{"train_loss": 1.4572656154632568, "global_step": 0, "epoch": 0} {"train_loss": 1.4363834857940674, "global_step": 1, "epoch": 0} {"train_loss": 1.4010169506072998, "global_step": 2, "epoch": 0} {"train_loss": 1.4137487411499023, "global_step": 3, "epoch": 0} {"train_loss": 1.4708596467971802, "global_step": 4, "epoch": 0} {"train_loss": 1.4130618572235107, "global_step": 5, "epoch": 0} {"train_loss": 1.446223497390747, "global_step": 6, "epoch": 0} {"train_loss": 1.4277117252349854, "global_step": 7, "epoch": 0} {"train_loss": 1.4047727584838867, "global_step": 8, "epoch": 0} {"train_loss": 1.4219249486923218, "global_step": 9, "epoch": 0} {"train_loss": 1.3971220254898071, "global_step": 10, "epoch": 0} {"train_loss": 1.4069974422454834, "global_step": 11, "epoch": 0} {"train_loss": 1.4186451435089111, "global_step": 12, "epoch": 0} {"train_loss": 1.3802493810653687, "global_step": 13, "epoch": 0} {"train_loss": 1.3841495513916016, "global_step": 14, "epoch": 0} {"train_loss": 1.3877366781234741, "global_step": 15, "epoch": 0} {"train_loss": 1.3625291585922241, "global_step": 16, "epoch": 0} {"train_loss": 1.3827130794525146, "global_step": 17, "epoch": 0} {"train_loss": 1.355515480041504, "global_step": 18, "epoch": 0} {"train_loss": 1.3559541702270508, "global_step": 19, "epoch": 0} {"train_loss": 1.3676447868347168, "global_step": 20, "epoch": 0} {"train_loss": 1.3581606149673462, "global_step": 21, "epoch": 0} {"train_loss": 1.3287193775177002, "global_step": 22, "epoch": 0} {"train_loss": 1.310462474822998, "global_step": 23, "epoch": 0} {"train_loss": 1.3392229080200195, "global_step": 24, "epoch": 0} {"train_loss": 1.3260939121246338, "global_step": 25, "epoch": 0} {"train_loss": 1.2994966506958008, "global_step": 26, "epoch": 0} {"train_loss": 1.3123793601989746, "global_step": 27, "epoch": 0} {"train_loss": 1.2499372959136963, "global_step": 28, "epoch": 0} {"train_loss": 1.2722861766815186, "global_step": 29, "epoch": 0} {"train_loss": 1.2882102727890015, "global_step": 30, "epoch": 0} {"train_loss": 1.2431923151016235, "global_step": 31, "epoch": 0} {"train_loss": 1.218435525894165, "global_step": 32, "epoch": 0} {"train_loss": 1.2138926982879639, "global_step": 33, "epoch": 0} {"train_loss": 1.2210673093795776, "global_step": 34, "epoch": 0} {"train_loss": 1.183135986328125, "global_step": 35, "epoch": 0} {"train_loss": 1.1747660636901855, "global_step": 36, "epoch": 0} {"train_loss": 1.1374133825302124, "global_step": 37, "epoch": 0} {"train_loss": 1.1271082162857056, "global_step": 38, "epoch": 0} {"train_loss": 1.1293532848358154, "global_step": 39, "epoch": 0} {"train_loss": 1.1102396249771118, "global_step": 40, "epoch": 0} {"train_loss": 1.3187636789821444, "global_step": 41, "epoch": 0, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.08473578745799996, "train/sim_max_reward_3": 0.10563019665542064, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.5497637593087155, "test/sim_max_reward_4500000": 0.31897924536482425, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.13455503383487172, "test/sim_max_reward_4500005": 0.1573857327028191, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.05409991255358192, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.059829530371475606, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.29829629030580695, "test/sim_max_reward_4500014": 0.16561182130584123, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.004249031229020703, "test/sim_max_reward_4500019": 0.39963147321879794, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.14861511220147822, "test/sim_max_reward_4500022": 0.3649989234231669, "test/sim_max_reward_4500023": 0.431168964091752, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.0, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.05325832318431668, "test/sim_max_reward_4500030": 0.2417637357732031, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0765272247743186, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.04882485170691779, "test/sim_max_reward_4500035": 0.08498010786302829, "test/sim_max_reward_4500036": 0.02257956182935472, "test/sim_max_reward_4500037": 0.0, "test/sim_max_reward_4500038": 0.1606878553606089, "test/sim_max_reward_4500039": 0.0, "test/sim_max_reward_4500040": 0.1607172078074504, "test/sim_max_reward_4500041": 0.0, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.1175735103924684, "test/sim_max_reward_4500046": 0.4209705501928377, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.15676767147011947, "test/mean_score": 0.08311111429610461, "val_loss": 10677596.0} {"train_loss": 1.068413496017456, "global_step": 42, "epoch": 1} {"train_loss": 1.0160552263259888, "global_step": 43, "epoch": 1} {"train_loss": 1.036121129989624, "global_step": 44, "epoch": 1} {"train_loss": 0.9352086782455444, "global_step": 45, "epoch": 1} {"train_loss": 0.919755220413208, "global_step": 46, "epoch": 1} {"train_loss": 0.9618508815765381, "global_step": 47, "epoch": 1} {"train_loss": 0.8641872406005859, "global_step": 48, "epoch": 1} {"train_loss": 0.8846880197525024, "global_step": 49, "epoch": 1} {"train_loss": 0.8432630896568298, "global_step": 50, "epoch": 1} {"train_loss": 0.9060846567153931, "global_step": 51, "epoch": 1} {"train_loss": 0.8438621163368225, "global_step": 52, "epoch": 1} {"train_loss": 0.8133804202079773, "global_step": 53, "epoch": 1} {"train_loss": 0.8416123390197754, "global_step": 54, "epoch": 1} {"train_loss": 0.741999626159668, "global_step": 55, "epoch": 1} {"train_loss": 0.6554780006408691, "global_step": 56, "epoch": 1} {"train_loss": 0.7390834093093872, "global_step": 57, "epoch": 1} {"train_loss": 0.7215222120285034, "global_step": 58, "epoch": 1} {"train_loss": 0.660125195980072, "global_step": 59, "epoch": 1} {"train_loss": 0.6587433815002441, "global_step": 60, "epoch": 1} {"train_loss": 0.6129822134971619, "global_step": 61, "epoch": 1} {"train_loss": 0.5588707327842712, "global_step": 62, "epoch": 1} {"train_loss": 0.521044135093689, "global_step": 63, "epoch": 1} {"train_loss": 0.6072341203689575, "global_step": 64, "epoch": 1} {"train_loss": 0.5200592279434204, "global_step": 65, "epoch": 1} {"train_loss": 0.4903531074523926, "global_step": 66, "epoch": 1} {"train_loss": 0.5260235667228699, "global_step": 67, "epoch": 1} {"train_loss": 0.44022130966186523, "global_step": 68, "epoch": 1} {"train_loss": 0.4506395757198334, "global_step": 69, "epoch": 1} {"train_loss": 0.4579158425331116, "global_step": 70, "epoch": 1} {"train_loss": 0.38993212580680847, "global_step": 71, "epoch": 1} {"train_loss": 0.38641977310180664, "global_step": 72, "epoch": 1} {"train_loss": 0.3394935131072998, "global_step": 73, "epoch": 1} {"train_loss": 0.3213428556919098, "global_step": 74, "epoch": 1} {"train_loss": 0.37692317366600037, "global_step": 75, "epoch": 1} {"train_loss": 0.3380257487297058, "global_step": 76, "epoch": 1} {"train_loss": 0.30301082134246826, "global_step": 77, "epoch": 1} {"train_loss": 0.3651536703109741, "global_step": 78, "epoch": 1} {"train_loss": 0.3044227361679077, "global_step": 79, "epoch": 1} {"train_loss": 0.2831657826900482, "global_step": 80, "epoch": 1} {"train_loss": 0.3352728486061096, "global_step": 81, "epoch": 1} {"train_loss": 0.2765437960624695, "global_step": 82, "epoch": 1} {"train_loss": 0.6071164941503888, "global_step": 83, "epoch": 1, "val_loss": 6052997.0} {"train_loss": 0.25597724318504333, "global_step": 84, "epoch": 2} {"train_loss": 0.20029039680957794, "global_step": 85, "epoch": 2} {"train_loss": 0.24169574677944183, "global_step": 86, "epoch": 2} {"train_loss": 0.24345678091049194, "global_step": 87, "epoch": 2} {"train_loss": 0.16863584518432617, "global_step": 88, "epoch": 2} {"train_loss": 0.16111567616462708, "global_step": 89, "epoch": 2} {"train_loss": 0.1340661197900772, "global_step": 90, "epoch": 2} {"train_loss": 0.23969003558158875, "global_step": 91, "epoch": 2} {"train_loss": 0.1431591808795929, "global_step": 92, "epoch": 2} {"train_loss": 0.13223350048065186, "global_step": 93, "epoch": 2} {"train_loss": 0.1234169751405716, "global_step": 94, "epoch": 2} {"train_loss": 0.08800087869167328, "global_step": 95, "epoch": 2} {"train_loss": 0.0997501015663147, "global_step": 96, "epoch": 2} {"train_loss": 0.1398436427116394, "global_step": 97, "epoch": 2} {"train_loss": 0.1430899053812027, "global_step": 98, "epoch": 2} {"train_loss": 0.16330179572105408, "global_step": 99, "epoch": 2} {"train_loss": 0.15733718872070312, "global_step": 100, "epoch": 2} {"train_loss": 0.08159197121858597, "global_step": 101, "epoch": 2} {"train_loss": 0.13245630264282227, "global_step": 102, "epoch": 2} {"train_loss": 0.11643414944410324, "global_step": 103, "epoch": 2} {"train_loss": 0.017564978450536728, "global_step": 104, "epoch": 2} {"train_loss": 0.0891382247209549, "global_step": 105, "epoch": 2} {"train_loss": 0.13172508776187897, "global_step": 106, "epoch": 2} {"train_loss": 0.029747426509857178, "global_step": 107, "epoch": 2} {"train_loss": 0.1159982904791832, "global_step": 108, "epoch": 2} {"train_loss": 0.034039489924907684, "global_step": 109, "epoch": 2} {"train_loss": 0.004029035568237305, "global_step": 110, "epoch": 2} {"train_loss": -0.02816496416926384, "global_step": 111, "epoch": 2} {"train_loss": -0.0004825834184885025, "global_step": 112, "epoch": 2} {"train_loss": 0.015549691393971443, "global_step": 113, "epoch": 2} {"train_loss": -0.04419530928134918, "global_step": 114, "epoch": 2} {"train_loss": 0.043120987713336945, "global_step": 115, "epoch": 2} {"train_loss": -0.10541769862174988, "global_step": 116, "epoch": 2} {"train_loss": -0.1194201409816742, "global_step": 117, "epoch": 2} {"train_loss": 0.05560368672013283, "global_step": 118, "epoch": 2} {"train_loss": 0.007925761863589287, "global_step": 119, "epoch": 2} {"train_loss": 0.04125615209341049, "global_step": 120, "epoch": 2} {"train_loss": -0.11072565615177155, "global_step": 121, "epoch": 2} {"train_loss": -0.12026317417621613, "global_step": 122, "epoch": 2} {"train_loss": -0.09908302128314972, "global_step": 123, "epoch": 2} {"train_loss": -0.061576418578624725, "global_step": 124, "epoch": 2} {"train_loss": 0.06943396234973556, "global_step": 125, "epoch": 2, "val_loss": 4771897.5} {"train_loss": -0.12721846997737885, "global_step": 126, "epoch": 3} {"train_loss": -0.1927415132522583, "global_step": 127, "epoch": 3} {"train_loss": -0.17494109272956848, "global_step": 128, "epoch": 3} {"train_loss": -0.04778730869293213, "global_step": 129, "epoch": 3} {"train_loss": -0.12710493803024292, "global_step": 130, "epoch": 3} {"train_loss": -0.2308109700679779, "global_step": 131, "epoch": 3} {"train_loss": -0.15680724382400513, "global_step": 132, "epoch": 3} {"train_loss": -0.15724554657936096, "global_step": 133, "epoch": 3} {"train_loss": -0.23844453692436218, "global_step": 134, "epoch": 3} {"train_loss": -0.23049801588058472, "global_step": 135, "epoch": 3} {"train_loss": -0.2486470639705658, "global_step": 136, "epoch": 3} {"train_loss": -0.23545603454113007, "global_step": 137, "epoch": 3} {"train_loss": -0.1499391496181488, "global_step": 138, "epoch": 3} {"train_loss": -0.12685103714466095, "global_step": 139, "epoch": 3} {"train_loss": -0.22952057421207428, "global_step": 140, "epoch": 3} {"train_loss": -0.24305598437786102, "global_step": 141, "epoch": 3} {"train_loss": -0.09797893464565277, "global_step": 142, "epoch": 3} {"train_loss": -0.23294320702552795, "global_step": 143, "epoch": 3} {"train_loss": -0.3023698627948761, "global_step": 144, "epoch": 3} {"train_loss": -0.18326792120933533, "global_step": 145, "epoch": 3} {"train_loss": -0.30201756954193115, "global_step": 146, "epoch": 3} {"train_loss": -0.22723382711410522, "global_step": 147, "epoch": 3} {"train_loss": -0.25769296288490295, "global_step": 148, "epoch": 3} {"train_loss": -0.21232596039772034, "global_step": 149, "epoch": 3} {"train_loss": -0.24165567755699158, "global_step": 150, "epoch": 3} {"train_loss": -0.24859488010406494, "global_step": 151, "epoch": 3} {"train_loss": -0.32185518741607666, "global_step": 152, "epoch": 3} {"train_loss": -0.3626176118850708, "global_step": 153, "epoch": 3} {"train_loss": -0.22514504194259644, "global_step": 154, "epoch": 3} {"train_loss": -0.31603050231933594, "global_step": 155, "epoch": 3} {"train_loss": -0.3664112091064453, "global_step": 156, "epoch": 3} {"train_loss": -0.2495046854019165, "global_step": 157, "epoch": 3} {"train_loss": -0.3758988082408905, "global_step": 158, "epoch": 3} {"train_loss": -0.39045172929763794, "global_step": 159, "epoch": 3} {"train_loss": -0.38187259435653687, "global_step": 160, "epoch": 3} {"train_loss": -0.4493595063686371, "global_step": 161, "epoch": 3} {"train_loss": -0.3871935307979584, "global_step": 162, "epoch": 3} {"train_loss": -0.3436901569366455, "global_step": 163, "epoch": 3} {"train_loss": -0.40728116035461426, "global_step": 164, "epoch": 3} {"train_loss": -0.33375391364097595, "global_step": 165, "epoch": 3} {"train_loss": -0.41554784774780273, "global_step": 166, "epoch": 3} {"train_loss": -0.2615595956643422, "global_step": 167, "epoch": 3, "val_loss": 4010861.25} {"train_loss": -0.28081852197647095, "global_step": 168, "epoch": 4} {"train_loss": -0.4250592291355133, "global_step": 169, "epoch": 4} {"train_loss": -0.39407089352607727, "global_step": 170, "epoch": 4} {"train_loss": -0.3764399290084839, "global_step": 171, "epoch": 4} {"train_loss": -0.43691709637641907, "global_step": 172, "epoch": 4} {"train_loss": -0.46423763036727905, "global_step": 173, "epoch": 4} {"train_loss": -0.4270005226135254, "global_step": 174, "epoch": 4} {"train_loss": -0.3936954736709595, "global_step": 175, "epoch": 4} {"train_loss": -0.47021520137786865, "global_step": 176, "epoch": 4} {"train_loss": -0.45499566197395325, "global_step": 177, "epoch": 4} {"train_loss": -0.49863576889038086, "global_step": 178, "epoch": 4} {"train_loss": -0.4677329659461975, "global_step": 179, "epoch": 4} {"train_loss": -0.4963003396987915, "global_step": 180, "epoch": 4} {"train_loss": -0.498598575592041, "global_step": 181, "epoch": 4} {"train_loss": -0.43269532918930054, "global_step": 182, "epoch": 4} {"train_loss": -0.48076292872428894, "global_step": 183, "epoch": 4} {"train_loss": -0.43105122447013855, "global_step": 184, "epoch": 4} {"train_loss": -0.47250181436538696, "global_step": 185, "epoch": 4} {"train_loss": -0.5189785957336426, "global_step": 186, "epoch": 4} {"train_loss": -0.44597819447517395, "global_step": 187, "epoch": 4} {"train_loss": -0.4435339570045471, "global_step": 188, "epoch": 4} {"train_loss": -0.45718497037887573, "global_step": 189, "epoch": 4} {"train_loss": -0.5440772771835327, "global_step": 190, "epoch": 4} {"train_loss": -0.5691732168197632, "global_step": 191, "epoch": 4} {"train_loss": -0.369911253452301, "global_step": 192, "epoch": 4} {"train_loss": -0.5761997103691101, "global_step": 193, "epoch": 4} {"train_loss": -0.6362578272819519, "global_step": 194, "epoch": 4} {"train_loss": -0.5568141937255859, "global_step": 195, "epoch": 4} {"train_loss": -0.5507619380950928, "global_step": 196, "epoch": 4} {"train_loss": -0.4715857207775116, "global_step": 197, "epoch": 4} {"train_loss": -0.4916246831417084, "global_step": 198, "epoch": 4} {"train_loss": -0.44767042994499207, "global_step": 199, "epoch": 4} {"train_loss": -0.46196281909942627, "global_step": 200, "epoch": 4} {"train_loss": -0.5419946908950806, "global_step": 201, "epoch": 4} {"train_loss": -0.6130273938179016, "global_step": 202, "epoch": 4} {"train_loss": -0.5776535868644714, "global_step": 203, "epoch": 4} {"train_loss": -0.5085811018943787, "global_step": 204, "epoch": 4} {"train_loss": -0.5431872606277466, "global_step": 205, "epoch": 4} {"train_loss": -0.5358278751373291, "global_step": 206, "epoch": 4} {"train_loss": -0.5127536654472351, "global_step": 207, "epoch": 4} {"train_loss": -0.49056950211524963, "global_step": 208, "epoch": 4} {"train_loss": -0.4826331472113019, "global_step": 209, "epoch": 4, "val_loss": 3560094.75} {"train_loss": -0.5457041263580322, "global_step": 210, "epoch": 5} {"train_loss": -0.6398467421531677, "global_step": 211, "epoch": 5} {"train_loss": -0.5784754157066345, "global_step": 212, "epoch": 5} {"train_loss": -0.5867937803268433, "global_step": 213, "epoch": 5} {"train_loss": -0.647496223449707, "global_step": 214, "epoch": 5} {"train_loss": -0.555328369140625, "global_step": 215, "epoch": 5} {"train_loss": -0.6084862947463989, "global_step": 216, "epoch": 5} {"train_loss": -0.5712878704071045, "global_step": 217, "epoch": 5} {"train_loss": -0.633490800857544, "global_step": 218, "epoch": 5} {"train_loss": -0.7138739228248596, "global_step": 219, "epoch": 5} {"train_loss": -0.6361250877380371, "global_step": 220, "epoch": 5} {"train_loss": -0.5829614996910095, "global_step": 221, "epoch": 5} {"train_loss": -0.6993433237075806, "global_step": 222, "epoch": 5} {"train_loss": -0.6336575150489807, "global_step": 223, "epoch": 5} {"train_loss": -0.6412909626960754, "global_step": 224, "epoch": 5} {"train_loss": -0.5166287422180176, "global_step": 225, "epoch": 5} {"train_loss": -0.6241491436958313, "global_step": 226, "epoch": 5} {"train_loss": -0.5281595587730408, "global_step": 227, "epoch": 5} {"train_loss": -0.6487100124359131, "global_step": 228, "epoch": 5} {"train_loss": -0.5784342885017395, "global_step": 229, "epoch": 5} {"train_loss": -0.7088286876678467, "global_step": 230, "epoch": 5} {"train_loss": -0.5970427989959717, "global_step": 231, "epoch": 5} {"train_loss": -0.7137181758880615, "global_step": 232, "epoch": 5} {"train_loss": -0.6717183589935303, "global_step": 233, "epoch": 5} {"train_loss": -0.6416304111480713, "global_step": 234, "epoch": 5} {"train_loss": -0.6459037661552429, "global_step": 235, "epoch": 5} {"train_loss": -0.655677080154419, "global_step": 236, "epoch": 5} {"train_loss": -0.63250732421875, "global_step": 237, "epoch": 5} {"train_loss": -0.6250151991844177, "global_step": 238, "epoch": 5} {"train_loss": -0.7341912984848022, "global_step": 239, "epoch": 5} {"train_loss": -0.682749330997467, "global_step": 240, "epoch": 5} {"train_loss": -0.760655403137207, "global_step": 241, "epoch": 5} {"train_loss": -0.6860860586166382, "global_step": 242, "epoch": 5} {"train_loss": -0.622266411781311, "global_step": 243, "epoch": 5} {"train_loss": -0.638081431388855, "global_step": 244, "epoch": 5} {"train_loss": -0.6726775169372559, "global_step": 245, "epoch": 5} {"train_loss": -0.7274169325828552, "global_step": 246, "epoch": 5} {"train_loss": -0.7261841297149658, "global_step": 247, "epoch": 5} {"train_loss": -0.6595166325569153, "global_step": 248, "epoch": 5} {"train_loss": -0.7430359125137329, "global_step": 249, "epoch": 5} {"train_loss": -0.7514811158180237, "global_step": 250, "epoch": 5} {"train_loss": -0.6488963521662212, "global_step": 251, "epoch": 5, "val_loss": 3187844.0} {"train_loss": -0.630021333694458, "global_step": 252, "epoch": 6} {"train_loss": -0.728559136390686, "global_step": 253, "epoch": 6} {"train_loss": -0.6759467124938965, "global_step": 254, "epoch": 6} {"train_loss": -0.7625508904457092, "global_step": 255, "epoch": 6} {"train_loss": -0.7483608722686768, "global_step": 256, "epoch": 6} {"train_loss": -0.7395157217979431, "global_step": 257, "epoch": 6} {"train_loss": -0.6883770823478699, "global_step": 258, "epoch": 6} {"train_loss": -0.8109569549560547, "global_step": 259, "epoch": 6} {"train_loss": -0.827411413192749, "global_step": 260, "epoch": 6} {"train_loss": -0.8041545152664185, "global_step": 261, "epoch": 6} {"train_loss": -0.7629643082618713, "global_step": 262, "epoch": 6} {"train_loss": -0.7451766729354858, "global_step": 263, "epoch": 6} {"train_loss": -0.7362369894981384, "global_step": 264, "epoch": 6} {"train_loss": -0.6440396308898926, "global_step": 265, "epoch": 6} {"train_loss": -0.782768726348877, "global_step": 266, "epoch": 6} {"train_loss": -0.8624649047851562, "global_step": 267, "epoch": 6} {"train_loss": -0.6823355555534363, "global_step": 268, "epoch": 6} {"train_loss": -0.8053005933761597, "global_step": 269, "epoch": 6} {"train_loss": -0.7775360345840454, "global_step": 270, "epoch": 6} {"train_loss": -0.6996023058891296, "global_step": 271, "epoch": 6} {"train_loss": -0.762649655342102, "global_step": 272, "epoch": 6} {"train_loss": -0.8047295808792114, "global_step": 273, "epoch": 6} {"train_loss": -0.7706664800643921, "global_step": 274, "epoch": 6} {"train_loss": -0.8747255206108093, "global_step": 275, "epoch": 6} {"train_loss": -0.7508838772773743, "global_step": 276, "epoch": 6} {"train_loss": -0.7873512506484985, "global_step": 277, "epoch": 6} {"train_loss": -0.7720284461975098, "global_step": 278, "epoch": 6} {"train_loss": -0.8590406775474548, "global_step": 279, "epoch": 6} {"train_loss": -0.7640962600708008, "global_step": 280, "epoch": 6} {"train_loss": -0.7317185401916504, "global_step": 281, "epoch": 6} {"train_loss": -0.8231194019317627, "global_step": 282, "epoch": 6} {"train_loss": -0.6891331672668457, "global_step": 283, "epoch": 6} {"train_loss": -0.8948837518692017, "global_step": 284, "epoch": 6} {"train_loss": -0.8380776643753052, "global_step": 285, "epoch": 6} {"train_loss": -0.7157060503959656, "global_step": 286, "epoch": 6} {"train_loss": -0.8274310827255249, "global_step": 287, "epoch": 6} {"train_loss": -0.9902694225311279, "global_step": 288, "epoch": 6} {"train_loss": -0.9072065949440002, "global_step": 289, "epoch": 6} {"train_loss": -0.8064782619476318, "global_step": 290, "epoch": 6} {"train_loss": -0.8287267684936523, "global_step": 291, "epoch": 6} {"train_loss": -0.8103715181350708, "global_step": 292, "epoch": 6} {"train_loss": -0.7783902883529663, "global_step": 293, "epoch": 6, "val_loss": 2841386.25} {"train_loss": -0.9204243421554565, "global_step": 294, "epoch": 7} {"train_loss": -0.8534953594207764, "global_step": 295, "epoch": 7} {"train_loss": -0.833771824836731, "global_step": 296, "epoch": 7} {"train_loss": -0.8026966452598572, "global_step": 297, "epoch": 7} {"train_loss": -0.7206050157546997, "global_step": 298, "epoch": 7} {"train_loss": -0.8457832336425781, "global_step": 299, "epoch": 7} {"train_loss": -0.8618469834327698, "global_step": 300, "epoch": 7} {"train_loss": -0.9107682108879089, "global_step": 301, "epoch": 7} {"train_loss": -0.8185899257659912, "global_step": 302, "epoch": 7} {"train_loss": -0.9098381996154785, "global_step": 303, "epoch": 7} {"train_loss": -0.8790614604949951, "global_step": 304, "epoch": 7} {"train_loss": -0.8867684006690979, "global_step": 305, "epoch": 7} {"train_loss": -0.8509162664413452, "global_step": 306, "epoch": 7} {"train_loss": -0.864453136920929, "global_step": 307, "epoch": 7} {"train_loss": -0.807287335395813, "global_step": 308, "epoch": 7} {"train_loss": -0.8591313362121582, "global_step": 309, "epoch": 7} {"train_loss": -0.9632092118263245, "global_step": 310, "epoch": 7} {"train_loss": -0.9992783069610596, "global_step": 311, "epoch": 7} {"train_loss": -0.8211715817451477, "global_step": 312, "epoch": 7} {"train_loss": -0.9463396072387695, "global_step": 313, "epoch": 7} {"train_loss": -0.7921940088272095, "global_step": 314, "epoch": 7} {"train_loss": -0.8720898628234863, "global_step": 315, "epoch": 7} {"train_loss": -0.9230958223342896, "global_step": 316, "epoch": 7} {"train_loss": -0.9993016123771667, "global_step": 317, "epoch": 7} {"train_loss": -0.775231122970581, "global_step": 318, "epoch": 7} {"train_loss": -0.9093807339668274, "global_step": 319, "epoch": 7} {"train_loss": -0.9107550382614136, "global_step": 320, "epoch": 7} {"train_loss": -0.8588912487030029, "global_step": 321, "epoch": 7} {"train_loss": -0.9060624241828918, "global_step": 322, "epoch": 7} {"train_loss": -0.9796351194381714, "global_step": 323, "epoch": 7} {"train_loss": -0.9327845573425293, "global_step": 324, "epoch": 7} {"train_loss": -0.8656593561172485, "global_step": 325, "epoch": 7} {"train_loss": -0.8891656398773193, "global_step": 326, "epoch": 7} {"train_loss": -0.935044527053833, "global_step": 327, "epoch": 7} {"train_loss": -0.8734742403030396, "global_step": 328, "epoch": 7} {"train_loss": -0.8717700242996216, "global_step": 329, "epoch": 7} {"train_loss": -0.8858970403671265, "global_step": 330, "epoch": 7} {"train_loss": -0.9724137783050537, "global_step": 331, "epoch": 7} {"train_loss": -0.7856473922729492, "global_step": 332, "epoch": 7} {"train_loss": -0.9461232423782349, "global_step": 333, "epoch": 7} {"train_loss": -0.8932236433029175, "global_step": 334, "epoch": 7} {"train_loss": -0.883931998695646, "global_step": 335, "epoch": 7, "val_loss": 2670844.0} {"train_loss": -0.9184783697128296, "global_step": 336, "epoch": 8} {"train_loss": -0.9541781544685364, "global_step": 337, "epoch": 8} {"train_loss": -0.9184645414352417, "global_step": 338, "epoch": 8} {"train_loss": -0.9222306609153748, "global_step": 339, "epoch": 8} {"train_loss": -0.9627135992050171, "global_step": 340, "epoch": 8} {"train_loss": -0.924983024597168, "global_step": 341, "epoch": 8} {"train_loss": -0.9823310375213623, "global_step": 342, "epoch": 8} {"train_loss": -1.0218515396118164, "global_step": 343, "epoch": 8} {"train_loss": -0.9809960722923279, "global_step": 344, "epoch": 8} {"train_loss": -1.0386834144592285, "global_step": 345, "epoch": 8} {"train_loss": -0.9005860686302185, "global_step": 346, "epoch": 8} {"train_loss": -0.9038363695144653, "global_step": 347, "epoch": 8} {"train_loss": -1.0306158065795898, "global_step": 348, "epoch": 8} {"train_loss": -0.9745512008666992, "global_step": 349, "epoch": 8} {"train_loss": -0.9724183678627014, "global_step": 350, "epoch": 8} {"train_loss": -0.9316740036010742, "global_step": 351, "epoch": 8} {"train_loss": -0.9927611947059631, "global_step": 352, "epoch": 8} {"train_loss": -0.9453691244125366, "global_step": 353, "epoch": 8} {"train_loss": -1.0888755321502686, "global_step": 354, "epoch": 8} {"train_loss": -0.9773695468902588, "global_step": 355, "epoch": 8} {"train_loss": -1.0077846050262451, "global_step": 356, "epoch": 8} {"train_loss": -1.0580048561096191, "global_step": 357, "epoch": 8} {"train_loss": -0.9872399568557739, "global_step": 358, "epoch": 8} {"train_loss": -1.0423128604888916, "global_step": 359, "epoch": 8} {"train_loss": -1.0478253364562988, "global_step": 360, "epoch": 8} {"train_loss": -1.0435631275177002, "global_step": 361, "epoch": 8} {"train_loss": -0.948617696762085, "global_step": 362, "epoch": 8} {"train_loss": -1.0161550045013428, "global_step": 363, "epoch": 8} {"train_loss": -1.0415334701538086, "global_step": 364, "epoch": 8} {"train_loss": -1.1165952682495117, "global_step": 365, "epoch": 8} {"train_loss": -1.0783604383468628, "global_step": 366, "epoch": 8} {"train_loss": -1.1721365451812744, "global_step": 367, "epoch": 8} {"train_loss": -0.9673988819122314, "global_step": 368, "epoch": 8} {"train_loss": -1.1428184509277344, "global_step": 369, "epoch": 8} {"train_loss": -1.0849568843841553, "global_step": 370, "epoch": 8} {"train_loss": -0.958265483379364, "global_step": 371, "epoch": 8} {"train_loss": -1.1806894540786743, "global_step": 372, "epoch": 8} {"train_loss": -1.154358148574829, "global_step": 373, "epoch": 8} {"train_loss": -1.0677434206008911, "global_step": 374, "epoch": 8} {"train_loss": -1.0506535768508911, "global_step": 375, "epoch": 8} {"train_loss": -1.1577625274658203, "global_step": 376, "epoch": 8} {"train_loss": -1.0168632992676325, "global_step": 377, "epoch": 8, "val_loss": 2375735.75} {"train_loss": -1.0912044048309326, "global_step": 378, "epoch": 9} {"train_loss": -1.1413764953613281, "global_step": 379, "epoch": 9} {"train_loss": -1.145896315574646, "global_step": 380, "epoch": 9} {"train_loss": -1.1094145774841309, "global_step": 381, "epoch": 9} {"train_loss": -1.0746701955795288, "global_step": 382, "epoch": 9} {"train_loss": -1.0063679218292236, "global_step": 383, "epoch": 9} {"train_loss": -1.1284208297729492, "global_step": 384, "epoch": 9} {"train_loss": -0.9938114881515503, "global_step": 385, "epoch": 9} {"train_loss": -1.030914545059204, "global_step": 386, "epoch": 9} {"train_loss": -0.9988372325897217, "global_step": 387, "epoch": 9} {"train_loss": -0.9610198736190796, "global_step": 388, "epoch": 9} {"train_loss": -1.0176594257354736, "global_step": 389, "epoch": 9} {"train_loss": -1.0992203950881958, "global_step": 390, "epoch": 9} {"train_loss": -1.075628399848938, "global_step": 391, "epoch": 9} {"train_loss": -1.1550285816192627, "global_step": 392, "epoch": 9} {"train_loss": -1.1055867671966553, "global_step": 393, "epoch": 9} {"train_loss": -1.0771846771240234, "global_step": 394, "epoch": 9} {"train_loss": -1.1868451833724976, "global_step": 395, "epoch": 9} {"train_loss": -1.0908830165863037, "global_step": 396, "epoch": 9} {"train_loss": -1.147984266281128, "global_step": 397, "epoch": 9} {"train_loss": -1.0892176628112793, "global_step": 398, "epoch": 9} {"train_loss": -1.1634858846664429, "global_step": 399, "epoch": 9} {"train_loss": -1.04301118850708, "global_step": 400, "epoch": 9} {"train_loss": -1.2688714265823364, "global_step": 401, "epoch": 9} {"train_loss": -1.1199651956558228, "global_step": 402, "epoch": 9} {"train_loss": -1.1602314710617065, "global_step": 403, "epoch": 9} {"train_loss": -1.073707103729248, "global_step": 404, "epoch": 9} {"train_loss": -1.162550687789917, "global_step": 405, "epoch": 9} {"train_loss": -1.201859712600708, "global_step": 406, "epoch": 9} {"train_loss": -1.152083396911621, "global_step": 407, "epoch": 9} {"train_loss": -1.21690034866333, "global_step": 408, "epoch": 9} {"train_loss": -1.2521779537200928, "global_step": 409, "epoch": 9} {"train_loss": -1.3253235816955566, "global_step": 410, "epoch": 9} {"train_loss": -1.1360387802124023, "global_step": 411, "epoch": 9} {"train_loss": -1.2840096950531006, "global_step": 412, "epoch": 9} {"train_loss": -1.0368938446044922, "global_step": 413, "epoch": 9} {"train_loss": -1.1835219860076904, "global_step": 414, "epoch": 9} {"train_loss": -1.241450309753418, "global_step": 415, "epoch": 9} {"train_loss": -1.2201584577560425, "global_step": 416, "epoch": 9} {"train_loss": -1.2001879215240479, "global_step": 417, "epoch": 9} {"train_loss": -1.230785608291626, "global_step": 418, "epoch": 9} {"train_loss": -1.1357617520150685, "global_step": 419, "epoch": 9, "val_loss": 2190040.25} {"train_loss": -1.1737980842590332, "global_step": 420, "epoch": 10} {"train_loss": -1.2709097862243652, "global_step": 421, "epoch": 10} {"train_loss": -1.2479430437088013, "global_step": 422, "epoch": 10} {"train_loss": -1.0696790218353271, "global_step": 423, "epoch": 10} {"train_loss": -1.2288105487823486, "global_step": 424, "epoch": 10} {"train_loss": -1.2292062044143677, "global_step": 425, "epoch": 10} {"train_loss": -1.2036879062652588, "global_step": 426, "epoch": 10} {"train_loss": -1.2061173915863037, "global_step": 427, "epoch": 10} {"train_loss": -1.20943021774292, "global_step": 428, "epoch": 10} {"train_loss": -1.1933151483535767, "global_step": 429, "epoch": 10} {"train_loss": -1.143475890159607, "global_step": 430, "epoch": 10} {"train_loss": -1.2302956581115723, "global_step": 431, "epoch": 10} {"train_loss": -1.324418306350708, "global_step": 432, "epoch": 10} {"train_loss": -1.391840934753418, "global_step": 433, "epoch": 10} {"train_loss": -1.1707179546356201, "global_step": 434, "epoch": 10} {"train_loss": -1.2728632688522339, "global_step": 435, "epoch": 10} {"train_loss": -1.1732712984085083, "global_step": 436, "epoch": 10} {"train_loss": -1.335423469543457, "global_step": 437, "epoch": 10} {"train_loss": -1.1743992567062378, "global_step": 438, "epoch": 10} {"train_loss": -1.3515909910202026, "global_step": 439, "epoch": 10} {"train_loss": -1.2293370962142944, "global_step": 440, "epoch": 10} {"train_loss": -1.337411880493164, "global_step": 441, "epoch": 10} {"train_loss": -1.2524945735931396, "global_step": 442, "epoch": 10} {"train_loss": -1.1995413303375244, "global_step": 443, "epoch": 10} {"train_loss": -1.2210439443588257, "global_step": 444, "epoch": 10} {"train_loss": -1.2422106266021729, "global_step": 445, "epoch": 10} {"train_loss": -1.4186557531356812, "global_step": 446, "epoch": 10} {"train_loss": -1.1364424228668213, "global_step": 447, "epoch": 10} {"train_loss": -1.3848798274993896, "global_step": 448, "epoch": 10} {"train_loss": -1.183443546295166, "global_step": 449, "epoch": 10} {"train_loss": -1.2738749980926514, "global_step": 450, "epoch": 10} {"train_loss": -1.314563512802124, "global_step": 451, "epoch": 10} {"train_loss": -1.2993539571762085, "global_step": 452, "epoch": 10} {"train_loss": -1.2683885097503662, "global_step": 453, "epoch": 10} {"train_loss": -1.334357738494873, "global_step": 454, "epoch": 10} {"train_loss": -1.2819957733154297, "global_step": 455, "epoch": 10} {"train_loss": -1.305543065071106, "global_step": 456, "epoch": 10} {"train_loss": -1.290880799293518, "global_step": 457, "epoch": 10} {"train_loss": -1.3235394954681396, "global_step": 458, "epoch": 10} {"train_loss": -1.3115899562835693, "global_step": 459, "epoch": 10} {"train_loss": -1.3509857654571533, "global_step": 460, "epoch": 10} {"train_loss": -1.2589180554662431, "global_step": 461, "epoch": 10, "val_loss": 1997508.125} {"train_loss": -1.4134931564331055, "global_step": 462, "epoch": 11} {"train_loss": -1.3712773323059082, "global_step": 463, "epoch": 11} {"train_loss": -1.3945361375808716, "global_step": 464, "epoch": 11} {"train_loss": -1.4589064121246338, "global_step": 465, "epoch": 11} {"train_loss": -1.3328883647918701, "global_step": 466, "epoch": 11} {"train_loss": -1.4454689025878906, "global_step": 467, "epoch": 11} {"train_loss": -1.361480951309204, "global_step": 468, "epoch": 11} {"train_loss": -1.2596750259399414, "global_step": 469, "epoch": 11} {"train_loss": -1.388948678970337, "global_step": 470, "epoch": 11} {"train_loss": -1.3867942094802856, "global_step": 471, "epoch": 11} {"train_loss": -1.3825021982192993, "global_step": 472, "epoch": 11} {"train_loss": -1.2405304908752441, "global_step": 473, "epoch": 11} {"train_loss": -1.3090789318084717, "global_step": 474, "epoch": 11} {"train_loss": -1.3793176412582397, "global_step": 475, "epoch": 11} {"train_loss": -1.4210695028305054, "global_step": 476, "epoch": 11} {"train_loss": -1.271228313446045, "global_step": 477, "epoch": 11} {"train_loss": -1.3977305889129639, "global_step": 478, "epoch": 11} {"train_loss": -1.367912769317627, "global_step": 479, "epoch": 11} {"train_loss": -1.3245718479156494, "global_step": 480, "epoch": 11} {"train_loss": -1.366316795349121, "global_step": 481, "epoch": 11} {"train_loss": -1.245725154876709, "global_step": 482, "epoch": 11} {"train_loss": -1.4376468658447266, "global_step": 483, "epoch": 11} {"train_loss": -1.430909276008606, "global_step": 484, "epoch": 11} {"train_loss": -1.3761895895004272, "global_step": 485, "epoch": 11} {"train_loss": -1.351822853088379, "global_step": 486, "epoch": 11} {"train_loss": -1.5133068561553955, "global_step": 487, "epoch": 11} {"train_loss": -1.4459726810455322, "global_step": 488, "epoch": 11} {"train_loss": -1.3697772026062012, "global_step": 489, "epoch": 11} {"train_loss": -1.374312162399292, "global_step": 490, "epoch": 11} {"train_loss": -1.3820902109146118, "global_step": 491, "epoch": 11} {"train_loss": -1.418996810913086, "global_step": 492, "epoch": 11} {"train_loss": -1.388988733291626, "global_step": 493, "epoch": 11} {"train_loss": -1.420466661453247, "global_step": 494, "epoch": 11} {"train_loss": -1.396146297454834, "global_step": 495, "epoch": 11} {"train_loss": -1.4630563259124756, "global_step": 496, "epoch": 11} {"train_loss": -1.3677964210510254, "global_step": 497, "epoch": 11} {"train_loss": -1.365706205368042, "global_step": 498, "epoch": 11} {"train_loss": -1.3782964944839478, "global_step": 499, "epoch": 11} {"train_loss": -1.354827642440796, "global_step": 500, "epoch": 11} {"train_loss": -1.3730249404907227, "global_step": 501, "epoch": 11} {"train_loss": -1.4610137939453125, "global_step": 502, "epoch": 11} {"train_loss": -1.3790372269494193, "global_step": 503, "epoch": 11, "val_loss": 1847793.625} {"train_loss": -1.4427987337112427, "global_step": 504, "epoch": 12} {"train_loss": -1.4495052099227905, "global_step": 505, "epoch": 12} {"train_loss": -1.388993740081787, "global_step": 506, "epoch": 12} {"train_loss": -1.449143886566162, "global_step": 507, "epoch": 12} {"train_loss": -1.3772143125534058, "global_step": 508, "epoch": 12} {"train_loss": -1.4107098579406738, "global_step": 509, "epoch": 12} {"train_loss": -1.3616783618927002, "global_step": 510, "epoch": 12} {"train_loss": -1.4887714385986328, "global_step": 511, "epoch": 12} {"train_loss": -1.4432973861694336, "global_step": 512, "epoch": 12} {"train_loss": -1.53090500831604, "global_step": 513, "epoch": 12} {"train_loss": -1.5184015035629272, "global_step": 514, "epoch": 12} {"train_loss": -1.4591057300567627, "global_step": 515, "epoch": 12} {"train_loss": -1.5027947425842285, "global_step": 516, "epoch": 12} {"train_loss": -1.3322805166244507, "global_step": 517, "epoch": 12} {"train_loss": -1.5576436519622803, "global_step": 518, "epoch": 12} {"train_loss": -1.5609560012817383, "global_step": 519, "epoch": 12} {"train_loss": -1.4486870765686035, "global_step": 520, "epoch": 12} {"train_loss": -1.405320167541504, "global_step": 521, "epoch": 12} {"train_loss": -1.4370543956756592, "global_step": 522, "epoch": 12} {"train_loss": -1.3861513137817383, "global_step": 523, "epoch": 12} {"train_loss": -1.497320294380188, "global_step": 524, "epoch": 12} {"train_loss": -1.4659438133239746, "global_step": 525, "epoch": 12} {"train_loss": -1.53172767162323, "global_step": 526, "epoch": 12} {"train_loss": -1.5012335777282715, "global_step": 527, "epoch": 12} {"train_loss": -1.5749591588974, "global_step": 528, "epoch": 12} {"train_loss": -1.563673496246338, "global_step": 529, "epoch": 12} {"train_loss": -1.4840378761291504, "global_step": 530, "epoch": 12} {"train_loss": -1.575014591217041, "global_step": 531, "epoch": 12} {"train_loss": -1.5474050045013428, "global_step": 532, "epoch": 12} {"train_loss": -1.3684238195419312, "global_step": 533, "epoch": 12} {"train_loss": -1.4444752931594849, "global_step": 534, "epoch": 12} {"train_loss": -1.524468183517456, "global_step": 535, "epoch": 12} {"train_loss": -1.5926740169525146, "global_step": 536, "epoch": 12} {"train_loss": -1.6585726737976074, "global_step": 537, "epoch": 12} {"train_loss": -1.4226067066192627, "global_step": 538, "epoch": 12} {"train_loss": -1.5456278324127197, "global_step": 539, "epoch": 12} {"train_loss": -1.5380339622497559, "global_step": 540, "epoch": 12} {"train_loss": -1.4668428897857666, "global_step": 541, "epoch": 12} {"train_loss": -1.544877052307129, "global_step": 542, "epoch": 12} {"train_loss": -1.2760796546936035, "global_step": 543, "epoch": 12} {"train_loss": -1.447304368019104, "global_step": 544, "epoch": 12} {"train_loss": -1.476463877019428, "global_step": 545, "epoch": 12, "val_loss": 1714513.75} {"train_loss": -1.4767193794250488, "global_step": 546, "epoch": 13} {"train_loss": -1.4796788692474365, "global_step": 547, "epoch": 13} {"train_loss": -1.541247844696045, "global_step": 548, "epoch": 13} {"train_loss": -1.5443977117538452, "global_step": 549, "epoch": 13} {"train_loss": -1.702791690826416, "global_step": 550, "epoch": 13} {"train_loss": -1.484226107597351, "global_step": 551, "epoch": 13} {"train_loss": -1.4778629541397095, "global_step": 552, "epoch": 13} {"train_loss": -1.4979976415634155, "global_step": 553, "epoch": 13} {"train_loss": -1.5552594661712646, "global_step": 554, "epoch": 13} {"train_loss": -1.5757877826690674, "global_step": 555, "epoch": 13} {"train_loss": -1.6436775922775269, "global_step": 556, "epoch": 13} {"train_loss": -1.608447551727295, "global_step": 557, "epoch": 13} {"train_loss": -1.5084466934204102, "global_step": 558, "epoch": 13} {"train_loss": -1.594562292098999, "global_step": 559, "epoch": 13} {"train_loss": -1.6550103425979614, "global_step": 560, "epoch": 13} {"train_loss": -1.5633420944213867, "global_step": 561, "epoch": 13} {"train_loss": -1.5317068099975586, "global_step": 562, "epoch": 13} {"train_loss": -1.5835907459259033, "global_step": 563, "epoch": 13} {"train_loss": -1.6780524253845215, "global_step": 564, "epoch": 13} {"train_loss": -1.6580580472946167, "global_step": 565, "epoch": 13} {"train_loss": -1.5408589839935303, "global_step": 566, "epoch": 13} {"train_loss": -1.56592857837677, "global_step": 567, "epoch": 13} {"train_loss": -1.5864005088806152, "global_step": 568, "epoch": 13} {"train_loss": -1.6663107872009277, "global_step": 569, "epoch": 13} {"train_loss": -1.6589219570159912, "global_step": 570, "epoch": 13} {"train_loss": -1.4665316343307495, "global_step": 571, "epoch": 13} {"train_loss": -1.4670054912567139, "global_step": 572, "epoch": 13} {"train_loss": -1.4837745428085327, "global_step": 573, "epoch": 13} {"train_loss": -1.650519847869873, "global_step": 574, "epoch": 13} {"train_loss": -1.5785162448883057, "global_step": 575, "epoch": 13} {"train_loss": -1.4732575416564941, "global_step": 576, "epoch": 13} {"train_loss": -1.696449875831604, "global_step": 577, "epoch": 13} {"train_loss": -1.516872525215149, "global_step": 578, "epoch": 13} {"train_loss": -1.5675547122955322, "global_step": 579, "epoch": 13} {"train_loss": -1.519345760345459, "global_step": 580, "epoch": 13} {"train_loss": -1.6374971866607666, "global_step": 581, "epoch": 13} {"train_loss": -1.5679090023040771, "global_step": 582, "epoch": 13} {"train_loss": -1.632666826248169, "global_step": 583, "epoch": 13} {"train_loss": -1.501176118850708, "global_step": 584, "epoch": 13} {"train_loss": -1.5533922910690308, "global_step": 585, "epoch": 13} {"train_loss": -1.5319725275039673, "global_step": 586, "epoch": 13} {"train_loss": -1.5658338240214758, "global_step": 587, "epoch": 13, "val_loss": 1585850.875} {"train_loss": -1.6882513761520386, "global_step": 588, "epoch": 14} {"train_loss": -1.5072654485702515, "global_step": 589, "epoch": 14} {"train_loss": -1.3837004899978638, "global_step": 590, "epoch": 14} {"train_loss": -1.7827434539794922, "global_step": 591, "epoch": 14} {"train_loss": -1.6084649562835693, "global_step": 592, "epoch": 14} {"train_loss": -1.7418001890182495, "global_step": 593, "epoch": 14} {"train_loss": -1.5508698225021362, "global_step": 594, "epoch": 14} {"train_loss": -1.6627261638641357, "global_step": 595, "epoch": 14} {"train_loss": -1.7194117307662964, "global_step": 596, "epoch": 14} {"train_loss": -1.6176503896713257, "global_step": 597, "epoch": 14} {"train_loss": -1.5954768657684326, "global_step": 598, "epoch": 14} {"train_loss": -1.7023727893829346, "global_step": 599, "epoch": 14} {"train_loss": -1.703554630279541, "global_step": 600, "epoch": 14} {"train_loss": -1.5757843255996704, "global_step": 601, "epoch": 14} {"train_loss": -1.6888794898986816, "global_step": 602, "epoch": 14} {"train_loss": -1.7265498638153076, "global_step": 603, "epoch": 14} {"train_loss": -1.6560572385787964, "global_step": 604, "epoch": 14} {"train_loss": -1.6312369108200073, "global_step": 605, "epoch": 14} {"train_loss": -1.5895297527313232, "global_step": 606, "epoch": 14} {"train_loss": -1.76718270778656, "global_step": 607, "epoch": 14} {"train_loss": -1.7563759088516235, "global_step": 608, "epoch": 14} {"train_loss": -1.739025354385376, "global_step": 609, "epoch": 14} {"train_loss": -1.7276477813720703, "global_step": 610, "epoch": 14} {"train_loss": -1.6451668739318848, "global_step": 611, "epoch": 14} {"train_loss": -1.540320873260498, "global_step": 612, "epoch": 14} {"train_loss": -1.6603655815124512, "global_step": 613, "epoch": 14} {"train_loss": -1.6191205978393555, "global_step": 614, "epoch": 14} {"train_loss": -1.6684601306915283, "global_step": 615, "epoch": 14} {"train_loss": -1.5200953483581543, "global_step": 616, "epoch": 14} {"train_loss": -1.8104455471038818, "global_step": 617, "epoch": 14} {"train_loss": -1.591054916381836, "global_step": 618, "epoch": 14} {"train_loss": -1.6952166557312012, "global_step": 619, "epoch": 14} {"train_loss": -1.7231733798980713, "global_step": 620, "epoch": 14} {"train_loss": -1.7512154579162598, "global_step": 621, "epoch": 14} {"train_loss": -1.8155081272125244, "global_step": 622, "epoch": 14} {"train_loss": -1.7900753021240234, "global_step": 623, "epoch": 14} {"train_loss": -1.6467549800872803, "global_step": 624, "epoch": 14} {"train_loss": -1.6880825757980347, "global_step": 625, "epoch": 14} {"train_loss": -1.600337266921997, "global_step": 626, "epoch": 14} {"train_loss": -1.7631912231445312, "global_step": 627, "epoch": 14} {"train_loss": -1.772573709487915, "global_step": 628, "epoch": 14} {"train_loss": -1.667915253412156, "global_step": 629, "epoch": 14, "val_loss": 1486319.25} {"train_loss": -1.5702928304672241, "global_step": 630, "epoch": 15} {"train_loss": -1.6601088047027588, "global_step": 631, "epoch": 15} {"train_loss": -1.6803350448608398, "global_step": 632, "epoch": 15} {"train_loss": -1.6742221117019653, "global_step": 633, "epoch": 15} {"train_loss": -1.8224315643310547, "global_step": 634, "epoch": 15} {"train_loss": -1.7314218282699585, "global_step": 635, "epoch": 15} {"train_loss": -1.7883343696594238, "global_step": 636, "epoch": 15} {"train_loss": -1.7649686336517334, "global_step": 637, "epoch": 15} {"train_loss": -1.9228078126907349, "global_step": 638, "epoch": 15} {"train_loss": -1.728508710861206, "global_step": 639, "epoch": 15} {"train_loss": -1.974314570426941, "global_step": 640, "epoch": 15} {"train_loss": -1.6698627471923828, "global_step": 641, "epoch": 15} {"train_loss": -1.6541602611541748, "global_step": 642, "epoch": 15} {"train_loss": -1.6158058643341064, "global_step": 643, "epoch": 15} {"train_loss": -1.7579755783081055, "global_step": 644, "epoch": 15} {"train_loss": -1.7261435985565186, "global_step": 645, "epoch": 15} {"train_loss": -1.6911485195159912, "global_step": 646, "epoch": 15} {"train_loss": -1.8926421403884888, "global_step": 647, "epoch": 15} {"train_loss": -1.7370734214782715, "global_step": 648, "epoch": 15} {"train_loss": -1.9532712697982788, "global_step": 649, "epoch": 15} {"train_loss": -1.776824712753296, "global_step": 650, "epoch": 15} {"train_loss": -1.8584644794464111, "global_step": 651, "epoch": 15} {"train_loss": -1.7062149047851562, "global_step": 652, "epoch": 15} {"train_loss": -1.79475998878479, "global_step": 653, "epoch": 15} {"train_loss": -1.8919649124145508, "global_step": 654, "epoch": 15} {"train_loss": -1.8465051651000977, "global_step": 655, "epoch": 15} {"train_loss": -1.808308482170105, "global_step": 656, "epoch": 15} {"train_loss": -1.7225399017333984, "global_step": 657, "epoch": 15} {"train_loss": -1.775397539138794, "global_step": 658, "epoch": 15} {"train_loss": -1.749333143234253, "global_step": 659, "epoch": 15} {"train_loss": -1.709395170211792, "global_step": 660, "epoch": 15} {"train_loss": -1.7841265201568604, "global_step": 661, "epoch": 15} {"train_loss": -1.8196749687194824, "global_step": 662, "epoch": 15} {"train_loss": -1.7798371315002441, "global_step": 663, "epoch": 15} {"train_loss": -1.7601656913757324, "global_step": 664, "epoch": 15} {"train_loss": -1.6926934719085693, "global_step": 665, "epoch": 15} {"train_loss": -1.9018659591674805, "global_step": 666, "epoch": 15} {"train_loss": -1.7864995002746582, "global_step": 667, "epoch": 15} {"train_loss": -1.601047158241272, "global_step": 668, "epoch": 15} {"train_loss": -1.660801649093628, "global_step": 669, "epoch": 15} {"train_loss": -1.6824918985366821, "global_step": 670, "epoch": 15} {"train_loss": -1.7579769690831502, "global_step": 671, "epoch": 15, "val_loss": 1364967.875} {"train_loss": -1.8625762462615967, "global_step": 672, "epoch": 16} {"train_loss": -1.8507789373397827, "global_step": 673, "epoch": 16} {"train_loss": -1.883939266204834, "global_step": 674, "epoch": 16} {"train_loss": -1.632570505142212, "global_step": 675, "epoch": 16} {"train_loss": -1.7138276100158691, "global_step": 676, "epoch": 16} {"train_loss": -1.7501556873321533, "global_step": 677, "epoch": 16} {"train_loss": -1.8842686414718628, "global_step": 678, "epoch": 16} {"train_loss": -1.7859737873077393, "global_step": 679, "epoch": 16} {"train_loss": -1.8328750133514404, "global_step": 680, "epoch": 16} {"train_loss": -1.7041922807693481, "global_step": 681, "epoch": 16} {"train_loss": -1.8324636220932007, "global_step": 682, "epoch": 16} {"train_loss": -1.784350872039795, "global_step": 683, "epoch": 16} {"train_loss": -1.8331239223480225, "global_step": 684, "epoch": 16} {"train_loss": -1.717649221420288, "global_step": 685, "epoch": 16} {"train_loss": -1.6647659540176392, "global_step": 686, "epoch": 16} {"train_loss": -1.6699508428573608, "global_step": 687, "epoch": 16} {"train_loss": -1.7940815687179565, "global_step": 688, "epoch": 16} {"train_loss": -1.7997381687164307, "global_step": 689, "epoch": 16} {"train_loss": -1.650001049041748, "global_step": 690, "epoch": 16} {"train_loss": -1.844759464263916, "global_step": 691, "epoch": 16} {"train_loss": -1.7524691820144653, "global_step": 692, "epoch": 16} {"train_loss": -1.8034696578979492, "global_step": 693, "epoch": 16} {"train_loss": -1.6527493000030518, "global_step": 694, "epoch": 16} {"train_loss": -1.7889132499694824, "global_step": 695, "epoch": 16} {"train_loss": -1.8722009658813477, "global_step": 696, "epoch": 16} {"train_loss": -1.7806532382965088, "global_step": 697, "epoch": 16} {"train_loss": -1.8541724681854248, "global_step": 698, "epoch": 16} {"train_loss": -1.7554253339767456, "global_step": 699, "epoch": 16} {"train_loss": -1.7005746364593506, "global_step": 700, "epoch": 16} {"train_loss": -1.8142123222351074, "global_step": 701, "epoch": 16} {"train_loss": -1.8451393842697144, "global_step": 702, "epoch": 16} {"train_loss": -1.8248662948608398, "global_step": 703, "epoch": 16} {"train_loss": -1.8215272426605225, "global_step": 704, "epoch": 16} {"train_loss": -1.8161531686782837, "global_step": 705, "epoch": 16} {"train_loss": -1.8415827751159668, "global_step": 706, "epoch": 16} {"train_loss": -1.8018836975097656, "global_step": 707, "epoch": 16} {"train_loss": -1.8833661079406738, "global_step": 708, "epoch": 16} {"train_loss": -1.9233160018920898, "global_step": 709, "epoch": 16} {"train_loss": -1.8022572994232178, "global_step": 710, "epoch": 16} {"train_loss": -1.933853030204773, "global_step": 711, "epoch": 16} {"train_loss": -1.8178791999816895, "global_step": 712, "epoch": 16} {"train_loss": -1.7985026325498308, "global_step": 713, "epoch": 16, "val_loss": 1270623.25} {"train_loss": -1.8947652578353882, "global_step": 714, "epoch": 17} {"train_loss": -1.8996111154556274, "global_step": 715, "epoch": 17} {"train_loss": -1.7726414203643799, "global_step": 716, "epoch": 17} {"train_loss": -1.8511203527450562, "global_step": 717, "epoch": 17} {"train_loss": -1.820847511291504, "global_step": 718, "epoch": 17} {"train_loss": -1.8728408813476562, "global_step": 719, "epoch": 17} {"train_loss": -1.9006515741348267, "global_step": 720, "epoch": 17} {"train_loss": -1.8932666778564453, "global_step": 721, "epoch": 17} {"train_loss": -1.8922873735427856, "global_step": 722, "epoch": 17} {"train_loss": -1.9181511402130127, "global_step": 723, "epoch": 17} {"train_loss": -1.9251465797424316, "global_step": 724, "epoch": 17} {"train_loss": -1.8667893409729004, "global_step": 725, "epoch": 17} {"train_loss": -1.8808975219726562, "global_step": 726, "epoch": 17} {"train_loss": -1.8288798332214355, "global_step": 727, "epoch": 17} {"train_loss": -1.9011855125427246, "global_step": 728, "epoch": 17} {"train_loss": -1.9582780599594116, "global_step": 729, "epoch": 17} {"train_loss": -1.9714269638061523, "global_step": 730, "epoch": 17} {"train_loss": -1.8180010318756104, "global_step": 731, "epoch": 17} {"train_loss": -1.8579174280166626, "global_step": 732, "epoch": 17} {"train_loss": -2.0121796131134033, "global_step": 733, "epoch": 17} {"train_loss": -1.9519433975219727, "global_step": 734, "epoch": 17} {"train_loss": -1.9268078804016113, "global_step": 735, "epoch": 17} {"train_loss": -2.138388156890869, "global_step": 736, "epoch": 17} {"train_loss": -1.909921646118164, "global_step": 737, "epoch": 17} {"train_loss": -1.8790192604064941, "global_step": 738, "epoch": 17} {"train_loss": -1.9607930183410645, "global_step": 739, "epoch": 17} {"train_loss": -1.9826138019561768, "global_step": 740, "epoch": 17} {"train_loss": -1.872455358505249, "global_step": 741, "epoch": 17} {"train_loss": -1.973993182182312, "global_step": 742, "epoch": 17} {"train_loss": -2.001899242401123, "global_step": 743, "epoch": 17} {"train_loss": -1.9411685466766357, "global_step": 744, "epoch": 17} {"train_loss": -1.7614383697509766, "global_step": 745, "epoch": 17} {"train_loss": -1.9898895025253296, "global_step": 746, "epoch": 17} {"train_loss": -1.893988847732544, "global_step": 747, "epoch": 17} {"train_loss": -1.7421894073486328, "global_step": 748, "epoch": 17} {"train_loss": -1.9254577159881592, "global_step": 749, "epoch": 17} {"train_loss": -1.9209990501403809, "global_step": 750, "epoch": 17} {"train_loss": -1.9128358364105225, "global_step": 751, "epoch": 17} {"train_loss": -1.9491641521453857, "global_step": 752, "epoch": 17} {"train_loss": -1.940932273864746, "global_step": 753, "epoch": 17} {"train_loss": -2.0302679538726807, "global_step": 754, "epoch": 17} {"train_loss": -1.9113971307164146, "global_step": 755, "epoch": 17, "val_loss": 1183108.125} {"train_loss": -1.9211084842681885, "global_step": 756, "epoch": 18} {"train_loss": -1.9141781330108643, "global_step": 757, "epoch": 18} {"train_loss": -1.9433417320251465, "global_step": 758, "epoch": 18} {"train_loss": -1.907694697380066, "global_step": 759, "epoch": 18} {"train_loss": -2.120218276977539, "global_step": 760, "epoch": 18} {"train_loss": -1.9616611003875732, "global_step": 761, "epoch": 18} {"train_loss": -1.9969778060913086, "global_step": 762, "epoch": 18} {"train_loss": -2.02191162109375, "global_step": 763, "epoch": 18} {"train_loss": -1.9916794300079346, "global_step": 764, "epoch": 18} {"train_loss": -2.0492069721221924, "global_step": 765, "epoch": 18} {"train_loss": -1.8650341033935547, "global_step": 766, "epoch": 18} {"train_loss": -1.8819355964660645, "global_step": 767, "epoch": 18} {"train_loss": -1.9683001041412354, "global_step": 768, "epoch": 18} {"train_loss": -1.9980909824371338, "global_step": 769, "epoch": 18} {"train_loss": -1.9341951608657837, "global_step": 770, "epoch": 18} {"train_loss": -1.8960280418395996, "global_step": 771, "epoch": 18} {"train_loss": -1.9428547620773315, "global_step": 772, "epoch": 18} {"train_loss": -1.9251593351364136, "global_step": 773, "epoch": 18} {"train_loss": -2.018838405609131, "global_step": 774, "epoch": 18} {"train_loss": -1.8628675937652588, "global_step": 775, "epoch": 18} {"train_loss": -2.0232272148132324, "global_step": 776, "epoch": 18} {"train_loss": -1.88930344581604, "global_step": 777, "epoch": 18} {"train_loss": -1.9417331218719482, "global_step": 778, "epoch": 18} {"train_loss": -1.938330888748169, "global_step": 779, "epoch": 18} {"train_loss": -1.8679388761520386, "global_step": 780, "epoch": 18} {"train_loss": -1.926408290863037, "global_step": 781, "epoch": 18} {"train_loss": -2.0311086177825928, "global_step": 782, "epoch": 18} {"train_loss": -1.9301958084106445, "global_step": 783, "epoch": 18} {"train_loss": -1.9517061710357666, "global_step": 784, "epoch": 18} {"train_loss": -1.9089605808258057, "global_step": 785, "epoch": 18} {"train_loss": -1.8908991813659668, "global_step": 786, "epoch": 18} {"train_loss": -1.9957756996154785, "global_step": 787, "epoch": 18} {"train_loss": -1.9945878982543945, "global_step": 788, "epoch": 18} {"train_loss": -1.92852783203125, "global_step": 789, "epoch": 18} {"train_loss": -2.0032453536987305, "global_step": 790, "epoch": 18} {"train_loss": -1.8958840370178223, "global_step": 791, "epoch": 18} {"train_loss": -2.0029759407043457, "global_step": 792, "epoch": 18} {"train_loss": -2.0915017127990723, "global_step": 793, "epoch": 18} {"train_loss": -2.003002643585205, "global_step": 794, "epoch": 18} {"train_loss": -2.0043630599975586, "global_step": 795, "epoch": 18} {"train_loss": -1.91475248336792, "global_step": 796, "epoch": 18} {"train_loss": -1.9618314589772905, "global_step": 797, "epoch": 18, "val_loss": 1132393.125} {"train_loss": -1.9394510984420776, "global_step": 798, "epoch": 19} {"train_loss": -1.9512596130371094, "global_step": 799, "epoch": 19} {"train_loss": -2.071925163269043, "global_step": 800, "epoch": 19} {"train_loss": -2.029475212097168, "global_step": 801, "epoch": 19} {"train_loss": -1.9737656116485596, "global_step": 802, "epoch": 19} {"train_loss": -2.064009189605713, "global_step": 803, "epoch": 19} {"train_loss": -2.040128231048584, "global_step": 804, "epoch": 19} {"train_loss": -2.012105703353882, "global_step": 805, "epoch": 19} {"train_loss": -1.8169312477111816, "global_step": 806, "epoch": 19} {"train_loss": -1.9249117374420166, "global_step": 807, "epoch": 19} {"train_loss": -2.037188768386841, "global_step": 808, "epoch": 19} {"train_loss": -2.0959582328796387, "global_step": 809, "epoch": 19} {"train_loss": -1.9235481023788452, "global_step": 810, "epoch": 19} {"train_loss": -2.1289072036743164, "global_step": 811, "epoch": 19} {"train_loss": -2.065446138381958, "global_step": 812, "epoch": 19} {"train_loss": -2.036081552505493, "global_step": 813, "epoch": 19} {"train_loss": -2.1379661560058594, "global_step": 814, "epoch": 19} {"train_loss": -2.1042912006378174, "global_step": 815, "epoch": 19} {"train_loss": -2.1117939949035645, "global_step": 816, "epoch": 19} {"train_loss": -2.0171728134155273, "global_step": 817, "epoch": 19} {"train_loss": -2.0758535861968994, "global_step": 818, "epoch": 19} {"train_loss": -1.9493591785430908, "global_step": 819, "epoch": 19} {"train_loss": -2.0631325244903564, "global_step": 820, "epoch": 19} {"train_loss": -1.972569465637207, "global_step": 821, "epoch": 19} {"train_loss": -2.104722023010254, "global_step": 822, "epoch": 19} {"train_loss": -1.8710280656814575, "global_step": 823, "epoch": 19} {"train_loss": -2.0890307426452637, "global_step": 824, "epoch": 19} {"train_loss": -1.9293935298919678, "global_step": 825, "epoch": 19} {"train_loss": -1.999126672744751, "global_step": 826, "epoch": 19} {"train_loss": -2.2574827671051025, "global_step": 827, "epoch": 19} {"train_loss": -2.1441879272460938, "global_step": 828, "epoch": 19} {"train_loss": -2.034208297729492, "global_step": 829, "epoch": 19} {"train_loss": -2.13777494430542, "global_step": 830, "epoch": 19} {"train_loss": -2.154247760772705, "global_step": 831, "epoch": 19} {"train_loss": -1.8989872932434082, "global_step": 832, "epoch": 19} {"train_loss": -2.0800766944885254, "global_step": 833, "epoch": 19} {"train_loss": -1.9931488037109375, "global_step": 834, "epoch": 19} {"train_loss": -2.020874500274658, "global_step": 835, "epoch": 19} {"train_loss": -2.1280322074890137, "global_step": 836, "epoch": 19} {"train_loss": -1.9779956340789795, "global_step": 837, "epoch": 19} {"train_loss": -2.0716443061828613, "global_step": 838, "epoch": 19} {"train_loss": -2.0374408818426586, "global_step": 839, "epoch": 19, "val_loss": 1067108.375} {"train_loss": -1.9803465604782104, "global_step": 840, "epoch": 20} {"train_loss": -2.237555503845215, "global_step": 841, "epoch": 20} {"train_loss": -2.1822376251220703, "global_step": 842, "epoch": 20} {"train_loss": -2.0949368476867676, "global_step": 843, "epoch": 20} {"train_loss": -1.9961974620819092, "global_step": 844, "epoch": 20} {"train_loss": -2.1446170806884766, "global_step": 845, "epoch": 20} {"train_loss": -2.1225786209106445, "global_step": 846, "epoch": 20} {"train_loss": -2.0444693565368652, "global_step": 847, "epoch": 20} {"train_loss": -2.0283665657043457, "global_step": 848, "epoch": 20} {"train_loss": -2.054100513458252, "global_step": 849, "epoch": 20} {"train_loss": -2.0394175052642822, "global_step": 850, "epoch": 20} {"train_loss": -2.050325393676758, "global_step": 851, "epoch": 20} {"train_loss": -2.093513011932373, "global_step": 852, "epoch": 20} {"train_loss": -2.1452202796936035, "global_step": 853, "epoch": 20} {"train_loss": -2.1838996410369873, "global_step": 854, "epoch": 20} {"train_loss": -2.159424304962158, "global_step": 855, "epoch": 20} {"train_loss": -1.9339640140533447, "global_step": 856, "epoch": 20} {"train_loss": -2.20045804977417, "global_step": 857, "epoch": 20} {"train_loss": -2.1963303089141846, "global_step": 858, "epoch": 20} {"train_loss": -2.029984712600708, "global_step": 859, "epoch": 20} {"train_loss": -2.0331757068634033, "global_step": 860, "epoch": 20} {"train_loss": -2.011983871459961, "global_step": 861, "epoch": 20} {"train_loss": -2.2143173217773438, "global_step": 862, "epoch": 20} {"train_loss": -2.077937364578247, "global_step": 863, "epoch": 20} {"train_loss": -2.128683090209961, "global_step": 864, "epoch": 20} {"train_loss": -2.0604937076568604, "global_step": 865, "epoch": 20} {"train_loss": -2.1374504566192627, "global_step": 866, "epoch": 20} {"train_loss": -2.0685946941375732, "global_step": 867, "epoch": 20} {"train_loss": -2.0833802223205566, "global_step": 868, "epoch": 20} {"train_loss": -2.166090726852417, "global_step": 869, "epoch": 20} {"train_loss": -2.1528432369232178, "global_step": 870, "epoch": 20} {"train_loss": -2.104203939437866, "global_step": 871, "epoch": 20} {"train_loss": -2.105001926422119, "global_step": 872, "epoch": 20} {"train_loss": -2.0066933631896973, "global_step": 873, "epoch": 20} {"train_loss": -2.1890368461608887, "global_step": 874, "epoch": 20} {"train_loss": -2.2003421783447266, "global_step": 875, "epoch": 20} {"train_loss": -2.1265082359313965, "global_step": 876, "epoch": 20} {"train_loss": -2.225414276123047, "global_step": 877, "epoch": 20} {"train_loss": -2.0545883178710938, "global_step": 878, "epoch": 20} {"train_loss": -2.1424121856689453, "global_step": 879, "epoch": 20} {"train_loss": -2.187305450439453, "global_step": 880, "epoch": 20} {"train_loss": -2.1064044322286333, "global_step": 881, "epoch": 20, "val_loss": 1006382.25} {"train_loss": -2.2571067810058594, "global_step": 882, "epoch": 21} {"train_loss": -2.2217884063720703, "global_step": 883, "epoch": 21} {"train_loss": -2.191958427429199, "global_step": 884, "epoch": 21} {"train_loss": -2.2516326904296875, "global_step": 885, "epoch": 21} {"train_loss": -2.234462261199951, "global_step": 886, "epoch": 21} {"train_loss": -2.0529956817626953, "global_step": 887, "epoch": 21} {"train_loss": -2.126858711242676, "global_step": 888, "epoch": 21} {"train_loss": -2.2134406566619873, "global_step": 889, "epoch": 21} {"train_loss": -2.1120080947875977, "global_step": 890, "epoch": 21} {"train_loss": -2.0185675621032715, "global_step": 891, "epoch": 21} {"train_loss": -2.110422372817993, "global_step": 892, "epoch": 21} {"train_loss": -2.2035207748413086, "global_step": 893, "epoch": 21} {"train_loss": -2.178699016571045, "global_step": 894, "epoch": 21} {"train_loss": -2.0790505409240723, "global_step": 895, "epoch": 21} {"train_loss": -2.1229372024536133, "global_step": 896, "epoch": 21} {"train_loss": -2.1984848976135254, "global_step": 897, "epoch": 21} {"train_loss": -2.203640937805176, "global_step": 898, "epoch": 21} {"train_loss": -2.2294998168945312, "global_step": 899, "epoch": 21} {"train_loss": -2.2447237968444824, "global_step": 900, "epoch": 21} {"train_loss": -2.079657554626465, "global_step": 901, "epoch": 21} {"train_loss": -2.0978000164031982, "global_step": 902, "epoch": 21} {"train_loss": -2.265687942504883, "global_step": 903, "epoch": 21} {"train_loss": -2.18888783454895, "global_step": 904, "epoch": 21} {"train_loss": -2.095440626144409, "global_step": 905, "epoch": 21} {"train_loss": -2.269537925720215, "global_step": 906, "epoch": 21} {"train_loss": -2.1559925079345703, "global_step": 907, "epoch": 21} {"train_loss": -2.2015719413757324, "global_step": 908, "epoch": 21} {"train_loss": -2.186034679412842, "global_step": 909, "epoch": 21} {"train_loss": -2.3116674423217773, "global_step": 910, "epoch": 21} {"train_loss": -2.1129252910614014, "global_step": 911, "epoch": 21} {"train_loss": -2.2126331329345703, "global_step": 912, "epoch": 21} {"train_loss": -2.2551352977752686, "global_step": 913, "epoch": 21} {"train_loss": -2.158806085586548, "global_step": 914, "epoch": 21} {"train_loss": -2.239461660385132, "global_step": 915, "epoch": 21} {"train_loss": -2.208904981613159, "global_step": 916, "epoch": 21} {"train_loss": -2.043194532394409, "global_step": 917, "epoch": 21} {"train_loss": -2.3344662189483643, "global_step": 918, "epoch": 21} {"train_loss": -2.272976875305176, "global_step": 919, "epoch": 21} {"train_loss": -2.3292980194091797, "global_step": 920, "epoch": 21} {"train_loss": -2.034661293029785, "global_step": 921, "epoch": 21} {"train_loss": -2.1085104942321777, "global_step": 922, "epoch": 21} {"train_loss": -2.180882221176511, "global_step": 923, "epoch": 21, "val_loss": 958535.0} {"train_loss": -1.9796173572540283, "global_step": 924, "epoch": 22} {"train_loss": -2.088848114013672, "global_step": 925, "epoch": 22} {"train_loss": -1.9982922077178955, "global_step": 926, "epoch": 22} {"train_loss": -2.1422431468963623, "global_step": 927, "epoch": 22} {"train_loss": -2.153398036956787, "global_step": 928, "epoch": 22} {"train_loss": -2.232358932495117, "global_step": 929, "epoch": 22} {"train_loss": -1.9314801692962646, "global_step": 930, "epoch": 22} {"train_loss": -2.0350170135498047, "global_step": 931, "epoch": 22} {"train_loss": -2.0031800270080566, "global_step": 932, "epoch": 22} {"train_loss": -2.0410478115081787, "global_step": 933, "epoch": 22} {"train_loss": -2.305494785308838, "global_step": 934, "epoch": 22} {"train_loss": -1.9825425148010254, "global_step": 935, "epoch": 22} {"train_loss": -2.401881694793701, "global_step": 936, "epoch": 22} {"train_loss": -2.0814545154571533, "global_step": 937, "epoch": 22} {"train_loss": -2.2108330726623535, "global_step": 938, "epoch": 22} {"train_loss": -2.2016091346740723, "global_step": 939, "epoch": 22} {"train_loss": -2.203298807144165, "global_step": 940, "epoch": 22} {"train_loss": -2.2167603969573975, "global_step": 941, "epoch": 22} {"train_loss": -2.0860211849212646, "global_step": 942, "epoch": 22} {"train_loss": -2.1877493858337402, "global_step": 943, "epoch": 22} {"train_loss": -2.1463539600372314, "global_step": 944, "epoch": 22} {"train_loss": -2.2752246856689453, "global_step": 945, "epoch": 22} {"train_loss": -2.313964366912842, "global_step": 946, "epoch": 22} {"train_loss": -2.377434730529785, "global_step": 947, "epoch": 22} {"train_loss": -2.224388599395752, "global_step": 948, "epoch": 22} {"train_loss": -2.349085569381714, "global_step": 949, "epoch": 22} {"train_loss": -2.216038227081299, "global_step": 950, "epoch": 22} {"train_loss": -2.227572441101074, "global_step": 951, "epoch": 22} {"train_loss": -2.2879157066345215, "global_step": 952, "epoch": 22} {"train_loss": -2.2999000549316406, "global_step": 953, "epoch": 22} {"train_loss": -2.3062541484832764, "global_step": 954, "epoch": 22} {"train_loss": -2.0625319480895996, "global_step": 955, "epoch": 22} {"train_loss": -2.310479164123535, "global_step": 956, "epoch": 22} {"train_loss": -2.319871425628662, "global_step": 957, "epoch": 22} {"train_loss": -2.151139736175537, "global_step": 958, "epoch": 22} {"train_loss": -2.18182110786438, "global_step": 959, "epoch": 22} {"train_loss": -2.183441400527954, "global_step": 960, "epoch": 22} {"train_loss": -2.23944091796875, "global_step": 961, "epoch": 22} {"train_loss": -2.26961612701416, "global_step": 962, "epoch": 22} {"train_loss": -2.3416032791137695, "global_step": 963, "epoch": 22} {"train_loss": -2.319246768951416, "global_step": 964, "epoch": 22} {"train_loss": -2.190891668910072, "global_step": 965, "epoch": 22, "val_loss": 911081.75} {"train_loss": -2.2001237869262695, "global_step": 966, "epoch": 23} {"train_loss": -2.326982021331787, "global_step": 967, "epoch": 23} {"train_loss": -2.2221274375915527, "global_step": 968, "epoch": 23} {"train_loss": -2.379171371459961, "global_step": 969, "epoch": 23} {"train_loss": -2.3172380924224854, "global_step": 970, "epoch": 23} {"train_loss": -2.229254722595215, "global_step": 971, "epoch": 23} {"train_loss": -2.094437599182129, "global_step": 972, "epoch": 23} {"train_loss": -2.3144545555114746, "global_step": 973, "epoch": 23} {"train_loss": -2.3169350624084473, "global_step": 974, "epoch": 23} {"train_loss": -2.305901527404785, "global_step": 975, "epoch": 23} {"train_loss": -2.295490026473999, "global_step": 976, "epoch": 23} {"train_loss": -2.2493627071380615, "global_step": 977, "epoch": 23} {"train_loss": -2.290187358856201, "global_step": 978, "epoch": 23} {"train_loss": -2.267625093460083, "global_step": 979, "epoch": 23} {"train_loss": -2.2939772605895996, "global_step": 980, "epoch": 23} {"train_loss": -2.3891022205352783, "global_step": 981, "epoch": 23} {"train_loss": -2.330681324005127, "global_step": 982, "epoch": 23} {"train_loss": -2.000352621078491, "global_step": 983, "epoch": 23} {"train_loss": -2.0410890579223633, "global_step": 984, "epoch": 23} {"train_loss": -2.250588893890381, "global_step": 985, "epoch": 23} {"train_loss": -2.159001350402832, "global_step": 986, "epoch": 23} {"train_loss": -2.108382225036621, "global_step": 987, "epoch": 23} {"train_loss": -1.9590753316879272, "global_step": 988, "epoch": 23} {"train_loss": -2.1755619049072266, "global_step": 989, "epoch": 23} {"train_loss": -1.8750741481781006, "global_step": 990, "epoch": 23} {"train_loss": -2.0740089416503906, "global_step": 991, "epoch": 23} {"train_loss": -2.0120363235473633, "global_step": 992, "epoch": 23} {"train_loss": -1.9406343698501587, "global_step": 993, "epoch": 23} {"train_loss": -2.21958065032959, "global_step": 994, "epoch": 23} {"train_loss": -2.0590591430664062, "global_step": 995, "epoch": 23} {"train_loss": -1.9974795579910278, "global_step": 996, "epoch": 23} {"train_loss": -2.226053237915039, "global_step": 997, "epoch": 23} {"train_loss": -2.0720438957214355, "global_step": 998, "epoch": 23} {"train_loss": -2.212887763977051, "global_step": 999, "epoch": 23} {"train_loss": -2.164778709411621, "global_step": 1000, "epoch": 23} {"train_loss": -1.9569473266601562, "global_step": 1001, "epoch": 23} {"train_loss": -2.2935800552368164, "global_step": 1002, "epoch": 23} {"train_loss": -2.255148410797119, "global_step": 1003, "epoch": 23} {"train_loss": -2.1201608180999756, "global_step": 1004, "epoch": 23} {"train_loss": -2.221834182739258, "global_step": 1005, "epoch": 23} {"train_loss": -2.2262704372406006, "global_step": 1006, "epoch": 23} {"train_loss": -2.1835947178658985, "global_step": 1007, "epoch": 23, "val_loss": 892163.3125} {"train_loss": -2.3039157390594482, "global_step": 1008, "epoch": 24} {"train_loss": -2.299639940261841, "global_step": 1009, "epoch": 24} {"train_loss": -2.315162181854248, "global_step": 1010, "epoch": 24} {"train_loss": -2.249044418334961, "global_step": 1011, "epoch": 24} {"train_loss": -2.3502979278564453, "global_step": 1012, "epoch": 24} {"train_loss": -2.4106810092926025, "global_step": 1013, "epoch": 24} {"train_loss": -2.32916259765625, "global_step": 1014, "epoch": 24} {"train_loss": -2.4340362548828125, "global_step": 1015, "epoch": 24} {"train_loss": -2.275225877761841, "global_step": 1016, "epoch": 24} {"train_loss": -2.326991081237793, "global_step": 1017, "epoch": 24} {"train_loss": -2.2718257904052734, "global_step": 1018, "epoch": 24} {"train_loss": -2.4045751094818115, "global_step": 1019, "epoch": 24} {"train_loss": -2.3163771629333496, "global_step": 1020, "epoch": 24} {"train_loss": -2.153952121734619, "global_step": 1021, "epoch": 24} {"train_loss": -2.198882579803467, "global_step": 1022, "epoch": 24} {"train_loss": -2.3673646450042725, "global_step": 1023, "epoch": 24} {"train_loss": -2.329620599746704, "global_step": 1024, "epoch": 24} {"train_loss": -2.3347651958465576, "global_step": 1025, "epoch": 24} {"train_loss": -2.375275135040283, "global_step": 1026, "epoch": 24} {"train_loss": -2.3734586238861084, "global_step": 1027, "epoch": 24} {"train_loss": -2.2566075325012207, "global_step": 1028, "epoch": 24} {"train_loss": -2.3672871589660645, "global_step": 1029, "epoch": 24} {"train_loss": -2.3493852615356445, "global_step": 1030, "epoch": 24} {"train_loss": -2.370479106903076, "global_step": 1031, "epoch": 24} {"train_loss": -2.3859379291534424, "global_step": 1032, "epoch": 24} {"train_loss": -2.3126258850097656, "global_step": 1033, "epoch": 24} {"train_loss": -2.2330188751220703, "global_step": 1034, "epoch": 24} {"train_loss": -2.2931480407714844, "global_step": 1035, "epoch": 24} {"train_loss": -2.243377208709717, "global_step": 1036, "epoch": 24} {"train_loss": -2.2744228839874268, "global_step": 1037, "epoch": 24} {"train_loss": -2.0006470680236816, "global_step": 1038, "epoch": 24} {"train_loss": -2.343360424041748, "global_step": 1039, "epoch": 24} {"train_loss": -2.0432868003845215, "global_step": 1040, "epoch": 24} {"train_loss": -2.2054128646850586, "global_step": 1041, "epoch": 24} {"train_loss": -2.224351644515991, "global_step": 1042, "epoch": 24} {"train_loss": -2.1828293800354004, "global_step": 1043, "epoch": 24} {"train_loss": -2.3622512817382812, "global_step": 1044, "epoch": 24} {"train_loss": -2.2195796966552734, "global_step": 1045, "epoch": 24} {"train_loss": -2.205535888671875, "global_step": 1046, "epoch": 24} {"train_loss": -2.4119207859039307, "global_step": 1047, "epoch": 24} {"train_loss": -2.0211284160614014, "global_step": 1048, "epoch": 24} {"train_loss": -2.28718638420105, "global_step": 1049, "epoch": 24, "val_loss": 867624.375} {"train_loss": -2.1191294193267822, "global_step": 1050, "epoch": 25} {"train_loss": -2.2889013290405273, "global_step": 1051, "epoch": 25} {"train_loss": -2.177116632461548, "global_step": 1052, "epoch": 25} {"train_loss": -2.0800466537475586, "global_step": 1053, "epoch": 25} {"train_loss": -2.3143534660339355, "global_step": 1054, "epoch": 25} {"train_loss": -2.2456905841827393, "global_step": 1055, "epoch": 25} {"train_loss": -2.3512206077575684, "global_step": 1056, "epoch": 25} {"train_loss": -2.3082382678985596, "global_step": 1057, "epoch": 25} {"train_loss": -2.2228121757507324, "global_step": 1058, "epoch": 25} {"train_loss": -2.2215781211853027, "global_step": 1059, "epoch": 25} {"train_loss": -2.260727882385254, "global_step": 1060, "epoch": 25} {"train_loss": -2.3054065704345703, "global_step": 1061, "epoch": 25} {"train_loss": -2.376722812652588, "global_step": 1062, "epoch": 25} {"train_loss": -2.2604355812072754, "global_step": 1063, "epoch": 25} {"train_loss": -2.2200770378112793, "global_step": 1064, "epoch": 25} {"train_loss": -2.3962697982788086, "global_step": 1065, "epoch": 25} {"train_loss": -2.330385684967041, "global_step": 1066, "epoch": 25} {"train_loss": -2.3969497680664062, "global_step": 1067, "epoch": 25} {"train_loss": -2.4284579753875732, "global_step": 1068, "epoch": 25} {"train_loss": -2.413538932800293, "global_step": 1069, "epoch": 25} {"train_loss": -2.3795790672302246, "global_step": 1070, "epoch": 25} {"train_loss": -2.3970868587493896, "global_step": 1071, "epoch": 25} {"train_loss": -2.3633370399475098, "global_step": 1072, "epoch": 25} {"train_loss": -2.296281576156616, "global_step": 1073, "epoch": 25} {"train_loss": -2.2054390907287598, "global_step": 1074, "epoch": 25} {"train_loss": -2.3002090454101562, "global_step": 1075, "epoch": 25} {"train_loss": -2.255235195159912, "global_step": 1076, "epoch": 25} {"train_loss": -2.2378690242767334, "global_step": 1077, "epoch": 25} {"train_loss": -2.329355478286743, "global_step": 1078, "epoch": 25} {"train_loss": -2.213615894317627, "global_step": 1079, "epoch": 25} {"train_loss": -2.3290553092956543, "global_step": 1080, "epoch": 25} {"train_loss": -2.187244176864624, "global_step": 1081, "epoch": 25} {"train_loss": -2.344539165496826, "global_step": 1082, "epoch": 25} {"train_loss": -2.2345380783081055, "global_step": 1083, "epoch": 25} {"train_loss": -2.2194674015045166, "global_step": 1084, "epoch": 25} {"train_loss": -2.2094264030456543, "global_step": 1085, "epoch": 25} {"train_loss": -2.43173885345459, "global_step": 1086, "epoch": 25} {"train_loss": -2.2732410430908203, "global_step": 1087, "epoch": 25} {"train_loss": -2.4442508220672607, "global_step": 1088, "epoch": 25} {"train_loss": -2.299724817276001, "global_step": 1089, "epoch": 25} {"train_loss": -2.386629343032837, "global_step": 1090, "epoch": 25} {"train_loss": -2.2959655977430797, "global_step": 1091, "epoch": 25, "val_loss": 803432.0625} {"train_loss": -2.3828516006469727, "global_step": 1092, "epoch": 26} {"train_loss": -2.2723183631896973, "global_step": 1093, "epoch": 26} {"train_loss": -2.4881134033203125, "global_step": 1094, "epoch": 26} {"train_loss": -2.455656051635742, "global_step": 1095, "epoch": 26} {"train_loss": -2.280233383178711, "global_step": 1096, "epoch": 26} {"train_loss": -2.4537835121154785, "global_step": 1097, "epoch": 26} {"train_loss": -2.3649299144744873, "global_step": 1098, "epoch": 26} {"train_loss": -2.418994426727295, "global_step": 1099, "epoch": 26} {"train_loss": -2.439401149749756, "global_step": 1100, "epoch": 26} {"train_loss": -2.4098124504089355, "global_step": 1101, "epoch": 26} {"train_loss": -2.493232488632202, "global_step": 1102, "epoch": 26} {"train_loss": -2.3511672019958496, "global_step": 1103, "epoch": 26} {"train_loss": -2.4674386978149414, "global_step": 1104, "epoch": 26} {"train_loss": -2.493201494216919, "global_step": 1105, "epoch": 26} {"train_loss": -2.3130760192871094, "global_step": 1106, "epoch": 26} {"train_loss": -2.3270530700683594, "global_step": 1107, "epoch": 26} {"train_loss": -2.5145366191864014, "global_step": 1108, "epoch": 26} {"train_loss": -2.511319637298584, "global_step": 1109, "epoch": 26} {"train_loss": -2.4323787689208984, "global_step": 1110, "epoch": 26} {"train_loss": -2.3134305477142334, "global_step": 1111, "epoch": 26} {"train_loss": -2.4249963760375977, "global_step": 1112, "epoch": 26} {"train_loss": -2.420729398727417, "global_step": 1113, "epoch": 26} {"train_loss": -2.2863240242004395, "global_step": 1114, "epoch": 26} {"train_loss": -2.38625431060791, "global_step": 1115, "epoch": 26} {"train_loss": -2.4760758876800537, "global_step": 1116, "epoch": 26} {"train_loss": -2.405768871307373, "global_step": 1117, "epoch": 26} {"train_loss": -2.4251251220703125, "global_step": 1118, "epoch": 26} {"train_loss": -2.500361919403076, "global_step": 1119, "epoch": 26} {"train_loss": -2.4133129119873047, "global_step": 1120, "epoch": 26} {"train_loss": -2.4481778144836426, "global_step": 1121, "epoch": 26} {"train_loss": -2.5040464401245117, "global_step": 1122, "epoch": 26} {"train_loss": -2.383558750152588, "global_step": 1123, "epoch": 26} {"train_loss": -2.5207624435424805, "global_step": 1124, "epoch": 26} {"train_loss": -2.4590930938720703, "global_step": 1125, "epoch": 26} {"train_loss": -2.412008762359619, "global_step": 1126, "epoch": 26} {"train_loss": -2.5491995811462402, "global_step": 1127, "epoch": 26} {"train_loss": -2.540271520614624, "global_step": 1128, "epoch": 26} {"train_loss": -2.3951330184936523, "global_step": 1129, "epoch": 26} {"train_loss": -2.43160080909729, "global_step": 1130, "epoch": 26} {"train_loss": -2.5220394134521484, "global_step": 1131, "epoch": 26} {"train_loss": -2.5821306705474854, "global_step": 1132, "epoch": 26} {"train_loss": -2.431633920896621, "global_step": 1133, "epoch": 26, "val_loss": 762527.9375} {"train_loss": -2.4651074409484863, "global_step": 1134, "epoch": 27} {"train_loss": -2.4559195041656494, "global_step": 1135, "epoch": 27} {"train_loss": -2.5824732780456543, "global_step": 1136, "epoch": 27} {"train_loss": -2.5065271854400635, "global_step": 1137, "epoch": 27} {"train_loss": -2.4227120876312256, "global_step": 1138, "epoch": 27} {"train_loss": -2.4185681343078613, "global_step": 1139, "epoch": 27} {"train_loss": -2.3857171535491943, "global_step": 1140, "epoch": 27} {"train_loss": -2.5715744495391846, "global_step": 1141, "epoch": 27} {"train_loss": -2.4782092571258545, "global_step": 1142, "epoch": 27} {"train_loss": -2.5337464809417725, "global_step": 1143, "epoch": 27} {"train_loss": -2.462038040161133, "global_step": 1144, "epoch": 27} {"train_loss": -2.58253812789917, "global_step": 1145, "epoch": 27} {"train_loss": -2.2910985946655273, "global_step": 1146, "epoch": 27} {"train_loss": -2.430542469024658, "global_step": 1147, "epoch": 27} {"train_loss": -2.483797550201416, "global_step": 1148, "epoch": 27} {"train_loss": -2.6703898906707764, "global_step": 1149, "epoch": 27} {"train_loss": -2.519774913787842, "global_step": 1150, "epoch": 27} {"train_loss": -2.438901901245117, "global_step": 1151, "epoch": 27} {"train_loss": -2.403324842453003, "global_step": 1152, "epoch": 27} {"train_loss": -2.4618587493896484, "global_step": 1153, "epoch": 27} {"train_loss": -2.5788373947143555, "global_step": 1154, "epoch": 27} {"train_loss": -2.391575336456299, "global_step": 1155, "epoch": 27} {"train_loss": -2.551426887512207, "global_step": 1156, "epoch": 27} {"train_loss": -2.5410995483398438, "global_step": 1157, "epoch": 27} {"train_loss": -2.270853042602539, "global_step": 1158, "epoch": 27} {"train_loss": -2.475114107131958, "global_step": 1159, "epoch": 27} {"train_loss": -2.3695075511932373, "global_step": 1160, "epoch": 27} {"train_loss": -2.560189723968506, "global_step": 1161, "epoch": 27} {"train_loss": -2.2820301055908203, "global_step": 1162, "epoch": 27} {"train_loss": -2.5974578857421875, "global_step": 1163, "epoch": 27} {"train_loss": -2.028852939605713, "global_step": 1164, "epoch": 27} {"train_loss": -2.3287200927734375, "global_step": 1165, "epoch": 27} {"train_loss": -2.234445810317993, "global_step": 1166, "epoch": 27} {"train_loss": -2.4634299278259277, "global_step": 1167, "epoch": 27} {"train_loss": -2.4691576957702637, "global_step": 1168, "epoch": 27} {"train_loss": -2.553565502166748, "global_step": 1169, "epoch": 27} {"train_loss": -2.4188952445983887, "global_step": 1170, "epoch": 27} {"train_loss": -2.442075252532959, "global_step": 1171, "epoch": 27} {"train_loss": -2.4651758670806885, "global_step": 1172, "epoch": 27} {"train_loss": -2.5161547660827637, "global_step": 1173, "epoch": 27} {"train_loss": -2.5795111656188965, "global_step": 1174, "epoch": 27} {"train_loss": -2.454659734453474, "global_step": 1175, "epoch": 27, "val_loss": 686424.3125} {"train_loss": -2.4188363552093506, "global_step": 1176, "epoch": 28} {"train_loss": -2.588268756866455, "global_step": 1177, "epoch": 28} {"train_loss": -2.5660746097564697, "global_step": 1178, "epoch": 28} {"train_loss": -2.411578893661499, "global_step": 1179, "epoch": 28} {"train_loss": -2.5191650390625, "global_step": 1180, "epoch": 28} {"train_loss": -2.581299304962158, "global_step": 1181, "epoch": 28} {"train_loss": -2.4858970642089844, "global_step": 1182, "epoch": 28} {"train_loss": -2.5556983947753906, "global_step": 1183, "epoch": 28} {"train_loss": -2.616647720336914, "global_step": 1184, "epoch": 28} {"train_loss": -2.6345276832580566, "global_step": 1185, "epoch": 28} {"train_loss": -2.4853131771087646, "global_step": 1186, "epoch": 28} {"train_loss": -2.5648908615112305, "global_step": 1187, "epoch": 28} {"train_loss": -2.560974597930908, "global_step": 1188, "epoch": 28} {"train_loss": -2.5279102325439453, "global_step": 1189, "epoch": 28} {"train_loss": -2.6549720764160156, "global_step": 1190, "epoch": 28} {"train_loss": -2.4911694526672363, "global_step": 1191, "epoch": 28} {"train_loss": -2.5352752208709717, "global_step": 1192, "epoch": 28} {"train_loss": -2.4136688709259033, "global_step": 1193, "epoch": 28} {"train_loss": -2.411341667175293, "global_step": 1194, "epoch": 28} {"train_loss": -2.4794764518737793, "global_step": 1195, "epoch": 28} {"train_loss": -2.4630587100982666, "global_step": 1196, "epoch": 28} {"train_loss": -2.5825629234313965, "global_step": 1197, "epoch": 28} {"train_loss": -2.475090742111206, "global_step": 1198, "epoch": 28} {"train_loss": -2.5312728881835938, "global_step": 1199, "epoch": 28} {"train_loss": -2.5620436668395996, "global_step": 1200, "epoch": 28} {"train_loss": -2.715928316116333, "global_step": 1201, "epoch": 28} {"train_loss": -2.3406918048858643, "global_step": 1202, "epoch": 28} {"train_loss": -2.4918620586395264, "global_step": 1203, "epoch": 28} {"train_loss": -2.5669407844543457, "global_step": 1204, "epoch": 28} {"train_loss": -2.4522202014923096, "global_step": 1205, "epoch": 28} {"train_loss": -2.540191411972046, "global_step": 1206, "epoch": 28} {"train_loss": -2.628448247909546, "global_step": 1207, "epoch": 28} {"train_loss": -2.645287036895752, "global_step": 1208, "epoch": 28} {"train_loss": -2.5110888481140137, "global_step": 1209, "epoch": 28} {"train_loss": -2.4456357955932617, "global_step": 1210, "epoch": 28} {"train_loss": -2.6265206336975098, "global_step": 1211, "epoch": 28} {"train_loss": -2.5660314559936523, "global_step": 1212, "epoch": 28} {"train_loss": -2.5179996490478516, "global_step": 1213, "epoch": 28} {"train_loss": -2.407680034637451, "global_step": 1214, "epoch": 28} {"train_loss": -2.631268262863159, "global_step": 1215, "epoch": 28} {"train_loss": -2.3144803047180176, "global_step": 1216, "epoch": 28} {"train_loss": -2.522061512583778, "global_step": 1217, "epoch": 28, "val_loss": 688067.25} {"train_loss": -2.2480807304382324, "global_step": 1218, "epoch": 29} {"train_loss": -2.3917717933654785, "global_step": 1219, "epoch": 29} {"train_loss": -2.200014114379883, "global_step": 1220, "epoch": 29} {"train_loss": -2.3583714962005615, "global_step": 1221, "epoch": 29} {"train_loss": -2.320535182952881, "global_step": 1222, "epoch": 29} {"train_loss": -2.381657600402832, "global_step": 1223, "epoch": 29} {"train_loss": -2.303586959838867, "global_step": 1224, "epoch": 29} {"train_loss": -2.2281155586242676, "global_step": 1225, "epoch": 29} {"train_loss": -2.412128448486328, "global_step": 1226, "epoch": 29} {"train_loss": -2.4167985916137695, "global_step": 1227, "epoch": 29} {"train_loss": -2.2244338989257812, "global_step": 1228, "epoch": 29} {"train_loss": -2.4852395057678223, "global_step": 1229, "epoch": 29} {"train_loss": -2.3979461193084717, "global_step": 1230, "epoch": 29} {"train_loss": -2.356462240219116, "global_step": 1231, "epoch": 29} {"train_loss": -2.525503635406494, "global_step": 1232, "epoch": 29} {"train_loss": -2.433257579803467, "global_step": 1233, "epoch": 29} {"train_loss": -2.533329963684082, "global_step": 1234, "epoch": 29} {"train_loss": -2.5236005783081055, "global_step": 1235, "epoch": 29} {"train_loss": -2.5037472248077393, "global_step": 1236, "epoch": 29} {"train_loss": -2.3823938369750977, "global_step": 1237, "epoch": 29} {"train_loss": -2.485548973083496, "global_step": 1238, "epoch": 29} {"train_loss": -2.5627858638763428, "global_step": 1239, "epoch": 29} {"train_loss": -2.36476469039917, "global_step": 1240, "epoch": 29} {"train_loss": -2.5482258796691895, "global_step": 1241, "epoch": 29} {"train_loss": -2.6645467281341553, "global_step": 1242, "epoch": 29} {"train_loss": -2.5542187690734863, "global_step": 1243, "epoch": 29} {"train_loss": -2.6845197677612305, "global_step": 1244, "epoch": 29} {"train_loss": -2.549851894378662, "global_step": 1245, "epoch": 29} {"train_loss": -2.618640661239624, "global_step": 1246, "epoch": 29} {"train_loss": -2.582843542098999, "global_step": 1247, "epoch": 29} {"train_loss": -2.567782402038574, "global_step": 1248, "epoch": 29} {"train_loss": -2.608916759490967, "global_step": 1249, "epoch": 29} {"train_loss": -2.5195627212524414, "global_step": 1250, "epoch": 29} {"train_loss": -2.486905574798584, "global_step": 1251, "epoch": 29} {"train_loss": -2.5152828693389893, "global_step": 1252, "epoch": 29} {"train_loss": -2.443418025970459, "global_step": 1253, "epoch": 29} {"train_loss": -2.4824657440185547, "global_step": 1254, "epoch": 29} {"train_loss": -2.327486991882324, "global_step": 1255, "epoch": 29} {"train_loss": -2.5232324600219727, "global_step": 1256, "epoch": 29} {"train_loss": -2.296712875366211, "global_step": 1257, "epoch": 29} {"train_loss": -2.57125186920166, "global_step": 1258, "epoch": 29} {"train_loss": -2.452982715197972, "global_step": 1259, "epoch": 29, "val_loss": 635007.1875} {"train_loss": -2.6256747245788574, "global_step": 1260, "epoch": 30} {"train_loss": -2.3629701137542725, "global_step": 1261, "epoch": 30} {"train_loss": -2.4655349254608154, "global_step": 1262, "epoch": 30} {"train_loss": -2.577476978302002, "global_step": 1263, "epoch": 30} {"train_loss": -2.4269485473632812, "global_step": 1264, "epoch": 30} {"train_loss": -2.553706645965576, "global_step": 1265, "epoch": 30} {"train_loss": -2.376741409301758, "global_step": 1266, "epoch": 30} {"train_loss": -2.574538230895996, "global_step": 1267, "epoch": 30} {"train_loss": -2.522181510925293, "global_step": 1268, "epoch": 30} {"train_loss": -2.4014716148376465, "global_step": 1269, "epoch": 30} {"train_loss": -2.5930838584899902, "global_step": 1270, "epoch": 30} {"train_loss": -2.4337902069091797, "global_step": 1271, "epoch": 30} {"train_loss": -2.58518123626709, "global_step": 1272, "epoch": 30} {"train_loss": -2.585911750793457, "global_step": 1273, "epoch": 30} {"train_loss": -2.5880749225616455, "global_step": 1274, "epoch": 30} {"train_loss": -2.595529794692993, "global_step": 1275, "epoch": 30} {"train_loss": -2.6520233154296875, "global_step": 1276, "epoch": 30} {"train_loss": -2.655785083770752, "global_step": 1277, "epoch": 30} {"train_loss": -2.5609610080718994, "global_step": 1278, "epoch": 30} {"train_loss": -2.614175796508789, "global_step": 1279, "epoch": 30} {"train_loss": -2.565398693084717, "global_step": 1280, "epoch": 30} {"train_loss": -2.633704662322998, "global_step": 1281, "epoch": 30} {"train_loss": -2.6644225120544434, "global_step": 1282, "epoch": 30} {"train_loss": -2.6813137531280518, "global_step": 1283, "epoch": 30} {"train_loss": -2.643167495727539, "global_step": 1284, "epoch": 30} {"train_loss": -2.5791056156158447, "global_step": 1285, "epoch": 30} {"train_loss": -2.6551671028137207, "global_step": 1286, "epoch": 30} {"train_loss": -2.5324840545654297, "global_step": 1287, "epoch": 30} {"train_loss": -2.62223219871521, "global_step": 1288, "epoch": 30} {"train_loss": -2.754640579223633, "global_step": 1289, "epoch": 30} {"train_loss": -2.465217113494873, "global_step": 1290, "epoch": 30} {"train_loss": -2.5906453132629395, "global_step": 1291, "epoch": 30} {"train_loss": -2.713036298751831, "global_step": 1292, "epoch": 30} {"train_loss": -2.52838134765625, "global_step": 1293, "epoch": 30} {"train_loss": -2.5872106552124023, "global_step": 1294, "epoch": 30} {"train_loss": -2.7824039459228516, "global_step": 1295, "epoch": 30} {"train_loss": -2.571298599243164, "global_step": 1296, "epoch": 30} {"train_loss": -2.62322998046875, "global_step": 1297, "epoch": 30} {"train_loss": -2.604541778564453, "global_step": 1298, "epoch": 30} {"train_loss": -2.659768581390381, "global_step": 1299, "epoch": 30} {"train_loss": -2.4501595497131348, "global_step": 1300, "epoch": 30} {"train_loss": -2.5797283365612937, "global_step": 1301, "epoch": 30, "val_loss": 580412.125} {"train_loss": -2.6223068237304688, "global_step": 1302, "epoch": 31} {"train_loss": -2.403402090072632, "global_step": 1303, "epoch": 31} {"train_loss": -2.5939536094665527, "global_step": 1304, "epoch": 31} {"train_loss": -2.450777530670166, "global_step": 1305, "epoch": 31} {"train_loss": -2.6094579696655273, "global_step": 1306, "epoch": 31} {"train_loss": -2.558302402496338, "global_step": 1307, "epoch": 31} {"train_loss": -2.4928579330444336, "global_step": 1308, "epoch": 31} {"train_loss": -2.5968329906463623, "global_step": 1309, "epoch": 31} {"train_loss": -2.671006202697754, "global_step": 1310, "epoch": 31} {"train_loss": -2.5082204341888428, "global_step": 1311, "epoch": 31} {"train_loss": -2.759972095489502, "global_step": 1312, "epoch": 31} {"train_loss": -2.5722286701202393, "global_step": 1313, "epoch": 31} {"train_loss": -2.731992721557617, "global_step": 1314, "epoch": 31} {"train_loss": -2.7152693271636963, "global_step": 1315, "epoch": 31} {"train_loss": -2.6404664516448975, "global_step": 1316, "epoch": 31} {"train_loss": -2.6570916175842285, "global_step": 1317, "epoch": 31} {"train_loss": -2.6233773231506348, "global_step": 1318, "epoch": 31} {"train_loss": -2.760361671447754, "global_step": 1319, "epoch": 31} {"train_loss": -2.8354320526123047, "global_step": 1320, "epoch": 31} {"train_loss": -2.8064355850219727, "global_step": 1321, "epoch": 31} {"train_loss": -2.7842278480529785, "global_step": 1322, "epoch": 31} {"train_loss": -2.6753907203674316, "global_step": 1323, "epoch": 31} {"train_loss": -2.739835023880005, "global_step": 1324, "epoch": 31} {"train_loss": -2.6452345848083496, "global_step": 1325, "epoch": 31} {"train_loss": -2.787541151046753, "global_step": 1326, "epoch": 31} {"train_loss": -2.7464256286621094, "global_step": 1327, "epoch": 31} {"train_loss": -2.688239097595215, "global_step": 1328, "epoch": 31} {"train_loss": -2.4927685260772705, "global_step": 1329, "epoch": 31} {"train_loss": -2.627883195877075, "global_step": 1330, "epoch": 31} {"train_loss": -2.715585231781006, "global_step": 1331, "epoch": 31} {"train_loss": -2.4348297119140625, "global_step": 1332, "epoch": 31} {"train_loss": -2.6384031772613525, "global_step": 1333, "epoch": 31} {"train_loss": -2.62858510017395, "global_step": 1334, "epoch": 31} {"train_loss": -2.7227394580841064, "global_step": 1335, "epoch": 31} {"train_loss": -2.7736563682556152, "global_step": 1336, "epoch": 31} {"train_loss": -2.366243362426758, "global_step": 1337, "epoch": 31} {"train_loss": -2.6922097206115723, "global_step": 1338, "epoch": 31} {"train_loss": -2.378300666809082, "global_step": 1339, "epoch": 31} {"train_loss": -2.6131410598754883, "global_step": 1340, "epoch": 31} {"train_loss": -2.4014272689819336, "global_step": 1341, "epoch": 31} {"train_loss": -2.4391448497772217, "global_step": 1342, "epoch": 31} {"train_loss": -2.6234112126486644, "global_step": 1343, "epoch": 31, "val_loss": 578639.6875} {"train_loss": -2.254378318786621, "global_step": 1344, "epoch": 32} {"train_loss": -2.558379650115967, "global_step": 1345, "epoch": 32} {"train_loss": -2.4403648376464844, "global_step": 1346, "epoch": 32} {"train_loss": -2.5828609466552734, "global_step": 1347, "epoch": 32} {"train_loss": -2.436222553253174, "global_step": 1348, "epoch": 32} {"train_loss": -2.3099522590637207, "global_step": 1349, "epoch": 32} {"train_loss": -2.587985038757324, "global_step": 1350, "epoch": 32} {"train_loss": -2.4512033462524414, "global_step": 1351, "epoch": 32} {"train_loss": -2.4173412322998047, "global_step": 1352, "epoch": 32} {"train_loss": -2.5479912757873535, "global_step": 1353, "epoch": 32} {"train_loss": -2.3965039253234863, "global_step": 1354, "epoch": 32} {"train_loss": -2.5324554443359375, "global_step": 1355, "epoch": 32} {"train_loss": -2.67004656791687, "global_step": 1356, "epoch": 32} {"train_loss": -2.4907422065734863, "global_step": 1357, "epoch": 32} {"train_loss": -2.5827696323394775, "global_step": 1358, "epoch": 32} {"train_loss": -2.6701090335845947, "global_step": 1359, "epoch": 32} {"train_loss": -2.697518825531006, "global_step": 1360, "epoch": 32} {"train_loss": -2.6623172760009766, "global_step": 1361, "epoch": 32} {"train_loss": -2.664613723754883, "global_step": 1362, "epoch": 32} {"train_loss": -2.6568875312805176, "global_step": 1363, "epoch": 32} {"train_loss": -2.6021275520324707, "global_step": 1364, "epoch": 32} {"train_loss": -2.751098155975342, "global_step": 1365, "epoch": 32} {"train_loss": -2.639669418334961, "global_step": 1366, "epoch": 32} {"train_loss": -2.6225943565368652, "global_step": 1367, "epoch": 32} {"train_loss": -2.648663282394409, "global_step": 1368, "epoch": 32} {"train_loss": -2.7204694747924805, "global_step": 1369, "epoch": 32} {"train_loss": -2.722687244415283, "global_step": 1370, "epoch": 32} {"train_loss": -2.896538734436035, "global_step": 1371, "epoch": 32} {"train_loss": -2.5960264205932617, "global_step": 1372, "epoch": 32} {"train_loss": -2.7643165588378906, "global_step": 1373, "epoch": 32} {"train_loss": -2.7694039344787598, "global_step": 1374, "epoch": 32} {"train_loss": -2.567507266998291, "global_step": 1375, "epoch": 32} {"train_loss": -2.7672648429870605, "global_step": 1376, "epoch": 32} {"train_loss": -2.716061592102051, "global_step": 1377, "epoch": 32} {"train_loss": -2.7244722843170166, "global_step": 1378, "epoch": 32} {"train_loss": -2.711059808731079, "global_step": 1379, "epoch": 32} {"train_loss": -2.8226866722106934, "global_step": 1380, "epoch": 32} {"train_loss": -2.6454057693481445, "global_step": 1381, "epoch": 32} {"train_loss": -2.855377674102783, "global_step": 1382, "epoch": 32} {"train_loss": -2.841728925704956, "global_step": 1383, "epoch": 32} {"train_loss": -2.6913511753082275, "global_step": 1384, "epoch": 32} {"train_loss": -2.6308547939573015, "global_step": 1385, "epoch": 32, "val_loss": 517876.4375} {"train_loss": -2.593977451324463, "global_step": 1386, "epoch": 33} {"train_loss": -2.551818370819092, "global_step": 1387, "epoch": 33} {"train_loss": -2.745677947998047, "global_step": 1388, "epoch": 33} {"train_loss": -2.6835777759552, "global_step": 1389, "epoch": 33} {"train_loss": -2.484405517578125, "global_step": 1390, "epoch": 33} {"train_loss": -2.7464749813079834, "global_step": 1391, "epoch": 33} {"train_loss": -2.4022533893585205, "global_step": 1392, "epoch": 33} {"train_loss": -2.7325992584228516, "global_step": 1393, "epoch": 33} {"train_loss": -2.222001075744629, "global_step": 1394, "epoch": 33} {"train_loss": -2.5193357467651367, "global_step": 1395, "epoch": 33} {"train_loss": -2.2464356422424316, "global_step": 1396, "epoch": 33} {"train_loss": -2.4645915031433105, "global_step": 1397, "epoch": 33} {"train_loss": -2.50710391998291, "global_step": 1398, "epoch": 33} {"train_loss": -2.3216423988342285, "global_step": 1399, "epoch": 33} {"train_loss": -2.551100969314575, "global_step": 1400, "epoch": 33} {"train_loss": -2.652863025665283, "global_step": 1401, "epoch": 33} {"train_loss": -2.4645755290985107, "global_step": 1402, "epoch": 33} {"train_loss": -2.639274835586548, "global_step": 1403, "epoch": 33} {"train_loss": -2.658010959625244, "global_step": 1404, "epoch": 33} {"train_loss": -2.4137115478515625, "global_step": 1405, "epoch": 33} {"train_loss": -2.7758233547210693, "global_step": 1406, "epoch": 33} {"train_loss": -2.5269317626953125, "global_step": 1407, "epoch": 33} {"train_loss": -2.7416903972625732, "global_step": 1408, "epoch": 33} {"train_loss": -2.7241907119750977, "global_step": 1409, "epoch": 33} {"train_loss": -2.6724765300750732, "global_step": 1410, "epoch": 33} {"train_loss": -2.698793888092041, "global_step": 1411, "epoch": 33} {"train_loss": -2.7276954650878906, "global_step": 1412, "epoch": 33} {"train_loss": -2.7426276206970215, "global_step": 1413, "epoch": 33} {"train_loss": -2.748384952545166, "global_step": 1414, "epoch": 33} {"train_loss": -2.6347975730895996, "global_step": 1415, "epoch": 33} {"train_loss": -2.8041863441467285, "global_step": 1416, "epoch": 33} {"train_loss": -2.7405593395233154, "global_step": 1417, "epoch": 33} {"train_loss": -2.651766061782837, "global_step": 1418, "epoch": 33} {"train_loss": -2.813077926635742, "global_step": 1419, "epoch": 33} {"train_loss": -2.7905068397521973, "global_step": 1420, "epoch": 33} {"train_loss": -2.759028911590576, "global_step": 1421, "epoch": 33} {"train_loss": -2.7697360515594482, "global_step": 1422, "epoch": 33} {"train_loss": -2.7625558376312256, "global_step": 1423, "epoch": 33} {"train_loss": -2.6554903984069824, "global_step": 1424, "epoch": 33} {"train_loss": -2.874572277069092, "global_step": 1425, "epoch": 33} {"train_loss": -2.7654027938842773, "global_step": 1426, "epoch": 33} {"train_loss": -2.6346353462764194, "global_step": 1427, "epoch": 33, "val_loss": 481259.625} {"train_loss": -2.6564557552337646, "global_step": 1428, "epoch": 34} {"train_loss": -2.794220447540283, "global_step": 1429, "epoch": 34} {"train_loss": -2.879425287246704, "global_step": 1430, "epoch": 34} {"train_loss": -2.8403525352478027, "global_step": 1431, "epoch": 34} {"train_loss": -2.748910427093506, "global_step": 1432, "epoch": 34} {"train_loss": -2.820248603820801, "global_step": 1433, "epoch": 34} {"train_loss": -2.7738819122314453, "global_step": 1434, "epoch": 34} {"train_loss": -2.788472890853882, "global_step": 1435, "epoch": 34} {"train_loss": -2.792168140411377, "global_step": 1436, "epoch": 34} {"train_loss": -2.7741622924804688, "global_step": 1437, "epoch": 34} {"train_loss": -2.690678834915161, "global_step": 1438, "epoch": 34} {"train_loss": -2.8405466079711914, "global_step": 1439, "epoch": 34} {"train_loss": -2.8579611778259277, "global_step": 1440, "epoch": 34} {"train_loss": -2.598433017730713, "global_step": 1441, "epoch": 34} {"train_loss": -2.848381996154785, "global_step": 1442, "epoch": 34} {"train_loss": -2.421971082687378, "global_step": 1443, "epoch": 34} {"train_loss": -2.8891055583953857, "global_step": 1444, "epoch": 34} {"train_loss": -2.313666343688965, "global_step": 1445, "epoch": 34} {"train_loss": -2.713468074798584, "global_step": 1446, "epoch": 34} {"train_loss": -2.1449942588806152, "global_step": 1447, "epoch": 34} {"train_loss": -2.6765823364257812, "global_step": 1448, "epoch": 34} {"train_loss": -2.2268428802490234, "global_step": 1449, "epoch": 34} {"train_loss": -2.2064590454101562, "global_step": 1450, "epoch": 34} {"train_loss": -2.4647908210754395, "global_step": 1451, "epoch": 34} {"train_loss": -2.5414998531341553, "global_step": 1452, "epoch": 34} {"train_loss": -2.585825204849243, "global_step": 1453, "epoch": 34} {"train_loss": -2.6942782402038574, "global_step": 1454, "epoch": 34} {"train_loss": -2.6010396480560303, "global_step": 1455, "epoch": 34} {"train_loss": -2.5838305950164795, "global_step": 1456, "epoch": 34} {"train_loss": -2.6777098178863525, "global_step": 1457, "epoch": 34} {"train_loss": -2.5840423107147217, "global_step": 1458, "epoch": 34} {"train_loss": -2.747936725616455, "global_step": 1459, "epoch": 34} {"train_loss": -2.6609673500061035, "global_step": 1460, "epoch": 34} {"train_loss": -2.7619738578796387, "global_step": 1461, "epoch": 34} {"train_loss": -2.789638042449951, "global_step": 1462, "epoch": 34} {"train_loss": -2.6677093505859375, "global_step": 1463, "epoch": 34} {"train_loss": -2.7571001052856445, "global_step": 1464, "epoch": 34} {"train_loss": -2.7294583320617676, "global_step": 1465, "epoch": 34} {"train_loss": -2.697645664215088, "global_step": 1466, "epoch": 34} {"train_loss": -2.752523183822632, "global_step": 1467, "epoch": 34} {"train_loss": -2.704193115234375, "global_step": 1468, "epoch": 34} {"train_loss": -2.665498966262454, "global_step": 1469, "epoch": 34, "val_loss": 448039.3125} {"train_loss": -2.927730083465576, "global_step": 1470, "epoch": 35} {"train_loss": -2.814061164855957, "global_step": 1471, "epoch": 35} {"train_loss": -2.886404037475586, "global_step": 1472, "epoch": 35} {"train_loss": -2.6910712718963623, "global_step": 1473, "epoch": 35} {"train_loss": -2.8150854110717773, "global_step": 1474, "epoch": 35} {"train_loss": -2.8026480674743652, "global_step": 1475, "epoch": 35} {"train_loss": -2.9618868827819824, "global_step": 1476, "epoch": 35} {"train_loss": -2.8566980361938477, "global_step": 1477, "epoch": 35} {"train_loss": -2.6363940238952637, "global_step": 1478, "epoch": 35} {"train_loss": -2.7913424968719482, "global_step": 1479, "epoch": 35} {"train_loss": -2.73812198638916, "global_step": 1480, "epoch": 35} {"train_loss": -2.8398430347442627, "global_step": 1481, "epoch": 35} {"train_loss": -2.8250670433044434, "global_step": 1482, "epoch": 35} {"train_loss": -2.866532802581787, "global_step": 1483, "epoch": 35} {"train_loss": -2.6128063201904297, "global_step": 1484, "epoch": 35} {"train_loss": -2.857548952102661, "global_step": 1485, "epoch": 35} {"train_loss": -2.5441651344299316, "global_step": 1486, "epoch": 35} {"train_loss": -2.742724895477295, "global_step": 1487, "epoch": 35} {"train_loss": -2.85178279876709, "global_step": 1488, "epoch": 35} {"train_loss": -2.725759267807007, "global_step": 1489, "epoch": 35} {"train_loss": -2.816985845565796, "global_step": 1490, "epoch": 35} {"train_loss": -2.8138933181762695, "global_step": 1491, "epoch": 35} {"train_loss": -2.799814224243164, "global_step": 1492, "epoch": 35} {"train_loss": -2.7823495864868164, "global_step": 1493, "epoch": 35} {"train_loss": -2.7580480575561523, "global_step": 1494, "epoch": 35} {"train_loss": -2.879918098449707, "global_step": 1495, "epoch": 35} {"train_loss": -2.656468152999878, "global_step": 1496, "epoch": 35} {"train_loss": -2.763774871826172, "global_step": 1497, "epoch": 35} {"train_loss": -2.833651065826416, "global_step": 1498, "epoch": 35} {"train_loss": -2.8056020736694336, "global_step": 1499, "epoch": 35} {"train_loss": -2.782532215118408, "global_step": 1500, "epoch": 35} {"train_loss": -2.763629913330078, "global_step": 1501, "epoch": 35} {"train_loss": -2.825589418411255, "global_step": 1502, "epoch": 35} {"train_loss": -2.68048095703125, "global_step": 1503, "epoch": 35} {"train_loss": -2.8179068565368652, "global_step": 1504, "epoch": 35} {"train_loss": -2.7570042610168457, "global_step": 1505, "epoch": 35} {"train_loss": -2.9029388427734375, "global_step": 1506, "epoch": 35} {"train_loss": -2.827333450317383, "global_step": 1507, "epoch": 35} {"train_loss": -2.725621461868286, "global_step": 1508, "epoch": 35} {"train_loss": -2.805858850479126, "global_step": 1509, "epoch": 35} {"train_loss": -2.857769250869751, "global_step": 1510, "epoch": 35} {"train_loss": -2.7928349404107955, "global_step": 1511, "epoch": 35, "val_loss": 419274.0625} {"train_loss": -2.885606050491333, "global_step": 1512, "epoch": 36} {"train_loss": -2.87013578414917, "global_step": 1513, "epoch": 36} {"train_loss": -2.7854971885681152, "global_step": 1514, "epoch": 36} {"train_loss": -2.873500108718872, "global_step": 1515, "epoch": 36} {"train_loss": -2.9133591651916504, "global_step": 1516, "epoch": 36} {"train_loss": -2.8051204681396484, "global_step": 1517, "epoch": 36} {"train_loss": -2.8614883422851562, "global_step": 1518, "epoch": 36} {"train_loss": -2.877488851547241, "global_step": 1519, "epoch": 36} {"train_loss": -2.8343539237976074, "global_step": 1520, "epoch": 36} {"train_loss": -2.9819087982177734, "global_step": 1521, "epoch": 36} {"train_loss": -2.884366989135742, "global_step": 1522, "epoch": 36} {"train_loss": -2.890094041824341, "global_step": 1523, "epoch": 36} {"train_loss": -2.8581504821777344, "global_step": 1524, "epoch": 36} {"train_loss": -2.866464376449585, "global_step": 1525, "epoch": 36} {"train_loss": -2.9281749725341797, "global_step": 1526, "epoch": 36} {"train_loss": -2.9194655418395996, "global_step": 1527, "epoch": 36} {"train_loss": -2.799907684326172, "global_step": 1528, "epoch": 36} {"train_loss": -2.9096641540527344, "global_step": 1529, "epoch": 36} {"train_loss": -3.027325391769409, "global_step": 1530, "epoch": 36} {"train_loss": -2.826904296875, "global_step": 1531, "epoch": 36} {"train_loss": -2.8194427490234375, "global_step": 1532, "epoch": 36} {"train_loss": -2.8735764026641846, "global_step": 1533, "epoch": 36} {"train_loss": -2.843003511428833, "global_step": 1534, "epoch": 36} {"train_loss": -2.9410228729248047, "global_step": 1535, "epoch": 36} {"train_loss": -2.747953176498413, "global_step": 1536, "epoch": 36} {"train_loss": -2.9822285175323486, "global_step": 1537, "epoch": 36} {"train_loss": -2.712897539138794, "global_step": 1538, "epoch": 36} {"train_loss": -2.859370470046997, "global_step": 1539, "epoch": 36} {"train_loss": -2.9342048168182373, "global_step": 1540, "epoch": 36} {"train_loss": -2.9480514526367188, "global_step": 1541, "epoch": 36} {"train_loss": -2.8893823623657227, "global_step": 1542, "epoch": 36} {"train_loss": -2.8096208572387695, "global_step": 1543, "epoch": 36} {"train_loss": -2.893467903137207, "global_step": 1544, "epoch": 36} {"train_loss": -2.867426633834839, "global_step": 1545, "epoch": 36} {"train_loss": -3.0123343467712402, "global_step": 1546, "epoch": 36} {"train_loss": -2.882899761199951, "global_step": 1547, "epoch": 36} {"train_loss": -2.9660463333129883, "global_step": 1548, "epoch": 36} {"train_loss": -2.968647003173828, "global_step": 1549, "epoch": 36} {"train_loss": -2.792393445968628, "global_step": 1550, "epoch": 36} {"train_loss": -2.925586700439453, "global_step": 1551, "epoch": 36} {"train_loss": -2.7826573848724365, "global_step": 1552, "epoch": 36} {"train_loss": -2.8813615242640176, "global_step": 1553, "epoch": 36, "val_loss": 375685.8125} {"train_loss": -2.983888626098633, "global_step": 1554, "epoch": 37} {"train_loss": -2.9154536724090576, "global_step": 1555, "epoch": 37} {"train_loss": -3.0588855743408203, "global_step": 1556, "epoch": 37} {"train_loss": -2.9375619888305664, "global_step": 1557, "epoch": 37} {"train_loss": -2.914923667907715, "global_step": 1558, "epoch": 37} {"train_loss": -2.997019052505493, "global_step": 1559, "epoch": 37} {"train_loss": -2.7711973190307617, "global_step": 1560, "epoch": 37} {"train_loss": -2.978652000427246, "global_step": 1561, "epoch": 37} {"train_loss": -2.826702833175659, "global_step": 1562, "epoch": 37} {"train_loss": -2.873023748397827, "global_step": 1563, "epoch": 37} {"train_loss": -2.9055752754211426, "global_step": 1564, "epoch": 37} {"train_loss": -2.901294231414795, "global_step": 1565, "epoch": 37} {"train_loss": -2.7873971462249756, "global_step": 1566, "epoch": 37} {"train_loss": -2.9475135803222656, "global_step": 1567, "epoch": 37} {"train_loss": -2.9496631622314453, "global_step": 1568, "epoch": 37} {"train_loss": -2.968411922454834, "global_step": 1569, "epoch": 37} {"train_loss": -3.005866050720215, "global_step": 1570, "epoch": 37} {"train_loss": -2.9562597274780273, "global_step": 1571, "epoch": 37} {"train_loss": -3.0041215419769287, "global_step": 1572, "epoch": 37} {"train_loss": -3.046691417694092, "global_step": 1573, "epoch": 37} {"train_loss": -2.948427438735962, "global_step": 1574, "epoch": 37} {"train_loss": -2.8921773433685303, "global_step": 1575, "epoch": 37} {"train_loss": -3.0869574546813965, "global_step": 1576, "epoch": 37} {"train_loss": -2.9688363075256348, "global_step": 1577, "epoch": 37} {"train_loss": -2.9611287117004395, "global_step": 1578, "epoch": 37} {"train_loss": -3.0281426906585693, "global_step": 1579, "epoch": 37} {"train_loss": -2.874314785003662, "global_step": 1580, "epoch": 37} {"train_loss": -2.8181583881378174, "global_step": 1581, "epoch": 37} {"train_loss": -2.981196165084839, "global_step": 1582, "epoch": 37} {"train_loss": -2.8491272926330566, "global_step": 1583, "epoch": 37} {"train_loss": -2.8766894340515137, "global_step": 1584, "epoch": 37} {"train_loss": -2.9463863372802734, "global_step": 1585, "epoch": 37} {"train_loss": -2.9142844676971436, "global_step": 1586, "epoch": 37} {"train_loss": -2.9874119758605957, "global_step": 1587, "epoch": 37} {"train_loss": -2.9383740425109863, "global_step": 1588, "epoch": 37} {"train_loss": -2.8682563304901123, "global_step": 1589, "epoch": 37} {"train_loss": -2.939791202545166, "global_step": 1590, "epoch": 37} {"train_loss": -2.8877437114715576, "global_step": 1591, "epoch": 37} {"train_loss": -2.8699421882629395, "global_step": 1592, "epoch": 37} {"train_loss": -2.837228298187256, "global_step": 1593, "epoch": 37} {"train_loss": -2.8968892097473145, "global_step": 1594, "epoch": 37} {"train_loss": -2.9274358408791676, "global_step": 1595, "epoch": 37, "val_loss": 350969.03125} {"train_loss": -3.049049139022827, "global_step": 1596, "epoch": 38} {"train_loss": -2.9634358882904053, "global_step": 1597, "epoch": 38} {"train_loss": -3.062750816345215, "global_step": 1598, "epoch": 38} {"train_loss": -2.9347774982452393, "global_step": 1599, "epoch": 38} {"train_loss": -2.9924774169921875, "global_step": 1600, "epoch": 38} {"train_loss": -2.939887523651123, "global_step": 1601, "epoch": 38} {"train_loss": -2.9466285705566406, "global_step": 1602, "epoch": 38} {"train_loss": -2.963724374771118, "global_step": 1603, "epoch": 38} {"train_loss": -3.11553955078125, "global_step": 1604, "epoch": 38} {"train_loss": -3.144257068634033, "global_step": 1605, "epoch": 38} {"train_loss": -2.9200758934020996, "global_step": 1606, "epoch": 38} {"train_loss": -2.968787670135498, "global_step": 1607, "epoch": 38} {"train_loss": -3.0819921493530273, "global_step": 1608, "epoch": 38} {"train_loss": -2.886833906173706, "global_step": 1609, "epoch": 38} {"train_loss": -2.9479525089263916, "global_step": 1610, "epoch": 38} {"train_loss": -3.0306670665740967, "global_step": 1611, "epoch": 38} {"train_loss": -2.8758583068847656, "global_step": 1612, "epoch": 38} {"train_loss": -3.073988199234009, "global_step": 1613, "epoch": 38} {"train_loss": -2.6810078620910645, "global_step": 1614, "epoch": 38} {"train_loss": -2.9849958419799805, "global_step": 1615, "epoch": 38} {"train_loss": -2.87911319732666, "global_step": 1616, "epoch": 38} {"train_loss": -2.7948837280273438, "global_step": 1617, "epoch": 38} {"train_loss": -3.0285677909851074, "global_step": 1618, "epoch": 38} {"train_loss": -2.622339963912964, "global_step": 1619, "epoch": 38} {"train_loss": -2.9019317626953125, "global_step": 1620, "epoch": 38} {"train_loss": -2.6964359283447266, "global_step": 1621, "epoch": 38} {"train_loss": -2.6709399223327637, "global_step": 1622, "epoch": 38} {"train_loss": -2.8801474571228027, "global_step": 1623, "epoch": 38} {"train_loss": -2.8215298652648926, "global_step": 1624, "epoch": 38} {"train_loss": -2.8461008071899414, "global_step": 1625, "epoch": 38} {"train_loss": -2.801011085510254, "global_step": 1626, "epoch": 38} {"train_loss": -3.074497699737549, "global_step": 1627, "epoch": 38} {"train_loss": -2.7285470962524414, "global_step": 1628, "epoch": 38} {"train_loss": -2.9185051918029785, "global_step": 1629, "epoch": 38} {"train_loss": -2.894859790802002, "global_step": 1630, "epoch": 38} {"train_loss": -2.994337797164917, "global_step": 1631, "epoch": 38} {"train_loss": -2.9738974571228027, "global_step": 1632, "epoch": 38} {"train_loss": -2.9753475189208984, "global_step": 1633, "epoch": 38} {"train_loss": -2.8574352264404297, "global_step": 1634, "epoch": 38} {"train_loss": -2.974754810333252, "global_step": 1635, "epoch": 38} {"train_loss": -2.889193058013916, "global_step": 1636, "epoch": 38} {"train_loss": -2.921401710737319, "global_step": 1637, "epoch": 38, "val_loss": 316374.25} {"train_loss": -2.97507905960083, "global_step": 1638, "epoch": 39} {"train_loss": -2.918732166290283, "global_step": 1639, "epoch": 39} {"train_loss": -3.091766834259033, "global_step": 1640, "epoch": 39} {"train_loss": -2.996267557144165, "global_step": 1641, "epoch": 39} {"train_loss": -3.073293924331665, "global_step": 1642, "epoch": 39} {"train_loss": -2.971240282058716, "global_step": 1643, "epoch": 39} {"train_loss": -3.0822079181671143, "global_step": 1644, "epoch": 39} {"train_loss": -3.164930820465088, "global_step": 1645, "epoch": 39} {"train_loss": -2.9417693614959717, "global_step": 1646, "epoch": 39} {"train_loss": -3.06504225730896, "global_step": 1647, "epoch": 39} {"train_loss": -2.9984872341156006, "global_step": 1648, "epoch": 39} {"train_loss": -3.1562812328338623, "global_step": 1649, "epoch": 39} {"train_loss": -2.8909385204315186, "global_step": 1650, "epoch": 39} {"train_loss": -2.9654369354248047, "global_step": 1651, "epoch": 39} {"train_loss": -3.1665172576904297, "global_step": 1652, "epoch": 39} {"train_loss": -3.132800579071045, "global_step": 1653, "epoch": 39} {"train_loss": -2.8609182834625244, "global_step": 1654, "epoch": 39} {"train_loss": -2.9807510375976562, "global_step": 1655, "epoch": 39} {"train_loss": -2.8497531414031982, "global_step": 1656, "epoch": 39} {"train_loss": -3.047333240509033, "global_step": 1657, "epoch": 39} {"train_loss": -2.9445436000823975, "global_step": 1658, "epoch": 39} {"train_loss": -2.944430351257324, "global_step": 1659, "epoch": 39} {"train_loss": -3.0241246223449707, "global_step": 1660, "epoch": 39} {"train_loss": -2.739410400390625, "global_step": 1661, "epoch": 39} {"train_loss": -2.9812583923339844, "global_step": 1662, "epoch": 39} {"train_loss": -2.8902385234832764, "global_step": 1663, "epoch": 39} {"train_loss": -3.0174665451049805, "global_step": 1664, "epoch": 39} {"train_loss": -2.851210117340088, "global_step": 1665, "epoch": 39} {"train_loss": -2.9519519805908203, "global_step": 1666, "epoch": 39} {"train_loss": -2.820915937423706, "global_step": 1667, "epoch": 39} {"train_loss": -3.0002455711364746, "global_step": 1668, "epoch": 39} {"train_loss": -2.881749153137207, "global_step": 1669, "epoch": 39} {"train_loss": -3.150860548019409, "global_step": 1670, "epoch": 39} {"train_loss": -2.894721031188965, "global_step": 1671, "epoch": 39} {"train_loss": -2.972904682159424, "global_step": 1672, "epoch": 39} {"train_loss": -3.122084379196167, "global_step": 1673, "epoch": 39} {"train_loss": -3.047985553741455, "global_step": 1674, "epoch": 39} {"train_loss": -3.075594425201416, "global_step": 1675, "epoch": 39} {"train_loss": -3.0610694885253906, "global_step": 1676, "epoch": 39} {"train_loss": -3.0495810508728027, "global_step": 1677, "epoch": 39} {"train_loss": -2.846090793609619, "global_step": 1678, "epoch": 39} {"train_loss": -2.9893429960523332, "global_step": 1679, "epoch": 39, "val_loss": 304607.96875} {"train_loss": -3.1009325981140137, "global_step": 1680, "epoch": 40} {"train_loss": -2.917801856994629, "global_step": 1681, "epoch": 40} {"train_loss": -3.025327205657959, "global_step": 1682, "epoch": 40} {"train_loss": -3.1070735454559326, "global_step": 1683, "epoch": 40} {"train_loss": -2.896871328353882, "global_step": 1684, "epoch": 40} {"train_loss": -3.035515785217285, "global_step": 1685, "epoch": 40} {"train_loss": -2.810471534729004, "global_step": 1686, "epoch": 40} {"train_loss": -2.906177043914795, "global_step": 1687, "epoch": 40} {"train_loss": -3.063528060913086, "global_step": 1688, "epoch": 40} {"train_loss": -3.0241715908050537, "global_step": 1689, "epoch": 40} {"train_loss": -3.147883415222168, "global_step": 1690, "epoch": 40} {"train_loss": -3.1332201957702637, "global_step": 1691, "epoch": 40} {"train_loss": -3.0428168773651123, "global_step": 1692, "epoch": 40} {"train_loss": -3.102860927581787, "global_step": 1693, "epoch": 40} {"train_loss": -2.9803411960601807, "global_step": 1694, "epoch": 40} {"train_loss": -3.053196430206299, "global_step": 1695, "epoch": 40} {"train_loss": -3.144707679748535, "global_step": 1696, "epoch": 40} {"train_loss": -2.941166400909424, "global_step": 1697, "epoch": 40} {"train_loss": -3.0566396713256836, "global_step": 1698, "epoch": 40} {"train_loss": -3.0726265907287598, "global_step": 1699, "epoch": 40} {"train_loss": -3.117312431335449, "global_step": 1700, "epoch": 40} {"train_loss": -3.0252084732055664, "global_step": 1701, "epoch": 40} {"train_loss": -3.093614339828491, "global_step": 1702, "epoch": 40} {"train_loss": -3.09307861328125, "global_step": 1703, "epoch": 40} {"train_loss": -3.1369307041168213, "global_step": 1704, "epoch": 40} {"train_loss": -3.0395517349243164, "global_step": 1705, "epoch": 40} {"train_loss": -3.082395315170288, "global_step": 1706, "epoch": 40} {"train_loss": -3.13810658454895, "global_step": 1707, "epoch": 40} {"train_loss": -3.0554261207580566, "global_step": 1708, "epoch": 40} {"train_loss": -3.051698684692383, "global_step": 1709, "epoch": 40} {"train_loss": -3.1036159992218018, "global_step": 1710, "epoch": 40} {"train_loss": -3.14148211479187, "global_step": 1711, "epoch": 40} {"train_loss": -3.0365359783172607, "global_step": 1712, "epoch": 40} {"train_loss": -3.166672945022583, "global_step": 1713, "epoch": 40} {"train_loss": -3.0320334434509277, "global_step": 1714, "epoch": 40} {"train_loss": -3.015854597091675, "global_step": 1715, "epoch": 40} {"train_loss": -3.076231002807617, "global_step": 1716, "epoch": 40} {"train_loss": -3.001455783843994, "global_step": 1717, "epoch": 40} {"train_loss": -2.980184555053711, "global_step": 1718, "epoch": 40} {"train_loss": -3.0557565689086914, "global_step": 1719, "epoch": 40} {"train_loss": -3.156877279281616, "global_step": 1720, "epoch": 40} {"train_loss": -3.0539912382761636, "global_step": 1721, "epoch": 40, "val_loss": 290714.15625} {"train_loss": -3.005424976348877, "global_step": 1722, "epoch": 41} {"train_loss": -3.068819522857666, "global_step": 1723, "epoch": 41} {"train_loss": -3.194004535675049, "global_step": 1724, "epoch": 41} {"train_loss": -3.039351224899292, "global_step": 1725, "epoch": 41} {"train_loss": -3.2418370246887207, "global_step": 1726, "epoch": 41} {"train_loss": -3.0367789268493652, "global_step": 1727, "epoch": 41} {"train_loss": -3.1092424392700195, "global_step": 1728, "epoch": 41} {"train_loss": -3.185576915740967, "global_step": 1729, "epoch": 41} {"train_loss": -3.1724114418029785, "global_step": 1730, "epoch": 41} {"train_loss": -3.152090311050415, "global_step": 1731, "epoch": 41} {"train_loss": -2.969216823577881, "global_step": 1732, "epoch": 41} {"train_loss": -3.1305289268493652, "global_step": 1733, "epoch": 41} {"train_loss": -3.099886417388916, "global_step": 1734, "epoch": 41} {"train_loss": -3.2610952854156494, "global_step": 1735, "epoch": 41} {"train_loss": -3.2564518451690674, "global_step": 1736, "epoch": 41} {"train_loss": -3.035135269165039, "global_step": 1737, "epoch": 41} {"train_loss": -3.2304067611694336, "global_step": 1738, "epoch": 41} {"train_loss": -3.1427040100097656, "global_step": 1739, "epoch": 41} {"train_loss": -3.0404090881347656, "global_step": 1740, "epoch": 41} {"train_loss": -3.24191951751709, "global_step": 1741, "epoch": 41} {"train_loss": -3.0330452919006348, "global_step": 1742, "epoch": 41} {"train_loss": -3.036979913711548, "global_step": 1743, "epoch": 41} {"train_loss": -3.2195708751678467, "global_step": 1744, "epoch": 41} {"train_loss": -3.2292723655700684, "global_step": 1745, "epoch": 41} {"train_loss": -3.045361042022705, "global_step": 1746, "epoch": 41} {"train_loss": -3.1632397174835205, "global_step": 1747, "epoch": 41} {"train_loss": -3.063839912414551, "global_step": 1748, "epoch": 41} {"train_loss": -3.1624245643615723, "global_step": 1749, "epoch": 41} {"train_loss": -3.0008511543273926, "global_step": 1750, "epoch": 41} {"train_loss": -3.099789619445801, "global_step": 1751, "epoch": 41} {"train_loss": -3.089344024658203, "global_step": 1752, "epoch": 41} {"train_loss": -2.9628517627716064, "global_step": 1753, "epoch": 41} {"train_loss": -3.1317145824432373, "global_step": 1754, "epoch": 41} {"train_loss": -3.2104315757751465, "global_step": 1755, "epoch": 41} {"train_loss": -3.177206516265869, "global_step": 1756, "epoch": 41} {"train_loss": -3.0890233516693115, "global_step": 1757, "epoch": 41} {"train_loss": -3.015028953552246, "global_step": 1758, "epoch": 41} {"train_loss": -3.1799468994140625, "global_step": 1759, "epoch": 41} {"train_loss": -3.141725778579712, "global_step": 1760, "epoch": 41} {"train_loss": -3.075617790222168, "global_step": 1761, "epoch": 41} {"train_loss": -3.160172462463379, "global_step": 1762, "epoch": 41} {"train_loss": -3.119730302265712, "global_step": 1763, "epoch": 41, "val_loss": 296935.78125} {"train_loss": -3.1804237365722656, "global_step": 1764, "epoch": 42} {"train_loss": -3.0243773460388184, "global_step": 1765, "epoch": 42} {"train_loss": -3.1281380653381348, "global_step": 1766, "epoch": 42} {"train_loss": -3.1067545413970947, "global_step": 1767, "epoch": 42} {"train_loss": -3.1897411346435547, "global_step": 1768, "epoch": 42} {"train_loss": -3.16874623298645, "global_step": 1769, "epoch": 42} {"train_loss": -3.0393614768981934, "global_step": 1770, "epoch": 42} {"train_loss": -3.0755257606506348, "global_step": 1771, "epoch": 42} {"train_loss": -3.0201151371002197, "global_step": 1772, "epoch": 42} {"train_loss": -3.143616199493408, "global_step": 1773, "epoch": 42} {"train_loss": -2.981268882751465, "global_step": 1774, "epoch": 42} {"train_loss": -3.1464390754699707, "global_step": 1775, "epoch": 42} {"train_loss": -3.097538471221924, "global_step": 1776, "epoch": 42} {"train_loss": -3.0237154960632324, "global_step": 1777, "epoch": 42} {"train_loss": -3.243669271469116, "global_step": 1778, "epoch": 42} {"train_loss": -2.8722944259643555, "global_step": 1779, "epoch": 42} {"train_loss": -3.0805373191833496, "global_step": 1780, "epoch": 42} {"train_loss": -2.827180862426758, "global_step": 1781, "epoch": 42} {"train_loss": -3.130328893661499, "global_step": 1782, "epoch": 42} {"train_loss": -2.821772575378418, "global_step": 1783, "epoch": 42} {"train_loss": -2.999133586883545, "global_step": 1784, "epoch": 42} {"train_loss": -2.9012129306793213, "global_step": 1785, "epoch": 42} {"train_loss": -3.1783671379089355, "global_step": 1786, "epoch": 42} {"train_loss": -3.0334339141845703, "global_step": 1787, "epoch": 42} {"train_loss": -3.1990416049957275, "global_step": 1788, "epoch": 42} {"train_loss": -2.9006476402282715, "global_step": 1789, "epoch": 42} {"train_loss": -3.164918899536133, "global_step": 1790, "epoch": 42} {"train_loss": -2.8892898559570312, "global_step": 1791, "epoch": 42} {"train_loss": -3.0898356437683105, "global_step": 1792, "epoch": 42} {"train_loss": -3.1876654624938965, "global_step": 1793, "epoch": 42} {"train_loss": -3.0821282863616943, "global_step": 1794, "epoch": 42} {"train_loss": -3.127546787261963, "global_step": 1795, "epoch": 42} {"train_loss": -3.080348014831543, "global_step": 1796, "epoch": 42} {"train_loss": -3.0509984493255615, "global_step": 1797, "epoch": 42} {"train_loss": -3.0931854248046875, "global_step": 1798, "epoch": 42} {"train_loss": -3.2094104290008545, "global_step": 1799, "epoch": 42} {"train_loss": -3.1322498321533203, "global_step": 1800, "epoch": 42} {"train_loss": -3.0977962017059326, "global_step": 1801, "epoch": 42} {"train_loss": -3.1182875633239746, "global_step": 1802, "epoch": 42} {"train_loss": -3.2060046195983887, "global_step": 1803, "epoch": 42} {"train_loss": -3.0127835273742676, "global_step": 1804, "epoch": 42} {"train_loss": -3.0793299958819436, "global_step": 1805, "epoch": 42, "val_loss": 278986.40625} {"train_loss": -3.220881938934326, "global_step": 1806, "epoch": 43} {"train_loss": -3.0909199714660645, "global_step": 1807, "epoch": 43} {"train_loss": -3.1701979637145996, "global_step": 1808, "epoch": 43} {"train_loss": -3.1426472663879395, "global_step": 1809, "epoch": 43} {"train_loss": -3.1746504306793213, "global_step": 1810, "epoch": 43} {"train_loss": -3.100374221801758, "global_step": 1811, "epoch": 43} {"train_loss": -3.0617613792419434, "global_step": 1812, "epoch": 43} {"train_loss": -3.2082059383392334, "global_step": 1813, "epoch": 43} {"train_loss": -3.0512373447418213, "global_step": 1814, "epoch": 43} {"train_loss": -3.0939903259277344, "global_step": 1815, "epoch": 43} {"train_loss": -3.214777708053589, "global_step": 1816, "epoch": 43} {"train_loss": -3.1367805004119873, "global_step": 1817, "epoch": 43} {"train_loss": -3.0710067749023438, "global_step": 1818, "epoch": 43} {"train_loss": -3.1903269290924072, "global_step": 1819, "epoch": 43} {"train_loss": -3.0930967330932617, "global_step": 1820, "epoch": 43} {"train_loss": -3.2195754051208496, "global_step": 1821, "epoch": 43} {"train_loss": -3.1349668502807617, "global_step": 1822, "epoch": 43} {"train_loss": -3.1182682514190674, "global_step": 1823, "epoch": 43} {"train_loss": -3.2089123725891113, "global_step": 1824, "epoch": 43} {"train_loss": -3.1962037086486816, "global_step": 1825, "epoch": 43} {"train_loss": -3.1597609519958496, "global_step": 1826, "epoch": 43} {"train_loss": -3.2604470252990723, "global_step": 1827, "epoch": 43} {"train_loss": -3.127941131591797, "global_step": 1828, "epoch": 43} {"train_loss": -3.2088992595672607, "global_step": 1829, "epoch": 43} {"train_loss": -3.1660027503967285, "global_step": 1830, "epoch": 43} {"train_loss": -3.1756997108459473, "global_step": 1831, "epoch": 43} {"train_loss": -3.192389488220215, "global_step": 1832, "epoch": 43} {"train_loss": -3.230987071990967, "global_step": 1833, "epoch": 43} {"train_loss": -3.2092156410217285, "global_step": 1834, "epoch": 43} {"train_loss": -3.055935859680176, "global_step": 1835, "epoch": 43} {"train_loss": -3.2841572761535645, "global_step": 1836, "epoch": 43} {"train_loss": -3.235980987548828, "global_step": 1837, "epoch": 43} {"train_loss": -3.1686933040618896, "global_step": 1838, "epoch": 43} {"train_loss": -3.3137474060058594, "global_step": 1839, "epoch": 43} {"train_loss": -3.24788236618042, "global_step": 1840, "epoch": 43} {"train_loss": -3.1324892044067383, "global_step": 1841, "epoch": 43} {"train_loss": -3.2277121543884277, "global_step": 1842, "epoch": 43} {"train_loss": -3.1725001335144043, "global_step": 1843, "epoch": 43} {"train_loss": -3.1473875045776367, "global_step": 1844, "epoch": 43} {"train_loss": -3.0760703086853027, "global_step": 1845, "epoch": 43} {"train_loss": -3.1269278526306152, "global_step": 1846, "epoch": 43} {"train_loss": -3.164785856292361, "global_step": 1847, "epoch": 43, "val_loss": 278865.84375} {"train_loss": -2.9795913696289062, "global_step": 1848, "epoch": 44} {"train_loss": -3.18830943107605, "global_step": 1849, "epoch": 44} {"train_loss": -2.772616386413574, "global_step": 1850, "epoch": 44} {"train_loss": -2.99019193649292, "global_step": 1851, "epoch": 44} {"train_loss": -2.731666088104248, "global_step": 1852, "epoch": 44} {"train_loss": -3.253117799758911, "global_step": 1853, "epoch": 44} {"train_loss": -2.9956459999084473, "global_step": 1854, "epoch": 44} {"train_loss": -2.9602155685424805, "global_step": 1855, "epoch": 44} {"train_loss": -2.9844553470611572, "global_step": 1856, "epoch": 44} {"train_loss": -3.1347713470458984, "global_step": 1857, "epoch": 44} {"train_loss": -3.0986976623535156, "global_step": 1858, "epoch": 44} {"train_loss": -3.171621799468994, "global_step": 1859, "epoch": 44} {"train_loss": -3.0131072998046875, "global_step": 1860, "epoch": 44} {"train_loss": -3.262984275817871, "global_step": 1861, "epoch": 44} {"train_loss": -3.153656482696533, "global_step": 1862, "epoch": 44} {"train_loss": -3.1259632110595703, "global_step": 1863, "epoch": 44} {"train_loss": -3.1793012619018555, "global_step": 1864, "epoch": 44} {"train_loss": -3.2084903717041016, "global_step": 1865, "epoch": 44} {"train_loss": -3.1682491302490234, "global_step": 1866, "epoch": 44} {"train_loss": -3.153012275695801, "global_step": 1867, "epoch": 44} {"train_loss": -3.218390941619873, "global_step": 1868, "epoch": 44} {"train_loss": -3.209989309310913, "global_step": 1869, "epoch": 44} {"train_loss": -3.157042980194092, "global_step": 1870, "epoch": 44} {"train_loss": -3.139646530151367, "global_step": 1871, "epoch": 44} {"train_loss": -3.2962307929992676, "global_step": 1872, "epoch": 44} {"train_loss": -3.2751457691192627, "global_step": 1873, "epoch": 44} {"train_loss": -3.308042526245117, "global_step": 1874, "epoch": 44} {"train_loss": -3.283202648162842, "global_step": 1875, "epoch": 44} {"train_loss": -3.174546003341675, "global_step": 1876, "epoch": 44} {"train_loss": -3.221518039703369, "global_step": 1877, "epoch": 44} {"train_loss": -3.3098742961883545, "global_step": 1878, "epoch": 44} {"train_loss": -3.2216360569000244, "global_step": 1879, "epoch": 44} {"train_loss": -3.3737003803253174, "global_step": 1880, "epoch": 44} {"train_loss": -3.2995734214782715, "global_step": 1881, "epoch": 44} {"train_loss": -3.2638278007507324, "global_step": 1882, "epoch": 44} {"train_loss": -3.287594795227051, "global_step": 1883, "epoch": 44} {"train_loss": -3.263504981994629, "global_step": 1884, "epoch": 44} {"train_loss": -3.178834915161133, "global_step": 1885, "epoch": 44} {"train_loss": -3.2657957077026367, "global_step": 1886, "epoch": 44} {"train_loss": -3.3213870525360107, "global_step": 1887, "epoch": 44} {"train_loss": -3.1046090126037598, "global_step": 1888, "epoch": 44} {"train_loss": -3.1704168092636835, "global_step": 1889, "epoch": 44, "val_loss": 263949.15625} {"train_loss": -3.1226649284362793, "global_step": 1890, "epoch": 45} {"train_loss": -3.117013931274414, "global_step": 1891, "epoch": 45} {"train_loss": -3.0608632564544678, "global_step": 1892, "epoch": 45} {"train_loss": -3.467644214630127, "global_step": 1893, "epoch": 45} {"train_loss": -3.2997164726257324, "global_step": 1894, "epoch": 45} {"train_loss": -3.2597289085388184, "global_step": 1895, "epoch": 45} {"train_loss": -3.1122334003448486, "global_step": 1896, "epoch": 45} {"train_loss": -3.1984410285949707, "global_step": 1897, "epoch": 45} {"train_loss": -3.2561392784118652, "global_step": 1898, "epoch": 45} {"train_loss": -3.260037422180176, "global_step": 1899, "epoch": 45} {"train_loss": -3.246448516845703, "global_step": 1900, "epoch": 45} {"train_loss": -3.152153968811035, "global_step": 1901, "epoch": 45} {"train_loss": -3.2940688133239746, "global_step": 1902, "epoch": 45} {"train_loss": -3.157893419265747, "global_step": 1903, "epoch": 45} {"train_loss": -3.2241244316101074, "global_step": 1904, "epoch": 45} {"train_loss": -3.2595176696777344, "global_step": 1905, "epoch": 45} {"train_loss": -3.3066256046295166, "global_step": 1906, "epoch": 45} {"train_loss": -3.2238540649414062, "global_step": 1907, "epoch": 45} {"train_loss": -3.2713639736175537, "global_step": 1908, "epoch": 45} {"train_loss": -3.2236688137054443, "global_step": 1909, "epoch": 45} {"train_loss": -3.2563705444335938, "global_step": 1910, "epoch": 45} {"train_loss": -3.3327178955078125, "global_step": 1911, "epoch": 45} {"train_loss": -3.0919504165649414, "global_step": 1912, "epoch": 45} {"train_loss": -3.147944450378418, "global_step": 1913, "epoch": 45} {"train_loss": -3.228259563446045, "global_step": 1914, "epoch": 45} {"train_loss": -3.374326705932617, "global_step": 1915, "epoch": 45} {"train_loss": -3.275547504425049, "global_step": 1916, "epoch": 45} {"train_loss": -3.187971591949463, "global_step": 1917, "epoch": 45} {"train_loss": -3.368360996246338, "global_step": 1918, "epoch": 45} {"train_loss": -3.2675106525421143, "global_step": 1919, "epoch": 45} {"train_loss": -3.3141825199127197, "global_step": 1920, "epoch": 45} {"train_loss": -3.177353858947754, "global_step": 1921, "epoch": 45} {"train_loss": -3.1640565395355225, "global_step": 1922, "epoch": 45} {"train_loss": -3.292815685272217, "global_step": 1923, "epoch": 45} {"train_loss": -3.125732898712158, "global_step": 1924, "epoch": 45} {"train_loss": -3.348806858062744, "global_step": 1925, "epoch": 45} {"train_loss": -3.256812334060669, "global_step": 1926, "epoch": 45} {"train_loss": -3.330988645553589, "global_step": 1927, "epoch": 45} {"train_loss": -3.263594627380371, "global_step": 1928, "epoch": 45} {"train_loss": -3.1936912536621094, "global_step": 1929, "epoch": 45} {"train_loss": -3.1722021102905273, "global_step": 1930, "epoch": 45} {"train_loss": -3.236712694168091, "global_step": 1931, "epoch": 45, "val_loss": 265185.1875} {"train_loss": -3.3085010051727295, "global_step": 1932, "epoch": 46} {"train_loss": -3.189631938934326, "global_step": 1933, "epoch": 46} {"train_loss": -3.2651638984680176, "global_step": 1934, "epoch": 46} {"train_loss": -3.116215944290161, "global_step": 1935, "epoch": 46} {"train_loss": -3.3218846321105957, "global_step": 1936, "epoch": 46} {"train_loss": -3.3361172676086426, "global_step": 1937, "epoch": 46} {"train_loss": -3.3362631797790527, "global_step": 1938, "epoch": 46} {"train_loss": -3.180290699005127, "global_step": 1939, "epoch": 46} {"train_loss": -3.2500500679016113, "global_step": 1940, "epoch": 46} {"train_loss": -3.2786951065063477, "global_step": 1941, "epoch": 46} {"train_loss": -3.325294017791748, "global_step": 1942, "epoch": 46} {"train_loss": -3.373331308364868, "global_step": 1943, "epoch": 46} {"train_loss": -3.305387496948242, "global_step": 1944, "epoch": 46} {"train_loss": -3.2606000900268555, "global_step": 1945, "epoch": 46} {"train_loss": -3.28658127784729, "global_step": 1946, "epoch": 46} {"train_loss": -3.169192314147949, "global_step": 1947, "epoch": 46} {"train_loss": -3.2892343997955322, "global_step": 1948, "epoch": 46} {"train_loss": -3.286508798599243, "global_step": 1949, "epoch": 46} {"train_loss": -3.174933671951294, "global_step": 1950, "epoch": 46} {"train_loss": -3.1971616744995117, "global_step": 1951, "epoch": 46} {"train_loss": -3.2861878871917725, "global_step": 1952, "epoch": 46} {"train_loss": -3.285884380340576, "global_step": 1953, "epoch": 46} {"train_loss": -3.205338954925537, "global_step": 1954, "epoch": 46} {"train_loss": -3.3372292518615723, "global_step": 1955, "epoch": 46} {"train_loss": -3.1618118286132812, "global_step": 1956, "epoch": 46} {"train_loss": -3.266355037689209, "global_step": 1957, "epoch": 46} {"train_loss": -3.2906947135925293, "global_step": 1958, "epoch": 46} {"train_loss": -3.126518487930298, "global_step": 1959, "epoch": 46} {"train_loss": -3.300018310546875, "global_step": 1960, "epoch": 46} {"train_loss": -3.453693151473999, "global_step": 1961, "epoch": 46} {"train_loss": -3.400663375854492, "global_step": 1962, "epoch": 46} {"train_loss": -3.2743988037109375, "global_step": 1963, "epoch": 46} {"train_loss": -3.341695547103882, "global_step": 1964, "epoch": 46} {"train_loss": -3.1961700916290283, "global_step": 1965, "epoch": 46} {"train_loss": -3.317342758178711, "global_step": 1966, "epoch": 46} {"train_loss": -3.2826595306396484, "global_step": 1967, "epoch": 46} {"train_loss": -3.235105514526367, "global_step": 1968, "epoch": 46} {"train_loss": -3.1464169025421143, "global_step": 1969, "epoch": 46} {"train_loss": -3.171548366546631, "global_step": 1970, "epoch": 46} {"train_loss": -3.1741998195648193, "global_step": 1971, "epoch": 46} {"train_loss": -3.186589241027832, "global_step": 1972, "epoch": 46} {"train_loss": -3.2616291159675237, "global_step": 1973, "epoch": 46, "val_loss": 254904.90625} {"train_loss": -3.16336727142334, "global_step": 1974, "epoch": 47} {"train_loss": -3.3716318607330322, "global_step": 1975, "epoch": 47} {"train_loss": -3.16610050201416, "global_step": 1976, "epoch": 47} {"train_loss": -3.264345645904541, "global_step": 1977, "epoch": 47} {"train_loss": -3.284222364425659, "global_step": 1978, "epoch": 47} {"train_loss": -3.2022624015808105, "global_step": 1979, "epoch": 47} {"train_loss": -3.4365649223327637, "global_step": 1980, "epoch": 47} {"train_loss": -3.4010496139526367, "global_step": 1981, "epoch": 47} {"train_loss": -3.2540879249572754, "global_step": 1982, "epoch": 47} {"train_loss": -3.340120553970337, "global_step": 1983, "epoch": 47} {"train_loss": -3.330500841140747, "global_step": 1984, "epoch": 47} {"train_loss": -3.3515784740448, "global_step": 1985, "epoch": 47} {"train_loss": -3.262363910675049, "global_step": 1986, "epoch": 47} {"train_loss": -3.3477346897125244, "global_step": 1987, "epoch": 47} {"train_loss": -3.213210344314575, "global_step": 1988, "epoch": 47} {"train_loss": -3.43031644821167, "global_step": 1989, "epoch": 47} {"train_loss": -3.351807117462158, "global_step": 1990, "epoch": 47} {"train_loss": -3.3564748764038086, "global_step": 1991, "epoch": 47} {"train_loss": -3.4435501098632812, "global_step": 1992, "epoch": 47} {"train_loss": -3.3082714080810547, "global_step": 1993, "epoch": 47} {"train_loss": -3.3247859477996826, "global_step": 1994, "epoch": 47} {"train_loss": -3.336172342300415, "global_step": 1995, "epoch": 47} {"train_loss": -3.37760853767395, "global_step": 1996, "epoch": 47} {"train_loss": -3.1997663974761963, "global_step": 1997, "epoch": 47} {"train_loss": -3.3353989124298096, "global_step": 1998, "epoch": 47} {"train_loss": -3.0511226654052734, "global_step": 1999, "epoch": 47} {"train_loss": -3.24922251701355, "global_step": 2000, "epoch": 47} {"train_loss": -3.2710697650909424, "global_step": 2001, "epoch": 47} {"train_loss": -3.1753921508789062, "global_step": 2002, "epoch": 47} {"train_loss": -3.2394461631774902, "global_step": 2003, "epoch": 47} {"train_loss": -2.9352498054504395, "global_step": 2004, "epoch": 47} {"train_loss": -3.280884265899658, "global_step": 2005, "epoch": 47} {"train_loss": -3.0189881324768066, "global_step": 2006, "epoch": 47} {"train_loss": -3.3194503784179688, "global_step": 2007, "epoch": 47} {"train_loss": -2.9082751274108887, "global_step": 2008, "epoch": 47} {"train_loss": -3.3584184646606445, "global_step": 2009, "epoch": 47} {"train_loss": -2.917046070098877, "global_step": 2010, "epoch": 47} {"train_loss": -3.4498257637023926, "global_step": 2011, "epoch": 47} {"train_loss": -3.014333963394165, "global_step": 2012, "epoch": 47} {"train_loss": -3.3344898223876953, "global_step": 2013, "epoch": 47} {"train_loss": -2.980612277984619, "global_step": 2014, "epoch": 47} {"train_loss": -3.252238387153262, "global_step": 2015, "epoch": 47, "val_loss": 254496.46875} {"train_loss": -3.0613977909088135, "global_step": 2016, "epoch": 48} {"train_loss": -3.2522199153900146, "global_step": 2017, "epoch": 48} {"train_loss": -3.107811450958252, "global_step": 2018, "epoch": 48} {"train_loss": -3.163935661315918, "global_step": 2019, "epoch": 48} {"train_loss": -3.2312698364257812, "global_step": 2020, "epoch": 48} {"train_loss": -3.1978201866149902, "global_step": 2021, "epoch": 48} {"train_loss": -3.370990037918091, "global_step": 2022, "epoch": 48} {"train_loss": -3.1720738410949707, "global_step": 2023, "epoch": 48} {"train_loss": -3.2637195587158203, "global_step": 2024, "epoch": 48} {"train_loss": -3.2764737606048584, "global_step": 2025, "epoch": 48} {"train_loss": -3.2894439697265625, "global_step": 2026, "epoch": 48} {"train_loss": -3.2296009063720703, "global_step": 2027, "epoch": 48} {"train_loss": -3.2906992435455322, "global_step": 2028, "epoch": 48} {"train_loss": -3.256091833114624, "global_step": 2029, "epoch": 48} {"train_loss": -3.3823442459106445, "global_step": 2030, "epoch": 48} {"train_loss": -3.268620014190674, "global_step": 2031, "epoch": 48} {"train_loss": -3.367060422897339, "global_step": 2032, "epoch": 48} {"train_loss": -3.351205825805664, "global_step": 2033, "epoch": 48} {"train_loss": -3.342538833618164, "global_step": 2034, "epoch": 48} {"train_loss": -3.2654531002044678, "global_step": 2035, "epoch": 48} {"train_loss": -3.285989761352539, "global_step": 2036, "epoch": 48} {"train_loss": -3.4489176273345947, "global_step": 2037, "epoch": 48} {"train_loss": -3.270066738128662, "global_step": 2038, "epoch": 48} {"train_loss": -3.293398380279541, "global_step": 2039, "epoch": 48} {"train_loss": -3.2469515800476074, "global_step": 2040, "epoch": 48} {"train_loss": -3.453042984008789, "global_step": 2041, "epoch": 48} {"train_loss": -3.290341377258301, "global_step": 2042, "epoch": 48} {"train_loss": -3.3316311836242676, "global_step": 2043, "epoch": 48} {"train_loss": -3.3439574241638184, "global_step": 2044, "epoch": 48} {"train_loss": -3.3603169918060303, "global_step": 2045, "epoch": 48} {"train_loss": -3.373854637145996, "global_step": 2046, "epoch": 48} {"train_loss": -3.302337408065796, "global_step": 2047, "epoch": 48} {"train_loss": -3.3458824157714844, "global_step": 2048, "epoch": 48} {"train_loss": -3.253998041152954, "global_step": 2049, "epoch": 48} {"train_loss": -3.038090467453003, "global_step": 2050, "epoch": 48} {"train_loss": -3.4099764823913574, "global_step": 2051, "epoch": 48} {"train_loss": -3.060976266860962, "global_step": 2052, "epoch": 48} {"train_loss": -3.323697566986084, "global_step": 2053, "epoch": 48} {"train_loss": -3.2224621772766113, "global_step": 2054, "epoch": 48} {"train_loss": -3.2768161296844482, "global_step": 2055, "epoch": 48} {"train_loss": -3.4064643383026123, "global_step": 2056, "epoch": 48} {"train_loss": -3.2826349962325323, "global_step": 2057, "epoch": 48, "val_loss": 244479.96875} {"train_loss": -3.2826528549194336, "global_step": 2058, "epoch": 49} {"train_loss": -3.2382774353027344, "global_step": 2059, "epoch": 49} {"train_loss": -3.4562065601348877, "global_step": 2060, "epoch": 49} {"train_loss": -3.38037371635437, "global_step": 2061, "epoch": 49} {"train_loss": -3.4759163856506348, "global_step": 2062, "epoch": 49} {"train_loss": -3.4535698890686035, "global_step": 2063, "epoch": 49} {"train_loss": -3.3014187812805176, "global_step": 2064, "epoch": 49} {"train_loss": -3.314980983734131, "global_step": 2065, "epoch": 49} {"train_loss": -3.427201747894287, "global_step": 2066, "epoch": 49} {"train_loss": -3.3531546592712402, "global_step": 2067, "epoch": 49} {"train_loss": -3.377415180206299, "global_step": 2068, "epoch": 49} {"train_loss": -3.3367767333984375, "global_step": 2069, "epoch": 49} {"train_loss": -3.059943437576294, "global_step": 2070, "epoch": 49} {"train_loss": -3.4037117958068848, "global_step": 2071, "epoch": 49} {"train_loss": -3.37192440032959, "global_step": 2072, "epoch": 49} {"train_loss": -3.3247344493865967, "global_step": 2073, "epoch": 49} {"train_loss": -3.280474901199341, "global_step": 2074, "epoch": 49} {"train_loss": -3.447000026702881, "global_step": 2075, "epoch": 49} {"train_loss": -3.228065013885498, "global_step": 2076, "epoch": 49} {"train_loss": -3.4686756134033203, "global_step": 2077, "epoch": 49} {"train_loss": -3.3035426139831543, "global_step": 2078, "epoch": 49} {"train_loss": -3.4525952339172363, "global_step": 2079, "epoch": 49} {"train_loss": -3.4882211685180664, "global_step": 2080, "epoch": 49} {"train_loss": -3.3455681800842285, "global_step": 2081, "epoch": 49} {"train_loss": -3.3722963333129883, "global_step": 2082, "epoch": 49} {"train_loss": -3.382697105407715, "global_step": 2083, "epoch": 49} {"train_loss": -3.4841997623443604, "global_step": 2084, "epoch": 49} {"train_loss": -3.4185025691986084, "global_step": 2085, "epoch": 49} {"train_loss": -3.394577741622925, "global_step": 2086, "epoch": 49} {"train_loss": -3.459057331085205, "global_step": 2087, "epoch": 49} {"train_loss": -3.370692729949951, "global_step": 2088, "epoch": 49} {"train_loss": -3.401768684387207, "global_step": 2089, "epoch": 49} {"train_loss": -3.3268237113952637, "global_step": 2090, "epoch": 49} {"train_loss": -3.3333210945129395, "global_step": 2091, "epoch": 49} {"train_loss": -3.3292815685272217, "global_step": 2092, "epoch": 49} {"train_loss": -3.236377716064453, "global_step": 2093, "epoch": 49} {"train_loss": -3.4256110191345215, "global_step": 2094, "epoch": 49} {"train_loss": -3.4127678871154785, "global_step": 2095, "epoch": 49} {"train_loss": -3.4159114360809326, "global_step": 2096, "epoch": 49} {"train_loss": -3.3885722160339355, "global_step": 2097, "epoch": 49} {"train_loss": -3.348443031311035, "global_step": 2098, "epoch": 49} {"train_loss": -3.369043707847595, "global_step": 2099, "epoch": 49, "val_loss": 237172.78125} {"train_loss": -3.3295116424560547, "global_step": 2100, "epoch": 50} {"train_loss": -3.2583587169647217, "global_step": 2101, "epoch": 50} {"train_loss": -3.3034603595733643, "global_step": 2102, "epoch": 50} {"train_loss": -3.322970390319824, "global_step": 2103, "epoch": 50} {"train_loss": -3.447798728942871, "global_step": 2104, "epoch": 50} {"train_loss": -3.4986963272094727, "global_step": 2105, "epoch": 50} {"train_loss": -3.40971040725708, "global_step": 2106, "epoch": 50} {"train_loss": -3.479665756225586, "global_step": 2107, "epoch": 50} {"train_loss": -3.4494810104370117, "global_step": 2108, "epoch": 50} {"train_loss": -3.2974181175231934, "global_step": 2109, "epoch": 50} {"train_loss": -3.369079113006592, "global_step": 2110, "epoch": 50} {"train_loss": -3.411484718322754, "global_step": 2111, "epoch": 50} {"train_loss": -3.454699993133545, "global_step": 2112, "epoch": 50} {"train_loss": -3.4146242141723633, "global_step": 2113, "epoch": 50} {"train_loss": -3.523159980773926, "global_step": 2114, "epoch": 50} {"train_loss": -3.4509944915771484, "global_step": 2115, "epoch": 50} {"train_loss": -3.315136671066284, "global_step": 2116, "epoch": 50} {"train_loss": -3.3436858654022217, "global_step": 2117, "epoch": 50} {"train_loss": -3.4138622283935547, "global_step": 2118, "epoch": 50} {"train_loss": -3.2932488918304443, "global_step": 2119, "epoch": 50} {"train_loss": -3.404540538787842, "global_step": 2120, "epoch": 50} {"train_loss": -3.4125819206237793, "global_step": 2121, "epoch": 50} {"train_loss": -3.1890645027160645, "global_step": 2122, "epoch": 50} {"train_loss": -3.4378151893615723, "global_step": 2123, "epoch": 50} {"train_loss": -3.082095146179199, "global_step": 2124, "epoch": 50} {"train_loss": -3.3968348503112793, "global_step": 2125, "epoch": 50} {"train_loss": -2.974506378173828, "global_step": 2126, "epoch": 50} {"train_loss": -3.3912835121154785, "global_step": 2127, "epoch": 50} {"train_loss": -3.244825601577759, "global_step": 2128, "epoch": 50} {"train_loss": -3.2598352432250977, "global_step": 2129, "epoch": 50} {"train_loss": -3.0920493602752686, "global_step": 2130, "epoch": 50} {"train_loss": -3.2866599559783936, "global_step": 2131, "epoch": 50} {"train_loss": -3.130866050720215, "global_step": 2132, "epoch": 50} {"train_loss": -3.423762321472168, "global_step": 2133, "epoch": 50} {"train_loss": -3.1833159923553467, "global_step": 2134, "epoch": 50} {"train_loss": -3.533895492553711, "global_step": 2135, "epoch": 50} {"train_loss": -3.2245800495147705, "global_step": 2136, "epoch": 50} {"train_loss": -3.41314959526062, "global_step": 2137, "epoch": 50} {"train_loss": -3.244904041290283, "global_step": 2138, "epoch": 50} {"train_loss": -3.358947277069092, "global_step": 2139, "epoch": 50} {"train_loss": -3.3305301666259766, "global_step": 2140, "epoch": 50} {"train_loss": -3.33815868695577, "global_step": 2141, "epoch": 50, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.14481227047244885, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.2032837009859434, "test/sim_max_reward_4500000": 0.3306764201402872, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.08407624377311251, "test/sim_max_reward_4500005": 0.15726088871160182, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.022042664417251497, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.10494072644630777, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.059829530371475606, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0014229503881936034, "test/sim_max_reward_4500014": 0.16561182130584123, "test/sim_max_reward_4500015": 0.2068740991695013, "test/sim_max_reward_4500016": 0.014673951444623072, "test/sim_max_reward_4500017": 0.0005088640794565039, "test/sim_max_reward_4500018": 0.05709363961726909, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.633957324714304, "test/sim_max_reward_4500022": 0.4425348548675989, "test/sim_max_reward_4500023": 0.4450546492313242, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.05793061050651459, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.47520456521848425, "test/sim_max_reward_4500028": 0.3491665144579656, "test/sim_max_reward_4500029": 0.0789463994481237, "test/sim_max_reward_4500030": 0.3827990034651407, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.4062027966194239, "test/sim_max_reward_4500035": 0.0779606034003907, "test/sim_max_reward_4500036": 0.2508149116011357, "test/sim_max_reward_4500037": 0.0019583881496629102, "test/sim_max_reward_4500038": 0.2905453636705766, "test/sim_max_reward_4500039": 0.24150201944448685, "test/sim_max_reward_4500040": 0.0, "test/sim_max_reward_4500041": 0.0, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.11835209524473915, "test/sim_max_reward_4500046": 0.5980930049698718, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.09142870947616215, "test/mean_score": 0.13044084242663032, "val_loss": 235127.46875} {"train_loss": -3.4651031494140625, "global_step": 2142, "epoch": 51} {"train_loss": -3.441573143005371, "global_step": 2143, "epoch": 51} {"train_loss": -3.5367608070373535, "global_step": 2144, "epoch": 51} {"train_loss": -3.509164333343506, "global_step": 2145, "epoch": 51} {"train_loss": -3.4460530281066895, "global_step": 2146, "epoch": 51} {"train_loss": -3.4505109786987305, "global_step": 2147, "epoch": 51} {"train_loss": -3.3477015495300293, "global_step": 2148, "epoch": 51} {"train_loss": -3.5632851123809814, "global_step": 2149, "epoch": 51} {"train_loss": -3.5587143898010254, "global_step": 2150, "epoch": 51} {"train_loss": -3.3994925022125244, "global_step": 2151, "epoch": 51} {"train_loss": -3.457643747329712, "global_step": 2152, "epoch": 51} {"train_loss": -3.4729509353637695, "global_step": 2153, "epoch": 51} {"train_loss": -3.253415107727051, "global_step": 2154, "epoch": 51} {"train_loss": -3.274855375289917, "global_step": 2155, "epoch": 51} {"train_loss": -3.539903163909912, "global_step": 2156, "epoch": 51} {"train_loss": -3.341473340988159, "global_step": 2157, "epoch": 51} {"train_loss": -3.578429698944092, "global_step": 2158, "epoch": 51} {"train_loss": -3.4672915935516357, "global_step": 2159, "epoch": 51} {"train_loss": -3.3222954273223877, "global_step": 2160, "epoch": 51} {"train_loss": -3.4646525382995605, "global_step": 2161, "epoch": 51} {"train_loss": -3.4944231510162354, "global_step": 2162, "epoch": 51} {"train_loss": -3.202343702316284, "global_step": 2163, "epoch": 51} {"train_loss": -3.367187738418579, "global_step": 2164, "epoch": 51} {"train_loss": -3.388556957244873, "global_step": 2165, "epoch": 51} {"train_loss": -3.2859816551208496, "global_step": 2166, "epoch": 51} {"train_loss": -3.4734578132629395, "global_step": 2167, "epoch": 51} {"train_loss": -3.468163013458252, "global_step": 2168, "epoch": 51} {"train_loss": -3.3142917156219482, "global_step": 2169, "epoch": 51} {"train_loss": -3.318087100982666, "global_step": 2170, "epoch": 51} {"train_loss": -3.346489429473877, "global_step": 2171, "epoch": 51} {"train_loss": -3.3076977729797363, "global_step": 2172, "epoch": 51} {"train_loss": -3.4750919342041016, "global_step": 2173, "epoch": 51} {"train_loss": -3.343489170074463, "global_step": 2174, "epoch": 51} {"train_loss": -3.39920711517334, "global_step": 2175, "epoch": 51} {"train_loss": -3.0965261459350586, "global_step": 2176, "epoch": 51} {"train_loss": -3.4286201000213623, "global_step": 2177, "epoch": 51} {"train_loss": -3.2404892444610596, "global_step": 2178, "epoch": 51} {"train_loss": -3.3755664825439453, "global_step": 2179, "epoch": 51} {"train_loss": -3.298821449279785, "global_step": 2180, "epoch": 51} {"train_loss": -3.3493165969848633, "global_step": 2181, "epoch": 51} {"train_loss": -3.3400356769561768, "global_step": 2182, "epoch": 51} {"train_loss": -3.396148000444685, "global_step": 2183, "epoch": 51, "val_loss": 226804.125} {"train_loss": -3.43060564994812, "global_step": 2184, "epoch": 52} {"train_loss": -3.4844703674316406, "global_step": 2185, "epoch": 52} {"train_loss": -3.5072946548461914, "global_step": 2186, "epoch": 52} {"train_loss": -3.282123327255249, "global_step": 2187, "epoch": 52} {"train_loss": -3.4532361030578613, "global_step": 2188, "epoch": 52} {"train_loss": -3.4352543354034424, "global_step": 2189, "epoch": 52} {"train_loss": -3.3431782722473145, "global_step": 2190, "epoch": 52} {"train_loss": -3.4283976554870605, "global_step": 2191, "epoch": 52} {"train_loss": -3.457556962966919, "global_step": 2192, "epoch": 52} {"train_loss": -3.342165231704712, "global_step": 2193, "epoch": 52} {"train_loss": -3.440944194793701, "global_step": 2194, "epoch": 52} {"train_loss": -3.376351833343506, "global_step": 2195, "epoch": 52} {"train_loss": -3.617342233657837, "global_step": 2196, "epoch": 52} {"train_loss": -3.4382450580596924, "global_step": 2197, "epoch": 52} {"train_loss": -3.569976806640625, "global_step": 2198, "epoch": 52} {"train_loss": -3.521867036819458, "global_step": 2199, "epoch": 52} {"train_loss": -3.4094526767730713, "global_step": 2200, "epoch": 52} {"train_loss": -3.4731318950653076, "global_step": 2201, "epoch": 52} {"train_loss": -3.528944492340088, "global_step": 2202, "epoch": 52} {"train_loss": -3.4818286895751953, "global_step": 2203, "epoch": 52} {"train_loss": -3.502561092376709, "global_step": 2204, "epoch": 52} {"train_loss": -3.5539069175720215, "global_step": 2205, "epoch": 52} {"train_loss": -3.5194919109344482, "global_step": 2206, "epoch": 52} {"train_loss": -3.2972705364227295, "global_step": 2207, "epoch": 52} {"train_loss": -3.500514030456543, "global_step": 2208, "epoch": 52} {"train_loss": -3.4167592525482178, "global_step": 2209, "epoch": 52} {"train_loss": -3.236800193786621, "global_step": 2210, "epoch": 52} {"train_loss": -3.6635828018188477, "global_step": 2211, "epoch": 52} {"train_loss": -3.395904064178467, "global_step": 2212, "epoch": 52} {"train_loss": -3.408661365509033, "global_step": 2213, "epoch": 52} {"train_loss": -3.3916962146759033, "global_step": 2214, "epoch": 52} {"train_loss": -3.5446596145629883, "global_step": 2215, "epoch": 52} {"train_loss": -3.342592716217041, "global_step": 2216, "epoch": 52} {"train_loss": -3.2248287200927734, "global_step": 2217, "epoch": 52} {"train_loss": -3.4238076210021973, "global_step": 2218, "epoch": 52} {"train_loss": -3.3759007453918457, "global_step": 2219, "epoch": 52} {"train_loss": -3.188933849334717, "global_step": 2220, "epoch": 52} {"train_loss": -3.614572048187256, "global_step": 2221, "epoch": 52} {"train_loss": -3.443067789077759, "global_step": 2222, "epoch": 52} {"train_loss": -3.2852981090545654, "global_step": 2223, "epoch": 52} {"train_loss": -3.4867868423461914, "global_step": 2224, "epoch": 52} {"train_loss": -3.4327982720874606, "global_step": 2225, "epoch": 52, "val_loss": 223486.984375} {"train_loss": -3.547656774520874, "global_step": 2226, "epoch": 53} {"train_loss": -3.268252372741699, "global_step": 2227, "epoch": 53} {"train_loss": -3.422844171524048, "global_step": 2228, "epoch": 53} {"train_loss": -3.366994857788086, "global_step": 2229, "epoch": 53} {"train_loss": -3.5926012992858887, "global_step": 2230, "epoch": 53} {"train_loss": -3.3671882152557373, "global_step": 2231, "epoch": 53} {"train_loss": -3.535700798034668, "global_step": 2232, "epoch": 53} {"train_loss": -3.434098243713379, "global_step": 2233, "epoch": 53} {"train_loss": -3.2860865592956543, "global_step": 2234, "epoch": 53} {"train_loss": -3.633152723312378, "global_step": 2235, "epoch": 53} {"train_loss": -3.3260276317596436, "global_step": 2236, "epoch": 53} {"train_loss": -3.513538122177124, "global_step": 2237, "epoch": 53} {"train_loss": -3.386321544647217, "global_step": 2238, "epoch": 53} {"train_loss": -3.4440035820007324, "global_step": 2239, "epoch": 53} {"train_loss": -3.3406448364257812, "global_step": 2240, "epoch": 53} {"train_loss": -3.4181246757507324, "global_step": 2241, "epoch": 53} {"train_loss": -3.48319411277771, "global_step": 2242, "epoch": 53} {"train_loss": -3.345393419265747, "global_step": 2243, "epoch": 53} {"train_loss": -3.316295623779297, "global_step": 2244, "epoch": 53} {"train_loss": -3.3657779693603516, "global_step": 2245, "epoch": 53} {"train_loss": -3.4575979709625244, "global_step": 2246, "epoch": 53} {"train_loss": -3.2705299854278564, "global_step": 2247, "epoch": 53} {"train_loss": -3.502516746520996, "global_step": 2248, "epoch": 53} {"train_loss": -3.4760947227478027, "global_step": 2249, "epoch": 53} {"train_loss": -3.333946704864502, "global_step": 2250, "epoch": 53} {"train_loss": -3.56472110748291, "global_step": 2251, "epoch": 53} {"train_loss": -3.405792474746704, "global_step": 2252, "epoch": 53} {"train_loss": -3.455505847930908, "global_step": 2253, "epoch": 53} {"train_loss": -3.464284896850586, "global_step": 2254, "epoch": 53} {"train_loss": -3.541018486022949, "global_step": 2255, "epoch": 53} {"train_loss": -3.3163704872131348, "global_step": 2256, "epoch": 53} {"train_loss": -3.477004051208496, "global_step": 2257, "epoch": 53} {"train_loss": -3.5534110069274902, "global_step": 2258, "epoch": 53} {"train_loss": -3.4821722507476807, "global_step": 2259, "epoch": 53} {"train_loss": -3.4450416564941406, "global_step": 2260, "epoch": 53} {"train_loss": -3.5887794494628906, "global_step": 2261, "epoch": 53} {"train_loss": -3.505032539367676, "global_step": 2262, "epoch": 53} {"train_loss": -3.5089316368103027, "global_step": 2263, "epoch": 53} {"train_loss": -3.496817111968994, "global_step": 2264, "epoch": 53} {"train_loss": -3.458327531814575, "global_step": 2265, "epoch": 53} {"train_loss": -3.5539824962615967, "global_step": 2266, "epoch": 53} {"train_loss": -3.445517755690075, "global_step": 2267, "epoch": 53, "val_loss": 223438.609375} {"train_loss": -3.50203800201416, "global_step": 2268, "epoch": 54} {"train_loss": -3.50813627243042, "global_step": 2269, "epoch": 54} {"train_loss": -3.4596505165100098, "global_step": 2270, "epoch": 54} {"train_loss": -3.479684352874756, "global_step": 2271, "epoch": 54} {"train_loss": -3.42238712310791, "global_step": 2272, "epoch": 54} {"train_loss": -3.54323673248291, "global_step": 2273, "epoch": 54} {"train_loss": -3.621662139892578, "global_step": 2274, "epoch": 54} {"train_loss": -3.5965609550476074, "global_step": 2275, "epoch": 54} {"train_loss": -3.4370415210723877, "global_step": 2276, "epoch": 54} {"train_loss": -3.5706427097320557, "global_step": 2277, "epoch": 54} {"train_loss": -3.629136800765991, "global_step": 2278, "epoch": 54} {"train_loss": -3.5122363567352295, "global_step": 2279, "epoch": 54} {"train_loss": -3.4784889221191406, "global_step": 2280, "epoch": 54} {"train_loss": -3.4600255489349365, "global_step": 2281, "epoch": 54} {"train_loss": -3.4784514904022217, "global_step": 2282, "epoch": 54} {"train_loss": -3.4437320232391357, "global_step": 2283, "epoch": 54} {"train_loss": -3.578348159790039, "global_step": 2284, "epoch": 54} {"train_loss": -3.656492233276367, "global_step": 2285, "epoch": 54} {"train_loss": -3.5841362476348877, "global_step": 2286, "epoch": 54} {"train_loss": -3.4913992881774902, "global_step": 2287, "epoch": 54} {"train_loss": -3.4822468757629395, "global_step": 2288, "epoch": 54} {"train_loss": -3.416146993637085, "global_step": 2289, "epoch": 54} {"train_loss": -3.572052240371704, "global_step": 2290, "epoch": 54} {"train_loss": -3.6116080284118652, "global_step": 2291, "epoch": 54} {"train_loss": -3.503002643585205, "global_step": 2292, "epoch": 54} {"train_loss": -3.5914745330810547, "global_step": 2293, "epoch": 54} {"train_loss": -3.342741012573242, "global_step": 2294, "epoch": 54} {"train_loss": -3.3647990226745605, "global_step": 2295, "epoch": 54} {"train_loss": -3.468280792236328, "global_step": 2296, "epoch": 54} {"train_loss": -3.3819727897644043, "global_step": 2297, "epoch": 54} {"train_loss": -3.5410194396972656, "global_step": 2298, "epoch": 54} {"train_loss": -3.3988566398620605, "global_step": 2299, "epoch": 54} {"train_loss": -3.647205352783203, "global_step": 2300, "epoch": 54} {"train_loss": -3.547926902770996, "global_step": 2301, "epoch": 54} {"train_loss": -3.4861245155334473, "global_step": 2302, "epoch": 54} {"train_loss": -3.4259090423583984, "global_step": 2303, "epoch": 54} {"train_loss": -3.472564697265625, "global_step": 2304, "epoch": 54} {"train_loss": -3.421926498413086, "global_step": 2305, "epoch": 54} {"train_loss": -3.535079002380371, "global_step": 2306, "epoch": 54} {"train_loss": -3.560037612915039, "global_step": 2307, "epoch": 54} {"train_loss": -3.417285442352295, "global_step": 2308, "epoch": 54} {"train_loss": -3.5059000310443698, "global_step": 2309, "epoch": 54, "val_loss": 223831.9375} {"train_loss": -3.345893383026123, "global_step": 2310, "epoch": 55} {"train_loss": -3.392518997192383, "global_step": 2311, "epoch": 55} {"train_loss": -3.3395283222198486, "global_step": 2312, "epoch": 55} {"train_loss": -3.5444278717041016, "global_step": 2313, "epoch": 55} {"train_loss": -3.5595436096191406, "global_step": 2314, "epoch": 55} {"train_loss": -3.4079580307006836, "global_step": 2315, "epoch": 55} {"train_loss": -3.419595241546631, "global_step": 2316, "epoch": 55} {"train_loss": -3.503520965576172, "global_step": 2317, "epoch": 55} {"train_loss": -3.516176700592041, "global_step": 2318, "epoch": 55} {"train_loss": -3.343578815460205, "global_step": 2319, "epoch": 55} {"train_loss": -3.4563918113708496, "global_step": 2320, "epoch": 55} {"train_loss": -3.245856523513794, "global_step": 2321, "epoch": 55} {"train_loss": -3.441200017929077, "global_step": 2322, "epoch": 55} {"train_loss": -3.4154114723205566, "global_step": 2323, "epoch": 55} {"train_loss": -3.502777338027954, "global_step": 2324, "epoch": 55} {"train_loss": -3.429941177368164, "global_step": 2325, "epoch": 55} {"train_loss": -3.4024498462677, "global_step": 2326, "epoch": 55} {"train_loss": -3.603689193725586, "global_step": 2327, "epoch": 55} {"train_loss": -3.501616954803467, "global_step": 2328, "epoch": 55} {"train_loss": -3.5676305294036865, "global_step": 2329, "epoch": 55} {"train_loss": -3.5317177772521973, "global_step": 2330, "epoch": 55} {"train_loss": -3.483396530151367, "global_step": 2331, "epoch": 55} {"train_loss": -3.476107358932495, "global_step": 2332, "epoch": 55} {"train_loss": -3.5265612602233887, "global_step": 2333, "epoch": 55} {"train_loss": -3.510998249053955, "global_step": 2334, "epoch": 55} {"train_loss": -3.522256851196289, "global_step": 2335, "epoch": 55} {"train_loss": -3.4600887298583984, "global_step": 2336, "epoch": 55} {"train_loss": -3.5871481895446777, "global_step": 2337, "epoch": 55} {"train_loss": -3.532299041748047, "global_step": 2338, "epoch": 55} {"train_loss": -3.5034265518188477, "global_step": 2339, "epoch": 55} {"train_loss": -3.5378267765045166, "global_step": 2340, "epoch": 55} {"train_loss": -3.4306743144989014, "global_step": 2341, "epoch": 55} {"train_loss": -3.4916443824768066, "global_step": 2342, "epoch": 55} {"train_loss": -3.5579099655151367, "global_step": 2343, "epoch": 55} {"train_loss": -3.593806266784668, "global_step": 2344, "epoch": 55} {"train_loss": -3.567028284072876, "global_step": 2345, "epoch": 55} {"train_loss": -3.563889503479004, "global_step": 2346, "epoch": 55} {"train_loss": -3.5775299072265625, "global_step": 2347, "epoch": 55} {"train_loss": -3.4685473442077637, "global_step": 2348, "epoch": 55} {"train_loss": -3.726846933364868, "global_step": 2349, "epoch": 55} {"train_loss": -3.512042760848999, "global_step": 2350, "epoch": 55} {"train_loss": -3.49143347853706, "global_step": 2351, "epoch": 55, "val_loss": 211075.609375} {"train_loss": -3.4899609088897705, "global_step": 2352, "epoch": 56} {"train_loss": -3.55104923248291, "global_step": 2353, "epoch": 56} {"train_loss": -3.59885311126709, "global_step": 2354, "epoch": 56} {"train_loss": -3.610973834991455, "global_step": 2355, "epoch": 56} {"train_loss": -3.5726120471954346, "global_step": 2356, "epoch": 56} {"train_loss": -3.549899101257324, "global_step": 2357, "epoch": 56} {"train_loss": -3.5145483016967773, "global_step": 2358, "epoch": 56} {"train_loss": -3.674776077270508, "global_step": 2359, "epoch": 56} {"train_loss": -3.5916898250579834, "global_step": 2360, "epoch": 56} {"train_loss": -3.609055995941162, "global_step": 2361, "epoch": 56} {"train_loss": -3.569096565246582, "global_step": 2362, "epoch": 56} {"train_loss": -3.694293975830078, "global_step": 2363, "epoch": 56} {"train_loss": -3.565108299255371, "global_step": 2364, "epoch": 56} {"train_loss": -3.498168468475342, "global_step": 2365, "epoch": 56} {"train_loss": -3.6202263832092285, "global_step": 2366, "epoch": 56} {"train_loss": -3.6000447273254395, "global_step": 2367, "epoch": 56} {"train_loss": -3.627077579498291, "global_step": 2368, "epoch": 56} {"train_loss": -3.57291579246521, "global_step": 2369, "epoch": 56} {"train_loss": -3.62404727935791, "global_step": 2370, "epoch": 56} {"train_loss": -3.5552268028259277, "global_step": 2371, "epoch": 56} {"train_loss": -3.6176514625549316, "global_step": 2372, "epoch": 56} {"train_loss": -3.621002197265625, "global_step": 2373, "epoch": 56} {"train_loss": -3.621760129928589, "global_step": 2374, "epoch": 56} {"train_loss": -3.4427437782287598, "global_step": 2375, "epoch": 56} {"train_loss": -3.5611748695373535, "global_step": 2376, "epoch": 56} {"train_loss": -3.466101884841919, "global_step": 2377, "epoch": 56} {"train_loss": -3.489243984222412, "global_step": 2378, "epoch": 56} {"train_loss": -3.4301657676696777, "global_step": 2379, "epoch": 56} {"train_loss": -3.3702566623687744, "global_step": 2380, "epoch": 56} {"train_loss": -3.7164831161499023, "global_step": 2381, "epoch": 56} {"train_loss": -3.3562514781951904, "global_step": 2382, "epoch": 56} {"train_loss": -3.6147379875183105, "global_step": 2383, "epoch": 56} {"train_loss": -3.3498072624206543, "global_step": 2384, "epoch": 56} {"train_loss": -3.5769500732421875, "global_step": 2385, "epoch": 56} {"train_loss": -3.482663869857788, "global_step": 2386, "epoch": 56} {"train_loss": -3.253901958465576, "global_step": 2387, "epoch": 56} {"train_loss": -3.5241990089416504, "global_step": 2388, "epoch": 56} {"train_loss": -3.402700662612915, "global_step": 2389, "epoch": 56} {"train_loss": -3.500967025756836, "global_step": 2390, "epoch": 56} {"train_loss": -3.4857378005981445, "global_step": 2391, "epoch": 56} {"train_loss": -3.599954128265381, "global_step": 2392, "epoch": 56} {"train_loss": -3.5408873501278104, "global_step": 2393, "epoch": 56, "val_loss": 211961.265625} {"train_loss": -3.4525389671325684, "global_step": 2394, "epoch": 57} {"train_loss": -3.624042510986328, "global_step": 2395, "epoch": 57} {"train_loss": -3.577333927154541, "global_step": 2396, "epoch": 57} {"train_loss": -3.5192246437072754, "global_step": 2397, "epoch": 57} {"train_loss": -3.6144144535064697, "global_step": 2398, "epoch": 57} {"train_loss": -3.6558380126953125, "global_step": 2399, "epoch": 57} {"train_loss": -3.580782413482666, "global_step": 2400, "epoch": 57} {"train_loss": -3.5811963081359863, "global_step": 2401, "epoch": 57} {"train_loss": -3.5048861503601074, "global_step": 2402, "epoch": 57} {"train_loss": -3.474008083343506, "global_step": 2403, "epoch": 57} {"train_loss": -3.547229290008545, "global_step": 2404, "epoch": 57} {"train_loss": -3.603612184524536, "global_step": 2405, "epoch": 57} {"train_loss": -3.3125834465026855, "global_step": 2406, "epoch": 57} {"train_loss": -3.5180912017822266, "global_step": 2407, "epoch": 57} {"train_loss": -3.653599262237549, "global_step": 2408, "epoch": 57} {"train_loss": -3.4514007568359375, "global_step": 2409, "epoch": 57} {"train_loss": -3.566185235977173, "global_step": 2410, "epoch": 57} {"train_loss": -3.451131820678711, "global_step": 2411, "epoch": 57} {"train_loss": -3.5935049057006836, "global_step": 2412, "epoch": 57} {"train_loss": -3.6804840564727783, "global_step": 2413, "epoch": 57} {"train_loss": -3.5626301765441895, "global_step": 2414, "epoch": 57} {"train_loss": -3.651146173477173, "global_step": 2415, "epoch": 57} {"train_loss": -3.505765199661255, "global_step": 2416, "epoch": 57} {"train_loss": -3.4714810848236084, "global_step": 2417, "epoch": 57} {"train_loss": -3.311215877532959, "global_step": 2418, "epoch": 57} {"train_loss": -3.652400016784668, "global_step": 2419, "epoch": 57} {"train_loss": -3.542222499847412, "global_step": 2420, "epoch": 57} {"train_loss": -3.6171419620513916, "global_step": 2421, "epoch": 57} {"train_loss": -3.5889523029327393, "global_step": 2422, "epoch": 57} {"train_loss": -3.5240659713745117, "global_step": 2423, "epoch": 57} {"train_loss": -3.556697368621826, "global_step": 2424, "epoch": 57} {"train_loss": -3.5873453617095947, "global_step": 2425, "epoch": 57} {"train_loss": -3.709711790084839, "global_step": 2426, "epoch": 57} {"train_loss": -3.7079567909240723, "global_step": 2427, "epoch": 57} {"train_loss": -3.6778793334960938, "global_step": 2428, "epoch": 57} {"train_loss": -3.826592445373535, "global_step": 2429, "epoch": 57} {"train_loss": -3.6876602172851562, "global_step": 2430, "epoch": 57} {"train_loss": -3.620957374572754, "global_step": 2431, "epoch": 57} {"train_loss": -3.6553432941436768, "global_step": 2432, "epoch": 57} {"train_loss": -3.640718936920166, "global_step": 2433, "epoch": 57} {"train_loss": -3.5753989219665527, "global_step": 2434, "epoch": 57} {"train_loss": -3.575354746409825, "global_step": 2435, "epoch": 57, "val_loss": 206473.203125} {"train_loss": -3.654806137084961, "global_step": 2436, "epoch": 58} {"train_loss": -3.689243793487549, "global_step": 2437, "epoch": 58} {"train_loss": -3.5653767585754395, "global_step": 2438, "epoch": 58} {"train_loss": -3.58842396736145, "global_step": 2439, "epoch": 58} {"train_loss": -3.568726062774658, "global_step": 2440, "epoch": 58} {"train_loss": -3.545529842376709, "global_step": 2441, "epoch": 58} {"train_loss": -3.509309768676758, "global_step": 2442, "epoch": 58} {"train_loss": -3.6319282054901123, "global_step": 2443, "epoch": 58} {"train_loss": -3.7503509521484375, "global_step": 2444, "epoch": 58} {"train_loss": -3.6009087562561035, "global_step": 2445, "epoch": 58} {"train_loss": -3.495176076889038, "global_step": 2446, "epoch": 58} {"train_loss": -3.47127366065979, "global_step": 2447, "epoch": 58} {"train_loss": -3.6902570724487305, "global_step": 2448, "epoch": 58} {"train_loss": -3.7301249504089355, "global_step": 2449, "epoch": 58} {"train_loss": -3.6210427284240723, "global_step": 2450, "epoch": 58} {"train_loss": -3.5740582942962646, "global_step": 2451, "epoch": 58} {"train_loss": -3.7031333446502686, "global_step": 2452, "epoch": 58} {"train_loss": -3.5809690952301025, "global_step": 2453, "epoch": 58} {"train_loss": -3.5771007537841797, "global_step": 2454, "epoch": 58} {"train_loss": -3.604501724243164, "global_step": 2455, "epoch": 58} {"train_loss": -3.5672783851623535, "global_step": 2456, "epoch": 58} {"train_loss": -3.555712938308716, "global_step": 2457, "epoch": 58} {"train_loss": -3.6657254695892334, "global_step": 2458, "epoch": 58} {"train_loss": -3.644115686416626, "global_step": 2459, "epoch": 58} {"train_loss": -3.7616970539093018, "global_step": 2460, "epoch": 58} {"train_loss": -3.6878583431243896, "global_step": 2461, "epoch": 58} {"train_loss": -3.667901039123535, "global_step": 2462, "epoch": 58} {"train_loss": -3.609149694442749, "global_step": 2463, "epoch": 58} {"train_loss": -3.695620536804199, "global_step": 2464, "epoch": 58} {"train_loss": -3.6172943115234375, "global_step": 2465, "epoch": 58} {"train_loss": -3.7322192192077637, "global_step": 2466, "epoch": 58} {"train_loss": -3.726262331008911, "global_step": 2467, "epoch": 58} {"train_loss": -3.5778720378875732, "global_step": 2468, "epoch": 58} {"train_loss": -3.6635172367095947, "global_step": 2469, "epoch": 58} {"train_loss": -3.663219451904297, "global_step": 2470, "epoch": 58} {"train_loss": -3.741626024246216, "global_step": 2471, "epoch": 58} {"train_loss": -3.56320858001709, "global_step": 2472, "epoch": 58} {"train_loss": -3.5298805236816406, "global_step": 2473, "epoch": 58} {"train_loss": -3.5528626441955566, "global_step": 2474, "epoch": 58} {"train_loss": -3.70361590385437, "global_step": 2475, "epoch": 58} {"train_loss": -3.5001943111419678, "global_step": 2476, "epoch": 58} {"train_loss": -3.62460188070933, "global_step": 2477, "epoch": 58, "val_loss": 205193.78125} {"train_loss": -3.691258192062378, "global_step": 2478, "epoch": 59} {"train_loss": -3.5379109382629395, "global_step": 2479, "epoch": 59} {"train_loss": -3.595322847366333, "global_step": 2480, "epoch": 59} {"train_loss": -3.5731682777404785, "global_step": 2481, "epoch": 59} {"train_loss": -3.6668877601623535, "global_step": 2482, "epoch": 59} {"train_loss": -3.621272563934326, "global_step": 2483, "epoch": 59} {"train_loss": -3.5039784908294678, "global_step": 2484, "epoch": 59} {"train_loss": -3.658083915710449, "global_step": 2485, "epoch": 59} {"train_loss": -3.5041143894195557, "global_step": 2486, "epoch": 59} {"train_loss": -3.370284080505371, "global_step": 2487, "epoch": 59} {"train_loss": -3.759507894515991, "global_step": 2488, "epoch": 59} {"train_loss": -3.461973190307617, "global_step": 2489, "epoch": 59} {"train_loss": -3.5826034545898438, "global_step": 2490, "epoch": 59} {"train_loss": -3.484586238861084, "global_step": 2491, "epoch": 59} {"train_loss": -3.6908349990844727, "global_step": 2492, "epoch": 59} {"train_loss": -3.5568478107452393, "global_step": 2493, "epoch": 59} {"train_loss": -3.658855676651001, "global_step": 2494, "epoch": 59} {"train_loss": -3.447892427444458, "global_step": 2495, "epoch": 59} {"train_loss": -3.5683140754699707, "global_step": 2496, "epoch": 59} {"train_loss": -3.5231165885925293, "global_step": 2497, "epoch": 59} {"train_loss": -3.5659494400024414, "global_step": 2498, "epoch": 59} {"train_loss": -3.722946882247925, "global_step": 2499, "epoch": 59} {"train_loss": -3.430305242538452, "global_step": 2500, "epoch": 59} {"train_loss": -3.5274393558502197, "global_step": 2501, "epoch": 59} {"train_loss": -3.6735401153564453, "global_step": 2502, "epoch": 59} {"train_loss": -3.384390115737915, "global_step": 2503, "epoch": 59} {"train_loss": -3.6449620723724365, "global_step": 2504, "epoch": 59} {"train_loss": -3.4663589000701904, "global_step": 2505, "epoch": 59} {"train_loss": -3.5193591117858887, "global_step": 2506, "epoch": 59} {"train_loss": -3.4280126094818115, "global_step": 2507, "epoch": 59} {"train_loss": -3.3751769065856934, "global_step": 2508, "epoch": 59} {"train_loss": -3.778041362762451, "global_step": 2509, "epoch": 59} {"train_loss": -3.4389843940734863, "global_step": 2510, "epoch": 59} {"train_loss": -3.5989766120910645, "global_step": 2511, "epoch": 59} {"train_loss": -3.5498008728027344, "global_step": 2512, "epoch": 59} {"train_loss": -3.595799684524536, "global_step": 2513, "epoch": 59} {"train_loss": -3.5936810970306396, "global_step": 2514, "epoch": 59} {"train_loss": -3.533425807952881, "global_step": 2515, "epoch": 59} {"train_loss": -3.6053476333618164, "global_step": 2516, "epoch": 59} {"train_loss": -3.5490198135375977, "global_step": 2517, "epoch": 59} {"train_loss": -3.5939230918884277, "global_step": 2518, "epoch": 59} {"train_loss": -3.559626233010065, "global_step": 2519, "epoch": 59, "val_loss": 199586.265625} {"train_loss": -3.6218276023864746, "global_step": 2520, "epoch": 60} {"train_loss": -3.477548122406006, "global_step": 2521, "epoch": 60} {"train_loss": -3.7095999717712402, "global_step": 2522, "epoch": 60} {"train_loss": -3.427830696105957, "global_step": 2523, "epoch": 60} {"train_loss": -3.500591278076172, "global_step": 2524, "epoch": 60} {"train_loss": -3.636214017868042, "global_step": 2525, "epoch": 60} {"train_loss": -3.660790205001831, "global_step": 2526, "epoch": 60} {"train_loss": -3.724057912826538, "global_step": 2527, "epoch": 60} {"train_loss": -3.676858901977539, "global_step": 2528, "epoch": 60} {"train_loss": -3.7200474739074707, "global_step": 2529, "epoch": 60} {"train_loss": -3.7482733726501465, "global_step": 2530, "epoch": 60} {"train_loss": -3.6284594535827637, "global_step": 2531, "epoch": 60} {"train_loss": -3.7451348304748535, "global_step": 2532, "epoch": 60} {"train_loss": -3.657982349395752, "global_step": 2533, "epoch": 60} {"train_loss": -3.7015633583068848, "global_step": 2534, "epoch": 60} {"train_loss": -3.73828387260437, "global_step": 2535, "epoch": 60} {"train_loss": -3.716358184814453, "global_step": 2536, "epoch": 60} {"train_loss": -3.6223886013031006, "global_step": 2537, "epoch": 60} {"train_loss": -3.6364834308624268, "global_step": 2538, "epoch": 60} {"train_loss": -3.5592634677886963, "global_step": 2539, "epoch": 60} {"train_loss": -3.647700309753418, "global_step": 2540, "epoch": 60} {"train_loss": -3.6067492961883545, "global_step": 2541, "epoch": 60} {"train_loss": -3.4020161628723145, "global_step": 2542, "epoch": 60} {"train_loss": -3.637773036956787, "global_step": 2543, "epoch": 60} {"train_loss": -3.611685276031494, "global_step": 2544, "epoch": 60} {"train_loss": -3.477931022644043, "global_step": 2545, "epoch": 60} {"train_loss": -3.534463405609131, "global_step": 2546, "epoch": 60} {"train_loss": -3.6486425399780273, "global_step": 2547, "epoch": 60} {"train_loss": -3.4892354011535645, "global_step": 2548, "epoch": 60} {"train_loss": -3.6827900409698486, "global_step": 2549, "epoch": 60} {"train_loss": -3.2110483646392822, "global_step": 2550, "epoch": 60} {"train_loss": -3.5064659118652344, "global_step": 2551, "epoch": 60} {"train_loss": -3.0115413665771484, "global_step": 2552, "epoch": 60} {"train_loss": -3.5600991249084473, "global_step": 2553, "epoch": 60} {"train_loss": -3.242711067199707, "global_step": 2554, "epoch": 60} {"train_loss": -3.6569876670837402, "global_step": 2555, "epoch": 60} {"train_loss": -3.137160301208496, "global_step": 2556, "epoch": 60} {"train_loss": -3.495032548904419, "global_step": 2557, "epoch": 60} {"train_loss": -3.383195161819458, "global_step": 2558, "epoch": 60} {"train_loss": -3.3617775440216064, "global_step": 2559, "epoch": 60} {"train_loss": -3.661004066467285, "global_step": 2560, "epoch": 60} {"train_loss": -3.5515493268058416, "global_step": 2561, "epoch": 60, "val_loss": 196318.65625} {"train_loss": -3.4467177391052246, "global_step": 2562, "epoch": 61} {"train_loss": -3.462785243988037, "global_step": 2563, "epoch": 61} {"train_loss": -3.4621753692626953, "global_step": 2564, "epoch": 61} {"train_loss": -3.508086681365967, "global_step": 2565, "epoch": 61} {"train_loss": -3.5753238201141357, "global_step": 2566, "epoch": 61} {"train_loss": -3.6131742000579834, "global_step": 2567, "epoch": 61} {"train_loss": -3.566415786743164, "global_step": 2568, "epoch": 61} {"train_loss": -3.4878931045532227, "global_step": 2569, "epoch": 61} {"train_loss": -3.5925068855285645, "global_step": 2570, "epoch": 61} {"train_loss": -3.5433621406555176, "global_step": 2571, "epoch": 61} {"train_loss": -3.594852924346924, "global_step": 2572, "epoch": 61} {"train_loss": -3.57454252243042, "global_step": 2573, "epoch": 61} {"train_loss": -3.573714256286621, "global_step": 2574, "epoch": 61} {"train_loss": -3.6802148818969727, "global_step": 2575, "epoch": 61} {"train_loss": -3.586507797241211, "global_step": 2576, "epoch": 61} {"train_loss": -3.7288150787353516, "global_step": 2577, "epoch": 61} {"train_loss": -3.4569947719573975, "global_step": 2578, "epoch": 61} {"train_loss": -3.6062707901000977, "global_step": 2579, "epoch": 61} {"train_loss": -3.6345067024230957, "global_step": 2580, "epoch": 61} {"train_loss": -3.629565715789795, "global_step": 2581, "epoch": 61} {"train_loss": -3.6780126094818115, "global_step": 2582, "epoch": 61} {"train_loss": -3.4825518131256104, "global_step": 2583, "epoch": 61} {"train_loss": -3.757040500640869, "global_step": 2584, "epoch": 61} {"train_loss": -3.75665545463562, "global_step": 2585, "epoch": 61} {"train_loss": -3.7517502307891846, "global_step": 2586, "epoch": 61} {"train_loss": -3.620664596557617, "global_step": 2587, "epoch": 61} {"train_loss": -3.5652103424072266, "global_step": 2588, "epoch": 61} {"train_loss": -3.6903979778289795, "global_step": 2589, "epoch": 61} {"train_loss": -3.8859288692474365, "global_step": 2590, "epoch": 61} {"train_loss": -3.657675266265869, "global_step": 2591, "epoch": 61} {"train_loss": -3.6698670387268066, "global_step": 2592, "epoch": 61} {"train_loss": -3.5966739654541016, "global_step": 2593, "epoch": 61} {"train_loss": -3.4991390705108643, "global_step": 2594, "epoch": 61} {"train_loss": -3.7709600925445557, "global_step": 2595, "epoch": 61} {"train_loss": -3.5376152992248535, "global_step": 2596, "epoch": 61} {"train_loss": -3.847118854522705, "global_step": 2597, "epoch": 61} {"train_loss": -3.6462059020996094, "global_step": 2598, "epoch": 61} {"train_loss": -3.495357036590576, "global_step": 2599, "epoch": 61} {"train_loss": -3.613798141479492, "global_step": 2600, "epoch": 61} {"train_loss": -3.6437370777130127, "global_step": 2601, "epoch": 61} {"train_loss": -3.6902732849121094, "global_step": 2602, "epoch": 61} {"train_loss": -3.614328378722781, "global_step": 2603, "epoch": 61, "val_loss": 193122.1875} {"train_loss": -3.685807943344116, "global_step": 2604, "epoch": 62} {"train_loss": -3.6510486602783203, "global_step": 2605, "epoch": 62} {"train_loss": -3.550961494445801, "global_step": 2606, "epoch": 62} {"train_loss": -3.771756649017334, "global_step": 2607, "epoch": 62} {"train_loss": -3.6103501319885254, "global_step": 2608, "epoch": 62} {"train_loss": -3.6498565673828125, "global_step": 2609, "epoch": 62} {"train_loss": -3.6403748989105225, "global_step": 2610, "epoch": 62} {"train_loss": -3.581974744796753, "global_step": 2611, "epoch": 62} {"train_loss": -3.7079849243164062, "global_step": 2612, "epoch": 62} {"train_loss": -3.540496349334717, "global_step": 2613, "epoch": 62} {"train_loss": -3.6940126419067383, "global_step": 2614, "epoch": 62} {"train_loss": -3.6415395736694336, "global_step": 2615, "epoch": 62} {"train_loss": -3.5260608196258545, "global_step": 2616, "epoch": 62} {"train_loss": -3.6065027713775635, "global_step": 2617, "epoch": 62} {"train_loss": -3.623563766479492, "global_step": 2618, "epoch": 62} {"train_loss": -3.624171733856201, "global_step": 2619, "epoch": 62} {"train_loss": -3.708233594894409, "global_step": 2620, "epoch": 62} {"train_loss": -3.598613739013672, "global_step": 2621, "epoch": 62} {"train_loss": -3.6887943744659424, "global_step": 2622, "epoch": 62} {"train_loss": -3.68808650970459, "global_step": 2623, "epoch": 62} {"train_loss": -3.7604832649230957, "global_step": 2624, "epoch": 62} {"train_loss": -3.6299734115600586, "global_step": 2625, "epoch": 62} {"train_loss": -3.797926425933838, "global_step": 2626, "epoch": 62} {"train_loss": -3.633042812347412, "global_step": 2627, "epoch": 62} {"train_loss": -3.7225050926208496, "global_step": 2628, "epoch": 62} {"train_loss": -3.7440755367279053, "global_step": 2629, "epoch": 62} {"train_loss": -3.8141441345214844, "global_step": 2630, "epoch": 62} {"train_loss": -3.667825698852539, "global_step": 2631, "epoch": 62} {"train_loss": -3.8380210399627686, "global_step": 2632, "epoch": 62} {"train_loss": -3.615866184234619, "global_step": 2633, "epoch": 62} {"train_loss": -3.8143012523651123, "global_step": 2634, "epoch": 62} {"train_loss": -3.7994871139526367, "global_step": 2635, "epoch": 62} {"train_loss": -3.8182365894317627, "global_step": 2636, "epoch": 62} {"train_loss": -3.7577784061431885, "global_step": 2637, "epoch": 62} {"train_loss": -3.7309374809265137, "global_step": 2638, "epoch": 62} {"train_loss": -3.7725491523742676, "global_step": 2639, "epoch": 62} {"train_loss": -3.8287858963012695, "global_step": 2640, "epoch": 62} {"train_loss": -3.698756694793701, "global_step": 2641, "epoch": 62} {"train_loss": -3.7357139587402344, "global_step": 2642, "epoch": 62} {"train_loss": -3.765293598175049, "global_step": 2643, "epoch": 62} {"train_loss": -3.8618907928466797, "global_step": 2644, "epoch": 62} {"train_loss": -3.6991041614895774, "global_step": 2645, "epoch": 62, "val_loss": 188284.25} {"train_loss": -3.8321785926818848, "global_step": 2646, "epoch": 63} {"train_loss": -3.639101028442383, "global_step": 2647, "epoch": 63} {"train_loss": -3.84647274017334, "global_step": 2648, "epoch": 63} {"train_loss": -3.801486015319824, "global_step": 2649, "epoch": 63} {"train_loss": -3.488697052001953, "global_step": 2650, "epoch": 63} {"train_loss": -3.642740488052368, "global_step": 2651, "epoch": 63} {"train_loss": -3.733320713043213, "global_step": 2652, "epoch": 63} {"train_loss": -3.7026455402374268, "global_step": 2653, "epoch": 63} {"train_loss": -3.8235511779785156, "global_step": 2654, "epoch": 63} {"train_loss": -3.661418914794922, "global_step": 2655, "epoch": 63} {"train_loss": -3.722134828567505, "global_step": 2656, "epoch": 63} {"train_loss": -3.810547113418579, "global_step": 2657, "epoch": 63} {"train_loss": -3.7980337142944336, "global_step": 2658, "epoch": 63} {"train_loss": -3.7346644401550293, "global_step": 2659, "epoch": 63} {"train_loss": -3.8889307975769043, "global_step": 2660, "epoch": 63} {"train_loss": -3.666766405105591, "global_step": 2661, "epoch": 63} {"train_loss": -3.5500617027282715, "global_step": 2662, "epoch": 63} {"train_loss": -3.8175830841064453, "global_step": 2663, "epoch": 63} {"train_loss": -3.7466776371002197, "global_step": 2664, "epoch": 63} {"train_loss": -3.835636615753174, "global_step": 2665, "epoch": 63} {"train_loss": -3.7272417545318604, "global_step": 2666, "epoch": 63} {"train_loss": -3.528665542602539, "global_step": 2667, "epoch": 63} {"train_loss": -3.639251232147217, "global_step": 2668, "epoch": 63} {"train_loss": -3.704097032546997, "global_step": 2669, "epoch": 63} {"train_loss": -3.773512840270996, "global_step": 2670, "epoch": 63} {"train_loss": -3.7340879440307617, "global_step": 2671, "epoch": 63} {"train_loss": -3.797029972076416, "global_step": 2672, "epoch": 63} {"train_loss": -3.737504243850708, "global_step": 2673, "epoch": 63} {"train_loss": -3.83354115486145, "global_step": 2674, "epoch": 63} {"train_loss": -3.7811179161071777, "global_step": 2675, "epoch": 63} {"train_loss": -3.7031755447387695, "global_step": 2676, "epoch": 63} {"train_loss": -3.685234308242798, "global_step": 2677, "epoch": 63} {"train_loss": -3.636521100997925, "global_step": 2678, "epoch": 63} {"train_loss": -3.8046369552612305, "global_step": 2679, "epoch": 63} {"train_loss": -3.532337188720703, "global_step": 2680, "epoch": 63} {"train_loss": -3.7922043800354004, "global_step": 2681, "epoch": 63} {"train_loss": -3.8522603511810303, "global_step": 2682, "epoch": 63} {"train_loss": -3.461338996887207, "global_step": 2683, "epoch": 63} {"train_loss": -3.8514981269836426, "global_step": 2684, "epoch": 63} {"train_loss": -3.3715503215789795, "global_step": 2685, "epoch": 63} {"train_loss": -3.607259511947632, "global_step": 2686, "epoch": 63} {"train_loss": -3.709325052443005, "global_step": 2687, "epoch": 63, "val_loss": 186680.53125} {"train_loss": -3.5689399242401123, "global_step": 2688, "epoch": 64} {"train_loss": -3.535404682159424, "global_step": 2689, "epoch": 64} {"train_loss": -3.579118251800537, "global_step": 2690, "epoch": 64} {"train_loss": -3.7988035678863525, "global_step": 2691, "epoch": 64} {"train_loss": -3.6488265991210938, "global_step": 2692, "epoch": 64} {"train_loss": -3.892721176147461, "global_step": 2693, "epoch": 64} {"train_loss": -3.642404317855835, "global_step": 2694, "epoch": 64} {"train_loss": -3.8456318378448486, "global_step": 2695, "epoch": 64} {"train_loss": -3.8242340087890625, "global_step": 2696, "epoch": 64} {"train_loss": -3.7117857933044434, "global_step": 2697, "epoch": 64} {"train_loss": -3.815572738647461, "global_step": 2698, "epoch": 64} {"train_loss": -3.770190954208374, "global_step": 2699, "epoch": 64} {"train_loss": -3.706970453262329, "global_step": 2700, "epoch": 64} {"train_loss": -3.6773974895477295, "global_step": 2701, "epoch": 64} {"train_loss": -3.6280808448791504, "global_step": 2702, "epoch": 64} {"train_loss": -3.7138209342956543, "global_step": 2703, "epoch": 64} {"train_loss": -3.745168447494507, "global_step": 2704, "epoch": 64} {"train_loss": -3.590083122253418, "global_step": 2705, "epoch": 64} {"train_loss": -3.731107711791992, "global_step": 2706, "epoch": 64} {"train_loss": -3.6606082916259766, "global_step": 2707, "epoch": 64} {"train_loss": -3.8451175689697266, "global_step": 2708, "epoch": 64} {"train_loss": -3.683729648590088, "global_step": 2709, "epoch": 64} {"train_loss": -3.572291851043701, "global_step": 2710, "epoch": 64} {"train_loss": -3.7833330631256104, "global_step": 2711, "epoch": 64} {"train_loss": -3.67445707321167, "global_step": 2712, "epoch": 64} {"train_loss": -3.8545167446136475, "global_step": 2713, "epoch": 64} {"train_loss": -3.789602279663086, "global_step": 2714, "epoch": 64} {"train_loss": -3.6969592571258545, "global_step": 2715, "epoch": 64} {"train_loss": -3.8531057834625244, "global_step": 2716, "epoch": 64} {"train_loss": -3.7107162475585938, "global_step": 2717, "epoch": 64} {"train_loss": -3.8037991523742676, "global_step": 2718, "epoch": 64} {"train_loss": -3.5906600952148438, "global_step": 2719, "epoch": 64} {"train_loss": -3.778700590133667, "global_step": 2720, "epoch": 64} {"train_loss": -3.7058844566345215, "global_step": 2721, "epoch": 64} {"train_loss": -3.708645820617676, "global_step": 2722, "epoch": 64} {"train_loss": -3.7819695472717285, "global_step": 2723, "epoch": 64} {"train_loss": -3.7036590576171875, "global_step": 2724, "epoch": 64} {"train_loss": -3.7821805477142334, "global_step": 2725, "epoch": 64} {"train_loss": -3.727174758911133, "global_step": 2726, "epoch": 64} {"train_loss": -3.8849728107452393, "global_step": 2727, "epoch": 64} {"train_loss": -3.743513822555542, "global_step": 2728, "epoch": 64} {"train_loss": -3.728250055086045, "global_step": 2729, "epoch": 64, "val_loss": 183544.65625} {"train_loss": -3.8255951404571533, "global_step": 2730, "epoch": 65} {"train_loss": -3.623488187789917, "global_step": 2731, "epoch": 65} {"train_loss": -3.777100086212158, "global_step": 2732, "epoch": 65} {"train_loss": -3.803581714630127, "global_step": 2733, "epoch": 65} {"train_loss": -3.786013126373291, "global_step": 2734, "epoch": 65} {"train_loss": -3.522160053253174, "global_step": 2735, "epoch": 65} {"train_loss": -3.7366368770599365, "global_step": 2736, "epoch": 65} {"train_loss": -3.643738269805908, "global_step": 2737, "epoch": 65} {"train_loss": -3.6868972778320312, "global_step": 2738, "epoch": 65} {"train_loss": -3.8206653594970703, "global_step": 2739, "epoch": 65} {"train_loss": -3.565525531768799, "global_step": 2740, "epoch": 65} {"train_loss": -3.8163976669311523, "global_step": 2741, "epoch": 65} {"train_loss": -3.8178789615631104, "global_step": 2742, "epoch": 65} {"train_loss": -3.781064033508301, "global_step": 2743, "epoch": 65} {"train_loss": -3.797905445098877, "global_step": 2744, "epoch": 65} {"train_loss": -3.7134976387023926, "global_step": 2745, "epoch": 65} {"train_loss": -3.6642322540283203, "global_step": 2746, "epoch": 65} {"train_loss": -3.81668758392334, "global_step": 2747, "epoch": 65} {"train_loss": -3.8164587020874023, "global_step": 2748, "epoch": 65} {"train_loss": -3.603311061859131, "global_step": 2749, "epoch": 65} {"train_loss": -3.729640245437622, "global_step": 2750, "epoch": 65} {"train_loss": -3.7566819190979004, "global_step": 2751, "epoch": 65} {"train_loss": -3.6238226890563965, "global_step": 2752, "epoch": 65} {"train_loss": -3.7742652893066406, "global_step": 2753, "epoch": 65} {"train_loss": -3.5714757442474365, "global_step": 2754, "epoch": 65} {"train_loss": -3.721099615097046, "global_step": 2755, "epoch": 65} {"train_loss": -3.7479074001312256, "global_step": 2756, "epoch": 65} {"train_loss": -3.637767791748047, "global_step": 2757, "epoch": 65} {"train_loss": -3.7400963306427, "global_step": 2758, "epoch": 65} {"train_loss": -3.605844736099243, "global_step": 2759, "epoch": 65} {"train_loss": -3.7883262634277344, "global_step": 2760, "epoch": 65} {"train_loss": -3.6611740589141846, "global_step": 2761, "epoch": 65} {"train_loss": -3.6414523124694824, "global_step": 2762, "epoch": 65} {"train_loss": -3.8566172122955322, "global_step": 2763, "epoch": 65} {"train_loss": -3.6453909873962402, "global_step": 2764, "epoch": 65} {"train_loss": -3.8088912963867188, "global_step": 2765, "epoch": 65} {"train_loss": -3.733003616333008, "global_step": 2766, "epoch": 65} {"train_loss": -3.8531336784362793, "global_step": 2767, "epoch": 65} {"train_loss": -3.8635668754577637, "global_step": 2768, "epoch": 65} {"train_loss": -3.847728729248047, "global_step": 2769, "epoch": 65} {"train_loss": -3.7740166187286377, "global_step": 2770, "epoch": 65} {"train_loss": -3.735955482437497, "global_step": 2771, "epoch": 65, "val_loss": 182862.125} {"train_loss": -3.7628605365753174, "global_step": 2772, "epoch": 66} {"train_loss": -3.545375347137451, "global_step": 2773, "epoch": 66} {"train_loss": -3.7007381916046143, "global_step": 2774, "epoch": 66} {"train_loss": -3.71059513092041, "global_step": 2775, "epoch": 66} {"train_loss": -3.8613719940185547, "global_step": 2776, "epoch": 66} {"train_loss": -3.6822874546051025, "global_step": 2777, "epoch": 66} {"train_loss": -3.7911131381988525, "global_step": 2778, "epoch": 66} {"train_loss": -3.765749454498291, "global_step": 2779, "epoch": 66} {"train_loss": -3.847672939300537, "global_step": 2780, "epoch": 66} {"train_loss": -3.7020492553710938, "global_step": 2781, "epoch": 66} {"train_loss": -3.8470675945281982, "global_step": 2782, "epoch": 66} {"train_loss": -3.879150390625, "global_step": 2783, "epoch": 66} {"train_loss": -3.802870273590088, "global_step": 2784, "epoch": 66} {"train_loss": -3.8107926845550537, "global_step": 2785, "epoch": 66} {"train_loss": -3.7118070125579834, "global_step": 2786, "epoch": 66} {"train_loss": -3.8154196739196777, "global_step": 2787, "epoch": 66} {"train_loss": -3.8009371757507324, "global_step": 2788, "epoch": 66} {"train_loss": -3.7143125534057617, "global_step": 2789, "epoch": 66} {"train_loss": -3.751980781555176, "global_step": 2790, "epoch": 66} {"train_loss": -3.791104555130005, "global_step": 2791, "epoch": 66} {"train_loss": -3.543728828430176, "global_step": 2792, "epoch": 66} {"train_loss": -3.769314765930176, "global_step": 2793, "epoch": 66} {"train_loss": -3.8098092079162598, "global_step": 2794, "epoch": 66} {"train_loss": -3.560032606124878, "global_step": 2795, "epoch": 66} {"train_loss": -3.7540011405944824, "global_step": 2796, "epoch": 66} {"train_loss": -3.8489151000976562, "global_step": 2797, "epoch": 66} {"train_loss": -3.6814842224121094, "global_step": 2798, "epoch": 66} {"train_loss": -3.5810935497283936, "global_step": 2799, "epoch": 66} {"train_loss": -3.853627920150757, "global_step": 2800, "epoch": 66} {"train_loss": -3.565965414047241, "global_step": 2801, "epoch": 66} {"train_loss": -3.7031197547912598, "global_step": 2802, "epoch": 66} {"train_loss": -3.5351333618164062, "global_step": 2803, "epoch": 66} {"train_loss": -3.6187548637390137, "global_step": 2804, "epoch": 66} {"train_loss": -3.4587411880493164, "global_step": 2805, "epoch": 66} {"train_loss": -3.4844024181365967, "global_step": 2806, "epoch": 66} {"train_loss": -3.808311939239502, "global_step": 2807, "epoch": 66} {"train_loss": -3.5828659534454346, "global_step": 2808, "epoch": 66} {"train_loss": -3.690181016921997, "global_step": 2809, "epoch": 66} {"train_loss": -3.5045011043548584, "global_step": 2810, "epoch": 66} {"train_loss": -3.6862404346466064, "global_step": 2811, "epoch": 66} {"train_loss": -3.557684898376465, "global_step": 2812, "epoch": 66} {"train_loss": -3.70479953289032, "global_step": 2813, "epoch": 66, "val_loss": 185885.53125} {"train_loss": -3.5566720962524414, "global_step": 2814, "epoch": 67} {"train_loss": -3.8685054779052734, "global_step": 2815, "epoch": 67} {"train_loss": -3.756021499633789, "global_step": 2816, "epoch": 67} {"train_loss": -3.861927032470703, "global_step": 2817, "epoch": 67} {"train_loss": -3.8024139404296875, "global_step": 2818, "epoch": 67} {"train_loss": -3.786180019378662, "global_step": 2819, "epoch": 67} {"train_loss": -3.777463436126709, "global_step": 2820, "epoch": 67} {"train_loss": -3.638800621032715, "global_step": 2821, "epoch": 67} {"train_loss": -3.633112668991089, "global_step": 2822, "epoch": 67} {"train_loss": -3.907797336578369, "global_step": 2823, "epoch": 67} {"train_loss": -3.6761717796325684, "global_step": 2824, "epoch": 67} {"train_loss": -3.8824379444122314, "global_step": 2825, "epoch": 67} {"train_loss": -3.7988452911376953, "global_step": 2826, "epoch": 67} {"train_loss": -3.852170944213867, "global_step": 2827, "epoch": 67} {"train_loss": -3.765258550643921, "global_step": 2828, "epoch": 67} {"train_loss": -3.930204153060913, "global_step": 2829, "epoch": 67} {"train_loss": -3.743231773376465, "global_step": 2830, "epoch": 67} {"train_loss": -3.639927387237549, "global_step": 2831, "epoch": 67} {"train_loss": -3.7596402168273926, "global_step": 2832, "epoch": 67} {"train_loss": -3.9232192039489746, "global_step": 2833, "epoch": 67} {"train_loss": -3.8467698097229004, "global_step": 2834, "epoch": 67} {"train_loss": -3.7583508491516113, "global_step": 2835, "epoch": 67} {"train_loss": -3.8348071575164795, "global_step": 2836, "epoch": 67} {"train_loss": -3.684865951538086, "global_step": 2837, "epoch": 67} {"train_loss": -3.6606502532958984, "global_step": 2838, "epoch": 67} {"train_loss": -3.674741268157959, "global_step": 2839, "epoch": 67} {"train_loss": -3.7156834602355957, "global_step": 2840, "epoch": 67} {"train_loss": -3.8099217414855957, "global_step": 2841, "epoch": 67} {"train_loss": -3.8017144203186035, "global_step": 2842, "epoch": 67} {"train_loss": -3.8102424144744873, "global_step": 2843, "epoch": 67} {"train_loss": -3.8200247287750244, "global_step": 2844, "epoch": 67} {"train_loss": -3.7390079498291016, "global_step": 2845, "epoch": 67} {"train_loss": -3.7281036376953125, "global_step": 2846, "epoch": 67} {"train_loss": -3.8156890869140625, "global_step": 2847, "epoch": 67} {"train_loss": -3.916914701461792, "global_step": 2848, "epoch": 67} {"train_loss": -3.925057888031006, "global_step": 2849, "epoch": 67} {"train_loss": -3.881730556488037, "global_step": 2850, "epoch": 67} {"train_loss": -3.7037453651428223, "global_step": 2851, "epoch": 67} {"train_loss": -3.7144713401794434, "global_step": 2852, "epoch": 67} {"train_loss": -3.616230010986328, "global_step": 2853, "epoch": 67} {"train_loss": -3.7600035667419434, "global_step": 2854, "epoch": 67} {"train_loss": -3.7714425779524303, "global_step": 2855, "epoch": 67, "val_loss": 176347.625} {"train_loss": -3.821845054626465, "global_step": 2856, "epoch": 68} {"train_loss": -3.802691698074341, "global_step": 2857, "epoch": 68} {"train_loss": -3.8017539978027344, "global_step": 2858, "epoch": 68} {"train_loss": -3.9900879859924316, "global_step": 2859, "epoch": 68} {"train_loss": -3.6836907863616943, "global_step": 2860, "epoch": 68} {"train_loss": -3.7828917503356934, "global_step": 2861, "epoch": 68} {"train_loss": -3.801666259765625, "global_step": 2862, "epoch": 68} {"train_loss": -3.6882784366607666, "global_step": 2863, "epoch": 68} {"train_loss": -3.794341802597046, "global_step": 2864, "epoch": 68} {"train_loss": -3.8095543384552, "global_step": 2865, "epoch": 68} {"train_loss": -3.716287851333618, "global_step": 2866, "epoch": 68} {"train_loss": -3.653427839279175, "global_step": 2867, "epoch": 68} {"train_loss": -3.700537919998169, "global_step": 2868, "epoch": 68} {"train_loss": -3.7315940856933594, "global_step": 2869, "epoch": 68} {"train_loss": -3.895763874053955, "global_step": 2870, "epoch": 68} {"train_loss": -3.7887866497039795, "global_step": 2871, "epoch": 68} {"train_loss": -3.6452040672302246, "global_step": 2872, "epoch": 68} {"train_loss": -3.676731586456299, "global_step": 2873, "epoch": 68} {"train_loss": -3.6821463108062744, "global_step": 2874, "epoch": 68} {"train_loss": -3.711966037750244, "global_step": 2875, "epoch": 68} {"train_loss": -3.9301211833953857, "global_step": 2876, "epoch": 68} {"train_loss": -3.694058656692505, "global_step": 2877, "epoch": 68} {"train_loss": -3.7613463401794434, "global_step": 2878, "epoch": 68} {"train_loss": -3.9062447547912598, "global_step": 2879, "epoch": 68} {"train_loss": -3.923396348953247, "global_step": 2880, "epoch": 68} {"train_loss": -3.745906352996826, "global_step": 2881, "epoch": 68} {"train_loss": -3.845242977142334, "global_step": 2882, "epoch": 68} {"train_loss": -3.8381905555725098, "global_step": 2883, "epoch": 68} {"train_loss": -3.735323905944824, "global_step": 2884, "epoch": 68} {"train_loss": -3.8176543712615967, "global_step": 2885, "epoch": 68} {"train_loss": -3.8404159545898438, "global_step": 2886, "epoch": 68} {"train_loss": -3.7969791889190674, "global_step": 2887, "epoch": 68} {"train_loss": -3.819589614868164, "global_step": 2888, "epoch": 68} {"train_loss": -3.9048566818237305, "global_step": 2889, "epoch": 68} {"train_loss": -3.7487070560455322, "global_step": 2890, "epoch": 68} {"train_loss": -3.770212173461914, "global_step": 2891, "epoch": 68} {"train_loss": -3.820354700088501, "global_step": 2892, "epoch": 68} {"train_loss": -3.8337244987487793, "global_step": 2893, "epoch": 68} {"train_loss": -3.93259334564209, "global_step": 2894, "epoch": 68} {"train_loss": -3.786461591720581, "global_step": 2895, "epoch": 68} {"train_loss": -3.903766632080078, "global_step": 2896, "epoch": 68} {"train_loss": -3.795369551295326, "global_step": 2897, "epoch": 68, "val_loss": 172733.203125} {"train_loss": -3.7078380584716797, "global_step": 2898, "epoch": 69} {"train_loss": -3.7009899616241455, "global_step": 2899, "epoch": 69} {"train_loss": -3.6851999759674072, "global_step": 2900, "epoch": 69} {"train_loss": -3.9172682762145996, "global_step": 2901, "epoch": 69} {"train_loss": -3.778798818588257, "global_step": 2902, "epoch": 69} {"train_loss": -3.708866596221924, "global_step": 2903, "epoch": 69} {"train_loss": -3.732339859008789, "global_step": 2904, "epoch": 69} {"train_loss": -3.7744131088256836, "global_step": 2905, "epoch": 69} {"train_loss": -3.9156432151794434, "global_step": 2906, "epoch": 69} {"train_loss": -3.9046387672424316, "global_step": 2907, "epoch": 69} {"train_loss": -3.5197243690490723, "global_step": 2908, "epoch": 69} {"train_loss": -3.8033461570739746, "global_step": 2909, "epoch": 69} {"train_loss": -3.901533603668213, "global_step": 2910, "epoch": 69} {"train_loss": -3.8162834644317627, "global_step": 2911, "epoch": 69} {"train_loss": -3.9017138481140137, "global_step": 2912, "epoch": 69} {"train_loss": -3.856933832168579, "global_step": 2913, "epoch": 69} {"train_loss": -3.8141732215881348, "global_step": 2914, "epoch": 69} {"train_loss": -3.8265886306762695, "global_step": 2915, "epoch": 69} {"train_loss": -3.7208313941955566, "global_step": 2916, "epoch": 69} {"train_loss": -4.001545429229736, "global_step": 2917, "epoch": 69} {"train_loss": -3.9677367210388184, "global_step": 2918, "epoch": 69} {"train_loss": -3.9644346237182617, "global_step": 2919, "epoch": 69} {"train_loss": -3.837542772293091, "global_step": 2920, "epoch": 69} {"train_loss": -3.738399028778076, "global_step": 2921, "epoch": 69} {"train_loss": -3.8769426345825195, "global_step": 2922, "epoch": 69} {"train_loss": -3.839444637298584, "global_step": 2923, "epoch": 69} {"train_loss": -3.9467291831970215, "global_step": 2924, "epoch": 69} {"train_loss": -3.9412882328033447, "global_step": 2925, "epoch": 69} {"train_loss": -3.7857699394226074, "global_step": 2926, "epoch": 69} {"train_loss": -3.956493854522705, "global_step": 2927, "epoch": 69} {"train_loss": -4.075468063354492, "global_step": 2928, "epoch": 69} {"train_loss": -3.8071866035461426, "global_step": 2929, "epoch": 69} {"train_loss": -3.784719944000244, "global_step": 2930, "epoch": 69} {"train_loss": -3.9629855155944824, "global_step": 2931, "epoch": 69} {"train_loss": -3.8099400997161865, "global_step": 2932, "epoch": 69} {"train_loss": -3.862919807434082, "global_step": 2933, "epoch": 69} {"train_loss": -3.794218063354492, "global_step": 2934, "epoch": 69} {"train_loss": -3.9695825576782227, "global_step": 2935, "epoch": 69} {"train_loss": -3.766655921936035, "global_step": 2936, "epoch": 69} {"train_loss": -3.8323984146118164, "global_step": 2937, "epoch": 69} {"train_loss": -3.8889822959899902, "global_step": 2938, "epoch": 69} {"train_loss": -3.8386611370813277, "global_step": 2939, "epoch": 69, "val_loss": 171710.328125} {"train_loss": -3.7146573066711426, "global_step": 2940, "epoch": 70} {"train_loss": -3.9767043590545654, "global_step": 2941, "epoch": 70} {"train_loss": -3.7752678394317627, "global_step": 2942, "epoch": 70} {"train_loss": -3.814267158508301, "global_step": 2943, "epoch": 70} {"train_loss": -3.675766706466675, "global_step": 2944, "epoch": 70} {"train_loss": -3.9224300384521484, "global_step": 2945, "epoch": 70} {"train_loss": -3.853574275970459, "global_step": 2946, "epoch": 70} {"train_loss": -3.751314878463745, "global_step": 2947, "epoch": 70} {"train_loss": -3.739410877227783, "global_step": 2948, "epoch": 70} {"train_loss": -3.686856269836426, "global_step": 2949, "epoch": 70} {"train_loss": -3.7191429138183594, "global_step": 2950, "epoch": 70} {"train_loss": -3.7529518604278564, "global_step": 2951, "epoch": 70} {"train_loss": -3.6259963512420654, "global_step": 2952, "epoch": 70} {"train_loss": -3.8403096199035645, "global_step": 2953, "epoch": 70} {"train_loss": -3.5757484436035156, "global_step": 2954, "epoch": 70} {"train_loss": -3.8234615325927734, "global_step": 2955, "epoch": 70} {"train_loss": -3.80056095123291, "global_step": 2956, "epoch": 70} {"train_loss": -3.7283287048339844, "global_step": 2957, "epoch": 70} {"train_loss": -3.7846250534057617, "global_step": 2958, "epoch": 70} {"train_loss": -3.836019515991211, "global_step": 2959, "epoch": 70} {"train_loss": -3.8041625022888184, "global_step": 2960, "epoch": 70} {"train_loss": -3.8536574840545654, "global_step": 2961, "epoch": 70} {"train_loss": -3.8476686477661133, "global_step": 2962, "epoch": 70} {"train_loss": -3.8006672859191895, "global_step": 2963, "epoch": 70} {"train_loss": -3.933232307434082, "global_step": 2964, "epoch": 70} {"train_loss": -3.7092299461364746, "global_step": 2965, "epoch": 70} {"train_loss": -3.8704967498779297, "global_step": 2966, "epoch": 70} {"train_loss": -3.7274160385131836, "global_step": 2967, "epoch": 70} {"train_loss": -3.7251715660095215, "global_step": 2968, "epoch": 70} {"train_loss": -3.925337553024292, "global_step": 2969, "epoch": 70} {"train_loss": -3.787336587905884, "global_step": 2970, "epoch": 70} {"train_loss": -3.8510499000549316, "global_step": 2971, "epoch": 70} {"train_loss": -3.7444868087768555, "global_step": 2972, "epoch": 70} {"train_loss": -3.8608531951904297, "global_step": 2973, "epoch": 70} {"train_loss": -3.6529955863952637, "global_step": 2974, "epoch": 70} {"train_loss": -3.838834285736084, "global_step": 2975, "epoch": 70} {"train_loss": -3.8891077041625977, "global_step": 2976, "epoch": 70} {"train_loss": -3.804996967315674, "global_step": 2977, "epoch": 70} {"train_loss": -3.9575300216674805, "global_step": 2978, "epoch": 70} {"train_loss": -3.7882156372070312, "global_step": 2979, "epoch": 70} {"train_loss": -3.85367488861084, "global_step": 2980, "epoch": 70} {"train_loss": -3.797471670877366, "global_step": 2981, "epoch": 70, "val_loss": 171490.28125} {"train_loss": -3.801889657974243, "global_step": 2982, "epoch": 71} {"train_loss": -3.9534568786621094, "global_step": 2983, "epoch": 71} {"train_loss": -3.7477686405181885, "global_step": 2984, "epoch": 71} {"train_loss": -3.8299946784973145, "global_step": 2985, "epoch": 71} {"train_loss": -3.9377505779266357, "global_step": 2986, "epoch": 71} {"train_loss": -3.852294445037842, "global_step": 2987, "epoch": 71} {"train_loss": -3.81537127494812, "global_step": 2988, "epoch": 71} {"train_loss": -3.8646411895751953, "global_step": 2989, "epoch": 71} {"train_loss": -3.849442481994629, "global_step": 2990, "epoch": 71} {"train_loss": -3.881842851638794, "global_step": 2991, "epoch": 71} {"train_loss": -3.8233070373535156, "global_step": 2992, "epoch": 71} {"train_loss": -3.858448028564453, "global_step": 2993, "epoch": 71} {"train_loss": -3.8567824363708496, "global_step": 2994, "epoch": 71} {"train_loss": -3.8926889896392822, "global_step": 2995, "epoch": 71} {"train_loss": -3.8454370498657227, "global_step": 2996, "epoch": 71} {"train_loss": -3.977144241333008, "global_step": 2997, "epoch": 71} {"train_loss": -3.891998291015625, "global_step": 2998, "epoch": 71} {"train_loss": -3.9400718212127686, "global_step": 2999, "epoch": 71} {"train_loss": -3.9265694618225098, "global_step": 3000, "epoch": 71} {"train_loss": -3.8936076164245605, "global_step": 3001, "epoch": 71} {"train_loss": -3.7878456115722656, "global_step": 3002, "epoch": 71} {"train_loss": -3.8104004859924316, "global_step": 3003, "epoch": 71} {"train_loss": -3.926140069961548, "global_step": 3004, "epoch": 71} {"train_loss": -3.844822406768799, "global_step": 3005, "epoch": 71} {"train_loss": -4.009031772613525, "global_step": 3006, "epoch": 71} {"train_loss": -3.816107749938965, "global_step": 3007, "epoch": 71} {"train_loss": -3.8575000762939453, "global_step": 3008, "epoch": 71} {"train_loss": -3.960543155670166, "global_step": 3009, "epoch": 71} {"train_loss": -3.939552068710327, "global_step": 3010, "epoch": 71} {"train_loss": -4.006620407104492, "global_step": 3011, "epoch": 71} {"train_loss": -3.833134174346924, "global_step": 3012, "epoch": 71} {"train_loss": -3.9689903259277344, "global_step": 3013, "epoch": 71} {"train_loss": -3.847538709640503, "global_step": 3014, "epoch": 71} {"train_loss": -3.916938066482544, "global_step": 3015, "epoch": 71} {"train_loss": -3.9198663234710693, "global_step": 3016, "epoch": 71} {"train_loss": -3.971973419189453, "global_step": 3017, "epoch": 71} {"train_loss": -3.7464144229888916, "global_step": 3018, "epoch": 71} {"train_loss": -3.8513267040252686, "global_step": 3019, "epoch": 71} {"train_loss": -3.6803274154663086, "global_step": 3020, "epoch": 71} {"train_loss": -3.88981556892395, "global_step": 3021, "epoch": 71} {"train_loss": -3.8769681453704834, "global_step": 3022, "epoch": 71} {"train_loss": -3.874543553306943, "global_step": 3023, "epoch": 71, "val_loss": 165434.265625} {"train_loss": -4.045194625854492, "global_step": 3024, "epoch": 72} {"train_loss": -3.7598366737365723, "global_step": 3025, "epoch": 72} {"train_loss": -3.853771686553955, "global_step": 3026, "epoch": 72} {"train_loss": -3.742377996444702, "global_step": 3027, "epoch": 72} {"train_loss": -3.8301196098327637, "global_step": 3028, "epoch": 72} {"train_loss": -3.9773788452148438, "global_step": 3029, "epoch": 72} {"train_loss": -3.797391891479492, "global_step": 3030, "epoch": 72} {"train_loss": -3.8544530868530273, "global_step": 3031, "epoch": 72} {"train_loss": -3.8616857528686523, "global_step": 3032, "epoch": 72} {"train_loss": -3.754301071166992, "global_step": 3033, "epoch": 72} {"train_loss": -3.9019155502319336, "global_step": 3034, "epoch": 72} {"train_loss": -3.736624240875244, "global_step": 3035, "epoch": 72} {"train_loss": -3.6299796104431152, "global_step": 3036, "epoch": 72} {"train_loss": -3.9087119102478027, "global_step": 3037, "epoch": 72} {"train_loss": -3.755218029022217, "global_step": 3038, "epoch": 72} {"train_loss": -3.8656463623046875, "global_step": 3039, "epoch": 72} {"train_loss": -4.001551628112793, "global_step": 3040, "epoch": 72} {"train_loss": -3.6801276206970215, "global_step": 3041, "epoch": 72} {"train_loss": -3.8058080673217773, "global_step": 3042, "epoch": 72} {"train_loss": -3.911496639251709, "global_step": 3043, "epoch": 72} {"train_loss": -3.714353561401367, "global_step": 3044, "epoch": 72} {"train_loss": -3.892997980117798, "global_step": 3045, "epoch": 72} {"train_loss": -3.925767421722412, "global_step": 3046, "epoch": 72} {"train_loss": -3.767064332962036, "global_step": 3047, "epoch": 72} {"train_loss": -3.809849262237549, "global_step": 3048, "epoch": 72} {"train_loss": -3.9084248542785645, "global_step": 3049, "epoch": 72} {"train_loss": -4.045401096343994, "global_step": 3050, "epoch": 72} {"train_loss": -3.8652849197387695, "global_step": 3051, "epoch": 72} {"train_loss": -3.9036200046539307, "global_step": 3052, "epoch": 72} {"train_loss": -3.91416597366333, "global_step": 3053, "epoch": 72} {"train_loss": -3.8617746829986572, "global_step": 3054, "epoch": 72} {"train_loss": -3.8890864849090576, "global_step": 3055, "epoch": 72} {"train_loss": -3.9201369285583496, "global_step": 3056, "epoch": 72} {"train_loss": -4.0146636962890625, "global_step": 3057, "epoch": 72} {"train_loss": -3.922820568084717, "global_step": 3058, "epoch": 72} {"train_loss": -3.8579518795013428, "global_step": 3059, "epoch": 72} {"train_loss": -4.018465042114258, "global_step": 3060, "epoch": 72} {"train_loss": -3.9361984729766846, "global_step": 3061, "epoch": 72} {"train_loss": -3.7935140132904053, "global_step": 3062, "epoch": 72} {"train_loss": -4.011602878570557, "global_step": 3063, "epoch": 72} {"train_loss": -3.944187641143799, "global_step": 3064, "epoch": 72} {"train_loss": -3.8670792068753923, "global_step": 3065, "epoch": 72, "val_loss": 164642.1875} {"train_loss": -3.8459205627441406, "global_step": 3066, "epoch": 73} {"train_loss": -4.137401580810547, "global_step": 3067, "epoch": 73} {"train_loss": -3.82542085647583, "global_step": 3068, "epoch": 73} {"train_loss": -3.939542531967163, "global_step": 3069, "epoch": 73} {"train_loss": -3.8854570388793945, "global_step": 3070, "epoch": 73} {"train_loss": -3.9174020290374756, "global_step": 3071, "epoch": 73} {"train_loss": -3.8516721725463867, "global_step": 3072, "epoch": 73} {"train_loss": -3.8205182552337646, "global_step": 3073, "epoch": 73} {"train_loss": -3.9141244888305664, "global_step": 3074, "epoch": 73} {"train_loss": -3.927255868911743, "global_step": 3075, "epoch": 73} {"train_loss": -3.923781633377075, "global_step": 3076, "epoch": 73} {"train_loss": -3.7788279056549072, "global_step": 3077, "epoch": 73} {"train_loss": -3.8715097904205322, "global_step": 3078, "epoch": 73} {"train_loss": -3.7239718437194824, "global_step": 3079, "epoch": 73} {"train_loss": -3.8812685012817383, "global_step": 3080, "epoch": 73} {"train_loss": -3.9078850746154785, "global_step": 3081, "epoch": 73} {"train_loss": -3.765042543411255, "global_step": 3082, "epoch": 73} {"train_loss": -3.9886765480041504, "global_step": 3083, "epoch": 73} {"train_loss": -3.8022871017456055, "global_step": 3084, "epoch": 73} {"train_loss": -3.6691372394561768, "global_step": 3085, "epoch": 73} {"train_loss": -3.8114137649536133, "global_step": 3086, "epoch": 73} {"train_loss": -3.870272397994995, "global_step": 3087, "epoch": 73} {"train_loss": -3.784956216812134, "global_step": 3088, "epoch": 73} {"train_loss": -3.838691473007202, "global_step": 3089, "epoch": 73} {"train_loss": -3.93127703666687, "global_step": 3090, "epoch": 73} {"train_loss": -3.943460464477539, "global_step": 3091, "epoch": 73} {"train_loss": -3.846302032470703, "global_step": 3092, "epoch": 73} {"train_loss": -4.003022193908691, "global_step": 3093, "epoch": 73} {"train_loss": -3.894627809524536, "global_step": 3094, "epoch": 73} {"train_loss": -3.9558181762695312, "global_step": 3095, "epoch": 73} {"train_loss": -3.808718204498291, "global_step": 3096, "epoch": 73} {"train_loss": -3.9484500885009766, "global_step": 3097, "epoch": 73} {"train_loss": -4.057443618774414, "global_step": 3098, "epoch": 73} {"train_loss": -3.8429417610168457, "global_step": 3099, "epoch": 73} {"train_loss": -3.941283702850342, "global_step": 3100, "epoch": 73} {"train_loss": -3.838310718536377, "global_step": 3101, "epoch": 73} {"train_loss": -4.017670154571533, "global_step": 3102, "epoch": 73} {"train_loss": -3.8182504177093506, "global_step": 3103, "epoch": 73} {"train_loss": -4.106575965881348, "global_step": 3104, "epoch": 73} {"train_loss": -3.9498391151428223, "global_step": 3105, "epoch": 73} {"train_loss": -3.8478636741638184, "global_step": 3106, "epoch": 73} {"train_loss": -3.8934041602270946, "global_step": 3107, "epoch": 73, "val_loss": 162206.09375} {"train_loss": -3.9634339809417725, "global_step": 3108, "epoch": 74} {"train_loss": -4.006547927856445, "global_step": 3109, "epoch": 74} {"train_loss": -3.8402936458587646, "global_step": 3110, "epoch": 74} {"train_loss": -3.989722728729248, "global_step": 3111, "epoch": 74} {"train_loss": -3.8671326637268066, "global_step": 3112, "epoch": 74} {"train_loss": -3.854565143585205, "global_step": 3113, "epoch": 74} {"train_loss": -3.861281394958496, "global_step": 3114, "epoch": 74} {"train_loss": -3.861269474029541, "global_step": 3115, "epoch": 74} {"train_loss": -3.9652719497680664, "global_step": 3116, "epoch": 74} {"train_loss": -3.9230451583862305, "global_step": 3117, "epoch": 74} {"train_loss": -3.922487735748291, "global_step": 3118, "epoch": 74} {"train_loss": -3.9433434009552, "global_step": 3119, "epoch": 74} {"train_loss": -4.040691375732422, "global_step": 3120, "epoch": 74} {"train_loss": -3.8230643272399902, "global_step": 3121, "epoch": 74} {"train_loss": -3.807790994644165, "global_step": 3122, "epoch": 74} {"train_loss": -3.8915936946868896, "global_step": 3123, "epoch": 74} {"train_loss": -3.823697328567505, "global_step": 3124, "epoch": 74} {"train_loss": -3.859762191772461, "global_step": 3125, "epoch": 74} {"train_loss": -4.000253200531006, "global_step": 3126, "epoch": 74} {"train_loss": -3.9252753257751465, "global_step": 3127, "epoch": 74} {"train_loss": -3.8363828659057617, "global_step": 3128, "epoch": 74} {"train_loss": -3.8908772468566895, "global_step": 3129, "epoch": 74} {"train_loss": -4.1108222007751465, "global_step": 3130, "epoch": 74} {"train_loss": -3.8565711975097656, "global_step": 3131, "epoch": 74} {"train_loss": -3.8712635040283203, "global_step": 3132, "epoch": 74} {"train_loss": -3.9909605979919434, "global_step": 3133, "epoch": 74} {"train_loss": -3.9291484355926514, "global_step": 3134, "epoch": 74} {"train_loss": -3.939591407775879, "global_step": 3135, "epoch": 74} {"train_loss": -4.098004341125488, "global_step": 3136, "epoch": 74} {"train_loss": -3.914964437484741, "global_step": 3137, "epoch": 74} {"train_loss": -3.840303897857666, "global_step": 3138, "epoch": 74} {"train_loss": -3.9820804595947266, "global_step": 3139, "epoch": 74} {"train_loss": -3.865662097930908, "global_step": 3140, "epoch": 74} {"train_loss": -3.885104179382324, "global_step": 3141, "epoch": 74} {"train_loss": -3.870255470275879, "global_step": 3142, "epoch": 74} {"train_loss": -3.8928561210632324, "global_step": 3143, "epoch": 74} {"train_loss": -4.063942909240723, "global_step": 3144, "epoch": 74} {"train_loss": -3.786238670349121, "global_step": 3145, "epoch": 74} {"train_loss": -3.9410946369171143, "global_step": 3146, "epoch": 74} {"train_loss": -3.9517769813537598, "global_step": 3147, "epoch": 74} {"train_loss": -4.076889991760254, "global_step": 3148, "epoch": 74} {"train_loss": -3.921869885353815, "global_step": 3149, "epoch": 74, "val_loss": 160147.828125} {"train_loss": -4.02273416519165, "global_step": 3150, "epoch": 75} {"train_loss": -3.9207935333251953, "global_step": 3151, "epoch": 75} {"train_loss": -3.7815017700195312, "global_step": 3152, "epoch": 75} {"train_loss": -4.010299205780029, "global_step": 3153, "epoch": 75} {"train_loss": -4.090207099914551, "global_step": 3154, "epoch": 75} {"train_loss": -3.875765800476074, "global_step": 3155, "epoch": 75} {"train_loss": -3.936699867248535, "global_step": 3156, "epoch": 75} {"train_loss": -4.103611469268799, "global_step": 3157, "epoch": 75} {"train_loss": -3.8461828231811523, "global_step": 3158, "epoch": 75} {"train_loss": -4.073427677154541, "global_step": 3159, "epoch": 75} {"train_loss": -3.9697835445404053, "global_step": 3160, "epoch": 75} {"train_loss": -3.989990472793579, "global_step": 3161, "epoch": 75} {"train_loss": -3.997607707977295, "global_step": 3162, "epoch": 75} {"train_loss": -4.138167381286621, "global_step": 3163, "epoch": 75} {"train_loss": -4.016631126403809, "global_step": 3164, "epoch": 75} {"train_loss": -3.977686882019043, "global_step": 3165, "epoch": 75} {"train_loss": -3.9271738529205322, "global_step": 3166, "epoch": 75} {"train_loss": -4.12183141708374, "global_step": 3167, "epoch": 75} {"train_loss": -3.9882800579071045, "global_step": 3168, "epoch": 75} {"train_loss": -3.840275526046753, "global_step": 3169, "epoch": 75} {"train_loss": -3.994429349899292, "global_step": 3170, "epoch": 75} {"train_loss": -3.8868942260742188, "global_step": 3171, "epoch": 75} {"train_loss": -3.973064422607422, "global_step": 3172, "epoch": 75} {"train_loss": -3.951439619064331, "global_step": 3173, "epoch": 75} {"train_loss": -4.14455509185791, "global_step": 3174, "epoch": 75} {"train_loss": -3.9176228046417236, "global_step": 3175, "epoch": 75} {"train_loss": -3.9438767433166504, "global_step": 3176, "epoch": 75} {"train_loss": -4.013721466064453, "global_step": 3177, "epoch": 75} {"train_loss": -4.003859519958496, "global_step": 3178, "epoch": 75} {"train_loss": -3.8380415439605713, "global_step": 3179, "epoch": 75} {"train_loss": -3.8213045597076416, "global_step": 3180, "epoch": 75} {"train_loss": -4.062952041625977, "global_step": 3181, "epoch": 75} {"train_loss": -3.910308599472046, "global_step": 3182, "epoch": 75} {"train_loss": -3.8819663524627686, "global_step": 3183, "epoch": 75} {"train_loss": -3.9658102989196777, "global_step": 3184, "epoch": 75} {"train_loss": -3.946124792098999, "global_step": 3185, "epoch": 75} {"train_loss": -3.9376397132873535, "global_step": 3186, "epoch": 75} {"train_loss": -3.9153101444244385, "global_step": 3187, "epoch": 75} {"train_loss": -3.909708261489868, "global_step": 3188, "epoch": 75} {"train_loss": -3.9634480476379395, "global_step": 3189, "epoch": 75} {"train_loss": -4.053298473358154, "global_step": 3190, "epoch": 75} {"train_loss": -3.9634139935175576, "global_step": 3191, "epoch": 75, "val_loss": 157063.828125} {"train_loss": -3.9002065658569336, "global_step": 3192, "epoch": 76} {"train_loss": -4.07194709777832, "global_step": 3193, "epoch": 76} {"train_loss": -3.9828317165374756, "global_step": 3194, "epoch": 76} {"train_loss": -3.9877114295959473, "global_step": 3195, "epoch": 76} {"train_loss": -3.8757920265197754, "global_step": 3196, "epoch": 76} {"train_loss": -3.8337693214416504, "global_step": 3197, "epoch": 76} {"train_loss": -4.109434127807617, "global_step": 3198, "epoch": 76} {"train_loss": -3.9132113456726074, "global_step": 3199, "epoch": 76} {"train_loss": -3.9620842933654785, "global_step": 3200, "epoch": 76} {"train_loss": -3.7805838584899902, "global_step": 3201, "epoch": 76} {"train_loss": -4.053553104400635, "global_step": 3202, "epoch": 76} {"train_loss": -4.172019004821777, "global_step": 3203, "epoch": 76} {"train_loss": -4.011404991149902, "global_step": 3204, "epoch": 76} {"train_loss": -3.7383315563201904, "global_step": 3205, "epoch": 76} {"train_loss": -4.143802642822266, "global_step": 3206, "epoch": 76} {"train_loss": -4.038983345031738, "global_step": 3207, "epoch": 76} {"train_loss": -3.9100356101989746, "global_step": 3208, "epoch": 76} {"train_loss": -3.7961533069610596, "global_step": 3209, "epoch": 76} {"train_loss": -3.99965238571167, "global_step": 3210, "epoch": 76} {"train_loss": -3.915821075439453, "global_step": 3211, "epoch": 76} {"train_loss": -3.7636935710906982, "global_step": 3212, "epoch": 76} {"train_loss": -3.920788049697876, "global_step": 3213, "epoch": 76} {"train_loss": -3.954956531524658, "global_step": 3214, "epoch": 76} {"train_loss": -3.822080612182617, "global_step": 3215, "epoch": 76} {"train_loss": -3.9897093772888184, "global_step": 3216, "epoch": 76} {"train_loss": -3.8455586433410645, "global_step": 3217, "epoch": 76} {"train_loss": -3.9432122707366943, "global_step": 3218, "epoch": 76} {"train_loss": -3.9552056789398193, "global_step": 3219, "epoch": 76} {"train_loss": -3.9998855590820312, "global_step": 3220, "epoch": 76} {"train_loss": -4.072603225708008, "global_step": 3221, "epoch": 76} {"train_loss": -4.115198612213135, "global_step": 3222, "epoch": 76} {"train_loss": -4.076165676116943, "global_step": 3223, "epoch": 76} {"train_loss": -3.878352165222168, "global_step": 3224, "epoch": 76} {"train_loss": -3.880763530731201, "global_step": 3225, "epoch": 76} {"train_loss": -3.939265251159668, "global_step": 3226, "epoch": 76} {"train_loss": -4.0328216552734375, "global_step": 3227, "epoch": 76} {"train_loss": -3.923064708709717, "global_step": 3228, "epoch": 76} {"train_loss": -3.8881235122680664, "global_step": 3229, "epoch": 76} {"train_loss": -4.001586437225342, "global_step": 3230, "epoch": 76} {"train_loss": -3.963812828063965, "global_step": 3231, "epoch": 76} {"train_loss": -3.946471929550171, "global_step": 3232, "epoch": 76} {"train_loss": -3.951759707360041, "global_step": 3233, "epoch": 76, "val_loss": 154372.21875} {"train_loss": -3.9973864555358887, "global_step": 3234, "epoch": 77} {"train_loss": -4.048018455505371, "global_step": 3235, "epoch": 77} {"train_loss": -3.8409693241119385, "global_step": 3236, "epoch": 77} {"train_loss": -3.9141807556152344, "global_step": 3237, "epoch": 77} {"train_loss": -4.055620193481445, "global_step": 3238, "epoch": 77} {"train_loss": -4.006946563720703, "global_step": 3239, "epoch": 77} {"train_loss": -3.9485292434692383, "global_step": 3240, "epoch": 77} {"train_loss": -3.8261656761169434, "global_step": 3241, "epoch": 77} {"train_loss": -4.016286849975586, "global_step": 3242, "epoch": 77} {"train_loss": -4.001258850097656, "global_step": 3243, "epoch": 77} {"train_loss": -3.8528523445129395, "global_step": 3244, "epoch": 77} {"train_loss": -3.9569814205169678, "global_step": 3245, "epoch": 77} {"train_loss": -3.9689629077911377, "global_step": 3246, "epoch": 77} {"train_loss": -3.7050793170928955, "global_step": 3247, "epoch": 77} {"train_loss": -3.9042458534240723, "global_step": 3248, "epoch": 77} {"train_loss": -3.773167371749878, "global_step": 3249, "epoch": 77} {"train_loss": -3.967637777328491, "global_step": 3250, "epoch": 77} {"train_loss": -4.033627510070801, "global_step": 3251, "epoch": 77} {"train_loss": -3.9316821098327637, "global_step": 3252, "epoch": 77} {"train_loss": -4.031373023986816, "global_step": 3253, "epoch": 77} {"train_loss": -3.9911205768585205, "global_step": 3254, "epoch": 77} {"train_loss": -4.008404731750488, "global_step": 3255, "epoch": 77} {"train_loss": -3.8574376106262207, "global_step": 3256, "epoch": 77} {"train_loss": -3.984731674194336, "global_step": 3257, "epoch": 77} {"train_loss": -3.8126258850097656, "global_step": 3258, "epoch": 77} {"train_loss": -3.959066152572632, "global_step": 3259, "epoch": 77} {"train_loss": -3.986851692199707, "global_step": 3260, "epoch": 77} {"train_loss": -3.9373764991760254, "global_step": 3261, "epoch": 77} {"train_loss": -4.051294803619385, "global_step": 3262, "epoch": 77} {"train_loss": -4.092846870422363, "global_step": 3263, "epoch": 77} {"train_loss": -4.038963317871094, "global_step": 3264, "epoch": 77} {"train_loss": -3.914172410964966, "global_step": 3265, "epoch": 77} {"train_loss": -4.072516918182373, "global_step": 3266, "epoch": 77} {"train_loss": -3.9647269248962402, "global_step": 3267, "epoch": 77} {"train_loss": -4.084808349609375, "global_step": 3268, "epoch": 77} {"train_loss": -4.141745567321777, "global_step": 3269, "epoch": 77} {"train_loss": -4.091434478759766, "global_step": 3270, "epoch": 77} {"train_loss": -3.960524082183838, "global_step": 3271, "epoch": 77} {"train_loss": -3.9754691123962402, "global_step": 3272, "epoch": 77} {"train_loss": -4.022747039794922, "global_step": 3273, "epoch": 77} {"train_loss": -4.062639236450195, "global_step": 3274, "epoch": 77} {"train_loss": -3.971295089948745, "global_step": 3275, "epoch": 77, "val_loss": 151041.296875} {"train_loss": -4.096334457397461, "global_step": 3276, "epoch": 78} {"train_loss": -3.896794319152832, "global_step": 3277, "epoch": 78} {"train_loss": -3.912118434906006, "global_step": 3278, "epoch": 78} {"train_loss": -3.9387576580047607, "global_step": 3279, "epoch": 78} {"train_loss": -3.801588535308838, "global_step": 3280, "epoch": 78} {"train_loss": -3.958486318588257, "global_step": 3281, "epoch": 78} {"train_loss": -4.01992130279541, "global_step": 3282, "epoch": 78} {"train_loss": -3.7256991863250732, "global_step": 3283, "epoch": 78} {"train_loss": -3.9011788368225098, "global_step": 3284, "epoch": 78} {"train_loss": -3.9071102142333984, "global_step": 3285, "epoch": 78} {"train_loss": -3.8105785846710205, "global_step": 3286, "epoch": 78} {"train_loss": -3.884469509124756, "global_step": 3287, "epoch": 78} {"train_loss": -3.895228862762451, "global_step": 3288, "epoch": 78} {"train_loss": -3.726243495941162, "global_step": 3289, "epoch": 78} {"train_loss": -4.100485324859619, "global_step": 3290, "epoch": 78} {"train_loss": -3.828310489654541, "global_step": 3291, "epoch": 78} {"train_loss": -3.8425145149230957, "global_step": 3292, "epoch": 78} {"train_loss": -3.9598217010498047, "global_step": 3293, "epoch": 78} {"train_loss": -3.7055811882019043, "global_step": 3294, "epoch": 78} {"train_loss": -4.05995512008667, "global_step": 3295, "epoch": 78} {"train_loss": -3.862415075302124, "global_step": 3296, "epoch": 78} {"train_loss": -3.8706955909729004, "global_step": 3297, "epoch": 78} {"train_loss": -4.04699182510376, "global_step": 3298, "epoch": 78} {"train_loss": -3.9460813999176025, "global_step": 3299, "epoch": 78} {"train_loss": -4.183938980102539, "global_step": 3300, "epoch": 78} {"train_loss": -4.075620651245117, "global_step": 3301, "epoch": 78} {"train_loss": -4.038424491882324, "global_step": 3302, "epoch": 78} {"train_loss": -3.9467697143554688, "global_step": 3303, "epoch": 78} {"train_loss": -3.904151439666748, "global_step": 3304, "epoch": 78} {"train_loss": -4.031048774719238, "global_step": 3305, "epoch": 78} {"train_loss": -3.88291335105896, "global_step": 3306, "epoch": 78} {"train_loss": -3.9746508598327637, "global_step": 3307, "epoch": 78} {"train_loss": -3.7457408905029297, "global_step": 3308, "epoch": 78} {"train_loss": -4.112873077392578, "global_step": 3309, "epoch": 78} {"train_loss": -3.92633056640625, "global_step": 3310, "epoch": 78} {"train_loss": -4.003822326660156, "global_step": 3311, "epoch": 78} {"train_loss": -3.93973445892334, "global_step": 3312, "epoch": 78} {"train_loss": -4.031502723693848, "global_step": 3313, "epoch": 78} {"train_loss": -3.821284294128418, "global_step": 3314, "epoch": 78} {"train_loss": -3.9257521629333496, "global_step": 3315, "epoch": 78} {"train_loss": -3.9012632369995117, "global_step": 3316, "epoch": 78} {"train_loss": -3.931221541904268, "global_step": 3317, "epoch": 78, "val_loss": 149110.296875} {"train_loss": -4.014558792114258, "global_step": 3318, "epoch": 79} {"train_loss": -3.9556241035461426, "global_step": 3319, "epoch": 79} {"train_loss": -4.082651138305664, "global_step": 3320, "epoch": 79} {"train_loss": -4.112235069274902, "global_step": 3321, "epoch": 79} {"train_loss": -4.039344310760498, "global_step": 3322, "epoch": 79} {"train_loss": -3.9240059852600098, "global_step": 3323, "epoch": 79} {"train_loss": -4.033092975616455, "global_step": 3324, "epoch": 79} {"train_loss": -4.025105953216553, "global_step": 3325, "epoch": 79} {"train_loss": -3.996610403060913, "global_step": 3326, "epoch": 79} {"train_loss": -3.9622740745544434, "global_step": 3327, "epoch": 79} {"train_loss": -4.0539350509643555, "global_step": 3328, "epoch": 79} {"train_loss": -4.085812568664551, "global_step": 3329, "epoch": 79} {"train_loss": -3.9707651138305664, "global_step": 3330, "epoch": 79} {"train_loss": -3.9072277545928955, "global_step": 3331, "epoch": 79} {"train_loss": -3.9652419090270996, "global_step": 3332, "epoch": 79} {"train_loss": -3.999640941619873, "global_step": 3333, "epoch": 79} {"train_loss": -4.073427200317383, "global_step": 3334, "epoch": 79} {"train_loss": -4.046489715576172, "global_step": 3335, "epoch": 79} {"train_loss": -3.9403319358825684, "global_step": 3336, "epoch": 79} {"train_loss": -4.044090747833252, "global_step": 3337, "epoch": 79} {"train_loss": -3.937274932861328, "global_step": 3338, "epoch": 79} {"train_loss": -4.001867294311523, "global_step": 3339, "epoch": 79} {"train_loss": -3.8908848762512207, "global_step": 3340, "epoch": 79} {"train_loss": -4.093928337097168, "global_step": 3341, "epoch": 79} {"train_loss": -3.829564094543457, "global_step": 3342, "epoch": 79} {"train_loss": -3.869935989379883, "global_step": 3343, "epoch": 79} {"train_loss": -3.846989870071411, "global_step": 3344, "epoch": 79} {"train_loss": -4.097062110900879, "global_step": 3345, "epoch": 79} {"train_loss": -4.130441665649414, "global_step": 3346, "epoch": 79} {"train_loss": -4.015998840332031, "global_step": 3347, "epoch": 79} {"train_loss": -4.054679870605469, "global_step": 3348, "epoch": 79} {"train_loss": -4.019678115844727, "global_step": 3349, "epoch": 79} {"train_loss": -3.9650535583496094, "global_step": 3350, "epoch": 79} {"train_loss": -4.086261749267578, "global_step": 3351, "epoch": 79} {"train_loss": -4.027224063873291, "global_step": 3352, "epoch": 79} {"train_loss": -3.990976333618164, "global_step": 3353, "epoch": 79} {"train_loss": -3.983447790145874, "global_step": 3354, "epoch": 79} {"train_loss": -4.1398234367370605, "global_step": 3355, "epoch": 79} {"train_loss": -4.104691028594971, "global_step": 3356, "epoch": 79} {"train_loss": -4.029716968536377, "global_step": 3357, "epoch": 79} {"train_loss": -4.200678825378418, "global_step": 3358, "epoch": 79} {"train_loss": -4.012190370332627, "global_step": 3359, "epoch": 79, "val_loss": 150319.703125} {"train_loss": -3.9208860397338867, "global_step": 3360, "epoch": 80} {"train_loss": -4.204799175262451, "global_step": 3361, "epoch": 80} {"train_loss": -4.000444412231445, "global_step": 3362, "epoch": 80} {"train_loss": -4.183907508850098, "global_step": 3363, "epoch": 80} {"train_loss": -4.023304462432861, "global_step": 3364, "epoch": 80} {"train_loss": -3.90643310546875, "global_step": 3365, "epoch": 80} {"train_loss": -4.1018171310424805, "global_step": 3366, "epoch": 80} {"train_loss": -4.22300910949707, "global_step": 3367, "epoch": 80} {"train_loss": -4.047539710998535, "global_step": 3368, "epoch": 80} {"train_loss": -4.183497428894043, "global_step": 3369, "epoch": 80} {"train_loss": -4.167102813720703, "global_step": 3370, "epoch": 80} {"train_loss": -4.004555702209473, "global_step": 3371, "epoch": 80} {"train_loss": -3.9583358764648438, "global_step": 3372, "epoch": 80} {"train_loss": -4.062806129455566, "global_step": 3373, "epoch": 80} {"train_loss": -4.0453596115112305, "global_step": 3374, "epoch": 80} {"train_loss": -4.122768402099609, "global_step": 3375, "epoch": 80} {"train_loss": -3.877406120300293, "global_step": 3376, "epoch": 80} {"train_loss": -4.033287048339844, "global_step": 3377, "epoch": 80} {"train_loss": -3.939950466156006, "global_step": 3378, "epoch": 80} {"train_loss": -3.770801305770874, "global_step": 3379, "epoch": 80} {"train_loss": -4.065325736999512, "global_step": 3380, "epoch": 80} {"train_loss": -3.99086332321167, "global_step": 3381, "epoch": 80} {"train_loss": -3.94657826423645, "global_step": 3382, "epoch": 80} {"train_loss": -4.062471389770508, "global_step": 3383, "epoch": 80} {"train_loss": -4.016053199768066, "global_step": 3384, "epoch": 80} {"train_loss": -3.91614031791687, "global_step": 3385, "epoch": 80} {"train_loss": -4.05638313293457, "global_step": 3386, "epoch": 80} {"train_loss": -4.028426170349121, "global_step": 3387, "epoch": 80} {"train_loss": -3.8745837211608887, "global_step": 3388, "epoch": 80} {"train_loss": -4.146249771118164, "global_step": 3389, "epoch": 80} {"train_loss": -4.034609794616699, "global_step": 3390, "epoch": 80} {"train_loss": -4.048892498016357, "global_step": 3391, "epoch": 80} {"train_loss": -4.01588773727417, "global_step": 3392, "epoch": 80} {"train_loss": -4.114740371704102, "global_step": 3393, "epoch": 80} {"train_loss": -4.176440715789795, "global_step": 3394, "epoch": 80} {"train_loss": -4.119531154632568, "global_step": 3395, "epoch": 80} {"train_loss": -4.084037780761719, "global_step": 3396, "epoch": 80} {"train_loss": -4.158436298370361, "global_step": 3397, "epoch": 80} {"train_loss": -4.161543846130371, "global_step": 3398, "epoch": 80} {"train_loss": -4.0006537437438965, "global_step": 3399, "epoch": 80} {"train_loss": -4.151880264282227, "global_step": 3400, "epoch": 80} {"train_loss": -4.0447962284088135, "global_step": 3401, "epoch": 80, "val_loss": 145842.4375} {"train_loss": -4.065984725952148, "global_step": 3402, "epoch": 81} {"train_loss": -4.155872344970703, "global_step": 3403, "epoch": 81} {"train_loss": -4.079916954040527, "global_step": 3404, "epoch": 81} {"train_loss": -4.05922794342041, "global_step": 3405, "epoch": 81} {"train_loss": -4.084498882293701, "global_step": 3406, "epoch": 81} {"train_loss": -4.025890350341797, "global_step": 3407, "epoch": 81} {"train_loss": -4.000369548797607, "global_step": 3408, "epoch": 81} {"train_loss": -3.9061763286590576, "global_step": 3409, "epoch": 81} {"train_loss": -4.0121636390686035, "global_step": 3410, "epoch": 81} {"train_loss": -4.205554962158203, "global_step": 3411, "epoch": 81} {"train_loss": -4.020791053771973, "global_step": 3412, "epoch": 81} {"train_loss": -3.735382080078125, "global_step": 3413, "epoch": 81} {"train_loss": -4.073420524597168, "global_step": 3414, "epoch": 81} {"train_loss": -3.7503976821899414, "global_step": 3415, "epoch": 81} {"train_loss": -3.8151376247406006, "global_step": 3416, "epoch": 81} {"train_loss": -3.9115395545959473, "global_step": 3417, "epoch": 81} {"train_loss": -3.9704957008361816, "global_step": 3418, "epoch": 81} {"train_loss": -3.849705219268799, "global_step": 3419, "epoch": 81} {"train_loss": -3.918262004852295, "global_step": 3420, "epoch": 81} {"train_loss": -3.9320898056030273, "global_step": 3421, "epoch": 81} {"train_loss": -3.937284469604492, "global_step": 3422, "epoch": 81} {"train_loss": -4.117985248565674, "global_step": 3423, "epoch": 81} {"train_loss": -4.0174174308776855, "global_step": 3424, "epoch": 81} {"train_loss": -3.9690418243408203, "global_step": 3425, "epoch": 81} {"train_loss": -4.104223728179932, "global_step": 3426, "epoch": 81} {"train_loss": -3.9877891540527344, "global_step": 3427, "epoch": 81} {"train_loss": -3.9903268814086914, "global_step": 3428, "epoch": 81} {"train_loss": -4.13908576965332, "global_step": 3429, "epoch": 81} {"train_loss": -3.973560333251953, "global_step": 3430, "epoch": 81} {"train_loss": -4.096138954162598, "global_step": 3431, "epoch": 81} {"train_loss": -4.125976085662842, "global_step": 3432, "epoch": 81} {"train_loss": -4.202443599700928, "global_step": 3433, "epoch": 81} {"train_loss": -4.086187362670898, "global_step": 3434, "epoch": 81} {"train_loss": -4.000292778015137, "global_step": 3435, "epoch": 81} {"train_loss": -4.029666900634766, "global_step": 3436, "epoch": 81} {"train_loss": -3.968191146850586, "global_step": 3437, "epoch": 81} {"train_loss": -4.033058166503906, "global_step": 3438, "epoch": 81} {"train_loss": -4.0279364585876465, "global_step": 3439, "epoch": 81} {"train_loss": -4.064545154571533, "global_step": 3440, "epoch": 81} {"train_loss": -3.946300983428955, "global_step": 3441, "epoch": 81} {"train_loss": -4.060967445373535, "global_step": 3442, "epoch": 81} {"train_loss": -4.012124742780413, "global_step": 3443, "epoch": 81, "val_loss": 144008.8125} {"train_loss": -4.130003929138184, "global_step": 3444, "epoch": 82} {"train_loss": -4.096743583679199, "global_step": 3445, "epoch": 82} {"train_loss": -4.2361040115356445, "global_step": 3446, "epoch": 82} {"train_loss": -4.165003776550293, "global_step": 3447, "epoch": 82} {"train_loss": -4.042545318603516, "global_step": 3448, "epoch": 82} {"train_loss": -4.101326942443848, "global_step": 3449, "epoch": 82} {"train_loss": -4.129812717437744, "global_step": 3450, "epoch": 82} {"train_loss": -4.168810844421387, "global_step": 3451, "epoch": 82} {"train_loss": -4.099702835083008, "global_step": 3452, "epoch": 82} {"train_loss": -4.055069446563721, "global_step": 3453, "epoch": 82} {"train_loss": -4.079679012298584, "global_step": 3454, "epoch": 82} {"train_loss": -4.1977362632751465, "global_step": 3455, "epoch": 82} {"train_loss": -4.204715251922607, "global_step": 3456, "epoch": 82} {"train_loss": -3.9329066276550293, "global_step": 3457, "epoch": 82} {"train_loss": -4.109081268310547, "global_step": 3458, "epoch": 82} {"train_loss": -4.021383285522461, "global_step": 3459, "epoch": 82} {"train_loss": -4.110529899597168, "global_step": 3460, "epoch": 82} {"train_loss": -4.063258171081543, "global_step": 3461, "epoch": 82} {"train_loss": -4.013962745666504, "global_step": 3462, "epoch": 82} {"train_loss": -4.051730155944824, "global_step": 3463, "epoch": 82} {"train_loss": -4.182350158691406, "global_step": 3464, "epoch": 82} {"train_loss": -4.192351341247559, "global_step": 3465, "epoch": 82} {"train_loss": -3.948538303375244, "global_step": 3466, "epoch": 82} {"train_loss": -4.142511367797852, "global_step": 3467, "epoch": 82} {"train_loss": -4.193838119506836, "global_step": 3468, "epoch": 82} {"train_loss": -4.046740531921387, "global_step": 3469, "epoch": 82} {"train_loss": -3.8951492309570312, "global_step": 3470, "epoch": 82} {"train_loss": -4.045788288116455, "global_step": 3471, "epoch": 82} {"train_loss": -3.792362689971924, "global_step": 3472, "epoch": 82} {"train_loss": -3.928297281265259, "global_step": 3473, "epoch": 82} {"train_loss": -3.6977410316467285, "global_step": 3474, "epoch": 82} {"train_loss": -3.7919256687164307, "global_step": 3475, "epoch": 82} {"train_loss": -3.896766185760498, "global_step": 3476, "epoch": 82} {"train_loss": -3.8449854850769043, "global_step": 3477, "epoch": 82} {"train_loss": -4.140746593475342, "global_step": 3478, "epoch": 82} {"train_loss": -3.979511260986328, "global_step": 3479, "epoch": 82} {"train_loss": -3.929746627807617, "global_step": 3480, "epoch": 82} {"train_loss": -3.968524217605591, "global_step": 3481, "epoch": 82} {"train_loss": -4.07114315032959, "global_step": 3482, "epoch": 82} {"train_loss": -3.7272534370422363, "global_step": 3483, "epoch": 82} {"train_loss": -3.7963099479675293, "global_step": 3484, "epoch": 82} {"train_loss": -4.027109969229925, "global_step": 3485, "epoch": 82, "val_loss": 140815.21875} {"train_loss": -4.045537948608398, "global_step": 3486, "epoch": 83} {"train_loss": -3.911594867706299, "global_step": 3487, "epoch": 83} {"train_loss": -3.878115653991699, "global_step": 3488, "epoch": 83} {"train_loss": -4.102810382843018, "global_step": 3489, "epoch": 83} {"train_loss": -3.8774874210357666, "global_step": 3490, "epoch": 83} {"train_loss": -4.055609226226807, "global_step": 3491, "epoch": 83} {"train_loss": -3.960500955581665, "global_step": 3492, "epoch": 83} {"train_loss": -4.096461296081543, "global_step": 3493, "epoch": 83} {"train_loss": -3.914466381072998, "global_step": 3494, "epoch": 83} {"train_loss": -4.033182144165039, "global_step": 3495, "epoch": 83} {"train_loss": -4.050567626953125, "global_step": 3496, "epoch": 83} {"train_loss": -4.053793430328369, "global_step": 3497, "epoch": 83} {"train_loss": -4.148321151733398, "global_step": 3498, "epoch": 83} {"train_loss": -4.201623916625977, "global_step": 3499, "epoch": 83} {"train_loss": -4.064133644104004, "global_step": 3500, "epoch": 83} {"train_loss": -4.159634590148926, "global_step": 3501, "epoch": 83} {"train_loss": -4.128408432006836, "global_step": 3502, "epoch": 83} {"train_loss": -3.9618515968322754, "global_step": 3503, "epoch": 83} {"train_loss": -4.033189296722412, "global_step": 3504, "epoch": 83} {"train_loss": -4.136495590209961, "global_step": 3505, "epoch": 83} {"train_loss": -4.139928340911865, "global_step": 3506, "epoch": 83} {"train_loss": -4.00340461730957, "global_step": 3507, "epoch": 83} {"train_loss": -4.089973449707031, "global_step": 3508, "epoch": 83} {"train_loss": -3.9496984481811523, "global_step": 3509, "epoch": 83} {"train_loss": -4.058547019958496, "global_step": 3510, "epoch": 83} {"train_loss": -4.050239086151123, "global_step": 3511, "epoch": 83} {"train_loss": -4.09390115737915, "global_step": 3512, "epoch": 83} {"train_loss": -4.211182117462158, "global_step": 3513, "epoch": 83} {"train_loss": -4.1571044921875, "global_step": 3514, "epoch": 83} {"train_loss": -4.12269401550293, "global_step": 3515, "epoch": 83} {"train_loss": -4.12394905090332, "global_step": 3516, "epoch": 83} {"train_loss": -4.11287784576416, "global_step": 3517, "epoch": 83} {"train_loss": -4.10316276550293, "global_step": 3518, "epoch": 83} {"train_loss": -4.0062479972839355, "global_step": 3519, "epoch": 83} {"train_loss": -4.060945510864258, "global_step": 3520, "epoch": 83} {"train_loss": -4.105226993560791, "global_step": 3521, "epoch": 83} {"train_loss": -4.072848796844482, "global_step": 3522, "epoch": 83} {"train_loss": -4.093873023986816, "global_step": 3523, "epoch": 83} {"train_loss": -4.230842590332031, "global_step": 3524, "epoch": 83} {"train_loss": -4.164633750915527, "global_step": 3525, "epoch": 83} {"train_loss": -4.1388349533081055, "global_step": 3526, "epoch": 83} {"train_loss": -4.072455099650791, "global_step": 3527, "epoch": 83, "val_loss": 141840.8125} {"train_loss": -3.9207663536071777, "global_step": 3528, "epoch": 84} {"train_loss": -4.007041931152344, "global_step": 3529, "epoch": 84} {"train_loss": -4.171733856201172, "global_step": 3530, "epoch": 84} {"train_loss": -4.089969635009766, "global_step": 3531, "epoch": 84} {"train_loss": -3.971226215362549, "global_step": 3532, "epoch": 84} {"train_loss": -4.116776943206787, "global_step": 3533, "epoch": 84} {"train_loss": -4.296178817749023, "global_step": 3534, "epoch": 84} {"train_loss": -4.000627517700195, "global_step": 3535, "epoch": 84} {"train_loss": -4.222142219543457, "global_step": 3536, "epoch": 84} {"train_loss": -4.103794574737549, "global_step": 3537, "epoch": 84} {"train_loss": -4.156866073608398, "global_step": 3538, "epoch": 84} {"train_loss": -3.986884593963623, "global_step": 3539, "epoch": 84} {"train_loss": -4.109976768493652, "global_step": 3540, "epoch": 84} {"train_loss": -4.05836296081543, "global_step": 3541, "epoch": 84} {"train_loss": -4.03500509262085, "global_step": 3542, "epoch": 84} {"train_loss": -4.13760232925415, "global_step": 3543, "epoch": 84} {"train_loss": -4.157925605773926, "global_step": 3544, "epoch": 84} {"train_loss": -4.077005386352539, "global_step": 3545, "epoch": 84} {"train_loss": -4.153469085693359, "global_step": 3546, "epoch": 84} {"train_loss": -4.0775146484375, "global_step": 3547, "epoch": 84} {"train_loss": -4.159991264343262, "global_step": 3548, "epoch": 84} {"train_loss": -4.204523086547852, "global_step": 3549, "epoch": 84} {"train_loss": -4.283637523651123, "global_step": 3550, "epoch": 84} {"train_loss": -4.008852005004883, "global_step": 3551, "epoch": 84} {"train_loss": -4.12646484375, "global_step": 3552, "epoch": 84} {"train_loss": -3.9746227264404297, "global_step": 3553, "epoch": 84} {"train_loss": -3.8975672721862793, "global_step": 3554, "epoch": 84} {"train_loss": -3.9405994415283203, "global_step": 3555, "epoch": 84} {"train_loss": -3.68131160736084, "global_step": 3556, "epoch": 84} {"train_loss": -4.144237041473389, "global_step": 3557, "epoch": 84} {"train_loss": -3.7584853172302246, "global_step": 3558, "epoch": 84} {"train_loss": -3.765763282775879, "global_step": 3559, "epoch": 84} {"train_loss": -3.9270918369293213, "global_step": 3560, "epoch": 84} {"train_loss": -3.682887554168701, "global_step": 3561, "epoch": 84} {"train_loss": -4.218186378479004, "global_step": 3562, "epoch": 84} {"train_loss": -3.803039073944092, "global_step": 3563, "epoch": 84} {"train_loss": -3.901156425476074, "global_step": 3564, "epoch": 84} {"train_loss": -4.032822132110596, "global_step": 3565, "epoch": 84} {"train_loss": -3.9705967903137207, "global_step": 3566, "epoch": 84} {"train_loss": -3.884117841720581, "global_step": 3567, "epoch": 84} {"train_loss": -4.151669979095459, "global_step": 3568, "epoch": 84} {"train_loss": -4.034433523813884, "global_step": 3569, "epoch": 84, "val_loss": 137456.734375} {"train_loss": -4.021965503692627, "global_step": 3570, "epoch": 85} {"train_loss": -4.089001178741455, "global_step": 3571, "epoch": 85} {"train_loss": -4.067987442016602, "global_step": 3572, "epoch": 85} {"train_loss": -4.00662899017334, "global_step": 3573, "epoch": 85} {"train_loss": -4.078144073486328, "global_step": 3574, "epoch": 85} {"train_loss": -3.9449076652526855, "global_step": 3575, "epoch": 85} {"train_loss": -4.142618179321289, "global_step": 3576, "epoch": 85} {"train_loss": -4.088958740234375, "global_step": 3577, "epoch": 85} {"train_loss": -4.075421333312988, "global_step": 3578, "epoch": 85} {"train_loss": -3.979240894317627, "global_step": 3579, "epoch": 85} {"train_loss": -4.092352867126465, "global_step": 3580, "epoch": 85} {"train_loss": -4.067595481872559, "global_step": 3581, "epoch": 85} {"train_loss": -4.088387489318848, "global_step": 3582, "epoch": 85} {"train_loss": -4.029313564300537, "global_step": 3583, "epoch": 85} {"train_loss": -4.2822346687316895, "global_step": 3584, "epoch": 85} {"train_loss": -4.060782432556152, "global_step": 3585, "epoch": 85} {"train_loss": -4.210351943969727, "global_step": 3586, "epoch": 85} {"train_loss": -4.277290344238281, "global_step": 3587, "epoch": 85} {"train_loss": -3.9444384574890137, "global_step": 3588, "epoch": 85} {"train_loss": -4.263014793395996, "global_step": 3589, "epoch": 85} {"train_loss": -4.080853462219238, "global_step": 3590, "epoch": 85} {"train_loss": -4.2325849533081055, "global_step": 3591, "epoch": 85} {"train_loss": -4.0885396003723145, "global_step": 3592, "epoch": 85} {"train_loss": -4.277548313140869, "global_step": 3593, "epoch": 85} {"train_loss": -4.123493671417236, "global_step": 3594, "epoch": 85} {"train_loss": -4.23887825012207, "global_step": 3595, "epoch": 85} {"train_loss": -4.266295433044434, "global_step": 3596, "epoch": 85} {"train_loss": -4.22591495513916, "global_step": 3597, "epoch": 85} {"train_loss": -4.186826229095459, "global_step": 3598, "epoch": 85} {"train_loss": -4.153422832489014, "global_step": 3599, "epoch": 85} {"train_loss": -4.134028434753418, "global_step": 3600, "epoch": 85} {"train_loss": -4.183955192565918, "global_step": 3601, "epoch": 85} {"train_loss": -4.155077934265137, "global_step": 3602, "epoch": 85} {"train_loss": -3.9285330772399902, "global_step": 3603, "epoch": 85} {"train_loss": -4.193531036376953, "global_step": 3604, "epoch": 85} {"train_loss": -4.124396324157715, "global_step": 3605, "epoch": 85} {"train_loss": -4.1891913414001465, "global_step": 3606, "epoch": 85} {"train_loss": -3.987067461013794, "global_step": 3607, "epoch": 85} {"train_loss": -3.9958102703094482, "global_step": 3608, "epoch": 85} {"train_loss": -4.200353145599365, "global_step": 3609, "epoch": 85} {"train_loss": -4.197672367095947, "global_step": 3610, "epoch": 85} {"train_loss": -4.1157251709983464, "global_step": 3611, "epoch": 85, "val_loss": 134315.28125} {"train_loss": -4.113140106201172, "global_step": 3612, "epoch": 86} {"train_loss": -4.002702713012695, "global_step": 3613, "epoch": 86} {"train_loss": -3.918466329574585, "global_step": 3614, "epoch": 86} {"train_loss": -4.040369033813477, "global_step": 3615, "epoch": 86} {"train_loss": -4.122132301330566, "global_step": 3616, "epoch": 86} {"train_loss": -4.10858678817749, "global_step": 3617, "epoch": 86} {"train_loss": -3.991598606109619, "global_step": 3618, "epoch": 86} {"train_loss": -4.110602378845215, "global_step": 3619, "epoch": 86} {"train_loss": -4.160182952880859, "global_step": 3620, "epoch": 86} {"train_loss": -4.075512886047363, "global_step": 3621, "epoch": 86} {"train_loss": -4.106540679931641, "global_step": 3622, "epoch": 86} {"train_loss": -4.112349510192871, "global_step": 3623, "epoch": 86} {"train_loss": -3.9804701805114746, "global_step": 3624, "epoch": 86} {"train_loss": -4.1388773918151855, "global_step": 3625, "epoch": 86} {"train_loss": -4.13505744934082, "global_step": 3626, "epoch": 86} {"train_loss": -4.339931011199951, "global_step": 3627, "epoch": 86} {"train_loss": -4.0098724365234375, "global_step": 3628, "epoch": 86} {"train_loss": -4.157097816467285, "global_step": 3629, "epoch": 86} {"train_loss": -4.21433162689209, "global_step": 3630, "epoch": 86} {"train_loss": -4.20842170715332, "global_step": 3631, "epoch": 86} {"train_loss": -4.138664245605469, "global_step": 3632, "epoch": 86} {"train_loss": -4.28233003616333, "global_step": 3633, "epoch": 86} {"train_loss": -3.9839677810668945, "global_step": 3634, "epoch": 86} {"train_loss": -3.955171585083008, "global_step": 3635, "epoch": 86} {"train_loss": -4.045052528381348, "global_step": 3636, "epoch": 86} {"train_loss": -3.917224884033203, "global_step": 3637, "epoch": 86} {"train_loss": -3.9748809337615967, "global_step": 3638, "epoch": 86} {"train_loss": -4.037992477416992, "global_step": 3639, "epoch": 86} {"train_loss": -3.907517433166504, "global_step": 3640, "epoch": 86} {"train_loss": -4.128808975219727, "global_step": 3641, "epoch": 86} {"train_loss": -4.066502571105957, "global_step": 3642, "epoch": 86} {"train_loss": -4.159564971923828, "global_step": 3643, "epoch": 86} {"train_loss": -4.007218360900879, "global_step": 3644, "epoch": 86} {"train_loss": -4.1011061668396, "global_step": 3645, "epoch": 86} {"train_loss": -3.9989311695098877, "global_step": 3646, "epoch": 86} {"train_loss": -3.835822105407715, "global_step": 3647, "epoch": 86} {"train_loss": -4.05914306640625, "global_step": 3648, "epoch": 86} {"train_loss": -3.9572157859802246, "global_step": 3649, "epoch": 86} {"train_loss": -4.1771063804626465, "global_step": 3650, "epoch": 86} {"train_loss": -4.21213960647583, "global_step": 3651, "epoch": 86} {"train_loss": -4.154272079467773, "global_step": 3652, "epoch": 86} {"train_loss": -4.078871516954331, "global_step": 3653, "epoch": 86, "val_loss": 134588.796875} {"train_loss": -4.0304975509643555, "global_step": 3654, "epoch": 87} {"train_loss": -4.148573875427246, "global_step": 3655, "epoch": 87} {"train_loss": -4.015907287597656, "global_step": 3656, "epoch": 87} {"train_loss": -3.98470401763916, "global_step": 3657, "epoch": 87} {"train_loss": -4.0854811668396, "global_step": 3658, "epoch": 87} {"train_loss": -4.076774597167969, "global_step": 3659, "epoch": 87} {"train_loss": -4.209404945373535, "global_step": 3660, "epoch": 87} {"train_loss": -4.125401496887207, "global_step": 3661, "epoch": 87} {"train_loss": -4.162526607513428, "global_step": 3662, "epoch": 87} {"train_loss": -4.130400657653809, "global_step": 3663, "epoch": 87} {"train_loss": -4.171680450439453, "global_step": 3664, "epoch": 87} {"train_loss": -4.248856544494629, "global_step": 3665, "epoch": 87} {"train_loss": -4.270938873291016, "global_step": 3666, "epoch": 87} {"train_loss": -4.165943145751953, "global_step": 3667, "epoch": 87} {"train_loss": -4.222261428833008, "global_step": 3668, "epoch": 87} {"train_loss": -4.2372589111328125, "global_step": 3669, "epoch": 87} {"train_loss": -4.108763217926025, "global_step": 3670, "epoch": 87} {"train_loss": -4.1901750564575195, "global_step": 3671, "epoch": 87} {"train_loss": -4.140787601470947, "global_step": 3672, "epoch": 87} {"train_loss": -3.9840636253356934, "global_step": 3673, "epoch": 87} {"train_loss": -4.2267303466796875, "global_step": 3674, "epoch": 87} {"train_loss": -4.088798522949219, "global_step": 3675, "epoch": 87} {"train_loss": -4.194990158081055, "global_step": 3676, "epoch": 87} {"train_loss": -4.252561092376709, "global_step": 3677, "epoch": 87} {"train_loss": -4.144855499267578, "global_step": 3678, "epoch": 87} {"train_loss": -4.263649940490723, "global_step": 3679, "epoch": 87} {"train_loss": -4.21854305267334, "global_step": 3680, "epoch": 87} {"train_loss": -4.210452079772949, "global_step": 3681, "epoch": 87} {"train_loss": -4.0706987380981445, "global_step": 3682, "epoch": 87} {"train_loss": -4.164285659790039, "global_step": 3683, "epoch": 87} {"train_loss": -4.2428107261657715, "global_step": 3684, "epoch": 87} {"train_loss": -4.143083572387695, "global_step": 3685, "epoch": 87} {"train_loss": -4.195558071136475, "global_step": 3686, "epoch": 87} {"train_loss": -4.123958587646484, "global_step": 3687, "epoch": 87} {"train_loss": -3.98492693901062, "global_step": 3688, "epoch": 87} {"train_loss": -4.160614967346191, "global_step": 3689, "epoch": 87} {"train_loss": -4.186592102050781, "global_step": 3690, "epoch": 87} {"train_loss": -4.190225124359131, "global_step": 3691, "epoch": 87} {"train_loss": -4.275279998779297, "global_step": 3692, "epoch": 87} {"train_loss": -4.025839805603027, "global_step": 3693, "epoch": 87} {"train_loss": -4.034451484680176, "global_step": 3694, "epoch": 87} {"train_loss": -4.151969597453163, "global_step": 3695, "epoch": 87, "val_loss": 131012.5859375} {"train_loss": -4.228623867034912, "global_step": 3696, "epoch": 88} {"train_loss": -4.023117542266846, "global_step": 3697, "epoch": 88} {"train_loss": -4.18776798248291, "global_step": 3698, "epoch": 88} {"train_loss": -4.245423793792725, "global_step": 3699, "epoch": 88} {"train_loss": -4.0498151779174805, "global_step": 3700, "epoch": 88} {"train_loss": -4.120987892150879, "global_step": 3701, "epoch": 88} {"train_loss": -4.0155839920043945, "global_step": 3702, "epoch": 88} {"train_loss": -4.108151435852051, "global_step": 3703, "epoch": 88} {"train_loss": -4.015822410583496, "global_step": 3704, "epoch": 88} {"train_loss": -4.17398738861084, "global_step": 3705, "epoch": 88} {"train_loss": -3.893742561340332, "global_step": 3706, "epoch": 88} {"train_loss": -4.09110164642334, "global_step": 3707, "epoch": 88} {"train_loss": -4.160205841064453, "global_step": 3708, "epoch": 88} {"train_loss": -3.790349006652832, "global_step": 3709, "epoch": 88} {"train_loss": -4.213335037231445, "global_step": 3710, "epoch": 88} {"train_loss": -3.8799166679382324, "global_step": 3711, "epoch": 88} {"train_loss": -3.910037040710449, "global_step": 3712, "epoch": 88} {"train_loss": -3.991025686264038, "global_step": 3713, "epoch": 88} {"train_loss": -4.144832611083984, "global_step": 3714, "epoch": 88} {"train_loss": -4.050413608551025, "global_step": 3715, "epoch": 88} {"train_loss": -3.823951005935669, "global_step": 3716, "epoch": 88} {"train_loss": -4.011609077453613, "global_step": 3717, "epoch": 88} {"train_loss": -3.9909424781799316, "global_step": 3718, "epoch": 88} {"train_loss": -3.9187676906585693, "global_step": 3719, "epoch": 88} {"train_loss": -4.109785079956055, "global_step": 3720, "epoch": 88} {"train_loss": -3.9014596939086914, "global_step": 3721, "epoch": 88} {"train_loss": -3.9399452209472656, "global_step": 3722, "epoch": 88} {"train_loss": -4.020339012145996, "global_step": 3723, "epoch": 88} {"train_loss": -4.132238864898682, "global_step": 3724, "epoch": 88} {"train_loss": -4.022992134094238, "global_step": 3725, "epoch": 88} {"train_loss": -3.993445634841919, "global_step": 3726, "epoch": 88} {"train_loss": -4.033862113952637, "global_step": 3727, "epoch": 88} {"train_loss": -4.130865097045898, "global_step": 3728, "epoch": 88} {"train_loss": -4.0876851081848145, "global_step": 3729, "epoch": 88} {"train_loss": -4.170098304748535, "global_step": 3730, "epoch": 88} {"train_loss": -4.286136627197266, "global_step": 3731, "epoch": 88} {"train_loss": -4.152281761169434, "global_step": 3732, "epoch": 88} {"train_loss": -4.084259986877441, "global_step": 3733, "epoch": 88} {"train_loss": -4.205783367156982, "global_step": 3734, "epoch": 88} {"train_loss": -4.112741470336914, "global_step": 3735, "epoch": 88} {"train_loss": -4.169217109680176, "global_step": 3736, "epoch": 88} {"train_loss": -4.066278400875273, "global_step": 3737, "epoch": 88, "val_loss": 128074.484375} {"train_loss": -4.321070671081543, "global_step": 3738, "epoch": 89} {"train_loss": -4.314050674438477, "global_step": 3739, "epoch": 89} {"train_loss": -4.291769981384277, "global_step": 3740, "epoch": 89} {"train_loss": -4.134585380554199, "global_step": 3741, "epoch": 89} {"train_loss": -4.216440200805664, "global_step": 3742, "epoch": 89} {"train_loss": -4.157288551330566, "global_step": 3743, "epoch": 89} {"train_loss": -4.108904838562012, "global_step": 3744, "epoch": 89} {"train_loss": -4.058405876159668, "global_step": 3745, "epoch": 89} {"train_loss": -4.225080490112305, "global_step": 3746, "epoch": 89} {"train_loss": -4.017697811126709, "global_step": 3747, "epoch": 89} {"train_loss": -4.147089958190918, "global_step": 3748, "epoch": 89} {"train_loss": -4.192609786987305, "global_step": 3749, "epoch": 89} {"train_loss": -4.020113945007324, "global_step": 3750, "epoch": 89} {"train_loss": -3.976365566253662, "global_step": 3751, "epoch": 89} {"train_loss": -4.262446880340576, "global_step": 3752, "epoch": 89} {"train_loss": -4.159673690795898, "global_step": 3753, "epoch": 89} {"train_loss": -3.972506046295166, "global_step": 3754, "epoch": 89} {"train_loss": -4.054112911224365, "global_step": 3755, "epoch": 89} {"train_loss": -4.051078796386719, "global_step": 3756, "epoch": 89} {"train_loss": -4.150845050811768, "global_step": 3757, "epoch": 89} {"train_loss": -4.175825119018555, "global_step": 3758, "epoch": 89} {"train_loss": -4.21270751953125, "global_step": 3759, "epoch": 89} {"train_loss": -4.078347682952881, "global_step": 3760, "epoch": 89} {"train_loss": -4.252413749694824, "global_step": 3761, "epoch": 89} {"train_loss": -4.026093006134033, "global_step": 3762, "epoch": 89} {"train_loss": -4.246060371398926, "global_step": 3763, "epoch": 89} {"train_loss": -4.206286430358887, "global_step": 3764, "epoch": 89} {"train_loss": -4.155723571777344, "global_step": 3765, "epoch": 89} {"train_loss": -4.1994547843933105, "global_step": 3766, "epoch": 89} {"train_loss": -4.121013641357422, "global_step": 3767, "epoch": 89} {"train_loss": -4.158448219299316, "global_step": 3768, "epoch": 89} {"train_loss": -4.403385162353516, "global_step": 3769, "epoch": 89} {"train_loss": -4.264936447143555, "global_step": 3770, "epoch": 89} {"train_loss": -4.240138053894043, "global_step": 3771, "epoch": 89} {"train_loss": -4.178124904632568, "global_step": 3772, "epoch": 89} {"train_loss": -4.320652008056641, "global_step": 3773, "epoch": 89} {"train_loss": -4.231298446655273, "global_step": 3774, "epoch": 89} {"train_loss": -4.159909248352051, "global_step": 3775, "epoch": 89} {"train_loss": -4.284832000732422, "global_step": 3776, "epoch": 89} {"train_loss": -4.110688209533691, "global_step": 3777, "epoch": 89} {"train_loss": -4.085343837738037, "global_step": 3778, "epoch": 89} {"train_loss": -4.169173388254075, "global_step": 3779, "epoch": 89, "val_loss": 127520.9375} {"train_loss": -4.184289932250977, "global_step": 3780, "epoch": 90} {"train_loss": -4.105766296386719, "global_step": 3781, "epoch": 90} {"train_loss": -4.273341178894043, "global_step": 3782, "epoch": 90} {"train_loss": -4.350881099700928, "global_step": 3783, "epoch": 90} {"train_loss": -4.227780818939209, "global_step": 3784, "epoch": 90} {"train_loss": -4.042617321014404, "global_step": 3785, "epoch": 90} {"train_loss": -4.118473052978516, "global_step": 3786, "epoch": 90} {"train_loss": -3.9691989421844482, "global_step": 3787, "epoch": 90} {"train_loss": -4.22524881362915, "global_step": 3788, "epoch": 90} {"train_loss": -4.3132853507995605, "global_step": 3789, "epoch": 90} {"train_loss": -4.116313457489014, "global_step": 3790, "epoch": 90} {"train_loss": -4.1371893882751465, "global_step": 3791, "epoch": 90} {"train_loss": -4.2317938804626465, "global_step": 3792, "epoch": 90} {"train_loss": -4.258901596069336, "global_step": 3793, "epoch": 90} {"train_loss": -4.147401809692383, "global_step": 3794, "epoch": 90} {"train_loss": -4.180586814880371, "global_step": 3795, "epoch": 90} {"train_loss": -4.144598007202148, "global_step": 3796, "epoch": 90} {"train_loss": -4.187930107116699, "global_step": 3797, "epoch": 90} {"train_loss": -4.239217758178711, "global_step": 3798, "epoch": 90} {"train_loss": -4.32613468170166, "global_step": 3799, "epoch": 90} {"train_loss": -4.2451581954956055, "global_step": 3800, "epoch": 90} {"train_loss": -4.260207176208496, "global_step": 3801, "epoch": 90} {"train_loss": -4.057165145874023, "global_step": 3802, "epoch": 90} {"train_loss": -4.117961406707764, "global_step": 3803, "epoch": 90} {"train_loss": -4.089069366455078, "global_step": 3804, "epoch": 90} {"train_loss": -4.04434061050415, "global_step": 3805, "epoch": 90} {"train_loss": -4.243866920471191, "global_step": 3806, "epoch": 90} {"train_loss": -4.172670364379883, "global_step": 3807, "epoch": 90} {"train_loss": -4.198403358459473, "global_step": 3808, "epoch": 90} {"train_loss": -4.138216972351074, "global_step": 3809, "epoch": 90} {"train_loss": -4.238149642944336, "global_step": 3810, "epoch": 90} {"train_loss": -3.9612045288085938, "global_step": 3811, "epoch": 90} {"train_loss": -4.1554388999938965, "global_step": 3812, "epoch": 90} {"train_loss": -4.313912868499756, "global_step": 3813, "epoch": 90} {"train_loss": -4.225424766540527, "global_step": 3814, "epoch": 90} {"train_loss": -4.200347900390625, "global_step": 3815, "epoch": 90} {"train_loss": -4.2150187492370605, "global_step": 3816, "epoch": 90} {"train_loss": -4.199873447418213, "global_step": 3817, "epoch": 90} {"train_loss": -4.168639183044434, "global_step": 3818, "epoch": 90} {"train_loss": -4.215150356292725, "global_step": 3819, "epoch": 90} {"train_loss": -4.138108730316162, "global_step": 3820, "epoch": 90} {"train_loss": -4.1824050687608265, "global_step": 3821, "epoch": 90, "val_loss": 125818.046875} {"train_loss": -4.196976184844971, "global_step": 3822, "epoch": 91} {"train_loss": -4.193768501281738, "global_step": 3823, "epoch": 91} {"train_loss": -4.2718963623046875, "global_step": 3824, "epoch": 91} {"train_loss": -4.156281471252441, "global_step": 3825, "epoch": 91} {"train_loss": -4.172811031341553, "global_step": 3826, "epoch": 91} {"train_loss": -4.355823516845703, "global_step": 3827, "epoch": 91} {"train_loss": -4.266201019287109, "global_step": 3828, "epoch": 91} {"train_loss": -4.196977138519287, "global_step": 3829, "epoch": 91} {"train_loss": -4.225063323974609, "global_step": 3830, "epoch": 91} {"train_loss": -4.272173881530762, "global_step": 3831, "epoch": 91} {"train_loss": -4.20991325378418, "global_step": 3832, "epoch": 91} {"train_loss": -4.404261589050293, "global_step": 3833, "epoch": 91} {"train_loss": -4.142669677734375, "global_step": 3834, "epoch": 91} {"train_loss": -4.351049423217773, "global_step": 3835, "epoch": 91} {"train_loss": -4.2200164794921875, "global_step": 3836, "epoch": 91} {"train_loss": -4.048423767089844, "global_step": 3837, "epoch": 91} {"train_loss": -4.272890567779541, "global_step": 3838, "epoch": 91} {"train_loss": -4.26032018661499, "global_step": 3839, "epoch": 91} {"train_loss": -4.268730163574219, "global_step": 3840, "epoch": 91} {"train_loss": -4.168206214904785, "global_step": 3841, "epoch": 91} {"train_loss": -4.265009880065918, "global_step": 3842, "epoch": 91} {"train_loss": -4.1430344581604, "global_step": 3843, "epoch": 91} {"train_loss": -4.291637420654297, "global_step": 3844, "epoch": 91} {"train_loss": -4.092022895812988, "global_step": 3845, "epoch": 91} {"train_loss": -4.078024387359619, "global_step": 3846, "epoch": 91} {"train_loss": -4.1998701095581055, "global_step": 3847, "epoch": 91} {"train_loss": -4.174269199371338, "global_step": 3848, "epoch": 91} {"train_loss": -4.239679336547852, "global_step": 3849, "epoch": 91} {"train_loss": -4.107466220855713, "global_step": 3850, "epoch": 91} {"train_loss": -4.282257080078125, "global_step": 3851, "epoch": 91} {"train_loss": -4.1204657554626465, "global_step": 3852, "epoch": 91} {"train_loss": -4.010932922363281, "global_step": 3853, "epoch": 91} {"train_loss": -4.243175983428955, "global_step": 3854, "epoch": 91} {"train_loss": -4.1379828453063965, "global_step": 3855, "epoch": 91} {"train_loss": -4.2420806884765625, "global_step": 3856, "epoch": 91} {"train_loss": -4.092065334320068, "global_step": 3857, "epoch": 91} {"train_loss": -4.169131278991699, "global_step": 3858, "epoch": 91} {"train_loss": -4.191446304321289, "global_step": 3859, "epoch": 91} {"train_loss": -4.0848002433776855, "global_step": 3860, "epoch": 91} {"train_loss": -4.254711151123047, "global_step": 3861, "epoch": 91} {"train_loss": -4.303600311279297, "global_step": 3862, "epoch": 91} {"train_loss": -4.20554578871954, "global_step": 3863, "epoch": 91, "val_loss": 123044.03125} {"train_loss": -4.384573936462402, "global_step": 3864, "epoch": 92} {"train_loss": -4.207705497741699, "global_step": 3865, "epoch": 92} {"train_loss": -4.284856796264648, "global_step": 3866, "epoch": 92} {"train_loss": -4.299345970153809, "global_step": 3867, "epoch": 92} {"train_loss": -4.317581653594971, "global_step": 3868, "epoch": 92} {"train_loss": -4.165998935699463, "global_step": 3869, "epoch": 92} {"train_loss": -4.416915416717529, "global_step": 3870, "epoch": 92} {"train_loss": -4.4259352684021, "global_step": 3871, "epoch": 92} {"train_loss": -4.354462146759033, "global_step": 3872, "epoch": 92} {"train_loss": -4.0603346824646, "global_step": 3873, "epoch": 92} {"train_loss": -4.232431888580322, "global_step": 3874, "epoch": 92} {"train_loss": -4.370920181274414, "global_step": 3875, "epoch": 92} {"train_loss": -4.278743743896484, "global_step": 3876, "epoch": 92} {"train_loss": -4.1851701736450195, "global_step": 3877, "epoch": 92} {"train_loss": -4.124756813049316, "global_step": 3878, "epoch": 92} {"train_loss": -4.249674320220947, "global_step": 3879, "epoch": 92} {"train_loss": -4.103940010070801, "global_step": 3880, "epoch": 92} {"train_loss": -4.133718490600586, "global_step": 3881, "epoch": 92} {"train_loss": -4.318815231323242, "global_step": 3882, "epoch": 92} {"train_loss": -4.069053649902344, "global_step": 3883, "epoch": 92} {"train_loss": -3.8999342918395996, "global_step": 3884, "epoch": 92} {"train_loss": -4.290492534637451, "global_step": 3885, "epoch": 92} {"train_loss": -4.2613630294799805, "global_step": 3886, "epoch": 92} {"train_loss": -4.036925315856934, "global_step": 3887, "epoch": 92} {"train_loss": -4.026360511779785, "global_step": 3888, "epoch": 92} {"train_loss": -4.321715354919434, "global_step": 3889, "epoch": 92} {"train_loss": -4.257421970367432, "global_step": 3890, "epoch": 92} {"train_loss": -4.232223987579346, "global_step": 3891, "epoch": 92} {"train_loss": -4.150583267211914, "global_step": 3892, "epoch": 92} {"train_loss": -4.279949188232422, "global_step": 3893, "epoch": 92} {"train_loss": -4.162012577056885, "global_step": 3894, "epoch": 92} {"train_loss": -4.277773857116699, "global_step": 3895, "epoch": 92} {"train_loss": -4.185683250427246, "global_step": 3896, "epoch": 92} {"train_loss": -4.112602710723877, "global_step": 3897, "epoch": 92} {"train_loss": -4.2702741622924805, "global_step": 3898, "epoch": 92} {"train_loss": -4.148024559020996, "global_step": 3899, "epoch": 92} {"train_loss": -4.033154487609863, "global_step": 3900, "epoch": 92} {"train_loss": -4.293353080749512, "global_step": 3901, "epoch": 92} {"train_loss": -4.313733100891113, "global_step": 3902, "epoch": 92} {"train_loss": -4.1534013748168945, "global_step": 3903, "epoch": 92} {"train_loss": -4.36896276473999, "global_step": 3904, "epoch": 92} {"train_loss": -4.222926548549107, "global_step": 3905, "epoch": 92, "val_loss": 122242.40625} {"train_loss": -4.073643684387207, "global_step": 3906, "epoch": 93} {"train_loss": -4.2317047119140625, "global_step": 3907, "epoch": 93} {"train_loss": -4.217628479003906, "global_step": 3908, "epoch": 93} {"train_loss": -4.292011260986328, "global_step": 3909, "epoch": 93} {"train_loss": -4.156890869140625, "global_step": 3910, "epoch": 93} {"train_loss": -4.253725051879883, "global_step": 3911, "epoch": 93} {"train_loss": -4.36556339263916, "global_step": 3912, "epoch": 93} {"train_loss": -4.236685276031494, "global_step": 3913, "epoch": 93} {"train_loss": -4.307065486907959, "global_step": 3914, "epoch": 93} {"train_loss": -4.288568496704102, "global_step": 3915, "epoch": 93} {"train_loss": -4.281476020812988, "global_step": 3916, "epoch": 93} {"train_loss": -4.320758819580078, "global_step": 3917, "epoch": 93} {"train_loss": -4.265267372131348, "global_step": 3918, "epoch": 93} {"train_loss": -4.281187057495117, "global_step": 3919, "epoch": 93} {"train_loss": -4.151628494262695, "global_step": 3920, "epoch": 93} {"train_loss": -4.171119689941406, "global_step": 3921, "epoch": 93} {"train_loss": -4.342541217803955, "global_step": 3922, "epoch": 93} {"train_loss": -4.129692077636719, "global_step": 3923, "epoch": 93} {"train_loss": -4.180882453918457, "global_step": 3924, "epoch": 93} {"train_loss": -4.041976451873779, "global_step": 3925, "epoch": 93} {"train_loss": -4.045292854309082, "global_step": 3926, "epoch": 93} {"train_loss": -4.305587291717529, "global_step": 3927, "epoch": 93} {"train_loss": -4.339191436767578, "global_step": 3928, "epoch": 93} {"train_loss": -4.039663314819336, "global_step": 3929, "epoch": 93} {"train_loss": -4.238218307495117, "global_step": 3930, "epoch": 93} {"train_loss": -4.220746040344238, "global_step": 3931, "epoch": 93} {"train_loss": -4.349259376525879, "global_step": 3932, "epoch": 93} {"train_loss": -4.341299057006836, "global_step": 3933, "epoch": 93} {"train_loss": -4.312735557556152, "global_step": 3934, "epoch": 93} {"train_loss": -4.262152671813965, "global_step": 3935, "epoch": 93} {"train_loss": -4.340395927429199, "global_step": 3936, "epoch": 93} {"train_loss": -4.386977195739746, "global_step": 3937, "epoch": 93} {"train_loss": -4.308932781219482, "global_step": 3938, "epoch": 93} {"train_loss": -4.240036964416504, "global_step": 3939, "epoch": 93} {"train_loss": -4.201416015625, "global_step": 3940, "epoch": 93} {"train_loss": -4.298459053039551, "global_step": 3941, "epoch": 93} {"train_loss": -4.1576948165893555, "global_step": 3942, "epoch": 93} {"train_loss": -4.401125907897949, "global_step": 3943, "epoch": 93} {"train_loss": -4.2999467849731445, "global_step": 3944, "epoch": 93} {"train_loss": -4.243281841278076, "global_step": 3945, "epoch": 93} {"train_loss": -4.318451404571533, "global_step": 3946, "epoch": 93} {"train_loss": -4.25088407879784, "global_step": 3947, "epoch": 93, "val_loss": 120116.1796875} {"train_loss": -4.147240161895752, "global_step": 3948, "epoch": 94} {"train_loss": -4.277776718139648, "global_step": 3949, "epoch": 94} {"train_loss": -4.335940361022949, "global_step": 3950, "epoch": 94} {"train_loss": -4.295714378356934, "global_step": 3951, "epoch": 94} {"train_loss": -4.287336349487305, "global_step": 3952, "epoch": 94} {"train_loss": -4.175309181213379, "global_step": 3953, "epoch": 94} {"train_loss": -4.384227752685547, "global_step": 3954, "epoch": 94} {"train_loss": -4.330651760101318, "global_step": 3955, "epoch": 94} {"train_loss": -4.317572593688965, "global_step": 3956, "epoch": 94} {"train_loss": -4.398951053619385, "global_step": 3957, "epoch": 94} {"train_loss": -4.452712059020996, "global_step": 3958, "epoch": 94} {"train_loss": -4.259552955627441, "global_step": 3959, "epoch": 94} {"train_loss": -4.350911617279053, "global_step": 3960, "epoch": 94} {"train_loss": -4.433927536010742, "global_step": 3961, "epoch": 94} {"train_loss": -4.14454460144043, "global_step": 3962, "epoch": 94} {"train_loss": -4.1604905128479, "global_step": 3963, "epoch": 94} {"train_loss": -4.235564231872559, "global_step": 3964, "epoch": 94} {"train_loss": -4.082674026489258, "global_step": 3965, "epoch": 94} {"train_loss": -4.409700393676758, "global_step": 3966, "epoch": 94} {"train_loss": -4.221386432647705, "global_step": 3967, "epoch": 94} {"train_loss": -4.124683856964111, "global_step": 3968, "epoch": 94} {"train_loss": -4.295235633850098, "global_step": 3969, "epoch": 94} {"train_loss": -4.318792343139648, "global_step": 3970, "epoch": 94} {"train_loss": -4.065147876739502, "global_step": 3971, "epoch": 94} {"train_loss": -4.1472063064575195, "global_step": 3972, "epoch": 94} {"train_loss": -4.282538890838623, "global_step": 3973, "epoch": 94} {"train_loss": -4.195523262023926, "global_step": 3974, "epoch": 94} {"train_loss": -4.403044700622559, "global_step": 3975, "epoch": 94} {"train_loss": -4.3125104904174805, "global_step": 3976, "epoch": 94} {"train_loss": -4.28095817565918, "global_step": 3977, "epoch": 94} {"train_loss": -4.209425926208496, "global_step": 3978, "epoch": 94} {"train_loss": -4.212735652923584, "global_step": 3979, "epoch": 94} {"train_loss": -4.066710948944092, "global_step": 3980, "epoch": 94} {"train_loss": -4.177491664886475, "global_step": 3981, "epoch": 94} {"train_loss": -4.2072858810424805, "global_step": 3982, "epoch": 94} {"train_loss": -4.1749467849731445, "global_step": 3983, "epoch": 94} {"train_loss": -4.163854598999023, "global_step": 3984, "epoch": 94} {"train_loss": -4.273677349090576, "global_step": 3985, "epoch": 94} {"train_loss": -4.236215114593506, "global_step": 3986, "epoch": 94} {"train_loss": -4.121648788452148, "global_step": 3987, "epoch": 94} {"train_loss": -4.321048736572266, "global_step": 3988, "epoch": 94} {"train_loss": -4.2509850433894565, "global_step": 3989, "epoch": 94, "val_loss": 117963.1796875} {"train_loss": -4.33573055267334, "global_step": 3990, "epoch": 95} {"train_loss": -4.304322719573975, "global_step": 3991, "epoch": 95} {"train_loss": -4.47532844543457, "global_step": 3992, "epoch": 95} {"train_loss": -4.241968631744385, "global_step": 3993, "epoch": 95} {"train_loss": -4.1893439292907715, "global_step": 3994, "epoch": 95} {"train_loss": -4.406378746032715, "global_step": 3995, "epoch": 95} {"train_loss": -4.291284561157227, "global_step": 3996, "epoch": 95} {"train_loss": -4.257447719573975, "global_step": 3997, "epoch": 95} {"train_loss": -4.221013069152832, "global_step": 3998, "epoch": 95} {"train_loss": -4.367663383483887, "global_step": 3999, "epoch": 95} {"train_loss": -4.375005722045898, "global_step": 4000, "epoch": 95} {"train_loss": -4.191229343414307, "global_step": 4001, "epoch": 95} {"train_loss": -4.340143203735352, "global_step": 4002, "epoch": 95} {"train_loss": -4.38880729675293, "global_step": 4003, "epoch": 95} {"train_loss": -4.157992362976074, "global_step": 4004, "epoch": 95} {"train_loss": -4.090550422668457, "global_step": 4005, "epoch": 95} {"train_loss": -4.305907249450684, "global_step": 4006, "epoch": 95} {"train_loss": -4.322625637054443, "global_step": 4007, "epoch": 95} {"train_loss": -4.053752899169922, "global_step": 4008, "epoch": 95} {"train_loss": -4.1815948486328125, "global_step": 4009, "epoch": 95} {"train_loss": -4.3539347648620605, "global_step": 4010, "epoch": 95} {"train_loss": -4.247827529907227, "global_step": 4011, "epoch": 95} {"train_loss": -4.229150772094727, "global_step": 4012, "epoch": 95} {"train_loss": -4.250401020050049, "global_step": 4013, "epoch": 95} {"train_loss": -4.0008721351623535, "global_step": 4014, "epoch": 95} {"train_loss": -4.175220489501953, "global_step": 4015, "epoch": 95} {"train_loss": -3.9482810497283936, "global_step": 4016, "epoch": 95} {"train_loss": -4.215845108032227, "global_step": 4017, "epoch": 95} {"train_loss": -4.143522262573242, "global_step": 4018, "epoch": 95} {"train_loss": -3.9530975818634033, "global_step": 4019, "epoch": 95} {"train_loss": -4.2871294021606445, "global_step": 4020, "epoch": 95} {"train_loss": -4.0698957443237305, "global_step": 4021, "epoch": 95} {"train_loss": -4.2475762367248535, "global_step": 4022, "epoch": 95} {"train_loss": -4.11457633972168, "global_step": 4023, "epoch": 95} {"train_loss": -4.180270195007324, "global_step": 4024, "epoch": 95} {"train_loss": -4.209861755371094, "global_step": 4025, "epoch": 95} {"train_loss": -4.341881275177002, "global_step": 4026, "epoch": 95} {"train_loss": -4.048837184906006, "global_step": 4027, "epoch": 95} {"train_loss": -4.171478271484375, "global_step": 4028, "epoch": 95} {"train_loss": -4.128547668457031, "global_step": 4029, "epoch": 95} {"train_loss": -4.238085746765137, "global_step": 4030, "epoch": 95} {"train_loss": -4.222051654543195, "global_step": 4031, "epoch": 95, "val_loss": 118544.21875} {"train_loss": -4.247763633728027, "global_step": 4032, "epoch": 96} {"train_loss": -4.250659465789795, "global_step": 4033, "epoch": 96} {"train_loss": -4.14674186706543, "global_step": 4034, "epoch": 96} {"train_loss": -4.255883693695068, "global_step": 4035, "epoch": 96} {"train_loss": -4.219622611999512, "global_step": 4036, "epoch": 96} {"train_loss": -4.367826461791992, "global_step": 4037, "epoch": 96} {"train_loss": -4.181748390197754, "global_step": 4038, "epoch": 96} {"train_loss": -4.211395263671875, "global_step": 4039, "epoch": 96} {"train_loss": -4.204726696014404, "global_step": 4040, "epoch": 96} {"train_loss": -4.227119445800781, "global_step": 4041, "epoch": 96} {"train_loss": -4.314413547515869, "global_step": 4042, "epoch": 96} {"train_loss": -4.294227123260498, "global_step": 4043, "epoch": 96} {"train_loss": -4.4676737785339355, "global_step": 4044, "epoch": 96} {"train_loss": -4.111234664916992, "global_step": 4045, "epoch": 96} {"train_loss": -4.382843971252441, "global_step": 4046, "epoch": 96} {"train_loss": -4.1780524253845215, "global_step": 4047, "epoch": 96} {"train_loss": -4.297052383422852, "global_step": 4048, "epoch": 96} {"train_loss": -4.241767406463623, "global_step": 4049, "epoch": 96} {"train_loss": -4.254138946533203, "global_step": 4050, "epoch": 96} {"train_loss": -4.303668975830078, "global_step": 4051, "epoch": 96} {"train_loss": -4.205896377563477, "global_step": 4052, "epoch": 96} {"train_loss": -4.213224411010742, "global_step": 4053, "epoch": 96} {"train_loss": -4.19075870513916, "global_step": 4054, "epoch": 96} {"train_loss": -4.27706241607666, "global_step": 4055, "epoch": 96} {"train_loss": -4.164063453674316, "global_step": 4056, "epoch": 96} {"train_loss": -4.311635971069336, "global_step": 4057, "epoch": 96} {"train_loss": -4.411149978637695, "global_step": 4058, "epoch": 96} {"train_loss": -4.258646011352539, "global_step": 4059, "epoch": 96} {"train_loss": -4.438816070556641, "global_step": 4060, "epoch": 96} {"train_loss": -4.266271591186523, "global_step": 4061, "epoch": 96} {"train_loss": -4.320780277252197, "global_step": 4062, "epoch": 96} {"train_loss": -4.389034271240234, "global_step": 4063, "epoch": 96} {"train_loss": -4.236358165740967, "global_step": 4064, "epoch": 96} {"train_loss": -4.374697685241699, "global_step": 4065, "epoch": 96} {"train_loss": -4.340961456298828, "global_step": 4066, "epoch": 96} {"train_loss": -4.239034175872803, "global_step": 4067, "epoch": 96} {"train_loss": -4.2694315910339355, "global_step": 4068, "epoch": 96} {"train_loss": -4.286874771118164, "global_step": 4069, "epoch": 96} {"train_loss": -4.373813629150391, "global_step": 4070, "epoch": 96} {"train_loss": -4.4230475425720215, "global_step": 4071, "epoch": 96} {"train_loss": -4.46860408782959, "global_step": 4072, "epoch": 96} {"train_loss": -4.287459475653512, "global_step": 4073, "epoch": 96, "val_loss": 114513.859375} {"train_loss": -4.466293811798096, "global_step": 4074, "epoch": 97} {"train_loss": -4.402215003967285, "global_step": 4075, "epoch": 97} {"train_loss": -4.293398857116699, "global_step": 4076, "epoch": 97} {"train_loss": -4.392988204956055, "global_step": 4077, "epoch": 97} {"train_loss": -4.387102127075195, "global_step": 4078, "epoch": 97} {"train_loss": -4.485600471496582, "global_step": 4079, "epoch": 97} {"train_loss": -4.313101768493652, "global_step": 4080, "epoch": 97} {"train_loss": -4.495165824890137, "global_step": 4081, "epoch": 97} {"train_loss": -4.353271484375, "global_step": 4082, "epoch": 97} {"train_loss": -4.424097537994385, "global_step": 4083, "epoch": 97} {"train_loss": -4.359238624572754, "global_step": 4084, "epoch": 97} {"train_loss": -4.237144470214844, "global_step": 4085, "epoch": 97} {"train_loss": -4.2953948974609375, "global_step": 4086, "epoch": 97} {"train_loss": -4.093377590179443, "global_step": 4087, "epoch": 97} {"train_loss": -4.117080211639404, "global_step": 4088, "epoch": 97} {"train_loss": -4.099895477294922, "global_step": 4089, "epoch": 97} {"train_loss": -4.422450065612793, "global_step": 4090, "epoch": 97} {"train_loss": -4.151117324829102, "global_step": 4091, "epoch": 97} {"train_loss": -3.9428954124450684, "global_step": 4092, "epoch": 97} {"train_loss": -4.107902526855469, "global_step": 4093, "epoch": 97} {"train_loss": -3.694859027862549, "global_step": 4094, "epoch": 97} {"train_loss": -4.094162940979004, "global_step": 4095, "epoch": 97} {"train_loss": -4.221042156219482, "global_step": 4096, "epoch": 97} {"train_loss": -4.364900588989258, "global_step": 4097, "epoch": 97} {"train_loss": -4.20633602142334, "global_step": 4098, "epoch": 97} {"train_loss": -4.271533966064453, "global_step": 4099, "epoch": 97} {"train_loss": -4.283337593078613, "global_step": 4100, "epoch": 97} {"train_loss": -4.144036769866943, "global_step": 4101, "epoch": 97} {"train_loss": -4.213393688201904, "global_step": 4102, "epoch": 97} {"train_loss": -4.084561347961426, "global_step": 4103, "epoch": 97} {"train_loss": -4.290496826171875, "global_step": 4104, "epoch": 97} {"train_loss": -4.299322128295898, "global_step": 4105, "epoch": 97} {"train_loss": -4.227807998657227, "global_step": 4106, "epoch": 97} {"train_loss": -4.346203804016113, "global_step": 4107, "epoch": 97} {"train_loss": -4.310561656951904, "global_step": 4108, "epoch": 97} {"train_loss": -4.269272804260254, "global_step": 4109, "epoch": 97} {"train_loss": -4.378874778747559, "global_step": 4110, "epoch": 97} {"train_loss": -4.266918182373047, "global_step": 4111, "epoch": 97} {"train_loss": -4.1950154304504395, "global_step": 4112, "epoch": 97} {"train_loss": -4.424831390380859, "global_step": 4113, "epoch": 97} {"train_loss": -4.315894603729248, "global_step": 4114, "epoch": 97} {"train_loss": -4.261176847276234, "global_step": 4115, "epoch": 97, "val_loss": 114193.671875} {"train_loss": -4.387615203857422, "global_step": 4116, "epoch": 98} {"train_loss": -4.3127031326293945, "global_step": 4117, "epoch": 98} {"train_loss": -4.338340759277344, "global_step": 4118, "epoch": 98} {"train_loss": -4.239347457885742, "global_step": 4119, "epoch": 98} {"train_loss": -4.444817543029785, "global_step": 4120, "epoch": 98} {"train_loss": -4.40138053894043, "global_step": 4121, "epoch": 98} {"train_loss": -4.294441223144531, "global_step": 4122, "epoch": 98} {"train_loss": -4.223076343536377, "global_step": 4123, "epoch": 98} {"train_loss": -4.299312591552734, "global_step": 4124, "epoch": 98} {"train_loss": -4.400691032409668, "global_step": 4125, "epoch": 98} {"train_loss": -4.202513694763184, "global_step": 4126, "epoch": 98} {"train_loss": -4.2461395263671875, "global_step": 4127, "epoch": 98} {"train_loss": -4.427544593811035, "global_step": 4128, "epoch": 98} {"train_loss": -4.475122451782227, "global_step": 4129, "epoch": 98} {"train_loss": -4.368854522705078, "global_step": 4130, "epoch": 98} {"train_loss": -4.3653669357299805, "global_step": 4131, "epoch": 98} {"train_loss": -4.404059410095215, "global_step": 4132, "epoch": 98} {"train_loss": -4.373176574707031, "global_step": 4133, "epoch": 98} {"train_loss": -4.393580436706543, "global_step": 4134, "epoch": 98} {"train_loss": -3.9707109928131104, "global_step": 4135, "epoch": 98} {"train_loss": -4.210206985473633, "global_step": 4136, "epoch": 98} {"train_loss": -4.238256931304932, "global_step": 4137, "epoch": 98} {"train_loss": -4.380109786987305, "global_step": 4138, "epoch": 98} {"train_loss": -4.275809288024902, "global_step": 4139, "epoch": 98} {"train_loss": -4.151738166809082, "global_step": 4140, "epoch": 98} {"train_loss": -4.2827863693237305, "global_step": 4141, "epoch": 98} {"train_loss": -4.357813835144043, "global_step": 4142, "epoch": 98} {"train_loss": -4.373620986938477, "global_step": 4143, "epoch": 98} {"train_loss": -4.216701030731201, "global_step": 4144, "epoch": 98} {"train_loss": -4.184658050537109, "global_step": 4145, "epoch": 98} {"train_loss": -4.240367889404297, "global_step": 4146, "epoch": 98} {"train_loss": -4.260961055755615, "global_step": 4147, "epoch": 98} {"train_loss": -4.132553577423096, "global_step": 4148, "epoch": 98} {"train_loss": -4.3661651611328125, "global_step": 4149, "epoch": 98} {"train_loss": -4.159641265869141, "global_step": 4150, "epoch": 98} {"train_loss": -4.220695495605469, "global_step": 4151, "epoch": 98} {"train_loss": -4.383162021636963, "global_step": 4152, "epoch": 98} {"train_loss": -4.160454273223877, "global_step": 4153, "epoch": 98} {"train_loss": -4.243842124938965, "global_step": 4154, "epoch": 98} {"train_loss": -4.378652572631836, "global_step": 4155, "epoch": 98} {"train_loss": -4.2744340896606445, "global_step": 4156, "epoch": 98} {"train_loss": -4.296801300275893, "global_step": 4157, "epoch": 98, "val_loss": 113187.0859375} {"train_loss": -4.332178592681885, "global_step": 4158, "epoch": 99} {"train_loss": -4.242803573608398, "global_step": 4159, "epoch": 99} {"train_loss": -4.166049003601074, "global_step": 4160, "epoch": 99} {"train_loss": -4.317179203033447, "global_step": 4161, "epoch": 99} {"train_loss": -4.472346782684326, "global_step": 4162, "epoch": 99} {"train_loss": -4.3998823165893555, "global_step": 4163, "epoch": 99} {"train_loss": -4.3142924308776855, "global_step": 4164, "epoch": 99} {"train_loss": -4.325029373168945, "global_step": 4165, "epoch": 99} {"train_loss": -4.303600311279297, "global_step": 4166, "epoch": 99} {"train_loss": -4.221958160400391, "global_step": 4167, "epoch": 99} {"train_loss": -4.507458209991455, "global_step": 4168, "epoch": 99} {"train_loss": -4.263749599456787, "global_step": 4169, "epoch": 99} {"train_loss": -4.362865447998047, "global_step": 4170, "epoch": 99} {"train_loss": -4.356876373291016, "global_step": 4171, "epoch": 99} {"train_loss": -4.141979694366455, "global_step": 4172, "epoch": 99} {"train_loss": -4.335803031921387, "global_step": 4173, "epoch": 99} {"train_loss": -4.361721992492676, "global_step": 4174, "epoch": 99} {"train_loss": -4.078439712524414, "global_step": 4175, "epoch": 99} {"train_loss": -4.322586536407471, "global_step": 4176, "epoch": 99} {"train_loss": -4.116490364074707, "global_step": 4177, "epoch": 99} {"train_loss": -4.202427864074707, "global_step": 4178, "epoch": 99} {"train_loss": -4.283735275268555, "global_step": 4179, "epoch": 99} {"train_loss": -4.137050628662109, "global_step": 4180, "epoch": 99} {"train_loss": -4.418952941894531, "global_step": 4181, "epoch": 99} {"train_loss": -4.318734169006348, "global_step": 4182, "epoch": 99} {"train_loss": -4.200114727020264, "global_step": 4183, "epoch": 99} {"train_loss": -4.182376861572266, "global_step": 4184, "epoch": 99} {"train_loss": -4.266633987426758, "global_step": 4185, "epoch": 99} {"train_loss": -4.224920749664307, "global_step": 4186, "epoch": 99} {"train_loss": -4.267208099365234, "global_step": 4187, "epoch": 99} {"train_loss": -4.34591007232666, "global_step": 4188, "epoch": 99} {"train_loss": -4.099595546722412, "global_step": 4189, "epoch": 99} {"train_loss": -4.166568279266357, "global_step": 4190, "epoch": 99} {"train_loss": -4.31767463684082, "global_step": 4191, "epoch": 99} {"train_loss": -4.153242111206055, "global_step": 4192, "epoch": 99} {"train_loss": -4.218204021453857, "global_step": 4193, "epoch": 99} {"train_loss": -4.326290130615234, "global_step": 4194, "epoch": 99} {"train_loss": -4.153170585632324, "global_step": 4195, "epoch": 99} {"train_loss": -4.1451826095581055, "global_step": 4196, "epoch": 99} {"train_loss": -4.2368316650390625, "global_step": 4197, "epoch": 99} {"train_loss": -4.423398017883301, "global_step": 4198, "epoch": 99} {"train_loss": -4.267536958058675, "global_step": 4199, "epoch": 99, "val_loss": 110773.875} {"train_loss": -4.414962291717529, "global_step": 4200, "epoch": 100} {"train_loss": -4.266417980194092, "global_step": 4201, "epoch": 100} {"train_loss": -4.342520713806152, "global_step": 4202, "epoch": 100} {"train_loss": -4.365178108215332, "global_step": 4203, "epoch": 100} {"train_loss": -4.377875328063965, "global_step": 4204, "epoch": 100} {"train_loss": -4.327979564666748, "global_step": 4205, "epoch": 100} {"train_loss": -4.277118682861328, "global_step": 4206, "epoch": 100} {"train_loss": -4.464987754821777, "global_step": 4207, "epoch": 100} {"train_loss": -4.3359785079956055, "global_step": 4208, "epoch": 100} {"train_loss": -4.42625617980957, "global_step": 4209, "epoch": 100} {"train_loss": -4.33038854598999, "global_step": 4210, "epoch": 100} {"train_loss": -4.217290878295898, "global_step": 4211, "epoch": 100} {"train_loss": -4.460305213928223, "global_step": 4212, "epoch": 100} {"train_loss": -4.354920387268066, "global_step": 4213, "epoch": 100} {"train_loss": -4.357452392578125, "global_step": 4214, "epoch": 100} {"train_loss": -4.345464706420898, "global_step": 4215, "epoch": 100} {"train_loss": -4.297527313232422, "global_step": 4216, "epoch": 100} {"train_loss": -4.316716194152832, "global_step": 4217, "epoch": 100} {"train_loss": -4.3000946044921875, "global_step": 4218, "epoch": 100} {"train_loss": -4.304777145385742, "global_step": 4219, "epoch": 100} {"train_loss": -4.442777633666992, "global_step": 4220, "epoch": 100} {"train_loss": -4.321110725402832, "global_step": 4221, "epoch": 100} {"train_loss": -4.404496669769287, "global_step": 4222, "epoch": 100} {"train_loss": -4.404919147491455, "global_step": 4223, "epoch": 100} {"train_loss": -4.316874027252197, "global_step": 4224, "epoch": 100} {"train_loss": -4.45053768157959, "global_step": 4225, "epoch": 100} {"train_loss": -4.347598552703857, "global_step": 4226, "epoch": 100} {"train_loss": -4.405960559844971, "global_step": 4227, "epoch": 100} {"train_loss": -4.40246057510376, "global_step": 4228, "epoch": 100} {"train_loss": -4.3568572998046875, "global_step": 4229, "epoch": 100} {"train_loss": -4.271426200866699, "global_step": 4230, "epoch": 100} {"train_loss": -4.271237373352051, "global_step": 4231, "epoch": 100} {"train_loss": -4.34146785736084, "global_step": 4232, "epoch": 100} {"train_loss": -4.4612555503845215, "global_step": 4233, "epoch": 100} {"train_loss": -4.0927557945251465, "global_step": 4234, "epoch": 100} {"train_loss": -4.519995212554932, "global_step": 4235, "epoch": 100} {"train_loss": -4.264257907867432, "global_step": 4236, "epoch": 100} {"train_loss": -4.131773948669434, "global_step": 4237, "epoch": 100} {"train_loss": -4.346307754516602, "global_step": 4238, "epoch": 100} {"train_loss": -4.198936462402344, "global_step": 4239, "epoch": 100} {"train_loss": -4.251832008361816, "global_step": 4240, "epoch": 100} {"train_loss": -4.334789752960205, "global_step": 4241, "epoch": 100, "train/sim_max_reward_0": 0.2663184084241821, "train/sim_max_reward_1": 0.0006754812217992413, "train/sim_max_reward_2": 0.05073832239570286, "train/sim_max_reward_3": 0.13769413585118084, "train/sim_max_reward_4": 0.2033812624107625, "train/sim_max_reward_5": 0.5754598474433827, "test/sim_max_reward_4500000": 0.3400451299650631, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.22039670142419063, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.2811617100750341, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.059829530371475606, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.13551956320027128, "test/sim_max_reward_4500014": 0.16561182130584123, "test/sim_max_reward_4500015": 0.062209148951694965, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.32124641078587135, "test/sim_max_reward_4500018": 0.004249031229020703, "test/sim_max_reward_4500019": 0.39496762743265895, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.35046980546662604, "test/sim_max_reward_4500022": 0.33035368716497726, "test/sim_max_reward_4500023": 0.4535015697313158, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.5413558040758131, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.04163460642148004, "test/sim_max_reward_4500030": 0.2501613533633418, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.00018337792502951656, "test/sim_max_reward_4500034": 0.08044736633806474, "test/sim_max_reward_4500035": 0.0779606034003907, "test/sim_max_reward_4500036": 0.02257956182935472, "test/sim_max_reward_4500037": 0.1449618251191584, "test/sim_max_reward_4500038": 0.5151334427258505, "test/sim_max_reward_4500039": 0.02236379928361599, "test/sim_max_reward_4500040": 0.19959554609322575, "test/sim_max_reward_4500041": 0.4551139684788236, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.1175735103924684, "test/sim_max_reward_4500046": 0.24261987744140182, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.20571124295783505, "test/mean_score": 0.12324929052794852, "val_loss": 113667.0546875} {"train_loss": -4.068650722503662, "global_step": 4242, "epoch": 101} {"train_loss": -4.319967746734619, "global_step": 4243, "epoch": 101} {"train_loss": -4.355038642883301, "global_step": 4244, "epoch": 101} {"train_loss": -4.07024621963501, "global_step": 4245, "epoch": 101} {"train_loss": -4.3313751220703125, "global_step": 4246, "epoch": 101} {"train_loss": -4.239645957946777, "global_step": 4247, "epoch": 101} {"train_loss": -4.311656475067139, "global_step": 4248, "epoch": 101} {"train_loss": -4.325130462646484, "global_step": 4249, "epoch": 101} {"train_loss": -4.262801647186279, "global_step": 4250, "epoch": 101} {"train_loss": -4.412492752075195, "global_step": 4251, "epoch": 101} {"train_loss": -4.285222053527832, "global_step": 4252, "epoch": 101} {"train_loss": -4.376177787780762, "global_step": 4253, "epoch": 101} {"train_loss": -4.3734869956970215, "global_step": 4254, "epoch": 101} {"train_loss": -4.408099174499512, "global_step": 4255, "epoch": 101} {"train_loss": -4.306443214416504, "global_step": 4256, "epoch": 101} {"train_loss": -4.362790107727051, "global_step": 4257, "epoch": 101} {"train_loss": -4.398306846618652, "global_step": 4258, "epoch": 101} {"train_loss": -4.303153038024902, "global_step": 4259, "epoch": 101} {"train_loss": -4.332643508911133, "global_step": 4260, "epoch": 101} {"train_loss": -4.512664794921875, "global_step": 4261, "epoch": 101} {"train_loss": -4.427881240844727, "global_step": 4262, "epoch": 101} {"train_loss": -4.337841987609863, "global_step": 4263, "epoch": 101} {"train_loss": -4.4807000160217285, "global_step": 4264, "epoch": 101} {"train_loss": -4.407229423522949, "global_step": 4265, "epoch": 101} {"train_loss": -4.2971086502075195, "global_step": 4266, "epoch": 101} {"train_loss": -4.463112831115723, "global_step": 4267, "epoch": 101} {"train_loss": -4.401123046875, "global_step": 4268, "epoch": 101} {"train_loss": -4.349592208862305, "global_step": 4269, "epoch": 101} {"train_loss": -4.371822357177734, "global_step": 4270, "epoch": 101} {"train_loss": -4.356986045837402, "global_step": 4271, "epoch": 101} {"train_loss": -4.48937463760376, "global_step": 4272, "epoch": 101} {"train_loss": -4.457100868225098, "global_step": 4273, "epoch": 101} {"train_loss": -4.404147148132324, "global_step": 4274, "epoch": 101} {"train_loss": -4.3754048347473145, "global_step": 4275, "epoch": 101} {"train_loss": -4.241237640380859, "global_step": 4276, "epoch": 101} {"train_loss": -4.380240440368652, "global_step": 4277, "epoch": 101} {"train_loss": -4.455766677856445, "global_step": 4278, "epoch": 101} {"train_loss": -4.360827445983887, "global_step": 4279, "epoch": 101} {"train_loss": -4.406035900115967, "global_step": 4280, "epoch": 101} {"train_loss": -4.427863597869873, "global_step": 4281, "epoch": 101} {"train_loss": -4.507411003112793, "global_step": 4282, "epoch": 101} {"train_loss": -4.360403946467808, "global_step": 4283, "epoch": 101, "val_loss": 108837.7578125} {"train_loss": -4.4139180183410645, "global_step": 4284, "epoch": 102} {"train_loss": -4.504177093505859, "global_step": 4285, "epoch": 102} {"train_loss": -4.37690544128418, "global_step": 4286, "epoch": 102} {"train_loss": -4.319903373718262, "global_step": 4287, "epoch": 102} {"train_loss": -4.445312023162842, "global_step": 4288, "epoch": 102} {"train_loss": -4.469334125518799, "global_step": 4289, "epoch": 102} {"train_loss": -4.400343894958496, "global_step": 4290, "epoch": 102} {"train_loss": -4.382494926452637, "global_step": 4291, "epoch": 102} {"train_loss": -4.49956750869751, "global_step": 4292, "epoch": 102} {"train_loss": -4.247615337371826, "global_step": 4293, "epoch": 102} {"train_loss": -4.337298393249512, "global_step": 4294, "epoch": 102} {"train_loss": -4.453156471252441, "global_step": 4295, "epoch": 102} {"train_loss": -4.338076114654541, "global_step": 4296, "epoch": 102} {"train_loss": -4.112781524658203, "global_step": 4297, "epoch": 102} {"train_loss": -4.307662487030029, "global_step": 4298, "epoch": 102} {"train_loss": -4.286373138427734, "global_step": 4299, "epoch": 102} {"train_loss": -4.333226680755615, "global_step": 4300, "epoch": 102} {"train_loss": -4.3267011642456055, "global_step": 4301, "epoch": 102} {"train_loss": -4.1157989501953125, "global_step": 4302, "epoch": 102} {"train_loss": -4.25456428527832, "global_step": 4303, "epoch": 102} {"train_loss": -4.195069313049316, "global_step": 4304, "epoch": 102} {"train_loss": -4.2350568771362305, "global_step": 4305, "epoch": 102} {"train_loss": -4.120817184448242, "global_step": 4306, "epoch": 102} {"train_loss": -4.2722930908203125, "global_step": 4307, "epoch": 102} {"train_loss": -4.196898460388184, "global_step": 4308, "epoch": 102} {"train_loss": -4.402352333068848, "global_step": 4309, "epoch": 102} {"train_loss": -4.133965492248535, "global_step": 4310, "epoch": 102} {"train_loss": -4.086488246917725, "global_step": 4311, "epoch": 102} {"train_loss": -4.284870147705078, "global_step": 4312, "epoch": 102} {"train_loss": -4.470330238342285, "global_step": 4313, "epoch": 102} {"train_loss": -4.180004596710205, "global_step": 4314, "epoch": 102} {"train_loss": -4.267208099365234, "global_step": 4315, "epoch": 102} {"train_loss": -4.253145217895508, "global_step": 4316, "epoch": 102} {"train_loss": -4.407959938049316, "global_step": 4317, "epoch": 102} {"train_loss": -4.44283390045166, "global_step": 4318, "epoch": 102} {"train_loss": -4.334457874298096, "global_step": 4319, "epoch": 102} {"train_loss": -4.288177490234375, "global_step": 4320, "epoch": 102} {"train_loss": -4.261499881744385, "global_step": 4321, "epoch": 102} {"train_loss": -4.452881813049316, "global_step": 4322, "epoch": 102} {"train_loss": -4.294241905212402, "global_step": 4323, "epoch": 102} {"train_loss": -4.2979512214660645, "global_step": 4324, "epoch": 102} {"train_loss": -4.314279420035226, "global_step": 4325, "epoch": 102, "val_loss": 107137.5859375} {"train_loss": -4.4534759521484375, "global_step": 4326, "epoch": 103} {"train_loss": -4.485310077667236, "global_step": 4327, "epoch": 103} {"train_loss": -4.3698601722717285, "global_step": 4328, "epoch": 103} {"train_loss": -4.400821685791016, "global_step": 4329, "epoch": 103} {"train_loss": -4.362351894378662, "global_step": 4330, "epoch": 103} {"train_loss": -4.369605541229248, "global_step": 4331, "epoch": 103} {"train_loss": -4.449521064758301, "global_step": 4332, "epoch": 103} {"train_loss": -4.522451400756836, "global_step": 4333, "epoch": 103} {"train_loss": -4.274741172790527, "global_step": 4334, "epoch": 103} {"train_loss": -4.357815742492676, "global_step": 4335, "epoch": 103} {"train_loss": -4.463715076446533, "global_step": 4336, "epoch": 103} {"train_loss": -4.343783855438232, "global_step": 4337, "epoch": 103} {"train_loss": -4.328460693359375, "global_step": 4338, "epoch": 103} {"train_loss": -4.291324138641357, "global_step": 4339, "epoch": 103} {"train_loss": -4.2500152587890625, "global_step": 4340, "epoch": 103} {"train_loss": -4.098027229309082, "global_step": 4341, "epoch": 103} {"train_loss": -4.026252269744873, "global_step": 4342, "epoch": 103} {"train_loss": -3.819016933441162, "global_step": 4343, "epoch": 103} {"train_loss": -3.740225315093994, "global_step": 4344, "epoch": 103} {"train_loss": -4.274260520935059, "global_step": 4345, "epoch": 103} {"train_loss": -4.089034080505371, "global_step": 4346, "epoch": 103} {"train_loss": -3.985853672027588, "global_step": 4347, "epoch": 103} {"train_loss": -4.298860549926758, "global_step": 4348, "epoch": 103} {"train_loss": -4.0026655197143555, "global_step": 4349, "epoch": 103} {"train_loss": -4.221590042114258, "global_step": 4350, "epoch": 103} {"train_loss": -4.084667205810547, "global_step": 4351, "epoch": 103} {"train_loss": -4.354851722717285, "global_step": 4352, "epoch": 103} {"train_loss": -4.282071590423584, "global_step": 4353, "epoch": 103} {"train_loss": -4.155622959136963, "global_step": 4354, "epoch": 103} {"train_loss": -4.437464237213135, "global_step": 4355, "epoch": 103} {"train_loss": -4.2470245361328125, "global_step": 4356, "epoch": 103} {"train_loss": -4.393327713012695, "global_step": 4357, "epoch": 103} {"train_loss": -4.241221904754639, "global_step": 4358, "epoch": 103} {"train_loss": -4.443076133728027, "global_step": 4359, "epoch": 103} {"train_loss": -4.245379447937012, "global_step": 4360, "epoch": 103} {"train_loss": -4.192007064819336, "global_step": 4361, "epoch": 103} {"train_loss": -4.265608787536621, "global_step": 4362, "epoch": 103} {"train_loss": -4.377934455871582, "global_step": 4363, "epoch": 103} {"train_loss": -4.208850860595703, "global_step": 4364, "epoch": 103} {"train_loss": -4.390469551086426, "global_step": 4365, "epoch": 103} {"train_loss": -4.230630397796631, "global_step": 4366, "epoch": 103} {"train_loss": -4.268906093779064, "global_step": 4367, "epoch": 103, "val_loss": 106463.0546875} {"train_loss": -4.303318500518799, "global_step": 4368, "epoch": 104} {"train_loss": -4.431926727294922, "global_step": 4369, "epoch": 104} {"train_loss": -4.300702095031738, "global_step": 4370, "epoch": 104} {"train_loss": -4.37790584564209, "global_step": 4371, "epoch": 104} {"train_loss": -4.434905052185059, "global_step": 4372, "epoch": 104} {"train_loss": -4.424961090087891, "global_step": 4373, "epoch": 104} {"train_loss": -4.370822429656982, "global_step": 4374, "epoch": 104} {"train_loss": -4.527637004852295, "global_step": 4375, "epoch": 104} {"train_loss": -4.503321647644043, "global_step": 4376, "epoch": 104} {"train_loss": -4.434131622314453, "global_step": 4377, "epoch": 104} {"train_loss": -4.412565231323242, "global_step": 4378, "epoch": 104} {"train_loss": -4.570271015167236, "global_step": 4379, "epoch": 104} {"train_loss": -4.5724778175354, "global_step": 4380, "epoch": 104} {"train_loss": -4.394484519958496, "global_step": 4381, "epoch": 104} {"train_loss": -4.575883865356445, "global_step": 4382, "epoch": 104} {"train_loss": -4.432959079742432, "global_step": 4383, "epoch": 104} {"train_loss": -4.4647932052612305, "global_step": 4384, "epoch": 104} {"train_loss": -4.398107051849365, "global_step": 4385, "epoch": 104} {"train_loss": -4.49698543548584, "global_step": 4386, "epoch": 104} {"train_loss": -4.350090026855469, "global_step": 4387, "epoch": 104} {"train_loss": -4.368890762329102, "global_step": 4388, "epoch": 104} {"train_loss": -4.492504596710205, "global_step": 4389, "epoch": 104} {"train_loss": -4.406003475189209, "global_step": 4390, "epoch": 104} {"train_loss": -4.304690361022949, "global_step": 4391, "epoch": 104} {"train_loss": -4.369724750518799, "global_step": 4392, "epoch": 104} {"train_loss": -4.42520809173584, "global_step": 4393, "epoch": 104} {"train_loss": -4.526843070983887, "global_step": 4394, "epoch": 104} {"train_loss": -4.433736801147461, "global_step": 4395, "epoch": 104} {"train_loss": -4.450597286224365, "global_step": 4396, "epoch": 104} {"train_loss": -4.454183578491211, "global_step": 4397, "epoch": 104} {"train_loss": -4.359230041503906, "global_step": 4398, "epoch": 104} {"train_loss": -4.39040994644165, "global_step": 4399, "epoch": 104} {"train_loss": -4.575472831726074, "global_step": 4400, "epoch": 104} {"train_loss": -4.34913969039917, "global_step": 4401, "epoch": 104} {"train_loss": -4.518741607666016, "global_step": 4402, "epoch": 104} {"train_loss": -4.454244136810303, "global_step": 4403, "epoch": 104} {"train_loss": -4.373262405395508, "global_step": 4404, "epoch": 104} {"train_loss": -4.421415328979492, "global_step": 4405, "epoch": 104} {"train_loss": -4.488829612731934, "global_step": 4406, "epoch": 104} {"train_loss": -4.319012641906738, "global_step": 4407, "epoch": 104} {"train_loss": -4.444944381713867, "global_step": 4408, "epoch": 104} {"train_loss": -4.43396578516279, "global_step": 4409, "epoch": 104, "val_loss": 105841.109375} {"train_loss": -4.52997350692749, "global_step": 4410, "epoch": 105} {"train_loss": -4.459052085876465, "global_step": 4411, "epoch": 105} {"train_loss": -4.558811187744141, "global_step": 4412, "epoch": 105} {"train_loss": -4.491910934448242, "global_step": 4413, "epoch": 105} {"train_loss": -4.578478813171387, "global_step": 4414, "epoch": 105} {"train_loss": -4.390750885009766, "global_step": 4415, "epoch": 105} {"train_loss": -4.470806121826172, "global_step": 4416, "epoch": 105} {"train_loss": -4.410403728485107, "global_step": 4417, "epoch": 105} {"train_loss": -4.425538063049316, "global_step": 4418, "epoch": 105} {"train_loss": -4.439126014709473, "global_step": 4419, "epoch": 105} {"train_loss": -4.524707794189453, "global_step": 4420, "epoch": 105} {"train_loss": -4.4048027992248535, "global_step": 4421, "epoch": 105} {"train_loss": -4.471146583557129, "global_step": 4422, "epoch": 105} {"train_loss": -4.417089462280273, "global_step": 4423, "epoch": 105} {"train_loss": -4.551982402801514, "global_step": 4424, "epoch": 105} {"train_loss": -4.5629167556762695, "global_step": 4425, "epoch": 105} {"train_loss": -4.619641304016113, "global_step": 4426, "epoch": 105} {"train_loss": -4.389245986938477, "global_step": 4427, "epoch": 105} {"train_loss": -4.481908798217773, "global_step": 4428, "epoch": 105} {"train_loss": -4.496614933013916, "global_step": 4429, "epoch": 105} {"train_loss": -4.47084903717041, "global_step": 4430, "epoch": 105} {"train_loss": -4.393388748168945, "global_step": 4431, "epoch": 105} {"train_loss": -4.451375961303711, "global_step": 4432, "epoch": 105} {"train_loss": -4.399710655212402, "global_step": 4433, "epoch": 105} {"train_loss": -4.018028259277344, "global_step": 4434, "epoch": 105} {"train_loss": -4.268385410308838, "global_step": 4435, "epoch": 105} {"train_loss": -4.29042387008667, "global_step": 4436, "epoch": 105} {"train_loss": -3.878025770187378, "global_step": 4437, "epoch": 105} {"train_loss": -4.373294830322266, "global_step": 4438, "epoch": 105} {"train_loss": -3.6673483848571777, "global_step": 4439, "epoch": 105} {"train_loss": -3.7174010276794434, "global_step": 4440, "epoch": 105} {"train_loss": -3.9917471408843994, "global_step": 4441, "epoch": 105} {"train_loss": -3.8633170127868652, "global_step": 4442, "epoch": 105} {"train_loss": -4.075868129730225, "global_step": 4443, "epoch": 105} {"train_loss": -3.8750839233398438, "global_step": 4444, "epoch": 105} {"train_loss": -4.161062717437744, "global_step": 4445, "epoch": 105} {"train_loss": -4.159489154815674, "global_step": 4446, "epoch": 105} {"train_loss": -4.023283958435059, "global_step": 4447, "epoch": 105} {"train_loss": -4.209028244018555, "global_step": 4448, "epoch": 105} {"train_loss": -4.002107620239258, "global_step": 4449, "epoch": 105} {"train_loss": -4.08920431137085, "global_step": 4450, "epoch": 105} {"train_loss": -4.290670656022572, "global_step": 4451, "epoch": 105, "val_loss": 107115.1796875} {"train_loss": -4.304608345031738, "global_step": 4452, "epoch": 106} {"train_loss": -4.023554801940918, "global_step": 4453, "epoch": 106} {"train_loss": -4.072882652282715, "global_step": 4454, "epoch": 106} {"train_loss": -4.206649303436279, "global_step": 4455, "epoch": 106} {"train_loss": -4.178978443145752, "global_step": 4456, "epoch": 106} {"train_loss": -4.218651294708252, "global_step": 4457, "epoch": 106} {"train_loss": -4.456329345703125, "global_step": 4458, "epoch": 106} {"train_loss": -4.349186897277832, "global_step": 4459, "epoch": 106} {"train_loss": -4.298890113830566, "global_step": 4460, "epoch": 106} {"train_loss": -4.427435874938965, "global_step": 4461, "epoch": 106} {"train_loss": -4.345110893249512, "global_step": 4462, "epoch": 106} {"train_loss": -4.227513313293457, "global_step": 4463, "epoch": 106} {"train_loss": -4.46075439453125, "global_step": 4464, "epoch": 106} {"train_loss": -4.403800964355469, "global_step": 4465, "epoch": 106} {"train_loss": -4.354704856872559, "global_step": 4466, "epoch": 106} {"train_loss": -4.456019878387451, "global_step": 4467, "epoch": 106} {"train_loss": -4.424694061279297, "global_step": 4468, "epoch": 106} {"train_loss": -4.438009262084961, "global_step": 4469, "epoch": 106} {"train_loss": -4.368664741516113, "global_step": 4470, "epoch": 106} {"train_loss": -4.190727710723877, "global_step": 4471, "epoch": 106} {"train_loss": -4.001279354095459, "global_step": 4472, "epoch": 106} {"train_loss": -4.16799259185791, "global_step": 4473, "epoch": 106} {"train_loss": -4.371262550354004, "global_step": 4474, "epoch": 106} {"train_loss": -4.366457939147949, "global_step": 4475, "epoch": 106} {"train_loss": -4.172102928161621, "global_step": 4476, "epoch": 106} {"train_loss": -4.399722099304199, "global_step": 4477, "epoch": 106} {"train_loss": -4.476668357849121, "global_step": 4478, "epoch": 106} {"train_loss": -4.263313293457031, "global_step": 4479, "epoch": 106} {"train_loss": -4.446545600891113, "global_step": 4480, "epoch": 106} {"train_loss": -4.477693557739258, "global_step": 4481, "epoch": 106} {"train_loss": -4.293022155761719, "global_step": 4482, "epoch": 106} {"train_loss": -4.301218032836914, "global_step": 4483, "epoch": 106} {"train_loss": -4.4296674728393555, "global_step": 4484, "epoch": 106} {"train_loss": -4.382106781005859, "global_step": 4485, "epoch": 106} {"train_loss": -4.355788230895996, "global_step": 4486, "epoch": 106} {"train_loss": -4.352081775665283, "global_step": 4487, "epoch": 106} {"train_loss": -4.368686199188232, "global_step": 4488, "epoch": 106} {"train_loss": -4.366530418395996, "global_step": 4489, "epoch": 106} {"train_loss": -4.427138328552246, "global_step": 4490, "epoch": 106} {"train_loss": -4.4614787101745605, "global_step": 4491, "epoch": 106} {"train_loss": -4.49027156829834, "global_step": 4492, "epoch": 106} {"train_loss": -4.335403533208938, "global_step": 4493, "epoch": 106, "val_loss": 104936.6640625} {"train_loss": -4.4948835372924805, "global_step": 4494, "epoch": 107} {"train_loss": -4.348404884338379, "global_step": 4495, "epoch": 107} {"train_loss": -4.299173831939697, "global_step": 4496, "epoch": 107} {"train_loss": -4.401371002197266, "global_step": 4497, "epoch": 107} {"train_loss": -4.521778583526611, "global_step": 4498, "epoch": 107} {"train_loss": -4.6086931228637695, "global_step": 4499, "epoch": 107} {"train_loss": -4.484133720397949, "global_step": 4500, "epoch": 107} {"train_loss": -4.507976531982422, "global_step": 4501, "epoch": 107} {"train_loss": -4.5245161056518555, "global_step": 4502, "epoch": 107} {"train_loss": -4.442105293273926, "global_step": 4503, "epoch": 107} {"train_loss": -4.342135429382324, "global_step": 4504, "epoch": 107} {"train_loss": -4.377936840057373, "global_step": 4505, "epoch": 107} {"train_loss": -4.228343486785889, "global_step": 4506, "epoch": 107} {"train_loss": -4.338652610778809, "global_step": 4507, "epoch": 107} {"train_loss": -4.434749126434326, "global_step": 4508, "epoch": 107} {"train_loss": -4.223334312438965, "global_step": 4509, "epoch": 107} {"train_loss": -4.285384178161621, "global_step": 4510, "epoch": 107} {"train_loss": -4.454267501831055, "global_step": 4511, "epoch": 107} {"train_loss": -4.411782264709473, "global_step": 4512, "epoch": 107} {"train_loss": -4.3386993408203125, "global_step": 4513, "epoch": 107} {"train_loss": -4.552486419677734, "global_step": 4514, "epoch": 107} {"train_loss": -4.474907398223877, "global_step": 4515, "epoch": 107} {"train_loss": -4.251307487487793, "global_step": 4516, "epoch": 107} {"train_loss": -4.602914810180664, "global_step": 4517, "epoch": 107} {"train_loss": -4.475488662719727, "global_step": 4518, "epoch": 107} {"train_loss": -4.442606449127197, "global_step": 4519, "epoch": 107} {"train_loss": -4.470538139343262, "global_step": 4520, "epoch": 107} {"train_loss": -4.292407989501953, "global_step": 4521, "epoch": 107} {"train_loss": -4.423810958862305, "global_step": 4522, "epoch": 107} {"train_loss": -4.348711013793945, "global_step": 4523, "epoch": 107} {"train_loss": -4.515915870666504, "global_step": 4524, "epoch": 107} {"train_loss": -4.40472412109375, "global_step": 4525, "epoch": 107} {"train_loss": -4.51445198059082, "global_step": 4526, "epoch": 107} {"train_loss": -4.525157928466797, "global_step": 4527, "epoch": 107} {"train_loss": -4.386408805847168, "global_step": 4528, "epoch": 107} {"train_loss": -4.399094104766846, "global_step": 4529, "epoch": 107} {"train_loss": -4.435925483703613, "global_step": 4530, "epoch": 107} {"train_loss": -4.394952297210693, "global_step": 4531, "epoch": 107} {"train_loss": -4.634720802307129, "global_step": 4532, "epoch": 107} {"train_loss": -4.4369306564331055, "global_step": 4533, "epoch": 107} {"train_loss": -4.537715911865234, "global_step": 4534, "epoch": 107} {"train_loss": -4.427355720883324, "global_step": 4535, "epoch": 107, "val_loss": 105278.921875} {"train_loss": -4.445321559906006, "global_step": 4536, "epoch": 108} {"train_loss": -4.349799156188965, "global_step": 4537, "epoch": 108} {"train_loss": -4.525378704071045, "global_step": 4538, "epoch": 108} {"train_loss": -4.454082489013672, "global_step": 4539, "epoch": 108} {"train_loss": -4.481988906860352, "global_step": 4540, "epoch": 108} {"train_loss": -4.496259689331055, "global_step": 4541, "epoch": 108} {"train_loss": -4.5374603271484375, "global_step": 4542, "epoch": 108} {"train_loss": -4.338997840881348, "global_step": 4543, "epoch": 108} {"train_loss": -4.53218412399292, "global_step": 4544, "epoch": 108} {"train_loss": -4.581354141235352, "global_step": 4545, "epoch": 108} {"train_loss": -4.437273025512695, "global_step": 4546, "epoch": 108} {"train_loss": -4.501913547515869, "global_step": 4547, "epoch": 108} {"train_loss": -4.392333030700684, "global_step": 4548, "epoch": 108} {"train_loss": -4.457432746887207, "global_step": 4549, "epoch": 108} {"train_loss": -4.422147750854492, "global_step": 4550, "epoch": 108} {"train_loss": -4.341790676116943, "global_step": 4551, "epoch": 108} {"train_loss": -4.594130039215088, "global_step": 4552, "epoch": 108} {"train_loss": -4.505214691162109, "global_step": 4553, "epoch": 108} {"train_loss": -4.210762977600098, "global_step": 4554, "epoch": 108} {"train_loss": -4.456520080566406, "global_step": 4555, "epoch": 108} {"train_loss": -4.4012064933776855, "global_step": 4556, "epoch": 108} {"train_loss": -4.557553768157959, "global_step": 4557, "epoch": 108} {"train_loss": -4.537727355957031, "global_step": 4558, "epoch": 108} {"train_loss": -4.461601257324219, "global_step": 4559, "epoch": 108} {"train_loss": -4.430294036865234, "global_step": 4560, "epoch": 108} {"train_loss": -4.418514251708984, "global_step": 4561, "epoch": 108} {"train_loss": -4.634796619415283, "global_step": 4562, "epoch": 108} {"train_loss": -4.4279375076293945, "global_step": 4563, "epoch": 108} {"train_loss": -4.679048538208008, "global_step": 4564, "epoch": 108} {"train_loss": -4.450263500213623, "global_step": 4565, "epoch": 108} {"train_loss": -4.476982116699219, "global_step": 4566, "epoch": 108} {"train_loss": -4.454640865325928, "global_step": 4567, "epoch": 108} {"train_loss": -4.447399616241455, "global_step": 4568, "epoch": 108} {"train_loss": -4.4871721267700195, "global_step": 4569, "epoch": 108} {"train_loss": -4.578248023986816, "global_step": 4570, "epoch": 108} {"train_loss": -4.513570308685303, "global_step": 4571, "epoch": 108} {"train_loss": -4.607394218444824, "global_step": 4572, "epoch": 108} {"train_loss": -4.399522304534912, "global_step": 4573, "epoch": 108} {"train_loss": -4.500582695007324, "global_step": 4574, "epoch": 108} {"train_loss": -4.6058197021484375, "global_step": 4575, "epoch": 108} {"train_loss": -4.4689788818359375, "global_step": 4576, "epoch": 108} {"train_loss": -4.477233784539359, "global_step": 4577, "epoch": 108, "val_loss": 102525.6796875} {"train_loss": -4.505548477172852, "global_step": 4578, "epoch": 109} {"train_loss": -4.518166542053223, "global_step": 4579, "epoch": 109} {"train_loss": -4.563798904418945, "global_step": 4580, "epoch": 109} {"train_loss": -4.622604846954346, "global_step": 4581, "epoch": 109} {"train_loss": -4.640883445739746, "global_step": 4582, "epoch": 109} {"train_loss": -4.602309226989746, "global_step": 4583, "epoch": 109} {"train_loss": -4.618821144104004, "global_step": 4584, "epoch": 109} {"train_loss": -4.446070671081543, "global_step": 4585, "epoch": 109} {"train_loss": -4.504189491271973, "global_step": 4586, "epoch": 109} {"train_loss": -4.483331680297852, "global_step": 4587, "epoch": 109} {"train_loss": -4.271803855895996, "global_step": 4588, "epoch": 109} {"train_loss": -4.287168979644775, "global_step": 4589, "epoch": 109} {"train_loss": -4.564492225646973, "global_step": 4590, "epoch": 109} {"train_loss": -4.590965270996094, "global_step": 4591, "epoch": 109} {"train_loss": -4.541803359985352, "global_step": 4592, "epoch": 109} {"train_loss": -4.5252227783203125, "global_step": 4593, "epoch": 109} {"train_loss": -4.465056896209717, "global_step": 4594, "epoch": 109} {"train_loss": -4.512686729431152, "global_step": 4595, "epoch": 109} {"train_loss": -4.512598991394043, "global_step": 4596, "epoch": 109} {"train_loss": -4.587233543395996, "global_step": 4597, "epoch": 109} {"train_loss": -4.547531604766846, "global_step": 4598, "epoch": 109} {"train_loss": -4.446133613586426, "global_step": 4599, "epoch": 109} {"train_loss": -4.377003192901611, "global_step": 4600, "epoch": 109} {"train_loss": -4.597023963928223, "global_step": 4601, "epoch": 109} {"train_loss": -4.533343315124512, "global_step": 4602, "epoch": 109} {"train_loss": -4.393085956573486, "global_step": 4603, "epoch": 109} {"train_loss": -4.6599884033203125, "global_step": 4604, "epoch": 109} {"train_loss": -4.5157060623168945, "global_step": 4605, "epoch": 109} {"train_loss": -4.510139465332031, "global_step": 4606, "epoch": 109} {"train_loss": -4.575163841247559, "global_step": 4607, "epoch": 109} {"train_loss": -4.50778865814209, "global_step": 4608, "epoch": 109} {"train_loss": -4.404392242431641, "global_step": 4609, "epoch": 109} {"train_loss": -4.367218017578125, "global_step": 4610, "epoch": 109} {"train_loss": -4.337251663208008, "global_step": 4611, "epoch": 109} {"train_loss": -4.471832275390625, "global_step": 4612, "epoch": 109} {"train_loss": -4.359772205352783, "global_step": 4613, "epoch": 109} {"train_loss": -4.349639415740967, "global_step": 4614, "epoch": 109} {"train_loss": -4.369855880737305, "global_step": 4615, "epoch": 109} {"train_loss": -4.435564041137695, "global_step": 4616, "epoch": 109} {"train_loss": -4.407846450805664, "global_step": 4617, "epoch": 109} {"train_loss": -4.4165940284729, "global_step": 4618, "epoch": 109} {"train_loss": -4.483220384234474, "global_step": 4619, "epoch": 109, "val_loss": 100953.3359375} {"train_loss": -4.655296802520752, "global_step": 4620, "epoch": 110} {"train_loss": -4.3105788230896, "global_step": 4621, "epoch": 110} {"train_loss": -4.548229694366455, "global_step": 4622, "epoch": 110} {"train_loss": -4.563350677490234, "global_step": 4623, "epoch": 110} {"train_loss": -4.439994812011719, "global_step": 4624, "epoch": 110} {"train_loss": -4.5627570152282715, "global_step": 4625, "epoch": 110} {"train_loss": -4.527427673339844, "global_step": 4626, "epoch": 110} {"train_loss": -4.601102828979492, "global_step": 4627, "epoch": 110} {"train_loss": -4.438028335571289, "global_step": 4628, "epoch": 110} {"train_loss": -4.358248710632324, "global_step": 4629, "epoch": 110} {"train_loss": -4.421746253967285, "global_step": 4630, "epoch": 110} {"train_loss": -4.381598472595215, "global_step": 4631, "epoch": 110} {"train_loss": -4.5557026863098145, "global_step": 4632, "epoch": 110} {"train_loss": -4.584450721740723, "global_step": 4633, "epoch": 110} {"train_loss": -4.4995880126953125, "global_step": 4634, "epoch": 110} {"train_loss": -4.512444496154785, "global_step": 4635, "epoch": 110} {"train_loss": -4.489938735961914, "global_step": 4636, "epoch": 110} {"train_loss": -4.53095817565918, "global_step": 4637, "epoch": 110} {"train_loss": -4.71371603012085, "global_step": 4638, "epoch": 110} {"train_loss": -4.545891761779785, "global_step": 4639, "epoch": 110} {"train_loss": -4.469343185424805, "global_step": 4640, "epoch": 110} {"train_loss": -4.5334014892578125, "global_step": 4641, "epoch": 110} {"train_loss": -4.604116916656494, "global_step": 4642, "epoch": 110} {"train_loss": -4.565896987915039, "global_step": 4643, "epoch": 110} {"train_loss": -4.519880294799805, "global_step": 4644, "epoch": 110} {"train_loss": -4.443259239196777, "global_step": 4645, "epoch": 110} {"train_loss": -4.5383992195129395, "global_step": 4646, "epoch": 110} {"train_loss": -4.463795185089111, "global_step": 4647, "epoch": 110} {"train_loss": -4.583894729614258, "global_step": 4648, "epoch": 110} {"train_loss": -4.589181900024414, "global_step": 4649, "epoch": 110} {"train_loss": -4.514007568359375, "global_step": 4650, "epoch": 110} {"train_loss": -4.468563079833984, "global_step": 4651, "epoch": 110} {"train_loss": -4.401776313781738, "global_step": 4652, "epoch": 110} {"train_loss": -4.16210412979126, "global_step": 4653, "epoch": 110} {"train_loss": -4.259832859039307, "global_step": 4654, "epoch": 110} {"train_loss": -4.411225318908691, "global_step": 4655, "epoch": 110} {"train_loss": -3.8391947746276855, "global_step": 4656, "epoch": 110} {"train_loss": -4.257882118225098, "global_step": 4657, "epoch": 110} {"train_loss": -4.146981716156006, "global_step": 4658, "epoch": 110} {"train_loss": -4.3661651611328125, "global_step": 4659, "epoch": 110} {"train_loss": -4.0503129959106445, "global_step": 4660, "epoch": 110} {"train_loss": -4.43528417746226, "global_step": 4661, "epoch": 110, "val_loss": 103925.2109375} {"train_loss": -4.084845542907715, "global_step": 4662, "epoch": 111} {"train_loss": -3.9198241233825684, "global_step": 4663, "epoch": 111} {"train_loss": -4.1724653244018555, "global_step": 4664, "epoch": 111} {"train_loss": -4.069527626037598, "global_step": 4665, "epoch": 111} {"train_loss": -4.15036678314209, "global_step": 4666, "epoch": 111} {"train_loss": -4.1904988288879395, "global_step": 4667, "epoch": 111} {"train_loss": -4.223424434661865, "global_step": 4668, "epoch": 111} {"train_loss": -4.310063362121582, "global_step": 4669, "epoch": 111} {"train_loss": -4.159353733062744, "global_step": 4670, "epoch": 111} {"train_loss": -4.266810417175293, "global_step": 4671, "epoch": 111} {"train_loss": -4.3232831954956055, "global_step": 4672, "epoch": 111} {"train_loss": -4.307304859161377, "global_step": 4673, "epoch": 111} {"train_loss": -4.3966569900512695, "global_step": 4674, "epoch": 111} {"train_loss": -4.257233142852783, "global_step": 4675, "epoch": 111} {"train_loss": -4.264604568481445, "global_step": 4676, "epoch": 111} {"train_loss": -4.408867835998535, "global_step": 4677, "epoch": 111} {"train_loss": -4.320077419281006, "global_step": 4678, "epoch": 111} {"train_loss": -4.520174026489258, "global_step": 4679, "epoch": 111} {"train_loss": -4.371073246002197, "global_step": 4680, "epoch": 111} {"train_loss": -4.439898490905762, "global_step": 4681, "epoch": 111} {"train_loss": -4.508580207824707, "global_step": 4682, "epoch": 111} {"train_loss": -4.382333755493164, "global_step": 4683, "epoch": 111} {"train_loss": -4.4291582107543945, "global_step": 4684, "epoch": 111} {"train_loss": -4.47310733795166, "global_step": 4685, "epoch": 111} {"train_loss": -4.393418312072754, "global_step": 4686, "epoch": 111} {"train_loss": -4.538257598876953, "global_step": 4687, "epoch": 111} {"train_loss": -4.541311264038086, "global_step": 4688, "epoch": 111} {"train_loss": -4.446367263793945, "global_step": 4689, "epoch": 111} {"train_loss": -4.48574686050415, "global_step": 4690, "epoch": 111} {"train_loss": -4.70267391204834, "global_step": 4691, "epoch": 111} {"train_loss": -4.393104076385498, "global_step": 4692, "epoch": 111} {"train_loss": -4.496442794799805, "global_step": 4693, "epoch": 111} {"train_loss": -4.449187755584717, "global_step": 4694, "epoch": 111} {"train_loss": -4.5188140869140625, "global_step": 4695, "epoch": 111} {"train_loss": -4.413825035095215, "global_step": 4696, "epoch": 111} {"train_loss": -4.409862518310547, "global_step": 4697, "epoch": 111} {"train_loss": -4.5661420822143555, "global_step": 4698, "epoch": 111} {"train_loss": -4.455243110656738, "global_step": 4699, "epoch": 111} {"train_loss": -4.513401985168457, "global_step": 4700, "epoch": 111} {"train_loss": -4.511537551879883, "global_step": 4701, "epoch": 111} {"train_loss": -4.474981307983398, "global_step": 4702, "epoch": 111} {"train_loss": -4.376623744056339, "global_step": 4703, "epoch": 111, "val_loss": 101280.953125} {"train_loss": -4.60002326965332, "global_step": 4704, "epoch": 112} {"train_loss": -4.277918338775635, "global_step": 4705, "epoch": 112} {"train_loss": -4.530928611755371, "global_step": 4706, "epoch": 112} {"train_loss": -4.765979766845703, "global_step": 4707, "epoch": 112} {"train_loss": -4.347562789916992, "global_step": 4708, "epoch": 112} {"train_loss": -4.292994976043701, "global_step": 4709, "epoch": 112} {"train_loss": -4.570356369018555, "global_step": 4710, "epoch": 112} {"train_loss": -4.550998687744141, "global_step": 4711, "epoch": 112} {"train_loss": -4.403568267822266, "global_step": 4712, "epoch": 112} {"train_loss": -4.4913330078125, "global_step": 4713, "epoch": 112} {"train_loss": -4.3918070793151855, "global_step": 4714, "epoch": 112} {"train_loss": -4.204835891723633, "global_step": 4715, "epoch": 112} {"train_loss": -4.445587158203125, "global_step": 4716, "epoch": 112} {"train_loss": -4.371844291687012, "global_step": 4717, "epoch": 112} {"train_loss": -4.5392656326293945, "global_step": 4718, "epoch": 112} {"train_loss": -4.618608474731445, "global_step": 4719, "epoch": 112} {"train_loss": -4.405397891998291, "global_step": 4720, "epoch": 112} {"train_loss": -4.559788227081299, "global_step": 4721, "epoch": 112} {"train_loss": -4.525014877319336, "global_step": 4722, "epoch": 112} {"train_loss": -4.415915489196777, "global_step": 4723, "epoch": 112} {"train_loss": -4.498403549194336, "global_step": 4724, "epoch": 112} {"train_loss": -4.59343957901001, "global_step": 4725, "epoch": 112} {"train_loss": -4.616307258605957, "global_step": 4726, "epoch": 112} {"train_loss": -4.50660514831543, "global_step": 4727, "epoch": 112} {"train_loss": -4.5273118019104, "global_step": 4728, "epoch": 112} {"train_loss": -4.800943374633789, "global_step": 4729, "epoch": 112} {"train_loss": -4.506519794464111, "global_step": 4730, "epoch": 112} {"train_loss": -4.525202751159668, "global_step": 4731, "epoch": 112} {"train_loss": -4.605173587799072, "global_step": 4732, "epoch": 112} {"train_loss": -4.5234293937683105, "global_step": 4733, "epoch": 112} {"train_loss": -4.4196248054504395, "global_step": 4734, "epoch": 112} {"train_loss": -4.561631202697754, "global_step": 4735, "epoch": 112} {"train_loss": -4.575078010559082, "global_step": 4736, "epoch": 112} {"train_loss": -4.476226329803467, "global_step": 4737, "epoch": 112} {"train_loss": -4.4944257736206055, "global_step": 4738, "epoch": 112} {"train_loss": -4.469544410705566, "global_step": 4739, "epoch": 112} {"train_loss": -4.587645530700684, "global_step": 4740, "epoch": 112} {"train_loss": -4.410056114196777, "global_step": 4741, "epoch": 112} {"train_loss": -4.560633659362793, "global_step": 4742, "epoch": 112} {"train_loss": -4.63072395324707, "global_step": 4743, "epoch": 112} {"train_loss": -4.561356544494629, "global_step": 4744, "epoch": 112} {"train_loss": -4.506544328871227, "global_step": 4745, "epoch": 112, "val_loss": 99496.2734375} {"train_loss": -4.547691345214844, "global_step": 4746, "epoch": 113} {"train_loss": -4.561485767364502, "global_step": 4747, "epoch": 113} {"train_loss": -4.453078269958496, "global_step": 4748, "epoch": 113} {"train_loss": -4.587928771972656, "global_step": 4749, "epoch": 113} {"train_loss": -4.641801357269287, "global_step": 4750, "epoch": 113} {"train_loss": -4.631083011627197, "global_step": 4751, "epoch": 113} {"train_loss": -4.545707702636719, "global_step": 4752, "epoch": 113} {"train_loss": -4.3619890213012695, "global_step": 4753, "epoch": 113} {"train_loss": -4.6485371589660645, "global_step": 4754, "epoch": 113} {"train_loss": -4.632133483886719, "global_step": 4755, "epoch": 113} {"train_loss": -4.5706281661987305, "global_step": 4756, "epoch": 113} {"train_loss": -4.534735679626465, "global_step": 4757, "epoch": 113} {"train_loss": -4.573631286621094, "global_step": 4758, "epoch": 113} {"train_loss": -4.543647766113281, "global_step": 4759, "epoch": 113} {"train_loss": -4.562563896179199, "global_step": 4760, "epoch": 113} {"train_loss": -4.520956993103027, "global_step": 4761, "epoch": 113} {"train_loss": -4.548007965087891, "global_step": 4762, "epoch": 113} {"train_loss": -4.398728847503662, "global_step": 4763, "epoch": 113} {"train_loss": -4.367183685302734, "global_step": 4764, "epoch": 113} {"train_loss": -4.546834468841553, "global_step": 4765, "epoch": 113} {"train_loss": -4.536780834197998, "global_step": 4766, "epoch": 113} {"train_loss": -4.359491348266602, "global_step": 4767, "epoch": 113} {"train_loss": -4.37796688079834, "global_step": 4768, "epoch": 113} {"train_loss": -4.436073303222656, "global_step": 4769, "epoch": 113} {"train_loss": -4.49980354309082, "global_step": 4770, "epoch": 113} {"train_loss": -4.500429153442383, "global_step": 4771, "epoch": 113} {"train_loss": -4.515852451324463, "global_step": 4772, "epoch": 113} {"train_loss": -4.257584571838379, "global_step": 4773, "epoch": 113} {"train_loss": -4.346783638000488, "global_step": 4774, "epoch": 113} {"train_loss": -4.369202136993408, "global_step": 4775, "epoch": 113} {"train_loss": -4.412970542907715, "global_step": 4776, "epoch": 113} {"train_loss": -4.464018821716309, "global_step": 4777, "epoch": 113} {"train_loss": -4.0390472412109375, "global_step": 4778, "epoch": 113} {"train_loss": -4.393679618835449, "global_step": 4779, "epoch": 113} {"train_loss": -4.629854202270508, "global_step": 4780, "epoch": 113} {"train_loss": -4.322504043579102, "global_step": 4781, "epoch": 113} {"train_loss": -4.544510841369629, "global_step": 4782, "epoch": 113} {"train_loss": -4.434568881988525, "global_step": 4783, "epoch": 113} {"train_loss": -4.455188751220703, "global_step": 4784, "epoch": 113} {"train_loss": -4.602754592895508, "global_step": 4785, "epoch": 113} {"train_loss": -4.415344715118408, "global_step": 4786, "epoch": 113} {"train_loss": -4.483837502343314, "global_step": 4787, "epoch": 113, "val_loss": 98749.859375} {"train_loss": -4.653962135314941, "global_step": 4788, "epoch": 114} {"train_loss": -4.412755966186523, "global_step": 4789, "epoch": 114} {"train_loss": -4.573543548583984, "global_step": 4790, "epoch": 114} {"train_loss": -4.426597595214844, "global_step": 4791, "epoch": 114} {"train_loss": -4.3912129402160645, "global_step": 4792, "epoch": 114} {"train_loss": -4.398158073425293, "global_step": 4793, "epoch": 114} {"train_loss": -4.583846092224121, "global_step": 4794, "epoch": 114} {"train_loss": -4.521025657653809, "global_step": 4795, "epoch": 114} {"train_loss": -4.476408004760742, "global_step": 4796, "epoch": 114} {"train_loss": -4.6413140296936035, "global_step": 4797, "epoch": 114} {"train_loss": -4.341041088104248, "global_step": 4798, "epoch": 114} {"train_loss": -4.572719573974609, "global_step": 4799, "epoch": 114} {"train_loss": -4.603658676147461, "global_step": 4800, "epoch": 114} {"train_loss": -4.502192497253418, "global_step": 4801, "epoch": 114} {"train_loss": -4.563780784606934, "global_step": 4802, "epoch": 114} {"train_loss": -4.4768900871276855, "global_step": 4803, "epoch": 114} {"train_loss": -4.567238807678223, "global_step": 4804, "epoch": 114} {"train_loss": -4.298595428466797, "global_step": 4805, "epoch": 114} {"train_loss": -4.548874855041504, "global_step": 4806, "epoch": 114} {"train_loss": -4.580123424530029, "global_step": 4807, "epoch": 114} {"train_loss": -4.52290153503418, "global_step": 4808, "epoch": 114} {"train_loss": -4.57313346862793, "global_step": 4809, "epoch": 114} {"train_loss": -4.561266899108887, "global_step": 4810, "epoch": 114} {"train_loss": -4.578339576721191, "global_step": 4811, "epoch": 114} {"train_loss": -4.637102127075195, "global_step": 4812, "epoch": 114} {"train_loss": -4.511202812194824, "global_step": 4813, "epoch": 114} {"train_loss": -4.36919641494751, "global_step": 4814, "epoch": 114} {"train_loss": -4.512953758239746, "global_step": 4815, "epoch": 114} {"train_loss": -4.764762878417969, "global_step": 4816, "epoch": 114} {"train_loss": -4.56655216217041, "global_step": 4817, "epoch": 114} {"train_loss": -4.463105201721191, "global_step": 4818, "epoch": 114} {"train_loss": -4.538702011108398, "global_step": 4819, "epoch": 114} {"train_loss": -4.505457878112793, "global_step": 4820, "epoch": 114} {"train_loss": -4.731459617614746, "global_step": 4821, "epoch": 114} {"train_loss": -4.637355804443359, "global_step": 4822, "epoch": 114} {"train_loss": -4.583844184875488, "global_step": 4823, "epoch": 114} {"train_loss": -4.454995632171631, "global_step": 4824, "epoch": 114} {"train_loss": -4.463431358337402, "global_step": 4825, "epoch": 114} {"train_loss": -4.727237224578857, "global_step": 4826, "epoch": 114} {"train_loss": -4.6510539054870605, "global_step": 4827, "epoch": 114} {"train_loss": -4.588539123535156, "global_step": 4828, "epoch": 114} {"train_loss": -4.544336182730539, "global_step": 4829, "epoch": 114, "val_loss": 97602.984375} {"train_loss": -4.483148097991943, "global_step": 4830, "epoch": 115} {"train_loss": -4.5324554443359375, "global_step": 4831, "epoch": 115} {"train_loss": -4.551464080810547, "global_step": 4832, "epoch": 115} {"train_loss": -4.731136322021484, "global_step": 4833, "epoch": 115} {"train_loss": -4.538203239440918, "global_step": 4834, "epoch": 115} {"train_loss": -4.405782222747803, "global_step": 4835, "epoch": 115} {"train_loss": -4.504773139953613, "global_step": 4836, "epoch": 115} {"train_loss": -4.7055206298828125, "global_step": 4837, "epoch": 115} {"train_loss": -4.617849349975586, "global_step": 4838, "epoch": 115} {"train_loss": -4.4277472496032715, "global_step": 4839, "epoch": 115} {"train_loss": -4.490147113800049, "global_step": 4840, "epoch": 115} {"train_loss": -4.556001663208008, "global_step": 4841, "epoch": 115} {"train_loss": -4.4203691482543945, "global_step": 4842, "epoch": 115} {"train_loss": -4.580266952514648, "global_step": 4843, "epoch": 115} {"train_loss": -4.46914005279541, "global_step": 4844, "epoch": 115} {"train_loss": -4.319658279418945, "global_step": 4845, "epoch": 115} {"train_loss": -4.4930830001831055, "global_step": 4846, "epoch": 115} {"train_loss": -4.52335262298584, "global_step": 4847, "epoch": 115} {"train_loss": -4.406317710876465, "global_step": 4848, "epoch": 115} {"train_loss": -4.5587382316589355, "global_step": 4849, "epoch": 115} {"train_loss": -4.4116339683532715, "global_step": 4850, "epoch": 115} {"train_loss": -4.552389621734619, "global_step": 4851, "epoch": 115} {"train_loss": -4.527797222137451, "global_step": 4852, "epoch": 115} {"train_loss": -4.560704231262207, "global_step": 4853, "epoch": 115} {"train_loss": -4.439375877380371, "global_step": 4854, "epoch": 115} {"train_loss": -4.581961631774902, "global_step": 4855, "epoch": 115} {"train_loss": -4.473424911499023, "global_step": 4856, "epoch": 115} {"train_loss": -4.318990707397461, "global_step": 4857, "epoch": 115} {"train_loss": -4.502230167388916, "global_step": 4858, "epoch": 115} {"train_loss": -4.538271903991699, "global_step": 4859, "epoch": 115} {"train_loss": -4.28125, "global_step": 4860, "epoch": 115} {"train_loss": -4.381227016448975, "global_step": 4861, "epoch": 115} {"train_loss": -4.586576461791992, "global_step": 4862, "epoch": 115} {"train_loss": -4.355069160461426, "global_step": 4863, "epoch": 115} {"train_loss": -4.549955368041992, "global_step": 4864, "epoch": 115} {"train_loss": -4.495358467102051, "global_step": 4865, "epoch": 115} {"train_loss": -4.582873821258545, "global_step": 4866, "epoch": 115} {"train_loss": -4.602815628051758, "global_step": 4867, "epoch": 115} {"train_loss": -4.679152488708496, "global_step": 4868, "epoch": 115} {"train_loss": -4.5658063888549805, "global_step": 4869, "epoch": 115} {"train_loss": -4.561799049377441, "global_step": 4870, "epoch": 115} {"train_loss": -4.5101103101457864, "global_step": 4871, "epoch": 115, "val_loss": 97592.2109375} {"train_loss": -4.606661796569824, "global_step": 4872, "epoch": 116} {"train_loss": -4.697528839111328, "global_step": 4873, "epoch": 116} {"train_loss": -4.500395774841309, "global_step": 4874, "epoch": 116} {"train_loss": -4.727417945861816, "global_step": 4875, "epoch": 116} {"train_loss": -4.579286575317383, "global_step": 4876, "epoch": 116} {"train_loss": -4.607834815979004, "global_step": 4877, "epoch": 116} {"train_loss": -4.831191062927246, "global_step": 4878, "epoch": 116} {"train_loss": -4.614687919616699, "global_step": 4879, "epoch": 116} {"train_loss": -4.664607524871826, "global_step": 4880, "epoch": 116} {"train_loss": -4.742379188537598, "global_step": 4881, "epoch": 116} {"train_loss": -4.4521660804748535, "global_step": 4882, "epoch": 116} {"train_loss": -4.5500078201293945, "global_step": 4883, "epoch": 116} {"train_loss": -4.486304759979248, "global_step": 4884, "epoch": 116} {"train_loss": -4.6355085372924805, "global_step": 4885, "epoch": 116} {"train_loss": -4.651942253112793, "global_step": 4886, "epoch": 116} {"train_loss": -4.648370742797852, "global_step": 4887, "epoch": 116} {"train_loss": -4.405101776123047, "global_step": 4888, "epoch": 116} {"train_loss": -4.421618461608887, "global_step": 4889, "epoch": 116} {"train_loss": -4.67641544342041, "global_step": 4890, "epoch": 116} {"train_loss": -4.480010986328125, "global_step": 4891, "epoch": 116} {"train_loss": -4.269588470458984, "global_step": 4892, "epoch": 116} {"train_loss": -4.550848960876465, "global_step": 4893, "epoch": 116} {"train_loss": -4.571216583251953, "global_step": 4894, "epoch": 116} {"train_loss": -4.440518379211426, "global_step": 4895, "epoch": 116} {"train_loss": -4.5802531242370605, "global_step": 4896, "epoch": 116} {"train_loss": -4.429898262023926, "global_step": 4897, "epoch": 116} {"train_loss": -4.591968059539795, "global_step": 4898, "epoch": 116} {"train_loss": -4.382057189941406, "global_step": 4899, "epoch": 116} {"train_loss": -4.353872299194336, "global_step": 4900, "epoch": 116} {"train_loss": -4.544351577758789, "global_step": 4901, "epoch": 116} {"train_loss": -4.328806400299072, "global_step": 4902, "epoch": 116} {"train_loss": -4.656159400939941, "global_step": 4903, "epoch": 116} {"train_loss": -4.413685321807861, "global_step": 4904, "epoch": 116} {"train_loss": -4.50606632232666, "global_step": 4905, "epoch": 116} {"train_loss": -4.32460880279541, "global_step": 4906, "epoch": 116} {"train_loss": -4.258327007293701, "global_step": 4907, "epoch": 116} {"train_loss": -4.214107036590576, "global_step": 4908, "epoch": 116} {"train_loss": -4.586962699890137, "global_step": 4909, "epoch": 116} {"train_loss": -4.465788841247559, "global_step": 4910, "epoch": 116} {"train_loss": -4.451192855834961, "global_step": 4911, "epoch": 116} {"train_loss": -4.581742286682129, "global_step": 4912, "epoch": 116} {"train_loss": -4.517736877713885, "global_step": 4913, "epoch": 116, "val_loss": 98324.4453125} {"train_loss": -4.587933540344238, "global_step": 4914, "epoch": 117} {"train_loss": -4.556057929992676, "global_step": 4915, "epoch": 117} {"train_loss": -4.581878662109375, "global_step": 4916, "epoch": 117} {"train_loss": -4.564446449279785, "global_step": 4917, "epoch": 117} {"train_loss": -4.524230003356934, "global_step": 4918, "epoch": 117} {"train_loss": -4.558422565460205, "global_step": 4919, "epoch": 117} {"train_loss": -4.580470085144043, "global_step": 4920, "epoch": 117} {"train_loss": -4.476647853851318, "global_step": 4921, "epoch": 117} {"train_loss": -4.527597427368164, "global_step": 4922, "epoch": 117} {"train_loss": -4.565873146057129, "global_step": 4923, "epoch": 117} {"train_loss": -4.671764373779297, "global_step": 4924, "epoch": 117} {"train_loss": -4.614230632781982, "global_step": 4925, "epoch": 117} {"train_loss": -4.5955023765563965, "global_step": 4926, "epoch": 117} {"train_loss": -4.433206558227539, "global_step": 4927, "epoch": 117} {"train_loss": -4.646123886108398, "global_step": 4928, "epoch": 117} {"train_loss": -4.441471099853516, "global_step": 4929, "epoch": 117} {"train_loss": -4.551900863647461, "global_step": 4930, "epoch": 117} {"train_loss": -4.744266510009766, "global_step": 4931, "epoch": 117} {"train_loss": -4.559164047241211, "global_step": 4932, "epoch": 117} {"train_loss": -4.657046318054199, "global_step": 4933, "epoch": 117} {"train_loss": -4.66290283203125, "global_step": 4934, "epoch": 117} {"train_loss": -4.64473819732666, "global_step": 4935, "epoch": 117} {"train_loss": -4.555759429931641, "global_step": 4936, "epoch": 117} {"train_loss": -4.4519805908203125, "global_step": 4937, "epoch": 117} {"train_loss": -4.637487888336182, "global_step": 4938, "epoch": 117} {"train_loss": -4.4685587882995605, "global_step": 4939, "epoch": 117} {"train_loss": -4.507714748382568, "global_step": 4940, "epoch": 117} {"train_loss": -4.63695764541626, "global_step": 4941, "epoch": 117} {"train_loss": -4.595575332641602, "global_step": 4942, "epoch": 117} {"train_loss": -4.493585109710693, "global_step": 4943, "epoch": 117} {"train_loss": -4.605923652648926, "global_step": 4944, "epoch": 117} {"train_loss": -4.563962459564209, "global_step": 4945, "epoch": 117} {"train_loss": -4.525257587432861, "global_step": 4946, "epoch": 117} {"train_loss": -4.634476184844971, "global_step": 4947, "epoch": 117} {"train_loss": -4.6172356605529785, "global_step": 4948, "epoch": 117} {"train_loss": -4.447535514831543, "global_step": 4949, "epoch": 117} {"train_loss": -4.268065452575684, "global_step": 4950, "epoch": 117} {"train_loss": -4.643702983856201, "global_step": 4951, "epoch": 117} {"train_loss": -4.382417678833008, "global_step": 4952, "epoch": 117} {"train_loss": -4.550826072692871, "global_step": 4953, "epoch": 117} {"train_loss": -4.598452091217041, "global_step": 4954, "epoch": 117} {"train_loss": -4.5586699304126554, "global_step": 4955, "epoch": 117, "val_loss": 96590.21875} {"train_loss": -4.512969493865967, "global_step": 4956, "epoch": 118} {"train_loss": -4.489710330963135, "global_step": 4957, "epoch": 118} {"train_loss": -4.480959415435791, "global_step": 4958, "epoch": 118} {"train_loss": -4.619842529296875, "global_step": 4959, "epoch": 118} {"train_loss": -4.518977165222168, "global_step": 4960, "epoch": 118} {"train_loss": -4.471634387969971, "global_step": 4961, "epoch": 118} {"train_loss": -4.489363670349121, "global_step": 4962, "epoch": 118} {"train_loss": -4.425870895385742, "global_step": 4963, "epoch": 118} {"train_loss": -4.702058792114258, "global_step": 4964, "epoch": 118} {"train_loss": -4.474087238311768, "global_step": 4965, "epoch": 118} {"train_loss": -4.383705139160156, "global_step": 4966, "epoch": 118} {"train_loss": -4.598961353302002, "global_step": 4967, "epoch": 118} {"train_loss": -4.635886192321777, "global_step": 4968, "epoch": 118} {"train_loss": -4.548952102661133, "global_step": 4969, "epoch": 118} {"train_loss": -4.584707260131836, "global_step": 4970, "epoch": 118} {"train_loss": -4.561363220214844, "global_step": 4971, "epoch": 118} {"train_loss": -4.645633697509766, "global_step": 4972, "epoch": 118} {"train_loss": -4.622906684875488, "global_step": 4973, "epoch": 118} {"train_loss": -4.45761251449585, "global_step": 4974, "epoch": 118} {"train_loss": -4.455760478973389, "global_step": 4975, "epoch": 118} {"train_loss": -4.633291244506836, "global_step": 4976, "epoch": 118} {"train_loss": -4.474740982055664, "global_step": 4977, "epoch": 118} {"train_loss": -4.526163101196289, "global_step": 4978, "epoch": 118} {"train_loss": -4.664863109588623, "global_step": 4979, "epoch": 118} {"train_loss": -4.582162857055664, "global_step": 4980, "epoch": 118} {"train_loss": -4.712186813354492, "global_step": 4981, "epoch": 118} {"train_loss": -4.653412342071533, "global_step": 4982, "epoch": 118} {"train_loss": -4.687613487243652, "global_step": 4983, "epoch": 118} {"train_loss": -4.793797016143799, "global_step": 4984, "epoch": 118} {"train_loss": -4.564117908477783, "global_step": 4985, "epoch": 118} {"train_loss": -4.639993667602539, "global_step": 4986, "epoch": 118} {"train_loss": -4.6061859130859375, "global_step": 4987, "epoch": 118} {"train_loss": -4.618577480316162, "global_step": 4988, "epoch": 118} {"train_loss": -4.482189655303955, "global_step": 4989, "epoch": 118} {"train_loss": -4.548603057861328, "global_step": 4990, "epoch": 118} {"train_loss": -4.777798652648926, "global_step": 4991, "epoch": 118} {"train_loss": -4.724349021911621, "global_step": 4992, "epoch": 118} {"train_loss": -4.5694661140441895, "global_step": 4993, "epoch": 118} {"train_loss": -4.6146039962768555, "global_step": 4994, "epoch": 118} {"train_loss": -4.6641716957092285, "global_step": 4995, "epoch": 118} {"train_loss": -4.682009220123291, "global_step": 4996, "epoch": 118} {"train_loss": -4.588628473735991, "global_step": 4997, "epoch": 118, "val_loss": 95046.5625} {"train_loss": -4.7326555252075195, "global_step": 4998, "epoch": 119} {"train_loss": -4.692866325378418, "global_step": 4999, "epoch": 119} {"train_loss": -4.637650012969971, "global_step": 5000, "epoch": 119} {"train_loss": -4.737184524536133, "global_step": 5001, "epoch": 119} {"train_loss": -4.707306385040283, "global_step": 5002, "epoch": 119} {"train_loss": -4.645503044128418, "global_step": 5003, "epoch": 119} {"train_loss": -4.632172584533691, "global_step": 5004, "epoch": 119} {"train_loss": -4.509676933288574, "global_step": 5005, "epoch": 119} {"train_loss": -4.6914567947387695, "global_step": 5006, "epoch": 119} {"train_loss": -4.7804765701293945, "global_step": 5007, "epoch": 119} {"train_loss": -4.583095550537109, "global_step": 5008, "epoch": 119} {"train_loss": -4.602301597595215, "global_step": 5009, "epoch": 119} {"train_loss": -4.666769027709961, "global_step": 5010, "epoch": 119} {"train_loss": -4.560941696166992, "global_step": 5011, "epoch": 119} {"train_loss": -4.660027027130127, "global_step": 5012, "epoch": 119} {"train_loss": -4.716917991638184, "global_step": 5013, "epoch": 119} {"train_loss": -4.572040557861328, "global_step": 5014, "epoch": 119} {"train_loss": -4.527129173278809, "global_step": 5015, "epoch": 119} {"train_loss": -4.750038146972656, "global_step": 5016, "epoch": 119} {"train_loss": -4.521245956420898, "global_step": 5017, "epoch": 119} {"train_loss": -4.433091163635254, "global_step": 5018, "epoch": 119} {"train_loss": -4.648953437805176, "global_step": 5019, "epoch": 119} {"train_loss": -4.39556884765625, "global_step": 5020, "epoch": 119} {"train_loss": -4.512234687805176, "global_step": 5021, "epoch": 119} {"train_loss": -4.689127445220947, "global_step": 5022, "epoch": 119} {"train_loss": -4.442849636077881, "global_step": 5023, "epoch": 119} {"train_loss": -4.577821254730225, "global_step": 5024, "epoch": 119} {"train_loss": -4.389622688293457, "global_step": 5025, "epoch": 119} {"train_loss": -4.373045921325684, "global_step": 5026, "epoch": 119} {"train_loss": -4.418726921081543, "global_step": 5027, "epoch": 119} {"train_loss": -4.482919692993164, "global_step": 5028, "epoch": 119} {"train_loss": -4.280981063842773, "global_step": 5029, "epoch": 119} {"train_loss": -4.142645835876465, "global_step": 5030, "epoch": 119} {"train_loss": -4.5025129318237305, "global_step": 5031, "epoch": 119} {"train_loss": -4.439452171325684, "global_step": 5032, "epoch": 119} {"train_loss": -4.453168869018555, "global_step": 5033, "epoch": 119} {"train_loss": -4.374675273895264, "global_step": 5034, "epoch": 119} {"train_loss": -4.496890544891357, "global_step": 5035, "epoch": 119} {"train_loss": -4.402929306030273, "global_step": 5036, "epoch": 119} {"train_loss": -4.418733596801758, "global_step": 5037, "epoch": 119} {"train_loss": -4.345367431640625, "global_step": 5038, "epoch": 119} {"train_loss": -4.539287249247233, "global_step": 5039, "epoch": 119, "val_loss": 97192.546875} {"train_loss": -4.437250137329102, "global_step": 5040, "epoch": 120} {"train_loss": -4.505014419555664, "global_step": 5041, "epoch": 120} {"train_loss": -4.385851860046387, "global_step": 5042, "epoch": 120} {"train_loss": -4.530878067016602, "global_step": 5043, "epoch": 120} {"train_loss": -4.547336578369141, "global_step": 5044, "epoch": 120} {"train_loss": -4.4766998291015625, "global_step": 5045, "epoch": 120} {"train_loss": -4.472103118896484, "global_step": 5046, "epoch": 120} {"train_loss": -4.568951606750488, "global_step": 5047, "epoch": 120} {"train_loss": -4.618160247802734, "global_step": 5048, "epoch": 120} {"train_loss": -4.719970226287842, "global_step": 5049, "epoch": 120} {"train_loss": -4.671147346496582, "global_step": 5050, "epoch": 120} {"train_loss": -4.617228984832764, "global_step": 5051, "epoch": 120} {"train_loss": -4.659131050109863, "global_step": 5052, "epoch": 120} {"train_loss": -4.7355546951293945, "global_step": 5053, "epoch": 120} {"train_loss": -4.586000919342041, "global_step": 5054, "epoch": 120} {"train_loss": -4.529732704162598, "global_step": 5055, "epoch": 120} {"train_loss": -4.819215774536133, "global_step": 5056, "epoch": 120} {"train_loss": -4.687238693237305, "global_step": 5057, "epoch": 120} {"train_loss": -4.672904968261719, "global_step": 5058, "epoch": 120} {"train_loss": -4.488589763641357, "global_step": 5059, "epoch": 120} {"train_loss": -4.646327018737793, "global_step": 5060, "epoch": 120} {"train_loss": -4.705928325653076, "global_step": 5061, "epoch": 120} {"train_loss": -4.551736831665039, "global_step": 5062, "epoch": 120} {"train_loss": -4.582354545593262, "global_step": 5063, "epoch": 120} {"train_loss": -4.726031303405762, "global_step": 5064, "epoch": 120} {"train_loss": -4.547510147094727, "global_step": 5065, "epoch": 120} {"train_loss": -4.755714416503906, "global_step": 5066, "epoch": 120} {"train_loss": -4.494367599487305, "global_step": 5067, "epoch": 120} {"train_loss": -4.563116550445557, "global_step": 5068, "epoch": 120} {"train_loss": -4.611459732055664, "global_step": 5069, "epoch": 120} {"train_loss": -4.357736587524414, "global_step": 5070, "epoch": 120} {"train_loss": -4.514133930206299, "global_step": 5071, "epoch": 120} {"train_loss": -4.7516937255859375, "global_step": 5072, "epoch": 120} {"train_loss": -4.631744384765625, "global_step": 5073, "epoch": 120} {"train_loss": -4.633707046508789, "global_step": 5074, "epoch": 120} {"train_loss": -4.505594730377197, "global_step": 5075, "epoch": 120} {"train_loss": -4.613081932067871, "global_step": 5076, "epoch": 120} {"train_loss": -4.734496116638184, "global_step": 5077, "epoch": 120} {"train_loss": -4.735020637512207, "global_step": 5078, "epoch": 120} {"train_loss": -4.566240310668945, "global_step": 5079, "epoch": 120} {"train_loss": -4.542088508605957, "global_step": 5080, "epoch": 120} {"train_loss": -4.599642821720669, "global_step": 5081, "epoch": 120, "val_loss": 95740.578125} {"train_loss": -4.545419692993164, "global_step": 5082, "epoch": 121} {"train_loss": -4.557078838348389, "global_step": 5083, "epoch": 121} {"train_loss": -4.6158952713012695, "global_step": 5084, "epoch": 121} {"train_loss": -4.423169136047363, "global_step": 5085, "epoch": 121} {"train_loss": -4.483501434326172, "global_step": 5086, "epoch": 121} {"train_loss": -4.5169267654418945, "global_step": 5087, "epoch": 121} {"train_loss": -4.662367820739746, "global_step": 5088, "epoch": 121} {"train_loss": -4.585505485534668, "global_step": 5089, "epoch": 121} {"train_loss": -4.559433460235596, "global_step": 5090, "epoch": 121} {"train_loss": -4.382550239562988, "global_step": 5091, "epoch": 121} {"train_loss": -4.647234916687012, "global_step": 5092, "epoch": 121} {"train_loss": -4.64907169342041, "global_step": 5093, "epoch": 121} {"train_loss": -4.570845603942871, "global_step": 5094, "epoch": 121} {"train_loss": -4.7683916091918945, "global_step": 5095, "epoch": 121} {"train_loss": -4.600511074066162, "global_step": 5096, "epoch": 121} {"train_loss": -4.517940521240234, "global_step": 5097, "epoch": 121} {"train_loss": -4.618149757385254, "global_step": 5098, "epoch": 121} {"train_loss": -4.665012359619141, "global_step": 5099, "epoch": 121} {"train_loss": -4.669244766235352, "global_step": 5100, "epoch": 121} {"train_loss": -4.572479248046875, "global_step": 5101, "epoch": 121} {"train_loss": -4.639728546142578, "global_step": 5102, "epoch": 121} {"train_loss": -4.683595657348633, "global_step": 5103, "epoch": 121} {"train_loss": -4.497440814971924, "global_step": 5104, "epoch": 121} {"train_loss": -4.500269889831543, "global_step": 5105, "epoch": 121} {"train_loss": -4.678990840911865, "global_step": 5106, "epoch": 121} {"train_loss": -4.54595947265625, "global_step": 5107, "epoch": 121} {"train_loss": -4.47466516494751, "global_step": 5108, "epoch": 121} {"train_loss": -4.678685188293457, "global_step": 5109, "epoch": 121} {"train_loss": -4.632034778594971, "global_step": 5110, "epoch": 121} {"train_loss": -4.506325721740723, "global_step": 5111, "epoch": 121} {"train_loss": -4.6319122314453125, "global_step": 5112, "epoch": 121} {"train_loss": -4.762925624847412, "global_step": 5113, "epoch": 121} {"train_loss": -4.523085594177246, "global_step": 5114, "epoch": 121} {"train_loss": -4.666463851928711, "global_step": 5115, "epoch": 121} {"train_loss": -4.655215263366699, "global_step": 5116, "epoch": 121} {"train_loss": -4.655501365661621, "global_step": 5117, "epoch": 121} {"train_loss": -4.69761848449707, "global_step": 5118, "epoch": 121} {"train_loss": -4.674307823181152, "global_step": 5119, "epoch": 121} {"train_loss": -4.731537818908691, "global_step": 5120, "epoch": 121} {"train_loss": -4.728639125823975, "global_step": 5121, "epoch": 121} {"train_loss": -4.689474105834961, "global_step": 5122, "epoch": 121} {"train_loss": -4.608143772397723, "global_step": 5123, "epoch": 121, "val_loss": 94936.0} {"train_loss": -4.542654991149902, "global_step": 5124, "epoch": 122} {"train_loss": -4.627864837646484, "global_step": 5125, "epoch": 122} {"train_loss": -4.582056999206543, "global_step": 5126, "epoch": 122} {"train_loss": -4.594379425048828, "global_step": 5127, "epoch": 122} {"train_loss": -4.5169501304626465, "global_step": 5128, "epoch": 122} {"train_loss": -4.6785078048706055, "global_step": 5129, "epoch": 122} {"train_loss": -4.746734142303467, "global_step": 5130, "epoch": 122} {"train_loss": -4.565727233886719, "global_step": 5131, "epoch": 122} {"train_loss": -4.805041790008545, "global_step": 5132, "epoch": 122} {"train_loss": -4.662372589111328, "global_step": 5133, "epoch": 122} {"train_loss": -4.510725021362305, "global_step": 5134, "epoch": 122} {"train_loss": -4.665835380554199, "global_step": 5135, "epoch": 122} {"train_loss": -4.608982563018799, "global_step": 5136, "epoch": 122} {"train_loss": -4.608868598937988, "global_step": 5137, "epoch": 122} {"train_loss": -4.596758842468262, "global_step": 5138, "epoch": 122} {"train_loss": -4.481754302978516, "global_step": 5139, "epoch": 122} {"train_loss": -4.754073143005371, "global_step": 5140, "epoch": 122} {"train_loss": -4.526767253875732, "global_step": 5141, "epoch": 122} {"train_loss": -4.611033916473389, "global_step": 5142, "epoch": 122} {"train_loss": -4.634222030639648, "global_step": 5143, "epoch": 122} {"train_loss": -4.656749725341797, "global_step": 5144, "epoch": 122} {"train_loss": -4.098979473114014, "global_step": 5145, "epoch": 122} {"train_loss": -4.352025032043457, "global_step": 5146, "epoch": 122} {"train_loss": -4.417998313903809, "global_step": 5147, "epoch": 122} {"train_loss": -4.117303848266602, "global_step": 5148, "epoch": 122} {"train_loss": -4.576692581176758, "global_step": 5149, "epoch": 122} {"train_loss": -4.700620651245117, "global_step": 5150, "epoch": 122} {"train_loss": -4.4418559074401855, "global_step": 5151, "epoch": 122} {"train_loss": -4.569762229919434, "global_step": 5152, "epoch": 122} {"train_loss": -4.610569953918457, "global_step": 5153, "epoch": 122} {"train_loss": -4.621431827545166, "global_step": 5154, "epoch": 122} {"train_loss": -4.598324775695801, "global_step": 5155, "epoch": 122} {"train_loss": -4.529490947723389, "global_step": 5156, "epoch": 122} {"train_loss": -4.532026290893555, "global_step": 5157, "epoch": 122} {"train_loss": -4.573770523071289, "global_step": 5158, "epoch": 122} {"train_loss": -4.5320353507995605, "global_step": 5159, "epoch": 122} {"train_loss": -4.700084209442139, "global_step": 5160, "epoch": 122} {"train_loss": -4.571983337402344, "global_step": 5161, "epoch": 122} {"train_loss": -4.639432907104492, "global_step": 5162, "epoch": 122} {"train_loss": -4.677577972412109, "global_step": 5163, "epoch": 122} {"train_loss": -4.63560676574707, "global_step": 5164, "epoch": 122} {"train_loss": -4.573085183189029, "global_step": 5165, "epoch": 122, "val_loss": 95369.5859375} {"train_loss": -4.556543827056885, "global_step": 5166, "epoch": 123} {"train_loss": -4.762701034545898, "global_step": 5167, "epoch": 123} {"train_loss": -4.56369686126709, "global_step": 5168, "epoch": 123} {"train_loss": -4.499333381652832, "global_step": 5169, "epoch": 123} {"train_loss": -4.583645820617676, "global_step": 5170, "epoch": 123} {"train_loss": -4.800779342651367, "global_step": 5171, "epoch": 123} {"train_loss": -4.454288005828857, "global_step": 5172, "epoch": 123} {"train_loss": -4.561118125915527, "global_step": 5173, "epoch": 123} {"train_loss": -4.614439487457275, "global_step": 5174, "epoch": 123} {"train_loss": -4.55426025390625, "global_step": 5175, "epoch": 123} {"train_loss": -4.699892044067383, "global_step": 5176, "epoch": 123} {"train_loss": -4.697361946105957, "global_step": 5177, "epoch": 123} {"train_loss": -4.607279300689697, "global_step": 5178, "epoch": 123} {"train_loss": -4.808803558349609, "global_step": 5179, "epoch": 123} {"train_loss": -4.68021297454834, "global_step": 5180, "epoch": 123} {"train_loss": -4.6705121994018555, "global_step": 5181, "epoch": 123} {"train_loss": -4.638260841369629, "global_step": 5182, "epoch": 123} {"train_loss": -4.636890888214111, "global_step": 5183, "epoch": 123} {"train_loss": -4.644218921661377, "global_step": 5184, "epoch": 123} {"train_loss": -4.5470404624938965, "global_step": 5185, "epoch": 123} {"train_loss": -4.616208076477051, "global_step": 5186, "epoch": 123} {"train_loss": -4.504756450653076, "global_step": 5187, "epoch": 123} {"train_loss": -4.432888984680176, "global_step": 5188, "epoch": 123} {"train_loss": -4.655882358551025, "global_step": 5189, "epoch": 123} {"train_loss": -4.540509223937988, "global_step": 5190, "epoch": 123} {"train_loss": -4.718288421630859, "global_step": 5191, "epoch": 123} {"train_loss": -4.736659049987793, "global_step": 5192, "epoch": 123} {"train_loss": -4.730893135070801, "global_step": 5193, "epoch": 123} {"train_loss": -4.648036479949951, "global_step": 5194, "epoch": 123} {"train_loss": -4.62749719619751, "global_step": 5195, "epoch": 123} {"train_loss": -4.738619804382324, "global_step": 5196, "epoch": 123} {"train_loss": -4.635502815246582, "global_step": 5197, "epoch": 123} {"train_loss": -4.660804271697998, "global_step": 5198, "epoch": 123} {"train_loss": -4.596918106079102, "global_step": 5199, "epoch": 123} {"train_loss": -4.578545093536377, "global_step": 5200, "epoch": 123} {"train_loss": -4.670855522155762, "global_step": 5201, "epoch": 123} {"train_loss": -4.770438194274902, "global_step": 5202, "epoch": 123} {"train_loss": -4.577515602111816, "global_step": 5203, "epoch": 123} {"train_loss": -4.638623237609863, "global_step": 5204, "epoch": 123} {"train_loss": -4.561367988586426, "global_step": 5205, "epoch": 123} {"train_loss": -4.514712333679199, "global_step": 5206, "epoch": 123} {"train_loss": -4.6273612181345625, "global_step": 5207, "epoch": 123, "val_loss": 92705.7890625} {"train_loss": -4.739480495452881, "global_step": 5208, "epoch": 124} {"train_loss": -4.688698768615723, "global_step": 5209, "epoch": 124} {"train_loss": -4.668713092803955, "global_step": 5210, "epoch": 124} {"train_loss": -4.656161308288574, "global_step": 5211, "epoch": 124} {"train_loss": -4.630622386932373, "global_step": 5212, "epoch": 124} {"train_loss": -4.644012451171875, "global_step": 5213, "epoch": 124} {"train_loss": -4.727100372314453, "global_step": 5214, "epoch": 124} {"train_loss": -4.791213035583496, "global_step": 5215, "epoch": 124} {"train_loss": -4.796046257019043, "global_step": 5216, "epoch": 124} {"train_loss": -4.611593246459961, "global_step": 5217, "epoch": 124} {"train_loss": -4.685321807861328, "global_step": 5218, "epoch": 124} {"train_loss": -4.764916896820068, "global_step": 5219, "epoch": 124} {"train_loss": -4.644131660461426, "global_step": 5220, "epoch": 124} {"train_loss": -4.628878593444824, "global_step": 5221, "epoch": 124} {"train_loss": -4.747042179107666, "global_step": 5222, "epoch": 124} {"train_loss": -4.738356113433838, "global_step": 5223, "epoch": 124} {"train_loss": -4.627240180969238, "global_step": 5224, "epoch": 124} {"train_loss": -4.671354293823242, "global_step": 5225, "epoch": 124} {"train_loss": -4.809998512268066, "global_step": 5226, "epoch": 124} {"train_loss": -4.778034687042236, "global_step": 5227, "epoch": 124} {"train_loss": -4.727793216705322, "global_step": 5228, "epoch": 124} {"train_loss": -4.796923637390137, "global_step": 5229, "epoch": 124} {"train_loss": -4.59509801864624, "global_step": 5230, "epoch": 124} {"train_loss": -4.731262683868408, "global_step": 5231, "epoch": 124} {"train_loss": -4.678519248962402, "global_step": 5232, "epoch": 124} {"train_loss": -4.748239517211914, "global_step": 5233, "epoch": 124} {"train_loss": -4.6092529296875, "global_step": 5234, "epoch": 124} {"train_loss": -4.595795154571533, "global_step": 5235, "epoch": 124} {"train_loss": -4.6810503005981445, "global_step": 5236, "epoch": 124} {"train_loss": -4.877798080444336, "global_step": 5237, "epoch": 124} {"train_loss": -4.617902755737305, "global_step": 5238, "epoch": 124} {"train_loss": -4.541881084442139, "global_step": 5239, "epoch": 124} {"train_loss": -4.366987228393555, "global_step": 5240, "epoch": 124} {"train_loss": -4.6048383712768555, "global_step": 5241, "epoch": 124} {"train_loss": -4.588303565979004, "global_step": 5242, "epoch": 124} {"train_loss": -4.506376266479492, "global_step": 5243, "epoch": 124} {"train_loss": -4.61235237121582, "global_step": 5244, "epoch": 124} {"train_loss": -4.724226474761963, "global_step": 5245, "epoch": 124} {"train_loss": -4.210353851318359, "global_step": 5246, "epoch": 124} {"train_loss": -4.258910179138184, "global_step": 5247, "epoch": 124} {"train_loss": -4.909412860870361, "global_step": 5248, "epoch": 124} {"train_loss": -4.6598953519548685, "global_step": 5249, "epoch": 124, "val_loss": 93700.6875} {"train_loss": -4.726316452026367, "global_step": 5250, "epoch": 125} {"train_loss": -4.6393303871154785, "global_step": 5251, "epoch": 125} {"train_loss": -4.694118499755859, "global_step": 5252, "epoch": 125} {"train_loss": -4.666103839874268, "global_step": 5253, "epoch": 125} {"train_loss": -4.656349182128906, "global_step": 5254, "epoch": 125} {"train_loss": -4.617690086364746, "global_step": 5255, "epoch": 125} {"train_loss": -4.637360572814941, "global_step": 5256, "epoch": 125} {"train_loss": -4.550267219543457, "global_step": 5257, "epoch": 125} {"train_loss": -4.679067611694336, "global_step": 5258, "epoch": 125} {"train_loss": -4.711941719055176, "global_step": 5259, "epoch": 125} {"train_loss": -4.560324668884277, "global_step": 5260, "epoch": 125} {"train_loss": -4.682932376861572, "global_step": 5261, "epoch": 125} {"train_loss": -4.753700256347656, "global_step": 5262, "epoch": 125} {"train_loss": -4.629039764404297, "global_step": 5263, "epoch": 125} {"train_loss": -4.61894416809082, "global_step": 5264, "epoch": 125} {"train_loss": -4.781309127807617, "global_step": 5265, "epoch": 125} {"train_loss": -4.6703691482543945, "global_step": 5266, "epoch": 125} {"train_loss": -4.76062536239624, "global_step": 5267, "epoch": 125} {"train_loss": -4.59504508972168, "global_step": 5268, "epoch": 125} {"train_loss": -4.699474334716797, "global_step": 5269, "epoch": 125} {"train_loss": -4.5191240310668945, "global_step": 5270, "epoch": 125} {"train_loss": -4.746335983276367, "global_step": 5271, "epoch": 125} {"train_loss": -4.724222660064697, "global_step": 5272, "epoch": 125} {"train_loss": -4.677034854888916, "global_step": 5273, "epoch": 125} {"train_loss": -4.665635108947754, "global_step": 5274, "epoch": 125} {"train_loss": -4.692991256713867, "global_step": 5275, "epoch": 125} {"train_loss": -4.6722412109375, "global_step": 5276, "epoch": 125} {"train_loss": -4.695273399353027, "global_step": 5277, "epoch": 125} {"train_loss": -4.661670207977295, "global_step": 5278, "epoch": 125} {"train_loss": -4.70982551574707, "global_step": 5279, "epoch": 125} {"train_loss": -4.77787971496582, "global_step": 5280, "epoch": 125} {"train_loss": -4.75719690322876, "global_step": 5281, "epoch": 125} {"train_loss": -4.7294721603393555, "global_step": 5282, "epoch": 125} {"train_loss": -4.832457542419434, "global_step": 5283, "epoch": 125} {"train_loss": -4.837191581726074, "global_step": 5284, "epoch": 125} {"train_loss": -4.576482772827148, "global_step": 5285, "epoch": 125} {"train_loss": -4.674895286560059, "global_step": 5286, "epoch": 125} {"train_loss": -4.730823516845703, "global_step": 5287, "epoch": 125} {"train_loss": -4.808938026428223, "global_step": 5288, "epoch": 125} {"train_loss": -4.7533955574035645, "global_step": 5289, "epoch": 125} {"train_loss": -4.459434986114502, "global_step": 5290, "epoch": 125} {"train_loss": -4.680143719627743, "global_step": 5291, "epoch": 125, "val_loss": 93826.7890625} {"train_loss": -4.604191303253174, "global_step": 5292, "epoch": 126} {"train_loss": -4.75065279006958, "global_step": 5293, "epoch": 126} {"train_loss": -4.791380882263184, "global_step": 5294, "epoch": 126} {"train_loss": -4.332830905914307, "global_step": 5295, "epoch": 126} {"train_loss": -4.582423686981201, "global_step": 5296, "epoch": 126} {"train_loss": -4.4867143630981445, "global_step": 5297, "epoch": 126} {"train_loss": -4.264935493469238, "global_step": 5298, "epoch": 126} {"train_loss": -4.552523612976074, "global_step": 5299, "epoch": 126} {"train_loss": -4.092838287353516, "global_step": 5300, "epoch": 126} {"train_loss": -4.224277019500732, "global_step": 5301, "epoch": 126} {"train_loss": -4.423946380615234, "global_step": 5302, "epoch": 126} {"train_loss": -4.3290910720825195, "global_step": 5303, "epoch": 126} {"train_loss": -4.576103210449219, "global_step": 5304, "epoch": 126} {"train_loss": -4.453866481781006, "global_step": 5305, "epoch": 126} {"train_loss": -4.637369155883789, "global_step": 5306, "epoch": 126} {"train_loss": -4.4279279708862305, "global_step": 5307, "epoch": 126} {"train_loss": -4.362457275390625, "global_step": 5308, "epoch": 126} {"train_loss": -4.532693862915039, "global_step": 5309, "epoch": 126} {"train_loss": -4.524359226226807, "global_step": 5310, "epoch": 126} {"train_loss": -4.606115341186523, "global_step": 5311, "epoch": 126} {"train_loss": -4.56418514251709, "global_step": 5312, "epoch": 126} {"train_loss": -4.457009315490723, "global_step": 5313, "epoch": 126} {"train_loss": -4.767287731170654, "global_step": 5314, "epoch": 126} {"train_loss": -4.639766693115234, "global_step": 5315, "epoch": 126} {"train_loss": -4.544403553009033, "global_step": 5316, "epoch": 126} {"train_loss": -4.734551429748535, "global_step": 5317, "epoch": 126} {"train_loss": -4.574423789978027, "global_step": 5318, "epoch": 126} {"train_loss": -4.658515930175781, "global_step": 5319, "epoch": 126} {"train_loss": -4.6808695793151855, "global_step": 5320, "epoch": 126} {"train_loss": -4.607310771942139, "global_step": 5321, "epoch": 126} {"train_loss": -4.593334197998047, "global_step": 5322, "epoch": 126} {"train_loss": -4.7193708419799805, "global_step": 5323, "epoch": 126} {"train_loss": -4.913054943084717, "global_step": 5324, "epoch": 126} {"train_loss": -4.675060272216797, "global_step": 5325, "epoch": 126} {"train_loss": -4.634958744049072, "global_step": 5326, "epoch": 126} {"train_loss": -4.710498332977295, "global_step": 5327, "epoch": 126} {"train_loss": -4.617207050323486, "global_step": 5328, "epoch": 126} {"train_loss": -4.806334972381592, "global_step": 5329, "epoch": 126} {"train_loss": -4.698080539703369, "global_step": 5330, "epoch": 126} {"train_loss": -4.774188041687012, "global_step": 5331, "epoch": 126} {"train_loss": -4.6522393226623535, "global_step": 5332, "epoch": 126} {"train_loss": -4.57746916725522, "global_step": 5333, "epoch": 126, "val_loss": 92016.1796875} {"train_loss": -4.624220848083496, "global_step": 5334, "epoch": 127} {"train_loss": -4.7403740882873535, "global_step": 5335, "epoch": 127} {"train_loss": -4.7788848876953125, "global_step": 5336, "epoch": 127} {"train_loss": -4.5888519287109375, "global_step": 5337, "epoch": 127} {"train_loss": -4.653794288635254, "global_step": 5338, "epoch": 127} {"train_loss": -4.712730407714844, "global_step": 5339, "epoch": 127} {"train_loss": -4.614995002746582, "global_step": 5340, "epoch": 127} {"train_loss": -4.664037704467773, "global_step": 5341, "epoch": 127} {"train_loss": -4.6736955642700195, "global_step": 5342, "epoch": 127} {"train_loss": -4.564138889312744, "global_step": 5343, "epoch": 127} {"train_loss": -4.69240140914917, "global_step": 5344, "epoch": 127} {"train_loss": -4.684436798095703, "global_step": 5345, "epoch": 127} {"train_loss": -4.721747398376465, "global_step": 5346, "epoch": 127} {"train_loss": -4.6255879402160645, "global_step": 5347, "epoch": 127} {"train_loss": -4.668951034545898, "global_step": 5348, "epoch": 127} {"train_loss": -4.5944623947143555, "global_step": 5349, "epoch": 127} {"train_loss": -4.63056755065918, "global_step": 5350, "epoch": 127} {"train_loss": -4.6526055335998535, "global_step": 5351, "epoch": 127} {"train_loss": -4.60763692855835, "global_step": 5352, "epoch": 127} {"train_loss": -4.703150272369385, "global_step": 5353, "epoch": 127} {"train_loss": -4.542757987976074, "global_step": 5354, "epoch": 127} {"train_loss": -4.585079669952393, "global_step": 5355, "epoch": 127} {"train_loss": -4.523120880126953, "global_step": 5356, "epoch": 127} {"train_loss": -4.399830341339111, "global_step": 5357, "epoch": 127} {"train_loss": -4.540872573852539, "global_step": 5358, "epoch": 127} {"train_loss": -4.656118392944336, "global_step": 5359, "epoch": 127} {"train_loss": -4.487111568450928, "global_step": 5360, "epoch": 127} {"train_loss": -4.634198188781738, "global_step": 5361, "epoch": 127} {"train_loss": -4.791925430297852, "global_step": 5362, "epoch": 127} {"train_loss": -4.859827041625977, "global_step": 5363, "epoch": 127} {"train_loss": -4.790229320526123, "global_step": 5364, "epoch": 127} {"train_loss": -4.808445453643799, "global_step": 5365, "epoch": 127} {"train_loss": -4.587708473205566, "global_step": 5366, "epoch": 127} {"train_loss": -4.805631160736084, "global_step": 5367, "epoch": 127} {"train_loss": -4.831220626831055, "global_step": 5368, "epoch": 127} {"train_loss": -4.789349555969238, "global_step": 5369, "epoch": 127} {"train_loss": -4.787782669067383, "global_step": 5370, "epoch": 127} {"train_loss": -4.756726264953613, "global_step": 5371, "epoch": 127} {"train_loss": -4.543874740600586, "global_step": 5372, "epoch": 127} {"train_loss": -4.812867164611816, "global_step": 5373, "epoch": 127} {"train_loss": -4.856456756591797, "global_step": 5374, "epoch": 127} {"train_loss": -4.6757980074201315, "global_step": 5375, "epoch": 127, "val_loss": 92021.234375} {"train_loss": -4.675505638122559, "global_step": 5376, "epoch": 128} {"train_loss": -4.849212646484375, "global_step": 5377, "epoch": 128} {"train_loss": -4.645814895629883, "global_step": 5378, "epoch": 128} {"train_loss": -4.791004657745361, "global_step": 5379, "epoch": 128} {"train_loss": -4.7938032150268555, "global_step": 5380, "epoch": 128} {"train_loss": -4.820089817047119, "global_step": 5381, "epoch": 128} {"train_loss": -4.7387237548828125, "global_step": 5382, "epoch": 128} {"train_loss": -4.581053256988525, "global_step": 5383, "epoch": 128} {"train_loss": -4.687301158905029, "global_step": 5384, "epoch": 128} {"train_loss": -4.848440647125244, "global_step": 5385, "epoch": 128} {"train_loss": -4.62025260925293, "global_step": 5386, "epoch": 128} {"train_loss": -4.674957275390625, "global_step": 5387, "epoch": 128} {"train_loss": -4.6692938804626465, "global_step": 5388, "epoch": 128} {"train_loss": -4.668877124786377, "global_step": 5389, "epoch": 128} {"train_loss": -4.751396179199219, "global_step": 5390, "epoch": 128} {"train_loss": -4.501426696777344, "global_step": 5391, "epoch": 128} {"train_loss": -4.695117950439453, "global_step": 5392, "epoch": 128} {"train_loss": -4.587333679199219, "global_step": 5393, "epoch": 128} {"train_loss": -4.436808109283447, "global_step": 5394, "epoch": 128} {"train_loss": -4.760492324829102, "global_step": 5395, "epoch": 128} {"train_loss": -4.615085124969482, "global_step": 5396, "epoch": 128} {"train_loss": -4.330259323120117, "global_step": 5397, "epoch": 128} {"train_loss": -4.566827297210693, "global_step": 5398, "epoch": 128} {"train_loss": -4.678297996520996, "global_step": 5399, "epoch": 128} {"train_loss": -4.454156398773193, "global_step": 5400, "epoch": 128} {"train_loss": -4.806162357330322, "global_step": 5401, "epoch": 128} {"train_loss": -4.664425849914551, "global_step": 5402, "epoch": 128} {"train_loss": -4.629911422729492, "global_step": 5403, "epoch": 128} {"train_loss": -4.767333984375, "global_step": 5404, "epoch": 128} {"train_loss": -4.684384346008301, "global_step": 5405, "epoch": 128} {"train_loss": -4.602786064147949, "global_step": 5406, "epoch": 128} {"train_loss": -4.472587585449219, "global_step": 5407, "epoch": 128} {"train_loss": -4.672847747802734, "global_step": 5408, "epoch": 128} {"train_loss": -4.678110122680664, "global_step": 5409, "epoch": 128} {"train_loss": -4.553952693939209, "global_step": 5410, "epoch": 128} {"train_loss": -4.692348480224609, "global_step": 5411, "epoch": 128} {"train_loss": -4.836685657501221, "global_step": 5412, "epoch": 128} {"train_loss": -4.592021465301514, "global_step": 5413, "epoch": 128} {"train_loss": -4.586260795593262, "global_step": 5414, "epoch": 128} {"train_loss": -4.691725730895996, "global_step": 5415, "epoch": 128} {"train_loss": -4.748290061950684, "global_step": 5416, "epoch": 128} {"train_loss": -4.661964314324515, "global_step": 5417, "epoch": 128, "val_loss": 92236.7578125} {"train_loss": -4.741244316101074, "global_step": 5418, "epoch": 129} {"train_loss": -4.635977268218994, "global_step": 5419, "epoch": 129} {"train_loss": -4.485841751098633, "global_step": 5420, "epoch": 129} {"train_loss": -4.790242671966553, "global_step": 5421, "epoch": 129} {"train_loss": -4.7157368659973145, "global_step": 5422, "epoch": 129} {"train_loss": -4.628070831298828, "global_step": 5423, "epoch": 129} {"train_loss": -4.754734516143799, "global_step": 5424, "epoch": 129} {"train_loss": -4.487293243408203, "global_step": 5425, "epoch": 129} {"train_loss": -4.602046012878418, "global_step": 5426, "epoch": 129} {"train_loss": -4.727078914642334, "global_step": 5427, "epoch": 129} {"train_loss": -4.575455188751221, "global_step": 5428, "epoch": 129} {"train_loss": -4.6678972244262695, "global_step": 5429, "epoch": 129} {"train_loss": -4.703362464904785, "global_step": 5430, "epoch": 129} {"train_loss": -4.5702080726623535, "global_step": 5431, "epoch": 129} {"train_loss": -4.592392921447754, "global_step": 5432, "epoch": 129} {"train_loss": -4.738149642944336, "global_step": 5433, "epoch": 129} {"train_loss": -4.6405134201049805, "global_step": 5434, "epoch": 129} {"train_loss": -4.636373519897461, "global_step": 5435, "epoch": 129} {"train_loss": -4.801698684692383, "global_step": 5436, "epoch": 129} {"train_loss": -4.765922546386719, "global_step": 5437, "epoch": 129} {"train_loss": -4.542717933654785, "global_step": 5438, "epoch": 129} {"train_loss": -4.638675689697266, "global_step": 5439, "epoch": 129} {"train_loss": -4.6689982414245605, "global_step": 5440, "epoch": 129} {"train_loss": -4.682194232940674, "global_step": 5441, "epoch": 129} {"train_loss": -4.657586097717285, "global_step": 5442, "epoch": 129} {"train_loss": -4.707502365112305, "global_step": 5443, "epoch": 129} {"train_loss": -4.71533203125, "global_step": 5444, "epoch": 129} {"train_loss": -4.635953903198242, "global_step": 5445, "epoch": 129} {"train_loss": -4.609383583068848, "global_step": 5446, "epoch": 129} {"train_loss": -4.902661323547363, "global_step": 5447, "epoch": 129} {"train_loss": -4.814223289489746, "global_step": 5448, "epoch": 129} {"train_loss": -4.5560712814331055, "global_step": 5449, "epoch": 129} {"train_loss": -4.7122931480407715, "global_step": 5450, "epoch": 129} {"train_loss": -4.73833703994751, "global_step": 5451, "epoch": 129} {"train_loss": -4.782113075256348, "global_step": 5452, "epoch": 129} {"train_loss": -4.769064903259277, "global_step": 5453, "epoch": 129} {"train_loss": -4.802534103393555, "global_step": 5454, "epoch": 129} {"train_loss": -4.819839954376221, "global_step": 5455, "epoch": 129} {"train_loss": -4.814016819000244, "global_step": 5456, "epoch": 129} {"train_loss": -4.659784317016602, "global_step": 5457, "epoch": 129} {"train_loss": -4.657331466674805, "global_step": 5458, "epoch": 129} {"train_loss": -4.688267889476958, "global_step": 5459, "epoch": 129, "val_loss": 91663.640625} {"train_loss": -4.596566677093506, "global_step": 5460, "epoch": 130} {"train_loss": -4.534148693084717, "global_step": 5461, "epoch": 130} {"train_loss": -4.619836330413818, "global_step": 5462, "epoch": 130} {"train_loss": -4.566773414611816, "global_step": 5463, "epoch": 130} {"train_loss": -4.734983921051025, "global_step": 5464, "epoch": 130} {"train_loss": -4.8045783042907715, "global_step": 5465, "epoch": 130} {"train_loss": -4.698012828826904, "global_step": 5466, "epoch": 130} {"train_loss": -4.653379440307617, "global_step": 5467, "epoch": 130} {"train_loss": -4.738365173339844, "global_step": 5468, "epoch": 130} {"train_loss": -4.779535293579102, "global_step": 5469, "epoch": 130} {"train_loss": -4.647853851318359, "global_step": 5470, "epoch": 130} {"train_loss": -4.735103130340576, "global_step": 5471, "epoch": 130} {"train_loss": -4.742318153381348, "global_step": 5472, "epoch": 130} {"train_loss": -4.682976722717285, "global_step": 5473, "epoch": 130} {"train_loss": -4.608659744262695, "global_step": 5474, "epoch": 130} {"train_loss": -4.710812091827393, "global_step": 5475, "epoch": 130} {"train_loss": -4.71169900894165, "global_step": 5476, "epoch": 130} {"train_loss": -4.655259132385254, "global_step": 5477, "epoch": 130} {"train_loss": -4.650916576385498, "global_step": 5478, "epoch": 130} {"train_loss": -4.734773635864258, "global_step": 5479, "epoch": 130} {"train_loss": -4.684659004211426, "global_step": 5480, "epoch": 130} {"train_loss": -4.833928108215332, "global_step": 5481, "epoch": 130} {"train_loss": -4.690690517425537, "global_step": 5482, "epoch": 130} {"train_loss": -4.707861423492432, "global_step": 5483, "epoch": 130} {"train_loss": -4.637392044067383, "global_step": 5484, "epoch": 130} {"train_loss": -4.698996067047119, "global_step": 5485, "epoch": 130} {"train_loss": -4.610788822174072, "global_step": 5486, "epoch": 130} {"train_loss": -4.671446800231934, "global_step": 5487, "epoch": 130} {"train_loss": -4.729642868041992, "global_step": 5488, "epoch": 130} {"train_loss": -4.578972339630127, "global_step": 5489, "epoch": 130} {"train_loss": -4.707058906555176, "global_step": 5490, "epoch": 130} {"train_loss": -4.672945976257324, "global_step": 5491, "epoch": 130} {"train_loss": -4.702431678771973, "global_step": 5492, "epoch": 130} {"train_loss": -4.7964606285095215, "global_step": 5493, "epoch": 130} {"train_loss": -4.787917137145996, "global_step": 5494, "epoch": 130} {"train_loss": -4.75874662399292, "global_step": 5495, "epoch": 130} {"train_loss": -4.770130634307861, "global_step": 5496, "epoch": 130} {"train_loss": -4.779649257659912, "global_step": 5497, "epoch": 130} {"train_loss": -4.954071521759033, "global_step": 5498, "epoch": 130} {"train_loss": -4.850159645080566, "global_step": 5499, "epoch": 130} {"train_loss": -4.7015380859375, "global_step": 5500, "epoch": 130} {"train_loss": -4.704976047788348, "global_step": 5501, "epoch": 130, "val_loss": 90955.421875} {"train_loss": -4.831125736236572, "global_step": 5502, "epoch": 131} {"train_loss": -4.719468116760254, "global_step": 5503, "epoch": 131} {"train_loss": -4.689054489135742, "global_step": 5504, "epoch": 131} {"train_loss": -4.772442817687988, "global_step": 5505, "epoch": 131} {"train_loss": -4.606063365936279, "global_step": 5506, "epoch": 131} {"train_loss": -4.794748306274414, "global_step": 5507, "epoch": 131} {"train_loss": -4.718502998352051, "global_step": 5508, "epoch": 131} {"train_loss": -4.666077613830566, "global_step": 5509, "epoch": 131} {"train_loss": -4.709591865539551, "global_step": 5510, "epoch": 131} {"train_loss": -4.805105209350586, "global_step": 5511, "epoch": 131} {"train_loss": -4.670907497406006, "global_step": 5512, "epoch": 131} {"train_loss": -4.650934219360352, "global_step": 5513, "epoch": 131} {"train_loss": -4.793703079223633, "global_step": 5514, "epoch": 131} {"train_loss": -4.751005172729492, "global_step": 5515, "epoch": 131} {"train_loss": -4.870408058166504, "global_step": 5516, "epoch": 131} {"train_loss": -4.70851993560791, "global_step": 5517, "epoch": 131} {"train_loss": -4.770390510559082, "global_step": 5518, "epoch": 131} {"train_loss": -4.819488525390625, "global_step": 5519, "epoch": 131} {"train_loss": -4.805265426635742, "global_step": 5520, "epoch": 131} {"train_loss": -4.721177101135254, "global_step": 5521, "epoch": 131} {"train_loss": -4.703497886657715, "global_step": 5522, "epoch": 131} {"train_loss": -4.473536014556885, "global_step": 5523, "epoch": 131} {"train_loss": -4.80073881149292, "global_step": 5524, "epoch": 131} {"train_loss": -4.635980129241943, "global_step": 5525, "epoch": 131} {"train_loss": -4.625276565551758, "global_step": 5526, "epoch": 131} {"train_loss": -4.650748252868652, "global_step": 5527, "epoch": 131} {"train_loss": -4.858044624328613, "global_step": 5528, "epoch": 131} {"train_loss": -4.758792877197266, "global_step": 5529, "epoch": 131} {"train_loss": -4.59492301940918, "global_step": 5530, "epoch": 131} {"train_loss": -4.590032577514648, "global_step": 5531, "epoch": 131} {"train_loss": -4.706540107727051, "global_step": 5532, "epoch": 131} {"train_loss": -4.596677780151367, "global_step": 5533, "epoch": 131} {"train_loss": -4.493603229522705, "global_step": 5534, "epoch": 131} {"train_loss": -4.585376262664795, "global_step": 5535, "epoch": 131} {"train_loss": -4.382739543914795, "global_step": 5536, "epoch": 131} {"train_loss": -4.64094352722168, "global_step": 5537, "epoch": 131} {"train_loss": -4.643786430358887, "global_step": 5538, "epoch": 131} {"train_loss": -4.665775299072266, "global_step": 5539, "epoch": 131} {"train_loss": -4.801880836486816, "global_step": 5540, "epoch": 131} {"train_loss": -4.676061630249023, "global_step": 5541, "epoch": 131} {"train_loss": -4.667065620422363, "global_step": 5542, "epoch": 131} {"train_loss": -4.694679544085548, "global_step": 5543, "epoch": 131, "val_loss": 94655.0} {"train_loss": -4.590059757232666, "global_step": 5544, "epoch": 132} {"train_loss": -4.593262672424316, "global_step": 5545, "epoch": 132} {"train_loss": -4.568665981292725, "global_step": 5546, "epoch": 132} {"train_loss": -4.696384429931641, "global_step": 5547, "epoch": 132} {"train_loss": -4.674901962280273, "global_step": 5548, "epoch": 132} {"train_loss": -4.62291145324707, "global_step": 5549, "epoch": 132} {"train_loss": -4.682389736175537, "global_step": 5550, "epoch": 132} {"train_loss": -4.7513227462768555, "global_step": 5551, "epoch": 132} {"train_loss": -4.6992645263671875, "global_step": 5552, "epoch": 132} {"train_loss": -4.665258407592773, "global_step": 5553, "epoch": 132} {"train_loss": -4.604626178741455, "global_step": 5554, "epoch": 132} {"train_loss": -4.5418243408203125, "global_step": 5555, "epoch": 132} {"train_loss": -4.789668560028076, "global_step": 5556, "epoch": 132} {"train_loss": -4.623878002166748, "global_step": 5557, "epoch": 132} {"train_loss": -4.85707950592041, "global_step": 5558, "epoch": 132} {"train_loss": -4.698798179626465, "global_step": 5559, "epoch": 132} {"train_loss": -4.70498514175415, "global_step": 5560, "epoch": 132} {"train_loss": -4.744756698608398, "global_step": 5561, "epoch": 132} {"train_loss": -4.610813140869141, "global_step": 5562, "epoch": 132} {"train_loss": -4.793028831481934, "global_step": 5563, "epoch": 132} {"train_loss": -4.624467372894287, "global_step": 5564, "epoch": 132} {"train_loss": -4.661970615386963, "global_step": 5565, "epoch": 132} {"train_loss": -4.506287574768066, "global_step": 5566, "epoch": 132} {"train_loss": -4.390732765197754, "global_step": 5567, "epoch": 132} {"train_loss": -4.639821529388428, "global_step": 5568, "epoch": 132} {"train_loss": -4.727286338806152, "global_step": 5569, "epoch": 132} {"train_loss": -4.628639221191406, "global_step": 5570, "epoch": 132} {"train_loss": -4.552083969116211, "global_step": 5571, "epoch": 132} {"train_loss": -4.522764205932617, "global_step": 5572, "epoch": 132} {"train_loss": -4.652416229248047, "global_step": 5573, "epoch": 132} {"train_loss": -4.810481071472168, "global_step": 5574, "epoch": 132} {"train_loss": -4.673835754394531, "global_step": 5575, "epoch": 132} {"train_loss": -4.83768367767334, "global_step": 5576, "epoch": 132} {"train_loss": -4.652161598205566, "global_step": 5577, "epoch": 132} {"train_loss": -4.77299690246582, "global_step": 5578, "epoch": 132} {"train_loss": -4.66005277633667, "global_step": 5579, "epoch": 132} {"train_loss": -4.718592166900635, "global_step": 5580, "epoch": 132} {"train_loss": -4.754255294799805, "global_step": 5581, "epoch": 132} {"train_loss": -4.540319919586182, "global_step": 5582, "epoch": 132} {"train_loss": -4.788039207458496, "global_step": 5583, "epoch": 132} {"train_loss": -4.685711860656738, "global_step": 5584, "epoch": 132} {"train_loss": -4.669343301228115, "global_step": 5585, "epoch": 132, "val_loss": 90922.4140625} {"train_loss": -4.930330276489258, "global_step": 5586, "epoch": 133} {"train_loss": -4.721315383911133, "global_step": 5587, "epoch": 133} {"train_loss": -4.623378753662109, "global_step": 5588, "epoch": 133} {"train_loss": -4.661567211151123, "global_step": 5589, "epoch": 133} {"train_loss": -4.8224945068359375, "global_step": 5590, "epoch": 133} {"train_loss": -4.749516010284424, "global_step": 5591, "epoch": 133} {"train_loss": -4.578316688537598, "global_step": 5592, "epoch": 133} {"train_loss": -4.734436511993408, "global_step": 5593, "epoch": 133} {"train_loss": -4.852206230163574, "global_step": 5594, "epoch": 133} {"train_loss": -4.772724628448486, "global_step": 5595, "epoch": 133} {"train_loss": -4.6458282470703125, "global_step": 5596, "epoch": 133} {"train_loss": -4.753006458282471, "global_step": 5597, "epoch": 133} {"train_loss": -4.76975154876709, "global_step": 5598, "epoch": 133} {"train_loss": -4.756505012512207, "global_step": 5599, "epoch": 133} {"train_loss": -4.655147552490234, "global_step": 5600, "epoch": 133} {"train_loss": -4.829410076141357, "global_step": 5601, "epoch": 133} {"train_loss": -4.676181316375732, "global_step": 5602, "epoch": 133} {"train_loss": -4.8065080642700195, "global_step": 5603, "epoch": 133} {"train_loss": -4.73096227645874, "global_step": 5604, "epoch": 133} {"train_loss": -4.803741455078125, "global_step": 5605, "epoch": 133} {"train_loss": -4.727999687194824, "global_step": 5606, "epoch": 133} {"train_loss": -4.7905473709106445, "global_step": 5607, "epoch": 133} {"train_loss": -4.880866527557373, "global_step": 5608, "epoch": 133} {"train_loss": -4.772443771362305, "global_step": 5609, "epoch": 133} {"train_loss": -4.80927848815918, "global_step": 5610, "epoch": 133} {"train_loss": -4.674205780029297, "global_step": 5611, "epoch": 133} {"train_loss": -4.791210174560547, "global_step": 5612, "epoch": 133} {"train_loss": -4.798511028289795, "global_step": 5613, "epoch": 133} {"train_loss": -4.757702350616455, "global_step": 5614, "epoch": 133} {"train_loss": -4.690805912017822, "global_step": 5615, "epoch": 133} {"train_loss": -4.694512367248535, "global_step": 5616, "epoch": 133} {"train_loss": -4.529642581939697, "global_step": 5617, "epoch": 133} {"train_loss": -4.807795524597168, "global_step": 5618, "epoch": 133} {"train_loss": -4.755043029785156, "global_step": 5619, "epoch": 133} {"train_loss": -4.620673179626465, "global_step": 5620, "epoch": 133} {"train_loss": -4.6978864669799805, "global_step": 5621, "epoch": 133} {"train_loss": -4.789331912994385, "global_step": 5622, "epoch": 133} {"train_loss": -4.91654109954834, "global_step": 5623, "epoch": 133} {"train_loss": -4.82365608215332, "global_step": 5624, "epoch": 133} {"train_loss": -4.634899139404297, "global_step": 5625, "epoch": 133} {"train_loss": -4.757180690765381, "global_step": 5626, "epoch": 133} {"train_loss": -4.744204725537982, "global_step": 5627, "epoch": 133, "val_loss": 90027.6953125} {"train_loss": -4.792272567749023, "global_step": 5628, "epoch": 134} {"train_loss": -4.649054527282715, "global_step": 5629, "epoch": 134} {"train_loss": -4.81848669052124, "global_step": 5630, "epoch": 134} {"train_loss": -4.887479782104492, "global_step": 5631, "epoch": 134} {"train_loss": -4.721070766448975, "global_step": 5632, "epoch": 134} {"train_loss": -4.717439651489258, "global_step": 5633, "epoch": 134} {"train_loss": -4.831650733947754, "global_step": 5634, "epoch": 134} {"train_loss": -4.843006134033203, "global_step": 5635, "epoch": 134} {"train_loss": -4.872165679931641, "global_step": 5636, "epoch": 134} {"train_loss": -4.689911842346191, "global_step": 5637, "epoch": 134} {"train_loss": -4.625035285949707, "global_step": 5638, "epoch": 134} {"train_loss": -4.627085208892822, "global_step": 5639, "epoch": 134} {"train_loss": -4.657242774963379, "global_step": 5640, "epoch": 134} {"train_loss": -4.795960426330566, "global_step": 5641, "epoch": 134} {"train_loss": -4.816262245178223, "global_step": 5642, "epoch": 134} {"train_loss": -4.577871799468994, "global_step": 5643, "epoch": 134} {"train_loss": -4.729523658752441, "global_step": 5644, "epoch": 134} {"train_loss": -4.780428886413574, "global_step": 5645, "epoch": 134} {"train_loss": -4.827458381652832, "global_step": 5646, "epoch": 134} {"train_loss": -4.760984897613525, "global_step": 5647, "epoch": 134} {"train_loss": -4.833887100219727, "global_step": 5648, "epoch": 134} {"train_loss": -4.57407283782959, "global_step": 5649, "epoch": 134} {"train_loss": -4.826813697814941, "global_step": 5650, "epoch": 134} {"train_loss": -4.9275312423706055, "global_step": 5651, "epoch": 134} {"train_loss": -4.709529876708984, "global_step": 5652, "epoch": 134} {"train_loss": -4.624939918518066, "global_step": 5653, "epoch": 134} {"train_loss": -4.734209060668945, "global_step": 5654, "epoch": 134} {"train_loss": -4.834368705749512, "global_step": 5655, "epoch": 134} {"train_loss": -4.6415934562683105, "global_step": 5656, "epoch": 134} {"train_loss": -4.571681976318359, "global_step": 5657, "epoch": 134} {"train_loss": -4.78078556060791, "global_step": 5658, "epoch": 134} {"train_loss": -4.483774185180664, "global_step": 5659, "epoch": 134} {"train_loss": -4.387186050415039, "global_step": 5660, "epoch": 134} {"train_loss": -4.606499671936035, "global_step": 5661, "epoch": 134} {"train_loss": -4.620916366577148, "global_step": 5662, "epoch": 134} {"train_loss": -4.666180610656738, "global_step": 5663, "epoch": 134} {"train_loss": -4.644117832183838, "global_step": 5664, "epoch": 134} {"train_loss": -4.705950736999512, "global_step": 5665, "epoch": 134} {"train_loss": -4.664700031280518, "global_step": 5666, "epoch": 134} {"train_loss": -4.600569725036621, "global_step": 5667, "epoch": 134} {"train_loss": -4.798854827880859, "global_step": 5668, "epoch": 134} {"train_loss": -4.713909376235235, "global_step": 5669, "epoch": 134, "val_loss": 91616.515625} {"train_loss": -4.535788536071777, "global_step": 5670, "epoch": 135} {"train_loss": -4.8240180015563965, "global_step": 5671, "epoch": 135} {"train_loss": -4.9531683921813965, "global_step": 5672, "epoch": 135} {"train_loss": -4.721286773681641, "global_step": 5673, "epoch": 135} {"train_loss": -4.829387187957764, "global_step": 5674, "epoch": 135} {"train_loss": -4.7103681564331055, "global_step": 5675, "epoch": 135} {"train_loss": -4.824077606201172, "global_step": 5676, "epoch": 135} {"train_loss": -4.822742462158203, "global_step": 5677, "epoch": 135} {"train_loss": -4.847128868103027, "global_step": 5678, "epoch": 135} {"train_loss": -4.773438930511475, "global_step": 5679, "epoch": 135} {"train_loss": -4.514493942260742, "global_step": 5680, "epoch": 135} {"train_loss": -4.588638782501221, "global_step": 5681, "epoch": 135} {"train_loss": -4.773174285888672, "global_step": 5682, "epoch": 135} {"train_loss": -4.792191505432129, "global_step": 5683, "epoch": 135} {"train_loss": -4.66236686706543, "global_step": 5684, "epoch": 135} {"train_loss": -4.604429721832275, "global_step": 5685, "epoch": 135} {"train_loss": -4.795775413513184, "global_step": 5686, "epoch": 135} {"train_loss": -4.710420608520508, "global_step": 5687, "epoch": 135} {"train_loss": -4.418535232543945, "global_step": 5688, "epoch": 135} {"train_loss": -4.651171684265137, "global_step": 5689, "epoch": 135} {"train_loss": -4.6360368728637695, "global_step": 5690, "epoch": 135} {"train_loss": -4.569685935974121, "global_step": 5691, "epoch": 135} {"train_loss": -4.6618852615356445, "global_step": 5692, "epoch": 135} {"train_loss": -4.550995826721191, "global_step": 5693, "epoch": 135} {"train_loss": -4.541419982910156, "global_step": 5694, "epoch": 135} {"train_loss": -4.642971992492676, "global_step": 5695, "epoch": 135} {"train_loss": -4.690399169921875, "global_step": 5696, "epoch": 135} {"train_loss": -4.637395858764648, "global_step": 5697, "epoch": 135} {"train_loss": -4.802241325378418, "global_step": 5698, "epoch": 135} {"train_loss": -4.604649543762207, "global_step": 5699, "epoch": 135} {"train_loss": -4.672741413116455, "global_step": 5700, "epoch": 135} {"train_loss": -4.904407978057861, "global_step": 5701, "epoch": 135} {"train_loss": -4.7431535720825195, "global_step": 5702, "epoch": 135} {"train_loss": -4.839597702026367, "global_step": 5703, "epoch": 135} {"train_loss": -4.759279251098633, "global_step": 5704, "epoch": 135} {"train_loss": -4.6991167068481445, "global_step": 5705, "epoch": 135} {"train_loss": -4.807032585144043, "global_step": 5706, "epoch": 135} {"train_loss": -4.785426139831543, "global_step": 5707, "epoch": 135} {"train_loss": -4.77036190032959, "global_step": 5708, "epoch": 135} {"train_loss": -4.707584857940674, "global_step": 5709, "epoch": 135} {"train_loss": -4.7556610107421875, "global_step": 5710, "epoch": 135} {"train_loss": -4.70662614277431, "global_step": 5711, "epoch": 135, "val_loss": 90235.4453125} {"train_loss": -4.690529823303223, "global_step": 5712, "epoch": 136} {"train_loss": -4.685000419616699, "global_step": 5713, "epoch": 136} {"train_loss": -4.562382221221924, "global_step": 5714, "epoch": 136} {"train_loss": -4.747303009033203, "global_step": 5715, "epoch": 136} {"train_loss": -4.7166595458984375, "global_step": 5716, "epoch": 136} {"train_loss": -4.447661399841309, "global_step": 5717, "epoch": 136} {"train_loss": -4.668247222900391, "global_step": 5718, "epoch": 136} {"train_loss": -4.684986114501953, "global_step": 5719, "epoch": 136} {"train_loss": -4.650882720947266, "global_step": 5720, "epoch": 136} {"train_loss": -4.728200912475586, "global_step": 5721, "epoch": 136} {"train_loss": -4.786804676055908, "global_step": 5722, "epoch": 136} {"train_loss": -4.571591377258301, "global_step": 5723, "epoch": 136} {"train_loss": -4.812468528747559, "global_step": 5724, "epoch": 136} {"train_loss": -4.715645790100098, "global_step": 5725, "epoch": 136} {"train_loss": -4.509296894073486, "global_step": 5726, "epoch": 136} {"train_loss": -4.7022600173950195, "global_step": 5727, "epoch": 136} {"train_loss": -4.628532886505127, "global_step": 5728, "epoch": 136} {"train_loss": -4.688729286193848, "global_step": 5729, "epoch": 136} {"train_loss": -4.709181785583496, "global_step": 5730, "epoch": 136} {"train_loss": -4.811306953430176, "global_step": 5731, "epoch": 136} {"train_loss": -4.778040409088135, "global_step": 5732, "epoch": 136} {"train_loss": -4.76895809173584, "global_step": 5733, "epoch": 136} {"train_loss": -4.854681968688965, "global_step": 5734, "epoch": 136} {"train_loss": -5.02065372467041, "global_step": 5735, "epoch": 136} {"train_loss": -4.872895240783691, "global_step": 5736, "epoch": 136} {"train_loss": -4.800233840942383, "global_step": 5737, "epoch": 136} {"train_loss": -4.7010345458984375, "global_step": 5738, "epoch": 136} {"train_loss": -4.742682456970215, "global_step": 5739, "epoch": 136} {"train_loss": -4.916984558105469, "global_step": 5740, "epoch": 136} {"train_loss": -4.7586212158203125, "global_step": 5741, "epoch": 136} {"train_loss": -4.636739730834961, "global_step": 5742, "epoch": 136} {"train_loss": -4.921106338500977, "global_step": 5743, "epoch": 136} {"train_loss": -4.799141883850098, "global_step": 5744, "epoch": 136} {"train_loss": -4.830209732055664, "global_step": 5745, "epoch": 136} {"train_loss": -4.786346435546875, "global_step": 5746, "epoch": 136} {"train_loss": -4.841014862060547, "global_step": 5747, "epoch": 136} {"train_loss": -4.568762302398682, "global_step": 5748, "epoch": 136} {"train_loss": -4.9231367111206055, "global_step": 5749, "epoch": 136} {"train_loss": -4.703209400177002, "global_step": 5750, "epoch": 136} {"train_loss": -4.767424583435059, "global_step": 5751, "epoch": 136} {"train_loss": -4.777957439422607, "global_step": 5752, "epoch": 136} {"train_loss": -4.7371426196325395, "global_step": 5753, "epoch": 136, "val_loss": 89509.4375} {"train_loss": -4.764805793762207, "global_step": 5754, "epoch": 137} {"train_loss": -4.682100296020508, "global_step": 5755, "epoch": 137} {"train_loss": -4.770869255065918, "global_step": 5756, "epoch": 137} {"train_loss": -4.843077659606934, "global_step": 5757, "epoch": 137} {"train_loss": -4.908857345581055, "global_step": 5758, "epoch": 137} {"train_loss": -4.787955284118652, "global_step": 5759, "epoch": 137} {"train_loss": -4.813592910766602, "global_step": 5760, "epoch": 137} {"train_loss": -4.772584438323975, "global_step": 5761, "epoch": 137} {"train_loss": -4.788382530212402, "global_step": 5762, "epoch": 137} {"train_loss": -4.805300712585449, "global_step": 5763, "epoch": 137} {"train_loss": -4.956151962280273, "global_step": 5764, "epoch": 137} {"train_loss": -4.804237365722656, "global_step": 5765, "epoch": 137} {"train_loss": -4.593832969665527, "global_step": 5766, "epoch": 137} {"train_loss": -4.653966903686523, "global_step": 5767, "epoch": 137} {"train_loss": -4.86762809753418, "global_step": 5768, "epoch": 137} {"train_loss": -4.624202728271484, "global_step": 5769, "epoch": 137} {"train_loss": -4.612710952758789, "global_step": 5770, "epoch": 137} {"train_loss": -4.726593494415283, "global_step": 5771, "epoch": 137} {"train_loss": -4.708373069763184, "global_step": 5772, "epoch": 137} {"train_loss": -4.587675094604492, "global_step": 5773, "epoch": 137} {"train_loss": -4.6679182052612305, "global_step": 5774, "epoch": 137} {"train_loss": -4.6648359298706055, "global_step": 5775, "epoch": 137} {"train_loss": -4.848813056945801, "global_step": 5776, "epoch": 137} {"train_loss": -4.623664855957031, "global_step": 5777, "epoch": 137} {"train_loss": -4.735714435577393, "global_step": 5778, "epoch": 137} {"train_loss": -4.613717079162598, "global_step": 5779, "epoch": 137} {"train_loss": -4.599207878112793, "global_step": 5780, "epoch": 137} {"train_loss": -4.620118141174316, "global_step": 5781, "epoch": 137} {"train_loss": -4.674942970275879, "global_step": 5782, "epoch": 137} {"train_loss": -4.834395408630371, "global_step": 5783, "epoch": 137} {"train_loss": -4.718261241912842, "global_step": 5784, "epoch": 137} {"train_loss": -4.771506309509277, "global_step": 5785, "epoch": 137} {"train_loss": -4.649837017059326, "global_step": 5786, "epoch": 137} {"train_loss": -4.6666154861450195, "global_step": 5787, "epoch": 137} {"train_loss": -4.584997177124023, "global_step": 5788, "epoch": 137} {"train_loss": -4.612161159515381, "global_step": 5789, "epoch": 137} {"train_loss": -4.676736831665039, "global_step": 5790, "epoch": 137} {"train_loss": -4.846445083618164, "global_step": 5791, "epoch": 137} {"train_loss": -4.870429039001465, "global_step": 5792, "epoch": 137} {"train_loss": -4.765259742736816, "global_step": 5793, "epoch": 137} {"train_loss": -4.802125930786133, "global_step": 5794, "epoch": 137} {"train_loss": -4.731554576328823, "global_step": 5795, "epoch": 137, "val_loss": 89416.8203125} {"train_loss": -4.670763969421387, "global_step": 5796, "epoch": 138} {"train_loss": -4.886056900024414, "global_step": 5797, "epoch": 138} {"train_loss": -4.86472749710083, "global_step": 5798, "epoch": 138} {"train_loss": -4.917184829711914, "global_step": 5799, "epoch": 138} {"train_loss": -4.81494140625, "global_step": 5800, "epoch": 138} {"train_loss": -4.897582054138184, "global_step": 5801, "epoch": 138} {"train_loss": -4.79827880859375, "global_step": 5802, "epoch": 138} {"train_loss": -4.749380588531494, "global_step": 5803, "epoch": 138} {"train_loss": -4.588192462921143, "global_step": 5804, "epoch": 138} {"train_loss": -4.832703590393066, "global_step": 5805, "epoch": 138} {"train_loss": -4.545977592468262, "global_step": 5806, "epoch": 138} {"train_loss": -4.643244743347168, "global_step": 5807, "epoch": 138} {"train_loss": -4.716351509094238, "global_step": 5808, "epoch": 138} {"train_loss": -4.883694171905518, "global_step": 5809, "epoch": 138} {"train_loss": -4.593099594116211, "global_step": 5810, "epoch": 138} {"train_loss": -4.780204772949219, "global_step": 5811, "epoch": 138} {"train_loss": -4.848552227020264, "global_step": 5812, "epoch": 138} {"train_loss": -4.768798828125, "global_step": 5813, "epoch": 138} {"train_loss": -4.823724746704102, "global_step": 5814, "epoch": 138} {"train_loss": -4.748058795928955, "global_step": 5815, "epoch": 138} {"train_loss": -4.739290237426758, "global_step": 5816, "epoch": 138} {"train_loss": -4.596558094024658, "global_step": 5817, "epoch": 138} {"train_loss": -4.80466365814209, "global_step": 5818, "epoch": 138} {"train_loss": -4.810454368591309, "global_step": 5819, "epoch": 138} {"train_loss": -4.8346147537231445, "global_step": 5820, "epoch": 138} {"train_loss": -4.747221946716309, "global_step": 5821, "epoch": 138} {"train_loss": -4.7615556716918945, "global_step": 5822, "epoch": 138} {"train_loss": -4.890224456787109, "global_step": 5823, "epoch": 138} {"train_loss": -4.852514266967773, "global_step": 5824, "epoch": 138} {"train_loss": -4.790626525878906, "global_step": 5825, "epoch": 138} {"train_loss": -4.782938480377197, "global_step": 5826, "epoch": 138} {"train_loss": -4.720519065856934, "global_step": 5827, "epoch": 138} {"train_loss": -4.713074207305908, "global_step": 5828, "epoch": 138} {"train_loss": -4.8478498458862305, "global_step": 5829, "epoch": 138} {"train_loss": -4.710634231567383, "global_step": 5830, "epoch": 138} {"train_loss": -4.600305557250977, "global_step": 5831, "epoch": 138} {"train_loss": -4.720303535461426, "global_step": 5832, "epoch": 138} {"train_loss": -4.908262252807617, "global_step": 5833, "epoch": 138} {"train_loss": -4.560930252075195, "global_step": 5834, "epoch": 138} {"train_loss": -4.7310991287231445, "global_step": 5835, "epoch": 138} {"train_loss": -4.820428371429443, "global_step": 5836, "epoch": 138} {"train_loss": -4.764103401274908, "global_step": 5837, "epoch": 138, "val_loss": 90459.21875} {"train_loss": -4.79340934753418, "global_step": 5838, "epoch": 139} {"train_loss": -4.633041858673096, "global_step": 5839, "epoch": 139} {"train_loss": -4.710866928100586, "global_step": 5840, "epoch": 139} {"train_loss": -4.653985977172852, "global_step": 5841, "epoch": 139} {"train_loss": -4.949516296386719, "global_step": 5842, "epoch": 139} {"train_loss": -4.646970748901367, "global_step": 5843, "epoch": 139} {"train_loss": -4.592099189758301, "global_step": 5844, "epoch": 139} {"train_loss": -4.531659126281738, "global_step": 5845, "epoch": 139} {"train_loss": -4.795704364776611, "global_step": 5846, "epoch": 139} {"train_loss": -4.757940292358398, "global_step": 5847, "epoch": 139} {"train_loss": -4.722359657287598, "global_step": 5848, "epoch": 139} {"train_loss": -4.680367469787598, "global_step": 5849, "epoch": 139} {"train_loss": -4.916815280914307, "global_step": 5850, "epoch": 139} {"train_loss": -4.776263236999512, "global_step": 5851, "epoch": 139} {"train_loss": -4.627463340759277, "global_step": 5852, "epoch": 139} {"train_loss": -4.729621410369873, "global_step": 5853, "epoch": 139} {"train_loss": -4.6714019775390625, "global_step": 5854, "epoch": 139} {"train_loss": -4.628792762756348, "global_step": 5855, "epoch": 139} {"train_loss": -4.600080490112305, "global_step": 5856, "epoch": 139} {"train_loss": -4.625677108764648, "global_step": 5857, "epoch": 139} {"train_loss": -4.756291389465332, "global_step": 5858, "epoch": 139} {"train_loss": -4.741241931915283, "global_step": 5859, "epoch": 139} {"train_loss": -4.743813514709473, "global_step": 5860, "epoch": 139} {"train_loss": -4.704767227172852, "global_step": 5861, "epoch": 139} {"train_loss": -4.888738632202148, "global_step": 5862, "epoch": 139} {"train_loss": -4.78749942779541, "global_step": 5863, "epoch": 139} {"train_loss": -4.759568214416504, "global_step": 5864, "epoch": 139} {"train_loss": -4.714156150817871, "global_step": 5865, "epoch": 139} {"train_loss": -4.784529685974121, "global_step": 5866, "epoch": 139} {"train_loss": -4.849291801452637, "global_step": 5867, "epoch": 139} {"train_loss": -4.850798606872559, "global_step": 5868, "epoch": 139} {"train_loss": -4.725925445556641, "global_step": 5869, "epoch": 139} {"train_loss": -4.746232032775879, "global_step": 5870, "epoch": 139} {"train_loss": -4.926484107971191, "global_step": 5871, "epoch": 139} {"train_loss": -4.608548164367676, "global_step": 5872, "epoch": 139} {"train_loss": -4.611066818237305, "global_step": 5873, "epoch": 139} {"train_loss": -4.7680511474609375, "global_step": 5874, "epoch": 139} {"train_loss": -4.81236457824707, "global_step": 5875, "epoch": 139} {"train_loss": -4.572786808013916, "global_step": 5876, "epoch": 139} {"train_loss": -4.787920951843262, "global_step": 5877, "epoch": 139} {"train_loss": -4.699179649353027, "global_step": 5878, "epoch": 139} {"train_loss": -4.7262267158145, "global_step": 5879, "epoch": 139, "val_loss": 88765.40625} {"train_loss": -4.734658718109131, "global_step": 5880, "epoch": 140} {"train_loss": -4.772613525390625, "global_step": 5881, "epoch": 140} {"train_loss": -4.473282814025879, "global_step": 5882, "epoch": 140} {"train_loss": -4.7570366859436035, "global_step": 5883, "epoch": 140} {"train_loss": -4.933351516723633, "global_step": 5884, "epoch": 140} {"train_loss": -4.707989692687988, "global_step": 5885, "epoch": 140} {"train_loss": -4.726228713989258, "global_step": 5886, "epoch": 140} {"train_loss": -4.6764678955078125, "global_step": 5887, "epoch": 140} {"train_loss": -4.722626686096191, "global_step": 5888, "epoch": 140} {"train_loss": -4.887603282928467, "global_step": 5889, "epoch": 140} {"train_loss": -4.733013153076172, "global_step": 5890, "epoch": 140} {"train_loss": -4.765418529510498, "global_step": 5891, "epoch": 140} {"train_loss": -4.776924133300781, "global_step": 5892, "epoch": 140} {"train_loss": -4.948594570159912, "global_step": 5893, "epoch": 140} {"train_loss": -4.747028350830078, "global_step": 5894, "epoch": 140} {"train_loss": -4.712092399597168, "global_step": 5895, "epoch": 140} {"train_loss": -4.849343299865723, "global_step": 5896, "epoch": 140} {"train_loss": -4.889352798461914, "global_step": 5897, "epoch": 140} {"train_loss": -4.662087917327881, "global_step": 5898, "epoch": 140} {"train_loss": -4.788573265075684, "global_step": 5899, "epoch": 140} {"train_loss": -4.7434797286987305, "global_step": 5900, "epoch": 140} {"train_loss": -4.874137878417969, "global_step": 5901, "epoch": 140} {"train_loss": -4.692688941955566, "global_step": 5902, "epoch": 140} {"train_loss": -4.775521278381348, "global_step": 5903, "epoch": 140} {"train_loss": -4.659946441650391, "global_step": 5904, "epoch": 140} {"train_loss": -4.768185615539551, "global_step": 5905, "epoch": 140} {"train_loss": -4.575279235839844, "global_step": 5906, "epoch": 140} {"train_loss": -4.641173362731934, "global_step": 5907, "epoch": 140} {"train_loss": -4.641783714294434, "global_step": 5908, "epoch": 140} {"train_loss": -4.701410293579102, "global_step": 5909, "epoch": 140} {"train_loss": -4.613356590270996, "global_step": 5910, "epoch": 140} {"train_loss": -4.59033203125, "global_step": 5911, "epoch": 140} {"train_loss": -4.6991682052612305, "global_step": 5912, "epoch": 140} {"train_loss": -4.63077974319458, "global_step": 5913, "epoch": 140} {"train_loss": -4.709809303283691, "global_step": 5914, "epoch": 140} {"train_loss": -4.811710357666016, "global_step": 5915, "epoch": 140} {"train_loss": -4.695797920227051, "global_step": 5916, "epoch": 140} {"train_loss": -4.455477714538574, "global_step": 5917, "epoch": 140} {"train_loss": -4.743183612823486, "global_step": 5918, "epoch": 140} {"train_loss": -4.705592632293701, "global_step": 5919, "epoch": 140} {"train_loss": -4.715570449829102, "global_step": 5920, "epoch": 140} {"train_loss": -4.725516750698998, "global_step": 5921, "epoch": 140, "val_loss": 88782.3046875} {"train_loss": -4.745348930358887, "global_step": 5922, "epoch": 141} {"train_loss": -4.850318908691406, "global_step": 5923, "epoch": 141} {"train_loss": -4.843132019042969, "global_step": 5924, "epoch": 141} {"train_loss": -4.810428619384766, "global_step": 5925, "epoch": 141} {"train_loss": -4.746060371398926, "global_step": 5926, "epoch": 141} {"train_loss": -4.809167861938477, "global_step": 5927, "epoch": 141} {"train_loss": -4.777303218841553, "global_step": 5928, "epoch": 141} {"train_loss": -4.759090423583984, "global_step": 5929, "epoch": 141} {"train_loss": -4.757877349853516, "global_step": 5930, "epoch": 141} {"train_loss": -4.598160743713379, "global_step": 5931, "epoch": 141} {"train_loss": -4.83763313293457, "global_step": 5932, "epoch": 141} {"train_loss": -4.796823501586914, "global_step": 5933, "epoch": 141} {"train_loss": -4.808494567871094, "global_step": 5934, "epoch": 141} {"train_loss": -4.82165002822876, "global_step": 5935, "epoch": 141} {"train_loss": -4.703815460205078, "global_step": 5936, "epoch": 141} {"train_loss": -4.746968746185303, "global_step": 5937, "epoch": 141} {"train_loss": -4.742155075073242, "global_step": 5938, "epoch": 141} {"train_loss": -4.912408351898193, "global_step": 5939, "epoch": 141} {"train_loss": -4.869037628173828, "global_step": 5940, "epoch": 141} {"train_loss": -4.74804162979126, "global_step": 5941, "epoch": 141} {"train_loss": -4.854762554168701, "global_step": 5942, "epoch": 141} {"train_loss": -4.800243377685547, "global_step": 5943, "epoch": 141} {"train_loss": -4.815149307250977, "global_step": 5944, "epoch": 141} {"train_loss": -4.818576812744141, "global_step": 5945, "epoch": 141} {"train_loss": -4.7719221115112305, "global_step": 5946, "epoch": 141} {"train_loss": -4.911993026733398, "global_step": 5947, "epoch": 141} {"train_loss": -4.748437881469727, "global_step": 5948, "epoch": 141} {"train_loss": -4.76478385925293, "global_step": 5949, "epoch": 141} {"train_loss": -4.737196922302246, "global_step": 5950, "epoch": 141} {"train_loss": -4.728634834289551, "global_step": 5951, "epoch": 141} {"train_loss": -4.8657026290893555, "global_step": 5952, "epoch": 141} {"train_loss": -4.951044082641602, "global_step": 5953, "epoch": 141} {"train_loss": -4.697678565979004, "global_step": 5954, "epoch": 141} {"train_loss": -4.948360919952393, "global_step": 5955, "epoch": 141} {"train_loss": -4.708710670471191, "global_step": 5956, "epoch": 141} {"train_loss": -4.802583694458008, "global_step": 5957, "epoch": 141} {"train_loss": -4.74188232421875, "global_step": 5958, "epoch": 141} {"train_loss": -4.5403971672058105, "global_step": 5959, "epoch": 141} {"train_loss": -4.495272636413574, "global_step": 5960, "epoch": 141} {"train_loss": -4.792184352874756, "global_step": 5961, "epoch": 141} {"train_loss": -4.506046772003174, "global_step": 5962, "epoch": 141} {"train_loss": -4.772721710659209, "global_step": 5963, "epoch": 141, "val_loss": 88848.1953125} {"train_loss": -4.829751968383789, "global_step": 5964, "epoch": 142} {"train_loss": -4.654442310333252, "global_step": 5965, "epoch": 142} {"train_loss": -4.80252742767334, "global_step": 5966, "epoch": 142} {"train_loss": -4.787909507751465, "global_step": 5967, "epoch": 142} {"train_loss": -4.905295372009277, "global_step": 5968, "epoch": 142} {"train_loss": -4.783164978027344, "global_step": 5969, "epoch": 142} {"train_loss": -4.755385398864746, "global_step": 5970, "epoch": 142} {"train_loss": -4.744095325469971, "global_step": 5971, "epoch": 142} {"train_loss": -4.679422378540039, "global_step": 5972, "epoch": 142} {"train_loss": -4.777225494384766, "global_step": 5973, "epoch": 142} {"train_loss": -4.799624443054199, "global_step": 5974, "epoch": 142} {"train_loss": -4.803775787353516, "global_step": 5975, "epoch": 142} {"train_loss": -4.861127853393555, "global_step": 5976, "epoch": 142} {"train_loss": -4.914176940917969, "global_step": 5977, "epoch": 142} {"train_loss": -4.718573093414307, "global_step": 5978, "epoch": 142} {"train_loss": -4.845330715179443, "global_step": 5979, "epoch": 142} {"train_loss": -4.875187873840332, "global_step": 5980, "epoch": 142} {"train_loss": -4.865711212158203, "global_step": 5981, "epoch": 142} {"train_loss": -4.930882453918457, "global_step": 5982, "epoch": 142} {"train_loss": -4.698264122009277, "global_step": 5983, "epoch": 142} {"train_loss": -4.826075077056885, "global_step": 5984, "epoch": 142} {"train_loss": -4.889719009399414, "global_step": 5985, "epoch": 142} {"train_loss": -4.8249006271362305, "global_step": 5986, "epoch": 142} {"train_loss": -4.730886459350586, "global_step": 5987, "epoch": 142} {"train_loss": -4.860683917999268, "global_step": 5988, "epoch": 142} {"train_loss": -4.7834930419921875, "global_step": 5989, "epoch": 142} {"train_loss": -4.7655863761901855, "global_step": 5990, "epoch": 142} {"train_loss": -4.842922210693359, "global_step": 5991, "epoch": 142} {"train_loss": -4.644308567047119, "global_step": 5992, "epoch": 142} {"train_loss": -4.567966461181641, "global_step": 5993, "epoch": 142} {"train_loss": -4.665164470672607, "global_step": 5994, "epoch": 142} {"train_loss": -4.556695938110352, "global_step": 5995, "epoch": 142} {"train_loss": -4.7365007400512695, "global_step": 5996, "epoch": 142} {"train_loss": -4.834142684936523, "global_step": 5997, "epoch": 142} {"train_loss": -4.507004261016846, "global_step": 5998, "epoch": 142} {"train_loss": -4.315488815307617, "global_step": 5999, "epoch": 142} {"train_loss": -4.7059125900268555, "global_step": 6000, "epoch": 142} {"train_loss": -4.643960952758789, "global_step": 6001, "epoch": 142} {"train_loss": -4.501757621765137, "global_step": 6002, "epoch": 142} {"train_loss": -4.864893913269043, "global_step": 6003, "epoch": 142} {"train_loss": -4.5433454513549805, "global_step": 6004, "epoch": 142} {"train_loss": -4.749782789321173, "global_step": 6005, "epoch": 142, "val_loss": 91087.359375} {"train_loss": -4.589654922485352, "global_step": 6006, "epoch": 143} {"train_loss": -4.646432399749756, "global_step": 6007, "epoch": 143} {"train_loss": -4.715716361999512, "global_step": 6008, "epoch": 143} {"train_loss": -4.593212604522705, "global_step": 6009, "epoch": 143} {"train_loss": -4.8429718017578125, "global_step": 6010, "epoch": 143} {"train_loss": -4.64222526550293, "global_step": 6011, "epoch": 143} {"train_loss": -4.754709243774414, "global_step": 6012, "epoch": 143} {"train_loss": -4.719213485717773, "global_step": 6013, "epoch": 143} {"train_loss": -4.709082126617432, "global_step": 6014, "epoch": 143} {"train_loss": -4.480440139770508, "global_step": 6015, "epoch": 143} {"train_loss": -4.74049711227417, "global_step": 6016, "epoch": 143} {"train_loss": -4.628061294555664, "global_step": 6017, "epoch": 143} {"train_loss": -4.759525299072266, "global_step": 6018, "epoch": 143} {"train_loss": -4.643007278442383, "global_step": 6019, "epoch": 143} {"train_loss": -4.544631481170654, "global_step": 6020, "epoch": 143} {"train_loss": -4.568953514099121, "global_step": 6021, "epoch": 143} {"train_loss": -4.450873374938965, "global_step": 6022, "epoch": 143} {"train_loss": -4.774879455566406, "global_step": 6023, "epoch": 143} {"train_loss": -4.53096866607666, "global_step": 6024, "epoch": 143} {"train_loss": -4.598548889160156, "global_step": 6025, "epoch": 143} {"train_loss": -4.65946102142334, "global_step": 6026, "epoch": 143} {"train_loss": -4.66412353515625, "global_step": 6027, "epoch": 143} {"train_loss": -4.725324630737305, "global_step": 6028, "epoch": 143} {"train_loss": -4.563880920410156, "global_step": 6029, "epoch": 143} {"train_loss": -4.559579372406006, "global_step": 6030, "epoch": 143} {"train_loss": -4.815728187561035, "global_step": 6031, "epoch": 143} {"train_loss": -4.585514068603516, "global_step": 6032, "epoch": 143} {"train_loss": -4.650455951690674, "global_step": 6033, "epoch": 143} {"train_loss": -4.587794780731201, "global_step": 6034, "epoch": 143} {"train_loss": -4.496551513671875, "global_step": 6035, "epoch": 143} {"train_loss": -4.722837448120117, "global_step": 6036, "epoch": 143} {"train_loss": -4.531105041503906, "global_step": 6037, "epoch": 143} {"train_loss": -4.676844120025635, "global_step": 6038, "epoch": 143} {"train_loss": -4.9440016746521, "global_step": 6039, "epoch": 143} {"train_loss": -4.743855953216553, "global_step": 6040, "epoch": 143} {"train_loss": -4.713809967041016, "global_step": 6041, "epoch": 143} {"train_loss": -4.6525983810424805, "global_step": 6042, "epoch": 143} {"train_loss": -4.578520774841309, "global_step": 6043, "epoch": 143} {"train_loss": -4.298025131225586, "global_step": 6044, "epoch": 143} {"train_loss": -4.222787380218506, "global_step": 6045, "epoch": 143} {"train_loss": -4.674037933349609, "global_step": 6046, "epoch": 143} {"train_loss": -4.633480015255156, "global_step": 6047, "epoch": 143, "val_loss": 92709.3671875} {"train_loss": -4.3101887702941895, "global_step": 6048, "epoch": 144} {"train_loss": -4.714732646942139, "global_step": 6049, "epoch": 144} {"train_loss": -4.6685028076171875, "global_step": 6050, "epoch": 144} {"train_loss": -4.662590026855469, "global_step": 6051, "epoch": 144} {"train_loss": -4.680462837219238, "global_step": 6052, "epoch": 144} {"train_loss": -4.696114540100098, "global_step": 6053, "epoch": 144} {"train_loss": -4.742307662963867, "global_step": 6054, "epoch": 144} {"train_loss": -4.650844573974609, "global_step": 6055, "epoch": 144} {"train_loss": -4.804141044616699, "global_step": 6056, "epoch": 144} {"train_loss": -4.722698211669922, "global_step": 6057, "epoch": 144} {"train_loss": -4.772491455078125, "global_step": 6058, "epoch": 144} {"train_loss": -4.82272481918335, "global_step": 6059, "epoch": 144} {"train_loss": -4.706530570983887, "global_step": 6060, "epoch": 144} {"train_loss": -4.890242576599121, "global_step": 6061, "epoch": 144} {"train_loss": -4.820350170135498, "global_step": 6062, "epoch": 144} {"train_loss": -4.799958229064941, "global_step": 6063, "epoch": 144} {"train_loss": -4.77729606628418, "global_step": 6064, "epoch": 144} {"train_loss": -4.826104640960693, "global_step": 6065, "epoch": 144} {"train_loss": -4.761084079742432, "global_step": 6066, "epoch": 144} {"train_loss": -4.8476104736328125, "global_step": 6067, "epoch": 144} {"train_loss": -4.814205169677734, "global_step": 6068, "epoch": 144} {"train_loss": -4.812957763671875, "global_step": 6069, "epoch": 144} {"train_loss": -4.728884696960449, "global_step": 6070, "epoch": 144} {"train_loss": -4.710522651672363, "global_step": 6071, "epoch": 144} {"train_loss": -4.857195854187012, "global_step": 6072, "epoch": 144} {"train_loss": -4.726254940032959, "global_step": 6073, "epoch": 144} {"train_loss": -4.8301591873168945, "global_step": 6074, "epoch": 144} {"train_loss": -4.844815731048584, "global_step": 6075, "epoch": 144} {"train_loss": -4.920076370239258, "global_step": 6076, "epoch": 144} {"train_loss": -4.833930969238281, "global_step": 6077, "epoch": 144} {"train_loss": -4.904618740081787, "global_step": 6078, "epoch": 144} {"train_loss": -4.840063571929932, "global_step": 6079, "epoch": 144} {"train_loss": -4.7731032371521, "global_step": 6080, "epoch": 144} {"train_loss": -4.903069019317627, "global_step": 6081, "epoch": 144} {"train_loss": -4.759556770324707, "global_step": 6082, "epoch": 144} {"train_loss": -4.731686592102051, "global_step": 6083, "epoch": 144} {"train_loss": -4.657676696777344, "global_step": 6084, "epoch": 144} {"train_loss": -4.839205265045166, "global_step": 6085, "epoch": 144} {"train_loss": -4.995933532714844, "global_step": 6086, "epoch": 144} {"train_loss": -4.876181602478027, "global_step": 6087, "epoch": 144} {"train_loss": -4.725344181060791, "global_step": 6088, "epoch": 144} {"train_loss": -4.773294937042963, "global_step": 6089, "epoch": 144, "val_loss": 87648.46875} {"train_loss": -4.921535491943359, "global_step": 6090, "epoch": 145} {"train_loss": -4.925943851470947, "global_step": 6091, "epoch": 145} {"train_loss": -4.815088272094727, "global_step": 6092, "epoch": 145} {"train_loss": -4.6232428550720215, "global_step": 6093, "epoch": 145} {"train_loss": -4.7978410720825195, "global_step": 6094, "epoch": 145} {"train_loss": -4.841997146606445, "global_step": 6095, "epoch": 145} {"train_loss": -4.71533203125, "global_step": 6096, "epoch": 145} {"train_loss": -4.672449111938477, "global_step": 6097, "epoch": 145} {"train_loss": -4.681238174438477, "global_step": 6098, "epoch": 145} {"train_loss": -4.681060791015625, "global_step": 6099, "epoch": 145} {"train_loss": -4.850875377655029, "global_step": 6100, "epoch": 145} {"train_loss": -4.766361236572266, "global_step": 6101, "epoch": 145} {"train_loss": -4.778703689575195, "global_step": 6102, "epoch": 145} {"train_loss": -4.723201274871826, "global_step": 6103, "epoch": 145} {"train_loss": -4.863819599151611, "global_step": 6104, "epoch": 145} {"train_loss": -4.924838542938232, "global_step": 6105, "epoch": 145} {"train_loss": -4.7652764320373535, "global_step": 6106, "epoch": 145} {"train_loss": -4.788932800292969, "global_step": 6107, "epoch": 145} {"train_loss": -4.781067848205566, "global_step": 6108, "epoch": 145} {"train_loss": -4.849311351776123, "global_step": 6109, "epoch": 145} {"train_loss": -4.890474319458008, "global_step": 6110, "epoch": 145} {"train_loss": -4.707440376281738, "global_step": 6111, "epoch": 145} {"train_loss": -4.769104957580566, "global_step": 6112, "epoch": 145} {"train_loss": -4.946489334106445, "global_step": 6113, "epoch": 145} {"train_loss": -4.934812545776367, "global_step": 6114, "epoch": 145} {"train_loss": -4.960952281951904, "global_step": 6115, "epoch": 145} {"train_loss": -4.886297702789307, "global_step": 6116, "epoch": 145} {"train_loss": -4.759826183319092, "global_step": 6117, "epoch": 145} {"train_loss": -4.718482494354248, "global_step": 6118, "epoch": 145} {"train_loss": -4.750324249267578, "global_step": 6119, "epoch": 145} {"train_loss": -5.032790184020996, "global_step": 6120, "epoch": 145} {"train_loss": -4.872899055480957, "global_step": 6121, "epoch": 145} {"train_loss": -4.806473731994629, "global_step": 6122, "epoch": 145} {"train_loss": -4.857120037078857, "global_step": 6123, "epoch": 145} {"train_loss": -4.922310829162598, "global_step": 6124, "epoch": 145} {"train_loss": -4.728472709655762, "global_step": 6125, "epoch": 145} {"train_loss": -4.731121063232422, "global_step": 6126, "epoch": 145} {"train_loss": -4.773907661437988, "global_step": 6127, "epoch": 145} {"train_loss": -4.955681800842285, "global_step": 6128, "epoch": 145} {"train_loss": -4.832983493804932, "global_step": 6129, "epoch": 145} {"train_loss": -4.580434799194336, "global_step": 6130, "epoch": 145} {"train_loss": -4.805242107028053, "global_step": 6131, "epoch": 145, "val_loss": 88111.21875} {"train_loss": -4.788853645324707, "global_step": 6132, "epoch": 146} {"train_loss": -4.720475673675537, "global_step": 6133, "epoch": 146} {"train_loss": -4.609685897827148, "global_step": 6134, "epoch": 146} {"train_loss": -4.871504783630371, "global_step": 6135, "epoch": 146} {"train_loss": -4.639547348022461, "global_step": 6136, "epoch": 146} {"train_loss": -4.806055545806885, "global_step": 6137, "epoch": 146} {"train_loss": -4.7364935874938965, "global_step": 6138, "epoch": 146} {"train_loss": -4.36068058013916, "global_step": 6139, "epoch": 146} {"train_loss": -4.617527961730957, "global_step": 6140, "epoch": 146} {"train_loss": -4.701371669769287, "global_step": 6141, "epoch": 146} {"train_loss": -4.756113052368164, "global_step": 6142, "epoch": 146} {"train_loss": -4.623887538909912, "global_step": 6143, "epoch": 146} {"train_loss": -4.711263656616211, "global_step": 6144, "epoch": 146} {"train_loss": -4.775702476501465, "global_step": 6145, "epoch": 146} {"train_loss": -4.76776123046875, "global_step": 6146, "epoch": 146} {"train_loss": -4.775362014770508, "global_step": 6147, "epoch": 146} {"train_loss": -4.824224472045898, "global_step": 6148, "epoch": 146} {"train_loss": -4.854565620422363, "global_step": 6149, "epoch": 146} {"train_loss": -4.709247589111328, "global_step": 6150, "epoch": 146} {"train_loss": -4.775124549865723, "global_step": 6151, "epoch": 146} {"train_loss": -4.965494155883789, "global_step": 6152, "epoch": 146} {"train_loss": -4.767841339111328, "global_step": 6153, "epoch": 146} {"train_loss": -4.889625549316406, "global_step": 6154, "epoch": 146} {"train_loss": -4.795482635498047, "global_step": 6155, "epoch": 146} {"train_loss": -4.855015277862549, "global_step": 6156, "epoch": 146} {"train_loss": -4.894003868103027, "global_step": 6157, "epoch": 146} {"train_loss": -4.82432746887207, "global_step": 6158, "epoch": 146} {"train_loss": -4.763034820556641, "global_step": 6159, "epoch": 146} {"train_loss": -4.796738147735596, "global_step": 6160, "epoch": 146} {"train_loss": -4.781548500061035, "global_step": 6161, "epoch": 146} {"train_loss": -4.786653518676758, "global_step": 6162, "epoch": 146} {"train_loss": -4.958752155303955, "global_step": 6163, "epoch": 146} {"train_loss": -4.887149333953857, "global_step": 6164, "epoch": 146} {"train_loss": -4.873601913452148, "global_step": 6165, "epoch": 146} {"train_loss": -4.711037635803223, "global_step": 6166, "epoch": 146} {"train_loss": -4.7891340255737305, "global_step": 6167, "epoch": 146} {"train_loss": -4.722143173217773, "global_step": 6168, "epoch": 146} {"train_loss": -4.82525634765625, "global_step": 6169, "epoch": 146} {"train_loss": -4.8885178565979, "global_step": 6170, "epoch": 146} {"train_loss": -4.7273173332214355, "global_step": 6171, "epoch": 146} {"train_loss": -4.621175289154053, "global_step": 6172, "epoch": 146} {"train_loss": -4.7687897228059315, "global_step": 6173, "epoch": 146, "val_loss": 87603.1875} {"train_loss": -4.802096366882324, "global_step": 6174, "epoch": 147} {"train_loss": -4.845457077026367, "global_step": 6175, "epoch": 147} {"train_loss": -4.83180046081543, "global_step": 6176, "epoch": 147} {"train_loss": -4.773859024047852, "global_step": 6177, "epoch": 147} {"train_loss": -4.791632652282715, "global_step": 6178, "epoch": 147} {"train_loss": -4.786096572875977, "global_step": 6179, "epoch": 147} {"train_loss": -4.738922595977783, "global_step": 6180, "epoch": 147} {"train_loss": -4.881718635559082, "global_step": 6181, "epoch": 147} {"train_loss": -4.769064903259277, "global_step": 6182, "epoch": 147} {"train_loss": -4.917165279388428, "global_step": 6183, "epoch": 147} {"train_loss": -4.783827781677246, "global_step": 6184, "epoch": 147} {"train_loss": -4.6403937339782715, "global_step": 6185, "epoch": 147} {"train_loss": -4.716164588928223, "global_step": 6186, "epoch": 147} {"train_loss": -4.866291046142578, "global_step": 6187, "epoch": 147} {"train_loss": -4.806265830993652, "global_step": 6188, "epoch": 147} {"train_loss": -4.766159534454346, "global_step": 6189, "epoch": 147} {"train_loss": -4.605378150939941, "global_step": 6190, "epoch": 147} {"train_loss": -4.824283123016357, "global_step": 6191, "epoch": 147} {"train_loss": -5.008651256561279, "global_step": 6192, "epoch": 147} {"train_loss": -4.734622955322266, "global_step": 6193, "epoch": 147} {"train_loss": -4.581111431121826, "global_step": 6194, "epoch": 147} {"train_loss": -4.798425674438477, "global_step": 6195, "epoch": 147} {"train_loss": -4.794219970703125, "global_step": 6196, "epoch": 147} {"train_loss": -4.759152412414551, "global_step": 6197, "epoch": 147} {"train_loss": -4.655888557434082, "global_step": 6198, "epoch": 147} {"train_loss": -4.756285667419434, "global_step": 6199, "epoch": 147} {"train_loss": -4.796834468841553, "global_step": 6200, "epoch": 147} {"train_loss": -4.731416702270508, "global_step": 6201, "epoch": 147} {"train_loss": -4.829998970031738, "global_step": 6202, "epoch": 147} {"train_loss": -4.598079681396484, "global_step": 6203, "epoch": 147} {"train_loss": -4.514644622802734, "global_step": 6204, "epoch": 147} {"train_loss": -4.605215549468994, "global_step": 6205, "epoch": 147} {"train_loss": -4.542577266693115, "global_step": 6206, "epoch": 147} {"train_loss": -4.323501110076904, "global_step": 6207, "epoch": 147} {"train_loss": -4.478826522827148, "global_step": 6208, "epoch": 147} {"train_loss": -4.710397720336914, "global_step": 6209, "epoch": 147} {"train_loss": -4.628725051879883, "global_step": 6210, "epoch": 147} {"train_loss": -4.638334274291992, "global_step": 6211, "epoch": 147} {"train_loss": -4.847803115844727, "global_step": 6212, "epoch": 147} {"train_loss": -4.522883415222168, "global_step": 6213, "epoch": 147} {"train_loss": -4.753930568695068, "global_step": 6214, "epoch": 147} {"train_loss": -4.72797341573806, "global_step": 6215, "epoch": 147, "val_loss": 89634.6875} {"train_loss": -4.5677313804626465, "global_step": 6216, "epoch": 148} {"train_loss": -4.917852878570557, "global_step": 6217, "epoch": 148} {"train_loss": -4.776798248291016, "global_step": 6218, "epoch": 148} {"train_loss": -4.795822620391846, "global_step": 6219, "epoch": 148} {"train_loss": -4.846543312072754, "global_step": 6220, "epoch": 148} {"train_loss": -4.777710914611816, "global_step": 6221, "epoch": 148} {"train_loss": -4.829163551330566, "global_step": 6222, "epoch": 148} {"train_loss": -4.741147994995117, "global_step": 6223, "epoch": 148} {"train_loss": -4.8076066970825195, "global_step": 6224, "epoch": 148} {"train_loss": -4.722522735595703, "global_step": 6225, "epoch": 148} {"train_loss": -4.7899274826049805, "global_step": 6226, "epoch": 148} {"train_loss": -4.923620223999023, "global_step": 6227, "epoch": 148} {"train_loss": -4.8234734535217285, "global_step": 6228, "epoch": 148} {"train_loss": -4.7533159255981445, "global_step": 6229, "epoch": 148} {"train_loss": -4.909712791442871, "global_step": 6230, "epoch": 148} {"train_loss": -4.709738254547119, "global_step": 6231, "epoch": 148} {"train_loss": -4.894651889801025, "global_step": 6232, "epoch": 148} {"train_loss": -4.944211483001709, "global_step": 6233, "epoch": 148} {"train_loss": -4.80084753036499, "global_step": 6234, "epoch": 148} {"train_loss": -4.869533538818359, "global_step": 6235, "epoch": 148} {"train_loss": -4.71806526184082, "global_step": 6236, "epoch": 148} {"train_loss": -4.902751445770264, "global_step": 6237, "epoch": 148} {"train_loss": -4.798956871032715, "global_step": 6238, "epoch": 148} {"train_loss": -4.904600143432617, "global_step": 6239, "epoch": 148} {"train_loss": -4.69879674911499, "global_step": 6240, "epoch": 148} {"train_loss": -4.741700649261475, "global_step": 6241, "epoch": 148} {"train_loss": -4.672851085662842, "global_step": 6242, "epoch": 148} {"train_loss": -4.796133518218994, "global_step": 6243, "epoch": 148} {"train_loss": -4.911231994628906, "global_step": 6244, "epoch": 148} {"train_loss": -4.79969596862793, "global_step": 6245, "epoch": 148} {"train_loss": -4.619721412658691, "global_step": 6246, "epoch": 148} {"train_loss": -4.894489288330078, "global_step": 6247, "epoch": 148} {"train_loss": -4.818885326385498, "global_step": 6248, "epoch": 148} {"train_loss": -4.767860412597656, "global_step": 6249, "epoch": 148} {"train_loss": -4.8267598152160645, "global_step": 6250, "epoch": 148} {"train_loss": -4.720876693725586, "global_step": 6251, "epoch": 148} {"train_loss": -4.823531150817871, "global_step": 6252, "epoch": 148} {"train_loss": -4.845762729644775, "global_step": 6253, "epoch": 148} {"train_loss": -4.761772632598877, "global_step": 6254, "epoch": 148} {"train_loss": -4.985447883605957, "global_step": 6255, "epoch": 148} {"train_loss": -4.750053882598877, "global_step": 6256, "epoch": 148} {"train_loss": -4.803098020099458, "global_step": 6257, "epoch": 148, "val_loss": 87507.546875} {"train_loss": -5.0023908615112305, "global_step": 6258, "epoch": 149} {"train_loss": -4.872756481170654, "global_step": 6259, "epoch": 149} {"train_loss": -4.8820905685424805, "global_step": 6260, "epoch": 149} {"train_loss": -4.853140830993652, "global_step": 6261, "epoch": 149} {"train_loss": -4.980594635009766, "global_step": 6262, "epoch": 149} {"train_loss": -4.904301643371582, "global_step": 6263, "epoch": 149} {"train_loss": -4.755764007568359, "global_step": 6264, "epoch": 149} {"train_loss": -5.020444869995117, "global_step": 6265, "epoch": 149} {"train_loss": -4.9507904052734375, "global_step": 6266, "epoch": 149} {"train_loss": -4.801185607910156, "global_step": 6267, "epoch": 149} {"train_loss": -4.564614772796631, "global_step": 6268, "epoch": 149} {"train_loss": -4.623561859130859, "global_step": 6269, "epoch": 149} {"train_loss": -4.7710747718811035, "global_step": 6270, "epoch": 149} {"train_loss": -4.806522369384766, "global_step": 6271, "epoch": 149} {"train_loss": -4.750316619873047, "global_step": 6272, "epoch": 149} {"train_loss": -4.590388298034668, "global_step": 6273, "epoch": 149} {"train_loss": -4.909477710723877, "global_step": 6274, "epoch": 149} {"train_loss": -4.868776798248291, "global_step": 6275, "epoch": 149} {"train_loss": -4.8535919189453125, "global_step": 6276, "epoch": 149} {"train_loss": -4.7272796630859375, "global_step": 6277, "epoch": 149} {"train_loss": -4.784468173980713, "global_step": 6278, "epoch": 149} {"train_loss": -4.894585609436035, "global_step": 6279, "epoch": 149} {"train_loss": -4.894018173217773, "global_step": 6280, "epoch": 149} {"train_loss": -4.877306938171387, "global_step": 6281, "epoch": 149} {"train_loss": -4.877435207366943, "global_step": 6282, "epoch": 149} {"train_loss": -4.789734840393066, "global_step": 6283, "epoch": 149} {"train_loss": -4.835324287414551, "global_step": 6284, "epoch": 149} {"train_loss": -4.797904014587402, "global_step": 6285, "epoch": 149} {"train_loss": -4.611508846282959, "global_step": 6286, "epoch": 149} {"train_loss": -4.809455871582031, "global_step": 6287, "epoch": 149} {"train_loss": -4.818312644958496, "global_step": 6288, "epoch": 149} {"train_loss": -4.839895725250244, "global_step": 6289, "epoch": 149} {"train_loss": -4.72639799118042, "global_step": 6290, "epoch": 149} {"train_loss": -4.798556327819824, "global_step": 6291, "epoch": 149} {"train_loss": -4.877168655395508, "global_step": 6292, "epoch": 149} {"train_loss": -4.82741641998291, "global_step": 6293, "epoch": 149} {"train_loss": -4.763069152832031, "global_step": 6294, "epoch": 149} {"train_loss": -4.711908340454102, "global_step": 6295, "epoch": 149} {"train_loss": -4.811588764190674, "global_step": 6296, "epoch": 149} {"train_loss": -4.779636383056641, "global_step": 6297, "epoch": 149} {"train_loss": -4.691104888916016, "global_step": 6298, "epoch": 149} {"train_loss": -4.814472993214925, "global_step": 6299, "epoch": 149, "val_loss": 88239.1015625} {"train_loss": -4.862859725952148, "global_step": 6300, "epoch": 150} {"train_loss": -4.797651767730713, "global_step": 6301, "epoch": 150} {"train_loss": -4.884458541870117, "global_step": 6302, "epoch": 150} {"train_loss": -4.888747692108154, "global_step": 6303, "epoch": 150} {"train_loss": -4.781177520751953, "global_step": 6304, "epoch": 150} {"train_loss": -4.924322128295898, "global_step": 6305, "epoch": 150} {"train_loss": -4.825659275054932, "global_step": 6306, "epoch": 150} {"train_loss": -4.9415435791015625, "global_step": 6307, "epoch": 150} {"train_loss": -4.782758712768555, "global_step": 6308, "epoch": 150} {"train_loss": -4.660737037658691, "global_step": 6309, "epoch": 150} {"train_loss": -4.566107749938965, "global_step": 6310, "epoch": 150} {"train_loss": -4.815520763397217, "global_step": 6311, "epoch": 150} {"train_loss": -4.478769302368164, "global_step": 6312, "epoch": 150} {"train_loss": -4.7859649658203125, "global_step": 6313, "epoch": 150} {"train_loss": -4.731574058532715, "global_step": 6314, "epoch": 150} {"train_loss": -4.625588893890381, "global_step": 6315, "epoch": 150} {"train_loss": -4.657888412475586, "global_step": 6316, "epoch": 150} {"train_loss": -4.771684646606445, "global_step": 6317, "epoch": 150} {"train_loss": -4.7603230476379395, "global_step": 6318, "epoch": 150} {"train_loss": -4.780925750732422, "global_step": 6319, "epoch": 150} {"train_loss": -4.7795209884643555, "global_step": 6320, "epoch": 150} {"train_loss": -4.858965873718262, "global_step": 6321, "epoch": 150} {"train_loss": -4.784104347229004, "global_step": 6322, "epoch": 150} {"train_loss": -4.696897029876709, "global_step": 6323, "epoch": 150} {"train_loss": -4.904531478881836, "global_step": 6324, "epoch": 150} {"train_loss": -4.726093769073486, "global_step": 6325, "epoch": 150} {"train_loss": -4.751169681549072, "global_step": 6326, "epoch": 150} {"train_loss": -4.911667823791504, "global_step": 6327, "epoch": 150} {"train_loss": -4.78614616394043, "global_step": 6328, "epoch": 150} {"train_loss": -4.925875663757324, "global_step": 6329, "epoch": 150} {"train_loss": -4.793564796447754, "global_step": 6330, "epoch": 150} {"train_loss": -4.970770835876465, "global_step": 6331, "epoch": 150} {"train_loss": -4.856877326965332, "global_step": 6332, "epoch": 150} {"train_loss": -4.836854934692383, "global_step": 6333, "epoch": 150} {"train_loss": -4.9511308670043945, "global_step": 6334, "epoch": 150} {"train_loss": -4.842844009399414, "global_step": 6335, "epoch": 150} {"train_loss": -4.874210357666016, "global_step": 6336, "epoch": 150} {"train_loss": -4.740846633911133, "global_step": 6337, "epoch": 150} {"train_loss": -4.941093921661377, "global_step": 6338, "epoch": 150} {"train_loss": -4.894275188446045, "global_step": 6339, "epoch": 150} {"train_loss": -4.5406718254089355, "global_step": 6340, "epoch": 150} {"train_loss": -4.787387643541608, "global_step": 6341, "epoch": 150, "train/sim_max_reward_0": 0.21325103660534642, "train/sim_max_reward_1": 0.4103395139276148, "train/sim_max_reward_2": 0.0, "train/sim_max_reward_3": 0.06861576431134164, "train/sim_max_reward_4": 0.04938687401813976, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4500000": 0.33163505174200103, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 4.4198787184752127e-07, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.16797540324195048, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.05317574936726585, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.47930557987234185, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.5000684787350512, "test/sim_max_reward_4500015": 0.07136275466934977, "test/sim_max_reward_4500016": 0.016675763131935927, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.004249031229020703, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.3752085824140955, "test/sim_max_reward_4500022": 0.33035368716497726, "test/sim_max_reward_4500023": 0.5453055366789884, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.02635084550610397, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.48353801904864757, "test/sim_max_reward_4500028": 0.2770796558787026, "test/sim_max_reward_4500029": 0.04163460642148004, "test/sim_max_reward_4500030": 0.10314191947648461, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.09394670751391468, "test/sim_max_reward_4500035": 0.0943819760266492, "test/sim_max_reward_4500036": 0.40651615293262744, "test/sim_max_reward_4500037": 0.15817835675983746, "test/sim_max_reward_4500038": 0.1606878553606089, "test/sim_max_reward_4500039": 0.3645468431978834, "test/sim_max_reward_4500040": 0.013039280895794533, "test/sim_max_reward_4500041": 0.0, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.43341007942680854, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.11862867072865349, "test/sim_max_reward_4500046": 0.4795838903645092, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.05659722449734764, "train/mean_score": 0.15576299137077168, "test/mean_score": 0.1336945155506968, "val_loss": 88143.828125} {"train_loss": -4.723602771759033, "global_step": 6342, "epoch": 151} {"train_loss": -4.664151191711426, "global_step": 6343, "epoch": 151} {"train_loss": -4.513375282287598, "global_step": 6344, "epoch": 151} {"train_loss": -4.880579948425293, "global_step": 6345, "epoch": 151} {"train_loss": -4.775722980499268, "global_step": 6346, "epoch": 151} {"train_loss": -4.533194541931152, "global_step": 6347, "epoch": 151} {"train_loss": -4.5068206787109375, "global_step": 6348, "epoch": 151} {"train_loss": -4.589454650878906, "global_step": 6349, "epoch": 151} {"train_loss": -4.755970001220703, "global_step": 6350, "epoch": 151} {"train_loss": -4.717257499694824, "global_step": 6351, "epoch": 151} {"train_loss": -4.679717063903809, "global_step": 6352, "epoch": 151} {"train_loss": -4.703308582305908, "global_step": 6353, "epoch": 151} {"train_loss": -4.611715316772461, "global_step": 6354, "epoch": 151} {"train_loss": -4.769198894500732, "global_step": 6355, "epoch": 151} {"train_loss": -4.73845100402832, "global_step": 6356, "epoch": 151} {"train_loss": -4.740557670593262, "global_step": 6357, "epoch": 151} {"train_loss": -4.774103164672852, "global_step": 6358, "epoch": 151} {"train_loss": -4.882871627807617, "global_step": 6359, "epoch": 151} {"train_loss": -4.870719909667969, "global_step": 6360, "epoch": 151} {"train_loss": -4.788477897644043, "global_step": 6361, "epoch": 151} {"train_loss": -4.782061576843262, "global_step": 6362, "epoch": 151} {"train_loss": -4.789787292480469, "global_step": 6363, "epoch": 151} {"train_loss": -4.73520565032959, "global_step": 6364, "epoch": 151} {"train_loss": -4.910802841186523, "global_step": 6365, "epoch": 151} {"train_loss": -4.6804609298706055, "global_step": 6366, "epoch": 151} {"train_loss": -4.850997447967529, "global_step": 6367, "epoch": 151} {"train_loss": -4.871545791625977, "global_step": 6368, "epoch": 151} {"train_loss": -4.844436168670654, "global_step": 6369, "epoch": 151} {"train_loss": -4.798928737640381, "global_step": 6370, "epoch": 151} {"train_loss": -4.9814229011535645, "global_step": 6371, "epoch": 151} {"train_loss": -4.887171745300293, "global_step": 6372, "epoch": 151} {"train_loss": -4.729612827301025, "global_step": 6373, "epoch": 151} {"train_loss": -4.983769416809082, "global_step": 6374, "epoch": 151} {"train_loss": -4.798802375793457, "global_step": 6375, "epoch": 151} {"train_loss": -4.797813415527344, "global_step": 6376, "epoch": 151} {"train_loss": -4.736975193023682, "global_step": 6377, "epoch": 151} {"train_loss": -4.809910774230957, "global_step": 6378, "epoch": 151} {"train_loss": -5.005985736846924, "global_step": 6379, "epoch": 151} {"train_loss": -4.880368232727051, "global_step": 6380, "epoch": 151} {"train_loss": -4.802337646484375, "global_step": 6381, "epoch": 151} {"train_loss": -4.860012054443359, "global_step": 6382, "epoch": 151} {"train_loss": -4.774064949580601, "global_step": 6383, "epoch": 151, "val_loss": 88012.5390625} {"train_loss": -4.75468635559082, "global_step": 6384, "epoch": 152} {"train_loss": -4.819291114807129, "global_step": 6385, "epoch": 152} {"train_loss": -4.9970550537109375, "global_step": 6386, "epoch": 152} {"train_loss": -4.908005714416504, "global_step": 6387, "epoch": 152} {"train_loss": -4.776081562042236, "global_step": 6388, "epoch": 152} {"train_loss": -4.963131904602051, "global_step": 6389, "epoch": 152} {"train_loss": -4.910204887390137, "global_step": 6390, "epoch": 152} {"train_loss": -4.918752670288086, "global_step": 6391, "epoch": 152} {"train_loss": -4.884616851806641, "global_step": 6392, "epoch": 152} {"train_loss": -4.890700340270996, "global_step": 6393, "epoch": 152} {"train_loss": -4.814323902130127, "global_step": 6394, "epoch": 152} {"train_loss": -4.9638519287109375, "global_step": 6395, "epoch": 152} {"train_loss": -4.631976127624512, "global_step": 6396, "epoch": 152} {"train_loss": -4.708881378173828, "global_step": 6397, "epoch": 152} {"train_loss": -4.727447986602783, "global_step": 6398, "epoch": 152} {"train_loss": -5.013890266418457, "global_step": 6399, "epoch": 152} {"train_loss": -4.866410255432129, "global_step": 6400, "epoch": 152} {"train_loss": -4.768012046813965, "global_step": 6401, "epoch": 152} {"train_loss": -4.754243850708008, "global_step": 6402, "epoch": 152} {"train_loss": -4.8518290519714355, "global_step": 6403, "epoch": 152} {"train_loss": -4.893193244934082, "global_step": 6404, "epoch": 152} {"train_loss": -4.794004917144775, "global_step": 6405, "epoch": 152} {"train_loss": -4.707970142364502, "global_step": 6406, "epoch": 152} {"train_loss": -4.674691200256348, "global_step": 6407, "epoch": 152} {"train_loss": -4.760890960693359, "global_step": 6408, "epoch": 152} {"train_loss": -4.835437774658203, "global_step": 6409, "epoch": 152} {"train_loss": -4.765379905700684, "global_step": 6410, "epoch": 152} {"train_loss": -4.883195877075195, "global_step": 6411, "epoch": 152} {"train_loss": -4.681306838989258, "global_step": 6412, "epoch": 152} {"train_loss": -4.647228240966797, "global_step": 6413, "epoch": 152} {"train_loss": -4.7507405281066895, "global_step": 6414, "epoch": 152} {"train_loss": -4.745125770568848, "global_step": 6415, "epoch": 152} {"train_loss": -4.668251991271973, "global_step": 6416, "epoch": 152} {"train_loss": -4.646869659423828, "global_step": 6417, "epoch": 152} {"train_loss": -4.697823524475098, "global_step": 6418, "epoch": 152} {"train_loss": -4.824291229248047, "global_step": 6419, "epoch": 152} {"train_loss": -4.437837600708008, "global_step": 6420, "epoch": 152} {"train_loss": -4.726443767547607, "global_step": 6421, "epoch": 152} {"train_loss": -4.874418258666992, "global_step": 6422, "epoch": 152} {"train_loss": -4.5981268882751465, "global_step": 6423, "epoch": 152} {"train_loss": -4.861151695251465, "global_step": 6424, "epoch": 152} {"train_loss": -4.786639667692638, "global_step": 6425, "epoch": 152, "val_loss": 87472.6796875} {"train_loss": -4.718806743621826, "global_step": 6426, "epoch": 153} {"train_loss": -4.911339282989502, "global_step": 6427, "epoch": 153} {"train_loss": -4.7248945236206055, "global_step": 6428, "epoch": 153} {"train_loss": -4.7105913162231445, "global_step": 6429, "epoch": 153} {"train_loss": -4.889647483825684, "global_step": 6430, "epoch": 153} {"train_loss": -4.806064605712891, "global_step": 6431, "epoch": 153} {"train_loss": -4.79749870300293, "global_step": 6432, "epoch": 153} {"train_loss": -4.931880950927734, "global_step": 6433, "epoch": 153} {"train_loss": -4.80867338180542, "global_step": 6434, "epoch": 153} {"train_loss": -4.894458770751953, "global_step": 6435, "epoch": 153} {"train_loss": -4.940263748168945, "global_step": 6436, "epoch": 153} {"train_loss": -4.724386215209961, "global_step": 6437, "epoch": 153} {"train_loss": -4.743812561035156, "global_step": 6438, "epoch": 153} {"train_loss": -4.963677406311035, "global_step": 6439, "epoch": 153} {"train_loss": -4.696028709411621, "global_step": 6440, "epoch": 153} {"train_loss": -4.808852195739746, "global_step": 6441, "epoch": 153} {"train_loss": -4.95046854019165, "global_step": 6442, "epoch": 153} {"train_loss": -4.80683708190918, "global_step": 6443, "epoch": 153} {"train_loss": -4.812208652496338, "global_step": 6444, "epoch": 153} {"train_loss": -4.879082679748535, "global_step": 6445, "epoch": 153} {"train_loss": -4.893521785736084, "global_step": 6446, "epoch": 153} {"train_loss": -4.797200679779053, "global_step": 6447, "epoch": 153} {"train_loss": -4.9607648849487305, "global_step": 6448, "epoch": 153} {"train_loss": -4.827319145202637, "global_step": 6449, "epoch": 153} {"train_loss": -4.961897373199463, "global_step": 6450, "epoch": 153} {"train_loss": -4.863519668579102, "global_step": 6451, "epoch": 153} {"train_loss": -4.787425994873047, "global_step": 6452, "epoch": 153} {"train_loss": -4.892454624176025, "global_step": 6453, "epoch": 153} {"train_loss": -4.975707054138184, "global_step": 6454, "epoch": 153} {"train_loss": -4.906355857849121, "global_step": 6455, "epoch": 153} {"train_loss": -4.761652946472168, "global_step": 6456, "epoch": 153} {"train_loss": -4.846149444580078, "global_step": 6457, "epoch": 153} {"train_loss": -4.765401840209961, "global_step": 6458, "epoch": 153} {"train_loss": -5.030805587768555, "global_step": 6459, "epoch": 153} {"train_loss": -5.056558609008789, "global_step": 6460, "epoch": 153} {"train_loss": -4.7562761306762695, "global_step": 6461, "epoch": 153} {"train_loss": -4.674609184265137, "global_step": 6462, "epoch": 153} {"train_loss": -4.804764270782471, "global_step": 6463, "epoch": 153} {"train_loss": -4.830259799957275, "global_step": 6464, "epoch": 153} {"train_loss": -4.841358184814453, "global_step": 6465, "epoch": 153} {"train_loss": -4.704778671264648, "global_step": 6466, "epoch": 153} {"train_loss": -4.837998810268584, "global_step": 6467, "epoch": 153, "val_loss": 87179.2890625} {"train_loss": -4.802960395812988, "global_step": 6468, "epoch": 154} {"train_loss": -4.751581192016602, "global_step": 6469, "epoch": 154} {"train_loss": -4.568045616149902, "global_step": 6470, "epoch": 154} {"train_loss": -4.736382484436035, "global_step": 6471, "epoch": 154} {"train_loss": -4.80138635635376, "global_step": 6472, "epoch": 154} {"train_loss": -4.8636369705200195, "global_step": 6473, "epoch": 154} {"train_loss": -4.843637466430664, "global_step": 6474, "epoch": 154} {"train_loss": -4.9031829833984375, "global_step": 6475, "epoch": 154} {"train_loss": -4.960674285888672, "global_step": 6476, "epoch": 154} {"train_loss": -4.876692771911621, "global_step": 6477, "epoch": 154} {"train_loss": -4.730158805847168, "global_step": 6478, "epoch": 154} {"train_loss": -4.7337965965271, "global_step": 6479, "epoch": 154} {"train_loss": -4.778369903564453, "global_step": 6480, "epoch": 154} {"train_loss": -4.705246925354004, "global_step": 6481, "epoch": 154} {"train_loss": -4.77225399017334, "global_step": 6482, "epoch": 154} {"train_loss": -4.9382476806640625, "global_step": 6483, "epoch": 154} {"train_loss": -4.960304260253906, "global_step": 6484, "epoch": 154} {"train_loss": -4.847315788269043, "global_step": 6485, "epoch": 154} {"train_loss": -4.907883644104004, "global_step": 6486, "epoch": 154} {"train_loss": -4.87705659866333, "global_step": 6487, "epoch": 154} {"train_loss": -4.799872875213623, "global_step": 6488, "epoch": 154} {"train_loss": -4.809826850891113, "global_step": 6489, "epoch": 154} {"train_loss": -4.950532913208008, "global_step": 6490, "epoch": 154} {"train_loss": -4.734767913818359, "global_step": 6491, "epoch": 154} {"train_loss": -4.818357467651367, "global_step": 6492, "epoch": 154} {"train_loss": -4.896581172943115, "global_step": 6493, "epoch": 154} {"train_loss": -5.031850337982178, "global_step": 6494, "epoch": 154} {"train_loss": -4.808608055114746, "global_step": 6495, "epoch": 154} {"train_loss": -4.8543500900268555, "global_step": 6496, "epoch": 154} {"train_loss": -4.846491813659668, "global_step": 6497, "epoch": 154} {"train_loss": -4.8007121086120605, "global_step": 6498, "epoch": 154} {"train_loss": -4.822685718536377, "global_step": 6499, "epoch": 154} {"train_loss": -5.003798484802246, "global_step": 6500, "epoch": 154} {"train_loss": -4.781564712524414, "global_step": 6501, "epoch": 154} {"train_loss": -4.903701305389404, "global_step": 6502, "epoch": 154} {"train_loss": -4.885076522827148, "global_step": 6503, "epoch": 154} {"train_loss": -4.9450602531433105, "global_step": 6504, "epoch": 154} {"train_loss": -4.810049533843994, "global_step": 6505, "epoch": 154} {"train_loss": -4.5900421142578125, "global_step": 6506, "epoch": 154} {"train_loss": -4.719600677490234, "global_step": 6507, "epoch": 154} {"train_loss": -5.032293796539307, "global_step": 6508, "epoch": 154} {"train_loss": -4.831404708680653, "global_step": 6509, "epoch": 154, "val_loss": 86826.0390625} {"train_loss": -4.668663501739502, "global_step": 6510, "epoch": 155} {"train_loss": -4.808736801147461, "global_step": 6511, "epoch": 155} {"train_loss": -4.732110500335693, "global_step": 6512, "epoch": 155} {"train_loss": -4.761602401733398, "global_step": 6513, "epoch": 155} {"train_loss": -4.934258460998535, "global_step": 6514, "epoch": 155} {"train_loss": -4.636938095092773, "global_step": 6515, "epoch": 155} {"train_loss": -4.801364898681641, "global_step": 6516, "epoch": 155} {"train_loss": -4.712973594665527, "global_step": 6517, "epoch": 155} {"train_loss": -4.760641098022461, "global_step": 6518, "epoch": 155} {"train_loss": -4.836606979370117, "global_step": 6519, "epoch": 155} {"train_loss": -4.7977800369262695, "global_step": 6520, "epoch": 155} {"train_loss": -4.850505352020264, "global_step": 6521, "epoch": 155} {"train_loss": -4.854090690612793, "global_step": 6522, "epoch": 155} {"train_loss": -4.716064453125, "global_step": 6523, "epoch": 155} {"train_loss": -4.889751434326172, "global_step": 6524, "epoch": 155} {"train_loss": -4.8043622970581055, "global_step": 6525, "epoch": 155} {"train_loss": -4.829723358154297, "global_step": 6526, "epoch": 155} {"train_loss": -4.697196006774902, "global_step": 6527, "epoch": 155} {"train_loss": -4.772325038909912, "global_step": 6528, "epoch": 155} {"train_loss": -4.8708415031433105, "global_step": 6529, "epoch": 155} {"train_loss": -4.959986686706543, "global_step": 6530, "epoch": 155} {"train_loss": -4.918421268463135, "global_step": 6531, "epoch": 155} {"train_loss": -4.753944396972656, "global_step": 6532, "epoch": 155} {"train_loss": -4.82234525680542, "global_step": 6533, "epoch": 155} {"train_loss": -4.94287633895874, "global_step": 6534, "epoch": 155} {"train_loss": -4.941338539123535, "global_step": 6535, "epoch": 155} {"train_loss": -4.842201232910156, "global_step": 6536, "epoch": 155} {"train_loss": -4.896804332733154, "global_step": 6537, "epoch": 155} {"train_loss": -4.82515287399292, "global_step": 6538, "epoch": 155} {"train_loss": -4.87584114074707, "global_step": 6539, "epoch": 155} {"train_loss": -4.882695198059082, "global_step": 6540, "epoch": 155} {"train_loss": -4.895532131195068, "global_step": 6541, "epoch": 155} {"train_loss": -4.749607086181641, "global_step": 6542, "epoch": 155} {"train_loss": -4.820165634155273, "global_step": 6543, "epoch": 155} {"train_loss": -4.914442539215088, "global_step": 6544, "epoch": 155} {"train_loss": -4.713517665863037, "global_step": 6545, "epoch": 155} {"train_loss": -4.930373191833496, "global_step": 6546, "epoch": 155} {"train_loss": -4.838993549346924, "global_step": 6547, "epoch": 155} {"train_loss": -4.985420227050781, "global_step": 6548, "epoch": 155} {"train_loss": -4.975945472717285, "global_step": 6549, "epoch": 155} {"train_loss": -4.672545909881592, "global_step": 6550, "epoch": 155} {"train_loss": -4.819831201008388, "global_step": 6551, "epoch": 155, "val_loss": 86336.109375} {"train_loss": -4.659440040588379, "global_step": 6552, "epoch": 156} {"train_loss": -4.561517715454102, "global_step": 6553, "epoch": 156} {"train_loss": -4.884355545043945, "global_step": 6554, "epoch": 156} {"train_loss": -4.870810031890869, "global_step": 6555, "epoch": 156} {"train_loss": -4.664983749389648, "global_step": 6556, "epoch": 156} {"train_loss": -4.798352241516113, "global_step": 6557, "epoch": 156} {"train_loss": -4.860177993774414, "global_step": 6558, "epoch": 156} {"train_loss": -4.843531608581543, "global_step": 6559, "epoch": 156} {"train_loss": -4.672077178955078, "global_step": 6560, "epoch": 156} {"train_loss": -4.846467971801758, "global_step": 6561, "epoch": 156} {"train_loss": -4.837808132171631, "global_step": 6562, "epoch": 156} {"train_loss": -4.829642295837402, "global_step": 6563, "epoch": 156} {"train_loss": -4.8674421310424805, "global_step": 6564, "epoch": 156} {"train_loss": -4.767714977264404, "global_step": 6565, "epoch": 156} {"train_loss": -4.830160140991211, "global_step": 6566, "epoch": 156} {"train_loss": -4.9634809494018555, "global_step": 6567, "epoch": 156} {"train_loss": -4.772668838500977, "global_step": 6568, "epoch": 156} {"train_loss": -4.722598075866699, "global_step": 6569, "epoch": 156} {"train_loss": -4.833653926849365, "global_step": 6570, "epoch": 156} {"train_loss": -4.9016523361206055, "global_step": 6571, "epoch": 156} {"train_loss": -4.936621189117432, "global_step": 6572, "epoch": 156} {"train_loss": -4.604427814483643, "global_step": 6573, "epoch": 156} {"train_loss": -4.8518781661987305, "global_step": 6574, "epoch": 156} {"train_loss": -4.93520975112915, "global_step": 6575, "epoch": 156} {"train_loss": -4.683094024658203, "global_step": 6576, "epoch": 156} {"train_loss": -4.808856010437012, "global_step": 6577, "epoch": 156} {"train_loss": -4.733205795288086, "global_step": 6578, "epoch": 156} {"train_loss": -4.804534912109375, "global_step": 6579, "epoch": 156} {"train_loss": -4.892333984375, "global_step": 6580, "epoch": 156} {"train_loss": -4.8816986083984375, "global_step": 6581, "epoch": 156} {"train_loss": -4.897921562194824, "global_step": 6582, "epoch": 156} {"train_loss": -4.905518054962158, "global_step": 6583, "epoch": 156} {"train_loss": -4.799542427062988, "global_step": 6584, "epoch": 156} {"train_loss": -4.894535064697266, "global_step": 6585, "epoch": 156} {"train_loss": -5.03490686416626, "global_step": 6586, "epoch": 156} {"train_loss": -4.887263298034668, "global_step": 6587, "epoch": 156} {"train_loss": -4.964412212371826, "global_step": 6588, "epoch": 156} {"train_loss": -4.9136857986450195, "global_step": 6589, "epoch": 156} {"train_loss": -4.829311370849609, "global_step": 6590, "epoch": 156} {"train_loss": -5.1343865394592285, "global_step": 6591, "epoch": 156} {"train_loss": -4.817528247833252, "global_step": 6592, "epoch": 156} {"train_loss": -4.835667859940302, "global_step": 6593, "epoch": 156, "val_loss": 86210.640625} {"train_loss": -4.820006370544434, "global_step": 6594, "epoch": 157} {"train_loss": -4.807187557220459, "global_step": 6595, "epoch": 157} {"train_loss": -4.681349754333496, "global_step": 6596, "epoch": 157} {"train_loss": -4.801601409912109, "global_step": 6597, "epoch": 157} {"train_loss": -4.6572065353393555, "global_step": 6598, "epoch": 157} {"train_loss": -4.924079895019531, "global_step": 6599, "epoch": 157} {"train_loss": -4.808411121368408, "global_step": 6600, "epoch": 157} {"train_loss": -4.667792320251465, "global_step": 6601, "epoch": 157} {"train_loss": -4.823721885681152, "global_step": 6602, "epoch": 157} {"train_loss": -4.877475738525391, "global_step": 6603, "epoch": 157} {"train_loss": -4.767474174499512, "global_step": 6604, "epoch": 157} {"train_loss": -4.7934112548828125, "global_step": 6605, "epoch": 157} {"train_loss": -4.894783973693848, "global_step": 6606, "epoch": 157} {"train_loss": -4.7618408203125, "global_step": 6607, "epoch": 157} {"train_loss": -4.822582244873047, "global_step": 6608, "epoch": 157} {"train_loss": -4.867085933685303, "global_step": 6609, "epoch": 157} {"train_loss": -4.8456034660339355, "global_step": 6610, "epoch": 157} {"train_loss": -4.918117046356201, "global_step": 6611, "epoch": 157} {"train_loss": -4.904780387878418, "global_step": 6612, "epoch": 157} {"train_loss": -4.771801948547363, "global_step": 6613, "epoch": 157} {"train_loss": -4.7961835861206055, "global_step": 6614, "epoch": 157} {"train_loss": -4.900860786437988, "global_step": 6615, "epoch": 157} {"train_loss": -4.7657151222229, "global_step": 6616, "epoch": 157} {"train_loss": -4.972661972045898, "global_step": 6617, "epoch": 157} {"train_loss": -4.875389099121094, "global_step": 6618, "epoch": 157} {"train_loss": -4.895669937133789, "global_step": 6619, "epoch": 157} {"train_loss": -5.006678581237793, "global_step": 6620, "epoch": 157} {"train_loss": -4.895078182220459, "global_step": 6621, "epoch": 157} {"train_loss": -4.9657511711120605, "global_step": 6622, "epoch": 157} {"train_loss": -4.87528133392334, "global_step": 6623, "epoch": 157} {"train_loss": -4.884572982788086, "global_step": 6624, "epoch": 157} {"train_loss": -4.795804977416992, "global_step": 6625, "epoch": 157} {"train_loss": -4.891904830932617, "global_step": 6626, "epoch": 157} {"train_loss": -4.893425464630127, "global_step": 6627, "epoch": 157} {"train_loss": -4.908102512359619, "global_step": 6628, "epoch": 157} {"train_loss": -5.028660774230957, "global_step": 6629, "epoch": 157} {"train_loss": -4.707027435302734, "global_step": 6630, "epoch": 157} {"train_loss": -4.821962833404541, "global_step": 6631, "epoch": 157} {"train_loss": -4.570448875427246, "global_step": 6632, "epoch": 157} {"train_loss": -4.73544454574585, "global_step": 6633, "epoch": 157} {"train_loss": -4.840322494506836, "global_step": 6634, "epoch": 157} {"train_loss": -4.829318977537609, "global_step": 6635, "epoch": 157, "val_loss": 89209.1875} {"train_loss": -4.569549560546875, "global_step": 6636, "epoch": 158} {"train_loss": -4.6896820068359375, "global_step": 6637, "epoch": 158} {"train_loss": -4.685721397399902, "global_step": 6638, "epoch": 158} {"train_loss": -4.523655891418457, "global_step": 6639, "epoch": 158} {"train_loss": -4.575963020324707, "global_step": 6640, "epoch": 158} {"train_loss": -4.78900146484375, "global_step": 6641, "epoch": 158} {"train_loss": -4.783830642700195, "global_step": 6642, "epoch": 158} {"train_loss": -4.783728122711182, "global_step": 6643, "epoch": 158} {"train_loss": -4.860355854034424, "global_step": 6644, "epoch": 158} {"train_loss": -4.686762809753418, "global_step": 6645, "epoch": 158} {"train_loss": -4.7464599609375, "global_step": 6646, "epoch": 158} {"train_loss": -4.590769290924072, "global_step": 6647, "epoch": 158} {"train_loss": -4.8794755935668945, "global_step": 6648, "epoch": 158} {"train_loss": -4.869601249694824, "global_step": 6649, "epoch": 158} {"train_loss": -4.620948791503906, "global_step": 6650, "epoch": 158} {"train_loss": -4.705571174621582, "global_step": 6651, "epoch": 158} {"train_loss": -4.620577812194824, "global_step": 6652, "epoch": 158} {"train_loss": -4.680974960327148, "global_step": 6653, "epoch": 158} {"train_loss": -4.586341857910156, "global_step": 6654, "epoch": 158} {"train_loss": -4.704614639282227, "global_step": 6655, "epoch": 158} {"train_loss": -4.620083808898926, "global_step": 6656, "epoch": 158} {"train_loss": -4.888522624969482, "global_step": 6657, "epoch": 158} {"train_loss": -4.688222885131836, "global_step": 6658, "epoch": 158} {"train_loss": -4.858499050140381, "global_step": 6659, "epoch": 158} {"train_loss": -4.739912986755371, "global_step": 6660, "epoch": 158} {"train_loss": -4.9598917961120605, "global_step": 6661, "epoch": 158} {"train_loss": -4.650855541229248, "global_step": 6662, "epoch": 158} {"train_loss": -4.877449989318848, "global_step": 6663, "epoch": 158} {"train_loss": -4.962444305419922, "global_step": 6664, "epoch": 158} {"train_loss": -4.863941669464111, "global_step": 6665, "epoch": 158} {"train_loss": -4.969478607177734, "global_step": 6666, "epoch": 158} {"train_loss": -4.713115692138672, "global_step": 6667, "epoch": 158} {"train_loss": -4.943469524383545, "global_step": 6668, "epoch": 158} {"train_loss": -4.691614627838135, "global_step": 6669, "epoch": 158} {"train_loss": -4.877823829650879, "global_step": 6670, "epoch": 158} {"train_loss": -4.79349422454834, "global_step": 6671, "epoch": 158} {"train_loss": -4.850942134857178, "global_step": 6672, "epoch": 158} {"train_loss": -5.010626792907715, "global_step": 6673, "epoch": 158} {"train_loss": -4.748615741729736, "global_step": 6674, "epoch": 158} {"train_loss": -4.8246750831604, "global_step": 6675, "epoch": 158} {"train_loss": -4.990420341491699, "global_step": 6676, "epoch": 158} {"train_loss": -4.772367829368228, "global_step": 6677, "epoch": 158, "val_loss": 85821.7734375} {"train_loss": -4.917420387268066, "global_step": 6678, "epoch": 159} {"train_loss": -4.8652119636535645, "global_step": 6679, "epoch": 159} {"train_loss": -4.972316741943359, "global_step": 6680, "epoch": 159} {"train_loss": -5.030209541320801, "global_step": 6681, "epoch": 159} {"train_loss": -4.927366256713867, "global_step": 6682, "epoch": 159} {"train_loss": -4.769007205963135, "global_step": 6683, "epoch": 159} {"train_loss": -4.949614524841309, "global_step": 6684, "epoch": 159} {"train_loss": -5.011136054992676, "global_step": 6685, "epoch": 159} {"train_loss": -4.925225257873535, "global_step": 6686, "epoch": 159} {"train_loss": -4.860640525817871, "global_step": 6687, "epoch": 159} {"train_loss": -4.7336626052856445, "global_step": 6688, "epoch": 159} {"train_loss": -4.807058334350586, "global_step": 6689, "epoch": 159} {"train_loss": -4.862207889556885, "global_step": 6690, "epoch": 159} {"train_loss": -4.717865467071533, "global_step": 6691, "epoch": 159} {"train_loss": -4.758711338043213, "global_step": 6692, "epoch": 159} {"train_loss": -4.862971305847168, "global_step": 6693, "epoch": 159} {"train_loss": -4.773609638214111, "global_step": 6694, "epoch": 159} {"train_loss": -4.800467491149902, "global_step": 6695, "epoch": 159} {"train_loss": -4.869497299194336, "global_step": 6696, "epoch": 159} {"train_loss": -4.78240966796875, "global_step": 6697, "epoch": 159} {"train_loss": -4.6696367263793945, "global_step": 6698, "epoch": 159} {"train_loss": -4.7663421630859375, "global_step": 6699, "epoch": 159} {"train_loss": -4.866697788238525, "global_step": 6700, "epoch": 159} {"train_loss": -4.679340362548828, "global_step": 6701, "epoch": 159} {"train_loss": -4.819082260131836, "global_step": 6702, "epoch": 159} {"train_loss": -4.657999038696289, "global_step": 6703, "epoch": 159} {"train_loss": -4.78256893157959, "global_step": 6704, "epoch": 159} {"train_loss": -4.830665111541748, "global_step": 6705, "epoch": 159} {"train_loss": -4.710989952087402, "global_step": 6706, "epoch": 159} {"train_loss": -4.753489971160889, "global_step": 6707, "epoch": 159} {"train_loss": -4.867050647735596, "global_step": 6708, "epoch": 159} {"train_loss": -4.847460746765137, "global_step": 6709, "epoch": 159} {"train_loss": -4.641921043395996, "global_step": 6710, "epoch": 159} {"train_loss": -4.761445999145508, "global_step": 6711, "epoch": 159} {"train_loss": -5.1091718673706055, "global_step": 6712, "epoch": 159} {"train_loss": -4.699954032897949, "global_step": 6713, "epoch": 159} {"train_loss": -4.594027519226074, "global_step": 6714, "epoch": 159} {"train_loss": -4.707309246063232, "global_step": 6715, "epoch": 159} {"train_loss": -4.862538814544678, "global_step": 6716, "epoch": 159} {"train_loss": -4.847362518310547, "global_step": 6717, "epoch": 159} {"train_loss": -4.65680456161499, "global_step": 6718, "epoch": 159} {"train_loss": -4.81315187045506, "global_step": 6719, "epoch": 159, "val_loss": 85430.7578125} {"train_loss": -4.691525459289551, "global_step": 6720, "epoch": 160} {"train_loss": -4.874294281005859, "global_step": 6721, "epoch": 160} {"train_loss": -4.919955253601074, "global_step": 6722, "epoch": 160} {"train_loss": -4.679523468017578, "global_step": 6723, "epoch": 160} {"train_loss": -4.738335132598877, "global_step": 6724, "epoch": 160} {"train_loss": -4.806633949279785, "global_step": 6725, "epoch": 160} {"train_loss": -4.767629623413086, "global_step": 6726, "epoch": 160} {"train_loss": -4.859264373779297, "global_step": 6727, "epoch": 160} {"train_loss": -4.898104667663574, "global_step": 6728, "epoch": 160} {"train_loss": -4.779542922973633, "global_step": 6729, "epoch": 160} {"train_loss": -4.880786895751953, "global_step": 6730, "epoch": 160} {"train_loss": -4.943035125732422, "global_step": 6731, "epoch": 160} {"train_loss": -4.687929153442383, "global_step": 6732, "epoch": 160} {"train_loss": -4.87507438659668, "global_step": 6733, "epoch": 160} {"train_loss": -4.675936222076416, "global_step": 6734, "epoch": 160} {"train_loss": -4.824069976806641, "global_step": 6735, "epoch": 160} {"train_loss": -4.933957099914551, "global_step": 6736, "epoch": 160} {"train_loss": -4.851411819458008, "global_step": 6737, "epoch": 160} {"train_loss": -4.775816440582275, "global_step": 6738, "epoch": 160} {"train_loss": -4.941839218139648, "global_step": 6739, "epoch": 160} {"train_loss": -4.918240070343018, "global_step": 6740, "epoch": 160} {"train_loss": -4.914393424987793, "global_step": 6741, "epoch": 160} {"train_loss": -4.904501914978027, "global_step": 6742, "epoch": 160} {"train_loss": -4.889217376708984, "global_step": 6743, "epoch": 160} {"train_loss": -4.708481788635254, "global_step": 6744, "epoch": 160} {"train_loss": -4.907318115234375, "global_step": 6745, "epoch": 160} {"train_loss": -4.864415168762207, "global_step": 6746, "epoch": 160} {"train_loss": -4.739048004150391, "global_step": 6747, "epoch": 160} {"train_loss": -4.989804267883301, "global_step": 6748, "epoch": 160} {"train_loss": -4.773519992828369, "global_step": 6749, "epoch": 160} {"train_loss": -4.917177200317383, "global_step": 6750, "epoch": 160} {"train_loss": -4.942241668701172, "global_step": 6751, "epoch": 160} {"train_loss": -4.751509189605713, "global_step": 6752, "epoch": 160} {"train_loss": -4.924901962280273, "global_step": 6753, "epoch": 160} {"train_loss": -4.833920955657959, "global_step": 6754, "epoch": 160} {"train_loss": -4.840219974517822, "global_step": 6755, "epoch": 160} {"train_loss": -4.915438652038574, "global_step": 6756, "epoch": 160} {"train_loss": -4.887202262878418, "global_step": 6757, "epoch": 160} {"train_loss": -4.818962097167969, "global_step": 6758, "epoch": 160} {"train_loss": -4.837906837463379, "global_step": 6759, "epoch": 160} {"train_loss": -4.877058029174805, "global_step": 6760, "epoch": 160} {"train_loss": -4.84371755236671, "global_step": 6761, "epoch": 160, "val_loss": 85891.3984375} {"train_loss": -5.002114295959473, "global_step": 6762, "epoch": 161} {"train_loss": -4.812837600708008, "global_step": 6763, "epoch": 161} {"train_loss": -4.6153950691223145, "global_step": 6764, "epoch": 161} {"train_loss": -4.882665634155273, "global_step": 6765, "epoch": 161} {"train_loss": -4.902441024780273, "global_step": 6766, "epoch": 161} {"train_loss": -4.962636470794678, "global_step": 6767, "epoch": 161} {"train_loss": -5.117886543273926, "global_step": 6768, "epoch": 161} {"train_loss": -4.675985813140869, "global_step": 6769, "epoch": 161} {"train_loss": -4.86919641494751, "global_step": 6770, "epoch": 161} {"train_loss": -4.978639125823975, "global_step": 6771, "epoch": 161} {"train_loss": -4.723803520202637, "global_step": 6772, "epoch": 161} {"train_loss": -4.936573028564453, "global_step": 6773, "epoch": 161} {"train_loss": -4.823675155639648, "global_step": 6774, "epoch": 161} {"train_loss": -4.866974830627441, "global_step": 6775, "epoch": 161} {"train_loss": -4.840085983276367, "global_step": 6776, "epoch": 161} {"train_loss": -4.867796897888184, "global_step": 6777, "epoch": 161} {"train_loss": -4.900743007659912, "global_step": 6778, "epoch": 161} {"train_loss": -4.933412551879883, "global_step": 6779, "epoch": 161} {"train_loss": -4.951300621032715, "global_step": 6780, "epoch": 161} {"train_loss": -4.866819381713867, "global_step": 6781, "epoch": 161} {"train_loss": -4.750303268432617, "global_step": 6782, "epoch": 161} {"train_loss": -4.7386932373046875, "global_step": 6783, "epoch": 161} {"train_loss": -4.977949142456055, "global_step": 6784, "epoch": 161} {"train_loss": -4.994955062866211, "global_step": 6785, "epoch": 161} {"train_loss": -4.793830871582031, "global_step": 6786, "epoch": 161} {"train_loss": -4.966118335723877, "global_step": 6787, "epoch": 161} {"train_loss": -4.845117568969727, "global_step": 6788, "epoch": 161} {"train_loss": -5.006488800048828, "global_step": 6789, "epoch": 161} {"train_loss": -5.005047798156738, "global_step": 6790, "epoch": 161} {"train_loss": -4.9740447998046875, "global_step": 6791, "epoch": 161} {"train_loss": -4.865522384643555, "global_step": 6792, "epoch": 161} {"train_loss": -4.810545921325684, "global_step": 6793, "epoch": 161} {"train_loss": -4.883652210235596, "global_step": 6794, "epoch": 161} {"train_loss": -4.917726993560791, "global_step": 6795, "epoch": 161} {"train_loss": -4.904263496398926, "global_step": 6796, "epoch": 161} {"train_loss": -4.973667621612549, "global_step": 6797, "epoch": 161} {"train_loss": -4.918830394744873, "global_step": 6798, "epoch": 161} {"train_loss": -4.813148021697998, "global_step": 6799, "epoch": 161} {"train_loss": -4.960259437561035, "global_step": 6800, "epoch": 161} {"train_loss": -4.872218132019043, "global_step": 6801, "epoch": 161} {"train_loss": -4.916936874389648, "global_step": 6802, "epoch": 161} {"train_loss": -4.886406705493019, "global_step": 6803, "epoch": 161, "val_loss": 86203.0} {"train_loss": -4.87351655960083, "global_step": 6804, "epoch": 162} {"train_loss": -4.799424648284912, "global_step": 6805, "epoch": 162} {"train_loss": -4.92311954498291, "global_step": 6806, "epoch": 162} {"train_loss": -5.100743293762207, "global_step": 6807, "epoch": 162} {"train_loss": -4.956952095031738, "global_step": 6808, "epoch": 162} {"train_loss": -4.779467582702637, "global_step": 6809, "epoch": 162} {"train_loss": -4.786591053009033, "global_step": 6810, "epoch": 162} {"train_loss": -4.862803936004639, "global_step": 6811, "epoch": 162} {"train_loss": -4.95496940612793, "global_step": 6812, "epoch": 162} {"train_loss": -4.870289325714111, "global_step": 6813, "epoch": 162} {"train_loss": -4.867326736450195, "global_step": 6814, "epoch": 162} {"train_loss": -4.8818864822387695, "global_step": 6815, "epoch": 162} {"train_loss": -4.868677616119385, "global_step": 6816, "epoch": 162} {"train_loss": -4.787128448486328, "global_step": 6817, "epoch": 162} {"train_loss": -4.957143306732178, "global_step": 6818, "epoch": 162} {"train_loss": -4.897115230560303, "global_step": 6819, "epoch": 162} {"train_loss": -4.844850540161133, "global_step": 6820, "epoch": 162} {"train_loss": -4.838467597961426, "global_step": 6821, "epoch": 162} {"train_loss": -4.981629371643066, "global_step": 6822, "epoch": 162} {"train_loss": -4.7571001052856445, "global_step": 6823, "epoch": 162} {"train_loss": -4.779130935668945, "global_step": 6824, "epoch": 162} {"train_loss": -4.699728012084961, "global_step": 6825, "epoch": 162} {"train_loss": -4.9148054122924805, "global_step": 6826, "epoch": 162} {"train_loss": -4.943218231201172, "global_step": 6827, "epoch": 162} {"train_loss": -4.985714435577393, "global_step": 6828, "epoch": 162} {"train_loss": -4.935606956481934, "global_step": 6829, "epoch": 162} {"train_loss": -4.699767112731934, "global_step": 6830, "epoch": 162} {"train_loss": -4.854501724243164, "global_step": 6831, "epoch": 162} {"train_loss": -4.847048759460449, "global_step": 6832, "epoch": 162} {"train_loss": -4.832439422607422, "global_step": 6833, "epoch": 162} {"train_loss": -4.958756446838379, "global_step": 6834, "epoch": 162} {"train_loss": -4.846851348876953, "global_step": 6835, "epoch": 162} {"train_loss": -4.875175952911377, "global_step": 6836, "epoch": 162} {"train_loss": -4.856878280639648, "global_step": 6837, "epoch": 162} {"train_loss": -4.897875785827637, "global_step": 6838, "epoch": 162} {"train_loss": -4.9326629638671875, "global_step": 6839, "epoch": 162} {"train_loss": -4.768203258514404, "global_step": 6840, "epoch": 162} {"train_loss": -4.939994812011719, "global_step": 6841, "epoch": 162} {"train_loss": -4.940707206726074, "global_step": 6842, "epoch": 162} {"train_loss": -4.84854793548584, "global_step": 6843, "epoch": 162} {"train_loss": -4.990189552307129, "global_step": 6844, "epoch": 162} {"train_loss": -4.877150512876964, "global_step": 6845, "epoch": 162, "val_loss": 85694.0625} {"train_loss": -4.9711995124816895, "global_step": 6846, "epoch": 163} {"train_loss": -4.852825164794922, "global_step": 6847, "epoch": 163} {"train_loss": -4.801629066467285, "global_step": 6848, "epoch": 163} {"train_loss": -4.922503471374512, "global_step": 6849, "epoch": 163} {"train_loss": -4.985732078552246, "global_step": 6850, "epoch": 163} {"train_loss": -4.8994598388671875, "global_step": 6851, "epoch": 163} {"train_loss": -4.994808197021484, "global_step": 6852, "epoch": 163} {"train_loss": -4.943110466003418, "global_step": 6853, "epoch": 163} {"train_loss": -4.907397270202637, "global_step": 6854, "epoch": 163} {"train_loss": -4.927669048309326, "global_step": 6855, "epoch": 163} {"train_loss": -5.021031856536865, "global_step": 6856, "epoch": 163} {"train_loss": -4.860132217407227, "global_step": 6857, "epoch": 163} {"train_loss": -4.675592422485352, "global_step": 6858, "epoch": 163} {"train_loss": -4.794230937957764, "global_step": 6859, "epoch": 163} {"train_loss": -4.96579647064209, "global_step": 6860, "epoch": 163} {"train_loss": -4.404449939727783, "global_step": 6861, "epoch": 163} {"train_loss": -4.6929779052734375, "global_step": 6862, "epoch": 163} {"train_loss": -4.634400367736816, "global_step": 6863, "epoch": 163} {"train_loss": -4.473154067993164, "global_step": 6864, "epoch": 163} {"train_loss": -4.48452091217041, "global_step": 6865, "epoch": 163} {"train_loss": -3.9737634658813477, "global_step": 6866, "epoch": 163} {"train_loss": -4.423031806945801, "global_step": 6867, "epoch": 163} {"train_loss": -4.6425089836120605, "global_step": 6868, "epoch": 163} {"train_loss": -4.778190612792969, "global_step": 6869, "epoch": 163} {"train_loss": -4.721136093139648, "global_step": 6870, "epoch": 163} {"train_loss": -4.562347888946533, "global_step": 6871, "epoch": 163} {"train_loss": -4.630336761474609, "global_step": 6872, "epoch": 163} {"train_loss": -4.627321243286133, "global_step": 6873, "epoch": 163} {"train_loss": -4.730749130249023, "global_step": 6874, "epoch": 163} {"train_loss": -4.839661598205566, "global_step": 6875, "epoch": 163} {"train_loss": -4.749258995056152, "global_step": 6876, "epoch": 163} {"train_loss": -4.726449012756348, "global_step": 6877, "epoch": 163} {"train_loss": -4.785146236419678, "global_step": 6878, "epoch": 163} {"train_loss": -4.747230529785156, "global_step": 6879, "epoch": 163} {"train_loss": -4.816524028778076, "global_step": 6880, "epoch": 163} {"train_loss": -4.782304286956787, "global_step": 6881, "epoch": 163} {"train_loss": -4.9051127433776855, "global_step": 6882, "epoch": 163} {"train_loss": -4.772905349731445, "global_step": 6883, "epoch": 163} {"train_loss": -4.80573844909668, "global_step": 6884, "epoch": 163} {"train_loss": -4.827917098999023, "global_step": 6885, "epoch": 163} {"train_loss": -4.864127159118652, "global_step": 6886, "epoch": 163} {"train_loss": -4.7573559284210205, "global_step": 6887, "epoch": 163, "val_loss": 86620.2734375} {"train_loss": -4.754450798034668, "global_step": 6888, "epoch": 164} {"train_loss": -4.806351661682129, "global_step": 6889, "epoch": 164} {"train_loss": -4.9822187423706055, "global_step": 6890, "epoch": 164} {"train_loss": -4.855445384979248, "global_step": 6891, "epoch": 164} {"train_loss": -4.83843994140625, "global_step": 6892, "epoch": 164} {"train_loss": -4.962167263031006, "global_step": 6893, "epoch": 164} {"train_loss": -4.6706743240356445, "global_step": 6894, "epoch": 164} {"train_loss": -4.8110761642456055, "global_step": 6895, "epoch": 164} {"train_loss": -4.917623519897461, "global_step": 6896, "epoch": 164} {"train_loss": -4.913419723510742, "global_step": 6897, "epoch": 164} {"train_loss": -4.875702857971191, "global_step": 6898, "epoch": 164} {"train_loss": -4.954434394836426, "global_step": 6899, "epoch": 164} {"train_loss": -4.906350135803223, "global_step": 6900, "epoch": 164} {"train_loss": -4.920499801635742, "global_step": 6901, "epoch": 164} {"train_loss": -4.692391872406006, "global_step": 6902, "epoch": 164} {"train_loss": -5.061018943786621, "global_step": 6903, "epoch": 164} {"train_loss": -4.789980411529541, "global_step": 6904, "epoch": 164} {"train_loss": -4.9724321365356445, "global_step": 6905, "epoch": 164} {"train_loss": -5.02068567276001, "global_step": 6906, "epoch": 164} {"train_loss": -4.798705101013184, "global_step": 6907, "epoch": 164} {"train_loss": -4.922994136810303, "global_step": 6908, "epoch": 164} {"train_loss": -4.924907684326172, "global_step": 6909, "epoch": 164} {"train_loss": -4.718835353851318, "global_step": 6910, "epoch": 164} {"train_loss": -4.762042045593262, "global_step": 6911, "epoch": 164} {"train_loss": -4.792304992675781, "global_step": 6912, "epoch": 164} {"train_loss": -4.893638610839844, "global_step": 6913, "epoch": 164} {"train_loss": -4.804359436035156, "global_step": 6914, "epoch": 164} {"train_loss": -4.698668956756592, "global_step": 6915, "epoch": 164} {"train_loss": -4.835709095001221, "global_step": 6916, "epoch": 164} {"train_loss": -4.934183120727539, "global_step": 6917, "epoch": 164} {"train_loss": -4.846775054931641, "global_step": 6918, "epoch": 164} {"train_loss": -4.803539276123047, "global_step": 6919, "epoch": 164} {"train_loss": -4.818378448486328, "global_step": 6920, "epoch": 164} {"train_loss": -4.89013671875, "global_step": 6921, "epoch": 164} {"train_loss": -4.782881259918213, "global_step": 6922, "epoch": 164} {"train_loss": -4.845123291015625, "global_step": 6923, "epoch": 164} {"train_loss": -4.813051700592041, "global_step": 6924, "epoch": 164} {"train_loss": -4.672295570373535, "global_step": 6925, "epoch": 164} {"train_loss": -4.716732025146484, "global_step": 6926, "epoch": 164} {"train_loss": -4.709016799926758, "global_step": 6927, "epoch": 164} {"train_loss": -4.788860321044922, "global_step": 6928, "epoch": 164} {"train_loss": -4.839897223881313, "global_step": 6929, "epoch": 164, "val_loss": 85664.0390625} {"train_loss": -4.836277484893799, "global_step": 6930, "epoch": 165} {"train_loss": -4.768575191497803, "global_step": 6931, "epoch": 165} {"train_loss": -4.662389755249023, "global_step": 6932, "epoch": 165} {"train_loss": -4.800800323486328, "global_step": 6933, "epoch": 165} {"train_loss": -4.742269992828369, "global_step": 6934, "epoch": 165} {"train_loss": -4.660245418548584, "global_step": 6935, "epoch": 165} {"train_loss": -4.809850692749023, "global_step": 6936, "epoch": 165} {"train_loss": -4.668878078460693, "global_step": 6937, "epoch": 165} {"train_loss": -4.726532459259033, "global_step": 6938, "epoch": 165} {"train_loss": -4.864673614501953, "global_step": 6939, "epoch": 165} {"train_loss": -4.954676628112793, "global_step": 6940, "epoch": 165} {"train_loss": -4.833267688751221, "global_step": 6941, "epoch": 165} {"train_loss": -4.960566997528076, "global_step": 6942, "epoch": 165} {"train_loss": -4.856836795806885, "global_step": 6943, "epoch": 165} {"train_loss": -4.788278579711914, "global_step": 6944, "epoch": 165} {"train_loss": -4.933222770690918, "global_step": 6945, "epoch": 165} {"train_loss": -4.858004570007324, "global_step": 6946, "epoch": 165} {"train_loss": -4.858156204223633, "global_step": 6947, "epoch": 165} {"train_loss": -4.875418663024902, "global_step": 6948, "epoch": 165} {"train_loss": -4.934327602386475, "global_step": 6949, "epoch": 165} {"train_loss": -4.929836273193359, "global_step": 6950, "epoch": 165} {"train_loss": -4.783302307128906, "global_step": 6951, "epoch": 165} {"train_loss": -4.811960220336914, "global_step": 6952, "epoch": 165} {"train_loss": -4.9084248542785645, "global_step": 6953, "epoch": 165} {"train_loss": -5.007711410522461, "global_step": 6954, "epoch": 165} {"train_loss": -4.821430206298828, "global_step": 6955, "epoch": 165} {"train_loss": -4.850550651550293, "global_step": 6956, "epoch": 165} {"train_loss": -4.8942551612854, "global_step": 6957, "epoch": 165} {"train_loss": -4.950717926025391, "global_step": 6958, "epoch": 165} {"train_loss": -4.8944196701049805, "global_step": 6959, "epoch": 165} {"train_loss": -4.918584823608398, "global_step": 6960, "epoch": 165} {"train_loss": -4.946642875671387, "global_step": 6961, "epoch": 165} {"train_loss": -4.8654279708862305, "global_step": 6962, "epoch": 165} {"train_loss": -4.936112403869629, "global_step": 6963, "epoch": 165} {"train_loss": -4.963030815124512, "global_step": 6964, "epoch": 165} {"train_loss": -4.9295148849487305, "global_step": 6965, "epoch": 165} {"train_loss": -4.885066986083984, "global_step": 6966, "epoch": 165} {"train_loss": -4.869579315185547, "global_step": 6967, "epoch": 165} {"train_loss": -4.928705215454102, "global_step": 6968, "epoch": 165} {"train_loss": -4.967825889587402, "global_step": 6969, "epoch": 165} {"train_loss": -4.930327415466309, "global_step": 6970, "epoch": 165} {"train_loss": -4.863826501937139, "global_step": 6971, "epoch": 165, "val_loss": 85129.6796875} {"train_loss": -4.931728839874268, "global_step": 6972, "epoch": 166} {"train_loss": -4.871108055114746, "global_step": 6973, "epoch": 166} {"train_loss": -4.9779815673828125, "global_step": 6974, "epoch": 166} {"train_loss": -4.904483795166016, "global_step": 6975, "epoch": 166} {"train_loss": -4.892189979553223, "global_step": 6976, "epoch": 166} {"train_loss": -4.9401960372924805, "global_step": 6977, "epoch": 166} {"train_loss": -4.876920700073242, "global_step": 6978, "epoch": 166} {"train_loss": -4.750705718994141, "global_step": 6979, "epoch": 166} {"train_loss": -4.680659770965576, "global_step": 6980, "epoch": 166} {"train_loss": -4.908276557922363, "global_step": 6981, "epoch": 166} {"train_loss": -5.000527381896973, "global_step": 6982, "epoch": 166} {"train_loss": -4.808612823486328, "global_step": 6983, "epoch": 166} {"train_loss": -4.978150844573975, "global_step": 6984, "epoch": 166} {"train_loss": -4.992972373962402, "global_step": 6985, "epoch": 166} {"train_loss": -4.942240238189697, "global_step": 6986, "epoch": 166} {"train_loss": -4.736713409423828, "global_step": 6987, "epoch": 166} {"train_loss": -4.718712329864502, "global_step": 6988, "epoch": 166} {"train_loss": -4.891575813293457, "global_step": 6989, "epoch": 166} {"train_loss": -4.85008430480957, "global_step": 6990, "epoch": 166} {"train_loss": -4.86932373046875, "global_step": 6991, "epoch": 166} {"train_loss": -4.598196983337402, "global_step": 6992, "epoch": 166} {"train_loss": -4.777444362640381, "global_step": 6993, "epoch": 166} {"train_loss": -4.530308723449707, "global_step": 6994, "epoch": 166} {"train_loss": -4.552882194519043, "global_step": 6995, "epoch": 166} {"train_loss": -4.458294868469238, "global_step": 6996, "epoch": 166} {"train_loss": -4.436553955078125, "global_step": 6997, "epoch": 166} {"train_loss": -4.635441780090332, "global_step": 6998, "epoch": 166} {"train_loss": -4.72774600982666, "global_step": 6999, "epoch": 166} {"train_loss": -4.560788154602051, "global_step": 7000, "epoch": 166} {"train_loss": -4.698579788208008, "global_step": 7001, "epoch": 166} {"train_loss": -4.427964210510254, "global_step": 7002, "epoch": 166} {"train_loss": -4.754480361938477, "global_step": 7003, "epoch": 166} {"train_loss": -4.608950614929199, "global_step": 7004, "epoch": 166} {"train_loss": -4.811832904815674, "global_step": 7005, "epoch": 166} {"train_loss": -4.805947303771973, "global_step": 7006, "epoch": 166} {"train_loss": -4.766054153442383, "global_step": 7007, "epoch": 166} {"train_loss": -4.848079681396484, "global_step": 7008, "epoch": 166} {"train_loss": -4.721857070922852, "global_step": 7009, "epoch": 166} {"train_loss": -4.912508964538574, "global_step": 7010, "epoch": 166} {"train_loss": -4.773536682128906, "global_step": 7011, "epoch": 166} {"train_loss": -4.947080612182617, "global_step": 7012, "epoch": 166} {"train_loss": -4.777531748726254, "global_step": 7013, "epoch": 166, "val_loss": 85130.375} {"train_loss": -4.882803916931152, "global_step": 7014, "epoch": 167} {"train_loss": -4.913633346557617, "global_step": 7015, "epoch": 167} {"train_loss": -4.7926459312438965, "global_step": 7016, "epoch": 167} {"train_loss": -4.759220123291016, "global_step": 7017, "epoch": 167} {"train_loss": -4.825961112976074, "global_step": 7018, "epoch": 167} {"train_loss": -4.831355571746826, "global_step": 7019, "epoch": 167} {"train_loss": -4.841473579406738, "global_step": 7020, "epoch": 167} {"train_loss": -4.767515182495117, "global_step": 7021, "epoch": 167} {"train_loss": -4.982298851013184, "global_step": 7022, "epoch": 167} {"train_loss": -4.928344249725342, "global_step": 7023, "epoch": 167} {"train_loss": -4.945582389831543, "global_step": 7024, "epoch": 167} {"train_loss": -4.917714595794678, "global_step": 7025, "epoch": 167} {"train_loss": -4.773008346557617, "global_step": 7026, "epoch": 167} {"train_loss": -4.912165641784668, "global_step": 7027, "epoch": 167} {"train_loss": -4.898444175720215, "global_step": 7028, "epoch": 167} {"train_loss": -4.898554801940918, "global_step": 7029, "epoch": 167} {"train_loss": -4.870199203491211, "global_step": 7030, "epoch": 167} {"train_loss": -4.949680328369141, "global_step": 7031, "epoch": 167} {"train_loss": -4.809149742126465, "global_step": 7032, "epoch": 167} {"train_loss": -5.06167459487915, "global_step": 7033, "epoch": 167} {"train_loss": -4.886094570159912, "global_step": 7034, "epoch": 167} {"train_loss": -5.002328872680664, "global_step": 7035, "epoch": 167} {"train_loss": -4.789443016052246, "global_step": 7036, "epoch": 167} {"train_loss": -4.833563327789307, "global_step": 7037, "epoch": 167} {"train_loss": -4.957220077514648, "global_step": 7038, "epoch": 167} {"train_loss": -4.773813247680664, "global_step": 7039, "epoch": 167} {"train_loss": -4.934177398681641, "global_step": 7040, "epoch": 167} {"train_loss": -4.914834976196289, "global_step": 7041, "epoch": 167} {"train_loss": -4.849331378936768, "global_step": 7042, "epoch": 167} {"train_loss": -4.778183460235596, "global_step": 7043, "epoch": 167} {"train_loss": -4.934332847595215, "global_step": 7044, "epoch": 167} {"train_loss": -5.0075154304504395, "global_step": 7045, "epoch": 167} {"train_loss": -4.960050582885742, "global_step": 7046, "epoch": 167} {"train_loss": -4.9830474853515625, "global_step": 7047, "epoch": 167} {"train_loss": -5.067492485046387, "global_step": 7048, "epoch": 167} {"train_loss": -4.797374725341797, "global_step": 7049, "epoch": 167} {"train_loss": -4.9085774421691895, "global_step": 7050, "epoch": 167} {"train_loss": -4.844714164733887, "global_step": 7051, "epoch": 167} {"train_loss": -4.848816871643066, "global_step": 7052, "epoch": 167} {"train_loss": -5.084198951721191, "global_step": 7053, "epoch": 167} {"train_loss": -5.093038558959961, "global_step": 7054, "epoch": 167} {"train_loss": -4.899848313558669, "global_step": 7055, "epoch": 167, "val_loss": 85407.125} {"train_loss": -4.8590989112854, "global_step": 7056, "epoch": 168} {"train_loss": -4.8715500831604, "global_step": 7057, "epoch": 168} {"train_loss": -4.915825366973877, "global_step": 7058, "epoch": 168} {"train_loss": -4.792169570922852, "global_step": 7059, "epoch": 168} {"train_loss": -4.855495929718018, "global_step": 7060, "epoch": 168} {"train_loss": -4.905981063842773, "global_step": 7061, "epoch": 168} {"train_loss": -5.068413257598877, "global_step": 7062, "epoch": 168} {"train_loss": -4.895572662353516, "global_step": 7063, "epoch": 168} {"train_loss": -4.909961700439453, "global_step": 7064, "epoch": 168} {"train_loss": -4.936513423919678, "global_step": 7065, "epoch": 168} {"train_loss": -4.9554123878479, "global_step": 7066, "epoch": 168} {"train_loss": -4.706683158874512, "global_step": 7067, "epoch": 168} {"train_loss": -4.624930381774902, "global_step": 7068, "epoch": 168} {"train_loss": -4.914114475250244, "global_step": 7069, "epoch": 168} {"train_loss": -4.910956382751465, "global_step": 7070, "epoch": 168} {"train_loss": -4.7221479415893555, "global_step": 7071, "epoch": 168} {"train_loss": -4.74086856842041, "global_step": 7072, "epoch": 168} {"train_loss": -4.844488143920898, "global_step": 7073, "epoch": 168} {"train_loss": -4.807302474975586, "global_step": 7074, "epoch": 168} {"train_loss": -4.799891948699951, "global_step": 7075, "epoch": 168} {"train_loss": -4.7381157875061035, "global_step": 7076, "epoch": 168} {"train_loss": -4.764429092407227, "global_step": 7077, "epoch": 168} {"train_loss": -4.698360443115234, "global_step": 7078, "epoch": 168} {"train_loss": -4.450862884521484, "global_step": 7079, "epoch": 168} {"train_loss": -4.681003570556641, "global_step": 7080, "epoch": 168} {"train_loss": -4.524670124053955, "global_step": 7081, "epoch": 168} {"train_loss": -4.595664024353027, "global_step": 7082, "epoch": 168} {"train_loss": -4.760966777801514, "global_step": 7083, "epoch": 168} {"train_loss": -4.623564720153809, "global_step": 7084, "epoch": 168} {"train_loss": -4.532930850982666, "global_step": 7085, "epoch": 168} {"train_loss": -4.796246528625488, "global_step": 7086, "epoch": 168} {"train_loss": -4.623176574707031, "global_step": 7087, "epoch": 168} {"train_loss": -4.7117767333984375, "global_step": 7088, "epoch": 168} {"train_loss": -4.759207725524902, "global_step": 7089, "epoch": 168} {"train_loss": -4.694647789001465, "global_step": 7090, "epoch": 168} {"train_loss": -4.814992904663086, "global_step": 7091, "epoch": 168} {"train_loss": -4.800973892211914, "global_step": 7092, "epoch": 168} {"train_loss": -4.880020618438721, "global_step": 7093, "epoch": 168} {"train_loss": -4.7893476486206055, "global_step": 7094, "epoch": 168} {"train_loss": -4.782578945159912, "global_step": 7095, "epoch": 168} {"train_loss": -4.735016822814941, "global_step": 7096, "epoch": 168} {"train_loss": -4.776335421062651, "global_step": 7097, "epoch": 168, "val_loss": 86920.265625} {"train_loss": -4.759254455566406, "global_step": 7098, "epoch": 169} {"train_loss": -4.8257598876953125, "global_step": 7099, "epoch": 169} {"train_loss": -4.850390434265137, "global_step": 7100, "epoch": 169} {"train_loss": -4.812515735626221, "global_step": 7101, "epoch": 169} {"train_loss": -4.905941963195801, "global_step": 7102, "epoch": 169} {"train_loss": -4.951310157775879, "global_step": 7103, "epoch": 169} {"train_loss": -4.8298540115356445, "global_step": 7104, "epoch": 169} {"train_loss": -4.838257789611816, "global_step": 7105, "epoch": 169} {"train_loss": -4.976016998291016, "global_step": 7106, "epoch": 169} {"train_loss": -4.821571350097656, "global_step": 7107, "epoch": 169} {"train_loss": -4.767153263092041, "global_step": 7108, "epoch": 169} {"train_loss": -4.9496541023254395, "global_step": 7109, "epoch": 169} {"train_loss": -4.856795310974121, "global_step": 7110, "epoch": 169} {"train_loss": -4.640214920043945, "global_step": 7111, "epoch": 169} {"train_loss": -4.83172607421875, "global_step": 7112, "epoch": 169} {"train_loss": -4.71368408203125, "global_step": 7113, "epoch": 169} {"train_loss": -4.773679733276367, "global_step": 7114, "epoch": 169} {"train_loss": -4.592836380004883, "global_step": 7115, "epoch": 169} {"train_loss": -4.963810920715332, "global_step": 7116, "epoch": 169} {"train_loss": -4.761074542999268, "global_step": 7117, "epoch": 169} {"train_loss": -4.867432594299316, "global_step": 7118, "epoch": 169} {"train_loss": -4.726707935333252, "global_step": 7119, "epoch": 169} {"train_loss": -4.877493858337402, "global_step": 7120, "epoch": 169} {"train_loss": -4.879222869873047, "global_step": 7121, "epoch": 169} {"train_loss": -4.879097938537598, "global_step": 7122, "epoch": 169} {"train_loss": -4.883188724517822, "global_step": 7123, "epoch": 169} {"train_loss": -4.7505292892456055, "global_step": 7124, "epoch": 169} {"train_loss": -4.827406883239746, "global_step": 7125, "epoch": 169} {"train_loss": -5.000885963439941, "global_step": 7126, "epoch": 169} {"train_loss": -4.8952317237854, "global_step": 7127, "epoch": 169} {"train_loss": -4.97421932220459, "global_step": 7128, "epoch": 169} {"train_loss": -4.949446678161621, "global_step": 7129, "epoch": 169} {"train_loss": -4.973970413208008, "global_step": 7130, "epoch": 169} {"train_loss": -4.8973469734191895, "global_step": 7131, "epoch": 169} {"train_loss": -4.810235977172852, "global_step": 7132, "epoch": 169} {"train_loss": -4.8354644775390625, "global_step": 7133, "epoch": 169} {"train_loss": -4.833137035369873, "global_step": 7134, "epoch": 169} {"train_loss": -4.903347492218018, "global_step": 7135, "epoch": 169} {"train_loss": -4.769147872924805, "global_step": 7136, "epoch": 169} {"train_loss": -5.0350446701049805, "global_step": 7137, "epoch": 169} {"train_loss": -4.847125053405762, "global_step": 7138, "epoch": 169} {"train_loss": -4.8490699245816185, "global_step": 7139, "epoch": 169, "val_loss": 84890.8046875} {"train_loss": -4.9078474044799805, "global_step": 7140, "epoch": 170} {"train_loss": -4.907627105712891, "global_step": 7141, "epoch": 170} {"train_loss": -4.892988681793213, "global_step": 7142, "epoch": 170} {"train_loss": -4.868109226226807, "global_step": 7143, "epoch": 170} {"train_loss": -4.781605243682861, "global_step": 7144, "epoch": 170} {"train_loss": -4.906965255737305, "global_step": 7145, "epoch": 170} {"train_loss": -4.734204292297363, "global_step": 7146, "epoch": 170} {"train_loss": -4.515351295471191, "global_step": 7147, "epoch": 170} {"train_loss": -4.85272216796875, "global_step": 7148, "epoch": 170} {"train_loss": -4.902314186096191, "global_step": 7149, "epoch": 170} {"train_loss": -4.764357089996338, "global_step": 7150, "epoch": 170} {"train_loss": -4.716394901275635, "global_step": 7151, "epoch": 170} {"train_loss": -4.720995903015137, "global_step": 7152, "epoch": 170} {"train_loss": -4.784943580627441, "global_step": 7153, "epoch": 170} {"train_loss": -4.767651557922363, "global_step": 7154, "epoch": 170} {"train_loss": -4.7848100662231445, "global_step": 7155, "epoch": 170} {"train_loss": -4.7927703857421875, "global_step": 7156, "epoch": 170} {"train_loss": -4.77808141708374, "global_step": 7157, "epoch": 170} {"train_loss": -4.832208633422852, "global_step": 7158, "epoch": 170} {"train_loss": -4.91771125793457, "global_step": 7159, "epoch": 170} {"train_loss": -4.816464424133301, "global_step": 7160, "epoch": 170} {"train_loss": -4.862888336181641, "global_step": 7161, "epoch": 170} {"train_loss": -4.9683942794799805, "global_step": 7162, "epoch": 170} {"train_loss": -4.788459777832031, "global_step": 7163, "epoch": 170} {"train_loss": -4.80741548538208, "global_step": 7164, "epoch": 170} {"train_loss": -4.902201175689697, "global_step": 7165, "epoch": 170} {"train_loss": -4.765257835388184, "global_step": 7166, "epoch": 170} {"train_loss": -4.8615217208862305, "global_step": 7167, "epoch": 170} {"train_loss": -4.918398857116699, "global_step": 7168, "epoch": 170} {"train_loss": -4.711730480194092, "global_step": 7169, "epoch": 170} {"train_loss": -5.025243759155273, "global_step": 7170, "epoch": 170} {"train_loss": -4.772397994995117, "global_step": 7171, "epoch": 170} {"train_loss": -4.83156681060791, "global_step": 7172, "epoch": 170} {"train_loss": -4.861915588378906, "global_step": 7173, "epoch": 170} {"train_loss": -4.762668609619141, "global_step": 7174, "epoch": 170} {"train_loss": -4.899946212768555, "global_step": 7175, "epoch": 170} {"train_loss": -4.797334671020508, "global_step": 7176, "epoch": 170} {"train_loss": -4.894424915313721, "global_step": 7177, "epoch": 170} {"train_loss": -4.91567325592041, "global_step": 7178, "epoch": 170} {"train_loss": -4.703742027282715, "global_step": 7179, "epoch": 170} {"train_loss": -4.801652908325195, "global_step": 7180, "epoch": 170} {"train_loss": -4.829262097676595, "global_step": 7181, "epoch": 170, "val_loss": 85028.9609375} {"train_loss": -4.914013862609863, "global_step": 7182, "epoch": 171} {"train_loss": -4.9176812171936035, "global_step": 7183, "epoch": 171} {"train_loss": -5.019892692565918, "global_step": 7184, "epoch": 171} {"train_loss": -4.859982490539551, "global_step": 7185, "epoch": 171} {"train_loss": -4.896934509277344, "global_step": 7186, "epoch": 171} {"train_loss": -4.910025596618652, "global_step": 7187, "epoch": 171} {"train_loss": -5.026885032653809, "global_step": 7188, "epoch": 171} {"train_loss": -4.9022536277771, "global_step": 7189, "epoch": 171} {"train_loss": -4.884136199951172, "global_step": 7190, "epoch": 171} {"train_loss": -4.811184883117676, "global_step": 7191, "epoch": 171} {"train_loss": -4.878194332122803, "global_step": 7192, "epoch": 171} {"train_loss": -4.925392150878906, "global_step": 7193, "epoch": 171} {"train_loss": -4.979535102844238, "global_step": 7194, "epoch": 171} {"train_loss": -4.860559463500977, "global_step": 7195, "epoch": 171} {"train_loss": -4.865533351898193, "global_step": 7196, "epoch": 171} {"train_loss": -4.895870208740234, "global_step": 7197, "epoch": 171} {"train_loss": -4.93131685256958, "global_step": 7198, "epoch": 171} {"train_loss": -4.868317127227783, "global_step": 7199, "epoch": 171} {"train_loss": -4.966291427612305, "global_step": 7200, "epoch": 171} {"train_loss": -4.985175609588623, "global_step": 7201, "epoch": 171} {"train_loss": -4.878922462463379, "global_step": 7202, "epoch": 171} {"train_loss": -4.754293918609619, "global_step": 7203, "epoch": 171} {"train_loss": -4.860705852508545, "global_step": 7204, "epoch": 171} {"train_loss": -4.963522911071777, "global_step": 7205, "epoch": 171} {"train_loss": -4.948626518249512, "global_step": 7206, "epoch": 171} {"train_loss": -4.925922393798828, "global_step": 7207, "epoch": 171} {"train_loss": -5.016693115234375, "global_step": 7208, "epoch": 171} {"train_loss": -4.797276020050049, "global_step": 7209, "epoch": 171} {"train_loss": -4.778540134429932, "global_step": 7210, "epoch": 171} {"train_loss": -4.905031204223633, "global_step": 7211, "epoch": 171} {"train_loss": -4.848992347717285, "global_step": 7212, "epoch": 171} {"train_loss": -4.90278434753418, "global_step": 7213, "epoch": 171} {"train_loss": -4.773506164550781, "global_step": 7214, "epoch": 171} {"train_loss": -4.898841857910156, "global_step": 7215, "epoch": 171} {"train_loss": -4.97628927230835, "global_step": 7216, "epoch": 171} {"train_loss": -4.782926559448242, "global_step": 7217, "epoch": 171} {"train_loss": -4.771214962005615, "global_step": 7218, "epoch": 171} {"train_loss": -4.9117302894592285, "global_step": 7219, "epoch": 171} {"train_loss": -4.960881233215332, "global_step": 7220, "epoch": 171} {"train_loss": -4.946826457977295, "global_step": 7221, "epoch": 171} {"train_loss": -4.9672627449035645, "global_step": 7222, "epoch": 171} {"train_loss": -4.89907109169733, "global_step": 7223, "epoch": 171, "val_loss": 84495.28125} {"train_loss": -4.9155192375183105, "global_step": 7224, "epoch": 172} {"train_loss": -4.935118675231934, "global_step": 7225, "epoch": 172} {"train_loss": -4.904506683349609, "global_step": 7226, "epoch": 172} {"train_loss": -4.902107238769531, "global_step": 7227, "epoch": 172} {"train_loss": -4.9306793212890625, "global_step": 7228, "epoch": 172} {"train_loss": -4.776366710662842, "global_step": 7229, "epoch": 172} {"train_loss": -4.739010810852051, "global_step": 7230, "epoch": 172} {"train_loss": -4.9319000244140625, "global_step": 7231, "epoch": 172} {"train_loss": -4.781002521514893, "global_step": 7232, "epoch": 172} {"train_loss": -4.995325565338135, "global_step": 7233, "epoch": 172} {"train_loss": -4.925457000732422, "global_step": 7234, "epoch": 172} {"train_loss": -4.819662094116211, "global_step": 7235, "epoch": 172} {"train_loss": -4.815908432006836, "global_step": 7236, "epoch": 172} {"train_loss": -5.022213935852051, "global_step": 7237, "epoch": 172} {"train_loss": -4.777508735656738, "global_step": 7238, "epoch": 172} {"train_loss": -4.8356828689575195, "global_step": 7239, "epoch": 172} {"train_loss": -5.002256870269775, "global_step": 7240, "epoch": 172} {"train_loss": -4.871822834014893, "global_step": 7241, "epoch": 172} {"train_loss": -4.927927017211914, "global_step": 7242, "epoch": 172} {"train_loss": -4.933635711669922, "global_step": 7243, "epoch": 172} {"train_loss": -5.04002571105957, "global_step": 7244, "epoch": 172} {"train_loss": -4.801797866821289, "global_step": 7245, "epoch": 172} {"train_loss": -4.983445167541504, "global_step": 7246, "epoch": 172} {"train_loss": -4.883105278015137, "global_step": 7247, "epoch": 172} {"train_loss": -4.87477970123291, "global_step": 7248, "epoch": 172} {"train_loss": -4.979700088500977, "global_step": 7249, "epoch": 172} {"train_loss": -4.920269012451172, "global_step": 7250, "epoch": 172} {"train_loss": -5.003537178039551, "global_step": 7251, "epoch": 172} {"train_loss": -4.9625678062438965, "global_step": 7252, "epoch": 172} {"train_loss": -4.86993408203125, "global_step": 7253, "epoch": 172} {"train_loss": -4.950264930725098, "global_step": 7254, "epoch": 172} {"train_loss": -4.900862216949463, "global_step": 7255, "epoch": 172} {"train_loss": -4.983388900756836, "global_step": 7256, "epoch": 172} {"train_loss": -4.784017562866211, "global_step": 7257, "epoch": 172} {"train_loss": -4.891196250915527, "global_step": 7258, "epoch": 172} {"train_loss": -4.860442161560059, "global_step": 7259, "epoch": 172} {"train_loss": -4.699346542358398, "global_step": 7260, "epoch": 172} {"train_loss": -4.842017650604248, "global_step": 7261, "epoch": 172} {"train_loss": -4.7101545333862305, "global_step": 7262, "epoch": 172} {"train_loss": -4.754280090332031, "global_step": 7263, "epoch": 172} {"train_loss": -5.0020670890808105, "global_step": 7264, "epoch": 172} {"train_loss": -4.889625083832514, "global_step": 7265, "epoch": 172, "val_loss": 85203.0078125} {"train_loss": -4.894131660461426, "global_step": 7266, "epoch": 173} {"train_loss": -4.902567386627197, "global_step": 7267, "epoch": 173} {"train_loss": -4.8440470695495605, "global_step": 7268, "epoch": 173} {"train_loss": -4.99498176574707, "global_step": 7269, "epoch": 173} {"train_loss": -4.85228157043457, "global_step": 7270, "epoch": 173} {"train_loss": -5.0517168045043945, "global_step": 7271, "epoch": 173} {"train_loss": -4.860043525695801, "global_step": 7272, "epoch": 173} {"train_loss": -5.009199142456055, "global_step": 7273, "epoch": 173} {"train_loss": -4.847461700439453, "global_step": 7274, "epoch": 173} {"train_loss": -4.955392360687256, "global_step": 7275, "epoch": 173} {"train_loss": -4.916950702667236, "global_step": 7276, "epoch": 173} {"train_loss": -4.783834934234619, "global_step": 7277, "epoch": 173} {"train_loss": -4.875065803527832, "global_step": 7278, "epoch": 173} {"train_loss": -4.907330513000488, "global_step": 7279, "epoch": 173} {"train_loss": -4.68005895614624, "global_step": 7280, "epoch": 173} {"train_loss": -4.737244606018066, "global_step": 7281, "epoch": 173} {"train_loss": -4.858891010284424, "global_step": 7282, "epoch": 173} {"train_loss": -4.842100143432617, "global_step": 7283, "epoch": 173} {"train_loss": -4.904355049133301, "global_step": 7284, "epoch": 173} {"train_loss": -4.966355800628662, "global_step": 7285, "epoch": 173} {"train_loss": -4.897165775299072, "global_step": 7286, "epoch": 173} {"train_loss": -4.929586410522461, "global_step": 7287, "epoch": 173} {"train_loss": -4.773638725280762, "global_step": 7288, "epoch": 173} {"train_loss": -4.844347953796387, "global_step": 7289, "epoch": 173} {"train_loss": -4.970351219177246, "global_step": 7290, "epoch": 173} {"train_loss": -4.7044830322265625, "global_step": 7291, "epoch": 173} {"train_loss": -4.989239692687988, "global_step": 7292, "epoch": 173} {"train_loss": -4.889298439025879, "global_step": 7293, "epoch": 173} {"train_loss": -4.7700653076171875, "global_step": 7294, "epoch": 173} {"train_loss": -4.927832126617432, "global_step": 7295, "epoch": 173} {"train_loss": -5.03450345993042, "global_step": 7296, "epoch": 173} {"train_loss": -4.938035488128662, "global_step": 7297, "epoch": 173} {"train_loss": -4.787144660949707, "global_step": 7298, "epoch": 173} {"train_loss": -4.837099075317383, "global_step": 7299, "epoch": 173} {"train_loss": -4.8613457679748535, "global_step": 7300, "epoch": 173} {"train_loss": -4.808402061462402, "global_step": 7301, "epoch": 173} {"train_loss": -4.885051727294922, "global_step": 7302, "epoch": 173} {"train_loss": -4.82765007019043, "global_step": 7303, "epoch": 173} {"train_loss": -5.001086235046387, "global_step": 7304, "epoch": 173} {"train_loss": -4.828413486480713, "global_step": 7305, "epoch": 173} {"train_loss": -4.816801071166992, "global_step": 7306, "epoch": 173} {"train_loss": -4.878122636250088, "global_step": 7307, "epoch": 173, "val_loss": 84552.9375} {"train_loss": -4.791120529174805, "global_step": 7308, "epoch": 174} {"train_loss": -4.800498008728027, "global_step": 7309, "epoch": 174} {"train_loss": -4.917379856109619, "global_step": 7310, "epoch": 174} {"train_loss": -4.787177085876465, "global_step": 7311, "epoch": 174} {"train_loss": -4.827370643615723, "global_step": 7312, "epoch": 174} {"train_loss": -4.814157485961914, "global_step": 7313, "epoch": 174} {"train_loss": -4.994087219238281, "global_step": 7314, "epoch": 174} {"train_loss": -4.874566078186035, "global_step": 7315, "epoch": 174} {"train_loss": -4.974537372589111, "global_step": 7316, "epoch": 174} {"train_loss": -4.934547424316406, "global_step": 7317, "epoch": 174} {"train_loss": -4.984871864318848, "global_step": 7318, "epoch": 174} {"train_loss": -4.898187637329102, "global_step": 7319, "epoch": 174} {"train_loss": -4.906055927276611, "global_step": 7320, "epoch": 174} {"train_loss": -4.760716438293457, "global_step": 7321, "epoch": 174} {"train_loss": -4.912118911743164, "global_step": 7322, "epoch": 174} {"train_loss": -4.772217273712158, "global_step": 7323, "epoch": 174} {"train_loss": -4.827878475189209, "global_step": 7324, "epoch": 174} {"train_loss": -5.0380449295043945, "global_step": 7325, "epoch": 174} {"train_loss": -4.8398590087890625, "global_step": 7326, "epoch": 174} {"train_loss": -4.873103141784668, "global_step": 7327, "epoch": 174} {"train_loss": -4.982257843017578, "global_step": 7328, "epoch": 174} {"train_loss": -4.7324538230896, "global_step": 7329, "epoch": 174} {"train_loss": -4.7798004150390625, "global_step": 7330, "epoch": 174} {"train_loss": -4.838065147399902, "global_step": 7331, "epoch": 174} {"train_loss": -5.039752960205078, "global_step": 7332, "epoch": 174} {"train_loss": -4.777879238128662, "global_step": 7333, "epoch": 174} {"train_loss": -4.6501312255859375, "global_step": 7334, "epoch": 174} {"train_loss": -4.920811653137207, "global_step": 7335, "epoch": 174} {"train_loss": -4.6767168045043945, "global_step": 7336, "epoch": 174} {"train_loss": -4.887932777404785, "global_step": 7337, "epoch": 174} {"train_loss": -4.843091011047363, "global_step": 7338, "epoch": 174} {"train_loss": -4.746416091918945, "global_step": 7339, "epoch": 174} {"train_loss": -5.019903182983398, "global_step": 7340, "epoch": 174} {"train_loss": -4.921322822570801, "global_step": 7341, "epoch": 174} {"train_loss": -4.636842250823975, "global_step": 7342, "epoch": 174} {"train_loss": -4.988675117492676, "global_step": 7343, "epoch": 174} {"train_loss": -4.918744087219238, "global_step": 7344, "epoch": 174} {"train_loss": -4.779421329498291, "global_step": 7345, "epoch": 174} {"train_loss": -4.898233413696289, "global_step": 7346, "epoch": 174} {"train_loss": -4.9310455322265625, "global_step": 7347, "epoch": 174} {"train_loss": -4.878931522369385, "global_step": 7348, "epoch": 174} {"train_loss": -4.865231445857456, "global_step": 7349, "epoch": 174, "val_loss": 85573.890625} {"train_loss": -4.880621910095215, "global_step": 7350, "epoch": 175} {"train_loss": -4.9333343505859375, "global_step": 7351, "epoch": 175} {"train_loss": -4.984490394592285, "global_step": 7352, "epoch": 175} {"train_loss": -4.872847080230713, "global_step": 7353, "epoch": 175} {"train_loss": -4.908529281616211, "global_step": 7354, "epoch": 175} {"train_loss": -4.80379581451416, "global_step": 7355, "epoch": 175} {"train_loss": -4.877985954284668, "global_step": 7356, "epoch": 175} {"train_loss": -4.96895694732666, "global_step": 7357, "epoch": 175} {"train_loss": -4.889678955078125, "global_step": 7358, "epoch": 175} {"train_loss": -4.951979637145996, "global_step": 7359, "epoch": 175} {"train_loss": -4.7986955642700195, "global_step": 7360, "epoch": 175} {"train_loss": -4.845527172088623, "global_step": 7361, "epoch": 175} {"train_loss": -4.803456783294678, "global_step": 7362, "epoch": 175} {"train_loss": -4.942534446716309, "global_step": 7363, "epoch": 175} {"train_loss": -4.935560703277588, "global_step": 7364, "epoch": 175} {"train_loss": -4.959901809692383, "global_step": 7365, "epoch": 175} {"train_loss": -4.978721618652344, "global_step": 7366, "epoch": 175} {"train_loss": -4.88939094543457, "global_step": 7367, "epoch": 175} {"train_loss": -4.961063385009766, "global_step": 7368, "epoch": 175} {"train_loss": -4.9545087814331055, "global_step": 7369, "epoch": 175} {"train_loss": -4.9354567527771, "global_step": 7370, "epoch": 175} {"train_loss": -5.002071380615234, "global_step": 7371, "epoch": 175} {"train_loss": -4.930987358093262, "global_step": 7372, "epoch": 175} {"train_loss": -4.850677490234375, "global_step": 7373, "epoch": 175} {"train_loss": -4.8966875076293945, "global_step": 7374, "epoch": 175} {"train_loss": -4.899751663208008, "global_step": 7375, "epoch": 175} {"train_loss": -4.843992233276367, "global_step": 7376, "epoch": 175} {"train_loss": -4.772270202636719, "global_step": 7377, "epoch": 175} {"train_loss": -4.969287872314453, "global_step": 7378, "epoch": 175} {"train_loss": -4.983038902282715, "global_step": 7379, "epoch": 175} {"train_loss": -4.927913188934326, "global_step": 7380, "epoch": 175} {"train_loss": -4.891417503356934, "global_step": 7381, "epoch": 175} {"train_loss": -4.944500923156738, "global_step": 7382, "epoch": 175} {"train_loss": -4.692275524139404, "global_step": 7383, "epoch": 175} {"train_loss": -4.808678150177002, "global_step": 7384, "epoch": 175} {"train_loss": -4.934784889221191, "global_step": 7385, "epoch": 175} {"train_loss": -4.989035129547119, "global_step": 7386, "epoch": 175} {"train_loss": -4.802196502685547, "global_step": 7387, "epoch": 175} {"train_loss": -4.751236915588379, "global_step": 7388, "epoch": 175} {"train_loss": -4.940705299377441, "global_step": 7389, "epoch": 175} {"train_loss": -4.786988258361816, "global_step": 7390, "epoch": 175} {"train_loss": -4.893727495556786, "global_step": 7391, "epoch": 175, "val_loss": 84258.4453125} {"train_loss": -4.9260993003845215, "global_step": 7392, "epoch": 176} {"train_loss": -5.033912181854248, "global_step": 7393, "epoch": 176} {"train_loss": -4.85211181640625, "global_step": 7394, "epoch": 176} {"train_loss": -4.75105619430542, "global_step": 7395, "epoch": 176} {"train_loss": -5.008376121520996, "global_step": 7396, "epoch": 176} {"train_loss": -4.901091575622559, "global_step": 7397, "epoch": 176} {"train_loss": -4.91696310043335, "global_step": 7398, "epoch": 176} {"train_loss": -4.941688537597656, "global_step": 7399, "epoch": 176} {"train_loss": -4.839946746826172, "global_step": 7400, "epoch": 176} {"train_loss": -4.765211582183838, "global_step": 7401, "epoch": 176} {"train_loss": -4.840714454650879, "global_step": 7402, "epoch": 176} {"train_loss": -4.926884651184082, "global_step": 7403, "epoch": 176} {"train_loss": -4.858586311340332, "global_step": 7404, "epoch": 176} {"train_loss": -4.92938232421875, "global_step": 7405, "epoch": 176} {"train_loss": -5.093451023101807, "global_step": 7406, "epoch": 176} {"train_loss": -4.999068260192871, "global_step": 7407, "epoch": 176} {"train_loss": -4.979168891906738, "global_step": 7408, "epoch": 176} {"train_loss": -4.90825891494751, "global_step": 7409, "epoch": 176} {"train_loss": -4.933534622192383, "global_step": 7410, "epoch": 176} {"train_loss": -4.981377601623535, "global_step": 7411, "epoch": 176} {"train_loss": -4.933915138244629, "global_step": 7412, "epoch": 176} {"train_loss": -5.002429008483887, "global_step": 7413, "epoch": 176} {"train_loss": -4.856217384338379, "global_step": 7414, "epoch": 176} {"train_loss": -5.028393745422363, "global_step": 7415, "epoch": 176} {"train_loss": -4.898425579071045, "global_step": 7416, "epoch": 176} {"train_loss": -4.698402404785156, "global_step": 7417, "epoch": 176} {"train_loss": -4.8342671394348145, "global_step": 7418, "epoch": 176} {"train_loss": -4.884446144104004, "global_step": 7419, "epoch": 176} {"train_loss": -4.735669136047363, "global_step": 7420, "epoch": 176} {"train_loss": -4.804959297180176, "global_step": 7421, "epoch": 176} {"train_loss": -4.718642234802246, "global_step": 7422, "epoch": 176} {"train_loss": -4.5628814697265625, "global_step": 7423, "epoch": 176} {"train_loss": -4.7862443923950195, "global_step": 7424, "epoch": 176} {"train_loss": -4.676002502441406, "global_step": 7425, "epoch": 176} {"train_loss": -4.719155311584473, "global_step": 7426, "epoch": 176} {"train_loss": -4.275003433227539, "global_step": 7427, "epoch": 176} {"train_loss": -4.618574142456055, "global_step": 7428, "epoch": 176} {"train_loss": -4.703649044036865, "global_step": 7429, "epoch": 176} {"train_loss": -4.728841781616211, "global_step": 7430, "epoch": 176} {"train_loss": -4.857995510101318, "global_step": 7431, "epoch": 176} {"train_loss": -4.821732044219971, "global_step": 7432, "epoch": 176} {"train_loss": -4.842249450229463, "global_step": 7433, "epoch": 176, "val_loss": 84872.1484375} {"train_loss": -4.8120503425598145, "global_step": 7434, "epoch": 177} {"train_loss": -4.904533386230469, "global_step": 7435, "epoch": 177} {"train_loss": -4.7993059158325195, "global_step": 7436, "epoch": 177} {"train_loss": -4.800479888916016, "global_step": 7437, "epoch": 177} {"train_loss": -4.820520877838135, "global_step": 7438, "epoch": 177} {"train_loss": -4.8353118896484375, "global_step": 7439, "epoch": 177} {"train_loss": -4.837420463562012, "global_step": 7440, "epoch": 177} {"train_loss": -4.825738906860352, "global_step": 7441, "epoch": 177} {"train_loss": -4.862685680389404, "global_step": 7442, "epoch": 177} {"train_loss": -4.8415679931640625, "global_step": 7443, "epoch": 177} {"train_loss": -4.860747337341309, "global_step": 7444, "epoch": 177} {"train_loss": -4.931401252746582, "global_step": 7445, "epoch": 177} {"train_loss": -4.811094284057617, "global_step": 7446, "epoch": 177} {"train_loss": -4.769980430603027, "global_step": 7447, "epoch": 177} {"train_loss": -4.949510097503662, "global_step": 7448, "epoch": 177} {"train_loss": -4.980173587799072, "global_step": 7449, "epoch": 177} {"train_loss": -4.887619972229004, "global_step": 7450, "epoch": 177} {"train_loss": -4.959561824798584, "global_step": 7451, "epoch": 177} {"train_loss": -5.003955841064453, "global_step": 7452, "epoch": 177} {"train_loss": -4.889499664306641, "global_step": 7453, "epoch": 177} {"train_loss": -4.942837238311768, "global_step": 7454, "epoch": 177} {"train_loss": -4.8768510818481445, "global_step": 7455, "epoch": 177} {"train_loss": -4.89491081237793, "global_step": 7456, "epoch": 177} {"train_loss": -4.966217041015625, "global_step": 7457, "epoch": 177} {"train_loss": -4.776304721832275, "global_step": 7458, "epoch": 177} {"train_loss": -4.943294525146484, "global_step": 7459, "epoch": 177} {"train_loss": -5.044309139251709, "global_step": 7460, "epoch": 177} {"train_loss": -4.652573585510254, "global_step": 7461, "epoch": 177} {"train_loss": -4.7177863121032715, "global_step": 7462, "epoch": 177} {"train_loss": -4.983193874359131, "global_step": 7463, "epoch": 177} {"train_loss": -4.8861470222473145, "global_step": 7464, "epoch": 177} {"train_loss": -4.807473659515381, "global_step": 7465, "epoch": 177} {"train_loss": -4.777785301208496, "global_step": 7466, "epoch": 177} {"train_loss": -4.913853645324707, "global_step": 7467, "epoch": 177} {"train_loss": -4.751914978027344, "global_step": 7468, "epoch": 177} {"train_loss": -4.93784236907959, "global_step": 7469, "epoch": 177} {"train_loss": -4.889296054840088, "global_step": 7470, "epoch": 177} {"train_loss": -4.623931884765625, "global_step": 7471, "epoch": 177} {"train_loss": -4.963756084442139, "global_step": 7472, "epoch": 177} {"train_loss": -4.849299907684326, "global_step": 7473, "epoch": 177} {"train_loss": -4.6972503662109375, "global_step": 7474, "epoch": 177} {"train_loss": -4.861063298724947, "global_step": 7475, "epoch": 177, "val_loss": 84398.8515625} {"train_loss": -4.824285984039307, "global_step": 7476, "epoch": 178} {"train_loss": -4.975003242492676, "global_step": 7477, "epoch": 178} {"train_loss": -4.806251525878906, "global_step": 7478, "epoch": 178} {"train_loss": -4.831019401550293, "global_step": 7479, "epoch": 178} {"train_loss": -4.854923248291016, "global_step": 7480, "epoch": 178} {"train_loss": -4.71401834487915, "global_step": 7481, "epoch": 178} {"train_loss": -4.723493576049805, "global_step": 7482, "epoch": 178} {"train_loss": -4.8301286697387695, "global_step": 7483, "epoch": 178} {"train_loss": -4.858498573303223, "global_step": 7484, "epoch": 178} {"train_loss": -4.84752893447876, "global_step": 7485, "epoch": 178} {"train_loss": -4.902735710144043, "global_step": 7486, "epoch": 178} {"train_loss": -4.803406238555908, "global_step": 7487, "epoch": 178} {"train_loss": -4.801668643951416, "global_step": 7488, "epoch": 178} {"train_loss": -4.755799293518066, "global_step": 7489, "epoch": 178} {"train_loss": -4.998291969299316, "global_step": 7490, "epoch": 178} {"train_loss": -4.790901184082031, "global_step": 7491, "epoch": 178} {"train_loss": -5.028369903564453, "global_step": 7492, "epoch": 178} {"train_loss": -4.940629005432129, "global_step": 7493, "epoch": 178} {"train_loss": -4.963263511657715, "global_step": 7494, "epoch": 178} {"train_loss": -4.917675971984863, "global_step": 7495, "epoch": 178} {"train_loss": -4.979353904724121, "global_step": 7496, "epoch": 178} {"train_loss": -4.904915809631348, "global_step": 7497, "epoch": 178} {"train_loss": -4.95150089263916, "global_step": 7498, "epoch": 178} {"train_loss": -4.830785274505615, "global_step": 7499, "epoch": 178} {"train_loss": -4.808853626251221, "global_step": 7500, "epoch": 178} {"train_loss": -4.77054500579834, "global_step": 7501, "epoch": 178} {"train_loss": -4.825446605682373, "global_step": 7502, "epoch": 178} {"train_loss": -5.100982189178467, "global_step": 7503, "epoch": 178} {"train_loss": -4.901241779327393, "global_step": 7504, "epoch": 178} {"train_loss": -4.9135613441467285, "global_step": 7505, "epoch": 178} {"train_loss": -4.933945655822754, "global_step": 7506, "epoch": 178} {"train_loss": -5.029915809631348, "global_step": 7507, "epoch": 178} {"train_loss": -4.873548984527588, "global_step": 7508, "epoch": 178} {"train_loss": -4.901645660400391, "global_step": 7509, "epoch": 178} {"train_loss": -4.918572425842285, "global_step": 7510, "epoch": 178} {"train_loss": -4.831863880157471, "global_step": 7511, "epoch": 178} {"train_loss": -4.882482528686523, "global_step": 7512, "epoch": 178} {"train_loss": -4.937211513519287, "global_step": 7513, "epoch": 178} {"train_loss": -4.939600467681885, "global_step": 7514, "epoch": 178} {"train_loss": -4.7870893478393555, "global_step": 7515, "epoch": 178} {"train_loss": -4.905675888061523, "global_step": 7516, "epoch": 178} {"train_loss": -4.881964274815151, "global_step": 7517, "epoch": 178, "val_loss": 84437.546875} {"train_loss": -4.96524715423584, "global_step": 7518, "epoch": 179} {"train_loss": -5.0519256591796875, "global_step": 7519, "epoch": 179} {"train_loss": -4.908669471740723, "global_step": 7520, "epoch": 179} {"train_loss": -4.897442817687988, "global_step": 7521, "epoch": 179} {"train_loss": -4.705739498138428, "global_step": 7522, "epoch": 179} {"train_loss": -4.824450492858887, "global_step": 7523, "epoch": 179} {"train_loss": -4.7437286376953125, "global_step": 7524, "epoch": 179} {"train_loss": -4.986784934997559, "global_step": 7525, "epoch": 179} {"train_loss": -4.760189533233643, "global_step": 7526, "epoch": 179} {"train_loss": -4.80649471282959, "global_step": 7527, "epoch": 179} {"train_loss": -4.772679328918457, "global_step": 7528, "epoch": 179} {"train_loss": -4.934574604034424, "global_step": 7529, "epoch": 179} {"train_loss": -4.898261070251465, "global_step": 7530, "epoch": 179} {"train_loss": -4.6382551193237305, "global_step": 7531, "epoch": 179} {"train_loss": -4.757850170135498, "global_step": 7532, "epoch": 179} {"train_loss": -4.826667785644531, "global_step": 7533, "epoch": 179} {"train_loss": -4.779072284698486, "global_step": 7534, "epoch": 179} {"train_loss": -4.846685409545898, "global_step": 7535, "epoch": 179} {"train_loss": -4.574399948120117, "global_step": 7536, "epoch": 179} {"train_loss": -4.793056488037109, "global_step": 7537, "epoch": 179} {"train_loss": -4.8903279304504395, "global_step": 7538, "epoch": 179} {"train_loss": -4.821626663208008, "global_step": 7539, "epoch": 179} {"train_loss": -4.790894031524658, "global_step": 7540, "epoch": 179} {"train_loss": -4.839677810668945, "global_step": 7541, "epoch": 179} {"train_loss": -4.829514503479004, "global_step": 7542, "epoch": 179} {"train_loss": -4.847866535186768, "global_step": 7543, "epoch": 179} {"train_loss": -4.836493015289307, "global_step": 7544, "epoch": 179} {"train_loss": -4.798242092132568, "global_step": 7545, "epoch": 179} {"train_loss": -4.928713798522949, "global_step": 7546, "epoch": 179} {"train_loss": -4.883218765258789, "global_step": 7547, "epoch": 179} {"train_loss": -4.919261932373047, "global_step": 7548, "epoch": 179} {"train_loss": -5.017710208892822, "global_step": 7549, "epoch": 179} {"train_loss": -5.039575576782227, "global_step": 7550, "epoch": 179} {"train_loss": -5.079050064086914, "global_step": 7551, "epoch": 179} {"train_loss": -4.940307140350342, "global_step": 7552, "epoch": 179} {"train_loss": -5.079714298248291, "global_step": 7553, "epoch": 179} {"train_loss": -4.940627574920654, "global_step": 7554, "epoch": 179} {"train_loss": -4.881705284118652, "global_step": 7555, "epoch": 179} {"train_loss": -5.059988021850586, "global_step": 7556, "epoch": 179} {"train_loss": -4.800158977508545, "global_step": 7557, "epoch": 179} {"train_loss": -4.8779706954956055, "global_step": 7558, "epoch": 179} {"train_loss": -4.871638093675886, "global_step": 7559, "epoch": 179, "val_loss": 82939.9453125} {"train_loss": -4.988987922668457, "global_step": 7560, "epoch": 180} {"train_loss": -4.9024834632873535, "global_step": 7561, "epoch": 180} {"train_loss": -4.85902738571167, "global_step": 7562, "epoch": 180} {"train_loss": -4.893820762634277, "global_step": 7563, "epoch": 180} {"train_loss": -5.013527870178223, "global_step": 7564, "epoch": 180} {"train_loss": -4.942023754119873, "global_step": 7565, "epoch": 180} {"train_loss": -4.8057708740234375, "global_step": 7566, "epoch": 180} {"train_loss": -4.820622444152832, "global_step": 7567, "epoch": 180} {"train_loss": -4.924524307250977, "global_step": 7568, "epoch": 180} {"train_loss": -4.898759841918945, "global_step": 7569, "epoch": 180} {"train_loss": -4.749406337738037, "global_step": 7570, "epoch": 180} {"train_loss": -4.868528366088867, "global_step": 7571, "epoch": 180} {"train_loss": -4.953707695007324, "global_step": 7572, "epoch": 180} {"train_loss": -4.487576484680176, "global_step": 7573, "epoch": 180} {"train_loss": -4.99154806137085, "global_step": 7574, "epoch": 180} {"train_loss": -4.8359222412109375, "global_step": 7575, "epoch": 180} {"train_loss": -4.676545143127441, "global_step": 7576, "epoch": 180} {"train_loss": -4.936960697174072, "global_step": 7577, "epoch": 180} {"train_loss": -4.7903923988342285, "global_step": 7578, "epoch": 180} {"train_loss": -4.746057987213135, "global_step": 7579, "epoch": 180} {"train_loss": -5.05377197265625, "global_step": 7580, "epoch": 180} {"train_loss": -4.841101169586182, "global_step": 7581, "epoch": 180} {"train_loss": -4.749539852142334, "global_step": 7582, "epoch": 180} {"train_loss": -4.973160743713379, "global_step": 7583, "epoch": 180} {"train_loss": -4.834159851074219, "global_step": 7584, "epoch": 180} {"train_loss": -4.973703861236572, "global_step": 7585, "epoch": 180} {"train_loss": -4.894474983215332, "global_step": 7586, "epoch": 180} {"train_loss": -4.996922016143799, "global_step": 7587, "epoch": 180} {"train_loss": -5.012002944946289, "global_step": 7588, "epoch": 180} {"train_loss": -4.944890975952148, "global_step": 7589, "epoch": 180} {"train_loss": -4.93807315826416, "global_step": 7590, "epoch": 180} {"train_loss": -4.9331512451171875, "global_step": 7591, "epoch": 180} {"train_loss": -5.050013065338135, "global_step": 7592, "epoch": 180} {"train_loss": -4.793047904968262, "global_step": 7593, "epoch": 180} {"train_loss": -4.865506649017334, "global_step": 7594, "epoch": 180} {"train_loss": -5.0323686599731445, "global_step": 7595, "epoch": 180} {"train_loss": -4.917384624481201, "global_step": 7596, "epoch": 180} {"train_loss": -4.921154975891113, "global_step": 7597, "epoch": 180} {"train_loss": -4.835256576538086, "global_step": 7598, "epoch": 180} {"train_loss": -4.791228294372559, "global_step": 7599, "epoch": 180} {"train_loss": -4.769587516784668, "global_step": 7600, "epoch": 180} {"train_loss": -4.879723401296706, "global_step": 7601, "epoch": 180, "val_loss": 85122.984375} {"train_loss": -4.79698371887207, "global_step": 7602, "epoch": 181} {"train_loss": -4.906002998352051, "global_step": 7603, "epoch": 181} {"train_loss": -4.914182662963867, "global_step": 7604, "epoch": 181} {"train_loss": -4.841273784637451, "global_step": 7605, "epoch": 181} {"train_loss": -4.946682453155518, "global_step": 7606, "epoch": 181} {"train_loss": -4.979857444763184, "global_step": 7607, "epoch": 181} {"train_loss": -4.85174560546875, "global_step": 7608, "epoch": 181} {"train_loss": -4.844616889953613, "global_step": 7609, "epoch": 181} {"train_loss": -4.7710747718811035, "global_step": 7610, "epoch": 181} {"train_loss": -4.943144798278809, "global_step": 7611, "epoch": 181} {"train_loss": -4.877192974090576, "global_step": 7612, "epoch": 181} {"train_loss": -4.974756240844727, "global_step": 7613, "epoch": 181} {"train_loss": -4.922665596008301, "global_step": 7614, "epoch": 181} {"train_loss": -4.987980842590332, "global_step": 7615, "epoch": 181} {"train_loss": -4.876652240753174, "global_step": 7616, "epoch": 181} {"train_loss": -4.752306938171387, "global_step": 7617, "epoch": 181} {"train_loss": -4.957733154296875, "global_step": 7618, "epoch": 181} {"train_loss": -4.656397819519043, "global_step": 7619, "epoch": 181} {"train_loss": -4.897826194763184, "global_step": 7620, "epoch": 181} {"train_loss": -4.963881492614746, "global_step": 7621, "epoch": 181} {"train_loss": -4.839437484741211, "global_step": 7622, "epoch": 181} {"train_loss": -4.905093193054199, "global_step": 7623, "epoch": 181} {"train_loss": -5.0529937744140625, "global_step": 7624, "epoch": 181} {"train_loss": -4.967859745025635, "global_step": 7625, "epoch": 181} {"train_loss": -4.925198554992676, "global_step": 7626, "epoch": 181} {"train_loss": -4.918291091918945, "global_step": 7627, "epoch": 181} {"train_loss": -5.094000816345215, "global_step": 7628, "epoch": 181} {"train_loss": -4.996286392211914, "global_step": 7629, "epoch": 181} {"train_loss": -5.005504131317139, "global_step": 7630, "epoch": 181} {"train_loss": -4.960968494415283, "global_step": 7631, "epoch": 181} {"train_loss": -4.885408401489258, "global_step": 7632, "epoch": 181} {"train_loss": -4.813277244567871, "global_step": 7633, "epoch": 181} {"train_loss": -4.725324630737305, "global_step": 7634, "epoch": 181} {"train_loss": -4.895175933837891, "global_step": 7635, "epoch": 181} {"train_loss": -4.631823539733887, "global_step": 7636, "epoch": 181} {"train_loss": -4.758332252502441, "global_step": 7637, "epoch": 181} {"train_loss": -4.387576580047607, "global_step": 7638, "epoch": 181} {"train_loss": -4.665472030639648, "global_step": 7639, "epoch": 181} {"train_loss": -4.788674354553223, "global_step": 7640, "epoch": 181} {"train_loss": -4.596665382385254, "global_step": 7641, "epoch": 181} {"train_loss": -4.890448093414307, "global_step": 7642, "epoch": 181} {"train_loss": -4.858488502956572, "global_step": 7643, "epoch": 181, "val_loss": 86642.125} {"train_loss": -4.607754230499268, "global_step": 7644, "epoch": 182} {"train_loss": -4.8510942459106445, "global_step": 7645, "epoch": 182} {"train_loss": -4.653905868530273, "global_step": 7646, "epoch": 182} {"train_loss": -4.865199089050293, "global_step": 7647, "epoch": 182} {"train_loss": -4.632248401641846, "global_step": 7648, "epoch": 182} {"train_loss": -4.830421447753906, "global_step": 7649, "epoch": 182} {"train_loss": -4.808929443359375, "global_step": 7650, "epoch": 182} {"train_loss": -4.9156341552734375, "global_step": 7651, "epoch": 182} {"train_loss": -4.885746955871582, "global_step": 7652, "epoch": 182} {"train_loss": -4.759566307067871, "global_step": 7653, "epoch": 182} {"train_loss": -4.772216320037842, "global_step": 7654, "epoch": 182} {"train_loss": -4.812689781188965, "global_step": 7655, "epoch": 182} {"train_loss": -4.864489555358887, "global_step": 7656, "epoch": 182} {"train_loss": -4.989002227783203, "global_step": 7657, "epoch": 182} {"train_loss": -4.8338303565979, "global_step": 7658, "epoch": 182} {"train_loss": -4.867206573486328, "global_step": 7659, "epoch": 182} {"train_loss": -4.925771713256836, "global_step": 7660, "epoch": 182} {"train_loss": -4.9524030685424805, "global_step": 7661, "epoch": 182} {"train_loss": -4.932727813720703, "global_step": 7662, "epoch": 182} {"train_loss": -4.977160453796387, "global_step": 7663, "epoch": 182} {"train_loss": -4.992410659790039, "global_step": 7664, "epoch": 182} {"train_loss": -4.969590187072754, "global_step": 7665, "epoch": 182} {"train_loss": -4.9952311515808105, "global_step": 7666, "epoch": 182} {"train_loss": -4.921970844268799, "global_step": 7667, "epoch": 182} {"train_loss": -5.08186149597168, "global_step": 7668, "epoch": 182} {"train_loss": -4.868896484375, "global_step": 7669, "epoch": 182} {"train_loss": -4.983671188354492, "global_step": 7670, "epoch": 182} {"train_loss": -4.967710971832275, "global_step": 7671, "epoch": 182} {"train_loss": -4.973134994506836, "global_step": 7672, "epoch": 182} {"train_loss": -4.868350505828857, "global_step": 7673, "epoch": 182} {"train_loss": -4.951119422912598, "global_step": 7674, "epoch": 182} {"train_loss": -4.938176155090332, "global_step": 7675, "epoch": 182} {"train_loss": -4.961108207702637, "global_step": 7676, "epoch": 182} {"train_loss": -4.730134010314941, "global_step": 7677, "epoch": 182} {"train_loss": -4.896947860717773, "global_step": 7678, "epoch": 182} {"train_loss": -4.90254020690918, "global_step": 7679, "epoch": 182} {"train_loss": -4.851691246032715, "global_step": 7680, "epoch": 182} {"train_loss": -4.909351825714111, "global_step": 7681, "epoch": 182} {"train_loss": -4.83317232131958, "global_step": 7682, "epoch": 182} {"train_loss": -4.962584495544434, "global_step": 7683, "epoch": 182} {"train_loss": -4.839850425720215, "global_step": 7684, "epoch": 182} {"train_loss": -4.88162864957537, "global_step": 7685, "epoch": 182, "val_loss": 85117.375} {"train_loss": -4.948622703552246, "global_step": 7686, "epoch": 183} {"train_loss": -5.036555767059326, "global_step": 7687, "epoch": 183} {"train_loss": -4.8472819328308105, "global_step": 7688, "epoch": 183} {"train_loss": -4.902413368225098, "global_step": 7689, "epoch": 183} {"train_loss": -4.835846424102783, "global_step": 7690, "epoch": 183} {"train_loss": -4.873950004577637, "global_step": 7691, "epoch": 183} {"train_loss": -4.948177337646484, "global_step": 7692, "epoch": 183} {"train_loss": -4.947244644165039, "global_step": 7693, "epoch": 183} {"train_loss": -4.939021587371826, "global_step": 7694, "epoch": 183} {"train_loss": -4.889297008514404, "global_step": 7695, "epoch": 183} {"train_loss": -5.1034674644470215, "global_step": 7696, "epoch": 183} {"train_loss": -5.039377212524414, "global_step": 7697, "epoch": 183} {"train_loss": -4.881853103637695, "global_step": 7698, "epoch": 183} {"train_loss": -4.97506046295166, "global_step": 7699, "epoch": 183} {"train_loss": -4.991668224334717, "global_step": 7700, "epoch": 183} {"train_loss": -4.938908100128174, "global_step": 7701, "epoch": 183} {"train_loss": -4.930575847625732, "global_step": 7702, "epoch": 183} {"train_loss": -4.877898693084717, "global_step": 7703, "epoch": 183} {"train_loss": -4.911059379577637, "global_step": 7704, "epoch": 183} {"train_loss": -4.900137901306152, "global_step": 7705, "epoch": 183} {"train_loss": -4.970396518707275, "global_step": 7706, "epoch": 183} {"train_loss": -4.822771072387695, "global_step": 7707, "epoch": 183} {"train_loss": -4.888901710510254, "global_step": 7708, "epoch": 183} {"train_loss": -4.96600341796875, "global_step": 7709, "epoch": 183} {"train_loss": -4.8378801345825195, "global_step": 7710, "epoch": 183} {"train_loss": -4.879665851593018, "global_step": 7711, "epoch": 183} {"train_loss": -5.07097053527832, "global_step": 7712, "epoch": 183} {"train_loss": -4.948940277099609, "global_step": 7713, "epoch": 183} {"train_loss": -4.923790454864502, "global_step": 7714, "epoch": 183} {"train_loss": -5.025918006896973, "global_step": 7715, "epoch": 183} {"train_loss": -4.872882843017578, "global_step": 7716, "epoch": 183} {"train_loss": -4.97218132019043, "global_step": 7717, "epoch": 183} {"train_loss": -5.015202522277832, "global_step": 7718, "epoch": 183} {"train_loss": -4.881711959838867, "global_step": 7719, "epoch": 183} {"train_loss": -4.841897010803223, "global_step": 7720, "epoch": 183} {"train_loss": -4.886164665222168, "global_step": 7721, "epoch": 183} {"train_loss": -4.8086042404174805, "global_step": 7722, "epoch": 183} {"train_loss": -5.071977615356445, "global_step": 7723, "epoch": 183} {"train_loss": -5.04773473739624, "global_step": 7724, "epoch": 183} {"train_loss": -4.822508811950684, "global_step": 7725, "epoch": 183} {"train_loss": -4.873538017272949, "global_step": 7726, "epoch": 183} {"train_loss": -4.931205999283564, "global_step": 7727, "epoch": 183, "val_loss": 87968.5625} {"train_loss": -4.384183406829834, "global_step": 7728, "epoch": 184} {"train_loss": -4.788002967834473, "global_step": 7729, "epoch": 184} {"train_loss": -4.86020565032959, "global_step": 7730, "epoch": 184} {"train_loss": -4.749285697937012, "global_step": 7731, "epoch": 184} {"train_loss": -4.79421854019165, "global_step": 7732, "epoch": 184} {"train_loss": -4.939826965332031, "global_step": 7733, "epoch": 184} {"train_loss": -4.60773229598999, "global_step": 7734, "epoch": 184} {"train_loss": -4.865131855010986, "global_step": 7735, "epoch": 184} {"train_loss": -4.895777702331543, "global_step": 7736, "epoch": 184} {"train_loss": -5.018430709838867, "global_step": 7737, "epoch": 184} {"train_loss": -4.934928894042969, "global_step": 7738, "epoch": 184} {"train_loss": -4.940868854522705, "global_step": 7739, "epoch": 184} {"train_loss": -4.785299777984619, "global_step": 7740, "epoch": 184} {"train_loss": -5.018537521362305, "global_step": 7741, "epoch": 184} {"train_loss": -5.023622035980225, "global_step": 7742, "epoch": 184} {"train_loss": -5.001893997192383, "global_step": 7743, "epoch": 184} {"train_loss": -4.874180793762207, "global_step": 7744, "epoch": 184} {"train_loss": -5.044438362121582, "global_step": 7745, "epoch": 184} {"train_loss": -4.990574836730957, "global_step": 7746, "epoch": 184} {"train_loss": -4.897329807281494, "global_step": 7747, "epoch": 184} {"train_loss": -4.975374221801758, "global_step": 7748, "epoch": 184} {"train_loss": -5.001715183258057, "global_step": 7749, "epoch": 184} {"train_loss": -5.043795585632324, "global_step": 7750, "epoch": 184} {"train_loss": -4.860262870788574, "global_step": 7751, "epoch": 184} {"train_loss": -4.886889457702637, "global_step": 7752, "epoch": 184} {"train_loss": -4.990582466125488, "global_step": 7753, "epoch": 184} {"train_loss": -4.8810954093933105, "global_step": 7754, "epoch": 184} {"train_loss": -5.042179107666016, "global_step": 7755, "epoch": 184} {"train_loss": -4.902735710144043, "global_step": 7756, "epoch": 184} {"train_loss": -4.960858345031738, "global_step": 7757, "epoch": 184} {"train_loss": -4.8813018798828125, "global_step": 7758, "epoch": 184} {"train_loss": -4.931751251220703, "global_step": 7759, "epoch": 184} {"train_loss": -4.998896598815918, "global_step": 7760, "epoch": 184} {"train_loss": -5.115029335021973, "global_step": 7761, "epoch": 184} {"train_loss": -4.987748146057129, "global_step": 7762, "epoch": 184} {"train_loss": -4.845287799835205, "global_step": 7763, "epoch": 184} {"train_loss": -5.082889556884766, "global_step": 7764, "epoch": 184} {"train_loss": -4.978696823120117, "global_step": 7765, "epoch": 184} {"train_loss": -5.060501575469971, "global_step": 7766, "epoch": 184} {"train_loss": -4.875592231750488, "global_step": 7767, "epoch": 184} {"train_loss": -4.945202827453613, "global_step": 7768, "epoch": 184} {"train_loss": -4.917664868491037, "global_step": 7769, "epoch": 184, "val_loss": 83552.8359375} {"train_loss": -5.098567962646484, "global_step": 7770, "epoch": 185} {"train_loss": -4.942367076873779, "global_step": 7771, "epoch": 185} {"train_loss": -4.977323055267334, "global_step": 7772, "epoch": 185} {"train_loss": -4.926947116851807, "global_step": 7773, "epoch": 185} {"train_loss": -4.795355796813965, "global_step": 7774, "epoch": 185} {"train_loss": -4.632946968078613, "global_step": 7775, "epoch": 185} {"train_loss": -4.84242057800293, "global_step": 7776, "epoch": 185} {"train_loss": -4.615747451782227, "global_step": 7777, "epoch": 185} {"train_loss": -4.908443450927734, "global_step": 7778, "epoch": 185} {"train_loss": -4.900294303894043, "global_step": 7779, "epoch": 185} {"train_loss": -4.796210289001465, "global_step": 7780, "epoch": 185} {"train_loss": -5.036823272705078, "global_step": 7781, "epoch": 185} {"train_loss": -4.833474636077881, "global_step": 7782, "epoch": 185} {"train_loss": -4.895120620727539, "global_step": 7783, "epoch": 185} {"train_loss": -4.902286529541016, "global_step": 7784, "epoch": 185} {"train_loss": -4.797895908355713, "global_step": 7785, "epoch": 185} {"train_loss": -4.776437759399414, "global_step": 7786, "epoch": 185} {"train_loss": -4.665807723999023, "global_step": 7787, "epoch": 185} {"train_loss": -4.9356794357299805, "global_step": 7788, "epoch": 185} {"train_loss": -4.714576244354248, "global_step": 7789, "epoch": 185} {"train_loss": -4.845200538635254, "global_step": 7790, "epoch": 185} {"train_loss": -4.989326477050781, "global_step": 7791, "epoch": 185} {"train_loss": -4.713872909545898, "global_step": 7792, "epoch": 185} {"train_loss": -5.027347564697266, "global_step": 7793, "epoch": 185} {"train_loss": -4.737452030181885, "global_step": 7794, "epoch": 185} {"train_loss": -4.888637542724609, "global_step": 7795, "epoch": 185} {"train_loss": -4.755624771118164, "global_step": 7796, "epoch": 185} {"train_loss": -4.824102401733398, "global_step": 7797, "epoch": 185} {"train_loss": -4.872824668884277, "global_step": 7798, "epoch": 185} {"train_loss": -4.866844654083252, "global_step": 7799, "epoch": 185} {"train_loss": -4.775895118713379, "global_step": 7800, "epoch": 185} {"train_loss": -4.916936874389648, "global_step": 7801, "epoch": 185} {"train_loss": -4.973929405212402, "global_step": 7802, "epoch": 185} {"train_loss": -5.012358665466309, "global_step": 7803, "epoch": 185} {"train_loss": -4.989129543304443, "global_step": 7804, "epoch": 185} {"train_loss": -4.949100971221924, "global_step": 7805, "epoch": 185} {"train_loss": -5.005462646484375, "global_step": 7806, "epoch": 185} {"train_loss": -4.807682514190674, "global_step": 7807, "epoch": 185} {"train_loss": -4.909671783447266, "global_step": 7808, "epoch": 185} {"train_loss": -4.890303134918213, "global_step": 7809, "epoch": 185} {"train_loss": -4.912199020385742, "global_step": 7810, "epoch": 185} {"train_loss": -4.870089916955857, "global_step": 7811, "epoch": 185, "val_loss": 84556.7734375} {"train_loss": -4.91815710067749, "global_step": 7812, "epoch": 186} {"train_loss": -4.981656074523926, "global_step": 7813, "epoch": 186} {"train_loss": -4.739011764526367, "global_step": 7814, "epoch": 186} {"train_loss": -4.89376974105835, "global_step": 7815, "epoch": 186} {"train_loss": -4.986507415771484, "global_step": 7816, "epoch": 186} {"train_loss": -5.028549671173096, "global_step": 7817, "epoch": 186} {"train_loss": -4.683859348297119, "global_step": 7818, "epoch": 186} {"train_loss": -5.012251853942871, "global_step": 7819, "epoch": 186} {"train_loss": -4.7976603507995605, "global_step": 7820, "epoch": 186} {"train_loss": -4.366761207580566, "global_step": 7821, "epoch": 186} {"train_loss": -4.951049327850342, "global_step": 7822, "epoch": 186} {"train_loss": -4.597307205200195, "global_step": 7823, "epoch": 186} {"train_loss": -4.670665264129639, "global_step": 7824, "epoch": 186} {"train_loss": -4.922661304473877, "global_step": 7825, "epoch": 186} {"train_loss": -4.614812850952148, "global_step": 7826, "epoch": 186} {"train_loss": -4.933797836303711, "global_step": 7827, "epoch": 186} {"train_loss": -4.80851936340332, "global_step": 7828, "epoch": 186} {"train_loss": -4.807376861572266, "global_step": 7829, "epoch": 186} {"train_loss": -4.74272346496582, "global_step": 7830, "epoch": 186} {"train_loss": -4.921363353729248, "global_step": 7831, "epoch": 186} {"train_loss": -4.860857963562012, "global_step": 7832, "epoch": 186} {"train_loss": -5.088901519775391, "global_step": 7833, "epoch": 186} {"train_loss": -4.850724220275879, "global_step": 7834, "epoch": 186} {"train_loss": -4.954697608947754, "global_step": 7835, "epoch": 186} {"train_loss": -4.689525604248047, "global_step": 7836, "epoch": 186} {"train_loss": -4.876391410827637, "global_step": 7837, "epoch": 186} {"train_loss": -4.78535270690918, "global_step": 7838, "epoch": 186} {"train_loss": -4.828639507293701, "global_step": 7839, "epoch": 186} {"train_loss": -4.8470916748046875, "global_step": 7840, "epoch": 186} {"train_loss": -4.951037883758545, "global_step": 7841, "epoch": 186} {"train_loss": -4.906799793243408, "global_step": 7842, "epoch": 186} {"train_loss": -4.927946090698242, "global_step": 7843, "epoch": 186} {"train_loss": -4.92226505279541, "global_step": 7844, "epoch": 186} {"train_loss": -4.961331367492676, "global_step": 7845, "epoch": 186} {"train_loss": -4.989129066467285, "global_step": 7846, "epoch": 186} {"train_loss": -5.008392333984375, "global_step": 7847, "epoch": 186} {"train_loss": -4.967955589294434, "global_step": 7848, "epoch": 186} {"train_loss": -4.902704238891602, "global_step": 7849, "epoch": 186} {"train_loss": -4.836146354675293, "global_step": 7850, "epoch": 186} {"train_loss": -4.9467668533325195, "global_step": 7851, "epoch": 186} {"train_loss": -4.895675182342529, "global_step": 7852, "epoch": 186} {"train_loss": -4.864896853764852, "global_step": 7853, "epoch": 186, "val_loss": 83815.859375} {"train_loss": -4.866809844970703, "global_step": 7854, "epoch": 187} {"train_loss": -4.856881618499756, "global_step": 7855, "epoch": 187} {"train_loss": -4.996307373046875, "global_step": 7856, "epoch": 187} {"train_loss": -4.9502153396606445, "global_step": 7857, "epoch": 187} {"train_loss": -4.878761291503906, "global_step": 7858, "epoch": 187} {"train_loss": -4.889714241027832, "global_step": 7859, "epoch": 187} {"train_loss": -4.954069137573242, "global_step": 7860, "epoch": 187} {"train_loss": -4.767681121826172, "global_step": 7861, "epoch": 187} {"train_loss": -4.878386497497559, "global_step": 7862, "epoch": 187} {"train_loss": -4.9157915115356445, "global_step": 7863, "epoch": 187} {"train_loss": -4.802078723907471, "global_step": 7864, "epoch": 187} {"train_loss": -4.912527084350586, "global_step": 7865, "epoch": 187} {"train_loss": -5.029969692230225, "global_step": 7866, "epoch": 187} {"train_loss": -4.8923821449279785, "global_step": 7867, "epoch": 187} {"train_loss": -4.819143295288086, "global_step": 7868, "epoch": 187} {"train_loss": -4.833904266357422, "global_step": 7869, "epoch": 187} {"train_loss": -4.952032089233398, "global_step": 7870, "epoch": 187} {"train_loss": -4.8764801025390625, "global_step": 7871, "epoch": 187} {"train_loss": -4.8921403884887695, "global_step": 7872, "epoch": 187} {"train_loss": -4.95277214050293, "global_step": 7873, "epoch": 187} {"train_loss": -4.88950777053833, "global_step": 7874, "epoch": 187} {"train_loss": -4.849023342132568, "global_step": 7875, "epoch": 187} {"train_loss": -4.956268310546875, "global_step": 7876, "epoch": 187} {"train_loss": -4.857455253601074, "global_step": 7877, "epoch": 187} {"train_loss": -4.908023357391357, "global_step": 7878, "epoch": 187} {"train_loss": -4.997036457061768, "global_step": 7879, "epoch": 187} {"train_loss": -4.904794216156006, "global_step": 7880, "epoch": 187} {"train_loss": -5.015067100524902, "global_step": 7881, "epoch": 187} {"train_loss": -5.108590126037598, "global_step": 7882, "epoch": 187} {"train_loss": -5.12508487701416, "global_step": 7883, "epoch": 187} {"train_loss": -4.940213203430176, "global_step": 7884, "epoch": 187} {"train_loss": -4.946725845336914, "global_step": 7885, "epoch": 187} {"train_loss": -5.193654537200928, "global_step": 7886, "epoch": 187} {"train_loss": -4.8972673416137695, "global_step": 7887, "epoch": 187} {"train_loss": -5.01688289642334, "global_step": 7888, "epoch": 187} {"train_loss": -5.084959983825684, "global_step": 7889, "epoch": 187} {"train_loss": -5.022330284118652, "global_step": 7890, "epoch": 187} {"train_loss": -4.948459625244141, "global_step": 7891, "epoch": 187} {"train_loss": -4.999936103820801, "global_step": 7892, "epoch": 187} {"train_loss": -4.949268817901611, "global_step": 7893, "epoch": 187} {"train_loss": -4.922100067138672, "global_step": 7894, "epoch": 187} {"train_loss": -4.941508985701061, "global_step": 7895, "epoch": 187, "val_loss": 82980.9921875} {"train_loss": -4.966135025024414, "global_step": 7896, "epoch": 188} {"train_loss": -4.857141017913818, "global_step": 7897, "epoch": 188} {"train_loss": -4.992809295654297, "global_step": 7898, "epoch": 188} {"train_loss": -5.072404861450195, "global_step": 7899, "epoch": 188} {"train_loss": -4.934317111968994, "global_step": 7900, "epoch": 188} {"train_loss": -5.0715742111206055, "global_step": 7901, "epoch": 188} {"train_loss": -4.925328254699707, "global_step": 7902, "epoch": 188} {"train_loss": -4.996359348297119, "global_step": 7903, "epoch": 188} {"train_loss": -4.853429317474365, "global_step": 7904, "epoch": 188} {"train_loss": -4.8177008628845215, "global_step": 7905, "epoch": 188} {"train_loss": -4.777780532836914, "global_step": 7906, "epoch": 188} {"train_loss": -4.920401096343994, "global_step": 7907, "epoch": 188} {"train_loss": -4.862627029418945, "global_step": 7908, "epoch": 188} {"train_loss": -4.803713798522949, "global_step": 7909, "epoch": 188} {"train_loss": -4.777698516845703, "global_step": 7910, "epoch": 188} {"train_loss": -4.938682556152344, "global_step": 7911, "epoch": 188} {"train_loss": -4.6928606033325195, "global_step": 7912, "epoch": 188} {"train_loss": -4.905149459838867, "global_step": 7913, "epoch": 188} {"train_loss": -4.812351226806641, "global_step": 7914, "epoch": 188} {"train_loss": -4.850505828857422, "global_step": 7915, "epoch": 188} {"train_loss": -4.853353500366211, "global_step": 7916, "epoch": 188} {"train_loss": -4.825248718261719, "global_step": 7917, "epoch": 188} {"train_loss": -4.795589447021484, "global_step": 7918, "epoch": 188} {"train_loss": -4.919057846069336, "global_step": 7919, "epoch": 188} {"train_loss": -4.927687644958496, "global_step": 7920, "epoch": 188} {"train_loss": -4.99163818359375, "global_step": 7921, "epoch": 188} {"train_loss": -4.95779275894165, "global_step": 7922, "epoch": 188} {"train_loss": -4.99329948425293, "global_step": 7923, "epoch": 188} {"train_loss": -4.9678473472595215, "global_step": 7924, "epoch": 188} {"train_loss": -4.902524948120117, "global_step": 7925, "epoch": 188} {"train_loss": -4.928935527801514, "global_step": 7926, "epoch": 188} {"train_loss": -5.029682159423828, "global_step": 7927, "epoch": 188} {"train_loss": -4.948532581329346, "global_step": 7928, "epoch": 188} {"train_loss": -4.787814140319824, "global_step": 7929, "epoch": 188} {"train_loss": -4.924896717071533, "global_step": 7930, "epoch": 188} {"train_loss": -4.877915382385254, "global_step": 7931, "epoch": 188} {"train_loss": -4.923649787902832, "global_step": 7932, "epoch": 188} {"train_loss": -4.930121898651123, "global_step": 7933, "epoch": 188} {"train_loss": -4.891848564147949, "global_step": 7934, "epoch": 188} {"train_loss": -5.00937557220459, "global_step": 7935, "epoch": 188} {"train_loss": -4.979852676391602, "global_step": 7936, "epoch": 188} {"train_loss": -4.913429793857393, "global_step": 7937, "epoch": 188, "val_loss": 84015.6640625} {"train_loss": -4.888835906982422, "global_step": 7938, "epoch": 189} {"train_loss": -5.082378387451172, "global_step": 7939, "epoch": 189} {"train_loss": -4.961404800415039, "global_step": 7940, "epoch": 189} {"train_loss": -4.935137748718262, "global_step": 7941, "epoch": 189} {"train_loss": -4.983572959899902, "global_step": 7942, "epoch": 189} {"train_loss": -4.787191867828369, "global_step": 7943, "epoch": 189} {"train_loss": -4.842621326446533, "global_step": 7944, "epoch": 189} {"train_loss": -4.992532253265381, "global_step": 7945, "epoch": 189} {"train_loss": -5.012534141540527, "global_step": 7946, "epoch": 189} {"train_loss": -4.942858695983887, "global_step": 7947, "epoch": 189} {"train_loss": -5.026666164398193, "global_step": 7948, "epoch": 189} {"train_loss": -5.047538757324219, "global_step": 7949, "epoch": 189} {"train_loss": -4.822820663452148, "global_step": 7950, "epoch": 189} {"train_loss": -4.94257926940918, "global_step": 7951, "epoch": 189} {"train_loss": -5.130188941955566, "global_step": 7952, "epoch": 189} {"train_loss": -4.813553333282471, "global_step": 7953, "epoch": 189} {"train_loss": -5.048006057739258, "global_step": 7954, "epoch": 189} {"train_loss": -4.950963973999023, "global_step": 7955, "epoch": 189} {"train_loss": -4.916460990905762, "global_step": 7956, "epoch": 189} {"train_loss": -5.032825469970703, "global_step": 7957, "epoch": 189} {"train_loss": -4.999595642089844, "global_step": 7958, "epoch": 189} {"train_loss": -4.87545108795166, "global_step": 7959, "epoch": 189} {"train_loss": -4.905574321746826, "global_step": 7960, "epoch": 189} {"train_loss": -4.900264739990234, "global_step": 7961, "epoch": 189} {"train_loss": -4.697834014892578, "global_step": 7962, "epoch": 189} {"train_loss": -4.865960121154785, "global_step": 7963, "epoch": 189} {"train_loss": -5.030899524688721, "global_step": 7964, "epoch": 189} {"train_loss": -4.9776153564453125, "global_step": 7965, "epoch": 189} {"train_loss": -4.965143203735352, "global_step": 7966, "epoch": 189} {"train_loss": -4.870963096618652, "global_step": 7967, "epoch": 189} {"train_loss": -4.95713996887207, "global_step": 7968, "epoch": 189} {"train_loss": -4.900354385375977, "global_step": 7969, "epoch": 189} {"train_loss": -5.0015411376953125, "global_step": 7970, "epoch": 189} {"train_loss": -4.824897289276123, "global_step": 7971, "epoch": 189} {"train_loss": -4.998614311218262, "global_step": 7972, "epoch": 189} {"train_loss": -5.005838394165039, "global_step": 7973, "epoch": 189} {"train_loss": -4.849508285522461, "global_step": 7974, "epoch": 189} {"train_loss": -4.869212627410889, "global_step": 7975, "epoch": 189} {"train_loss": -4.84999942779541, "global_step": 7976, "epoch": 189} {"train_loss": -4.98574161529541, "global_step": 7977, "epoch": 189} {"train_loss": -5.023419380187988, "global_step": 7978, "epoch": 189} {"train_loss": -4.940859102067494, "global_step": 7979, "epoch": 189, "val_loss": 83527.5859375} {"train_loss": -4.9881744384765625, "global_step": 7980, "epoch": 190} {"train_loss": -4.8778862953186035, "global_step": 7981, "epoch": 190} {"train_loss": -4.910627365112305, "global_step": 7982, "epoch": 190} {"train_loss": -5.017266273498535, "global_step": 7983, "epoch": 190} {"train_loss": -4.931537628173828, "global_step": 7984, "epoch": 190} {"train_loss": -4.9277801513671875, "global_step": 7985, "epoch": 190} {"train_loss": -5.083391189575195, "global_step": 7986, "epoch": 190} {"train_loss": -5.053027629852295, "global_step": 7987, "epoch": 190} {"train_loss": -5.020393371582031, "global_step": 7988, "epoch": 190} {"train_loss": -4.999418258666992, "global_step": 7989, "epoch": 190} {"train_loss": -5.020152568817139, "global_step": 7990, "epoch": 190} {"train_loss": -5.03994083404541, "global_step": 7991, "epoch": 190} {"train_loss": -5.07282829284668, "global_step": 7992, "epoch": 190} {"train_loss": -4.95681095123291, "global_step": 7993, "epoch": 190} {"train_loss": -4.7528228759765625, "global_step": 7994, "epoch": 190} {"train_loss": -4.8309125900268555, "global_step": 7995, "epoch": 190} {"train_loss": -4.882652282714844, "global_step": 7996, "epoch": 190} {"train_loss": -4.957763671875, "global_step": 7997, "epoch": 190} {"train_loss": -4.664149761199951, "global_step": 7998, "epoch": 190} {"train_loss": -4.935574531555176, "global_step": 7999, "epoch": 190} {"train_loss": -5.049676418304443, "global_step": 8000, "epoch": 190} {"train_loss": -4.885527610778809, "global_step": 8001, "epoch": 190} {"train_loss": -4.763114929199219, "global_step": 8002, "epoch": 190} {"train_loss": -4.922086715698242, "global_step": 8003, "epoch": 190} {"train_loss": -4.76836633682251, "global_step": 8004, "epoch": 190} {"train_loss": -4.905768871307373, "global_step": 8005, "epoch": 190} {"train_loss": -4.909524917602539, "global_step": 8006, "epoch": 190} {"train_loss": -4.957463264465332, "global_step": 8007, "epoch": 190} {"train_loss": -5.064647197723389, "global_step": 8008, "epoch": 190} {"train_loss": -4.783517360687256, "global_step": 8009, "epoch": 190} {"train_loss": -4.798905372619629, "global_step": 8010, "epoch": 190} {"train_loss": -4.832998275756836, "global_step": 8011, "epoch": 190} {"train_loss": -4.951952934265137, "global_step": 8012, "epoch": 190} {"train_loss": -5.037274360656738, "global_step": 8013, "epoch": 190} {"train_loss": -4.71826696395874, "global_step": 8014, "epoch": 190} {"train_loss": -4.975930213928223, "global_step": 8015, "epoch": 190} {"train_loss": -4.750302791595459, "global_step": 8016, "epoch": 190} {"train_loss": -4.766080856323242, "global_step": 8017, "epoch": 190} {"train_loss": -4.986368179321289, "global_step": 8018, "epoch": 190} {"train_loss": -4.769110679626465, "global_step": 8019, "epoch": 190} {"train_loss": -5.100639343261719, "global_step": 8020, "epoch": 190} {"train_loss": -4.918428682145619, "global_step": 8021, "epoch": 190, "val_loss": 84265.4921875} {"train_loss": -4.931900978088379, "global_step": 8022, "epoch": 191} {"train_loss": -4.877620220184326, "global_step": 8023, "epoch": 191} {"train_loss": -4.578370094299316, "global_step": 8024, "epoch": 191} {"train_loss": -4.850655555725098, "global_step": 8025, "epoch": 191} {"train_loss": -4.758517742156982, "global_step": 8026, "epoch": 191} {"train_loss": -4.737971305847168, "global_step": 8027, "epoch": 191} {"train_loss": -4.733097076416016, "global_step": 8028, "epoch": 191} {"train_loss": -4.905365943908691, "global_step": 8029, "epoch": 191} {"train_loss": -4.568428039550781, "global_step": 8030, "epoch": 191} {"train_loss": -4.840987205505371, "global_step": 8031, "epoch": 191} {"train_loss": -4.846973896026611, "global_step": 8032, "epoch": 191} {"train_loss": -4.945895671844482, "global_step": 8033, "epoch": 191} {"train_loss": -4.776976585388184, "global_step": 8034, "epoch": 191} {"train_loss": -4.913266181945801, "global_step": 8035, "epoch": 191} {"train_loss": -4.715192794799805, "global_step": 8036, "epoch": 191} {"train_loss": -4.843410015106201, "global_step": 8037, "epoch": 191} {"train_loss": -4.830719947814941, "global_step": 8038, "epoch": 191} {"train_loss": -4.806488037109375, "global_step": 8039, "epoch": 191} {"train_loss": -4.914071083068848, "global_step": 8040, "epoch": 191} {"train_loss": -4.91317892074585, "global_step": 8041, "epoch": 191} {"train_loss": -4.907153129577637, "global_step": 8042, "epoch": 191} {"train_loss": -5.048601150512695, "global_step": 8043, "epoch": 191} {"train_loss": -5.06752347946167, "global_step": 8044, "epoch": 191} {"train_loss": -4.972929000854492, "global_step": 8045, "epoch": 191} {"train_loss": -4.9451446533203125, "global_step": 8046, "epoch": 191} {"train_loss": -5.159295558929443, "global_step": 8047, "epoch": 191} {"train_loss": -4.99666690826416, "global_step": 8048, "epoch": 191} {"train_loss": -4.967832565307617, "global_step": 8049, "epoch": 191} {"train_loss": -4.9640607833862305, "global_step": 8050, "epoch": 191} {"train_loss": -4.9375505447387695, "global_step": 8051, "epoch": 191} {"train_loss": -4.9987335205078125, "global_step": 8052, "epoch": 191} {"train_loss": -4.993666172027588, "global_step": 8053, "epoch": 191} {"train_loss": -4.961938858032227, "global_step": 8054, "epoch": 191} {"train_loss": -4.969259262084961, "global_step": 8055, "epoch": 191} {"train_loss": -4.93051815032959, "global_step": 8056, "epoch": 191} {"train_loss": -5.058746814727783, "global_step": 8057, "epoch": 191} {"train_loss": -4.934525966644287, "global_step": 8058, "epoch": 191} {"train_loss": -4.909207344055176, "global_step": 8059, "epoch": 191} {"train_loss": -4.998113632202148, "global_step": 8060, "epoch": 191} {"train_loss": -4.801136493682861, "global_step": 8061, "epoch": 191} {"train_loss": -4.932020664215088, "global_step": 8062, "epoch": 191} {"train_loss": -4.898835886092413, "global_step": 8063, "epoch": 191, "val_loss": 84686.4921875} {"train_loss": -4.7635931968688965, "global_step": 8064, "epoch": 192} {"train_loss": -4.872808456420898, "global_step": 8065, "epoch": 192} {"train_loss": -4.785482406616211, "global_step": 8066, "epoch": 192} {"train_loss": -4.8006744384765625, "global_step": 8067, "epoch": 192} {"train_loss": -5.000866889953613, "global_step": 8068, "epoch": 192} {"train_loss": -4.782687187194824, "global_step": 8069, "epoch": 192} {"train_loss": -4.870221138000488, "global_step": 8070, "epoch": 192} {"train_loss": -4.818341255187988, "global_step": 8071, "epoch": 192} {"train_loss": -4.761204719543457, "global_step": 8072, "epoch": 192} {"train_loss": -4.617623805999756, "global_step": 8073, "epoch": 192} {"train_loss": -4.622059345245361, "global_step": 8074, "epoch": 192} {"train_loss": -4.661947250366211, "global_step": 8075, "epoch": 192} {"train_loss": -4.728843688964844, "global_step": 8076, "epoch": 192} {"train_loss": -4.661250114440918, "global_step": 8077, "epoch": 192} {"train_loss": -4.863027572631836, "global_step": 8078, "epoch": 192} {"train_loss": -4.707690238952637, "global_step": 8079, "epoch": 192} {"train_loss": -4.756200313568115, "global_step": 8080, "epoch": 192} {"train_loss": -4.844766616821289, "global_step": 8081, "epoch": 192} {"train_loss": -4.831221580505371, "global_step": 8082, "epoch": 192} {"train_loss": -4.905694007873535, "global_step": 8083, "epoch": 192} {"train_loss": -4.837259292602539, "global_step": 8084, "epoch": 192} {"train_loss": -4.816141128540039, "global_step": 8085, "epoch": 192} {"train_loss": -4.960007190704346, "global_step": 8086, "epoch": 192} {"train_loss": -4.822181701660156, "global_step": 8087, "epoch": 192} {"train_loss": -4.9587531089782715, "global_step": 8088, "epoch": 192} {"train_loss": -5.004187107086182, "global_step": 8089, "epoch": 192} {"train_loss": -4.9513750076293945, "global_step": 8090, "epoch": 192} {"train_loss": -4.8559675216674805, "global_step": 8091, "epoch": 192} {"train_loss": -5.000378608703613, "global_step": 8092, "epoch": 192} {"train_loss": -5.012426853179932, "global_step": 8093, "epoch": 192} {"train_loss": -4.848211288452148, "global_step": 8094, "epoch": 192} {"train_loss": -4.971644401550293, "global_step": 8095, "epoch": 192} {"train_loss": -4.9159135818481445, "global_step": 8096, "epoch": 192} {"train_loss": -5.027143478393555, "global_step": 8097, "epoch": 192} {"train_loss": -4.865455627441406, "global_step": 8098, "epoch": 192} {"train_loss": -5.050497055053711, "global_step": 8099, "epoch": 192} {"train_loss": -4.982132911682129, "global_step": 8100, "epoch": 192} {"train_loss": -4.944169998168945, "global_step": 8101, "epoch": 192} {"train_loss": -4.99111270904541, "global_step": 8102, "epoch": 192} {"train_loss": -5.015161514282227, "global_step": 8103, "epoch": 192} {"train_loss": -4.961790084838867, "global_step": 8104, "epoch": 192} {"train_loss": -4.869085209710257, "global_step": 8105, "epoch": 192, "val_loss": 83668.3359375} {"train_loss": -5.0720720291137695, "global_step": 8106, "epoch": 193} {"train_loss": -4.991524696350098, "global_step": 8107, "epoch": 193} {"train_loss": -4.9037604331970215, "global_step": 8108, "epoch": 193} {"train_loss": -5.016419410705566, "global_step": 8109, "epoch": 193} {"train_loss": -4.783178329467773, "global_step": 8110, "epoch": 193} {"train_loss": -4.892385005950928, "global_step": 8111, "epoch": 193} {"train_loss": -5.112727165222168, "global_step": 8112, "epoch": 193} {"train_loss": -5.007296562194824, "global_step": 8113, "epoch": 193} {"train_loss": -5.006350040435791, "global_step": 8114, "epoch": 193} {"train_loss": -4.933196067810059, "global_step": 8115, "epoch": 193} {"train_loss": -4.963048934936523, "global_step": 8116, "epoch": 193} {"train_loss": -5.021759510040283, "global_step": 8117, "epoch": 193} {"train_loss": -4.979997634887695, "global_step": 8118, "epoch": 193} {"train_loss": -4.839340686798096, "global_step": 8119, "epoch": 193} {"train_loss": -4.934971809387207, "global_step": 8120, "epoch": 193} {"train_loss": -5.0706610679626465, "global_step": 8121, "epoch": 193} {"train_loss": -5.042391777038574, "global_step": 8122, "epoch": 193} {"train_loss": -4.90360689163208, "global_step": 8123, "epoch": 193} {"train_loss": -4.952181816101074, "global_step": 8124, "epoch": 193} {"train_loss": -4.837800025939941, "global_step": 8125, "epoch": 193} {"train_loss": -4.994078636169434, "global_step": 8126, "epoch": 193} {"train_loss": -4.826074600219727, "global_step": 8127, "epoch": 193} {"train_loss": -4.953690528869629, "global_step": 8128, "epoch": 193} {"train_loss": -5.021523475646973, "global_step": 8129, "epoch": 193} {"train_loss": -5.0308380126953125, "global_step": 8130, "epoch": 193} {"train_loss": -5.051412105560303, "global_step": 8131, "epoch": 193} {"train_loss": -4.908723831176758, "global_step": 8132, "epoch": 193} {"train_loss": -4.988466739654541, "global_step": 8133, "epoch": 193} {"train_loss": -4.901273250579834, "global_step": 8134, "epoch": 193} {"train_loss": -4.919425964355469, "global_step": 8135, "epoch": 193} {"train_loss": -5.034233093261719, "global_step": 8136, "epoch": 193} {"train_loss": -5.003961563110352, "global_step": 8137, "epoch": 193} {"train_loss": -5.050544738769531, "global_step": 8138, "epoch": 193} {"train_loss": -5.123755931854248, "global_step": 8139, "epoch": 193} {"train_loss": -4.965279579162598, "global_step": 8140, "epoch": 193} {"train_loss": -4.866081237792969, "global_step": 8141, "epoch": 193} {"train_loss": -4.752590656280518, "global_step": 8142, "epoch": 193} {"train_loss": -4.833390235900879, "global_step": 8143, "epoch": 193} {"train_loss": -4.934687614440918, "global_step": 8144, "epoch": 193} {"train_loss": -5.003811836242676, "global_step": 8145, "epoch": 193} {"train_loss": -4.864918231964111, "global_step": 8146, "epoch": 193} {"train_loss": -4.955126319612775, "global_step": 8147, "epoch": 193, "val_loss": 85678.015625} {"train_loss": -4.7264909744262695, "global_step": 8148, "epoch": 194} {"train_loss": -4.873488903045654, "global_step": 8149, "epoch": 194} {"train_loss": -4.904849052429199, "global_step": 8150, "epoch": 194} {"train_loss": -4.465289115905762, "global_step": 8151, "epoch": 194} {"train_loss": -4.805914402008057, "global_step": 8152, "epoch": 194} {"train_loss": -4.533404350280762, "global_step": 8153, "epoch": 194} {"train_loss": -4.447239875793457, "global_step": 8154, "epoch": 194} {"train_loss": -4.792176246643066, "global_step": 8155, "epoch": 194} {"train_loss": -4.7761688232421875, "global_step": 8156, "epoch": 194} {"train_loss": -4.796045780181885, "global_step": 8157, "epoch": 194} {"train_loss": -4.921850204467773, "global_step": 8158, "epoch": 194} {"train_loss": -4.904404640197754, "global_step": 8159, "epoch": 194} {"train_loss": -4.8755269050598145, "global_step": 8160, "epoch": 194} {"train_loss": -4.853483200073242, "global_step": 8161, "epoch": 194} {"train_loss": -4.976393699645996, "global_step": 8162, "epoch": 194} {"train_loss": -4.979506969451904, "global_step": 8163, "epoch": 194} {"train_loss": -4.884245872497559, "global_step": 8164, "epoch": 194} {"train_loss": -4.923500061035156, "global_step": 8165, "epoch": 194} {"train_loss": -4.872542381286621, "global_step": 8166, "epoch": 194} {"train_loss": -4.942743301391602, "global_step": 8167, "epoch": 194} {"train_loss": -4.906560897827148, "global_step": 8168, "epoch": 194} {"train_loss": -4.974373817443848, "global_step": 8169, "epoch": 194} {"train_loss": -4.978857040405273, "global_step": 8170, "epoch": 194} {"train_loss": -4.95482873916626, "global_step": 8171, "epoch": 194} {"train_loss": -5.038610458374023, "global_step": 8172, "epoch": 194} {"train_loss": -4.971220970153809, "global_step": 8173, "epoch": 194} {"train_loss": -4.9514055252075195, "global_step": 8174, "epoch": 194} {"train_loss": -4.929763317108154, "global_step": 8175, "epoch": 194} {"train_loss": -4.801799774169922, "global_step": 8176, "epoch": 194} {"train_loss": -5.047344207763672, "global_step": 8177, "epoch": 194} {"train_loss": -4.836310386657715, "global_step": 8178, "epoch": 194} {"train_loss": -4.937753200531006, "global_step": 8179, "epoch": 194} {"train_loss": -4.918177604675293, "global_step": 8180, "epoch": 194} {"train_loss": -5.013585090637207, "global_step": 8181, "epoch": 194} {"train_loss": -4.984561920166016, "global_step": 8182, "epoch": 194} {"train_loss": -4.926760196685791, "global_step": 8183, "epoch": 194} {"train_loss": -4.96236515045166, "global_step": 8184, "epoch": 194} {"train_loss": -4.9937357902526855, "global_step": 8185, "epoch": 194} {"train_loss": -4.909073829650879, "global_step": 8186, "epoch": 194} {"train_loss": -4.9588117599487305, "global_step": 8187, "epoch": 194} {"train_loss": -5.065116882324219, "global_step": 8188, "epoch": 194} {"train_loss": -4.887255714053199, "global_step": 8189, "epoch": 194, "val_loss": 84241.28125} {"train_loss": -4.812853813171387, "global_step": 8190, "epoch": 195} {"train_loss": -5.062656402587891, "global_step": 8191, "epoch": 195} {"train_loss": -4.935546875, "global_step": 8192, "epoch": 195} {"train_loss": -4.841871738433838, "global_step": 8193, "epoch": 195} {"train_loss": -4.804606914520264, "global_step": 8194, "epoch": 195} {"train_loss": -5.044502258300781, "global_step": 8195, "epoch": 195} {"train_loss": -4.821813583374023, "global_step": 8196, "epoch": 195} {"train_loss": -4.743721961975098, "global_step": 8197, "epoch": 195} {"train_loss": -4.820878982543945, "global_step": 8198, "epoch": 195} {"train_loss": -4.9087114334106445, "global_step": 8199, "epoch": 195} {"train_loss": -4.954607963562012, "global_step": 8200, "epoch": 195} {"train_loss": -4.962186813354492, "global_step": 8201, "epoch": 195} {"train_loss": -4.956256866455078, "global_step": 8202, "epoch": 195} {"train_loss": -4.8750319480896, "global_step": 8203, "epoch": 195} {"train_loss": -4.95387601852417, "global_step": 8204, "epoch": 195} {"train_loss": -4.967472076416016, "global_step": 8205, "epoch": 195} {"train_loss": -5.019697666168213, "global_step": 8206, "epoch": 195} {"train_loss": -4.939842700958252, "global_step": 8207, "epoch": 195} {"train_loss": -4.823042869567871, "global_step": 8208, "epoch": 195} {"train_loss": -4.987298488616943, "global_step": 8209, "epoch": 195} {"train_loss": -5.000060081481934, "global_step": 8210, "epoch": 195} {"train_loss": -4.9788408279418945, "global_step": 8211, "epoch": 195} {"train_loss": -4.963356971740723, "global_step": 8212, "epoch": 195} {"train_loss": -4.943083763122559, "global_step": 8213, "epoch": 195} {"train_loss": -4.912127494812012, "global_step": 8214, "epoch": 195} {"train_loss": -4.921958923339844, "global_step": 8215, "epoch": 195} {"train_loss": -4.809111595153809, "global_step": 8216, "epoch": 195} {"train_loss": -5.025909423828125, "global_step": 8217, "epoch": 195} {"train_loss": -4.910117149353027, "global_step": 8218, "epoch": 195} {"train_loss": -4.957278251647949, "global_step": 8219, "epoch": 195} {"train_loss": -5.035397052764893, "global_step": 8220, "epoch": 195} {"train_loss": -4.808568000793457, "global_step": 8221, "epoch": 195} {"train_loss": -4.9092302322387695, "global_step": 8222, "epoch": 195} {"train_loss": -4.926775932312012, "global_step": 8223, "epoch": 195} {"train_loss": -4.853894233703613, "global_step": 8224, "epoch": 195} {"train_loss": -4.900847911834717, "global_step": 8225, "epoch": 195} {"train_loss": -5.0688629150390625, "global_step": 8226, "epoch": 195} {"train_loss": -4.92202091217041, "global_step": 8227, "epoch": 195} {"train_loss": -4.893546104431152, "global_step": 8228, "epoch": 195} {"train_loss": -4.934161186218262, "global_step": 8229, "epoch": 195} {"train_loss": -4.778464317321777, "global_step": 8230, "epoch": 195} {"train_loss": -4.921331973302932, "global_step": 8231, "epoch": 195, "val_loss": 83030.5078125} {"train_loss": -4.915807247161865, "global_step": 8232, "epoch": 196} {"train_loss": -4.929361820220947, "global_step": 8233, "epoch": 196} {"train_loss": -4.963957786560059, "global_step": 8234, "epoch": 196} {"train_loss": -4.823154449462891, "global_step": 8235, "epoch": 196} {"train_loss": -4.880207538604736, "global_step": 8236, "epoch": 196} {"train_loss": -4.951938629150391, "global_step": 8237, "epoch": 196} {"train_loss": -4.972600936889648, "global_step": 8238, "epoch": 196} {"train_loss": -5.023883819580078, "global_step": 8239, "epoch": 196} {"train_loss": -4.945523262023926, "global_step": 8240, "epoch": 196} {"train_loss": -4.9101481437683105, "global_step": 8241, "epoch": 196} {"train_loss": -5.0936665534973145, "global_step": 8242, "epoch": 196} {"train_loss": -4.966359615325928, "global_step": 8243, "epoch": 196} {"train_loss": -4.954249382019043, "global_step": 8244, "epoch": 196} {"train_loss": -4.9945292472839355, "global_step": 8245, "epoch": 196} {"train_loss": -5.011924743652344, "global_step": 8246, "epoch": 196} {"train_loss": -4.884563446044922, "global_step": 8247, "epoch": 196} {"train_loss": -5.068317890167236, "global_step": 8248, "epoch": 196} {"train_loss": -5.029439926147461, "global_step": 8249, "epoch": 196} {"train_loss": -4.9451799392700195, "global_step": 8250, "epoch": 196} {"train_loss": -5.026144504547119, "global_step": 8251, "epoch": 196} {"train_loss": -5.033339023590088, "global_step": 8252, "epoch": 196} {"train_loss": -5.066737174987793, "global_step": 8253, "epoch": 196} {"train_loss": -5.019067287445068, "global_step": 8254, "epoch": 196} {"train_loss": -5.027777671813965, "global_step": 8255, "epoch": 196} {"train_loss": -5.055100440979004, "global_step": 8256, "epoch": 196} {"train_loss": -5.004262924194336, "global_step": 8257, "epoch": 196} {"train_loss": -4.932410717010498, "global_step": 8258, "epoch": 196} {"train_loss": -4.934727191925049, "global_step": 8259, "epoch": 196} {"train_loss": -5.0343217849731445, "global_step": 8260, "epoch": 196} {"train_loss": -5.064309120178223, "global_step": 8261, "epoch": 196} {"train_loss": -5.076946258544922, "global_step": 8262, "epoch": 196} {"train_loss": -5.057430267333984, "global_step": 8263, "epoch": 196} {"train_loss": -5.000189781188965, "global_step": 8264, "epoch": 196} {"train_loss": -4.931053638458252, "global_step": 8265, "epoch": 196} {"train_loss": -4.866225242614746, "global_step": 8266, "epoch": 196} {"train_loss": -4.984057903289795, "global_step": 8267, "epoch": 196} {"train_loss": -4.882045745849609, "global_step": 8268, "epoch": 196} {"train_loss": -4.917325973510742, "global_step": 8269, "epoch": 196} {"train_loss": -5.046418190002441, "global_step": 8270, "epoch": 196} {"train_loss": -4.879430770874023, "global_step": 8271, "epoch": 196} {"train_loss": -4.870632171630859, "global_step": 8272, "epoch": 196} {"train_loss": -4.974433331262498, "global_step": 8273, "epoch": 196, "val_loss": 82243.5546875} {"train_loss": -4.9988250732421875, "global_step": 8274, "epoch": 197} {"train_loss": -4.994860649108887, "global_step": 8275, "epoch": 197} {"train_loss": -4.827796936035156, "global_step": 8276, "epoch": 197} {"train_loss": -4.912807464599609, "global_step": 8277, "epoch": 197} {"train_loss": -5.049051284790039, "global_step": 8278, "epoch": 197} {"train_loss": -4.868706226348877, "global_step": 8279, "epoch": 197} {"train_loss": -4.8931708335876465, "global_step": 8280, "epoch": 197} {"train_loss": -4.930892467498779, "global_step": 8281, "epoch": 197} {"train_loss": -4.9178571701049805, "global_step": 8282, "epoch": 197} {"train_loss": -5.068103790283203, "global_step": 8283, "epoch": 197} {"train_loss": -4.972660064697266, "global_step": 8284, "epoch": 197} {"train_loss": -5.057981491088867, "global_step": 8285, "epoch": 197} {"train_loss": -5.0511369705200195, "global_step": 8286, "epoch": 197} {"train_loss": -4.960000991821289, "global_step": 8287, "epoch": 197} {"train_loss": -4.900010108947754, "global_step": 8288, "epoch": 197} {"train_loss": -4.930059432983398, "global_step": 8289, "epoch": 197} {"train_loss": -4.974777698516846, "global_step": 8290, "epoch": 197} {"train_loss": -4.816015243530273, "global_step": 8291, "epoch": 197} {"train_loss": -4.817146301269531, "global_step": 8292, "epoch": 197} {"train_loss": -4.991494655609131, "global_step": 8293, "epoch": 197} {"train_loss": -4.871307373046875, "global_step": 8294, "epoch": 197} {"train_loss": -4.9602203369140625, "global_step": 8295, "epoch": 197} {"train_loss": -4.969624042510986, "global_step": 8296, "epoch": 197} {"train_loss": -4.894126892089844, "global_step": 8297, "epoch": 197} {"train_loss": -5.121640205383301, "global_step": 8298, "epoch": 197} {"train_loss": -4.776817321777344, "global_step": 8299, "epoch": 197} {"train_loss": -4.727116584777832, "global_step": 8300, "epoch": 197} {"train_loss": -4.819528579711914, "global_step": 8301, "epoch": 197} {"train_loss": -4.782601356506348, "global_step": 8302, "epoch": 197} {"train_loss": -4.7679524421691895, "global_step": 8303, "epoch": 197} {"train_loss": -4.774220943450928, "global_step": 8304, "epoch": 197} {"train_loss": -4.848339080810547, "global_step": 8305, "epoch": 197} {"train_loss": -4.714414596557617, "global_step": 8306, "epoch": 197} {"train_loss": -4.525402069091797, "global_step": 8307, "epoch": 197} {"train_loss": -5.083588600158691, "global_step": 8308, "epoch": 197} {"train_loss": -4.708581447601318, "global_step": 8309, "epoch": 197} {"train_loss": -4.864569187164307, "global_step": 8310, "epoch": 197} {"train_loss": -4.820307731628418, "global_step": 8311, "epoch": 197} {"train_loss": -4.837063789367676, "global_step": 8312, "epoch": 197} {"train_loss": -5.132704257965088, "global_step": 8313, "epoch": 197} {"train_loss": -4.810162544250488, "global_step": 8314, "epoch": 197} {"train_loss": -4.900778089250837, "global_step": 8315, "epoch": 197, "val_loss": 83571.6015625} {"train_loss": -4.8186774253845215, "global_step": 8316, "epoch": 198} {"train_loss": -4.765010356903076, "global_step": 8317, "epoch": 198} {"train_loss": -4.849452018737793, "global_step": 8318, "epoch": 198} {"train_loss": -4.807844161987305, "global_step": 8319, "epoch": 198} {"train_loss": -4.925724029541016, "global_step": 8320, "epoch": 198} {"train_loss": -4.972757339477539, "global_step": 8321, "epoch": 198} {"train_loss": -4.982144832611084, "global_step": 8322, "epoch": 198} {"train_loss": -4.933594703674316, "global_step": 8323, "epoch": 198} {"train_loss": -4.931124687194824, "global_step": 8324, "epoch": 198} {"train_loss": -4.893768310546875, "global_step": 8325, "epoch": 198} {"train_loss": -5.019495010375977, "global_step": 8326, "epoch": 198} {"train_loss": -4.973203659057617, "global_step": 8327, "epoch": 198} {"train_loss": -5.054003715515137, "global_step": 8328, "epoch": 198} {"train_loss": -4.838850975036621, "global_step": 8329, "epoch": 198} {"train_loss": -5.100991725921631, "global_step": 8330, "epoch": 198} {"train_loss": -4.931244850158691, "global_step": 8331, "epoch": 198} {"train_loss": -5.036721229553223, "global_step": 8332, "epoch": 198} {"train_loss": -4.991363525390625, "global_step": 8333, "epoch": 198} {"train_loss": -4.953243255615234, "global_step": 8334, "epoch": 198} {"train_loss": -5.044008255004883, "global_step": 8335, "epoch": 198} {"train_loss": -4.939843654632568, "global_step": 8336, "epoch": 198} {"train_loss": -5.047565460205078, "global_step": 8337, "epoch": 198} {"train_loss": -4.934006690979004, "global_step": 8338, "epoch": 198} {"train_loss": -4.940199851989746, "global_step": 8339, "epoch": 198} {"train_loss": -4.903992176055908, "global_step": 8340, "epoch": 198} {"train_loss": -4.986945152282715, "global_step": 8341, "epoch": 198} {"train_loss": -4.918837547302246, "global_step": 8342, "epoch": 198} {"train_loss": -5.048297882080078, "global_step": 8343, "epoch": 198} {"train_loss": -4.871187210083008, "global_step": 8344, "epoch": 198} {"train_loss": -4.901817321777344, "global_step": 8345, "epoch": 198} {"train_loss": -5.0385050773620605, "global_step": 8346, "epoch": 198} {"train_loss": -4.956805229187012, "global_step": 8347, "epoch": 198} {"train_loss": -4.857968807220459, "global_step": 8348, "epoch": 198} {"train_loss": -4.933717250823975, "global_step": 8349, "epoch": 198} {"train_loss": -4.882961273193359, "global_step": 8350, "epoch": 198} {"train_loss": -4.852889060974121, "global_step": 8351, "epoch": 198} {"train_loss": -4.868521690368652, "global_step": 8352, "epoch": 198} {"train_loss": -4.921567440032959, "global_step": 8353, "epoch": 198} {"train_loss": -4.898433685302734, "global_step": 8354, "epoch": 198} {"train_loss": -4.988168239593506, "global_step": 8355, "epoch": 198} {"train_loss": -4.921751976013184, "global_step": 8356, "epoch": 198} {"train_loss": -4.9338546480451315, "global_step": 8357, "epoch": 198, "val_loss": 83141.2890625} {"train_loss": -5.015389919281006, "global_step": 8358, "epoch": 199} {"train_loss": -4.937260627746582, "global_step": 8359, "epoch": 199} {"train_loss": -4.903750419616699, "global_step": 8360, "epoch": 199} {"train_loss": -5.094859600067139, "global_step": 8361, "epoch": 199} {"train_loss": -5.066516876220703, "global_step": 8362, "epoch": 199} {"train_loss": -5.0006184577941895, "global_step": 8363, "epoch": 199} {"train_loss": -4.974479675292969, "global_step": 8364, "epoch": 199} {"train_loss": -5.032625675201416, "global_step": 8365, "epoch": 199} {"train_loss": -5.053308486938477, "global_step": 8366, "epoch": 199} {"train_loss": -5.072746276855469, "global_step": 8367, "epoch": 199} {"train_loss": -5.016514778137207, "global_step": 8368, "epoch": 199} {"train_loss": -5.093156814575195, "global_step": 8369, "epoch": 199} {"train_loss": -4.968295097351074, "global_step": 8370, "epoch": 199} {"train_loss": -4.837864875793457, "global_step": 8371, "epoch": 199} {"train_loss": -5.043568134307861, "global_step": 8372, "epoch": 199} {"train_loss": -4.973039150238037, "global_step": 8373, "epoch": 199} {"train_loss": -5.141610622406006, "global_step": 8374, "epoch": 199} {"train_loss": -4.931157112121582, "global_step": 8375, "epoch": 199} {"train_loss": -4.931843280792236, "global_step": 8376, "epoch": 199} {"train_loss": -4.936091899871826, "global_step": 8377, "epoch": 199} {"train_loss": -5.020190238952637, "global_step": 8378, "epoch": 199} {"train_loss": -4.915754318237305, "global_step": 8379, "epoch": 199} {"train_loss": -5.057822227478027, "global_step": 8380, "epoch": 199} {"train_loss": -4.993490219116211, "global_step": 8381, "epoch": 199} {"train_loss": -4.860656261444092, "global_step": 8382, "epoch": 199} {"train_loss": -4.778478622436523, "global_step": 8383, "epoch": 199} {"train_loss": -4.881952285766602, "global_step": 8384, "epoch": 199} {"train_loss": -4.973145961761475, "global_step": 8385, "epoch": 199} {"train_loss": -4.93658447265625, "global_step": 8386, "epoch": 199} {"train_loss": -4.836456298828125, "global_step": 8387, "epoch": 199} {"train_loss": -4.873434543609619, "global_step": 8388, "epoch": 199} {"train_loss": -4.89321231842041, "global_step": 8389, "epoch": 199} {"train_loss": -4.82295036315918, "global_step": 8390, "epoch": 199} {"train_loss": -4.844104290008545, "global_step": 8391, "epoch": 199} {"train_loss": -5.041782379150391, "global_step": 8392, "epoch": 199} {"train_loss": -4.747411727905273, "global_step": 8393, "epoch": 199} {"train_loss": -5.092865943908691, "global_step": 8394, "epoch": 199} {"train_loss": -4.959511756896973, "global_step": 8395, "epoch": 199} {"train_loss": -4.922689437866211, "global_step": 8396, "epoch": 199} {"train_loss": -4.972936630249023, "global_step": 8397, "epoch": 199} {"train_loss": -4.969614028930664, "global_step": 8398, "epoch": 199} {"train_loss": -4.962100063051496, "global_step": 8399, "epoch": 199, "val_loss": 83745.953125} {"train_loss": -4.919867515563965, "global_step": 8400, "epoch": 200} {"train_loss": -5.061779975891113, "global_step": 8401, "epoch": 200} {"train_loss": -4.731265068054199, "global_step": 8402, "epoch": 200} {"train_loss": -4.975192546844482, "global_step": 8403, "epoch": 200} {"train_loss": -4.897829055786133, "global_step": 8404, "epoch": 200} {"train_loss": -4.977653503417969, "global_step": 8405, "epoch": 200} {"train_loss": -5.184797763824463, "global_step": 8406, "epoch": 200} {"train_loss": -5.012242317199707, "global_step": 8407, "epoch": 200} {"train_loss": -4.997673034667969, "global_step": 8408, "epoch": 200} {"train_loss": -4.937980651855469, "global_step": 8409, "epoch": 200} {"train_loss": -4.859468460083008, "global_step": 8410, "epoch": 200} {"train_loss": -4.917570114135742, "global_step": 8411, "epoch": 200} {"train_loss": -5.0248589515686035, "global_step": 8412, "epoch": 200} {"train_loss": -4.868950843811035, "global_step": 8413, "epoch": 200} {"train_loss": -5.009964942932129, "global_step": 8414, "epoch": 200} {"train_loss": -4.918286323547363, "global_step": 8415, "epoch": 200} {"train_loss": -4.948503494262695, "global_step": 8416, "epoch": 200} {"train_loss": -4.978030204772949, "global_step": 8417, "epoch": 200} {"train_loss": -4.92317533493042, "global_step": 8418, "epoch": 200} {"train_loss": -5.1265869140625, "global_step": 8419, "epoch": 200} {"train_loss": -4.744726181030273, "global_step": 8420, "epoch": 200} {"train_loss": -4.950754642486572, "global_step": 8421, "epoch": 200} {"train_loss": -5.151773452758789, "global_step": 8422, "epoch": 200} {"train_loss": -4.897040367126465, "global_step": 8423, "epoch": 200} {"train_loss": -4.8011932373046875, "global_step": 8424, "epoch": 200} {"train_loss": -4.895193099975586, "global_step": 8425, "epoch": 200} {"train_loss": -4.788394927978516, "global_step": 8426, "epoch": 200} {"train_loss": -4.8657307624816895, "global_step": 8427, "epoch": 200} {"train_loss": -5.027683258056641, "global_step": 8428, "epoch": 200} {"train_loss": -4.868644714355469, "global_step": 8429, "epoch": 200} {"train_loss": -4.959277153015137, "global_step": 8430, "epoch": 200} {"train_loss": -4.862044334411621, "global_step": 8431, "epoch": 200} {"train_loss": -4.866499900817871, "global_step": 8432, "epoch": 200} {"train_loss": -5.041619300842285, "global_step": 8433, "epoch": 200} {"train_loss": -4.825716972351074, "global_step": 8434, "epoch": 200} {"train_loss": -4.9286651611328125, "global_step": 8435, "epoch": 200} {"train_loss": -4.955567359924316, "global_step": 8436, "epoch": 200} {"train_loss": -4.902441024780273, "global_step": 8437, "epoch": 200} {"train_loss": -5.102917671203613, "global_step": 8438, "epoch": 200} {"train_loss": -5.027741432189941, "global_step": 8439, "epoch": 200} {"train_loss": -4.959847450256348, "global_step": 8440, "epoch": 200} {"train_loss": -4.943816854840233, "global_step": 8441, "epoch": 200, "train/sim_max_reward_0": 0.19317848549133732, "train/sim_max_reward_1": 0.05216598429182595, "train/sim_max_reward_2": 0.17320919230391837, "train/sim_max_reward_3": 0.0053467998742405525, "train/sim_max_reward_4": 0.009503307570729362, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4500000": 0.3282875348841493, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0011067380474561546, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.16063735747739583, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.045796851765227804, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.30125231282121706, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.36819088894457896, "test/sim_max_reward_4500015": 0.05918341727318116, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.004249031229020703, "test/sim_max_reward_4500019": 0.39496762743265895, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.14861511220147822, "test/sim_max_reward_4500022": 0.3829095003427856, "test/sim_max_reward_4500023": 0.431168964091752, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.25805179707497994, "test/sim_max_reward_4500026": 0.04185147830665218, "test/sim_max_reward_4500027": 6.208385506367412e-05, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.04163460642148004, "test/sim_max_reward_4500030": 0.14927800189130747, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.41669666656436133, "test/sim_max_reward_4500034": 0.054792514429858254, "test/sim_max_reward_4500035": 0.0779606034003907, "test/sim_max_reward_4500036": 0.4494254557169702, "test/sim_max_reward_4500037": 0.17979637744087887, "test/sim_max_reward_4500038": 0.3762439844299418, "test/sim_max_reward_4500039": 0.32065169361694035, "test/sim_max_reward_4500040": 0.0, "test/sim_max_reward_4500041": 0.0, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.30559560267848423, "test/sim_max_reward_4500044": 0.01055345468867214, "test/sim_max_reward_4500045": 0.1175735103924684, "test/sim_max_reward_4500046": 0.16290866370711915, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.10439808814903984, "test/mean_score": 0.11841319955063671, "val_loss": 82622.4453125} {"train_loss": -4.917853355407715, "global_step": 8442, "epoch": 201} {"train_loss": -4.800518035888672, "global_step": 8443, "epoch": 201} {"train_loss": -4.979132175445557, "global_step": 8444, "epoch": 201} {"train_loss": -5.030860900878906, "global_step": 8445, "epoch": 201} {"train_loss": -4.907280921936035, "global_step": 8446, "epoch": 201} {"train_loss": -5.034879684448242, "global_step": 8447, "epoch": 201} {"train_loss": -4.991371154785156, "global_step": 8448, "epoch": 201} {"train_loss": -4.835893630981445, "global_step": 8449, "epoch": 201} {"train_loss": -4.971795082092285, "global_step": 8450, "epoch": 201} {"train_loss": -4.952040195465088, "global_step": 8451, "epoch": 201} {"train_loss": -4.958412170410156, "global_step": 8452, "epoch": 201} {"train_loss": -5.020603179931641, "global_step": 8453, "epoch": 201} {"train_loss": -4.923252105712891, "global_step": 8454, "epoch": 201} {"train_loss": -4.9247517585754395, "global_step": 8455, "epoch": 201} {"train_loss": -5.083965301513672, "global_step": 8456, "epoch": 201} {"train_loss": -5.0731353759765625, "global_step": 8457, "epoch": 201} {"train_loss": -4.89663028717041, "global_step": 8458, "epoch": 201} {"train_loss": -4.839293479919434, "global_step": 8459, "epoch": 201} {"train_loss": -5.067363739013672, "global_step": 8460, "epoch": 201} {"train_loss": -5.027098655700684, "global_step": 8461, "epoch": 201} {"train_loss": -4.995957851409912, "global_step": 8462, "epoch": 201} {"train_loss": -4.937438011169434, "global_step": 8463, "epoch": 201} {"train_loss": -5.038875579833984, "global_step": 8464, "epoch": 201} {"train_loss": -5.005793571472168, "global_step": 8465, "epoch": 201} {"train_loss": -5.012630462646484, "global_step": 8466, "epoch": 201} {"train_loss": -5.0286149978637695, "global_step": 8467, "epoch": 201} {"train_loss": -4.975046157836914, "global_step": 8468, "epoch": 201} {"train_loss": -5.089366436004639, "global_step": 8469, "epoch": 201} {"train_loss": -5.006546974182129, "global_step": 8470, "epoch": 201} {"train_loss": -5.004439353942871, "global_step": 8471, "epoch": 201} {"train_loss": -4.964132785797119, "global_step": 8472, "epoch": 201} {"train_loss": -4.889542579650879, "global_step": 8473, "epoch": 201} {"train_loss": -5.009882926940918, "global_step": 8474, "epoch": 201} {"train_loss": -5.044700622558594, "global_step": 8475, "epoch": 201} {"train_loss": -5.031267166137695, "global_step": 8476, "epoch": 201} {"train_loss": -5.07865047454834, "global_step": 8477, "epoch": 201} {"train_loss": -4.976158618927002, "global_step": 8478, "epoch": 201} {"train_loss": -4.928071975708008, "global_step": 8479, "epoch": 201} {"train_loss": -4.825246334075928, "global_step": 8480, "epoch": 201} {"train_loss": -4.8892645835876465, "global_step": 8481, "epoch": 201} {"train_loss": -4.874822616577148, "global_step": 8482, "epoch": 201} {"train_loss": -4.971301328568232, "global_step": 8483, "epoch": 201, "val_loss": 82761.7890625} {"train_loss": -4.967177867889404, "global_step": 8484, "epoch": 202} {"train_loss": -4.806340217590332, "global_step": 8485, "epoch": 202} {"train_loss": -4.9637956619262695, "global_step": 8486, "epoch": 202} {"train_loss": -4.82680606842041, "global_step": 8487, "epoch": 202} {"train_loss": -4.8350982666015625, "global_step": 8488, "epoch": 202} {"train_loss": -4.894101142883301, "global_step": 8489, "epoch": 202} {"train_loss": -4.926087379455566, "global_step": 8490, "epoch": 202} {"train_loss": -4.79352331161499, "global_step": 8491, "epoch": 202} {"train_loss": -4.824517250061035, "global_step": 8492, "epoch": 202} {"train_loss": -4.855213165283203, "global_step": 8493, "epoch": 202} {"train_loss": -4.715970039367676, "global_step": 8494, "epoch": 202} {"train_loss": -4.784239292144775, "global_step": 8495, "epoch": 202} {"train_loss": -4.801487922668457, "global_step": 8496, "epoch": 202} {"train_loss": -4.661594867706299, "global_step": 8497, "epoch": 202} {"train_loss": -4.945346832275391, "global_step": 8498, "epoch": 202} {"train_loss": -4.922575950622559, "global_step": 8499, "epoch": 202} {"train_loss": -4.902827739715576, "global_step": 8500, "epoch": 202} {"train_loss": -4.904896259307861, "global_step": 8501, "epoch": 202} {"train_loss": -4.9492573738098145, "global_step": 8502, "epoch": 202} {"train_loss": -4.826109886169434, "global_step": 8503, "epoch": 202} {"train_loss": -4.852453231811523, "global_step": 8504, "epoch": 202} {"train_loss": -4.800751686096191, "global_step": 8505, "epoch": 202} {"train_loss": -4.867997169494629, "global_step": 8506, "epoch": 202} {"train_loss": -4.818820953369141, "global_step": 8507, "epoch": 202} {"train_loss": -5.0757317543029785, "global_step": 8508, "epoch": 202} {"train_loss": -4.907594680786133, "global_step": 8509, "epoch": 202} {"train_loss": -4.876856803894043, "global_step": 8510, "epoch": 202} {"train_loss": -5.021054744720459, "global_step": 8511, "epoch": 202} {"train_loss": -4.923222064971924, "global_step": 8512, "epoch": 202} {"train_loss": -5.13295841217041, "global_step": 8513, "epoch": 202} {"train_loss": -4.948117256164551, "global_step": 8514, "epoch": 202} {"train_loss": -4.916259765625, "global_step": 8515, "epoch": 202} {"train_loss": -5.011385917663574, "global_step": 8516, "epoch": 202} {"train_loss": -4.98270845413208, "global_step": 8517, "epoch": 202} {"train_loss": -4.889082908630371, "global_step": 8518, "epoch": 202} {"train_loss": -5.030760765075684, "global_step": 8519, "epoch": 202} {"train_loss": -4.9080328941345215, "global_step": 8520, "epoch": 202} {"train_loss": -4.9549241065979, "global_step": 8521, "epoch": 202} {"train_loss": -4.957847595214844, "global_step": 8522, "epoch": 202} {"train_loss": -4.954092979431152, "global_step": 8523, "epoch": 202} {"train_loss": -4.979987144470215, "global_step": 8524, "epoch": 202} {"train_loss": -4.902287994112287, "global_step": 8525, "epoch": 202, "val_loss": 82172.5390625} {"train_loss": -5.008955001831055, "global_step": 8526, "epoch": 203} {"train_loss": -4.870498180389404, "global_step": 8527, "epoch": 203} {"train_loss": -5.010187149047852, "global_step": 8528, "epoch": 203} {"train_loss": -4.903409004211426, "global_step": 8529, "epoch": 203} {"train_loss": -5.060807228088379, "global_step": 8530, "epoch": 203} {"train_loss": -4.910372734069824, "global_step": 8531, "epoch": 203} {"train_loss": -5.232173919677734, "global_step": 8532, "epoch": 203} {"train_loss": -5.068589210510254, "global_step": 8533, "epoch": 203} {"train_loss": -4.927398204803467, "global_step": 8534, "epoch": 203} {"train_loss": -5.0133562088012695, "global_step": 8535, "epoch": 203} {"train_loss": -4.878989219665527, "global_step": 8536, "epoch": 203} {"train_loss": -5.028012275695801, "global_step": 8537, "epoch": 203} {"train_loss": -4.879645347595215, "global_step": 8538, "epoch": 203} {"train_loss": -5.028043746948242, "global_step": 8539, "epoch": 203} {"train_loss": -5.0003156661987305, "global_step": 8540, "epoch": 203} {"train_loss": -4.998873710632324, "global_step": 8541, "epoch": 203} {"train_loss": -5.157353401184082, "global_step": 8542, "epoch": 203} {"train_loss": -5.123293876647949, "global_step": 8543, "epoch": 203} {"train_loss": -5.044083118438721, "global_step": 8544, "epoch": 203} {"train_loss": -5.021766185760498, "global_step": 8545, "epoch": 203} {"train_loss": -5.032891273498535, "global_step": 8546, "epoch": 203} {"train_loss": -5.0786848068237305, "global_step": 8547, "epoch": 203} {"train_loss": -4.89077091217041, "global_step": 8548, "epoch": 203} {"train_loss": -5.149254322052002, "global_step": 8549, "epoch": 203} {"train_loss": -5.074828147888184, "global_step": 8550, "epoch": 203} {"train_loss": -5.120286464691162, "global_step": 8551, "epoch": 203} {"train_loss": -4.934517860412598, "global_step": 8552, "epoch": 203} {"train_loss": -4.987022399902344, "global_step": 8553, "epoch": 203} {"train_loss": -4.975862503051758, "global_step": 8554, "epoch": 203} {"train_loss": -5.065601825714111, "global_step": 8555, "epoch": 203} {"train_loss": -5.107734680175781, "global_step": 8556, "epoch": 203} {"train_loss": -4.995898723602295, "global_step": 8557, "epoch": 203} {"train_loss": -4.898212432861328, "global_step": 8558, "epoch": 203} {"train_loss": -4.933173179626465, "global_step": 8559, "epoch": 203} {"train_loss": -5.052215576171875, "global_step": 8560, "epoch": 203} {"train_loss": -4.918505668640137, "global_step": 8561, "epoch": 203} {"train_loss": -4.879174709320068, "global_step": 8562, "epoch": 203} {"train_loss": -4.796064376831055, "global_step": 8563, "epoch": 203} {"train_loss": -4.913930892944336, "global_step": 8564, "epoch": 203} {"train_loss": -4.961597442626953, "global_step": 8565, "epoch": 203} {"train_loss": -4.945802688598633, "global_step": 8566, "epoch": 203} {"train_loss": -4.995707250776745, "global_step": 8567, "epoch": 203, "val_loss": 83056.171875} {"train_loss": -5.0089592933654785, "global_step": 8568, "epoch": 204} {"train_loss": -4.991535186767578, "global_step": 8569, "epoch": 204} {"train_loss": -4.673121452331543, "global_step": 8570, "epoch": 204} {"train_loss": -4.775588512420654, "global_step": 8571, "epoch": 204} {"train_loss": -4.796561241149902, "global_step": 8572, "epoch": 204} {"train_loss": -4.757084369659424, "global_step": 8573, "epoch": 204} {"train_loss": -5.032331466674805, "global_step": 8574, "epoch": 204} {"train_loss": -4.670208930969238, "global_step": 8575, "epoch": 204} {"train_loss": -4.845893859863281, "global_step": 8576, "epoch": 204} {"train_loss": -4.611082553863525, "global_step": 8577, "epoch": 204} {"train_loss": -4.669491291046143, "global_step": 8578, "epoch": 204} {"train_loss": -4.73064661026001, "global_step": 8579, "epoch": 204} {"train_loss": -4.8669939041137695, "global_step": 8580, "epoch": 204} {"train_loss": -4.789514541625977, "global_step": 8581, "epoch": 204} {"train_loss": -4.784296035766602, "global_step": 8582, "epoch": 204} {"train_loss": -4.712872505187988, "global_step": 8583, "epoch": 204} {"train_loss": -4.785793781280518, "global_step": 8584, "epoch": 204} {"train_loss": -4.811271667480469, "global_step": 8585, "epoch": 204} {"train_loss": -4.779568672180176, "global_step": 8586, "epoch": 204} {"train_loss": -4.811151504516602, "global_step": 8587, "epoch": 204} {"train_loss": -4.97917366027832, "global_step": 8588, "epoch": 204} {"train_loss": -4.705735206604004, "global_step": 8589, "epoch": 204} {"train_loss": -4.931136131286621, "global_step": 8590, "epoch": 204} {"train_loss": -4.7485456466674805, "global_step": 8591, "epoch": 204} {"train_loss": -4.995110988616943, "global_step": 8592, "epoch": 204} {"train_loss": -4.957281589508057, "global_step": 8593, "epoch": 204} {"train_loss": -4.89511775970459, "global_step": 8594, "epoch": 204} {"train_loss": -4.930744171142578, "global_step": 8595, "epoch": 204} {"train_loss": -4.946140289306641, "global_step": 8596, "epoch": 204} {"train_loss": -4.856366157531738, "global_step": 8597, "epoch": 204} {"train_loss": -4.897133827209473, "global_step": 8598, "epoch": 204} {"train_loss": -4.986390113830566, "global_step": 8599, "epoch": 204} {"train_loss": -4.96998405456543, "global_step": 8600, "epoch": 204} {"train_loss": -4.909641742706299, "global_step": 8601, "epoch": 204} {"train_loss": -4.975836277008057, "global_step": 8602, "epoch": 204} {"train_loss": -4.912246227264404, "global_step": 8603, "epoch": 204} {"train_loss": -4.951016902923584, "global_step": 8604, "epoch": 204} {"train_loss": -4.896222114562988, "global_step": 8605, "epoch": 204} {"train_loss": -4.983053684234619, "global_step": 8606, "epoch": 204} {"train_loss": -4.881550312042236, "global_step": 8607, "epoch": 204} {"train_loss": -4.99109411239624, "global_step": 8608, "epoch": 204} {"train_loss": -4.861917348135085, "global_step": 8609, "epoch": 204, "val_loss": 82015.9453125} {"train_loss": -4.942578315734863, "global_step": 8610, "epoch": 205} {"train_loss": -5.029595375061035, "global_step": 8611, "epoch": 205} {"train_loss": -4.823464393615723, "global_step": 8612, "epoch": 205} {"train_loss": -4.991449356079102, "global_step": 8613, "epoch": 205} {"train_loss": -5.0189385414123535, "global_step": 8614, "epoch": 205} {"train_loss": -4.814990997314453, "global_step": 8615, "epoch": 205} {"train_loss": -5.006978988647461, "global_step": 8616, "epoch": 205} {"train_loss": -4.992768287658691, "global_step": 8617, "epoch": 205} {"train_loss": -5.088077545166016, "global_step": 8618, "epoch": 205} {"train_loss": -5.068583011627197, "global_step": 8619, "epoch": 205} {"train_loss": -4.919100284576416, "global_step": 8620, "epoch": 205} {"train_loss": -4.89097785949707, "global_step": 8621, "epoch": 205} {"train_loss": -4.914361476898193, "global_step": 8622, "epoch": 205} {"train_loss": -4.911797523498535, "global_step": 8623, "epoch": 205} {"train_loss": -4.827852249145508, "global_step": 8624, "epoch": 205} {"train_loss": -4.993351459503174, "global_step": 8625, "epoch": 205} {"train_loss": -5.023521423339844, "global_step": 8626, "epoch": 205} {"train_loss": -5.083131313323975, "global_step": 8627, "epoch": 205} {"train_loss": -5.067400932312012, "global_step": 8628, "epoch": 205} {"train_loss": -4.936966419219971, "global_step": 8629, "epoch": 205} {"train_loss": -5.001826286315918, "global_step": 8630, "epoch": 205} {"train_loss": -4.867124557495117, "global_step": 8631, "epoch": 205} {"train_loss": -4.865819931030273, "global_step": 8632, "epoch": 205} {"train_loss": -5.102464199066162, "global_step": 8633, "epoch": 205} {"train_loss": -5.009676933288574, "global_step": 8634, "epoch": 205} {"train_loss": -4.764715194702148, "global_step": 8635, "epoch": 205} {"train_loss": -4.9925432205200195, "global_step": 8636, "epoch": 205} {"train_loss": -4.864003658294678, "global_step": 8637, "epoch": 205} {"train_loss": -4.812806129455566, "global_step": 8638, "epoch": 205} {"train_loss": -4.932158946990967, "global_step": 8639, "epoch": 205} {"train_loss": -5.088024616241455, "global_step": 8640, "epoch": 205} {"train_loss": -4.974065780639648, "global_step": 8641, "epoch": 205} {"train_loss": -4.967473030090332, "global_step": 8642, "epoch": 205} {"train_loss": -5.097658634185791, "global_step": 8643, "epoch": 205} {"train_loss": -4.913652420043945, "global_step": 8644, "epoch": 205} {"train_loss": -5.030455589294434, "global_step": 8645, "epoch": 205} {"train_loss": -4.879184722900391, "global_step": 8646, "epoch": 205} {"train_loss": -4.878215312957764, "global_step": 8647, "epoch": 205} {"train_loss": -5.16123104095459, "global_step": 8648, "epoch": 205} {"train_loss": -4.987565994262695, "global_step": 8649, "epoch": 205} {"train_loss": -4.958271503448486, "global_step": 8650, "epoch": 205} {"train_loss": -4.962523176556542, "global_step": 8651, "epoch": 205, "val_loss": 82434.71875} {"train_loss": -4.9259748458862305, "global_step": 8652, "epoch": 206} {"train_loss": -4.974971771240234, "global_step": 8653, "epoch": 206} {"train_loss": -4.937623023986816, "global_step": 8654, "epoch": 206} {"train_loss": -5.075206756591797, "global_step": 8655, "epoch": 206} {"train_loss": -4.871967315673828, "global_step": 8656, "epoch": 206} {"train_loss": -4.883630752563477, "global_step": 8657, "epoch": 206} {"train_loss": -5.187407493591309, "global_step": 8658, "epoch": 206} {"train_loss": -5.016454219818115, "global_step": 8659, "epoch": 206} {"train_loss": -4.908329010009766, "global_step": 8660, "epoch": 206} {"train_loss": -4.930697917938232, "global_step": 8661, "epoch": 206} {"train_loss": -4.886238098144531, "global_step": 8662, "epoch": 206} {"train_loss": -4.9587788581848145, "global_step": 8663, "epoch": 206} {"train_loss": -5.013139247894287, "global_step": 8664, "epoch": 206} {"train_loss": -4.8991804122924805, "global_step": 8665, "epoch": 206} {"train_loss": -5.076931476593018, "global_step": 8666, "epoch": 206} {"train_loss": -4.976530075073242, "global_step": 8667, "epoch": 206} {"train_loss": -4.910951614379883, "global_step": 8668, "epoch": 206} {"train_loss": -4.9716081619262695, "global_step": 8669, "epoch": 206} {"train_loss": -5.038044452667236, "global_step": 8670, "epoch": 206} {"train_loss": -5.0316009521484375, "global_step": 8671, "epoch": 206} {"train_loss": -5.024625778198242, "global_step": 8672, "epoch": 206} {"train_loss": -5.153644561767578, "global_step": 8673, "epoch": 206} {"train_loss": -5.091413497924805, "global_step": 8674, "epoch": 206} {"train_loss": -5.001617431640625, "global_step": 8675, "epoch": 206} {"train_loss": -4.884756088256836, "global_step": 8676, "epoch": 206} {"train_loss": -4.964934825897217, "global_step": 8677, "epoch": 206} {"train_loss": -5.000776767730713, "global_step": 8678, "epoch": 206} {"train_loss": -4.835847854614258, "global_step": 8679, "epoch": 206} {"train_loss": -4.930295944213867, "global_step": 8680, "epoch": 206} {"train_loss": -4.871434211730957, "global_step": 8681, "epoch": 206} {"train_loss": -4.842390060424805, "global_step": 8682, "epoch": 206} {"train_loss": -5.086669921875, "global_step": 8683, "epoch": 206} {"train_loss": -4.996733665466309, "global_step": 8684, "epoch": 206} {"train_loss": -4.963616371154785, "global_step": 8685, "epoch": 206} {"train_loss": -5.100357532501221, "global_step": 8686, "epoch": 206} {"train_loss": -5.049651622772217, "global_step": 8687, "epoch": 206} {"train_loss": -5.212883472442627, "global_step": 8688, "epoch": 206} {"train_loss": -5.1184773445129395, "global_step": 8689, "epoch": 206} {"train_loss": -4.988205909729004, "global_step": 8690, "epoch": 206} {"train_loss": -4.947902679443359, "global_step": 8691, "epoch": 206} {"train_loss": -5.215859413146973, "global_step": 8692, "epoch": 206} {"train_loss": -4.9953709329877585, "global_step": 8693, "epoch": 206, "val_loss": 82836.046875} {"train_loss": -4.812982559204102, "global_step": 8694, "epoch": 207} {"train_loss": -5.059998035430908, "global_step": 8695, "epoch": 207} {"train_loss": -5.0425286293029785, "global_step": 8696, "epoch": 207} {"train_loss": -5.024351119995117, "global_step": 8697, "epoch": 207} {"train_loss": -4.992648124694824, "global_step": 8698, "epoch": 207} {"train_loss": -4.953428268432617, "global_step": 8699, "epoch": 207} {"train_loss": -4.9894561767578125, "global_step": 8700, "epoch": 207} {"train_loss": -5.024716377258301, "global_step": 8701, "epoch": 207} {"train_loss": -4.915895462036133, "global_step": 8702, "epoch": 207} {"train_loss": -4.778797626495361, "global_step": 8703, "epoch": 207} {"train_loss": -5.061362266540527, "global_step": 8704, "epoch": 207} {"train_loss": -4.9153337478637695, "global_step": 8705, "epoch": 207} {"train_loss": -4.9448466300964355, "global_step": 8706, "epoch": 207} {"train_loss": -5.097039699554443, "global_step": 8707, "epoch": 207} {"train_loss": -5.023871421813965, "global_step": 8708, "epoch": 207} {"train_loss": -4.931743144989014, "global_step": 8709, "epoch": 207} {"train_loss": -4.915402889251709, "global_step": 8710, "epoch": 207} {"train_loss": -4.952393531799316, "global_step": 8711, "epoch": 207} {"train_loss": -5.1210222244262695, "global_step": 8712, "epoch": 207} {"train_loss": -4.919539451599121, "global_step": 8713, "epoch": 207} {"train_loss": -4.9241743087768555, "global_step": 8714, "epoch": 207} {"train_loss": -5.059722423553467, "global_step": 8715, "epoch": 207} {"train_loss": -4.923263072967529, "global_step": 8716, "epoch": 207} {"train_loss": -4.815456390380859, "global_step": 8717, "epoch": 207} {"train_loss": -4.979461193084717, "global_step": 8718, "epoch": 207} {"train_loss": -5.026607513427734, "global_step": 8719, "epoch": 207} {"train_loss": -5.104508399963379, "global_step": 8720, "epoch": 207} {"train_loss": -5.065979957580566, "global_step": 8721, "epoch": 207} {"train_loss": -5.117117881774902, "global_step": 8722, "epoch": 207} {"train_loss": -5.078893184661865, "global_step": 8723, "epoch": 207} {"train_loss": -4.91793966293335, "global_step": 8724, "epoch": 207} {"train_loss": -5.013331413269043, "global_step": 8725, "epoch": 207} {"train_loss": -5.103662490844727, "global_step": 8726, "epoch": 207} {"train_loss": -5.073371887207031, "global_step": 8727, "epoch": 207} {"train_loss": -4.975476264953613, "global_step": 8728, "epoch": 207} {"train_loss": -5.033359527587891, "global_step": 8729, "epoch": 207} {"train_loss": -4.855854034423828, "global_step": 8730, "epoch": 207} {"train_loss": -5.011257648468018, "global_step": 8731, "epoch": 207} {"train_loss": -4.934845924377441, "global_step": 8732, "epoch": 207} {"train_loss": -4.945502281188965, "global_step": 8733, "epoch": 207} {"train_loss": -5.055441856384277, "global_step": 8734, "epoch": 207} {"train_loss": -4.9853401865277975, "global_step": 8735, "epoch": 207, "val_loss": 82002.078125} {"train_loss": -4.91613245010376, "global_step": 8736, "epoch": 208} {"train_loss": -4.863771915435791, "global_step": 8737, "epoch": 208} {"train_loss": -5.000702857971191, "global_step": 8738, "epoch": 208} {"train_loss": -4.634389877319336, "global_step": 8739, "epoch": 208} {"train_loss": -4.949676990509033, "global_step": 8740, "epoch": 208} {"train_loss": -4.966382026672363, "global_step": 8741, "epoch": 208} {"train_loss": -4.598476409912109, "global_step": 8742, "epoch": 208} {"train_loss": -5.002897262573242, "global_step": 8743, "epoch": 208} {"train_loss": -4.943215370178223, "global_step": 8744, "epoch": 208} {"train_loss": -4.703896999359131, "global_step": 8745, "epoch": 208} {"train_loss": -5.0213446617126465, "global_step": 8746, "epoch": 208} {"train_loss": -4.852736473083496, "global_step": 8747, "epoch": 208} {"train_loss": -4.806516170501709, "global_step": 8748, "epoch": 208} {"train_loss": -5.035280227661133, "global_step": 8749, "epoch": 208} {"train_loss": -4.957706451416016, "global_step": 8750, "epoch": 208} {"train_loss": -4.984471321105957, "global_step": 8751, "epoch": 208} {"train_loss": -5.028268337249756, "global_step": 8752, "epoch": 208} {"train_loss": -5.01738977432251, "global_step": 8753, "epoch": 208} {"train_loss": -4.900808334350586, "global_step": 8754, "epoch": 208} {"train_loss": -4.912883758544922, "global_step": 8755, "epoch": 208} {"train_loss": -4.966341972351074, "global_step": 8756, "epoch": 208} {"train_loss": -4.727334976196289, "global_step": 8757, "epoch": 208} {"train_loss": -5.042510509490967, "global_step": 8758, "epoch": 208} {"train_loss": -4.809562683105469, "global_step": 8759, "epoch": 208} {"train_loss": -5.118684768676758, "global_step": 8760, "epoch": 208} {"train_loss": -4.881618976593018, "global_step": 8761, "epoch": 208} {"train_loss": -5.0062432289123535, "global_step": 8762, "epoch": 208} {"train_loss": -5.078503608703613, "global_step": 8763, "epoch": 208} {"train_loss": -4.816915512084961, "global_step": 8764, "epoch": 208} {"train_loss": -4.916896820068359, "global_step": 8765, "epoch": 208} {"train_loss": -5.051342964172363, "global_step": 8766, "epoch": 208} {"train_loss": -4.976431846618652, "global_step": 8767, "epoch": 208} {"train_loss": -4.874752044677734, "global_step": 8768, "epoch": 208} {"train_loss": -5.077019691467285, "global_step": 8769, "epoch": 208} {"train_loss": -5.086038112640381, "global_step": 8770, "epoch": 208} {"train_loss": -5.023387908935547, "global_step": 8771, "epoch": 208} {"train_loss": -5.034566402435303, "global_step": 8772, "epoch": 208} {"train_loss": -4.936488151550293, "global_step": 8773, "epoch": 208} {"train_loss": -4.969570159912109, "global_step": 8774, "epoch": 208} {"train_loss": -5.161252975463867, "global_step": 8775, "epoch": 208} {"train_loss": -4.873378753662109, "global_step": 8776, "epoch": 208} {"train_loss": -4.943471181960333, "global_step": 8777, "epoch": 208, "val_loss": 82128.4140625} {"train_loss": -4.99282169342041, "global_step": 8778, "epoch": 209} {"train_loss": -5.038632392883301, "global_step": 8779, "epoch": 209} {"train_loss": -5.03488302230835, "global_step": 8780, "epoch": 209} {"train_loss": -5.004533767700195, "global_step": 8781, "epoch": 209} {"train_loss": -5.044522285461426, "global_step": 8782, "epoch": 209} {"train_loss": -5.025806427001953, "global_step": 8783, "epoch": 209} {"train_loss": -5.079120635986328, "global_step": 8784, "epoch": 209} {"train_loss": -4.866130828857422, "global_step": 8785, "epoch": 209} {"train_loss": -4.993314266204834, "global_step": 8786, "epoch": 209} {"train_loss": -5.1808319091796875, "global_step": 8787, "epoch": 209} {"train_loss": -5.011621475219727, "global_step": 8788, "epoch": 209} {"train_loss": -4.889584064483643, "global_step": 8789, "epoch": 209} {"train_loss": -4.887785911560059, "global_step": 8790, "epoch": 209} {"train_loss": -4.967678070068359, "global_step": 8791, "epoch": 209} {"train_loss": -5.000570297241211, "global_step": 8792, "epoch": 209} {"train_loss": -5.101933002471924, "global_step": 8793, "epoch": 209} {"train_loss": -4.990708827972412, "global_step": 8794, "epoch": 209} {"train_loss": -5.142711639404297, "global_step": 8795, "epoch": 209} {"train_loss": -5.005071640014648, "global_step": 8796, "epoch": 209} {"train_loss": -4.994143486022949, "global_step": 8797, "epoch": 209} {"train_loss": -4.901263236999512, "global_step": 8798, "epoch": 209} {"train_loss": -5.111417293548584, "global_step": 8799, "epoch": 209} {"train_loss": -4.997196197509766, "global_step": 8800, "epoch": 209} {"train_loss": -4.947523593902588, "global_step": 8801, "epoch": 209} {"train_loss": -4.899730682373047, "global_step": 8802, "epoch": 209} {"train_loss": -5.014873504638672, "global_step": 8803, "epoch": 209} {"train_loss": -4.930963039398193, "global_step": 8804, "epoch": 209} {"train_loss": -4.968111991882324, "global_step": 8805, "epoch": 209} {"train_loss": -5.074906826019287, "global_step": 8806, "epoch": 209} {"train_loss": -4.988858222961426, "global_step": 8807, "epoch": 209} {"train_loss": -4.954312324523926, "global_step": 8808, "epoch": 209} {"train_loss": -5.025737762451172, "global_step": 8809, "epoch": 209} {"train_loss": -5.056993007659912, "global_step": 8810, "epoch": 209} {"train_loss": -4.8781819343566895, "global_step": 8811, "epoch": 209} {"train_loss": -4.926077842712402, "global_step": 8812, "epoch": 209} {"train_loss": -5.098740577697754, "global_step": 8813, "epoch": 209} {"train_loss": -5.027555465698242, "global_step": 8814, "epoch": 209} {"train_loss": -5.019730091094971, "global_step": 8815, "epoch": 209} {"train_loss": -5.116231441497803, "global_step": 8816, "epoch": 209} {"train_loss": -5.177799224853516, "global_step": 8817, "epoch": 209} {"train_loss": -4.861246109008789, "global_step": 8818, "epoch": 209} {"train_loss": -5.007701737540109, "global_step": 8819, "epoch": 209, "val_loss": 81657.03125} {"train_loss": -5.075874328613281, "global_step": 8820, "epoch": 210} {"train_loss": -5.029410362243652, "global_step": 8821, "epoch": 210} {"train_loss": -4.828823089599609, "global_step": 8822, "epoch": 210} {"train_loss": -4.939446449279785, "global_step": 8823, "epoch": 210} {"train_loss": -5.105570316314697, "global_step": 8824, "epoch": 210} {"train_loss": -5.012890815734863, "global_step": 8825, "epoch": 210} {"train_loss": -4.860626220703125, "global_step": 8826, "epoch": 210} {"train_loss": -4.942330360412598, "global_step": 8827, "epoch": 210} {"train_loss": -5.006645679473877, "global_step": 8828, "epoch": 210} {"train_loss": -5.067601203918457, "global_step": 8829, "epoch": 210} {"train_loss": -5.079708099365234, "global_step": 8830, "epoch": 210} {"train_loss": -5.0289306640625, "global_step": 8831, "epoch": 210} {"train_loss": -4.956178188323975, "global_step": 8832, "epoch": 210} {"train_loss": -5.093754291534424, "global_step": 8833, "epoch": 210} {"train_loss": -4.912662029266357, "global_step": 8834, "epoch": 210} {"train_loss": -4.950631141662598, "global_step": 8835, "epoch": 210} {"train_loss": -4.959134101867676, "global_step": 8836, "epoch": 210} {"train_loss": -5.020392894744873, "global_step": 8837, "epoch": 210} {"train_loss": -4.938900470733643, "global_step": 8838, "epoch": 210} {"train_loss": -4.968042373657227, "global_step": 8839, "epoch": 210} {"train_loss": -5.039144515991211, "global_step": 8840, "epoch": 210} {"train_loss": -4.9334330558776855, "global_step": 8841, "epoch": 210} {"train_loss": -4.983648300170898, "global_step": 8842, "epoch": 210} {"train_loss": -4.90402889251709, "global_step": 8843, "epoch": 210} {"train_loss": -4.86412239074707, "global_step": 8844, "epoch": 210} {"train_loss": -4.819968223571777, "global_step": 8845, "epoch": 210} {"train_loss": -5.0235795974731445, "global_step": 8846, "epoch": 210} {"train_loss": -4.9778242111206055, "global_step": 8847, "epoch": 210} {"train_loss": -4.674564361572266, "global_step": 8848, "epoch": 210} {"train_loss": -5.050922393798828, "global_step": 8849, "epoch": 210} {"train_loss": -4.826009750366211, "global_step": 8850, "epoch": 210} {"train_loss": -4.84918212890625, "global_step": 8851, "epoch": 210} {"train_loss": -5.017147541046143, "global_step": 8852, "epoch": 210} {"train_loss": -4.960082054138184, "global_step": 8853, "epoch": 210} {"train_loss": -4.882368564605713, "global_step": 8854, "epoch": 210} {"train_loss": -4.932436466217041, "global_step": 8855, "epoch": 210} {"train_loss": -4.933992385864258, "global_step": 8856, "epoch": 210} {"train_loss": -4.817863464355469, "global_step": 8857, "epoch": 210} {"train_loss": -4.905774116516113, "global_step": 8858, "epoch": 210} {"train_loss": -4.995345115661621, "global_step": 8859, "epoch": 210} {"train_loss": -5.04830265045166, "global_step": 8860, "epoch": 210} {"train_loss": -4.9598381746382945, "global_step": 8861, "epoch": 210, "val_loss": 81379.7421875} {"train_loss": -5.047853469848633, "global_step": 8862, "epoch": 211} {"train_loss": -5.008581638336182, "global_step": 8863, "epoch": 211} {"train_loss": -5.03718376159668, "global_step": 8864, "epoch": 211} {"train_loss": -4.9967498779296875, "global_step": 8865, "epoch": 211} {"train_loss": -5.045368671417236, "global_step": 8866, "epoch": 211} {"train_loss": -5.004598617553711, "global_step": 8867, "epoch": 211} {"train_loss": -4.936762809753418, "global_step": 8868, "epoch": 211} {"train_loss": -4.828045845031738, "global_step": 8869, "epoch": 211} {"train_loss": -5.023439407348633, "global_step": 8870, "epoch": 211} {"train_loss": -4.94293212890625, "global_step": 8871, "epoch": 211} {"train_loss": -5.020437717437744, "global_step": 8872, "epoch": 211} {"train_loss": -4.987635135650635, "global_step": 8873, "epoch": 211} {"train_loss": -5.084725379943848, "global_step": 8874, "epoch": 211} {"train_loss": -4.868710517883301, "global_step": 8875, "epoch": 211} {"train_loss": -4.847424507141113, "global_step": 8876, "epoch": 211} {"train_loss": -5.082415580749512, "global_step": 8877, "epoch": 211} {"train_loss": -4.949963569641113, "global_step": 8878, "epoch": 211} {"train_loss": -4.917139053344727, "global_step": 8879, "epoch": 211} {"train_loss": -5.055389881134033, "global_step": 8880, "epoch": 211} {"train_loss": -4.873085021972656, "global_step": 8881, "epoch": 211} {"train_loss": -4.928795337677002, "global_step": 8882, "epoch": 211} {"train_loss": -5.062575817108154, "global_step": 8883, "epoch": 211} {"train_loss": -4.881803035736084, "global_step": 8884, "epoch": 211} {"train_loss": -4.915937423706055, "global_step": 8885, "epoch": 211} {"train_loss": -4.908845901489258, "global_step": 8886, "epoch": 211} {"train_loss": -4.967370986938477, "global_step": 8887, "epoch": 211} {"train_loss": -5.107359886169434, "global_step": 8888, "epoch": 211} {"train_loss": -4.951807022094727, "global_step": 8889, "epoch": 211} {"train_loss": -4.861997127532959, "global_step": 8890, "epoch": 211} {"train_loss": -5.0320281982421875, "global_step": 8891, "epoch": 211} {"train_loss": -5.068599700927734, "global_step": 8892, "epoch": 211} {"train_loss": -4.803709030151367, "global_step": 8893, "epoch": 211} {"train_loss": -4.970515251159668, "global_step": 8894, "epoch": 211} {"train_loss": -4.937358856201172, "global_step": 8895, "epoch": 211} {"train_loss": -4.933724880218506, "global_step": 8896, "epoch": 211} {"train_loss": -4.865621566772461, "global_step": 8897, "epoch": 211} {"train_loss": -4.978017807006836, "global_step": 8898, "epoch": 211} {"train_loss": -4.865530967712402, "global_step": 8899, "epoch": 211} {"train_loss": -4.888500213623047, "global_step": 8900, "epoch": 211} {"train_loss": -5.055408477783203, "global_step": 8901, "epoch": 211} {"train_loss": -4.862914085388184, "global_step": 8902, "epoch": 211} {"train_loss": -4.960630087625413, "global_step": 8903, "epoch": 211, "val_loss": 81281.0546875} {"train_loss": -4.956195831298828, "global_step": 8904, "epoch": 212} {"train_loss": -4.934296607971191, "global_step": 8905, "epoch": 212} {"train_loss": -4.942047595977783, "global_step": 8906, "epoch": 212} {"train_loss": -5.069918155670166, "global_step": 8907, "epoch": 212} {"train_loss": -5.072544097900391, "global_step": 8908, "epoch": 212} {"train_loss": -5.109097957611084, "global_step": 8909, "epoch": 212} {"train_loss": -4.985171318054199, "global_step": 8910, "epoch": 212} {"train_loss": -5.049727916717529, "global_step": 8911, "epoch": 212} {"train_loss": -5.0808868408203125, "global_step": 8912, "epoch": 212} {"train_loss": -5.016221046447754, "global_step": 8913, "epoch": 212} {"train_loss": -4.898406982421875, "global_step": 8914, "epoch": 212} {"train_loss": -4.995352745056152, "global_step": 8915, "epoch": 212} {"train_loss": -5.005380630493164, "global_step": 8916, "epoch": 212} {"train_loss": -4.967889785766602, "global_step": 8917, "epoch": 212} {"train_loss": -4.922499656677246, "global_step": 8918, "epoch": 212} {"train_loss": -5.202953815460205, "global_step": 8919, "epoch": 212} {"train_loss": -4.896750450134277, "global_step": 8920, "epoch": 212} {"train_loss": -4.844574928283691, "global_step": 8921, "epoch": 212} {"train_loss": -4.874480724334717, "global_step": 8922, "epoch": 212} {"train_loss": -4.799445629119873, "global_step": 8923, "epoch": 212} {"train_loss": -5.026402473449707, "global_step": 8924, "epoch": 212} {"train_loss": -5.0302276611328125, "global_step": 8925, "epoch": 212} {"train_loss": -4.859919548034668, "global_step": 8926, "epoch": 212} {"train_loss": -5.022194862365723, "global_step": 8927, "epoch": 212} {"train_loss": -4.798174858093262, "global_step": 8928, "epoch": 212} {"train_loss": -4.896538734436035, "global_step": 8929, "epoch": 212} {"train_loss": -5.080676555633545, "global_step": 8930, "epoch": 212} {"train_loss": -4.874349117279053, "global_step": 8931, "epoch": 212} {"train_loss": -4.980500221252441, "global_step": 8932, "epoch": 212} {"train_loss": -4.846198558807373, "global_step": 8933, "epoch": 212} {"train_loss": -4.903891086578369, "global_step": 8934, "epoch": 212} {"train_loss": -4.880502700805664, "global_step": 8935, "epoch": 212} {"train_loss": -4.915379524230957, "global_step": 8936, "epoch": 212} {"train_loss": -4.857773780822754, "global_step": 8937, "epoch": 212} {"train_loss": -4.906735897064209, "global_step": 8938, "epoch": 212} {"train_loss": -4.930685043334961, "global_step": 8939, "epoch": 212} {"train_loss": -4.984830379486084, "global_step": 8940, "epoch": 212} {"train_loss": -5.099610805511475, "global_step": 8941, "epoch": 212} {"train_loss": -4.904212474822998, "global_step": 8942, "epoch": 212} {"train_loss": -4.957056999206543, "global_step": 8943, "epoch": 212} {"train_loss": -4.975332260131836, "global_step": 8944, "epoch": 212} {"train_loss": -4.957496824718657, "global_step": 8945, "epoch": 212, "val_loss": 81397.7265625} {"train_loss": -4.929845333099365, "global_step": 8946, "epoch": 213} {"train_loss": -4.876590728759766, "global_step": 8947, "epoch": 213} {"train_loss": -5.135186195373535, "global_step": 8948, "epoch": 213} {"train_loss": -4.8356451988220215, "global_step": 8949, "epoch": 213} {"train_loss": -4.915791988372803, "global_step": 8950, "epoch": 213} {"train_loss": -4.932474136352539, "global_step": 8951, "epoch": 213} {"train_loss": -4.947181701660156, "global_step": 8952, "epoch": 213} {"train_loss": -5.030719757080078, "global_step": 8953, "epoch": 213} {"train_loss": -4.846330642700195, "global_step": 8954, "epoch": 213} {"train_loss": -5.062160015106201, "global_step": 8955, "epoch": 213} {"train_loss": -5.008035182952881, "global_step": 8956, "epoch": 213} {"train_loss": -4.8599748611450195, "global_step": 8957, "epoch": 213} {"train_loss": -4.946352958679199, "global_step": 8958, "epoch": 213} {"train_loss": -4.936527729034424, "global_step": 8959, "epoch": 213} {"train_loss": -5.028062343597412, "global_step": 8960, "epoch": 213} {"train_loss": -4.892524719238281, "global_step": 8961, "epoch": 213} {"train_loss": -4.8196868896484375, "global_step": 8962, "epoch": 213} {"train_loss": -4.990891456604004, "global_step": 8963, "epoch": 213} {"train_loss": -4.843791961669922, "global_step": 8964, "epoch": 213} {"train_loss": -4.870122909545898, "global_step": 8965, "epoch": 213} {"train_loss": -4.8239827156066895, "global_step": 8966, "epoch": 213} {"train_loss": -4.888397216796875, "global_step": 8967, "epoch": 213} {"train_loss": -4.972149848937988, "global_step": 8968, "epoch": 213} {"train_loss": -5.134400367736816, "global_step": 8969, "epoch": 213} {"train_loss": -5.06453275680542, "global_step": 8970, "epoch": 213} {"train_loss": -4.889570236206055, "global_step": 8971, "epoch": 213} {"train_loss": -4.912148475646973, "global_step": 8972, "epoch": 213} {"train_loss": -5.112400054931641, "global_step": 8973, "epoch": 213} {"train_loss": -4.762635231018066, "global_step": 8974, "epoch": 213} {"train_loss": -4.950486183166504, "global_step": 8975, "epoch": 213} {"train_loss": -5.054717540740967, "global_step": 8976, "epoch": 213} {"train_loss": -5.082172393798828, "global_step": 8977, "epoch": 213} {"train_loss": -5.040576934814453, "global_step": 8978, "epoch": 213} {"train_loss": -4.943634986877441, "global_step": 8979, "epoch": 213} {"train_loss": -5.165742874145508, "global_step": 8980, "epoch": 213} {"train_loss": -5.003596305847168, "global_step": 8981, "epoch": 213} {"train_loss": -4.943002700805664, "global_step": 8982, "epoch": 213} {"train_loss": -5.125870704650879, "global_step": 8983, "epoch": 213} {"train_loss": -5.066625118255615, "global_step": 8984, "epoch": 213} {"train_loss": -5.124619483947754, "global_step": 8985, "epoch": 213} {"train_loss": -4.999242305755615, "global_step": 8986, "epoch": 213} {"train_loss": -4.9743271214621405, "global_step": 8987, "epoch": 213, "val_loss": 81567.3046875} {"train_loss": -4.930324077606201, "global_step": 8988, "epoch": 214} {"train_loss": -4.95062255859375, "global_step": 8989, "epoch": 214} {"train_loss": -5.050106048583984, "global_step": 8990, "epoch": 214} {"train_loss": -4.975456714630127, "global_step": 8991, "epoch": 214} {"train_loss": -5.134329795837402, "global_step": 8992, "epoch": 214} {"train_loss": -4.942910194396973, "global_step": 8993, "epoch": 214} {"train_loss": -5.210387229919434, "global_step": 8994, "epoch": 214} {"train_loss": -5.067561149597168, "global_step": 8995, "epoch": 214} {"train_loss": -5.083542346954346, "global_step": 8996, "epoch": 214} {"train_loss": -4.935568809509277, "global_step": 8997, "epoch": 214} {"train_loss": -4.714097499847412, "global_step": 8998, "epoch": 214} {"train_loss": -5.0183000564575195, "global_step": 8999, "epoch": 214} {"train_loss": -4.804203033447266, "global_step": 9000, "epoch": 214} {"train_loss": -4.611501216888428, "global_step": 9001, "epoch": 214} {"train_loss": -4.861115455627441, "global_step": 9002, "epoch": 214} {"train_loss": -5.001639366149902, "global_step": 9003, "epoch": 214} {"train_loss": -4.827089786529541, "global_step": 9004, "epoch": 214} {"train_loss": -5.006519317626953, "global_step": 9005, "epoch": 214} {"train_loss": -4.884733200073242, "global_step": 9006, "epoch": 214} {"train_loss": -4.887528896331787, "global_step": 9007, "epoch": 214} {"train_loss": -5.0363006591796875, "global_step": 9008, "epoch": 214} {"train_loss": -4.881511211395264, "global_step": 9009, "epoch": 214} {"train_loss": -4.9575018882751465, "global_step": 9010, "epoch": 214} {"train_loss": -4.901949882507324, "global_step": 9011, "epoch": 214} {"train_loss": -4.786072254180908, "global_step": 9012, "epoch": 214} {"train_loss": -4.969613552093506, "global_step": 9013, "epoch": 214} {"train_loss": -4.767237663269043, "global_step": 9014, "epoch": 214} {"train_loss": -4.760973930358887, "global_step": 9015, "epoch": 214} {"train_loss": -4.609236717224121, "global_step": 9016, "epoch": 214} {"train_loss": -4.597312927246094, "global_step": 9017, "epoch": 214} {"train_loss": -4.712892055511475, "global_step": 9018, "epoch": 214} {"train_loss": -4.616682052612305, "global_step": 9019, "epoch": 214} {"train_loss": -4.667453765869141, "global_step": 9020, "epoch": 214} {"train_loss": -4.805639266967773, "global_step": 9021, "epoch": 214} {"train_loss": -4.742047309875488, "global_step": 9022, "epoch": 214} {"train_loss": -4.811568260192871, "global_step": 9023, "epoch": 214} {"train_loss": -4.787220001220703, "global_step": 9024, "epoch": 214} {"train_loss": -4.634763240814209, "global_step": 9025, "epoch": 214} {"train_loss": -4.828506946563721, "global_step": 9026, "epoch": 214} {"train_loss": -4.670570373535156, "global_step": 9027, "epoch": 214} {"train_loss": -4.7432098388671875, "global_step": 9028, "epoch": 214} {"train_loss": -4.856836602801368, "global_step": 9029, "epoch": 214, "val_loss": 82310.265625} {"train_loss": -4.825023174285889, "global_step": 9030, "epoch": 215} {"train_loss": -4.808257579803467, "global_step": 9031, "epoch": 215} {"train_loss": -4.978475570678711, "global_step": 9032, "epoch": 215} {"train_loss": -4.919327259063721, "global_step": 9033, "epoch": 215} {"train_loss": -4.963631629943848, "global_step": 9034, "epoch": 215} {"train_loss": -4.945121765136719, "global_step": 9035, "epoch": 215} {"train_loss": -4.992281913757324, "global_step": 9036, "epoch": 215} {"train_loss": -5.08199405670166, "global_step": 9037, "epoch": 215} {"train_loss": -4.912657737731934, "global_step": 9038, "epoch": 215} {"train_loss": -4.892752647399902, "global_step": 9039, "epoch": 215} {"train_loss": -4.888511657714844, "global_step": 9040, "epoch": 215} {"train_loss": -4.984099864959717, "global_step": 9041, "epoch": 215} {"train_loss": -5.025816917419434, "global_step": 9042, "epoch": 215} {"train_loss": -4.9923176765441895, "global_step": 9043, "epoch": 215} {"train_loss": -5.160799503326416, "global_step": 9044, "epoch": 215} {"train_loss": -4.929010391235352, "global_step": 9045, "epoch": 215} {"train_loss": -4.886711597442627, "global_step": 9046, "epoch": 215} {"train_loss": -4.87613582611084, "global_step": 9047, "epoch": 215} {"train_loss": -5.005346298217773, "global_step": 9048, "epoch": 215} {"train_loss": -5.015997886657715, "global_step": 9049, "epoch": 215} {"train_loss": -4.954914093017578, "global_step": 9050, "epoch": 215} {"train_loss": -5.067993640899658, "global_step": 9051, "epoch": 215} {"train_loss": -4.849401950836182, "global_step": 9052, "epoch": 215} {"train_loss": -4.863395690917969, "global_step": 9053, "epoch": 215} {"train_loss": -5.089537620544434, "global_step": 9054, "epoch": 215} {"train_loss": -4.873088359832764, "global_step": 9055, "epoch": 215} {"train_loss": -4.973274230957031, "global_step": 9056, "epoch": 215} {"train_loss": -5.018719673156738, "global_step": 9057, "epoch": 215} {"train_loss": -5.047353744506836, "global_step": 9058, "epoch": 215} {"train_loss": -4.879631519317627, "global_step": 9059, "epoch": 215} {"train_loss": -4.974301815032959, "global_step": 9060, "epoch": 215} {"train_loss": -5.015771865844727, "global_step": 9061, "epoch": 215} {"train_loss": -5.037700176239014, "global_step": 9062, "epoch": 215} {"train_loss": -5.031167984008789, "global_step": 9063, "epoch": 215} {"train_loss": -5.028023719787598, "global_step": 9064, "epoch": 215} {"train_loss": -5.058891296386719, "global_step": 9065, "epoch": 215} {"train_loss": -5.111247539520264, "global_step": 9066, "epoch": 215} {"train_loss": -5.031815052032471, "global_step": 9067, "epoch": 215} {"train_loss": -4.912358283996582, "global_step": 9068, "epoch": 215} {"train_loss": -5.097527980804443, "global_step": 9069, "epoch": 215} {"train_loss": -5.008455753326416, "global_step": 9070, "epoch": 215} {"train_loss": -4.977579593658447, "global_step": 9071, "epoch": 215, "val_loss": 81734.03125} {"train_loss": -4.809553623199463, "global_step": 9072, "epoch": 216} {"train_loss": -4.985601425170898, "global_step": 9073, "epoch": 216} {"train_loss": -5.032279014587402, "global_step": 9074, "epoch": 216} {"train_loss": -5.166611194610596, "global_step": 9075, "epoch": 216} {"train_loss": -4.941317081451416, "global_step": 9076, "epoch": 216} {"train_loss": -5.026986122131348, "global_step": 9077, "epoch": 216} {"train_loss": -4.950794696807861, "global_step": 9078, "epoch": 216} {"train_loss": -5.13450813293457, "global_step": 9079, "epoch": 216} {"train_loss": -4.958497524261475, "global_step": 9080, "epoch": 216} {"train_loss": -4.8325276374816895, "global_step": 9081, "epoch": 216} {"train_loss": -4.978788375854492, "global_step": 9082, "epoch": 216} {"train_loss": -4.999042510986328, "global_step": 9083, "epoch": 216} {"train_loss": -4.802206039428711, "global_step": 9084, "epoch": 216} {"train_loss": -4.783777236938477, "global_step": 9085, "epoch": 216} {"train_loss": -4.944158554077148, "global_step": 9086, "epoch": 216} {"train_loss": -4.887390613555908, "global_step": 9087, "epoch": 216} {"train_loss": -4.927437782287598, "global_step": 9088, "epoch": 216} {"train_loss": -5.037219524383545, "global_step": 9089, "epoch": 216} {"train_loss": -4.845007419586182, "global_step": 9090, "epoch": 216} {"train_loss": -4.961130142211914, "global_step": 9091, "epoch": 216} {"train_loss": -4.855834007263184, "global_step": 9092, "epoch": 216} {"train_loss": -4.982670783996582, "global_step": 9093, "epoch": 216} {"train_loss": -4.924755573272705, "global_step": 9094, "epoch": 216} {"train_loss": -5.066221714019775, "global_step": 9095, "epoch": 216} {"train_loss": -5.0605082511901855, "global_step": 9096, "epoch": 216} {"train_loss": -4.888654708862305, "global_step": 9097, "epoch": 216} {"train_loss": -4.961181640625, "global_step": 9098, "epoch": 216} {"train_loss": -4.824968338012695, "global_step": 9099, "epoch": 216} {"train_loss": -4.896467685699463, "global_step": 9100, "epoch": 216} {"train_loss": -4.905558109283447, "global_step": 9101, "epoch": 216} {"train_loss": -4.8510236740112305, "global_step": 9102, "epoch": 216} {"train_loss": -4.860903263092041, "global_step": 9103, "epoch": 216} {"train_loss": -4.9571428298950195, "global_step": 9104, "epoch": 216} {"train_loss": -5.1538262367248535, "global_step": 9105, "epoch": 216} {"train_loss": -4.850534439086914, "global_step": 9106, "epoch": 216} {"train_loss": -4.930323600769043, "global_step": 9107, "epoch": 216} {"train_loss": -5.027463912963867, "global_step": 9108, "epoch": 216} {"train_loss": -4.993361949920654, "global_step": 9109, "epoch": 216} {"train_loss": -4.960990905761719, "global_step": 9110, "epoch": 216} {"train_loss": -4.927438735961914, "global_step": 9111, "epoch": 216} {"train_loss": -5.135514259338379, "global_step": 9112, "epoch": 216} {"train_loss": -4.949136086872646, "global_step": 9113, "epoch": 216, "val_loss": 83233.625} {"train_loss": -4.827303409576416, "global_step": 9114, "epoch": 217} {"train_loss": -4.9674835205078125, "global_step": 9115, "epoch": 217} {"train_loss": -4.8279619216918945, "global_step": 9116, "epoch": 217} {"train_loss": -4.946925163269043, "global_step": 9117, "epoch": 217} {"train_loss": -4.959263801574707, "global_step": 9118, "epoch": 217} {"train_loss": -4.730800151824951, "global_step": 9119, "epoch": 217} {"train_loss": -4.913811683654785, "global_step": 9120, "epoch": 217} {"train_loss": -4.937556743621826, "global_step": 9121, "epoch": 217} {"train_loss": -4.889493465423584, "global_step": 9122, "epoch": 217} {"train_loss": -4.95810604095459, "global_step": 9123, "epoch": 217} {"train_loss": -4.985789775848389, "global_step": 9124, "epoch": 217} {"train_loss": -4.992944717407227, "global_step": 9125, "epoch": 217} {"train_loss": -4.967233657836914, "global_step": 9126, "epoch": 217} {"train_loss": -4.937083721160889, "global_step": 9127, "epoch": 217} {"train_loss": -4.853420257568359, "global_step": 9128, "epoch": 217} {"train_loss": -4.911332607269287, "global_step": 9129, "epoch": 217} {"train_loss": -5.0002055168151855, "global_step": 9130, "epoch": 217} {"train_loss": -4.985445022583008, "global_step": 9131, "epoch": 217} {"train_loss": -5.057583332061768, "global_step": 9132, "epoch": 217} {"train_loss": -5.0354719161987305, "global_step": 9133, "epoch": 217} {"train_loss": -4.993666648864746, "global_step": 9134, "epoch": 217} {"train_loss": -5.048583984375, "global_step": 9135, "epoch": 217} {"train_loss": -5.0197248458862305, "global_step": 9136, "epoch": 217} {"train_loss": -4.803386688232422, "global_step": 9137, "epoch": 217} {"train_loss": -4.914546012878418, "global_step": 9138, "epoch": 217} {"train_loss": -4.84588623046875, "global_step": 9139, "epoch": 217} {"train_loss": -4.751045227050781, "global_step": 9140, "epoch": 217} {"train_loss": -5.08863639831543, "global_step": 9141, "epoch": 217} {"train_loss": -4.898366928100586, "global_step": 9142, "epoch": 217} {"train_loss": -4.890618324279785, "global_step": 9143, "epoch": 217} {"train_loss": -4.913187026977539, "global_step": 9144, "epoch": 217} {"train_loss": -5.022058486938477, "global_step": 9145, "epoch": 217} {"train_loss": -4.927575588226318, "global_step": 9146, "epoch": 217} {"train_loss": -4.9339599609375, "global_step": 9147, "epoch": 217} {"train_loss": -5.012741565704346, "global_step": 9148, "epoch": 217} {"train_loss": -4.918830871582031, "global_step": 9149, "epoch": 217} {"train_loss": -4.937605381011963, "global_step": 9150, "epoch": 217} {"train_loss": -5.0469512939453125, "global_step": 9151, "epoch": 217} {"train_loss": -4.918618202209473, "global_step": 9152, "epoch": 217} {"train_loss": -5.033239364624023, "global_step": 9153, "epoch": 217} {"train_loss": -4.805181980133057, "global_step": 9154, "epoch": 217} {"train_loss": -4.938191357113066, "global_step": 9155, "epoch": 217, "val_loss": 81955.734375} {"train_loss": -5.086334228515625, "global_step": 9156, "epoch": 218} {"train_loss": -4.766251564025879, "global_step": 9157, "epoch": 218} {"train_loss": -5.077834129333496, "global_step": 9158, "epoch": 218} {"train_loss": -4.860494613647461, "global_step": 9159, "epoch": 218} {"train_loss": -4.9121904373168945, "global_step": 9160, "epoch": 218} {"train_loss": -5.143404960632324, "global_step": 9161, "epoch": 218} {"train_loss": -4.962672233581543, "global_step": 9162, "epoch": 218} {"train_loss": -5.018689155578613, "global_step": 9163, "epoch": 218} {"train_loss": -5.046703338623047, "global_step": 9164, "epoch": 218} {"train_loss": -4.838066101074219, "global_step": 9165, "epoch": 218} {"train_loss": -5.110678672790527, "global_step": 9166, "epoch": 218} {"train_loss": -4.946863651275635, "global_step": 9167, "epoch": 218} {"train_loss": -4.9348955154418945, "global_step": 9168, "epoch": 218} {"train_loss": -5.092801570892334, "global_step": 9169, "epoch": 218} {"train_loss": -4.985860824584961, "global_step": 9170, "epoch": 218} {"train_loss": -4.933066368103027, "global_step": 9171, "epoch": 218} {"train_loss": -4.9601969718933105, "global_step": 9172, "epoch": 218} {"train_loss": -4.986017227172852, "global_step": 9173, "epoch": 218} {"train_loss": -4.919435501098633, "global_step": 9174, "epoch": 218} {"train_loss": -5.039590835571289, "global_step": 9175, "epoch": 218} {"train_loss": -5.024587631225586, "global_step": 9176, "epoch": 218} {"train_loss": -5.0814032554626465, "global_step": 9177, "epoch": 218} {"train_loss": -5.065299034118652, "global_step": 9178, "epoch": 218} {"train_loss": -5.059569358825684, "global_step": 9179, "epoch": 218} {"train_loss": -5.052520275115967, "global_step": 9180, "epoch": 218} {"train_loss": -4.939450740814209, "global_step": 9181, "epoch": 218} {"train_loss": -5.177801132202148, "global_step": 9182, "epoch": 218} {"train_loss": -4.893918991088867, "global_step": 9183, "epoch": 218} {"train_loss": -5.019700050354004, "global_step": 9184, "epoch": 218} {"train_loss": -5.1069769859313965, "global_step": 9185, "epoch": 218} {"train_loss": -4.971750736236572, "global_step": 9186, "epoch": 218} {"train_loss": -5.087657928466797, "global_step": 9187, "epoch": 218} {"train_loss": -5.112084865570068, "global_step": 9188, "epoch": 218} {"train_loss": -5.06907844543457, "global_step": 9189, "epoch": 218} {"train_loss": -5.081245422363281, "global_step": 9190, "epoch": 218} {"train_loss": -5.011580944061279, "global_step": 9191, "epoch": 218} {"train_loss": -4.91231107711792, "global_step": 9192, "epoch": 218} {"train_loss": -4.896528244018555, "global_step": 9193, "epoch": 218} {"train_loss": -4.985125541687012, "global_step": 9194, "epoch": 218} {"train_loss": -4.996579647064209, "global_step": 9195, "epoch": 218} {"train_loss": -5.080631256103516, "global_step": 9196, "epoch": 218} {"train_loss": -5.005431901840937, "global_step": 9197, "epoch": 218, "val_loss": 80684.4140625} {"train_loss": -5.043254852294922, "global_step": 9198, "epoch": 219} {"train_loss": -4.889555931091309, "global_step": 9199, "epoch": 219} {"train_loss": -4.905248641967773, "global_step": 9200, "epoch": 219} {"train_loss": -5.047000885009766, "global_step": 9201, "epoch": 219} {"train_loss": -5.015260696411133, "global_step": 9202, "epoch": 219} {"train_loss": -4.983558654785156, "global_step": 9203, "epoch": 219} {"train_loss": -4.920181751251221, "global_step": 9204, "epoch": 219} {"train_loss": -5.020831108093262, "global_step": 9205, "epoch": 219} {"train_loss": -4.918174743652344, "global_step": 9206, "epoch": 219} {"train_loss": -5.098764419555664, "global_step": 9207, "epoch": 219} {"train_loss": -4.877117156982422, "global_step": 9208, "epoch": 219} {"train_loss": -4.954005241394043, "global_step": 9209, "epoch": 219} {"train_loss": -4.917940616607666, "global_step": 9210, "epoch": 219} {"train_loss": -4.965907096862793, "global_step": 9211, "epoch": 219} {"train_loss": -5.072051048278809, "global_step": 9212, "epoch": 219} {"train_loss": -5.098257064819336, "global_step": 9213, "epoch": 219} {"train_loss": -5.116340160369873, "global_step": 9214, "epoch": 219} {"train_loss": -4.991697788238525, "global_step": 9215, "epoch": 219} {"train_loss": -5.043308258056641, "global_step": 9216, "epoch": 219} {"train_loss": -5.138537406921387, "global_step": 9217, "epoch": 219} {"train_loss": -4.968845367431641, "global_step": 9218, "epoch": 219} {"train_loss": -5.037996292114258, "global_step": 9219, "epoch": 219} {"train_loss": -5.029141426086426, "global_step": 9220, "epoch": 219} {"train_loss": -4.845406532287598, "global_step": 9221, "epoch": 219} {"train_loss": -4.9253339767456055, "global_step": 9222, "epoch": 219} {"train_loss": -5.090500831604004, "global_step": 9223, "epoch": 219} {"train_loss": -4.9187421798706055, "global_step": 9224, "epoch": 219} {"train_loss": -4.914616584777832, "global_step": 9225, "epoch": 219} {"train_loss": -5.062965393066406, "global_step": 9226, "epoch": 219} {"train_loss": -5.095832824707031, "global_step": 9227, "epoch": 219} {"train_loss": -4.910815238952637, "global_step": 9228, "epoch": 219} {"train_loss": -5.00572395324707, "global_step": 9229, "epoch": 219} {"train_loss": -5.028545379638672, "global_step": 9230, "epoch": 219} {"train_loss": -4.932028770446777, "global_step": 9231, "epoch": 219} {"train_loss": -4.928003787994385, "global_step": 9232, "epoch": 219} {"train_loss": -5.133326530456543, "global_step": 9233, "epoch": 219} {"train_loss": -5.086733818054199, "global_step": 9234, "epoch": 219} {"train_loss": -4.961086273193359, "global_step": 9235, "epoch": 219} {"train_loss": -4.992664337158203, "global_step": 9236, "epoch": 219} {"train_loss": -4.9137091636657715, "global_step": 9237, "epoch": 219} {"train_loss": -5.0403151512146, "global_step": 9238, "epoch": 219} {"train_loss": -4.997769333067394, "global_step": 9239, "epoch": 219, "val_loss": 81168.2421875} {"train_loss": -4.919752597808838, "global_step": 9240, "epoch": 220} {"train_loss": -5.131164073944092, "global_step": 9241, "epoch": 220} {"train_loss": -5.266193389892578, "global_step": 9242, "epoch": 220} {"train_loss": -4.864692687988281, "global_step": 9243, "epoch": 220} {"train_loss": -5.058679103851318, "global_step": 9244, "epoch": 220} {"train_loss": -4.934921741485596, "global_step": 9245, "epoch": 220} {"train_loss": -4.987926006317139, "global_step": 9246, "epoch": 220} {"train_loss": -5.017180442810059, "global_step": 9247, "epoch": 220} {"train_loss": -5.086601734161377, "global_step": 9248, "epoch": 220} {"train_loss": -5.008449554443359, "global_step": 9249, "epoch": 220} {"train_loss": -4.988288879394531, "global_step": 9250, "epoch": 220} {"train_loss": -4.974258899688721, "global_step": 9251, "epoch": 220} {"train_loss": -5.000157833099365, "global_step": 9252, "epoch": 220} {"train_loss": -4.929640293121338, "global_step": 9253, "epoch": 220} {"train_loss": -4.928648471832275, "global_step": 9254, "epoch": 220} {"train_loss": -4.759866237640381, "global_step": 9255, "epoch": 220} {"train_loss": -4.9398651123046875, "global_step": 9256, "epoch": 220} {"train_loss": -4.9547529220581055, "global_step": 9257, "epoch": 220} {"train_loss": -4.986697196960449, "global_step": 9258, "epoch": 220} {"train_loss": -4.977787971496582, "global_step": 9259, "epoch": 220} {"train_loss": -5.037943363189697, "global_step": 9260, "epoch": 220} {"train_loss": -4.922672271728516, "global_step": 9261, "epoch": 220} {"train_loss": -5.001532077789307, "global_step": 9262, "epoch": 220} {"train_loss": -4.917311668395996, "global_step": 9263, "epoch": 220} {"train_loss": -4.94293737411499, "global_step": 9264, "epoch": 220} {"train_loss": -5.080039978027344, "global_step": 9265, "epoch": 220} {"train_loss": -5.062041282653809, "global_step": 9266, "epoch": 220} {"train_loss": -5.065791130065918, "global_step": 9267, "epoch": 220} {"train_loss": -4.915445327758789, "global_step": 9268, "epoch": 220} {"train_loss": -4.998905658721924, "global_step": 9269, "epoch": 220} {"train_loss": -4.886703968048096, "global_step": 9270, "epoch": 220} {"train_loss": -4.914078712463379, "global_step": 9271, "epoch": 220} {"train_loss": -5.05534553527832, "global_step": 9272, "epoch": 220} {"train_loss": -5.17955207824707, "global_step": 9273, "epoch": 220} {"train_loss": -5.051258087158203, "global_step": 9274, "epoch": 220} {"train_loss": -5.055819988250732, "global_step": 9275, "epoch": 220} {"train_loss": -4.961926460266113, "global_step": 9276, "epoch": 220} {"train_loss": -4.946789741516113, "global_step": 9277, "epoch": 220} {"train_loss": -4.999615669250488, "global_step": 9278, "epoch": 220} {"train_loss": -4.879485130310059, "global_step": 9279, "epoch": 220} {"train_loss": -4.9587016105651855, "global_step": 9280, "epoch": 220} {"train_loss": -4.99100044795445, "global_step": 9281, "epoch": 220, "val_loss": 81776.109375} {"train_loss": -4.819169044494629, "global_step": 9282, "epoch": 221} {"train_loss": -5.06397819519043, "global_step": 9283, "epoch": 221} {"train_loss": -4.949202537536621, "global_step": 9284, "epoch": 221} {"train_loss": -5.009737014770508, "global_step": 9285, "epoch": 221} {"train_loss": -5.047459602355957, "global_step": 9286, "epoch": 221} {"train_loss": -5.062765121459961, "global_step": 9287, "epoch": 221} {"train_loss": -5.0275068283081055, "global_step": 9288, "epoch": 221} {"train_loss": -4.999555587768555, "global_step": 9289, "epoch": 221} {"train_loss": -5.012324810028076, "global_step": 9290, "epoch": 221} {"train_loss": -4.919094562530518, "global_step": 9291, "epoch": 221} {"train_loss": -4.966974258422852, "global_step": 9292, "epoch": 221} {"train_loss": -4.904251575469971, "global_step": 9293, "epoch": 221} {"train_loss": -5.068397045135498, "global_step": 9294, "epoch": 221} {"train_loss": -4.9963531494140625, "global_step": 9295, "epoch": 221} {"train_loss": -4.941084861755371, "global_step": 9296, "epoch": 221} {"train_loss": -4.9833173751831055, "global_step": 9297, "epoch": 221} {"train_loss": -5.112387657165527, "global_step": 9298, "epoch": 221} {"train_loss": -4.928417205810547, "global_step": 9299, "epoch": 221} {"train_loss": -5.0642595291137695, "global_step": 9300, "epoch": 221} {"train_loss": -4.93133544921875, "global_step": 9301, "epoch": 221} {"train_loss": -5.040561676025391, "global_step": 9302, "epoch": 221} {"train_loss": -5.009145736694336, "global_step": 9303, "epoch": 221} {"train_loss": -5.021399021148682, "global_step": 9304, "epoch": 221} {"train_loss": -5.082195281982422, "global_step": 9305, "epoch": 221} {"train_loss": -5.057730197906494, "global_step": 9306, "epoch": 221} {"train_loss": -5.01643180847168, "global_step": 9307, "epoch": 221} {"train_loss": -4.97141170501709, "global_step": 9308, "epoch": 221} {"train_loss": -5.010982036590576, "global_step": 9309, "epoch": 221} {"train_loss": -4.985446929931641, "global_step": 9310, "epoch": 221} {"train_loss": -5.029819488525391, "global_step": 9311, "epoch": 221} {"train_loss": -4.9919233322143555, "global_step": 9312, "epoch": 221} {"train_loss": -5.055023193359375, "global_step": 9313, "epoch": 221} {"train_loss": -4.918274879455566, "global_step": 9314, "epoch": 221} {"train_loss": -4.9190216064453125, "global_step": 9315, "epoch": 221} {"train_loss": -4.9902663230896, "global_step": 9316, "epoch": 221} {"train_loss": -5.020522117614746, "global_step": 9317, "epoch": 221} {"train_loss": -4.944012641906738, "global_step": 9318, "epoch": 221} {"train_loss": -4.981198310852051, "global_step": 9319, "epoch": 221} {"train_loss": -4.989276885986328, "global_step": 9320, "epoch": 221} {"train_loss": -4.924469470977783, "global_step": 9321, "epoch": 221} {"train_loss": -4.897233963012695, "global_step": 9322, "epoch": 221} {"train_loss": -4.995360431217012, "global_step": 9323, "epoch": 221, "val_loss": 81035.6484375} {"train_loss": -5.013290882110596, "global_step": 9324, "epoch": 222} {"train_loss": -4.718166828155518, "global_step": 9325, "epoch": 222} {"train_loss": -5.047052383422852, "global_step": 9326, "epoch": 222} {"train_loss": -5.084473609924316, "global_step": 9327, "epoch": 222} {"train_loss": -4.821397304534912, "global_step": 9328, "epoch": 222} {"train_loss": -5.162010669708252, "global_step": 9329, "epoch": 222} {"train_loss": -5.085411548614502, "global_step": 9330, "epoch": 222} {"train_loss": -4.934234142303467, "global_step": 9331, "epoch": 222} {"train_loss": -4.935932636260986, "global_step": 9332, "epoch": 222} {"train_loss": -4.7491254806518555, "global_step": 9333, "epoch": 222} {"train_loss": -4.908005714416504, "global_step": 9334, "epoch": 222} {"train_loss": -4.927310943603516, "global_step": 9335, "epoch": 222} {"train_loss": -4.792159080505371, "global_step": 9336, "epoch": 222} {"train_loss": -4.97701358795166, "global_step": 9337, "epoch": 222} {"train_loss": -4.843291282653809, "global_step": 9338, "epoch": 222} {"train_loss": -4.883066177368164, "global_step": 9339, "epoch": 222} {"train_loss": -4.9406280517578125, "global_step": 9340, "epoch": 222} {"train_loss": -5.003183841705322, "global_step": 9341, "epoch": 222} {"train_loss": -4.940481662750244, "global_step": 9342, "epoch": 222} {"train_loss": -5.029386520385742, "global_step": 9343, "epoch": 222} {"train_loss": -5.0646772384643555, "global_step": 9344, "epoch": 222} {"train_loss": -4.886730194091797, "global_step": 9345, "epoch": 222} {"train_loss": -4.987752914428711, "global_step": 9346, "epoch": 222} {"train_loss": -4.9650678634643555, "global_step": 9347, "epoch": 222} {"train_loss": -4.9444966316223145, "global_step": 9348, "epoch": 222} {"train_loss": -5.057730674743652, "global_step": 9349, "epoch": 222} {"train_loss": -5.227145195007324, "global_step": 9350, "epoch": 222} {"train_loss": -5.11511754989624, "global_step": 9351, "epoch": 222} {"train_loss": -5.0603928565979, "global_step": 9352, "epoch": 222} {"train_loss": -4.989431858062744, "global_step": 9353, "epoch": 222} {"train_loss": -5.161989688873291, "global_step": 9354, "epoch": 222} {"train_loss": -4.895455837249756, "global_step": 9355, "epoch": 222} {"train_loss": -5.068074703216553, "global_step": 9356, "epoch": 222} {"train_loss": -5.1188459396362305, "global_step": 9357, "epoch": 222} {"train_loss": -5.004612922668457, "global_step": 9358, "epoch": 222} {"train_loss": -5.031864166259766, "global_step": 9359, "epoch": 222} {"train_loss": -5.11569881439209, "global_step": 9360, "epoch": 222} {"train_loss": -4.959677696228027, "global_step": 9361, "epoch": 222} {"train_loss": -4.913967132568359, "global_step": 9362, "epoch": 222} {"train_loss": -5.0042572021484375, "global_step": 9363, "epoch": 222} {"train_loss": -4.830898284912109, "global_step": 9364, "epoch": 222} {"train_loss": -4.976406415303548, "global_step": 9365, "epoch": 222, "val_loss": 82299.859375} {"train_loss": -5.110414505004883, "global_step": 9366, "epoch": 223} {"train_loss": -4.875830173492432, "global_step": 9367, "epoch": 223} {"train_loss": -4.8809099197387695, "global_step": 9368, "epoch": 223} {"train_loss": -4.951085090637207, "global_step": 9369, "epoch": 223} {"train_loss": -4.948019981384277, "global_step": 9370, "epoch": 223} {"train_loss": -5.017161846160889, "global_step": 9371, "epoch": 223} {"train_loss": -4.852701187133789, "global_step": 9372, "epoch": 223} {"train_loss": -4.881231784820557, "global_step": 9373, "epoch": 223} {"train_loss": -4.884013652801514, "global_step": 9374, "epoch": 223} {"train_loss": -5.061859130859375, "global_step": 9375, "epoch": 223} {"train_loss": -5.013665676116943, "global_step": 9376, "epoch": 223} {"train_loss": -4.997954368591309, "global_step": 9377, "epoch": 223} {"train_loss": -5.1037211418151855, "global_step": 9378, "epoch": 223} {"train_loss": -4.897544860839844, "global_step": 9379, "epoch": 223} {"train_loss": -4.9770636558532715, "global_step": 9380, "epoch": 223} {"train_loss": -5.220787525177002, "global_step": 9381, "epoch": 223} {"train_loss": -5.018204212188721, "global_step": 9382, "epoch": 223} {"train_loss": -4.902956008911133, "global_step": 9383, "epoch": 223} {"train_loss": -4.9334516525268555, "global_step": 9384, "epoch": 223} {"train_loss": -5.095218181610107, "global_step": 9385, "epoch": 223} {"train_loss": -4.917545318603516, "global_step": 9386, "epoch": 223} {"train_loss": -4.9294257164001465, "global_step": 9387, "epoch": 223} {"train_loss": -5.132441520690918, "global_step": 9388, "epoch": 223} {"train_loss": -4.981299877166748, "global_step": 9389, "epoch": 223} {"train_loss": -4.949916839599609, "global_step": 9390, "epoch": 223} {"train_loss": -4.852919101715088, "global_step": 9391, "epoch": 223} {"train_loss": -5.030368804931641, "global_step": 9392, "epoch": 223} {"train_loss": -5.021422386169434, "global_step": 9393, "epoch": 223} {"train_loss": -4.964022636413574, "global_step": 9394, "epoch": 223} {"train_loss": -5.059140682220459, "global_step": 9395, "epoch": 223} {"train_loss": -5.111659049987793, "global_step": 9396, "epoch": 223} {"train_loss": -5.089966297149658, "global_step": 9397, "epoch": 223} {"train_loss": -5.158493995666504, "global_step": 9398, "epoch": 223} {"train_loss": -5.116648197174072, "global_step": 9399, "epoch": 223} {"train_loss": -5.049443244934082, "global_step": 9400, "epoch": 223} {"train_loss": -5.174639701843262, "global_step": 9401, "epoch": 223} {"train_loss": -4.9885149002075195, "global_step": 9402, "epoch": 223} {"train_loss": -5.099844932556152, "global_step": 9403, "epoch": 223} {"train_loss": -5.028261184692383, "global_step": 9404, "epoch": 223} {"train_loss": -4.902068138122559, "global_step": 9405, "epoch": 223} {"train_loss": -5.0950822830200195, "global_step": 9406, "epoch": 223} {"train_loss": -5.0063337825593495, "global_step": 9407, "epoch": 223, "val_loss": 82708.6875} {"train_loss": -5.087690353393555, "global_step": 9408, "epoch": 224} {"train_loss": -5.0996551513671875, "global_step": 9409, "epoch": 224} {"train_loss": -5.09271240234375, "global_step": 9410, "epoch": 224} {"train_loss": -5.141008377075195, "global_step": 9411, "epoch": 224} {"train_loss": -5.047948837280273, "global_step": 9412, "epoch": 224} {"train_loss": -5.00158166885376, "global_step": 9413, "epoch": 224} {"train_loss": -4.930269718170166, "global_step": 9414, "epoch": 224} {"train_loss": -4.742836952209473, "global_step": 9415, "epoch": 224} {"train_loss": -4.967245578765869, "global_step": 9416, "epoch": 224} {"train_loss": -5.078582763671875, "global_step": 9417, "epoch": 224} {"train_loss": -4.967037200927734, "global_step": 9418, "epoch": 224} {"train_loss": -4.824957847595215, "global_step": 9419, "epoch": 224} {"train_loss": -4.860810279846191, "global_step": 9420, "epoch": 224} {"train_loss": -4.724020957946777, "global_step": 9421, "epoch": 224} {"train_loss": -4.841224193572998, "global_step": 9422, "epoch": 224} {"train_loss": -4.986847877502441, "global_step": 9423, "epoch": 224} {"train_loss": -5.062127113342285, "global_step": 9424, "epoch": 224} {"train_loss": -4.930220603942871, "global_step": 9425, "epoch": 224} {"train_loss": -4.882589817047119, "global_step": 9426, "epoch": 224} {"train_loss": -4.978113174438477, "global_step": 9427, "epoch": 224} {"train_loss": -4.915764331817627, "global_step": 9428, "epoch": 224} {"train_loss": -4.838381290435791, "global_step": 9429, "epoch": 224} {"train_loss": -5.051877975463867, "global_step": 9430, "epoch": 224} {"train_loss": -4.897520065307617, "global_step": 9431, "epoch": 224} {"train_loss": -4.742387771606445, "global_step": 9432, "epoch": 224} {"train_loss": -4.881443023681641, "global_step": 9433, "epoch": 224} {"train_loss": -4.991226673126221, "global_step": 9434, "epoch": 224} {"train_loss": -5.035565376281738, "global_step": 9435, "epoch": 224} {"train_loss": -4.989612102508545, "global_step": 9436, "epoch": 224} {"train_loss": -4.832206726074219, "global_step": 9437, "epoch": 224} {"train_loss": -4.950392723083496, "global_step": 9438, "epoch": 224} {"train_loss": -4.913483142852783, "global_step": 9439, "epoch": 224} {"train_loss": -4.970366477966309, "global_step": 9440, "epoch": 224} {"train_loss": -4.948951721191406, "global_step": 9441, "epoch": 224} {"train_loss": -4.959737777709961, "global_step": 9442, "epoch": 224} {"train_loss": -4.985426425933838, "global_step": 9443, "epoch": 224} {"train_loss": -5.07094669342041, "global_step": 9444, "epoch": 224} {"train_loss": -5.022162437438965, "global_step": 9445, "epoch": 224} {"train_loss": -4.993229866027832, "global_step": 9446, "epoch": 224} {"train_loss": -5.014554977416992, "global_step": 9447, "epoch": 224} {"train_loss": -5.0779876708984375, "global_step": 9448, "epoch": 224} {"train_loss": -4.958578234627133, "global_step": 9449, "epoch": 224, "val_loss": 82376.9375} {"train_loss": -5.021355628967285, "global_step": 9450, "epoch": 225} {"train_loss": -4.986345291137695, "global_step": 9451, "epoch": 225} {"train_loss": -5.025465965270996, "global_step": 9452, "epoch": 225} {"train_loss": -5.0042405128479, "global_step": 9453, "epoch": 225} {"train_loss": -5.229817867279053, "global_step": 9454, "epoch": 225} {"train_loss": -4.908546447753906, "global_step": 9455, "epoch": 225} {"train_loss": -5.096010208129883, "global_step": 9456, "epoch": 225} {"train_loss": -4.8641815185546875, "global_step": 9457, "epoch": 225} {"train_loss": -4.884897232055664, "global_step": 9458, "epoch": 225} {"train_loss": -5.044079780578613, "global_step": 9459, "epoch": 225} {"train_loss": -4.970880508422852, "global_step": 9460, "epoch": 225} {"train_loss": -5.046725273132324, "global_step": 9461, "epoch": 225} {"train_loss": -5.00120735168457, "global_step": 9462, "epoch": 225} {"train_loss": -5.036508560180664, "global_step": 9463, "epoch": 225} {"train_loss": -5.038191795349121, "global_step": 9464, "epoch": 225} {"train_loss": -5.073805332183838, "global_step": 9465, "epoch": 225} {"train_loss": -5.001134872436523, "global_step": 9466, "epoch": 225} {"train_loss": -5.134759902954102, "global_step": 9467, "epoch": 225} {"train_loss": -4.965887546539307, "global_step": 9468, "epoch": 225} {"train_loss": -4.971631050109863, "global_step": 9469, "epoch": 225} {"train_loss": -5.036285877227783, "global_step": 9470, "epoch": 225} {"train_loss": -4.946198463439941, "global_step": 9471, "epoch": 225} {"train_loss": -4.9907331466674805, "global_step": 9472, "epoch": 225} {"train_loss": -5.149687767028809, "global_step": 9473, "epoch": 225} {"train_loss": -5.051031112670898, "global_step": 9474, "epoch": 225} {"train_loss": -4.991372108459473, "global_step": 9475, "epoch": 225} {"train_loss": -5.158576488494873, "global_step": 9476, "epoch": 225} {"train_loss": -5.140955924987793, "global_step": 9477, "epoch": 225} {"train_loss": -5.0277910232543945, "global_step": 9478, "epoch": 225} {"train_loss": -5.008007049560547, "global_step": 9479, "epoch": 225} {"train_loss": -5.082831382751465, "global_step": 9480, "epoch": 225} {"train_loss": -5.095441818237305, "global_step": 9481, "epoch": 225} {"train_loss": -5.008447170257568, "global_step": 9482, "epoch": 225} {"train_loss": -4.993902206420898, "global_step": 9483, "epoch": 225} {"train_loss": -4.940834045410156, "global_step": 9484, "epoch": 225} {"train_loss": -4.887373447418213, "global_step": 9485, "epoch": 225} {"train_loss": -5.018619537353516, "global_step": 9486, "epoch": 225} {"train_loss": -5.0966796875, "global_step": 9487, "epoch": 225} {"train_loss": -5.160373687744141, "global_step": 9488, "epoch": 225} {"train_loss": -4.994977951049805, "global_step": 9489, "epoch": 225} {"train_loss": -5.033958435058594, "global_step": 9490, "epoch": 225} {"train_loss": -5.0241422426132925, "global_step": 9491, "epoch": 225, "val_loss": 82660.8046875} {"train_loss": -4.93427848815918, "global_step": 9492, "epoch": 226} {"train_loss": -4.933310031890869, "global_step": 9493, "epoch": 226} {"train_loss": -4.998812675476074, "global_step": 9494, "epoch": 226} {"train_loss": -4.943979263305664, "global_step": 9495, "epoch": 226} {"train_loss": -5.04559326171875, "global_step": 9496, "epoch": 226} {"train_loss": -4.900376319885254, "global_step": 9497, "epoch": 226} {"train_loss": -5.037801265716553, "global_step": 9498, "epoch": 226} {"train_loss": -5.081032752990723, "global_step": 9499, "epoch": 226} {"train_loss": -4.956945419311523, "global_step": 9500, "epoch": 226} {"train_loss": -5.202363967895508, "global_step": 9501, "epoch": 226} {"train_loss": -4.913195610046387, "global_step": 9502, "epoch": 226} {"train_loss": -4.890561580657959, "global_step": 9503, "epoch": 226} {"train_loss": -5.0452728271484375, "global_step": 9504, "epoch": 226} {"train_loss": -5.015778064727783, "global_step": 9505, "epoch": 226} {"train_loss": -4.93953800201416, "global_step": 9506, "epoch": 226} {"train_loss": -4.949695587158203, "global_step": 9507, "epoch": 226} {"train_loss": -4.877535820007324, "global_step": 9508, "epoch": 226} {"train_loss": -4.855369567871094, "global_step": 9509, "epoch": 226} {"train_loss": -5.008467674255371, "global_step": 9510, "epoch": 226} {"train_loss": -5.081943988800049, "global_step": 9511, "epoch": 226} {"train_loss": -4.985756874084473, "global_step": 9512, "epoch": 226} {"train_loss": -5.009504318237305, "global_step": 9513, "epoch": 226} {"train_loss": -4.9233012199401855, "global_step": 9514, "epoch": 226} {"train_loss": -4.943325996398926, "global_step": 9515, "epoch": 226} {"train_loss": -4.862079620361328, "global_step": 9516, "epoch": 226} {"train_loss": -4.899020671844482, "global_step": 9517, "epoch": 226} {"train_loss": -4.932300567626953, "global_step": 9518, "epoch": 226} {"train_loss": -4.911766052246094, "global_step": 9519, "epoch": 226} {"train_loss": -5.021162033081055, "global_step": 9520, "epoch": 226} {"train_loss": -4.890973091125488, "global_step": 9521, "epoch": 226} {"train_loss": -4.9946608543396, "global_step": 9522, "epoch": 226} {"train_loss": -5.092856407165527, "global_step": 9523, "epoch": 226} {"train_loss": -4.872099876403809, "global_step": 9524, "epoch": 226} {"train_loss": -4.893357276916504, "global_step": 9525, "epoch": 226} {"train_loss": -4.841194152832031, "global_step": 9526, "epoch": 226} {"train_loss": -4.938691139221191, "global_step": 9527, "epoch": 226} {"train_loss": -5.053984642028809, "global_step": 9528, "epoch": 226} {"train_loss": -4.985857963562012, "global_step": 9529, "epoch": 226} {"train_loss": -5.14813232421875, "global_step": 9530, "epoch": 226} {"train_loss": -4.875436782836914, "global_step": 9531, "epoch": 226} {"train_loss": -5.084785461425781, "global_step": 9532, "epoch": 226} {"train_loss": -4.9690880661919, "global_step": 9533, "epoch": 226, "val_loss": 82253.1875} {"train_loss": -4.951084613800049, "global_step": 9534, "epoch": 227} {"train_loss": -4.935527324676514, "global_step": 9535, "epoch": 227} {"train_loss": -5.089151382446289, "global_step": 9536, "epoch": 227} {"train_loss": -5.091148376464844, "global_step": 9537, "epoch": 227} {"train_loss": -4.918234348297119, "global_step": 9538, "epoch": 227} {"train_loss": -5.081323146820068, "global_step": 9539, "epoch": 227} {"train_loss": -5.115758895874023, "global_step": 9540, "epoch": 227} {"train_loss": -5.0955986976623535, "global_step": 9541, "epoch": 227} {"train_loss": -4.925527572631836, "global_step": 9542, "epoch": 227} {"train_loss": -4.9266276359558105, "global_step": 9543, "epoch": 227} {"train_loss": -4.942569732666016, "global_step": 9544, "epoch": 227} {"train_loss": -4.860927581787109, "global_step": 9545, "epoch": 227} {"train_loss": -4.754822254180908, "global_step": 9546, "epoch": 227} {"train_loss": -5.0320539474487305, "global_step": 9547, "epoch": 227} {"train_loss": -4.869396209716797, "global_step": 9548, "epoch": 227} {"train_loss": -4.659633636474609, "global_step": 9549, "epoch": 227} {"train_loss": -5.110639572143555, "global_step": 9550, "epoch": 227} {"train_loss": -4.911660671234131, "global_step": 9551, "epoch": 227} {"train_loss": -4.870569229125977, "global_step": 9552, "epoch": 227} {"train_loss": -4.889078617095947, "global_step": 9553, "epoch": 227} {"train_loss": -4.751591205596924, "global_step": 9554, "epoch": 227} {"train_loss": -4.9669976234436035, "global_step": 9555, "epoch": 227} {"train_loss": -4.958123207092285, "global_step": 9556, "epoch": 227} {"train_loss": -4.928554058074951, "global_step": 9557, "epoch": 227} {"train_loss": -4.899656295776367, "global_step": 9558, "epoch": 227} {"train_loss": -5.054745674133301, "global_step": 9559, "epoch": 227} {"train_loss": -5.180340766906738, "global_step": 9560, "epoch": 227} {"train_loss": -4.945531845092773, "global_step": 9561, "epoch": 227} {"train_loss": -5.043941497802734, "global_step": 9562, "epoch": 227} {"train_loss": -5.148312568664551, "global_step": 9563, "epoch": 227} {"train_loss": -4.976212978363037, "global_step": 9564, "epoch": 227} {"train_loss": -4.842097282409668, "global_step": 9565, "epoch": 227} {"train_loss": -5.10394287109375, "global_step": 9566, "epoch": 227} {"train_loss": -5.07411003112793, "global_step": 9567, "epoch": 227} {"train_loss": -4.909724235534668, "global_step": 9568, "epoch": 227} {"train_loss": -4.783557891845703, "global_step": 9569, "epoch": 227} {"train_loss": -4.990107536315918, "global_step": 9570, "epoch": 227} {"train_loss": -4.914105415344238, "global_step": 9571, "epoch": 227} {"train_loss": -4.966740608215332, "global_step": 9572, "epoch": 227} {"train_loss": -5.0304718017578125, "global_step": 9573, "epoch": 227} {"train_loss": -5.013006210327148, "global_step": 9574, "epoch": 227} {"train_loss": -4.966279620216007, "global_step": 9575, "epoch": 227, "val_loss": 81673.21875} {"train_loss": -4.830061912536621, "global_step": 9576, "epoch": 228} {"train_loss": -4.910394191741943, "global_step": 9577, "epoch": 228} {"train_loss": -5.1524457931518555, "global_step": 9578, "epoch": 228} {"train_loss": -4.936244010925293, "global_step": 9579, "epoch": 228} {"train_loss": -4.97072696685791, "global_step": 9580, "epoch": 228} {"train_loss": -4.9152607917785645, "global_step": 9581, "epoch": 228} {"train_loss": -5.0803303718566895, "global_step": 9582, "epoch": 228} {"train_loss": -5.056732177734375, "global_step": 9583, "epoch": 228} {"train_loss": -5.10700798034668, "global_step": 9584, "epoch": 228} {"train_loss": -5.023833274841309, "global_step": 9585, "epoch": 228} {"train_loss": -4.938223361968994, "global_step": 9586, "epoch": 228} {"train_loss": -5.1097564697265625, "global_step": 9587, "epoch": 228} {"train_loss": -5.010830402374268, "global_step": 9588, "epoch": 228} {"train_loss": -4.8274688720703125, "global_step": 9589, "epoch": 228} {"train_loss": -4.8872761726379395, "global_step": 9590, "epoch": 228} {"train_loss": -5.044777870178223, "global_step": 9591, "epoch": 228} {"train_loss": -4.852872848510742, "global_step": 9592, "epoch": 228} {"train_loss": -4.88564395904541, "global_step": 9593, "epoch": 228} {"train_loss": -4.899078369140625, "global_step": 9594, "epoch": 228} {"train_loss": -5.035340309143066, "global_step": 9595, "epoch": 228} {"train_loss": -4.878289699554443, "global_step": 9596, "epoch": 228} {"train_loss": -4.997198104858398, "global_step": 9597, "epoch": 228} {"train_loss": -4.971584320068359, "global_step": 9598, "epoch": 228} {"train_loss": -5.183396339416504, "global_step": 9599, "epoch": 228} {"train_loss": -4.863653659820557, "global_step": 9600, "epoch": 228} {"train_loss": -4.980154037475586, "global_step": 9601, "epoch": 228} {"train_loss": -4.922623157501221, "global_step": 9602, "epoch": 228} {"train_loss": -5.0487565994262695, "global_step": 9603, "epoch": 228} {"train_loss": -5.070526599884033, "global_step": 9604, "epoch": 228} {"train_loss": -4.8564229011535645, "global_step": 9605, "epoch": 228} {"train_loss": -4.955212116241455, "global_step": 9606, "epoch": 228} {"train_loss": -4.896733283996582, "global_step": 9607, "epoch": 228} {"train_loss": -4.939711570739746, "global_step": 9608, "epoch": 228} {"train_loss": -4.969727516174316, "global_step": 9609, "epoch": 228} {"train_loss": -4.979905128479004, "global_step": 9610, "epoch": 228} {"train_loss": -4.943528175354004, "global_step": 9611, "epoch": 228} {"train_loss": -5.092025279998779, "global_step": 9612, "epoch": 228} {"train_loss": -4.995821952819824, "global_step": 9613, "epoch": 228} {"train_loss": -4.986602306365967, "global_step": 9614, "epoch": 228} {"train_loss": -5.132652282714844, "global_step": 9615, "epoch": 228} {"train_loss": -5.055706024169922, "global_step": 9616, "epoch": 228} {"train_loss": -4.981707504817417, "global_step": 9617, "epoch": 228, "val_loss": 81593.625} {"train_loss": -4.955575466156006, "global_step": 9618, "epoch": 229} {"train_loss": -5.053386211395264, "global_step": 9619, "epoch": 229} {"train_loss": -5.013548851013184, "global_step": 9620, "epoch": 229} {"train_loss": -5.023110866546631, "global_step": 9621, "epoch": 229} {"train_loss": -5.08547306060791, "global_step": 9622, "epoch": 229} {"train_loss": -5.075318336486816, "global_step": 9623, "epoch": 229} {"train_loss": -5.11647891998291, "global_step": 9624, "epoch": 229} {"train_loss": -5.0398478507995605, "global_step": 9625, "epoch": 229} {"train_loss": -5.028729438781738, "global_step": 9626, "epoch": 229} {"train_loss": -5.017874717712402, "global_step": 9627, "epoch": 229} {"train_loss": -5.0011749267578125, "global_step": 9628, "epoch": 229} {"train_loss": -5.008411407470703, "global_step": 9629, "epoch": 229} {"train_loss": -4.883707523345947, "global_step": 9630, "epoch": 229} {"train_loss": -4.889158248901367, "global_step": 9631, "epoch": 229} {"train_loss": -4.9579267501831055, "global_step": 9632, "epoch": 229} {"train_loss": -4.968956470489502, "global_step": 9633, "epoch": 229} {"train_loss": -5.040650367736816, "global_step": 9634, "epoch": 229} {"train_loss": -4.850407600402832, "global_step": 9635, "epoch": 229} {"train_loss": -4.822797775268555, "global_step": 9636, "epoch": 229} {"train_loss": -4.862599849700928, "global_step": 9637, "epoch": 229} {"train_loss": -4.7911787033081055, "global_step": 9638, "epoch": 229} {"train_loss": -4.9107513427734375, "global_step": 9639, "epoch": 229} {"train_loss": -4.898067951202393, "global_step": 9640, "epoch": 229} {"train_loss": -5.007421493530273, "global_step": 9641, "epoch": 229} {"train_loss": -4.949512481689453, "global_step": 9642, "epoch": 229} {"train_loss": -5.04958438873291, "global_step": 9643, "epoch": 229} {"train_loss": -5.046834945678711, "global_step": 9644, "epoch": 229} {"train_loss": -5.01521110534668, "global_step": 9645, "epoch": 229} {"train_loss": -4.868995666503906, "global_step": 9646, "epoch": 229} {"train_loss": -5.003174304962158, "global_step": 9647, "epoch": 229} {"train_loss": -4.854107856750488, "global_step": 9648, "epoch": 229} {"train_loss": -4.730365753173828, "global_step": 9649, "epoch": 229} {"train_loss": -5.03846549987793, "global_step": 9650, "epoch": 229} {"train_loss": -4.91533899307251, "global_step": 9651, "epoch": 229} {"train_loss": -4.907709121704102, "global_step": 9652, "epoch": 229} {"train_loss": -5.0360283851623535, "global_step": 9653, "epoch": 229} {"train_loss": -5.0062255859375, "global_step": 9654, "epoch": 229} {"train_loss": -5.027711868286133, "global_step": 9655, "epoch": 229} {"train_loss": -5.08204984664917, "global_step": 9656, "epoch": 229} {"train_loss": -5.0192365646362305, "global_step": 9657, "epoch": 229} {"train_loss": -5.006391525268555, "global_step": 9658, "epoch": 229} {"train_loss": -4.970711617242722, "global_step": 9659, "epoch": 229, "val_loss": 81101.1484375} {"train_loss": -5.000945091247559, "global_step": 9660, "epoch": 230} {"train_loss": -4.96304988861084, "global_step": 9661, "epoch": 230} {"train_loss": -5.014191150665283, "global_step": 9662, "epoch": 230} {"train_loss": -4.984299659729004, "global_step": 9663, "epoch": 230} {"train_loss": -4.952086448669434, "global_step": 9664, "epoch": 230} {"train_loss": -4.915958404541016, "global_step": 9665, "epoch": 230} {"train_loss": -5.047608852386475, "global_step": 9666, "epoch": 230} {"train_loss": -5.18405294418335, "global_step": 9667, "epoch": 230} {"train_loss": -5.030052185058594, "global_step": 9668, "epoch": 230} {"train_loss": -4.983424186706543, "global_step": 9669, "epoch": 230} {"train_loss": -5.089320182800293, "global_step": 9670, "epoch": 230} {"train_loss": -4.978298187255859, "global_step": 9671, "epoch": 230} {"train_loss": -4.9780731201171875, "global_step": 9672, "epoch": 230} {"train_loss": -5.113618850708008, "global_step": 9673, "epoch": 230} {"train_loss": -4.97695255279541, "global_step": 9674, "epoch": 230} {"train_loss": -5.206467151641846, "global_step": 9675, "epoch": 230} {"train_loss": -5.113302230834961, "global_step": 9676, "epoch": 230} {"train_loss": -5.107870101928711, "global_step": 9677, "epoch": 230} {"train_loss": -4.989627361297607, "global_step": 9678, "epoch": 230} {"train_loss": -5.039709091186523, "global_step": 9679, "epoch": 230} {"train_loss": -5.012870788574219, "global_step": 9680, "epoch": 230} {"train_loss": -5.0811052322387695, "global_step": 9681, "epoch": 230} {"train_loss": -5.03500509262085, "global_step": 9682, "epoch": 230} {"train_loss": -5.155646324157715, "global_step": 9683, "epoch": 230} {"train_loss": -5.0573296546936035, "global_step": 9684, "epoch": 230} {"train_loss": -5.123518943786621, "global_step": 9685, "epoch": 230} {"train_loss": -5.008450508117676, "global_step": 9686, "epoch": 230} {"train_loss": -5.143903732299805, "global_step": 9687, "epoch": 230} {"train_loss": -5.172792434692383, "global_step": 9688, "epoch": 230} {"train_loss": -4.833892822265625, "global_step": 9689, "epoch": 230} {"train_loss": -4.92714262008667, "global_step": 9690, "epoch": 230} {"train_loss": -5.040340423583984, "global_step": 9691, "epoch": 230} {"train_loss": -5.118643760681152, "global_step": 9692, "epoch": 230} {"train_loss": -5.132134437561035, "global_step": 9693, "epoch": 230} {"train_loss": -5.161036014556885, "global_step": 9694, "epoch": 230} {"train_loss": -4.999392032623291, "global_step": 9695, "epoch": 230} {"train_loss": -4.960574626922607, "global_step": 9696, "epoch": 230} {"train_loss": -4.99064302444458, "global_step": 9697, "epoch": 230} {"train_loss": -5.167054176330566, "global_step": 9698, "epoch": 230} {"train_loss": -5.135510444641113, "global_step": 9699, "epoch": 230} {"train_loss": -5.106193542480469, "global_step": 9700, "epoch": 230} {"train_loss": -5.046673445474534, "global_step": 9701, "epoch": 230, "val_loss": 81562.5625} {"train_loss": -4.978265762329102, "global_step": 9702, "epoch": 231} {"train_loss": -4.990456581115723, "global_step": 9703, "epoch": 231} {"train_loss": -4.994480133056641, "global_step": 9704, "epoch": 231} {"train_loss": -5.0886101722717285, "global_step": 9705, "epoch": 231} {"train_loss": -4.911808967590332, "global_step": 9706, "epoch": 231} {"train_loss": -5.151778221130371, "global_step": 9707, "epoch": 231} {"train_loss": -4.847150802612305, "global_step": 9708, "epoch": 231} {"train_loss": -4.961248874664307, "global_step": 9709, "epoch": 231} {"train_loss": -4.833207130432129, "global_step": 9710, "epoch": 231} {"train_loss": -5.021380424499512, "global_step": 9711, "epoch": 231} {"train_loss": -4.901993751525879, "global_step": 9712, "epoch": 231} {"train_loss": -4.831002235412598, "global_step": 9713, "epoch": 231} {"train_loss": -4.75004768371582, "global_step": 9714, "epoch": 231} {"train_loss": -4.528496742248535, "global_step": 9715, "epoch": 231} {"train_loss": -4.865255355834961, "global_step": 9716, "epoch": 231} {"train_loss": -4.63635778427124, "global_step": 9717, "epoch": 231} {"train_loss": -4.509982109069824, "global_step": 9718, "epoch": 231} {"train_loss": -4.817237377166748, "global_step": 9719, "epoch": 231} {"train_loss": -4.693103790283203, "global_step": 9720, "epoch": 231} {"train_loss": -4.710848331451416, "global_step": 9721, "epoch": 231} {"train_loss": -4.764627456665039, "global_step": 9722, "epoch": 231} {"train_loss": -4.699066162109375, "global_step": 9723, "epoch": 231} {"train_loss": -4.798684597015381, "global_step": 9724, "epoch": 231} {"train_loss": -4.897326469421387, "global_step": 9725, "epoch": 231} {"train_loss": -4.77203893661499, "global_step": 9726, "epoch": 231} {"train_loss": -4.886300086975098, "global_step": 9727, "epoch": 231} {"train_loss": -4.948890209197998, "global_step": 9728, "epoch": 231} {"train_loss": -4.869121074676514, "global_step": 9729, "epoch": 231} {"train_loss": -5.002710342407227, "global_step": 9730, "epoch": 231} {"train_loss": -4.840468406677246, "global_step": 9731, "epoch": 231} {"train_loss": -4.869529724121094, "global_step": 9732, "epoch": 231} {"train_loss": -4.951816558837891, "global_step": 9733, "epoch": 231} {"train_loss": -4.892331123352051, "global_step": 9734, "epoch": 231} {"train_loss": -4.936992645263672, "global_step": 9735, "epoch": 231} {"train_loss": -5.007046699523926, "global_step": 9736, "epoch": 231} {"train_loss": -4.9014129638671875, "global_step": 9737, "epoch": 231} {"train_loss": -4.88789176940918, "global_step": 9738, "epoch": 231} {"train_loss": -5.0647382736206055, "global_step": 9739, "epoch": 231} {"train_loss": -4.900964736938477, "global_step": 9740, "epoch": 231} {"train_loss": -4.861262798309326, "global_step": 9741, "epoch": 231} {"train_loss": -5.045035362243652, "global_step": 9742, "epoch": 231} {"train_loss": -4.878569557553246, "global_step": 9743, "epoch": 231, "val_loss": 82000.890625} {"train_loss": -4.993125915527344, "global_step": 9744, "epoch": 232} {"train_loss": -5.000575065612793, "global_step": 9745, "epoch": 232} {"train_loss": -4.924825668334961, "global_step": 9746, "epoch": 232} {"train_loss": -5.094140529632568, "global_step": 9747, "epoch": 232} {"train_loss": -5.109811305999756, "global_step": 9748, "epoch": 232} {"train_loss": -4.90767765045166, "global_step": 9749, "epoch": 232} {"train_loss": -4.9267425537109375, "global_step": 9750, "epoch": 232} {"train_loss": -5.051999568939209, "global_step": 9751, "epoch": 232} {"train_loss": -4.9400315284729, "global_step": 9752, "epoch": 232} {"train_loss": -5.093767166137695, "global_step": 9753, "epoch": 232} {"train_loss": -5.117022514343262, "global_step": 9754, "epoch": 232} {"train_loss": -5.073697090148926, "global_step": 9755, "epoch": 232} {"train_loss": -4.913637161254883, "global_step": 9756, "epoch": 232} {"train_loss": -4.906856536865234, "global_step": 9757, "epoch": 232} {"train_loss": -4.890138626098633, "global_step": 9758, "epoch": 232} {"train_loss": -5.004561901092529, "global_step": 9759, "epoch": 232} {"train_loss": -4.978399276733398, "global_step": 9760, "epoch": 232} {"train_loss": -5.062830924987793, "global_step": 9761, "epoch": 232} {"train_loss": -5.098010063171387, "global_step": 9762, "epoch": 232} {"train_loss": -5.137388706207275, "global_step": 9763, "epoch": 232} {"train_loss": -4.977331161499023, "global_step": 9764, "epoch": 232} {"train_loss": -5.0938239097595215, "global_step": 9765, "epoch": 232} {"train_loss": -5.065478801727295, "global_step": 9766, "epoch": 232} {"train_loss": -5.121082305908203, "global_step": 9767, "epoch": 232} {"train_loss": -5.063017845153809, "global_step": 9768, "epoch": 232} {"train_loss": -4.997134685516357, "global_step": 9769, "epoch": 232} {"train_loss": -5.018439292907715, "global_step": 9770, "epoch": 232} {"train_loss": -4.854979515075684, "global_step": 9771, "epoch": 232} {"train_loss": -5.091702461242676, "global_step": 9772, "epoch": 232} {"train_loss": -5.067948818206787, "global_step": 9773, "epoch": 232} {"train_loss": -4.986269950866699, "global_step": 9774, "epoch": 232} {"train_loss": -5.032848358154297, "global_step": 9775, "epoch": 232} {"train_loss": -5.169200897216797, "global_step": 9776, "epoch": 232} {"train_loss": -5.027297019958496, "global_step": 9777, "epoch": 232} {"train_loss": -4.918098449707031, "global_step": 9778, "epoch": 232} {"train_loss": -5.0990142822265625, "global_step": 9779, "epoch": 232} {"train_loss": -4.914756774902344, "global_step": 9780, "epoch": 232} {"train_loss": -4.9846343994140625, "global_step": 9781, "epoch": 232} {"train_loss": -4.918493270874023, "global_step": 9782, "epoch": 232} {"train_loss": -4.668071746826172, "global_step": 9783, "epoch": 232} {"train_loss": -4.902464866638184, "global_step": 9784, "epoch": 232} {"train_loss": -5.0022351287660145, "global_step": 9785, "epoch": 232, "val_loss": 82181.671875} {"train_loss": -4.862682342529297, "global_step": 9786, "epoch": 233} {"train_loss": -4.99085807800293, "global_step": 9787, "epoch": 233} {"train_loss": -4.831752777099609, "global_step": 9788, "epoch": 233} {"train_loss": -4.845556735992432, "global_step": 9789, "epoch": 233} {"train_loss": -4.8429131507873535, "global_step": 9790, "epoch": 233} {"train_loss": -4.822957992553711, "global_step": 9791, "epoch": 233} {"train_loss": -4.9879150390625, "global_step": 9792, "epoch": 233} {"train_loss": -4.716043472290039, "global_step": 9793, "epoch": 233} {"train_loss": -4.952533721923828, "global_step": 9794, "epoch": 233} {"train_loss": -4.9171953201293945, "global_step": 9795, "epoch": 233} {"train_loss": -5.081390380859375, "global_step": 9796, "epoch": 233} {"train_loss": -4.9837141036987305, "global_step": 9797, "epoch": 233} {"train_loss": -4.981202125549316, "global_step": 9798, "epoch": 233} {"train_loss": -4.953571319580078, "global_step": 9799, "epoch": 233} {"train_loss": -4.987886905670166, "global_step": 9800, "epoch": 233} {"train_loss": -4.894690990447998, "global_step": 9801, "epoch": 233} {"train_loss": -4.900649070739746, "global_step": 9802, "epoch": 233} {"train_loss": -5.068365097045898, "global_step": 9803, "epoch": 233} {"train_loss": -4.872049808502197, "global_step": 9804, "epoch": 233} {"train_loss": -4.922025680541992, "global_step": 9805, "epoch": 233} {"train_loss": -4.996598720550537, "global_step": 9806, "epoch": 233} {"train_loss": -5.028415679931641, "global_step": 9807, "epoch": 233} {"train_loss": -4.945693016052246, "global_step": 9808, "epoch": 233} {"train_loss": -5.030165672302246, "global_step": 9809, "epoch": 233} {"train_loss": -5.07620906829834, "global_step": 9810, "epoch": 233} {"train_loss": -4.926691055297852, "global_step": 9811, "epoch": 233} {"train_loss": -5.065463066101074, "global_step": 9812, "epoch": 233} {"train_loss": -4.9622955322265625, "global_step": 9813, "epoch": 233} {"train_loss": -5.076552867889404, "global_step": 9814, "epoch": 233} {"train_loss": -5.030299186706543, "global_step": 9815, "epoch": 233} {"train_loss": -5.075308799743652, "global_step": 9816, "epoch": 233} {"train_loss": -4.948278903961182, "global_step": 9817, "epoch": 233} {"train_loss": -5.0237345695495605, "global_step": 9818, "epoch": 233} {"train_loss": -4.965176582336426, "global_step": 9819, "epoch": 233} {"train_loss": -5.165956497192383, "global_step": 9820, "epoch": 233} {"train_loss": -4.976218223571777, "global_step": 9821, "epoch": 233} {"train_loss": -5.066856384277344, "global_step": 9822, "epoch": 233} {"train_loss": -5.030977249145508, "global_step": 9823, "epoch": 233} {"train_loss": -4.98375129699707, "global_step": 9824, "epoch": 233} {"train_loss": -5.164609432220459, "global_step": 9825, "epoch": 233} {"train_loss": -5.000412464141846, "global_step": 9826, "epoch": 233} {"train_loss": -4.972616820108323, "global_step": 9827, "epoch": 233, "val_loss": 81550.140625} {"train_loss": -5.115859508514404, "global_step": 9828, "epoch": 234} {"train_loss": -4.927892208099365, "global_step": 9829, "epoch": 234} {"train_loss": -5.0098958015441895, "global_step": 9830, "epoch": 234} {"train_loss": -5.035552978515625, "global_step": 9831, "epoch": 234} {"train_loss": -4.898778438568115, "global_step": 9832, "epoch": 234} {"train_loss": -5.0723137855529785, "global_step": 9833, "epoch": 234} {"train_loss": -5.097943305969238, "global_step": 9834, "epoch": 234} {"train_loss": -4.717023849487305, "global_step": 9835, "epoch": 234} {"train_loss": -4.9280571937561035, "global_step": 9836, "epoch": 234} {"train_loss": -4.979711055755615, "global_step": 9837, "epoch": 234} {"train_loss": -4.92657470703125, "global_step": 9838, "epoch": 234} {"train_loss": -4.831201076507568, "global_step": 9839, "epoch": 234} {"train_loss": -5.153120040893555, "global_step": 9840, "epoch": 234} {"train_loss": -4.8615498542785645, "global_step": 9841, "epoch": 234} {"train_loss": -4.977358341217041, "global_step": 9842, "epoch": 234} {"train_loss": -5.007570266723633, "global_step": 9843, "epoch": 234} {"train_loss": -4.937722682952881, "global_step": 9844, "epoch": 234} {"train_loss": -4.992630958557129, "global_step": 9845, "epoch": 234} {"train_loss": -5.0238261222839355, "global_step": 9846, "epoch": 234} {"train_loss": -4.904504776000977, "global_step": 9847, "epoch": 234} {"train_loss": -5.152716159820557, "global_step": 9848, "epoch": 234} {"train_loss": -4.9861979484558105, "global_step": 9849, "epoch": 234} {"train_loss": -5.0055251121521, "global_step": 9850, "epoch": 234} {"train_loss": -5.064165115356445, "global_step": 9851, "epoch": 234} {"train_loss": -4.896280288696289, "global_step": 9852, "epoch": 234} {"train_loss": -5.017540454864502, "global_step": 9853, "epoch": 234} {"train_loss": -4.993622303009033, "global_step": 9854, "epoch": 234} {"train_loss": -5.041117191314697, "global_step": 9855, "epoch": 234} {"train_loss": -5.1035475730896, "global_step": 9856, "epoch": 234} {"train_loss": -4.983377456665039, "global_step": 9857, "epoch": 234} {"train_loss": -5.103582382202148, "global_step": 9858, "epoch": 234} {"train_loss": -4.957915782928467, "global_step": 9859, "epoch": 234} {"train_loss": -5.042459964752197, "global_step": 9860, "epoch": 234} {"train_loss": -5.092766761779785, "global_step": 9861, "epoch": 234} {"train_loss": -5.074777126312256, "global_step": 9862, "epoch": 234} {"train_loss": -5.024872779846191, "global_step": 9863, "epoch": 234} {"train_loss": -5.009742259979248, "global_step": 9864, "epoch": 234} {"train_loss": -5.109676361083984, "global_step": 9865, "epoch": 234} {"train_loss": -5.040788173675537, "global_step": 9866, "epoch": 234} {"train_loss": -5.067719459533691, "global_step": 9867, "epoch": 234} {"train_loss": -5.091001510620117, "global_step": 9868, "epoch": 234} {"train_loss": -5.006355013166155, "global_step": 9869, "epoch": 234, "val_loss": 81401.9453125} {"train_loss": -5.226570129394531, "global_step": 9870, "epoch": 235} {"train_loss": -4.943024635314941, "global_step": 9871, "epoch": 235} {"train_loss": -5.17280387878418, "global_step": 9872, "epoch": 235} {"train_loss": -5.101408004760742, "global_step": 9873, "epoch": 235} {"train_loss": -5.01530122756958, "global_step": 9874, "epoch": 235} {"train_loss": -4.942465782165527, "global_step": 9875, "epoch": 235} {"train_loss": -5.023455619812012, "global_step": 9876, "epoch": 235} {"train_loss": -5.095066547393799, "global_step": 9877, "epoch": 235} {"train_loss": -4.885476112365723, "global_step": 9878, "epoch": 235} {"train_loss": -4.995745658874512, "global_step": 9879, "epoch": 235} {"train_loss": -5.201014041900635, "global_step": 9880, "epoch": 235} {"train_loss": -4.995456695556641, "global_step": 9881, "epoch": 235} {"train_loss": -4.928842067718506, "global_step": 9882, "epoch": 235} {"train_loss": -4.912562370300293, "global_step": 9883, "epoch": 235} {"train_loss": -4.895376205444336, "global_step": 9884, "epoch": 235} {"train_loss": -4.994762897491455, "global_step": 9885, "epoch": 235} {"train_loss": -4.716722011566162, "global_step": 9886, "epoch": 235} {"train_loss": -5.013649940490723, "global_step": 9887, "epoch": 235} {"train_loss": -4.933149337768555, "global_step": 9888, "epoch": 235} {"train_loss": -4.648261547088623, "global_step": 9889, "epoch": 235} {"train_loss": -4.991829872131348, "global_step": 9890, "epoch": 235} {"train_loss": -4.95084285736084, "global_step": 9891, "epoch": 235} {"train_loss": -4.870845317840576, "global_step": 9892, "epoch": 235} {"train_loss": -5.055940628051758, "global_step": 9893, "epoch": 235} {"train_loss": -4.967923164367676, "global_step": 9894, "epoch": 235} {"train_loss": -4.983658313751221, "global_step": 9895, "epoch": 235} {"train_loss": -4.913215160369873, "global_step": 9896, "epoch": 235} {"train_loss": -4.757415294647217, "global_step": 9897, "epoch": 235} {"train_loss": -5.108760833740234, "global_step": 9898, "epoch": 235} {"train_loss": -4.73109769821167, "global_step": 9899, "epoch": 235} {"train_loss": -4.861414909362793, "global_step": 9900, "epoch": 235} {"train_loss": -4.8010945320129395, "global_step": 9901, "epoch": 235} {"train_loss": -5.052032947540283, "global_step": 9902, "epoch": 235} {"train_loss": -5.09527587890625, "global_step": 9903, "epoch": 235} {"train_loss": -5.002593517303467, "global_step": 9904, "epoch": 235} {"train_loss": -4.973529815673828, "global_step": 9905, "epoch": 235} {"train_loss": -4.900135040283203, "global_step": 9906, "epoch": 235} {"train_loss": -4.9629058837890625, "global_step": 9907, "epoch": 235} {"train_loss": -4.96712064743042, "global_step": 9908, "epoch": 235} {"train_loss": -5.174722194671631, "global_step": 9909, "epoch": 235} {"train_loss": -5.004202842712402, "global_step": 9910, "epoch": 235} {"train_loss": -4.970104047230312, "global_step": 9911, "epoch": 235, "val_loss": 81120.7734375} {"train_loss": -5.018192291259766, "global_step": 9912, "epoch": 236} {"train_loss": -4.8924970626831055, "global_step": 9913, "epoch": 236} {"train_loss": -4.91609001159668, "global_step": 9914, "epoch": 236} {"train_loss": -4.9517621994018555, "global_step": 9915, "epoch": 236} {"train_loss": -4.955930709838867, "global_step": 9916, "epoch": 236} {"train_loss": -5.0598883628845215, "global_step": 9917, "epoch": 236} {"train_loss": -4.813241004943848, "global_step": 9918, "epoch": 236} {"train_loss": -5.116846084594727, "global_step": 9919, "epoch": 236} {"train_loss": -4.883966445922852, "global_step": 9920, "epoch": 236} {"train_loss": -5.024240970611572, "global_step": 9921, "epoch": 236} {"train_loss": -4.978023052215576, "global_step": 9922, "epoch": 236} {"train_loss": -4.944003105163574, "global_step": 9923, "epoch": 236} {"train_loss": -4.941935062408447, "global_step": 9924, "epoch": 236} {"train_loss": -5.009665012359619, "global_step": 9925, "epoch": 236} {"train_loss": -4.9966888427734375, "global_step": 9926, "epoch": 236} {"train_loss": -4.930364608764648, "global_step": 9927, "epoch": 236} {"train_loss": -4.942063331604004, "global_step": 9928, "epoch": 236} {"train_loss": -5.154370307922363, "global_step": 9929, "epoch": 236} {"train_loss": -5.014516353607178, "global_step": 9930, "epoch": 236} {"train_loss": -5.057640552520752, "global_step": 9931, "epoch": 236} {"train_loss": -5.077976703643799, "global_step": 9932, "epoch": 236} {"train_loss": -5.110796928405762, "global_step": 9933, "epoch": 236} {"train_loss": -4.814594745635986, "global_step": 9934, "epoch": 236} {"train_loss": -5.152584075927734, "global_step": 9935, "epoch": 236} {"train_loss": -5.07070255279541, "global_step": 9936, "epoch": 236} {"train_loss": -5.0532636642456055, "global_step": 9937, "epoch": 236} {"train_loss": -5.104929447174072, "global_step": 9938, "epoch": 236} {"train_loss": -5.041186332702637, "global_step": 9939, "epoch": 236} {"train_loss": -5.055127143859863, "global_step": 9940, "epoch": 236} {"train_loss": -4.947588920593262, "global_step": 9941, "epoch": 236} {"train_loss": -4.853035926818848, "global_step": 9942, "epoch": 236} {"train_loss": -5.012395858764648, "global_step": 9943, "epoch": 236} {"train_loss": -4.855977535247803, "global_step": 9944, "epoch": 236} {"train_loss": -5.033503532409668, "global_step": 9945, "epoch": 236} {"train_loss": -4.769017219543457, "global_step": 9946, "epoch": 236} {"train_loss": -4.6744256019592285, "global_step": 9947, "epoch": 236} {"train_loss": -4.990455150604248, "global_step": 9948, "epoch": 236} {"train_loss": -4.656017303466797, "global_step": 9949, "epoch": 236} {"train_loss": -4.942320346832275, "global_step": 9950, "epoch": 236} {"train_loss": -4.876523017883301, "global_step": 9951, "epoch": 236} {"train_loss": -4.936641693115234, "global_step": 9952, "epoch": 236} {"train_loss": -4.968637182599022, "global_step": 9953, "epoch": 236, "val_loss": 84131.0859375} {"train_loss": -4.672390937805176, "global_step": 9954, "epoch": 237} {"train_loss": -4.767121315002441, "global_step": 9955, "epoch": 237} {"train_loss": -4.839142322540283, "global_step": 9956, "epoch": 237} {"train_loss": -4.8948564529418945, "global_step": 9957, "epoch": 237} {"train_loss": -4.8853302001953125, "global_step": 9958, "epoch": 237} {"train_loss": -4.8991546630859375, "global_step": 9959, "epoch": 237} {"train_loss": -4.829845428466797, "global_step": 9960, "epoch": 237} {"train_loss": -4.852197647094727, "global_step": 9961, "epoch": 237} {"train_loss": -4.947382926940918, "global_step": 9962, "epoch": 237} {"train_loss": -5.041486740112305, "global_step": 9963, "epoch": 237} {"train_loss": -5.127384185791016, "global_step": 9964, "epoch": 237} {"train_loss": -5.0022382736206055, "global_step": 9965, "epoch": 237} {"train_loss": -4.945832252502441, "global_step": 9966, "epoch": 237} {"train_loss": -4.892805099487305, "global_step": 9967, "epoch": 237} {"train_loss": -4.813977241516113, "global_step": 9968, "epoch": 237} {"train_loss": -4.971377372741699, "global_step": 9969, "epoch": 237} {"train_loss": -4.939453125, "global_step": 9970, "epoch": 237} {"train_loss": -5.151052951812744, "global_step": 9971, "epoch": 237} {"train_loss": -4.864555358886719, "global_step": 9972, "epoch": 237} {"train_loss": -5.009287357330322, "global_step": 9973, "epoch": 237} {"train_loss": -4.9433817863464355, "global_step": 9974, "epoch": 237} {"train_loss": -4.721532821655273, "global_step": 9975, "epoch": 237} {"train_loss": -4.884948253631592, "global_step": 9976, "epoch": 237} {"train_loss": -4.900687217712402, "global_step": 9977, "epoch": 237} {"train_loss": -4.957434177398682, "global_step": 9978, "epoch": 237} {"train_loss": -4.952262878417969, "global_step": 9979, "epoch": 237} {"train_loss": -5.01645565032959, "global_step": 9980, "epoch": 237} {"train_loss": -4.890267372131348, "global_step": 9981, "epoch": 237} {"train_loss": -4.965707778930664, "global_step": 9982, "epoch": 237} {"train_loss": -4.788122177124023, "global_step": 9983, "epoch": 237} {"train_loss": -4.779958724975586, "global_step": 9984, "epoch": 237} {"train_loss": -4.968713283538818, "global_step": 9985, "epoch": 237} {"train_loss": -4.893160820007324, "global_step": 9986, "epoch": 237} {"train_loss": -4.969562530517578, "global_step": 9987, "epoch": 237} {"train_loss": -5.0012311935424805, "global_step": 9988, "epoch": 237} {"train_loss": -5.137877941131592, "global_step": 9989, "epoch": 237} {"train_loss": -5.057343482971191, "global_step": 9990, "epoch": 237} {"train_loss": -5.16510009765625, "global_step": 9991, "epoch": 237} {"train_loss": -5.071686267852783, "global_step": 9992, "epoch": 237} {"train_loss": -5.177041530609131, "global_step": 9993, "epoch": 237} {"train_loss": -5.104220867156982, "global_step": 9994, "epoch": 237} {"train_loss": -4.943582239605131, "global_step": 9995, "epoch": 237, "val_loss": 81756.8046875} {"train_loss": -4.8935980796813965, "global_step": 9996, "epoch": 238} {"train_loss": -4.967554092407227, "global_step": 9997, "epoch": 238} {"train_loss": -5.05485725402832, "global_step": 9998, "epoch": 238} {"train_loss": -4.9513444900512695, "global_step": 9999, "epoch": 238} {"train_loss": -5.0024309158325195, "global_step": 10000, "epoch": 238} {"train_loss": -5.043847560882568, "global_step": 10001, "epoch": 238} {"train_loss": -4.990313529968262, "global_step": 10002, "epoch": 238} {"train_loss": -4.979118824005127, "global_step": 10003, "epoch": 238} {"train_loss": -5.131958484649658, "global_step": 10004, "epoch": 238} {"train_loss": -4.997138023376465, "global_step": 10005, "epoch": 238} {"train_loss": -5.038571357727051, "global_step": 10006, "epoch": 238} {"train_loss": -5.025387763977051, "global_step": 10007, "epoch": 238} {"train_loss": -4.9767045974731445, "global_step": 10008, "epoch": 238} {"train_loss": -5.041095733642578, "global_step": 10009, "epoch": 238} {"train_loss": -5.0864129066467285, "global_step": 10010, "epoch": 238} {"train_loss": -4.984438419342041, "global_step": 10011, "epoch": 238} {"train_loss": -4.909148216247559, "global_step": 10012, "epoch": 238} {"train_loss": -4.884920120239258, "global_step": 10013, "epoch": 238} {"train_loss": -4.944293022155762, "global_step": 10014, "epoch": 238} {"train_loss": -4.973916530609131, "global_step": 10015, "epoch": 238} {"train_loss": -5.160294055938721, "global_step": 10016, "epoch": 238} {"train_loss": -5.063480377197266, "global_step": 10017, "epoch": 238} {"train_loss": -5.046338081359863, "global_step": 10018, "epoch": 238} {"train_loss": -5.016995906829834, "global_step": 10019, "epoch": 238} {"train_loss": -5.1567182540893555, "global_step": 10020, "epoch": 238} {"train_loss": -5.242580890655518, "global_step": 10021, "epoch": 238} {"train_loss": -4.9557204246521, "global_step": 10022, "epoch": 238} {"train_loss": -5.103928565979004, "global_step": 10023, "epoch": 238} {"train_loss": -5.08522891998291, "global_step": 10024, "epoch": 238} {"train_loss": -5.204960346221924, "global_step": 10025, "epoch": 238} {"train_loss": -4.828159332275391, "global_step": 10026, "epoch": 238} {"train_loss": -5.049989700317383, "global_step": 10027, "epoch": 238} {"train_loss": -4.886702537536621, "global_step": 10028, "epoch": 238} {"train_loss": -4.8458943367004395, "global_step": 10029, "epoch": 238} {"train_loss": -5.166933536529541, "global_step": 10030, "epoch": 238} {"train_loss": -5.015712261199951, "global_step": 10031, "epoch": 238} {"train_loss": -5.063236236572266, "global_step": 10032, "epoch": 238} {"train_loss": -5.052013397216797, "global_step": 10033, "epoch": 238} {"train_loss": -5.079981327056885, "global_step": 10034, "epoch": 238} {"train_loss": -5.056552886962891, "global_step": 10035, "epoch": 238} {"train_loss": -4.882748603820801, "global_step": 10036, "epoch": 238} {"train_loss": -5.022945733297439, "global_step": 10037, "epoch": 238, "val_loss": 82323.9140625} {"train_loss": -4.963195323944092, "global_step": 10038, "epoch": 239} {"train_loss": -5.138654708862305, "global_step": 10039, "epoch": 239} {"train_loss": -4.905801296234131, "global_step": 10040, "epoch": 239} {"train_loss": -4.9810791015625, "global_step": 10041, "epoch": 239} {"train_loss": -5.076625347137451, "global_step": 10042, "epoch": 239} {"train_loss": -5.139098167419434, "global_step": 10043, "epoch": 239} {"train_loss": -5.056890487670898, "global_step": 10044, "epoch": 239} {"train_loss": -5.178773880004883, "global_step": 10045, "epoch": 239} {"train_loss": -4.863224983215332, "global_step": 10046, "epoch": 239} {"train_loss": -4.9777374267578125, "global_step": 10047, "epoch": 239} {"train_loss": -4.970937252044678, "global_step": 10048, "epoch": 239} {"train_loss": -4.960165977478027, "global_step": 10049, "epoch": 239} {"train_loss": -4.963836193084717, "global_step": 10050, "epoch": 239} {"train_loss": -5.064798831939697, "global_step": 10051, "epoch": 239} {"train_loss": -4.940313816070557, "global_step": 10052, "epoch": 239} {"train_loss": -4.963058948516846, "global_step": 10053, "epoch": 239} {"train_loss": -4.986209869384766, "global_step": 10054, "epoch": 239} {"train_loss": -5.053593635559082, "global_step": 10055, "epoch": 239} {"train_loss": -5.06269645690918, "global_step": 10056, "epoch": 239} {"train_loss": -4.929963111877441, "global_step": 10057, "epoch": 239} {"train_loss": -5.059174537658691, "global_step": 10058, "epoch": 239} {"train_loss": -4.971944332122803, "global_step": 10059, "epoch": 239} {"train_loss": -4.998940467834473, "global_step": 10060, "epoch": 239} {"train_loss": -4.880677700042725, "global_step": 10061, "epoch": 239} {"train_loss": -4.954494953155518, "global_step": 10062, "epoch": 239} {"train_loss": -4.9601359367370605, "global_step": 10063, "epoch": 239} {"train_loss": -4.952707290649414, "global_step": 10064, "epoch": 239} {"train_loss": -5.0486602783203125, "global_step": 10065, "epoch": 239} {"train_loss": -4.913309097290039, "global_step": 10066, "epoch": 239} {"train_loss": -5.077070713043213, "global_step": 10067, "epoch": 239} {"train_loss": -4.909546852111816, "global_step": 10068, "epoch": 239} {"train_loss": -4.962686061859131, "global_step": 10069, "epoch": 239} {"train_loss": -4.943500518798828, "global_step": 10070, "epoch": 239} {"train_loss": -4.981827735900879, "global_step": 10071, "epoch": 239} {"train_loss": -4.974084854125977, "global_step": 10072, "epoch": 239} {"train_loss": -4.985629558563232, "global_step": 10073, "epoch": 239} {"train_loss": -5.022686958312988, "global_step": 10074, "epoch": 239} {"train_loss": -4.949568748474121, "global_step": 10075, "epoch": 239} {"train_loss": -5.091801643371582, "global_step": 10076, "epoch": 239} {"train_loss": -4.877359390258789, "global_step": 10077, "epoch": 239} {"train_loss": -4.926414489746094, "global_step": 10078, "epoch": 239} {"train_loss": -4.99295837538583, "global_step": 10079, "epoch": 239, "val_loss": 81763.421875} {"train_loss": -5.004522323608398, "global_step": 10080, "epoch": 240} {"train_loss": -5.149702548980713, "global_step": 10081, "epoch": 240} {"train_loss": -5.127874851226807, "global_step": 10082, "epoch": 240} {"train_loss": -5.056591510772705, "global_step": 10083, "epoch": 240} {"train_loss": -4.901585102081299, "global_step": 10084, "epoch": 240} {"train_loss": -5.1063032150268555, "global_step": 10085, "epoch": 240} {"train_loss": -4.946558952331543, "global_step": 10086, "epoch": 240} {"train_loss": -4.976420879364014, "global_step": 10087, "epoch": 240} {"train_loss": -4.937952518463135, "global_step": 10088, "epoch": 240} {"train_loss": -5.074273109436035, "global_step": 10089, "epoch": 240} {"train_loss": -5.093023777008057, "global_step": 10090, "epoch": 240} {"train_loss": -5.066546440124512, "global_step": 10091, "epoch": 240} {"train_loss": -5.097609996795654, "global_step": 10092, "epoch": 240} {"train_loss": -5.052216529846191, "global_step": 10093, "epoch": 240} {"train_loss": -5.166967391967773, "global_step": 10094, "epoch": 240} {"train_loss": -4.975152969360352, "global_step": 10095, "epoch": 240} {"train_loss": -4.863796710968018, "global_step": 10096, "epoch": 240} {"train_loss": -5.002053260803223, "global_step": 10097, "epoch": 240} {"train_loss": -5.0733232498168945, "global_step": 10098, "epoch": 240} {"train_loss": -4.976828098297119, "global_step": 10099, "epoch": 240} {"train_loss": -4.978712558746338, "global_step": 10100, "epoch": 240} {"train_loss": -5.140120506286621, "global_step": 10101, "epoch": 240} {"train_loss": -4.978257179260254, "global_step": 10102, "epoch": 240} {"train_loss": -4.985860824584961, "global_step": 10103, "epoch": 240} {"train_loss": -4.976728439331055, "global_step": 10104, "epoch": 240} {"train_loss": -5.104318618774414, "global_step": 10105, "epoch": 240} {"train_loss": -5.104644298553467, "global_step": 10106, "epoch": 240} {"train_loss": -5.136157989501953, "global_step": 10107, "epoch": 240} {"train_loss": -4.822126388549805, "global_step": 10108, "epoch": 240} {"train_loss": -4.994431972503662, "global_step": 10109, "epoch": 240} {"train_loss": -4.988978385925293, "global_step": 10110, "epoch": 240} {"train_loss": -4.942915439605713, "global_step": 10111, "epoch": 240} {"train_loss": -4.925415515899658, "global_step": 10112, "epoch": 240} {"train_loss": -4.9245076179504395, "global_step": 10113, "epoch": 240} {"train_loss": -5.054657936096191, "global_step": 10114, "epoch": 240} {"train_loss": -4.98572301864624, "global_step": 10115, "epoch": 240} {"train_loss": -5.064736366271973, "global_step": 10116, "epoch": 240} {"train_loss": -5.037649154663086, "global_step": 10117, "epoch": 240} {"train_loss": -5.050395965576172, "global_step": 10118, "epoch": 240} {"train_loss": -5.004524230957031, "global_step": 10119, "epoch": 240} {"train_loss": -5.062294006347656, "global_step": 10120, "epoch": 240} {"train_loss": -5.023093348457699, "global_step": 10121, "epoch": 240, "val_loss": 81916.4140625} {"train_loss": -4.937211990356445, "global_step": 10122, "epoch": 241} {"train_loss": -5.108346939086914, "global_step": 10123, "epoch": 241} {"train_loss": -5.111488342285156, "global_step": 10124, "epoch": 241} {"train_loss": -4.941155433654785, "global_step": 10125, "epoch": 241} {"train_loss": -5.1114606857299805, "global_step": 10126, "epoch": 241} {"train_loss": -5.036978721618652, "global_step": 10127, "epoch": 241} {"train_loss": -5.044229507446289, "global_step": 10128, "epoch": 241} {"train_loss": -5.106404781341553, "global_step": 10129, "epoch": 241} {"train_loss": -4.994307518005371, "global_step": 10130, "epoch": 241} {"train_loss": -5.007465362548828, "global_step": 10131, "epoch": 241} {"train_loss": -5.117407321929932, "global_step": 10132, "epoch": 241} {"train_loss": -4.955724239349365, "global_step": 10133, "epoch": 241} {"train_loss": -5.178775787353516, "global_step": 10134, "epoch": 241} {"train_loss": -5.142500877380371, "global_step": 10135, "epoch": 241} {"train_loss": -5.046817779541016, "global_step": 10136, "epoch": 241} {"train_loss": -4.931417942047119, "global_step": 10137, "epoch": 241} {"train_loss": -5.163249969482422, "global_step": 10138, "epoch": 241} {"train_loss": -5.008639812469482, "global_step": 10139, "epoch": 241} {"train_loss": -4.890185356140137, "global_step": 10140, "epoch": 241} {"train_loss": -5.186548233032227, "global_step": 10141, "epoch": 241} {"train_loss": -5.121133804321289, "global_step": 10142, "epoch": 241} {"train_loss": -4.983715057373047, "global_step": 10143, "epoch": 241} {"train_loss": -5.048101425170898, "global_step": 10144, "epoch": 241} {"train_loss": -5.2957377433776855, "global_step": 10145, "epoch": 241} {"train_loss": -5.0993242263793945, "global_step": 10146, "epoch": 241} {"train_loss": -4.9671125411987305, "global_step": 10147, "epoch": 241} {"train_loss": -5.002810478210449, "global_step": 10148, "epoch": 241} {"train_loss": -4.978791236877441, "global_step": 10149, "epoch": 241} {"train_loss": -5.233186721801758, "global_step": 10150, "epoch": 241} {"train_loss": -4.883082866668701, "global_step": 10151, "epoch": 241} {"train_loss": -4.815847396850586, "global_step": 10152, "epoch": 241} {"train_loss": -5.036715030670166, "global_step": 10153, "epoch": 241} {"train_loss": -5.018307685852051, "global_step": 10154, "epoch": 241} {"train_loss": -5.059040069580078, "global_step": 10155, "epoch": 241} {"train_loss": -4.735287189483643, "global_step": 10156, "epoch": 241} {"train_loss": -5.141439437866211, "global_step": 10157, "epoch": 241} {"train_loss": -4.858907222747803, "global_step": 10158, "epoch": 241} {"train_loss": -5.0144572257995605, "global_step": 10159, "epoch": 241} {"train_loss": -5.1250715255737305, "global_step": 10160, "epoch": 241} {"train_loss": -5.078975677490234, "global_step": 10161, "epoch": 241} {"train_loss": -4.971246719360352, "global_step": 10162, "epoch": 241} {"train_loss": -5.034646601904006, "global_step": 10163, "epoch": 241, "val_loss": 82052.4921875} {"train_loss": -4.96376371383667, "global_step": 10164, "epoch": 242} {"train_loss": -5.1397013664245605, "global_step": 10165, "epoch": 242} {"train_loss": -5.052774429321289, "global_step": 10166, "epoch": 242} {"train_loss": -5.069851875305176, "global_step": 10167, "epoch": 242} {"train_loss": -5.2000555992126465, "global_step": 10168, "epoch": 242} {"train_loss": -5.128790378570557, "global_step": 10169, "epoch": 242} {"train_loss": -4.986355304718018, "global_step": 10170, "epoch": 242} {"train_loss": -5.217691421508789, "global_step": 10171, "epoch": 242} {"train_loss": -5.143759250640869, "global_step": 10172, "epoch": 242} {"train_loss": -5.027125358581543, "global_step": 10173, "epoch": 242} {"train_loss": -5.153470993041992, "global_step": 10174, "epoch": 242} {"train_loss": -5.096386909484863, "global_step": 10175, "epoch": 242} {"train_loss": -4.998630046844482, "global_step": 10176, "epoch": 242} {"train_loss": -5.1008620262146, "global_step": 10177, "epoch": 242} {"train_loss": -5.0822858810424805, "global_step": 10178, "epoch": 242} {"train_loss": -5.135397434234619, "global_step": 10179, "epoch": 242} {"train_loss": -5.077582836151123, "global_step": 10180, "epoch": 242} {"train_loss": -5.166643142700195, "global_step": 10181, "epoch": 242} {"train_loss": -5.080314636230469, "global_step": 10182, "epoch": 242} {"train_loss": -4.9437055587768555, "global_step": 10183, "epoch": 242} {"train_loss": -5.041019916534424, "global_step": 10184, "epoch": 242} {"train_loss": -5.100893020629883, "global_step": 10185, "epoch": 242} {"train_loss": -5.016015529632568, "global_step": 10186, "epoch": 242} {"train_loss": -5.0296430587768555, "global_step": 10187, "epoch": 242} {"train_loss": -5.027132987976074, "global_step": 10188, "epoch": 242} {"train_loss": -4.996874809265137, "global_step": 10189, "epoch": 242} {"train_loss": -5.030255317687988, "global_step": 10190, "epoch": 242} {"train_loss": -5.04805850982666, "global_step": 10191, "epoch": 242} {"train_loss": -4.980266571044922, "global_step": 10192, "epoch": 242} {"train_loss": -4.994194984436035, "global_step": 10193, "epoch": 242} {"train_loss": -5.1430511474609375, "global_step": 10194, "epoch": 242} {"train_loss": -5.123600006103516, "global_step": 10195, "epoch": 242} {"train_loss": -4.960997104644775, "global_step": 10196, "epoch": 242} {"train_loss": -5.031744003295898, "global_step": 10197, "epoch": 242} {"train_loss": -5.088738918304443, "global_step": 10198, "epoch": 242} {"train_loss": -4.819767951965332, "global_step": 10199, "epoch": 242} {"train_loss": -5.097498893737793, "global_step": 10200, "epoch": 242} {"train_loss": -5.064836025238037, "global_step": 10201, "epoch": 242} {"train_loss": -4.922863960266113, "global_step": 10202, "epoch": 242} {"train_loss": -4.868386268615723, "global_step": 10203, "epoch": 242} {"train_loss": -4.997953414916992, "global_step": 10204, "epoch": 242} {"train_loss": -5.04797489302499, "global_step": 10205, "epoch": 242, "val_loss": 82890.984375} {"train_loss": -4.9234113693237305, "global_step": 10206, "epoch": 243} {"train_loss": -5.051700592041016, "global_step": 10207, "epoch": 243} {"train_loss": -5.114987850189209, "global_step": 10208, "epoch": 243} {"train_loss": -4.905728816986084, "global_step": 10209, "epoch": 243} {"train_loss": -5.045868873596191, "global_step": 10210, "epoch": 243} {"train_loss": -4.935823917388916, "global_step": 10211, "epoch": 243} {"train_loss": -5.012454032897949, "global_step": 10212, "epoch": 243} {"train_loss": -5.039411544799805, "global_step": 10213, "epoch": 243} {"train_loss": -4.894604682922363, "global_step": 10214, "epoch": 243} {"train_loss": -5.104340553283691, "global_step": 10215, "epoch": 243} {"train_loss": -5.0145263671875, "global_step": 10216, "epoch": 243} {"train_loss": -5.007397174835205, "global_step": 10217, "epoch": 243} {"train_loss": -5.098586559295654, "global_step": 10218, "epoch": 243} {"train_loss": -4.985637187957764, "global_step": 10219, "epoch": 243} {"train_loss": -4.917943954467773, "global_step": 10220, "epoch": 243} {"train_loss": -4.996600151062012, "global_step": 10221, "epoch": 243} {"train_loss": -4.982694149017334, "global_step": 10222, "epoch": 243} {"train_loss": -5.09196138381958, "global_step": 10223, "epoch": 243} {"train_loss": -5.052951335906982, "global_step": 10224, "epoch": 243} {"train_loss": -4.935054302215576, "global_step": 10225, "epoch": 243} {"train_loss": -5.024080753326416, "global_step": 10226, "epoch": 243} {"train_loss": -5.151673316955566, "global_step": 10227, "epoch": 243} {"train_loss": -5.121081352233887, "global_step": 10228, "epoch": 243} {"train_loss": -4.965497970581055, "global_step": 10229, "epoch": 243} {"train_loss": -5.026864051818848, "global_step": 10230, "epoch": 243} {"train_loss": -5.1495161056518555, "global_step": 10231, "epoch": 243} {"train_loss": -4.993564605712891, "global_step": 10232, "epoch": 243} {"train_loss": -5.167937278747559, "global_step": 10233, "epoch": 243} {"train_loss": -4.9723405838012695, "global_step": 10234, "epoch": 243} {"train_loss": -5.067014694213867, "global_step": 10235, "epoch": 243} {"train_loss": -4.953819274902344, "global_step": 10236, "epoch": 243} {"train_loss": -5.0545430183410645, "global_step": 10237, "epoch": 243} {"train_loss": -5.120589256286621, "global_step": 10238, "epoch": 243} {"train_loss": -4.876834869384766, "global_step": 10239, "epoch": 243} {"train_loss": -5.004446029663086, "global_step": 10240, "epoch": 243} {"train_loss": -5.105563163757324, "global_step": 10241, "epoch": 243} {"train_loss": -5.007004261016846, "global_step": 10242, "epoch": 243} {"train_loss": -5.106503009796143, "global_step": 10243, "epoch": 243} {"train_loss": -5.060080528259277, "global_step": 10244, "epoch": 243} {"train_loss": -5.1258134841918945, "global_step": 10245, "epoch": 243} {"train_loss": -4.922662734985352, "global_step": 10246, "epoch": 243} {"train_loss": -5.0256526583716985, "global_step": 10247, "epoch": 243, "val_loss": 81054.921875} {"train_loss": -4.92758846282959, "global_step": 10248, "epoch": 244} {"train_loss": -5.08552360534668, "global_step": 10249, "epoch": 244} {"train_loss": -5.005057334899902, "global_step": 10250, "epoch": 244} {"train_loss": -4.8171491622924805, "global_step": 10251, "epoch": 244} {"train_loss": -4.964791297912598, "global_step": 10252, "epoch": 244} {"train_loss": -5.187277317047119, "global_step": 10253, "epoch": 244} {"train_loss": -5.108189582824707, "global_step": 10254, "epoch": 244} {"train_loss": -4.928426265716553, "global_step": 10255, "epoch": 244} {"train_loss": -5.137222766876221, "global_step": 10256, "epoch": 244} {"train_loss": -5.04232120513916, "global_step": 10257, "epoch": 244} {"train_loss": -5.031808853149414, "global_step": 10258, "epoch": 244} {"train_loss": -5.1639509201049805, "global_step": 10259, "epoch": 244} {"train_loss": -4.9742937088012695, "global_step": 10260, "epoch": 244} {"train_loss": -5.154448509216309, "global_step": 10261, "epoch": 244} {"train_loss": -5.124946594238281, "global_step": 10262, "epoch": 244} {"train_loss": -5.040719032287598, "global_step": 10263, "epoch": 244} {"train_loss": -5.054597854614258, "global_step": 10264, "epoch": 244} {"train_loss": -5.181073188781738, "global_step": 10265, "epoch": 244} {"train_loss": -5.1754021644592285, "global_step": 10266, "epoch": 244} {"train_loss": -5.082812309265137, "global_step": 10267, "epoch": 244} {"train_loss": -5.16756534576416, "global_step": 10268, "epoch": 244} {"train_loss": -4.871148586273193, "global_step": 10269, "epoch": 244} {"train_loss": -4.978121757507324, "global_step": 10270, "epoch": 244} {"train_loss": -5.026771068572998, "global_step": 10271, "epoch": 244} {"train_loss": -5.097888946533203, "global_step": 10272, "epoch": 244} {"train_loss": -4.991186141967773, "global_step": 10273, "epoch": 244} {"train_loss": -5.09398889541626, "global_step": 10274, "epoch": 244} {"train_loss": -4.965612411499023, "global_step": 10275, "epoch": 244} {"train_loss": -5.047328948974609, "global_step": 10276, "epoch": 244} {"train_loss": -5.041886806488037, "global_step": 10277, "epoch": 244} {"train_loss": -5.113892555236816, "global_step": 10278, "epoch": 244} {"train_loss": -5.007599830627441, "global_step": 10279, "epoch": 244} {"train_loss": -5.09121036529541, "global_step": 10280, "epoch": 244} {"train_loss": -5.003196716308594, "global_step": 10281, "epoch": 244} {"train_loss": -4.9336771965026855, "global_step": 10282, "epoch": 244} {"train_loss": -4.97162389755249, "global_step": 10283, "epoch": 244} {"train_loss": -4.948826789855957, "global_step": 10284, "epoch": 244} {"train_loss": -5.0205841064453125, "global_step": 10285, "epoch": 244} {"train_loss": -5.170464992523193, "global_step": 10286, "epoch": 244} {"train_loss": -5.238008499145508, "global_step": 10287, "epoch": 244} {"train_loss": -5.074326515197754, "global_step": 10288, "epoch": 244} {"train_loss": -5.0511193161919, "global_step": 10289, "epoch": 244, "val_loss": 80774.015625} {"train_loss": -4.976251125335693, "global_step": 10290, "epoch": 245} {"train_loss": -4.897651672363281, "global_step": 10291, "epoch": 245} {"train_loss": -5.140556335449219, "global_step": 10292, "epoch": 245} {"train_loss": -5.088996887207031, "global_step": 10293, "epoch": 245} {"train_loss": -5.184993267059326, "global_step": 10294, "epoch": 245} {"train_loss": -5.1655073165893555, "global_step": 10295, "epoch": 245} {"train_loss": -5.041559219360352, "global_step": 10296, "epoch": 245} {"train_loss": -4.905699729919434, "global_step": 10297, "epoch": 245} {"train_loss": -5.050363540649414, "global_step": 10298, "epoch": 245} {"train_loss": -5.053047180175781, "global_step": 10299, "epoch": 245} {"train_loss": -5.088140487670898, "global_step": 10300, "epoch": 245} {"train_loss": -4.993011474609375, "global_step": 10301, "epoch": 245} {"train_loss": -4.923398494720459, "global_step": 10302, "epoch": 245} {"train_loss": -5.044355392456055, "global_step": 10303, "epoch": 245} {"train_loss": -5.280844688415527, "global_step": 10304, "epoch": 245} {"train_loss": -4.969341278076172, "global_step": 10305, "epoch": 245} {"train_loss": -5.072900772094727, "global_step": 10306, "epoch": 245} {"train_loss": -4.973910331726074, "global_step": 10307, "epoch": 245} {"train_loss": -5.087917327880859, "global_step": 10308, "epoch": 245} {"train_loss": -5.074603080749512, "global_step": 10309, "epoch": 245} {"train_loss": -5.069058895111084, "global_step": 10310, "epoch": 245} {"train_loss": -5.116976261138916, "global_step": 10311, "epoch": 245} {"train_loss": -5.035320281982422, "global_step": 10312, "epoch": 245} {"train_loss": -5.071991920471191, "global_step": 10313, "epoch": 245} {"train_loss": -4.938860893249512, "global_step": 10314, "epoch": 245} {"train_loss": -5.060417175292969, "global_step": 10315, "epoch": 245} {"train_loss": -5.081214904785156, "global_step": 10316, "epoch": 245} {"train_loss": -5.152368545532227, "global_step": 10317, "epoch": 245} {"train_loss": -5.052183628082275, "global_step": 10318, "epoch": 245} {"train_loss": -5.069409370422363, "global_step": 10319, "epoch": 245} {"train_loss": -5.005380630493164, "global_step": 10320, "epoch": 245} {"train_loss": -5.079472541809082, "global_step": 10321, "epoch": 245} {"train_loss": -5.187150955200195, "global_step": 10322, "epoch": 245} {"train_loss": -4.96121883392334, "global_step": 10323, "epoch": 245} {"train_loss": -5.074517250061035, "global_step": 10324, "epoch": 245} {"train_loss": -5.134625434875488, "global_step": 10325, "epoch": 245} {"train_loss": -4.84549617767334, "global_step": 10326, "epoch": 245} {"train_loss": -5.047158241271973, "global_step": 10327, "epoch": 245} {"train_loss": -5.008803367614746, "global_step": 10328, "epoch": 245} {"train_loss": -4.989245414733887, "global_step": 10329, "epoch": 245} {"train_loss": -5.034946441650391, "global_step": 10330, "epoch": 245} {"train_loss": -5.049392643428984, "global_step": 10331, "epoch": 245, "val_loss": 81502.9140625} {"train_loss": -4.971460342407227, "global_step": 10332, "epoch": 246} {"train_loss": -5.014151573181152, "global_step": 10333, "epoch": 246} {"train_loss": -5.019985675811768, "global_step": 10334, "epoch": 246} {"train_loss": -4.939584732055664, "global_step": 10335, "epoch": 246} {"train_loss": -4.963789463043213, "global_step": 10336, "epoch": 246} {"train_loss": -5.016941070556641, "global_step": 10337, "epoch": 246} {"train_loss": -4.987521648406982, "global_step": 10338, "epoch": 246} {"train_loss": -4.875667572021484, "global_step": 10339, "epoch": 246} {"train_loss": -4.944859981536865, "global_step": 10340, "epoch": 246} {"train_loss": -4.883780479431152, "global_step": 10341, "epoch": 246} {"train_loss": -5.1243085861206055, "global_step": 10342, "epoch": 246} {"train_loss": -5.0021562576293945, "global_step": 10343, "epoch": 246} {"train_loss": -5.007942199707031, "global_step": 10344, "epoch": 246} {"train_loss": -5.075547218322754, "global_step": 10345, "epoch": 246} {"train_loss": -5.059032440185547, "global_step": 10346, "epoch": 246} {"train_loss": -4.90880012512207, "global_step": 10347, "epoch": 246} {"train_loss": -5.193852424621582, "global_step": 10348, "epoch": 246} {"train_loss": -4.9667840003967285, "global_step": 10349, "epoch": 246} {"train_loss": -5.118253707885742, "global_step": 10350, "epoch": 246} {"train_loss": -5.165426254272461, "global_step": 10351, "epoch": 246} {"train_loss": -5.061344146728516, "global_step": 10352, "epoch": 246} {"train_loss": -5.02122163772583, "global_step": 10353, "epoch": 246} {"train_loss": -5.111223220825195, "global_step": 10354, "epoch": 246} {"train_loss": -4.908250331878662, "global_step": 10355, "epoch": 246} {"train_loss": -5.045506477355957, "global_step": 10356, "epoch": 246} {"train_loss": -4.875749588012695, "global_step": 10357, "epoch": 246} {"train_loss": -4.816883563995361, "global_step": 10358, "epoch": 246} {"train_loss": -4.971024036407471, "global_step": 10359, "epoch": 246} {"train_loss": -5.0475006103515625, "global_step": 10360, "epoch": 246} {"train_loss": -4.986414909362793, "global_step": 10361, "epoch": 246} {"train_loss": -5.008116245269775, "global_step": 10362, "epoch": 246} {"train_loss": -4.841828346252441, "global_step": 10363, "epoch": 246} {"train_loss": -5.045214653015137, "global_step": 10364, "epoch": 246} {"train_loss": -5.122707366943359, "global_step": 10365, "epoch": 246} {"train_loss": -4.9163970947265625, "global_step": 10366, "epoch": 246} {"train_loss": -5.072006702423096, "global_step": 10367, "epoch": 246} {"train_loss": -4.946554660797119, "global_step": 10368, "epoch": 246} {"train_loss": -4.978387832641602, "global_step": 10369, "epoch": 246} {"train_loss": -4.881537914276123, "global_step": 10370, "epoch": 246} {"train_loss": -4.975126266479492, "global_step": 10371, "epoch": 246} {"train_loss": -5.067005157470703, "global_step": 10372, "epoch": 246} {"train_loss": -4.998110498700823, "global_step": 10373, "epoch": 246, "val_loss": 81831.421875} {"train_loss": -4.99676513671875, "global_step": 10374, "epoch": 247} {"train_loss": -5.124654293060303, "global_step": 10375, "epoch": 247} {"train_loss": -4.918334007263184, "global_step": 10376, "epoch": 247} {"train_loss": -4.944583415985107, "global_step": 10377, "epoch": 247} {"train_loss": -5.137616157531738, "global_step": 10378, "epoch": 247} {"train_loss": -5.097277641296387, "global_step": 10379, "epoch": 247} {"train_loss": -4.949163436889648, "global_step": 10380, "epoch": 247} {"train_loss": -5.013190746307373, "global_step": 10381, "epoch": 247} {"train_loss": -4.992793560028076, "global_step": 10382, "epoch": 247} {"train_loss": -5.002614974975586, "global_step": 10383, "epoch": 247} {"train_loss": -5.059547424316406, "global_step": 10384, "epoch": 247} {"train_loss": -5.145210266113281, "global_step": 10385, "epoch": 247} {"train_loss": -5.052300930023193, "global_step": 10386, "epoch": 247} {"train_loss": -5.124309539794922, "global_step": 10387, "epoch": 247} {"train_loss": -5.197538375854492, "global_step": 10388, "epoch": 247} {"train_loss": -5.064410209655762, "global_step": 10389, "epoch": 247} {"train_loss": -5.123170375823975, "global_step": 10390, "epoch": 247} {"train_loss": -4.941532135009766, "global_step": 10391, "epoch": 247} {"train_loss": -5.022090435028076, "global_step": 10392, "epoch": 247} {"train_loss": -5.077333450317383, "global_step": 10393, "epoch": 247} {"train_loss": -5.113492965698242, "global_step": 10394, "epoch": 247} {"train_loss": -4.967740535736084, "global_step": 10395, "epoch": 247} {"train_loss": -5.129229545593262, "global_step": 10396, "epoch": 247} {"train_loss": -5.160323143005371, "global_step": 10397, "epoch": 247} {"train_loss": -5.110854148864746, "global_step": 10398, "epoch": 247} {"train_loss": -5.051137447357178, "global_step": 10399, "epoch": 247} {"train_loss": -5.0410661697387695, "global_step": 10400, "epoch": 247} {"train_loss": -5.219570636749268, "global_step": 10401, "epoch": 247} {"train_loss": -4.968491077423096, "global_step": 10402, "epoch": 247} {"train_loss": -5.194006443023682, "global_step": 10403, "epoch": 247} {"train_loss": -5.110151290893555, "global_step": 10404, "epoch": 247} {"train_loss": -4.994115829467773, "global_step": 10405, "epoch": 247} {"train_loss": -4.984967231750488, "global_step": 10406, "epoch": 247} {"train_loss": -5.129583358764648, "global_step": 10407, "epoch": 247} {"train_loss": -5.122305870056152, "global_step": 10408, "epoch": 247} {"train_loss": -5.098199844360352, "global_step": 10409, "epoch": 247} {"train_loss": -5.179198265075684, "global_step": 10410, "epoch": 247} {"train_loss": -5.025623798370361, "global_step": 10411, "epoch": 247} {"train_loss": -5.1067633628845215, "global_step": 10412, "epoch": 247} {"train_loss": -5.073150634765625, "global_step": 10413, "epoch": 247} {"train_loss": -4.989341735839844, "global_step": 10414, "epoch": 247} {"train_loss": -5.070020039876302, "global_step": 10415, "epoch": 247, "val_loss": 80902.5546875} {"train_loss": -5.002089500427246, "global_step": 10416, "epoch": 248} {"train_loss": -5.024385929107666, "global_step": 10417, "epoch": 248} {"train_loss": -5.186585426330566, "global_step": 10418, "epoch": 248} {"train_loss": -5.1443891525268555, "global_step": 10419, "epoch": 248} {"train_loss": -5.022812366485596, "global_step": 10420, "epoch": 248} {"train_loss": -5.150068283081055, "global_step": 10421, "epoch": 248} {"train_loss": -4.990550994873047, "global_step": 10422, "epoch": 248} {"train_loss": -4.760636329650879, "global_step": 10423, "epoch": 248} {"train_loss": -4.932002544403076, "global_step": 10424, "epoch": 248} {"train_loss": -4.585125923156738, "global_step": 10425, "epoch": 248} {"train_loss": -4.702026844024658, "global_step": 10426, "epoch": 248} {"train_loss": -4.751558780670166, "global_step": 10427, "epoch": 248} {"train_loss": -4.494266033172607, "global_step": 10428, "epoch": 248} {"train_loss": -4.914353847503662, "global_step": 10429, "epoch": 248} {"train_loss": -4.589164733886719, "global_step": 10430, "epoch": 248} {"train_loss": -4.923224449157715, "global_step": 10431, "epoch": 248} {"train_loss": -4.624554634094238, "global_step": 10432, "epoch": 248} {"train_loss": -4.955211639404297, "global_step": 10433, "epoch": 248} {"train_loss": -4.772021293640137, "global_step": 10434, "epoch": 248} {"train_loss": -4.966953754425049, "global_step": 10435, "epoch": 248} {"train_loss": -4.897024631500244, "global_step": 10436, "epoch": 248} {"train_loss": -4.823967933654785, "global_step": 10437, "epoch": 248} {"train_loss": -4.787899017333984, "global_step": 10438, "epoch": 248} {"train_loss": -4.838559627532959, "global_step": 10439, "epoch": 248} {"train_loss": -4.964810371398926, "global_step": 10440, "epoch": 248} {"train_loss": -4.900021076202393, "global_step": 10441, "epoch": 248} {"train_loss": -4.847095489501953, "global_step": 10442, "epoch": 248} {"train_loss": -4.9525322914123535, "global_step": 10443, "epoch": 248} {"train_loss": -5.032026767730713, "global_step": 10444, "epoch": 248} {"train_loss": -5.090981483459473, "global_step": 10445, "epoch": 248} {"train_loss": -5.016024589538574, "global_step": 10446, "epoch": 248} {"train_loss": -5.100426197052002, "global_step": 10447, "epoch": 248} {"train_loss": -5.10512113571167, "global_step": 10448, "epoch": 248} {"train_loss": -5.001324653625488, "global_step": 10449, "epoch": 248} {"train_loss": -4.908941268920898, "global_step": 10450, "epoch": 248} {"train_loss": -5.030302047729492, "global_step": 10451, "epoch": 248} {"train_loss": -5.051140785217285, "global_step": 10452, "epoch": 248} {"train_loss": -5.125682830810547, "global_step": 10453, "epoch": 248} {"train_loss": -5.14653205871582, "global_step": 10454, "epoch": 248} {"train_loss": -5.110511779785156, "global_step": 10455, "epoch": 248} {"train_loss": -4.946507930755615, "global_step": 10456, "epoch": 248} {"train_loss": -4.932834659303937, "global_step": 10457, "epoch": 248, "val_loss": 81447.53125} {"train_loss": -5.02172327041626, "global_step": 10458, "epoch": 249} {"train_loss": -5.131004333496094, "global_step": 10459, "epoch": 249} {"train_loss": -4.90616512298584, "global_step": 10460, "epoch": 249} {"train_loss": -5.057991027832031, "global_step": 10461, "epoch": 249} {"train_loss": -5.202343940734863, "global_step": 10462, "epoch": 249} {"train_loss": -5.030087471008301, "global_step": 10463, "epoch": 249} {"train_loss": -5.133256912231445, "global_step": 10464, "epoch": 249} {"train_loss": -5.161731719970703, "global_step": 10465, "epoch": 249} {"train_loss": -5.211346626281738, "global_step": 10466, "epoch": 249} {"train_loss": -5.117509841918945, "global_step": 10467, "epoch": 249} {"train_loss": -4.991657257080078, "global_step": 10468, "epoch": 249} {"train_loss": -5.155628681182861, "global_step": 10469, "epoch": 249} {"train_loss": -4.969511985778809, "global_step": 10470, "epoch": 249} {"train_loss": -4.747661590576172, "global_step": 10471, "epoch": 249} {"train_loss": -5.18209171295166, "global_step": 10472, "epoch": 249} {"train_loss": -4.9026312828063965, "global_step": 10473, "epoch": 249} {"train_loss": -4.988055229187012, "global_step": 10474, "epoch": 249} {"train_loss": -5.079154014587402, "global_step": 10475, "epoch": 249} {"train_loss": -4.988099098205566, "global_step": 10476, "epoch": 249} {"train_loss": -4.944640159606934, "global_step": 10477, "epoch": 249} {"train_loss": -5.225262641906738, "global_step": 10478, "epoch": 249} {"train_loss": -4.867359161376953, "global_step": 10479, "epoch": 249} {"train_loss": -4.994668006896973, "global_step": 10480, "epoch": 249} {"train_loss": -5.057465076446533, "global_step": 10481, "epoch": 249} {"train_loss": -4.8988752365112305, "global_step": 10482, "epoch": 249} {"train_loss": -4.937040328979492, "global_step": 10483, "epoch": 249} {"train_loss": -5.02370023727417, "global_step": 10484, "epoch": 249} {"train_loss": -5.079351425170898, "global_step": 10485, "epoch": 249} {"train_loss": -4.987449645996094, "global_step": 10486, "epoch": 249} {"train_loss": -4.945761680603027, "global_step": 10487, "epoch": 249} {"train_loss": -4.9394025802612305, "global_step": 10488, "epoch": 249} {"train_loss": -5.005634307861328, "global_step": 10489, "epoch": 249} {"train_loss": -4.974950790405273, "global_step": 10490, "epoch": 249} {"train_loss": -4.993979454040527, "global_step": 10491, "epoch": 249} {"train_loss": -4.974392890930176, "global_step": 10492, "epoch": 249} {"train_loss": -4.965073108673096, "global_step": 10493, "epoch": 249} {"train_loss": -5.0015869140625, "global_step": 10494, "epoch": 249} {"train_loss": -5.10319709777832, "global_step": 10495, "epoch": 249} {"train_loss": -5.264097690582275, "global_step": 10496, "epoch": 249} {"train_loss": -5.000665664672852, "global_step": 10497, "epoch": 249} {"train_loss": -5.154231071472168, "global_step": 10498, "epoch": 249} {"train_loss": -5.03067794300261, "global_step": 10499, "epoch": 249, "val_loss": 81035.2734375} {"train_loss": -4.909755706787109, "global_step": 10500, "epoch": 250} {"train_loss": -5.055337905883789, "global_step": 10501, "epoch": 250} {"train_loss": -5.06821346282959, "global_step": 10502, "epoch": 250} {"train_loss": -5.035974502563477, "global_step": 10503, "epoch": 250} {"train_loss": -5.017138481140137, "global_step": 10504, "epoch": 250} {"train_loss": -5.033252716064453, "global_step": 10505, "epoch": 250} {"train_loss": -5.093930244445801, "global_step": 10506, "epoch": 250} {"train_loss": -5.0261430740356445, "global_step": 10507, "epoch": 250} {"train_loss": -5.0309157371521, "global_step": 10508, "epoch": 250} {"train_loss": -5.096897125244141, "global_step": 10509, "epoch": 250} {"train_loss": -4.958823204040527, "global_step": 10510, "epoch": 250} {"train_loss": -4.8143415451049805, "global_step": 10511, "epoch": 250} {"train_loss": -4.8691558837890625, "global_step": 10512, "epoch": 250} {"train_loss": -4.821655750274658, "global_step": 10513, "epoch": 250} {"train_loss": -4.957140922546387, "global_step": 10514, "epoch": 250} {"train_loss": -4.975320816040039, "global_step": 10515, "epoch": 250} {"train_loss": -5.047907829284668, "global_step": 10516, "epoch": 250} {"train_loss": -4.9773454666137695, "global_step": 10517, "epoch": 250} {"train_loss": -4.912302017211914, "global_step": 10518, "epoch": 250} {"train_loss": -5.10338020324707, "global_step": 10519, "epoch": 250} {"train_loss": -4.928342342376709, "global_step": 10520, "epoch": 250} {"train_loss": -5.113866329193115, "global_step": 10521, "epoch": 250} {"train_loss": -5.058670520782471, "global_step": 10522, "epoch": 250} {"train_loss": -5.0562424659729, "global_step": 10523, "epoch": 250} {"train_loss": -4.8614935874938965, "global_step": 10524, "epoch": 250} {"train_loss": -5.09467887878418, "global_step": 10525, "epoch": 250} {"train_loss": -5.103228569030762, "global_step": 10526, "epoch": 250} {"train_loss": -5.038214206695557, "global_step": 10527, "epoch": 250} {"train_loss": -5.003890037536621, "global_step": 10528, "epoch": 250} {"train_loss": -5.1533203125, "global_step": 10529, "epoch": 250} {"train_loss": -5.0148396492004395, "global_step": 10530, "epoch": 250} {"train_loss": -5.032609939575195, "global_step": 10531, "epoch": 250} {"train_loss": -5.075992107391357, "global_step": 10532, "epoch": 250} {"train_loss": -4.967482566833496, "global_step": 10533, "epoch": 250} {"train_loss": -5.035764694213867, "global_step": 10534, "epoch": 250} {"train_loss": -5.0599212646484375, "global_step": 10535, "epoch": 250} {"train_loss": -5.107194900512695, "global_step": 10536, "epoch": 250} {"train_loss": -5.169897079467773, "global_step": 10537, "epoch": 250} {"train_loss": -5.119968891143799, "global_step": 10538, "epoch": 250} {"train_loss": -5.025209426879883, "global_step": 10539, "epoch": 250} {"train_loss": -5.107950210571289, "global_step": 10540, "epoch": 250} {"train_loss": -5.022812071300688, "global_step": 10541, "epoch": 250, "train/sim_max_reward_0": 0.3177739338884784, "train/sim_max_reward_1": 0.16338559012808407, "train/sim_max_reward_2": 0.2867612927031864, "train/sim_max_reward_3": 0.09822119382192075, "train/sim_max_reward_4": 0.28319669575783724, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4500000": 0.37924929303067, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.0793336438708821, "test/sim_max_reward_4500005": 0.16126585610851837, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.1690980021571838, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.05302488737159811, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.17263041716979716, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.16561182130584123, "test/sim_max_reward_4500015": 0.1673833329240443, "test/sim_max_reward_4500016": 0.373120698770775, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.35621041945866005, "test/sim_max_reward_4500019": 0.39496762743265895, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.14861511220147822, "test/sim_max_reward_4500022": 0.33035368716497726, "test/sim_max_reward_4500023": 0.48696958417206077, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.13497255592037247, "test/sim_max_reward_4500026": 0.01145002834560718, "test/sim_max_reward_4500027": 0.637594518284529, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.38273425387368304, "test/sim_max_reward_4500030": 0.21069127958234216, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.32683567869035945, "test/sim_max_reward_4500033": 0.15090441448692346, "test/sim_max_reward_4500034": 0.4315141829731471, "test/sim_max_reward_4500035": 0.5321580580030912, "test/sim_max_reward_4500036": 0.20712726033432347, "test/sim_max_reward_4500037": 0.2944170873108199, "test/sim_max_reward_4500038": 0.29076655582942373, "test/sim_max_reward_4500039": 0.07392643431743294, "test/sim_max_reward_4500040": 0.1658525870361414, "test/sim_max_reward_4500041": 0.6309834026369943, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.1763995204006517, "test/sim_max_reward_4500044": 0.08833493873583917, "test/sim_max_reward_4500045": 0.1175735103924684, "test/sim_max_reward_4500046": 0.6855419438395708, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.22372057761028238, "test/mean_score": 0.18400394052016616, "val_loss": 80833.875} {"train_loss": -4.940462112426758, "global_step": 10542, "epoch": 251} {"train_loss": -4.942299842834473, "global_step": 10543, "epoch": 251} {"train_loss": -4.918816089630127, "global_step": 10544, "epoch": 251} {"train_loss": -4.937835693359375, "global_step": 10545, "epoch": 251} {"train_loss": -5.182748317718506, "global_step": 10546, "epoch": 251} {"train_loss": -5.03856086730957, "global_step": 10547, "epoch": 251} {"train_loss": -4.800986289978027, "global_step": 10548, "epoch": 251} {"train_loss": -5.0640950202941895, "global_step": 10549, "epoch": 251} {"train_loss": -4.911849498748779, "global_step": 10550, "epoch": 251} {"train_loss": -4.92356014251709, "global_step": 10551, "epoch": 251} {"train_loss": -5.1070122718811035, "global_step": 10552, "epoch": 251} {"train_loss": -5.030685901641846, "global_step": 10553, "epoch": 251} {"train_loss": -5.080488681793213, "global_step": 10554, "epoch": 251} {"train_loss": -5.126849174499512, "global_step": 10555, "epoch": 251} {"train_loss": -5.13226842880249, "global_step": 10556, "epoch": 251} {"train_loss": -4.8121232986450195, "global_step": 10557, "epoch": 251} {"train_loss": -5.06241512298584, "global_step": 10558, "epoch": 251} {"train_loss": -5.033740997314453, "global_step": 10559, "epoch": 251} {"train_loss": -5.073965549468994, "global_step": 10560, "epoch": 251} {"train_loss": -5.050848960876465, "global_step": 10561, "epoch": 251} {"train_loss": -5.138360023498535, "global_step": 10562, "epoch": 251} {"train_loss": -4.942476272583008, "global_step": 10563, "epoch": 251} {"train_loss": -5.012694358825684, "global_step": 10564, "epoch": 251} {"train_loss": -5.008518695831299, "global_step": 10565, "epoch": 251} {"train_loss": -4.998847961425781, "global_step": 10566, "epoch": 251} {"train_loss": -4.967947959899902, "global_step": 10567, "epoch": 251} {"train_loss": -4.94950008392334, "global_step": 10568, "epoch": 251} {"train_loss": -4.957439422607422, "global_step": 10569, "epoch": 251} {"train_loss": -5.069612503051758, "global_step": 10570, "epoch": 251} {"train_loss": -5.037395477294922, "global_step": 10571, "epoch": 251} {"train_loss": -5.043406009674072, "global_step": 10572, "epoch": 251} {"train_loss": -5.138423442840576, "global_step": 10573, "epoch": 251} {"train_loss": -4.915651321411133, "global_step": 10574, "epoch": 251} {"train_loss": -4.949969291687012, "global_step": 10575, "epoch": 251} {"train_loss": -5.000078201293945, "global_step": 10576, "epoch": 251} {"train_loss": -5.003340244293213, "global_step": 10577, "epoch": 251} {"train_loss": -5.114984035491943, "global_step": 10578, "epoch": 251} {"train_loss": -5.018996238708496, "global_step": 10579, "epoch": 251} {"train_loss": -5.138493061065674, "global_step": 10580, "epoch": 251} {"train_loss": -5.0276994705200195, "global_step": 10581, "epoch": 251} {"train_loss": -5.064817428588867, "global_step": 10582, "epoch": 251} {"train_loss": -5.017155579158238, "global_step": 10583, "epoch": 251, "val_loss": 81546.3515625} {"train_loss": -5.092394828796387, "global_step": 10584, "epoch": 252} {"train_loss": -5.0786895751953125, "global_step": 10585, "epoch": 252} {"train_loss": -5.073143005371094, "global_step": 10586, "epoch": 252} {"train_loss": -5.182514190673828, "global_step": 10587, "epoch": 252} {"train_loss": -4.984360694885254, "global_step": 10588, "epoch": 252} {"train_loss": -5.020686626434326, "global_step": 10589, "epoch": 252} {"train_loss": -5.068801403045654, "global_step": 10590, "epoch": 252} {"train_loss": -4.998725891113281, "global_step": 10591, "epoch": 252} {"train_loss": -5.109119892120361, "global_step": 10592, "epoch": 252} {"train_loss": -5.055977821350098, "global_step": 10593, "epoch": 252} {"train_loss": -4.950188636779785, "global_step": 10594, "epoch": 252} {"train_loss": -4.9710259437561035, "global_step": 10595, "epoch": 252} {"train_loss": -4.98837947845459, "global_step": 10596, "epoch": 252} {"train_loss": -4.9585371017456055, "global_step": 10597, "epoch": 252} {"train_loss": -5.1378607749938965, "global_step": 10598, "epoch": 252} {"train_loss": -5.0174336433410645, "global_step": 10599, "epoch": 252} {"train_loss": -5.13169002532959, "global_step": 10600, "epoch": 252} {"train_loss": -5.090906143188477, "global_step": 10601, "epoch": 252} {"train_loss": -5.0706787109375, "global_step": 10602, "epoch": 252} {"train_loss": -5.059368133544922, "global_step": 10603, "epoch": 252} {"train_loss": -5.125287055969238, "global_step": 10604, "epoch": 252} {"train_loss": -5.015820026397705, "global_step": 10605, "epoch": 252} {"train_loss": -5.100316524505615, "global_step": 10606, "epoch": 252} {"train_loss": -5.023481369018555, "global_step": 10607, "epoch": 252} {"train_loss": -4.977178573608398, "global_step": 10608, "epoch": 252} {"train_loss": -5.02081298828125, "global_step": 10609, "epoch": 252} {"train_loss": -5.05189847946167, "global_step": 10610, "epoch": 252} {"train_loss": -5.043474197387695, "global_step": 10611, "epoch": 252} {"train_loss": -5.041459083557129, "global_step": 10612, "epoch": 252} {"train_loss": -5.098320960998535, "global_step": 10613, "epoch": 252} {"train_loss": -5.026119232177734, "global_step": 10614, "epoch": 252} {"train_loss": -4.988879203796387, "global_step": 10615, "epoch": 252} {"train_loss": -5.167428970336914, "global_step": 10616, "epoch": 252} {"train_loss": -4.921171188354492, "global_step": 10617, "epoch": 252} {"train_loss": -4.931714057922363, "global_step": 10618, "epoch": 252} {"train_loss": -5.024213790893555, "global_step": 10619, "epoch": 252} {"train_loss": -4.946395397186279, "global_step": 10620, "epoch": 252} {"train_loss": -5.1854047775268555, "global_step": 10621, "epoch": 252} {"train_loss": -5.116156578063965, "global_step": 10622, "epoch": 252} {"train_loss": -5.012652397155762, "global_step": 10623, "epoch": 252} {"train_loss": -4.994963645935059, "global_step": 10624, "epoch": 252} {"train_loss": -5.04404141789391, "global_step": 10625, "epoch": 252, "val_loss": 81484.96875} {"train_loss": -4.988397598266602, "global_step": 10626, "epoch": 253} {"train_loss": -5.150024890899658, "global_step": 10627, "epoch": 253} {"train_loss": -5.0277557373046875, "global_step": 10628, "epoch": 253} {"train_loss": -5.126456260681152, "global_step": 10629, "epoch": 253} {"train_loss": -4.911287784576416, "global_step": 10630, "epoch": 253} {"train_loss": -5.009826183319092, "global_step": 10631, "epoch": 253} {"train_loss": -5.169783592224121, "global_step": 10632, "epoch": 253} {"train_loss": -4.955458641052246, "global_step": 10633, "epoch": 253} {"train_loss": -5.0692009925842285, "global_step": 10634, "epoch": 253} {"train_loss": -5.099277973175049, "global_step": 10635, "epoch": 253} {"train_loss": -4.955013275146484, "global_step": 10636, "epoch": 253} {"train_loss": -5.070204257965088, "global_step": 10637, "epoch": 253} {"train_loss": -5.119077682495117, "global_step": 10638, "epoch": 253} {"train_loss": -4.996837615966797, "global_step": 10639, "epoch": 253} {"train_loss": -5.059281826019287, "global_step": 10640, "epoch": 253} {"train_loss": -4.99124002456665, "global_step": 10641, "epoch": 253} {"train_loss": -5.054914951324463, "global_step": 10642, "epoch": 253} {"train_loss": -5.139181137084961, "global_step": 10643, "epoch": 253} {"train_loss": -5.05370569229126, "global_step": 10644, "epoch": 253} {"train_loss": -5.161240577697754, "global_step": 10645, "epoch": 253} {"train_loss": -5.063328742980957, "global_step": 10646, "epoch": 253} {"train_loss": -5.032101631164551, "global_step": 10647, "epoch": 253} {"train_loss": -5.125957489013672, "global_step": 10648, "epoch": 253} {"train_loss": -5.065486431121826, "global_step": 10649, "epoch": 253} {"train_loss": -5.106257915496826, "global_step": 10650, "epoch": 253} {"train_loss": -5.085762023925781, "global_step": 10651, "epoch": 253} {"train_loss": -5.053139686584473, "global_step": 10652, "epoch": 253} {"train_loss": -5.29255485534668, "global_step": 10653, "epoch": 253} {"train_loss": -5.033344745635986, "global_step": 10654, "epoch": 253} {"train_loss": -5.031321048736572, "global_step": 10655, "epoch": 253} {"train_loss": -5.170881271362305, "global_step": 10656, "epoch": 253} {"train_loss": -5.048937797546387, "global_step": 10657, "epoch": 253} {"train_loss": -5.057888984680176, "global_step": 10658, "epoch": 253} {"train_loss": -5.089982986450195, "global_step": 10659, "epoch": 253} {"train_loss": -4.833526611328125, "global_step": 10660, "epoch": 253} {"train_loss": -5.06538724899292, "global_step": 10661, "epoch": 253} {"train_loss": -4.906480312347412, "global_step": 10662, "epoch": 253} {"train_loss": -4.943388938903809, "global_step": 10663, "epoch": 253} {"train_loss": -4.96226692199707, "global_step": 10664, "epoch": 253} {"train_loss": -5.072088718414307, "global_step": 10665, "epoch": 253} {"train_loss": -5.03114128112793, "global_step": 10666, "epoch": 253} {"train_loss": -5.051107122784569, "global_step": 10667, "epoch": 253, "val_loss": 81115.4375} {"train_loss": -5.098967552185059, "global_step": 10668, "epoch": 254} {"train_loss": -4.919118881225586, "global_step": 10669, "epoch": 254} {"train_loss": -4.948842525482178, "global_step": 10670, "epoch": 254} {"train_loss": -5.134846210479736, "global_step": 10671, "epoch": 254} {"train_loss": -4.91547966003418, "global_step": 10672, "epoch": 254} {"train_loss": -5.133520126342773, "global_step": 10673, "epoch": 254} {"train_loss": -5.134727478027344, "global_step": 10674, "epoch": 254} {"train_loss": -5.088593482971191, "global_step": 10675, "epoch": 254} {"train_loss": -4.954323768615723, "global_step": 10676, "epoch": 254} {"train_loss": -4.9867777824401855, "global_step": 10677, "epoch": 254} {"train_loss": -4.984367370605469, "global_step": 10678, "epoch": 254} {"train_loss": -4.901244640350342, "global_step": 10679, "epoch": 254} {"train_loss": -5.073535442352295, "global_step": 10680, "epoch": 254} {"train_loss": -5.090029716491699, "global_step": 10681, "epoch": 254} {"train_loss": -4.884316444396973, "global_step": 10682, "epoch": 254} {"train_loss": -4.894390106201172, "global_step": 10683, "epoch": 254} {"train_loss": -5.075134754180908, "global_step": 10684, "epoch": 254} {"train_loss": -5.052324295043945, "global_step": 10685, "epoch": 254} {"train_loss": -4.999627113342285, "global_step": 10686, "epoch": 254} {"train_loss": -5.136606693267822, "global_step": 10687, "epoch": 254} {"train_loss": -5.178759574890137, "global_step": 10688, "epoch": 254} {"train_loss": -5.118770599365234, "global_step": 10689, "epoch": 254} {"train_loss": -5.187065124511719, "global_step": 10690, "epoch": 254} {"train_loss": -5.074756622314453, "global_step": 10691, "epoch": 254} {"train_loss": -5.131482124328613, "global_step": 10692, "epoch": 254} {"train_loss": -5.004530906677246, "global_step": 10693, "epoch": 254} {"train_loss": -5.197044372558594, "global_step": 10694, "epoch": 254} {"train_loss": -5.022286415100098, "global_step": 10695, "epoch": 254} {"train_loss": -5.153660774230957, "global_step": 10696, "epoch": 254} {"train_loss": -5.013189315795898, "global_step": 10697, "epoch": 254} {"train_loss": -5.018157482147217, "global_step": 10698, "epoch": 254} {"train_loss": -5.122157096862793, "global_step": 10699, "epoch": 254} {"train_loss": -5.203759670257568, "global_step": 10700, "epoch": 254} {"train_loss": -5.122471809387207, "global_step": 10701, "epoch": 254} {"train_loss": -4.958042144775391, "global_step": 10702, "epoch": 254} {"train_loss": -4.983773708343506, "global_step": 10703, "epoch": 254} {"train_loss": -5.090231895446777, "global_step": 10704, "epoch": 254} {"train_loss": -5.071236610412598, "global_step": 10705, "epoch": 254} {"train_loss": -5.118440628051758, "global_step": 10706, "epoch": 254} {"train_loss": -5.0487213134765625, "global_step": 10707, "epoch": 254} {"train_loss": -5.246620178222656, "global_step": 10708, "epoch": 254} {"train_loss": -5.05947824886867, "global_step": 10709, "epoch": 254, "val_loss": 82035.7578125} {"train_loss": -4.913691520690918, "global_step": 10710, "epoch": 255} {"train_loss": -4.992455005645752, "global_step": 10711, "epoch": 255} {"train_loss": -5.1255693435668945, "global_step": 10712, "epoch": 255} {"train_loss": -5.01582145690918, "global_step": 10713, "epoch": 255} {"train_loss": -5.1711554527282715, "global_step": 10714, "epoch": 255} {"train_loss": -4.923633098602295, "global_step": 10715, "epoch": 255} {"train_loss": -4.9969377517700195, "global_step": 10716, "epoch": 255} {"train_loss": -4.9887003898620605, "global_step": 10717, "epoch": 255} {"train_loss": -5.0659332275390625, "global_step": 10718, "epoch": 255} {"train_loss": -4.879464626312256, "global_step": 10719, "epoch": 255} {"train_loss": -5.07460880279541, "global_step": 10720, "epoch": 255} {"train_loss": -5.006864547729492, "global_step": 10721, "epoch": 255} {"train_loss": -5.00803279876709, "global_step": 10722, "epoch": 255} {"train_loss": -5.12486457824707, "global_step": 10723, "epoch": 255} {"train_loss": -5.070276260375977, "global_step": 10724, "epoch": 255} {"train_loss": -5.094437599182129, "global_step": 10725, "epoch": 255} {"train_loss": -4.956960678100586, "global_step": 10726, "epoch": 255} {"train_loss": -5.07423210144043, "global_step": 10727, "epoch": 255} {"train_loss": -4.940536975860596, "global_step": 10728, "epoch": 255} {"train_loss": -4.971310615539551, "global_step": 10729, "epoch": 255} {"train_loss": -4.892509460449219, "global_step": 10730, "epoch": 255} {"train_loss": -4.935750961303711, "global_step": 10731, "epoch": 255} {"train_loss": -5.031858444213867, "global_step": 10732, "epoch": 255} {"train_loss": -5.069586753845215, "global_step": 10733, "epoch": 255} {"train_loss": -5.021103858947754, "global_step": 10734, "epoch": 255} {"train_loss": -5.2346601486206055, "global_step": 10735, "epoch": 255} {"train_loss": -4.947196960449219, "global_step": 10736, "epoch": 255} {"train_loss": -5.071086406707764, "global_step": 10737, "epoch": 255} {"train_loss": -5.044702053070068, "global_step": 10738, "epoch": 255} {"train_loss": -5.069311618804932, "global_step": 10739, "epoch": 255} {"train_loss": -5.065495491027832, "global_step": 10740, "epoch": 255} {"train_loss": -5.061767578125, "global_step": 10741, "epoch": 255} {"train_loss": -5.110458850860596, "global_step": 10742, "epoch": 255} {"train_loss": -5.122547149658203, "global_step": 10743, "epoch": 255} {"train_loss": -5.024086952209473, "global_step": 10744, "epoch": 255} {"train_loss": -4.996525764465332, "global_step": 10745, "epoch": 255} {"train_loss": -4.916229248046875, "global_step": 10746, "epoch": 255} {"train_loss": -5.180080890655518, "global_step": 10747, "epoch": 255} {"train_loss": -5.119277477264404, "global_step": 10748, "epoch": 255} {"train_loss": -5.090383529663086, "global_step": 10749, "epoch": 255} {"train_loss": -5.023216247558594, "global_step": 10750, "epoch": 255} {"train_loss": -5.038378636042277, "global_step": 10751, "epoch": 255, "val_loss": 80702.4609375} {"train_loss": -5.083837032318115, "global_step": 10752, "epoch": 256} {"train_loss": -5.143023490905762, "global_step": 10753, "epoch": 256} {"train_loss": -5.187141418457031, "global_step": 10754, "epoch": 256} {"train_loss": -5.127216339111328, "global_step": 10755, "epoch": 256} {"train_loss": -5.091954231262207, "global_step": 10756, "epoch": 256} {"train_loss": -4.987787246704102, "global_step": 10757, "epoch": 256} {"train_loss": -5.0344438552856445, "global_step": 10758, "epoch": 256} {"train_loss": -5.060375213623047, "global_step": 10759, "epoch": 256} {"train_loss": -4.958890914916992, "global_step": 10760, "epoch": 256} {"train_loss": -4.9922590255737305, "global_step": 10761, "epoch": 256} {"train_loss": -5.180768966674805, "global_step": 10762, "epoch": 256} {"train_loss": -5.043883800506592, "global_step": 10763, "epoch": 256} {"train_loss": -4.853996276855469, "global_step": 10764, "epoch": 256} {"train_loss": -5.110942363739014, "global_step": 10765, "epoch": 256} {"train_loss": -4.767402172088623, "global_step": 10766, "epoch": 256} {"train_loss": -4.63848876953125, "global_step": 10767, "epoch": 256} {"train_loss": -5.012054443359375, "global_step": 10768, "epoch": 256} {"train_loss": -4.93569803237915, "global_step": 10769, "epoch": 256} {"train_loss": -4.907742500305176, "global_step": 10770, "epoch": 256} {"train_loss": -5.134661674499512, "global_step": 10771, "epoch": 256} {"train_loss": -4.828603744506836, "global_step": 10772, "epoch": 256} {"train_loss": -5.0270185470581055, "global_step": 10773, "epoch": 256} {"train_loss": -5.143451690673828, "global_step": 10774, "epoch": 256} {"train_loss": -4.823215007781982, "global_step": 10775, "epoch": 256} {"train_loss": -4.953714370727539, "global_step": 10776, "epoch": 256} {"train_loss": -5.05070161819458, "global_step": 10777, "epoch": 256} {"train_loss": -5.069990158081055, "global_step": 10778, "epoch": 256} {"train_loss": -5.091631889343262, "global_step": 10779, "epoch": 256} {"train_loss": -5.100687026977539, "global_step": 10780, "epoch": 256} {"train_loss": -4.888064384460449, "global_step": 10781, "epoch": 256} {"train_loss": -5.0708909034729, "global_step": 10782, "epoch": 256} {"train_loss": -5.224178314208984, "global_step": 10783, "epoch": 256} {"train_loss": -5.095802307128906, "global_step": 10784, "epoch": 256} {"train_loss": -5.230093002319336, "global_step": 10785, "epoch": 256} {"train_loss": -5.00578498840332, "global_step": 10786, "epoch": 256} {"train_loss": -5.0774312019348145, "global_step": 10787, "epoch": 256} {"train_loss": -5.001880645751953, "global_step": 10788, "epoch": 256} {"train_loss": -4.961490154266357, "global_step": 10789, "epoch": 256} {"train_loss": -4.926725387573242, "global_step": 10790, "epoch": 256} {"train_loss": -4.960262775421143, "global_step": 10791, "epoch": 256} {"train_loss": -5.3578596115112305, "global_step": 10792, "epoch": 256} {"train_loss": -5.026233900161016, "global_step": 10793, "epoch": 256, "val_loss": 80398.765625} {"train_loss": -5.1034698486328125, "global_step": 10794, "epoch": 257} {"train_loss": -5.16324520111084, "global_step": 10795, "epoch": 257} {"train_loss": -5.155591011047363, "global_step": 10796, "epoch": 257} {"train_loss": -5.1428375244140625, "global_step": 10797, "epoch": 257} {"train_loss": -5.050569534301758, "global_step": 10798, "epoch": 257} {"train_loss": -4.90582799911499, "global_step": 10799, "epoch": 257} {"train_loss": -5.078392028808594, "global_step": 10800, "epoch": 257} {"train_loss": -4.956564903259277, "global_step": 10801, "epoch": 257} {"train_loss": -5.078296661376953, "global_step": 10802, "epoch": 257} {"train_loss": -5.006364822387695, "global_step": 10803, "epoch": 257} {"train_loss": -4.797240734100342, "global_step": 10804, "epoch": 257} {"train_loss": -4.912785530090332, "global_step": 10805, "epoch": 257} {"train_loss": -4.988391399383545, "global_step": 10806, "epoch": 257} {"train_loss": -4.842648506164551, "global_step": 10807, "epoch": 257} {"train_loss": -4.961816310882568, "global_step": 10808, "epoch": 257} {"train_loss": -4.964448928833008, "global_step": 10809, "epoch": 257} {"train_loss": -4.642190933227539, "global_step": 10810, "epoch": 257} {"train_loss": -5.002410888671875, "global_step": 10811, "epoch": 257} {"train_loss": -4.942863464355469, "global_step": 10812, "epoch": 257} {"train_loss": -4.937464714050293, "global_step": 10813, "epoch": 257} {"train_loss": -5.030585289001465, "global_step": 10814, "epoch": 257} {"train_loss": -4.878235340118408, "global_step": 10815, "epoch": 257} {"train_loss": -5.036545276641846, "global_step": 10816, "epoch": 257} {"train_loss": -4.9698591232299805, "global_step": 10817, "epoch": 257} {"train_loss": -5.182502269744873, "global_step": 10818, "epoch": 257} {"train_loss": -4.878787994384766, "global_step": 10819, "epoch": 257} {"train_loss": -5.102983474731445, "global_step": 10820, "epoch": 257} {"train_loss": -5.068484306335449, "global_step": 10821, "epoch": 257} {"train_loss": -5.143699645996094, "global_step": 10822, "epoch": 257} {"train_loss": -5.155207633972168, "global_step": 10823, "epoch": 257} {"train_loss": -4.830868721008301, "global_step": 10824, "epoch": 257} {"train_loss": -5.095982074737549, "global_step": 10825, "epoch": 257} {"train_loss": -5.1055192947387695, "global_step": 10826, "epoch": 257} {"train_loss": -5.055422782897949, "global_step": 10827, "epoch": 257} {"train_loss": -5.08899450302124, "global_step": 10828, "epoch": 257} {"train_loss": -5.074560165405273, "global_step": 10829, "epoch": 257} {"train_loss": -5.060961723327637, "global_step": 10830, "epoch": 257} {"train_loss": -5.054308891296387, "global_step": 10831, "epoch": 257} {"train_loss": -5.033729553222656, "global_step": 10832, "epoch": 257} {"train_loss": -4.998295783996582, "global_step": 10833, "epoch": 257} {"train_loss": -5.0048418045043945, "global_step": 10834, "epoch": 257} {"train_loss": -5.0122567017873125, "global_step": 10835, "epoch": 257, "val_loss": 81360.171875} {"train_loss": -5.012551307678223, "global_step": 10836, "epoch": 258} {"train_loss": -4.99672794342041, "global_step": 10837, "epoch": 258} {"train_loss": -5.020440101623535, "global_step": 10838, "epoch": 258} {"train_loss": -5.009016036987305, "global_step": 10839, "epoch": 258} {"train_loss": -5.078125476837158, "global_step": 10840, "epoch": 258} {"train_loss": -5.046479225158691, "global_step": 10841, "epoch": 258} {"train_loss": -4.912728786468506, "global_step": 10842, "epoch": 258} {"train_loss": -4.942902565002441, "global_step": 10843, "epoch": 258} {"train_loss": -5.150401592254639, "global_step": 10844, "epoch": 258} {"train_loss": -4.879165172576904, "global_step": 10845, "epoch": 258} {"train_loss": -5.08324670791626, "global_step": 10846, "epoch": 258} {"train_loss": -4.808012962341309, "global_step": 10847, "epoch": 258} {"train_loss": -4.955777645111084, "global_step": 10848, "epoch": 258} {"train_loss": -4.965001106262207, "global_step": 10849, "epoch": 258} {"train_loss": -5.054815769195557, "global_step": 10850, "epoch": 258} {"train_loss": -5.0625410079956055, "global_step": 10851, "epoch": 258} {"train_loss": -4.973875522613525, "global_step": 10852, "epoch": 258} {"train_loss": -5.004865646362305, "global_step": 10853, "epoch": 258} {"train_loss": -5.077859878540039, "global_step": 10854, "epoch": 258} {"train_loss": -5.011061668395996, "global_step": 10855, "epoch": 258} {"train_loss": -5.039201736450195, "global_step": 10856, "epoch": 258} {"train_loss": -5.106828689575195, "global_step": 10857, "epoch": 258} {"train_loss": -5.023797988891602, "global_step": 10858, "epoch": 258} {"train_loss": -5.1361188888549805, "global_step": 10859, "epoch": 258} {"train_loss": -5.1555705070495605, "global_step": 10860, "epoch": 258} {"train_loss": -5.087335586547852, "global_step": 10861, "epoch": 258} {"train_loss": -5.01571798324585, "global_step": 10862, "epoch": 258} {"train_loss": -5.056173801422119, "global_step": 10863, "epoch": 258} {"train_loss": -5.259085178375244, "global_step": 10864, "epoch": 258} {"train_loss": -5.15393590927124, "global_step": 10865, "epoch": 258} {"train_loss": -5.1829681396484375, "global_step": 10866, "epoch": 258} {"train_loss": -5.159127712249756, "global_step": 10867, "epoch": 258} {"train_loss": -5.027641296386719, "global_step": 10868, "epoch": 258} {"train_loss": -5.009190559387207, "global_step": 10869, "epoch": 258} {"train_loss": -5.149559497833252, "global_step": 10870, "epoch": 258} {"train_loss": -5.012989044189453, "global_step": 10871, "epoch": 258} {"train_loss": -4.897674560546875, "global_step": 10872, "epoch": 258} {"train_loss": -5.04223108291626, "global_step": 10873, "epoch": 258} {"train_loss": -4.953925132751465, "global_step": 10874, "epoch": 258} {"train_loss": -5.056131362915039, "global_step": 10875, "epoch": 258} {"train_loss": -5.22622013092041, "global_step": 10876, "epoch": 258} {"train_loss": -5.045818215324765, "global_step": 10877, "epoch": 258, "val_loss": 80507.28125} {"train_loss": -4.980960845947266, "global_step": 10878, "epoch": 259} {"train_loss": -5.195870399475098, "global_step": 10879, "epoch": 259} {"train_loss": -4.896243095397949, "global_step": 10880, "epoch": 259} {"train_loss": -4.866294860839844, "global_step": 10881, "epoch": 259} {"train_loss": -4.9945549964904785, "global_step": 10882, "epoch": 259} {"train_loss": -5.005198001861572, "global_step": 10883, "epoch": 259} {"train_loss": -4.986142158508301, "global_step": 10884, "epoch": 259} {"train_loss": -4.974376201629639, "global_step": 10885, "epoch": 259} {"train_loss": -5.143911361694336, "global_step": 10886, "epoch": 259} {"train_loss": -5.034213066101074, "global_step": 10887, "epoch": 259} {"train_loss": -4.992302894592285, "global_step": 10888, "epoch": 259} {"train_loss": -4.7991437911987305, "global_step": 10889, "epoch": 259} {"train_loss": -5.042715072631836, "global_step": 10890, "epoch": 259} {"train_loss": -5.060614585876465, "global_step": 10891, "epoch": 259} {"train_loss": -4.870796203613281, "global_step": 10892, "epoch": 259} {"train_loss": -4.957150936126709, "global_step": 10893, "epoch": 259} {"train_loss": -5.025147438049316, "global_step": 10894, "epoch": 259} {"train_loss": -4.830992698669434, "global_step": 10895, "epoch": 259} {"train_loss": -5.137680530548096, "global_step": 10896, "epoch": 259} {"train_loss": -4.914305686950684, "global_step": 10897, "epoch": 259} {"train_loss": -4.796187877655029, "global_step": 10898, "epoch": 259} {"train_loss": -5.083083629608154, "global_step": 10899, "epoch": 259} {"train_loss": -4.912615776062012, "global_step": 10900, "epoch": 259} {"train_loss": -4.816591739654541, "global_step": 10901, "epoch": 259} {"train_loss": -5.056665897369385, "global_step": 10902, "epoch": 259} {"train_loss": -4.799107074737549, "global_step": 10903, "epoch": 259} {"train_loss": -5.013676643371582, "global_step": 10904, "epoch": 259} {"train_loss": -4.896193504333496, "global_step": 10905, "epoch": 259} {"train_loss": -5.154653549194336, "global_step": 10906, "epoch": 259} {"train_loss": -4.899171829223633, "global_step": 10907, "epoch": 259} {"train_loss": -5.101496696472168, "global_step": 10908, "epoch": 259} {"train_loss": -5.088071823120117, "global_step": 10909, "epoch": 259} {"train_loss": -5.071052551269531, "global_step": 10910, "epoch": 259} {"train_loss": -4.978192329406738, "global_step": 10911, "epoch": 259} {"train_loss": -4.923044204711914, "global_step": 10912, "epoch": 259} {"train_loss": -5.100369453430176, "global_step": 10913, "epoch": 259} {"train_loss": -4.9770612716674805, "global_step": 10914, "epoch": 259} {"train_loss": -4.9893717765808105, "global_step": 10915, "epoch": 259} {"train_loss": -5.053491592407227, "global_step": 10916, "epoch": 259} {"train_loss": -5.118075370788574, "global_step": 10917, "epoch": 259} {"train_loss": -5.138308525085449, "global_step": 10918, "epoch": 259} {"train_loss": -4.991011017844791, "global_step": 10919, "epoch": 259, "val_loss": 80355.3671875} {"train_loss": -5.021984577178955, "global_step": 10920, "epoch": 260} {"train_loss": -5.2595014572143555, "global_step": 10921, "epoch": 260} {"train_loss": -5.157130241394043, "global_step": 10922, "epoch": 260} {"train_loss": -5.0500288009643555, "global_step": 10923, "epoch": 260} {"train_loss": -5.174080848693848, "global_step": 10924, "epoch": 260} {"train_loss": -5.127110004425049, "global_step": 10925, "epoch": 260} {"train_loss": -5.163133144378662, "global_step": 10926, "epoch": 260} {"train_loss": -5.082164287567139, "global_step": 10927, "epoch": 260} {"train_loss": -5.013245582580566, "global_step": 10928, "epoch": 260} {"train_loss": -5.047848701477051, "global_step": 10929, "epoch": 260} {"train_loss": -5.133863925933838, "global_step": 10930, "epoch": 260} {"train_loss": -5.110918045043945, "global_step": 10931, "epoch": 260} {"train_loss": -5.131548881530762, "global_step": 10932, "epoch": 260} {"train_loss": -5.107246398925781, "global_step": 10933, "epoch": 260} {"train_loss": -5.122060298919678, "global_step": 10934, "epoch": 260} {"train_loss": -5.042821884155273, "global_step": 10935, "epoch": 260} {"train_loss": -5.077406883239746, "global_step": 10936, "epoch": 260} {"train_loss": -5.123020172119141, "global_step": 10937, "epoch": 260} {"train_loss": -5.10836935043335, "global_step": 10938, "epoch": 260} {"train_loss": -4.966277122497559, "global_step": 10939, "epoch": 260} {"train_loss": -5.088282585144043, "global_step": 10940, "epoch": 260} {"train_loss": -5.103999614715576, "global_step": 10941, "epoch": 260} {"train_loss": -5.301688194274902, "global_step": 10942, "epoch": 260} {"train_loss": -4.94260835647583, "global_step": 10943, "epoch": 260} {"train_loss": -5.055721282958984, "global_step": 10944, "epoch": 260} {"train_loss": -5.008754730224609, "global_step": 10945, "epoch": 260} {"train_loss": -5.012823104858398, "global_step": 10946, "epoch": 260} {"train_loss": -5.04966926574707, "global_step": 10947, "epoch": 260} {"train_loss": -5.030729293823242, "global_step": 10948, "epoch": 260} {"train_loss": -5.169990539550781, "global_step": 10949, "epoch": 260} {"train_loss": -5.109711170196533, "global_step": 10950, "epoch": 260} {"train_loss": -5.015969753265381, "global_step": 10951, "epoch": 260} {"train_loss": -5.229402542114258, "global_step": 10952, "epoch": 260} {"train_loss": -5.127141952514648, "global_step": 10953, "epoch": 260} {"train_loss": -5.088050842285156, "global_step": 10954, "epoch": 260} {"train_loss": -5.103239059448242, "global_step": 10955, "epoch": 260} {"train_loss": -4.991206169128418, "global_step": 10956, "epoch": 260} {"train_loss": -5.022172927856445, "global_step": 10957, "epoch": 260} {"train_loss": -5.1497602462768555, "global_step": 10958, "epoch": 260} {"train_loss": -5.2341413497924805, "global_step": 10959, "epoch": 260} {"train_loss": -4.8967814445495605, "global_step": 10960, "epoch": 260} {"train_loss": -5.089873268490746, "global_step": 10961, "epoch": 260, "val_loss": 80907.578125} {"train_loss": -4.973109245300293, "global_step": 10962, "epoch": 261} {"train_loss": -5.053686141967773, "global_step": 10963, "epoch": 261} {"train_loss": -5.082474231719971, "global_step": 10964, "epoch": 261} {"train_loss": -4.98757266998291, "global_step": 10965, "epoch": 261} {"train_loss": -5.221833229064941, "global_step": 10966, "epoch": 261} {"train_loss": -5.221589088439941, "global_step": 10967, "epoch": 261} {"train_loss": -5.08270788192749, "global_step": 10968, "epoch": 261} {"train_loss": -5.018248558044434, "global_step": 10969, "epoch": 261} {"train_loss": -5.0649094581604, "global_step": 10970, "epoch": 261} {"train_loss": -5.082675933837891, "global_step": 10971, "epoch": 261} {"train_loss": -5.046283721923828, "global_step": 10972, "epoch": 261} {"train_loss": -5.037551403045654, "global_step": 10973, "epoch": 261} {"train_loss": -4.985107421875, "global_step": 10974, "epoch": 261} {"train_loss": -5.0194549560546875, "global_step": 10975, "epoch": 261} {"train_loss": -5.056117057800293, "global_step": 10976, "epoch": 261} {"train_loss": -5.0062150955200195, "global_step": 10977, "epoch": 261} {"train_loss": -5.059604167938232, "global_step": 10978, "epoch": 261} {"train_loss": -4.798304080963135, "global_step": 10979, "epoch": 261} {"train_loss": -4.95641565322876, "global_step": 10980, "epoch": 261} {"train_loss": -5.047473430633545, "global_step": 10981, "epoch": 261} {"train_loss": -4.798331260681152, "global_step": 10982, "epoch": 261} {"train_loss": -5.151309013366699, "global_step": 10983, "epoch": 261} {"train_loss": -5.0350542068481445, "global_step": 10984, "epoch": 261} {"train_loss": -5.013993263244629, "global_step": 10985, "epoch": 261} {"train_loss": -5.180323123931885, "global_step": 10986, "epoch": 261} {"train_loss": -5.114190101623535, "global_step": 10987, "epoch": 261} {"train_loss": -5.11707878112793, "global_step": 10988, "epoch": 261} {"train_loss": -5.082101345062256, "global_step": 10989, "epoch": 261} {"train_loss": -5.049833297729492, "global_step": 10990, "epoch": 261} {"train_loss": -5.047819137573242, "global_step": 10991, "epoch": 261} {"train_loss": -4.965754508972168, "global_step": 10992, "epoch": 261} {"train_loss": -5.190543174743652, "global_step": 10993, "epoch": 261} {"train_loss": -4.995092391967773, "global_step": 10994, "epoch": 261} {"train_loss": -5.118666172027588, "global_step": 10995, "epoch": 261} {"train_loss": -5.0633931159973145, "global_step": 10996, "epoch": 261} {"train_loss": -4.964778900146484, "global_step": 10997, "epoch": 261} {"train_loss": -5.062313079833984, "global_step": 10998, "epoch": 261} {"train_loss": -5.005583763122559, "global_step": 10999, "epoch": 261} {"train_loss": -5.054413795471191, "global_step": 11000, "epoch": 261} {"train_loss": -5.023716926574707, "global_step": 11001, "epoch": 261} {"train_loss": -4.872644901275635, "global_step": 11002, "epoch": 261} {"train_loss": -5.039331163678851, "global_step": 11003, "epoch": 261, "val_loss": 80272.8671875} {"train_loss": -5.126811504364014, "global_step": 11004, "epoch": 262} {"train_loss": -5.073081970214844, "global_step": 11005, "epoch": 262} {"train_loss": -5.068495750427246, "global_step": 11006, "epoch": 262} {"train_loss": -4.976231575012207, "global_step": 11007, "epoch": 262} {"train_loss": -5.016287803649902, "global_step": 11008, "epoch": 262} {"train_loss": -5.196639537811279, "global_step": 11009, "epoch": 262} {"train_loss": -4.887965202331543, "global_step": 11010, "epoch": 262} {"train_loss": -5.0160017013549805, "global_step": 11011, "epoch": 262} {"train_loss": -4.979987144470215, "global_step": 11012, "epoch": 262} {"train_loss": -4.862758159637451, "global_step": 11013, "epoch": 262} {"train_loss": -4.908546447753906, "global_step": 11014, "epoch": 262} {"train_loss": -5.153916358947754, "global_step": 11015, "epoch": 262} {"train_loss": -4.793993949890137, "global_step": 11016, "epoch": 262} {"train_loss": -4.970273494720459, "global_step": 11017, "epoch": 262} {"train_loss": -5.023011207580566, "global_step": 11018, "epoch": 262} {"train_loss": -4.999236106872559, "global_step": 11019, "epoch": 262} {"train_loss": -4.9220290184021, "global_step": 11020, "epoch": 262} {"train_loss": -4.800075531005859, "global_step": 11021, "epoch": 262} {"train_loss": -5.043293476104736, "global_step": 11022, "epoch": 262} {"train_loss": -4.826945781707764, "global_step": 11023, "epoch": 262} {"train_loss": -5.023309707641602, "global_step": 11024, "epoch": 262} {"train_loss": -4.995067596435547, "global_step": 11025, "epoch": 262} {"train_loss": -4.979733467102051, "global_step": 11026, "epoch": 262} {"train_loss": -5.045195579528809, "global_step": 11027, "epoch": 262} {"train_loss": -4.865677833557129, "global_step": 11028, "epoch": 262} {"train_loss": -5.0144805908203125, "global_step": 11029, "epoch": 262} {"train_loss": -5.033997058868408, "global_step": 11030, "epoch": 262} {"train_loss": -4.976963520050049, "global_step": 11031, "epoch": 262} {"train_loss": -5.060486793518066, "global_step": 11032, "epoch": 262} {"train_loss": -4.9373016357421875, "global_step": 11033, "epoch": 262} {"train_loss": -4.931495666503906, "global_step": 11034, "epoch": 262} {"train_loss": -5.0475263595581055, "global_step": 11035, "epoch": 262} {"train_loss": -5.00543737411499, "global_step": 11036, "epoch": 262} {"train_loss": -5.206245422363281, "global_step": 11037, "epoch": 262} {"train_loss": -5.122664451599121, "global_step": 11038, "epoch": 262} {"train_loss": -5.001134872436523, "global_step": 11039, "epoch": 262} {"train_loss": -5.039529323577881, "global_step": 11040, "epoch": 262} {"train_loss": -5.198554992675781, "global_step": 11041, "epoch": 262} {"train_loss": -4.989289283752441, "global_step": 11042, "epoch": 262} {"train_loss": -5.140328407287598, "global_step": 11043, "epoch": 262} {"train_loss": -5.170144081115723, "global_step": 11044, "epoch": 262} {"train_loss": -5.009821471713838, "global_step": 11045, "epoch": 262, "val_loss": 81122.21875} {"train_loss": -5.083653450012207, "global_step": 11046, "epoch": 263} {"train_loss": -5.237856864929199, "global_step": 11047, "epoch": 263} {"train_loss": -4.966324806213379, "global_step": 11048, "epoch": 263} {"train_loss": -5.273234844207764, "global_step": 11049, "epoch": 263} {"train_loss": -5.100341796875, "global_step": 11050, "epoch": 263} {"train_loss": -5.042447566986084, "global_step": 11051, "epoch": 263} {"train_loss": -5.10923957824707, "global_step": 11052, "epoch": 263} {"train_loss": -5.034278392791748, "global_step": 11053, "epoch": 263} {"train_loss": -5.0632524490356445, "global_step": 11054, "epoch": 263} {"train_loss": -5.1554155349731445, "global_step": 11055, "epoch": 263} {"train_loss": -4.983138084411621, "global_step": 11056, "epoch": 263} {"train_loss": -5.013822555541992, "global_step": 11057, "epoch": 263} {"train_loss": -5.120694637298584, "global_step": 11058, "epoch": 263} {"train_loss": -5.052530288696289, "global_step": 11059, "epoch": 263} {"train_loss": -5.061581134796143, "global_step": 11060, "epoch": 263} {"train_loss": -5.010169982910156, "global_step": 11061, "epoch": 263} {"train_loss": -5.170295238494873, "global_step": 11062, "epoch": 263} {"train_loss": -5.074704647064209, "global_step": 11063, "epoch": 263} {"train_loss": -4.9589948654174805, "global_step": 11064, "epoch": 263} {"train_loss": -5.0358357429504395, "global_step": 11065, "epoch": 263} {"train_loss": -5.15117073059082, "global_step": 11066, "epoch": 263} {"train_loss": -4.9460129737854, "global_step": 11067, "epoch": 263} {"train_loss": -5.131983757019043, "global_step": 11068, "epoch": 263} {"train_loss": -4.966324329376221, "global_step": 11069, "epoch": 263} {"train_loss": -4.972116470336914, "global_step": 11070, "epoch": 263} {"train_loss": -4.972539901733398, "global_step": 11071, "epoch": 263} {"train_loss": -4.983174800872803, "global_step": 11072, "epoch": 263} {"train_loss": -5.131573677062988, "global_step": 11073, "epoch": 263} {"train_loss": -5.02895975112915, "global_step": 11074, "epoch": 263} {"train_loss": -5.09489107131958, "global_step": 11075, "epoch": 263} {"train_loss": -5.037434101104736, "global_step": 11076, "epoch": 263} {"train_loss": -4.826920986175537, "global_step": 11077, "epoch": 263} {"train_loss": -5.175107955932617, "global_step": 11078, "epoch": 263} {"train_loss": -5.016495704650879, "global_step": 11079, "epoch": 263} {"train_loss": -4.949735641479492, "global_step": 11080, "epoch": 263} {"train_loss": -5.038140296936035, "global_step": 11081, "epoch": 263} {"train_loss": -4.9268012046813965, "global_step": 11082, "epoch": 263} {"train_loss": -4.737059116363525, "global_step": 11083, "epoch": 263} {"train_loss": -5.034323692321777, "global_step": 11084, "epoch": 263} {"train_loss": -5.113269329071045, "global_step": 11085, "epoch": 263} {"train_loss": -4.989972114562988, "global_step": 11086, "epoch": 263} {"train_loss": -5.04304187638419, "global_step": 11087, "epoch": 263, "val_loss": 80880.4609375} {"train_loss": -4.917470455169678, "global_step": 11088, "epoch": 264} {"train_loss": -4.954082489013672, "global_step": 11089, "epoch": 264} {"train_loss": -5.056540012359619, "global_step": 11090, "epoch": 264} {"train_loss": -5.098979949951172, "global_step": 11091, "epoch": 264} {"train_loss": -5.104026794433594, "global_step": 11092, "epoch": 264} {"train_loss": -5.154890060424805, "global_step": 11093, "epoch": 264} {"train_loss": -5.036601543426514, "global_step": 11094, "epoch": 264} {"train_loss": -5.154653549194336, "global_step": 11095, "epoch": 264} {"train_loss": -5.13551139831543, "global_step": 11096, "epoch": 264} {"train_loss": -5.1126708984375, "global_step": 11097, "epoch": 264} {"train_loss": -5.089987754821777, "global_step": 11098, "epoch": 264} {"train_loss": -5.143127918243408, "global_step": 11099, "epoch": 264} {"train_loss": -5.1806745529174805, "global_step": 11100, "epoch": 264} {"train_loss": -5.153426170349121, "global_step": 11101, "epoch": 264} {"train_loss": -5.197741508483887, "global_step": 11102, "epoch": 264} {"train_loss": -5.12408447265625, "global_step": 11103, "epoch": 264} {"train_loss": -5.091335773468018, "global_step": 11104, "epoch": 264} {"train_loss": -4.993127822875977, "global_step": 11105, "epoch": 264} {"train_loss": -5.113476753234863, "global_step": 11106, "epoch": 264} {"train_loss": -5.203886032104492, "global_step": 11107, "epoch": 264} {"train_loss": -5.1421661376953125, "global_step": 11108, "epoch": 264} {"train_loss": -5.103426456451416, "global_step": 11109, "epoch": 264} {"train_loss": -4.984020233154297, "global_step": 11110, "epoch": 264} {"train_loss": -5.135149955749512, "global_step": 11111, "epoch": 264} {"train_loss": -4.979912757873535, "global_step": 11112, "epoch": 264} {"train_loss": -5.103767395019531, "global_step": 11113, "epoch": 264} {"train_loss": -5.035887718200684, "global_step": 11114, "epoch": 264} {"train_loss": -5.033030033111572, "global_step": 11115, "epoch": 264} {"train_loss": -5.061520099639893, "global_step": 11116, "epoch": 264} {"train_loss": -5.007438659667969, "global_step": 11117, "epoch": 264} {"train_loss": -5.198315620422363, "global_step": 11118, "epoch": 264} {"train_loss": -5.0517377853393555, "global_step": 11119, "epoch": 264} {"train_loss": -5.133197784423828, "global_step": 11120, "epoch": 264} {"train_loss": -4.9591755867004395, "global_step": 11121, "epoch": 264} {"train_loss": -4.895267486572266, "global_step": 11122, "epoch": 264} {"train_loss": -5.146336555480957, "global_step": 11123, "epoch": 264} {"train_loss": -5.220412254333496, "global_step": 11124, "epoch": 264} {"train_loss": -5.032507419586182, "global_step": 11125, "epoch": 264} {"train_loss": -5.060544013977051, "global_step": 11126, "epoch": 264} {"train_loss": -5.149037837982178, "global_step": 11127, "epoch": 264} {"train_loss": -5.106563568115234, "global_step": 11128, "epoch": 264} {"train_loss": -5.089957861673264, "global_step": 11129, "epoch": 264, "val_loss": 80271.828125} {"train_loss": -5.116219520568848, "global_step": 11130, "epoch": 265} {"train_loss": -5.0057783126831055, "global_step": 11131, "epoch": 265} {"train_loss": -5.162014007568359, "global_step": 11132, "epoch": 265} {"train_loss": -5.064534664154053, "global_step": 11133, "epoch": 265} {"train_loss": -5.019336700439453, "global_step": 11134, "epoch": 265} {"train_loss": -5.102373123168945, "global_step": 11135, "epoch": 265} {"train_loss": -4.996888637542725, "global_step": 11136, "epoch": 265} {"train_loss": -5.005727767944336, "global_step": 11137, "epoch": 265} {"train_loss": -4.984482765197754, "global_step": 11138, "epoch": 265} {"train_loss": -5.1057658195495605, "global_step": 11139, "epoch": 265} {"train_loss": -5.144067764282227, "global_step": 11140, "epoch": 265} {"train_loss": -4.986578941345215, "global_step": 11141, "epoch": 265} {"train_loss": -5.173654079437256, "global_step": 11142, "epoch": 265} {"train_loss": -5.04616641998291, "global_step": 11143, "epoch": 265} {"train_loss": -5.084572792053223, "global_step": 11144, "epoch": 265} {"train_loss": -5.072878837585449, "global_step": 11145, "epoch": 265} {"train_loss": -5.049036026000977, "global_step": 11146, "epoch": 265} {"train_loss": -5.100982666015625, "global_step": 11147, "epoch": 265} {"train_loss": -5.094455718994141, "global_step": 11148, "epoch": 265} {"train_loss": -5.199322700500488, "global_step": 11149, "epoch": 265} {"train_loss": -5.034655570983887, "global_step": 11150, "epoch": 265} {"train_loss": -5.157920837402344, "global_step": 11151, "epoch": 265} {"train_loss": -5.142338752746582, "global_step": 11152, "epoch": 265} {"train_loss": -5.072760581970215, "global_step": 11153, "epoch": 265} {"train_loss": -5.092317581176758, "global_step": 11154, "epoch": 265} {"train_loss": -5.0441389083862305, "global_step": 11155, "epoch": 265} {"train_loss": -5.007984161376953, "global_step": 11156, "epoch": 265} {"train_loss": -5.077239036560059, "global_step": 11157, "epoch": 265} {"train_loss": -5.041688919067383, "global_step": 11158, "epoch": 265} {"train_loss": -5.174581050872803, "global_step": 11159, "epoch": 265} {"train_loss": -5.088401794433594, "global_step": 11160, "epoch": 265} {"train_loss": -5.118983268737793, "global_step": 11161, "epoch": 265} {"train_loss": -5.083806037902832, "global_step": 11162, "epoch": 265} {"train_loss": -5.050588130950928, "global_step": 11163, "epoch": 265} {"train_loss": -5.151172637939453, "global_step": 11164, "epoch": 265} {"train_loss": -5.116941452026367, "global_step": 11165, "epoch": 265} {"train_loss": -5.167150497436523, "global_step": 11166, "epoch": 265} {"train_loss": -5.058922290802002, "global_step": 11167, "epoch": 265} {"train_loss": -5.008508682250977, "global_step": 11168, "epoch": 265} {"train_loss": -5.16672420501709, "global_step": 11169, "epoch": 265} {"train_loss": -4.9839653968811035, "global_step": 11170, "epoch": 265} {"train_loss": -5.0793850762503485, "global_step": 11171, "epoch": 265, "val_loss": 80062.5390625} {"train_loss": -5.116222381591797, "global_step": 11172, "epoch": 266} {"train_loss": -4.9102983474731445, "global_step": 11173, "epoch": 266} {"train_loss": -5.163822174072266, "global_step": 11174, "epoch": 266} {"train_loss": -5.129812240600586, "global_step": 11175, "epoch": 266} {"train_loss": -5.128800392150879, "global_step": 11176, "epoch": 266} {"train_loss": -5.016789436340332, "global_step": 11177, "epoch": 266} {"train_loss": -5.122100830078125, "global_step": 11178, "epoch": 266} {"train_loss": -5.072969436645508, "global_step": 11179, "epoch": 266} {"train_loss": -5.072196960449219, "global_step": 11180, "epoch": 266} {"train_loss": -5.063875198364258, "global_step": 11181, "epoch": 266} {"train_loss": -5.006870269775391, "global_step": 11182, "epoch": 266} {"train_loss": -4.9973907470703125, "global_step": 11183, "epoch": 266} {"train_loss": -5.223540782928467, "global_step": 11184, "epoch": 266} {"train_loss": -5.097832679748535, "global_step": 11185, "epoch": 266} {"train_loss": -5.09591817855835, "global_step": 11186, "epoch": 266} {"train_loss": -5.073493480682373, "global_step": 11187, "epoch": 266} {"train_loss": -5.066461086273193, "global_step": 11188, "epoch": 266} {"train_loss": -5.1149749755859375, "global_step": 11189, "epoch": 266} {"train_loss": -5.031608581542969, "global_step": 11190, "epoch": 266} {"train_loss": -4.9822096824646, "global_step": 11191, "epoch": 266} {"train_loss": -5.136420249938965, "global_step": 11192, "epoch": 266} {"train_loss": -5.072099685668945, "global_step": 11193, "epoch": 266} {"train_loss": -5.062575340270996, "global_step": 11194, "epoch": 266} {"train_loss": -5.169133186340332, "global_step": 11195, "epoch": 266} {"train_loss": -5.063409805297852, "global_step": 11196, "epoch": 266} {"train_loss": -5.146145343780518, "global_step": 11197, "epoch": 266} {"train_loss": -5.01043701171875, "global_step": 11198, "epoch": 266} {"train_loss": -5.1567182540893555, "global_step": 11199, "epoch": 266} {"train_loss": -5.106794834136963, "global_step": 11200, "epoch": 266} {"train_loss": -5.20407772064209, "global_step": 11201, "epoch": 266} {"train_loss": -5.215156555175781, "global_step": 11202, "epoch": 266} {"train_loss": -4.971429347991943, "global_step": 11203, "epoch": 266} {"train_loss": -4.920668125152588, "global_step": 11204, "epoch": 266} {"train_loss": -5.104546070098877, "global_step": 11205, "epoch": 266} {"train_loss": -4.845682621002197, "global_step": 11206, "epoch": 266} {"train_loss": -4.937480926513672, "global_step": 11207, "epoch": 266} {"train_loss": -5.077596664428711, "global_step": 11208, "epoch": 266} {"train_loss": -5.000063419342041, "global_step": 11209, "epoch": 266} {"train_loss": -4.993681907653809, "global_step": 11210, "epoch": 266} {"train_loss": -5.0650410652160645, "global_step": 11211, "epoch": 266} {"train_loss": -4.900646686553955, "global_step": 11212, "epoch": 266} {"train_loss": -5.064065263384864, "global_step": 11213, "epoch": 266, "val_loss": 80429.0} {"train_loss": -4.926772117614746, "global_step": 11214, "epoch": 267} {"train_loss": -4.966391563415527, "global_step": 11215, "epoch": 267} {"train_loss": -4.998728275299072, "global_step": 11216, "epoch": 267} {"train_loss": -4.959817409515381, "global_step": 11217, "epoch": 267} {"train_loss": -4.896142959594727, "global_step": 11218, "epoch": 267} {"train_loss": -5.027242660522461, "global_step": 11219, "epoch": 267} {"train_loss": -5.007194519042969, "global_step": 11220, "epoch": 267} {"train_loss": -4.857816696166992, "global_step": 11221, "epoch": 267} {"train_loss": -5.124314308166504, "global_step": 11222, "epoch": 267} {"train_loss": -4.983750820159912, "global_step": 11223, "epoch": 267} {"train_loss": -5.177543640136719, "global_step": 11224, "epoch": 267} {"train_loss": -5.0923027992248535, "global_step": 11225, "epoch": 267} {"train_loss": -4.984072685241699, "global_step": 11226, "epoch": 267} {"train_loss": -5.099045753479004, "global_step": 11227, "epoch": 267} {"train_loss": -4.97114372253418, "global_step": 11228, "epoch": 267} {"train_loss": -5.179842948913574, "global_step": 11229, "epoch": 267} {"train_loss": -4.912899017333984, "global_step": 11230, "epoch": 267} {"train_loss": -5.026789665222168, "global_step": 11231, "epoch": 267} {"train_loss": -4.881782531738281, "global_step": 11232, "epoch": 267} {"train_loss": -4.989164352416992, "global_step": 11233, "epoch": 267} {"train_loss": -5.153031349182129, "global_step": 11234, "epoch": 267} {"train_loss": -4.902701377868652, "global_step": 11235, "epoch": 267} {"train_loss": -5.033969879150391, "global_step": 11236, "epoch": 267} {"train_loss": -4.90286111831665, "global_step": 11237, "epoch": 267} {"train_loss": -5.0427985191345215, "global_step": 11238, "epoch": 267} {"train_loss": -4.8426055908203125, "global_step": 11239, "epoch": 267} {"train_loss": -5.056921005249023, "global_step": 11240, "epoch": 267} {"train_loss": -5.061040878295898, "global_step": 11241, "epoch": 267} {"train_loss": -5.090762138366699, "global_step": 11242, "epoch": 267} {"train_loss": -5.17264461517334, "global_step": 11243, "epoch": 267} {"train_loss": -5.102337837219238, "global_step": 11244, "epoch": 267} {"train_loss": -5.036402702331543, "global_step": 11245, "epoch": 267} {"train_loss": -5.205716133117676, "global_step": 11246, "epoch": 267} {"train_loss": -5.2337117195129395, "global_step": 11247, "epoch": 267} {"train_loss": -4.998037338256836, "global_step": 11248, "epoch": 267} {"train_loss": -4.932380199432373, "global_step": 11249, "epoch": 267} {"train_loss": -4.869990348815918, "global_step": 11250, "epoch": 267} {"train_loss": -5.1181640625, "global_step": 11251, "epoch": 267} {"train_loss": -5.019449234008789, "global_step": 11252, "epoch": 267} {"train_loss": -4.977788925170898, "global_step": 11253, "epoch": 267} {"train_loss": -4.925764083862305, "global_step": 11254, "epoch": 267} {"train_loss": -5.016772031784058, "global_step": 11255, "epoch": 267, "val_loss": 81145.90625} {"train_loss": -4.9715681076049805, "global_step": 11256, "epoch": 268} {"train_loss": -5.119292259216309, "global_step": 11257, "epoch": 268} {"train_loss": -5.227843284606934, "global_step": 11258, "epoch": 268} {"train_loss": -5.020516395568848, "global_step": 11259, "epoch": 268} {"train_loss": -4.910901069641113, "global_step": 11260, "epoch": 268} {"train_loss": -5.217769145965576, "global_step": 11261, "epoch": 268} {"train_loss": -5.060879707336426, "global_step": 11262, "epoch": 268} {"train_loss": -5.099514484405518, "global_step": 11263, "epoch": 268} {"train_loss": -5.11367130279541, "global_step": 11264, "epoch": 268} {"train_loss": -5.144119739532471, "global_step": 11265, "epoch": 268} {"train_loss": -5.095887660980225, "global_step": 11266, "epoch": 268} {"train_loss": -5.081639766693115, "global_step": 11267, "epoch": 268} {"train_loss": -5.093105792999268, "global_step": 11268, "epoch": 268} {"train_loss": -4.99821662902832, "global_step": 11269, "epoch": 268} {"train_loss": -5.011419773101807, "global_step": 11270, "epoch": 268} {"train_loss": -5.15775203704834, "global_step": 11271, "epoch": 268} {"train_loss": -5.05091667175293, "global_step": 11272, "epoch": 268} {"train_loss": -5.046960830688477, "global_step": 11273, "epoch": 268} {"train_loss": -4.967432022094727, "global_step": 11274, "epoch": 268} {"train_loss": -5.081974506378174, "global_step": 11275, "epoch": 268} {"train_loss": -5.142182350158691, "global_step": 11276, "epoch": 268} {"train_loss": -5.06326150894165, "global_step": 11277, "epoch": 268} {"train_loss": -4.989295482635498, "global_step": 11278, "epoch": 268} {"train_loss": -5.023870944976807, "global_step": 11279, "epoch": 268} {"train_loss": -5.183529853820801, "global_step": 11280, "epoch": 268} {"train_loss": -5.090789794921875, "global_step": 11281, "epoch": 268} {"train_loss": -5.0461530685424805, "global_step": 11282, "epoch": 268} {"train_loss": -5.084202289581299, "global_step": 11283, "epoch": 268} {"train_loss": -5.108624458312988, "global_step": 11284, "epoch": 268} {"train_loss": -4.934372425079346, "global_step": 11285, "epoch": 268} {"train_loss": -5.058947563171387, "global_step": 11286, "epoch": 268} {"train_loss": -5.149807929992676, "global_step": 11287, "epoch": 268} {"train_loss": -5.070096969604492, "global_step": 11288, "epoch": 268} {"train_loss": -4.903282642364502, "global_step": 11289, "epoch": 268} {"train_loss": -5.0874528884887695, "global_step": 11290, "epoch": 268} {"train_loss": -5.220730781555176, "global_step": 11291, "epoch": 268} {"train_loss": -5.193347930908203, "global_step": 11292, "epoch": 268} {"train_loss": -5.096609115600586, "global_step": 11293, "epoch": 268} {"train_loss": -5.073090553283691, "global_step": 11294, "epoch": 268} {"train_loss": -5.093834400177002, "global_step": 11295, "epoch": 268} {"train_loss": -5.300469875335693, "global_step": 11296, "epoch": 268} {"train_loss": -5.080298696245466, "global_step": 11297, "epoch": 268, "val_loss": 79789.8046875} {"train_loss": -4.981307506561279, "global_step": 11298, "epoch": 269} {"train_loss": -5.12587833404541, "global_step": 11299, "epoch": 269} {"train_loss": -5.066862106323242, "global_step": 11300, "epoch": 269} {"train_loss": -5.083614349365234, "global_step": 11301, "epoch": 269} {"train_loss": -5.106194019317627, "global_step": 11302, "epoch": 269} {"train_loss": -5.107571601867676, "global_step": 11303, "epoch": 269} {"train_loss": -5.181879997253418, "global_step": 11304, "epoch": 269} {"train_loss": -5.046080589294434, "global_step": 11305, "epoch": 269} {"train_loss": -5.231883525848389, "global_step": 11306, "epoch": 269} {"train_loss": -5.016324043273926, "global_step": 11307, "epoch": 269} {"train_loss": -5.144384384155273, "global_step": 11308, "epoch": 269} {"train_loss": -5.113877296447754, "global_step": 11309, "epoch": 269} {"train_loss": -5.112011432647705, "global_step": 11310, "epoch": 269} {"train_loss": -5.123208999633789, "global_step": 11311, "epoch": 269} {"train_loss": -5.128735065460205, "global_step": 11312, "epoch": 269} {"train_loss": -5.091821193695068, "global_step": 11313, "epoch": 269} {"train_loss": -4.905557155609131, "global_step": 11314, "epoch": 269} {"train_loss": -4.8695387840271, "global_step": 11315, "epoch": 269} {"train_loss": -5.034282684326172, "global_step": 11316, "epoch": 269} {"train_loss": -5.016260147094727, "global_step": 11317, "epoch": 269} {"train_loss": -4.967912197113037, "global_step": 11318, "epoch": 269} {"train_loss": -5.127687454223633, "global_step": 11319, "epoch": 269} {"train_loss": -5.140398979187012, "global_step": 11320, "epoch": 269} {"train_loss": -5.067905426025391, "global_step": 11321, "epoch": 269} {"train_loss": -5.0026140213012695, "global_step": 11322, "epoch": 269} {"train_loss": -4.9782586097717285, "global_step": 11323, "epoch": 269} {"train_loss": -5.000807762145996, "global_step": 11324, "epoch": 269} {"train_loss": -5.188292503356934, "global_step": 11325, "epoch": 269} {"train_loss": -5.108193397521973, "global_step": 11326, "epoch": 269} {"train_loss": -5.020333766937256, "global_step": 11327, "epoch": 269} {"train_loss": -5.074541091918945, "global_step": 11328, "epoch": 269} {"train_loss": -5.148711204528809, "global_step": 11329, "epoch": 269} {"train_loss": -4.876592636108398, "global_step": 11330, "epoch": 269} {"train_loss": -4.854055404663086, "global_step": 11331, "epoch": 269} {"train_loss": -5.0419158935546875, "global_step": 11332, "epoch": 269} {"train_loss": -5.081230163574219, "global_step": 11333, "epoch": 269} {"train_loss": -5.032741546630859, "global_step": 11334, "epoch": 269} {"train_loss": -5.122244834899902, "global_step": 11335, "epoch": 269} {"train_loss": -5.028395175933838, "global_step": 11336, "epoch": 269} {"train_loss": -5.0935516357421875, "global_step": 11337, "epoch": 269} {"train_loss": -5.148157119750977, "global_step": 11338, "epoch": 269} {"train_loss": -5.062627236048381, "global_step": 11339, "epoch": 269, "val_loss": 79545.8046875} {"train_loss": -5.08900260925293, "global_step": 11340, "epoch": 270} {"train_loss": -4.985323905944824, "global_step": 11341, "epoch": 270} {"train_loss": -4.970287799835205, "global_step": 11342, "epoch": 270} {"train_loss": -5.160797595977783, "global_step": 11343, "epoch": 270} {"train_loss": -5.0571794509887695, "global_step": 11344, "epoch": 270} {"train_loss": -5.032871723175049, "global_step": 11345, "epoch": 270} {"train_loss": -5.119483947753906, "global_step": 11346, "epoch": 270} {"train_loss": -5.10523796081543, "global_step": 11347, "epoch": 270} {"train_loss": -5.074191093444824, "global_step": 11348, "epoch": 270} {"train_loss": -5.012487888336182, "global_step": 11349, "epoch": 270} {"train_loss": -5.088762283325195, "global_step": 11350, "epoch": 270} {"train_loss": -5.222806930541992, "global_step": 11351, "epoch": 270} {"train_loss": -5.08310604095459, "global_step": 11352, "epoch": 270} {"train_loss": -4.953714370727539, "global_step": 11353, "epoch": 270} {"train_loss": -5.067690849304199, "global_step": 11354, "epoch": 270} {"train_loss": -5.0617475509643555, "global_step": 11355, "epoch": 270} {"train_loss": -5.223751068115234, "global_step": 11356, "epoch": 270} {"train_loss": -5.047832489013672, "global_step": 11357, "epoch": 270} {"train_loss": -4.949517726898193, "global_step": 11358, "epoch": 270} {"train_loss": -5.069516181945801, "global_step": 11359, "epoch": 270} {"train_loss": -4.957385063171387, "global_step": 11360, "epoch": 270} {"train_loss": -5.109841346740723, "global_step": 11361, "epoch": 270} {"train_loss": -4.887137413024902, "global_step": 11362, "epoch": 270} {"train_loss": -5.198853492736816, "global_step": 11363, "epoch": 270} {"train_loss": -5.046666145324707, "global_step": 11364, "epoch": 270} {"train_loss": -5.105131149291992, "global_step": 11365, "epoch": 270} {"train_loss": -5.058547496795654, "global_step": 11366, "epoch": 270} {"train_loss": -5.305885314941406, "global_step": 11367, "epoch": 270} {"train_loss": -5.178793430328369, "global_step": 11368, "epoch": 270} {"train_loss": -5.035080909729004, "global_step": 11369, "epoch": 270} {"train_loss": -5.16361141204834, "global_step": 11370, "epoch": 270} {"train_loss": -5.220681190490723, "global_step": 11371, "epoch": 270} {"train_loss": -5.138588905334473, "global_step": 11372, "epoch": 270} {"train_loss": -5.063888072967529, "global_step": 11373, "epoch": 270} {"train_loss": -5.189316272735596, "global_step": 11374, "epoch": 270} {"train_loss": -5.148625373840332, "global_step": 11375, "epoch": 270} {"train_loss": -5.087641716003418, "global_step": 11376, "epoch": 270} {"train_loss": -5.260782718658447, "global_step": 11377, "epoch": 270} {"train_loss": -5.129520893096924, "global_step": 11378, "epoch": 270} {"train_loss": -5.062544345855713, "global_step": 11379, "epoch": 270} {"train_loss": -4.91988468170166, "global_step": 11380, "epoch": 270} {"train_loss": -5.088840564092, "global_step": 11381, "epoch": 270, "val_loss": 79935.3046875} {"train_loss": -5.0872955322265625, "global_step": 11382, "epoch": 271} {"train_loss": -5.069605827331543, "global_step": 11383, "epoch": 271} {"train_loss": -5.052984714508057, "global_step": 11384, "epoch": 271} {"train_loss": -5.180032253265381, "global_step": 11385, "epoch": 271} {"train_loss": -5.12163782119751, "global_step": 11386, "epoch": 271} {"train_loss": -5.266622066497803, "global_step": 11387, "epoch": 271} {"train_loss": -5.211699962615967, "global_step": 11388, "epoch": 271} {"train_loss": -4.822505474090576, "global_step": 11389, "epoch": 271} {"train_loss": -5.1149492263793945, "global_step": 11390, "epoch": 271} {"train_loss": -5.112209796905518, "global_step": 11391, "epoch": 271} {"train_loss": -5.141885757446289, "global_step": 11392, "epoch": 271} {"train_loss": -5.054529190063477, "global_step": 11393, "epoch": 271} {"train_loss": -4.914579391479492, "global_step": 11394, "epoch": 271} {"train_loss": -5.122256755828857, "global_step": 11395, "epoch": 271} {"train_loss": -5.1174702644348145, "global_step": 11396, "epoch": 271} {"train_loss": -5.0072784423828125, "global_step": 11397, "epoch": 271} {"train_loss": -4.970941543579102, "global_step": 11398, "epoch": 271} {"train_loss": -5.183011531829834, "global_step": 11399, "epoch": 271} {"train_loss": -5.072713851928711, "global_step": 11400, "epoch": 271} {"train_loss": -5.033909797668457, "global_step": 11401, "epoch": 271} {"train_loss": -5.083629131317139, "global_step": 11402, "epoch": 271} {"train_loss": -5.216937065124512, "global_step": 11403, "epoch": 271} {"train_loss": -5.119322299957275, "global_step": 11404, "epoch": 271} {"train_loss": -5.043827056884766, "global_step": 11405, "epoch": 271} {"train_loss": -4.9573974609375, "global_step": 11406, "epoch": 271} {"train_loss": -5.198272705078125, "global_step": 11407, "epoch": 271} {"train_loss": -5.207637310028076, "global_step": 11408, "epoch": 271} {"train_loss": -5.160341262817383, "global_step": 11409, "epoch": 271} {"train_loss": -5.214136123657227, "global_step": 11410, "epoch": 271} {"train_loss": -5.053645610809326, "global_step": 11411, "epoch": 271} {"train_loss": -5.056399345397949, "global_step": 11412, "epoch": 271} {"train_loss": -4.859035491943359, "global_step": 11413, "epoch": 271} {"train_loss": -5.12380313873291, "global_step": 11414, "epoch": 271} {"train_loss": -4.572948455810547, "global_step": 11415, "epoch": 271} {"train_loss": -4.8445916175842285, "global_step": 11416, "epoch": 271} {"train_loss": -4.481019496917725, "global_step": 11417, "epoch": 271} {"train_loss": -4.437915802001953, "global_step": 11418, "epoch": 271} {"train_loss": -4.774604320526123, "global_step": 11419, "epoch": 271} {"train_loss": -4.63985538482666, "global_step": 11420, "epoch": 271} {"train_loss": -4.730931282043457, "global_step": 11421, "epoch": 271} {"train_loss": -4.8599371910095215, "global_step": 11422, "epoch": 271} {"train_loss": -4.995226178850446, "global_step": 11423, "epoch": 271, "val_loss": 80651.5} {"train_loss": -5.0345611572265625, "global_step": 11424, "epoch": 272} {"train_loss": -4.557405471801758, "global_step": 11425, "epoch": 272} {"train_loss": -4.771265029907227, "global_step": 11426, "epoch": 272} {"train_loss": -4.799644947052002, "global_step": 11427, "epoch": 272} {"train_loss": -4.714155197143555, "global_step": 11428, "epoch": 272} {"train_loss": -5.058710098266602, "global_step": 11429, "epoch": 272} {"train_loss": -4.640531539916992, "global_step": 11430, "epoch": 272} {"train_loss": -4.990168571472168, "global_step": 11431, "epoch": 272} {"train_loss": -4.855297565460205, "global_step": 11432, "epoch": 272} {"train_loss": -4.736517906188965, "global_step": 11433, "epoch": 272} {"train_loss": -4.994501113891602, "global_step": 11434, "epoch": 272} {"train_loss": -4.782776832580566, "global_step": 11435, "epoch": 272} {"train_loss": -4.758210182189941, "global_step": 11436, "epoch": 272} {"train_loss": -4.999458312988281, "global_step": 11437, "epoch": 272} {"train_loss": -4.920563220977783, "global_step": 11438, "epoch": 272} {"train_loss": -4.875669002532959, "global_step": 11439, "epoch": 272} {"train_loss": -5.026290416717529, "global_step": 11440, "epoch": 272} {"train_loss": -4.781745910644531, "global_step": 11441, "epoch": 272} {"train_loss": -5.1076459884643555, "global_step": 11442, "epoch": 272} {"train_loss": -4.96640682220459, "global_step": 11443, "epoch": 272} {"train_loss": -4.979317665100098, "global_step": 11444, "epoch": 272} {"train_loss": -5.0276384353637695, "global_step": 11445, "epoch": 272} {"train_loss": -5.080838680267334, "global_step": 11446, "epoch": 272} {"train_loss": -5.085468769073486, "global_step": 11447, "epoch": 272} {"train_loss": -5.001786231994629, "global_step": 11448, "epoch": 272} {"train_loss": -5.025784015655518, "global_step": 11449, "epoch": 272} {"train_loss": -5.059199333190918, "global_step": 11450, "epoch": 272} {"train_loss": -5.128295421600342, "global_step": 11451, "epoch": 272} {"train_loss": -5.122370719909668, "global_step": 11452, "epoch": 272} {"train_loss": -4.990632057189941, "global_step": 11453, "epoch": 272} {"train_loss": -4.860700607299805, "global_step": 11454, "epoch": 272} {"train_loss": -5.043884754180908, "global_step": 11455, "epoch": 272} {"train_loss": -4.8391008377075195, "global_step": 11456, "epoch": 272} {"train_loss": -5.014039039611816, "global_step": 11457, "epoch": 272} {"train_loss": -5.037107467651367, "global_step": 11458, "epoch": 272} {"train_loss": -5.085431098937988, "global_step": 11459, "epoch": 272} {"train_loss": -5.085483074188232, "global_step": 11460, "epoch": 272} {"train_loss": -5.163623809814453, "global_step": 11461, "epoch": 272} {"train_loss": -5.071787357330322, "global_step": 11462, "epoch": 272} {"train_loss": -5.010523796081543, "global_step": 11463, "epoch": 272} {"train_loss": -5.079979419708252, "global_step": 11464, "epoch": 272} {"train_loss": -4.9574936003912065, "global_step": 11465, "epoch": 272, "val_loss": 79929.125} {"train_loss": -5.0921478271484375, "global_step": 11466, "epoch": 273} {"train_loss": -5.119400978088379, "global_step": 11467, "epoch": 273} {"train_loss": -5.130273818969727, "global_step": 11468, "epoch": 273} {"train_loss": -5.047611236572266, "global_step": 11469, "epoch": 273} {"train_loss": -5.025605201721191, "global_step": 11470, "epoch": 273} {"train_loss": -5.069448471069336, "global_step": 11471, "epoch": 273} {"train_loss": -5.2407331466674805, "global_step": 11472, "epoch": 273} {"train_loss": -5.125243186950684, "global_step": 11473, "epoch": 273} {"train_loss": -5.105666160583496, "global_step": 11474, "epoch": 273} {"train_loss": -5.135904788970947, "global_step": 11475, "epoch": 273} {"train_loss": -5.157382011413574, "global_step": 11476, "epoch": 273} {"train_loss": -5.075295448303223, "global_step": 11477, "epoch": 273} {"train_loss": -5.155697822570801, "global_step": 11478, "epoch": 273} {"train_loss": -5.119043350219727, "global_step": 11479, "epoch": 273} {"train_loss": -5.073809623718262, "global_step": 11480, "epoch": 273} {"train_loss": -5.098836421966553, "global_step": 11481, "epoch": 273} {"train_loss": -5.172189712524414, "global_step": 11482, "epoch": 273} {"train_loss": -5.196254730224609, "global_step": 11483, "epoch": 273} {"train_loss": -5.249550819396973, "global_step": 11484, "epoch": 273} {"train_loss": -5.063606262207031, "global_step": 11485, "epoch": 273} {"train_loss": -5.197643756866455, "global_step": 11486, "epoch": 273} {"train_loss": -5.102315902709961, "global_step": 11487, "epoch": 273} {"train_loss": -5.067665100097656, "global_step": 11488, "epoch": 273} {"train_loss": -5.087162017822266, "global_step": 11489, "epoch": 273} {"train_loss": -5.191771030426025, "global_step": 11490, "epoch": 273} {"train_loss": -5.157621383666992, "global_step": 11491, "epoch": 273} {"train_loss": -5.126002788543701, "global_step": 11492, "epoch": 273} {"train_loss": -5.104864120483398, "global_step": 11493, "epoch": 273} {"train_loss": -5.043622970581055, "global_step": 11494, "epoch": 273} {"train_loss": -5.088191986083984, "global_step": 11495, "epoch": 273} {"train_loss": -5.029349327087402, "global_step": 11496, "epoch": 273} {"train_loss": -5.155841827392578, "global_step": 11497, "epoch": 273} {"train_loss": -5.175661087036133, "global_step": 11498, "epoch": 273} {"train_loss": -4.929523468017578, "global_step": 11499, "epoch": 273} {"train_loss": -4.988324165344238, "global_step": 11500, "epoch": 273} {"train_loss": -5.075108051300049, "global_step": 11501, "epoch": 273} {"train_loss": -4.9340386390686035, "global_step": 11502, "epoch": 273} {"train_loss": -4.897781848907471, "global_step": 11503, "epoch": 273} {"train_loss": -5.003747940063477, "global_step": 11504, "epoch": 273} {"train_loss": -4.8857831954956055, "global_step": 11505, "epoch": 273} {"train_loss": -5.0049824714660645, "global_step": 11506, "epoch": 273} {"train_loss": -5.0886254878271195, "global_step": 11507, "epoch": 273, "val_loss": 81347.0} {"train_loss": -4.9365129470825195, "global_step": 11508, "epoch": 274} {"train_loss": -5.139750003814697, "global_step": 11509, "epoch": 274} {"train_loss": -5.001121997833252, "global_step": 11510, "epoch": 274} {"train_loss": -5.001978874206543, "global_step": 11511, "epoch": 274} {"train_loss": -4.917783737182617, "global_step": 11512, "epoch": 274} {"train_loss": -4.950713157653809, "global_step": 11513, "epoch": 274} {"train_loss": -5.107283592224121, "global_step": 11514, "epoch": 274} {"train_loss": -5.0350518226623535, "global_step": 11515, "epoch": 274} {"train_loss": -4.981726169586182, "global_step": 11516, "epoch": 274} {"train_loss": -5.067876815795898, "global_step": 11517, "epoch": 274} {"train_loss": -5.0764851570129395, "global_step": 11518, "epoch": 274} {"train_loss": -4.974606513977051, "global_step": 11519, "epoch": 274} {"train_loss": -5.0948920249938965, "global_step": 11520, "epoch": 274} {"train_loss": -5.115056991577148, "global_step": 11521, "epoch": 274} {"train_loss": -5.109361171722412, "global_step": 11522, "epoch": 274} {"train_loss": -4.8815083503723145, "global_step": 11523, "epoch": 274} {"train_loss": -5.032115459442139, "global_step": 11524, "epoch": 274} {"train_loss": -5.045039176940918, "global_step": 11525, "epoch": 274} {"train_loss": -5.027026176452637, "global_step": 11526, "epoch": 274} {"train_loss": -5.127712249755859, "global_step": 11527, "epoch": 274} {"train_loss": -5.114989757537842, "global_step": 11528, "epoch": 274} {"train_loss": -5.06113862991333, "global_step": 11529, "epoch": 274} {"train_loss": -5.102293014526367, "global_step": 11530, "epoch": 274} {"train_loss": -5.095338821411133, "global_step": 11531, "epoch": 274} {"train_loss": -5.088831901550293, "global_step": 11532, "epoch": 274} {"train_loss": -4.923616409301758, "global_step": 11533, "epoch": 274} {"train_loss": -5.084643363952637, "global_step": 11534, "epoch": 274} {"train_loss": -4.981991767883301, "global_step": 11535, "epoch": 274} {"train_loss": -5.1105241775512695, "global_step": 11536, "epoch": 274} {"train_loss": -5.147312164306641, "global_step": 11537, "epoch": 274} {"train_loss": -5.133668899536133, "global_step": 11538, "epoch": 274} {"train_loss": -5.086867332458496, "global_step": 11539, "epoch": 274} {"train_loss": -5.096710681915283, "global_step": 11540, "epoch": 274} {"train_loss": -5.020242691040039, "global_step": 11541, "epoch": 274} {"train_loss": -5.100841045379639, "global_step": 11542, "epoch": 274} {"train_loss": -4.966197967529297, "global_step": 11543, "epoch": 274} {"train_loss": -5.156507968902588, "global_step": 11544, "epoch": 274} {"train_loss": -4.965210914611816, "global_step": 11545, "epoch": 274} {"train_loss": -5.107205390930176, "global_step": 11546, "epoch": 274} {"train_loss": -5.05643367767334, "global_step": 11547, "epoch": 274} {"train_loss": -5.08969783782959, "global_step": 11548, "epoch": 274} {"train_loss": -5.050549087070284, "global_step": 11549, "epoch": 274, "val_loss": 79289.7734375} {"train_loss": -4.9900078773498535, "global_step": 11550, "epoch": 275} {"train_loss": -5.057065010070801, "global_step": 11551, "epoch": 275} {"train_loss": -5.123827934265137, "global_step": 11552, "epoch": 275} {"train_loss": -5.238884925842285, "global_step": 11553, "epoch": 275} {"train_loss": -4.951083183288574, "global_step": 11554, "epoch": 275} {"train_loss": -5.087015151977539, "global_step": 11555, "epoch": 275} {"train_loss": -5.073641300201416, "global_step": 11556, "epoch": 275} {"train_loss": -4.934765815734863, "global_step": 11557, "epoch": 275} {"train_loss": -5.189143657684326, "global_step": 11558, "epoch": 275} {"train_loss": -5.149262428283691, "global_step": 11559, "epoch": 275} {"train_loss": -5.113753795623779, "global_step": 11560, "epoch": 275} {"train_loss": -5.098559379577637, "global_step": 11561, "epoch": 275} {"train_loss": -5.242509841918945, "global_step": 11562, "epoch": 275} {"train_loss": -5.165207862854004, "global_step": 11563, "epoch": 275} {"train_loss": -4.879499435424805, "global_step": 11564, "epoch": 275} {"train_loss": -5.015051364898682, "global_step": 11565, "epoch": 275} {"train_loss": -5.195172309875488, "global_step": 11566, "epoch": 275} {"train_loss": -5.017271995544434, "global_step": 11567, "epoch": 275} {"train_loss": -4.9446330070495605, "global_step": 11568, "epoch": 275} {"train_loss": -5.089296340942383, "global_step": 11569, "epoch": 275} {"train_loss": -5.163178443908691, "global_step": 11570, "epoch": 275} {"train_loss": -5.019918441772461, "global_step": 11571, "epoch": 275} {"train_loss": -4.974851608276367, "global_step": 11572, "epoch": 275} {"train_loss": -5.036682605743408, "global_step": 11573, "epoch": 275} {"train_loss": -5.002946376800537, "global_step": 11574, "epoch": 275} {"train_loss": -5.091608047485352, "global_step": 11575, "epoch": 275} {"train_loss": -5.060752868652344, "global_step": 11576, "epoch": 275} {"train_loss": -5.093863487243652, "global_step": 11577, "epoch": 275} {"train_loss": -4.90115213394165, "global_step": 11578, "epoch": 275} {"train_loss": -5.217967510223389, "global_step": 11579, "epoch": 275} {"train_loss": -5.109716892242432, "global_step": 11580, "epoch": 275} {"train_loss": -5.006409645080566, "global_step": 11581, "epoch": 275} {"train_loss": -5.095486640930176, "global_step": 11582, "epoch": 275} {"train_loss": -5.249831199645996, "global_step": 11583, "epoch": 275} {"train_loss": -5.134992599487305, "global_step": 11584, "epoch": 275} {"train_loss": -5.0748372077941895, "global_step": 11585, "epoch": 275} {"train_loss": -5.047747611999512, "global_step": 11586, "epoch": 275} {"train_loss": -5.018438339233398, "global_step": 11587, "epoch": 275} {"train_loss": -5.201467514038086, "global_step": 11588, "epoch": 275} {"train_loss": -5.118183135986328, "global_step": 11589, "epoch": 275} {"train_loss": -5.149908065795898, "global_step": 11590, "epoch": 275} {"train_loss": -5.080930709838867, "global_step": 11591, "epoch": 275, "val_loss": 80197.6953125} {"train_loss": -5.146997928619385, "global_step": 11592, "epoch": 276} {"train_loss": -5.10047721862793, "global_step": 11593, "epoch": 276} {"train_loss": -5.098044395446777, "global_step": 11594, "epoch": 276} {"train_loss": -5.086197853088379, "global_step": 11595, "epoch": 276} {"train_loss": -4.952670574188232, "global_step": 11596, "epoch": 276} {"train_loss": -5.104706764221191, "global_step": 11597, "epoch": 276} {"train_loss": -5.288619041442871, "global_step": 11598, "epoch": 276} {"train_loss": -5.18269157409668, "global_step": 11599, "epoch": 276} {"train_loss": -5.1702880859375, "global_step": 11600, "epoch": 276} {"train_loss": -5.179089546203613, "global_step": 11601, "epoch": 276} {"train_loss": -5.163803577423096, "global_step": 11602, "epoch": 276} {"train_loss": -4.991673469543457, "global_step": 11603, "epoch": 276} {"train_loss": -5.0501389503479, "global_step": 11604, "epoch": 276} {"train_loss": -5.162249565124512, "global_step": 11605, "epoch": 276} {"train_loss": -4.822934150695801, "global_step": 11606, "epoch": 276} {"train_loss": -4.821743965148926, "global_step": 11607, "epoch": 276} {"train_loss": -5.006488800048828, "global_step": 11608, "epoch": 276} {"train_loss": -4.915549278259277, "global_step": 11609, "epoch": 276} {"train_loss": -4.688708782196045, "global_step": 11610, "epoch": 276} {"train_loss": -5.005014419555664, "global_step": 11611, "epoch": 276} {"train_loss": -4.829282760620117, "global_step": 11612, "epoch": 276} {"train_loss": -4.933706283569336, "global_step": 11613, "epoch": 276} {"train_loss": -4.797275543212891, "global_step": 11614, "epoch": 276} {"train_loss": -4.8866472244262695, "global_step": 11615, "epoch": 276} {"train_loss": -5.01680850982666, "global_step": 11616, "epoch": 276} {"train_loss": -4.782609462738037, "global_step": 11617, "epoch": 276} {"train_loss": -5.07598876953125, "global_step": 11618, "epoch": 276} {"train_loss": -4.818535804748535, "global_step": 11619, "epoch": 276} {"train_loss": -4.919293403625488, "global_step": 11620, "epoch": 276} {"train_loss": -5.042574882507324, "global_step": 11621, "epoch": 276} {"train_loss": -5.015191555023193, "global_step": 11622, "epoch": 276} {"train_loss": -5.185266017913818, "global_step": 11623, "epoch": 276} {"train_loss": -4.969204902648926, "global_step": 11624, "epoch": 276} {"train_loss": -5.033815860748291, "global_step": 11625, "epoch": 276} {"train_loss": -4.987909317016602, "global_step": 11626, "epoch": 276} {"train_loss": -5.075448513031006, "global_step": 11627, "epoch": 276} {"train_loss": -5.059351444244385, "global_step": 11628, "epoch": 276} {"train_loss": -5.108344554901123, "global_step": 11629, "epoch": 276} {"train_loss": -4.983335018157959, "global_step": 11630, "epoch": 276} {"train_loss": -4.945926666259766, "global_step": 11631, "epoch": 276} {"train_loss": -5.133044242858887, "global_step": 11632, "epoch": 276} {"train_loss": -5.012666974748884, "global_step": 11633, "epoch": 276, "val_loss": 80043.3203125} {"train_loss": -5.090766906738281, "global_step": 11634, "epoch": 277} {"train_loss": -5.062438488006592, "global_step": 11635, "epoch": 277} {"train_loss": -5.122995853424072, "global_step": 11636, "epoch": 277} {"train_loss": -4.83880615234375, "global_step": 11637, "epoch": 277} {"train_loss": -5.1294403076171875, "global_step": 11638, "epoch": 277} {"train_loss": -4.956507205963135, "global_step": 11639, "epoch": 277} {"train_loss": -5.237339019775391, "global_step": 11640, "epoch": 277} {"train_loss": -5.169565200805664, "global_step": 11641, "epoch": 277} {"train_loss": -5.170949459075928, "global_step": 11642, "epoch": 277} {"train_loss": -5.0967583656311035, "global_step": 11643, "epoch": 277} {"train_loss": -5.057616710662842, "global_step": 11644, "epoch": 277} {"train_loss": -5.160717010498047, "global_step": 11645, "epoch": 277} {"train_loss": -4.94859504699707, "global_step": 11646, "epoch": 277} {"train_loss": -5.036818027496338, "global_step": 11647, "epoch": 277} {"train_loss": -5.1096577644348145, "global_step": 11648, "epoch": 277} {"train_loss": -5.178128719329834, "global_step": 11649, "epoch": 277} {"train_loss": -4.984676361083984, "global_step": 11650, "epoch": 277} {"train_loss": -5.187236785888672, "global_step": 11651, "epoch": 277} {"train_loss": -5.212320327758789, "global_step": 11652, "epoch": 277} {"train_loss": -5.228762626647949, "global_step": 11653, "epoch": 277} {"train_loss": -5.17490291595459, "global_step": 11654, "epoch": 277} {"train_loss": -5.119359493255615, "global_step": 11655, "epoch": 277} {"train_loss": -4.9390716552734375, "global_step": 11656, "epoch": 277} {"train_loss": -5.195256233215332, "global_step": 11657, "epoch": 277} {"train_loss": -5.053994178771973, "global_step": 11658, "epoch": 277} {"train_loss": -4.758611679077148, "global_step": 11659, "epoch": 277} {"train_loss": -4.979487419128418, "global_step": 11660, "epoch": 277} {"train_loss": -4.846053123474121, "global_step": 11661, "epoch": 277} {"train_loss": -4.970288276672363, "global_step": 11662, "epoch": 277} {"train_loss": -4.76771354675293, "global_step": 11663, "epoch": 277} {"train_loss": -4.987390518188477, "global_step": 11664, "epoch": 277} {"train_loss": -4.910057067871094, "global_step": 11665, "epoch": 277} {"train_loss": -4.900293827056885, "global_step": 11666, "epoch": 277} {"train_loss": -5.027630805969238, "global_step": 11667, "epoch": 277} {"train_loss": -5.097896099090576, "global_step": 11668, "epoch": 277} {"train_loss": -4.97614860534668, "global_step": 11669, "epoch": 277} {"train_loss": -5.08428955078125, "global_step": 11670, "epoch": 277} {"train_loss": -4.99990177154541, "global_step": 11671, "epoch": 277} {"train_loss": -4.897270679473877, "global_step": 11672, "epoch": 277} {"train_loss": -4.970154762268066, "global_step": 11673, "epoch": 277} {"train_loss": -5.094165325164795, "global_step": 11674, "epoch": 277} {"train_loss": -5.044351668584914, "global_step": 11675, "epoch": 277, "val_loss": 79693.0} {"train_loss": -5.079010009765625, "global_step": 11676, "epoch": 278} {"train_loss": -5.116055488586426, "global_step": 11677, "epoch": 278} {"train_loss": -5.0434088706970215, "global_step": 11678, "epoch": 278} {"train_loss": -5.155450344085693, "global_step": 11679, "epoch": 278} {"train_loss": -5.156645774841309, "global_step": 11680, "epoch": 278} {"train_loss": -4.99186372756958, "global_step": 11681, "epoch": 278} {"train_loss": -5.001157760620117, "global_step": 11682, "epoch": 278} {"train_loss": -5.139211654663086, "global_step": 11683, "epoch": 278} {"train_loss": -5.130970001220703, "global_step": 11684, "epoch": 278} {"train_loss": -5.104915142059326, "global_step": 11685, "epoch": 278} {"train_loss": -5.095169544219971, "global_step": 11686, "epoch": 278} {"train_loss": -5.217623710632324, "global_step": 11687, "epoch": 278} {"train_loss": -5.085036277770996, "global_step": 11688, "epoch": 278} {"train_loss": -5.189515113830566, "global_step": 11689, "epoch": 278} {"train_loss": -4.9698805809021, "global_step": 11690, "epoch": 278} {"train_loss": -5.063965320587158, "global_step": 11691, "epoch": 278} {"train_loss": -5.168374538421631, "global_step": 11692, "epoch": 278} {"train_loss": -5.00884485244751, "global_step": 11693, "epoch": 278} {"train_loss": -5.068243026733398, "global_step": 11694, "epoch": 278} {"train_loss": -5.049252510070801, "global_step": 11695, "epoch": 278} {"train_loss": -5.035458087921143, "global_step": 11696, "epoch": 278} {"train_loss": -5.176661491394043, "global_step": 11697, "epoch": 278} {"train_loss": -4.981526851654053, "global_step": 11698, "epoch": 278} {"train_loss": -4.896421432495117, "global_step": 11699, "epoch": 278} {"train_loss": -4.939859390258789, "global_step": 11700, "epoch": 278} {"train_loss": -4.958520889282227, "global_step": 11701, "epoch": 278} {"train_loss": -5.027413368225098, "global_step": 11702, "epoch": 278} {"train_loss": -4.993295669555664, "global_step": 11703, "epoch": 278} {"train_loss": -5.09408712387085, "global_step": 11704, "epoch": 278} {"train_loss": -5.12529182434082, "global_step": 11705, "epoch": 278} {"train_loss": -5.076076507568359, "global_step": 11706, "epoch": 278} {"train_loss": -5.139720916748047, "global_step": 11707, "epoch": 278} {"train_loss": -5.062166213989258, "global_step": 11708, "epoch": 278} {"train_loss": -5.126609802246094, "global_step": 11709, "epoch": 278} {"train_loss": -4.972216606140137, "global_step": 11710, "epoch": 278} {"train_loss": -5.007258415222168, "global_step": 11711, "epoch": 278} {"train_loss": -5.059209823608398, "global_step": 11712, "epoch": 278} {"train_loss": -4.989933967590332, "global_step": 11713, "epoch": 278} {"train_loss": -4.977085113525391, "global_step": 11714, "epoch": 278} {"train_loss": -5.144650459289551, "global_step": 11715, "epoch": 278} {"train_loss": -4.9136762619018555, "global_step": 11716, "epoch": 278} {"train_loss": -5.062558843975975, "global_step": 11717, "epoch": 278, "val_loss": 80891.6328125} {"train_loss": -5.003354072570801, "global_step": 11718, "epoch": 279} {"train_loss": -5.027843475341797, "global_step": 11719, "epoch": 279} {"train_loss": -5.162097930908203, "global_step": 11720, "epoch": 279} {"train_loss": -5.13275146484375, "global_step": 11721, "epoch": 279} {"train_loss": -5.0856499671936035, "global_step": 11722, "epoch": 279} {"train_loss": -4.980636119842529, "global_step": 11723, "epoch": 279} {"train_loss": -5.294787883758545, "global_step": 11724, "epoch": 279} {"train_loss": -5.056396484375, "global_step": 11725, "epoch": 279} {"train_loss": -5.180030822753906, "global_step": 11726, "epoch": 279} {"train_loss": -5.0612287521362305, "global_step": 11727, "epoch": 279} {"train_loss": -5.175470352172852, "global_step": 11728, "epoch": 279} {"train_loss": -5.140324592590332, "global_step": 11729, "epoch": 279} {"train_loss": -5.135122299194336, "global_step": 11730, "epoch": 279} {"train_loss": -4.964237213134766, "global_step": 11731, "epoch": 279} {"train_loss": -5.022686004638672, "global_step": 11732, "epoch": 279} {"train_loss": -5.13359260559082, "global_step": 11733, "epoch": 279} {"train_loss": -5.035311698913574, "global_step": 11734, "epoch": 279} {"train_loss": -5.168725967407227, "global_step": 11735, "epoch": 279} {"train_loss": -5.058278560638428, "global_step": 11736, "epoch": 279} {"train_loss": -5.204988479614258, "global_step": 11737, "epoch": 279} {"train_loss": -5.154941082000732, "global_step": 11738, "epoch": 279} {"train_loss": -5.198420524597168, "global_step": 11739, "epoch": 279} {"train_loss": -5.159040451049805, "global_step": 11740, "epoch": 279} {"train_loss": -4.933777809143066, "global_step": 11741, "epoch": 279} {"train_loss": -4.99770450592041, "global_step": 11742, "epoch": 279} {"train_loss": -5.096537113189697, "global_step": 11743, "epoch": 279} {"train_loss": -5.096312046051025, "global_step": 11744, "epoch": 279} {"train_loss": -5.039644241333008, "global_step": 11745, "epoch": 279} {"train_loss": -5.043753623962402, "global_step": 11746, "epoch": 279} {"train_loss": -5.0082597732543945, "global_step": 11747, "epoch": 279} {"train_loss": -5.152775764465332, "global_step": 11748, "epoch": 279} {"train_loss": -5.016786098480225, "global_step": 11749, "epoch": 279} {"train_loss": -5.0692009925842285, "global_step": 11750, "epoch": 279} {"train_loss": -5.111661434173584, "global_step": 11751, "epoch": 279} {"train_loss": -5.045751571655273, "global_step": 11752, "epoch": 279} {"train_loss": -5.072803497314453, "global_step": 11753, "epoch": 279} {"train_loss": -5.047483444213867, "global_step": 11754, "epoch": 279} {"train_loss": -5.187411308288574, "global_step": 11755, "epoch": 279} {"train_loss": -5.034421443939209, "global_step": 11756, "epoch": 279} {"train_loss": -5.050383567810059, "global_step": 11757, "epoch": 279} {"train_loss": -5.066969394683838, "global_step": 11758, "epoch": 279} {"train_loss": -5.087211574826922, "global_step": 11759, "epoch": 279, "val_loss": 80405.2890625} {"train_loss": -4.969086647033691, "global_step": 11760, "epoch": 280} {"train_loss": -5.026446342468262, "global_step": 11761, "epoch": 280} {"train_loss": -4.971771240234375, "global_step": 11762, "epoch": 280} {"train_loss": -5.102114677429199, "global_step": 11763, "epoch": 280} {"train_loss": -4.923303127288818, "global_step": 11764, "epoch": 280} {"train_loss": -4.946821689605713, "global_step": 11765, "epoch": 280} {"train_loss": -4.797904968261719, "global_step": 11766, "epoch": 280} {"train_loss": -5.073504447937012, "global_step": 11767, "epoch": 280} {"train_loss": -4.844018936157227, "global_step": 11768, "epoch": 280} {"train_loss": -4.9974365234375, "global_step": 11769, "epoch": 280} {"train_loss": -5.148022651672363, "global_step": 11770, "epoch": 280} {"train_loss": -4.973357200622559, "global_step": 11771, "epoch": 280} {"train_loss": -5.13808012008667, "global_step": 11772, "epoch": 280} {"train_loss": -5.126930236816406, "global_step": 11773, "epoch": 280} {"train_loss": -5.115926742553711, "global_step": 11774, "epoch": 280} {"train_loss": -5.198293685913086, "global_step": 11775, "epoch": 280} {"train_loss": -4.978768348693848, "global_step": 11776, "epoch": 280} {"train_loss": -4.952056407928467, "global_step": 11777, "epoch": 280} {"train_loss": -5.1453962326049805, "global_step": 11778, "epoch": 280} {"train_loss": -5.046979904174805, "global_step": 11779, "epoch": 280} {"train_loss": -5.1137518882751465, "global_step": 11780, "epoch": 280} {"train_loss": -5.062250137329102, "global_step": 11781, "epoch": 280} {"train_loss": -5.0715837478637695, "global_step": 11782, "epoch": 280} {"train_loss": -5.216925621032715, "global_step": 11783, "epoch": 280} {"train_loss": -5.101155757904053, "global_step": 11784, "epoch": 280} {"train_loss": -4.941025733947754, "global_step": 11785, "epoch": 280} {"train_loss": -5.150795936584473, "global_step": 11786, "epoch": 280} {"train_loss": -5.110772609710693, "global_step": 11787, "epoch": 280} {"train_loss": -5.134549140930176, "global_step": 11788, "epoch": 280} {"train_loss": -5.026968955993652, "global_step": 11789, "epoch": 280} {"train_loss": -5.006744384765625, "global_step": 11790, "epoch": 280} {"train_loss": -5.095196723937988, "global_step": 11791, "epoch": 280} {"train_loss": -5.058350563049316, "global_step": 11792, "epoch": 280} {"train_loss": -5.158825874328613, "global_step": 11793, "epoch": 280} {"train_loss": -5.1106038093566895, "global_step": 11794, "epoch": 280} {"train_loss": -5.029136657714844, "global_step": 11795, "epoch": 280} {"train_loss": -5.1530609130859375, "global_step": 11796, "epoch": 280} {"train_loss": -5.179017543792725, "global_step": 11797, "epoch": 280} {"train_loss": -5.178655624389648, "global_step": 11798, "epoch": 280} {"train_loss": -5.104825019836426, "global_step": 11799, "epoch": 280} {"train_loss": -5.176926136016846, "global_step": 11800, "epoch": 280} {"train_loss": -5.066941772188459, "global_step": 11801, "epoch": 280, "val_loss": 79212.2734375} {"train_loss": -5.1263251304626465, "global_step": 11802, "epoch": 281} {"train_loss": -4.966670036315918, "global_step": 11803, "epoch": 281} {"train_loss": -5.104278564453125, "global_step": 11804, "epoch": 281} {"train_loss": -5.078896522521973, "global_step": 11805, "epoch": 281} {"train_loss": -5.1516313552856445, "global_step": 11806, "epoch": 281} {"train_loss": -5.056110382080078, "global_step": 11807, "epoch": 281} {"train_loss": -5.184548377990723, "global_step": 11808, "epoch": 281} {"train_loss": -5.139442443847656, "global_step": 11809, "epoch": 281} {"train_loss": -5.064305305480957, "global_step": 11810, "epoch": 281} {"train_loss": -4.956846237182617, "global_step": 11811, "epoch": 281} {"train_loss": -5.179632663726807, "global_step": 11812, "epoch": 281} {"train_loss": -5.129601001739502, "global_step": 11813, "epoch": 281} {"train_loss": -4.972473621368408, "global_step": 11814, "epoch": 281} {"train_loss": -5.084029197692871, "global_step": 11815, "epoch": 281} {"train_loss": -5.078991889953613, "global_step": 11816, "epoch": 281} {"train_loss": -5.025600433349609, "global_step": 11817, "epoch": 281} {"train_loss": -5.012887477874756, "global_step": 11818, "epoch": 281} {"train_loss": -4.922357082366943, "global_step": 11819, "epoch": 281} {"train_loss": -5.0678911209106445, "global_step": 11820, "epoch": 281} {"train_loss": -5.143432140350342, "global_step": 11821, "epoch": 281} {"train_loss": -5.0933990478515625, "global_step": 11822, "epoch": 281} {"train_loss": -5.09404182434082, "global_step": 11823, "epoch": 281} {"train_loss": -5.1170172691345215, "global_step": 11824, "epoch": 281} {"train_loss": -4.963130950927734, "global_step": 11825, "epoch": 281} {"train_loss": -4.982418060302734, "global_step": 11826, "epoch": 281} {"train_loss": -5.069558620452881, "global_step": 11827, "epoch": 281} {"train_loss": -5.174318313598633, "global_step": 11828, "epoch": 281} {"train_loss": -5.049094200134277, "global_step": 11829, "epoch": 281} {"train_loss": -5.00075626373291, "global_step": 11830, "epoch": 281} {"train_loss": -5.241724967956543, "global_step": 11831, "epoch": 281} {"train_loss": -5.052416801452637, "global_step": 11832, "epoch": 281} {"train_loss": -5.0517072677612305, "global_step": 11833, "epoch": 281} {"train_loss": -5.056126594543457, "global_step": 11834, "epoch": 281} {"train_loss": -5.012609481811523, "global_step": 11835, "epoch": 281} {"train_loss": -5.067529201507568, "global_step": 11836, "epoch": 281} {"train_loss": -5.161648750305176, "global_step": 11837, "epoch": 281} {"train_loss": -5.158225059509277, "global_step": 11838, "epoch": 281} {"train_loss": -5.176115036010742, "global_step": 11839, "epoch": 281} {"train_loss": -5.13093376159668, "global_step": 11840, "epoch": 281} {"train_loss": -5.211659908294678, "global_step": 11841, "epoch": 281} {"train_loss": -5.149834632873535, "global_step": 11842, "epoch": 281} {"train_loss": -5.083496218635922, "global_step": 11843, "epoch": 281, "val_loss": 79967.3125} {"train_loss": -4.842072486877441, "global_step": 11844, "epoch": 282} {"train_loss": -4.978227138519287, "global_step": 11845, "epoch": 282} {"train_loss": -4.900872230529785, "global_step": 11846, "epoch": 282} {"train_loss": -5.13487434387207, "global_step": 11847, "epoch": 282} {"train_loss": -5.066714763641357, "global_step": 11848, "epoch": 282} {"train_loss": -4.954768180847168, "global_step": 11849, "epoch": 282} {"train_loss": -4.909137725830078, "global_step": 11850, "epoch": 282} {"train_loss": -4.995630264282227, "global_step": 11851, "epoch": 282} {"train_loss": -5.094968318939209, "global_step": 11852, "epoch": 282} {"train_loss": -5.146563529968262, "global_step": 11853, "epoch": 282} {"train_loss": -5.106876373291016, "global_step": 11854, "epoch": 282} {"train_loss": -5.204253196716309, "global_step": 11855, "epoch": 282} {"train_loss": -5.077583312988281, "global_step": 11856, "epoch": 282} {"train_loss": -5.041510581970215, "global_step": 11857, "epoch": 282} {"train_loss": -5.047145843505859, "global_step": 11858, "epoch": 282} {"train_loss": -5.092687606811523, "global_step": 11859, "epoch": 282} {"train_loss": -5.1359405517578125, "global_step": 11860, "epoch": 282} {"train_loss": -4.982763290405273, "global_step": 11861, "epoch": 282} {"train_loss": -5.066854476928711, "global_step": 11862, "epoch": 282} {"train_loss": -5.077438831329346, "global_step": 11863, "epoch": 282} {"train_loss": -5.184504508972168, "global_step": 11864, "epoch": 282} {"train_loss": -5.0299906730651855, "global_step": 11865, "epoch": 282} {"train_loss": -4.997345447540283, "global_step": 11866, "epoch": 282} {"train_loss": -5.1154961585998535, "global_step": 11867, "epoch": 282} {"train_loss": -5.031961441040039, "global_step": 11868, "epoch": 282} {"train_loss": -4.994599342346191, "global_step": 11869, "epoch": 282} {"train_loss": -5.08201789855957, "global_step": 11870, "epoch": 282} {"train_loss": -5.019362449645996, "global_step": 11871, "epoch": 282} {"train_loss": -5.230053901672363, "global_step": 11872, "epoch": 282} {"train_loss": -5.096899032592773, "global_step": 11873, "epoch": 282} {"train_loss": -5.1521830558776855, "global_step": 11874, "epoch": 282} {"train_loss": -5.075389385223389, "global_step": 11875, "epoch": 282} {"train_loss": -5.127570152282715, "global_step": 11876, "epoch": 282} {"train_loss": -5.151790618896484, "global_step": 11877, "epoch": 282} {"train_loss": -5.13698673248291, "global_step": 11878, "epoch": 282} {"train_loss": -5.054213523864746, "global_step": 11879, "epoch": 282} {"train_loss": -5.0759806632995605, "global_step": 11880, "epoch": 282} {"train_loss": -5.136654853820801, "global_step": 11881, "epoch": 282} {"train_loss": -5.099300861358643, "global_step": 11882, "epoch": 282} {"train_loss": -4.971025466918945, "global_step": 11883, "epoch": 282} {"train_loss": -5.261374473571777, "global_step": 11884, "epoch": 282} {"train_loss": -5.067649296351841, "global_step": 11885, "epoch": 282, "val_loss": 79824.59375} {"train_loss": -5.184258460998535, "global_step": 11886, "epoch": 283} {"train_loss": -5.069930076599121, "global_step": 11887, "epoch": 283} {"train_loss": -5.06546688079834, "global_step": 11888, "epoch": 283} {"train_loss": -5.228586196899414, "global_step": 11889, "epoch": 283} {"train_loss": -5.128433704376221, "global_step": 11890, "epoch": 283} {"train_loss": -5.045082092285156, "global_step": 11891, "epoch": 283} {"train_loss": -4.953932762145996, "global_step": 11892, "epoch": 283} {"train_loss": -4.846334457397461, "global_step": 11893, "epoch": 283} {"train_loss": -4.932495594024658, "global_step": 11894, "epoch": 283} {"train_loss": -5.120411396026611, "global_step": 11895, "epoch": 283} {"train_loss": -4.972542762756348, "global_step": 11896, "epoch": 283} {"train_loss": -5.092357635498047, "global_step": 11897, "epoch": 283} {"train_loss": -5.068243980407715, "global_step": 11898, "epoch": 283} {"train_loss": -5.005947589874268, "global_step": 11899, "epoch": 283} {"train_loss": -4.938745498657227, "global_step": 11900, "epoch": 283} {"train_loss": -5.051098346710205, "global_step": 11901, "epoch": 283} {"train_loss": -5.127647876739502, "global_step": 11902, "epoch": 283} {"train_loss": -5.006467342376709, "global_step": 11903, "epoch": 283} {"train_loss": -4.9749755859375, "global_step": 11904, "epoch": 283} {"train_loss": -5.117282390594482, "global_step": 11905, "epoch": 283} {"train_loss": -5.071943283081055, "global_step": 11906, "epoch": 283} {"train_loss": -5.210192680358887, "global_step": 11907, "epoch": 283} {"train_loss": -5.0985493659973145, "global_step": 11908, "epoch": 283} {"train_loss": -5.063946723937988, "global_step": 11909, "epoch": 283} {"train_loss": -5.04982852935791, "global_step": 11910, "epoch": 283} {"train_loss": -5.152454376220703, "global_step": 11911, "epoch": 283} {"train_loss": -5.008012771606445, "global_step": 11912, "epoch": 283} {"train_loss": -4.992286682128906, "global_step": 11913, "epoch": 283} {"train_loss": -5.060450553894043, "global_step": 11914, "epoch": 283} {"train_loss": -5.0191874504089355, "global_step": 11915, "epoch": 283} {"train_loss": -5.093562126159668, "global_step": 11916, "epoch": 283} {"train_loss": -5.056005477905273, "global_step": 11917, "epoch": 283} {"train_loss": -5.114609241485596, "global_step": 11918, "epoch": 283} {"train_loss": -5.135128498077393, "global_step": 11919, "epoch": 283} {"train_loss": -5.138457775115967, "global_step": 11920, "epoch": 283} {"train_loss": -5.04664421081543, "global_step": 11921, "epoch": 283} {"train_loss": -4.973026275634766, "global_step": 11922, "epoch": 283} {"train_loss": -5.067212104797363, "global_step": 11923, "epoch": 283} {"train_loss": -5.134427070617676, "global_step": 11924, "epoch": 283} {"train_loss": -5.048551559448242, "global_step": 11925, "epoch": 283} {"train_loss": -5.053665637969971, "global_step": 11926, "epoch": 283} {"train_loss": -5.063220818837483, "global_step": 11927, "epoch": 283, "val_loss": 79637.4609375} {"train_loss": -5.141379356384277, "global_step": 11928, "epoch": 284} {"train_loss": -5.153384208679199, "global_step": 11929, "epoch": 284} {"train_loss": -5.127586364746094, "global_step": 11930, "epoch": 284} {"train_loss": -4.988490104675293, "global_step": 11931, "epoch": 284} {"train_loss": -5.1497063636779785, "global_step": 11932, "epoch": 284} {"train_loss": -5.230263710021973, "global_step": 11933, "epoch": 284} {"train_loss": -5.070647239685059, "global_step": 11934, "epoch": 284} {"train_loss": -4.994548320770264, "global_step": 11935, "epoch": 284} {"train_loss": -5.172418117523193, "global_step": 11936, "epoch": 284} {"train_loss": -5.020449638366699, "global_step": 11937, "epoch": 284} {"train_loss": -5.112715721130371, "global_step": 11938, "epoch": 284} {"train_loss": -4.9343180656433105, "global_step": 11939, "epoch": 284} {"train_loss": -4.976200103759766, "global_step": 11940, "epoch": 284} {"train_loss": -5.23340368270874, "global_step": 11941, "epoch": 284} {"train_loss": -5.0603227615356445, "global_step": 11942, "epoch": 284} {"train_loss": -5.168073654174805, "global_step": 11943, "epoch": 284} {"train_loss": -5.033547401428223, "global_step": 11944, "epoch": 284} {"train_loss": -5.0200676918029785, "global_step": 11945, "epoch": 284} {"train_loss": -5.028644561767578, "global_step": 11946, "epoch": 284} {"train_loss": -5.125592231750488, "global_step": 11947, "epoch": 284} {"train_loss": -4.768426895141602, "global_step": 11948, "epoch": 284} {"train_loss": -5.159974098205566, "global_step": 11949, "epoch": 284} {"train_loss": -4.842985153198242, "global_step": 11950, "epoch": 284} {"train_loss": -4.978367805480957, "global_step": 11951, "epoch": 284} {"train_loss": -4.925417900085449, "global_step": 11952, "epoch": 284} {"train_loss": -4.917790412902832, "global_step": 11953, "epoch": 284} {"train_loss": -5.102180480957031, "global_step": 11954, "epoch": 284} {"train_loss": -4.995749473571777, "global_step": 11955, "epoch": 284} {"train_loss": -4.985167503356934, "global_step": 11956, "epoch": 284} {"train_loss": -5.229452133178711, "global_step": 11957, "epoch": 284} {"train_loss": -4.855073928833008, "global_step": 11958, "epoch": 284} {"train_loss": -4.991014003753662, "global_step": 11959, "epoch": 284} {"train_loss": -4.699968338012695, "global_step": 11960, "epoch": 284} {"train_loss": -5.099813938140869, "global_step": 11961, "epoch": 284} {"train_loss": -4.917274475097656, "global_step": 11962, "epoch": 284} {"train_loss": -4.842362403869629, "global_step": 11963, "epoch": 284} {"train_loss": -4.882726669311523, "global_step": 11964, "epoch": 284} {"train_loss": -5.105487823486328, "global_step": 11965, "epoch": 284} {"train_loss": -4.780156135559082, "global_step": 11966, "epoch": 284} {"train_loss": -5.127815246582031, "global_step": 11967, "epoch": 284} {"train_loss": -4.890993595123291, "global_step": 11968, "epoch": 284} {"train_loss": -5.019139392035348, "global_step": 11969, "epoch": 284, "val_loss": 81059.78125} {"train_loss": -4.915494918823242, "global_step": 11970, "epoch": 285} {"train_loss": -5.125837326049805, "global_step": 11971, "epoch": 285} {"train_loss": -5.076679229736328, "global_step": 11972, "epoch": 285} {"train_loss": -5.128851890563965, "global_step": 11973, "epoch": 285} {"train_loss": -5.065042972564697, "global_step": 11974, "epoch": 285} {"train_loss": -5.008724212646484, "global_step": 11975, "epoch": 285} {"train_loss": -5.11272668838501, "global_step": 11976, "epoch": 285} {"train_loss": -5.213696479797363, "global_step": 11977, "epoch": 285} {"train_loss": -4.928114891052246, "global_step": 11978, "epoch": 285} {"train_loss": -5.273951530456543, "global_step": 11979, "epoch": 285} {"train_loss": -5.091107368469238, "global_step": 11980, "epoch": 285} {"train_loss": -5.219599723815918, "global_step": 11981, "epoch": 285} {"train_loss": -5.089347839355469, "global_step": 11982, "epoch": 285} {"train_loss": -5.249331474304199, "global_step": 11983, "epoch": 285} {"train_loss": -4.930961608886719, "global_step": 11984, "epoch": 285} {"train_loss": -5.066998481750488, "global_step": 11985, "epoch": 285} {"train_loss": -5.205143928527832, "global_step": 11986, "epoch": 285} {"train_loss": -4.9993367195129395, "global_step": 11987, "epoch": 285} {"train_loss": -5.088369369506836, "global_step": 11988, "epoch": 285} {"train_loss": -5.082269191741943, "global_step": 11989, "epoch": 285} {"train_loss": -5.021053791046143, "global_step": 11990, "epoch": 285} {"train_loss": -5.011514186859131, "global_step": 11991, "epoch": 285} {"train_loss": -5.192595958709717, "global_step": 11992, "epoch": 285} {"train_loss": -4.854476451873779, "global_step": 11993, "epoch": 285} {"train_loss": -5.175539493560791, "global_step": 11994, "epoch": 285} {"train_loss": -5.307889938354492, "global_step": 11995, "epoch": 285} {"train_loss": -5.195457935333252, "global_step": 11996, "epoch": 285} {"train_loss": -4.978499412536621, "global_step": 11997, "epoch": 285} {"train_loss": -5.129240989685059, "global_step": 11998, "epoch": 285} {"train_loss": -5.059496879577637, "global_step": 11999, "epoch": 285} {"train_loss": -5.053345203399658, "global_step": 12000, "epoch": 285} {"train_loss": -5.18397331237793, "global_step": 12001, "epoch": 285} {"train_loss": -5.0987982749938965, "global_step": 12002, "epoch": 285} {"train_loss": -5.090110778808594, "global_step": 12003, "epoch": 285} {"train_loss": -4.976954460144043, "global_step": 12004, "epoch": 285} {"train_loss": -5.004864692687988, "global_step": 12005, "epoch": 285} {"train_loss": -4.954270362854004, "global_step": 12006, "epoch": 285} {"train_loss": -5.088059902191162, "global_step": 12007, "epoch": 285} {"train_loss": -4.9392595291137695, "global_step": 12008, "epoch": 285} {"train_loss": -4.898684501647949, "global_step": 12009, "epoch": 285} {"train_loss": -4.932838439941406, "global_step": 12010, "epoch": 285} {"train_loss": -5.064979746228173, "global_step": 12011, "epoch": 285, "val_loss": 80916.2265625} {"train_loss": -5.001613140106201, "global_step": 12012, "epoch": 286} {"train_loss": -5.00662899017334, "global_step": 12013, "epoch": 286} {"train_loss": -5.035890102386475, "global_step": 12014, "epoch": 286} {"train_loss": -5.019622802734375, "global_step": 12015, "epoch": 286} {"train_loss": -5.179652690887451, "global_step": 12016, "epoch": 286} {"train_loss": -4.964517116546631, "global_step": 12017, "epoch": 286} {"train_loss": -5.038372039794922, "global_step": 12018, "epoch": 286} {"train_loss": -4.92911434173584, "global_step": 12019, "epoch": 286} {"train_loss": -5.058518409729004, "global_step": 12020, "epoch": 286} {"train_loss": -5.175612449645996, "global_step": 12021, "epoch": 286} {"train_loss": -4.9742631912231445, "global_step": 12022, "epoch": 286} {"train_loss": -5.096686363220215, "global_step": 12023, "epoch": 286} {"train_loss": -4.920132637023926, "global_step": 12024, "epoch": 286} {"train_loss": -4.997113227844238, "global_step": 12025, "epoch": 286} {"train_loss": -4.933297157287598, "global_step": 12026, "epoch": 286} {"train_loss": -4.878278732299805, "global_step": 12027, "epoch": 286} {"train_loss": -5.002396583557129, "global_step": 12028, "epoch": 286} {"train_loss": -5.12877082824707, "global_step": 12029, "epoch": 286} {"train_loss": -5.1108174324035645, "global_step": 12030, "epoch": 286} {"train_loss": -5.13536262512207, "global_step": 12031, "epoch": 286} {"train_loss": -4.9535298347473145, "global_step": 12032, "epoch": 286} {"train_loss": -5.073263168334961, "global_step": 12033, "epoch": 286} {"train_loss": -5.161232948303223, "global_step": 12034, "epoch": 286} {"train_loss": -5.177890300750732, "global_step": 12035, "epoch": 286} {"train_loss": -5.122490882873535, "global_step": 12036, "epoch": 286} {"train_loss": -5.2095842361450195, "global_step": 12037, "epoch": 286} {"train_loss": -5.01826810836792, "global_step": 12038, "epoch": 286} {"train_loss": -5.144869804382324, "global_step": 12039, "epoch": 286} {"train_loss": -5.18702507019043, "global_step": 12040, "epoch": 286} {"train_loss": -5.199190139770508, "global_step": 12041, "epoch": 286} {"train_loss": -5.241788864135742, "global_step": 12042, "epoch": 286} {"train_loss": -5.023345947265625, "global_step": 12043, "epoch": 286} {"train_loss": -5.127225875854492, "global_step": 12044, "epoch": 286} {"train_loss": -5.050887107849121, "global_step": 12045, "epoch": 286} {"train_loss": -5.048069000244141, "global_step": 12046, "epoch": 286} {"train_loss": -5.185618877410889, "global_step": 12047, "epoch": 286} {"train_loss": -5.152502536773682, "global_step": 12048, "epoch": 286} {"train_loss": -4.848989963531494, "global_step": 12049, "epoch": 286} {"train_loss": -4.845645427703857, "global_step": 12050, "epoch": 286} {"train_loss": -4.998131275177002, "global_step": 12051, "epoch": 286} {"train_loss": -4.827281951904297, "global_step": 12052, "epoch": 286} {"train_loss": -5.051091557457333, "global_step": 12053, "epoch": 286, "val_loss": 79816.6953125} {"train_loss": -5.19046688079834, "global_step": 12054, "epoch": 287} {"train_loss": -5.049519062042236, "global_step": 12055, "epoch": 287} {"train_loss": -5.0304107666015625, "global_step": 12056, "epoch": 287} {"train_loss": -5.139472007751465, "global_step": 12057, "epoch": 287} {"train_loss": -5.055039882659912, "global_step": 12058, "epoch": 287} {"train_loss": -5.106657981872559, "global_step": 12059, "epoch": 287} {"train_loss": -5.054405212402344, "global_step": 12060, "epoch": 287} {"train_loss": -5.026088714599609, "global_step": 12061, "epoch": 287} {"train_loss": -5.033786773681641, "global_step": 12062, "epoch": 287} {"train_loss": -5.145776748657227, "global_step": 12063, "epoch": 287} {"train_loss": -5.138405799865723, "global_step": 12064, "epoch": 287} {"train_loss": -5.1514434814453125, "global_step": 12065, "epoch": 287} {"train_loss": -5.000335693359375, "global_step": 12066, "epoch": 287} {"train_loss": -5.200860977172852, "global_step": 12067, "epoch": 287} {"train_loss": -5.16218376159668, "global_step": 12068, "epoch": 287} {"train_loss": -5.173499584197998, "global_step": 12069, "epoch": 287} {"train_loss": -5.159305572509766, "global_step": 12070, "epoch": 287} {"train_loss": -5.04624080657959, "global_step": 12071, "epoch": 287} {"train_loss": -5.113994121551514, "global_step": 12072, "epoch": 287} {"train_loss": -5.129050254821777, "global_step": 12073, "epoch": 287} {"train_loss": -5.145800590515137, "global_step": 12074, "epoch": 287} {"train_loss": -5.136075496673584, "global_step": 12075, "epoch": 287} {"train_loss": -5.125974178314209, "global_step": 12076, "epoch": 287} {"train_loss": -4.825486660003662, "global_step": 12077, "epoch": 287} {"train_loss": -5.076929092407227, "global_step": 12078, "epoch": 287} {"train_loss": -5.072772979736328, "global_step": 12079, "epoch": 287} {"train_loss": -5.062738418579102, "global_step": 12080, "epoch": 287} {"train_loss": -5.023935317993164, "global_step": 12081, "epoch": 287} {"train_loss": -5.259703636169434, "global_step": 12082, "epoch": 287} {"train_loss": -5.185022354125977, "global_step": 12083, "epoch": 287} {"train_loss": -5.1170759201049805, "global_step": 12084, "epoch": 287} {"train_loss": -5.039916038513184, "global_step": 12085, "epoch": 287} {"train_loss": -4.939405918121338, "global_step": 12086, "epoch": 287} {"train_loss": -5.0868425369262695, "global_step": 12087, "epoch": 287} {"train_loss": -5.1167402267456055, "global_step": 12088, "epoch": 287} {"train_loss": -5.197240352630615, "global_step": 12089, "epoch": 287} {"train_loss": -5.263787746429443, "global_step": 12090, "epoch": 287} {"train_loss": -5.210421085357666, "global_step": 12091, "epoch": 287} {"train_loss": -5.077948570251465, "global_step": 12092, "epoch": 287} {"train_loss": -5.041215896606445, "global_step": 12093, "epoch": 287} {"train_loss": -4.981103897094727, "global_step": 12094, "epoch": 287} {"train_loss": -5.10217607588995, "global_step": 12095, "epoch": 287, "val_loss": 79892.453125} {"train_loss": -5.060201644897461, "global_step": 12096, "epoch": 288} {"train_loss": -5.118868827819824, "global_step": 12097, "epoch": 288} {"train_loss": -5.139648914337158, "global_step": 12098, "epoch": 288} {"train_loss": -4.986728668212891, "global_step": 12099, "epoch": 288} {"train_loss": -5.229344367980957, "global_step": 12100, "epoch": 288} {"train_loss": -5.057330131530762, "global_step": 12101, "epoch": 288} {"train_loss": -5.209575653076172, "global_step": 12102, "epoch": 288} {"train_loss": -5.057856559753418, "global_step": 12103, "epoch": 288} {"train_loss": -5.096179962158203, "global_step": 12104, "epoch": 288} {"train_loss": -5.166962146759033, "global_step": 12105, "epoch": 288} {"train_loss": -5.17356538772583, "global_step": 12106, "epoch": 288} {"train_loss": -5.109549045562744, "global_step": 12107, "epoch": 288} {"train_loss": -4.981452465057373, "global_step": 12108, "epoch": 288} {"train_loss": -5.136216163635254, "global_step": 12109, "epoch": 288} {"train_loss": -5.021449089050293, "global_step": 12110, "epoch": 288} {"train_loss": -5.114030361175537, "global_step": 12111, "epoch": 288} {"train_loss": -5.182461738586426, "global_step": 12112, "epoch": 288} {"train_loss": -5.117114067077637, "global_step": 12113, "epoch": 288} {"train_loss": -4.9021711349487305, "global_step": 12114, "epoch": 288} {"train_loss": -5.0893964767456055, "global_step": 12115, "epoch": 288} {"train_loss": -5.082542896270752, "global_step": 12116, "epoch": 288} {"train_loss": -5.032364845275879, "global_step": 12117, "epoch": 288} {"train_loss": -5.157326698303223, "global_step": 12118, "epoch": 288} {"train_loss": -5.216095924377441, "global_step": 12119, "epoch": 288} {"train_loss": -5.047575950622559, "global_step": 12120, "epoch": 288} {"train_loss": -5.270134925842285, "global_step": 12121, "epoch": 288} {"train_loss": -5.128590106964111, "global_step": 12122, "epoch": 288} {"train_loss": -5.16660213470459, "global_step": 12123, "epoch": 288} {"train_loss": -5.13478946685791, "global_step": 12124, "epoch": 288} {"train_loss": -5.041329383850098, "global_step": 12125, "epoch": 288} {"train_loss": -4.902393341064453, "global_step": 12126, "epoch": 288} {"train_loss": -5.125205039978027, "global_step": 12127, "epoch": 288} {"train_loss": -4.892910003662109, "global_step": 12128, "epoch": 288} {"train_loss": -4.965804100036621, "global_step": 12129, "epoch": 288} {"train_loss": -4.993762016296387, "global_step": 12130, "epoch": 288} {"train_loss": -5.0176825523376465, "global_step": 12131, "epoch": 288} {"train_loss": -5.186270236968994, "global_step": 12132, "epoch": 288} {"train_loss": -4.965622901916504, "global_step": 12133, "epoch": 288} {"train_loss": -5.1597490310668945, "global_step": 12134, "epoch": 288} {"train_loss": -4.996029853820801, "global_step": 12135, "epoch": 288} {"train_loss": -4.943824768066406, "global_step": 12136, "epoch": 288} {"train_loss": -5.084735109692528, "global_step": 12137, "epoch": 288, "val_loss": 79472.7578125} {"train_loss": -5.0061540603637695, "global_step": 12138, "epoch": 289} {"train_loss": -5.141509056091309, "global_step": 12139, "epoch": 289} {"train_loss": -5.347970008850098, "global_step": 12140, "epoch": 289} {"train_loss": -5.245662689208984, "global_step": 12141, "epoch": 289} {"train_loss": -5.03278923034668, "global_step": 12142, "epoch": 289} {"train_loss": -5.016487121582031, "global_step": 12143, "epoch": 289} {"train_loss": -5.13264274597168, "global_step": 12144, "epoch": 289} {"train_loss": -5.027687072753906, "global_step": 12145, "epoch": 289} {"train_loss": -5.057427406311035, "global_step": 12146, "epoch": 289} {"train_loss": -5.079783916473389, "global_step": 12147, "epoch": 289} {"train_loss": -5.184204578399658, "global_step": 12148, "epoch": 289} {"train_loss": -5.245479106903076, "global_step": 12149, "epoch": 289} {"train_loss": -5.216180801391602, "global_step": 12150, "epoch": 289} {"train_loss": -5.127963066101074, "global_step": 12151, "epoch": 289} {"train_loss": -5.143510818481445, "global_step": 12152, "epoch": 289} {"train_loss": -5.026557922363281, "global_step": 12153, "epoch": 289} {"train_loss": -5.093435287475586, "global_step": 12154, "epoch": 289} {"train_loss": -5.127928733825684, "global_step": 12155, "epoch": 289} {"train_loss": -5.283452987670898, "global_step": 12156, "epoch": 289} {"train_loss": -5.079744338989258, "global_step": 12157, "epoch": 289} {"train_loss": -5.048856735229492, "global_step": 12158, "epoch": 289} {"train_loss": -5.056357383728027, "global_step": 12159, "epoch": 289} {"train_loss": -5.250227451324463, "global_step": 12160, "epoch": 289} {"train_loss": -5.10552453994751, "global_step": 12161, "epoch": 289} {"train_loss": -5.151893138885498, "global_step": 12162, "epoch": 289} {"train_loss": -5.002634525299072, "global_step": 12163, "epoch": 289} {"train_loss": -5.244956970214844, "global_step": 12164, "epoch": 289} {"train_loss": -5.103995323181152, "global_step": 12165, "epoch": 289} {"train_loss": -5.238874435424805, "global_step": 12166, "epoch": 289} {"train_loss": -5.042236328125, "global_step": 12167, "epoch": 289} {"train_loss": -5.014853477478027, "global_step": 12168, "epoch": 289} {"train_loss": -5.221249580383301, "global_step": 12169, "epoch": 289} {"train_loss": -5.15694522857666, "global_step": 12170, "epoch": 289} {"train_loss": -4.997272491455078, "global_step": 12171, "epoch": 289} {"train_loss": -5.205198287963867, "global_step": 12172, "epoch": 289} {"train_loss": -5.1560869216918945, "global_step": 12173, "epoch": 289} {"train_loss": -5.128561019897461, "global_step": 12174, "epoch": 289} {"train_loss": -5.070400714874268, "global_step": 12175, "epoch": 289} {"train_loss": -5.055682182312012, "global_step": 12176, "epoch": 289} {"train_loss": -5.144472599029541, "global_step": 12177, "epoch": 289} {"train_loss": -4.8756279945373535, "global_step": 12178, "epoch": 289} {"train_loss": -5.121132475989206, "global_step": 12179, "epoch": 289, "val_loss": 79152.1328125} {"train_loss": -5.092477321624756, "global_step": 12180, "epoch": 290} {"train_loss": -5.19922399520874, "global_step": 12181, "epoch": 290} {"train_loss": -5.019356727600098, "global_step": 12182, "epoch": 290} {"train_loss": -5.125791549682617, "global_step": 12183, "epoch": 290} {"train_loss": -5.041952133178711, "global_step": 12184, "epoch": 290} {"train_loss": -5.1328301429748535, "global_step": 12185, "epoch": 290} {"train_loss": -5.104572296142578, "global_step": 12186, "epoch": 290} {"train_loss": -4.920235633850098, "global_step": 12187, "epoch": 290} {"train_loss": -5.117727279663086, "global_step": 12188, "epoch": 290} {"train_loss": -4.98723030090332, "global_step": 12189, "epoch": 290} {"train_loss": -4.9098005294799805, "global_step": 12190, "epoch": 290} {"train_loss": -4.961523056030273, "global_step": 12191, "epoch": 290} {"train_loss": -4.82423210144043, "global_step": 12192, "epoch": 290} {"train_loss": -5.0476508140563965, "global_step": 12193, "epoch": 290} {"train_loss": -4.813884735107422, "global_step": 12194, "epoch": 290} {"train_loss": -4.811244010925293, "global_step": 12195, "epoch": 290} {"train_loss": -4.636752605438232, "global_step": 12196, "epoch": 290} {"train_loss": -4.725852966308594, "global_step": 12197, "epoch": 290} {"train_loss": -4.885996341705322, "global_step": 12198, "epoch": 290} {"train_loss": -4.731296062469482, "global_step": 12199, "epoch": 290} {"train_loss": -4.989964485168457, "global_step": 12200, "epoch": 290} {"train_loss": -4.721897125244141, "global_step": 12201, "epoch": 290} {"train_loss": -4.870914459228516, "global_step": 12202, "epoch": 290} {"train_loss": -4.987523078918457, "global_step": 12203, "epoch": 290} {"train_loss": -4.774960041046143, "global_step": 12204, "epoch": 290} {"train_loss": -4.7873029708862305, "global_step": 12205, "epoch": 290} {"train_loss": -4.969112873077393, "global_step": 12206, "epoch": 290} {"train_loss": -4.985052108764648, "global_step": 12207, "epoch": 290} {"train_loss": -4.932539939880371, "global_step": 12208, "epoch": 290} {"train_loss": -4.881723403930664, "global_step": 12209, "epoch": 290} {"train_loss": -5.006392478942871, "global_step": 12210, "epoch": 290} {"train_loss": -5.107657432556152, "global_step": 12211, "epoch": 290} {"train_loss": -5.0269317626953125, "global_step": 12212, "epoch": 290} {"train_loss": -5.041383743286133, "global_step": 12213, "epoch": 290} {"train_loss": -5.113185405731201, "global_step": 12214, "epoch": 290} {"train_loss": -4.96157169342041, "global_step": 12215, "epoch": 290} {"train_loss": -5.133090972900391, "global_step": 12216, "epoch": 290} {"train_loss": -4.972136497497559, "global_step": 12217, "epoch": 290} {"train_loss": -5.017002582550049, "global_step": 12218, "epoch": 290} {"train_loss": -4.9931440353393555, "global_step": 12219, "epoch": 290} {"train_loss": -5.185046195983887, "global_step": 12220, "epoch": 290} {"train_loss": -4.967669782184419, "global_step": 12221, "epoch": 290, "val_loss": 80388.609375} {"train_loss": -5.0093584060668945, "global_step": 12222, "epoch": 291} {"train_loss": -5.107062339782715, "global_step": 12223, "epoch": 291} {"train_loss": -5.162224292755127, "global_step": 12224, "epoch": 291} {"train_loss": -5.176479339599609, "global_step": 12225, "epoch": 291} {"train_loss": -5.0041327476501465, "global_step": 12226, "epoch": 291} {"train_loss": -4.97636604309082, "global_step": 12227, "epoch": 291} {"train_loss": -5.0294189453125, "global_step": 12228, "epoch": 291} {"train_loss": -5.076099395751953, "global_step": 12229, "epoch": 291} {"train_loss": -5.095624923706055, "global_step": 12230, "epoch": 291} {"train_loss": -5.145188331604004, "global_step": 12231, "epoch": 291} {"train_loss": -5.135953903198242, "global_step": 12232, "epoch": 291} {"train_loss": -5.110116481781006, "global_step": 12233, "epoch": 291} {"train_loss": -5.009660720825195, "global_step": 12234, "epoch": 291} {"train_loss": -5.108913421630859, "global_step": 12235, "epoch": 291} {"train_loss": -5.2345051765441895, "global_step": 12236, "epoch": 291} {"train_loss": -5.105149269104004, "global_step": 12237, "epoch": 291} {"train_loss": -5.204481601715088, "global_step": 12238, "epoch": 291} {"train_loss": -5.112093925476074, "global_step": 12239, "epoch": 291} {"train_loss": -5.155997276306152, "global_step": 12240, "epoch": 291} {"train_loss": -5.100157737731934, "global_step": 12241, "epoch": 291} {"train_loss": -5.094942092895508, "global_step": 12242, "epoch": 291} {"train_loss": -5.166908264160156, "global_step": 12243, "epoch": 291} {"train_loss": -5.042724609375, "global_step": 12244, "epoch": 291} {"train_loss": -5.118508815765381, "global_step": 12245, "epoch": 291} {"train_loss": -5.13568115234375, "global_step": 12246, "epoch": 291} {"train_loss": -5.056088924407959, "global_step": 12247, "epoch": 291} {"train_loss": -5.2470197677612305, "global_step": 12248, "epoch": 291} {"train_loss": -5.141868591308594, "global_step": 12249, "epoch": 291} {"train_loss": -5.077510356903076, "global_step": 12250, "epoch": 291} {"train_loss": -5.003299713134766, "global_step": 12251, "epoch": 291} {"train_loss": -5.134217262268066, "global_step": 12252, "epoch": 291} {"train_loss": -5.1696977615356445, "global_step": 12253, "epoch": 291} {"train_loss": -5.138798713684082, "global_step": 12254, "epoch": 291} {"train_loss": -5.0574188232421875, "global_step": 12255, "epoch": 291} {"train_loss": -5.040269374847412, "global_step": 12256, "epoch": 291} {"train_loss": -5.2820515632629395, "global_step": 12257, "epoch": 291} {"train_loss": -5.029134750366211, "global_step": 12258, "epoch": 291} {"train_loss": -5.118999481201172, "global_step": 12259, "epoch": 291} {"train_loss": -5.270112037658691, "global_step": 12260, "epoch": 291} {"train_loss": -5.190345764160156, "global_step": 12261, "epoch": 291} {"train_loss": -5.172652721405029, "global_step": 12262, "epoch": 291} {"train_loss": -5.1167462439764115, "global_step": 12263, "epoch": 291, "val_loss": 79101.421875} {"train_loss": -5.086206912994385, "global_step": 12264, "epoch": 292} {"train_loss": -5.21767520904541, "global_step": 12265, "epoch": 292} {"train_loss": -5.242425441741943, "global_step": 12266, "epoch": 292} {"train_loss": -5.004730224609375, "global_step": 12267, "epoch": 292} {"train_loss": -5.045346736907959, "global_step": 12268, "epoch": 292} {"train_loss": -5.023077964782715, "global_step": 12269, "epoch": 292} {"train_loss": -5.052029132843018, "global_step": 12270, "epoch": 292} {"train_loss": -5.116917133331299, "global_step": 12271, "epoch": 292} {"train_loss": -5.137757778167725, "global_step": 12272, "epoch": 292} {"train_loss": -5.185694694519043, "global_step": 12273, "epoch": 292} {"train_loss": -5.229004383087158, "global_step": 12274, "epoch": 292} {"train_loss": -5.116054058074951, "global_step": 12275, "epoch": 292} {"train_loss": -5.152451038360596, "global_step": 12276, "epoch": 292} {"train_loss": -5.176827430725098, "global_step": 12277, "epoch": 292} {"train_loss": -5.071892738342285, "global_step": 12278, "epoch": 292} {"train_loss": -5.157788276672363, "global_step": 12279, "epoch": 292} {"train_loss": -5.033939361572266, "global_step": 12280, "epoch": 292} {"train_loss": -5.070256233215332, "global_step": 12281, "epoch": 292} {"train_loss": -5.057827472686768, "global_step": 12282, "epoch": 292} {"train_loss": -5.234245300292969, "global_step": 12283, "epoch": 292} {"train_loss": -5.101217746734619, "global_step": 12284, "epoch": 292} {"train_loss": -5.212615966796875, "global_step": 12285, "epoch": 292} {"train_loss": -5.202110290527344, "global_step": 12286, "epoch": 292} {"train_loss": -5.1616129875183105, "global_step": 12287, "epoch": 292} {"train_loss": -5.133840560913086, "global_step": 12288, "epoch": 292} {"train_loss": -5.125345230102539, "global_step": 12289, "epoch": 292} {"train_loss": -5.241847038269043, "global_step": 12290, "epoch": 292} {"train_loss": -5.185486316680908, "global_step": 12291, "epoch": 292} {"train_loss": -5.221627712249756, "global_step": 12292, "epoch": 292} {"train_loss": -5.20580530166626, "global_step": 12293, "epoch": 292} {"train_loss": -5.074947834014893, "global_step": 12294, "epoch": 292} {"train_loss": -5.0388617515563965, "global_step": 12295, "epoch": 292} {"train_loss": -4.9838361740112305, "global_step": 12296, "epoch": 292} {"train_loss": -5.231332302093506, "global_step": 12297, "epoch": 292} {"train_loss": -5.176731109619141, "global_step": 12298, "epoch": 292} {"train_loss": -4.937138557434082, "global_step": 12299, "epoch": 292} {"train_loss": -4.969371795654297, "global_step": 12300, "epoch": 292} {"train_loss": -5.141390800476074, "global_step": 12301, "epoch": 292} {"train_loss": -5.166231155395508, "global_step": 12302, "epoch": 292} {"train_loss": -4.970947265625, "global_step": 12303, "epoch": 292} {"train_loss": -5.198979377746582, "global_step": 12304, "epoch": 292} {"train_loss": -5.122250261760893, "global_step": 12305, "epoch": 292, "val_loss": 79854.1328125} {"train_loss": -5.001139163970947, "global_step": 12306, "epoch": 293} {"train_loss": -5.014352798461914, "global_step": 12307, "epoch": 293} {"train_loss": -4.983696937561035, "global_step": 12308, "epoch": 293} {"train_loss": -4.966179847717285, "global_step": 12309, "epoch": 293} {"train_loss": -5.107276439666748, "global_step": 12310, "epoch": 293} {"train_loss": -4.89456844329834, "global_step": 12311, "epoch": 293} {"train_loss": -4.950955867767334, "global_step": 12312, "epoch": 293} {"train_loss": -5.1489458084106445, "global_step": 12313, "epoch": 293} {"train_loss": -5.033998489379883, "global_step": 12314, "epoch": 293} {"train_loss": -4.8794097900390625, "global_step": 12315, "epoch": 293} {"train_loss": -5.216970443725586, "global_step": 12316, "epoch": 293} {"train_loss": -4.960907459259033, "global_step": 12317, "epoch": 293} {"train_loss": -5.0904316902160645, "global_step": 12318, "epoch": 293} {"train_loss": -5.038116931915283, "global_step": 12319, "epoch": 293} {"train_loss": -4.965585708618164, "global_step": 12320, "epoch": 293} {"train_loss": -5.234201908111572, "global_step": 12321, "epoch": 293} {"train_loss": -5.072357177734375, "global_step": 12322, "epoch": 293} {"train_loss": -5.211113929748535, "global_step": 12323, "epoch": 293} {"train_loss": -5.0892744064331055, "global_step": 12324, "epoch": 293} {"train_loss": -5.128576755523682, "global_step": 12325, "epoch": 293} {"train_loss": -5.159501075744629, "global_step": 12326, "epoch": 293} {"train_loss": -5.074519634246826, "global_step": 12327, "epoch": 293} {"train_loss": -5.022963523864746, "global_step": 12328, "epoch": 293} {"train_loss": -5.118851661682129, "global_step": 12329, "epoch": 293} {"train_loss": -5.136699676513672, "global_step": 12330, "epoch": 293} {"train_loss": -5.104086399078369, "global_step": 12331, "epoch": 293} {"train_loss": -5.174403667449951, "global_step": 12332, "epoch": 293} {"train_loss": -5.071362018585205, "global_step": 12333, "epoch": 293} {"train_loss": -5.148321151733398, "global_step": 12334, "epoch": 293} {"train_loss": -5.191267967224121, "global_step": 12335, "epoch": 293} {"train_loss": -5.178352355957031, "global_step": 12336, "epoch": 293} {"train_loss": -5.2086944580078125, "global_step": 12337, "epoch": 293} {"train_loss": -5.188389301300049, "global_step": 12338, "epoch": 293} {"train_loss": -5.126850605010986, "global_step": 12339, "epoch": 293} {"train_loss": -5.108532905578613, "global_step": 12340, "epoch": 293} {"train_loss": -4.977956295013428, "global_step": 12341, "epoch": 293} {"train_loss": -5.146350860595703, "global_step": 12342, "epoch": 293} {"train_loss": -5.090929985046387, "global_step": 12343, "epoch": 293} {"train_loss": -5.174304008483887, "global_step": 12344, "epoch": 293} {"train_loss": -4.978358745574951, "global_step": 12345, "epoch": 293} {"train_loss": -5.132146835327148, "global_step": 12346, "epoch": 293} {"train_loss": -5.0808023271106535, "global_step": 12347, "epoch": 293, "val_loss": 80696.1875} {"train_loss": -4.848126411437988, "global_step": 12348, "epoch": 294} {"train_loss": -5.016395568847656, "global_step": 12349, "epoch": 294} {"train_loss": -5.212602138519287, "global_step": 12350, "epoch": 294} {"train_loss": -4.947359085083008, "global_step": 12351, "epoch": 294} {"train_loss": -5.11000919342041, "global_step": 12352, "epoch": 294} {"train_loss": -4.963006973266602, "global_step": 12353, "epoch": 294} {"train_loss": -4.925449371337891, "global_step": 12354, "epoch": 294} {"train_loss": -5.110942840576172, "global_step": 12355, "epoch": 294} {"train_loss": -5.106639862060547, "global_step": 12356, "epoch": 294} {"train_loss": -5.140131950378418, "global_step": 12357, "epoch": 294} {"train_loss": -5.065608501434326, "global_step": 12358, "epoch": 294} {"train_loss": -5.0158538818359375, "global_step": 12359, "epoch": 294} {"train_loss": -5.124058723449707, "global_step": 12360, "epoch": 294} {"train_loss": -5.211658954620361, "global_step": 12361, "epoch": 294} {"train_loss": -5.330122470855713, "global_step": 12362, "epoch": 294} {"train_loss": -4.989289283752441, "global_step": 12363, "epoch": 294} {"train_loss": -4.994474411010742, "global_step": 12364, "epoch": 294} {"train_loss": -5.064359664916992, "global_step": 12365, "epoch": 294} {"train_loss": -5.118020057678223, "global_step": 12366, "epoch": 294} {"train_loss": -5.180511951446533, "global_step": 12367, "epoch": 294} {"train_loss": -5.013586044311523, "global_step": 12368, "epoch": 294} {"train_loss": -5.127375602722168, "global_step": 12369, "epoch": 294} {"train_loss": -5.078983783721924, "global_step": 12370, "epoch": 294} {"train_loss": -5.130363464355469, "global_step": 12371, "epoch": 294} {"train_loss": -5.054596900939941, "global_step": 12372, "epoch": 294} {"train_loss": -5.145878791809082, "global_step": 12373, "epoch": 294} {"train_loss": -5.104636192321777, "global_step": 12374, "epoch": 294} {"train_loss": -4.925412178039551, "global_step": 12375, "epoch": 294} {"train_loss": -5.107954025268555, "global_step": 12376, "epoch": 294} {"train_loss": -4.981810569763184, "global_step": 12377, "epoch": 294} {"train_loss": -5.123388290405273, "global_step": 12378, "epoch": 294} {"train_loss": -4.880771160125732, "global_step": 12379, "epoch": 294} {"train_loss": -5.064867973327637, "global_step": 12380, "epoch": 294} {"train_loss": -5.084831714630127, "global_step": 12381, "epoch": 294} {"train_loss": -5.152886390686035, "global_step": 12382, "epoch": 294} {"train_loss": -5.15775728225708, "global_step": 12383, "epoch": 294} {"train_loss": -4.945615768432617, "global_step": 12384, "epoch": 294} {"train_loss": -5.109931468963623, "global_step": 12385, "epoch": 294} {"train_loss": -5.1789350509643555, "global_step": 12386, "epoch": 294} {"train_loss": -5.164667129516602, "global_step": 12387, "epoch": 294} {"train_loss": -5.05825138092041, "global_step": 12388, "epoch": 294} {"train_loss": -5.07568393434797, "global_step": 12389, "epoch": 294, "val_loss": 79552.6796875} {"train_loss": -5.1930646896362305, "global_step": 12390, "epoch": 295} {"train_loss": -5.182748794555664, "global_step": 12391, "epoch": 295} {"train_loss": -5.209804534912109, "global_step": 12392, "epoch": 295} {"train_loss": -5.0761542320251465, "global_step": 12393, "epoch": 295} {"train_loss": -5.192620277404785, "global_step": 12394, "epoch": 295} {"train_loss": -5.035126686096191, "global_step": 12395, "epoch": 295} {"train_loss": -5.034499168395996, "global_step": 12396, "epoch": 295} {"train_loss": -5.154547691345215, "global_step": 12397, "epoch": 295} {"train_loss": -5.164511680603027, "global_step": 12398, "epoch": 295} {"train_loss": -5.144477844238281, "global_step": 12399, "epoch": 295} {"train_loss": -4.982169151306152, "global_step": 12400, "epoch": 295} {"train_loss": -5.20388126373291, "global_step": 12401, "epoch": 295} {"train_loss": -5.13116979598999, "global_step": 12402, "epoch": 295} {"train_loss": -5.074213027954102, "global_step": 12403, "epoch": 295} {"train_loss": -5.070587158203125, "global_step": 12404, "epoch": 295} {"train_loss": -5.045076370239258, "global_step": 12405, "epoch": 295} {"train_loss": -5.179104804992676, "global_step": 12406, "epoch": 295} {"train_loss": -5.2084269523620605, "global_step": 12407, "epoch": 295} {"train_loss": -5.131551742553711, "global_step": 12408, "epoch": 295} {"train_loss": -5.146408557891846, "global_step": 12409, "epoch": 295} {"train_loss": -5.309372425079346, "global_step": 12410, "epoch": 295} {"train_loss": -5.0406575202941895, "global_step": 12411, "epoch": 295} {"train_loss": -5.248429298400879, "global_step": 12412, "epoch": 295} {"train_loss": -5.150634765625, "global_step": 12413, "epoch": 295} {"train_loss": -4.990585803985596, "global_step": 12414, "epoch": 295} {"train_loss": -4.946081638336182, "global_step": 12415, "epoch": 295} {"train_loss": -5.181140899658203, "global_step": 12416, "epoch": 295} {"train_loss": -5.183162212371826, "global_step": 12417, "epoch": 295} {"train_loss": -5.151577949523926, "global_step": 12418, "epoch": 295} {"train_loss": -5.051873207092285, "global_step": 12419, "epoch": 295} {"train_loss": -4.998064994812012, "global_step": 12420, "epoch": 295} {"train_loss": -4.9927778244018555, "global_step": 12421, "epoch": 295} {"train_loss": -5.087827682495117, "global_step": 12422, "epoch": 295} {"train_loss": -5.112374305725098, "global_step": 12423, "epoch": 295} {"train_loss": -5.143904209136963, "global_step": 12424, "epoch": 295} {"train_loss": -5.209113121032715, "global_step": 12425, "epoch": 295} {"train_loss": -5.1483869552612305, "global_step": 12426, "epoch": 295} {"train_loss": -5.147549152374268, "global_step": 12427, "epoch": 295} {"train_loss": -5.1744208335876465, "global_step": 12428, "epoch": 295} {"train_loss": -5.21499490737915, "global_step": 12429, "epoch": 295} {"train_loss": -5.083909034729004, "global_step": 12430, "epoch": 295} {"train_loss": -5.124673979622977, "global_step": 12431, "epoch": 295, "val_loss": 79626.0859375} {"train_loss": -5.081629276275635, "global_step": 12432, "epoch": 296} {"train_loss": -5.161990642547607, "global_step": 12433, "epoch": 296} {"train_loss": -4.993191719055176, "global_step": 12434, "epoch": 296} {"train_loss": -5.064107894897461, "global_step": 12435, "epoch": 296} {"train_loss": -4.917820930480957, "global_step": 12436, "epoch": 296} {"train_loss": -5.039944648742676, "global_step": 12437, "epoch": 296} {"train_loss": -5.182389259338379, "global_step": 12438, "epoch": 296} {"train_loss": -5.129786968231201, "global_step": 12439, "epoch": 296} {"train_loss": -5.011828422546387, "global_step": 12440, "epoch": 296} {"train_loss": -5.127462387084961, "global_step": 12441, "epoch": 296} {"train_loss": -5.063393592834473, "global_step": 12442, "epoch": 296} {"train_loss": -4.9348649978637695, "global_step": 12443, "epoch": 296} {"train_loss": -5.039281845092773, "global_step": 12444, "epoch": 296} {"train_loss": -5.078036308288574, "global_step": 12445, "epoch": 296} {"train_loss": -5.1006598472595215, "global_step": 12446, "epoch": 296} {"train_loss": -5.181087493896484, "global_step": 12447, "epoch": 296} {"train_loss": -5.099788665771484, "global_step": 12448, "epoch": 296} {"train_loss": -5.126181602478027, "global_step": 12449, "epoch": 296} {"train_loss": -5.136662483215332, "global_step": 12450, "epoch": 296} {"train_loss": -5.102618217468262, "global_step": 12451, "epoch": 296} {"train_loss": -4.994234085083008, "global_step": 12452, "epoch": 296} {"train_loss": -4.968784809112549, "global_step": 12453, "epoch": 296} {"train_loss": -5.190543174743652, "global_step": 12454, "epoch": 296} {"train_loss": -5.1088972091674805, "global_step": 12455, "epoch": 296} {"train_loss": -5.051754951477051, "global_step": 12456, "epoch": 296} {"train_loss": -4.961040019989014, "global_step": 12457, "epoch": 296} {"train_loss": -5.085081100463867, "global_step": 12458, "epoch": 296} {"train_loss": -4.804135799407959, "global_step": 12459, "epoch": 296} {"train_loss": -5.059756755828857, "global_step": 12460, "epoch": 296} {"train_loss": -5.013271331787109, "global_step": 12461, "epoch": 296} {"train_loss": -5.081991195678711, "global_step": 12462, "epoch": 296} {"train_loss": -5.077939510345459, "global_step": 12463, "epoch": 296} {"train_loss": -4.958514213562012, "global_step": 12464, "epoch": 296} {"train_loss": -5.005617141723633, "global_step": 12465, "epoch": 296} {"train_loss": -4.976157188415527, "global_step": 12466, "epoch": 296} {"train_loss": -5.121058464050293, "global_step": 12467, "epoch": 296} {"train_loss": -4.897091865539551, "global_step": 12468, "epoch": 296} {"train_loss": -5.095417022705078, "global_step": 12469, "epoch": 296} {"train_loss": -5.002163410186768, "global_step": 12470, "epoch": 296} {"train_loss": -4.967879772186279, "global_step": 12471, "epoch": 296} {"train_loss": -5.129600524902344, "global_step": 12472, "epoch": 296} {"train_loss": -5.051173573448544, "global_step": 12473, "epoch": 296, "val_loss": 79096.375} {"train_loss": -5.133635520935059, "global_step": 12474, "epoch": 297} {"train_loss": -5.179290294647217, "global_step": 12475, "epoch": 297} {"train_loss": -5.100379467010498, "global_step": 12476, "epoch": 297} {"train_loss": -5.170280456542969, "global_step": 12477, "epoch": 297} {"train_loss": -5.125809669494629, "global_step": 12478, "epoch": 297} {"train_loss": -5.120481014251709, "global_step": 12479, "epoch": 297} {"train_loss": -5.221117973327637, "global_step": 12480, "epoch": 297} {"train_loss": -5.07631778717041, "global_step": 12481, "epoch": 297} {"train_loss": -5.091614246368408, "global_step": 12482, "epoch": 297} {"train_loss": -5.120767593383789, "global_step": 12483, "epoch": 297} {"train_loss": -5.300503730773926, "global_step": 12484, "epoch": 297} {"train_loss": -5.055327415466309, "global_step": 12485, "epoch": 297} {"train_loss": -5.281094551086426, "global_step": 12486, "epoch": 297} {"train_loss": -5.22310733795166, "global_step": 12487, "epoch": 297} {"train_loss": -5.309060096740723, "global_step": 12488, "epoch": 297} {"train_loss": -5.041630744934082, "global_step": 12489, "epoch": 297} {"train_loss": -5.0787553787231445, "global_step": 12490, "epoch": 297} {"train_loss": -5.152437210083008, "global_step": 12491, "epoch": 297} {"train_loss": -5.148592948913574, "global_step": 12492, "epoch": 297} {"train_loss": -5.005832672119141, "global_step": 12493, "epoch": 297} {"train_loss": -5.0255632400512695, "global_step": 12494, "epoch": 297} {"train_loss": -5.186949729919434, "global_step": 12495, "epoch": 297} {"train_loss": -4.969013690948486, "global_step": 12496, "epoch": 297} {"train_loss": -5.00653600692749, "global_step": 12497, "epoch": 297} {"train_loss": -4.985079288482666, "global_step": 12498, "epoch": 297} {"train_loss": -5.003997802734375, "global_step": 12499, "epoch": 297} {"train_loss": -5.208132743835449, "global_step": 12500, "epoch": 297} {"train_loss": -5.1744489669799805, "global_step": 12501, "epoch": 297} {"train_loss": -5.210859775543213, "global_step": 12502, "epoch": 297} {"train_loss": -5.101570129394531, "global_step": 12503, "epoch": 297} {"train_loss": -5.063708782196045, "global_step": 12504, "epoch": 297} {"train_loss": -4.977618217468262, "global_step": 12505, "epoch": 297} {"train_loss": -5.03963565826416, "global_step": 12506, "epoch": 297} {"train_loss": -5.0278730392456055, "global_step": 12507, "epoch": 297} {"train_loss": -5.070220947265625, "global_step": 12508, "epoch": 297} {"train_loss": -5.061472415924072, "global_step": 12509, "epoch": 297} {"train_loss": -5.040909767150879, "global_step": 12510, "epoch": 297} {"train_loss": -5.146097183227539, "global_step": 12511, "epoch": 297} {"train_loss": -5.112239837646484, "global_step": 12512, "epoch": 297} {"train_loss": -5.2054667472839355, "global_step": 12513, "epoch": 297} {"train_loss": -5.145596027374268, "global_step": 12514, "epoch": 297} {"train_loss": -5.112755627859206, "global_step": 12515, "epoch": 297, "val_loss": 79629.7734375} {"train_loss": -5.088143825531006, "global_step": 12516, "epoch": 298} {"train_loss": -5.123249053955078, "global_step": 12517, "epoch": 298} {"train_loss": -5.10845422744751, "global_step": 12518, "epoch": 298} {"train_loss": -5.037729263305664, "global_step": 12519, "epoch": 298} {"train_loss": -5.028288841247559, "global_step": 12520, "epoch": 298} {"train_loss": -5.112392425537109, "global_step": 12521, "epoch": 298} {"train_loss": -5.227533340454102, "global_step": 12522, "epoch": 298} {"train_loss": -5.05501651763916, "global_step": 12523, "epoch": 298} {"train_loss": -5.14063835144043, "global_step": 12524, "epoch": 298} {"train_loss": -5.16450309753418, "global_step": 12525, "epoch": 298} {"train_loss": -5.139096260070801, "global_step": 12526, "epoch": 298} {"train_loss": -5.202511787414551, "global_step": 12527, "epoch": 298} {"train_loss": -5.043378829956055, "global_step": 12528, "epoch": 298} {"train_loss": -5.190423011779785, "global_step": 12529, "epoch": 298} {"train_loss": -5.156480312347412, "global_step": 12530, "epoch": 298} {"train_loss": -5.105012893676758, "global_step": 12531, "epoch": 298} {"train_loss": -5.111238956451416, "global_step": 12532, "epoch": 298} {"train_loss": -5.0962748527526855, "global_step": 12533, "epoch": 298} {"train_loss": -5.131285667419434, "global_step": 12534, "epoch": 298} {"train_loss": -5.182883262634277, "global_step": 12535, "epoch": 298} {"train_loss": -5.081324577331543, "global_step": 12536, "epoch": 298} {"train_loss": -5.11617374420166, "global_step": 12537, "epoch": 298} {"train_loss": -5.079811096191406, "global_step": 12538, "epoch": 298} {"train_loss": -5.206380844116211, "global_step": 12539, "epoch": 298} {"train_loss": -5.2318115234375, "global_step": 12540, "epoch": 298} {"train_loss": -5.069772720336914, "global_step": 12541, "epoch": 298} {"train_loss": -5.169573783874512, "global_step": 12542, "epoch": 298} {"train_loss": -5.163987159729004, "global_step": 12543, "epoch": 298} {"train_loss": -5.128388404846191, "global_step": 12544, "epoch": 298} {"train_loss": -5.203736305236816, "global_step": 12545, "epoch": 298} {"train_loss": -5.132948398590088, "global_step": 12546, "epoch": 298} {"train_loss": -5.091109752655029, "global_step": 12547, "epoch": 298} {"train_loss": -5.213020324707031, "global_step": 12548, "epoch": 298} {"train_loss": -5.232076168060303, "global_step": 12549, "epoch": 298} {"train_loss": -4.986408710479736, "global_step": 12550, "epoch": 298} {"train_loss": -5.194824695587158, "global_step": 12551, "epoch": 298} {"train_loss": -4.993860244750977, "global_step": 12552, "epoch": 298} {"train_loss": -5.268798828125, "global_step": 12553, "epoch": 298} {"train_loss": -5.177699565887451, "global_step": 12554, "epoch": 298} {"train_loss": -5.256610870361328, "global_step": 12555, "epoch": 298} {"train_loss": -5.055397987365723, "global_step": 12556, "epoch": 298} {"train_loss": -5.131798653375535, "global_step": 12557, "epoch": 298, "val_loss": 79571.828125} {"train_loss": -5.163114070892334, "global_step": 12558, "epoch": 299} {"train_loss": -4.956954002380371, "global_step": 12559, "epoch": 299} {"train_loss": -5.075259208679199, "global_step": 12560, "epoch": 299} {"train_loss": -5.163829803466797, "global_step": 12561, "epoch": 299} {"train_loss": -5.175113677978516, "global_step": 12562, "epoch": 299} {"train_loss": -4.888188362121582, "global_step": 12563, "epoch": 299} {"train_loss": -5.100307941436768, "global_step": 12564, "epoch": 299} {"train_loss": -5.234259605407715, "global_step": 12565, "epoch": 299} {"train_loss": -5.131715297698975, "global_step": 12566, "epoch": 299} {"train_loss": -5.099660396575928, "global_step": 12567, "epoch": 299} {"train_loss": -5.17124080657959, "global_step": 12568, "epoch": 299} {"train_loss": -5.028280735015869, "global_step": 12569, "epoch": 299} {"train_loss": -4.999379634857178, "global_step": 12570, "epoch": 299} {"train_loss": -5.1277971267700195, "global_step": 12571, "epoch": 299} {"train_loss": -4.828995704650879, "global_step": 12572, "epoch": 299} {"train_loss": -5.032374858856201, "global_step": 12573, "epoch": 299} {"train_loss": -5.153048515319824, "global_step": 12574, "epoch": 299} {"train_loss": -4.998844146728516, "global_step": 12575, "epoch": 299} {"train_loss": -5.025286674499512, "global_step": 12576, "epoch": 299} {"train_loss": -5.0996270179748535, "global_step": 12577, "epoch": 299} {"train_loss": -4.988635063171387, "global_step": 12578, "epoch": 299} {"train_loss": -5.07646369934082, "global_step": 12579, "epoch": 299} {"train_loss": -4.98414421081543, "global_step": 12580, "epoch": 299} {"train_loss": -5.072187423706055, "global_step": 12581, "epoch": 299} {"train_loss": -4.812933444976807, "global_step": 12582, "epoch": 299} {"train_loss": -5.129338264465332, "global_step": 12583, "epoch": 299} {"train_loss": -5.051650524139404, "global_step": 12584, "epoch": 299} {"train_loss": -5.01746940612793, "global_step": 12585, "epoch": 299} {"train_loss": -4.956990718841553, "global_step": 12586, "epoch": 299} {"train_loss": -5.187949180603027, "global_step": 12587, "epoch": 299} {"train_loss": -5.105356693267822, "global_step": 12588, "epoch": 299} {"train_loss": -5.065979480743408, "global_step": 12589, "epoch": 299} {"train_loss": -5.070594787597656, "global_step": 12590, "epoch": 299} {"train_loss": -5.062582015991211, "global_step": 12591, "epoch": 299} {"train_loss": -5.11472749710083, "global_step": 12592, "epoch": 299} {"train_loss": -4.942321300506592, "global_step": 12593, "epoch": 299} {"train_loss": -5.056184768676758, "global_step": 12594, "epoch": 299} {"train_loss": -5.0565996170043945, "global_step": 12595, "epoch": 299} {"train_loss": -5.0395636558532715, "global_step": 12596, "epoch": 299} {"train_loss": -5.045060634613037, "global_step": 12597, "epoch": 299} {"train_loss": -4.96243953704834, "global_step": 12598, "epoch": 299} {"train_loss": -5.054759241285778, "global_step": 12599, "epoch": 299, "val_loss": 79242.171875} {"train_loss": -5.050714492797852, "global_step": 12600, "epoch": 300} {"train_loss": -5.1827850341796875, "global_step": 12601, "epoch": 300} {"train_loss": -5.0202484130859375, "global_step": 12602, "epoch": 300} {"train_loss": -5.066347122192383, "global_step": 12603, "epoch": 300} {"train_loss": -5.03856086730957, "global_step": 12604, "epoch": 300} {"train_loss": -5.15196418762207, "global_step": 12605, "epoch": 300} {"train_loss": -5.115391254425049, "global_step": 12606, "epoch": 300} {"train_loss": -5.045490264892578, "global_step": 12607, "epoch": 300} {"train_loss": -5.192324161529541, "global_step": 12608, "epoch": 300} {"train_loss": -5.096538543701172, "global_step": 12609, "epoch": 300} {"train_loss": -5.093278884887695, "global_step": 12610, "epoch": 300} {"train_loss": -5.175471305847168, "global_step": 12611, "epoch": 300} {"train_loss": -5.225879669189453, "global_step": 12612, "epoch": 300} {"train_loss": -5.052388668060303, "global_step": 12613, "epoch": 300} {"train_loss": -5.214130878448486, "global_step": 12614, "epoch": 300} {"train_loss": -5.076972007751465, "global_step": 12615, "epoch": 300} {"train_loss": -5.0029096603393555, "global_step": 12616, "epoch": 300} {"train_loss": -5.035211086273193, "global_step": 12617, "epoch": 300} {"train_loss": -5.152889251708984, "global_step": 12618, "epoch": 300} {"train_loss": -5.190646648406982, "global_step": 12619, "epoch": 300} {"train_loss": -5.216099739074707, "global_step": 12620, "epoch": 300} {"train_loss": -5.091766357421875, "global_step": 12621, "epoch": 300} {"train_loss": -5.107745170593262, "global_step": 12622, "epoch": 300} {"train_loss": -5.1569623947143555, "global_step": 12623, "epoch": 300} {"train_loss": -5.193335056304932, "global_step": 12624, "epoch": 300} {"train_loss": -5.19802188873291, "global_step": 12625, "epoch": 300} {"train_loss": -5.140650749206543, "global_step": 12626, "epoch": 300} {"train_loss": -5.189582824707031, "global_step": 12627, "epoch": 300} {"train_loss": -5.2423553466796875, "global_step": 12628, "epoch": 300} {"train_loss": -4.974747657775879, "global_step": 12629, "epoch": 300} {"train_loss": -5.186129093170166, "global_step": 12630, "epoch": 300} {"train_loss": -5.087040424346924, "global_step": 12631, "epoch": 300} {"train_loss": -5.162506580352783, "global_step": 12632, "epoch": 300} {"train_loss": -5.02984619140625, "global_step": 12633, "epoch": 300} {"train_loss": -5.063905715942383, "global_step": 12634, "epoch": 300} {"train_loss": -5.120997905731201, "global_step": 12635, "epoch": 300} {"train_loss": -5.166623115539551, "global_step": 12636, "epoch": 300} {"train_loss": -5.1257219314575195, "global_step": 12637, "epoch": 300} {"train_loss": -5.2330780029296875, "global_step": 12638, "epoch": 300} {"train_loss": -5.048933982849121, "global_step": 12639, "epoch": 300} {"train_loss": -4.958162307739258, "global_step": 12640, "epoch": 300} {"train_loss": -5.11764365150815, "global_step": 12641, "epoch": 300, "train/sim_max_reward_0": 0.3856584242489447, "train/sim_max_reward_1": 0.11745892542653562, "train/sim_max_reward_2": 0.2553194011945249, "train/sim_max_reward_3": 0.04172918737066105, "train/sim_max_reward_4": 0.24190608395547808, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4500000": 0.32943935577003675, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.1587760023573772, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.04528876879792907, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.4039533700709793, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.3163612195490487, "test/sim_max_reward_4500015": 0.02068400304565784, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.004249031229020703, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.5614369445327488, "test/sim_max_reward_4500022": 0.33035368716497726, "test/sim_max_reward_4500023": 0.5738031060989612, "test/sim_max_reward_4500024": 0.0781455179872621, "test/sim_max_reward_4500025": 0.24123209033178936, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.09757978428023686, "test/sim_max_reward_4500028": 0.6483697860362397, "test/sim_max_reward_4500029": 0.1382392035874872, "test/sim_max_reward_4500030": 0.1751176508209356, "test/sim_max_reward_4500031": 0.0474092174560433, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.042918425004986244, "test/sim_max_reward_4500034": 0.3637851109642093, "test/sim_max_reward_4500035": 0.5667206174176174, "test/sim_max_reward_4500036": 0.48368043212864753, "test/sim_max_reward_4500037": 0.24050710361129465, "test/sim_max_reward_4500038": 0.3178607800877572, "test/sim_max_reward_4500039": 0.10285289293167214, "test/sim_max_reward_4500040": 0.0, "test/sim_max_reward_4500041": 0.3184982285319475, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.4049808868280884, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.12596001799724207, "test/sim_max_reward_4500046": 0.07983069219241903, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.2058427969263886, "test/mean_score": 0.15512084482547936, "val_loss": 78916.0234375} {"train_loss": -5.280527114868164, "global_step": 12642, "epoch": 301} {"train_loss": -5.1501569747924805, "global_step": 12643, "epoch": 301} {"train_loss": -4.985682487487793, "global_step": 12644, "epoch": 301} {"train_loss": -5.012077331542969, "global_step": 12645, "epoch": 301} {"train_loss": -5.158818244934082, "global_step": 12646, "epoch": 301} {"train_loss": -5.158943176269531, "global_step": 12647, "epoch": 301} {"train_loss": -4.945037841796875, "global_step": 12648, "epoch": 301} {"train_loss": -5.351306438446045, "global_step": 12649, "epoch": 301} {"train_loss": -5.104417324066162, "global_step": 12650, "epoch": 301} {"train_loss": -5.1099853515625, "global_step": 12651, "epoch": 301} {"train_loss": -5.188872337341309, "global_step": 12652, "epoch": 301} {"train_loss": -5.168399810791016, "global_step": 12653, "epoch": 301} {"train_loss": -5.183479309082031, "global_step": 12654, "epoch": 301} {"train_loss": -5.067748546600342, "global_step": 12655, "epoch": 301} {"train_loss": -4.968881607055664, "global_step": 12656, "epoch": 301} {"train_loss": -5.153022766113281, "global_step": 12657, "epoch": 301} {"train_loss": -5.152955532073975, "global_step": 12658, "epoch": 301} {"train_loss": -5.020252227783203, "global_step": 12659, "epoch": 301} {"train_loss": -5.021707057952881, "global_step": 12660, "epoch": 301} {"train_loss": -5.070474624633789, "global_step": 12661, "epoch": 301} {"train_loss": -4.968044757843018, "global_step": 12662, "epoch": 301} {"train_loss": -5.023030757904053, "global_step": 12663, "epoch": 301} {"train_loss": -5.021860122680664, "global_step": 12664, "epoch": 301} {"train_loss": -5.076874732971191, "global_step": 12665, "epoch": 301} {"train_loss": -4.967467308044434, "global_step": 12666, "epoch": 301} {"train_loss": -5.057598114013672, "global_step": 12667, "epoch": 301} {"train_loss": -5.215388774871826, "global_step": 12668, "epoch": 301} {"train_loss": -5.134509086608887, "global_step": 12669, "epoch": 301} {"train_loss": -5.171169757843018, "global_step": 12670, "epoch": 301} {"train_loss": -4.982816696166992, "global_step": 12671, "epoch": 301} {"train_loss": -5.021170139312744, "global_step": 12672, "epoch": 301} {"train_loss": -5.091276168823242, "global_step": 12673, "epoch": 301} {"train_loss": -5.0656843185424805, "global_step": 12674, "epoch": 301} {"train_loss": -5.066110134124756, "global_step": 12675, "epoch": 301} {"train_loss": -4.868132591247559, "global_step": 12676, "epoch": 301} {"train_loss": -4.982029914855957, "global_step": 12677, "epoch": 301} {"train_loss": -5.095322608947754, "global_step": 12678, "epoch": 301} {"train_loss": -4.867692947387695, "global_step": 12679, "epoch": 301} {"train_loss": -5.128172874450684, "global_step": 12680, "epoch": 301} {"train_loss": -4.8167572021484375, "global_step": 12681, "epoch": 301} {"train_loss": -5.145010948181152, "global_step": 12682, "epoch": 301} {"train_loss": -5.0713192621866865, "global_step": 12683, "epoch": 301, "val_loss": 79150.625} {"train_loss": -4.99658203125, "global_step": 12684, "epoch": 302} {"train_loss": -5.037569522857666, "global_step": 12685, "epoch": 302} {"train_loss": -5.0921220779418945, "global_step": 12686, "epoch": 302} {"train_loss": -4.9323930740356445, "global_step": 12687, "epoch": 302} {"train_loss": -5.103003025054932, "global_step": 12688, "epoch": 302} {"train_loss": -5.052969455718994, "global_step": 12689, "epoch": 302} {"train_loss": -4.915184020996094, "global_step": 12690, "epoch": 302} {"train_loss": -5.038397789001465, "global_step": 12691, "epoch": 302} {"train_loss": -4.9078521728515625, "global_step": 12692, "epoch": 302} {"train_loss": -5.149984359741211, "global_step": 12693, "epoch": 302} {"train_loss": -4.9119553565979, "global_step": 12694, "epoch": 302} {"train_loss": -5.011837959289551, "global_step": 12695, "epoch": 302} {"train_loss": -5.146785736083984, "global_step": 12696, "epoch": 302} {"train_loss": -5.012274742126465, "global_step": 12697, "epoch": 302} {"train_loss": -5.151998043060303, "global_step": 12698, "epoch": 302} {"train_loss": -5.199855804443359, "global_step": 12699, "epoch": 302} {"train_loss": -5.153927803039551, "global_step": 12700, "epoch": 302} {"train_loss": -5.053295135498047, "global_step": 12701, "epoch": 302} {"train_loss": -5.170089244842529, "global_step": 12702, "epoch": 302} {"train_loss": -5.073781967163086, "global_step": 12703, "epoch": 302} {"train_loss": -5.102389812469482, "global_step": 12704, "epoch": 302} {"train_loss": -5.090494632720947, "global_step": 12705, "epoch": 302} {"train_loss": -5.1625471115112305, "global_step": 12706, "epoch": 302} {"train_loss": -5.089871883392334, "global_step": 12707, "epoch": 302} {"train_loss": -5.229954719543457, "global_step": 12708, "epoch": 302} {"train_loss": -5.2148356437683105, "global_step": 12709, "epoch": 302} {"train_loss": -5.150804042816162, "global_step": 12710, "epoch": 302} {"train_loss": -5.175601005554199, "global_step": 12711, "epoch": 302} {"train_loss": -5.123285293579102, "global_step": 12712, "epoch": 302} {"train_loss": -5.162294387817383, "global_step": 12713, "epoch": 302} {"train_loss": -5.131964683532715, "global_step": 12714, "epoch": 302} {"train_loss": -5.050675868988037, "global_step": 12715, "epoch": 302} {"train_loss": -4.976790428161621, "global_step": 12716, "epoch": 302} {"train_loss": -5.00288724899292, "global_step": 12717, "epoch": 302} {"train_loss": -5.097933292388916, "global_step": 12718, "epoch": 302} {"train_loss": -4.9554924964904785, "global_step": 12719, "epoch": 302} {"train_loss": -5.18866491317749, "global_step": 12720, "epoch": 302} {"train_loss": -5.063459873199463, "global_step": 12721, "epoch": 302} {"train_loss": -5.092866897583008, "global_step": 12722, "epoch": 302} {"train_loss": -5.192022323608398, "global_step": 12723, "epoch": 302} {"train_loss": -4.9727020263671875, "global_step": 12724, "epoch": 302} {"train_loss": -5.082035541534424, "global_step": 12725, "epoch": 302, "val_loss": 79320.4375} {"train_loss": -4.967472553253174, "global_step": 12726, "epoch": 303} {"train_loss": -5.07633113861084, "global_step": 12727, "epoch": 303} {"train_loss": -5.0043230056762695, "global_step": 12728, "epoch": 303} {"train_loss": -4.978041648864746, "global_step": 12729, "epoch": 303} {"train_loss": -5.025713920593262, "global_step": 12730, "epoch": 303} {"train_loss": -4.972405433654785, "global_step": 12731, "epoch": 303} {"train_loss": -5.029702186584473, "global_step": 12732, "epoch": 303} {"train_loss": -5.077280521392822, "global_step": 12733, "epoch": 303} {"train_loss": -5.107526779174805, "global_step": 12734, "epoch": 303} {"train_loss": -5.0880937576293945, "global_step": 12735, "epoch": 303} {"train_loss": -5.2067365646362305, "global_step": 12736, "epoch": 303} {"train_loss": -5.153328895568848, "global_step": 12737, "epoch": 303} {"train_loss": -5.141463756561279, "global_step": 12738, "epoch": 303} {"train_loss": -5.255855560302734, "global_step": 12739, "epoch": 303} {"train_loss": -5.034151077270508, "global_step": 12740, "epoch": 303} {"train_loss": -5.141510963439941, "global_step": 12741, "epoch": 303} {"train_loss": -4.935695171356201, "global_step": 12742, "epoch": 303} {"train_loss": -5.054963111877441, "global_step": 12743, "epoch": 303} {"train_loss": -5.149700164794922, "global_step": 12744, "epoch": 303} {"train_loss": -5.110267162322998, "global_step": 12745, "epoch": 303} {"train_loss": -5.07651424407959, "global_step": 12746, "epoch": 303} {"train_loss": -5.096242904663086, "global_step": 12747, "epoch": 303} {"train_loss": -5.140310764312744, "global_step": 12748, "epoch": 303} {"train_loss": -5.202243804931641, "global_step": 12749, "epoch": 303} {"train_loss": -5.341821193695068, "global_step": 12750, "epoch": 303} {"train_loss": -5.187743186950684, "global_step": 12751, "epoch": 303} {"train_loss": -5.105095863342285, "global_step": 12752, "epoch": 303} {"train_loss": -5.102353096008301, "global_step": 12753, "epoch": 303} {"train_loss": -5.029454231262207, "global_step": 12754, "epoch": 303} {"train_loss": -4.952136516571045, "global_step": 12755, "epoch": 303} {"train_loss": -5.237781047821045, "global_step": 12756, "epoch": 303} {"train_loss": -5.233994007110596, "global_step": 12757, "epoch": 303} {"train_loss": -5.245634078979492, "global_step": 12758, "epoch": 303} {"train_loss": -5.1047587394714355, "global_step": 12759, "epoch": 303} {"train_loss": -5.104362487792969, "global_step": 12760, "epoch": 303} {"train_loss": -5.08317756652832, "global_step": 12761, "epoch": 303} {"train_loss": -5.15305233001709, "global_step": 12762, "epoch": 303} {"train_loss": -5.177348613739014, "global_step": 12763, "epoch": 303} {"train_loss": -5.0595927238464355, "global_step": 12764, "epoch": 303} {"train_loss": -5.167782306671143, "global_step": 12765, "epoch": 303} {"train_loss": -5.161493301391602, "global_step": 12766, "epoch": 303} {"train_loss": -5.106672888710385, "global_step": 12767, "epoch": 303, "val_loss": 78911.609375} {"train_loss": -4.935595512390137, "global_step": 12768, "epoch": 304} {"train_loss": -5.111418724060059, "global_step": 12769, "epoch": 304} {"train_loss": -4.851788520812988, "global_step": 12770, "epoch": 304} {"train_loss": -5.263604164123535, "global_step": 12771, "epoch": 304} {"train_loss": -5.139634609222412, "global_step": 12772, "epoch": 304} {"train_loss": -5.134791374206543, "global_step": 12773, "epoch": 304} {"train_loss": -5.1279449462890625, "global_step": 12774, "epoch": 304} {"train_loss": -5.236270904541016, "global_step": 12775, "epoch": 304} {"train_loss": -5.081733703613281, "global_step": 12776, "epoch": 304} {"train_loss": -5.132704734802246, "global_step": 12777, "epoch": 304} {"train_loss": -5.324525356292725, "global_step": 12778, "epoch": 304} {"train_loss": -5.172842979431152, "global_step": 12779, "epoch": 304} {"train_loss": -5.111179351806641, "global_step": 12780, "epoch": 304} {"train_loss": -5.141979217529297, "global_step": 12781, "epoch": 304} {"train_loss": -5.141697406768799, "global_step": 12782, "epoch": 304} {"train_loss": -5.092169761657715, "global_step": 12783, "epoch": 304} {"train_loss": -5.021463394165039, "global_step": 12784, "epoch": 304} {"train_loss": -5.252040863037109, "global_step": 12785, "epoch": 304} {"train_loss": -5.110322952270508, "global_step": 12786, "epoch": 304} {"train_loss": -5.008634090423584, "global_step": 12787, "epoch": 304} {"train_loss": -5.17406702041626, "global_step": 12788, "epoch": 304} {"train_loss": -5.1203718185424805, "global_step": 12789, "epoch": 304} {"train_loss": -5.040136337280273, "global_step": 12790, "epoch": 304} {"train_loss": -5.235716819763184, "global_step": 12791, "epoch": 304} {"train_loss": -5.140895843505859, "global_step": 12792, "epoch": 304} {"train_loss": -5.152824401855469, "global_step": 12793, "epoch": 304} {"train_loss": -5.096900939941406, "global_step": 12794, "epoch": 304} {"train_loss": -5.155682563781738, "global_step": 12795, "epoch": 304} {"train_loss": -5.141312599182129, "global_step": 12796, "epoch": 304} {"train_loss": -5.117238998413086, "global_step": 12797, "epoch": 304} {"train_loss": -5.142948627471924, "global_step": 12798, "epoch": 304} {"train_loss": -4.953686714172363, "global_step": 12799, "epoch": 304} {"train_loss": -5.037003517150879, "global_step": 12800, "epoch": 304} {"train_loss": -5.240073204040527, "global_step": 12801, "epoch": 304} {"train_loss": -5.100736618041992, "global_step": 12802, "epoch": 304} {"train_loss": -5.072009086608887, "global_step": 12803, "epoch": 304} {"train_loss": -5.183998107910156, "global_step": 12804, "epoch": 304} {"train_loss": -5.111939907073975, "global_step": 12805, "epoch": 304} {"train_loss": -5.206595420837402, "global_step": 12806, "epoch": 304} {"train_loss": -5.160691261291504, "global_step": 12807, "epoch": 304} {"train_loss": -5.286508560180664, "global_step": 12808, "epoch": 304} {"train_loss": -5.128026769274757, "global_step": 12809, "epoch": 304, "val_loss": 79007.734375} {"train_loss": -4.961801052093506, "global_step": 12810, "epoch": 305} {"train_loss": -5.137879371643066, "global_step": 12811, "epoch": 305} {"train_loss": -5.275060176849365, "global_step": 12812, "epoch": 305} {"train_loss": -4.9850897789001465, "global_step": 12813, "epoch": 305} {"train_loss": -5.048918724060059, "global_step": 12814, "epoch": 305} {"train_loss": -5.117336273193359, "global_step": 12815, "epoch": 305} {"train_loss": -5.123679161071777, "global_step": 12816, "epoch": 305} {"train_loss": -5.133496284484863, "global_step": 12817, "epoch": 305} {"train_loss": -5.128525257110596, "global_step": 12818, "epoch": 305} {"train_loss": -5.104537487030029, "global_step": 12819, "epoch": 305} {"train_loss": -5.020771026611328, "global_step": 12820, "epoch": 305} {"train_loss": -5.155987739562988, "global_step": 12821, "epoch": 305} {"train_loss": -4.981987953186035, "global_step": 12822, "epoch": 305} {"train_loss": -5.176450252532959, "global_step": 12823, "epoch": 305} {"train_loss": -5.146401882171631, "global_step": 12824, "epoch": 305} {"train_loss": -5.145357131958008, "global_step": 12825, "epoch": 305} {"train_loss": -5.117108345031738, "global_step": 12826, "epoch": 305} {"train_loss": -5.094621658325195, "global_step": 12827, "epoch": 305} {"train_loss": -5.163284778594971, "global_step": 12828, "epoch": 305} {"train_loss": -5.061118125915527, "global_step": 12829, "epoch": 305} {"train_loss": -5.121540069580078, "global_step": 12830, "epoch": 305} {"train_loss": -5.133463382720947, "global_step": 12831, "epoch": 305} {"train_loss": -4.91287088394165, "global_step": 12832, "epoch": 305} {"train_loss": -5.2226104736328125, "global_step": 12833, "epoch": 305} {"train_loss": -5.028476238250732, "global_step": 12834, "epoch": 305} {"train_loss": -5.196000099182129, "global_step": 12835, "epoch": 305} {"train_loss": -5.05699348449707, "global_step": 12836, "epoch": 305} {"train_loss": -5.0837907791137695, "global_step": 12837, "epoch": 305} {"train_loss": -5.100874900817871, "global_step": 12838, "epoch": 305} {"train_loss": -5.111020565032959, "global_step": 12839, "epoch": 305} {"train_loss": -5.130758762359619, "global_step": 12840, "epoch": 305} {"train_loss": -5.208219528198242, "global_step": 12841, "epoch": 305} {"train_loss": -5.1176042556762695, "global_step": 12842, "epoch": 305} {"train_loss": -5.038235664367676, "global_step": 12843, "epoch": 305} {"train_loss": -5.015440940856934, "global_step": 12844, "epoch": 305} {"train_loss": -5.171627521514893, "global_step": 12845, "epoch": 305} {"train_loss": -5.227964401245117, "global_step": 12846, "epoch": 305} {"train_loss": -5.05848503112793, "global_step": 12847, "epoch": 305} {"train_loss": -5.1560845375061035, "global_step": 12848, "epoch": 305} {"train_loss": -5.144563674926758, "global_step": 12849, "epoch": 305} {"train_loss": -5.10444450378418, "global_step": 12850, "epoch": 305} {"train_loss": -5.109422263644991, "global_step": 12851, "epoch": 305, "val_loss": 80434.9453125} {"train_loss": -5.067943572998047, "global_step": 12852, "epoch": 306} {"train_loss": -5.0986409187316895, "global_step": 12853, "epoch": 306} {"train_loss": -5.244478702545166, "global_step": 12854, "epoch": 306} {"train_loss": -5.146453380584717, "global_step": 12855, "epoch": 306} {"train_loss": -5.172179222106934, "global_step": 12856, "epoch": 306} {"train_loss": -5.051434516906738, "global_step": 12857, "epoch": 306} {"train_loss": -5.226016521453857, "global_step": 12858, "epoch": 306} {"train_loss": -5.007352828979492, "global_step": 12859, "epoch": 306} {"train_loss": -5.044437408447266, "global_step": 12860, "epoch": 306} {"train_loss": -5.139003753662109, "global_step": 12861, "epoch": 306} {"train_loss": -5.1313323974609375, "global_step": 12862, "epoch": 306} {"train_loss": -5.17690372467041, "global_step": 12863, "epoch": 306} {"train_loss": -5.071494102478027, "global_step": 12864, "epoch": 306} {"train_loss": -5.1826043128967285, "global_step": 12865, "epoch": 306} {"train_loss": -5.07871150970459, "global_step": 12866, "epoch": 306} {"train_loss": -4.897512912750244, "global_step": 12867, "epoch": 306} {"train_loss": -5.051702499389648, "global_step": 12868, "epoch": 306} {"train_loss": -4.957020282745361, "global_step": 12869, "epoch": 306} {"train_loss": -5.027685165405273, "global_step": 12870, "epoch": 306} {"train_loss": -5.285673141479492, "global_step": 12871, "epoch": 306} {"train_loss": -5.034089088439941, "global_step": 12872, "epoch": 306} {"train_loss": -5.055954933166504, "global_step": 12873, "epoch": 306} {"train_loss": -5.285900115966797, "global_step": 12874, "epoch": 306} {"train_loss": -5.211629867553711, "global_step": 12875, "epoch": 306} {"train_loss": -5.226108074188232, "global_step": 12876, "epoch": 306} {"train_loss": -5.170034408569336, "global_step": 12877, "epoch": 306} {"train_loss": -5.1914896965026855, "global_step": 12878, "epoch": 306} {"train_loss": -5.046200752258301, "global_step": 12879, "epoch": 306} {"train_loss": -5.188175678253174, "global_step": 12880, "epoch": 306} {"train_loss": -5.181503772735596, "global_step": 12881, "epoch": 306} {"train_loss": -5.01954460144043, "global_step": 12882, "epoch": 306} {"train_loss": -5.193549156188965, "global_step": 12883, "epoch": 306} {"train_loss": -5.022202491760254, "global_step": 12884, "epoch": 306} {"train_loss": -4.9518327713012695, "global_step": 12885, "epoch": 306} {"train_loss": -5.180246829986572, "global_step": 12886, "epoch": 306} {"train_loss": -5.135458946228027, "global_step": 12887, "epoch": 306} {"train_loss": -5.106233596801758, "global_step": 12888, "epoch": 306} {"train_loss": -5.062596321105957, "global_step": 12889, "epoch": 306} {"train_loss": -5.007267475128174, "global_step": 12890, "epoch": 306} {"train_loss": -5.033108234405518, "global_step": 12891, "epoch": 306} {"train_loss": -4.90833854675293, "global_step": 12892, "epoch": 306} {"train_loss": -5.101322866621471, "global_step": 12893, "epoch": 306, "val_loss": 78109.6875} {"train_loss": -5.145888805389404, "global_step": 12894, "epoch": 307} {"train_loss": -5.235715389251709, "global_step": 12895, "epoch": 307} {"train_loss": -4.946113586425781, "global_step": 12896, "epoch": 307} {"train_loss": -5.135859966278076, "global_step": 12897, "epoch": 307} {"train_loss": -4.959529876708984, "global_step": 12898, "epoch": 307} {"train_loss": -5.091207981109619, "global_step": 12899, "epoch": 307} {"train_loss": -5.198465347290039, "global_step": 12900, "epoch": 307} {"train_loss": -5.035925388336182, "global_step": 12901, "epoch": 307} {"train_loss": -5.014437675476074, "global_step": 12902, "epoch": 307} {"train_loss": -5.038088321685791, "global_step": 12903, "epoch": 307} {"train_loss": -4.9705963134765625, "global_step": 12904, "epoch": 307} {"train_loss": -5.155691146850586, "global_step": 12905, "epoch": 307} {"train_loss": -5.228911399841309, "global_step": 12906, "epoch": 307} {"train_loss": -5.0576982498168945, "global_step": 12907, "epoch": 307} {"train_loss": -5.091691017150879, "global_step": 12908, "epoch": 307} {"train_loss": -5.16166877746582, "global_step": 12909, "epoch": 307} {"train_loss": -5.209556579589844, "global_step": 12910, "epoch": 307} {"train_loss": -5.272469520568848, "global_step": 12911, "epoch": 307} {"train_loss": -4.988987445831299, "global_step": 12912, "epoch": 307} {"train_loss": -5.061654090881348, "global_step": 12913, "epoch": 307} {"train_loss": -5.078598976135254, "global_step": 12914, "epoch": 307} {"train_loss": -5.141160011291504, "global_step": 12915, "epoch": 307} {"train_loss": -5.176246643066406, "global_step": 12916, "epoch": 307} {"train_loss": -5.089198112487793, "global_step": 12917, "epoch": 307} {"train_loss": -5.0208539962768555, "global_step": 12918, "epoch": 307} {"train_loss": -5.076411247253418, "global_step": 12919, "epoch": 307} {"train_loss": -5.042187213897705, "global_step": 12920, "epoch": 307} {"train_loss": -5.174924850463867, "global_step": 12921, "epoch": 307} {"train_loss": -5.093486785888672, "global_step": 12922, "epoch": 307} {"train_loss": -5.0831708908081055, "global_step": 12923, "epoch": 307} {"train_loss": -5.116840362548828, "global_step": 12924, "epoch": 307} {"train_loss": -5.047240257263184, "global_step": 12925, "epoch": 307} {"train_loss": -5.0331292152404785, "global_step": 12926, "epoch": 307} {"train_loss": -5.162685394287109, "global_step": 12927, "epoch": 307} {"train_loss": -5.19317626953125, "global_step": 12928, "epoch": 307} {"train_loss": -5.140887260437012, "global_step": 12929, "epoch": 307} {"train_loss": -5.168204307556152, "global_step": 12930, "epoch": 307} {"train_loss": -5.222006797790527, "global_step": 12931, "epoch": 307} {"train_loss": -5.169991970062256, "global_step": 12932, "epoch": 307} {"train_loss": -4.966642379760742, "global_step": 12933, "epoch": 307} {"train_loss": -5.1616058349609375, "global_step": 12934, "epoch": 307} {"train_loss": -5.104035048257737, "global_step": 12935, "epoch": 307, "val_loss": 78063.7421875} {"train_loss": -5.294818878173828, "global_step": 12936, "epoch": 308} {"train_loss": -5.239146709442139, "global_step": 12937, "epoch": 308} {"train_loss": -5.09583854675293, "global_step": 12938, "epoch": 308} {"train_loss": -5.210689067840576, "global_step": 12939, "epoch": 308} {"train_loss": -5.045449733734131, "global_step": 12940, "epoch": 308} {"train_loss": -5.198172569274902, "global_step": 12941, "epoch": 308} {"train_loss": -5.277684211730957, "global_step": 12942, "epoch": 308} {"train_loss": -5.115591049194336, "global_step": 12943, "epoch": 308} {"train_loss": -5.1577253341674805, "global_step": 12944, "epoch": 308} {"train_loss": -5.165637969970703, "global_step": 12945, "epoch": 308} {"train_loss": -5.117972373962402, "global_step": 12946, "epoch": 308} {"train_loss": -5.288989067077637, "global_step": 12947, "epoch": 308} {"train_loss": -5.063535690307617, "global_step": 12948, "epoch": 308} {"train_loss": -5.185826301574707, "global_step": 12949, "epoch": 308} {"train_loss": -5.042076587677002, "global_step": 12950, "epoch": 308} {"train_loss": -4.844945907592773, "global_step": 12951, "epoch": 308} {"train_loss": -5.159488677978516, "global_step": 12952, "epoch": 308} {"train_loss": -5.102173328399658, "global_step": 12953, "epoch": 308} {"train_loss": -5.154834747314453, "global_step": 12954, "epoch": 308} {"train_loss": -5.133028507232666, "global_step": 12955, "epoch": 308} {"train_loss": -5.130321979522705, "global_step": 12956, "epoch": 308} {"train_loss": -5.252493858337402, "global_step": 12957, "epoch": 308} {"train_loss": -5.016191482543945, "global_step": 12958, "epoch": 308} {"train_loss": -5.007357120513916, "global_step": 12959, "epoch": 308} {"train_loss": -5.061430931091309, "global_step": 12960, "epoch": 308} {"train_loss": -5.0117926597595215, "global_step": 12961, "epoch": 308} {"train_loss": -5.076920509338379, "global_step": 12962, "epoch": 308} {"train_loss": -5.208300590515137, "global_step": 12963, "epoch": 308} {"train_loss": -5.109621047973633, "global_step": 12964, "epoch": 308} {"train_loss": -5.069669723510742, "global_step": 12965, "epoch": 308} {"train_loss": -5.029352188110352, "global_step": 12966, "epoch": 308} {"train_loss": -5.104787826538086, "global_step": 12967, "epoch": 308} {"train_loss": -5.139718055725098, "global_step": 12968, "epoch": 308} {"train_loss": -4.940457344055176, "global_step": 12969, "epoch": 308} {"train_loss": -5.07760763168335, "global_step": 12970, "epoch": 308} {"train_loss": -5.104888916015625, "global_step": 12971, "epoch": 308} {"train_loss": -5.161525726318359, "global_step": 12972, "epoch": 308} {"train_loss": -5.11579704284668, "global_step": 12973, "epoch": 308} {"train_loss": -5.192744731903076, "global_step": 12974, "epoch": 308} {"train_loss": -5.08091926574707, "global_step": 12975, "epoch": 308} {"train_loss": -5.176375389099121, "global_step": 12976, "epoch": 308} {"train_loss": -5.12174882207598, "global_step": 12977, "epoch": 308, "val_loss": 80012.1953125} {"train_loss": -5.020165920257568, "global_step": 12978, "epoch": 309} {"train_loss": -5.117367744445801, "global_step": 12979, "epoch": 309} {"train_loss": -5.079061508178711, "global_step": 12980, "epoch": 309} {"train_loss": -5.124375820159912, "global_step": 12981, "epoch": 309} {"train_loss": -5.260611534118652, "global_step": 12982, "epoch": 309} {"train_loss": -5.215845108032227, "global_step": 12983, "epoch": 309} {"train_loss": -5.08364200592041, "global_step": 12984, "epoch": 309} {"train_loss": -5.269160747528076, "global_step": 12985, "epoch": 309} {"train_loss": -5.1382856369018555, "global_step": 12986, "epoch": 309} {"train_loss": -5.267646789550781, "global_step": 12987, "epoch": 309} {"train_loss": -5.039612770080566, "global_step": 12988, "epoch": 309} {"train_loss": -5.166970252990723, "global_step": 12989, "epoch": 309} {"train_loss": -5.198894500732422, "global_step": 12990, "epoch": 309} {"train_loss": -5.106695652008057, "global_step": 12991, "epoch": 309} {"train_loss": -5.220715522766113, "global_step": 12992, "epoch": 309} {"train_loss": -5.16316032409668, "global_step": 12993, "epoch": 309} {"train_loss": -5.239480972290039, "global_step": 12994, "epoch": 309} {"train_loss": -5.072983741760254, "global_step": 12995, "epoch": 309} {"train_loss": -5.009853363037109, "global_step": 12996, "epoch": 309} {"train_loss": -5.226389408111572, "global_step": 12997, "epoch": 309} {"train_loss": -5.099836349487305, "global_step": 12998, "epoch": 309} {"train_loss": -5.2155866622924805, "global_step": 12999, "epoch": 309} {"train_loss": -4.970644950866699, "global_step": 13000, "epoch": 309} {"train_loss": -4.929220676422119, "global_step": 13001, "epoch": 309} {"train_loss": -5.011319160461426, "global_step": 13002, "epoch": 309} {"train_loss": -4.996618270874023, "global_step": 13003, "epoch": 309} {"train_loss": -5.090249538421631, "global_step": 13004, "epoch": 309} {"train_loss": -5.176618576049805, "global_step": 13005, "epoch": 309} {"train_loss": -4.97398567199707, "global_step": 13006, "epoch": 309} {"train_loss": -5.029862403869629, "global_step": 13007, "epoch": 309} {"train_loss": -4.99884033203125, "global_step": 13008, "epoch": 309} {"train_loss": -5.071168899536133, "global_step": 13009, "epoch": 309} {"train_loss": -4.923441410064697, "global_step": 13010, "epoch": 309} {"train_loss": -5.085756301879883, "global_step": 13011, "epoch": 309} {"train_loss": -5.027773380279541, "global_step": 13012, "epoch": 309} {"train_loss": -5.040295124053955, "global_step": 13013, "epoch": 309} {"train_loss": -5.133428573608398, "global_step": 13014, "epoch": 309} {"train_loss": -4.984382629394531, "global_step": 13015, "epoch": 309} {"train_loss": -5.080099105834961, "global_step": 13016, "epoch": 309} {"train_loss": -5.1844048500061035, "global_step": 13017, "epoch": 309} {"train_loss": -5.0746307373046875, "global_step": 13018, "epoch": 309} {"train_loss": -5.10075010572161, "global_step": 13019, "epoch": 309, "val_loss": 78660.46875} {"train_loss": -5.088411331176758, "global_step": 13020, "epoch": 310} {"train_loss": -5.111874580383301, "global_step": 13021, "epoch": 310} {"train_loss": -4.984284400939941, "global_step": 13022, "epoch": 310} {"train_loss": -5.111443519592285, "global_step": 13023, "epoch": 310} {"train_loss": -5.126995086669922, "global_step": 13024, "epoch": 310} {"train_loss": -5.103745460510254, "global_step": 13025, "epoch": 310} {"train_loss": -5.0442423820495605, "global_step": 13026, "epoch": 310} {"train_loss": -5.110689163208008, "global_step": 13027, "epoch": 310} {"train_loss": -5.005238056182861, "global_step": 13028, "epoch": 310} {"train_loss": -5.06314754486084, "global_step": 13029, "epoch": 310} {"train_loss": -5.003375053405762, "global_step": 13030, "epoch": 310} {"train_loss": -5.090925216674805, "global_step": 13031, "epoch": 310} {"train_loss": -5.12455940246582, "global_step": 13032, "epoch": 310} {"train_loss": -5.152871131896973, "global_step": 13033, "epoch": 310} {"train_loss": -5.171955108642578, "global_step": 13034, "epoch": 310} {"train_loss": -4.980338096618652, "global_step": 13035, "epoch": 310} {"train_loss": -5.079122543334961, "global_step": 13036, "epoch": 310} {"train_loss": -5.186010360717773, "global_step": 13037, "epoch": 310} {"train_loss": -5.125952243804932, "global_step": 13038, "epoch": 310} {"train_loss": -5.15956974029541, "global_step": 13039, "epoch": 310} {"train_loss": -5.190942764282227, "global_step": 13040, "epoch": 310} {"train_loss": -5.121771335601807, "global_step": 13041, "epoch": 310} {"train_loss": -5.055232524871826, "global_step": 13042, "epoch": 310} {"train_loss": -5.181827545166016, "global_step": 13043, "epoch": 310} {"train_loss": -5.242208480834961, "global_step": 13044, "epoch": 310} {"train_loss": -5.118579864501953, "global_step": 13045, "epoch": 310} {"train_loss": -5.309323310852051, "global_step": 13046, "epoch": 310} {"train_loss": -4.995014190673828, "global_step": 13047, "epoch": 310} {"train_loss": -5.0592451095581055, "global_step": 13048, "epoch": 310} {"train_loss": -5.153502464294434, "global_step": 13049, "epoch": 310} {"train_loss": -5.115667819976807, "global_step": 13050, "epoch": 310} {"train_loss": -5.082228660583496, "global_step": 13051, "epoch": 310} {"train_loss": -5.128553867340088, "global_step": 13052, "epoch": 310} {"train_loss": -5.1625752449035645, "global_step": 13053, "epoch": 310} {"train_loss": -5.153530597686768, "global_step": 13054, "epoch": 310} {"train_loss": -5.324076175689697, "global_step": 13055, "epoch": 310} {"train_loss": -5.112565994262695, "global_step": 13056, "epoch": 310} {"train_loss": -5.146667003631592, "global_step": 13057, "epoch": 310} {"train_loss": -5.003242492675781, "global_step": 13058, "epoch": 310} {"train_loss": -5.2498393058776855, "global_step": 13059, "epoch": 310} {"train_loss": -5.1976447105407715, "global_step": 13060, "epoch": 310} {"train_loss": -5.1176499752771285, "global_step": 13061, "epoch": 310, "val_loss": 79008.1640625} {"train_loss": -5.1493425369262695, "global_step": 13062, "epoch": 311} {"train_loss": -5.209878921508789, "global_step": 13063, "epoch": 311} {"train_loss": -5.022364139556885, "global_step": 13064, "epoch": 311} {"train_loss": -4.950457572937012, "global_step": 13065, "epoch": 311} {"train_loss": -5.18282413482666, "global_step": 13066, "epoch": 311} {"train_loss": -5.023630619049072, "global_step": 13067, "epoch": 311} {"train_loss": -4.983062744140625, "global_step": 13068, "epoch": 311} {"train_loss": -5.215176582336426, "global_step": 13069, "epoch": 311} {"train_loss": -4.986148834228516, "global_step": 13070, "epoch": 311} {"train_loss": -4.985710144042969, "global_step": 13071, "epoch": 311} {"train_loss": -5.105378150939941, "global_step": 13072, "epoch": 311} {"train_loss": -5.008610248565674, "global_step": 13073, "epoch": 311} {"train_loss": -5.126882553100586, "global_step": 13074, "epoch": 311} {"train_loss": -5.173571586608887, "global_step": 13075, "epoch": 311} {"train_loss": -4.915915012359619, "global_step": 13076, "epoch": 311} {"train_loss": -5.202141284942627, "global_step": 13077, "epoch": 311} {"train_loss": -5.078649997711182, "global_step": 13078, "epoch": 311} {"train_loss": -5.068615913391113, "global_step": 13079, "epoch": 311} {"train_loss": -5.149435043334961, "global_step": 13080, "epoch": 311} {"train_loss": -5.182324409484863, "global_step": 13081, "epoch": 311} {"train_loss": -5.146695137023926, "global_step": 13082, "epoch": 311} {"train_loss": -5.082401275634766, "global_step": 13083, "epoch": 311} {"train_loss": -5.158844947814941, "global_step": 13084, "epoch": 311} {"train_loss": -5.0824737548828125, "global_step": 13085, "epoch": 311} {"train_loss": -5.14349365234375, "global_step": 13086, "epoch": 311} {"train_loss": -5.266093730926514, "global_step": 13087, "epoch": 311} {"train_loss": -5.1645331382751465, "global_step": 13088, "epoch": 311} {"train_loss": -5.124482154846191, "global_step": 13089, "epoch": 311} {"train_loss": -5.128604888916016, "global_step": 13090, "epoch": 311} {"train_loss": -5.213983535766602, "global_step": 13091, "epoch": 311} {"train_loss": -5.058188438415527, "global_step": 13092, "epoch": 311} {"train_loss": -5.1503190994262695, "global_step": 13093, "epoch": 311} {"train_loss": -4.978904724121094, "global_step": 13094, "epoch": 311} {"train_loss": -5.181332588195801, "global_step": 13095, "epoch": 311} {"train_loss": -5.117678642272949, "global_step": 13096, "epoch": 311} {"train_loss": -4.927142143249512, "global_step": 13097, "epoch": 311} {"train_loss": -5.114485263824463, "global_step": 13098, "epoch": 311} {"train_loss": -4.898913383483887, "global_step": 13099, "epoch": 311} {"train_loss": -4.895697593688965, "global_step": 13100, "epoch": 311} {"train_loss": -5.118497848510742, "global_step": 13101, "epoch": 311} {"train_loss": -4.991209030151367, "global_step": 13102, "epoch": 311} {"train_loss": -5.084052846545265, "global_step": 13103, "epoch": 311, "val_loss": 78754.4375} {"train_loss": -5.168734550476074, "global_step": 13104, "epoch": 312} {"train_loss": -4.980256080627441, "global_step": 13105, "epoch": 312} {"train_loss": -4.997358322143555, "global_step": 13106, "epoch": 312} {"train_loss": -5.1092376708984375, "global_step": 13107, "epoch": 312} {"train_loss": -5.056456089019775, "global_step": 13108, "epoch": 312} {"train_loss": -4.966609954833984, "global_step": 13109, "epoch": 312} {"train_loss": -5.061453342437744, "global_step": 13110, "epoch": 312} {"train_loss": -5.1491804122924805, "global_step": 13111, "epoch": 312} {"train_loss": -5.195147514343262, "global_step": 13112, "epoch": 312} {"train_loss": -5.010677337646484, "global_step": 13113, "epoch": 312} {"train_loss": -5.066390037536621, "global_step": 13114, "epoch": 312} {"train_loss": -5.097651958465576, "global_step": 13115, "epoch": 312} {"train_loss": -5.247803688049316, "global_step": 13116, "epoch": 312} {"train_loss": -5.173519134521484, "global_step": 13117, "epoch": 312} {"train_loss": -5.255393028259277, "global_step": 13118, "epoch": 312} {"train_loss": -4.974142074584961, "global_step": 13119, "epoch": 312} {"train_loss": -4.887175559997559, "global_step": 13120, "epoch": 312} {"train_loss": -5.138701438903809, "global_step": 13121, "epoch": 312} {"train_loss": -5.0637359619140625, "global_step": 13122, "epoch": 312} {"train_loss": -5.206161975860596, "global_step": 13123, "epoch": 312} {"train_loss": -5.086843490600586, "global_step": 13124, "epoch": 312} {"train_loss": -5.071436882019043, "global_step": 13125, "epoch": 312} {"train_loss": -5.183187484741211, "global_step": 13126, "epoch": 312} {"train_loss": -5.118886947631836, "global_step": 13127, "epoch": 312} {"train_loss": -5.086765289306641, "global_step": 13128, "epoch": 312} {"train_loss": -5.147331237792969, "global_step": 13129, "epoch": 312} {"train_loss": -5.072809219360352, "global_step": 13130, "epoch": 312} {"train_loss": -5.11494255065918, "global_step": 13131, "epoch": 312} {"train_loss": -5.093996524810791, "global_step": 13132, "epoch": 312} {"train_loss": -5.063292980194092, "global_step": 13133, "epoch": 312} {"train_loss": -5.2186479568481445, "global_step": 13134, "epoch": 312} {"train_loss": -4.957075595855713, "global_step": 13135, "epoch": 312} {"train_loss": -5.019992828369141, "global_step": 13136, "epoch": 312} {"train_loss": -5.273883819580078, "global_step": 13137, "epoch": 312} {"train_loss": -5.114129066467285, "global_step": 13138, "epoch": 312} {"train_loss": -5.191714286804199, "global_step": 13139, "epoch": 312} {"train_loss": -5.036504745483398, "global_step": 13140, "epoch": 312} {"train_loss": -5.142389297485352, "global_step": 13141, "epoch": 312} {"train_loss": -5.135008811950684, "global_step": 13142, "epoch": 312} {"train_loss": -5.104596138000488, "global_step": 13143, "epoch": 312} {"train_loss": -5.168745517730713, "global_step": 13144, "epoch": 312} {"train_loss": -5.104440053304036, "global_step": 13145, "epoch": 312, "val_loss": 79890.1015625} {"train_loss": -5.105275630950928, "global_step": 13146, "epoch": 313} {"train_loss": -5.154724597930908, "global_step": 13147, "epoch": 313} {"train_loss": -5.171873092651367, "global_step": 13148, "epoch": 313} {"train_loss": -5.077176570892334, "global_step": 13149, "epoch": 313} {"train_loss": -5.20527458190918, "global_step": 13150, "epoch": 313} {"train_loss": -5.070865154266357, "global_step": 13151, "epoch": 313} {"train_loss": -5.203180313110352, "global_step": 13152, "epoch": 313} {"train_loss": -5.012895107269287, "global_step": 13153, "epoch": 313} {"train_loss": -5.142275810241699, "global_step": 13154, "epoch": 313} {"train_loss": -5.0653977394104, "global_step": 13155, "epoch": 313} {"train_loss": -5.1162214279174805, "global_step": 13156, "epoch": 313} {"train_loss": -5.149040222167969, "global_step": 13157, "epoch": 313} {"train_loss": -5.232497215270996, "global_step": 13158, "epoch": 313} {"train_loss": -5.184811115264893, "global_step": 13159, "epoch": 313} {"train_loss": -5.203981876373291, "global_step": 13160, "epoch": 313} {"train_loss": -5.156085968017578, "global_step": 13161, "epoch": 313} {"train_loss": -5.063693046569824, "global_step": 13162, "epoch": 313} {"train_loss": -5.192193984985352, "global_step": 13163, "epoch": 313} {"train_loss": -4.979004383087158, "global_step": 13164, "epoch": 313} {"train_loss": -5.20562219619751, "global_step": 13165, "epoch": 313} {"train_loss": -5.027058124542236, "global_step": 13166, "epoch": 313} {"train_loss": -5.005906105041504, "global_step": 13167, "epoch": 313} {"train_loss": -4.954138278961182, "global_step": 13168, "epoch": 313} {"train_loss": -5.239473342895508, "global_step": 13169, "epoch": 313} {"train_loss": -4.8605499267578125, "global_step": 13170, "epoch": 313} {"train_loss": -5.041078090667725, "global_step": 13171, "epoch": 313} {"train_loss": -5.205904006958008, "global_step": 13172, "epoch": 313} {"train_loss": -4.915791988372803, "global_step": 13173, "epoch": 313} {"train_loss": -5.188311576843262, "global_step": 13174, "epoch": 313} {"train_loss": -5.107625961303711, "global_step": 13175, "epoch": 313} {"train_loss": -5.094874382019043, "global_step": 13176, "epoch": 313} {"train_loss": -5.136112213134766, "global_step": 13177, "epoch": 313} {"train_loss": -5.09374475479126, "global_step": 13178, "epoch": 313} {"train_loss": -5.156569480895996, "global_step": 13179, "epoch": 313} {"train_loss": -5.144103050231934, "global_step": 13180, "epoch": 313} {"train_loss": -5.216620445251465, "global_step": 13181, "epoch": 313} {"train_loss": -5.233262062072754, "global_step": 13182, "epoch": 313} {"train_loss": -5.055483818054199, "global_step": 13183, "epoch": 313} {"train_loss": -4.951929092407227, "global_step": 13184, "epoch": 313} {"train_loss": -5.100973129272461, "global_step": 13185, "epoch": 313} {"train_loss": -5.292905807495117, "global_step": 13186, "epoch": 313} {"train_loss": -5.115140165601458, "global_step": 13187, "epoch": 313, "val_loss": 78950.40625} {"train_loss": -5.148181915283203, "global_step": 13188, "epoch": 314} {"train_loss": -5.152927398681641, "global_step": 13189, "epoch": 314} {"train_loss": -5.094865798950195, "global_step": 13190, "epoch": 314} {"train_loss": -5.129364967346191, "global_step": 13191, "epoch": 314} {"train_loss": -5.18491268157959, "global_step": 13192, "epoch": 314} {"train_loss": -5.255500793457031, "global_step": 13193, "epoch": 314} {"train_loss": -5.046782493591309, "global_step": 13194, "epoch": 314} {"train_loss": -5.198958396911621, "global_step": 13195, "epoch": 314} {"train_loss": -5.277666091918945, "global_step": 13196, "epoch": 314} {"train_loss": -4.990758895874023, "global_step": 13197, "epoch": 314} {"train_loss": -5.034998893737793, "global_step": 13198, "epoch": 314} {"train_loss": -5.126332759857178, "global_step": 13199, "epoch": 314} {"train_loss": -5.132033824920654, "global_step": 13200, "epoch": 314} {"train_loss": -5.126164436340332, "global_step": 13201, "epoch": 314} {"train_loss": -5.170808792114258, "global_step": 13202, "epoch": 314} {"train_loss": -5.0913238525390625, "global_step": 13203, "epoch": 314} {"train_loss": -5.232342720031738, "global_step": 13204, "epoch": 314} {"train_loss": -5.210683345794678, "global_step": 13205, "epoch": 314} {"train_loss": -5.181821823120117, "global_step": 13206, "epoch": 314} {"train_loss": -5.180554389953613, "global_step": 13207, "epoch": 314} {"train_loss": -5.236988067626953, "global_step": 13208, "epoch": 314} {"train_loss": -5.209185600280762, "global_step": 13209, "epoch": 314} {"train_loss": -5.09700870513916, "global_step": 13210, "epoch": 314} {"train_loss": -5.231595516204834, "global_step": 13211, "epoch": 314} {"train_loss": -5.174261093139648, "global_step": 13212, "epoch": 314} {"train_loss": -5.04443883895874, "global_step": 13213, "epoch": 314} {"train_loss": -5.161526203155518, "global_step": 13214, "epoch": 314} {"train_loss": -5.0563836097717285, "global_step": 13215, "epoch": 314} {"train_loss": -5.368356227874756, "global_step": 13216, "epoch": 314} {"train_loss": -5.136615753173828, "global_step": 13217, "epoch": 314} {"train_loss": -5.121321678161621, "global_step": 13218, "epoch": 314} {"train_loss": -5.163434982299805, "global_step": 13219, "epoch": 314} {"train_loss": -5.023995399475098, "global_step": 13220, "epoch": 314} {"train_loss": -5.218618392944336, "global_step": 13221, "epoch": 314} {"train_loss": -5.144537925720215, "global_step": 13222, "epoch": 314} {"train_loss": -4.985140800476074, "global_step": 13223, "epoch": 314} {"train_loss": -5.144519805908203, "global_step": 13224, "epoch": 314} {"train_loss": -5.187022686004639, "global_step": 13225, "epoch": 314} {"train_loss": -5.149909019470215, "global_step": 13226, "epoch": 314} {"train_loss": -5.11051082611084, "global_step": 13227, "epoch": 314} {"train_loss": -5.065878391265869, "global_step": 13228, "epoch": 314} {"train_loss": -5.147832677477882, "global_step": 13229, "epoch": 314, "val_loss": 79962.9921875} {"train_loss": -5.059781074523926, "global_step": 13230, "epoch": 315} {"train_loss": -5.1643147468566895, "global_step": 13231, "epoch": 315} {"train_loss": -4.983954906463623, "global_step": 13232, "epoch": 315} {"train_loss": -5.0302414894104, "global_step": 13233, "epoch": 315} {"train_loss": -4.985006809234619, "global_step": 13234, "epoch": 315} {"train_loss": -4.854179382324219, "global_step": 13235, "epoch": 315} {"train_loss": -5.017169952392578, "global_step": 13236, "epoch": 315} {"train_loss": -5.251395225524902, "global_step": 13237, "epoch": 315} {"train_loss": -5.05855655670166, "global_step": 13238, "epoch": 315} {"train_loss": -5.063821792602539, "global_step": 13239, "epoch": 315} {"train_loss": -4.8487019538879395, "global_step": 13240, "epoch": 315} {"train_loss": -5.052794933319092, "global_step": 13241, "epoch": 315} {"train_loss": -4.865133285522461, "global_step": 13242, "epoch": 315} {"train_loss": -5.076242446899414, "global_step": 13243, "epoch": 315} {"train_loss": -4.979524612426758, "global_step": 13244, "epoch": 315} {"train_loss": -4.88556432723999, "global_step": 13245, "epoch": 315} {"train_loss": -5.078273296356201, "global_step": 13246, "epoch": 315} {"train_loss": -5.062819480895996, "global_step": 13247, "epoch": 315} {"train_loss": -5.131958484649658, "global_step": 13248, "epoch": 315} {"train_loss": -5.202127456665039, "global_step": 13249, "epoch": 315} {"train_loss": -5.184092998504639, "global_step": 13250, "epoch": 315} {"train_loss": -5.064079761505127, "global_step": 13251, "epoch": 315} {"train_loss": -5.080183506011963, "global_step": 13252, "epoch": 315} {"train_loss": -5.160128116607666, "global_step": 13253, "epoch": 315} {"train_loss": -5.142569541931152, "global_step": 13254, "epoch": 315} {"train_loss": -5.135336875915527, "global_step": 13255, "epoch": 315} {"train_loss": -5.157658576965332, "global_step": 13256, "epoch": 315} {"train_loss": -5.166038513183594, "global_step": 13257, "epoch": 315} {"train_loss": -5.201493740081787, "global_step": 13258, "epoch": 315} {"train_loss": -5.113442420959473, "global_step": 13259, "epoch": 315} {"train_loss": -5.060919761657715, "global_step": 13260, "epoch": 315} {"train_loss": -5.1541218757629395, "global_step": 13261, "epoch": 315} {"train_loss": -5.260766983032227, "global_step": 13262, "epoch": 315} {"train_loss": -5.109330177307129, "global_step": 13263, "epoch": 315} {"train_loss": -5.153308391571045, "global_step": 13264, "epoch": 315} {"train_loss": -5.282864570617676, "global_step": 13265, "epoch": 315} {"train_loss": -5.148344993591309, "global_step": 13266, "epoch": 315} {"train_loss": -5.17496395111084, "global_step": 13267, "epoch": 315} {"train_loss": -5.282275199890137, "global_step": 13268, "epoch": 315} {"train_loss": -5.181100845336914, "global_step": 13269, "epoch": 315} {"train_loss": -5.052494049072266, "global_step": 13270, "epoch": 315} {"train_loss": -5.096918276378086, "global_step": 13271, "epoch": 315, "val_loss": 78920.640625} {"train_loss": -5.0405426025390625, "global_step": 13272, "epoch": 316} {"train_loss": -5.218596458435059, "global_step": 13273, "epoch": 316} {"train_loss": -5.037674903869629, "global_step": 13274, "epoch": 316} {"train_loss": -5.111616134643555, "global_step": 13275, "epoch": 316} {"train_loss": -5.185879230499268, "global_step": 13276, "epoch": 316} {"train_loss": -5.04669189453125, "global_step": 13277, "epoch": 316} {"train_loss": -4.936699867248535, "global_step": 13278, "epoch": 316} {"train_loss": -4.912575721740723, "global_step": 13279, "epoch": 316} {"train_loss": -4.991663932800293, "global_step": 13280, "epoch": 316} {"train_loss": -5.015698432922363, "global_step": 13281, "epoch": 316} {"train_loss": -5.086905479431152, "global_step": 13282, "epoch": 316} {"train_loss": -4.997347831726074, "global_step": 13283, "epoch": 316} {"train_loss": -5.138940811157227, "global_step": 13284, "epoch": 316} {"train_loss": -5.18721866607666, "global_step": 13285, "epoch": 316} {"train_loss": -5.114256858825684, "global_step": 13286, "epoch": 316} {"train_loss": -5.002300262451172, "global_step": 13287, "epoch": 316} {"train_loss": -5.078218460083008, "global_step": 13288, "epoch": 316} {"train_loss": -5.100185871124268, "global_step": 13289, "epoch": 316} {"train_loss": -5.124682426452637, "global_step": 13290, "epoch": 316} {"train_loss": -5.1263747215271, "global_step": 13291, "epoch": 316} {"train_loss": -5.2790327072143555, "global_step": 13292, "epoch": 316} {"train_loss": -5.0836334228515625, "global_step": 13293, "epoch": 316} {"train_loss": -5.172353744506836, "global_step": 13294, "epoch": 316} {"train_loss": -5.173872947692871, "global_step": 13295, "epoch": 316} {"train_loss": -5.182993412017822, "global_step": 13296, "epoch": 316} {"train_loss": -5.1697468757629395, "global_step": 13297, "epoch": 316} {"train_loss": -5.245359897613525, "global_step": 13298, "epoch": 316} {"train_loss": -5.092166900634766, "global_step": 13299, "epoch": 316} {"train_loss": -5.20099401473999, "global_step": 13300, "epoch": 316} {"train_loss": -5.198607921600342, "global_step": 13301, "epoch": 316} {"train_loss": -5.183443069458008, "global_step": 13302, "epoch": 316} {"train_loss": -5.243623733520508, "global_step": 13303, "epoch": 316} {"train_loss": -5.263924598693848, "global_step": 13304, "epoch": 316} {"train_loss": -5.096283435821533, "global_step": 13305, "epoch": 316} {"train_loss": -5.034544944763184, "global_step": 13306, "epoch": 316} {"train_loss": -5.133753776550293, "global_step": 13307, "epoch": 316} {"train_loss": -5.121878623962402, "global_step": 13308, "epoch": 316} {"train_loss": -5.108516693115234, "global_step": 13309, "epoch": 316} {"train_loss": -5.16851806640625, "global_step": 13310, "epoch": 316} {"train_loss": -5.207393646240234, "global_step": 13311, "epoch": 316} {"train_loss": -5.172919750213623, "global_step": 13312, "epoch": 316} {"train_loss": -5.116505191439674, "global_step": 13313, "epoch": 316, "val_loss": 79092.7109375} {"train_loss": -5.0842390060424805, "global_step": 13314, "epoch": 317} {"train_loss": -4.9809465408325195, "global_step": 13315, "epoch": 317} {"train_loss": -5.075437545776367, "global_step": 13316, "epoch": 317} {"train_loss": -5.1131439208984375, "global_step": 13317, "epoch": 317} {"train_loss": -5.059994697570801, "global_step": 13318, "epoch": 317} {"train_loss": -5.351131439208984, "global_step": 13319, "epoch": 317} {"train_loss": -4.9568657875061035, "global_step": 13320, "epoch": 317} {"train_loss": -5.20414924621582, "global_step": 13321, "epoch": 317} {"train_loss": -5.197808265686035, "global_step": 13322, "epoch": 317} {"train_loss": -5.056334495544434, "global_step": 13323, "epoch": 317} {"train_loss": -5.120765686035156, "global_step": 13324, "epoch": 317} {"train_loss": -5.14427375793457, "global_step": 13325, "epoch": 317} {"train_loss": -5.078089237213135, "global_step": 13326, "epoch": 317} {"train_loss": -5.0970659255981445, "global_step": 13327, "epoch": 317} {"train_loss": -5.334650039672852, "global_step": 13328, "epoch": 317} {"train_loss": -5.236956596374512, "global_step": 13329, "epoch": 317} {"train_loss": -5.137762069702148, "global_step": 13330, "epoch": 317} {"train_loss": -5.223562240600586, "global_step": 13331, "epoch": 317} {"train_loss": -4.895508766174316, "global_step": 13332, "epoch": 317} {"train_loss": -5.168309211730957, "global_step": 13333, "epoch": 317} {"train_loss": -5.142891883850098, "global_step": 13334, "epoch": 317} {"train_loss": -5.107783317565918, "global_step": 13335, "epoch": 317} {"train_loss": -5.113071918487549, "global_step": 13336, "epoch": 317} {"train_loss": -5.027044296264648, "global_step": 13337, "epoch": 317} {"train_loss": -5.226222991943359, "global_step": 13338, "epoch": 317} {"train_loss": -5.003835678100586, "global_step": 13339, "epoch": 317} {"train_loss": -5.290739059448242, "global_step": 13340, "epoch": 317} {"train_loss": -5.12340784072876, "global_step": 13341, "epoch": 317} {"train_loss": -5.0175628662109375, "global_step": 13342, "epoch": 317} {"train_loss": -5.127190589904785, "global_step": 13343, "epoch": 317} {"train_loss": -5.2157392501831055, "global_step": 13344, "epoch": 317} {"train_loss": -5.185604572296143, "global_step": 13345, "epoch": 317} {"train_loss": -5.2803192138671875, "global_step": 13346, "epoch": 317} {"train_loss": -5.11650276184082, "global_step": 13347, "epoch": 317} {"train_loss": -5.274308204650879, "global_step": 13348, "epoch": 317} {"train_loss": -5.191681385040283, "global_step": 13349, "epoch": 317} {"train_loss": -5.212706565856934, "global_step": 13350, "epoch": 317} {"train_loss": -5.214690208435059, "global_step": 13351, "epoch": 317} {"train_loss": -5.249526023864746, "global_step": 13352, "epoch": 317} {"train_loss": -5.139700412750244, "global_step": 13353, "epoch": 317} {"train_loss": -5.1410627365112305, "global_step": 13354, "epoch": 317} {"train_loss": -5.1443844976879305, "global_step": 13355, "epoch": 317, "val_loss": 79331.1953125} {"train_loss": -5.169078826904297, "global_step": 13356, "epoch": 318} {"train_loss": -5.266031265258789, "global_step": 13357, "epoch": 318} {"train_loss": -5.3343353271484375, "global_step": 13358, "epoch": 318} {"train_loss": -5.024350166320801, "global_step": 13359, "epoch": 318} {"train_loss": -5.035427570343018, "global_step": 13360, "epoch": 318} {"train_loss": -5.165610313415527, "global_step": 13361, "epoch": 318} {"train_loss": -5.1235127449035645, "global_step": 13362, "epoch": 318} {"train_loss": -5.319045066833496, "global_step": 13363, "epoch": 318} {"train_loss": -5.087107181549072, "global_step": 13364, "epoch": 318} {"train_loss": -5.090343475341797, "global_step": 13365, "epoch": 318} {"train_loss": -5.140676021575928, "global_step": 13366, "epoch": 318} {"train_loss": -5.150568008422852, "global_step": 13367, "epoch": 318} {"train_loss": -5.090027809143066, "global_step": 13368, "epoch": 318} {"train_loss": -5.2932820320129395, "global_step": 13369, "epoch": 318} {"train_loss": -5.108220100402832, "global_step": 13370, "epoch": 318} {"train_loss": -5.040589809417725, "global_step": 13371, "epoch": 318} {"train_loss": -5.170648574829102, "global_step": 13372, "epoch": 318} {"train_loss": -5.0008320808410645, "global_step": 13373, "epoch": 318} {"train_loss": -5.017273902893066, "global_step": 13374, "epoch": 318} {"train_loss": -5.25866174697876, "global_step": 13375, "epoch": 318} {"train_loss": -5.103545188903809, "global_step": 13376, "epoch": 318} {"train_loss": -4.8758368492126465, "global_step": 13377, "epoch": 318} {"train_loss": -5.116014003753662, "global_step": 13378, "epoch": 318} {"train_loss": -4.959781169891357, "global_step": 13379, "epoch": 318} {"train_loss": -4.986861705780029, "global_step": 13380, "epoch": 318} {"train_loss": -4.950848579406738, "global_step": 13381, "epoch": 318} {"train_loss": -5.27824592590332, "global_step": 13382, "epoch": 318} {"train_loss": -4.96138858795166, "global_step": 13383, "epoch": 318} {"train_loss": -5.192399024963379, "global_step": 13384, "epoch": 318} {"train_loss": -5.170151233673096, "global_step": 13385, "epoch": 318} {"train_loss": -5.020963191986084, "global_step": 13386, "epoch": 318} {"train_loss": -5.199126243591309, "global_step": 13387, "epoch": 318} {"train_loss": -5.182886600494385, "global_step": 13388, "epoch": 318} {"train_loss": -5.04609489440918, "global_step": 13389, "epoch": 318} {"train_loss": -5.17972469329834, "global_step": 13390, "epoch": 318} {"train_loss": -5.0848798751831055, "global_step": 13391, "epoch": 318} {"train_loss": -5.194527626037598, "global_step": 13392, "epoch": 318} {"train_loss": -5.145604610443115, "global_step": 13393, "epoch": 318} {"train_loss": -5.167705535888672, "global_step": 13394, "epoch": 318} {"train_loss": -5.052416801452637, "global_step": 13395, "epoch": 318} {"train_loss": -5.051609039306641, "global_step": 13396, "epoch": 318} {"train_loss": -5.1181471574874156, "global_step": 13397, "epoch": 318, "val_loss": 79061.4765625} {"train_loss": -4.965653419494629, "global_step": 13398, "epoch": 319} {"train_loss": -5.126682758331299, "global_step": 13399, "epoch": 319} {"train_loss": -5.2394866943359375, "global_step": 13400, "epoch": 319} {"train_loss": -5.175199508666992, "global_step": 13401, "epoch": 319} {"train_loss": -5.207653045654297, "global_step": 13402, "epoch": 319} {"train_loss": -5.219417572021484, "global_step": 13403, "epoch": 319} {"train_loss": -5.042966365814209, "global_step": 13404, "epoch": 319} {"train_loss": -5.186683654785156, "global_step": 13405, "epoch": 319} {"train_loss": -5.128756046295166, "global_step": 13406, "epoch": 319} {"train_loss": -5.097342491149902, "global_step": 13407, "epoch": 319} {"train_loss": -5.090733528137207, "global_step": 13408, "epoch": 319} {"train_loss": -5.061143398284912, "global_step": 13409, "epoch": 319} {"train_loss": -5.011580944061279, "global_step": 13410, "epoch": 319} {"train_loss": -5.175529479980469, "global_step": 13411, "epoch": 319} {"train_loss": -5.1776123046875, "global_step": 13412, "epoch": 319} {"train_loss": -5.26696252822876, "global_step": 13413, "epoch": 319} {"train_loss": -5.090035438537598, "global_step": 13414, "epoch": 319} {"train_loss": -5.030945301055908, "global_step": 13415, "epoch": 319} {"train_loss": -5.080258369445801, "global_step": 13416, "epoch": 319} {"train_loss": -5.080080986022949, "global_step": 13417, "epoch": 319} {"train_loss": -5.433619499206543, "global_step": 13418, "epoch": 319} {"train_loss": -5.116542816162109, "global_step": 13419, "epoch": 319} {"train_loss": -5.263714790344238, "global_step": 13420, "epoch": 319} {"train_loss": -5.12957763671875, "global_step": 13421, "epoch": 319} {"train_loss": -5.117695331573486, "global_step": 13422, "epoch": 319} {"train_loss": -5.222408294677734, "global_step": 13423, "epoch": 319} {"train_loss": -4.9640278816223145, "global_step": 13424, "epoch": 319} {"train_loss": -5.275172710418701, "global_step": 13425, "epoch": 319} {"train_loss": -4.960492134094238, "global_step": 13426, "epoch": 319} {"train_loss": -5.225493907928467, "global_step": 13427, "epoch": 319} {"train_loss": -5.159171104431152, "global_step": 13428, "epoch": 319} {"train_loss": -5.311225891113281, "global_step": 13429, "epoch": 319} {"train_loss": -5.212297439575195, "global_step": 13430, "epoch": 319} {"train_loss": -5.111321449279785, "global_step": 13431, "epoch": 319} {"train_loss": -5.081355571746826, "global_step": 13432, "epoch": 319} {"train_loss": -5.22001314163208, "global_step": 13433, "epoch": 319} {"train_loss": -5.120802879333496, "global_step": 13434, "epoch": 319} {"train_loss": -5.080844879150391, "global_step": 13435, "epoch": 319} {"train_loss": -5.046374797821045, "global_step": 13436, "epoch": 319} {"train_loss": -5.137888431549072, "global_step": 13437, "epoch": 319} {"train_loss": -5.018510818481445, "global_step": 13438, "epoch": 319} {"train_loss": -5.1399796690259665, "global_step": 13439, "epoch": 319, "val_loss": 80178.5859375} {"train_loss": -5.133347034454346, "global_step": 13440, "epoch": 320} {"train_loss": -5.021933555603027, "global_step": 13441, "epoch": 320} {"train_loss": -5.135312080383301, "global_step": 13442, "epoch": 320} {"train_loss": -5.210582733154297, "global_step": 13443, "epoch": 320} {"train_loss": -5.088230133056641, "global_step": 13444, "epoch": 320} {"train_loss": -5.011579990386963, "global_step": 13445, "epoch": 320} {"train_loss": -5.133937835693359, "global_step": 13446, "epoch": 320} {"train_loss": -5.200972557067871, "global_step": 13447, "epoch": 320} {"train_loss": -5.076591491699219, "global_step": 13448, "epoch": 320} {"train_loss": -5.204697608947754, "global_step": 13449, "epoch": 320} {"train_loss": -4.797689437866211, "global_step": 13450, "epoch": 320} {"train_loss": -5.015151023864746, "global_step": 13451, "epoch": 320} {"train_loss": -4.951326370239258, "global_step": 13452, "epoch": 320} {"train_loss": -5.0682525634765625, "global_step": 13453, "epoch": 320} {"train_loss": -5.012862205505371, "global_step": 13454, "epoch": 320} {"train_loss": -5.003851890563965, "global_step": 13455, "epoch": 320} {"train_loss": -5.055971622467041, "global_step": 13456, "epoch": 320} {"train_loss": -4.921766757965088, "global_step": 13457, "epoch": 320} {"train_loss": -5.185469150543213, "global_step": 13458, "epoch": 320} {"train_loss": -5.0307207107543945, "global_step": 13459, "epoch": 320} {"train_loss": -5.10189962387085, "global_step": 13460, "epoch": 320} {"train_loss": -5.1974029541015625, "global_step": 13461, "epoch": 320} {"train_loss": -5.019896507263184, "global_step": 13462, "epoch": 320} {"train_loss": -5.134326934814453, "global_step": 13463, "epoch": 320} {"train_loss": -5.146634578704834, "global_step": 13464, "epoch": 320} {"train_loss": -5.162940979003906, "global_step": 13465, "epoch": 320} {"train_loss": -5.078017234802246, "global_step": 13466, "epoch": 320} {"train_loss": -5.2026519775390625, "global_step": 13467, "epoch": 320} {"train_loss": -5.1432671546936035, "global_step": 13468, "epoch": 320} {"train_loss": -5.182900428771973, "global_step": 13469, "epoch": 320} {"train_loss": -5.093778133392334, "global_step": 13470, "epoch": 320} {"train_loss": -5.213010787963867, "global_step": 13471, "epoch": 320} {"train_loss": -5.058030128479004, "global_step": 13472, "epoch": 320} {"train_loss": -5.006137371063232, "global_step": 13473, "epoch": 320} {"train_loss": -5.1675944328308105, "global_step": 13474, "epoch": 320} {"train_loss": -5.163895606994629, "global_step": 13475, "epoch": 320} {"train_loss": -5.208234786987305, "global_step": 13476, "epoch": 320} {"train_loss": -5.173810958862305, "global_step": 13477, "epoch": 320} {"train_loss": -5.120481491088867, "global_step": 13478, "epoch": 320} {"train_loss": -5.101930141448975, "global_step": 13479, "epoch": 320} {"train_loss": -5.141598701477051, "global_step": 13480, "epoch": 320} {"train_loss": -5.098767927714756, "global_step": 13481, "epoch": 320, "val_loss": 79180.8203125} {"train_loss": -5.177244186401367, "global_step": 13482, "epoch": 321} {"train_loss": -5.111663818359375, "global_step": 13483, "epoch": 321} {"train_loss": -5.126070022583008, "global_step": 13484, "epoch": 321} {"train_loss": -5.048415660858154, "global_step": 13485, "epoch": 321} {"train_loss": -5.169745445251465, "global_step": 13486, "epoch": 321} {"train_loss": -5.289806842803955, "global_step": 13487, "epoch": 321} {"train_loss": -5.080347537994385, "global_step": 13488, "epoch": 321} {"train_loss": -5.199341773986816, "global_step": 13489, "epoch": 321} {"train_loss": -5.085172653198242, "global_step": 13490, "epoch": 321} {"train_loss": -5.0761518478393555, "global_step": 13491, "epoch": 321} {"train_loss": -5.08950662612915, "global_step": 13492, "epoch": 321} {"train_loss": -5.084331035614014, "global_step": 13493, "epoch": 321} {"train_loss": -5.2648749351501465, "global_step": 13494, "epoch": 321} {"train_loss": -5.198647499084473, "global_step": 13495, "epoch": 321} {"train_loss": -5.217080116271973, "global_step": 13496, "epoch": 321} {"train_loss": -5.238458633422852, "global_step": 13497, "epoch": 321} {"train_loss": -5.152730941772461, "global_step": 13498, "epoch": 321} {"train_loss": -5.148542881011963, "global_step": 13499, "epoch": 321} {"train_loss": -5.128075122833252, "global_step": 13500, "epoch": 321} {"train_loss": -5.037946701049805, "global_step": 13501, "epoch": 321} {"train_loss": -5.083804130554199, "global_step": 13502, "epoch": 321} {"train_loss": -5.191705226898193, "global_step": 13503, "epoch": 321} {"train_loss": -5.043305397033691, "global_step": 13504, "epoch": 321} {"train_loss": -5.134755611419678, "global_step": 13505, "epoch": 321} {"train_loss": -5.1261491775512695, "global_step": 13506, "epoch": 321} {"train_loss": -5.105663299560547, "global_step": 13507, "epoch": 321} {"train_loss": -5.311251640319824, "global_step": 13508, "epoch": 321} {"train_loss": -5.193957805633545, "global_step": 13509, "epoch": 321} {"train_loss": -5.179665565490723, "global_step": 13510, "epoch": 321} {"train_loss": -5.224329471588135, "global_step": 13511, "epoch": 321} {"train_loss": -5.224503517150879, "global_step": 13512, "epoch": 321} {"train_loss": -5.297077178955078, "global_step": 13513, "epoch": 321} {"train_loss": -5.059116840362549, "global_step": 13514, "epoch": 321} {"train_loss": -5.0516767501831055, "global_step": 13515, "epoch": 321} {"train_loss": -5.23443603515625, "global_step": 13516, "epoch": 321} {"train_loss": -5.250289440155029, "global_step": 13517, "epoch": 321} {"train_loss": -5.046679496765137, "global_step": 13518, "epoch": 321} {"train_loss": -5.159238815307617, "global_step": 13519, "epoch": 321} {"train_loss": -5.282369613647461, "global_step": 13520, "epoch": 321} {"train_loss": -5.129004001617432, "global_step": 13521, "epoch": 321} {"train_loss": -5.1033477783203125, "global_step": 13522, "epoch": 321} {"train_loss": -5.156173762821016, "global_step": 13523, "epoch": 321, "val_loss": 78680.6640625} {"train_loss": -5.168530464172363, "global_step": 13524, "epoch": 322} {"train_loss": -5.250292778015137, "global_step": 13525, "epoch": 322} {"train_loss": -5.30029821395874, "global_step": 13526, "epoch": 322} {"train_loss": -5.106746673583984, "global_step": 13527, "epoch": 322} {"train_loss": -5.0607123374938965, "global_step": 13528, "epoch": 322} {"train_loss": -5.015927314758301, "global_step": 13529, "epoch": 322} {"train_loss": -5.125636577606201, "global_step": 13530, "epoch": 322} {"train_loss": -5.212162017822266, "global_step": 13531, "epoch": 322} {"train_loss": -5.030485153198242, "global_step": 13532, "epoch": 322} {"train_loss": -4.984450340270996, "global_step": 13533, "epoch": 322} {"train_loss": -5.026857376098633, "global_step": 13534, "epoch": 322} {"train_loss": -4.9354352951049805, "global_step": 13535, "epoch": 322} {"train_loss": -4.884210586547852, "global_step": 13536, "epoch": 322} {"train_loss": -5.138031005859375, "global_step": 13537, "epoch": 322} {"train_loss": -4.990262031555176, "global_step": 13538, "epoch": 322} {"train_loss": -4.983266830444336, "global_step": 13539, "epoch": 322} {"train_loss": -5.1279473304748535, "global_step": 13540, "epoch": 322} {"train_loss": -4.892874717712402, "global_step": 13541, "epoch": 322} {"train_loss": -5.046166896820068, "global_step": 13542, "epoch": 322} {"train_loss": -4.947116851806641, "global_step": 13543, "epoch": 322} {"train_loss": -5.173830986022949, "global_step": 13544, "epoch": 322} {"train_loss": -4.812930107116699, "global_step": 13545, "epoch": 322} {"train_loss": -5.1091532707214355, "global_step": 13546, "epoch": 322} {"train_loss": -5.00468635559082, "global_step": 13547, "epoch": 322} {"train_loss": -5.104281425476074, "global_step": 13548, "epoch": 322} {"train_loss": -5.031432628631592, "global_step": 13549, "epoch": 322} {"train_loss": -5.003580093383789, "global_step": 13550, "epoch": 322} {"train_loss": -5.076572418212891, "global_step": 13551, "epoch": 322} {"train_loss": -5.046555519104004, "global_step": 13552, "epoch": 322} {"train_loss": -5.150966644287109, "global_step": 13553, "epoch": 322} {"train_loss": -5.097271919250488, "global_step": 13554, "epoch": 322} {"train_loss": -5.056973934173584, "global_step": 13555, "epoch": 322} {"train_loss": -5.105159759521484, "global_step": 13556, "epoch": 322} {"train_loss": -5.011927604675293, "global_step": 13557, "epoch": 322} {"train_loss": -5.047525405883789, "global_step": 13558, "epoch": 322} {"train_loss": -5.013086795806885, "global_step": 13559, "epoch": 322} {"train_loss": -5.144932270050049, "global_step": 13560, "epoch": 322} {"train_loss": -5.107512474060059, "global_step": 13561, "epoch": 322} {"train_loss": -5.08079719543457, "global_step": 13562, "epoch": 322} {"train_loss": -5.133399486541748, "global_step": 13563, "epoch": 322} {"train_loss": -5.048397064208984, "global_step": 13564, "epoch": 322} {"train_loss": -5.06931978180295, "global_step": 13565, "epoch": 322, "val_loss": 79037.234375} {"train_loss": -5.16869592666626, "global_step": 13566, "epoch": 323} {"train_loss": -5.104718208312988, "global_step": 13567, "epoch": 323} {"train_loss": -5.112349510192871, "global_step": 13568, "epoch": 323} {"train_loss": -5.210312843322754, "global_step": 13569, "epoch": 323} {"train_loss": -5.228029251098633, "global_step": 13570, "epoch": 323} {"train_loss": -5.344566345214844, "global_step": 13571, "epoch": 323} {"train_loss": -5.304534912109375, "global_step": 13572, "epoch": 323} {"train_loss": -5.117728233337402, "global_step": 13573, "epoch": 323} {"train_loss": -5.023094177246094, "global_step": 13574, "epoch": 323} {"train_loss": -5.2105536460876465, "global_step": 13575, "epoch": 323} {"train_loss": -5.143328666687012, "global_step": 13576, "epoch": 323} {"train_loss": -5.098761558532715, "global_step": 13577, "epoch": 323} {"train_loss": -5.10897159576416, "global_step": 13578, "epoch": 323} {"train_loss": -5.258798599243164, "global_step": 13579, "epoch": 323} {"train_loss": -5.097951889038086, "global_step": 13580, "epoch": 323} {"train_loss": -5.003021240234375, "global_step": 13581, "epoch": 323} {"train_loss": -5.132884979248047, "global_step": 13582, "epoch": 323} {"train_loss": -5.035455703735352, "global_step": 13583, "epoch": 323} {"train_loss": -4.971837997436523, "global_step": 13584, "epoch": 323} {"train_loss": -5.085680961608887, "global_step": 13585, "epoch": 323} {"train_loss": -5.107844352722168, "global_step": 13586, "epoch": 323} {"train_loss": -5.04915714263916, "global_step": 13587, "epoch": 323} {"train_loss": -5.182667255401611, "global_step": 13588, "epoch": 323} {"train_loss": -5.116554260253906, "global_step": 13589, "epoch": 323} {"train_loss": -5.179616928100586, "global_step": 13590, "epoch": 323} {"train_loss": -5.031619071960449, "global_step": 13591, "epoch": 323} {"train_loss": -5.075606822967529, "global_step": 13592, "epoch": 323} {"train_loss": -5.157773971557617, "global_step": 13593, "epoch": 323} {"train_loss": -5.142797470092773, "global_step": 13594, "epoch": 323} {"train_loss": -5.120309829711914, "global_step": 13595, "epoch": 323} {"train_loss": -5.121204376220703, "global_step": 13596, "epoch": 323} {"train_loss": -5.119977951049805, "global_step": 13597, "epoch": 323} {"train_loss": -5.1891584396362305, "global_step": 13598, "epoch": 323} {"train_loss": -5.12989616394043, "global_step": 13599, "epoch": 323} {"train_loss": -5.14620304107666, "global_step": 13600, "epoch": 323} {"train_loss": -5.009209632873535, "global_step": 13601, "epoch": 323} {"train_loss": -5.131141185760498, "global_step": 13602, "epoch": 323} {"train_loss": -5.052752494812012, "global_step": 13603, "epoch": 323} {"train_loss": -5.090653419494629, "global_step": 13604, "epoch": 323} {"train_loss": -5.131405830383301, "global_step": 13605, "epoch": 323} {"train_loss": -5.026505470275879, "global_step": 13606, "epoch": 323} {"train_loss": -5.128266879490444, "global_step": 13607, "epoch": 323, "val_loss": 78898.1953125} {"train_loss": -5.184584140777588, "global_step": 13608, "epoch": 324} {"train_loss": -5.249085903167725, "global_step": 13609, "epoch": 324} {"train_loss": -5.06010627746582, "global_step": 13610, "epoch": 324} {"train_loss": -5.0772294998168945, "global_step": 13611, "epoch": 324} {"train_loss": -4.9283342361450195, "global_step": 13612, "epoch": 324} {"train_loss": -4.923220634460449, "global_step": 13613, "epoch": 324} {"train_loss": -4.961291313171387, "global_step": 13614, "epoch": 324} {"train_loss": -5.063724517822266, "global_step": 13615, "epoch": 324} {"train_loss": -5.012667179107666, "global_step": 13616, "epoch": 324} {"train_loss": -4.815310478210449, "global_step": 13617, "epoch": 324} {"train_loss": -4.849022388458252, "global_step": 13618, "epoch": 324} {"train_loss": -5.115232467651367, "global_step": 13619, "epoch": 324} {"train_loss": -4.862579345703125, "global_step": 13620, "epoch": 324} {"train_loss": -5.0510711669921875, "global_step": 13621, "epoch": 324} {"train_loss": -5.0950798988342285, "global_step": 13622, "epoch": 324} {"train_loss": -4.911109924316406, "global_step": 13623, "epoch": 324} {"train_loss": -5.077598571777344, "global_step": 13624, "epoch": 324} {"train_loss": -4.96497917175293, "global_step": 13625, "epoch": 324} {"train_loss": -5.046921730041504, "global_step": 13626, "epoch": 324} {"train_loss": -5.08057165145874, "global_step": 13627, "epoch": 324} {"train_loss": -5.176274299621582, "global_step": 13628, "epoch": 324} {"train_loss": -4.930303573608398, "global_step": 13629, "epoch": 324} {"train_loss": -5.031282424926758, "global_step": 13630, "epoch": 324} {"train_loss": -5.071237564086914, "global_step": 13631, "epoch": 324} {"train_loss": -5.078125, "global_step": 13632, "epoch": 324} {"train_loss": -5.017627239227295, "global_step": 13633, "epoch": 324} {"train_loss": -5.153141498565674, "global_step": 13634, "epoch": 324} {"train_loss": -5.055127143859863, "global_step": 13635, "epoch": 324} {"train_loss": -5.053283214569092, "global_step": 13636, "epoch": 324} {"train_loss": -5.05400276184082, "global_step": 13637, "epoch": 324} {"train_loss": -5.254519462585449, "global_step": 13638, "epoch": 324} {"train_loss": -5.041738510131836, "global_step": 13639, "epoch": 324} {"train_loss": -5.215087413787842, "global_step": 13640, "epoch": 324} {"train_loss": -5.090185165405273, "global_step": 13641, "epoch": 324} {"train_loss": -5.258489608764648, "global_step": 13642, "epoch": 324} {"train_loss": -5.095993518829346, "global_step": 13643, "epoch": 324} {"train_loss": -5.156097412109375, "global_step": 13644, "epoch": 324} {"train_loss": -5.110583305358887, "global_step": 13645, "epoch": 324} {"train_loss": -5.216053009033203, "global_step": 13646, "epoch": 324} {"train_loss": -5.038138389587402, "global_step": 13647, "epoch": 324} {"train_loss": -5.015613079071045, "global_step": 13648, "epoch": 324} {"train_loss": -5.059317407153902, "global_step": 13649, "epoch": 324, "val_loss": 78318.984375} {"train_loss": -5.190746307373047, "global_step": 13650, "epoch": 325} {"train_loss": -4.964019775390625, "global_step": 13651, "epoch": 325} {"train_loss": -5.049740314483643, "global_step": 13652, "epoch": 325} {"train_loss": -5.111588478088379, "global_step": 13653, "epoch": 325} {"train_loss": -4.888351917266846, "global_step": 13654, "epoch": 325} {"train_loss": -5.074478626251221, "global_step": 13655, "epoch": 325} {"train_loss": -4.960267066955566, "global_step": 13656, "epoch": 325} {"train_loss": -5.132523536682129, "global_step": 13657, "epoch": 325} {"train_loss": -5.115027904510498, "global_step": 13658, "epoch": 325} {"train_loss": -5.079854965209961, "global_step": 13659, "epoch": 325} {"train_loss": -5.148024559020996, "global_step": 13660, "epoch": 325} {"train_loss": -5.03494119644165, "global_step": 13661, "epoch": 325} {"train_loss": -5.137648582458496, "global_step": 13662, "epoch": 325} {"train_loss": -5.228992462158203, "global_step": 13663, "epoch": 325} {"train_loss": -5.123640060424805, "global_step": 13664, "epoch": 325} {"train_loss": -5.124659061431885, "global_step": 13665, "epoch": 325} {"train_loss": -5.127720832824707, "global_step": 13666, "epoch": 325} {"train_loss": -5.225164890289307, "global_step": 13667, "epoch": 325} {"train_loss": -5.144344806671143, "global_step": 13668, "epoch": 325} {"train_loss": -5.196932792663574, "global_step": 13669, "epoch": 325} {"train_loss": -5.090167045593262, "global_step": 13670, "epoch": 325} {"train_loss": -5.1184797286987305, "global_step": 13671, "epoch": 325} {"train_loss": -5.118007659912109, "global_step": 13672, "epoch": 325} {"train_loss": -5.1375555992126465, "global_step": 13673, "epoch": 325} {"train_loss": -5.054568767547607, "global_step": 13674, "epoch": 325} {"train_loss": -5.2294111251831055, "global_step": 13675, "epoch": 325} {"train_loss": -5.073816299438477, "global_step": 13676, "epoch": 325} {"train_loss": -5.323414325714111, "global_step": 13677, "epoch": 325} {"train_loss": -5.075658321380615, "global_step": 13678, "epoch": 325} {"train_loss": -5.102676868438721, "global_step": 13679, "epoch": 325} {"train_loss": -5.240182399749756, "global_step": 13680, "epoch": 325} {"train_loss": -5.16925573348999, "global_step": 13681, "epoch": 325} {"train_loss": -5.078114032745361, "global_step": 13682, "epoch": 325} {"train_loss": -5.215648174285889, "global_step": 13683, "epoch": 325} {"train_loss": -5.137413024902344, "global_step": 13684, "epoch": 325} {"train_loss": -5.09604549407959, "global_step": 13685, "epoch": 325} {"train_loss": -5.264941215515137, "global_step": 13686, "epoch": 325} {"train_loss": -5.00761604309082, "global_step": 13687, "epoch": 325} {"train_loss": -5.227869987487793, "global_step": 13688, "epoch": 325} {"train_loss": -5.226692199707031, "global_step": 13689, "epoch": 325} {"train_loss": -5.048826217651367, "global_step": 13690, "epoch": 325} {"train_loss": -5.121538355236962, "global_step": 13691, "epoch": 325, "val_loss": 78628.5390625} {"train_loss": -5.216256141662598, "global_step": 13692, "epoch": 326} {"train_loss": -5.074387550354004, "global_step": 13693, "epoch": 326} {"train_loss": -5.129573822021484, "global_step": 13694, "epoch": 326} {"train_loss": -5.1303510665893555, "global_step": 13695, "epoch": 326} {"train_loss": -5.227452278137207, "global_step": 13696, "epoch": 326} {"train_loss": -5.3215532302856445, "global_step": 13697, "epoch": 326} {"train_loss": -5.1883697509765625, "global_step": 13698, "epoch": 326} {"train_loss": -5.27789306640625, "global_step": 13699, "epoch": 326} {"train_loss": -5.159836769104004, "global_step": 13700, "epoch": 326} {"train_loss": -5.196483135223389, "global_step": 13701, "epoch": 326} {"train_loss": -5.2269158363342285, "global_step": 13702, "epoch": 326} {"train_loss": -5.12015962600708, "global_step": 13703, "epoch": 326} {"train_loss": -5.310255527496338, "global_step": 13704, "epoch": 326} {"train_loss": -5.045907497406006, "global_step": 13705, "epoch": 326} {"train_loss": -4.9886040687561035, "global_step": 13706, "epoch": 326} {"train_loss": -5.212937355041504, "global_step": 13707, "epoch": 326} {"train_loss": -5.141656398773193, "global_step": 13708, "epoch": 326} {"train_loss": -5.0851311683654785, "global_step": 13709, "epoch": 326} {"train_loss": -5.364150047302246, "global_step": 13710, "epoch": 326} {"train_loss": -5.163428783416748, "global_step": 13711, "epoch": 326} {"train_loss": -5.113613128662109, "global_step": 13712, "epoch": 326} {"train_loss": -5.189940452575684, "global_step": 13713, "epoch": 326} {"train_loss": -5.183450222015381, "global_step": 13714, "epoch": 326} {"train_loss": -5.1418914794921875, "global_step": 13715, "epoch": 326} {"train_loss": -5.23580265045166, "global_step": 13716, "epoch": 326} {"train_loss": -5.032741546630859, "global_step": 13717, "epoch": 326} {"train_loss": -5.079046249389648, "global_step": 13718, "epoch": 326} {"train_loss": -5.156040191650391, "global_step": 13719, "epoch": 326} {"train_loss": -5.17041540145874, "global_step": 13720, "epoch": 326} {"train_loss": -5.090693473815918, "global_step": 13721, "epoch": 326} {"train_loss": -5.2338547706604, "global_step": 13722, "epoch": 326} {"train_loss": -5.260793685913086, "global_step": 13723, "epoch": 326} {"train_loss": -5.173211097717285, "global_step": 13724, "epoch": 326} {"train_loss": -5.044419288635254, "global_step": 13725, "epoch": 326} {"train_loss": -5.099715232849121, "global_step": 13726, "epoch": 326} {"train_loss": -5.232632637023926, "global_step": 13727, "epoch": 326} {"train_loss": -5.051427841186523, "global_step": 13728, "epoch": 326} {"train_loss": -5.136041164398193, "global_step": 13729, "epoch": 326} {"train_loss": -5.165951728820801, "global_step": 13730, "epoch": 326} {"train_loss": -5.044190406799316, "global_step": 13731, "epoch": 326} {"train_loss": -5.194016456604004, "global_step": 13732, "epoch": 326} {"train_loss": -5.163824660437448, "global_step": 13733, "epoch": 326, "val_loss": 78734.7578125} {"train_loss": -5.108377933502197, "global_step": 13734, "epoch": 327} {"train_loss": -5.067012786865234, "global_step": 13735, "epoch": 327} {"train_loss": -4.9901909828186035, "global_step": 13736, "epoch": 327} {"train_loss": -5.171109676361084, "global_step": 13737, "epoch": 327} {"train_loss": -5.076215744018555, "global_step": 13738, "epoch": 327} {"train_loss": -5.014816761016846, "global_step": 13739, "epoch": 327} {"train_loss": -5.177528381347656, "global_step": 13740, "epoch": 327} {"train_loss": -5.141288757324219, "global_step": 13741, "epoch": 327} {"train_loss": -5.152410507202148, "global_step": 13742, "epoch": 327} {"train_loss": -5.130475997924805, "global_step": 13743, "epoch": 327} {"train_loss": -5.113245010375977, "global_step": 13744, "epoch": 327} {"train_loss": -5.075726509094238, "global_step": 13745, "epoch": 327} {"train_loss": -5.229665756225586, "global_step": 13746, "epoch": 327} {"train_loss": -4.889773368835449, "global_step": 13747, "epoch": 327} {"train_loss": -5.242918968200684, "global_step": 13748, "epoch": 327} {"train_loss": -4.946009635925293, "global_step": 13749, "epoch": 327} {"train_loss": -5.082333564758301, "global_step": 13750, "epoch": 327} {"train_loss": -5.200797080993652, "global_step": 13751, "epoch": 327} {"train_loss": -5.0916948318481445, "global_step": 13752, "epoch": 327} {"train_loss": -5.185544967651367, "global_step": 13753, "epoch": 327} {"train_loss": -5.356781959533691, "global_step": 13754, "epoch": 327} {"train_loss": -5.241175651550293, "global_step": 13755, "epoch": 327} {"train_loss": -5.281664848327637, "global_step": 13756, "epoch": 327} {"train_loss": -5.115400314331055, "global_step": 13757, "epoch": 327} {"train_loss": -5.110123157501221, "global_step": 13758, "epoch": 327} {"train_loss": -5.185152530670166, "global_step": 13759, "epoch": 327} {"train_loss": -5.08900260925293, "global_step": 13760, "epoch": 327} {"train_loss": -5.153165817260742, "global_step": 13761, "epoch": 327} {"train_loss": -5.222907066345215, "global_step": 13762, "epoch": 327} {"train_loss": -5.007809638977051, "global_step": 13763, "epoch": 327} {"train_loss": -5.3126540184021, "global_step": 13764, "epoch": 327} {"train_loss": -5.1847991943359375, "global_step": 13765, "epoch": 327} {"train_loss": -5.198700904846191, "global_step": 13766, "epoch": 327} {"train_loss": -5.018171310424805, "global_step": 13767, "epoch": 327} {"train_loss": -5.146450042724609, "global_step": 13768, "epoch": 327} {"train_loss": -5.308126449584961, "global_step": 13769, "epoch": 327} {"train_loss": -5.179757118225098, "global_step": 13770, "epoch": 327} {"train_loss": -5.237321853637695, "global_step": 13771, "epoch": 327} {"train_loss": -5.068706512451172, "global_step": 13772, "epoch": 327} {"train_loss": -5.0454511642456055, "global_step": 13773, "epoch": 327} {"train_loss": -5.131551742553711, "global_step": 13774, "epoch": 327} {"train_loss": -5.138267744155157, "global_step": 13775, "epoch": 327, "val_loss": 78907.4140625} {"train_loss": -5.222749710083008, "global_step": 13776, "epoch": 328} {"train_loss": -5.204905033111572, "global_step": 13777, "epoch": 328} {"train_loss": -5.156344413757324, "global_step": 13778, "epoch": 328} {"train_loss": -5.158639907836914, "global_step": 13779, "epoch": 328} {"train_loss": -5.254367828369141, "global_step": 13780, "epoch": 328} {"train_loss": -5.078740119934082, "global_step": 13781, "epoch": 328} {"train_loss": -5.143523216247559, "global_step": 13782, "epoch": 328} {"train_loss": -5.204425811767578, "global_step": 13783, "epoch": 328} {"train_loss": -5.232107162475586, "global_step": 13784, "epoch": 328} {"train_loss": -5.209199905395508, "global_step": 13785, "epoch": 328} {"train_loss": -5.266166687011719, "global_step": 13786, "epoch": 328} {"train_loss": -5.237217426300049, "global_step": 13787, "epoch": 328} {"train_loss": -5.202622413635254, "global_step": 13788, "epoch": 328} {"train_loss": -5.147843360900879, "global_step": 13789, "epoch": 328} {"train_loss": -5.270484924316406, "global_step": 13790, "epoch": 328} {"train_loss": -5.113871097564697, "global_step": 13791, "epoch": 328} {"train_loss": -5.102710247039795, "global_step": 13792, "epoch": 328} {"train_loss": -5.084014892578125, "global_step": 13793, "epoch": 328} {"train_loss": -5.173391342163086, "global_step": 13794, "epoch": 328} {"train_loss": -5.1646928787231445, "global_step": 13795, "epoch": 328} {"train_loss": -5.24125337600708, "global_step": 13796, "epoch": 328} {"train_loss": -5.149012565612793, "global_step": 13797, "epoch": 328} {"train_loss": -5.192970275878906, "global_step": 13798, "epoch": 328} {"train_loss": -5.134072303771973, "global_step": 13799, "epoch": 328} {"train_loss": -5.1903076171875, "global_step": 13800, "epoch": 328} {"train_loss": -4.975736141204834, "global_step": 13801, "epoch": 328} {"train_loss": -4.971501350402832, "global_step": 13802, "epoch": 328} {"train_loss": -5.094738006591797, "global_step": 13803, "epoch": 328} {"train_loss": -5.112849235534668, "global_step": 13804, "epoch": 328} {"train_loss": -4.949655532836914, "global_step": 13805, "epoch": 328} {"train_loss": -5.021396636962891, "global_step": 13806, "epoch": 328} {"train_loss": -5.088241100311279, "global_step": 13807, "epoch": 328} {"train_loss": -5.141498565673828, "global_step": 13808, "epoch": 328} {"train_loss": -4.9342875480651855, "global_step": 13809, "epoch": 328} {"train_loss": -5.070501327514648, "global_step": 13810, "epoch": 328} {"train_loss": -5.056621074676514, "global_step": 13811, "epoch": 328} {"train_loss": -4.964077949523926, "global_step": 13812, "epoch": 328} {"train_loss": -5.031216621398926, "global_step": 13813, "epoch": 328} {"train_loss": -4.90155029296875, "global_step": 13814, "epoch": 328} {"train_loss": -5.054264068603516, "global_step": 13815, "epoch": 328} {"train_loss": -5.041468620300293, "global_step": 13816, "epoch": 328} {"train_loss": -5.123650857380459, "global_step": 13817, "epoch": 328, "val_loss": 79910.828125} {"train_loss": -4.931015968322754, "global_step": 13818, "epoch": 329} {"train_loss": -5.0345282554626465, "global_step": 13819, "epoch": 329} {"train_loss": -5.06365442276001, "global_step": 13820, "epoch": 329} {"train_loss": -5.105433464050293, "global_step": 13821, "epoch": 329} {"train_loss": -5.178985595703125, "global_step": 13822, "epoch": 329} {"train_loss": -5.074795722961426, "global_step": 13823, "epoch": 329} {"train_loss": -5.123196125030518, "global_step": 13824, "epoch": 329} {"train_loss": -5.048155307769775, "global_step": 13825, "epoch": 329} {"train_loss": -5.154195785522461, "global_step": 13826, "epoch": 329} {"train_loss": -5.038119316101074, "global_step": 13827, "epoch": 329} {"train_loss": -5.0937933921813965, "global_step": 13828, "epoch": 329} {"train_loss": -5.069221496582031, "global_step": 13829, "epoch": 329} {"train_loss": -5.1311540603637695, "global_step": 13830, "epoch": 329} {"train_loss": -5.068612575531006, "global_step": 13831, "epoch": 329} {"train_loss": -5.2087860107421875, "global_step": 13832, "epoch": 329} {"train_loss": -5.2389726638793945, "global_step": 13833, "epoch": 329} {"train_loss": -5.259465217590332, "global_step": 13834, "epoch": 329} {"train_loss": -5.1388959884643555, "global_step": 13835, "epoch": 329} {"train_loss": -5.090733528137207, "global_step": 13836, "epoch": 329} {"train_loss": -5.117005348205566, "global_step": 13837, "epoch": 329} {"train_loss": -5.205386161804199, "global_step": 13838, "epoch": 329} {"train_loss": -5.165508270263672, "global_step": 13839, "epoch": 329} {"train_loss": -5.148251533508301, "global_step": 13840, "epoch": 329} {"train_loss": -5.099172592163086, "global_step": 13841, "epoch": 329} {"train_loss": -5.150130271911621, "global_step": 13842, "epoch": 329} {"train_loss": -5.013561248779297, "global_step": 13843, "epoch": 329} {"train_loss": -5.0879716873168945, "global_step": 13844, "epoch": 329} {"train_loss": -5.171943664550781, "global_step": 13845, "epoch": 329} {"train_loss": -5.083115577697754, "global_step": 13846, "epoch": 329} {"train_loss": -5.023321151733398, "global_step": 13847, "epoch": 329} {"train_loss": -5.248702526092529, "global_step": 13848, "epoch": 329} {"train_loss": -5.201223850250244, "global_step": 13849, "epoch": 329} {"train_loss": -5.11490535736084, "global_step": 13850, "epoch": 329} {"train_loss": -5.24013614654541, "global_step": 13851, "epoch": 329} {"train_loss": -5.275607109069824, "global_step": 13852, "epoch": 329} {"train_loss": -5.258164405822754, "global_step": 13853, "epoch": 329} {"train_loss": -5.174761772155762, "global_step": 13854, "epoch": 329} {"train_loss": -5.125275611877441, "global_step": 13855, "epoch": 329} {"train_loss": -5.244533538818359, "global_step": 13856, "epoch": 329} {"train_loss": -5.197378158569336, "global_step": 13857, "epoch": 329} {"train_loss": -5.204618453979492, "global_step": 13858, "epoch": 329} {"train_loss": -5.141232921963646, "global_step": 13859, "epoch": 329, "val_loss": 78699.2421875} {"train_loss": -5.048344612121582, "global_step": 13860, "epoch": 330} {"train_loss": -5.118988037109375, "global_step": 13861, "epoch": 330} {"train_loss": -5.1713151931762695, "global_step": 13862, "epoch": 330} {"train_loss": -5.092235565185547, "global_step": 13863, "epoch": 330} {"train_loss": -5.051778793334961, "global_step": 13864, "epoch": 330} {"train_loss": -5.110106468200684, "global_step": 13865, "epoch": 330} {"train_loss": -5.333431243896484, "global_step": 13866, "epoch": 330} {"train_loss": -5.027894020080566, "global_step": 13867, "epoch": 330} {"train_loss": -5.121919631958008, "global_step": 13868, "epoch": 330} {"train_loss": -5.146039009094238, "global_step": 13869, "epoch": 330} {"train_loss": -5.275310039520264, "global_step": 13870, "epoch": 330} {"train_loss": -5.185437202453613, "global_step": 13871, "epoch": 330} {"train_loss": -5.111827850341797, "global_step": 13872, "epoch": 330} {"train_loss": -5.148458003997803, "global_step": 13873, "epoch": 330} {"train_loss": -5.202668190002441, "global_step": 13874, "epoch": 330} {"train_loss": -5.244958877563477, "global_step": 13875, "epoch": 330} {"train_loss": -4.898124694824219, "global_step": 13876, "epoch": 330} {"train_loss": -5.133601665496826, "global_step": 13877, "epoch": 330} {"train_loss": -5.183901786804199, "global_step": 13878, "epoch": 330} {"train_loss": -5.106163024902344, "global_step": 13879, "epoch": 330} {"train_loss": -5.145042419433594, "global_step": 13880, "epoch": 330} {"train_loss": -5.2076849937438965, "global_step": 13881, "epoch": 330} {"train_loss": -5.158079624176025, "global_step": 13882, "epoch": 330} {"train_loss": -5.1909565925598145, "global_step": 13883, "epoch": 330} {"train_loss": -5.082204341888428, "global_step": 13884, "epoch": 330} {"train_loss": -5.334084510803223, "global_step": 13885, "epoch": 330} {"train_loss": -5.183231353759766, "global_step": 13886, "epoch": 330} {"train_loss": -5.054713249206543, "global_step": 13887, "epoch": 330} {"train_loss": -5.260119438171387, "global_step": 13888, "epoch": 330} {"train_loss": -5.120790481567383, "global_step": 13889, "epoch": 330} {"train_loss": -5.107641220092773, "global_step": 13890, "epoch": 330} {"train_loss": -5.184211730957031, "global_step": 13891, "epoch": 330} {"train_loss": -5.276341438293457, "global_step": 13892, "epoch": 330} {"train_loss": -5.151801109313965, "global_step": 13893, "epoch": 330} {"train_loss": -5.143398761749268, "global_step": 13894, "epoch": 330} {"train_loss": -5.106267929077148, "global_step": 13895, "epoch": 330} {"train_loss": -5.237146377563477, "global_step": 13896, "epoch": 330} {"train_loss": -5.164895057678223, "global_step": 13897, "epoch": 330} {"train_loss": -5.164027214050293, "global_step": 13898, "epoch": 330} {"train_loss": -5.384485721588135, "global_step": 13899, "epoch": 330} {"train_loss": -5.226553916931152, "global_step": 13900, "epoch": 330} {"train_loss": -5.16176962852478, "global_step": 13901, "epoch": 330, "val_loss": 78343.734375} {"train_loss": -5.182023048400879, "global_step": 13902, "epoch": 331} {"train_loss": -5.224336624145508, "global_step": 13903, "epoch": 331} {"train_loss": -5.077081680297852, "global_step": 13904, "epoch": 331} {"train_loss": -5.173288345336914, "global_step": 13905, "epoch": 331} {"train_loss": -5.094198226928711, "global_step": 13906, "epoch": 331} {"train_loss": -5.365029335021973, "global_step": 13907, "epoch": 331} {"train_loss": -5.082533359527588, "global_step": 13908, "epoch": 331} {"train_loss": -5.3158769607543945, "global_step": 13909, "epoch": 331} {"train_loss": -5.28678035736084, "global_step": 13910, "epoch": 331} {"train_loss": -5.023655414581299, "global_step": 13911, "epoch": 331} {"train_loss": -5.188905715942383, "global_step": 13912, "epoch": 331} {"train_loss": -5.167173385620117, "global_step": 13913, "epoch": 331} {"train_loss": -5.065649032592773, "global_step": 13914, "epoch": 331} {"train_loss": -5.189400672912598, "global_step": 13915, "epoch": 331} {"train_loss": -5.140570640563965, "global_step": 13916, "epoch": 331} {"train_loss": -5.157997131347656, "global_step": 13917, "epoch": 331} {"train_loss": -5.0568084716796875, "global_step": 13918, "epoch": 331} {"train_loss": -5.175159454345703, "global_step": 13919, "epoch": 331} {"train_loss": -5.305547714233398, "global_step": 13920, "epoch": 331} {"train_loss": -5.251194477081299, "global_step": 13921, "epoch": 331} {"train_loss": -4.948932647705078, "global_step": 13922, "epoch": 331} {"train_loss": -5.28861141204834, "global_step": 13923, "epoch": 331} {"train_loss": -5.126111030578613, "global_step": 13924, "epoch": 331} {"train_loss": -5.146291732788086, "global_step": 13925, "epoch": 331} {"train_loss": -5.096357345581055, "global_step": 13926, "epoch": 331} {"train_loss": -4.9842376708984375, "global_step": 13927, "epoch": 331} {"train_loss": -5.133575916290283, "global_step": 13928, "epoch": 331} {"train_loss": -5.091677665710449, "global_step": 13929, "epoch": 331} {"train_loss": -5.055638313293457, "global_step": 13930, "epoch": 331} {"train_loss": -5.106891632080078, "global_step": 13931, "epoch": 331} {"train_loss": -5.1865973472595215, "global_step": 13932, "epoch": 331} {"train_loss": -5.082067489624023, "global_step": 13933, "epoch": 331} {"train_loss": -5.064370155334473, "global_step": 13934, "epoch": 331} {"train_loss": -4.967172622680664, "global_step": 13935, "epoch": 331} {"train_loss": -4.89567756652832, "global_step": 13936, "epoch": 331} {"train_loss": -5.202332019805908, "global_step": 13937, "epoch": 331} {"train_loss": -4.862873077392578, "global_step": 13938, "epoch": 331} {"train_loss": -5.056781768798828, "global_step": 13939, "epoch": 331} {"train_loss": -4.994332313537598, "global_step": 13940, "epoch": 331} {"train_loss": -4.974305152893066, "global_step": 13941, "epoch": 331} {"train_loss": -5.1239013671875, "global_step": 13942, "epoch": 331} {"train_loss": -5.115187747137887, "global_step": 13943, "epoch": 331, "val_loss": 79069.515625} {"train_loss": -5.095146179199219, "global_step": 13944, "epoch": 332} {"train_loss": -5.199816703796387, "global_step": 13945, "epoch": 332} {"train_loss": -5.030007839202881, "global_step": 13946, "epoch": 332} {"train_loss": -5.208948135375977, "global_step": 13947, "epoch": 332} {"train_loss": -4.9978251457214355, "global_step": 13948, "epoch": 332} {"train_loss": -5.32559061050415, "global_step": 13949, "epoch": 332} {"train_loss": -5.171397686004639, "global_step": 13950, "epoch": 332} {"train_loss": -5.203592300415039, "global_step": 13951, "epoch": 332} {"train_loss": -5.204013824462891, "global_step": 13952, "epoch": 332} {"train_loss": -5.258887767791748, "global_step": 13953, "epoch": 332} {"train_loss": -5.301849365234375, "global_step": 13954, "epoch": 332} {"train_loss": -5.164001941680908, "global_step": 13955, "epoch": 332} {"train_loss": -5.084047317504883, "global_step": 13956, "epoch": 332} {"train_loss": -5.132416725158691, "global_step": 13957, "epoch": 332} {"train_loss": -5.256053924560547, "global_step": 13958, "epoch": 332} {"train_loss": -5.272826194763184, "global_step": 13959, "epoch": 332} {"train_loss": -5.18606424331665, "global_step": 13960, "epoch": 332} {"train_loss": -5.145031929016113, "global_step": 13961, "epoch": 332} {"train_loss": -5.1234130859375, "global_step": 13962, "epoch": 332} {"train_loss": -5.134632110595703, "global_step": 13963, "epoch": 332} {"train_loss": -5.17683219909668, "global_step": 13964, "epoch": 332} {"train_loss": -5.2430291175842285, "global_step": 13965, "epoch": 332} {"train_loss": -5.06071662902832, "global_step": 13966, "epoch": 332} {"train_loss": -5.139924049377441, "global_step": 13967, "epoch": 332} {"train_loss": -5.07071590423584, "global_step": 13968, "epoch": 332} {"train_loss": -5.128137588500977, "global_step": 13969, "epoch": 332} {"train_loss": -5.127834320068359, "global_step": 13970, "epoch": 332} {"train_loss": -5.124427795410156, "global_step": 13971, "epoch": 332} {"train_loss": -4.975516319274902, "global_step": 13972, "epoch": 332} {"train_loss": -5.204344272613525, "global_step": 13973, "epoch": 332} {"train_loss": -5.128150463104248, "global_step": 13974, "epoch": 332} {"train_loss": -5.132758140563965, "global_step": 13975, "epoch": 332} {"train_loss": -5.3318939208984375, "global_step": 13976, "epoch": 332} {"train_loss": -5.224466800689697, "global_step": 13977, "epoch": 332} {"train_loss": -5.334232330322266, "global_step": 13978, "epoch": 332} {"train_loss": -5.146133899688721, "global_step": 13979, "epoch": 332} {"train_loss": -5.1686224937438965, "global_step": 13980, "epoch": 332} {"train_loss": -4.985248565673828, "global_step": 13981, "epoch": 332} {"train_loss": -5.119198322296143, "global_step": 13982, "epoch": 332} {"train_loss": -5.16943359375, "global_step": 13983, "epoch": 332} {"train_loss": -5.139261245727539, "global_step": 13984, "epoch": 332} {"train_loss": -5.161926530656361, "global_step": 13985, "epoch": 332, "val_loss": 78318.7578125} {"train_loss": -5.275109767913818, "global_step": 13986, "epoch": 333} {"train_loss": -5.037839889526367, "global_step": 13987, "epoch": 333} {"train_loss": -5.191708087921143, "global_step": 13988, "epoch": 333} {"train_loss": -5.179224967956543, "global_step": 13989, "epoch": 333} {"train_loss": -5.262157440185547, "global_step": 13990, "epoch": 333} {"train_loss": -5.180482387542725, "global_step": 13991, "epoch": 333} {"train_loss": -5.178393840789795, "global_step": 13992, "epoch": 333} {"train_loss": -5.2794694900512695, "global_step": 13993, "epoch": 333} {"train_loss": -5.200979232788086, "global_step": 13994, "epoch": 333} {"train_loss": -5.220222473144531, "global_step": 13995, "epoch": 333} {"train_loss": -5.19998025894165, "global_step": 13996, "epoch": 333} {"train_loss": -5.101043701171875, "global_step": 13997, "epoch": 333} {"train_loss": -5.070618152618408, "global_step": 13998, "epoch": 333} {"train_loss": -5.031133651733398, "global_step": 13999, "epoch": 333} {"train_loss": -5.1011643409729, "global_step": 14000, "epoch": 333} {"train_loss": -5.131663799285889, "global_step": 14001, "epoch": 333} {"train_loss": -5.047431468963623, "global_step": 14002, "epoch": 333} {"train_loss": -5.3096923828125, "global_step": 14003, "epoch": 333} {"train_loss": -5.151322364807129, "global_step": 14004, "epoch": 333} {"train_loss": -5.075366497039795, "global_step": 14005, "epoch": 333} {"train_loss": -5.081883430480957, "global_step": 14006, "epoch": 333} {"train_loss": -5.1247944831848145, "global_step": 14007, "epoch": 333} {"train_loss": -4.969944477081299, "global_step": 14008, "epoch": 333} {"train_loss": -5.136201858520508, "global_step": 14009, "epoch": 333} {"train_loss": -5.076231002807617, "global_step": 14010, "epoch": 333} {"train_loss": -5.167813777923584, "global_step": 14011, "epoch": 333} {"train_loss": -5.187806129455566, "global_step": 14012, "epoch": 333} {"train_loss": -5.104091644287109, "global_step": 14013, "epoch": 333} {"train_loss": -5.20725154876709, "global_step": 14014, "epoch": 333} {"train_loss": -5.080672740936279, "global_step": 14015, "epoch": 333} {"train_loss": -5.162255764007568, "global_step": 14016, "epoch": 333} {"train_loss": -5.268309116363525, "global_step": 14017, "epoch": 333} {"train_loss": -5.018294334411621, "global_step": 14018, "epoch": 333} {"train_loss": -5.034436225891113, "global_step": 14019, "epoch": 333} {"train_loss": -5.2732954025268555, "global_step": 14020, "epoch": 333} {"train_loss": -5.220819473266602, "global_step": 14021, "epoch": 333} {"train_loss": -5.094505786895752, "global_step": 14022, "epoch": 333} {"train_loss": -5.1564483642578125, "global_step": 14023, "epoch": 333} {"train_loss": -5.071379661560059, "global_step": 14024, "epoch": 333} {"train_loss": -5.192046165466309, "global_step": 14025, "epoch": 333} {"train_loss": -5.166144371032715, "global_step": 14026, "epoch": 333} {"train_loss": -5.148133652550833, "global_step": 14027, "epoch": 333, "val_loss": 78393.609375} {"train_loss": -5.200618743896484, "global_step": 14028, "epoch": 334} {"train_loss": -5.118146896362305, "global_step": 14029, "epoch": 334} {"train_loss": -5.104355335235596, "global_step": 14030, "epoch": 334} {"train_loss": -5.264766693115234, "global_step": 14031, "epoch": 334} {"train_loss": -5.170292377471924, "global_step": 14032, "epoch": 334} {"train_loss": -5.167129993438721, "global_step": 14033, "epoch": 334} {"train_loss": -5.176374435424805, "global_step": 14034, "epoch": 334} {"train_loss": -5.063439846038818, "global_step": 14035, "epoch": 334} {"train_loss": -5.222015380859375, "global_step": 14036, "epoch": 334} {"train_loss": -5.071955680847168, "global_step": 14037, "epoch": 334} {"train_loss": -5.208204746246338, "global_step": 14038, "epoch": 334} {"train_loss": -5.094114303588867, "global_step": 14039, "epoch": 334} {"train_loss": -5.1269917488098145, "global_step": 14040, "epoch": 334} {"train_loss": -5.233856678009033, "global_step": 14041, "epoch": 334} {"train_loss": -5.156586647033691, "global_step": 14042, "epoch": 334} {"train_loss": -5.179657459259033, "global_step": 14043, "epoch": 334} {"train_loss": -5.3220672607421875, "global_step": 14044, "epoch": 334} {"train_loss": -5.091207027435303, "global_step": 14045, "epoch": 334} {"train_loss": -5.14339017868042, "global_step": 14046, "epoch": 334} {"train_loss": -5.362607479095459, "global_step": 14047, "epoch": 334} {"train_loss": -5.156405448913574, "global_step": 14048, "epoch": 334} {"train_loss": -5.182677268981934, "global_step": 14049, "epoch": 334} {"train_loss": -5.1931304931640625, "global_step": 14050, "epoch": 334} {"train_loss": -5.141317367553711, "global_step": 14051, "epoch": 334} {"train_loss": -5.134344100952148, "global_step": 14052, "epoch": 334} {"train_loss": -5.161650657653809, "global_step": 14053, "epoch": 334} {"train_loss": -5.016924858093262, "global_step": 14054, "epoch": 334} {"train_loss": -4.951623916625977, "global_step": 14055, "epoch": 334} {"train_loss": -5.32713508605957, "global_step": 14056, "epoch": 334} {"train_loss": -5.1836652755737305, "global_step": 14057, "epoch": 334} {"train_loss": -5.172425746917725, "global_step": 14058, "epoch": 334} {"train_loss": -5.074776649475098, "global_step": 14059, "epoch": 334} {"train_loss": -5.124680519104004, "global_step": 14060, "epoch": 334} {"train_loss": -5.148874282836914, "global_step": 14061, "epoch": 334} {"train_loss": -4.961361408233643, "global_step": 14062, "epoch": 334} {"train_loss": -5.255230903625488, "global_step": 14063, "epoch": 334} {"train_loss": -5.118542671203613, "global_step": 14064, "epoch": 334} {"train_loss": -5.066987991333008, "global_step": 14065, "epoch": 334} {"train_loss": -5.0023698806762695, "global_step": 14066, "epoch": 334} {"train_loss": -5.116169452667236, "global_step": 14067, "epoch": 334} {"train_loss": -5.132875442504883, "global_step": 14068, "epoch": 334} {"train_loss": -5.1465526421864825, "global_step": 14069, "epoch": 334, "val_loss": 78799.1484375} {"train_loss": -5.075429916381836, "global_step": 14070, "epoch": 335} {"train_loss": -4.998502731323242, "global_step": 14071, "epoch": 335} {"train_loss": -5.189536094665527, "global_step": 14072, "epoch": 335} {"train_loss": -5.239621162414551, "global_step": 14073, "epoch": 335} {"train_loss": -5.008548259735107, "global_step": 14074, "epoch": 335} {"train_loss": -5.2506422996521, "global_step": 14075, "epoch": 335} {"train_loss": -5.044546127319336, "global_step": 14076, "epoch": 335} {"train_loss": -5.201699256896973, "global_step": 14077, "epoch": 335} {"train_loss": -5.180413246154785, "global_step": 14078, "epoch": 335} {"train_loss": -5.164319038391113, "global_step": 14079, "epoch": 335} {"train_loss": -5.106586456298828, "global_step": 14080, "epoch": 335} {"train_loss": -5.316083908081055, "global_step": 14081, "epoch": 335} {"train_loss": -4.998023986816406, "global_step": 14082, "epoch": 335} {"train_loss": -5.10849666595459, "global_step": 14083, "epoch": 335} {"train_loss": -5.056825637817383, "global_step": 14084, "epoch": 335} {"train_loss": -5.018937110900879, "global_step": 14085, "epoch": 335} {"train_loss": -5.110723495483398, "global_step": 14086, "epoch": 335} {"train_loss": -4.992461681365967, "global_step": 14087, "epoch": 335} {"train_loss": -5.147431373596191, "global_step": 14088, "epoch": 335} {"train_loss": -4.994429588317871, "global_step": 14089, "epoch": 335} {"train_loss": -5.082859516143799, "global_step": 14090, "epoch": 335} {"train_loss": -5.15587043762207, "global_step": 14091, "epoch": 335} {"train_loss": -5.200047969818115, "global_step": 14092, "epoch": 335} {"train_loss": -5.140203475952148, "global_step": 14093, "epoch": 335} {"train_loss": -5.2150654792785645, "global_step": 14094, "epoch": 335} {"train_loss": -5.165623664855957, "global_step": 14095, "epoch": 335} {"train_loss": -5.08933162689209, "global_step": 14096, "epoch": 335} {"train_loss": -5.219797134399414, "global_step": 14097, "epoch": 335} {"train_loss": -5.221059799194336, "global_step": 14098, "epoch": 335} {"train_loss": -5.181917667388916, "global_step": 14099, "epoch": 335} {"train_loss": -5.035399436950684, "global_step": 14100, "epoch": 335} {"train_loss": -5.160948753356934, "global_step": 14101, "epoch": 335} {"train_loss": -5.2124505043029785, "global_step": 14102, "epoch": 335} {"train_loss": -5.038760185241699, "global_step": 14103, "epoch": 335} {"train_loss": -5.107039451599121, "global_step": 14104, "epoch": 335} {"train_loss": -5.181776523590088, "global_step": 14105, "epoch": 335} {"train_loss": -5.189371109008789, "global_step": 14106, "epoch": 335} {"train_loss": -5.199643135070801, "global_step": 14107, "epoch": 335} {"train_loss": -4.991630554199219, "global_step": 14108, "epoch": 335} {"train_loss": -5.1538543701171875, "global_step": 14109, "epoch": 335} {"train_loss": -5.218686103820801, "global_step": 14110, "epoch": 335} {"train_loss": -5.1351364226568315, "global_step": 14111, "epoch": 335, "val_loss": 78920.4296875} {"train_loss": -5.114950656890869, "global_step": 14112, "epoch": 336} {"train_loss": -5.169746398925781, "global_step": 14113, "epoch": 336} {"train_loss": -5.076887130737305, "global_step": 14114, "epoch": 336} {"train_loss": -5.217929840087891, "global_step": 14115, "epoch": 336} {"train_loss": -5.216940879821777, "global_step": 14116, "epoch": 336} {"train_loss": -5.092820167541504, "global_step": 14117, "epoch": 336} {"train_loss": -5.172396183013916, "global_step": 14118, "epoch": 336} {"train_loss": -5.107698440551758, "global_step": 14119, "epoch": 336} {"train_loss": -5.369920253753662, "global_step": 14120, "epoch": 336} {"train_loss": -5.289585113525391, "global_step": 14121, "epoch": 336} {"train_loss": -5.139747619628906, "global_step": 14122, "epoch": 336} {"train_loss": -5.342947006225586, "global_step": 14123, "epoch": 336} {"train_loss": -5.1976542472839355, "global_step": 14124, "epoch": 336} {"train_loss": -5.124536514282227, "global_step": 14125, "epoch": 336} {"train_loss": -5.0783891677856445, "global_step": 14126, "epoch": 336} {"train_loss": -5.181369781494141, "global_step": 14127, "epoch": 336} {"train_loss": -5.1927924156188965, "global_step": 14128, "epoch": 336} {"train_loss": -5.040229797363281, "global_step": 14129, "epoch": 336} {"train_loss": -5.050744533538818, "global_step": 14130, "epoch": 336} {"train_loss": -5.159051895141602, "global_step": 14131, "epoch": 336} {"train_loss": -5.1013360023498535, "global_step": 14132, "epoch": 336} {"train_loss": -5.046319007873535, "global_step": 14133, "epoch": 336} {"train_loss": -5.0760884284973145, "global_step": 14134, "epoch": 336} {"train_loss": -5.0796709060668945, "global_step": 14135, "epoch": 336} {"train_loss": -5.280544757843018, "global_step": 14136, "epoch": 336} {"train_loss": -5.104581356048584, "global_step": 14137, "epoch": 336} {"train_loss": -5.1035966873168945, "global_step": 14138, "epoch": 336} {"train_loss": -5.2709550857543945, "global_step": 14139, "epoch": 336} {"train_loss": -5.120748996734619, "global_step": 14140, "epoch": 336} {"train_loss": -5.174574375152588, "global_step": 14141, "epoch": 336} {"train_loss": -5.136127948760986, "global_step": 14142, "epoch": 336} {"train_loss": -5.175546646118164, "global_step": 14143, "epoch": 336} {"train_loss": -5.080254554748535, "global_step": 14144, "epoch": 336} {"train_loss": -5.1673903465271, "global_step": 14145, "epoch": 336} {"train_loss": -5.177885055541992, "global_step": 14146, "epoch": 336} {"train_loss": -5.0509843826293945, "global_step": 14147, "epoch": 336} {"train_loss": -5.1320085525512695, "global_step": 14148, "epoch": 336} {"train_loss": -5.007763385772705, "global_step": 14149, "epoch": 336} {"train_loss": -5.157432556152344, "global_step": 14150, "epoch": 336} {"train_loss": -5.127158164978027, "global_step": 14151, "epoch": 336} {"train_loss": -5.150354385375977, "global_step": 14152, "epoch": 336} {"train_loss": -5.1472949641091486, "global_step": 14153, "epoch": 336, "val_loss": 78177.265625} {"train_loss": -5.2176432609558105, "global_step": 14154, "epoch": 337} {"train_loss": -5.147913932800293, "global_step": 14155, "epoch": 337} {"train_loss": -5.104692459106445, "global_step": 14156, "epoch": 337} {"train_loss": -5.240996837615967, "global_step": 14157, "epoch": 337} {"train_loss": -5.100129127502441, "global_step": 14158, "epoch": 337} {"train_loss": -5.111453056335449, "global_step": 14159, "epoch": 337} {"train_loss": -5.113152503967285, "global_step": 14160, "epoch": 337} {"train_loss": -5.010519027709961, "global_step": 14161, "epoch": 337} {"train_loss": -5.114941596984863, "global_step": 14162, "epoch": 337} {"train_loss": -5.04981803894043, "global_step": 14163, "epoch": 337} {"train_loss": -5.001909255981445, "global_step": 14164, "epoch": 337} {"train_loss": -5.006679534912109, "global_step": 14165, "epoch": 337} {"train_loss": -5.075303077697754, "global_step": 14166, "epoch": 337} {"train_loss": -5.025014400482178, "global_step": 14167, "epoch": 337} {"train_loss": -5.134089946746826, "global_step": 14168, "epoch": 337} {"train_loss": -5.009579658508301, "global_step": 14169, "epoch": 337} {"train_loss": -5.02289342880249, "global_step": 14170, "epoch": 337} {"train_loss": -5.236784934997559, "global_step": 14171, "epoch": 337} {"train_loss": -4.981694221496582, "global_step": 14172, "epoch": 337} {"train_loss": -5.078525066375732, "global_step": 14173, "epoch": 337} {"train_loss": -5.025546073913574, "global_step": 14174, "epoch": 337} {"train_loss": -5.022883892059326, "global_step": 14175, "epoch": 337} {"train_loss": -5.2982683181762695, "global_step": 14176, "epoch": 337} {"train_loss": -5.017999649047852, "global_step": 14177, "epoch": 337} {"train_loss": -5.12363862991333, "global_step": 14178, "epoch": 337} {"train_loss": -4.873713970184326, "global_step": 14179, "epoch": 337} {"train_loss": -5.080752849578857, "global_step": 14180, "epoch": 337} {"train_loss": -4.936952590942383, "global_step": 14181, "epoch": 337} {"train_loss": -5.11906099319458, "global_step": 14182, "epoch": 337} {"train_loss": -5.066901683807373, "global_step": 14183, "epoch": 337} {"train_loss": -5.225728988647461, "global_step": 14184, "epoch": 337} {"train_loss": -5.117428779602051, "global_step": 14185, "epoch": 337} {"train_loss": -5.067500114440918, "global_step": 14186, "epoch": 337} {"train_loss": -5.214849948883057, "global_step": 14187, "epoch": 337} {"train_loss": -5.191834926605225, "global_step": 14188, "epoch": 337} {"train_loss": -5.117196083068848, "global_step": 14189, "epoch": 337} {"train_loss": -5.234478950500488, "global_step": 14190, "epoch": 337} {"train_loss": -5.111337661743164, "global_step": 14191, "epoch": 337} {"train_loss": -4.905641555786133, "global_step": 14192, "epoch": 337} {"train_loss": -5.187355041503906, "global_step": 14193, "epoch": 337} {"train_loss": -5.071841239929199, "global_step": 14194, "epoch": 337} {"train_loss": -5.093143508547828, "global_step": 14195, "epoch": 337, "val_loss": 79132.0625} {"train_loss": -5.108711242675781, "global_step": 14196, "epoch": 338} {"train_loss": -5.052011966705322, "global_step": 14197, "epoch": 338} {"train_loss": -5.0007734298706055, "global_step": 14198, "epoch": 338} {"train_loss": -5.147075653076172, "global_step": 14199, "epoch": 338} {"train_loss": -5.174087047576904, "global_step": 14200, "epoch": 338} {"train_loss": -5.101773262023926, "global_step": 14201, "epoch": 338} {"train_loss": -5.263151168823242, "global_step": 14202, "epoch": 338} {"train_loss": -5.242505073547363, "global_step": 14203, "epoch": 338} {"train_loss": -5.089482307434082, "global_step": 14204, "epoch": 338} {"train_loss": -5.156426429748535, "global_step": 14205, "epoch": 338} {"train_loss": -5.149325847625732, "global_step": 14206, "epoch": 338} {"train_loss": -5.0050225257873535, "global_step": 14207, "epoch": 338} {"train_loss": -5.100052356719971, "global_step": 14208, "epoch": 338} {"train_loss": -5.10626220703125, "global_step": 14209, "epoch": 338} {"train_loss": -5.3264007568359375, "global_step": 14210, "epoch": 338} {"train_loss": -5.198615550994873, "global_step": 14211, "epoch": 338} {"train_loss": -5.312024116516113, "global_step": 14212, "epoch": 338} {"train_loss": -5.283884048461914, "global_step": 14213, "epoch": 338} {"train_loss": -5.041947364807129, "global_step": 14214, "epoch": 338} {"train_loss": -4.928452491760254, "global_step": 14215, "epoch": 338} {"train_loss": -5.169200897216797, "global_step": 14216, "epoch": 338} {"train_loss": -5.106512069702148, "global_step": 14217, "epoch": 338} {"train_loss": -5.020071029663086, "global_step": 14218, "epoch": 338} {"train_loss": -5.102501392364502, "global_step": 14219, "epoch": 338} {"train_loss": -4.942119598388672, "global_step": 14220, "epoch": 338} {"train_loss": -5.089306831359863, "global_step": 14221, "epoch": 338} {"train_loss": -5.060752868652344, "global_step": 14222, "epoch": 338} {"train_loss": -5.045028209686279, "global_step": 14223, "epoch": 338} {"train_loss": -5.3038010597229, "global_step": 14224, "epoch": 338} {"train_loss": -4.992759704589844, "global_step": 14225, "epoch": 338} {"train_loss": -5.1212944984436035, "global_step": 14226, "epoch": 338} {"train_loss": -5.210149765014648, "global_step": 14227, "epoch": 338} {"train_loss": -5.033653259277344, "global_step": 14228, "epoch": 338} {"train_loss": -5.17242431640625, "global_step": 14229, "epoch": 338} {"train_loss": -5.093137741088867, "global_step": 14230, "epoch": 338} {"train_loss": -5.160069465637207, "global_step": 14231, "epoch": 338} {"train_loss": -5.07186222076416, "global_step": 14232, "epoch": 338} {"train_loss": -5.186871528625488, "global_step": 14233, "epoch": 338} {"train_loss": -5.192168235778809, "global_step": 14234, "epoch": 338} {"train_loss": -5.092127323150635, "global_step": 14235, "epoch": 338} {"train_loss": -5.192315101623535, "global_step": 14236, "epoch": 338} {"train_loss": -5.126078037988572, "global_step": 14237, "epoch": 338, "val_loss": 79116.921875} {"train_loss": -5.0373334884643555, "global_step": 14238, "epoch": 339} {"train_loss": -5.237813949584961, "global_step": 14239, "epoch": 339} {"train_loss": -5.15532112121582, "global_step": 14240, "epoch": 339} {"train_loss": -5.093332290649414, "global_step": 14241, "epoch": 339} {"train_loss": -5.070358753204346, "global_step": 14242, "epoch": 339} {"train_loss": -5.16093635559082, "global_step": 14243, "epoch": 339} {"train_loss": -5.277762413024902, "global_step": 14244, "epoch": 339} {"train_loss": -5.1265153884887695, "global_step": 14245, "epoch": 339} {"train_loss": -5.159191131591797, "global_step": 14246, "epoch": 339} {"train_loss": -5.199435234069824, "global_step": 14247, "epoch": 339} {"train_loss": -5.140056133270264, "global_step": 14248, "epoch": 339} {"train_loss": -4.96193790435791, "global_step": 14249, "epoch": 339} {"train_loss": -5.070220947265625, "global_step": 14250, "epoch": 339} {"train_loss": -5.070115089416504, "global_step": 14251, "epoch": 339} {"train_loss": -5.253418445587158, "global_step": 14252, "epoch": 339} {"train_loss": -5.109293460845947, "global_step": 14253, "epoch": 339} {"train_loss": -5.060074806213379, "global_step": 14254, "epoch": 339} {"train_loss": -5.219264030456543, "global_step": 14255, "epoch": 339} {"train_loss": -5.129533767700195, "global_step": 14256, "epoch": 339} {"train_loss": -5.262957572937012, "global_step": 14257, "epoch": 339} {"train_loss": -5.15673828125, "global_step": 14258, "epoch": 339} {"train_loss": -5.101329803466797, "global_step": 14259, "epoch": 339} {"train_loss": -4.9635138511657715, "global_step": 14260, "epoch": 339} {"train_loss": -5.012564659118652, "global_step": 14261, "epoch": 339} {"train_loss": -5.107837200164795, "global_step": 14262, "epoch": 339} {"train_loss": -5.1575703620910645, "global_step": 14263, "epoch": 339} {"train_loss": -5.115652084350586, "global_step": 14264, "epoch": 339} {"train_loss": -5.212507247924805, "global_step": 14265, "epoch": 339} {"train_loss": -5.030485153198242, "global_step": 14266, "epoch": 339} {"train_loss": -5.1149702072143555, "global_step": 14267, "epoch": 339} {"train_loss": -5.116306781768799, "global_step": 14268, "epoch": 339} {"train_loss": -5.068975925445557, "global_step": 14269, "epoch": 339} {"train_loss": -5.21269416809082, "global_step": 14270, "epoch": 339} {"train_loss": -5.150942802429199, "global_step": 14271, "epoch": 339} {"train_loss": -5.18458366394043, "global_step": 14272, "epoch": 339} {"train_loss": -5.155084133148193, "global_step": 14273, "epoch": 339} {"train_loss": -5.091166019439697, "global_step": 14274, "epoch": 339} {"train_loss": -5.117880344390869, "global_step": 14275, "epoch": 339} {"train_loss": -5.208202838897705, "global_step": 14276, "epoch": 339} {"train_loss": -5.164342403411865, "global_step": 14277, "epoch": 339} {"train_loss": -5.036533832550049, "global_step": 14278, "epoch": 339} {"train_loss": -5.131874220711844, "global_step": 14279, "epoch": 339, "val_loss": 79094.734375} {"train_loss": -5.194026947021484, "global_step": 14280, "epoch": 340} {"train_loss": -5.080569267272949, "global_step": 14281, "epoch": 340} {"train_loss": -5.120187759399414, "global_step": 14282, "epoch": 340} {"train_loss": -5.215853691101074, "global_step": 14283, "epoch": 340} {"train_loss": -5.046897888183594, "global_step": 14284, "epoch": 340} {"train_loss": -5.237246513366699, "global_step": 14285, "epoch": 340} {"train_loss": -5.277220726013184, "global_step": 14286, "epoch": 340} {"train_loss": -5.132781505584717, "global_step": 14287, "epoch": 340} {"train_loss": -4.998276710510254, "global_step": 14288, "epoch": 340} {"train_loss": -5.231688499450684, "global_step": 14289, "epoch": 340} {"train_loss": -5.257122039794922, "global_step": 14290, "epoch": 340} {"train_loss": -5.024791240692139, "global_step": 14291, "epoch": 340} {"train_loss": -5.043859958648682, "global_step": 14292, "epoch": 340} {"train_loss": -5.045505523681641, "global_step": 14293, "epoch": 340} {"train_loss": -5.095788955688477, "global_step": 14294, "epoch": 340} {"train_loss": -5.216005802154541, "global_step": 14295, "epoch": 340} {"train_loss": -5.147129535675049, "global_step": 14296, "epoch": 340} {"train_loss": -5.095335483551025, "global_step": 14297, "epoch": 340} {"train_loss": -5.0245747566223145, "global_step": 14298, "epoch": 340} {"train_loss": -5.067592144012451, "global_step": 14299, "epoch": 340} {"train_loss": -5.230367183685303, "global_step": 14300, "epoch": 340} {"train_loss": -5.215699195861816, "global_step": 14301, "epoch": 340} {"train_loss": -5.1751179695129395, "global_step": 14302, "epoch": 340} {"train_loss": -5.185670852661133, "global_step": 14303, "epoch": 340} {"train_loss": -5.00809383392334, "global_step": 14304, "epoch": 340} {"train_loss": -5.083140850067139, "global_step": 14305, "epoch": 340} {"train_loss": -5.302629470825195, "global_step": 14306, "epoch": 340} {"train_loss": -5.18698263168335, "global_step": 14307, "epoch": 340} {"train_loss": -5.319429397583008, "global_step": 14308, "epoch": 340} {"train_loss": -5.126101493835449, "global_step": 14309, "epoch": 340} {"train_loss": -5.063743591308594, "global_step": 14310, "epoch": 340} {"train_loss": -5.134182453155518, "global_step": 14311, "epoch": 340} {"train_loss": -5.179408073425293, "global_step": 14312, "epoch": 340} {"train_loss": -5.148373603820801, "global_step": 14313, "epoch": 340} {"train_loss": -5.1748247146606445, "global_step": 14314, "epoch": 340} {"train_loss": -5.213676452636719, "global_step": 14315, "epoch": 340} {"train_loss": -5.164389610290527, "global_step": 14316, "epoch": 340} {"train_loss": -5.181512832641602, "global_step": 14317, "epoch": 340} {"train_loss": -5.244749069213867, "global_step": 14318, "epoch": 340} {"train_loss": -5.177288055419922, "global_step": 14319, "epoch": 340} {"train_loss": -5.226722717285156, "global_step": 14320, "epoch": 340} {"train_loss": -5.1556613218216665, "global_step": 14321, "epoch": 340, "val_loss": 79833.328125} {"train_loss": -5.282365322113037, "global_step": 14322, "epoch": 341} {"train_loss": -5.055355548858643, "global_step": 14323, "epoch": 341} {"train_loss": -5.159253120422363, "global_step": 14324, "epoch": 341} {"train_loss": -5.144716262817383, "global_step": 14325, "epoch": 341} {"train_loss": -5.18165397644043, "global_step": 14326, "epoch": 341} {"train_loss": -5.293223857879639, "global_step": 14327, "epoch": 341} {"train_loss": -5.202968597412109, "global_step": 14328, "epoch": 341} {"train_loss": -5.09765625, "global_step": 14329, "epoch": 341} {"train_loss": -5.242743015289307, "global_step": 14330, "epoch": 341} {"train_loss": -5.1281633377075195, "global_step": 14331, "epoch": 341} {"train_loss": -5.190546989440918, "global_step": 14332, "epoch": 341} {"train_loss": -5.156627655029297, "global_step": 14333, "epoch": 341} {"train_loss": -5.093975067138672, "global_step": 14334, "epoch": 341} {"train_loss": -5.197078704833984, "global_step": 14335, "epoch": 341} {"train_loss": -5.059786796569824, "global_step": 14336, "epoch": 341} {"train_loss": -4.880778789520264, "global_step": 14337, "epoch": 341} {"train_loss": -5.0670166015625, "global_step": 14338, "epoch": 341} {"train_loss": -5.1785688400268555, "global_step": 14339, "epoch": 341} {"train_loss": -4.853461742401123, "global_step": 14340, "epoch": 341} {"train_loss": -4.944647789001465, "global_step": 14341, "epoch": 341} {"train_loss": -4.977463722229004, "global_step": 14342, "epoch": 341} {"train_loss": -4.846160888671875, "global_step": 14343, "epoch": 341} {"train_loss": -5.103163719177246, "global_step": 14344, "epoch": 341} {"train_loss": -4.899173736572266, "global_step": 14345, "epoch": 341} {"train_loss": -5.057047367095947, "global_step": 14346, "epoch": 341} {"train_loss": -5.010290622711182, "global_step": 14347, "epoch": 341} {"train_loss": -5.139593601226807, "global_step": 14348, "epoch": 341} {"train_loss": -5.044407367706299, "global_step": 14349, "epoch": 341} {"train_loss": -5.073429584503174, "global_step": 14350, "epoch": 341} {"train_loss": -5.142215728759766, "global_step": 14351, "epoch": 341} {"train_loss": -5.187414169311523, "global_step": 14352, "epoch": 341} {"train_loss": -5.200624465942383, "global_step": 14353, "epoch": 341} {"train_loss": -5.119288444519043, "global_step": 14354, "epoch": 341} {"train_loss": -4.990367889404297, "global_step": 14355, "epoch": 341} {"train_loss": -5.085746765136719, "global_step": 14356, "epoch": 341} {"train_loss": -5.048322677612305, "global_step": 14357, "epoch": 341} {"train_loss": -5.086483001708984, "global_step": 14358, "epoch": 341} {"train_loss": -5.221349239349365, "global_step": 14359, "epoch": 341} {"train_loss": -5.080582618713379, "global_step": 14360, "epoch": 341} {"train_loss": -5.058414459228516, "global_step": 14361, "epoch": 341} {"train_loss": -5.16886043548584, "global_step": 14362, "epoch": 341} {"train_loss": -5.099574906485421, "global_step": 14363, "epoch": 341, "val_loss": 78915.625} {"train_loss": -5.077935695648193, "global_step": 14364, "epoch": 342} {"train_loss": -5.1829514503479, "global_step": 14365, "epoch": 342} {"train_loss": -5.23441219329834, "global_step": 14366, "epoch": 342} {"train_loss": -5.085237503051758, "global_step": 14367, "epoch": 342} {"train_loss": -5.32618522644043, "global_step": 14368, "epoch": 342} {"train_loss": -5.17357063293457, "global_step": 14369, "epoch": 342} {"train_loss": -5.152495384216309, "global_step": 14370, "epoch": 342} {"train_loss": -5.255026817321777, "global_step": 14371, "epoch": 342} {"train_loss": -5.2029876708984375, "global_step": 14372, "epoch": 342} {"train_loss": -5.293350696563721, "global_step": 14373, "epoch": 342} {"train_loss": -5.266944408416748, "global_step": 14374, "epoch": 342} {"train_loss": -5.188057899475098, "global_step": 14375, "epoch": 342} {"train_loss": -5.243414402008057, "global_step": 14376, "epoch": 342} {"train_loss": -5.176626682281494, "global_step": 14377, "epoch": 342} {"train_loss": -5.102968692779541, "global_step": 14378, "epoch": 342} {"train_loss": -5.171742916107178, "global_step": 14379, "epoch": 342} {"train_loss": -5.116992473602295, "global_step": 14380, "epoch": 342} {"train_loss": -5.1345744132995605, "global_step": 14381, "epoch": 342} {"train_loss": -5.126251697540283, "global_step": 14382, "epoch": 342} {"train_loss": -5.254323959350586, "global_step": 14383, "epoch": 342} {"train_loss": -5.2184858322143555, "global_step": 14384, "epoch": 342} {"train_loss": -5.068788528442383, "global_step": 14385, "epoch": 342} {"train_loss": -5.065183639526367, "global_step": 14386, "epoch": 342} {"train_loss": -5.310739517211914, "global_step": 14387, "epoch": 342} {"train_loss": -5.322159767150879, "global_step": 14388, "epoch": 342} {"train_loss": -5.2580766677856445, "global_step": 14389, "epoch": 342} {"train_loss": -5.276729583740234, "global_step": 14390, "epoch": 342} {"train_loss": -5.1175642013549805, "global_step": 14391, "epoch": 342} {"train_loss": -5.12232780456543, "global_step": 14392, "epoch": 342} {"train_loss": -5.277015686035156, "global_step": 14393, "epoch": 342} {"train_loss": -5.176599502563477, "global_step": 14394, "epoch": 342} {"train_loss": -4.979422569274902, "global_step": 14395, "epoch": 342} {"train_loss": -4.983600616455078, "global_step": 14396, "epoch": 342} {"train_loss": -5.166508674621582, "global_step": 14397, "epoch": 342} {"train_loss": -5.017886638641357, "global_step": 14398, "epoch": 342} {"train_loss": -5.111513137817383, "global_step": 14399, "epoch": 342} {"train_loss": -5.012107849121094, "global_step": 14400, "epoch": 342} {"train_loss": -5.0948615074157715, "global_step": 14401, "epoch": 342} {"train_loss": -5.180367469787598, "global_step": 14402, "epoch": 342} {"train_loss": -5.115542411804199, "global_step": 14403, "epoch": 342} {"train_loss": -5.170341968536377, "global_step": 14404, "epoch": 342} {"train_loss": -5.164600349607921, "global_step": 14405, "epoch": 342, "val_loss": 79183.9375} {"train_loss": -5.138526916503906, "global_step": 14406, "epoch": 343} {"train_loss": -5.170608997344971, "global_step": 14407, "epoch": 343} {"train_loss": -5.076547622680664, "global_step": 14408, "epoch": 343} {"train_loss": -5.094317436218262, "global_step": 14409, "epoch": 343} {"train_loss": -5.158006191253662, "global_step": 14410, "epoch": 343} {"train_loss": -5.030993461608887, "global_step": 14411, "epoch": 343} {"train_loss": -5.158177852630615, "global_step": 14412, "epoch": 343} {"train_loss": -5.260232448577881, "global_step": 14413, "epoch": 343} {"train_loss": -5.204078674316406, "global_step": 14414, "epoch": 343} {"train_loss": -5.104504585266113, "global_step": 14415, "epoch": 343} {"train_loss": -5.3870134353637695, "global_step": 14416, "epoch": 343} {"train_loss": -5.125190734863281, "global_step": 14417, "epoch": 343} {"train_loss": -5.259821891784668, "global_step": 14418, "epoch": 343} {"train_loss": -5.179798126220703, "global_step": 14419, "epoch": 343} {"train_loss": -5.1640825271606445, "global_step": 14420, "epoch": 343} {"train_loss": -5.13272762298584, "global_step": 14421, "epoch": 343} {"train_loss": -5.259181976318359, "global_step": 14422, "epoch": 343} {"train_loss": -5.312813758850098, "global_step": 14423, "epoch": 343} {"train_loss": -5.198176383972168, "global_step": 14424, "epoch": 343} {"train_loss": -5.229567527770996, "global_step": 14425, "epoch": 343} {"train_loss": -5.1967339515686035, "global_step": 14426, "epoch": 343} {"train_loss": -5.170216083526611, "global_step": 14427, "epoch": 343} {"train_loss": -5.1158270835876465, "global_step": 14428, "epoch": 343} {"train_loss": -5.067299842834473, "global_step": 14429, "epoch": 343} {"train_loss": -5.169129848480225, "global_step": 14430, "epoch": 343} {"train_loss": -5.142684459686279, "global_step": 14431, "epoch": 343} {"train_loss": -5.133551120758057, "global_step": 14432, "epoch": 343} {"train_loss": -5.344104766845703, "global_step": 14433, "epoch": 343} {"train_loss": -5.062313079833984, "global_step": 14434, "epoch": 343} {"train_loss": -5.185415267944336, "global_step": 14435, "epoch": 343} {"train_loss": -5.261777400970459, "global_step": 14436, "epoch": 343} {"train_loss": -5.1682586669921875, "global_step": 14437, "epoch": 343} {"train_loss": -5.223528861999512, "global_step": 14438, "epoch": 343} {"train_loss": -5.156953811645508, "global_step": 14439, "epoch": 343} {"train_loss": -5.191082954406738, "global_step": 14440, "epoch": 343} {"train_loss": -5.3156538009643555, "global_step": 14441, "epoch": 343} {"train_loss": -5.1744842529296875, "global_step": 14442, "epoch": 343} {"train_loss": -5.221434593200684, "global_step": 14443, "epoch": 343} {"train_loss": -5.215199947357178, "global_step": 14444, "epoch": 343} {"train_loss": -5.114653587341309, "global_step": 14445, "epoch": 343} {"train_loss": -5.2137651443481445, "global_step": 14446, "epoch": 343} {"train_loss": -5.180789220900762, "global_step": 14447, "epoch": 343, "val_loss": 80011.5859375} {"train_loss": -5.186999320983887, "global_step": 14448, "epoch": 344} {"train_loss": -5.0457539558410645, "global_step": 14449, "epoch": 344} {"train_loss": -5.265440940856934, "global_step": 14450, "epoch": 344} {"train_loss": -5.2692108154296875, "global_step": 14451, "epoch": 344} {"train_loss": -5.312062740325928, "global_step": 14452, "epoch": 344} {"train_loss": -5.226401329040527, "global_step": 14453, "epoch": 344} {"train_loss": -5.11129093170166, "global_step": 14454, "epoch": 344} {"train_loss": -5.288407325744629, "global_step": 14455, "epoch": 344} {"train_loss": -5.059637069702148, "global_step": 14456, "epoch": 344} {"train_loss": -5.263308525085449, "global_step": 14457, "epoch": 344} {"train_loss": -5.314638137817383, "global_step": 14458, "epoch": 344} {"train_loss": -5.289002895355225, "global_step": 14459, "epoch": 344} {"train_loss": -5.271433353424072, "global_step": 14460, "epoch": 344} {"train_loss": -5.127349853515625, "global_step": 14461, "epoch": 344} {"train_loss": -5.1909499168396, "global_step": 14462, "epoch": 344} {"train_loss": -5.217496871948242, "global_step": 14463, "epoch": 344} {"train_loss": -5.162989616394043, "global_step": 14464, "epoch": 344} {"train_loss": -5.184751510620117, "global_step": 14465, "epoch": 344} {"train_loss": -5.100919723510742, "global_step": 14466, "epoch": 344} {"train_loss": -5.213447570800781, "global_step": 14467, "epoch": 344} {"train_loss": -5.332579612731934, "global_step": 14468, "epoch": 344} {"train_loss": -5.297107696533203, "global_step": 14469, "epoch": 344} {"train_loss": -5.137683868408203, "global_step": 14470, "epoch": 344} {"train_loss": -5.210919380187988, "global_step": 14471, "epoch": 344} {"train_loss": -5.026615142822266, "global_step": 14472, "epoch": 344} {"train_loss": -5.038644790649414, "global_step": 14473, "epoch": 344} {"train_loss": -5.132923126220703, "global_step": 14474, "epoch": 344} {"train_loss": -5.14521598815918, "global_step": 14475, "epoch": 344} {"train_loss": -5.226930141448975, "global_step": 14476, "epoch": 344} {"train_loss": -4.928189277648926, "global_step": 14477, "epoch": 344} {"train_loss": -5.056094646453857, "global_step": 14478, "epoch": 344} {"train_loss": -5.216241836547852, "global_step": 14479, "epoch": 344} {"train_loss": -4.886448860168457, "global_step": 14480, "epoch": 344} {"train_loss": -5.038956165313721, "global_step": 14481, "epoch": 344} {"train_loss": -5.058306694030762, "global_step": 14482, "epoch": 344} {"train_loss": -5.04645299911499, "global_step": 14483, "epoch": 344} {"train_loss": -5.1072001457214355, "global_step": 14484, "epoch": 344} {"train_loss": -5.146738052368164, "global_step": 14485, "epoch": 344} {"train_loss": -5.162511825561523, "global_step": 14486, "epoch": 344} {"train_loss": -5.180739879608154, "global_step": 14487, "epoch": 344} {"train_loss": -5.183361053466797, "global_step": 14488, "epoch": 344} {"train_loss": -5.159488712038312, "global_step": 14489, "epoch": 344, "val_loss": 79475.09375} {"train_loss": -5.168729305267334, "global_step": 14490, "epoch": 345} {"train_loss": -5.030287742614746, "global_step": 14491, "epoch": 345} {"train_loss": -5.085733413696289, "global_step": 14492, "epoch": 345} {"train_loss": -5.110130786895752, "global_step": 14493, "epoch": 345} {"train_loss": -5.244045257568359, "global_step": 14494, "epoch": 345} {"train_loss": -5.240482330322266, "global_step": 14495, "epoch": 345} {"train_loss": -5.1984663009643555, "global_step": 14496, "epoch": 345} {"train_loss": -5.119974136352539, "global_step": 14497, "epoch": 345} {"train_loss": -5.171501636505127, "global_step": 14498, "epoch": 345} {"train_loss": -4.961452484130859, "global_step": 14499, "epoch": 345} {"train_loss": -5.240100860595703, "global_step": 14500, "epoch": 345} {"train_loss": -5.038928031921387, "global_step": 14501, "epoch": 345} {"train_loss": -5.148602485656738, "global_step": 14502, "epoch": 345} {"train_loss": -5.268708229064941, "global_step": 14503, "epoch": 345} {"train_loss": -5.122917175292969, "global_step": 14504, "epoch": 345} {"train_loss": -5.2813897132873535, "global_step": 14505, "epoch": 345} {"train_loss": -5.221622467041016, "global_step": 14506, "epoch": 345} {"train_loss": -5.15587043762207, "global_step": 14507, "epoch": 345} {"train_loss": -5.203165054321289, "global_step": 14508, "epoch": 345} {"train_loss": -5.115235328674316, "global_step": 14509, "epoch": 345} {"train_loss": -5.094191551208496, "global_step": 14510, "epoch": 345} {"train_loss": -5.063738822937012, "global_step": 14511, "epoch": 345} {"train_loss": -5.093121528625488, "global_step": 14512, "epoch": 345} {"train_loss": -5.097017765045166, "global_step": 14513, "epoch": 345} {"train_loss": -5.126517295837402, "global_step": 14514, "epoch": 345} {"train_loss": -5.263322353363037, "global_step": 14515, "epoch": 345} {"train_loss": -5.119652271270752, "global_step": 14516, "epoch": 345} {"train_loss": -5.210363864898682, "global_step": 14517, "epoch": 345} {"train_loss": -4.979072570800781, "global_step": 14518, "epoch": 345} {"train_loss": -5.0870771408081055, "global_step": 14519, "epoch": 345} {"train_loss": -5.27442741394043, "global_step": 14520, "epoch": 345} {"train_loss": -5.042994499206543, "global_step": 14521, "epoch": 345} {"train_loss": -4.8628339767456055, "global_step": 14522, "epoch": 345} {"train_loss": -5.133650302886963, "global_step": 14523, "epoch": 345} {"train_loss": -5.259774208068848, "global_step": 14524, "epoch": 345} {"train_loss": -5.0858964920043945, "global_step": 14525, "epoch": 345} {"train_loss": -5.139287948608398, "global_step": 14526, "epoch": 345} {"train_loss": -5.0537214279174805, "global_step": 14527, "epoch": 345} {"train_loss": -5.181160926818848, "global_step": 14528, "epoch": 345} {"train_loss": -5.185301303863525, "global_step": 14529, "epoch": 345} {"train_loss": -5.290968894958496, "global_step": 14530, "epoch": 345} {"train_loss": -5.141423588707333, "global_step": 14531, "epoch": 345, "val_loss": 78201.640625} {"train_loss": -5.124849796295166, "global_step": 14532, "epoch": 346} {"train_loss": -5.112123966217041, "global_step": 14533, "epoch": 346} {"train_loss": -5.083925247192383, "global_step": 14534, "epoch": 346} {"train_loss": -5.060352325439453, "global_step": 14535, "epoch": 346} {"train_loss": -5.108503341674805, "global_step": 14536, "epoch": 346} {"train_loss": -5.140864372253418, "global_step": 14537, "epoch": 346} {"train_loss": -5.075448036193848, "global_step": 14538, "epoch": 346} {"train_loss": -5.180615425109863, "global_step": 14539, "epoch": 346} {"train_loss": -5.2804179191589355, "global_step": 14540, "epoch": 346} {"train_loss": -5.250553131103516, "global_step": 14541, "epoch": 346} {"train_loss": -5.188055992126465, "global_step": 14542, "epoch": 346} {"train_loss": -5.099637031555176, "global_step": 14543, "epoch": 346} {"train_loss": -5.261517524719238, "global_step": 14544, "epoch": 346} {"train_loss": -5.1482648849487305, "global_step": 14545, "epoch": 346} {"train_loss": -5.281963348388672, "global_step": 14546, "epoch": 346} {"train_loss": -5.1749267578125, "global_step": 14547, "epoch": 346} {"train_loss": -5.1444196701049805, "global_step": 14548, "epoch": 346} {"train_loss": -5.172393321990967, "global_step": 14549, "epoch": 346} {"train_loss": -5.3296003341674805, "global_step": 14550, "epoch": 346} {"train_loss": -5.168351650238037, "global_step": 14551, "epoch": 346} {"train_loss": -5.094414710998535, "global_step": 14552, "epoch": 346} {"train_loss": -5.223247528076172, "global_step": 14553, "epoch": 346} {"train_loss": -5.248049259185791, "global_step": 14554, "epoch": 346} {"train_loss": -5.117643356323242, "global_step": 14555, "epoch": 346} {"train_loss": -5.278580665588379, "global_step": 14556, "epoch": 346} {"train_loss": -5.150631427764893, "global_step": 14557, "epoch": 346} {"train_loss": -5.33206844329834, "global_step": 14558, "epoch": 346} {"train_loss": -5.128536224365234, "global_step": 14559, "epoch": 346} {"train_loss": -5.110844612121582, "global_step": 14560, "epoch": 346} {"train_loss": -5.327673435211182, "global_step": 14561, "epoch": 346} {"train_loss": -5.3101701736450195, "global_step": 14562, "epoch": 346} {"train_loss": -5.092569351196289, "global_step": 14563, "epoch": 346} {"train_loss": -5.132643699645996, "global_step": 14564, "epoch": 346} {"train_loss": -5.217023849487305, "global_step": 14565, "epoch": 346} {"train_loss": -5.108644008636475, "global_step": 14566, "epoch": 346} {"train_loss": -5.126696586608887, "global_step": 14567, "epoch": 346} {"train_loss": -5.160208702087402, "global_step": 14568, "epoch": 346} {"train_loss": -5.193231582641602, "global_step": 14569, "epoch": 346} {"train_loss": -5.057512283325195, "global_step": 14570, "epoch": 346} {"train_loss": -5.101619720458984, "global_step": 14571, "epoch": 346} {"train_loss": -5.142085552215576, "global_step": 14572, "epoch": 346} {"train_loss": -5.1703822158631825, "global_step": 14573, "epoch": 346, "val_loss": 79220.40625} {"train_loss": -5.137159824371338, "global_step": 14574, "epoch": 347} {"train_loss": -5.0064592361450195, "global_step": 14575, "epoch": 347} {"train_loss": -5.212238311767578, "global_step": 14576, "epoch": 347} {"train_loss": -5.268118381500244, "global_step": 14577, "epoch": 347} {"train_loss": -5.2868452072143555, "global_step": 14578, "epoch": 347} {"train_loss": -5.195784568786621, "global_step": 14579, "epoch": 347} {"train_loss": -5.16700553894043, "global_step": 14580, "epoch": 347} {"train_loss": -5.252607822418213, "global_step": 14581, "epoch": 347} {"train_loss": -5.061945915222168, "global_step": 14582, "epoch": 347} {"train_loss": -5.206063270568848, "global_step": 14583, "epoch": 347} {"train_loss": -5.188509941101074, "global_step": 14584, "epoch": 347} {"train_loss": -5.198531150817871, "global_step": 14585, "epoch": 347} {"train_loss": -5.135357856750488, "global_step": 14586, "epoch": 347} {"train_loss": -5.215541839599609, "global_step": 14587, "epoch": 347} {"train_loss": -5.162764549255371, "global_step": 14588, "epoch": 347} {"train_loss": -5.165347099304199, "global_step": 14589, "epoch": 347} {"train_loss": -5.04429292678833, "global_step": 14590, "epoch": 347} {"train_loss": -5.331787109375, "global_step": 14591, "epoch": 347} {"train_loss": -5.146032333374023, "global_step": 14592, "epoch": 347} {"train_loss": -5.18359899520874, "global_step": 14593, "epoch": 347} {"train_loss": -5.252279758453369, "global_step": 14594, "epoch": 347} {"train_loss": -5.203221321105957, "global_step": 14595, "epoch": 347} {"train_loss": -5.147030353546143, "global_step": 14596, "epoch": 347} {"train_loss": -5.209461212158203, "global_step": 14597, "epoch": 347} {"train_loss": -5.166505813598633, "global_step": 14598, "epoch": 347} {"train_loss": -5.150276184082031, "global_step": 14599, "epoch": 347} {"train_loss": -5.071998596191406, "global_step": 14600, "epoch": 347} {"train_loss": -5.243019104003906, "global_step": 14601, "epoch": 347} {"train_loss": -5.098567008972168, "global_step": 14602, "epoch": 347} {"train_loss": -5.142244338989258, "global_step": 14603, "epoch": 347} {"train_loss": -5.113746643066406, "global_step": 14604, "epoch": 347} {"train_loss": -5.249353408813477, "global_step": 14605, "epoch": 347} {"train_loss": -5.337462902069092, "global_step": 14606, "epoch": 347} {"train_loss": -5.042685031890869, "global_step": 14607, "epoch": 347} {"train_loss": -5.109128952026367, "global_step": 14608, "epoch": 347} {"train_loss": -5.106549263000488, "global_step": 14609, "epoch": 347} {"train_loss": -5.1111040115356445, "global_step": 14610, "epoch": 347} {"train_loss": -5.167936325073242, "global_step": 14611, "epoch": 347} {"train_loss": -5.207337856292725, "global_step": 14612, "epoch": 347} {"train_loss": -5.097202301025391, "global_step": 14613, "epoch": 347} {"train_loss": -5.150498867034912, "global_step": 14614, "epoch": 347} {"train_loss": -5.167358160018921, "global_step": 14615, "epoch": 347, "val_loss": 79131.8984375} {"train_loss": -5.135368347167969, "global_step": 14616, "epoch": 348} {"train_loss": -5.223179340362549, "global_step": 14617, "epoch": 348} {"train_loss": -5.318073272705078, "global_step": 14618, "epoch": 348} {"train_loss": -5.163012504577637, "global_step": 14619, "epoch": 348} {"train_loss": -5.175436019897461, "global_step": 14620, "epoch": 348} {"train_loss": -5.3934831619262695, "global_step": 14621, "epoch": 348} {"train_loss": -5.043021202087402, "global_step": 14622, "epoch": 348} {"train_loss": -5.053168773651123, "global_step": 14623, "epoch": 348} {"train_loss": -5.204504013061523, "global_step": 14624, "epoch": 348} {"train_loss": -5.137713432312012, "global_step": 14625, "epoch": 348} {"train_loss": -5.188762187957764, "global_step": 14626, "epoch": 348} {"train_loss": -5.140859603881836, "global_step": 14627, "epoch": 348} {"train_loss": -5.01521110534668, "global_step": 14628, "epoch": 348} {"train_loss": -5.099100112915039, "global_step": 14629, "epoch": 348} {"train_loss": -5.118924617767334, "global_step": 14630, "epoch": 348} {"train_loss": -5.195614337921143, "global_step": 14631, "epoch": 348} {"train_loss": -5.10205078125, "global_step": 14632, "epoch": 348} {"train_loss": -5.285800933837891, "global_step": 14633, "epoch": 348} {"train_loss": -5.247219085693359, "global_step": 14634, "epoch": 348} {"train_loss": -5.225229263305664, "global_step": 14635, "epoch": 348} {"train_loss": -5.150516510009766, "global_step": 14636, "epoch": 348} {"train_loss": -5.098587512969971, "global_step": 14637, "epoch": 348} {"train_loss": -5.133918285369873, "global_step": 14638, "epoch": 348} {"train_loss": -5.164722442626953, "global_step": 14639, "epoch": 348} {"train_loss": -5.167685508728027, "global_step": 14640, "epoch": 348} {"train_loss": -5.083992958068848, "global_step": 14641, "epoch": 348} {"train_loss": -5.113800048828125, "global_step": 14642, "epoch": 348} {"train_loss": -5.343924522399902, "global_step": 14643, "epoch": 348} {"train_loss": -4.925439357757568, "global_step": 14644, "epoch": 348} {"train_loss": -5.204553604125977, "global_step": 14645, "epoch": 348} {"train_loss": -5.212850570678711, "global_step": 14646, "epoch": 348} {"train_loss": -5.134468078613281, "global_step": 14647, "epoch": 348} {"train_loss": -5.122392654418945, "global_step": 14648, "epoch": 348} {"train_loss": -5.129912853240967, "global_step": 14649, "epoch": 348} {"train_loss": -5.312256813049316, "global_step": 14650, "epoch": 348} {"train_loss": -5.280667304992676, "global_step": 14651, "epoch": 348} {"train_loss": -5.166919708251953, "global_step": 14652, "epoch": 348} {"train_loss": -5.269266605377197, "global_step": 14653, "epoch": 348} {"train_loss": -5.100263595581055, "global_step": 14654, "epoch": 348} {"train_loss": -5.005046844482422, "global_step": 14655, "epoch": 348} {"train_loss": -5.179333686828613, "global_step": 14656, "epoch": 348} {"train_loss": -5.165366831279936, "global_step": 14657, "epoch": 348, "val_loss": 78084.0078125} {"train_loss": -5.123356342315674, "global_step": 14658, "epoch": 349} {"train_loss": -5.088218688964844, "global_step": 14659, "epoch": 349} {"train_loss": -5.118019104003906, "global_step": 14660, "epoch": 349} {"train_loss": -5.174299240112305, "global_step": 14661, "epoch": 349} {"train_loss": -5.210012435913086, "global_step": 14662, "epoch": 349} {"train_loss": -5.15080451965332, "global_step": 14663, "epoch": 349} {"train_loss": -5.140546798706055, "global_step": 14664, "epoch": 349} {"train_loss": -5.1604719161987305, "global_step": 14665, "epoch": 349} {"train_loss": -5.143945693969727, "global_step": 14666, "epoch": 349} {"train_loss": -5.202216148376465, "global_step": 14667, "epoch": 349} {"train_loss": -5.222874641418457, "global_step": 14668, "epoch": 349} {"train_loss": -5.073447227478027, "global_step": 14669, "epoch": 349} {"train_loss": -5.118152618408203, "global_step": 14670, "epoch": 349} {"train_loss": -5.2300920486450195, "global_step": 14671, "epoch": 349} {"train_loss": -5.134793281555176, "global_step": 14672, "epoch": 349} {"train_loss": -5.231505870819092, "global_step": 14673, "epoch": 349} {"train_loss": -5.29319953918457, "global_step": 14674, "epoch": 349} {"train_loss": -5.225650310516357, "global_step": 14675, "epoch": 349} {"train_loss": -5.2410888671875, "global_step": 14676, "epoch": 349} {"train_loss": -5.043307781219482, "global_step": 14677, "epoch": 349} {"train_loss": -5.352025985717773, "global_step": 14678, "epoch": 349} {"train_loss": -5.242875099182129, "global_step": 14679, "epoch": 349} {"train_loss": -5.12891149520874, "global_step": 14680, "epoch": 349} {"train_loss": -5.172104835510254, "global_step": 14681, "epoch": 349} {"train_loss": -5.093278884887695, "global_step": 14682, "epoch": 349} {"train_loss": -5.3227410316467285, "global_step": 14683, "epoch": 349} {"train_loss": -5.184117317199707, "global_step": 14684, "epoch": 349} {"train_loss": -5.075279235839844, "global_step": 14685, "epoch": 349} {"train_loss": -5.184422492980957, "global_step": 14686, "epoch": 349} {"train_loss": -5.352215766906738, "global_step": 14687, "epoch": 349} {"train_loss": -5.158587455749512, "global_step": 14688, "epoch": 349} {"train_loss": -5.013887405395508, "global_step": 14689, "epoch": 349} {"train_loss": -5.169114112854004, "global_step": 14690, "epoch": 349} {"train_loss": -4.9783711433410645, "global_step": 14691, "epoch": 349} {"train_loss": -5.310252666473389, "global_step": 14692, "epoch": 349} {"train_loss": -5.100194931030273, "global_step": 14693, "epoch": 349} {"train_loss": -5.120031833648682, "global_step": 14694, "epoch": 349} {"train_loss": -5.159605979919434, "global_step": 14695, "epoch": 349} {"train_loss": -5.3109025955200195, "global_step": 14696, "epoch": 349} {"train_loss": -5.121059894561768, "global_step": 14697, "epoch": 349} {"train_loss": -5.142026901245117, "global_step": 14698, "epoch": 349} {"train_loss": -5.1717449596949985, "global_step": 14699, "epoch": 349, "val_loss": 79010.3359375} {"train_loss": -5.2417449951171875, "global_step": 14700, "epoch": 350} {"train_loss": -5.162283897399902, "global_step": 14701, "epoch": 350} {"train_loss": -5.170958995819092, "global_step": 14702, "epoch": 350} {"train_loss": -5.232152938842773, "global_step": 14703, "epoch": 350} {"train_loss": -5.23818302154541, "global_step": 14704, "epoch": 350} {"train_loss": -5.1873674392700195, "global_step": 14705, "epoch": 350} {"train_loss": -5.279541015625, "global_step": 14706, "epoch": 350} {"train_loss": -5.191915512084961, "global_step": 14707, "epoch": 350} {"train_loss": -5.262042045593262, "global_step": 14708, "epoch": 350} {"train_loss": -5.203987121582031, "global_step": 14709, "epoch": 350} {"train_loss": -5.053554534912109, "global_step": 14710, "epoch": 350} {"train_loss": -5.17540168762207, "global_step": 14711, "epoch": 350} {"train_loss": -5.1650190353393555, "global_step": 14712, "epoch": 350} {"train_loss": -5.110321044921875, "global_step": 14713, "epoch": 350} {"train_loss": -5.180316925048828, "global_step": 14714, "epoch": 350} {"train_loss": -5.0961103439331055, "global_step": 14715, "epoch": 350} {"train_loss": -5.146849632263184, "global_step": 14716, "epoch": 350} {"train_loss": -5.078841209411621, "global_step": 14717, "epoch": 350} {"train_loss": -5.415872097015381, "global_step": 14718, "epoch": 350} {"train_loss": -5.159224987030029, "global_step": 14719, "epoch": 350} {"train_loss": -5.135194778442383, "global_step": 14720, "epoch": 350} {"train_loss": -5.058074951171875, "global_step": 14721, "epoch": 350} {"train_loss": -5.2031354904174805, "global_step": 14722, "epoch": 350} {"train_loss": -5.085697174072266, "global_step": 14723, "epoch": 350} {"train_loss": -5.088598251342773, "global_step": 14724, "epoch": 350} {"train_loss": -5.0323591232299805, "global_step": 14725, "epoch": 350} {"train_loss": -5.083778381347656, "global_step": 14726, "epoch": 350} {"train_loss": -5.235272407531738, "global_step": 14727, "epoch": 350} {"train_loss": -5.064879417419434, "global_step": 14728, "epoch": 350} {"train_loss": -5.146400451660156, "global_step": 14729, "epoch": 350} {"train_loss": -5.0753560066223145, "global_step": 14730, "epoch": 350} {"train_loss": -5.187257766723633, "global_step": 14731, "epoch": 350} {"train_loss": -5.21666145324707, "global_step": 14732, "epoch": 350} {"train_loss": -5.344967365264893, "global_step": 14733, "epoch": 350} {"train_loss": -5.1405181884765625, "global_step": 14734, "epoch": 350} {"train_loss": -4.92848539352417, "global_step": 14735, "epoch": 350} {"train_loss": -5.115296363830566, "global_step": 14736, "epoch": 350} {"train_loss": -5.275057792663574, "global_step": 14737, "epoch": 350} {"train_loss": -4.89424991607666, "global_step": 14738, "epoch": 350} {"train_loss": -5.137546539306641, "global_step": 14739, "epoch": 350} {"train_loss": -5.124863624572754, "global_step": 14740, "epoch": 350} {"train_loss": -5.154064553124564, "global_step": 14741, "epoch": 350, "train/sim_max_reward_0": 0.20155798736878786, "train/sim_max_reward_1": 0.8319332584911003, "train/sim_max_reward_2": 0.16043272427109517, "train/sim_max_reward_3": 0.08542434526555376, "train/sim_max_reward_4": 0.21661654300023397, "train/sim_max_reward_5": 0.41206915963965907, "test/sim_max_reward_4500000": 0.36509209322940506, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.16309185586563354, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.04494433411836119, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.31272473510720394, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.8776848888804532, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.39442991740527683, "test/sim_max_reward_4500019": 0.3995954542462446, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.7396326922789079, "test/sim_max_reward_4500022": 0.6389053725894333, "test/sim_max_reward_4500023": 0.5964394057688768, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.725340833833341, "test/sim_max_reward_4500026": 0.047489279384058794, "test/sim_max_reward_4500027": 0.3227677123748227, "test/sim_max_reward_4500028": 0.34425643148996105, "test/sim_max_reward_4500029": 0.04163460642148004, "test/sim_max_reward_4500030": 0.15619776996694795, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.26503523266299833, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.3653125193771619, "test/sim_max_reward_4500035": 0.0815124915767583, "test/sim_max_reward_4500036": 0.777209811487055, "test/sim_max_reward_4500037": 0.0, "test/sim_max_reward_4500038": 0.3567070223442179, "test/sim_max_reward_4500039": 0.2371276905497067, "test/sim_max_reward_4500040": 0.1519229644941731, "test/sim_max_reward_4500041": 0.0, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.6028398631565942, "test/sim_max_reward_4500045": 0.1175735103924684, "test/sim_max_reward_4500046": 0.1904599965434631, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.09073976362894809, "train/mean_score": 0.31800566967273836, "test/mean_score": 0.18961765843843315, "val_loss": 79008.671875} {"train_loss": -5.210547924041748, "global_step": 14742, "epoch": 351} {"train_loss": -5.131840705871582, "global_step": 14743, "epoch": 351} {"train_loss": -5.184258460998535, "global_step": 14744, "epoch": 351} {"train_loss": -5.026473045349121, "global_step": 14745, "epoch": 351} {"train_loss": -5.214141845703125, "global_step": 14746, "epoch": 351} {"train_loss": -5.257054328918457, "global_step": 14747, "epoch": 351} {"train_loss": -5.031586170196533, "global_step": 14748, "epoch": 351} {"train_loss": -5.065178871154785, "global_step": 14749, "epoch": 351} {"train_loss": -5.246294975280762, "global_step": 14750, "epoch": 351} {"train_loss": -5.116175651550293, "global_step": 14751, "epoch": 351} {"train_loss": -5.2857818603515625, "global_step": 14752, "epoch": 351} {"train_loss": -5.064123630523682, "global_step": 14753, "epoch": 351} {"train_loss": -5.091673374176025, "global_step": 14754, "epoch": 351} {"train_loss": -5.181373596191406, "global_step": 14755, "epoch": 351} {"train_loss": -5.177520275115967, "global_step": 14756, "epoch": 351} {"train_loss": -5.030265808105469, "global_step": 14757, "epoch": 351} {"train_loss": -5.157137870788574, "global_step": 14758, "epoch": 351} {"train_loss": -5.196521282196045, "global_step": 14759, "epoch": 351} {"train_loss": -5.237968444824219, "global_step": 14760, "epoch": 351} {"train_loss": -5.113680839538574, "global_step": 14761, "epoch": 351} {"train_loss": -5.256468772888184, "global_step": 14762, "epoch": 351} {"train_loss": -5.111861228942871, "global_step": 14763, "epoch": 351} {"train_loss": -5.288091659545898, "global_step": 14764, "epoch": 351} {"train_loss": -5.240287780761719, "global_step": 14765, "epoch": 351} {"train_loss": -5.343937873840332, "global_step": 14766, "epoch": 351} {"train_loss": -5.231259346008301, "global_step": 14767, "epoch": 351} {"train_loss": -5.197382926940918, "global_step": 14768, "epoch": 351} {"train_loss": -5.2134575843811035, "global_step": 14769, "epoch": 351} {"train_loss": -5.195680618286133, "global_step": 14770, "epoch": 351} {"train_loss": -5.253653526306152, "global_step": 14771, "epoch": 351} {"train_loss": -5.135037422180176, "global_step": 14772, "epoch": 351} {"train_loss": -5.169004917144775, "global_step": 14773, "epoch": 351} {"train_loss": -5.244996070861816, "global_step": 14774, "epoch": 351} {"train_loss": -5.204607963562012, "global_step": 14775, "epoch": 351} {"train_loss": -5.116403102874756, "global_step": 14776, "epoch": 351} {"train_loss": -5.172597885131836, "global_step": 14777, "epoch": 351} {"train_loss": -5.302116394042969, "global_step": 14778, "epoch": 351} {"train_loss": -4.956159591674805, "global_step": 14779, "epoch": 351} {"train_loss": -5.150815486907959, "global_step": 14780, "epoch": 351} {"train_loss": -5.197461128234863, "global_step": 14781, "epoch": 351} {"train_loss": -5.281087875366211, "global_step": 14782, "epoch": 351} {"train_loss": -5.175067050116403, "global_step": 14783, "epoch": 351, "val_loss": 78632.46875} {"train_loss": -5.032279968261719, "global_step": 14784, "epoch": 352} {"train_loss": -5.2374444007873535, "global_step": 14785, "epoch": 352} {"train_loss": -5.239656448364258, "global_step": 14786, "epoch": 352} {"train_loss": -5.093207359313965, "global_step": 14787, "epoch": 352} {"train_loss": -5.14372444152832, "global_step": 14788, "epoch": 352} {"train_loss": -5.21573543548584, "global_step": 14789, "epoch": 352} {"train_loss": -5.245809555053711, "global_step": 14790, "epoch": 352} {"train_loss": -5.115909099578857, "global_step": 14791, "epoch": 352} {"train_loss": -5.228623390197754, "global_step": 14792, "epoch": 352} {"train_loss": -5.233682632446289, "global_step": 14793, "epoch": 352} {"train_loss": -5.286897659301758, "global_step": 14794, "epoch": 352} {"train_loss": -5.248403549194336, "global_step": 14795, "epoch": 352} {"train_loss": -5.233636856079102, "global_step": 14796, "epoch": 352} {"train_loss": -5.269958019256592, "global_step": 14797, "epoch": 352} {"train_loss": -5.099132537841797, "global_step": 14798, "epoch": 352} {"train_loss": -5.332026481628418, "global_step": 14799, "epoch": 352} {"train_loss": -5.2608642578125, "global_step": 14800, "epoch": 352} {"train_loss": -5.157544136047363, "global_step": 14801, "epoch": 352} {"train_loss": -5.249393463134766, "global_step": 14802, "epoch": 352} {"train_loss": -5.142976760864258, "global_step": 14803, "epoch": 352} {"train_loss": -5.117944717407227, "global_step": 14804, "epoch": 352} {"train_loss": -5.284066200256348, "global_step": 14805, "epoch": 352} {"train_loss": -5.179037570953369, "global_step": 14806, "epoch": 352} {"train_loss": -4.919768333435059, "global_step": 14807, "epoch": 352} {"train_loss": -5.11478328704834, "global_step": 14808, "epoch": 352} {"train_loss": -5.064167499542236, "global_step": 14809, "epoch": 352} {"train_loss": -4.9990763664245605, "global_step": 14810, "epoch": 352} {"train_loss": -5.218514442443848, "global_step": 14811, "epoch": 352} {"train_loss": -5.135732173919678, "global_step": 14812, "epoch": 352} {"train_loss": -5.06721305847168, "global_step": 14813, "epoch": 352} {"train_loss": -5.192103385925293, "global_step": 14814, "epoch": 352} {"train_loss": -5.244373798370361, "global_step": 14815, "epoch": 352} {"train_loss": -5.191055774688721, "global_step": 14816, "epoch": 352} {"train_loss": -5.254120826721191, "global_step": 14817, "epoch": 352} {"train_loss": -5.108087539672852, "global_step": 14818, "epoch": 352} {"train_loss": -5.291539192199707, "global_step": 14819, "epoch": 352} {"train_loss": -5.163900852203369, "global_step": 14820, "epoch": 352} {"train_loss": -5.140904426574707, "global_step": 14821, "epoch": 352} {"train_loss": -5.023131370544434, "global_step": 14822, "epoch": 352} {"train_loss": -5.082233428955078, "global_step": 14823, "epoch": 352} {"train_loss": -5.136189937591553, "global_step": 14824, "epoch": 352} {"train_loss": -5.171001286733718, "global_step": 14825, "epoch": 352, "val_loss": 78613.1484375} {"train_loss": -5.265563488006592, "global_step": 14826, "epoch": 353} {"train_loss": -5.067276954650879, "global_step": 14827, "epoch": 353} {"train_loss": -5.092616081237793, "global_step": 14828, "epoch": 353} {"train_loss": -5.232189178466797, "global_step": 14829, "epoch": 353} {"train_loss": -5.126945495605469, "global_step": 14830, "epoch": 353} {"train_loss": -5.312380790710449, "global_step": 14831, "epoch": 353} {"train_loss": -5.090542316436768, "global_step": 14832, "epoch": 353} {"train_loss": -5.153510093688965, "global_step": 14833, "epoch": 353} {"train_loss": -5.139875411987305, "global_step": 14834, "epoch": 353} {"train_loss": -5.148288726806641, "global_step": 14835, "epoch": 353} {"train_loss": -5.226898670196533, "global_step": 14836, "epoch": 353} {"train_loss": -5.1190714836120605, "global_step": 14837, "epoch": 353} {"train_loss": -5.060123443603516, "global_step": 14838, "epoch": 353} {"train_loss": -5.127481460571289, "global_step": 14839, "epoch": 353} {"train_loss": -5.188241004943848, "global_step": 14840, "epoch": 353} {"train_loss": -5.00581693649292, "global_step": 14841, "epoch": 353} {"train_loss": -5.145810604095459, "global_step": 14842, "epoch": 353} {"train_loss": -5.240418434143066, "global_step": 14843, "epoch": 353} {"train_loss": -5.150291442871094, "global_step": 14844, "epoch": 353} {"train_loss": -5.233401298522949, "global_step": 14845, "epoch": 353} {"train_loss": -5.188711643218994, "global_step": 14846, "epoch": 353} {"train_loss": -5.159231185913086, "global_step": 14847, "epoch": 353} {"train_loss": -5.208446979522705, "global_step": 14848, "epoch": 353} {"train_loss": -5.281323432922363, "global_step": 14849, "epoch": 353} {"train_loss": -5.204361438751221, "global_step": 14850, "epoch": 353} {"train_loss": -5.113231658935547, "global_step": 14851, "epoch": 353} {"train_loss": -5.122271537780762, "global_step": 14852, "epoch": 353} {"train_loss": -5.142775058746338, "global_step": 14853, "epoch": 353} {"train_loss": -5.126554489135742, "global_step": 14854, "epoch": 353} {"train_loss": -5.272463798522949, "global_step": 14855, "epoch": 353} {"train_loss": -5.24657678604126, "global_step": 14856, "epoch": 353} {"train_loss": -5.2068047523498535, "global_step": 14857, "epoch": 353} {"train_loss": -5.172120094299316, "global_step": 14858, "epoch": 353} {"train_loss": -5.1689982414245605, "global_step": 14859, "epoch": 353} {"train_loss": -5.235607147216797, "global_step": 14860, "epoch": 353} {"train_loss": -5.048523426055908, "global_step": 14861, "epoch": 353} {"train_loss": -5.303208827972412, "global_step": 14862, "epoch": 353} {"train_loss": -5.241715431213379, "global_step": 14863, "epoch": 353} {"train_loss": -5.183943271636963, "global_step": 14864, "epoch": 353} {"train_loss": -5.202658653259277, "global_step": 14865, "epoch": 353} {"train_loss": -5.172943115234375, "global_step": 14866, "epoch": 353} {"train_loss": -5.174636693227859, "global_step": 14867, "epoch": 353, "val_loss": 79109.8515625} {"train_loss": -5.110170364379883, "global_step": 14868, "epoch": 354} {"train_loss": -5.272768020629883, "global_step": 14869, "epoch": 354} {"train_loss": -5.255420684814453, "global_step": 14870, "epoch": 354} {"train_loss": -5.312692642211914, "global_step": 14871, "epoch": 354} {"train_loss": -5.313412666320801, "global_step": 14872, "epoch": 354} {"train_loss": -5.098005294799805, "global_step": 14873, "epoch": 354} {"train_loss": -5.101188659667969, "global_step": 14874, "epoch": 354} {"train_loss": -5.273858070373535, "global_step": 14875, "epoch": 354} {"train_loss": -5.031702518463135, "global_step": 14876, "epoch": 354} {"train_loss": -5.146845817565918, "global_step": 14877, "epoch": 354} {"train_loss": -5.013683795928955, "global_step": 14878, "epoch": 354} {"train_loss": -5.247582912445068, "global_step": 14879, "epoch": 354} {"train_loss": -5.318702697753906, "global_step": 14880, "epoch": 354} {"train_loss": -4.8556060791015625, "global_step": 14881, "epoch": 354} {"train_loss": -4.788017749786377, "global_step": 14882, "epoch": 354} {"train_loss": -5.185502052307129, "global_step": 14883, "epoch": 354} {"train_loss": -4.941313743591309, "global_step": 14884, "epoch": 354} {"train_loss": -4.891826629638672, "global_step": 14885, "epoch": 354} {"train_loss": -5.221879959106445, "global_step": 14886, "epoch": 354} {"train_loss": -4.917037487030029, "global_step": 14887, "epoch": 354} {"train_loss": -5.162018775939941, "global_step": 14888, "epoch": 354} {"train_loss": -5.115161895751953, "global_step": 14889, "epoch": 354} {"train_loss": -5.072210311889648, "global_step": 14890, "epoch": 354} {"train_loss": -5.075794219970703, "global_step": 14891, "epoch": 354} {"train_loss": -5.099361896514893, "global_step": 14892, "epoch": 354} {"train_loss": -5.041913986206055, "global_step": 14893, "epoch": 354} {"train_loss": -5.14309024810791, "global_step": 14894, "epoch": 354} {"train_loss": -5.1819353103637695, "global_step": 14895, "epoch": 354} {"train_loss": -5.120625019073486, "global_step": 14896, "epoch": 354} {"train_loss": -5.053461074829102, "global_step": 14897, "epoch": 354} {"train_loss": -5.074577331542969, "global_step": 14898, "epoch": 354} {"train_loss": -5.166759490966797, "global_step": 14899, "epoch": 354} {"train_loss": -5.129458427429199, "global_step": 14900, "epoch": 354} {"train_loss": -5.290308475494385, "global_step": 14901, "epoch": 354} {"train_loss": -5.095559120178223, "global_step": 14902, "epoch": 354} {"train_loss": -5.179536819458008, "global_step": 14903, "epoch": 354} {"train_loss": -5.055139064788818, "global_step": 14904, "epoch": 354} {"train_loss": -5.081853866577148, "global_step": 14905, "epoch": 354} {"train_loss": -5.086705207824707, "global_step": 14906, "epoch": 354} {"train_loss": -5.24708366394043, "global_step": 14907, "epoch": 354} {"train_loss": -5.1703386306762695, "global_step": 14908, "epoch": 354} {"train_loss": -5.123318672180176, "global_step": 14909, "epoch": 354, "val_loss": 78465.40625} {"train_loss": -5.258602142333984, "global_step": 14910, "epoch": 355} {"train_loss": -5.06243896484375, "global_step": 14911, "epoch": 355} {"train_loss": -5.1799702644348145, "global_step": 14912, "epoch": 355} {"train_loss": -5.208896160125732, "global_step": 14913, "epoch": 355} {"train_loss": -5.225654602050781, "global_step": 14914, "epoch": 355} {"train_loss": -5.328924655914307, "global_step": 14915, "epoch": 355} {"train_loss": -5.102324485778809, "global_step": 14916, "epoch": 355} {"train_loss": -5.225466728210449, "global_step": 14917, "epoch": 355} {"train_loss": -5.324679851531982, "global_step": 14918, "epoch": 355} {"train_loss": -5.278082847595215, "global_step": 14919, "epoch": 355} {"train_loss": -5.218028545379639, "global_step": 14920, "epoch": 355} {"train_loss": -5.142365455627441, "global_step": 14921, "epoch": 355} {"train_loss": -5.23007869720459, "global_step": 14922, "epoch": 355} {"train_loss": -5.1961669921875, "global_step": 14923, "epoch": 355} {"train_loss": -5.148921012878418, "global_step": 14924, "epoch": 355} {"train_loss": -5.119535446166992, "global_step": 14925, "epoch": 355} {"train_loss": -5.17020320892334, "global_step": 14926, "epoch": 355} {"train_loss": -5.221498489379883, "global_step": 14927, "epoch": 355} {"train_loss": -4.980511665344238, "global_step": 14928, "epoch": 355} {"train_loss": -5.245075225830078, "global_step": 14929, "epoch": 355} {"train_loss": -5.263116836547852, "global_step": 14930, "epoch": 355} {"train_loss": -5.2901201248168945, "global_step": 14931, "epoch": 355} {"train_loss": -5.289135932922363, "global_step": 14932, "epoch": 355} {"train_loss": -5.164446830749512, "global_step": 14933, "epoch": 355} {"train_loss": -5.086996078491211, "global_step": 14934, "epoch": 355} {"train_loss": -5.2999348640441895, "global_step": 14935, "epoch": 355} {"train_loss": -5.252981185913086, "global_step": 14936, "epoch": 355} {"train_loss": -5.150906562805176, "global_step": 14937, "epoch": 355} {"train_loss": -5.291485786437988, "global_step": 14938, "epoch": 355} {"train_loss": -5.175289630889893, "global_step": 14939, "epoch": 355} {"train_loss": -5.170866966247559, "global_step": 14940, "epoch": 355} {"train_loss": -5.125698089599609, "global_step": 14941, "epoch": 355} {"train_loss": -5.052194118499756, "global_step": 14942, "epoch": 355} {"train_loss": -5.0595855712890625, "global_step": 14943, "epoch": 355} {"train_loss": -5.2251152992248535, "global_step": 14944, "epoch": 355} {"train_loss": -5.374422073364258, "global_step": 14945, "epoch": 355} {"train_loss": -5.202678680419922, "global_step": 14946, "epoch": 355} {"train_loss": -5.123846054077148, "global_step": 14947, "epoch": 355} {"train_loss": -5.141613006591797, "global_step": 14948, "epoch": 355} {"train_loss": -5.155989646911621, "global_step": 14949, "epoch": 355} {"train_loss": -5.147280693054199, "global_step": 14950, "epoch": 355} {"train_loss": -5.192950770968483, "global_step": 14951, "epoch": 355, "val_loss": 77739.28125} {"train_loss": -5.338268280029297, "global_step": 14952, "epoch": 356} {"train_loss": -5.087875843048096, "global_step": 14953, "epoch": 356} {"train_loss": -5.061740875244141, "global_step": 14954, "epoch": 356} {"train_loss": -5.1713056564331055, "global_step": 14955, "epoch": 356} {"train_loss": -5.1162495613098145, "global_step": 14956, "epoch": 356} {"train_loss": -5.257919788360596, "global_step": 14957, "epoch": 356} {"train_loss": -5.1542887687683105, "global_step": 14958, "epoch": 356} {"train_loss": -5.192370414733887, "global_step": 14959, "epoch": 356} {"train_loss": -5.2422661781311035, "global_step": 14960, "epoch": 356} {"train_loss": -5.207972526550293, "global_step": 14961, "epoch": 356} {"train_loss": -5.127685070037842, "global_step": 14962, "epoch": 356} {"train_loss": -5.127804279327393, "global_step": 14963, "epoch": 356} {"train_loss": -5.101414680480957, "global_step": 14964, "epoch": 356} {"train_loss": -5.191672325134277, "global_step": 14965, "epoch": 356} {"train_loss": -5.198925018310547, "global_step": 14966, "epoch": 356} {"train_loss": -5.236633777618408, "global_step": 14967, "epoch": 356} {"train_loss": -5.201479911804199, "global_step": 14968, "epoch": 356} {"train_loss": -5.203469276428223, "global_step": 14969, "epoch": 356} {"train_loss": -5.150562763214111, "global_step": 14970, "epoch": 356} {"train_loss": -5.100249290466309, "global_step": 14971, "epoch": 356} {"train_loss": -5.214146614074707, "global_step": 14972, "epoch": 356} {"train_loss": -5.139158725738525, "global_step": 14973, "epoch": 356} {"train_loss": -5.096650123596191, "global_step": 14974, "epoch": 356} {"train_loss": -5.262531280517578, "global_step": 14975, "epoch": 356} {"train_loss": -5.155123710632324, "global_step": 14976, "epoch": 356} {"train_loss": -5.222569465637207, "global_step": 14977, "epoch": 356} {"train_loss": -5.181486129760742, "global_step": 14978, "epoch": 356} {"train_loss": -5.274757385253906, "global_step": 14979, "epoch": 356} {"train_loss": -5.214242935180664, "global_step": 14980, "epoch": 356} {"train_loss": -5.222166061401367, "global_step": 14981, "epoch": 356} {"train_loss": -5.226016998291016, "global_step": 14982, "epoch": 356} {"train_loss": -5.270995616912842, "global_step": 14983, "epoch": 356} {"train_loss": -5.297544002532959, "global_step": 14984, "epoch": 356} {"train_loss": -5.087930679321289, "global_step": 14985, "epoch": 356} {"train_loss": -5.180218696594238, "global_step": 14986, "epoch": 356} {"train_loss": -5.179108619689941, "global_step": 14987, "epoch": 356} {"train_loss": -5.134115219116211, "global_step": 14988, "epoch": 356} {"train_loss": -5.158164024353027, "global_step": 14989, "epoch": 356} {"train_loss": -5.079399108886719, "global_step": 14990, "epoch": 356} {"train_loss": -5.311370372772217, "global_step": 14991, "epoch": 356} {"train_loss": -5.177124977111816, "global_step": 14992, "epoch": 356} {"train_loss": -5.1857201144808815, "global_step": 14993, "epoch": 356, "val_loss": 78395.4296875} {"train_loss": -5.227232456207275, "global_step": 14994, "epoch": 357} {"train_loss": -5.157367706298828, "global_step": 14995, "epoch": 357} {"train_loss": -5.187500476837158, "global_step": 14996, "epoch": 357} {"train_loss": -5.083127975463867, "global_step": 14997, "epoch": 357} {"train_loss": -5.315000534057617, "global_step": 14998, "epoch": 357} {"train_loss": -5.1017351150512695, "global_step": 14999, "epoch": 357} {"train_loss": -5.313836574554443, "global_step": 15000, "epoch": 357} {"train_loss": -5.263751983642578, "global_step": 15001, "epoch": 357} {"train_loss": -5.147012710571289, "global_step": 15002, "epoch": 357} {"train_loss": -5.132930755615234, "global_step": 15003, "epoch": 357} {"train_loss": -5.150733947753906, "global_step": 15004, "epoch": 357} {"train_loss": -5.245918273925781, "global_step": 15005, "epoch": 357} {"train_loss": -5.16184139251709, "global_step": 15006, "epoch": 357} {"train_loss": -5.194805145263672, "global_step": 15007, "epoch": 357} {"train_loss": -5.187467575073242, "global_step": 15008, "epoch": 357} {"train_loss": -5.242338180541992, "global_step": 15009, "epoch": 357} {"train_loss": -5.281826019287109, "global_step": 15010, "epoch": 357} {"train_loss": -5.205806732177734, "global_step": 15011, "epoch": 357} {"train_loss": -5.282331466674805, "global_step": 15012, "epoch": 357} {"train_loss": -5.1531524658203125, "global_step": 15013, "epoch": 357} {"train_loss": -5.202360153198242, "global_step": 15014, "epoch": 357} {"train_loss": -5.1471052169799805, "global_step": 15015, "epoch": 357} {"train_loss": -5.154542922973633, "global_step": 15016, "epoch": 357} {"train_loss": -5.245593070983887, "global_step": 15017, "epoch": 357} {"train_loss": -5.161908149719238, "global_step": 15018, "epoch": 357} {"train_loss": -5.132660388946533, "global_step": 15019, "epoch": 357} {"train_loss": -5.123744010925293, "global_step": 15020, "epoch": 357} {"train_loss": -5.209588050842285, "global_step": 15021, "epoch": 357} {"train_loss": -5.172277450561523, "global_step": 15022, "epoch": 357} {"train_loss": -5.179492950439453, "global_step": 15023, "epoch": 357} {"train_loss": -5.108599662780762, "global_step": 15024, "epoch": 357} {"train_loss": -5.2516374588012695, "global_step": 15025, "epoch": 357} {"train_loss": -5.249951362609863, "global_step": 15026, "epoch": 357} {"train_loss": -5.278189659118652, "global_step": 15027, "epoch": 357} {"train_loss": -5.236847400665283, "global_step": 15028, "epoch": 357} {"train_loss": -5.294389247894287, "global_step": 15029, "epoch": 357} {"train_loss": -5.147005081176758, "global_step": 15030, "epoch": 357} {"train_loss": -5.136102676391602, "global_step": 15031, "epoch": 357} {"train_loss": -5.292208671569824, "global_step": 15032, "epoch": 357} {"train_loss": -5.3291015625, "global_step": 15033, "epoch": 357} {"train_loss": -5.222280025482178, "global_step": 15034, "epoch": 357} {"train_loss": -5.2017689773014615, "global_step": 15035, "epoch": 357, "val_loss": 78327.1953125} {"train_loss": -5.123605728149414, "global_step": 15036, "epoch": 358} {"train_loss": -5.182973861694336, "global_step": 15037, "epoch": 358} {"train_loss": -5.034985542297363, "global_step": 15038, "epoch": 358} {"train_loss": -5.118758678436279, "global_step": 15039, "epoch": 358} {"train_loss": -5.207376480102539, "global_step": 15040, "epoch": 358} {"train_loss": -5.160973072052002, "global_step": 15041, "epoch": 358} {"train_loss": -5.002098083496094, "global_step": 15042, "epoch": 358} {"train_loss": -5.409717559814453, "global_step": 15043, "epoch": 358} {"train_loss": -5.194550514221191, "global_step": 15044, "epoch": 358} {"train_loss": -5.241805076599121, "global_step": 15045, "epoch": 358} {"train_loss": -5.147104263305664, "global_step": 15046, "epoch": 358} {"train_loss": -5.154732704162598, "global_step": 15047, "epoch": 358} {"train_loss": -5.284037113189697, "global_step": 15048, "epoch": 358} {"train_loss": -5.142751693725586, "global_step": 15049, "epoch": 358} {"train_loss": -5.058797836303711, "global_step": 15050, "epoch": 358} {"train_loss": -5.180968284606934, "global_step": 15051, "epoch": 358} {"train_loss": -5.21820068359375, "global_step": 15052, "epoch": 358} {"train_loss": -5.139213562011719, "global_step": 15053, "epoch": 358} {"train_loss": -5.0977630615234375, "global_step": 15054, "epoch": 358} {"train_loss": -5.052837371826172, "global_step": 15055, "epoch": 358} {"train_loss": -5.080896854400635, "global_step": 15056, "epoch": 358} {"train_loss": -5.10008430480957, "global_step": 15057, "epoch": 358} {"train_loss": -5.170677185058594, "global_step": 15058, "epoch": 358} {"train_loss": -5.125253200531006, "global_step": 15059, "epoch": 358} {"train_loss": -5.073966026306152, "global_step": 15060, "epoch": 358} {"train_loss": -5.16054630279541, "global_step": 15061, "epoch": 358} {"train_loss": -5.105007648468018, "global_step": 15062, "epoch": 358} {"train_loss": -5.051569938659668, "global_step": 15063, "epoch": 358} {"train_loss": -5.1322174072265625, "global_step": 15064, "epoch": 358} {"train_loss": -5.145417213439941, "global_step": 15065, "epoch": 358} {"train_loss": -5.238775253295898, "global_step": 15066, "epoch": 358} {"train_loss": -5.3425445556640625, "global_step": 15067, "epoch": 358} {"train_loss": -5.187302589416504, "global_step": 15068, "epoch": 358} {"train_loss": -5.202644348144531, "global_step": 15069, "epoch": 358} {"train_loss": -5.192200183868408, "global_step": 15070, "epoch": 358} {"train_loss": -5.226250171661377, "global_step": 15071, "epoch": 358} {"train_loss": -5.233563423156738, "global_step": 15072, "epoch": 358} {"train_loss": -5.180877208709717, "global_step": 15073, "epoch": 358} {"train_loss": -5.149621486663818, "global_step": 15074, "epoch": 358} {"train_loss": -5.119386672973633, "global_step": 15075, "epoch": 358} {"train_loss": -5.120721340179443, "global_step": 15076, "epoch": 358} {"train_loss": -5.160342171078637, "global_step": 15077, "epoch": 358, "val_loss": 79248.859375} {"train_loss": -5.190305709838867, "global_step": 15078, "epoch": 359} {"train_loss": -5.144942283630371, "global_step": 15079, "epoch": 359} {"train_loss": -5.270451068878174, "global_step": 15080, "epoch": 359} {"train_loss": -5.08302116394043, "global_step": 15081, "epoch": 359} {"train_loss": -5.333438873291016, "global_step": 15082, "epoch": 359} {"train_loss": -5.168071746826172, "global_step": 15083, "epoch": 359} {"train_loss": -5.1181440353393555, "global_step": 15084, "epoch": 359} {"train_loss": -5.166545867919922, "global_step": 15085, "epoch": 359} {"train_loss": -5.2111101150512695, "global_step": 15086, "epoch": 359} {"train_loss": -5.188558578491211, "global_step": 15087, "epoch": 359} {"train_loss": -5.200247287750244, "global_step": 15088, "epoch": 359} {"train_loss": -5.157966613769531, "global_step": 15089, "epoch": 359} {"train_loss": -4.878990173339844, "global_step": 15090, "epoch": 359} {"train_loss": -5.1907830238342285, "global_step": 15091, "epoch": 359} {"train_loss": -5.192722797393799, "global_step": 15092, "epoch": 359} {"train_loss": -5.1770524978637695, "global_step": 15093, "epoch": 359} {"train_loss": -5.298073768615723, "global_step": 15094, "epoch": 359} {"train_loss": -5.225314140319824, "global_step": 15095, "epoch": 359} {"train_loss": -5.219829082489014, "global_step": 15096, "epoch": 359} {"train_loss": -5.251404762268066, "global_step": 15097, "epoch": 359} {"train_loss": -5.0506591796875, "global_step": 15098, "epoch": 359} {"train_loss": -5.203707218170166, "global_step": 15099, "epoch": 359} {"train_loss": -5.104636192321777, "global_step": 15100, "epoch": 359} {"train_loss": -5.144154071807861, "global_step": 15101, "epoch": 359} {"train_loss": -5.186835289001465, "global_step": 15102, "epoch": 359} {"train_loss": -5.078373908996582, "global_step": 15103, "epoch": 359} {"train_loss": -5.335143089294434, "global_step": 15104, "epoch": 359} {"train_loss": -5.26498556137085, "global_step": 15105, "epoch": 359} {"train_loss": -5.316471576690674, "global_step": 15106, "epoch": 359} {"train_loss": -5.128993511199951, "global_step": 15107, "epoch": 359} {"train_loss": -5.314872741699219, "global_step": 15108, "epoch": 359} {"train_loss": -5.17146110534668, "global_step": 15109, "epoch": 359} {"train_loss": -5.13299560546875, "global_step": 15110, "epoch": 359} {"train_loss": -5.170163154602051, "global_step": 15111, "epoch": 359} {"train_loss": -5.252568244934082, "global_step": 15112, "epoch": 359} {"train_loss": -5.198141574859619, "global_step": 15113, "epoch": 359} {"train_loss": -5.224168300628662, "global_step": 15114, "epoch": 359} {"train_loss": -5.267207145690918, "global_step": 15115, "epoch": 359} {"train_loss": -5.160874366760254, "global_step": 15116, "epoch": 359} {"train_loss": -5.019460678100586, "global_step": 15117, "epoch": 359} {"train_loss": -5.188126564025879, "global_step": 15118, "epoch": 359} {"train_loss": -5.179656426111857, "global_step": 15119, "epoch": 359, "val_loss": 78978.609375} {"train_loss": -5.10537052154541, "global_step": 15120, "epoch": 360} {"train_loss": -5.037877559661865, "global_step": 15121, "epoch": 360} {"train_loss": -4.977416038513184, "global_step": 15122, "epoch": 360} {"train_loss": -5.139621734619141, "global_step": 15123, "epoch": 360} {"train_loss": -5.049744606018066, "global_step": 15124, "epoch": 360} {"train_loss": -5.099667549133301, "global_step": 15125, "epoch": 360} {"train_loss": -5.1198625564575195, "global_step": 15126, "epoch": 360} {"train_loss": -5.183416366577148, "global_step": 15127, "epoch": 360} {"train_loss": -5.065834045410156, "global_step": 15128, "epoch": 360} {"train_loss": -5.047538757324219, "global_step": 15129, "epoch": 360} {"train_loss": -5.195092678070068, "global_step": 15130, "epoch": 360} {"train_loss": -4.988447189331055, "global_step": 15131, "epoch": 360} {"train_loss": -4.99648904800415, "global_step": 15132, "epoch": 360} {"train_loss": -4.958694934844971, "global_step": 15133, "epoch": 360} {"train_loss": -5.204899787902832, "global_step": 15134, "epoch": 360} {"train_loss": -5.252262115478516, "global_step": 15135, "epoch": 360} {"train_loss": -4.9752092361450195, "global_step": 15136, "epoch": 360} {"train_loss": -5.113526344299316, "global_step": 15137, "epoch": 360} {"train_loss": -5.034651279449463, "global_step": 15138, "epoch": 360} {"train_loss": -5.083982944488525, "global_step": 15139, "epoch": 360} {"train_loss": -4.969330310821533, "global_step": 15140, "epoch": 360} {"train_loss": -5.139828205108643, "global_step": 15141, "epoch": 360} {"train_loss": -5.070349216461182, "global_step": 15142, "epoch": 360} {"train_loss": -5.212603569030762, "global_step": 15143, "epoch": 360} {"train_loss": -5.009714126586914, "global_step": 15144, "epoch": 360} {"train_loss": -5.16322135925293, "global_step": 15145, "epoch": 360} {"train_loss": -5.145979881286621, "global_step": 15146, "epoch": 360} {"train_loss": -5.133449077606201, "global_step": 15147, "epoch": 360} {"train_loss": -5.149445056915283, "global_step": 15148, "epoch": 360} {"train_loss": -5.195712566375732, "global_step": 15149, "epoch": 360} {"train_loss": -5.151479721069336, "global_step": 15150, "epoch": 360} {"train_loss": -5.183472633361816, "global_step": 15151, "epoch": 360} {"train_loss": -5.20650577545166, "global_step": 15152, "epoch": 360} {"train_loss": -5.363664627075195, "global_step": 15153, "epoch": 360} {"train_loss": -5.23773193359375, "global_step": 15154, "epoch": 360} {"train_loss": -5.1736836433410645, "global_step": 15155, "epoch": 360} {"train_loss": -5.257627964019775, "global_step": 15156, "epoch": 360} {"train_loss": -5.15018367767334, "global_step": 15157, "epoch": 360} {"train_loss": -5.16294002532959, "global_step": 15158, "epoch": 360} {"train_loss": -5.249076843261719, "global_step": 15159, "epoch": 360} {"train_loss": -5.165592670440674, "global_step": 15160, "epoch": 360} {"train_loss": -5.1261484282357355, "global_step": 15161, "epoch": 360, "val_loss": 78376.4453125} {"train_loss": -5.109541416168213, "global_step": 15162, "epoch": 361} {"train_loss": -5.319003105163574, "global_step": 15163, "epoch": 361} {"train_loss": -5.3316330909729, "global_step": 15164, "epoch": 361} {"train_loss": -5.2098283767700195, "global_step": 15165, "epoch": 361} {"train_loss": -5.111720085144043, "global_step": 15166, "epoch": 361} {"train_loss": -5.299749374389648, "global_step": 15167, "epoch": 361} {"train_loss": -5.308523178100586, "global_step": 15168, "epoch": 361} {"train_loss": -5.274447441101074, "global_step": 15169, "epoch": 361} {"train_loss": -5.193685531616211, "global_step": 15170, "epoch": 361} {"train_loss": -5.1981401443481445, "global_step": 15171, "epoch": 361} {"train_loss": -5.22490119934082, "global_step": 15172, "epoch": 361} {"train_loss": -5.204658508300781, "global_step": 15173, "epoch": 361} {"train_loss": -5.250421047210693, "global_step": 15174, "epoch": 361} {"train_loss": -5.202882766723633, "global_step": 15175, "epoch": 361} {"train_loss": -5.174067974090576, "global_step": 15176, "epoch": 361} {"train_loss": -5.100759506225586, "global_step": 15177, "epoch": 361} {"train_loss": -5.188793659210205, "global_step": 15178, "epoch": 361} {"train_loss": -5.091459274291992, "global_step": 15179, "epoch": 361} {"train_loss": -5.180609226226807, "global_step": 15180, "epoch": 361} {"train_loss": -5.202050685882568, "global_step": 15181, "epoch": 361} {"train_loss": -5.191603660583496, "global_step": 15182, "epoch": 361} {"train_loss": -5.196341037750244, "global_step": 15183, "epoch": 361} {"train_loss": -5.150522232055664, "global_step": 15184, "epoch": 361} {"train_loss": -5.100307941436768, "global_step": 15185, "epoch": 361} {"train_loss": -5.286153793334961, "global_step": 15186, "epoch": 361} {"train_loss": -5.266392707824707, "global_step": 15187, "epoch": 361} {"train_loss": -5.230303764343262, "global_step": 15188, "epoch": 361} {"train_loss": -5.144801139831543, "global_step": 15189, "epoch": 361} {"train_loss": -5.090933322906494, "global_step": 15190, "epoch": 361} {"train_loss": -5.063989639282227, "global_step": 15191, "epoch": 361} {"train_loss": -5.135078430175781, "global_step": 15192, "epoch": 361} {"train_loss": -5.144593238830566, "global_step": 15193, "epoch": 361} {"train_loss": -5.036048889160156, "global_step": 15194, "epoch": 361} {"train_loss": -5.269941329956055, "global_step": 15195, "epoch": 361} {"train_loss": -5.205799102783203, "global_step": 15196, "epoch": 361} {"train_loss": -5.253378868103027, "global_step": 15197, "epoch": 361} {"train_loss": -5.104208946228027, "global_step": 15198, "epoch": 361} {"train_loss": -5.166323661804199, "global_step": 15199, "epoch": 361} {"train_loss": -5.260282039642334, "global_step": 15200, "epoch": 361} {"train_loss": -5.217213153839111, "global_step": 15201, "epoch": 361} {"train_loss": -5.284727096557617, "global_step": 15202, "epoch": 361} {"train_loss": -5.1939155374254495, "global_step": 15203, "epoch": 361, "val_loss": 78409.140625} {"train_loss": -5.189394950866699, "global_step": 15204, "epoch": 362} {"train_loss": -5.256004333496094, "global_step": 15205, "epoch": 362} {"train_loss": -5.335200786590576, "global_step": 15206, "epoch": 362} {"train_loss": -5.274874687194824, "global_step": 15207, "epoch": 362} {"train_loss": -5.0345563888549805, "global_step": 15208, "epoch": 362} {"train_loss": -5.2163848876953125, "global_step": 15209, "epoch": 362} {"train_loss": -5.144360542297363, "global_step": 15210, "epoch": 362} {"train_loss": -5.029156684875488, "global_step": 15211, "epoch": 362} {"train_loss": -5.119988441467285, "global_step": 15212, "epoch": 362} {"train_loss": -5.25223445892334, "global_step": 15213, "epoch": 362} {"train_loss": -5.153621673583984, "global_step": 15214, "epoch": 362} {"train_loss": -5.17649507522583, "global_step": 15215, "epoch": 362} {"train_loss": -5.163261413574219, "global_step": 15216, "epoch": 362} {"train_loss": -5.105602264404297, "global_step": 15217, "epoch": 362} {"train_loss": -5.216318130493164, "global_step": 15218, "epoch": 362} {"train_loss": -5.144674777984619, "global_step": 15219, "epoch": 362} {"train_loss": -5.04314661026001, "global_step": 15220, "epoch": 362} {"train_loss": -5.1697773933410645, "global_step": 15221, "epoch": 362} {"train_loss": -5.0482401847839355, "global_step": 15222, "epoch": 362} {"train_loss": -5.203706741333008, "global_step": 15223, "epoch": 362} {"train_loss": -5.254353046417236, "global_step": 15224, "epoch": 362} {"train_loss": -5.220394134521484, "global_step": 15225, "epoch": 362} {"train_loss": -4.969815254211426, "global_step": 15226, "epoch": 362} {"train_loss": -5.21571683883667, "global_step": 15227, "epoch": 362} {"train_loss": -5.087782382965088, "global_step": 15228, "epoch": 362} {"train_loss": -5.030150413513184, "global_step": 15229, "epoch": 362} {"train_loss": -5.239193916320801, "global_step": 15230, "epoch": 362} {"train_loss": -4.894839286804199, "global_step": 15231, "epoch": 362} {"train_loss": -5.201262474060059, "global_step": 15232, "epoch": 362} {"train_loss": -5.187902450561523, "global_step": 15233, "epoch": 362} {"train_loss": -5.169007301330566, "global_step": 15234, "epoch": 362} {"train_loss": -5.126971244812012, "global_step": 15235, "epoch": 362} {"train_loss": -5.265897750854492, "global_step": 15236, "epoch": 362} {"train_loss": -5.203770637512207, "global_step": 15237, "epoch": 362} {"train_loss": -5.109040260314941, "global_step": 15238, "epoch": 362} {"train_loss": -5.146278381347656, "global_step": 15239, "epoch": 362} {"train_loss": -5.103166103363037, "global_step": 15240, "epoch": 362} {"train_loss": -5.113626003265381, "global_step": 15241, "epoch": 362} {"train_loss": -5.270998001098633, "global_step": 15242, "epoch": 362} {"train_loss": -5.214726448059082, "global_step": 15243, "epoch": 362} {"train_loss": -5.088089942932129, "global_step": 15244, "epoch": 362} {"train_loss": -5.156088840393793, "global_step": 15245, "epoch": 362, "val_loss": 78402.28125} {"train_loss": -5.002228260040283, "global_step": 15246, "epoch": 363} {"train_loss": -5.126091957092285, "global_step": 15247, "epoch": 363} {"train_loss": -5.31608772277832, "global_step": 15248, "epoch": 363} {"train_loss": -5.065295219421387, "global_step": 15249, "epoch": 363} {"train_loss": -4.981113433837891, "global_step": 15250, "epoch": 363} {"train_loss": -5.046494960784912, "global_step": 15251, "epoch": 363} {"train_loss": -5.1257781982421875, "global_step": 15252, "epoch": 363} {"train_loss": -5.040392875671387, "global_step": 15253, "epoch": 363} {"train_loss": -5.147514820098877, "global_step": 15254, "epoch": 363} {"train_loss": -5.1629743576049805, "global_step": 15255, "epoch": 363} {"train_loss": -5.317925453186035, "global_step": 15256, "epoch": 363} {"train_loss": -5.140280246734619, "global_step": 15257, "epoch": 363} {"train_loss": -5.197567939758301, "global_step": 15258, "epoch": 363} {"train_loss": -5.139584064483643, "global_step": 15259, "epoch": 363} {"train_loss": -5.104589462280273, "global_step": 15260, "epoch": 363} {"train_loss": -5.265049934387207, "global_step": 15261, "epoch": 363} {"train_loss": -5.145308017730713, "global_step": 15262, "epoch": 363} {"train_loss": -5.122211456298828, "global_step": 15263, "epoch": 363} {"train_loss": -5.27336311340332, "global_step": 15264, "epoch": 363} {"train_loss": -5.266275882720947, "global_step": 15265, "epoch": 363} {"train_loss": -5.143950462341309, "global_step": 15266, "epoch": 363} {"train_loss": -5.081783294677734, "global_step": 15267, "epoch": 363} {"train_loss": -5.280501365661621, "global_step": 15268, "epoch": 363} {"train_loss": -5.244319438934326, "global_step": 15269, "epoch": 363} {"train_loss": -5.33872127532959, "global_step": 15270, "epoch": 363} {"train_loss": -5.156092643737793, "global_step": 15271, "epoch": 363} {"train_loss": -5.108834266662598, "global_step": 15272, "epoch": 363} {"train_loss": -5.15822696685791, "global_step": 15273, "epoch": 363} {"train_loss": -5.257510185241699, "global_step": 15274, "epoch": 363} {"train_loss": -5.304403305053711, "global_step": 15275, "epoch": 363} {"train_loss": -5.054086208343506, "global_step": 15276, "epoch": 363} {"train_loss": -5.334842681884766, "global_step": 15277, "epoch": 363} {"train_loss": -5.277013778686523, "global_step": 15278, "epoch": 363} {"train_loss": -5.117297172546387, "global_step": 15279, "epoch": 363} {"train_loss": -5.037525653839111, "global_step": 15280, "epoch": 363} {"train_loss": -5.201050281524658, "global_step": 15281, "epoch": 363} {"train_loss": -5.207699775695801, "global_step": 15282, "epoch": 363} {"train_loss": -5.075408935546875, "global_step": 15283, "epoch": 363} {"train_loss": -5.180821895599365, "global_step": 15284, "epoch": 363} {"train_loss": -5.242673873901367, "global_step": 15285, "epoch": 363} {"train_loss": -5.170698165893555, "global_step": 15286, "epoch": 363} {"train_loss": -5.165745587576003, "global_step": 15287, "epoch": 363, "val_loss": 77799.140625} {"train_loss": -5.218563079833984, "global_step": 15288, "epoch": 364} {"train_loss": -5.170821189880371, "global_step": 15289, "epoch": 364} {"train_loss": -5.208901882171631, "global_step": 15290, "epoch": 364} {"train_loss": -5.201770782470703, "global_step": 15291, "epoch": 364} {"train_loss": -5.198733329772949, "global_step": 15292, "epoch": 364} {"train_loss": -5.226424217224121, "global_step": 15293, "epoch": 364} {"train_loss": -5.286257266998291, "global_step": 15294, "epoch": 364} {"train_loss": -5.14804744720459, "global_step": 15295, "epoch": 364} {"train_loss": -5.193559169769287, "global_step": 15296, "epoch": 364} {"train_loss": -5.312371253967285, "global_step": 15297, "epoch": 364} {"train_loss": -5.20670223236084, "global_step": 15298, "epoch": 364} {"train_loss": -5.198268890380859, "global_step": 15299, "epoch": 364} {"train_loss": -5.273507118225098, "global_step": 15300, "epoch": 364} {"train_loss": -5.371794700622559, "global_step": 15301, "epoch": 364} {"train_loss": -5.11306095123291, "global_step": 15302, "epoch": 364} {"train_loss": -5.220340728759766, "global_step": 15303, "epoch": 364} {"train_loss": -5.3765668869018555, "global_step": 15304, "epoch": 364} {"train_loss": -5.2753682136535645, "global_step": 15305, "epoch": 364} {"train_loss": -5.210482597351074, "global_step": 15306, "epoch": 364} {"train_loss": -5.242136001586914, "global_step": 15307, "epoch": 364} {"train_loss": -5.116872787475586, "global_step": 15308, "epoch": 364} {"train_loss": -5.127932071685791, "global_step": 15309, "epoch": 364} {"train_loss": -5.091183185577393, "global_step": 15310, "epoch": 364} {"train_loss": -5.218461990356445, "global_step": 15311, "epoch": 364} {"train_loss": -5.312459945678711, "global_step": 15312, "epoch": 364} {"train_loss": -5.068855285644531, "global_step": 15313, "epoch": 364} {"train_loss": -5.175288200378418, "global_step": 15314, "epoch": 364} {"train_loss": -5.118043422698975, "global_step": 15315, "epoch": 364} {"train_loss": -5.261935234069824, "global_step": 15316, "epoch": 364} {"train_loss": -5.149056911468506, "global_step": 15317, "epoch": 364} {"train_loss": -5.022741794586182, "global_step": 15318, "epoch": 364} {"train_loss": -5.075369358062744, "global_step": 15319, "epoch": 364} {"train_loss": -5.000397682189941, "global_step": 15320, "epoch": 364} {"train_loss": -4.8926897048950195, "global_step": 15321, "epoch": 364} {"train_loss": -4.996279716491699, "global_step": 15322, "epoch": 364} {"train_loss": -5.019841194152832, "global_step": 15323, "epoch": 364} {"train_loss": -4.935103416442871, "global_step": 15324, "epoch": 364} {"train_loss": -4.951507568359375, "global_step": 15325, "epoch": 364} {"train_loss": -4.987949371337891, "global_step": 15326, "epoch": 364} {"train_loss": -5.00670862197876, "global_step": 15327, "epoch": 364} {"train_loss": -4.872389793395996, "global_step": 15328, "epoch": 364} {"train_loss": -5.145477567400251, "global_step": 15329, "epoch": 364, "val_loss": 78856.484375} {"train_loss": -5.008459091186523, "global_step": 15330, "epoch": 365} {"train_loss": -5.002155303955078, "global_step": 15331, "epoch": 365} {"train_loss": -5.04680871963501, "global_step": 15332, "epoch": 365} {"train_loss": -5.184962749481201, "global_step": 15333, "epoch": 365} {"train_loss": -5.145905017852783, "global_step": 15334, "epoch": 365} {"train_loss": -5.079412460327148, "global_step": 15335, "epoch": 365} {"train_loss": -5.08506441116333, "global_step": 15336, "epoch": 365} {"train_loss": -4.979436874389648, "global_step": 15337, "epoch": 365} {"train_loss": -5.085323810577393, "global_step": 15338, "epoch": 365} {"train_loss": -5.284379959106445, "global_step": 15339, "epoch": 365} {"train_loss": -5.204227924346924, "global_step": 15340, "epoch": 365} {"train_loss": -5.153191566467285, "global_step": 15341, "epoch": 365} {"train_loss": -5.244693279266357, "global_step": 15342, "epoch": 365} {"train_loss": -5.106426239013672, "global_step": 15343, "epoch": 365} {"train_loss": -5.27749490737915, "global_step": 15344, "epoch": 365} {"train_loss": -5.109165668487549, "global_step": 15345, "epoch": 365} {"train_loss": -5.267256736755371, "global_step": 15346, "epoch": 365} {"train_loss": -5.4026641845703125, "global_step": 15347, "epoch": 365} {"train_loss": -5.085390090942383, "global_step": 15348, "epoch": 365} {"train_loss": -5.223132610321045, "global_step": 15349, "epoch": 365} {"train_loss": -5.142626762390137, "global_step": 15350, "epoch": 365} {"train_loss": -5.150913238525391, "global_step": 15351, "epoch": 365} {"train_loss": -5.077075958251953, "global_step": 15352, "epoch": 365} {"train_loss": -5.045591354370117, "global_step": 15353, "epoch": 365} {"train_loss": -5.27708101272583, "global_step": 15354, "epoch": 365} {"train_loss": -5.219387531280518, "global_step": 15355, "epoch": 365} {"train_loss": -5.115684986114502, "global_step": 15356, "epoch": 365} {"train_loss": -5.199003219604492, "global_step": 15357, "epoch": 365} {"train_loss": -5.033640384674072, "global_step": 15358, "epoch": 365} {"train_loss": -5.108333587646484, "global_step": 15359, "epoch": 365} {"train_loss": -5.244716644287109, "global_step": 15360, "epoch": 365} {"train_loss": -5.087030410766602, "global_step": 15361, "epoch": 365} {"train_loss": -5.258859634399414, "global_step": 15362, "epoch": 365} {"train_loss": -5.1672043800354, "global_step": 15363, "epoch": 365} {"train_loss": -5.107053756713867, "global_step": 15364, "epoch": 365} {"train_loss": -5.154524803161621, "global_step": 15365, "epoch": 365} {"train_loss": -5.250646591186523, "global_step": 15366, "epoch": 365} {"train_loss": -5.239175796508789, "global_step": 15367, "epoch": 365} {"train_loss": -5.227313041687012, "global_step": 15368, "epoch": 365} {"train_loss": -5.2406086921691895, "global_step": 15369, "epoch": 365} {"train_loss": -5.176235198974609, "global_step": 15370, "epoch": 365} {"train_loss": -5.162371056420462, "global_step": 15371, "epoch": 365, "val_loss": 78418.3203125} {"train_loss": -5.157685279846191, "global_step": 15372, "epoch": 366} {"train_loss": -5.215227127075195, "global_step": 15373, "epoch": 366} {"train_loss": -5.184185028076172, "global_step": 15374, "epoch": 366} {"train_loss": -5.189823150634766, "global_step": 15375, "epoch": 366} {"train_loss": -5.2004075050354, "global_step": 15376, "epoch": 366} {"train_loss": -5.265852928161621, "global_step": 15377, "epoch": 366} {"train_loss": -5.060596466064453, "global_step": 15378, "epoch": 366} {"train_loss": -5.00193977355957, "global_step": 15379, "epoch": 366} {"train_loss": -5.12880802154541, "global_step": 15380, "epoch": 366} {"train_loss": -5.30363655090332, "global_step": 15381, "epoch": 366} {"train_loss": -5.197955131530762, "global_step": 15382, "epoch": 366} {"train_loss": -5.2021942138671875, "global_step": 15383, "epoch": 366} {"train_loss": -5.291136741638184, "global_step": 15384, "epoch": 366} {"train_loss": -5.034397125244141, "global_step": 15385, "epoch": 366} {"train_loss": -5.202454566955566, "global_step": 15386, "epoch": 366} {"train_loss": -5.201192855834961, "global_step": 15387, "epoch": 366} {"train_loss": -5.1785407066345215, "global_step": 15388, "epoch": 366} {"train_loss": -5.180890083312988, "global_step": 15389, "epoch": 366} {"train_loss": -5.162674903869629, "global_step": 15390, "epoch": 366} {"train_loss": -5.20543098449707, "global_step": 15391, "epoch": 366} {"train_loss": -5.281369209289551, "global_step": 15392, "epoch": 366} {"train_loss": -5.1956000328063965, "global_step": 15393, "epoch": 366} {"train_loss": -5.1750640869140625, "global_step": 15394, "epoch": 366} {"train_loss": -5.1505842208862305, "global_step": 15395, "epoch": 366} {"train_loss": -5.020366191864014, "global_step": 15396, "epoch": 366} {"train_loss": -5.347568511962891, "global_step": 15397, "epoch": 366} {"train_loss": -5.095521926879883, "global_step": 15398, "epoch": 366} {"train_loss": -5.158587455749512, "global_step": 15399, "epoch": 366} {"train_loss": -5.234370231628418, "global_step": 15400, "epoch": 366} {"train_loss": -5.210719108581543, "global_step": 15401, "epoch": 366} {"train_loss": -5.042055130004883, "global_step": 15402, "epoch": 366} {"train_loss": -5.2446136474609375, "global_step": 15403, "epoch": 366} {"train_loss": -5.035923004150391, "global_step": 15404, "epoch": 366} {"train_loss": -5.041205406188965, "global_step": 15405, "epoch": 366} {"train_loss": -5.157532691955566, "global_step": 15406, "epoch": 366} {"train_loss": -5.133270740509033, "global_step": 15407, "epoch": 366} {"train_loss": -5.228381156921387, "global_step": 15408, "epoch": 366} {"train_loss": -5.24729061126709, "global_step": 15409, "epoch": 366} {"train_loss": -5.036245346069336, "global_step": 15410, "epoch": 366} {"train_loss": -5.179300308227539, "global_step": 15411, "epoch": 366} {"train_loss": -5.107410430908203, "global_step": 15412, "epoch": 366} {"train_loss": -5.166668051765079, "global_step": 15413, "epoch": 366, "val_loss": 78243.7421875} {"train_loss": -5.116593360900879, "global_step": 15414, "epoch": 367} {"train_loss": -5.04880428314209, "global_step": 15415, "epoch": 367} {"train_loss": -5.1957550048828125, "global_step": 15416, "epoch": 367} {"train_loss": -5.234482765197754, "global_step": 15417, "epoch": 367} {"train_loss": -5.180150985717773, "global_step": 15418, "epoch": 367} {"train_loss": -5.259768486022949, "global_step": 15419, "epoch": 367} {"train_loss": -5.172272682189941, "global_step": 15420, "epoch": 367} {"train_loss": -5.178482532501221, "global_step": 15421, "epoch": 367} {"train_loss": -5.289818286895752, "global_step": 15422, "epoch": 367} {"train_loss": -5.060423851013184, "global_step": 15423, "epoch": 367} {"train_loss": -5.164697647094727, "global_step": 15424, "epoch": 367} {"train_loss": -5.363748550415039, "global_step": 15425, "epoch": 367} {"train_loss": -5.0835041999816895, "global_step": 15426, "epoch": 367} {"train_loss": -5.196015357971191, "global_step": 15427, "epoch": 367} {"train_loss": -5.095541954040527, "global_step": 15428, "epoch": 367} {"train_loss": -5.019979476928711, "global_step": 15429, "epoch": 367} {"train_loss": -5.184162139892578, "global_step": 15430, "epoch": 367} {"train_loss": -5.046885967254639, "global_step": 15431, "epoch": 367} {"train_loss": -5.094167232513428, "global_step": 15432, "epoch": 367} {"train_loss": -5.286764144897461, "global_step": 15433, "epoch": 367} {"train_loss": -5.137324333190918, "global_step": 15434, "epoch": 367} {"train_loss": -5.103110313415527, "global_step": 15435, "epoch": 367} {"train_loss": -5.325000286102295, "global_step": 15436, "epoch": 367} {"train_loss": -5.117602825164795, "global_step": 15437, "epoch": 367} {"train_loss": -5.187523365020752, "global_step": 15438, "epoch": 367} {"train_loss": -5.141523361206055, "global_step": 15439, "epoch": 367} {"train_loss": -5.126462936401367, "global_step": 15440, "epoch": 367} {"train_loss": -5.298851013183594, "global_step": 15441, "epoch": 367} {"train_loss": -5.150489807128906, "global_step": 15442, "epoch": 367} {"train_loss": -5.060187816619873, "global_step": 15443, "epoch": 367} {"train_loss": -5.241892337799072, "global_step": 15444, "epoch": 367} {"train_loss": -5.229039192199707, "global_step": 15445, "epoch": 367} {"train_loss": -5.1935529708862305, "global_step": 15446, "epoch": 367} {"train_loss": -5.226291179656982, "global_step": 15447, "epoch": 367} {"train_loss": -5.278160095214844, "global_step": 15448, "epoch": 367} {"train_loss": -5.362643718719482, "global_step": 15449, "epoch": 367} {"train_loss": -5.166345596313477, "global_step": 15450, "epoch": 367} {"train_loss": -5.06486701965332, "global_step": 15451, "epoch": 367} {"train_loss": -5.256955146789551, "global_step": 15452, "epoch": 367} {"train_loss": -5.255153656005859, "global_step": 15453, "epoch": 367} {"train_loss": -5.027732849121094, "global_step": 15454, "epoch": 367} {"train_loss": -5.17631181081136, "global_step": 15455, "epoch": 367, "val_loss": 78561.28125} {"train_loss": -5.0528435707092285, "global_step": 15456, "epoch": 368} {"train_loss": -5.066580772399902, "global_step": 15457, "epoch": 368} {"train_loss": -5.252840042114258, "global_step": 15458, "epoch": 368} {"train_loss": -5.058755874633789, "global_step": 15459, "epoch": 368} {"train_loss": -5.027853965759277, "global_step": 15460, "epoch": 368} {"train_loss": -5.073641300201416, "global_step": 15461, "epoch": 368} {"train_loss": -5.035193920135498, "global_step": 15462, "epoch": 368} {"train_loss": -5.057858467102051, "global_step": 15463, "epoch": 368} {"train_loss": -5.3091959953308105, "global_step": 15464, "epoch": 368} {"train_loss": -5.101031303405762, "global_step": 15465, "epoch": 368} {"train_loss": -5.224787712097168, "global_step": 15466, "epoch": 368} {"train_loss": -5.099709510803223, "global_step": 15467, "epoch": 368} {"train_loss": -5.081934928894043, "global_step": 15468, "epoch": 368} {"train_loss": -5.2016730308532715, "global_step": 15469, "epoch": 368} {"train_loss": -5.024044513702393, "global_step": 15470, "epoch": 368} {"train_loss": -5.15368127822876, "global_step": 15471, "epoch": 368} {"train_loss": -5.2420125007629395, "global_step": 15472, "epoch": 368} {"train_loss": -5.039210319519043, "global_step": 15473, "epoch": 368} {"train_loss": -5.216249465942383, "global_step": 15474, "epoch": 368} {"train_loss": -5.183744430541992, "global_step": 15475, "epoch": 368} {"train_loss": -5.260122299194336, "global_step": 15476, "epoch": 368} {"train_loss": -5.266744136810303, "global_step": 15477, "epoch": 368} {"train_loss": -5.168893814086914, "global_step": 15478, "epoch": 368} {"train_loss": -5.194785118103027, "global_step": 15479, "epoch": 368} {"train_loss": -5.124304294586182, "global_step": 15480, "epoch": 368} {"train_loss": -5.110760688781738, "global_step": 15481, "epoch": 368} {"train_loss": -5.17538595199585, "global_step": 15482, "epoch": 368} {"train_loss": -5.329302787780762, "global_step": 15483, "epoch": 368} {"train_loss": -5.220340251922607, "global_step": 15484, "epoch": 368} {"train_loss": -5.396246910095215, "global_step": 15485, "epoch": 368} {"train_loss": -5.254756927490234, "global_step": 15486, "epoch": 368} {"train_loss": -5.260615348815918, "global_step": 15487, "epoch": 368} {"train_loss": -5.170266628265381, "global_step": 15488, "epoch": 368} {"train_loss": -5.168466567993164, "global_step": 15489, "epoch": 368} {"train_loss": -5.05870246887207, "global_step": 15490, "epoch": 368} {"train_loss": -5.108818054199219, "global_step": 15491, "epoch": 368} {"train_loss": -5.270503044128418, "global_step": 15492, "epoch": 368} {"train_loss": -5.230342864990234, "global_step": 15493, "epoch": 368} {"train_loss": -5.030490875244141, "global_step": 15494, "epoch": 368} {"train_loss": -5.197364807128906, "global_step": 15495, "epoch": 368} {"train_loss": -5.168695449829102, "global_step": 15496, "epoch": 368} {"train_loss": -5.161827325820923, "global_step": 15497, "epoch": 368, "val_loss": 78456.5859375} {"train_loss": -5.209301948547363, "global_step": 15498, "epoch": 369} {"train_loss": -5.295474052429199, "global_step": 15499, "epoch": 369} {"train_loss": -5.15187931060791, "global_step": 15500, "epoch": 369} {"train_loss": -5.179917335510254, "global_step": 15501, "epoch": 369} {"train_loss": -5.177753448486328, "global_step": 15502, "epoch": 369} {"train_loss": -5.328317642211914, "global_step": 15503, "epoch": 369} {"train_loss": -5.207177639007568, "global_step": 15504, "epoch": 369} {"train_loss": -5.353790283203125, "global_step": 15505, "epoch": 369} {"train_loss": -5.257082462310791, "global_step": 15506, "epoch": 369} {"train_loss": -5.241931438446045, "global_step": 15507, "epoch": 369} {"train_loss": -5.16847038269043, "global_step": 15508, "epoch": 369} {"train_loss": -5.002774715423584, "global_step": 15509, "epoch": 369} {"train_loss": -5.227797031402588, "global_step": 15510, "epoch": 369} {"train_loss": -5.266475677490234, "global_step": 15511, "epoch": 369} {"train_loss": -5.22522497177124, "global_step": 15512, "epoch": 369} {"train_loss": -5.236702919006348, "global_step": 15513, "epoch": 369} {"train_loss": -5.189707279205322, "global_step": 15514, "epoch": 369} {"train_loss": -5.306704044342041, "global_step": 15515, "epoch": 369} {"train_loss": -5.17466926574707, "global_step": 15516, "epoch": 369} {"train_loss": -5.216235637664795, "global_step": 15517, "epoch": 369} {"train_loss": -5.237452507019043, "global_step": 15518, "epoch": 369} {"train_loss": -5.258596897125244, "global_step": 15519, "epoch": 369} {"train_loss": -5.124688148498535, "global_step": 15520, "epoch": 369} {"train_loss": -5.405500411987305, "global_step": 15521, "epoch": 369} {"train_loss": -5.213886260986328, "global_step": 15522, "epoch": 369} {"train_loss": -5.1143951416015625, "global_step": 15523, "epoch": 369} {"train_loss": -5.0525007247924805, "global_step": 15524, "epoch": 369} {"train_loss": -5.195346832275391, "global_step": 15525, "epoch": 369} {"train_loss": -5.326592445373535, "global_step": 15526, "epoch": 369} {"train_loss": -5.219315528869629, "global_step": 15527, "epoch": 369} {"train_loss": -5.137859344482422, "global_step": 15528, "epoch": 369} {"train_loss": -5.285712242126465, "global_step": 15529, "epoch": 369} {"train_loss": -5.259370803833008, "global_step": 15530, "epoch": 369} {"train_loss": -5.302107810974121, "global_step": 15531, "epoch": 369} {"train_loss": -5.138093948364258, "global_step": 15532, "epoch": 369} {"train_loss": -5.252536773681641, "global_step": 15533, "epoch": 369} {"train_loss": -5.1103057861328125, "global_step": 15534, "epoch": 369} {"train_loss": -5.152941703796387, "global_step": 15535, "epoch": 369} {"train_loss": -5.256387710571289, "global_step": 15536, "epoch": 369} {"train_loss": -5.205052375793457, "global_step": 15537, "epoch": 369} {"train_loss": -5.360265731811523, "global_step": 15538, "epoch": 369} {"train_loss": -5.221982365562802, "global_step": 15539, "epoch": 369, "val_loss": 78331.7578125} {"train_loss": -5.194366455078125, "global_step": 15540, "epoch": 370} {"train_loss": -5.2233991622924805, "global_step": 15541, "epoch": 370} {"train_loss": -5.232521057128906, "global_step": 15542, "epoch": 370} {"train_loss": -5.152465343475342, "global_step": 15543, "epoch": 370} {"train_loss": -5.118430137634277, "global_step": 15544, "epoch": 370} {"train_loss": -5.042581558227539, "global_step": 15545, "epoch": 370} {"train_loss": -5.306529998779297, "global_step": 15546, "epoch": 370} {"train_loss": -5.228748321533203, "global_step": 15547, "epoch": 370} {"train_loss": -5.222458839416504, "global_step": 15548, "epoch": 370} {"train_loss": -5.140611171722412, "global_step": 15549, "epoch": 370} {"train_loss": -5.300909042358398, "global_step": 15550, "epoch": 370} {"train_loss": -5.347939968109131, "global_step": 15551, "epoch": 370} {"train_loss": -5.188644886016846, "global_step": 15552, "epoch": 370} {"train_loss": -5.256592273712158, "global_step": 15553, "epoch": 370} {"train_loss": -5.232428550720215, "global_step": 15554, "epoch": 370} {"train_loss": -5.30670166015625, "global_step": 15555, "epoch": 370} {"train_loss": -5.200573921203613, "global_step": 15556, "epoch": 370} {"train_loss": -5.162120819091797, "global_step": 15557, "epoch": 370} {"train_loss": -5.082405090332031, "global_step": 15558, "epoch": 370} {"train_loss": -5.267294883728027, "global_step": 15559, "epoch": 370} {"train_loss": -5.176370620727539, "global_step": 15560, "epoch": 370} {"train_loss": -5.250688552856445, "global_step": 15561, "epoch": 370} {"train_loss": -5.273808479309082, "global_step": 15562, "epoch": 370} {"train_loss": -5.101822853088379, "global_step": 15563, "epoch": 370} {"train_loss": -5.199282169342041, "global_step": 15564, "epoch": 370} {"train_loss": -5.180635929107666, "global_step": 15565, "epoch": 370} {"train_loss": -5.156113147735596, "global_step": 15566, "epoch": 370} {"train_loss": -5.220238208770752, "global_step": 15567, "epoch": 370} {"train_loss": -5.208830833435059, "global_step": 15568, "epoch": 370} {"train_loss": -5.1624579429626465, "global_step": 15569, "epoch": 370} {"train_loss": -5.037318229675293, "global_step": 15570, "epoch": 370} {"train_loss": -5.121725082397461, "global_step": 15571, "epoch": 370} {"train_loss": -5.2476396560668945, "global_step": 15572, "epoch": 370} {"train_loss": -5.24589729309082, "global_step": 15573, "epoch": 370} {"train_loss": -5.040531158447266, "global_step": 15574, "epoch": 370} {"train_loss": -5.225898742675781, "global_step": 15575, "epoch": 370} {"train_loss": -5.3083391189575195, "global_step": 15576, "epoch": 370} {"train_loss": -5.151932716369629, "global_step": 15577, "epoch": 370} {"train_loss": -5.332485198974609, "global_step": 15578, "epoch": 370} {"train_loss": -5.224269866943359, "global_step": 15579, "epoch": 370} {"train_loss": -5.274725914001465, "global_step": 15580, "epoch": 370} {"train_loss": -5.203088363011678, "global_step": 15581, "epoch": 370, "val_loss": 78492.6640625} {"train_loss": -5.21577262878418, "global_step": 15582, "epoch": 371} {"train_loss": -5.29050350189209, "global_step": 15583, "epoch": 371} {"train_loss": -5.216031074523926, "global_step": 15584, "epoch": 371} {"train_loss": -5.289426803588867, "global_step": 15585, "epoch": 371} {"train_loss": -5.302660942077637, "global_step": 15586, "epoch": 371} {"train_loss": -5.268406391143799, "global_step": 15587, "epoch": 371} {"train_loss": -5.141660690307617, "global_step": 15588, "epoch": 371} {"train_loss": -5.15866756439209, "global_step": 15589, "epoch": 371} {"train_loss": -5.159690856933594, "global_step": 15590, "epoch": 371} {"train_loss": -5.165840148925781, "global_step": 15591, "epoch": 371} {"train_loss": -5.300912857055664, "global_step": 15592, "epoch": 371} {"train_loss": -5.129342079162598, "global_step": 15593, "epoch": 371} {"train_loss": -5.259735107421875, "global_step": 15594, "epoch": 371} {"train_loss": -5.241596698760986, "global_step": 15595, "epoch": 371} {"train_loss": -5.339687347412109, "global_step": 15596, "epoch": 371} {"train_loss": -5.173455238342285, "global_step": 15597, "epoch": 371} {"train_loss": -5.133164882659912, "global_step": 15598, "epoch": 371} {"train_loss": -5.134739875793457, "global_step": 15599, "epoch": 371} {"train_loss": -5.212337493896484, "global_step": 15600, "epoch": 371} {"train_loss": -5.200980186462402, "global_step": 15601, "epoch": 371} {"train_loss": -5.182406902313232, "global_step": 15602, "epoch": 371} {"train_loss": -5.06775426864624, "global_step": 15603, "epoch": 371} {"train_loss": -5.276795387268066, "global_step": 15604, "epoch": 371} {"train_loss": -5.369891166687012, "global_step": 15605, "epoch": 371} {"train_loss": -5.228984355926514, "global_step": 15606, "epoch": 371} {"train_loss": -5.100688457489014, "global_step": 15607, "epoch": 371} {"train_loss": -5.270263671875, "global_step": 15608, "epoch": 371} {"train_loss": -5.1128010749816895, "global_step": 15609, "epoch": 371} {"train_loss": -4.996495723724365, "global_step": 15610, "epoch": 371} {"train_loss": -5.102234840393066, "global_step": 15611, "epoch": 371} {"train_loss": -5.218305587768555, "global_step": 15612, "epoch": 371} {"train_loss": -5.090309143066406, "global_step": 15613, "epoch": 371} {"train_loss": -5.1951751708984375, "global_step": 15614, "epoch": 371} {"train_loss": -5.272547721862793, "global_step": 15615, "epoch": 371} {"train_loss": -5.070217132568359, "global_step": 15616, "epoch": 371} {"train_loss": -5.111937522888184, "global_step": 15617, "epoch": 371} {"train_loss": -5.388184070587158, "global_step": 15618, "epoch": 371} {"train_loss": -5.166626930236816, "global_step": 15619, "epoch": 371} {"train_loss": -5.137441635131836, "global_step": 15620, "epoch": 371} {"train_loss": -5.184658050537109, "global_step": 15621, "epoch": 371} {"train_loss": -5.167187690734863, "global_step": 15622, "epoch": 371} {"train_loss": -5.19267970039731, "global_step": 15623, "epoch": 371, "val_loss": 78784.09375} {"train_loss": -5.200193405151367, "global_step": 15624, "epoch": 372} {"train_loss": -5.0187602043151855, "global_step": 15625, "epoch": 372} {"train_loss": -5.194023132324219, "global_step": 15626, "epoch": 372} {"train_loss": -5.094565391540527, "global_step": 15627, "epoch": 372} {"train_loss": -5.1311750411987305, "global_step": 15628, "epoch": 372} {"train_loss": -5.164771556854248, "global_step": 15629, "epoch": 372} {"train_loss": -5.016246795654297, "global_step": 15630, "epoch": 372} {"train_loss": -5.168063640594482, "global_step": 15631, "epoch": 372} {"train_loss": -5.0479631423950195, "global_step": 15632, "epoch": 372} {"train_loss": -5.204160690307617, "global_step": 15633, "epoch": 372} {"train_loss": -5.1421966552734375, "global_step": 15634, "epoch": 372} {"train_loss": -5.030252933502197, "global_step": 15635, "epoch": 372} {"train_loss": -5.355834007263184, "global_step": 15636, "epoch": 372} {"train_loss": -5.196358680725098, "global_step": 15637, "epoch": 372} {"train_loss": -5.145346641540527, "global_step": 15638, "epoch": 372} {"train_loss": -5.201589584350586, "global_step": 15639, "epoch": 372} {"train_loss": -5.282639503479004, "global_step": 15640, "epoch": 372} {"train_loss": -5.200708389282227, "global_step": 15641, "epoch": 372} {"train_loss": -5.232303619384766, "global_step": 15642, "epoch": 372} {"train_loss": -5.212136268615723, "global_step": 15643, "epoch": 372} {"train_loss": -5.191450595855713, "global_step": 15644, "epoch": 372} {"train_loss": -5.264986991882324, "global_step": 15645, "epoch": 372} {"train_loss": -5.18959903717041, "global_step": 15646, "epoch": 372} {"train_loss": -5.19241189956665, "global_step": 15647, "epoch": 372} {"train_loss": -5.196628570556641, "global_step": 15648, "epoch": 372} {"train_loss": -5.260304927825928, "global_step": 15649, "epoch": 372} {"train_loss": -5.271312713623047, "global_step": 15650, "epoch": 372} {"train_loss": -5.199204921722412, "global_step": 15651, "epoch": 372} {"train_loss": -5.232028484344482, "global_step": 15652, "epoch": 372} {"train_loss": -5.1432952880859375, "global_step": 15653, "epoch": 372} {"train_loss": -5.264450550079346, "global_step": 15654, "epoch": 372} {"train_loss": -5.261338233947754, "global_step": 15655, "epoch": 372} {"train_loss": -5.294023513793945, "global_step": 15656, "epoch": 372} {"train_loss": -5.30619478225708, "global_step": 15657, "epoch": 372} {"train_loss": -5.146036148071289, "global_step": 15658, "epoch": 372} {"train_loss": -5.264970779418945, "global_step": 15659, "epoch": 372} {"train_loss": -5.181390285491943, "global_step": 15660, "epoch": 372} {"train_loss": -5.047859191894531, "global_step": 15661, "epoch": 372} {"train_loss": -5.315369606018066, "global_step": 15662, "epoch": 372} {"train_loss": -5.0733418464660645, "global_step": 15663, "epoch": 372} {"train_loss": -5.0992536544799805, "global_step": 15664, "epoch": 372} {"train_loss": -5.186499277750651, "global_step": 15665, "epoch": 372, "val_loss": 79173.96875} {"train_loss": -5.154553413391113, "global_step": 15666, "epoch": 373} {"train_loss": -5.158334255218506, "global_step": 15667, "epoch": 373} {"train_loss": -5.271676063537598, "global_step": 15668, "epoch": 373} {"train_loss": -5.265093803405762, "global_step": 15669, "epoch": 373} {"train_loss": -5.210419654846191, "global_step": 15670, "epoch": 373} {"train_loss": -5.144863128662109, "global_step": 15671, "epoch": 373} {"train_loss": -5.29160213470459, "global_step": 15672, "epoch": 373} {"train_loss": -5.133874893188477, "global_step": 15673, "epoch": 373} {"train_loss": -5.135627269744873, "global_step": 15674, "epoch": 373} {"train_loss": -5.2868757247924805, "global_step": 15675, "epoch": 373} {"train_loss": -5.239415168762207, "global_step": 15676, "epoch": 373} {"train_loss": -5.174190044403076, "global_step": 15677, "epoch": 373} {"train_loss": -5.160494804382324, "global_step": 15678, "epoch": 373} {"train_loss": -5.232876777648926, "global_step": 15679, "epoch": 373} {"train_loss": -5.048643112182617, "global_step": 15680, "epoch": 373} {"train_loss": -5.053355693817139, "global_step": 15681, "epoch": 373} {"train_loss": -5.287461757659912, "global_step": 15682, "epoch": 373} {"train_loss": -5.156192779541016, "global_step": 15683, "epoch": 373} {"train_loss": -4.983788013458252, "global_step": 15684, "epoch": 373} {"train_loss": -5.194775104522705, "global_step": 15685, "epoch": 373} {"train_loss": -5.199008941650391, "global_step": 15686, "epoch": 373} {"train_loss": -5.146300792694092, "global_step": 15687, "epoch": 373} {"train_loss": -5.19151496887207, "global_step": 15688, "epoch": 373} {"train_loss": -5.207550525665283, "global_step": 15689, "epoch": 373} {"train_loss": -5.132601737976074, "global_step": 15690, "epoch": 373} {"train_loss": -5.209851264953613, "global_step": 15691, "epoch": 373} {"train_loss": -5.131315231323242, "global_step": 15692, "epoch": 373} {"train_loss": -5.13987922668457, "global_step": 15693, "epoch": 373} {"train_loss": -5.346458435058594, "global_step": 15694, "epoch": 373} {"train_loss": -5.297427177429199, "global_step": 15695, "epoch": 373} {"train_loss": -5.3040313720703125, "global_step": 15696, "epoch": 373} {"train_loss": -5.237517356872559, "global_step": 15697, "epoch": 373} {"train_loss": -5.262820720672607, "global_step": 15698, "epoch": 373} {"train_loss": -5.183626651763916, "global_step": 15699, "epoch": 373} {"train_loss": -5.311746120452881, "global_step": 15700, "epoch": 373} {"train_loss": -5.266924858093262, "global_step": 15701, "epoch": 373} {"train_loss": -5.310003757476807, "global_step": 15702, "epoch": 373} {"train_loss": -5.1479082107543945, "global_step": 15703, "epoch": 373} {"train_loss": -5.1399641036987305, "global_step": 15704, "epoch": 373} {"train_loss": -5.14030647277832, "global_step": 15705, "epoch": 373} {"train_loss": -5.10919713973999, "global_step": 15706, "epoch": 373} {"train_loss": -5.195648340951829, "global_step": 15707, "epoch": 373, "val_loss": 78532.34375} {"train_loss": -5.230283737182617, "global_step": 15708, "epoch": 374} {"train_loss": -5.1846089363098145, "global_step": 15709, "epoch": 374} {"train_loss": -5.138059139251709, "global_step": 15710, "epoch": 374} {"train_loss": -5.124803066253662, "global_step": 15711, "epoch": 374} {"train_loss": -4.9721269607543945, "global_step": 15712, "epoch": 374} {"train_loss": -5.161898612976074, "global_step": 15713, "epoch": 374} {"train_loss": -5.040823459625244, "global_step": 15714, "epoch": 374} {"train_loss": -5.168516159057617, "global_step": 15715, "epoch": 374} {"train_loss": -5.20139217376709, "global_step": 15716, "epoch": 374} {"train_loss": -5.046722888946533, "global_step": 15717, "epoch": 374} {"train_loss": -5.149735450744629, "global_step": 15718, "epoch": 374} {"train_loss": -5.062796592712402, "global_step": 15719, "epoch": 374} {"train_loss": -5.181917190551758, "global_step": 15720, "epoch": 374} {"train_loss": -5.143360137939453, "global_step": 15721, "epoch": 374} {"train_loss": -5.233272552490234, "global_step": 15722, "epoch": 374} {"train_loss": -5.004997730255127, "global_step": 15723, "epoch": 374} {"train_loss": -5.131601333618164, "global_step": 15724, "epoch": 374} {"train_loss": -5.313229560852051, "global_step": 15725, "epoch": 374} {"train_loss": -5.173443794250488, "global_step": 15726, "epoch": 374} {"train_loss": -5.175566673278809, "global_step": 15727, "epoch": 374} {"train_loss": -5.242044448852539, "global_step": 15728, "epoch": 374} {"train_loss": -5.143124580383301, "global_step": 15729, "epoch": 374} {"train_loss": -5.332908630371094, "global_step": 15730, "epoch": 374} {"train_loss": -5.209423542022705, "global_step": 15731, "epoch": 374} {"train_loss": -5.214325904846191, "global_step": 15732, "epoch": 374} {"train_loss": -5.251996040344238, "global_step": 15733, "epoch": 374} {"train_loss": -5.307236671447754, "global_step": 15734, "epoch": 374} {"train_loss": -5.1850481033325195, "global_step": 15735, "epoch": 374} {"train_loss": -5.170101165771484, "global_step": 15736, "epoch": 374} {"train_loss": -5.359984874725342, "global_step": 15737, "epoch": 374} {"train_loss": -5.0858893394470215, "global_step": 15738, "epoch": 374} {"train_loss": -5.115234375, "global_step": 15739, "epoch": 374} {"train_loss": -5.193441867828369, "global_step": 15740, "epoch": 374} {"train_loss": -5.150215148925781, "global_step": 15741, "epoch": 374} {"train_loss": -5.139252185821533, "global_step": 15742, "epoch": 374} {"train_loss": -5.173076629638672, "global_step": 15743, "epoch": 374} {"train_loss": -5.371991157531738, "global_step": 15744, "epoch": 374} {"train_loss": -5.080451011657715, "global_step": 15745, "epoch": 374} {"train_loss": -5.194099426269531, "global_step": 15746, "epoch": 374} {"train_loss": -5.193943023681641, "global_step": 15747, "epoch": 374} {"train_loss": -5.088918685913086, "global_step": 15748, "epoch": 374} {"train_loss": -5.169511045728411, "global_step": 15749, "epoch": 374, "val_loss": 78986.7109375} {"train_loss": -5.194154739379883, "global_step": 15750, "epoch": 375} {"train_loss": -5.183429718017578, "global_step": 15751, "epoch": 375} {"train_loss": -5.180376052856445, "global_step": 15752, "epoch": 375} {"train_loss": -5.22914457321167, "global_step": 15753, "epoch": 375} {"train_loss": -5.058609962463379, "global_step": 15754, "epoch": 375} {"train_loss": -5.225022315979004, "global_step": 15755, "epoch": 375} {"train_loss": -5.171938419342041, "global_step": 15756, "epoch": 375} {"train_loss": -5.007620811462402, "global_step": 15757, "epoch": 375} {"train_loss": -5.341648101806641, "global_step": 15758, "epoch": 375} {"train_loss": -5.10658073425293, "global_step": 15759, "epoch": 375} {"train_loss": -5.119747161865234, "global_step": 15760, "epoch": 375} {"train_loss": -5.205195426940918, "global_step": 15761, "epoch": 375} {"train_loss": -5.183629989624023, "global_step": 15762, "epoch": 375} {"train_loss": -5.280413627624512, "global_step": 15763, "epoch": 375} {"train_loss": -5.106445789337158, "global_step": 15764, "epoch": 375} {"train_loss": -5.289705276489258, "global_step": 15765, "epoch": 375} {"train_loss": -5.288815498352051, "global_step": 15766, "epoch": 375} {"train_loss": -4.950068473815918, "global_step": 15767, "epoch": 375} {"train_loss": -5.318507194519043, "global_step": 15768, "epoch": 375} {"train_loss": -5.280993461608887, "global_step": 15769, "epoch": 375} {"train_loss": -5.118154525756836, "global_step": 15770, "epoch": 375} {"train_loss": -5.275823593139648, "global_step": 15771, "epoch": 375} {"train_loss": -5.1283674240112305, "global_step": 15772, "epoch": 375} {"train_loss": -5.0774688720703125, "global_step": 15773, "epoch": 375} {"train_loss": -5.125495433807373, "global_step": 15774, "epoch": 375} {"train_loss": -5.168663501739502, "global_step": 15775, "epoch": 375} {"train_loss": -5.217462539672852, "global_step": 15776, "epoch": 375} {"train_loss": -5.233490467071533, "global_step": 15777, "epoch": 375} {"train_loss": -5.165947437286377, "global_step": 15778, "epoch": 375} {"train_loss": -5.185561180114746, "global_step": 15779, "epoch": 375} {"train_loss": -5.184345722198486, "global_step": 15780, "epoch": 375} {"train_loss": -5.179596900939941, "global_step": 15781, "epoch": 375} {"train_loss": -5.095586776733398, "global_step": 15782, "epoch": 375} {"train_loss": -5.246594429016113, "global_step": 15783, "epoch": 375} {"train_loss": -5.2243547439575195, "global_step": 15784, "epoch": 375} {"train_loss": -5.197576522827148, "global_step": 15785, "epoch": 375} {"train_loss": -5.267621994018555, "global_step": 15786, "epoch": 375} {"train_loss": -5.2293267250061035, "global_step": 15787, "epoch": 375} {"train_loss": -5.1158976554870605, "global_step": 15788, "epoch": 375} {"train_loss": -5.298898696899414, "global_step": 15789, "epoch": 375} {"train_loss": -5.38831901550293, "global_step": 15790, "epoch": 375} {"train_loss": -5.193543797447568, "global_step": 15791, "epoch": 375, "val_loss": 78380.2890625} {"train_loss": -5.1259965896606445, "global_step": 15792, "epoch": 376} {"train_loss": -5.239543437957764, "global_step": 15793, "epoch": 376} {"train_loss": -5.369922161102295, "global_step": 15794, "epoch": 376} {"train_loss": -5.245150089263916, "global_step": 15795, "epoch": 376} {"train_loss": -5.075465679168701, "global_step": 15796, "epoch": 376} {"train_loss": -5.341212272644043, "global_step": 15797, "epoch": 376} {"train_loss": -5.269112586975098, "global_step": 15798, "epoch": 376} {"train_loss": -4.981667995452881, "global_step": 15799, "epoch": 376} {"train_loss": -5.30622673034668, "global_step": 15800, "epoch": 376} {"train_loss": -5.199728965759277, "global_step": 15801, "epoch": 376} {"train_loss": -4.851290225982666, "global_step": 15802, "epoch": 376} {"train_loss": -5.154680252075195, "global_step": 15803, "epoch": 376} {"train_loss": -4.969033718109131, "global_step": 15804, "epoch": 376} {"train_loss": -4.880139350891113, "global_step": 15805, "epoch": 376} {"train_loss": -5.052339553833008, "global_step": 15806, "epoch": 376} {"train_loss": -5.080007076263428, "global_step": 15807, "epoch": 376} {"train_loss": -5.204812049865723, "global_step": 15808, "epoch": 376} {"train_loss": -4.982213973999023, "global_step": 15809, "epoch": 376} {"train_loss": -5.1845903396606445, "global_step": 15810, "epoch": 376} {"train_loss": -5.235256195068359, "global_step": 15811, "epoch": 376} {"train_loss": -5.122556686401367, "global_step": 15812, "epoch": 376} {"train_loss": -5.298795700073242, "global_step": 15813, "epoch": 376} {"train_loss": -5.004264831542969, "global_step": 15814, "epoch": 376} {"train_loss": -5.077773094177246, "global_step": 15815, "epoch": 376} {"train_loss": -5.134764671325684, "global_step": 15816, "epoch": 376} {"train_loss": -5.128865718841553, "global_step": 15817, "epoch": 376} {"train_loss": -5.170389175415039, "global_step": 15818, "epoch": 376} {"train_loss": -5.223008632659912, "global_step": 15819, "epoch": 376} {"train_loss": -5.2091569900512695, "global_step": 15820, "epoch": 376} {"train_loss": -5.125471115112305, "global_step": 15821, "epoch": 376} {"train_loss": -5.2605133056640625, "global_step": 15822, "epoch": 376} {"train_loss": -5.108282089233398, "global_step": 15823, "epoch": 376} {"train_loss": -5.155940055847168, "global_step": 15824, "epoch": 376} {"train_loss": -5.239360332489014, "global_step": 15825, "epoch": 376} {"train_loss": -5.170809745788574, "global_step": 15826, "epoch": 376} {"train_loss": -5.278903007507324, "global_step": 15827, "epoch": 376} {"train_loss": -5.135166168212891, "global_step": 15828, "epoch": 376} {"train_loss": -5.292444229125977, "global_step": 15829, "epoch": 376} {"train_loss": -5.032973289489746, "global_step": 15830, "epoch": 376} {"train_loss": -5.2786993980407715, "global_step": 15831, "epoch": 376} {"train_loss": -5.1721086502075195, "global_step": 15832, "epoch": 376} {"train_loss": -5.155609233038766, "global_step": 15833, "epoch": 376, "val_loss": 77619.4140625} {"train_loss": -5.257147789001465, "global_step": 15834, "epoch": 377} {"train_loss": -5.17958402633667, "global_step": 15835, "epoch": 377} {"train_loss": -5.267288684844971, "global_step": 15836, "epoch": 377} {"train_loss": -5.200098514556885, "global_step": 15837, "epoch": 377} {"train_loss": -5.358119964599609, "global_step": 15838, "epoch": 377} {"train_loss": -5.138460159301758, "global_step": 15839, "epoch": 377} {"train_loss": -5.19972038269043, "global_step": 15840, "epoch": 377} {"train_loss": -5.077375411987305, "global_step": 15841, "epoch": 377} {"train_loss": -5.182324409484863, "global_step": 15842, "epoch": 377} {"train_loss": -5.14176082611084, "global_step": 15843, "epoch": 377} {"train_loss": -5.134722709655762, "global_step": 15844, "epoch": 377} {"train_loss": -5.191766738891602, "global_step": 15845, "epoch": 377} {"train_loss": -5.0705084800720215, "global_step": 15846, "epoch": 377} {"train_loss": -5.260369300842285, "global_step": 15847, "epoch": 377} {"train_loss": -4.9830121994018555, "global_step": 15848, "epoch": 377} {"train_loss": -5.018332004547119, "global_step": 15849, "epoch": 377} {"train_loss": -5.167399883270264, "global_step": 15850, "epoch": 377} {"train_loss": -5.1499433517456055, "global_step": 15851, "epoch": 377} {"train_loss": -5.200130462646484, "global_step": 15852, "epoch": 377} {"train_loss": -5.204465866088867, "global_step": 15853, "epoch": 377} {"train_loss": -5.164797782897949, "global_step": 15854, "epoch": 377} {"train_loss": -5.100544452667236, "global_step": 15855, "epoch": 377} {"train_loss": -5.214961051940918, "global_step": 15856, "epoch": 377} {"train_loss": -5.156125068664551, "global_step": 15857, "epoch": 377} {"train_loss": -5.236725807189941, "global_step": 15858, "epoch": 377} {"train_loss": -5.214980125427246, "global_step": 15859, "epoch": 377} {"train_loss": -5.233980178833008, "global_step": 15860, "epoch": 377} {"train_loss": -5.212014198303223, "global_step": 15861, "epoch": 377} {"train_loss": -5.245307922363281, "global_step": 15862, "epoch": 377} {"train_loss": -5.040150165557861, "global_step": 15863, "epoch": 377} {"train_loss": -5.200475692749023, "global_step": 15864, "epoch": 377} {"train_loss": -5.274226188659668, "global_step": 15865, "epoch": 377} {"train_loss": -5.161856651306152, "global_step": 15866, "epoch": 377} {"train_loss": -5.050043106079102, "global_step": 15867, "epoch": 377} {"train_loss": -5.083045959472656, "global_step": 15868, "epoch": 377} {"train_loss": -5.1546549797058105, "global_step": 15869, "epoch": 377} {"train_loss": -4.998175144195557, "global_step": 15870, "epoch": 377} {"train_loss": -5.252720832824707, "global_step": 15871, "epoch": 377} {"train_loss": -5.186770915985107, "global_step": 15872, "epoch": 377} {"train_loss": -5.046156883239746, "global_step": 15873, "epoch": 377} {"train_loss": -5.1157331466674805, "global_step": 15874, "epoch": 377} {"train_loss": -5.1630606424240835, "global_step": 15875, "epoch": 377, "val_loss": 78091.8828125} {"train_loss": -5.1093363761901855, "global_step": 15876, "epoch": 378} {"train_loss": -5.226669788360596, "global_step": 15877, "epoch": 378} {"train_loss": -5.067060470581055, "global_step": 15878, "epoch": 378} {"train_loss": -5.257787227630615, "global_step": 15879, "epoch": 378} {"train_loss": -5.0478363037109375, "global_step": 15880, "epoch": 378} {"train_loss": -5.233582496643066, "global_step": 15881, "epoch": 378} {"train_loss": -5.264062404632568, "global_step": 15882, "epoch": 378} {"train_loss": -5.186509609222412, "global_step": 15883, "epoch": 378} {"train_loss": -5.134355545043945, "global_step": 15884, "epoch": 378} {"train_loss": -5.145205497741699, "global_step": 15885, "epoch": 378} {"train_loss": -5.341851234436035, "global_step": 15886, "epoch": 378} {"train_loss": -5.249031066894531, "global_step": 15887, "epoch": 378} {"train_loss": -5.065600872039795, "global_step": 15888, "epoch": 378} {"train_loss": -5.199028015136719, "global_step": 15889, "epoch": 378} {"train_loss": -5.195723533630371, "global_step": 15890, "epoch": 378} {"train_loss": -5.311990737915039, "global_step": 15891, "epoch": 378} {"train_loss": -5.2274580001831055, "global_step": 15892, "epoch": 378} {"train_loss": -5.233449935913086, "global_step": 15893, "epoch": 378} {"train_loss": -5.2405548095703125, "global_step": 15894, "epoch": 378} {"train_loss": -5.121553421020508, "global_step": 15895, "epoch": 378} {"train_loss": -5.156747817993164, "global_step": 15896, "epoch": 378} {"train_loss": -5.375758171081543, "global_step": 15897, "epoch": 378} {"train_loss": -5.257636070251465, "global_step": 15898, "epoch": 378} {"train_loss": -5.1547322273254395, "global_step": 15899, "epoch": 378} {"train_loss": -5.2121262550354, "global_step": 15900, "epoch": 378} {"train_loss": -5.213226318359375, "global_step": 15901, "epoch": 378} {"train_loss": -5.1721577644348145, "global_step": 15902, "epoch": 378} {"train_loss": -5.297191143035889, "global_step": 15903, "epoch": 378} {"train_loss": -5.1952362060546875, "global_step": 15904, "epoch": 378} {"train_loss": -5.230217933654785, "global_step": 15905, "epoch": 378} {"train_loss": -5.125016212463379, "global_step": 15906, "epoch": 378} {"train_loss": -5.315375804901123, "global_step": 15907, "epoch": 378} {"train_loss": -5.078659534454346, "global_step": 15908, "epoch": 378} {"train_loss": -5.178096771240234, "global_step": 15909, "epoch": 378} {"train_loss": -5.094451904296875, "global_step": 15910, "epoch": 378} {"train_loss": -5.245617389678955, "global_step": 15911, "epoch": 378} {"train_loss": -5.22540283203125, "global_step": 15912, "epoch": 378} {"train_loss": -5.065132141113281, "global_step": 15913, "epoch": 378} {"train_loss": -5.221073627471924, "global_step": 15914, "epoch": 378} {"train_loss": -5.183600425720215, "global_step": 15915, "epoch": 378} {"train_loss": -5.096834182739258, "global_step": 15916, "epoch": 378} {"train_loss": -5.1957316398620605, "global_step": 15917, "epoch": 378, "val_loss": 77993.390625} {"train_loss": -5.2216901779174805, "global_step": 15918, "epoch": 379} {"train_loss": -5.227967262268066, "global_step": 15919, "epoch": 379} {"train_loss": -5.141173362731934, "global_step": 15920, "epoch": 379} {"train_loss": -5.1101813316345215, "global_step": 15921, "epoch": 379} {"train_loss": -5.138185501098633, "global_step": 15922, "epoch": 379} {"train_loss": -5.1127495765686035, "global_step": 15923, "epoch": 379} {"train_loss": -5.223025321960449, "global_step": 15924, "epoch": 379} {"train_loss": -5.115591049194336, "global_step": 15925, "epoch": 379} {"train_loss": -5.07020902633667, "global_step": 15926, "epoch": 379} {"train_loss": -5.0921831130981445, "global_step": 15927, "epoch": 379} {"train_loss": -5.205402374267578, "global_step": 15928, "epoch": 379} {"train_loss": -5.12673807144165, "global_step": 15929, "epoch": 379} {"train_loss": -5.260466575622559, "global_step": 15930, "epoch": 379} {"train_loss": -5.2281880378723145, "global_step": 15931, "epoch": 379} {"train_loss": -5.189261436462402, "global_step": 15932, "epoch": 379} {"train_loss": -5.166387557983398, "global_step": 15933, "epoch": 379} {"train_loss": -5.221853256225586, "global_step": 15934, "epoch": 379} {"train_loss": -5.2433671951293945, "global_step": 15935, "epoch": 379} {"train_loss": -5.282398223876953, "global_step": 15936, "epoch": 379} {"train_loss": -5.20859432220459, "global_step": 15937, "epoch": 379} {"train_loss": -5.264684677124023, "global_step": 15938, "epoch": 379} {"train_loss": -5.186349868774414, "global_step": 15939, "epoch": 379} {"train_loss": -5.278463840484619, "global_step": 15940, "epoch": 379} {"train_loss": -5.315519332885742, "global_step": 15941, "epoch": 379} {"train_loss": -5.118600368499756, "global_step": 15942, "epoch": 379} {"train_loss": -5.325221061706543, "global_step": 15943, "epoch": 379} {"train_loss": -5.211352348327637, "global_step": 15944, "epoch": 379} {"train_loss": -5.211313247680664, "global_step": 15945, "epoch": 379} {"train_loss": -5.1297430992126465, "global_step": 15946, "epoch": 379} {"train_loss": -5.309077262878418, "global_step": 15947, "epoch": 379} {"train_loss": -5.261772155761719, "global_step": 15948, "epoch": 379} {"train_loss": -5.267106533050537, "global_step": 15949, "epoch": 379} {"train_loss": -5.248282432556152, "global_step": 15950, "epoch": 379} {"train_loss": -5.196279048919678, "global_step": 15951, "epoch": 379} {"train_loss": -5.248287200927734, "global_step": 15952, "epoch": 379} {"train_loss": -5.225275039672852, "global_step": 15953, "epoch": 379} {"train_loss": -5.123297691345215, "global_step": 15954, "epoch": 379} {"train_loss": -5.014265537261963, "global_step": 15955, "epoch": 379} {"train_loss": -5.206263542175293, "global_step": 15956, "epoch": 379} {"train_loss": -5.121600151062012, "global_step": 15957, "epoch": 379} {"train_loss": -5.065415382385254, "global_step": 15958, "epoch": 379} {"train_loss": -5.1937358265831355, "global_step": 15959, "epoch": 379, "val_loss": 78280.515625} {"train_loss": -5.171250343322754, "global_step": 15960, "epoch": 380} {"train_loss": -5.140309810638428, "global_step": 15961, "epoch": 380} {"train_loss": -5.271512985229492, "global_step": 15962, "epoch": 380} {"train_loss": -5.071091651916504, "global_step": 15963, "epoch": 380} {"train_loss": -5.251260757446289, "global_step": 15964, "epoch": 380} {"train_loss": -5.162631511688232, "global_step": 15965, "epoch": 380} {"train_loss": -5.169075965881348, "global_step": 15966, "epoch": 380} {"train_loss": -5.177178382873535, "global_step": 15967, "epoch": 380} {"train_loss": -5.1832427978515625, "global_step": 15968, "epoch": 380} {"train_loss": -5.286169052124023, "global_step": 15969, "epoch": 380} {"train_loss": -5.2443671226501465, "global_step": 15970, "epoch": 380} {"train_loss": -5.408426761627197, "global_step": 15971, "epoch": 380} {"train_loss": -5.235726356506348, "global_step": 15972, "epoch": 380} {"train_loss": -5.259324073791504, "global_step": 15973, "epoch": 380} {"train_loss": -5.240751266479492, "global_step": 15974, "epoch": 380} {"train_loss": -5.139789581298828, "global_step": 15975, "epoch": 380} {"train_loss": -5.252862453460693, "global_step": 15976, "epoch": 380} {"train_loss": -5.2002458572387695, "global_step": 15977, "epoch": 380} {"train_loss": -5.202218532562256, "global_step": 15978, "epoch": 380} {"train_loss": -5.075047492980957, "global_step": 15979, "epoch": 380} {"train_loss": -5.19028377532959, "global_step": 15980, "epoch": 380} {"train_loss": -5.066825866699219, "global_step": 15981, "epoch": 380} {"train_loss": -4.832218170166016, "global_step": 15982, "epoch": 380} {"train_loss": -5.175868034362793, "global_step": 15983, "epoch": 380} {"train_loss": -5.174421787261963, "global_step": 15984, "epoch": 380} {"train_loss": -5.044844150543213, "global_step": 15985, "epoch": 380} {"train_loss": -4.9962849617004395, "global_step": 15986, "epoch": 380} {"train_loss": -5.074704170227051, "global_step": 15987, "epoch": 380} {"train_loss": -5.073822498321533, "global_step": 15988, "epoch": 380} {"train_loss": -5.18516731262207, "global_step": 15989, "epoch": 380} {"train_loss": -4.983590126037598, "global_step": 15990, "epoch": 380} {"train_loss": -5.227362155914307, "global_step": 15991, "epoch": 380} {"train_loss": -5.204957008361816, "global_step": 15992, "epoch": 380} {"train_loss": -5.226157188415527, "global_step": 15993, "epoch": 380} {"train_loss": -5.054244041442871, "global_step": 15994, "epoch": 380} {"train_loss": -5.110306739807129, "global_step": 15995, "epoch": 380} {"train_loss": -5.2132158279418945, "global_step": 15996, "epoch": 380} {"train_loss": -5.169719696044922, "global_step": 15997, "epoch": 380} {"train_loss": -5.207467079162598, "global_step": 15998, "epoch": 380} {"train_loss": -5.081737518310547, "global_step": 15999, "epoch": 380} {"train_loss": -5.123271942138672, "global_step": 16000, "epoch": 380} {"train_loss": -5.158116772061303, "global_step": 16001, "epoch": 380, "val_loss": 78107.7421875} {"train_loss": -5.134483337402344, "global_step": 16002, "epoch": 381} {"train_loss": -5.013110160827637, "global_step": 16003, "epoch": 381} {"train_loss": -5.072084426879883, "global_step": 16004, "epoch": 381} {"train_loss": -5.209770202636719, "global_step": 16005, "epoch": 381} {"train_loss": -5.120055198669434, "global_step": 16006, "epoch": 381} {"train_loss": -5.1353325843811035, "global_step": 16007, "epoch": 381} {"train_loss": -5.321163654327393, "global_step": 16008, "epoch": 381} {"train_loss": -5.256566047668457, "global_step": 16009, "epoch": 381} {"train_loss": -5.19835090637207, "global_step": 16010, "epoch": 381} {"train_loss": -5.14315128326416, "global_step": 16011, "epoch": 381} {"train_loss": -5.314833164215088, "global_step": 16012, "epoch": 381} {"train_loss": -5.246885299682617, "global_step": 16013, "epoch": 381} {"train_loss": -5.253710746765137, "global_step": 16014, "epoch": 381} {"train_loss": -4.935080528259277, "global_step": 16015, "epoch": 381} {"train_loss": -5.251670837402344, "global_step": 16016, "epoch": 381} {"train_loss": -5.22560977935791, "global_step": 16017, "epoch": 381} {"train_loss": -5.244359493255615, "global_step": 16018, "epoch": 381} {"train_loss": -5.303681373596191, "global_step": 16019, "epoch": 381} {"train_loss": -5.212734222412109, "global_step": 16020, "epoch": 381} {"train_loss": -5.191893100738525, "global_step": 16021, "epoch": 381} {"train_loss": -5.165826320648193, "global_step": 16022, "epoch": 381} {"train_loss": -5.370120048522949, "global_step": 16023, "epoch": 381} {"train_loss": -5.322805404663086, "global_step": 16024, "epoch": 381} {"train_loss": -5.223959922790527, "global_step": 16025, "epoch": 381} {"train_loss": -5.127367973327637, "global_step": 16026, "epoch": 381} {"train_loss": -5.190800666809082, "global_step": 16027, "epoch": 381} {"train_loss": -5.306600093841553, "global_step": 16028, "epoch": 381} {"train_loss": -5.154642581939697, "global_step": 16029, "epoch": 381} {"train_loss": -5.277478218078613, "global_step": 16030, "epoch": 381} {"train_loss": -5.132891654968262, "global_step": 16031, "epoch": 381} {"train_loss": -5.203658580780029, "global_step": 16032, "epoch": 381} {"train_loss": -5.192814826965332, "global_step": 16033, "epoch": 381} {"train_loss": -5.294685363769531, "global_step": 16034, "epoch": 381} {"train_loss": -5.223616600036621, "global_step": 16035, "epoch": 381} {"train_loss": -5.324435234069824, "global_step": 16036, "epoch": 381} {"train_loss": -5.192451000213623, "global_step": 16037, "epoch": 381} {"train_loss": -5.169882774353027, "global_step": 16038, "epoch": 381} {"train_loss": -5.151053428649902, "global_step": 16039, "epoch": 381} {"train_loss": -5.2311906814575195, "global_step": 16040, "epoch": 381} {"train_loss": -5.1160173416137695, "global_step": 16041, "epoch": 381} {"train_loss": -5.2883620262146, "global_step": 16042, "epoch": 381} {"train_loss": -5.207991702216012, "global_step": 16043, "epoch": 381, "val_loss": 77875.09375} {"train_loss": -5.185406684875488, "global_step": 16044, "epoch": 382} {"train_loss": -5.189118385314941, "global_step": 16045, "epoch": 382} {"train_loss": -5.234304428100586, "global_step": 16046, "epoch": 382} {"train_loss": -5.186727523803711, "global_step": 16047, "epoch": 382} {"train_loss": -5.154308319091797, "global_step": 16048, "epoch": 382} {"train_loss": -5.1731767654418945, "global_step": 16049, "epoch": 382} {"train_loss": -5.1912031173706055, "global_step": 16050, "epoch": 382} {"train_loss": -5.23227596282959, "global_step": 16051, "epoch": 382} {"train_loss": -5.169095039367676, "global_step": 16052, "epoch": 382} {"train_loss": -5.283967971801758, "global_step": 16053, "epoch": 382} {"train_loss": -5.286736011505127, "global_step": 16054, "epoch": 382} {"train_loss": -5.187126159667969, "global_step": 16055, "epoch": 382} {"train_loss": -5.238722801208496, "global_step": 16056, "epoch": 382} {"train_loss": -5.293854713439941, "global_step": 16057, "epoch": 382} {"train_loss": -5.146992206573486, "global_step": 16058, "epoch": 382} {"train_loss": -5.058962821960449, "global_step": 16059, "epoch": 382} {"train_loss": -5.09921932220459, "global_step": 16060, "epoch": 382} {"train_loss": -5.043966293334961, "global_step": 16061, "epoch": 382} {"train_loss": -5.169358253479004, "global_step": 16062, "epoch": 382} {"train_loss": -5.192011833190918, "global_step": 16063, "epoch": 382} {"train_loss": -5.191497802734375, "global_step": 16064, "epoch": 382} {"train_loss": -5.13448429107666, "global_step": 16065, "epoch": 382} {"train_loss": -5.236985206604004, "global_step": 16066, "epoch": 382} {"train_loss": -4.978860855102539, "global_step": 16067, "epoch": 382} {"train_loss": -5.086404800415039, "global_step": 16068, "epoch": 382} {"train_loss": -4.969839572906494, "global_step": 16069, "epoch": 382} {"train_loss": -5.013156890869141, "global_step": 16070, "epoch": 382} {"train_loss": -5.042662620544434, "global_step": 16071, "epoch": 382} {"train_loss": -5.154416084289551, "global_step": 16072, "epoch": 382} {"train_loss": -5.077425003051758, "global_step": 16073, "epoch": 382} {"train_loss": -5.137672424316406, "global_step": 16074, "epoch": 382} {"train_loss": -5.25574254989624, "global_step": 16075, "epoch": 382} {"train_loss": -4.933372497558594, "global_step": 16076, "epoch": 382} {"train_loss": -5.076767921447754, "global_step": 16077, "epoch": 382} {"train_loss": -5.365035057067871, "global_step": 16078, "epoch": 382} {"train_loss": -5.152581691741943, "global_step": 16079, "epoch": 382} {"train_loss": -5.246111869812012, "global_step": 16080, "epoch": 382} {"train_loss": -5.36059045791626, "global_step": 16081, "epoch": 382} {"train_loss": -5.199127674102783, "global_step": 16082, "epoch": 382} {"train_loss": -5.191756248474121, "global_step": 16083, "epoch": 382} {"train_loss": -5.122137069702148, "global_step": 16084, "epoch": 382} {"train_loss": -5.1617840358189175, "global_step": 16085, "epoch": 382, "val_loss": 78068.5859375} {"train_loss": -5.238179683685303, "global_step": 16086, "epoch": 383} {"train_loss": -5.238486289978027, "global_step": 16087, "epoch": 383} {"train_loss": -5.250113487243652, "global_step": 16088, "epoch": 383} {"train_loss": -5.223674774169922, "global_step": 16089, "epoch": 383} {"train_loss": -5.15281867980957, "global_step": 16090, "epoch": 383} {"train_loss": -5.303095817565918, "global_step": 16091, "epoch": 383} {"train_loss": -5.290484428405762, "global_step": 16092, "epoch": 383} {"train_loss": -5.150629997253418, "global_step": 16093, "epoch": 383} {"train_loss": -5.221932411193848, "global_step": 16094, "epoch": 383} {"train_loss": -5.310831069946289, "global_step": 16095, "epoch": 383} {"train_loss": -5.072239398956299, "global_step": 16096, "epoch": 383} {"train_loss": -5.261052131652832, "global_step": 16097, "epoch": 383} {"train_loss": -5.086448669433594, "global_step": 16098, "epoch": 383} {"train_loss": -5.190709114074707, "global_step": 16099, "epoch": 383} {"train_loss": -5.1745829582214355, "global_step": 16100, "epoch": 383} {"train_loss": -5.23807430267334, "global_step": 16101, "epoch": 383} {"train_loss": -5.1113786697387695, "global_step": 16102, "epoch": 383} {"train_loss": -5.172182083129883, "global_step": 16103, "epoch": 383} {"train_loss": -5.15998649597168, "global_step": 16104, "epoch": 383} {"train_loss": -5.226846694946289, "global_step": 16105, "epoch": 383} {"train_loss": -5.214010238647461, "global_step": 16106, "epoch": 383} {"train_loss": -5.247559547424316, "global_step": 16107, "epoch": 383} {"train_loss": -5.050804138183594, "global_step": 16108, "epoch": 383} {"train_loss": -5.242276668548584, "global_step": 16109, "epoch": 383} {"train_loss": -5.213994026184082, "global_step": 16110, "epoch": 383} {"train_loss": -5.11945915222168, "global_step": 16111, "epoch": 383} {"train_loss": -5.1381378173828125, "global_step": 16112, "epoch": 383} {"train_loss": -5.218873977661133, "global_step": 16113, "epoch": 383} {"train_loss": -5.118030548095703, "global_step": 16114, "epoch": 383} {"train_loss": -5.21232795715332, "global_step": 16115, "epoch": 383} {"train_loss": -5.247699737548828, "global_step": 16116, "epoch": 383} {"train_loss": -5.184417724609375, "global_step": 16117, "epoch": 383} {"train_loss": -5.237199783325195, "global_step": 16118, "epoch": 383} {"train_loss": -5.210458278656006, "global_step": 16119, "epoch": 383} {"train_loss": -5.159384727478027, "global_step": 16120, "epoch": 383} {"train_loss": -5.153907775878906, "global_step": 16121, "epoch": 383} {"train_loss": -5.364253520965576, "global_step": 16122, "epoch": 383} {"train_loss": -5.20102071762085, "global_step": 16123, "epoch": 383} {"train_loss": -5.184540748596191, "global_step": 16124, "epoch": 383} {"train_loss": -5.273397445678711, "global_step": 16125, "epoch": 383} {"train_loss": -5.152650356292725, "global_step": 16126, "epoch": 383} {"train_loss": -5.203363418579102, "global_step": 16127, "epoch": 383, "val_loss": 78458.8203125} {"train_loss": -5.332383632659912, "global_step": 16128, "epoch": 384} {"train_loss": -5.082995891571045, "global_step": 16129, "epoch": 384} {"train_loss": -5.138222694396973, "global_step": 16130, "epoch": 384} {"train_loss": -5.284085273742676, "global_step": 16131, "epoch": 384} {"train_loss": -5.152828216552734, "global_step": 16132, "epoch": 384} {"train_loss": -5.088474273681641, "global_step": 16133, "epoch": 384} {"train_loss": -5.238622665405273, "global_step": 16134, "epoch": 384} {"train_loss": -5.05009126663208, "global_step": 16135, "epoch": 384} {"train_loss": -5.243447303771973, "global_step": 16136, "epoch": 384} {"train_loss": -5.125423431396484, "global_step": 16137, "epoch": 384} {"train_loss": -5.214449405670166, "global_step": 16138, "epoch": 384} {"train_loss": -5.237889766693115, "global_step": 16139, "epoch": 384} {"train_loss": -5.033018589019775, "global_step": 16140, "epoch": 384} {"train_loss": -5.19019889831543, "global_step": 16141, "epoch": 384} {"train_loss": -5.128677845001221, "global_step": 16142, "epoch": 384} {"train_loss": -5.164858341217041, "global_step": 16143, "epoch": 384} {"train_loss": -5.32014274597168, "global_step": 16144, "epoch": 384} {"train_loss": -5.02540397644043, "global_step": 16145, "epoch": 384} {"train_loss": -5.20277214050293, "global_step": 16146, "epoch": 384} {"train_loss": -5.077853202819824, "global_step": 16147, "epoch": 384} {"train_loss": -5.255866527557373, "global_step": 16148, "epoch": 384} {"train_loss": -5.257805824279785, "global_step": 16149, "epoch": 384} {"train_loss": -5.287588596343994, "global_step": 16150, "epoch": 384} {"train_loss": -5.202211380004883, "global_step": 16151, "epoch": 384} {"train_loss": -5.234641075134277, "global_step": 16152, "epoch": 384} {"train_loss": -5.1824445724487305, "global_step": 16153, "epoch": 384} {"train_loss": -5.123848915100098, "global_step": 16154, "epoch": 384} {"train_loss": -4.995499610900879, "global_step": 16155, "epoch": 384} {"train_loss": -5.250083923339844, "global_step": 16156, "epoch": 384} {"train_loss": -4.99830961227417, "global_step": 16157, "epoch": 384} {"train_loss": -5.189748764038086, "global_step": 16158, "epoch": 384} {"train_loss": -5.230727195739746, "global_step": 16159, "epoch": 384} {"train_loss": -4.975114345550537, "global_step": 16160, "epoch": 384} {"train_loss": -5.032665252685547, "global_step": 16161, "epoch": 384} {"train_loss": -5.197080612182617, "global_step": 16162, "epoch": 384} {"train_loss": -5.115589141845703, "global_step": 16163, "epoch": 384} {"train_loss": -5.14073371887207, "global_step": 16164, "epoch": 384} {"train_loss": -5.1677703857421875, "global_step": 16165, "epoch": 384} {"train_loss": -5.229883193969727, "global_step": 16166, "epoch": 384} {"train_loss": -5.219041347503662, "global_step": 16167, "epoch": 384} {"train_loss": -5.248795509338379, "global_step": 16168, "epoch": 384} {"train_loss": -5.1721720695495605, "global_step": 16169, "epoch": 384, "val_loss": 78172.7421875} {"train_loss": -5.195289134979248, "global_step": 16170, "epoch": 385} {"train_loss": -5.33908224105835, "global_step": 16171, "epoch": 385} {"train_loss": -5.179998397827148, "global_step": 16172, "epoch": 385} {"train_loss": -5.2536773681640625, "global_step": 16173, "epoch": 385} {"train_loss": -5.258050918579102, "global_step": 16174, "epoch": 385} {"train_loss": -5.220581531524658, "global_step": 16175, "epoch": 385} {"train_loss": -5.138961315155029, "global_step": 16176, "epoch": 385} {"train_loss": -5.214202880859375, "global_step": 16177, "epoch": 385} {"train_loss": -5.1077070236206055, "global_step": 16178, "epoch": 385} {"train_loss": -5.167717456817627, "global_step": 16179, "epoch": 385} {"train_loss": -5.376125335693359, "global_step": 16180, "epoch": 385} {"train_loss": -5.10410737991333, "global_step": 16181, "epoch": 385} {"train_loss": -5.081671714782715, "global_step": 16182, "epoch": 385} {"train_loss": -5.263451099395752, "global_step": 16183, "epoch": 385} {"train_loss": -5.1175432205200195, "global_step": 16184, "epoch": 385} {"train_loss": -5.257218837738037, "global_step": 16185, "epoch": 385} {"train_loss": -5.2185540199279785, "global_step": 16186, "epoch": 385} {"train_loss": -5.009454727172852, "global_step": 16187, "epoch": 385} {"train_loss": -5.328149318695068, "global_step": 16188, "epoch": 385} {"train_loss": -5.097417831420898, "global_step": 16189, "epoch": 385} {"train_loss": -5.1661272048950195, "global_step": 16190, "epoch": 385} {"train_loss": -5.249083518981934, "global_step": 16191, "epoch": 385} {"train_loss": -5.240773677825928, "global_step": 16192, "epoch": 385} {"train_loss": -5.200387001037598, "global_step": 16193, "epoch": 385} {"train_loss": -5.240355491638184, "global_step": 16194, "epoch": 385} {"train_loss": -5.2153544425964355, "global_step": 16195, "epoch": 385} {"train_loss": -5.127385139465332, "global_step": 16196, "epoch": 385} {"train_loss": -5.166849136352539, "global_step": 16197, "epoch": 385} {"train_loss": -5.327737808227539, "global_step": 16198, "epoch": 385} {"train_loss": -5.265596389770508, "global_step": 16199, "epoch": 385} {"train_loss": -5.221954345703125, "global_step": 16200, "epoch": 385} {"train_loss": -5.223968982696533, "global_step": 16201, "epoch": 385} {"train_loss": -5.125850677490234, "global_step": 16202, "epoch": 385} {"train_loss": -5.249174118041992, "global_step": 16203, "epoch": 385} {"train_loss": -5.131488800048828, "global_step": 16204, "epoch": 385} {"train_loss": -5.322412967681885, "global_step": 16205, "epoch": 385} {"train_loss": -5.099527359008789, "global_step": 16206, "epoch": 385} {"train_loss": -5.165078163146973, "global_step": 16207, "epoch": 385} {"train_loss": -5.270911693572998, "global_step": 16208, "epoch": 385} {"train_loss": -5.23723030090332, "global_step": 16209, "epoch": 385} {"train_loss": -5.180020332336426, "global_step": 16210, "epoch": 385} {"train_loss": -5.202751114254906, "global_step": 16211, "epoch": 385, "val_loss": 77853.0859375} {"train_loss": -5.162741661071777, "global_step": 16212, "epoch": 386} {"train_loss": -5.351500511169434, "global_step": 16213, "epoch": 386} {"train_loss": -5.204123497009277, "global_step": 16214, "epoch": 386} {"train_loss": -5.3822855949401855, "global_step": 16215, "epoch": 386} {"train_loss": -5.222752571105957, "global_step": 16216, "epoch": 386} {"train_loss": -5.105033874511719, "global_step": 16217, "epoch": 386} {"train_loss": -5.21453332901001, "global_step": 16218, "epoch": 386} {"train_loss": -5.18058967590332, "global_step": 16219, "epoch": 386} {"train_loss": -5.074833393096924, "global_step": 16220, "epoch": 386} {"train_loss": -5.294852256774902, "global_step": 16221, "epoch": 386} {"train_loss": -5.245095252990723, "global_step": 16222, "epoch": 386} {"train_loss": -5.227859020233154, "global_step": 16223, "epoch": 386} {"train_loss": -5.123284339904785, "global_step": 16224, "epoch": 386} {"train_loss": -5.182557582855225, "global_step": 16225, "epoch": 386} {"train_loss": -5.341718673706055, "global_step": 16226, "epoch": 386} {"train_loss": -5.208627223968506, "global_step": 16227, "epoch": 386} {"train_loss": -5.199253559112549, "global_step": 16228, "epoch": 386} {"train_loss": -5.308032989501953, "global_step": 16229, "epoch": 386} {"train_loss": -5.147804260253906, "global_step": 16230, "epoch": 386} {"train_loss": -5.342907905578613, "global_step": 16231, "epoch": 386} {"train_loss": -5.184806823730469, "global_step": 16232, "epoch": 386} {"train_loss": -5.1353349685668945, "global_step": 16233, "epoch": 386} {"train_loss": -5.339635848999023, "global_step": 16234, "epoch": 386} {"train_loss": -5.119869709014893, "global_step": 16235, "epoch": 386} {"train_loss": -5.286726474761963, "global_step": 16236, "epoch": 386} {"train_loss": -5.319068908691406, "global_step": 16237, "epoch": 386} {"train_loss": -5.165831089019775, "global_step": 16238, "epoch": 386} {"train_loss": -5.261624336242676, "global_step": 16239, "epoch": 386} {"train_loss": -5.323884963989258, "global_step": 16240, "epoch": 386} {"train_loss": -5.212742805480957, "global_step": 16241, "epoch": 386} {"train_loss": -5.205900192260742, "global_step": 16242, "epoch": 386} {"train_loss": -5.152374267578125, "global_step": 16243, "epoch": 386} {"train_loss": -5.300361633300781, "global_step": 16244, "epoch": 386} {"train_loss": -5.242411136627197, "global_step": 16245, "epoch": 386} {"train_loss": -5.185811996459961, "global_step": 16246, "epoch": 386} {"train_loss": -5.2823405265808105, "global_step": 16247, "epoch": 386} {"train_loss": -5.152034759521484, "global_step": 16248, "epoch": 386} {"train_loss": -5.161759853363037, "global_step": 16249, "epoch": 386} {"train_loss": -5.082928657531738, "global_step": 16250, "epoch": 386} {"train_loss": -5.2600908279418945, "global_step": 16251, "epoch": 386} {"train_loss": -5.13925838470459, "global_step": 16252, "epoch": 386} {"train_loss": -5.219709112530663, "global_step": 16253, "epoch": 386, "val_loss": 78266.5546875} {"train_loss": -5.204817295074463, "global_step": 16254, "epoch": 387} {"train_loss": -5.097296714782715, "global_step": 16255, "epoch": 387} {"train_loss": -5.158540725708008, "global_step": 16256, "epoch": 387} {"train_loss": -5.2071533203125, "global_step": 16257, "epoch": 387} {"train_loss": -5.325702667236328, "global_step": 16258, "epoch": 387} {"train_loss": -5.280490875244141, "global_step": 16259, "epoch": 387} {"train_loss": -5.211921691894531, "global_step": 16260, "epoch": 387} {"train_loss": -5.193962097167969, "global_step": 16261, "epoch": 387} {"train_loss": -5.138972282409668, "global_step": 16262, "epoch": 387} {"train_loss": -5.136898994445801, "global_step": 16263, "epoch": 387} {"train_loss": -5.312130928039551, "global_step": 16264, "epoch": 387} {"train_loss": -5.120375156402588, "global_step": 16265, "epoch": 387} {"train_loss": -5.150067329406738, "global_step": 16266, "epoch": 387} {"train_loss": -5.223416328430176, "global_step": 16267, "epoch": 387} {"train_loss": -5.252270221710205, "global_step": 16268, "epoch": 387} {"train_loss": -5.142364025115967, "global_step": 16269, "epoch": 387} {"train_loss": -5.221170902252197, "global_step": 16270, "epoch": 387} {"train_loss": -5.247954368591309, "global_step": 16271, "epoch": 387} {"train_loss": -5.279725074768066, "global_step": 16272, "epoch": 387} {"train_loss": -5.269760608673096, "global_step": 16273, "epoch": 387} {"train_loss": -5.244952201843262, "global_step": 16274, "epoch": 387} {"train_loss": -5.253912448883057, "global_step": 16275, "epoch": 387} {"train_loss": -5.325625896453857, "global_step": 16276, "epoch": 387} {"train_loss": -5.279464244842529, "global_step": 16277, "epoch": 387} {"train_loss": -5.252842426300049, "global_step": 16278, "epoch": 387} {"train_loss": -5.210526943206787, "global_step": 16279, "epoch": 387} {"train_loss": -5.253839492797852, "global_step": 16280, "epoch": 387} {"train_loss": -5.254725456237793, "global_step": 16281, "epoch": 387} {"train_loss": -5.2730393409729, "global_step": 16282, "epoch": 387} {"train_loss": -5.257809162139893, "global_step": 16283, "epoch": 387} {"train_loss": -5.298063278198242, "global_step": 16284, "epoch": 387} {"train_loss": -5.278316497802734, "global_step": 16285, "epoch": 387} {"train_loss": -5.262676239013672, "global_step": 16286, "epoch": 387} {"train_loss": -5.151012420654297, "global_step": 16287, "epoch": 387} {"train_loss": -5.1947760581970215, "global_step": 16288, "epoch": 387} {"train_loss": -5.153172969818115, "global_step": 16289, "epoch": 387} {"train_loss": -5.384814739227295, "global_step": 16290, "epoch": 387} {"train_loss": -5.239163398742676, "global_step": 16291, "epoch": 387} {"train_loss": -5.1160993576049805, "global_step": 16292, "epoch": 387} {"train_loss": -5.211840629577637, "global_step": 16293, "epoch": 387} {"train_loss": -5.303773880004883, "global_step": 16294, "epoch": 387} {"train_loss": -5.227382523672921, "global_step": 16295, "epoch": 387, "val_loss": 78366.0078125} {"train_loss": -5.222211837768555, "global_step": 16296, "epoch": 388} {"train_loss": -5.188675880432129, "global_step": 16297, "epoch": 388} {"train_loss": -5.212543487548828, "global_step": 16298, "epoch": 388} {"train_loss": -5.308182716369629, "global_step": 16299, "epoch": 388} {"train_loss": -5.089938640594482, "global_step": 16300, "epoch": 388} {"train_loss": -5.282486915588379, "global_step": 16301, "epoch": 388} {"train_loss": -5.197751998901367, "global_step": 16302, "epoch": 388} {"train_loss": -5.186367511749268, "global_step": 16303, "epoch": 388} {"train_loss": -5.243406295776367, "global_step": 16304, "epoch": 388} {"train_loss": -5.118478775024414, "global_step": 16305, "epoch": 388} {"train_loss": -5.243937015533447, "global_step": 16306, "epoch": 388} {"train_loss": -5.189110279083252, "global_step": 16307, "epoch": 388} {"train_loss": -5.3726348876953125, "global_step": 16308, "epoch": 388} {"train_loss": -5.306219100952148, "global_step": 16309, "epoch": 388} {"train_loss": -5.229556083679199, "global_step": 16310, "epoch": 388} {"train_loss": -5.378420829772949, "global_step": 16311, "epoch": 388} {"train_loss": -5.220287799835205, "global_step": 16312, "epoch": 388} {"train_loss": -5.129853248596191, "global_step": 16313, "epoch": 388} {"train_loss": -5.279073715209961, "global_step": 16314, "epoch": 388} {"train_loss": -5.209784984588623, "global_step": 16315, "epoch": 388} {"train_loss": -5.1273298263549805, "global_step": 16316, "epoch": 388} {"train_loss": -5.338895797729492, "global_step": 16317, "epoch": 388} {"train_loss": -5.17694091796875, "global_step": 16318, "epoch": 388} {"train_loss": -5.294345855712891, "global_step": 16319, "epoch": 388} {"train_loss": -5.196678638458252, "global_step": 16320, "epoch": 388} {"train_loss": -5.150335788726807, "global_step": 16321, "epoch": 388} {"train_loss": -5.2677507400512695, "global_step": 16322, "epoch": 388} {"train_loss": -5.190232276916504, "global_step": 16323, "epoch": 388} {"train_loss": -5.21381950378418, "global_step": 16324, "epoch": 388} {"train_loss": -5.2978668212890625, "global_step": 16325, "epoch": 388} {"train_loss": -5.223537921905518, "global_step": 16326, "epoch": 388} {"train_loss": -5.338682651519775, "global_step": 16327, "epoch": 388} {"train_loss": -5.246127128601074, "global_step": 16328, "epoch": 388} {"train_loss": -5.115565299987793, "global_step": 16329, "epoch": 388} {"train_loss": -5.124335289001465, "global_step": 16330, "epoch": 388} {"train_loss": -5.3410258293151855, "global_step": 16331, "epoch": 388} {"train_loss": -5.334815979003906, "global_step": 16332, "epoch": 388} {"train_loss": -5.272459983825684, "global_step": 16333, "epoch": 388} {"train_loss": -5.209627628326416, "global_step": 16334, "epoch": 388} {"train_loss": -5.1474127769470215, "global_step": 16335, "epoch": 388} {"train_loss": -5.146416664123535, "global_step": 16336, "epoch": 388} {"train_loss": -5.2260618550436835, "global_step": 16337, "epoch": 388, "val_loss": 77412.8828125} {"train_loss": -5.241655349731445, "global_step": 16338, "epoch": 389} {"train_loss": -5.271506309509277, "global_step": 16339, "epoch": 389} {"train_loss": -5.2650146484375, "global_step": 16340, "epoch": 389} {"train_loss": -5.33899450302124, "global_step": 16341, "epoch": 389} {"train_loss": -5.223337173461914, "global_step": 16342, "epoch": 389} {"train_loss": -5.2176713943481445, "global_step": 16343, "epoch": 389} {"train_loss": -5.156790256500244, "global_step": 16344, "epoch": 389} {"train_loss": -5.156167030334473, "global_step": 16345, "epoch": 389} {"train_loss": -5.360373497009277, "global_step": 16346, "epoch": 389} {"train_loss": -5.320281505584717, "global_step": 16347, "epoch": 389} {"train_loss": -5.177590370178223, "global_step": 16348, "epoch": 389} {"train_loss": -5.155012130737305, "global_step": 16349, "epoch": 389} {"train_loss": -5.148402214050293, "global_step": 16350, "epoch": 389} {"train_loss": -5.302011489868164, "global_step": 16351, "epoch": 389} {"train_loss": -5.131919860839844, "global_step": 16352, "epoch": 389} {"train_loss": -5.204554080963135, "global_step": 16353, "epoch": 389} {"train_loss": -5.140585899353027, "global_step": 16354, "epoch": 389} {"train_loss": -5.292922019958496, "global_step": 16355, "epoch": 389} {"train_loss": -5.231010437011719, "global_step": 16356, "epoch": 389} {"train_loss": -5.009161949157715, "global_step": 16357, "epoch": 389} {"train_loss": -5.1850738525390625, "global_step": 16358, "epoch": 389} {"train_loss": -5.279570579528809, "global_step": 16359, "epoch": 389} {"train_loss": -5.319069862365723, "global_step": 16360, "epoch": 389} {"train_loss": -5.27119255065918, "global_step": 16361, "epoch": 389} {"train_loss": -5.219832420349121, "global_step": 16362, "epoch": 389} {"train_loss": -5.1730451583862305, "global_step": 16363, "epoch": 389} {"train_loss": -5.179025173187256, "global_step": 16364, "epoch": 389} {"train_loss": -5.204761981964111, "global_step": 16365, "epoch": 389} {"train_loss": -5.16383695602417, "global_step": 16366, "epoch": 389} {"train_loss": -5.193107604980469, "global_step": 16367, "epoch": 389} {"train_loss": -5.137411594390869, "global_step": 16368, "epoch": 389} {"train_loss": -5.177799224853516, "global_step": 16369, "epoch": 389} {"train_loss": -5.257224082946777, "global_step": 16370, "epoch": 389} {"train_loss": -5.288546562194824, "global_step": 16371, "epoch": 389} {"train_loss": -5.258444786071777, "global_step": 16372, "epoch": 389} {"train_loss": -5.17520809173584, "global_step": 16373, "epoch": 389} {"train_loss": -5.213295936584473, "global_step": 16374, "epoch": 389} {"train_loss": -5.069003105163574, "global_step": 16375, "epoch": 389} {"train_loss": -5.141213893890381, "global_step": 16376, "epoch": 389} {"train_loss": -5.211617469787598, "global_step": 16377, "epoch": 389} {"train_loss": -5.198594570159912, "global_step": 16378, "epoch": 389} {"train_loss": -5.2092695917402, "global_step": 16379, "epoch": 389, "val_loss": 78170.3984375} {"train_loss": -5.158968925476074, "global_step": 16380, "epoch": 390} {"train_loss": -5.124277114868164, "global_step": 16381, "epoch": 390} {"train_loss": -5.120159149169922, "global_step": 16382, "epoch": 390} {"train_loss": -5.310365676879883, "global_step": 16383, "epoch": 390} {"train_loss": -5.179426193237305, "global_step": 16384, "epoch": 390} {"train_loss": -5.179559230804443, "global_step": 16385, "epoch": 390} {"train_loss": -5.249903678894043, "global_step": 16386, "epoch": 390} {"train_loss": -5.23917293548584, "global_step": 16387, "epoch": 390} {"train_loss": -5.192343235015869, "global_step": 16388, "epoch": 390} {"train_loss": -5.245635032653809, "global_step": 16389, "epoch": 390} {"train_loss": -5.060521125793457, "global_step": 16390, "epoch": 390} {"train_loss": -5.269015789031982, "global_step": 16391, "epoch": 390} {"train_loss": -5.197065353393555, "global_step": 16392, "epoch": 390} {"train_loss": -5.156599998474121, "global_step": 16393, "epoch": 390} {"train_loss": -5.019821643829346, "global_step": 16394, "epoch": 390} {"train_loss": -5.256763458251953, "global_step": 16395, "epoch": 390} {"train_loss": -5.113664627075195, "global_step": 16396, "epoch": 390} {"train_loss": -5.181464195251465, "global_step": 16397, "epoch": 390} {"train_loss": -5.230944633483887, "global_step": 16398, "epoch": 390} {"train_loss": -5.09276008605957, "global_step": 16399, "epoch": 390} {"train_loss": -5.18341064453125, "global_step": 16400, "epoch": 390} {"train_loss": -5.212665557861328, "global_step": 16401, "epoch": 390} {"train_loss": -5.205276012420654, "global_step": 16402, "epoch": 390} {"train_loss": -5.011028289794922, "global_step": 16403, "epoch": 390} {"train_loss": -5.370330810546875, "global_step": 16404, "epoch": 390} {"train_loss": -5.115396499633789, "global_step": 16405, "epoch": 390} {"train_loss": -5.254019737243652, "global_step": 16406, "epoch": 390} {"train_loss": -5.202362060546875, "global_step": 16407, "epoch": 390} {"train_loss": -5.198969841003418, "global_step": 16408, "epoch": 390} {"train_loss": -5.152549743652344, "global_step": 16409, "epoch": 390} {"train_loss": -5.211367607116699, "global_step": 16410, "epoch": 390} {"train_loss": -5.154888153076172, "global_step": 16411, "epoch": 390} {"train_loss": -5.222150802612305, "global_step": 16412, "epoch": 390} {"train_loss": -5.237367630004883, "global_step": 16413, "epoch": 390} {"train_loss": -5.189610004425049, "global_step": 16414, "epoch": 390} {"train_loss": -5.290340423583984, "global_step": 16415, "epoch": 390} {"train_loss": -5.138564109802246, "global_step": 16416, "epoch": 390} {"train_loss": -5.266488552093506, "global_step": 16417, "epoch": 390} {"train_loss": -5.376947402954102, "global_step": 16418, "epoch": 390} {"train_loss": -5.187910079956055, "global_step": 16419, "epoch": 390} {"train_loss": -5.314939022064209, "global_step": 16420, "epoch": 390} {"train_loss": -5.198698077883039, "global_step": 16421, "epoch": 390, "val_loss": 78922.109375} {"train_loss": -5.25997257232666, "global_step": 16422, "epoch": 391} {"train_loss": -5.127089500427246, "global_step": 16423, "epoch": 391} {"train_loss": -5.176901817321777, "global_step": 16424, "epoch": 391} {"train_loss": -5.0542707443237305, "global_step": 16425, "epoch": 391} {"train_loss": -5.126764297485352, "global_step": 16426, "epoch": 391} {"train_loss": -4.973158836364746, "global_step": 16427, "epoch": 391} {"train_loss": -5.160941123962402, "global_step": 16428, "epoch": 391} {"train_loss": -5.225153923034668, "global_step": 16429, "epoch": 391} {"train_loss": -5.084565162658691, "global_step": 16430, "epoch": 391} {"train_loss": -5.300691604614258, "global_step": 16431, "epoch": 391} {"train_loss": -5.2888641357421875, "global_step": 16432, "epoch": 391} {"train_loss": -5.158317565917969, "global_step": 16433, "epoch": 391} {"train_loss": -5.080632209777832, "global_step": 16434, "epoch": 391} {"train_loss": -5.181573390960693, "global_step": 16435, "epoch": 391} {"train_loss": -5.209606647491455, "global_step": 16436, "epoch": 391} {"train_loss": -5.295642852783203, "global_step": 16437, "epoch": 391} {"train_loss": -5.375769138336182, "global_step": 16438, "epoch": 391} {"train_loss": -5.1984639167785645, "global_step": 16439, "epoch": 391} {"train_loss": -5.093531131744385, "global_step": 16440, "epoch": 391} {"train_loss": -5.087422847747803, "global_step": 16441, "epoch": 391} {"train_loss": -5.312680244445801, "global_step": 16442, "epoch": 391} {"train_loss": -5.072048187255859, "global_step": 16443, "epoch": 391} {"train_loss": -5.223396301269531, "global_step": 16444, "epoch": 391} {"train_loss": -5.342688083648682, "global_step": 16445, "epoch": 391} {"train_loss": -5.115268707275391, "global_step": 16446, "epoch": 391} {"train_loss": -5.206207752227783, "global_step": 16447, "epoch": 391} {"train_loss": -5.219691276550293, "global_step": 16448, "epoch": 391} {"train_loss": -5.288331985473633, "global_step": 16449, "epoch": 391} {"train_loss": -5.196812152862549, "global_step": 16450, "epoch": 391} {"train_loss": -5.139989852905273, "global_step": 16451, "epoch": 391} {"train_loss": -5.261316776275635, "global_step": 16452, "epoch": 391} {"train_loss": -5.068269729614258, "global_step": 16453, "epoch": 391} {"train_loss": -5.221485614776611, "global_step": 16454, "epoch": 391} {"train_loss": -5.150235652923584, "global_step": 16455, "epoch": 391} {"train_loss": -5.232778549194336, "global_step": 16456, "epoch": 391} {"train_loss": -5.292094707489014, "global_step": 16457, "epoch": 391} {"train_loss": -5.201973915100098, "global_step": 16458, "epoch": 391} {"train_loss": -5.153057098388672, "global_step": 16459, "epoch": 391} {"train_loss": -5.082365036010742, "global_step": 16460, "epoch": 391} {"train_loss": -5.21075439453125, "global_step": 16461, "epoch": 391} {"train_loss": -5.218724727630615, "global_step": 16462, "epoch": 391} {"train_loss": -5.191384020305815, "global_step": 16463, "epoch": 391, "val_loss": 77757.1015625} {"train_loss": -5.319819927215576, "global_step": 16464, "epoch": 392} {"train_loss": -5.2704010009765625, "global_step": 16465, "epoch": 392} {"train_loss": -5.292088985443115, "global_step": 16466, "epoch": 392} {"train_loss": -5.2269134521484375, "global_step": 16467, "epoch": 392} {"train_loss": -5.2220611572265625, "global_step": 16468, "epoch": 392} {"train_loss": -5.2200236320495605, "global_step": 16469, "epoch": 392} {"train_loss": -5.299434661865234, "global_step": 16470, "epoch": 392} {"train_loss": -5.262219429016113, "global_step": 16471, "epoch": 392} {"train_loss": -5.22020149230957, "global_step": 16472, "epoch": 392} {"train_loss": -5.247684478759766, "global_step": 16473, "epoch": 392} {"train_loss": -5.10630989074707, "global_step": 16474, "epoch": 392} {"train_loss": -5.259639739990234, "global_step": 16475, "epoch": 392} {"train_loss": -5.221970558166504, "global_step": 16476, "epoch": 392} {"train_loss": -5.172131538391113, "global_step": 16477, "epoch": 392} {"train_loss": -5.0529327392578125, "global_step": 16478, "epoch": 392} {"train_loss": -5.189424991607666, "global_step": 16479, "epoch": 392} {"train_loss": -5.317682266235352, "global_step": 16480, "epoch": 392} {"train_loss": -5.275121688842773, "global_step": 16481, "epoch": 392} {"train_loss": -5.079919815063477, "global_step": 16482, "epoch": 392} {"train_loss": -5.214298248291016, "global_step": 16483, "epoch": 392} {"train_loss": -5.315505027770996, "global_step": 16484, "epoch": 392} {"train_loss": -5.042552947998047, "global_step": 16485, "epoch": 392} {"train_loss": -5.14449405670166, "global_step": 16486, "epoch": 392} {"train_loss": -5.32411003112793, "global_step": 16487, "epoch": 392} {"train_loss": -5.1880340576171875, "global_step": 16488, "epoch": 392} {"train_loss": -5.151405334472656, "global_step": 16489, "epoch": 392} {"train_loss": -5.250370025634766, "global_step": 16490, "epoch": 392} {"train_loss": -5.172276973724365, "global_step": 16491, "epoch": 392} {"train_loss": -5.160465240478516, "global_step": 16492, "epoch": 392} {"train_loss": -5.176177978515625, "global_step": 16493, "epoch": 392} {"train_loss": -5.26866340637207, "global_step": 16494, "epoch": 392} {"train_loss": -5.169921875, "global_step": 16495, "epoch": 392} {"train_loss": -5.082163333892822, "global_step": 16496, "epoch": 392} {"train_loss": -5.294328689575195, "global_step": 16497, "epoch": 392} {"train_loss": -5.140588283538818, "global_step": 16498, "epoch": 392} {"train_loss": -5.1758832931518555, "global_step": 16499, "epoch": 392} {"train_loss": -5.137373447418213, "global_step": 16500, "epoch": 392} {"train_loss": -5.3161163330078125, "global_step": 16501, "epoch": 392} {"train_loss": -5.172890663146973, "global_step": 16502, "epoch": 392} {"train_loss": -5.111481189727783, "global_step": 16503, "epoch": 392} {"train_loss": -5.047248363494873, "global_step": 16504, "epoch": 392} {"train_loss": -5.204464787528629, "global_step": 16505, "epoch": 392, "val_loss": 78678.65625} {"train_loss": -5.177800178527832, "global_step": 16506, "epoch": 393} {"train_loss": -5.14005184173584, "global_step": 16507, "epoch": 393} {"train_loss": -5.154349327087402, "global_step": 16508, "epoch": 393} {"train_loss": -5.329801559448242, "global_step": 16509, "epoch": 393} {"train_loss": -5.094449520111084, "global_step": 16510, "epoch": 393} {"train_loss": -5.311409950256348, "global_step": 16511, "epoch": 393} {"train_loss": -5.266788959503174, "global_step": 16512, "epoch": 393} {"train_loss": -5.21753454208374, "global_step": 16513, "epoch": 393} {"train_loss": -5.265920162200928, "global_step": 16514, "epoch": 393} {"train_loss": -5.16533088684082, "global_step": 16515, "epoch": 393} {"train_loss": -5.221647262573242, "global_step": 16516, "epoch": 393} {"train_loss": -5.257185459136963, "global_step": 16517, "epoch": 393} {"train_loss": -5.088544845581055, "global_step": 16518, "epoch": 393} {"train_loss": -5.26807165145874, "global_step": 16519, "epoch": 393} {"train_loss": -5.234177589416504, "global_step": 16520, "epoch": 393} {"train_loss": -5.244974613189697, "global_step": 16521, "epoch": 393} {"train_loss": -5.166204929351807, "global_step": 16522, "epoch": 393} {"train_loss": -5.2276411056518555, "global_step": 16523, "epoch": 393} {"train_loss": -5.039422988891602, "global_step": 16524, "epoch": 393} {"train_loss": -5.173770904541016, "global_step": 16525, "epoch": 393} {"train_loss": -5.078742027282715, "global_step": 16526, "epoch": 393} {"train_loss": -5.101796627044678, "global_step": 16527, "epoch": 393} {"train_loss": -5.293034553527832, "global_step": 16528, "epoch": 393} {"train_loss": -5.261678695678711, "global_step": 16529, "epoch": 393} {"train_loss": -5.3242645263671875, "global_step": 16530, "epoch": 393} {"train_loss": -5.257656097412109, "global_step": 16531, "epoch": 393} {"train_loss": -5.251378059387207, "global_step": 16532, "epoch": 393} {"train_loss": -5.174382209777832, "global_step": 16533, "epoch": 393} {"train_loss": -5.240697383880615, "global_step": 16534, "epoch": 393} {"train_loss": -5.217820167541504, "global_step": 16535, "epoch": 393} {"train_loss": -5.059381484985352, "global_step": 16536, "epoch": 393} {"train_loss": -5.124809741973877, "global_step": 16537, "epoch": 393} {"train_loss": -5.219270706176758, "global_step": 16538, "epoch": 393} {"train_loss": -5.127936363220215, "global_step": 16539, "epoch": 393} {"train_loss": -5.242166519165039, "global_step": 16540, "epoch": 393} {"train_loss": -5.1592559814453125, "global_step": 16541, "epoch": 393} {"train_loss": -5.1123762130737305, "global_step": 16542, "epoch": 393} {"train_loss": -5.0783772468566895, "global_step": 16543, "epoch": 393} {"train_loss": -5.196147441864014, "global_step": 16544, "epoch": 393} {"train_loss": -5.245210647583008, "global_step": 16545, "epoch": 393} {"train_loss": -5.1816253662109375, "global_step": 16546, "epoch": 393} {"train_loss": -5.193254152933757, "global_step": 16547, "epoch": 393, "val_loss": 77750.6875} {"train_loss": -5.328489780426025, "global_step": 16548, "epoch": 394} {"train_loss": -5.033102035522461, "global_step": 16549, "epoch": 394} {"train_loss": -4.975461006164551, "global_step": 16550, "epoch": 394} {"train_loss": -5.131589889526367, "global_step": 16551, "epoch": 394} {"train_loss": -5.135698318481445, "global_step": 16552, "epoch": 394} {"train_loss": -5.214818000793457, "global_step": 16553, "epoch": 394} {"train_loss": -5.30096435546875, "global_step": 16554, "epoch": 394} {"train_loss": -5.2267656326293945, "global_step": 16555, "epoch": 394} {"train_loss": -5.246057510375977, "global_step": 16556, "epoch": 394} {"train_loss": -5.3177971839904785, "global_step": 16557, "epoch": 394} {"train_loss": -5.134148597717285, "global_step": 16558, "epoch": 394} {"train_loss": -5.134481906890869, "global_step": 16559, "epoch": 394} {"train_loss": -5.3573222160339355, "global_step": 16560, "epoch": 394} {"train_loss": -5.199962139129639, "global_step": 16561, "epoch": 394} {"train_loss": -5.1304612159729, "global_step": 16562, "epoch": 394} {"train_loss": -5.053653240203857, "global_step": 16563, "epoch": 394} {"train_loss": -5.160456657409668, "global_step": 16564, "epoch": 394} {"train_loss": -4.986818313598633, "global_step": 16565, "epoch": 394} {"train_loss": -5.159849166870117, "global_step": 16566, "epoch": 394} {"train_loss": -5.1592698097229, "global_step": 16567, "epoch": 394} {"train_loss": -5.124452590942383, "global_step": 16568, "epoch": 394} {"train_loss": -5.201571464538574, "global_step": 16569, "epoch": 394} {"train_loss": -5.092418670654297, "global_step": 16570, "epoch": 394} {"train_loss": -5.191486835479736, "global_step": 16571, "epoch": 394} {"train_loss": -5.124031066894531, "global_step": 16572, "epoch": 394} {"train_loss": -5.204710483551025, "global_step": 16573, "epoch": 394} {"train_loss": -5.17645788192749, "global_step": 16574, "epoch": 394} {"train_loss": -5.253156661987305, "global_step": 16575, "epoch": 394} {"train_loss": -5.167904853820801, "global_step": 16576, "epoch": 394} {"train_loss": -5.1966352462768555, "global_step": 16577, "epoch": 394} {"train_loss": -5.196869850158691, "global_step": 16578, "epoch": 394} {"train_loss": -5.153537750244141, "global_step": 16579, "epoch": 394} {"train_loss": -5.194402694702148, "global_step": 16580, "epoch": 394} {"train_loss": -5.389731407165527, "global_step": 16581, "epoch": 394} {"train_loss": -5.280287265777588, "global_step": 16582, "epoch": 394} {"train_loss": -5.207483291625977, "global_step": 16583, "epoch": 394} {"train_loss": -5.3329596519470215, "global_step": 16584, "epoch": 394} {"train_loss": -5.225202560424805, "global_step": 16585, "epoch": 394} {"train_loss": -5.213052272796631, "global_step": 16586, "epoch": 394} {"train_loss": -5.190199851989746, "global_step": 16587, "epoch": 394} {"train_loss": -5.277268409729004, "global_step": 16588, "epoch": 394} {"train_loss": -5.190201997756958, "global_step": 16589, "epoch": 394, "val_loss": 77410.7890625} {"train_loss": -5.260266304016113, "global_step": 16590, "epoch": 395} {"train_loss": -5.321808338165283, "global_step": 16591, "epoch": 395} {"train_loss": -5.371026515960693, "global_step": 16592, "epoch": 395} {"train_loss": -5.29890251159668, "global_step": 16593, "epoch": 395} {"train_loss": -5.221296310424805, "global_step": 16594, "epoch": 395} {"train_loss": -5.206106185913086, "global_step": 16595, "epoch": 395} {"train_loss": -5.147701740264893, "global_step": 16596, "epoch": 395} {"train_loss": -5.352320671081543, "global_step": 16597, "epoch": 395} {"train_loss": -5.2691264152526855, "global_step": 16598, "epoch": 395} {"train_loss": -5.055809020996094, "global_step": 16599, "epoch": 395} {"train_loss": -5.105818748474121, "global_step": 16600, "epoch": 395} {"train_loss": -5.214713096618652, "global_step": 16601, "epoch": 395} {"train_loss": -5.078121185302734, "global_step": 16602, "epoch": 395} {"train_loss": -5.303365707397461, "global_step": 16603, "epoch": 395} {"train_loss": -5.293020248413086, "global_step": 16604, "epoch": 395} {"train_loss": -5.055707931518555, "global_step": 16605, "epoch": 395} {"train_loss": -5.214370250701904, "global_step": 16606, "epoch": 395} {"train_loss": -5.120612144470215, "global_step": 16607, "epoch": 395} {"train_loss": -5.173333168029785, "global_step": 16608, "epoch": 395} {"train_loss": -5.0868024826049805, "global_step": 16609, "epoch": 395} {"train_loss": -5.172832012176514, "global_step": 16610, "epoch": 395} {"train_loss": -5.159874439239502, "global_step": 16611, "epoch": 395} {"train_loss": -5.351438522338867, "global_step": 16612, "epoch": 395} {"train_loss": -5.238642692565918, "global_step": 16613, "epoch": 395} {"train_loss": -5.200930595397949, "global_step": 16614, "epoch": 395} {"train_loss": -5.181501388549805, "global_step": 16615, "epoch": 395} {"train_loss": -5.115180015563965, "global_step": 16616, "epoch": 395} {"train_loss": -5.1904377937316895, "global_step": 16617, "epoch": 395} {"train_loss": -5.196813583374023, "global_step": 16618, "epoch": 395} {"train_loss": -5.202049255371094, "global_step": 16619, "epoch": 395} {"train_loss": -5.087873935699463, "global_step": 16620, "epoch": 395} {"train_loss": -5.283968925476074, "global_step": 16621, "epoch": 395} {"train_loss": -5.200138092041016, "global_step": 16622, "epoch": 395} {"train_loss": -5.299077987670898, "global_step": 16623, "epoch": 395} {"train_loss": -5.248445510864258, "global_step": 16624, "epoch": 395} {"train_loss": -5.1569318771362305, "global_step": 16625, "epoch": 395} {"train_loss": -5.16046667098999, "global_step": 16626, "epoch": 395} {"train_loss": -5.266706943511963, "global_step": 16627, "epoch": 395} {"train_loss": -5.301156044006348, "global_step": 16628, "epoch": 395} {"train_loss": -5.253722190856934, "global_step": 16629, "epoch": 395} {"train_loss": -5.145298957824707, "global_step": 16630, "epoch": 395} {"train_loss": -5.206361350559053, "global_step": 16631, "epoch": 395, "val_loss": 77687.3984375} {"train_loss": -5.302074909210205, "global_step": 16632, "epoch": 396} {"train_loss": -5.285586357116699, "global_step": 16633, "epoch": 396} {"train_loss": -5.293546676635742, "global_step": 16634, "epoch": 396} {"train_loss": -5.338006019592285, "global_step": 16635, "epoch": 396} {"train_loss": -5.268270969390869, "global_step": 16636, "epoch": 396} {"train_loss": -5.258289337158203, "global_step": 16637, "epoch": 396} {"train_loss": -5.304644584655762, "global_step": 16638, "epoch": 396} {"train_loss": -5.286137580871582, "global_step": 16639, "epoch": 396} {"train_loss": -5.229901313781738, "global_step": 16640, "epoch": 396} {"train_loss": -5.307504177093506, "global_step": 16641, "epoch": 396} {"train_loss": -5.168761253356934, "global_step": 16642, "epoch": 396} {"train_loss": -5.311314582824707, "global_step": 16643, "epoch": 396} {"train_loss": -5.170327186584473, "global_step": 16644, "epoch": 396} {"train_loss": -5.129522800445557, "global_step": 16645, "epoch": 396} {"train_loss": -5.2331671714782715, "global_step": 16646, "epoch": 396} {"train_loss": -5.278843402862549, "global_step": 16647, "epoch": 396} {"train_loss": -5.134671211242676, "global_step": 16648, "epoch": 396} {"train_loss": -5.341816425323486, "global_step": 16649, "epoch": 396} {"train_loss": -5.201316833496094, "global_step": 16650, "epoch": 396} {"train_loss": -5.137628555297852, "global_step": 16651, "epoch": 396} {"train_loss": -5.1024980545043945, "global_step": 16652, "epoch": 396} {"train_loss": -5.254709243774414, "global_step": 16653, "epoch": 396} {"train_loss": -5.176311492919922, "global_step": 16654, "epoch": 396} {"train_loss": -5.225039958953857, "global_step": 16655, "epoch": 396} {"train_loss": -5.067913055419922, "global_step": 16656, "epoch": 396} {"train_loss": -5.251322269439697, "global_step": 16657, "epoch": 396} {"train_loss": -5.143869400024414, "global_step": 16658, "epoch": 396} {"train_loss": -5.075071334838867, "global_step": 16659, "epoch": 396} {"train_loss": -5.083080291748047, "global_step": 16660, "epoch": 396} {"train_loss": -5.199673175811768, "global_step": 16661, "epoch": 396} {"train_loss": -5.164693832397461, "global_step": 16662, "epoch": 396} {"train_loss": -5.138893127441406, "global_step": 16663, "epoch": 396} {"train_loss": -5.226369857788086, "global_step": 16664, "epoch": 396} {"train_loss": -5.045173645019531, "global_step": 16665, "epoch": 396} {"train_loss": -5.011200904846191, "global_step": 16666, "epoch": 396} {"train_loss": -5.002756118774414, "global_step": 16667, "epoch": 396} {"train_loss": -5.236363410949707, "global_step": 16668, "epoch": 396} {"train_loss": -5.091427803039551, "global_step": 16669, "epoch": 396} {"train_loss": -5.234966278076172, "global_step": 16670, "epoch": 396} {"train_loss": -5.209812164306641, "global_step": 16671, "epoch": 396} {"train_loss": -5.06562614440918, "global_step": 16672, "epoch": 396} {"train_loss": -5.194934129714966, "global_step": 16673, "epoch": 396, "val_loss": 78343.09375} {"train_loss": -5.259601593017578, "global_step": 16674, "epoch": 397} {"train_loss": -5.150442123413086, "global_step": 16675, "epoch": 397} {"train_loss": -5.215714454650879, "global_step": 16676, "epoch": 397} {"train_loss": -5.297706604003906, "global_step": 16677, "epoch": 397} {"train_loss": -5.1662187576293945, "global_step": 16678, "epoch": 397} {"train_loss": -5.201040267944336, "global_step": 16679, "epoch": 397} {"train_loss": -5.161983966827393, "global_step": 16680, "epoch": 397} {"train_loss": -5.2143402099609375, "global_step": 16681, "epoch": 397} {"train_loss": -5.151183605194092, "global_step": 16682, "epoch": 397} {"train_loss": -5.2548370361328125, "global_step": 16683, "epoch": 397} {"train_loss": -5.1614789962768555, "global_step": 16684, "epoch": 397} {"train_loss": -5.144536972045898, "global_step": 16685, "epoch": 397} {"train_loss": -5.145298480987549, "global_step": 16686, "epoch": 397} {"train_loss": -5.214264392852783, "global_step": 16687, "epoch": 397} {"train_loss": -5.27284574508667, "global_step": 16688, "epoch": 397} {"train_loss": -5.251730918884277, "global_step": 16689, "epoch": 397} {"train_loss": -5.30973482131958, "global_step": 16690, "epoch": 397} {"train_loss": -5.292046546936035, "global_step": 16691, "epoch": 397} {"train_loss": -5.150333881378174, "global_step": 16692, "epoch": 397} {"train_loss": -5.286638259887695, "global_step": 16693, "epoch": 397} {"train_loss": -5.352764129638672, "global_step": 16694, "epoch": 397} {"train_loss": -5.250243663787842, "global_step": 16695, "epoch": 397} {"train_loss": -5.274996757507324, "global_step": 16696, "epoch": 397} {"train_loss": -5.315717697143555, "global_step": 16697, "epoch": 397} {"train_loss": -5.134565830230713, "global_step": 16698, "epoch": 397} {"train_loss": -5.242220401763916, "global_step": 16699, "epoch": 397} {"train_loss": -5.3132643699646, "global_step": 16700, "epoch": 397} {"train_loss": -5.0863423347473145, "global_step": 16701, "epoch": 397} {"train_loss": -5.259478569030762, "global_step": 16702, "epoch": 397} {"train_loss": -5.195905685424805, "global_step": 16703, "epoch": 397} {"train_loss": -5.1574296951293945, "global_step": 16704, "epoch": 397} {"train_loss": -5.297663688659668, "global_step": 16705, "epoch": 397} {"train_loss": -5.122806549072266, "global_step": 16706, "epoch": 397} {"train_loss": -5.260182857513428, "global_step": 16707, "epoch": 397} {"train_loss": -4.980381965637207, "global_step": 16708, "epoch": 397} {"train_loss": -5.309837341308594, "global_step": 16709, "epoch": 397} {"train_loss": -5.163201332092285, "global_step": 16710, "epoch": 397} {"train_loss": -5.13253927230835, "global_step": 16711, "epoch": 397} {"train_loss": -5.261410236358643, "global_step": 16712, "epoch": 397} {"train_loss": -5.248143196105957, "global_step": 16713, "epoch": 397} {"train_loss": -5.12032413482666, "global_step": 16714, "epoch": 397} {"train_loss": -5.214033694494338, "global_step": 16715, "epoch": 397, "val_loss": 77876.1796875} {"train_loss": -5.254009246826172, "global_step": 16716, "epoch": 398} {"train_loss": -5.300867080688477, "global_step": 16717, "epoch": 398} {"train_loss": -5.265048027038574, "global_step": 16718, "epoch": 398} {"train_loss": -5.226739883422852, "global_step": 16719, "epoch": 398} {"train_loss": -5.210622787475586, "global_step": 16720, "epoch": 398} {"train_loss": -5.234908103942871, "global_step": 16721, "epoch": 398} {"train_loss": -5.230899810791016, "global_step": 16722, "epoch": 398} {"train_loss": -5.215971946716309, "global_step": 16723, "epoch": 398} {"train_loss": -5.277161121368408, "global_step": 16724, "epoch": 398} {"train_loss": -5.280182361602783, "global_step": 16725, "epoch": 398} {"train_loss": -5.193107604980469, "global_step": 16726, "epoch": 398} {"train_loss": -5.136651039123535, "global_step": 16727, "epoch": 398} {"train_loss": -5.223354339599609, "global_step": 16728, "epoch": 398} {"train_loss": -5.170299530029297, "global_step": 16729, "epoch": 398} {"train_loss": -5.105932712554932, "global_step": 16730, "epoch": 398} {"train_loss": -5.3177170753479, "global_step": 16731, "epoch": 398} {"train_loss": -5.112009048461914, "global_step": 16732, "epoch": 398} {"train_loss": -5.12525749206543, "global_step": 16733, "epoch": 398} {"train_loss": -5.212457180023193, "global_step": 16734, "epoch": 398} {"train_loss": -5.223167896270752, "global_step": 16735, "epoch": 398} {"train_loss": -5.117793083190918, "global_step": 16736, "epoch": 398} {"train_loss": -5.1906256675720215, "global_step": 16737, "epoch": 398} {"train_loss": -5.173996925354004, "global_step": 16738, "epoch": 398} {"train_loss": -5.223529815673828, "global_step": 16739, "epoch": 398} {"train_loss": -5.151554584503174, "global_step": 16740, "epoch": 398} {"train_loss": -5.170893669128418, "global_step": 16741, "epoch": 398} {"train_loss": -5.285053253173828, "global_step": 16742, "epoch": 398} {"train_loss": -5.174169540405273, "global_step": 16743, "epoch": 398} {"train_loss": -5.153381824493408, "global_step": 16744, "epoch": 398} {"train_loss": -5.370882987976074, "global_step": 16745, "epoch": 398} {"train_loss": -5.126993656158447, "global_step": 16746, "epoch": 398} {"train_loss": -5.105199813842773, "global_step": 16747, "epoch": 398} {"train_loss": -5.239651679992676, "global_step": 16748, "epoch": 398} {"train_loss": -5.118587493896484, "global_step": 16749, "epoch": 398} {"train_loss": -5.066478729248047, "global_step": 16750, "epoch": 398} {"train_loss": -5.250373840332031, "global_step": 16751, "epoch": 398} {"train_loss": -5.163120269775391, "global_step": 16752, "epoch": 398} {"train_loss": -5.191628456115723, "global_step": 16753, "epoch": 398} {"train_loss": -5.202834129333496, "global_step": 16754, "epoch": 398} {"train_loss": -5.192305564880371, "global_step": 16755, "epoch": 398} {"train_loss": -5.134836673736572, "global_step": 16756, "epoch": 398} {"train_loss": -5.201104107357207, "global_step": 16757, "epoch": 398, "val_loss": 78325.3984375} {"train_loss": -5.240959167480469, "global_step": 16758, "epoch": 399} {"train_loss": -5.160172462463379, "global_step": 16759, "epoch": 399} {"train_loss": -5.167776107788086, "global_step": 16760, "epoch": 399} {"train_loss": -5.205831527709961, "global_step": 16761, "epoch": 399} {"train_loss": -5.1914567947387695, "global_step": 16762, "epoch": 399} {"train_loss": -5.097294807434082, "global_step": 16763, "epoch": 399} {"train_loss": -5.120978355407715, "global_step": 16764, "epoch": 399} {"train_loss": -5.226974010467529, "global_step": 16765, "epoch": 399} {"train_loss": -5.281966209411621, "global_step": 16766, "epoch": 399} {"train_loss": -5.216719627380371, "global_step": 16767, "epoch": 399} {"train_loss": -5.126345634460449, "global_step": 16768, "epoch": 399} {"train_loss": -5.119661331176758, "global_step": 16769, "epoch": 399} {"train_loss": -5.197331428527832, "global_step": 16770, "epoch": 399} {"train_loss": -5.146068572998047, "global_step": 16771, "epoch": 399} {"train_loss": -5.221773624420166, "global_step": 16772, "epoch": 399} {"train_loss": -5.279351234436035, "global_step": 16773, "epoch": 399} {"train_loss": -5.109038829803467, "global_step": 16774, "epoch": 399} {"train_loss": -5.209681510925293, "global_step": 16775, "epoch": 399} {"train_loss": -5.324551582336426, "global_step": 16776, "epoch": 399} {"train_loss": -4.9648895263671875, "global_step": 16777, "epoch": 399} {"train_loss": -5.257803916931152, "global_step": 16778, "epoch": 399} {"train_loss": -5.214737892150879, "global_step": 16779, "epoch": 399} {"train_loss": -5.056784629821777, "global_step": 16780, "epoch": 399} {"train_loss": -5.250924587249756, "global_step": 16781, "epoch": 399} {"train_loss": -5.233858108520508, "global_step": 16782, "epoch": 399} {"train_loss": -5.285279750823975, "global_step": 16783, "epoch": 399} {"train_loss": -5.187638282775879, "global_step": 16784, "epoch": 399} {"train_loss": -5.022217750549316, "global_step": 16785, "epoch": 399} {"train_loss": -5.349782466888428, "global_step": 16786, "epoch": 399} {"train_loss": -5.141084671020508, "global_step": 16787, "epoch": 399} {"train_loss": -5.288854598999023, "global_step": 16788, "epoch": 399} {"train_loss": -5.213515281677246, "global_step": 16789, "epoch": 399} {"train_loss": -5.23313570022583, "global_step": 16790, "epoch": 399} {"train_loss": -5.3397746086120605, "global_step": 16791, "epoch": 399} {"train_loss": -5.2465434074401855, "global_step": 16792, "epoch": 399} {"train_loss": -5.193480491638184, "global_step": 16793, "epoch": 399} {"train_loss": -5.092050075531006, "global_step": 16794, "epoch": 399} {"train_loss": -5.214235782623291, "global_step": 16795, "epoch": 399} {"train_loss": -5.305129051208496, "global_step": 16796, "epoch": 399} {"train_loss": -5.122352600097656, "global_step": 16797, "epoch": 399} {"train_loss": -5.205183029174805, "global_step": 16798, "epoch": 399} {"train_loss": -5.196913662410918, "global_step": 16799, "epoch": 399, "val_loss": 78130.265625} {"train_loss": -5.339183807373047, "global_step": 16800, "epoch": 400} {"train_loss": -5.142227649688721, "global_step": 16801, "epoch": 400} {"train_loss": -5.242915630340576, "global_step": 16802, "epoch": 400} {"train_loss": -5.22795295715332, "global_step": 16803, "epoch": 400} {"train_loss": -5.379476070404053, "global_step": 16804, "epoch": 400} {"train_loss": -5.215709209442139, "global_step": 16805, "epoch": 400} {"train_loss": -5.117074966430664, "global_step": 16806, "epoch": 400} {"train_loss": -5.206313133239746, "global_step": 16807, "epoch": 400} {"train_loss": -5.2903900146484375, "global_step": 16808, "epoch": 400} {"train_loss": -5.323089599609375, "global_step": 16809, "epoch": 400} {"train_loss": -5.082129001617432, "global_step": 16810, "epoch": 400} {"train_loss": -5.108310699462891, "global_step": 16811, "epoch": 400} {"train_loss": -5.218099117279053, "global_step": 16812, "epoch": 400} {"train_loss": -5.206035614013672, "global_step": 16813, "epoch": 400} {"train_loss": -5.372854232788086, "global_step": 16814, "epoch": 400} {"train_loss": -5.25853157043457, "global_step": 16815, "epoch": 400} {"train_loss": -5.295290946960449, "global_step": 16816, "epoch": 400} {"train_loss": -5.204142093658447, "global_step": 16817, "epoch": 400} {"train_loss": -5.307526111602783, "global_step": 16818, "epoch": 400} {"train_loss": -5.264781951904297, "global_step": 16819, "epoch": 400} {"train_loss": -5.1336870193481445, "global_step": 16820, "epoch": 400} {"train_loss": -5.205550670623779, "global_step": 16821, "epoch": 400} {"train_loss": -5.180756568908691, "global_step": 16822, "epoch": 400} {"train_loss": -5.066407203674316, "global_step": 16823, "epoch": 400} {"train_loss": -5.188871383666992, "global_step": 16824, "epoch": 400} {"train_loss": -5.349480628967285, "global_step": 16825, "epoch": 400} {"train_loss": -5.216405868530273, "global_step": 16826, "epoch": 400} {"train_loss": -5.106688022613525, "global_step": 16827, "epoch": 400} {"train_loss": -5.20323371887207, "global_step": 16828, "epoch": 400} {"train_loss": -5.2810163497924805, "global_step": 16829, "epoch": 400} {"train_loss": -5.162528038024902, "global_step": 16830, "epoch": 400} {"train_loss": -5.324063301086426, "global_step": 16831, "epoch": 400} {"train_loss": -5.2029128074646, "global_step": 16832, "epoch": 400} {"train_loss": -5.167058944702148, "global_step": 16833, "epoch": 400} {"train_loss": -5.164243221282959, "global_step": 16834, "epoch": 400} {"train_loss": -5.217641353607178, "global_step": 16835, "epoch": 400} {"train_loss": -5.0522990226745605, "global_step": 16836, "epoch": 400} {"train_loss": -5.227266311645508, "global_step": 16837, "epoch": 400} {"train_loss": -5.190528869628906, "global_step": 16838, "epoch": 400} {"train_loss": -5.100949764251709, "global_step": 16839, "epoch": 400} {"train_loss": -5.140163421630859, "global_step": 16840, "epoch": 400} {"train_loss": -5.2079287597111295, "global_step": 16841, "epoch": 400, "train/sim_max_reward_0": 0.1922025055884831, "train/sim_max_reward_1": 0.7673076273543588, "train/sim_max_reward_2": 0.2880133644874099, "train/sim_max_reward_3": 0.07216634607184604, "train/sim_max_reward_4": 0.27652106563850926, "train/sim_max_reward_5": 0.5394116883232399, "test/sim_max_reward_4500000": 0.33545001878982844, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.12478492811296969, "test/sim_max_reward_4500006": 0.030557247257457787, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.04485101166080106, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.42957354962300054, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.6708916423156588, "test/sim_max_reward_4500015": 0.0015612969227477046, "test/sim_max_reward_4500016": 0.016831089196532173, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.16639279695728687, "test/sim_max_reward_4500019": 0.39496762743265895, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.43645387941070074, "test/sim_max_reward_4500022": 0.7444104344088994, "test/sim_max_reward_4500023": 0.9656273902360754, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.4679378684866362, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.7053138004740157, "test/sim_max_reward_4500028": 0.5857400388324212, "test/sim_max_reward_4500029": 0.04163460642148004, "test/sim_max_reward_4500030": 0.20496486565028932, "test/sim_max_reward_4500031": 0.004274515809097813, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.7399685540125306, "test/sim_max_reward_4500035": 0.7332948211497775, "test/sim_max_reward_4500036": 0.5320459650691253, "test/sim_max_reward_4500037": 0.5264109022377542, "test/sim_max_reward_4500038": 0.5778309075703435, "test/sim_max_reward_4500039": 0.764250165271056, "test/sim_max_reward_4500040": 0.29262577930404615, "test/sim_max_reward_4500041": 0.0, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.1175735103924684, "test/sim_max_reward_4500046": 0.08043583468793974, "test/sim_max_reward_4500047": 0.012889389629723542, "test/sim_max_reward_4500048": 0.0073919700154363955, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.35593709957730785, "test/mean_score": 0.21765112123360253, "val_loss": 77607.953125} {"train_loss": -5.303586006164551, "global_step": 16842, "epoch": 401} {"train_loss": -5.204882621765137, "global_step": 16843, "epoch": 401} {"train_loss": -5.13062858581543, "global_step": 16844, "epoch": 401} {"train_loss": -5.148103713989258, "global_step": 16845, "epoch": 401} {"train_loss": -5.150456428527832, "global_step": 16846, "epoch": 401} {"train_loss": -5.2071051597595215, "global_step": 16847, "epoch": 401} {"train_loss": -5.182771682739258, "global_step": 16848, "epoch": 401} {"train_loss": -5.3025102615356445, "global_step": 16849, "epoch": 401} {"train_loss": -5.256984233856201, "global_step": 16850, "epoch": 401} {"train_loss": -5.297150135040283, "global_step": 16851, "epoch": 401} {"train_loss": -5.050752639770508, "global_step": 16852, "epoch": 401} {"train_loss": -5.097265243530273, "global_step": 16853, "epoch": 401} {"train_loss": -5.109759330749512, "global_step": 16854, "epoch": 401} {"train_loss": -5.119234085083008, "global_step": 16855, "epoch": 401} {"train_loss": -5.219633102416992, "global_step": 16856, "epoch": 401} {"train_loss": -5.301267147064209, "global_step": 16857, "epoch": 401} {"train_loss": -5.002651214599609, "global_step": 16858, "epoch": 401} {"train_loss": -5.382798194885254, "global_step": 16859, "epoch": 401} {"train_loss": -5.242814540863037, "global_step": 16860, "epoch": 401} {"train_loss": -5.231002330780029, "global_step": 16861, "epoch": 401} {"train_loss": -5.23695707321167, "global_step": 16862, "epoch": 401} {"train_loss": -5.2217183113098145, "global_step": 16863, "epoch": 401} {"train_loss": -5.241153717041016, "global_step": 16864, "epoch": 401} {"train_loss": -5.304046154022217, "global_step": 16865, "epoch": 401} {"train_loss": -5.280768394470215, "global_step": 16866, "epoch": 401} {"train_loss": -5.235074043273926, "global_step": 16867, "epoch": 401} {"train_loss": -5.053009986877441, "global_step": 16868, "epoch": 401} {"train_loss": -5.320804595947266, "global_step": 16869, "epoch": 401} {"train_loss": -5.2773332595825195, "global_step": 16870, "epoch": 401} {"train_loss": -5.159469127655029, "global_step": 16871, "epoch": 401} {"train_loss": -5.216619491577148, "global_step": 16872, "epoch": 401} {"train_loss": -5.256852149963379, "global_step": 16873, "epoch": 401} {"train_loss": -5.2029314041137695, "global_step": 16874, "epoch": 401} {"train_loss": -5.2884392738342285, "global_step": 16875, "epoch": 401} {"train_loss": -5.268157958984375, "global_step": 16876, "epoch": 401} {"train_loss": -5.310665607452393, "global_step": 16877, "epoch": 401} {"train_loss": -5.224198341369629, "global_step": 16878, "epoch": 401} {"train_loss": -5.237127304077148, "global_step": 16879, "epoch": 401} {"train_loss": -5.297232627868652, "global_step": 16880, "epoch": 401} {"train_loss": -5.370795726776123, "global_step": 16881, "epoch": 401} {"train_loss": -5.2439117431640625, "global_step": 16882, "epoch": 401} {"train_loss": -5.224713893163772, "global_step": 16883, "epoch": 401, "val_loss": 78652.3515625} {"train_loss": -5.287242889404297, "global_step": 16884, "epoch": 402} {"train_loss": -5.171997547149658, "global_step": 16885, "epoch": 402} {"train_loss": -5.241868019104004, "global_step": 16886, "epoch": 402} {"train_loss": -5.2982072830200195, "global_step": 16887, "epoch": 402} {"train_loss": -5.296304702758789, "global_step": 16888, "epoch": 402} {"train_loss": -5.028834819793701, "global_step": 16889, "epoch": 402} {"train_loss": -5.206271171569824, "global_step": 16890, "epoch": 402} {"train_loss": -5.143292427062988, "global_step": 16891, "epoch": 402} {"train_loss": -5.195215225219727, "global_step": 16892, "epoch": 402} {"train_loss": -5.258060932159424, "global_step": 16893, "epoch": 402} {"train_loss": -5.140087604522705, "global_step": 16894, "epoch": 402} {"train_loss": -5.370439529418945, "global_step": 16895, "epoch": 402} {"train_loss": -5.306792259216309, "global_step": 16896, "epoch": 402} {"train_loss": -5.324462890625, "global_step": 16897, "epoch": 402} {"train_loss": -5.325457572937012, "global_step": 16898, "epoch": 402} {"train_loss": -5.229826927185059, "global_step": 16899, "epoch": 402} {"train_loss": -5.182201385498047, "global_step": 16900, "epoch": 402} {"train_loss": -5.226922512054443, "global_step": 16901, "epoch": 402} {"train_loss": -5.239790439605713, "global_step": 16902, "epoch": 402} {"train_loss": -5.141013145446777, "global_step": 16903, "epoch": 402} {"train_loss": -5.280330657958984, "global_step": 16904, "epoch": 402} {"train_loss": -5.2651047706604, "global_step": 16905, "epoch": 402} {"train_loss": -5.349100112915039, "global_step": 16906, "epoch": 402} {"train_loss": -5.2322893142700195, "global_step": 16907, "epoch": 402} {"train_loss": -5.216854095458984, "global_step": 16908, "epoch": 402} {"train_loss": -5.310480117797852, "global_step": 16909, "epoch": 402} {"train_loss": -5.184617519378662, "global_step": 16910, "epoch": 402} {"train_loss": -5.106927394866943, "global_step": 16911, "epoch": 402} {"train_loss": -5.1526689529418945, "global_step": 16912, "epoch": 402} {"train_loss": -5.237087249755859, "global_step": 16913, "epoch": 402} {"train_loss": -5.269265651702881, "global_step": 16914, "epoch": 402} {"train_loss": -5.169069766998291, "global_step": 16915, "epoch": 402} {"train_loss": -5.151697158813477, "global_step": 16916, "epoch": 402} {"train_loss": -5.176757335662842, "global_step": 16917, "epoch": 402} {"train_loss": -5.103043556213379, "global_step": 16918, "epoch": 402} {"train_loss": -5.2357072830200195, "global_step": 16919, "epoch": 402} {"train_loss": -4.998697280883789, "global_step": 16920, "epoch": 402} {"train_loss": -5.371311187744141, "global_step": 16921, "epoch": 402} {"train_loss": -5.010647773742676, "global_step": 16922, "epoch": 402} {"train_loss": -5.134345054626465, "global_step": 16923, "epoch": 402} {"train_loss": -5.215935230255127, "global_step": 16924, "epoch": 402} {"train_loss": -5.212888649531773, "global_step": 16925, "epoch": 402, "val_loss": 77772.3046875} {"train_loss": -5.2496232986450195, "global_step": 16926, "epoch": 403} {"train_loss": -5.164221286773682, "global_step": 16927, "epoch": 403} {"train_loss": -4.995824337005615, "global_step": 16928, "epoch": 403} {"train_loss": -4.9952898025512695, "global_step": 16929, "epoch": 403} {"train_loss": -5.136911392211914, "global_step": 16930, "epoch": 403} {"train_loss": -5.07243013381958, "global_step": 16931, "epoch": 403} {"train_loss": -5.081451416015625, "global_step": 16932, "epoch": 403} {"train_loss": -5.094645977020264, "global_step": 16933, "epoch": 403} {"train_loss": -5.2739105224609375, "global_step": 16934, "epoch": 403} {"train_loss": -5.0363359451293945, "global_step": 16935, "epoch": 403} {"train_loss": -5.115056991577148, "global_step": 16936, "epoch": 403} {"train_loss": -5.225311279296875, "global_step": 16937, "epoch": 403} {"train_loss": -5.042792797088623, "global_step": 16938, "epoch": 403} {"train_loss": -5.205028057098389, "global_step": 16939, "epoch": 403} {"train_loss": -5.099588394165039, "global_step": 16940, "epoch": 403} {"train_loss": -5.106681823730469, "global_step": 16941, "epoch": 403} {"train_loss": -5.104771614074707, "global_step": 16942, "epoch": 403} {"train_loss": -5.2227630615234375, "global_step": 16943, "epoch": 403} {"train_loss": -5.2924885749816895, "global_step": 16944, "epoch": 403} {"train_loss": -5.2086968421936035, "global_step": 16945, "epoch": 403} {"train_loss": -5.152253150939941, "global_step": 16946, "epoch": 403} {"train_loss": -5.266144752502441, "global_step": 16947, "epoch": 403} {"train_loss": -5.198702812194824, "global_step": 16948, "epoch": 403} {"train_loss": -5.086455345153809, "global_step": 16949, "epoch": 403} {"train_loss": -5.235901832580566, "global_step": 16950, "epoch": 403} {"train_loss": -5.153547763824463, "global_step": 16951, "epoch": 403} {"train_loss": -5.146274089813232, "global_step": 16952, "epoch": 403} {"train_loss": -5.226690292358398, "global_step": 16953, "epoch": 403} {"train_loss": -5.097500324249268, "global_step": 16954, "epoch": 403} {"train_loss": -5.197393417358398, "global_step": 16955, "epoch": 403} {"train_loss": -5.282297611236572, "global_step": 16956, "epoch": 403} {"train_loss": -5.1195573806762695, "global_step": 16957, "epoch": 403} {"train_loss": -5.276237487792969, "global_step": 16958, "epoch": 403} {"train_loss": -5.178323745727539, "global_step": 16959, "epoch": 403} {"train_loss": -5.071466445922852, "global_step": 16960, "epoch": 403} {"train_loss": -5.345881462097168, "global_step": 16961, "epoch": 403} {"train_loss": -5.226953983306885, "global_step": 16962, "epoch": 403} {"train_loss": -5.181385040283203, "global_step": 16963, "epoch": 403} {"train_loss": -5.226518630981445, "global_step": 16964, "epoch": 403} {"train_loss": -5.232205390930176, "global_step": 16965, "epoch": 403} {"train_loss": -5.166550159454346, "global_step": 16966, "epoch": 403} {"train_loss": -5.165504898343768, "global_step": 16967, "epoch": 403, "val_loss": 78488.34375} {"train_loss": -5.253275394439697, "global_step": 16968, "epoch": 404} {"train_loss": -5.1568427085876465, "global_step": 16969, "epoch": 404} {"train_loss": -5.184250831604004, "global_step": 16970, "epoch": 404} {"train_loss": -5.1152448654174805, "global_step": 16971, "epoch": 404} {"train_loss": -5.250514984130859, "global_step": 16972, "epoch": 404} {"train_loss": -5.1921844482421875, "global_step": 16973, "epoch": 404} {"train_loss": -5.183599948883057, "global_step": 16974, "epoch": 404} {"train_loss": -5.167135238647461, "global_step": 16975, "epoch": 404} {"train_loss": -5.321341514587402, "global_step": 16976, "epoch": 404} {"train_loss": -5.2611517906188965, "global_step": 16977, "epoch": 404} {"train_loss": -5.245428562164307, "global_step": 16978, "epoch": 404} {"train_loss": -5.171431541442871, "global_step": 16979, "epoch": 404} {"train_loss": -5.1743974685668945, "global_step": 16980, "epoch": 404} {"train_loss": -5.292296409606934, "global_step": 16981, "epoch": 404} {"train_loss": -5.176080703735352, "global_step": 16982, "epoch": 404} {"train_loss": -5.112957000732422, "global_step": 16983, "epoch": 404} {"train_loss": -5.163618087768555, "global_step": 16984, "epoch": 404} {"train_loss": -5.176052093505859, "global_step": 16985, "epoch": 404} {"train_loss": -5.166534423828125, "global_step": 16986, "epoch": 404} {"train_loss": -5.2766876220703125, "global_step": 16987, "epoch": 404} {"train_loss": -5.213024139404297, "global_step": 16988, "epoch": 404} {"train_loss": -5.19276237487793, "global_step": 16989, "epoch": 404} {"train_loss": -5.268377304077148, "global_step": 16990, "epoch": 404} {"train_loss": -5.347201347351074, "global_step": 16991, "epoch": 404} {"train_loss": -5.015067100524902, "global_step": 16992, "epoch": 404} {"train_loss": -5.175970077514648, "global_step": 16993, "epoch": 404} {"train_loss": -5.218207359313965, "global_step": 16994, "epoch": 404} {"train_loss": -5.156134605407715, "global_step": 16995, "epoch": 404} {"train_loss": -5.231796741485596, "global_step": 16996, "epoch": 404} {"train_loss": -5.154813766479492, "global_step": 16997, "epoch": 404} {"train_loss": -5.201179504394531, "global_step": 16998, "epoch": 404} {"train_loss": -5.338109970092773, "global_step": 16999, "epoch": 404} {"train_loss": -5.241605758666992, "global_step": 17000, "epoch": 404} {"train_loss": -5.186185359954834, "global_step": 17001, "epoch": 404} {"train_loss": -5.284136772155762, "global_step": 17002, "epoch": 404} {"train_loss": -5.337617874145508, "global_step": 17003, "epoch": 404} {"train_loss": -5.234892845153809, "global_step": 17004, "epoch": 404} {"train_loss": -5.376776695251465, "global_step": 17005, "epoch": 404} {"train_loss": -5.237470626831055, "global_step": 17006, "epoch": 404} {"train_loss": -5.264410972595215, "global_step": 17007, "epoch": 404} {"train_loss": -5.218817710876465, "global_step": 17008, "epoch": 404} {"train_loss": -5.21896311214992, "global_step": 17009, "epoch": 404, "val_loss": 78540.375} {"train_loss": -5.305751800537109, "global_step": 17010, "epoch": 405} {"train_loss": -5.286307334899902, "global_step": 17011, "epoch": 405} {"train_loss": -5.248703956604004, "global_step": 17012, "epoch": 405} {"train_loss": -5.220582008361816, "global_step": 17013, "epoch": 405} {"train_loss": -5.267663955688477, "global_step": 17014, "epoch": 405} {"train_loss": -4.983353614807129, "global_step": 17015, "epoch": 405} {"train_loss": -5.338849067687988, "global_step": 17016, "epoch": 405} {"train_loss": -5.331068515777588, "global_step": 17017, "epoch": 405} {"train_loss": -5.090018272399902, "global_step": 17018, "epoch": 405} {"train_loss": -5.189873695373535, "global_step": 17019, "epoch": 405} {"train_loss": -5.202070236206055, "global_step": 17020, "epoch": 405} {"train_loss": -5.168832302093506, "global_step": 17021, "epoch": 405} {"train_loss": -5.269719123840332, "global_step": 17022, "epoch": 405} {"train_loss": -5.241875648498535, "global_step": 17023, "epoch": 405} {"train_loss": -5.264379978179932, "global_step": 17024, "epoch": 405} {"train_loss": -5.156406402587891, "global_step": 17025, "epoch": 405} {"train_loss": -5.228668212890625, "global_step": 17026, "epoch": 405} {"train_loss": -5.247768402099609, "global_step": 17027, "epoch": 405} {"train_loss": -4.962989807128906, "global_step": 17028, "epoch": 405} {"train_loss": -5.201647758483887, "global_step": 17029, "epoch": 405} {"train_loss": -5.231243133544922, "global_step": 17030, "epoch": 405} {"train_loss": -5.040858745574951, "global_step": 17031, "epoch": 405} {"train_loss": -5.170656204223633, "global_step": 17032, "epoch": 405} {"train_loss": -5.138819694519043, "global_step": 17033, "epoch": 405} {"train_loss": -5.228322505950928, "global_step": 17034, "epoch": 405} {"train_loss": -5.256546974182129, "global_step": 17035, "epoch": 405} {"train_loss": -5.2708659172058105, "global_step": 17036, "epoch": 405} {"train_loss": -5.417503356933594, "global_step": 17037, "epoch": 405} {"train_loss": -5.126916885375977, "global_step": 17038, "epoch": 405} {"train_loss": -5.133843421936035, "global_step": 17039, "epoch": 405} {"train_loss": -5.137696266174316, "global_step": 17040, "epoch": 405} {"train_loss": -5.337942600250244, "global_step": 17041, "epoch": 405} {"train_loss": -5.141483306884766, "global_step": 17042, "epoch": 405} {"train_loss": -5.209469795227051, "global_step": 17043, "epoch": 405} {"train_loss": -5.336522102355957, "global_step": 17044, "epoch": 405} {"train_loss": -5.068482875823975, "global_step": 17045, "epoch": 405} {"train_loss": -5.132992267608643, "global_step": 17046, "epoch": 405} {"train_loss": -5.311866760253906, "global_step": 17047, "epoch": 405} {"train_loss": -5.180546283721924, "global_step": 17048, "epoch": 405} {"train_loss": -5.180812835693359, "global_step": 17049, "epoch": 405} {"train_loss": -5.217822074890137, "global_step": 17050, "epoch": 405} {"train_loss": -5.206433477855864, "global_step": 17051, "epoch": 405, "val_loss": 78506.2421875} {"train_loss": -5.151535987854004, "global_step": 17052, "epoch": 406} {"train_loss": -5.022541522979736, "global_step": 17053, "epoch": 406} {"train_loss": -5.210086822509766, "global_step": 17054, "epoch": 406} {"train_loss": -5.120203018188477, "global_step": 17055, "epoch": 406} {"train_loss": -5.267765998840332, "global_step": 17056, "epoch": 406} {"train_loss": -5.163564682006836, "global_step": 17057, "epoch": 406} {"train_loss": -5.129521369934082, "global_step": 17058, "epoch": 406} {"train_loss": -5.305083274841309, "global_step": 17059, "epoch": 406} {"train_loss": -5.117430686950684, "global_step": 17060, "epoch": 406} {"train_loss": -5.110939025878906, "global_step": 17061, "epoch": 406} {"train_loss": -5.135322570800781, "global_step": 17062, "epoch": 406} {"train_loss": -5.245833396911621, "global_step": 17063, "epoch": 406} {"train_loss": -5.17759895324707, "global_step": 17064, "epoch": 406} {"train_loss": -5.246853828430176, "global_step": 17065, "epoch": 406} {"train_loss": -5.2805891036987305, "global_step": 17066, "epoch": 406} {"train_loss": -5.252261161804199, "global_step": 17067, "epoch": 406} {"train_loss": -5.3986287117004395, "global_step": 17068, "epoch": 406} {"train_loss": -5.1966376304626465, "global_step": 17069, "epoch": 406} {"train_loss": -5.246532440185547, "global_step": 17070, "epoch": 406} {"train_loss": -5.256500244140625, "global_step": 17071, "epoch": 406} {"train_loss": -5.208524227142334, "global_step": 17072, "epoch": 406} {"train_loss": -5.188473701477051, "global_step": 17073, "epoch": 406} {"train_loss": -5.275581359863281, "global_step": 17074, "epoch": 406} {"train_loss": -5.06566858291626, "global_step": 17075, "epoch": 406} {"train_loss": -5.26310396194458, "global_step": 17076, "epoch": 406} {"train_loss": -5.198189735412598, "global_step": 17077, "epoch": 406} {"train_loss": -5.170339584350586, "global_step": 17078, "epoch": 406} {"train_loss": -5.123678207397461, "global_step": 17079, "epoch": 406} {"train_loss": -5.365120887756348, "global_step": 17080, "epoch": 406} {"train_loss": -5.164808750152588, "global_step": 17081, "epoch": 406} {"train_loss": -5.173854351043701, "global_step": 17082, "epoch": 406} {"train_loss": -5.321046829223633, "global_step": 17083, "epoch": 406} {"train_loss": -5.154422760009766, "global_step": 17084, "epoch": 406} {"train_loss": -5.266101837158203, "global_step": 17085, "epoch": 406} {"train_loss": -5.1134233474731445, "global_step": 17086, "epoch": 406} {"train_loss": -5.212368011474609, "global_step": 17087, "epoch": 406} {"train_loss": -5.378645896911621, "global_step": 17088, "epoch": 406} {"train_loss": -5.279862403869629, "global_step": 17089, "epoch": 406} {"train_loss": -5.270230293273926, "global_step": 17090, "epoch": 406} {"train_loss": -5.327191352844238, "global_step": 17091, "epoch": 406} {"train_loss": -5.227448463439941, "global_step": 17092, "epoch": 406} {"train_loss": -5.2139802660260886, "global_step": 17093, "epoch": 406, "val_loss": 78047.6640625} {"train_loss": -5.394411087036133, "global_step": 17094, "epoch": 407} {"train_loss": -5.321126937866211, "global_step": 17095, "epoch": 407} {"train_loss": -5.32277250289917, "global_step": 17096, "epoch": 407} {"train_loss": -5.185081958770752, "global_step": 17097, "epoch": 407} {"train_loss": -5.246329307556152, "global_step": 17098, "epoch": 407} {"train_loss": -5.225823402404785, "global_step": 17099, "epoch": 407} {"train_loss": -5.241183280944824, "global_step": 17100, "epoch": 407} {"train_loss": -5.081727981567383, "global_step": 17101, "epoch": 407} {"train_loss": -5.200674533843994, "global_step": 17102, "epoch": 407} {"train_loss": -5.301563262939453, "global_step": 17103, "epoch": 407} {"train_loss": -5.183160781860352, "global_step": 17104, "epoch": 407} {"train_loss": -5.176369667053223, "global_step": 17105, "epoch": 407} {"train_loss": -5.2931132316589355, "global_step": 17106, "epoch": 407} {"train_loss": -5.2092180252075195, "global_step": 17107, "epoch": 407} {"train_loss": -5.266841888427734, "global_step": 17108, "epoch": 407} {"train_loss": -5.0890703201293945, "global_step": 17109, "epoch": 407} {"train_loss": -5.285550594329834, "global_step": 17110, "epoch": 407} {"train_loss": -5.209327697753906, "global_step": 17111, "epoch": 407} {"train_loss": -5.184013366699219, "global_step": 17112, "epoch": 407} {"train_loss": -5.123752593994141, "global_step": 17113, "epoch": 407} {"train_loss": -5.229328155517578, "global_step": 17114, "epoch": 407} {"train_loss": -5.049583435058594, "global_step": 17115, "epoch": 407} {"train_loss": -5.2004714012146, "global_step": 17116, "epoch": 407} {"train_loss": -4.9701642990112305, "global_step": 17117, "epoch": 407} {"train_loss": -5.225677490234375, "global_step": 17118, "epoch": 407} {"train_loss": -5.167759418487549, "global_step": 17119, "epoch": 407} {"train_loss": -5.005478858947754, "global_step": 17120, "epoch": 407} {"train_loss": -5.40162992477417, "global_step": 17121, "epoch": 407} {"train_loss": -5.070488452911377, "global_step": 17122, "epoch": 407} {"train_loss": -5.120848655700684, "global_step": 17123, "epoch": 407} {"train_loss": -4.995032787322998, "global_step": 17124, "epoch": 407} {"train_loss": -5.243474006652832, "global_step": 17125, "epoch": 407} {"train_loss": -5.031982421875, "global_step": 17126, "epoch": 407} {"train_loss": -5.093020439147949, "global_step": 17127, "epoch": 407} {"train_loss": -5.242040157318115, "global_step": 17128, "epoch": 407} {"train_loss": -5.155349254608154, "global_step": 17129, "epoch": 407} {"train_loss": -5.17978572845459, "global_step": 17130, "epoch": 407} {"train_loss": -5.018579483032227, "global_step": 17131, "epoch": 407} {"train_loss": -5.1330180168151855, "global_step": 17132, "epoch": 407} {"train_loss": -5.184285640716553, "global_step": 17133, "epoch": 407} {"train_loss": -5.104718208312988, "global_step": 17134, "epoch": 407} {"train_loss": -5.179220710481916, "global_step": 17135, "epoch": 407, "val_loss": 78152.140625} {"train_loss": -5.035970687866211, "global_step": 17136, "epoch": 408} {"train_loss": -5.1282806396484375, "global_step": 17137, "epoch": 408} {"train_loss": -5.185199737548828, "global_step": 17138, "epoch": 408} {"train_loss": -5.316015720367432, "global_step": 17139, "epoch": 408} {"train_loss": -5.241379737854004, "global_step": 17140, "epoch": 408} {"train_loss": -5.159943103790283, "global_step": 17141, "epoch": 408} {"train_loss": -5.365819931030273, "global_step": 17142, "epoch": 408} {"train_loss": -5.142556190490723, "global_step": 17143, "epoch": 408} {"train_loss": -5.309992790222168, "global_step": 17144, "epoch": 408} {"train_loss": -5.310327529907227, "global_step": 17145, "epoch": 408} {"train_loss": -5.2910871505737305, "global_step": 17146, "epoch": 408} {"train_loss": -5.273935794830322, "global_step": 17147, "epoch": 408} {"train_loss": -5.234973907470703, "global_step": 17148, "epoch": 408} {"train_loss": -5.229418754577637, "global_step": 17149, "epoch": 408} {"train_loss": -5.28237247467041, "global_step": 17150, "epoch": 408} {"train_loss": -5.307831764221191, "global_step": 17151, "epoch": 408} {"train_loss": -5.257743835449219, "global_step": 17152, "epoch": 408} {"train_loss": -5.187739372253418, "global_step": 17153, "epoch": 408} {"train_loss": -5.311814785003662, "global_step": 17154, "epoch": 408} {"train_loss": -5.0939435958862305, "global_step": 17155, "epoch": 408} {"train_loss": -5.156929969787598, "global_step": 17156, "epoch": 408} {"train_loss": -5.292296409606934, "global_step": 17157, "epoch": 408} {"train_loss": -5.192791938781738, "global_step": 17158, "epoch": 408} {"train_loss": -5.292758941650391, "global_step": 17159, "epoch": 408} {"train_loss": -5.239985942840576, "global_step": 17160, "epoch": 408} {"train_loss": -5.176814079284668, "global_step": 17161, "epoch": 408} {"train_loss": -5.29136848449707, "global_step": 17162, "epoch": 408} {"train_loss": -5.318025588989258, "global_step": 17163, "epoch": 408} {"train_loss": -5.146115779876709, "global_step": 17164, "epoch": 408} {"train_loss": -5.227571964263916, "global_step": 17165, "epoch": 408} {"train_loss": -5.1169633865356445, "global_step": 17166, "epoch": 408} {"train_loss": -5.139084815979004, "global_step": 17167, "epoch": 408} {"train_loss": -5.2274651527404785, "global_step": 17168, "epoch": 408} {"train_loss": -5.342432975769043, "global_step": 17169, "epoch": 408} {"train_loss": -5.137075424194336, "global_step": 17170, "epoch": 408} {"train_loss": -5.2212748527526855, "global_step": 17171, "epoch": 408} {"train_loss": -5.067849159240723, "global_step": 17172, "epoch": 408} {"train_loss": -5.146397590637207, "global_step": 17173, "epoch": 408} {"train_loss": -5.1024041175842285, "global_step": 17174, "epoch": 408} {"train_loss": -5.376230239868164, "global_step": 17175, "epoch": 408} {"train_loss": -5.234916687011719, "global_step": 17176, "epoch": 408} {"train_loss": -5.221858115423293, "global_step": 17177, "epoch": 408, "val_loss": 77521.3515625} {"train_loss": -5.30368709564209, "global_step": 17178, "epoch": 409} {"train_loss": -5.040388107299805, "global_step": 17179, "epoch": 409} {"train_loss": -5.112967491149902, "global_step": 17180, "epoch": 409} {"train_loss": -5.181238174438477, "global_step": 17181, "epoch": 409} {"train_loss": -5.220298767089844, "global_step": 17182, "epoch": 409} {"train_loss": -5.2617998123168945, "global_step": 17183, "epoch": 409} {"train_loss": -5.292008876800537, "global_step": 17184, "epoch": 409} {"train_loss": -5.122209548950195, "global_step": 17185, "epoch": 409} {"train_loss": -5.229828357696533, "global_step": 17186, "epoch": 409} {"train_loss": -5.2718186378479, "global_step": 17187, "epoch": 409} {"train_loss": -5.187741756439209, "global_step": 17188, "epoch": 409} {"train_loss": -5.240817546844482, "global_step": 17189, "epoch": 409} {"train_loss": -5.19193696975708, "global_step": 17190, "epoch": 409} {"train_loss": -5.195009231567383, "global_step": 17191, "epoch": 409} {"train_loss": -5.274883270263672, "global_step": 17192, "epoch": 409} {"train_loss": -5.2615814208984375, "global_step": 17193, "epoch": 409} {"train_loss": -5.286492347717285, "global_step": 17194, "epoch": 409} {"train_loss": -5.281250953674316, "global_step": 17195, "epoch": 409} {"train_loss": -5.305940628051758, "global_step": 17196, "epoch": 409} {"train_loss": -5.161808013916016, "global_step": 17197, "epoch": 409} {"train_loss": -5.227154731750488, "global_step": 17198, "epoch": 409} {"train_loss": -5.216137886047363, "global_step": 17199, "epoch": 409} {"train_loss": -5.164369583129883, "global_step": 17200, "epoch": 409} {"train_loss": -5.296614170074463, "global_step": 17201, "epoch": 409} {"train_loss": -5.245256423950195, "global_step": 17202, "epoch": 409} {"train_loss": -5.280445098876953, "global_step": 17203, "epoch": 409} {"train_loss": -5.320966720581055, "global_step": 17204, "epoch": 409} {"train_loss": -5.2528395652771, "global_step": 17205, "epoch": 409} {"train_loss": -5.234128475189209, "global_step": 17206, "epoch": 409} {"train_loss": -5.3792009353637695, "global_step": 17207, "epoch": 409} {"train_loss": -5.24832010269165, "global_step": 17208, "epoch": 409} {"train_loss": -5.172667503356934, "global_step": 17209, "epoch": 409} {"train_loss": -5.20515775680542, "global_step": 17210, "epoch": 409} {"train_loss": -5.342069625854492, "global_step": 17211, "epoch": 409} {"train_loss": -5.176156997680664, "global_step": 17212, "epoch": 409} {"train_loss": -5.314404010772705, "global_step": 17213, "epoch": 409} {"train_loss": -5.292487144470215, "global_step": 17214, "epoch": 409} {"train_loss": -5.262218952178955, "global_step": 17215, "epoch": 409} {"train_loss": -5.29602575302124, "global_step": 17216, "epoch": 409} {"train_loss": -5.1417036056518555, "global_step": 17217, "epoch": 409} {"train_loss": -5.27572774887085, "global_step": 17218, "epoch": 409} {"train_loss": -5.236981153488159, "global_step": 17219, "epoch": 409, "val_loss": 78319.3125} {"train_loss": -5.220052719116211, "global_step": 17220, "epoch": 410} {"train_loss": -5.177947044372559, "global_step": 17221, "epoch": 410} {"train_loss": -5.219369888305664, "global_step": 17222, "epoch": 410} {"train_loss": -5.206908226013184, "global_step": 17223, "epoch": 410} {"train_loss": -5.143495559692383, "global_step": 17224, "epoch": 410} {"train_loss": -5.185039520263672, "global_step": 17225, "epoch": 410} {"train_loss": -5.22537088394165, "global_step": 17226, "epoch": 410} {"train_loss": -5.242363929748535, "global_step": 17227, "epoch": 410} {"train_loss": -5.2254791259765625, "global_step": 17228, "epoch": 410} {"train_loss": -5.239428997039795, "global_step": 17229, "epoch": 410} {"train_loss": -5.280361175537109, "global_step": 17230, "epoch": 410} {"train_loss": -5.185820579528809, "global_step": 17231, "epoch": 410} {"train_loss": -5.2744879722595215, "global_step": 17232, "epoch": 410} {"train_loss": -5.23514461517334, "global_step": 17233, "epoch": 410} {"train_loss": -5.306354522705078, "global_step": 17234, "epoch": 410} {"train_loss": -5.070206642150879, "global_step": 17235, "epoch": 410} {"train_loss": -5.109923362731934, "global_step": 17236, "epoch": 410} {"train_loss": -5.151267051696777, "global_step": 17237, "epoch": 410} {"train_loss": -5.239748477935791, "global_step": 17238, "epoch": 410} {"train_loss": -5.286907196044922, "global_step": 17239, "epoch": 410} {"train_loss": -5.1457366943359375, "global_step": 17240, "epoch": 410} {"train_loss": -5.254199028015137, "global_step": 17241, "epoch": 410} {"train_loss": -5.183915138244629, "global_step": 17242, "epoch": 410} {"train_loss": -5.153141975402832, "global_step": 17243, "epoch": 410} {"train_loss": -5.1145806312561035, "global_step": 17244, "epoch": 410} {"train_loss": -5.413762092590332, "global_step": 17245, "epoch": 410} {"train_loss": -5.162225723266602, "global_step": 17246, "epoch": 410} {"train_loss": -4.803018569946289, "global_step": 17247, "epoch": 410} {"train_loss": -5.202215671539307, "global_step": 17248, "epoch": 410} {"train_loss": -5.199686527252197, "global_step": 17249, "epoch": 410} {"train_loss": -5.156606674194336, "global_step": 17250, "epoch": 410} {"train_loss": -5.2530107498168945, "global_step": 17251, "epoch": 410} {"train_loss": -5.267316818237305, "global_step": 17252, "epoch": 410} {"train_loss": -5.091996669769287, "global_step": 17253, "epoch": 410} {"train_loss": -5.344169616699219, "global_step": 17254, "epoch": 410} {"train_loss": -5.2083892822265625, "global_step": 17255, "epoch": 410} {"train_loss": -5.15179967880249, "global_step": 17256, "epoch": 410} {"train_loss": -5.31071662902832, "global_step": 17257, "epoch": 410} {"train_loss": -5.271692276000977, "global_step": 17258, "epoch": 410} {"train_loss": -5.170569896697998, "global_step": 17259, "epoch": 410} {"train_loss": -5.215333938598633, "global_step": 17260, "epoch": 410} {"train_loss": -5.202381610870361, "global_step": 17261, "epoch": 410, "val_loss": 78152.0546875} {"train_loss": -5.309353351593018, "global_step": 17262, "epoch": 411} {"train_loss": -5.186992645263672, "global_step": 17263, "epoch": 411} {"train_loss": -5.166370868682861, "global_step": 17264, "epoch": 411} {"train_loss": -5.239402770996094, "global_step": 17265, "epoch": 411} {"train_loss": -5.3162713050842285, "global_step": 17266, "epoch": 411} {"train_loss": -5.115268230438232, "global_step": 17267, "epoch": 411} {"train_loss": -5.188443183898926, "global_step": 17268, "epoch": 411} {"train_loss": -5.215439319610596, "global_step": 17269, "epoch": 411} {"train_loss": -5.1845598220825195, "global_step": 17270, "epoch": 411} {"train_loss": -5.169530391693115, "global_step": 17271, "epoch": 411} {"train_loss": -5.170071601867676, "global_step": 17272, "epoch": 411} {"train_loss": -5.145852088928223, "global_step": 17273, "epoch": 411} {"train_loss": -4.992566108703613, "global_step": 17274, "epoch": 411} {"train_loss": -5.1996169090271, "global_step": 17275, "epoch": 411} {"train_loss": -5.3026323318481445, "global_step": 17276, "epoch": 411} {"train_loss": -5.146437644958496, "global_step": 17277, "epoch": 411} {"train_loss": -5.199235916137695, "global_step": 17278, "epoch": 411} {"train_loss": -5.233636379241943, "global_step": 17279, "epoch": 411} {"train_loss": -5.228706359863281, "global_step": 17280, "epoch": 411} {"train_loss": -5.27595329284668, "global_step": 17281, "epoch": 411} {"train_loss": -5.183643341064453, "global_step": 17282, "epoch": 411} {"train_loss": -5.2245774269104, "global_step": 17283, "epoch": 411} {"train_loss": -5.208392143249512, "global_step": 17284, "epoch": 411} {"train_loss": -5.2235002517700195, "global_step": 17285, "epoch": 411} {"train_loss": -5.304568290710449, "global_step": 17286, "epoch": 411} {"train_loss": -5.28133487701416, "global_step": 17287, "epoch": 411} {"train_loss": -5.266107082366943, "global_step": 17288, "epoch": 411} {"train_loss": -5.38493537902832, "global_step": 17289, "epoch": 411} {"train_loss": -5.339217185974121, "global_step": 17290, "epoch": 411} {"train_loss": -5.150847911834717, "global_step": 17291, "epoch": 411} {"train_loss": -5.24560546875, "global_step": 17292, "epoch": 411} {"train_loss": -5.284870147705078, "global_step": 17293, "epoch": 411} {"train_loss": -5.268979072570801, "global_step": 17294, "epoch": 411} {"train_loss": -5.25048828125, "global_step": 17295, "epoch": 411} {"train_loss": -5.234452247619629, "global_step": 17296, "epoch": 411} {"train_loss": -5.313356876373291, "global_step": 17297, "epoch": 411} {"train_loss": -5.196106433868408, "global_step": 17298, "epoch": 411} {"train_loss": -5.058314800262451, "global_step": 17299, "epoch": 411} {"train_loss": -5.105393409729004, "global_step": 17300, "epoch": 411} {"train_loss": -5.250240325927734, "global_step": 17301, "epoch": 411} {"train_loss": -5.350866317749023, "global_step": 17302, "epoch": 411} {"train_loss": -5.219345921561832, "global_step": 17303, "epoch": 411, "val_loss": 78286.9609375} {"train_loss": -5.185910224914551, "global_step": 17304, "epoch": 412} {"train_loss": -5.267717361450195, "global_step": 17305, "epoch": 412} {"train_loss": -5.193475723266602, "global_step": 17306, "epoch": 412} {"train_loss": -5.256504535675049, "global_step": 17307, "epoch": 412} {"train_loss": -5.264802932739258, "global_step": 17308, "epoch": 412} {"train_loss": -5.241244316101074, "global_step": 17309, "epoch": 412} {"train_loss": -5.245700359344482, "global_step": 17310, "epoch": 412} {"train_loss": -5.112997055053711, "global_step": 17311, "epoch": 412} {"train_loss": -5.1257405281066895, "global_step": 17312, "epoch": 412} {"train_loss": -5.230132102966309, "global_step": 17313, "epoch": 412} {"train_loss": -5.221663951873779, "global_step": 17314, "epoch": 412} {"train_loss": -5.239091873168945, "global_step": 17315, "epoch": 412} {"train_loss": -5.218608856201172, "global_step": 17316, "epoch": 412} {"train_loss": -5.274521350860596, "global_step": 17317, "epoch": 412} {"train_loss": -5.262981414794922, "global_step": 17318, "epoch": 412} {"train_loss": -5.137077808380127, "global_step": 17319, "epoch": 412} {"train_loss": -5.236209392547607, "global_step": 17320, "epoch": 412} {"train_loss": -5.350727081298828, "global_step": 17321, "epoch": 412} {"train_loss": -5.206013202667236, "global_step": 17322, "epoch": 412} {"train_loss": -5.263972282409668, "global_step": 17323, "epoch": 412} {"train_loss": -5.214494705200195, "global_step": 17324, "epoch": 412} {"train_loss": -5.16700553894043, "global_step": 17325, "epoch": 412} {"train_loss": -5.230453014373779, "global_step": 17326, "epoch": 412} {"train_loss": -5.242222785949707, "global_step": 17327, "epoch": 412} {"train_loss": -5.345122814178467, "global_step": 17328, "epoch": 412} {"train_loss": -5.21558952331543, "global_step": 17329, "epoch": 412} {"train_loss": -5.321475028991699, "global_step": 17330, "epoch": 412} {"train_loss": -5.33123779296875, "global_step": 17331, "epoch": 412} {"train_loss": -5.3119730949401855, "global_step": 17332, "epoch": 412} {"train_loss": -5.171788215637207, "global_step": 17333, "epoch": 412} {"train_loss": -5.151165008544922, "global_step": 17334, "epoch": 412} {"train_loss": -5.314291000366211, "global_step": 17335, "epoch": 412} {"train_loss": -5.076210021972656, "global_step": 17336, "epoch": 412} {"train_loss": -5.025256633758545, "global_step": 17337, "epoch": 412} {"train_loss": -5.303136825561523, "global_step": 17338, "epoch": 412} {"train_loss": -5.213325023651123, "global_step": 17339, "epoch": 412} {"train_loss": -5.218785285949707, "global_step": 17340, "epoch": 412} {"train_loss": -5.172116279602051, "global_step": 17341, "epoch": 412} {"train_loss": -5.057466506958008, "global_step": 17342, "epoch": 412} {"train_loss": -5.099637985229492, "global_step": 17343, "epoch": 412} {"train_loss": -5.325827121734619, "global_step": 17344, "epoch": 412} {"train_loss": -5.218483981632051, "global_step": 17345, "epoch": 412, "val_loss": 78108.9296875} {"train_loss": -5.286638259887695, "global_step": 17346, "epoch": 413} {"train_loss": -5.321951389312744, "global_step": 17347, "epoch": 413} {"train_loss": -5.202439308166504, "global_step": 17348, "epoch": 413} {"train_loss": -5.2570013999938965, "global_step": 17349, "epoch": 413} {"train_loss": -5.37210750579834, "global_step": 17350, "epoch": 413} {"train_loss": -5.16016149520874, "global_step": 17351, "epoch": 413} {"train_loss": -5.100637912750244, "global_step": 17352, "epoch": 413} {"train_loss": -5.271540641784668, "global_step": 17353, "epoch": 413} {"train_loss": -5.227436542510986, "global_step": 17354, "epoch": 413} {"train_loss": -5.194199562072754, "global_step": 17355, "epoch": 413} {"train_loss": -5.278694152832031, "global_step": 17356, "epoch": 413} {"train_loss": -5.390012264251709, "global_step": 17357, "epoch": 413} {"train_loss": -5.351940155029297, "global_step": 17358, "epoch": 413} {"train_loss": -5.342813491821289, "global_step": 17359, "epoch": 413} {"train_loss": -5.352846145629883, "global_step": 17360, "epoch": 413} {"train_loss": -5.249762535095215, "global_step": 17361, "epoch": 413} {"train_loss": -5.247642517089844, "global_step": 17362, "epoch": 413} {"train_loss": -5.209632396697998, "global_step": 17363, "epoch": 413} {"train_loss": -5.19581413269043, "global_step": 17364, "epoch": 413} {"train_loss": -5.258392333984375, "global_step": 17365, "epoch": 413} {"train_loss": -5.044383525848389, "global_step": 17366, "epoch": 413} {"train_loss": -5.232536315917969, "global_step": 17367, "epoch": 413} {"train_loss": -4.873200416564941, "global_step": 17368, "epoch": 413} {"train_loss": -4.647281169891357, "global_step": 17369, "epoch": 413} {"train_loss": -4.87760066986084, "global_step": 17370, "epoch": 413} {"train_loss": -4.821813583374023, "global_step": 17371, "epoch": 413} {"train_loss": -5.139688014984131, "global_step": 17372, "epoch": 413} {"train_loss": -4.913416862487793, "global_step": 17373, "epoch": 413} {"train_loss": -5.141122817993164, "global_step": 17374, "epoch": 413} {"train_loss": -5.006973743438721, "global_step": 17375, "epoch": 413} {"train_loss": -5.087397575378418, "global_step": 17376, "epoch": 413} {"train_loss": -4.977478504180908, "global_step": 17377, "epoch": 413} {"train_loss": -5.191822052001953, "global_step": 17378, "epoch": 413} {"train_loss": -5.022616386413574, "global_step": 17379, "epoch": 413} {"train_loss": -5.13118839263916, "global_step": 17380, "epoch": 413} {"train_loss": -5.1382293701171875, "global_step": 17381, "epoch": 413} {"train_loss": -5.192132949829102, "global_step": 17382, "epoch": 413} {"train_loss": -5.168686866760254, "global_step": 17383, "epoch": 413} {"train_loss": -5.206418514251709, "global_step": 17384, "epoch": 413} {"train_loss": -5.098698139190674, "global_step": 17385, "epoch": 413} {"train_loss": -5.053463935852051, "global_step": 17386, "epoch": 413} {"train_loss": -5.150199458712623, "global_step": 17387, "epoch": 413, "val_loss": 78432.1875} {"train_loss": -5.2377095222473145, "global_step": 17388, "epoch": 414} {"train_loss": -5.1138715744018555, "global_step": 17389, "epoch": 414} {"train_loss": -5.201268672943115, "global_step": 17390, "epoch": 414} {"train_loss": -5.191592693328857, "global_step": 17391, "epoch": 414} {"train_loss": -5.30019474029541, "global_step": 17392, "epoch": 414} {"train_loss": -5.385389804840088, "global_step": 17393, "epoch": 414} {"train_loss": -5.217798709869385, "global_step": 17394, "epoch": 414} {"train_loss": -5.3473663330078125, "global_step": 17395, "epoch": 414} {"train_loss": -5.287877082824707, "global_step": 17396, "epoch": 414} {"train_loss": -5.259902477264404, "global_step": 17397, "epoch": 414} {"train_loss": -5.049476146697998, "global_step": 17398, "epoch": 414} {"train_loss": -5.320570945739746, "global_step": 17399, "epoch": 414} {"train_loss": -5.135509490966797, "global_step": 17400, "epoch": 414} {"train_loss": -5.27085018157959, "global_step": 17401, "epoch": 414} {"train_loss": -5.184451103210449, "global_step": 17402, "epoch": 414} {"train_loss": -5.256992816925049, "global_step": 17403, "epoch": 414} {"train_loss": -5.288935661315918, "global_step": 17404, "epoch": 414} {"train_loss": -5.296139717102051, "global_step": 17405, "epoch": 414} {"train_loss": -5.240752220153809, "global_step": 17406, "epoch": 414} {"train_loss": -5.091644763946533, "global_step": 17407, "epoch": 414} {"train_loss": -5.185747146606445, "global_step": 17408, "epoch": 414} {"train_loss": -5.111800193786621, "global_step": 17409, "epoch": 414} {"train_loss": -5.2883710861206055, "global_step": 17410, "epoch": 414} {"train_loss": -5.379982948303223, "global_step": 17411, "epoch": 414} {"train_loss": -5.164141654968262, "global_step": 17412, "epoch": 414} {"train_loss": -5.220871925354004, "global_step": 17413, "epoch": 414} {"train_loss": -5.314694881439209, "global_step": 17414, "epoch": 414} {"train_loss": -5.2001142501831055, "global_step": 17415, "epoch": 414} {"train_loss": -5.199487686157227, "global_step": 17416, "epoch": 414} {"train_loss": -5.270199775695801, "global_step": 17417, "epoch": 414} {"train_loss": -5.239343643188477, "global_step": 17418, "epoch": 414} {"train_loss": -5.413280963897705, "global_step": 17419, "epoch": 414} {"train_loss": -5.1699676513671875, "global_step": 17420, "epoch": 414} {"train_loss": -5.146154880523682, "global_step": 17421, "epoch": 414} {"train_loss": -5.279532432556152, "global_step": 17422, "epoch": 414} {"train_loss": -5.205099582672119, "global_step": 17423, "epoch": 414} {"train_loss": -5.144351959228516, "global_step": 17424, "epoch": 414} {"train_loss": -5.249724388122559, "global_step": 17425, "epoch": 414} {"train_loss": -5.334949493408203, "global_step": 17426, "epoch": 414} {"train_loss": -5.288760185241699, "global_step": 17427, "epoch": 414} {"train_loss": -5.186769485473633, "global_step": 17428, "epoch": 414} {"train_loss": -5.2338081655048185, "global_step": 17429, "epoch": 414, "val_loss": 77767.3046875} {"train_loss": -5.205676555633545, "global_step": 17430, "epoch": 415} {"train_loss": -5.235233783721924, "global_step": 17431, "epoch": 415} {"train_loss": -5.140913963317871, "global_step": 17432, "epoch": 415} {"train_loss": -5.368296146392822, "global_step": 17433, "epoch": 415} {"train_loss": -5.33972692489624, "global_step": 17434, "epoch": 415} {"train_loss": -5.281647682189941, "global_step": 17435, "epoch": 415} {"train_loss": -5.2690629959106445, "global_step": 17436, "epoch": 415} {"train_loss": -5.2375383377075195, "global_step": 17437, "epoch": 415} {"train_loss": -5.337642192840576, "global_step": 17438, "epoch": 415} {"train_loss": -5.194511413574219, "global_step": 17439, "epoch": 415} {"train_loss": -5.315128326416016, "global_step": 17440, "epoch": 415} {"train_loss": -5.258254051208496, "global_step": 17441, "epoch": 415} {"train_loss": -5.219795227050781, "global_step": 17442, "epoch": 415} {"train_loss": -5.286473274230957, "global_step": 17443, "epoch": 415} {"train_loss": -5.266385555267334, "global_step": 17444, "epoch": 415} {"train_loss": -5.212204933166504, "global_step": 17445, "epoch": 415} {"train_loss": -5.209572792053223, "global_step": 17446, "epoch": 415} {"train_loss": -5.367036819458008, "global_step": 17447, "epoch": 415} {"train_loss": -5.326850414276123, "global_step": 17448, "epoch": 415} {"train_loss": -5.165246963500977, "global_step": 17449, "epoch": 415} {"train_loss": -5.26451301574707, "global_step": 17450, "epoch": 415} {"train_loss": -5.178274631500244, "global_step": 17451, "epoch": 415} {"train_loss": -5.1776275634765625, "global_step": 17452, "epoch": 415} {"train_loss": -5.381806373596191, "global_step": 17453, "epoch": 415} {"train_loss": -5.194232940673828, "global_step": 17454, "epoch": 415} {"train_loss": -5.231866359710693, "global_step": 17455, "epoch": 415} {"train_loss": -5.426885604858398, "global_step": 17456, "epoch": 415} {"train_loss": -5.104861259460449, "global_step": 17457, "epoch": 415} {"train_loss": -5.241359710693359, "global_step": 17458, "epoch": 415} {"train_loss": -5.3115081787109375, "global_step": 17459, "epoch": 415} {"train_loss": -5.182642459869385, "global_step": 17460, "epoch": 415} {"train_loss": -5.164890766143799, "global_step": 17461, "epoch": 415} {"train_loss": -5.146624565124512, "global_step": 17462, "epoch": 415} {"train_loss": -5.134844779968262, "global_step": 17463, "epoch": 415} {"train_loss": -5.226884841918945, "global_step": 17464, "epoch": 415} {"train_loss": -5.146777629852295, "global_step": 17465, "epoch": 415} {"train_loss": -5.21027946472168, "global_step": 17466, "epoch": 415} {"train_loss": -5.242712020874023, "global_step": 17467, "epoch": 415} {"train_loss": -5.104082107543945, "global_step": 17468, "epoch": 415} {"train_loss": -5.291862487792969, "global_step": 17469, "epoch": 415} {"train_loss": -5.222625732421875, "global_step": 17470, "epoch": 415} {"train_loss": -5.237555776323591, "global_step": 17471, "epoch": 415, "val_loss": 76843.5} {"train_loss": -5.332711219787598, "global_step": 17472, "epoch": 416} {"train_loss": -5.191250324249268, "global_step": 17473, "epoch": 416} {"train_loss": -5.187231063842773, "global_step": 17474, "epoch": 416} {"train_loss": -5.359479904174805, "global_step": 17475, "epoch": 416} {"train_loss": -5.385407447814941, "global_step": 17476, "epoch": 416} {"train_loss": -5.185800552368164, "global_step": 17477, "epoch": 416} {"train_loss": -5.150512218475342, "global_step": 17478, "epoch": 416} {"train_loss": -5.260307312011719, "global_step": 17479, "epoch": 416} {"train_loss": -5.227165222167969, "global_step": 17480, "epoch": 416} {"train_loss": -5.235227108001709, "global_step": 17481, "epoch": 416} {"train_loss": -5.222706317901611, "global_step": 17482, "epoch": 416} {"train_loss": -5.307711124420166, "global_step": 17483, "epoch": 416} {"train_loss": -5.141175270080566, "global_step": 17484, "epoch": 416} {"train_loss": -5.14182710647583, "global_step": 17485, "epoch": 416} {"train_loss": -5.3808183670043945, "global_step": 17486, "epoch": 416} {"train_loss": -5.214404106140137, "global_step": 17487, "epoch": 416} {"train_loss": -5.164312362670898, "global_step": 17488, "epoch": 416} {"train_loss": -5.109107971191406, "global_step": 17489, "epoch": 416} {"train_loss": -5.158143997192383, "global_step": 17490, "epoch": 416} {"train_loss": -5.327610015869141, "global_step": 17491, "epoch": 416} {"train_loss": -5.365077972412109, "global_step": 17492, "epoch": 416} {"train_loss": -5.226958274841309, "global_step": 17493, "epoch": 416} {"train_loss": -5.226970672607422, "global_step": 17494, "epoch": 416} {"train_loss": -5.115579605102539, "global_step": 17495, "epoch": 416} {"train_loss": -5.371769905090332, "global_step": 17496, "epoch": 416} {"train_loss": -5.243408679962158, "global_step": 17497, "epoch": 416} {"train_loss": -5.341602325439453, "global_step": 17498, "epoch": 416} {"train_loss": -5.270648002624512, "global_step": 17499, "epoch": 416} {"train_loss": -5.360691070556641, "global_step": 17500, "epoch": 416} {"train_loss": -5.228658676147461, "global_step": 17501, "epoch": 416} {"train_loss": -5.04646110534668, "global_step": 17502, "epoch": 416} {"train_loss": -5.2312092781066895, "global_step": 17503, "epoch": 416} {"train_loss": -5.173125743865967, "global_step": 17504, "epoch": 416} {"train_loss": -5.2281694412231445, "global_step": 17505, "epoch": 416} {"train_loss": -5.340320587158203, "global_step": 17506, "epoch": 416} {"train_loss": -5.223173141479492, "global_step": 17507, "epoch": 416} {"train_loss": -5.3679914474487305, "global_step": 17508, "epoch": 416} {"train_loss": -5.0678510665893555, "global_step": 17509, "epoch": 416} {"train_loss": -5.257486343383789, "global_step": 17510, "epoch": 416} {"train_loss": -5.219057083129883, "global_step": 17511, "epoch": 416} {"train_loss": -5.108341217041016, "global_step": 17512, "epoch": 416} {"train_loss": -5.235449393590291, "global_step": 17513, "epoch": 416, "val_loss": 78087.015625} {"train_loss": -5.207355976104736, "global_step": 17514, "epoch": 417} {"train_loss": -5.253298759460449, "global_step": 17515, "epoch": 417} {"train_loss": -5.2839436531066895, "global_step": 17516, "epoch": 417} {"train_loss": -5.1742706298828125, "global_step": 17517, "epoch": 417} {"train_loss": -5.327308177947998, "global_step": 17518, "epoch": 417} {"train_loss": -5.203052997589111, "global_step": 17519, "epoch": 417} {"train_loss": -5.302524566650391, "global_step": 17520, "epoch": 417} {"train_loss": -5.366026878356934, "global_step": 17521, "epoch": 417} {"train_loss": -5.2591094970703125, "global_step": 17522, "epoch": 417} {"train_loss": -5.253292560577393, "global_step": 17523, "epoch": 417} {"train_loss": -5.323195457458496, "global_step": 17524, "epoch": 417} {"train_loss": -5.2251691818237305, "global_step": 17525, "epoch": 417} {"train_loss": -5.3242340087890625, "global_step": 17526, "epoch": 417} {"train_loss": -5.231515884399414, "global_step": 17527, "epoch": 417} {"train_loss": -5.076382160186768, "global_step": 17528, "epoch": 417} {"train_loss": -5.316580772399902, "global_step": 17529, "epoch": 417} {"train_loss": -5.346236228942871, "global_step": 17530, "epoch": 417} {"train_loss": -5.2425432205200195, "global_step": 17531, "epoch": 417} {"train_loss": -5.230792045593262, "global_step": 17532, "epoch": 417} {"train_loss": -5.321653366088867, "global_step": 17533, "epoch": 417} {"train_loss": -5.293980598449707, "global_step": 17534, "epoch": 417} {"train_loss": -5.361067771911621, "global_step": 17535, "epoch": 417} {"train_loss": -5.191132068634033, "global_step": 17536, "epoch": 417} {"train_loss": -5.191436767578125, "global_step": 17537, "epoch": 417} {"train_loss": -5.363760948181152, "global_step": 17538, "epoch": 417} {"train_loss": -5.264037132263184, "global_step": 17539, "epoch": 417} {"train_loss": -5.237699031829834, "global_step": 17540, "epoch": 417} {"train_loss": -5.256889343261719, "global_step": 17541, "epoch": 417} {"train_loss": -5.2277913093566895, "global_step": 17542, "epoch": 417} {"train_loss": -5.009243011474609, "global_step": 17543, "epoch": 417} {"train_loss": -5.305010795593262, "global_step": 17544, "epoch": 417} {"train_loss": -5.162778377532959, "global_step": 17545, "epoch": 417} {"train_loss": -5.338540077209473, "global_step": 17546, "epoch": 417} {"train_loss": -5.3056230545043945, "global_step": 17547, "epoch": 417} {"train_loss": -5.381598949432373, "global_step": 17548, "epoch": 417} {"train_loss": -5.296774387359619, "global_step": 17549, "epoch": 417} {"train_loss": -5.279440879821777, "global_step": 17550, "epoch": 417} {"train_loss": -5.1682586669921875, "global_step": 17551, "epoch": 417} {"train_loss": -5.269723415374756, "global_step": 17552, "epoch": 417} {"train_loss": -5.2150115966796875, "global_step": 17553, "epoch": 417} {"train_loss": -5.247041702270508, "global_step": 17554, "epoch": 417} {"train_loss": -5.258595943450928, "global_step": 17555, "epoch": 417, "val_loss": 77388.6015625} {"train_loss": -5.15207576751709, "global_step": 17556, "epoch": 418} {"train_loss": -5.377102851867676, "global_step": 17557, "epoch": 418} {"train_loss": -5.3169169425964355, "global_step": 17558, "epoch": 418} {"train_loss": -5.139937877655029, "global_step": 17559, "epoch": 418} {"train_loss": -5.278129577636719, "global_step": 17560, "epoch": 418} {"train_loss": -5.244607925415039, "global_step": 17561, "epoch": 418} {"train_loss": -5.17885684967041, "global_step": 17562, "epoch": 418} {"train_loss": -5.11195182800293, "global_step": 17563, "epoch": 418} {"train_loss": -5.34426212310791, "global_step": 17564, "epoch": 418} {"train_loss": -5.304215431213379, "global_step": 17565, "epoch": 418} {"train_loss": -5.103643894195557, "global_step": 17566, "epoch": 418} {"train_loss": -5.183706283569336, "global_step": 17567, "epoch": 418} {"train_loss": -5.175310134887695, "global_step": 17568, "epoch": 418} {"train_loss": -5.219539642333984, "global_step": 17569, "epoch": 418} {"train_loss": -5.11663818359375, "global_step": 17570, "epoch": 418} {"train_loss": -5.05445671081543, "global_step": 17571, "epoch": 418} {"train_loss": -5.212559223175049, "global_step": 17572, "epoch": 418} {"train_loss": -5.3987932205200195, "global_step": 17573, "epoch": 418} {"train_loss": -5.303427696228027, "global_step": 17574, "epoch": 418} {"train_loss": -5.19044828414917, "global_step": 17575, "epoch": 418} {"train_loss": -5.167899131774902, "global_step": 17576, "epoch": 418} {"train_loss": -5.275020599365234, "global_step": 17577, "epoch": 418} {"train_loss": -5.244977951049805, "global_step": 17578, "epoch": 418} {"train_loss": -5.302701950073242, "global_step": 17579, "epoch": 418} {"train_loss": -5.289484977722168, "global_step": 17580, "epoch": 418} {"train_loss": -5.273920059204102, "global_step": 17581, "epoch": 418} {"train_loss": -5.228338718414307, "global_step": 17582, "epoch": 418} {"train_loss": -5.281742572784424, "global_step": 17583, "epoch": 418} {"train_loss": -5.144476890563965, "global_step": 17584, "epoch": 418} {"train_loss": -5.099679470062256, "global_step": 17585, "epoch": 418} {"train_loss": -5.209921836853027, "global_step": 17586, "epoch": 418} {"train_loss": -5.262856483459473, "global_step": 17587, "epoch": 418} {"train_loss": -5.279397010803223, "global_step": 17588, "epoch": 418} {"train_loss": -5.216012001037598, "global_step": 17589, "epoch": 418} {"train_loss": -5.2111005783081055, "global_step": 17590, "epoch": 418} {"train_loss": -5.111293792724609, "global_step": 17591, "epoch": 418} {"train_loss": -5.266776084899902, "global_step": 17592, "epoch": 418} {"train_loss": -5.170933246612549, "global_step": 17593, "epoch": 418} {"train_loss": -5.054360866546631, "global_step": 17594, "epoch": 418} {"train_loss": -5.317085266113281, "global_step": 17595, "epoch": 418} {"train_loss": -5.168910026550293, "global_step": 17596, "epoch": 418} {"train_loss": -5.224192312785557, "global_step": 17597, "epoch": 418, "val_loss": 77431.2578125} {"train_loss": -5.324939250946045, "global_step": 17598, "epoch": 419} {"train_loss": -5.161012172698975, "global_step": 17599, "epoch": 419} {"train_loss": -5.186647415161133, "global_step": 17600, "epoch": 419} {"train_loss": -5.233182430267334, "global_step": 17601, "epoch": 419} {"train_loss": -5.1630120277404785, "global_step": 17602, "epoch": 419} {"train_loss": -5.223546981811523, "global_step": 17603, "epoch": 419} {"train_loss": -5.176642417907715, "global_step": 17604, "epoch": 419} {"train_loss": -5.223110675811768, "global_step": 17605, "epoch": 419} {"train_loss": -5.256662368774414, "global_step": 17606, "epoch": 419} {"train_loss": -5.2610039710998535, "global_step": 17607, "epoch": 419} {"train_loss": -5.154238700866699, "global_step": 17608, "epoch": 419} {"train_loss": -5.125977039337158, "global_step": 17609, "epoch": 419} {"train_loss": -5.241937160491943, "global_step": 17610, "epoch": 419} {"train_loss": -5.254114151000977, "global_step": 17611, "epoch": 419} {"train_loss": -5.212174415588379, "global_step": 17612, "epoch": 419} {"train_loss": -5.20953369140625, "global_step": 17613, "epoch": 419} {"train_loss": -5.0847320556640625, "global_step": 17614, "epoch": 419} {"train_loss": -5.371614456176758, "global_step": 17615, "epoch": 419} {"train_loss": -5.085424900054932, "global_step": 17616, "epoch": 419} {"train_loss": -5.288601875305176, "global_step": 17617, "epoch": 419} {"train_loss": -5.3668999671936035, "global_step": 17618, "epoch": 419} {"train_loss": -5.142388343811035, "global_step": 17619, "epoch": 419} {"train_loss": -5.167818069458008, "global_step": 17620, "epoch": 419} {"train_loss": -5.152439594268799, "global_step": 17621, "epoch": 419} {"train_loss": -5.0920305252075195, "global_step": 17622, "epoch": 419} {"train_loss": -5.224681377410889, "global_step": 17623, "epoch": 419} {"train_loss": -5.267551422119141, "global_step": 17624, "epoch": 419} {"train_loss": -5.1431779861450195, "global_step": 17625, "epoch": 419} {"train_loss": -5.060327053070068, "global_step": 17626, "epoch": 419} {"train_loss": -5.219132423400879, "global_step": 17627, "epoch": 419} {"train_loss": -5.282826900482178, "global_step": 17628, "epoch": 419} {"train_loss": -5.148441314697266, "global_step": 17629, "epoch": 419} {"train_loss": -5.249024391174316, "global_step": 17630, "epoch": 419} {"train_loss": -5.302666664123535, "global_step": 17631, "epoch": 419} {"train_loss": -5.198781967163086, "global_step": 17632, "epoch": 419} {"train_loss": -5.201178550720215, "global_step": 17633, "epoch": 419} {"train_loss": -5.207622051239014, "global_step": 17634, "epoch": 419} {"train_loss": -5.189791679382324, "global_step": 17635, "epoch": 419} {"train_loss": -5.199129581451416, "global_step": 17636, "epoch": 419} {"train_loss": -5.255481719970703, "global_step": 17637, "epoch": 419} {"train_loss": -5.264467239379883, "global_step": 17638, "epoch": 419} {"train_loss": -5.209476448240734, "global_step": 17639, "epoch": 419, "val_loss": 77209.5703125} {"train_loss": -5.16349458694458, "global_step": 17640, "epoch": 420} {"train_loss": -5.233304023742676, "global_step": 17641, "epoch": 420} {"train_loss": -5.2280073165893555, "global_step": 17642, "epoch": 420} {"train_loss": -5.339753150939941, "global_step": 17643, "epoch": 420} {"train_loss": -5.381130218505859, "global_step": 17644, "epoch": 420} {"train_loss": -5.198816299438477, "global_step": 17645, "epoch": 420} {"train_loss": -5.168847560882568, "global_step": 17646, "epoch": 420} {"train_loss": -5.120744705200195, "global_step": 17647, "epoch": 420} {"train_loss": -5.197146892547607, "global_step": 17648, "epoch": 420} {"train_loss": -5.274138450622559, "global_step": 17649, "epoch": 420} {"train_loss": -5.244017124176025, "global_step": 17650, "epoch": 420} {"train_loss": -5.212158679962158, "global_step": 17651, "epoch": 420} {"train_loss": -5.467929840087891, "global_step": 17652, "epoch": 420} {"train_loss": -5.40237283706665, "global_step": 17653, "epoch": 420} {"train_loss": -5.178442478179932, "global_step": 17654, "epoch": 420} {"train_loss": -5.2551679611206055, "global_step": 17655, "epoch": 420} {"train_loss": -5.241151809692383, "global_step": 17656, "epoch": 420} {"train_loss": -5.308516025543213, "global_step": 17657, "epoch": 420} {"train_loss": -5.294704437255859, "global_step": 17658, "epoch": 420} {"train_loss": -5.0568366050720215, "global_step": 17659, "epoch": 420} {"train_loss": -5.145224571228027, "global_step": 17660, "epoch": 420} {"train_loss": -5.436464309692383, "global_step": 17661, "epoch": 420} {"train_loss": -5.2378740310668945, "global_step": 17662, "epoch": 420} {"train_loss": -5.18363094329834, "global_step": 17663, "epoch": 420} {"train_loss": -5.250997066497803, "global_step": 17664, "epoch": 420} {"train_loss": -5.138370990753174, "global_step": 17665, "epoch": 420} {"train_loss": -5.273704528808594, "global_step": 17666, "epoch": 420} {"train_loss": -5.259635925292969, "global_step": 17667, "epoch": 420} {"train_loss": -5.156211853027344, "global_step": 17668, "epoch": 420} {"train_loss": -5.207298278808594, "global_step": 17669, "epoch": 420} {"train_loss": -5.261405944824219, "global_step": 17670, "epoch": 420} {"train_loss": -5.102771759033203, "global_step": 17671, "epoch": 420} {"train_loss": -5.176973342895508, "global_step": 17672, "epoch": 420} {"train_loss": -5.0694708824157715, "global_step": 17673, "epoch": 420} {"train_loss": -5.162712097167969, "global_step": 17674, "epoch": 420} {"train_loss": -5.346200942993164, "global_step": 17675, "epoch": 420} {"train_loss": -5.175677299499512, "global_step": 17676, "epoch": 420} {"train_loss": -5.341792106628418, "global_step": 17677, "epoch": 420} {"train_loss": -5.23742151260376, "global_step": 17678, "epoch": 420} {"train_loss": -5.213796615600586, "global_step": 17679, "epoch": 420} {"train_loss": -5.327507495880127, "global_step": 17680, "epoch": 420} {"train_loss": -5.2327843734196255, "global_step": 17681, "epoch": 420, "val_loss": 78169.953125} {"train_loss": -5.07078218460083, "global_step": 17682, "epoch": 421} {"train_loss": -5.252664566040039, "global_step": 17683, "epoch": 421} {"train_loss": -5.182369232177734, "global_step": 17684, "epoch": 421} {"train_loss": -5.3383917808532715, "global_step": 17685, "epoch": 421} {"train_loss": -5.238320827484131, "global_step": 17686, "epoch": 421} {"train_loss": -5.164689064025879, "global_step": 17687, "epoch": 421} {"train_loss": -5.199052810668945, "global_step": 17688, "epoch": 421} {"train_loss": -5.178311824798584, "global_step": 17689, "epoch": 421} {"train_loss": -5.2020087242126465, "global_step": 17690, "epoch": 421} {"train_loss": -5.335380554199219, "global_step": 17691, "epoch": 421} {"train_loss": -5.14755392074585, "global_step": 17692, "epoch": 421} {"train_loss": -5.125212669372559, "global_step": 17693, "epoch": 421} {"train_loss": -5.160517692565918, "global_step": 17694, "epoch": 421} {"train_loss": -5.116707801818848, "global_step": 17695, "epoch": 421} {"train_loss": -5.188601493835449, "global_step": 17696, "epoch": 421} {"train_loss": -5.163546562194824, "global_step": 17697, "epoch": 421} {"train_loss": -5.174108505249023, "global_step": 17698, "epoch": 421} {"train_loss": -5.148434162139893, "global_step": 17699, "epoch": 421} {"train_loss": -5.130790710449219, "global_step": 17700, "epoch": 421} {"train_loss": -5.267884254455566, "global_step": 17701, "epoch": 421} {"train_loss": -5.168967247009277, "global_step": 17702, "epoch": 421} {"train_loss": -5.314566612243652, "global_step": 17703, "epoch": 421} {"train_loss": -5.305278778076172, "global_step": 17704, "epoch": 421} {"train_loss": -5.3951520919799805, "global_step": 17705, "epoch": 421} {"train_loss": -5.285802841186523, "global_step": 17706, "epoch": 421} {"train_loss": -5.301090240478516, "global_step": 17707, "epoch": 421} {"train_loss": -5.277868747711182, "global_step": 17708, "epoch": 421} {"train_loss": -5.216855525970459, "global_step": 17709, "epoch": 421} {"train_loss": -5.289585590362549, "global_step": 17710, "epoch": 421} {"train_loss": -5.155558109283447, "global_step": 17711, "epoch": 421} {"train_loss": -5.306909561157227, "global_step": 17712, "epoch": 421} {"train_loss": -5.297740936279297, "global_step": 17713, "epoch": 421} {"train_loss": -5.284345626831055, "global_step": 17714, "epoch": 421} {"train_loss": -5.196539878845215, "global_step": 17715, "epoch": 421} {"train_loss": -5.372332572937012, "global_step": 17716, "epoch": 421} {"train_loss": -5.261239051818848, "global_step": 17717, "epoch": 421} {"train_loss": -5.284784317016602, "global_step": 17718, "epoch": 421} {"train_loss": -5.404175758361816, "global_step": 17719, "epoch": 421} {"train_loss": -5.258756637573242, "global_step": 17720, "epoch": 421} {"train_loss": -5.19819450378418, "global_step": 17721, "epoch": 421} {"train_loss": -5.221989154815674, "global_step": 17722, "epoch": 421} {"train_loss": -5.23408968108041, "global_step": 17723, "epoch": 421, "val_loss": 77831.7578125} {"train_loss": -5.326248645782471, "global_step": 17724, "epoch": 422} {"train_loss": -5.257621765136719, "global_step": 17725, "epoch": 422} {"train_loss": -5.112556457519531, "global_step": 17726, "epoch": 422} {"train_loss": -5.272016525268555, "global_step": 17727, "epoch": 422} {"train_loss": -5.252072334289551, "global_step": 17728, "epoch": 422} {"train_loss": -5.0557661056518555, "global_step": 17729, "epoch": 422} {"train_loss": -5.279175281524658, "global_step": 17730, "epoch": 422} {"train_loss": -5.193343162536621, "global_step": 17731, "epoch": 422} {"train_loss": -5.181294918060303, "global_step": 17732, "epoch": 422} {"train_loss": -5.153861045837402, "global_step": 17733, "epoch": 422} {"train_loss": -5.2769293785095215, "global_step": 17734, "epoch": 422} {"train_loss": -5.250779628753662, "global_step": 17735, "epoch": 422} {"train_loss": -5.276336669921875, "global_step": 17736, "epoch": 422} {"train_loss": -5.034431457519531, "global_step": 17737, "epoch": 422} {"train_loss": -5.17378568649292, "global_step": 17738, "epoch": 422} {"train_loss": -5.282684326171875, "global_step": 17739, "epoch": 422} {"train_loss": -5.221117973327637, "global_step": 17740, "epoch": 422} {"train_loss": -5.096254348754883, "global_step": 17741, "epoch": 422} {"train_loss": -5.145669937133789, "global_step": 17742, "epoch": 422} {"train_loss": -5.289700508117676, "global_step": 17743, "epoch": 422} {"train_loss": -5.227565765380859, "global_step": 17744, "epoch": 422} {"train_loss": -5.252111434936523, "global_step": 17745, "epoch": 422} {"train_loss": -5.34405517578125, "global_step": 17746, "epoch": 422} {"train_loss": -5.1469268798828125, "global_step": 17747, "epoch": 422} {"train_loss": -5.108280181884766, "global_step": 17748, "epoch": 422} {"train_loss": -5.245078086853027, "global_step": 17749, "epoch": 422} {"train_loss": -5.29726505279541, "global_step": 17750, "epoch": 422} {"train_loss": -5.208663463592529, "global_step": 17751, "epoch": 422} {"train_loss": -5.235970497131348, "global_step": 17752, "epoch": 422} {"train_loss": -5.189489364624023, "global_step": 17753, "epoch": 422} {"train_loss": -5.447204113006592, "global_step": 17754, "epoch": 422} {"train_loss": -5.301519393920898, "global_step": 17755, "epoch": 422} {"train_loss": -5.117159366607666, "global_step": 17756, "epoch": 422} {"train_loss": -5.223027229309082, "global_step": 17757, "epoch": 422} {"train_loss": -5.237874984741211, "global_step": 17758, "epoch": 422} {"train_loss": -5.28449821472168, "global_step": 17759, "epoch": 422} {"train_loss": -5.2166266441345215, "global_step": 17760, "epoch": 422} {"train_loss": -5.3397979736328125, "global_step": 17761, "epoch": 422} {"train_loss": -5.159708023071289, "global_step": 17762, "epoch": 422} {"train_loss": -5.1136860847473145, "global_step": 17763, "epoch": 422} {"train_loss": -5.332765102386475, "global_step": 17764, "epoch": 422} {"train_loss": -5.228412174043202, "global_step": 17765, "epoch": 422, "val_loss": 77846.4609375} {"train_loss": -5.2965545654296875, "global_step": 17766, "epoch": 423} {"train_loss": -5.136192798614502, "global_step": 17767, "epoch": 423} {"train_loss": -5.205369472503662, "global_step": 17768, "epoch": 423} {"train_loss": -5.23010778427124, "global_step": 17769, "epoch": 423} {"train_loss": -5.267027854919434, "global_step": 17770, "epoch": 423} {"train_loss": -5.283452033996582, "global_step": 17771, "epoch": 423} {"train_loss": -5.245851039886475, "global_step": 17772, "epoch": 423} {"train_loss": -5.160366058349609, "global_step": 17773, "epoch": 423} {"train_loss": -5.496921062469482, "global_step": 17774, "epoch": 423} {"train_loss": -5.1563262939453125, "global_step": 17775, "epoch": 423} {"train_loss": -5.0662689208984375, "global_step": 17776, "epoch": 423} {"train_loss": -5.384382724761963, "global_step": 17777, "epoch": 423} {"train_loss": -5.217554092407227, "global_step": 17778, "epoch": 423} {"train_loss": -5.246012210845947, "global_step": 17779, "epoch": 423} {"train_loss": -5.311503887176514, "global_step": 17780, "epoch": 423} {"train_loss": -5.50666618347168, "global_step": 17781, "epoch": 423} {"train_loss": -5.299427509307861, "global_step": 17782, "epoch": 423} {"train_loss": -5.255649566650391, "global_step": 17783, "epoch": 423} {"train_loss": -5.259387016296387, "global_step": 17784, "epoch": 423} {"train_loss": -5.2546772956848145, "global_step": 17785, "epoch": 423} {"train_loss": -5.319729804992676, "global_step": 17786, "epoch": 423} {"train_loss": -5.19299840927124, "global_step": 17787, "epoch": 423} {"train_loss": -5.187069892883301, "global_step": 17788, "epoch": 423} {"train_loss": -5.239415168762207, "global_step": 17789, "epoch": 423} {"train_loss": -5.269257545471191, "global_step": 17790, "epoch": 423} {"train_loss": -5.216239929199219, "global_step": 17791, "epoch": 423} {"train_loss": -5.164900779724121, "global_step": 17792, "epoch": 423} {"train_loss": -5.155806541442871, "global_step": 17793, "epoch": 423} {"train_loss": -5.2488603591918945, "global_step": 17794, "epoch": 423} {"train_loss": -5.2226972579956055, "global_step": 17795, "epoch": 423} {"train_loss": -5.158020496368408, "global_step": 17796, "epoch": 423} {"train_loss": -5.436138153076172, "global_step": 17797, "epoch": 423} {"train_loss": -5.07586669921875, "global_step": 17798, "epoch": 423} {"train_loss": -5.2726850509643555, "global_step": 17799, "epoch": 423} {"train_loss": -5.334431171417236, "global_step": 17800, "epoch": 423} {"train_loss": -5.038468360900879, "global_step": 17801, "epoch": 423} {"train_loss": -5.250674724578857, "global_step": 17802, "epoch": 423} {"train_loss": -5.170344352722168, "global_step": 17803, "epoch": 423} {"train_loss": -5.117128372192383, "global_step": 17804, "epoch": 423} {"train_loss": -5.346125602722168, "global_step": 17805, "epoch": 423} {"train_loss": -5.115961074829102, "global_step": 17806, "epoch": 423} {"train_loss": -5.237600360597883, "global_step": 17807, "epoch": 423, "val_loss": 79504.0859375} {"train_loss": -5.1750946044921875, "global_step": 17808, "epoch": 424} {"train_loss": -5.186810493469238, "global_step": 17809, "epoch": 424} {"train_loss": -5.18251371383667, "global_step": 17810, "epoch": 424} {"train_loss": -5.001712799072266, "global_step": 17811, "epoch": 424} {"train_loss": -5.272359371185303, "global_step": 17812, "epoch": 424} {"train_loss": -5.125386714935303, "global_step": 17813, "epoch": 424} {"train_loss": -5.270126819610596, "global_step": 17814, "epoch": 424} {"train_loss": -5.252636909484863, "global_step": 17815, "epoch": 424} {"train_loss": -5.061043739318848, "global_step": 17816, "epoch": 424} {"train_loss": -5.231017112731934, "global_step": 17817, "epoch": 424} {"train_loss": -5.208343029022217, "global_step": 17818, "epoch": 424} {"train_loss": -5.154102325439453, "global_step": 17819, "epoch": 424} {"train_loss": -5.08531379699707, "global_step": 17820, "epoch": 424} {"train_loss": -5.350281715393066, "global_step": 17821, "epoch": 424} {"train_loss": -5.089848041534424, "global_step": 17822, "epoch": 424} {"train_loss": -5.261557102203369, "global_step": 17823, "epoch": 424} {"train_loss": -5.224620819091797, "global_step": 17824, "epoch": 424} {"train_loss": -5.2660017013549805, "global_step": 17825, "epoch": 424} {"train_loss": -5.304344177246094, "global_step": 17826, "epoch": 424} {"train_loss": -5.169027328491211, "global_step": 17827, "epoch": 424} {"train_loss": -5.2646942138671875, "global_step": 17828, "epoch": 424} {"train_loss": -5.271770477294922, "global_step": 17829, "epoch": 424} {"train_loss": -5.225440502166748, "global_step": 17830, "epoch": 424} {"train_loss": -5.323639869689941, "global_step": 17831, "epoch": 424} {"train_loss": -5.207921981811523, "global_step": 17832, "epoch": 424} {"train_loss": -5.195085525512695, "global_step": 17833, "epoch": 424} {"train_loss": -5.336294651031494, "global_step": 17834, "epoch": 424} {"train_loss": -5.324594497680664, "global_step": 17835, "epoch": 424} {"train_loss": -5.283949375152588, "global_step": 17836, "epoch": 424} {"train_loss": -5.260875701904297, "global_step": 17837, "epoch": 424} {"train_loss": -5.09854793548584, "global_step": 17838, "epoch": 424} {"train_loss": -5.336764335632324, "global_step": 17839, "epoch": 424} {"train_loss": -5.3291215896606445, "global_step": 17840, "epoch": 424} {"train_loss": -5.304531097412109, "global_step": 17841, "epoch": 424} {"train_loss": -5.24554967880249, "global_step": 17842, "epoch": 424} {"train_loss": -5.2422099113464355, "global_step": 17843, "epoch": 424} {"train_loss": -5.1880693435668945, "global_step": 17844, "epoch": 424} {"train_loss": -5.200498580932617, "global_step": 17845, "epoch": 424} {"train_loss": -5.292880535125732, "global_step": 17846, "epoch": 424} {"train_loss": -5.226482391357422, "global_step": 17847, "epoch": 424} {"train_loss": -5.221015930175781, "global_step": 17848, "epoch": 424} {"train_loss": -5.223545187995548, "global_step": 17849, "epoch": 424, "val_loss": 77885.4453125} {"train_loss": -5.065052509307861, "global_step": 17850, "epoch": 425} {"train_loss": -5.35699462890625, "global_step": 17851, "epoch": 425} {"train_loss": -5.274072647094727, "global_step": 17852, "epoch": 425} {"train_loss": -5.304682731628418, "global_step": 17853, "epoch": 425} {"train_loss": -5.253530025482178, "global_step": 17854, "epoch": 425} {"train_loss": -5.184988975524902, "global_step": 17855, "epoch": 425} {"train_loss": -5.319890022277832, "global_step": 17856, "epoch": 425} {"train_loss": -5.182344913482666, "global_step": 17857, "epoch": 425} {"train_loss": -5.345478534698486, "global_step": 17858, "epoch": 425} {"train_loss": -5.239658832550049, "global_step": 17859, "epoch": 425} {"train_loss": -5.362017631530762, "global_step": 17860, "epoch": 425} {"train_loss": -5.183701515197754, "global_step": 17861, "epoch": 425} {"train_loss": -5.216538429260254, "global_step": 17862, "epoch": 425} {"train_loss": -5.226581573486328, "global_step": 17863, "epoch": 425} {"train_loss": -5.188516616821289, "global_step": 17864, "epoch": 425} {"train_loss": -5.417323112487793, "global_step": 17865, "epoch": 425} {"train_loss": -5.02780818939209, "global_step": 17866, "epoch": 425} {"train_loss": -5.054173469543457, "global_step": 17867, "epoch": 425} {"train_loss": -5.349031448364258, "global_step": 17868, "epoch": 425} {"train_loss": -5.1258416175842285, "global_step": 17869, "epoch": 425} {"train_loss": -5.170770645141602, "global_step": 17870, "epoch": 425} {"train_loss": -5.2549920082092285, "global_step": 17871, "epoch": 425} {"train_loss": -5.014308929443359, "global_step": 17872, "epoch": 425} {"train_loss": -5.236666679382324, "global_step": 17873, "epoch": 425} {"train_loss": -5.267355442047119, "global_step": 17874, "epoch": 425} {"train_loss": -5.388566017150879, "global_step": 17875, "epoch": 425} {"train_loss": -5.161299228668213, "global_step": 17876, "epoch": 425} {"train_loss": -5.363855361938477, "global_step": 17877, "epoch": 425} {"train_loss": -4.940145492553711, "global_step": 17878, "epoch": 425} {"train_loss": -5.037201881408691, "global_step": 17879, "epoch": 425} {"train_loss": -5.327667713165283, "global_step": 17880, "epoch": 425} {"train_loss": -5.059966087341309, "global_step": 17881, "epoch": 425} {"train_loss": -5.24653959274292, "global_step": 17882, "epoch": 425} {"train_loss": -5.271851062774658, "global_step": 17883, "epoch": 425} {"train_loss": -5.364294528961182, "global_step": 17884, "epoch": 425} {"train_loss": -5.258214473724365, "global_step": 17885, "epoch": 425} {"train_loss": -5.376551628112793, "global_step": 17886, "epoch": 425} {"train_loss": -5.150662422180176, "global_step": 17887, "epoch": 425} {"train_loss": -5.295952796936035, "global_step": 17888, "epoch": 425} {"train_loss": -5.30872917175293, "global_step": 17889, "epoch": 425} {"train_loss": -5.41273307800293, "global_step": 17890, "epoch": 425} {"train_loss": -5.2321163813273115, "global_step": 17891, "epoch": 425, "val_loss": 77435.9921875} {"train_loss": -5.277279853820801, "global_step": 17892, "epoch": 426} {"train_loss": -5.164563179016113, "global_step": 17893, "epoch": 426} {"train_loss": -5.223186492919922, "global_step": 17894, "epoch": 426} {"train_loss": -5.212654113769531, "global_step": 17895, "epoch": 426} {"train_loss": -5.2767839431762695, "global_step": 17896, "epoch": 426} {"train_loss": -5.371412754058838, "global_step": 17897, "epoch": 426} {"train_loss": -5.123457908630371, "global_step": 17898, "epoch": 426} {"train_loss": -5.296644687652588, "global_step": 17899, "epoch": 426} {"train_loss": -5.185334205627441, "global_step": 17900, "epoch": 426} {"train_loss": -5.214340686798096, "global_step": 17901, "epoch": 426} {"train_loss": -5.2808332443237305, "global_step": 17902, "epoch": 426} {"train_loss": -5.326409339904785, "global_step": 17903, "epoch": 426} {"train_loss": -5.27981424331665, "global_step": 17904, "epoch": 426} {"train_loss": -5.200937747955322, "global_step": 17905, "epoch": 426} {"train_loss": -5.162562847137451, "global_step": 17906, "epoch": 426} {"train_loss": -5.282353401184082, "global_step": 17907, "epoch": 426} {"train_loss": -5.21623420715332, "global_step": 17908, "epoch": 426} {"train_loss": -5.288544178009033, "global_step": 17909, "epoch": 426} {"train_loss": -5.239740371704102, "global_step": 17910, "epoch": 426} {"train_loss": -5.3486480712890625, "global_step": 17911, "epoch": 426} {"train_loss": -5.259965896606445, "global_step": 17912, "epoch": 426} {"train_loss": -5.417960166931152, "global_step": 17913, "epoch": 426} {"train_loss": -5.255697727203369, "global_step": 17914, "epoch": 426} {"train_loss": -5.209621429443359, "global_step": 17915, "epoch": 426} {"train_loss": -5.249698638916016, "global_step": 17916, "epoch": 426} {"train_loss": -5.34565544128418, "global_step": 17917, "epoch": 426} {"train_loss": -5.327516078948975, "global_step": 17918, "epoch": 426} {"train_loss": -5.189847946166992, "global_step": 17919, "epoch": 426} {"train_loss": -5.151630878448486, "global_step": 17920, "epoch": 426} {"train_loss": -5.198863506317139, "global_step": 17921, "epoch": 426} {"train_loss": -5.182929992675781, "global_step": 17922, "epoch": 426} {"train_loss": -5.18181037902832, "global_step": 17923, "epoch": 426} {"train_loss": -5.368874549865723, "global_step": 17924, "epoch": 426} {"train_loss": -5.21783447265625, "global_step": 17925, "epoch": 426} {"train_loss": -5.141465187072754, "global_step": 17926, "epoch": 426} {"train_loss": -5.333863735198975, "global_step": 17927, "epoch": 426} {"train_loss": -5.178421974182129, "global_step": 17928, "epoch": 426} {"train_loss": -5.114483833312988, "global_step": 17929, "epoch": 426} {"train_loss": -5.15983772277832, "global_step": 17930, "epoch": 426} {"train_loss": -5.21138858795166, "global_step": 17931, "epoch": 426} {"train_loss": -5.2140374183654785, "global_step": 17932, "epoch": 426} {"train_loss": -5.23830441066197, "global_step": 17933, "epoch": 426, "val_loss": 77284.671875} {"train_loss": -5.195340156555176, "global_step": 17934, "epoch": 427} {"train_loss": -5.19096040725708, "global_step": 17935, "epoch": 427} {"train_loss": -5.320632457733154, "global_step": 17936, "epoch": 427} {"train_loss": -5.4010701179504395, "global_step": 17937, "epoch": 427} {"train_loss": -5.125962257385254, "global_step": 17938, "epoch": 427} {"train_loss": -5.329183578491211, "global_step": 17939, "epoch": 427} {"train_loss": -5.178520202636719, "global_step": 17940, "epoch": 427} {"train_loss": -5.269311428070068, "global_step": 17941, "epoch": 427} {"train_loss": -5.267733573913574, "global_step": 17942, "epoch": 427} {"train_loss": -5.264461517333984, "global_step": 17943, "epoch": 427} {"train_loss": -5.20458984375, "global_step": 17944, "epoch": 427} {"train_loss": -5.262576103210449, "global_step": 17945, "epoch": 427} {"train_loss": -5.244892120361328, "global_step": 17946, "epoch": 427} {"train_loss": -5.164020538330078, "global_step": 17947, "epoch": 427} {"train_loss": -5.272251605987549, "global_step": 17948, "epoch": 427} {"train_loss": -5.274960517883301, "global_step": 17949, "epoch": 427} {"train_loss": -5.27071475982666, "global_step": 17950, "epoch": 427} {"train_loss": -5.4477691650390625, "global_step": 17951, "epoch": 427} {"train_loss": -5.254234313964844, "global_step": 17952, "epoch": 427} {"train_loss": -5.224445343017578, "global_step": 17953, "epoch": 427} {"train_loss": -5.337241172790527, "global_step": 17954, "epoch": 427} {"train_loss": -5.136317253112793, "global_step": 17955, "epoch": 427} {"train_loss": -5.302186965942383, "global_step": 17956, "epoch": 427} {"train_loss": -5.113880157470703, "global_step": 17957, "epoch": 427} {"train_loss": -5.222649574279785, "global_step": 17958, "epoch": 427} {"train_loss": -5.211013317108154, "global_step": 17959, "epoch": 427} {"train_loss": -5.212743759155273, "global_step": 17960, "epoch": 427} {"train_loss": -5.2748823165893555, "global_step": 17961, "epoch": 427} {"train_loss": -5.139455795288086, "global_step": 17962, "epoch": 427} {"train_loss": -5.1440534591674805, "global_step": 17963, "epoch": 427} {"train_loss": -5.217069149017334, "global_step": 17964, "epoch": 427} {"train_loss": -5.15024471282959, "global_step": 17965, "epoch": 427} {"train_loss": -5.262627601623535, "global_step": 17966, "epoch": 427} {"train_loss": -5.297769069671631, "global_step": 17967, "epoch": 427} {"train_loss": -5.14497709274292, "global_step": 17968, "epoch": 427} {"train_loss": -5.164057731628418, "global_step": 17969, "epoch": 427} {"train_loss": -5.247341632843018, "global_step": 17970, "epoch": 427} {"train_loss": -5.32918643951416, "global_step": 17971, "epoch": 427} {"train_loss": -5.289216041564941, "global_step": 17972, "epoch": 427} {"train_loss": -5.341409683227539, "global_step": 17973, "epoch": 427} {"train_loss": -5.311656951904297, "global_step": 17974, "epoch": 427} {"train_loss": -5.242530890873501, "global_step": 17975, "epoch": 427, "val_loss": 77198.5390625} {"train_loss": -5.252530097961426, "global_step": 17976, "epoch": 428} {"train_loss": -5.331155776977539, "global_step": 17977, "epoch": 428} {"train_loss": -5.392487525939941, "global_step": 17978, "epoch": 428} {"train_loss": -5.31892728805542, "global_step": 17979, "epoch": 428} {"train_loss": -5.436474323272705, "global_step": 17980, "epoch": 428} {"train_loss": -5.2857513427734375, "global_step": 17981, "epoch": 428} {"train_loss": -5.251378059387207, "global_step": 17982, "epoch": 428} {"train_loss": -5.345233917236328, "global_step": 17983, "epoch": 428} {"train_loss": -5.221715450286865, "global_step": 17984, "epoch": 428} {"train_loss": -5.336864948272705, "global_step": 17985, "epoch": 428} {"train_loss": -5.289059638977051, "global_step": 17986, "epoch": 428} {"train_loss": -5.182457447052002, "global_step": 17987, "epoch": 428} {"train_loss": -5.1090192794799805, "global_step": 17988, "epoch": 428} {"train_loss": -5.351822853088379, "global_step": 17989, "epoch": 428} {"train_loss": -5.075462818145752, "global_step": 17990, "epoch": 428} {"train_loss": -5.176923751831055, "global_step": 17991, "epoch": 428} {"train_loss": -5.169798374176025, "global_step": 17992, "epoch": 428} {"train_loss": -5.145668983459473, "global_step": 17993, "epoch": 428} {"train_loss": -5.256538391113281, "global_step": 17994, "epoch": 428} {"train_loss": -5.1474409103393555, "global_step": 17995, "epoch": 428} {"train_loss": -5.345227241516113, "global_step": 17996, "epoch": 428} {"train_loss": -5.132155418395996, "global_step": 17997, "epoch": 428} {"train_loss": -5.189828395843506, "global_step": 17998, "epoch": 428} {"train_loss": -5.219389915466309, "global_step": 17999, "epoch": 428} {"train_loss": -5.261051654815674, "global_step": 18000, "epoch": 428} {"train_loss": -5.110467433929443, "global_step": 18001, "epoch": 428} {"train_loss": -5.090561389923096, "global_step": 18002, "epoch": 428} {"train_loss": -5.2417988777160645, "global_step": 18003, "epoch": 428} {"train_loss": -5.275337219238281, "global_step": 18004, "epoch": 428} {"train_loss": -5.212881088256836, "global_step": 18005, "epoch": 428} {"train_loss": -5.245974540710449, "global_step": 18006, "epoch": 428} {"train_loss": -5.183732032775879, "global_step": 18007, "epoch": 428} {"train_loss": -5.226222991943359, "global_step": 18008, "epoch": 428} {"train_loss": -5.188119888305664, "global_step": 18009, "epoch": 428} {"train_loss": -5.2086567878723145, "global_step": 18010, "epoch": 428} {"train_loss": -5.308944225311279, "global_step": 18011, "epoch": 428} {"train_loss": -5.158407211303711, "global_step": 18012, "epoch": 428} {"train_loss": -5.203771114349365, "global_step": 18013, "epoch": 428} {"train_loss": -5.197044849395752, "global_step": 18014, "epoch": 428} {"train_loss": -5.069624900817871, "global_step": 18015, "epoch": 428} {"train_loss": -5.288851737976074, "global_step": 18016, "epoch": 428} {"train_loss": -5.230486404328119, "global_step": 18017, "epoch": 428, "val_loss": 78491.1171875} {"train_loss": -5.099474906921387, "global_step": 18018, "epoch": 429} {"train_loss": -5.281821250915527, "global_step": 18019, "epoch": 429} {"train_loss": -5.261023044586182, "global_step": 18020, "epoch": 429} {"train_loss": -5.274865627288818, "global_step": 18021, "epoch": 429} {"train_loss": -5.247694492340088, "global_step": 18022, "epoch": 429} {"train_loss": -5.230644702911377, "global_step": 18023, "epoch": 429} {"train_loss": -5.182756423950195, "global_step": 18024, "epoch": 429} {"train_loss": -5.363461494445801, "global_step": 18025, "epoch": 429} {"train_loss": -5.144202709197998, "global_step": 18026, "epoch": 429} {"train_loss": -5.183018684387207, "global_step": 18027, "epoch": 429} {"train_loss": -5.235196113586426, "global_step": 18028, "epoch": 429} {"train_loss": -5.322614669799805, "global_step": 18029, "epoch": 429} {"train_loss": -5.134627342224121, "global_step": 18030, "epoch": 429} {"train_loss": -5.4636054039001465, "global_step": 18031, "epoch": 429} {"train_loss": -5.266847610473633, "global_step": 18032, "epoch": 429} {"train_loss": -5.251610279083252, "global_step": 18033, "epoch": 429} {"train_loss": -5.213423252105713, "global_step": 18034, "epoch": 429} {"train_loss": -5.209250450134277, "global_step": 18035, "epoch": 429} {"train_loss": -5.107170104980469, "global_step": 18036, "epoch": 429} {"train_loss": -5.234317779541016, "global_step": 18037, "epoch": 429} {"train_loss": -5.205078601837158, "global_step": 18038, "epoch": 429} {"train_loss": -5.197030067443848, "global_step": 18039, "epoch": 429} {"train_loss": -5.201091766357422, "global_step": 18040, "epoch": 429} {"train_loss": -5.130324363708496, "global_step": 18041, "epoch": 429} {"train_loss": -5.123342037200928, "global_step": 18042, "epoch": 429} {"train_loss": -5.275252819061279, "global_step": 18043, "epoch": 429} {"train_loss": -5.187424659729004, "global_step": 18044, "epoch": 429} {"train_loss": -5.103227615356445, "global_step": 18045, "epoch": 429} {"train_loss": -5.0973663330078125, "global_step": 18046, "epoch": 429} {"train_loss": -5.305118560791016, "global_step": 18047, "epoch": 429} {"train_loss": -5.103451728820801, "global_step": 18048, "epoch": 429} {"train_loss": -5.076839447021484, "global_step": 18049, "epoch": 429} {"train_loss": -5.131241798400879, "global_step": 18050, "epoch": 429} {"train_loss": -5.221061706542969, "global_step": 18051, "epoch": 429} {"train_loss": -5.255793571472168, "global_step": 18052, "epoch": 429} {"train_loss": -5.258336067199707, "global_step": 18053, "epoch": 429} {"train_loss": -5.198995590209961, "global_step": 18054, "epoch": 429} {"train_loss": -5.155081748962402, "global_step": 18055, "epoch": 429} {"train_loss": -5.328253746032715, "global_step": 18056, "epoch": 429} {"train_loss": -5.2502617835998535, "global_step": 18057, "epoch": 429} {"train_loss": -5.214158058166504, "global_step": 18058, "epoch": 429} {"train_loss": -5.212258145922706, "global_step": 18059, "epoch": 429, "val_loss": 77787.09375} {"train_loss": -5.280642509460449, "global_step": 18060, "epoch": 430} {"train_loss": -5.299022197723389, "global_step": 18061, "epoch": 430} {"train_loss": -5.197127819061279, "global_step": 18062, "epoch": 430} {"train_loss": -5.2013139724731445, "global_step": 18063, "epoch": 430} {"train_loss": -5.291027069091797, "global_step": 18064, "epoch": 430} {"train_loss": -5.143329620361328, "global_step": 18065, "epoch": 430} {"train_loss": -5.218261241912842, "global_step": 18066, "epoch": 430} {"train_loss": -5.241253852844238, "global_step": 18067, "epoch": 430} {"train_loss": -5.350125312805176, "global_step": 18068, "epoch": 430} {"train_loss": -5.227630615234375, "global_step": 18069, "epoch": 430} {"train_loss": -5.185376167297363, "global_step": 18070, "epoch": 430} {"train_loss": -5.20650577545166, "global_step": 18071, "epoch": 430} {"train_loss": -5.307048797607422, "global_step": 18072, "epoch": 430} {"train_loss": -5.279640197753906, "global_step": 18073, "epoch": 430} {"train_loss": -5.205950736999512, "global_step": 18074, "epoch": 430} {"train_loss": -5.284336090087891, "global_step": 18075, "epoch": 430} {"train_loss": -5.325366020202637, "global_step": 18076, "epoch": 430} {"train_loss": -5.224788188934326, "global_step": 18077, "epoch": 430} {"train_loss": -5.237767696380615, "global_step": 18078, "epoch": 430} {"train_loss": -5.196201801300049, "global_step": 18079, "epoch": 430} {"train_loss": -5.208719730377197, "global_step": 18080, "epoch": 430} {"train_loss": -5.187021255493164, "global_step": 18081, "epoch": 430} {"train_loss": -5.2790045738220215, "global_step": 18082, "epoch": 430} {"train_loss": -5.224847793579102, "global_step": 18083, "epoch": 430} {"train_loss": -5.276651382446289, "global_step": 18084, "epoch": 430} {"train_loss": -5.257737159729004, "global_step": 18085, "epoch": 430} {"train_loss": -5.407562255859375, "global_step": 18086, "epoch": 430} {"train_loss": -5.362724304199219, "global_step": 18087, "epoch": 430} {"train_loss": -5.235782623291016, "global_step": 18088, "epoch": 430} {"train_loss": -5.262211799621582, "global_step": 18089, "epoch": 430} {"train_loss": -5.21337366104126, "global_step": 18090, "epoch": 430} {"train_loss": -5.403263092041016, "global_step": 18091, "epoch": 430} {"train_loss": -5.220680236816406, "global_step": 18092, "epoch": 430} {"train_loss": -5.254117965698242, "global_step": 18093, "epoch": 430} {"train_loss": -5.17186164855957, "global_step": 18094, "epoch": 430} {"train_loss": -5.220666408538818, "global_step": 18095, "epoch": 430} {"train_loss": -5.4067230224609375, "global_step": 18096, "epoch": 430} {"train_loss": -5.065591812133789, "global_step": 18097, "epoch": 430} {"train_loss": -5.188652038574219, "global_step": 18098, "epoch": 430} {"train_loss": -5.235193252563477, "global_step": 18099, "epoch": 430} {"train_loss": -5.284170150756836, "global_step": 18100, "epoch": 430} {"train_loss": -5.248068468911307, "global_step": 18101, "epoch": 430, "val_loss": 77506.53125} {"train_loss": -5.019268989562988, "global_step": 18102, "epoch": 431} {"train_loss": -5.256796836853027, "global_step": 18103, "epoch": 431} {"train_loss": -5.242596626281738, "global_step": 18104, "epoch": 431} {"train_loss": -5.292994499206543, "global_step": 18105, "epoch": 431} {"train_loss": -5.261582374572754, "global_step": 18106, "epoch": 431} {"train_loss": -5.285135269165039, "global_step": 18107, "epoch": 431} {"train_loss": -5.327395439147949, "global_step": 18108, "epoch": 431} {"train_loss": -5.197978496551514, "global_step": 18109, "epoch": 431} {"train_loss": -5.259720802307129, "global_step": 18110, "epoch": 431} {"train_loss": -5.310032844543457, "global_step": 18111, "epoch": 431} {"train_loss": -5.1300458908081055, "global_step": 18112, "epoch": 431} {"train_loss": -5.325868606567383, "global_step": 18113, "epoch": 431} {"train_loss": -5.408473014831543, "global_step": 18114, "epoch": 431} {"train_loss": -5.187982559204102, "global_step": 18115, "epoch": 431} {"train_loss": -5.194684982299805, "global_step": 18116, "epoch": 431} {"train_loss": -5.176729202270508, "global_step": 18117, "epoch": 431} {"train_loss": -5.159726142883301, "global_step": 18118, "epoch": 431} {"train_loss": -5.247048377990723, "global_step": 18119, "epoch": 431} {"train_loss": -5.195076942443848, "global_step": 18120, "epoch": 431} {"train_loss": -5.157495498657227, "global_step": 18121, "epoch": 431} {"train_loss": -5.375046730041504, "global_step": 18122, "epoch": 431} {"train_loss": -5.00522518157959, "global_step": 18123, "epoch": 431} {"train_loss": -5.308236122131348, "global_step": 18124, "epoch": 431} {"train_loss": -5.13533878326416, "global_step": 18125, "epoch": 431} {"train_loss": -5.137202262878418, "global_step": 18126, "epoch": 431} {"train_loss": -5.204726219177246, "global_step": 18127, "epoch": 431} {"train_loss": -5.2209978103637695, "global_step": 18128, "epoch": 431} {"train_loss": -5.068752288818359, "global_step": 18129, "epoch": 431} {"train_loss": -5.1565656661987305, "global_step": 18130, "epoch": 431} {"train_loss": -5.2173261642456055, "global_step": 18131, "epoch": 431} {"train_loss": -5.076243877410889, "global_step": 18132, "epoch": 431} {"train_loss": -5.134399890899658, "global_step": 18133, "epoch": 431} {"train_loss": -5.143328666687012, "global_step": 18134, "epoch": 431} {"train_loss": -5.163203239440918, "global_step": 18135, "epoch": 431} {"train_loss": -5.239609241485596, "global_step": 18136, "epoch": 431} {"train_loss": -5.160196304321289, "global_step": 18137, "epoch": 431} {"train_loss": -5.261439800262451, "global_step": 18138, "epoch": 431} {"train_loss": -5.172122955322266, "global_step": 18139, "epoch": 431} {"train_loss": -5.132913112640381, "global_step": 18140, "epoch": 431} {"train_loss": -5.375329971313477, "global_step": 18141, "epoch": 431} {"train_loss": -5.195201396942139, "global_step": 18142, "epoch": 431} {"train_loss": -5.2050658748263405, "global_step": 18143, "epoch": 431, "val_loss": 77556.71875} {"train_loss": -5.242781162261963, "global_step": 18144, "epoch": 432} {"train_loss": -5.230597496032715, "global_step": 18145, "epoch": 432} {"train_loss": -5.183209419250488, "global_step": 18146, "epoch": 432} {"train_loss": -5.286005973815918, "global_step": 18147, "epoch": 432} {"train_loss": -5.2669830322265625, "global_step": 18148, "epoch": 432} {"train_loss": -5.142139434814453, "global_step": 18149, "epoch": 432} {"train_loss": -5.211777687072754, "global_step": 18150, "epoch": 432} {"train_loss": -5.212298393249512, "global_step": 18151, "epoch": 432} {"train_loss": -5.210722923278809, "global_step": 18152, "epoch": 432} {"train_loss": -5.208083629608154, "global_step": 18153, "epoch": 432} {"train_loss": -5.087453842163086, "global_step": 18154, "epoch": 432} {"train_loss": -5.209323883056641, "global_step": 18155, "epoch": 432} {"train_loss": -5.303565979003906, "global_step": 18156, "epoch": 432} {"train_loss": -5.162397384643555, "global_step": 18157, "epoch": 432} {"train_loss": -5.218999862670898, "global_step": 18158, "epoch": 432} {"train_loss": -5.08812141418457, "global_step": 18159, "epoch": 432} {"train_loss": -5.195558547973633, "global_step": 18160, "epoch": 432} {"train_loss": -5.341458320617676, "global_step": 18161, "epoch": 432} {"train_loss": -5.241244316101074, "global_step": 18162, "epoch": 432} {"train_loss": -5.255786895751953, "global_step": 18163, "epoch": 432} {"train_loss": -5.237898826599121, "global_step": 18164, "epoch": 432} {"train_loss": -5.240235328674316, "global_step": 18165, "epoch": 432} {"train_loss": -5.432167053222656, "global_step": 18166, "epoch": 432} {"train_loss": -5.196056365966797, "global_step": 18167, "epoch": 432} {"train_loss": -5.3737664222717285, "global_step": 18168, "epoch": 432} {"train_loss": -5.34562873840332, "global_step": 18169, "epoch": 432} {"train_loss": -5.4287004470825195, "global_step": 18170, "epoch": 432} {"train_loss": -5.264740467071533, "global_step": 18171, "epoch": 432} {"train_loss": -5.236292839050293, "global_step": 18172, "epoch": 432} {"train_loss": -5.36201286315918, "global_step": 18173, "epoch": 432} {"train_loss": -5.317923069000244, "global_step": 18174, "epoch": 432} {"train_loss": -5.1811113357543945, "global_step": 18175, "epoch": 432} {"train_loss": -5.3002753257751465, "global_step": 18176, "epoch": 432} {"train_loss": -5.177172660827637, "global_step": 18177, "epoch": 432} {"train_loss": -5.136776447296143, "global_step": 18178, "epoch": 432} {"train_loss": -5.29455041885376, "global_step": 18179, "epoch": 432} {"train_loss": -5.285545825958252, "global_step": 18180, "epoch": 432} {"train_loss": -5.291536331176758, "global_step": 18181, "epoch": 432} {"train_loss": -5.214043617248535, "global_step": 18182, "epoch": 432} {"train_loss": -5.186385154724121, "global_step": 18183, "epoch": 432} {"train_loss": -5.195098876953125, "global_step": 18184, "epoch": 432} {"train_loss": -5.242543799536569, "global_step": 18185, "epoch": 432, "val_loss": 78012.28125} {"train_loss": -5.242650985717773, "global_step": 18186, "epoch": 433} {"train_loss": -5.224841117858887, "global_step": 18187, "epoch": 433} {"train_loss": -5.303388595581055, "global_step": 18188, "epoch": 433} {"train_loss": -5.261298179626465, "global_step": 18189, "epoch": 433} {"train_loss": -5.2288618087768555, "global_step": 18190, "epoch": 433} {"train_loss": -5.321502685546875, "global_step": 18191, "epoch": 433} {"train_loss": -5.196310520172119, "global_step": 18192, "epoch": 433} {"train_loss": -5.160551071166992, "global_step": 18193, "epoch": 433} {"train_loss": -5.257658004760742, "global_step": 18194, "epoch": 433} {"train_loss": -5.260382652282715, "global_step": 18195, "epoch": 433} {"train_loss": -5.188726902008057, "global_step": 18196, "epoch": 433} {"train_loss": -5.343049049377441, "global_step": 18197, "epoch": 433} {"train_loss": -5.14864444732666, "global_step": 18198, "epoch": 433} {"train_loss": -5.1848955154418945, "global_step": 18199, "epoch": 433} {"train_loss": -5.115385055541992, "global_step": 18200, "epoch": 433} {"train_loss": -5.260659217834473, "global_step": 18201, "epoch": 433} {"train_loss": -5.065162181854248, "global_step": 18202, "epoch": 433} {"train_loss": -5.373284339904785, "global_step": 18203, "epoch": 433} {"train_loss": -5.169887542724609, "global_step": 18204, "epoch": 433} {"train_loss": -5.284003257751465, "global_step": 18205, "epoch": 433} {"train_loss": -5.160630226135254, "global_step": 18206, "epoch": 433} {"train_loss": -5.191488742828369, "global_step": 18207, "epoch": 433} {"train_loss": -5.117988586425781, "global_step": 18208, "epoch": 433} {"train_loss": -5.275430679321289, "global_step": 18209, "epoch": 433} {"train_loss": -5.389700889587402, "global_step": 18210, "epoch": 433} {"train_loss": -5.171782493591309, "global_step": 18211, "epoch": 433} {"train_loss": -5.220302581787109, "global_step": 18212, "epoch": 433} {"train_loss": -5.151853084564209, "global_step": 18213, "epoch": 433} {"train_loss": -5.261888027191162, "global_step": 18214, "epoch": 433} {"train_loss": -5.265742778778076, "global_step": 18215, "epoch": 433} {"train_loss": -5.23645544052124, "global_step": 18216, "epoch": 433} {"train_loss": -5.2538042068481445, "global_step": 18217, "epoch": 433} {"train_loss": -5.359960556030273, "global_step": 18218, "epoch": 433} {"train_loss": -4.952775955200195, "global_step": 18219, "epoch": 433} {"train_loss": -5.130592346191406, "global_step": 18220, "epoch": 433} {"train_loss": -5.328152656555176, "global_step": 18221, "epoch": 433} {"train_loss": -5.158238410949707, "global_step": 18222, "epoch": 433} {"train_loss": -4.92672872543335, "global_step": 18223, "epoch": 433} {"train_loss": -5.275744438171387, "global_step": 18224, "epoch": 433} {"train_loss": -5.234569549560547, "global_step": 18225, "epoch": 433} {"train_loss": -5.160019874572754, "global_step": 18226, "epoch": 433} {"train_loss": -5.212976546514602, "global_step": 18227, "epoch": 433, "val_loss": 79021.71875} {"train_loss": -5.093141078948975, "global_step": 18228, "epoch": 434} {"train_loss": -5.2002668380737305, "global_step": 18229, "epoch": 434} {"train_loss": -5.1935529708862305, "global_step": 18230, "epoch": 434} {"train_loss": -5.25346565246582, "global_step": 18231, "epoch": 434} {"train_loss": -5.195718288421631, "global_step": 18232, "epoch": 434} {"train_loss": -4.993143558502197, "global_step": 18233, "epoch": 434} {"train_loss": -5.232887268066406, "global_step": 18234, "epoch": 434} {"train_loss": -5.372002601623535, "global_step": 18235, "epoch": 434} {"train_loss": -5.139191627502441, "global_step": 18236, "epoch": 434} {"train_loss": -5.267393589019775, "global_step": 18237, "epoch": 434} {"train_loss": -5.208147048950195, "global_step": 18238, "epoch": 434} {"train_loss": -5.254157543182373, "global_step": 18239, "epoch": 434} {"train_loss": -5.123785972595215, "global_step": 18240, "epoch": 434} {"train_loss": -5.329626083374023, "global_step": 18241, "epoch": 434} {"train_loss": -5.236824989318848, "global_step": 18242, "epoch": 434} {"train_loss": -5.244385719299316, "global_step": 18243, "epoch": 434} {"train_loss": -5.248815536499023, "global_step": 18244, "epoch": 434} {"train_loss": -5.111356735229492, "global_step": 18245, "epoch": 434} {"train_loss": -5.173567295074463, "global_step": 18246, "epoch": 434} {"train_loss": -5.1065473556518555, "global_step": 18247, "epoch": 434} {"train_loss": -5.286301612854004, "global_step": 18248, "epoch": 434} {"train_loss": -5.091680526733398, "global_step": 18249, "epoch": 434} {"train_loss": -5.376973628997803, "global_step": 18250, "epoch": 434} {"train_loss": -5.224339485168457, "global_step": 18251, "epoch": 434} {"train_loss": -5.129647254943848, "global_step": 18252, "epoch": 434} {"train_loss": -5.281808853149414, "global_step": 18253, "epoch": 434} {"train_loss": -5.251711368560791, "global_step": 18254, "epoch": 434} {"train_loss": -5.253757476806641, "global_step": 18255, "epoch": 434} {"train_loss": -5.130728721618652, "global_step": 18256, "epoch": 434} {"train_loss": -5.3015031814575195, "global_step": 18257, "epoch": 434} {"train_loss": -5.23273229598999, "global_step": 18258, "epoch": 434} {"train_loss": -5.22490119934082, "global_step": 18259, "epoch": 434} {"train_loss": -5.37110710144043, "global_step": 18260, "epoch": 434} {"train_loss": -5.340758323669434, "global_step": 18261, "epoch": 434} {"train_loss": -5.26344633102417, "global_step": 18262, "epoch": 434} {"train_loss": -5.332262992858887, "global_step": 18263, "epoch": 434} {"train_loss": -5.333513259887695, "global_step": 18264, "epoch": 434} {"train_loss": -5.2735700607299805, "global_step": 18265, "epoch": 434} {"train_loss": -5.187567710876465, "global_step": 18266, "epoch": 434} {"train_loss": -5.264525413513184, "global_step": 18267, "epoch": 434} {"train_loss": -5.183725357055664, "global_step": 18268, "epoch": 434} {"train_loss": -5.228738024121239, "global_step": 18269, "epoch": 434, "val_loss": 77692.2734375} {"train_loss": -5.274013519287109, "global_step": 18270, "epoch": 435} {"train_loss": -5.31048583984375, "global_step": 18271, "epoch": 435} {"train_loss": -5.1918182373046875, "global_step": 18272, "epoch": 435} {"train_loss": -5.236133575439453, "global_step": 18273, "epoch": 435} {"train_loss": -5.255206108093262, "global_step": 18274, "epoch": 435} {"train_loss": -5.242917060852051, "global_step": 18275, "epoch": 435} {"train_loss": -5.239885330200195, "global_step": 18276, "epoch": 435} {"train_loss": -5.277256488800049, "global_step": 18277, "epoch": 435} {"train_loss": -5.238576889038086, "global_step": 18278, "epoch": 435} {"train_loss": -5.2871575355529785, "global_step": 18279, "epoch": 435} {"train_loss": -5.173112869262695, "global_step": 18280, "epoch": 435} {"train_loss": -5.251125812530518, "global_step": 18281, "epoch": 435} {"train_loss": -5.2669358253479, "global_step": 18282, "epoch": 435} {"train_loss": -5.371281623840332, "global_step": 18283, "epoch": 435} {"train_loss": -5.153522491455078, "global_step": 18284, "epoch": 435} {"train_loss": -5.2672224044799805, "global_step": 18285, "epoch": 435} {"train_loss": -5.236764907836914, "global_step": 18286, "epoch": 435} {"train_loss": -5.336111545562744, "global_step": 18287, "epoch": 435} {"train_loss": -5.287287712097168, "global_step": 18288, "epoch": 435} {"train_loss": -5.312915802001953, "global_step": 18289, "epoch": 435} {"train_loss": -5.168344497680664, "global_step": 18290, "epoch": 435} {"train_loss": -5.357544898986816, "global_step": 18291, "epoch": 435} {"train_loss": -5.214057922363281, "global_step": 18292, "epoch": 435} {"train_loss": -5.174428939819336, "global_step": 18293, "epoch": 435} {"train_loss": -5.279030799865723, "global_step": 18294, "epoch": 435} {"train_loss": -5.186656951904297, "global_step": 18295, "epoch": 435} {"train_loss": -5.274050712585449, "global_step": 18296, "epoch": 435} {"train_loss": -5.254866123199463, "global_step": 18297, "epoch": 435} {"train_loss": -5.235814094543457, "global_step": 18298, "epoch": 435} {"train_loss": -5.108606815338135, "global_step": 18299, "epoch": 435} {"train_loss": -5.231978893280029, "global_step": 18300, "epoch": 435} {"train_loss": -5.315970420837402, "global_step": 18301, "epoch": 435} {"train_loss": -5.060085296630859, "global_step": 18302, "epoch": 435} {"train_loss": -5.219426155090332, "global_step": 18303, "epoch": 435} {"train_loss": -5.450966835021973, "global_step": 18304, "epoch": 435} {"train_loss": -5.233206748962402, "global_step": 18305, "epoch": 435} {"train_loss": -5.276481628417969, "global_step": 18306, "epoch": 435} {"train_loss": -5.327092170715332, "global_step": 18307, "epoch": 435} {"train_loss": -5.287443161010742, "global_step": 18308, "epoch": 435} {"train_loss": -5.186061859130859, "global_step": 18309, "epoch": 435} {"train_loss": -5.217775344848633, "global_step": 18310, "epoch": 435} {"train_loss": -5.25026577994937, "global_step": 18311, "epoch": 435, "val_loss": 77260.0859375} {"train_loss": -5.204739093780518, "global_step": 18312, "epoch": 436} {"train_loss": -5.228292465209961, "global_step": 18313, "epoch": 436} {"train_loss": -5.318077087402344, "global_step": 18314, "epoch": 436} {"train_loss": -5.301545143127441, "global_step": 18315, "epoch": 436} {"train_loss": -5.23640251159668, "global_step": 18316, "epoch": 436} {"train_loss": -5.344517230987549, "global_step": 18317, "epoch": 436} {"train_loss": -5.33268928527832, "global_step": 18318, "epoch": 436} {"train_loss": -5.337284088134766, "global_step": 18319, "epoch": 436} {"train_loss": -5.325716018676758, "global_step": 18320, "epoch": 436} {"train_loss": -5.328003883361816, "global_step": 18321, "epoch": 436} {"train_loss": -5.241870880126953, "global_step": 18322, "epoch": 436} {"train_loss": -5.103482246398926, "global_step": 18323, "epoch": 436} {"train_loss": -5.172908782958984, "global_step": 18324, "epoch": 436} {"train_loss": -5.186219692230225, "global_step": 18325, "epoch": 436} {"train_loss": -5.235194206237793, "global_step": 18326, "epoch": 436} {"train_loss": -5.117066383361816, "global_step": 18327, "epoch": 436} {"train_loss": -5.282829761505127, "global_step": 18328, "epoch": 436} {"train_loss": -5.190192222595215, "global_step": 18329, "epoch": 436} {"train_loss": -5.168337821960449, "global_step": 18330, "epoch": 436} {"train_loss": -5.253961563110352, "global_step": 18331, "epoch": 436} {"train_loss": -5.292978286743164, "global_step": 18332, "epoch": 436} {"train_loss": -5.213773250579834, "global_step": 18333, "epoch": 436} {"train_loss": -5.28595495223999, "global_step": 18334, "epoch": 436} {"train_loss": -5.257956504821777, "global_step": 18335, "epoch": 436} {"train_loss": -5.210239410400391, "global_step": 18336, "epoch": 436} {"train_loss": -5.255642890930176, "global_step": 18337, "epoch": 436} {"train_loss": -5.403433322906494, "global_step": 18338, "epoch": 436} {"train_loss": -5.202584266662598, "global_step": 18339, "epoch": 436} {"train_loss": -5.231719017028809, "global_step": 18340, "epoch": 436} {"train_loss": -5.279489517211914, "global_step": 18341, "epoch": 436} {"train_loss": -5.187805652618408, "global_step": 18342, "epoch": 436} {"train_loss": -5.1518449783325195, "global_step": 18343, "epoch": 436} {"train_loss": -5.24769401550293, "global_step": 18344, "epoch": 436} {"train_loss": -5.353863716125488, "global_step": 18345, "epoch": 436} {"train_loss": -5.414357662200928, "global_step": 18346, "epoch": 436} {"train_loss": -5.2555694580078125, "global_step": 18347, "epoch": 436} {"train_loss": -5.2133965492248535, "global_step": 18348, "epoch": 436} {"train_loss": -5.218031883239746, "global_step": 18349, "epoch": 436} {"train_loss": -5.337586402893066, "global_step": 18350, "epoch": 436} {"train_loss": -5.260732650756836, "global_step": 18351, "epoch": 436} {"train_loss": -5.307503700256348, "global_step": 18352, "epoch": 436} {"train_loss": -5.259267148517427, "global_step": 18353, "epoch": 436, "val_loss": 78013.21875} {"train_loss": -5.258850574493408, "global_step": 18354, "epoch": 437} {"train_loss": -5.237789154052734, "global_step": 18355, "epoch": 437} {"train_loss": -5.1615190505981445, "global_step": 18356, "epoch": 437} {"train_loss": -5.343900680541992, "global_step": 18357, "epoch": 437} {"train_loss": -5.13401985168457, "global_step": 18358, "epoch": 437} {"train_loss": -5.294063568115234, "global_step": 18359, "epoch": 437} {"train_loss": -5.278130531311035, "global_step": 18360, "epoch": 437} {"train_loss": -5.194349765777588, "global_step": 18361, "epoch": 437} {"train_loss": -5.28458309173584, "global_step": 18362, "epoch": 437} {"train_loss": -5.246066093444824, "global_step": 18363, "epoch": 437} {"train_loss": -5.3900651931762695, "global_step": 18364, "epoch": 437} {"train_loss": -5.19509220123291, "global_step": 18365, "epoch": 437} {"train_loss": -5.424444198608398, "global_step": 18366, "epoch": 437} {"train_loss": -5.244394302368164, "global_step": 18367, "epoch": 437} {"train_loss": -5.233634948730469, "global_step": 18368, "epoch": 437} {"train_loss": -5.181262969970703, "global_step": 18369, "epoch": 437} {"train_loss": -5.237373352050781, "global_step": 18370, "epoch": 437} {"train_loss": -5.084615707397461, "global_step": 18371, "epoch": 437} {"train_loss": -5.273797988891602, "global_step": 18372, "epoch": 437} {"train_loss": -5.318126678466797, "global_step": 18373, "epoch": 437} {"train_loss": -5.273682594299316, "global_step": 18374, "epoch": 437} {"train_loss": -5.279890060424805, "global_step": 18375, "epoch": 437} {"train_loss": -5.300349712371826, "global_step": 18376, "epoch": 437} {"train_loss": -5.346560478210449, "global_step": 18377, "epoch": 437} {"train_loss": -5.264130115509033, "global_step": 18378, "epoch": 437} {"train_loss": -5.287014484405518, "global_step": 18379, "epoch": 437} {"train_loss": -5.142584800720215, "global_step": 18380, "epoch": 437} {"train_loss": -5.180403709411621, "global_step": 18381, "epoch": 437} {"train_loss": -5.292472839355469, "global_step": 18382, "epoch": 437} {"train_loss": -5.1641716957092285, "global_step": 18383, "epoch": 437} {"train_loss": -5.268862724304199, "global_step": 18384, "epoch": 437} {"train_loss": -5.154720783233643, "global_step": 18385, "epoch": 437} {"train_loss": -5.23819637298584, "global_step": 18386, "epoch": 437} {"train_loss": -5.157788276672363, "global_step": 18387, "epoch": 437} {"train_loss": -5.1242852210998535, "global_step": 18388, "epoch": 437} {"train_loss": -5.3349609375, "global_step": 18389, "epoch": 437} {"train_loss": -5.041276931762695, "global_step": 18390, "epoch": 437} {"train_loss": -5.153926372528076, "global_step": 18391, "epoch": 437} {"train_loss": -5.283522605895996, "global_step": 18392, "epoch": 437} {"train_loss": -5.211803913116455, "global_step": 18393, "epoch": 437} {"train_loss": -5.2967529296875, "global_step": 18394, "epoch": 437} {"train_loss": -5.2361276263282415, "global_step": 18395, "epoch": 437, "val_loss": 77780.984375} {"train_loss": -5.353033065795898, "global_step": 18396, "epoch": 438} {"train_loss": -5.25599479675293, "global_step": 18397, "epoch": 438} {"train_loss": -5.199903964996338, "global_step": 18398, "epoch": 438} {"train_loss": -5.332268238067627, "global_step": 18399, "epoch": 438} {"train_loss": -5.236293792724609, "global_step": 18400, "epoch": 438} {"train_loss": -5.302654266357422, "global_step": 18401, "epoch": 438} {"train_loss": -5.289087772369385, "global_step": 18402, "epoch": 438} {"train_loss": -5.460961818695068, "global_step": 18403, "epoch": 438} {"train_loss": -5.356324195861816, "global_step": 18404, "epoch": 438} {"train_loss": -5.197287559509277, "global_step": 18405, "epoch": 438} {"train_loss": -5.302525520324707, "global_step": 18406, "epoch": 438} {"train_loss": -5.328888893127441, "global_step": 18407, "epoch": 438} {"train_loss": -5.125030994415283, "global_step": 18408, "epoch": 438} {"train_loss": -5.220737457275391, "global_step": 18409, "epoch": 438} {"train_loss": -4.99339485168457, "global_step": 18410, "epoch": 438} {"train_loss": -5.28708028793335, "global_step": 18411, "epoch": 438} {"train_loss": -5.277356147766113, "global_step": 18412, "epoch": 438} {"train_loss": -5.178807258605957, "global_step": 18413, "epoch": 438} {"train_loss": -5.18409538269043, "global_step": 18414, "epoch": 438} {"train_loss": -5.177391052246094, "global_step": 18415, "epoch": 438} {"train_loss": -5.175234794616699, "global_step": 18416, "epoch": 438} {"train_loss": -5.29094934463501, "global_step": 18417, "epoch": 438} {"train_loss": -5.161619186401367, "global_step": 18418, "epoch": 438} {"train_loss": -5.310103416442871, "global_step": 18419, "epoch": 438} {"train_loss": -5.042740821838379, "global_step": 18420, "epoch": 438} {"train_loss": -5.262648582458496, "global_step": 18421, "epoch": 438} {"train_loss": -5.0781965255737305, "global_step": 18422, "epoch": 438} {"train_loss": -5.1771955490112305, "global_step": 18423, "epoch": 438} {"train_loss": -5.265695571899414, "global_step": 18424, "epoch": 438} {"train_loss": -5.214572906494141, "global_step": 18425, "epoch": 438} {"train_loss": -5.301943778991699, "global_step": 18426, "epoch": 438} {"train_loss": -5.163897514343262, "global_step": 18427, "epoch": 438} {"train_loss": -5.259586334228516, "global_step": 18428, "epoch": 438} {"train_loss": -5.263443470001221, "global_step": 18429, "epoch": 438} {"train_loss": -5.31755256652832, "global_step": 18430, "epoch": 438} {"train_loss": -5.139804840087891, "global_step": 18431, "epoch": 438} {"train_loss": -5.266932964324951, "global_step": 18432, "epoch": 438} {"train_loss": -5.250738620758057, "global_step": 18433, "epoch": 438} {"train_loss": -5.218919277191162, "global_step": 18434, "epoch": 438} {"train_loss": -5.371157646179199, "global_step": 18435, "epoch": 438} {"train_loss": -5.2583394050598145, "global_step": 18436, "epoch": 438} {"train_loss": -5.237433842250279, "global_step": 18437, "epoch": 438, "val_loss": 76873.9375} {"train_loss": -5.248208045959473, "global_step": 18438, "epoch": 439} {"train_loss": -5.110990524291992, "global_step": 18439, "epoch": 439} {"train_loss": -5.137014389038086, "global_step": 18440, "epoch": 439} {"train_loss": -5.173908233642578, "global_step": 18441, "epoch": 439} {"train_loss": -5.138363361358643, "global_step": 18442, "epoch": 439} {"train_loss": -5.27385950088501, "global_step": 18443, "epoch": 439} {"train_loss": -5.261473655700684, "global_step": 18444, "epoch": 439} {"train_loss": -5.32916259765625, "global_step": 18445, "epoch": 439} {"train_loss": -5.211575984954834, "global_step": 18446, "epoch": 439} {"train_loss": -5.280246734619141, "global_step": 18447, "epoch": 439} {"train_loss": -5.29415225982666, "global_step": 18448, "epoch": 439} {"train_loss": -5.4561567306518555, "global_step": 18449, "epoch": 439} {"train_loss": -5.356374740600586, "global_step": 18450, "epoch": 439} {"train_loss": -5.164307117462158, "global_step": 18451, "epoch": 439} {"train_loss": -5.339042663574219, "global_step": 18452, "epoch": 439} {"train_loss": -5.216001510620117, "global_step": 18453, "epoch": 439} {"train_loss": -5.252472400665283, "global_step": 18454, "epoch": 439} {"train_loss": -5.17754602432251, "global_step": 18455, "epoch": 439} {"train_loss": -5.278552055358887, "global_step": 18456, "epoch": 439} {"train_loss": -5.231093406677246, "global_step": 18457, "epoch": 439} {"train_loss": -5.379976272583008, "global_step": 18458, "epoch": 439} {"train_loss": -5.103952407836914, "global_step": 18459, "epoch": 439} {"train_loss": -5.2848711013793945, "global_step": 18460, "epoch": 439} {"train_loss": -5.042984962463379, "global_step": 18461, "epoch": 439} {"train_loss": -5.325096607208252, "global_step": 18462, "epoch": 439} {"train_loss": -5.241355895996094, "global_step": 18463, "epoch": 439} {"train_loss": -4.992870330810547, "global_step": 18464, "epoch": 439} {"train_loss": -5.28564977645874, "global_step": 18465, "epoch": 439} {"train_loss": -5.160909175872803, "global_step": 18466, "epoch": 439} {"train_loss": -5.133584976196289, "global_step": 18467, "epoch": 439} {"train_loss": -5.393838405609131, "global_step": 18468, "epoch": 439} {"train_loss": -5.116201400756836, "global_step": 18469, "epoch": 439} {"train_loss": -5.214203357696533, "global_step": 18470, "epoch": 439} {"train_loss": -5.082300186157227, "global_step": 18471, "epoch": 439} {"train_loss": -5.154712200164795, "global_step": 18472, "epoch": 439} {"train_loss": -5.179413318634033, "global_step": 18473, "epoch": 439} {"train_loss": -5.246496200561523, "global_step": 18474, "epoch": 439} {"train_loss": -5.3432722091674805, "global_step": 18475, "epoch": 439} {"train_loss": -5.146672248840332, "global_step": 18476, "epoch": 439} {"train_loss": -5.242528438568115, "global_step": 18477, "epoch": 439} {"train_loss": -5.219816207885742, "global_step": 18478, "epoch": 439} {"train_loss": -5.225315956842332, "global_step": 18479, "epoch": 439, "val_loss": 77524.140625} {"train_loss": -5.255615234375, "global_step": 18480, "epoch": 440} {"train_loss": -5.311450958251953, "global_step": 18481, "epoch": 440} {"train_loss": -5.218135833740234, "global_step": 18482, "epoch": 440} {"train_loss": -5.256667613983154, "global_step": 18483, "epoch": 440} {"train_loss": -5.227704048156738, "global_step": 18484, "epoch": 440} {"train_loss": -5.424886703491211, "global_step": 18485, "epoch": 440} {"train_loss": -5.048549652099609, "global_step": 18486, "epoch": 440} {"train_loss": -5.199719429016113, "global_step": 18487, "epoch": 440} {"train_loss": -5.166170120239258, "global_step": 18488, "epoch": 440} {"train_loss": -5.262367248535156, "global_step": 18489, "epoch": 440} {"train_loss": -5.279239177703857, "global_step": 18490, "epoch": 440} {"train_loss": -5.2804718017578125, "global_step": 18491, "epoch": 440} {"train_loss": -5.258969783782959, "global_step": 18492, "epoch": 440} {"train_loss": -5.177098274230957, "global_step": 18493, "epoch": 440} {"train_loss": -5.144506454467773, "global_step": 18494, "epoch": 440} {"train_loss": -5.411111831665039, "global_step": 18495, "epoch": 440} {"train_loss": -5.232308387756348, "global_step": 18496, "epoch": 440} {"train_loss": -5.429841995239258, "global_step": 18497, "epoch": 440} {"train_loss": -5.214900970458984, "global_step": 18498, "epoch": 440} {"train_loss": -5.162348747253418, "global_step": 18499, "epoch": 440} {"train_loss": -5.302769184112549, "global_step": 18500, "epoch": 440} {"train_loss": -5.129836082458496, "global_step": 18501, "epoch": 440} {"train_loss": -5.476122856140137, "global_step": 18502, "epoch": 440} {"train_loss": -5.289708137512207, "global_step": 18503, "epoch": 440} {"train_loss": -5.224822998046875, "global_step": 18504, "epoch": 440} {"train_loss": -5.232331275939941, "global_step": 18505, "epoch": 440} {"train_loss": -5.228858947753906, "global_step": 18506, "epoch": 440} {"train_loss": -5.112820625305176, "global_step": 18507, "epoch": 440} {"train_loss": -5.309627056121826, "global_step": 18508, "epoch": 440} {"train_loss": -5.28877592086792, "global_step": 18509, "epoch": 440} {"train_loss": -5.1714372634887695, "global_step": 18510, "epoch": 440} {"train_loss": -5.332340240478516, "global_step": 18511, "epoch": 440} {"train_loss": -5.296538352966309, "global_step": 18512, "epoch": 440} {"train_loss": -5.319413185119629, "global_step": 18513, "epoch": 440} {"train_loss": -5.298378944396973, "global_step": 18514, "epoch": 440} {"train_loss": -5.191737651824951, "global_step": 18515, "epoch": 440} {"train_loss": -5.272231101989746, "global_step": 18516, "epoch": 440} {"train_loss": -5.3161516189575195, "global_step": 18517, "epoch": 440} {"train_loss": -5.274003028869629, "global_step": 18518, "epoch": 440} {"train_loss": -5.310355186462402, "global_step": 18519, "epoch": 440} {"train_loss": -5.244237899780273, "global_step": 18520, "epoch": 440} {"train_loss": -5.257607516788301, "global_step": 18521, "epoch": 440, "val_loss": 76908.1796875} {"train_loss": -5.13637638092041, "global_step": 18522, "epoch": 441} {"train_loss": -5.23895263671875, "global_step": 18523, "epoch": 441} {"train_loss": -5.303764343261719, "global_step": 18524, "epoch": 441} {"train_loss": -5.2469682693481445, "global_step": 18525, "epoch": 441} {"train_loss": -5.240689754486084, "global_step": 18526, "epoch": 441} {"train_loss": -5.265847206115723, "global_step": 18527, "epoch": 441} {"train_loss": -5.169086456298828, "global_step": 18528, "epoch": 441} {"train_loss": -5.420173645019531, "global_step": 18529, "epoch": 441} {"train_loss": -5.237062931060791, "global_step": 18530, "epoch": 441} {"train_loss": -5.200302600860596, "global_step": 18531, "epoch": 441} {"train_loss": -5.255899429321289, "global_step": 18532, "epoch": 441} {"train_loss": -5.228124618530273, "global_step": 18533, "epoch": 441} {"train_loss": -5.361244201660156, "global_step": 18534, "epoch": 441} {"train_loss": -5.1751627922058105, "global_step": 18535, "epoch": 441} {"train_loss": -5.068428993225098, "global_step": 18536, "epoch": 441} {"train_loss": -5.282858371734619, "global_step": 18537, "epoch": 441} {"train_loss": -5.157698631286621, "global_step": 18538, "epoch": 441} {"train_loss": -5.1597514152526855, "global_step": 18539, "epoch": 441} {"train_loss": -5.279996871948242, "global_step": 18540, "epoch": 441} {"train_loss": -5.219204902648926, "global_step": 18541, "epoch": 441} {"train_loss": -5.251950263977051, "global_step": 18542, "epoch": 441} {"train_loss": -5.170748710632324, "global_step": 18543, "epoch": 441} {"train_loss": -5.212827682495117, "global_step": 18544, "epoch": 441} {"train_loss": -5.098257541656494, "global_step": 18545, "epoch": 441} {"train_loss": -5.135077953338623, "global_step": 18546, "epoch": 441} {"train_loss": -5.265721321105957, "global_step": 18547, "epoch": 441} {"train_loss": -5.147873878479004, "global_step": 18548, "epoch": 441} {"train_loss": -5.238022804260254, "global_step": 18549, "epoch": 441} {"train_loss": -5.261098384857178, "global_step": 18550, "epoch": 441} {"train_loss": -5.252720832824707, "global_step": 18551, "epoch": 441} {"train_loss": -5.253820419311523, "global_step": 18552, "epoch": 441} {"train_loss": -5.2501325607299805, "global_step": 18553, "epoch": 441} {"train_loss": -5.252982139587402, "global_step": 18554, "epoch": 441} {"train_loss": -5.233608245849609, "global_step": 18555, "epoch": 441} {"train_loss": -5.184723854064941, "global_step": 18556, "epoch": 441} {"train_loss": -5.28148889541626, "global_step": 18557, "epoch": 441} {"train_loss": -5.19857120513916, "global_step": 18558, "epoch": 441} {"train_loss": -5.208189010620117, "global_step": 18559, "epoch": 441} {"train_loss": -5.327262878417969, "global_step": 18560, "epoch": 441} {"train_loss": -5.2231035232543945, "global_step": 18561, "epoch": 441} {"train_loss": -5.163906574249268, "global_step": 18562, "epoch": 441} {"train_loss": -5.225762798672631, "global_step": 18563, "epoch": 441, "val_loss": 77066.984375} {"train_loss": -5.354599952697754, "global_step": 18564, "epoch": 442} {"train_loss": -5.203974723815918, "global_step": 18565, "epoch": 442} {"train_loss": -5.296941757202148, "global_step": 18566, "epoch": 442} {"train_loss": -5.152594566345215, "global_step": 18567, "epoch": 442} {"train_loss": -5.30201530456543, "global_step": 18568, "epoch": 442} {"train_loss": -5.233659267425537, "global_step": 18569, "epoch": 442} {"train_loss": -4.99552059173584, "global_step": 18570, "epoch": 442} {"train_loss": -5.159759521484375, "global_step": 18571, "epoch": 442} {"train_loss": -5.23558235168457, "global_step": 18572, "epoch": 442} {"train_loss": -5.183061599731445, "global_step": 18573, "epoch": 442} {"train_loss": -5.103841304779053, "global_step": 18574, "epoch": 442} {"train_loss": -5.208309650421143, "global_step": 18575, "epoch": 442} {"train_loss": -5.181300163269043, "global_step": 18576, "epoch": 442} {"train_loss": -5.209882736206055, "global_step": 18577, "epoch": 442} {"train_loss": -5.235170364379883, "global_step": 18578, "epoch": 442} {"train_loss": -5.108902454376221, "global_step": 18579, "epoch": 442} {"train_loss": -5.372008323669434, "global_step": 18580, "epoch": 442} {"train_loss": -5.173542499542236, "global_step": 18581, "epoch": 442} {"train_loss": -5.233453750610352, "global_step": 18582, "epoch": 442} {"train_loss": -5.264288902282715, "global_step": 18583, "epoch": 442} {"train_loss": -5.135318756103516, "global_step": 18584, "epoch": 442} {"train_loss": -5.30252742767334, "global_step": 18585, "epoch": 442} {"train_loss": -5.171690464019775, "global_step": 18586, "epoch": 442} {"train_loss": -5.326297760009766, "global_step": 18587, "epoch": 442} {"train_loss": -5.258090019226074, "global_step": 18588, "epoch": 442} {"train_loss": -5.327851295471191, "global_step": 18589, "epoch": 442} {"train_loss": -5.2809367179870605, "global_step": 18590, "epoch": 442} {"train_loss": -5.216178894042969, "global_step": 18591, "epoch": 442} {"train_loss": -5.293442726135254, "global_step": 18592, "epoch": 442} {"train_loss": -5.222897529602051, "global_step": 18593, "epoch": 442} {"train_loss": -5.109269142150879, "global_step": 18594, "epoch": 442} {"train_loss": -5.312734127044678, "global_step": 18595, "epoch": 442} {"train_loss": -5.237720489501953, "global_step": 18596, "epoch": 442} {"train_loss": -5.288103103637695, "global_step": 18597, "epoch": 442} {"train_loss": -5.228828430175781, "global_step": 18598, "epoch": 442} {"train_loss": -5.194009780883789, "global_step": 18599, "epoch": 442} {"train_loss": -5.196313381195068, "global_step": 18600, "epoch": 442} {"train_loss": -5.285943508148193, "global_step": 18601, "epoch": 442} {"train_loss": -5.17693567276001, "global_step": 18602, "epoch": 442} {"train_loss": -5.134220600128174, "global_step": 18603, "epoch": 442} {"train_loss": -5.263228416442871, "global_step": 18604, "epoch": 442} {"train_loss": -5.224343765349615, "global_step": 18605, "epoch": 442, "val_loss": 77378.75} {"train_loss": -5.120662689208984, "global_step": 18606, "epoch": 443} {"train_loss": -5.320730686187744, "global_step": 18607, "epoch": 443} {"train_loss": -5.1617889404296875, "global_step": 18608, "epoch": 443} {"train_loss": -5.213420867919922, "global_step": 18609, "epoch": 443} {"train_loss": -5.181818008422852, "global_step": 18610, "epoch": 443} {"train_loss": -5.288008689880371, "global_step": 18611, "epoch": 443} {"train_loss": -5.333812713623047, "global_step": 18612, "epoch": 443} {"train_loss": -5.187995910644531, "global_step": 18613, "epoch": 443} {"train_loss": -5.232081413269043, "global_step": 18614, "epoch": 443} {"train_loss": -5.2063703536987305, "global_step": 18615, "epoch": 443} {"train_loss": -5.317744255065918, "global_step": 18616, "epoch": 443} {"train_loss": -5.3449201583862305, "global_step": 18617, "epoch": 443} {"train_loss": -5.158472061157227, "global_step": 18618, "epoch": 443} {"train_loss": -5.334702968597412, "global_step": 18619, "epoch": 443} {"train_loss": -5.255886554718018, "global_step": 18620, "epoch": 443} {"train_loss": -5.1154279708862305, "global_step": 18621, "epoch": 443} {"train_loss": -5.2992095947265625, "global_step": 18622, "epoch": 443} {"train_loss": -5.301494598388672, "global_step": 18623, "epoch": 443} {"train_loss": -5.373757362365723, "global_step": 18624, "epoch": 443} {"train_loss": -5.344808101654053, "global_step": 18625, "epoch": 443} {"train_loss": -5.361883163452148, "global_step": 18626, "epoch": 443} {"train_loss": -5.2607526779174805, "global_step": 18627, "epoch": 443} {"train_loss": -5.29444694519043, "global_step": 18628, "epoch": 443} {"train_loss": -5.245278358459473, "global_step": 18629, "epoch": 443} {"train_loss": -5.254620552062988, "global_step": 18630, "epoch": 443} {"train_loss": -5.18602180480957, "global_step": 18631, "epoch": 443} {"train_loss": -5.336691856384277, "global_step": 18632, "epoch": 443} {"train_loss": -5.229482650756836, "global_step": 18633, "epoch": 443} {"train_loss": -5.16931676864624, "global_step": 18634, "epoch": 443} {"train_loss": -5.268965721130371, "global_step": 18635, "epoch": 443} {"train_loss": -5.256792068481445, "global_step": 18636, "epoch": 443} {"train_loss": -5.357261657714844, "global_step": 18637, "epoch": 443} {"train_loss": -5.1880364418029785, "global_step": 18638, "epoch": 443} {"train_loss": -5.374260902404785, "global_step": 18639, "epoch": 443} {"train_loss": -5.278024673461914, "global_step": 18640, "epoch": 443} {"train_loss": -5.257752418518066, "global_step": 18641, "epoch": 443} {"train_loss": -5.275714874267578, "global_step": 18642, "epoch": 443} {"train_loss": -5.0963873863220215, "global_step": 18643, "epoch": 443} {"train_loss": -5.324505805969238, "global_step": 18644, "epoch": 443} {"train_loss": -5.307480335235596, "global_step": 18645, "epoch": 443} {"train_loss": -5.244023323059082, "global_step": 18646, "epoch": 443} {"train_loss": -5.262880813507807, "global_step": 18647, "epoch": 443, "val_loss": 77092.53125} {"train_loss": -5.315851211547852, "global_step": 18648, "epoch": 444} {"train_loss": -5.248701095581055, "global_step": 18649, "epoch": 444} {"train_loss": -5.336408615112305, "global_step": 18650, "epoch": 444} {"train_loss": -5.197839736938477, "global_step": 18651, "epoch": 444} {"train_loss": -5.2332916259765625, "global_step": 18652, "epoch": 444} {"train_loss": -5.164759635925293, "global_step": 18653, "epoch": 444} {"train_loss": -5.334176540374756, "global_step": 18654, "epoch": 444} {"train_loss": -5.221898555755615, "global_step": 18655, "epoch": 444} {"train_loss": -5.262118816375732, "global_step": 18656, "epoch": 444} {"train_loss": -5.290043830871582, "global_step": 18657, "epoch": 444} {"train_loss": -5.239152908325195, "global_step": 18658, "epoch": 444} {"train_loss": -5.241784572601318, "global_step": 18659, "epoch": 444} {"train_loss": -5.330996990203857, "global_step": 18660, "epoch": 444} {"train_loss": -5.2889509201049805, "global_step": 18661, "epoch": 444} {"train_loss": -5.376935958862305, "global_step": 18662, "epoch": 444} {"train_loss": -5.28491735458374, "global_step": 18663, "epoch": 444} {"train_loss": -5.27419900894165, "global_step": 18664, "epoch": 444} {"train_loss": -5.382154941558838, "global_step": 18665, "epoch": 444} {"train_loss": -5.20338249206543, "global_step": 18666, "epoch": 444} {"train_loss": -5.263433456420898, "global_step": 18667, "epoch": 444} {"train_loss": -5.270668983459473, "global_step": 18668, "epoch": 444} {"train_loss": -5.322506904602051, "global_step": 18669, "epoch": 444} {"train_loss": -5.306153297424316, "global_step": 18670, "epoch": 444} {"train_loss": -5.368805885314941, "global_step": 18671, "epoch": 444} {"train_loss": -5.280339241027832, "global_step": 18672, "epoch": 444} {"train_loss": -5.3377509117126465, "global_step": 18673, "epoch": 444} {"train_loss": -5.266756057739258, "global_step": 18674, "epoch": 444} {"train_loss": -5.276454925537109, "global_step": 18675, "epoch": 444} {"train_loss": -5.282526969909668, "global_step": 18676, "epoch": 444} {"train_loss": -5.182939529418945, "global_step": 18677, "epoch": 444} {"train_loss": -5.160869598388672, "global_step": 18678, "epoch": 444} {"train_loss": -5.3943610191345215, "global_step": 18679, "epoch": 444} {"train_loss": -5.225457191467285, "global_step": 18680, "epoch": 444} {"train_loss": -5.197027206420898, "global_step": 18681, "epoch": 444} {"train_loss": -5.160762310028076, "global_step": 18682, "epoch": 444} {"train_loss": -5.34757137298584, "global_step": 18683, "epoch": 444} {"train_loss": -5.393526077270508, "global_step": 18684, "epoch": 444} {"train_loss": -5.283681869506836, "global_step": 18685, "epoch": 444} {"train_loss": -5.438424110412598, "global_step": 18686, "epoch": 444} {"train_loss": -5.063910484313965, "global_step": 18687, "epoch": 444} {"train_loss": -5.2813401222229, "global_step": 18688, "epoch": 444} {"train_loss": -5.2702202796936035, "global_step": 18689, "epoch": 444, "val_loss": 77004.1171875} {"train_loss": -5.294816970825195, "global_step": 18690, "epoch": 445} {"train_loss": -5.299432754516602, "global_step": 18691, "epoch": 445} {"train_loss": -5.2956624031066895, "global_step": 18692, "epoch": 445} {"train_loss": -5.296868324279785, "global_step": 18693, "epoch": 445} {"train_loss": -5.371573448181152, "global_step": 18694, "epoch": 445} {"train_loss": -5.3413872718811035, "global_step": 18695, "epoch": 445} {"train_loss": -5.20361328125, "global_step": 18696, "epoch": 445} {"train_loss": -5.440957069396973, "global_step": 18697, "epoch": 445} {"train_loss": -5.332225322723389, "global_step": 18698, "epoch": 445} {"train_loss": -5.177924633026123, "global_step": 18699, "epoch": 445} {"train_loss": -5.41481876373291, "global_step": 18700, "epoch": 445} {"train_loss": -5.233926773071289, "global_step": 18701, "epoch": 445} {"train_loss": -5.2477240562438965, "global_step": 18702, "epoch": 445} {"train_loss": -5.276497840881348, "global_step": 18703, "epoch": 445} {"train_loss": -5.378312110900879, "global_step": 18704, "epoch": 445} {"train_loss": -5.1961822509765625, "global_step": 18705, "epoch": 445} {"train_loss": -5.255255222320557, "global_step": 18706, "epoch": 445} {"train_loss": -5.282893180847168, "global_step": 18707, "epoch": 445} {"train_loss": -5.266304969787598, "global_step": 18708, "epoch": 445} {"train_loss": -5.329320907592773, "global_step": 18709, "epoch": 445} {"train_loss": -5.219829082489014, "global_step": 18710, "epoch": 445} {"train_loss": -5.265180587768555, "global_step": 18711, "epoch": 445} {"train_loss": -5.2536163330078125, "global_step": 18712, "epoch": 445} {"train_loss": -5.0950927734375, "global_step": 18713, "epoch": 445} {"train_loss": -5.173061370849609, "global_step": 18714, "epoch": 445} {"train_loss": -5.219690322875977, "global_step": 18715, "epoch": 445} {"train_loss": -5.1436920166015625, "global_step": 18716, "epoch": 445} {"train_loss": -5.26939058303833, "global_step": 18717, "epoch": 445} {"train_loss": -5.264301300048828, "global_step": 18718, "epoch": 445} {"train_loss": -5.29245662689209, "global_step": 18719, "epoch": 445} {"train_loss": -5.340034484863281, "global_step": 18720, "epoch": 445} {"train_loss": -5.2359619140625, "global_step": 18721, "epoch": 445} {"train_loss": -5.382663726806641, "global_step": 18722, "epoch": 445} {"train_loss": -5.161002159118652, "global_step": 18723, "epoch": 445} {"train_loss": -5.279396057128906, "global_step": 18724, "epoch": 445} {"train_loss": -5.21415901184082, "global_step": 18725, "epoch": 445} {"train_loss": -5.3824052810668945, "global_step": 18726, "epoch": 445} {"train_loss": -5.158000946044922, "global_step": 18727, "epoch": 445} {"train_loss": -5.142354965209961, "global_step": 18728, "epoch": 445} {"train_loss": -5.237972259521484, "global_step": 18729, "epoch": 445} {"train_loss": -5.145960807800293, "global_step": 18730, "epoch": 445} {"train_loss": -5.26478522164481, "global_step": 18731, "epoch": 445, "val_loss": 77089.7421875} {"train_loss": -5.160110950469971, "global_step": 18732, "epoch": 446} {"train_loss": -5.221331596374512, "global_step": 18733, "epoch": 446} {"train_loss": -5.280280113220215, "global_step": 18734, "epoch": 446} {"train_loss": -5.163722038269043, "global_step": 18735, "epoch": 446} {"train_loss": -5.222264289855957, "global_step": 18736, "epoch": 446} {"train_loss": -5.266063690185547, "global_step": 18737, "epoch": 446} {"train_loss": -5.117431640625, "global_step": 18738, "epoch": 446} {"train_loss": -5.19593620300293, "global_step": 18739, "epoch": 446} {"train_loss": -5.289278507232666, "global_step": 18740, "epoch": 446} {"train_loss": -5.14731502532959, "global_step": 18741, "epoch": 446} {"train_loss": -5.419807434082031, "global_step": 18742, "epoch": 446} {"train_loss": -5.3801445960998535, "global_step": 18743, "epoch": 446} {"train_loss": -5.116320610046387, "global_step": 18744, "epoch": 446} {"train_loss": -5.229907035827637, "global_step": 18745, "epoch": 446} {"train_loss": -5.3189191818237305, "global_step": 18746, "epoch": 446} {"train_loss": -5.275084018707275, "global_step": 18747, "epoch": 446} {"train_loss": -5.263944625854492, "global_step": 18748, "epoch": 446} {"train_loss": -5.272089958190918, "global_step": 18749, "epoch": 446} {"train_loss": -5.168122291564941, "global_step": 18750, "epoch": 446} {"train_loss": -5.3439836502075195, "global_step": 18751, "epoch": 446} {"train_loss": -5.366735458374023, "global_step": 18752, "epoch": 446} {"train_loss": -5.275564193725586, "global_step": 18753, "epoch": 446} {"train_loss": -5.192119598388672, "global_step": 18754, "epoch": 446} {"train_loss": -5.270329475402832, "global_step": 18755, "epoch": 446} {"train_loss": -5.106630802154541, "global_step": 18756, "epoch": 446} {"train_loss": -5.204705238342285, "global_step": 18757, "epoch": 446} {"train_loss": -5.358623504638672, "global_step": 18758, "epoch": 446} {"train_loss": -5.2123942375183105, "global_step": 18759, "epoch": 446} {"train_loss": -5.273978233337402, "global_step": 18760, "epoch": 446} {"train_loss": -5.324288845062256, "global_step": 18761, "epoch": 446} {"train_loss": -5.143030643463135, "global_step": 18762, "epoch": 446} {"train_loss": -5.25361442565918, "global_step": 18763, "epoch": 446} {"train_loss": -5.397437572479248, "global_step": 18764, "epoch": 446} {"train_loss": -5.325034141540527, "global_step": 18765, "epoch": 446} {"train_loss": -5.321702003479004, "global_step": 18766, "epoch": 446} {"train_loss": -5.306100845336914, "global_step": 18767, "epoch": 446} {"train_loss": -5.188046455383301, "global_step": 18768, "epoch": 446} {"train_loss": -5.276368141174316, "global_step": 18769, "epoch": 446} {"train_loss": -5.327138900756836, "global_step": 18770, "epoch": 446} {"train_loss": -5.2455058097839355, "global_step": 18771, "epoch": 446} {"train_loss": -5.18609619140625, "global_step": 18772, "epoch": 446} {"train_loss": -5.255929231643677, "global_step": 18773, "epoch": 446, "val_loss": 76197.4140625} {"train_loss": -5.242679595947266, "global_step": 18774, "epoch": 447} {"train_loss": -5.341056823730469, "global_step": 18775, "epoch": 447} {"train_loss": -5.170146465301514, "global_step": 18776, "epoch": 447} {"train_loss": -5.160662651062012, "global_step": 18777, "epoch": 447} {"train_loss": -5.2526960372924805, "global_step": 18778, "epoch": 447} {"train_loss": -5.283941268920898, "global_step": 18779, "epoch": 447} {"train_loss": -5.229895114898682, "global_step": 18780, "epoch": 447} {"train_loss": -5.365151405334473, "global_step": 18781, "epoch": 447} {"train_loss": -5.314271450042725, "global_step": 18782, "epoch": 447} {"train_loss": -5.2897515296936035, "global_step": 18783, "epoch": 447} {"train_loss": -5.257750988006592, "global_step": 18784, "epoch": 447} {"train_loss": -5.3383331298828125, "global_step": 18785, "epoch": 447} {"train_loss": -5.344661235809326, "global_step": 18786, "epoch": 447} {"train_loss": -5.399426460266113, "global_step": 18787, "epoch": 447} {"train_loss": -5.277777671813965, "global_step": 18788, "epoch": 447} {"train_loss": -5.32772159576416, "global_step": 18789, "epoch": 447} {"train_loss": -5.253609657287598, "global_step": 18790, "epoch": 447} {"train_loss": -5.246450424194336, "global_step": 18791, "epoch": 447} {"train_loss": -5.1744160652160645, "global_step": 18792, "epoch": 447} {"train_loss": -5.325869083404541, "global_step": 18793, "epoch": 447} {"train_loss": -5.164927005767822, "global_step": 18794, "epoch": 447} {"train_loss": -5.28189754486084, "global_step": 18795, "epoch": 447} {"train_loss": -5.4610161781311035, "global_step": 18796, "epoch": 447} {"train_loss": -5.200753211975098, "global_step": 18797, "epoch": 447} {"train_loss": -5.076637268066406, "global_step": 18798, "epoch": 447} {"train_loss": -5.172823905944824, "global_step": 18799, "epoch": 447} {"train_loss": -5.250171661376953, "global_step": 18800, "epoch": 447} {"train_loss": -5.176567077636719, "global_step": 18801, "epoch": 447} {"train_loss": -5.259476661682129, "global_step": 18802, "epoch": 447} {"train_loss": -5.189223289489746, "global_step": 18803, "epoch": 447} {"train_loss": -5.268009185791016, "global_step": 18804, "epoch": 447} {"train_loss": -5.4135541915893555, "global_step": 18805, "epoch": 447} {"train_loss": -5.122633934020996, "global_step": 18806, "epoch": 447} {"train_loss": -5.20944881439209, "global_step": 18807, "epoch": 447} {"train_loss": -5.2115888595581055, "global_step": 18808, "epoch": 447} {"train_loss": -5.2649641036987305, "global_step": 18809, "epoch": 447} {"train_loss": -5.321843147277832, "global_step": 18810, "epoch": 447} {"train_loss": -5.120013236999512, "global_step": 18811, "epoch": 447} {"train_loss": -5.356416702270508, "global_step": 18812, "epoch": 447} {"train_loss": -5.180374622344971, "global_step": 18813, "epoch": 447} {"train_loss": -5.184823036193848, "global_step": 18814, "epoch": 447} {"train_loss": -5.256916977110363, "global_step": 18815, "epoch": 447, "val_loss": 76815.890625} {"train_loss": -5.200160026550293, "global_step": 18816, "epoch": 448} {"train_loss": -5.228518486022949, "global_step": 18817, "epoch": 448} {"train_loss": -5.222306251525879, "global_step": 18818, "epoch": 448} {"train_loss": -5.335502624511719, "global_step": 18819, "epoch": 448} {"train_loss": -5.214866638183594, "global_step": 18820, "epoch": 448} {"train_loss": -5.294402122497559, "global_step": 18821, "epoch": 448} {"train_loss": -5.415398597717285, "global_step": 18822, "epoch": 448} {"train_loss": -5.313093185424805, "global_step": 18823, "epoch": 448} {"train_loss": -5.2067155838012695, "global_step": 18824, "epoch": 448} {"train_loss": -5.295738220214844, "global_step": 18825, "epoch": 448} {"train_loss": -5.267635822296143, "global_step": 18826, "epoch": 448} {"train_loss": -5.253122329711914, "global_step": 18827, "epoch": 448} {"train_loss": -5.233585357666016, "global_step": 18828, "epoch": 448} {"train_loss": -5.234845161437988, "global_step": 18829, "epoch": 448} {"train_loss": -5.2155046463012695, "global_step": 18830, "epoch": 448} {"train_loss": -5.298292636871338, "global_step": 18831, "epoch": 448} {"train_loss": -5.214090347290039, "global_step": 18832, "epoch": 448} {"train_loss": -5.126556396484375, "global_step": 18833, "epoch": 448} {"train_loss": -5.470412254333496, "global_step": 18834, "epoch": 448} {"train_loss": -5.282436370849609, "global_step": 18835, "epoch": 448} {"train_loss": -5.283746719360352, "global_step": 18836, "epoch": 448} {"train_loss": -5.340348720550537, "global_step": 18837, "epoch": 448} {"train_loss": -5.175047874450684, "global_step": 18838, "epoch": 448} {"train_loss": -5.205220699310303, "global_step": 18839, "epoch": 448} {"train_loss": -5.220517635345459, "global_step": 18840, "epoch": 448} {"train_loss": -5.32598876953125, "global_step": 18841, "epoch": 448} {"train_loss": -5.398220062255859, "global_step": 18842, "epoch": 448} {"train_loss": -5.3194074630737305, "global_step": 18843, "epoch": 448} {"train_loss": -5.2788214683532715, "global_step": 18844, "epoch": 448} {"train_loss": -5.258257865905762, "global_step": 18845, "epoch": 448} {"train_loss": -5.21197509765625, "global_step": 18846, "epoch": 448} {"train_loss": -5.2544097900390625, "global_step": 18847, "epoch": 448} {"train_loss": -5.312200546264648, "global_step": 18848, "epoch": 448} {"train_loss": -5.216536521911621, "global_step": 18849, "epoch": 448} {"train_loss": -5.314666748046875, "global_step": 18850, "epoch": 448} {"train_loss": -5.189114570617676, "global_step": 18851, "epoch": 448} {"train_loss": -5.273594379425049, "global_step": 18852, "epoch": 448} {"train_loss": -5.211871147155762, "global_step": 18853, "epoch": 448} {"train_loss": -5.230403900146484, "global_step": 18854, "epoch": 448} {"train_loss": -5.319668769836426, "global_step": 18855, "epoch": 448} {"train_loss": -5.322871208190918, "global_step": 18856, "epoch": 448} {"train_loss": -5.264222621917725, "global_step": 18857, "epoch": 448, "val_loss": 76966.6796875} {"train_loss": -5.248598098754883, "global_step": 18858, "epoch": 449} {"train_loss": -5.489668846130371, "global_step": 18859, "epoch": 449} {"train_loss": -5.255448341369629, "global_step": 18860, "epoch": 449} {"train_loss": -5.363768100738525, "global_step": 18861, "epoch": 449} {"train_loss": -5.316237449645996, "global_step": 18862, "epoch": 449} {"train_loss": -5.351076602935791, "global_step": 18863, "epoch": 449} {"train_loss": -5.449812889099121, "global_step": 18864, "epoch": 449} {"train_loss": -5.249684810638428, "global_step": 18865, "epoch": 449} {"train_loss": -5.387315273284912, "global_step": 18866, "epoch": 449} {"train_loss": -5.219817638397217, "global_step": 18867, "epoch": 449} {"train_loss": -5.104258060455322, "global_step": 18868, "epoch": 449} {"train_loss": -5.2626190185546875, "global_step": 18869, "epoch": 449} {"train_loss": -5.223072052001953, "global_step": 18870, "epoch": 449} {"train_loss": -5.223060607910156, "global_step": 18871, "epoch": 449} {"train_loss": -5.258498191833496, "global_step": 18872, "epoch": 449} {"train_loss": -5.209930419921875, "global_step": 18873, "epoch": 449} {"train_loss": -5.245704650878906, "global_step": 18874, "epoch": 449} {"train_loss": -5.275968551635742, "global_step": 18875, "epoch": 449} {"train_loss": -5.253915786743164, "global_step": 18876, "epoch": 449} {"train_loss": -5.212116718292236, "global_step": 18877, "epoch": 449} {"train_loss": -5.291146755218506, "global_step": 18878, "epoch": 449} {"train_loss": -5.119634628295898, "global_step": 18879, "epoch": 449} {"train_loss": -5.268918037414551, "global_step": 18880, "epoch": 449} {"train_loss": -5.382606506347656, "global_step": 18881, "epoch": 449} {"train_loss": -5.242256164550781, "global_step": 18882, "epoch": 449} {"train_loss": -5.26310920715332, "global_step": 18883, "epoch": 449} {"train_loss": -5.361682891845703, "global_step": 18884, "epoch": 449} {"train_loss": -5.287941932678223, "global_step": 18885, "epoch": 449} {"train_loss": -5.317752361297607, "global_step": 18886, "epoch": 449} {"train_loss": -5.203817844390869, "global_step": 18887, "epoch": 449} {"train_loss": -5.195932865142822, "global_step": 18888, "epoch": 449} {"train_loss": -5.337874889373779, "global_step": 18889, "epoch": 449} {"train_loss": -5.24346399307251, "global_step": 18890, "epoch": 449} {"train_loss": -5.337607383728027, "global_step": 18891, "epoch": 449} {"train_loss": -5.138310432434082, "global_step": 18892, "epoch": 449} {"train_loss": -5.2551774978637695, "global_step": 18893, "epoch": 449} {"train_loss": -5.299718856811523, "global_step": 18894, "epoch": 449} {"train_loss": -5.275514602661133, "global_step": 18895, "epoch": 449} {"train_loss": -5.314896583557129, "global_step": 18896, "epoch": 449} {"train_loss": -5.2749505043029785, "global_step": 18897, "epoch": 449} {"train_loss": -5.261935234069824, "global_step": 18898, "epoch": 449} {"train_loss": -5.274659701756069, "global_step": 18899, "epoch": 449, "val_loss": 78084.953125} {"train_loss": -5.242433547973633, "global_step": 18900, "epoch": 450} {"train_loss": -5.3841552734375, "global_step": 18901, "epoch": 450} {"train_loss": -5.312581539154053, "global_step": 18902, "epoch": 450} {"train_loss": -5.269453048706055, "global_step": 18903, "epoch": 450} {"train_loss": -5.388260841369629, "global_step": 18904, "epoch": 450} {"train_loss": -5.330680847167969, "global_step": 18905, "epoch": 450} {"train_loss": -5.346199035644531, "global_step": 18906, "epoch": 450} {"train_loss": -5.260926246643066, "global_step": 18907, "epoch": 450} {"train_loss": -5.161799907684326, "global_step": 18908, "epoch": 450} {"train_loss": -5.285277366638184, "global_step": 18909, "epoch": 450} {"train_loss": -5.240028381347656, "global_step": 18910, "epoch": 450} {"train_loss": -5.230820655822754, "global_step": 18911, "epoch": 450} {"train_loss": -5.322342872619629, "global_step": 18912, "epoch": 450} {"train_loss": -5.402111053466797, "global_step": 18913, "epoch": 450} {"train_loss": -5.308337211608887, "global_step": 18914, "epoch": 450} {"train_loss": -5.190857410430908, "global_step": 18915, "epoch": 450} {"train_loss": -5.168097496032715, "global_step": 18916, "epoch": 450} {"train_loss": -5.348555564880371, "global_step": 18917, "epoch": 450} {"train_loss": -5.153327941894531, "global_step": 18918, "epoch": 450} {"train_loss": -5.2336578369140625, "global_step": 18919, "epoch": 450} {"train_loss": -5.3784894943237305, "global_step": 18920, "epoch": 450} {"train_loss": -5.237479209899902, "global_step": 18921, "epoch": 450} {"train_loss": -5.384514808654785, "global_step": 18922, "epoch": 450} {"train_loss": -5.17120361328125, "global_step": 18923, "epoch": 450} {"train_loss": -5.2210235595703125, "global_step": 18924, "epoch": 450} {"train_loss": -5.343071937561035, "global_step": 18925, "epoch": 450} {"train_loss": -5.202756881713867, "global_step": 18926, "epoch": 450} {"train_loss": -5.2688446044921875, "global_step": 18927, "epoch": 450} {"train_loss": -5.415924549102783, "global_step": 18928, "epoch": 450} {"train_loss": -5.319149017333984, "global_step": 18929, "epoch": 450} {"train_loss": -5.28887939453125, "global_step": 18930, "epoch": 450} {"train_loss": -5.378653049468994, "global_step": 18931, "epoch": 450} {"train_loss": -5.367686748504639, "global_step": 18932, "epoch": 450} {"train_loss": -5.352657794952393, "global_step": 18933, "epoch": 450} {"train_loss": -5.138448715209961, "global_step": 18934, "epoch": 450} {"train_loss": -5.195931434631348, "global_step": 18935, "epoch": 450} {"train_loss": -5.191205024719238, "global_step": 18936, "epoch": 450} {"train_loss": -5.240190505981445, "global_step": 18937, "epoch": 450} {"train_loss": -5.2788801193237305, "global_step": 18938, "epoch": 450} {"train_loss": -5.20001220703125, "global_step": 18939, "epoch": 450} {"train_loss": -5.284003257751465, "global_step": 18940, "epoch": 450} {"train_loss": -5.279877424240112, "global_step": 18941, "epoch": 450, "train/sim_max_reward_0": 0.2843567187766178, "train/sim_max_reward_1": 0.1562568212211859, "train/sim_max_reward_2": 0.5645767723232075, "train/sim_max_reward_3": 0.16923852512674972, "train/sim_max_reward_4": 0.3638214303153523, "train/sim_max_reward_5": 0.5551095672567117, "test/sim_max_reward_4500000": 0.7088564437349774, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.160049812360806, "test/sim_max_reward_4500005": 0.1679019526983328, "test/sim_max_reward_4500006": 0.38649024340088023, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.04450914194831958, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.3974939928306241, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.9192658355674054, "test/sim_max_reward_4500015": 0.08031408504575692, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.15102933445603067, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.44346346897472777, "test/sim_max_reward_4500022": 0.6618005861009488, "test/sim_max_reward_4500023": 0.7325807330342629, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.34453704945637276, "test/sim_max_reward_4500026": 0.11521756486129969, "test/sim_max_reward_4500027": 0.5668792809970107, "test/sim_max_reward_4500028": 0.4349166980267949, "test/sim_max_reward_4500029": 0.060864551517243896, "test/sim_max_reward_4500030": 0.5842424565440543, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.29886526660635, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.2280074508052495, "test/sim_max_reward_4500035": 0.46284911973535947, "test/sim_max_reward_4500036": 0.35455763727555273, "test/sim_max_reward_4500037": 0.4404501490060284, "test/sim_max_reward_4500038": 0.36657744107437273, "test/sim_max_reward_4500039": 0.767165112650508, "test/sim_max_reward_4500040": 0.1544940542150255, "test/sim_max_reward_4500041": 0.0, "test/sim_max_reward_4500042": 0.006176609952930741, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.1340557845055027, "test/sim_max_reward_4500045": 0.1175735103924684, "test/sim_max_reward_4500046": 0.060011891639559764, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.0605495794694939, "train/mean_score": 0.34889330583663747, "test/mean_score": 0.21652698147494875, "val_loss": 75809.6015625} {"train_loss": -5.3186750411987305, "global_step": 18942, "epoch": 451} {"train_loss": -5.3661370277404785, "global_step": 18943, "epoch": 451} {"train_loss": -5.182541847229004, "global_step": 18944, "epoch": 451} {"train_loss": -5.187382221221924, "global_step": 18945, "epoch": 451} {"train_loss": -5.276559352874756, "global_step": 18946, "epoch": 451} {"train_loss": -5.306149005889893, "global_step": 18947, "epoch": 451} {"train_loss": -5.152139186859131, "global_step": 18948, "epoch": 451} {"train_loss": -5.341306686401367, "global_step": 18949, "epoch": 451} {"train_loss": -5.200201034545898, "global_step": 18950, "epoch": 451} {"train_loss": -5.251407623291016, "global_step": 18951, "epoch": 451} {"train_loss": -5.327190399169922, "global_step": 18952, "epoch": 451} {"train_loss": -5.333065986633301, "global_step": 18953, "epoch": 451} {"train_loss": -5.331164360046387, "global_step": 18954, "epoch": 451} {"train_loss": -5.217316150665283, "global_step": 18955, "epoch": 451} {"train_loss": -5.331890106201172, "global_step": 18956, "epoch": 451} {"train_loss": -5.26743221282959, "global_step": 18957, "epoch": 451} {"train_loss": -5.242581367492676, "global_step": 18958, "epoch": 451} {"train_loss": -5.230655670166016, "global_step": 18959, "epoch": 451} {"train_loss": -5.207420825958252, "global_step": 18960, "epoch": 451} {"train_loss": -5.261478424072266, "global_step": 18961, "epoch": 451} {"train_loss": -5.2686896324157715, "global_step": 18962, "epoch": 451} {"train_loss": -5.343986511230469, "global_step": 18963, "epoch": 451} {"train_loss": -5.303473949432373, "global_step": 18964, "epoch": 451} {"train_loss": -5.217365741729736, "global_step": 18965, "epoch": 451} {"train_loss": -5.384417533874512, "global_step": 18966, "epoch": 451} {"train_loss": -5.166194915771484, "global_step": 18967, "epoch": 451} {"train_loss": -5.268934726715088, "global_step": 18968, "epoch": 451} {"train_loss": -5.187837600708008, "global_step": 18969, "epoch": 451} {"train_loss": -5.298783302307129, "global_step": 18970, "epoch": 451} {"train_loss": -5.318005084991455, "global_step": 18971, "epoch": 451} {"train_loss": -5.274958610534668, "global_step": 18972, "epoch": 451} {"train_loss": -5.331795692443848, "global_step": 18973, "epoch": 451} {"train_loss": -5.256208419799805, "global_step": 18974, "epoch": 451} {"train_loss": -5.218311309814453, "global_step": 18975, "epoch": 451} {"train_loss": -5.215688705444336, "global_step": 18976, "epoch": 451} {"train_loss": -5.332121849060059, "global_step": 18977, "epoch": 451} {"train_loss": -5.315887451171875, "global_step": 18978, "epoch": 451} {"train_loss": -5.19972038269043, "global_step": 18979, "epoch": 451} {"train_loss": -5.372274398803711, "global_step": 18980, "epoch": 451} {"train_loss": -5.199103355407715, "global_step": 18981, "epoch": 451} {"train_loss": -5.266772270202637, "global_step": 18982, "epoch": 451} {"train_loss": -5.268853687104725, "global_step": 18983, "epoch": 451, "val_loss": 76306.84375} {"train_loss": -5.29063081741333, "global_step": 18984, "epoch": 452} {"train_loss": -5.402484893798828, "global_step": 18985, "epoch": 452} {"train_loss": -5.349326133728027, "global_step": 18986, "epoch": 452} {"train_loss": -5.307808876037598, "global_step": 18987, "epoch": 452} {"train_loss": -5.262905120849609, "global_step": 18988, "epoch": 452} {"train_loss": -5.2437357902526855, "global_step": 18989, "epoch": 452} {"train_loss": -5.27039098739624, "global_step": 18990, "epoch": 452} {"train_loss": -5.298673152923584, "global_step": 18991, "epoch": 452} {"train_loss": -5.276103973388672, "global_step": 18992, "epoch": 452} {"train_loss": -5.3663506507873535, "global_step": 18993, "epoch": 452} {"train_loss": -5.145040035247803, "global_step": 18994, "epoch": 452} {"train_loss": -5.304347038269043, "global_step": 18995, "epoch": 452} {"train_loss": -5.355579376220703, "global_step": 18996, "epoch": 452} {"train_loss": -5.0689377784729, "global_step": 18997, "epoch": 452} {"train_loss": -5.175017356872559, "global_step": 18998, "epoch": 452} {"train_loss": -5.2962846755981445, "global_step": 18999, "epoch": 452} {"train_loss": -5.243792533874512, "global_step": 19000, "epoch": 452} {"train_loss": -5.276032447814941, "global_step": 19001, "epoch": 452} {"train_loss": -5.4162492752075195, "global_step": 19002, "epoch": 452} {"train_loss": -5.170464515686035, "global_step": 19003, "epoch": 452} {"train_loss": -5.224996566772461, "global_step": 19004, "epoch": 452} {"train_loss": -5.283422470092773, "global_step": 19005, "epoch": 452} {"train_loss": -5.132686614990234, "global_step": 19006, "epoch": 452} {"train_loss": -5.25486946105957, "global_step": 19007, "epoch": 452} {"train_loss": -5.149989128112793, "global_step": 19008, "epoch": 452} {"train_loss": -5.213306427001953, "global_step": 19009, "epoch": 452} {"train_loss": -5.283891677856445, "global_step": 19010, "epoch": 452} {"train_loss": -5.297089576721191, "global_step": 19011, "epoch": 452} {"train_loss": -5.361353874206543, "global_step": 19012, "epoch": 452} {"train_loss": -5.326339244842529, "global_step": 19013, "epoch": 452} {"train_loss": -5.279053688049316, "global_step": 19014, "epoch": 452} {"train_loss": -5.142796993255615, "global_step": 19015, "epoch": 452} {"train_loss": -5.254414081573486, "global_step": 19016, "epoch": 452} {"train_loss": -5.347871780395508, "global_step": 19017, "epoch": 452} {"train_loss": -5.265316009521484, "global_step": 19018, "epoch": 452} {"train_loss": -5.249752998352051, "global_step": 19019, "epoch": 452} {"train_loss": -5.1672234535217285, "global_step": 19020, "epoch": 452} {"train_loss": -5.313840389251709, "global_step": 19021, "epoch": 452} {"train_loss": -5.182819843292236, "global_step": 19022, "epoch": 452} {"train_loss": -5.243038177490234, "global_step": 19023, "epoch": 452} {"train_loss": -5.253765106201172, "global_step": 19024, "epoch": 452} {"train_loss": -5.263335409618559, "global_step": 19025, "epoch": 452, "val_loss": 77069.6640625} {"train_loss": -5.2275710105896, "global_step": 19026, "epoch": 453} {"train_loss": -5.270373344421387, "global_step": 19027, "epoch": 453} {"train_loss": -5.343601703643799, "global_step": 19028, "epoch": 453} {"train_loss": -5.357584476470947, "global_step": 19029, "epoch": 453} {"train_loss": -5.24403715133667, "global_step": 19030, "epoch": 453} {"train_loss": -5.17055606842041, "global_step": 19031, "epoch": 453} {"train_loss": -5.307836532592773, "global_step": 19032, "epoch": 453} {"train_loss": -5.144185543060303, "global_step": 19033, "epoch": 453} {"train_loss": -5.219026565551758, "global_step": 19034, "epoch": 453} {"train_loss": -5.421048164367676, "global_step": 19035, "epoch": 453} {"train_loss": -5.206578254699707, "global_step": 19036, "epoch": 453} {"train_loss": -5.140279769897461, "global_step": 19037, "epoch": 453} {"train_loss": -5.440700531005859, "global_step": 19038, "epoch": 453} {"train_loss": -5.075607776641846, "global_step": 19039, "epoch": 453} {"train_loss": -5.021080493927002, "global_step": 19040, "epoch": 453} {"train_loss": -4.997972011566162, "global_step": 19041, "epoch": 453} {"train_loss": -5.0690388679504395, "global_step": 19042, "epoch": 453} {"train_loss": -4.752941131591797, "global_step": 19043, "epoch": 453} {"train_loss": -5.211640357971191, "global_step": 19044, "epoch": 453} {"train_loss": -5.188499450683594, "global_step": 19045, "epoch": 453} {"train_loss": -5.059191703796387, "global_step": 19046, "epoch": 453} {"train_loss": -5.099091529846191, "global_step": 19047, "epoch": 453} {"train_loss": -5.247642993927002, "global_step": 19048, "epoch": 453} {"train_loss": -5.121912956237793, "global_step": 19049, "epoch": 453} {"train_loss": -5.188359260559082, "global_step": 19050, "epoch": 453} {"train_loss": -5.16301965713501, "global_step": 19051, "epoch": 453} {"train_loss": -5.220452308654785, "global_step": 19052, "epoch": 453} {"train_loss": -5.240795135498047, "global_step": 19053, "epoch": 453} {"train_loss": -5.263123035430908, "global_step": 19054, "epoch": 453} {"train_loss": -5.092672348022461, "global_step": 19055, "epoch": 453} {"train_loss": -5.205440044403076, "global_step": 19056, "epoch": 453} {"train_loss": -5.346687316894531, "global_step": 19057, "epoch": 453} {"train_loss": -5.1087164878845215, "global_step": 19058, "epoch": 453} {"train_loss": -5.223759651184082, "global_step": 19059, "epoch": 453} {"train_loss": -5.165252685546875, "global_step": 19060, "epoch": 453} {"train_loss": -5.263458728790283, "global_step": 19061, "epoch": 453} {"train_loss": -5.222658157348633, "global_step": 19062, "epoch": 453} {"train_loss": -5.329584121704102, "global_step": 19063, "epoch": 453} {"train_loss": -5.170253753662109, "global_step": 19064, "epoch": 453} {"train_loss": -5.243491172790527, "global_step": 19065, "epoch": 453} {"train_loss": -5.214970588684082, "global_step": 19066, "epoch": 453} {"train_loss": -5.197579383850098, "global_step": 19067, "epoch": 453, "val_loss": 76620.7578125} {"train_loss": -5.247374534606934, "global_step": 19068, "epoch": 454} {"train_loss": -5.280691623687744, "global_step": 19069, "epoch": 454} {"train_loss": -5.177840232849121, "global_step": 19070, "epoch": 454} {"train_loss": -5.389369487762451, "global_step": 19071, "epoch": 454} {"train_loss": -5.25076961517334, "global_step": 19072, "epoch": 454} {"train_loss": -5.286561965942383, "global_step": 19073, "epoch": 454} {"train_loss": -5.201481342315674, "global_step": 19074, "epoch": 454} {"train_loss": -5.242728233337402, "global_step": 19075, "epoch": 454} {"train_loss": -5.351174354553223, "global_step": 19076, "epoch": 454} {"train_loss": -5.2943949699401855, "global_step": 19077, "epoch": 454} {"train_loss": -5.316889762878418, "global_step": 19078, "epoch": 454} {"train_loss": -5.2928466796875, "global_step": 19079, "epoch": 454} {"train_loss": -5.4194536209106445, "global_step": 19080, "epoch": 454} {"train_loss": -5.2956223487854, "global_step": 19081, "epoch": 454} {"train_loss": -5.2419514656066895, "global_step": 19082, "epoch": 454} {"train_loss": -5.259901523590088, "global_step": 19083, "epoch": 454} {"train_loss": -5.43635368347168, "global_step": 19084, "epoch": 454} {"train_loss": -5.264002799987793, "global_step": 19085, "epoch": 454} {"train_loss": -5.339612007141113, "global_step": 19086, "epoch": 454} {"train_loss": -5.447183609008789, "global_step": 19087, "epoch": 454} {"train_loss": -5.230734348297119, "global_step": 19088, "epoch": 454} {"train_loss": -5.407243251800537, "global_step": 19089, "epoch": 454} {"train_loss": -5.164490699768066, "global_step": 19090, "epoch": 454} {"train_loss": -5.401758193969727, "global_step": 19091, "epoch": 454} {"train_loss": -5.252414226531982, "global_step": 19092, "epoch": 454} {"train_loss": -5.089879989624023, "global_step": 19093, "epoch": 454} {"train_loss": -5.310846328735352, "global_step": 19094, "epoch": 454} {"train_loss": -5.329809188842773, "global_step": 19095, "epoch": 454} {"train_loss": -5.232847213745117, "global_step": 19096, "epoch": 454} {"train_loss": -5.092398643493652, "global_step": 19097, "epoch": 454} {"train_loss": -5.227287292480469, "global_step": 19098, "epoch": 454} {"train_loss": -5.150655746459961, "global_step": 19099, "epoch": 454} {"train_loss": -5.065240383148193, "global_step": 19100, "epoch": 454} {"train_loss": -5.171792030334473, "global_step": 19101, "epoch": 454} {"train_loss": -5.2169952392578125, "global_step": 19102, "epoch": 454} {"train_loss": -5.193569660186768, "global_step": 19103, "epoch": 454} {"train_loss": -5.28110933303833, "global_step": 19104, "epoch": 454} {"train_loss": -5.167121887207031, "global_step": 19105, "epoch": 454} {"train_loss": -5.276439189910889, "global_step": 19106, "epoch": 454} {"train_loss": -5.333843231201172, "global_step": 19107, "epoch": 454} {"train_loss": -5.072706699371338, "global_step": 19108, "epoch": 454} {"train_loss": -5.2630313123975485, "global_step": 19109, "epoch": 454, "val_loss": 76729.2890625} {"train_loss": -5.355751991271973, "global_step": 19110, "epoch": 455} {"train_loss": -5.145228862762451, "global_step": 19111, "epoch": 455} {"train_loss": -5.213644027709961, "global_step": 19112, "epoch": 455} {"train_loss": -5.123412132263184, "global_step": 19113, "epoch": 455} {"train_loss": -5.2639265060424805, "global_step": 19114, "epoch": 455} {"train_loss": -5.014761924743652, "global_step": 19115, "epoch": 455} {"train_loss": -5.30229377746582, "global_step": 19116, "epoch": 455} {"train_loss": -5.068078994750977, "global_step": 19117, "epoch": 455} {"train_loss": -5.18961238861084, "global_step": 19118, "epoch": 455} {"train_loss": -5.280328750610352, "global_step": 19119, "epoch": 455} {"train_loss": -5.315009117126465, "global_step": 19120, "epoch": 455} {"train_loss": -5.336267948150635, "global_step": 19121, "epoch": 455} {"train_loss": -5.288661003112793, "global_step": 19122, "epoch": 455} {"train_loss": -5.209538459777832, "global_step": 19123, "epoch": 455} {"train_loss": -5.124853134155273, "global_step": 19124, "epoch": 455} {"train_loss": -5.328739643096924, "global_step": 19125, "epoch": 455} {"train_loss": -5.238498210906982, "global_step": 19126, "epoch": 455} {"train_loss": -5.230931758880615, "global_step": 19127, "epoch": 455} {"train_loss": -5.150187015533447, "global_step": 19128, "epoch": 455} {"train_loss": -5.213761329650879, "global_step": 19129, "epoch": 455} {"train_loss": -5.302663326263428, "global_step": 19130, "epoch": 455} {"train_loss": -5.344781875610352, "global_step": 19131, "epoch": 455} {"train_loss": -5.203726768493652, "global_step": 19132, "epoch": 455} {"train_loss": -5.30594539642334, "global_step": 19133, "epoch": 455} {"train_loss": -5.232076168060303, "global_step": 19134, "epoch": 455} {"train_loss": -5.143048286437988, "global_step": 19135, "epoch": 455} {"train_loss": -5.366098403930664, "global_step": 19136, "epoch": 455} {"train_loss": -5.286123275756836, "global_step": 19137, "epoch": 455} {"train_loss": -5.152121543884277, "global_step": 19138, "epoch": 455} {"train_loss": -5.28774881362915, "global_step": 19139, "epoch": 455} {"train_loss": -5.331536293029785, "global_step": 19140, "epoch": 455} {"train_loss": -5.283890724182129, "global_step": 19141, "epoch": 455} {"train_loss": -5.372427463531494, "global_step": 19142, "epoch": 455} {"train_loss": -5.314239025115967, "global_step": 19143, "epoch": 455} {"train_loss": -5.187914848327637, "global_step": 19144, "epoch": 455} {"train_loss": -5.332397937774658, "global_step": 19145, "epoch": 455} {"train_loss": -5.296117782592773, "global_step": 19146, "epoch": 455} {"train_loss": -5.295929908752441, "global_step": 19147, "epoch": 455} {"train_loss": -5.403446197509766, "global_step": 19148, "epoch": 455} {"train_loss": -5.349747657775879, "global_step": 19149, "epoch": 455} {"train_loss": -5.237276077270508, "global_step": 19150, "epoch": 455} {"train_loss": -5.253280060631888, "global_step": 19151, "epoch": 455, "val_loss": 76202.2265625} {"train_loss": -5.3372321128845215, "global_step": 19152, "epoch": 456} {"train_loss": -5.319359302520752, "global_step": 19153, "epoch": 456} {"train_loss": -5.235532760620117, "global_step": 19154, "epoch": 456} {"train_loss": -5.28529167175293, "global_step": 19155, "epoch": 456} {"train_loss": -5.085448265075684, "global_step": 19156, "epoch": 456} {"train_loss": -5.271417617797852, "global_step": 19157, "epoch": 456} {"train_loss": -5.06949520111084, "global_step": 19158, "epoch": 456} {"train_loss": -5.344526767730713, "global_step": 19159, "epoch": 456} {"train_loss": -5.1087422370910645, "global_step": 19160, "epoch": 456} {"train_loss": -5.18447208404541, "global_step": 19161, "epoch": 456} {"train_loss": -5.252127647399902, "global_step": 19162, "epoch": 456} {"train_loss": -5.345304012298584, "global_step": 19163, "epoch": 456} {"train_loss": -5.149510383605957, "global_step": 19164, "epoch": 456} {"train_loss": -5.069657325744629, "global_step": 19165, "epoch": 456} {"train_loss": -5.317388534545898, "global_step": 19166, "epoch": 456} {"train_loss": -5.076601028442383, "global_step": 19167, "epoch": 456} {"train_loss": -5.241918563842773, "global_step": 19168, "epoch": 456} {"train_loss": -5.160211563110352, "global_step": 19169, "epoch": 456} {"train_loss": -5.294551849365234, "global_step": 19170, "epoch": 456} {"train_loss": -5.135953426361084, "global_step": 19171, "epoch": 456} {"train_loss": -5.3068037033081055, "global_step": 19172, "epoch": 456} {"train_loss": -5.284080505371094, "global_step": 19173, "epoch": 456} {"train_loss": -5.293773174285889, "global_step": 19174, "epoch": 456} {"train_loss": -5.264143943786621, "global_step": 19175, "epoch": 456} {"train_loss": -5.244863510131836, "global_step": 19176, "epoch": 456} {"train_loss": -5.265679359436035, "global_step": 19177, "epoch": 456} {"train_loss": -5.283048629760742, "global_step": 19178, "epoch": 456} {"train_loss": -5.248394012451172, "global_step": 19179, "epoch": 456} {"train_loss": -5.244435787200928, "global_step": 19180, "epoch": 456} {"train_loss": -5.283343315124512, "global_step": 19181, "epoch": 456} {"train_loss": -5.419966697692871, "global_step": 19182, "epoch": 456} {"train_loss": -5.27097225189209, "global_step": 19183, "epoch": 456} {"train_loss": -5.413823127746582, "global_step": 19184, "epoch": 456} {"train_loss": -5.270177841186523, "global_step": 19185, "epoch": 456} {"train_loss": -5.268638610839844, "global_step": 19186, "epoch": 456} {"train_loss": -5.363441467285156, "global_step": 19187, "epoch": 456} {"train_loss": -5.318046569824219, "global_step": 19188, "epoch": 456} {"train_loss": -5.274582862854004, "global_step": 19189, "epoch": 456} {"train_loss": -5.356245994567871, "global_step": 19190, "epoch": 456} {"train_loss": -5.250922203063965, "global_step": 19191, "epoch": 456} {"train_loss": -5.385088920593262, "global_step": 19192, "epoch": 456} {"train_loss": -5.258649167560396, "global_step": 19193, "epoch": 456, "val_loss": 76931.28125} {"train_loss": -5.359790802001953, "global_step": 19194, "epoch": 457} {"train_loss": -5.218153953552246, "global_step": 19195, "epoch": 457} {"train_loss": -5.349938869476318, "global_step": 19196, "epoch": 457} {"train_loss": -5.339239120483398, "global_step": 19197, "epoch": 457} {"train_loss": -5.298543453216553, "global_step": 19198, "epoch": 457} {"train_loss": -5.235032558441162, "global_step": 19199, "epoch": 457} {"train_loss": -5.280981063842773, "global_step": 19200, "epoch": 457} {"train_loss": -5.307897090911865, "global_step": 19201, "epoch": 457} {"train_loss": -5.236352920532227, "global_step": 19202, "epoch": 457} {"train_loss": -5.200894832611084, "global_step": 19203, "epoch": 457} {"train_loss": -5.115002632141113, "global_step": 19204, "epoch": 457} {"train_loss": -5.372108459472656, "global_step": 19205, "epoch": 457} {"train_loss": -5.506462097167969, "global_step": 19206, "epoch": 457} {"train_loss": -5.184704780578613, "global_step": 19207, "epoch": 457} {"train_loss": -5.1606950759887695, "global_step": 19208, "epoch": 457} {"train_loss": -5.31455135345459, "global_step": 19209, "epoch": 457} {"train_loss": -5.2144927978515625, "global_step": 19210, "epoch": 457} {"train_loss": -5.271757125854492, "global_step": 19211, "epoch": 457} {"train_loss": -5.40178918838501, "global_step": 19212, "epoch": 457} {"train_loss": -5.20009183883667, "global_step": 19213, "epoch": 457} {"train_loss": -5.2158026695251465, "global_step": 19214, "epoch": 457} {"train_loss": -5.211611270904541, "global_step": 19215, "epoch": 457} {"train_loss": -5.153273582458496, "global_step": 19216, "epoch": 457} {"train_loss": -5.13980770111084, "global_step": 19217, "epoch": 457} {"train_loss": -5.171017646789551, "global_step": 19218, "epoch": 457} {"train_loss": -5.201955795288086, "global_step": 19219, "epoch": 457} {"train_loss": -5.377166748046875, "global_step": 19220, "epoch": 457} {"train_loss": -5.305675983428955, "global_step": 19221, "epoch": 457} {"train_loss": -5.32094144821167, "global_step": 19222, "epoch": 457} {"train_loss": -5.209049224853516, "global_step": 19223, "epoch": 457} {"train_loss": -5.2556023597717285, "global_step": 19224, "epoch": 457} {"train_loss": -5.2057905197143555, "global_step": 19225, "epoch": 457} {"train_loss": -5.219151973724365, "global_step": 19226, "epoch": 457} {"train_loss": -5.2713727951049805, "global_step": 19227, "epoch": 457} {"train_loss": -5.199649333953857, "global_step": 19228, "epoch": 457} {"train_loss": -5.255494117736816, "global_step": 19229, "epoch": 457} {"train_loss": -5.405381679534912, "global_step": 19230, "epoch": 457} {"train_loss": -5.360954284667969, "global_step": 19231, "epoch": 457} {"train_loss": -5.4268646240234375, "global_step": 19232, "epoch": 457} {"train_loss": -5.124876976013184, "global_step": 19233, "epoch": 457} {"train_loss": -5.255660533905029, "global_step": 19234, "epoch": 457} {"train_loss": -5.265473377136957, "global_step": 19235, "epoch": 457, "val_loss": 76702.78125} {"train_loss": -5.168759346008301, "global_step": 19236, "epoch": 458} {"train_loss": -5.252340793609619, "global_step": 19237, "epoch": 458} {"train_loss": -5.161725997924805, "global_step": 19238, "epoch": 458} {"train_loss": -5.126847267150879, "global_step": 19239, "epoch": 458} {"train_loss": -5.170726776123047, "global_step": 19240, "epoch": 458} {"train_loss": -5.191722869873047, "global_step": 19241, "epoch": 458} {"train_loss": -5.199281692504883, "global_step": 19242, "epoch": 458} {"train_loss": -5.425276756286621, "global_step": 19243, "epoch": 458} {"train_loss": -5.243967056274414, "global_step": 19244, "epoch": 458} {"train_loss": -5.1900634765625, "global_step": 19245, "epoch": 458} {"train_loss": -5.1215057373046875, "global_step": 19246, "epoch": 458} {"train_loss": -5.096316337585449, "global_step": 19247, "epoch": 458} {"train_loss": -5.213212490081787, "global_step": 19248, "epoch": 458} {"train_loss": -5.203945159912109, "global_step": 19249, "epoch": 458} {"train_loss": -5.14716911315918, "global_step": 19250, "epoch": 458} {"train_loss": -5.168325424194336, "global_step": 19251, "epoch": 458} {"train_loss": -5.125622749328613, "global_step": 19252, "epoch": 458} {"train_loss": -5.369879245758057, "global_step": 19253, "epoch": 458} {"train_loss": -5.115215301513672, "global_step": 19254, "epoch": 458} {"train_loss": -5.3114094734191895, "global_step": 19255, "epoch": 458} {"train_loss": -5.18964958190918, "global_step": 19256, "epoch": 458} {"train_loss": -5.373802185058594, "global_step": 19257, "epoch": 458} {"train_loss": -5.288653373718262, "global_step": 19258, "epoch": 458} {"train_loss": -5.343131065368652, "global_step": 19259, "epoch": 458} {"train_loss": -5.366645812988281, "global_step": 19260, "epoch": 458} {"train_loss": -5.230040073394775, "global_step": 19261, "epoch": 458} {"train_loss": -5.216381072998047, "global_step": 19262, "epoch": 458} {"train_loss": -5.248237133026123, "global_step": 19263, "epoch": 458} {"train_loss": -5.115926742553711, "global_step": 19264, "epoch": 458} {"train_loss": -5.274693489074707, "global_step": 19265, "epoch": 458} {"train_loss": -5.281383991241455, "global_step": 19266, "epoch": 458} {"train_loss": -5.2749924659729, "global_step": 19267, "epoch": 458} {"train_loss": -5.265917778015137, "global_step": 19268, "epoch": 458} {"train_loss": -5.365030288696289, "global_step": 19269, "epoch": 458} {"train_loss": -5.279303550720215, "global_step": 19270, "epoch": 458} {"train_loss": -5.339250564575195, "global_step": 19271, "epoch": 458} {"train_loss": -5.358031272888184, "global_step": 19272, "epoch": 458} {"train_loss": -5.332649230957031, "global_step": 19273, "epoch": 458} {"train_loss": -5.210121154785156, "global_step": 19274, "epoch": 458} {"train_loss": -5.280644416809082, "global_step": 19275, "epoch": 458} {"train_loss": -5.353641510009766, "global_step": 19276, "epoch": 458} {"train_loss": -5.24600997425261, "global_step": 19277, "epoch": 458, "val_loss": 76775.3203125} {"train_loss": -5.208678245544434, "global_step": 19278, "epoch": 459} {"train_loss": -5.300387382507324, "global_step": 19279, "epoch": 459} {"train_loss": -5.276682376861572, "global_step": 19280, "epoch": 459} {"train_loss": -5.2279276847839355, "global_step": 19281, "epoch": 459} {"train_loss": -5.22873067855835, "global_step": 19282, "epoch": 459} {"train_loss": -5.3437604904174805, "global_step": 19283, "epoch": 459} {"train_loss": -5.318021297454834, "global_step": 19284, "epoch": 459} {"train_loss": -5.067080497741699, "global_step": 19285, "epoch": 459} {"train_loss": -5.354499816894531, "global_step": 19286, "epoch": 459} {"train_loss": -5.50653076171875, "global_step": 19287, "epoch": 459} {"train_loss": -5.417365074157715, "global_step": 19288, "epoch": 459} {"train_loss": -5.282789707183838, "global_step": 19289, "epoch": 459} {"train_loss": -5.172399520874023, "global_step": 19290, "epoch": 459} {"train_loss": -5.372767925262451, "global_step": 19291, "epoch": 459} {"train_loss": -5.069406509399414, "global_step": 19292, "epoch": 459} {"train_loss": -5.2292046546936035, "global_step": 19293, "epoch": 459} {"train_loss": -5.237331867218018, "global_step": 19294, "epoch": 459} {"train_loss": -5.208166599273682, "global_step": 19295, "epoch": 459} {"train_loss": -5.245666027069092, "global_step": 19296, "epoch": 459} {"train_loss": -5.276157379150391, "global_step": 19297, "epoch": 459} {"train_loss": -5.255547523498535, "global_step": 19298, "epoch": 459} {"train_loss": -5.187278747558594, "global_step": 19299, "epoch": 459} {"train_loss": -5.27827262878418, "global_step": 19300, "epoch": 459} {"train_loss": -5.198942184448242, "global_step": 19301, "epoch": 459} {"train_loss": -5.311191558837891, "global_step": 19302, "epoch": 459} {"train_loss": -5.264693260192871, "global_step": 19303, "epoch": 459} {"train_loss": -5.041201114654541, "global_step": 19304, "epoch": 459} {"train_loss": -5.265798568725586, "global_step": 19305, "epoch": 459} {"train_loss": -5.268521785736084, "global_step": 19306, "epoch": 459} {"train_loss": -5.172675132751465, "global_step": 19307, "epoch": 459} {"train_loss": -5.2619781494140625, "global_step": 19308, "epoch": 459} {"train_loss": -5.253977298736572, "global_step": 19309, "epoch": 459} {"train_loss": -5.297233581542969, "global_step": 19310, "epoch": 459} {"train_loss": -5.306121826171875, "global_step": 19311, "epoch": 459} {"train_loss": -5.245814323425293, "global_step": 19312, "epoch": 459} {"train_loss": -5.332807540893555, "global_step": 19313, "epoch": 459} {"train_loss": -5.2056660652160645, "global_step": 19314, "epoch": 459} {"train_loss": -5.182221412658691, "global_step": 19315, "epoch": 459} {"train_loss": -5.221622467041016, "global_step": 19316, "epoch": 459} {"train_loss": -5.2741312980651855, "global_step": 19317, "epoch": 459} {"train_loss": -5.438745498657227, "global_step": 19318, "epoch": 459} {"train_loss": -5.256960414704823, "global_step": 19319, "epoch": 459, "val_loss": 76783.765625} {"train_loss": -5.306209564208984, "global_step": 19320, "epoch": 460} {"train_loss": -5.293839931488037, "global_step": 19321, "epoch": 460} {"train_loss": -5.1769022941589355, "global_step": 19322, "epoch": 460} {"train_loss": -5.209429740905762, "global_step": 19323, "epoch": 460} {"train_loss": -5.11259651184082, "global_step": 19324, "epoch": 460} {"train_loss": -5.215121746063232, "global_step": 19325, "epoch": 460} {"train_loss": -5.383141040802002, "global_step": 19326, "epoch": 460} {"train_loss": -5.240747451782227, "global_step": 19327, "epoch": 460} {"train_loss": -5.304169178009033, "global_step": 19328, "epoch": 460} {"train_loss": -5.400387763977051, "global_step": 19329, "epoch": 460} {"train_loss": -5.270511627197266, "global_step": 19330, "epoch": 460} {"train_loss": -5.344634532928467, "global_step": 19331, "epoch": 460} {"train_loss": -5.327129364013672, "global_step": 19332, "epoch": 460} {"train_loss": -5.298672676086426, "global_step": 19333, "epoch": 460} {"train_loss": -5.272083282470703, "global_step": 19334, "epoch": 460} {"train_loss": -5.316618919372559, "global_step": 19335, "epoch": 460} {"train_loss": -5.176715850830078, "global_step": 19336, "epoch": 460} {"train_loss": -5.130630970001221, "global_step": 19337, "epoch": 460} {"train_loss": -5.3540754318237305, "global_step": 19338, "epoch": 460} {"train_loss": -5.353560447692871, "global_step": 19339, "epoch": 460} {"train_loss": -5.308210372924805, "global_step": 19340, "epoch": 460} {"train_loss": -5.21351432800293, "global_step": 19341, "epoch": 460} {"train_loss": -5.216366767883301, "global_step": 19342, "epoch": 460} {"train_loss": -5.321051597595215, "global_step": 19343, "epoch": 460} {"train_loss": -5.36830997467041, "global_step": 19344, "epoch": 460} {"train_loss": -5.327469348907471, "global_step": 19345, "epoch": 460} {"train_loss": -5.217166900634766, "global_step": 19346, "epoch": 460} {"train_loss": -5.3263444900512695, "global_step": 19347, "epoch": 460} {"train_loss": -5.283712387084961, "global_step": 19348, "epoch": 460} {"train_loss": -5.14773416519165, "global_step": 19349, "epoch": 460} {"train_loss": -5.176506996154785, "global_step": 19350, "epoch": 460} {"train_loss": -5.249701499938965, "global_step": 19351, "epoch": 460} {"train_loss": -5.2380051612854, "global_step": 19352, "epoch": 460} {"train_loss": -5.237390041351318, "global_step": 19353, "epoch": 460} {"train_loss": -5.288360595703125, "global_step": 19354, "epoch": 460} {"train_loss": -5.172917366027832, "global_step": 19355, "epoch": 460} {"train_loss": -5.395602226257324, "global_step": 19356, "epoch": 460} {"train_loss": -5.238089561462402, "global_step": 19357, "epoch": 460} {"train_loss": -5.323773384094238, "global_step": 19358, "epoch": 460} {"train_loss": -5.331332683563232, "global_step": 19359, "epoch": 460} {"train_loss": -5.219851970672607, "global_step": 19360, "epoch": 460} {"train_loss": -5.268469708306449, "global_step": 19361, "epoch": 460, "val_loss": 76429.0} {"train_loss": -5.252394676208496, "global_step": 19362, "epoch": 461} {"train_loss": -5.270941734313965, "global_step": 19363, "epoch": 461} {"train_loss": -5.317168712615967, "global_step": 19364, "epoch": 461} {"train_loss": -5.264925003051758, "global_step": 19365, "epoch": 461} {"train_loss": -5.189950942993164, "global_step": 19366, "epoch": 461} {"train_loss": -5.251412391662598, "global_step": 19367, "epoch": 461} {"train_loss": -5.219138145446777, "global_step": 19368, "epoch": 461} {"train_loss": -5.285643577575684, "global_step": 19369, "epoch": 461} {"train_loss": -5.30605411529541, "global_step": 19370, "epoch": 461} {"train_loss": -5.134671211242676, "global_step": 19371, "epoch": 461} {"train_loss": -5.291223526000977, "global_step": 19372, "epoch": 461} {"train_loss": -5.10146427154541, "global_step": 19373, "epoch": 461} {"train_loss": -5.104673385620117, "global_step": 19374, "epoch": 461} {"train_loss": -5.341907024383545, "global_step": 19375, "epoch": 461} {"train_loss": -5.0686140060424805, "global_step": 19376, "epoch": 461} {"train_loss": -5.251185894012451, "global_step": 19377, "epoch": 461} {"train_loss": -5.054811477661133, "global_step": 19378, "epoch": 461} {"train_loss": -5.1088690757751465, "global_step": 19379, "epoch": 461} {"train_loss": -5.269461631774902, "global_step": 19380, "epoch": 461} {"train_loss": -5.073763847351074, "global_step": 19381, "epoch": 461} {"train_loss": -5.1653289794921875, "global_step": 19382, "epoch": 461} {"train_loss": -5.171885013580322, "global_step": 19383, "epoch": 461} {"train_loss": -5.023099899291992, "global_step": 19384, "epoch": 461} {"train_loss": -5.313959121704102, "global_step": 19385, "epoch": 461} {"train_loss": -5.035305976867676, "global_step": 19386, "epoch": 461} {"train_loss": -5.241583824157715, "global_step": 19387, "epoch": 461} {"train_loss": -5.164187431335449, "global_step": 19388, "epoch": 461} {"train_loss": -5.147686958312988, "global_step": 19389, "epoch": 461} {"train_loss": -5.323406219482422, "global_step": 19390, "epoch": 461} {"train_loss": -5.088369369506836, "global_step": 19391, "epoch": 461} {"train_loss": -5.218225002288818, "global_step": 19392, "epoch": 461} {"train_loss": -5.182216167449951, "global_step": 19393, "epoch": 461} {"train_loss": -5.347446918487549, "global_step": 19394, "epoch": 461} {"train_loss": -5.2795634269714355, "global_step": 19395, "epoch": 461} {"train_loss": -5.251254558563232, "global_step": 19396, "epoch": 461} {"train_loss": -5.292039394378662, "global_step": 19397, "epoch": 461} {"train_loss": -5.345501899719238, "global_step": 19398, "epoch": 461} {"train_loss": -5.3528361320495605, "global_step": 19399, "epoch": 461} {"train_loss": -5.214966773986816, "global_step": 19400, "epoch": 461} {"train_loss": -5.266716003417969, "global_step": 19401, "epoch": 461} {"train_loss": -5.18594217300415, "global_step": 19402, "epoch": 461} {"train_loss": -5.218148924055553, "global_step": 19403, "epoch": 461, "val_loss": 76328.671875} {"train_loss": -5.158751964569092, "global_step": 19404, "epoch": 462} {"train_loss": -5.430394172668457, "global_step": 19405, "epoch": 462} {"train_loss": -5.168676376342773, "global_step": 19406, "epoch": 462} {"train_loss": -5.334268569946289, "global_step": 19407, "epoch": 462} {"train_loss": -5.314273834228516, "global_step": 19408, "epoch": 462} {"train_loss": -5.230997085571289, "global_step": 19409, "epoch": 462} {"train_loss": -5.315652370452881, "global_step": 19410, "epoch": 462} {"train_loss": -5.29721736907959, "global_step": 19411, "epoch": 462} {"train_loss": -5.211785793304443, "global_step": 19412, "epoch": 462} {"train_loss": -5.256072044372559, "global_step": 19413, "epoch": 462} {"train_loss": -5.322238922119141, "global_step": 19414, "epoch": 462} {"train_loss": -5.355447292327881, "global_step": 19415, "epoch": 462} {"train_loss": -5.384531021118164, "global_step": 19416, "epoch": 462} {"train_loss": -5.207773685455322, "global_step": 19417, "epoch": 462} {"train_loss": -5.411308765411377, "global_step": 19418, "epoch": 462} {"train_loss": -5.322972297668457, "global_step": 19419, "epoch": 462} {"train_loss": -5.375152587890625, "global_step": 19420, "epoch": 462} {"train_loss": -5.195730686187744, "global_step": 19421, "epoch": 462} {"train_loss": -5.211536407470703, "global_step": 19422, "epoch": 462} {"train_loss": -5.3170881271362305, "global_step": 19423, "epoch": 462} {"train_loss": -5.142611026763916, "global_step": 19424, "epoch": 462} {"train_loss": -5.167780876159668, "global_step": 19425, "epoch": 462} {"train_loss": -5.392005920410156, "global_step": 19426, "epoch": 462} {"train_loss": -5.30226993560791, "global_step": 19427, "epoch": 462} {"train_loss": -5.38299036026001, "global_step": 19428, "epoch": 462} {"train_loss": -5.251188278198242, "global_step": 19429, "epoch": 462} {"train_loss": -5.216494083404541, "global_step": 19430, "epoch": 462} {"train_loss": -5.339236736297607, "global_step": 19431, "epoch": 462} {"train_loss": -5.3382368087768555, "global_step": 19432, "epoch": 462} {"train_loss": -5.409496784210205, "global_step": 19433, "epoch": 462} {"train_loss": -5.228435516357422, "global_step": 19434, "epoch": 462} {"train_loss": -5.3437113761901855, "global_step": 19435, "epoch": 462} {"train_loss": -5.2164506912231445, "global_step": 19436, "epoch": 462} {"train_loss": -5.25506591796875, "global_step": 19437, "epoch": 462} {"train_loss": -5.32023811340332, "global_step": 19438, "epoch": 462} {"train_loss": -5.054813385009766, "global_step": 19439, "epoch": 462} {"train_loss": -5.381361484527588, "global_step": 19440, "epoch": 462} {"train_loss": -5.313126564025879, "global_step": 19441, "epoch": 462} {"train_loss": -5.074239730834961, "global_step": 19442, "epoch": 462} {"train_loss": -5.215496063232422, "global_step": 19443, "epoch": 462} {"train_loss": -5.380947113037109, "global_step": 19444, "epoch": 462} {"train_loss": -5.277941942214966, "global_step": 19445, "epoch": 462, "val_loss": 75814.4453125} {"train_loss": -5.300698280334473, "global_step": 19446, "epoch": 463} {"train_loss": -5.291311264038086, "global_step": 19447, "epoch": 463} {"train_loss": -5.106100559234619, "global_step": 19448, "epoch": 463} {"train_loss": -5.357141494750977, "global_step": 19449, "epoch": 463} {"train_loss": -5.131049156188965, "global_step": 19450, "epoch": 463} {"train_loss": -5.378556251525879, "global_step": 19451, "epoch": 463} {"train_loss": -5.235246658325195, "global_step": 19452, "epoch": 463} {"train_loss": -5.204217910766602, "global_step": 19453, "epoch": 463} {"train_loss": -5.269805908203125, "global_step": 19454, "epoch": 463} {"train_loss": -5.160355091094971, "global_step": 19455, "epoch": 463} {"train_loss": -5.272525787353516, "global_step": 19456, "epoch": 463} {"train_loss": -5.206859588623047, "global_step": 19457, "epoch": 463} {"train_loss": -5.0789875984191895, "global_step": 19458, "epoch": 463} {"train_loss": -5.135488033294678, "global_step": 19459, "epoch": 463} {"train_loss": -5.010561943054199, "global_step": 19460, "epoch": 463} {"train_loss": -5.220816135406494, "global_step": 19461, "epoch": 463} {"train_loss": -5.149815559387207, "global_step": 19462, "epoch": 463} {"train_loss": -5.2057695388793945, "global_step": 19463, "epoch": 463} {"train_loss": -5.126270294189453, "global_step": 19464, "epoch": 463} {"train_loss": -5.29434871673584, "global_step": 19465, "epoch": 463} {"train_loss": -5.201274871826172, "global_step": 19466, "epoch": 463} {"train_loss": -5.07638692855835, "global_step": 19467, "epoch": 463} {"train_loss": -5.116522312164307, "global_step": 19468, "epoch": 463} {"train_loss": -5.299405097961426, "global_step": 19469, "epoch": 463} {"train_loss": -5.145783424377441, "global_step": 19470, "epoch": 463} {"train_loss": -5.305464744567871, "global_step": 19471, "epoch": 463} {"train_loss": -5.2024407386779785, "global_step": 19472, "epoch": 463} {"train_loss": -5.153175354003906, "global_step": 19473, "epoch": 463} {"train_loss": -5.249715805053711, "global_step": 19474, "epoch": 463} {"train_loss": -5.357522010803223, "global_step": 19475, "epoch": 463} {"train_loss": -5.200839042663574, "global_step": 19476, "epoch": 463} {"train_loss": -5.290639400482178, "global_step": 19477, "epoch": 463} {"train_loss": -5.2748003005981445, "global_step": 19478, "epoch": 463} {"train_loss": -5.094012260437012, "global_step": 19479, "epoch": 463} {"train_loss": -5.364787578582764, "global_step": 19480, "epoch": 463} {"train_loss": -5.191244125366211, "global_step": 19481, "epoch": 463} {"train_loss": -5.300759315490723, "global_step": 19482, "epoch": 463} {"train_loss": -5.1947784423828125, "global_step": 19483, "epoch": 463} {"train_loss": -5.196597099304199, "global_step": 19484, "epoch": 463} {"train_loss": -5.34261417388916, "global_step": 19485, "epoch": 463} {"train_loss": -5.244427680969238, "global_step": 19486, "epoch": 463} {"train_loss": -5.221317155020578, "global_step": 19487, "epoch": 463, "val_loss": 76828.390625} {"train_loss": -5.161140441894531, "global_step": 19488, "epoch": 464} {"train_loss": -5.344537258148193, "global_step": 19489, "epoch": 464} {"train_loss": -5.183834075927734, "global_step": 19490, "epoch": 464} {"train_loss": -5.2282514572143555, "global_step": 19491, "epoch": 464} {"train_loss": -5.278214454650879, "global_step": 19492, "epoch": 464} {"train_loss": -5.23490571975708, "global_step": 19493, "epoch": 464} {"train_loss": -5.1691436767578125, "global_step": 19494, "epoch": 464} {"train_loss": -5.299136161804199, "global_step": 19495, "epoch": 464} {"train_loss": -5.210799217224121, "global_step": 19496, "epoch": 464} {"train_loss": -5.275095462799072, "global_step": 19497, "epoch": 464} {"train_loss": -5.271693229675293, "global_step": 19498, "epoch": 464} {"train_loss": -5.237146854400635, "global_step": 19499, "epoch": 464} {"train_loss": -5.401915550231934, "global_step": 19500, "epoch": 464} {"train_loss": -5.225476264953613, "global_step": 19501, "epoch": 464} {"train_loss": -5.1801252365112305, "global_step": 19502, "epoch": 464} {"train_loss": -5.173157691955566, "global_step": 19503, "epoch": 464} {"train_loss": -5.403266906738281, "global_step": 19504, "epoch": 464} {"train_loss": -5.309833526611328, "global_step": 19505, "epoch": 464} {"train_loss": -5.288924694061279, "global_step": 19506, "epoch": 464} {"train_loss": -5.240522861480713, "global_step": 19507, "epoch": 464} {"train_loss": -5.156408309936523, "global_step": 19508, "epoch": 464} {"train_loss": -5.370655059814453, "global_step": 19509, "epoch": 464} {"train_loss": -5.327040672302246, "global_step": 19510, "epoch": 464} {"train_loss": -5.2915544509887695, "global_step": 19511, "epoch": 464} {"train_loss": -5.32399845123291, "global_step": 19512, "epoch": 464} {"train_loss": -5.249748229980469, "global_step": 19513, "epoch": 464} {"train_loss": -5.327785491943359, "global_step": 19514, "epoch": 464} {"train_loss": -5.321472644805908, "global_step": 19515, "epoch": 464} {"train_loss": -5.378849983215332, "global_step": 19516, "epoch": 464} {"train_loss": -5.3282599449157715, "global_step": 19517, "epoch": 464} {"train_loss": -5.295424461364746, "global_step": 19518, "epoch": 464} {"train_loss": -5.408803462982178, "global_step": 19519, "epoch": 464} {"train_loss": -5.453944683074951, "global_step": 19520, "epoch": 464} {"train_loss": -5.170453071594238, "global_step": 19521, "epoch": 464} {"train_loss": -5.267754554748535, "global_step": 19522, "epoch": 464} {"train_loss": -5.258331775665283, "global_step": 19523, "epoch": 464} {"train_loss": -5.148571014404297, "global_step": 19524, "epoch": 464} {"train_loss": -5.232357025146484, "global_step": 19525, "epoch": 464} {"train_loss": -5.384312629699707, "global_step": 19526, "epoch": 464} {"train_loss": -5.198516845703125, "global_step": 19527, "epoch": 464} {"train_loss": -5.321261405944824, "global_step": 19528, "epoch": 464} {"train_loss": -5.279135102317447, "global_step": 19529, "epoch": 464, "val_loss": 76039.0078125} {"train_loss": -5.306436538696289, "global_step": 19530, "epoch": 465} {"train_loss": -5.18495512008667, "global_step": 19531, "epoch": 465} {"train_loss": -5.336517810821533, "global_step": 19532, "epoch": 465} {"train_loss": -5.065798759460449, "global_step": 19533, "epoch": 465} {"train_loss": -5.267330169677734, "global_step": 19534, "epoch": 465} {"train_loss": -5.289186954498291, "global_step": 19535, "epoch": 465} {"train_loss": -5.317295551300049, "global_step": 19536, "epoch": 465} {"train_loss": -5.322476387023926, "global_step": 19537, "epoch": 465} {"train_loss": -5.373748302459717, "global_step": 19538, "epoch": 465} {"train_loss": -5.24863862991333, "global_step": 19539, "epoch": 465} {"train_loss": -5.257060527801514, "global_step": 19540, "epoch": 465} {"train_loss": -5.4289045333862305, "global_step": 19541, "epoch": 465} {"train_loss": -5.3391242027282715, "global_step": 19542, "epoch": 465} {"train_loss": -5.287307262420654, "global_step": 19543, "epoch": 465} {"train_loss": -5.245334625244141, "global_step": 19544, "epoch": 465} {"train_loss": -5.17136287689209, "global_step": 19545, "epoch": 465} {"train_loss": -5.3090620040893555, "global_step": 19546, "epoch": 465} {"train_loss": -5.188621997833252, "global_step": 19547, "epoch": 465} {"train_loss": -5.315860748291016, "global_step": 19548, "epoch": 465} {"train_loss": -5.256723403930664, "global_step": 19549, "epoch": 465} {"train_loss": -5.348746299743652, "global_step": 19550, "epoch": 465} {"train_loss": -5.235387802124023, "global_step": 19551, "epoch": 465} {"train_loss": -5.31845760345459, "global_step": 19552, "epoch": 465} {"train_loss": -5.385354995727539, "global_step": 19553, "epoch": 465} {"train_loss": -5.385955810546875, "global_step": 19554, "epoch": 465} {"train_loss": -5.181623935699463, "global_step": 19555, "epoch": 465} {"train_loss": -5.359826564788818, "global_step": 19556, "epoch": 465} {"train_loss": -5.328585147857666, "global_step": 19557, "epoch": 465} {"train_loss": -5.218466758728027, "global_step": 19558, "epoch": 465} {"train_loss": -5.205218315124512, "global_step": 19559, "epoch": 465} {"train_loss": -5.16813850402832, "global_step": 19560, "epoch": 465} {"train_loss": -5.232410430908203, "global_step": 19561, "epoch": 465} {"train_loss": -5.353518486022949, "global_step": 19562, "epoch": 465} {"train_loss": -5.227800369262695, "global_step": 19563, "epoch": 465} {"train_loss": -5.213642597198486, "global_step": 19564, "epoch": 465} {"train_loss": -5.243821620941162, "global_step": 19565, "epoch": 465} {"train_loss": -5.34273624420166, "global_step": 19566, "epoch": 465} {"train_loss": -5.169637203216553, "global_step": 19567, "epoch": 465} {"train_loss": -5.175004005432129, "global_step": 19568, "epoch": 465} {"train_loss": -5.304471969604492, "global_step": 19569, "epoch": 465} {"train_loss": -5.068005084991455, "global_step": 19570, "epoch": 465} {"train_loss": -5.266834542864845, "global_step": 19571, "epoch": 465, "val_loss": 77048.40625} {"train_loss": -5.235511779785156, "global_step": 19572, "epoch": 466} {"train_loss": -5.228213310241699, "global_step": 19573, "epoch": 466} {"train_loss": -5.187858581542969, "global_step": 19574, "epoch": 466} {"train_loss": -5.206014156341553, "global_step": 19575, "epoch": 466} {"train_loss": -5.152652740478516, "global_step": 19576, "epoch": 466} {"train_loss": -5.237964630126953, "global_step": 19577, "epoch": 466} {"train_loss": -5.224733352661133, "global_step": 19578, "epoch": 466} {"train_loss": -5.278507232666016, "global_step": 19579, "epoch": 466} {"train_loss": -5.19075345993042, "global_step": 19580, "epoch": 466} {"train_loss": -5.21626091003418, "global_step": 19581, "epoch": 466} {"train_loss": -5.344405651092529, "global_step": 19582, "epoch": 466} {"train_loss": -5.275529861450195, "global_step": 19583, "epoch": 466} {"train_loss": -5.217559814453125, "global_step": 19584, "epoch": 466} {"train_loss": -5.355600833892822, "global_step": 19585, "epoch": 466} {"train_loss": -5.344277381896973, "global_step": 19586, "epoch": 466} {"train_loss": -5.29107666015625, "global_step": 19587, "epoch": 466} {"train_loss": -5.293422698974609, "global_step": 19588, "epoch": 466} {"train_loss": -5.136731147766113, "global_step": 19589, "epoch": 466} {"train_loss": -5.350922584533691, "global_step": 19590, "epoch": 466} {"train_loss": -5.209449768066406, "global_step": 19591, "epoch": 466} {"train_loss": -5.276297092437744, "global_step": 19592, "epoch": 466} {"train_loss": -5.352349758148193, "global_step": 19593, "epoch": 466} {"train_loss": -5.095677375793457, "global_step": 19594, "epoch": 466} {"train_loss": -5.30523681640625, "global_step": 19595, "epoch": 466} {"train_loss": -5.273397445678711, "global_step": 19596, "epoch": 466} {"train_loss": -5.185126781463623, "global_step": 19597, "epoch": 466} {"train_loss": -5.271413803100586, "global_step": 19598, "epoch": 466} {"train_loss": -5.3255815505981445, "global_step": 19599, "epoch": 466} {"train_loss": -5.339168548583984, "global_step": 19600, "epoch": 466} {"train_loss": -5.337821960449219, "global_step": 19601, "epoch": 466} {"train_loss": -5.20198917388916, "global_step": 19602, "epoch": 466} {"train_loss": -5.432101249694824, "global_step": 19603, "epoch": 466} {"train_loss": -5.28270959854126, "global_step": 19604, "epoch": 466} {"train_loss": -5.194255352020264, "global_step": 19605, "epoch": 466} {"train_loss": -5.18233585357666, "global_step": 19606, "epoch": 466} {"train_loss": -5.211816310882568, "global_step": 19607, "epoch": 466} {"train_loss": -5.363870620727539, "global_step": 19608, "epoch": 466} {"train_loss": -5.2585930824279785, "global_step": 19609, "epoch": 466} {"train_loss": -5.227805137634277, "global_step": 19610, "epoch": 466} {"train_loss": -5.163127422332764, "global_step": 19611, "epoch": 466} {"train_loss": -5.12750244140625, "global_step": 19612, "epoch": 466} {"train_loss": -5.252246663683937, "global_step": 19613, "epoch": 466, "val_loss": 75846.8671875} {"train_loss": -5.254709720611572, "global_step": 19614, "epoch": 467} {"train_loss": -5.206297874450684, "global_step": 19615, "epoch": 467} {"train_loss": -5.1576313972473145, "global_step": 19616, "epoch": 467} {"train_loss": -5.382599830627441, "global_step": 19617, "epoch": 467} {"train_loss": -5.284360408782959, "global_step": 19618, "epoch": 467} {"train_loss": -5.420408248901367, "global_step": 19619, "epoch": 467} {"train_loss": -5.243466854095459, "global_step": 19620, "epoch": 467} {"train_loss": -5.346776485443115, "global_step": 19621, "epoch": 467} {"train_loss": -5.330200672149658, "global_step": 19622, "epoch": 467} {"train_loss": -5.3357086181640625, "global_step": 19623, "epoch": 467} {"train_loss": -5.321515083312988, "global_step": 19624, "epoch": 467} {"train_loss": -5.202473163604736, "global_step": 19625, "epoch": 467} {"train_loss": -5.199684143066406, "global_step": 19626, "epoch": 467} {"train_loss": -5.368274688720703, "global_step": 19627, "epoch": 467} {"train_loss": -5.36442756652832, "global_step": 19628, "epoch": 467} {"train_loss": -5.268733978271484, "global_step": 19629, "epoch": 467} {"train_loss": -5.361259460449219, "global_step": 19630, "epoch": 467} {"train_loss": -5.116948127746582, "global_step": 19631, "epoch": 467} {"train_loss": -5.283590316772461, "global_step": 19632, "epoch": 467} {"train_loss": -5.285238265991211, "global_step": 19633, "epoch": 467} {"train_loss": -5.1094160079956055, "global_step": 19634, "epoch": 467} {"train_loss": -5.236589431762695, "global_step": 19635, "epoch": 467} {"train_loss": -5.288849830627441, "global_step": 19636, "epoch": 467} {"train_loss": -5.196905136108398, "global_step": 19637, "epoch": 467} {"train_loss": -5.273617744445801, "global_step": 19638, "epoch": 467} {"train_loss": -5.158469200134277, "global_step": 19639, "epoch": 467} {"train_loss": -5.4249491691589355, "global_step": 19640, "epoch": 467} {"train_loss": -5.337589740753174, "global_step": 19641, "epoch": 467} {"train_loss": -5.381361961364746, "global_step": 19642, "epoch": 467} {"train_loss": -5.296645641326904, "global_step": 19643, "epoch": 467} {"train_loss": -5.250218391418457, "global_step": 19644, "epoch": 467} {"train_loss": -5.246917724609375, "global_step": 19645, "epoch": 467} {"train_loss": -5.354043960571289, "global_step": 19646, "epoch": 467} {"train_loss": -5.232935905456543, "global_step": 19647, "epoch": 467} {"train_loss": -5.287437438964844, "global_step": 19648, "epoch": 467} {"train_loss": -5.269862651824951, "global_step": 19649, "epoch": 467} {"train_loss": -5.296714782714844, "global_step": 19650, "epoch": 467} {"train_loss": -5.200079917907715, "global_step": 19651, "epoch": 467} {"train_loss": -5.108938694000244, "global_step": 19652, "epoch": 467} {"train_loss": -5.183938026428223, "global_step": 19653, "epoch": 467} {"train_loss": -5.30992317199707, "global_step": 19654, "epoch": 467} {"train_loss": -5.272218170620146, "global_step": 19655, "epoch": 467, "val_loss": 76752.7109375} {"train_loss": -5.2701520919799805, "global_step": 19656, "epoch": 468} {"train_loss": -5.318061828613281, "global_step": 19657, "epoch": 468} {"train_loss": -5.156215667724609, "global_step": 19658, "epoch": 468} {"train_loss": -5.271385669708252, "global_step": 19659, "epoch": 468} {"train_loss": -5.113309860229492, "global_step": 19660, "epoch": 468} {"train_loss": -5.155033111572266, "global_step": 19661, "epoch": 468} {"train_loss": -5.364816665649414, "global_step": 19662, "epoch": 468} {"train_loss": -5.112665176391602, "global_step": 19663, "epoch": 468} {"train_loss": -5.3490400314331055, "global_step": 19664, "epoch": 468} {"train_loss": -5.313452243804932, "global_step": 19665, "epoch": 468} {"train_loss": -5.30119514465332, "global_step": 19666, "epoch": 468} {"train_loss": -5.3260345458984375, "global_step": 19667, "epoch": 468} {"train_loss": -5.290879726409912, "global_step": 19668, "epoch": 468} {"train_loss": -5.30831241607666, "global_step": 19669, "epoch": 468} {"train_loss": -5.19582462310791, "global_step": 19670, "epoch": 468} {"train_loss": -5.339298248291016, "global_step": 19671, "epoch": 468} {"train_loss": -5.309431076049805, "global_step": 19672, "epoch": 468} {"train_loss": -5.371417045593262, "global_step": 19673, "epoch": 468} {"train_loss": -5.401534080505371, "global_step": 19674, "epoch": 468} {"train_loss": -5.311704635620117, "global_step": 19675, "epoch": 468} {"train_loss": -5.241083145141602, "global_step": 19676, "epoch": 468} {"train_loss": -5.263376712799072, "global_step": 19677, "epoch": 468} {"train_loss": -5.270937919616699, "global_step": 19678, "epoch": 468} {"train_loss": -5.226461410522461, "global_step": 19679, "epoch": 468} {"train_loss": -5.356094837188721, "global_step": 19680, "epoch": 468} {"train_loss": -5.279550552368164, "global_step": 19681, "epoch": 468} {"train_loss": -5.370429992675781, "global_step": 19682, "epoch": 468} {"train_loss": -5.15753173828125, "global_step": 19683, "epoch": 468} {"train_loss": -5.047496318817139, "global_step": 19684, "epoch": 468} {"train_loss": -5.337489128112793, "global_step": 19685, "epoch": 468} {"train_loss": -5.394325256347656, "global_step": 19686, "epoch": 468} {"train_loss": -5.277228355407715, "global_step": 19687, "epoch": 468} {"train_loss": -5.198522567749023, "global_step": 19688, "epoch": 468} {"train_loss": -5.30316686630249, "global_step": 19689, "epoch": 468} {"train_loss": -5.167230129241943, "global_step": 19690, "epoch": 468} {"train_loss": -5.412518501281738, "global_step": 19691, "epoch": 468} {"train_loss": -5.44677734375, "global_step": 19692, "epoch": 468} {"train_loss": -5.4177045822143555, "global_step": 19693, "epoch": 468} {"train_loss": -5.329410552978516, "global_step": 19694, "epoch": 468} {"train_loss": -5.358776092529297, "global_step": 19695, "epoch": 468} {"train_loss": -5.287311553955078, "global_step": 19696, "epoch": 468} {"train_loss": -5.286437897455125, "global_step": 19697, "epoch": 468, "val_loss": 76324.3046875} {"train_loss": -5.421860694885254, "global_step": 19698, "epoch": 469} {"train_loss": -5.302972793579102, "global_step": 19699, "epoch": 469} {"train_loss": -5.3499908447265625, "global_step": 19700, "epoch": 469} {"train_loss": -5.318441867828369, "global_step": 19701, "epoch": 469} {"train_loss": -5.3369598388671875, "global_step": 19702, "epoch": 469} {"train_loss": -5.452872276306152, "global_step": 19703, "epoch": 469} {"train_loss": -5.334562301635742, "global_step": 19704, "epoch": 469} {"train_loss": -5.258378505706787, "global_step": 19705, "epoch": 469} {"train_loss": -5.2799482345581055, "global_step": 19706, "epoch": 469} {"train_loss": -5.273775100708008, "global_step": 19707, "epoch": 469} {"train_loss": -5.304869651794434, "global_step": 19708, "epoch": 469} {"train_loss": -5.191283226013184, "global_step": 19709, "epoch": 469} {"train_loss": -5.299858093261719, "global_step": 19710, "epoch": 469} {"train_loss": -5.321885108947754, "global_step": 19711, "epoch": 469} {"train_loss": -5.228430271148682, "global_step": 19712, "epoch": 469} {"train_loss": -5.346438407897949, "global_step": 19713, "epoch": 469} {"train_loss": -5.231184959411621, "global_step": 19714, "epoch": 469} {"train_loss": -5.404356002807617, "global_step": 19715, "epoch": 469} {"train_loss": -5.379190444946289, "global_step": 19716, "epoch": 469} {"train_loss": -5.289822578430176, "global_step": 19717, "epoch": 469} {"train_loss": -5.35501766204834, "global_step": 19718, "epoch": 469} {"train_loss": -5.355982780456543, "global_step": 19719, "epoch": 469} {"train_loss": -5.233539581298828, "global_step": 19720, "epoch": 469} {"train_loss": -5.2387542724609375, "global_step": 19721, "epoch": 469} {"train_loss": -5.308977127075195, "global_step": 19722, "epoch": 469} {"train_loss": -5.293654441833496, "global_step": 19723, "epoch": 469} {"train_loss": -5.137326717376709, "global_step": 19724, "epoch": 469} {"train_loss": -5.3706955909729, "global_step": 19725, "epoch": 469} {"train_loss": -5.263188362121582, "global_step": 19726, "epoch": 469} {"train_loss": -5.201794147491455, "global_step": 19727, "epoch": 469} {"train_loss": -5.361532211303711, "global_step": 19728, "epoch": 469} {"train_loss": -5.327295303344727, "global_step": 19729, "epoch": 469} {"train_loss": -5.287073135375977, "global_step": 19730, "epoch": 469} {"train_loss": -5.280035018920898, "global_step": 19731, "epoch": 469} {"train_loss": -5.303179740905762, "global_step": 19732, "epoch": 469} {"train_loss": -5.2287187576293945, "global_step": 19733, "epoch": 469} {"train_loss": -5.21608304977417, "global_step": 19734, "epoch": 469} {"train_loss": -5.322035789489746, "global_step": 19735, "epoch": 469} {"train_loss": -5.334316253662109, "global_step": 19736, "epoch": 469} {"train_loss": -5.352686405181885, "global_step": 19737, "epoch": 469} {"train_loss": -5.28133487701416, "global_step": 19738, "epoch": 469} {"train_loss": -5.300956464949108, "global_step": 19739, "epoch": 469, "val_loss": 75995.1171875} {"train_loss": -5.337606430053711, "global_step": 19740, "epoch": 470} {"train_loss": -5.276401042938232, "global_step": 19741, "epoch": 470} {"train_loss": -5.255441665649414, "global_step": 19742, "epoch": 470} {"train_loss": -5.322072505950928, "global_step": 19743, "epoch": 470} {"train_loss": -5.3610100746154785, "global_step": 19744, "epoch": 470} {"train_loss": -5.285036087036133, "global_step": 19745, "epoch": 470} {"train_loss": -5.328383445739746, "global_step": 19746, "epoch": 470} {"train_loss": -5.218585014343262, "global_step": 19747, "epoch": 470} {"train_loss": -5.312859535217285, "global_step": 19748, "epoch": 470} {"train_loss": -5.17153263092041, "global_step": 19749, "epoch": 470} {"train_loss": -5.288800239562988, "global_step": 19750, "epoch": 470} {"train_loss": -5.219200611114502, "global_step": 19751, "epoch": 470} {"train_loss": -5.252533912658691, "global_step": 19752, "epoch": 470} {"train_loss": -5.346549987792969, "global_step": 19753, "epoch": 470} {"train_loss": -5.2741618156433105, "global_step": 19754, "epoch": 470} {"train_loss": -5.210657119750977, "global_step": 19755, "epoch": 470} {"train_loss": -5.322786331176758, "global_step": 19756, "epoch": 470} {"train_loss": -5.448069095611572, "global_step": 19757, "epoch": 470} {"train_loss": -5.381413459777832, "global_step": 19758, "epoch": 470} {"train_loss": -5.434425354003906, "global_step": 19759, "epoch": 470} {"train_loss": -5.236881256103516, "global_step": 19760, "epoch": 470} {"train_loss": -5.352946758270264, "global_step": 19761, "epoch": 470} {"train_loss": -5.177649974822998, "global_step": 19762, "epoch": 470} {"train_loss": -5.1680498123168945, "global_step": 19763, "epoch": 470} {"train_loss": -5.026852607727051, "global_step": 19764, "epoch": 470} {"train_loss": -5.299744129180908, "global_step": 19765, "epoch": 470} {"train_loss": -5.125474452972412, "global_step": 19766, "epoch": 470} {"train_loss": -5.244977951049805, "global_step": 19767, "epoch": 470} {"train_loss": -5.376906871795654, "global_step": 19768, "epoch": 470} {"train_loss": -5.224501609802246, "global_step": 19769, "epoch": 470} {"train_loss": -5.279577255249023, "global_step": 19770, "epoch": 470} {"train_loss": -5.348789215087891, "global_step": 19771, "epoch": 470} {"train_loss": -5.218803882598877, "global_step": 19772, "epoch": 470} {"train_loss": -5.2621636390686035, "global_step": 19773, "epoch": 470} {"train_loss": -5.293112754821777, "global_step": 19774, "epoch": 470} {"train_loss": -5.25078010559082, "global_step": 19775, "epoch": 470} {"train_loss": -5.237513542175293, "global_step": 19776, "epoch": 470} {"train_loss": -5.185988426208496, "global_step": 19777, "epoch": 470} {"train_loss": -5.260253429412842, "global_step": 19778, "epoch": 470} {"train_loss": -5.303643226623535, "global_step": 19779, "epoch": 470} {"train_loss": -5.224519729614258, "global_step": 19780, "epoch": 470} {"train_loss": -5.27293002037775, "global_step": 19781, "epoch": 470, "val_loss": 76155.046875} {"train_loss": -5.380932807922363, "global_step": 19782, "epoch": 471} {"train_loss": -5.181756019592285, "global_step": 19783, "epoch": 471} {"train_loss": -5.391300201416016, "global_step": 19784, "epoch": 471} {"train_loss": -5.3179121017456055, "global_step": 19785, "epoch": 471} {"train_loss": -5.105091571807861, "global_step": 19786, "epoch": 471} {"train_loss": -5.3584794998168945, "global_step": 19787, "epoch": 471} {"train_loss": -5.34996223449707, "global_step": 19788, "epoch": 471} {"train_loss": -5.051919460296631, "global_step": 19789, "epoch": 471} {"train_loss": -5.355912685394287, "global_step": 19790, "epoch": 471} {"train_loss": -5.209603309631348, "global_step": 19791, "epoch": 471} {"train_loss": -5.301653861999512, "global_step": 19792, "epoch": 471} {"train_loss": -5.415887832641602, "global_step": 19793, "epoch": 471} {"train_loss": -5.35386323928833, "global_step": 19794, "epoch": 471} {"train_loss": -5.118467330932617, "global_step": 19795, "epoch": 471} {"train_loss": -5.201016426086426, "global_step": 19796, "epoch": 471} {"train_loss": -5.2460222244262695, "global_step": 19797, "epoch": 471} {"train_loss": -5.285542011260986, "global_step": 19798, "epoch": 471} {"train_loss": -5.375400543212891, "global_step": 19799, "epoch": 471} {"train_loss": -5.316378593444824, "global_step": 19800, "epoch": 471} {"train_loss": -5.350011825561523, "global_step": 19801, "epoch": 471} {"train_loss": -5.361786842346191, "global_step": 19802, "epoch": 471} {"train_loss": -5.269263744354248, "global_step": 19803, "epoch": 471} {"train_loss": -5.312292098999023, "global_step": 19804, "epoch": 471} {"train_loss": -5.234060287475586, "global_step": 19805, "epoch": 471} {"train_loss": -5.194238662719727, "global_step": 19806, "epoch": 471} {"train_loss": -5.33287239074707, "global_step": 19807, "epoch": 471} {"train_loss": -5.232935428619385, "global_step": 19808, "epoch": 471} {"train_loss": -5.257251739501953, "global_step": 19809, "epoch": 471} {"train_loss": -5.31746768951416, "global_step": 19810, "epoch": 471} {"train_loss": -5.331453323364258, "global_step": 19811, "epoch": 471} {"train_loss": -5.2764811515808105, "global_step": 19812, "epoch": 471} {"train_loss": -5.352384090423584, "global_step": 19813, "epoch": 471} {"train_loss": -5.188083648681641, "global_step": 19814, "epoch": 471} {"train_loss": -5.210414886474609, "global_step": 19815, "epoch": 471} {"train_loss": -5.3614501953125, "global_step": 19816, "epoch": 471} {"train_loss": -5.269039154052734, "global_step": 19817, "epoch": 471} {"train_loss": -5.419686794281006, "global_step": 19818, "epoch": 471} {"train_loss": -5.289793014526367, "global_step": 19819, "epoch": 471} {"train_loss": -5.504158973693848, "global_step": 19820, "epoch": 471} {"train_loss": -5.381889820098877, "global_step": 19821, "epoch": 471} {"train_loss": -5.250504493713379, "global_step": 19822, "epoch": 471} {"train_loss": -5.291700226919992, "global_step": 19823, "epoch": 471, "val_loss": 76178.515625} {"train_loss": -5.422066688537598, "global_step": 19824, "epoch": 472} {"train_loss": -5.307521820068359, "global_step": 19825, "epoch": 472} {"train_loss": -5.2321014404296875, "global_step": 19826, "epoch": 472} {"train_loss": -5.239804267883301, "global_step": 19827, "epoch": 472} {"train_loss": -5.306818962097168, "global_step": 19828, "epoch": 472} {"train_loss": -5.26969575881958, "global_step": 19829, "epoch": 472} {"train_loss": -5.32234525680542, "global_step": 19830, "epoch": 472} {"train_loss": -5.260995864868164, "global_step": 19831, "epoch": 472} {"train_loss": -5.22322940826416, "global_step": 19832, "epoch": 472} {"train_loss": -5.335255146026611, "global_step": 19833, "epoch": 472} {"train_loss": -5.3082356452941895, "global_step": 19834, "epoch": 472} {"train_loss": -5.366350173950195, "global_step": 19835, "epoch": 472} {"train_loss": -5.394237995147705, "global_step": 19836, "epoch": 472} {"train_loss": -5.199554443359375, "global_step": 19837, "epoch": 472} {"train_loss": -5.11268949508667, "global_step": 19838, "epoch": 472} {"train_loss": -5.4672465324401855, "global_step": 19839, "epoch": 472} {"train_loss": -5.208657264709473, "global_step": 19840, "epoch": 472} {"train_loss": -5.424017906188965, "global_step": 19841, "epoch": 472} {"train_loss": -5.334146499633789, "global_step": 19842, "epoch": 472} {"train_loss": -5.298865795135498, "global_step": 19843, "epoch": 472} {"train_loss": -5.308294296264648, "global_step": 19844, "epoch": 472} {"train_loss": -5.324987411499023, "global_step": 19845, "epoch": 472} {"train_loss": -5.222280502319336, "global_step": 19846, "epoch": 472} {"train_loss": -5.2707366943359375, "global_step": 19847, "epoch": 472} {"train_loss": -5.312901496887207, "global_step": 19848, "epoch": 472} {"train_loss": -5.2450151443481445, "global_step": 19849, "epoch": 472} {"train_loss": -5.3815693855285645, "global_step": 19850, "epoch": 472} {"train_loss": -5.370187759399414, "global_step": 19851, "epoch": 472} {"train_loss": -5.322083950042725, "global_step": 19852, "epoch": 472} {"train_loss": -5.39219856262207, "global_step": 19853, "epoch": 472} {"train_loss": -5.380368232727051, "global_step": 19854, "epoch": 472} {"train_loss": -5.180224895477295, "global_step": 19855, "epoch": 472} {"train_loss": -5.198823928833008, "global_step": 19856, "epoch": 472} {"train_loss": -5.352209091186523, "global_step": 19857, "epoch": 472} {"train_loss": -5.3065185546875, "global_step": 19858, "epoch": 472} {"train_loss": -5.181812286376953, "global_step": 19859, "epoch": 472} {"train_loss": -5.236244201660156, "global_step": 19860, "epoch": 472} {"train_loss": -5.262384414672852, "global_step": 19861, "epoch": 472} {"train_loss": -5.243309020996094, "global_step": 19862, "epoch": 472} {"train_loss": -5.078268051147461, "global_step": 19863, "epoch": 472} {"train_loss": -5.279317855834961, "global_step": 19864, "epoch": 472} {"train_loss": -5.290345566613333, "global_step": 19865, "epoch": 472, "val_loss": 77127.328125} {"train_loss": -5.122664928436279, "global_step": 19866, "epoch": 473} {"train_loss": -5.40949010848999, "global_step": 19867, "epoch": 473} {"train_loss": -5.369368076324463, "global_step": 19868, "epoch": 473} {"train_loss": -5.2398529052734375, "global_step": 19869, "epoch": 473} {"train_loss": -5.36774206161499, "global_step": 19870, "epoch": 473} {"train_loss": -5.168358325958252, "global_step": 19871, "epoch": 473} {"train_loss": -5.356599807739258, "global_step": 19872, "epoch": 473} {"train_loss": -5.176938533782959, "global_step": 19873, "epoch": 473} {"train_loss": -5.256863117218018, "global_step": 19874, "epoch": 473} {"train_loss": -5.397084712982178, "global_step": 19875, "epoch": 473} {"train_loss": -5.269579887390137, "global_step": 19876, "epoch": 473} {"train_loss": -5.256418228149414, "global_step": 19877, "epoch": 473} {"train_loss": -5.334161758422852, "global_step": 19878, "epoch": 473} {"train_loss": -5.192485809326172, "global_step": 19879, "epoch": 473} {"train_loss": -5.400022506713867, "global_step": 19880, "epoch": 473} {"train_loss": -5.300701141357422, "global_step": 19881, "epoch": 473} {"train_loss": -5.26706075668335, "global_step": 19882, "epoch": 473} {"train_loss": -5.224111080169678, "global_step": 19883, "epoch": 473} {"train_loss": -5.133604049682617, "global_step": 19884, "epoch": 473} {"train_loss": -5.262554168701172, "global_step": 19885, "epoch": 473} {"train_loss": -5.2505784034729, "global_step": 19886, "epoch": 473} {"train_loss": -5.3045806884765625, "global_step": 19887, "epoch": 473} {"train_loss": -5.2181243896484375, "global_step": 19888, "epoch": 473} {"train_loss": -5.2326178550720215, "global_step": 19889, "epoch": 473} {"train_loss": -5.3020243644714355, "global_step": 19890, "epoch": 473} {"train_loss": -5.379417419433594, "global_step": 19891, "epoch": 473} {"train_loss": -5.288647651672363, "global_step": 19892, "epoch": 473} {"train_loss": -5.291440010070801, "global_step": 19893, "epoch": 473} {"train_loss": -5.145831108093262, "global_step": 19894, "epoch": 473} {"train_loss": -5.224862098693848, "global_step": 19895, "epoch": 473} {"train_loss": -5.16349983215332, "global_step": 19896, "epoch": 473} {"train_loss": -5.139016628265381, "global_step": 19897, "epoch": 473} {"train_loss": -5.238814353942871, "global_step": 19898, "epoch": 473} {"train_loss": -5.30753755569458, "global_step": 19899, "epoch": 473} {"train_loss": -5.196182727813721, "global_step": 19900, "epoch": 473} {"train_loss": -5.143028259277344, "global_step": 19901, "epoch": 473} {"train_loss": -5.2939958572387695, "global_step": 19902, "epoch": 473} {"train_loss": -5.174264907836914, "global_step": 19903, "epoch": 473} {"train_loss": -5.160074710845947, "global_step": 19904, "epoch": 473} {"train_loss": -5.206068992614746, "global_step": 19905, "epoch": 473} {"train_loss": -5.264549255371094, "global_step": 19906, "epoch": 473} {"train_loss": -5.256676401410784, "global_step": 19907, "epoch": 473, "val_loss": 76247.875} {"train_loss": -5.291672229766846, "global_step": 19908, "epoch": 474} {"train_loss": -5.305781841278076, "global_step": 19909, "epoch": 474} {"train_loss": -5.211496353149414, "global_step": 19910, "epoch": 474} {"train_loss": -5.202351093292236, "global_step": 19911, "epoch": 474} {"train_loss": -5.220524787902832, "global_step": 19912, "epoch": 474} {"train_loss": -5.369402885437012, "global_step": 19913, "epoch": 474} {"train_loss": -5.244514465332031, "global_step": 19914, "epoch": 474} {"train_loss": -5.307547569274902, "global_step": 19915, "epoch": 474} {"train_loss": -5.239776611328125, "global_step": 19916, "epoch": 474} {"train_loss": -5.206390380859375, "global_step": 19917, "epoch": 474} {"train_loss": -5.257543563842773, "global_step": 19918, "epoch": 474} {"train_loss": -5.344015121459961, "global_step": 19919, "epoch": 474} {"train_loss": -5.300751209259033, "global_step": 19920, "epoch": 474} {"train_loss": -5.243569374084473, "global_step": 19921, "epoch": 474} {"train_loss": -5.382915496826172, "global_step": 19922, "epoch": 474} {"train_loss": -5.223188400268555, "global_step": 19923, "epoch": 474} {"train_loss": -5.295690536499023, "global_step": 19924, "epoch": 474} {"train_loss": -5.396860599517822, "global_step": 19925, "epoch": 474} {"train_loss": -5.246147155761719, "global_step": 19926, "epoch": 474} {"train_loss": -5.268139362335205, "global_step": 19927, "epoch": 474} {"train_loss": -5.22809362411499, "global_step": 19928, "epoch": 474} {"train_loss": -5.294269561767578, "global_step": 19929, "epoch": 474} {"train_loss": -5.309149265289307, "global_step": 19930, "epoch": 474} {"train_loss": -5.273038387298584, "global_step": 19931, "epoch": 474} {"train_loss": -5.304522514343262, "global_step": 19932, "epoch": 474} {"train_loss": -5.253044128417969, "global_step": 19933, "epoch": 474} {"train_loss": -5.291200637817383, "global_step": 19934, "epoch": 474} {"train_loss": -5.286081314086914, "global_step": 19935, "epoch": 474} {"train_loss": -5.321166038513184, "global_step": 19936, "epoch": 474} {"train_loss": -5.327033996582031, "global_step": 19937, "epoch": 474} {"train_loss": -5.298200607299805, "global_step": 19938, "epoch": 474} {"train_loss": -5.376378059387207, "global_step": 19939, "epoch": 474} {"train_loss": -5.348857879638672, "global_step": 19940, "epoch": 474} {"train_loss": -5.3031110763549805, "global_step": 19941, "epoch": 474} {"train_loss": -5.140533447265625, "global_step": 19942, "epoch": 474} {"train_loss": -5.447079658508301, "global_step": 19943, "epoch": 474} {"train_loss": -5.327558517456055, "global_step": 19944, "epoch": 474} {"train_loss": -5.0620012283325195, "global_step": 19945, "epoch": 474} {"train_loss": -5.183276653289795, "global_step": 19946, "epoch": 474} {"train_loss": -5.191370010375977, "global_step": 19947, "epoch": 474} {"train_loss": -5.208148956298828, "global_step": 19948, "epoch": 474} {"train_loss": -5.275689227240426, "global_step": 19949, "epoch": 474, "val_loss": 77539.1015625} {"train_loss": -4.910179138183594, "global_step": 19950, "epoch": 475} {"train_loss": -5.239742279052734, "global_step": 19951, "epoch": 475} {"train_loss": -4.90002965927124, "global_step": 19952, "epoch": 475} {"train_loss": -5.147245407104492, "global_step": 19953, "epoch": 475} {"train_loss": -5.240435600280762, "global_step": 19954, "epoch": 475} {"train_loss": -5.08181095123291, "global_step": 19955, "epoch": 475} {"train_loss": -5.333315372467041, "global_step": 19956, "epoch": 475} {"train_loss": -4.982494831085205, "global_step": 19957, "epoch": 475} {"train_loss": -5.329583168029785, "global_step": 19958, "epoch": 475} {"train_loss": -4.989112854003906, "global_step": 19959, "epoch": 475} {"train_loss": -5.3174638748168945, "global_step": 19960, "epoch": 475} {"train_loss": -5.037482261657715, "global_step": 19961, "epoch": 475} {"train_loss": -5.148362159729004, "global_step": 19962, "epoch": 475} {"train_loss": -5.148348331451416, "global_step": 19963, "epoch": 475} {"train_loss": -5.304806709289551, "global_step": 19964, "epoch": 475} {"train_loss": -5.107827663421631, "global_step": 19965, "epoch": 475} {"train_loss": -5.237583160400391, "global_step": 19966, "epoch": 475} {"train_loss": -4.985219478607178, "global_step": 19967, "epoch": 475} {"train_loss": -5.238123893737793, "global_step": 19968, "epoch": 475} {"train_loss": -5.24105978012085, "global_step": 19969, "epoch": 475} {"train_loss": -5.359538555145264, "global_step": 19970, "epoch": 475} {"train_loss": -5.001337051391602, "global_step": 19971, "epoch": 475} {"train_loss": -5.357297897338867, "global_step": 19972, "epoch": 475} {"train_loss": -5.103585243225098, "global_step": 19973, "epoch": 475} {"train_loss": -5.151100158691406, "global_step": 19974, "epoch": 475} {"train_loss": -5.156149387359619, "global_step": 19975, "epoch": 475} {"train_loss": -5.285496711730957, "global_step": 19976, "epoch": 475} {"train_loss": -5.060460090637207, "global_step": 19977, "epoch": 475} {"train_loss": -5.252655029296875, "global_step": 19978, "epoch": 475} {"train_loss": -5.298360347747803, "global_step": 19979, "epoch": 475} {"train_loss": -5.372192859649658, "global_step": 19980, "epoch": 475} {"train_loss": -5.192165374755859, "global_step": 19981, "epoch": 475} {"train_loss": -5.2639970779418945, "global_step": 19982, "epoch": 475} {"train_loss": -5.2465362548828125, "global_step": 19983, "epoch": 475} {"train_loss": -5.327886581420898, "global_step": 19984, "epoch": 475} {"train_loss": -5.1548309326171875, "global_step": 19985, "epoch": 475} {"train_loss": -5.341028690338135, "global_step": 19986, "epoch": 475} {"train_loss": -5.347749710083008, "global_step": 19987, "epoch": 475} {"train_loss": -5.138267517089844, "global_step": 19988, "epoch": 475} {"train_loss": -5.2789082527160645, "global_step": 19989, "epoch": 475} {"train_loss": -5.0489501953125, "global_step": 19990, "epoch": 475} {"train_loss": -5.1844680195762995, "global_step": 19991, "epoch": 475, "val_loss": 77036.8203125} {"train_loss": -5.189953804016113, "global_step": 19992, "epoch": 476} {"train_loss": -5.215770721435547, "global_step": 19993, "epoch": 476} {"train_loss": -5.230762958526611, "global_step": 19994, "epoch": 476} {"train_loss": -5.189643859863281, "global_step": 19995, "epoch": 476} {"train_loss": -5.187350749969482, "global_step": 19996, "epoch": 476} {"train_loss": -5.268571853637695, "global_step": 19997, "epoch": 476} {"train_loss": -5.257325172424316, "global_step": 19998, "epoch": 476} {"train_loss": -5.154277801513672, "global_step": 19999, "epoch": 476} {"train_loss": -5.153243064880371, "global_step": 20000, "epoch": 476} {"train_loss": -5.3226470947265625, "global_step": 20001, "epoch": 476} {"train_loss": -5.3929243087768555, "global_step": 20002, "epoch": 476} {"train_loss": -5.207791805267334, "global_step": 20003, "epoch": 476} {"train_loss": -5.361401557922363, "global_step": 20004, "epoch": 476} {"train_loss": -5.188340663909912, "global_step": 20005, "epoch": 476} {"train_loss": -5.2466864585876465, "global_step": 20006, "epoch": 476} {"train_loss": -5.362770080566406, "global_step": 20007, "epoch": 476} {"train_loss": -5.246444225311279, "global_step": 20008, "epoch": 476} {"train_loss": -5.348233699798584, "global_step": 20009, "epoch": 476} {"train_loss": -5.414189338684082, "global_step": 20010, "epoch": 476} {"train_loss": -5.2790117263793945, "global_step": 20011, "epoch": 476} {"train_loss": -5.354252815246582, "global_step": 20012, "epoch": 476} {"train_loss": -5.357220649719238, "global_step": 20013, "epoch": 476} {"train_loss": -5.36026668548584, "global_step": 20014, "epoch": 476} {"train_loss": -5.271482467651367, "global_step": 20015, "epoch": 476} {"train_loss": -5.259940147399902, "global_step": 20016, "epoch": 476} {"train_loss": -5.242253303527832, "global_step": 20017, "epoch": 476} {"train_loss": -5.279323577880859, "global_step": 20018, "epoch": 476} {"train_loss": -5.2407073974609375, "global_step": 20019, "epoch": 476} {"train_loss": -5.28046178817749, "global_step": 20020, "epoch": 476} {"train_loss": -5.330740928649902, "global_step": 20021, "epoch": 476} {"train_loss": -5.2511701583862305, "global_step": 20022, "epoch": 476} {"train_loss": -5.437536239624023, "global_step": 20023, "epoch": 476} {"train_loss": -5.188796043395996, "global_step": 20024, "epoch": 476} {"train_loss": -5.395914554595947, "global_step": 20025, "epoch": 476} {"train_loss": -5.342860221862793, "global_step": 20026, "epoch": 476} {"train_loss": -5.262677192687988, "global_step": 20027, "epoch": 476} {"train_loss": -5.38173770904541, "global_step": 20028, "epoch": 476} {"train_loss": -5.234514236450195, "global_step": 20029, "epoch": 476} {"train_loss": -5.287485122680664, "global_step": 20030, "epoch": 476} {"train_loss": -5.243191242218018, "global_step": 20031, "epoch": 476} {"train_loss": -5.283859729766846, "global_step": 20032, "epoch": 476} {"train_loss": -5.2794369629451205, "global_step": 20033, "epoch": 476, "val_loss": 76049.875} {"train_loss": -5.337552547454834, "global_step": 20034, "epoch": 477} {"train_loss": -5.082716941833496, "global_step": 20035, "epoch": 477} {"train_loss": -5.3403167724609375, "global_step": 20036, "epoch": 477} {"train_loss": -5.252660751342773, "global_step": 20037, "epoch": 477} {"train_loss": -5.420557975769043, "global_step": 20038, "epoch": 477} {"train_loss": -5.2601213455200195, "global_step": 20039, "epoch": 477} {"train_loss": -5.261226654052734, "global_step": 20040, "epoch": 477} {"train_loss": -5.227316856384277, "global_step": 20041, "epoch": 477} {"train_loss": -5.275331497192383, "global_step": 20042, "epoch": 477} {"train_loss": -5.239887237548828, "global_step": 20043, "epoch": 477} {"train_loss": -5.292963027954102, "global_step": 20044, "epoch": 477} {"train_loss": -5.32778263092041, "global_step": 20045, "epoch": 477} {"train_loss": -5.391078472137451, "global_step": 20046, "epoch": 477} {"train_loss": -5.264941692352295, "global_step": 20047, "epoch": 477} {"train_loss": -5.308977127075195, "global_step": 20048, "epoch": 477} {"train_loss": -5.215113162994385, "global_step": 20049, "epoch": 477} {"train_loss": -5.360849857330322, "global_step": 20050, "epoch": 477} {"train_loss": -5.229917526245117, "global_step": 20051, "epoch": 477} {"train_loss": -5.2458086013793945, "global_step": 20052, "epoch": 477} {"train_loss": -5.2671918869018555, "global_step": 20053, "epoch": 477} {"train_loss": -5.458254814147949, "global_step": 20054, "epoch": 477} {"train_loss": -5.286720275878906, "global_step": 20055, "epoch": 477} {"train_loss": -5.342336654663086, "global_step": 20056, "epoch": 477} {"train_loss": -5.273322105407715, "global_step": 20057, "epoch": 477} {"train_loss": -5.290962219238281, "global_step": 20058, "epoch": 477} {"train_loss": -5.297223091125488, "global_step": 20059, "epoch": 477} {"train_loss": -5.241721153259277, "global_step": 20060, "epoch": 477} {"train_loss": -5.434996604919434, "global_step": 20061, "epoch": 477} {"train_loss": -5.279405117034912, "global_step": 20062, "epoch": 477} {"train_loss": -5.3227996826171875, "global_step": 20063, "epoch": 477} {"train_loss": -5.308237075805664, "global_step": 20064, "epoch": 477} {"train_loss": -5.1617512702941895, "global_step": 20065, "epoch": 477} {"train_loss": -5.287804126739502, "global_step": 20066, "epoch": 477} {"train_loss": -5.163420677185059, "global_step": 20067, "epoch": 477} {"train_loss": -5.334409713745117, "global_step": 20068, "epoch": 477} {"train_loss": -5.299670696258545, "global_step": 20069, "epoch": 477} {"train_loss": -5.241073131561279, "global_step": 20070, "epoch": 477} {"train_loss": -5.240576267242432, "global_step": 20071, "epoch": 477} {"train_loss": -5.168539047241211, "global_step": 20072, "epoch": 477} {"train_loss": -5.295994758605957, "global_step": 20073, "epoch": 477} {"train_loss": -5.316501617431641, "global_step": 20074, "epoch": 477} {"train_loss": -5.282805772054763, "global_step": 20075, "epoch": 477, "val_loss": 76822.875} {"train_loss": -5.256665229797363, "global_step": 20076, "epoch": 478} {"train_loss": -5.235837936401367, "global_step": 20077, "epoch": 478} {"train_loss": -5.452587604522705, "global_step": 20078, "epoch": 478} {"train_loss": -5.258162498474121, "global_step": 20079, "epoch": 478} {"train_loss": -5.247352600097656, "global_step": 20080, "epoch": 478} {"train_loss": -5.327306747436523, "global_step": 20081, "epoch": 478} {"train_loss": -5.225366592407227, "global_step": 20082, "epoch": 478} {"train_loss": -5.331242561340332, "global_step": 20083, "epoch": 478} {"train_loss": -5.312578201293945, "global_step": 20084, "epoch": 478} {"train_loss": -5.187068462371826, "global_step": 20085, "epoch": 478} {"train_loss": -5.3848724365234375, "global_step": 20086, "epoch": 478} {"train_loss": -5.259963035583496, "global_step": 20087, "epoch": 478} {"train_loss": -5.173064231872559, "global_step": 20088, "epoch": 478} {"train_loss": -5.262304306030273, "global_step": 20089, "epoch": 478} {"train_loss": -5.17012357711792, "global_step": 20090, "epoch": 478} {"train_loss": -5.311220169067383, "global_step": 20091, "epoch": 478} {"train_loss": -5.318271636962891, "global_step": 20092, "epoch": 478} {"train_loss": -5.211660385131836, "global_step": 20093, "epoch": 478} {"train_loss": -5.2687811851501465, "global_step": 20094, "epoch": 478} {"train_loss": -5.347962856292725, "global_step": 20095, "epoch": 478} {"train_loss": -5.067336082458496, "global_step": 20096, "epoch": 478} {"train_loss": -5.233447074890137, "global_step": 20097, "epoch": 478} {"train_loss": -5.28473424911499, "global_step": 20098, "epoch": 478} {"train_loss": -5.228734016418457, "global_step": 20099, "epoch": 478} {"train_loss": -5.3660173416137695, "global_step": 20100, "epoch": 478} {"train_loss": -5.198166370391846, "global_step": 20101, "epoch": 478} {"train_loss": -5.368404388427734, "global_step": 20102, "epoch": 478} {"train_loss": -5.311794281005859, "global_step": 20103, "epoch": 478} {"train_loss": -5.090185165405273, "global_step": 20104, "epoch": 478} {"train_loss": -5.2278852462768555, "global_step": 20105, "epoch": 478} {"train_loss": -5.065715789794922, "global_step": 20106, "epoch": 478} {"train_loss": -5.277070999145508, "global_step": 20107, "epoch": 478} {"train_loss": -5.257750988006592, "global_step": 20108, "epoch": 478} {"train_loss": -5.2906951904296875, "global_step": 20109, "epoch": 478} {"train_loss": -5.222733497619629, "global_step": 20110, "epoch": 478} {"train_loss": -5.272049427032471, "global_step": 20111, "epoch": 478} {"train_loss": -5.284163475036621, "global_step": 20112, "epoch": 478} {"train_loss": -5.329031944274902, "global_step": 20113, "epoch": 478} {"train_loss": -5.176817417144775, "global_step": 20114, "epoch": 478} {"train_loss": -5.352199554443359, "global_step": 20115, "epoch": 478} {"train_loss": -5.223186492919922, "global_step": 20116, "epoch": 478} {"train_loss": -5.262438206445603, "global_step": 20117, "epoch": 478, "val_loss": 76447.328125} {"train_loss": -5.346579074859619, "global_step": 20118, "epoch": 479} {"train_loss": -5.20471715927124, "global_step": 20119, "epoch": 479} {"train_loss": -5.286293029785156, "global_step": 20120, "epoch": 479} {"train_loss": -5.143257141113281, "global_step": 20121, "epoch": 479} {"train_loss": -5.256412029266357, "global_step": 20122, "epoch": 479} {"train_loss": -5.437935829162598, "global_step": 20123, "epoch": 479} {"train_loss": -5.274535655975342, "global_step": 20124, "epoch": 479} {"train_loss": -5.150677680969238, "global_step": 20125, "epoch": 479} {"train_loss": -5.243467807769775, "global_step": 20126, "epoch": 479} {"train_loss": -5.413125038146973, "global_step": 20127, "epoch": 479} {"train_loss": -5.244668483734131, "global_step": 20128, "epoch": 479} {"train_loss": -5.206210613250732, "global_step": 20129, "epoch": 479} {"train_loss": -5.3286452293396, "global_step": 20130, "epoch": 479} {"train_loss": -5.366870880126953, "global_step": 20131, "epoch": 479} {"train_loss": -5.309055805206299, "global_step": 20132, "epoch": 479} {"train_loss": -5.269936561584473, "global_step": 20133, "epoch": 479} {"train_loss": -5.236228942871094, "global_step": 20134, "epoch": 479} {"train_loss": -5.367355823516846, "global_step": 20135, "epoch": 479} {"train_loss": -5.423112869262695, "global_step": 20136, "epoch": 479} {"train_loss": -5.34221076965332, "global_step": 20137, "epoch": 479} {"train_loss": -5.29556131362915, "global_step": 20138, "epoch": 479} {"train_loss": -5.149640083312988, "global_step": 20139, "epoch": 479} {"train_loss": -5.234762191772461, "global_step": 20140, "epoch": 479} {"train_loss": -5.296806335449219, "global_step": 20141, "epoch": 479} {"train_loss": -5.194016456604004, "global_step": 20142, "epoch": 479} {"train_loss": -5.326709270477295, "global_step": 20143, "epoch": 479} {"train_loss": -5.337880611419678, "global_step": 20144, "epoch": 479} {"train_loss": -5.370393753051758, "global_step": 20145, "epoch": 479} {"train_loss": -5.163679599761963, "global_step": 20146, "epoch": 479} {"train_loss": -5.4282121658325195, "global_step": 20147, "epoch": 479} {"train_loss": -5.405246734619141, "global_step": 20148, "epoch": 479} {"train_loss": -5.384973526000977, "global_step": 20149, "epoch": 479} {"train_loss": -5.369512557983398, "global_step": 20150, "epoch": 479} {"train_loss": -5.320664405822754, "global_step": 20151, "epoch": 479} {"train_loss": -5.441284656524658, "global_step": 20152, "epoch": 479} {"train_loss": -5.288150787353516, "global_step": 20153, "epoch": 479} {"train_loss": -5.214993953704834, "global_step": 20154, "epoch": 479} {"train_loss": -5.381601333618164, "global_step": 20155, "epoch": 479} {"train_loss": -5.278363227844238, "global_step": 20156, "epoch": 479} {"train_loss": -5.201951026916504, "global_step": 20157, "epoch": 479} {"train_loss": -5.2734456062316895, "global_step": 20158, "epoch": 479} {"train_loss": -5.297737325940814, "global_step": 20159, "epoch": 479, "val_loss": 75980.3515625} {"train_loss": -5.3717570304870605, "global_step": 20160, "epoch": 480} {"train_loss": -5.290567398071289, "global_step": 20161, "epoch": 480} {"train_loss": -5.341012001037598, "global_step": 20162, "epoch": 480} {"train_loss": -5.348785400390625, "global_step": 20163, "epoch": 480} {"train_loss": -5.296201705932617, "global_step": 20164, "epoch": 480} {"train_loss": -5.24072790145874, "global_step": 20165, "epoch": 480} {"train_loss": -5.268730163574219, "global_step": 20166, "epoch": 480} {"train_loss": -5.50039005279541, "global_step": 20167, "epoch": 480} {"train_loss": -5.204397201538086, "global_step": 20168, "epoch": 480} {"train_loss": -5.3540544509887695, "global_step": 20169, "epoch": 480} {"train_loss": -5.172456741333008, "global_step": 20170, "epoch": 480} {"train_loss": -5.508689880371094, "global_step": 20171, "epoch": 480} {"train_loss": -5.243424415588379, "global_step": 20172, "epoch": 480} {"train_loss": -5.310382843017578, "global_step": 20173, "epoch": 480} {"train_loss": -5.329480171203613, "global_step": 20174, "epoch": 480} {"train_loss": -5.413752555847168, "global_step": 20175, "epoch": 480} {"train_loss": -5.274621963500977, "global_step": 20176, "epoch": 480} {"train_loss": -5.216952323913574, "global_step": 20177, "epoch": 480} {"train_loss": -5.269552230834961, "global_step": 20178, "epoch": 480} {"train_loss": -5.278641223907471, "global_step": 20179, "epoch": 480} {"train_loss": -5.016965866088867, "global_step": 20180, "epoch": 480} {"train_loss": -5.403901100158691, "global_step": 20181, "epoch": 480} {"train_loss": -5.015746116638184, "global_step": 20182, "epoch": 480} {"train_loss": -5.219255447387695, "global_step": 20183, "epoch": 480} {"train_loss": -5.344547271728516, "global_step": 20184, "epoch": 480} {"train_loss": -5.0659098625183105, "global_step": 20185, "epoch": 480} {"train_loss": -5.28689432144165, "global_step": 20186, "epoch": 480} {"train_loss": -5.128505706787109, "global_step": 20187, "epoch": 480} {"train_loss": -5.314206123352051, "global_step": 20188, "epoch": 480} {"train_loss": -5.172121047973633, "global_step": 20189, "epoch": 480} {"train_loss": -5.1663079261779785, "global_step": 20190, "epoch": 480} {"train_loss": -5.360986232757568, "global_step": 20191, "epoch": 480} {"train_loss": -5.200172424316406, "global_step": 20192, "epoch": 480} {"train_loss": -5.169905185699463, "global_step": 20193, "epoch": 480} {"train_loss": -5.307271957397461, "global_step": 20194, "epoch": 480} {"train_loss": -5.107212066650391, "global_step": 20195, "epoch": 480} {"train_loss": -5.23996639251709, "global_step": 20196, "epoch": 480} {"train_loss": -5.157853126525879, "global_step": 20197, "epoch": 480} {"train_loss": -5.269835948944092, "global_step": 20198, "epoch": 480} {"train_loss": -5.36811637878418, "global_step": 20199, "epoch": 480} {"train_loss": -5.312398910522461, "global_step": 20200, "epoch": 480} {"train_loss": -5.2654958338964555, "global_step": 20201, "epoch": 480, "val_loss": 75879.828125} {"train_loss": -5.253224849700928, "global_step": 20202, "epoch": 481} {"train_loss": -5.18501615524292, "global_step": 20203, "epoch": 481} {"train_loss": -5.406132698059082, "global_step": 20204, "epoch": 481} {"train_loss": -5.514177322387695, "global_step": 20205, "epoch": 481} {"train_loss": -5.183805465698242, "global_step": 20206, "epoch": 481} {"train_loss": -5.407848358154297, "global_step": 20207, "epoch": 481} {"train_loss": -5.38288688659668, "global_step": 20208, "epoch": 481} {"train_loss": -5.318173408508301, "global_step": 20209, "epoch": 481} {"train_loss": -5.284537315368652, "global_step": 20210, "epoch": 481} {"train_loss": -5.155178070068359, "global_step": 20211, "epoch": 481} {"train_loss": -5.300354957580566, "global_step": 20212, "epoch": 481} {"train_loss": -5.2467942237854, "global_step": 20213, "epoch": 481} {"train_loss": -5.046491622924805, "global_step": 20214, "epoch": 481} {"train_loss": -5.334230422973633, "global_step": 20215, "epoch": 481} {"train_loss": -5.245208263397217, "global_step": 20216, "epoch": 481} {"train_loss": -5.258967876434326, "global_step": 20217, "epoch": 481} {"train_loss": -5.337132453918457, "global_step": 20218, "epoch": 481} {"train_loss": -5.277070045471191, "global_step": 20219, "epoch": 481} {"train_loss": -5.203792572021484, "global_step": 20220, "epoch": 481} {"train_loss": -5.4707441329956055, "global_step": 20221, "epoch": 481} {"train_loss": -5.262420654296875, "global_step": 20222, "epoch": 481} {"train_loss": -5.366940975189209, "global_step": 20223, "epoch": 481} {"train_loss": -5.323177814483643, "global_step": 20224, "epoch": 481} {"train_loss": -5.299581527709961, "global_step": 20225, "epoch": 481} {"train_loss": -5.269423484802246, "global_step": 20226, "epoch": 481} {"train_loss": -5.3049774169921875, "global_step": 20227, "epoch": 481} {"train_loss": -5.210641860961914, "global_step": 20228, "epoch": 481} {"train_loss": -5.218964576721191, "global_step": 20229, "epoch": 481} {"train_loss": -5.363122463226318, "global_step": 20230, "epoch": 481} {"train_loss": -5.285703659057617, "global_step": 20231, "epoch": 481} {"train_loss": -5.2332868576049805, "global_step": 20232, "epoch": 481} {"train_loss": -5.302615165710449, "global_step": 20233, "epoch": 481} {"train_loss": -5.297406196594238, "global_step": 20234, "epoch": 481} {"train_loss": -5.249734878540039, "global_step": 20235, "epoch": 481} {"train_loss": -5.341796875, "global_step": 20236, "epoch": 481} {"train_loss": -5.301551818847656, "global_step": 20237, "epoch": 481} {"train_loss": -5.325953483581543, "global_step": 20238, "epoch": 481} {"train_loss": -5.463099479675293, "global_step": 20239, "epoch": 481} {"train_loss": -5.273682594299316, "global_step": 20240, "epoch": 481} {"train_loss": -5.244711399078369, "global_step": 20241, "epoch": 481} {"train_loss": -5.369710922241211, "global_step": 20242, "epoch": 481} {"train_loss": -5.2932527632940385, "global_step": 20243, "epoch": 481, "val_loss": 75741.203125} {"train_loss": -5.360858917236328, "global_step": 20244, "epoch": 482} {"train_loss": -5.313251495361328, "global_step": 20245, "epoch": 482} {"train_loss": -5.502192497253418, "global_step": 20246, "epoch": 482} {"train_loss": -5.246362686157227, "global_step": 20247, "epoch": 482} {"train_loss": -5.370246410369873, "global_step": 20248, "epoch": 482} {"train_loss": -5.483938217163086, "global_step": 20249, "epoch": 482} {"train_loss": -5.230312347412109, "global_step": 20250, "epoch": 482} {"train_loss": -5.2781267166137695, "global_step": 20251, "epoch": 482} {"train_loss": -5.327956199645996, "global_step": 20252, "epoch": 482} {"train_loss": -5.387317657470703, "global_step": 20253, "epoch": 482} {"train_loss": -5.346014022827148, "global_step": 20254, "epoch": 482} {"train_loss": -5.30875301361084, "global_step": 20255, "epoch": 482} {"train_loss": -5.286651611328125, "global_step": 20256, "epoch": 482} {"train_loss": -5.252196788787842, "global_step": 20257, "epoch": 482} {"train_loss": -5.348345756530762, "global_step": 20258, "epoch": 482} {"train_loss": -5.2209625244140625, "global_step": 20259, "epoch": 482} {"train_loss": -5.2657856941223145, "global_step": 20260, "epoch": 482} {"train_loss": -5.314334869384766, "global_step": 20261, "epoch": 482} {"train_loss": -5.2002949714660645, "global_step": 20262, "epoch": 482} {"train_loss": -5.333505630493164, "global_step": 20263, "epoch": 482} {"train_loss": -5.160945892333984, "global_step": 20264, "epoch": 482} {"train_loss": -5.233972549438477, "global_step": 20265, "epoch": 482} {"train_loss": -5.2491960525512695, "global_step": 20266, "epoch": 482} {"train_loss": -5.17683219909668, "global_step": 20267, "epoch": 482} {"train_loss": -5.199487686157227, "global_step": 20268, "epoch": 482} {"train_loss": -5.217897415161133, "global_step": 20269, "epoch": 482} {"train_loss": -5.360671043395996, "global_step": 20270, "epoch": 482} {"train_loss": -5.245266914367676, "global_step": 20271, "epoch": 482} {"train_loss": -5.200897216796875, "global_step": 20272, "epoch": 482} {"train_loss": -5.311007976531982, "global_step": 20273, "epoch": 482} {"train_loss": -5.2739949226379395, "global_step": 20274, "epoch": 482} {"train_loss": -5.234546661376953, "global_step": 20275, "epoch": 482} {"train_loss": -5.30085563659668, "global_step": 20276, "epoch": 482} {"train_loss": -5.226739883422852, "global_step": 20277, "epoch": 482} {"train_loss": -5.345107078552246, "global_step": 20278, "epoch": 482} {"train_loss": -5.229796409606934, "global_step": 20279, "epoch": 482} {"train_loss": -5.309372425079346, "global_step": 20280, "epoch": 482} {"train_loss": -5.346698760986328, "global_step": 20281, "epoch": 482} {"train_loss": -5.329715728759766, "global_step": 20282, "epoch": 482} {"train_loss": -5.313624382019043, "global_step": 20283, "epoch": 482} {"train_loss": -5.3502516746521, "global_step": 20284, "epoch": 482} {"train_loss": -5.293317953745524, "global_step": 20285, "epoch": 482, "val_loss": 76640.4921875} {"train_loss": -5.409481525421143, "global_step": 20286, "epoch": 483} {"train_loss": -5.233879089355469, "global_step": 20287, "epoch": 483} {"train_loss": -5.345637321472168, "global_step": 20288, "epoch": 483} {"train_loss": -5.498178482055664, "global_step": 20289, "epoch": 483} {"train_loss": -5.31706428527832, "global_step": 20290, "epoch": 483} {"train_loss": -5.255357265472412, "global_step": 20291, "epoch": 483} {"train_loss": -5.376267433166504, "global_step": 20292, "epoch": 483} {"train_loss": -5.372989177703857, "global_step": 20293, "epoch": 483} {"train_loss": -5.382992267608643, "global_step": 20294, "epoch": 483} {"train_loss": -5.37031364440918, "global_step": 20295, "epoch": 483} {"train_loss": -5.254302024841309, "global_step": 20296, "epoch": 483} {"train_loss": -5.3687896728515625, "global_step": 20297, "epoch": 483} {"train_loss": -5.420529365539551, "global_step": 20298, "epoch": 483} {"train_loss": -5.424879550933838, "global_step": 20299, "epoch": 483} {"train_loss": -5.377483367919922, "global_step": 20300, "epoch": 483} {"train_loss": -5.371086120605469, "global_step": 20301, "epoch": 483} {"train_loss": -5.397646903991699, "global_step": 20302, "epoch": 483} {"train_loss": -5.316288948059082, "global_step": 20303, "epoch": 483} {"train_loss": -5.209873676300049, "global_step": 20304, "epoch": 483} {"train_loss": -5.202718734741211, "global_step": 20305, "epoch": 483} {"train_loss": -5.31117057800293, "global_step": 20306, "epoch": 483} {"train_loss": -5.306880950927734, "global_step": 20307, "epoch": 483} {"train_loss": -5.197664737701416, "global_step": 20308, "epoch": 483} {"train_loss": -5.240497589111328, "global_step": 20309, "epoch": 483} {"train_loss": -5.220328330993652, "global_step": 20310, "epoch": 483} {"train_loss": -5.025961875915527, "global_step": 20311, "epoch": 483} {"train_loss": -5.243504524230957, "global_step": 20312, "epoch": 483} {"train_loss": -5.342239856719971, "global_step": 20313, "epoch": 483} {"train_loss": -5.358587741851807, "global_step": 20314, "epoch": 483} {"train_loss": -5.215285301208496, "global_step": 20315, "epoch": 483} {"train_loss": -5.328486919403076, "global_step": 20316, "epoch": 483} {"train_loss": -5.26973819732666, "global_step": 20317, "epoch": 483} {"train_loss": -5.29075813293457, "global_step": 20318, "epoch": 483} {"train_loss": -5.231316566467285, "global_step": 20319, "epoch": 483} {"train_loss": -5.243146896362305, "global_step": 20320, "epoch": 483} {"train_loss": -5.2796149253845215, "global_step": 20321, "epoch": 483} {"train_loss": -5.219369888305664, "global_step": 20322, "epoch": 483} {"train_loss": -5.3520660400390625, "global_step": 20323, "epoch": 483} {"train_loss": -5.4208879470825195, "global_step": 20324, "epoch": 483} {"train_loss": -5.353703498840332, "global_step": 20325, "epoch": 483} {"train_loss": -5.264223098754883, "global_step": 20326, "epoch": 483} {"train_loss": -5.3056877340589255, "global_step": 20327, "epoch": 483, "val_loss": 76851.71875} {"train_loss": -5.328834533691406, "global_step": 20328, "epoch": 484} {"train_loss": -5.187997817993164, "global_step": 20329, "epoch": 484} {"train_loss": -5.31581449508667, "global_step": 20330, "epoch": 484} {"train_loss": -5.405611038208008, "global_step": 20331, "epoch": 484} {"train_loss": -5.1908793449401855, "global_step": 20332, "epoch": 484} {"train_loss": -5.263437271118164, "global_step": 20333, "epoch": 484} {"train_loss": -5.390998840332031, "global_step": 20334, "epoch": 484} {"train_loss": -5.353590965270996, "global_step": 20335, "epoch": 484} {"train_loss": -5.303698539733887, "global_step": 20336, "epoch": 484} {"train_loss": -5.2731218338012695, "global_step": 20337, "epoch": 484} {"train_loss": -5.312067985534668, "global_step": 20338, "epoch": 484} {"train_loss": -5.315585136413574, "global_step": 20339, "epoch": 484} {"train_loss": -5.358192443847656, "global_step": 20340, "epoch": 484} {"train_loss": -5.356801509857178, "global_step": 20341, "epoch": 484} {"train_loss": -5.329476356506348, "global_step": 20342, "epoch": 484} {"train_loss": -5.3115105628967285, "global_step": 20343, "epoch": 484} {"train_loss": -5.099301338195801, "global_step": 20344, "epoch": 484} {"train_loss": -5.239199638366699, "global_step": 20345, "epoch": 484} {"train_loss": -5.3094072341918945, "global_step": 20346, "epoch": 484} {"train_loss": -5.171920299530029, "global_step": 20347, "epoch": 484} {"train_loss": -5.275609016418457, "global_step": 20348, "epoch": 484} {"train_loss": -5.281150817871094, "global_step": 20349, "epoch": 484} {"train_loss": -5.193766117095947, "global_step": 20350, "epoch": 484} {"train_loss": -5.329268455505371, "global_step": 20351, "epoch": 484} {"train_loss": -5.342809677124023, "global_step": 20352, "epoch": 484} {"train_loss": -5.267174243927002, "global_step": 20353, "epoch": 484} {"train_loss": -5.164066791534424, "global_step": 20354, "epoch": 484} {"train_loss": -5.339139938354492, "global_step": 20355, "epoch": 484} {"train_loss": -5.265158653259277, "global_step": 20356, "epoch": 484} {"train_loss": -5.2023115158081055, "global_step": 20357, "epoch": 484} {"train_loss": -5.410094261169434, "global_step": 20358, "epoch": 484} {"train_loss": -5.225379943847656, "global_step": 20359, "epoch": 484} {"train_loss": -5.239592552185059, "global_step": 20360, "epoch": 484} {"train_loss": -5.339195251464844, "global_step": 20361, "epoch": 484} {"train_loss": -5.13211727142334, "global_step": 20362, "epoch": 484} {"train_loss": -5.236015319824219, "global_step": 20363, "epoch": 484} {"train_loss": -5.112035751342773, "global_step": 20364, "epoch": 484} {"train_loss": -5.297059059143066, "global_step": 20365, "epoch": 484} {"train_loss": -5.209951877593994, "global_step": 20366, "epoch": 484} {"train_loss": -5.199204921722412, "global_step": 20367, "epoch": 484} {"train_loss": -5.303450584411621, "global_step": 20368, "epoch": 484} {"train_loss": -5.275174867539179, "global_step": 20369, "epoch": 484, "val_loss": 76510.6640625} {"train_loss": -5.289445877075195, "global_step": 20370, "epoch": 485} {"train_loss": -5.3359222412109375, "global_step": 20371, "epoch": 485} {"train_loss": -5.161049842834473, "global_step": 20372, "epoch": 485} {"train_loss": -5.158799648284912, "global_step": 20373, "epoch": 485} {"train_loss": -5.119016170501709, "global_step": 20374, "epoch": 485} {"train_loss": -5.32833194732666, "global_step": 20375, "epoch": 485} {"train_loss": -5.072683334350586, "global_step": 20376, "epoch": 485} {"train_loss": -5.315679550170898, "global_step": 20377, "epoch": 485} {"train_loss": -5.179211616516113, "global_step": 20378, "epoch": 485} {"train_loss": -5.27811861038208, "global_step": 20379, "epoch": 485} {"train_loss": -5.276154518127441, "global_step": 20380, "epoch": 485} {"train_loss": -5.3830461502075195, "global_step": 20381, "epoch": 485} {"train_loss": -5.300352573394775, "global_step": 20382, "epoch": 485} {"train_loss": -5.198606014251709, "global_step": 20383, "epoch": 485} {"train_loss": -5.32907247543335, "global_step": 20384, "epoch": 485} {"train_loss": -5.308238506317139, "global_step": 20385, "epoch": 485} {"train_loss": -5.125523567199707, "global_step": 20386, "epoch": 485} {"train_loss": -5.264188766479492, "global_step": 20387, "epoch": 485} {"train_loss": -5.3917670249938965, "global_step": 20388, "epoch": 485} {"train_loss": -5.37490177154541, "global_step": 20389, "epoch": 485} {"train_loss": -5.27252197265625, "global_step": 20390, "epoch": 485} {"train_loss": -5.211627960205078, "global_step": 20391, "epoch": 485} {"train_loss": -5.387709140777588, "global_step": 20392, "epoch": 485} {"train_loss": -5.320021629333496, "global_step": 20393, "epoch": 485} {"train_loss": -5.283369541168213, "global_step": 20394, "epoch": 485} {"train_loss": -5.254184246063232, "global_step": 20395, "epoch": 485} {"train_loss": -5.16089391708374, "global_step": 20396, "epoch": 485} {"train_loss": -5.172121524810791, "global_step": 20397, "epoch": 485} {"train_loss": -5.369180679321289, "global_step": 20398, "epoch": 485} {"train_loss": -5.326182842254639, "global_step": 20399, "epoch": 485} {"train_loss": -5.290822505950928, "global_step": 20400, "epoch": 485} {"train_loss": -5.400605201721191, "global_step": 20401, "epoch": 485} {"train_loss": -5.288949966430664, "global_step": 20402, "epoch": 485} {"train_loss": -5.1481451988220215, "global_step": 20403, "epoch": 485} {"train_loss": -5.283210277557373, "global_step": 20404, "epoch": 485} {"train_loss": -5.291642189025879, "global_step": 20405, "epoch": 485} {"train_loss": -5.248657703399658, "global_step": 20406, "epoch": 485} {"train_loss": -5.399754524230957, "global_step": 20407, "epoch": 485} {"train_loss": -5.157428741455078, "global_step": 20408, "epoch": 485} {"train_loss": -5.278210163116455, "global_step": 20409, "epoch": 485} {"train_loss": -5.497597694396973, "global_step": 20410, "epoch": 485} {"train_loss": -5.273986941292172, "global_step": 20411, "epoch": 485, "val_loss": 75981.359375} {"train_loss": -5.401298522949219, "global_step": 20412, "epoch": 486} {"train_loss": -5.36213493347168, "global_step": 20413, "epoch": 486} {"train_loss": -5.332119941711426, "global_step": 20414, "epoch": 486} {"train_loss": -5.256505966186523, "global_step": 20415, "epoch": 486} {"train_loss": -5.35562801361084, "global_step": 20416, "epoch": 486} {"train_loss": -5.315960884094238, "global_step": 20417, "epoch": 486} {"train_loss": -5.436507225036621, "global_step": 20418, "epoch": 486} {"train_loss": -5.357813835144043, "global_step": 20419, "epoch": 486} {"train_loss": -5.382510185241699, "global_step": 20420, "epoch": 486} {"train_loss": -5.303373336791992, "global_step": 20421, "epoch": 486} {"train_loss": -5.470808982849121, "global_step": 20422, "epoch": 486} {"train_loss": -5.262014865875244, "global_step": 20423, "epoch": 486} {"train_loss": -5.352616310119629, "global_step": 20424, "epoch": 486} {"train_loss": -5.293741226196289, "global_step": 20425, "epoch": 486} {"train_loss": -5.409847259521484, "global_step": 20426, "epoch": 486} {"train_loss": -5.154413223266602, "global_step": 20427, "epoch": 486} {"train_loss": -5.26662540435791, "global_step": 20428, "epoch": 486} {"train_loss": -5.335052490234375, "global_step": 20429, "epoch": 486} {"train_loss": -5.295989990234375, "global_step": 20430, "epoch": 486} {"train_loss": -5.301864147186279, "global_step": 20431, "epoch": 486} {"train_loss": -5.313612937927246, "global_step": 20432, "epoch": 486} {"train_loss": -5.3488969802856445, "global_step": 20433, "epoch": 486} {"train_loss": -5.266445159912109, "global_step": 20434, "epoch": 486} {"train_loss": -5.319364547729492, "global_step": 20435, "epoch": 486} {"train_loss": -5.366730213165283, "global_step": 20436, "epoch": 486} {"train_loss": -5.2383270263671875, "global_step": 20437, "epoch": 486} {"train_loss": -5.1720380783081055, "global_step": 20438, "epoch": 486} {"train_loss": -5.313672065734863, "global_step": 20439, "epoch": 486} {"train_loss": -5.267129421234131, "global_step": 20440, "epoch": 486} {"train_loss": -5.2905659675598145, "global_step": 20441, "epoch": 486} {"train_loss": -5.33888053894043, "global_step": 20442, "epoch": 486} {"train_loss": -5.257820129394531, "global_step": 20443, "epoch": 486} {"train_loss": -5.195074558258057, "global_step": 20444, "epoch": 486} {"train_loss": -5.181666374206543, "global_step": 20445, "epoch": 486} {"train_loss": -5.302631855010986, "global_step": 20446, "epoch": 486} {"train_loss": -5.256119728088379, "global_step": 20447, "epoch": 486} {"train_loss": -5.270505905151367, "global_step": 20448, "epoch": 486} {"train_loss": -5.435263156890869, "global_step": 20449, "epoch": 486} {"train_loss": -5.335321426391602, "global_step": 20450, "epoch": 486} {"train_loss": -5.325037956237793, "global_step": 20451, "epoch": 486} {"train_loss": -5.337279319763184, "global_step": 20452, "epoch": 486} {"train_loss": -5.313974539438884, "global_step": 20453, "epoch": 486, "val_loss": 76282.1328125} {"train_loss": -5.302071571350098, "global_step": 20454, "epoch": 487} {"train_loss": -5.283018112182617, "global_step": 20455, "epoch": 487} {"train_loss": -5.216960906982422, "global_step": 20456, "epoch": 487} {"train_loss": -5.413980484008789, "global_step": 20457, "epoch": 487} {"train_loss": -5.244378089904785, "global_step": 20458, "epoch": 487} {"train_loss": -5.2438764572143555, "global_step": 20459, "epoch": 487} {"train_loss": -5.396664619445801, "global_step": 20460, "epoch": 487} {"train_loss": -5.278796195983887, "global_step": 20461, "epoch": 487} {"train_loss": -5.08351993560791, "global_step": 20462, "epoch": 487} {"train_loss": -5.413259506225586, "global_step": 20463, "epoch": 487} {"train_loss": -5.266536712646484, "global_step": 20464, "epoch": 487} {"train_loss": -5.350860595703125, "global_step": 20465, "epoch": 487} {"train_loss": -5.255987167358398, "global_step": 20466, "epoch": 487} {"train_loss": -5.293397426605225, "global_step": 20467, "epoch": 487} {"train_loss": -5.37537145614624, "global_step": 20468, "epoch": 487} {"train_loss": -5.331489086151123, "global_step": 20469, "epoch": 487} {"train_loss": -5.321747779846191, "global_step": 20470, "epoch": 487} {"train_loss": -5.2108564376831055, "global_step": 20471, "epoch": 487} {"train_loss": -5.258160591125488, "global_step": 20472, "epoch": 487} {"train_loss": -5.2432074546813965, "global_step": 20473, "epoch": 487} {"train_loss": -5.331827163696289, "global_step": 20474, "epoch": 487} {"train_loss": -5.239524841308594, "global_step": 20475, "epoch": 487} {"train_loss": -5.134377479553223, "global_step": 20476, "epoch": 487} {"train_loss": -5.35270881652832, "global_step": 20477, "epoch": 487} {"train_loss": -5.183018684387207, "global_step": 20478, "epoch": 487} {"train_loss": -5.367377281188965, "global_step": 20479, "epoch": 487} {"train_loss": -5.18736457824707, "global_step": 20480, "epoch": 487} {"train_loss": -5.304026126861572, "global_step": 20481, "epoch": 487} {"train_loss": -5.371058464050293, "global_step": 20482, "epoch": 487} {"train_loss": -5.289106845855713, "global_step": 20483, "epoch": 487} {"train_loss": -5.192008972167969, "global_step": 20484, "epoch": 487} {"train_loss": -5.399582862854004, "global_step": 20485, "epoch": 487} {"train_loss": -5.23624324798584, "global_step": 20486, "epoch": 487} {"train_loss": -5.2495927810668945, "global_step": 20487, "epoch": 487} {"train_loss": -5.3596062660217285, "global_step": 20488, "epoch": 487} {"train_loss": -5.238192558288574, "global_step": 20489, "epoch": 487} {"train_loss": -5.2361016273498535, "global_step": 20490, "epoch": 487} {"train_loss": -5.260376930236816, "global_step": 20491, "epoch": 487} {"train_loss": -5.270557403564453, "global_step": 20492, "epoch": 487} {"train_loss": -5.226541042327881, "global_step": 20493, "epoch": 487} {"train_loss": -5.224964141845703, "global_step": 20494, "epoch": 487} {"train_loss": -5.273459457215809, "global_step": 20495, "epoch": 487, "val_loss": 77646.625} {"train_loss": -5.155324935913086, "global_step": 20496, "epoch": 488} {"train_loss": -5.338892459869385, "global_step": 20497, "epoch": 488} {"train_loss": -5.186002731323242, "global_step": 20498, "epoch": 488} {"train_loss": -5.218487739562988, "global_step": 20499, "epoch": 488} {"train_loss": -5.3815131187438965, "global_step": 20500, "epoch": 488} {"train_loss": -5.2289628982543945, "global_step": 20501, "epoch": 488} {"train_loss": -5.164053916931152, "global_step": 20502, "epoch": 488} {"train_loss": -5.33286190032959, "global_step": 20503, "epoch": 488} {"train_loss": -5.457676887512207, "global_step": 20504, "epoch": 488} {"train_loss": -5.300394058227539, "global_step": 20505, "epoch": 488} {"train_loss": -5.388266563415527, "global_step": 20506, "epoch": 488} {"train_loss": -5.1652374267578125, "global_step": 20507, "epoch": 488} {"train_loss": -5.361001968383789, "global_step": 20508, "epoch": 488} {"train_loss": -5.26088285446167, "global_step": 20509, "epoch": 488} {"train_loss": -5.279475212097168, "global_step": 20510, "epoch": 488} {"train_loss": -5.251944541931152, "global_step": 20511, "epoch": 488} {"train_loss": -5.3965864181518555, "global_step": 20512, "epoch": 488} {"train_loss": -5.329535484313965, "global_step": 20513, "epoch": 488} {"train_loss": -5.375336170196533, "global_step": 20514, "epoch": 488} {"train_loss": -5.354964256286621, "global_step": 20515, "epoch": 488} {"train_loss": -5.189982891082764, "global_step": 20516, "epoch": 488} {"train_loss": -5.247642517089844, "global_step": 20517, "epoch": 488} {"train_loss": -5.413573265075684, "global_step": 20518, "epoch": 488} {"train_loss": -5.219374656677246, "global_step": 20519, "epoch": 488} {"train_loss": -5.383752346038818, "global_step": 20520, "epoch": 488} {"train_loss": -5.170332431793213, "global_step": 20521, "epoch": 488} {"train_loss": -5.291009902954102, "global_step": 20522, "epoch": 488} {"train_loss": -5.3262104988098145, "global_step": 20523, "epoch": 488} {"train_loss": -5.277256965637207, "global_step": 20524, "epoch": 488} {"train_loss": -5.304088592529297, "global_step": 20525, "epoch": 488} {"train_loss": -5.2299699783325195, "global_step": 20526, "epoch": 488} {"train_loss": -5.312692642211914, "global_step": 20527, "epoch": 488} {"train_loss": -5.270773887634277, "global_step": 20528, "epoch": 488} {"train_loss": -5.344300270080566, "global_step": 20529, "epoch": 488} {"train_loss": -5.291534423828125, "global_step": 20530, "epoch": 488} {"train_loss": -5.2621846199035645, "global_step": 20531, "epoch": 488} {"train_loss": -5.350094795227051, "global_step": 20532, "epoch": 488} {"train_loss": -5.286599159240723, "global_step": 20533, "epoch": 488} {"train_loss": -5.182072639465332, "global_step": 20534, "epoch": 488} {"train_loss": -5.350623607635498, "global_step": 20535, "epoch": 488} {"train_loss": -5.423366069793701, "global_step": 20536, "epoch": 488} {"train_loss": -5.294340281259446, "global_step": 20537, "epoch": 488, "val_loss": 75996.34375} {"train_loss": -5.3163628578186035, "global_step": 20538, "epoch": 489} {"train_loss": -5.2285871505737305, "global_step": 20539, "epoch": 489} {"train_loss": -5.148229598999023, "global_step": 20540, "epoch": 489} {"train_loss": -5.393045425415039, "global_step": 20541, "epoch": 489} {"train_loss": -5.278379440307617, "global_step": 20542, "epoch": 489} {"train_loss": -5.371039390563965, "global_step": 20543, "epoch": 489} {"train_loss": -5.2789306640625, "global_step": 20544, "epoch": 489} {"train_loss": -5.36148738861084, "global_step": 20545, "epoch": 489} {"train_loss": -5.365598678588867, "global_step": 20546, "epoch": 489} {"train_loss": -5.321850776672363, "global_step": 20547, "epoch": 489} {"train_loss": -5.2798871994018555, "global_step": 20548, "epoch": 489} {"train_loss": -5.226572036743164, "global_step": 20549, "epoch": 489} {"train_loss": -5.318042278289795, "global_step": 20550, "epoch": 489} {"train_loss": -5.29550313949585, "global_step": 20551, "epoch": 489} {"train_loss": -5.235708713531494, "global_step": 20552, "epoch": 489} {"train_loss": -5.457039833068848, "global_step": 20553, "epoch": 489} {"train_loss": -5.276081085205078, "global_step": 20554, "epoch": 489} {"train_loss": -5.299511909484863, "global_step": 20555, "epoch": 489} {"train_loss": -5.423912048339844, "global_step": 20556, "epoch": 489} {"train_loss": -5.2854413986206055, "global_step": 20557, "epoch": 489} {"train_loss": -5.344404220581055, "global_step": 20558, "epoch": 489} {"train_loss": -5.378966331481934, "global_step": 20559, "epoch": 489} {"train_loss": -5.323687553405762, "global_step": 20560, "epoch": 489} {"train_loss": -5.269279479980469, "global_step": 20561, "epoch": 489} {"train_loss": -5.2960710525512695, "global_step": 20562, "epoch": 489} {"train_loss": -5.382545471191406, "global_step": 20563, "epoch": 489} {"train_loss": -5.298285484313965, "global_step": 20564, "epoch": 489} {"train_loss": -5.251743316650391, "global_step": 20565, "epoch": 489} {"train_loss": -5.278994560241699, "global_step": 20566, "epoch": 489} {"train_loss": -5.323367595672607, "global_step": 20567, "epoch": 489} {"train_loss": -5.338387489318848, "global_step": 20568, "epoch": 489} {"train_loss": -5.2118401527404785, "global_step": 20569, "epoch": 489} {"train_loss": -5.3324174880981445, "global_step": 20570, "epoch": 489} {"train_loss": -5.2497711181640625, "global_step": 20571, "epoch": 489} {"train_loss": -5.27161979675293, "global_step": 20572, "epoch": 489} {"train_loss": -5.3222336769104, "global_step": 20573, "epoch": 489} {"train_loss": -5.371916770935059, "global_step": 20574, "epoch": 489} {"train_loss": -5.215909957885742, "global_step": 20575, "epoch": 489} {"train_loss": -5.354576110839844, "global_step": 20576, "epoch": 489} {"train_loss": -5.258185863494873, "global_step": 20577, "epoch": 489} {"train_loss": -5.405548572540283, "global_step": 20578, "epoch": 489} {"train_loss": -5.306591181528001, "global_step": 20579, "epoch": 489, "val_loss": 76284.015625} {"train_loss": -5.2632551193237305, "global_step": 20580, "epoch": 490} {"train_loss": -5.275731086730957, "global_step": 20581, "epoch": 490} {"train_loss": -5.267807960510254, "global_step": 20582, "epoch": 490} {"train_loss": -5.257604598999023, "global_step": 20583, "epoch": 490} {"train_loss": -5.31304931640625, "global_step": 20584, "epoch": 490} {"train_loss": -5.328402042388916, "global_step": 20585, "epoch": 490} {"train_loss": -5.282773971557617, "global_step": 20586, "epoch": 490} {"train_loss": -5.421754360198975, "global_step": 20587, "epoch": 490} {"train_loss": -5.313198089599609, "global_step": 20588, "epoch": 490} {"train_loss": -5.20440673828125, "global_step": 20589, "epoch": 490} {"train_loss": -5.316286087036133, "global_step": 20590, "epoch": 490} {"train_loss": -5.294398307800293, "global_step": 20591, "epoch": 490} {"train_loss": -5.346699237823486, "global_step": 20592, "epoch": 490} {"train_loss": -5.096147537231445, "global_step": 20593, "epoch": 490} {"train_loss": -5.285823345184326, "global_step": 20594, "epoch": 490} {"train_loss": -5.3707990646362305, "global_step": 20595, "epoch": 490} {"train_loss": -5.285158157348633, "global_step": 20596, "epoch": 490} {"train_loss": -5.242511749267578, "global_step": 20597, "epoch": 490} {"train_loss": -5.419639587402344, "global_step": 20598, "epoch": 490} {"train_loss": -5.2085747718811035, "global_step": 20599, "epoch": 490} {"train_loss": -5.2085065841674805, "global_step": 20600, "epoch": 490} {"train_loss": -5.253267288208008, "global_step": 20601, "epoch": 490} {"train_loss": -5.388570785522461, "global_step": 20602, "epoch": 490} {"train_loss": -5.404905319213867, "global_step": 20603, "epoch": 490} {"train_loss": -5.376976490020752, "global_step": 20604, "epoch": 490} {"train_loss": -5.387694835662842, "global_step": 20605, "epoch": 490} {"train_loss": -5.259461879730225, "global_step": 20606, "epoch": 490} {"train_loss": -5.3774919509887695, "global_step": 20607, "epoch": 490} {"train_loss": -5.195484161376953, "global_step": 20608, "epoch": 490} {"train_loss": -5.295703411102295, "global_step": 20609, "epoch": 490} {"train_loss": -5.254211902618408, "global_step": 20610, "epoch": 490} {"train_loss": -5.327417373657227, "global_step": 20611, "epoch": 490} {"train_loss": -5.346278667449951, "global_step": 20612, "epoch": 490} {"train_loss": -5.283865928649902, "global_step": 20613, "epoch": 490} {"train_loss": -5.337047100067139, "global_step": 20614, "epoch": 490} {"train_loss": -5.203303813934326, "global_step": 20615, "epoch": 490} {"train_loss": -5.26944637298584, "global_step": 20616, "epoch": 490} {"train_loss": -5.488473892211914, "global_step": 20617, "epoch": 490} {"train_loss": -5.406785011291504, "global_step": 20618, "epoch": 490} {"train_loss": -5.3331298828125, "global_step": 20619, "epoch": 490} {"train_loss": -5.277889251708984, "global_step": 20620, "epoch": 490} {"train_loss": -5.307730720156715, "global_step": 20621, "epoch": 490, "val_loss": 76188.6171875} {"train_loss": -5.33662223815918, "global_step": 20622, "epoch": 491} {"train_loss": -5.291681289672852, "global_step": 20623, "epoch": 491} {"train_loss": -5.41181755065918, "global_step": 20624, "epoch": 491} {"train_loss": -5.3457183837890625, "global_step": 20625, "epoch": 491} {"train_loss": -5.311860084533691, "global_step": 20626, "epoch": 491} {"train_loss": -5.373355388641357, "global_step": 20627, "epoch": 491} {"train_loss": -5.3599629402160645, "global_step": 20628, "epoch": 491} {"train_loss": -5.326850891113281, "global_step": 20629, "epoch": 491} {"train_loss": -5.280154228210449, "global_step": 20630, "epoch": 491} {"train_loss": -5.319787979125977, "global_step": 20631, "epoch": 491} {"train_loss": -5.340482234954834, "global_step": 20632, "epoch": 491} {"train_loss": -5.257436752319336, "global_step": 20633, "epoch": 491} {"train_loss": -5.238794803619385, "global_step": 20634, "epoch": 491} {"train_loss": -5.379424095153809, "global_step": 20635, "epoch": 491} {"train_loss": -5.424154758453369, "global_step": 20636, "epoch": 491} {"train_loss": -5.2634172439575195, "global_step": 20637, "epoch": 491} {"train_loss": -5.281702041625977, "global_step": 20638, "epoch": 491} {"train_loss": -5.2798662185668945, "global_step": 20639, "epoch": 491} {"train_loss": -5.333869934082031, "global_step": 20640, "epoch": 491} {"train_loss": -5.381304740905762, "global_step": 20641, "epoch": 491} {"train_loss": -5.308492183685303, "global_step": 20642, "epoch": 491} {"train_loss": -5.336998462677002, "global_step": 20643, "epoch": 491} {"train_loss": -5.358570098876953, "global_step": 20644, "epoch": 491} {"train_loss": -5.351092338562012, "global_step": 20645, "epoch": 491} {"train_loss": -5.280603885650635, "global_step": 20646, "epoch": 491} {"train_loss": -5.315791606903076, "global_step": 20647, "epoch": 491} {"train_loss": -5.277466773986816, "global_step": 20648, "epoch": 491} {"train_loss": -5.398947238922119, "global_step": 20649, "epoch": 491} {"train_loss": -5.272322177886963, "global_step": 20650, "epoch": 491} {"train_loss": -5.35103702545166, "global_step": 20651, "epoch": 491} {"train_loss": -5.265347480773926, "global_step": 20652, "epoch": 491} {"train_loss": -5.384411811828613, "global_step": 20653, "epoch": 491} {"train_loss": -5.113832950592041, "global_step": 20654, "epoch": 491} {"train_loss": -5.336029052734375, "global_step": 20655, "epoch": 491} {"train_loss": -5.286960601806641, "global_step": 20656, "epoch": 491} {"train_loss": -5.129393577575684, "global_step": 20657, "epoch": 491} {"train_loss": -5.228158950805664, "global_step": 20658, "epoch": 491} {"train_loss": -5.22260856628418, "global_step": 20659, "epoch": 491} {"train_loss": -5.205560684204102, "global_step": 20660, "epoch": 491} {"train_loss": -5.3940534591674805, "global_step": 20661, "epoch": 491} {"train_loss": -5.280148983001709, "global_step": 20662, "epoch": 491} {"train_loss": -5.303672904060001, "global_step": 20663, "epoch": 491, "val_loss": 76758.234375} {"train_loss": -5.234830856323242, "global_step": 20664, "epoch": 492} {"train_loss": -5.242303848266602, "global_step": 20665, "epoch": 492} {"train_loss": -5.06394100189209, "global_step": 20666, "epoch": 492} {"train_loss": -5.238037109375, "global_step": 20667, "epoch": 492} {"train_loss": -5.226665496826172, "global_step": 20668, "epoch": 492} {"train_loss": -5.037026882171631, "global_step": 20669, "epoch": 492} {"train_loss": -5.392003059387207, "global_step": 20670, "epoch": 492} {"train_loss": -5.302595138549805, "global_step": 20671, "epoch": 492} {"train_loss": -5.1209821701049805, "global_step": 20672, "epoch": 492} {"train_loss": -5.321414470672607, "global_step": 20673, "epoch": 492} {"train_loss": -5.212717056274414, "global_step": 20674, "epoch": 492} {"train_loss": -5.3044610023498535, "global_step": 20675, "epoch": 492} {"train_loss": -5.254465103149414, "global_step": 20676, "epoch": 492} {"train_loss": -5.2571635246276855, "global_step": 20677, "epoch": 492} {"train_loss": -5.2718892097473145, "global_step": 20678, "epoch": 492} {"train_loss": -5.332649230957031, "global_step": 20679, "epoch": 492} {"train_loss": -5.169600486755371, "global_step": 20680, "epoch": 492} {"train_loss": -5.257527828216553, "global_step": 20681, "epoch": 492} {"train_loss": -5.258115768432617, "global_step": 20682, "epoch": 492} {"train_loss": -5.267603397369385, "global_step": 20683, "epoch": 492} {"train_loss": -5.354135036468506, "global_step": 20684, "epoch": 492} {"train_loss": -5.091188907623291, "global_step": 20685, "epoch": 492} {"train_loss": -5.270042419433594, "global_step": 20686, "epoch": 492} {"train_loss": -5.219050407409668, "global_step": 20687, "epoch": 492} {"train_loss": -5.084427833557129, "global_step": 20688, "epoch": 492} {"train_loss": -5.189413547515869, "global_step": 20689, "epoch": 492} {"train_loss": -5.247717380523682, "global_step": 20690, "epoch": 492} {"train_loss": -5.159661293029785, "global_step": 20691, "epoch": 492} {"train_loss": -5.219974040985107, "global_step": 20692, "epoch": 492} {"train_loss": -5.333247184753418, "global_step": 20693, "epoch": 492} {"train_loss": -5.182300567626953, "global_step": 20694, "epoch": 492} {"train_loss": -5.235044479370117, "global_step": 20695, "epoch": 492} {"train_loss": -5.165504455566406, "global_step": 20696, "epoch": 492} {"train_loss": -5.362056732177734, "global_step": 20697, "epoch": 492} {"train_loss": -5.239831924438477, "global_step": 20698, "epoch": 492} {"train_loss": -5.258069038391113, "global_step": 20699, "epoch": 492} {"train_loss": -5.319046974182129, "global_step": 20700, "epoch": 492} {"train_loss": -5.253692626953125, "global_step": 20701, "epoch": 492} {"train_loss": -5.334359169006348, "global_step": 20702, "epoch": 492} {"train_loss": -5.163080215454102, "global_step": 20703, "epoch": 492} {"train_loss": -5.3431396484375, "global_step": 20704, "epoch": 492} {"train_loss": -5.239921762829735, "global_step": 20705, "epoch": 492, "val_loss": 76206.3671875} {"train_loss": -5.358348846435547, "global_step": 20706, "epoch": 493} {"train_loss": -5.15269660949707, "global_step": 20707, "epoch": 493} {"train_loss": -5.311653137207031, "global_step": 20708, "epoch": 493} {"train_loss": -5.302611827850342, "global_step": 20709, "epoch": 493} {"train_loss": -5.339293956756592, "global_step": 20710, "epoch": 493} {"train_loss": -5.162920951843262, "global_step": 20711, "epoch": 493} {"train_loss": -5.166652679443359, "global_step": 20712, "epoch": 493} {"train_loss": -5.282528877258301, "global_step": 20713, "epoch": 493} {"train_loss": -5.431615829467773, "global_step": 20714, "epoch": 493} {"train_loss": -5.276205539703369, "global_step": 20715, "epoch": 493} {"train_loss": -5.156883716583252, "global_step": 20716, "epoch": 493} {"train_loss": -5.363082408905029, "global_step": 20717, "epoch": 493} {"train_loss": -5.415816307067871, "global_step": 20718, "epoch": 493} {"train_loss": -5.322053909301758, "global_step": 20719, "epoch": 493} {"train_loss": -5.305088996887207, "global_step": 20720, "epoch": 493} {"train_loss": -5.250450134277344, "global_step": 20721, "epoch": 493} {"train_loss": -5.174031734466553, "global_step": 20722, "epoch": 493} {"train_loss": -5.317462921142578, "global_step": 20723, "epoch": 493} {"train_loss": -5.303012847900391, "global_step": 20724, "epoch": 493} {"train_loss": -5.101812839508057, "global_step": 20725, "epoch": 493} {"train_loss": -5.324040412902832, "global_step": 20726, "epoch": 493} {"train_loss": -5.333700180053711, "global_step": 20727, "epoch": 493} {"train_loss": -5.24751091003418, "global_step": 20728, "epoch": 493} {"train_loss": -5.257268905639648, "global_step": 20729, "epoch": 493} {"train_loss": -5.3643035888671875, "global_step": 20730, "epoch": 493} {"train_loss": -5.15341329574585, "global_step": 20731, "epoch": 493} {"train_loss": -5.366171360015869, "global_step": 20732, "epoch": 493} {"train_loss": -5.2891459465026855, "global_step": 20733, "epoch": 493} {"train_loss": -5.126232624053955, "global_step": 20734, "epoch": 493} {"train_loss": -5.32840633392334, "global_step": 20735, "epoch": 493} {"train_loss": -5.262267112731934, "global_step": 20736, "epoch": 493} {"train_loss": -5.271528244018555, "global_step": 20737, "epoch": 493} {"train_loss": -5.416988372802734, "global_step": 20738, "epoch": 493} {"train_loss": -5.275474548339844, "global_step": 20739, "epoch": 493} {"train_loss": -5.301142692565918, "global_step": 20740, "epoch": 493} {"train_loss": -5.30098295211792, "global_step": 20741, "epoch": 493} {"train_loss": -5.3444623947143555, "global_step": 20742, "epoch": 493} {"train_loss": -5.376605033874512, "global_step": 20743, "epoch": 493} {"train_loss": -5.425816535949707, "global_step": 20744, "epoch": 493} {"train_loss": -5.211441993713379, "global_step": 20745, "epoch": 493} {"train_loss": -5.376450061798096, "global_step": 20746, "epoch": 493} {"train_loss": -5.282063438778832, "global_step": 20747, "epoch": 493, "val_loss": 76115.234375} {"train_loss": -5.313546180725098, "global_step": 20748, "epoch": 494} {"train_loss": -5.1778717041015625, "global_step": 20749, "epoch": 494} {"train_loss": -5.345501899719238, "global_step": 20750, "epoch": 494} {"train_loss": -5.2867536544799805, "global_step": 20751, "epoch": 494} {"train_loss": -5.219675064086914, "global_step": 20752, "epoch": 494} {"train_loss": -5.147812843322754, "global_step": 20753, "epoch": 494} {"train_loss": -5.302528381347656, "global_step": 20754, "epoch": 494} {"train_loss": -5.365058898925781, "global_step": 20755, "epoch": 494} {"train_loss": -5.264865875244141, "global_step": 20756, "epoch": 494} {"train_loss": -5.188321113586426, "global_step": 20757, "epoch": 494} {"train_loss": -5.3328537940979, "global_step": 20758, "epoch": 494} {"train_loss": -5.183337688446045, "global_step": 20759, "epoch": 494} {"train_loss": -5.151371955871582, "global_step": 20760, "epoch": 494} {"train_loss": -5.1537766456604, "global_step": 20761, "epoch": 494} {"train_loss": -5.503727912902832, "global_step": 20762, "epoch": 494} {"train_loss": -5.122483253479004, "global_step": 20763, "epoch": 494} {"train_loss": -5.205890655517578, "global_step": 20764, "epoch": 494} {"train_loss": -5.2076826095581055, "global_step": 20765, "epoch": 494} {"train_loss": -5.210423946380615, "global_step": 20766, "epoch": 494} {"train_loss": -5.326455593109131, "global_step": 20767, "epoch": 494} {"train_loss": -5.208817005157471, "global_step": 20768, "epoch": 494} {"train_loss": -5.119571208953857, "global_step": 20769, "epoch": 494} {"train_loss": -5.07793664932251, "global_step": 20770, "epoch": 494} {"train_loss": -5.350914478302002, "global_step": 20771, "epoch": 494} {"train_loss": -5.158627510070801, "global_step": 20772, "epoch": 494} {"train_loss": -5.277504920959473, "global_step": 20773, "epoch": 494} {"train_loss": -5.219410419464111, "global_step": 20774, "epoch": 494} {"train_loss": -5.170331954956055, "global_step": 20775, "epoch": 494} {"train_loss": -5.358782768249512, "global_step": 20776, "epoch": 494} {"train_loss": -5.158782958984375, "global_step": 20777, "epoch": 494} {"train_loss": -5.335244178771973, "global_step": 20778, "epoch": 494} {"train_loss": -5.1524505615234375, "global_step": 20779, "epoch": 494} {"train_loss": -5.26567268371582, "global_step": 20780, "epoch": 494} {"train_loss": -5.20130729675293, "global_step": 20781, "epoch": 494} {"train_loss": -5.298130512237549, "global_step": 20782, "epoch": 494} {"train_loss": -5.245882034301758, "global_step": 20783, "epoch": 494} {"train_loss": -5.256527423858643, "global_step": 20784, "epoch": 494} {"train_loss": -5.3504133224487305, "global_step": 20785, "epoch": 494} {"train_loss": -5.241739273071289, "global_step": 20786, "epoch": 494} {"train_loss": -5.3279523849487305, "global_step": 20787, "epoch": 494} {"train_loss": -5.2332658767700195, "global_step": 20788, "epoch": 494} {"train_loss": -5.246929679598127, "global_step": 20789, "epoch": 494, "val_loss": 76366.4921875} {"train_loss": -5.25299072265625, "global_step": 20790, "epoch": 495} {"train_loss": -5.257215976715088, "global_step": 20791, "epoch": 495} {"train_loss": -5.432445526123047, "global_step": 20792, "epoch": 495} {"train_loss": -5.111747741699219, "global_step": 20793, "epoch": 495} {"train_loss": -5.253321647644043, "global_step": 20794, "epoch": 495} {"train_loss": -5.255614280700684, "global_step": 20795, "epoch": 495} {"train_loss": -5.065313339233398, "global_step": 20796, "epoch": 495} {"train_loss": -5.269235610961914, "global_step": 20797, "epoch": 495} {"train_loss": -5.096228122711182, "global_step": 20798, "epoch": 495} {"train_loss": -5.297451972961426, "global_step": 20799, "epoch": 495} {"train_loss": -5.257816314697266, "global_step": 20800, "epoch": 495} {"train_loss": -5.147132873535156, "global_step": 20801, "epoch": 495} {"train_loss": -5.366570949554443, "global_step": 20802, "epoch": 495} {"train_loss": -5.237398624420166, "global_step": 20803, "epoch": 495} {"train_loss": -5.248780250549316, "global_step": 20804, "epoch": 495} {"train_loss": -5.369128704071045, "global_step": 20805, "epoch": 495} {"train_loss": -5.239731311798096, "global_step": 20806, "epoch": 495} {"train_loss": -5.27593994140625, "global_step": 20807, "epoch": 495} {"train_loss": -5.219453811645508, "global_step": 20808, "epoch": 495} {"train_loss": -5.33413028717041, "global_step": 20809, "epoch": 495} {"train_loss": -5.27971887588501, "global_step": 20810, "epoch": 495} {"train_loss": -5.226872444152832, "global_step": 20811, "epoch": 495} {"train_loss": -5.212935447692871, "global_step": 20812, "epoch": 495} {"train_loss": -5.34687614440918, "global_step": 20813, "epoch": 495} {"train_loss": -5.123824596405029, "global_step": 20814, "epoch": 495} {"train_loss": -5.179220199584961, "global_step": 20815, "epoch": 495} {"train_loss": -5.318015098571777, "global_step": 20816, "epoch": 495} {"train_loss": -5.306760787963867, "global_step": 20817, "epoch": 495} {"train_loss": -5.393583297729492, "global_step": 20818, "epoch": 495} {"train_loss": -5.3036370277404785, "global_step": 20819, "epoch": 495} {"train_loss": -5.318008899688721, "global_step": 20820, "epoch": 495} {"train_loss": -5.4503254890441895, "global_step": 20821, "epoch": 495} {"train_loss": -5.411602973937988, "global_step": 20822, "epoch": 495} {"train_loss": -5.24951696395874, "global_step": 20823, "epoch": 495} {"train_loss": -5.478342056274414, "global_step": 20824, "epoch": 495} {"train_loss": -5.310262203216553, "global_step": 20825, "epoch": 495} {"train_loss": -5.308483600616455, "global_step": 20826, "epoch": 495} {"train_loss": -5.315735816955566, "global_step": 20827, "epoch": 495} {"train_loss": -5.232314109802246, "global_step": 20828, "epoch": 495} {"train_loss": -5.3196587562561035, "global_step": 20829, "epoch": 495} {"train_loss": -5.403013229370117, "global_step": 20830, "epoch": 495} {"train_loss": -5.2788419382912775, "global_step": 20831, "epoch": 495, "val_loss": 76046.1875} {"train_loss": -5.294534683227539, "global_step": 20832, "epoch": 496} {"train_loss": -5.336119174957275, "global_step": 20833, "epoch": 496} {"train_loss": -5.2480926513671875, "global_step": 20834, "epoch": 496} {"train_loss": -5.417786598205566, "global_step": 20835, "epoch": 496} {"train_loss": -5.232359886169434, "global_step": 20836, "epoch": 496} {"train_loss": -5.269369125366211, "global_step": 20837, "epoch": 496} {"train_loss": -5.212168216705322, "global_step": 20838, "epoch": 496} {"train_loss": -5.301820278167725, "global_step": 20839, "epoch": 496} {"train_loss": -5.052030563354492, "global_step": 20840, "epoch": 496} {"train_loss": -5.4327592849731445, "global_step": 20841, "epoch": 496} {"train_loss": -5.144865989685059, "global_step": 20842, "epoch": 496} {"train_loss": -5.205575942993164, "global_step": 20843, "epoch": 496} {"train_loss": -5.180093288421631, "global_step": 20844, "epoch": 496} {"train_loss": -5.127379894256592, "global_step": 20845, "epoch": 496} {"train_loss": -5.27194356918335, "global_step": 20846, "epoch": 496} {"train_loss": -5.230824947357178, "global_step": 20847, "epoch": 496} {"train_loss": -5.201236248016357, "global_step": 20848, "epoch": 496} {"train_loss": -5.409757137298584, "global_step": 20849, "epoch": 496} {"train_loss": -5.396097183227539, "global_step": 20850, "epoch": 496} {"train_loss": -5.289247989654541, "global_step": 20851, "epoch": 496} {"train_loss": -5.268003463745117, "global_step": 20852, "epoch": 496} {"train_loss": -5.235058307647705, "global_step": 20853, "epoch": 496} {"train_loss": -5.387031555175781, "global_step": 20854, "epoch": 496} {"train_loss": -5.232447624206543, "global_step": 20855, "epoch": 496} {"train_loss": -5.258447647094727, "global_step": 20856, "epoch": 496} {"train_loss": -5.245442867279053, "global_step": 20857, "epoch": 496} {"train_loss": -5.211292266845703, "global_step": 20858, "epoch": 496} {"train_loss": -5.345654487609863, "global_step": 20859, "epoch": 496} {"train_loss": -5.202069282531738, "global_step": 20860, "epoch": 496} {"train_loss": -5.313291072845459, "global_step": 20861, "epoch": 496} {"train_loss": -5.291006088256836, "global_step": 20862, "epoch": 496} {"train_loss": -5.2222747802734375, "global_step": 20863, "epoch": 496} {"train_loss": -5.300559997558594, "global_step": 20864, "epoch": 496} {"train_loss": -5.314192295074463, "global_step": 20865, "epoch": 496} {"train_loss": -5.346614837646484, "global_step": 20866, "epoch": 496} {"train_loss": -5.346221923828125, "global_step": 20867, "epoch": 496} {"train_loss": -5.330589294433594, "global_step": 20868, "epoch": 496} {"train_loss": -5.394651412963867, "global_step": 20869, "epoch": 496} {"train_loss": -5.233695030212402, "global_step": 20870, "epoch": 496} {"train_loss": -5.251987934112549, "global_step": 20871, "epoch": 496} {"train_loss": -5.338323593139648, "global_step": 20872, "epoch": 496} {"train_loss": -5.276739029657273, "global_step": 20873, "epoch": 496, "val_loss": 76255.4453125} {"train_loss": -5.234733581542969, "global_step": 20874, "epoch": 497} {"train_loss": -5.40177059173584, "global_step": 20875, "epoch": 497} {"train_loss": -5.315201282501221, "global_step": 20876, "epoch": 497} {"train_loss": -5.316507339477539, "global_step": 20877, "epoch": 497} {"train_loss": -5.329688549041748, "global_step": 20878, "epoch": 497} {"train_loss": -5.376163005828857, "global_step": 20879, "epoch": 497} {"train_loss": -5.336228370666504, "global_step": 20880, "epoch": 497} {"train_loss": -5.28703498840332, "global_step": 20881, "epoch": 497} {"train_loss": -5.33642578125, "global_step": 20882, "epoch": 497} {"train_loss": -5.226109504699707, "global_step": 20883, "epoch": 497} {"train_loss": -5.3382248878479, "global_step": 20884, "epoch": 497} {"train_loss": -5.351631164550781, "global_step": 20885, "epoch": 497} {"train_loss": -5.360776901245117, "global_step": 20886, "epoch": 497} {"train_loss": -5.285615921020508, "global_step": 20887, "epoch": 497} {"train_loss": -5.382626533508301, "global_step": 20888, "epoch": 497} {"train_loss": -5.323073863983154, "global_step": 20889, "epoch": 497} {"train_loss": -5.348275184631348, "global_step": 20890, "epoch": 497} {"train_loss": -5.495932102203369, "global_step": 20891, "epoch": 497} {"train_loss": -5.259904384613037, "global_step": 20892, "epoch": 497} {"train_loss": -5.292716026306152, "global_step": 20893, "epoch": 497} {"train_loss": -5.329675674438477, "global_step": 20894, "epoch": 497} {"train_loss": -5.161820411682129, "global_step": 20895, "epoch": 497} {"train_loss": -5.4739484786987305, "global_step": 20896, "epoch": 497} {"train_loss": -5.450707912445068, "global_step": 20897, "epoch": 497} {"train_loss": -5.355147361755371, "global_step": 20898, "epoch": 497} {"train_loss": -5.446709632873535, "global_step": 20899, "epoch": 497} {"train_loss": -5.264441967010498, "global_step": 20900, "epoch": 497} {"train_loss": -5.301118850708008, "global_step": 20901, "epoch": 497} {"train_loss": -5.302872657775879, "global_step": 20902, "epoch": 497} {"train_loss": -5.2316741943359375, "global_step": 20903, "epoch": 497} {"train_loss": -5.122715473175049, "global_step": 20904, "epoch": 497} {"train_loss": -5.173125267028809, "global_step": 20905, "epoch": 497} {"train_loss": -5.367830276489258, "global_step": 20906, "epoch": 497} {"train_loss": -5.213745594024658, "global_step": 20907, "epoch": 497} {"train_loss": -5.269192695617676, "global_step": 20908, "epoch": 497} {"train_loss": -5.3821024894714355, "global_step": 20909, "epoch": 497} {"train_loss": -5.1639909744262695, "global_step": 20910, "epoch": 497} {"train_loss": -5.292376518249512, "global_step": 20911, "epoch": 497} {"train_loss": -5.119346618652344, "global_step": 20912, "epoch": 497} {"train_loss": -5.213042736053467, "global_step": 20913, "epoch": 497} {"train_loss": -5.255066394805908, "global_step": 20914, "epoch": 497} {"train_loss": -5.303583077022007, "global_step": 20915, "epoch": 497, "val_loss": 76255.8203125} {"train_loss": -5.16272497177124, "global_step": 20916, "epoch": 498} {"train_loss": -5.227837562561035, "global_step": 20917, "epoch": 498} {"train_loss": -5.222747802734375, "global_step": 20918, "epoch": 498} {"train_loss": -5.247089862823486, "global_step": 20919, "epoch": 498} {"train_loss": -5.375175476074219, "global_step": 20920, "epoch": 498} {"train_loss": -5.187339782714844, "global_step": 20921, "epoch": 498} {"train_loss": -5.349358558654785, "global_step": 20922, "epoch": 498} {"train_loss": -5.21729040145874, "global_step": 20923, "epoch": 498} {"train_loss": -5.291782379150391, "global_step": 20924, "epoch": 498} {"train_loss": -5.3880133628845215, "global_step": 20925, "epoch": 498} {"train_loss": -5.31147575378418, "global_step": 20926, "epoch": 498} {"train_loss": -5.2086381912231445, "global_step": 20927, "epoch": 498} {"train_loss": -5.336337089538574, "global_step": 20928, "epoch": 498} {"train_loss": -5.352631092071533, "global_step": 20929, "epoch": 498} {"train_loss": -5.322132110595703, "global_step": 20930, "epoch": 498} {"train_loss": -5.316651344299316, "global_step": 20931, "epoch": 498} {"train_loss": -5.282109260559082, "global_step": 20932, "epoch": 498} {"train_loss": -5.325234413146973, "global_step": 20933, "epoch": 498} {"train_loss": -5.251249313354492, "global_step": 20934, "epoch": 498} {"train_loss": -5.340605735778809, "global_step": 20935, "epoch": 498} {"train_loss": -5.471938610076904, "global_step": 20936, "epoch": 498} {"train_loss": -5.334314346313477, "global_step": 20937, "epoch": 498} {"train_loss": -5.258021354675293, "global_step": 20938, "epoch": 498} {"train_loss": -5.132433891296387, "global_step": 20939, "epoch": 498} {"train_loss": -5.243027210235596, "global_step": 20940, "epoch": 498} {"train_loss": -5.3725385665893555, "global_step": 20941, "epoch": 498} {"train_loss": -5.211682319641113, "global_step": 20942, "epoch": 498} {"train_loss": -5.3199052810668945, "global_step": 20943, "epoch": 498} {"train_loss": -5.376380920410156, "global_step": 20944, "epoch": 498} {"train_loss": -5.186172008514404, "global_step": 20945, "epoch": 498} {"train_loss": -5.134792327880859, "global_step": 20946, "epoch": 498} {"train_loss": -5.276921272277832, "global_step": 20947, "epoch": 498} {"train_loss": -5.247618675231934, "global_step": 20948, "epoch": 498} {"train_loss": -5.170063018798828, "global_step": 20949, "epoch": 498} {"train_loss": -5.21864128112793, "global_step": 20950, "epoch": 498} {"train_loss": -5.255489826202393, "global_step": 20951, "epoch": 498} {"train_loss": -5.214188575744629, "global_step": 20952, "epoch": 498} {"train_loss": -5.21920108795166, "global_step": 20953, "epoch": 498} {"train_loss": -5.241972923278809, "global_step": 20954, "epoch": 498} {"train_loss": -5.280420780181885, "global_step": 20955, "epoch": 498} {"train_loss": -5.4140777587890625, "global_step": 20956, "epoch": 498} {"train_loss": -5.275300196238926, "global_step": 20957, "epoch": 498, "val_loss": 76271.8984375} {"train_loss": -5.202740669250488, "global_step": 20958, "epoch": 499} {"train_loss": -5.394832611083984, "global_step": 20959, "epoch": 499} {"train_loss": -5.35496711730957, "global_step": 20960, "epoch": 499} {"train_loss": -5.235663414001465, "global_step": 20961, "epoch": 499} {"train_loss": -5.194101810455322, "global_step": 20962, "epoch": 499} {"train_loss": -5.382075309753418, "global_step": 20963, "epoch": 499} {"train_loss": -5.158936023712158, "global_step": 20964, "epoch": 499} {"train_loss": -5.307325839996338, "global_step": 20965, "epoch": 499} {"train_loss": -5.222620010375977, "global_step": 20966, "epoch": 499} {"train_loss": -5.346223831176758, "global_step": 20967, "epoch": 499} {"train_loss": -5.388182640075684, "global_step": 20968, "epoch": 499} {"train_loss": -5.435657024383545, "global_step": 20969, "epoch": 499} {"train_loss": -5.375368118286133, "global_step": 20970, "epoch": 499} {"train_loss": -5.287808895111084, "global_step": 20971, "epoch": 499} {"train_loss": -5.37056827545166, "global_step": 20972, "epoch": 499} {"train_loss": -5.3584418296813965, "global_step": 20973, "epoch": 499} {"train_loss": -5.304832458496094, "global_step": 20974, "epoch": 499} {"train_loss": -5.444512367248535, "global_step": 20975, "epoch": 499} {"train_loss": -5.1988420486450195, "global_step": 20976, "epoch": 499} {"train_loss": -5.2141947746276855, "global_step": 20977, "epoch": 499} {"train_loss": -5.4207000732421875, "global_step": 20978, "epoch": 499} {"train_loss": -5.089552402496338, "global_step": 20979, "epoch": 499} {"train_loss": -5.342108726501465, "global_step": 20980, "epoch": 499} {"train_loss": -5.23909330368042, "global_step": 20981, "epoch": 499} {"train_loss": -5.1565961837768555, "global_step": 20982, "epoch": 499} {"train_loss": -5.260610580444336, "global_step": 20983, "epoch": 499} {"train_loss": -5.147861480712891, "global_step": 20984, "epoch": 499} {"train_loss": -5.394967079162598, "global_step": 20985, "epoch": 499} {"train_loss": -5.279430389404297, "global_step": 20986, "epoch": 499} {"train_loss": -5.124829292297363, "global_step": 20987, "epoch": 499} {"train_loss": -5.296322345733643, "global_step": 20988, "epoch": 499} {"train_loss": -5.162741184234619, "global_step": 20989, "epoch": 499} {"train_loss": -5.272245407104492, "global_step": 20990, "epoch": 499} {"train_loss": -5.2614240646362305, "global_step": 20991, "epoch": 499} {"train_loss": -5.271615982055664, "global_step": 20992, "epoch": 499} {"train_loss": -5.3742218017578125, "global_step": 20993, "epoch": 499} {"train_loss": -5.245199680328369, "global_step": 20994, "epoch": 499} {"train_loss": -5.318417549133301, "global_step": 20995, "epoch": 499} {"train_loss": -5.149784088134766, "global_step": 20996, "epoch": 499} {"train_loss": -5.335437774658203, "global_step": 20997, "epoch": 499} {"train_loss": -5.330253601074219, "global_step": 20998, "epoch": 499} {"train_loss": -5.284243901570638, "global_step": 20999, "epoch": 499, "val_loss": 76284.328125} {"train_loss": -5.4168853759765625, "global_step": 21000, "epoch": 500} {"train_loss": -5.219520568847656, "global_step": 21001, "epoch": 500} {"train_loss": -5.424531936645508, "global_step": 21002, "epoch": 500} {"train_loss": -5.256014823913574, "global_step": 21003, "epoch": 500} {"train_loss": -5.256608963012695, "global_step": 21004, "epoch": 500} {"train_loss": -5.4884443283081055, "global_step": 21005, "epoch": 500} {"train_loss": -5.132321357727051, "global_step": 21006, "epoch": 500} {"train_loss": -5.30872106552124, "global_step": 21007, "epoch": 500} {"train_loss": -5.222753524780273, "global_step": 21008, "epoch": 500} {"train_loss": -5.185450077056885, "global_step": 21009, "epoch": 500} {"train_loss": -5.4002604484558105, "global_step": 21010, "epoch": 500} {"train_loss": -5.231026649475098, "global_step": 21011, "epoch": 500} {"train_loss": -5.268362998962402, "global_step": 21012, "epoch": 500} {"train_loss": -5.256181716918945, "global_step": 21013, "epoch": 500} {"train_loss": -5.226022720336914, "global_step": 21014, "epoch": 500} {"train_loss": -5.306642055511475, "global_step": 21015, "epoch": 500} {"train_loss": -5.383430480957031, "global_step": 21016, "epoch": 500} {"train_loss": -5.403251647949219, "global_step": 21017, "epoch": 500} {"train_loss": -5.36898136138916, "global_step": 21018, "epoch": 500} {"train_loss": -5.321846008300781, "global_step": 21019, "epoch": 500} {"train_loss": -5.306933879852295, "global_step": 21020, "epoch": 500} {"train_loss": -5.230618476867676, "global_step": 21021, "epoch": 500} {"train_loss": -5.414752006530762, "global_step": 21022, "epoch": 500} {"train_loss": -5.2003350257873535, "global_step": 21023, "epoch": 500} {"train_loss": -5.234053611755371, "global_step": 21024, "epoch": 500} {"train_loss": -5.432003974914551, "global_step": 21025, "epoch": 500} {"train_loss": -5.343087196350098, "global_step": 21026, "epoch": 500} {"train_loss": -5.342536449432373, "global_step": 21027, "epoch": 500} {"train_loss": -5.388489723205566, "global_step": 21028, "epoch": 500} {"train_loss": -5.350872993469238, "global_step": 21029, "epoch": 500} {"train_loss": -5.332837104797363, "global_step": 21030, "epoch": 500} {"train_loss": -5.268986225128174, "global_step": 21031, "epoch": 500} {"train_loss": -5.305885314941406, "global_step": 21032, "epoch": 500} {"train_loss": -5.435655117034912, "global_step": 21033, "epoch": 500} {"train_loss": -5.247149467468262, "global_step": 21034, "epoch": 500} {"train_loss": -5.163297176361084, "global_step": 21035, "epoch": 500} {"train_loss": -5.279024124145508, "global_step": 21036, "epoch": 500} {"train_loss": -5.223772048950195, "global_step": 21037, "epoch": 500} {"train_loss": -5.185424327850342, "global_step": 21038, "epoch": 500} {"train_loss": -5.159355163574219, "global_step": 21039, "epoch": 500} {"train_loss": -5.369687557220459, "global_step": 21040, "epoch": 500} {"train_loss": -5.29766381354559, "global_step": 21041, "epoch": 500, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.11161541156468374, "train/sim_max_reward_2": 0.5107324024090713, "train/sim_max_reward_3": 0.16674368581109497, "train/sim_max_reward_4": 0.23378310025045063, "train/sim_max_reward_5": 0.5749085565393526, "test/sim_max_reward_4500000": 0.6741749356289136, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.2678034316810548, "test/sim_max_reward_4500004": 0.28175255924103276, "test/sim_max_reward_4500005": 0.12523014390384815, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.10406547324556019, "test/sim_max_reward_4500008": 0.0006214592050730729, "test/sim_max_reward_4500009": 0.3929454773335836, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.46763316849082004, "test/sim_max_reward_4500012": 0.22287304945200512, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.3822221066381891, "test/sim_max_reward_4500015": 0.16513252774339582, "test/sim_max_reward_4500016": 0.015903838936164746, "test/sim_max_reward_4500017": 0.9622816039143177, "test/sim_max_reward_4500018": 0.4002690482748458, "test/sim_max_reward_4500019": 0.4092574940640847, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.7730472968422837, "test/sim_max_reward_4500022": 0.35109235329280714, "test/sim_max_reward_4500023": 0.5486642938483842, "test/sim_max_reward_4500024": 0.15861069484018064, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.19663472341366076, "test/sim_max_reward_4500027": 0.5340166802360001, "test/sim_max_reward_4500028": 0.4501770298965101, "test/sim_max_reward_4500029": 0.29431158295495125, "test/sim_max_reward_4500030": 0.8311156054085647, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.25629078650726517, "test/sim_max_reward_4500033": 0.22713223985040326, "test/sim_max_reward_4500034": 0.45619282583266507, "test/sim_max_reward_4500035": 0.7632735096515716, "test/sim_max_reward_4500036": 0.43194425232100486, "test/sim_max_reward_4500037": 0.017920209501255124, "test/sim_max_reward_4500038": 0.29979795221384453, "test/sim_max_reward_4500039": 0.9250258363890949, "test/sim_max_reward_4500040": 0.22193413361553924, "test/sim_max_reward_4500041": 0.263596366571529, "test/sim_max_reward_4500042": 0.4113253693718551, "test/sim_max_reward_4500043": 0.2460247568854454, "test/sim_max_reward_4500044": 0.06224366451113711, "test/sim_max_reward_4500045": 0.11948153547807783, "test/sim_max_reward_4500046": 0.5520916043024868, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.6150824242773542, "test/sim_max_reward_4500049": 0.5804547794489241, "train/mean_score": 0.2980134421967842, "test/mean_score": 0.30919297650431365, "val_loss": 76373.8359375} {"train_loss": -5.277238845825195, "global_step": 21042, "epoch": 501} {"train_loss": -5.393247604370117, "global_step": 21043, "epoch": 501} {"train_loss": -5.254339218139648, "global_step": 21044, "epoch": 501} {"train_loss": -5.3245954513549805, "global_step": 21045, "epoch": 501} {"train_loss": -5.187352180480957, "global_step": 21046, "epoch": 501} {"train_loss": -5.2264909744262695, "global_step": 21047, "epoch": 501} {"train_loss": -5.343924522399902, "global_step": 21048, "epoch": 501} {"train_loss": -5.2235307693481445, "global_step": 21049, "epoch": 501} {"train_loss": -5.30190896987915, "global_step": 21050, "epoch": 501} {"train_loss": -5.119770050048828, "global_step": 21051, "epoch": 501} {"train_loss": -5.249585151672363, "global_step": 21052, "epoch": 501} {"train_loss": -5.363840579986572, "global_step": 21053, "epoch": 501} {"train_loss": -5.206455230712891, "global_step": 21054, "epoch": 501} {"train_loss": -5.3707780838012695, "global_step": 21055, "epoch": 501} {"train_loss": -5.135991096496582, "global_step": 21056, "epoch": 501} {"train_loss": -5.232693195343018, "global_step": 21057, "epoch": 501} {"train_loss": -5.317624092102051, "global_step": 21058, "epoch": 501} {"train_loss": -5.1845245361328125, "global_step": 21059, "epoch": 501} {"train_loss": -5.388620853424072, "global_step": 21060, "epoch": 501} {"train_loss": -5.223445892333984, "global_step": 21061, "epoch": 501} {"train_loss": -5.131932258605957, "global_step": 21062, "epoch": 501} {"train_loss": -5.24392557144165, "global_step": 21063, "epoch": 501} {"train_loss": -5.23568868637085, "global_step": 21064, "epoch": 501} {"train_loss": -5.334712028503418, "global_step": 21065, "epoch": 501} {"train_loss": -5.272465705871582, "global_step": 21066, "epoch": 501} {"train_loss": -5.333377361297607, "global_step": 21067, "epoch": 501} {"train_loss": -5.375523567199707, "global_step": 21068, "epoch": 501} {"train_loss": -5.236564636230469, "global_step": 21069, "epoch": 501} {"train_loss": -5.215968132019043, "global_step": 21070, "epoch": 501} {"train_loss": -5.316420555114746, "global_step": 21071, "epoch": 501} {"train_loss": -5.319202423095703, "global_step": 21072, "epoch": 501} {"train_loss": -5.412778854370117, "global_step": 21073, "epoch": 501} {"train_loss": -5.320311069488525, "global_step": 21074, "epoch": 501} {"train_loss": -5.462291240692139, "global_step": 21075, "epoch": 501} {"train_loss": -5.3693413734436035, "global_step": 21076, "epoch": 501} {"train_loss": -5.287042617797852, "global_step": 21077, "epoch": 501} {"train_loss": -5.304381847381592, "global_step": 21078, "epoch": 501} {"train_loss": -5.388777256011963, "global_step": 21079, "epoch": 501} {"train_loss": -5.285849571228027, "global_step": 21080, "epoch": 501} {"train_loss": -5.2397685050964355, "global_step": 21081, "epoch": 501} {"train_loss": -5.379739284515381, "global_step": 21082, "epoch": 501} {"train_loss": -5.288492441177368, "global_step": 21083, "epoch": 501, "val_loss": 76320.4921875} {"train_loss": -5.372753143310547, "global_step": 21084, "epoch": 502} {"train_loss": -5.2489519119262695, "global_step": 21085, "epoch": 502} {"train_loss": -5.3040266036987305, "global_step": 21086, "epoch": 502} {"train_loss": -5.374089241027832, "global_step": 21087, "epoch": 502} {"train_loss": -5.33728551864624, "global_step": 21088, "epoch": 502} {"train_loss": -5.296699047088623, "global_step": 21089, "epoch": 502} {"train_loss": -5.402932643890381, "global_step": 21090, "epoch": 502} {"train_loss": -5.308814525604248, "global_step": 21091, "epoch": 502} {"train_loss": -5.352148056030273, "global_step": 21092, "epoch": 502} {"train_loss": -5.178351402282715, "global_step": 21093, "epoch": 502} {"train_loss": -5.246571063995361, "global_step": 21094, "epoch": 502} {"train_loss": -5.302324295043945, "global_step": 21095, "epoch": 502} {"train_loss": -5.364657402038574, "global_step": 21096, "epoch": 502} {"train_loss": -5.430818557739258, "global_step": 21097, "epoch": 502} {"train_loss": -5.179228782653809, "global_step": 21098, "epoch": 502} {"train_loss": -5.402709007263184, "global_step": 21099, "epoch": 502} {"train_loss": -5.215126991271973, "global_step": 21100, "epoch": 502} {"train_loss": -5.381246089935303, "global_step": 21101, "epoch": 502} {"train_loss": -5.375539779663086, "global_step": 21102, "epoch": 502} {"train_loss": -5.314899444580078, "global_step": 21103, "epoch": 502} {"train_loss": -5.408599853515625, "global_step": 21104, "epoch": 502} {"train_loss": -5.365933418273926, "global_step": 21105, "epoch": 502} {"train_loss": -5.178307056427002, "global_step": 21106, "epoch": 502} {"train_loss": -5.27691650390625, "global_step": 21107, "epoch": 502} {"train_loss": -5.377497673034668, "global_step": 21108, "epoch": 502} {"train_loss": -5.207662582397461, "global_step": 21109, "epoch": 502} {"train_loss": -5.373196601867676, "global_step": 21110, "epoch": 502} {"train_loss": -5.36832332611084, "global_step": 21111, "epoch": 502} {"train_loss": -5.2696685791015625, "global_step": 21112, "epoch": 502} {"train_loss": -5.407912254333496, "global_step": 21113, "epoch": 502} {"train_loss": -5.376721382141113, "global_step": 21114, "epoch": 502} {"train_loss": -5.318443775177002, "global_step": 21115, "epoch": 502} {"train_loss": -5.338644981384277, "global_step": 21116, "epoch": 502} {"train_loss": -5.43453311920166, "global_step": 21117, "epoch": 502} {"train_loss": -5.30317497253418, "global_step": 21118, "epoch": 502} {"train_loss": -5.21796989440918, "global_step": 21119, "epoch": 502} {"train_loss": -5.3010358810424805, "global_step": 21120, "epoch": 502} {"train_loss": -5.1585845947265625, "global_step": 21121, "epoch": 502} {"train_loss": -5.219482421875, "global_step": 21122, "epoch": 502} {"train_loss": -5.383298873901367, "global_step": 21123, "epoch": 502} {"train_loss": -5.357670307159424, "global_step": 21124, "epoch": 502} {"train_loss": -5.313806125095913, "global_step": 21125, "epoch": 502, "val_loss": 76230.5390625} {"train_loss": -5.334820747375488, "global_step": 21126, "epoch": 503} {"train_loss": -5.108980178833008, "global_step": 21127, "epoch": 503} {"train_loss": -5.289437294006348, "global_step": 21128, "epoch": 503} {"train_loss": -5.414665222167969, "global_step": 21129, "epoch": 503} {"train_loss": -5.173160076141357, "global_step": 21130, "epoch": 503} {"train_loss": -5.337301254272461, "global_step": 21131, "epoch": 503} {"train_loss": -5.377081871032715, "global_step": 21132, "epoch": 503} {"train_loss": -5.318957805633545, "global_step": 21133, "epoch": 503} {"train_loss": -5.392973899841309, "global_step": 21134, "epoch": 503} {"train_loss": -5.286606788635254, "global_step": 21135, "epoch": 503} {"train_loss": -5.400339126586914, "global_step": 21136, "epoch": 503} {"train_loss": -5.226555824279785, "global_step": 21137, "epoch": 503} {"train_loss": -5.169322967529297, "global_step": 21138, "epoch": 503} {"train_loss": -5.291024208068848, "global_step": 21139, "epoch": 503} {"train_loss": -5.404020309448242, "global_step": 21140, "epoch": 503} {"train_loss": -5.266716003417969, "global_step": 21141, "epoch": 503} {"train_loss": -5.256948471069336, "global_step": 21142, "epoch": 503} {"train_loss": -5.286596775054932, "global_step": 21143, "epoch": 503} {"train_loss": -5.365421295166016, "global_step": 21144, "epoch": 503} {"train_loss": -5.2361602783203125, "global_step": 21145, "epoch": 503} {"train_loss": -5.393376350402832, "global_step": 21146, "epoch": 503} {"train_loss": -5.266507148742676, "global_step": 21147, "epoch": 503} {"train_loss": -5.351987838745117, "global_step": 21148, "epoch": 503} {"train_loss": -5.17680025100708, "global_step": 21149, "epoch": 503} {"train_loss": -5.148560523986816, "global_step": 21150, "epoch": 503} {"train_loss": -5.034642696380615, "global_step": 21151, "epoch": 503} {"train_loss": -5.064149856567383, "global_step": 21152, "epoch": 503} {"train_loss": -5.324583053588867, "global_step": 21153, "epoch": 503} {"train_loss": -5.11113166809082, "global_step": 21154, "epoch": 503} {"train_loss": -5.32376766204834, "global_step": 21155, "epoch": 503} {"train_loss": -5.216737747192383, "global_step": 21156, "epoch": 503} {"train_loss": -5.138612747192383, "global_step": 21157, "epoch": 503} {"train_loss": -5.371902942657471, "global_step": 21158, "epoch": 503} {"train_loss": -5.214804172515869, "global_step": 21159, "epoch": 503} {"train_loss": -5.3633904457092285, "global_step": 21160, "epoch": 503} {"train_loss": -5.155060291290283, "global_step": 21161, "epoch": 503} {"train_loss": -5.237811088562012, "global_step": 21162, "epoch": 503} {"train_loss": -5.33230447769165, "global_step": 21163, "epoch": 503} {"train_loss": -5.264275074005127, "global_step": 21164, "epoch": 503} {"train_loss": -5.360592842102051, "global_step": 21165, "epoch": 503} {"train_loss": -5.289161682128906, "global_step": 21166, "epoch": 503} {"train_loss": -5.271746646790278, "global_step": 21167, "epoch": 503, "val_loss": 76936.1875} {"train_loss": -5.330369472503662, "global_step": 21168, "epoch": 504} {"train_loss": -5.2029805183410645, "global_step": 21169, "epoch": 504} {"train_loss": -5.341579437255859, "global_step": 21170, "epoch": 504} {"train_loss": -5.297362327575684, "global_step": 21171, "epoch": 504} {"train_loss": -5.351225852966309, "global_step": 21172, "epoch": 504} {"train_loss": -5.304987907409668, "global_step": 21173, "epoch": 504} {"train_loss": -5.385893821716309, "global_step": 21174, "epoch": 504} {"train_loss": -5.3133158683776855, "global_step": 21175, "epoch": 504} {"train_loss": -5.3159379959106445, "global_step": 21176, "epoch": 504} {"train_loss": -5.383796691894531, "global_step": 21177, "epoch": 504} {"train_loss": -5.252727508544922, "global_step": 21178, "epoch": 504} {"train_loss": -5.276718616485596, "global_step": 21179, "epoch": 504} {"train_loss": -5.374300479888916, "global_step": 21180, "epoch": 504} {"train_loss": -5.24464225769043, "global_step": 21181, "epoch": 504} {"train_loss": -5.20145320892334, "global_step": 21182, "epoch": 504} {"train_loss": -5.270877361297607, "global_step": 21183, "epoch": 504} {"train_loss": -5.2536540031433105, "global_step": 21184, "epoch": 504} {"train_loss": -5.05979585647583, "global_step": 21185, "epoch": 504} {"train_loss": -5.452991485595703, "global_step": 21186, "epoch": 504} {"train_loss": -5.1887102127075195, "global_step": 21187, "epoch": 504} {"train_loss": -5.305450439453125, "global_step": 21188, "epoch": 504} {"train_loss": -5.274084091186523, "global_step": 21189, "epoch": 504} {"train_loss": -5.096739768981934, "global_step": 21190, "epoch": 504} {"train_loss": -5.300771713256836, "global_step": 21191, "epoch": 504} {"train_loss": -5.1331987380981445, "global_step": 21192, "epoch": 504} {"train_loss": -5.379232406616211, "global_step": 21193, "epoch": 504} {"train_loss": -5.117742538452148, "global_step": 21194, "epoch": 504} {"train_loss": -5.196734428405762, "global_step": 21195, "epoch": 504} {"train_loss": -5.456521034240723, "global_step": 21196, "epoch": 504} {"train_loss": -5.127008438110352, "global_step": 21197, "epoch": 504} {"train_loss": -5.247549533843994, "global_step": 21198, "epoch": 504} {"train_loss": -5.030314922332764, "global_step": 21199, "epoch": 504} {"train_loss": -5.274197101593018, "global_step": 21200, "epoch": 504} {"train_loss": -5.169100761413574, "global_step": 21201, "epoch": 504} {"train_loss": -5.153903961181641, "global_step": 21202, "epoch": 504} {"train_loss": -5.196314811706543, "global_step": 21203, "epoch": 504} {"train_loss": -5.401917457580566, "global_step": 21204, "epoch": 504} {"train_loss": -5.238308906555176, "global_step": 21205, "epoch": 504} {"train_loss": -5.395341873168945, "global_step": 21206, "epoch": 504} {"train_loss": -5.336718559265137, "global_step": 21207, "epoch": 504} {"train_loss": -5.273237228393555, "global_step": 21208, "epoch": 504} {"train_loss": -5.268893037523542, "global_step": 21209, "epoch": 504, "val_loss": 75863.8046875} {"train_loss": -5.394776344299316, "global_step": 21210, "epoch": 505} {"train_loss": -5.416970252990723, "global_step": 21211, "epoch": 505} {"train_loss": -5.354775428771973, "global_step": 21212, "epoch": 505} {"train_loss": -5.422703742980957, "global_step": 21213, "epoch": 505} {"train_loss": -5.245323181152344, "global_step": 21214, "epoch": 505} {"train_loss": -5.359532833099365, "global_step": 21215, "epoch": 505} {"train_loss": -5.299687385559082, "global_step": 21216, "epoch": 505} {"train_loss": -5.317941665649414, "global_step": 21217, "epoch": 505} {"train_loss": -5.316288471221924, "global_step": 21218, "epoch": 505} {"train_loss": -5.445878028869629, "global_step": 21219, "epoch": 505} {"train_loss": -5.468277931213379, "global_step": 21220, "epoch": 505} {"train_loss": -5.370834827423096, "global_step": 21221, "epoch": 505} {"train_loss": -5.3874993324279785, "global_step": 21222, "epoch": 505} {"train_loss": -5.378847122192383, "global_step": 21223, "epoch": 505} {"train_loss": -5.455023765563965, "global_step": 21224, "epoch": 505} {"train_loss": -5.366975784301758, "global_step": 21225, "epoch": 505} {"train_loss": -5.299909591674805, "global_step": 21226, "epoch": 505} {"train_loss": -5.314784526824951, "global_step": 21227, "epoch": 505} {"train_loss": -5.342506408691406, "global_step": 21228, "epoch": 505} {"train_loss": -5.214210033416748, "global_step": 21229, "epoch": 505} {"train_loss": -5.267309665679932, "global_step": 21230, "epoch": 505} {"train_loss": -5.352052211761475, "global_step": 21231, "epoch": 505} {"train_loss": -5.282869815826416, "global_step": 21232, "epoch": 505} {"train_loss": -5.30759859085083, "global_step": 21233, "epoch": 505} {"train_loss": -5.191795349121094, "global_step": 21234, "epoch": 505} {"train_loss": -5.276969909667969, "global_step": 21235, "epoch": 505} {"train_loss": -5.144225597381592, "global_step": 21236, "epoch": 505} {"train_loss": -5.335188865661621, "global_step": 21237, "epoch": 505} {"train_loss": -5.295777797698975, "global_step": 21238, "epoch": 505} {"train_loss": -5.35466194152832, "global_step": 21239, "epoch": 505} {"train_loss": -5.345455169677734, "global_step": 21240, "epoch": 505} {"train_loss": -5.257957935333252, "global_step": 21241, "epoch": 505} {"train_loss": -5.3138885498046875, "global_step": 21242, "epoch": 505} {"train_loss": -5.418576240539551, "global_step": 21243, "epoch": 505} {"train_loss": -5.230725288391113, "global_step": 21244, "epoch": 505} {"train_loss": -5.221794128417969, "global_step": 21245, "epoch": 505} {"train_loss": -5.247373104095459, "global_step": 21246, "epoch": 505} {"train_loss": -5.268031120300293, "global_step": 21247, "epoch": 505} {"train_loss": -5.400949478149414, "global_step": 21248, "epoch": 505} {"train_loss": -5.208658695220947, "global_step": 21249, "epoch": 505} {"train_loss": -5.187572002410889, "global_step": 21250, "epoch": 505} {"train_loss": -5.319505725588117, "global_step": 21251, "epoch": 505, "val_loss": 75910.4609375} {"train_loss": -5.388907432556152, "global_step": 21252, "epoch": 506} {"train_loss": -5.280667781829834, "global_step": 21253, "epoch": 506} {"train_loss": -5.44219970703125, "global_step": 21254, "epoch": 506} {"train_loss": -5.347069263458252, "global_step": 21255, "epoch": 506} {"train_loss": -5.384779930114746, "global_step": 21256, "epoch": 506} {"train_loss": -5.358670234680176, "global_step": 21257, "epoch": 506} {"train_loss": -5.19512939453125, "global_step": 21258, "epoch": 506} {"train_loss": -5.408880233764648, "global_step": 21259, "epoch": 506} {"train_loss": -5.1884355545043945, "global_step": 21260, "epoch": 506} {"train_loss": -5.263050079345703, "global_step": 21261, "epoch": 506} {"train_loss": -5.284384250640869, "global_step": 21262, "epoch": 506} {"train_loss": -5.35969352722168, "global_step": 21263, "epoch": 506} {"train_loss": -5.262106418609619, "global_step": 21264, "epoch": 506} {"train_loss": -5.393558502197266, "global_step": 21265, "epoch": 506} {"train_loss": -5.340047836303711, "global_step": 21266, "epoch": 506} {"train_loss": -5.146362781524658, "global_step": 21267, "epoch": 506} {"train_loss": -5.401843547821045, "global_step": 21268, "epoch": 506} {"train_loss": -5.221844673156738, "global_step": 21269, "epoch": 506} {"train_loss": -5.439936637878418, "global_step": 21270, "epoch": 506} {"train_loss": -5.333809852600098, "global_step": 21271, "epoch": 506} {"train_loss": -5.3068647384643555, "global_step": 21272, "epoch": 506} {"train_loss": -5.390790939331055, "global_step": 21273, "epoch": 506} {"train_loss": -5.362648963928223, "global_step": 21274, "epoch": 506} {"train_loss": -5.303007125854492, "global_step": 21275, "epoch": 506} {"train_loss": -5.347832202911377, "global_step": 21276, "epoch": 506} {"train_loss": -5.407550811767578, "global_step": 21277, "epoch": 506} {"train_loss": -5.340502738952637, "global_step": 21278, "epoch": 506} {"train_loss": -5.305421829223633, "global_step": 21279, "epoch": 506} {"train_loss": -5.187982559204102, "global_step": 21280, "epoch": 506} {"train_loss": -5.318350315093994, "global_step": 21281, "epoch": 506} {"train_loss": -5.3329596519470215, "global_step": 21282, "epoch": 506} {"train_loss": -5.383636951446533, "global_step": 21283, "epoch": 506} {"train_loss": -5.453221321105957, "global_step": 21284, "epoch": 506} {"train_loss": -5.446944236755371, "global_step": 21285, "epoch": 506} {"train_loss": -5.383489608764648, "global_step": 21286, "epoch": 506} {"train_loss": -5.310948371887207, "global_step": 21287, "epoch": 506} {"train_loss": -5.211113929748535, "global_step": 21288, "epoch": 506} {"train_loss": -5.267193794250488, "global_step": 21289, "epoch": 506} {"train_loss": -5.301520347595215, "global_step": 21290, "epoch": 506} {"train_loss": -5.326848983764648, "global_step": 21291, "epoch": 506} {"train_loss": -5.449140548706055, "global_step": 21292, "epoch": 506} {"train_loss": -5.330015159788585, "global_step": 21293, "epoch": 506, "val_loss": 77365.6015625} {"train_loss": -5.2411603927612305, "global_step": 21294, "epoch": 507} {"train_loss": -5.287595748901367, "global_step": 21295, "epoch": 507} {"train_loss": -5.368738174438477, "global_step": 21296, "epoch": 507} {"train_loss": -5.24984073638916, "global_step": 21297, "epoch": 507} {"train_loss": -5.22660493850708, "global_step": 21298, "epoch": 507} {"train_loss": -5.257599353790283, "global_step": 21299, "epoch": 507} {"train_loss": -5.278540134429932, "global_step": 21300, "epoch": 507} {"train_loss": -5.302089691162109, "global_step": 21301, "epoch": 507} {"train_loss": -5.229642391204834, "global_step": 21302, "epoch": 507} {"train_loss": -5.280086994171143, "global_step": 21303, "epoch": 507} {"train_loss": -5.393838882446289, "global_step": 21304, "epoch": 507} {"train_loss": -5.405908584594727, "global_step": 21305, "epoch": 507} {"train_loss": -5.277610778808594, "global_step": 21306, "epoch": 507} {"train_loss": -5.4313249588012695, "global_step": 21307, "epoch": 507} {"train_loss": -5.291341781616211, "global_step": 21308, "epoch": 507} {"train_loss": -5.3882341384887695, "global_step": 21309, "epoch": 507} {"train_loss": -5.347128868103027, "global_step": 21310, "epoch": 507} {"train_loss": -5.34471321105957, "global_step": 21311, "epoch": 507} {"train_loss": -5.327390670776367, "global_step": 21312, "epoch": 507} {"train_loss": -5.440194606781006, "global_step": 21313, "epoch": 507} {"train_loss": -5.322298526763916, "global_step": 21314, "epoch": 507} {"train_loss": -5.311079978942871, "global_step": 21315, "epoch": 507} {"train_loss": -5.287494659423828, "global_step": 21316, "epoch": 507} {"train_loss": -5.394720077514648, "global_step": 21317, "epoch": 507} {"train_loss": -5.257698059082031, "global_step": 21318, "epoch": 507} {"train_loss": -5.196447372436523, "global_step": 21319, "epoch": 507} {"train_loss": -5.305777072906494, "global_step": 21320, "epoch": 507} {"train_loss": -5.255145072937012, "global_step": 21321, "epoch": 507} {"train_loss": -5.373500347137451, "global_step": 21322, "epoch": 507} {"train_loss": -5.233193874359131, "global_step": 21323, "epoch": 507} {"train_loss": -5.380467414855957, "global_step": 21324, "epoch": 507} {"train_loss": -5.139839172363281, "global_step": 21325, "epoch": 507} {"train_loss": -5.379471778869629, "global_step": 21326, "epoch": 507} {"train_loss": -5.311736106872559, "global_step": 21327, "epoch": 507} {"train_loss": -5.298617839813232, "global_step": 21328, "epoch": 507} {"train_loss": -5.355340480804443, "global_step": 21329, "epoch": 507} {"train_loss": -5.338018894195557, "global_step": 21330, "epoch": 507} {"train_loss": -5.312126159667969, "global_step": 21331, "epoch": 507} {"train_loss": -5.253861427307129, "global_step": 21332, "epoch": 507} {"train_loss": -5.183755397796631, "global_step": 21333, "epoch": 507} {"train_loss": -5.286892890930176, "global_step": 21334, "epoch": 507} {"train_loss": -5.307353167306809, "global_step": 21335, "epoch": 507, "val_loss": 75998.703125} {"train_loss": -5.327676773071289, "global_step": 21336, "epoch": 508} {"train_loss": -5.385109901428223, "global_step": 21337, "epoch": 508} {"train_loss": -5.249753475189209, "global_step": 21338, "epoch": 508} {"train_loss": -5.37139892578125, "global_step": 21339, "epoch": 508} {"train_loss": -5.313509941101074, "global_step": 21340, "epoch": 508} {"train_loss": -5.414286136627197, "global_step": 21341, "epoch": 508} {"train_loss": -5.325810432434082, "global_step": 21342, "epoch": 508} {"train_loss": -5.440157890319824, "global_step": 21343, "epoch": 508} {"train_loss": -5.380982875823975, "global_step": 21344, "epoch": 508} {"train_loss": -5.3364338874816895, "global_step": 21345, "epoch": 508} {"train_loss": -5.447513580322266, "global_step": 21346, "epoch": 508} {"train_loss": -5.3717241287231445, "global_step": 21347, "epoch": 508} {"train_loss": -5.261384010314941, "global_step": 21348, "epoch": 508} {"train_loss": -5.490701675415039, "global_step": 21349, "epoch": 508} {"train_loss": -5.329350471496582, "global_step": 21350, "epoch": 508} {"train_loss": -5.2648701667785645, "global_step": 21351, "epoch": 508} {"train_loss": -5.325162887573242, "global_step": 21352, "epoch": 508} {"train_loss": -5.329614162445068, "global_step": 21353, "epoch": 508} {"train_loss": -5.063847541809082, "global_step": 21354, "epoch": 508} {"train_loss": -5.323261260986328, "global_step": 21355, "epoch": 508} {"train_loss": -5.248805046081543, "global_step": 21356, "epoch": 508} {"train_loss": -5.281222343444824, "global_step": 21357, "epoch": 508} {"train_loss": -5.1359477043151855, "global_step": 21358, "epoch": 508} {"train_loss": -5.250763416290283, "global_step": 21359, "epoch": 508} {"train_loss": -5.488479137420654, "global_step": 21360, "epoch": 508} {"train_loss": -5.2274065017700195, "global_step": 21361, "epoch": 508} {"train_loss": -5.353713035583496, "global_step": 21362, "epoch": 508} {"train_loss": -5.4152727127075195, "global_step": 21363, "epoch": 508} {"train_loss": -5.319644927978516, "global_step": 21364, "epoch": 508} {"train_loss": -5.156571388244629, "global_step": 21365, "epoch": 508} {"train_loss": -5.183689117431641, "global_step": 21366, "epoch": 508} {"train_loss": -5.26331090927124, "global_step": 21367, "epoch": 508} {"train_loss": -5.252120018005371, "global_step": 21368, "epoch": 508} {"train_loss": -5.227331638336182, "global_step": 21369, "epoch": 508} {"train_loss": -5.315841197967529, "global_step": 21370, "epoch": 508} {"train_loss": -5.275040149688721, "global_step": 21371, "epoch": 508} {"train_loss": -5.283876895904541, "global_step": 21372, "epoch": 508} {"train_loss": -5.399196624755859, "global_step": 21373, "epoch": 508} {"train_loss": -5.179067611694336, "global_step": 21374, "epoch": 508} {"train_loss": -5.285386562347412, "global_step": 21375, "epoch": 508} {"train_loss": -5.30784797668457, "global_step": 21376, "epoch": 508} {"train_loss": -5.306840113231114, "global_step": 21377, "epoch": 508, "val_loss": 75470.8671875} {"train_loss": -5.32061767578125, "global_step": 21378, "epoch": 509} {"train_loss": -5.3783769607543945, "global_step": 21379, "epoch": 509} {"train_loss": -5.391942024230957, "global_step": 21380, "epoch": 509} {"train_loss": -5.294710636138916, "global_step": 21381, "epoch": 509} {"train_loss": -5.324384689331055, "global_step": 21382, "epoch": 509} {"train_loss": -5.23074197769165, "global_step": 21383, "epoch": 509} {"train_loss": -5.378853797912598, "global_step": 21384, "epoch": 509} {"train_loss": -5.2143025398254395, "global_step": 21385, "epoch": 509} {"train_loss": -5.289233207702637, "global_step": 21386, "epoch": 509} {"train_loss": -5.409046173095703, "global_step": 21387, "epoch": 509} {"train_loss": -5.208573341369629, "global_step": 21388, "epoch": 509} {"train_loss": -5.373941898345947, "global_step": 21389, "epoch": 509} {"train_loss": -5.324235439300537, "global_step": 21390, "epoch": 509} {"train_loss": -5.268146514892578, "global_step": 21391, "epoch": 509} {"train_loss": -5.216335296630859, "global_step": 21392, "epoch": 509} {"train_loss": -5.325400352478027, "global_step": 21393, "epoch": 509} {"train_loss": -5.176314830780029, "global_step": 21394, "epoch": 509} {"train_loss": -5.349496841430664, "global_step": 21395, "epoch": 509} {"train_loss": -5.349185943603516, "global_step": 21396, "epoch": 509} {"train_loss": -5.262613773345947, "global_step": 21397, "epoch": 509} {"train_loss": -5.27325963973999, "global_step": 21398, "epoch": 509} {"train_loss": -5.3700361251831055, "global_step": 21399, "epoch": 509} {"train_loss": -5.363016128540039, "global_step": 21400, "epoch": 509} {"train_loss": -5.1454668045043945, "global_step": 21401, "epoch": 509} {"train_loss": -5.372828483581543, "global_step": 21402, "epoch": 509} {"train_loss": -5.319853782653809, "global_step": 21403, "epoch": 509} {"train_loss": -5.439994812011719, "global_step": 21404, "epoch": 509} {"train_loss": -5.391616344451904, "global_step": 21405, "epoch": 509} {"train_loss": -5.363274097442627, "global_step": 21406, "epoch": 509} {"train_loss": -5.393988609313965, "global_step": 21407, "epoch": 509} {"train_loss": -5.322549343109131, "global_step": 21408, "epoch": 509} {"train_loss": -5.334138870239258, "global_step": 21409, "epoch": 509} {"train_loss": -5.267530918121338, "global_step": 21410, "epoch": 509} {"train_loss": -5.386137962341309, "global_step": 21411, "epoch": 509} {"train_loss": -5.265746116638184, "global_step": 21412, "epoch": 509} {"train_loss": -5.295019626617432, "global_step": 21413, "epoch": 509} {"train_loss": -5.225583076477051, "global_step": 21414, "epoch": 509} {"train_loss": -5.357701301574707, "global_step": 21415, "epoch": 509} {"train_loss": -5.221193313598633, "global_step": 21416, "epoch": 509} {"train_loss": -5.392922401428223, "global_step": 21417, "epoch": 509} {"train_loss": -5.333561897277832, "global_step": 21418, "epoch": 509} {"train_loss": -5.315934396925426, "global_step": 21419, "epoch": 509, "val_loss": 75915.0703125} {"train_loss": -5.2707719802856445, "global_step": 21420, "epoch": 510} {"train_loss": -5.341606616973877, "global_step": 21421, "epoch": 510} {"train_loss": -5.206430912017822, "global_step": 21422, "epoch": 510} {"train_loss": -5.515833377838135, "global_step": 21423, "epoch": 510} {"train_loss": -5.419290065765381, "global_step": 21424, "epoch": 510} {"train_loss": -5.2747273445129395, "global_step": 21425, "epoch": 510} {"train_loss": -5.235513210296631, "global_step": 21426, "epoch": 510} {"train_loss": -5.307671546936035, "global_step": 21427, "epoch": 510} {"train_loss": -5.282382965087891, "global_step": 21428, "epoch": 510} {"train_loss": -5.399440765380859, "global_step": 21429, "epoch": 510} {"train_loss": -5.398842811584473, "global_step": 21430, "epoch": 510} {"train_loss": -5.218632221221924, "global_step": 21431, "epoch": 510} {"train_loss": -5.306153774261475, "global_step": 21432, "epoch": 510} {"train_loss": -5.19589900970459, "global_step": 21433, "epoch": 510} {"train_loss": -5.341958522796631, "global_step": 21434, "epoch": 510} {"train_loss": -5.474699020385742, "global_step": 21435, "epoch": 510} {"train_loss": -5.326294422149658, "global_step": 21436, "epoch": 510} {"train_loss": -5.260315895080566, "global_step": 21437, "epoch": 510} {"train_loss": -5.323798656463623, "global_step": 21438, "epoch": 510} {"train_loss": -5.267989635467529, "global_step": 21439, "epoch": 510} {"train_loss": -5.433839797973633, "global_step": 21440, "epoch": 510} {"train_loss": -5.304475784301758, "global_step": 21441, "epoch": 510} {"train_loss": -5.2068986892700195, "global_step": 21442, "epoch": 510} {"train_loss": -5.3542046546936035, "global_step": 21443, "epoch": 510} {"train_loss": -5.377947807312012, "global_step": 21444, "epoch": 510} {"train_loss": -5.264578342437744, "global_step": 21445, "epoch": 510} {"train_loss": -5.2921881675720215, "global_step": 21446, "epoch": 510} {"train_loss": -5.323783874511719, "global_step": 21447, "epoch": 510} {"train_loss": -5.268510818481445, "global_step": 21448, "epoch": 510} {"train_loss": -5.383708953857422, "global_step": 21449, "epoch": 510} {"train_loss": -5.4332170486450195, "global_step": 21450, "epoch": 510} {"train_loss": -5.2870612144470215, "global_step": 21451, "epoch": 510} {"train_loss": -5.3934326171875, "global_step": 21452, "epoch": 510} {"train_loss": -5.384316444396973, "global_step": 21453, "epoch": 510} {"train_loss": -5.295122146606445, "global_step": 21454, "epoch": 510} {"train_loss": -5.357366561889648, "global_step": 21455, "epoch": 510} {"train_loss": -5.286810874938965, "global_step": 21456, "epoch": 510} {"train_loss": -5.446716785430908, "global_step": 21457, "epoch": 510} {"train_loss": -5.40971565246582, "global_step": 21458, "epoch": 510} {"train_loss": -5.218832969665527, "global_step": 21459, "epoch": 510} {"train_loss": -5.301052093505859, "global_step": 21460, "epoch": 510} {"train_loss": -5.3234547319866365, "global_step": 21461, "epoch": 510, "val_loss": 76507.2421875} {"train_loss": -5.365893363952637, "global_step": 21462, "epoch": 511} {"train_loss": -5.352777004241943, "global_step": 21463, "epoch": 511} {"train_loss": -5.311850547790527, "global_step": 21464, "epoch": 511} {"train_loss": -5.334090709686279, "global_step": 21465, "epoch": 511} {"train_loss": -5.261436462402344, "global_step": 21466, "epoch": 511} {"train_loss": -5.299619674682617, "global_step": 21467, "epoch": 511} {"train_loss": -5.422176361083984, "global_step": 21468, "epoch": 511} {"train_loss": -5.225352764129639, "global_step": 21469, "epoch": 511} {"train_loss": -5.35670280456543, "global_step": 21470, "epoch": 511} {"train_loss": -5.416072368621826, "global_step": 21471, "epoch": 511} {"train_loss": -5.288760662078857, "global_step": 21472, "epoch": 511} {"train_loss": -5.344839096069336, "global_step": 21473, "epoch": 511} {"train_loss": -5.226322174072266, "global_step": 21474, "epoch": 511} {"train_loss": -5.256349563598633, "global_step": 21475, "epoch": 511} {"train_loss": -5.413236618041992, "global_step": 21476, "epoch": 511} {"train_loss": -5.168238639831543, "global_step": 21477, "epoch": 511} {"train_loss": -5.374412536621094, "global_step": 21478, "epoch": 511} {"train_loss": -5.378225803375244, "global_step": 21479, "epoch": 511} {"train_loss": -5.399360179901123, "global_step": 21480, "epoch": 511} {"train_loss": -5.2780303955078125, "global_step": 21481, "epoch": 511} {"train_loss": -5.367475986480713, "global_step": 21482, "epoch": 511} {"train_loss": -5.411772727966309, "global_step": 21483, "epoch": 511} {"train_loss": -5.3337860107421875, "global_step": 21484, "epoch": 511} {"train_loss": -5.209814071655273, "global_step": 21485, "epoch": 511} {"train_loss": -5.348628044128418, "global_step": 21486, "epoch": 511} {"train_loss": -5.426095008850098, "global_step": 21487, "epoch": 511} {"train_loss": -5.315106391906738, "global_step": 21488, "epoch": 511} {"train_loss": -5.257076263427734, "global_step": 21489, "epoch": 511} {"train_loss": -5.307761192321777, "global_step": 21490, "epoch": 511} {"train_loss": -5.264467239379883, "global_step": 21491, "epoch": 511} {"train_loss": -5.331592082977295, "global_step": 21492, "epoch": 511} {"train_loss": -5.3830413818359375, "global_step": 21493, "epoch": 511} {"train_loss": -5.391131401062012, "global_step": 21494, "epoch": 511} {"train_loss": -5.433080673217773, "global_step": 21495, "epoch": 511} {"train_loss": -5.178488254547119, "global_step": 21496, "epoch": 511} {"train_loss": -5.4338154792785645, "global_step": 21497, "epoch": 511} {"train_loss": -5.390005588531494, "global_step": 21498, "epoch": 511} {"train_loss": -5.226223468780518, "global_step": 21499, "epoch": 511} {"train_loss": -5.279872417449951, "global_step": 21500, "epoch": 511} {"train_loss": -5.40219783782959, "global_step": 21501, "epoch": 511} {"train_loss": -5.406209468841553, "global_step": 21502, "epoch": 511} {"train_loss": -5.330684003375826, "global_step": 21503, "epoch": 511, "val_loss": 75764.0625} {"train_loss": -5.367725372314453, "global_step": 21504, "epoch": 512} {"train_loss": -5.374325752258301, "global_step": 21505, "epoch": 512} {"train_loss": -5.205295085906982, "global_step": 21506, "epoch": 512} {"train_loss": -5.173827648162842, "global_step": 21507, "epoch": 512} {"train_loss": -5.5570878982543945, "global_step": 21508, "epoch": 512} {"train_loss": -5.423377990722656, "global_step": 21509, "epoch": 512} {"train_loss": -5.281195640563965, "global_step": 21510, "epoch": 512} {"train_loss": -5.241157531738281, "global_step": 21511, "epoch": 512} {"train_loss": -5.3160905838012695, "global_step": 21512, "epoch": 512} {"train_loss": -5.347498416900635, "global_step": 21513, "epoch": 512} {"train_loss": -5.44429874420166, "global_step": 21514, "epoch": 512} {"train_loss": -5.310871124267578, "global_step": 21515, "epoch": 512} {"train_loss": -5.274949073791504, "global_step": 21516, "epoch": 512} {"train_loss": -5.368282318115234, "global_step": 21517, "epoch": 512} {"train_loss": -5.206961631774902, "global_step": 21518, "epoch": 512} {"train_loss": -5.357956886291504, "global_step": 21519, "epoch": 512} {"train_loss": -5.250558376312256, "global_step": 21520, "epoch": 512} {"train_loss": -5.382536888122559, "global_step": 21521, "epoch": 512} {"train_loss": -5.191041946411133, "global_step": 21522, "epoch": 512} {"train_loss": -5.280572891235352, "global_step": 21523, "epoch": 512} {"train_loss": -5.348756790161133, "global_step": 21524, "epoch": 512} {"train_loss": -5.365457534790039, "global_step": 21525, "epoch": 512} {"train_loss": -5.362979888916016, "global_step": 21526, "epoch": 512} {"train_loss": -5.389005661010742, "global_step": 21527, "epoch": 512} {"train_loss": -5.339593887329102, "global_step": 21528, "epoch": 512} {"train_loss": -5.468592643737793, "global_step": 21529, "epoch": 512} {"train_loss": -5.291825294494629, "global_step": 21530, "epoch": 512} {"train_loss": -5.402304649353027, "global_step": 21531, "epoch": 512} {"train_loss": -5.452987194061279, "global_step": 21532, "epoch": 512} {"train_loss": -5.357242584228516, "global_step": 21533, "epoch": 512} {"train_loss": -5.154287338256836, "global_step": 21534, "epoch": 512} {"train_loss": -5.266913414001465, "global_step": 21535, "epoch": 512} {"train_loss": -5.417829990386963, "global_step": 21536, "epoch": 512} {"train_loss": -5.178922653198242, "global_step": 21537, "epoch": 512} {"train_loss": -5.344296455383301, "global_step": 21538, "epoch": 512} {"train_loss": -5.370007514953613, "global_step": 21539, "epoch": 512} {"train_loss": -5.2274274826049805, "global_step": 21540, "epoch": 512} {"train_loss": -5.295062065124512, "global_step": 21541, "epoch": 512} {"train_loss": -5.493553638458252, "global_step": 21542, "epoch": 512} {"train_loss": -5.192899227142334, "global_step": 21543, "epoch": 512} {"train_loss": -5.385551452636719, "global_step": 21544, "epoch": 512} {"train_loss": -5.329105184191749, "global_step": 21545, "epoch": 512, "val_loss": 76283.7109375} {"train_loss": -5.2407989501953125, "global_step": 21546, "epoch": 513} {"train_loss": -5.323314189910889, "global_step": 21547, "epoch": 513} {"train_loss": -5.304878234863281, "global_step": 21548, "epoch": 513} {"train_loss": -5.316254138946533, "global_step": 21549, "epoch": 513} {"train_loss": -5.373485565185547, "global_step": 21550, "epoch": 513} {"train_loss": -5.226552963256836, "global_step": 21551, "epoch": 513} {"train_loss": -5.292577743530273, "global_step": 21552, "epoch": 513} {"train_loss": -5.290450572967529, "global_step": 21553, "epoch": 513} {"train_loss": -5.203784942626953, "global_step": 21554, "epoch": 513} {"train_loss": -5.337064266204834, "global_step": 21555, "epoch": 513} {"train_loss": -5.294390678405762, "global_step": 21556, "epoch": 513} {"train_loss": -5.318304061889648, "global_step": 21557, "epoch": 513} {"train_loss": -5.19383430480957, "global_step": 21558, "epoch": 513} {"train_loss": -5.288034439086914, "global_step": 21559, "epoch": 513} {"train_loss": -5.333378791809082, "global_step": 21560, "epoch": 513} {"train_loss": -5.3209662437438965, "global_step": 21561, "epoch": 513} {"train_loss": -5.22894287109375, "global_step": 21562, "epoch": 513} {"train_loss": -5.299920082092285, "global_step": 21563, "epoch": 513} {"train_loss": -5.2861223220825195, "global_step": 21564, "epoch": 513} {"train_loss": -5.2006731033325195, "global_step": 21565, "epoch": 513} {"train_loss": -5.314770698547363, "global_step": 21566, "epoch": 513} {"train_loss": -5.314155578613281, "global_step": 21567, "epoch": 513} {"train_loss": -5.290511131286621, "global_step": 21568, "epoch": 513} {"train_loss": -5.319430351257324, "global_step": 21569, "epoch": 513} {"train_loss": -5.267380714416504, "global_step": 21570, "epoch": 513} {"train_loss": -5.37277889251709, "global_step": 21571, "epoch": 513} {"train_loss": -5.297789573669434, "global_step": 21572, "epoch": 513} {"train_loss": -5.402988433837891, "global_step": 21573, "epoch": 513} {"train_loss": -5.2755842208862305, "global_step": 21574, "epoch": 513} {"train_loss": -5.422130584716797, "global_step": 21575, "epoch": 513} {"train_loss": -5.407977104187012, "global_step": 21576, "epoch": 513} {"train_loss": -5.498560905456543, "global_step": 21577, "epoch": 513} {"train_loss": -5.282881259918213, "global_step": 21578, "epoch": 513} {"train_loss": -5.382661819458008, "global_step": 21579, "epoch": 513} {"train_loss": -5.343105316162109, "global_step": 21580, "epoch": 513} {"train_loss": -5.203514099121094, "global_step": 21581, "epoch": 513} {"train_loss": -5.378594875335693, "global_step": 21582, "epoch": 513} {"train_loss": -5.215080261230469, "global_step": 21583, "epoch": 513} {"train_loss": -5.3517255783081055, "global_step": 21584, "epoch": 513} {"train_loss": -5.262084484100342, "global_step": 21585, "epoch": 513} {"train_loss": -5.357704162597656, "global_step": 21586, "epoch": 513} {"train_loss": -5.3067938827333, "global_step": 21587, "epoch": 513, "val_loss": 76466.625} {"train_loss": -5.31545877456665, "global_step": 21588, "epoch": 514} {"train_loss": -5.37993860244751, "global_step": 21589, "epoch": 514} {"train_loss": -5.496446132659912, "global_step": 21590, "epoch": 514} {"train_loss": -5.301921367645264, "global_step": 21591, "epoch": 514} {"train_loss": -5.342067718505859, "global_step": 21592, "epoch": 514} {"train_loss": -5.323201656341553, "global_step": 21593, "epoch": 514} {"train_loss": -5.273553371429443, "global_step": 21594, "epoch": 514} {"train_loss": -5.429759979248047, "global_step": 21595, "epoch": 514} {"train_loss": -5.236432075500488, "global_step": 21596, "epoch": 514} {"train_loss": -5.335198879241943, "global_step": 21597, "epoch": 514} {"train_loss": -5.329689979553223, "global_step": 21598, "epoch": 514} {"train_loss": -5.13370418548584, "global_step": 21599, "epoch": 514} {"train_loss": -5.2184343338012695, "global_step": 21600, "epoch": 514} {"train_loss": -5.3400468826293945, "global_step": 21601, "epoch": 514} {"train_loss": -5.312751770019531, "global_step": 21602, "epoch": 514} {"train_loss": -5.507483959197998, "global_step": 21603, "epoch": 514} {"train_loss": -5.301450729370117, "global_step": 21604, "epoch": 514} {"train_loss": -5.253032684326172, "global_step": 21605, "epoch": 514} {"train_loss": -5.337053298950195, "global_step": 21606, "epoch": 514} {"train_loss": -5.345104217529297, "global_step": 21607, "epoch": 514} {"train_loss": -5.33553409576416, "global_step": 21608, "epoch": 514} {"train_loss": -5.346935272216797, "global_step": 21609, "epoch": 514} {"train_loss": -5.326626777648926, "global_step": 21610, "epoch": 514} {"train_loss": -5.276432991027832, "global_step": 21611, "epoch": 514} {"train_loss": -5.438846111297607, "global_step": 21612, "epoch": 514} {"train_loss": -5.351668357849121, "global_step": 21613, "epoch": 514} {"train_loss": -5.227895736694336, "global_step": 21614, "epoch": 514} {"train_loss": -5.266736030578613, "global_step": 21615, "epoch": 514} {"train_loss": -5.337828159332275, "global_step": 21616, "epoch": 514} {"train_loss": -5.349504470825195, "global_step": 21617, "epoch": 514} {"train_loss": -5.3882598876953125, "global_step": 21618, "epoch": 514} {"train_loss": -5.203343391418457, "global_step": 21619, "epoch": 514} {"train_loss": -5.270326614379883, "global_step": 21620, "epoch": 514} {"train_loss": -5.408052444458008, "global_step": 21621, "epoch": 514} {"train_loss": -5.221474647521973, "global_step": 21622, "epoch": 514} {"train_loss": -5.296010971069336, "global_step": 21623, "epoch": 514} {"train_loss": -5.39486026763916, "global_step": 21624, "epoch": 514} {"train_loss": -5.401257514953613, "global_step": 21625, "epoch": 514} {"train_loss": -5.381903648376465, "global_step": 21626, "epoch": 514} {"train_loss": -5.310486793518066, "global_step": 21627, "epoch": 514} {"train_loss": -5.34603214263916, "global_step": 21628, "epoch": 514} {"train_loss": -5.324137233552479, "global_step": 21629, "epoch": 514, "val_loss": 76266.6015625} {"train_loss": -5.373287200927734, "global_step": 21630, "epoch": 515} {"train_loss": -5.336190700531006, "global_step": 21631, "epoch": 515} {"train_loss": -5.13399600982666, "global_step": 21632, "epoch": 515} {"train_loss": -5.262104511260986, "global_step": 21633, "epoch": 515} {"train_loss": -5.449124336242676, "global_step": 21634, "epoch": 515} {"train_loss": -5.447671413421631, "global_step": 21635, "epoch": 515} {"train_loss": -5.375782489776611, "global_step": 21636, "epoch": 515} {"train_loss": -5.218409538269043, "global_step": 21637, "epoch": 515} {"train_loss": -5.2664031982421875, "global_step": 21638, "epoch": 515} {"train_loss": -5.432309627532959, "global_step": 21639, "epoch": 515} {"train_loss": -5.241091251373291, "global_step": 21640, "epoch": 515} {"train_loss": -5.341259002685547, "global_step": 21641, "epoch": 515} {"train_loss": -5.286479949951172, "global_step": 21642, "epoch": 515} {"train_loss": -5.422543525695801, "global_step": 21643, "epoch": 515} {"train_loss": -5.264953136444092, "global_step": 21644, "epoch": 515} {"train_loss": -5.347072601318359, "global_step": 21645, "epoch": 515} {"train_loss": -5.352508544921875, "global_step": 21646, "epoch": 515} {"train_loss": -5.334364414215088, "global_step": 21647, "epoch": 515} {"train_loss": -5.418540954589844, "global_step": 21648, "epoch": 515} {"train_loss": -5.268960952758789, "global_step": 21649, "epoch": 515} {"train_loss": -5.469456195831299, "global_step": 21650, "epoch": 515} {"train_loss": -5.460035800933838, "global_step": 21651, "epoch": 515} {"train_loss": -5.397307872772217, "global_step": 21652, "epoch": 515} {"train_loss": -5.181828498840332, "global_step": 21653, "epoch": 515} {"train_loss": -5.448010444641113, "global_step": 21654, "epoch": 515} {"train_loss": -5.391950607299805, "global_step": 21655, "epoch": 515} {"train_loss": -5.273865222930908, "global_step": 21656, "epoch": 515} {"train_loss": -5.367403030395508, "global_step": 21657, "epoch": 515} {"train_loss": -5.332332134246826, "global_step": 21658, "epoch": 515} {"train_loss": -5.296621322631836, "global_step": 21659, "epoch": 515} {"train_loss": -5.384019374847412, "global_step": 21660, "epoch": 515} {"train_loss": -5.329893112182617, "global_step": 21661, "epoch": 515} {"train_loss": -5.236048698425293, "global_step": 21662, "epoch": 515} {"train_loss": -5.390581130981445, "global_step": 21663, "epoch": 515} {"train_loss": -5.36488676071167, "global_step": 21664, "epoch": 515} {"train_loss": -5.430471897125244, "global_step": 21665, "epoch": 515} {"train_loss": -5.12410831451416, "global_step": 21666, "epoch": 515} {"train_loss": -5.405117988586426, "global_step": 21667, "epoch": 515} {"train_loss": -5.335243225097656, "global_step": 21668, "epoch": 515} {"train_loss": -5.25423526763916, "global_step": 21669, "epoch": 515} {"train_loss": -5.279527187347412, "global_step": 21670, "epoch": 515} {"train_loss": -5.332490989140102, "global_step": 21671, "epoch": 515, "val_loss": 76041.9609375} {"train_loss": -5.380697727203369, "global_step": 21672, "epoch": 516} {"train_loss": -5.324306964874268, "global_step": 21673, "epoch": 516} {"train_loss": -5.3321943283081055, "global_step": 21674, "epoch": 516} {"train_loss": -5.354180335998535, "global_step": 21675, "epoch": 516} {"train_loss": -5.3363847732543945, "global_step": 21676, "epoch": 516} {"train_loss": -5.247766494750977, "global_step": 21677, "epoch": 516} {"train_loss": -5.391678333282471, "global_step": 21678, "epoch": 516} {"train_loss": -5.425772666931152, "global_step": 21679, "epoch": 516} {"train_loss": -5.2797627449035645, "global_step": 21680, "epoch": 516} {"train_loss": -5.215500354766846, "global_step": 21681, "epoch": 516} {"train_loss": -5.316423416137695, "global_step": 21682, "epoch": 516} {"train_loss": -5.309762001037598, "global_step": 21683, "epoch": 516} {"train_loss": -5.353003978729248, "global_step": 21684, "epoch": 516} {"train_loss": -5.3551435470581055, "global_step": 21685, "epoch": 516} {"train_loss": -5.274204254150391, "global_step": 21686, "epoch": 516} {"train_loss": -5.276810646057129, "global_step": 21687, "epoch": 516} {"train_loss": -5.235003471374512, "global_step": 21688, "epoch": 516} {"train_loss": -5.169689178466797, "global_step": 21689, "epoch": 516} {"train_loss": -5.347288131713867, "global_step": 21690, "epoch": 516} {"train_loss": -5.252493858337402, "global_step": 21691, "epoch": 516} {"train_loss": -5.2073869705200195, "global_step": 21692, "epoch": 516} {"train_loss": -5.250446319580078, "global_step": 21693, "epoch": 516} {"train_loss": -5.113894462585449, "global_step": 21694, "epoch": 516} {"train_loss": -5.29047966003418, "global_step": 21695, "epoch": 516} {"train_loss": -5.336769104003906, "global_step": 21696, "epoch": 516} {"train_loss": -5.240931510925293, "global_step": 21697, "epoch": 516} {"train_loss": -5.446362018585205, "global_step": 21698, "epoch": 516} {"train_loss": -5.288557052612305, "global_step": 21699, "epoch": 516} {"train_loss": -5.24252462387085, "global_step": 21700, "epoch": 516} {"train_loss": -5.254615783691406, "global_step": 21701, "epoch": 516} {"train_loss": -5.328139305114746, "global_step": 21702, "epoch": 516} {"train_loss": -5.244708061218262, "global_step": 21703, "epoch": 516} {"train_loss": -5.2565507888793945, "global_step": 21704, "epoch": 516} {"train_loss": -5.4001970291137695, "global_step": 21705, "epoch": 516} {"train_loss": -5.262265682220459, "global_step": 21706, "epoch": 516} {"train_loss": -5.378762245178223, "global_step": 21707, "epoch": 516} {"train_loss": -5.204145908355713, "global_step": 21708, "epoch": 516} {"train_loss": -5.33229398727417, "global_step": 21709, "epoch": 516} {"train_loss": -5.276925086975098, "global_step": 21710, "epoch": 516} {"train_loss": -5.23714017868042, "global_step": 21711, "epoch": 516} {"train_loss": -5.181892395019531, "global_step": 21712, "epoch": 516} {"train_loss": -5.2927914801098055, "global_step": 21713, "epoch": 516, "val_loss": 77148.1640625} {"train_loss": -5.102330207824707, "global_step": 21714, "epoch": 517} {"train_loss": -5.331897735595703, "global_step": 21715, "epoch": 517} {"train_loss": -5.432663917541504, "global_step": 21716, "epoch": 517} {"train_loss": -5.278419494628906, "global_step": 21717, "epoch": 517} {"train_loss": -5.358054161071777, "global_step": 21718, "epoch": 517} {"train_loss": -5.328486919403076, "global_step": 21719, "epoch": 517} {"train_loss": -5.252486228942871, "global_step": 21720, "epoch": 517} {"train_loss": -5.378106117248535, "global_step": 21721, "epoch": 517} {"train_loss": -5.3088459968566895, "global_step": 21722, "epoch": 517} {"train_loss": -5.126348495483398, "global_step": 21723, "epoch": 517} {"train_loss": -5.462105751037598, "global_step": 21724, "epoch": 517} {"train_loss": -5.332489967346191, "global_step": 21725, "epoch": 517} {"train_loss": -5.0976080894470215, "global_step": 21726, "epoch": 517} {"train_loss": -5.325079917907715, "global_step": 21727, "epoch": 517} {"train_loss": -5.254366874694824, "global_step": 21728, "epoch": 517} {"train_loss": -5.268894195556641, "global_step": 21729, "epoch": 517} {"train_loss": -5.432096481323242, "global_step": 21730, "epoch": 517} {"train_loss": -5.1712212562561035, "global_step": 21731, "epoch": 517} {"train_loss": -5.165387153625488, "global_step": 21732, "epoch": 517} {"train_loss": -5.244579792022705, "global_step": 21733, "epoch": 517} {"train_loss": -5.251834869384766, "global_step": 21734, "epoch": 517} {"train_loss": -5.293929100036621, "global_step": 21735, "epoch": 517} {"train_loss": -5.231840133666992, "global_step": 21736, "epoch": 517} {"train_loss": -5.297540664672852, "global_step": 21737, "epoch": 517} {"train_loss": -5.26839017868042, "global_step": 21738, "epoch": 517} {"train_loss": -5.244420528411865, "global_step": 21739, "epoch": 517} {"train_loss": -5.329494476318359, "global_step": 21740, "epoch": 517} {"train_loss": -5.274317741394043, "global_step": 21741, "epoch": 517} {"train_loss": -5.417750835418701, "global_step": 21742, "epoch": 517} {"train_loss": -5.418705940246582, "global_step": 21743, "epoch": 517} {"train_loss": -5.185390949249268, "global_step": 21744, "epoch": 517} {"train_loss": -5.233175277709961, "global_step": 21745, "epoch": 517} {"train_loss": -5.378430366516113, "global_step": 21746, "epoch": 517} {"train_loss": -5.264392852783203, "global_step": 21747, "epoch": 517} {"train_loss": -5.320552825927734, "global_step": 21748, "epoch": 517} {"train_loss": -5.311560153961182, "global_step": 21749, "epoch": 517} {"train_loss": -5.137585639953613, "global_step": 21750, "epoch": 517} {"train_loss": -5.3504958152771, "global_step": 21751, "epoch": 517} {"train_loss": -5.390279293060303, "global_step": 21752, "epoch": 517} {"train_loss": -5.309934616088867, "global_step": 21753, "epoch": 517} {"train_loss": -5.303134918212891, "global_step": 21754, "epoch": 517} {"train_loss": -5.293347006752377, "global_step": 21755, "epoch": 517, "val_loss": 75841.3203125} {"train_loss": -5.2674360275268555, "global_step": 21756, "epoch": 518} {"train_loss": -5.408557891845703, "global_step": 21757, "epoch": 518} {"train_loss": -5.30085563659668, "global_step": 21758, "epoch": 518} {"train_loss": -5.296352863311768, "global_step": 21759, "epoch": 518} {"train_loss": -5.285525321960449, "global_step": 21760, "epoch": 518} {"train_loss": -5.466892242431641, "global_step": 21761, "epoch": 518} {"train_loss": -5.255329608917236, "global_step": 21762, "epoch": 518} {"train_loss": -5.237232685089111, "global_step": 21763, "epoch": 518} {"train_loss": -5.236050605773926, "global_step": 21764, "epoch": 518} {"train_loss": -5.330256462097168, "global_step": 21765, "epoch": 518} {"train_loss": -5.326926231384277, "global_step": 21766, "epoch": 518} {"train_loss": -5.315751552581787, "global_step": 21767, "epoch": 518} {"train_loss": -5.3354034423828125, "global_step": 21768, "epoch": 518} {"train_loss": -5.368960857391357, "global_step": 21769, "epoch": 518} {"train_loss": -5.321328163146973, "global_step": 21770, "epoch": 518} {"train_loss": -5.373215198516846, "global_step": 21771, "epoch": 518} {"train_loss": -5.456928730010986, "global_step": 21772, "epoch": 518} {"train_loss": -5.405943870544434, "global_step": 21773, "epoch": 518} {"train_loss": -5.398839950561523, "global_step": 21774, "epoch": 518} {"train_loss": -5.466464996337891, "global_step": 21775, "epoch": 518} {"train_loss": -5.368512153625488, "global_step": 21776, "epoch": 518} {"train_loss": -5.418682098388672, "global_step": 21777, "epoch": 518} {"train_loss": -5.30799674987793, "global_step": 21778, "epoch": 518} {"train_loss": -5.455181121826172, "global_step": 21779, "epoch": 518} {"train_loss": -5.428523063659668, "global_step": 21780, "epoch": 518} {"train_loss": -5.371191024780273, "global_step": 21781, "epoch": 518} {"train_loss": -5.279264450073242, "global_step": 21782, "epoch": 518} {"train_loss": -5.313376426696777, "global_step": 21783, "epoch": 518} {"train_loss": -5.294808387756348, "global_step": 21784, "epoch": 518} {"train_loss": -5.308358669281006, "global_step": 21785, "epoch": 518} {"train_loss": -5.286875247955322, "global_step": 21786, "epoch": 518} {"train_loss": -5.198181629180908, "global_step": 21787, "epoch": 518} {"train_loss": -5.321055889129639, "global_step": 21788, "epoch": 518} {"train_loss": -5.328516006469727, "global_step": 21789, "epoch": 518} {"train_loss": -5.210922718048096, "global_step": 21790, "epoch": 518} {"train_loss": -5.288524627685547, "global_step": 21791, "epoch": 518} {"train_loss": -5.250718593597412, "global_step": 21792, "epoch": 518} {"train_loss": -5.282980442047119, "global_step": 21793, "epoch": 518} {"train_loss": -5.2770304679870605, "global_step": 21794, "epoch": 518} {"train_loss": -5.278635025024414, "global_step": 21795, "epoch": 518} {"train_loss": -5.317298889160156, "global_step": 21796, "epoch": 518} {"train_loss": -5.332064276649838, "global_step": 21797, "epoch": 518, "val_loss": 77089.0546875} {"train_loss": -5.30654764175415, "global_step": 21798, "epoch": 519} {"train_loss": -5.331724643707275, "global_step": 21799, "epoch": 519} {"train_loss": -5.406579971313477, "global_step": 21800, "epoch": 519} {"train_loss": -5.279144287109375, "global_step": 21801, "epoch": 519} {"train_loss": -5.1837544441223145, "global_step": 21802, "epoch": 519} {"train_loss": -5.358189582824707, "global_step": 21803, "epoch": 519} {"train_loss": -5.475352764129639, "global_step": 21804, "epoch": 519} {"train_loss": -5.2389984130859375, "global_step": 21805, "epoch": 519} {"train_loss": -5.469692230224609, "global_step": 21806, "epoch": 519} {"train_loss": -5.357253074645996, "global_step": 21807, "epoch": 519} {"train_loss": -5.303984642028809, "global_step": 21808, "epoch": 519} {"train_loss": -5.38422966003418, "global_step": 21809, "epoch": 519} {"train_loss": -5.276628494262695, "global_step": 21810, "epoch": 519} {"train_loss": -5.31447696685791, "global_step": 21811, "epoch": 519} {"train_loss": -5.409736633300781, "global_step": 21812, "epoch": 519} {"train_loss": -5.24594783782959, "global_step": 21813, "epoch": 519} {"train_loss": -5.251957893371582, "global_step": 21814, "epoch": 519} {"train_loss": -5.32347297668457, "global_step": 21815, "epoch": 519} {"train_loss": -5.270936012268066, "global_step": 21816, "epoch": 519} {"train_loss": -5.299474239349365, "global_step": 21817, "epoch": 519} {"train_loss": -5.436473846435547, "global_step": 21818, "epoch": 519} {"train_loss": -5.271414756774902, "global_step": 21819, "epoch": 519} {"train_loss": -5.2625908851623535, "global_step": 21820, "epoch": 519} {"train_loss": -5.399345874786377, "global_step": 21821, "epoch": 519} {"train_loss": -5.383907318115234, "global_step": 21822, "epoch": 519} {"train_loss": -5.320402145385742, "global_step": 21823, "epoch": 519} {"train_loss": -5.417552471160889, "global_step": 21824, "epoch": 519} {"train_loss": -5.543164253234863, "global_step": 21825, "epoch": 519} {"train_loss": -5.3796706199646, "global_step": 21826, "epoch": 519} {"train_loss": -5.370724678039551, "global_step": 21827, "epoch": 519} {"train_loss": -5.319671154022217, "global_step": 21828, "epoch": 519} {"train_loss": -5.33903694152832, "global_step": 21829, "epoch": 519} {"train_loss": -5.353158950805664, "global_step": 21830, "epoch": 519} {"train_loss": -5.384685516357422, "global_step": 21831, "epoch": 519} {"train_loss": -5.4130401611328125, "global_step": 21832, "epoch": 519} {"train_loss": -5.277112007141113, "global_step": 21833, "epoch": 519} {"train_loss": -5.301027297973633, "global_step": 21834, "epoch": 519} {"train_loss": -5.2979912757873535, "global_step": 21835, "epoch": 519} {"train_loss": -5.297671794891357, "global_step": 21836, "epoch": 519} {"train_loss": -5.424701690673828, "global_step": 21837, "epoch": 519} {"train_loss": -5.2862067222595215, "global_step": 21838, "epoch": 519} {"train_loss": -5.342580840701149, "global_step": 21839, "epoch": 519, "val_loss": 77117.6796875} {"train_loss": -5.358647346496582, "global_step": 21840, "epoch": 520} {"train_loss": -4.781240463256836, "global_step": 21841, "epoch": 520} {"train_loss": -5.172610282897949, "global_step": 21842, "epoch": 520} {"train_loss": -5.208266258239746, "global_step": 21843, "epoch": 520} {"train_loss": -4.859334945678711, "global_step": 21844, "epoch": 520} {"train_loss": -5.039870262145996, "global_step": 21845, "epoch": 520} {"train_loss": -4.9732465744018555, "global_step": 21846, "epoch": 520} {"train_loss": -5.317812919616699, "global_step": 21847, "epoch": 520} {"train_loss": -5.070812225341797, "global_step": 21848, "epoch": 520} {"train_loss": -5.177923202514648, "global_step": 21849, "epoch": 520} {"train_loss": -5.071721076965332, "global_step": 21850, "epoch": 520} {"train_loss": -5.124640464782715, "global_step": 21851, "epoch": 520} {"train_loss": -5.143980026245117, "global_step": 21852, "epoch": 520} {"train_loss": -5.135612487792969, "global_step": 21853, "epoch": 520} {"train_loss": -5.306875228881836, "global_step": 21854, "epoch": 520} {"train_loss": -5.212823390960693, "global_step": 21855, "epoch": 520} {"train_loss": -5.338881492614746, "global_step": 21856, "epoch": 520} {"train_loss": -5.252671241760254, "global_step": 21857, "epoch": 520} {"train_loss": -5.432619094848633, "global_step": 21858, "epoch": 520} {"train_loss": -5.113651752471924, "global_step": 21859, "epoch": 520} {"train_loss": -5.208189487457275, "global_step": 21860, "epoch": 520} {"train_loss": -5.207098007202148, "global_step": 21861, "epoch": 520} {"train_loss": -5.293389320373535, "global_step": 21862, "epoch": 520} {"train_loss": -5.089141368865967, "global_step": 21863, "epoch": 520} {"train_loss": -5.199182510375977, "global_step": 21864, "epoch": 520} {"train_loss": -5.298433303833008, "global_step": 21865, "epoch": 520} {"train_loss": -5.188910484313965, "global_step": 21866, "epoch": 520} {"train_loss": -5.260641574859619, "global_step": 21867, "epoch": 520} {"train_loss": -5.392551422119141, "global_step": 21868, "epoch": 520} {"train_loss": -5.086912155151367, "global_step": 21869, "epoch": 520} {"train_loss": -5.206808090209961, "global_step": 21870, "epoch": 520} {"train_loss": -5.2722272872924805, "global_step": 21871, "epoch": 520} {"train_loss": -5.101466178894043, "global_step": 21872, "epoch": 520} {"train_loss": -5.356319427490234, "global_step": 21873, "epoch": 520} {"train_loss": -5.230127334594727, "global_step": 21874, "epoch": 520} {"train_loss": -5.371267318725586, "global_step": 21875, "epoch": 520} {"train_loss": -5.329404830932617, "global_step": 21876, "epoch": 520} {"train_loss": -5.270707130432129, "global_step": 21877, "epoch": 520} {"train_loss": -5.339481353759766, "global_step": 21878, "epoch": 520} {"train_loss": -5.206534385681152, "global_step": 21879, "epoch": 520} {"train_loss": -5.322937488555908, "global_step": 21880, "epoch": 520} {"train_loss": -5.205906572796049, "global_step": 21881, "epoch": 520, "val_loss": 76665.9140625} {"train_loss": -5.1689653396606445, "global_step": 21882, "epoch": 521} {"train_loss": -5.222084045410156, "global_step": 21883, "epoch": 521} {"train_loss": -5.269617557525635, "global_step": 21884, "epoch": 521} {"train_loss": -5.447740077972412, "global_step": 21885, "epoch": 521} {"train_loss": -5.371185302734375, "global_step": 21886, "epoch": 521} {"train_loss": -5.290508270263672, "global_step": 21887, "epoch": 521} {"train_loss": -5.104532241821289, "global_step": 21888, "epoch": 521} {"train_loss": -5.404844760894775, "global_step": 21889, "epoch": 521} {"train_loss": -5.196226119995117, "global_step": 21890, "epoch": 521} {"train_loss": -5.309131622314453, "global_step": 21891, "epoch": 521} {"train_loss": -5.277653217315674, "global_step": 21892, "epoch": 521} {"train_loss": -5.453855514526367, "global_step": 21893, "epoch": 521} {"train_loss": -5.265738487243652, "global_step": 21894, "epoch": 521} {"train_loss": -5.271560192108154, "global_step": 21895, "epoch": 521} {"train_loss": -5.405872344970703, "global_step": 21896, "epoch": 521} {"train_loss": -5.258443355560303, "global_step": 21897, "epoch": 521} {"train_loss": -5.403348922729492, "global_step": 21898, "epoch": 521} {"train_loss": -5.541036128997803, "global_step": 21899, "epoch": 521} {"train_loss": -5.276296615600586, "global_step": 21900, "epoch": 521} {"train_loss": -5.346790313720703, "global_step": 21901, "epoch": 521} {"train_loss": -5.157989501953125, "global_step": 21902, "epoch": 521} {"train_loss": -5.3868255615234375, "global_step": 21903, "epoch": 521} {"train_loss": -5.3376922607421875, "global_step": 21904, "epoch": 521} {"train_loss": -5.157936096191406, "global_step": 21905, "epoch": 521} {"train_loss": -5.388824462890625, "global_step": 21906, "epoch": 521} {"train_loss": -5.357296466827393, "global_step": 21907, "epoch": 521} {"train_loss": -5.235672950744629, "global_step": 21908, "epoch": 521} {"train_loss": -5.479989528656006, "global_step": 21909, "epoch": 521} {"train_loss": -5.271033763885498, "global_step": 21910, "epoch": 521} {"train_loss": -5.2906880378723145, "global_step": 21911, "epoch": 521} {"train_loss": -5.198963165283203, "global_step": 21912, "epoch": 521} {"train_loss": -5.146791458129883, "global_step": 21913, "epoch": 521} {"train_loss": -5.245855331420898, "global_step": 21914, "epoch": 521} {"train_loss": -5.336225986480713, "global_step": 21915, "epoch": 521} {"train_loss": -5.340691089630127, "global_step": 21916, "epoch": 521} {"train_loss": -5.403559684753418, "global_step": 21917, "epoch": 521} {"train_loss": -5.366153717041016, "global_step": 21918, "epoch": 521} {"train_loss": -5.443000793457031, "global_step": 21919, "epoch": 521} {"train_loss": -5.45188045501709, "global_step": 21920, "epoch": 521} {"train_loss": -5.300206661224365, "global_step": 21921, "epoch": 521} {"train_loss": -5.366067886352539, "global_step": 21922, "epoch": 521} {"train_loss": -5.3166420459747314, "global_step": 21923, "epoch": 521, "val_loss": 76308.875} {"train_loss": -5.317351341247559, "global_step": 21924, "epoch": 522} {"train_loss": -5.2063188552856445, "global_step": 21925, "epoch": 522} {"train_loss": -5.2111687660217285, "global_step": 21926, "epoch": 522} {"train_loss": -5.320755958557129, "global_step": 21927, "epoch": 522} {"train_loss": -5.36191463470459, "global_step": 21928, "epoch": 522} {"train_loss": -5.274075508117676, "global_step": 21929, "epoch": 522} {"train_loss": -5.478106498718262, "global_step": 21930, "epoch": 522} {"train_loss": -5.2467546463012695, "global_step": 21931, "epoch": 522} {"train_loss": -5.00760555267334, "global_step": 21932, "epoch": 522} {"train_loss": -5.423898696899414, "global_step": 21933, "epoch": 522} {"train_loss": -5.410021781921387, "global_step": 21934, "epoch": 522} {"train_loss": -5.382857322692871, "global_step": 21935, "epoch": 522} {"train_loss": -5.395166873931885, "global_step": 21936, "epoch": 522} {"train_loss": -5.277350902557373, "global_step": 21937, "epoch": 522} {"train_loss": -5.316249847412109, "global_step": 21938, "epoch": 522} {"train_loss": -5.371638298034668, "global_step": 21939, "epoch": 522} {"train_loss": -5.409967422485352, "global_step": 21940, "epoch": 522} {"train_loss": -5.1975812911987305, "global_step": 21941, "epoch": 522} {"train_loss": -5.344680309295654, "global_step": 21942, "epoch": 522} {"train_loss": -5.38605260848999, "global_step": 21943, "epoch": 522} {"train_loss": -5.220486164093018, "global_step": 21944, "epoch": 522} {"train_loss": -5.247879981994629, "global_step": 21945, "epoch": 522} {"train_loss": -5.2250261306762695, "global_step": 21946, "epoch": 522} {"train_loss": -5.315454483032227, "global_step": 21947, "epoch": 522} {"train_loss": -5.284990310668945, "global_step": 21948, "epoch": 522} {"train_loss": -5.195874214172363, "global_step": 21949, "epoch": 522} {"train_loss": -5.326532363891602, "global_step": 21950, "epoch": 522} {"train_loss": -5.351409435272217, "global_step": 21951, "epoch": 522} {"train_loss": -5.294147491455078, "global_step": 21952, "epoch": 522} {"train_loss": -5.4058685302734375, "global_step": 21953, "epoch": 522} {"train_loss": -5.406573295593262, "global_step": 21954, "epoch": 522} {"train_loss": -5.302534103393555, "global_step": 21955, "epoch": 522} {"train_loss": -5.301290512084961, "global_step": 21956, "epoch": 522} {"train_loss": -5.223359107971191, "global_step": 21957, "epoch": 522} {"train_loss": -5.297588348388672, "global_step": 21958, "epoch": 522} {"train_loss": -5.2562103271484375, "global_step": 21959, "epoch": 522} {"train_loss": -5.414679050445557, "global_step": 21960, "epoch": 522} {"train_loss": -5.351171970367432, "global_step": 21961, "epoch": 522} {"train_loss": -5.162321090698242, "global_step": 21962, "epoch": 522} {"train_loss": -5.340657711029053, "global_step": 21963, "epoch": 522} {"train_loss": -5.352382183074951, "global_step": 21964, "epoch": 522} {"train_loss": -5.306589614777338, "global_step": 21965, "epoch": 522, "val_loss": 75875.046875} {"train_loss": -5.385794639587402, "global_step": 21966, "epoch": 523} {"train_loss": -5.312806606292725, "global_step": 21967, "epoch": 523} {"train_loss": -5.4443678855896, "global_step": 21968, "epoch": 523} {"train_loss": -5.304460525512695, "global_step": 21969, "epoch": 523} {"train_loss": -5.356721878051758, "global_step": 21970, "epoch": 523} {"train_loss": -5.315291404724121, "global_step": 21971, "epoch": 523} {"train_loss": -5.348432540893555, "global_step": 21972, "epoch": 523} {"train_loss": -5.268441200256348, "global_step": 21973, "epoch": 523} {"train_loss": -5.44728946685791, "global_step": 21974, "epoch": 523} {"train_loss": -5.314875602722168, "global_step": 21975, "epoch": 523} {"train_loss": -5.296046257019043, "global_step": 21976, "epoch": 523} {"train_loss": -5.470986366271973, "global_step": 21977, "epoch": 523} {"train_loss": -5.383546352386475, "global_step": 21978, "epoch": 523} {"train_loss": -5.306333541870117, "global_step": 21979, "epoch": 523} {"train_loss": -5.3618316650390625, "global_step": 21980, "epoch": 523} {"train_loss": -5.3206892013549805, "global_step": 21981, "epoch": 523} {"train_loss": -5.38789176940918, "global_step": 21982, "epoch": 523} {"train_loss": -5.311370372772217, "global_step": 21983, "epoch": 523} {"train_loss": -5.384284496307373, "global_step": 21984, "epoch": 523} {"train_loss": -5.268865585327148, "global_step": 21985, "epoch": 523} {"train_loss": -5.306344032287598, "global_step": 21986, "epoch": 523} {"train_loss": -5.373167514801025, "global_step": 21987, "epoch": 523} {"train_loss": -5.262115478515625, "global_step": 21988, "epoch": 523} {"train_loss": -5.315845489501953, "global_step": 21989, "epoch": 523} {"train_loss": -5.308947563171387, "global_step": 21990, "epoch": 523} {"train_loss": -5.348299503326416, "global_step": 21991, "epoch": 523} {"train_loss": -5.369804382324219, "global_step": 21992, "epoch": 523} {"train_loss": -5.200464248657227, "global_step": 21993, "epoch": 523} {"train_loss": -5.410400390625, "global_step": 21994, "epoch": 523} {"train_loss": -5.236563682556152, "global_step": 21995, "epoch": 523} {"train_loss": -5.287726879119873, "global_step": 21996, "epoch": 523} {"train_loss": -5.283895969390869, "global_step": 21997, "epoch": 523} {"train_loss": -5.332520961761475, "global_step": 21998, "epoch": 523} {"train_loss": -5.352910041809082, "global_step": 21999, "epoch": 523} {"train_loss": -5.241100311279297, "global_step": 22000, "epoch": 523} {"train_loss": -5.162149906158447, "global_step": 22001, "epoch": 523} {"train_loss": -5.3199357986450195, "global_step": 22002, "epoch": 523} {"train_loss": -5.317893028259277, "global_step": 22003, "epoch": 523} {"train_loss": -5.388361930847168, "global_step": 22004, "epoch": 523} {"train_loss": -5.222482681274414, "global_step": 22005, "epoch": 523} {"train_loss": -5.293641090393066, "global_step": 22006, "epoch": 523} {"train_loss": -5.32533073425293, "global_step": 22007, "epoch": 523, "val_loss": 76594.9921875} {"train_loss": -5.363471031188965, "global_step": 22008, "epoch": 524} {"train_loss": -5.247325897216797, "global_step": 22009, "epoch": 524} {"train_loss": -5.316654682159424, "global_step": 22010, "epoch": 524} {"train_loss": -5.284178733825684, "global_step": 22011, "epoch": 524} {"train_loss": -5.338142395019531, "global_step": 22012, "epoch": 524} {"train_loss": -5.433201789855957, "global_step": 22013, "epoch": 524} {"train_loss": -5.359397888183594, "global_step": 22014, "epoch": 524} {"train_loss": -5.382435321807861, "global_step": 22015, "epoch": 524} {"train_loss": -5.36794376373291, "global_step": 22016, "epoch": 524} {"train_loss": -5.3401780128479, "global_step": 22017, "epoch": 524} {"train_loss": -5.309625625610352, "global_step": 22018, "epoch": 524} {"train_loss": -5.335155487060547, "global_step": 22019, "epoch": 524} {"train_loss": -5.293956756591797, "global_step": 22020, "epoch": 524} {"train_loss": -5.264450550079346, "global_step": 22021, "epoch": 524} {"train_loss": -5.32094669342041, "global_step": 22022, "epoch": 524} {"train_loss": -5.353281497955322, "global_step": 22023, "epoch": 524} {"train_loss": -5.268242835998535, "global_step": 22024, "epoch": 524} {"train_loss": -5.411065101623535, "global_step": 22025, "epoch": 524} {"train_loss": -5.436583518981934, "global_step": 22026, "epoch": 524} {"train_loss": -5.270373344421387, "global_step": 22027, "epoch": 524} {"train_loss": -5.388171672821045, "global_step": 22028, "epoch": 524} {"train_loss": -5.369709491729736, "global_step": 22029, "epoch": 524} {"train_loss": -5.413145542144775, "global_step": 22030, "epoch": 524} {"train_loss": -5.279684066772461, "global_step": 22031, "epoch": 524} {"train_loss": -5.391218185424805, "global_step": 22032, "epoch": 524} {"train_loss": -5.262955665588379, "global_step": 22033, "epoch": 524} {"train_loss": -5.266030311584473, "global_step": 22034, "epoch": 524} {"train_loss": -5.48657751083374, "global_step": 22035, "epoch": 524} {"train_loss": -5.352149963378906, "global_step": 22036, "epoch": 524} {"train_loss": -5.391445159912109, "global_step": 22037, "epoch": 524} {"train_loss": -5.38921594619751, "global_step": 22038, "epoch": 524} {"train_loss": -5.4242658615112305, "global_step": 22039, "epoch": 524} {"train_loss": -5.450362205505371, "global_step": 22040, "epoch": 524} {"train_loss": -5.302734851837158, "global_step": 22041, "epoch": 524} {"train_loss": -5.416223526000977, "global_step": 22042, "epoch": 524} {"train_loss": -5.349015712738037, "global_step": 22043, "epoch": 524} {"train_loss": -5.323376655578613, "global_step": 22044, "epoch": 524} {"train_loss": -5.424167633056641, "global_step": 22045, "epoch": 524} {"train_loss": -5.290190696716309, "global_step": 22046, "epoch": 524} {"train_loss": -5.246496677398682, "global_step": 22047, "epoch": 524} {"train_loss": -5.242300987243652, "global_step": 22048, "epoch": 524} {"train_loss": -5.3444090230124335, "global_step": 22049, "epoch": 524, "val_loss": 76071.4453125} {"train_loss": -5.32496452331543, "global_step": 22050, "epoch": 525} {"train_loss": -5.224370002746582, "global_step": 22051, "epoch": 525} {"train_loss": -5.334865093231201, "global_step": 22052, "epoch": 525} {"train_loss": -5.382010459899902, "global_step": 22053, "epoch": 525} {"train_loss": -5.349539756774902, "global_step": 22054, "epoch": 525} {"train_loss": -5.271795272827148, "global_step": 22055, "epoch": 525} {"train_loss": -5.329497337341309, "global_step": 22056, "epoch": 525} {"train_loss": -5.367667198181152, "global_step": 22057, "epoch": 525} {"train_loss": -5.300320625305176, "global_step": 22058, "epoch": 525} {"train_loss": -5.344127178192139, "global_step": 22059, "epoch": 525} {"train_loss": -5.352110385894775, "global_step": 22060, "epoch": 525} {"train_loss": -5.286364555358887, "global_step": 22061, "epoch": 525} {"train_loss": -5.559445858001709, "global_step": 22062, "epoch": 525} {"train_loss": -5.381992816925049, "global_step": 22063, "epoch": 525} {"train_loss": -5.3992791175842285, "global_step": 22064, "epoch": 525} {"train_loss": -5.315951347351074, "global_step": 22065, "epoch": 525} {"train_loss": -5.371177673339844, "global_step": 22066, "epoch": 525} {"train_loss": -5.331326484680176, "global_step": 22067, "epoch": 525} {"train_loss": -5.280256271362305, "global_step": 22068, "epoch": 525} {"train_loss": -5.37708854675293, "global_step": 22069, "epoch": 525} {"train_loss": -5.364758014678955, "global_step": 22070, "epoch": 525} {"train_loss": -5.22353458404541, "global_step": 22071, "epoch": 525} {"train_loss": -5.375272750854492, "global_step": 22072, "epoch": 525} {"train_loss": -5.213706970214844, "global_step": 22073, "epoch": 525} {"train_loss": -5.384856700897217, "global_step": 22074, "epoch": 525} {"train_loss": -5.261363983154297, "global_step": 22075, "epoch": 525} {"train_loss": -5.2620439529418945, "global_step": 22076, "epoch": 525} {"train_loss": -5.24349308013916, "global_step": 22077, "epoch": 525} {"train_loss": -5.427034378051758, "global_step": 22078, "epoch": 525} {"train_loss": -5.255036354064941, "global_step": 22079, "epoch": 525} {"train_loss": -5.318725109100342, "global_step": 22080, "epoch": 525} {"train_loss": -5.344023704528809, "global_step": 22081, "epoch": 525} {"train_loss": -5.438379764556885, "global_step": 22082, "epoch": 525} {"train_loss": -5.219124794006348, "global_step": 22083, "epoch": 525} {"train_loss": -5.292001724243164, "global_step": 22084, "epoch": 525} {"train_loss": -5.478646278381348, "global_step": 22085, "epoch": 525} {"train_loss": -5.274095058441162, "global_step": 22086, "epoch": 525} {"train_loss": -5.309442520141602, "global_step": 22087, "epoch": 525} {"train_loss": -5.43182373046875, "global_step": 22088, "epoch": 525} {"train_loss": -5.203782081604004, "global_step": 22089, "epoch": 525} {"train_loss": -5.380890846252441, "global_step": 22090, "epoch": 525} {"train_loss": -5.33200266247704, "global_step": 22091, "epoch": 525, "val_loss": 75906.859375} {"train_loss": -5.229032516479492, "global_step": 22092, "epoch": 526} {"train_loss": -5.311925888061523, "global_step": 22093, "epoch": 526} {"train_loss": -5.390413761138916, "global_step": 22094, "epoch": 526} {"train_loss": -5.4990620613098145, "global_step": 22095, "epoch": 526} {"train_loss": -5.190319538116455, "global_step": 22096, "epoch": 526} {"train_loss": -5.325831413269043, "global_step": 22097, "epoch": 526} {"train_loss": -5.4008708000183105, "global_step": 22098, "epoch": 526} {"train_loss": -5.241235733032227, "global_step": 22099, "epoch": 526} {"train_loss": -5.38729190826416, "global_step": 22100, "epoch": 526} {"train_loss": -5.235414505004883, "global_step": 22101, "epoch": 526} {"train_loss": -5.384129524230957, "global_step": 22102, "epoch": 526} {"train_loss": -5.382850646972656, "global_step": 22103, "epoch": 526} {"train_loss": -5.389249324798584, "global_step": 22104, "epoch": 526} {"train_loss": -5.301369667053223, "global_step": 22105, "epoch": 526} {"train_loss": -5.412946701049805, "global_step": 22106, "epoch": 526} {"train_loss": -5.325449466705322, "global_step": 22107, "epoch": 526} {"train_loss": -5.512790679931641, "global_step": 22108, "epoch": 526} {"train_loss": -5.269518852233887, "global_step": 22109, "epoch": 526} {"train_loss": -5.344095230102539, "global_step": 22110, "epoch": 526} {"train_loss": -5.3181562423706055, "global_step": 22111, "epoch": 526} {"train_loss": -5.2526936531066895, "global_step": 22112, "epoch": 526} {"train_loss": -5.2691497802734375, "global_step": 22113, "epoch": 526} {"train_loss": -5.291350841522217, "global_step": 22114, "epoch": 526} {"train_loss": -5.3838043212890625, "global_step": 22115, "epoch": 526} {"train_loss": -5.264678955078125, "global_step": 22116, "epoch": 526} {"train_loss": -5.309502601623535, "global_step": 22117, "epoch": 526} {"train_loss": -5.3278608322143555, "global_step": 22118, "epoch": 526} {"train_loss": -5.0394768714904785, "global_step": 22119, "epoch": 526} {"train_loss": -5.426873207092285, "global_step": 22120, "epoch": 526} {"train_loss": -5.265547752380371, "global_step": 22121, "epoch": 526} {"train_loss": -5.321653842926025, "global_step": 22122, "epoch": 526} {"train_loss": -5.364821434020996, "global_step": 22123, "epoch": 526} {"train_loss": -5.283778667449951, "global_step": 22124, "epoch": 526} {"train_loss": -5.255216598510742, "global_step": 22125, "epoch": 526} {"train_loss": -5.277416229248047, "global_step": 22126, "epoch": 526} {"train_loss": -5.424395561218262, "global_step": 22127, "epoch": 526} {"train_loss": -5.361515998840332, "global_step": 22128, "epoch": 526} {"train_loss": -5.351048469543457, "global_step": 22129, "epoch": 526} {"train_loss": -5.42741584777832, "global_step": 22130, "epoch": 526} {"train_loss": -5.410322189331055, "global_step": 22131, "epoch": 526} {"train_loss": -5.319705009460449, "global_step": 22132, "epoch": 526} {"train_loss": -5.3283335481371195, "global_step": 22133, "epoch": 526, "val_loss": 76345.484375} {"train_loss": -5.39669132232666, "global_step": 22134, "epoch": 527} {"train_loss": -5.3460540771484375, "global_step": 22135, "epoch": 527} {"train_loss": -5.412055969238281, "global_step": 22136, "epoch": 527} {"train_loss": -5.455991268157959, "global_step": 22137, "epoch": 527} {"train_loss": -5.335080623626709, "global_step": 22138, "epoch": 527} {"train_loss": -5.426730155944824, "global_step": 22139, "epoch": 527} {"train_loss": -5.368350505828857, "global_step": 22140, "epoch": 527} {"train_loss": -5.272434711456299, "global_step": 22141, "epoch": 527} {"train_loss": -5.357903003692627, "global_step": 22142, "epoch": 527} {"train_loss": -5.261878490447998, "global_step": 22143, "epoch": 527} {"train_loss": -5.273687362670898, "global_step": 22144, "epoch": 527} {"train_loss": -5.517437934875488, "global_step": 22145, "epoch": 527} {"train_loss": -5.195005416870117, "global_step": 22146, "epoch": 527} {"train_loss": -5.265526294708252, "global_step": 22147, "epoch": 527} {"train_loss": -5.379742622375488, "global_step": 22148, "epoch": 527} {"train_loss": -5.396344184875488, "global_step": 22149, "epoch": 527} {"train_loss": -5.281332492828369, "global_step": 22150, "epoch": 527} {"train_loss": -5.321418762207031, "global_step": 22151, "epoch": 527} {"train_loss": -5.128427505493164, "global_step": 22152, "epoch": 527} {"train_loss": -5.170131683349609, "global_step": 22153, "epoch": 527} {"train_loss": -5.259496212005615, "global_step": 22154, "epoch": 527} {"train_loss": -5.172873497009277, "global_step": 22155, "epoch": 527} {"train_loss": -5.396308422088623, "global_step": 22156, "epoch": 527} {"train_loss": -5.416966438293457, "global_step": 22157, "epoch": 527} {"train_loss": -5.215509414672852, "global_step": 22158, "epoch": 527} {"train_loss": -5.082807540893555, "global_step": 22159, "epoch": 527} {"train_loss": -5.2480854988098145, "global_step": 22160, "epoch": 527} {"train_loss": -5.279253005981445, "global_step": 22161, "epoch": 527} {"train_loss": -5.451842784881592, "global_step": 22162, "epoch": 527} {"train_loss": -5.312878608703613, "global_step": 22163, "epoch": 527} {"train_loss": -5.420614719390869, "global_step": 22164, "epoch": 527} {"train_loss": -5.456931114196777, "global_step": 22165, "epoch": 527} {"train_loss": -5.343016624450684, "global_step": 22166, "epoch": 527} {"train_loss": -5.218770980834961, "global_step": 22167, "epoch": 527} {"train_loss": -5.256275177001953, "global_step": 22168, "epoch": 527} {"train_loss": -5.237285614013672, "global_step": 22169, "epoch": 527} {"train_loss": -5.151778697967529, "global_step": 22170, "epoch": 527} {"train_loss": -5.216368675231934, "global_step": 22171, "epoch": 527} {"train_loss": -5.248579025268555, "global_step": 22172, "epoch": 527} {"train_loss": -5.285444259643555, "global_step": 22173, "epoch": 527} {"train_loss": -5.268049716949463, "global_step": 22174, "epoch": 527} {"train_loss": -5.305878707340786, "global_step": 22175, "epoch": 527, "val_loss": 76355.0703125} {"train_loss": -5.360893249511719, "global_step": 22176, "epoch": 528} {"train_loss": -5.365236282348633, "global_step": 22177, "epoch": 528} {"train_loss": -5.388628005981445, "global_step": 22178, "epoch": 528} {"train_loss": -5.180305480957031, "global_step": 22179, "epoch": 528} {"train_loss": -5.27140998840332, "global_step": 22180, "epoch": 528} {"train_loss": -5.385998249053955, "global_step": 22181, "epoch": 528} {"train_loss": -5.427259922027588, "global_step": 22182, "epoch": 528} {"train_loss": -5.203120231628418, "global_step": 22183, "epoch": 528} {"train_loss": -5.283422946929932, "global_step": 22184, "epoch": 528} {"train_loss": -5.370465278625488, "global_step": 22185, "epoch": 528} {"train_loss": -5.370495796203613, "global_step": 22186, "epoch": 528} {"train_loss": -5.225466728210449, "global_step": 22187, "epoch": 528} {"train_loss": -5.238460540771484, "global_step": 22188, "epoch": 528} {"train_loss": -5.314824104309082, "global_step": 22189, "epoch": 528} {"train_loss": -5.30340576171875, "global_step": 22190, "epoch": 528} {"train_loss": -5.1128950119018555, "global_step": 22191, "epoch": 528} {"train_loss": -5.409135341644287, "global_step": 22192, "epoch": 528} {"train_loss": -5.405905723571777, "global_step": 22193, "epoch": 528} {"train_loss": -5.245014190673828, "global_step": 22194, "epoch": 528} {"train_loss": -5.355677604675293, "global_step": 22195, "epoch": 528} {"train_loss": -5.406174659729004, "global_step": 22196, "epoch": 528} {"train_loss": -5.301220893859863, "global_step": 22197, "epoch": 528} {"train_loss": -5.296694278717041, "global_step": 22198, "epoch": 528} {"train_loss": -5.338616371154785, "global_step": 22199, "epoch": 528} {"train_loss": -5.459869384765625, "global_step": 22200, "epoch": 528} {"train_loss": -5.233099937438965, "global_step": 22201, "epoch": 528} {"train_loss": -5.218445777893066, "global_step": 22202, "epoch": 528} {"train_loss": -5.421082496643066, "global_step": 22203, "epoch": 528} {"train_loss": -5.358191013336182, "global_step": 22204, "epoch": 528} {"train_loss": -5.336130142211914, "global_step": 22205, "epoch": 528} {"train_loss": -5.377535343170166, "global_step": 22206, "epoch": 528} {"train_loss": -5.331817150115967, "global_step": 22207, "epoch": 528} {"train_loss": -5.417280197143555, "global_step": 22208, "epoch": 528} {"train_loss": -5.40527868270874, "global_step": 22209, "epoch": 528} {"train_loss": -5.323744773864746, "global_step": 22210, "epoch": 528} {"train_loss": -5.303686618804932, "global_step": 22211, "epoch": 528} {"train_loss": -5.275419235229492, "global_step": 22212, "epoch": 528} {"train_loss": -5.43607234954834, "global_step": 22213, "epoch": 528} {"train_loss": -5.3779826164245605, "global_step": 22214, "epoch": 528} {"train_loss": -5.236592769622803, "global_step": 22215, "epoch": 528} {"train_loss": -5.499752998352051, "global_step": 22216, "epoch": 528} {"train_loss": -5.331045048577445, "global_step": 22217, "epoch": 528, "val_loss": 76131.40625} {"train_loss": -5.443695068359375, "global_step": 22218, "epoch": 529} {"train_loss": -5.4900970458984375, "global_step": 22219, "epoch": 529} {"train_loss": -5.325836658477783, "global_step": 22220, "epoch": 529} {"train_loss": -5.347905158996582, "global_step": 22221, "epoch": 529} {"train_loss": -5.162346363067627, "global_step": 22222, "epoch": 529} {"train_loss": -5.297745704650879, "global_step": 22223, "epoch": 529} {"train_loss": -5.26589822769165, "global_step": 22224, "epoch": 529} {"train_loss": -5.293063163757324, "global_step": 22225, "epoch": 529} {"train_loss": -5.181319236755371, "global_step": 22226, "epoch": 529} {"train_loss": -5.384629726409912, "global_step": 22227, "epoch": 529} {"train_loss": -5.343199729919434, "global_step": 22228, "epoch": 529} {"train_loss": -5.362004280090332, "global_step": 22229, "epoch": 529} {"train_loss": -5.2810540199279785, "global_step": 22230, "epoch": 529} {"train_loss": -5.24876594543457, "global_step": 22231, "epoch": 529} {"train_loss": -5.262607574462891, "global_step": 22232, "epoch": 529} {"train_loss": -5.236626625061035, "global_step": 22233, "epoch": 529} {"train_loss": -5.323783874511719, "global_step": 22234, "epoch": 529} {"train_loss": -5.275025367736816, "global_step": 22235, "epoch": 529} {"train_loss": -5.407520294189453, "global_step": 22236, "epoch": 529} {"train_loss": -5.1532368659973145, "global_step": 22237, "epoch": 529} {"train_loss": -5.3141350746154785, "global_step": 22238, "epoch": 529} {"train_loss": -5.333313465118408, "global_step": 22239, "epoch": 529} {"train_loss": -5.189040184020996, "global_step": 22240, "epoch": 529} {"train_loss": -5.311783790588379, "global_step": 22241, "epoch": 529} {"train_loss": -5.203636646270752, "global_step": 22242, "epoch": 529} {"train_loss": -5.287600994110107, "global_step": 22243, "epoch": 529} {"train_loss": -5.280858993530273, "global_step": 22244, "epoch": 529} {"train_loss": -5.227708339691162, "global_step": 22245, "epoch": 529} {"train_loss": -5.423859119415283, "global_step": 22246, "epoch": 529} {"train_loss": -5.410534858703613, "global_step": 22247, "epoch": 529} {"train_loss": -5.457152366638184, "global_step": 22248, "epoch": 529} {"train_loss": -5.31690788269043, "global_step": 22249, "epoch": 529} {"train_loss": -5.360919952392578, "global_step": 22250, "epoch": 529} {"train_loss": -5.261607646942139, "global_step": 22251, "epoch": 529} {"train_loss": -5.208950042724609, "global_step": 22252, "epoch": 529} {"train_loss": -5.31282901763916, "global_step": 22253, "epoch": 529} {"train_loss": -5.298400402069092, "global_step": 22254, "epoch": 529} {"train_loss": -5.322099685668945, "global_step": 22255, "epoch": 529} {"train_loss": -5.376282691955566, "global_step": 22256, "epoch": 529} {"train_loss": -5.331047534942627, "global_step": 22257, "epoch": 529} {"train_loss": -5.476724624633789, "global_step": 22258, "epoch": 529} {"train_loss": -5.313748416446504, "global_step": 22259, "epoch": 529, "val_loss": 76602.109375} {"train_loss": -5.305490016937256, "global_step": 22260, "epoch": 530} {"train_loss": -5.280742645263672, "global_step": 22261, "epoch": 530} {"train_loss": -5.178567409515381, "global_step": 22262, "epoch": 530} {"train_loss": -5.411807060241699, "global_step": 22263, "epoch": 530} {"train_loss": -5.405944347381592, "global_step": 22264, "epoch": 530} {"train_loss": -5.260551452636719, "global_step": 22265, "epoch": 530} {"train_loss": -5.347203254699707, "global_step": 22266, "epoch": 530} {"train_loss": -5.268095970153809, "global_step": 22267, "epoch": 530} {"train_loss": -5.488455772399902, "global_step": 22268, "epoch": 530} {"train_loss": -5.42977237701416, "global_step": 22269, "epoch": 530} {"train_loss": -5.3817548751831055, "global_step": 22270, "epoch": 530} {"train_loss": -5.3002028465271, "global_step": 22271, "epoch": 530} {"train_loss": -5.34770393371582, "global_step": 22272, "epoch": 530} {"train_loss": -5.396928310394287, "global_step": 22273, "epoch": 530} {"train_loss": -5.322571754455566, "global_step": 22274, "epoch": 530} {"train_loss": -5.1717681884765625, "global_step": 22275, "epoch": 530} {"train_loss": -5.305102348327637, "global_step": 22276, "epoch": 530} {"train_loss": -5.4100799560546875, "global_step": 22277, "epoch": 530} {"train_loss": -5.295342445373535, "global_step": 22278, "epoch": 530} {"train_loss": -5.253258228302002, "global_step": 22279, "epoch": 530} {"train_loss": -5.38945198059082, "global_step": 22280, "epoch": 530} {"train_loss": -5.428704261779785, "global_step": 22281, "epoch": 530} {"train_loss": -5.152181148529053, "global_step": 22282, "epoch": 530} {"train_loss": -5.316450119018555, "global_step": 22283, "epoch": 530} {"train_loss": -5.488738059997559, "global_step": 22284, "epoch": 530} {"train_loss": -5.367504119873047, "global_step": 22285, "epoch": 530} {"train_loss": -5.326603889465332, "global_step": 22286, "epoch": 530} {"train_loss": -5.374019145965576, "global_step": 22287, "epoch": 530} {"train_loss": -5.294632434844971, "global_step": 22288, "epoch": 530} {"train_loss": -5.376405239105225, "global_step": 22289, "epoch": 530} {"train_loss": -5.376324653625488, "global_step": 22290, "epoch": 530} {"train_loss": -5.412178993225098, "global_step": 22291, "epoch": 530} {"train_loss": -5.3755693435668945, "global_step": 22292, "epoch": 530} {"train_loss": -5.442047119140625, "global_step": 22293, "epoch": 530} {"train_loss": -5.368405342102051, "global_step": 22294, "epoch": 530} {"train_loss": -5.389033317565918, "global_step": 22295, "epoch": 530} {"train_loss": -5.237573623657227, "global_step": 22296, "epoch": 530} {"train_loss": -5.417901992797852, "global_step": 22297, "epoch": 530} {"train_loss": -5.384429931640625, "global_step": 22298, "epoch": 530} {"train_loss": -5.293548583984375, "global_step": 22299, "epoch": 530} {"train_loss": -5.336489677429199, "global_step": 22300, "epoch": 530} {"train_loss": -5.343806141898746, "global_step": 22301, "epoch": 530, "val_loss": 76295.640625} {"train_loss": -5.179015159606934, "global_step": 22302, "epoch": 531} {"train_loss": -5.275132179260254, "global_step": 22303, "epoch": 531} {"train_loss": -5.349977493286133, "global_step": 22304, "epoch": 531} {"train_loss": -5.32939338684082, "global_step": 22305, "epoch": 531} {"train_loss": -5.044504642486572, "global_step": 22306, "epoch": 531} {"train_loss": -5.313558578491211, "global_step": 22307, "epoch": 531} {"train_loss": -5.284188270568848, "global_step": 22308, "epoch": 531} {"train_loss": -5.24772834777832, "global_step": 22309, "epoch": 531} {"train_loss": -5.432051658630371, "global_step": 22310, "epoch": 531} {"train_loss": -5.241249084472656, "global_step": 22311, "epoch": 531} {"train_loss": -5.336212158203125, "global_step": 22312, "epoch": 531} {"train_loss": -5.347428321838379, "global_step": 22313, "epoch": 531} {"train_loss": -5.2677764892578125, "global_step": 22314, "epoch": 531} {"train_loss": -5.262413024902344, "global_step": 22315, "epoch": 531} {"train_loss": -5.2692952156066895, "global_step": 22316, "epoch": 531} {"train_loss": -5.338142395019531, "global_step": 22317, "epoch": 531} {"train_loss": -5.302001953125, "global_step": 22318, "epoch": 531} {"train_loss": -5.354407787322998, "global_step": 22319, "epoch": 531} {"train_loss": -5.238692283630371, "global_step": 22320, "epoch": 531} {"train_loss": -5.309109687805176, "global_step": 22321, "epoch": 531} {"train_loss": -5.253439903259277, "global_step": 22322, "epoch": 531} {"train_loss": -5.325141429901123, "global_step": 22323, "epoch": 531} {"train_loss": -5.340244293212891, "global_step": 22324, "epoch": 531} {"train_loss": -5.223257064819336, "global_step": 22325, "epoch": 531} {"train_loss": -5.276209831237793, "global_step": 22326, "epoch": 531} {"train_loss": -5.3022637367248535, "global_step": 22327, "epoch": 531} {"train_loss": -5.047066688537598, "global_step": 22328, "epoch": 531} {"train_loss": -5.4709978103637695, "global_step": 22329, "epoch": 531} {"train_loss": -5.295221328735352, "global_step": 22330, "epoch": 531} {"train_loss": -5.373130798339844, "global_step": 22331, "epoch": 531} {"train_loss": -5.291220664978027, "global_step": 22332, "epoch": 531} {"train_loss": -5.3993706703186035, "global_step": 22333, "epoch": 531} {"train_loss": -5.11379861831665, "global_step": 22334, "epoch": 531} {"train_loss": -5.328296661376953, "global_step": 22335, "epoch": 531} {"train_loss": -5.299724578857422, "global_step": 22336, "epoch": 531} {"train_loss": -5.334436416625977, "global_step": 22337, "epoch": 531} {"train_loss": -5.241622447967529, "global_step": 22338, "epoch": 531} {"train_loss": -5.191727161407471, "global_step": 22339, "epoch": 531} {"train_loss": -5.339062690734863, "global_step": 22340, "epoch": 531} {"train_loss": -5.346354961395264, "global_step": 22341, "epoch": 531} {"train_loss": -5.456803321838379, "global_step": 22342, "epoch": 531} {"train_loss": -5.292287451880319, "global_step": 22343, "epoch": 531, "val_loss": 76598.484375} {"train_loss": -5.382801055908203, "global_step": 22344, "epoch": 532} {"train_loss": -5.25004768371582, "global_step": 22345, "epoch": 532} {"train_loss": -5.352425575256348, "global_step": 22346, "epoch": 532} {"train_loss": -5.434186935424805, "global_step": 22347, "epoch": 532} {"train_loss": -5.3114094734191895, "global_step": 22348, "epoch": 532} {"train_loss": -5.309849262237549, "global_step": 22349, "epoch": 532} {"train_loss": -5.268582344055176, "global_step": 22350, "epoch": 532} {"train_loss": -5.368490695953369, "global_step": 22351, "epoch": 532} {"train_loss": -5.290436744689941, "global_step": 22352, "epoch": 532} {"train_loss": -5.374471664428711, "global_step": 22353, "epoch": 532} {"train_loss": -5.267704010009766, "global_step": 22354, "epoch": 532} {"train_loss": -5.392892837524414, "global_step": 22355, "epoch": 532} {"train_loss": -5.229804039001465, "global_step": 22356, "epoch": 532} {"train_loss": -5.327320575714111, "global_step": 22357, "epoch": 532} {"train_loss": -5.260141372680664, "global_step": 22358, "epoch": 532} {"train_loss": -5.25946569442749, "global_step": 22359, "epoch": 532} {"train_loss": -5.269896507263184, "global_step": 22360, "epoch": 532} {"train_loss": -5.326056003570557, "global_step": 22361, "epoch": 532} {"train_loss": -5.2884979248046875, "global_step": 22362, "epoch": 532} {"train_loss": -5.372340202331543, "global_step": 22363, "epoch": 532} {"train_loss": -5.347853660583496, "global_step": 22364, "epoch": 532} {"train_loss": -5.369668960571289, "global_step": 22365, "epoch": 532} {"train_loss": -5.410521030426025, "global_step": 22366, "epoch": 532} {"train_loss": -5.385019302368164, "global_step": 22367, "epoch": 532} {"train_loss": -5.234864234924316, "global_step": 22368, "epoch": 532} {"train_loss": -5.304449558258057, "global_step": 22369, "epoch": 532} {"train_loss": -5.505051136016846, "global_step": 22370, "epoch": 532} {"train_loss": -5.234762191772461, "global_step": 22371, "epoch": 532} {"train_loss": -5.181708812713623, "global_step": 22372, "epoch": 532} {"train_loss": -5.444901466369629, "global_step": 22373, "epoch": 532} {"train_loss": -5.272853374481201, "global_step": 22374, "epoch": 532} {"train_loss": -5.125131130218506, "global_step": 22375, "epoch": 532} {"train_loss": -5.368976593017578, "global_step": 22376, "epoch": 532} {"train_loss": -5.24360466003418, "global_step": 22377, "epoch": 532} {"train_loss": -5.379711151123047, "global_step": 22378, "epoch": 532} {"train_loss": -5.299990177154541, "global_step": 22379, "epoch": 532} {"train_loss": -5.257700443267822, "global_step": 22380, "epoch": 532} {"train_loss": -5.413409233093262, "global_step": 22381, "epoch": 532} {"train_loss": -5.358674049377441, "global_step": 22382, "epoch": 532} {"train_loss": -5.27391242980957, "global_step": 22383, "epoch": 532} {"train_loss": -5.375514507293701, "global_step": 22384, "epoch": 532} {"train_loss": -5.320006109419323, "global_step": 22385, "epoch": 532, "val_loss": 76174.3984375} {"train_loss": -5.302984714508057, "global_step": 22386, "epoch": 533} {"train_loss": -5.297684669494629, "global_step": 22387, "epoch": 533} {"train_loss": -5.27125883102417, "global_step": 22388, "epoch": 533} {"train_loss": -5.356316566467285, "global_step": 22389, "epoch": 533} {"train_loss": -5.243997573852539, "global_step": 22390, "epoch": 533} {"train_loss": -5.500301361083984, "global_step": 22391, "epoch": 533} {"train_loss": -5.276832103729248, "global_step": 22392, "epoch": 533} {"train_loss": -5.430412769317627, "global_step": 22393, "epoch": 533} {"train_loss": -5.331765651702881, "global_step": 22394, "epoch": 533} {"train_loss": -5.353845596313477, "global_step": 22395, "epoch": 533} {"train_loss": -5.3553338050842285, "global_step": 22396, "epoch": 533} {"train_loss": -5.223640441894531, "global_step": 22397, "epoch": 533} {"train_loss": -5.346173286437988, "global_step": 22398, "epoch": 533} {"train_loss": -5.439021110534668, "global_step": 22399, "epoch": 533} {"train_loss": -5.4930572509765625, "global_step": 22400, "epoch": 533} {"train_loss": -5.303102493286133, "global_step": 22401, "epoch": 533} {"train_loss": -5.40613317489624, "global_step": 22402, "epoch": 533} {"train_loss": -5.377538204193115, "global_step": 22403, "epoch": 533} {"train_loss": -5.271241188049316, "global_step": 22404, "epoch": 533} {"train_loss": -5.274985313415527, "global_step": 22405, "epoch": 533} {"train_loss": -5.244363307952881, "global_step": 22406, "epoch": 533} {"train_loss": -5.274323463439941, "global_step": 22407, "epoch": 533} {"train_loss": -5.3698883056640625, "global_step": 22408, "epoch": 533} {"train_loss": -5.195727348327637, "global_step": 22409, "epoch": 533} {"train_loss": -5.2553300857543945, "global_step": 22410, "epoch": 533} {"train_loss": -5.276118755340576, "global_step": 22411, "epoch": 533} {"train_loss": -5.205777168273926, "global_step": 22412, "epoch": 533} {"train_loss": -5.310366630554199, "global_step": 22413, "epoch": 533} {"train_loss": -5.343866348266602, "global_step": 22414, "epoch": 533} {"train_loss": -5.2846574783325195, "global_step": 22415, "epoch": 533} {"train_loss": -5.1640119552612305, "global_step": 22416, "epoch": 533} {"train_loss": -5.4782328605651855, "global_step": 22417, "epoch": 533} {"train_loss": -5.331977844238281, "global_step": 22418, "epoch": 533} {"train_loss": -5.3354973793029785, "global_step": 22419, "epoch": 533} {"train_loss": -5.404302597045898, "global_step": 22420, "epoch": 533} {"train_loss": -5.298542022705078, "global_step": 22421, "epoch": 533} {"train_loss": -5.373887538909912, "global_step": 22422, "epoch": 533} {"train_loss": -5.335330963134766, "global_step": 22423, "epoch": 533} {"train_loss": -5.255520820617676, "global_step": 22424, "epoch": 533} {"train_loss": -5.231866359710693, "global_step": 22425, "epoch": 533} {"train_loss": -5.399450302124023, "global_step": 22426, "epoch": 533} {"train_loss": -5.323909282684326, "global_step": 22427, "epoch": 533, "val_loss": 76030.8671875} {"train_loss": -5.344851493835449, "global_step": 22428, "epoch": 534} {"train_loss": -5.1826982498168945, "global_step": 22429, "epoch": 534} {"train_loss": -5.244472503662109, "global_step": 22430, "epoch": 534} {"train_loss": -5.494909286499023, "global_step": 22431, "epoch": 534} {"train_loss": -5.4754486083984375, "global_step": 22432, "epoch": 534} {"train_loss": -5.316213130950928, "global_step": 22433, "epoch": 534} {"train_loss": -5.216801166534424, "global_step": 22434, "epoch": 534} {"train_loss": -5.427931785583496, "global_step": 22435, "epoch": 534} {"train_loss": -5.318454742431641, "global_step": 22436, "epoch": 534} {"train_loss": -5.289898872375488, "global_step": 22437, "epoch": 534} {"train_loss": -5.333606719970703, "global_step": 22438, "epoch": 534} {"train_loss": -5.19407844543457, "global_step": 22439, "epoch": 534} {"train_loss": -5.201832294464111, "global_step": 22440, "epoch": 534} {"train_loss": -5.272853851318359, "global_step": 22441, "epoch": 534} {"train_loss": -5.128755569458008, "global_step": 22442, "epoch": 534} {"train_loss": -5.264495372772217, "global_step": 22443, "epoch": 534} {"train_loss": -5.178962707519531, "global_step": 22444, "epoch": 534} {"train_loss": -5.12845516204834, "global_step": 22445, "epoch": 534} {"train_loss": -5.212379455566406, "global_step": 22446, "epoch": 534} {"train_loss": -5.233085632324219, "global_step": 22447, "epoch": 534} {"train_loss": -5.351341247558594, "global_step": 22448, "epoch": 534} {"train_loss": -5.161782264709473, "global_step": 22449, "epoch": 534} {"train_loss": -5.322792053222656, "global_step": 22450, "epoch": 534} {"train_loss": -5.274624347686768, "global_step": 22451, "epoch": 534} {"train_loss": -5.209366321563721, "global_step": 22452, "epoch": 534} {"train_loss": -5.288477897644043, "global_step": 22453, "epoch": 534} {"train_loss": -5.2431840896606445, "global_step": 22454, "epoch": 534} {"train_loss": -5.376053810119629, "global_step": 22455, "epoch": 534} {"train_loss": -5.245859146118164, "global_step": 22456, "epoch": 534} {"train_loss": -5.251523494720459, "global_step": 22457, "epoch": 534} {"train_loss": -5.275054931640625, "global_step": 22458, "epoch": 534} {"train_loss": -5.397728443145752, "global_step": 22459, "epoch": 534} {"train_loss": -5.269904136657715, "global_step": 22460, "epoch": 534} {"train_loss": -5.270913124084473, "global_step": 22461, "epoch": 534} {"train_loss": -5.276383399963379, "global_step": 22462, "epoch": 534} {"train_loss": -5.5067315101623535, "global_step": 22463, "epoch": 534} {"train_loss": -5.399543762207031, "global_step": 22464, "epoch": 534} {"train_loss": -5.323241710662842, "global_step": 22465, "epoch": 534} {"train_loss": -5.245027542114258, "global_step": 22466, "epoch": 534} {"train_loss": -5.285260200500488, "global_step": 22467, "epoch": 534} {"train_loss": -5.47951602935791, "global_step": 22468, "epoch": 534} {"train_loss": -5.29279146875654, "global_step": 22469, "epoch": 534, "val_loss": 76406.609375} {"train_loss": -5.306237697601318, "global_step": 22470, "epoch": 535} {"train_loss": -5.283777236938477, "global_step": 22471, "epoch": 535} {"train_loss": -5.3675432205200195, "global_step": 22472, "epoch": 535} {"train_loss": -5.259267330169678, "global_step": 22473, "epoch": 535} {"train_loss": -5.340517997741699, "global_step": 22474, "epoch": 535} {"train_loss": -5.464558124542236, "global_step": 22475, "epoch": 535} {"train_loss": -5.420426368713379, "global_step": 22476, "epoch": 535} {"train_loss": -5.347917556762695, "global_step": 22477, "epoch": 535} {"train_loss": -5.332054138183594, "global_step": 22478, "epoch": 535} {"train_loss": -5.259040355682373, "global_step": 22479, "epoch": 535} {"train_loss": -5.360463619232178, "global_step": 22480, "epoch": 535} {"train_loss": -5.143734931945801, "global_step": 22481, "epoch": 535} {"train_loss": -5.333377361297607, "global_step": 22482, "epoch": 535} {"train_loss": -5.3204498291015625, "global_step": 22483, "epoch": 535} {"train_loss": -5.325448989868164, "global_step": 22484, "epoch": 535} {"train_loss": -5.180416107177734, "global_step": 22485, "epoch": 535} {"train_loss": -5.469864845275879, "global_step": 22486, "epoch": 535} {"train_loss": -5.381496906280518, "global_step": 22487, "epoch": 535} {"train_loss": -5.41133975982666, "global_step": 22488, "epoch": 535} {"train_loss": -5.521546363830566, "global_step": 22489, "epoch": 535} {"train_loss": -5.313356399536133, "global_step": 22490, "epoch": 535} {"train_loss": -5.341656684875488, "global_step": 22491, "epoch": 535} {"train_loss": -5.309015274047852, "global_step": 22492, "epoch": 535} {"train_loss": -5.329862594604492, "global_step": 22493, "epoch": 535} {"train_loss": -5.401275634765625, "global_step": 22494, "epoch": 535} {"train_loss": -5.31455659866333, "global_step": 22495, "epoch": 535} {"train_loss": -5.452299118041992, "global_step": 22496, "epoch": 535} {"train_loss": -5.210165023803711, "global_step": 22497, "epoch": 535} {"train_loss": -5.468151092529297, "global_step": 22498, "epoch": 535} {"train_loss": -5.275322914123535, "global_step": 22499, "epoch": 535} {"train_loss": -5.4740214347839355, "global_step": 22500, "epoch": 535} {"train_loss": -5.258450508117676, "global_step": 22501, "epoch": 535} {"train_loss": -5.443272590637207, "global_step": 22502, "epoch": 535} {"train_loss": -5.224487781524658, "global_step": 22503, "epoch": 535} {"train_loss": -5.331365585327148, "global_step": 22504, "epoch": 535} {"train_loss": -5.32243013381958, "global_step": 22505, "epoch": 535} {"train_loss": -5.406874179840088, "global_step": 22506, "epoch": 535} {"train_loss": -5.31870174407959, "global_step": 22507, "epoch": 535} {"train_loss": -5.463099479675293, "global_step": 22508, "epoch": 535} {"train_loss": -5.36955451965332, "global_step": 22509, "epoch": 535} {"train_loss": -5.338101863861084, "global_step": 22510, "epoch": 535} {"train_loss": -5.34643232254755, "global_step": 22511, "epoch": 535, "val_loss": 76865.734375} {"train_loss": -5.303896903991699, "global_step": 22512, "epoch": 536} {"train_loss": -5.430970191955566, "global_step": 22513, "epoch": 536} {"train_loss": -5.37609338760376, "global_step": 22514, "epoch": 536} {"train_loss": -5.169417381286621, "global_step": 22515, "epoch": 536} {"train_loss": -5.2814531326293945, "global_step": 22516, "epoch": 536} {"train_loss": -5.343969821929932, "global_step": 22517, "epoch": 536} {"train_loss": -5.244697570800781, "global_step": 22518, "epoch": 536} {"train_loss": -5.343563079833984, "global_step": 22519, "epoch": 536} {"train_loss": -5.2973456382751465, "global_step": 22520, "epoch": 536} {"train_loss": -5.571722507476807, "global_step": 22521, "epoch": 536} {"train_loss": -5.340738296508789, "global_step": 22522, "epoch": 536} {"train_loss": -5.142966270446777, "global_step": 22523, "epoch": 536} {"train_loss": -5.573533058166504, "global_step": 22524, "epoch": 536} {"train_loss": -5.284725666046143, "global_step": 22525, "epoch": 536} {"train_loss": -5.2899298667907715, "global_step": 22526, "epoch": 536} {"train_loss": -5.248951435089111, "global_step": 22527, "epoch": 536} {"train_loss": -5.463109016418457, "global_step": 22528, "epoch": 536} {"train_loss": -5.4255547523498535, "global_step": 22529, "epoch": 536} {"train_loss": -5.304584503173828, "global_step": 22530, "epoch": 536} {"train_loss": -5.357720375061035, "global_step": 22531, "epoch": 536} {"train_loss": -5.294000148773193, "global_step": 22532, "epoch": 536} {"train_loss": -5.232423782348633, "global_step": 22533, "epoch": 536} {"train_loss": -5.4473724365234375, "global_step": 22534, "epoch": 536} {"train_loss": -5.244691371917725, "global_step": 22535, "epoch": 536} {"train_loss": -5.235123157501221, "global_step": 22536, "epoch": 536} {"train_loss": -5.330704689025879, "global_step": 22537, "epoch": 536} {"train_loss": -5.163352966308594, "global_step": 22538, "epoch": 536} {"train_loss": -5.361666679382324, "global_step": 22539, "epoch": 536} {"train_loss": -5.386745452880859, "global_step": 22540, "epoch": 536} {"train_loss": -5.2424516677856445, "global_step": 22541, "epoch": 536} {"train_loss": -5.279574394226074, "global_step": 22542, "epoch": 536} {"train_loss": -5.33100700378418, "global_step": 22543, "epoch": 536} {"train_loss": -5.263744354248047, "global_step": 22544, "epoch": 536} {"train_loss": -5.191333770751953, "global_step": 22545, "epoch": 536} {"train_loss": -5.402600288391113, "global_step": 22546, "epoch": 536} {"train_loss": -5.40582275390625, "global_step": 22547, "epoch": 536} {"train_loss": -5.37431526184082, "global_step": 22548, "epoch": 536} {"train_loss": -5.226998329162598, "global_step": 22549, "epoch": 536} {"train_loss": -5.291379928588867, "global_step": 22550, "epoch": 536} {"train_loss": -5.314340591430664, "global_step": 22551, "epoch": 536} {"train_loss": -5.336154937744141, "global_step": 22552, "epoch": 536} {"train_loss": -5.316989092599778, "global_step": 22553, "epoch": 536, "val_loss": 76213.7890625} {"train_loss": -5.3209452629089355, "global_step": 22554, "epoch": 537} {"train_loss": -5.3251729011535645, "global_step": 22555, "epoch": 537} {"train_loss": -5.389983654022217, "global_step": 22556, "epoch": 537} {"train_loss": -5.4586076736450195, "global_step": 22557, "epoch": 537} {"train_loss": -5.344356536865234, "global_step": 22558, "epoch": 537} {"train_loss": -5.397485256195068, "global_step": 22559, "epoch": 537} {"train_loss": -5.191144943237305, "global_step": 22560, "epoch": 537} {"train_loss": -5.423604965209961, "global_step": 22561, "epoch": 537} {"train_loss": -5.328791618347168, "global_step": 22562, "epoch": 537} {"train_loss": -5.256074905395508, "global_step": 22563, "epoch": 537} {"train_loss": -5.444103240966797, "global_step": 22564, "epoch": 537} {"train_loss": -5.35561466217041, "global_step": 22565, "epoch": 537} {"train_loss": -5.441919326782227, "global_step": 22566, "epoch": 537} {"train_loss": -5.499053001403809, "global_step": 22567, "epoch": 537} {"train_loss": -5.318342685699463, "global_step": 22568, "epoch": 537} {"train_loss": -5.208335876464844, "global_step": 22569, "epoch": 537} {"train_loss": -5.509273529052734, "global_step": 22570, "epoch": 537} {"train_loss": -5.283965110778809, "global_step": 22571, "epoch": 537} {"train_loss": -5.411061763763428, "global_step": 22572, "epoch": 537} {"train_loss": -5.348227500915527, "global_step": 22573, "epoch": 537} {"train_loss": -5.493781089782715, "global_step": 22574, "epoch": 537} {"train_loss": -5.35368537902832, "global_step": 22575, "epoch": 537} {"train_loss": -5.238576889038086, "global_step": 22576, "epoch": 537} {"train_loss": -5.381333351135254, "global_step": 22577, "epoch": 537} {"train_loss": -5.4184417724609375, "global_step": 22578, "epoch": 537} {"train_loss": -5.215000152587891, "global_step": 22579, "epoch": 537} {"train_loss": -5.404899597167969, "global_step": 22580, "epoch": 537} {"train_loss": -5.290831089019775, "global_step": 22581, "epoch": 537} {"train_loss": -5.194744110107422, "global_step": 22582, "epoch": 537} {"train_loss": -5.407512664794922, "global_step": 22583, "epoch": 537} {"train_loss": -5.326234817504883, "global_step": 22584, "epoch": 537} {"train_loss": -5.278731822967529, "global_step": 22585, "epoch": 537} {"train_loss": -5.329427719116211, "global_step": 22586, "epoch": 537} {"train_loss": -5.294544219970703, "global_step": 22587, "epoch": 537} {"train_loss": -5.213946342468262, "global_step": 22588, "epoch": 537} {"train_loss": -5.457658290863037, "global_step": 22589, "epoch": 537} {"train_loss": -5.405707359313965, "global_step": 22590, "epoch": 537} {"train_loss": -5.325708866119385, "global_step": 22591, "epoch": 537} {"train_loss": -5.360946178436279, "global_step": 22592, "epoch": 537} {"train_loss": -5.285250663757324, "global_step": 22593, "epoch": 537} {"train_loss": -5.526431560516357, "global_step": 22594, "epoch": 537} {"train_loss": -5.353181225912912, "global_step": 22595, "epoch": 537, "val_loss": 76219.703125} {"train_loss": -5.293552398681641, "global_step": 22596, "epoch": 538} {"train_loss": -5.448262691497803, "global_step": 22597, "epoch": 538} {"train_loss": -5.386628150939941, "global_step": 22598, "epoch": 538} {"train_loss": -5.427850723266602, "global_step": 22599, "epoch": 538} {"train_loss": -5.294189453125, "global_step": 22600, "epoch": 538} {"train_loss": -5.396313667297363, "global_step": 22601, "epoch": 538} {"train_loss": -5.284390449523926, "global_step": 22602, "epoch": 538} {"train_loss": -5.216001033782959, "global_step": 22603, "epoch": 538} {"train_loss": -5.203225135803223, "global_step": 22604, "epoch": 538} {"train_loss": -5.280508995056152, "global_step": 22605, "epoch": 538} {"train_loss": -5.261518478393555, "global_step": 22606, "epoch": 538} {"train_loss": -5.358969688415527, "global_step": 22607, "epoch": 538} {"train_loss": -5.3386125564575195, "global_step": 22608, "epoch": 538} {"train_loss": -5.3026885986328125, "global_step": 22609, "epoch": 538} {"train_loss": -5.358351707458496, "global_step": 22610, "epoch": 538} {"train_loss": -5.394770622253418, "global_step": 22611, "epoch": 538} {"train_loss": -5.424466133117676, "global_step": 22612, "epoch": 538} {"train_loss": -5.430622100830078, "global_step": 22613, "epoch": 538} {"train_loss": -5.254212379455566, "global_step": 22614, "epoch": 538} {"train_loss": -5.373924255371094, "global_step": 22615, "epoch": 538} {"train_loss": -5.381114482879639, "global_step": 22616, "epoch": 538} {"train_loss": -5.287361145019531, "global_step": 22617, "epoch": 538} {"train_loss": -5.2407331466674805, "global_step": 22618, "epoch": 538} {"train_loss": -5.257402420043945, "global_step": 22619, "epoch": 538} {"train_loss": -5.4163103103637695, "global_step": 22620, "epoch": 538} {"train_loss": -5.161219596862793, "global_step": 22621, "epoch": 538} {"train_loss": -5.343503952026367, "global_step": 22622, "epoch": 538} {"train_loss": -5.289763450622559, "global_step": 22623, "epoch": 538} {"train_loss": -5.120870590209961, "global_step": 22624, "epoch": 538} {"train_loss": -5.173087120056152, "global_step": 22625, "epoch": 538} {"train_loss": -5.104089736938477, "global_step": 22626, "epoch": 538} {"train_loss": -5.249454975128174, "global_step": 22627, "epoch": 538} {"train_loss": -5.159372329711914, "global_step": 22628, "epoch": 538} {"train_loss": -5.160256385803223, "global_step": 22629, "epoch": 538} {"train_loss": -5.23432731628418, "global_step": 22630, "epoch": 538} {"train_loss": -5.194891929626465, "global_step": 22631, "epoch": 538} {"train_loss": -5.281497955322266, "global_step": 22632, "epoch": 538} {"train_loss": -5.355980396270752, "global_step": 22633, "epoch": 538} {"train_loss": -5.241786003112793, "global_step": 22634, "epoch": 538} {"train_loss": -5.276236057281494, "global_step": 22635, "epoch": 538} {"train_loss": -5.382748126983643, "global_step": 22636, "epoch": 538} {"train_loss": -5.292437167394729, "global_step": 22637, "epoch": 538, "val_loss": 76222.3984375} {"train_loss": -5.250967025756836, "global_step": 22638, "epoch": 539} {"train_loss": -5.386713981628418, "global_step": 22639, "epoch": 539} {"train_loss": -5.304323196411133, "global_step": 22640, "epoch": 539} {"train_loss": -5.333593368530273, "global_step": 22641, "epoch": 539} {"train_loss": -5.304107666015625, "global_step": 22642, "epoch": 539} {"train_loss": -5.353206634521484, "global_step": 22643, "epoch": 539} {"train_loss": -5.353532791137695, "global_step": 22644, "epoch": 539} {"train_loss": -5.245799541473389, "global_step": 22645, "epoch": 539} {"train_loss": -5.355991363525391, "global_step": 22646, "epoch": 539} {"train_loss": -5.3054938316345215, "global_step": 22647, "epoch": 539} {"train_loss": -5.398820877075195, "global_step": 22648, "epoch": 539} {"train_loss": -5.406863689422607, "global_step": 22649, "epoch": 539} {"train_loss": -5.353899002075195, "global_step": 22650, "epoch": 539} {"train_loss": -5.2445268630981445, "global_step": 22651, "epoch": 539} {"train_loss": -5.3371710777282715, "global_step": 22652, "epoch": 539} {"train_loss": -5.346872806549072, "global_step": 22653, "epoch": 539} {"train_loss": -5.197700500488281, "global_step": 22654, "epoch": 539} {"train_loss": -5.344758987426758, "global_step": 22655, "epoch": 539} {"train_loss": -5.3015360832214355, "global_step": 22656, "epoch": 539} {"train_loss": -5.216467380523682, "global_step": 22657, "epoch": 539} {"train_loss": -5.185094833374023, "global_step": 22658, "epoch": 539} {"train_loss": -5.365386009216309, "global_step": 22659, "epoch": 539} {"train_loss": -5.261151313781738, "global_step": 22660, "epoch": 539} {"train_loss": -5.298868179321289, "global_step": 22661, "epoch": 539} {"train_loss": -5.338106155395508, "global_step": 22662, "epoch": 539} {"train_loss": -5.348060607910156, "global_step": 22663, "epoch": 539} {"train_loss": -5.255395412445068, "global_step": 22664, "epoch": 539} {"train_loss": -5.423542022705078, "global_step": 22665, "epoch": 539} {"train_loss": -5.278985023498535, "global_step": 22666, "epoch": 539} {"train_loss": -5.27720308303833, "global_step": 22667, "epoch": 539} {"train_loss": -5.408271789550781, "global_step": 22668, "epoch": 539} {"train_loss": -5.245419025421143, "global_step": 22669, "epoch": 539} {"train_loss": -5.302698135375977, "global_step": 22670, "epoch": 539} {"train_loss": -5.306375026702881, "global_step": 22671, "epoch": 539} {"train_loss": -5.503795623779297, "global_step": 22672, "epoch": 539} {"train_loss": -5.338753700256348, "global_step": 22673, "epoch": 539} {"train_loss": -5.383296966552734, "global_step": 22674, "epoch": 539} {"train_loss": -5.384321212768555, "global_step": 22675, "epoch": 539} {"train_loss": -5.275012016296387, "global_step": 22676, "epoch": 539} {"train_loss": -5.304669380187988, "global_step": 22677, "epoch": 539} {"train_loss": -5.354343414306641, "global_step": 22678, "epoch": 539} {"train_loss": -5.3230349109286355, "global_step": 22679, "epoch": 539, "val_loss": 76087.6953125} {"train_loss": -5.450547218322754, "global_step": 22680, "epoch": 540} {"train_loss": -5.294200897216797, "global_step": 22681, "epoch": 540} {"train_loss": -5.322592735290527, "global_step": 22682, "epoch": 540} {"train_loss": -5.4577226638793945, "global_step": 22683, "epoch": 540} {"train_loss": -5.298969268798828, "global_step": 22684, "epoch": 540} {"train_loss": -5.414073944091797, "global_step": 22685, "epoch": 540} {"train_loss": -5.423803806304932, "global_step": 22686, "epoch": 540} {"train_loss": -5.477867126464844, "global_step": 22687, "epoch": 540} {"train_loss": -5.251949310302734, "global_step": 22688, "epoch": 540} {"train_loss": -5.335701942443848, "global_step": 22689, "epoch": 540} {"train_loss": -5.342280387878418, "global_step": 22690, "epoch": 540} {"train_loss": -5.3761138916015625, "global_step": 22691, "epoch": 540} {"train_loss": -5.218425750732422, "global_step": 22692, "epoch": 540} {"train_loss": -5.308351039886475, "global_step": 22693, "epoch": 540} {"train_loss": -5.37788724899292, "global_step": 22694, "epoch": 540} {"train_loss": -5.372976303100586, "global_step": 22695, "epoch": 540} {"train_loss": -5.328386306762695, "global_step": 22696, "epoch": 540} {"train_loss": -5.365697860717773, "global_step": 22697, "epoch": 540} {"train_loss": -5.465704441070557, "global_step": 22698, "epoch": 540} {"train_loss": -5.422842979431152, "global_step": 22699, "epoch": 540} {"train_loss": -5.3142499923706055, "global_step": 22700, "epoch": 540} {"train_loss": -5.371837615966797, "global_step": 22701, "epoch": 540} {"train_loss": -5.210888385772705, "global_step": 22702, "epoch": 540} {"train_loss": -5.524465560913086, "global_step": 22703, "epoch": 540} {"train_loss": -5.240973472595215, "global_step": 22704, "epoch": 540} {"train_loss": -5.293634414672852, "global_step": 22705, "epoch": 540} {"train_loss": -5.378132343292236, "global_step": 22706, "epoch": 540} {"train_loss": -5.32318639755249, "global_step": 22707, "epoch": 540} {"train_loss": -5.317330837249756, "global_step": 22708, "epoch": 540} {"train_loss": -5.341503143310547, "global_step": 22709, "epoch": 540} {"train_loss": -5.110492706298828, "global_step": 22710, "epoch": 540} {"train_loss": -5.279088973999023, "global_step": 22711, "epoch": 540} {"train_loss": -5.186440944671631, "global_step": 22712, "epoch": 540} {"train_loss": -5.398185729980469, "global_step": 22713, "epoch": 540} {"train_loss": -5.232030868530273, "global_step": 22714, "epoch": 540} {"train_loss": -5.411351203918457, "global_step": 22715, "epoch": 540} {"train_loss": -5.186685562133789, "global_step": 22716, "epoch": 540} {"train_loss": -5.284817695617676, "global_step": 22717, "epoch": 540} {"train_loss": -5.4138383865356445, "global_step": 22718, "epoch": 540} {"train_loss": -5.290646553039551, "global_step": 22719, "epoch": 540} {"train_loss": -5.320969581604004, "global_step": 22720, "epoch": 540} {"train_loss": -5.334482420058477, "global_step": 22721, "epoch": 540, "val_loss": 75529.2890625} {"train_loss": -5.454084873199463, "global_step": 22722, "epoch": 541} {"train_loss": -5.351494789123535, "global_step": 22723, "epoch": 541} {"train_loss": -5.38038444519043, "global_step": 22724, "epoch": 541} {"train_loss": -5.3085832595825195, "global_step": 22725, "epoch": 541} {"train_loss": -5.429309844970703, "global_step": 22726, "epoch": 541} {"train_loss": -5.441900730133057, "global_step": 22727, "epoch": 541} {"train_loss": -5.345444679260254, "global_step": 22728, "epoch": 541} {"train_loss": -5.438477039337158, "global_step": 22729, "epoch": 541} {"train_loss": -5.362695693969727, "global_step": 22730, "epoch": 541} {"train_loss": -5.1780500411987305, "global_step": 22731, "epoch": 541} {"train_loss": -5.275537014007568, "global_step": 22732, "epoch": 541} {"train_loss": -5.393603324890137, "global_step": 22733, "epoch": 541} {"train_loss": -5.378355979919434, "global_step": 22734, "epoch": 541} {"train_loss": -5.290161609649658, "global_step": 22735, "epoch": 541} {"train_loss": -5.431162357330322, "global_step": 22736, "epoch": 541} {"train_loss": -5.46152925491333, "global_step": 22737, "epoch": 541} {"train_loss": -5.213179588317871, "global_step": 22738, "epoch": 541} {"train_loss": -5.252729415893555, "global_step": 22739, "epoch": 541} {"train_loss": -5.198022365570068, "global_step": 22740, "epoch": 541} {"train_loss": -5.401361465454102, "global_step": 22741, "epoch": 541} {"train_loss": -5.373763084411621, "global_step": 22742, "epoch": 541} {"train_loss": -5.233186721801758, "global_step": 22743, "epoch": 541} {"train_loss": -5.455117702484131, "global_step": 22744, "epoch": 541} {"train_loss": -5.163511753082275, "global_step": 22745, "epoch": 541} {"train_loss": -5.258810997009277, "global_step": 22746, "epoch": 541} {"train_loss": -5.214021682739258, "global_step": 22747, "epoch": 541} {"train_loss": -5.292858123779297, "global_step": 22748, "epoch": 541} {"train_loss": -5.316277027130127, "global_step": 22749, "epoch": 541} {"train_loss": -5.279022216796875, "global_step": 22750, "epoch": 541} {"train_loss": -5.24161434173584, "global_step": 22751, "epoch": 541} {"train_loss": -5.466586112976074, "global_step": 22752, "epoch": 541} {"train_loss": -5.305527687072754, "global_step": 22753, "epoch": 541} {"train_loss": -5.344851493835449, "global_step": 22754, "epoch": 541} {"train_loss": -5.322013854980469, "global_step": 22755, "epoch": 541} {"train_loss": -5.245153903961182, "global_step": 22756, "epoch": 541} {"train_loss": -5.303160190582275, "global_step": 22757, "epoch": 541} {"train_loss": -5.462391376495361, "global_step": 22758, "epoch": 541} {"train_loss": -5.403504371643066, "global_step": 22759, "epoch": 541} {"train_loss": -5.188117027282715, "global_step": 22760, "epoch": 541} {"train_loss": -5.350308418273926, "global_step": 22761, "epoch": 541} {"train_loss": -5.32273006439209, "global_step": 22762, "epoch": 541} {"train_loss": -5.33012935093471, "global_step": 22763, "epoch": 541, "val_loss": 75911.59375} {"train_loss": -5.411552429199219, "global_step": 22764, "epoch": 542} {"train_loss": -5.301868438720703, "global_step": 22765, "epoch": 542} {"train_loss": -5.160181999206543, "global_step": 22766, "epoch": 542} {"train_loss": -5.447183609008789, "global_step": 22767, "epoch": 542} {"train_loss": -5.31491756439209, "global_step": 22768, "epoch": 542} {"train_loss": -5.390890121459961, "global_step": 22769, "epoch": 542} {"train_loss": -5.258286476135254, "global_step": 22770, "epoch": 542} {"train_loss": -5.258626937866211, "global_step": 22771, "epoch": 542} {"train_loss": -5.259283065795898, "global_step": 22772, "epoch": 542} {"train_loss": -5.253511428833008, "global_step": 22773, "epoch": 542} {"train_loss": -5.355470657348633, "global_step": 22774, "epoch": 542} {"train_loss": -5.263915061950684, "global_step": 22775, "epoch": 542} {"train_loss": -5.326394557952881, "global_step": 22776, "epoch": 542} {"train_loss": -5.254510879516602, "global_step": 22777, "epoch": 542} {"train_loss": -5.236783027648926, "global_step": 22778, "epoch": 542} {"train_loss": -5.363475322723389, "global_step": 22779, "epoch": 542} {"train_loss": -5.326142311096191, "global_step": 22780, "epoch": 542} {"train_loss": -5.2591962814331055, "global_step": 22781, "epoch": 542} {"train_loss": -5.303682327270508, "global_step": 22782, "epoch": 542} {"train_loss": -5.278791904449463, "global_step": 22783, "epoch": 542} {"train_loss": -5.426718235015869, "global_step": 22784, "epoch": 542} {"train_loss": -5.322051048278809, "global_step": 22785, "epoch": 542} {"train_loss": -5.290953636169434, "global_step": 22786, "epoch": 542} {"train_loss": -5.216687202453613, "global_step": 22787, "epoch": 542} {"train_loss": -5.321202754974365, "global_step": 22788, "epoch": 542} {"train_loss": -5.301031589508057, "global_step": 22789, "epoch": 542} {"train_loss": -5.320692539215088, "global_step": 22790, "epoch": 542} {"train_loss": -5.274410724639893, "global_step": 22791, "epoch": 542} {"train_loss": -5.211919784545898, "global_step": 22792, "epoch": 542} {"train_loss": -5.375017166137695, "global_step": 22793, "epoch": 542} {"train_loss": -5.290533065795898, "global_step": 22794, "epoch": 542} {"train_loss": -5.165927886962891, "global_step": 22795, "epoch": 542} {"train_loss": -5.4003753662109375, "global_step": 22796, "epoch": 542} {"train_loss": -5.263403415679932, "global_step": 22797, "epoch": 542} {"train_loss": -5.17094612121582, "global_step": 22798, "epoch": 542} {"train_loss": -5.34576416015625, "global_step": 22799, "epoch": 542} {"train_loss": -5.3303632736206055, "global_step": 22800, "epoch": 542} {"train_loss": -5.3466081619262695, "global_step": 22801, "epoch": 542} {"train_loss": -5.371541976928711, "global_step": 22802, "epoch": 542} {"train_loss": -5.187194347381592, "global_step": 22803, "epoch": 542} {"train_loss": -5.25455904006958, "global_step": 22804, "epoch": 542} {"train_loss": -5.298813763118925, "global_step": 22805, "epoch": 542, "val_loss": 76104.0546875} {"train_loss": -5.428062438964844, "global_step": 22806, "epoch": 543} {"train_loss": -5.309673309326172, "global_step": 22807, "epoch": 543} {"train_loss": -5.414397716522217, "global_step": 22808, "epoch": 543} {"train_loss": -5.266148567199707, "global_step": 22809, "epoch": 543} {"train_loss": -5.263897895812988, "global_step": 22810, "epoch": 543} {"train_loss": -5.3352203369140625, "global_step": 22811, "epoch": 543} {"train_loss": -5.343992710113525, "global_step": 22812, "epoch": 543} {"train_loss": -5.199994087219238, "global_step": 22813, "epoch": 543} {"train_loss": -5.2686872482299805, "global_step": 22814, "epoch": 543} {"train_loss": -5.424882888793945, "global_step": 22815, "epoch": 543} {"train_loss": -5.495716094970703, "global_step": 22816, "epoch": 543} {"train_loss": -5.234061241149902, "global_step": 22817, "epoch": 543} {"train_loss": -5.332983016967773, "global_step": 22818, "epoch": 543} {"train_loss": -5.2610182762146, "global_step": 22819, "epoch": 543} {"train_loss": -5.297357559204102, "global_step": 22820, "epoch": 543} {"train_loss": -5.439587593078613, "global_step": 22821, "epoch": 543} {"train_loss": -5.254239559173584, "global_step": 22822, "epoch": 543} {"train_loss": -5.34384822845459, "global_step": 22823, "epoch": 543} {"train_loss": -5.450042724609375, "global_step": 22824, "epoch": 543} {"train_loss": -5.230587005615234, "global_step": 22825, "epoch": 543} {"train_loss": -5.47418212890625, "global_step": 22826, "epoch": 543} {"train_loss": -5.365666389465332, "global_step": 22827, "epoch": 543} {"train_loss": -5.423646926879883, "global_step": 22828, "epoch": 543} {"train_loss": -5.28062629699707, "global_step": 22829, "epoch": 543} {"train_loss": -5.320261001586914, "global_step": 22830, "epoch": 543} {"train_loss": -5.398647308349609, "global_step": 22831, "epoch": 543} {"train_loss": -5.325112342834473, "global_step": 22832, "epoch": 543} {"train_loss": -5.3815155029296875, "global_step": 22833, "epoch": 543} {"train_loss": -5.418201446533203, "global_step": 22834, "epoch": 543} {"train_loss": -5.349876403808594, "global_step": 22835, "epoch": 543} {"train_loss": -5.47424840927124, "global_step": 22836, "epoch": 543} {"train_loss": -5.403521537780762, "global_step": 22837, "epoch": 543} {"train_loss": -5.432979583740234, "global_step": 22838, "epoch": 543} {"train_loss": -5.144604682922363, "global_step": 22839, "epoch": 543} {"train_loss": -5.394420623779297, "global_step": 22840, "epoch": 543} {"train_loss": -5.354434967041016, "global_step": 22841, "epoch": 543} {"train_loss": -5.264989376068115, "global_step": 22842, "epoch": 543} {"train_loss": -5.33349609375, "global_step": 22843, "epoch": 543} {"train_loss": -5.3360090255737305, "global_step": 22844, "epoch": 543} {"train_loss": -5.372160911560059, "global_step": 22845, "epoch": 543} {"train_loss": -5.330545902252197, "global_step": 22846, "epoch": 543} {"train_loss": -5.344719648361206, "global_step": 22847, "epoch": 543, "val_loss": 77049.9375} {"train_loss": -5.314958095550537, "global_step": 22848, "epoch": 544} {"train_loss": -5.309389114379883, "global_step": 22849, "epoch": 544} {"train_loss": -5.369708061218262, "global_step": 22850, "epoch": 544} {"train_loss": -5.408536434173584, "global_step": 22851, "epoch": 544} {"train_loss": -5.391993999481201, "global_step": 22852, "epoch": 544} {"train_loss": -5.4278154373168945, "global_step": 22853, "epoch": 544} {"train_loss": -5.276610851287842, "global_step": 22854, "epoch": 544} {"train_loss": -5.3710455894470215, "global_step": 22855, "epoch": 544} {"train_loss": -5.370532035827637, "global_step": 22856, "epoch": 544} {"train_loss": -5.219611167907715, "global_step": 22857, "epoch": 544} {"train_loss": -5.4003424644470215, "global_step": 22858, "epoch": 544} {"train_loss": -5.255247116088867, "global_step": 22859, "epoch": 544} {"train_loss": -5.189147472381592, "global_step": 22860, "epoch": 544} {"train_loss": -5.364306449890137, "global_step": 22861, "epoch": 544} {"train_loss": -5.307967662811279, "global_step": 22862, "epoch": 544} {"train_loss": -5.250175476074219, "global_step": 22863, "epoch": 544} {"train_loss": -5.223110198974609, "global_step": 22864, "epoch": 544} {"train_loss": -5.4479780197143555, "global_step": 22865, "epoch": 544} {"train_loss": -5.389618873596191, "global_step": 22866, "epoch": 544} {"train_loss": -5.20793342590332, "global_step": 22867, "epoch": 544} {"train_loss": -5.369549751281738, "global_step": 22868, "epoch": 544} {"train_loss": -5.333330154418945, "global_step": 22869, "epoch": 544} {"train_loss": -5.398900985717773, "global_step": 22870, "epoch": 544} {"train_loss": -5.400304794311523, "global_step": 22871, "epoch": 544} {"train_loss": -5.324586868286133, "global_step": 22872, "epoch": 544} {"train_loss": -5.281734466552734, "global_step": 22873, "epoch": 544} {"train_loss": -5.296405792236328, "global_step": 22874, "epoch": 544} {"train_loss": -5.356786251068115, "global_step": 22875, "epoch": 544} {"train_loss": -5.465319633483887, "global_step": 22876, "epoch": 544} {"train_loss": -5.372137069702148, "global_step": 22877, "epoch": 544} {"train_loss": -5.415732383728027, "global_step": 22878, "epoch": 544} {"train_loss": -5.393488883972168, "global_step": 22879, "epoch": 544} {"train_loss": -5.3341779708862305, "global_step": 22880, "epoch": 544} {"train_loss": -5.472938537597656, "global_step": 22881, "epoch": 544} {"train_loss": -5.329713821411133, "global_step": 22882, "epoch": 544} {"train_loss": -5.240181922912598, "global_step": 22883, "epoch": 544} {"train_loss": -5.3346357345581055, "global_step": 22884, "epoch": 544} {"train_loss": -5.378384590148926, "global_step": 22885, "epoch": 544} {"train_loss": -5.453337669372559, "global_step": 22886, "epoch": 544} {"train_loss": -5.504929065704346, "global_step": 22887, "epoch": 544} {"train_loss": -5.480747222900391, "global_step": 22888, "epoch": 544} {"train_loss": -5.349936632882981, "global_step": 22889, "epoch": 544, "val_loss": 76325.3046875} {"train_loss": -5.255449295043945, "global_step": 22890, "epoch": 545} {"train_loss": -5.448391914367676, "global_step": 22891, "epoch": 545} {"train_loss": -5.206409931182861, "global_step": 22892, "epoch": 545} {"train_loss": -5.279475212097168, "global_step": 22893, "epoch": 545} {"train_loss": -5.398357391357422, "global_step": 22894, "epoch": 545} {"train_loss": -5.2896199226379395, "global_step": 22895, "epoch": 545} {"train_loss": -5.5006513595581055, "global_step": 22896, "epoch": 545} {"train_loss": -5.29765510559082, "global_step": 22897, "epoch": 545} {"train_loss": -5.40300989151001, "global_step": 22898, "epoch": 545} {"train_loss": -5.384476661682129, "global_step": 22899, "epoch": 545} {"train_loss": -5.529984474182129, "global_step": 22900, "epoch": 545} {"train_loss": -5.370937347412109, "global_step": 22901, "epoch": 545} {"train_loss": -5.249173641204834, "global_step": 22902, "epoch": 545} {"train_loss": -5.310609817504883, "global_step": 22903, "epoch": 545} {"train_loss": -5.349312782287598, "global_step": 22904, "epoch": 545} {"train_loss": -5.304713249206543, "global_step": 22905, "epoch": 545} {"train_loss": -5.3672027587890625, "global_step": 22906, "epoch": 545} {"train_loss": -5.266021728515625, "global_step": 22907, "epoch": 545} {"train_loss": -5.355164051055908, "global_step": 22908, "epoch": 545} {"train_loss": -5.264876842498779, "global_step": 22909, "epoch": 545} {"train_loss": -5.334139823913574, "global_step": 22910, "epoch": 545} {"train_loss": -5.240075588226318, "global_step": 22911, "epoch": 545} {"train_loss": -5.402116298675537, "global_step": 22912, "epoch": 545} {"train_loss": -5.268044948577881, "global_step": 22913, "epoch": 545} {"train_loss": -5.372228622436523, "global_step": 22914, "epoch": 545} {"train_loss": -5.530854225158691, "global_step": 22915, "epoch": 545} {"train_loss": -5.354892730712891, "global_step": 22916, "epoch": 545} {"train_loss": -5.399104118347168, "global_step": 22917, "epoch": 545} {"train_loss": -5.373088836669922, "global_step": 22918, "epoch": 545} {"train_loss": -5.359394550323486, "global_step": 22919, "epoch": 545} {"train_loss": -5.411816120147705, "global_step": 22920, "epoch": 545} {"train_loss": -5.313023567199707, "global_step": 22921, "epoch": 545} {"train_loss": -5.314044952392578, "global_step": 22922, "epoch": 545} {"train_loss": -5.381775856018066, "global_step": 22923, "epoch": 545} {"train_loss": -5.423300266265869, "global_step": 22924, "epoch": 545} {"train_loss": -5.306725025177002, "global_step": 22925, "epoch": 545} {"train_loss": -5.3960161209106445, "global_step": 22926, "epoch": 545} {"train_loss": -5.377382278442383, "global_step": 22927, "epoch": 545} {"train_loss": -5.279411315917969, "global_step": 22928, "epoch": 545} {"train_loss": -5.355704307556152, "global_step": 22929, "epoch": 545} {"train_loss": -5.269521713256836, "global_step": 22930, "epoch": 545} {"train_loss": -5.348111447833833, "global_step": 22931, "epoch": 545, "val_loss": 76155.2578125} {"train_loss": -5.385714530944824, "global_step": 22932, "epoch": 546} {"train_loss": -5.428187370300293, "global_step": 22933, "epoch": 546} {"train_loss": -5.350652694702148, "global_step": 22934, "epoch": 546} {"train_loss": -5.3010640144348145, "global_step": 22935, "epoch": 546} {"train_loss": -5.407831192016602, "global_step": 22936, "epoch": 546} {"train_loss": -5.39227819442749, "global_step": 22937, "epoch": 546} {"train_loss": -5.353111743927002, "global_step": 22938, "epoch": 546} {"train_loss": -5.393991470336914, "global_step": 22939, "epoch": 546} {"train_loss": -5.348167896270752, "global_step": 22940, "epoch": 546} {"train_loss": -5.382665634155273, "global_step": 22941, "epoch": 546} {"train_loss": -5.454519271850586, "global_step": 22942, "epoch": 546} {"train_loss": -5.334627151489258, "global_step": 22943, "epoch": 546} {"train_loss": -5.209338665008545, "global_step": 22944, "epoch": 546} {"train_loss": -5.312687873840332, "global_step": 22945, "epoch": 546} {"train_loss": -5.4095892906188965, "global_step": 22946, "epoch": 546} {"train_loss": -5.434691905975342, "global_step": 22947, "epoch": 546} {"train_loss": -5.466040134429932, "global_step": 22948, "epoch": 546} {"train_loss": -5.308732032775879, "global_step": 22949, "epoch": 546} {"train_loss": -5.468538761138916, "global_step": 22950, "epoch": 546} {"train_loss": -5.429594039916992, "global_step": 22951, "epoch": 546} {"train_loss": -5.284996032714844, "global_step": 22952, "epoch": 546} {"train_loss": -5.342304229736328, "global_step": 22953, "epoch": 546} {"train_loss": -5.386447906494141, "global_step": 22954, "epoch": 546} {"train_loss": -5.4533586502075195, "global_step": 22955, "epoch": 546} {"train_loss": -5.416162967681885, "global_step": 22956, "epoch": 546} {"train_loss": -5.370096206665039, "global_step": 22957, "epoch": 546} {"train_loss": -5.436501979827881, "global_step": 22958, "epoch": 546} {"train_loss": -5.3987603187561035, "global_step": 22959, "epoch": 546} {"train_loss": -5.237054347991943, "global_step": 22960, "epoch": 546} {"train_loss": -5.471428871154785, "global_step": 22961, "epoch": 546} {"train_loss": -5.356450080871582, "global_step": 22962, "epoch": 546} {"train_loss": -5.427250385284424, "global_step": 22963, "epoch": 546} {"train_loss": -5.315920829772949, "global_step": 22964, "epoch": 546} {"train_loss": -5.418546199798584, "global_step": 22965, "epoch": 546} {"train_loss": -5.306976795196533, "global_step": 22966, "epoch": 546} {"train_loss": -5.324943542480469, "global_step": 22967, "epoch": 546} {"train_loss": -5.240628719329834, "global_step": 22968, "epoch": 546} {"train_loss": -5.226200103759766, "global_step": 22969, "epoch": 546} {"train_loss": -5.304116725921631, "global_step": 22970, "epoch": 546} {"train_loss": -5.258214950561523, "global_step": 22971, "epoch": 546} {"train_loss": -5.2891459465026855, "global_step": 22972, "epoch": 546} {"train_loss": -5.357902163550968, "global_step": 22973, "epoch": 546, "val_loss": 76097.953125} {"train_loss": -5.28568696975708, "global_step": 22974, "epoch": 547} {"train_loss": -5.147570610046387, "global_step": 22975, "epoch": 547} {"train_loss": -5.314501762390137, "global_step": 22976, "epoch": 547} {"train_loss": -5.323791980743408, "global_step": 22977, "epoch": 547} {"train_loss": -5.198575973510742, "global_step": 22978, "epoch": 547} {"train_loss": -5.289301872253418, "global_step": 22979, "epoch": 547} {"train_loss": -5.227631568908691, "global_step": 22980, "epoch": 547} {"train_loss": -5.320886611938477, "global_step": 22981, "epoch": 547} {"train_loss": -5.280193328857422, "global_step": 22982, "epoch": 547} {"train_loss": -5.4996819496154785, "global_step": 22983, "epoch": 547} {"train_loss": -5.211645603179932, "global_step": 22984, "epoch": 547} {"train_loss": -5.232797145843506, "global_step": 22985, "epoch": 547} {"train_loss": -5.417386531829834, "global_step": 22986, "epoch": 547} {"train_loss": -5.370546340942383, "global_step": 22987, "epoch": 547} {"train_loss": -5.401094436645508, "global_step": 22988, "epoch": 547} {"train_loss": -5.4166412353515625, "global_step": 22989, "epoch": 547} {"train_loss": -5.269567012786865, "global_step": 22990, "epoch": 547} {"train_loss": -5.260326862335205, "global_step": 22991, "epoch": 547} {"train_loss": -5.42899751663208, "global_step": 22992, "epoch": 547} {"train_loss": -5.4152021408081055, "global_step": 22993, "epoch": 547} {"train_loss": -5.32153844833374, "global_step": 22994, "epoch": 547} {"train_loss": -5.336826801300049, "global_step": 22995, "epoch": 547} {"train_loss": -5.26489782333374, "global_step": 22996, "epoch": 547} {"train_loss": -5.2332258224487305, "global_step": 22997, "epoch": 547} {"train_loss": -5.419203758239746, "global_step": 22998, "epoch": 547} {"train_loss": -5.1925177574157715, "global_step": 22999, "epoch": 547} {"train_loss": -5.311772346496582, "global_step": 23000, "epoch": 547} {"train_loss": -5.323602199554443, "global_step": 23001, "epoch": 547} {"train_loss": -5.298820495605469, "global_step": 23002, "epoch": 547} {"train_loss": -5.346844673156738, "global_step": 23003, "epoch": 547} {"train_loss": -5.372607231140137, "global_step": 23004, "epoch": 547} {"train_loss": -5.331182956695557, "global_step": 23005, "epoch": 547} {"train_loss": -5.283143043518066, "global_step": 23006, "epoch": 547} {"train_loss": -5.248029708862305, "global_step": 23007, "epoch": 547} {"train_loss": -5.289555549621582, "global_step": 23008, "epoch": 547} {"train_loss": -5.332824230194092, "global_step": 23009, "epoch": 547} {"train_loss": -5.375489234924316, "global_step": 23010, "epoch": 547} {"train_loss": -5.221962928771973, "global_step": 23011, "epoch": 547} {"train_loss": -5.297475337982178, "global_step": 23012, "epoch": 547} {"train_loss": -5.315252304077148, "global_step": 23013, "epoch": 547} {"train_loss": -5.373594284057617, "global_step": 23014, "epoch": 547} {"train_loss": -5.312202499026344, "global_step": 23015, "epoch": 547, "val_loss": 75547.625} {"train_loss": -5.361611366271973, "global_step": 23016, "epoch": 548} {"train_loss": -5.384998321533203, "global_step": 23017, "epoch": 548} {"train_loss": -5.392848968505859, "global_step": 23018, "epoch": 548} {"train_loss": -5.32160758972168, "global_step": 23019, "epoch": 548} {"train_loss": -5.137249946594238, "global_step": 23020, "epoch": 548} {"train_loss": -5.25645637512207, "global_step": 23021, "epoch": 548} {"train_loss": -5.165064811706543, "global_step": 23022, "epoch": 548} {"train_loss": -5.238124370574951, "global_step": 23023, "epoch": 548} {"train_loss": -5.401268005371094, "global_step": 23024, "epoch": 548} {"train_loss": -5.420536041259766, "global_step": 23025, "epoch": 548} {"train_loss": -5.420080184936523, "global_step": 23026, "epoch": 548} {"train_loss": -5.484661102294922, "global_step": 23027, "epoch": 548} {"train_loss": -5.351752281188965, "global_step": 23028, "epoch": 548} {"train_loss": -5.307093620300293, "global_step": 23029, "epoch": 548} {"train_loss": -5.28920316696167, "global_step": 23030, "epoch": 548} {"train_loss": -5.437915325164795, "global_step": 23031, "epoch": 548} {"train_loss": -5.422231674194336, "global_step": 23032, "epoch": 548} {"train_loss": -5.265382289886475, "global_step": 23033, "epoch": 548} {"train_loss": -5.3633952140808105, "global_step": 23034, "epoch": 548} {"train_loss": -5.224931716918945, "global_step": 23035, "epoch": 548} {"train_loss": -5.243307113647461, "global_step": 23036, "epoch": 548} {"train_loss": -5.3434157371521, "global_step": 23037, "epoch": 548} {"train_loss": -5.283280372619629, "global_step": 23038, "epoch": 548} {"train_loss": -5.282456398010254, "global_step": 23039, "epoch": 548} {"train_loss": -5.4933881759643555, "global_step": 23040, "epoch": 548} {"train_loss": -5.210346221923828, "global_step": 23041, "epoch": 548} {"train_loss": -5.342962741851807, "global_step": 23042, "epoch": 548} {"train_loss": -5.173799514770508, "global_step": 23043, "epoch": 548} {"train_loss": -5.224370956420898, "global_step": 23044, "epoch": 548} {"train_loss": -5.329384803771973, "global_step": 23045, "epoch": 548} {"train_loss": -5.1776123046875, "global_step": 23046, "epoch": 548} {"train_loss": -5.3246049880981445, "global_step": 23047, "epoch": 548} {"train_loss": -5.36068058013916, "global_step": 23048, "epoch": 548} {"train_loss": -5.460572719573975, "global_step": 23049, "epoch": 548} {"train_loss": -5.294212341308594, "global_step": 23050, "epoch": 548} {"train_loss": -5.21115255355835, "global_step": 23051, "epoch": 548} {"train_loss": -5.245811462402344, "global_step": 23052, "epoch": 548} {"train_loss": -5.334351539611816, "global_step": 23053, "epoch": 548} {"train_loss": -5.2647199630737305, "global_step": 23054, "epoch": 548} {"train_loss": -5.316205978393555, "global_step": 23055, "epoch": 548} {"train_loss": -5.403496265411377, "global_step": 23056, "epoch": 548} {"train_loss": -5.319458530062721, "global_step": 23057, "epoch": 548, "val_loss": 76025.1796875} {"train_loss": -5.273204803466797, "global_step": 23058, "epoch": 549} {"train_loss": -5.368105888366699, "global_step": 23059, "epoch": 549} {"train_loss": -5.352535247802734, "global_step": 23060, "epoch": 549} {"train_loss": -5.491222858428955, "global_step": 23061, "epoch": 549} {"train_loss": -5.322155952453613, "global_step": 23062, "epoch": 549} {"train_loss": -5.429350852966309, "global_step": 23063, "epoch": 549} {"train_loss": -5.545139312744141, "global_step": 23064, "epoch": 549} {"train_loss": -5.307498931884766, "global_step": 23065, "epoch": 549} {"train_loss": -5.355135917663574, "global_step": 23066, "epoch": 549} {"train_loss": -5.404876232147217, "global_step": 23067, "epoch": 549} {"train_loss": -5.355969429016113, "global_step": 23068, "epoch": 549} {"train_loss": -5.426932334899902, "global_step": 23069, "epoch": 549} {"train_loss": -5.231696128845215, "global_step": 23070, "epoch": 549} {"train_loss": -5.383452892303467, "global_step": 23071, "epoch": 549} {"train_loss": -5.331586837768555, "global_step": 23072, "epoch": 549} {"train_loss": -5.2362494468688965, "global_step": 23073, "epoch": 549} {"train_loss": -5.313177108764648, "global_step": 23074, "epoch": 549} {"train_loss": -5.408405303955078, "global_step": 23075, "epoch": 549} {"train_loss": -5.322657585144043, "global_step": 23076, "epoch": 549} {"train_loss": -5.319614410400391, "global_step": 23077, "epoch": 549} {"train_loss": -5.311178207397461, "global_step": 23078, "epoch": 549} {"train_loss": -5.300248622894287, "global_step": 23079, "epoch": 549} {"train_loss": -5.332222938537598, "global_step": 23080, "epoch": 549} {"train_loss": -5.260781288146973, "global_step": 23081, "epoch": 549} {"train_loss": -5.302421569824219, "global_step": 23082, "epoch": 549} {"train_loss": -5.288229465484619, "global_step": 23083, "epoch": 549} {"train_loss": -5.292566299438477, "global_step": 23084, "epoch": 549} {"train_loss": -5.3542160987854, "global_step": 23085, "epoch": 549} {"train_loss": -5.25664758682251, "global_step": 23086, "epoch": 549} {"train_loss": -5.252971172332764, "global_step": 23087, "epoch": 549} {"train_loss": -5.249293327331543, "global_step": 23088, "epoch": 549} {"train_loss": -5.414398670196533, "global_step": 23089, "epoch": 549} {"train_loss": -5.48272705078125, "global_step": 23090, "epoch": 549} {"train_loss": -5.233241081237793, "global_step": 23091, "epoch": 549} {"train_loss": -5.428956508636475, "global_step": 23092, "epoch": 549} {"train_loss": -5.431791305541992, "global_step": 23093, "epoch": 549} {"train_loss": -5.193511486053467, "global_step": 23094, "epoch": 549} {"train_loss": -5.438787460327148, "global_step": 23095, "epoch": 549} {"train_loss": -5.330175399780273, "global_step": 23096, "epoch": 549} {"train_loss": -5.400405406951904, "global_step": 23097, "epoch": 549} {"train_loss": -5.298183441162109, "global_step": 23098, "epoch": 549} {"train_loss": -5.3428413186754495, "global_step": 23099, "epoch": 549, "val_loss": 76342.53125} {"train_loss": -5.346683502197266, "global_step": 23100, "epoch": 550} {"train_loss": -5.3829755783081055, "global_step": 23101, "epoch": 550} {"train_loss": -5.341222763061523, "global_step": 23102, "epoch": 550} {"train_loss": -5.320817470550537, "global_step": 23103, "epoch": 550} {"train_loss": -5.330417633056641, "global_step": 23104, "epoch": 550} {"train_loss": -5.280421733856201, "global_step": 23105, "epoch": 550} {"train_loss": -5.541154384613037, "global_step": 23106, "epoch": 550} {"train_loss": -5.432700157165527, "global_step": 23107, "epoch": 550} {"train_loss": -5.351279258728027, "global_step": 23108, "epoch": 550} {"train_loss": -5.324753761291504, "global_step": 23109, "epoch": 550} {"train_loss": -5.521979331970215, "global_step": 23110, "epoch": 550} {"train_loss": -5.3136491775512695, "global_step": 23111, "epoch": 550} {"train_loss": -5.264778137207031, "global_step": 23112, "epoch": 550} {"train_loss": -5.443094253540039, "global_step": 23113, "epoch": 550} {"train_loss": -5.388888359069824, "global_step": 23114, "epoch": 550} {"train_loss": -5.208107948303223, "global_step": 23115, "epoch": 550} {"train_loss": -5.328003406524658, "global_step": 23116, "epoch": 550} {"train_loss": -5.446974754333496, "global_step": 23117, "epoch": 550} {"train_loss": -5.307290077209473, "global_step": 23118, "epoch": 550} {"train_loss": -5.448646545410156, "global_step": 23119, "epoch": 550} {"train_loss": -5.433701038360596, "global_step": 23120, "epoch": 550} {"train_loss": -5.301250457763672, "global_step": 23121, "epoch": 550} {"train_loss": -5.3519744873046875, "global_step": 23122, "epoch": 550} {"train_loss": -5.330639839172363, "global_step": 23123, "epoch": 550} {"train_loss": -5.3920063972473145, "global_step": 23124, "epoch": 550} {"train_loss": -5.291206359863281, "global_step": 23125, "epoch": 550} {"train_loss": -5.415051460266113, "global_step": 23126, "epoch": 550} {"train_loss": -5.37636661529541, "global_step": 23127, "epoch": 550} {"train_loss": -5.288886547088623, "global_step": 23128, "epoch": 550} {"train_loss": -5.460689544677734, "global_step": 23129, "epoch": 550} {"train_loss": -5.295651435852051, "global_step": 23130, "epoch": 550} {"train_loss": -5.409625053405762, "global_step": 23131, "epoch": 550} {"train_loss": -5.4228339195251465, "global_step": 23132, "epoch": 550} {"train_loss": -5.227391242980957, "global_step": 23133, "epoch": 550} {"train_loss": -5.296710968017578, "global_step": 23134, "epoch": 550} {"train_loss": -5.292930603027344, "global_step": 23135, "epoch": 550} {"train_loss": -5.17647647857666, "global_step": 23136, "epoch": 550} {"train_loss": -5.353856086730957, "global_step": 23137, "epoch": 550} {"train_loss": -5.340083599090576, "global_step": 23138, "epoch": 550} {"train_loss": -5.161107063293457, "global_step": 23139, "epoch": 550} {"train_loss": -5.375574111938477, "global_step": 23140, "epoch": 550} {"train_loss": -5.344507739657447, "global_step": 23141, "epoch": 550, "train/sim_max_reward_0": 0.3234726857639914, "train/sim_max_reward_1": 0.14251610923813304, "train/sim_max_reward_2": 0.34905049236194935, "train/sim_max_reward_3": 0.3690989359415886, "train/sim_max_reward_4": 0.739868171064673, "train/sim_max_reward_5": 0.19298475936218748, "test/sim_max_reward_4500000": 0.7877910362703109, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.181216041969276, "test/sim_max_reward_4500005": 0.1322087129154604, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.20449310429877826, "test/sim_max_reward_4500008": 3.3661464734259636e-05, "test/sim_max_reward_4500009": 0.05358088630893471, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.12352749597495183, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.3495268123326383, "test/sim_max_reward_4500015": 0.12612185724810926, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.6149212983199585, "test/sim_max_reward_4500018": 0.15528278842711352, "test/sim_max_reward_4500019": 0.41112516484054057, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.537560755145806, "test/sim_max_reward_4500022": 0.3325456708853507, "test/sim_max_reward_4500023": 0.49797984948205976, "test/sim_max_reward_4500024": 0.3852489706385757, "test/sim_max_reward_4500025": 0.12048119717649508, "test/sim_max_reward_4500026": 0.13224427054843196, "test/sim_max_reward_4500027": 0.16054649870988597, "test/sim_max_reward_4500028": 0.40875303584589795, "test/sim_max_reward_4500029": 0.24118833133471396, "test/sim_max_reward_4500030": 0.21694335187326444, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.3114998226885722, "test/sim_max_reward_4500034": 0.39427054422721475, "test/sim_max_reward_4500035": 0.13042964280309494, "test/sim_max_reward_4500036": 0.2584676897621627, "test/sim_max_reward_4500037": 0.3086291869497915, "test/sim_max_reward_4500038": 0.2830807482487753, "test/sim_max_reward_4500039": 0.047077790489621865, "test/sim_max_reward_4500040": 0.4513939845525645, "test/sim_max_reward_4500041": 0.36799570636291884, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.36150495595457754, "test/sim_max_reward_4500044": 0.5507233170672499, "test/sim_max_reward_4500045": 0.12365513170603937, "test/sim_max_reward_4500046": 0.5037822134697711, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.1612742175377195, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.35283185895542046, "test/mean_score": 0.2103113273108576, "val_loss": 76326.5} {"train_loss": -5.24235200881958, "global_step": 23142, "epoch": 551} {"train_loss": -5.35723876953125, "global_step": 23143, "epoch": 551} {"train_loss": -5.231448173522949, "global_step": 23144, "epoch": 551} {"train_loss": -5.428934574127197, "global_step": 23145, "epoch": 551} {"train_loss": -5.293001174926758, "global_step": 23146, "epoch": 551} {"train_loss": -5.269479751586914, "global_step": 23147, "epoch": 551} {"train_loss": -5.286542892456055, "global_step": 23148, "epoch": 551} {"train_loss": -5.4457292556762695, "global_step": 23149, "epoch": 551} {"train_loss": -5.419039726257324, "global_step": 23150, "epoch": 551} {"train_loss": -5.350319862365723, "global_step": 23151, "epoch": 551} {"train_loss": -5.370818138122559, "global_step": 23152, "epoch": 551} {"train_loss": -5.279308795928955, "global_step": 23153, "epoch": 551} {"train_loss": -5.230995178222656, "global_step": 23154, "epoch": 551} {"train_loss": -5.393885135650635, "global_step": 23155, "epoch": 551} {"train_loss": -5.331698894500732, "global_step": 23156, "epoch": 551} {"train_loss": -5.351893901824951, "global_step": 23157, "epoch": 551} {"train_loss": -5.332799434661865, "global_step": 23158, "epoch": 551} {"train_loss": -5.226448059082031, "global_step": 23159, "epoch": 551} {"train_loss": -5.333068370819092, "global_step": 23160, "epoch": 551} {"train_loss": -5.310602188110352, "global_step": 23161, "epoch": 551} {"train_loss": -5.359183311462402, "global_step": 23162, "epoch": 551} {"train_loss": -5.333102226257324, "global_step": 23163, "epoch": 551} {"train_loss": -5.470248222351074, "global_step": 23164, "epoch": 551} {"train_loss": -5.18825101852417, "global_step": 23165, "epoch": 551} {"train_loss": -5.354818344116211, "global_step": 23166, "epoch": 551} {"train_loss": -5.364451885223389, "global_step": 23167, "epoch": 551} {"train_loss": -5.266157627105713, "global_step": 23168, "epoch": 551} {"train_loss": -5.22141170501709, "global_step": 23169, "epoch": 551} {"train_loss": -5.316399574279785, "global_step": 23170, "epoch": 551} {"train_loss": -5.302536964416504, "global_step": 23171, "epoch": 551} {"train_loss": -5.290376663208008, "global_step": 23172, "epoch": 551} {"train_loss": -5.380376815795898, "global_step": 23173, "epoch": 551} {"train_loss": -5.2758307456970215, "global_step": 23174, "epoch": 551} {"train_loss": -5.453641891479492, "global_step": 23175, "epoch": 551} {"train_loss": -5.378068923950195, "global_step": 23176, "epoch": 551} {"train_loss": -5.331820964813232, "global_step": 23177, "epoch": 551} {"train_loss": -5.374638557434082, "global_step": 23178, "epoch": 551} {"train_loss": -5.4064812660217285, "global_step": 23179, "epoch": 551} {"train_loss": -5.400975227355957, "global_step": 23180, "epoch": 551} {"train_loss": -5.332587242126465, "global_step": 23181, "epoch": 551} {"train_loss": -5.227175712585449, "global_step": 23182, "epoch": 551} {"train_loss": -5.332785072780791, "global_step": 23183, "epoch": 551, "val_loss": 76492.1875} {"train_loss": -5.524265289306641, "global_step": 23184, "epoch": 552} {"train_loss": -5.400345325469971, "global_step": 23185, "epoch": 552} {"train_loss": -5.473269462585449, "global_step": 23186, "epoch": 552} {"train_loss": -5.440937042236328, "global_step": 23187, "epoch": 552} {"train_loss": -5.357634544372559, "global_step": 23188, "epoch": 552} {"train_loss": -5.238793849945068, "global_step": 23189, "epoch": 552} {"train_loss": -5.340179920196533, "global_step": 23190, "epoch": 552} {"train_loss": -5.535715103149414, "global_step": 23191, "epoch": 552} {"train_loss": -5.335504531860352, "global_step": 23192, "epoch": 552} {"train_loss": -5.401727676391602, "global_step": 23193, "epoch": 552} {"train_loss": -5.559942245483398, "global_step": 23194, "epoch": 552} {"train_loss": -5.3439741134643555, "global_step": 23195, "epoch": 552} {"train_loss": -5.360058784484863, "global_step": 23196, "epoch": 552} {"train_loss": -5.3205108642578125, "global_step": 23197, "epoch": 552} {"train_loss": -5.446560859680176, "global_step": 23198, "epoch": 552} {"train_loss": -5.275381088256836, "global_step": 23199, "epoch": 552} {"train_loss": -5.349348068237305, "global_step": 23200, "epoch": 552} {"train_loss": -5.418532371520996, "global_step": 23201, "epoch": 552} {"train_loss": -5.222015380859375, "global_step": 23202, "epoch": 552} {"train_loss": -5.333660125732422, "global_step": 23203, "epoch": 552} {"train_loss": -5.398221969604492, "global_step": 23204, "epoch": 552} {"train_loss": -5.355496406555176, "global_step": 23205, "epoch": 552} {"train_loss": -5.420266628265381, "global_step": 23206, "epoch": 552} {"train_loss": -5.3515400886535645, "global_step": 23207, "epoch": 552} {"train_loss": -5.091742992401123, "global_step": 23208, "epoch": 552} {"train_loss": -5.3239240646362305, "global_step": 23209, "epoch": 552} {"train_loss": -5.298937797546387, "global_step": 23210, "epoch": 552} {"train_loss": -5.3031697273254395, "global_step": 23211, "epoch": 552} {"train_loss": -5.37624454498291, "global_step": 23212, "epoch": 552} {"train_loss": -5.334502220153809, "global_step": 23213, "epoch": 552} {"train_loss": -5.335104942321777, "global_step": 23214, "epoch": 552} {"train_loss": -5.3706769943237305, "global_step": 23215, "epoch": 552} {"train_loss": -5.441022872924805, "global_step": 23216, "epoch": 552} {"train_loss": -5.428924560546875, "global_step": 23217, "epoch": 552} {"train_loss": -5.309820652008057, "global_step": 23218, "epoch": 552} {"train_loss": -5.403392791748047, "global_step": 23219, "epoch": 552} {"train_loss": -5.308020114898682, "global_step": 23220, "epoch": 552} {"train_loss": -5.376911640167236, "global_step": 23221, "epoch": 552} {"train_loss": -5.35455846786499, "global_step": 23222, "epoch": 552} {"train_loss": -5.332198143005371, "global_step": 23223, "epoch": 552} {"train_loss": -5.144079208374023, "global_step": 23224, "epoch": 552} {"train_loss": -5.359117042450678, "global_step": 23225, "epoch": 552, "val_loss": 75733.9375} {"train_loss": -5.405399799346924, "global_step": 23226, "epoch": 553} {"train_loss": -5.400803089141846, "global_step": 23227, "epoch": 553} {"train_loss": -5.298885345458984, "global_step": 23228, "epoch": 553} {"train_loss": -5.4517974853515625, "global_step": 23229, "epoch": 553} {"train_loss": -5.393710136413574, "global_step": 23230, "epoch": 553} {"train_loss": -5.352268695831299, "global_step": 23231, "epoch": 553} {"train_loss": -5.261977672576904, "global_step": 23232, "epoch": 553} {"train_loss": -5.414484024047852, "global_step": 23233, "epoch": 553} {"train_loss": -5.449741363525391, "global_step": 23234, "epoch": 553} {"train_loss": -5.293791770935059, "global_step": 23235, "epoch": 553} {"train_loss": -5.349950313568115, "global_step": 23236, "epoch": 553} {"train_loss": -5.258026123046875, "global_step": 23237, "epoch": 553} {"train_loss": -5.340198040008545, "global_step": 23238, "epoch": 553} {"train_loss": -5.385223388671875, "global_step": 23239, "epoch": 553} {"train_loss": -5.2860822677612305, "global_step": 23240, "epoch": 553} {"train_loss": -5.365011215209961, "global_step": 23241, "epoch": 553} {"train_loss": -5.340662002563477, "global_step": 23242, "epoch": 553} {"train_loss": -5.276155471801758, "global_step": 23243, "epoch": 553} {"train_loss": -5.1120758056640625, "global_step": 23244, "epoch": 553} {"train_loss": -5.377554416656494, "global_step": 23245, "epoch": 553} {"train_loss": -5.333399295806885, "global_step": 23246, "epoch": 553} {"train_loss": -5.376319408416748, "global_step": 23247, "epoch": 553} {"train_loss": -5.419516563415527, "global_step": 23248, "epoch": 553} {"train_loss": -5.29627799987793, "global_step": 23249, "epoch": 553} {"train_loss": -5.252851486206055, "global_step": 23250, "epoch": 553} {"train_loss": -5.177305221557617, "global_step": 23251, "epoch": 553} {"train_loss": -5.3237504959106445, "global_step": 23252, "epoch": 553} {"train_loss": -5.452676296234131, "global_step": 23253, "epoch": 553} {"train_loss": -5.2013654708862305, "global_step": 23254, "epoch": 553} {"train_loss": -5.393725395202637, "global_step": 23255, "epoch": 553} {"train_loss": -5.312533855438232, "global_step": 23256, "epoch": 553} {"train_loss": -5.1930365562438965, "global_step": 23257, "epoch": 553} {"train_loss": -5.332215785980225, "global_step": 23258, "epoch": 553} {"train_loss": -5.305749416351318, "global_step": 23259, "epoch": 553} {"train_loss": -5.27913761138916, "global_step": 23260, "epoch": 553} {"train_loss": -5.354803085327148, "global_step": 23261, "epoch": 553} {"train_loss": -5.28931999206543, "global_step": 23262, "epoch": 553} {"train_loss": -5.421034812927246, "global_step": 23263, "epoch": 553} {"train_loss": -5.40743350982666, "global_step": 23264, "epoch": 553} {"train_loss": -5.293149948120117, "global_step": 23265, "epoch": 553} {"train_loss": -5.309605121612549, "global_step": 23266, "epoch": 553} {"train_loss": -5.3286679699307395, "global_step": 23267, "epoch": 553, "val_loss": 76206.4921875} {"train_loss": -5.368096351623535, "global_step": 23268, "epoch": 554} {"train_loss": -5.285853385925293, "global_step": 23269, "epoch": 554} {"train_loss": -5.350899696350098, "global_step": 23270, "epoch": 554} {"train_loss": -5.452646255493164, "global_step": 23271, "epoch": 554} {"train_loss": -5.325875759124756, "global_step": 23272, "epoch": 554} {"train_loss": -5.3563127517700195, "global_step": 23273, "epoch": 554} {"train_loss": -5.325695514678955, "global_step": 23274, "epoch": 554} {"train_loss": -5.316193580627441, "global_step": 23275, "epoch": 554} {"train_loss": -5.295184135437012, "global_step": 23276, "epoch": 554} {"train_loss": -5.363531112670898, "global_step": 23277, "epoch": 554} {"train_loss": -5.457704544067383, "global_step": 23278, "epoch": 554} {"train_loss": -5.296662330627441, "global_step": 23279, "epoch": 554} {"train_loss": -5.48524284362793, "global_step": 23280, "epoch": 554} {"train_loss": -5.256031036376953, "global_step": 23281, "epoch": 554} {"train_loss": -5.370636940002441, "global_step": 23282, "epoch": 554} {"train_loss": -5.120337009429932, "global_step": 23283, "epoch": 554} {"train_loss": -5.493755340576172, "global_step": 23284, "epoch": 554} {"train_loss": -5.429493427276611, "global_step": 23285, "epoch": 554} {"train_loss": -5.386102676391602, "global_step": 23286, "epoch": 554} {"train_loss": -5.402278423309326, "global_step": 23287, "epoch": 554} {"train_loss": -5.452844619750977, "global_step": 23288, "epoch": 554} {"train_loss": -5.233559608459473, "global_step": 23289, "epoch": 554} {"train_loss": -5.3912787437438965, "global_step": 23290, "epoch": 554} {"train_loss": -5.367519855499268, "global_step": 23291, "epoch": 554} {"train_loss": -5.5028839111328125, "global_step": 23292, "epoch": 554} {"train_loss": -5.366888046264648, "global_step": 23293, "epoch": 554} {"train_loss": -5.368613243103027, "global_step": 23294, "epoch": 554} {"train_loss": -5.352448463439941, "global_step": 23295, "epoch": 554} {"train_loss": -5.3013505935668945, "global_step": 23296, "epoch": 554} {"train_loss": -5.424468994140625, "global_step": 23297, "epoch": 554} {"train_loss": -5.372161865234375, "global_step": 23298, "epoch": 554} {"train_loss": -5.486690998077393, "global_step": 23299, "epoch": 554} {"train_loss": -5.38631534576416, "global_step": 23300, "epoch": 554} {"train_loss": -5.308759689331055, "global_step": 23301, "epoch": 554} {"train_loss": -5.382744789123535, "global_step": 23302, "epoch": 554} {"train_loss": -5.396130561828613, "global_step": 23303, "epoch": 554} {"train_loss": -5.452792644500732, "global_step": 23304, "epoch": 554} {"train_loss": -5.309805870056152, "global_step": 23305, "epoch": 554} {"train_loss": -5.278383255004883, "global_step": 23306, "epoch": 554} {"train_loss": -5.450813293457031, "global_step": 23307, "epoch": 554} {"train_loss": -5.317709922790527, "global_step": 23308, "epoch": 554} {"train_loss": -5.368017037709554, "global_step": 23309, "epoch": 554, "val_loss": 76310.234375} {"train_loss": -5.330099105834961, "global_step": 23310, "epoch": 555} {"train_loss": -5.383260726928711, "global_step": 23311, "epoch": 555} {"train_loss": -5.357960224151611, "global_step": 23312, "epoch": 555} {"train_loss": -5.405683994293213, "global_step": 23313, "epoch": 555} {"train_loss": -5.4032416343688965, "global_step": 23314, "epoch": 555} {"train_loss": -5.444268226623535, "global_step": 23315, "epoch": 555} {"train_loss": -5.476343631744385, "global_step": 23316, "epoch": 555} {"train_loss": -5.345757484436035, "global_step": 23317, "epoch": 555} {"train_loss": -5.394972324371338, "global_step": 23318, "epoch": 555} {"train_loss": -5.363556861877441, "global_step": 23319, "epoch": 555} {"train_loss": -5.326480865478516, "global_step": 23320, "epoch": 555} {"train_loss": -5.394144058227539, "global_step": 23321, "epoch": 555} {"train_loss": -5.346624374389648, "global_step": 23322, "epoch": 555} {"train_loss": -5.362730979919434, "global_step": 23323, "epoch": 555} {"train_loss": -5.317018032073975, "global_step": 23324, "epoch": 555} {"train_loss": -5.233887195587158, "global_step": 23325, "epoch": 555} {"train_loss": -5.445838451385498, "global_step": 23326, "epoch": 555} {"train_loss": -5.364337921142578, "global_step": 23327, "epoch": 555} {"train_loss": -5.303135395050049, "global_step": 23328, "epoch": 555} {"train_loss": -5.283005714416504, "global_step": 23329, "epoch": 555} {"train_loss": -5.336033344268799, "global_step": 23330, "epoch": 555} {"train_loss": -5.316589832305908, "global_step": 23331, "epoch": 555} {"train_loss": -5.416414260864258, "global_step": 23332, "epoch": 555} {"train_loss": -5.436590671539307, "global_step": 23333, "epoch": 555} {"train_loss": -5.439967155456543, "global_step": 23334, "epoch": 555} {"train_loss": -5.348834991455078, "global_step": 23335, "epoch": 555} {"train_loss": -5.206650733947754, "global_step": 23336, "epoch": 555} {"train_loss": -5.336021423339844, "global_step": 23337, "epoch": 555} {"train_loss": -5.350578308105469, "global_step": 23338, "epoch": 555} {"train_loss": -5.368481636047363, "global_step": 23339, "epoch": 555} {"train_loss": -5.333011627197266, "global_step": 23340, "epoch": 555} {"train_loss": -5.296695709228516, "global_step": 23341, "epoch": 555} {"train_loss": -5.358485221862793, "global_step": 23342, "epoch": 555} {"train_loss": -5.317254066467285, "global_step": 23343, "epoch": 555} {"train_loss": -5.256889343261719, "global_step": 23344, "epoch": 555} {"train_loss": -5.474947929382324, "global_step": 23345, "epoch": 555} {"train_loss": -5.365573883056641, "global_step": 23346, "epoch": 555} {"train_loss": -5.445960998535156, "global_step": 23347, "epoch": 555} {"train_loss": -5.3085503578186035, "global_step": 23348, "epoch": 555} {"train_loss": -5.431643009185791, "global_step": 23349, "epoch": 555} {"train_loss": -5.258996963500977, "global_step": 23350, "epoch": 555} {"train_loss": -5.358496030171712, "global_step": 23351, "epoch": 555, "val_loss": 76601.3125} {"train_loss": -5.439967155456543, "global_step": 23352, "epoch": 556} {"train_loss": -5.3102946281433105, "global_step": 23353, "epoch": 556} {"train_loss": -5.474296569824219, "global_step": 23354, "epoch": 556} {"train_loss": -5.357304573059082, "global_step": 23355, "epoch": 556} {"train_loss": -5.126238822937012, "global_step": 23356, "epoch": 556} {"train_loss": -5.340212821960449, "global_step": 23357, "epoch": 556} {"train_loss": -5.274778842926025, "global_step": 23358, "epoch": 556} {"train_loss": -5.218021869659424, "global_step": 23359, "epoch": 556} {"train_loss": -5.30177640914917, "global_step": 23360, "epoch": 556} {"train_loss": -5.360335350036621, "global_step": 23361, "epoch": 556} {"train_loss": -5.37229061126709, "global_step": 23362, "epoch": 556} {"train_loss": -5.544125556945801, "global_step": 23363, "epoch": 556} {"train_loss": -5.244333267211914, "global_step": 23364, "epoch": 556} {"train_loss": -5.363285064697266, "global_step": 23365, "epoch": 556} {"train_loss": -5.310600757598877, "global_step": 23366, "epoch": 556} {"train_loss": -5.297857284545898, "global_step": 23367, "epoch": 556} {"train_loss": -5.334785461425781, "global_step": 23368, "epoch": 556} {"train_loss": -5.486017227172852, "global_step": 23369, "epoch": 556} {"train_loss": -5.299700736999512, "global_step": 23370, "epoch": 556} {"train_loss": -5.456439971923828, "global_step": 23371, "epoch": 556} {"train_loss": -5.520720958709717, "global_step": 23372, "epoch": 556} {"train_loss": -5.320253372192383, "global_step": 23373, "epoch": 556} {"train_loss": -5.263833045959473, "global_step": 23374, "epoch": 556} {"train_loss": -5.419086456298828, "global_step": 23375, "epoch": 556} {"train_loss": -5.295539855957031, "global_step": 23376, "epoch": 556} {"train_loss": -5.321610450744629, "global_step": 23377, "epoch": 556} {"train_loss": -5.292418479919434, "global_step": 23378, "epoch": 556} {"train_loss": -5.3075103759765625, "global_step": 23379, "epoch": 556} {"train_loss": -5.387373924255371, "global_step": 23380, "epoch": 556} {"train_loss": -5.296220779418945, "global_step": 23381, "epoch": 556} {"train_loss": -5.261763095855713, "global_step": 23382, "epoch": 556} {"train_loss": -5.314783096313477, "global_step": 23383, "epoch": 556} {"train_loss": -5.482752799987793, "global_step": 23384, "epoch": 556} {"train_loss": -5.408883571624756, "global_step": 23385, "epoch": 556} {"train_loss": -5.376450061798096, "global_step": 23386, "epoch": 556} {"train_loss": -5.322757720947266, "global_step": 23387, "epoch": 556} {"train_loss": -5.40105676651001, "global_step": 23388, "epoch": 556} {"train_loss": -5.4235429763793945, "global_step": 23389, "epoch": 556} {"train_loss": -5.453452110290527, "global_step": 23390, "epoch": 556} {"train_loss": -5.2139668464660645, "global_step": 23391, "epoch": 556} {"train_loss": -5.403140068054199, "global_step": 23392, "epoch": 556} {"train_loss": -5.348690191904704, "global_step": 23393, "epoch": 556, "val_loss": 76560.96875} {"train_loss": -5.352866172790527, "global_step": 23394, "epoch": 557} {"train_loss": -5.33423376083374, "global_step": 23395, "epoch": 557} {"train_loss": -5.332469940185547, "global_step": 23396, "epoch": 557} {"train_loss": -5.316454887390137, "global_step": 23397, "epoch": 557} {"train_loss": -5.362255096435547, "global_step": 23398, "epoch": 557} {"train_loss": -5.354576110839844, "global_step": 23399, "epoch": 557} {"train_loss": -5.342501640319824, "global_step": 23400, "epoch": 557} {"train_loss": -5.3574748039245605, "global_step": 23401, "epoch": 557} {"train_loss": -5.287077903747559, "global_step": 23402, "epoch": 557} {"train_loss": -5.333136558532715, "global_step": 23403, "epoch": 557} {"train_loss": -5.287295818328857, "global_step": 23404, "epoch": 557} {"train_loss": -5.317483901977539, "global_step": 23405, "epoch": 557} {"train_loss": -5.47342586517334, "global_step": 23406, "epoch": 557} {"train_loss": -5.381209373474121, "global_step": 23407, "epoch": 557} {"train_loss": -5.377111434936523, "global_step": 23408, "epoch": 557} {"train_loss": -5.223489284515381, "global_step": 23409, "epoch": 557} {"train_loss": -5.425246715545654, "global_step": 23410, "epoch": 557} {"train_loss": -5.424480438232422, "global_step": 23411, "epoch": 557} {"train_loss": -5.366670608520508, "global_step": 23412, "epoch": 557} {"train_loss": -5.361586570739746, "global_step": 23413, "epoch": 557} {"train_loss": -5.3395843505859375, "global_step": 23414, "epoch": 557} {"train_loss": -5.366304874420166, "global_step": 23415, "epoch": 557} {"train_loss": -5.410578727722168, "global_step": 23416, "epoch": 557} {"train_loss": -5.361382484436035, "global_step": 23417, "epoch": 557} {"train_loss": -5.146636962890625, "global_step": 23418, "epoch": 557} {"train_loss": -5.349568843841553, "global_step": 23419, "epoch": 557} {"train_loss": -5.3591718673706055, "global_step": 23420, "epoch": 557} {"train_loss": -5.504990100860596, "global_step": 23421, "epoch": 557} {"train_loss": -5.253891944885254, "global_step": 23422, "epoch": 557} {"train_loss": -5.2457733154296875, "global_step": 23423, "epoch": 557} {"train_loss": -5.288321495056152, "global_step": 23424, "epoch": 557} {"train_loss": -5.408870697021484, "global_step": 23425, "epoch": 557} {"train_loss": -5.282914161682129, "global_step": 23426, "epoch": 557} {"train_loss": -5.395020484924316, "global_step": 23427, "epoch": 557} {"train_loss": -5.489889144897461, "global_step": 23428, "epoch": 557} {"train_loss": -5.178786754608154, "global_step": 23429, "epoch": 557} {"train_loss": -5.302095890045166, "global_step": 23430, "epoch": 557} {"train_loss": -5.497157096862793, "global_step": 23431, "epoch": 557} {"train_loss": -5.461696624755859, "global_step": 23432, "epoch": 557} {"train_loss": -5.453578948974609, "global_step": 23433, "epoch": 557} {"train_loss": -5.3311686515808105, "global_step": 23434, "epoch": 557} {"train_loss": -5.351601532527378, "global_step": 23435, "epoch": 557, "val_loss": 75929.5} {"train_loss": -5.34273624420166, "global_step": 23436, "epoch": 558} {"train_loss": -5.387238502502441, "global_step": 23437, "epoch": 558} {"train_loss": -5.487448692321777, "global_step": 23438, "epoch": 558} {"train_loss": -5.321124076843262, "global_step": 23439, "epoch": 558} {"train_loss": -5.156837463378906, "global_step": 23440, "epoch": 558} {"train_loss": -5.382171154022217, "global_step": 23441, "epoch": 558} {"train_loss": -5.349409580230713, "global_step": 23442, "epoch": 558} {"train_loss": -5.208402156829834, "global_step": 23443, "epoch": 558} {"train_loss": -5.287406921386719, "global_step": 23444, "epoch": 558} {"train_loss": -5.123285293579102, "global_step": 23445, "epoch": 558} {"train_loss": -5.176084995269775, "global_step": 23446, "epoch": 558} {"train_loss": -5.331602573394775, "global_step": 23447, "epoch": 558} {"train_loss": -5.219347953796387, "global_step": 23448, "epoch": 558} {"train_loss": -5.324037551879883, "global_step": 23449, "epoch": 558} {"train_loss": -5.1902055740356445, "global_step": 23450, "epoch": 558} {"train_loss": -5.196204662322998, "global_step": 23451, "epoch": 558} {"train_loss": -5.266348838806152, "global_step": 23452, "epoch": 558} {"train_loss": -5.421451568603516, "global_step": 23453, "epoch": 558} {"train_loss": -5.2680158615112305, "global_step": 23454, "epoch": 558} {"train_loss": -5.267301559448242, "global_step": 23455, "epoch": 558} {"train_loss": -5.388149261474609, "global_step": 23456, "epoch": 558} {"train_loss": -5.293290615081787, "global_step": 23457, "epoch": 558} {"train_loss": -5.23002815246582, "global_step": 23458, "epoch": 558} {"train_loss": -5.249302864074707, "global_step": 23459, "epoch": 558} {"train_loss": -5.32352352142334, "global_step": 23460, "epoch": 558} {"train_loss": -5.229442596435547, "global_step": 23461, "epoch": 558} {"train_loss": -5.234078407287598, "global_step": 23462, "epoch": 558} {"train_loss": -5.317938327789307, "global_step": 23463, "epoch": 558} {"train_loss": -5.4037299156188965, "global_step": 23464, "epoch": 558} {"train_loss": -5.300251007080078, "global_step": 23465, "epoch": 558} {"train_loss": -5.502570152282715, "global_step": 23466, "epoch": 558} {"train_loss": -5.47187614440918, "global_step": 23467, "epoch": 558} {"train_loss": -5.411454200744629, "global_step": 23468, "epoch": 558} {"train_loss": -5.203427314758301, "global_step": 23469, "epoch": 558} {"train_loss": -5.492830276489258, "global_step": 23470, "epoch": 558} {"train_loss": -5.283848762512207, "global_step": 23471, "epoch": 558} {"train_loss": -5.252763271331787, "global_step": 23472, "epoch": 558} {"train_loss": -5.463852882385254, "global_step": 23473, "epoch": 558} {"train_loss": -5.337894439697266, "global_step": 23474, "epoch": 558} {"train_loss": -5.351503372192383, "global_step": 23475, "epoch": 558} {"train_loss": -5.393488883972168, "global_step": 23476, "epoch": 558} {"train_loss": -5.314873729433332, "global_step": 23477, "epoch": 558, "val_loss": 76111.171875} {"train_loss": -5.262414932250977, "global_step": 23478, "epoch": 559} {"train_loss": -5.252287864685059, "global_step": 23479, "epoch": 559} {"train_loss": -5.390164852142334, "global_step": 23480, "epoch": 559} {"train_loss": -5.374959468841553, "global_step": 23481, "epoch": 559} {"train_loss": -5.472708702087402, "global_step": 23482, "epoch": 559} {"train_loss": -5.287101745605469, "global_step": 23483, "epoch": 559} {"train_loss": -5.37750244140625, "global_step": 23484, "epoch": 559} {"train_loss": -5.279325485229492, "global_step": 23485, "epoch": 559} {"train_loss": -5.386013984680176, "global_step": 23486, "epoch": 559} {"train_loss": -5.242988586425781, "global_step": 23487, "epoch": 559} {"train_loss": -5.285586833953857, "global_step": 23488, "epoch": 559} {"train_loss": -5.265342712402344, "global_step": 23489, "epoch": 559} {"train_loss": -5.452354907989502, "global_step": 23490, "epoch": 559} {"train_loss": -5.309959888458252, "global_step": 23491, "epoch": 559} {"train_loss": -5.3320465087890625, "global_step": 23492, "epoch": 559} {"train_loss": -5.430744171142578, "global_step": 23493, "epoch": 559} {"train_loss": -5.432917594909668, "global_step": 23494, "epoch": 559} {"train_loss": -5.4889326095581055, "global_step": 23495, "epoch": 559} {"train_loss": -5.444222450256348, "global_step": 23496, "epoch": 559} {"train_loss": -5.221475601196289, "global_step": 23497, "epoch": 559} {"train_loss": -5.3628129959106445, "global_step": 23498, "epoch": 559} {"train_loss": -5.268343448638916, "global_step": 23499, "epoch": 559} {"train_loss": -5.491235256195068, "global_step": 23500, "epoch": 559} {"train_loss": -5.306058883666992, "global_step": 23501, "epoch": 559} {"train_loss": -5.206511974334717, "global_step": 23502, "epoch": 559} {"train_loss": -5.460042953491211, "global_step": 23503, "epoch": 559} {"train_loss": -5.386507987976074, "global_step": 23504, "epoch": 559} {"train_loss": -5.338143825531006, "global_step": 23505, "epoch": 559} {"train_loss": -5.415835857391357, "global_step": 23506, "epoch": 559} {"train_loss": -5.381942272186279, "global_step": 23507, "epoch": 559} {"train_loss": -5.2725830078125, "global_step": 23508, "epoch": 559} {"train_loss": -5.307689666748047, "global_step": 23509, "epoch": 559} {"train_loss": -5.552026748657227, "global_step": 23510, "epoch": 559} {"train_loss": -5.301083087921143, "global_step": 23511, "epoch": 559} {"train_loss": -5.349415302276611, "global_step": 23512, "epoch": 559} {"train_loss": -5.390923500061035, "global_step": 23513, "epoch": 559} {"train_loss": -5.185290336608887, "global_step": 23514, "epoch": 559} {"train_loss": -5.346621513366699, "global_step": 23515, "epoch": 559} {"train_loss": -5.129002571105957, "global_step": 23516, "epoch": 559} {"train_loss": -5.078563690185547, "global_step": 23517, "epoch": 559} {"train_loss": -5.430706977844238, "global_step": 23518, "epoch": 559} {"train_loss": -5.33643837202163, "global_step": 23519, "epoch": 559, "val_loss": 75951.8828125} {"train_loss": -5.205526351928711, "global_step": 23520, "epoch": 560} {"train_loss": -5.1973676681518555, "global_step": 23521, "epoch": 560} {"train_loss": -5.384880065917969, "global_step": 23522, "epoch": 560} {"train_loss": -5.41225528717041, "global_step": 23523, "epoch": 560} {"train_loss": -5.402383804321289, "global_step": 23524, "epoch": 560} {"train_loss": -5.337298393249512, "global_step": 23525, "epoch": 560} {"train_loss": -5.339351654052734, "global_step": 23526, "epoch": 560} {"train_loss": -5.432781219482422, "global_step": 23527, "epoch": 560} {"train_loss": -5.295671463012695, "global_step": 23528, "epoch": 560} {"train_loss": -5.283544063568115, "global_step": 23529, "epoch": 560} {"train_loss": -5.395829200744629, "global_step": 23530, "epoch": 560} {"train_loss": -5.270902633666992, "global_step": 23531, "epoch": 560} {"train_loss": -5.357982635498047, "global_step": 23532, "epoch": 560} {"train_loss": -5.257139205932617, "global_step": 23533, "epoch": 560} {"train_loss": -5.313376426696777, "global_step": 23534, "epoch": 560} {"train_loss": -5.500002384185791, "global_step": 23535, "epoch": 560} {"train_loss": -5.323693752288818, "global_step": 23536, "epoch": 560} {"train_loss": -5.343165397644043, "global_step": 23537, "epoch": 560} {"train_loss": -5.4537248611450195, "global_step": 23538, "epoch": 560} {"train_loss": -5.310249328613281, "global_step": 23539, "epoch": 560} {"train_loss": -5.3412885665893555, "global_step": 23540, "epoch": 560} {"train_loss": -5.279961585998535, "global_step": 23541, "epoch": 560} {"train_loss": -5.2327880859375, "global_step": 23542, "epoch": 560} {"train_loss": -5.348944187164307, "global_step": 23543, "epoch": 560} {"train_loss": -5.300505638122559, "global_step": 23544, "epoch": 560} {"train_loss": -5.26528263092041, "global_step": 23545, "epoch": 560} {"train_loss": -5.2277679443359375, "global_step": 23546, "epoch": 560} {"train_loss": -5.30856466293335, "global_step": 23547, "epoch": 560} {"train_loss": -5.238487243652344, "global_step": 23548, "epoch": 560} {"train_loss": -5.269469261169434, "global_step": 23549, "epoch": 560} {"train_loss": -5.186144828796387, "global_step": 23550, "epoch": 560} {"train_loss": -5.259973526000977, "global_step": 23551, "epoch": 560} {"train_loss": -5.383236885070801, "global_step": 23552, "epoch": 560} {"train_loss": -5.329301834106445, "global_step": 23553, "epoch": 560} {"train_loss": -5.177274227142334, "global_step": 23554, "epoch": 560} {"train_loss": -5.214055061340332, "global_step": 23555, "epoch": 560} {"train_loss": -5.339601516723633, "global_step": 23556, "epoch": 560} {"train_loss": -5.308770179748535, "global_step": 23557, "epoch": 560} {"train_loss": -5.221565246582031, "global_step": 23558, "epoch": 560} {"train_loss": -5.278475761413574, "global_step": 23559, "epoch": 560} {"train_loss": -5.305391311645508, "global_step": 23560, "epoch": 560} {"train_loss": -5.309078591210501, "global_step": 23561, "epoch": 560, "val_loss": 76222.1953125} {"train_loss": -5.468729496002197, "global_step": 23562, "epoch": 561} {"train_loss": -5.342764854431152, "global_step": 23563, "epoch": 561} {"train_loss": -5.297123908996582, "global_step": 23564, "epoch": 561} {"train_loss": -5.249576568603516, "global_step": 23565, "epoch": 561} {"train_loss": -5.2872209548950195, "global_step": 23566, "epoch": 561} {"train_loss": -5.3515424728393555, "global_step": 23567, "epoch": 561} {"train_loss": -5.311585903167725, "global_step": 23568, "epoch": 561} {"train_loss": -5.379635810852051, "global_step": 23569, "epoch": 561} {"train_loss": -5.423225402832031, "global_step": 23570, "epoch": 561} {"train_loss": -5.3102617263793945, "global_step": 23571, "epoch": 561} {"train_loss": -5.365318298339844, "global_step": 23572, "epoch": 561} {"train_loss": -5.368792533874512, "global_step": 23573, "epoch": 561} {"train_loss": -5.364677429199219, "global_step": 23574, "epoch": 561} {"train_loss": -5.409857749938965, "global_step": 23575, "epoch": 561} {"train_loss": -5.455009460449219, "global_step": 23576, "epoch": 561} {"train_loss": -5.258813858032227, "global_step": 23577, "epoch": 561} {"train_loss": -5.354113578796387, "global_step": 23578, "epoch": 561} {"train_loss": -5.400362014770508, "global_step": 23579, "epoch": 561} {"train_loss": -5.401724815368652, "global_step": 23580, "epoch": 561} {"train_loss": -5.383597373962402, "global_step": 23581, "epoch": 561} {"train_loss": -5.465928077697754, "global_step": 23582, "epoch": 561} {"train_loss": -5.349116802215576, "global_step": 23583, "epoch": 561} {"train_loss": -5.480264663696289, "global_step": 23584, "epoch": 561} {"train_loss": -5.292393684387207, "global_step": 23585, "epoch": 561} {"train_loss": -5.328324317932129, "global_step": 23586, "epoch": 561} {"train_loss": -5.429339408874512, "global_step": 23587, "epoch": 561} {"train_loss": -5.352182388305664, "global_step": 23588, "epoch": 561} {"train_loss": -5.40850830078125, "global_step": 23589, "epoch": 561} {"train_loss": -5.345673084259033, "global_step": 23590, "epoch": 561} {"train_loss": -5.415694236755371, "global_step": 23591, "epoch": 561} {"train_loss": -5.381625175476074, "global_step": 23592, "epoch": 561} {"train_loss": -5.419462203979492, "global_step": 23593, "epoch": 561} {"train_loss": -5.476320743560791, "global_step": 23594, "epoch": 561} {"train_loss": -5.404317855834961, "global_step": 23595, "epoch": 561} {"train_loss": -5.259693145751953, "global_step": 23596, "epoch": 561} {"train_loss": -5.609314441680908, "global_step": 23597, "epoch": 561} {"train_loss": -5.438467979431152, "global_step": 23598, "epoch": 561} {"train_loss": -5.292390823364258, "global_step": 23599, "epoch": 561} {"train_loss": -5.207442283630371, "global_step": 23600, "epoch": 561} {"train_loss": -5.189840793609619, "global_step": 23601, "epoch": 561} {"train_loss": -5.411911964416504, "global_step": 23602, "epoch": 561} {"train_loss": -5.369940326327369, "global_step": 23603, "epoch": 561, "val_loss": 76371.15625} {"train_loss": -5.430858612060547, "global_step": 23604, "epoch": 562} {"train_loss": -5.375875473022461, "global_step": 23605, "epoch": 562} {"train_loss": -5.355216979980469, "global_step": 23606, "epoch": 562} {"train_loss": -5.438589096069336, "global_step": 23607, "epoch": 562} {"train_loss": -5.456571578979492, "global_step": 23608, "epoch": 562} {"train_loss": -5.285266399383545, "global_step": 23609, "epoch": 562} {"train_loss": -5.424246788024902, "global_step": 23610, "epoch": 562} {"train_loss": -5.187593936920166, "global_step": 23611, "epoch": 562} {"train_loss": -5.367897987365723, "global_step": 23612, "epoch": 562} {"train_loss": -5.379395484924316, "global_step": 23613, "epoch": 562} {"train_loss": -5.323543548583984, "global_step": 23614, "epoch": 562} {"train_loss": -5.4314374923706055, "global_step": 23615, "epoch": 562} {"train_loss": -5.397854804992676, "global_step": 23616, "epoch": 562} {"train_loss": -5.206826686859131, "global_step": 23617, "epoch": 562} {"train_loss": -5.200075149536133, "global_step": 23618, "epoch": 562} {"train_loss": -5.40887451171875, "global_step": 23619, "epoch": 562} {"train_loss": -5.299521446228027, "global_step": 23620, "epoch": 562} {"train_loss": -5.447051048278809, "global_step": 23621, "epoch": 562} {"train_loss": -5.333827018737793, "global_step": 23622, "epoch": 562} {"train_loss": -5.455007553100586, "global_step": 23623, "epoch": 562} {"train_loss": -5.281538963317871, "global_step": 23624, "epoch": 562} {"train_loss": -5.396817207336426, "global_step": 23625, "epoch": 562} {"train_loss": -5.334474563598633, "global_step": 23626, "epoch": 562} {"train_loss": -5.331732749938965, "global_step": 23627, "epoch": 562} {"train_loss": -5.356359481811523, "global_step": 23628, "epoch": 562} {"train_loss": -5.446274280548096, "global_step": 23629, "epoch": 562} {"train_loss": -5.4277663230896, "global_step": 23630, "epoch": 562} {"train_loss": -5.333730697631836, "global_step": 23631, "epoch": 562} {"train_loss": -5.2832818031311035, "global_step": 23632, "epoch": 562} {"train_loss": -5.292523384094238, "global_step": 23633, "epoch": 562} {"train_loss": -5.522871971130371, "global_step": 23634, "epoch": 562} {"train_loss": -5.401142120361328, "global_step": 23635, "epoch": 562} {"train_loss": -5.384756088256836, "global_step": 23636, "epoch": 562} {"train_loss": -5.341967582702637, "global_step": 23637, "epoch": 562} {"train_loss": -5.434947967529297, "global_step": 23638, "epoch": 562} {"train_loss": -5.465516090393066, "global_step": 23639, "epoch": 562} {"train_loss": -5.270782947540283, "global_step": 23640, "epoch": 562} {"train_loss": -5.464493751525879, "global_step": 23641, "epoch": 562} {"train_loss": -5.388400554656982, "global_step": 23642, "epoch": 562} {"train_loss": -5.31462287902832, "global_step": 23643, "epoch": 562} {"train_loss": -5.367216110229492, "global_step": 23644, "epoch": 562} {"train_loss": -5.364516973495483, "global_step": 23645, "epoch": 562, "val_loss": 76587.4453125} {"train_loss": -5.361439228057861, "global_step": 23646, "epoch": 563} {"train_loss": -5.368216037750244, "global_step": 23647, "epoch": 563} {"train_loss": -5.31745719909668, "global_step": 23648, "epoch": 563} {"train_loss": -5.413227081298828, "global_step": 23649, "epoch": 563} {"train_loss": -5.521303653717041, "global_step": 23650, "epoch": 563} {"train_loss": -5.297918796539307, "global_step": 23651, "epoch": 563} {"train_loss": -5.416028022766113, "global_step": 23652, "epoch": 563} {"train_loss": -5.291629791259766, "global_step": 23653, "epoch": 563} {"train_loss": -5.300351619720459, "global_step": 23654, "epoch": 563} {"train_loss": -5.243200302124023, "global_step": 23655, "epoch": 563} {"train_loss": -5.480689525604248, "global_step": 23656, "epoch": 563} {"train_loss": -5.235072135925293, "global_step": 23657, "epoch": 563} {"train_loss": -5.425840377807617, "global_step": 23658, "epoch": 563} {"train_loss": -5.271085739135742, "global_step": 23659, "epoch": 563} {"train_loss": -5.2414326667785645, "global_step": 23660, "epoch": 563} {"train_loss": -5.30249547958374, "global_step": 23661, "epoch": 563} {"train_loss": -5.392293453216553, "global_step": 23662, "epoch": 563} {"train_loss": -5.443427085876465, "global_step": 23663, "epoch": 563} {"train_loss": -5.380712509155273, "global_step": 23664, "epoch": 563} {"train_loss": -5.388502597808838, "global_step": 23665, "epoch": 563} {"train_loss": -5.471862316131592, "global_step": 23666, "epoch": 563} {"train_loss": -5.392431259155273, "global_step": 23667, "epoch": 563} {"train_loss": -5.335798263549805, "global_step": 23668, "epoch": 563} {"train_loss": -5.476682186126709, "global_step": 23669, "epoch": 563} {"train_loss": -5.273764133453369, "global_step": 23670, "epoch": 563} {"train_loss": -5.4374189376831055, "global_step": 23671, "epoch": 563} {"train_loss": -5.42396879196167, "global_step": 23672, "epoch": 563} {"train_loss": -5.331347465515137, "global_step": 23673, "epoch": 563} {"train_loss": -5.383831024169922, "global_step": 23674, "epoch": 563} {"train_loss": -5.450908660888672, "global_step": 23675, "epoch": 563} {"train_loss": -5.379513740539551, "global_step": 23676, "epoch": 563} {"train_loss": -5.379528522491455, "global_step": 23677, "epoch": 563} {"train_loss": -5.395637512207031, "global_step": 23678, "epoch": 563} {"train_loss": -5.366418838500977, "global_step": 23679, "epoch": 563} {"train_loss": -5.343926906585693, "global_step": 23680, "epoch": 563} {"train_loss": -5.440556049346924, "global_step": 23681, "epoch": 563} {"train_loss": -5.413507461547852, "global_step": 23682, "epoch": 563} {"train_loss": -5.316777229309082, "global_step": 23683, "epoch": 563} {"train_loss": -5.471296310424805, "global_step": 23684, "epoch": 563} {"train_loss": -5.2959394454956055, "global_step": 23685, "epoch": 563} {"train_loss": -5.447623252868652, "global_step": 23686, "epoch": 563} {"train_loss": -5.377331222806658, "global_step": 23687, "epoch": 563, "val_loss": 76216.0625} {"train_loss": -5.378891944885254, "global_step": 23688, "epoch": 564} {"train_loss": -5.225281238555908, "global_step": 23689, "epoch": 564} {"train_loss": -5.429715633392334, "global_step": 23690, "epoch": 564} {"train_loss": -5.346347808837891, "global_step": 23691, "epoch": 564} {"train_loss": -5.3011956214904785, "global_step": 23692, "epoch": 564} {"train_loss": -5.449782371520996, "global_step": 23693, "epoch": 564} {"train_loss": -5.326563835144043, "global_step": 23694, "epoch": 564} {"train_loss": -5.350521087646484, "global_step": 23695, "epoch": 564} {"train_loss": -5.294860363006592, "global_step": 23696, "epoch": 564} {"train_loss": -5.248434066772461, "global_step": 23697, "epoch": 564} {"train_loss": -5.396799087524414, "global_step": 23698, "epoch": 564} {"train_loss": -5.319584369659424, "global_step": 23699, "epoch": 564} {"train_loss": -5.311009407043457, "global_step": 23700, "epoch": 564} {"train_loss": -5.45801305770874, "global_step": 23701, "epoch": 564} {"train_loss": -5.415193557739258, "global_step": 23702, "epoch": 564} {"train_loss": -5.315827369689941, "global_step": 23703, "epoch": 564} {"train_loss": -5.42572021484375, "global_step": 23704, "epoch": 564} {"train_loss": -5.347175598144531, "global_step": 23705, "epoch": 564} {"train_loss": -5.319276809692383, "global_step": 23706, "epoch": 564} {"train_loss": -5.192168712615967, "global_step": 23707, "epoch": 564} {"train_loss": -5.344108581542969, "global_step": 23708, "epoch": 564} {"train_loss": -5.394146919250488, "global_step": 23709, "epoch": 564} {"train_loss": -5.45179557800293, "global_step": 23710, "epoch": 564} {"train_loss": -5.299442768096924, "global_step": 23711, "epoch": 564} {"train_loss": -5.429631233215332, "global_step": 23712, "epoch": 564} {"train_loss": -5.33326530456543, "global_step": 23713, "epoch": 564} {"train_loss": -5.324268341064453, "global_step": 23714, "epoch": 564} {"train_loss": -5.498159885406494, "global_step": 23715, "epoch": 564} {"train_loss": -5.462202072143555, "global_step": 23716, "epoch": 564} {"train_loss": -5.462652683258057, "global_step": 23717, "epoch": 564} {"train_loss": -5.330782890319824, "global_step": 23718, "epoch": 564} {"train_loss": -5.2842631340026855, "global_step": 23719, "epoch": 564} {"train_loss": -5.486717700958252, "global_step": 23720, "epoch": 564} {"train_loss": -5.515133380889893, "global_step": 23721, "epoch": 564} {"train_loss": -5.3225603103637695, "global_step": 23722, "epoch": 564} {"train_loss": -5.449960708618164, "global_step": 23723, "epoch": 564} {"train_loss": -5.328433513641357, "global_step": 23724, "epoch": 564} {"train_loss": -5.474255561828613, "global_step": 23725, "epoch": 564} {"train_loss": -5.357438564300537, "global_step": 23726, "epoch": 564} {"train_loss": -5.206874370574951, "global_step": 23727, "epoch": 564} {"train_loss": -5.361654281616211, "global_step": 23728, "epoch": 564} {"train_loss": -5.366369656154087, "global_step": 23729, "epoch": 564, "val_loss": 75793.921875} {"train_loss": -5.347344398498535, "global_step": 23730, "epoch": 565} {"train_loss": -5.333469867706299, "global_step": 23731, "epoch": 565} {"train_loss": -5.288997650146484, "global_step": 23732, "epoch": 565} {"train_loss": -5.363019943237305, "global_step": 23733, "epoch": 565} {"train_loss": -5.265921592712402, "global_step": 23734, "epoch": 565} {"train_loss": -5.390985488891602, "global_step": 23735, "epoch": 565} {"train_loss": -5.419001579284668, "global_step": 23736, "epoch": 565} {"train_loss": -5.360750198364258, "global_step": 23737, "epoch": 565} {"train_loss": -5.316762924194336, "global_step": 23738, "epoch": 565} {"train_loss": -5.345774173736572, "global_step": 23739, "epoch": 565} {"train_loss": -5.400712013244629, "global_step": 23740, "epoch": 565} {"train_loss": -5.429574966430664, "global_step": 23741, "epoch": 565} {"train_loss": -5.389404773712158, "global_step": 23742, "epoch": 565} {"train_loss": -5.311615467071533, "global_step": 23743, "epoch": 565} {"train_loss": -5.402190208435059, "global_step": 23744, "epoch": 565} {"train_loss": -5.389598846435547, "global_step": 23745, "epoch": 565} {"train_loss": -5.431743144989014, "global_step": 23746, "epoch": 565} {"train_loss": -5.540684700012207, "global_step": 23747, "epoch": 565} {"train_loss": -5.42319393157959, "global_step": 23748, "epoch": 565} {"train_loss": -5.32091760635376, "global_step": 23749, "epoch": 565} {"train_loss": -5.430233001708984, "global_step": 23750, "epoch": 565} {"train_loss": -5.347835540771484, "global_step": 23751, "epoch": 565} {"train_loss": -5.319159984588623, "global_step": 23752, "epoch": 565} {"train_loss": -5.4155168533325195, "global_step": 23753, "epoch": 565} {"train_loss": -5.353137969970703, "global_step": 23754, "epoch": 565} {"train_loss": -5.204262733459473, "global_step": 23755, "epoch": 565} {"train_loss": -5.3705925941467285, "global_step": 23756, "epoch": 565} {"train_loss": -5.4605560302734375, "global_step": 23757, "epoch": 565} {"train_loss": -5.262722492218018, "global_step": 23758, "epoch": 565} {"train_loss": -5.381720542907715, "global_step": 23759, "epoch": 565} {"train_loss": -5.302757740020752, "global_step": 23760, "epoch": 565} {"train_loss": -5.316733360290527, "global_step": 23761, "epoch": 565} {"train_loss": -5.420012474060059, "global_step": 23762, "epoch": 565} {"train_loss": -5.3703107833862305, "global_step": 23763, "epoch": 565} {"train_loss": -5.438080787658691, "global_step": 23764, "epoch": 565} {"train_loss": -5.380035400390625, "global_step": 23765, "epoch": 565} {"train_loss": -5.374471187591553, "global_step": 23766, "epoch": 565} {"train_loss": -5.480823516845703, "global_step": 23767, "epoch": 565} {"train_loss": -5.281824588775635, "global_step": 23768, "epoch": 565} {"train_loss": -5.416616439819336, "global_step": 23769, "epoch": 565} {"train_loss": -5.303668022155762, "global_step": 23770, "epoch": 565} {"train_loss": -5.367801813852219, "global_step": 23771, "epoch": 565, "val_loss": 76464.7421875} {"train_loss": -5.261734485626221, "global_step": 23772, "epoch": 566} {"train_loss": -5.258371829986572, "global_step": 23773, "epoch": 566} {"train_loss": -5.2784576416015625, "global_step": 23774, "epoch": 566} {"train_loss": -5.312410831451416, "global_step": 23775, "epoch": 566} {"train_loss": -5.32418155670166, "global_step": 23776, "epoch": 566} {"train_loss": -5.1678547859191895, "global_step": 23777, "epoch": 566} {"train_loss": -5.383857250213623, "global_step": 23778, "epoch": 566} {"train_loss": -5.330265045166016, "global_step": 23779, "epoch": 566} {"train_loss": -5.309206962585449, "global_step": 23780, "epoch": 566} {"train_loss": -5.427263259887695, "global_step": 23781, "epoch": 566} {"train_loss": -5.368484020233154, "global_step": 23782, "epoch": 566} {"train_loss": -5.364335536956787, "global_step": 23783, "epoch": 566} {"train_loss": -5.353569984436035, "global_step": 23784, "epoch": 566} {"train_loss": -5.374715805053711, "global_step": 23785, "epoch": 566} {"train_loss": -5.293249130249023, "global_step": 23786, "epoch": 566} {"train_loss": -5.457435607910156, "global_step": 23787, "epoch": 566} {"train_loss": -5.3040771484375, "global_step": 23788, "epoch": 566} {"train_loss": -5.348768711090088, "global_step": 23789, "epoch": 566} {"train_loss": -5.3008246421813965, "global_step": 23790, "epoch": 566} {"train_loss": -5.3937458992004395, "global_step": 23791, "epoch": 566} {"train_loss": -5.479694366455078, "global_step": 23792, "epoch": 566} {"train_loss": -5.40652322769165, "global_step": 23793, "epoch": 566} {"train_loss": -5.3882365226745605, "global_step": 23794, "epoch": 566} {"train_loss": -5.220893383026123, "global_step": 23795, "epoch": 566} {"train_loss": -5.492916107177734, "global_step": 23796, "epoch": 566} {"train_loss": -5.3490118980407715, "global_step": 23797, "epoch": 566} {"train_loss": -5.3546247482299805, "global_step": 23798, "epoch": 566} {"train_loss": -5.340461730957031, "global_step": 23799, "epoch": 566} {"train_loss": -5.386393070220947, "global_step": 23800, "epoch": 566} {"train_loss": -5.401364803314209, "global_step": 23801, "epoch": 566} {"train_loss": -5.369356632232666, "global_step": 23802, "epoch": 566} {"train_loss": -5.42303991317749, "global_step": 23803, "epoch": 566} {"train_loss": -5.261509895324707, "global_step": 23804, "epoch": 566} {"train_loss": -5.271739959716797, "global_step": 23805, "epoch": 566} {"train_loss": -5.313806533813477, "global_step": 23806, "epoch": 566} {"train_loss": -5.426382064819336, "global_step": 23807, "epoch": 566} {"train_loss": -5.277722358703613, "global_step": 23808, "epoch": 566} {"train_loss": -5.392666816711426, "global_step": 23809, "epoch": 566} {"train_loss": -5.373639106750488, "global_step": 23810, "epoch": 566} {"train_loss": -5.277920722961426, "global_step": 23811, "epoch": 566} {"train_loss": -5.233347415924072, "global_step": 23812, "epoch": 566} {"train_loss": -5.344011329469227, "global_step": 23813, "epoch": 566, "val_loss": 76189.4921875} {"train_loss": -5.17421817779541, "global_step": 23814, "epoch": 567} {"train_loss": -5.367642402648926, "global_step": 23815, "epoch": 567} {"train_loss": -5.297723770141602, "global_step": 23816, "epoch": 567} {"train_loss": -5.388184547424316, "global_step": 23817, "epoch": 567} {"train_loss": -5.431207656860352, "global_step": 23818, "epoch": 567} {"train_loss": -5.3209381103515625, "global_step": 23819, "epoch": 567} {"train_loss": -5.284781455993652, "global_step": 23820, "epoch": 567} {"train_loss": -5.415991306304932, "global_step": 23821, "epoch": 567} {"train_loss": -5.449975490570068, "global_step": 23822, "epoch": 567} {"train_loss": -5.410245895385742, "global_step": 23823, "epoch": 567} {"train_loss": -5.41947078704834, "global_step": 23824, "epoch": 567} {"train_loss": -5.47686767578125, "global_step": 23825, "epoch": 567} {"train_loss": -5.418092727661133, "global_step": 23826, "epoch": 567} {"train_loss": -5.308836936950684, "global_step": 23827, "epoch": 567} {"train_loss": -5.390378475189209, "global_step": 23828, "epoch": 567} {"train_loss": -5.368686676025391, "global_step": 23829, "epoch": 567} {"train_loss": -5.472897052764893, "global_step": 23830, "epoch": 567} {"train_loss": -5.2687859535217285, "global_step": 23831, "epoch": 567} {"train_loss": -5.474722862243652, "global_step": 23832, "epoch": 567} {"train_loss": -5.407814025878906, "global_step": 23833, "epoch": 567} {"train_loss": -5.361270904541016, "global_step": 23834, "epoch": 567} {"train_loss": -5.280940055847168, "global_step": 23835, "epoch": 567} {"train_loss": -5.347858428955078, "global_step": 23836, "epoch": 567} {"train_loss": -5.3031463623046875, "global_step": 23837, "epoch": 567} {"train_loss": -5.414162635803223, "global_step": 23838, "epoch": 567} {"train_loss": -5.383581161499023, "global_step": 23839, "epoch": 567} {"train_loss": -5.141451835632324, "global_step": 23840, "epoch": 567} {"train_loss": -5.403500080108643, "global_step": 23841, "epoch": 567} {"train_loss": -5.43064022064209, "global_step": 23842, "epoch": 567} {"train_loss": -5.412525177001953, "global_step": 23843, "epoch": 567} {"train_loss": -5.363116264343262, "global_step": 23844, "epoch": 567} {"train_loss": -5.411762237548828, "global_step": 23845, "epoch": 567} {"train_loss": -5.405814170837402, "global_step": 23846, "epoch": 567} {"train_loss": -5.3845534324646, "global_step": 23847, "epoch": 567} {"train_loss": -5.306577205657959, "global_step": 23848, "epoch": 567} {"train_loss": -5.3286590576171875, "global_step": 23849, "epoch": 567} {"train_loss": -5.358969688415527, "global_step": 23850, "epoch": 567} {"train_loss": -5.469642639160156, "global_step": 23851, "epoch": 567} {"train_loss": -5.342226028442383, "global_step": 23852, "epoch": 567} {"train_loss": -5.434738636016846, "global_step": 23853, "epoch": 567} {"train_loss": -5.518954753875732, "global_step": 23854, "epoch": 567} {"train_loss": -5.372215157463437, "global_step": 23855, "epoch": 567, "val_loss": 75683.3046875} {"train_loss": -5.422430038452148, "global_step": 23856, "epoch": 568} {"train_loss": -5.383798122406006, "global_step": 23857, "epoch": 568} {"train_loss": -5.484963417053223, "global_step": 23858, "epoch": 568} {"train_loss": -5.494422435760498, "global_step": 23859, "epoch": 568} {"train_loss": -5.480402946472168, "global_step": 23860, "epoch": 568} {"train_loss": -5.314317226409912, "global_step": 23861, "epoch": 568} {"train_loss": -5.455753326416016, "global_step": 23862, "epoch": 568} {"train_loss": -5.4372758865356445, "global_step": 23863, "epoch": 568} {"train_loss": -5.5212578773498535, "global_step": 23864, "epoch": 568} {"train_loss": -5.363292217254639, "global_step": 23865, "epoch": 568} {"train_loss": -5.308751583099365, "global_step": 23866, "epoch": 568} {"train_loss": -5.513669967651367, "global_step": 23867, "epoch": 568} {"train_loss": -5.429492950439453, "global_step": 23868, "epoch": 568} {"train_loss": -5.206658363342285, "global_step": 23869, "epoch": 568} {"train_loss": -5.4587225914001465, "global_step": 23870, "epoch": 568} {"train_loss": -5.521183013916016, "global_step": 23871, "epoch": 568} {"train_loss": -5.321987152099609, "global_step": 23872, "epoch": 568} {"train_loss": -5.532096862792969, "global_step": 23873, "epoch": 568} {"train_loss": -5.397631645202637, "global_step": 23874, "epoch": 568} {"train_loss": -5.414968490600586, "global_step": 23875, "epoch": 568} {"train_loss": -5.332527160644531, "global_step": 23876, "epoch": 568} {"train_loss": -5.334500312805176, "global_step": 23877, "epoch": 568} {"train_loss": -5.332976341247559, "global_step": 23878, "epoch": 568} {"train_loss": -5.487532615661621, "global_step": 23879, "epoch": 568} {"train_loss": -5.273002624511719, "global_step": 23880, "epoch": 568} {"train_loss": -5.26615047454834, "global_step": 23881, "epoch": 568} {"train_loss": -5.2725725173950195, "global_step": 23882, "epoch": 568} {"train_loss": -5.403329849243164, "global_step": 23883, "epoch": 568} {"train_loss": -5.188796043395996, "global_step": 23884, "epoch": 568} {"train_loss": -5.351617813110352, "global_step": 23885, "epoch": 568} {"train_loss": -5.440359115600586, "global_step": 23886, "epoch": 568} {"train_loss": -5.25383186340332, "global_step": 23887, "epoch": 568} {"train_loss": -5.204996109008789, "global_step": 23888, "epoch": 568} {"train_loss": -5.439662456512451, "global_step": 23889, "epoch": 568} {"train_loss": -5.351387023925781, "global_step": 23890, "epoch": 568} {"train_loss": -5.240978717803955, "global_step": 23891, "epoch": 568} {"train_loss": -5.474430084228516, "global_step": 23892, "epoch": 568} {"train_loss": -5.298547744750977, "global_step": 23893, "epoch": 568} {"train_loss": -5.429272651672363, "global_step": 23894, "epoch": 568} {"train_loss": -5.327370643615723, "global_step": 23895, "epoch": 568} {"train_loss": -5.44834566116333, "global_step": 23896, "epoch": 568} {"train_loss": -5.377233936673119, "global_step": 23897, "epoch": 568, "val_loss": 76455.2734375} {"train_loss": -5.358691215515137, "global_step": 23898, "epoch": 569} {"train_loss": -5.40727424621582, "global_step": 23899, "epoch": 569} {"train_loss": -5.512962818145752, "global_step": 23900, "epoch": 569} {"train_loss": -5.445075035095215, "global_step": 23901, "epoch": 569} {"train_loss": -5.3322601318359375, "global_step": 23902, "epoch": 569} {"train_loss": -5.415881156921387, "global_step": 23903, "epoch": 569} {"train_loss": -5.3164777755737305, "global_step": 23904, "epoch": 569} {"train_loss": -5.374204158782959, "global_step": 23905, "epoch": 569} {"train_loss": -5.419270992279053, "global_step": 23906, "epoch": 569} {"train_loss": -5.429220676422119, "global_step": 23907, "epoch": 569} {"train_loss": -5.488461494445801, "global_step": 23908, "epoch": 569} {"train_loss": -5.210915565490723, "global_step": 23909, "epoch": 569} {"train_loss": -5.242018699645996, "global_step": 23910, "epoch": 569} {"train_loss": -5.329977989196777, "global_step": 23911, "epoch": 569} {"train_loss": -5.2892746925354, "global_step": 23912, "epoch": 569} {"train_loss": -5.243664741516113, "global_step": 23913, "epoch": 569} {"train_loss": -5.362370491027832, "global_step": 23914, "epoch": 569} {"train_loss": -5.35600471496582, "global_step": 23915, "epoch": 569} {"train_loss": -5.298837661743164, "global_step": 23916, "epoch": 569} {"train_loss": -5.285706996917725, "global_step": 23917, "epoch": 569} {"train_loss": -5.3257856369018555, "global_step": 23918, "epoch": 569} {"train_loss": -5.341152191162109, "global_step": 23919, "epoch": 569} {"train_loss": -5.380352973937988, "global_step": 23920, "epoch": 569} {"train_loss": -5.343883037567139, "global_step": 23921, "epoch": 569} {"train_loss": -5.391927242279053, "global_step": 23922, "epoch": 569} {"train_loss": -5.3884406089782715, "global_step": 23923, "epoch": 569} {"train_loss": -5.235542297363281, "global_step": 23924, "epoch": 569} {"train_loss": -5.340754985809326, "global_step": 23925, "epoch": 569} {"train_loss": -5.347932815551758, "global_step": 23926, "epoch": 569} {"train_loss": -5.24359655380249, "global_step": 23927, "epoch": 569} {"train_loss": -5.472637176513672, "global_step": 23928, "epoch": 569} {"train_loss": -5.34596061706543, "global_step": 23929, "epoch": 569} {"train_loss": -5.39440393447876, "global_step": 23930, "epoch": 569} {"train_loss": -5.440402984619141, "global_step": 23931, "epoch": 569} {"train_loss": -5.255321025848389, "global_step": 23932, "epoch": 569} {"train_loss": -5.324525833129883, "global_step": 23933, "epoch": 569} {"train_loss": -5.310535430908203, "global_step": 23934, "epoch": 569} {"train_loss": -5.38751220703125, "global_step": 23935, "epoch": 569} {"train_loss": -5.35575008392334, "global_step": 23936, "epoch": 569} {"train_loss": -5.2470703125, "global_step": 23937, "epoch": 569} {"train_loss": -5.322858810424805, "global_step": 23938, "epoch": 569} {"train_loss": -5.347529388609386, "global_step": 23939, "epoch": 569, "val_loss": 76705.1796875} {"train_loss": -5.232692241668701, "global_step": 23940, "epoch": 570} {"train_loss": -5.295755386352539, "global_step": 23941, "epoch": 570} {"train_loss": -5.4655866622924805, "global_step": 23942, "epoch": 570} {"train_loss": -5.461231231689453, "global_step": 23943, "epoch": 570} {"train_loss": -5.366994857788086, "global_step": 23944, "epoch": 570} {"train_loss": -5.317042350769043, "global_step": 23945, "epoch": 570} {"train_loss": -5.331436634063721, "global_step": 23946, "epoch": 570} {"train_loss": -5.3186845779418945, "global_step": 23947, "epoch": 570} {"train_loss": -5.34719705581665, "global_step": 23948, "epoch": 570} {"train_loss": -5.306633472442627, "global_step": 23949, "epoch": 570} {"train_loss": -5.412880897521973, "global_step": 23950, "epoch": 570} {"train_loss": -5.333929061889648, "global_step": 23951, "epoch": 570} {"train_loss": -5.300778388977051, "global_step": 23952, "epoch": 570} {"train_loss": -5.329037666320801, "global_step": 23953, "epoch": 570} {"train_loss": -5.339521408081055, "global_step": 23954, "epoch": 570} {"train_loss": -5.371180534362793, "global_step": 23955, "epoch": 570} {"train_loss": -5.3995819091796875, "global_step": 23956, "epoch": 570} {"train_loss": -5.195866107940674, "global_step": 23957, "epoch": 570} {"train_loss": -5.321137428283691, "global_step": 23958, "epoch": 570} {"train_loss": -5.4739789962768555, "global_step": 23959, "epoch": 570} {"train_loss": -5.33613395690918, "global_step": 23960, "epoch": 570} {"train_loss": -5.354666233062744, "global_step": 23961, "epoch": 570} {"train_loss": -5.328514099121094, "global_step": 23962, "epoch": 570} {"train_loss": -5.317663192749023, "global_step": 23963, "epoch": 570} {"train_loss": -5.397375106811523, "global_step": 23964, "epoch": 570} {"train_loss": -5.3483123779296875, "global_step": 23965, "epoch": 570} {"train_loss": -5.290667533874512, "global_step": 23966, "epoch": 570} {"train_loss": -5.336221218109131, "global_step": 23967, "epoch": 570} {"train_loss": -5.344680309295654, "global_step": 23968, "epoch": 570} {"train_loss": -5.270944595336914, "global_step": 23969, "epoch": 570} {"train_loss": -5.276276588439941, "global_step": 23970, "epoch": 570} {"train_loss": -5.416595935821533, "global_step": 23971, "epoch": 570} {"train_loss": -5.317146301269531, "global_step": 23972, "epoch": 570} {"train_loss": -5.27846097946167, "global_step": 23973, "epoch": 570} {"train_loss": -5.461369514465332, "global_step": 23974, "epoch": 570} {"train_loss": -5.2782793045043945, "global_step": 23975, "epoch": 570} {"train_loss": -5.3322577476501465, "global_step": 23976, "epoch": 570} {"train_loss": -5.245838165283203, "global_step": 23977, "epoch": 570} {"train_loss": -5.463515281677246, "global_step": 23978, "epoch": 570} {"train_loss": -5.379486083984375, "global_step": 23979, "epoch": 570} {"train_loss": -5.278408050537109, "global_step": 23980, "epoch": 570} {"train_loss": -5.341445832025437, "global_step": 23981, "epoch": 570, "val_loss": 76093.5859375} {"train_loss": -5.257762432098389, "global_step": 23982, "epoch": 571} {"train_loss": -5.312155723571777, "global_step": 23983, "epoch": 571} {"train_loss": -5.343860149383545, "global_step": 23984, "epoch": 571} {"train_loss": -5.415593147277832, "global_step": 23985, "epoch": 571} {"train_loss": -5.355685234069824, "global_step": 23986, "epoch": 571} {"train_loss": -5.374810218811035, "global_step": 23987, "epoch": 571} {"train_loss": -5.352507591247559, "global_step": 23988, "epoch": 571} {"train_loss": -5.3964385986328125, "global_step": 23989, "epoch": 571} {"train_loss": -5.408199310302734, "global_step": 23990, "epoch": 571} {"train_loss": -5.289186477661133, "global_step": 23991, "epoch": 571} {"train_loss": -5.411725044250488, "global_step": 23992, "epoch": 571} {"train_loss": -5.445038318634033, "global_step": 23993, "epoch": 571} {"train_loss": -5.418066024780273, "global_step": 23994, "epoch": 571} {"train_loss": -5.366278171539307, "global_step": 23995, "epoch": 571} {"train_loss": -5.362998962402344, "global_step": 23996, "epoch": 571} {"train_loss": -5.3105316162109375, "global_step": 23997, "epoch": 571} {"train_loss": -5.372382640838623, "global_step": 23998, "epoch": 571} {"train_loss": -5.385117530822754, "global_step": 23999, "epoch": 571} {"train_loss": -5.343677520751953, "global_step": 24000, "epoch": 571} {"train_loss": -5.436470031738281, "global_step": 24001, "epoch": 571} {"train_loss": -5.4303436279296875, "global_step": 24002, "epoch": 571} {"train_loss": -5.332208633422852, "global_step": 24003, "epoch": 571} {"train_loss": -5.277702331542969, "global_step": 24004, "epoch": 571} {"train_loss": -5.398353099822998, "global_step": 24005, "epoch": 571} {"train_loss": -5.555692195892334, "global_step": 24006, "epoch": 571} {"train_loss": -5.282084941864014, "global_step": 24007, "epoch": 571} {"train_loss": -5.392395973205566, "global_step": 24008, "epoch": 571} {"train_loss": -5.362868785858154, "global_step": 24009, "epoch": 571} {"train_loss": -5.370757102966309, "global_step": 24010, "epoch": 571} {"train_loss": -5.331932544708252, "global_step": 24011, "epoch": 571} {"train_loss": -5.402742385864258, "global_step": 24012, "epoch": 571} {"train_loss": -5.312131404876709, "global_step": 24013, "epoch": 571} {"train_loss": -5.203502655029297, "global_step": 24014, "epoch": 571} {"train_loss": -5.351188659667969, "global_step": 24015, "epoch": 571} {"train_loss": -5.457524299621582, "global_step": 24016, "epoch": 571} {"train_loss": -5.382697105407715, "global_step": 24017, "epoch": 571} {"train_loss": -5.350584983825684, "global_step": 24018, "epoch": 571} {"train_loss": -5.302342414855957, "global_step": 24019, "epoch": 571} {"train_loss": -5.428070068359375, "global_step": 24020, "epoch": 571} {"train_loss": -5.412649154663086, "global_step": 24021, "epoch": 571} {"train_loss": -5.327288627624512, "global_step": 24022, "epoch": 571} {"train_loss": -5.365702436083839, "global_step": 24023, "epoch": 571, "val_loss": 76353.375} {"train_loss": -5.389317035675049, "global_step": 24024, "epoch": 572} {"train_loss": -5.328325271606445, "global_step": 24025, "epoch": 572} {"train_loss": -5.399318695068359, "global_step": 24026, "epoch": 572} {"train_loss": -5.31309175491333, "global_step": 24027, "epoch": 572} {"train_loss": -5.420105934143066, "global_step": 24028, "epoch": 572} {"train_loss": -5.36201286315918, "global_step": 24029, "epoch": 572} {"train_loss": -5.331778526306152, "global_step": 24030, "epoch": 572} {"train_loss": -5.300371170043945, "global_step": 24031, "epoch": 572} {"train_loss": -5.299632549285889, "global_step": 24032, "epoch": 572} {"train_loss": -5.275544166564941, "global_step": 24033, "epoch": 572} {"train_loss": -5.2313690185546875, "global_step": 24034, "epoch": 572} {"train_loss": -5.354790210723877, "global_step": 24035, "epoch": 572} {"train_loss": -5.351841449737549, "global_step": 24036, "epoch": 572} {"train_loss": -5.293749809265137, "global_step": 24037, "epoch": 572} {"train_loss": -5.3305745124816895, "global_step": 24038, "epoch": 572} {"train_loss": -5.325372695922852, "global_step": 24039, "epoch": 572} {"train_loss": -5.312408924102783, "global_step": 24040, "epoch": 572} {"train_loss": -5.393287658691406, "global_step": 24041, "epoch": 572} {"train_loss": -5.443263053894043, "global_step": 24042, "epoch": 572} {"train_loss": -5.253603458404541, "global_step": 24043, "epoch": 572} {"train_loss": -5.29887580871582, "global_step": 24044, "epoch": 572} {"train_loss": -5.419605731964111, "global_step": 24045, "epoch": 572} {"train_loss": -5.512451171875, "global_step": 24046, "epoch": 572} {"train_loss": -5.402366638183594, "global_step": 24047, "epoch": 572} {"train_loss": -5.336853981018066, "global_step": 24048, "epoch": 572} {"train_loss": -5.479499816894531, "global_step": 24049, "epoch": 572} {"train_loss": -5.264939308166504, "global_step": 24050, "epoch": 572} {"train_loss": -5.399331092834473, "global_step": 24051, "epoch": 572} {"train_loss": -5.352384567260742, "global_step": 24052, "epoch": 572} {"train_loss": -5.297983646392822, "global_step": 24053, "epoch": 572} {"train_loss": -5.32655143737793, "global_step": 24054, "epoch": 572} {"train_loss": -5.392073154449463, "global_step": 24055, "epoch": 572} {"train_loss": -5.257016181945801, "global_step": 24056, "epoch": 572} {"train_loss": -5.314801216125488, "global_step": 24057, "epoch": 572} {"train_loss": -5.2100324630737305, "global_step": 24058, "epoch": 572} {"train_loss": -5.407886505126953, "global_step": 24059, "epoch": 572} {"train_loss": -5.159013748168945, "global_step": 24060, "epoch": 572} {"train_loss": -5.240206718444824, "global_step": 24061, "epoch": 572} {"train_loss": -5.329954624176025, "global_step": 24062, "epoch": 572} {"train_loss": -5.3907694816589355, "global_step": 24063, "epoch": 572} {"train_loss": -5.272896766662598, "global_step": 24064, "epoch": 572} {"train_loss": -5.335381235395159, "global_step": 24065, "epoch": 572, "val_loss": 76132.46875} {"train_loss": -5.394814968109131, "global_step": 24066, "epoch": 573} {"train_loss": -5.200699806213379, "global_step": 24067, "epoch": 573} {"train_loss": -5.392279624938965, "global_step": 24068, "epoch": 573} {"train_loss": -5.3694658279418945, "global_step": 24069, "epoch": 573} {"train_loss": -5.3768110275268555, "global_step": 24070, "epoch": 573} {"train_loss": -5.233341217041016, "global_step": 24071, "epoch": 573} {"train_loss": -5.4143218994140625, "global_step": 24072, "epoch": 573} {"train_loss": -5.3486833572387695, "global_step": 24073, "epoch": 573} {"train_loss": -5.513978004455566, "global_step": 24074, "epoch": 573} {"train_loss": -5.313693046569824, "global_step": 24075, "epoch": 573} {"train_loss": -5.29852294921875, "global_step": 24076, "epoch": 573} {"train_loss": -5.308437347412109, "global_step": 24077, "epoch": 573} {"train_loss": -5.374236583709717, "global_step": 24078, "epoch": 573} {"train_loss": -5.345331192016602, "global_step": 24079, "epoch": 573} {"train_loss": -5.3563232421875, "global_step": 24080, "epoch": 573} {"train_loss": -5.358550071716309, "global_step": 24081, "epoch": 573} {"train_loss": -5.505607604980469, "global_step": 24082, "epoch": 573} {"train_loss": -5.351230144500732, "global_step": 24083, "epoch": 573} {"train_loss": -5.416195869445801, "global_step": 24084, "epoch": 573} {"train_loss": -5.521143913269043, "global_step": 24085, "epoch": 573} {"train_loss": -5.422183036804199, "global_step": 24086, "epoch": 573} {"train_loss": -5.421784400939941, "global_step": 24087, "epoch": 573} {"train_loss": -5.422446250915527, "global_step": 24088, "epoch": 573} {"train_loss": -5.343208312988281, "global_step": 24089, "epoch": 573} {"train_loss": -5.169094562530518, "global_step": 24090, "epoch": 573} {"train_loss": -5.380964756011963, "global_step": 24091, "epoch": 573} {"train_loss": -5.430747985839844, "global_step": 24092, "epoch": 573} {"train_loss": -5.387218952178955, "global_step": 24093, "epoch": 573} {"train_loss": -5.300354480743408, "global_step": 24094, "epoch": 573} {"train_loss": -5.305501937866211, "global_step": 24095, "epoch": 573} {"train_loss": -5.346155643463135, "global_step": 24096, "epoch": 573} {"train_loss": -5.4538469314575195, "global_step": 24097, "epoch": 573} {"train_loss": -5.46291446685791, "global_step": 24098, "epoch": 573} {"train_loss": -5.379661560058594, "global_step": 24099, "epoch": 573} {"train_loss": -5.357051372528076, "global_step": 24100, "epoch": 573} {"train_loss": -5.413442611694336, "global_step": 24101, "epoch": 573} {"train_loss": -5.314835071563721, "global_step": 24102, "epoch": 573} {"train_loss": -5.359897613525391, "global_step": 24103, "epoch": 573} {"train_loss": -5.410408973693848, "global_step": 24104, "epoch": 573} {"train_loss": -5.361536026000977, "global_step": 24105, "epoch": 573} {"train_loss": -5.297032833099365, "global_step": 24106, "epoch": 573} {"train_loss": -5.370611781165714, "global_step": 24107, "epoch": 573, "val_loss": 76268.6875} {"train_loss": -5.4159088134765625, "global_step": 24108, "epoch": 574} {"train_loss": -5.473938941955566, "global_step": 24109, "epoch": 574} {"train_loss": -5.357673168182373, "global_step": 24110, "epoch": 574} {"train_loss": -5.381558418273926, "global_step": 24111, "epoch": 574} {"train_loss": -5.518239498138428, "global_step": 24112, "epoch": 574} {"train_loss": -5.409841537475586, "global_step": 24113, "epoch": 574} {"train_loss": -5.26686429977417, "global_step": 24114, "epoch": 574} {"train_loss": -5.53738260269165, "global_step": 24115, "epoch": 574} {"train_loss": -5.336261749267578, "global_step": 24116, "epoch": 574} {"train_loss": -5.192679405212402, "global_step": 24117, "epoch": 574} {"train_loss": -5.3442230224609375, "global_step": 24118, "epoch": 574} {"train_loss": -5.190059185028076, "global_step": 24119, "epoch": 574} {"train_loss": -5.407631874084473, "global_step": 24120, "epoch": 574} {"train_loss": -5.47379207611084, "global_step": 24121, "epoch": 574} {"train_loss": -5.316023349761963, "global_step": 24122, "epoch": 574} {"train_loss": -5.388393402099609, "global_step": 24123, "epoch": 574} {"train_loss": -5.367364883422852, "global_step": 24124, "epoch": 574} {"train_loss": -5.334425449371338, "global_step": 24125, "epoch": 574} {"train_loss": -5.428125858306885, "global_step": 24126, "epoch": 574} {"train_loss": -5.397172927856445, "global_step": 24127, "epoch": 574} {"train_loss": -5.311267852783203, "global_step": 24128, "epoch": 574} {"train_loss": -5.371889114379883, "global_step": 24129, "epoch": 574} {"train_loss": -5.332476615905762, "global_step": 24130, "epoch": 574} {"train_loss": -5.490911483764648, "global_step": 24131, "epoch": 574} {"train_loss": -5.226789474487305, "global_step": 24132, "epoch": 574} {"train_loss": -5.336938381195068, "global_step": 24133, "epoch": 574} {"train_loss": -5.183104515075684, "global_step": 24134, "epoch": 574} {"train_loss": -5.368070602416992, "global_step": 24135, "epoch": 574} {"train_loss": -5.311234474182129, "global_step": 24136, "epoch": 574} {"train_loss": -5.222787857055664, "global_step": 24137, "epoch": 574} {"train_loss": -5.336315155029297, "global_step": 24138, "epoch": 574} {"train_loss": -5.360251426696777, "global_step": 24139, "epoch": 574} {"train_loss": -5.255475044250488, "global_step": 24140, "epoch": 574} {"train_loss": -5.443483352661133, "global_step": 24141, "epoch": 574} {"train_loss": -5.458105564117432, "global_step": 24142, "epoch": 574} {"train_loss": -5.386660099029541, "global_step": 24143, "epoch": 574} {"train_loss": -5.347388744354248, "global_step": 24144, "epoch": 574} {"train_loss": -5.320695400238037, "global_step": 24145, "epoch": 574} {"train_loss": -5.416609764099121, "global_step": 24146, "epoch": 574} {"train_loss": -5.470088958740234, "global_step": 24147, "epoch": 574} {"train_loss": -5.3634748458862305, "global_step": 24148, "epoch": 574} {"train_loss": -5.361110335304623, "global_step": 24149, "epoch": 574, "val_loss": 76347.609375} {"train_loss": -5.4009904861450195, "global_step": 24150, "epoch": 575} {"train_loss": -5.326257705688477, "global_step": 24151, "epoch": 575} {"train_loss": -5.462649822235107, "global_step": 24152, "epoch": 575} {"train_loss": -5.330291748046875, "global_step": 24153, "epoch": 575} {"train_loss": -5.307652473449707, "global_step": 24154, "epoch": 575} {"train_loss": -5.216373443603516, "global_step": 24155, "epoch": 575} {"train_loss": -5.372339725494385, "global_step": 24156, "epoch": 575} {"train_loss": -5.317306041717529, "global_step": 24157, "epoch": 575} {"train_loss": -5.432199001312256, "global_step": 24158, "epoch": 575} {"train_loss": -5.4347615242004395, "global_step": 24159, "epoch": 575} {"train_loss": -5.231839179992676, "global_step": 24160, "epoch": 575} {"train_loss": -5.354050636291504, "global_step": 24161, "epoch": 575} {"train_loss": -5.406710624694824, "global_step": 24162, "epoch": 575} {"train_loss": -5.315959453582764, "global_step": 24163, "epoch": 575} {"train_loss": -5.215582847595215, "global_step": 24164, "epoch": 575} {"train_loss": -5.460701942443848, "global_step": 24165, "epoch": 575} {"train_loss": -5.381173133850098, "global_step": 24166, "epoch": 575} {"train_loss": -5.346219062805176, "global_step": 24167, "epoch": 575} {"train_loss": -5.46113395690918, "global_step": 24168, "epoch": 575} {"train_loss": -5.366467475891113, "global_step": 24169, "epoch": 575} {"train_loss": -5.407660484313965, "global_step": 24170, "epoch": 575} {"train_loss": -5.154314041137695, "global_step": 24171, "epoch": 575} {"train_loss": -5.2909393310546875, "global_step": 24172, "epoch": 575} {"train_loss": -5.476297378540039, "global_step": 24173, "epoch": 575} {"train_loss": -5.343584060668945, "global_step": 24174, "epoch": 575} {"train_loss": -5.255239486694336, "global_step": 24175, "epoch": 575} {"train_loss": -5.276544570922852, "global_step": 24176, "epoch": 575} {"train_loss": -5.253286838531494, "global_step": 24177, "epoch": 575} {"train_loss": -5.302536964416504, "global_step": 24178, "epoch": 575} {"train_loss": -5.38700008392334, "global_step": 24179, "epoch": 575} {"train_loss": -5.220747947692871, "global_step": 24180, "epoch": 575} {"train_loss": -5.4332075119018555, "global_step": 24181, "epoch": 575} {"train_loss": -5.282047271728516, "global_step": 24182, "epoch": 575} {"train_loss": -5.431880474090576, "global_step": 24183, "epoch": 575} {"train_loss": -5.295136451721191, "global_step": 24184, "epoch": 575} {"train_loss": -5.426459789276123, "global_step": 24185, "epoch": 575} {"train_loss": -5.419035911560059, "global_step": 24186, "epoch": 575} {"train_loss": -5.217182159423828, "global_step": 24187, "epoch": 575} {"train_loss": -5.259101867675781, "global_step": 24188, "epoch": 575} {"train_loss": -5.409366607666016, "global_step": 24189, "epoch": 575} {"train_loss": -5.351988792419434, "global_step": 24190, "epoch": 575} {"train_loss": -5.341436147689819, "global_step": 24191, "epoch": 575, "val_loss": 77130.0625} {"train_loss": -5.234984397888184, "global_step": 24192, "epoch": 576} {"train_loss": -5.442337989807129, "global_step": 24193, "epoch": 576} {"train_loss": -5.300379276275635, "global_step": 24194, "epoch": 576} {"train_loss": -5.383164405822754, "global_step": 24195, "epoch": 576} {"train_loss": -5.392812728881836, "global_step": 24196, "epoch": 576} {"train_loss": -5.327754020690918, "global_step": 24197, "epoch": 576} {"train_loss": -5.50351095199585, "global_step": 24198, "epoch": 576} {"train_loss": -5.323021411895752, "global_step": 24199, "epoch": 576} {"train_loss": -5.297669887542725, "global_step": 24200, "epoch": 576} {"train_loss": -5.274747371673584, "global_step": 24201, "epoch": 576} {"train_loss": -5.26269006729126, "global_step": 24202, "epoch": 576} {"train_loss": -5.1126790046691895, "global_step": 24203, "epoch": 576} {"train_loss": -5.400585651397705, "global_step": 24204, "epoch": 576} {"train_loss": -5.0952959060668945, "global_step": 24205, "epoch": 576} {"train_loss": -5.3416900634765625, "global_step": 24206, "epoch": 576} {"train_loss": -5.2950592041015625, "global_step": 24207, "epoch": 576} {"train_loss": -5.286046981811523, "global_step": 24208, "epoch": 576} {"train_loss": -5.427845478057861, "global_step": 24209, "epoch": 576} {"train_loss": -5.279763698577881, "global_step": 24210, "epoch": 576} {"train_loss": -5.299065113067627, "global_step": 24211, "epoch": 576} {"train_loss": -5.300023078918457, "global_step": 24212, "epoch": 576} {"train_loss": -5.312623977661133, "global_step": 24213, "epoch": 576} {"train_loss": -5.303448677062988, "global_step": 24214, "epoch": 576} {"train_loss": -5.362538814544678, "global_step": 24215, "epoch": 576} {"train_loss": -5.44119930267334, "global_step": 24216, "epoch": 576} {"train_loss": -5.425419807434082, "global_step": 24217, "epoch": 576} {"train_loss": -5.301326751708984, "global_step": 24218, "epoch": 576} {"train_loss": -5.374236583709717, "global_step": 24219, "epoch": 576} {"train_loss": -5.354301929473877, "global_step": 24220, "epoch": 576} {"train_loss": -5.30002498626709, "global_step": 24221, "epoch": 576} {"train_loss": -5.258142948150635, "global_step": 24222, "epoch": 576} {"train_loss": -5.316170692443848, "global_step": 24223, "epoch": 576} {"train_loss": -5.29722785949707, "global_step": 24224, "epoch": 576} {"train_loss": -5.434968948364258, "global_step": 24225, "epoch": 576} {"train_loss": -5.527235507965088, "global_step": 24226, "epoch": 576} {"train_loss": -5.268154144287109, "global_step": 24227, "epoch": 576} {"train_loss": -5.303257942199707, "global_step": 24228, "epoch": 576} {"train_loss": -5.4252471923828125, "global_step": 24229, "epoch": 576} {"train_loss": -5.398299217224121, "global_step": 24230, "epoch": 576} {"train_loss": -5.352851867675781, "global_step": 24231, "epoch": 576} {"train_loss": -5.424224853515625, "global_step": 24232, "epoch": 576} {"train_loss": -5.3338410173143656, "global_step": 24233, "epoch": 576, "val_loss": 76177.25} {"train_loss": -5.345768451690674, "global_step": 24234, "epoch": 577} {"train_loss": -5.342977523803711, "global_step": 24235, "epoch": 577} {"train_loss": -5.3731818199157715, "global_step": 24236, "epoch": 577} {"train_loss": -5.333502292633057, "global_step": 24237, "epoch": 577} {"train_loss": -5.239324569702148, "global_step": 24238, "epoch": 577} {"train_loss": -5.31235408782959, "global_step": 24239, "epoch": 577} {"train_loss": -5.3817830085754395, "global_step": 24240, "epoch": 577} {"train_loss": -5.20286226272583, "global_step": 24241, "epoch": 577} {"train_loss": -5.365179061889648, "global_step": 24242, "epoch": 577} {"train_loss": -5.245720863342285, "global_step": 24243, "epoch": 577} {"train_loss": -5.505275726318359, "global_step": 24244, "epoch": 577} {"train_loss": -5.337933540344238, "global_step": 24245, "epoch": 577} {"train_loss": -5.412407875061035, "global_step": 24246, "epoch": 577} {"train_loss": -5.535191535949707, "global_step": 24247, "epoch": 577} {"train_loss": -5.383586883544922, "global_step": 24248, "epoch": 577} {"train_loss": -5.501273155212402, "global_step": 24249, "epoch": 577} {"train_loss": -5.497585773468018, "global_step": 24250, "epoch": 577} {"train_loss": -5.355072021484375, "global_step": 24251, "epoch": 577} {"train_loss": -5.48643684387207, "global_step": 24252, "epoch": 577} {"train_loss": -5.348263740539551, "global_step": 24253, "epoch": 577} {"train_loss": -5.368307113647461, "global_step": 24254, "epoch": 577} {"train_loss": -5.487706184387207, "global_step": 24255, "epoch": 577} {"train_loss": -5.363211631774902, "global_step": 24256, "epoch": 577} {"train_loss": -5.445002555847168, "global_step": 24257, "epoch": 577} {"train_loss": -5.281796455383301, "global_step": 24258, "epoch": 577} {"train_loss": -5.36247444152832, "global_step": 24259, "epoch": 577} {"train_loss": -5.422356605529785, "global_step": 24260, "epoch": 577} {"train_loss": -5.422612190246582, "global_step": 24261, "epoch": 577} {"train_loss": -5.414080619812012, "global_step": 24262, "epoch": 577} {"train_loss": -5.414556503295898, "global_step": 24263, "epoch": 577} {"train_loss": -5.322112083435059, "global_step": 24264, "epoch": 577} {"train_loss": -5.436446189880371, "global_step": 24265, "epoch": 577} {"train_loss": -5.384791374206543, "global_step": 24266, "epoch": 577} {"train_loss": -5.2550554275512695, "global_step": 24267, "epoch": 577} {"train_loss": -5.28708028793335, "global_step": 24268, "epoch": 577} {"train_loss": -5.375942707061768, "global_step": 24269, "epoch": 577} {"train_loss": -5.543646335601807, "global_step": 24270, "epoch": 577} {"train_loss": -5.1490797996521, "global_step": 24271, "epoch": 577} {"train_loss": -5.439978122711182, "global_step": 24272, "epoch": 577} {"train_loss": -5.335878849029541, "global_step": 24273, "epoch": 577} {"train_loss": -5.355072021484375, "global_step": 24274, "epoch": 577} {"train_loss": -5.37526814142863, "global_step": 24275, "epoch": 577, "val_loss": 77243.21875} {"train_loss": -5.461909770965576, "global_step": 24276, "epoch": 578} {"train_loss": -5.300498008728027, "global_step": 24277, "epoch": 578} {"train_loss": -5.371211051940918, "global_step": 24278, "epoch": 578} {"train_loss": -5.4125237464904785, "global_step": 24279, "epoch": 578} {"train_loss": -5.410892486572266, "global_step": 24280, "epoch": 578} {"train_loss": -5.318728923797607, "global_step": 24281, "epoch": 578} {"train_loss": -5.388242721557617, "global_step": 24282, "epoch": 578} {"train_loss": -5.395823001861572, "global_step": 24283, "epoch": 578} {"train_loss": -5.468149185180664, "global_step": 24284, "epoch": 578} {"train_loss": -5.380904674530029, "global_step": 24285, "epoch": 578} {"train_loss": -5.321147918701172, "global_step": 24286, "epoch": 578} {"train_loss": -5.4185590744018555, "global_step": 24287, "epoch": 578} {"train_loss": -5.313867092132568, "global_step": 24288, "epoch": 578} {"train_loss": -5.396378993988037, "global_step": 24289, "epoch": 578} {"train_loss": -5.352964401245117, "global_step": 24290, "epoch": 578} {"train_loss": -5.379963397979736, "global_step": 24291, "epoch": 578} {"train_loss": -5.442221641540527, "global_step": 24292, "epoch": 578} {"train_loss": -5.479806900024414, "global_step": 24293, "epoch": 578} {"train_loss": -5.503864765167236, "global_step": 24294, "epoch": 578} {"train_loss": -5.476468563079834, "global_step": 24295, "epoch": 578} {"train_loss": -5.329225063323975, "global_step": 24296, "epoch": 578} {"train_loss": -5.356387615203857, "global_step": 24297, "epoch": 578} {"train_loss": -5.352322578430176, "global_step": 24298, "epoch": 578} {"train_loss": -5.378820419311523, "global_step": 24299, "epoch": 578} {"train_loss": -5.493575096130371, "global_step": 24300, "epoch": 578} {"train_loss": -5.375723838806152, "global_step": 24301, "epoch": 578} {"train_loss": -5.314146041870117, "global_step": 24302, "epoch": 578} {"train_loss": -5.371367454528809, "global_step": 24303, "epoch": 578} {"train_loss": -5.29842472076416, "global_step": 24304, "epoch": 578} {"train_loss": -5.405539512634277, "global_step": 24305, "epoch": 578} {"train_loss": -5.4299211502075195, "global_step": 24306, "epoch": 578} {"train_loss": -5.316958427429199, "global_step": 24307, "epoch": 578} {"train_loss": -5.345244884490967, "global_step": 24308, "epoch": 578} {"train_loss": -5.353442192077637, "global_step": 24309, "epoch": 578} {"train_loss": -5.388751029968262, "global_step": 24310, "epoch": 578} {"train_loss": -5.252232551574707, "global_step": 24311, "epoch": 578} {"train_loss": -5.398294448852539, "global_step": 24312, "epoch": 578} {"train_loss": -5.310155868530273, "global_step": 24313, "epoch": 578} {"train_loss": -5.322388172149658, "global_step": 24314, "epoch": 578} {"train_loss": -5.2696075439453125, "global_step": 24315, "epoch": 578} {"train_loss": -5.237709045410156, "global_step": 24316, "epoch": 578} {"train_loss": -5.371904554821196, "global_step": 24317, "epoch": 578, "val_loss": 76232.65625} {"train_loss": -5.256932258605957, "global_step": 24318, "epoch": 579} {"train_loss": -5.347595691680908, "global_step": 24319, "epoch": 579} {"train_loss": -5.375351428985596, "global_step": 24320, "epoch": 579} {"train_loss": -5.328897953033447, "global_step": 24321, "epoch": 579} {"train_loss": -5.412544250488281, "global_step": 24322, "epoch": 579} {"train_loss": -5.416469573974609, "global_step": 24323, "epoch": 579} {"train_loss": -5.2967071533203125, "global_step": 24324, "epoch": 579} {"train_loss": -5.361822605133057, "global_step": 24325, "epoch": 579} {"train_loss": -5.468411445617676, "global_step": 24326, "epoch": 579} {"train_loss": -5.226970195770264, "global_step": 24327, "epoch": 579} {"train_loss": -5.397355556488037, "global_step": 24328, "epoch": 579} {"train_loss": -5.436890602111816, "global_step": 24329, "epoch": 579} {"train_loss": -5.400740146636963, "global_step": 24330, "epoch": 579} {"train_loss": -5.457980632781982, "global_step": 24331, "epoch": 579} {"train_loss": -5.536661148071289, "global_step": 24332, "epoch": 579} {"train_loss": -5.290950298309326, "global_step": 24333, "epoch": 579} {"train_loss": -5.399904727935791, "global_step": 24334, "epoch": 579} {"train_loss": -5.382411956787109, "global_step": 24335, "epoch": 579} {"train_loss": -5.4767608642578125, "global_step": 24336, "epoch": 579} {"train_loss": -5.332225799560547, "global_step": 24337, "epoch": 579} {"train_loss": -5.547314643859863, "global_step": 24338, "epoch": 579} {"train_loss": -5.454858303070068, "global_step": 24339, "epoch": 579} {"train_loss": -5.32867956161499, "global_step": 24340, "epoch": 579} {"train_loss": -5.418544769287109, "global_step": 24341, "epoch": 579} {"train_loss": -5.316734313964844, "global_step": 24342, "epoch": 579} {"train_loss": -5.4107561111450195, "global_step": 24343, "epoch": 579} {"train_loss": -5.325357437133789, "global_step": 24344, "epoch": 579} {"train_loss": -5.363062858581543, "global_step": 24345, "epoch": 579} {"train_loss": -5.290383338928223, "global_step": 24346, "epoch": 579} {"train_loss": -5.26953125, "global_step": 24347, "epoch": 579} {"train_loss": -5.329037666320801, "global_step": 24348, "epoch": 579} {"train_loss": -5.484877109527588, "global_step": 24349, "epoch": 579} {"train_loss": -5.417732238769531, "global_step": 24350, "epoch": 579} {"train_loss": -5.3247175216674805, "global_step": 24351, "epoch": 579} {"train_loss": -5.394529342651367, "global_step": 24352, "epoch": 579} {"train_loss": -5.436841011047363, "global_step": 24353, "epoch": 579} {"train_loss": -5.403131484985352, "global_step": 24354, "epoch": 579} {"train_loss": -5.352603912353516, "global_step": 24355, "epoch": 579} {"train_loss": -5.272546768188477, "global_step": 24356, "epoch": 579} {"train_loss": -5.613516330718994, "global_step": 24357, "epoch": 579} {"train_loss": -5.3611226081848145, "global_step": 24358, "epoch": 579} {"train_loss": -5.381094251360212, "global_step": 24359, "epoch": 579, "val_loss": 76006.5078125} {"train_loss": -5.449699401855469, "global_step": 24360, "epoch": 580} {"train_loss": -5.486854553222656, "global_step": 24361, "epoch": 580} {"train_loss": -5.396980285644531, "global_step": 24362, "epoch": 580} {"train_loss": -5.39488410949707, "global_step": 24363, "epoch": 580} {"train_loss": -5.5360236167907715, "global_step": 24364, "epoch": 580} {"train_loss": -5.379964828491211, "global_step": 24365, "epoch": 580} {"train_loss": -5.3348002433776855, "global_step": 24366, "epoch": 580} {"train_loss": -5.434364318847656, "global_step": 24367, "epoch": 580} {"train_loss": -5.289536476135254, "global_step": 24368, "epoch": 580} {"train_loss": -5.28012228012085, "global_step": 24369, "epoch": 580} {"train_loss": -5.412960052490234, "global_step": 24370, "epoch": 580} {"train_loss": -5.3518877029418945, "global_step": 24371, "epoch": 580} {"train_loss": -5.145236015319824, "global_step": 24372, "epoch": 580} {"train_loss": -5.317968368530273, "global_step": 24373, "epoch": 580} {"train_loss": -5.343052864074707, "global_step": 24374, "epoch": 580} {"train_loss": -5.3206915855407715, "global_step": 24375, "epoch": 580} {"train_loss": -5.363811492919922, "global_step": 24376, "epoch": 580} {"train_loss": -5.341269016265869, "global_step": 24377, "epoch": 580} {"train_loss": -5.469533920288086, "global_step": 24378, "epoch": 580} {"train_loss": -5.2584638595581055, "global_step": 24379, "epoch": 580} {"train_loss": -5.245698928833008, "global_step": 24380, "epoch": 580} {"train_loss": -5.589689254760742, "global_step": 24381, "epoch": 580} {"train_loss": -5.432956218719482, "global_step": 24382, "epoch": 580} {"train_loss": -5.485439300537109, "global_step": 24383, "epoch": 580} {"train_loss": -5.33927583694458, "global_step": 24384, "epoch": 580} {"train_loss": -5.456815719604492, "global_step": 24385, "epoch": 580} {"train_loss": -5.325986385345459, "global_step": 24386, "epoch": 580} {"train_loss": -5.2513580322265625, "global_step": 24387, "epoch": 580} {"train_loss": -5.350586891174316, "global_step": 24388, "epoch": 580} {"train_loss": -5.363705635070801, "global_step": 24389, "epoch": 580} {"train_loss": -5.261594772338867, "global_step": 24390, "epoch": 580} {"train_loss": -5.450239181518555, "global_step": 24391, "epoch": 580} {"train_loss": -5.311718940734863, "global_step": 24392, "epoch": 580} {"train_loss": -5.402597427368164, "global_step": 24393, "epoch": 580} {"train_loss": -5.4545745849609375, "global_step": 24394, "epoch": 580} {"train_loss": -5.394021034240723, "global_step": 24395, "epoch": 580} {"train_loss": -5.352095603942871, "global_step": 24396, "epoch": 580} {"train_loss": -5.458431243896484, "global_step": 24397, "epoch": 580} {"train_loss": -5.278787612915039, "global_step": 24398, "epoch": 580} {"train_loss": -5.3423261642456055, "global_step": 24399, "epoch": 580} {"train_loss": -5.431553840637207, "global_step": 24400, "epoch": 580} {"train_loss": -5.372551441192627, "global_step": 24401, "epoch": 580, "val_loss": 76394.078125} {"train_loss": -5.499344825744629, "global_step": 24402, "epoch": 581} {"train_loss": -5.3652238845825195, "global_step": 24403, "epoch": 581} {"train_loss": -5.333321571350098, "global_step": 24404, "epoch": 581} {"train_loss": -5.37725830078125, "global_step": 24405, "epoch": 581} {"train_loss": -5.429529190063477, "global_step": 24406, "epoch": 581} {"train_loss": -5.351791858673096, "global_step": 24407, "epoch": 581} {"train_loss": -5.3486552238464355, "global_step": 24408, "epoch": 581} {"train_loss": -5.388677597045898, "global_step": 24409, "epoch": 581} {"train_loss": -5.3224897384643555, "global_step": 24410, "epoch": 581} {"train_loss": -5.420383453369141, "global_step": 24411, "epoch": 581} {"train_loss": -5.3579487800598145, "global_step": 24412, "epoch": 581} {"train_loss": -5.312660217285156, "global_step": 24413, "epoch": 581} {"train_loss": -5.344775199890137, "global_step": 24414, "epoch": 581} {"train_loss": -5.458627700805664, "global_step": 24415, "epoch": 581} {"train_loss": -5.3348894119262695, "global_step": 24416, "epoch": 581} {"train_loss": -5.522429466247559, "global_step": 24417, "epoch": 581} {"train_loss": -5.381410598754883, "global_step": 24418, "epoch": 581} {"train_loss": -5.410935401916504, "global_step": 24419, "epoch": 581} {"train_loss": -5.428350448608398, "global_step": 24420, "epoch": 581} {"train_loss": -5.3140668869018555, "global_step": 24421, "epoch": 581} {"train_loss": -5.44305419921875, "global_step": 24422, "epoch": 581} {"train_loss": -5.307322978973389, "global_step": 24423, "epoch": 581} {"train_loss": -5.343368053436279, "global_step": 24424, "epoch": 581} {"train_loss": -5.449832439422607, "global_step": 24425, "epoch": 581} {"train_loss": -5.381715774536133, "global_step": 24426, "epoch": 581} {"train_loss": -5.300144195556641, "global_step": 24427, "epoch": 581} {"train_loss": -5.381743431091309, "global_step": 24428, "epoch": 581} {"train_loss": -5.208171367645264, "global_step": 24429, "epoch": 581} {"train_loss": -5.453307151794434, "global_step": 24430, "epoch": 581} {"train_loss": -5.418055534362793, "global_step": 24431, "epoch": 581} {"train_loss": -5.340850830078125, "global_step": 24432, "epoch": 581} {"train_loss": -5.27908992767334, "global_step": 24433, "epoch": 581} {"train_loss": -5.280174255371094, "global_step": 24434, "epoch": 581} {"train_loss": -5.324276924133301, "global_step": 24435, "epoch": 581} {"train_loss": -5.437490463256836, "global_step": 24436, "epoch": 581} {"train_loss": -5.372522354125977, "global_step": 24437, "epoch": 581} {"train_loss": -5.354438304901123, "global_step": 24438, "epoch": 581} {"train_loss": -5.408989906311035, "global_step": 24439, "epoch": 581} {"train_loss": -5.411655902862549, "global_step": 24440, "epoch": 581} {"train_loss": -5.248075485229492, "global_step": 24441, "epoch": 581} {"train_loss": -5.397645473480225, "global_step": 24442, "epoch": 581} {"train_loss": -5.371819371268863, "global_step": 24443, "epoch": 581, "val_loss": 76037.7109375} {"train_loss": -5.37120246887207, "global_step": 24444, "epoch": 582} {"train_loss": -5.327322959899902, "global_step": 24445, "epoch": 582} {"train_loss": -5.582277774810791, "global_step": 24446, "epoch": 582} {"train_loss": -5.561841011047363, "global_step": 24447, "epoch": 582} {"train_loss": -5.333975791931152, "global_step": 24448, "epoch": 582} {"train_loss": -5.364989757537842, "global_step": 24449, "epoch": 582} {"train_loss": -5.362279415130615, "global_step": 24450, "epoch": 582} {"train_loss": -5.419571876525879, "global_step": 24451, "epoch": 582} {"train_loss": -5.347033500671387, "global_step": 24452, "epoch": 582} {"train_loss": -5.42902946472168, "global_step": 24453, "epoch": 582} {"train_loss": -5.356234550476074, "global_step": 24454, "epoch": 582} {"train_loss": -5.375246047973633, "global_step": 24455, "epoch": 582} {"train_loss": -5.348788261413574, "global_step": 24456, "epoch": 582} {"train_loss": -5.447509765625, "global_step": 24457, "epoch": 582} {"train_loss": -5.397444248199463, "global_step": 24458, "epoch": 582} {"train_loss": -5.368735313415527, "global_step": 24459, "epoch": 582} {"train_loss": -5.309263229370117, "global_step": 24460, "epoch": 582} {"train_loss": -5.3690595626831055, "global_step": 24461, "epoch": 582} {"train_loss": -5.3034892082214355, "global_step": 24462, "epoch": 582} {"train_loss": -5.3505449295043945, "global_step": 24463, "epoch": 582} {"train_loss": -5.314119338989258, "global_step": 24464, "epoch": 582} {"train_loss": -5.292507171630859, "global_step": 24465, "epoch": 582} {"train_loss": -5.493995666503906, "global_step": 24466, "epoch": 582} {"train_loss": -5.446722030639648, "global_step": 24467, "epoch": 582} {"train_loss": -5.303628921508789, "global_step": 24468, "epoch": 582} {"train_loss": -5.508645534515381, "global_step": 24469, "epoch": 582} {"train_loss": -5.4980340003967285, "global_step": 24470, "epoch": 582} {"train_loss": -5.362360954284668, "global_step": 24471, "epoch": 582} {"train_loss": -5.376491069793701, "global_step": 24472, "epoch": 582} {"train_loss": -5.416627883911133, "global_step": 24473, "epoch": 582} {"train_loss": -5.4024977684021, "global_step": 24474, "epoch": 582} {"train_loss": -5.402468204498291, "global_step": 24475, "epoch": 582} {"train_loss": -5.391064643859863, "global_step": 24476, "epoch": 582} {"train_loss": -5.215085506439209, "global_step": 24477, "epoch": 582} {"train_loss": -5.340282440185547, "global_step": 24478, "epoch": 582} {"train_loss": -5.4063897132873535, "global_step": 24479, "epoch": 582} {"train_loss": -5.4207658767700195, "global_step": 24480, "epoch": 582} {"train_loss": -5.460108757019043, "global_step": 24481, "epoch": 582} {"train_loss": -5.334601402282715, "global_step": 24482, "epoch": 582} {"train_loss": -5.324069023132324, "global_step": 24483, "epoch": 582} {"train_loss": -5.310920238494873, "global_step": 24484, "epoch": 582} {"train_loss": -5.382045700436547, "global_step": 24485, "epoch": 582, "val_loss": 76744.84375} {"train_loss": -5.326689720153809, "global_step": 24486, "epoch": 583} {"train_loss": -5.4077863693237305, "global_step": 24487, "epoch": 583} {"train_loss": -5.385472297668457, "global_step": 24488, "epoch": 583} {"train_loss": -5.310451507568359, "global_step": 24489, "epoch": 583} {"train_loss": -5.436603546142578, "global_step": 24490, "epoch": 583} {"train_loss": -5.346951484680176, "global_step": 24491, "epoch": 583} {"train_loss": -5.2700886726379395, "global_step": 24492, "epoch": 583} {"train_loss": -5.308662414550781, "global_step": 24493, "epoch": 583} {"train_loss": -5.3321685791015625, "global_step": 24494, "epoch": 583} {"train_loss": -5.311574935913086, "global_step": 24495, "epoch": 583} {"train_loss": -5.215494155883789, "global_step": 24496, "epoch": 583} {"train_loss": -5.605029106140137, "global_step": 24497, "epoch": 583} {"train_loss": -5.361778259277344, "global_step": 24498, "epoch": 583} {"train_loss": -5.402215957641602, "global_step": 24499, "epoch": 583} {"train_loss": -5.548684120178223, "global_step": 24500, "epoch": 583} {"train_loss": -5.393346309661865, "global_step": 24501, "epoch": 583} {"train_loss": -5.572713851928711, "global_step": 24502, "epoch": 583} {"train_loss": -5.3120951652526855, "global_step": 24503, "epoch": 583} {"train_loss": -5.3315629959106445, "global_step": 24504, "epoch": 583} {"train_loss": -5.41326379776001, "global_step": 24505, "epoch": 583} {"train_loss": -5.285889625549316, "global_step": 24506, "epoch": 583} {"train_loss": -5.445962905883789, "global_step": 24507, "epoch": 583} {"train_loss": -5.363426685333252, "global_step": 24508, "epoch": 583} {"train_loss": -5.295598983764648, "global_step": 24509, "epoch": 583} {"train_loss": -5.2327961921691895, "global_step": 24510, "epoch": 583} {"train_loss": -5.331324577331543, "global_step": 24511, "epoch": 583} {"train_loss": -5.358128070831299, "global_step": 24512, "epoch": 583} {"train_loss": -5.3218536376953125, "global_step": 24513, "epoch": 583} {"train_loss": -5.461248397827148, "global_step": 24514, "epoch": 583} {"train_loss": -5.360932350158691, "global_step": 24515, "epoch": 583} {"train_loss": -5.264376163482666, "global_step": 24516, "epoch": 583} {"train_loss": -5.468513488769531, "global_step": 24517, "epoch": 583} {"train_loss": -5.458310127258301, "global_step": 24518, "epoch": 583} {"train_loss": -5.54572868347168, "global_step": 24519, "epoch": 583} {"train_loss": -5.522642135620117, "global_step": 24520, "epoch": 583} {"train_loss": -5.372265815734863, "global_step": 24521, "epoch": 583} {"train_loss": -5.424966335296631, "global_step": 24522, "epoch": 583} {"train_loss": -5.26438045501709, "global_step": 24523, "epoch": 583} {"train_loss": -5.372884750366211, "global_step": 24524, "epoch": 583} {"train_loss": -5.433178901672363, "global_step": 24525, "epoch": 583} {"train_loss": -5.38729190826416, "global_step": 24526, "epoch": 583} {"train_loss": -5.3768612543741865, "global_step": 24527, "epoch": 583, "val_loss": 76422.0390625} {"train_loss": -5.296667098999023, "global_step": 24528, "epoch": 584} {"train_loss": -5.453897476196289, "global_step": 24529, "epoch": 584} {"train_loss": -5.318743705749512, "global_step": 24530, "epoch": 584} {"train_loss": -5.41858434677124, "global_step": 24531, "epoch": 584} {"train_loss": -5.255096912384033, "global_step": 24532, "epoch": 584} {"train_loss": -5.510700225830078, "global_step": 24533, "epoch": 584} {"train_loss": -5.283205032348633, "global_step": 24534, "epoch": 584} {"train_loss": -5.477045059204102, "global_step": 24535, "epoch": 584} {"train_loss": -5.3141255378723145, "global_step": 24536, "epoch": 584} {"train_loss": -5.447334289550781, "global_step": 24537, "epoch": 584} {"train_loss": -5.385985374450684, "global_step": 24538, "epoch": 584} {"train_loss": -5.463018417358398, "global_step": 24539, "epoch": 584} {"train_loss": -5.503471374511719, "global_step": 24540, "epoch": 584} {"train_loss": -5.396215438842773, "global_step": 24541, "epoch": 584} {"train_loss": -5.488824367523193, "global_step": 24542, "epoch": 584} {"train_loss": -5.405712604522705, "global_step": 24543, "epoch": 584} {"train_loss": -5.428959369659424, "global_step": 24544, "epoch": 584} {"train_loss": -5.35068416595459, "global_step": 24545, "epoch": 584} {"train_loss": -5.290400505065918, "global_step": 24546, "epoch": 584} {"train_loss": -5.4318389892578125, "global_step": 24547, "epoch": 584} {"train_loss": -5.239293575286865, "global_step": 24548, "epoch": 584} {"train_loss": -5.504308700561523, "global_step": 24549, "epoch": 584} {"train_loss": -5.423590660095215, "global_step": 24550, "epoch": 584} {"train_loss": -5.4178338050842285, "global_step": 24551, "epoch": 584} {"train_loss": -5.3212127685546875, "global_step": 24552, "epoch": 584} {"train_loss": -5.311173439025879, "global_step": 24553, "epoch": 584} {"train_loss": -5.361241340637207, "global_step": 24554, "epoch": 584} {"train_loss": -5.396949291229248, "global_step": 24555, "epoch": 584} {"train_loss": -5.464958190917969, "global_step": 24556, "epoch": 584} {"train_loss": -5.475194454193115, "global_step": 24557, "epoch": 584} {"train_loss": -5.348918914794922, "global_step": 24558, "epoch": 584} {"train_loss": -5.333771705627441, "global_step": 24559, "epoch": 584} {"train_loss": -5.359650135040283, "global_step": 24560, "epoch": 584} {"train_loss": -5.49100399017334, "global_step": 24561, "epoch": 584} {"train_loss": -5.280204772949219, "global_step": 24562, "epoch": 584} {"train_loss": -5.406438827514648, "global_step": 24563, "epoch": 584} {"train_loss": -5.279580593109131, "global_step": 24564, "epoch": 584} {"train_loss": -5.495633125305176, "global_step": 24565, "epoch": 584} {"train_loss": -5.331430435180664, "global_step": 24566, "epoch": 584} {"train_loss": -5.365240097045898, "global_step": 24567, "epoch": 584} {"train_loss": -5.438015937805176, "global_step": 24568, "epoch": 584} {"train_loss": -5.389860334850493, "global_step": 24569, "epoch": 584, "val_loss": 77367.875} {"train_loss": -5.339420318603516, "global_step": 24570, "epoch": 585} {"train_loss": -5.323991298675537, "global_step": 24571, "epoch": 585} {"train_loss": -5.369494438171387, "global_step": 24572, "epoch": 585} {"train_loss": -5.391573905944824, "global_step": 24573, "epoch": 585} {"train_loss": -5.308242321014404, "global_step": 24574, "epoch": 585} {"train_loss": -5.421727657318115, "global_step": 24575, "epoch": 585} {"train_loss": -5.452115058898926, "global_step": 24576, "epoch": 585} {"train_loss": -5.378969192504883, "global_step": 24577, "epoch": 585} {"train_loss": -5.401311874389648, "global_step": 24578, "epoch": 585} {"train_loss": -5.536522388458252, "global_step": 24579, "epoch": 585} {"train_loss": -5.532630920410156, "global_step": 24580, "epoch": 585} {"train_loss": -5.384713172912598, "global_step": 24581, "epoch": 585} {"train_loss": -5.371638774871826, "global_step": 24582, "epoch": 585} {"train_loss": -5.260675430297852, "global_step": 24583, "epoch": 585} {"train_loss": -5.3659467697143555, "global_step": 24584, "epoch": 585} {"train_loss": -5.391439914703369, "global_step": 24585, "epoch": 585} {"train_loss": -5.234519004821777, "global_step": 24586, "epoch": 585} {"train_loss": -5.31148099899292, "global_step": 24587, "epoch": 585} {"train_loss": -5.333225250244141, "global_step": 24588, "epoch": 585} {"train_loss": -5.2899017333984375, "global_step": 24589, "epoch": 585} {"train_loss": -5.15941047668457, "global_step": 24590, "epoch": 585} {"train_loss": -5.321264266967773, "global_step": 24591, "epoch": 585} {"train_loss": -5.260464668273926, "global_step": 24592, "epoch": 585} {"train_loss": -5.3484272956848145, "global_step": 24593, "epoch": 585} {"train_loss": -5.429718971252441, "global_step": 24594, "epoch": 585} {"train_loss": -5.14772891998291, "global_step": 24595, "epoch": 585} {"train_loss": -5.450041770935059, "global_step": 24596, "epoch": 585} {"train_loss": -5.3273844718933105, "global_step": 24597, "epoch": 585} {"train_loss": -5.290309429168701, "global_step": 24598, "epoch": 585} {"train_loss": -5.4273786544799805, "global_step": 24599, "epoch": 585} {"train_loss": -5.2059454917907715, "global_step": 24600, "epoch": 585} {"train_loss": -5.457093715667725, "global_step": 24601, "epoch": 585} {"train_loss": -5.378024578094482, "global_step": 24602, "epoch": 585} {"train_loss": -5.402989387512207, "global_step": 24603, "epoch": 585} {"train_loss": -5.286369323730469, "global_step": 24604, "epoch": 585} {"train_loss": -5.3889312744140625, "global_step": 24605, "epoch": 585} {"train_loss": -5.471371650695801, "global_step": 24606, "epoch": 585} {"train_loss": -5.193086624145508, "global_step": 24607, "epoch": 585} {"train_loss": -5.421889305114746, "global_step": 24608, "epoch": 585} {"train_loss": -5.42844295501709, "global_step": 24609, "epoch": 585} {"train_loss": -5.250937461853027, "global_step": 24610, "epoch": 585} {"train_loss": -5.353180771782284, "global_step": 24611, "epoch": 585, "val_loss": 76361.875} {"train_loss": -5.474305152893066, "global_step": 24612, "epoch": 586} {"train_loss": -5.294662952423096, "global_step": 24613, "epoch": 586} {"train_loss": -5.5868377685546875, "global_step": 24614, "epoch": 586} {"train_loss": -5.279771327972412, "global_step": 24615, "epoch": 586} {"train_loss": -5.3941264152526855, "global_step": 24616, "epoch": 586} {"train_loss": -5.35693883895874, "global_step": 24617, "epoch": 586} {"train_loss": -5.268337249755859, "global_step": 24618, "epoch": 586} {"train_loss": -5.300339698791504, "global_step": 24619, "epoch": 586} {"train_loss": -5.347471237182617, "global_step": 24620, "epoch": 586} {"train_loss": -5.351918697357178, "global_step": 24621, "epoch": 586} {"train_loss": -5.324133396148682, "global_step": 24622, "epoch": 586} {"train_loss": -5.476417541503906, "global_step": 24623, "epoch": 586} {"train_loss": -5.404211044311523, "global_step": 24624, "epoch": 586} {"train_loss": -5.307632923126221, "global_step": 24625, "epoch": 586} {"train_loss": -5.349895477294922, "global_step": 24626, "epoch": 586} {"train_loss": -5.530277729034424, "global_step": 24627, "epoch": 586} {"train_loss": -5.242931365966797, "global_step": 24628, "epoch": 586} {"train_loss": -5.486848831176758, "global_step": 24629, "epoch": 586} {"train_loss": -5.431988716125488, "global_step": 24630, "epoch": 586} {"train_loss": -5.358635425567627, "global_step": 24631, "epoch": 586} {"train_loss": -5.382464408874512, "global_step": 24632, "epoch": 586} {"train_loss": -5.380362510681152, "global_step": 24633, "epoch": 586} {"train_loss": -5.3065266609191895, "global_step": 24634, "epoch": 586} {"train_loss": -5.28001594543457, "global_step": 24635, "epoch": 586} {"train_loss": -5.487338066101074, "global_step": 24636, "epoch": 586} {"train_loss": -5.439115047454834, "global_step": 24637, "epoch": 586} {"train_loss": -5.387476444244385, "global_step": 24638, "epoch": 586} {"train_loss": -5.341447353363037, "global_step": 24639, "epoch": 586} {"train_loss": -5.379441261291504, "global_step": 24640, "epoch": 586} {"train_loss": -5.500328063964844, "global_step": 24641, "epoch": 586} {"train_loss": -5.391262054443359, "global_step": 24642, "epoch": 586} {"train_loss": -5.565394878387451, "global_step": 24643, "epoch": 586} {"train_loss": -5.4015727043151855, "global_step": 24644, "epoch": 586} {"train_loss": -5.37662410736084, "global_step": 24645, "epoch": 586} {"train_loss": -5.424652099609375, "global_step": 24646, "epoch": 586} {"train_loss": -5.508989334106445, "global_step": 24647, "epoch": 586} {"train_loss": -5.317971706390381, "global_step": 24648, "epoch": 586} {"train_loss": -5.422545433044434, "global_step": 24649, "epoch": 586} {"train_loss": -5.450445652008057, "global_step": 24650, "epoch": 586} {"train_loss": -5.306349754333496, "global_step": 24651, "epoch": 586} {"train_loss": -5.361029148101807, "global_step": 24652, "epoch": 586} {"train_loss": -5.389631396248227, "global_step": 24653, "epoch": 586, "val_loss": 77113.390625} {"train_loss": -5.188591003417969, "global_step": 24654, "epoch": 587} {"train_loss": -5.351773262023926, "global_step": 24655, "epoch": 587} {"train_loss": -5.362884044647217, "global_step": 24656, "epoch": 587} {"train_loss": -5.264827728271484, "global_step": 24657, "epoch": 587} {"train_loss": -5.493887901306152, "global_step": 24658, "epoch": 587} {"train_loss": -5.374002933502197, "global_step": 24659, "epoch": 587} {"train_loss": -5.4531755447387695, "global_step": 24660, "epoch": 587} {"train_loss": -5.293715476989746, "global_step": 24661, "epoch": 587} {"train_loss": -5.214528560638428, "global_step": 24662, "epoch": 587} {"train_loss": -5.511842727661133, "global_step": 24663, "epoch": 587} {"train_loss": -5.366315841674805, "global_step": 24664, "epoch": 587} {"train_loss": -5.3442769050598145, "global_step": 24665, "epoch": 587} {"train_loss": -5.3747687339782715, "global_step": 24666, "epoch": 587} {"train_loss": -5.303927898406982, "global_step": 24667, "epoch": 587} {"train_loss": -5.378446578979492, "global_step": 24668, "epoch": 587} {"train_loss": -5.47950553894043, "global_step": 24669, "epoch": 587} {"train_loss": -5.395875930786133, "global_step": 24670, "epoch": 587} {"train_loss": -5.132067680358887, "global_step": 24671, "epoch": 587} {"train_loss": -5.383134841918945, "global_step": 24672, "epoch": 587} {"train_loss": -5.440647125244141, "global_step": 24673, "epoch": 587} {"train_loss": -5.428645133972168, "global_step": 24674, "epoch": 587} {"train_loss": -5.3372039794921875, "global_step": 24675, "epoch": 587} {"train_loss": -5.495408058166504, "global_step": 24676, "epoch": 587} {"train_loss": -5.283167362213135, "global_step": 24677, "epoch": 587} {"train_loss": -5.2904767990112305, "global_step": 24678, "epoch": 587} {"train_loss": -5.402963638305664, "global_step": 24679, "epoch": 587} {"train_loss": -5.417507648468018, "global_step": 24680, "epoch": 587} {"train_loss": -5.494152069091797, "global_step": 24681, "epoch": 587} {"train_loss": -5.437112331390381, "global_step": 24682, "epoch": 587} {"train_loss": -5.393556594848633, "global_step": 24683, "epoch": 587} {"train_loss": -5.322035789489746, "global_step": 24684, "epoch": 587} {"train_loss": -5.351082801818848, "global_step": 24685, "epoch": 587} {"train_loss": -5.277554512023926, "global_step": 24686, "epoch": 587} {"train_loss": -5.330781936645508, "global_step": 24687, "epoch": 587} {"train_loss": -5.459877967834473, "global_step": 24688, "epoch": 587} {"train_loss": -5.475762367248535, "global_step": 24689, "epoch": 587} {"train_loss": -5.415643692016602, "global_step": 24690, "epoch": 587} {"train_loss": -5.387727737426758, "global_step": 24691, "epoch": 587} {"train_loss": -5.369198799133301, "global_step": 24692, "epoch": 587} {"train_loss": -5.468585014343262, "global_step": 24693, "epoch": 587} {"train_loss": -5.398550033569336, "global_step": 24694, "epoch": 587} {"train_loss": -5.373976866404216, "global_step": 24695, "epoch": 587, "val_loss": 76334.9375} {"train_loss": -5.413636684417725, "global_step": 24696, "epoch": 588} {"train_loss": -5.437102317810059, "global_step": 24697, "epoch": 588} {"train_loss": -5.447951316833496, "global_step": 24698, "epoch": 588} {"train_loss": -5.391538619995117, "global_step": 24699, "epoch": 588} {"train_loss": -5.215656757354736, "global_step": 24700, "epoch": 588} {"train_loss": -5.432622909545898, "global_step": 24701, "epoch": 588} {"train_loss": -5.461367607116699, "global_step": 24702, "epoch": 588} {"train_loss": -5.38493537902832, "global_step": 24703, "epoch": 588} {"train_loss": -5.550798416137695, "global_step": 24704, "epoch": 588} {"train_loss": -5.346535682678223, "global_step": 24705, "epoch": 588} {"train_loss": -5.3633246421813965, "global_step": 24706, "epoch": 588} {"train_loss": -5.371477127075195, "global_step": 24707, "epoch": 588} {"train_loss": -5.42488431930542, "global_step": 24708, "epoch": 588} {"train_loss": -5.4927568435668945, "global_step": 24709, "epoch": 588} {"train_loss": -5.2680840492248535, "global_step": 24710, "epoch": 588} {"train_loss": -5.385625839233398, "global_step": 24711, "epoch": 588} {"train_loss": -5.37529182434082, "global_step": 24712, "epoch": 588} {"train_loss": -5.505929946899414, "global_step": 24713, "epoch": 588} {"train_loss": -5.389044761657715, "global_step": 24714, "epoch": 588} {"train_loss": -5.393446922302246, "global_step": 24715, "epoch": 588} {"train_loss": -5.29366397857666, "global_step": 24716, "epoch": 588} {"train_loss": -5.506877899169922, "global_step": 24717, "epoch": 588} {"train_loss": -5.280224800109863, "global_step": 24718, "epoch": 588} {"train_loss": -5.39883279800415, "global_step": 24719, "epoch": 588} {"train_loss": -5.376760005950928, "global_step": 24720, "epoch": 588} {"train_loss": -5.438790798187256, "global_step": 24721, "epoch": 588} {"train_loss": -5.379796028137207, "global_step": 24722, "epoch": 588} {"train_loss": -5.370340347290039, "global_step": 24723, "epoch": 588} {"train_loss": -5.258118629455566, "global_step": 24724, "epoch": 588} {"train_loss": -5.325462341308594, "global_step": 24725, "epoch": 588} {"train_loss": -5.386092185974121, "global_step": 24726, "epoch": 588} {"train_loss": -5.293852806091309, "global_step": 24727, "epoch": 588} {"train_loss": -5.361145973205566, "global_step": 24728, "epoch": 588} {"train_loss": -5.366231918334961, "global_step": 24729, "epoch": 588} {"train_loss": -5.274477958679199, "global_step": 24730, "epoch": 588} {"train_loss": -5.387403964996338, "global_step": 24731, "epoch": 588} {"train_loss": -5.2714128494262695, "global_step": 24732, "epoch": 588} {"train_loss": -5.132136344909668, "global_step": 24733, "epoch": 588} {"train_loss": -5.213198184967041, "global_step": 24734, "epoch": 588} {"train_loss": -5.155230522155762, "global_step": 24735, "epoch": 588} {"train_loss": -5.305991172790527, "global_step": 24736, "epoch": 588} {"train_loss": -5.358672959463937, "global_step": 24737, "epoch": 588, "val_loss": 77210.90625} {"train_loss": -5.414984703063965, "global_step": 24738, "epoch": 589} {"train_loss": -5.243427276611328, "global_step": 24739, "epoch": 589} {"train_loss": -5.435469150543213, "global_step": 24740, "epoch": 589} {"train_loss": -5.356110572814941, "global_step": 24741, "epoch": 589} {"train_loss": -5.346384048461914, "global_step": 24742, "epoch": 589} {"train_loss": -5.403665542602539, "global_step": 24743, "epoch": 589} {"train_loss": -5.208146572113037, "global_step": 24744, "epoch": 589} {"train_loss": -5.556051254272461, "global_step": 24745, "epoch": 589} {"train_loss": -5.418381214141846, "global_step": 24746, "epoch": 589} {"train_loss": -5.409022808074951, "global_step": 24747, "epoch": 589} {"train_loss": -5.279864311218262, "global_step": 24748, "epoch": 589} {"train_loss": -5.413447856903076, "global_step": 24749, "epoch": 589} {"train_loss": -5.382726669311523, "global_step": 24750, "epoch": 589} {"train_loss": -5.360734939575195, "global_step": 24751, "epoch": 589} {"train_loss": -5.495155334472656, "global_step": 24752, "epoch": 589} {"train_loss": -5.395847320556641, "global_step": 24753, "epoch": 589} {"train_loss": -5.426108360290527, "global_step": 24754, "epoch": 589} {"train_loss": -5.41933536529541, "global_step": 24755, "epoch": 589} {"train_loss": -5.399441242218018, "global_step": 24756, "epoch": 589} {"train_loss": -5.355824947357178, "global_step": 24757, "epoch": 589} {"train_loss": -5.459347724914551, "global_step": 24758, "epoch": 589} {"train_loss": -5.381813049316406, "global_step": 24759, "epoch": 589} {"train_loss": -5.321430206298828, "global_step": 24760, "epoch": 589} {"train_loss": -5.487885475158691, "global_step": 24761, "epoch": 589} {"train_loss": -5.285381317138672, "global_step": 24762, "epoch": 589} {"train_loss": -5.205061912536621, "global_step": 24763, "epoch": 589} {"train_loss": -5.317586898803711, "global_step": 24764, "epoch": 589} {"train_loss": -5.330178260803223, "global_step": 24765, "epoch": 589} {"train_loss": -5.3674726486206055, "global_step": 24766, "epoch": 589} {"train_loss": -5.389298915863037, "global_step": 24767, "epoch": 589} {"train_loss": -5.4192891120910645, "global_step": 24768, "epoch": 589} {"train_loss": -5.488574028015137, "global_step": 24769, "epoch": 589} {"train_loss": -5.344393730163574, "global_step": 24770, "epoch": 589} {"train_loss": -5.3015971183776855, "global_step": 24771, "epoch": 589} {"train_loss": -5.297294616699219, "global_step": 24772, "epoch": 589} {"train_loss": -5.615785598754883, "global_step": 24773, "epoch": 589} {"train_loss": -5.34096622467041, "global_step": 24774, "epoch": 589} {"train_loss": -5.414834022521973, "global_step": 24775, "epoch": 589} {"train_loss": -5.3338165283203125, "global_step": 24776, "epoch": 589} {"train_loss": -5.259825706481934, "global_step": 24777, "epoch": 589} {"train_loss": -5.326434135437012, "global_step": 24778, "epoch": 589} {"train_loss": -5.377718959535871, "global_step": 24779, "epoch": 589, "val_loss": 76424.0859375} {"train_loss": -5.430534362792969, "global_step": 24780, "epoch": 590} {"train_loss": -5.538398265838623, "global_step": 24781, "epoch": 590} {"train_loss": -5.392102241516113, "global_step": 24782, "epoch": 590} {"train_loss": -5.381828308105469, "global_step": 24783, "epoch": 590} {"train_loss": -5.3607177734375, "global_step": 24784, "epoch": 590} {"train_loss": -5.465395927429199, "global_step": 24785, "epoch": 590} {"train_loss": -5.469951629638672, "global_step": 24786, "epoch": 590} {"train_loss": -5.409083843231201, "global_step": 24787, "epoch": 590} {"train_loss": -5.437060832977295, "global_step": 24788, "epoch": 590} {"train_loss": -5.276378154754639, "global_step": 24789, "epoch": 590} {"train_loss": -5.3338847160339355, "global_step": 24790, "epoch": 590} {"train_loss": -5.368410587310791, "global_step": 24791, "epoch": 590} {"train_loss": -5.456081390380859, "global_step": 24792, "epoch": 590} {"train_loss": -5.492245674133301, "global_step": 24793, "epoch": 590} {"train_loss": -5.228129863739014, "global_step": 24794, "epoch": 590} {"train_loss": -5.259932518005371, "global_step": 24795, "epoch": 590} {"train_loss": -5.4643635749816895, "global_step": 24796, "epoch": 590} {"train_loss": -5.32420539855957, "global_step": 24797, "epoch": 590} {"train_loss": -5.349547386169434, "global_step": 24798, "epoch": 590} {"train_loss": -5.319912910461426, "global_step": 24799, "epoch": 590} {"train_loss": -5.409651756286621, "global_step": 24800, "epoch": 590} {"train_loss": -5.4343461990356445, "global_step": 24801, "epoch": 590} {"train_loss": -5.460921287536621, "global_step": 24802, "epoch": 590} {"train_loss": -5.415146350860596, "global_step": 24803, "epoch": 590} {"train_loss": -5.461872577667236, "global_step": 24804, "epoch": 590} {"train_loss": -5.497775077819824, "global_step": 24805, "epoch": 590} {"train_loss": -5.338316917419434, "global_step": 24806, "epoch": 590} {"train_loss": -5.307903289794922, "global_step": 24807, "epoch": 590} {"train_loss": -5.279057502746582, "global_step": 24808, "epoch": 590} {"train_loss": -5.3626861572265625, "global_step": 24809, "epoch": 590} {"train_loss": -5.239428520202637, "global_step": 24810, "epoch": 590} {"train_loss": -5.263236999511719, "global_step": 24811, "epoch": 590} {"train_loss": -5.376336097717285, "global_step": 24812, "epoch": 590} {"train_loss": -5.358790397644043, "global_step": 24813, "epoch": 590} {"train_loss": -5.337592601776123, "global_step": 24814, "epoch": 590} {"train_loss": -5.547856330871582, "global_step": 24815, "epoch": 590} {"train_loss": -5.194997310638428, "global_step": 24816, "epoch": 590} {"train_loss": -5.3123955726623535, "global_step": 24817, "epoch": 590} {"train_loss": -5.2285871505737305, "global_step": 24818, "epoch": 590} {"train_loss": -5.222172260284424, "global_step": 24819, "epoch": 590} {"train_loss": -5.407382011413574, "global_step": 24820, "epoch": 590} {"train_loss": -5.370463382630121, "global_step": 24821, "epoch": 590, "val_loss": 76758.3828125} {"train_loss": -5.338218688964844, "global_step": 24822, "epoch": 591} {"train_loss": -5.316316604614258, "global_step": 24823, "epoch": 591} {"train_loss": -5.202395439147949, "global_step": 24824, "epoch": 591} {"train_loss": -5.29084587097168, "global_step": 24825, "epoch": 591} {"train_loss": -5.545125961303711, "global_step": 24826, "epoch": 591} {"train_loss": -5.300387859344482, "global_step": 24827, "epoch": 591} {"train_loss": -5.4687418937683105, "global_step": 24828, "epoch": 591} {"train_loss": -5.413541316986084, "global_step": 24829, "epoch": 591} {"train_loss": -5.360494613647461, "global_step": 24830, "epoch": 591} {"train_loss": -5.3884596824646, "global_step": 24831, "epoch": 591} {"train_loss": -5.391829490661621, "global_step": 24832, "epoch": 591} {"train_loss": -5.279775619506836, "global_step": 24833, "epoch": 591} {"train_loss": -5.365161418914795, "global_step": 24834, "epoch": 591} {"train_loss": -5.336549758911133, "global_step": 24835, "epoch": 591} {"train_loss": -5.397285461425781, "global_step": 24836, "epoch": 591} {"train_loss": -5.295679092407227, "global_step": 24837, "epoch": 591} {"train_loss": -5.3754706382751465, "global_step": 24838, "epoch": 591} {"train_loss": -5.292428970336914, "global_step": 24839, "epoch": 591} {"train_loss": -5.481207370758057, "global_step": 24840, "epoch": 591} {"train_loss": -5.452072620391846, "global_step": 24841, "epoch": 591} {"train_loss": -5.315032005310059, "global_step": 24842, "epoch": 591} {"train_loss": -5.361693382263184, "global_step": 24843, "epoch": 591} {"train_loss": -5.3489155769348145, "global_step": 24844, "epoch": 591} {"train_loss": -5.316290378570557, "global_step": 24845, "epoch": 591} {"train_loss": -5.425443649291992, "global_step": 24846, "epoch": 591} {"train_loss": -5.3728251457214355, "global_step": 24847, "epoch": 591} {"train_loss": -5.294655799865723, "global_step": 24848, "epoch": 591} {"train_loss": -5.272421836853027, "global_step": 24849, "epoch": 591} {"train_loss": -5.458254337310791, "global_step": 24850, "epoch": 591} {"train_loss": -5.477526664733887, "global_step": 24851, "epoch": 591} {"train_loss": -5.369952201843262, "global_step": 24852, "epoch": 591} {"train_loss": -5.30521297454834, "global_step": 24853, "epoch": 591} {"train_loss": -5.479696750640869, "global_step": 24854, "epoch": 591} {"train_loss": -5.293511390686035, "global_step": 24855, "epoch": 591} {"train_loss": -5.429917812347412, "global_step": 24856, "epoch": 591} {"train_loss": -5.363149642944336, "global_step": 24857, "epoch": 591} {"train_loss": -5.332846164703369, "global_step": 24858, "epoch": 591} {"train_loss": -5.423349857330322, "global_step": 24859, "epoch": 591} {"train_loss": -5.329466819763184, "global_step": 24860, "epoch": 591} {"train_loss": -5.2957844734191895, "global_step": 24861, "epoch": 591} {"train_loss": -5.364426612854004, "global_step": 24862, "epoch": 591} {"train_loss": -5.365850323722476, "global_step": 24863, "epoch": 591, "val_loss": 75947.96875} {"train_loss": -5.322784423828125, "global_step": 24864, "epoch": 592} {"train_loss": -5.484749794006348, "global_step": 24865, "epoch": 592} {"train_loss": -5.203287124633789, "global_step": 24866, "epoch": 592} {"train_loss": -5.371841907501221, "global_step": 24867, "epoch": 592} {"train_loss": -5.445916175842285, "global_step": 24868, "epoch": 592} {"train_loss": -5.316890716552734, "global_step": 24869, "epoch": 592} {"train_loss": -5.208010673522949, "global_step": 24870, "epoch": 592} {"train_loss": -5.331408500671387, "global_step": 24871, "epoch": 592} {"train_loss": -5.380706787109375, "global_step": 24872, "epoch": 592} {"train_loss": -5.426049709320068, "global_step": 24873, "epoch": 592} {"train_loss": -5.485881805419922, "global_step": 24874, "epoch": 592} {"train_loss": -5.384283065795898, "global_step": 24875, "epoch": 592} {"train_loss": -5.367147445678711, "global_step": 24876, "epoch": 592} {"train_loss": -5.350471496582031, "global_step": 24877, "epoch": 592} {"train_loss": -5.346642971038818, "global_step": 24878, "epoch": 592} {"train_loss": -5.284893989562988, "global_step": 24879, "epoch": 592} {"train_loss": -5.4395551681518555, "global_step": 24880, "epoch": 592} {"train_loss": -5.380622863769531, "global_step": 24881, "epoch": 592} {"train_loss": -5.508532524108887, "global_step": 24882, "epoch": 592} {"train_loss": -5.285821437835693, "global_step": 24883, "epoch": 592} {"train_loss": -5.349203109741211, "global_step": 24884, "epoch": 592} {"train_loss": -5.457287788391113, "global_step": 24885, "epoch": 592} {"train_loss": -5.403120994567871, "global_step": 24886, "epoch": 592} {"train_loss": -5.389519691467285, "global_step": 24887, "epoch": 592} {"train_loss": -5.361129283905029, "global_step": 24888, "epoch": 592} {"train_loss": -5.378973007202148, "global_step": 24889, "epoch": 592} {"train_loss": -5.500337600708008, "global_step": 24890, "epoch": 592} {"train_loss": -5.3903913497924805, "global_step": 24891, "epoch": 592} {"train_loss": -5.461777687072754, "global_step": 24892, "epoch": 592} {"train_loss": -5.314696311950684, "global_step": 24893, "epoch": 592} {"train_loss": -5.466644763946533, "global_step": 24894, "epoch": 592} {"train_loss": -5.451186656951904, "global_step": 24895, "epoch": 592} {"train_loss": -5.330041885375977, "global_step": 24896, "epoch": 592} {"train_loss": -5.375914573669434, "global_step": 24897, "epoch": 592} {"train_loss": -5.4870991706848145, "global_step": 24898, "epoch": 592} {"train_loss": -5.3498992919921875, "global_step": 24899, "epoch": 592} {"train_loss": -5.53513240814209, "global_step": 24900, "epoch": 592} {"train_loss": -5.194298267364502, "global_step": 24901, "epoch": 592} {"train_loss": -5.3798933029174805, "global_step": 24902, "epoch": 592} {"train_loss": -5.398140907287598, "global_step": 24903, "epoch": 592} {"train_loss": -5.39639949798584, "global_step": 24904, "epoch": 592} {"train_loss": -5.382119315011161, "global_step": 24905, "epoch": 592, "val_loss": 76609.03125} {"train_loss": -5.420895576477051, "global_step": 24906, "epoch": 593} {"train_loss": -5.397811412811279, "global_step": 24907, "epoch": 593} {"train_loss": -5.312447547912598, "global_step": 24908, "epoch": 593} {"train_loss": -5.360526084899902, "global_step": 24909, "epoch": 593} {"train_loss": -5.319679260253906, "global_step": 24910, "epoch": 593} {"train_loss": -5.3265275955200195, "global_step": 24911, "epoch": 593} {"train_loss": -5.471539497375488, "global_step": 24912, "epoch": 593} {"train_loss": -5.297870635986328, "global_step": 24913, "epoch": 593} {"train_loss": -5.527942657470703, "global_step": 24914, "epoch": 593} {"train_loss": -5.432988166809082, "global_step": 24915, "epoch": 593} {"train_loss": -5.416230201721191, "global_step": 24916, "epoch": 593} {"train_loss": -5.428834438323975, "global_step": 24917, "epoch": 593} {"train_loss": -5.340845584869385, "global_step": 24918, "epoch": 593} {"train_loss": -5.444140911102295, "global_step": 24919, "epoch": 593} {"train_loss": -5.440320014953613, "global_step": 24920, "epoch": 593} {"train_loss": -5.388256072998047, "global_step": 24921, "epoch": 593} {"train_loss": -5.335304260253906, "global_step": 24922, "epoch": 593} {"train_loss": -5.436279773712158, "global_step": 24923, "epoch": 593} {"train_loss": -5.446280002593994, "global_step": 24924, "epoch": 593} {"train_loss": -5.309722900390625, "global_step": 24925, "epoch": 593} {"train_loss": -5.188384056091309, "global_step": 24926, "epoch": 593} {"train_loss": -5.376147270202637, "global_step": 24927, "epoch": 593} {"train_loss": -5.455499649047852, "global_step": 24928, "epoch": 593} {"train_loss": -5.43448543548584, "global_step": 24929, "epoch": 593} {"train_loss": -5.412517547607422, "global_step": 24930, "epoch": 593} {"train_loss": -5.414365768432617, "global_step": 24931, "epoch": 593} {"train_loss": -5.542043209075928, "global_step": 24932, "epoch": 593} {"train_loss": -5.286892890930176, "global_step": 24933, "epoch": 593} {"train_loss": -5.276799201965332, "global_step": 24934, "epoch": 593} {"train_loss": -5.331864356994629, "global_step": 24935, "epoch": 593} {"train_loss": -5.4105329513549805, "global_step": 24936, "epoch": 593} {"train_loss": -5.377704620361328, "global_step": 24937, "epoch": 593} {"train_loss": -5.509021759033203, "global_step": 24938, "epoch": 593} {"train_loss": -5.389845848083496, "global_step": 24939, "epoch": 593} {"train_loss": -5.358689308166504, "global_step": 24940, "epoch": 593} {"train_loss": -5.389712810516357, "global_step": 24941, "epoch": 593} {"train_loss": -5.393739700317383, "global_step": 24942, "epoch": 593} {"train_loss": -5.229019641876221, "global_step": 24943, "epoch": 593} {"train_loss": -5.457885265350342, "global_step": 24944, "epoch": 593} {"train_loss": -5.461543083190918, "global_step": 24945, "epoch": 593} {"train_loss": -5.456833839416504, "global_step": 24946, "epoch": 593} {"train_loss": -5.388741402398972, "global_step": 24947, "epoch": 593, "val_loss": 75610.5078125} {"train_loss": -5.339849472045898, "global_step": 24948, "epoch": 594} {"train_loss": -5.445539474487305, "global_step": 24949, "epoch": 594} {"train_loss": -5.355378150939941, "global_step": 24950, "epoch": 594} {"train_loss": -5.564875602722168, "global_step": 24951, "epoch": 594} {"train_loss": -5.301644325256348, "global_step": 24952, "epoch": 594} {"train_loss": -5.2860918045043945, "global_step": 24953, "epoch": 594} {"train_loss": -5.379742622375488, "global_step": 24954, "epoch": 594} {"train_loss": -5.358863830566406, "global_step": 24955, "epoch": 594} {"train_loss": -5.364569187164307, "global_step": 24956, "epoch": 594} {"train_loss": -5.359326362609863, "global_step": 24957, "epoch": 594} {"train_loss": -5.336323261260986, "global_step": 24958, "epoch": 594} {"train_loss": -5.391875267028809, "global_step": 24959, "epoch": 594} {"train_loss": -5.415505409240723, "global_step": 24960, "epoch": 594} {"train_loss": -5.333209991455078, "global_step": 24961, "epoch": 594} {"train_loss": -5.379018783569336, "global_step": 24962, "epoch": 594} {"train_loss": -5.390817642211914, "global_step": 24963, "epoch": 594} {"train_loss": -5.371271133422852, "global_step": 24964, "epoch": 594} {"train_loss": -5.291207313537598, "global_step": 24965, "epoch": 594} {"train_loss": -5.23049259185791, "global_step": 24966, "epoch": 594} {"train_loss": -5.38224458694458, "global_step": 24967, "epoch": 594} {"train_loss": -5.298535346984863, "global_step": 24968, "epoch": 594} {"train_loss": -5.430301189422607, "global_step": 24969, "epoch": 594} {"train_loss": -5.446883201599121, "global_step": 24970, "epoch": 594} {"train_loss": -5.367303848266602, "global_step": 24971, "epoch": 594} {"train_loss": -5.351812362670898, "global_step": 24972, "epoch": 594} {"train_loss": -5.464919090270996, "global_step": 24973, "epoch": 594} {"train_loss": -5.3787641525268555, "global_step": 24974, "epoch": 594} {"train_loss": -5.448354244232178, "global_step": 24975, "epoch": 594} {"train_loss": -5.292274475097656, "global_step": 24976, "epoch": 594} {"train_loss": -5.331814765930176, "global_step": 24977, "epoch": 594} {"train_loss": -5.324054718017578, "global_step": 24978, "epoch": 594} {"train_loss": -5.370761871337891, "global_step": 24979, "epoch": 594} {"train_loss": -5.369959831237793, "global_step": 24980, "epoch": 594} {"train_loss": -5.432952880859375, "global_step": 24981, "epoch": 594} {"train_loss": -5.433097839355469, "global_step": 24982, "epoch": 594} {"train_loss": -5.347460746765137, "global_step": 24983, "epoch": 594} {"train_loss": -5.296728134155273, "global_step": 24984, "epoch": 594} {"train_loss": -5.425317764282227, "global_step": 24985, "epoch": 594} {"train_loss": -5.369867324829102, "global_step": 24986, "epoch": 594} {"train_loss": -5.489638805389404, "global_step": 24987, "epoch": 594} {"train_loss": -5.324808120727539, "global_step": 24988, "epoch": 594} {"train_loss": -5.3742076101757235, "global_step": 24989, "epoch": 594, "val_loss": 76618.1640625} {"train_loss": -5.324377536773682, "global_step": 24990, "epoch": 595} {"train_loss": -5.207096099853516, "global_step": 24991, "epoch": 595} {"train_loss": -5.463628768920898, "global_step": 24992, "epoch": 595} {"train_loss": -5.354211330413818, "global_step": 24993, "epoch": 595} {"train_loss": -5.382262229919434, "global_step": 24994, "epoch": 595} {"train_loss": -5.3798627853393555, "global_step": 24995, "epoch": 595} {"train_loss": -5.288239002227783, "global_step": 24996, "epoch": 595} {"train_loss": -5.436600685119629, "global_step": 24997, "epoch": 595} {"train_loss": -5.407398700714111, "global_step": 24998, "epoch": 595} {"train_loss": -5.312287330627441, "global_step": 24999, "epoch": 595} {"train_loss": -5.331909656524658, "global_step": 25000, "epoch": 595} {"train_loss": -5.149906158447266, "global_step": 25001, "epoch": 595} {"train_loss": -5.399824619293213, "global_step": 25002, "epoch": 595} {"train_loss": -5.399035453796387, "global_step": 25003, "epoch": 595} {"train_loss": -5.330606460571289, "global_step": 25004, "epoch": 595} {"train_loss": -5.3105669021606445, "global_step": 25005, "epoch": 595} {"train_loss": -5.375978469848633, "global_step": 25006, "epoch": 595} {"train_loss": -5.4768266677856445, "global_step": 25007, "epoch": 595} {"train_loss": -5.3472819328308105, "global_step": 25008, "epoch": 595} {"train_loss": -5.401318073272705, "global_step": 25009, "epoch": 595} {"train_loss": -5.282095909118652, "global_step": 25010, "epoch": 595} {"train_loss": -5.3642120361328125, "global_step": 25011, "epoch": 595} {"train_loss": -5.271105766296387, "global_step": 25012, "epoch": 595} {"train_loss": -5.22243595123291, "global_step": 25013, "epoch": 595} {"train_loss": -5.4716796875, "global_step": 25014, "epoch": 595} {"train_loss": -5.347551345825195, "global_step": 25015, "epoch": 595} {"train_loss": -5.38316535949707, "global_step": 25016, "epoch": 595} {"train_loss": -5.359939098358154, "global_step": 25017, "epoch": 595} {"train_loss": -5.37453031539917, "global_step": 25018, "epoch": 595} {"train_loss": -5.406585216522217, "global_step": 25019, "epoch": 595} {"train_loss": -5.352561950683594, "global_step": 25020, "epoch": 595} {"train_loss": -5.3339433670043945, "global_step": 25021, "epoch": 595} {"train_loss": -5.365190505981445, "global_step": 25022, "epoch": 595} {"train_loss": -5.399580001831055, "global_step": 25023, "epoch": 595} {"train_loss": -5.468799114227295, "global_step": 25024, "epoch": 595} {"train_loss": -5.389673709869385, "global_step": 25025, "epoch": 595} {"train_loss": -5.4127092361450195, "global_step": 25026, "epoch": 595} {"train_loss": -5.559109687805176, "global_step": 25027, "epoch": 595} {"train_loss": -5.322225093841553, "global_step": 25028, "epoch": 595} {"train_loss": -5.39117956161499, "global_step": 25029, "epoch": 595} {"train_loss": -5.369710922241211, "global_step": 25030, "epoch": 595} {"train_loss": -5.36358228183928, "global_step": 25031, "epoch": 595, "val_loss": 76406.34375} {"train_loss": -5.461709976196289, "global_step": 25032, "epoch": 596} {"train_loss": -5.190767288208008, "global_step": 25033, "epoch": 596} {"train_loss": -5.368569374084473, "global_step": 25034, "epoch": 596} {"train_loss": -5.379376411437988, "global_step": 25035, "epoch": 596} {"train_loss": -5.299428939819336, "global_step": 25036, "epoch": 596} {"train_loss": -5.513346195220947, "global_step": 25037, "epoch": 596} {"train_loss": -5.247537612915039, "global_step": 25038, "epoch": 596} {"train_loss": -5.39462947845459, "global_step": 25039, "epoch": 596} {"train_loss": -5.321349143981934, "global_step": 25040, "epoch": 596} {"train_loss": -5.430355072021484, "global_step": 25041, "epoch": 596} {"train_loss": -5.443553924560547, "global_step": 25042, "epoch": 596} {"train_loss": -5.49068546295166, "global_step": 25043, "epoch": 596} {"train_loss": -5.42920446395874, "global_step": 25044, "epoch": 596} {"train_loss": -5.373183250427246, "global_step": 25045, "epoch": 596} {"train_loss": -5.219677925109863, "global_step": 25046, "epoch": 596} {"train_loss": -5.431405067443848, "global_step": 25047, "epoch": 596} {"train_loss": -5.443694114685059, "global_step": 25048, "epoch": 596} {"train_loss": -5.4132585525512695, "global_step": 25049, "epoch": 596} {"train_loss": -5.2478132247924805, "global_step": 25050, "epoch": 596} {"train_loss": -5.3498311042785645, "global_step": 25051, "epoch": 596} {"train_loss": -5.375550270080566, "global_step": 25052, "epoch": 596} {"train_loss": -5.338942050933838, "global_step": 25053, "epoch": 596} {"train_loss": -5.330770015716553, "global_step": 25054, "epoch": 596} {"train_loss": -5.406264305114746, "global_step": 25055, "epoch": 596} {"train_loss": -5.355058670043945, "global_step": 25056, "epoch": 596} {"train_loss": -5.3732194900512695, "global_step": 25057, "epoch": 596} {"train_loss": -5.43349027633667, "global_step": 25058, "epoch": 596} {"train_loss": -5.418939590454102, "global_step": 25059, "epoch": 596} {"train_loss": -5.461282730102539, "global_step": 25060, "epoch": 596} {"train_loss": -5.470956802368164, "global_step": 25061, "epoch": 596} {"train_loss": -5.410041809082031, "global_step": 25062, "epoch": 596} {"train_loss": -5.450125694274902, "global_step": 25063, "epoch": 596} {"train_loss": -5.4893574714660645, "global_step": 25064, "epoch": 596} {"train_loss": -5.361778259277344, "global_step": 25065, "epoch": 596} {"train_loss": -5.465715408325195, "global_step": 25066, "epoch": 596} {"train_loss": -5.368480682373047, "global_step": 25067, "epoch": 596} {"train_loss": -5.469211101531982, "global_step": 25068, "epoch": 596} {"train_loss": -5.551112651824951, "global_step": 25069, "epoch": 596} {"train_loss": -5.504132270812988, "global_step": 25070, "epoch": 596} {"train_loss": -5.343289375305176, "global_step": 25071, "epoch": 596} {"train_loss": -5.3575439453125, "global_step": 25072, "epoch": 596} {"train_loss": -5.393346434547787, "global_step": 25073, "epoch": 596, "val_loss": 76346.1640625} {"train_loss": -5.478026866912842, "global_step": 25074, "epoch": 597} {"train_loss": -5.379141807556152, "global_step": 25075, "epoch": 597} {"train_loss": -5.296608924865723, "global_step": 25076, "epoch": 597} {"train_loss": -5.397284507751465, "global_step": 25077, "epoch": 597} {"train_loss": -5.362608909606934, "global_step": 25078, "epoch": 597} {"train_loss": -5.334894180297852, "global_step": 25079, "epoch": 597} {"train_loss": -5.298523902893066, "global_step": 25080, "epoch": 597} {"train_loss": -5.218805313110352, "global_step": 25081, "epoch": 597} {"train_loss": -5.174738883972168, "global_step": 25082, "epoch": 597} {"train_loss": -5.317984580993652, "global_step": 25083, "epoch": 597} {"train_loss": -5.207544803619385, "global_step": 25084, "epoch": 597} {"train_loss": -5.49786376953125, "global_step": 25085, "epoch": 597} {"train_loss": -5.393880367279053, "global_step": 25086, "epoch": 597} {"train_loss": -5.327192306518555, "global_step": 25087, "epoch": 597} {"train_loss": -5.272382736206055, "global_step": 25088, "epoch": 597} {"train_loss": -5.380335330963135, "global_step": 25089, "epoch": 597} {"train_loss": -5.149615287780762, "global_step": 25090, "epoch": 597} {"train_loss": -5.396350860595703, "global_step": 25091, "epoch": 597} {"train_loss": -5.226789474487305, "global_step": 25092, "epoch": 597} {"train_loss": -5.413649082183838, "global_step": 25093, "epoch": 597} {"train_loss": -5.411838531494141, "global_step": 25094, "epoch": 597} {"train_loss": -5.300820350646973, "global_step": 25095, "epoch": 597} {"train_loss": -5.371427536010742, "global_step": 25096, "epoch": 597} {"train_loss": -5.544060707092285, "global_step": 25097, "epoch": 597} {"train_loss": -5.3112969398498535, "global_step": 25098, "epoch": 597} {"train_loss": -5.445228576660156, "global_step": 25099, "epoch": 597} {"train_loss": -5.454849720001221, "global_step": 25100, "epoch": 597} {"train_loss": -5.400635719299316, "global_step": 25101, "epoch": 597} {"train_loss": -5.486219882965088, "global_step": 25102, "epoch": 597} {"train_loss": -5.365958213806152, "global_step": 25103, "epoch": 597} {"train_loss": -5.38383674621582, "global_step": 25104, "epoch": 597} {"train_loss": -5.443490982055664, "global_step": 25105, "epoch": 597} {"train_loss": -5.312512397766113, "global_step": 25106, "epoch": 597} {"train_loss": -5.404016494750977, "global_step": 25107, "epoch": 597} {"train_loss": -5.429825305938721, "global_step": 25108, "epoch": 597} {"train_loss": -5.4193620681762695, "global_step": 25109, "epoch": 597} {"train_loss": -5.438100814819336, "global_step": 25110, "epoch": 597} {"train_loss": -5.357602119445801, "global_step": 25111, "epoch": 597} {"train_loss": -5.34583854675293, "global_step": 25112, "epoch": 597} {"train_loss": -5.423083305358887, "global_step": 25113, "epoch": 597} {"train_loss": -5.258862495422363, "global_step": 25114, "epoch": 597} {"train_loss": -5.361037617637997, "global_step": 25115, "epoch": 597, "val_loss": 76585.96875} {"train_loss": -5.497894287109375, "global_step": 25116, "epoch": 598} {"train_loss": -5.429102897644043, "global_step": 25117, "epoch": 598} {"train_loss": -5.448637962341309, "global_step": 25118, "epoch": 598} {"train_loss": -5.4535017013549805, "global_step": 25119, "epoch": 598} {"train_loss": -5.294188022613525, "global_step": 25120, "epoch": 598} {"train_loss": -5.381314277648926, "global_step": 25121, "epoch": 598} {"train_loss": -5.440098285675049, "global_step": 25122, "epoch": 598} {"train_loss": -5.3367156982421875, "global_step": 25123, "epoch": 598} {"train_loss": -5.498303413391113, "global_step": 25124, "epoch": 598} {"train_loss": -5.428282260894775, "global_step": 25125, "epoch": 598} {"train_loss": -5.399548530578613, "global_step": 25126, "epoch": 598} {"train_loss": -5.433481216430664, "global_step": 25127, "epoch": 598} {"train_loss": -5.364310264587402, "global_step": 25128, "epoch": 598} {"train_loss": -5.412038803100586, "global_step": 25129, "epoch": 598} {"train_loss": -5.405693531036377, "global_step": 25130, "epoch": 598} {"train_loss": -5.331416606903076, "global_step": 25131, "epoch": 598} {"train_loss": -5.442138195037842, "global_step": 25132, "epoch": 598} {"train_loss": -5.285654544830322, "global_step": 25133, "epoch": 598} {"train_loss": -5.278942584991455, "global_step": 25134, "epoch": 598} {"train_loss": -5.400669574737549, "global_step": 25135, "epoch": 598} {"train_loss": -5.28331995010376, "global_step": 25136, "epoch": 598} {"train_loss": -5.367887496948242, "global_step": 25137, "epoch": 598} {"train_loss": -5.488778114318848, "global_step": 25138, "epoch": 598} {"train_loss": -5.414172172546387, "global_step": 25139, "epoch": 598} {"train_loss": -5.545206069946289, "global_step": 25140, "epoch": 598} {"train_loss": -5.471070289611816, "global_step": 25141, "epoch": 598} {"train_loss": -5.4166717529296875, "global_step": 25142, "epoch": 598} {"train_loss": -5.407144069671631, "global_step": 25143, "epoch": 598} {"train_loss": -5.415707111358643, "global_step": 25144, "epoch": 598} {"train_loss": -5.313519477844238, "global_step": 25145, "epoch": 598} {"train_loss": -5.364382743835449, "global_step": 25146, "epoch": 598} {"train_loss": -5.342095375061035, "global_step": 25147, "epoch": 598} {"train_loss": -5.31215763092041, "global_step": 25148, "epoch": 598} {"train_loss": -5.3716535568237305, "global_step": 25149, "epoch": 598} {"train_loss": -5.323219299316406, "global_step": 25150, "epoch": 598} {"train_loss": -5.322431564331055, "global_step": 25151, "epoch": 598} {"train_loss": -5.295474052429199, "global_step": 25152, "epoch": 598} {"train_loss": -5.2554030418396, "global_step": 25153, "epoch": 598} {"train_loss": -5.507473945617676, "global_step": 25154, "epoch": 598} {"train_loss": -5.309004306793213, "global_step": 25155, "epoch": 598} {"train_loss": -5.256233215332031, "global_step": 25156, "epoch": 598} {"train_loss": -5.383943886983962, "global_step": 25157, "epoch": 598, "val_loss": 77166.78125} {"train_loss": -5.329613208770752, "global_step": 25158, "epoch": 599} {"train_loss": -5.437734603881836, "global_step": 25159, "epoch": 599} {"train_loss": -5.256591796875, "global_step": 25160, "epoch": 599} {"train_loss": -5.423990249633789, "global_step": 25161, "epoch": 599} {"train_loss": -5.1950225830078125, "global_step": 25162, "epoch": 599} {"train_loss": -5.154888153076172, "global_step": 25163, "epoch": 599} {"train_loss": -5.420632362365723, "global_step": 25164, "epoch": 599} {"train_loss": -5.25565242767334, "global_step": 25165, "epoch": 599} {"train_loss": -5.223092079162598, "global_step": 25166, "epoch": 599} {"train_loss": -5.318075180053711, "global_step": 25167, "epoch": 599} {"train_loss": -5.465564727783203, "global_step": 25168, "epoch": 599} {"train_loss": -5.395387649536133, "global_step": 25169, "epoch": 599} {"train_loss": -5.265807628631592, "global_step": 25170, "epoch": 599} {"train_loss": -5.46183443069458, "global_step": 25171, "epoch": 599} {"train_loss": -5.30685567855835, "global_step": 25172, "epoch": 599} {"train_loss": -5.513270854949951, "global_step": 25173, "epoch": 599} {"train_loss": -5.406929016113281, "global_step": 25174, "epoch": 599} {"train_loss": -5.147023677825928, "global_step": 25175, "epoch": 599} {"train_loss": -5.407029628753662, "global_step": 25176, "epoch": 599} {"train_loss": -5.276203632354736, "global_step": 25177, "epoch": 599} {"train_loss": -5.324154853820801, "global_step": 25178, "epoch": 599} {"train_loss": -5.437315940856934, "global_step": 25179, "epoch": 599} {"train_loss": -5.326981544494629, "global_step": 25180, "epoch": 599} {"train_loss": -5.490674018859863, "global_step": 25181, "epoch": 599} {"train_loss": -5.4393157958984375, "global_step": 25182, "epoch": 599} {"train_loss": -5.462952136993408, "global_step": 25183, "epoch": 599} {"train_loss": -5.253296852111816, "global_step": 25184, "epoch": 599} {"train_loss": -5.348723411560059, "global_step": 25185, "epoch": 599} {"train_loss": -5.322370529174805, "global_step": 25186, "epoch": 599} {"train_loss": -5.398928642272949, "global_step": 25187, "epoch": 599} {"train_loss": -5.399449348449707, "global_step": 25188, "epoch": 599} {"train_loss": -5.325477123260498, "global_step": 25189, "epoch": 599} {"train_loss": -5.479538917541504, "global_step": 25190, "epoch": 599} {"train_loss": -5.28922176361084, "global_step": 25191, "epoch": 599} {"train_loss": -5.433504104614258, "global_step": 25192, "epoch": 599} {"train_loss": -5.433210372924805, "global_step": 25193, "epoch": 599} {"train_loss": -5.268928527832031, "global_step": 25194, "epoch": 599} {"train_loss": -5.520091533660889, "global_step": 25195, "epoch": 599} {"train_loss": -5.375364303588867, "global_step": 25196, "epoch": 599} {"train_loss": -5.228100776672363, "global_step": 25197, "epoch": 599} {"train_loss": -5.383171081542969, "global_step": 25198, "epoch": 599} {"train_loss": -5.355764616103399, "global_step": 25199, "epoch": 599, "val_loss": 76831.09375} {"train_loss": -5.301304340362549, "global_step": 25200, "epoch": 600} {"train_loss": -5.437459945678711, "global_step": 25201, "epoch": 600} {"train_loss": -5.293288707733154, "global_step": 25202, "epoch": 600} {"train_loss": -5.42804479598999, "global_step": 25203, "epoch": 600} {"train_loss": -5.359254837036133, "global_step": 25204, "epoch": 600} {"train_loss": -5.371349334716797, "global_step": 25205, "epoch": 600} {"train_loss": -5.308083534240723, "global_step": 25206, "epoch": 600} {"train_loss": -5.313961982727051, "global_step": 25207, "epoch": 600} {"train_loss": -5.546899318695068, "global_step": 25208, "epoch": 600} {"train_loss": -5.318159580230713, "global_step": 25209, "epoch": 600} {"train_loss": -5.455899238586426, "global_step": 25210, "epoch": 600} {"train_loss": -5.386898994445801, "global_step": 25211, "epoch": 600} {"train_loss": -5.432373046875, "global_step": 25212, "epoch": 600} {"train_loss": -5.252654075622559, "global_step": 25213, "epoch": 600} {"train_loss": -5.537646293640137, "global_step": 25214, "epoch": 600} {"train_loss": -5.288434028625488, "global_step": 25215, "epoch": 600} {"train_loss": -5.32855224609375, "global_step": 25216, "epoch": 600} {"train_loss": -5.448696136474609, "global_step": 25217, "epoch": 600} {"train_loss": -5.2826690673828125, "global_step": 25218, "epoch": 600} {"train_loss": -5.509433746337891, "global_step": 25219, "epoch": 600} {"train_loss": -5.267314910888672, "global_step": 25220, "epoch": 600} {"train_loss": -5.458957672119141, "global_step": 25221, "epoch": 600} {"train_loss": -5.416788101196289, "global_step": 25222, "epoch": 600} {"train_loss": -5.531386852264404, "global_step": 25223, "epoch": 600} {"train_loss": -5.47061824798584, "global_step": 25224, "epoch": 600} {"train_loss": -5.375565528869629, "global_step": 25225, "epoch": 600} {"train_loss": -5.366090774536133, "global_step": 25226, "epoch": 600} {"train_loss": -5.474112510681152, "global_step": 25227, "epoch": 600} {"train_loss": -5.400740623474121, "global_step": 25228, "epoch": 600} {"train_loss": -5.387685298919678, "global_step": 25229, "epoch": 600} {"train_loss": -5.283173561096191, "global_step": 25230, "epoch": 600} {"train_loss": -5.334681510925293, "global_step": 25231, "epoch": 600} {"train_loss": -5.276106834411621, "global_step": 25232, "epoch": 600} {"train_loss": -5.356510162353516, "global_step": 25233, "epoch": 600} {"train_loss": -5.425013065338135, "global_step": 25234, "epoch": 600} {"train_loss": -5.343409538269043, "global_step": 25235, "epoch": 600} {"train_loss": -5.3965301513671875, "global_step": 25236, "epoch": 600} {"train_loss": -5.463518142700195, "global_step": 25237, "epoch": 600} {"train_loss": -5.401796340942383, "global_step": 25238, "epoch": 600} {"train_loss": -5.342145919799805, "global_step": 25239, "epoch": 600} {"train_loss": -5.4223198890686035, "global_step": 25240, "epoch": 600} {"train_loss": -5.383363224211193, "global_step": 25241, "epoch": 600, "train/sim_max_reward_0": 0.31749427316806206, "train/sim_max_reward_1": 0.17635673659764148, "train/sim_max_reward_2": 0.6417145404007336, "train/sim_max_reward_3": 0.5751169087663035, "train/sim_max_reward_4": 0.44388267679501253, "train/sim_max_reward_5": 0.5607238944254169, "test/sim_max_reward_4500000": 0.35418699265445064, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.24573580540728093, "test/sim_max_reward_4500004": 0.22351337140367375, "test/sim_max_reward_4500005": 0.1760240728166324, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0239754891386459, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.10576350569942682, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.4490552938247203, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.34803862603780283, "test/sim_max_reward_4500015": 0.502742159760024, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.5254721661575781, "test/sim_max_reward_4500018": 0.15146062838608967, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.14861511220147822, "test/sim_max_reward_4500022": 0.3314456633708386, "test/sim_max_reward_4500023": 0.4833227782157243, "test/sim_max_reward_4500024": 0.11671096285996899, "test/sim_max_reward_4500025": 0.353733988395521, "test/sim_max_reward_4500026": 0.2770079779994465, "test/sim_max_reward_4500027": 0.8359192441886689, "test/sim_max_reward_4500028": 0.41939199841164826, "test/sim_max_reward_4500029": 0.4962015923166092, "test/sim_max_reward_4500030": 0.2824281703934423, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.1633896737905983, "test/sim_max_reward_4500034": 0.8550428091096903, "test/sim_max_reward_4500035": 0.5214998992696748, "test/sim_max_reward_4500036": 0.41012521749773156, "test/sim_max_reward_4500037": 0.17091783148133727, "test/sim_max_reward_4500038": 0.43477786936888424, "test/sim_max_reward_4500039": 0.6540386885021097, "test/sim_max_reward_4500040": 0.2628647133142155, "test/sim_max_reward_4500041": 0.2522442225573727, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.3815041562967807, "test/sim_max_reward_4500044": 0.4907623992517566, "test/sim_max_reward_4500045": 0.13924673184993738, "test/sim_max_reward_4500046": 0.40417917268250014, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.7867400626081635, "test/sim_max_reward_4500049": 0.1919446694999719, "train/mean_score": 0.452548171692195, "test/mean_score": 0.268580899867316, "val_loss": 75746.90625} {"train_loss": -5.394077777862549, "global_step": 25242, "epoch": 601} {"train_loss": -5.393259048461914, "global_step": 25243, "epoch": 601} {"train_loss": -5.41909122467041, "global_step": 25244, "epoch": 601} {"train_loss": -5.518833160400391, "global_step": 25245, "epoch": 601} {"train_loss": -5.442493915557861, "global_step": 25246, "epoch": 601} {"train_loss": -5.362936973571777, "global_step": 25247, "epoch": 601} {"train_loss": -5.269684791564941, "global_step": 25248, "epoch": 601} {"train_loss": -5.324085235595703, "global_step": 25249, "epoch": 601} {"train_loss": -5.584636688232422, "global_step": 25250, "epoch": 601} {"train_loss": -5.426670074462891, "global_step": 25251, "epoch": 601} {"train_loss": -5.41452169418335, "global_step": 25252, "epoch": 601} {"train_loss": -5.3741068840026855, "global_step": 25253, "epoch": 601} {"train_loss": -5.440961837768555, "global_step": 25254, "epoch": 601} {"train_loss": -5.4011735916137695, "global_step": 25255, "epoch": 601} {"train_loss": -5.391114234924316, "global_step": 25256, "epoch": 601} {"train_loss": -5.608001708984375, "global_step": 25257, "epoch": 601} {"train_loss": -5.347362518310547, "global_step": 25258, "epoch": 601} {"train_loss": -5.312384605407715, "global_step": 25259, "epoch": 601} {"train_loss": -5.338742733001709, "global_step": 25260, "epoch": 601} {"train_loss": -5.399286270141602, "global_step": 25261, "epoch": 601} {"train_loss": -5.4794816970825195, "global_step": 25262, "epoch": 601} {"train_loss": -5.410967826843262, "global_step": 25263, "epoch": 601} {"train_loss": -5.424413204193115, "global_step": 25264, "epoch": 601} {"train_loss": -5.423867225646973, "global_step": 25265, "epoch": 601} {"train_loss": -5.380895614624023, "global_step": 25266, "epoch": 601} {"train_loss": -5.352471351623535, "global_step": 25267, "epoch": 601} {"train_loss": -5.3846540451049805, "global_step": 25268, "epoch": 601} {"train_loss": -5.358412742614746, "global_step": 25269, "epoch": 601} {"train_loss": -5.3433308601379395, "global_step": 25270, "epoch": 601} {"train_loss": -5.468941688537598, "global_step": 25271, "epoch": 601} {"train_loss": -5.301305294036865, "global_step": 25272, "epoch": 601} {"train_loss": -5.291082859039307, "global_step": 25273, "epoch": 601} {"train_loss": -5.495543003082275, "global_step": 25274, "epoch": 601} {"train_loss": -5.351555824279785, "global_step": 25275, "epoch": 601} {"train_loss": -5.287136077880859, "global_step": 25276, "epoch": 601} {"train_loss": -5.3729047775268555, "global_step": 25277, "epoch": 601} {"train_loss": -5.304806709289551, "global_step": 25278, "epoch": 601} {"train_loss": -5.298029899597168, "global_step": 25279, "epoch": 601} {"train_loss": -5.4105610847473145, "global_step": 25280, "epoch": 601} {"train_loss": -5.317348480224609, "global_step": 25281, "epoch": 601} {"train_loss": -5.4768548011779785, "global_step": 25282, "epoch": 601} {"train_loss": -5.3929042021433515, "global_step": 25283, "epoch": 601, "val_loss": 76195.0546875} {"train_loss": -5.377065658569336, "global_step": 25284, "epoch": 602} {"train_loss": -5.368926048278809, "global_step": 25285, "epoch": 602} {"train_loss": -5.422221660614014, "global_step": 25286, "epoch": 602} {"train_loss": -5.40315580368042, "global_step": 25287, "epoch": 602} {"train_loss": -5.4404401779174805, "global_step": 25288, "epoch": 602} {"train_loss": -5.36946439743042, "global_step": 25289, "epoch": 602} {"train_loss": -5.4309844970703125, "global_step": 25290, "epoch": 602} {"train_loss": -5.531003952026367, "global_step": 25291, "epoch": 602} {"train_loss": -5.411865234375, "global_step": 25292, "epoch": 602} {"train_loss": -5.342752933502197, "global_step": 25293, "epoch": 602} {"train_loss": -5.396610260009766, "global_step": 25294, "epoch": 602} {"train_loss": -5.432859420776367, "global_step": 25295, "epoch": 602} {"train_loss": -5.4641242027282715, "global_step": 25296, "epoch": 602} {"train_loss": -5.360982894897461, "global_step": 25297, "epoch": 602} {"train_loss": -5.311715126037598, "global_step": 25298, "epoch": 602} {"train_loss": -5.284342288970947, "global_step": 25299, "epoch": 602} {"train_loss": -5.337881088256836, "global_step": 25300, "epoch": 602} {"train_loss": -5.411022186279297, "global_step": 25301, "epoch": 602} {"train_loss": -5.335312843322754, "global_step": 25302, "epoch": 602} {"train_loss": -5.328387260437012, "global_step": 25303, "epoch": 602} {"train_loss": -5.379973411560059, "global_step": 25304, "epoch": 602} {"train_loss": -5.397447109222412, "global_step": 25305, "epoch": 602} {"train_loss": -5.425019264221191, "global_step": 25306, "epoch": 602} {"train_loss": -5.355277061462402, "global_step": 25307, "epoch": 602} {"train_loss": -5.393143653869629, "global_step": 25308, "epoch": 602} {"train_loss": -5.481897354125977, "global_step": 25309, "epoch": 602} {"train_loss": -5.494877338409424, "global_step": 25310, "epoch": 602} {"train_loss": -5.274008750915527, "global_step": 25311, "epoch": 602} {"train_loss": -5.406032562255859, "global_step": 25312, "epoch": 602} {"train_loss": -5.30905818939209, "global_step": 25313, "epoch": 602} {"train_loss": -5.387236595153809, "global_step": 25314, "epoch": 602} {"train_loss": -5.399111747741699, "global_step": 25315, "epoch": 602} {"train_loss": -5.391655921936035, "global_step": 25316, "epoch": 602} {"train_loss": -5.346453666687012, "global_step": 25317, "epoch": 602} {"train_loss": -5.386148929595947, "global_step": 25318, "epoch": 602} {"train_loss": -5.406455039978027, "global_step": 25319, "epoch": 602} {"train_loss": -5.409468173980713, "global_step": 25320, "epoch": 602} {"train_loss": -5.381248474121094, "global_step": 25321, "epoch": 602} {"train_loss": -5.35897159576416, "global_step": 25322, "epoch": 602} {"train_loss": -5.297374725341797, "global_step": 25323, "epoch": 602} {"train_loss": -5.542815208435059, "global_step": 25324, "epoch": 602} {"train_loss": -5.3900572458903, "global_step": 25325, "epoch": 602, "val_loss": 76869.203125} {"train_loss": -5.258324146270752, "global_step": 25326, "epoch": 603} {"train_loss": -5.384315013885498, "global_step": 25327, "epoch": 603} {"train_loss": -5.360179901123047, "global_step": 25328, "epoch": 603} {"train_loss": -5.269380569458008, "global_step": 25329, "epoch": 603} {"train_loss": -5.31191349029541, "global_step": 25330, "epoch": 603} {"train_loss": -5.429608345031738, "global_step": 25331, "epoch": 603} {"train_loss": -5.212743759155273, "global_step": 25332, "epoch": 603} {"train_loss": -5.427792072296143, "global_step": 25333, "epoch": 603} {"train_loss": -5.451378345489502, "global_step": 25334, "epoch": 603} {"train_loss": -5.2909746170043945, "global_step": 25335, "epoch": 603} {"train_loss": -5.3187384605407715, "global_step": 25336, "epoch": 603} {"train_loss": -5.341558456420898, "global_step": 25337, "epoch": 603} {"train_loss": -5.383347511291504, "global_step": 25338, "epoch": 603} {"train_loss": -5.513616561889648, "global_step": 25339, "epoch": 603} {"train_loss": -5.458185195922852, "global_step": 25340, "epoch": 603} {"train_loss": -5.450494289398193, "global_step": 25341, "epoch": 603} {"train_loss": -5.4839019775390625, "global_step": 25342, "epoch": 603} {"train_loss": -5.504621505737305, "global_step": 25343, "epoch": 603} {"train_loss": -5.330759048461914, "global_step": 25344, "epoch": 603} {"train_loss": -5.37539529800415, "global_step": 25345, "epoch": 603} {"train_loss": -5.433366298675537, "global_step": 25346, "epoch": 603} {"train_loss": -5.452163219451904, "global_step": 25347, "epoch": 603} {"train_loss": -5.242424488067627, "global_step": 25348, "epoch": 603} {"train_loss": -5.47066068649292, "global_step": 25349, "epoch": 603} {"train_loss": -5.407707214355469, "global_step": 25350, "epoch": 603} {"train_loss": -5.169355869293213, "global_step": 25351, "epoch": 603} {"train_loss": -5.34632682800293, "global_step": 25352, "epoch": 603} {"train_loss": -5.217529296875, "global_step": 25353, "epoch": 603} {"train_loss": -5.291319370269775, "global_step": 25354, "epoch": 603} {"train_loss": -5.398693084716797, "global_step": 25355, "epoch": 603} {"train_loss": -5.328888893127441, "global_step": 25356, "epoch": 603} {"train_loss": -5.210518836975098, "global_step": 25357, "epoch": 603} {"train_loss": -5.437011241912842, "global_step": 25358, "epoch": 603} {"train_loss": -5.288088798522949, "global_step": 25359, "epoch": 603} {"train_loss": -5.418568134307861, "global_step": 25360, "epoch": 603} {"train_loss": -5.385242938995361, "global_step": 25361, "epoch": 603} {"train_loss": -5.328118801116943, "global_step": 25362, "epoch": 603} {"train_loss": -5.324304580688477, "global_step": 25363, "epoch": 603} {"train_loss": -5.4238481521606445, "global_step": 25364, "epoch": 603} {"train_loss": -5.262918949127197, "global_step": 25365, "epoch": 603} {"train_loss": -5.360294342041016, "global_step": 25366, "epoch": 603} {"train_loss": -5.360497849328177, "global_step": 25367, "epoch": 603, "val_loss": 75775.84375} {"train_loss": -5.467972755432129, "global_step": 25368, "epoch": 604} {"train_loss": -5.478742599487305, "global_step": 25369, "epoch": 604} {"train_loss": -5.200869560241699, "global_step": 25370, "epoch": 604} {"train_loss": -5.345015525817871, "global_step": 25371, "epoch": 604} {"train_loss": -5.441534042358398, "global_step": 25372, "epoch": 604} {"train_loss": -5.380609512329102, "global_step": 25373, "epoch": 604} {"train_loss": -5.315659999847412, "global_step": 25374, "epoch": 604} {"train_loss": -5.425723075866699, "global_step": 25375, "epoch": 604} {"train_loss": -5.386088848114014, "global_step": 25376, "epoch": 604} {"train_loss": -5.244227886199951, "global_step": 25377, "epoch": 604} {"train_loss": -5.459070205688477, "global_step": 25378, "epoch": 604} {"train_loss": -5.2294182777404785, "global_step": 25379, "epoch": 604} {"train_loss": -5.243375301361084, "global_step": 25380, "epoch": 604} {"train_loss": -5.382798194885254, "global_step": 25381, "epoch": 604} {"train_loss": -5.312167167663574, "global_step": 25382, "epoch": 604} {"train_loss": -5.385805606842041, "global_step": 25383, "epoch": 604} {"train_loss": -5.372272491455078, "global_step": 25384, "epoch": 604} {"train_loss": -5.380363941192627, "global_step": 25385, "epoch": 604} {"train_loss": -5.500853061676025, "global_step": 25386, "epoch": 604} {"train_loss": -5.202394485473633, "global_step": 25387, "epoch": 604} {"train_loss": -5.374579429626465, "global_step": 25388, "epoch": 604} {"train_loss": -5.323657512664795, "global_step": 25389, "epoch": 604} {"train_loss": -5.328865051269531, "global_step": 25390, "epoch": 604} {"train_loss": -5.51214075088501, "global_step": 25391, "epoch": 604} {"train_loss": -5.395059585571289, "global_step": 25392, "epoch": 604} {"train_loss": -5.444997787475586, "global_step": 25393, "epoch": 604} {"train_loss": -5.374087333679199, "global_step": 25394, "epoch": 604} {"train_loss": -5.5044121742248535, "global_step": 25395, "epoch": 604} {"train_loss": -5.396871566772461, "global_step": 25396, "epoch": 604} {"train_loss": -5.417154312133789, "global_step": 25397, "epoch": 604} {"train_loss": -5.378608703613281, "global_step": 25398, "epoch": 604} {"train_loss": -5.432283878326416, "global_step": 25399, "epoch": 604} {"train_loss": -5.431660175323486, "global_step": 25400, "epoch": 604} {"train_loss": -5.363579273223877, "global_step": 25401, "epoch": 604} {"train_loss": -5.389665603637695, "global_step": 25402, "epoch": 604} {"train_loss": -5.33560848236084, "global_step": 25403, "epoch": 604} {"train_loss": -5.368371963500977, "global_step": 25404, "epoch": 604} {"train_loss": -5.458868026733398, "global_step": 25405, "epoch": 604} {"train_loss": -5.417153358459473, "global_step": 25406, "epoch": 604} {"train_loss": -5.404437065124512, "global_step": 25407, "epoch": 604} {"train_loss": -5.3030500411987305, "global_step": 25408, "epoch": 604} {"train_loss": -5.377258085069203, "global_step": 25409, "epoch": 604, "val_loss": 76158.140625} {"train_loss": -5.206542015075684, "global_step": 25410, "epoch": 605} {"train_loss": -5.4090776443481445, "global_step": 25411, "epoch": 605} {"train_loss": -5.385447978973389, "global_step": 25412, "epoch": 605} {"train_loss": -5.232532978057861, "global_step": 25413, "epoch": 605} {"train_loss": -5.29193115234375, "global_step": 25414, "epoch": 605} {"train_loss": -5.456539154052734, "global_step": 25415, "epoch": 605} {"train_loss": -5.308079242706299, "global_step": 25416, "epoch": 605} {"train_loss": -5.387704372406006, "global_step": 25417, "epoch": 605} {"train_loss": -5.359672546386719, "global_step": 25418, "epoch": 605} {"train_loss": -5.334332466125488, "global_step": 25419, "epoch": 605} {"train_loss": -5.348544597625732, "global_step": 25420, "epoch": 605} {"train_loss": -5.333864212036133, "global_step": 25421, "epoch": 605} {"train_loss": -5.230451583862305, "global_step": 25422, "epoch": 605} {"train_loss": -5.334981918334961, "global_step": 25423, "epoch": 605} {"train_loss": -5.342900276184082, "global_step": 25424, "epoch": 605} {"train_loss": -5.431761741638184, "global_step": 25425, "epoch": 605} {"train_loss": -5.1849870681762695, "global_step": 25426, "epoch": 605} {"train_loss": -5.3479180335998535, "global_step": 25427, "epoch": 605} {"train_loss": -5.380196571350098, "global_step": 25428, "epoch": 605} {"train_loss": -5.393657207489014, "global_step": 25429, "epoch": 605} {"train_loss": -5.414560317993164, "global_step": 25430, "epoch": 605} {"train_loss": -5.36454963684082, "global_step": 25431, "epoch": 605} {"train_loss": -5.384737491607666, "global_step": 25432, "epoch": 605} {"train_loss": -5.353052616119385, "global_step": 25433, "epoch": 605} {"train_loss": -5.302999496459961, "global_step": 25434, "epoch": 605} {"train_loss": -5.515223503112793, "global_step": 25435, "epoch": 605} {"train_loss": -5.458637237548828, "global_step": 25436, "epoch": 605} {"train_loss": -5.461621284484863, "global_step": 25437, "epoch": 605} {"train_loss": -5.426185607910156, "global_step": 25438, "epoch": 605} {"train_loss": -5.355231285095215, "global_step": 25439, "epoch": 605} {"train_loss": -5.278672218322754, "global_step": 25440, "epoch": 605} {"train_loss": -5.505301475524902, "global_step": 25441, "epoch": 605} {"train_loss": -5.5230793952941895, "global_step": 25442, "epoch": 605} {"train_loss": -5.230968475341797, "global_step": 25443, "epoch": 605} {"train_loss": -5.465715408325195, "global_step": 25444, "epoch": 605} {"train_loss": -5.463329315185547, "global_step": 25445, "epoch": 605} {"train_loss": -5.4755659103393555, "global_step": 25446, "epoch": 605} {"train_loss": -5.44998836517334, "global_step": 25447, "epoch": 605} {"train_loss": -5.344117164611816, "global_step": 25448, "epoch": 605} {"train_loss": -5.353837966918945, "global_step": 25449, "epoch": 605} {"train_loss": -5.450997352600098, "global_step": 25450, "epoch": 605} {"train_loss": -5.369445925667172, "global_step": 25451, "epoch": 605, "val_loss": 76785.6015625} {"train_loss": -5.248841285705566, "global_step": 25452, "epoch": 606} {"train_loss": -5.56020450592041, "global_step": 25453, "epoch": 606} {"train_loss": -5.528783798217773, "global_step": 25454, "epoch": 606} {"train_loss": -5.389925956726074, "global_step": 25455, "epoch": 606} {"train_loss": -5.449253559112549, "global_step": 25456, "epoch": 606} {"train_loss": -5.545600891113281, "global_step": 25457, "epoch": 606} {"train_loss": -5.396242618560791, "global_step": 25458, "epoch": 606} {"train_loss": -5.396327018737793, "global_step": 25459, "epoch": 606} {"train_loss": -5.362153053283691, "global_step": 25460, "epoch": 606} {"train_loss": -5.3198323249816895, "global_step": 25461, "epoch": 606} {"train_loss": -5.452537536621094, "global_step": 25462, "epoch": 606} {"train_loss": -5.5502777099609375, "global_step": 25463, "epoch": 606} {"train_loss": -5.29894495010376, "global_step": 25464, "epoch": 606} {"train_loss": -5.442089080810547, "global_step": 25465, "epoch": 606} {"train_loss": -5.488197326660156, "global_step": 25466, "epoch": 606} {"train_loss": -5.382534027099609, "global_step": 25467, "epoch": 606} {"train_loss": -5.505813121795654, "global_step": 25468, "epoch": 606} {"train_loss": -5.45792818069458, "global_step": 25469, "epoch": 606} {"train_loss": -5.33358097076416, "global_step": 25470, "epoch": 606} {"train_loss": -5.589920997619629, "global_step": 25471, "epoch": 606} {"train_loss": -5.4589128494262695, "global_step": 25472, "epoch": 606} {"train_loss": -5.470073699951172, "global_step": 25473, "epoch": 606} {"train_loss": -5.395613670349121, "global_step": 25474, "epoch": 606} {"train_loss": -5.391905784606934, "global_step": 25475, "epoch": 606} {"train_loss": -5.4710283279418945, "global_step": 25476, "epoch": 606} {"train_loss": -5.271130084991455, "global_step": 25477, "epoch": 606} {"train_loss": -5.396851062774658, "global_step": 25478, "epoch": 606} {"train_loss": -5.283438682556152, "global_step": 25479, "epoch": 606} {"train_loss": -5.158010482788086, "global_step": 25480, "epoch": 606} {"train_loss": -5.399356842041016, "global_step": 25481, "epoch": 606} {"train_loss": -5.297985076904297, "global_step": 25482, "epoch": 606} {"train_loss": -5.218008518218994, "global_step": 25483, "epoch": 606} {"train_loss": -5.343515872955322, "global_step": 25484, "epoch": 606} {"train_loss": -5.30507230758667, "global_step": 25485, "epoch": 606} {"train_loss": -5.231603145599365, "global_step": 25486, "epoch": 606} {"train_loss": -5.38120698928833, "global_step": 25487, "epoch": 606} {"train_loss": -5.22130012512207, "global_step": 25488, "epoch": 606} {"train_loss": -5.442017555236816, "global_step": 25489, "epoch": 606} {"train_loss": -5.2886528968811035, "global_step": 25490, "epoch": 606} {"train_loss": -5.344628810882568, "global_step": 25491, "epoch": 606} {"train_loss": -5.390407562255859, "global_step": 25492, "epoch": 606} {"train_loss": -5.384827523004441, "global_step": 25493, "epoch": 606, "val_loss": 76412.1015625} {"train_loss": -5.496922016143799, "global_step": 25494, "epoch": 607} {"train_loss": -5.311768531799316, "global_step": 25495, "epoch": 607} {"train_loss": -5.353034973144531, "global_step": 25496, "epoch": 607} {"train_loss": -5.484124183654785, "global_step": 25497, "epoch": 607} {"train_loss": -5.372204780578613, "global_step": 25498, "epoch": 607} {"train_loss": -5.43131160736084, "global_step": 25499, "epoch": 607} {"train_loss": -5.480050086975098, "global_step": 25500, "epoch": 607} {"train_loss": -5.398991107940674, "global_step": 25501, "epoch": 607} {"train_loss": -5.307728290557861, "global_step": 25502, "epoch": 607} {"train_loss": -5.380100250244141, "global_step": 25503, "epoch": 607} {"train_loss": -5.396444320678711, "global_step": 25504, "epoch": 607} {"train_loss": -5.47734260559082, "global_step": 25505, "epoch": 607} {"train_loss": -5.42234992980957, "global_step": 25506, "epoch": 607} {"train_loss": -5.386984348297119, "global_step": 25507, "epoch": 607} {"train_loss": -5.277256965637207, "global_step": 25508, "epoch": 607} {"train_loss": -5.405606269836426, "global_step": 25509, "epoch": 607} {"train_loss": -5.375256538391113, "global_step": 25510, "epoch": 607} {"train_loss": -5.047746658325195, "global_step": 25511, "epoch": 607} {"train_loss": -5.455756187438965, "global_step": 25512, "epoch": 607} {"train_loss": -5.3386335372924805, "global_step": 25513, "epoch": 607} {"train_loss": -5.363770484924316, "global_step": 25514, "epoch": 607} {"train_loss": -5.3773345947265625, "global_step": 25515, "epoch": 607} {"train_loss": -5.3785719871521, "global_step": 25516, "epoch": 607} {"train_loss": -5.274613857269287, "global_step": 25517, "epoch": 607} {"train_loss": -5.328854560852051, "global_step": 25518, "epoch": 607} {"train_loss": -5.167729377746582, "global_step": 25519, "epoch": 607} {"train_loss": -5.420281410217285, "global_step": 25520, "epoch": 607} {"train_loss": -5.523892402648926, "global_step": 25521, "epoch": 607} {"train_loss": -5.330063343048096, "global_step": 25522, "epoch": 607} {"train_loss": -5.319205284118652, "global_step": 25523, "epoch": 607} {"train_loss": -5.360880374908447, "global_step": 25524, "epoch": 607} {"train_loss": -5.406270980834961, "global_step": 25525, "epoch": 607} {"train_loss": -5.360647201538086, "global_step": 25526, "epoch": 607} {"train_loss": -5.368058681488037, "global_step": 25527, "epoch": 607} {"train_loss": -5.402028560638428, "global_step": 25528, "epoch": 607} {"train_loss": -5.361541748046875, "global_step": 25529, "epoch": 607} {"train_loss": -5.312863349914551, "global_step": 25530, "epoch": 607} {"train_loss": -5.363271713256836, "global_step": 25531, "epoch": 607} {"train_loss": -5.3304853439331055, "global_step": 25532, "epoch": 607} {"train_loss": -5.371832847595215, "global_step": 25533, "epoch": 607} {"train_loss": -5.350773334503174, "global_step": 25534, "epoch": 607} {"train_loss": -5.3659983930133635, "global_step": 25535, "epoch": 607, "val_loss": 76440.2109375} {"train_loss": -5.547694206237793, "global_step": 25536, "epoch": 608} {"train_loss": -5.322543621063232, "global_step": 25537, "epoch": 608} {"train_loss": -5.4635725021362305, "global_step": 25538, "epoch": 608} {"train_loss": -5.439409255981445, "global_step": 25539, "epoch": 608} {"train_loss": -5.374581336975098, "global_step": 25540, "epoch": 608} {"train_loss": -5.315938949584961, "global_step": 25541, "epoch": 608} {"train_loss": -5.32005500793457, "global_step": 25542, "epoch": 608} {"train_loss": -5.3518476486206055, "global_step": 25543, "epoch": 608} {"train_loss": -5.434448719024658, "global_step": 25544, "epoch": 608} {"train_loss": -5.432558536529541, "global_step": 25545, "epoch": 608} {"train_loss": -5.544902801513672, "global_step": 25546, "epoch": 608} {"train_loss": -5.460722923278809, "global_step": 25547, "epoch": 608} {"train_loss": -5.334832191467285, "global_step": 25548, "epoch": 608} {"train_loss": -5.4098219871521, "global_step": 25549, "epoch": 608} {"train_loss": -5.4513750076293945, "global_step": 25550, "epoch": 608} {"train_loss": -5.426203727722168, "global_step": 25551, "epoch": 608} {"train_loss": -5.491084575653076, "global_step": 25552, "epoch": 608} {"train_loss": -5.368744850158691, "global_step": 25553, "epoch": 608} {"train_loss": -5.2819743156433105, "global_step": 25554, "epoch": 608} {"train_loss": -5.503023147583008, "global_step": 25555, "epoch": 608} {"train_loss": -5.367483139038086, "global_step": 25556, "epoch": 608} {"train_loss": -5.377052307128906, "global_step": 25557, "epoch": 608} {"train_loss": -5.458545684814453, "global_step": 25558, "epoch": 608} {"train_loss": -5.494342803955078, "global_step": 25559, "epoch": 608} {"train_loss": -5.446076393127441, "global_step": 25560, "epoch": 608} {"train_loss": -5.335857391357422, "global_step": 25561, "epoch": 608} {"train_loss": -5.35054349899292, "global_step": 25562, "epoch": 608} {"train_loss": -5.4978346824646, "global_step": 25563, "epoch": 608} {"train_loss": -5.316766738891602, "global_step": 25564, "epoch": 608} {"train_loss": -5.4370832443237305, "global_step": 25565, "epoch": 608} {"train_loss": -5.456668853759766, "global_step": 25566, "epoch": 608} {"train_loss": -5.40650749206543, "global_step": 25567, "epoch": 608} {"train_loss": -5.408019065856934, "global_step": 25568, "epoch": 608} {"train_loss": -5.366630554199219, "global_step": 25569, "epoch": 608} {"train_loss": -5.393187522888184, "global_step": 25570, "epoch": 608} {"train_loss": -5.450686454772949, "global_step": 25571, "epoch": 608} {"train_loss": -5.385659694671631, "global_step": 25572, "epoch": 608} {"train_loss": -5.4987945556640625, "global_step": 25573, "epoch": 608} {"train_loss": -5.436289310455322, "global_step": 25574, "epoch": 608} {"train_loss": -5.390134811401367, "global_step": 25575, "epoch": 608} {"train_loss": -5.434698104858398, "global_step": 25576, "epoch": 608} {"train_loss": -5.414407275971913, "global_step": 25577, "epoch": 608, "val_loss": 75974.5859375} {"train_loss": -5.4205241203308105, "global_step": 25578, "epoch": 609} {"train_loss": -5.3193440437316895, "global_step": 25579, "epoch": 609} {"train_loss": -5.509964466094971, "global_step": 25580, "epoch": 609} {"train_loss": -5.540342330932617, "global_step": 25581, "epoch": 609} {"train_loss": -5.439213752746582, "global_step": 25582, "epoch": 609} {"train_loss": -5.510685920715332, "global_step": 25583, "epoch": 609} {"train_loss": -5.391275405883789, "global_step": 25584, "epoch": 609} {"train_loss": -5.40322208404541, "global_step": 25585, "epoch": 609} {"train_loss": -5.338074684143066, "global_step": 25586, "epoch": 609} {"train_loss": -5.43109130859375, "global_step": 25587, "epoch": 609} {"train_loss": -5.443878173828125, "global_step": 25588, "epoch": 609} {"train_loss": -5.344391345977783, "global_step": 25589, "epoch": 609} {"train_loss": -5.326925754547119, "global_step": 25590, "epoch": 609} {"train_loss": -5.433200359344482, "global_step": 25591, "epoch": 609} {"train_loss": -5.374601364135742, "global_step": 25592, "epoch": 609} {"train_loss": -5.4882493019104, "global_step": 25593, "epoch": 609} {"train_loss": -5.370609283447266, "global_step": 25594, "epoch": 609} {"train_loss": -5.366521835327148, "global_step": 25595, "epoch": 609} {"train_loss": -5.3096466064453125, "global_step": 25596, "epoch": 609} {"train_loss": -5.354578971862793, "global_step": 25597, "epoch": 609} {"train_loss": -5.374901294708252, "global_step": 25598, "epoch": 609} {"train_loss": -5.401291847229004, "global_step": 25599, "epoch": 609} {"train_loss": -5.550045013427734, "global_step": 25600, "epoch": 609} {"train_loss": -5.547783851623535, "global_step": 25601, "epoch": 609} {"train_loss": -5.2959794998168945, "global_step": 25602, "epoch": 609} {"train_loss": -5.308040618896484, "global_step": 25603, "epoch": 609} {"train_loss": -5.471329689025879, "global_step": 25604, "epoch": 609} {"train_loss": -5.4063215255737305, "global_step": 25605, "epoch": 609} {"train_loss": -5.405187606811523, "global_step": 25606, "epoch": 609} {"train_loss": -5.498025417327881, "global_step": 25607, "epoch": 609} {"train_loss": -5.342212677001953, "global_step": 25608, "epoch": 609} {"train_loss": -5.437814712524414, "global_step": 25609, "epoch": 609} {"train_loss": -5.2777509689331055, "global_step": 25610, "epoch": 609} {"train_loss": -5.5362138748168945, "global_step": 25611, "epoch": 609} {"train_loss": -5.362942218780518, "global_step": 25612, "epoch": 609} {"train_loss": -5.346698760986328, "global_step": 25613, "epoch": 609} {"train_loss": -5.440343856811523, "global_step": 25614, "epoch": 609} {"train_loss": -5.4061150550842285, "global_step": 25615, "epoch": 609} {"train_loss": -5.276793003082275, "global_step": 25616, "epoch": 609} {"train_loss": -5.307008743286133, "global_step": 25617, "epoch": 609} {"train_loss": -5.292604446411133, "global_step": 25618, "epoch": 609} {"train_loss": -5.3990850902739025, "global_step": 25619, "epoch": 609, "val_loss": 76052.8984375} {"train_loss": -5.507267951965332, "global_step": 25620, "epoch": 610} {"train_loss": -5.4058122634887695, "global_step": 25621, "epoch": 610} {"train_loss": -5.4041748046875, "global_step": 25622, "epoch": 610} {"train_loss": -5.530056476593018, "global_step": 25623, "epoch": 610} {"train_loss": -5.437104225158691, "global_step": 25624, "epoch": 610} {"train_loss": -5.3650007247924805, "global_step": 25625, "epoch": 610} {"train_loss": -5.437034606933594, "global_step": 25626, "epoch": 610} {"train_loss": -5.3610687255859375, "global_step": 25627, "epoch": 610} {"train_loss": -5.384122371673584, "global_step": 25628, "epoch": 610} {"train_loss": -5.337615013122559, "global_step": 25629, "epoch": 610} {"train_loss": -5.457470893859863, "global_step": 25630, "epoch": 610} {"train_loss": -5.4661865234375, "global_step": 25631, "epoch": 610} {"train_loss": -5.530015468597412, "global_step": 25632, "epoch": 610} {"train_loss": -5.32942008972168, "global_step": 25633, "epoch": 610} {"train_loss": -5.464781761169434, "global_step": 25634, "epoch": 610} {"train_loss": -5.383648872375488, "global_step": 25635, "epoch": 610} {"train_loss": -5.406642913818359, "global_step": 25636, "epoch": 610} {"train_loss": -5.319375991821289, "global_step": 25637, "epoch": 610} {"train_loss": -5.400808334350586, "global_step": 25638, "epoch": 610} {"train_loss": -5.5505781173706055, "global_step": 25639, "epoch": 610} {"train_loss": -5.311102867126465, "global_step": 25640, "epoch": 610} {"train_loss": -5.267487525939941, "global_step": 25641, "epoch": 610} {"train_loss": -5.447625160217285, "global_step": 25642, "epoch": 610} {"train_loss": -5.497457504272461, "global_step": 25643, "epoch": 610} {"train_loss": -5.55589485168457, "global_step": 25644, "epoch": 610} {"train_loss": -5.494095802307129, "global_step": 25645, "epoch": 610} {"train_loss": -5.4642014503479, "global_step": 25646, "epoch": 610} {"train_loss": -5.385014057159424, "global_step": 25647, "epoch": 610} {"train_loss": -5.356655120849609, "global_step": 25648, "epoch": 610} {"train_loss": -5.438228130340576, "global_step": 25649, "epoch": 610} {"train_loss": -5.363945960998535, "global_step": 25650, "epoch": 610} {"train_loss": -5.326751232147217, "global_step": 25651, "epoch": 610} {"train_loss": -5.267762660980225, "global_step": 25652, "epoch": 610} {"train_loss": -5.473549842834473, "global_step": 25653, "epoch": 610} {"train_loss": -5.317507266998291, "global_step": 25654, "epoch": 610} {"train_loss": -5.344476699829102, "global_step": 25655, "epoch": 610} {"train_loss": -5.328005790710449, "global_step": 25656, "epoch": 610} {"train_loss": -5.388776779174805, "global_step": 25657, "epoch": 610} {"train_loss": -5.381833553314209, "global_step": 25658, "epoch": 610} {"train_loss": -5.440225601196289, "global_step": 25659, "epoch": 610} {"train_loss": -5.42129373550415, "global_step": 25660, "epoch": 610} {"train_loss": -5.407717318761916, "global_step": 25661, "epoch": 610, "val_loss": 75616.734375} {"train_loss": -5.403133869171143, "global_step": 25662, "epoch": 611} {"train_loss": -5.368999481201172, "global_step": 25663, "epoch": 611} {"train_loss": -5.406219482421875, "global_step": 25664, "epoch": 611} {"train_loss": -5.479935646057129, "global_step": 25665, "epoch": 611} {"train_loss": -5.459906101226807, "global_step": 25666, "epoch": 611} {"train_loss": -5.522103309631348, "global_step": 25667, "epoch": 611} {"train_loss": -5.4057793617248535, "global_step": 25668, "epoch": 611} {"train_loss": -5.318202972412109, "global_step": 25669, "epoch": 611} {"train_loss": -5.3377685546875, "global_step": 25670, "epoch": 611} {"train_loss": -5.364680290222168, "global_step": 25671, "epoch": 611} {"train_loss": -5.322300910949707, "global_step": 25672, "epoch": 611} {"train_loss": -5.252751350402832, "global_step": 25673, "epoch": 611} {"train_loss": -5.330639362335205, "global_step": 25674, "epoch": 611} {"train_loss": -5.124631881713867, "global_step": 25675, "epoch": 611} {"train_loss": -5.18890380859375, "global_step": 25676, "epoch": 611} {"train_loss": -5.456518173217773, "global_step": 25677, "epoch": 611} {"train_loss": -5.3764543533325195, "global_step": 25678, "epoch": 611} {"train_loss": -5.275221347808838, "global_step": 25679, "epoch": 611} {"train_loss": -5.338486194610596, "global_step": 25680, "epoch": 611} {"train_loss": -5.307040214538574, "global_step": 25681, "epoch": 611} {"train_loss": -5.462223052978516, "global_step": 25682, "epoch": 611} {"train_loss": -5.3740949630737305, "global_step": 25683, "epoch": 611} {"train_loss": -5.469108581542969, "global_step": 25684, "epoch": 611} {"train_loss": -5.399768352508545, "global_step": 25685, "epoch": 611} {"train_loss": -5.418337345123291, "global_step": 25686, "epoch": 611} {"train_loss": -5.37723970413208, "global_step": 25687, "epoch": 611} {"train_loss": -5.359748363494873, "global_step": 25688, "epoch": 611} {"train_loss": -5.259419918060303, "global_step": 25689, "epoch": 611} {"train_loss": -5.352333068847656, "global_step": 25690, "epoch": 611} {"train_loss": -5.457728385925293, "global_step": 25691, "epoch": 611} {"train_loss": -5.40521240234375, "global_step": 25692, "epoch": 611} {"train_loss": -5.388546943664551, "global_step": 25693, "epoch": 611} {"train_loss": -5.330017566680908, "global_step": 25694, "epoch": 611} {"train_loss": -5.320523738861084, "global_step": 25695, "epoch": 611} {"train_loss": -5.259133338928223, "global_step": 25696, "epoch": 611} {"train_loss": -5.2582173347473145, "global_step": 25697, "epoch": 611} {"train_loss": -5.242801666259766, "global_step": 25698, "epoch": 611} {"train_loss": -5.462852478027344, "global_step": 25699, "epoch": 611} {"train_loss": -5.260650634765625, "global_step": 25700, "epoch": 611} {"train_loss": -5.355237007141113, "global_step": 25701, "epoch": 611} {"train_loss": -5.339674949645996, "global_step": 25702, "epoch": 611} {"train_loss": -5.355257000241961, "global_step": 25703, "epoch": 611, "val_loss": 76709.5078125} {"train_loss": -5.360485553741455, "global_step": 25704, "epoch": 612} {"train_loss": -5.302555084228516, "global_step": 25705, "epoch": 612} {"train_loss": -5.479389667510986, "global_step": 25706, "epoch": 612} {"train_loss": -5.235948085784912, "global_step": 25707, "epoch": 612} {"train_loss": -5.268953323364258, "global_step": 25708, "epoch": 612} {"train_loss": -5.411685943603516, "global_step": 25709, "epoch": 612} {"train_loss": -5.4313225746154785, "global_step": 25710, "epoch": 612} {"train_loss": -5.2662129402160645, "global_step": 25711, "epoch": 612} {"train_loss": -5.579075336456299, "global_step": 25712, "epoch": 612} {"train_loss": -5.335266590118408, "global_step": 25713, "epoch": 612} {"train_loss": -5.422479629516602, "global_step": 25714, "epoch": 612} {"train_loss": -5.404529571533203, "global_step": 25715, "epoch": 612} {"train_loss": -5.448760986328125, "global_step": 25716, "epoch": 612} {"train_loss": -5.331844329833984, "global_step": 25717, "epoch": 612} {"train_loss": -5.457078456878662, "global_step": 25718, "epoch": 612} {"train_loss": -5.325262069702148, "global_step": 25719, "epoch": 612} {"train_loss": -5.344208240509033, "global_step": 25720, "epoch": 612} {"train_loss": -5.2570905685424805, "global_step": 25721, "epoch": 612} {"train_loss": -5.406846046447754, "global_step": 25722, "epoch": 612} {"train_loss": -5.379219055175781, "global_step": 25723, "epoch": 612} {"train_loss": -5.397002220153809, "global_step": 25724, "epoch": 612} {"train_loss": -5.391968250274658, "global_step": 25725, "epoch": 612} {"train_loss": -5.352999210357666, "global_step": 25726, "epoch": 612} {"train_loss": -5.4221625328063965, "global_step": 25727, "epoch": 612} {"train_loss": -5.397514343261719, "global_step": 25728, "epoch": 612} {"train_loss": -5.3547587394714355, "global_step": 25729, "epoch": 612} {"train_loss": -5.376779556274414, "global_step": 25730, "epoch": 612} {"train_loss": -5.395261764526367, "global_step": 25731, "epoch": 612} {"train_loss": -5.301299095153809, "global_step": 25732, "epoch": 612} {"train_loss": -5.291520118713379, "global_step": 25733, "epoch": 612} {"train_loss": -5.464928150177002, "global_step": 25734, "epoch": 612} {"train_loss": -5.553213596343994, "global_step": 25735, "epoch": 612} {"train_loss": -5.479635238647461, "global_step": 25736, "epoch": 612} {"train_loss": -5.578915596008301, "global_step": 25737, "epoch": 612} {"train_loss": -5.3912506103515625, "global_step": 25738, "epoch": 612} {"train_loss": -5.379876136779785, "global_step": 25739, "epoch": 612} {"train_loss": -5.333703994750977, "global_step": 25740, "epoch": 612} {"train_loss": -5.326621055603027, "global_step": 25741, "epoch": 612} {"train_loss": -5.380857944488525, "global_step": 25742, "epoch": 612} {"train_loss": -5.460072040557861, "global_step": 25743, "epoch": 612} {"train_loss": -5.385359764099121, "global_step": 25744, "epoch": 612} {"train_loss": -5.384545292173113, "global_step": 25745, "epoch": 612, "val_loss": 75832.1015625} {"train_loss": -5.379548072814941, "global_step": 25746, "epoch": 613} {"train_loss": -5.2739667892456055, "global_step": 25747, "epoch": 613} {"train_loss": -5.345241069793701, "global_step": 25748, "epoch": 613} {"train_loss": -5.49606990814209, "global_step": 25749, "epoch": 613} {"train_loss": -5.437963962554932, "global_step": 25750, "epoch": 613} {"train_loss": -5.4036383628845215, "global_step": 25751, "epoch": 613} {"train_loss": -5.467059135437012, "global_step": 25752, "epoch": 613} {"train_loss": -5.311349868774414, "global_step": 25753, "epoch": 613} {"train_loss": -5.500103950500488, "global_step": 25754, "epoch": 613} {"train_loss": -5.4464945793151855, "global_step": 25755, "epoch": 613} {"train_loss": -5.397310256958008, "global_step": 25756, "epoch": 613} {"train_loss": -5.442378997802734, "global_step": 25757, "epoch": 613} {"train_loss": -5.415524482727051, "global_step": 25758, "epoch": 613} {"train_loss": -5.495068550109863, "global_step": 25759, "epoch": 613} {"train_loss": -5.325122833251953, "global_step": 25760, "epoch": 613} {"train_loss": -5.42890739440918, "global_step": 25761, "epoch": 613} {"train_loss": -5.412093639373779, "global_step": 25762, "epoch": 613} {"train_loss": -5.444580078125, "global_step": 25763, "epoch": 613} {"train_loss": -5.452387809753418, "global_step": 25764, "epoch": 613} {"train_loss": -5.459367752075195, "global_step": 25765, "epoch": 613} {"train_loss": -5.415384292602539, "global_step": 25766, "epoch": 613} {"train_loss": -5.312184810638428, "global_step": 25767, "epoch": 613} {"train_loss": -5.402217388153076, "global_step": 25768, "epoch": 613} {"train_loss": -5.35199499130249, "global_step": 25769, "epoch": 613} {"train_loss": -5.46958065032959, "global_step": 25770, "epoch": 613} {"train_loss": -5.3678083419799805, "global_step": 25771, "epoch": 613} {"train_loss": -5.355070114135742, "global_step": 25772, "epoch": 613} {"train_loss": -5.51865291595459, "global_step": 25773, "epoch": 613} {"train_loss": -5.477414131164551, "global_step": 25774, "epoch": 613} {"train_loss": -5.460864067077637, "global_step": 25775, "epoch": 613} {"train_loss": -5.502814769744873, "global_step": 25776, "epoch": 613} {"train_loss": -5.225995063781738, "global_step": 25777, "epoch": 613} {"train_loss": -5.399724006652832, "global_step": 25778, "epoch": 613} {"train_loss": -5.382691383361816, "global_step": 25779, "epoch": 613} {"train_loss": -5.444340705871582, "global_step": 25780, "epoch": 613} {"train_loss": -5.242646217346191, "global_step": 25781, "epoch": 613} {"train_loss": -5.410737037658691, "global_step": 25782, "epoch": 613} {"train_loss": -5.434929847717285, "global_step": 25783, "epoch": 613} {"train_loss": -5.178089141845703, "global_step": 25784, "epoch": 613} {"train_loss": -5.456605434417725, "global_step": 25785, "epoch": 613} {"train_loss": -5.2969794273376465, "global_step": 25786, "epoch": 613} {"train_loss": -5.39940299306597, "global_step": 25787, "epoch": 613, "val_loss": 76246.8828125} {"train_loss": -5.401168346405029, "global_step": 25788, "epoch": 614} {"train_loss": -5.418449401855469, "global_step": 25789, "epoch": 614} {"train_loss": -5.446418762207031, "global_step": 25790, "epoch": 614} {"train_loss": -5.360339641571045, "global_step": 25791, "epoch": 614} {"train_loss": -5.434848785400391, "global_step": 25792, "epoch": 614} {"train_loss": -5.47470760345459, "global_step": 25793, "epoch": 614} {"train_loss": -5.376906394958496, "global_step": 25794, "epoch": 614} {"train_loss": -5.430863380432129, "global_step": 25795, "epoch": 614} {"train_loss": -5.392073154449463, "global_step": 25796, "epoch": 614} {"train_loss": -5.300856590270996, "global_step": 25797, "epoch": 614} {"train_loss": -5.528532028198242, "global_step": 25798, "epoch": 614} {"train_loss": -5.5444841384887695, "global_step": 25799, "epoch": 614} {"train_loss": -5.551980972290039, "global_step": 25800, "epoch": 614} {"train_loss": -5.329624176025391, "global_step": 25801, "epoch": 614} {"train_loss": -5.481574535369873, "global_step": 25802, "epoch": 614} {"train_loss": -5.313662052154541, "global_step": 25803, "epoch": 614} {"train_loss": -5.270557880401611, "global_step": 25804, "epoch": 614} {"train_loss": -5.303284645080566, "global_step": 25805, "epoch": 614} {"train_loss": -5.340241432189941, "global_step": 25806, "epoch": 614} {"train_loss": -5.384310722351074, "global_step": 25807, "epoch": 614} {"train_loss": -5.569897651672363, "global_step": 25808, "epoch": 614} {"train_loss": -5.414398193359375, "global_step": 25809, "epoch": 614} {"train_loss": -5.496031284332275, "global_step": 25810, "epoch": 614} {"train_loss": -5.329594612121582, "global_step": 25811, "epoch": 614} {"train_loss": -5.388068675994873, "global_step": 25812, "epoch": 614} {"train_loss": -5.400359153747559, "global_step": 25813, "epoch": 614} {"train_loss": -5.439881801605225, "global_step": 25814, "epoch": 614} {"train_loss": -5.437552452087402, "global_step": 25815, "epoch": 614} {"train_loss": -5.414168357849121, "global_step": 25816, "epoch": 614} {"train_loss": -5.309908866882324, "global_step": 25817, "epoch": 614} {"train_loss": -5.3668928146362305, "global_step": 25818, "epoch": 614} {"train_loss": -5.410518169403076, "global_step": 25819, "epoch": 614} {"train_loss": -5.434395790100098, "global_step": 25820, "epoch": 614} {"train_loss": -5.28920841217041, "global_step": 25821, "epoch": 614} {"train_loss": -5.519526958465576, "global_step": 25822, "epoch": 614} {"train_loss": -5.275968074798584, "global_step": 25823, "epoch": 614} {"train_loss": -5.344820499420166, "global_step": 25824, "epoch": 614} {"train_loss": -5.358701705932617, "global_step": 25825, "epoch": 614} {"train_loss": -5.358633995056152, "global_step": 25826, "epoch": 614} {"train_loss": -5.360109806060791, "global_step": 25827, "epoch": 614} {"train_loss": -5.3056135177612305, "global_step": 25828, "epoch": 614} {"train_loss": -5.399101813634236, "global_step": 25829, "epoch": 614, "val_loss": 76382.6484375} {"train_loss": -5.38989782333374, "global_step": 25830, "epoch": 615} {"train_loss": -5.427823543548584, "global_step": 25831, "epoch": 615} {"train_loss": -5.3812127113342285, "global_step": 25832, "epoch": 615} {"train_loss": -5.455758094787598, "global_step": 25833, "epoch": 615} {"train_loss": -5.4810285568237305, "global_step": 25834, "epoch": 615} {"train_loss": -5.415008544921875, "global_step": 25835, "epoch": 615} {"train_loss": -5.339099407196045, "global_step": 25836, "epoch": 615} {"train_loss": -5.452282905578613, "global_step": 25837, "epoch": 615} {"train_loss": -5.401837348937988, "global_step": 25838, "epoch": 615} {"train_loss": -5.344151496887207, "global_step": 25839, "epoch": 615} {"train_loss": -5.339404106140137, "global_step": 25840, "epoch": 615} {"train_loss": -5.394232749938965, "global_step": 25841, "epoch": 615} {"train_loss": -5.496859550476074, "global_step": 25842, "epoch": 615} {"train_loss": -5.326798439025879, "global_step": 25843, "epoch": 615} {"train_loss": -5.328719615936279, "global_step": 25844, "epoch": 615} {"train_loss": -5.380760192871094, "global_step": 25845, "epoch": 615} {"train_loss": -5.402858257293701, "global_step": 25846, "epoch": 615} {"train_loss": -5.340944290161133, "global_step": 25847, "epoch": 615} {"train_loss": -5.439449310302734, "global_step": 25848, "epoch": 615} {"train_loss": -5.420029640197754, "global_step": 25849, "epoch": 615} {"train_loss": -5.426694869995117, "global_step": 25850, "epoch": 615} {"train_loss": -5.386549949645996, "global_step": 25851, "epoch": 615} {"train_loss": -5.435644149780273, "global_step": 25852, "epoch": 615} {"train_loss": -5.357695579528809, "global_step": 25853, "epoch": 615} {"train_loss": -5.552873611450195, "global_step": 25854, "epoch": 615} {"train_loss": -5.531912803649902, "global_step": 25855, "epoch": 615} {"train_loss": -5.456870079040527, "global_step": 25856, "epoch": 615} {"train_loss": -5.408448696136475, "global_step": 25857, "epoch": 615} {"train_loss": -5.3250579833984375, "global_step": 25858, "epoch": 615} {"train_loss": -5.438100814819336, "global_step": 25859, "epoch": 615} {"train_loss": -5.500885009765625, "global_step": 25860, "epoch": 615} {"train_loss": -5.350730895996094, "global_step": 25861, "epoch": 615} {"train_loss": -5.3134989738464355, "global_step": 25862, "epoch": 615} {"train_loss": -5.456557273864746, "global_step": 25863, "epoch": 615} {"train_loss": -5.38262939453125, "global_step": 25864, "epoch": 615} {"train_loss": -5.42226505279541, "global_step": 25865, "epoch": 615} {"train_loss": -5.339543342590332, "global_step": 25866, "epoch": 615} {"train_loss": -5.499186038970947, "global_step": 25867, "epoch": 615} {"train_loss": -5.353065490722656, "global_step": 25868, "epoch": 615} {"train_loss": -5.40164852142334, "global_step": 25869, "epoch": 615} {"train_loss": -5.433408737182617, "global_step": 25870, "epoch": 615} {"train_loss": -5.408240772428966, "global_step": 25871, "epoch": 615, "val_loss": 76312.2421875} {"train_loss": -5.427548885345459, "global_step": 25872, "epoch": 616} {"train_loss": -5.410892486572266, "global_step": 25873, "epoch": 616} {"train_loss": -5.411439418792725, "global_step": 25874, "epoch": 616} {"train_loss": -5.484789848327637, "global_step": 25875, "epoch": 616} {"train_loss": -5.394139289855957, "global_step": 25876, "epoch": 616} {"train_loss": -5.460291862487793, "global_step": 25877, "epoch": 616} {"train_loss": -5.451920509338379, "global_step": 25878, "epoch": 616} {"train_loss": -5.471057891845703, "global_step": 25879, "epoch": 616} {"train_loss": -5.462578773498535, "global_step": 25880, "epoch": 616} {"train_loss": -5.425248146057129, "global_step": 25881, "epoch": 616} {"train_loss": -5.366824626922607, "global_step": 25882, "epoch": 616} {"train_loss": -5.470337867736816, "global_step": 25883, "epoch": 616} {"train_loss": -5.370699405670166, "global_step": 25884, "epoch": 616} {"train_loss": -5.39000129699707, "global_step": 25885, "epoch": 616} {"train_loss": -5.4536285400390625, "global_step": 25886, "epoch": 616} {"train_loss": -5.31906795501709, "global_step": 25887, "epoch": 616} {"train_loss": -5.414920806884766, "global_step": 25888, "epoch": 616} {"train_loss": -5.533727169036865, "global_step": 25889, "epoch": 616} {"train_loss": -5.410317420959473, "global_step": 25890, "epoch": 616} {"train_loss": -5.378382682800293, "global_step": 25891, "epoch": 616} {"train_loss": -5.264697074890137, "global_step": 25892, "epoch": 616} {"train_loss": -5.275046348571777, "global_step": 25893, "epoch": 616} {"train_loss": -5.457071304321289, "global_step": 25894, "epoch": 616} {"train_loss": -5.293774127960205, "global_step": 25895, "epoch": 616} {"train_loss": -5.329986095428467, "global_step": 25896, "epoch": 616} {"train_loss": -5.515315055847168, "global_step": 25897, "epoch": 616} {"train_loss": -5.41446590423584, "global_step": 25898, "epoch": 616} {"train_loss": -5.453432083129883, "global_step": 25899, "epoch": 616} {"train_loss": -5.3771796226501465, "global_step": 25900, "epoch": 616} {"train_loss": -5.380756378173828, "global_step": 25901, "epoch": 616} {"train_loss": -5.520707130432129, "global_step": 25902, "epoch": 616} {"train_loss": -5.273701190948486, "global_step": 25903, "epoch": 616} {"train_loss": -5.293266296386719, "global_step": 25904, "epoch": 616} {"train_loss": -5.444272041320801, "global_step": 25905, "epoch": 616} {"train_loss": -5.449501991271973, "global_step": 25906, "epoch": 616} {"train_loss": -5.350468635559082, "global_step": 25907, "epoch": 616} {"train_loss": -5.3086137771606445, "global_step": 25908, "epoch": 616} {"train_loss": -5.379599571228027, "global_step": 25909, "epoch": 616} {"train_loss": -5.432649612426758, "global_step": 25910, "epoch": 616} {"train_loss": -5.320094108581543, "global_step": 25911, "epoch": 616} {"train_loss": -5.42280912399292, "global_step": 25912, "epoch": 616} {"train_loss": -5.401725848515828, "global_step": 25913, "epoch": 616, "val_loss": 76615.8125} {"train_loss": -5.357627868652344, "global_step": 25914, "epoch": 617} {"train_loss": -5.30765438079834, "global_step": 25915, "epoch": 617} {"train_loss": -5.491913795471191, "global_step": 25916, "epoch": 617} {"train_loss": -5.365211009979248, "global_step": 25917, "epoch": 617} {"train_loss": -5.539348602294922, "global_step": 25918, "epoch": 617} {"train_loss": -5.417192459106445, "global_step": 25919, "epoch": 617} {"train_loss": -5.4564714431762695, "global_step": 25920, "epoch": 617} {"train_loss": -5.488741397857666, "global_step": 25921, "epoch": 617} {"train_loss": -5.265058994293213, "global_step": 25922, "epoch": 617} {"train_loss": -5.333189964294434, "global_step": 25923, "epoch": 617} {"train_loss": -5.364442825317383, "global_step": 25924, "epoch": 617} {"train_loss": -5.507421016693115, "global_step": 25925, "epoch": 617} {"train_loss": -5.424885272979736, "global_step": 25926, "epoch": 617} {"train_loss": -5.394407272338867, "global_step": 25927, "epoch": 617} {"train_loss": -5.495662689208984, "global_step": 25928, "epoch": 617} {"train_loss": -5.4625043869018555, "global_step": 25929, "epoch": 617} {"train_loss": -5.483495235443115, "global_step": 25930, "epoch": 617} {"train_loss": -5.470021724700928, "global_step": 25931, "epoch": 617} {"train_loss": -5.517016887664795, "global_step": 25932, "epoch": 617} {"train_loss": -5.369955062866211, "global_step": 25933, "epoch": 617} {"train_loss": -5.283850193023682, "global_step": 25934, "epoch": 617} {"train_loss": -5.565375804901123, "global_step": 25935, "epoch": 617} {"train_loss": -5.507301330566406, "global_step": 25936, "epoch": 617} {"train_loss": -5.4413652420043945, "global_step": 25937, "epoch": 617} {"train_loss": -5.417240142822266, "global_step": 25938, "epoch": 617} {"train_loss": -5.437138557434082, "global_step": 25939, "epoch": 617} {"train_loss": -5.358176231384277, "global_step": 25940, "epoch": 617} {"train_loss": -5.521754264831543, "global_step": 25941, "epoch": 617} {"train_loss": -5.4351911544799805, "global_step": 25942, "epoch": 617} {"train_loss": -5.42355489730835, "global_step": 25943, "epoch": 617} {"train_loss": -5.399694442749023, "global_step": 25944, "epoch": 617} {"train_loss": -5.429608345031738, "global_step": 25945, "epoch": 617} {"train_loss": -5.260499000549316, "global_step": 25946, "epoch": 617} {"train_loss": -5.415205955505371, "global_step": 25947, "epoch": 617} {"train_loss": -5.5247273445129395, "global_step": 25948, "epoch": 617} {"train_loss": -5.32981014251709, "global_step": 25949, "epoch": 617} {"train_loss": -5.214679718017578, "global_step": 25950, "epoch": 617} {"train_loss": -5.392922401428223, "global_step": 25951, "epoch": 617} {"train_loss": -5.460838317871094, "global_step": 25952, "epoch": 617} {"train_loss": -5.546176910400391, "global_step": 25953, "epoch": 617} {"train_loss": -5.350037097930908, "global_step": 25954, "epoch": 617} {"train_loss": -5.41930966150193, "global_step": 25955, "epoch": 617, "val_loss": 76119.9140625} {"train_loss": -5.350943088531494, "global_step": 25956, "epoch": 618} {"train_loss": -5.385248184204102, "global_step": 25957, "epoch": 618} {"train_loss": -5.3817949295043945, "global_step": 25958, "epoch": 618} {"train_loss": -5.367221832275391, "global_step": 25959, "epoch": 618} {"train_loss": -5.343082904815674, "global_step": 25960, "epoch": 618} {"train_loss": -5.448240756988525, "global_step": 25961, "epoch": 618} {"train_loss": -5.181559085845947, "global_step": 25962, "epoch": 618} {"train_loss": -5.304986000061035, "global_step": 25963, "epoch": 618} {"train_loss": -5.351572036743164, "global_step": 25964, "epoch": 618} {"train_loss": -5.392057418823242, "global_step": 25965, "epoch": 618} {"train_loss": -5.401207447052002, "global_step": 25966, "epoch": 618} {"train_loss": -5.417418956756592, "global_step": 25967, "epoch": 618} {"train_loss": -5.40986442565918, "global_step": 25968, "epoch": 618} {"train_loss": -5.474048614501953, "global_step": 25969, "epoch": 618} {"train_loss": -5.388820648193359, "global_step": 25970, "epoch": 618} {"train_loss": -5.475211143493652, "global_step": 25971, "epoch": 618} {"train_loss": -5.380816459655762, "global_step": 25972, "epoch": 618} {"train_loss": -5.536849021911621, "global_step": 25973, "epoch": 618} {"train_loss": -5.421262741088867, "global_step": 25974, "epoch": 618} {"train_loss": -5.287081241607666, "global_step": 25975, "epoch": 618} {"train_loss": -5.485354900360107, "global_step": 25976, "epoch": 618} {"train_loss": -5.2950849533081055, "global_step": 25977, "epoch": 618} {"train_loss": -5.241455554962158, "global_step": 25978, "epoch": 618} {"train_loss": -5.409524440765381, "global_step": 25979, "epoch": 618} {"train_loss": -5.082249641418457, "global_step": 25980, "epoch": 618} {"train_loss": -5.465973377227783, "global_step": 25981, "epoch": 618} {"train_loss": -5.402444839477539, "global_step": 25982, "epoch": 618} {"train_loss": -5.262787818908691, "global_step": 25983, "epoch": 618} {"train_loss": -5.2280731201171875, "global_step": 25984, "epoch": 618} {"train_loss": -5.23598575592041, "global_step": 25985, "epoch": 618} {"train_loss": -5.408591270446777, "global_step": 25986, "epoch": 618} {"train_loss": -5.350193023681641, "global_step": 25987, "epoch": 618} {"train_loss": -5.422642707824707, "global_step": 25988, "epoch": 618} {"train_loss": -5.285893440246582, "global_step": 25989, "epoch": 618} {"train_loss": -5.470108985900879, "global_step": 25990, "epoch": 618} {"train_loss": -5.411738395690918, "global_step": 25991, "epoch": 618} {"train_loss": -5.330906867980957, "global_step": 25992, "epoch": 618} {"train_loss": -5.345507621765137, "global_step": 25993, "epoch": 618} {"train_loss": -5.430333137512207, "global_step": 25994, "epoch": 618} {"train_loss": -5.297051429748535, "global_step": 25995, "epoch": 618} {"train_loss": -5.37302303314209, "global_step": 25996, "epoch": 618} {"train_loss": -5.366075186502366, "global_step": 25997, "epoch": 618, "val_loss": 75807.2109375} {"train_loss": -5.386234283447266, "global_step": 25998, "epoch": 619} {"train_loss": -5.361365795135498, "global_step": 25999, "epoch": 619} {"train_loss": -5.504338264465332, "global_step": 26000, "epoch": 619} {"train_loss": -5.306500434875488, "global_step": 26001, "epoch": 619} {"train_loss": -5.481417655944824, "global_step": 26002, "epoch": 619} {"train_loss": -5.438926696777344, "global_step": 26003, "epoch": 619} {"train_loss": -5.4175238609313965, "global_step": 26004, "epoch": 619} {"train_loss": -5.321765422821045, "global_step": 26005, "epoch": 619} {"train_loss": -5.349728584289551, "global_step": 26006, "epoch": 619} {"train_loss": -5.48549222946167, "global_step": 26007, "epoch": 619} {"train_loss": -5.323827743530273, "global_step": 26008, "epoch": 619} {"train_loss": -5.458481788635254, "global_step": 26009, "epoch": 619} {"train_loss": -5.362578392028809, "global_step": 26010, "epoch": 619} {"train_loss": -5.198460578918457, "global_step": 26011, "epoch": 619} {"train_loss": -5.48878288269043, "global_step": 26012, "epoch": 619} {"train_loss": -5.574798583984375, "global_step": 26013, "epoch": 619} {"train_loss": -5.364428520202637, "global_step": 26014, "epoch": 619} {"train_loss": -5.424220085144043, "global_step": 26015, "epoch": 619} {"train_loss": -5.366578102111816, "global_step": 26016, "epoch": 619} {"train_loss": -5.4476423263549805, "global_step": 26017, "epoch": 619} {"train_loss": -5.415412902832031, "global_step": 26018, "epoch": 619} {"train_loss": -5.503705024719238, "global_step": 26019, "epoch": 619} {"train_loss": -5.3508758544921875, "global_step": 26020, "epoch": 619} {"train_loss": -5.425522327423096, "global_step": 26021, "epoch": 619} {"train_loss": -5.37042760848999, "global_step": 26022, "epoch": 619} {"train_loss": -5.218845844268799, "global_step": 26023, "epoch": 619} {"train_loss": -5.350062370300293, "global_step": 26024, "epoch": 619} {"train_loss": -5.336683750152588, "global_step": 26025, "epoch": 619} {"train_loss": -5.3961501121521, "global_step": 26026, "epoch": 619} {"train_loss": -5.417135715484619, "global_step": 26027, "epoch": 619} {"train_loss": -5.316191673278809, "global_step": 26028, "epoch": 619} {"train_loss": -5.243659019470215, "global_step": 26029, "epoch": 619} {"train_loss": -5.488463401794434, "global_step": 26030, "epoch": 619} {"train_loss": -5.249532222747803, "global_step": 26031, "epoch": 619} {"train_loss": -5.503758430480957, "global_step": 26032, "epoch": 619} {"train_loss": -5.366168022155762, "global_step": 26033, "epoch": 619} {"train_loss": -5.460372447967529, "global_step": 26034, "epoch": 619} {"train_loss": -5.31649112701416, "global_step": 26035, "epoch": 619} {"train_loss": -5.366198539733887, "global_step": 26036, "epoch": 619} {"train_loss": -5.491045951843262, "global_step": 26037, "epoch": 619} {"train_loss": -5.306013107299805, "global_step": 26038, "epoch": 619} {"train_loss": -5.3910710243951705, "global_step": 26039, "epoch": 619, "val_loss": 75998.5546875} {"train_loss": -5.424070835113525, "global_step": 26040, "epoch": 620} {"train_loss": -5.50643253326416, "global_step": 26041, "epoch": 620} {"train_loss": -5.386934757232666, "global_step": 26042, "epoch": 620} {"train_loss": -5.466231346130371, "global_step": 26043, "epoch": 620} {"train_loss": -5.322868347167969, "global_step": 26044, "epoch": 620} {"train_loss": -5.373075008392334, "global_step": 26045, "epoch": 620} {"train_loss": -5.341279983520508, "global_step": 26046, "epoch": 620} {"train_loss": -5.274083137512207, "global_step": 26047, "epoch": 620} {"train_loss": -5.4179606437683105, "global_step": 26048, "epoch": 620} {"train_loss": -5.529390811920166, "global_step": 26049, "epoch": 620} {"train_loss": -5.361632347106934, "global_step": 26050, "epoch": 620} {"train_loss": -5.301873683929443, "global_step": 26051, "epoch": 620} {"train_loss": -5.383871555328369, "global_step": 26052, "epoch": 620} {"train_loss": -5.4389495849609375, "global_step": 26053, "epoch": 620} {"train_loss": -5.474267959594727, "global_step": 26054, "epoch": 620} {"train_loss": -5.392975807189941, "global_step": 26055, "epoch": 620} {"train_loss": -5.4157514572143555, "global_step": 26056, "epoch": 620} {"train_loss": -5.362792015075684, "global_step": 26057, "epoch": 620} {"train_loss": -5.313364028930664, "global_step": 26058, "epoch": 620} {"train_loss": -5.388729572296143, "global_step": 26059, "epoch": 620} {"train_loss": -5.241178512573242, "global_step": 26060, "epoch": 620} {"train_loss": -5.213956832885742, "global_step": 26061, "epoch": 620} {"train_loss": -5.378178119659424, "global_step": 26062, "epoch": 620} {"train_loss": -5.136305809020996, "global_step": 26063, "epoch": 620} {"train_loss": -5.328282833099365, "global_step": 26064, "epoch": 620} {"train_loss": -5.305973052978516, "global_step": 26065, "epoch": 620} {"train_loss": -5.185519218444824, "global_step": 26066, "epoch": 620} {"train_loss": -5.227574825286865, "global_step": 26067, "epoch": 620} {"train_loss": -5.20155668258667, "global_step": 26068, "epoch": 620} {"train_loss": -5.236384868621826, "global_step": 26069, "epoch": 620} {"train_loss": -5.069022178649902, "global_step": 26070, "epoch": 620} {"train_loss": -5.480701446533203, "global_step": 26071, "epoch": 620} {"train_loss": -5.1032891273498535, "global_step": 26072, "epoch": 620} {"train_loss": -5.366086483001709, "global_step": 26073, "epoch": 620} {"train_loss": -5.276897430419922, "global_step": 26074, "epoch": 620} {"train_loss": -5.33286190032959, "global_step": 26075, "epoch": 620} {"train_loss": -5.485783576965332, "global_step": 26076, "epoch": 620} {"train_loss": -5.340585708618164, "global_step": 26077, "epoch": 620} {"train_loss": -5.422846794128418, "global_step": 26078, "epoch": 620} {"train_loss": -5.423989295959473, "global_step": 26079, "epoch": 620} {"train_loss": -5.364656925201416, "global_step": 26080, "epoch": 620} {"train_loss": -5.34545696349371, "global_step": 26081, "epoch": 620, "val_loss": 76070.8359375} {"train_loss": -5.374493598937988, "global_step": 26082, "epoch": 621} {"train_loss": -5.472536087036133, "global_step": 26083, "epoch": 621} {"train_loss": -5.235990524291992, "global_step": 26084, "epoch": 621} {"train_loss": -5.32868766784668, "global_step": 26085, "epoch": 621} {"train_loss": -5.550589561462402, "global_step": 26086, "epoch": 621} {"train_loss": -5.495930194854736, "global_step": 26087, "epoch": 621} {"train_loss": -5.399752140045166, "global_step": 26088, "epoch": 621} {"train_loss": -5.4690632820129395, "global_step": 26089, "epoch": 621} {"train_loss": -5.394931793212891, "global_step": 26090, "epoch": 621} {"train_loss": -5.437928676605225, "global_step": 26091, "epoch": 621} {"train_loss": -5.38236665725708, "global_step": 26092, "epoch": 621} {"train_loss": -5.445525169372559, "global_step": 26093, "epoch": 621} {"train_loss": -5.263808250427246, "global_step": 26094, "epoch": 621} {"train_loss": -5.359371185302734, "global_step": 26095, "epoch": 621} {"train_loss": -5.218935966491699, "global_step": 26096, "epoch": 621} {"train_loss": -5.243793487548828, "global_step": 26097, "epoch": 621} {"train_loss": -5.32582950592041, "global_step": 26098, "epoch": 621} {"train_loss": -5.289058685302734, "global_step": 26099, "epoch": 621} {"train_loss": -5.324619293212891, "global_step": 26100, "epoch": 621} {"train_loss": -5.353457450866699, "global_step": 26101, "epoch": 621} {"train_loss": -5.374405860900879, "global_step": 26102, "epoch": 621} {"train_loss": -5.351963996887207, "global_step": 26103, "epoch": 621} {"train_loss": -5.336824893951416, "global_step": 26104, "epoch": 621} {"train_loss": -5.282580375671387, "global_step": 26105, "epoch": 621} {"train_loss": -5.412369728088379, "global_step": 26106, "epoch": 621} {"train_loss": -5.199709415435791, "global_step": 26107, "epoch": 621} {"train_loss": -5.3369550704956055, "global_step": 26108, "epoch": 621} {"train_loss": -5.374050140380859, "global_step": 26109, "epoch": 621} {"train_loss": -5.2622480392456055, "global_step": 26110, "epoch": 621} {"train_loss": -5.340517044067383, "global_step": 26111, "epoch": 621} {"train_loss": -5.203178405761719, "global_step": 26112, "epoch": 621} {"train_loss": -5.384442329406738, "global_step": 26113, "epoch": 621} {"train_loss": -5.261092185974121, "global_step": 26114, "epoch": 621} {"train_loss": -5.357449531555176, "global_step": 26115, "epoch": 621} {"train_loss": -5.229203224182129, "global_step": 26116, "epoch": 621} {"train_loss": -5.296315670013428, "global_step": 26117, "epoch": 621} {"train_loss": -5.372931480407715, "global_step": 26118, "epoch": 621} {"train_loss": -5.352831840515137, "global_step": 26119, "epoch": 621} {"train_loss": -5.294073104858398, "global_step": 26120, "epoch": 621} {"train_loss": -5.18040657043457, "global_step": 26121, "epoch": 621} {"train_loss": -5.37421178817749, "global_step": 26122, "epoch": 621} {"train_loss": -5.340530088969639, "global_step": 26123, "epoch": 621, "val_loss": 77196.171875} {"train_loss": -5.356679439544678, "global_step": 26124, "epoch": 622} {"train_loss": -5.417057037353516, "global_step": 26125, "epoch": 622} {"train_loss": -5.507115364074707, "global_step": 26126, "epoch": 622} {"train_loss": -5.457756519317627, "global_step": 26127, "epoch": 622} {"train_loss": -5.450874328613281, "global_step": 26128, "epoch": 622} {"train_loss": -5.474177360534668, "global_step": 26129, "epoch": 622} {"train_loss": -5.269711017608643, "global_step": 26130, "epoch": 622} {"train_loss": -5.355316162109375, "global_step": 26131, "epoch": 622} {"train_loss": -5.394094467163086, "global_step": 26132, "epoch": 622} {"train_loss": -5.318624496459961, "global_step": 26133, "epoch": 622} {"train_loss": -5.3927788734436035, "global_step": 26134, "epoch": 622} {"train_loss": -5.2903642654418945, "global_step": 26135, "epoch": 622} {"train_loss": -5.267642021179199, "global_step": 26136, "epoch": 622} {"train_loss": -5.2622833251953125, "global_step": 26137, "epoch": 622} {"train_loss": -5.252685546875, "global_step": 26138, "epoch": 622} {"train_loss": -5.289732933044434, "global_step": 26139, "epoch": 622} {"train_loss": -5.195941925048828, "global_step": 26140, "epoch": 622} {"train_loss": -5.480607032775879, "global_step": 26141, "epoch": 622} {"train_loss": -5.208034992218018, "global_step": 26142, "epoch": 622} {"train_loss": -5.407659530639648, "global_step": 26143, "epoch": 622} {"train_loss": -5.409287929534912, "global_step": 26144, "epoch": 622} {"train_loss": -5.385141372680664, "global_step": 26145, "epoch": 622} {"train_loss": -5.4344096183776855, "global_step": 26146, "epoch": 622} {"train_loss": -5.386784553527832, "global_step": 26147, "epoch": 622} {"train_loss": -5.352424621582031, "global_step": 26148, "epoch": 622} {"train_loss": -5.337918758392334, "global_step": 26149, "epoch": 622} {"train_loss": -5.4787445068359375, "global_step": 26150, "epoch": 622} {"train_loss": -5.512990951538086, "global_step": 26151, "epoch": 622} {"train_loss": -5.379698753356934, "global_step": 26152, "epoch": 622} {"train_loss": -5.44483757019043, "global_step": 26153, "epoch": 622} {"train_loss": -5.471053123474121, "global_step": 26154, "epoch": 622} {"train_loss": -5.373331546783447, "global_step": 26155, "epoch": 622} {"train_loss": -5.340534210205078, "global_step": 26156, "epoch": 622} {"train_loss": -5.376044273376465, "global_step": 26157, "epoch": 622} {"train_loss": -5.400673866271973, "global_step": 26158, "epoch": 622} {"train_loss": -5.489779472351074, "global_step": 26159, "epoch": 622} {"train_loss": -5.49204158782959, "global_step": 26160, "epoch": 622} {"train_loss": -5.36491060256958, "global_step": 26161, "epoch": 622} {"train_loss": -5.382993698120117, "global_step": 26162, "epoch": 622} {"train_loss": -5.179460525512695, "global_step": 26163, "epoch": 622} {"train_loss": -5.663326263427734, "global_step": 26164, "epoch": 622} {"train_loss": -5.38357736950829, "global_step": 26165, "epoch": 622, "val_loss": 76777.140625} {"train_loss": -5.316961288452148, "global_step": 26166, "epoch": 623} {"train_loss": -5.459648132324219, "global_step": 26167, "epoch": 623} {"train_loss": -5.449196815490723, "global_step": 26168, "epoch": 623} {"train_loss": -5.454623222351074, "global_step": 26169, "epoch": 623} {"train_loss": -5.532620429992676, "global_step": 26170, "epoch": 623} {"train_loss": -5.358272075653076, "global_step": 26171, "epoch": 623} {"train_loss": -5.393618583679199, "global_step": 26172, "epoch": 623} {"train_loss": -5.366848945617676, "global_step": 26173, "epoch": 623} {"train_loss": -5.463722229003906, "global_step": 26174, "epoch": 623} {"train_loss": -5.351221561431885, "global_step": 26175, "epoch": 623} {"train_loss": -5.441983222961426, "global_step": 26176, "epoch": 623} {"train_loss": -5.576091766357422, "global_step": 26177, "epoch": 623} {"train_loss": -5.4305853843688965, "global_step": 26178, "epoch": 623} {"train_loss": -5.451774597167969, "global_step": 26179, "epoch": 623} {"train_loss": -5.378415107727051, "global_step": 26180, "epoch": 623} {"train_loss": -5.5081377029418945, "global_step": 26181, "epoch": 623} {"train_loss": -5.254929542541504, "global_step": 26182, "epoch": 623} {"train_loss": -5.514474391937256, "global_step": 26183, "epoch": 623} {"train_loss": -5.459153175354004, "global_step": 26184, "epoch": 623} {"train_loss": -5.323949813842773, "global_step": 26185, "epoch": 623} {"train_loss": -5.364009380340576, "global_step": 26186, "epoch": 623} {"train_loss": -5.336565971374512, "global_step": 26187, "epoch": 623} {"train_loss": -5.333683967590332, "global_step": 26188, "epoch": 623} {"train_loss": -5.54939079284668, "global_step": 26189, "epoch": 623} {"train_loss": -5.458322525024414, "global_step": 26190, "epoch": 623} {"train_loss": -5.393764972686768, "global_step": 26191, "epoch": 623} {"train_loss": -5.309018611907959, "global_step": 26192, "epoch": 623} {"train_loss": -5.438877105712891, "global_step": 26193, "epoch": 623} {"train_loss": -5.362725734710693, "global_step": 26194, "epoch": 623} {"train_loss": -5.453793525695801, "global_step": 26195, "epoch": 623} {"train_loss": -5.425115585327148, "global_step": 26196, "epoch": 623} {"train_loss": -5.423748016357422, "global_step": 26197, "epoch": 623} {"train_loss": -5.445633411407471, "global_step": 26198, "epoch": 623} {"train_loss": -5.388976097106934, "global_step": 26199, "epoch": 623} {"train_loss": -5.440793514251709, "global_step": 26200, "epoch": 623} {"train_loss": -5.445286750793457, "global_step": 26201, "epoch": 623} {"train_loss": -5.396764278411865, "global_step": 26202, "epoch": 623} {"train_loss": -5.369532585144043, "global_step": 26203, "epoch": 623} {"train_loss": -5.278982162475586, "global_step": 26204, "epoch": 623} {"train_loss": -5.34019660949707, "global_step": 26205, "epoch": 623} {"train_loss": -5.474046230316162, "global_step": 26206, "epoch": 623} {"train_loss": -5.414122138704572, "global_step": 26207, "epoch": 623, "val_loss": 76074.171875} {"train_loss": -5.4664154052734375, "global_step": 26208, "epoch": 624} {"train_loss": -5.334432601928711, "global_step": 26209, "epoch": 624} {"train_loss": -5.332039833068848, "global_step": 26210, "epoch": 624} {"train_loss": -5.386476993560791, "global_step": 26211, "epoch": 624} {"train_loss": -5.40199613571167, "global_step": 26212, "epoch": 624} {"train_loss": -5.313152313232422, "global_step": 26213, "epoch": 624} {"train_loss": -5.360019207000732, "global_step": 26214, "epoch": 624} {"train_loss": -5.415826320648193, "global_step": 26215, "epoch": 624} {"train_loss": -5.354021072387695, "global_step": 26216, "epoch": 624} {"train_loss": -5.370585918426514, "global_step": 26217, "epoch": 624} {"train_loss": -5.509115219116211, "global_step": 26218, "epoch": 624} {"train_loss": -5.391201972961426, "global_step": 26219, "epoch": 624} {"train_loss": -5.423190116882324, "global_step": 26220, "epoch": 624} {"train_loss": -5.3179426193237305, "global_step": 26221, "epoch": 624} {"train_loss": -5.439763069152832, "global_step": 26222, "epoch": 624} {"train_loss": -5.449766159057617, "global_step": 26223, "epoch": 624} {"train_loss": -5.624753475189209, "global_step": 26224, "epoch": 624} {"train_loss": -5.183210372924805, "global_step": 26225, "epoch": 624} {"train_loss": -5.306698799133301, "global_step": 26226, "epoch": 624} {"train_loss": -5.444819927215576, "global_step": 26227, "epoch": 624} {"train_loss": -5.527660369873047, "global_step": 26228, "epoch": 624} {"train_loss": -5.443558692932129, "global_step": 26229, "epoch": 624} {"train_loss": -5.565147876739502, "global_step": 26230, "epoch": 624} {"train_loss": -5.525679111480713, "global_step": 26231, "epoch": 624} {"train_loss": -5.362759113311768, "global_step": 26232, "epoch": 624} {"train_loss": -5.52071475982666, "global_step": 26233, "epoch": 624} {"train_loss": -5.541831016540527, "global_step": 26234, "epoch": 624} {"train_loss": -5.378829002380371, "global_step": 26235, "epoch": 624} {"train_loss": -5.385734558105469, "global_step": 26236, "epoch": 624} {"train_loss": -5.544543266296387, "global_step": 26237, "epoch": 624} {"train_loss": -5.520044803619385, "global_step": 26238, "epoch": 624} {"train_loss": -5.3424272537231445, "global_step": 26239, "epoch": 624} {"train_loss": -5.333467483520508, "global_step": 26240, "epoch": 624} {"train_loss": -5.453006744384766, "global_step": 26241, "epoch": 624} {"train_loss": -5.355862617492676, "global_step": 26242, "epoch": 624} {"train_loss": -5.49928092956543, "global_step": 26243, "epoch": 624} {"train_loss": -5.4220123291015625, "global_step": 26244, "epoch": 624} {"train_loss": -5.1054911613464355, "global_step": 26245, "epoch": 624} {"train_loss": -5.340880393981934, "global_step": 26246, "epoch": 624} {"train_loss": -5.402792930603027, "global_step": 26247, "epoch": 624} {"train_loss": -5.323350429534912, "global_step": 26248, "epoch": 624} {"train_loss": -5.4043385074252175, "global_step": 26249, "epoch": 624, "val_loss": 76569.109375} {"train_loss": -5.404851913452148, "global_step": 26250, "epoch": 625} {"train_loss": -5.168482780456543, "global_step": 26251, "epoch": 625} {"train_loss": -5.3093109130859375, "global_step": 26252, "epoch": 625} {"train_loss": -5.316278457641602, "global_step": 26253, "epoch": 625} {"train_loss": -5.329395294189453, "global_step": 26254, "epoch": 625} {"train_loss": -5.468031883239746, "global_step": 26255, "epoch": 625} {"train_loss": -5.312038421630859, "global_step": 26256, "epoch": 625} {"train_loss": -5.291075706481934, "global_step": 26257, "epoch": 625} {"train_loss": -5.406074047088623, "global_step": 26258, "epoch": 625} {"train_loss": -5.459598064422607, "global_step": 26259, "epoch": 625} {"train_loss": -5.362168788909912, "global_step": 26260, "epoch": 625} {"train_loss": -5.344142913818359, "global_step": 26261, "epoch": 625} {"train_loss": -5.333008766174316, "global_step": 26262, "epoch": 625} {"train_loss": -5.435558319091797, "global_step": 26263, "epoch": 625} {"train_loss": -5.416685104370117, "global_step": 26264, "epoch": 625} {"train_loss": -5.413318634033203, "global_step": 26265, "epoch": 625} {"train_loss": -5.5612945556640625, "global_step": 26266, "epoch": 625} {"train_loss": -5.283868312835693, "global_step": 26267, "epoch": 625} {"train_loss": -5.420214653015137, "global_step": 26268, "epoch": 625} {"train_loss": -5.342751502990723, "global_step": 26269, "epoch": 625} {"train_loss": -5.314268112182617, "global_step": 26270, "epoch": 625} {"train_loss": -5.454683780670166, "global_step": 26271, "epoch": 625} {"train_loss": -5.431462287902832, "global_step": 26272, "epoch": 625} {"train_loss": -5.474689960479736, "global_step": 26273, "epoch": 625} {"train_loss": -5.490391731262207, "global_step": 26274, "epoch": 625} {"train_loss": -5.400467395782471, "global_step": 26275, "epoch": 625} {"train_loss": -5.313852787017822, "global_step": 26276, "epoch": 625} {"train_loss": -5.432754039764404, "global_step": 26277, "epoch": 625} {"train_loss": -5.489048957824707, "global_step": 26278, "epoch": 625} {"train_loss": -5.392223358154297, "global_step": 26279, "epoch": 625} {"train_loss": -5.532410621643066, "global_step": 26280, "epoch": 625} {"train_loss": -5.424473762512207, "global_step": 26281, "epoch": 625} {"train_loss": -5.407127380371094, "global_step": 26282, "epoch": 625} {"train_loss": -5.532532691955566, "global_step": 26283, "epoch": 625} {"train_loss": -5.327776908874512, "global_step": 26284, "epoch": 625} {"train_loss": -5.353359699249268, "global_step": 26285, "epoch": 625} {"train_loss": -5.542398452758789, "global_step": 26286, "epoch": 625} {"train_loss": -5.373501777648926, "global_step": 26287, "epoch": 625} {"train_loss": -5.353160381317139, "global_step": 26288, "epoch": 625} {"train_loss": -5.429911136627197, "global_step": 26289, "epoch": 625} {"train_loss": -5.4182233810424805, "global_step": 26290, "epoch": 625} {"train_loss": -5.395932208924067, "global_step": 26291, "epoch": 625, "val_loss": 75914.453125} {"train_loss": -5.308915138244629, "global_step": 26292, "epoch": 626} {"train_loss": -5.419051170349121, "global_step": 26293, "epoch": 626} {"train_loss": -5.4963884353637695, "global_step": 26294, "epoch": 626} {"train_loss": -5.341196060180664, "global_step": 26295, "epoch": 626} {"train_loss": -5.380123138427734, "global_step": 26296, "epoch": 626} {"train_loss": -5.319391250610352, "global_step": 26297, "epoch": 626} {"train_loss": -5.375312805175781, "global_step": 26298, "epoch": 626} {"train_loss": -5.492595672607422, "global_step": 26299, "epoch": 626} {"train_loss": -5.430878639221191, "global_step": 26300, "epoch": 626} {"train_loss": -5.40447998046875, "global_step": 26301, "epoch": 626} {"train_loss": -5.409682273864746, "global_step": 26302, "epoch": 626} {"train_loss": -5.4630632400512695, "global_step": 26303, "epoch": 626} {"train_loss": -5.458800315856934, "global_step": 26304, "epoch": 626} {"train_loss": -5.385384559631348, "global_step": 26305, "epoch": 626} {"train_loss": -5.348560333251953, "global_step": 26306, "epoch": 626} {"train_loss": -5.442660331726074, "global_step": 26307, "epoch": 626} {"train_loss": -5.317414283752441, "global_step": 26308, "epoch": 626} {"train_loss": -5.482779026031494, "global_step": 26309, "epoch": 626} {"train_loss": -5.342312335968018, "global_step": 26310, "epoch": 626} {"train_loss": -5.344393730163574, "global_step": 26311, "epoch": 626} {"train_loss": -5.51921272277832, "global_step": 26312, "epoch": 626} {"train_loss": -5.379688739776611, "global_step": 26313, "epoch": 626} {"train_loss": -5.380245208740234, "global_step": 26314, "epoch": 626} {"train_loss": -5.475543022155762, "global_step": 26315, "epoch": 626} {"train_loss": -5.411347389221191, "global_step": 26316, "epoch": 626} {"train_loss": -5.512659072875977, "global_step": 26317, "epoch": 626} {"train_loss": -5.469944477081299, "global_step": 26318, "epoch": 626} {"train_loss": -5.478649139404297, "global_step": 26319, "epoch": 626} {"train_loss": -5.472958564758301, "global_step": 26320, "epoch": 626} {"train_loss": -5.307063102722168, "global_step": 26321, "epoch": 626} {"train_loss": -5.47448205947876, "global_step": 26322, "epoch": 626} {"train_loss": -5.441619396209717, "global_step": 26323, "epoch": 626} {"train_loss": -5.359338283538818, "global_step": 26324, "epoch": 626} {"train_loss": -5.362483024597168, "global_step": 26325, "epoch": 626} {"train_loss": -5.44086217880249, "global_step": 26326, "epoch": 626} {"train_loss": -5.491196632385254, "global_step": 26327, "epoch": 626} {"train_loss": -5.307258605957031, "global_step": 26328, "epoch": 626} {"train_loss": -5.440582752227783, "global_step": 26329, "epoch": 626} {"train_loss": -5.331125259399414, "global_step": 26330, "epoch": 626} {"train_loss": -5.311459541320801, "global_step": 26331, "epoch": 626} {"train_loss": -5.450037002563477, "global_step": 26332, "epoch": 626} {"train_loss": -5.408850317909604, "global_step": 26333, "epoch": 626, "val_loss": 75928.7109375} {"train_loss": -5.421605110168457, "global_step": 26334, "epoch": 627} {"train_loss": -5.372311592102051, "global_step": 26335, "epoch": 627} {"train_loss": -5.453097343444824, "global_step": 26336, "epoch": 627} {"train_loss": -5.329525947570801, "global_step": 26337, "epoch": 627} {"train_loss": -5.4572434425354, "global_step": 26338, "epoch": 627} {"train_loss": -5.40350341796875, "global_step": 26339, "epoch": 627} {"train_loss": -5.537345886230469, "global_step": 26340, "epoch": 627} {"train_loss": -5.472918510437012, "global_step": 26341, "epoch": 627} {"train_loss": -5.45705509185791, "global_step": 26342, "epoch": 627} {"train_loss": -5.451231479644775, "global_step": 26343, "epoch": 627} {"train_loss": -5.401449203491211, "global_step": 26344, "epoch": 627} {"train_loss": -5.454029083251953, "global_step": 26345, "epoch": 627} {"train_loss": -5.443700790405273, "global_step": 26346, "epoch": 627} {"train_loss": -5.430169105529785, "global_step": 26347, "epoch": 627} {"train_loss": -5.348574161529541, "global_step": 26348, "epoch": 627} {"train_loss": -5.484715938568115, "global_step": 26349, "epoch": 627} {"train_loss": -5.371688365936279, "global_step": 26350, "epoch": 627} {"train_loss": -5.440598964691162, "global_step": 26351, "epoch": 627} {"train_loss": -5.416928291320801, "global_step": 26352, "epoch": 627} {"train_loss": -5.481523513793945, "global_step": 26353, "epoch": 627} {"train_loss": -5.360907554626465, "global_step": 26354, "epoch": 627} {"train_loss": -5.342750072479248, "global_step": 26355, "epoch": 627} {"train_loss": -5.4666972160339355, "global_step": 26356, "epoch": 627} {"train_loss": -5.2889299392700195, "global_step": 26357, "epoch": 627} {"train_loss": -5.433215141296387, "global_step": 26358, "epoch": 627} {"train_loss": -5.314122200012207, "global_step": 26359, "epoch": 627} {"train_loss": -5.369419097900391, "global_step": 26360, "epoch": 627} {"train_loss": -5.4317474365234375, "global_step": 26361, "epoch": 627} {"train_loss": -5.420070648193359, "global_step": 26362, "epoch": 627} {"train_loss": -5.297947883605957, "global_step": 26363, "epoch": 627} {"train_loss": -5.389779090881348, "global_step": 26364, "epoch": 627} {"train_loss": -5.213940620422363, "global_step": 26365, "epoch": 627} {"train_loss": -5.3317718505859375, "global_step": 26366, "epoch": 627} {"train_loss": -5.397217273712158, "global_step": 26367, "epoch": 627} {"train_loss": -5.242777347564697, "global_step": 26368, "epoch": 627} {"train_loss": -5.412482738494873, "global_step": 26369, "epoch": 627} {"train_loss": -5.178425312042236, "global_step": 26370, "epoch": 627} {"train_loss": -5.455503463745117, "global_step": 26371, "epoch": 627} {"train_loss": -5.252819061279297, "global_step": 26372, "epoch": 627} {"train_loss": -5.408208847045898, "global_step": 26373, "epoch": 627} {"train_loss": -5.383906364440918, "global_step": 26374, "epoch": 627} {"train_loss": -5.386743579592023, "global_step": 26375, "epoch": 627, "val_loss": 76358.03125} {"train_loss": -5.367361545562744, "global_step": 26376, "epoch": 628} {"train_loss": -5.432290554046631, "global_step": 26377, "epoch": 628} {"train_loss": -5.396740436553955, "global_step": 26378, "epoch": 628} {"train_loss": -5.407155990600586, "global_step": 26379, "epoch": 628} {"train_loss": -5.45865535736084, "global_step": 26380, "epoch": 628} {"train_loss": -5.413617134094238, "global_step": 26381, "epoch": 628} {"train_loss": -5.513735294342041, "global_step": 26382, "epoch": 628} {"train_loss": -5.330286026000977, "global_step": 26383, "epoch": 628} {"train_loss": -5.487025260925293, "global_step": 26384, "epoch": 628} {"train_loss": -5.503020763397217, "global_step": 26385, "epoch": 628} {"train_loss": -5.313460350036621, "global_step": 26386, "epoch": 628} {"train_loss": -5.442264556884766, "global_step": 26387, "epoch": 628} {"train_loss": -5.387345314025879, "global_step": 26388, "epoch": 628} {"train_loss": -5.377678871154785, "global_step": 26389, "epoch": 628} {"train_loss": -5.401411056518555, "global_step": 26390, "epoch": 628} {"train_loss": -5.459144115447998, "global_step": 26391, "epoch": 628} {"train_loss": -5.544923782348633, "global_step": 26392, "epoch": 628} {"train_loss": -5.4076972007751465, "global_step": 26393, "epoch": 628} {"train_loss": -5.534399032592773, "global_step": 26394, "epoch": 628} {"train_loss": -5.5121378898620605, "global_step": 26395, "epoch": 628} {"train_loss": -5.393675327301025, "global_step": 26396, "epoch": 628} {"train_loss": -5.430608749389648, "global_step": 26397, "epoch": 628} {"train_loss": -5.356642723083496, "global_step": 26398, "epoch": 628} {"train_loss": -5.497502326965332, "global_step": 26399, "epoch": 628} {"train_loss": -5.394528865814209, "global_step": 26400, "epoch": 628} {"train_loss": -5.360684871673584, "global_step": 26401, "epoch": 628} {"train_loss": -5.4292449951171875, "global_step": 26402, "epoch": 628} {"train_loss": -5.3922529220581055, "global_step": 26403, "epoch": 628} {"train_loss": -5.492247581481934, "global_step": 26404, "epoch": 628} {"train_loss": -5.410421371459961, "global_step": 26405, "epoch": 628} {"train_loss": -5.541603088378906, "global_step": 26406, "epoch": 628} {"train_loss": -5.452059268951416, "global_step": 26407, "epoch": 628} {"train_loss": -5.354887962341309, "global_step": 26408, "epoch": 628} {"train_loss": -5.336760520935059, "global_step": 26409, "epoch": 628} {"train_loss": -5.488381385803223, "global_step": 26410, "epoch": 628} {"train_loss": -5.318140983581543, "global_step": 26411, "epoch": 628} {"train_loss": -5.392261505126953, "global_step": 26412, "epoch": 628} {"train_loss": -5.468669414520264, "global_step": 26413, "epoch": 628} {"train_loss": -5.405170440673828, "global_step": 26414, "epoch": 628} {"train_loss": -5.311499118804932, "global_step": 26415, "epoch": 628} {"train_loss": -5.470513343811035, "global_step": 26416, "epoch": 628} {"train_loss": -5.425967840921311, "global_step": 26417, "epoch": 628, "val_loss": 75671.4765625} {"train_loss": -5.578205108642578, "global_step": 26418, "epoch": 629} {"train_loss": -5.393479347229004, "global_step": 26419, "epoch": 629} {"train_loss": -5.279530048370361, "global_step": 26420, "epoch": 629} {"train_loss": -5.509435653686523, "global_step": 26421, "epoch": 629} {"train_loss": -5.477490425109863, "global_step": 26422, "epoch": 629} {"train_loss": -5.393113613128662, "global_step": 26423, "epoch": 629} {"train_loss": -5.389464378356934, "global_step": 26424, "epoch": 629} {"train_loss": -5.488676071166992, "global_step": 26425, "epoch": 629} {"train_loss": -5.4649658203125, "global_step": 26426, "epoch": 629} {"train_loss": -5.373863220214844, "global_step": 26427, "epoch": 629} {"train_loss": -5.430706977844238, "global_step": 26428, "epoch": 629} {"train_loss": -5.376124382019043, "global_step": 26429, "epoch": 629} {"train_loss": -5.4178009033203125, "global_step": 26430, "epoch": 629} {"train_loss": -5.456146717071533, "global_step": 26431, "epoch": 629} {"train_loss": -5.45950984954834, "global_step": 26432, "epoch": 629} {"train_loss": -5.496696472167969, "global_step": 26433, "epoch": 629} {"train_loss": -5.39139461517334, "global_step": 26434, "epoch": 629} {"train_loss": -5.379948616027832, "global_step": 26435, "epoch": 629} {"train_loss": -5.408772945404053, "global_step": 26436, "epoch": 629} {"train_loss": -5.3694915771484375, "global_step": 26437, "epoch": 629} {"train_loss": -5.321793079376221, "global_step": 26438, "epoch": 629} {"train_loss": -5.480205059051514, "global_step": 26439, "epoch": 629} {"train_loss": -5.399109840393066, "global_step": 26440, "epoch": 629} {"train_loss": -5.352246284484863, "global_step": 26441, "epoch": 629} {"train_loss": -5.496946334838867, "global_step": 26442, "epoch": 629} {"train_loss": -5.351846218109131, "global_step": 26443, "epoch": 629} {"train_loss": -5.5193963050842285, "global_step": 26444, "epoch": 629} {"train_loss": -5.428767204284668, "global_step": 26445, "epoch": 629} {"train_loss": -5.481809139251709, "global_step": 26446, "epoch": 629} {"train_loss": -5.354241371154785, "global_step": 26447, "epoch": 629} {"train_loss": -5.39713191986084, "global_step": 26448, "epoch": 629} {"train_loss": -5.3713884353637695, "global_step": 26449, "epoch": 629} {"train_loss": -5.337658882141113, "global_step": 26450, "epoch": 629} {"train_loss": -5.415932655334473, "global_step": 26451, "epoch": 629} {"train_loss": -5.3716583251953125, "global_step": 26452, "epoch": 629} {"train_loss": -5.541342735290527, "global_step": 26453, "epoch": 629} {"train_loss": -5.470522880554199, "global_step": 26454, "epoch": 629} {"train_loss": -5.567244529724121, "global_step": 26455, "epoch": 629} {"train_loss": -5.40130090713501, "global_step": 26456, "epoch": 629} {"train_loss": -5.383685111999512, "global_step": 26457, "epoch": 629} {"train_loss": -5.427018165588379, "global_step": 26458, "epoch": 629} {"train_loss": -5.42351237932841, "global_step": 26459, "epoch": 629, "val_loss": 76414.6640625} {"train_loss": -5.326886177062988, "global_step": 26460, "epoch": 630} {"train_loss": -5.407350540161133, "global_step": 26461, "epoch": 630} {"train_loss": -5.592008590698242, "global_step": 26462, "epoch": 630} {"train_loss": -5.376309394836426, "global_step": 26463, "epoch": 630} {"train_loss": -5.312276840209961, "global_step": 26464, "epoch": 630} {"train_loss": -5.4996466636657715, "global_step": 26465, "epoch": 630} {"train_loss": -5.419029235839844, "global_step": 26466, "epoch": 630} {"train_loss": -5.3173675537109375, "global_step": 26467, "epoch": 630} {"train_loss": -5.420030117034912, "global_step": 26468, "epoch": 630} {"train_loss": -5.3517632484436035, "global_step": 26469, "epoch": 630} {"train_loss": -5.396523475646973, "global_step": 26470, "epoch": 630} {"train_loss": -5.3308305740356445, "global_step": 26471, "epoch": 630} {"train_loss": -5.404229164123535, "global_step": 26472, "epoch": 630} {"train_loss": -5.351095676422119, "global_step": 26473, "epoch": 630} {"train_loss": -5.393241882324219, "global_step": 26474, "epoch": 630} {"train_loss": -5.257781028747559, "global_step": 26475, "epoch": 630} {"train_loss": -5.489256381988525, "global_step": 26476, "epoch": 630} {"train_loss": -5.420851230621338, "global_step": 26477, "epoch": 630} {"train_loss": -5.340804100036621, "global_step": 26478, "epoch": 630} {"train_loss": -5.451269149780273, "global_step": 26479, "epoch": 630} {"train_loss": -5.48788595199585, "global_step": 26480, "epoch": 630} {"train_loss": -5.339057922363281, "global_step": 26481, "epoch": 630} {"train_loss": -5.493536472320557, "global_step": 26482, "epoch": 630} {"train_loss": -5.356904983520508, "global_step": 26483, "epoch": 630} {"train_loss": -5.463581085205078, "global_step": 26484, "epoch": 630} {"train_loss": -5.385862350463867, "global_step": 26485, "epoch": 630} {"train_loss": -5.456860065460205, "global_step": 26486, "epoch": 630} {"train_loss": -5.459099769592285, "global_step": 26487, "epoch": 630} {"train_loss": -5.459417819976807, "global_step": 26488, "epoch": 630} {"train_loss": -5.522776126861572, "global_step": 26489, "epoch": 630} {"train_loss": -5.319042205810547, "global_step": 26490, "epoch": 630} {"train_loss": -5.446902275085449, "global_step": 26491, "epoch": 630} {"train_loss": -5.240631103515625, "global_step": 26492, "epoch": 630} {"train_loss": -5.159146308898926, "global_step": 26493, "epoch": 630} {"train_loss": -5.253826141357422, "global_step": 26494, "epoch": 630} {"train_loss": -5.239276885986328, "global_step": 26495, "epoch": 630} {"train_loss": -5.386163711547852, "global_step": 26496, "epoch": 630} {"train_loss": -5.204845428466797, "global_step": 26497, "epoch": 630} {"train_loss": -5.323907375335693, "global_step": 26498, "epoch": 630} {"train_loss": -5.3875555992126465, "global_step": 26499, "epoch": 630} {"train_loss": -5.150179862976074, "global_step": 26500, "epoch": 630} {"train_loss": -5.377194461368379, "global_step": 26501, "epoch": 630, "val_loss": 76264.96875} {"train_loss": -5.294960975646973, "global_step": 26502, "epoch": 631} {"train_loss": -5.373045921325684, "global_step": 26503, "epoch": 631} {"train_loss": -5.332115173339844, "global_step": 26504, "epoch": 631} {"train_loss": -5.370850086212158, "global_step": 26505, "epoch": 631} {"train_loss": -5.218326568603516, "global_step": 26506, "epoch": 631} {"train_loss": -5.4435014724731445, "global_step": 26507, "epoch": 631} {"train_loss": -5.274508476257324, "global_step": 26508, "epoch": 631} {"train_loss": -5.336883544921875, "global_step": 26509, "epoch": 631} {"train_loss": -5.451546669006348, "global_step": 26510, "epoch": 631} {"train_loss": -5.463676929473877, "global_step": 26511, "epoch": 631} {"train_loss": -5.409525394439697, "global_step": 26512, "epoch": 631} {"train_loss": -5.452682971954346, "global_step": 26513, "epoch": 631} {"train_loss": -5.347330570220947, "global_step": 26514, "epoch": 631} {"train_loss": -5.38339900970459, "global_step": 26515, "epoch": 631} {"train_loss": -5.529221057891846, "global_step": 26516, "epoch": 631} {"train_loss": -5.211263656616211, "global_step": 26517, "epoch": 631} {"train_loss": -5.392872333526611, "global_step": 26518, "epoch": 631} {"train_loss": -5.344423770904541, "global_step": 26519, "epoch": 631} {"train_loss": -5.328258514404297, "global_step": 26520, "epoch": 631} {"train_loss": -5.358372211456299, "global_step": 26521, "epoch": 631} {"train_loss": -5.32305383682251, "global_step": 26522, "epoch": 631} {"train_loss": -5.484377861022949, "global_step": 26523, "epoch": 631} {"train_loss": -5.30826473236084, "global_step": 26524, "epoch": 631} {"train_loss": -5.519265651702881, "global_step": 26525, "epoch": 631} {"train_loss": -5.372215747833252, "global_step": 26526, "epoch": 631} {"train_loss": -5.355018615722656, "global_step": 26527, "epoch": 631} {"train_loss": -5.351867198944092, "global_step": 26528, "epoch": 631} {"train_loss": -5.397589683532715, "global_step": 26529, "epoch": 631} {"train_loss": -5.45182466506958, "global_step": 26530, "epoch": 631} {"train_loss": -5.486325263977051, "global_step": 26531, "epoch": 631} {"train_loss": -5.505352973937988, "global_step": 26532, "epoch": 631} {"train_loss": -5.324043273925781, "global_step": 26533, "epoch": 631} {"train_loss": -5.450437545776367, "global_step": 26534, "epoch": 631} {"train_loss": -5.362991809844971, "global_step": 26535, "epoch": 631} {"train_loss": -5.479008674621582, "global_step": 26536, "epoch": 631} {"train_loss": -5.4091010093688965, "global_step": 26537, "epoch": 631} {"train_loss": -5.583557605743408, "global_step": 26538, "epoch": 631} {"train_loss": -5.253350257873535, "global_step": 26539, "epoch": 631} {"train_loss": -5.396777153015137, "global_step": 26540, "epoch": 631} {"train_loss": -5.400524139404297, "global_step": 26541, "epoch": 631} {"train_loss": -5.418992519378662, "global_step": 26542, "epoch": 631} {"train_loss": -5.39000449861799, "global_step": 26543, "epoch": 631, "val_loss": 76483.4609375} {"train_loss": -5.437320232391357, "global_step": 26544, "epoch": 632} {"train_loss": -5.274115562438965, "global_step": 26545, "epoch": 632} {"train_loss": -5.385693073272705, "global_step": 26546, "epoch": 632} {"train_loss": -5.504944801330566, "global_step": 26547, "epoch": 632} {"train_loss": -5.330038070678711, "global_step": 26548, "epoch": 632} {"train_loss": -5.353146076202393, "global_step": 26549, "epoch": 632} {"train_loss": -5.4202799797058105, "global_step": 26550, "epoch": 632} {"train_loss": -5.3958740234375, "global_step": 26551, "epoch": 632} {"train_loss": -5.385430335998535, "global_step": 26552, "epoch": 632} {"train_loss": -5.574634552001953, "global_step": 26553, "epoch": 632} {"train_loss": -5.414787292480469, "global_step": 26554, "epoch": 632} {"train_loss": -5.425173759460449, "global_step": 26555, "epoch": 632} {"train_loss": -5.425604343414307, "global_step": 26556, "epoch": 632} {"train_loss": -5.285182952880859, "global_step": 26557, "epoch": 632} {"train_loss": -5.379192352294922, "global_step": 26558, "epoch": 632} {"train_loss": -5.427591323852539, "global_step": 26559, "epoch": 632} {"train_loss": -5.322539329528809, "global_step": 26560, "epoch": 632} {"train_loss": -5.296776294708252, "global_step": 26561, "epoch": 632} {"train_loss": -5.4173994064331055, "global_step": 26562, "epoch": 632} {"train_loss": -5.289457321166992, "global_step": 26563, "epoch": 632} {"train_loss": -5.470605850219727, "global_step": 26564, "epoch": 632} {"train_loss": -5.3966779708862305, "global_step": 26565, "epoch": 632} {"train_loss": -5.287693023681641, "global_step": 26566, "epoch": 632} {"train_loss": -5.439069747924805, "global_step": 26567, "epoch": 632} {"train_loss": -5.476911544799805, "global_step": 26568, "epoch": 632} {"train_loss": -5.437751770019531, "global_step": 26569, "epoch": 632} {"train_loss": -5.415134429931641, "global_step": 26570, "epoch": 632} {"train_loss": -5.373058795928955, "global_step": 26571, "epoch": 632} {"train_loss": -5.469541549682617, "global_step": 26572, "epoch": 632} {"train_loss": -5.271594047546387, "global_step": 26573, "epoch": 632} {"train_loss": -5.409646034240723, "global_step": 26574, "epoch": 632} {"train_loss": -5.469245910644531, "global_step": 26575, "epoch": 632} {"train_loss": -5.344551086425781, "global_step": 26576, "epoch": 632} {"train_loss": -5.543302059173584, "global_step": 26577, "epoch": 632} {"train_loss": -5.438613414764404, "global_step": 26578, "epoch": 632} {"train_loss": -5.445335865020752, "global_step": 26579, "epoch": 632} {"train_loss": -5.365231990814209, "global_step": 26580, "epoch": 632} {"train_loss": -5.336894989013672, "global_step": 26581, "epoch": 632} {"train_loss": -5.428792476654053, "global_step": 26582, "epoch": 632} {"train_loss": -5.308284759521484, "global_step": 26583, "epoch": 632} {"train_loss": -5.4464945793151855, "global_step": 26584, "epoch": 632} {"train_loss": -5.400886456171672, "global_step": 26585, "epoch": 632, "val_loss": 76228.796875} {"train_loss": -5.563336372375488, "global_step": 26586, "epoch": 633} {"train_loss": -5.410341262817383, "global_step": 26587, "epoch": 633} {"train_loss": -5.501643657684326, "global_step": 26588, "epoch": 633} {"train_loss": -5.506950378417969, "global_step": 26589, "epoch": 633} {"train_loss": -5.369433403015137, "global_step": 26590, "epoch": 633} {"train_loss": -5.378272533416748, "global_step": 26591, "epoch": 633} {"train_loss": -5.453630447387695, "global_step": 26592, "epoch": 633} {"train_loss": -5.492551326751709, "global_step": 26593, "epoch": 633} {"train_loss": -5.397049903869629, "global_step": 26594, "epoch": 633} {"train_loss": -5.380058288574219, "global_step": 26595, "epoch": 633} {"train_loss": -5.51290225982666, "global_step": 26596, "epoch": 633} {"train_loss": -5.487804412841797, "global_step": 26597, "epoch": 633} {"train_loss": -5.402428150177002, "global_step": 26598, "epoch": 633} {"train_loss": -5.416945457458496, "global_step": 26599, "epoch": 633} {"train_loss": -5.545068264007568, "global_step": 26600, "epoch": 633} {"train_loss": -5.433723449707031, "global_step": 26601, "epoch": 633} {"train_loss": -5.355093002319336, "global_step": 26602, "epoch": 633} {"train_loss": -5.298442363739014, "global_step": 26603, "epoch": 633} {"train_loss": -5.415128707885742, "global_step": 26604, "epoch": 633} {"train_loss": -5.487876892089844, "global_step": 26605, "epoch": 633} {"train_loss": -5.402705192565918, "global_step": 26606, "epoch": 633} {"train_loss": -5.301455497741699, "global_step": 26607, "epoch": 633} {"train_loss": -5.464386463165283, "global_step": 26608, "epoch": 633} {"train_loss": -5.32242488861084, "global_step": 26609, "epoch": 633} {"train_loss": -5.372479438781738, "global_step": 26610, "epoch": 633} {"train_loss": -5.391945838928223, "global_step": 26611, "epoch": 633} {"train_loss": -5.356757164001465, "global_step": 26612, "epoch": 633} {"train_loss": -5.380209922790527, "global_step": 26613, "epoch": 633} {"train_loss": -5.478326797485352, "global_step": 26614, "epoch": 633} {"train_loss": -5.309934616088867, "global_step": 26615, "epoch": 633} {"train_loss": -5.378870487213135, "global_step": 26616, "epoch": 633} {"train_loss": -5.430314540863037, "global_step": 26617, "epoch": 633} {"train_loss": -5.3957319259643555, "global_step": 26618, "epoch": 633} {"train_loss": -5.260922431945801, "global_step": 26619, "epoch": 633} {"train_loss": -5.42143440246582, "global_step": 26620, "epoch": 633} {"train_loss": -5.318270683288574, "global_step": 26621, "epoch": 633} {"train_loss": -5.184223651885986, "global_step": 26622, "epoch": 633} {"train_loss": -5.4157633781433105, "global_step": 26623, "epoch": 633} {"train_loss": -5.4508819580078125, "global_step": 26624, "epoch": 633} {"train_loss": -5.4830098152160645, "global_step": 26625, "epoch": 633} {"train_loss": -5.376460075378418, "global_step": 26626, "epoch": 633} {"train_loss": -5.404082650230045, "global_step": 26627, "epoch": 633, "val_loss": 76511.890625} {"train_loss": -5.452627182006836, "global_step": 26628, "epoch": 634} {"train_loss": -5.454427719116211, "global_step": 26629, "epoch": 634} {"train_loss": -5.419618606567383, "global_step": 26630, "epoch": 634} {"train_loss": -5.326422691345215, "global_step": 26631, "epoch": 634} {"train_loss": -5.364438533782959, "global_step": 26632, "epoch": 634} {"train_loss": -5.43747615814209, "global_step": 26633, "epoch": 634} {"train_loss": -5.558163166046143, "global_step": 26634, "epoch": 634} {"train_loss": -5.413870811462402, "global_step": 26635, "epoch": 634} {"train_loss": -5.499353408813477, "global_step": 26636, "epoch": 634} {"train_loss": -5.39223575592041, "global_step": 26637, "epoch": 634} {"train_loss": -5.415409564971924, "global_step": 26638, "epoch": 634} {"train_loss": -5.3962812423706055, "global_step": 26639, "epoch": 634} {"train_loss": -5.489519119262695, "global_step": 26640, "epoch": 634} {"train_loss": -5.440898418426514, "global_step": 26641, "epoch": 634} {"train_loss": -5.456273078918457, "global_step": 26642, "epoch": 634} {"train_loss": -5.40371036529541, "global_step": 26643, "epoch": 634} {"train_loss": -5.401398658752441, "global_step": 26644, "epoch": 634} {"train_loss": -5.4844512939453125, "global_step": 26645, "epoch": 634} {"train_loss": -5.403728485107422, "global_step": 26646, "epoch": 634} {"train_loss": -5.363368511199951, "global_step": 26647, "epoch": 634} {"train_loss": -5.443739891052246, "global_step": 26648, "epoch": 634} {"train_loss": -5.259710311889648, "global_step": 26649, "epoch": 634} {"train_loss": -5.302480697631836, "global_step": 26650, "epoch": 634} {"train_loss": -5.462062835693359, "global_step": 26651, "epoch": 634} {"train_loss": -5.24147891998291, "global_step": 26652, "epoch": 634} {"train_loss": -5.481507301330566, "global_step": 26653, "epoch": 634} {"train_loss": -5.322409629821777, "global_step": 26654, "epoch": 634} {"train_loss": -5.3133134841918945, "global_step": 26655, "epoch": 634} {"train_loss": -5.4016008377075195, "global_step": 26656, "epoch": 634} {"train_loss": -5.370905876159668, "global_step": 26657, "epoch": 634} {"train_loss": -5.2754669189453125, "global_step": 26658, "epoch": 634} {"train_loss": -5.431778907775879, "global_step": 26659, "epoch": 634} {"train_loss": -5.401410102844238, "global_step": 26660, "epoch": 634} {"train_loss": -5.4503374099731445, "global_step": 26661, "epoch": 634} {"train_loss": -5.450691223144531, "global_step": 26662, "epoch": 634} {"train_loss": -5.369655132293701, "global_step": 26663, "epoch": 634} {"train_loss": -5.519781112670898, "global_step": 26664, "epoch": 634} {"train_loss": -5.533601760864258, "global_step": 26665, "epoch": 634} {"train_loss": -5.359895706176758, "global_step": 26666, "epoch": 634} {"train_loss": -5.354424953460693, "global_step": 26667, "epoch": 634} {"train_loss": -5.472713947296143, "global_step": 26668, "epoch": 634} {"train_loss": -5.409387758799961, "global_step": 26669, "epoch": 634, "val_loss": 76207.828125} {"train_loss": -5.408953666687012, "global_step": 26670, "epoch": 635} {"train_loss": -5.512641429901123, "global_step": 26671, "epoch": 635} {"train_loss": -5.481122016906738, "global_step": 26672, "epoch": 635} {"train_loss": -5.283515453338623, "global_step": 26673, "epoch": 635} {"train_loss": -5.419119358062744, "global_step": 26674, "epoch": 635} {"train_loss": -5.37071418762207, "global_step": 26675, "epoch": 635} {"train_loss": -5.400843620300293, "global_step": 26676, "epoch": 635} {"train_loss": -5.4069976806640625, "global_step": 26677, "epoch": 635} {"train_loss": -5.4452805519104, "global_step": 26678, "epoch": 635} {"train_loss": -5.403654098510742, "global_step": 26679, "epoch": 635} {"train_loss": -5.344743728637695, "global_step": 26680, "epoch": 635} {"train_loss": -5.55165433883667, "global_step": 26681, "epoch": 635} {"train_loss": -5.402346611022949, "global_step": 26682, "epoch": 635} {"train_loss": -5.413336753845215, "global_step": 26683, "epoch": 635} {"train_loss": -5.396621227264404, "global_step": 26684, "epoch": 635} {"train_loss": -5.442815780639648, "global_step": 26685, "epoch": 635} {"train_loss": -5.460732460021973, "global_step": 26686, "epoch": 635} {"train_loss": -5.468466758728027, "global_step": 26687, "epoch": 635} {"train_loss": -5.42755126953125, "global_step": 26688, "epoch": 635} {"train_loss": -5.467090129852295, "global_step": 26689, "epoch": 635} {"train_loss": -5.460629463195801, "global_step": 26690, "epoch": 635} {"train_loss": -5.455574989318848, "global_step": 26691, "epoch": 635} {"train_loss": -5.358821868896484, "global_step": 26692, "epoch": 635} {"train_loss": -5.3332695960998535, "global_step": 26693, "epoch": 635} {"train_loss": -5.528956413269043, "global_step": 26694, "epoch": 635} {"train_loss": -5.382215976715088, "global_step": 26695, "epoch": 635} {"train_loss": -5.340289115905762, "global_step": 26696, "epoch": 635} {"train_loss": -5.348240852355957, "global_step": 26697, "epoch": 635} {"train_loss": -5.446463108062744, "global_step": 26698, "epoch": 635} {"train_loss": -5.421627998352051, "global_step": 26699, "epoch": 635} {"train_loss": -5.422039985656738, "global_step": 26700, "epoch": 635} {"train_loss": -5.387149810791016, "global_step": 26701, "epoch": 635} {"train_loss": -5.414783477783203, "global_step": 26702, "epoch": 635} {"train_loss": -5.455660343170166, "global_step": 26703, "epoch": 635} {"train_loss": -5.306641578674316, "global_step": 26704, "epoch": 635} {"train_loss": -5.505340099334717, "global_step": 26705, "epoch": 635} {"train_loss": -5.302948474884033, "global_step": 26706, "epoch": 635} {"train_loss": -5.538041591644287, "global_step": 26707, "epoch": 635} {"train_loss": -5.490667819976807, "global_step": 26708, "epoch": 635} {"train_loss": -5.185805797576904, "global_step": 26709, "epoch": 635} {"train_loss": -5.3209228515625, "global_step": 26710, "epoch": 635} {"train_loss": -5.410445860454014, "global_step": 26711, "epoch": 635, "val_loss": 76228.9140625} {"train_loss": -5.287990093231201, "global_step": 26712, "epoch": 636} {"train_loss": -5.310342788696289, "global_step": 26713, "epoch": 636} {"train_loss": -5.3908796310424805, "global_step": 26714, "epoch": 636} {"train_loss": -5.363101959228516, "global_step": 26715, "epoch": 636} {"train_loss": -5.497398853302002, "global_step": 26716, "epoch": 636} {"train_loss": -5.453686237335205, "global_step": 26717, "epoch": 636} {"train_loss": -5.405040740966797, "global_step": 26718, "epoch": 636} {"train_loss": -5.407926559448242, "global_step": 26719, "epoch": 636} {"train_loss": -5.397228240966797, "global_step": 26720, "epoch": 636} {"train_loss": -5.384064674377441, "global_step": 26721, "epoch": 636} {"train_loss": -5.315701484680176, "global_step": 26722, "epoch": 636} {"train_loss": -5.385544776916504, "global_step": 26723, "epoch": 636} {"train_loss": -5.341965675354004, "global_step": 26724, "epoch": 636} {"train_loss": -5.286365985870361, "global_step": 26725, "epoch": 636} {"train_loss": -5.400415420532227, "global_step": 26726, "epoch": 636} {"train_loss": -5.41120719909668, "global_step": 26727, "epoch": 636} {"train_loss": -5.327917098999023, "global_step": 26728, "epoch": 636} {"train_loss": -5.324560165405273, "global_step": 26729, "epoch": 636} {"train_loss": -5.381879806518555, "global_step": 26730, "epoch": 636} {"train_loss": -5.499107360839844, "global_step": 26731, "epoch": 636} {"train_loss": -5.460843086242676, "global_step": 26732, "epoch": 636} {"train_loss": -5.294376850128174, "global_step": 26733, "epoch": 636} {"train_loss": -5.395583629608154, "global_step": 26734, "epoch": 636} {"train_loss": -5.449723243713379, "global_step": 26735, "epoch": 636} {"train_loss": -5.323098659515381, "global_step": 26736, "epoch": 636} {"train_loss": -5.536202430725098, "global_step": 26737, "epoch": 636} {"train_loss": -5.241620063781738, "global_step": 26738, "epoch": 636} {"train_loss": -5.483177185058594, "global_step": 26739, "epoch": 636} {"train_loss": -5.548497200012207, "global_step": 26740, "epoch": 636} {"train_loss": -5.466180801391602, "global_step": 26741, "epoch": 636} {"train_loss": -5.455850601196289, "global_step": 26742, "epoch": 636} {"train_loss": -5.373321533203125, "global_step": 26743, "epoch": 636} {"train_loss": -5.419397354125977, "global_step": 26744, "epoch": 636} {"train_loss": -5.3510541915893555, "global_step": 26745, "epoch": 636} {"train_loss": -5.483381271362305, "global_step": 26746, "epoch": 636} {"train_loss": -5.189562797546387, "global_step": 26747, "epoch": 636} {"train_loss": -5.415449142456055, "global_step": 26748, "epoch": 636} {"train_loss": -5.473349571228027, "global_step": 26749, "epoch": 636} {"train_loss": -5.470595359802246, "global_step": 26750, "epoch": 636} {"train_loss": -5.331500053405762, "global_step": 26751, "epoch": 636} {"train_loss": -5.373623847961426, "global_step": 26752, "epoch": 636} {"train_loss": -5.395690895262218, "global_step": 26753, "epoch": 636, "val_loss": 76268.8046875} {"train_loss": -5.317694664001465, "global_step": 26754, "epoch": 637} {"train_loss": -5.389376640319824, "global_step": 26755, "epoch": 637} {"train_loss": -5.407451629638672, "global_step": 26756, "epoch": 637} {"train_loss": -5.334494113922119, "global_step": 26757, "epoch": 637} {"train_loss": -5.420224189758301, "global_step": 26758, "epoch": 637} {"train_loss": -5.481467247009277, "global_step": 26759, "epoch": 637} {"train_loss": -5.542383670806885, "global_step": 26760, "epoch": 637} {"train_loss": -5.422723293304443, "global_step": 26761, "epoch": 637} {"train_loss": -5.267187595367432, "global_step": 26762, "epoch": 637} {"train_loss": -5.462603569030762, "global_step": 26763, "epoch": 637} {"train_loss": -5.391870498657227, "global_step": 26764, "epoch": 637} {"train_loss": -5.3930158615112305, "global_step": 26765, "epoch": 637} {"train_loss": -5.4800896644592285, "global_step": 26766, "epoch": 637} {"train_loss": -5.346814155578613, "global_step": 26767, "epoch": 637} {"train_loss": -5.564785957336426, "global_step": 26768, "epoch": 637} {"train_loss": -5.479636192321777, "global_step": 26769, "epoch": 637} {"train_loss": -5.272794723510742, "global_step": 26770, "epoch": 637} {"train_loss": -5.471193313598633, "global_step": 26771, "epoch": 637} {"train_loss": -5.437922477722168, "global_step": 26772, "epoch": 637} {"train_loss": -5.470551490783691, "global_step": 26773, "epoch": 637} {"train_loss": -5.472039222717285, "global_step": 26774, "epoch": 637} {"train_loss": -5.60312032699585, "global_step": 26775, "epoch": 637} {"train_loss": -5.51611328125, "global_step": 26776, "epoch": 637} {"train_loss": -5.527399063110352, "global_step": 26777, "epoch": 637} {"train_loss": -5.483590126037598, "global_step": 26778, "epoch": 637} {"train_loss": -5.48541784286499, "global_step": 26779, "epoch": 637} {"train_loss": -5.542316436767578, "global_step": 26780, "epoch": 637} {"train_loss": -5.392987251281738, "global_step": 26781, "epoch": 637} {"train_loss": -5.46388053894043, "global_step": 26782, "epoch": 637} {"train_loss": -5.398491859436035, "global_step": 26783, "epoch": 637} {"train_loss": -5.631828308105469, "global_step": 26784, "epoch": 637} {"train_loss": -5.561853408813477, "global_step": 26785, "epoch": 637} {"train_loss": -5.473395824432373, "global_step": 26786, "epoch": 637} {"train_loss": -5.440375804901123, "global_step": 26787, "epoch": 637} {"train_loss": -5.434830665588379, "global_step": 26788, "epoch": 637} {"train_loss": -5.2988996505737305, "global_step": 26789, "epoch": 637} {"train_loss": -5.405018329620361, "global_step": 26790, "epoch": 637} {"train_loss": -5.39141845703125, "global_step": 26791, "epoch": 637} {"train_loss": -5.388491630554199, "global_step": 26792, "epoch": 637} {"train_loss": -5.307159423828125, "global_step": 26793, "epoch": 637} {"train_loss": -5.4281463623046875, "global_step": 26794, "epoch": 637} {"train_loss": -5.434187866392589, "global_step": 26795, "epoch": 637, "val_loss": 75849.8984375} {"train_loss": -5.529970169067383, "global_step": 26796, "epoch": 638} {"train_loss": -5.4732346534729, "global_step": 26797, "epoch": 638} {"train_loss": -5.363259792327881, "global_step": 26798, "epoch": 638} {"train_loss": -5.569459915161133, "global_step": 26799, "epoch": 638} {"train_loss": -5.37530517578125, "global_step": 26800, "epoch": 638} {"train_loss": -5.51241397857666, "global_step": 26801, "epoch": 638} {"train_loss": -5.417086124420166, "global_step": 26802, "epoch": 638} {"train_loss": -5.606234550476074, "global_step": 26803, "epoch": 638} {"train_loss": -5.583298683166504, "global_step": 26804, "epoch": 638} {"train_loss": -5.396120071411133, "global_step": 26805, "epoch": 638} {"train_loss": -5.402127265930176, "global_step": 26806, "epoch": 638} {"train_loss": -5.508705139160156, "global_step": 26807, "epoch": 638} {"train_loss": -5.451230525970459, "global_step": 26808, "epoch": 638} {"train_loss": -5.449010848999023, "global_step": 26809, "epoch": 638} {"train_loss": -5.391529083251953, "global_step": 26810, "epoch": 638} {"train_loss": -5.413120269775391, "global_step": 26811, "epoch": 638} {"train_loss": -5.462735652923584, "global_step": 26812, "epoch": 638} {"train_loss": -5.3778181076049805, "global_step": 26813, "epoch": 638} {"train_loss": -5.387469291687012, "global_step": 26814, "epoch": 638} {"train_loss": -5.378227233886719, "global_step": 26815, "epoch": 638} {"train_loss": -5.357520580291748, "global_step": 26816, "epoch": 638} {"train_loss": -5.424424171447754, "global_step": 26817, "epoch": 638} {"train_loss": -5.445677757263184, "global_step": 26818, "epoch": 638} {"train_loss": -5.244800090789795, "global_step": 26819, "epoch": 638} {"train_loss": -5.343152046203613, "global_step": 26820, "epoch": 638} {"train_loss": -5.310937881469727, "global_step": 26821, "epoch": 638} {"train_loss": -5.539882659912109, "global_step": 26822, "epoch": 638} {"train_loss": -5.429611682891846, "global_step": 26823, "epoch": 638} {"train_loss": -5.567628383636475, "global_step": 26824, "epoch": 638} {"train_loss": -5.367955207824707, "global_step": 26825, "epoch": 638} {"train_loss": -5.476035118103027, "global_step": 26826, "epoch": 638} {"train_loss": -5.439424514770508, "global_step": 26827, "epoch": 638} {"train_loss": -5.303683757781982, "global_step": 26828, "epoch": 638} {"train_loss": -5.271902084350586, "global_step": 26829, "epoch": 638} {"train_loss": -5.414780616760254, "global_step": 26830, "epoch": 638} {"train_loss": -5.380313396453857, "global_step": 26831, "epoch": 638} {"train_loss": -5.464748382568359, "global_step": 26832, "epoch": 638} {"train_loss": -5.322912693023682, "global_step": 26833, "epoch": 638} {"train_loss": -5.275493621826172, "global_step": 26834, "epoch": 638} {"train_loss": -5.3677873611450195, "global_step": 26835, "epoch": 638} {"train_loss": -5.359431743621826, "global_step": 26836, "epoch": 638} {"train_loss": -5.4185604481470016, "global_step": 26837, "epoch": 638, "val_loss": 75907.6640625} {"train_loss": -5.224183082580566, "global_step": 26838, "epoch": 639} {"train_loss": -5.536907196044922, "global_step": 26839, "epoch": 639} {"train_loss": -5.340825080871582, "global_step": 26840, "epoch": 639} {"train_loss": -5.401466369628906, "global_step": 26841, "epoch": 639} {"train_loss": -5.372503757476807, "global_step": 26842, "epoch": 639} {"train_loss": -5.333810806274414, "global_step": 26843, "epoch": 639} {"train_loss": -5.519044399261475, "global_step": 26844, "epoch": 639} {"train_loss": -5.383275508880615, "global_step": 26845, "epoch": 639} {"train_loss": -5.478341102600098, "global_step": 26846, "epoch": 639} {"train_loss": -5.487826347351074, "global_step": 26847, "epoch": 639} {"train_loss": -5.388919830322266, "global_step": 26848, "epoch": 639} {"train_loss": -5.494656562805176, "global_step": 26849, "epoch": 639} {"train_loss": -5.403439044952393, "global_step": 26850, "epoch": 639} {"train_loss": -5.421901702880859, "global_step": 26851, "epoch": 639} {"train_loss": -5.401137828826904, "global_step": 26852, "epoch": 639} {"train_loss": -5.259921550750732, "global_step": 26853, "epoch": 639} {"train_loss": -5.444068431854248, "global_step": 26854, "epoch": 639} {"train_loss": -5.343491077423096, "global_step": 26855, "epoch": 639} {"train_loss": -5.312203884124756, "global_step": 26856, "epoch": 639} {"train_loss": -5.366205215454102, "global_step": 26857, "epoch": 639} {"train_loss": -5.304407596588135, "global_step": 26858, "epoch": 639} {"train_loss": -5.480863571166992, "global_step": 26859, "epoch": 639} {"train_loss": -5.320716857910156, "global_step": 26860, "epoch": 639} {"train_loss": -5.332131862640381, "global_step": 26861, "epoch": 639} {"train_loss": -5.391222953796387, "global_step": 26862, "epoch": 639} {"train_loss": -5.317099571228027, "global_step": 26863, "epoch": 639} {"train_loss": -5.378818988800049, "global_step": 26864, "epoch": 639} {"train_loss": -5.4162397384643555, "global_step": 26865, "epoch": 639} {"train_loss": -5.3318986892700195, "global_step": 26866, "epoch": 639} {"train_loss": -5.250678062438965, "global_step": 26867, "epoch": 639} {"train_loss": -5.436022758483887, "global_step": 26868, "epoch": 639} {"train_loss": -5.406105995178223, "global_step": 26869, "epoch": 639} {"train_loss": -5.373597145080566, "global_step": 26870, "epoch": 639} {"train_loss": -5.507558822631836, "global_step": 26871, "epoch": 639} {"train_loss": -5.44645881652832, "global_step": 26872, "epoch": 639} {"train_loss": -5.3551740646362305, "global_step": 26873, "epoch": 639} {"train_loss": -5.435787200927734, "global_step": 26874, "epoch": 639} {"train_loss": -5.430852890014648, "global_step": 26875, "epoch": 639} {"train_loss": -5.255982398986816, "global_step": 26876, "epoch": 639} {"train_loss": -5.36231803894043, "global_step": 26877, "epoch": 639} {"train_loss": -5.414364814758301, "global_step": 26878, "epoch": 639} {"train_loss": -5.387216545286632, "global_step": 26879, "epoch": 639, "val_loss": 75473.75} {"train_loss": -5.590083122253418, "global_step": 26880, "epoch": 640} {"train_loss": -5.420742988586426, "global_step": 26881, "epoch": 640} {"train_loss": -5.431899070739746, "global_step": 26882, "epoch": 640} {"train_loss": -5.415156841278076, "global_step": 26883, "epoch": 640} {"train_loss": -5.447277069091797, "global_step": 26884, "epoch": 640} {"train_loss": -5.27435302734375, "global_step": 26885, "epoch": 640} {"train_loss": -5.420013427734375, "global_step": 26886, "epoch": 640} {"train_loss": -5.4861860275268555, "global_step": 26887, "epoch": 640} {"train_loss": -5.534913539886475, "global_step": 26888, "epoch": 640} {"train_loss": -5.423311233520508, "global_step": 26889, "epoch": 640} {"train_loss": -5.344489574432373, "global_step": 26890, "epoch": 640} {"train_loss": -5.541030406951904, "global_step": 26891, "epoch": 640} {"train_loss": -5.419562816619873, "global_step": 26892, "epoch": 640} {"train_loss": -5.477071762084961, "global_step": 26893, "epoch": 640} {"train_loss": -5.462215423583984, "global_step": 26894, "epoch": 640} {"train_loss": -5.4027557373046875, "global_step": 26895, "epoch": 640} {"train_loss": -5.374600887298584, "global_step": 26896, "epoch": 640} {"train_loss": -5.487757682800293, "global_step": 26897, "epoch": 640} {"train_loss": -5.385556697845459, "global_step": 26898, "epoch": 640} {"train_loss": -5.408790111541748, "global_step": 26899, "epoch": 640} {"train_loss": -5.423469066619873, "global_step": 26900, "epoch": 640} {"train_loss": -5.427457809448242, "global_step": 26901, "epoch": 640} {"train_loss": -5.324771404266357, "global_step": 26902, "epoch": 640} {"train_loss": -5.431598663330078, "global_step": 26903, "epoch": 640} {"train_loss": -5.317591667175293, "global_step": 26904, "epoch": 640} {"train_loss": -5.285838603973389, "global_step": 26905, "epoch": 640} {"train_loss": -5.4998369216918945, "global_step": 26906, "epoch": 640} {"train_loss": -5.347321510314941, "global_step": 26907, "epoch": 640} {"train_loss": -5.189260482788086, "global_step": 26908, "epoch": 640} {"train_loss": -5.393664360046387, "global_step": 26909, "epoch": 640} {"train_loss": -5.26755952835083, "global_step": 26910, "epoch": 640} {"train_loss": -5.312522888183594, "global_step": 26911, "epoch": 640} {"train_loss": -5.257142066955566, "global_step": 26912, "epoch": 640} {"train_loss": -5.13499641418457, "global_step": 26913, "epoch": 640} {"train_loss": -5.245025634765625, "global_step": 26914, "epoch": 640} {"train_loss": -5.412076950073242, "global_step": 26915, "epoch": 640} {"train_loss": -5.364301681518555, "global_step": 26916, "epoch": 640} {"train_loss": -5.328550815582275, "global_step": 26917, "epoch": 640} {"train_loss": -5.465324401855469, "global_step": 26918, "epoch": 640} {"train_loss": -5.28115701675415, "global_step": 26919, "epoch": 640} {"train_loss": -5.396185874938965, "global_step": 26920, "epoch": 640} {"train_loss": -5.389676025935581, "global_step": 26921, "epoch": 640, "val_loss": 76212.890625} {"train_loss": -5.250935077667236, "global_step": 26922, "epoch": 641} {"train_loss": -5.525126934051514, "global_step": 26923, "epoch": 641} {"train_loss": -5.390522003173828, "global_step": 26924, "epoch": 641} {"train_loss": -5.265922546386719, "global_step": 26925, "epoch": 641} {"train_loss": -5.382713794708252, "global_step": 26926, "epoch": 641} {"train_loss": -5.383421897888184, "global_step": 26927, "epoch": 641} {"train_loss": -5.342538833618164, "global_step": 26928, "epoch": 641} {"train_loss": -5.41110897064209, "global_step": 26929, "epoch": 641} {"train_loss": -5.479348659515381, "global_step": 26930, "epoch": 641} {"train_loss": -5.392067909240723, "global_step": 26931, "epoch": 641} {"train_loss": -5.4486541748046875, "global_step": 26932, "epoch": 641} {"train_loss": -5.2474212646484375, "global_step": 26933, "epoch": 641} {"train_loss": -5.358213424682617, "global_step": 26934, "epoch": 641} {"train_loss": -5.432806968688965, "global_step": 26935, "epoch": 641} {"train_loss": -5.4452409744262695, "global_step": 26936, "epoch": 641} {"train_loss": -5.528079509735107, "global_step": 26937, "epoch": 641} {"train_loss": -5.505104064941406, "global_step": 26938, "epoch": 641} {"train_loss": -5.434229850769043, "global_step": 26939, "epoch": 641} {"train_loss": -5.391959190368652, "global_step": 26940, "epoch": 641} {"train_loss": -5.466538429260254, "global_step": 26941, "epoch": 641} {"train_loss": -5.457520008087158, "global_step": 26942, "epoch": 641} {"train_loss": -5.434558868408203, "global_step": 26943, "epoch": 641} {"train_loss": -5.467872142791748, "global_step": 26944, "epoch": 641} {"train_loss": -5.4678826332092285, "global_step": 26945, "epoch": 641} {"train_loss": -5.5143046379089355, "global_step": 26946, "epoch": 641} {"train_loss": -5.4717302322387695, "global_step": 26947, "epoch": 641} {"train_loss": -5.3386735916137695, "global_step": 26948, "epoch": 641} {"train_loss": -5.473491668701172, "global_step": 26949, "epoch": 641} {"train_loss": -5.413041591644287, "global_step": 26950, "epoch": 641} {"train_loss": -5.376258850097656, "global_step": 26951, "epoch": 641} {"train_loss": -5.2571024894714355, "global_step": 26952, "epoch": 641} {"train_loss": -5.4653778076171875, "global_step": 26953, "epoch": 641} {"train_loss": -5.458273887634277, "global_step": 26954, "epoch": 641} {"train_loss": -5.4873857498168945, "global_step": 26955, "epoch": 641} {"train_loss": -5.347667694091797, "global_step": 26956, "epoch": 641} {"train_loss": -5.425440788269043, "global_step": 26957, "epoch": 641} {"train_loss": -5.438425540924072, "global_step": 26958, "epoch": 641} {"train_loss": -5.390532970428467, "global_step": 26959, "epoch": 641} {"train_loss": -5.478342056274414, "global_step": 26960, "epoch": 641} {"train_loss": -5.187643051147461, "global_step": 26961, "epoch": 641} {"train_loss": -5.261265277862549, "global_step": 26962, "epoch": 641} {"train_loss": -5.4071501436687655, "global_step": 26963, "epoch": 641, "val_loss": 75801.21875} {"train_loss": -5.317721366882324, "global_step": 26964, "epoch": 642} {"train_loss": -5.233611106872559, "global_step": 26965, "epoch": 642} {"train_loss": -5.359787940979004, "global_step": 26966, "epoch": 642} {"train_loss": -5.4118804931640625, "global_step": 26967, "epoch": 642} {"train_loss": -5.308905601501465, "global_step": 26968, "epoch": 642} {"train_loss": -5.4351115226745605, "global_step": 26969, "epoch": 642} {"train_loss": -5.354576110839844, "global_step": 26970, "epoch": 642} {"train_loss": -5.408570289611816, "global_step": 26971, "epoch": 642} {"train_loss": -5.490784645080566, "global_step": 26972, "epoch": 642} {"train_loss": -5.3544206619262695, "global_step": 26973, "epoch": 642} {"train_loss": -5.470136642456055, "global_step": 26974, "epoch": 642} {"train_loss": -5.312237739562988, "global_step": 26975, "epoch": 642} {"train_loss": -5.413978099822998, "global_step": 26976, "epoch": 642} {"train_loss": -5.549945831298828, "global_step": 26977, "epoch": 642} {"train_loss": -5.363659858703613, "global_step": 26978, "epoch": 642} {"train_loss": -5.445620536804199, "global_step": 26979, "epoch": 642} {"train_loss": -5.411139488220215, "global_step": 26980, "epoch": 642} {"train_loss": -5.41307258605957, "global_step": 26981, "epoch": 642} {"train_loss": -5.397529602050781, "global_step": 26982, "epoch": 642} {"train_loss": -5.53718376159668, "global_step": 26983, "epoch": 642} {"train_loss": -5.409458160400391, "global_step": 26984, "epoch": 642} {"train_loss": -5.367974281311035, "global_step": 26985, "epoch": 642} {"train_loss": -5.5781168937683105, "global_step": 26986, "epoch": 642} {"train_loss": -5.443847179412842, "global_step": 26987, "epoch": 642} {"train_loss": -5.495069980621338, "global_step": 26988, "epoch": 642} {"train_loss": -5.434704780578613, "global_step": 26989, "epoch": 642} {"train_loss": -5.369100570678711, "global_step": 26990, "epoch": 642} {"train_loss": -5.3886542320251465, "global_step": 26991, "epoch": 642} {"train_loss": -5.425926208496094, "global_step": 26992, "epoch": 642} {"train_loss": -5.307387351989746, "global_step": 26993, "epoch": 642} {"train_loss": -5.400938034057617, "global_step": 26994, "epoch": 642} {"train_loss": -5.400575637817383, "global_step": 26995, "epoch": 642} {"train_loss": -5.3929548263549805, "global_step": 26996, "epoch": 642} {"train_loss": -5.5322980880737305, "global_step": 26997, "epoch": 642} {"train_loss": -5.444198131561279, "global_step": 26998, "epoch": 642} {"train_loss": -5.434873580932617, "global_step": 26999, "epoch": 642} {"train_loss": -5.370794296264648, "global_step": 27000, "epoch": 642} {"train_loss": -5.422362327575684, "global_step": 27001, "epoch": 642} {"train_loss": -5.332436561584473, "global_step": 27002, "epoch": 642} {"train_loss": -5.48973274230957, "global_step": 27003, "epoch": 642} {"train_loss": -5.511059761047363, "global_step": 27004, "epoch": 642} {"train_loss": -5.413121427808489, "global_step": 27005, "epoch": 642, "val_loss": 75701.0859375} {"train_loss": -5.4934563636779785, "global_step": 27006, "epoch": 643} {"train_loss": -5.391670227050781, "global_step": 27007, "epoch": 643} {"train_loss": -5.457552433013916, "global_step": 27008, "epoch": 643} {"train_loss": -5.5069146156311035, "global_step": 27009, "epoch": 643} {"train_loss": -5.3347063064575195, "global_step": 27010, "epoch": 643} {"train_loss": -5.447179794311523, "global_step": 27011, "epoch": 643} {"train_loss": -5.434728622436523, "global_step": 27012, "epoch": 643} {"train_loss": -5.3775129318237305, "global_step": 27013, "epoch": 643} {"train_loss": -5.514761447906494, "global_step": 27014, "epoch": 643} {"train_loss": -5.355332374572754, "global_step": 27015, "epoch": 643} {"train_loss": -5.474381923675537, "global_step": 27016, "epoch": 643} {"train_loss": -5.343899250030518, "global_step": 27017, "epoch": 643} {"train_loss": -5.447900772094727, "global_step": 27018, "epoch": 643} {"train_loss": -5.442721366882324, "global_step": 27019, "epoch": 643} {"train_loss": -5.26791524887085, "global_step": 27020, "epoch": 643} {"train_loss": -5.42204475402832, "global_step": 27021, "epoch": 643} {"train_loss": -5.404117584228516, "global_step": 27022, "epoch": 643} {"train_loss": -5.4167160987854, "global_step": 27023, "epoch": 643} {"train_loss": -5.387815475463867, "global_step": 27024, "epoch": 643} {"train_loss": -5.376350402832031, "global_step": 27025, "epoch": 643} {"train_loss": -5.396121501922607, "global_step": 27026, "epoch": 643} {"train_loss": -5.542688369750977, "global_step": 27027, "epoch": 643} {"train_loss": -5.432546615600586, "global_step": 27028, "epoch": 643} {"train_loss": -5.400181770324707, "global_step": 27029, "epoch": 643} {"train_loss": -5.294801235198975, "global_step": 27030, "epoch": 643} {"train_loss": -5.3593597412109375, "global_step": 27031, "epoch": 643} {"train_loss": -5.329245567321777, "global_step": 27032, "epoch": 643} {"train_loss": -5.298404216766357, "global_step": 27033, "epoch": 643} {"train_loss": -5.525152683258057, "global_step": 27034, "epoch": 643} {"train_loss": -5.3585405349731445, "global_step": 27035, "epoch": 643} {"train_loss": -5.304354667663574, "global_step": 27036, "epoch": 643} {"train_loss": -5.585874080657959, "global_step": 27037, "epoch": 643} {"train_loss": -5.37117862701416, "global_step": 27038, "epoch": 643} {"train_loss": -5.522815227508545, "global_step": 27039, "epoch": 643} {"train_loss": -5.432613372802734, "global_step": 27040, "epoch": 643} {"train_loss": -5.403939723968506, "global_step": 27041, "epoch": 643} {"train_loss": -5.4326324462890625, "global_step": 27042, "epoch": 643} {"train_loss": -5.502366065979004, "global_step": 27043, "epoch": 643} {"train_loss": -5.305665493011475, "global_step": 27044, "epoch": 643} {"train_loss": -5.3697075843811035, "global_step": 27045, "epoch": 643} {"train_loss": -5.271905899047852, "global_step": 27046, "epoch": 643} {"train_loss": -5.408225979123797, "global_step": 27047, "epoch": 643, "val_loss": 76352.578125} {"train_loss": -5.492569923400879, "global_step": 27048, "epoch": 644} {"train_loss": -5.267514228820801, "global_step": 27049, "epoch": 644} {"train_loss": -5.515959739685059, "global_step": 27050, "epoch": 644} {"train_loss": -5.293303489685059, "global_step": 27051, "epoch": 644} {"train_loss": -5.398290157318115, "global_step": 27052, "epoch": 644} {"train_loss": -5.485818386077881, "global_step": 27053, "epoch": 644} {"train_loss": -5.183572769165039, "global_step": 27054, "epoch": 644} {"train_loss": -5.124774932861328, "global_step": 27055, "epoch": 644} {"train_loss": -5.2017645835876465, "global_step": 27056, "epoch": 644} {"train_loss": -5.307868003845215, "global_step": 27057, "epoch": 644} {"train_loss": -5.428048133850098, "global_step": 27058, "epoch": 644} {"train_loss": -5.263263702392578, "global_step": 27059, "epoch": 644} {"train_loss": -5.463663101196289, "global_step": 27060, "epoch": 644} {"train_loss": -5.357553005218506, "global_step": 27061, "epoch": 644} {"train_loss": -5.398479461669922, "global_step": 27062, "epoch": 644} {"train_loss": -5.358797073364258, "global_step": 27063, "epoch": 644} {"train_loss": -5.289490699768066, "global_step": 27064, "epoch": 644} {"train_loss": -5.286884307861328, "global_step": 27065, "epoch": 644} {"train_loss": -5.410683631896973, "global_step": 27066, "epoch": 644} {"train_loss": -5.491168022155762, "global_step": 27067, "epoch": 644} {"train_loss": -5.332025527954102, "global_step": 27068, "epoch": 644} {"train_loss": -5.526889324188232, "global_step": 27069, "epoch": 644} {"train_loss": -5.442122936248779, "global_step": 27070, "epoch": 644} {"train_loss": -5.3701863288879395, "global_step": 27071, "epoch": 644} {"train_loss": -5.290269374847412, "global_step": 27072, "epoch": 644} {"train_loss": -5.336760520935059, "global_step": 27073, "epoch": 644} {"train_loss": -5.314692497253418, "global_step": 27074, "epoch": 644} {"train_loss": -5.369277000427246, "global_step": 27075, "epoch": 644} {"train_loss": -5.5509490966796875, "global_step": 27076, "epoch": 644} {"train_loss": -5.479289531707764, "global_step": 27077, "epoch": 644} {"train_loss": -5.486093521118164, "global_step": 27078, "epoch": 644} {"train_loss": -5.350490570068359, "global_step": 27079, "epoch": 644} {"train_loss": -5.267788887023926, "global_step": 27080, "epoch": 644} {"train_loss": -5.459399700164795, "global_step": 27081, "epoch": 644} {"train_loss": -5.54444694519043, "global_step": 27082, "epoch": 644} {"train_loss": -5.4896440505981445, "global_step": 27083, "epoch": 644} {"train_loss": -5.461530685424805, "global_step": 27084, "epoch": 644} {"train_loss": -5.468559265136719, "global_step": 27085, "epoch": 644} {"train_loss": -5.390547275543213, "global_step": 27086, "epoch": 644} {"train_loss": -5.293100357055664, "global_step": 27087, "epoch": 644} {"train_loss": -5.52408504486084, "global_step": 27088, "epoch": 644} {"train_loss": -5.388245877765474, "global_step": 27089, "epoch": 644, "val_loss": 76071.2578125} {"train_loss": -5.476085186004639, "global_step": 27090, "epoch": 645} {"train_loss": -5.422316551208496, "global_step": 27091, "epoch": 645} {"train_loss": -5.476199150085449, "global_step": 27092, "epoch": 645} {"train_loss": -5.3963303565979, "global_step": 27093, "epoch": 645} {"train_loss": -5.5052571296691895, "global_step": 27094, "epoch": 645} {"train_loss": -5.2914204597473145, "global_step": 27095, "epoch": 645} {"train_loss": -5.411980628967285, "global_step": 27096, "epoch": 645} {"train_loss": -5.35066556930542, "global_step": 27097, "epoch": 645} {"train_loss": -5.429026126861572, "global_step": 27098, "epoch": 645} {"train_loss": -5.339169979095459, "global_step": 27099, "epoch": 645} {"train_loss": -5.317692756652832, "global_step": 27100, "epoch": 645} {"train_loss": -5.392494201660156, "global_step": 27101, "epoch": 645} {"train_loss": -5.298402309417725, "global_step": 27102, "epoch": 645} {"train_loss": -5.197725772857666, "global_step": 27103, "epoch": 645} {"train_loss": -5.329331398010254, "global_step": 27104, "epoch": 645} {"train_loss": -5.246895790100098, "global_step": 27105, "epoch": 645} {"train_loss": -5.369929313659668, "global_step": 27106, "epoch": 645} {"train_loss": -5.405802249908447, "global_step": 27107, "epoch": 645} {"train_loss": -5.431430816650391, "global_step": 27108, "epoch": 645} {"train_loss": -5.373119354248047, "global_step": 27109, "epoch": 645} {"train_loss": -5.383570194244385, "global_step": 27110, "epoch": 645} {"train_loss": -5.393346786499023, "global_step": 27111, "epoch": 645} {"train_loss": -5.355086326599121, "global_step": 27112, "epoch": 645} {"train_loss": -5.411889553070068, "global_step": 27113, "epoch": 645} {"train_loss": -5.457296371459961, "global_step": 27114, "epoch": 645} {"train_loss": -5.463973045349121, "global_step": 27115, "epoch": 645} {"train_loss": -5.371816635131836, "global_step": 27116, "epoch": 645} {"train_loss": -5.417903900146484, "global_step": 27117, "epoch": 645} {"train_loss": -5.368731498718262, "global_step": 27118, "epoch": 645} {"train_loss": -5.376176834106445, "global_step": 27119, "epoch": 645} {"train_loss": -5.329775810241699, "global_step": 27120, "epoch": 645} {"train_loss": -5.445900917053223, "global_step": 27121, "epoch": 645} {"train_loss": -5.45797061920166, "global_step": 27122, "epoch": 645} {"train_loss": -5.296847820281982, "global_step": 27123, "epoch": 645} {"train_loss": -5.315173625946045, "global_step": 27124, "epoch": 645} {"train_loss": -5.481394290924072, "global_step": 27125, "epoch": 645} {"train_loss": -5.460574150085449, "global_step": 27126, "epoch": 645} {"train_loss": -5.540502548217773, "global_step": 27127, "epoch": 645} {"train_loss": -5.372343063354492, "global_step": 27128, "epoch": 645} {"train_loss": -5.390352249145508, "global_step": 27129, "epoch": 645} {"train_loss": -5.424996376037598, "global_step": 27130, "epoch": 645} {"train_loss": -5.392351445697603, "global_step": 27131, "epoch": 645, "val_loss": 75631.6328125} {"train_loss": -5.567223072052002, "global_step": 27132, "epoch": 646} {"train_loss": -5.298378944396973, "global_step": 27133, "epoch": 646} {"train_loss": -5.376172065734863, "global_step": 27134, "epoch": 646} {"train_loss": -5.352463722229004, "global_step": 27135, "epoch": 646} {"train_loss": -5.3338117599487305, "global_step": 27136, "epoch": 646} {"train_loss": -5.381839275360107, "global_step": 27137, "epoch": 646} {"train_loss": -5.289822101593018, "global_step": 27138, "epoch": 646} {"train_loss": -5.4198784828186035, "global_step": 27139, "epoch": 646} {"train_loss": -5.341172218322754, "global_step": 27140, "epoch": 646} {"train_loss": -5.401656150817871, "global_step": 27141, "epoch": 646} {"train_loss": -5.46258544921875, "global_step": 27142, "epoch": 646} {"train_loss": -5.24649715423584, "global_step": 27143, "epoch": 646} {"train_loss": -5.297949314117432, "global_step": 27144, "epoch": 646} {"train_loss": -5.4430694580078125, "global_step": 27145, "epoch": 646} {"train_loss": -5.274259567260742, "global_step": 27146, "epoch": 646} {"train_loss": -5.463596343994141, "global_step": 27147, "epoch": 646} {"train_loss": -5.110541343688965, "global_step": 27148, "epoch": 646} {"train_loss": -5.263261318206787, "global_step": 27149, "epoch": 646} {"train_loss": -5.251263618469238, "global_step": 27150, "epoch": 646} {"train_loss": -5.380002498626709, "global_step": 27151, "epoch": 646} {"train_loss": -5.313397407531738, "global_step": 27152, "epoch": 646} {"train_loss": -5.225898742675781, "global_step": 27153, "epoch": 646} {"train_loss": -5.4086151123046875, "global_step": 27154, "epoch": 646} {"train_loss": -5.3683061599731445, "global_step": 27155, "epoch": 646} {"train_loss": -5.490248680114746, "global_step": 27156, "epoch": 646} {"train_loss": -5.436728477478027, "global_step": 27157, "epoch": 646} {"train_loss": -5.444005966186523, "global_step": 27158, "epoch": 646} {"train_loss": -5.411223411560059, "global_step": 27159, "epoch": 646} {"train_loss": -5.318182945251465, "global_step": 27160, "epoch": 646} {"train_loss": -5.4824628829956055, "global_step": 27161, "epoch": 646} {"train_loss": -5.4593892097473145, "global_step": 27162, "epoch": 646} {"train_loss": -5.387937545776367, "global_step": 27163, "epoch": 646} {"train_loss": -5.4008636474609375, "global_step": 27164, "epoch": 646} {"train_loss": -5.396142482757568, "global_step": 27165, "epoch": 646} {"train_loss": -5.398077011108398, "global_step": 27166, "epoch": 646} {"train_loss": -5.341555595397949, "global_step": 27167, "epoch": 646} {"train_loss": -5.485403060913086, "global_step": 27168, "epoch": 646} {"train_loss": -5.391451358795166, "global_step": 27169, "epoch": 646} {"train_loss": -5.434340000152588, "global_step": 27170, "epoch": 646} {"train_loss": -5.505397796630859, "global_step": 27171, "epoch": 646} {"train_loss": -5.472306251525879, "global_step": 27172, "epoch": 646} {"train_loss": -5.380693015598116, "global_step": 27173, "epoch": 646, "val_loss": 75962.6015625} {"train_loss": -5.413175106048584, "global_step": 27174, "epoch": 647} {"train_loss": -5.309995174407959, "global_step": 27175, "epoch": 647} {"train_loss": -5.423622131347656, "global_step": 27176, "epoch": 647} {"train_loss": -5.5115461349487305, "global_step": 27177, "epoch": 647} {"train_loss": -5.399681568145752, "global_step": 27178, "epoch": 647} {"train_loss": -5.440566062927246, "global_step": 27179, "epoch": 647} {"train_loss": -5.305018901824951, "global_step": 27180, "epoch": 647} {"train_loss": -5.4849934577941895, "global_step": 27181, "epoch": 647} {"train_loss": -5.532314300537109, "global_step": 27182, "epoch": 647} {"train_loss": -5.375245094299316, "global_step": 27183, "epoch": 647} {"train_loss": -5.327392578125, "global_step": 27184, "epoch": 647} {"train_loss": -5.351398468017578, "global_step": 27185, "epoch": 647} {"train_loss": -5.260004997253418, "global_step": 27186, "epoch": 647} {"train_loss": -5.369736671447754, "global_step": 27187, "epoch": 647} {"train_loss": -5.456899166107178, "global_step": 27188, "epoch": 647} {"train_loss": -5.398836135864258, "global_step": 27189, "epoch": 647} {"train_loss": -5.521286487579346, "global_step": 27190, "epoch": 647} {"train_loss": -5.412335395812988, "global_step": 27191, "epoch": 647} {"train_loss": -5.556168556213379, "global_step": 27192, "epoch": 647} {"train_loss": -5.500848293304443, "global_step": 27193, "epoch": 647} {"train_loss": -5.4308977127075195, "global_step": 27194, "epoch": 647} {"train_loss": -5.5160603523254395, "global_step": 27195, "epoch": 647} {"train_loss": -5.419062614440918, "global_step": 27196, "epoch": 647} {"train_loss": -5.660073757171631, "global_step": 27197, "epoch": 647} {"train_loss": -5.392531394958496, "global_step": 27198, "epoch": 647} {"train_loss": -5.477471828460693, "global_step": 27199, "epoch": 647} {"train_loss": -5.45201301574707, "global_step": 27200, "epoch": 647} {"train_loss": -5.399369239807129, "global_step": 27201, "epoch": 647} {"train_loss": -5.491785049438477, "global_step": 27202, "epoch": 647} {"train_loss": -5.54325008392334, "global_step": 27203, "epoch": 647} {"train_loss": -5.535900115966797, "global_step": 27204, "epoch": 647} {"train_loss": -5.564918041229248, "global_step": 27205, "epoch": 647} {"train_loss": -5.556595325469971, "global_step": 27206, "epoch": 647} {"train_loss": -5.538996696472168, "global_step": 27207, "epoch": 647} {"train_loss": -5.402631759643555, "global_step": 27208, "epoch": 647} {"train_loss": -5.404531478881836, "global_step": 27209, "epoch": 647} {"train_loss": -5.3745927810668945, "global_step": 27210, "epoch": 647} {"train_loss": -5.573553562164307, "global_step": 27211, "epoch": 647} {"train_loss": -5.447381973266602, "global_step": 27212, "epoch": 647} {"train_loss": -5.342650890350342, "global_step": 27213, "epoch": 647} {"train_loss": -5.457659721374512, "global_step": 27214, "epoch": 647} {"train_loss": -5.443121626263573, "global_step": 27215, "epoch": 647, "val_loss": 74794.2421875} {"train_loss": -5.388136863708496, "global_step": 27216, "epoch": 648} {"train_loss": -5.2295241355896, "global_step": 27217, "epoch": 648} {"train_loss": -5.458907127380371, "global_step": 27218, "epoch": 648} {"train_loss": -5.401019096374512, "global_step": 27219, "epoch": 648} {"train_loss": -5.371725082397461, "global_step": 27220, "epoch": 648} {"train_loss": -5.463423252105713, "global_step": 27221, "epoch": 648} {"train_loss": -5.370298385620117, "global_step": 27222, "epoch": 648} {"train_loss": -5.440167427062988, "global_step": 27223, "epoch": 648} {"train_loss": -5.444221496582031, "global_step": 27224, "epoch": 648} {"train_loss": -5.436885356903076, "global_step": 27225, "epoch": 648} {"train_loss": -5.375838279724121, "global_step": 27226, "epoch": 648} {"train_loss": -5.541404724121094, "global_step": 27227, "epoch": 648} {"train_loss": -5.432072162628174, "global_step": 27228, "epoch": 648} {"train_loss": -5.3911027908325195, "global_step": 27229, "epoch": 648} {"train_loss": -5.401190280914307, "global_step": 27230, "epoch": 648} {"train_loss": -5.468480110168457, "global_step": 27231, "epoch": 648} {"train_loss": -5.357039928436279, "global_step": 27232, "epoch": 648} {"train_loss": -5.3903374671936035, "global_step": 27233, "epoch": 648} {"train_loss": -5.478979110717773, "global_step": 27234, "epoch": 648} {"train_loss": -5.376116752624512, "global_step": 27235, "epoch": 648} {"train_loss": -5.489213466644287, "global_step": 27236, "epoch": 648} {"train_loss": -5.246084213256836, "global_step": 27237, "epoch": 648} {"train_loss": -5.421173095703125, "global_step": 27238, "epoch": 648} {"train_loss": -5.386568069458008, "global_step": 27239, "epoch": 648} {"train_loss": -5.3304853439331055, "global_step": 27240, "epoch": 648} {"train_loss": -5.360637664794922, "global_step": 27241, "epoch": 648} {"train_loss": -5.474858283996582, "global_step": 27242, "epoch": 648} {"train_loss": -5.501138687133789, "global_step": 27243, "epoch": 648} {"train_loss": -5.469246864318848, "global_step": 27244, "epoch": 648} {"train_loss": -5.3950300216674805, "global_step": 27245, "epoch": 648} {"train_loss": -5.451606750488281, "global_step": 27246, "epoch": 648} {"train_loss": -5.451929092407227, "global_step": 27247, "epoch": 648} {"train_loss": -5.360552787780762, "global_step": 27248, "epoch": 648} {"train_loss": -5.551502704620361, "global_step": 27249, "epoch": 648} {"train_loss": -5.367812156677246, "global_step": 27250, "epoch": 648} {"train_loss": -5.300173282623291, "global_step": 27251, "epoch": 648} {"train_loss": -5.397951126098633, "global_step": 27252, "epoch": 648} {"train_loss": -5.494450569152832, "global_step": 27253, "epoch": 648} {"train_loss": -5.554914474487305, "global_step": 27254, "epoch": 648} {"train_loss": -5.461535453796387, "global_step": 27255, "epoch": 648} {"train_loss": -5.525777339935303, "global_step": 27256, "epoch": 648} {"train_loss": -5.419386000860305, "global_step": 27257, "epoch": 648, "val_loss": 75785.96875} {"train_loss": -5.401742935180664, "global_step": 27258, "epoch": 649} {"train_loss": -5.399324893951416, "global_step": 27259, "epoch": 649} {"train_loss": -5.4730963706970215, "global_step": 27260, "epoch": 649} {"train_loss": -5.455591678619385, "global_step": 27261, "epoch": 649} {"train_loss": -5.586635589599609, "global_step": 27262, "epoch": 649} {"train_loss": -5.485400199890137, "global_step": 27263, "epoch": 649} {"train_loss": -5.397366046905518, "global_step": 27264, "epoch": 649} {"train_loss": -5.440421104431152, "global_step": 27265, "epoch": 649} {"train_loss": -5.6316819190979, "global_step": 27266, "epoch": 649} {"train_loss": -5.556878566741943, "global_step": 27267, "epoch": 649} {"train_loss": -5.415334701538086, "global_step": 27268, "epoch": 649} {"train_loss": -5.514756202697754, "global_step": 27269, "epoch": 649} {"train_loss": -5.3152546882629395, "global_step": 27270, "epoch": 649} {"train_loss": -5.483923435211182, "global_step": 27271, "epoch": 649} {"train_loss": -5.416512489318848, "global_step": 27272, "epoch": 649} {"train_loss": -5.447972297668457, "global_step": 27273, "epoch": 649} {"train_loss": -5.54055118560791, "global_step": 27274, "epoch": 649} {"train_loss": -5.432551383972168, "global_step": 27275, "epoch": 649} {"train_loss": -5.500479221343994, "global_step": 27276, "epoch": 649} {"train_loss": -5.465321063995361, "global_step": 27277, "epoch": 649} {"train_loss": -5.351179599761963, "global_step": 27278, "epoch": 649} {"train_loss": -5.516472816467285, "global_step": 27279, "epoch": 649} {"train_loss": -5.441105842590332, "global_step": 27280, "epoch": 649} {"train_loss": -5.394853591918945, "global_step": 27281, "epoch": 649} {"train_loss": -5.459022045135498, "global_step": 27282, "epoch": 649} {"train_loss": -5.319171905517578, "global_step": 27283, "epoch": 649} {"train_loss": -5.457827091217041, "global_step": 27284, "epoch": 649} {"train_loss": -5.349375247955322, "global_step": 27285, "epoch": 649} {"train_loss": -5.40799617767334, "global_step": 27286, "epoch": 649} {"train_loss": -5.308445930480957, "global_step": 27287, "epoch": 649} {"train_loss": -5.366532325744629, "global_step": 27288, "epoch": 649} {"train_loss": -5.410348415374756, "global_step": 27289, "epoch": 649} {"train_loss": -5.3919477462768555, "global_step": 27290, "epoch": 649} {"train_loss": -5.37919282913208, "global_step": 27291, "epoch": 649} {"train_loss": -5.415433883666992, "global_step": 27292, "epoch": 649} {"train_loss": -5.412550926208496, "global_step": 27293, "epoch": 649} {"train_loss": -5.40437650680542, "global_step": 27294, "epoch": 649} {"train_loss": -5.435602188110352, "global_step": 27295, "epoch": 649} {"train_loss": -5.322412014007568, "global_step": 27296, "epoch": 649} {"train_loss": -5.289248466491699, "global_step": 27297, "epoch": 649} {"train_loss": -5.438554763793945, "global_step": 27298, "epoch": 649} {"train_loss": -5.428721348444621, "global_step": 27299, "epoch": 649, "val_loss": 75467.1640625} {"train_loss": -5.440181255340576, "global_step": 27300, "epoch": 650} {"train_loss": -5.391967296600342, "global_step": 27301, "epoch": 650} {"train_loss": -5.55484676361084, "global_step": 27302, "epoch": 650} {"train_loss": -5.3185529708862305, "global_step": 27303, "epoch": 650} {"train_loss": -5.431154727935791, "global_step": 27304, "epoch": 650} {"train_loss": -5.369963645935059, "global_step": 27305, "epoch": 650} {"train_loss": -5.187249660491943, "global_step": 27306, "epoch": 650} {"train_loss": -5.438686370849609, "global_step": 27307, "epoch": 650} {"train_loss": -5.1626996994018555, "global_step": 27308, "epoch": 650} {"train_loss": -5.326309680938721, "global_step": 27309, "epoch": 650} {"train_loss": -5.329151630401611, "global_step": 27310, "epoch": 650} {"train_loss": -5.208202362060547, "global_step": 27311, "epoch": 650} {"train_loss": -5.404064178466797, "global_step": 27312, "epoch": 650} {"train_loss": -5.331239700317383, "global_step": 27313, "epoch": 650} {"train_loss": -5.3816142082214355, "global_step": 27314, "epoch": 650} {"train_loss": -5.4400529861450195, "global_step": 27315, "epoch": 650} {"train_loss": -5.414556980133057, "global_step": 27316, "epoch": 650} {"train_loss": -5.434957027435303, "global_step": 27317, "epoch": 650} {"train_loss": -5.336735725402832, "global_step": 27318, "epoch": 650} {"train_loss": -5.418279647827148, "global_step": 27319, "epoch": 650} {"train_loss": -5.387350082397461, "global_step": 27320, "epoch": 650} {"train_loss": -5.32883882522583, "global_step": 27321, "epoch": 650} {"train_loss": -5.331158638000488, "global_step": 27322, "epoch": 650} {"train_loss": -5.443772315979004, "global_step": 27323, "epoch": 650} {"train_loss": -5.496699333190918, "global_step": 27324, "epoch": 650} {"train_loss": -5.453945636749268, "global_step": 27325, "epoch": 650} {"train_loss": -5.524320602416992, "global_step": 27326, "epoch": 650} {"train_loss": -5.392409324645996, "global_step": 27327, "epoch": 650} {"train_loss": -5.47557258605957, "global_step": 27328, "epoch": 650} {"train_loss": -5.392914295196533, "global_step": 27329, "epoch": 650} {"train_loss": -5.354442596435547, "global_step": 27330, "epoch": 650} {"train_loss": -5.538857460021973, "global_step": 27331, "epoch": 650} {"train_loss": -5.268249988555908, "global_step": 27332, "epoch": 650} {"train_loss": -5.496908187866211, "global_step": 27333, "epoch": 650} {"train_loss": -5.481348991394043, "global_step": 27334, "epoch": 650} {"train_loss": -5.384969711303711, "global_step": 27335, "epoch": 650} {"train_loss": -5.470130920410156, "global_step": 27336, "epoch": 650} {"train_loss": -5.329385757446289, "global_step": 27337, "epoch": 650} {"train_loss": -5.382267951965332, "global_step": 27338, "epoch": 650} {"train_loss": -5.482884883880615, "global_step": 27339, "epoch": 650} {"train_loss": -5.415349006652832, "global_step": 27340, "epoch": 650} {"train_loss": -5.3958441984085805, "global_step": 27341, "epoch": 650, "train/sim_max_reward_0": 0.2522498378477222, "train/sim_max_reward_1": 0.15209366586168904, "train/sim_max_reward_2": 0.9008590679831874, "train/sim_max_reward_3": 0.165893633980918, "train/sim_max_reward_4": 0.8626743005842405, "train/sim_max_reward_5": 0.30698827246420207, "test/sim_max_reward_4500000": 0.8420738603387057, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.47280999919274636, "test/sim_max_reward_4500003": 0.5650057546624806, "test/sim_max_reward_4500004": 0.057834396720529126, "test/sim_max_reward_4500005": 0.3582492878787628, "test/sim_max_reward_4500006": 0.4310462671283696, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.14010319035430777, "test/sim_max_reward_4500009": 0.7195719463166371, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.34715901630829743, "test/sim_max_reward_4500012": 0.00033874784108770537, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.3531065481394175, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.38548870782958794, "test/sim_max_reward_4500019": 0.39508153283368475, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.30084959469876804, "test/sim_max_reward_4500022": 0.6978697400239964, "test/sim_max_reward_4500023": 0.5487093740945992, "test/sim_max_reward_4500024": 0.4359498860737422, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.5205873472351571, "test/sim_max_reward_4500027": 0.7495866893428277, "test/sim_max_reward_4500028": 0.4299863828765311, "test/sim_max_reward_4500029": 0.04163460642148004, "test/sim_max_reward_4500030": 0.16481651202644143, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.31741651281790195, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.7434917268051919, "test/sim_max_reward_4500035": 0.8849955433632379, "test/sim_max_reward_4500036": 0.39328751885503144, "test/sim_max_reward_4500037": 0.20709220783936455, "test/sim_max_reward_4500038": 0.9283063578178067, "test/sim_max_reward_4500039": 0.6381344603304708, "test/sim_max_reward_4500040": 0.16098505188808257, "test/sim_max_reward_4500041": 0.1790285908032239, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.567256457278159, "test/sim_max_reward_4500044": 0.5196824030076879, "test/sim_max_reward_4500045": 0.35558620305402616, "test/sim_max_reward_4500046": 0.61931525627049, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.4807535894853694, "test/sim_max_reward_4500049": 0.02286088287471423, "train/mean_score": 0.4401264631203265, "test/mean_score": 0.3198743886854152, "val_loss": 76044.890625} {"train_loss": -5.42941951751709, "global_step": 27342, "epoch": 651} {"train_loss": -5.442346096038818, "global_step": 27343, "epoch": 651} {"train_loss": -5.42586088180542, "global_step": 27344, "epoch": 651} {"train_loss": -5.419217109680176, "global_step": 27345, "epoch": 651} {"train_loss": -5.436551094055176, "global_step": 27346, "epoch": 651} {"train_loss": -5.430487155914307, "global_step": 27347, "epoch": 651} {"train_loss": -5.459474086761475, "global_step": 27348, "epoch": 651} {"train_loss": -5.46504020690918, "global_step": 27349, "epoch": 651} {"train_loss": -5.406231880187988, "global_step": 27350, "epoch": 651} {"train_loss": -5.497830390930176, "global_step": 27351, "epoch": 651} {"train_loss": -5.409194469451904, "global_step": 27352, "epoch": 651} {"train_loss": -5.351806640625, "global_step": 27353, "epoch": 651} {"train_loss": -5.269043445587158, "global_step": 27354, "epoch": 651} {"train_loss": -5.316702842712402, "global_step": 27355, "epoch": 651} {"train_loss": -5.4845428466796875, "global_step": 27356, "epoch": 651} {"train_loss": -5.425459861755371, "global_step": 27357, "epoch": 651} {"train_loss": -5.330260753631592, "global_step": 27358, "epoch": 651} {"train_loss": -5.487382411956787, "global_step": 27359, "epoch": 651} {"train_loss": -5.516706943511963, "global_step": 27360, "epoch": 651} {"train_loss": -5.422545909881592, "global_step": 27361, "epoch": 651} {"train_loss": -5.585570335388184, "global_step": 27362, "epoch": 651} {"train_loss": -5.500890731811523, "global_step": 27363, "epoch": 651} {"train_loss": -5.543795108795166, "global_step": 27364, "epoch": 651} {"train_loss": -5.464559078216553, "global_step": 27365, "epoch": 651} {"train_loss": -5.297543525695801, "global_step": 27366, "epoch": 651} {"train_loss": -5.330592155456543, "global_step": 27367, "epoch": 651} {"train_loss": -5.3049421310424805, "global_step": 27368, "epoch": 651} {"train_loss": -5.340230941772461, "global_step": 27369, "epoch": 651} {"train_loss": -5.449580669403076, "global_step": 27370, "epoch": 651} {"train_loss": -5.477448463439941, "global_step": 27371, "epoch": 651} {"train_loss": -5.6361870765686035, "global_step": 27372, "epoch": 651} {"train_loss": -5.419743537902832, "global_step": 27373, "epoch": 651} {"train_loss": -5.385507583618164, "global_step": 27374, "epoch": 651} {"train_loss": -5.3445305824279785, "global_step": 27375, "epoch": 651} {"train_loss": -5.370111465454102, "global_step": 27376, "epoch": 651} {"train_loss": -5.380897045135498, "global_step": 27377, "epoch": 651} {"train_loss": -5.385251998901367, "global_step": 27378, "epoch": 651} {"train_loss": -5.428776741027832, "global_step": 27379, "epoch": 651} {"train_loss": -5.252224922180176, "global_step": 27380, "epoch": 651} {"train_loss": -5.534334659576416, "global_step": 27381, "epoch": 651} {"train_loss": -5.46730899810791, "global_step": 27382, "epoch": 651} {"train_loss": -5.423455056690035, "global_step": 27383, "epoch": 651, "val_loss": 75945.859375} {"train_loss": -5.4213666915893555, "global_step": 27384, "epoch": 652} {"train_loss": -5.393807411193848, "global_step": 27385, "epoch": 652} {"train_loss": -5.543778419494629, "global_step": 27386, "epoch": 652} {"train_loss": -5.4866623878479, "global_step": 27387, "epoch": 652} {"train_loss": -5.373715877532959, "global_step": 27388, "epoch": 652} {"train_loss": -5.444487571716309, "global_step": 27389, "epoch": 652} {"train_loss": -5.35916805267334, "global_step": 27390, "epoch": 652} {"train_loss": -5.471286773681641, "global_step": 27391, "epoch": 652} {"train_loss": -5.386725902557373, "global_step": 27392, "epoch": 652} {"train_loss": -5.362585067749023, "global_step": 27393, "epoch": 652} {"train_loss": -5.596749305725098, "global_step": 27394, "epoch": 652} {"train_loss": -5.420929431915283, "global_step": 27395, "epoch": 652} {"train_loss": -5.33935546875, "global_step": 27396, "epoch": 652} {"train_loss": -5.45412540435791, "global_step": 27397, "epoch": 652} {"train_loss": -5.454978942871094, "global_step": 27398, "epoch": 652} {"train_loss": -5.380875587463379, "global_step": 27399, "epoch": 652} {"train_loss": -5.471148490905762, "global_step": 27400, "epoch": 652} {"train_loss": -5.3527116775512695, "global_step": 27401, "epoch": 652} {"train_loss": -5.4641008377075195, "global_step": 27402, "epoch": 652} {"train_loss": -5.452148914337158, "global_step": 27403, "epoch": 652} {"train_loss": -5.295551300048828, "global_step": 27404, "epoch": 652} {"train_loss": -5.400718688964844, "global_step": 27405, "epoch": 652} {"train_loss": -5.574697971343994, "global_step": 27406, "epoch": 652} {"train_loss": -5.5001444816589355, "global_step": 27407, "epoch": 652} {"train_loss": -5.309040069580078, "global_step": 27408, "epoch": 652} {"train_loss": -5.333835601806641, "global_step": 27409, "epoch": 652} {"train_loss": -5.417707443237305, "global_step": 27410, "epoch": 652} {"train_loss": -5.393267631530762, "global_step": 27411, "epoch": 652} {"train_loss": -5.441210746765137, "global_step": 27412, "epoch": 652} {"train_loss": -5.534602165222168, "global_step": 27413, "epoch": 652} {"train_loss": -5.633767127990723, "global_step": 27414, "epoch": 652} {"train_loss": -5.425568580627441, "global_step": 27415, "epoch": 652} {"train_loss": -5.390259265899658, "global_step": 27416, "epoch": 652} {"train_loss": -5.549305438995361, "global_step": 27417, "epoch": 652} {"train_loss": -5.419142246246338, "global_step": 27418, "epoch": 652} {"train_loss": -5.385009288787842, "global_step": 27419, "epoch": 652} {"train_loss": -5.4750566482543945, "global_step": 27420, "epoch": 652} {"train_loss": -5.4639716148376465, "global_step": 27421, "epoch": 652} {"train_loss": -5.330172061920166, "global_step": 27422, "epoch": 652} {"train_loss": -5.417513370513916, "global_step": 27423, "epoch": 652} {"train_loss": -5.552411079406738, "global_step": 27424, "epoch": 652} {"train_loss": -5.435174680891491, "global_step": 27425, "epoch": 652, "val_loss": 75334.2265625} {"train_loss": -5.42244815826416, "global_step": 27426, "epoch": 653} {"train_loss": -5.37578010559082, "global_step": 27427, "epoch": 653} {"train_loss": -5.404078960418701, "global_step": 27428, "epoch": 653} {"train_loss": -5.310935020446777, "global_step": 27429, "epoch": 653} {"train_loss": -5.4452924728393555, "global_step": 27430, "epoch": 653} {"train_loss": -5.3091206550598145, "global_step": 27431, "epoch": 653} {"train_loss": -5.3241376876831055, "global_step": 27432, "epoch": 653} {"train_loss": -5.378775119781494, "global_step": 27433, "epoch": 653} {"train_loss": -5.326902389526367, "global_step": 27434, "epoch": 653} {"train_loss": -5.3659162521362305, "global_step": 27435, "epoch": 653} {"train_loss": -5.436152458190918, "global_step": 27436, "epoch": 653} {"train_loss": -5.245445728302002, "global_step": 27437, "epoch": 653} {"train_loss": -5.393552780151367, "global_step": 27438, "epoch": 653} {"train_loss": -5.316367149353027, "global_step": 27439, "epoch": 653} {"train_loss": -5.468172073364258, "global_step": 27440, "epoch": 653} {"train_loss": -5.263227462768555, "global_step": 27441, "epoch": 653} {"train_loss": -5.447339057922363, "global_step": 27442, "epoch": 653} {"train_loss": -5.333996772766113, "global_step": 27443, "epoch": 653} {"train_loss": -5.4161858558654785, "global_step": 27444, "epoch": 653} {"train_loss": -5.349634647369385, "global_step": 27445, "epoch": 653} {"train_loss": -5.4864935874938965, "global_step": 27446, "epoch": 653} {"train_loss": -5.486217498779297, "global_step": 27447, "epoch": 653} {"train_loss": -5.33851432800293, "global_step": 27448, "epoch": 653} {"train_loss": -5.4566144943237305, "global_step": 27449, "epoch": 653} {"train_loss": -5.368159294128418, "global_step": 27450, "epoch": 653} {"train_loss": -5.474969387054443, "global_step": 27451, "epoch": 653} {"train_loss": -5.517253875732422, "global_step": 27452, "epoch": 653} {"train_loss": -5.523888111114502, "global_step": 27453, "epoch": 653} {"train_loss": -5.415811538696289, "global_step": 27454, "epoch": 653} {"train_loss": -5.457859039306641, "global_step": 27455, "epoch": 653} {"train_loss": -5.502429008483887, "global_step": 27456, "epoch": 653} {"train_loss": -5.541787147521973, "global_step": 27457, "epoch": 653} {"train_loss": -5.442413806915283, "global_step": 27458, "epoch": 653} {"train_loss": -5.436653137207031, "global_step": 27459, "epoch": 653} {"train_loss": -5.392746925354004, "global_step": 27460, "epoch": 653} {"train_loss": -5.368036270141602, "global_step": 27461, "epoch": 653} {"train_loss": -5.409687042236328, "global_step": 27462, "epoch": 653} {"train_loss": -5.40339469909668, "global_step": 27463, "epoch": 653} {"train_loss": -5.52937650680542, "global_step": 27464, "epoch": 653} {"train_loss": -5.523504257202148, "global_step": 27465, "epoch": 653} {"train_loss": -5.3935227394104, "global_step": 27466, "epoch": 653} {"train_loss": -5.411256642568679, "global_step": 27467, "epoch": 653, "val_loss": 75483.890625} {"train_loss": -5.475679397583008, "global_step": 27468, "epoch": 654} {"train_loss": -5.429518699645996, "global_step": 27469, "epoch": 654} {"train_loss": -5.27561092376709, "global_step": 27470, "epoch": 654} {"train_loss": -5.494622230529785, "global_step": 27471, "epoch": 654} {"train_loss": -5.350029945373535, "global_step": 27472, "epoch": 654} {"train_loss": -5.420031547546387, "global_step": 27473, "epoch": 654} {"train_loss": -5.511423587799072, "global_step": 27474, "epoch": 654} {"train_loss": -5.47816801071167, "global_step": 27475, "epoch": 654} {"train_loss": -5.38385009765625, "global_step": 27476, "epoch": 654} {"train_loss": -5.529264450073242, "global_step": 27477, "epoch": 654} {"train_loss": -5.425412178039551, "global_step": 27478, "epoch": 654} {"train_loss": -5.421895980834961, "global_step": 27479, "epoch": 654} {"train_loss": -5.488525390625, "global_step": 27480, "epoch": 654} {"train_loss": -5.488772869110107, "global_step": 27481, "epoch": 654} {"train_loss": -5.316059112548828, "global_step": 27482, "epoch": 654} {"train_loss": -5.489340305328369, "global_step": 27483, "epoch": 654} {"train_loss": -5.447778701782227, "global_step": 27484, "epoch": 654} {"train_loss": -5.45890474319458, "global_step": 27485, "epoch": 654} {"train_loss": -5.414453506469727, "global_step": 27486, "epoch": 654} {"train_loss": -5.415432929992676, "global_step": 27487, "epoch": 654} {"train_loss": -5.358905792236328, "global_step": 27488, "epoch": 654} {"train_loss": -5.511989593505859, "global_step": 27489, "epoch": 654} {"train_loss": -5.332396030426025, "global_step": 27490, "epoch": 654} {"train_loss": -5.422426700592041, "global_step": 27491, "epoch": 654} {"train_loss": -5.470807075500488, "global_step": 27492, "epoch": 654} {"train_loss": -5.26822566986084, "global_step": 27493, "epoch": 654} {"train_loss": -5.285207748413086, "global_step": 27494, "epoch": 654} {"train_loss": -5.418671607971191, "global_step": 27495, "epoch": 654} {"train_loss": -5.27517032623291, "global_step": 27496, "epoch": 654} {"train_loss": -5.5174970626831055, "global_step": 27497, "epoch": 654} {"train_loss": -5.2172651290893555, "global_step": 27498, "epoch": 654} {"train_loss": -5.3993706703186035, "global_step": 27499, "epoch": 654} {"train_loss": -5.417047500610352, "global_step": 27500, "epoch": 654} {"train_loss": -5.453747749328613, "global_step": 27501, "epoch": 654} {"train_loss": -5.383514404296875, "global_step": 27502, "epoch": 654} {"train_loss": -5.279538154602051, "global_step": 27503, "epoch": 654} {"train_loss": -5.432891845703125, "global_step": 27504, "epoch": 654} {"train_loss": -5.408674240112305, "global_step": 27505, "epoch": 654} {"train_loss": -5.395264625549316, "global_step": 27506, "epoch": 654} {"train_loss": -5.4953789710998535, "global_step": 27507, "epoch": 654} {"train_loss": -5.580776214599609, "global_step": 27508, "epoch": 654} {"train_loss": -5.41657262756711, "global_step": 27509, "epoch": 654, "val_loss": 75736.1875} {"train_loss": -5.401304721832275, "global_step": 27510, "epoch": 655} {"train_loss": -5.564423084259033, "global_step": 27511, "epoch": 655} {"train_loss": -5.532228469848633, "global_step": 27512, "epoch": 655} {"train_loss": -5.437056541442871, "global_step": 27513, "epoch": 655} {"train_loss": -5.3536248207092285, "global_step": 27514, "epoch": 655} {"train_loss": -5.476920127868652, "global_step": 27515, "epoch": 655} {"train_loss": -5.318285942077637, "global_step": 27516, "epoch": 655} {"train_loss": -5.447896957397461, "global_step": 27517, "epoch": 655} {"train_loss": -5.377499103546143, "global_step": 27518, "epoch": 655} {"train_loss": -5.456484794616699, "global_step": 27519, "epoch": 655} {"train_loss": -5.424588680267334, "global_step": 27520, "epoch": 655} {"train_loss": -5.361276626586914, "global_step": 27521, "epoch": 655} {"train_loss": -5.430968761444092, "global_step": 27522, "epoch": 655} {"train_loss": -5.404278755187988, "global_step": 27523, "epoch": 655} {"train_loss": -5.359257221221924, "global_step": 27524, "epoch": 655} {"train_loss": -5.438083648681641, "global_step": 27525, "epoch": 655} {"train_loss": -5.367499828338623, "global_step": 27526, "epoch": 655} {"train_loss": -5.484334945678711, "global_step": 27527, "epoch": 655} {"train_loss": -5.527606010437012, "global_step": 27528, "epoch": 655} {"train_loss": -5.454877853393555, "global_step": 27529, "epoch": 655} {"train_loss": -5.40252685546875, "global_step": 27530, "epoch": 655} {"train_loss": -5.54990291595459, "global_step": 27531, "epoch": 655} {"train_loss": -5.46049690246582, "global_step": 27532, "epoch": 655} {"train_loss": -5.528921127319336, "global_step": 27533, "epoch": 655} {"train_loss": -5.510769844055176, "global_step": 27534, "epoch": 655} {"train_loss": -5.41747522354126, "global_step": 27535, "epoch": 655} {"train_loss": -5.373607635498047, "global_step": 27536, "epoch": 655} {"train_loss": -5.535858154296875, "global_step": 27537, "epoch": 655} {"train_loss": -5.37362003326416, "global_step": 27538, "epoch": 655} {"train_loss": -5.378604888916016, "global_step": 27539, "epoch": 655} {"train_loss": -5.333461761474609, "global_step": 27540, "epoch": 655} {"train_loss": -5.339195251464844, "global_step": 27541, "epoch": 655} {"train_loss": -5.524168968200684, "global_step": 27542, "epoch": 655} {"train_loss": -5.3374223709106445, "global_step": 27543, "epoch": 655} {"train_loss": -5.3947672843933105, "global_step": 27544, "epoch": 655} {"train_loss": -5.38806676864624, "global_step": 27545, "epoch": 655} {"train_loss": -5.4937744140625, "global_step": 27546, "epoch": 655} {"train_loss": -5.349252223968506, "global_step": 27547, "epoch": 655} {"train_loss": -5.532912254333496, "global_step": 27548, "epoch": 655} {"train_loss": -5.404202938079834, "global_step": 27549, "epoch": 655} {"train_loss": -5.348270416259766, "global_step": 27550, "epoch": 655} {"train_loss": -5.426938284011114, "global_step": 27551, "epoch": 655, "val_loss": 76554.2109375} {"train_loss": -5.4308977127075195, "global_step": 27552, "epoch": 656} {"train_loss": -5.396417617797852, "global_step": 27553, "epoch": 656} {"train_loss": -5.416550636291504, "global_step": 27554, "epoch": 656} {"train_loss": -5.2565155029296875, "global_step": 27555, "epoch": 656} {"train_loss": -5.483003616333008, "global_step": 27556, "epoch": 656} {"train_loss": -5.528716087341309, "global_step": 27557, "epoch": 656} {"train_loss": -5.320619106292725, "global_step": 27558, "epoch": 656} {"train_loss": -5.369193077087402, "global_step": 27559, "epoch": 656} {"train_loss": -5.315171718597412, "global_step": 27560, "epoch": 656} {"train_loss": -5.400573253631592, "global_step": 27561, "epoch": 656} {"train_loss": -5.4466047286987305, "global_step": 27562, "epoch": 656} {"train_loss": -5.430525779724121, "global_step": 27563, "epoch": 656} {"train_loss": -5.361440658569336, "global_step": 27564, "epoch": 656} {"train_loss": -5.386900424957275, "global_step": 27565, "epoch": 656} {"train_loss": -5.448890686035156, "global_step": 27566, "epoch": 656} {"train_loss": -5.496820449829102, "global_step": 27567, "epoch": 656} {"train_loss": -5.365233421325684, "global_step": 27568, "epoch": 656} {"train_loss": -5.310500621795654, "global_step": 27569, "epoch": 656} {"train_loss": -5.366294860839844, "global_step": 27570, "epoch": 656} {"train_loss": -5.486255645751953, "global_step": 27571, "epoch": 656} {"train_loss": -5.46888542175293, "global_step": 27572, "epoch": 656} {"train_loss": -5.481565475463867, "global_step": 27573, "epoch": 656} {"train_loss": -5.41202449798584, "global_step": 27574, "epoch": 656} {"train_loss": -5.547346115112305, "global_step": 27575, "epoch": 656} {"train_loss": -5.443636417388916, "global_step": 27576, "epoch": 656} {"train_loss": -5.51297664642334, "global_step": 27577, "epoch": 656} {"train_loss": -5.354190826416016, "global_step": 27578, "epoch": 656} {"train_loss": -5.385868549346924, "global_step": 27579, "epoch": 656} {"train_loss": -5.5160112380981445, "global_step": 27580, "epoch": 656} {"train_loss": -5.43048095703125, "global_step": 27581, "epoch": 656} {"train_loss": -5.430638313293457, "global_step": 27582, "epoch": 656} {"train_loss": -5.508251190185547, "global_step": 27583, "epoch": 656} {"train_loss": -5.4289631843566895, "global_step": 27584, "epoch": 656} {"train_loss": -5.4320969581604, "global_step": 27585, "epoch": 656} {"train_loss": -5.362424850463867, "global_step": 27586, "epoch": 656} {"train_loss": -5.405435085296631, "global_step": 27587, "epoch": 656} {"train_loss": -5.384357929229736, "global_step": 27588, "epoch": 656} {"train_loss": -5.525966644287109, "global_step": 27589, "epoch": 656} {"train_loss": -5.348714828491211, "global_step": 27590, "epoch": 656} {"train_loss": -5.313568592071533, "global_step": 27591, "epoch": 656} {"train_loss": -5.525678634643555, "global_step": 27592, "epoch": 656} {"train_loss": -5.422101895014445, "global_step": 27593, "epoch": 656, "val_loss": 75856.1640625} {"train_loss": -5.366628646850586, "global_step": 27594, "epoch": 657} {"train_loss": -5.405974864959717, "global_step": 27595, "epoch": 657} {"train_loss": -5.515169143676758, "global_step": 27596, "epoch": 657} {"train_loss": -5.3534255027771, "global_step": 27597, "epoch": 657} {"train_loss": -5.401938438415527, "global_step": 27598, "epoch": 657} {"train_loss": -5.375430583953857, "global_step": 27599, "epoch": 657} {"train_loss": -5.382848739624023, "global_step": 27600, "epoch": 657} {"train_loss": -5.569555282592773, "global_step": 27601, "epoch": 657} {"train_loss": -5.393092155456543, "global_step": 27602, "epoch": 657} {"train_loss": -5.445710182189941, "global_step": 27603, "epoch": 657} {"train_loss": -5.37310266494751, "global_step": 27604, "epoch": 657} {"train_loss": -5.367189407348633, "global_step": 27605, "epoch": 657} {"train_loss": -5.4837965965271, "global_step": 27606, "epoch": 657} {"train_loss": -5.385315895080566, "global_step": 27607, "epoch": 657} {"train_loss": -5.445162773132324, "global_step": 27608, "epoch": 657} {"train_loss": -5.527004241943359, "global_step": 27609, "epoch": 657} {"train_loss": -5.460177421569824, "global_step": 27610, "epoch": 657} {"train_loss": -5.4623517990112305, "global_step": 27611, "epoch": 657} {"train_loss": -5.5369720458984375, "global_step": 27612, "epoch": 657} {"train_loss": -5.527749061584473, "global_step": 27613, "epoch": 657} {"train_loss": -5.391079902648926, "global_step": 27614, "epoch": 657} {"train_loss": -5.456217288970947, "global_step": 27615, "epoch": 657} {"train_loss": -5.441405296325684, "global_step": 27616, "epoch": 657} {"train_loss": -5.501833915710449, "global_step": 27617, "epoch": 657} {"train_loss": -5.35066032409668, "global_step": 27618, "epoch": 657} {"train_loss": -5.608808517456055, "global_step": 27619, "epoch": 657} {"train_loss": -5.514187335968018, "global_step": 27620, "epoch": 657} {"train_loss": -5.443328857421875, "global_step": 27621, "epoch": 657} {"train_loss": -5.346627235412598, "global_step": 27622, "epoch": 657} {"train_loss": -5.397104740142822, "global_step": 27623, "epoch": 657} {"train_loss": -5.370800971984863, "global_step": 27624, "epoch": 657} {"train_loss": -5.474354267120361, "global_step": 27625, "epoch": 657} {"train_loss": -5.353904724121094, "global_step": 27626, "epoch": 657} {"train_loss": -5.593869686126709, "global_step": 27627, "epoch": 657} {"train_loss": -5.480161666870117, "global_step": 27628, "epoch": 657} {"train_loss": -5.3985090255737305, "global_step": 27629, "epoch": 657} {"train_loss": -5.403782367706299, "global_step": 27630, "epoch": 657} {"train_loss": -5.338503837585449, "global_step": 27631, "epoch": 657} {"train_loss": -5.478944778442383, "global_step": 27632, "epoch": 657} {"train_loss": -5.516571044921875, "global_step": 27633, "epoch": 657} {"train_loss": -5.48831844329834, "global_step": 27634, "epoch": 657} {"train_loss": -5.442576431092762, "global_step": 27635, "epoch": 657, "val_loss": 76221.8046875} {"train_loss": -5.371328353881836, "global_step": 27636, "epoch": 658} {"train_loss": -5.38887882232666, "global_step": 27637, "epoch": 658} {"train_loss": -5.621668815612793, "global_step": 27638, "epoch": 658} {"train_loss": -5.391000270843506, "global_step": 27639, "epoch": 658} {"train_loss": -5.388243675231934, "global_step": 27640, "epoch": 658} {"train_loss": -5.464444637298584, "global_step": 27641, "epoch": 658} {"train_loss": -5.524564743041992, "global_step": 27642, "epoch": 658} {"train_loss": -5.296599388122559, "global_step": 27643, "epoch": 658} {"train_loss": -5.419283866882324, "global_step": 27644, "epoch": 658} {"train_loss": -5.311314105987549, "global_step": 27645, "epoch": 658} {"train_loss": -5.2295637130737305, "global_step": 27646, "epoch": 658} {"train_loss": -5.536469459533691, "global_step": 27647, "epoch": 658} {"train_loss": -5.283258438110352, "global_step": 27648, "epoch": 658} {"train_loss": -5.110432147979736, "global_step": 27649, "epoch": 658} {"train_loss": -5.433048725128174, "global_step": 27650, "epoch": 658} {"train_loss": -5.526384353637695, "global_step": 27651, "epoch": 658} {"train_loss": -5.444162368774414, "global_step": 27652, "epoch": 658} {"train_loss": -5.526714324951172, "global_step": 27653, "epoch": 658} {"train_loss": -5.361445426940918, "global_step": 27654, "epoch": 658} {"train_loss": -5.438847064971924, "global_step": 27655, "epoch": 658} {"train_loss": -5.54784631729126, "global_step": 27656, "epoch": 658} {"train_loss": -5.448974609375, "global_step": 27657, "epoch": 658} {"train_loss": -5.417140960693359, "global_step": 27658, "epoch": 658} {"train_loss": -5.397007465362549, "global_step": 27659, "epoch": 658} {"train_loss": -5.438749313354492, "global_step": 27660, "epoch": 658} {"train_loss": -5.393548011779785, "global_step": 27661, "epoch": 658} {"train_loss": -5.311953544616699, "global_step": 27662, "epoch": 658} {"train_loss": -5.441536903381348, "global_step": 27663, "epoch": 658} {"train_loss": -5.477132797241211, "global_step": 27664, "epoch": 658} {"train_loss": -5.396291732788086, "global_step": 27665, "epoch": 658} {"train_loss": -5.482938766479492, "global_step": 27666, "epoch": 658} {"train_loss": -5.503081321716309, "global_step": 27667, "epoch": 658} {"train_loss": -5.448272228240967, "global_step": 27668, "epoch": 658} {"train_loss": -5.413933753967285, "global_step": 27669, "epoch": 658} {"train_loss": -5.271341323852539, "global_step": 27670, "epoch": 658} {"train_loss": -5.397202491760254, "global_step": 27671, "epoch": 658} {"train_loss": -5.451531410217285, "global_step": 27672, "epoch": 658} {"train_loss": -5.4179182052612305, "global_step": 27673, "epoch": 658} {"train_loss": -5.456280708312988, "global_step": 27674, "epoch": 658} {"train_loss": -5.304126739501953, "global_step": 27675, "epoch": 658} {"train_loss": -5.478021144866943, "global_step": 27676, "epoch": 658} {"train_loss": -5.41613507270813, "global_step": 27677, "epoch": 658, "val_loss": 75368.9453125} {"train_loss": -5.3109588623046875, "global_step": 27678, "epoch": 659} {"train_loss": -5.296018123626709, "global_step": 27679, "epoch": 659} {"train_loss": -5.494490623474121, "global_step": 27680, "epoch": 659} {"train_loss": -5.349725246429443, "global_step": 27681, "epoch": 659} {"train_loss": -5.429919242858887, "global_step": 27682, "epoch": 659} {"train_loss": -5.355070114135742, "global_step": 27683, "epoch": 659} {"train_loss": -5.4797515869140625, "global_step": 27684, "epoch": 659} {"train_loss": -5.516096115112305, "global_step": 27685, "epoch": 659} {"train_loss": -5.531591415405273, "global_step": 27686, "epoch": 659} {"train_loss": -5.549763202667236, "global_step": 27687, "epoch": 659} {"train_loss": -5.385089874267578, "global_step": 27688, "epoch": 659} {"train_loss": -5.405975341796875, "global_step": 27689, "epoch": 659} {"train_loss": -5.451796531677246, "global_step": 27690, "epoch": 659} {"train_loss": -5.552126407623291, "global_step": 27691, "epoch": 659} {"train_loss": -5.414199352264404, "global_step": 27692, "epoch": 659} {"train_loss": -5.391757488250732, "global_step": 27693, "epoch": 659} {"train_loss": -5.484718322753906, "global_step": 27694, "epoch": 659} {"train_loss": -5.300249099731445, "global_step": 27695, "epoch": 659} {"train_loss": -5.419013977050781, "global_step": 27696, "epoch": 659} {"train_loss": -5.376607894897461, "global_step": 27697, "epoch": 659} {"train_loss": -5.525959014892578, "global_step": 27698, "epoch": 659} {"train_loss": -5.596254348754883, "global_step": 27699, "epoch": 659} {"train_loss": -5.416009426116943, "global_step": 27700, "epoch": 659} {"train_loss": -5.437534809112549, "global_step": 27701, "epoch": 659} {"train_loss": -5.448512077331543, "global_step": 27702, "epoch": 659} {"train_loss": -5.413928985595703, "global_step": 27703, "epoch": 659} {"train_loss": -5.486825942993164, "global_step": 27704, "epoch": 659} {"train_loss": -5.480304718017578, "global_step": 27705, "epoch": 659} {"train_loss": -5.430450439453125, "global_step": 27706, "epoch": 659} {"train_loss": -5.367710113525391, "global_step": 27707, "epoch": 659} {"train_loss": -5.41123104095459, "global_step": 27708, "epoch": 659} {"train_loss": -5.427024841308594, "global_step": 27709, "epoch": 659} {"train_loss": -5.587230205535889, "global_step": 27710, "epoch": 659} {"train_loss": -5.395020484924316, "global_step": 27711, "epoch": 659} {"train_loss": -5.45119571685791, "global_step": 27712, "epoch": 659} {"train_loss": -5.409623146057129, "global_step": 27713, "epoch": 659} {"train_loss": -5.398305892944336, "global_step": 27714, "epoch": 659} {"train_loss": -5.479463577270508, "global_step": 27715, "epoch": 659} {"train_loss": -5.404562950134277, "global_step": 27716, "epoch": 659} {"train_loss": -5.388281345367432, "global_step": 27717, "epoch": 659} {"train_loss": -5.438420295715332, "global_step": 27718, "epoch": 659} {"train_loss": -5.437058664503551, "global_step": 27719, "epoch": 659, "val_loss": 76738.2265625} {"train_loss": -5.381274700164795, "global_step": 27720, "epoch": 660} {"train_loss": -5.40222692489624, "global_step": 27721, "epoch": 660} {"train_loss": -5.363064765930176, "global_step": 27722, "epoch": 660} {"train_loss": -5.460365295410156, "global_step": 27723, "epoch": 660} {"train_loss": -5.540199279785156, "global_step": 27724, "epoch": 660} {"train_loss": -5.286364555358887, "global_step": 27725, "epoch": 660} {"train_loss": -5.323790073394775, "global_step": 27726, "epoch": 660} {"train_loss": -5.38238525390625, "global_step": 27727, "epoch": 660} {"train_loss": -5.390935897827148, "global_step": 27728, "epoch": 660} {"train_loss": -5.436614990234375, "global_step": 27729, "epoch": 660} {"train_loss": -5.334277629852295, "global_step": 27730, "epoch": 660} {"train_loss": -5.306491374969482, "global_step": 27731, "epoch": 660} {"train_loss": -5.372610092163086, "global_step": 27732, "epoch": 660} {"train_loss": -5.235561370849609, "global_step": 27733, "epoch": 660} {"train_loss": -5.541804313659668, "global_step": 27734, "epoch": 660} {"train_loss": -5.450082302093506, "global_step": 27735, "epoch": 660} {"train_loss": -5.4031901359558105, "global_step": 27736, "epoch": 660} {"train_loss": -5.54090690612793, "global_step": 27737, "epoch": 660} {"train_loss": -5.673458099365234, "global_step": 27738, "epoch": 660} {"train_loss": -5.420383453369141, "global_step": 27739, "epoch": 660} {"train_loss": -5.503598213195801, "global_step": 27740, "epoch": 660} {"train_loss": -5.339491367340088, "global_step": 27741, "epoch": 660} {"train_loss": -5.531578540802002, "global_step": 27742, "epoch": 660} {"train_loss": -5.382691383361816, "global_step": 27743, "epoch": 660} {"train_loss": -5.412136554718018, "global_step": 27744, "epoch": 660} {"train_loss": -5.446709156036377, "global_step": 27745, "epoch": 660} {"train_loss": -5.474844932556152, "global_step": 27746, "epoch": 660} {"train_loss": -5.305547714233398, "global_step": 27747, "epoch": 660} {"train_loss": -5.321094512939453, "global_step": 27748, "epoch": 660} {"train_loss": -5.389225959777832, "global_step": 27749, "epoch": 660} {"train_loss": -5.178134918212891, "global_step": 27750, "epoch": 660} {"train_loss": -5.369861602783203, "global_step": 27751, "epoch": 660} {"train_loss": -5.468240737915039, "global_step": 27752, "epoch": 660} {"train_loss": -5.356273651123047, "global_step": 27753, "epoch": 660} {"train_loss": -5.429018974304199, "global_step": 27754, "epoch": 660} {"train_loss": -5.444713592529297, "global_step": 27755, "epoch": 660} {"train_loss": -5.445781707763672, "global_step": 27756, "epoch": 660} {"train_loss": -5.39721155166626, "global_step": 27757, "epoch": 660} {"train_loss": -5.3730010986328125, "global_step": 27758, "epoch": 660} {"train_loss": -5.49374532699585, "global_step": 27759, "epoch": 660} {"train_loss": -5.325009346008301, "global_step": 27760, "epoch": 660} {"train_loss": -5.407230320430937, "global_step": 27761, "epoch": 660, "val_loss": 75571.140625} {"train_loss": -5.421674728393555, "global_step": 27762, "epoch": 661} {"train_loss": -5.1737165451049805, "global_step": 27763, "epoch": 661} {"train_loss": -5.398616790771484, "global_step": 27764, "epoch": 661} {"train_loss": -5.435849666595459, "global_step": 27765, "epoch": 661} {"train_loss": -5.284015655517578, "global_step": 27766, "epoch": 661} {"train_loss": -5.477084159851074, "global_step": 27767, "epoch": 661} {"train_loss": -5.194971084594727, "global_step": 27768, "epoch": 661} {"train_loss": -5.455451011657715, "global_step": 27769, "epoch": 661} {"train_loss": -5.3273420333862305, "global_step": 27770, "epoch": 661} {"train_loss": -5.4003448486328125, "global_step": 27771, "epoch": 661} {"train_loss": -5.358431816101074, "global_step": 27772, "epoch": 661} {"train_loss": -5.212347030639648, "global_step": 27773, "epoch": 661} {"train_loss": -5.437490463256836, "global_step": 27774, "epoch": 661} {"train_loss": -5.23527717590332, "global_step": 27775, "epoch": 661} {"train_loss": -5.4327802658081055, "global_step": 27776, "epoch": 661} {"train_loss": -5.418865203857422, "global_step": 27777, "epoch": 661} {"train_loss": -5.457635879516602, "global_step": 27778, "epoch": 661} {"train_loss": -5.3108811378479, "global_step": 27779, "epoch": 661} {"train_loss": -5.4510722160339355, "global_step": 27780, "epoch": 661} {"train_loss": -5.391831398010254, "global_step": 27781, "epoch": 661} {"train_loss": -5.4063496589660645, "global_step": 27782, "epoch": 661} {"train_loss": -5.336232662200928, "global_step": 27783, "epoch": 661} {"train_loss": -5.343666076660156, "global_step": 27784, "epoch": 661} {"train_loss": -5.554594993591309, "global_step": 27785, "epoch": 661} {"train_loss": -5.4046630859375, "global_step": 27786, "epoch": 661} {"train_loss": -5.445610523223877, "global_step": 27787, "epoch": 661} {"train_loss": -5.4486613273620605, "global_step": 27788, "epoch": 661} {"train_loss": -5.381017684936523, "global_step": 27789, "epoch": 661} {"train_loss": -5.424291610717773, "global_step": 27790, "epoch": 661} {"train_loss": -5.495563983917236, "global_step": 27791, "epoch": 661} {"train_loss": -5.40883731842041, "global_step": 27792, "epoch": 661} {"train_loss": -5.358672142028809, "global_step": 27793, "epoch": 661} {"train_loss": -5.352424621582031, "global_step": 27794, "epoch": 661} {"train_loss": -5.404477119445801, "global_step": 27795, "epoch": 661} {"train_loss": -5.428622245788574, "global_step": 27796, "epoch": 661} {"train_loss": -5.617581367492676, "global_step": 27797, "epoch": 661} {"train_loss": -5.329471588134766, "global_step": 27798, "epoch": 661} {"train_loss": -5.363034248352051, "global_step": 27799, "epoch": 661} {"train_loss": -5.6178998947143555, "global_step": 27800, "epoch": 661} {"train_loss": -5.409578323364258, "global_step": 27801, "epoch": 661} {"train_loss": -5.498534679412842, "global_step": 27802, "epoch": 661} {"train_loss": -5.399378594898042, "global_step": 27803, "epoch": 661, "val_loss": 76079.09375} {"train_loss": -5.353579044342041, "global_step": 27804, "epoch": 662} {"train_loss": -5.439914703369141, "global_step": 27805, "epoch": 662} {"train_loss": -5.387632369995117, "global_step": 27806, "epoch": 662} {"train_loss": -5.422086238861084, "global_step": 27807, "epoch": 662} {"train_loss": -5.528985023498535, "global_step": 27808, "epoch": 662} {"train_loss": -5.4070725440979, "global_step": 27809, "epoch": 662} {"train_loss": -5.509467124938965, "global_step": 27810, "epoch": 662} {"train_loss": -5.46268892288208, "global_step": 27811, "epoch": 662} {"train_loss": -5.298043251037598, "global_step": 27812, "epoch": 662} {"train_loss": -5.374463081359863, "global_step": 27813, "epoch": 662} {"train_loss": -5.452812671661377, "global_step": 27814, "epoch": 662} {"train_loss": -5.388889312744141, "global_step": 27815, "epoch": 662} {"train_loss": -5.404998779296875, "global_step": 27816, "epoch": 662} {"train_loss": -5.454392433166504, "global_step": 27817, "epoch": 662} {"train_loss": -5.5526957511901855, "global_step": 27818, "epoch": 662} {"train_loss": -5.401517868041992, "global_step": 27819, "epoch": 662} {"train_loss": -5.61176872253418, "global_step": 27820, "epoch": 662} {"train_loss": -5.551268577575684, "global_step": 27821, "epoch": 662} {"train_loss": -5.422556400299072, "global_step": 27822, "epoch": 662} {"train_loss": -5.419195652008057, "global_step": 27823, "epoch": 662} {"train_loss": -5.511650085449219, "global_step": 27824, "epoch": 662} {"train_loss": -5.353336334228516, "global_step": 27825, "epoch": 662} {"train_loss": -5.375658988952637, "global_step": 27826, "epoch": 662} {"train_loss": -5.506550312042236, "global_step": 27827, "epoch": 662} {"train_loss": -5.325639724731445, "global_step": 27828, "epoch": 662} {"train_loss": -5.274827003479004, "global_step": 27829, "epoch": 662} {"train_loss": -5.40212345123291, "global_step": 27830, "epoch": 662} {"train_loss": -5.330970764160156, "global_step": 27831, "epoch": 662} {"train_loss": -5.471354961395264, "global_step": 27832, "epoch": 662} {"train_loss": -5.431029319763184, "global_step": 27833, "epoch": 662} {"train_loss": -5.454103469848633, "global_step": 27834, "epoch": 662} {"train_loss": -5.516160011291504, "global_step": 27835, "epoch": 662} {"train_loss": -5.285414218902588, "global_step": 27836, "epoch": 662} {"train_loss": -5.361167907714844, "global_step": 27837, "epoch": 662} {"train_loss": -5.406388759613037, "global_step": 27838, "epoch": 662} {"train_loss": -5.276364326477051, "global_step": 27839, "epoch": 662} {"train_loss": -5.329221725463867, "global_step": 27840, "epoch": 662} {"train_loss": -5.352695465087891, "global_step": 27841, "epoch": 662} {"train_loss": -5.622729301452637, "global_step": 27842, "epoch": 662} {"train_loss": -5.342432022094727, "global_step": 27843, "epoch": 662} {"train_loss": -5.4140625, "global_step": 27844, "epoch": 662} {"train_loss": -5.419316507521129, "global_step": 27845, "epoch": 662, "val_loss": 76494.2734375} {"train_loss": -5.3060126304626465, "global_step": 27846, "epoch": 663} {"train_loss": -5.351907253265381, "global_step": 27847, "epoch": 663} {"train_loss": -5.449462890625, "global_step": 27848, "epoch": 663} {"train_loss": -5.396702289581299, "global_step": 27849, "epoch": 663} {"train_loss": -5.475715160369873, "global_step": 27850, "epoch": 663} {"train_loss": -5.53331995010376, "global_step": 27851, "epoch": 663} {"train_loss": -5.470558166503906, "global_step": 27852, "epoch": 663} {"train_loss": -5.370882987976074, "global_step": 27853, "epoch": 663} {"train_loss": -5.359884262084961, "global_step": 27854, "epoch": 663} {"train_loss": -5.400803565979004, "global_step": 27855, "epoch": 663} {"train_loss": -5.4290452003479, "global_step": 27856, "epoch": 663} {"train_loss": -5.5866899490356445, "global_step": 27857, "epoch": 663} {"train_loss": -5.432441711425781, "global_step": 27858, "epoch": 663} {"train_loss": -5.500004768371582, "global_step": 27859, "epoch": 663} {"train_loss": -5.363644599914551, "global_step": 27860, "epoch": 663} {"train_loss": -5.408785343170166, "global_step": 27861, "epoch": 663} {"train_loss": -5.404725074768066, "global_step": 27862, "epoch": 663} {"train_loss": -5.42664098739624, "global_step": 27863, "epoch": 663} {"train_loss": -5.361788272857666, "global_step": 27864, "epoch": 663} {"train_loss": -5.299391746520996, "global_step": 27865, "epoch": 663} {"train_loss": -5.397791385650635, "global_step": 27866, "epoch": 663} {"train_loss": -5.459638595581055, "global_step": 27867, "epoch": 663} {"train_loss": -5.455147743225098, "global_step": 27868, "epoch": 663} {"train_loss": -5.415036201477051, "global_step": 27869, "epoch": 663} {"train_loss": -5.388949394226074, "global_step": 27870, "epoch": 663} {"train_loss": -5.494747161865234, "global_step": 27871, "epoch": 663} {"train_loss": -5.225602626800537, "global_step": 27872, "epoch": 663} {"train_loss": -5.3977813720703125, "global_step": 27873, "epoch": 663} {"train_loss": -5.331603050231934, "global_step": 27874, "epoch": 663} {"train_loss": -5.497781753540039, "global_step": 27875, "epoch": 663} {"train_loss": -5.322350025177002, "global_step": 27876, "epoch": 663} {"train_loss": -5.4020185470581055, "global_step": 27877, "epoch": 663} {"train_loss": -5.456435203552246, "global_step": 27878, "epoch": 663} {"train_loss": -5.335247993469238, "global_step": 27879, "epoch": 663} {"train_loss": -5.502621650695801, "global_step": 27880, "epoch": 663} {"train_loss": -5.454069137573242, "global_step": 27881, "epoch": 663} {"train_loss": -5.2960429191589355, "global_step": 27882, "epoch": 663} {"train_loss": -5.45423698425293, "global_step": 27883, "epoch": 663} {"train_loss": -5.2105865478515625, "global_step": 27884, "epoch": 663} {"train_loss": -5.40131950378418, "global_step": 27885, "epoch": 663} {"train_loss": -5.323541164398193, "global_step": 27886, "epoch": 663} {"train_loss": -5.400051764079502, "global_step": 27887, "epoch": 663, "val_loss": 75906.421875} {"train_loss": -5.420393943786621, "global_step": 27888, "epoch": 664} {"train_loss": -5.249256610870361, "global_step": 27889, "epoch": 664} {"train_loss": -5.361238479614258, "global_step": 27890, "epoch": 664} {"train_loss": -5.384429931640625, "global_step": 27891, "epoch": 664} {"train_loss": -5.436796188354492, "global_step": 27892, "epoch": 664} {"train_loss": -5.291614055633545, "global_step": 27893, "epoch": 664} {"train_loss": -5.435384750366211, "global_step": 27894, "epoch": 664} {"train_loss": -5.332351207733154, "global_step": 27895, "epoch": 664} {"train_loss": -5.3902435302734375, "global_step": 27896, "epoch": 664} {"train_loss": -5.538424968719482, "global_step": 27897, "epoch": 664} {"train_loss": -5.447399616241455, "global_step": 27898, "epoch": 664} {"train_loss": -5.487675666809082, "global_step": 27899, "epoch": 664} {"train_loss": -5.471600532531738, "global_step": 27900, "epoch": 664} {"train_loss": -5.410526752471924, "global_step": 27901, "epoch": 664} {"train_loss": -5.438068389892578, "global_step": 27902, "epoch": 664} {"train_loss": -5.373941898345947, "global_step": 27903, "epoch": 664} {"train_loss": -5.439071178436279, "global_step": 27904, "epoch": 664} {"train_loss": -5.49747896194458, "global_step": 27905, "epoch": 664} {"train_loss": -5.511598587036133, "global_step": 27906, "epoch": 664} {"train_loss": -5.289723873138428, "global_step": 27907, "epoch": 664} {"train_loss": -5.558187007904053, "global_step": 27908, "epoch": 664} {"train_loss": -5.484392166137695, "global_step": 27909, "epoch": 664} {"train_loss": -5.6728057861328125, "global_step": 27910, "epoch": 664} {"train_loss": -5.400331497192383, "global_step": 27911, "epoch": 664} {"train_loss": -5.459618091583252, "global_step": 27912, "epoch": 664} {"train_loss": -5.395520210266113, "global_step": 27913, "epoch": 664} {"train_loss": -5.43549919128418, "global_step": 27914, "epoch": 664} {"train_loss": -5.563913345336914, "global_step": 27915, "epoch": 664} {"train_loss": -5.371514320373535, "global_step": 27916, "epoch": 664} {"train_loss": -5.544524192810059, "global_step": 27917, "epoch": 664} {"train_loss": -5.377016067504883, "global_step": 27918, "epoch": 664} {"train_loss": -5.3931884765625, "global_step": 27919, "epoch": 664} {"train_loss": -5.543515205383301, "global_step": 27920, "epoch": 664} {"train_loss": -5.4309892654418945, "global_step": 27921, "epoch": 664} {"train_loss": -5.464743614196777, "global_step": 27922, "epoch": 664} {"train_loss": -5.3732709884643555, "global_step": 27923, "epoch": 664} {"train_loss": -5.32595682144165, "global_step": 27924, "epoch": 664} {"train_loss": -5.4519195556640625, "global_step": 27925, "epoch": 664} {"train_loss": -5.608257293701172, "global_step": 27926, "epoch": 664} {"train_loss": -5.434606552124023, "global_step": 27927, "epoch": 664} {"train_loss": -5.4938883781433105, "global_step": 27928, "epoch": 664} {"train_loss": -5.439812932695661, "global_step": 27929, "epoch": 664, "val_loss": 75271.359375} {"train_loss": -5.411087989807129, "global_step": 27930, "epoch": 665} {"train_loss": -5.583677291870117, "global_step": 27931, "epoch": 665} {"train_loss": -5.444417953491211, "global_step": 27932, "epoch": 665} {"train_loss": -5.4975786209106445, "global_step": 27933, "epoch": 665} {"train_loss": -5.461509704589844, "global_step": 27934, "epoch": 665} {"train_loss": -5.3473896980285645, "global_step": 27935, "epoch": 665} {"train_loss": -5.456266403198242, "global_step": 27936, "epoch": 665} {"train_loss": -5.509918689727783, "global_step": 27937, "epoch": 665} {"train_loss": -5.446517467498779, "global_step": 27938, "epoch": 665} {"train_loss": -5.561846733093262, "global_step": 27939, "epoch": 665} {"train_loss": -5.497996807098389, "global_step": 27940, "epoch": 665} {"train_loss": -5.54098653793335, "global_step": 27941, "epoch": 665} {"train_loss": -5.429914474487305, "global_step": 27942, "epoch": 665} {"train_loss": -5.633996963500977, "global_step": 27943, "epoch": 665} {"train_loss": -5.4680070877075195, "global_step": 27944, "epoch": 665} {"train_loss": -5.363884925842285, "global_step": 27945, "epoch": 665} {"train_loss": -5.46348762512207, "global_step": 27946, "epoch": 665} {"train_loss": -5.476775169372559, "global_step": 27947, "epoch": 665} {"train_loss": -5.457868576049805, "global_step": 27948, "epoch": 665} {"train_loss": -5.33380126953125, "global_step": 27949, "epoch": 665} {"train_loss": -5.447061061859131, "global_step": 27950, "epoch": 665} {"train_loss": -5.395628452301025, "global_step": 27951, "epoch": 665} {"train_loss": -5.479740142822266, "global_step": 27952, "epoch": 665} {"train_loss": -5.369348049163818, "global_step": 27953, "epoch": 665} {"train_loss": -5.41445255279541, "global_step": 27954, "epoch": 665} {"train_loss": -5.326688766479492, "global_step": 27955, "epoch": 665} {"train_loss": -5.446684837341309, "global_step": 27956, "epoch": 665} {"train_loss": -5.3927202224731445, "global_step": 27957, "epoch": 665} {"train_loss": -5.5072021484375, "global_step": 27958, "epoch": 665} {"train_loss": -5.35236930847168, "global_step": 27959, "epoch": 665} {"train_loss": -5.492072105407715, "global_step": 27960, "epoch": 665} {"train_loss": -5.462119102478027, "global_step": 27961, "epoch": 665} {"train_loss": -5.401938438415527, "global_step": 27962, "epoch": 665} {"train_loss": -5.479589462280273, "global_step": 27963, "epoch": 665} {"train_loss": -5.436245918273926, "global_step": 27964, "epoch": 665} {"train_loss": -5.411476135253906, "global_step": 27965, "epoch": 665} {"train_loss": -5.409069061279297, "global_step": 27966, "epoch": 665} {"train_loss": -5.388406753540039, "global_step": 27967, "epoch": 665} {"train_loss": -5.393953323364258, "global_step": 27968, "epoch": 665} {"train_loss": -5.4074931144714355, "global_step": 27969, "epoch": 665} {"train_loss": -5.354032516479492, "global_step": 27970, "epoch": 665} {"train_loss": -5.444535107839675, "global_step": 27971, "epoch": 665, "val_loss": 75582.4765625} {"train_loss": -5.278425216674805, "global_step": 27972, "epoch": 666} {"train_loss": -5.211071014404297, "global_step": 27973, "epoch": 666} {"train_loss": -5.4020280838012695, "global_step": 27974, "epoch": 666} {"train_loss": -5.324535846710205, "global_step": 27975, "epoch": 666} {"train_loss": -5.457347869873047, "global_step": 27976, "epoch": 666} {"train_loss": -5.420492172241211, "global_step": 27977, "epoch": 666} {"train_loss": -5.444897174835205, "global_step": 27978, "epoch": 666} {"train_loss": -5.375223159790039, "global_step": 27979, "epoch": 666} {"train_loss": -5.467320442199707, "global_step": 27980, "epoch": 666} {"train_loss": -5.36676025390625, "global_step": 27981, "epoch": 666} {"train_loss": -5.459411144256592, "global_step": 27982, "epoch": 666} {"train_loss": -5.350932598114014, "global_step": 27983, "epoch": 666} {"train_loss": -5.4376444816589355, "global_step": 27984, "epoch": 666} {"train_loss": -5.36851692199707, "global_step": 27985, "epoch": 666} {"train_loss": -5.436081886291504, "global_step": 27986, "epoch": 666} {"train_loss": -5.540777206420898, "global_step": 27987, "epoch": 666} {"train_loss": -5.331488609313965, "global_step": 27988, "epoch": 666} {"train_loss": -5.294508934020996, "global_step": 27989, "epoch": 666} {"train_loss": -5.397463798522949, "global_step": 27990, "epoch": 666} {"train_loss": -5.422540664672852, "global_step": 27991, "epoch": 666} {"train_loss": -5.402604103088379, "global_step": 27992, "epoch": 666} {"train_loss": -5.438694000244141, "global_step": 27993, "epoch": 666} {"train_loss": -5.511160850524902, "global_step": 27994, "epoch": 666} {"train_loss": -5.3914361000061035, "global_step": 27995, "epoch": 666} {"train_loss": -5.533646583557129, "global_step": 27996, "epoch": 666} {"train_loss": -5.4095683097839355, "global_step": 27997, "epoch": 666} {"train_loss": -5.471158981323242, "global_step": 27998, "epoch": 666} {"train_loss": -5.455387115478516, "global_step": 27999, "epoch": 666} {"train_loss": -5.328216075897217, "global_step": 28000, "epoch": 666} {"train_loss": -5.437756061553955, "global_step": 28001, "epoch": 666} {"train_loss": -5.591678619384766, "global_step": 28002, "epoch": 666} {"train_loss": -5.49266242980957, "global_step": 28003, "epoch": 666} {"train_loss": -5.537845611572266, "global_step": 28004, "epoch": 666} {"train_loss": -5.555327415466309, "global_step": 28005, "epoch": 666} {"train_loss": -5.40384578704834, "global_step": 28006, "epoch": 666} {"train_loss": -5.572511196136475, "global_step": 28007, "epoch": 666} {"train_loss": -5.297515869140625, "global_step": 28008, "epoch": 666} {"train_loss": -5.4374799728393555, "global_step": 28009, "epoch": 666} {"train_loss": -5.425754547119141, "global_step": 28010, "epoch": 666} {"train_loss": -5.382458686828613, "global_step": 28011, "epoch": 666} {"train_loss": -5.525362014770508, "global_step": 28012, "epoch": 666} {"train_loss": -5.421557301566715, "global_step": 28013, "epoch": 666, "val_loss": 76086.0625} {"train_loss": -5.451298713684082, "global_step": 28014, "epoch": 667} {"train_loss": -5.450088024139404, "global_step": 28015, "epoch": 667} {"train_loss": -5.463280200958252, "global_step": 28016, "epoch": 667} {"train_loss": -5.418594837188721, "global_step": 28017, "epoch": 667} {"train_loss": -5.450558185577393, "global_step": 28018, "epoch": 667} {"train_loss": -5.499795913696289, "global_step": 28019, "epoch": 667} {"train_loss": -5.3913984298706055, "global_step": 28020, "epoch": 667} {"train_loss": -5.567902565002441, "global_step": 28021, "epoch": 667} {"train_loss": -5.4974470138549805, "global_step": 28022, "epoch": 667} {"train_loss": -5.516558647155762, "global_step": 28023, "epoch": 667} {"train_loss": -5.2959747314453125, "global_step": 28024, "epoch": 667} {"train_loss": -5.390281677246094, "global_step": 28025, "epoch": 667} {"train_loss": -5.390031337738037, "global_step": 28026, "epoch": 667} {"train_loss": -5.416628837585449, "global_step": 28027, "epoch": 667} {"train_loss": -5.560786247253418, "global_step": 28028, "epoch": 667} {"train_loss": -5.499349594116211, "global_step": 28029, "epoch": 667} {"train_loss": -5.421573638916016, "global_step": 28030, "epoch": 667} {"train_loss": -5.496869087219238, "global_step": 28031, "epoch": 667} {"train_loss": -5.5171918869018555, "global_step": 28032, "epoch": 667} {"train_loss": -5.463343620300293, "global_step": 28033, "epoch": 667} {"train_loss": -5.50126314163208, "global_step": 28034, "epoch": 667} {"train_loss": -5.454595565795898, "global_step": 28035, "epoch": 667} {"train_loss": -5.414168357849121, "global_step": 28036, "epoch": 667} {"train_loss": -5.4233012199401855, "global_step": 28037, "epoch": 667} {"train_loss": -5.470602989196777, "global_step": 28038, "epoch": 667} {"train_loss": -5.375971794128418, "global_step": 28039, "epoch": 667} {"train_loss": -5.547619819641113, "global_step": 28040, "epoch": 667} {"train_loss": -5.536778450012207, "global_step": 28041, "epoch": 667} {"train_loss": -5.426821708679199, "global_step": 28042, "epoch": 667} {"train_loss": -5.399264335632324, "global_step": 28043, "epoch": 667} {"train_loss": -5.3853302001953125, "global_step": 28044, "epoch": 667} {"train_loss": -5.3032331466674805, "global_step": 28045, "epoch": 667} {"train_loss": -5.38153600692749, "global_step": 28046, "epoch": 667} {"train_loss": -5.259049892425537, "global_step": 28047, "epoch": 667} {"train_loss": -5.229984283447266, "global_step": 28048, "epoch": 667} {"train_loss": -5.358361721038818, "global_step": 28049, "epoch": 667} {"train_loss": -5.504756927490234, "global_step": 28050, "epoch": 667} {"train_loss": -5.328982830047607, "global_step": 28051, "epoch": 667} {"train_loss": -5.557984352111816, "global_step": 28052, "epoch": 667} {"train_loss": -5.562105655670166, "global_step": 28053, "epoch": 667} {"train_loss": -5.464046478271484, "global_step": 28054, "epoch": 667} {"train_loss": -5.439792848768688, "global_step": 28055, "epoch": 667, "val_loss": 75147.359375} {"train_loss": -5.30368709564209, "global_step": 28056, "epoch": 668} {"train_loss": -5.52970027923584, "global_step": 28057, "epoch": 668} {"train_loss": -5.531692028045654, "global_step": 28058, "epoch": 668} {"train_loss": -5.362530708312988, "global_step": 28059, "epoch": 668} {"train_loss": -5.377799034118652, "global_step": 28060, "epoch": 668} {"train_loss": -5.500685214996338, "global_step": 28061, "epoch": 668} {"train_loss": -5.494272232055664, "global_step": 28062, "epoch": 668} {"train_loss": -5.393474102020264, "global_step": 28063, "epoch": 668} {"train_loss": -5.467891693115234, "global_step": 28064, "epoch": 668} {"train_loss": -5.4578351974487305, "global_step": 28065, "epoch": 668} {"train_loss": -5.357151031494141, "global_step": 28066, "epoch": 668} {"train_loss": -5.4983110427856445, "global_step": 28067, "epoch": 668} {"train_loss": -5.550031661987305, "global_step": 28068, "epoch": 668} {"train_loss": -5.53681755065918, "global_step": 28069, "epoch": 668} {"train_loss": -5.422708511352539, "global_step": 28070, "epoch": 668} {"train_loss": -5.431423187255859, "global_step": 28071, "epoch": 668} {"train_loss": -5.555534839630127, "global_step": 28072, "epoch": 668} {"train_loss": -5.466938018798828, "global_step": 28073, "epoch": 668} {"train_loss": -5.384762287139893, "global_step": 28074, "epoch": 668} {"train_loss": -5.514168739318848, "global_step": 28075, "epoch": 668} {"train_loss": -5.463817119598389, "global_step": 28076, "epoch": 668} {"train_loss": -5.5236639976501465, "global_step": 28077, "epoch": 668} {"train_loss": -5.337574481964111, "global_step": 28078, "epoch": 668} {"train_loss": -5.405434608459473, "global_step": 28079, "epoch": 668} {"train_loss": -5.324798107147217, "global_step": 28080, "epoch": 668} {"train_loss": -5.336441993713379, "global_step": 28081, "epoch": 668} {"train_loss": -5.431109428405762, "global_step": 28082, "epoch": 668} {"train_loss": -5.419604301452637, "global_step": 28083, "epoch": 668} {"train_loss": -5.398466110229492, "global_step": 28084, "epoch": 668} {"train_loss": -5.3987956047058105, "global_step": 28085, "epoch": 668} {"train_loss": -5.410328388214111, "global_step": 28086, "epoch": 668} {"train_loss": -5.423640727996826, "global_step": 28087, "epoch": 668} {"train_loss": -5.381172180175781, "global_step": 28088, "epoch": 668} {"train_loss": -5.344326972961426, "global_step": 28089, "epoch": 668} {"train_loss": -5.247371673583984, "global_step": 28090, "epoch": 668} {"train_loss": -5.415359020233154, "global_step": 28091, "epoch": 668} {"train_loss": -5.494027614593506, "global_step": 28092, "epoch": 668} {"train_loss": -5.343937873840332, "global_step": 28093, "epoch": 668} {"train_loss": -5.52758264541626, "global_step": 28094, "epoch": 668} {"train_loss": -5.36670446395874, "global_step": 28095, "epoch": 668} {"train_loss": -5.493192672729492, "global_step": 28096, "epoch": 668} {"train_loss": -5.428483100164504, "global_step": 28097, "epoch": 668, "val_loss": 76040.8046875} {"train_loss": -5.327762603759766, "global_step": 28098, "epoch": 669} {"train_loss": -5.488711357116699, "global_step": 28099, "epoch": 669} {"train_loss": -5.369744300842285, "global_step": 28100, "epoch": 669} {"train_loss": -5.418541431427002, "global_step": 28101, "epoch": 669} {"train_loss": -5.434261322021484, "global_step": 28102, "epoch": 669} {"train_loss": -5.344066619873047, "global_step": 28103, "epoch": 669} {"train_loss": -5.374882221221924, "global_step": 28104, "epoch": 669} {"train_loss": -5.371209621429443, "global_step": 28105, "epoch": 669} {"train_loss": -5.575300216674805, "global_step": 28106, "epoch": 669} {"train_loss": -5.458345413208008, "global_step": 28107, "epoch": 669} {"train_loss": -5.274256706237793, "global_step": 28108, "epoch": 669} {"train_loss": -5.545738220214844, "global_step": 28109, "epoch": 669} {"train_loss": -5.343347549438477, "global_step": 28110, "epoch": 669} {"train_loss": -5.473754405975342, "global_step": 28111, "epoch": 669} {"train_loss": -5.494813442230225, "global_step": 28112, "epoch": 669} {"train_loss": -5.487570285797119, "global_step": 28113, "epoch": 669} {"train_loss": -5.4686150550842285, "global_step": 28114, "epoch": 669} {"train_loss": -5.590125560760498, "global_step": 28115, "epoch": 669} {"train_loss": -5.432065010070801, "global_step": 28116, "epoch": 669} {"train_loss": -5.43199348449707, "global_step": 28117, "epoch": 669} {"train_loss": -5.532613754272461, "global_step": 28118, "epoch": 669} {"train_loss": -5.404851913452148, "global_step": 28119, "epoch": 669} {"train_loss": -5.456936836242676, "global_step": 28120, "epoch": 669} {"train_loss": -5.434217929840088, "global_step": 28121, "epoch": 669} {"train_loss": -5.39469575881958, "global_step": 28122, "epoch": 669} {"train_loss": -5.436397552490234, "global_step": 28123, "epoch": 669} {"train_loss": -5.537958145141602, "global_step": 28124, "epoch": 669} {"train_loss": -5.447324752807617, "global_step": 28125, "epoch": 669} {"train_loss": -5.498621940612793, "global_step": 28126, "epoch": 669} {"train_loss": -5.434637069702148, "global_step": 28127, "epoch": 669} {"train_loss": -5.353884220123291, "global_step": 28128, "epoch": 669} {"train_loss": -5.37435245513916, "global_step": 28129, "epoch": 669} {"train_loss": -5.5508880615234375, "global_step": 28130, "epoch": 669} {"train_loss": -5.157118320465088, "global_step": 28131, "epoch": 669} {"train_loss": -5.4350385665893555, "global_step": 28132, "epoch": 669} {"train_loss": -5.392658710479736, "global_step": 28133, "epoch": 669} {"train_loss": -5.403815746307373, "global_step": 28134, "epoch": 669} {"train_loss": -5.590255260467529, "global_step": 28135, "epoch": 669} {"train_loss": -5.354915618896484, "global_step": 28136, "epoch": 669} {"train_loss": -5.413949012756348, "global_step": 28137, "epoch": 669} {"train_loss": -5.484921932220459, "global_step": 28138, "epoch": 669} {"train_loss": -5.431802102497646, "global_step": 28139, "epoch": 669, "val_loss": 75756.46875} {"train_loss": -5.355056285858154, "global_step": 28140, "epoch": 670} {"train_loss": -5.250977516174316, "global_step": 28141, "epoch": 670} {"train_loss": -5.381715774536133, "global_step": 28142, "epoch": 670} {"train_loss": -5.3766350746154785, "global_step": 28143, "epoch": 670} {"train_loss": -5.289913177490234, "global_step": 28144, "epoch": 670} {"train_loss": -5.243293762207031, "global_step": 28145, "epoch": 670} {"train_loss": -5.281070232391357, "global_step": 28146, "epoch": 670} {"train_loss": -5.495777606964111, "global_step": 28147, "epoch": 670} {"train_loss": -5.394735336303711, "global_step": 28148, "epoch": 670} {"train_loss": -5.380168914794922, "global_step": 28149, "epoch": 670} {"train_loss": -5.405360221862793, "global_step": 28150, "epoch": 670} {"train_loss": -5.389395236968994, "global_step": 28151, "epoch": 670} {"train_loss": -5.342000961303711, "global_step": 28152, "epoch": 670} {"train_loss": -5.382638931274414, "global_step": 28153, "epoch": 670} {"train_loss": -5.367517948150635, "global_step": 28154, "epoch": 670} {"train_loss": -5.404916763305664, "global_step": 28155, "epoch": 670} {"train_loss": -5.421015739440918, "global_step": 28156, "epoch": 670} {"train_loss": -5.358497619628906, "global_step": 28157, "epoch": 670} {"train_loss": -5.459006309509277, "global_step": 28158, "epoch": 670} {"train_loss": -5.439365386962891, "global_step": 28159, "epoch": 670} {"train_loss": -5.528487205505371, "global_step": 28160, "epoch": 670} {"train_loss": -5.460917949676514, "global_step": 28161, "epoch": 670} {"train_loss": -5.504907608032227, "global_step": 28162, "epoch": 670} {"train_loss": -5.384575843811035, "global_step": 28163, "epoch": 670} {"train_loss": -5.3397955894470215, "global_step": 28164, "epoch": 670} {"train_loss": -5.433550834655762, "global_step": 28165, "epoch": 670} {"train_loss": -5.415866851806641, "global_step": 28166, "epoch": 670} {"train_loss": -5.390322685241699, "global_step": 28167, "epoch": 670} {"train_loss": -5.460145950317383, "global_step": 28168, "epoch": 670} {"train_loss": -5.445554256439209, "global_step": 28169, "epoch": 670} {"train_loss": -5.5009613037109375, "global_step": 28170, "epoch": 670} {"train_loss": -5.468608856201172, "global_step": 28171, "epoch": 670} {"train_loss": -5.274162292480469, "global_step": 28172, "epoch": 670} {"train_loss": -5.648060321807861, "global_step": 28173, "epoch": 670} {"train_loss": -5.44917106628418, "global_step": 28174, "epoch": 670} {"train_loss": -5.487833023071289, "global_step": 28175, "epoch": 670} {"train_loss": -5.46559476852417, "global_step": 28176, "epoch": 670} {"train_loss": -5.381731986999512, "global_step": 28177, "epoch": 670} {"train_loss": -5.459413528442383, "global_step": 28178, "epoch": 670} {"train_loss": -5.562255859375, "global_step": 28179, "epoch": 670} {"train_loss": -5.523736953735352, "global_step": 28180, "epoch": 670} {"train_loss": -5.416989281063988, "global_step": 28181, "epoch": 670, "val_loss": 75184.46875} {"train_loss": -5.484192371368408, "global_step": 28182, "epoch": 671} {"train_loss": -5.462069034576416, "global_step": 28183, "epoch": 671} {"train_loss": -5.546098709106445, "global_step": 28184, "epoch": 671} {"train_loss": -5.51384162902832, "global_step": 28185, "epoch": 671} {"train_loss": -5.4854888916015625, "global_step": 28186, "epoch": 671} {"train_loss": -5.34954833984375, "global_step": 28187, "epoch": 671} {"train_loss": -5.432682037353516, "global_step": 28188, "epoch": 671} {"train_loss": -5.5047197341918945, "global_step": 28189, "epoch": 671} {"train_loss": -5.506026268005371, "global_step": 28190, "epoch": 671} {"train_loss": -5.455158710479736, "global_step": 28191, "epoch": 671} {"train_loss": -5.511220932006836, "global_step": 28192, "epoch": 671} {"train_loss": -5.496672630310059, "global_step": 28193, "epoch": 671} {"train_loss": -5.39219856262207, "global_step": 28194, "epoch": 671} {"train_loss": -5.4839935302734375, "global_step": 28195, "epoch": 671} {"train_loss": -5.46907901763916, "global_step": 28196, "epoch": 671} {"train_loss": -5.47482442855835, "global_step": 28197, "epoch": 671} {"train_loss": -5.447882175445557, "global_step": 28198, "epoch": 671} {"train_loss": -5.444458484649658, "global_step": 28199, "epoch": 671} {"train_loss": -5.5298285484313965, "global_step": 28200, "epoch": 671} {"train_loss": -5.485100269317627, "global_step": 28201, "epoch": 671} {"train_loss": -5.45152473449707, "global_step": 28202, "epoch": 671} {"train_loss": -5.439794540405273, "global_step": 28203, "epoch": 671} {"train_loss": -5.497766017913818, "global_step": 28204, "epoch": 671} {"train_loss": -5.405510902404785, "global_step": 28205, "epoch": 671} {"train_loss": -5.394360542297363, "global_step": 28206, "epoch": 671} {"train_loss": -5.531968116760254, "global_step": 28207, "epoch": 671} {"train_loss": -5.460908889770508, "global_step": 28208, "epoch": 671} {"train_loss": -5.411203384399414, "global_step": 28209, "epoch": 671} {"train_loss": -5.503557205200195, "global_step": 28210, "epoch": 671} {"train_loss": -5.509802341461182, "global_step": 28211, "epoch": 671} {"train_loss": -5.498027801513672, "global_step": 28212, "epoch": 671} {"train_loss": -5.416090965270996, "global_step": 28213, "epoch": 671} {"train_loss": -5.427373886108398, "global_step": 28214, "epoch": 671} {"train_loss": -5.30772066116333, "global_step": 28215, "epoch": 671} {"train_loss": -5.435755252838135, "global_step": 28216, "epoch": 671} {"train_loss": -5.280671119689941, "global_step": 28217, "epoch": 671} {"train_loss": -5.475126266479492, "global_step": 28218, "epoch": 671} {"train_loss": -5.356511116027832, "global_step": 28219, "epoch": 671} {"train_loss": -5.469483375549316, "global_step": 28220, "epoch": 671} {"train_loss": -5.349608421325684, "global_step": 28221, "epoch": 671} {"train_loss": -5.434324264526367, "global_step": 28222, "epoch": 671} {"train_loss": -5.451733430226644, "global_step": 28223, "epoch": 671, "val_loss": 75497.734375} {"train_loss": -5.406174182891846, "global_step": 28224, "epoch": 672} {"train_loss": -5.275949954986572, "global_step": 28225, "epoch": 672} {"train_loss": -5.326915264129639, "global_step": 28226, "epoch": 672} {"train_loss": -5.2999587059021, "global_step": 28227, "epoch": 672} {"train_loss": -5.30516242980957, "global_step": 28228, "epoch": 672} {"train_loss": -5.194718360900879, "global_step": 28229, "epoch": 672} {"train_loss": -5.275054454803467, "global_step": 28230, "epoch": 672} {"train_loss": -5.330252170562744, "global_step": 28231, "epoch": 672} {"train_loss": -5.12074089050293, "global_step": 28232, "epoch": 672} {"train_loss": -5.352289199829102, "global_step": 28233, "epoch": 672} {"train_loss": -5.361522674560547, "global_step": 28234, "epoch": 672} {"train_loss": -5.438976287841797, "global_step": 28235, "epoch": 672} {"train_loss": -5.295777797698975, "global_step": 28236, "epoch": 672} {"train_loss": -5.381870269775391, "global_step": 28237, "epoch": 672} {"train_loss": -5.3382086753845215, "global_step": 28238, "epoch": 672} {"train_loss": -5.508833408355713, "global_step": 28239, "epoch": 672} {"train_loss": -5.41128396987915, "global_step": 28240, "epoch": 672} {"train_loss": -5.406634330749512, "global_step": 28241, "epoch": 672} {"train_loss": -5.495348930358887, "global_step": 28242, "epoch": 672} {"train_loss": -5.413732051849365, "global_step": 28243, "epoch": 672} {"train_loss": -5.401791095733643, "global_step": 28244, "epoch": 672} {"train_loss": -5.425530433654785, "global_step": 28245, "epoch": 672} {"train_loss": -5.477975845336914, "global_step": 28246, "epoch": 672} {"train_loss": -5.4744343757629395, "global_step": 28247, "epoch": 672} {"train_loss": -5.619308948516846, "global_step": 28248, "epoch": 672} {"train_loss": -5.4893670082092285, "global_step": 28249, "epoch": 672} {"train_loss": -5.40798807144165, "global_step": 28250, "epoch": 672} {"train_loss": -5.559081077575684, "global_step": 28251, "epoch": 672} {"train_loss": -5.403254508972168, "global_step": 28252, "epoch": 672} {"train_loss": -5.360173225402832, "global_step": 28253, "epoch": 672} {"train_loss": -5.441179275512695, "global_step": 28254, "epoch": 672} {"train_loss": -5.52942419052124, "global_step": 28255, "epoch": 672} {"train_loss": -5.316546440124512, "global_step": 28256, "epoch": 672} {"train_loss": -5.541012287139893, "global_step": 28257, "epoch": 672} {"train_loss": -5.367680549621582, "global_step": 28258, "epoch": 672} {"train_loss": -5.369687080383301, "global_step": 28259, "epoch": 672} {"train_loss": -5.375783920288086, "global_step": 28260, "epoch": 672} {"train_loss": -5.5152459144592285, "global_step": 28261, "epoch": 672} {"train_loss": -5.446840286254883, "global_step": 28262, "epoch": 672} {"train_loss": -5.463970184326172, "global_step": 28263, "epoch": 672} {"train_loss": -5.407864093780518, "global_step": 28264, "epoch": 672} {"train_loss": -5.39868670418149, "global_step": 28265, "epoch": 672, "val_loss": 75800.3125} {"train_loss": -5.2948408126831055, "global_step": 28266, "epoch": 673} {"train_loss": -5.44719123840332, "global_step": 28267, "epoch": 673} {"train_loss": -5.385629653930664, "global_step": 28268, "epoch": 673} {"train_loss": -5.46686315536499, "global_step": 28269, "epoch": 673} {"train_loss": -5.447246551513672, "global_step": 28270, "epoch": 673} {"train_loss": -5.6638898849487305, "global_step": 28271, "epoch": 673} {"train_loss": -5.598582744598389, "global_step": 28272, "epoch": 673} {"train_loss": -5.489009380340576, "global_step": 28273, "epoch": 673} {"train_loss": -5.57086181640625, "global_step": 28274, "epoch": 673} {"train_loss": -5.4725141525268555, "global_step": 28275, "epoch": 673} {"train_loss": -5.4352264404296875, "global_step": 28276, "epoch": 673} {"train_loss": -5.364396095275879, "global_step": 28277, "epoch": 673} {"train_loss": -5.5256805419921875, "global_step": 28278, "epoch": 673} {"train_loss": -5.4936676025390625, "global_step": 28279, "epoch": 673} {"train_loss": -5.465615749359131, "global_step": 28280, "epoch": 673} {"train_loss": -5.566561698913574, "global_step": 28281, "epoch": 673} {"train_loss": -5.390553951263428, "global_step": 28282, "epoch": 673} {"train_loss": -5.39005184173584, "global_step": 28283, "epoch": 673} {"train_loss": -5.410935401916504, "global_step": 28284, "epoch": 673} {"train_loss": -5.441562175750732, "global_step": 28285, "epoch": 673} {"train_loss": -5.451132774353027, "global_step": 28286, "epoch": 673} {"train_loss": -5.528397083282471, "global_step": 28287, "epoch": 673} {"train_loss": -5.317864894866943, "global_step": 28288, "epoch": 673} {"train_loss": -5.438627243041992, "global_step": 28289, "epoch": 673} {"train_loss": -5.362640380859375, "global_step": 28290, "epoch": 673} {"train_loss": -5.326857566833496, "global_step": 28291, "epoch": 673} {"train_loss": -5.433602333068848, "global_step": 28292, "epoch": 673} {"train_loss": -5.4591803550720215, "global_step": 28293, "epoch": 673} {"train_loss": -5.3453826904296875, "global_step": 28294, "epoch": 673} {"train_loss": -5.471107482910156, "global_step": 28295, "epoch": 673} {"train_loss": -5.383681774139404, "global_step": 28296, "epoch": 673} {"train_loss": -5.519299030303955, "global_step": 28297, "epoch": 673} {"train_loss": -5.427785396575928, "global_step": 28298, "epoch": 673} {"train_loss": -5.455221652984619, "global_step": 28299, "epoch": 673} {"train_loss": -5.478386878967285, "global_step": 28300, "epoch": 673} {"train_loss": -5.497585773468018, "global_step": 28301, "epoch": 673} {"train_loss": -5.386909484863281, "global_step": 28302, "epoch": 673} {"train_loss": -5.472016334533691, "global_step": 28303, "epoch": 673} {"train_loss": -5.343881607055664, "global_step": 28304, "epoch": 673} {"train_loss": -5.29533576965332, "global_step": 28305, "epoch": 673} {"train_loss": -5.373505592346191, "global_step": 28306, "epoch": 673} {"train_loss": -5.4378568558465865, "global_step": 28307, "epoch": 673, "val_loss": 75896.25} {"train_loss": -5.341338157653809, "global_step": 28308, "epoch": 674} {"train_loss": -5.400505065917969, "global_step": 28309, "epoch": 674} {"train_loss": -5.4181108474731445, "global_step": 28310, "epoch": 674} {"train_loss": -5.399588584899902, "global_step": 28311, "epoch": 674} {"train_loss": -5.313984394073486, "global_step": 28312, "epoch": 674} {"train_loss": -5.513886451721191, "global_step": 28313, "epoch": 674} {"train_loss": -5.370661735534668, "global_step": 28314, "epoch": 674} {"train_loss": -5.480348110198975, "global_step": 28315, "epoch": 674} {"train_loss": -5.564888000488281, "global_step": 28316, "epoch": 674} {"train_loss": -5.438159942626953, "global_step": 28317, "epoch": 674} {"train_loss": -5.436529159545898, "global_step": 28318, "epoch": 674} {"train_loss": -5.299993991851807, "global_step": 28319, "epoch": 674} {"train_loss": -5.423445224761963, "global_step": 28320, "epoch": 674} {"train_loss": -5.491053581237793, "global_step": 28321, "epoch": 674} {"train_loss": -5.281100273132324, "global_step": 28322, "epoch": 674} {"train_loss": -5.372515678405762, "global_step": 28323, "epoch": 674} {"train_loss": -5.285465240478516, "global_step": 28324, "epoch": 674} {"train_loss": -5.515590667724609, "global_step": 28325, "epoch": 674} {"train_loss": -5.436801910400391, "global_step": 28326, "epoch": 674} {"train_loss": -5.380376815795898, "global_step": 28327, "epoch": 674} {"train_loss": -5.3026628494262695, "global_step": 28328, "epoch": 674} {"train_loss": -5.498922824859619, "global_step": 28329, "epoch": 674} {"train_loss": -5.454983711242676, "global_step": 28330, "epoch": 674} {"train_loss": -5.397284984588623, "global_step": 28331, "epoch": 674} {"train_loss": -5.487659454345703, "global_step": 28332, "epoch": 674} {"train_loss": -5.35276985168457, "global_step": 28333, "epoch": 674} {"train_loss": -5.468301773071289, "global_step": 28334, "epoch": 674} {"train_loss": -5.4952592849731445, "global_step": 28335, "epoch": 674} {"train_loss": -5.4132513999938965, "global_step": 28336, "epoch": 674} {"train_loss": -5.496123790740967, "global_step": 28337, "epoch": 674} {"train_loss": -5.587247848510742, "global_step": 28338, "epoch": 674} {"train_loss": -5.474641799926758, "global_step": 28339, "epoch": 674} {"train_loss": -5.413963317871094, "global_step": 28340, "epoch": 674} {"train_loss": -5.460178852081299, "global_step": 28341, "epoch": 674} {"train_loss": -5.452407360076904, "global_step": 28342, "epoch": 674} {"train_loss": -5.498420238494873, "global_step": 28343, "epoch": 674} {"train_loss": -5.362529754638672, "global_step": 28344, "epoch": 674} {"train_loss": -5.467937469482422, "global_step": 28345, "epoch": 674} {"train_loss": -5.424846649169922, "global_step": 28346, "epoch": 674} {"train_loss": -5.628293514251709, "global_step": 28347, "epoch": 674} {"train_loss": -5.328434944152832, "global_step": 28348, "epoch": 674} {"train_loss": -5.430795011066255, "global_step": 28349, "epoch": 674, "val_loss": 75219.3359375} {"train_loss": -5.440464019775391, "global_step": 28350, "epoch": 675} {"train_loss": -5.423065662384033, "global_step": 28351, "epoch": 675} {"train_loss": -5.32806396484375, "global_step": 28352, "epoch": 675} {"train_loss": -5.500619411468506, "global_step": 28353, "epoch": 675} {"train_loss": -5.42143440246582, "global_step": 28354, "epoch": 675} {"train_loss": -5.4141526222229, "global_step": 28355, "epoch": 675} {"train_loss": -5.378611087799072, "global_step": 28356, "epoch": 675} {"train_loss": -5.367351531982422, "global_step": 28357, "epoch": 675} {"train_loss": -5.441863059997559, "global_step": 28358, "epoch": 675} {"train_loss": -5.326011657714844, "global_step": 28359, "epoch": 675} {"train_loss": -5.393945693969727, "global_step": 28360, "epoch": 675} {"train_loss": -5.499961853027344, "global_step": 28361, "epoch": 675} {"train_loss": -5.457226276397705, "global_step": 28362, "epoch": 675} {"train_loss": -5.321658134460449, "global_step": 28363, "epoch": 675} {"train_loss": -5.374324321746826, "global_step": 28364, "epoch": 675} {"train_loss": -5.513424396514893, "global_step": 28365, "epoch": 675} {"train_loss": -5.360531330108643, "global_step": 28366, "epoch": 675} {"train_loss": -5.4409499168396, "global_step": 28367, "epoch": 675} {"train_loss": -5.474066257476807, "global_step": 28368, "epoch": 675} {"train_loss": -5.5313615798950195, "global_step": 28369, "epoch": 675} {"train_loss": -5.53057336807251, "global_step": 28370, "epoch": 675} {"train_loss": -5.662962913513184, "global_step": 28371, "epoch": 675} {"train_loss": -5.532537460327148, "global_step": 28372, "epoch": 675} {"train_loss": -5.391669273376465, "global_step": 28373, "epoch": 675} {"train_loss": -5.295727729797363, "global_step": 28374, "epoch": 675} {"train_loss": -5.529136657714844, "global_step": 28375, "epoch": 675} {"train_loss": -5.352383613586426, "global_step": 28376, "epoch": 675} {"train_loss": -5.489583969116211, "global_step": 28377, "epoch": 675} {"train_loss": -5.432939529418945, "global_step": 28378, "epoch": 675} {"train_loss": -5.504066467285156, "global_step": 28379, "epoch": 675} {"train_loss": -5.264278411865234, "global_step": 28380, "epoch": 675} {"train_loss": -5.440847396850586, "global_step": 28381, "epoch": 675} {"train_loss": -5.4114298820495605, "global_step": 28382, "epoch": 675} {"train_loss": -5.3677754402160645, "global_step": 28383, "epoch": 675} {"train_loss": -5.369133472442627, "global_step": 28384, "epoch": 675} {"train_loss": -5.328131675720215, "global_step": 28385, "epoch": 675} {"train_loss": -5.35581111907959, "global_step": 28386, "epoch": 675} {"train_loss": -5.4801764488220215, "global_step": 28387, "epoch": 675} {"train_loss": -5.2064104080200195, "global_step": 28388, "epoch": 675} {"train_loss": -5.467662811279297, "global_step": 28389, "epoch": 675} {"train_loss": -5.269089698791504, "global_step": 28390, "epoch": 675} {"train_loss": -5.417523429507301, "global_step": 28391, "epoch": 675, "val_loss": 75406.9375} {"train_loss": -5.461313247680664, "global_step": 28392, "epoch": 676} {"train_loss": -5.33400821685791, "global_step": 28393, "epoch": 676} {"train_loss": -5.513834476470947, "global_step": 28394, "epoch": 676} {"train_loss": -5.4027581214904785, "global_step": 28395, "epoch": 676} {"train_loss": -5.494452953338623, "global_step": 28396, "epoch": 676} {"train_loss": -5.405266761779785, "global_step": 28397, "epoch": 676} {"train_loss": -5.377154350280762, "global_step": 28398, "epoch": 676} {"train_loss": -5.361435890197754, "global_step": 28399, "epoch": 676} {"train_loss": -5.4405975341796875, "global_step": 28400, "epoch": 676} {"train_loss": -5.424259185791016, "global_step": 28401, "epoch": 676} {"train_loss": -5.378993988037109, "global_step": 28402, "epoch": 676} {"train_loss": -5.510822296142578, "global_step": 28403, "epoch": 676} {"train_loss": -5.480138778686523, "global_step": 28404, "epoch": 676} {"train_loss": -5.468056678771973, "global_step": 28405, "epoch": 676} {"train_loss": -5.47670841217041, "global_step": 28406, "epoch": 676} {"train_loss": -5.490497589111328, "global_step": 28407, "epoch": 676} {"train_loss": -5.3317365646362305, "global_step": 28408, "epoch": 676} {"train_loss": -5.449496269226074, "global_step": 28409, "epoch": 676} {"train_loss": -5.509240627288818, "global_step": 28410, "epoch": 676} {"train_loss": -5.468507766723633, "global_step": 28411, "epoch": 676} {"train_loss": -5.5199174880981445, "global_step": 28412, "epoch": 676} {"train_loss": -5.51188850402832, "global_step": 28413, "epoch": 676} {"train_loss": -5.633975982666016, "global_step": 28414, "epoch": 676} {"train_loss": -5.333930969238281, "global_step": 28415, "epoch": 676} {"train_loss": -5.459237098693848, "global_step": 28416, "epoch": 676} {"train_loss": -5.407575607299805, "global_step": 28417, "epoch": 676} {"train_loss": -5.64318323135376, "global_step": 28418, "epoch": 676} {"train_loss": -5.53201961517334, "global_step": 28419, "epoch": 676} {"train_loss": -5.4435505867004395, "global_step": 28420, "epoch": 676} {"train_loss": -5.46834659576416, "global_step": 28421, "epoch": 676} {"train_loss": -5.349676132202148, "global_step": 28422, "epoch": 676} {"train_loss": -5.463833808898926, "global_step": 28423, "epoch": 676} {"train_loss": -5.560760021209717, "global_step": 28424, "epoch": 676} {"train_loss": -5.42340087890625, "global_step": 28425, "epoch": 676} {"train_loss": -5.405732154846191, "global_step": 28426, "epoch": 676} {"train_loss": -5.293876647949219, "global_step": 28427, "epoch": 676} {"train_loss": -5.491466522216797, "global_step": 28428, "epoch": 676} {"train_loss": -5.451140403747559, "global_step": 28429, "epoch": 676} {"train_loss": -5.441716194152832, "global_step": 28430, "epoch": 676} {"train_loss": -5.539451599121094, "global_step": 28431, "epoch": 676} {"train_loss": -5.322271347045898, "global_step": 28432, "epoch": 676} {"train_loss": -5.448044300079346, "global_step": 28433, "epoch": 676, "val_loss": 76005.6875} {"train_loss": -5.522092819213867, "global_step": 28434, "epoch": 677} {"train_loss": -5.570023536682129, "global_step": 28435, "epoch": 677} {"train_loss": -5.42467737197876, "global_step": 28436, "epoch": 677} {"train_loss": -5.437747001647949, "global_step": 28437, "epoch": 677} {"train_loss": -5.380836486816406, "global_step": 28438, "epoch": 677} {"train_loss": -5.43125581741333, "global_step": 28439, "epoch": 677} {"train_loss": -5.521844863891602, "global_step": 28440, "epoch": 677} {"train_loss": -5.417688369750977, "global_step": 28441, "epoch": 677} {"train_loss": -5.41282844543457, "global_step": 28442, "epoch": 677} {"train_loss": -5.388261795043945, "global_step": 28443, "epoch": 677} {"train_loss": -5.453649520874023, "global_step": 28444, "epoch": 677} {"train_loss": -5.406045436859131, "global_step": 28445, "epoch": 677} {"train_loss": -5.451725006103516, "global_step": 28446, "epoch": 677} {"train_loss": -5.426596641540527, "global_step": 28447, "epoch": 677} {"train_loss": -5.504129886627197, "global_step": 28448, "epoch": 677} {"train_loss": -5.470989227294922, "global_step": 28449, "epoch": 677} {"train_loss": -5.495014667510986, "global_step": 28450, "epoch": 677} {"train_loss": -5.3237481117248535, "global_step": 28451, "epoch": 677} {"train_loss": -5.525111198425293, "global_step": 28452, "epoch": 677} {"train_loss": -5.3629536628723145, "global_step": 28453, "epoch": 677} {"train_loss": -5.419280052185059, "global_step": 28454, "epoch": 677} {"train_loss": -5.529776573181152, "global_step": 28455, "epoch": 677} {"train_loss": -5.437705039978027, "global_step": 28456, "epoch": 677} {"train_loss": -5.416311264038086, "global_step": 28457, "epoch": 677} {"train_loss": -5.496297836303711, "global_step": 28458, "epoch": 677} {"train_loss": -5.282094955444336, "global_step": 28459, "epoch": 677} {"train_loss": -5.482526779174805, "global_step": 28460, "epoch": 677} {"train_loss": -5.535239219665527, "global_step": 28461, "epoch": 677} {"train_loss": -5.376997947692871, "global_step": 28462, "epoch": 677} {"train_loss": -5.437126159667969, "global_step": 28463, "epoch": 677} {"train_loss": -5.376167297363281, "global_step": 28464, "epoch": 677} {"train_loss": -5.436574935913086, "global_step": 28465, "epoch": 677} {"train_loss": -5.424921989440918, "global_step": 28466, "epoch": 677} {"train_loss": -5.406371593475342, "global_step": 28467, "epoch": 677} {"train_loss": -5.4450788497924805, "global_step": 28468, "epoch": 677} {"train_loss": -5.4805908203125, "global_step": 28469, "epoch": 677} {"train_loss": -5.287141799926758, "global_step": 28470, "epoch": 677} {"train_loss": -5.4960150718688965, "global_step": 28471, "epoch": 677} {"train_loss": -5.43434476852417, "global_step": 28472, "epoch": 677} {"train_loss": -5.474878311157227, "global_step": 28473, "epoch": 677} {"train_loss": -5.568479061126709, "global_step": 28474, "epoch": 677} {"train_loss": -5.442971116020566, "global_step": 28475, "epoch": 677, "val_loss": 75573.21875} {"train_loss": -5.512768268585205, "global_step": 28476, "epoch": 678} {"train_loss": -5.428140640258789, "global_step": 28477, "epoch": 678} {"train_loss": -5.411833763122559, "global_step": 28478, "epoch": 678} {"train_loss": -5.492521286010742, "global_step": 28479, "epoch": 678} {"train_loss": -5.471117973327637, "global_step": 28480, "epoch": 678} {"train_loss": -5.382781028747559, "global_step": 28481, "epoch": 678} {"train_loss": -5.36541223526001, "global_step": 28482, "epoch": 678} {"train_loss": -5.371210098266602, "global_step": 28483, "epoch": 678} {"train_loss": -5.276939392089844, "global_step": 28484, "epoch": 678} {"train_loss": -5.382808208465576, "global_step": 28485, "epoch": 678} {"train_loss": -5.448581695556641, "global_step": 28486, "epoch": 678} {"train_loss": -5.291382789611816, "global_step": 28487, "epoch": 678} {"train_loss": -5.436781883239746, "global_step": 28488, "epoch": 678} {"train_loss": -5.470259666442871, "global_step": 28489, "epoch": 678} {"train_loss": -5.298781394958496, "global_step": 28490, "epoch": 678} {"train_loss": -5.409975528717041, "global_step": 28491, "epoch": 678} {"train_loss": -5.3027849197387695, "global_step": 28492, "epoch": 678} {"train_loss": -5.323613166809082, "global_step": 28493, "epoch": 678} {"train_loss": -5.253562927246094, "global_step": 28494, "epoch": 678} {"train_loss": -5.360631465911865, "global_step": 28495, "epoch": 678} {"train_loss": -5.4555253982543945, "global_step": 28496, "epoch": 678} {"train_loss": -5.42470645904541, "global_step": 28497, "epoch": 678} {"train_loss": -5.512561321258545, "global_step": 28498, "epoch": 678} {"train_loss": -5.293569564819336, "global_step": 28499, "epoch": 678} {"train_loss": -5.539236068725586, "global_step": 28500, "epoch": 678} {"train_loss": -5.441470146179199, "global_step": 28501, "epoch": 678} {"train_loss": -5.510148525238037, "global_step": 28502, "epoch": 678} {"train_loss": -5.447424411773682, "global_step": 28503, "epoch": 678} {"train_loss": -5.5766921043396, "global_step": 28504, "epoch": 678} {"train_loss": -5.554291248321533, "global_step": 28505, "epoch": 678} {"train_loss": -5.42120361328125, "global_step": 28506, "epoch": 678} {"train_loss": -5.543720245361328, "global_step": 28507, "epoch": 678} {"train_loss": -5.344235420227051, "global_step": 28508, "epoch": 678} {"train_loss": -5.5514678955078125, "global_step": 28509, "epoch": 678} {"train_loss": -5.497816562652588, "global_step": 28510, "epoch": 678} {"train_loss": -5.413857936859131, "global_step": 28511, "epoch": 678} {"train_loss": -5.491342544555664, "global_step": 28512, "epoch": 678} {"train_loss": -5.443965911865234, "global_step": 28513, "epoch": 678} {"train_loss": -5.439664840698242, "global_step": 28514, "epoch": 678} {"train_loss": -5.346282482147217, "global_step": 28515, "epoch": 678} {"train_loss": -5.404633522033691, "global_step": 28516, "epoch": 678} {"train_loss": -5.423558575766427, "global_step": 28517, "epoch": 678, "val_loss": 75204.96875} {"train_loss": -5.492319107055664, "global_step": 28518, "epoch": 679} {"train_loss": -5.404904365539551, "global_step": 28519, "epoch": 679} {"train_loss": -5.505974292755127, "global_step": 28520, "epoch": 679} {"train_loss": -5.413299560546875, "global_step": 28521, "epoch": 679} {"train_loss": -5.289975643157959, "global_step": 28522, "epoch": 679} {"train_loss": -5.37154483795166, "global_step": 28523, "epoch": 679} {"train_loss": -5.347056865692139, "global_step": 28524, "epoch": 679} {"train_loss": -5.458611965179443, "global_step": 28525, "epoch": 679} {"train_loss": -5.5885491371154785, "global_step": 28526, "epoch": 679} {"train_loss": -5.219093322753906, "global_step": 28527, "epoch": 679} {"train_loss": -5.413419723510742, "global_step": 28528, "epoch": 679} {"train_loss": -5.423679351806641, "global_step": 28529, "epoch": 679} {"train_loss": -5.500500679016113, "global_step": 28530, "epoch": 679} {"train_loss": -5.529501914978027, "global_step": 28531, "epoch": 679} {"train_loss": -5.506185531616211, "global_step": 28532, "epoch": 679} {"train_loss": -5.4312639236450195, "global_step": 28533, "epoch": 679} {"train_loss": -5.599906921386719, "global_step": 28534, "epoch": 679} {"train_loss": -5.405654430389404, "global_step": 28535, "epoch": 679} {"train_loss": -5.39808464050293, "global_step": 28536, "epoch": 679} {"train_loss": -5.494406700134277, "global_step": 28537, "epoch": 679} {"train_loss": -5.472483158111572, "global_step": 28538, "epoch": 679} {"train_loss": -5.433144569396973, "global_step": 28539, "epoch": 679} {"train_loss": -5.488245964050293, "global_step": 28540, "epoch": 679} {"train_loss": -5.44256591796875, "global_step": 28541, "epoch": 679} {"train_loss": -5.36806583404541, "global_step": 28542, "epoch": 679} {"train_loss": -5.3701605796813965, "global_step": 28543, "epoch": 679} {"train_loss": -5.641451358795166, "global_step": 28544, "epoch": 679} {"train_loss": -5.411689281463623, "global_step": 28545, "epoch": 679} {"train_loss": -5.508646011352539, "global_step": 28546, "epoch": 679} {"train_loss": -5.441871643066406, "global_step": 28547, "epoch": 679} {"train_loss": -5.434346675872803, "global_step": 28548, "epoch": 679} {"train_loss": -5.525710105895996, "global_step": 28549, "epoch": 679} {"train_loss": -5.4143571853637695, "global_step": 28550, "epoch": 679} {"train_loss": -5.336788177490234, "global_step": 28551, "epoch": 679} {"train_loss": -5.434571266174316, "global_step": 28552, "epoch": 679} {"train_loss": -5.377657890319824, "global_step": 28553, "epoch": 679} {"train_loss": -5.479994297027588, "global_step": 28554, "epoch": 679} {"train_loss": -5.576181411743164, "global_step": 28555, "epoch": 679} {"train_loss": -5.364797592163086, "global_step": 28556, "epoch": 679} {"train_loss": -5.229745864868164, "global_step": 28557, "epoch": 679} {"train_loss": -5.436941146850586, "global_step": 28558, "epoch": 679} {"train_loss": -5.438968079430716, "global_step": 28559, "epoch": 679, "val_loss": 75770.8046875} {"train_loss": -5.394896984100342, "global_step": 28560, "epoch": 680} {"train_loss": -5.400568962097168, "global_step": 28561, "epoch": 680} {"train_loss": -5.531246185302734, "global_step": 28562, "epoch": 680} {"train_loss": -5.350342273712158, "global_step": 28563, "epoch": 680} {"train_loss": -5.632134914398193, "global_step": 28564, "epoch": 680} {"train_loss": -5.52979850769043, "global_step": 28565, "epoch": 680} {"train_loss": -5.366236686706543, "global_step": 28566, "epoch": 680} {"train_loss": -5.484583854675293, "global_step": 28567, "epoch": 680} {"train_loss": -5.470660209655762, "global_step": 28568, "epoch": 680} {"train_loss": -5.425107479095459, "global_step": 28569, "epoch": 680} {"train_loss": -5.601041316986084, "global_step": 28570, "epoch": 680} {"train_loss": -5.464923858642578, "global_step": 28571, "epoch": 680} {"train_loss": -5.492412567138672, "global_step": 28572, "epoch": 680} {"train_loss": -5.56527042388916, "global_step": 28573, "epoch": 680} {"train_loss": -5.381082534790039, "global_step": 28574, "epoch": 680} {"train_loss": -5.413186550140381, "global_step": 28575, "epoch": 680} {"train_loss": -5.564482688903809, "global_step": 28576, "epoch": 680} {"train_loss": -5.405885696411133, "global_step": 28577, "epoch": 680} {"train_loss": -5.482796669006348, "global_step": 28578, "epoch": 680} {"train_loss": -5.48063850402832, "global_step": 28579, "epoch": 680} {"train_loss": -5.553450584411621, "global_step": 28580, "epoch": 680} {"train_loss": -5.321398735046387, "global_step": 28581, "epoch": 680} {"train_loss": -5.380411148071289, "global_step": 28582, "epoch": 680} {"train_loss": -5.3329973220825195, "global_step": 28583, "epoch": 680} {"train_loss": -5.503806114196777, "global_step": 28584, "epoch": 680} {"train_loss": -5.428954601287842, "global_step": 28585, "epoch": 680} {"train_loss": -5.589112281799316, "global_step": 28586, "epoch": 680} {"train_loss": -5.428830146789551, "global_step": 28587, "epoch": 680} {"train_loss": -5.432948112487793, "global_step": 28588, "epoch": 680} {"train_loss": -5.4038801193237305, "global_step": 28589, "epoch": 680} {"train_loss": -5.5346903800964355, "global_step": 28590, "epoch": 680} {"train_loss": -5.502950668334961, "global_step": 28591, "epoch": 680} {"train_loss": -5.509954452514648, "global_step": 28592, "epoch": 680} {"train_loss": -5.372725009918213, "global_step": 28593, "epoch": 680} {"train_loss": -5.436028480529785, "global_step": 28594, "epoch": 680} {"train_loss": -5.5409746170043945, "global_step": 28595, "epoch": 680} {"train_loss": -5.428330421447754, "global_step": 28596, "epoch": 680} {"train_loss": -5.420053958892822, "global_step": 28597, "epoch": 680} {"train_loss": -5.400881767272949, "global_step": 28598, "epoch": 680} {"train_loss": -5.385318756103516, "global_step": 28599, "epoch": 680} {"train_loss": -5.452540874481201, "global_step": 28600, "epoch": 680} {"train_loss": -5.458740461440313, "global_step": 28601, "epoch": 680, "val_loss": 75741.671875} {"train_loss": -5.524074554443359, "global_step": 28602, "epoch": 681} {"train_loss": -5.546018600463867, "global_step": 28603, "epoch": 681} {"train_loss": -5.501175403594971, "global_step": 28604, "epoch": 681} {"train_loss": -5.364964485168457, "global_step": 28605, "epoch": 681} {"train_loss": -5.5656633377075195, "global_step": 28606, "epoch": 681} {"train_loss": -5.449872016906738, "global_step": 28607, "epoch": 681} {"train_loss": -5.525906562805176, "global_step": 28608, "epoch": 681} {"train_loss": -5.506937026977539, "global_step": 28609, "epoch": 681} {"train_loss": -5.3102498054504395, "global_step": 28610, "epoch": 681} {"train_loss": -5.480968475341797, "global_step": 28611, "epoch": 681} {"train_loss": -5.3241119384765625, "global_step": 28612, "epoch": 681} {"train_loss": -5.528280258178711, "global_step": 28613, "epoch": 681} {"train_loss": -5.505866050720215, "global_step": 28614, "epoch": 681} {"train_loss": -5.307385444641113, "global_step": 28615, "epoch": 681} {"train_loss": -5.5594282150268555, "global_step": 28616, "epoch": 681} {"train_loss": -5.542285919189453, "global_step": 28617, "epoch": 681} {"train_loss": -5.45992374420166, "global_step": 28618, "epoch": 681} {"train_loss": -5.502408981323242, "global_step": 28619, "epoch": 681} {"train_loss": -5.424769878387451, "global_step": 28620, "epoch": 681} {"train_loss": -5.47629451751709, "global_step": 28621, "epoch": 681} {"train_loss": -5.346593856811523, "global_step": 28622, "epoch": 681} {"train_loss": -5.5213141441345215, "global_step": 28623, "epoch": 681} {"train_loss": -5.434388160705566, "global_step": 28624, "epoch": 681} {"train_loss": -5.484071731567383, "global_step": 28625, "epoch": 681} {"train_loss": -5.385453701019287, "global_step": 28626, "epoch": 681} {"train_loss": -5.359004974365234, "global_step": 28627, "epoch": 681} {"train_loss": -5.4943647384643555, "global_step": 28628, "epoch": 681} {"train_loss": -5.465256214141846, "global_step": 28629, "epoch": 681} {"train_loss": -5.482295989990234, "global_step": 28630, "epoch": 681} {"train_loss": -5.4905877113342285, "global_step": 28631, "epoch": 681} {"train_loss": -5.533158302307129, "global_step": 28632, "epoch": 681} {"train_loss": -5.33660888671875, "global_step": 28633, "epoch": 681} {"train_loss": -5.372129917144775, "global_step": 28634, "epoch": 681} {"train_loss": -5.5185112953186035, "global_step": 28635, "epoch": 681} {"train_loss": -5.530376434326172, "global_step": 28636, "epoch": 681} {"train_loss": -5.477504730224609, "global_step": 28637, "epoch": 681} {"train_loss": -5.485095977783203, "global_step": 28638, "epoch": 681} {"train_loss": -5.257199287414551, "global_step": 28639, "epoch": 681} {"train_loss": -5.4959716796875, "global_step": 28640, "epoch": 681} {"train_loss": -5.4641571044921875, "global_step": 28641, "epoch": 681} {"train_loss": -5.364677906036377, "global_step": 28642, "epoch": 681} {"train_loss": -5.452932119369507, "global_step": 28643, "epoch": 681, "val_loss": 75675.1796875} {"train_loss": -5.563867092132568, "global_step": 28644, "epoch": 682} {"train_loss": -5.424689769744873, "global_step": 28645, "epoch": 682} {"train_loss": -5.313331604003906, "global_step": 28646, "epoch": 682} {"train_loss": -5.4171295166015625, "global_step": 28647, "epoch": 682} {"train_loss": -5.541525840759277, "global_step": 28648, "epoch": 682} {"train_loss": -5.418909072875977, "global_step": 28649, "epoch": 682} {"train_loss": -5.394416809082031, "global_step": 28650, "epoch": 682} {"train_loss": -5.637810707092285, "global_step": 28651, "epoch": 682} {"train_loss": -5.486451148986816, "global_step": 28652, "epoch": 682} {"train_loss": -5.439820289611816, "global_step": 28653, "epoch": 682} {"train_loss": -5.386565208435059, "global_step": 28654, "epoch": 682} {"train_loss": -5.529725074768066, "global_step": 28655, "epoch": 682} {"train_loss": -5.619157791137695, "global_step": 28656, "epoch": 682} {"train_loss": -5.413689613342285, "global_step": 28657, "epoch": 682} {"train_loss": -5.521960735321045, "global_step": 28658, "epoch": 682} {"train_loss": -5.542888164520264, "global_step": 28659, "epoch": 682} {"train_loss": -5.470975399017334, "global_step": 28660, "epoch": 682} {"train_loss": -5.409496307373047, "global_step": 28661, "epoch": 682} {"train_loss": -5.409926891326904, "global_step": 28662, "epoch": 682} {"train_loss": -5.349155426025391, "global_step": 28663, "epoch": 682} {"train_loss": -5.508261680603027, "global_step": 28664, "epoch": 682} {"train_loss": -5.388731956481934, "global_step": 28665, "epoch": 682} {"train_loss": -5.5241570472717285, "global_step": 28666, "epoch": 682} {"train_loss": -5.416506767272949, "global_step": 28667, "epoch": 682} {"train_loss": -5.453395843505859, "global_step": 28668, "epoch": 682} {"train_loss": -5.504355430603027, "global_step": 28669, "epoch": 682} {"train_loss": -5.548415184020996, "global_step": 28670, "epoch": 682} {"train_loss": -5.466412544250488, "global_step": 28671, "epoch": 682} {"train_loss": -5.475332260131836, "global_step": 28672, "epoch": 682} {"train_loss": -5.477218151092529, "global_step": 28673, "epoch": 682} {"train_loss": -5.564043998718262, "global_step": 28674, "epoch": 682} {"train_loss": -5.416053771972656, "global_step": 28675, "epoch": 682} {"train_loss": -5.46782922744751, "global_step": 28676, "epoch": 682} {"train_loss": -5.460171699523926, "global_step": 28677, "epoch": 682} {"train_loss": -5.441641807556152, "global_step": 28678, "epoch": 682} {"train_loss": -5.442949295043945, "global_step": 28679, "epoch": 682} {"train_loss": -5.419217109680176, "global_step": 28680, "epoch": 682} {"train_loss": -5.473179817199707, "global_step": 28681, "epoch": 682} {"train_loss": -5.5192179679870605, "global_step": 28682, "epoch": 682} {"train_loss": -5.41422700881958, "global_step": 28683, "epoch": 682} {"train_loss": -5.371050834655762, "global_step": 28684, "epoch": 682} {"train_loss": -5.464507568450201, "global_step": 28685, "epoch": 682, "val_loss": 75533.1015625} {"train_loss": -5.365439414978027, "global_step": 28686, "epoch": 683} {"train_loss": -5.36503267288208, "global_step": 28687, "epoch": 683} {"train_loss": -5.3820295333862305, "global_step": 28688, "epoch": 683} {"train_loss": -5.479674816131592, "global_step": 28689, "epoch": 683} {"train_loss": -5.402405261993408, "global_step": 28690, "epoch": 683} {"train_loss": -5.369799613952637, "global_step": 28691, "epoch": 683} {"train_loss": -5.432778358459473, "global_step": 28692, "epoch": 683} {"train_loss": -5.398481845855713, "global_step": 28693, "epoch": 683} {"train_loss": -5.489378929138184, "global_step": 28694, "epoch": 683} {"train_loss": -5.425333023071289, "global_step": 28695, "epoch": 683} {"train_loss": -5.2841596603393555, "global_step": 28696, "epoch": 683} {"train_loss": -5.4094953536987305, "global_step": 28697, "epoch": 683} {"train_loss": -5.4774017333984375, "global_step": 28698, "epoch": 683} {"train_loss": -5.493724822998047, "global_step": 28699, "epoch": 683} {"train_loss": -5.419154167175293, "global_step": 28700, "epoch": 683} {"train_loss": -5.4259724617004395, "global_step": 28701, "epoch": 683} {"train_loss": -5.443863868713379, "global_step": 28702, "epoch": 683} {"train_loss": -5.475888252258301, "global_step": 28703, "epoch": 683} {"train_loss": -5.402817726135254, "global_step": 28704, "epoch": 683} {"train_loss": -5.389516830444336, "global_step": 28705, "epoch": 683} {"train_loss": -5.415579319000244, "global_step": 28706, "epoch": 683} {"train_loss": -5.592935562133789, "global_step": 28707, "epoch": 683} {"train_loss": -5.485695838928223, "global_step": 28708, "epoch": 683} {"train_loss": -5.586545944213867, "global_step": 28709, "epoch": 683} {"train_loss": -5.496442794799805, "global_step": 28710, "epoch": 683} {"train_loss": -5.4648542404174805, "global_step": 28711, "epoch": 683} {"train_loss": -5.497900009155273, "global_step": 28712, "epoch": 683} {"train_loss": -5.5373005867004395, "global_step": 28713, "epoch": 683} {"train_loss": -5.453065872192383, "global_step": 28714, "epoch": 683} {"train_loss": -5.52182674407959, "global_step": 28715, "epoch": 683} {"train_loss": -5.503510475158691, "global_step": 28716, "epoch": 683} {"train_loss": -5.510499000549316, "global_step": 28717, "epoch": 683} {"train_loss": -5.397477149963379, "global_step": 28718, "epoch": 683} {"train_loss": -5.393860816955566, "global_step": 28719, "epoch": 683} {"train_loss": -5.482647895812988, "global_step": 28720, "epoch": 683} {"train_loss": -5.4389495849609375, "global_step": 28721, "epoch": 683} {"train_loss": -5.442155838012695, "global_step": 28722, "epoch": 683} {"train_loss": -5.432331085205078, "global_step": 28723, "epoch": 683} {"train_loss": -5.345970630645752, "global_step": 28724, "epoch": 683} {"train_loss": -5.44014310836792, "global_step": 28725, "epoch": 683} {"train_loss": -5.466334342956543, "global_step": 28726, "epoch": 683} {"train_loss": -5.447059915179298, "global_step": 28727, "epoch": 683, "val_loss": 75147.4140625} {"train_loss": -5.368141174316406, "global_step": 28728, "epoch": 684} {"train_loss": -5.429452896118164, "global_step": 28729, "epoch": 684} {"train_loss": -5.415398597717285, "global_step": 28730, "epoch": 684} {"train_loss": -5.409002304077148, "global_step": 28731, "epoch": 684} {"train_loss": -5.554136276245117, "global_step": 28732, "epoch": 684} {"train_loss": -5.537341594696045, "global_step": 28733, "epoch": 684} {"train_loss": -5.303785800933838, "global_step": 28734, "epoch": 684} {"train_loss": -5.545039176940918, "global_step": 28735, "epoch": 684} {"train_loss": -5.415928363800049, "global_step": 28736, "epoch": 684} {"train_loss": -5.393937587738037, "global_step": 28737, "epoch": 684} {"train_loss": -5.442784786224365, "global_step": 28738, "epoch": 684} {"train_loss": -5.4829254150390625, "global_step": 28739, "epoch": 684} {"train_loss": -5.500894069671631, "global_step": 28740, "epoch": 684} {"train_loss": -5.506332874298096, "global_step": 28741, "epoch": 684} {"train_loss": -5.492231369018555, "global_step": 28742, "epoch": 684} {"train_loss": -5.524045944213867, "global_step": 28743, "epoch": 684} {"train_loss": -5.58734130859375, "global_step": 28744, "epoch": 684} {"train_loss": -5.448330402374268, "global_step": 28745, "epoch": 684} {"train_loss": -5.477195739746094, "global_step": 28746, "epoch": 684} {"train_loss": -5.489156723022461, "global_step": 28747, "epoch": 684} {"train_loss": -5.44820499420166, "global_step": 28748, "epoch": 684} {"train_loss": -5.491353988647461, "global_step": 28749, "epoch": 684} {"train_loss": -5.404270172119141, "global_step": 28750, "epoch": 684} {"train_loss": -5.381871223449707, "global_step": 28751, "epoch": 684} {"train_loss": -5.459806442260742, "global_step": 28752, "epoch": 684} {"train_loss": -5.487597942352295, "global_step": 28753, "epoch": 684} {"train_loss": -5.353097438812256, "global_step": 28754, "epoch": 684} {"train_loss": -5.401871681213379, "global_step": 28755, "epoch": 684} {"train_loss": -5.4413275718688965, "global_step": 28756, "epoch": 684} {"train_loss": -5.425447463989258, "global_step": 28757, "epoch": 684} {"train_loss": -5.526935577392578, "global_step": 28758, "epoch": 684} {"train_loss": -5.392658233642578, "global_step": 28759, "epoch": 684} {"train_loss": -5.41989278793335, "global_step": 28760, "epoch": 684} {"train_loss": -5.629057884216309, "global_step": 28761, "epoch": 684} {"train_loss": -5.415978908538818, "global_step": 28762, "epoch": 684} {"train_loss": -5.370975494384766, "global_step": 28763, "epoch": 684} {"train_loss": -5.4727396965026855, "global_step": 28764, "epoch": 684} {"train_loss": -5.2877373695373535, "global_step": 28765, "epoch": 684} {"train_loss": -5.505893707275391, "global_step": 28766, "epoch": 684} {"train_loss": -5.500280857086182, "global_step": 28767, "epoch": 684} {"train_loss": -5.437393665313721, "global_step": 28768, "epoch": 684} {"train_loss": -5.453060729163034, "global_step": 28769, "epoch": 684, "val_loss": 75135.4921875} {"train_loss": -5.376148223876953, "global_step": 28770, "epoch": 685} {"train_loss": -5.476465225219727, "global_step": 28771, "epoch": 685} {"train_loss": -5.585649490356445, "global_step": 28772, "epoch": 685} {"train_loss": -5.429201126098633, "global_step": 28773, "epoch": 685} {"train_loss": -5.432453155517578, "global_step": 28774, "epoch": 685} {"train_loss": -5.500025749206543, "global_step": 28775, "epoch": 685} {"train_loss": -5.494838714599609, "global_step": 28776, "epoch": 685} {"train_loss": -5.3862409591674805, "global_step": 28777, "epoch": 685} {"train_loss": -5.469727516174316, "global_step": 28778, "epoch": 685} {"train_loss": -5.459835529327393, "global_step": 28779, "epoch": 685} {"train_loss": -5.516716003417969, "global_step": 28780, "epoch": 685} {"train_loss": -5.508811950683594, "global_step": 28781, "epoch": 685} {"train_loss": -5.509644031524658, "global_step": 28782, "epoch": 685} {"train_loss": -5.51386022567749, "global_step": 28783, "epoch": 685} {"train_loss": -5.58349609375, "global_step": 28784, "epoch": 685} {"train_loss": -5.403575897216797, "global_step": 28785, "epoch": 685} {"train_loss": -5.358788013458252, "global_step": 28786, "epoch": 685} {"train_loss": -5.549807071685791, "global_step": 28787, "epoch": 685} {"train_loss": -5.495899677276611, "global_step": 28788, "epoch": 685} {"train_loss": -5.39410924911499, "global_step": 28789, "epoch": 685} {"train_loss": -5.475647926330566, "global_step": 28790, "epoch": 685} {"train_loss": -5.548792839050293, "global_step": 28791, "epoch": 685} {"train_loss": -5.48957633972168, "global_step": 28792, "epoch": 685} {"train_loss": -5.559935092926025, "global_step": 28793, "epoch": 685} {"train_loss": -5.492198944091797, "global_step": 28794, "epoch": 685} {"train_loss": -5.373149871826172, "global_step": 28795, "epoch": 685} {"train_loss": -5.439929962158203, "global_step": 28796, "epoch": 685} {"train_loss": -5.510687351226807, "global_step": 28797, "epoch": 685} {"train_loss": -5.414351463317871, "global_step": 28798, "epoch": 685} {"train_loss": -5.489151954650879, "global_step": 28799, "epoch": 685} {"train_loss": -5.39531135559082, "global_step": 28800, "epoch": 685} {"train_loss": -5.400429725646973, "global_step": 28801, "epoch": 685} {"train_loss": -5.397670269012451, "global_step": 28802, "epoch": 685} {"train_loss": -5.497727870941162, "global_step": 28803, "epoch": 685} {"train_loss": -5.487730026245117, "global_step": 28804, "epoch": 685} {"train_loss": -5.560537338256836, "global_step": 28805, "epoch": 685} {"train_loss": -5.434258460998535, "global_step": 28806, "epoch": 685} {"train_loss": -5.333174705505371, "global_step": 28807, "epoch": 685} {"train_loss": -5.4423675537109375, "global_step": 28808, "epoch": 685} {"train_loss": -5.4060468673706055, "global_step": 28809, "epoch": 685} {"train_loss": -5.3249592781066895, "global_step": 28810, "epoch": 685} {"train_loss": -5.45891801516215, "global_step": 28811, "epoch": 685, "val_loss": 75346.5859375} {"train_loss": -5.5089921951293945, "global_step": 28812, "epoch": 686} {"train_loss": -5.492559432983398, "global_step": 28813, "epoch": 686} {"train_loss": -5.4262847900390625, "global_step": 28814, "epoch": 686} {"train_loss": -5.514777183532715, "global_step": 28815, "epoch": 686} {"train_loss": -5.624969005584717, "global_step": 28816, "epoch": 686} {"train_loss": -5.347863674163818, "global_step": 28817, "epoch": 686} {"train_loss": -5.518708229064941, "global_step": 28818, "epoch": 686} {"train_loss": -5.366199493408203, "global_step": 28819, "epoch": 686} {"train_loss": -5.421824932098389, "global_step": 28820, "epoch": 686} {"train_loss": -5.416889190673828, "global_step": 28821, "epoch": 686} {"train_loss": -5.380906105041504, "global_step": 28822, "epoch": 686} {"train_loss": -5.415134429931641, "global_step": 28823, "epoch": 686} {"train_loss": -5.364445686340332, "global_step": 28824, "epoch": 686} {"train_loss": -5.480844020843506, "global_step": 28825, "epoch": 686} {"train_loss": -5.5783467292785645, "global_step": 28826, "epoch": 686} {"train_loss": -5.45289421081543, "global_step": 28827, "epoch": 686} {"train_loss": -5.475332260131836, "global_step": 28828, "epoch": 686} {"train_loss": -5.428852081298828, "global_step": 28829, "epoch": 686} {"train_loss": -5.46126651763916, "global_step": 28830, "epoch": 686} {"train_loss": -5.396414279937744, "global_step": 28831, "epoch": 686} {"train_loss": -5.399874687194824, "global_step": 28832, "epoch": 686} {"train_loss": -5.428460597991943, "global_step": 28833, "epoch": 686} {"train_loss": -5.442910194396973, "global_step": 28834, "epoch": 686} {"train_loss": -5.425534725189209, "global_step": 28835, "epoch": 686} {"train_loss": -5.5694780349731445, "global_step": 28836, "epoch": 686} {"train_loss": -5.425949573516846, "global_step": 28837, "epoch": 686} {"train_loss": -5.540051460266113, "global_step": 28838, "epoch": 686} {"train_loss": -5.542240142822266, "global_step": 28839, "epoch": 686} {"train_loss": -5.3229475021362305, "global_step": 28840, "epoch": 686} {"train_loss": -5.432796478271484, "global_step": 28841, "epoch": 686} {"train_loss": -5.538259029388428, "global_step": 28842, "epoch": 686} {"train_loss": -5.387735366821289, "global_step": 28843, "epoch": 686} {"train_loss": -5.329773902893066, "global_step": 28844, "epoch": 686} {"train_loss": -5.388745307922363, "global_step": 28845, "epoch": 686} {"train_loss": -5.387734889984131, "global_step": 28846, "epoch": 686} {"train_loss": -5.462950706481934, "global_step": 28847, "epoch": 686} {"train_loss": -5.4547834396362305, "global_step": 28848, "epoch": 686} {"train_loss": -5.445957183837891, "global_step": 28849, "epoch": 686} {"train_loss": -5.485304355621338, "global_step": 28850, "epoch": 686} {"train_loss": -5.340544700622559, "global_step": 28851, "epoch": 686} {"train_loss": -5.431707382202148, "global_step": 28852, "epoch": 686} {"train_loss": -5.44553820292155, "global_step": 28853, "epoch": 686, "val_loss": 75438.6328125} {"train_loss": -5.432483673095703, "global_step": 28854, "epoch": 687} {"train_loss": -5.4831156730651855, "global_step": 28855, "epoch": 687} {"train_loss": -5.406851768493652, "global_step": 28856, "epoch": 687} {"train_loss": -5.454329490661621, "global_step": 28857, "epoch": 687} {"train_loss": -5.499224662780762, "global_step": 28858, "epoch": 687} {"train_loss": -5.384892463684082, "global_step": 28859, "epoch": 687} {"train_loss": -5.628478050231934, "global_step": 28860, "epoch": 687} {"train_loss": -5.370321273803711, "global_step": 28861, "epoch": 687} {"train_loss": -5.4863715171813965, "global_step": 28862, "epoch": 687} {"train_loss": -5.478809356689453, "global_step": 28863, "epoch": 687} {"train_loss": -5.5290703773498535, "global_step": 28864, "epoch": 687} {"train_loss": -5.3863325119018555, "global_step": 28865, "epoch": 687} {"train_loss": -5.46214485168457, "global_step": 28866, "epoch": 687} {"train_loss": -5.403566360473633, "global_step": 28867, "epoch": 687} {"train_loss": -5.590368747711182, "global_step": 28868, "epoch": 687} {"train_loss": -5.441883087158203, "global_step": 28869, "epoch": 687} {"train_loss": -5.579008102416992, "global_step": 28870, "epoch": 687} {"train_loss": -5.410900115966797, "global_step": 28871, "epoch": 687} {"train_loss": -5.580854892730713, "global_step": 28872, "epoch": 687} {"train_loss": -5.36251163482666, "global_step": 28873, "epoch": 687} {"train_loss": -5.463717460632324, "global_step": 28874, "epoch": 687} {"train_loss": -5.4095635414123535, "global_step": 28875, "epoch": 687} {"train_loss": -5.365688800811768, "global_step": 28876, "epoch": 687} {"train_loss": -5.50282621383667, "global_step": 28877, "epoch": 687} {"train_loss": -5.383973121643066, "global_step": 28878, "epoch": 687} {"train_loss": -5.490123748779297, "global_step": 28879, "epoch": 687} {"train_loss": -5.376367092132568, "global_step": 28880, "epoch": 687} {"train_loss": -5.328896999359131, "global_step": 28881, "epoch": 687} {"train_loss": -5.470148086547852, "global_step": 28882, "epoch": 687} {"train_loss": -5.392793655395508, "global_step": 28883, "epoch": 687} {"train_loss": -5.425593852996826, "global_step": 28884, "epoch": 687} {"train_loss": -5.395130157470703, "global_step": 28885, "epoch": 687} {"train_loss": -5.412034034729004, "global_step": 28886, "epoch": 687} {"train_loss": -5.477321624755859, "global_step": 28887, "epoch": 687} {"train_loss": -5.530247688293457, "global_step": 28888, "epoch": 687} {"train_loss": -5.455108642578125, "global_step": 28889, "epoch": 687} {"train_loss": -5.514955520629883, "global_step": 28890, "epoch": 687} {"train_loss": -5.443201065063477, "global_step": 28891, "epoch": 687} {"train_loss": -5.4437761306762695, "global_step": 28892, "epoch": 687} {"train_loss": -5.383725166320801, "global_step": 28893, "epoch": 687} {"train_loss": -5.50303840637207, "global_step": 28894, "epoch": 687} {"train_loss": -5.454155853816441, "global_step": 28895, "epoch": 687, "val_loss": 75152.734375} {"train_loss": -5.474045753479004, "global_step": 28896, "epoch": 688} {"train_loss": -5.582630157470703, "global_step": 28897, "epoch": 688} {"train_loss": -5.512087821960449, "global_step": 28898, "epoch": 688} {"train_loss": -5.400324821472168, "global_step": 28899, "epoch": 688} {"train_loss": -5.468374729156494, "global_step": 28900, "epoch": 688} {"train_loss": -5.5411553382873535, "global_step": 28901, "epoch": 688} {"train_loss": -5.411070346832275, "global_step": 28902, "epoch": 688} {"train_loss": -5.602470397949219, "global_step": 28903, "epoch": 688} {"train_loss": -5.521666049957275, "global_step": 28904, "epoch": 688} {"train_loss": -5.412647724151611, "global_step": 28905, "epoch": 688} {"train_loss": -5.626556396484375, "global_step": 28906, "epoch": 688} {"train_loss": -5.3888678550720215, "global_step": 28907, "epoch": 688} {"train_loss": -5.642703056335449, "global_step": 28908, "epoch": 688} {"train_loss": -5.474213600158691, "global_step": 28909, "epoch": 688} {"train_loss": -5.468658924102783, "global_step": 28910, "epoch": 688} {"train_loss": -5.5091681480407715, "global_step": 28911, "epoch": 688} {"train_loss": -5.463006973266602, "global_step": 28912, "epoch": 688} {"train_loss": -5.392531394958496, "global_step": 28913, "epoch": 688} {"train_loss": -5.321016311645508, "global_step": 28914, "epoch": 688} {"train_loss": -5.450169086456299, "global_step": 28915, "epoch": 688} {"train_loss": -5.260699272155762, "global_step": 28916, "epoch": 688} {"train_loss": -5.330193996429443, "global_step": 28917, "epoch": 688} {"train_loss": -5.505070686340332, "global_step": 28918, "epoch": 688} {"train_loss": -5.494786262512207, "global_step": 28919, "epoch": 688} {"train_loss": -5.397886276245117, "global_step": 28920, "epoch": 688} {"train_loss": -5.238525867462158, "global_step": 28921, "epoch": 688} {"train_loss": -5.450014114379883, "global_step": 28922, "epoch": 688} {"train_loss": -5.26924991607666, "global_step": 28923, "epoch": 688} {"train_loss": -5.45298957824707, "global_step": 28924, "epoch": 688} {"train_loss": -5.439767837524414, "global_step": 28925, "epoch": 688} {"train_loss": -5.32145357131958, "global_step": 28926, "epoch": 688} {"train_loss": -5.555074691772461, "global_step": 28927, "epoch": 688} {"train_loss": -5.536501407623291, "global_step": 28928, "epoch": 688} {"train_loss": -5.4301371574401855, "global_step": 28929, "epoch": 688} {"train_loss": -5.532842636108398, "global_step": 28930, "epoch": 688} {"train_loss": -5.436028480529785, "global_step": 28931, "epoch": 688} {"train_loss": -5.274923324584961, "global_step": 28932, "epoch": 688} {"train_loss": -5.545409202575684, "global_step": 28933, "epoch": 688} {"train_loss": -5.336629390716553, "global_step": 28934, "epoch": 688} {"train_loss": -5.316171646118164, "global_step": 28935, "epoch": 688} {"train_loss": -5.587047576904297, "global_step": 28936, "epoch": 688} {"train_loss": -5.446229616800944, "global_step": 28937, "epoch": 688, "val_loss": 75615.5625} {"train_loss": -5.485799789428711, "global_step": 28938, "epoch": 689} {"train_loss": -5.364923000335693, "global_step": 28939, "epoch": 689} {"train_loss": -5.444879531860352, "global_step": 28940, "epoch": 689} {"train_loss": -5.500870704650879, "global_step": 28941, "epoch": 689} {"train_loss": -5.441000938415527, "global_step": 28942, "epoch": 689} {"train_loss": -5.348808288574219, "global_step": 28943, "epoch": 689} {"train_loss": -5.527793884277344, "global_step": 28944, "epoch": 689} {"train_loss": -5.370633125305176, "global_step": 28945, "epoch": 689} {"train_loss": -5.3968505859375, "global_step": 28946, "epoch": 689} {"train_loss": -5.551302433013916, "global_step": 28947, "epoch": 689} {"train_loss": -5.311845779418945, "global_step": 28948, "epoch": 689} {"train_loss": -5.402985095977783, "global_step": 28949, "epoch": 689} {"train_loss": -5.458293437957764, "global_step": 28950, "epoch": 689} {"train_loss": -5.39489221572876, "global_step": 28951, "epoch": 689} {"train_loss": -5.314148426055908, "global_step": 28952, "epoch": 689} {"train_loss": -5.31198787689209, "global_step": 28953, "epoch": 689} {"train_loss": -5.357169151306152, "global_step": 28954, "epoch": 689} {"train_loss": -5.395689964294434, "global_step": 28955, "epoch": 689} {"train_loss": -5.464840412139893, "global_step": 28956, "epoch": 689} {"train_loss": -5.569923400878906, "global_step": 28957, "epoch": 689} {"train_loss": -5.498568534851074, "global_step": 28958, "epoch": 689} {"train_loss": -5.519245147705078, "global_step": 28959, "epoch": 689} {"train_loss": -5.377644062042236, "global_step": 28960, "epoch": 689} {"train_loss": -5.342306137084961, "global_step": 28961, "epoch": 689} {"train_loss": -5.590486526489258, "global_step": 28962, "epoch": 689} {"train_loss": -5.5174407958984375, "global_step": 28963, "epoch": 689} {"train_loss": -5.520346641540527, "global_step": 28964, "epoch": 689} {"train_loss": -5.581093788146973, "global_step": 28965, "epoch": 689} {"train_loss": -5.47068977355957, "global_step": 28966, "epoch": 689} {"train_loss": -5.4945807456970215, "global_step": 28967, "epoch": 689} {"train_loss": -5.617674827575684, "global_step": 28968, "epoch": 689} {"train_loss": -5.4311723709106445, "global_step": 28969, "epoch": 689} {"train_loss": -5.415427207946777, "global_step": 28970, "epoch": 689} {"train_loss": -5.4653520584106445, "global_step": 28971, "epoch": 689} {"train_loss": -5.549089431762695, "global_step": 28972, "epoch": 689} {"train_loss": -5.527052402496338, "global_step": 28973, "epoch": 689} {"train_loss": -5.444180965423584, "global_step": 28974, "epoch": 689} {"train_loss": -5.522995471954346, "global_step": 28975, "epoch": 689} {"train_loss": -5.52223539352417, "global_step": 28976, "epoch": 689} {"train_loss": -5.463489532470703, "global_step": 28977, "epoch": 689} {"train_loss": -5.428177356719971, "global_step": 28978, "epoch": 689} {"train_loss": -5.453522636776879, "global_step": 28979, "epoch": 689, "val_loss": 75613.8984375} {"train_loss": -5.486237525939941, "global_step": 28980, "epoch": 690} {"train_loss": -5.538308620452881, "global_step": 28981, "epoch": 690} {"train_loss": -5.550151824951172, "global_step": 28982, "epoch": 690} {"train_loss": -5.552850723266602, "global_step": 28983, "epoch": 690} {"train_loss": -5.498137474060059, "global_step": 28984, "epoch": 690} {"train_loss": -5.443545341491699, "global_step": 28985, "epoch": 690} {"train_loss": -5.472538948059082, "global_step": 28986, "epoch": 690} {"train_loss": -5.495559215545654, "global_step": 28987, "epoch": 690} {"train_loss": -5.5392746925354, "global_step": 28988, "epoch": 690} {"train_loss": -5.571396827697754, "global_step": 28989, "epoch": 690} {"train_loss": -5.622244358062744, "global_step": 28990, "epoch": 690} {"train_loss": -5.475949764251709, "global_step": 28991, "epoch": 690} {"train_loss": -5.409626007080078, "global_step": 28992, "epoch": 690} {"train_loss": -5.552319526672363, "global_step": 28993, "epoch": 690} {"train_loss": -5.455427169799805, "global_step": 28994, "epoch": 690} {"train_loss": -5.47564172744751, "global_step": 28995, "epoch": 690} {"train_loss": -5.40980863571167, "global_step": 28996, "epoch": 690} {"train_loss": -5.388659477233887, "global_step": 28997, "epoch": 690} {"train_loss": -5.364198684692383, "global_step": 28998, "epoch": 690} {"train_loss": -5.429612636566162, "global_step": 28999, "epoch": 690} {"train_loss": -5.274846076965332, "global_step": 29000, "epoch": 690} {"train_loss": -5.666619300842285, "global_step": 29001, "epoch": 690} {"train_loss": -5.343686103820801, "global_step": 29002, "epoch": 690} {"train_loss": -5.465410232543945, "global_step": 29003, "epoch": 690} {"train_loss": -5.437932968139648, "global_step": 29004, "epoch": 690} {"train_loss": -5.403987884521484, "global_step": 29005, "epoch": 690} {"train_loss": -5.4427971839904785, "global_step": 29006, "epoch": 690} {"train_loss": -5.440302848815918, "global_step": 29007, "epoch": 690} {"train_loss": -5.421485900878906, "global_step": 29008, "epoch": 690} {"train_loss": -5.335961818695068, "global_step": 29009, "epoch": 690} {"train_loss": -5.464615345001221, "global_step": 29010, "epoch": 690} {"train_loss": -5.462471961975098, "global_step": 29011, "epoch": 690} {"train_loss": -5.438599586486816, "global_step": 29012, "epoch": 690} {"train_loss": -5.2293806076049805, "global_step": 29013, "epoch": 690} {"train_loss": -5.452700614929199, "global_step": 29014, "epoch": 690} {"train_loss": -5.402814865112305, "global_step": 29015, "epoch": 690} {"train_loss": -5.36200475692749, "global_step": 29016, "epoch": 690} {"train_loss": -5.455757141113281, "global_step": 29017, "epoch": 690} {"train_loss": -5.370729923248291, "global_step": 29018, "epoch": 690} {"train_loss": -5.276772499084473, "global_step": 29019, "epoch": 690} {"train_loss": -5.308483123779297, "global_step": 29020, "epoch": 690} {"train_loss": -5.439093351364136, "global_step": 29021, "epoch": 690, "val_loss": 75466.03125} {"train_loss": -5.434256553649902, "global_step": 29022, "epoch": 691} {"train_loss": -5.378479957580566, "global_step": 29023, "epoch": 691} {"train_loss": -5.3863959312438965, "global_step": 29024, "epoch": 691} {"train_loss": -5.5533447265625, "global_step": 29025, "epoch": 691} {"train_loss": -5.435200214385986, "global_step": 29026, "epoch": 691} {"train_loss": -5.4499993324279785, "global_step": 29027, "epoch": 691} {"train_loss": -5.42691707611084, "global_step": 29028, "epoch": 691} {"train_loss": -5.468228816986084, "global_step": 29029, "epoch": 691} {"train_loss": -5.5140533447265625, "global_step": 29030, "epoch": 691} {"train_loss": -5.411694049835205, "global_step": 29031, "epoch": 691} {"train_loss": -5.4301862716674805, "global_step": 29032, "epoch": 691} {"train_loss": -5.579192161560059, "global_step": 29033, "epoch": 691} {"train_loss": -5.3638596534729, "global_step": 29034, "epoch": 691} {"train_loss": -5.388040065765381, "global_step": 29035, "epoch": 691} {"train_loss": -5.376187324523926, "global_step": 29036, "epoch": 691} {"train_loss": -5.487643241882324, "global_step": 29037, "epoch": 691} {"train_loss": -5.317129135131836, "global_step": 29038, "epoch": 691} {"train_loss": -5.437228202819824, "global_step": 29039, "epoch": 691} {"train_loss": -5.406929016113281, "global_step": 29040, "epoch": 691} {"train_loss": -5.349594593048096, "global_step": 29041, "epoch": 691} {"train_loss": -5.399242401123047, "global_step": 29042, "epoch": 691} {"train_loss": -5.448285102844238, "global_step": 29043, "epoch": 691} {"train_loss": -5.547551155090332, "global_step": 29044, "epoch": 691} {"train_loss": -5.500034809112549, "global_step": 29045, "epoch": 691} {"train_loss": -5.369228363037109, "global_step": 29046, "epoch": 691} {"train_loss": -5.455533027648926, "global_step": 29047, "epoch": 691} {"train_loss": -5.495527267456055, "global_step": 29048, "epoch": 691} {"train_loss": -5.4273362159729, "global_step": 29049, "epoch": 691} {"train_loss": -5.542777061462402, "global_step": 29050, "epoch": 691} {"train_loss": -5.411529541015625, "global_step": 29051, "epoch": 691} {"train_loss": -5.475151062011719, "global_step": 29052, "epoch": 691} {"train_loss": -5.563655853271484, "global_step": 29053, "epoch": 691} {"train_loss": -5.377138614654541, "global_step": 29054, "epoch": 691} {"train_loss": -5.39844274520874, "global_step": 29055, "epoch": 691} {"train_loss": -5.44586706161499, "global_step": 29056, "epoch": 691} {"train_loss": -5.522521018981934, "global_step": 29057, "epoch": 691} {"train_loss": -5.4634504318237305, "global_step": 29058, "epoch": 691} {"train_loss": -5.427914619445801, "global_step": 29059, "epoch": 691} {"train_loss": -5.410401821136475, "global_step": 29060, "epoch": 691} {"train_loss": -5.363454341888428, "global_step": 29061, "epoch": 691} {"train_loss": -5.4741291999816895, "global_step": 29062, "epoch": 691} {"train_loss": -5.439198289598737, "global_step": 29063, "epoch": 691, "val_loss": 75737.1875} {"train_loss": -5.428597927093506, "global_step": 29064, "epoch": 692} {"train_loss": -5.450953960418701, "global_step": 29065, "epoch": 692} {"train_loss": -5.410375595092773, "global_step": 29066, "epoch": 692} {"train_loss": -5.465339660644531, "global_step": 29067, "epoch": 692} {"train_loss": -5.431448936462402, "global_step": 29068, "epoch": 692} {"train_loss": -5.440825462341309, "global_step": 29069, "epoch": 692} {"train_loss": -5.327662467956543, "global_step": 29070, "epoch": 692} {"train_loss": -5.399859428405762, "global_step": 29071, "epoch": 692} {"train_loss": -5.316105842590332, "global_step": 29072, "epoch": 692} {"train_loss": -5.441147804260254, "global_step": 29073, "epoch": 692} {"train_loss": -5.558967590332031, "global_step": 29074, "epoch": 692} {"train_loss": -5.304193019866943, "global_step": 29075, "epoch": 692} {"train_loss": -5.455313205718994, "global_step": 29076, "epoch": 692} {"train_loss": -5.516452789306641, "global_step": 29077, "epoch": 692} {"train_loss": -5.501284122467041, "global_step": 29078, "epoch": 692} {"train_loss": -5.340390682220459, "global_step": 29079, "epoch": 692} {"train_loss": -5.512826919555664, "global_step": 29080, "epoch": 692} {"train_loss": -5.364438056945801, "global_step": 29081, "epoch": 692} {"train_loss": -5.58266544342041, "global_step": 29082, "epoch": 692} {"train_loss": -5.354269981384277, "global_step": 29083, "epoch": 692} {"train_loss": -5.356539726257324, "global_step": 29084, "epoch": 692} {"train_loss": -5.559976577758789, "global_step": 29085, "epoch": 692} {"train_loss": -5.435496807098389, "global_step": 29086, "epoch": 692} {"train_loss": -5.463075637817383, "global_step": 29087, "epoch": 692} {"train_loss": -5.5233869552612305, "global_step": 29088, "epoch": 692} {"train_loss": -5.398788928985596, "global_step": 29089, "epoch": 692} {"train_loss": -5.442615509033203, "global_step": 29090, "epoch": 692} {"train_loss": -5.502170562744141, "global_step": 29091, "epoch": 692} {"train_loss": -5.409825325012207, "global_step": 29092, "epoch": 692} {"train_loss": -5.488731861114502, "global_step": 29093, "epoch": 692} {"train_loss": -5.5275187492370605, "global_step": 29094, "epoch": 692} {"train_loss": -5.509626388549805, "global_step": 29095, "epoch": 692} {"train_loss": -5.366421699523926, "global_step": 29096, "epoch": 692} {"train_loss": -5.409588813781738, "global_step": 29097, "epoch": 692} {"train_loss": -5.522550582885742, "global_step": 29098, "epoch": 692} {"train_loss": -5.543366432189941, "global_step": 29099, "epoch": 692} {"train_loss": -5.631328582763672, "global_step": 29100, "epoch": 692} {"train_loss": -5.632824897766113, "global_step": 29101, "epoch": 692} {"train_loss": -5.489462852478027, "global_step": 29102, "epoch": 692} {"train_loss": -5.394355773925781, "global_step": 29103, "epoch": 692} {"train_loss": -5.415712356567383, "global_step": 29104, "epoch": 692} {"train_loss": -5.45722314289638, "global_step": 29105, "epoch": 692, "val_loss": 74862.359375} {"train_loss": -5.600659370422363, "global_step": 29106, "epoch": 693} {"train_loss": -5.486664772033691, "global_step": 29107, "epoch": 693} {"train_loss": -5.418424606323242, "global_step": 29108, "epoch": 693} {"train_loss": -5.308077812194824, "global_step": 29109, "epoch": 693} {"train_loss": -5.269108295440674, "global_step": 29110, "epoch": 693} {"train_loss": -5.470163822174072, "global_step": 29111, "epoch": 693} {"train_loss": -5.522136688232422, "global_step": 29112, "epoch": 693} {"train_loss": -5.566728115081787, "global_step": 29113, "epoch": 693} {"train_loss": -5.424272060394287, "global_step": 29114, "epoch": 693} {"train_loss": -5.561723709106445, "global_step": 29115, "epoch": 693} {"train_loss": -5.391697883605957, "global_step": 29116, "epoch": 693} {"train_loss": -5.406824111938477, "global_step": 29117, "epoch": 693} {"train_loss": -5.432437896728516, "global_step": 29118, "epoch": 693} {"train_loss": -5.449828624725342, "global_step": 29119, "epoch": 693} {"train_loss": -5.400752067565918, "global_step": 29120, "epoch": 693} {"train_loss": -5.441788673400879, "global_step": 29121, "epoch": 693} {"train_loss": -5.505511283874512, "global_step": 29122, "epoch": 693} {"train_loss": -5.462543487548828, "global_step": 29123, "epoch": 693} {"train_loss": -5.424844264984131, "global_step": 29124, "epoch": 693} {"train_loss": -5.408233642578125, "global_step": 29125, "epoch": 693} {"train_loss": -5.204730987548828, "global_step": 29126, "epoch": 693} {"train_loss": -5.576606750488281, "global_step": 29127, "epoch": 693} {"train_loss": -5.443368911743164, "global_step": 29128, "epoch": 693} {"train_loss": -5.430845260620117, "global_step": 29129, "epoch": 693} {"train_loss": -5.421642303466797, "global_step": 29130, "epoch": 693} {"train_loss": -5.362288475036621, "global_step": 29131, "epoch": 693} {"train_loss": -5.384776592254639, "global_step": 29132, "epoch": 693} {"train_loss": -5.4904985427856445, "global_step": 29133, "epoch": 693} {"train_loss": -5.320537090301514, "global_step": 29134, "epoch": 693} {"train_loss": -5.412328720092773, "global_step": 29135, "epoch": 693} {"train_loss": -5.433737754821777, "global_step": 29136, "epoch": 693} {"train_loss": -5.364476680755615, "global_step": 29137, "epoch": 693} {"train_loss": -5.447822570800781, "global_step": 29138, "epoch": 693} {"train_loss": -5.3582892417907715, "global_step": 29139, "epoch": 693} {"train_loss": -5.3736701011657715, "global_step": 29140, "epoch": 693} {"train_loss": -5.378120422363281, "global_step": 29141, "epoch": 693} {"train_loss": -5.299310684204102, "global_step": 29142, "epoch": 693} {"train_loss": -5.371676445007324, "global_step": 29143, "epoch": 693} {"train_loss": -5.358370780944824, "global_step": 29144, "epoch": 693} {"train_loss": -5.269906997680664, "global_step": 29145, "epoch": 693} {"train_loss": -5.489971160888672, "global_step": 29146, "epoch": 693} {"train_loss": -5.419932683308919, "global_step": 29147, "epoch": 693, "val_loss": 75194.5859375} {"train_loss": -5.464122772216797, "global_step": 29148, "epoch": 694} {"train_loss": -5.3685126304626465, "global_step": 29149, "epoch": 694} {"train_loss": -5.432748794555664, "global_step": 29150, "epoch": 694} {"train_loss": -5.4344024658203125, "global_step": 29151, "epoch": 694} {"train_loss": -5.4465718269348145, "global_step": 29152, "epoch": 694} {"train_loss": -5.484379291534424, "global_step": 29153, "epoch": 694} {"train_loss": -5.508036136627197, "global_step": 29154, "epoch": 694} {"train_loss": -5.414276123046875, "global_step": 29155, "epoch": 694} {"train_loss": -5.228367805480957, "global_step": 29156, "epoch": 694} {"train_loss": -5.47587776184082, "global_step": 29157, "epoch": 694} {"train_loss": -5.527256011962891, "global_step": 29158, "epoch": 694} {"train_loss": -5.382428169250488, "global_step": 29159, "epoch": 694} {"train_loss": -5.445173263549805, "global_step": 29160, "epoch": 694} {"train_loss": -5.37255859375, "global_step": 29161, "epoch": 694} {"train_loss": -5.558933258056641, "global_step": 29162, "epoch": 694} {"train_loss": -5.4734296798706055, "global_step": 29163, "epoch": 694} {"train_loss": -5.46906042098999, "global_step": 29164, "epoch": 694} {"train_loss": -5.491143226623535, "global_step": 29165, "epoch": 694} {"train_loss": -5.510584831237793, "global_step": 29166, "epoch": 694} {"train_loss": -5.492542743682861, "global_step": 29167, "epoch": 694} {"train_loss": -5.54221248626709, "global_step": 29168, "epoch": 694} {"train_loss": -5.5080952644348145, "global_step": 29169, "epoch": 694} {"train_loss": -5.503814220428467, "global_step": 29170, "epoch": 694} {"train_loss": -5.416901111602783, "global_step": 29171, "epoch": 694} {"train_loss": -5.533539772033691, "global_step": 29172, "epoch": 694} {"train_loss": -5.464012145996094, "global_step": 29173, "epoch": 694} {"train_loss": -5.482488632202148, "global_step": 29174, "epoch": 694} {"train_loss": -5.396294593811035, "global_step": 29175, "epoch": 694} {"train_loss": -5.289915084838867, "global_step": 29176, "epoch": 694} {"train_loss": -5.431215286254883, "global_step": 29177, "epoch": 694} {"train_loss": -5.506597518920898, "global_step": 29178, "epoch": 694} {"train_loss": -5.456042289733887, "global_step": 29179, "epoch": 694} {"train_loss": -5.256336688995361, "global_step": 29180, "epoch": 694} {"train_loss": -5.501928806304932, "global_step": 29181, "epoch": 694} {"train_loss": -5.564919948577881, "global_step": 29182, "epoch": 694} {"train_loss": -5.235195159912109, "global_step": 29183, "epoch": 694} {"train_loss": -5.528236389160156, "global_step": 29184, "epoch": 694} {"train_loss": -5.317811965942383, "global_step": 29185, "epoch": 694} {"train_loss": -5.3291335105896, "global_step": 29186, "epoch": 694} {"train_loss": -5.377109050750732, "global_step": 29187, "epoch": 694} {"train_loss": -5.314593315124512, "global_step": 29188, "epoch": 694} {"train_loss": -5.439826908565703, "global_step": 29189, "epoch": 694, "val_loss": 75314.765625} {"train_loss": -5.312941551208496, "global_step": 29190, "epoch": 695} {"train_loss": -5.502948760986328, "global_step": 29191, "epoch": 695} {"train_loss": -5.532894134521484, "global_step": 29192, "epoch": 695} {"train_loss": -5.416317939758301, "global_step": 29193, "epoch": 695} {"train_loss": -5.523327827453613, "global_step": 29194, "epoch": 695} {"train_loss": -5.5600905418396, "global_step": 29195, "epoch": 695} {"train_loss": -5.386943817138672, "global_step": 29196, "epoch": 695} {"train_loss": -5.388592720031738, "global_step": 29197, "epoch": 695} {"train_loss": -5.465456008911133, "global_step": 29198, "epoch": 695} {"train_loss": -5.466352462768555, "global_step": 29199, "epoch": 695} {"train_loss": -5.474946022033691, "global_step": 29200, "epoch": 695} {"train_loss": -5.371067047119141, "global_step": 29201, "epoch": 695} {"train_loss": -5.505445957183838, "global_step": 29202, "epoch": 695} {"train_loss": -5.399638652801514, "global_step": 29203, "epoch": 695} {"train_loss": -5.474141597747803, "global_step": 29204, "epoch": 695} {"train_loss": -5.473696708679199, "global_step": 29205, "epoch": 695} {"train_loss": -5.2787299156188965, "global_step": 29206, "epoch": 695} {"train_loss": -5.470454216003418, "global_step": 29207, "epoch": 695} {"train_loss": -5.525822639465332, "global_step": 29208, "epoch": 695} {"train_loss": -5.278347969055176, "global_step": 29209, "epoch": 695} {"train_loss": -5.363284587860107, "global_step": 29210, "epoch": 695} {"train_loss": -5.406249046325684, "global_step": 29211, "epoch": 695} {"train_loss": -5.476999282836914, "global_step": 29212, "epoch": 695} {"train_loss": -5.366365432739258, "global_step": 29213, "epoch": 695} {"train_loss": -5.337270736694336, "global_step": 29214, "epoch": 695} {"train_loss": -5.351483345031738, "global_step": 29215, "epoch": 695} {"train_loss": -5.421187400817871, "global_step": 29216, "epoch": 695} {"train_loss": -5.582552909851074, "global_step": 29217, "epoch": 695} {"train_loss": -5.522517204284668, "global_step": 29218, "epoch": 695} {"train_loss": -5.458299160003662, "global_step": 29219, "epoch": 695} {"train_loss": -5.564846992492676, "global_step": 29220, "epoch": 695} {"train_loss": -5.480156898498535, "global_step": 29221, "epoch": 695} {"train_loss": -5.496397018432617, "global_step": 29222, "epoch": 695} {"train_loss": -5.443873405456543, "global_step": 29223, "epoch": 695} {"train_loss": -5.546488285064697, "global_step": 29224, "epoch": 695} {"train_loss": -5.425876617431641, "global_step": 29225, "epoch": 695} {"train_loss": -5.221639633178711, "global_step": 29226, "epoch": 695} {"train_loss": -5.465322971343994, "global_step": 29227, "epoch": 695} {"train_loss": -5.365924835205078, "global_step": 29228, "epoch": 695} {"train_loss": -5.279844760894775, "global_step": 29229, "epoch": 695} {"train_loss": -5.442447662353516, "global_step": 29230, "epoch": 695} {"train_loss": -5.435409137180874, "global_step": 29231, "epoch": 695, "val_loss": 75928.1875} {"train_loss": -5.402472972869873, "global_step": 29232, "epoch": 696} {"train_loss": -5.481388092041016, "global_step": 29233, "epoch": 696} {"train_loss": -5.3480448722839355, "global_step": 29234, "epoch": 696} {"train_loss": -5.441205978393555, "global_step": 29235, "epoch": 696} {"train_loss": -5.289417266845703, "global_step": 29236, "epoch": 696} {"train_loss": -5.528510570526123, "global_step": 29237, "epoch": 696} {"train_loss": -5.377691268920898, "global_step": 29238, "epoch": 696} {"train_loss": -5.3797760009765625, "global_step": 29239, "epoch": 696} {"train_loss": -5.398581504821777, "global_step": 29240, "epoch": 696} {"train_loss": -5.3726677894592285, "global_step": 29241, "epoch": 696} {"train_loss": -5.448004722595215, "global_step": 29242, "epoch": 696} {"train_loss": -5.4726243019104, "global_step": 29243, "epoch": 696} {"train_loss": -5.512923717498779, "global_step": 29244, "epoch": 696} {"train_loss": -5.476049900054932, "global_step": 29245, "epoch": 696} {"train_loss": -5.415066242218018, "global_step": 29246, "epoch": 696} {"train_loss": -5.53305721282959, "global_step": 29247, "epoch": 696} {"train_loss": -5.490054607391357, "global_step": 29248, "epoch": 696} {"train_loss": -5.506625175476074, "global_step": 29249, "epoch": 696} {"train_loss": -5.3418731689453125, "global_step": 29250, "epoch": 696} {"train_loss": -5.460470676422119, "global_step": 29251, "epoch": 696} {"train_loss": -5.4124040603637695, "global_step": 29252, "epoch": 696} {"train_loss": -5.41309928894043, "global_step": 29253, "epoch": 696} {"train_loss": -5.373225688934326, "global_step": 29254, "epoch": 696} {"train_loss": -5.491375923156738, "global_step": 29255, "epoch": 696} {"train_loss": -5.3707685470581055, "global_step": 29256, "epoch": 696} {"train_loss": -5.484616756439209, "global_step": 29257, "epoch": 696} {"train_loss": -5.474552154541016, "global_step": 29258, "epoch": 696} {"train_loss": -5.46489953994751, "global_step": 29259, "epoch": 696} {"train_loss": -5.5111188888549805, "global_step": 29260, "epoch": 696} {"train_loss": -5.390649318695068, "global_step": 29261, "epoch": 696} {"train_loss": -5.489435195922852, "global_step": 29262, "epoch": 696} {"train_loss": -5.5546650886535645, "global_step": 29263, "epoch": 696} {"train_loss": -5.368173599243164, "global_step": 29264, "epoch": 696} {"train_loss": -5.536167144775391, "global_step": 29265, "epoch": 696} {"train_loss": -5.379924774169922, "global_step": 29266, "epoch": 696} {"train_loss": -5.4610490798950195, "global_step": 29267, "epoch": 696} {"train_loss": -5.596926689147949, "global_step": 29268, "epoch": 696} {"train_loss": -5.407256126403809, "global_step": 29269, "epoch": 696} {"train_loss": -5.453486442565918, "global_step": 29270, "epoch": 696} {"train_loss": -5.326721668243408, "global_step": 29271, "epoch": 696} {"train_loss": -5.420195579528809, "global_step": 29272, "epoch": 696} {"train_loss": -5.440313543592181, "global_step": 29273, "epoch": 696, "val_loss": 75171.578125} {"train_loss": -5.447805404663086, "global_step": 29274, "epoch": 697} {"train_loss": -5.460801124572754, "global_step": 29275, "epoch": 697} {"train_loss": -5.535680770874023, "global_step": 29276, "epoch": 697} {"train_loss": -5.450826168060303, "global_step": 29277, "epoch": 697} {"train_loss": -5.493771553039551, "global_step": 29278, "epoch": 697} {"train_loss": -5.602608680725098, "global_step": 29279, "epoch": 697} {"train_loss": -5.514432907104492, "global_step": 29280, "epoch": 697} {"train_loss": -5.518249034881592, "global_step": 29281, "epoch": 697} {"train_loss": -5.528868675231934, "global_step": 29282, "epoch": 697} {"train_loss": -5.478596210479736, "global_step": 29283, "epoch": 697} {"train_loss": -5.403075218200684, "global_step": 29284, "epoch": 697} {"train_loss": -5.442759990692139, "global_step": 29285, "epoch": 697} {"train_loss": -5.5460920333862305, "global_step": 29286, "epoch": 697} {"train_loss": -5.461724281311035, "global_step": 29287, "epoch": 697} {"train_loss": -5.577637672424316, "global_step": 29288, "epoch": 697} {"train_loss": -5.360247611999512, "global_step": 29289, "epoch": 697} {"train_loss": -5.4199347496032715, "global_step": 29290, "epoch": 697} {"train_loss": -5.441427230834961, "global_step": 29291, "epoch": 697} {"train_loss": -5.434446811676025, "global_step": 29292, "epoch": 697} {"train_loss": -5.3019609451293945, "global_step": 29293, "epoch": 697} {"train_loss": -5.578939437866211, "global_step": 29294, "epoch": 697} {"train_loss": -5.458553314208984, "global_step": 29295, "epoch": 697} {"train_loss": -5.364128112792969, "global_step": 29296, "epoch": 697} {"train_loss": -5.409562110900879, "global_step": 29297, "epoch": 697} {"train_loss": -5.599861145019531, "global_step": 29298, "epoch": 697} {"train_loss": -5.461106300354004, "global_step": 29299, "epoch": 697} {"train_loss": -5.48453950881958, "global_step": 29300, "epoch": 697} {"train_loss": -5.326418876647949, "global_step": 29301, "epoch": 697} {"train_loss": -5.415553092956543, "global_step": 29302, "epoch": 697} {"train_loss": -5.51798152923584, "global_step": 29303, "epoch": 697} {"train_loss": -5.436481475830078, "global_step": 29304, "epoch": 697} {"train_loss": -5.408127784729004, "global_step": 29305, "epoch": 697} {"train_loss": -5.591795444488525, "global_step": 29306, "epoch": 697} {"train_loss": -5.374900817871094, "global_step": 29307, "epoch": 697} {"train_loss": -5.441956520080566, "global_step": 29308, "epoch": 697} {"train_loss": -5.395926475524902, "global_step": 29309, "epoch": 697} {"train_loss": -5.501218795776367, "global_step": 29310, "epoch": 697} {"train_loss": -5.499456405639648, "global_step": 29311, "epoch": 697} {"train_loss": -5.426056385040283, "global_step": 29312, "epoch": 697} {"train_loss": -5.469003200531006, "global_step": 29313, "epoch": 697} {"train_loss": -5.411955833435059, "global_step": 29314, "epoch": 697} {"train_loss": -5.4621622903006415, "global_step": 29315, "epoch": 697, "val_loss": 75977.125} {"train_loss": -5.448041915893555, "global_step": 29316, "epoch": 698} {"train_loss": -5.421923637390137, "global_step": 29317, "epoch": 698} {"train_loss": -5.544398307800293, "global_step": 29318, "epoch": 698} {"train_loss": -5.678282737731934, "global_step": 29319, "epoch": 698} {"train_loss": -5.55946683883667, "global_step": 29320, "epoch": 698} {"train_loss": -5.485745429992676, "global_step": 29321, "epoch": 698} {"train_loss": -5.463151931762695, "global_step": 29322, "epoch": 698} {"train_loss": -5.370810508728027, "global_step": 29323, "epoch": 698} {"train_loss": -5.409371376037598, "global_step": 29324, "epoch": 698} {"train_loss": -5.391545295715332, "global_step": 29325, "epoch": 698} {"train_loss": -5.377021789550781, "global_step": 29326, "epoch": 698} {"train_loss": -5.553190231323242, "global_step": 29327, "epoch": 698} {"train_loss": -5.485925674438477, "global_step": 29328, "epoch": 698} {"train_loss": -5.446488380432129, "global_step": 29329, "epoch": 698} {"train_loss": -5.448178768157959, "global_step": 29330, "epoch": 698} {"train_loss": -5.593967914581299, "global_step": 29331, "epoch": 698} {"train_loss": -5.587434768676758, "global_step": 29332, "epoch": 698} {"train_loss": -5.475423812866211, "global_step": 29333, "epoch": 698} {"train_loss": -5.318833827972412, "global_step": 29334, "epoch": 698} {"train_loss": -5.509948253631592, "global_step": 29335, "epoch": 698} {"train_loss": -5.3284101486206055, "global_step": 29336, "epoch": 698} {"train_loss": -5.365416526794434, "global_step": 29337, "epoch": 698} {"train_loss": -5.506007194519043, "global_step": 29338, "epoch": 698} {"train_loss": -5.348395347595215, "global_step": 29339, "epoch": 698} {"train_loss": -5.470585823059082, "global_step": 29340, "epoch": 698} {"train_loss": -5.4885430335998535, "global_step": 29341, "epoch": 698} {"train_loss": -5.386031627655029, "global_step": 29342, "epoch": 698} {"train_loss": -5.416108131408691, "global_step": 29343, "epoch": 698} {"train_loss": -5.515146732330322, "global_step": 29344, "epoch": 698} {"train_loss": -5.395099639892578, "global_step": 29345, "epoch": 698} {"train_loss": -5.407556056976318, "global_step": 29346, "epoch": 698} {"train_loss": -5.4444451332092285, "global_step": 29347, "epoch": 698} {"train_loss": -5.473889350891113, "global_step": 29348, "epoch": 698} {"train_loss": -5.40628719329834, "global_step": 29349, "epoch": 698} {"train_loss": -5.58360481262207, "global_step": 29350, "epoch": 698} {"train_loss": -5.372076988220215, "global_step": 29351, "epoch": 698} {"train_loss": -5.512462615966797, "global_step": 29352, "epoch": 698} {"train_loss": -5.543780326843262, "global_step": 29353, "epoch": 698} {"train_loss": -5.460388660430908, "global_step": 29354, "epoch": 698} {"train_loss": -5.368614673614502, "global_step": 29355, "epoch": 698} {"train_loss": -5.479022979736328, "global_step": 29356, "epoch": 698} {"train_loss": -5.461070038023449, "global_step": 29357, "epoch": 698, "val_loss": 75601.3125} {"train_loss": -5.419602394104004, "global_step": 29358, "epoch": 699} {"train_loss": -5.503880977630615, "global_step": 29359, "epoch": 699} {"train_loss": -5.529779434204102, "global_step": 29360, "epoch": 699} {"train_loss": -5.401108741760254, "global_step": 29361, "epoch": 699} {"train_loss": -5.528512477874756, "global_step": 29362, "epoch": 699} {"train_loss": -5.470904350280762, "global_step": 29363, "epoch": 699} {"train_loss": -5.463615417480469, "global_step": 29364, "epoch": 699} {"train_loss": -5.424952030181885, "global_step": 29365, "epoch": 699} {"train_loss": -5.4747514724731445, "global_step": 29366, "epoch": 699} {"train_loss": -5.451528072357178, "global_step": 29367, "epoch": 699} {"train_loss": -5.540457725524902, "global_step": 29368, "epoch": 699} {"train_loss": -5.473403453826904, "global_step": 29369, "epoch": 699} {"train_loss": -5.480119705200195, "global_step": 29370, "epoch": 699} {"train_loss": -5.563893795013428, "global_step": 29371, "epoch": 699} {"train_loss": -5.432059288024902, "global_step": 29372, "epoch": 699} {"train_loss": -5.32388973236084, "global_step": 29373, "epoch": 699} {"train_loss": -5.477760314941406, "global_step": 29374, "epoch": 699} {"train_loss": -5.533153533935547, "global_step": 29375, "epoch": 699} {"train_loss": -5.393691062927246, "global_step": 29376, "epoch": 699} {"train_loss": -5.5260515213012695, "global_step": 29377, "epoch": 699} {"train_loss": -5.560861587524414, "global_step": 29378, "epoch": 699} {"train_loss": -5.288823127746582, "global_step": 29379, "epoch": 699} {"train_loss": -5.4114179611206055, "global_step": 29380, "epoch": 699} {"train_loss": -5.419774532318115, "global_step": 29381, "epoch": 699} {"train_loss": -5.379727840423584, "global_step": 29382, "epoch": 699} {"train_loss": -5.558719635009766, "global_step": 29383, "epoch": 699} {"train_loss": -5.5432353019714355, "global_step": 29384, "epoch": 699} {"train_loss": -5.382314205169678, "global_step": 29385, "epoch": 699} {"train_loss": -5.487157821655273, "global_step": 29386, "epoch": 699} {"train_loss": -5.400960445404053, "global_step": 29387, "epoch": 699} {"train_loss": -5.377485275268555, "global_step": 29388, "epoch": 699} {"train_loss": -5.471164703369141, "global_step": 29389, "epoch": 699} {"train_loss": -5.311318397521973, "global_step": 29390, "epoch": 699} {"train_loss": -5.463181495666504, "global_step": 29391, "epoch": 699} {"train_loss": -5.515708923339844, "global_step": 29392, "epoch": 699} {"train_loss": -5.438215255737305, "global_step": 29393, "epoch": 699} {"train_loss": -5.505271911621094, "global_step": 29394, "epoch": 699} {"train_loss": -5.276005268096924, "global_step": 29395, "epoch": 699} {"train_loss": -5.456365585327148, "global_step": 29396, "epoch": 699} {"train_loss": -5.513775825500488, "global_step": 29397, "epoch": 699} {"train_loss": -5.450969696044922, "global_step": 29398, "epoch": 699} {"train_loss": -5.456773780641102, "global_step": 29399, "epoch": 699, "val_loss": 75723.1328125} {"train_loss": -5.54077672958374, "global_step": 29400, "epoch": 700} {"train_loss": -5.498441219329834, "global_step": 29401, "epoch": 700} {"train_loss": -5.294880390167236, "global_step": 29402, "epoch": 700} {"train_loss": -5.412060737609863, "global_step": 29403, "epoch": 700} {"train_loss": -5.426573276519775, "global_step": 29404, "epoch": 700} {"train_loss": -5.434961795806885, "global_step": 29405, "epoch": 700} {"train_loss": -5.467130661010742, "global_step": 29406, "epoch": 700} {"train_loss": -5.523448944091797, "global_step": 29407, "epoch": 700} {"train_loss": -5.431205749511719, "global_step": 29408, "epoch": 700} {"train_loss": -5.399569988250732, "global_step": 29409, "epoch": 700} {"train_loss": -5.379847526550293, "global_step": 29410, "epoch": 700} {"train_loss": -5.403494834899902, "global_step": 29411, "epoch": 700} {"train_loss": -5.52919864654541, "global_step": 29412, "epoch": 700} {"train_loss": -5.350254058837891, "global_step": 29413, "epoch": 700} {"train_loss": -5.404233932495117, "global_step": 29414, "epoch": 700} {"train_loss": -5.3891706466674805, "global_step": 29415, "epoch": 700} {"train_loss": -5.414628982543945, "global_step": 29416, "epoch": 700} {"train_loss": -5.544090270996094, "global_step": 29417, "epoch": 700} {"train_loss": -5.401835918426514, "global_step": 29418, "epoch": 700} {"train_loss": -5.281822204589844, "global_step": 29419, "epoch": 700} {"train_loss": -5.473723411560059, "global_step": 29420, "epoch": 700} {"train_loss": -5.3511457443237305, "global_step": 29421, "epoch": 700} {"train_loss": -5.503545761108398, "global_step": 29422, "epoch": 700} {"train_loss": -5.481745719909668, "global_step": 29423, "epoch": 700} {"train_loss": -5.379873752593994, "global_step": 29424, "epoch": 700} {"train_loss": -5.43887996673584, "global_step": 29425, "epoch": 700} {"train_loss": -5.395689487457275, "global_step": 29426, "epoch": 700} {"train_loss": -5.436424255371094, "global_step": 29427, "epoch": 700} {"train_loss": -5.403159141540527, "global_step": 29428, "epoch": 700} {"train_loss": -5.39518404006958, "global_step": 29429, "epoch": 700} {"train_loss": -5.556574821472168, "global_step": 29430, "epoch": 700} {"train_loss": -5.53657341003418, "global_step": 29431, "epoch": 700} {"train_loss": -5.397578239440918, "global_step": 29432, "epoch": 700} {"train_loss": -5.342817306518555, "global_step": 29433, "epoch": 700} {"train_loss": -5.494509220123291, "global_step": 29434, "epoch": 700} {"train_loss": -5.309894561767578, "global_step": 29435, "epoch": 700} {"train_loss": -5.473526954650879, "global_step": 29436, "epoch": 700} {"train_loss": -5.396023750305176, "global_step": 29437, "epoch": 700} {"train_loss": -5.3636016845703125, "global_step": 29438, "epoch": 700} {"train_loss": -5.386575698852539, "global_step": 29439, "epoch": 700} {"train_loss": -5.4636616706848145, "global_step": 29440, "epoch": 700} {"train_loss": -5.42885666801816, "global_step": 29441, "epoch": 700, "train/sim_max_reward_0": 0.4287700079836533, "train/sim_max_reward_1": 0.10946618924369984, "train/sim_max_reward_2": 0.1991416283885956, "train/sim_max_reward_3": 0.3485879526524617, "train/sim_max_reward_4": 0.690195847783713, "train/sim_max_reward_5": 0.5650628359074941, "test/sim_max_reward_4500000": 0.8046023605824123, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.44374818684137207, "test/sim_max_reward_4500003": 0.5352033359346428, "test/sim_max_reward_4500004": 0.3606459880303244, "test/sim_max_reward_4500005": 0.12478492811296969, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.2649842137600164, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.3381551513828707, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.0926828969091831, "test/sim_max_reward_4500012": 0.7807371482022704, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.4298240948894154, "test/sim_max_reward_4500015": 0.2198550698545924, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.5776177536220387, "test/sim_max_reward_4500018": 0.31660181432818774, "test/sim_max_reward_4500019": 0.9722032457343392, "test/sim_max_reward_4500020": 0.4080807146739597, "test/sim_max_reward_4500021": 0.6871832263181608, "test/sim_max_reward_4500022": 0.6799707651401182, "test/sim_max_reward_4500023": 0.8572824447550205, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.1611838577661921, "test/sim_max_reward_4500026": 0.17167799123071267, "test/sim_max_reward_4500027": 0.5998664986863216, "test/sim_max_reward_4500028": 0.6789984850937882, "test/sim_max_reward_4500029": 0.21153387036330681, "test/sim_max_reward_4500030": 0.32347421686131517, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.46748050709224254, "test/sim_max_reward_4500033": 0.30317440941777546, "test/sim_max_reward_4500034": 0.4550096121342776, "test/sim_max_reward_4500035": 0.8796120387884943, "test/sim_max_reward_4500036": 0.4640885328624085, "test/sim_max_reward_4500037": 0.3187701114939806, "test/sim_max_reward_4500038": 0.3283599933057113, "test/sim_max_reward_4500039": 0.3754748305715653, "test/sim_max_reward_4500040": 0.24045877676569652, "test/sim_max_reward_4500041": 0.2364225320059248, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.8437531987873319, "test/sim_max_reward_4500044": 0.11380621119202905, "test/sim_max_reward_4500045": 0.15561452298613362, "test/sim_max_reward_4500046": 0.31655249958913545, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.283815076578676, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.3902040769932696, "test/mean_score": 0.3372654983843919, "val_loss": 74806.3046875} {"train_loss": -5.4584503173828125, "global_step": 29442, "epoch": 701} {"train_loss": -5.553536415100098, "global_step": 29443, "epoch": 701} {"train_loss": -5.257416725158691, "global_step": 29444, "epoch": 701} {"train_loss": -5.491556167602539, "global_step": 29445, "epoch": 701} {"train_loss": -5.499370574951172, "global_step": 29446, "epoch": 701} {"train_loss": -5.565123081207275, "global_step": 29447, "epoch": 701} {"train_loss": -5.4631452560424805, "global_step": 29448, "epoch": 701} {"train_loss": -5.290270805358887, "global_step": 29449, "epoch": 701} {"train_loss": -5.353415489196777, "global_step": 29450, "epoch": 701} {"train_loss": -5.457613945007324, "global_step": 29451, "epoch": 701} {"train_loss": -5.554840564727783, "global_step": 29452, "epoch": 701} {"train_loss": -5.434408187866211, "global_step": 29453, "epoch": 701} {"train_loss": -5.431766986846924, "global_step": 29454, "epoch": 701} {"train_loss": -5.443785667419434, "global_step": 29455, "epoch": 701} {"train_loss": -5.481118202209473, "global_step": 29456, "epoch": 701} {"train_loss": -5.429267883300781, "global_step": 29457, "epoch": 701} {"train_loss": -5.443192481994629, "global_step": 29458, "epoch": 701} {"train_loss": -5.575496196746826, "global_step": 29459, "epoch": 701} {"train_loss": -5.410007476806641, "global_step": 29460, "epoch": 701} {"train_loss": -5.4389801025390625, "global_step": 29461, "epoch": 701} {"train_loss": -5.481380462646484, "global_step": 29462, "epoch": 701} {"train_loss": -5.458444595336914, "global_step": 29463, "epoch": 701} {"train_loss": -5.445413589477539, "global_step": 29464, "epoch": 701} {"train_loss": -5.517056465148926, "global_step": 29465, "epoch": 701} {"train_loss": -5.365660667419434, "global_step": 29466, "epoch": 701} {"train_loss": -5.491178512573242, "global_step": 29467, "epoch": 701} {"train_loss": -5.462655067443848, "global_step": 29468, "epoch": 701} {"train_loss": -5.507236480712891, "global_step": 29469, "epoch": 701} {"train_loss": -5.384692192077637, "global_step": 29470, "epoch": 701} {"train_loss": -5.483376502990723, "global_step": 29471, "epoch": 701} {"train_loss": -5.368250846862793, "global_step": 29472, "epoch": 701} {"train_loss": -5.397691249847412, "global_step": 29473, "epoch": 701} {"train_loss": -5.535594463348389, "global_step": 29474, "epoch": 701} {"train_loss": -5.4956865310668945, "global_step": 29475, "epoch": 701} {"train_loss": -5.585660934448242, "global_step": 29476, "epoch": 701} {"train_loss": -5.400862216949463, "global_step": 29477, "epoch": 701} {"train_loss": -5.387165546417236, "global_step": 29478, "epoch": 701} {"train_loss": -5.541759490966797, "global_step": 29479, "epoch": 701} {"train_loss": -5.402797698974609, "global_step": 29480, "epoch": 701} {"train_loss": -5.404086112976074, "global_step": 29481, "epoch": 701} {"train_loss": -5.3614397048950195, "global_step": 29482, "epoch": 701} {"train_loss": -5.450820604960124, "global_step": 29483, "epoch": 701, "val_loss": 75364.796875} {"train_loss": -5.427954196929932, "global_step": 29484, "epoch": 702} {"train_loss": -5.437717437744141, "global_step": 29485, "epoch": 702} {"train_loss": -5.370746612548828, "global_step": 29486, "epoch": 702} {"train_loss": -5.579037666320801, "global_step": 29487, "epoch": 702} {"train_loss": -5.413537979125977, "global_step": 29488, "epoch": 702} {"train_loss": -5.416495323181152, "global_step": 29489, "epoch": 702} {"train_loss": -5.537283897399902, "global_step": 29490, "epoch": 702} {"train_loss": -5.494280815124512, "global_step": 29491, "epoch": 702} {"train_loss": -5.410070896148682, "global_step": 29492, "epoch": 702} {"train_loss": -5.518434524536133, "global_step": 29493, "epoch": 702} {"train_loss": -5.429830074310303, "global_step": 29494, "epoch": 702} {"train_loss": -5.50054407119751, "global_step": 29495, "epoch": 702} {"train_loss": -5.391139507293701, "global_step": 29496, "epoch": 702} {"train_loss": -5.4190778732299805, "global_step": 29497, "epoch": 702} {"train_loss": -5.53632926940918, "global_step": 29498, "epoch": 702} {"train_loss": -5.508481979370117, "global_step": 29499, "epoch": 702} {"train_loss": -5.52590274810791, "global_step": 29500, "epoch": 702} {"train_loss": -5.444577693939209, "global_step": 29501, "epoch": 702} {"train_loss": -5.482118606567383, "global_step": 29502, "epoch": 702} {"train_loss": -5.425666809082031, "global_step": 29503, "epoch": 702} {"train_loss": -5.396289825439453, "global_step": 29504, "epoch": 702} {"train_loss": -5.305819511413574, "global_step": 29505, "epoch": 702} {"train_loss": -5.576706409454346, "global_step": 29506, "epoch": 702} {"train_loss": -5.4345622062683105, "global_step": 29507, "epoch": 702} {"train_loss": -5.43369197845459, "global_step": 29508, "epoch": 702} {"train_loss": -5.363261699676514, "global_step": 29509, "epoch": 702} {"train_loss": -5.486800193786621, "global_step": 29510, "epoch": 702} {"train_loss": -5.380598545074463, "global_step": 29511, "epoch": 702} {"train_loss": -5.381941795349121, "global_step": 29512, "epoch": 702} {"train_loss": -5.518911361694336, "global_step": 29513, "epoch": 702} {"train_loss": -5.398550510406494, "global_step": 29514, "epoch": 702} {"train_loss": -5.337587356567383, "global_step": 29515, "epoch": 702} {"train_loss": -5.410525321960449, "global_step": 29516, "epoch": 702} {"train_loss": -5.467429161071777, "global_step": 29517, "epoch": 702} {"train_loss": -5.416506767272949, "global_step": 29518, "epoch": 702} {"train_loss": -5.392793655395508, "global_step": 29519, "epoch": 702} {"train_loss": -5.354517936706543, "global_step": 29520, "epoch": 702} {"train_loss": -5.437743663787842, "global_step": 29521, "epoch": 702} {"train_loss": -5.499768257141113, "global_step": 29522, "epoch": 702} {"train_loss": -5.528318405151367, "global_step": 29523, "epoch": 702} {"train_loss": -5.319103240966797, "global_step": 29524, "epoch": 702} {"train_loss": -5.442156905219669, "global_step": 29525, "epoch": 702, "val_loss": 75419.265625} {"train_loss": -5.493556499481201, "global_step": 29526, "epoch": 703} {"train_loss": -5.5078654289245605, "global_step": 29527, "epoch": 703} {"train_loss": -5.513454437255859, "global_step": 29528, "epoch": 703} {"train_loss": -5.3710455894470215, "global_step": 29529, "epoch": 703} {"train_loss": -5.391217231750488, "global_step": 29530, "epoch": 703} {"train_loss": -5.306268692016602, "global_step": 29531, "epoch": 703} {"train_loss": -5.48574161529541, "global_step": 29532, "epoch": 703} {"train_loss": -5.3747758865356445, "global_step": 29533, "epoch": 703} {"train_loss": -5.3463134765625, "global_step": 29534, "epoch": 703} {"train_loss": -5.372951507568359, "global_step": 29535, "epoch": 703} {"train_loss": -5.424765110015869, "global_step": 29536, "epoch": 703} {"train_loss": -5.631386756896973, "global_step": 29537, "epoch": 703} {"train_loss": -5.35883903503418, "global_step": 29538, "epoch": 703} {"train_loss": -5.554325103759766, "global_step": 29539, "epoch": 703} {"train_loss": -5.425346851348877, "global_step": 29540, "epoch": 703} {"train_loss": -5.422521591186523, "global_step": 29541, "epoch": 703} {"train_loss": -5.482961654663086, "global_step": 29542, "epoch": 703} {"train_loss": -5.425721168518066, "global_step": 29543, "epoch": 703} {"train_loss": -5.478872776031494, "global_step": 29544, "epoch": 703} {"train_loss": -5.521340370178223, "global_step": 29545, "epoch": 703} {"train_loss": -5.408424377441406, "global_step": 29546, "epoch": 703} {"train_loss": -5.49727201461792, "global_step": 29547, "epoch": 703} {"train_loss": -5.514280319213867, "global_step": 29548, "epoch": 703} {"train_loss": -5.512550354003906, "global_step": 29549, "epoch": 703} {"train_loss": -5.458444595336914, "global_step": 29550, "epoch": 703} {"train_loss": -5.59094762802124, "global_step": 29551, "epoch": 703} {"train_loss": -5.398118019104004, "global_step": 29552, "epoch": 703} {"train_loss": -5.43062686920166, "global_step": 29553, "epoch": 703} {"train_loss": -5.455167770385742, "global_step": 29554, "epoch": 703} {"train_loss": -5.51214075088501, "global_step": 29555, "epoch": 703} {"train_loss": -5.542768955230713, "global_step": 29556, "epoch": 703} {"train_loss": -5.619958877563477, "global_step": 29557, "epoch": 703} {"train_loss": -5.53007698059082, "global_step": 29558, "epoch": 703} {"train_loss": -5.416118144989014, "global_step": 29559, "epoch": 703} {"train_loss": -5.410540580749512, "global_step": 29560, "epoch": 703} {"train_loss": -5.595431327819824, "global_step": 29561, "epoch": 703} {"train_loss": -5.472723960876465, "global_step": 29562, "epoch": 703} {"train_loss": -5.390793800354004, "global_step": 29563, "epoch": 703} {"train_loss": -5.445624351501465, "global_step": 29564, "epoch": 703} {"train_loss": -5.5275163650512695, "global_step": 29565, "epoch": 703} {"train_loss": -5.366683006286621, "global_step": 29566, "epoch": 703} {"train_loss": -5.4658564158848355, "global_step": 29567, "epoch": 703, "val_loss": 74788.9921875} {"train_loss": -5.514252662658691, "global_step": 29568, "epoch": 704} {"train_loss": -5.457056999206543, "global_step": 29569, "epoch": 704} {"train_loss": -5.498382568359375, "global_step": 29570, "epoch": 704} {"train_loss": -5.477167129516602, "global_step": 29571, "epoch": 704} {"train_loss": -5.346118927001953, "global_step": 29572, "epoch": 704} {"train_loss": -5.489187240600586, "global_step": 29573, "epoch": 704} {"train_loss": -5.532015800476074, "global_step": 29574, "epoch": 704} {"train_loss": -5.426860809326172, "global_step": 29575, "epoch": 704} {"train_loss": -5.588953971862793, "global_step": 29576, "epoch": 704} {"train_loss": -5.385495185852051, "global_step": 29577, "epoch": 704} {"train_loss": -5.475497245788574, "global_step": 29578, "epoch": 704} {"train_loss": -5.4882049560546875, "global_step": 29579, "epoch": 704} {"train_loss": -5.385979652404785, "global_step": 29580, "epoch": 704} {"train_loss": -5.445471286773682, "global_step": 29581, "epoch": 704} {"train_loss": -5.349321365356445, "global_step": 29582, "epoch": 704} {"train_loss": -5.530717849731445, "global_step": 29583, "epoch": 704} {"train_loss": -5.382831573486328, "global_step": 29584, "epoch": 704} {"train_loss": -5.576816558837891, "global_step": 29585, "epoch": 704} {"train_loss": -5.4687371253967285, "global_step": 29586, "epoch": 704} {"train_loss": -5.518514633178711, "global_step": 29587, "epoch": 704} {"train_loss": -5.504497528076172, "global_step": 29588, "epoch": 704} {"train_loss": -5.573853492736816, "global_step": 29589, "epoch": 704} {"train_loss": -5.475521087646484, "global_step": 29590, "epoch": 704} {"train_loss": -5.472614765167236, "global_step": 29591, "epoch": 704} {"train_loss": -5.607410907745361, "global_step": 29592, "epoch": 704} {"train_loss": -5.553421974182129, "global_step": 29593, "epoch": 704} {"train_loss": -5.506521224975586, "global_step": 29594, "epoch": 704} {"train_loss": -5.444530487060547, "global_step": 29595, "epoch": 704} {"train_loss": -5.414782524108887, "global_step": 29596, "epoch": 704} {"train_loss": -5.575249671936035, "global_step": 29597, "epoch": 704} {"train_loss": -5.418072700500488, "global_step": 29598, "epoch": 704} {"train_loss": -5.463250160217285, "global_step": 29599, "epoch": 704} {"train_loss": -5.315276145935059, "global_step": 29600, "epoch": 704} {"train_loss": -5.423089981079102, "global_step": 29601, "epoch": 704} {"train_loss": -5.339944839477539, "global_step": 29602, "epoch": 704} {"train_loss": -5.368915557861328, "global_step": 29603, "epoch": 704} {"train_loss": -5.465472221374512, "global_step": 29604, "epoch": 704} {"train_loss": -5.397367000579834, "global_step": 29605, "epoch": 704} {"train_loss": -5.323386192321777, "global_step": 29606, "epoch": 704} {"train_loss": -5.36909294128418, "global_step": 29607, "epoch": 704} {"train_loss": -5.407135486602783, "global_step": 29608, "epoch": 704} {"train_loss": -5.458815779004778, "global_step": 29609, "epoch": 704, "val_loss": 75607.625} {"train_loss": -5.2862091064453125, "global_step": 29610, "epoch": 705} {"train_loss": -5.558755874633789, "global_step": 29611, "epoch": 705} {"train_loss": -5.432486534118652, "global_step": 29612, "epoch": 705} {"train_loss": -5.350684642791748, "global_step": 29613, "epoch": 705} {"train_loss": -5.59196138381958, "global_step": 29614, "epoch": 705} {"train_loss": -5.461803436279297, "global_step": 29615, "epoch": 705} {"train_loss": -5.443934440612793, "global_step": 29616, "epoch": 705} {"train_loss": -5.432826995849609, "global_step": 29617, "epoch": 705} {"train_loss": -5.420602798461914, "global_step": 29618, "epoch": 705} {"train_loss": -5.565749645233154, "global_step": 29619, "epoch": 705} {"train_loss": -5.453263759613037, "global_step": 29620, "epoch": 705} {"train_loss": -5.5440568923950195, "global_step": 29621, "epoch": 705} {"train_loss": -5.597017288208008, "global_step": 29622, "epoch": 705} {"train_loss": -5.404840469360352, "global_step": 29623, "epoch": 705} {"train_loss": -5.566025733947754, "global_step": 29624, "epoch": 705} {"train_loss": -5.3603434562683105, "global_step": 29625, "epoch": 705} {"train_loss": -5.4018425941467285, "global_step": 29626, "epoch": 705} {"train_loss": -5.396227836608887, "global_step": 29627, "epoch": 705} {"train_loss": -5.371008396148682, "global_step": 29628, "epoch": 705} {"train_loss": -5.4621686935424805, "global_step": 29629, "epoch": 705} {"train_loss": -5.509514808654785, "global_step": 29630, "epoch": 705} {"train_loss": -5.327303886413574, "global_step": 29631, "epoch": 705} {"train_loss": -5.418573379516602, "global_step": 29632, "epoch": 705} {"train_loss": -5.411420822143555, "global_step": 29633, "epoch": 705} {"train_loss": -5.333804130554199, "global_step": 29634, "epoch": 705} {"train_loss": -5.557701110839844, "global_step": 29635, "epoch": 705} {"train_loss": -5.484796524047852, "global_step": 29636, "epoch": 705} {"train_loss": -5.307125091552734, "global_step": 29637, "epoch": 705} {"train_loss": -5.42955207824707, "global_step": 29638, "epoch": 705} {"train_loss": -5.540277481079102, "global_step": 29639, "epoch": 705} {"train_loss": -5.379294395446777, "global_step": 29640, "epoch": 705} {"train_loss": -5.404699325561523, "global_step": 29641, "epoch": 705} {"train_loss": -5.40015983581543, "global_step": 29642, "epoch": 705} {"train_loss": -5.50930118560791, "global_step": 29643, "epoch": 705} {"train_loss": -5.566884994506836, "global_step": 29644, "epoch": 705} {"train_loss": -5.540227890014648, "global_step": 29645, "epoch": 705} {"train_loss": -5.457241058349609, "global_step": 29646, "epoch": 705} {"train_loss": -5.515255928039551, "global_step": 29647, "epoch": 705} {"train_loss": -5.430549621582031, "global_step": 29648, "epoch": 705} {"train_loss": -5.494061470031738, "global_step": 29649, "epoch": 705} {"train_loss": -5.470947742462158, "global_step": 29650, "epoch": 705} {"train_loss": -5.451492207390921, "global_step": 29651, "epoch": 705, "val_loss": 75372.0859375} {"train_loss": -5.405673503875732, "global_step": 29652, "epoch": 706} {"train_loss": -5.421913146972656, "global_step": 29653, "epoch": 706} {"train_loss": -5.473023414611816, "global_step": 29654, "epoch": 706} {"train_loss": -5.459047317504883, "global_step": 29655, "epoch": 706} {"train_loss": -5.551490783691406, "global_step": 29656, "epoch": 706} {"train_loss": -5.35180139541626, "global_step": 29657, "epoch": 706} {"train_loss": -5.468988418579102, "global_step": 29658, "epoch": 706} {"train_loss": -5.306179046630859, "global_step": 29659, "epoch": 706} {"train_loss": -5.339446544647217, "global_step": 29660, "epoch": 706} {"train_loss": -5.415622711181641, "global_step": 29661, "epoch": 706} {"train_loss": -5.390097618103027, "global_step": 29662, "epoch": 706} {"train_loss": -5.40877628326416, "global_step": 29663, "epoch": 706} {"train_loss": -5.378172397613525, "global_step": 29664, "epoch": 706} {"train_loss": -5.372450351715088, "global_step": 29665, "epoch": 706} {"train_loss": -5.4721879959106445, "global_step": 29666, "epoch": 706} {"train_loss": -5.294356346130371, "global_step": 29667, "epoch": 706} {"train_loss": -5.485417366027832, "global_step": 29668, "epoch": 706} {"train_loss": -5.498732566833496, "global_step": 29669, "epoch": 706} {"train_loss": -5.425379276275635, "global_step": 29670, "epoch": 706} {"train_loss": -5.3114848136901855, "global_step": 29671, "epoch": 706} {"train_loss": -5.526350021362305, "global_step": 29672, "epoch": 706} {"train_loss": -5.470741271972656, "global_step": 29673, "epoch": 706} {"train_loss": -5.387941360473633, "global_step": 29674, "epoch": 706} {"train_loss": -5.3149333000183105, "global_step": 29675, "epoch": 706} {"train_loss": -5.448261737823486, "global_step": 29676, "epoch": 706} {"train_loss": -5.292027473449707, "global_step": 29677, "epoch": 706} {"train_loss": -5.365548610687256, "global_step": 29678, "epoch": 706} {"train_loss": -5.582324981689453, "global_step": 29679, "epoch": 706} {"train_loss": -5.450900077819824, "global_step": 29680, "epoch": 706} {"train_loss": -5.4928131103515625, "global_step": 29681, "epoch": 706} {"train_loss": -5.419397830963135, "global_step": 29682, "epoch": 706} {"train_loss": -5.4966888427734375, "global_step": 29683, "epoch": 706} {"train_loss": -5.479270935058594, "global_step": 29684, "epoch": 706} {"train_loss": -5.419044494628906, "global_step": 29685, "epoch": 706} {"train_loss": -5.432734966278076, "global_step": 29686, "epoch": 706} {"train_loss": -5.332892894744873, "global_step": 29687, "epoch": 706} {"train_loss": -5.455238342285156, "global_step": 29688, "epoch": 706} {"train_loss": -5.356110572814941, "global_step": 29689, "epoch": 706} {"train_loss": -5.3896942138671875, "global_step": 29690, "epoch": 706} {"train_loss": -5.547966003417969, "global_step": 29691, "epoch": 706} {"train_loss": -5.436379432678223, "global_step": 29692, "epoch": 706} {"train_loss": -5.42557616460891, "global_step": 29693, "epoch": 706, "val_loss": 75102.0625} {"train_loss": -5.48637580871582, "global_step": 29694, "epoch": 707} {"train_loss": -5.373551368713379, "global_step": 29695, "epoch": 707} {"train_loss": -5.49583625793457, "global_step": 29696, "epoch": 707} {"train_loss": -5.407599925994873, "global_step": 29697, "epoch": 707} {"train_loss": -5.472811698913574, "global_step": 29698, "epoch": 707} {"train_loss": -5.440300941467285, "global_step": 29699, "epoch": 707} {"train_loss": -5.282778263092041, "global_step": 29700, "epoch": 707} {"train_loss": -5.5193891525268555, "global_step": 29701, "epoch": 707} {"train_loss": -5.434837818145752, "global_step": 29702, "epoch": 707} {"train_loss": -5.315031051635742, "global_step": 29703, "epoch": 707} {"train_loss": -5.382445812225342, "global_step": 29704, "epoch": 707} {"train_loss": -5.454917907714844, "global_step": 29705, "epoch": 707} {"train_loss": -5.527700424194336, "global_step": 29706, "epoch": 707} {"train_loss": -5.448538780212402, "global_step": 29707, "epoch": 707} {"train_loss": -5.400596618652344, "global_step": 29708, "epoch": 707} {"train_loss": -5.491057395935059, "global_step": 29709, "epoch": 707} {"train_loss": -5.511235237121582, "global_step": 29710, "epoch": 707} {"train_loss": -5.439356803894043, "global_step": 29711, "epoch": 707} {"train_loss": -5.467190742492676, "global_step": 29712, "epoch": 707} {"train_loss": -5.574518203735352, "global_step": 29713, "epoch": 707} {"train_loss": -5.618913650512695, "global_step": 29714, "epoch": 707} {"train_loss": -5.427419185638428, "global_step": 29715, "epoch": 707} {"train_loss": -5.461752891540527, "global_step": 29716, "epoch": 707} {"train_loss": -5.5995612144470215, "global_step": 29717, "epoch": 707} {"train_loss": -5.449120044708252, "global_step": 29718, "epoch": 707} {"train_loss": -5.367117881774902, "global_step": 29719, "epoch": 707} {"train_loss": -5.432624340057373, "global_step": 29720, "epoch": 707} {"train_loss": -5.444528102874756, "global_step": 29721, "epoch": 707} {"train_loss": -5.600775718688965, "global_step": 29722, "epoch": 707} {"train_loss": -5.460492134094238, "global_step": 29723, "epoch": 707} {"train_loss": -5.520451545715332, "global_step": 29724, "epoch": 707} {"train_loss": -5.450010776519775, "global_step": 29725, "epoch": 707} {"train_loss": -5.458244323730469, "global_step": 29726, "epoch": 707} {"train_loss": -5.504288673400879, "global_step": 29727, "epoch": 707} {"train_loss": -5.385097503662109, "global_step": 29728, "epoch": 707} {"train_loss": -5.432678699493408, "global_step": 29729, "epoch": 707} {"train_loss": -5.528201103210449, "global_step": 29730, "epoch": 707} {"train_loss": -5.376772403717041, "global_step": 29731, "epoch": 707} {"train_loss": -5.562435150146484, "global_step": 29732, "epoch": 707} {"train_loss": -5.412834167480469, "global_step": 29733, "epoch": 707} {"train_loss": -5.495018005371094, "global_step": 29734, "epoch": 707} {"train_loss": -5.459758826664516, "global_step": 29735, "epoch": 707, "val_loss": 75043.109375} {"train_loss": -5.434177398681641, "global_step": 29736, "epoch": 708} {"train_loss": -5.554906845092773, "global_step": 29737, "epoch": 708} {"train_loss": -5.402505397796631, "global_step": 29738, "epoch": 708} {"train_loss": -5.494738578796387, "global_step": 29739, "epoch": 708} {"train_loss": -5.463648796081543, "global_step": 29740, "epoch": 708} {"train_loss": -5.465993881225586, "global_step": 29741, "epoch": 708} {"train_loss": -5.546441078186035, "global_step": 29742, "epoch": 708} {"train_loss": -5.333657264709473, "global_step": 29743, "epoch": 708} {"train_loss": -5.5019683837890625, "global_step": 29744, "epoch": 708} {"train_loss": -5.466516017913818, "global_step": 29745, "epoch": 708} {"train_loss": -5.614545822143555, "global_step": 29746, "epoch": 708} {"train_loss": -5.39610481262207, "global_step": 29747, "epoch": 708} {"train_loss": -5.441484451293945, "global_step": 29748, "epoch": 708} {"train_loss": -5.502548694610596, "global_step": 29749, "epoch": 708} {"train_loss": -5.506621360778809, "global_step": 29750, "epoch": 708} {"train_loss": -5.55240535736084, "global_step": 29751, "epoch": 708} {"train_loss": -5.393322467803955, "global_step": 29752, "epoch": 708} {"train_loss": -5.3910136222839355, "global_step": 29753, "epoch": 708} {"train_loss": -5.494786262512207, "global_step": 29754, "epoch": 708} {"train_loss": -5.406108856201172, "global_step": 29755, "epoch": 708} {"train_loss": -5.433335781097412, "global_step": 29756, "epoch": 708} {"train_loss": -5.476907730102539, "global_step": 29757, "epoch": 708} {"train_loss": -5.410238265991211, "global_step": 29758, "epoch": 708} {"train_loss": -5.4273505210876465, "global_step": 29759, "epoch": 708} {"train_loss": -5.580887794494629, "global_step": 29760, "epoch": 708} {"train_loss": -5.478972911834717, "global_step": 29761, "epoch": 708} {"train_loss": -5.457935333251953, "global_step": 29762, "epoch": 708} {"train_loss": -5.451451301574707, "global_step": 29763, "epoch": 708} {"train_loss": -5.351061820983887, "global_step": 29764, "epoch": 708} {"train_loss": -5.351889610290527, "global_step": 29765, "epoch": 708} {"train_loss": -5.3977952003479, "global_step": 29766, "epoch": 708} {"train_loss": -5.5523576736450195, "global_step": 29767, "epoch": 708} {"train_loss": -5.44158935546875, "global_step": 29768, "epoch": 708} {"train_loss": -5.438207149505615, "global_step": 29769, "epoch": 708} {"train_loss": -5.488512992858887, "global_step": 29770, "epoch": 708} {"train_loss": -5.463100910186768, "global_step": 29771, "epoch": 708} {"train_loss": -5.547329425811768, "global_step": 29772, "epoch": 708} {"train_loss": -5.47229528427124, "global_step": 29773, "epoch": 708} {"train_loss": -5.347186088562012, "global_step": 29774, "epoch": 708} {"train_loss": -5.457806587219238, "global_step": 29775, "epoch": 708} {"train_loss": -5.435116291046143, "global_step": 29776, "epoch": 708} {"train_loss": -5.459613709222703, "global_step": 29777, "epoch": 708, "val_loss": 75151.7421875} {"train_loss": -5.567998886108398, "global_step": 29778, "epoch": 709} {"train_loss": -5.6171770095825195, "global_step": 29779, "epoch": 709} {"train_loss": -5.438830375671387, "global_step": 29780, "epoch": 709} {"train_loss": -5.449380874633789, "global_step": 29781, "epoch": 709} {"train_loss": -5.430276870727539, "global_step": 29782, "epoch": 709} {"train_loss": -5.391627788543701, "global_step": 29783, "epoch": 709} {"train_loss": -5.5356550216674805, "global_step": 29784, "epoch": 709} {"train_loss": -5.349002361297607, "global_step": 29785, "epoch": 709} {"train_loss": -5.462769508361816, "global_step": 29786, "epoch": 709} {"train_loss": -5.4041748046875, "global_step": 29787, "epoch": 709} {"train_loss": -5.538269996643066, "global_step": 29788, "epoch": 709} {"train_loss": -5.526646137237549, "global_step": 29789, "epoch": 709} {"train_loss": -5.580912113189697, "global_step": 29790, "epoch": 709} {"train_loss": -5.505494117736816, "global_step": 29791, "epoch": 709} {"train_loss": -5.633573532104492, "global_step": 29792, "epoch": 709} {"train_loss": -5.452936172485352, "global_step": 29793, "epoch": 709} {"train_loss": -5.562663555145264, "global_step": 29794, "epoch": 709} {"train_loss": -5.443911552429199, "global_step": 29795, "epoch": 709} {"train_loss": -5.506237983703613, "global_step": 29796, "epoch": 709} {"train_loss": -5.508078575134277, "global_step": 29797, "epoch": 709} {"train_loss": -5.464634895324707, "global_step": 29798, "epoch": 709} {"train_loss": -5.5219879150390625, "global_step": 29799, "epoch": 709} {"train_loss": -5.482963562011719, "global_step": 29800, "epoch": 709} {"train_loss": -5.539389133453369, "global_step": 29801, "epoch": 709} {"train_loss": -5.52699089050293, "global_step": 29802, "epoch": 709} {"train_loss": -5.444977283477783, "global_step": 29803, "epoch": 709} {"train_loss": -5.3688530921936035, "global_step": 29804, "epoch": 709} {"train_loss": -5.484200477600098, "global_step": 29805, "epoch": 709} {"train_loss": -5.502384185791016, "global_step": 29806, "epoch": 709} {"train_loss": -5.432589054107666, "global_step": 29807, "epoch": 709} {"train_loss": -5.420891284942627, "global_step": 29808, "epoch": 709} {"train_loss": -5.544978618621826, "global_step": 29809, "epoch": 709} {"train_loss": -5.392186164855957, "global_step": 29810, "epoch": 709} {"train_loss": -5.387091636657715, "global_step": 29811, "epoch": 709} {"train_loss": -5.447000026702881, "global_step": 29812, "epoch": 709} {"train_loss": -5.4206414222717285, "global_step": 29813, "epoch": 709} {"train_loss": -5.5053253173828125, "global_step": 29814, "epoch": 709} {"train_loss": -5.464641094207764, "global_step": 29815, "epoch": 709} {"train_loss": -5.610576629638672, "global_step": 29816, "epoch": 709} {"train_loss": -5.417097568511963, "global_step": 29817, "epoch": 709} {"train_loss": -5.346442222595215, "global_step": 29818, "epoch": 709} {"train_loss": -5.478373118809292, "global_step": 29819, "epoch": 709, "val_loss": 75219.0859375} {"train_loss": -5.381183624267578, "global_step": 29820, "epoch": 710} {"train_loss": -5.354381561279297, "global_step": 29821, "epoch": 710} {"train_loss": -5.544356346130371, "global_step": 29822, "epoch": 710} {"train_loss": -5.389146327972412, "global_step": 29823, "epoch": 710} {"train_loss": -5.521881103515625, "global_step": 29824, "epoch": 710} {"train_loss": -5.457772254943848, "global_step": 29825, "epoch": 710} {"train_loss": -5.4571099281311035, "global_step": 29826, "epoch": 710} {"train_loss": -5.539979934692383, "global_step": 29827, "epoch": 710} {"train_loss": -5.566868782043457, "global_step": 29828, "epoch": 710} {"train_loss": -5.384941577911377, "global_step": 29829, "epoch": 710} {"train_loss": -5.486097812652588, "global_step": 29830, "epoch": 710} {"train_loss": -5.406101226806641, "global_step": 29831, "epoch": 710} {"train_loss": -5.4304399490356445, "global_step": 29832, "epoch": 710} {"train_loss": -5.274652481079102, "global_step": 29833, "epoch": 710} {"train_loss": -5.556070327758789, "global_step": 29834, "epoch": 710} {"train_loss": -5.417938709259033, "global_step": 29835, "epoch": 710} {"train_loss": -5.337162494659424, "global_step": 29836, "epoch": 710} {"train_loss": -5.470876693725586, "global_step": 29837, "epoch": 710} {"train_loss": -5.376482963562012, "global_step": 29838, "epoch": 710} {"train_loss": -5.552457332611084, "global_step": 29839, "epoch": 710} {"train_loss": -5.53085994720459, "global_step": 29840, "epoch": 710} {"train_loss": -5.575048923492432, "global_step": 29841, "epoch": 710} {"train_loss": -5.439703464508057, "global_step": 29842, "epoch": 710} {"train_loss": -5.528825759887695, "global_step": 29843, "epoch": 710} {"train_loss": -5.463853359222412, "global_step": 29844, "epoch": 710} {"train_loss": -5.429634094238281, "global_step": 29845, "epoch": 710} {"train_loss": -5.541995048522949, "global_step": 29846, "epoch": 710} {"train_loss": -5.477548122406006, "global_step": 29847, "epoch": 710} {"train_loss": -5.518266677856445, "global_step": 29848, "epoch": 710} {"train_loss": -5.586561679840088, "global_step": 29849, "epoch": 710} {"train_loss": -5.337888717651367, "global_step": 29850, "epoch": 710} {"train_loss": -5.3011322021484375, "global_step": 29851, "epoch": 710} {"train_loss": -5.568756580352783, "global_step": 29852, "epoch": 710} {"train_loss": -5.408273220062256, "global_step": 29853, "epoch": 710} {"train_loss": -5.575170516967773, "global_step": 29854, "epoch": 710} {"train_loss": -5.546994209289551, "global_step": 29855, "epoch": 710} {"train_loss": -5.411921501159668, "global_step": 29856, "epoch": 710} {"train_loss": -5.471184730529785, "global_step": 29857, "epoch": 710} {"train_loss": -5.580047607421875, "global_step": 29858, "epoch": 710} {"train_loss": -5.479412078857422, "global_step": 29859, "epoch": 710} {"train_loss": -5.392691135406494, "global_step": 29860, "epoch": 710} {"train_loss": -5.464571373803275, "global_step": 29861, "epoch": 710, "val_loss": 74937.21875} {"train_loss": -5.506735801696777, "global_step": 29862, "epoch": 711} {"train_loss": -5.429947853088379, "global_step": 29863, "epoch": 711} {"train_loss": -5.577031135559082, "global_step": 29864, "epoch": 711} {"train_loss": -5.3923540115356445, "global_step": 29865, "epoch": 711} {"train_loss": -5.475603103637695, "global_step": 29866, "epoch": 711} {"train_loss": -5.302995204925537, "global_step": 29867, "epoch": 711} {"train_loss": -5.358783721923828, "global_step": 29868, "epoch": 711} {"train_loss": -5.403501987457275, "global_step": 29869, "epoch": 711} {"train_loss": -5.449444770812988, "global_step": 29870, "epoch": 711} {"train_loss": -5.3277201652526855, "global_step": 29871, "epoch": 711} {"train_loss": -5.407502174377441, "global_step": 29872, "epoch": 711} {"train_loss": -5.494385719299316, "global_step": 29873, "epoch": 711} {"train_loss": -5.348039627075195, "global_step": 29874, "epoch": 711} {"train_loss": -5.4635772705078125, "global_step": 29875, "epoch": 711} {"train_loss": -5.3085479736328125, "global_step": 29876, "epoch": 711} {"train_loss": -5.476684093475342, "global_step": 29877, "epoch": 711} {"train_loss": -5.463702201843262, "global_step": 29878, "epoch": 711} {"train_loss": -5.305106163024902, "global_step": 29879, "epoch": 711} {"train_loss": -5.47176456451416, "global_step": 29880, "epoch": 711} {"train_loss": -5.40046501159668, "global_step": 29881, "epoch": 711} {"train_loss": -5.442134857177734, "global_step": 29882, "epoch": 711} {"train_loss": -5.411949157714844, "global_step": 29883, "epoch": 711} {"train_loss": -5.572354793548584, "global_step": 29884, "epoch": 711} {"train_loss": -5.480066776275635, "global_step": 29885, "epoch": 711} {"train_loss": -5.368804454803467, "global_step": 29886, "epoch": 711} {"train_loss": -5.506570816040039, "global_step": 29887, "epoch": 711} {"train_loss": -5.235374450683594, "global_step": 29888, "epoch": 711} {"train_loss": -5.438145637512207, "global_step": 29889, "epoch": 711} {"train_loss": -5.538279056549072, "global_step": 29890, "epoch": 711} {"train_loss": -5.504006385803223, "global_step": 29891, "epoch": 711} {"train_loss": -5.405582427978516, "global_step": 29892, "epoch": 711} {"train_loss": -5.3506059646606445, "global_step": 29893, "epoch": 711} {"train_loss": -5.542851448059082, "global_step": 29894, "epoch": 711} {"train_loss": -5.439441680908203, "global_step": 29895, "epoch": 711} {"train_loss": -5.481198310852051, "global_step": 29896, "epoch": 711} {"train_loss": -5.358490467071533, "global_step": 29897, "epoch": 711} {"train_loss": -5.45601749420166, "global_step": 29898, "epoch": 711} {"train_loss": -5.482545852661133, "global_step": 29899, "epoch": 711} {"train_loss": -5.507335662841797, "global_step": 29900, "epoch": 711} {"train_loss": -5.493452548980713, "global_step": 29901, "epoch": 711} {"train_loss": -5.583765029907227, "global_step": 29902, "epoch": 711} {"train_loss": -5.440085433778309, "global_step": 29903, "epoch": 711, "val_loss": 74895.9140625} {"train_loss": -5.428049087524414, "global_step": 29904, "epoch": 712} {"train_loss": -5.478140830993652, "global_step": 29905, "epoch": 712} {"train_loss": -5.439146041870117, "global_step": 29906, "epoch": 712} {"train_loss": -5.552548408508301, "global_step": 29907, "epoch": 712} {"train_loss": -5.483779430389404, "global_step": 29908, "epoch": 712} {"train_loss": -5.4328389167785645, "global_step": 29909, "epoch": 712} {"train_loss": -5.424283027648926, "global_step": 29910, "epoch": 712} {"train_loss": -5.622267723083496, "global_step": 29911, "epoch": 712} {"train_loss": -5.497200012207031, "global_step": 29912, "epoch": 712} {"train_loss": -5.47052001953125, "global_step": 29913, "epoch": 712} {"train_loss": -5.358386039733887, "global_step": 29914, "epoch": 712} {"train_loss": -5.39860200881958, "global_step": 29915, "epoch": 712} {"train_loss": -5.297447681427002, "global_step": 29916, "epoch": 712} {"train_loss": -5.373808860778809, "global_step": 29917, "epoch": 712} {"train_loss": -5.344546794891357, "global_step": 29918, "epoch": 712} {"train_loss": -5.416861534118652, "global_step": 29919, "epoch": 712} {"train_loss": -5.510373592376709, "global_step": 29920, "epoch": 712} {"train_loss": -5.406221866607666, "global_step": 29921, "epoch": 712} {"train_loss": -5.355547904968262, "global_step": 29922, "epoch": 712} {"train_loss": -5.421722412109375, "global_step": 29923, "epoch": 712} {"train_loss": -5.393649101257324, "global_step": 29924, "epoch": 712} {"train_loss": -5.4697184562683105, "global_step": 29925, "epoch": 712} {"train_loss": -5.357967376708984, "global_step": 29926, "epoch": 712} {"train_loss": -5.461334705352783, "global_step": 29927, "epoch": 712} {"train_loss": -5.444672584533691, "global_step": 29928, "epoch": 712} {"train_loss": -5.431876182556152, "global_step": 29929, "epoch": 712} {"train_loss": -5.463890075683594, "global_step": 29930, "epoch": 712} {"train_loss": -5.571070194244385, "global_step": 29931, "epoch": 712} {"train_loss": -5.400265216827393, "global_step": 29932, "epoch": 712} {"train_loss": -5.403711318969727, "global_step": 29933, "epoch": 712} {"train_loss": -5.457154273986816, "global_step": 29934, "epoch": 712} {"train_loss": -5.586554050445557, "global_step": 29935, "epoch": 712} {"train_loss": -5.473771095275879, "global_step": 29936, "epoch": 712} {"train_loss": -5.414588928222656, "global_step": 29937, "epoch": 712} {"train_loss": -5.389528751373291, "global_step": 29938, "epoch": 712} {"train_loss": -5.578973293304443, "global_step": 29939, "epoch": 712} {"train_loss": -5.397492408752441, "global_step": 29940, "epoch": 712} {"train_loss": -5.364105701446533, "global_step": 29941, "epoch": 712} {"train_loss": -5.532381057739258, "global_step": 29942, "epoch": 712} {"train_loss": -5.282971382141113, "global_step": 29943, "epoch": 712} {"train_loss": -5.4472761154174805, "global_step": 29944, "epoch": 712} {"train_loss": -5.438973052161081, "global_step": 29945, "epoch": 712, "val_loss": 75559.6953125} {"train_loss": -5.377585411071777, "global_step": 29946, "epoch": 713} {"train_loss": -5.508891582489014, "global_step": 29947, "epoch": 713} {"train_loss": -5.422155380249023, "global_step": 29948, "epoch": 713} {"train_loss": -5.394976615905762, "global_step": 29949, "epoch": 713} {"train_loss": -5.4486494064331055, "global_step": 29950, "epoch": 713} {"train_loss": -5.279270172119141, "global_step": 29951, "epoch": 713} {"train_loss": -5.536087989807129, "global_step": 29952, "epoch": 713} {"train_loss": -5.4217963218688965, "global_step": 29953, "epoch": 713} {"train_loss": -5.576365947723389, "global_step": 29954, "epoch": 713} {"train_loss": -5.4139227867126465, "global_step": 29955, "epoch": 713} {"train_loss": -5.492195129394531, "global_step": 29956, "epoch": 713} {"train_loss": -5.507209777832031, "global_step": 29957, "epoch": 713} {"train_loss": -5.6365766525268555, "global_step": 29958, "epoch": 713} {"train_loss": -5.516804218292236, "global_step": 29959, "epoch": 713} {"train_loss": -5.546751022338867, "global_step": 29960, "epoch": 713} {"train_loss": -5.368991851806641, "global_step": 29961, "epoch": 713} {"train_loss": -5.5909929275512695, "global_step": 29962, "epoch": 713} {"train_loss": -5.529811382293701, "global_step": 29963, "epoch": 713} {"train_loss": -5.393977165222168, "global_step": 29964, "epoch": 713} {"train_loss": -5.385445594787598, "global_step": 29965, "epoch": 713} {"train_loss": -5.4206647872924805, "global_step": 29966, "epoch": 713} {"train_loss": -5.338024139404297, "global_step": 29967, "epoch": 713} {"train_loss": -5.5712127685546875, "global_step": 29968, "epoch": 713} {"train_loss": -5.354155540466309, "global_step": 29969, "epoch": 713} {"train_loss": -5.427975177764893, "global_step": 29970, "epoch": 713} {"train_loss": -5.504095077514648, "global_step": 29971, "epoch": 713} {"train_loss": -5.2410383224487305, "global_step": 29972, "epoch": 713} {"train_loss": -5.469622611999512, "global_step": 29973, "epoch": 713} {"train_loss": -5.244941711425781, "global_step": 29974, "epoch": 713} {"train_loss": -5.3730292320251465, "global_step": 29975, "epoch": 713} {"train_loss": -5.377605438232422, "global_step": 29976, "epoch": 713} {"train_loss": -5.296600818634033, "global_step": 29977, "epoch": 713} {"train_loss": -5.517258644104004, "global_step": 29978, "epoch": 713} {"train_loss": -5.451603889465332, "global_step": 29979, "epoch": 713} {"train_loss": -5.305027484893799, "global_step": 29980, "epoch": 713} {"train_loss": -5.327262878417969, "global_step": 29981, "epoch": 713} {"train_loss": -5.485733985900879, "global_step": 29982, "epoch": 713} {"train_loss": -5.266252040863037, "global_step": 29983, "epoch": 713} {"train_loss": -5.419113636016846, "global_step": 29984, "epoch": 713} {"train_loss": -5.387156963348389, "global_step": 29985, "epoch": 713} {"train_loss": -5.469620704650879, "global_step": 29986, "epoch": 713} {"train_loss": -5.429227431615193, "global_step": 29987, "epoch": 713, "val_loss": 75785.671875} {"train_loss": -5.373885631561279, "global_step": 29988, "epoch": 714} {"train_loss": -5.362320899963379, "global_step": 29989, "epoch": 714} {"train_loss": -5.430333137512207, "global_step": 29990, "epoch": 714} {"train_loss": -5.486161231994629, "global_step": 29991, "epoch": 714} {"train_loss": -5.434009552001953, "global_step": 29992, "epoch": 714} {"train_loss": -5.4494829177856445, "global_step": 29993, "epoch": 714} {"train_loss": -5.463595390319824, "global_step": 29994, "epoch": 714} {"train_loss": -5.415462970733643, "global_step": 29995, "epoch": 714} {"train_loss": -5.457300186157227, "global_step": 29996, "epoch": 714} {"train_loss": -5.493853569030762, "global_step": 29997, "epoch": 714} {"train_loss": -5.377092361450195, "global_step": 29998, "epoch": 714} {"train_loss": -5.4642839431762695, "global_step": 29999, "epoch": 714} {"train_loss": -5.525965690612793, "global_step": 30000, "epoch": 714} {"train_loss": -5.448882102966309, "global_step": 30001, "epoch": 714} {"train_loss": -5.468935966491699, "global_step": 30002, "epoch": 714} {"train_loss": -5.3652238845825195, "global_step": 30003, "epoch": 714} {"train_loss": -5.388659477233887, "global_step": 30004, "epoch": 714} {"train_loss": -5.530060768127441, "global_step": 30005, "epoch": 714} {"train_loss": -5.451298713684082, "global_step": 30006, "epoch": 714} {"train_loss": -5.500396728515625, "global_step": 30007, "epoch": 714} {"train_loss": -5.438279628753662, "global_step": 30008, "epoch": 714} {"train_loss": -5.4406938552856445, "global_step": 30009, "epoch": 714} {"train_loss": -5.360268592834473, "global_step": 30010, "epoch": 714} {"train_loss": -5.500904083251953, "global_step": 30011, "epoch": 714} {"train_loss": -5.211279392242432, "global_step": 30012, "epoch": 714} {"train_loss": -5.451629161834717, "global_step": 30013, "epoch": 714} {"train_loss": -5.508559703826904, "global_step": 30014, "epoch": 714} {"train_loss": -5.577134609222412, "global_step": 30015, "epoch": 714} {"train_loss": -5.496218681335449, "global_step": 30016, "epoch": 714} {"train_loss": -5.466766357421875, "global_step": 30017, "epoch": 714} {"train_loss": -5.457878589630127, "global_step": 30018, "epoch": 714} {"train_loss": -5.621801376342773, "global_step": 30019, "epoch": 714} {"train_loss": -5.494193077087402, "global_step": 30020, "epoch": 714} {"train_loss": -5.497874736785889, "global_step": 30021, "epoch": 714} {"train_loss": -5.45720100402832, "global_step": 30022, "epoch": 714} {"train_loss": -5.468289375305176, "global_step": 30023, "epoch": 714} {"train_loss": -5.430233001708984, "global_step": 30024, "epoch": 714} {"train_loss": -5.381307601928711, "global_step": 30025, "epoch": 714} {"train_loss": -5.350735664367676, "global_step": 30026, "epoch": 714} {"train_loss": -5.440675735473633, "global_step": 30027, "epoch": 714} {"train_loss": -5.37424373626709, "global_step": 30028, "epoch": 714} {"train_loss": -5.447484527315412, "global_step": 30029, "epoch": 714, "val_loss": 75270.921875} {"train_loss": -5.573060989379883, "global_step": 30030, "epoch": 715} {"train_loss": -5.560629844665527, "global_step": 30031, "epoch": 715} {"train_loss": -5.46608829498291, "global_step": 30032, "epoch": 715} {"train_loss": -5.530414581298828, "global_step": 30033, "epoch": 715} {"train_loss": -5.567315101623535, "global_step": 30034, "epoch": 715} {"train_loss": -5.56205940246582, "global_step": 30035, "epoch": 715} {"train_loss": -5.4822492599487305, "global_step": 30036, "epoch": 715} {"train_loss": -5.523130893707275, "global_step": 30037, "epoch": 715} {"train_loss": -5.513992786407471, "global_step": 30038, "epoch": 715} {"train_loss": -5.505992889404297, "global_step": 30039, "epoch": 715} {"train_loss": -5.439156532287598, "global_step": 30040, "epoch": 715} {"train_loss": -5.55606746673584, "global_step": 30041, "epoch": 715} {"train_loss": -5.524645805358887, "global_step": 30042, "epoch": 715} {"train_loss": -5.373164176940918, "global_step": 30043, "epoch": 715} {"train_loss": -5.436941146850586, "global_step": 30044, "epoch": 715} {"train_loss": -5.487331390380859, "global_step": 30045, "epoch": 715} {"train_loss": -5.440906524658203, "global_step": 30046, "epoch": 715} {"train_loss": -5.6037445068359375, "global_step": 30047, "epoch": 715} {"train_loss": -5.4063568115234375, "global_step": 30048, "epoch": 715} {"train_loss": -5.371668338775635, "global_step": 30049, "epoch": 715} {"train_loss": -5.520167350769043, "global_step": 30050, "epoch": 715} {"train_loss": -5.491805076599121, "global_step": 30051, "epoch": 715} {"train_loss": -5.405450820922852, "global_step": 30052, "epoch": 715} {"train_loss": -5.3652873039245605, "global_step": 30053, "epoch": 715} {"train_loss": -5.427401065826416, "global_step": 30054, "epoch": 715} {"train_loss": -5.612473011016846, "global_step": 30055, "epoch": 715} {"train_loss": -5.6100382804870605, "global_step": 30056, "epoch": 715} {"train_loss": -5.402764320373535, "global_step": 30057, "epoch": 715} {"train_loss": -5.547060966491699, "global_step": 30058, "epoch": 715} {"train_loss": -5.2775349617004395, "global_step": 30059, "epoch": 715} {"train_loss": -5.391923904418945, "global_step": 30060, "epoch": 715} {"train_loss": -5.4981513023376465, "global_step": 30061, "epoch": 715} {"train_loss": -5.445736885070801, "global_step": 30062, "epoch": 715} {"train_loss": -5.5876922607421875, "global_step": 30063, "epoch": 715} {"train_loss": -5.458514213562012, "global_step": 30064, "epoch": 715} {"train_loss": -5.464049339294434, "global_step": 30065, "epoch": 715} {"train_loss": -5.456575393676758, "global_step": 30066, "epoch": 715} {"train_loss": -5.504096508026123, "global_step": 30067, "epoch": 715} {"train_loss": -5.629938125610352, "global_step": 30068, "epoch": 715} {"train_loss": -5.271209239959717, "global_step": 30069, "epoch": 715} {"train_loss": -5.528943061828613, "global_step": 30070, "epoch": 715} {"train_loss": -5.486956596374512, "global_step": 30071, "epoch": 715, "val_loss": 75003.421875} {"train_loss": -5.438056945800781, "global_step": 30072, "epoch": 716} {"train_loss": -5.595868110656738, "global_step": 30073, "epoch": 716} {"train_loss": -5.481409072875977, "global_step": 30074, "epoch": 716} {"train_loss": -5.356786727905273, "global_step": 30075, "epoch": 716} {"train_loss": -5.431722164154053, "global_step": 30076, "epoch": 716} {"train_loss": -5.476212501525879, "global_step": 30077, "epoch": 716} {"train_loss": -5.5807695388793945, "global_step": 30078, "epoch": 716} {"train_loss": -5.597236633300781, "global_step": 30079, "epoch": 716} {"train_loss": -5.385195732116699, "global_step": 30080, "epoch": 716} {"train_loss": -5.573746204376221, "global_step": 30081, "epoch": 716} {"train_loss": -5.405360221862793, "global_step": 30082, "epoch": 716} {"train_loss": -5.450788497924805, "global_step": 30083, "epoch": 716} {"train_loss": -5.4793291091918945, "global_step": 30084, "epoch": 716} {"train_loss": -5.326763153076172, "global_step": 30085, "epoch": 716} {"train_loss": -5.561903476715088, "global_step": 30086, "epoch": 716} {"train_loss": -5.4023566246032715, "global_step": 30087, "epoch": 716} {"train_loss": -5.406055450439453, "global_step": 30088, "epoch": 716} {"train_loss": -5.51851224899292, "global_step": 30089, "epoch": 716} {"train_loss": -5.495792388916016, "global_step": 30090, "epoch": 716} {"train_loss": -5.458950042724609, "global_step": 30091, "epoch": 716} {"train_loss": -5.495301723480225, "global_step": 30092, "epoch": 716} {"train_loss": -5.515810012817383, "global_step": 30093, "epoch": 716} {"train_loss": -5.468214988708496, "global_step": 30094, "epoch": 716} {"train_loss": -5.366422653198242, "global_step": 30095, "epoch": 716} {"train_loss": -5.321246147155762, "global_step": 30096, "epoch": 716} {"train_loss": -5.416619300842285, "global_step": 30097, "epoch": 716} {"train_loss": -5.465432167053223, "global_step": 30098, "epoch": 716} {"train_loss": -5.325906753540039, "global_step": 30099, "epoch": 716} {"train_loss": -5.376922607421875, "global_step": 30100, "epoch": 716} {"train_loss": -5.265632629394531, "global_step": 30101, "epoch": 716} {"train_loss": -5.399683952331543, "global_step": 30102, "epoch": 716} {"train_loss": -5.34222412109375, "global_step": 30103, "epoch": 716} {"train_loss": -5.405694484710693, "global_step": 30104, "epoch": 716} {"train_loss": -5.466573238372803, "global_step": 30105, "epoch": 716} {"train_loss": -5.238588333129883, "global_step": 30106, "epoch": 716} {"train_loss": -5.4191389083862305, "global_step": 30107, "epoch": 716} {"train_loss": -5.504839897155762, "global_step": 30108, "epoch": 716} {"train_loss": -5.541815280914307, "global_step": 30109, "epoch": 716} {"train_loss": -5.210319519042969, "global_step": 30110, "epoch": 716} {"train_loss": -5.562180519104004, "global_step": 30111, "epoch": 716} {"train_loss": -5.493033409118652, "global_step": 30112, "epoch": 716} {"train_loss": -5.441837310791016, "global_step": 30113, "epoch": 716, "val_loss": 74557.9140625} {"train_loss": -5.318331241607666, "global_step": 30114, "epoch": 717} {"train_loss": -5.4113545417785645, "global_step": 30115, "epoch": 717} {"train_loss": -5.4864020347595215, "global_step": 30116, "epoch": 717} {"train_loss": -5.475367069244385, "global_step": 30117, "epoch": 717} {"train_loss": -5.43491792678833, "global_step": 30118, "epoch": 717} {"train_loss": -5.579793930053711, "global_step": 30119, "epoch": 717} {"train_loss": -5.464011192321777, "global_step": 30120, "epoch": 717} {"train_loss": -5.5557169914245605, "global_step": 30121, "epoch": 717} {"train_loss": -5.520320415496826, "global_step": 30122, "epoch": 717} {"train_loss": -5.546781539916992, "global_step": 30123, "epoch": 717} {"train_loss": -5.532776832580566, "global_step": 30124, "epoch": 717} {"train_loss": -5.441883087158203, "global_step": 30125, "epoch": 717} {"train_loss": -5.371103763580322, "global_step": 30126, "epoch": 717} {"train_loss": -5.527159690856934, "global_step": 30127, "epoch": 717} {"train_loss": -5.484682083129883, "global_step": 30128, "epoch": 717} {"train_loss": -5.310538291931152, "global_step": 30129, "epoch": 717} {"train_loss": -5.517653942108154, "global_step": 30130, "epoch": 717} {"train_loss": -5.390268325805664, "global_step": 30131, "epoch": 717} {"train_loss": -5.357405662536621, "global_step": 30132, "epoch": 717} {"train_loss": -5.502562046051025, "global_step": 30133, "epoch": 717} {"train_loss": -5.4258198738098145, "global_step": 30134, "epoch": 717} {"train_loss": -5.604610919952393, "global_step": 30135, "epoch": 717} {"train_loss": -5.459285736083984, "global_step": 30136, "epoch": 717} {"train_loss": -5.428443431854248, "global_step": 30137, "epoch": 717} {"train_loss": -5.541966438293457, "global_step": 30138, "epoch": 717} {"train_loss": -5.521853446960449, "global_step": 30139, "epoch": 717} {"train_loss": -5.381866455078125, "global_step": 30140, "epoch": 717} {"train_loss": -5.455338478088379, "global_step": 30141, "epoch": 717} {"train_loss": -5.537781715393066, "global_step": 30142, "epoch": 717} {"train_loss": -5.5523247718811035, "global_step": 30143, "epoch": 717} {"train_loss": -5.461939811706543, "global_step": 30144, "epoch": 717} {"train_loss": -5.469111442565918, "global_step": 30145, "epoch": 717} {"train_loss": -5.553631782531738, "global_step": 30146, "epoch": 717} {"train_loss": -5.430744647979736, "global_step": 30147, "epoch": 717} {"train_loss": -5.537939071655273, "global_step": 30148, "epoch": 717} {"train_loss": -5.490049362182617, "global_step": 30149, "epoch": 717} {"train_loss": -5.50817346572876, "global_step": 30150, "epoch": 717} {"train_loss": -5.521821022033691, "global_step": 30151, "epoch": 717} {"train_loss": -5.508458137512207, "global_step": 30152, "epoch": 717} {"train_loss": -5.5115766525268555, "global_step": 30153, "epoch": 717} {"train_loss": -5.394118309020996, "global_step": 30154, "epoch": 717} {"train_loss": -5.475407055446079, "global_step": 30155, "epoch": 717, "val_loss": 75047.1796875} {"train_loss": -5.584178447723389, "global_step": 30156, "epoch": 718} {"train_loss": -5.5014190673828125, "global_step": 30157, "epoch": 718} {"train_loss": -5.638998031616211, "global_step": 30158, "epoch": 718} {"train_loss": -5.475983619689941, "global_step": 30159, "epoch": 718} {"train_loss": -5.390995025634766, "global_step": 30160, "epoch": 718} {"train_loss": -5.469202041625977, "global_step": 30161, "epoch": 718} {"train_loss": -5.388266563415527, "global_step": 30162, "epoch": 718} {"train_loss": -5.388735294342041, "global_step": 30163, "epoch": 718} {"train_loss": -5.544759750366211, "global_step": 30164, "epoch": 718} {"train_loss": -5.380995750427246, "global_step": 30165, "epoch": 718} {"train_loss": -5.546234130859375, "global_step": 30166, "epoch": 718} {"train_loss": -5.5313825607299805, "global_step": 30167, "epoch": 718} {"train_loss": -5.507201671600342, "global_step": 30168, "epoch": 718} {"train_loss": -5.440396308898926, "global_step": 30169, "epoch": 718} {"train_loss": -5.5514302253723145, "global_step": 30170, "epoch": 718} {"train_loss": -5.638218402862549, "global_step": 30171, "epoch": 718} {"train_loss": -5.536402702331543, "global_step": 30172, "epoch": 718} {"train_loss": -5.533844947814941, "global_step": 30173, "epoch": 718} {"train_loss": -5.4194536209106445, "global_step": 30174, "epoch": 718} {"train_loss": -5.472247123718262, "global_step": 30175, "epoch": 718} {"train_loss": -5.437147617340088, "global_step": 30176, "epoch": 718} {"train_loss": -5.400449752807617, "global_step": 30177, "epoch": 718} {"train_loss": -5.438201904296875, "global_step": 30178, "epoch": 718} {"train_loss": -5.397974014282227, "global_step": 30179, "epoch": 718} {"train_loss": -5.3745527267456055, "global_step": 30180, "epoch": 718} {"train_loss": -5.521000862121582, "global_step": 30181, "epoch": 718} {"train_loss": -5.535750389099121, "global_step": 30182, "epoch": 718} {"train_loss": -5.545661926269531, "global_step": 30183, "epoch": 718} {"train_loss": -5.373218059539795, "global_step": 30184, "epoch": 718} {"train_loss": -5.530771255493164, "global_step": 30185, "epoch": 718} {"train_loss": -5.524001121520996, "global_step": 30186, "epoch": 718} {"train_loss": -5.496618270874023, "global_step": 30187, "epoch": 718} {"train_loss": -5.409689426422119, "global_step": 30188, "epoch": 718} {"train_loss": -5.440885543823242, "global_step": 30189, "epoch": 718} {"train_loss": -5.399762153625488, "global_step": 30190, "epoch": 718} {"train_loss": -5.402645587921143, "global_step": 30191, "epoch": 718} {"train_loss": -5.478011131286621, "global_step": 30192, "epoch": 718} {"train_loss": -5.405528545379639, "global_step": 30193, "epoch": 718} {"train_loss": -5.612945556640625, "global_step": 30194, "epoch": 718} {"train_loss": -5.3823699951171875, "global_step": 30195, "epoch": 718} {"train_loss": -5.482966423034668, "global_step": 30196, "epoch": 718} {"train_loss": -5.475332237425304, "global_step": 30197, "epoch": 718, "val_loss": 74530.7734375} {"train_loss": -5.524543762207031, "global_step": 30198, "epoch": 719} {"train_loss": -5.51523494720459, "global_step": 30199, "epoch": 719} {"train_loss": -5.5982346534729, "global_step": 30200, "epoch": 719} {"train_loss": -5.577259063720703, "global_step": 30201, "epoch": 719} {"train_loss": -5.410759925842285, "global_step": 30202, "epoch": 719} {"train_loss": -5.475732326507568, "global_step": 30203, "epoch": 719} {"train_loss": -5.496734142303467, "global_step": 30204, "epoch": 719} {"train_loss": -5.48892879486084, "global_step": 30205, "epoch": 719} {"train_loss": -5.384368896484375, "global_step": 30206, "epoch": 719} {"train_loss": -5.427822589874268, "global_step": 30207, "epoch": 719} {"train_loss": -5.548479080200195, "global_step": 30208, "epoch": 719} {"train_loss": -5.509427070617676, "global_step": 30209, "epoch": 719} {"train_loss": -5.48647928237915, "global_step": 30210, "epoch": 719} {"train_loss": -5.405487060546875, "global_step": 30211, "epoch": 719} {"train_loss": -5.4758830070495605, "global_step": 30212, "epoch": 719} {"train_loss": -5.531134128570557, "global_step": 30213, "epoch": 719} {"train_loss": -5.400437355041504, "global_step": 30214, "epoch": 719} {"train_loss": -5.452549457550049, "global_step": 30215, "epoch": 719} {"train_loss": -5.454249382019043, "global_step": 30216, "epoch": 719} {"train_loss": -5.5144829750061035, "global_step": 30217, "epoch": 719} {"train_loss": -5.506202697753906, "global_step": 30218, "epoch": 719} {"train_loss": -5.600752830505371, "global_step": 30219, "epoch": 719} {"train_loss": -5.489684581756592, "global_step": 30220, "epoch": 719} {"train_loss": -5.528624534606934, "global_step": 30221, "epoch": 719} {"train_loss": -5.434614181518555, "global_step": 30222, "epoch": 719} {"train_loss": -5.479923248291016, "global_step": 30223, "epoch": 719} {"train_loss": -5.400992393493652, "global_step": 30224, "epoch": 719} {"train_loss": -5.4651384353637695, "global_step": 30225, "epoch": 719} {"train_loss": -5.427309036254883, "global_step": 30226, "epoch": 719} {"train_loss": -5.412257194519043, "global_step": 30227, "epoch": 719} {"train_loss": -5.520130634307861, "global_step": 30228, "epoch": 719} {"train_loss": -5.416067123413086, "global_step": 30229, "epoch": 719} {"train_loss": -5.4201860427856445, "global_step": 30230, "epoch": 719} {"train_loss": -5.393064498901367, "global_step": 30231, "epoch": 719} {"train_loss": -5.280061721801758, "global_step": 30232, "epoch": 719} {"train_loss": -5.322164535522461, "global_step": 30233, "epoch": 719} {"train_loss": -5.493189811706543, "global_step": 30234, "epoch": 719} {"train_loss": -5.354544162750244, "global_step": 30235, "epoch": 719} {"train_loss": -5.366241455078125, "global_step": 30236, "epoch": 719} {"train_loss": -5.453201770782471, "global_step": 30237, "epoch": 719} {"train_loss": -5.397838115692139, "global_step": 30238, "epoch": 719} {"train_loss": -5.458428496406192, "global_step": 30239, "epoch": 719, "val_loss": 75689.546875} {"train_loss": -5.271600246429443, "global_step": 30240, "epoch": 720} {"train_loss": -5.275416374206543, "global_step": 30241, "epoch": 720} {"train_loss": -5.311424255371094, "global_step": 30242, "epoch": 720} {"train_loss": -5.228784561157227, "global_step": 30243, "epoch": 720} {"train_loss": -5.447956085205078, "global_step": 30244, "epoch": 720} {"train_loss": -5.422887802124023, "global_step": 30245, "epoch": 720} {"train_loss": -5.481318473815918, "global_step": 30246, "epoch": 720} {"train_loss": -5.40931510925293, "global_step": 30247, "epoch": 720} {"train_loss": -5.46437406539917, "global_step": 30248, "epoch": 720} {"train_loss": -5.41987419128418, "global_step": 30249, "epoch": 720} {"train_loss": -5.394644260406494, "global_step": 30250, "epoch": 720} {"train_loss": -5.259456634521484, "global_step": 30251, "epoch": 720} {"train_loss": -5.492260456085205, "global_step": 30252, "epoch": 720} {"train_loss": -5.321233749389648, "global_step": 30253, "epoch": 720} {"train_loss": -5.504178047180176, "global_step": 30254, "epoch": 720} {"train_loss": -5.396742820739746, "global_step": 30255, "epoch": 720} {"train_loss": -5.40072774887085, "global_step": 30256, "epoch": 720} {"train_loss": -5.399416923522949, "global_step": 30257, "epoch": 720} {"train_loss": -5.372806072235107, "global_step": 30258, "epoch": 720} {"train_loss": -5.487221717834473, "global_step": 30259, "epoch": 720} {"train_loss": -5.501870632171631, "global_step": 30260, "epoch": 720} {"train_loss": -5.408799171447754, "global_step": 30261, "epoch": 720} {"train_loss": -5.4639892578125, "global_step": 30262, "epoch": 720} {"train_loss": -5.531431198120117, "global_step": 30263, "epoch": 720} {"train_loss": -5.441619873046875, "global_step": 30264, "epoch": 720} {"train_loss": -5.403786659240723, "global_step": 30265, "epoch": 720} {"train_loss": -5.398349761962891, "global_step": 30266, "epoch": 720} {"train_loss": -5.3123650550842285, "global_step": 30267, "epoch": 720} {"train_loss": -5.488490581512451, "global_step": 30268, "epoch": 720} {"train_loss": -5.436110973358154, "global_step": 30269, "epoch": 720} {"train_loss": -5.547641754150391, "global_step": 30270, "epoch": 720} {"train_loss": -5.436826705932617, "global_step": 30271, "epoch": 720} {"train_loss": -5.512140274047852, "global_step": 30272, "epoch": 720} {"train_loss": -5.456686019897461, "global_step": 30273, "epoch": 720} {"train_loss": -5.464984893798828, "global_step": 30274, "epoch": 720} {"train_loss": -5.573371887207031, "global_step": 30275, "epoch": 720} {"train_loss": -5.440156936645508, "global_step": 30276, "epoch": 720} {"train_loss": -5.369970321655273, "global_step": 30277, "epoch": 720} {"train_loss": -5.439059257507324, "global_step": 30278, "epoch": 720} {"train_loss": -5.383138656616211, "global_step": 30279, "epoch": 720} {"train_loss": -5.327488899230957, "global_step": 30280, "epoch": 720} {"train_loss": -5.417078177134196, "global_step": 30281, "epoch": 720, "val_loss": 74333.1640625} {"train_loss": -5.485227584838867, "global_step": 30282, "epoch": 721} {"train_loss": -5.512789726257324, "global_step": 30283, "epoch": 721} {"train_loss": -5.4696736335754395, "global_step": 30284, "epoch": 721} {"train_loss": -5.432158946990967, "global_step": 30285, "epoch": 721} {"train_loss": -5.473021507263184, "global_step": 30286, "epoch": 721} {"train_loss": -5.46127462387085, "global_step": 30287, "epoch": 721} {"train_loss": -5.371633529663086, "global_step": 30288, "epoch": 721} {"train_loss": -5.395304203033447, "global_step": 30289, "epoch": 721} {"train_loss": -5.38248872756958, "global_step": 30290, "epoch": 721} {"train_loss": -5.528363227844238, "global_step": 30291, "epoch": 721} {"train_loss": -5.412023544311523, "global_step": 30292, "epoch": 721} {"train_loss": -5.382322311401367, "global_step": 30293, "epoch": 721} {"train_loss": -5.607170104980469, "global_step": 30294, "epoch": 721} {"train_loss": -5.364750385284424, "global_step": 30295, "epoch": 721} {"train_loss": -5.477314472198486, "global_step": 30296, "epoch": 721} {"train_loss": -5.50831413269043, "global_step": 30297, "epoch": 721} {"train_loss": -5.509999752044678, "global_step": 30298, "epoch": 721} {"train_loss": -5.460630416870117, "global_step": 30299, "epoch": 721} {"train_loss": -5.358725070953369, "global_step": 30300, "epoch": 721} {"train_loss": -5.387966156005859, "global_step": 30301, "epoch": 721} {"train_loss": -5.510622501373291, "global_step": 30302, "epoch": 721} {"train_loss": -5.388590335845947, "global_step": 30303, "epoch": 721} {"train_loss": -5.471097469329834, "global_step": 30304, "epoch": 721} {"train_loss": -5.512031078338623, "global_step": 30305, "epoch": 721} {"train_loss": -5.515537261962891, "global_step": 30306, "epoch": 721} {"train_loss": -5.58573055267334, "global_step": 30307, "epoch": 721} {"train_loss": -5.4374847412109375, "global_step": 30308, "epoch": 721} {"train_loss": -5.4162468910217285, "global_step": 30309, "epoch": 721} {"train_loss": -5.467060089111328, "global_step": 30310, "epoch": 721} {"train_loss": -5.546777725219727, "global_step": 30311, "epoch": 721} {"train_loss": -5.4401140213012695, "global_step": 30312, "epoch": 721} {"train_loss": -5.404984474182129, "global_step": 30313, "epoch": 721} {"train_loss": -5.563080787658691, "global_step": 30314, "epoch": 721} {"train_loss": -5.4884796142578125, "global_step": 30315, "epoch": 721} {"train_loss": -5.586620807647705, "global_step": 30316, "epoch": 721} {"train_loss": -5.5855183601379395, "global_step": 30317, "epoch": 721} {"train_loss": -5.570812702178955, "global_step": 30318, "epoch": 721} {"train_loss": -5.527075290679932, "global_step": 30319, "epoch": 721} {"train_loss": -5.54852294921875, "global_step": 30320, "epoch": 721} {"train_loss": -5.497585773468018, "global_step": 30321, "epoch": 721} {"train_loss": -5.548374176025391, "global_step": 30322, "epoch": 721} {"train_loss": -5.4744057314736505, "global_step": 30323, "epoch": 721, "val_loss": 75565.0625} {"train_loss": -5.469925880432129, "global_step": 30324, "epoch": 722} {"train_loss": -5.570854663848877, "global_step": 30325, "epoch": 722} {"train_loss": -5.4334001541137695, "global_step": 30326, "epoch": 722} {"train_loss": -5.505637168884277, "global_step": 30327, "epoch": 722} {"train_loss": -5.560711860656738, "global_step": 30328, "epoch": 722} {"train_loss": -5.399199485778809, "global_step": 30329, "epoch": 722} {"train_loss": -5.530664443969727, "global_step": 30330, "epoch": 722} {"train_loss": -5.416213035583496, "global_step": 30331, "epoch": 722} {"train_loss": -5.402815341949463, "global_step": 30332, "epoch": 722} {"train_loss": -5.3973917961120605, "global_step": 30333, "epoch": 722} {"train_loss": -5.526644706726074, "global_step": 30334, "epoch": 722} {"train_loss": -5.507346153259277, "global_step": 30335, "epoch": 722} {"train_loss": -5.570085525512695, "global_step": 30336, "epoch": 722} {"train_loss": -5.3330583572387695, "global_step": 30337, "epoch": 722} {"train_loss": -5.504085063934326, "global_step": 30338, "epoch": 722} {"train_loss": -5.4492926597595215, "global_step": 30339, "epoch": 722} {"train_loss": -5.530263900756836, "global_step": 30340, "epoch": 722} {"train_loss": -5.436276435852051, "global_step": 30341, "epoch": 722} {"train_loss": -5.569351673126221, "global_step": 30342, "epoch": 722} {"train_loss": -5.381125450134277, "global_step": 30343, "epoch": 722} {"train_loss": -5.339684963226318, "global_step": 30344, "epoch": 722} {"train_loss": -5.62110710144043, "global_step": 30345, "epoch": 722} {"train_loss": -5.367595672607422, "global_step": 30346, "epoch": 722} {"train_loss": -5.496437072753906, "global_step": 30347, "epoch": 722} {"train_loss": -5.420675754547119, "global_step": 30348, "epoch": 722} {"train_loss": -5.434994697570801, "global_step": 30349, "epoch": 722} {"train_loss": -5.400467872619629, "global_step": 30350, "epoch": 722} {"train_loss": -5.496894359588623, "global_step": 30351, "epoch": 722} {"train_loss": -5.5202484130859375, "global_step": 30352, "epoch": 722} {"train_loss": -5.5611772537231445, "global_step": 30353, "epoch": 722} {"train_loss": -5.416852951049805, "global_step": 30354, "epoch": 722} {"train_loss": -5.451930046081543, "global_step": 30355, "epoch": 722} {"train_loss": -5.603918075561523, "global_step": 30356, "epoch": 722} {"train_loss": -5.492198944091797, "global_step": 30357, "epoch": 722} {"train_loss": -5.417518615722656, "global_step": 30358, "epoch": 722} {"train_loss": -5.508018493652344, "global_step": 30359, "epoch": 722} {"train_loss": -5.34553861618042, "global_step": 30360, "epoch": 722} {"train_loss": -5.540248870849609, "global_step": 30361, "epoch": 722} {"train_loss": -5.318219184875488, "global_step": 30362, "epoch": 722} {"train_loss": -5.564620018005371, "global_step": 30363, "epoch": 722} {"train_loss": -5.508358955383301, "global_step": 30364, "epoch": 722} {"train_loss": -5.469283626193092, "global_step": 30365, "epoch": 722, "val_loss": 74536.9609375} {"train_loss": -5.569002628326416, "global_step": 30366, "epoch": 723} {"train_loss": -5.534188270568848, "global_step": 30367, "epoch": 723} {"train_loss": -5.448848724365234, "global_step": 30368, "epoch": 723} {"train_loss": -5.4798431396484375, "global_step": 30369, "epoch": 723} {"train_loss": -5.439042091369629, "global_step": 30370, "epoch": 723} {"train_loss": -5.472009658813477, "global_step": 30371, "epoch": 723} {"train_loss": -5.553901672363281, "global_step": 30372, "epoch": 723} {"train_loss": -5.391298294067383, "global_step": 30373, "epoch": 723} {"train_loss": -5.515963077545166, "global_step": 30374, "epoch": 723} {"train_loss": -5.331778526306152, "global_step": 30375, "epoch": 723} {"train_loss": -5.532415866851807, "global_step": 30376, "epoch": 723} {"train_loss": -5.51863431930542, "global_step": 30377, "epoch": 723} {"train_loss": -5.49843692779541, "global_step": 30378, "epoch": 723} {"train_loss": -5.472814559936523, "global_step": 30379, "epoch": 723} {"train_loss": -5.577765941619873, "global_step": 30380, "epoch": 723} {"train_loss": -5.469903945922852, "global_step": 30381, "epoch": 723} {"train_loss": -5.4244537353515625, "global_step": 30382, "epoch": 723} {"train_loss": -5.430150985717773, "global_step": 30383, "epoch": 723} {"train_loss": -5.598506450653076, "global_step": 30384, "epoch": 723} {"train_loss": -5.409393310546875, "global_step": 30385, "epoch": 723} {"train_loss": -5.579856872558594, "global_step": 30386, "epoch": 723} {"train_loss": -5.4284539222717285, "global_step": 30387, "epoch": 723} {"train_loss": -5.504640102386475, "global_step": 30388, "epoch": 723} {"train_loss": -5.378194808959961, "global_step": 30389, "epoch": 723} {"train_loss": -5.447081565856934, "global_step": 30390, "epoch": 723} {"train_loss": -5.480497360229492, "global_step": 30391, "epoch": 723} {"train_loss": -5.663638591766357, "global_step": 30392, "epoch": 723} {"train_loss": -5.627983570098877, "global_step": 30393, "epoch": 723} {"train_loss": -5.604079246520996, "global_step": 30394, "epoch": 723} {"train_loss": -5.465611457824707, "global_step": 30395, "epoch": 723} {"train_loss": -5.493560314178467, "global_step": 30396, "epoch": 723} {"train_loss": -5.383176803588867, "global_step": 30397, "epoch": 723} {"train_loss": -5.559565544128418, "global_step": 30398, "epoch": 723} {"train_loss": -5.5254669189453125, "global_step": 30399, "epoch": 723} {"train_loss": -5.2443437576293945, "global_step": 30400, "epoch": 723} {"train_loss": -5.4626665115356445, "global_step": 30401, "epoch": 723} {"train_loss": -5.542963027954102, "global_step": 30402, "epoch": 723} {"train_loss": -5.4904375076293945, "global_step": 30403, "epoch": 723} {"train_loss": -5.618171691894531, "global_step": 30404, "epoch": 723} {"train_loss": -5.482919216156006, "global_step": 30405, "epoch": 723} {"train_loss": -5.510087966918945, "global_step": 30406, "epoch": 723} {"train_loss": -5.491216046469552, "global_step": 30407, "epoch": 723, "val_loss": 74837.2578125} {"train_loss": -5.510463714599609, "global_step": 30408, "epoch": 724} {"train_loss": -5.543394088745117, "global_step": 30409, "epoch": 724} {"train_loss": -5.5640668869018555, "global_step": 30410, "epoch": 724} {"train_loss": -5.474318981170654, "global_step": 30411, "epoch": 724} {"train_loss": -5.443700313568115, "global_step": 30412, "epoch": 724} {"train_loss": -5.554040908813477, "global_step": 30413, "epoch": 724} {"train_loss": -5.5990142822265625, "global_step": 30414, "epoch": 724} {"train_loss": -5.372915267944336, "global_step": 30415, "epoch": 724} {"train_loss": -5.6516852378845215, "global_step": 30416, "epoch": 724} {"train_loss": -5.419073104858398, "global_step": 30417, "epoch": 724} {"train_loss": -5.489850997924805, "global_step": 30418, "epoch": 724} {"train_loss": -5.345273017883301, "global_step": 30419, "epoch": 724} {"train_loss": -5.509984493255615, "global_step": 30420, "epoch": 724} {"train_loss": -5.392314434051514, "global_step": 30421, "epoch": 724} {"train_loss": -5.591856002807617, "global_step": 30422, "epoch": 724} {"train_loss": -5.609760761260986, "global_step": 30423, "epoch": 724} {"train_loss": -5.567295074462891, "global_step": 30424, "epoch": 724} {"train_loss": -5.434682846069336, "global_step": 30425, "epoch": 724} {"train_loss": -5.5815935134887695, "global_step": 30426, "epoch": 724} {"train_loss": -5.384354591369629, "global_step": 30427, "epoch": 724} {"train_loss": -5.443971157073975, "global_step": 30428, "epoch": 724} {"train_loss": -5.303103446960449, "global_step": 30429, "epoch": 724} {"train_loss": -5.359752655029297, "global_step": 30430, "epoch": 724} {"train_loss": -5.372952938079834, "global_step": 30431, "epoch": 724} {"train_loss": -5.354681015014648, "global_step": 30432, "epoch": 724} {"train_loss": -5.412474155426025, "global_step": 30433, "epoch": 724} {"train_loss": -5.475551605224609, "global_step": 30434, "epoch": 724} {"train_loss": -5.279581546783447, "global_step": 30435, "epoch": 724} {"train_loss": -5.451179027557373, "global_step": 30436, "epoch": 724} {"train_loss": -5.361085414886475, "global_step": 30437, "epoch": 724} {"train_loss": -5.392993927001953, "global_step": 30438, "epoch": 724} {"train_loss": -5.400290012359619, "global_step": 30439, "epoch": 724} {"train_loss": -5.4791154861450195, "global_step": 30440, "epoch": 724} {"train_loss": -5.381103515625, "global_step": 30441, "epoch": 724} {"train_loss": -5.384056568145752, "global_step": 30442, "epoch": 724} {"train_loss": -5.484427452087402, "global_step": 30443, "epoch": 724} {"train_loss": -5.482504844665527, "global_step": 30444, "epoch": 724} {"train_loss": -5.447351455688477, "global_step": 30445, "epoch": 724} {"train_loss": -5.561130523681641, "global_step": 30446, "epoch": 724} {"train_loss": -5.441331386566162, "global_step": 30447, "epoch": 724} {"train_loss": -5.465658664703369, "global_step": 30448, "epoch": 724} {"train_loss": -5.458580221448626, "global_step": 30449, "epoch": 724, "val_loss": 75063.3203125} {"train_loss": -5.383632659912109, "global_step": 30450, "epoch": 725} {"train_loss": -5.53491735458374, "global_step": 30451, "epoch": 725} {"train_loss": -5.498641014099121, "global_step": 30452, "epoch": 725} {"train_loss": -5.470934867858887, "global_step": 30453, "epoch": 725} {"train_loss": -5.5198211669921875, "global_step": 30454, "epoch": 725} {"train_loss": -5.4720778465271, "global_step": 30455, "epoch": 725} {"train_loss": -5.477423667907715, "global_step": 30456, "epoch": 725} {"train_loss": -5.526917457580566, "global_step": 30457, "epoch": 725} {"train_loss": -5.452855587005615, "global_step": 30458, "epoch": 725} {"train_loss": -5.39190149307251, "global_step": 30459, "epoch": 725} {"train_loss": -5.454277515411377, "global_step": 30460, "epoch": 725} {"train_loss": -5.564207553863525, "global_step": 30461, "epoch": 725} {"train_loss": -5.474612236022949, "global_step": 30462, "epoch": 725} {"train_loss": -5.553561687469482, "global_step": 30463, "epoch": 725} {"train_loss": -5.472445964813232, "global_step": 30464, "epoch": 725} {"train_loss": -5.412333011627197, "global_step": 30465, "epoch": 725} {"train_loss": -5.468988418579102, "global_step": 30466, "epoch": 725} {"train_loss": -5.519423961639404, "global_step": 30467, "epoch": 725} {"train_loss": -5.470457077026367, "global_step": 30468, "epoch": 725} {"train_loss": -5.492420196533203, "global_step": 30469, "epoch": 725} {"train_loss": -5.470243453979492, "global_step": 30470, "epoch": 725} {"train_loss": -5.580714702606201, "global_step": 30471, "epoch": 725} {"train_loss": -5.390159606933594, "global_step": 30472, "epoch": 725} {"train_loss": -5.460385799407959, "global_step": 30473, "epoch": 725} {"train_loss": -5.535074710845947, "global_step": 30474, "epoch": 725} {"train_loss": -5.5786662101745605, "global_step": 30475, "epoch": 725} {"train_loss": -5.437105178833008, "global_step": 30476, "epoch": 725} {"train_loss": -5.473695278167725, "global_step": 30477, "epoch": 725} {"train_loss": -5.416028022766113, "global_step": 30478, "epoch": 725} {"train_loss": -5.49525260925293, "global_step": 30479, "epoch": 725} {"train_loss": -5.33925724029541, "global_step": 30480, "epoch": 725} {"train_loss": -5.473445892333984, "global_step": 30481, "epoch": 725} {"train_loss": -5.501255989074707, "global_step": 30482, "epoch": 725} {"train_loss": -5.369329452514648, "global_step": 30483, "epoch": 725} {"train_loss": -5.464372158050537, "global_step": 30484, "epoch": 725} {"train_loss": -5.458745002746582, "global_step": 30485, "epoch": 725} {"train_loss": -5.46580696105957, "global_step": 30486, "epoch": 725} {"train_loss": -5.477207183837891, "global_step": 30487, "epoch": 725} {"train_loss": -5.37117862701416, "global_step": 30488, "epoch": 725} {"train_loss": -5.445522308349609, "global_step": 30489, "epoch": 725} {"train_loss": -5.474669456481934, "global_step": 30490, "epoch": 725} {"train_loss": -5.467087654840379, "global_step": 30491, "epoch": 725, "val_loss": 74486.625} {"train_loss": -5.670214653015137, "global_step": 30492, "epoch": 726} {"train_loss": -5.4620819091796875, "global_step": 30493, "epoch": 726} {"train_loss": -5.407604217529297, "global_step": 30494, "epoch": 726} {"train_loss": -5.491530418395996, "global_step": 30495, "epoch": 726} {"train_loss": -5.42073917388916, "global_step": 30496, "epoch": 726} {"train_loss": -5.435586929321289, "global_step": 30497, "epoch": 726} {"train_loss": -5.521881103515625, "global_step": 30498, "epoch": 726} {"train_loss": -5.447275161743164, "global_step": 30499, "epoch": 726} {"train_loss": -5.448578834533691, "global_step": 30500, "epoch": 726} {"train_loss": -5.513010501861572, "global_step": 30501, "epoch": 726} {"train_loss": -5.364474296569824, "global_step": 30502, "epoch": 726} {"train_loss": -5.4705657958984375, "global_step": 30503, "epoch": 726} {"train_loss": -5.456508636474609, "global_step": 30504, "epoch": 726} {"train_loss": -5.4411821365356445, "global_step": 30505, "epoch": 726} {"train_loss": -5.412866592407227, "global_step": 30506, "epoch": 726} {"train_loss": -5.589856147766113, "global_step": 30507, "epoch": 726} {"train_loss": -5.508838653564453, "global_step": 30508, "epoch": 726} {"train_loss": -5.454305648803711, "global_step": 30509, "epoch": 726} {"train_loss": -5.466336250305176, "global_step": 30510, "epoch": 726} {"train_loss": -5.498473167419434, "global_step": 30511, "epoch": 726} {"train_loss": -5.436860084533691, "global_step": 30512, "epoch": 726} {"train_loss": -5.617522716522217, "global_step": 30513, "epoch": 726} {"train_loss": -5.5997314453125, "global_step": 30514, "epoch": 726} {"train_loss": -5.438108444213867, "global_step": 30515, "epoch": 726} {"train_loss": -5.572092056274414, "global_step": 30516, "epoch": 726} {"train_loss": -5.431450843811035, "global_step": 30517, "epoch": 726} {"train_loss": -5.415555000305176, "global_step": 30518, "epoch": 726} {"train_loss": -5.418510437011719, "global_step": 30519, "epoch": 726} {"train_loss": -5.525134086608887, "global_step": 30520, "epoch": 726} {"train_loss": -5.513926029205322, "global_step": 30521, "epoch": 726} {"train_loss": -5.476470947265625, "global_step": 30522, "epoch": 726} {"train_loss": -5.4190216064453125, "global_step": 30523, "epoch": 726} {"train_loss": -5.507354736328125, "global_step": 30524, "epoch": 726} {"train_loss": -5.568365097045898, "global_step": 30525, "epoch": 726} {"train_loss": -5.404179573059082, "global_step": 30526, "epoch": 726} {"train_loss": -5.612364768981934, "global_step": 30527, "epoch": 726} {"train_loss": -5.530041694641113, "global_step": 30528, "epoch": 726} {"train_loss": -5.2494964599609375, "global_step": 30529, "epoch": 726} {"train_loss": -5.460049152374268, "global_step": 30530, "epoch": 726} {"train_loss": -5.312479019165039, "global_step": 30531, "epoch": 726} {"train_loss": -5.540077209472656, "global_step": 30532, "epoch": 726} {"train_loss": -5.471763837905157, "global_step": 30533, "epoch": 726, "val_loss": 74490.109375} {"train_loss": -5.536862373352051, "global_step": 30534, "epoch": 727} {"train_loss": -5.417045593261719, "global_step": 30535, "epoch": 727} {"train_loss": -5.447911262512207, "global_step": 30536, "epoch": 727} {"train_loss": -5.441458225250244, "global_step": 30537, "epoch": 727} {"train_loss": -5.513642311096191, "global_step": 30538, "epoch": 727} {"train_loss": -5.545989036560059, "global_step": 30539, "epoch": 727} {"train_loss": -5.368772983551025, "global_step": 30540, "epoch": 727} {"train_loss": -5.349420547485352, "global_step": 30541, "epoch": 727} {"train_loss": -5.5092315673828125, "global_step": 30542, "epoch": 727} {"train_loss": -5.342041015625, "global_step": 30543, "epoch": 727} {"train_loss": -5.459293365478516, "global_step": 30544, "epoch": 727} {"train_loss": -5.421872615814209, "global_step": 30545, "epoch": 727} {"train_loss": -5.5436320304870605, "global_step": 30546, "epoch": 727} {"train_loss": -5.427151679992676, "global_step": 30547, "epoch": 727} {"train_loss": -5.596823692321777, "global_step": 30548, "epoch": 727} {"train_loss": -5.491094589233398, "global_step": 30549, "epoch": 727} {"train_loss": -5.365172863006592, "global_step": 30550, "epoch": 727} {"train_loss": -5.571735858917236, "global_step": 30551, "epoch": 727} {"train_loss": -5.50885009765625, "global_step": 30552, "epoch": 727} {"train_loss": -5.487841606140137, "global_step": 30553, "epoch": 727} {"train_loss": -5.455392360687256, "global_step": 30554, "epoch": 727} {"train_loss": -5.4189772605896, "global_step": 30555, "epoch": 727} {"train_loss": -5.350595474243164, "global_step": 30556, "epoch": 727} {"train_loss": -5.503869533538818, "global_step": 30557, "epoch": 727} {"train_loss": -5.464807510375977, "global_step": 30558, "epoch": 727} {"train_loss": -5.455837726593018, "global_step": 30559, "epoch": 727} {"train_loss": -5.404040336608887, "global_step": 30560, "epoch": 727} {"train_loss": -5.303401470184326, "global_step": 30561, "epoch": 727} {"train_loss": -5.539658546447754, "global_step": 30562, "epoch": 727} {"train_loss": -5.450369358062744, "global_step": 30563, "epoch": 727} {"train_loss": -5.368192672729492, "global_step": 30564, "epoch": 727} {"train_loss": -5.401070594787598, "global_step": 30565, "epoch": 727} {"train_loss": -5.318661689758301, "global_step": 30566, "epoch": 727} {"train_loss": -5.467650413513184, "global_step": 30567, "epoch": 727} {"train_loss": -5.435826301574707, "global_step": 30568, "epoch": 727} {"train_loss": -5.44485330581665, "global_step": 30569, "epoch": 727} {"train_loss": -5.498343467712402, "global_step": 30570, "epoch": 727} {"train_loss": -5.447011470794678, "global_step": 30571, "epoch": 727} {"train_loss": -5.475545883178711, "global_step": 30572, "epoch": 727} {"train_loss": -5.616430282592773, "global_step": 30573, "epoch": 727} {"train_loss": -5.453215599060059, "global_step": 30574, "epoch": 727} {"train_loss": -5.457936865942819, "global_step": 30575, "epoch": 727, "val_loss": 74364.0546875} {"train_loss": -5.4971208572387695, "global_step": 30576, "epoch": 728} {"train_loss": -5.464820384979248, "global_step": 30577, "epoch": 728} {"train_loss": -5.484192848205566, "global_step": 30578, "epoch": 728} {"train_loss": -5.462423324584961, "global_step": 30579, "epoch": 728} {"train_loss": -5.578158855438232, "global_step": 30580, "epoch": 728} {"train_loss": -5.45297384262085, "global_step": 30581, "epoch": 728} {"train_loss": -5.440162658691406, "global_step": 30582, "epoch": 728} {"train_loss": -5.565908908843994, "global_step": 30583, "epoch": 728} {"train_loss": -5.407887935638428, "global_step": 30584, "epoch": 728} {"train_loss": -5.431013107299805, "global_step": 30585, "epoch": 728} {"train_loss": -5.519237518310547, "global_step": 30586, "epoch": 728} {"train_loss": -5.448246479034424, "global_step": 30587, "epoch": 728} {"train_loss": -5.505749225616455, "global_step": 30588, "epoch": 728} {"train_loss": -5.501996040344238, "global_step": 30589, "epoch": 728} {"train_loss": -5.408782005310059, "global_step": 30590, "epoch": 728} {"train_loss": -5.475622177124023, "global_step": 30591, "epoch": 728} {"train_loss": -5.641412734985352, "global_step": 30592, "epoch": 728} {"train_loss": -5.4994893074035645, "global_step": 30593, "epoch": 728} {"train_loss": -5.458878517150879, "global_step": 30594, "epoch": 728} {"train_loss": -5.609823226928711, "global_step": 30595, "epoch": 728} {"train_loss": -5.418169975280762, "global_step": 30596, "epoch": 728} {"train_loss": -5.50673770904541, "global_step": 30597, "epoch": 728} {"train_loss": -5.534079551696777, "global_step": 30598, "epoch": 728} {"train_loss": -5.560338973999023, "global_step": 30599, "epoch": 728} {"train_loss": -5.495604515075684, "global_step": 30600, "epoch": 728} {"train_loss": -5.468265056610107, "global_step": 30601, "epoch": 728} {"train_loss": -5.449477672576904, "global_step": 30602, "epoch": 728} {"train_loss": -5.418294429779053, "global_step": 30603, "epoch": 728} {"train_loss": -5.471378803253174, "global_step": 30604, "epoch": 728} {"train_loss": -5.402396202087402, "global_step": 30605, "epoch": 728} {"train_loss": -5.528522491455078, "global_step": 30606, "epoch": 728} {"train_loss": -5.48823356628418, "global_step": 30607, "epoch": 728} {"train_loss": -5.482419967651367, "global_step": 30608, "epoch": 728} {"train_loss": -5.5009684562683105, "global_step": 30609, "epoch": 728} {"train_loss": -5.484583854675293, "global_step": 30610, "epoch": 728} {"train_loss": -5.527788162231445, "global_step": 30611, "epoch": 728} {"train_loss": -5.518202781677246, "global_step": 30612, "epoch": 728} {"train_loss": -5.560976982116699, "global_step": 30613, "epoch": 728} {"train_loss": -5.463312149047852, "global_step": 30614, "epoch": 728} {"train_loss": -5.486649513244629, "global_step": 30615, "epoch": 728} {"train_loss": -5.388962268829346, "global_step": 30616, "epoch": 728} {"train_loss": -5.48426780246553, "global_step": 30617, "epoch": 728, "val_loss": 74882.4453125} {"train_loss": -5.574389457702637, "global_step": 30618, "epoch": 729} {"train_loss": -5.655255317687988, "global_step": 30619, "epoch": 729} {"train_loss": -5.546629428863525, "global_step": 30620, "epoch": 729} {"train_loss": -5.498950004577637, "global_step": 30621, "epoch": 729} {"train_loss": -5.526362895965576, "global_step": 30622, "epoch": 729} {"train_loss": -5.47416353225708, "global_step": 30623, "epoch": 729} {"train_loss": -5.323829650878906, "global_step": 30624, "epoch": 729} {"train_loss": -5.381488800048828, "global_step": 30625, "epoch": 729} {"train_loss": -5.5479583740234375, "global_step": 30626, "epoch": 729} {"train_loss": -5.372691631317139, "global_step": 30627, "epoch": 729} {"train_loss": -5.5275726318359375, "global_step": 30628, "epoch": 729} {"train_loss": -5.553341865539551, "global_step": 30629, "epoch": 729} {"train_loss": -5.53205680847168, "global_step": 30630, "epoch": 729} {"train_loss": -5.44921875, "global_step": 30631, "epoch": 729} {"train_loss": -5.454503059387207, "global_step": 30632, "epoch": 729} {"train_loss": -5.595709800720215, "global_step": 30633, "epoch": 729} {"train_loss": -5.52074670791626, "global_step": 30634, "epoch": 729} {"train_loss": -5.499599456787109, "global_step": 30635, "epoch": 729} {"train_loss": -5.418959140777588, "global_step": 30636, "epoch": 729} {"train_loss": -5.4349260330200195, "global_step": 30637, "epoch": 729} {"train_loss": -5.543878555297852, "global_step": 30638, "epoch": 729} {"train_loss": -5.479827880859375, "global_step": 30639, "epoch": 729} {"train_loss": -5.529093265533447, "global_step": 30640, "epoch": 729} {"train_loss": -5.473640441894531, "global_step": 30641, "epoch": 729} {"train_loss": -5.40427303314209, "global_step": 30642, "epoch": 729} {"train_loss": -5.4480061531066895, "global_step": 30643, "epoch": 729} {"train_loss": -5.442141532897949, "global_step": 30644, "epoch": 729} {"train_loss": -5.314680099487305, "global_step": 30645, "epoch": 729} {"train_loss": -5.470317363739014, "global_step": 30646, "epoch": 729} {"train_loss": -5.381687164306641, "global_step": 30647, "epoch": 729} {"train_loss": -5.411169052124023, "global_step": 30648, "epoch": 729} {"train_loss": -5.509608268737793, "global_step": 30649, "epoch": 729} {"train_loss": -5.35264778137207, "global_step": 30650, "epoch": 729} {"train_loss": -5.566394805908203, "global_step": 30651, "epoch": 729} {"train_loss": -5.512681484222412, "global_step": 30652, "epoch": 729} {"train_loss": -5.433292865753174, "global_step": 30653, "epoch": 729} {"train_loss": -5.519753456115723, "global_step": 30654, "epoch": 729} {"train_loss": -5.415477752685547, "global_step": 30655, "epoch": 729} {"train_loss": -5.434789657592773, "global_step": 30656, "epoch": 729} {"train_loss": -5.393659591674805, "global_step": 30657, "epoch": 729} {"train_loss": -5.528325080871582, "global_step": 30658, "epoch": 729} {"train_loss": -5.475227060772124, "global_step": 30659, "epoch": 729, "val_loss": 74948.265625} {"train_loss": -5.520669460296631, "global_step": 30660, "epoch": 730} {"train_loss": -5.45689058303833, "global_step": 30661, "epoch": 730} {"train_loss": -5.455812454223633, "global_step": 30662, "epoch": 730} {"train_loss": -5.422811508178711, "global_step": 30663, "epoch": 730} {"train_loss": -5.451803684234619, "global_step": 30664, "epoch": 730} {"train_loss": -5.480254650115967, "global_step": 30665, "epoch": 730} {"train_loss": -5.564187526702881, "global_step": 30666, "epoch": 730} {"train_loss": -5.557269096374512, "global_step": 30667, "epoch": 730} {"train_loss": -5.512089252471924, "global_step": 30668, "epoch": 730} {"train_loss": -5.506808280944824, "global_step": 30669, "epoch": 730} {"train_loss": -5.439007759094238, "global_step": 30670, "epoch": 730} {"train_loss": -5.350281715393066, "global_step": 30671, "epoch": 730} {"train_loss": -5.5464186668396, "global_step": 30672, "epoch": 730} {"train_loss": -5.481454849243164, "global_step": 30673, "epoch": 730} {"train_loss": -5.562723159790039, "global_step": 30674, "epoch": 730} {"train_loss": -5.511404991149902, "global_step": 30675, "epoch": 730} {"train_loss": -5.573616027832031, "global_step": 30676, "epoch": 730} {"train_loss": -5.309060573577881, "global_step": 30677, "epoch": 730} {"train_loss": -5.546266078948975, "global_step": 30678, "epoch": 730} {"train_loss": -5.3673295974731445, "global_step": 30679, "epoch": 730} {"train_loss": -5.253367900848389, "global_step": 30680, "epoch": 730} {"train_loss": -5.600261211395264, "global_step": 30681, "epoch": 730} {"train_loss": -5.602226257324219, "global_step": 30682, "epoch": 730} {"train_loss": -5.502713203430176, "global_step": 30683, "epoch": 730} {"train_loss": -5.509347915649414, "global_step": 30684, "epoch": 730} {"train_loss": -5.411154747009277, "global_step": 30685, "epoch": 730} {"train_loss": -5.443632125854492, "global_step": 30686, "epoch": 730} {"train_loss": -5.591575622558594, "global_step": 30687, "epoch": 730} {"train_loss": -5.386913299560547, "global_step": 30688, "epoch": 730} {"train_loss": -5.373651504516602, "global_step": 30689, "epoch": 730} {"train_loss": -5.4689202308654785, "global_step": 30690, "epoch": 730} {"train_loss": -5.46151876449585, "global_step": 30691, "epoch": 730} {"train_loss": -5.456447601318359, "global_step": 30692, "epoch": 730} {"train_loss": -5.5684967041015625, "global_step": 30693, "epoch": 730} {"train_loss": -5.452007293701172, "global_step": 30694, "epoch": 730} {"train_loss": -5.397176742553711, "global_step": 30695, "epoch": 730} {"train_loss": -5.3771653175354, "global_step": 30696, "epoch": 730} {"train_loss": -5.459855556488037, "global_step": 30697, "epoch": 730} {"train_loss": -5.360615253448486, "global_step": 30698, "epoch": 730} {"train_loss": -5.386953353881836, "global_step": 30699, "epoch": 730} {"train_loss": -5.469468116760254, "global_step": 30700, "epoch": 730} {"train_loss": -5.468154123851231, "global_step": 30701, "epoch": 730, "val_loss": 74769.0625} {"train_loss": -5.453269958496094, "global_step": 30702, "epoch": 731} {"train_loss": -5.514858245849609, "global_step": 30703, "epoch": 731} {"train_loss": -5.386614799499512, "global_step": 30704, "epoch": 731} {"train_loss": -5.53622579574585, "global_step": 30705, "epoch": 731} {"train_loss": -5.642999649047852, "global_step": 30706, "epoch": 731} {"train_loss": -5.5579657554626465, "global_step": 30707, "epoch": 731} {"train_loss": -5.462363243103027, "global_step": 30708, "epoch": 731} {"train_loss": -5.469810485839844, "global_step": 30709, "epoch": 731} {"train_loss": -5.558659076690674, "global_step": 30710, "epoch": 731} {"train_loss": -5.601422309875488, "global_step": 30711, "epoch": 731} {"train_loss": -5.5643720626831055, "global_step": 30712, "epoch": 731} {"train_loss": -5.5080413818359375, "global_step": 30713, "epoch": 731} {"train_loss": -5.553532600402832, "global_step": 30714, "epoch": 731} {"train_loss": -5.374044418334961, "global_step": 30715, "epoch": 731} {"train_loss": -5.4807891845703125, "global_step": 30716, "epoch": 731} {"train_loss": -5.535672664642334, "global_step": 30717, "epoch": 731} {"train_loss": -5.468922138214111, "global_step": 30718, "epoch": 731} {"train_loss": -5.49509859085083, "global_step": 30719, "epoch": 731} {"train_loss": -5.5724101066589355, "global_step": 30720, "epoch": 731} {"train_loss": -5.613436698913574, "global_step": 30721, "epoch": 731} {"train_loss": -5.44659423828125, "global_step": 30722, "epoch": 731} {"train_loss": -5.329684257507324, "global_step": 30723, "epoch": 731} {"train_loss": -5.501998424530029, "global_step": 30724, "epoch": 731} {"train_loss": -5.403351783752441, "global_step": 30725, "epoch": 731} {"train_loss": -5.484012603759766, "global_step": 30726, "epoch": 731} {"train_loss": -5.468759059906006, "global_step": 30727, "epoch": 731} {"train_loss": -5.306975364685059, "global_step": 30728, "epoch": 731} {"train_loss": -5.52921724319458, "global_step": 30729, "epoch": 731} {"train_loss": -5.50165319442749, "global_step": 30730, "epoch": 731} {"train_loss": -5.598247528076172, "global_step": 30731, "epoch": 731} {"train_loss": -5.515596389770508, "global_step": 30732, "epoch": 731} {"train_loss": -5.5164642333984375, "global_step": 30733, "epoch": 731} {"train_loss": -5.4062042236328125, "global_step": 30734, "epoch": 731} {"train_loss": -5.399513244628906, "global_step": 30735, "epoch": 731} {"train_loss": -5.514950275421143, "global_step": 30736, "epoch": 731} {"train_loss": -5.526930809020996, "global_step": 30737, "epoch": 731} {"train_loss": -5.549387454986572, "global_step": 30738, "epoch": 731} {"train_loss": -5.525224208831787, "global_step": 30739, "epoch": 731} {"train_loss": -5.369228363037109, "global_step": 30740, "epoch": 731} {"train_loss": -5.439211845397949, "global_step": 30741, "epoch": 731} {"train_loss": -5.287152290344238, "global_step": 30742, "epoch": 731} {"train_loss": -5.485522270202637, "global_step": 30743, "epoch": 731, "val_loss": 74578.90625} {"train_loss": -5.624567031860352, "global_step": 30744, "epoch": 732} {"train_loss": -5.461054801940918, "global_step": 30745, "epoch": 732} {"train_loss": -5.434067726135254, "global_step": 30746, "epoch": 732} {"train_loss": -5.4637041091918945, "global_step": 30747, "epoch": 732} {"train_loss": -5.480660438537598, "global_step": 30748, "epoch": 732} {"train_loss": -5.53294563293457, "global_step": 30749, "epoch": 732} {"train_loss": -5.478151321411133, "global_step": 30750, "epoch": 732} {"train_loss": -5.565138816833496, "global_step": 30751, "epoch": 732} {"train_loss": -5.503056526184082, "global_step": 30752, "epoch": 732} {"train_loss": -5.512111663818359, "global_step": 30753, "epoch": 732} {"train_loss": -5.355404853820801, "global_step": 30754, "epoch": 732} {"train_loss": -5.53691291809082, "global_step": 30755, "epoch": 732} {"train_loss": -5.521783828735352, "global_step": 30756, "epoch": 732} {"train_loss": -5.673116207122803, "global_step": 30757, "epoch": 732} {"train_loss": -5.436888694763184, "global_step": 30758, "epoch": 732} {"train_loss": -5.389578342437744, "global_step": 30759, "epoch": 732} {"train_loss": -5.533762454986572, "global_step": 30760, "epoch": 732} {"train_loss": -5.417557239532471, "global_step": 30761, "epoch": 732} {"train_loss": -5.496356010437012, "global_step": 30762, "epoch": 732} {"train_loss": -5.56002950668335, "global_step": 30763, "epoch": 732} {"train_loss": -5.492922782897949, "global_step": 30764, "epoch": 732} {"train_loss": -5.599858283996582, "global_step": 30765, "epoch": 732} {"train_loss": -5.353050231933594, "global_step": 30766, "epoch": 732} {"train_loss": -5.4352216720581055, "global_step": 30767, "epoch": 732} {"train_loss": -5.5294108390808105, "global_step": 30768, "epoch": 732} {"train_loss": -5.628196716308594, "global_step": 30769, "epoch": 732} {"train_loss": -5.465054035186768, "global_step": 30770, "epoch": 732} {"train_loss": -5.473241329193115, "global_step": 30771, "epoch": 732} {"train_loss": -5.544410705566406, "global_step": 30772, "epoch": 732} {"train_loss": -5.513767242431641, "global_step": 30773, "epoch": 732} {"train_loss": -5.373103141784668, "global_step": 30774, "epoch": 732} {"train_loss": -5.571990489959717, "global_step": 30775, "epoch": 732} {"train_loss": -5.405710697174072, "global_step": 30776, "epoch": 732} {"train_loss": -5.284937381744385, "global_step": 30777, "epoch": 732} {"train_loss": -5.416023254394531, "global_step": 30778, "epoch": 732} {"train_loss": -5.363138675689697, "global_step": 30779, "epoch": 732} {"train_loss": -5.426922798156738, "global_step": 30780, "epoch": 732} {"train_loss": -5.532199859619141, "global_step": 30781, "epoch": 732} {"train_loss": -5.357769012451172, "global_step": 30782, "epoch": 732} {"train_loss": -5.501612186431885, "global_step": 30783, "epoch": 732} {"train_loss": -5.473822593688965, "global_step": 30784, "epoch": 732} {"train_loss": -5.479329835800898, "global_step": 30785, "epoch": 732, "val_loss": 74586.078125} {"train_loss": -5.35825777053833, "global_step": 30786, "epoch": 733} {"train_loss": -5.493590354919434, "global_step": 30787, "epoch": 733} {"train_loss": -5.443917751312256, "global_step": 30788, "epoch": 733} {"train_loss": -5.50154972076416, "global_step": 30789, "epoch": 733} {"train_loss": -5.4163818359375, "global_step": 30790, "epoch": 733} {"train_loss": -5.291991233825684, "global_step": 30791, "epoch": 733} {"train_loss": -5.470263957977295, "global_step": 30792, "epoch": 733} {"train_loss": -5.538763046264648, "global_step": 30793, "epoch": 733} {"train_loss": -5.438887596130371, "global_step": 30794, "epoch": 733} {"train_loss": -5.389126300811768, "global_step": 30795, "epoch": 733} {"train_loss": -5.419312953948975, "global_step": 30796, "epoch": 733} {"train_loss": -5.377496242523193, "global_step": 30797, "epoch": 733} {"train_loss": -5.444718360900879, "global_step": 30798, "epoch": 733} {"train_loss": -5.516424179077148, "global_step": 30799, "epoch": 733} {"train_loss": -5.534881591796875, "global_step": 30800, "epoch": 733} {"train_loss": -5.462001800537109, "global_step": 30801, "epoch": 733} {"train_loss": -5.585375785827637, "global_step": 30802, "epoch": 733} {"train_loss": -5.440635681152344, "global_step": 30803, "epoch": 733} {"train_loss": -5.63227653503418, "global_step": 30804, "epoch": 733} {"train_loss": -5.571868896484375, "global_step": 30805, "epoch": 733} {"train_loss": -5.6221160888671875, "global_step": 30806, "epoch": 733} {"train_loss": -5.487051010131836, "global_step": 30807, "epoch": 733} {"train_loss": -5.529845714569092, "global_step": 30808, "epoch": 733} {"train_loss": -5.479884147644043, "global_step": 30809, "epoch": 733} {"train_loss": -5.5399322509765625, "global_step": 30810, "epoch": 733} {"train_loss": -5.460345268249512, "global_step": 30811, "epoch": 733} {"train_loss": -5.562771797180176, "global_step": 30812, "epoch": 733} {"train_loss": -5.455955982208252, "global_step": 30813, "epoch": 733} {"train_loss": -5.388026237487793, "global_step": 30814, "epoch": 733} {"train_loss": -5.641063690185547, "global_step": 30815, "epoch": 733} {"train_loss": -5.4820098876953125, "global_step": 30816, "epoch": 733} {"train_loss": -5.461041450500488, "global_step": 30817, "epoch": 733} {"train_loss": -5.486894607543945, "global_step": 30818, "epoch": 733} {"train_loss": -5.485077857971191, "global_step": 30819, "epoch": 733} {"train_loss": -5.483860492706299, "global_step": 30820, "epoch": 733} {"train_loss": -5.534069538116455, "global_step": 30821, "epoch": 733} {"train_loss": -5.492079734802246, "global_step": 30822, "epoch": 733} {"train_loss": -5.575010299682617, "global_step": 30823, "epoch": 733} {"train_loss": -5.312034606933594, "global_step": 30824, "epoch": 733} {"train_loss": -5.346206188201904, "global_step": 30825, "epoch": 733} {"train_loss": -5.406914710998535, "global_step": 30826, "epoch": 733} {"train_loss": -5.47615248816354, "global_step": 30827, "epoch": 733, "val_loss": 75537.3828125} {"train_loss": -5.483368396759033, "global_step": 30828, "epoch": 734} {"train_loss": -5.406588554382324, "global_step": 30829, "epoch": 734} {"train_loss": -5.563450813293457, "global_step": 30830, "epoch": 734} {"train_loss": -5.410321235656738, "global_step": 30831, "epoch": 734} {"train_loss": -5.353938102722168, "global_step": 30832, "epoch": 734} {"train_loss": -5.391546249389648, "global_step": 30833, "epoch": 734} {"train_loss": -5.484718322753906, "global_step": 30834, "epoch": 734} {"train_loss": -5.445204257965088, "global_step": 30835, "epoch": 734} {"train_loss": -5.424875259399414, "global_step": 30836, "epoch": 734} {"train_loss": -5.378650665283203, "global_step": 30837, "epoch": 734} {"train_loss": -5.469085216522217, "global_step": 30838, "epoch": 734} {"train_loss": -5.344989776611328, "global_step": 30839, "epoch": 734} {"train_loss": -5.44734001159668, "global_step": 30840, "epoch": 734} {"train_loss": -5.522538661956787, "global_step": 30841, "epoch": 734} {"train_loss": -5.267044544219971, "global_step": 30842, "epoch": 734} {"train_loss": -5.5501708984375, "global_step": 30843, "epoch": 734} {"train_loss": -5.424443244934082, "global_step": 30844, "epoch": 734} {"train_loss": -5.551953315734863, "global_step": 30845, "epoch": 734} {"train_loss": -5.526576042175293, "global_step": 30846, "epoch": 734} {"train_loss": -5.439833164215088, "global_step": 30847, "epoch": 734} {"train_loss": -5.525485992431641, "global_step": 30848, "epoch": 734} {"train_loss": -5.4921464920043945, "global_step": 30849, "epoch": 734} {"train_loss": -5.531693458557129, "global_step": 30850, "epoch": 734} {"train_loss": -5.452101707458496, "global_step": 30851, "epoch": 734} {"train_loss": -5.449196815490723, "global_step": 30852, "epoch": 734} {"train_loss": -5.454267978668213, "global_step": 30853, "epoch": 734} {"train_loss": -5.51248836517334, "global_step": 30854, "epoch": 734} {"train_loss": -5.484033107757568, "global_step": 30855, "epoch": 734} {"train_loss": -5.365630626678467, "global_step": 30856, "epoch": 734} {"train_loss": -5.379196643829346, "global_step": 30857, "epoch": 734} {"train_loss": -5.524705410003662, "global_step": 30858, "epoch": 734} {"train_loss": -5.378635406494141, "global_step": 30859, "epoch": 734} {"train_loss": -5.440032958984375, "global_step": 30860, "epoch": 734} {"train_loss": -5.511592864990234, "global_step": 30861, "epoch": 734} {"train_loss": -5.573359966278076, "global_step": 30862, "epoch": 734} {"train_loss": -5.526063919067383, "global_step": 30863, "epoch": 734} {"train_loss": -5.471493721008301, "global_step": 30864, "epoch": 734} {"train_loss": -5.522028923034668, "global_step": 30865, "epoch": 734} {"train_loss": -5.452369689941406, "global_step": 30866, "epoch": 734} {"train_loss": -5.5035176277160645, "global_step": 30867, "epoch": 734} {"train_loss": -5.4269256591796875, "global_step": 30868, "epoch": 734} {"train_loss": -5.459027642295474, "global_step": 30869, "epoch": 734, "val_loss": 75386.921875} {"train_loss": -5.395586967468262, "global_step": 30870, "epoch": 735} {"train_loss": -5.4928436279296875, "global_step": 30871, "epoch": 735} {"train_loss": -5.513507843017578, "global_step": 30872, "epoch": 735} {"train_loss": -5.417765140533447, "global_step": 30873, "epoch": 735} {"train_loss": -5.675765037536621, "global_step": 30874, "epoch": 735} {"train_loss": -5.491237640380859, "global_step": 30875, "epoch": 735} {"train_loss": -5.304921627044678, "global_step": 30876, "epoch": 735} {"train_loss": -5.402782440185547, "global_step": 30877, "epoch": 735} {"train_loss": -5.402796745300293, "global_step": 30878, "epoch": 735} {"train_loss": -5.323890686035156, "global_step": 30879, "epoch": 735} {"train_loss": -5.493096351623535, "global_step": 30880, "epoch": 735} {"train_loss": -5.4647626876831055, "global_step": 30881, "epoch": 735} {"train_loss": -5.489965915679932, "global_step": 30882, "epoch": 735} {"train_loss": -5.5590057373046875, "global_step": 30883, "epoch": 735} {"train_loss": -5.364893913269043, "global_step": 30884, "epoch": 735} {"train_loss": -5.583953380584717, "global_step": 30885, "epoch": 735} {"train_loss": -5.339468955993652, "global_step": 30886, "epoch": 735} {"train_loss": -5.539996147155762, "global_step": 30887, "epoch": 735} {"train_loss": -5.358020782470703, "global_step": 30888, "epoch": 735} {"train_loss": -5.478490829467773, "global_step": 30889, "epoch": 735} {"train_loss": -5.465304374694824, "global_step": 30890, "epoch": 735} {"train_loss": -5.49981689453125, "global_step": 30891, "epoch": 735} {"train_loss": -5.525905609130859, "global_step": 30892, "epoch": 735} {"train_loss": -5.474838733673096, "global_step": 30893, "epoch": 735} {"train_loss": -5.452812194824219, "global_step": 30894, "epoch": 735} {"train_loss": -5.533663749694824, "global_step": 30895, "epoch": 735} {"train_loss": -5.4714508056640625, "global_step": 30896, "epoch": 735} {"train_loss": -5.512363433837891, "global_step": 30897, "epoch": 735} {"train_loss": -5.4557881355285645, "global_step": 30898, "epoch": 735} {"train_loss": -5.437075614929199, "global_step": 30899, "epoch": 735} {"train_loss": -5.468901634216309, "global_step": 30900, "epoch": 735} {"train_loss": -5.498773097991943, "global_step": 30901, "epoch": 735} {"train_loss": -5.463974952697754, "global_step": 30902, "epoch": 735} {"train_loss": -5.488595962524414, "global_step": 30903, "epoch": 735} {"train_loss": -5.453737258911133, "global_step": 30904, "epoch": 735} {"train_loss": -5.461091995239258, "global_step": 30905, "epoch": 735} {"train_loss": -5.422503471374512, "global_step": 30906, "epoch": 735} {"train_loss": -5.43363618850708, "global_step": 30907, "epoch": 735} {"train_loss": -5.594703197479248, "global_step": 30908, "epoch": 735} {"train_loss": -5.4218244552612305, "global_step": 30909, "epoch": 735} {"train_loss": -5.469309329986572, "global_step": 30910, "epoch": 735} {"train_loss": -5.468298662276495, "global_step": 30911, "epoch": 735, "val_loss": 74856.8125} {"train_loss": -5.385591983795166, "global_step": 30912, "epoch": 736} {"train_loss": -5.572685241699219, "global_step": 30913, "epoch": 736} {"train_loss": -5.488064289093018, "global_step": 30914, "epoch": 736} {"train_loss": -5.492864608764648, "global_step": 30915, "epoch": 736} {"train_loss": -5.378467559814453, "global_step": 30916, "epoch": 736} {"train_loss": -5.560169219970703, "global_step": 30917, "epoch": 736} {"train_loss": -5.438992500305176, "global_step": 30918, "epoch": 736} {"train_loss": -5.455572128295898, "global_step": 30919, "epoch": 736} {"train_loss": -5.5030107498168945, "global_step": 30920, "epoch": 736} {"train_loss": -5.515378952026367, "global_step": 30921, "epoch": 736} {"train_loss": -5.470963954925537, "global_step": 30922, "epoch": 736} {"train_loss": -5.562267303466797, "global_step": 30923, "epoch": 736} {"train_loss": -5.497568607330322, "global_step": 30924, "epoch": 736} {"train_loss": -5.518415927886963, "global_step": 30925, "epoch": 736} {"train_loss": -5.322329521179199, "global_step": 30926, "epoch": 736} {"train_loss": -5.424526214599609, "global_step": 30927, "epoch": 736} {"train_loss": -5.497651100158691, "global_step": 30928, "epoch": 736} {"train_loss": -5.414221286773682, "global_step": 30929, "epoch": 736} {"train_loss": -5.5262250900268555, "global_step": 30930, "epoch": 736} {"train_loss": -5.419844627380371, "global_step": 30931, "epoch": 736} {"train_loss": -5.479026794433594, "global_step": 30932, "epoch": 736} {"train_loss": -5.487367153167725, "global_step": 30933, "epoch": 736} {"train_loss": -5.367911338806152, "global_step": 30934, "epoch": 736} {"train_loss": -5.336368560791016, "global_step": 30935, "epoch": 736} {"train_loss": -5.355196952819824, "global_step": 30936, "epoch": 736} {"train_loss": -5.38349723815918, "global_step": 30937, "epoch": 736} {"train_loss": -5.469185829162598, "global_step": 30938, "epoch": 736} {"train_loss": -5.360787868499756, "global_step": 30939, "epoch": 736} {"train_loss": -5.393100738525391, "global_step": 30940, "epoch": 736} {"train_loss": -5.3802490234375, "global_step": 30941, "epoch": 736} {"train_loss": -5.549467086791992, "global_step": 30942, "epoch": 736} {"train_loss": -5.3842573165893555, "global_step": 30943, "epoch": 736} {"train_loss": -5.482954502105713, "global_step": 30944, "epoch": 736} {"train_loss": -5.351130485534668, "global_step": 30945, "epoch": 736} {"train_loss": -5.412043571472168, "global_step": 30946, "epoch": 736} {"train_loss": -5.451814651489258, "global_step": 30947, "epoch": 736} {"train_loss": -5.510610580444336, "global_step": 30948, "epoch": 736} {"train_loss": -5.546588897705078, "global_step": 30949, "epoch": 736} {"train_loss": -5.607278823852539, "global_step": 30950, "epoch": 736} {"train_loss": -5.444745063781738, "global_step": 30951, "epoch": 736} {"train_loss": -5.400547027587891, "global_step": 30952, "epoch": 736} {"train_loss": -5.456442923772903, "global_step": 30953, "epoch": 736, "val_loss": 75312.1484375} {"train_loss": -5.356064796447754, "global_step": 30954, "epoch": 737} {"train_loss": -5.607834815979004, "global_step": 30955, "epoch": 737} {"train_loss": -5.413132667541504, "global_step": 30956, "epoch": 737} {"train_loss": -5.413769721984863, "global_step": 30957, "epoch": 737} {"train_loss": -5.445479393005371, "global_step": 30958, "epoch": 737} {"train_loss": -5.492368698120117, "global_step": 30959, "epoch": 737} {"train_loss": -5.543140411376953, "global_step": 30960, "epoch": 737} {"train_loss": -5.506368637084961, "global_step": 30961, "epoch": 737} {"train_loss": -5.514776706695557, "global_step": 30962, "epoch": 737} {"train_loss": -5.572915077209473, "global_step": 30963, "epoch": 737} {"train_loss": -5.380034446716309, "global_step": 30964, "epoch": 737} {"train_loss": -5.496237754821777, "global_step": 30965, "epoch": 737} {"train_loss": -5.464349269866943, "global_step": 30966, "epoch": 737} {"train_loss": -5.524306297302246, "global_step": 30967, "epoch": 737} {"train_loss": -5.532549858093262, "global_step": 30968, "epoch": 737} {"train_loss": -5.469969749450684, "global_step": 30969, "epoch": 737} {"train_loss": -5.43326997756958, "global_step": 30970, "epoch": 737} {"train_loss": -5.414632320404053, "global_step": 30971, "epoch": 737} {"train_loss": -5.522393226623535, "global_step": 30972, "epoch": 737} {"train_loss": -5.589346408843994, "global_step": 30973, "epoch": 737} {"train_loss": -5.531485080718994, "global_step": 30974, "epoch": 737} {"train_loss": -5.445701599121094, "global_step": 30975, "epoch": 737} {"train_loss": -5.606786727905273, "global_step": 30976, "epoch": 737} {"train_loss": -5.445157051086426, "global_step": 30977, "epoch": 737} {"train_loss": -5.578891277313232, "global_step": 30978, "epoch": 737} {"train_loss": -5.620540618896484, "global_step": 30979, "epoch": 737} {"train_loss": -5.480379104614258, "global_step": 30980, "epoch": 737} {"train_loss": -5.398924827575684, "global_step": 30981, "epoch": 737} {"train_loss": -5.5898566246032715, "global_step": 30982, "epoch": 737} {"train_loss": -5.351413726806641, "global_step": 30983, "epoch": 737} {"train_loss": -5.529149055480957, "global_step": 30984, "epoch": 737} {"train_loss": -5.5567827224731445, "global_step": 30985, "epoch": 737} {"train_loss": -5.518886566162109, "global_step": 30986, "epoch": 737} {"train_loss": -5.497189044952393, "global_step": 30987, "epoch": 737} {"train_loss": -5.518171787261963, "global_step": 30988, "epoch": 737} {"train_loss": -5.517396926879883, "global_step": 30989, "epoch": 737} {"train_loss": -5.525491714477539, "global_step": 30990, "epoch": 737} {"train_loss": -5.482747554779053, "global_step": 30991, "epoch": 737} {"train_loss": -5.4736175537109375, "global_step": 30992, "epoch": 737} {"train_loss": -5.440115928649902, "global_step": 30993, "epoch": 737} {"train_loss": -5.461960792541504, "global_step": 30994, "epoch": 737} {"train_loss": -5.495376098723638, "global_step": 30995, "epoch": 737, "val_loss": 74595.3125} {"train_loss": -5.40352725982666, "global_step": 30996, "epoch": 738} {"train_loss": -5.42087459564209, "global_step": 30997, "epoch": 738} {"train_loss": -5.468897819519043, "global_step": 30998, "epoch": 738} {"train_loss": -5.300801753997803, "global_step": 30999, "epoch": 738} {"train_loss": -5.426979064941406, "global_step": 31000, "epoch": 738} {"train_loss": -5.466581344604492, "global_step": 31001, "epoch": 738} {"train_loss": -5.399559020996094, "global_step": 31002, "epoch": 738} {"train_loss": -5.513059139251709, "global_step": 31003, "epoch": 738} {"train_loss": -5.519522666931152, "global_step": 31004, "epoch": 738} {"train_loss": -5.488414287567139, "global_step": 31005, "epoch": 738} {"train_loss": -5.576241493225098, "global_step": 31006, "epoch": 738} {"train_loss": -5.508670330047607, "global_step": 31007, "epoch": 738} {"train_loss": -5.409221649169922, "global_step": 31008, "epoch": 738} {"train_loss": -5.481119632720947, "global_step": 31009, "epoch": 738} {"train_loss": -5.460697650909424, "global_step": 31010, "epoch": 738} {"train_loss": -5.414775371551514, "global_step": 31011, "epoch": 738} {"train_loss": -5.4719696044921875, "global_step": 31012, "epoch": 738} {"train_loss": -5.530605792999268, "global_step": 31013, "epoch": 738} {"train_loss": -5.49993896484375, "global_step": 31014, "epoch": 738} {"train_loss": -5.478682994842529, "global_step": 31015, "epoch": 738} {"train_loss": -5.489436149597168, "global_step": 31016, "epoch": 738} {"train_loss": -5.488966464996338, "global_step": 31017, "epoch": 738} {"train_loss": -5.4203901290893555, "global_step": 31018, "epoch": 738} {"train_loss": -5.5346174240112305, "global_step": 31019, "epoch": 738} {"train_loss": -5.436602592468262, "global_step": 31020, "epoch": 738} {"train_loss": -5.402434349060059, "global_step": 31021, "epoch": 738} {"train_loss": -5.559108734130859, "global_step": 31022, "epoch": 738} {"train_loss": -5.457638740539551, "global_step": 31023, "epoch": 738} {"train_loss": -5.580300807952881, "global_step": 31024, "epoch": 738} {"train_loss": -5.4922194480896, "global_step": 31025, "epoch": 738} {"train_loss": -5.498348236083984, "global_step": 31026, "epoch": 738} {"train_loss": -5.62795352935791, "global_step": 31027, "epoch": 738} {"train_loss": -5.483156681060791, "global_step": 31028, "epoch": 738} {"train_loss": -5.5640997886657715, "global_step": 31029, "epoch": 738} {"train_loss": -5.453425407409668, "global_step": 31030, "epoch": 738} {"train_loss": -5.483560085296631, "global_step": 31031, "epoch": 738} {"train_loss": -5.389808654785156, "global_step": 31032, "epoch": 738} {"train_loss": -5.5724873542785645, "global_step": 31033, "epoch": 738} {"train_loss": -5.581466197967529, "global_step": 31034, "epoch": 738} {"train_loss": -5.460601329803467, "global_step": 31035, "epoch": 738} {"train_loss": -5.51215124130249, "global_step": 31036, "epoch": 738} {"train_loss": -5.483650128046672, "global_step": 31037, "epoch": 738, "val_loss": 74876.125} {"train_loss": -5.467226982116699, "global_step": 31038, "epoch": 739} {"train_loss": -5.525402069091797, "global_step": 31039, "epoch": 739} {"train_loss": -5.490603923797607, "global_step": 31040, "epoch": 739} {"train_loss": -5.626175880432129, "global_step": 31041, "epoch": 739} {"train_loss": -5.458034038543701, "global_step": 31042, "epoch": 739} {"train_loss": -5.429455757141113, "global_step": 31043, "epoch": 739} {"train_loss": -5.475261688232422, "global_step": 31044, "epoch": 739} {"train_loss": -5.458661079406738, "global_step": 31045, "epoch": 739} {"train_loss": -5.472921371459961, "global_step": 31046, "epoch": 739} {"train_loss": -5.412493705749512, "global_step": 31047, "epoch": 739} {"train_loss": -5.435452461242676, "global_step": 31048, "epoch": 739} {"train_loss": -5.406508445739746, "global_step": 31049, "epoch": 739} {"train_loss": -5.540989875793457, "global_step": 31050, "epoch": 739} {"train_loss": -5.4441914558410645, "global_step": 31051, "epoch": 739} {"train_loss": -5.457322120666504, "global_step": 31052, "epoch": 739} {"train_loss": -5.376542568206787, "global_step": 31053, "epoch": 739} {"train_loss": -5.450985908508301, "global_step": 31054, "epoch": 739} {"train_loss": -5.561160564422607, "global_step": 31055, "epoch": 739} {"train_loss": -5.579668998718262, "global_step": 31056, "epoch": 739} {"train_loss": -5.523337364196777, "global_step": 31057, "epoch": 739} {"train_loss": -5.510470390319824, "global_step": 31058, "epoch": 739} {"train_loss": -5.4831061363220215, "global_step": 31059, "epoch": 739} {"train_loss": -5.433788299560547, "global_step": 31060, "epoch": 739} {"train_loss": -5.427892684936523, "global_step": 31061, "epoch": 739} {"train_loss": -5.529256343841553, "global_step": 31062, "epoch": 739} {"train_loss": -5.403396129608154, "global_step": 31063, "epoch": 739} {"train_loss": -5.529086112976074, "global_step": 31064, "epoch": 739} {"train_loss": -5.465218544006348, "global_step": 31065, "epoch": 739} {"train_loss": -5.3707756996154785, "global_step": 31066, "epoch": 739} {"train_loss": -5.5271196365356445, "global_step": 31067, "epoch": 739} {"train_loss": -5.516615867614746, "global_step": 31068, "epoch": 739} {"train_loss": -5.3981475830078125, "global_step": 31069, "epoch": 739} {"train_loss": -5.525008678436279, "global_step": 31070, "epoch": 739} {"train_loss": -5.613787651062012, "global_step": 31071, "epoch": 739} {"train_loss": -5.530679702758789, "global_step": 31072, "epoch": 739} {"train_loss": -5.522505760192871, "global_step": 31073, "epoch": 739} {"train_loss": -5.430427074432373, "global_step": 31074, "epoch": 739} {"train_loss": -5.5208330154418945, "global_step": 31075, "epoch": 739} {"train_loss": -5.475292205810547, "global_step": 31076, "epoch": 739} {"train_loss": -5.500245571136475, "global_step": 31077, "epoch": 739} {"train_loss": -5.42958927154541, "global_step": 31078, "epoch": 739} {"train_loss": -5.4841711748214, "global_step": 31079, "epoch": 739, "val_loss": 74944.4921875} {"train_loss": -5.5133771896362305, "global_step": 31080, "epoch": 740} {"train_loss": -5.415424346923828, "global_step": 31081, "epoch": 740} {"train_loss": -5.557290554046631, "global_step": 31082, "epoch": 740} {"train_loss": -5.598626136779785, "global_step": 31083, "epoch": 740} {"train_loss": -5.471576690673828, "global_step": 31084, "epoch": 740} {"train_loss": -5.556013107299805, "global_step": 31085, "epoch": 740} {"train_loss": -5.635280132293701, "global_step": 31086, "epoch": 740} {"train_loss": -5.530673027038574, "global_step": 31087, "epoch": 740} {"train_loss": -5.435552597045898, "global_step": 31088, "epoch": 740} {"train_loss": -5.648652076721191, "global_step": 31089, "epoch": 740} {"train_loss": -5.512260437011719, "global_step": 31090, "epoch": 740} {"train_loss": -5.697690010070801, "global_step": 31091, "epoch": 740} {"train_loss": -5.445624351501465, "global_step": 31092, "epoch": 740} {"train_loss": -5.467316627502441, "global_step": 31093, "epoch": 740} {"train_loss": -5.459187984466553, "global_step": 31094, "epoch": 740} {"train_loss": -5.4247636795043945, "global_step": 31095, "epoch": 740} {"train_loss": -5.447073459625244, "global_step": 31096, "epoch": 740} {"train_loss": -5.501690864562988, "global_step": 31097, "epoch": 740} {"train_loss": -5.610038757324219, "global_step": 31098, "epoch": 740} {"train_loss": -5.371299743652344, "global_step": 31099, "epoch": 740} {"train_loss": -5.471904277801514, "global_step": 31100, "epoch": 740} {"train_loss": -5.672873497009277, "global_step": 31101, "epoch": 740} {"train_loss": -5.471569061279297, "global_step": 31102, "epoch": 740} {"train_loss": -5.479642391204834, "global_step": 31103, "epoch": 740} {"train_loss": -5.588119029998779, "global_step": 31104, "epoch": 740} {"train_loss": -5.437060356140137, "global_step": 31105, "epoch": 740} {"train_loss": -5.54808235168457, "global_step": 31106, "epoch": 740} {"train_loss": -5.553677082061768, "global_step": 31107, "epoch": 740} {"train_loss": -5.5567307472229, "global_step": 31108, "epoch": 740} {"train_loss": -5.422679424285889, "global_step": 31109, "epoch": 740} {"train_loss": -5.628873825073242, "global_step": 31110, "epoch": 740} {"train_loss": -5.405270099639893, "global_step": 31111, "epoch": 740} {"train_loss": -5.524776935577393, "global_step": 31112, "epoch": 740} {"train_loss": -5.424591541290283, "global_step": 31113, "epoch": 740} {"train_loss": -5.513205528259277, "global_step": 31114, "epoch": 740} {"train_loss": -5.430266380310059, "global_step": 31115, "epoch": 740} {"train_loss": -5.563989639282227, "global_step": 31116, "epoch": 740} {"train_loss": -5.491390705108643, "global_step": 31117, "epoch": 740} {"train_loss": -5.524668216705322, "global_step": 31118, "epoch": 740} {"train_loss": -5.506386756896973, "global_step": 31119, "epoch": 740} {"train_loss": -5.577718257904053, "global_step": 31120, "epoch": 740} {"train_loss": -5.516434839793614, "global_step": 31121, "epoch": 740, "val_loss": 75057.4296875} {"train_loss": -5.4526824951171875, "global_step": 31122, "epoch": 741} {"train_loss": -5.534608840942383, "global_step": 31123, "epoch": 741} {"train_loss": -5.499183177947998, "global_step": 31124, "epoch": 741} {"train_loss": -5.553877830505371, "global_step": 31125, "epoch": 741} {"train_loss": -5.48569393157959, "global_step": 31126, "epoch": 741} {"train_loss": -5.3833746910095215, "global_step": 31127, "epoch": 741} {"train_loss": -5.636634826660156, "global_step": 31128, "epoch": 741} {"train_loss": -5.528748512268066, "global_step": 31129, "epoch": 741} {"train_loss": -5.490185260772705, "global_step": 31130, "epoch": 741} {"train_loss": -5.46640682220459, "global_step": 31131, "epoch": 741} {"train_loss": -5.458938121795654, "global_step": 31132, "epoch": 741} {"train_loss": -5.531782150268555, "global_step": 31133, "epoch": 741} {"train_loss": -5.507192611694336, "global_step": 31134, "epoch": 741} {"train_loss": -5.5356011390686035, "global_step": 31135, "epoch": 741} {"train_loss": -5.48586368560791, "global_step": 31136, "epoch": 741} {"train_loss": -5.4074602127075195, "global_step": 31137, "epoch": 741} {"train_loss": -5.566481590270996, "global_step": 31138, "epoch": 741} {"train_loss": -5.485400199890137, "global_step": 31139, "epoch": 741} {"train_loss": -5.4978718757629395, "global_step": 31140, "epoch": 741} {"train_loss": -5.533879280090332, "global_step": 31141, "epoch": 741} {"train_loss": -5.393622398376465, "global_step": 31142, "epoch": 741} {"train_loss": -5.430489540100098, "global_step": 31143, "epoch": 741} {"train_loss": -5.466938018798828, "global_step": 31144, "epoch": 741} {"train_loss": -5.473924160003662, "global_step": 31145, "epoch": 741} {"train_loss": -5.425774574279785, "global_step": 31146, "epoch": 741} {"train_loss": -5.448855400085449, "global_step": 31147, "epoch": 741} {"train_loss": -5.5913166999816895, "global_step": 31148, "epoch": 741} {"train_loss": -5.540389060974121, "global_step": 31149, "epoch": 741} {"train_loss": -5.480245590209961, "global_step": 31150, "epoch": 741} {"train_loss": -5.398456573486328, "global_step": 31151, "epoch": 741} {"train_loss": -5.610994338989258, "global_step": 31152, "epoch": 741} {"train_loss": -5.463978290557861, "global_step": 31153, "epoch": 741} {"train_loss": -5.456031322479248, "global_step": 31154, "epoch": 741} {"train_loss": -5.548549175262451, "global_step": 31155, "epoch": 741} {"train_loss": -5.56572151184082, "global_step": 31156, "epoch": 741} {"train_loss": -5.526049613952637, "global_step": 31157, "epoch": 741} {"train_loss": -5.515381813049316, "global_step": 31158, "epoch": 741} {"train_loss": -5.5440473556518555, "global_step": 31159, "epoch": 741} {"train_loss": -5.348142623901367, "global_step": 31160, "epoch": 741} {"train_loss": -5.598941802978516, "global_step": 31161, "epoch": 741} {"train_loss": -5.551028728485107, "global_step": 31162, "epoch": 741} {"train_loss": -5.499714635667347, "global_step": 31163, "epoch": 741, "val_loss": 75215.5} {"train_loss": -5.459229469299316, "global_step": 31164, "epoch": 742} {"train_loss": -5.529596328735352, "global_step": 31165, "epoch": 742} {"train_loss": -5.573308944702148, "global_step": 31166, "epoch": 742} {"train_loss": -5.387832164764404, "global_step": 31167, "epoch": 742} {"train_loss": -5.5087890625, "global_step": 31168, "epoch": 742} {"train_loss": -5.540640830993652, "global_step": 31169, "epoch": 742} {"train_loss": -5.459589004516602, "global_step": 31170, "epoch": 742} {"train_loss": -5.473293304443359, "global_step": 31171, "epoch": 742} {"train_loss": -5.484714508056641, "global_step": 31172, "epoch": 742} {"train_loss": -5.4464945793151855, "global_step": 31173, "epoch": 742} {"train_loss": -5.347568988800049, "global_step": 31174, "epoch": 742} {"train_loss": -5.509859085083008, "global_step": 31175, "epoch": 742} {"train_loss": -5.482480525970459, "global_step": 31176, "epoch": 742} {"train_loss": -5.448850631713867, "global_step": 31177, "epoch": 742} {"train_loss": -5.506161212921143, "global_step": 31178, "epoch": 742} {"train_loss": -5.42089319229126, "global_step": 31179, "epoch": 742} {"train_loss": -5.593996047973633, "global_step": 31180, "epoch": 742} {"train_loss": -5.544926166534424, "global_step": 31181, "epoch": 742} {"train_loss": -5.56431770324707, "global_step": 31182, "epoch": 742} {"train_loss": -5.504961013793945, "global_step": 31183, "epoch": 742} {"train_loss": -5.454586982727051, "global_step": 31184, "epoch": 742} {"train_loss": -5.515960216522217, "global_step": 31185, "epoch": 742} {"train_loss": -5.504874229431152, "global_step": 31186, "epoch": 742} {"train_loss": -5.492722511291504, "global_step": 31187, "epoch": 742} {"train_loss": -5.625053882598877, "global_step": 31188, "epoch": 742} {"train_loss": -5.53427791595459, "global_step": 31189, "epoch": 742} {"train_loss": -5.47194766998291, "global_step": 31190, "epoch": 742} {"train_loss": -5.584344387054443, "global_step": 31191, "epoch": 742} {"train_loss": -5.46722412109375, "global_step": 31192, "epoch": 742} {"train_loss": -5.474673271179199, "global_step": 31193, "epoch": 742} {"train_loss": -5.423774719238281, "global_step": 31194, "epoch": 742} {"train_loss": -5.479486465454102, "global_step": 31195, "epoch": 742} {"train_loss": -5.413673400878906, "global_step": 31196, "epoch": 742} {"train_loss": -5.505090713500977, "global_step": 31197, "epoch": 742} {"train_loss": -5.452434539794922, "global_step": 31198, "epoch": 742} {"train_loss": -5.516722679138184, "global_step": 31199, "epoch": 742} {"train_loss": -5.3183393478393555, "global_step": 31200, "epoch": 742} {"train_loss": -5.4819231033325195, "global_step": 31201, "epoch": 742} {"train_loss": -5.372746467590332, "global_step": 31202, "epoch": 742} {"train_loss": -5.480093955993652, "global_step": 31203, "epoch": 742} {"train_loss": -5.509552955627441, "global_step": 31204, "epoch": 742} {"train_loss": -5.481544029145014, "global_step": 31205, "epoch": 742, "val_loss": 74565.6640625} {"train_loss": -5.465644359588623, "global_step": 31206, "epoch": 743} {"train_loss": -5.451325416564941, "global_step": 31207, "epoch": 743} {"train_loss": -5.377140045166016, "global_step": 31208, "epoch": 743} {"train_loss": -5.5633978843688965, "global_step": 31209, "epoch": 743} {"train_loss": -5.5495991706848145, "global_step": 31210, "epoch": 743} {"train_loss": -5.413750648498535, "global_step": 31211, "epoch": 743} {"train_loss": -5.486004829406738, "global_step": 31212, "epoch": 743} {"train_loss": -5.552557468414307, "global_step": 31213, "epoch": 743} {"train_loss": -5.484865188598633, "global_step": 31214, "epoch": 743} {"train_loss": -5.472263336181641, "global_step": 31215, "epoch": 743} {"train_loss": -5.636960983276367, "global_step": 31216, "epoch": 743} {"train_loss": -5.45782470703125, "global_step": 31217, "epoch": 743} {"train_loss": -5.467220783233643, "global_step": 31218, "epoch": 743} {"train_loss": -5.4479217529296875, "global_step": 31219, "epoch": 743} {"train_loss": -5.398433685302734, "global_step": 31220, "epoch": 743} {"train_loss": -5.634130954742432, "global_step": 31221, "epoch": 743} {"train_loss": -5.337223052978516, "global_step": 31222, "epoch": 743} {"train_loss": -5.481273174285889, "global_step": 31223, "epoch": 743} {"train_loss": -5.466005325317383, "global_step": 31224, "epoch": 743} {"train_loss": -5.501385688781738, "global_step": 31225, "epoch": 743} {"train_loss": -5.337972640991211, "global_step": 31226, "epoch": 743} {"train_loss": -5.669743537902832, "global_step": 31227, "epoch": 743} {"train_loss": -5.430944442749023, "global_step": 31228, "epoch": 743} {"train_loss": -5.481734275817871, "global_step": 31229, "epoch": 743} {"train_loss": -5.501115798950195, "global_step": 31230, "epoch": 743} {"train_loss": -5.274521350860596, "global_step": 31231, "epoch": 743} {"train_loss": -5.579139232635498, "global_step": 31232, "epoch": 743} {"train_loss": -5.365602493286133, "global_step": 31233, "epoch": 743} {"train_loss": -5.436295986175537, "global_step": 31234, "epoch": 743} {"train_loss": -5.433182239532471, "global_step": 31235, "epoch": 743} {"train_loss": -5.314263343811035, "global_step": 31236, "epoch": 743} {"train_loss": -5.556865692138672, "global_step": 31237, "epoch": 743} {"train_loss": -5.489732265472412, "global_step": 31238, "epoch": 743} {"train_loss": -5.3668928146362305, "global_step": 31239, "epoch": 743} {"train_loss": -5.435356616973877, "global_step": 31240, "epoch": 743} {"train_loss": -5.446465492248535, "global_step": 31241, "epoch": 743} {"train_loss": -5.575222969055176, "global_step": 31242, "epoch": 743} {"train_loss": -5.513681411743164, "global_step": 31243, "epoch": 743} {"train_loss": -5.541497230529785, "global_step": 31244, "epoch": 743} {"train_loss": -5.4012861251831055, "global_step": 31245, "epoch": 743} {"train_loss": -5.439375877380371, "global_step": 31246, "epoch": 743} {"train_loss": -5.471441654931931, "global_step": 31247, "epoch": 743, "val_loss": 74742.578125} {"train_loss": -5.441605567932129, "global_step": 31248, "epoch": 744} {"train_loss": -5.523364543914795, "global_step": 31249, "epoch": 744} {"train_loss": -5.550934791564941, "global_step": 31250, "epoch": 744} {"train_loss": -5.542124271392822, "global_step": 31251, "epoch": 744} {"train_loss": -5.429060459136963, "global_step": 31252, "epoch": 744} {"train_loss": -5.5111083984375, "global_step": 31253, "epoch": 744} {"train_loss": -5.484395980834961, "global_step": 31254, "epoch": 744} {"train_loss": -5.621458053588867, "global_step": 31255, "epoch": 744} {"train_loss": -5.580489635467529, "global_step": 31256, "epoch": 744} {"train_loss": -5.47841739654541, "global_step": 31257, "epoch": 744} {"train_loss": -5.6459550857543945, "global_step": 31258, "epoch": 744} {"train_loss": -5.487229347229004, "global_step": 31259, "epoch": 744} {"train_loss": -5.343401908874512, "global_step": 31260, "epoch": 744} {"train_loss": -5.4692277908325195, "global_step": 31261, "epoch": 744} {"train_loss": -5.552552223205566, "global_step": 31262, "epoch": 744} {"train_loss": -5.396053314208984, "global_step": 31263, "epoch": 744} {"train_loss": -5.489694595336914, "global_step": 31264, "epoch": 744} {"train_loss": -5.41959285736084, "global_step": 31265, "epoch": 744} {"train_loss": -5.450909614562988, "global_step": 31266, "epoch": 744} {"train_loss": -5.5048065185546875, "global_step": 31267, "epoch": 744} {"train_loss": -5.45111083984375, "global_step": 31268, "epoch": 744} {"train_loss": -5.546182632446289, "global_step": 31269, "epoch": 744} {"train_loss": -5.458327770233154, "global_step": 31270, "epoch": 744} {"train_loss": -5.501653671264648, "global_step": 31271, "epoch": 744} {"train_loss": -5.483776092529297, "global_step": 31272, "epoch": 744} {"train_loss": -5.422659397125244, "global_step": 31273, "epoch": 744} {"train_loss": -5.477475166320801, "global_step": 31274, "epoch": 744} {"train_loss": -5.388410568237305, "global_step": 31275, "epoch": 744} {"train_loss": -5.377674102783203, "global_step": 31276, "epoch": 744} {"train_loss": -5.386527061462402, "global_step": 31277, "epoch": 744} {"train_loss": -5.432949066162109, "global_step": 31278, "epoch": 744} {"train_loss": -5.433572292327881, "global_step": 31279, "epoch": 744} {"train_loss": -5.307991981506348, "global_step": 31280, "epoch": 744} {"train_loss": -5.471047401428223, "global_step": 31281, "epoch": 744} {"train_loss": -5.565040111541748, "global_step": 31282, "epoch": 744} {"train_loss": -5.444135665893555, "global_step": 31283, "epoch": 744} {"train_loss": -5.463986873626709, "global_step": 31284, "epoch": 744} {"train_loss": -5.532280921936035, "global_step": 31285, "epoch": 744} {"train_loss": -5.465612888336182, "global_step": 31286, "epoch": 744} {"train_loss": -5.5494794845581055, "global_step": 31287, "epoch": 744} {"train_loss": -5.610292434692383, "global_step": 31288, "epoch": 744} {"train_loss": -5.482904706682477, "global_step": 31289, "epoch": 744, "val_loss": 74877.421875} {"train_loss": -5.566572189331055, "global_step": 31290, "epoch": 745} {"train_loss": -5.549605369567871, "global_step": 31291, "epoch": 745} {"train_loss": -5.5805559158325195, "global_step": 31292, "epoch": 745} {"train_loss": -5.482361316680908, "global_step": 31293, "epoch": 745} {"train_loss": -5.628705978393555, "global_step": 31294, "epoch": 745} {"train_loss": -5.521873474121094, "global_step": 31295, "epoch": 745} {"train_loss": -5.445837497711182, "global_step": 31296, "epoch": 745} {"train_loss": -5.513008117675781, "global_step": 31297, "epoch": 745} {"train_loss": -5.511112213134766, "global_step": 31298, "epoch": 745} {"train_loss": -5.392300605773926, "global_step": 31299, "epoch": 745} {"train_loss": -5.449624061584473, "global_step": 31300, "epoch": 745} {"train_loss": -5.517671585083008, "global_step": 31301, "epoch": 745} {"train_loss": -5.363283634185791, "global_step": 31302, "epoch": 745} {"train_loss": -5.52450704574585, "global_step": 31303, "epoch": 745} {"train_loss": -5.673676490783691, "global_step": 31304, "epoch": 745} {"train_loss": -5.502546310424805, "global_step": 31305, "epoch": 745} {"train_loss": -5.570652961730957, "global_step": 31306, "epoch": 745} {"train_loss": -5.518319129943848, "global_step": 31307, "epoch": 745} {"train_loss": -5.5114922523498535, "global_step": 31308, "epoch": 745} {"train_loss": -5.563501834869385, "global_step": 31309, "epoch": 745} {"train_loss": -5.387280464172363, "global_step": 31310, "epoch": 745} {"train_loss": -5.3706889152526855, "global_step": 31311, "epoch": 745} {"train_loss": -5.518945693969727, "global_step": 31312, "epoch": 745} {"train_loss": -5.5256242752075195, "global_step": 31313, "epoch": 745} {"train_loss": -5.569639205932617, "global_step": 31314, "epoch": 745} {"train_loss": -5.508481502532959, "global_step": 31315, "epoch": 745} {"train_loss": -5.524211883544922, "global_step": 31316, "epoch": 745} {"train_loss": -5.483560562133789, "global_step": 31317, "epoch": 745} {"train_loss": -5.44339656829834, "global_step": 31318, "epoch": 745} {"train_loss": -5.511820316314697, "global_step": 31319, "epoch": 745} {"train_loss": -5.540307998657227, "global_step": 31320, "epoch": 745} {"train_loss": -5.617079734802246, "global_step": 31321, "epoch": 745} {"train_loss": -5.331761360168457, "global_step": 31322, "epoch": 745} {"train_loss": -5.44937801361084, "global_step": 31323, "epoch": 745} {"train_loss": -5.45924186706543, "global_step": 31324, "epoch": 745} {"train_loss": -5.326582908630371, "global_step": 31325, "epoch": 745} {"train_loss": -5.592886924743652, "global_step": 31326, "epoch": 745} {"train_loss": -5.390263557434082, "global_step": 31327, "epoch": 745} {"train_loss": -5.4833831787109375, "global_step": 31328, "epoch": 745} {"train_loss": -5.477590560913086, "global_step": 31329, "epoch": 745} {"train_loss": -5.4992218017578125, "global_step": 31330, "epoch": 745} {"train_loss": -5.499216443016415, "global_step": 31331, "epoch": 745, "val_loss": 74380.6953125} {"train_loss": -5.60133171081543, "global_step": 31332, "epoch": 746} {"train_loss": -5.511086940765381, "global_step": 31333, "epoch": 746} {"train_loss": -5.469927787780762, "global_step": 31334, "epoch": 746} {"train_loss": -5.454937934875488, "global_step": 31335, "epoch": 746} {"train_loss": -5.5676727294921875, "global_step": 31336, "epoch": 746} {"train_loss": -5.580480575561523, "global_step": 31337, "epoch": 746} {"train_loss": -5.364127159118652, "global_step": 31338, "epoch": 746} {"train_loss": -5.448588848114014, "global_step": 31339, "epoch": 746} {"train_loss": -5.438044548034668, "global_step": 31340, "epoch": 746} {"train_loss": -5.436091899871826, "global_step": 31341, "epoch": 746} {"train_loss": -5.652403831481934, "global_step": 31342, "epoch": 746} {"train_loss": -5.46595573425293, "global_step": 31343, "epoch": 746} {"train_loss": -5.495351314544678, "global_step": 31344, "epoch": 746} {"train_loss": -5.410887718200684, "global_step": 31345, "epoch": 746} {"train_loss": -5.41148567199707, "global_step": 31346, "epoch": 746} {"train_loss": -5.480987548828125, "global_step": 31347, "epoch": 746} {"train_loss": -5.402256965637207, "global_step": 31348, "epoch": 746} {"train_loss": -5.252159118652344, "global_step": 31349, "epoch": 746} {"train_loss": -5.484926223754883, "global_step": 31350, "epoch": 746} {"train_loss": -5.422082901000977, "global_step": 31351, "epoch": 746} {"train_loss": -5.331899642944336, "global_step": 31352, "epoch": 746} {"train_loss": -5.3467020988464355, "global_step": 31353, "epoch": 746} {"train_loss": -5.425480842590332, "global_step": 31354, "epoch": 746} {"train_loss": -5.437481880187988, "global_step": 31355, "epoch": 746} {"train_loss": -5.4256391525268555, "global_step": 31356, "epoch": 746} {"train_loss": -5.4009199142456055, "global_step": 31357, "epoch": 746} {"train_loss": -5.319999694824219, "global_step": 31358, "epoch": 746} {"train_loss": -5.43189001083374, "global_step": 31359, "epoch": 746} {"train_loss": -5.441062927246094, "global_step": 31360, "epoch": 746} {"train_loss": -5.447138786315918, "global_step": 31361, "epoch": 746} {"train_loss": -5.465719699859619, "global_step": 31362, "epoch": 746} {"train_loss": -5.458520412445068, "global_step": 31363, "epoch": 746} {"train_loss": -5.525975227355957, "global_step": 31364, "epoch": 746} {"train_loss": -5.468808174133301, "global_step": 31365, "epoch": 746} {"train_loss": -5.586348533630371, "global_step": 31366, "epoch": 746} {"train_loss": -5.479679584503174, "global_step": 31367, "epoch": 746} {"train_loss": -5.518901824951172, "global_step": 31368, "epoch": 746} {"train_loss": -5.285843849182129, "global_step": 31369, "epoch": 746} {"train_loss": -5.564095497131348, "global_step": 31370, "epoch": 746} {"train_loss": -5.430517673492432, "global_step": 31371, "epoch": 746} {"train_loss": -5.541524410247803, "global_step": 31372, "epoch": 746} {"train_loss": -5.454449403853643, "global_step": 31373, "epoch": 746, "val_loss": 74341.3203125} {"train_loss": -5.551117897033691, "global_step": 31374, "epoch": 747} {"train_loss": -5.4649834632873535, "global_step": 31375, "epoch": 747} {"train_loss": -5.4517107009887695, "global_step": 31376, "epoch": 747} {"train_loss": -5.464967727661133, "global_step": 31377, "epoch": 747} {"train_loss": -5.578591346740723, "global_step": 31378, "epoch": 747} {"train_loss": -5.49091100692749, "global_step": 31379, "epoch": 747} {"train_loss": -5.536542892456055, "global_step": 31380, "epoch": 747} {"train_loss": -5.511898517608643, "global_step": 31381, "epoch": 747} {"train_loss": -5.487205505371094, "global_step": 31382, "epoch": 747} {"train_loss": -5.50102424621582, "global_step": 31383, "epoch": 747} {"train_loss": -5.3608622550964355, "global_step": 31384, "epoch": 747} {"train_loss": -5.433902740478516, "global_step": 31385, "epoch": 747} {"train_loss": -5.560615539550781, "global_step": 31386, "epoch": 747} {"train_loss": -5.259873390197754, "global_step": 31387, "epoch": 747} {"train_loss": -5.451706886291504, "global_step": 31388, "epoch": 747} {"train_loss": -5.448448181152344, "global_step": 31389, "epoch": 747} {"train_loss": -5.518255710601807, "global_step": 31390, "epoch": 747} {"train_loss": -5.357058525085449, "global_step": 31391, "epoch": 747} {"train_loss": -5.575066566467285, "global_step": 31392, "epoch": 747} {"train_loss": -5.4828338623046875, "global_step": 31393, "epoch": 747} {"train_loss": -5.532766342163086, "global_step": 31394, "epoch": 747} {"train_loss": -5.572450637817383, "global_step": 31395, "epoch": 747} {"train_loss": -5.547741889953613, "global_step": 31396, "epoch": 747} {"train_loss": -5.513147354125977, "global_step": 31397, "epoch": 747} {"train_loss": -5.5616631507873535, "global_step": 31398, "epoch": 747} {"train_loss": -5.521639823913574, "global_step": 31399, "epoch": 747} {"train_loss": -5.447347164154053, "global_step": 31400, "epoch": 747} {"train_loss": -5.549304008483887, "global_step": 31401, "epoch": 747} {"train_loss": -5.487285614013672, "global_step": 31402, "epoch": 747} {"train_loss": -5.351153373718262, "global_step": 31403, "epoch": 747} {"train_loss": -5.492770195007324, "global_step": 31404, "epoch": 747} {"train_loss": -5.5889153480529785, "global_step": 31405, "epoch": 747} {"train_loss": -5.535117149353027, "global_step": 31406, "epoch": 747} {"train_loss": -5.464912414550781, "global_step": 31407, "epoch": 747} {"train_loss": -5.471127510070801, "global_step": 31408, "epoch": 747} {"train_loss": -5.5947065353393555, "global_step": 31409, "epoch": 747} {"train_loss": -5.539609432220459, "global_step": 31410, "epoch": 747} {"train_loss": -5.521964073181152, "global_step": 31411, "epoch": 747} {"train_loss": -5.514613151550293, "global_step": 31412, "epoch": 747} {"train_loss": -5.458436012268066, "global_step": 31413, "epoch": 747} {"train_loss": -5.4735870361328125, "global_step": 31414, "epoch": 747} {"train_loss": -5.490583624158587, "global_step": 31415, "epoch": 747, "val_loss": 74758.4921875} {"train_loss": -5.516727447509766, "global_step": 31416, "epoch": 748} {"train_loss": -5.516165256500244, "global_step": 31417, "epoch": 748} {"train_loss": -5.413814067840576, "global_step": 31418, "epoch": 748} {"train_loss": -5.408249378204346, "global_step": 31419, "epoch": 748} {"train_loss": -5.504079818725586, "global_step": 31420, "epoch": 748} {"train_loss": -5.454930305480957, "global_step": 31421, "epoch": 748} {"train_loss": -5.543792724609375, "global_step": 31422, "epoch": 748} {"train_loss": -5.5470871925354, "global_step": 31423, "epoch": 748} {"train_loss": -5.420035362243652, "global_step": 31424, "epoch": 748} {"train_loss": -5.554703712463379, "global_step": 31425, "epoch": 748} {"train_loss": -5.5288004875183105, "global_step": 31426, "epoch": 748} {"train_loss": -5.442255020141602, "global_step": 31427, "epoch": 748} {"train_loss": -5.6079511642456055, "global_step": 31428, "epoch": 748} {"train_loss": -5.523482799530029, "global_step": 31429, "epoch": 748} {"train_loss": -5.427087783813477, "global_step": 31430, "epoch": 748} {"train_loss": -5.5662312507629395, "global_step": 31431, "epoch": 748} {"train_loss": -5.3804216384887695, "global_step": 31432, "epoch": 748} {"train_loss": -5.423519611358643, "global_step": 31433, "epoch": 748} {"train_loss": -5.575841903686523, "global_step": 31434, "epoch": 748} {"train_loss": -5.450041770935059, "global_step": 31435, "epoch": 748} {"train_loss": -5.487173080444336, "global_step": 31436, "epoch": 748} {"train_loss": -5.468863487243652, "global_step": 31437, "epoch": 748} {"train_loss": -5.502954483032227, "global_step": 31438, "epoch": 748} {"train_loss": -5.47974967956543, "global_step": 31439, "epoch": 748} {"train_loss": -5.478445529937744, "global_step": 31440, "epoch": 748} {"train_loss": -5.437613010406494, "global_step": 31441, "epoch": 748} {"train_loss": -5.566743850708008, "global_step": 31442, "epoch": 748} {"train_loss": -5.489012241363525, "global_step": 31443, "epoch": 748} {"train_loss": -5.506387710571289, "global_step": 31444, "epoch": 748} {"train_loss": -5.633761882781982, "global_step": 31445, "epoch": 748} {"train_loss": -5.371517181396484, "global_step": 31446, "epoch": 748} {"train_loss": -5.532717704772949, "global_step": 31447, "epoch": 748} {"train_loss": -5.383110523223877, "global_step": 31448, "epoch": 748} {"train_loss": -5.579923629760742, "global_step": 31449, "epoch": 748} {"train_loss": -5.466998100280762, "global_step": 31450, "epoch": 748} {"train_loss": -5.540759086608887, "global_step": 31451, "epoch": 748} {"train_loss": -5.521125316619873, "global_step": 31452, "epoch": 748} {"train_loss": -5.453116416931152, "global_step": 31453, "epoch": 748} {"train_loss": -5.534599304199219, "global_step": 31454, "epoch": 748} {"train_loss": -5.65153169631958, "global_step": 31455, "epoch": 748} {"train_loss": -5.493949890136719, "global_step": 31456, "epoch": 748} {"train_loss": -5.498474904469082, "global_step": 31457, "epoch": 748, "val_loss": 74169.5546875} {"train_loss": -5.469038009643555, "global_step": 31458, "epoch": 749} {"train_loss": -5.524441719055176, "global_step": 31459, "epoch": 749} {"train_loss": -5.471060752868652, "global_step": 31460, "epoch": 749} {"train_loss": -5.536238193511963, "global_step": 31461, "epoch": 749} {"train_loss": -5.371205806732178, "global_step": 31462, "epoch": 749} {"train_loss": -5.577626705169678, "global_step": 31463, "epoch": 749} {"train_loss": -5.555863380432129, "global_step": 31464, "epoch": 749} {"train_loss": -5.562348365783691, "global_step": 31465, "epoch": 749} {"train_loss": -5.414644718170166, "global_step": 31466, "epoch": 749} {"train_loss": -5.572322845458984, "global_step": 31467, "epoch": 749} {"train_loss": -5.575560569763184, "global_step": 31468, "epoch": 749} {"train_loss": -5.407962322235107, "global_step": 31469, "epoch": 749} {"train_loss": -5.716034889221191, "global_step": 31470, "epoch": 749} {"train_loss": -5.45380973815918, "global_step": 31471, "epoch": 749} {"train_loss": -5.470280647277832, "global_step": 31472, "epoch": 749} {"train_loss": -5.588145732879639, "global_step": 31473, "epoch": 749} {"train_loss": -5.474292755126953, "global_step": 31474, "epoch": 749} {"train_loss": -5.512337684631348, "global_step": 31475, "epoch": 749} {"train_loss": -5.460034370422363, "global_step": 31476, "epoch": 749} {"train_loss": -5.470141410827637, "global_step": 31477, "epoch": 749} {"train_loss": -5.439240455627441, "global_step": 31478, "epoch": 749} {"train_loss": -5.53424596786499, "global_step": 31479, "epoch": 749} {"train_loss": -5.527362823486328, "global_step": 31480, "epoch": 749} {"train_loss": -5.461249351501465, "global_step": 31481, "epoch": 749} {"train_loss": -5.470575332641602, "global_step": 31482, "epoch": 749} {"train_loss": -5.424561500549316, "global_step": 31483, "epoch": 749} {"train_loss": -5.523900508880615, "global_step": 31484, "epoch": 749} {"train_loss": -5.5297136306762695, "global_step": 31485, "epoch": 749} {"train_loss": -5.381712913513184, "global_step": 31486, "epoch": 749} {"train_loss": -5.469633102416992, "global_step": 31487, "epoch": 749} {"train_loss": -5.5518999099731445, "global_step": 31488, "epoch": 749} {"train_loss": -5.558696269989014, "global_step": 31489, "epoch": 749} {"train_loss": -5.5825042724609375, "global_step": 31490, "epoch": 749} {"train_loss": -5.587054252624512, "global_step": 31491, "epoch": 749} {"train_loss": -5.617164611816406, "global_step": 31492, "epoch": 749} {"train_loss": -5.489400863647461, "global_step": 31493, "epoch": 749} {"train_loss": -5.480246067047119, "global_step": 31494, "epoch": 749} {"train_loss": -5.547238349914551, "global_step": 31495, "epoch": 749} {"train_loss": -5.475643634796143, "global_step": 31496, "epoch": 749} {"train_loss": -5.536764144897461, "global_step": 31497, "epoch": 749} {"train_loss": -5.568140029907227, "global_step": 31498, "epoch": 749} {"train_loss": -5.507552862167358, "global_step": 31499, "epoch": 749, "val_loss": 74001.890625} {"train_loss": -5.385312557220459, "global_step": 31500, "epoch": 750} {"train_loss": -5.501837253570557, "global_step": 31501, "epoch": 750} {"train_loss": -5.390936851501465, "global_step": 31502, "epoch": 750} {"train_loss": -5.490897178649902, "global_step": 31503, "epoch": 750} {"train_loss": -5.530359268188477, "global_step": 31504, "epoch": 750} {"train_loss": -5.344670295715332, "global_step": 31505, "epoch": 750} {"train_loss": -5.540257453918457, "global_step": 31506, "epoch": 750} {"train_loss": -5.429440975189209, "global_step": 31507, "epoch": 750} {"train_loss": -5.441860198974609, "global_step": 31508, "epoch": 750} {"train_loss": -5.623971939086914, "global_step": 31509, "epoch": 750} {"train_loss": -5.295297145843506, "global_step": 31510, "epoch": 750} {"train_loss": -5.437549591064453, "global_step": 31511, "epoch": 750} {"train_loss": -5.375228404998779, "global_step": 31512, "epoch": 750} {"train_loss": -5.380077838897705, "global_step": 31513, "epoch": 750} {"train_loss": -5.440272808074951, "global_step": 31514, "epoch": 750} {"train_loss": -5.479013442993164, "global_step": 31515, "epoch": 750} {"train_loss": -5.460206031799316, "global_step": 31516, "epoch": 750} {"train_loss": -5.458976745605469, "global_step": 31517, "epoch": 750} {"train_loss": -5.286201477050781, "global_step": 31518, "epoch": 750} {"train_loss": -5.436741828918457, "global_step": 31519, "epoch": 750} {"train_loss": -5.346449375152588, "global_step": 31520, "epoch": 750} {"train_loss": -5.502481460571289, "global_step": 31521, "epoch": 750} {"train_loss": -5.308415412902832, "global_step": 31522, "epoch": 750} {"train_loss": -5.527691841125488, "global_step": 31523, "epoch": 750} {"train_loss": -5.413737773895264, "global_step": 31524, "epoch": 750} {"train_loss": -5.600290298461914, "global_step": 31525, "epoch": 750} {"train_loss": -5.636940002441406, "global_step": 31526, "epoch": 750} {"train_loss": -5.509528160095215, "global_step": 31527, "epoch": 750} {"train_loss": -5.482474327087402, "global_step": 31528, "epoch": 750} {"train_loss": -5.4791107177734375, "global_step": 31529, "epoch": 750} {"train_loss": -5.402165412902832, "global_step": 31530, "epoch": 750} {"train_loss": -5.511431694030762, "global_step": 31531, "epoch": 750} {"train_loss": -5.491881847381592, "global_step": 31532, "epoch": 750} {"train_loss": -5.579744815826416, "global_step": 31533, "epoch": 750} {"train_loss": -5.589702606201172, "global_step": 31534, "epoch": 750} {"train_loss": -5.54908561706543, "global_step": 31535, "epoch": 750} {"train_loss": -5.570947170257568, "global_step": 31536, "epoch": 750} {"train_loss": -5.5600996017456055, "global_step": 31537, "epoch": 750} {"train_loss": -5.646965503692627, "global_step": 31538, "epoch": 750} {"train_loss": -5.57824182510376, "global_step": 31539, "epoch": 750} {"train_loss": -5.4439826011657715, "global_step": 31540, "epoch": 750} {"train_loss": -5.475460427148001, "global_step": 31541, "epoch": 750, "train/sim_max_reward_0": 0.21498038175713416, "train/sim_max_reward_1": 0.16978617619412015, "train/sim_max_reward_2": 0.41740687988026826, "train/sim_max_reward_3": 0.7462379068113686, "train/sim_max_reward_4": 0.6729801557606667, "train/sim_max_reward_5": 0.5735579452917803, "test/sim_max_reward_4500000": 0.7607222921621856, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.845501522287435, "test/sim_max_reward_4500003": 0.4971307178575256, "test/sim_max_reward_4500004": 0.06339124341367763, "test/sim_max_reward_4500005": 0.3289135162812103, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.6138791080660979, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9162791795816095, "test/sim_max_reward_4500012": 0.5800210172777336, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.8406825465407648, "test/sim_max_reward_4500015": 5.078024326943645e-05, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.14569583103710076, "test/sim_max_reward_4500019": 0.9517578732271549, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.606951243945603, "test/sim_max_reward_4500022": 0.5266948116087713, "test/sim_max_reward_4500023": 0.8963129353251726, "test/sim_max_reward_4500024": 0.24552468111680295, "test/sim_max_reward_4500025": 0.6877434022107245, "test/sim_max_reward_4500026": 0.3115229712052241, "test/sim_max_reward_4500027": 0.9121541501620004, "test/sim_max_reward_4500028": 0.4435994779301863, "test/sim_max_reward_4500029": 0.13553878481256504, "test/sim_max_reward_4500030": 0.34337874857970996, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.42306911533319147, "test/sim_max_reward_4500033": 0.11143629734871845, "test/sim_max_reward_4500034": 0.816213710460975, "test/sim_max_reward_4500035": 0.517679848668287, "test/sim_max_reward_4500036": 0.4655702054207411, "test/sim_max_reward_4500037": 0.0, "test/sim_max_reward_4500038": 0.8932878139024082, "test/sim_max_reward_4500039": 0.2656946637362819, "test/sim_max_reward_4500040": 0.25245647141338645, "test/sim_max_reward_4500041": 0.8096511860707191, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.783044217588566, "test/sim_max_reward_4500044": 0.5649855581571708, "test/sim_max_reward_4500045": 0.1820661443986155, "test/sim_max_reward_4500046": 0.6709861782631257, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.09142488353047859, "train/mean_score": 0.46582490761588974, "test/mean_score": 0.3703711457445955, "val_loss": 74539.0625} {"train_loss": -5.560914516448975, "global_step": 31542, "epoch": 751} {"train_loss": -5.573602676391602, "global_step": 31543, "epoch": 751} {"train_loss": -5.469837665557861, "global_step": 31544, "epoch": 751} {"train_loss": -5.444194316864014, "global_step": 31545, "epoch": 751} {"train_loss": -5.471706390380859, "global_step": 31546, "epoch": 751} {"train_loss": -5.343924522399902, "global_step": 31547, "epoch": 751} {"train_loss": -5.469952583312988, "global_step": 31548, "epoch": 751} {"train_loss": -5.488777160644531, "global_step": 31549, "epoch": 751} {"train_loss": -5.451547622680664, "global_step": 31550, "epoch": 751} {"train_loss": -5.4147138595581055, "global_step": 31551, "epoch": 751} {"train_loss": -5.544733047485352, "global_step": 31552, "epoch": 751} {"train_loss": -5.384871482849121, "global_step": 31553, "epoch": 751} {"train_loss": -5.39542818069458, "global_step": 31554, "epoch": 751} {"train_loss": -5.2200927734375, "global_step": 31555, "epoch": 751} {"train_loss": -5.441617012023926, "global_step": 31556, "epoch": 751} {"train_loss": -5.472350597381592, "global_step": 31557, "epoch": 751} {"train_loss": -5.508708953857422, "global_step": 31558, "epoch": 751} {"train_loss": -5.460902214050293, "global_step": 31559, "epoch": 751} {"train_loss": -5.449162483215332, "global_step": 31560, "epoch": 751} {"train_loss": -5.552504062652588, "global_step": 31561, "epoch": 751} {"train_loss": -5.457492828369141, "global_step": 31562, "epoch": 751} {"train_loss": -5.5095319747924805, "global_step": 31563, "epoch": 751} {"train_loss": -5.513091087341309, "global_step": 31564, "epoch": 751} {"train_loss": -5.406905174255371, "global_step": 31565, "epoch": 751} {"train_loss": -5.448616027832031, "global_step": 31566, "epoch": 751} {"train_loss": -5.4520111083984375, "global_step": 31567, "epoch": 751} {"train_loss": -5.491438865661621, "global_step": 31568, "epoch": 751} {"train_loss": -5.464583396911621, "global_step": 31569, "epoch": 751} {"train_loss": -5.512628555297852, "global_step": 31570, "epoch": 751} {"train_loss": -5.577657699584961, "global_step": 31571, "epoch": 751} {"train_loss": -5.4298553466796875, "global_step": 31572, "epoch": 751} {"train_loss": -5.545544624328613, "global_step": 31573, "epoch": 751} {"train_loss": -5.401851654052734, "global_step": 31574, "epoch": 751} {"train_loss": -5.406123161315918, "global_step": 31575, "epoch": 751} {"train_loss": -5.561801910400391, "global_step": 31576, "epoch": 751} {"train_loss": -5.463582992553711, "global_step": 31577, "epoch": 751} {"train_loss": -5.450132369995117, "global_step": 31578, "epoch": 751} {"train_loss": -5.535891056060791, "global_step": 31579, "epoch": 751} {"train_loss": -5.4882097244262695, "global_step": 31580, "epoch": 751} {"train_loss": -5.472634315490723, "global_step": 31581, "epoch": 751} {"train_loss": -5.605206489562988, "global_step": 31582, "epoch": 751} {"train_loss": -5.471698238736107, "global_step": 31583, "epoch": 751, "val_loss": 74800.1640625} {"train_loss": -5.519925117492676, "global_step": 31584, "epoch": 752} {"train_loss": -5.502442836761475, "global_step": 31585, "epoch": 752} {"train_loss": -5.47785758972168, "global_step": 31586, "epoch": 752} {"train_loss": -5.456949234008789, "global_step": 31587, "epoch": 752} {"train_loss": -5.511301040649414, "global_step": 31588, "epoch": 752} {"train_loss": -5.490836143493652, "global_step": 31589, "epoch": 752} {"train_loss": -5.594226837158203, "global_step": 31590, "epoch": 752} {"train_loss": -5.424267768859863, "global_step": 31591, "epoch": 752} {"train_loss": -5.454929351806641, "global_step": 31592, "epoch": 752} {"train_loss": -5.422256946563721, "global_step": 31593, "epoch": 752} {"train_loss": -5.550581932067871, "global_step": 31594, "epoch": 752} {"train_loss": -5.455690383911133, "global_step": 31595, "epoch": 752} {"train_loss": -5.516114711761475, "global_step": 31596, "epoch": 752} {"train_loss": -5.457566261291504, "global_step": 31597, "epoch": 752} {"train_loss": -5.448543071746826, "global_step": 31598, "epoch": 752} {"train_loss": -5.584290504455566, "global_step": 31599, "epoch": 752} {"train_loss": -5.3998823165893555, "global_step": 31600, "epoch": 752} {"train_loss": -5.620362281799316, "global_step": 31601, "epoch": 752} {"train_loss": -5.609959602355957, "global_step": 31602, "epoch": 752} {"train_loss": -5.505650043487549, "global_step": 31603, "epoch": 752} {"train_loss": -5.5424909591674805, "global_step": 31604, "epoch": 752} {"train_loss": -5.50136661529541, "global_step": 31605, "epoch": 752} {"train_loss": -5.337950706481934, "global_step": 31606, "epoch": 752} {"train_loss": -5.483572006225586, "global_step": 31607, "epoch": 752} {"train_loss": -5.5800371170043945, "global_step": 31608, "epoch": 752} {"train_loss": -5.461299896240234, "global_step": 31609, "epoch": 752} {"train_loss": -5.508885383605957, "global_step": 31610, "epoch": 752} {"train_loss": -5.559492588043213, "global_step": 31611, "epoch": 752} {"train_loss": -5.443614482879639, "global_step": 31612, "epoch": 752} {"train_loss": -5.489067077636719, "global_step": 31613, "epoch": 752} {"train_loss": -5.436003684997559, "global_step": 31614, "epoch": 752} {"train_loss": -5.449721813201904, "global_step": 31615, "epoch": 752} {"train_loss": -5.56751823425293, "global_step": 31616, "epoch": 752} {"train_loss": -5.451479911804199, "global_step": 31617, "epoch": 752} {"train_loss": -5.606405258178711, "global_step": 31618, "epoch": 752} {"train_loss": -5.5234055519104, "global_step": 31619, "epoch": 752} {"train_loss": -5.443682670593262, "global_step": 31620, "epoch": 752} {"train_loss": -5.492316246032715, "global_step": 31621, "epoch": 752} {"train_loss": -5.517202377319336, "global_step": 31622, "epoch": 752} {"train_loss": -5.380634307861328, "global_step": 31623, "epoch": 752} {"train_loss": -5.415148735046387, "global_step": 31624, "epoch": 752} {"train_loss": -5.491426433835711, "global_step": 31625, "epoch": 752, "val_loss": 74407.1328125} {"train_loss": -5.394979476928711, "global_step": 31626, "epoch": 753} {"train_loss": -5.573331832885742, "global_step": 31627, "epoch": 753} {"train_loss": -5.492318153381348, "global_step": 31628, "epoch": 753} {"train_loss": -5.485634803771973, "global_step": 31629, "epoch": 753} {"train_loss": -5.49541711807251, "global_step": 31630, "epoch": 753} {"train_loss": -5.520031929016113, "global_step": 31631, "epoch": 753} {"train_loss": -5.476320266723633, "global_step": 31632, "epoch": 753} {"train_loss": -5.562995433807373, "global_step": 31633, "epoch": 753} {"train_loss": -5.5087690353393555, "global_step": 31634, "epoch": 753} {"train_loss": -5.568724632263184, "global_step": 31635, "epoch": 753} {"train_loss": -5.589941501617432, "global_step": 31636, "epoch": 753} {"train_loss": -5.518982410430908, "global_step": 31637, "epoch": 753} {"train_loss": -5.43503475189209, "global_step": 31638, "epoch": 753} {"train_loss": -5.678555488586426, "global_step": 31639, "epoch": 753} {"train_loss": -5.484847068786621, "global_step": 31640, "epoch": 753} {"train_loss": -5.419992446899414, "global_step": 31641, "epoch": 753} {"train_loss": -5.347894668579102, "global_step": 31642, "epoch": 753} {"train_loss": -5.481387615203857, "global_step": 31643, "epoch": 753} {"train_loss": -5.402663707733154, "global_step": 31644, "epoch": 753} {"train_loss": -5.420405387878418, "global_step": 31645, "epoch": 753} {"train_loss": -5.466703414916992, "global_step": 31646, "epoch": 753} {"train_loss": -5.47929573059082, "global_step": 31647, "epoch": 753} {"train_loss": -5.274762153625488, "global_step": 31648, "epoch": 753} {"train_loss": -5.48183536529541, "global_step": 31649, "epoch": 753} {"train_loss": -5.4027910232543945, "global_step": 31650, "epoch": 753} {"train_loss": -5.373584747314453, "global_step": 31651, "epoch": 753} {"train_loss": -5.434704303741455, "global_step": 31652, "epoch": 753} {"train_loss": -5.367295265197754, "global_step": 31653, "epoch": 753} {"train_loss": -5.408539295196533, "global_step": 31654, "epoch": 753} {"train_loss": -5.501280784606934, "global_step": 31655, "epoch": 753} {"train_loss": -5.564417839050293, "global_step": 31656, "epoch": 753} {"train_loss": -5.383835315704346, "global_step": 31657, "epoch": 753} {"train_loss": -5.5109710693359375, "global_step": 31658, "epoch": 753} {"train_loss": -5.448822975158691, "global_step": 31659, "epoch": 753} {"train_loss": -5.59771728515625, "global_step": 31660, "epoch": 753} {"train_loss": -5.598226547241211, "global_step": 31661, "epoch": 753} {"train_loss": -5.46215295791626, "global_step": 31662, "epoch": 753} {"train_loss": -5.496438026428223, "global_step": 31663, "epoch": 753} {"train_loss": -5.514928817749023, "global_step": 31664, "epoch": 753} {"train_loss": -5.508905410766602, "global_step": 31665, "epoch": 753} {"train_loss": -5.595334053039551, "global_step": 31666, "epoch": 753} {"train_loss": -5.481918686912174, "global_step": 31667, "epoch": 753, "val_loss": 74502.3046875} {"train_loss": -5.415164947509766, "global_step": 31668, "epoch": 754} {"train_loss": -5.578490734100342, "global_step": 31669, "epoch": 754} {"train_loss": -5.444643974304199, "global_step": 31670, "epoch": 754} {"train_loss": -5.3718438148498535, "global_step": 31671, "epoch": 754} {"train_loss": -5.595676422119141, "global_step": 31672, "epoch": 754} {"train_loss": -5.543678283691406, "global_step": 31673, "epoch": 754} {"train_loss": -5.484766006469727, "global_step": 31674, "epoch": 754} {"train_loss": -5.541715145111084, "global_step": 31675, "epoch": 754} {"train_loss": -5.478768348693848, "global_step": 31676, "epoch": 754} {"train_loss": -5.585882186889648, "global_step": 31677, "epoch": 754} {"train_loss": -5.514116287231445, "global_step": 31678, "epoch": 754} {"train_loss": -5.460635185241699, "global_step": 31679, "epoch": 754} {"train_loss": -5.467850208282471, "global_step": 31680, "epoch": 754} {"train_loss": -5.514366149902344, "global_step": 31681, "epoch": 754} {"train_loss": -5.4459028244018555, "global_step": 31682, "epoch": 754} {"train_loss": -5.512994766235352, "global_step": 31683, "epoch": 754} {"train_loss": -5.434371471405029, "global_step": 31684, "epoch": 754} {"train_loss": -5.510397911071777, "global_step": 31685, "epoch": 754} {"train_loss": -5.552793025970459, "global_step": 31686, "epoch": 754} {"train_loss": -5.590513229370117, "global_step": 31687, "epoch": 754} {"train_loss": -5.551392555236816, "global_step": 31688, "epoch": 754} {"train_loss": -5.49431037902832, "global_step": 31689, "epoch": 754} {"train_loss": -5.561465263366699, "global_step": 31690, "epoch": 754} {"train_loss": -5.605966091156006, "global_step": 31691, "epoch": 754} {"train_loss": -5.507195472717285, "global_step": 31692, "epoch": 754} {"train_loss": -5.4944257736206055, "global_step": 31693, "epoch": 754} {"train_loss": -5.451052188873291, "global_step": 31694, "epoch": 754} {"train_loss": -5.497717380523682, "global_step": 31695, "epoch": 754} {"train_loss": -5.464316368103027, "global_step": 31696, "epoch": 754} {"train_loss": -5.556071758270264, "global_step": 31697, "epoch": 754} {"train_loss": -5.530529022216797, "global_step": 31698, "epoch": 754} {"train_loss": -5.58188009262085, "global_step": 31699, "epoch": 754} {"train_loss": -5.482246398925781, "global_step": 31700, "epoch": 754} {"train_loss": -5.512329578399658, "global_step": 31701, "epoch": 754} {"train_loss": -5.523149490356445, "global_step": 31702, "epoch": 754} {"train_loss": -5.574434280395508, "global_step": 31703, "epoch": 754} {"train_loss": -5.372729301452637, "global_step": 31704, "epoch": 754} {"train_loss": -5.642539024353027, "global_step": 31705, "epoch": 754} {"train_loss": -5.403428077697754, "global_step": 31706, "epoch": 754} {"train_loss": -5.452576637268066, "global_step": 31707, "epoch": 754} {"train_loss": -5.441450119018555, "global_step": 31708, "epoch": 754} {"train_loss": -5.507032224110195, "global_step": 31709, "epoch": 754, "val_loss": 74509.4921875} {"train_loss": -5.474612236022949, "global_step": 31710, "epoch": 755} {"train_loss": -5.494466781616211, "global_step": 31711, "epoch": 755} {"train_loss": -5.432930946350098, "global_step": 31712, "epoch": 755} {"train_loss": -5.55702018737793, "global_step": 31713, "epoch": 755} {"train_loss": -5.53257942199707, "global_step": 31714, "epoch": 755} {"train_loss": -5.514890670776367, "global_step": 31715, "epoch": 755} {"train_loss": -5.52511739730835, "global_step": 31716, "epoch": 755} {"train_loss": -5.515528678894043, "global_step": 31717, "epoch": 755} {"train_loss": -5.457175254821777, "global_step": 31718, "epoch": 755} {"train_loss": -5.500286102294922, "global_step": 31719, "epoch": 755} {"train_loss": -5.370370388031006, "global_step": 31720, "epoch": 755} {"train_loss": -5.624945163726807, "global_step": 31721, "epoch": 755} {"train_loss": -5.386845588684082, "global_step": 31722, "epoch": 755} {"train_loss": -5.567981243133545, "global_step": 31723, "epoch": 755} {"train_loss": -5.493858337402344, "global_step": 31724, "epoch": 755} {"train_loss": -5.294888019561768, "global_step": 31725, "epoch": 755} {"train_loss": -5.539613723754883, "global_step": 31726, "epoch": 755} {"train_loss": -5.525555610656738, "global_step": 31727, "epoch": 755} {"train_loss": -5.486139297485352, "global_step": 31728, "epoch": 755} {"train_loss": -5.390429973602295, "global_step": 31729, "epoch": 755} {"train_loss": -5.430933952331543, "global_step": 31730, "epoch": 755} {"train_loss": -5.550061225891113, "global_step": 31731, "epoch": 755} {"train_loss": -5.430497169494629, "global_step": 31732, "epoch": 755} {"train_loss": -5.5558857917785645, "global_step": 31733, "epoch": 755} {"train_loss": -5.504185676574707, "global_step": 31734, "epoch": 755} {"train_loss": -5.4640960693359375, "global_step": 31735, "epoch": 755} {"train_loss": -5.520256042480469, "global_step": 31736, "epoch": 755} {"train_loss": -5.617793083190918, "global_step": 31737, "epoch": 755} {"train_loss": -5.404662132263184, "global_step": 31738, "epoch": 755} {"train_loss": -5.5905609130859375, "global_step": 31739, "epoch": 755} {"train_loss": -5.589123249053955, "global_step": 31740, "epoch": 755} {"train_loss": -5.492435932159424, "global_step": 31741, "epoch": 755} {"train_loss": -5.632596969604492, "global_step": 31742, "epoch": 755} {"train_loss": -5.4436821937561035, "global_step": 31743, "epoch": 755} {"train_loss": -5.4956817626953125, "global_step": 31744, "epoch": 755} {"train_loss": -5.447863578796387, "global_step": 31745, "epoch": 755} {"train_loss": -5.5384416580200195, "global_step": 31746, "epoch": 755} {"train_loss": -5.6282196044921875, "global_step": 31747, "epoch": 755} {"train_loss": -5.429542541503906, "global_step": 31748, "epoch": 755} {"train_loss": -5.612123012542725, "global_step": 31749, "epoch": 755} {"train_loss": -5.489057540893555, "global_step": 31750, "epoch": 755} {"train_loss": -5.501852285294306, "global_step": 31751, "epoch": 755, "val_loss": 74371.796875} {"train_loss": -5.456396102905273, "global_step": 31752, "epoch": 756} {"train_loss": -5.517707824707031, "global_step": 31753, "epoch": 756} {"train_loss": -5.45716667175293, "global_step": 31754, "epoch": 756} {"train_loss": -5.539130210876465, "global_step": 31755, "epoch": 756} {"train_loss": -5.675161361694336, "global_step": 31756, "epoch": 756} {"train_loss": -5.477884769439697, "global_step": 31757, "epoch": 756} {"train_loss": -5.49346923828125, "global_step": 31758, "epoch": 756} {"train_loss": -5.456514835357666, "global_step": 31759, "epoch": 756} {"train_loss": -5.463727951049805, "global_step": 31760, "epoch": 756} {"train_loss": -5.476484298706055, "global_step": 31761, "epoch": 756} {"train_loss": -5.44285774230957, "global_step": 31762, "epoch": 756} {"train_loss": -5.502843856811523, "global_step": 31763, "epoch": 756} {"train_loss": -5.490194320678711, "global_step": 31764, "epoch": 756} {"train_loss": -5.592157363891602, "global_step": 31765, "epoch": 756} {"train_loss": -5.542590141296387, "global_step": 31766, "epoch": 756} {"train_loss": -5.556034564971924, "global_step": 31767, "epoch": 756} {"train_loss": -5.375778675079346, "global_step": 31768, "epoch": 756} {"train_loss": -5.384734630584717, "global_step": 31769, "epoch": 756} {"train_loss": -5.393809795379639, "global_step": 31770, "epoch": 756} {"train_loss": -5.535501480102539, "global_step": 31771, "epoch": 756} {"train_loss": -5.539188861846924, "global_step": 31772, "epoch": 756} {"train_loss": -5.5101213455200195, "global_step": 31773, "epoch": 756} {"train_loss": -5.424611568450928, "global_step": 31774, "epoch": 756} {"train_loss": -5.3511433601379395, "global_step": 31775, "epoch": 756} {"train_loss": -5.368487358093262, "global_step": 31776, "epoch": 756} {"train_loss": -5.516105651855469, "global_step": 31777, "epoch": 756} {"train_loss": -5.459020614624023, "global_step": 31778, "epoch": 756} {"train_loss": -5.414219379425049, "global_step": 31779, "epoch": 756} {"train_loss": -5.4604291915893555, "global_step": 31780, "epoch": 756} {"train_loss": -5.5345540046691895, "global_step": 31781, "epoch": 756} {"train_loss": -5.424610137939453, "global_step": 31782, "epoch": 756} {"train_loss": -5.431868553161621, "global_step": 31783, "epoch": 756} {"train_loss": -5.423404693603516, "global_step": 31784, "epoch": 756} {"train_loss": -5.366091728210449, "global_step": 31785, "epoch": 756} {"train_loss": -5.395520210266113, "global_step": 31786, "epoch": 756} {"train_loss": -5.4079790115356445, "global_step": 31787, "epoch": 756} {"train_loss": -5.443281173706055, "global_step": 31788, "epoch": 756} {"train_loss": -5.3679304122924805, "global_step": 31789, "epoch": 756} {"train_loss": -5.5204877853393555, "global_step": 31790, "epoch": 756} {"train_loss": -5.477353096008301, "global_step": 31791, "epoch": 756} {"train_loss": -5.409799575805664, "global_step": 31792, "epoch": 756} {"train_loss": -5.466636952899751, "global_step": 31793, "epoch": 756, "val_loss": 75366.8046875} {"train_loss": -5.382166385650635, "global_step": 31794, "epoch": 757} {"train_loss": -5.554591178894043, "global_step": 31795, "epoch": 757} {"train_loss": -5.588717937469482, "global_step": 31796, "epoch": 757} {"train_loss": -5.387945175170898, "global_step": 31797, "epoch": 757} {"train_loss": -5.337526321411133, "global_step": 31798, "epoch": 757} {"train_loss": -5.436788558959961, "global_step": 31799, "epoch": 757} {"train_loss": -5.494317054748535, "global_step": 31800, "epoch": 757} {"train_loss": -5.4685797691345215, "global_step": 31801, "epoch": 757} {"train_loss": -5.479730129241943, "global_step": 31802, "epoch": 757} {"train_loss": -5.362100124359131, "global_step": 31803, "epoch": 757} {"train_loss": -5.48663330078125, "global_step": 31804, "epoch": 757} {"train_loss": -5.617203712463379, "global_step": 31805, "epoch": 757} {"train_loss": -5.530028343200684, "global_step": 31806, "epoch": 757} {"train_loss": -5.499201774597168, "global_step": 31807, "epoch": 757} {"train_loss": -5.426188945770264, "global_step": 31808, "epoch": 757} {"train_loss": -5.634716033935547, "global_step": 31809, "epoch": 757} {"train_loss": -5.451130390167236, "global_step": 31810, "epoch": 757} {"train_loss": -5.505074501037598, "global_step": 31811, "epoch": 757} {"train_loss": -5.363014221191406, "global_step": 31812, "epoch": 757} {"train_loss": -5.571711540222168, "global_step": 31813, "epoch": 757} {"train_loss": -5.461887836456299, "global_step": 31814, "epoch": 757} {"train_loss": -5.484955787658691, "global_step": 31815, "epoch": 757} {"train_loss": -5.520564079284668, "global_step": 31816, "epoch": 757} {"train_loss": -5.362360000610352, "global_step": 31817, "epoch": 757} {"train_loss": -5.363059997558594, "global_step": 31818, "epoch": 757} {"train_loss": -5.51883602142334, "global_step": 31819, "epoch": 757} {"train_loss": -5.466314315795898, "global_step": 31820, "epoch": 757} {"train_loss": -5.433145046234131, "global_step": 31821, "epoch": 757} {"train_loss": -5.457183837890625, "global_step": 31822, "epoch": 757} {"train_loss": -5.366697311401367, "global_step": 31823, "epoch": 757} {"train_loss": -5.555421352386475, "global_step": 31824, "epoch": 757} {"train_loss": -5.521725654602051, "global_step": 31825, "epoch": 757} {"train_loss": -5.5201029777526855, "global_step": 31826, "epoch": 757} {"train_loss": -5.497759819030762, "global_step": 31827, "epoch": 757} {"train_loss": -5.390195369720459, "global_step": 31828, "epoch": 757} {"train_loss": -5.4362263679504395, "global_step": 31829, "epoch": 757} {"train_loss": -5.401291370391846, "global_step": 31830, "epoch": 757} {"train_loss": -5.3997578620910645, "global_step": 31831, "epoch": 757} {"train_loss": -5.563633918762207, "global_step": 31832, "epoch": 757} {"train_loss": -5.446260452270508, "global_step": 31833, "epoch": 757} {"train_loss": -5.442379951477051, "global_step": 31834, "epoch": 757} {"train_loss": -5.467791296186901, "global_step": 31835, "epoch": 757, "val_loss": 74025.3515625} {"train_loss": -5.42279577255249, "global_step": 31836, "epoch": 758} {"train_loss": -5.498824596405029, "global_step": 31837, "epoch": 758} {"train_loss": -5.4624152183532715, "global_step": 31838, "epoch": 758} {"train_loss": -5.457372665405273, "global_step": 31839, "epoch": 758} {"train_loss": -5.456676483154297, "global_step": 31840, "epoch": 758} {"train_loss": -5.480417728424072, "global_step": 31841, "epoch": 758} {"train_loss": -5.528554916381836, "global_step": 31842, "epoch": 758} {"train_loss": -5.518321990966797, "global_step": 31843, "epoch": 758} {"train_loss": -5.589447975158691, "global_step": 31844, "epoch": 758} {"train_loss": -5.501427173614502, "global_step": 31845, "epoch": 758} {"train_loss": -5.575508117675781, "global_step": 31846, "epoch": 758} {"train_loss": -5.437017440795898, "global_step": 31847, "epoch": 758} {"train_loss": -5.574185371398926, "global_step": 31848, "epoch": 758} {"train_loss": -5.422544479370117, "global_step": 31849, "epoch": 758} {"train_loss": -5.602851867675781, "global_step": 31850, "epoch": 758} {"train_loss": -5.5402936935424805, "global_step": 31851, "epoch": 758} {"train_loss": -5.528027534484863, "global_step": 31852, "epoch": 758} {"train_loss": -5.525100231170654, "global_step": 31853, "epoch": 758} {"train_loss": -5.647075653076172, "global_step": 31854, "epoch": 758} {"train_loss": -5.532261848449707, "global_step": 31855, "epoch": 758} {"train_loss": -5.514534950256348, "global_step": 31856, "epoch": 758} {"train_loss": -5.536428451538086, "global_step": 31857, "epoch": 758} {"train_loss": -5.545395851135254, "global_step": 31858, "epoch": 758} {"train_loss": -5.3352460861206055, "global_step": 31859, "epoch": 758} {"train_loss": -5.430632591247559, "global_step": 31860, "epoch": 758} {"train_loss": -5.505635738372803, "global_step": 31861, "epoch": 758} {"train_loss": -5.592176914215088, "global_step": 31862, "epoch": 758} {"train_loss": -5.499591827392578, "global_step": 31863, "epoch": 758} {"train_loss": -5.378262519836426, "global_step": 31864, "epoch": 758} {"train_loss": -5.481132984161377, "global_step": 31865, "epoch": 758} {"train_loss": -5.380626678466797, "global_step": 31866, "epoch": 758} {"train_loss": -5.3252058029174805, "global_step": 31867, "epoch": 758} {"train_loss": -5.5089592933654785, "global_step": 31868, "epoch": 758} {"train_loss": -5.378710746765137, "global_step": 31869, "epoch": 758} {"train_loss": -5.486359596252441, "global_step": 31870, "epoch": 758} {"train_loss": -5.4536943435668945, "global_step": 31871, "epoch": 758} {"train_loss": -5.360415458679199, "global_step": 31872, "epoch": 758} {"train_loss": -5.482295989990234, "global_step": 31873, "epoch": 758} {"train_loss": -5.654173851013184, "global_step": 31874, "epoch": 758} {"train_loss": -5.5226640701293945, "global_step": 31875, "epoch": 758} {"train_loss": -5.461513042449951, "global_step": 31876, "epoch": 758} {"train_loss": -5.488357646124704, "global_step": 31877, "epoch": 758, "val_loss": 74613.59375} {"train_loss": -5.439454078674316, "global_step": 31878, "epoch": 759} {"train_loss": -5.456350326538086, "global_step": 31879, "epoch": 759} {"train_loss": -5.581169605255127, "global_step": 31880, "epoch": 759} {"train_loss": -5.606621742248535, "global_step": 31881, "epoch": 759} {"train_loss": -5.525961875915527, "global_step": 31882, "epoch": 759} {"train_loss": -5.483219146728516, "global_step": 31883, "epoch": 759} {"train_loss": -5.436093330383301, "global_step": 31884, "epoch": 759} {"train_loss": -5.504206657409668, "global_step": 31885, "epoch": 759} {"train_loss": -5.501946926116943, "global_step": 31886, "epoch": 759} {"train_loss": -5.501557350158691, "global_step": 31887, "epoch": 759} {"train_loss": -5.463246822357178, "global_step": 31888, "epoch": 759} {"train_loss": -5.418309688568115, "global_step": 31889, "epoch": 759} {"train_loss": -5.533015251159668, "global_step": 31890, "epoch": 759} {"train_loss": -5.431401252746582, "global_step": 31891, "epoch": 759} {"train_loss": -5.466794013977051, "global_step": 31892, "epoch": 759} {"train_loss": -5.393072605133057, "global_step": 31893, "epoch": 759} {"train_loss": -5.527099132537842, "global_step": 31894, "epoch": 759} {"train_loss": -5.441683769226074, "global_step": 31895, "epoch": 759} {"train_loss": -5.522552013397217, "global_step": 31896, "epoch": 759} {"train_loss": -5.472052097320557, "global_step": 31897, "epoch": 759} {"train_loss": -5.502668380737305, "global_step": 31898, "epoch": 759} {"train_loss": -5.5066328048706055, "global_step": 31899, "epoch": 759} {"train_loss": -5.446906089782715, "global_step": 31900, "epoch": 759} {"train_loss": -5.464510440826416, "global_step": 31901, "epoch": 759} {"train_loss": -5.634799957275391, "global_step": 31902, "epoch": 759} {"train_loss": -5.496481895446777, "global_step": 31903, "epoch": 759} {"train_loss": -5.501374244689941, "global_step": 31904, "epoch": 759} {"train_loss": -5.523955345153809, "global_step": 31905, "epoch": 759} {"train_loss": -5.575299263000488, "global_step": 31906, "epoch": 759} {"train_loss": -5.452343940734863, "global_step": 31907, "epoch": 759} {"train_loss": -5.569026947021484, "global_step": 31908, "epoch": 759} {"train_loss": -5.57330322265625, "global_step": 31909, "epoch": 759} {"train_loss": -5.50611686706543, "global_step": 31910, "epoch": 759} {"train_loss": -5.459048271179199, "global_step": 31911, "epoch": 759} {"train_loss": -5.572617530822754, "global_step": 31912, "epoch": 759} {"train_loss": -5.610806465148926, "global_step": 31913, "epoch": 759} {"train_loss": -5.465557098388672, "global_step": 31914, "epoch": 759} {"train_loss": -5.444354057312012, "global_step": 31915, "epoch": 759} {"train_loss": -5.49355411529541, "global_step": 31916, "epoch": 759} {"train_loss": -5.408912658691406, "global_step": 31917, "epoch": 759} {"train_loss": -5.437182426452637, "global_step": 31918, "epoch": 759} {"train_loss": -5.497674442472912, "global_step": 31919, "epoch": 759, "val_loss": 74554.515625} {"train_loss": -5.583425045013428, "global_step": 31920, "epoch": 760} {"train_loss": -5.438251495361328, "global_step": 31921, "epoch": 760} {"train_loss": -5.630881309509277, "global_step": 31922, "epoch": 760} {"train_loss": -5.533682823181152, "global_step": 31923, "epoch": 760} {"train_loss": -5.463721752166748, "global_step": 31924, "epoch": 760} {"train_loss": -5.503777503967285, "global_step": 31925, "epoch": 760} {"train_loss": -5.478906631469727, "global_step": 31926, "epoch": 760} {"train_loss": -5.4333696365356445, "global_step": 31927, "epoch": 760} {"train_loss": -5.451706886291504, "global_step": 31928, "epoch": 760} {"train_loss": -5.552611351013184, "global_step": 31929, "epoch": 760} {"train_loss": -5.477108955383301, "global_step": 31930, "epoch": 760} {"train_loss": -5.532674789428711, "global_step": 31931, "epoch": 760} {"train_loss": -5.523773193359375, "global_step": 31932, "epoch": 760} {"train_loss": -5.55043363571167, "global_step": 31933, "epoch": 760} {"train_loss": -5.62974739074707, "global_step": 31934, "epoch": 760} {"train_loss": -5.462466239929199, "global_step": 31935, "epoch": 760} {"train_loss": -5.4223456382751465, "global_step": 31936, "epoch": 760} {"train_loss": -5.57969856262207, "global_step": 31937, "epoch": 760} {"train_loss": -5.613514423370361, "global_step": 31938, "epoch": 760} {"train_loss": -5.380828857421875, "global_step": 31939, "epoch": 760} {"train_loss": -5.57960319519043, "global_step": 31940, "epoch": 760} {"train_loss": -5.48267936706543, "global_step": 31941, "epoch": 760} {"train_loss": -5.601696968078613, "global_step": 31942, "epoch": 760} {"train_loss": -5.666225433349609, "global_step": 31943, "epoch": 760} {"train_loss": -5.53813362121582, "global_step": 31944, "epoch": 760} {"train_loss": -5.651334285736084, "global_step": 31945, "epoch": 760} {"train_loss": -5.516853332519531, "global_step": 31946, "epoch": 760} {"train_loss": -5.559478759765625, "global_step": 31947, "epoch": 760} {"train_loss": -5.531095504760742, "global_step": 31948, "epoch": 760} {"train_loss": -5.46921968460083, "global_step": 31949, "epoch": 760} {"train_loss": -5.4072723388671875, "global_step": 31950, "epoch": 760} {"train_loss": -5.512557029724121, "global_step": 31951, "epoch": 760} {"train_loss": -5.554863452911377, "global_step": 31952, "epoch": 760} {"train_loss": -5.440816879272461, "global_step": 31953, "epoch": 760} {"train_loss": -5.476837635040283, "global_step": 31954, "epoch": 760} {"train_loss": -5.521526336669922, "global_step": 31955, "epoch": 760} {"train_loss": -5.516426086425781, "global_step": 31956, "epoch": 760} {"train_loss": -5.464571952819824, "global_step": 31957, "epoch": 760} {"train_loss": -5.504756927490234, "global_step": 31958, "epoch": 760} {"train_loss": -5.411888122558594, "global_step": 31959, "epoch": 760} {"train_loss": -5.438481330871582, "global_step": 31960, "epoch": 760} {"train_loss": -5.516091880344209, "global_step": 31961, "epoch": 760, "val_loss": 74087.96875} {"train_loss": -5.479608535766602, "global_step": 31962, "epoch": 761} {"train_loss": -5.50411319732666, "global_step": 31963, "epoch": 761} {"train_loss": -5.474889755249023, "global_step": 31964, "epoch": 761} {"train_loss": -5.58420991897583, "global_step": 31965, "epoch": 761} {"train_loss": -5.511932849884033, "global_step": 31966, "epoch": 761} {"train_loss": -5.599245071411133, "global_step": 31967, "epoch": 761} {"train_loss": -5.541069030761719, "global_step": 31968, "epoch": 761} {"train_loss": -5.482673645019531, "global_step": 31969, "epoch": 761} {"train_loss": -5.5723185539245605, "global_step": 31970, "epoch": 761} {"train_loss": -5.600087642669678, "global_step": 31971, "epoch": 761} {"train_loss": -5.55666446685791, "global_step": 31972, "epoch": 761} {"train_loss": -5.6673383712768555, "global_step": 31973, "epoch": 761} {"train_loss": -5.449484825134277, "global_step": 31974, "epoch": 761} {"train_loss": -5.474514484405518, "global_step": 31975, "epoch": 761} {"train_loss": -5.559349536895752, "global_step": 31976, "epoch": 761} {"train_loss": -5.479496955871582, "global_step": 31977, "epoch": 761} {"train_loss": -5.491344928741455, "global_step": 31978, "epoch": 761} {"train_loss": -5.508697509765625, "global_step": 31979, "epoch": 761} {"train_loss": -5.6233978271484375, "global_step": 31980, "epoch": 761} {"train_loss": -5.496034145355225, "global_step": 31981, "epoch": 761} {"train_loss": -5.446801662445068, "global_step": 31982, "epoch": 761} {"train_loss": -5.576574802398682, "global_step": 31983, "epoch": 761} {"train_loss": -5.6153364181518555, "global_step": 31984, "epoch": 761} {"train_loss": -5.4482879638671875, "global_step": 31985, "epoch": 761} {"train_loss": -5.432875633239746, "global_step": 31986, "epoch": 761} {"train_loss": -5.369925498962402, "global_step": 31987, "epoch": 761} {"train_loss": -5.578936576843262, "global_step": 31988, "epoch": 761} {"train_loss": -5.415842056274414, "global_step": 31989, "epoch": 761} {"train_loss": -5.571528434753418, "global_step": 31990, "epoch": 761} {"train_loss": -5.49350643157959, "global_step": 31991, "epoch": 761} {"train_loss": -5.526149749755859, "global_step": 31992, "epoch": 761} {"train_loss": -5.290931701660156, "global_step": 31993, "epoch": 761} {"train_loss": -5.479728698730469, "global_step": 31994, "epoch": 761} {"train_loss": -5.4650092124938965, "global_step": 31995, "epoch": 761} {"train_loss": -5.6100616455078125, "global_step": 31996, "epoch": 761} {"train_loss": -5.447166442871094, "global_step": 31997, "epoch": 761} {"train_loss": -5.578854084014893, "global_step": 31998, "epoch": 761} {"train_loss": -5.4265217781066895, "global_step": 31999, "epoch": 761} {"train_loss": -5.637948036193848, "global_step": 32000, "epoch": 761} {"train_loss": -5.534809112548828, "global_step": 32001, "epoch": 761} {"train_loss": -5.564404487609863, "global_step": 32002, "epoch": 761} {"train_loss": -5.516726368949527, "global_step": 32003, "epoch": 761, "val_loss": 74866.6484375} {"train_loss": -5.422398090362549, "global_step": 32004, "epoch": 762} {"train_loss": -5.575119972229004, "global_step": 32005, "epoch": 762} {"train_loss": -5.595378875732422, "global_step": 32006, "epoch": 762} {"train_loss": -5.540440559387207, "global_step": 32007, "epoch": 762} {"train_loss": -5.534424781799316, "global_step": 32008, "epoch": 762} {"train_loss": -5.473911285400391, "global_step": 32009, "epoch": 762} {"train_loss": -5.539492607116699, "global_step": 32010, "epoch": 762} {"train_loss": -5.560887336730957, "global_step": 32011, "epoch": 762} {"train_loss": -5.352033615112305, "global_step": 32012, "epoch": 762} {"train_loss": -5.6388349533081055, "global_step": 32013, "epoch": 762} {"train_loss": -5.472777366638184, "global_step": 32014, "epoch": 762} {"train_loss": -5.565272331237793, "global_step": 32015, "epoch": 762} {"train_loss": -5.471741676330566, "global_step": 32016, "epoch": 762} {"train_loss": -5.347689628601074, "global_step": 32017, "epoch": 762} {"train_loss": -5.557535171508789, "global_step": 32018, "epoch": 762} {"train_loss": -5.619420051574707, "global_step": 32019, "epoch": 762} {"train_loss": -5.631740570068359, "global_step": 32020, "epoch": 762} {"train_loss": -5.545397758483887, "global_step": 32021, "epoch": 762} {"train_loss": -5.2975335121154785, "global_step": 32022, "epoch": 762} {"train_loss": -5.532001972198486, "global_step": 32023, "epoch": 762} {"train_loss": -5.495059967041016, "global_step": 32024, "epoch": 762} {"train_loss": -5.5905842781066895, "global_step": 32025, "epoch": 762} {"train_loss": -5.56702995300293, "global_step": 32026, "epoch": 762} {"train_loss": -5.413107872009277, "global_step": 32027, "epoch": 762} {"train_loss": -5.463954925537109, "global_step": 32028, "epoch": 762} {"train_loss": -5.48451042175293, "global_step": 32029, "epoch": 762} {"train_loss": -5.4199371337890625, "global_step": 32030, "epoch": 762} {"train_loss": -5.434885025024414, "global_step": 32031, "epoch": 762} {"train_loss": -5.486004829406738, "global_step": 32032, "epoch": 762} {"train_loss": -5.540688514709473, "global_step": 32033, "epoch": 762} {"train_loss": -5.558558940887451, "global_step": 32034, "epoch": 762} {"train_loss": -5.420313835144043, "global_step": 32035, "epoch": 762} {"train_loss": -5.447151184082031, "global_step": 32036, "epoch": 762} {"train_loss": -5.518439292907715, "global_step": 32037, "epoch": 762} {"train_loss": -5.482419490814209, "global_step": 32038, "epoch": 762} {"train_loss": -5.557843208312988, "global_step": 32039, "epoch": 762} {"train_loss": -5.5296711921691895, "global_step": 32040, "epoch": 762} {"train_loss": -5.389482498168945, "global_step": 32041, "epoch": 762} {"train_loss": -5.537091255187988, "global_step": 32042, "epoch": 762} {"train_loss": -5.441880226135254, "global_step": 32043, "epoch": 762} {"train_loss": -5.496463775634766, "global_step": 32044, "epoch": 762} {"train_loss": -5.503263076146443, "global_step": 32045, "epoch": 762, "val_loss": 75508.5546875} {"train_loss": -5.337891101837158, "global_step": 32046, "epoch": 763} {"train_loss": -5.487178325653076, "global_step": 32047, "epoch": 763} {"train_loss": -5.556476593017578, "global_step": 32048, "epoch": 763} {"train_loss": -5.486813545227051, "global_step": 32049, "epoch": 763} {"train_loss": -5.342135429382324, "global_step": 32050, "epoch": 763} {"train_loss": -5.560153961181641, "global_step": 32051, "epoch": 763} {"train_loss": -5.527369976043701, "global_step": 32052, "epoch": 763} {"train_loss": -5.567858695983887, "global_step": 32053, "epoch": 763} {"train_loss": -5.384579658508301, "global_step": 32054, "epoch": 763} {"train_loss": -5.394641876220703, "global_step": 32055, "epoch": 763} {"train_loss": -5.337031364440918, "global_step": 32056, "epoch": 763} {"train_loss": -5.53824520111084, "global_step": 32057, "epoch": 763} {"train_loss": -5.464616775512695, "global_step": 32058, "epoch": 763} {"train_loss": -5.469475746154785, "global_step": 32059, "epoch": 763} {"train_loss": -5.581354141235352, "global_step": 32060, "epoch": 763} {"train_loss": -5.573942184448242, "global_step": 32061, "epoch": 763} {"train_loss": -5.46563196182251, "global_step": 32062, "epoch": 763} {"train_loss": -5.573944091796875, "global_step": 32063, "epoch": 763} {"train_loss": -5.423513412475586, "global_step": 32064, "epoch": 763} {"train_loss": -5.514368057250977, "global_step": 32065, "epoch": 763} {"train_loss": -5.530031681060791, "global_step": 32066, "epoch": 763} {"train_loss": -5.47908353805542, "global_step": 32067, "epoch": 763} {"train_loss": -5.5677103996276855, "global_step": 32068, "epoch": 763} {"train_loss": -5.542564868927002, "global_step": 32069, "epoch": 763} {"train_loss": -5.497408390045166, "global_step": 32070, "epoch": 763} {"train_loss": -5.4868903160095215, "global_step": 32071, "epoch": 763} {"train_loss": -5.480866432189941, "global_step": 32072, "epoch": 763} {"train_loss": -5.60564661026001, "global_step": 32073, "epoch": 763} {"train_loss": -5.5178656578063965, "global_step": 32074, "epoch": 763} {"train_loss": -5.352196216583252, "global_step": 32075, "epoch": 763} {"train_loss": -5.455641746520996, "global_step": 32076, "epoch": 763} {"train_loss": -5.417171478271484, "global_step": 32077, "epoch": 763} {"train_loss": -5.532273292541504, "global_step": 32078, "epoch": 763} {"train_loss": -5.649545192718506, "global_step": 32079, "epoch": 763} {"train_loss": -5.548917293548584, "global_step": 32080, "epoch": 763} {"train_loss": -5.470333576202393, "global_step": 32081, "epoch": 763} {"train_loss": -5.500657081604004, "global_step": 32082, "epoch": 763} {"train_loss": -5.4316816329956055, "global_step": 32083, "epoch": 763} {"train_loss": -5.550241470336914, "global_step": 32084, "epoch": 763} {"train_loss": -5.6351447105407715, "global_step": 32085, "epoch": 763} {"train_loss": -5.536151885986328, "global_step": 32086, "epoch": 763} {"train_loss": -5.496097791762579, "global_step": 32087, "epoch": 763, "val_loss": 74386.6953125} {"train_loss": -5.368557453155518, "global_step": 32088, "epoch": 764} {"train_loss": -5.5207953453063965, "global_step": 32089, "epoch": 764} {"train_loss": -5.533111095428467, "global_step": 32090, "epoch": 764} {"train_loss": -5.4817328453063965, "global_step": 32091, "epoch": 764} {"train_loss": -5.596221446990967, "global_step": 32092, "epoch": 764} {"train_loss": -5.391010284423828, "global_step": 32093, "epoch": 764} {"train_loss": -5.4861273765563965, "global_step": 32094, "epoch": 764} {"train_loss": -5.446195602416992, "global_step": 32095, "epoch": 764} {"train_loss": -5.444358825683594, "global_step": 32096, "epoch": 764} {"train_loss": -5.531656742095947, "global_step": 32097, "epoch": 764} {"train_loss": -5.634477615356445, "global_step": 32098, "epoch": 764} {"train_loss": -5.509243965148926, "global_step": 32099, "epoch": 764} {"train_loss": -5.470665454864502, "global_step": 32100, "epoch": 764} {"train_loss": -5.502394676208496, "global_step": 32101, "epoch": 764} {"train_loss": -5.520512104034424, "global_step": 32102, "epoch": 764} {"train_loss": -5.444371223449707, "global_step": 32103, "epoch": 764} {"train_loss": -5.510623931884766, "global_step": 32104, "epoch": 764} {"train_loss": -5.514863967895508, "global_step": 32105, "epoch": 764} {"train_loss": -5.39462947845459, "global_step": 32106, "epoch": 764} {"train_loss": -5.629116535186768, "global_step": 32107, "epoch": 764} {"train_loss": -5.468583106994629, "global_step": 32108, "epoch": 764} {"train_loss": -5.470844268798828, "global_step": 32109, "epoch": 764} {"train_loss": -5.429973125457764, "global_step": 32110, "epoch": 764} {"train_loss": -5.529505252838135, "global_step": 32111, "epoch": 764} {"train_loss": -5.522378921508789, "global_step": 32112, "epoch": 764} {"train_loss": -5.546416282653809, "global_step": 32113, "epoch": 764} {"train_loss": -5.580371856689453, "global_step": 32114, "epoch": 764} {"train_loss": -5.6453142166137695, "global_step": 32115, "epoch": 764} {"train_loss": -5.49233341217041, "global_step": 32116, "epoch": 764} {"train_loss": -5.422430992126465, "global_step": 32117, "epoch": 764} {"train_loss": -5.603252410888672, "global_step": 32118, "epoch": 764} {"train_loss": -5.436616897583008, "global_step": 32119, "epoch": 764} {"train_loss": -5.558531284332275, "global_step": 32120, "epoch": 764} {"train_loss": -5.59466552734375, "global_step": 32121, "epoch": 764} {"train_loss": -5.5583086013793945, "global_step": 32122, "epoch": 764} {"train_loss": -5.457712650299072, "global_step": 32123, "epoch": 764} {"train_loss": -5.421731948852539, "global_step": 32124, "epoch": 764} {"train_loss": -5.482630252838135, "global_step": 32125, "epoch": 764} {"train_loss": -5.412684440612793, "global_step": 32126, "epoch": 764} {"train_loss": -5.480203151702881, "global_step": 32127, "epoch": 764} {"train_loss": -5.594273567199707, "global_step": 32128, "epoch": 764} {"train_loss": -5.5030079909733365, "global_step": 32129, "epoch": 764, "val_loss": 75164.8046875} {"train_loss": -5.463393211364746, "global_step": 32130, "epoch": 765} {"train_loss": -5.4520673751831055, "global_step": 32131, "epoch": 765} {"train_loss": -5.503676414489746, "global_step": 32132, "epoch": 765} {"train_loss": -5.396571159362793, "global_step": 32133, "epoch": 765} {"train_loss": -5.58319091796875, "global_step": 32134, "epoch": 765} {"train_loss": -5.464705467224121, "global_step": 32135, "epoch": 765} {"train_loss": -5.560891151428223, "global_step": 32136, "epoch": 765} {"train_loss": -5.593143463134766, "global_step": 32137, "epoch": 765} {"train_loss": -5.524251461029053, "global_step": 32138, "epoch": 765} {"train_loss": -5.528529167175293, "global_step": 32139, "epoch": 765} {"train_loss": -5.47707986831665, "global_step": 32140, "epoch": 765} {"train_loss": -5.403923511505127, "global_step": 32141, "epoch": 765} {"train_loss": -5.52878475189209, "global_step": 32142, "epoch": 765} {"train_loss": -5.475423812866211, "global_step": 32143, "epoch": 765} {"train_loss": -5.529321670532227, "global_step": 32144, "epoch": 765} {"train_loss": -5.380082607269287, "global_step": 32145, "epoch": 765} {"train_loss": -5.347103595733643, "global_step": 32146, "epoch": 765} {"train_loss": -5.566790580749512, "global_step": 32147, "epoch": 765} {"train_loss": -5.476828575134277, "global_step": 32148, "epoch": 765} {"train_loss": -5.557211875915527, "global_step": 32149, "epoch": 765} {"train_loss": -5.584043502807617, "global_step": 32150, "epoch": 765} {"train_loss": -5.387073040008545, "global_step": 32151, "epoch": 765} {"train_loss": -5.556154251098633, "global_step": 32152, "epoch": 765} {"train_loss": -5.565266132354736, "global_step": 32153, "epoch": 765} {"train_loss": -5.465173721313477, "global_step": 32154, "epoch": 765} {"train_loss": -5.460470199584961, "global_step": 32155, "epoch": 765} {"train_loss": -5.60894775390625, "global_step": 32156, "epoch": 765} {"train_loss": -5.578952312469482, "global_step": 32157, "epoch": 765} {"train_loss": -5.537260055541992, "global_step": 32158, "epoch": 765} {"train_loss": -5.577719211578369, "global_step": 32159, "epoch": 765} {"train_loss": -5.604954719543457, "global_step": 32160, "epoch": 765} {"train_loss": -5.511203289031982, "global_step": 32161, "epoch": 765} {"train_loss": -5.572537422180176, "global_step": 32162, "epoch": 765} {"train_loss": -5.619128704071045, "global_step": 32163, "epoch": 765} {"train_loss": -5.604166030883789, "global_step": 32164, "epoch": 765} {"train_loss": -5.606171607971191, "global_step": 32165, "epoch": 765} {"train_loss": -5.502573013305664, "global_step": 32166, "epoch": 765} {"train_loss": -5.564600944519043, "global_step": 32167, "epoch": 765} {"train_loss": -5.5061163902282715, "global_step": 32168, "epoch": 765} {"train_loss": -5.512426853179932, "global_step": 32169, "epoch": 765} {"train_loss": -5.458162307739258, "global_step": 32170, "epoch": 765} {"train_loss": -5.513868842806135, "global_step": 32171, "epoch": 765, "val_loss": 73961.6484375} {"train_loss": -5.5041656494140625, "global_step": 32172, "epoch": 766} {"train_loss": -5.524653434753418, "global_step": 32173, "epoch": 766} {"train_loss": -5.515740394592285, "global_step": 32174, "epoch": 766} {"train_loss": -5.497004508972168, "global_step": 32175, "epoch": 766} {"train_loss": -5.5523271560668945, "global_step": 32176, "epoch": 766} {"train_loss": -5.531704425811768, "global_step": 32177, "epoch": 766} {"train_loss": -5.589526176452637, "global_step": 32178, "epoch": 766} {"train_loss": -5.626233100891113, "global_step": 32179, "epoch": 766} {"train_loss": -5.51011323928833, "global_step": 32180, "epoch": 766} {"train_loss": -5.4869160652160645, "global_step": 32181, "epoch": 766} {"train_loss": -5.47284460067749, "global_step": 32182, "epoch": 766} {"train_loss": -5.530587673187256, "global_step": 32183, "epoch": 766} {"train_loss": -5.491786479949951, "global_step": 32184, "epoch": 766} {"train_loss": -5.576521873474121, "global_step": 32185, "epoch": 766} {"train_loss": -5.406196117401123, "global_step": 32186, "epoch": 766} {"train_loss": -5.480587959289551, "global_step": 32187, "epoch": 766} {"train_loss": -5.706969738006592, "global_step": 32188, "epoch": 766} {"train_loss": -5.559107780456543, "global_step": 32189, "epoch": 766} {"train_loss": -5.528999328613281, "global_step": 32190, "epoch": 766} {"train_loss": -5.5122480392456055, "global_step": 32191, "epoch": 766} {"train_loss": -5.371766567230225, "global_step": 32192, "epoch": 766} {"train_loss": -5.57260274887085, "global_step": 32193, "epoch": 766} {"train_loss": -5.526907444000244, "global_step": 32194, "epoch": 766} {"train_loss": -5.509446144104004, "global_step": 32195, "epoch": 766} {"train_loss": -5.490100860595703, "global_step": 32196, "epoch": 766} {"train_loss": -5.48092794418335, "global_step": 32197, "epoch": 766} {"train_loss": -5.342569828033447, "global_step": 32198, "epoch": 766} {"train_loss": -5.496143817901611, "global_step": 32199, "epoch": 766} {"train_loss": -5.398673057556152, "global_step": 32200, "epoch": 766} {"train_loss": -5.3398590087890625, "global_step": 32201, "epoch": 766} {"train_loss": -5.588503837585449, "global_step": 32202, "epoch": 766} {"train_loss": -5.377561569213867, "global_step": 32203, "epoch": 766} {"train_loss": -5.414443016052246, "global_step": 32204, "epoch": 766} {"train_loss": -5.5830583572387695, "global_step": 32205, "epoch": 766} {"train_loss": -5.506320476531982, "global_step": 32206, "epoch": 766} {"train_loss": -5.509442329406738, "global_step": 32207, "epoch": 766} {"train_loss": -5.405691146850586, "global_step": 32208, "epoch": 766} {"train_loss": -5.443215370178223, "global_step": 32209, "epoch": 766} {"train_loss": -5.413130760192871, "global_step": 32210, "epoch": 766} {"train_loss": -5.532005310058594, "global_step": 32211, "epoch": 766} {"train_loss": -5.342874050140381, "global_step": 32212, "epoch": 766} {"train_loss": -5.495105879647391, "global_step": 32213, "epoch": 766, "val_loss": 75431.5390625} {"train_loss": -5.390594482421875, "global_step": 32214, "epoch": 767} {"train_loss": -5.58441162109375, "global_step": 32215, "epoch": 767} {"train_loss": -5.540939807891846, "global_step": 32216, "epoch": 767} {"train_loss": -5.387792587280273, "global_step": 32217, "epoch": 767} {"train_loss": -5.475404262542725, "global_step": 32218, "epoch": 767} {"train_loss": -5.456974983215332, "global_step": 32219, "epoch": 767} {"train_loss": -5.60322904586792, "global_step": 32220, "epoch": 767} {"train_loss": -5.485154151916504, "global_step": 32221, "epoch": 767} {"train_loss": -5.600348472595215, "global_step": 32222, "epoch": 767} {"train_loss": -5.467160224914551, "global_step": 32223, "epoch": 767} {"train_loss": -5.539867401123047, "global_step": 32224, "epoch": 767} {"train_loss": -5.58553409576416, "global_step": 32225, "epoch": 767} {"train_loss": -5.430485725402832, "global_step": 32226, "epoch": 767} {"train_loss": -5.500637054443359, "global_step": 32227, "epoch": 767} {"train_loss": -5.604824066162109, "global_step": 32228, "epoch": 767} {"train_loss": -5.563763618469238, "global_step": 32229, "epoch": 767} {"train_loss": -5.428492546081543, "global_step": 32230, "epoch": 767} {"train_loss": -5.553584098815918, "global_step": 32231, "epoch": 767} {"train_loss": -5.277387619018555, "global_step": 32232, "epoch": 767} {"train_loss": -5.309167861938477, "global_step": 32233, "epoch": 767} {"train_loss": -5.476090431213379, "global_step": 32234, "epoch": 767} {"train_loss": -5.385385513305664, "global_step": 32235, "epoch": 767} {"train_loss": -5.264132976531982, "global_step": 32236, "epoch": 767} {"train_loss": -5.347235202789307, "global_step": 32237, "epoch": 767} {"train_loss": -5.308145523071289, "global_step": 32238, "epoch": 767} {"train_loss": -5.320062637329102, "global_step": 32239, "epoch": 767} {"train_loss": -5.391846656799316, "global_step": 32240, "epoch": 767} {"train_loss": -5.538730621337891, "global_step": 32241, "epoch": 767} {"train_loss": -5.365837574005127, "global_step": 32242, "epoch": 767} {"train_loss": -5.470026016235352, "global_step": 32243, "epoch": 767} {"train_loss": -5.481722354888916, "global_step": 32244, "epoch": 767} {"train_loss": -5.487969398498535, "global_step": 32245, "epoch": 767} {"train_loss": -5.406613349914551, "global_step": 32246, "epoch": 767} {"train_loss": -5.366500377655029, "global_step": 32247, "epoch": 767} {"train_loss": -5.32080078125, "global_step": 32248, "epoch": 767} {"train_loss": -5.574570178985596, "global_step": 32249, "epoch": 767} {"train_loss": -5.495153903961182, "global_step": 32250, "epoch": 767} {"train_loss": -5.560636520385742, "global_step": 32251, "epoch": 767} {"train_loss": -5.476904392242432, "global_step": 32252, "epoch": 767} {"train_loss": -5.444092273712158, "global_step": 32253, "epoch": 767} {"train_loss": -5.567814826965332, "global_step": 32254, "epoch": 767} {"train_loss": -5.459853229068575, "global_step": 32255, "epoch": 767, "val_loss": 75066.25} {"train_loss": -5.421651363372803, "global_step": 32256, "epoch": 768} {"train_loss": -5.46821403503418, "global_step": 32257, "epoch": 768} {"train_loss": -5.575927734375, "global_step": 32258, "epoch": 768} {"train_loss": -5.4493513107299805, "global_step": 32259, "epoch": 768} {"train_loss": -5.515496730804443, "global_step": 32260, "epoch": 768} {"train_loss": -5.489180564880371, "global_step": 32261, "epoch": 768} {"train_loss": -5.468382358551025, "global_step": 32262, "epoch": 768} {"train_loss": -5.435263633728027, "global_step": 32263, "epoch": 768} {"train_loss": -5.574115753173828, "global_step": 32264, "epoch": 768} {"train_loss": -5.5077056884765625, "global_step": 32265, "epoch": 768} {"train_loss": -5.428256511688232, "global_step": 32266, "epoch": 768} {"train_loss": -5.4536285400390625, "global_step": 32267, "epoch": 768} {"train_loss": -5.630951881408691, "global_step": 32268, "epoch": 768} {"train_loss": -5.613574981689453, "global_step": 32269, "epoch": 768} {"train_loss": -5.365225791931152, "global_step": 32270, "epoch": 768} {"train_loss": -5.487969398498535, "global_step": 32271, "epoch": 768} {"train_loss": -5.512599945068359, "global_step": 32272, "epoch": 768} {"train_loss": -5.349676132202148, "global_step": 32273, "epoch": 768} {"train_loss": -5.540186405181885, "global_step": 32274, "epoch": 768} {"train_loss": -5.591797828674316, "global_step": 32275, "epoch": 768} {"train_loss": -5.551816463470459, "global_step": 32276, "epoch": 768} {"train_loss": -5.506492614746094, "global_step": 32277, "epoch": 768} {"train_loss": -5.605599880218506, "global_step": 32278, "epoch": 768} {"train_loss": -5.5106306076049805, "global_step": 32279, "epoch": 768} {"train_loss": -5.590447902679443, "global_step": 32280, "epoch": 768} {"train_loss": -5.774840831756592, "global_step": 32281, "epoch": 768} {"train_loss": -5.465119361877441, "global_step": 32282, "epoch": 768} {"train_loss": -5.58941125869751, "global_step": 32283, "epoch": 768} {"train_loss": -5.569530487060547, "global_step": 32284, "epoch": 768} {"train_loss": -5.559661865234375, "global_step": 32285, "epoch": 768} {"train_loss": -5.433639049530029, "global_step": 32286, "epoch": 768} {"train_loss": -5.492169380187988, "global_step": 32287, "epoch": 768} {"train_loss": -5.593740940093994, "global_step": 32288, "epoch": 768} {"train_loss": -5.378994941711426, "global_step": 32289, "epoch": 768} {"train_loss": -5.41455602645874, "global_step": 32290, "epoch": 768} {"train_loss": -5.507732391357422, "global_step": 32291, "epoch": 768} {"train_loss": -5.357913970947266, "global_step": 32292, "epoch": 768} {"train_loss": -5.483515739440918, "global_step": 32293, "epoch": 768} {"train_loss": -5.559515953063965, "global_step": 32294, "epoch": 768} {"train_loss": -5.506850719451904, "global_step": 32295, "epoch": 768} {"train_loss": -5.55963134765625, "global_step": 32296, "epoch": 768} {"train_loss": -5.509058452787853, "global_step": 32297, "epoch": 768, "val_loss": 74803.53125} {"train_loss": -5.511678695678711, "global_step": 32298, "epoch": 769} {"train_loss": -5.502959728240967, "global_step": 32299, "epoch": 769} {"train_loss": -5.499449729919434, "global_step": 32300, "epoch": 769} {"train_loss": -5.4274396896362305, "global_step": 32301, "epoch": 769} {"train_loss": -5.634228706359863, "global_step": 32302, "epoch": 769} {"train_loss": -5.515942573547363, "global_step": 32303, "epoch": 769} {"train_loss": -5.407962799072266, "global_step": 32304, "epoch": 769} {"train_loss": -5.610917568206787, "global_step": 32305, "epoch": 769} {"train_loss": -5.442442893981934, "global_step": 32306, "epoch": 769} {"train_loss": -5.525559425354004, "global_step": 32307, "epoch": 769} {"train_loss": -5.552524566650391, "global_step": 32308, "epoch": 769} {"train_loss": -5.414842128753662, "global_step": 32309, "epoch": 769} {"train_loss": -5.529303550720215, "global_step": 32310, "epoch": 769} {"train_loss": -5.486717700958252, "global_step": 32311, "epoch": 769} {"train_loss": -5.650388717651367, "global_step": 32312, "epoch": 769} {"train_loss": -5.476372718811035, "global_step": 32313, "epoch": 769} {"train_loss": -5.52649450302124, "global_step": 32314, "epoch": 769} {"train_loss": -5.650603294372559, "global_step": 32315, "epoch": 769} {"train_loss": -5.427730560302734, "global_step": 32316, "epoch": 769} {"train_loss": -5.566152572631836, "global_step": 32317, "epoch": 769} {"train_loss": -5.605180740356445, "global_step": 32318, "epoch": 769} {"train_loss": -5.499311447143555, "global_step": 32319, "epoch": 769} {"train_loss": -5.424426555633545, "global_step": 32320, "epoch": 769} {"train_loss": -5.43308162689209, "global_step": 32321, "epoch": 769} {"train_loss": -5.527646064758301, "global_step": 32322, "epoch": 769} {"train_loss": -5.383823394775391, "global_step": 32323, "epoch": 769} {"train_loss": -5.470644950866699, "global_step": 32324, "epoch": 769} {"train_loss": -5.437402725219727, "global_step": 32325, "epoch": 769} {"train_loss": -5.3990373611450195, "global_step": 32326, "epoch": 769} {"train_loss": -5.5306501388549805, "global_step": 32327, "epoch": 769} {"train_loss": -5.442601203918457, "global_step": 32328, "epoch": 769} {"train_loss": -5.447550296783447, "global_step": 32329, "epoch": 769} {"train_loss": -5.5903401374816895, "global_step": 32330, "epoch": 769} {"train_loss": -5.394993782043457, "global_step": 32331, "epoch": 769} {"train_loss": -5.445094108581543, "global_step": 32332, "epoch": 769} {"train_loss": -5.456799507141113, "global_step": 32333, "epoch": 769} {"train_loss": -5.642469882965088, "global_step": 32334, "epoch": 769} {"train_loss": -5.365605354309082, "global_step": 32335, "epoch": 769} {"train_loss": -5.487488269805908, "global_step": 32336, "epoch": 769} {"train_loss": -5.426969528198242, "global_step": 32337, "epoch": 769} {"train_loss": -5.5758795738220215, "global_step": 32338, "epoch": 769} {"train_loss": -5.494836988903227, "global_step": 32339, "epoch": 769, "val_loss": 74614.9375} {"train_loss": -5.4658002853393555, "global_step": 32340, "epoch": 770} {"train_loss": -5.511282920837402, "global_step": 32341, "epoch": 770} {"train_loss": -5.412737846374512, "global_step": 32342, "epoch": 770} {"train_loss": -5.448005676269531, "global_step": 32343, "epoch": 770} {"train_loss": -5.497430801391602, "global_step": 32344, "epoch": 770} {"train_loss": -5.608249664306641, "global_step": 32345, "epoch": 770} {"train_loss": -5.301854133605957, "global_step": 32346, "epoch": 770} {"train_loss": -5.592837333679199, "global_step": 32347, "epoch": 770} {"train_loss": -5.504001617431641, "global_step": 32348, "epoch": 770} {"train_loss": -5.5520219802856445, "global_step": 32349, "epoch": 770} {"train_loss": -5.598405838012695, "global_step": 32350, "epoch": 770} {"train_loss": -5.587192058563232, "global_step": 32351, "epoch": 770} {"train_loss": -5.62459659576416, "global_step": 32352, "epoch": 770} {"train_loss": -5.593284606933594, "global_step": 32353, "epoch": 770} {"train_loss": -5.525655746459961, "global_step": 32354, "epoch": 770} {"train_loss": -5.532014846801758, "global_step": 32355, "epoch": 770} {"train_loss": -5.360618591308594, "global_step": 32356, "epoch": 770} {"train_loss": -5.483818054199219, "global_step": 32357, "epoch": 770} {"train_loss": -5.542733192443848, "global_step": 32358, "epoch": 770} {"train_loss": -5.508118152618408, "global_step": 32359, "epoch": 770} {"train_loss": -5.584029674530029, "global_step": 32360, "epoch": 770} {"train_loss": -5.525604248046875, "global_step": 32361, "epoch": 770} {"train_loss": -5.488863945007324, "global_step": 32362, "epoch": 770} {"train_loss": -5.43181848526001, "global_step": 32363, "epoch": 770} {"train_loss": -5.495582103729248, "global_step": 32364, "epoch": 770} {"train_loss": -5.543931007385254, "global_step": 32365, "epoch": 770} {"train_loss": -5.420747756958008, "global_step": 32366, "epoch": 770} {"train_loss": -5.4687886238098145, "global_step": 32367, "epoch": 770} {"train_loss": -5.379617691040039, "global_step": 32368, "epoch": 770} {"train_loss": -5.391610622406006, "global_step": 32369, "epoch": 770} {"train_loss": -5.434366226196289, "global_step": 32370, "epoch": 770} {"train_loss": -5.577836036682129, "global_step": 32371, "epoch": 770} {"train_loss": -5.497175216674805, "global_step": 32372, "epoch": 770} {"train_loss": -5.421821594238281, "global_step": 32373, "epoch": 770} {"train_loss": -5.535558700561523, "global_step": 32374, "epoch": 770} {"train_loss": -5.457335472106934, "global_step": 32375, "epoch": 770} {"train_loss": -5.489406585693359, "global_step": 32376, "epoch": 770} {"train_loss": -5.479513168334961, "global_step": 32377, "epoch": 770} {"train_loss": -5.525236129760742, "global_step": 32378, "epoch": 770} {"train_loss": -5.593679904937744, "global_step": 32379, "epoch": 770} {"train_loss": -5.5973005294799805, "global_step": 32380, "epoch": 770} {"train_loss": -5.503186021532331, "global_step": 32381, "epoch": 770, "val_loss": 74638.1640625} {"train_loss": -5.5375566482543945, "global_step": 32382, "epoch": 771} {"train_loss": -5.593783855438232, "global_step": 32383, "epoch": 771} {"train_loss": -5.563121795654297, "global_step": 32384, "epoch": 771} {"train_loss": -5.592438220977783, "global_step": 32385, "epoch": 771} {"train_loss": -5.513542652130127, "global_step": 32386, "epoch": 771} {"train_loss": -5.564126968383789, "global_step": 32387, "epoch": 771} {"train_loss": -5.57545280456543, "global_step": 32388, "epoch": 771} {"train_loss": -5.566844940185547, "global_step": 32389, "epoch": 771} {"train_loss": -5.576872825622559, "global_step": 32390, "epoch": 771} {"train_loss": -5.545671463012695, "global_step": 32391, "epoch": 771} {"train_loss": -5.550649166107178, "global_step": 32392, "epoch": 771} {"train_loss": -5.472559928894043, "global_step": 32393, "epoch": 771} {"train_loss": -5.399701118469238, "global_step": 32394, "epoch": 771} {"train_loss": -5.584651947021484, "global_step": 32395, "epoch": 771} {"train_loss": -5.652118682861328, "global_step": 32396, "epoch": 771} {"train_loss": -5.478240966796875, "global_step": 32397, "epoch": 771} {"train_loss": -5.505853176116943, "global_step": 32398, "epoch": 771} {"train_loss": -5.585909843444824, "global_step": 32399, "epoch": 771} {"train_loss": -5.506771087646484, "global_step": 32400, "epoch": 771} {"train_loss": -5.454739093780518, "global_step": 32401, "epoch": 771} {"train_loss": -5.545453071594238, "global_step": 32402, "epoch": 771} {"train_loss": -5.479650020599365, "global_step": 32403, "epoch": 771} {"train_loss": -5.486940383911133, "global_step": 32404, "epoch": 771} {"train_loss": -5.435407638549805, "global_step": 32405, "epoch": 771} {"train_loss": -5.557981491088867, "global_step": 32406, "epoch": 771} {"train_loss": -5.474062919616699, "global_step": 32407, "epoch": 771} {"train_loss": -5.432535171508789, "global_step": 32408, "epoch": 771} {"train_loss": -5.596485614776611, "global_step": 32409, "epoch": 771} {"train_loss": -5.45017147064209, "global_step": 32410, "epoch": 771} {"train_loss": -5.396425247192383, "global_step": 32411, "epoch": 771} {"train_loss": -5.461280345916748, "global_step": 32412, "epoch": 771} {"train_loss": -5.371510028839111, "global_step": 32413, "epoch": 771} {"train_loss": -5.667116165161133, "global_step": 32414, "epoch": 771} {"train_loss": -5.652707576751709, "global_step": 32415, "epoch": 771} {"train_loss": -5.496227264404297, "global_step": 32416, "epoch": 771} {"train_loss": -5.388976573944092, "global_step": 32417, "epoch": 771} {"train_loss": -5.419157981872559, "global_step": 32418, "epoch": 771} {"train_loss": -5.578802108764648, "global_step": 32419, "epoch": 771} {"train_loss": -5.391785144805908, "global_step": 32420, "epoch": 771} {"train_loss": -5.359615802764893, "global_step": 32421, "epoch": 771} {"train_loss": -5.511103630065918, "global_step": 32422, "epoch": 771} {"train_loss": -5.50743013336545, "global_step": 32423, "epoch": 771, "val_loss": 74635.0234375} {"train_loss": -5.492690563201904, "global_step": 32424, "epoch": 772} {"train_loss": -5.475793838500977, "global_step": 32425, "epoch": 772} {"train_loss": -5.487179279327393, "global_step": 32426, "epoch": 772} {"train_loss": -5.411733150482178, "global_step": 32427, "epoch": 772} {"train_loss": -5.611817359924316, "global_step": 32428, "epoch": 772} {"train_loss": -5.441801071166992, "global_step": 32429, "epoch": 772} {"train_loss": -5.549338340759277, "global_step": 32430, "epoch": 772} {"train_loss": -5.538245677947998, "global_step": 32431, "epoch": 772} {"train_loss": -5.5810546875, "global_step": 32432, "epoch": 772} {"train_loss": -5.569380760192871, "global_step": 32433, "epoch": 772} {"train_loss": -5.5802001953125, "global_step": 32434, "epoch": 772} {"train_loss": -5.483460426330566, "global_step": 32435, "epoch": 772} {"train_loss": -5.341649055480957, "global_step": 32436, "epoch": 772} {"train_loss": -5.519863128662109, "global_step": 32437, "epoch": 772} {"train_loss": -5.603856086730957, "global_step": 32438, "epoch": 772} {"train_loss": -5.461637496948242, "global_step": 32439, "epoch": 772} {"train_loss": -5.382932186126709, "global_step": 32440, "epoch": 772} {"train_loss": -5.411911964416504, "global_step": 32441, "epoch": 772} {"train_loss": -5.423410415649414, "global_step": 32442, "epoch": 772} {"train_loss": -5.373963356018066, "global_step": 32443, "epoch": 772} {"train_loss": -5.535743713378906, "global_step": 32444, "epoch": 772} {"train_loss": -5.441622257232666, "global_step": 32445, "epoch": 772} {"train_loss": -5.279528617858887, "global_step": 32446, "epoch": 772} {"train_loss": -5.559615135192871, "global_step": 32447, "epoch": 772} {"train_loss": -5.541470050811768, "global_step": 32448, "epoch": 772} {"train_loss": -5.4760637283325195, "global_step": 32449, "epoch": 772} {"train_loss": -5.379678249359131, "global_step": 32450, "epoch": 772} {"train_loss": -5.467626571655273, "global_step": 32451, "epoch": 772} {"train_loss": -5.4352312088012695, "global_step": 32452, "epoch": 772} {"train_loss": -5.4994797706604, "global_step": 32453, "epoch": 772} {"train_loss": -5.507746696472168, "global_step": 32454, "epoch": 772} {"train_loss": -5.462429046630859, "global_step": 32455, "epoch": 772} {"train_loss": -5.463881015777588, "global_step": 32456, "epoch": 772} {"train_loss": -5.516386032104492, "global_step": 32457, "epoch": 772} {"train_loss": -5.570715427398682, "global_step": 32458, "epoch": 772} {"train_loss": -5.600703239440918, "global_step": 32459, "epoch": 772} {"train_loss": -5.387441635131836, "global_step": 32460, "epoch": 772} {"train_loss": -5.480534076690674, "global_step": 32461, "epoch": 772} {"train_loss": -5.544076442718506, "global_step": 32462, "epoch": 772} {"train_loss": -5.543234348297119, "global_step": 32463, "epoch": 772} {"train_loss": -5.574488639831543, "global_step": 32464, "epoch": 772} {"train_loss": -5.489479859670003, "global_step": 32465, "epoch": 772, "val_loss": 74538.6953125} {"train_loss": -5.447822093963623, "global_step": 32466, "epoch": 773} {"train_loss": -5.61634635925293, "global_step": 32467, "epoch": 773} {"train_loss": -5.551941394805908, "global_step": 32468, "epoch": 773} {"train_loss": -5.5562520027160645, "global_step": 32469, "epoch": 773} {"train_loss": -5.494069576263428, "global_step": 32470, "epoch": 773} {"train_loss": -5.405881881713867, "global_step": 32471, "epoch": 773} {"train_loss": -5.448396682739258, "global_step": 32472, "epoch": 773} {"train_loss": -5.41941499710083, "global_step": 32473, "epoch": 773} {"train_loss": -5.580532073974609, "global_step": 32474, "epoch": 773} {"train_loss": -5.498791694641113, "global_step": 32475, "epoch": 773} {"train_loss": -5.51600980758667, "global_step": 32476, "epoch": 773} {"train_loss": -5.5465192794799805, "global_step": 32477, "epoch": 773} {"train_loss": -5.451591491699219, "global_step": 32478, "epoch": 773} {"train_loss": -5.577601432800293, "global_step": 32479, "epoch": 773} {"train_loss": -5.428822040557861, "global_step": 32480, "epoch": 773} {"train_loss": -5.555150032043457, "global_step": 32481, "epoch": 773} {"train_loss": -5.452624320983887, "global_step": 32482, "epoch": 773} {"train_loss": -5.493618965148926, "global_step": 32483, "epoch": 773} {"train_loss": -5.612820625305176, "global_step": 32484, "epoch": 773} {"train_loss": -5.475003242492676, "global_step": 32485, "epoch": 773} {"train_loss": -5.553652763366699, "global_step": 32486, "epoch": 773} {"train_loss": -5.407961368560791, "global_step": 32487, "epoch": 773} {"train_loss": -5.609238624572754, "global_step": 32488, "epoch": 773} {"train_loss": -5.3910369873046875, "global_step": 32489, "epoch": 773} {"train_loss": -5.533393859863281, "global_step": 32490, "epoch": 773} {"train_loss": -5.442841529846191, "global_step": 32491, "epoch": 773} {"train_loss": -5.450927257537842, "global_step": 32492, "epoch": 773} {"train_loss": -5.66040563583374, "global_step": 32493, "epoch": 773} {"train_loss": -5.465970993041992, "global_step": 32494, "epoch": 773} {"train_loss": -5.420071601867676, "global_step": 32495, "epoch": 773} {"train_loss": -5.510430335998535, "global_step": 32496, "epoch": 773} {"train_loss": -5.439043998718262, "global_step": 32497, "epoch": 773} {"train_loss": -5.417665958404541, "global_step": 32498, "epoch": 773} {"train_loss": -5.547780990600586, "global_step": 32499, "epoch": 773} {"train_loss": -5.530181407928467, "global_step": 32500, "epoch": 773} {"train_loss": -5.502634048461914, "global_step": 32501, "epoch": 773} {"train_loss": -5.536049842834473, "global_step": 32502, "epoch": 773} {"train_loss": -5.472099304199219, "global_step": 32503, "epoch": 773} {"train_loss": -5.512062072753906, "global_step": 32504, "epoch": 773} {"train_loss": -5.42846155166626, "global_step": 32505, "epoch": 773} {"train_loss": -5.5864033699035645, "global_step": 32506, "epoch": 773} {"train_loss": -5.504336493355887, "global_step": 32507, "epoch": 773, "val_loss": 74865.09375} {"train_loss": -5.480478286743164, "global_step": 32508, "epoch": 774} {"train_loss": -5.624455451965332, "global_step": 32509, "epoch": 774} {"train_loss": -5.505825519561768, "global_step": 32510, "epoch": 774} {"train_loss": -5.576418399810791, "global_step": 32511, "epoch": 774} {"train_loss": -5.489753246307373, "global_step": 32512, "epoch": 774} {"train_loss": -5.556796073913574, "global_step": 32513, "epoch": 774} {"train_loss": -5.70736837387085, "global_step": 32514, "epoch": 774} {"train_loss": -5.499309539794922, "global_step": 32515, "epoch": 774} {"train_loss": -5.495556831359863, "global_step": 32516, "epoch": 774} {"train_loss": -5.437658309936523, "global_step": 32517, "epoch": 774} {"train_loss": -5.3749613761901855, "global_step": 32518, "epoch": 774} {"train_loss": -5.481595039367676, "global_step": 32519, "epoch": 774} {"train_loss": -5.423050403594971, "global_step": 32520, "epoch": 774} {"train_loss": -5.444094657897949, "global_step": 32521, "epoch": 774} {"train_loss": -5.572346210479736, "global_step": 32522, "epoch": 774} {"train_loss": -5.390490531921387, "global_step": 32523, "epoch": 774} {"train_loss": -5.411303997039795, "global_step": 32524, "epoch": 774} {"train_loss": -5.5188140869140625, "global_step": 32525, "epoch": 774} {"train_loss": -5.379459381103516, "global_step": 32526, "epoch": 774} {"train_loss": -5.550121307373047, "global_step": 32527, "epoch": 774} {"train_loss": -5.478795051574707, "global_step": 32528, "epoch": 774} {"train_loss": -5.5823822021484375, "global_step": 32529, "epoch": 774} {"train_loss": -5.427145957946777, "global_step": 32530, "epoch": 774} {"train_loss": -5.421280860900879, "global_step": 32531, "epoch": 774} {"train_loss": -5.412731170654297, "global_step": 32532, "epoch": 774} {"train_loss": -5.432873725891113, "global_step": 32533, "epoch": 774} {"train_loss": -5.49959135055542, "global_step": 32534, "epoch": 774} {"train_loss": -5.304439544677734, "global_step": 32535, "epoch": 774} {"train_loss": -5.502465724945068, "global_step": 32536, "epoch": 774} {"train_loss": -5.361673831939697, "global_step": 32537, "epoch": 774} {"train_loss": -5.455023765563965, "global_step": 32538, "epoch": 774} {"train_loss": -5.382949352264404, "global_step": 32539, "epoch": 774} {"train_loss": -5.532233238220215, "global_step": 32540, "epoch": 774} {"train_loss": -5.434780597686768, "global_step": 32541, "epoch": 774} {"train_loss": -5.335070610046387, "global_step": 32542, "epoch": 774} {"train_loss": -5.48425817489624, "global_step": 32543, "epoch": 774} {"train_loss": -5.423140525817871, "global_step": 32544, "epoch": 774} {"train_loss": -5.452132225036621, "global_step": 32545, "epoch": 774} {"train_loss": -5.474189758300781, "global_step": 32546, "epoch": 774} {"train_loss": -5.440816402435303, "global_step": 32547, "epoch": 774} {"train_loss": -5.520672798156738, "global_step": 32548, "epoch": 774} {"train_loss": -5.471853108633132, "global_step": 32549, "epoch": 774, "val_loss": 75291.6015625} {"train_loss": -5.4290947914123535, "global_step": 32550, "epoch": 775} {"train_loss": -5.591726779937744, "global_step": 32551, "epoch": 775} {"train_loss": -5.532296180725098, "global_step": 32552, "epoch": 775} {"train_loss": -5.523753643035889, "global_step": 32553, "epoch": 775} {"train_loss": -5.505059719085693, "global_step": 32554, "epoch": 775} {"train_loss": -5.540628433227539, "global_step": 32555, "epoch": 775} {"train_loss": -5.560961723327637, "global_step": 32556, "epoch": 775} {"train_loss": -5.480401039123535, "global_step": 32557, "epoch": 775} {"train_loss": -5.534819602966309, "global_step": 32558, "epoch": 775} {"train_loss": -5.420284271240234, "global_step": 32559, "epoch": 775} {"train_loss": -5.472600936889648, "global_step": 32560, "epoch": 775} {"train_loss": -5.53921365737915, "global_step": 32561, "epoch": 775} {"train_loss": -5.591770172119141, "global_step": 32562, "epoch": 775} {"train_loss": -5.5118513107299805, "global_step": 32563, "epoch": 775} {"train_loss": -5.469913482666016, "global_step": 32564, "epoch": 775} {"train_loss": -5.462708473205566, "global_step": 32565, "epoch": 775} {"train_loss": -5.508894920349121, "global_step": 32566, "epoch": 775} {"train_loss": -5.4756879806518555, "global_step": 32567, "epoch": 775} {"train_loss": -5.444066524505615, "global_step": 32568, "epoch": 775} {"train_loss": -5.499012470245361, "global_step": 32569, "epoch": 775} {"train_loss": -5.548969268798828, "global_step": 32570, "epoch": 775} {"train_loss": -5.539242744445801, "global_step": 32571, "epoch": 775} {"train_loss": -5.494935989379883, "global_step": 32572, "epoch": 775} {"train_loss": -5.671351432800293, "global_step": 32573, "epoch": 775} {"train_loss": -5.597858905792236, "global_step": 32574, "epoch": 775} {"train_loss": -5.484419822692871, "global_step": 32575, "epoch": 775} {"train_loss": -5.4603590965271, "global_step": 32576, "epoch": 775} {"train_loss": -5.633185386657715, "global_step": 32577, "epoch": 775} {"train_loss": -5.448528289794922, "global_step": 32578, "epoch": 775} {"train_loss": -5.477718353271484, "global_step": 32579, "epoch": 775} {"train_loss": -5.664890766143799, "global_step": 32580, "epoch": 775} {"train_loss": -5.509620666503906, "global_step": 32581, "epoch": 775} {"train_loss": -5.462423324584961, "global_step": 32582, "epoch": 775} {"train_loss": -5.497312545776367, "global_step": 32583, "epoch": 775} {"train_loss": -5.6067705154418945, "global_step": 32584, "epoch": 775} {"train_loss": -5.54908561706543, "global_step": 32585, "epoch": 775} {"train_loss": -5.483118057250977, "global_step": 32586, "epoch": 775} {"train_loss": -5.620439529418945, "global_step": 32587, "epoch": 775} {"train_loss": -5.386263370513916, "global_step": 32588, "epoch": 775} {"train_loss": -5.554880619049072, "global_step": 32589, "epoch": 775} {"train_loss": -5.3732757568359375, "global_step": 32590, "epoch": 775} {"train_loss": -5.520646072569347, "global_step": 32591, "epoch": 775, "val_loss": 74204.7734375} {"train_loss": -5.455237865447998, "global_step": 32592, "epoch": 776} {"train_loss": -5.566661357879639, "global_step": 32593, "epoch": 776} {"train_loss": -5.483005523681641, "global_step": 32594, "epoch": 776} {"train_loss": -5.5649309158325195, "global_step": 32595, "epoch": 776} {"train_loss": -5.482489109039307, "global_step": 32596, "epoch": 776} {"train_loss": -5.556097030639648, "global_step": 32597, "epoch": 776} {"train_loss": -5.622623920440674, "global_step": 32598, "epoch": 776} {"train_loss": -5.455455303192139, "global_step": 32599, "epoch": 776} {"train_loss": -5.616462707519531, "global_step": 32600, "epoch": 776} {"train_loss": -5.641505241394043, "global_step": 32601, "epoch": 776} {"train_loss": -5.540117263793945, "global_step": 32602, "epoch": 776} {"train_loss": -5.554098129272461, "global_step": 32603, "epoch": 776} {"train_loss": -5.545313835144043, "global_step": 32604, "epoch": 776} {"train_loss": -5.660113334655762, "global_step": 32605, "epoch": 776} {"train_loss": -5.582703590393066, "global_step": 32606, "epoch": 776} {"train_loss": -5.6495361328125, "global_step": 32607, "epoch": 776} {"train_loss": -5.471594333648682, "global_step": 32608, "epoch": 776} {"train_loss": -5.514527320861816, "global_step": 32609, "epoch": 776} {"train_loss": -5.38691520690918, "global_step": 32610, "epoch": 776} {"train_loss": -5.46658992767334, "global_step": 32611, "epoch": 776} {"train_loss": -5.402009010314941, "global_step": 32612, "epoch": 776} {"train_loss": -5.466139793395996, "global_step": 32613, "epoch": 776} {"train_loss": -5.469463348388672, "global_step": 32614, "epoch": 776} {"train_loss": -5.362396240234375, "global_step": 32615, "epoch": 776} {"train_loss": -5.491264820098877, "global_step": 32616, "epoch": 776} {"train_loss": -5.572188854217529, "global_step": 32617, "epoch": 776} {"train_loss": -5.399868011474609, "global_step": 32618, "epoch": 776} {"train_loss": -5.56417989730835, "global_step": 32619, "epoch": 776} {"train_loss": -5.580607891082764, "global_step": 32620, "epoch": 776} {"train_loss": -5.5215325355529785, "global_step": 32621, "epoch": 776} {"train_loss": -5.468960762023926, "global_step": 32622, "epoch": 776} {"train_loss": -5.4840087890625, "global_step": 32623, "epoch": 776} {"train_loss": -5.4040327072143555, "global_step": 32624, "epoch": 776} {"train_loss": -5.4770331382751465, "global_step": 32625, "epoch": 776} {"train_loss": -5.480789661407471, "global_step": 32626, "epoch": 776} {"train_loss": -5.3810834884643555, "global_step": 32627, "epoch": 776} {"train_loss": -5.446684837341309, "global_step": 32628, "epoch": 776} {"train_loss": -5.455781936645508, "global_step": 32629, "epoch": 776} {"train_loss": -5.489830017089844, "global_step": 32630, "epoch": 776} {"train_loss": -5.528234481811523, "global_step": 32631, "epoch": 776} {"train_loss": -5.502196311950684, "global_step": 32632, "epoch": 776} {"train_loss": -5.508542321977162, "global_step": 32633, "epoch": 776, "val_loss": 74407.40625} {"train_loss": -5.634596347808838, "global_step": 32634, "epoch": 777} {"train_loss": -5.6190032958984375, "global_step": 32635, "epoch": 777} {"train_loss": -5.526956558227539, "global_step": 32636, "epoch": 777} {"train_loss": -5.522490501403809, "global_step": 32637, "epoch": 777} {"train_loss": -5.524824142456055, "global_step": 32638, "epoch": 777} {"train_loss": -5.581480979919434, "global_step": 32639, "epoch": 777} {"train_loss": -5.53017520904541, "global_step": 32640, "epoch": 777} {"train_loss": -5.481705665588379, "global_step": 32641, "epoch": 777} {"train_loss": -5.438776969909668, "global_step": 32642, "epoch": 777} {"train_loss": -5.525173664093018, "global_step": 32643, "epoch": 777} {"train_loss": -5.540907859802246, "global_step": 32644, "epoch": 777} {"train_loss": -5.64579439163208, "global_step": 32645, "epoch": 777} {"train_loss": -5.522723197937012, "global_step": 32646, "epoch": 777} {"train_loss": -5.644110679626465, "global_step": 32647, "epoch": 777} {"train_loss": -5.489627838134766, "global_step": 32648, "epoch": 777} {"train_loss": -5.525838851928711, "global_step": 32649, "epoch": 777} {"train_loss": -5.55771541595459, "global_step": 32650, "epoch": 777} {"train_loss": -5.468177795410156, "global_step": 32651, "epoch": 777} {"train_loss": -5.488611698150635, "global_step": 32652, "epoch": 777} {"train_loss": -5.586177825927734, "global_step": 32653, "epoch": 777} {"train_loss": -5.555614471435547, "global_step": 32654, "epoch": 777} {"train_loss": -5.36827278137207, "global_step": 32655, "epoch": 777} {"train_loss": -5.558742523193359, "global_step": 32656, "epoch": 777} {"train_loss": -5.440959930419922, "global_step": 32657, "epoch": 777} {"train_loss": -5.411426067352295, "global_step": 32658, "epoch": 777} {"train_loss": -5.494568824768066, "global_step": 32659, "epoch": 777} {"train_loss": -5.616964340209961, "global_step": 32660, "epoch": 777} {"train_loss": -5.432938575744629, "global_step": 32661, "epoch": 777} {"train_loss": -5.520718574523926, "global_step": 32662, "epoch": 777} {"train_loss": -5.482692718505859, "global_step": 32663, "epoch": 777} {"train_loss": -5.346915245056152, "global_step": 32664, "epoch": 777} {"train_loss": -5.59471321105957, "global_step": 32665, "epoch": 777} {"train_loss": -5.588292121887207, "global_step": 32666, "epoch": 777} {"train_loss": -5.548576831817627, "global_step": 32667, "epoch": 777} {"train_loss": -5.496290683746338, "global_step": 32668, "epoch": 777} {"train_loss": -5.528979778289795, "global_step": 32669, "epoch": 777} {"train_loss": -5.508909702301025, "global_step": 32670, "epoch": 777} {"train_loss": -5.429689407348633, "global_step": 32671, "epoch": 777} {"train_loss": -5.552288055419922, "global_step": 32672, "epoch": 777} {"train_loss": -5.443018913269043, "global_step": 32673, "epoch": 777} {"train_loss": -5.537172317504883, "global_step": 32674, "epoch": 777} {"train_loss": -5.516886733827137, "global_step": 32675, "epoch": 777, "val_loss": 75060.3828125} {"train_loss": -5.5126471519470215, "global_step": 32676, "epoch": 778} {"train_loss": -5.512297630310059, "global_step": 32677, "epoch": 778} {"train_loss": -5.539028167724609, "global_step": 32678, "epoch": 778} {"train_loss": -5.680630207061768, "global_step": 32679, "epoch": 778} {"train_loss": -5.466629981994629, "global_step": 32680, "epoch": 778} {"train_loss": -5.5683674812316895, "global_step": 32681, "epoch": 778} {"train_loss": -5.5225677490234375, "global_step": 32682, "epoch": 778} {"train_loss": -5.492254257202148, "global_step": 32683, "epoch": 778} {"train_loss": -5.625920295715332, "global_step": 32684, "epoch": 778} {"train_loss": -5.511784553527832, "global_step": 32685, "epoch": 778} {"train_loss": -5.54026460647583, "global_step": 32686, "epoch": 778} {"train_loss": -5.526251316070557, "global_step": 32687, "epoch": 778} {"train_loss": -5.482843399047852, "global_step": 32688, "epoch": 778} {"train_loss": -5.539461612701416, "global_step": 32689, "epoch": 778} {"train_loss": -5.421992301940918, "global_step": 32690, "epoch": 778} {"train_loss": -5.4449262619018555, "global_step": 32691, "epoch": 778} {"train_loss": -5.615649223327637, "global_step": 32692, "epoch": 778} {"train_loss": -5.558032512664795, "global_step": 32693, "epoch": 778} {"train_loss": -5.6294264793396, "global_step": 32694, "epoch": 778} {"train_loss": -5.631630897521973, "global_step": 32695, "epoch": 778} {"train_loss": -5.349081039428711, "global_step": 32696, "epoch": 778} {"train_loss": -5.513866424560547, "global_step": 32697, "epoch": 778} {"train_loss": -5.438654899597168, "global_step": 32698, "epoch": 778} {"train_loss": -5.478508472442627, "global_step": 32699, "epoch": 778} {"train_loss": -5.54671573638916, "global_step": 32700, "epoch": 778} {"train_loss": -5.636719226837158, "global_step": 32701, "epoch": 778} {"train_loss": -5.499122619628906, "global_step": 32702, "epoch": 778} {"train_loss": -5.629364490509033, "global_step": 32703, "epoch": 778} {"train_loss": -5.549478530883789, "global_step": 32704, "epoch": 778} {"train_loss": -5.502241134643555, "global_step": 32705, "epoch": 778} {"train_loss": -5.435171127319336, "global_step": 32706, "epoch": 778} {"train_loss": -5.610359191894531, "global_step": 32707, "epoch": 778} {"train_loss": -5.4328179359436035, "global_step": 32708, "epoch": 778} {"train_loss": -5.400773525238037, "global_step": 32709, "epoch": 778} {"train_loss": -5.482882976531982, "global_step": 32710, "epoch": 778} {"train_loss": -5.419436931610107, "global_step": 32711, "epoch": 778} {"train_loss": -5.455039978027344, "global_step": 32712, "epoch": 778} {"train_loss": -5.682759761810303, "global_step": 32713, "epoch": 778} {"train_loss": -5.512914657592773, "global_step": 32714, "epoch": 778} {"train_loss": -5.546424865722656, "global_step": 32715, "epoch": 778} {"train_loss": -5.533249855041504, "global_step": 32716, "epoch": 778} {"train_loss": -5.5208943003699895, "global_step": 32717, "epoch": 778, "val_loss": 74565.1875} {"train_loss": -5.677404403686523, "global_step": 32718, "epoch": 779} {"train_loss": -5.380908012390137, "global_step": 32719, "epoch": 779} {"train_loss": -5.474992752075195, "global_step": 32720, "epoch": 779} {"train_loss": -5.561277389526367, "global_step": 32721, "epoch": 779} {"train_loss": -5.495752811431885, "global_step": 32722, "epoch": 779} {"train_loss": -5.3460917472839355, "global_step": 32723, "epoch": 779} {"train_loss": -5.507037162780762, "global_step": 32724, "epoch": 779} {"train_loss": -5.488466262817383, "global_step": 32725, "epoch": 779} {"train_loss": -5.518441200256348, "global_step": 32726, "epoch": 779} {"train_loss": -5.506486892700195, "global_step": 32727, "epoch": 779} {"train_loss": -5.609827518463135, "global_step": 32728, "epoch": 779} {"train_loss": -5.5458550453186035, "global_step": 32729, "epoch": 779} {"train_loss": -5.520362377166748, "global_step": 32730, "epoch": 779} {"train_loss": -5.633033752441406, "global_step": 32731, "epoch": 779} {"train_loss": -5.686796188354492, "global_step": 32732, "epoch": 779} {"train_loss": -5.5553388595581055, "global_step": 32733, "epoch": 779} {"train_loss": -5.451639652252197, "global_step": 32734, "epoch": 779} {"train_loss": -5.5194878578186035, "global_step": 32735, "epoch": 779} {"train_loss": -5.445742130279541, "global_step": 32736, "epoch": 779} {"train_loss": -5.449288845062256, "global_step": 32737, "epoch": 779} {"train_loss": -5.561537742614746, "global_step": 32738, "epoch": 779} {"train_loss": -5.44233512878418, "global_step": 32739, "epoch": 779} {"train_loss": -5.522869110107422, "global_step": 32740, "epoch": 779} {"train_loss": -5.4107160568237305, "global_step": 32741, "epoch": 779} {"train_loss": -5.528589248657227, "global_step": 32742, "epoch": 779} {"train_loss": -5.521183967590332, "global_step": 32743, "epoch": 779} {"train_loss": -5.455050945281982, "global_step": 32744, "epoch": 779} {"train_loss": -5.547996520996094, "global_step": 32745, "epoch": 779} {"train_loss": -5.4820098876953125, "global_step": 32746, "epoch": 779} {"train_loss": -5.439344882965088, "global_step": 32747, "epoch": 779} {"train_loss": -5.525094985961914, "global_step": 32748, "epoch": 779} {"train_loss": -5.478528022766113, "global_step": 32749, "epoch": 779} {"train_loss": -5.591365337371826, "global_step": 32750, "epoch": 779} {"train_loss": -5.656491279602051, "global_step": 32751, "epoch": 779} {"train_loss": -5.357166290283203, "global_step": 32752, "epoch": 779} {"train_loss": -5.455255508422852, "global_step": 32753, "epoch": 779} {"train_loss": -5.40465784072876, "global_step": 32754, "epoch": 779} {"train_loss": -5.373983383178711, "global_step": 32755, "epoch": 779} {"train_loss": -5.41806173324585, "global_step": 32756, "epoch": 779} {"train_loss": -5.547995567321777, "global_step": 32757, "epoch": 779} {"train_loss": -5.511777877807617, "global_step": 32758, "epoch": 779} {"train_loss": -5.503710247221447, "global_step": 32759, "epoch": 779, "val_loss": 74645.296875} {"train_loss": -5.501214027404785, "global_step": 32760, "epoch": 780} {"train_loss": -5.302270412445068, "global_step": 32761, "epoch": 780} {"train_loss": -5.616876602172852, "global_step": 32762, "epoch": 780} {"train_loss": -5.504341125488281, "global_step": 32763, "epoch": 780} {"train_loss": -5.452968597412109, "global_step": 32764, "epoch": 780} {"train_loss": -5.326503753662109, "global_step": 32765, "epoch": 780} {"train_loss": -5.452597618103027, "global_step": 32766, "epoch": 780} {"train_loss": -5.1628265380859375, "global_step": 32767, "epoch": 780} {"train_loss": -5.3472771644592285, "global_step": 32768, "epoch": 780} {"train_loss": -5.440007209777832, "global_step": 32769, "epoch": 780} {"train_loss": -5.490571022033691, "global_step": 32770, "epoch": 780} {"train_loss": -5.280830383300781, "global_step": 32771, "epoch": 780} {"train_loss": -5.439905166625977, "global_step": 32772, "epoch": 780} {"train_loss": -5.442880630493164, "global_step": 32773, "epoch": 780} {"train_loss": -5.335646629333496, "global_step": 32774, "epoch": 780} {"train_loss": -5.486909866333008, "global_step": 32775, "epoch": 780} {"train_loss": -5.366739273071289, "global_step": 32776, "epoch": 780} {"train_loss": -5.436373710632324, "global_step": 32777, "epoch": 780} {"train_loss": -5.296491622924805, "global_step": 32778, "epoch": 780} {"train_loss": -5.478029251098633, "global_step": 32779, "epoch": 780} {"train_loss": -5.452746868133545, "global_step": 32780, "epoch": 780} {"train_loss": -5.400259971618652, "global_step": 32781, "epoch": 780} {"train_loss": -5.388404846191406, "global_step": 32782, "epoch": 780} {"train_loss": -5.451821327209473, "global_step": 32783, "epoch": 780} {"train_loss": -5.338417053222656, "global_step": 32784, "epoch": 780} {"train_loss": -5.477287292480469, "global_step": 32785, "epoch": 780} {"train_loss": -5.5108160972595215, "global_step": 32786, "epoch": 780} {"train_loss": -5.432539939880371, "global_step": 32787, "epoch": 780} {"train_loss": -5.385345458984375, "global_step": 32788, "epoch": 780} {"train_loss": -5.678584098815918, "global_step": 32789, "epoch": 780} {"train_loss": -5.5025858879089355, "global_step": 32790, "epoch": 780} {"train_loss": -5.5284423828125, "global_step": 32791, "epoch": 780} {"train_loss": -5.613931179046631, "global_step": 32792, "epoch": 780} {"train_loss": -5.5862717628479, "global_step": 32793, "epoch": 780} {"train_loss": -5.453742027282715, "global_step": 32794, "epoch": 780} {"train_loss": -5.5143938064575195, "global_step": 32795, "epoch": 780} {"train_loss": -5.482003211975098, "global_step": 32796, "epoch": 780} {"train_loss": -5.4789958000183105, "global_step": 32797, "epoch": 780} {"train_loss": -5.4496564865112305, "global_step": 32798, "epoch": 780} {"train_loss": -5.62934684753418, "global_step": 32799, "epoch": 780} {"train_loss": -5.449703693389893, "global_step": 32800, "epoch": 780} {"train_loss": -5.446854795728411, "global_step": 32801, "epoch": 780, "val_loss": 73799.328125} {"train_loss": -5.601766109466553, "global_step": 32802, "epoch": 781} {"train_loss": -5.50624942779541, "global_step": 32803, "epoch": 781} {"train_loss": -5.470120429992676, "global_step": 32804, "epoch": 781} {"train_loss": -5.554152011871338, "global_step": 32805, "epoch": 781} {"train_loss": -5.465568542480469, "global_step": 32806, "epoch": 781} {"train_loss": -5.585790157318115, "global_step": 32807, "epoch": 781} {"train_loss": -5.563436508178711, "global_step": 32808, "epoch": 781} {"train_loss": -5.471806526184082, "global_step": 32809, "epoch": 781} {"train_loss": -5.580313682556152, "global_step": 32810, "epoch": 781} {"train_loss": -5.430600643157959, "global_step": 32811, "epoch": 781} {"train_loss": -5.530203342437744, "global_step": 32812, "epoch": 781} {"train_loss": -5.507184028625488, "global_step": 32813, "epoch": 781} {"train_loss": -5.514618396759033, "global_step": 32814, "epoch": 781} {"train_loss": -5.490841865539551, "global_step": 32815, "epoch": 781} {"train_loss": -5.602458953857422, "global_step": 32816, "epoch": 781} {"train_loss": -5.553910732269287, "global_step": 32817, "epoch": 781} {"train_loss": -5.4665727615356445, "global_step": 32818, "epoch": 781} {"train_loss": -5.476690292358398, "global_step": 32819, "epoch": 781} {"train_loss": -5.53709077835083, "global_step": 32820, "epoch": 781} {"train_loss": -5.558743476867676, "global_step": 32821, "epoch": 781} {"train_loss": -5.507513046264648, "global_step": 32822, "epoch": 781} {"train_loss": -5.53233528137207, "global_step": 32823, "epoch": 781} {"train_loss": -5.576231002807617, "global_step": 32824, "epoch": 781} {"train_loss": -5.703451633453369, "global_step": 32825, "epoch": 781} {"train_loss": -5.448586463928223, "global_step": 32826, "epoch": 781} {"train_loss": -5.487949848175049, "global_step": 32827, "epoch": 781} {"train_loss": -5.619182586669922, "global_step": 32828, "epoch": 781} {"train_loss": -5.555505275726318, "global_step": 32829, "epoch": 781} {"train_loss": -5.435371398925781, "global_step": 32830, "epoch": 781} {"train_loss": -5.522996425628662, "global_step": 32831, "epoch": 781} {"train_loss": -5.4815673828125, "global_step": 32832, "epoch": 781} {"train_loss": -5.518782615661621, "global_step": 32833, "epoch": 781} {"train_loss": -5.524841785430908, "global_step": 32834, "epoch": 781} {"train_loss": -5.618679046630859, "global_step": 32835, "epoch": 781} {"train_loss": -5.624983787536621, "global_step": 32836, "epoch": 781} {"train_loss": -5.406345367431641, "global_step": 32837, "epoch": 781} {"train_loss": -5.513914108276367, "global_step": 32838, "epoch": 781} {"train_loss": -5.501021385192871, "global_step": 32839, "epoch": 781} {"train_loss": -5.498991966247559, "global_step": 32840, "epoch": 781} {"train_loss": -5.605964660644531, "global_step": 32841, "epoch": 781} {"train_loss": -5.488279819488525, "global_step": 32842, "epoch": 781} {"train_loss": -5.5214594432285855, "global_step": 32843, "epoch": 781, "val_loss": 74750.2578125} {"train_loss": -5.38138484954834, "global_step": 32844, "epoch": 782} {"train_loss": -5.5091376304626465, "global_step": 32845, "epoch": 782} {"train_loss": -5.31124210357666, "global_step": 32846, "epoch": 782} {"train_loss": -5.461421966552734, "global_step": 32847, "epoch": 782} {"train_loss": -5.562478065490723, "global_step": 32848, "epoch": 782} {"train_loss": -5.4346113204956055, "global_step": 32849, "epoch": 782} {"train_loss": -5.409204483032227, "global_step": 32850, "epoch": 782} {"train_loss": -5.602947235107422, "global_step": 32851, "epoch": 782} {"train_loss": -5.559922218322754, "global_step": 32852, "epoch": 782} {"train_loss": -5.600613117218018, "global_step": 32853, "epoch": 782} {"train_loss": -5.497445583343506, "global_step": 32854, "epoch": 782} {"train_loss": -5.508430480957031, "global_step": 32855, "epoch": 782} {"train_loss": -5.3927836418151855, "global_step": 32856, "epoch": 782} {"train_loss": -5.403735160827637, "global_step": 32857, "epoch": 782} {"train_loss": -5.517871856689453, "global_step": 32858, "epoch": 782} {"train_loss": -5.6110100746154785, "global_step": 32859, "epoch": 782} {"train_loss": -5.405532360076904, "global_step": 32860, "epoch": 782} {"train_loss": -5.532790184020996, "global_step": 32861, "epoch": 782} {"train_loss": -5.499190330505371, "global_step": 32862, "epoch": 782} {"train_loss": -5.468587398529053, "global_step": 32863, "epoch": 782} {"train_loss": -5.499727249145508, "global_step": 32864, "epoch": 782} {"train_loss": -5.617314338684082, "global_step": 32865, "epoch": 782} {"train_loss": -5.537985801696777, "global_step": 32866, "epoch": 782} {"train_loss": -5.533820152282715, "global_step": 32867, "epoch": 782} {"train_loss": -5.554224967956543, "global_step": 32868, "epoch": 782} {"train_loss": -5.63604211807251, "global_step": 32869, "epoch": 782} {"train_loss": -5.4343581199646, "global_step": 32870, "epoch": 782} {"train_loss": -5.541007995605469, "global_step": 32871, "epoch": 782} {"train_loss": -5.571467399597168, "global_step": 32872, "epoch": 782} {"train_loss": -5.5132527351379395, "global_step": 32873, "epoch": 782} {"train_loss": -5.44277286529541, "global_step": 32874, "epoch": 782} {"train_loss": -5.606019020080566, "global_step": 32875, "epoch": 782} {"train_loss": -5.429818153381348, "global_step": 32876, "epoch": 782} {"train_loss": -5.584355354309082, "global_step": 32877, "epoch": 782} {"train_loss": -5.493657112121582, "global_step": 32878, "epoch": 782} {"train_loss": -5.442078590393066, "global_step": 32879, "epoch": 782} {"train_loss": -5.541642189025879, "global_step": 32880, "epoch": 782} {"train_loss": -5.609628677368164, "global_step": 32881, "epoch": 782} {"train_loss": -5.555391311645508, "global_step": 32882, "epoch": 782} {"train_loss": -5.457049369812012, "global_step": 32883, "epoch": 782} {"train_loss": -5.622910499572754, "global_step": 32884, "epoch": 782} {"train_loss": -5.511813947132656, "global_step": 32885, "epoch": 782, "val_loss": 74655.6875} {"train_loss": -5.444521903991699, "global_step": 32886, "epoch": 783} {"train_loss": -5.496673583984375, "global_step": 32887, "epoch": 783} {"train_loss": -5.4710893630981445, "global_step": 32888, "epoch": 783} {"train_loss": -5.507835388183594, "global_step": 32889, "epoch": 783} {"train_loss": -5.520356178283691, "global_step": 32890, "epoch": 783} {"train_loss": -5.517899513244629, "global_step": 32891, "epoch": 783} {"train_loss": -5.426002502441406, "global_step": 32892, "epoch": 783} {"train_loss": -5.55587911605835, "global_step": 32893, "epoch": 783} {"train_loss": -5.532237529754639, "global_step": 32894, "epoch": 783} {"train_loss": -5.4841437339782715, "global_step": 32895, "epoch": 783} {"train_loss": -5.67063570022583, "global_step": 32896, "epoch": 783} {"train_loss": -5.560723304748535, "global_step": 32897, "epoch": 783} {"train_loss": -5.519391059875488, "global_step": 32898, "epoch": 783} {"train_loss": -5.530941963195801, "global_step": 32899, "epoch": 783} {"train_loss": -5.634607315063477, "global_step": 32900, "epoch": 783} {"train_loss": -5.5534820556640625, "global_step": 32901, "epoch": 783} {"train_loss": -5.367712020874023, "global_step": 32902, "epoch": 783} {"train_loss": -5.659917831420898, "global_step": 32903, "epoch": 783} {"train_loss": -5.615294456481934, "global_step": 32904, "epoch": 783} {"train_loss": -5.4368367195129395, "global_step": 32905, "epoch": 783} {"train_loss": -5.601014137268066, "global_step": 32906, "epoch": 783} {"train_loss": -5.475580215454102, "global_step": 32907, "epoch": 783} {"train_loss": -5.5900163650512695, "global_step": 32908, "epoch": 783} {"train_loss": -5.4915266036987305, "global_step": 32909, "epoch": 783} {"train_loss": -5.3990373611450195, "global_step": 32910, "epoch": 783} {"train_loss": -5.519412517547607, "global_step": 32911, "epoch": 783} {"train_loss": -5.478297710418701, "global_step": 32912, "epoch": 783} {"train_loss": -5.657370090484619, "global_step": 32913, "epoch": 783} {"train_loss": -5.59277868270874, "global_step": 32914, "epoch": 783} {"train_loss": -5.542870044708252, "global_step": 32915, "epoch": 783} {"train_loss": -5.552346229553223, "global_step": 32916, "epoch": 783} {"train_loss": -5.614846229553223, "global_step": 32917, "epoch": 783} {"train_loss": -5.583587646484375, "global_step": 32918, "epoch": 783} {"train_loss": -5.5263166427612305, "global_step": 32919, "epoch": 783} {"train_loss": -5.549208164215088, "global_step": 32920, "epoch": 783} {"train_loss": -5.639479637145996, "global_step": 32921, "epoch": 783} {"train_loss": -5.493801116943359, "global_step": 32922, "epoch": 783} {"train_loss": -5.4756975173950195, "global_step": 32923, "epoch": 783} {"train_loss": -5.537816047668457, "global_step": 32924, "epoch": 783} {"train_loss": -5.460389137268066, "global_step": 32925, "epoch": 783} {"train_loss": -5.577793598175049, "global_step": 32926, "epoch": 783} {"train_loss": -5.532860017958141, "global_step": 32927, "epoch": 783, "val_loss": 75047.1953125} {"train_loss": -5.475700855255127, "global_step": 32928, "epoch": 784} {"train_loss": -5.635310173034668, "global_step": 32929, "epoch": 784} {"train_loss": -5.470179080963135, "global_step": 32930, "epoch": 784} {"train_loss": -5.42203950881958, "global_step": 32931, "epoch": 784} {"train_loss": -5.643650054931641, "global_step": 32932, "epoch": 784} {"train_loss": -5.6598687171936035, "global_step": 32933, "epoch": 784} {"train_loss": -5.546176433563232, "global_step": 32934, "epoch": 784} {"train_loss": -5.435360431671143, "global_step": 32935, "epoch": 784} {"train_loss": -5.713332653045654, "global_step": 32936, "epoch": 784} {"train_loss": -5.541849136352539, "global_step": 32937, "epoch": 784} {"train_loss": -5.398615837097168, "global_step": 32938, "epoch": 784} {"train_loss": -5.441971778869629, "global_step": 32939, "epoch": 784} {"train_loss": -5.695903301239014, "global_step": 32940, "epoch": 784} {"train_loss": -5.452025413513184, "global_step": 32941, "epoch": 784} {"train_loss": -5.317394733428955, "global_step": 32942, "epoch": 784} {"train_loss": -5.54495906829834, "global_step": 32943, "epoch": 784} {"train_loss": -5.272187232971191, "global_step": 32944, "epoch": 784} {"train_loss": -5.618930816650391, "global_step": 32945, "epoch": 784} {"train_loss": -5.464970111846924, "global_step": 32946, "epoch": 784} {"train_loss": -5.290383815765381, "global_step": 32947, "epoch": 784} {"train_loss": -5.485500335693359, "global_step": 32948, "epoch": 784} {"train_loss": -5.373903751373291, "global_step": 32949, "epoch": 784} {"train_loss": -5.521448135375977, "global_step": 32950, "epoch": 784} {"train_loss": -5.501254081726074, "global_step": 32951, "epoch": 784} {"train_loss": -5.42611026763916, "global_step": 32952, "epoch": 784} {"train_loss": -5.612983226776123, "global_step": 32953, "epoch": 784} {"train_loss": -5.631019115447998, "global_step": 32954, "epoch": 784} {"train_loss": -5.403988838195801, "global_step": 32955, "epoch": 784} {"train_loss": -5.625615119934082, "global_step": 32956, "epoch": 784} {"train_loss": -5.371190547943115, "global_step": 32957, "epoch": 784} {"train_loss": -5.487924575805664, "global_step": 32958, "epoch": 784} {"train_loss": -5.513249397277832, "global_step": 32959, "epoch": 784} {"train_loss": -5.298474311828613, "global_step": 32960, "epoch": 784} {"train_loss": -5.5394606590271, "global_step": 32961, "epoch": 784} {"train_loss": -5.423415184020996, "global_step": 32962, "epoch": 784} {"train_loss": -5.365679740905762, "global_step": 32963, "epoch": 784} {"train_loss": -5.592529296875, "global_step": 32964, "epoch": 784} {"train_loss": -5.617945671081543, "global_step": 32965, "epoch": 784} {"train_loss": -5.517956733703613, "global_step": 32966, "epoch": 784} {"train_loss": -5.588313102722168, "global_step": 32967, "epoch": 784} {"train_loss": -5.508414268493652, "global_step": 32968, "epoch": 784} {"train_loss": -5.499927202860515, "global_step": 32969, "epoch": 784, "val_loss": 74274.7578125} {"train_loss": -5.534519672393799, "global_step": 32970, "epoch": 785} {"train_loss": -5.6453447341918945, "global_step": 32971, "epoch": 785} {"train_loss": -5.465328216552734, "global_step": 32972, "epoch": 785} {"train_loss": -5.608242034912109, "global_step": 32973, "epoch": 785} {"train_loss": -5.572767734527588, "global_step": 32974, "epoch": 785} {"train_loss": -5.5215606689453125, "global_step": 32975, "epoch": 785} {"train_loss": -5.487663745880127, "global_step": 32976, "epoch": 785} {"train_loss": -5.577070236206055, "global_step": 32977, "epoch": 785} {"train_loss": -5.533284664154053, "global_step": 32978, "epoch": 785} {"train_loss": -5.490523338317871, "global_step": 32979, "epoch": 785} {"train_loss": -5.352638244628906, "global_step": 32980, "epoch": 785} {"train_loss": -5.460234642028809, "global_step": 32981, "epoch": 785} {"train_loss": -5.462370872497559, "global_step": 32982, "epoch": 785} {"train_loss": -5.306792736053467, "global_step": 32983, "epoch": 785} {"train_loss": -5.510455131530762, "global_step": 32984, "epoch": 785} {"train_loss": -5.409686088562012, "global_step": 32985, "epoch": 785} {"train_loss": -5.415299892425537, "global_step": 32986, "epoch": 785} {"train_loss": -5.544266223907471, "global_step": 32987, "epoch": 785} {"train_loss": -5.419355392456055, "global_step": 32988, "epoch": 785} {"train_loss": -5.620477676391602, "global_step": 32989, "epoch": 785} {"train_loss": -5.39539098739624, "global_step": 32990, "epoch": 785} {"train_loss": -5.466852188110352, "global_step": 32991, "epoch": 785} {"train_loss": -5.516149997711182, "global_step": 32992, "epoch": 785} {"train_loss": -5.414848327636719, "global_step": 32993, "epoch": 785} {"train_loss": -5.565427780151367, "global_step": 32994, "epoch": 785} {"train_loss": -5.441498756408691, "global_step": 32995, "epoch": 785} {"train_loss": -5.41909122467041, "global_step": 32996, "epoch": 785} {"train_loss": -5.558966636657715, "global_step": 32997, "epoch": 785} {"train_loss": -5.627943992614746, "global_step": 32998, "epoch": 785} {"train_loss": -5.489529609680176, "global_step": 32999, "epoch": 785} {"train_loss": -5.572464466094971, "global_step": 33000, "epoch": 785} {"train_loss": -5.450756072998047, "global_step": 33001, "epoch": 785} {"train_loss": -5.399312973022461, "global_step": 33002, "epoch": 785} {"train_loss": -5.653245449066162, "global_step": 33003, "epoch": 785} {"train_loss": -5.595813751220703, "global_step": 33004, "epoch": 785} {"train_loss": -5.488829135894775, "global_step": 33005, "epoch": 785} {"train_loss": -5.522584915161133, "global_step": 33006, "epoch": 785} {"train_loss": -5.4156670570373535, "global_step": 33007, "epoch": 785} {"train_loss": -5.451570987701416, "global_step": 33008, "epoch": 785} {"train_loss": -5.591023921966553, "global_step": 33009, "epoch": 785} {"train_loss": -5.438209056854248, "global_step": 33010, "epoch": 785} {"train_loss": -5.496580680211385, "global_step": 33011, "epoch": 785, "val_loss": 74435.25} {"train_loss": -5.365148544311523, "global_step": 33012, "epoch": 786} {"train_loss": -5.495216369628906, "global_step": 33013, "epoch": 786} {"train_loss": -5.696944713592529, "global_step": 33014, "epoch": 786} {"train_loss": -5.682369232177734, "global_step": 33015, "epoch": 786} {"train_loss": -5.526954650878906, "global_step": 33016, "epoch": 786} {"train_loss": -5.353476524353027, "global_step": 33017, "epoch": 786} {"train_loss": -5.446688652038574, "global_step": 33018, "epoch": 786} {"train_loss": -5.337332248687744, "global_step": 33019, "epoch": 786} {"train_loss": -5.566158294677734, "global_step": 33020, "epoch": 786} {"train_loss": -5.422714710235596, "global_step": 33021, "epoch": 786} {"train_loss": -5.614686489105225, "global_step": 33022, "epoch": 786} {"train_loss": -5.546640396118164, "global_step": 33023, "epoch": 786} {"train_loss": -5.619740962982178, "global_step": 33024, "epoch": 786} {"train_loss": -5.615230560302734, "global_step": 33025, "epoch": 786} {"train_loss": -5.5917205810546875, "global_step": 33026, "epoch": 786} {"train_loss": -5.62399959564209, "global_step": 33027, "epoch": 786} {"train_loss": -5.466383934020996, "global_step": 33028, "epoch": 786} {"train_loss": -5.444131851196289, "global_step": 33029, "epoch": 786} {"train_loss": -5.654610633850098, "global_step": 33030, "epoch": 786} {"train_loss": -5.469498157501221, "global_step": 33031, "epoch": 786} {"train_loss": -5.381830215454102, "global_step": 33032, "epoch": 786} {"train_loss": -5.593550205230713, "global_step": 33033, "epoch": 786} {"train_loss": -5.533878803253174, "global_step": 33034, "epoch": 786} {"train_loss": -5.610568046569824, "global_step": 33035, "epoch": 786} {"train_loss": -5.43997049331665, "global_step": 33036, "epoch": 786} {"train_loss": -5.600874423980713, "global_step": 33037, "epoch": 786} {"train_loss": -5.57429313659668, "global_step": 33038, "epoch": 786} {"train_loss": -5.568259239196777, "global_step": 33039, "epoch": 786} {"train_loss": -5.5138044357299805, "global_step": 33040, "epoch": 786} {"train_loss": -5.52801513671875, "global_step": 33041, "epoch": 786} {"train_loss": -5.486309051513672, "global_step": 33042, "epoch": 786} {"train_loss": -5.454643249511719, "global_step": 33043, "epoch": 786} {"train_loss": -5.455385208129883, "global_step": 33044, "epoch": 786} {"train_loss": -5.5796098709106445, "global_step": 33045, "epoch": 786} {"train_loss": -5.628802299499512, "global_step": 33046, "epoch": 786} {"train_loss": -5.5270843505859375, "global_step": 33047, "epoch": 786} {"train_loss": -5.376582622528076, "global_step": 33048, "epoch": 786} {"train_loss": -5.489415645599365, "global_step": 33049, "epoch": 786} {"train_loss": -5.587507247924805, "global_step": 33050, "epoch": 786} {"train_loss": -5.434948444366455, "global_step": 33051, "epoch": 786} {"train_loss": -5.429859161376953, "global_step": 33052, "epoch": 786} {"train_loss": -5.521899552572341, "global_step": 33053, "epoch": 786, "val_loss": 73827.375} {"train_loss": -5.488550186157227, "global_step": 33054, "epoch": 787} {"train_loss": -5.4600830078125, "global_step": 33055, "epoch": 787} {"train_loss": -5.394388198852539, "global_step": 33056, "epoch": 787} {"train_loss": -5.636701583862305, "global_step": 33057, "epoch": 787} {"train_loss": -5.544642448425293, "global_step": 33058, "epoch": 787} {"train_loss": -5.571599006652832, "global_step": 33059, "epoch": 787} {"train_loss": -5.639786720275879, "global_step": 33060, "epoch": 787} {"train_loss": -5.437961101531982, "global_step": 33061, "epoch": 787} {"train_loss": -5.594897747039795, "global_step": 33062, "epoch": 787} {"train_loss": -5.649482250213623, "global_step": 33063, "epoch": 787} {"train_loss": -5.532268047332764, "global_step": 33064, "epoch": 787} {"train_loss": -5.576904296875, "global_step": 33065, "epoch": 787} {"train_loss": -5.485721111297607, "global_step": 33066, "epoch": 787} {"train_loss": -5.500054359436035, "global_step": 33067, "epoch": 787} {"train_loss": -5.563313961029053, "global_step": 33068, "epoch": 787} {"train_loss": -5.541409492492676, "global_step": 33069, "epoch": 787} {"train_loss": -5.521402835845947, "global_step": 33070, "epoch": 787} {"train_loss": -5.483166217803955, "global_step": 33071, "epoch": 787} {"train_loss": -5.56501579284668, "global_step": 33072, "epoch": 787} {"train_loss": -5.497683525085449, "global_step": 33073, "epoch": 787} {"train_loss": -5.581048965454102, "global_step": 33074, "epoch": 787} {"train_loss": -5.433071136474609, "global_step": 33075, "epoch": 787} {"train_loss": -5.615296840667725, "global_step": 33076, "epoch": 787} {"train_loss": -5.487412929534912, "global_step": 33077, "epoch": 787} {"train_loss": -5.454465389251709, "global_step": 33078, "epoch": 787} {"train_loss": -5.412506580352783, "global_step": 33079, "epoch": 787} {"train_loss": -5.544123649597168, "global_step": 33080, "epoch": 787} {"train_loss": -5.3621978759765625, "global_step": 33081, "epoch": 787} {"train_loss": -5.5608978271484375, "global_step": 33082, "epoch": 787} {"train_loss": -5.446758270263672, "global_step": 33083, "epoch": 787} {"train_loss": -5.340654373168945, "global_step": 33084, "epoch": 787} {"train_loss": -5.604921340942383, "global_step": 33085, "epoch": 787} {"train_loss": -5.3843231201171875, "global_step": 33086, "epoch": 787} {"train_loss": -5.460333347320557, "global_step": 33087, "epoch": 787} {"train_loss": -5.460914611816406, "global_step": 33088, "epoch": 787} {"train_loss": -5.337010860443115, "global_step": 33089, "epoch": 787} {"train_loss": -5.629289627075195, "global_step": 33090, "epoch": 787} {"train_loss": -5.506298065185547, "global_step": 33091, "epoch": 787} {"train_loss": -5.496432304382324, "global_step": 33092, "epoch": 787} {"train_loss": -5.628034591674805, "global_step": 33093, "epoch": 787} {"train_loss": -5.644894599914551, "global_step": 33094, "epoch": 787} {"train_loss": -5.517459358487811, "global_step": 33095, "epoch": 787, "val_loss": 74301.234375} {"train_loss": -5.505254745483398, "global_step": 33096, "epoch": 788} {"train_loss": -5.411370277404785, "global_step": 33097, "epoch": 788} {"train_loss": -5.61036491394043, "global_step": 33098, "epoch": 788} {"train_loss": -5.43266487121582, "global_step": 33099, "epoch": 788} {"train_loss": -5.547336101531982, "global_step": 33100, "epoch": 788} {"train_loss": -5.4570631980896, "global_step": 33101, "epoch": 788} {"train_loss": -5.5164031982421875, "global_step": 33102, "epoch": 788} {"train_loss": -5.479775428771973, "global_step": 33103, "epoch": 788} {"train_loss": -5.478410720825195, "global_step": 33104, "epoch": 788} {"train_loss": -5.478038311004639, "global_step": 33105, "epoch": 788} {"train_loss": -5.5622358322143555, "global_step": 33106, "epoch": 788} {"train_loss": -5.590136528015137, "global_step": 33107, "epoch": 788} {"train_loss": -5.504986763000488, "global_step": 33108, "epoch": 788} {"train_loss": -5.566179275512695, "global_step": 33109, "epoch": 788} {"train_loss": -5.552241802215576, "global_step": 33110, "epoch": 788} {"train_loss": -5.590765953063965, "global_step": 33111, "epoch": 788} {"train_loss": -5.614185333251953, "global_step": 33112, "epoch": 788} {"train_loss": -5.566609859466553, "global_step": 33113, "epoch": 788} {"train_loss": -5.4793572425842285, "global_step": 33114, "epoch": 788} {"train_loss": -5.50490665435791, "global_step": 33115, "epoch": 788} {"train_loss": -5.574582576751709, "global_step": 33116, "epoch": 788} {"train_loss": -5.401373863220215, "global_step": 33117, "epoch": 788} {"train_loss": -5.756454944610596, "global_step": 33118, "epoch": 788} {"train_loss": -5.387789249420166, "global_step": 33119, "epoch": 788} {"train_loss": -5.290322303771973, "global_step": 33120, "epoch": 788} {"train_loss": -5.4849395751953125, "global_step": 33121, "epoch": 788} {"train_loss": -5.415889739990234, "global_step": 33122, "epoch": 788} {"train_loss": -5.221010208129883, "global_step": 33123, "epoch": 788} {"train_loss": -5.581160545349121, "global_step": 33124, "epoch": 788} {"train_loss": -5.455479621887207, "global_step": 33125, "epoch": 788} {"train_loss": -5.327418327331543, "global_step": 33126, "epoch": 788} {"train_loss": -5.598230361938477, "global_step": 33127, "epoch": 788} {"train_loss": -5.352095603942871, "global_step": 33128, "epoch": 788} {"train_loss": -5.412448883056641, "global_step": 33129, "epoch": 788} {"train_loss": -5.326745986938477, "global_step": 33130, "epoch": 788} {"train_loss": -5.396763801574707, "global_step": 33131, "epoch": 788} {"train_loss": -5.446381568908691, "global_step": 33132, "epoch": 788} {"train_loss": -5.337991237640381, "global_step": 33133, "epoch": 788} {"train_loss": -5.5728983879089355, "global_step": 33134, "epoch": 788} {"train_loss": -5.41811466217041, "global_step": 33135, "epoch": 788} {"train_loss": -5.462878227233887, "global_step": 33136, "epoch": 788} {"train_loss": -5.479807921818325, "global_step": 33137, "epoch": 788, "val_loss": 75016.8046875} {"train_loss": -5.523303508758545, "global_step": 33138, "epoch": 789} {"train_loss": -5.448942184448242, "global_step": 33139, "epoch": 789} {"train_loss": -5.485220909118652, "global_step": 33140, "epoch": 789} {"train_loss": -5.4818034172058105, "global_step": 33141, "epoch": 789} {"train_loss": -5.565203666687012, "global_step": 33142, "epoch": 789} {"train_loss": -5.622954845428467, "global_step": 33143, "epoch": 789} {"train_loss": -5.479055404663086, "global_step": 33144, "epoch": 789} {"train_loss": -5.507116317749023, "global_step": 33145, "epoch": 789} {"train_loss": -5.539162635803223, "global_step": 33146, "epoch": 789} {"train_loss": -5.399111747741699, "global_step": 33147, "epoch": 789} {"train_loss": -5.45751953125, "global_step": 33148, "epoch": 789} {"train_loss": -5.479377746582031, "global_step": 33149, "epoch": 789} {"train_loss": -5.481086730957031, "global_step": 33150, "epoch": 789} {"train_loss": -5.551026821136475, "global_step": 33151, "epoch": 789} {"train_loss": -5.535833358764648, "global_step": 33152, "epoch": 789} {"train_loss": -5.525603294372559, "global_step": 33153, "epoch": 789} {"train_loss": -5.44441032409668, "global_step": 33154, "epoch": 789} {"train_loss": -5.550238609313965, "global_step": 33155, "epoch": 789} {"train_loss": -5.576980113983154, "global_step": 33156, "epoch": 789} {"train_loss": -5.537332534790039, "global_step": 33157, "epoch": 789} {"train_loss": -5.439288139343262, "global_step": 33158, "epoch": 789} {"train_loss": -5.640157699584961, "global_step": 33159, "epoch": 789} {"train_loss": -5.47159481048584, "global_step": 33160, "epoch": 789} {"train_loss": -5.4351043701171875, "global_step": 33161, "epoch": 789} {"train_loss": -5.536250114440918, "global_step": 33162, "epoch": 789} {"train_loss": -5.5199995040893555, "global_step": 33163, "epoch": 789} {"train_loss": -5.533552169799805, "global_step": 33164, "epoch": 789} {"train_loss": -5.598457336425781, "global_step": 33165, "epoch": 789} {"train_loss": -5.660717010498047, "global_step": 33166, "epoch": 789} {"train_loss": -5.518969535827637, "global_step": 33167, "epoch": 789} {"train_loss": -5.628358840942383, "global_step": 33168, "epoch": 789} {"train_loss": -5.529204368591309, "global_step": 33169, "epoch": 789} {"train_loss": -5.483426094055176, "global_step": 33170, "epoch": 789} {"train_loss": -5.565065383911133, "global_step": 33171, "epoch": 789} {"train_loss": -5.503727912902832, "global_step": 33172, "epoch": 789} {"train_loss": -5.661008834838867, "global_step": 33173, "epoch": 789} {"train_loss": -5.480810642242432, "global_step": 33174, "epoch": 789} {"train_loss": -5.54198694229126, "global_step": 33175, "epoch": 789} {"train_loss": -5.465387344360352, "global_step": 33176, "epoch": 789} {"train_loss": -5.447115898132324, "global_step": 33177, "epoch": 789} {"train_loss": -5.351363182067871, "global_step": 33178, "epoch": 789} {"train_loss": -5.517411322820754, "global_step": 33179, "epoch": 789, "val_loss": 74217.03125} {"train_loss": -5.619770050048828, "global_step": 33180, "epoch": 790} {"train_loss": -5.6465301513671875, "global_step": 33181, "epoch": 790} {"train_loss": -5.4199419021606445, "global_step": 33182, "epoch": 790} {"train_loss": -5.577628135681152, "global_step": 33183, "epoch": 790} {"train_loss": -5.550083637237549, "global_step": 33184, "epoch": 790} {"train_loss": -5.588046550750732, "global_step": 33185, "epoch": 790} {"train_loss": -5.49326753616333, "global_step": 33186, "epoch": 790} {"train_loss": -5.580814361572266, "global_step": 33187, "epoch": 790} {"train_loss": -5.562478065490723, "global_step": 33188, "epoch": 790} {"train_loss": -5.456312656402588, "global_step": 33189, "epoch": 790} {"train_loss": -5.5640869140625, "global_step": 33190, "epoch": 790} {"train_loss": -5.5352983474731445, "global_step": 33191, "epoch": 790} {"train_loss": -5.508581161499023, "global_step": 33192, "epoch": 790} {"train_loss": -5.501970291137695, "global_step": 33193, "epoch": 790} {"train_loss": -5.679815292358398, "global_step": 33194, "epoch": 790} {"train_loss": -5.585556983947754, "global_step": 33195, "epoch": 790} {"train_loss": -5.555741786956787, "global_step": 33196, "epoch": 790} {"train_loss": -5.554874420166016, "global_step": 33197, "epoch": 790} {"train_loss": -5.539242744445801, "global_step": 33198, "epoch": 790} {"train_loss": -5.595640659332275, "global_step": 33199, "epoch": 790} {"train_loss": -5.587677955627441, "global_step": 33200, "epoch": 790} {"train_loss": -5.565900802612305, "global_step": 33201, "epoch": 790} {"train_loss": -5.624698162078857, "global_step": 33202, "epoch": 790} {"train_loss": -5.485358238220215, "global_step": 33203, "epoch": 790} {"train_loss": -5.6249799728393555, "global_step": 33204, "epoch": 790} {"train_loss": -5.614459991455078, "global_step": 33205, "epoch": 790} {"train_loss": -5.608047008514404, "global_step": 33206, "epoch": 790} {"train_loss": -5.527694225311279, "global_step": 33207, "epoch": 790} {"train_loss": -5.436093330383301, "global_step": 33208, "epoch": 790} {"train_loss": -5.5617876052856445, "global_step": 33209, "epoch": 790} {"train_loss": -5.581694602966309, "global_step": 33210, "epoch": 790} {"train_loss": -5.3781938552856445, "global_step": 33211, "epoch": 790} {"train_loss": -5.56992769241333, "global_step": 33212, "epoch": 790} {"train_loss": -5.419647216796875, "global_step": 33213, "epoch": 790} {"train_loss": -5.466060638427734, "global_step": 33214, "epoch": 790} {"train_loss": -5.396636009216309, "global_step": 33215, "epoch": 790} {"train_loss": -5.415040493011475, "global_step": 33216, "epoch": 790} {"train_loss": -5.613035202026367, "global_step": 33217, "epoch": 790} {"train_loss": -5.496095657348633, "global_step": 33218, "epoch": 790} {"train_loss": -5.569601058959961, "global_step": 33219, "epoch": 790} {"train_loss": -5.595310688018799, "global_step": 33220, "epoch": 790} {"train_loss": -5.541278498513358, "global_step": 33221, "epoch": 790, "val_loss": 73793.46875} {"train_loss": -5.584367752075195, "global_step": 33222, "epoch": 791} {"train_loss": -5.514614105224609, "global_step": 33223, "epoch": 791} {"train_loss": -5.588794708251953, "global_step": 33224, "epoch": 791} {"train_loss": -5.5273051261901855, "global_step": 33225, "epoch": 791} {"train_loss": -5.624526023864746, "global_step": 33226, "epoch": 791} {"train_loss": -5.487260818481445, "global_step": 33227, "epoch": 791} {"train_loss": -5.619864463806152, "global_step": 33228, "epoch": 791} {"train_loss": -5.424342155456543, "global_step": 33229, "epoch": 791} {"train_loss": -5.511045455932617, "global_step": 33230, "epoch": 791} {"train_loss": -5.3897013664245605, "global_step": 33231, "epoch": 791} {"train_loss": -5.462201118469238, "global_step": 33232, "epoch": 791} {"train_loss": -5.505699634552002, "global_step": 33233, "epoch": 791} {"train_loss": -5.3997273445129395, "global_step": 33234, "epoch": 791} {"train_loss": -5.4394426345825195, "global_step": 33235, "epoch": 791} {"train_loss": -5.521953582763672, "global_step": 33236, "epoch": 791} {"train_loss": -5.392196178436279, "global_step": 33237, "epoch": 791} {"train_loss": -5.556138515472412, "global_step": 33238, "epoch": 791} {"train_loss": -5.5060319900512695, "global_step": 33239, "epoch": 791} {"train_loss": -5.450910568237305, "global_step": 33240, "epoch": 791} {"train_loss": -5.434756278991699, "global_step": 33241, "epoch": 791} {"train_loss": -5.414860725402832, "global_step": 33242, "epoch": 791} {"train_loss": -5.550266265869141, "global_step": 33243, "epoch": 791} {"train_loss": -5.382301330566406, "global_step": 33244, "epoch": 791} {"train_loss": -5.474546909332275, "global_step": 33245, "epoch": 791} {"train_loss": -5.351617336273193, "global_step": 33246, "epoch": 791} {"train_loss": -5.539030075073242, "global_step": 33247, "epoch": 791} {"train_loss": -5.600895404815674, "global_step": 33248, "epoch": 791} {"train_loss": -5.477667808532715, "global_step": 33249, "epoch": 791} {"train_loss": -5.513070583343506, "global_step": 33250, "epoch": 791} {"train_loss": -5.487021446228027, "global_step": 33251, "epoch": 791} {"train_loss": -5.493518829345703, "global_step": 33252, "epoch": 791} {"train_loss": -5.43692684173584, "global_step": 33253, "epoch": 791} {"train_loss": -5.380390167236328, "global_step": 33254, "epoch": 791} {"train_loss": -5.554594993591309, "global_step": 33255, "epoch": 791} {"train_loss": -5.423864841461182, "global_step": 33256, "epoch": 791} {"train_loss": -5.3717241287231445, "global_step": 33257, "epoch": 791} {"train_loss": -5.398929119110107, "global_step": 33258, "epoch": 791} {"train_loss": -5.4473490715026855, "global_step": 33259, "epoch": 791} {"train_loss": -5.522582054138184, "global_step": 33260, "epoch": 791} {"train_loss": -5.3995771408081055, "global_step": 33261, "epoch": 791} {"train_loss": -5.51338005065918, "global_step": 33262, "epoch": 791} {"train_loss": -5.479723158336821, "global_step": 33263, "epoch": 791, "val_loss": 74739.96875} {"train_loss": -5.4542951583862305, "global_step": 33264, "epoch": 792} {"train_loss": -5.589344024658203, "global_step": 33265, "epoch": 792} {"train_loss": -5.482390403747559, "global_step": 33266, "epoch": 792} {"train_loss": -5.385326385498047, "global_step": 33267, "epoch": 792} {"train_loss": -5.50273323059082, "global_step": 33268, "epoch": 792} {"train_loss": -5.601701736450195, "global_step": 33269, "epoch": 792} {"train_loss": -5.423715591430664, "global_step": 33270, "epoch": 792} {"train_loss": -5.442914009094238, "global_step": 33271, "epoch": 792} {"train_loss": -5.348677635192871, "global_step": 33272, "epoch": 792} {"train_loss": -5.502220153808594, "global_step": 33273, "epoch": 792} {"train_loss": -5.577221870422363, "global_step": 33274, "epoch": 792} {"train_loss": -5.495296955108643, "global_step": 33275, "epoch": 792} {"train_loss": -5.35197639465332, "global_step": 33276, "epoch": 792} {"train_loss": -5.4401750564575195, "global_step": 33277, "epoch": 792} {"train_loss": -5.4717631340026855, "global_step": 33278, "epoch": 792} {"train_loss": -5.498231887817383, "global_step": 33279, "epoch": 792} {"train_loss": -5.500746726989746, "global_step": 33280, "epoch": 792} {"train_loss": -5.540005683898926, "global_step": 33281, "epoch": 792} {"train_loss": -5.579665660858154, "global_step": 33282, "epoch": 792} {"train_loss": -5.434750556945801, "global_step": 33283, "epoch": 792} {"train_loss": -5.499465465545654, "global_step": 33284, "epoch": 792} {"train_loss": -5.578882217407227, "global_step": 33285, "epoch": 792} {"train_loss": -5.37300968170166, "global_step": 33286, "epoch": 792} {"train_loss": -5.66588020324707, "global_step": 33287, "epoch": 792} {"train_loss": -5.669689178466797, "global_step": 33288, "epoch": 792} {"train_loss": -5.431413173675537, "global_step": 33289, "epoch": 792} {"train_loss": -5.605889320373535, "global_step": 33290, "epoch": 792} {"train_loss": -5.432132720947266, "global_step": 33291, "epoch": 792} {"train_loss": -5.431779861450195, "global_step": 33292, "epoch": 792} {"train_loss": -5.477196216583252, "global_step": 33293, "epoch": 792} {"train_loss": -5.405606269836426, "global_step": 33294, "epoch": 792} {"train_loss": -5.532711505889893, "global_step": 33295, "epoch": 792} {"train_loss": -5.591605186462402, "global_step": 33296, "epoch": 792} {"train_loss": -5.581144332885742, "global_step": 33297, "epoch": 792} {"train_loss": -5.500770568847656, "global_step": 33298, "epoch": 792} {"train_loss": -5.543536186218262, "global_step": 33299, "epoch": 792} {"train_loss": -5.409087181091309, "global_step": 33300, "epoch": 792} {"train_loss": -5.613463401794434, "global_step": 33301, "epoch": 792} {"train_loss": -5.393001556396484, "global_step": 33302, "epoch": 792} {"train_loss": -5.53233528137207, "global_step": 33303, "epoch": 792} {"train_loss": -5.659970283508301, "global_step": 33304, "epoch": 792} {"train_loss": -5.500707558223179, "global_step": 33305, "epoch": 792, "val_loss": 74470.828125} {"train_loss": -5.578829765319824, "global_step": 33306, "epoch": 793} {"train_loss": -5.624905109405518, "global_step": 33307, "epoch": 793} {"train_loss": -5.52325439453125, "global_step": 33308, "epoch": 793} {"train_loss": -5.5333404541015625, "global_step": 33309, "epoch": 793} {"train_loss": -5.456413269042969, "global_step": 33310, "epoch": 793} {"train_loss": -5.545956611633301, "global_step": 33311, "epoch": 793} {"train_loss": -5.58261775970459, "global_step": 33312, "epoch": 793} {"train_loss": -5.467720985412598, "global_step": 33313, "epoch": 793} {"train_loss": -5.449574947357178, "global_step": 33314, "epoch": 793} {"train_loss": -5.436459541320801, "global_step": 33315, "epoch": 793} {"train_loss": -5.640133857727051, "global_step": 33316, "epoch": 793} {"train_loss": -5.462635517120361, "global_step": 33317, "epoch": 793} {"train_loss": -5.45066499710083, "global_step": 33318, "epoch": 793} {"train_loss": -5.550776481628418, "global_step": 33319, "epoch": 793} {"train_loss": -5.570908546447754, "global_step": 33320, "epoch": 793} {"train_loss": -5.582572937011719, "global_step": 33321, "epoch": 793} {"train_loss": -5.412432670593262, "global_step": 33322, "epoch": 793} {"train_loss": -5.592104911804199, "global_step": 33323, "epoch": 793} {"train_loss": -5.613659858703613, "global_step": 33324, "epoch": 793} {"train_loss": -5.4405951499938965, "global_step": 33325, "epoch": 793} {"train_loss": -5.546385765075684, "global_step": 33326, "epoch": 793} {"train_loss": -5.519347667694092, "global_step": 33327, "epoch": 793} {"train_loss": -5.54530668258667, "global_step": 33328, "epoch": 793} {"train_loss": -5.560288429260254, "global_step": 33329, "epoch": 793} {"train_loss": -5.463163375854492, "global_step": 33330, "epoch": 793} {"train_loss": -5.473379135131836, "global_step": 33331, "epoch": 793} {"train_loss": -5.586033821105957, "global_step": 33332, "epoch": 793} {"train_loss": -5.670668601989746, "global_step": 33333, "epoch": 793} {"train_loss": -5.4828362464904785, "global_step": 33334, "epoch": 793} {"train_loss": -5.560617923736572, "global_step": 33335, "epoch": 793} {"train_loss": -5.5388946533203125, "global_step": 33336, "epoch": 793} {"train_loss": -5.467167854309082, "global_step": 33337, "epoch": 793} {"train_loss": -5.475253582000732, "global_step": 33338, "epoch": 793} {"train_loss": -5.529664993286133, "global_step": 33339, "epoch": 793} {"train_loss": -5.57784366607666, "global_step": 33340, "epoch": 793} {"train_loss": -5.565479278564453, "global_step": 33341, "epoch": 793} {"train_loss": -5.5162529945373535, "global_step": 33342, "epoch": 793} {"train_loss": -5.555098533630371, "global_step": 33343, "epoch": 793} {"train_loss": -5.5420026779174805, "global_step": 33344, "epoch": 793} {"train_loss": -5.552907943725586, "global_step": 33345, "epoch": 793} {"train_loss": -5.526067733764648, "global_step": 33346, "epoch": 793} {"train_loss": -5.532481329781668, "global_step": 33347, "epoch": 793, "val_loss": 74590.8203125} {"train_loss": -5.608479976654053, "global_step": 33348, "epoch": 794} {"train_loss": -5.468780517578125, "global_step": 33349, "epoch": 794} {"train_loss": -5.514678955078125, "global_step": 33350, "epoch": 794} {"train_loss": -5.551421165466309, "global_step": 33351, "epoch": 794} {"train_loss": -5.609584808349609, "global_step": 33352, "epoch": 794} {"train_loss": -5.534235954284668, "global_step": 33353, "epoch": 794} {"train_loss": -5.523298740386963, "global_step": 33354, "epoch": 794} {"train_loss": -5.4104156494140625, "global_step": 33355, "epoch": 794} {"train_loss": -5.4884352684021, "global_step": 33356, "epoch": 794} {"train_loss": -5.3838653564453125, "global_step": 33357, "epoch": 794} {"train_loss": -5.513307571411133, "global_step": 33358, "epoch": 794} {"train_loss": -5.388457775115967, "global_step": 33359, "epoch": 794} {"train_loss": -5.483589172363281, "global_step": 33360, "epoch": 794} {"train_loss": -5.575131416320801, "global_step": 33361, "epoch": 794} {"train_loss": -5.474518775939941, "global_step": 33362, "epoch": 794} {"train_loss": -5.542767524719238, "global_step": 33363, "epoch": 794} {"train_loss": -5.481739521026611, "global_step": 33364, "epoch": 794} {"train_loss": -5.540103912353516, "global_step": 33365, "epoch": 794} {"train_loss": -5.484269142150879, "global_step": 33366, "epoch": 794} {"train_loss": -5.486879348754883, "global_step": 33367, "epoch": 794} {"train_loss": -5.665826320648193, "global_step": 33368, "epoch": 794} {"train_loss": -5.493773460388184, "global_step": 33369, "epoch": 794} {"train_loss": -5.495670795440674, "global_step": 33370, "epoch": 794} {"train_loss": -5.534656524658203, "global_step": 33371, "epoch": 794} {"train_loss": -5.492771148681641, "global_step": 33372, "epoch": 794} {"train_loss": -5.552031993865967, "global_step": 33373, "epoch": 794} {"train_loss": -5.573890686035156, "global_step": 33374, "epoch": 794} {"train_loss": -5.496695518493652, "global_step": 33375, "epoch": 794} {"train_loss": -5.512772083282471, "global_step": 33376, "epoch": 794} {"train_loss": -5.520115852355957, "global_step": 33377, "epoch": 794} {"train_loss": -5.60328483581543, "global_step": 33378, "epoch": 794} {"train_loss": -5.529009819030762, "global_step": 33379, "epoch": 794} {"train_loss": -5.402873516082764, "global_step": 33380, "epoch": 794} {"train_loss": -5.533459186553955, "global_step": 33381, "epoch": 794} {"train_loss": -5.518888473510742, "global_step": 33382, "epoch": 794} {"train_loss": -5.500843048095703, "global_step": 33383, "epoch": 794} {"train_loss": -5.537496566772461, "global_step": 33384, "epoch": 794} {"train_loss": -5.474583625793457, "global_step": 33385, "epoch": 794} {"train_loss": -5.449189186096191, "global_step": 33386, "epoch": 794} {"train_loss": -5.55289363861084, "global_step": 33387, "epoch": 794} {"train_loss": -5.471662521362305, "global_step": 33388, "epoch": 794} {"train_loss": -5.508734964189076, "global_step": 33389, "epoch": 794, "val_loss": 74389.75} {"train_loss": -5.559415817260742, "global_step": 33390, "epoch": 795} {"train_loss": -5.462802410125732, "global_step": 33391, "epoch": 795} {"train_loss": -5.466008186340332, "global_step": 33392, "epoch": 795} {"train_loss": -5.612613201141357, "global_step": 33393, "epoch": 795} {"train_loss": -5.522324085235596, "global_step": 33394, "epoch": 795} {"train_loss": -5.60106086730957, "global_step": 33395, "epoch": 795} {"train_loss": -5.488361358642578, "global_step": 33396, "epoch": 795} {"train_loss": -5.573657989501953, "global_step": 33397, "epoch": 795} {"train_loss": -5.516571044921875, "global_step": 33398, "epoch": 795} {"train_loss": -5.591843605041504, "global_step": 33399, "epoch": 795} {"train_loss": -5.456478118896484, "global_step": 33400, "epoch": 795} {"train_loss": -5.4585089683532715, "global_step": 33401, "epoch": 795} {"train_loss": -5.505369663238525, "global_step": 33402, "epoch": 795} {"train_loss": -5.525345325469971, "global_step": 33403, "epoch": 795} {"train_loss": -5.544685363769531, "global_step": 33404, "epoch": 795} {"train_loss": -5.494749069213867, "global_step": 33405, "epoch": 795} {"train_loss": -5.522026538848877, "global_step": 33406, "epoch": 795} {"train_loss": -5.5549163818359375, "global_step": 33407, "epoch": 795} {"train_loss": -5.471456527709961, "global_step": 33408, "epoch": 795} {"train_loss": -5.645149230957031, "global_step": 33409, "epoch": 795} {"train_loss": -5.727612495422363, "global_step": 33410, "epoch": 795} {"train_loss": -5.43450403213501, "global_step": 33411, "epoch": 795} {"train_loss": -5.564994812011719, "global_step": 33412, "epoch": 795} {"train_loss": -5.6040472984313965, "global_step": 33413, "epoch": 795} {"train_loss": -5.397097587585449, "global_step": 33414, "epoch": 795} {"train_loss": -5.552100658416748, "global_step": 33415, "epoch": 795} {"train_loss": -5.552971839904785, "global_step": 33416, "epoch": 795} {"train_loss": -5.598137855529785, "global_step": 33417, "epoch": 795} {"train_loss": -5.619718551635742, "global_step": 33418, "epoch": 795} {"train_loss": -5.575950622558594, "global_step": 33419, "epoch": 795} {"train_loss": -5.5666961669921875, "global_step": 33420, "epoch": 795} {"train_loss": -5.480414867401123, "global_step": 33421, "epoch": 795} {"train_loss": -5.594515800476074, "global_step": 33422, "epoch": 795} {"train_loss": -5.571713924407959, "global_step": 33423, "epoch": 795} {"train_loss": -5.470032691955566, "global_step": 33424, "epoch": 795} {"train_loss": -5.588078498840332, "global_step": 33425, "epoch": 795} {"train_loss": -5.50056266784668, "global_step": 33426, "epoch": 795} {"train_loss": -5.407637596130371, "global_step": 33427, "epoch": 795} {"train_loss": -5.554263114929199, "global_step": 33428, "epoch": 795} {"train_loss": -5.46126127243042, "global_step": 33429, "epoch": 795} {"train_loss": -5.583228588104248, "global_step": 33430, "epoch": 795} {"train_loss": -5.534743842624483, "global_step": 33431, "epoch": 795, "val_loss": 74406.9921875} {"train_loss": -5.545683860778809, "global_step": 33432, "epoch": 796} {"train_loss": -5.49760627746582, "global_step": 33433, "epoch": 796} {"train_loss": -5.486207962036133, "global_step": 33434, "epoch": 796} {"train_loss": -5.616130828857422, "global_step": 33435, "epoch": 796} {"train_loss": -5.623724937438965, "global_step": 33436, "epoch": 796} {"train_loss": -5.522001266479492, "global_step": 33437, "epoch": 796} {"train_loss": -5.402790069580078, "global_step": 33438, "epoch": 796} {"train_loss": -5.581212043762207, "global_step": 33439, "epoch": 796} {"train_loss": -5.59958553314209, "global_step": 33440, "epoch": 796} {"train_loss": -5.551705360412598, "global_step": 33441, "epoch": 796} {"train_loss": -5.547422885894775, "global_step": 33442, "epoch": 796} {"train_loss": -5.4813079833984375, "global_step": 33443, "epoch": 796} {"train_loss": -5.662889003753662, "global_step": 33444, "epoch": 796} {"train_loss": -5.530854225158691, "global_step": 33445, "epoch": 796} {"train_loss": -5.673553943634033, "global_step": 33446, "epoch": 796} {"train_loss": -5.674542427062988, "global_step": 33447, "epoch": 796} {"train_loss": -5.543515205383301, "global_step": 33448, "epoch": 796} {"train_loss": -5.7116780281066895, "global_step": 33449, "epoch": 796} {"train_loss": -5.504777908325195, "global_step": 33450, "epoch": 796} {"train_loss": -5.489605903625488, "global_step": 33451, "epoch": 796} {"train_loss": -5.621453285217285, "global_step": 33452, "epoch": 796} {"train_loss": -5.6193084716796875, "global_step": 33453, "epoch": 796} {"train_loss": -5.402096748352051, "global_step": 33454, "epoch": 796} {"train_loss": -5.519474983215332, "global_step": 33455, "epoch": 796} {"train_loss": -5.528566360473633, "global_step": 33456, "epoch": 796} {"train_loss": -5.485568046569824, "global_step": 33457, "epoch": 796} {"train_loss": -5.571841716766357, "global_step": 33458, "epoch": 796} {"train_loss": -5.549291610717773, "global_step": 33459, "epoch": 796} {"train_loss": -5.66046142578125, "global_step": 33460, "epoch": 796} {"train_loss": -5.592187881469727, "global_step": 33461, "epoch": 796} {"train_loss": -5.501638889312744, "global_step": 33462, "epoch": 796} {"train_loss": -5.4792962074279785, "global_step": 33463, "epoch": 796} {"train_loss": -5.541478157043457, "global_step": 33464, "epoch": 796} {"train_loss": -5.312581539154053, "global_step": 33465, "epoch": 796} {"train_loss": -5.541739463806152, "global_step": 33466, "epoch": 796} {"train_loss": -5.565561294555664, "global_step": 33467, "epoch": 796} {"train_loss": -5.400088310241699, "global_step": 33468, "epoch": 796} {"train_loss": -5.479362487792969, "global_step": 33469, "epoch": 796} {"train_loss": -5.545385837554932, "global_step": 33470, "epoch": 796} {"train_loss": -5.428783416748047, "global_step": 33471, "epoch": 796} {"train_loss": -5.437796115875244, "global_step": 33472, "epoch": 796} {"train_loss": -5.539455924715314, "global_step": 33473, "epoch": 796, "val_loss": 74023.8515625} {"train_loss": -5.423207759857178, "global_step": 33474, "epoch": 797} {"train_loss": -5.593293190002441, "global_step": 33475, "epoch": 797} {"train_loss": -5.428301811218262, "global_step": 33476, "epoch": 797} {"train_loss": -5.529962539672852, "global_step": 33477, "epoch": 797} {"train_loss": -5.514731407165527, "global_step": 33478, "epoch": 797} {"train_loss": -5.604028701782227, "global_step": 33479, "epoch": 797} {"train_loss": -5.5445451736450195, "global_step": 33480, "epoch": 797} {"train_loss": -5.53509521484375, "global_step": 33481, "epoch": 797} {"train_loss": -5.649319648742676, "global_step": 33482, "epoch": 797} {"train_loss": -5.473668098449707, "global_step": 33483, "epoch": 797} {"train_loss": -5.549304485321045, "global_step": 33484, "epoch": 797} {"train_loss": -5.564080238342285, "global_step": 33485, "epoch": 797} {"train_loss": -5.595745086669922, "global_step": 33486, "epoch": 797} {"train_loss": -5.501831531524658, "global_step": 33487, "epoch": 797} {"train_loss": -5.568568229675293, "global_step": 33488, "epoch": 797} {"train_loss": -5.605940818786621, "global_step": 33489, "epoch": 797} {"train_loss": -5.508779048919678, "global_step": 33490, "epoch": 797} {"train_loss": -5.453638553619385, "global_step": 33491, "epoch": 797} {"train_loss": -5.550989151000977, "global_step": 33492, "epoch": 797} {"train_loss": -5.550164222717285, "global_step": 33493, "epoch": 797} {"train_loss": -5.628822326660156, "global_step": 33494, "epoch": 797} {"train_loss": -5.539816856384277, "global_step": 33495, "epoch": 797} {"train_loss": -5.509239196777344, "global_step": 33496, "epoch": 797} {"train_loss": -5.567363739013672, "global_step": 33497, "epoch": 797} {"train_loss": -5.509237289428711, "global_step": 33498, "epoch": 797} {"train_loss": -5.405219078063965, "global_step": 33499, "epoch": 797} {"train_loss": -5.642668724060059, "global_step": 33500, "epoch": 797} {"train_loss": -5.511806488037109, "global_step": 33501, "epoch": 797} {"train_loss": -5.46931791305542, "global_step": 33502, "epoch": 797} {"train_loss": -5.482478618621826, "global_step": 33503, "epoch": 797} {"train_loss": -5.379617691040039, "global_step": 33504, "epoch": 797} {"train_loss": -5.5189337730407715, "global_step": 33505, "epoch": 797} {"train_loss": -5.563462257385254, "global_step": 33506, "epoch": 797} {"train_loss": -5.454963684082031, "global_step": 33507, "epoch": 797} {"train_loss": -5.454315662384033, "global_step": 33508, "epoch": 797} {"train_loss": -5.632615566253662, "global_step": 33509, "epoch": 797} {"train_loss": -5.4241743087768555, "global_step": 33510, "epoch": 797} {"train_loss": -5.536382675170898, "global_step": 33511, "epoch": 797} {"train_loss": -5.5517096519470215, "global_step": 33512, "epoch": 797} {"train_loss": -5.483748435974121, "global_step": 33513, "epoch": 797} {"train_loss": -5.61580753326416, "global_step": 33514, "epoch": 797} {"train_loss": -5.5258716855730325, "global_step": 33515, "epoch": 797, "val_loss": 73903.984375} {"train_loss": -5.705260276794434, "global_step": 33516, "epoch": 798} {"train_loss": -5.527544021606445, "global_step": 33517, "epoch": 798} {"train_loss": -5.523853302001953, "global_step": 33518, "epoch": 798} {"train_loss": -5.520625114440918, "global_step": 33519, "epoch": 798} {"train_loss": -5.5336151123046875, "global_step": 33520, "epoch": 798} {"train_loss": -5.473201751708984, "global_step": 33521, "epoch": 798} {"train_loss": -5.479754447937012, "global_step": 33522, "epoch": 798} {"train_loss": -5.575058937072754, "global_step": 33523, "epoch": 798} {"train_loss": -5.581292152404785, "global_step": 33524, "epoch": 798} {"train_loss": -5.483720302581787, "global_step": 33525, "epoch": 798} {"train_loss": -5.544699668884277, "global_step": 33526, "epoch": 798} {"train_loss": -5.461860179901123, "global_step": 33527, "epoch": 798} {"train_loss": -5.602623462677002, "global_step": 33528, "epoch": 798} {"train_loss": -5.415787696838379, "global_step": 33529, "epoch": 798} {"train_loss": -5.521850109100342, "global_step": 33530, "epoch": 798} {"train_loss": -5.488629341125488, "global_step": 33531, "epoch": 798} {"train_loss": -5.601823806762695, "global_step": 33532, "epoch": 798} {"train_loss": -5.545154571533203, "global_step": 33533, "epoch": 798} {"train_loss": -5.5037031173706055, "global_step": 33534, "epoch": 798} {"train_loss": -5.634200096130371, "global_step": 33535, "epoch": 798} {"train_loss": -5.543006896972656, "global_step": 33536, "epoch": 798} {"train_loss": -5.519757270812988, "global_step": 33537, "epoch": 798} {"train_loss": -5.631455421447754, "global_step": 33538, "epoch": 798} {"train_loss": -5.500853061676025, "global_step": 33539, "epoch": 798} {"train_loss": -5.382177352905273, "global_step": 33540, "epoch": 798} {"train_loss": -5.587121963500977, "global_step": 33541, "epoch": 798} {"train_loss": -5.465165138244629, "global_step": 33542, "epoch": 798} {"train_loss": -5.432051658630371, "global_step": 33543, "epoch": 798} {"train_loss": -5.6436238288879395, "global_step": 33544, "epoch": 798} {"train_loss": -5.470049858093262, "global_step": 33545, "epoch": 798} {"train_loss": -5.7200093269348145, "global_step": 33546, "epoch": 798} {"train_loss": -5.551825523376465, "global_step": 33547, "epoch": 798} {"train_loss": -5.408628463745117, "global_step": 33548, "epoch": 798} {"train_loss": -5.508459568023682, "global_step": 33549, "epoch": 798} {"train_loss": -5.521500587463379, "global_step": 33550, "epoch": 798} {"train_loss": -5.434228897094727, "global_step": 33551, "epoch": 798} {"train_loss": -5.656703948974609, "global_step": 33552, "epoch": 798} {"train_loss": -5.6461100578308105, "global_step": 33553, "epoch": 798} {"train_loss": -5.404404640197754, "global_step": 33554, "epoch": 798} {"train_loss": -5.383274078369141, "global_step": 33555, "epoch": 798} {"train_loss": -5.45876407623291, "global_step": 33556, "epoch": 798} {"train_loss": -5.527607872372582, "global_step": 33557, "epoch": 798, "val_loss": 74338.15625} {"train_loss": -5.659962177276611, "global_step": 33558, "epoch": 799} {"train_loss": -5.646371841430664, "global_step": 33559, "epoch": 799} {"train_loss": -5.591597557067871, "global_step": 33560, "epoch": 799} {"train_loss": -5.610557556152344, "global_step": 33561, "epoch": 799} {"train_loss": -5.645247459411621, "global_step": 33562, "epoch": 799} {"train_loss": -5.602199077606201, "global_step": 33563, "epoch": 799} {"train_loss": -5.4256792068481445, "global_step": 33564, "epoch": 799} {"train_loss": -5.534571170806885, "global_step": 33565, "epoch": 799} {"train_loss": -5.5486345291137695, "global_step": 33566, "epoch": 799} {"train_loss": -5.471579551696777, "global_step": 33567, "epoch": 799} {"train_loss": -5.600564956665039, "global_step": 33568, "epoch": 799} {"train_loss": -5.443399429321289, "global_step": 33569, "epoch": 799} {"train_loss": -5.597496032714844, "global_step": 33570, "epoch": 799} {"train_loss": -5.304412841796875, "global_step": 33571, "epoch": 799} {"train_loss": -5.510873794555664, "global_step": 33572, "epoch": 799} {"train_loss": -5.500135898590088, "global_step": 33573, "epoch": 799} {"train_loss": -5.637984752655029, "global_step": 33574, "epoch": 799} {"train_loss": -5.4064741134643555, "global_step": 33575, "epoch": 799} {"train_loss": -5.513991355895996, "global_step": 33576, "epoch": 799} {"train_loss": -5.420579433441162, "global_step": 33577, "epoch": 799} {"train_loss": -5.464686870574951, "global_step": 33578, "epoch": 799} {"train_loss": -5.472017765045166, "global_step": 33579, "epoch": 799} {"train_loss": -5.477220058441162, "global_step": 33580, "epoch": 799} {"train_loss": -5.499024391174316, "global_step": 33581, "epoch": 799} {"train_loss": -5.667086601257324, "global_step": 33582, "epoch": 799} {"train_loss": -5.501348972320557, "global_step": 33583, "epoch": 799} {"train_loss": -5.449906349182129, "global_step": 33584, "epoch": 799} {"train_loss": -5.705585479736328, "global_step": 33585, "epoch": 799} {"train_loss": -5.319671154022217, "global_step": 33586, "epoch": 799} {"train_loss": -5.412815570831299, "global_step": 33587, "epoch": 799} {"train_loss": -5.547848224639893, "global_step": 33588, "epoch": 799} {"train_loss": -5.478595733642578, "global_step": 33589, "epoch": 799} {"train_loss": -5.632606506347656, "global_step": 33590, "epoch": 799} {"train_loss": -5.477621555328369, "global_step": 33591, "epoch": 799} {"train_loss": -5.455903053283691, "global_step": 33592, "epoch": 799} {"train_loss": -5.584565162658691, "global_step": 33593, "epoch": 799} {"train_loss": -5.525834083557129, "global_step": 33594, "epoch": 799} {"train_loss": -5.675392150878906, "global_step": 33595, "epoch": 799} {"train_loss": -5.4840826988220215, "global_step": 33596, "epoch": 799} {"train_loss": -5.596793174743652, "global_step": 33597, "epoch": 799} {"train_loss": -5.444974899291992, "global_step": 33598, "epoch": 799} {"train_loss": -5.522407157080514, "global_step": 33599, "epoch": 799, "val_loss": 74087.671875} {"train_loss": -5.577579498291016, "global_step": 33600, "epoch": 800} {"train_loss": -5.528055191040039, "global_step": 33601, "epoch": 800} {"train_loss": -5.5107831954956055, "global_step": 33602, "epoch": 800} {"train_loss": -5.583698749542236, "global_step": 33603, "epoch": 800} {"train_loss": -5.485830307006836, "global_step": 33604, "epoch": 800} {"train_loss": -5.57974910736084, "global_step": 33605, "epoch": 800} {"train_loss": -5.526885032653809, "global_step": 33606, "epoch": 800} {"train_loss": -5.533581733703613, "global_step": 33607, "epoch": 800} {"train_loss": -5.537508010864258, "global_step": 33608, "epoch": 800} {"train_loss": -5.672515869140625, "global_step": 33609, "epoch": 800} {"train_loss": -5.591071605682373, "global_step": 33610, "epoch": 800} {"train_loss": -5.541042327880859, "global_step": 33611, "epoch": 800} {"train_loss": -5.451967239379883, "global_step": 33612, "epoch": 800} {"train_loss": -5.575133323669434, "global_step": 33613, "epoch": 800} {"train_loss": -5.613468170166016, "global_step": 33614, "epoch": 800} {"train_loss": -5.55642032623291, "global_step": 33615, "epoch": 800} {"train_loss": -5.516589641571045, "global_step": 33616, "epoch": 800} {"train_loss": -5.547761917114258, "global_step": 33617, "epoch": 800} {"train_loss": -5.546872615814209, "global_step": 33618, "epoch": 800} {"train_loss": -5.615739822387695, "global_step": 33619, "epoch": 800} {"train_loss": -5.563748359680176, "global_step": 33620, "epoch": 800} {"train_loss": -5.4554853439331055, "global_step": 33621, "epoch": 800} {"train_loss": -5.413942337036133, "global_step": 33622, "epoch": 800} {"train_loss": -5.599928855895996, "global_step": 33623, "epoch": 800} {"train_loss": -5.566649913787842, "global_step": 33624, "epoch": 800} {"train_loss": -5.4535980224609375, "global_step": 33625, "epoch": 800} {"train_loss": -5.499227523803711, "global_step": 33626, "epoch": 800} {"train_loss": -5.400055408477783, "global_step": 33627, "epoch": 800} {"train_loss": -5.523216247558594, "global_step": 33628, "epoch": 800} {"train_loss": -5.486931800842285, "global_step": 33629, "epoch": 800} {"train_loss": -5.525605201721191, "global_step": 33630, "epoch": 800} {"train_loss": -5.440378665924072, "global_step": 33631, "epoch": 800} {"train_loss": -5.438623428344727, "global_step": 33632, "epoch": 800} {"train_loss": -5.561199188232422, "global_step": 33633, "epoch": 800} {"train_loss": -5.532936096191406, "global_step": 33634, "epoch": 800} {"train_loss": -5.622485637664795, "global_step": 33635, "epoch": 800} {"train_loss": -5.54016637802124, "global_step": 33636, "epoch": 800} {"train_loss": -5.483855724334717, "global_step": 33637, "epoch": 800} {"train_loss": -5.562538146972656, "global_step": 33638, "epoch": 800} {"train_loss": -5.40899658203125, "global_step": 33639, "epoch": 800} {"train_loss": -5.586789131164551, "global_step": 33640, "epoch": 800} {"train_loss": -5.5315940380096436, "global_step": 33641, "epoch": 800, "train/sim_max_reward_0": 0.39914074176164077, "train/sim_max_reward_1": 0.9529057032735998, "train/sim_max_reward_2": 0.9130287469540804, "train/sim_max_reward_3": 0.22959147419906994, "train/sim_max_reward_4": 0.38196400189394736, "train/sim_max_reward_5": 0.67209857872416, "test/sim_max_reward_4500000": 0.5723817995307211, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.4089662009235051, "test/sim_max_reward_4500003": 0.7340543717494448, "test/sim_max_reward_4500004": 0.10534905360748766, "test/sim_max_reward_4500005": 0.34025366689205644, "test/sim_max_reward_4500006": 0.0, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.9286371189591398, "test/sim_max_reward_4500010": 0.6514829980748861, "test/sim_max_reward_4500011": 0.15266967440669263, "test/sim_max_reward_4500012": 0.15704056245372222, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.7828706682335398, "test/sim_max_reward_4500015": 0.4008633108626181, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.887763437956823, "test/sim_max_reward_4500018": 0.4934084438138607, "test/sim_max_reward_4500019": 0.7754544831577566, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.14861511220147822, "test/sim_max_reward_4500022": 0.38514704287101187, "test/sim_max_reward_4500023": 0.7304086511993697, "test/sim_max_reward_4500024": 0.2027601342995821, "test/sim_max_reward_4500025": 0.8830983581652947, "test/sim_max_reward_4500026": 0.18561014477962098, "test/sim_max_reward_4500027": 0.4719921154214202, "test/sim_max_reward_4500028": 0.8293110988122215, "test/sim_max_reward_4500029": 0.10031789140555361, "test/sim_max_reward_4500030": 0.3143246644427496, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.43184656177221387, "test/sim_max_reward_4500033": 0.1904918760887403, "test/sim_max_reward_4500034": 0.4312694149802904, "test/sim_max_reward_4500035": 0.8636062868268036, "test/sim_max_reward_4500036": 1.0, "test/sim_max_reward_4500037": 0.17055508896129026, "test/sim_max_reward_4500038": 0.4329500827300068, "test/sim_max_reward_4500039": 0.3799584663400418, "test/sim_max_reward_4500040": 0.19906228408131738, "test/sim_max_reward_4500041": 0.954826828837401, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.9518545305981961, "test/sim_max_reward_4500044": 0.6094488463922925, "test/sim_max_reward_4500045": 0.17311035135101446, "test/sim_max_reward_4500046": 0.2277448822306457, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.7427941958549108, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5914548744677496, "test/mean_score": 0.388845690156808, "val_loss": 74399.546875} {"train_loss": -5.607050895690918, "global_step": 33642, "epoch": 801} {"train_loss": -5.546736240386963, "global_step": 33643, "epoch": 801} {"train_loss": -5.458517074584961, "global_step": 33644, "epoch": 801} {"train_loss": -5.432277202606201, "global_step": 33645, "epoch": 801} {"train_loss": -5.508753776550293, "global_step": 33646, "epoch": 801} {"train_loss": -5.574161529541016, "global_step": 33647, "epoch": 801} {"train_loss": -5.515115737915039, "global_step": 33648, "epoch": 801} {"train_loss": -5.587855339050293, "global_step": 33649, "epoch": 801} {"train_loss": -5.520162582397461, "global_step": 33650, "epoch": 801} {"train_loss": -5.593452453613281, "global_step": 33651, "epoch": 801} {"train_loss": -5.570805549621582, "global_step": 33652, "epoch": 801} {"train_loss": -5.441036224365234, "global_step": 33653, "epoch": 801} {"train_loss": -5.523520469665527, "global_step": 33654, "epoch": 801} {"train_loss": -5.632728576660156, "global_step": 33655, "epoch": 801} {"train_loss": -5.522601127624512, "global_step": 33656, "epoch": 801} {"train_loss": -5.509727478027344, "global_step": 33657, "epoch": 801} {"train_loss": -5.567253112792969, "global_step": 33658, "epoch": 801} {"train_loss": -5.452031135559082, "global_step": 33659, "epoch": 801} {"train_loss": -5.461755752563477, "global_step": 33660, "epoch": 801} {"train_loss": -5.583578109741211, "global_step": 33661, "epoch": 801} {"train_loss": -5.432435035705566, "global_step": 33662, "epoch": 801} {"train_loss": -5.396899223327637, "global_step": 33663, "epoch": 801} {"train_loss": -5.645135879516602, "global_step": 33664, "epoch": 801} {"train_loss": -5.498959541320801, "global_step": 33665, "epoch": 801} {"train_loss": -5.510361671447754, "global_step": 33666, "epoch": 801} {"train_loss": -5.448247909545898, "global_step": 33667, "epoch": 801} {"train_loss": -5.532346248626709, "global_step": 33668, "epoch": 801} {"train_loss": -5.502574920654297, "global_step": 33669, "epoch": 801} {"train_loss": -5.5202178955078125, "global_step": 33670, "epoch": 801} {"train_loss": -5.579906940460205, "global_step": 33671, "epoch": 801} {"train_loss": -5.508323669433594, "global_step": 33672, "epoch": 801} {"train_loss": -5.494880199432373, "global_step": 33673, "epoch": 801} {"train_loss": -5.5511322021484375, "global_step": 33674, "epoch": 801} {"train_loss": -5.4630842208862305, "global_step": 33675, "epoch": 801} {"train_loss": -5.455345153808594, "global_step": 33676, "epoch": 801} {"train_loss": -5.471828460693359, "global_step": 33677, "epoch": 801} {"train_loss": -5.481316566467285, "global_step": 33678, "epoch": 801} {"train_loss": -5.50581693649292, "global_step": 33679, "epoch": 801} {"train_loss": -5.534160614013672, "global_step": 33680, "epoch": 801} {"train_loss": -5.494996547698975, "global_step": 33681, "epoch": 801} {"train_loss": -5.64157247543335, "global_step": 33682, "epoch": 801} {"train_loss": -5.5191365877787275, "global_step": 33683, "epoch": 801, "val_loss": 74585.640625} {"train_loss": -5.500591278076172, "global_step": 33684, "epoch": 802} {"train_loss": -5.601443290710449, "global_step": 33685, "epoch": 802} {"train_loss": -5.44043493270874, "global_step": 33686, "epoch": 802} {"train_loss": -5.479986190795898, "global_step": 33687, "epoch": 802} {"train_loss": -5.456491470336914, "global_step": 33688, "epoch": 802} {"train_loss": -5.53339147567749, "global_step": 33689, "epoch": 802} {"train_loss": -5.4890522956848145, "global_step": 33690, "epoch": 802} {"train_loss": -5.5826544761657715, "global_step": 33691, "epoch": 802} {"train_loss": -5.487056732177734, "global_step": 33692, "epoch": 802} {"train_loss": -5.453188419342041, "global_step": 33693, "epoch": 802} {"train_loss": -5.511265277862549, "global_step": 33694, "epoch": 802} {"train_loss": -5.605755805969238, "global_step": 33695, "epoch": 802} {"train_loss": -5.547207832336426, "global_step": 33696, "epoch": 802} {"train_loss": -5.564761161804199, "global_step": 33697, "epoch": 802} {"train_loss": -5.629021644592285, "global_step": 33698, "epoch": 802} {"train_loss": -5.490572929382324, "global_step": 33699, "epoch": 802} {"train_loss": -5.4916863441467285, "global_step": 33700, "epoch": 802} {"train_loss": -5.418664932250977, "global_step": 33701, "epoch": 802} {"train_loss": -5.5822858810424805, "global_step": 33702, "epoch": 802} {"train_loss": -5.494960784912109, "global_step": 33703, "epoch": 802} {"train_loss": -5.524952411651611, "global_step": 33704, "epoch": 802} {"train_loss": -5.461623668670654, "global_step": 33705, "epoch": 802} {"train_loss": -5.514178276062012, "global_step": 33706, "epoch": 802} {"train_loss": -5.518681526184082, "global_step": 33707, "epoch": 802} {"train_loss": -5.562436103820801, "global_step": 33708, "epoch": 802} {"train_loss": -5.503725528717041, "global_step": 33709, "epoch": 802} {"train_loss": -5.478110313415527, "global_step": 33710, "epoch": 802} {"train_loss": -5.4751129150390625, "global_step": 33711, "epoch": 802} {"train_loss": -5.304286956787109, "global_step": 33712, "epoch": 802} {"train_loss": -5.610183238983154, "global_step": 33713, "epoch": 802} {"train_loss": -5.502143859863281, "global_step": 33714, "epoch": 802} {"train_loss": -5.592153549194336, "global_step": 33715, "epoch": 802} {"train_loss": -5.463628768920898, "global_step": 33716, "epoch": 802} {"train_loss": -5.553431510925293, "global_step": 33717, "epoch": 802} {"train_loss": -5.489467620849609, "global_step": 33718, "epoch": 802} {"train_loss": -5.559527397155762, "global_step": 33719, "epoch": 802} {"train_loss": -5.428033351898193, "global_step": 33720, "epoch": 802} {"train_loss": -5.432614803314209, "global_step": 33721, "epoch": 802} {"train_loss": -5.607186317443848, "global_step": 33722, "epoch": 802} {"train_loss": -5.269452095031738, "global_step": 33723, "epoch": 802} {"train_loss": -5.489896297454834, "global_step": 33724, "epoch": 802} {"train_loss": -5.506090913500104, "global_step": 33725, "epoch": 802, "val_loss": 74842.9375} {"train_loss": -5.441143989562988, "global_step": 33726, "epoch": 803} {"train_loss": -5.517618179321289, "global_step": 33727, "epoch": 803} {"train_loss": -5.511324882507324, "global_step": 33728, "epoch": 803} {"train_loss": -5.4661149978637695, "global_step": 33729, "epoch": 803} {"train_loss": -5.586936950683594, "global_step": 33730, "epoch": 803} {"train_loss": -5.645203590393066, "global_step": 33731, "epoch": 803} {"train_loss": -5.572407245635986, "global_step": 33732, "epoch": 803} {"train_loss": -5.529512882232666, "global_step": 33733, "epoch": 803} {"train_loss": -5.507638931274414, "global_step": 33734, "epoch": 803} {"train_loss": -5.539116382598877, "global_step": 33735, "epoch": 803} {"train_loss": -5.566473007202148, "global_step": 33736, "epoch": 803} {"train_loss": -5.584956169128418, "global_step": 33737, "epoch": 803} {"train_loss": -5.453360080718994, "global_step": 33738, "epoch": 803} {"train_loss": -5.49102783203125, "global_step": 33739, "epoch": 803} {"train_loss": -5.510061740875244, "global_step": 33740, "epoch": 803} {"train_loss": -5.519372463226318, "global_step": 33741, "epoch": 803} {"train_loss": -5.534880638122559, "global_step": 33742, "epoch": 803} {"train_loss": -5.55103874206543, "global_step": 33743, "epoch": 803} {"train_loss": -5.415592193603516, "global_step": 33744, "epoch": 803} {"train_loss": -5.398369789123535, "global_step": 33745, "epoch": 803} {"train_loss": -5.471585273742676, "global_step": 33746, "epoch": 803} {"train_loss": -5.5340423583984375, "global_step": 33747, "epoch": 803} {"train_loss": -5.476284027099609, "global_step": 33748, "epoch": 803} {"train_loss": -5.380270004272461, "global_step": 33749, "epoch": 803} {"train_loss": -5.50532341003418, "global_step": 33750, "epoch": 803} {"train_loss": -5.288450241088867, "global_step": 33751, "epoch": 803} {"train_loss": -5.606874465942383, "global_step": 33752, "epoch": 803} {"train_loss": -5.557729721069336, "global_step": 33753, "epoch": 803} {"train_loss": -5.442539691925049, "global_step": 33754, "epoch": 803} {"train_loss": -5.594387054443359, "global_step": 33755, "epoch": 803} {"train_loss": -5.453529357910156, "global_step": 33756, "epoch": 803} {"train_loss": -5.732246398925781, "global_step": 33757, "epoch": 803} {"train_loss": -5.586595058441162, "global_step": 33758, "epoch": 803} {"train_loss": -5.605800151824951, "global_step": 33759, "epoch": 803} {"train_loss": -5.5142436027526855, "global_step": 33760, "epoch": 803} {"train_loss": -5.443986892700195, "global_step": 33761, "epoch": 803} {"train_loss": -5.43858003616333, "global_step": 33762, "epoch": 803} {"train_loss": -5.463257789611816, "global_step": 33763, "epoch": 803} {"train_loss": -5.433681964874268, "global_step": 33764, "epoch": 803} {"train_loss": -5.44485330581665, "global_step": 33765, "epoch": 803} {"train_loss": -5.536050796508789, "global_step": 33766, "epoch": 803} {"train_loss": -5.511227619080317, "global_step": 33767, "epoch": 803, "val_loss": 74314.875} {"train_loss": -5.55645751953125, "global_step": 33768, "epoch": 804} {"train_loss": -5.4938249588012695, "global_step": 33769, "epoch": 804} {"train_loss": -5.562594890594482, "global_step": 33770, "epoch": 804} {"train_loss": -5.561838626861572, "global_step": 33771, "epoch": 804} {"train_loss": -5.569206237792969, "global_step": 33772, "epoch": 804} {"train_loss": -5.420501232147217, "global_step": 33773, "epoch": 804} {"train_loss": -5.537213325500488, "global_step": 33774, "epoch": 804} {"train_loss": -5.630624771118164, "global_step": 33775, "epoch": 804} {"train_loss": -5.655571937561035, "global_step": 33776, "epoch": 804} {"train_loss": -5.465653419494629, "global_step": 33777, "epoch": 804} {"train_loss": -5.468264579772949, "global_step": 33778, "epoch": 804} {"train_loss": -5.602292060852051, "global_step": 33779, "epoch": 804} {"train_loss": -5.552444934844971, "global_step": 33780, "epoch": 804} {"train_loss": -5.685547828674316, "global_step": 33781, "epoch": 804} {"train_loss": -5.607512474060059, "global_step": 33782, "epoch": 804} {"train_loss": -5.434532642364502, "global_step": 33783, "epoch": 804} {"train_loss": -5.567161560058594, "global_step": 33784, "epoch": 804} {"train_loss": -5.525757789611816, "global_step": 33785, "epoch": 804} {"train_loss": -5.522351264953613, "global_step": 33786, "epoch": 804} {"train_loss": -5.437444686889648, "global_step": 33787, "epoch": 804} {"train_loss": -5.632498741149902, "global_step": 33788, "epoch": 804} {"train_loss": -5.571510314941406, "global_step": 33789, "epoch": 804} {"train_loss": -5.590777397155762, "global_step": 33790, "epoch": 804} {"train_loss": -5.531176567077637, "global_step": 33791, "epoch": 804} {"train_loss": -5.5533905029296875, "global_step": 33792, "epoch": 804} {"train_loss": -5.541133880615234, "global_step": 33793, "epoch": 804} {"train_loss": -5.466759204864502, "global_step": 33794, "epoch": 804} {"train_loss": -5.597475051879883, "global_step": 33795, "epoch": 804} {"train_loss": -5.538093566894531, "global_step": 33796, "epoch": 804} {"train_loss": -5.581820011138916, "global_step": 33797, "epoch": 804} {"train_loss": -5.462408065795898, "global_step": 33798, "epoch": 804} {"train_loss": -5.608067512512207, "global_step": 33799, "epoch": 804} {"train_loss": -5.534392356872559, "global_step": 33800, "epoch": 804} {"train_loss": -5.595412254333496, "global_step": 33801, "epoch": 804} {"train_loss": -5.604684829711914, "global_step": 33802, "epoch": 804} {"train_loss": -5.608087539672852, "global_step": 33803, "epoch": 804} {"train_loss": -5.4271440505981445, "global_step": 33804, "epoch": 804} {"train_loss": -5.4871320724487305, "global_step": 33805, "epoch": 804} {"train_loss": -5.480932712554932, "global_step": 33806, "epoch": 804} {"train_loss": -5.599153995513916, "global_step": 33807, "epoch": 804} {"train_loss": -5.483397006988525, "global_step": 33808, "epoch": 804} {"train_loss": -5.54190917242141, "global_step": 33809, "epoch": 804, "val_loss": 74234.828125} {"train_loss": -5.5102128982543945, "global_step": 33810, "epoch": 805} {"train_loss": -5.365924835205078, "global_step": 33811, "epoch": 805} {"train_loss": -5.645256042480469, "global_step": 33812, "epoch": 805} {"train_loss": -5.522721290588379, "global_step": 33813, "epoch": 805} {"train_loss": -5.5800065994262695, "global_step": 33814, "epoch": 805} {"train_loss": -5.603832721710205, "global_step": 33815, "epoch": 805} {"train_loss": -5.478488922119141, "global_step": 33816, "epoch": 805} {"train_loss": -5.610648155212402, "global_step": 33817, "epoch": 805} {"train_loss": -5.56171178817749, "global_step": 33818, "epoch": 805} {"train_loss": -5.547916889190674, "global_step": 33819, "epoch": 805} {"train_loss": -5.596432209014893, "global_step": 33820, "epoch": 805} {"train_loss": -5.382963180541992, "global_step": 33821, "epoch": 805} {"train_loss": -5.53257942199707, "global_step": 33822, "epoch": 805} {"train_loss": -5.53217887878418, "global_step": 33823, "epoch": 805} {"train_loss": -5.540214538574219, "global_step": 33824, "epoch": 805} {"train_loss": -5.332923412322998, "global_step": 33825, "epoch": 805} {"train_loss": -5.597447395324707, "global_step": 33826, "epoch": 805} {"train_loss": -5.399158954620361, "global_step": 33827, "epoch": 805} {"train_loss": -5.498232841491699, "global_step": 33828, "epoch": 805} {"train_loss": -5.629134178161621, "global_step": 33829, "epoch": 805} {"train_loss": -5.572024345397949, "global_step": 33830, "epoch": 805} {"train_loss": -5.471304893493652, "global_step": 33831, "epoch": 805} {"train_loss": -5.483654022216797, "global_step": 33832, "epoch": 805} {"train_loss": -5.458588123321533, "global_step": 33833, "epoch": 805} {"train_loss": -5.49829626083374, "global_step": 33834, "epoch": 805} {"train_loss": -5.497862815856934, "global_step": 33835, "epoch": 805} {"train_loss": -5.4854536056518555, "global_step": 33836, "epoch": 805} {"train_loss": -5.457865238189697, "global_step": 33837, "epoch": 805} {"train_loss": -5.5570292472839355, "global_step": 33838, "epoch": 805} {"train_loss": -5.615556240081787, "global_step": 33839, "epoch": 805} {"train_loss": -5.517292499542236, "global_step": 33840, "epoch": 805} {"train_loss": -5.413601398468018, "global_step": 33841, "epoch": 805} {"train_loss": -5.468392372131348, "global_step": 33842, "epoch": 805} {"train_loss": -5.5116777420043945, "global_step": 33843, "epoch": 805} {"train_loss": -5.390738010406494, "global_step": 33844, "epoch": 805} {"train_loss": -5.592844009399414, "global_step": 33845, "epoch": 805} {"train_loss": -5.480224609375, "global_step": 33846, "epoch": 805} {"train_loss": -5.585775375366211, "global_step": 33847, "epoch": 805} {"train_loss": -5.481269836425781, "global_step": 33848, "epoch": 805} {"train_loss": -5.430267333984375, "global_step": 33849, "epoch": 805} {"train_loss": -5.4215545654296875, "global_step": 33850, "epoch": 805} {"train_loss": -5.50798899786813, "global_step": 33851, "epoch": 805, "val_loss": 74140.59375} {"train_loss": -5.475371360778809, "global_step": 33852, "epoch": 806} {"train_loss": -5.586695671081543, "global_step": 33853, "epoch": 806} {"train_loss": -5.476714134216309, "global_step": 33854, "epoch": 806} {"train_loss": -5.545598983764648, "global_step": 33855, "epoch": 806} {"train_loss": -5.531069755554199, "global_step": 33856, "epoch": 806} {"train_loss": -5.596811294555664, "global_step": 33857, "epoch": 806} {"train_loss": -5.514630317687988, "global_step": 33858, "epoch": 806} {"train_loss": -5.616382122039795, "global_step": 33859, "epoch": 806} {"train_loss": -5.539700508117676, "global_step": 33860, "epoch": 806} {"train_loss": -5.6482744216918945, "global_step": 33861, "epoch": 806} {"train_loss": -5.6141357421875, "global_step": 33862, "epoch": 806} {"train_loss": -5.605165958404541, "global_step": 33863, "epoch": 806} {"train_loss": -5.512291431427002, "global_step": 33864, "epoch": 806} {"train_loss": -5.571398735046387, "global_step": 33865, "epoch": 806} {"train_loss": -5.600350379943848, "global_step": 33866, "epoch": 806} {"train_loss": -5.5941057205200195, "global_step": 33867, "epoch": 806} {"train_loss": -5.448306083679199, "global_step": 33868, "epoch": 806} {"train_loss": -5.417089462280273, "global_step": 33869, "epoch": 806} {"train_loss": -5.497806549072266, "global_step": 33870, "epoch": 806} {"train_loss": -5.551717758178711, "global_step": 33871, "epoch": 806} {"train_loss": -5.55463171005249, "global_step": 33872, "epoch": 806} {"train_loss": -5.644902229309082, "global_step": 33873, "epoch": 806} {"train_loss": -5.558793544769287, "global_step": 33874, "epoch": 806} {"train_loss": -5.4291253089904785, "global_step": 33875, "epoch": 806} {"train_loss": -5.476502418518066, "global_step": 33876, "epoch": 806} {"train_loss": -5.639966011047363, "global_step": 33877, "epoch": 806} {"train_loss": -5.578269958496094, "global_step": 33878, "epoch": 806} {"train_loss": -5.436914920806885, "global_step": 33879, "epoch": 806} {"train_loss": -5.490843296051025, "global_step": 33880, "epoch": 806} {"train_loss": -5.645246505737305, "global_step": 33881, "epoch": 806} {"train_loss": -5.416631698608398, "global_step": 33882, "epoch": 806} {"train_loss": -5.4943437576293945, "global_step": 33883, "epoch": 806} {"train_loss": -5.486153602600098, "global_step": 33884, "epoch": 806} {"train_loss": -5.61437463760376, "global_step": 33885, "epoch": 806} {"train_loss": -5.565322399139404, "global_step": 33886, "epoch": 806} {"train_loss": -5.656412124633789, "global_step": 33887, "epoch": 806} {"train_loss": -5.565880298614502, "global_step": 33888, "epoch": 806} {"train_loss": -5.557272911071777, "global_step": 33889, "epoch": 806} {"train_loss": -5.382270812988281, "global_step": 33890, "epoch": 806} {"train_loss": -5.449035167694092, "global_step": 33891, "epoch": 806} {"train_loss": -5.488122940063477, "global_step": 33892, "epoch": 806} {"train_loss": -5.539257901055472, "global_step": 33893, "epoch": 806, "val_loss": 74819.75} {"train_loss": -5.493981838226318, "global_step": 33894, "epoch": 807} {"train_loss": -5.455864906311035, "global_step": 33895, "epoch": 807} {"train_loss": -5.484226226806641, "global_step": 33896, "epoch": 807} {"train_loss": -5.462279319763184, "global_step": 33897, "epoch": 807} {"train_loss": -5.425080299377441, "global_step": 33898, "epoch": 807} {"train_loss": -5.4270524978637695, "global_step": 33899, "epoch": 807} {"train_loss": -5.497883319854736, "global_step": 33900, "epoch": 807} {"train_loss": -5.493086814880371, "global_step": 33901, "epoch": 807} {"train_loss": -5.492340564727783, "global_step": 33902, "epoch": 807} {"train_loss": -5.478726863861084, "global_step": 33903, "epoch": 807} {"train_loss": -5.50759744644165, "global_step": 33904, "epoch": 807} {"train_loss": -5.396114349365234, "global_step": 33905, "epoch": 807} {"train_loss": -5.485644340515137, "global_step": 33906, "epoch": 807} {"train_loss": -5.34536600112915, "global_step": 33907, "epoch": 807} {"train_loss": -5.467161178588867, "global_step": 33908, "epoch": 807} {"train_loss": -5.451403617858887, "global_step": 33909, "epoch": 807} {"train_loss": -5.479633331298828, "global_step": 33910, "epoch": 807} {"train_loss": -5.466741561889648, "global_step": 33911, "epoch": 807} {"train_loss": -5.476779937744141, "global_step": 33912, "epoch": 807} {"train_loss": -5.435614585876465, "global_step": 33913, "epoch": 807} {"train_loss": -5.675431251525879, "global_step": 33914, "epoch": 807} {"train_loss": -5.513104438781738, "global_step": 33915, "epoch": 807} {"train_loss": -5.495594501495361, "global_step": 33916, "epoch": 807} {"train_loss": -5.586287975311279, "global_step": 33917, "epoch": 807} {"train_loss": -5.526289939880371, "global_step": 33918, "epoch": 807} {"train_loss": -5.543912887573242, "global_step": 33919, "epoch": 807} {"train_loss": -5.634687423706055, "global_step": 33920, "epoch": 807} {"train_loss": -5.588537216186523, "global_step": 33921, "epoch": 807} {"train_loss": -5.421579360961914, "global_step": 33922, "epoch": 807} {"train_loss": -5.520011901855469, "global_step": 33923, "epoch": 807} {"train_loss": -5.4467997550964355, "global_step": 33924, "epoch": 807} {"train_loss": -5.554336071014404, "global_step": 33925, "epoch": 807} {"train_loss": -5.617656707763672, "global_step": 33926, "epoch": 807} {"train_loss": -5.521228790283203, "global_step": 33927, "epoch": 807} {"train_loss": -5.475449562072754, "global_step": 33928, "epoch": 807} {"train_loss": -5.414332389831543, "global_step": 33929, "epoch": 807} {"train_loss": -5.47782039642334, "global_step": 33930, "epoch": 807} {"train_loss": -5.52267599105835, "global_step": 33931, "epoch": 807} {"train_loss": -5.604164123535156, "global_step": 33932, "epoch": 807} {"train_loss": -5.569457530975342, "global_step": 33933, "epoch": 807} {"train_loss": -5.591621398925781, "global_step": 33934, "epoch": 807} {"train_loss": -5.500614416031611, "global_step": 33935, "epoch": 807, "val_loss": 73955.9140625} {"train_loss": -5.54405403137207, "global_step": 33936, "epoch": 808} {"train_loss": -5.398453712463379, "global_step": 33937, "epoch": 808} {"train_loss": -5.655289649963379, "global_step": 33938, "epoch": 808} {"train_loss": -5.554384231567383, "global_step": 33939, "epoch": 808} {"train_loss": -5.590096950531006, "global_step": 33940, "epoch": 808} {"train_loss": -5.515575408935547, "global_step": 33941, "epoch": 808} {"train_loss": -5.593075752258301, "global_step": 33942, "epoch": 808} {"train_loss": -5.417666435241699, "global_step": 33943, "epoch": 808} {"train_loss": -5.528378486633301, "global_step": 33944, "epoch": 808} {"train_loss": -5.584963798522949, "global_step": 33945, "epoch": 808} {"train_loss": -5.514935493469238, "global_step": 33946, "epoch": 808} {"train_loss": -5.584632396697998, "global_step": 33947, "epoch": 808} {"train_loss": -5.549266338348389, "global_step": 33948, "epoch": 808} {"train_loss": -5.4775190353393555, "global_step": 33949, "epoch": 808} {"train_loss": -5.477779388427734, "global_step": 33950, "epoch": 808} {"train_loss": -5.539746284484863, "global_step": 33951, "epoch": 808} {"train_loss": -5.456327438354492, "global_step": 33952, "epoch": 808} {"train_loss": -5.519772529602051, "global_step": 33953, "epoch": 808} {"train_loss": -5.3825860023498535, "global_step": 33954, "epoch": 808} {"train_loss": -5.3719611167907715, "global_step": 33955, "epoch": 808} {"train_loss": -5.375842094421387, "global_step": 33956, "epoch": 808} {"train_loss": -5.447971343994141, "global_step": 33957, "epoch": 808} {"train_loss": -5.363364219665527, "global_step": 33958, "epoch": 808} {"train_loss": -5.431708812713623, "global_step": 33959, "epoch": 808} {"train_loss": -5.51209020614624, "global_step": 33960, "epoch": 808} {"train_loss": -5.595304489135742, "global_step": 33961, "epoch": 808} {"train_loss": -5.438022613525391, "global_step": 33962, "epoch": 808} {"train_loss": -5.5295305252075195, "global_step": 33963, "epoch": 808} {"train_loss": -5.506120204925537, "global_step": 33964, "epoch": 808} {"train_loss": -5.533754348754883, "global_step": 33965, "epoch": 808} {"train_loss": -5.492369174957275, "global_step": 33966, "epoch": 808} {"train_loss": -5.468264579772949, "global_step": 33967, "epoch": 808} {"train_loss": -5.578276634216309, "global_step": 33968, "epoch": 808} {"train_loss": -5.486901760101318, "global_step": 33969, "epoch": 808} {"train_loss": -5.60902214050293, "global_step": 33970, "epoch": 808} {"train_loss": -5.421563148498535, "global_step": 33971, "epoch": 808} {"train_loss": -5.601743698120117, "global_step": 33972, "epoch": 808} {"train_loss": -5.456076622009277, "global_step": 33973, "epoch": 808} {"train_loss": -5.591909885406494, "global_step": 33974, "epoch": 808} {"train_loss": -5.520003318786621, "global_step": 33975, "epoch": 808} {"train_loss": -5.646888256072998, "global_step": 33976, "epoch": 808} {"train_loss": -5.509439718155634, "global_step": 33977, "epoch": 808, "val_loss": 73773.234375} {"train_loss": -5.560962200164795, "global_step": 33978, "epoch": 809} {"train_loss": -5.617063522338867, "global_step": 33979, "epoch": 809} {"train_loss": -5.413661003112793, "global_step": 33980, "epoch": 809} {"train_loss": -5.40397834777832, "global_step": 33981, "epoch": 809} {"train_loss": -5.543332099914551, "global_step": 33982, "epoch": 809} {"train_loss": -5.34981632232666, "global_step": 33983, "epoch": 809} {"train_loss": -5.526618957519531, "global_step": 33984, "epoch": 809} {"train_loss": -5.528043746948242, "global_step": 33985, "epoch": 809} {"train_loss": -5.481661796569824, "global_step": 33986, "epoch": 809} {"train_loss": -5.543234348297119, "global_step": 33987, "epoch": 809} {"train_loss": -5.522362232208252, "global_step": 33988, "epoch": 809} {"train_loss": -5.5180439949035645, "global_step": 33989, "epoch": 809} {"train_loss": -5.552818298339844, "global_step": 33990, "epoch": 809} {"train_loss": -5.676477432250977, "global_step": 33991, "epoch": 809} {"train_loss": -5.4121012687683105, "global_step": 33992, "epoch": 809} {"train_loss": -5.598957061767578, "global_step": 33993, "epoch": 809} {"train_loss": -5.46401309967041, "global_step": 33994, "epoch": 809} {"train_loss": -5.43665075302124, "global_step": 33995, "epoch": 809} {"train_loss": -5.403185844421387, "global_step": 33996, "epoch": 809} {"train_loss": -5.4404754638671875, "global_step": 33997, "epoch": 809} {"train_loss": -5.52744197845459, "global_step": 33998, "epoch": 809} {"train_loss": -5.478717803955078, "global_step": 33999, "epoch": 809} {"train_loss": -5.4994072914123535, "global_step": 34000, "epoch": 809} {"train_loss": -5.418011665344238, "global_step": 34001, "epoch": 809} {"train_loss": -5.546592712402344, "global_step": 34002, "epoch": 809} {"train_loss": -5.32660436630249, "global_step": 34003, "epoch": 809} {"train_loss": -5.468863010406494, "global_step": 34004, "epoch": 809} {"train_loss": -5.5296549797058105, "global_step": 34005, "epoch": 809} {"train_loss": -5.539009094238281, "global_step": 34006, "epoch": 809} {"train_loss": -5.478356838226318, "global_step": 34007, "epoch": 809} {"train_loss": -5.487084865570068, "global_step": 34008, "epoch": 809} {"train_loss": -5.513007164001465, "global_step": 34009, "epoch": 809} {"train_loss": -5.520304203033447, "global_step": 34010, "epoch": 809} {"train_loss": -5.750142574310303, "global_step": 34011, "epoch": 809} {"train_loss": -5.467770576477051, "global_step": 34012, "epoch": 809} {"train_loss": -5.4406538009643555, "global_step": 34013, "epoch": 809} {"train_loss": -5.56417179107666, "global_step": 34014, "epoch": 809} {"train_loss": -5.48026180267334, "global_step": 34015, "epoch": 809} {"train_loss": -5.475046157836914, "global_step": 34016, "epoch": 809} {"train_loss": -5.678296089172363, "global_step": 34017, "epoch": 809} {"train_loss": -5.60417366027832, "global_step": 34018, "epoch": 809} {"train_loss": -5.509413775943575, "global_step": 34019, "epoch": 809, "val_loss": 74671.265625} {"train_loss": -5.489899158477783, "global_step": 34020, "epoch": 810} {"train_loss": -5.53480863571167, "global_step": 34021, "epoch": 810} {"train_loss": -5.687182426452637, "global_step": 34022, "epoch": 810} {"train_loss": -5.485772132873535, "global_step": 34023, "epoch": 810} {"train_loss": -5.3997802734375, "global_step": 34024, "epoch": 810} {"train_loss": -5.59253454208374, "global_step": 34025, "epoch": 810} {"train_loss": -5.535820007324219, "global_step": 34026, "epoch": 810} {"train_loss": -5.386259078979492, "global_step": 34027, "epoch": 810} {"train_loss": -5.538005352020264, "global_step": 34028, "epoch": 810} {"train_loss": -5.415803909301758, "global_step": 34029, "epoch": 810} {"train_loss": -5.46069860458374, "global_step": 34030, "epoch": 810} {"train_loss": -5.499003887176514, "global_step": 34031, "epoch": 810} {"train_loss": -5.591264724731445, "global_step": 34032, "epoch": 810} {"train_loss": -5.647312641143799, "global_step": 34033, "epoch": 810} {"train_loss": -5.526142120361328, "global_step": 34034, "epoch": 810} {"train_loss": -5.701183795928955, "global_step": 34035, "epoch": 810} {"train_loss": -5.558539390563965, "global_step": 34036, "epoch": 810} {"train_loss": -5.509026527404785, "global_step": 34037, "epoch": 810} {"train_loss": -5.492318630218506, "global_step": 34038, "epoch": 810} {"train_loss": -5.458059310913086, "global_step": 34039, "epoch": 810} {"train_loss": -5.492380142211914, "global_step": 34040, "epoch": 810} {"train_loss": -5.5283732414245605, "global_step": 34041, "epoch": 810} {"train_loss": -5.528642654418945, "global_step": 34042, "epoch": 810} {"train_loss": -5.433070182800293, "global_step": 34043, "epoch": 810} {"train_loss": -5.508779525756836, "global_step": 34044, "epoch": 810} {"train_loss": -5.576264381408691, "global_step": 34045, "epoch": 810} {"train_loss": -5.590921401977539, "global_step": 34046, "epoch": 810} {"train_loss": -5.534104347229004, "global_step": 34047, "epoch": 810} {"train_loss": -5.538028717041016, "global_step": 34048, "epoch": 810} {"train_loss": -5.588907718658447, "global_step": 34049, "epoch": 810} {"train_loss": -5.500644683837891, "global_step": 34050, "epoch": 810} {"train_loss": -5.586000442504883, "global_step": 34051, "epoch": 810} {"train_loss": -5.500115871429443, "global_step": 34052, "epoch": 810} {"train_loss": -5.447624206542969, "global_step": 34053, "epoch": 810} {"train_loss": -5.566972732543945, "global_step": 34054, "epoch": 810} {"train_loss": -5.42154598236084, "global_step": 34055, "epoch": 810} {"train_loss": -5.495458602905273, "global_step": 34056, "epoch": 810} {"train_loss": -5.490976333618164, "global_step": 34057, "epoch": 810} {"train_loss": -5.377038955688477, "global_step": 34058, "epoch": 810} {"train_loss": -5.582821846008301, "global_step": 34059, "epoch": 810} {"train_loss": -5.6187238693237305, "global_step": 34060, "epoch": 810} {"train_loss": -5.523199762616839, "global_step": 34061, "epoch": 810, "val_loss": 73989.7890625} {"train_loss": -5.562368392944336, "global_step": 34062, "epoch": 811} {"train_loss": -5.43344259262085, "global_step": 34063, "epoch": 811} {"train_loss": -5.500097274780273, "global_step": 34064, "epoch": 811} {"train_loss": -5.581252098083496, "global_step": 34065, "epoch": 811} {"train_loss": -5.536993980407715, "global_step": 34066, "epoch": 811} {"train_loss": -5.5757060050964355, "global_step": 34067, "epoch": 811} {"train_loss": -5.5141096115112305, "global_step": 34068, "epoch": 811} {"train_loss": -5.453216075897217, "global_step": 34069, "epoch": 811} {"train_loss": -5.415060520172119, "global_step": 34070, "epoch": 811} {"train_loss": -5.525601863861084, "global_step": 34071, "epoch": 811} {"train_loss": -5.446159839630127, "global_step": 34072, "epoch": 811} {"train_loss": -5.555085182189941, "global_step": 34073, "epoch": 811} {"train_loss": -5.602224349975586, "global_step": 34074, "epoch": 811} {"train_loss": -5.564038276672363, "global_step": 34075, "epoch": 811} {"train_loss": -5.547049522399902, "global_step": 34076, "epoch": 811} {"train_loss": -5.433055877685547, "global_step": 34077, "epoch": 811} {"train_loss": -5.473045349121094, "global_step": 34078, "epoch": 811} {"train_loss": -5.471526622772217, "global_step": 34079, "epoch": 811} {"train_loss": -5.568432807922363, "global_step": 34080, "epoch": 811} {"train_loss": -5.473640441894531, "global_step": 34081, "epoch": 811} {"train_loss": -5.5351433753967285, "global_step": 34082, "epoch": 811} {"train_loss": -5.544672012329102, "global_step": 34083, "epoch": 811} {"train_loss": -5.569727897644043, "global_step": 34084, "epoch": 811} {"train_loss": -5.60034704208374, "global_step": 34085, "epoch": 811} {"train_loss": -5.581296443939209, "global_step": 34086, "epoch": 811} {"train_loss": -5.631801128387451, "global_step": 34087, "epoch": 811} {"train_loss": -5.530025959014893, "global_step": 34088, "epoch": 811} {"train_loss": -5.444303035736084, "global_step": 34089, "epoch": 811} {"train_loss": -5.6020121574401855, "global_step": 34090, "epoch": 811} {"train_loss": -5.474444389343262, "global_step": 34091, "epoch": 811} {"train_loss": -5.461729049682617, "global_step": 34092, "epoch": 811} {"train_loss": -5.4693379402160645, "global_step": 34093, "epoch": 811} {"train_loss": -5.516956329345703, "global_step": 34094, "epoch": 811} {"train_loss": -5.572719097137451, "global_step": 34095, "epoch": 811} {"train_loss": -5.559959888458252, "global_step": 34096, "epoch": 811} {"train_loss": -5.478012561798096, "global_step": 34097, "epoch": 811} {"train_loss": -5.512219429016113, "global_step": 34098, "epoch": 811} {"train_loss": -5.557096004486084, "global_step": 34099, "epoch": 811} {"train_loss": -5.575122833251953, "global_step": 34100, "epoch": 811} {"train_loss": -5.587437629699707, "global_step": 34101, "epoch": 811} {"train_loss": -5.529566764831543, "global_step": 34102, "epoch": 811} {"train_loss": -5.524786052249727, "global_step": 34103, "epoch": 811, "val_loss": 73958.2890625} {"train_loss": -5.565621852874756, "global_step": 34104, "epoch": 812} {"train_loss": -5.443509101867676, "global_step": 34105, "epoch": 812} {"train_loss": -5.679640769958496, "global_step": 34106, "epoch": 812} {"train_loss": -5.605071544647217, "global_step": 34107, "epoch": 812} {"train_loss": -5.53745174407959, "global_step": 34108, "epoch": 812} {"train_loss": -5.467935562133789, "global_step": 34109, "epoch": 812} {"train_loss": -5.591654300689697, "global_step": 34110, "epoch": 812} {"train_loss": -5.5449113845825195, "global_step": 34111, "epoch": 812} {"train_loss": -5.492091655731201, "global_step": 34112, "epoch": 812} {"train_loss": -5.491601943969727, "global_step": 34113, "epoch": 812} {"train_loss": -5.655752182006836, "global_step": 34114, "epoch": 812} {"train_loss": -5.549496650695801, "global_step": 34115, "epoch": 812} {"train_loss": -5.443960189819336, "global_step": 34116, "epoch": 812} {"train_loss": -5.562579154968262, "global_step": 34117, "epoch": 812} {"train_loss": -5.655058860778809, "global_step": 34118, "epoch": 812} {"train_loss": -5.589456081390381, "global_step": 34119, "epoch": 812} {"train_loss": -5.623526573181152, "global_step": 34120, "epoch": 812} {"train_loss": -5.666048049926758, "global_step": 34121, "epoch": 812} {"train_loss": -5.374436378479004, "global_step": 34122, "epoch": 812} {"train_loss": -5.636560440063477, "global_step": 34123, "epoch": 812} {"train_loss": -5.56492805480957, "global_step": 34124, "epoch": 812} {"train_loss": -5.434454917907715, "global_step": 34125, "epoch": 812} {"train_loss": -5.600685119628906, "global_step": 34126, "epoch": 812} {"train_loss": -5.51878547668457, "global_step": 34127, "epoch": 812} {"train_loss": -5.381111145019531, "global_step": 34128, "epoch": 812} {"train_loss": -5.621026992797852, "global_step": 34129, "epoch": 812} {"train_loss": -5.490527629852295, "global_step": 34130, "epoch": 812} {"train_loss": -5.5649237632751465, "global_step": 34131, "epoch": 812} {"train_loss": -5.445502281188965, "global_step": 34132, "epoch": 812} {"train_loss": -5.595160007476807, "global_step": 34133, "epoch": 812} {"train_loss": -5.6074628829956055, "global_step": 34134, "epoch": 812} {"train_loss": -5.576315879821777, "global_step": 34135, "epoch": 812} {"train_loss": -5.437914848327637, "global_step": 34136, "epoch": 812} {"train_loss": -5.534278869628906, "global_step": 34137, "epoch": 812} {"train_loss": -5.694310188293457, "global_step": 34138, "epoch": 812} {"train_loss": -5.601881980895996, "global_step": 34139, "epoch": 812} {"train_loss": -5.513579368591309, "global_step": 34140, "epoch": 812} {"train_loss": -5.613631248474121, "global_step": 34141, "epoch": 812} {"train_loss": -5.5911407470703125, "global_step": 34142, "epoch": 812} {"train_loss": -5.621762275695801, "global_step": 34143, "epoch": 812} {"train_loss": -5.5409698486328125, "global_step": 34144, "epoch": 812} {"train_loss": -5.5536726997012185, "global_step": 34145, "epoch": 812, "val_loss": 74128.3125} {"train_loss": -5.613468170166016, "global_step": 34146, "epoch": 813} {"train_loss": -5.682924270629883, "global_step": 34147, "epoch": 813} {"train_loss": -5.575359344482422, "global_step": 34148, "epoch": 813} {"train_loss": -5.659792900085449, "global_step": 34149, "epoch": 813} {"train_loss": -5.477292537689209, "global_step": 34150, "epoch": 813} {"train_loss": -5.465950012207031, "global_step": 34151, "epoch": 813} {"train_loss": -5.630169868469238, "global_step": 34152, "epoch": 813} {"train_loss": -5.730144500732422, "global_step": 34153, "epoch": 813} {"train_loss": -5.653225421905518, "global_step": 34154, "epoch": 813} {"train_loss": -5.513311862945557, "global_step": 34155, "epoch": 813} {"train_loss": -5.497495651245117, "global_step": 34156, "epoch": 813} {"train_loss": -5.624382972717285, "global_step": 34157, "epoch": 813} {"train_loss": -5.545531272888184, "global_step": 34158, "epoch": 813} {"train_loss": -5.6142144203186035, "global_step": 34159, "epoch": 813} {"train_loss": -5.562714576721191, "global_step": 34160, "epoch": 813} {"train_loss": -5.39960241317749, "global_step": 34161, "epoch": 813} {"train_loss": -5.482888698577881, "global_step": 34162, "epoch": 813} {"train_loss": -5.479375839233398, "global_step": 34163, "epoch": 813} {"train_loss": -5.514626502990723, "global_step": 34164, "epoch": 813} {"train_loss": -5.52897834777832, "global_step": 34165, "epoch": 813} {"train_loss": -5.571051120758057, "global_step": 34166, "epoch": 813} {"train_loss": -5.604832649230957, "global_step": 34167, "epoch": 813} {"train_loss": -5.516232967376709, "global_step": 34168, "epoch": 813} {"train_loss": -5.516458034515381, "global_step": 34169, "epoch": 813} {"train_loss": -5.570136070251465, "global_step": 34170, "epoch": 813} {"train_loss": -5.528013229370117, "global_step": 34171, "epoch": 813} {"train_loss": -5.526307106018066, "global_step": 34172, "epoch": 813} {"train_loss": -5.443986892700195, "global_step": 34173, "epoch": 813} {"train_loss": -5.6040191650390625, "global_step": 34174, "epoch": 813} {"train_loss": -5.584263801574707, "global_step": 34175, "epoch": 813} {"train_loss": -5.550061225891113, "global_step": 34176, "epoch": 813} {"train_loss": -5.60988712310791, "global_step": 34177, "epoch": 813} {"train_loss": -5.531530380249023, "global_step": 34178, "epoch": 813} {"train_loss": -5.421285629272461, "global_step": 34179, "epoch": 813} {"train_loss": -5.660137176513672, "global_step": 34180, "epoch": 813} {"train_loss": -5.668341636657715, "global_step": 34181, "epoch": 813} {"train_loss": -5.514765739440918, "global_step": 34182, "epoch": 813} {"train_loss": -5.521050453186035, "global_step": 34183, "epoch": 813} {"train_loss": -5.545177459716797, "global_step": 34184, "epoch": 813} {"train_loss": -5.452335357666016, "global_step": 34185, "epoch": 813} {"train_loss": -5.544761657714844, "global_step": 34186, "epoch": 813} {"train_loss": -5.553782167888823, "global_step": 34187, "epoch": 813, "val_loss": 74244.328125} {"train_loss": -5.589406490325928, "global_step": 34188, "epoch": 814} {"train_loss": -5.518440246582031, "global_step": 34189, "epoch": 814} {"train_loss": -5.646698951721191, "global_step": 34190, "epoch": 814} {"train_loss": -5.494035720825195, "global_step": 34191, "epoch": 814} {"train_loss": -5.634847640991211, "global_step": 34192, "epoch": 814} {"train_loss": -5.476047039031982, "global_step": 34193, "epoch": 814} {"train_loss": -5.651793479919434, "global_step": 34194, "epoch": 814} {"train_loss": -5.422835350036621, "global_step": 34195, "epoch": 814} {"train_loss": -5.61150598526001, "global_step": 34196, "epoch": 814} {"train_loss": -5.43431282043457, "global_step": 34197, "epoch": 814} {"train_loss": -5.538419246673584, "global_step": 34198, "epoch": 814} {"train_loss": -5.588796615600586, "global_step": 34199, "epoch": 814} {"train_loss": -5.503618240356445, "global_step": 34200, "epoch": 814} {"train_loss": -5.553201675415039, "global_step": 34201, "epoch": 814} {"train_loss": -5.577184677124023, "global_step": 34202, "epoch": 814} {"train_loss": -5.4997663497924805, "global_step": 34203, "epoch": 814} {"train_loss": -5.665663242340088, "global_step": 34204, "epoch": 814} {"train_loss": -5.577401161193848, "global_step": 34205, "epoch": 814} {"train_loss": -5.5012946128845215, "global_step": 34206, "epoch": 814} {"train_loss": -5.498274803161621, "global_step": 34207, "epoch": 814} {"train_loss": -5.5738725662231445, "global_step": 34208, "epoch": 814} {"train_loss": -5.636815071105957, "global_step": 34209, "epoch": 814} {"train_loss": -5.503605842590332, "global_step": 34210, "epoch": 814} {"train_loss": -5.507698059082031, "global_step": 34211, "epoch": 814} {"train_loss": -5.585869789123535, "global_step": 34212, "epoch": 814} {"train_loss": -5.473247528076172, "global_step": 34213, "epoch": 814} {"train_loss": -5.483301162719727, "global_step": 34214, "epoch": 814} {"train_loss": -5.544391632080078, "global_step": 34215, "epoch": 814} {"train_loss": -5.487520217895508, "global_step": 34216, "epoch": 814} {"train_loss": -5.540046691894531, "global_step": 34217, "epoch": 814} {"train_loss": -5.617649078369141, "global_step": 34218, "epoch": 814} {"train_loss": -5.649008750915527, "global_step": 34219, "epoch": 814} {"train_loss": -5.516943454742432, "global_step": 34220, "epoch": 814} {"train_loss": -5.507323741912842, "global_step": 34221, "epoch": 814} {"train_loss": -5.637889862060547, "global_step": 34222, "epoch": 814} {"train_loss": -5.512393951416016, "global_step": 34223, "epoch": 814} {"train_loss": -5.541561603546143, "global_step": 34224, "epoch": 814} {"train_loss": -5.548022747039795, "global_step": 34225, "epoch": 814} {"train_loss": -5.569990634918213, "global_step": 34226, "epoch": 814} {"train_loss": -5.4766130447387695, "global_step": 34227, "epoch": 814} {"train_loss": -5.473301887512207, "global_step": 34228, "epoch": 814} {"train_loss": -5.543090525127592, "global_step": 34229, "epoch": 814, "val_loss": 74738.1953125} {"train_loss": -5.483625888824463, "global_step": 34230, "epoch": 815} {"train_loss": -5.619416236877441, "global_step": 34231, "epoch": 815} {"train_loss": -5.544620990753174, "global_step": 34232, "epoch": 815} {"train_loss": -5.4157395362854, "global_step": 34233, "epoch": 815} {"train_loss": -5.568721771240234, "global_step": 34234, "epoch": 815} {"train_loss": -5.522907257080078, "global_step": 34235, "epoch": 815} {"train_loss": -5.637877464294434, "global_step": 34236, "epoch": 815} {"train_loss": -5.42155647277832, "global_step": 34237, "epoch": 815} {"train_loss": -5.693014621734619, "global_step": 34238, "epoch": 815} {"train_loss": -5.673654556274414, "global_step": 34239, "epoch": 815} {"train_loss": -5.470512866973877, "global_step": 34240, "epoch": 815} {"train_loss": -5.550729751586914, "global_step": 34241, "epoch": 815} {"train_loss": -5.576415061950684, "global_step": 34242, "epoch": 815} {"train_loss": -5.589772701263428, "global_step": 34243, "epoch": 815} {"train_loss": -5.415012359619141, "global_step": 34244, "epoch": 815} {"train_loss": -5.589170455932617, "global_step": 34245, "epoch": 815} {"train_loss": -5.490825176239014, "global_step": 34246, "epoch": 815} {"train_loss": -5.541067123413086, "global_step": 34247, "epoch": 815} {"train_loss": -5.5596208572387695, "global_step": 34248, "epoch": 815} {"train_loss": -5.540550231933594, "global_step": 34249, "epoch": 815} {"train_loss": -5.491293907165527, "global_step": 34250, "epoch": 815} {"train_loss": -5.51181697845459, "global_step": 34251, "epoch": 815} {"train_loss": -5.580743789672852, "global_step": 34252, "epoch": 815} {"train_loss": -5.678103923797607, "global_step": 34253, "epoch": 815} {"train_loss": -5.438755035400391, "global_step": 34254, "epoch": 815} {"train_loss": -5.511308670043945, "global_step": 34255, "epoch": 815} {"train_loss": -5.621563911437988, "global_step": 34256, "epoch": 815} {"train_loss": -5.480047225952148, "global_step": 34257, "epoch": 815} {"train_loss": -5.39039421081543, "global_step": 34258, "epoch": 815} {"train_loss": -5.531779766082764, "global_step": 34259, "epoch": 815} {"train_loss": -5.627602577209473, "global_step": 34260, "epoch": 815} {"train_loss": -5.628313064575195, "global_step": 34261, "epoch": 815} {"train_loss": -5.461775302886963, "global_step": 34262, "epoch": 815} {"train_loss": -5.545124053955078, "global_step": 34263, "epoch": 815} {"train_loss": -5.490476131439209, "global_step": 34264, "epoch": 815} {"train_loss": -5.510464668273926, "global_step": 34265, "epoch": 815} {"train_loss": -5.37894868850708, "global_step": 34266, "epoch": 815} {"train_loss": -5.447533130645752, "global_step": 34267, "epoch": 815} {"train_loss": -5.514462947845459, "global_step": 34268, "epoch": 815} {"train_loss": -5.544253349304199, "global_step": 34269, "epoch": 815} {"train_loss": -5.500485420227051, "global_step": 34270, "epoch": 815} {"train_loss": -5.530519746598744, "global_step": 34271, "epoch": 815, "val_loss": 74733.2578125} {"train_loss": -5.461174964904785, "global_step": 34272, "epoch": 816} {"train_loss": -5.507608413696289, "global_step": 34273, "epoch": 816} {"train_loss": -5.515720367431641, "global_step": 34274, "epoch": 816} {"train_loss": -5.557635307312012, "global_step": 34275, "epoch": 816} {"train_loss": -5.494171619415283, "global_step": 34276, "epoch": 816} {"train_loss": -5.453696250915527, "global_step": 34277, "epoch": 816} {"train_loss": -5.462090015411377, "global_step": 34278, "epoch": 816} {"train_loss": -5.5818634033203125, "global_step": 34279, "epoch": 816} {"train_loss": -5.433771133422852, "global_step": 34280, "epoch": 816} {"train_loss": -5.485711097717285, "global_step": 34281, "epoch": 816} {"train_loss": -5.452103614807129, "global_step": 34282, "epoch": 816} {"train_loss": -5.41770076751709, "global_step": 34283, "epoch": 816} {"train_loss": -5.582719326019287, "global_step": 34284, "epoch": 816} {"train_loss": -5.4643425941467285, "global_step": 34285, "epoch": 816} {"train_loss": -5.42681884765625, "global_step": 34286, "epoch": 816} {"train_loss": -5.5537495613098145, "global_step": 34287, "epoch": 816} {"train_loss": -5.422581195831299, "global_step": 34288, "epoch": 816} {"train_loss": -5.536965847015381, "global_step": 34289, "epoch": 816} {"train_loss": -5.536886692047119, "global_step": 34290, "epoch": 816} {"train_loss": -5.52742862701416, "global_step": 34291, "epoch": 816} {"train_loss": -5.605420112609863, "global_step": 34292, "epoch": 816} {"train_loss": -5.465802192687988, "global_step": 34293, "epoch": 816} {"train_loss": -5.494024276733398, "global_step": 34294, "epoch": 816} {"train_loss": -5.494051933288574, "global_step": 34295, "epoch": 816} {"train_loss": -5.479989528656006, "global_step": 34296, "epoch": 816} {"train_loss": -5.618938446044922, "global_step": 34297, "epoch": 816} {"train_loss": -5.404516220092773, "global_step": 34298, "epoch": 816} {"train_loss": -5.519755840301514, "global_step": 34299, "epoch": 816} {"train_loss": -5.4402241706848145, "global_step": 34300, "epoch": 816} {"train_loss": -5.523325443267822, "global_step": 34301, "epoch": 816} {"train_loss": -5.4777302742004395, "global_step": 34302, "epoch": 816} {"train_loss": -5.481410980224609, "global_step": 34303, "epoch": 816} {"train_loss": -5.578665733337402, "global_step": 34304, "epoch": 816} {"train_loss": -5.33896541595459, "global_step": 34305, "epoch": 816} {"train_loss": -5.455817222595215, "global_step": 34306, "epoch": 816} {"train_loss": -5.3827314376831055, "global_step": 34307, "epoch": 816} {"train_loss": -5.641308784484863, "global_step": 34308, "epoch": 816} {"train_loss": -5.5007123947143555, "global_step": 34309, "epoch": 816} {"train_loss": -5.337928771972656, "global_step": 34310, "epoch": 816} {"train_loss": -5.4890313148498535, "global_step": 34311, "epoch": 816} {"train_loss": -5.48796272277832, "global_step": 34312, "epoch": 816} {"train_loss": -5.490692660922096, "global_step": 34313, "epoch": 816, "val_loss": 74992.9921875} {"train_loss": -5.4356842041015625, "global_step": 34314, "epoch": 817} {"train_loss": -5.525732040405273, "global_step": 34315, "epoch": 817} {"train_loss": -5.510456085205078, "global_step": 34316, "epoch": 817} {"train_loss": -5.463109970092773, "global_step": 34317, "epoch": 817} {"train_loss": -5.638284206390381, "global_step": 34318, "epoch": 817} {"train_loss": -5.515994548797607, "global_step": 34319, "epoch": 817} {"train_loss": -5.524079322814941, "global_step": 34320, "epoch": 817} {"train_loss": -5.415007591247559, "global_step": 34321, "epoch": 817} {"train_loss": -5.477393627166748, "global_step": 34322, "epoch": 817} {"train_loss": -5.627007484436035, "global_step": 34323, "epoch": 817} {"train_loss": -5.492058277130127, "global_step": 34324, "epoch": 817} {"train_loss": -5.435371398925781, "global_step": 34325, "epoch": 817} {"train_loss": -5.412098407745361, "global_step": 34326, "epoch": 817} {"train_loss": -5.517581939697266, "global_step": 34327, "epoch": 817} {"train_loss": -5.3657989501953125, "global_step": 34328, "epoch": 817} {"train_loss": -5.4242987632751465, "global_step": 34329, "epoch": 817} {"train_loss": -5.6555914878845215, "global_step": 34330, "epoch": 817} {"train_loss": -5.473746299743652, "global_step": 34331, "epoch": 817} {"train_loss": -5.546227931976318, "global_step": 34332, "epoch": 817} {"train_loss": -5.457626819610596, "global_step": 34333, "epoch": 817} {"train_loss": -5.573020935058594, "global_step": 34334, "epoch": 817} {"train_loss": -5.504944801330566, "global_step": 34335, "epoch": 817} {"train_loss": -5.483336925506592, "global_step": 34336, "epoch": 817} {"train_loss": -5.457150459289551, "global_step": 34337, "epoch": 817} {"train_loss": -5.435298919677734, "global_step": 34338, "epoch": 817} {"train_loss": -5.496771812438965, "global_step": 34339, "epoch": 817} {"train_loss": -5.475351810455322, "global_step": 34340, "epoch": 817} {"train_loss": -5.489886283874512, "global_step": 34341, "epoch": 817} {"train_loss": -5.4520463943481445, "global_step": 34342, "epoch": 817} {"train_loss": -5.556405067443848, "global_step": 34343, "epoch": 817} {"train_loss": -5.646880149841309, "global_step": 34344, "epoch": 817} {"train_loss": -5.472692012786865, "global_step": 34345, "epoch": 817} {"train_loss": -5.591989517211914, "global_step": 34346, "epoch": 817} {"train_loss": -5.4795122146606445, "global_step": 34347, "epoch": 817} {"train_loss": -5.544372081756592, "global_step": 34348, "epoch": 817} {"train_loss": -5.561977386474609, "global_step": 34349, "epoch": 817} {"train_loss": -5.677616119384766, "global_step": 34350, "epoch": 817} {"train_loss": -5.527883052825928, "global_step": 34351, "epoch": 817} {"train_loss": -5.644713401794434, "global_step": 34352, "epoch": 817} {"train_loss": -5.595676422119141, "global_step": 34353, "epoch": 817} {"train_loss": -5.60235595703125, "global_step": 34354, "epoch": 817} {"train_loss": -5.5191173780532115, "global_step": 34355, "epoch": 817, "val_loss": 74741.015625} {"train_loss": -5.435032844543457, "global_step": 34356, "epoch": 818} {"train_loss": -5.5250349044799805, "global_step": 34357, "epoch": 818} {"train_loss": -5.500767707824707, "global_step": 34358, "epoch": 818} {"train_loss": -5.480242729187012, "global_step": 34359, "epoch": 818} {"train_loss": -5.640540599822998, "global_step": 34360, "epoch": 818} {"train_loss": -5.468197822570801, "global_step": 34361, "epoch": 818} {"train_loss": -5.4097113609313965, "global_step": 34362, "epoch": 818} {"train_loss": -5.558144569396973, "global_step": 34363, "epoch": 818} {"train_loss": -5.651948928833008, "global_step": 34364, "epoch": 818} {"train_loss": -5.514166831970215, "global_step": 34365, "epoch": 818} {"train_loss": -5.680398941040039, "global_step": 34366, "epoch": 818} {"train_loss": -5.501229763031006, "global_step": 34367, "epoch": 818} {"train_loss": -5.5201592445373535, "global_step": 34368, "epoch": 818} {"train_loss": -5.505148887634277, "global_step": 34369, "epoch": 818} {"train_loss": -5.503570556640625, "global_step": 34370, "epoch": 818} {"train_loss": -5.540909767150879, "global_step": 34371, "epoch": 818} {"train_loss": -5.382335662841797, "global_step": 34372, "epoch": 818} {"train_loss": -5.431059837341309, "global_step": 34373, "epoch": 818} {"train_loss": -5.628164768218994, "global_step": 34374, "epoch": 818} {"train_loss": -5.54727840423584, "global_step": 34375, "epoch": 818} {"train_loss": -5.516364574432373, "global_step": 34376, "epoch": 818} {"train_loss": -5.479470252990723, "global_step": 34377, "epoch": 818} {"train_loss": -5.498517990112305, "global_step": 34378, "epoch": 818} {"train_loss": -5.559479236602783, "global_step": 34379, "epoch": 818} {"train_loss": -5.575281143188477, "global_step": 34380, "epoch": 818} {"train_loss": -5.5644426345825195, "global_step": 34381, "epoch": 818} {"train_loss": -5.408910274505615, "global_step": 34382, "epoch": 818} {"train_loss": -5.5040106773376465, "global_step": 34383, "epoch": 818} {"train_loss": -5.594966888427734, "global_step": 34384, "epoch": 818} {"train_loss": -5.4435715675354, "global_step": 34385, "epoch": 818} {"train_loss": -5.423548698425293, "global_step": 34386, "epoch": 818} {"train_loss": -5.445237159729004, "global_step": 34387, "epoch": 818} {"train_loss": -5.578869819641113, "global_step": 34388, "epoch": 818} {"train_loss": -5.546769142150879, "global_step": 34389, "epoch": 818} {"train_loss": -5.598367691040039, "global_step": 34390, "epoch": 818} {"train_loss": -5.295177459716797, "global_step": 34391, "epoch": 818} {"train_loss": -5.596513748168945, "global_step": 34392, "epoch": 818} {"train_loss": -5.492743492126465, "global_step": 34393, "epoch": 818} {"train_loss": -5.582235813140869, "global_step": 34394, "epoch": 818} {"train_loss": -5.4069061279296875, "global_step": 34395, "epoch": 818} {"train_loss": -5.580410957336426, "global_step": 34396, "epoch": 818} {"train_loss": -5.517181180772328, "global_step": 34397, "epoch": 818, "val_loss": 74294.53125} {"train_loss": -5.552793502807617, "global_step": 34398, "epoch": 819} {"train_loss": -5.551531791687012, "global_step": 34399, "epoch": 819} {"train_loss": -5.5431671142578125, "global_step": 34400, "epoch": 819} {"train_loss": -5.6158599853515625, "global_step": 34401, "epoch": 819} {"train_loss": -5.4336748123168945, "global_step": 34402, "epoch": 819} {"train_loss": -5.617712020874023, "global_step": 34403, "epoch": 819} {"train_loss": -5.519769191741943, "global_step": 34404, "epoch": 819} {"train_loss": -5.436375617980957, "global_step": 34405, "epoch": 819} {"train_loss": -5.488310813903809, "global_step": 34406, "epoch": 819} {"train_loss": -5.52251672744751, "global_step": 34407, "epoch": 819} {"train_loss": -5.41697883605957, "global_step": 34408, "epoch": 819} {"train_loss": -5.636507034301758, "global_step": 34409, "epoch": 819} {"train_loss": -5.475878715515137, "global_step": 34410, "epoch": 819} {"train_loss": -5.506713390350342, "global_step": 34411, "epoch": 819} {"train_loss": -5.583271503448486, "global_step": 34412, "epoch": 819} {"train_loss": -5.421811103820801, "global_step": 34413, "epoch": 819} {"train_loss": -5.569853782653809, "global_step": 34414, "epoch": 819} {"train_loss": -5.5081024169921875, "global_step": 34415, "epoch": 819} {"train_loss": -5.5744476318359375, "global_step": 34416, "epoch": 819} {"train_loss": -5.520869255065918, "global_step": 34417, "epoch": 819} {"train_loss": -5.479525566101074, "global_step": 34418, "epoch": 819} {"train_loss": -5.495936393737793, "global_step": 34419, "epoch": 819} {"train_loss": -5.554275989532471, "global_step": 34420, "epoch": 819} {"train_loss": -5.477590560913086, "global_step": 34421, "epoch": 819} {"train_loss": -5.651540756225586, "global_step": 34422, "epoch": 819} {"train_loss": -5.573766708374023, "global_step": 34423, "epoch": 819} {"train_loss": -5.587893486022949, "global_step": 34424, "epoch": 819} {"train_loss": -5.539003372192383, "global_step": 34425, "epoch": 819} {"train_loss": -5.605258464813232, "global_step": 34426, "epoch": 819} {"train_loss": -5.517831325531006, "global_step": 34427, "epoch": 819} {"train_loss": -5.410862922668457, "global_step": 34428, "epoch": 819} {"train_loss": -5.439122676849365, "global_step": 34429, "epoch": 819} {"train_loss": -5.593347549438477, "global_step": 34430, "epoch": 819} {"train_loss": -5.4764509201049805, "global_step": 34431, "epoch": 819} {"train_loss": -5.748902320861816, "global_step": 34432, "epoch": 819} {"train_loss": -5.5453667640686035, "global_step": 34433, "epoch": 819} {"train_loss": -5.566769599914551, "global_step": 34434, "epoch": 819} {"train_loss": -5.65805721282959, "global_step": 34435, "epoch": 819} {"train_loss": -5.575742721557617, "global_step": 34436, "epoch": 819} {"train_loss": -5.399241924285889, "global_step": 34437, "epoch": 819} {"train_loss": -5.343682289123535, "global_step": 34438, "epoch": 819} {"train_loss": -5.530156532923381, "global_step": 34439, "epoch": 819, "val_loss": 74463.859375} {"train_loss": -5.639327049255371, "global_step": 34440, "epoch": 820} {"train_loss": -5.5270233154296875, "global_step": 34441, "epoch": 820} {"train_loss": -5.522161483764648, "global_step": 34442, "epoch": 820} {"train_loss": -5.588129997253418, "global_step": 34443, "epoch": 820} {"train_loss": -5.531214237213135, "global_step": 34444, "epoch": 820} {"train_loss": -5.492430686950684, "global_step": 34445, "epoch": 820} {"train_loss": -5.392872333526611, "global_step": 34446, "epoch": 820} {"train_loss": -5.455984592437744, "global_step": 34447, "epoch": 820} {"train_loss": -5.479047775268555, "global_step": 34448, "epoch": 820} {"train_loss": -5.440996170043945, "global_step": 34449, "epoch": 820} {"train_loss": -5.683058738708496, "global_step": 34450, "epoch": 820} {"train_loss": -5.603748321533203, "global_step": 34451, "epoch": 820} {"train_loss": -5.556013584136963, "global_step": 34452, "epoch": 820} {"train_loss": -5.515091896057129, "global_step": 34453, "epoch": 820} {"train_loss": -5.560783386230469, "global_step": 34454, "epoch": 820} {"train_loss": -5.5927557945251465, "global_step": 34455, "epoch": 820} {"train_loss": -5.569762229919434, "global_step": 34456, "epoch": 820} {"train_loss": -5.612602233886719, "global_step": 34457, "epoch": 820} {"train_loss": -5.475958824157715, "global_step": 34458, "epoch": 820} {"train_loss": -5.574112892150879, "global_step": 34459, "epoch": 820} {"train_loss": -5.507882118225098, "global_step": 34460, "epoch": 820} {"train_loss": -5.570584297180176, "global_step": 34461, "epoch": 820} {"train_loss": -5.543895244598389, "global_step": 34462, "epoch": 820} {"train_loss": -5.569157600402832, "global_step": 34463, "epoch": 820} {"train_loss": -5.564383029937744, "global_step": 34464, "epoch": 820} {"train_loss": -5.373865127563477, "global_step": 34465, "epoch": 820} {"train_loss": -5.5694050788879395, "global_step": 34466, "epoch": 820} {"train_loss": -5.588476181030273, "global_step": 34467, "epoch": 820} {"train_loss": -5.451671123504639, "global_step": 34468, "epoch": 820} {"train_loss": -5.506674766540527, "global_step": 34469, "epoch": 820} {"train_loss": -5.457363605499268, "global_step": 34470, "epoch": 820} {"train_loss": -5.529939651489258, "global_step": 34471, "epoch": 820} {"train_loss": -5.630542755126953, "global_step": 34472, "epoch": 820} {"train_loss": -5.562705039978027, "global_step": 34473, "epoch": 820} {"train_loss": -5.457293510437012, "global_step": 34474, "epoch": 820} {"train_loss": -5.6691389083862305, "global_step": 34475, "epoch": 820} {"train_loss": -5.616464138031006, "global_step": 34476, "epoch": 820} {"train_loss": -5.342789173126221, "global_step": 34477, "epoch": 820} {"train_loss": -5.538502216339111, "global_step": 34478, "epoch": 820} {"train_loss": -5.512035369873047, "global_step": 34479, "epoch": 820} {"train_loss": -5.5115461349487305, "global_step": 34480, "epoch": 820} {"train_loss": -5.53491869426909, "global_step": 34481, "epoch": 820, "val_loss": 74455.765625} {"train_loss": -5.50404167175293, "global_step": 34482, "epoch": 821} {"train_loss": -5.4635910987854, "global_step": 34483, "epoch": 821} {"train_loss": -5.5482378005981445, "global_step": 34484, "epoch": 821} {"train_loss": -5.575765609741211, "global_step": 34485, "epoch": 821} {"train_loss": -5.571953773498535, "global_step": 34486, "epoch": 821} {"train_loss": -5.5190958976745605, "global_step": 34487, "epoch": 821} {"train_loss": -5.772058963775635, "global_step": 34488, "epoch": 821} {"train_loss": -5.564837455749512, "global_step": 34489, "epoch": 821} {"train_loss": -5.529788970947266, "global_step": 34490, "epoch": 821} {"train_loss": -5.473920822143555, "global_step": 34491, "epoch": 821} {"train_loss": -5.637803077697754, "global_step": 34492, "epoch": 821} {"train_loss": -5.56636905670166, "global_step": 34493, "epoch": 821} {"train_loss": -5.5563788414001465, "global_step": 34494, "epoch": 821} {"train_loss": -5.675356864929199, "global_step": 34495, "epoch": 821} {"train_loss": -5.4937639236450195, "global_step": 34496, "epoch": 821} {"train_loss": -5.496664524078369, "global_step": 34497, "epoch": 821} {"train_loss": -5.451083660125732, "global_step": 34498, "epoch": 821} {"train_loss": -5.429033279418945, "global_step": 34499, "epoch": 821} {"train_loss": -5.668844223022461, "global_step": 34500, "epoch": 821} {"train_loss": -5.483036518096924, "global_step": 34501, "epoch": 821} {"train_loss": -5.436673641204834, "global_step": 34502, "epoch": 821} {"train_loss": -5.548992156982422, "global_step": 34503, "epoch": 821} {"train_loss": -5.615243911743164, "global_step": 34504, "epoch": 821} {"train_loss": -5.537576675415039, "global_step": 34505, "epoch": 821} {"train_loss": -5.624288082122803, "global_step": 34506, "epoch": 821} {"train_loss": -5.6310272216796875, "global_step": 34507, "epoch": 821} {"train_loss": -5.592474937438965, "global_step": 34508, "epoch": 821} {"train_loss": -5.6173996925354, "global_step": 34509, "epoch": 821} {"train_loss": -5.565200328826904, "global_step": 34510, "epoch": 821} {"train_loss": -5.625651836395264, "global_step": 34511, "epoch": 821} {"train_loss": -5.605164527893066, "global_step": 34512, "epoch": 821} {"train_loss": -5.377970218658447, "global_step": 34513, "epoch": 821} {"train_loss": -5.537186145782471, "global_step": 34514, "epoch": 821} {"train_loss": -5.610204219818115, "global_step": 34515, "epoch": 821} {"train_loss": -5.573559761047363, "global_step": 34516, "epoch": 821} {"train_loss": -5.481531143188477, "global_step": 34517, "epoch": 821} {"train_loss": -5.626158714294434, "global_step": 34518, "epoch": 821} {"train_loss": -5.610039234161377, "global_step": 34519, "epoch": 821} {"train_loss": -5.524848461151123, "global_step": 34520, "epoch": 821} {"train_loss": -5.537724494934082, "global_step": 34521, "epoch": 821} {"train_loss": -5.612648963928223, "global_step": 34522, "epoch": 821} {"train_loss": -5.55906123206729, "global_step": 34523, "epoch": 821, "val_loss": 74092.6328125} {"train_loss": -5.481479644775391, "global_step": 34524, "epoch": 822} {"train_loss": -5.534701824188232, "global_step": 34525, "epoch": 822} {"train_loss": -5.4911065101623535, "global_step": 34526, "epoch": 822} {"train_loss": -5.6171064376831055, "global_step": 34527, "epoch": 822} {"train_loss": -5.552950859069824, "global_step": 34528, "epoch": 822} {"train_loss": -5.578238487243652, "global_step": 34529, "epoch": 822} {"train_loss": -5.567431449890137, "global_step": 34530, "epoch": 822} {"train_loss": -5.581350803375244, "global_step": 34531, "epoch": 822} {"train_loss": -5.526467323303223, "global_step": 34532, "epoch": 822} {"train_loss": -5.398202896118164, "global_step": 34533, "epoch": 822} {"train_loss": -5.570941925048828, "global_step": 34534, "epoch": 822} {"train_loss": -5.562007904052734, "global_step": 34535, "epoch": 822} {"train_loss": -5.524590015411377, "global_step": 34536, "epoch": 822} {"train_loss": -5.598759651184082, "global_step": 34537, "epoch": 822} {"train_loss": -5.558062553405762, "global_step": 34538, "epoch": 822} {"train_loss": -5.628894805908203, "global_step": 34539, "epoch": 822} {"train_loss": -5.5900187492370605, "global_step": 34540, "epoch": 822} {"train_loss": -5.600371360778809, "global_step": 34541, "epoch": 822} {"train_loss": -5.480895042419434, "global_step": 34542, "epoch": 822} {"train_loss": -5.619741439819336, "global_step": 34543, "epoch": 822} {"train_loss": -5.555440425872803, "global_step": 34544, "epoch": 822} {"train_loss": -5.51104736328125, "global_step": 34545, "epoch": 822} {"train_loss": -5.584196090698242, "global_step": 34546, "epoch": 822} {"train_loss": -5.502516746520996, "global_step": 34547, "epoch": 822} {"train_loss": -5.539772987365723, "global_step": 34548, "epoch": 822} {"train_loss": -5.5879364013671875, "global_step": 34549, "epoch": 822} {"train_loss": -5.623540878295898, "global_step": 34550, "epoch": 822} {"train_loss": -5.5764384269714355, "global_step": 34551, "epoch": 822} {"train_loss": -5.56155252456665, "global_step": 34552, "epoch": 822} {"train_loss": -5.556857109069824, "global_step": 34553, "epoch": 822} {"train_loss": -5.5223236083984375, "global_step": 34554, "epoch": 822} {"train_loss": -5.519000053405762, "global_step": 34555, "epoch": 822} {"train_loss": -5.618412017822266, "global_step": 34556, "epoch": 822} {"train_loss": -5.554169654846191, "global_step": 34557, "epoch": 822} {"train_loss": -5.5351433753967285, "global_step": 34558, "epoch": 822} {"train_loss": -5.373109340667725, "global_step": 34559, "epoch": 822} {"train_loss": -5.536890506744385, "global_step": 34560, "epoch": 822} {"train_loss": -5.494252681732178, "global_step": 34561, "epoch": 822} {"train_loss": -5.469033241271973, "global_step": 34562, "epoch": 822} {"train_loss": -5.50390625, "global_step": 34563, "epoch": 822} {"train_loss": -5.522022247314453, "global_step": 34564, "epoch": 822} {"train_loss": -5.5439713682447165, "global_step": 34565, "epoch": 822, "val_loss": 73774.09375} {"train_loss": -5.557215690612793, "global_step": 34566, "epoch": 823} {"train_loss": -5.545479774475098, "global_step": 34567, "epoch": 823} {"train_loss": -5.580475330352783, "global_step": 34568, "epoch": 823} {"train_loss": -5.489253997802734, "global_step": 34569, "epoch": 823} {"train_loss": -5.513274669647217, "global_step": 34570, "epoch": 823} {"train_loss": -5.667158603668213, "global_step": 34571, "epoch": 823} {"train_loss": -5.546107292175293, "global_step": 34572, "epoch": 823} {"train_loss": -5.517574310302734, "global_step": 34573, "epoch": 823} {"train_loss": -5.630239009857178, "global_step": 34574, "epoch": 823} {"train_loss": -5.57755708694458, "global_step": 34575, "epoch": 823} {"train_loss": -5.624772071838379, "global_step": 34576, "epoch": 823} {"train_loss": -5.582893371582031, "global_step": 34577, "epoch": 823} {"train_loss": -5.448964595794678, "global_step": 34578, "epoch": 823} {"train_loss": -5.545401096343994, "global_step": 34579, "epoch": 823} {"train_loss": -5.416357040405273, "global_step": 34580, "epoch": 823} {"train_loss": -5.592741012573242, "global_step": 34581, "epoch": 823} {"train_loss": -5.570429801940918, "global_step": 34582, "epoch": 823} {"train_loss": -5.491383075714111, "global_step": 34583, "epoch": 823} {"train_loss": -5.513106346130371, "global_step": 34584, "epoch": 823} {"train_loss": -5.458815574645996, "global_step": 34585, "epoch": 823} {"train_loss": -5.600822925567627, "global_step": 34586, "epoch": 823} {"train_loss": -5.6010541915893555, "global_step": 34587, "epoch": 823} {"train_loss": -5.555825710296631, "global_step": 34588, "epoch": 823} {"train_loss": -5.513861656188965, "global_step": 34589, "epoch": 823} {"train_loss": -5.595743179321289, "global_step": 34590, "epoch": 823} {"train_loss": -5.337815761566162, "global_step": 34591, "epoch": 823} {"train_loss": -5.597960472106934, "global_step": 34592, "epoch": 823} {"train_loss": -5.610749244689941, "global_step": 34593, "epoch": 823} {"train_loss": -5.537595748901367, "global_step": 34594, "epoch": 823} {"train_loss": -5.5863752365112305, "global_step": 34595, "epoch": 823} {"train_loss": -5.52518367767334, "global_step": 34596, "epoch": 823} {"train_loss": -5.546779632568359, "global_step": 34597, "epoch": 823} {"train_loss": -5.507791042327881, "global_step": 34598, "epoch": 823} {"train_loss": -5.497263431549072, "global_step": 34599, "epoch": 823} {"train_loss": -5.526040077209473, "global_step": 34600, "epoch": 823} {"train_loss": -5.648983001708984, "global_step": 34601, "epoch": 823} {"train_loss": -5.485351085662842, "global_step": 34602, "epoch": 823} {"train_loss": -5.540774345397949, "global_step": 34603, "epoch": 823} {"train_loss": -5.536823272705078, "global_step": 34604, "epoch": 823} {"train_loss": -5.551201343536377, "global_step": 34605, "epoch": 823} {"train_loss": -5.445607662200928, "global_step": 34606, "epoch": 823} {"train_loss": -5.540252390361967, "global_step": 34607, "epoch": 823, "val_loss": 74134.8046875} {"train_loss": -5.488405704498291, "global_step": 34608, "epoch": 824} {"train_loss": -5.572833061218262, "global_step": 34609, "epoch": 824} {"train_loss": -5.524382591247559, "global_step": 34610, "epoch": 824} {"train_loss": -5.491675853729248, "global_step": 34611, "epoch": 824} {"train_loss": -5.600616455078125, "global_step": 34612, "epoch": 824} {"train_loss": -5.586865425109863, "global_step": 34613, "epoch": 824} {"train_loss": -5.626707077026367, "global_step": 34614, "epoch": 824} {"train_loss": -5.53016471862793, "global_step": 34615, "epoch": 824} {"train_loss": -5.625616550445557, "global_step": 34616, "epoch": 824} {"train_loss": -5.6307172775268555, "global_step": 34617, "epoch": 824} {"train_loss": -5.473587989807129, "global_step": 34618, "epoch": 824} {"train_loss": -5.662454605102539, "global_step": 34619, "epoch": 824} {"train_loss": -5.680437088012695, "global_step": 34620, "epoch": 824} {"train_loss": -5.549280166625977, "global_step": 34621, "epoch": 824} {"train_loss": -5.673043251037598, "global_step": 34622, "epoch": 824} {"train_loss": -5.694583892822266, "global_step": 34623, "epoch": 824} {"train_loss": -5.51597261428833, "global_step": 34624, "epoch": 824} {"train_loss": -5.623562812805176, "global_step": 34625, "epoch": 824} {"train_loss": -5.5279998779296875, "global_step": 34626, "epoch": 824} {"train_loss": -5.484570503234863, "global_step": 34627, "epoch": 824} {"train_loss": -5.538982391357422, "global_step": 34628, "epoch": 824} {"train_loss": -5.530795097351074, "global_step": 34629, "epoch": 824} {"train_loss": -5.481174945831299, "global_step": 34630, "epoch": 824} {"train_loss": -5.480541229248047, "global_step": 34631, "epoch": 824} {"train_loss": -5.592489242553711, "global_step": 34632, "epoch": 824} {"train_loss": -5.530861854553223, "global_step": 34633, "epoch": 824} {"train_loss": -5.541788578033447, "global_step": 34634, "epoch": 824} {"train_loss": -5.554913520812988, "global_step": 34635, "epoch": 824} {"train_loss": -5.611263275146484, "global_step": 34636, "epoch": 824} {"train_loss": -5.476014137268066, "global_step": 34637, "epoch": 824} {"train_loss": -5.508970737457275, "global_step": 34638, "epoch": 824} {"train_loss": -5.49052095413208, "global_step": 34639, "epoch": 824} {"train_loss": -5.52533483505249, "global_step": 34640, "epoch": 824} {"train_loss": -5.529152870178223, "global_step": 34641, "epoch": 824} {"train_loss": -5.607501983642578, "global_step": 34642, "epoch": 824} {"train_loss": -5.540867805480957, "global_step": 34643, "epoch": 824} {"train_loss": -5.685876846313477, "global_step": 34644, "epoch": 824} {"train_loss": -5.635313987731934, "global_step": 34645, "epoch": 824} {"train_loss": -5.521788597106934, "global_step": 34646, "epoch": 824} {"train_loss": -5.505524635314941, "global_step": 34647, "epoch": 824} {"train_loss": -5.665411949157715, "global_step": 34648, "epoch": 824} {"train_loss": -5.563365334556217, "global_step": 34649, "epoch": 824, "val_loss": 74553.0} {"train_loss": -5.552585601806641, "global_step": 34650, "epoch": 825} {"train_loss": -5.56019401550293, "global_step": 34651, "epoch": 825} {"train_loss": -5.660685062408447, "global_step": 34652, "epoch": 825} {"train_loss": -5.449270248413086, "global_step": 34653, "epoch": 825} {"train_loss": -5.586555480957031, "global_step": 34654, "epoch": 825} {"train_loss": -5.451471328735352, "global_step": 34655, "epoch": 825} {"train_loss": -5.518714904785156, "global_step": 34656, "epoch": 825} {"train_loss": -5.53508186340332, "global_step": 34657, "epoch": 825} {"train_loss": -5.5809454917907715, "global_step": 34658, "epoch": 825} {"train_loss": -5.520402908325195, "global_step": 34659, "epoch": 825} {"train_loss": -5.639533519744873, "global_step": 34660, "epoch": 825} {"train_loss": -5.580502033233643, "global_step": 34661, "epoch": 825} {"train_loss": -5.527987480163574, "global_step": 34662, "epoch": 825} {"train_loss": -5.583101272583008, "global_step": 34663, "epoch": 825} {"train_loss": -5.466405868530273, "global_step": 34664, "epoch": 825} {"train_loss": -5.587357044219971, "global_step": 34665, "epoch": 825} {"train_loss": -5.539336204528809, "global_step": 34666, "epoch": 825} {"train_loss": -5.503592491149902, "global_step": 34667, "epoch": 825} {"train_loss": -5.554813861846924, "global_step": 34668, "epoch": 825} {"train_loss": -5.724851131439209, "global_step": 34669, "epoch": 825} {"train_loss": -5.620477676391602, "global_step": 34670, "epoch": 825} {"train_loss": -5.512770652770996, "global_step": 34671, "epoch": 825} {"train_loss": -5.594295501708984, "global_step": 34672, "epoch": 825} {"train_loss": -5.5496320724487305, "global_step": 34673, "epoch": 825} {"train_loss": -5.476316928863525, "global_step": 34674, "epoch": 825} {"train_loss": -5.591095924377441, "global_step": 34675, "epoch": 825} {"train_loss": -5.5768890380859375, "global_step": 34676, "epoch": 825} {"train_loss": -5.524346828460693, "global_step": 34677, "epoch": 825} {"train_loss": -5.4218902587890625, "global_step": 34678, "epoch": 825} {"train_loss": -5.474242210388184, "global_step": 34679, "epoch": 825} {"train_loss": -5.479183673858643, "global_step": 34680, "epoch": 825} {"train_loss": -5.316254615783691, "global_step": 34681, "epoch": 825} {"train_loss": -5.7773003578186035, "global_step": 34682, "epoch": 825} {"train_loss": -5.51475715637207, "global_step": 34683, "epoch": 825} {"train_loss": -5.495124816894531, "global_step": 34684, "epoch": 825} {"train_loss": -5.563007354736328, "global_step": 34685, "epoch": 825} {"train_loss": -5.568446636199951, "global_step": 34686, "epoch": 825} {"train_loss": -5.43180513381958, "global_step": 34687, "epoch": 825} {"train_loss": -5.471458911895752, "global_step": 34688, "epoch": 825} {"train_loss": -5.6349382400512695, "global_step": 34689, "epoch": 825} {"train_loss": -5.527948379516602, "global_step": 34690, "epoch": 825} {"train_loss": -5.544323739551363, "global_step": 34691, "epoch": 825, "val_loss": 74584.515625} {"train_loss": -5.605431079864502, "global_step": 34692, "epoch": 826} {"train_loss": -5.633646011352539, "global_step": 34693, "epoch": 826} {"train_loss": -5.631101131439209, "global_step": 34694, "epoch": 826} {"train_loss": -5.471985816955566, "global_step": 34695, "epoch": 826} {"train_loss": -5.673946380615234, "global_step": 34696, "epoch": 826} {"train_loss": -5.452856063842773, "global_step": 34697, "epoch": 826} {"train_loss": -5.48239803314209, "global_step": 34698, "epoch": 826} {"train_loss": -5.561708927154541, "global_step": 34699, "epoch": 826} {"train_loss": -5.529447555541992, "global_step": 34700, "epoch": 826} {"train_loss": -5.506302833557129, "global_step": 34701, "epoch": 826} {"train_loss": -5.540771484375, "global_step": 34702, "epoch": 826} {"train_loss": -5.515199661254883, "global_step": 34703, "epoch": 826} {"train_loss": -5.547410011291504, "global_step": 34704, "epoch": 826} {"train_loss": -5.4878387451171875, "global_step": 34705, "epoch": 826} {"train_loss": -5.496166229248047, "global_step": 34706, "epoch": 826} {"train_loss": -5.552924156188965, "global_step": 34707, "epoch": 826} {"train_loss": -5.449495315551758, "global_step": 34708, "epoch": 826} {"train_loss": -5.52833366394043, "global_step": 34709, "epoch": 826} {"train_loss": -5.405142307281494, "global_step": 34710, "epoch": 826} {"train_loss": -5.579459190368652, "global_step": 34711, "epoch": 826} {"train_loss": -5.509515762329102, "global_step": 34712, "epoch": 826} {"train_loss": -5.469478607177734, "global_step": 34713, "epoch": 826} {"train_loss": -5.460371017456055, "global_step": 34714, "epoch": 826} {"train_loss": -5.621217727661133, "global_step": 34715, "epoch": 826} {"train_loss": -5.539035797119141, "global_step": 34716, "epoch": 826} {"train_loss": -5.637179374694824, "global_step": 34717, "epoch": 826} {"train_loss": -5.683827877044678, "global_step": 34718, "epoch": 826} {"train_loss": -5.526603698730469, "global_step": 34719, "epoch": 826} {"train_loss": -5.465440273284912, "global_step": 34720, "epoch": 826} {"train_loss": -5.474854469299316, "global_step": 34721, "epoch": 826} {"train_loss": -5.5340423583984375, "global_step": 34722, "epoch": 826} {"train_loss": -5.499523162841797, "global_step": 34723, "epoch": 826} {"train_loss": -5.334915637969971, "global_step": 34724, "epoch": 826} {"train_loss": -5.519702911376953, "global_step": 34725, "epoch": 826} {"train_loss": -5.560734748840332, "global_step": 34726, "epoch": 826} {"train_loss": -5.448352813720703, "global_step": 34727, "epoch": 826} {"train_loss": -5.503013610839844, "global_step": 34728, "epoch": 826} {"train_loss": -5.5588178634643555, "global_step": 34729, "epoch": 826} {"train_loss": -5.509635925292969, "global_step": 34730, "epoch": 826} {"train_loss": -5.355645179748535, "global_step": 34731, "epoch": 826} {"train_loss": -5.505288124084473, "global_step": 34732, "epoch": 826} {"train_loss": -5.519127448399861, "global_step": 34733, "epoch": 826, "val_loss": 74720.125} {"train_loss": -5.573521137237549, "global_step": 34734, "epoch": 827} {"train_loss": -5.535102367401123, "global_step": 34735, "epoch": 827} {"train_loss": -5.435482501983643, "global_step": 34736, "epoch": 827} {"train_loss": -5.624783039093018, "global_step": 34737, "epoch": 827} {"train_loss": -5.478199481964111, "global_step": 34738, "epoch": 827} {"train_loss": -5.546812057495117, "global_step": 34739, "epoch": 827} {"train_loss": -5.61335563659668, "global_step": 34740, "epoch": 827} {"train_loss": -5.54194450378418, "global_step": 34741, "epoch": 827} {"train_loss": -5.494514465332031, "global_step": 34742, "epoch": 827} {"train_loss": -5.524871826171875, "global_step": 34743, "epoch": 827} {"train_loss": -5.566725730895996, "global_step": 34744, "epoch": 827} {"train_loss": -5.443742752075195, "global_step": 34745, "epoch": 827} {"train_loss": -5.640020370483398, "global_step": 34746, "epoch": 827} {"train_loss": -5.531176567077637, "global_step": 34747, "epoch": 827} {"train_loss": -5.46807861328125, "global_step": 34748, "epoch": 827} {"train_loss": -5.497633934020996, "global_step": 34749, "epoch": 827} {"train_loss": -5.621596336364746, "global_step": 34750, "epoch": 827} {"train_loss": -5.600231170654297, "global_step": 34751, "epoch": 827} {"train_loss": -5.408775329589844, "global_step": 34752, "epoch": 827} {"train_loss": -5.5616350173950195, "global_step": 34753, "epoch": 827} {"train_loss": -5.590930938720703, "global_step": 34754, "epoch": 827} {"train_loss": -5.498529434204102, "global_step": 34755, "epoch": 827} {"train_loss": -5.501620769500732, "global_step": 34756, "epoch": 827} {"train_loss": -5.501445770263672, "global_step": 34757, "epoch": 827} {"train_loss": -5.5578932762146, "global_step": 34758, "epoch": 827} {"train_loss": -5.6438188552856445, "global_step": 34759, "epoch": 827} {"train_loss": -5.537936687469482, "global_step": 34760, "epoch": 827} {"train_loss": -5.453166961669922, "global_step": 34761, "epoch": 827} {"train_loss": -5.579957962036133, "global_step": 34762, "epoch": 827} {"train_loss": -5.5579423904418945, "global_step": 34763, "epoch": 827} {"train_loss": -5.641883850097656, "global_step": 34764, "epoch": 827} {"train_loss": -5.398014545440674, "global_step": 34765, "epoch": 827} {"train_loss": -5.563894271850586, "global_step": 34766, "epoch": 827} {"train_loss": -5.75028657913208, "global_step": 34767, "epoch": 827} {"train_loss": -5.548036575317383, "global_step": 34768, "epoch": 827} {"train_loss": -5.391351699829102, "global_step": 34769, "epoch": 827} {"train_loss": -5.457268714904785, "global_step": 34770, "epoch": 827} {"train_loss": -5.551288604736328, "global_step": 34771, "epoch": 827} {"train_loss": -5.5722222328186035, "global_step": 34772, "epoch": 827} {"train_loss": -5.60289192199707, "global_step": 34773, "epoch": 827} {"train_loss": -5.57688570022583, "global_step": 34774, "epoch": 827} {"train_loss": -5.542776527858916, "global_step": 34775, "epoch": 827, "val_loss": 74228.5078125} {"train_loss": -5.5952911376953125, "global_step": 34776, "epoch": 828} {"train_loss": -5.6506853103637695, "global_step": 34777, "epoch": 828} {"train_loss": -5.525538921356201, "global_step": 34778, "epoch": 828} {"train_loss": -5.457770347595215, "global_step": 34779, "epoch": 828} {"train_loss": -5.5972208976745605, "global_step": 34780, "epoch": 828} {"train_loss": -5.481603145599365, "global_step": 34781, "epoch": 828} {"train_loss": -5.678598403930664, "global_step": 34782, "epoch": 828} {"train_loss": -5.493535041809082, "global_step": 34783, "epoch": 828} {"train_loss": -5.59147310256958, "global_step": 34784, "epoch": 828} {"train_loss": -5.524569034576416, "global_step": 34785, "epoch": 828} {"train_loss": -5.665936470031738, "global_step": 34786, "epoch": 828} {"train_loss": -5.605112075805664, "global_step": 34787, "epoch": 828} {"train_loss": -5.601261138916016, "global_step": 34788, "epoch": 828} {"train_loss": -5.494906902313232, "global_step": 34789, "epoch": 828} {"train_loss": -5.581582546234131, "global_step": 34790, "epoch": 828} {"train_loss": -5.602091312408447, "global_step": 34791, "epoch": 828} {"train_loss": -5.327683925628662, "global_step": 34792, "epoch": 828} {"train_loss": -5.587676048278809, "global_step": 34793, "epoch": 828} {"train_loss": -5.570932388305664, "global_step": 34794, "epoch": 828} {"train_loss": -5.341798782348633, "global_step": 34795, "epoch": 828} {"train_loss": -5.551754951477051, "global_step": 34796, "epoch": 828} {"train_loss": -5.498044490814209, "global_step": 34797, "epoch": 828} {"train_loss": -5.545567035675049, "global_step": 34798, "epoch": 828} {"train_loss": -5.571732521057129, "global_step": 34799, "epoch": 828} {"train_loss": -5.512750625610352, "global_step": 34800, "epoch": 828} {"train_loss": -5.6036176681518555, "global_step": 34801, "epoch": 828} {"train_loss": -5.533408164978027, "global_step": 34802, "epoch": 828} {"train_loss": -5.615994453430176, "global_step": 34803, "epoch": 828} {"train_loss": -5.547747611999512, "global_step": 34804, "epoch": 828} {"train_loss": -5.546113967895508, "global_step": 34805, "epoch": 828} {"train_loss": -5.526734828948975, "global_step": 34806, "epoch": 828} {"train_loss": -5.497109413146973, "global_step": 34807, "epoch": 828} {"train_loss": -5.558718681335449, "global_step": 34808, "epoch": 828} {"train_loss": -5.444268703460693, "global_step": 34809, "epoch": 828} {"train_loss": -5.569396018981934, "global_step": 34810, "epoch": 828} {"train_loss": -5.500693321228027, "global_step": 34811, "epoch": 828} {"train_loss": -5.3996806144714355, "global_step": 34812, "epoch": 828} {"train_loss": -5.5851616859436035, "global_step": 34813, "epoch": 828} {"train_loss": -5.526019096374512, "global_step": 34814, "epoch": 828} {"train_loss": -5.569094181060791, "global_step": 34815, "epoch": 828} {"train_loss": -5.557834148406982, "global_step": 34816, "epoch": 828} {"train_loss": -5.543258757818313, "global_step": 34817, "epoch": 828, "val_loss": 74198.9609375} {"train_loss": -5.6535234451293945, "global_step": 34818, "epoch": 829} {"train_loss": -5.4901275634765625, "global_step": 34819, "epoch": 829} {"train_loss": -5.5741190910339355, "global_step": 34820, "epoch": 829} {"train_loss": -5.653594970703125, "global_step": 34821, "epoch": 829} {"train_loss": -5.492820739746094, "global_step": 34822, "epoch": 829} {"train_loss": -5.522026062011719, "global_step": 34823, "epoch": 829} {"train_loss": -5.5886688232421875, "global_step": 34824, "epoch": 829} {"train_loss": -5.497611045837402, "global_step": 34825, "epoch": 829} {"train_loss": -5.474680423736572, "global_step": 34826, "epoch": 829} {"train_loss": -5.561785697937012, "global_step": 34827, "epoch": 829} {"train_loss": -5.4590654373168945, "global_step": 34828, "epoch": 829} {"train_loss": -5.528504848480225, "global_step": 34829, "epoch": 829} {"train_loss": -5.615685939788818, "global_step": 34830, "epoch": 829} {"train_loss": -5.559649467468262, "global_step": 34831, "epoch": 829} {"train_loss": -5.482143402099609, "global_step": 34832, "epoch": 829} {"train_loss": -5.4206976890563965, "global_step": 34833, "epoch": 829} {"train_loss": -5.369801998138428, "global_step": 34834, "epoch": 829} {"train_loss": -5.474143981933594, "global_step": 34835, "epoch": 829} {"train_loss": -5.437551498413086, "global_step": 34836, "epoch": 829} {"train_loss": -5.664326190948486, "global_step": 34837, "epoch": 829} {"train_loss": -5.548880577087402, "global_step": 34838, "epoch": 829} {"train_loss": -5.625249862670898, "global_step": 34839, "epoch": 829} {"train_loss": -5.617340087890625, "global_step": 34840, "epoch": 829} {"train_loss": -5.537993431091309, "global_step": 34841, "epoch": 829} {"train_loss": -5.578266143798828, "global_step": 34842, "epoch": 829} {"train_loss": -5.583515167236328, "global_step": 34843, "epoch": 829} {"train_loss": -5.606264114379883, "global_step": 34844, "epoch": 829} {"train_loss": -5.5786261558532715, "global_step": 34845, "epoch": 829} {"train_loss": -5.426247596740723, "global_step": 34846, "epoch": 829} {"train_loss": -5.596159934997559, "global_step": 34847, "epoch": 829} {"train_loss": -5.598258972167969, "global_step": 34848, "epoch": 829} {"train_loss": -5.555132865905762, "global_step": 34849, "epoch": 829} {"train_loss": -5.535874366760254, "global_step": 34850, "epoch": 829} {"train_loss": -5.570343017578125, "global_step": 34851, "epoch": 829} {"train_loss": -5.516048908233643, "global_step": 34852, "epoch": 829} {"train_loss": -5.526909828186035, "global_step": 34853, "epoch": 829} {"train_loss": -5.529015064239502, "global_step": 34854, "epoch": 829} {"train_loss": -5.508667945861816, "global_step": 34855, "epoch": 829} {"train_loss": -5.497504711151123, "global_step": 34856, "epoch": 829} {"train_loss": -5.70944881439209, "global_step": 34857, "epoch": 829} {"train_loss": -5.504312515258789, "global_step": 34858, "epoch": 829} {"train_loss": -5.544044698987689, "global_step": 34859, "epoch": 829, "val_loss": 74505.953125} {"train_loss": -5.674101829528809, "global_step": 34860, "epoch": 830} {"train_loss": -5.542825698852539, "global_step": 34861, "epoch": 830} {"train_loss": -5.601592063903809, "global_step": 34862, "epoch": 830} {"train_loss": -5.537870407104492, "global_step": 34863, "epoch": 830} {"train_loss": -5.538068771362305, "global_step": 34864, "epoch": 830} {"train_loss": -5.665618419647217, "global_step": 34865, "epoch": 830} {"train_loss": -5.608108043670654, "global_step": 34866, "epoch": 830} {"train_loss": -5.559213161468506, "global_step": 34867, "epoch": 830} {"train_loss": -5.478967666625977, "global_step": 34868, "epoch": 830} {"train_loss": -5.598196029663086, "global_step": 34869, "epoch": 830} {"train_loss": -5.6275529861450195, "global_step": 34870, "epoch": 830} {"train_loss": -5.633378982543945, "global_step": 34871, "epoch": 830} {"train_loss": -5.622915267944336, "global_step": 34872, "epoch": 830} {"train_loss": -5.5381574630737305, "global_step": 34873, "epoch": 830} {"train_loss": -5.581742286682129, "global_step": 34874, "epoch": 830} {"train_loss": -5.574078559875488, "global_step": 34875, "epoch": 830} {"train_loss": -5.503095626831055, "global_step": 34876, "epoch": 830} {"train_loss": -5.551587104797363, "global_step": 34877, "epoch": 830} {"train_loss": -5.493646621704102, "global_step": 34878, "epoch": 830} {"train_loss": -5.530674934387207, "global_step": 34879, "epoch": 830} {"train_loss": -5.492923736572266, "global_step": 34880, "epoch": 830} {"train_loss": -5.464042663574219, "global_step": 34881, "epoch": 830} {"train_loss": -5.4808502197265625, "global_step": 34882, "epoch": 830} {"train_loss": -5.574329376220703, "global_step": 34883, "epoch": 830} {"train_loss": -5.599694728851318, "global_step": 34884, "epoch": 830} {"train_loss": -5.594315528869629, "global_step": 34885, "epoch": 830} {"train_loss": -5.526839733123779, "global_step": 34886, "epoch": 830} {"train_loss": -5.467473030090332, "global_step": 34887, "epoch": 830} {"train_loss": -5.492279052734375, "global_step": 34888, "epoch": 830} {"train_loss": -5.578161239624023, "global_step": 34889, "epoch": 830} {"train_loss": -5.656766414642334, "global_step": 34890, "epoch": 830} {"train_loss": -5.545597076416016, "global_step": 34891, "epoch": 830} {"train_loss": -5.541261672973633, "global_step": 34892, "epoch": 830} {"train_loss": -5.660428047180176, "global_step": 34893, "epoch": 830} {"train_loss": -5.583402633666992, "global_step": 34894, "epoch": 830} {"train_loss": -5.508090019226074, "global_step": 34895, "epoch": 830} {"train_loss": -5.589608192443848, "global_step": 34896, "epoch": 830} {"train_loss": -5.618152618408203, "global_step": 34897, "epoch": 830} {"train_loss": -5.5475382804870605, "global_step": 34898, "epoch": 830} {"train_loss": -5.50441837310791, "global_step": 34899, "epoch": 830} {"train_loss": -5.581883430480957, "global_step": 34900, "epoch": 830} {"train_loss": -5.564212640126546, "global_step": 34901, "epoch": 830, "val_loss": 74059.8125} {"train_loss": -5.549372673034668, "global_step": 34902, "epoch": 831} {"train_loss": -5.5235395431518555, "global_step": 34903, "epoch": 831} {"train_loss": -5.626776218414307, "global_step": 34904, "epoch": 831} {"train_loss": -5.52298641204834, "global_step": 34905, "epoch": 831} {"train_loss": -5.56611442565918, "global_step": 34906, "epoch": 831} {"train_loss": -5.654793739318848, "global_step": 34907, "epoch": 831} {"train_loss": -5.511486530303955, "global_step": 34908, "epoch": 831} {"train_loss": -5.339923858642578, "global_step": 34909, "epoch": 831} {"train_loss": -5.600983619689941, "global_step": 34910, "epoch": 831} {"train_loss": -5.4469194412231445, "global_step": 34911, "epoch": 831} {"train_loss": -5.482145309448242, "global_step": 34912, "epoch": 831} {"train_loss": -5.493730068206787, "global_step": 34913, "epoch": 831} {"train_loss": -5.674186706542969, "global_step": 34914, "epoch": 831} {"train_loss": -5.546671390533447, "global_step": 34915, "epoch": 831} {"train_loss": -5.4742431640625, "global_step": 34916, "epoch": 831} {"train_loss": -5.564403057098389, "global_step": 34917, "epoch": 831} {"train_loss": -5.607281684875488, "global_step": 34918, "epoch": 831} {"train_loss": -5.53606653213501, "global_step": 34919, "epoch": 831} {"train_loss": -5.598508834838867, "global_step": 34920, "epoch": 831} {"train_loss": -5.528271198272705, "global_step": 34921, "epoch": 831} {"train_loss": -5.525975227355957, "global_step": 34922, "epoch": 831} {"train_loss": -5.498915672302246, "global_step": 34923, "epoch": 831} {"train_loss": -5.554081439971924, "global_step": 34924, "epoch": 831} {"train_loss": -5.638009548187256, "global_step": 34925, "epoch": 831} {"train_loss": -5.470809459686279, "global_step": 34926, "epoch": 831} {"train_loss": -5.655879974365234, "global_step": 34927, "epoch": 831} {"train_loss": -5.498697757720947, "global_step": 34928, "epoch": 831} {"train_loss": -5.513152599334717, "global_step": 34929, "epoch": 831} {"train_loss": -5.526471138000488, "global_step": 34930, "epoch": 831} {"train_loss": -5.528360366821289, "global_step": 34931, "epoch": 831} {"train_loss": -5.565936088562012, "global_step": 34932, "epoch": 831} {"train_loss": -5.447519302368164, "global_step": 34933, "epoch": 831} {"train_loss": -5.49859619140625, "global_step": 34934, "epoch": 831} {"train_loss": -5.440864086151123, "global_step": 34935, "epoch": 831} {"train_loss": -5.666552543640137, "global_step": 34936, "epoch": 831} {"train_loss": -5.4859137535095215, "global_step": 34937, "epoch": 831} {"train_loss": -5.686634063720703, "global_step": 34938, "epoch": 831} {"train_loss": -5.543898105621338, "global_step": 34939, "epoch": 831} {"train_loss": -5.6401047706604, "global_step": 34940, "epoch": 831} {"train_loss": -5.638530731201172, "global_step": 34941, "epoch": 831} {"train_loss": -5.493471145629883, "global_step": 34942, "epoch": 831} {"train_loss": -5.545639140265329, "global_step": 34943, "epoch": 831, "val_loss": 73736.5390625} {"train_loss": -5.50835657119751, "global_step": 34944, "epoch": 832} {"train_loss": -5.6201629638671875, "global_step": 34945, "epoch": 832} {"train_loss": -5.53420877456665, "global_step": 34946, "epoch": 832} {"train_loss": -5.641788959503174, "global_step": 34947, "epoch": 832} {"train_loss": -5.61594820022583, "global_step": 34948, "epoch": 832} {"train_loss": -5.524295330047607, "global_step": 34949, "epoch": 832} {"train_loss": -5.637623310089111, "global_step": 34950, "epoch": 832} {"train_loss": -5.614902496337891, "global_step": 34951, "epoch": 832} {"train_loss": -5.44881534576416, "global_step": 34952, "epoch": 832} {"train_loss": -5.506463050842285, "global_step": 34953, "epoch": 832} {"train_loss": -5.576618194580078, "global_step": 34954, "epoch": 832} {"train_loss": -5.640956401824951, "global_step": 34955, "epoch": 832} {"train_loss": -5.555776596069336, "global_step": 34956, "epoch": 832} {"train_loss": -5.528446197509766, "global_step": 34957, "epoch": 832} {"train_loss": -5.588252067565918, "global_step": 34958, "epoch": 832} {"train_loss": -5.694546222686768, "global_step": 34959, "epoch": 832} {"train_loss": -5.490018844604492, "global_step": 34960, "epoch": 832} {"train_loss": -5.639672756195068, "global_step": 34961, "epoch": 832} {"train_loss": -5.561424255371094, "global_step": 34962, "epoch": 832} {"train_loss": -5.4228835105896, "global_step": 34963, "epoch": 832} {"train_loss": -5.705757141113281, "global_step": 34964, "epoch": 832} {"train_loss": -5.440907001495361, "global_step": 34965, "epoch": 832} {"train_loss": -5.570669174194336, "global_step": 34966, "epoch": 832} {"train_loss": -5.572994232177734, "global_step": 34967, "epoch": 832} {"train_loss": -5.445101737976074, "global_step": 34968, "epoch": 832} {"train_loss": -5.423234939575195, "global_step": 34969, "epoch": 832} {"train_loss": -5.618805885314941, "global_step": 34970, "epoch": 832} {"train_loss": -5.6097517013549805, "global_step": 34971, "epoch": 832} {"train_loss": -5.5587639808654785, "global_step": 34972, "epoch": 832} {"train_loss": -5.6129021644592285, "global_step": 34973, "epoch": 832} {"train_loss": -5.594667434692383, "global_step": 34974, "epoch": 832} {"train_loss": -5.5807647705078125, "global_step": 34975, "epoch": 832} {"train_loss": -5.523655414581299, "global_step": 34976, "epoch": 832} {"train_loss": -5.589722633361816, "global_step": 34977, "epoch": 832} {"train_loss": -5.648377895355225, "global_step": 34978, "epoch": 832} {"train_loss": -5.58122444152832, "global_step": 34979, "epoch": 832} {"train_loss": -5.561434745788574, "global_step": 34980, "epoch": 832} {"train_loss": -5.488781929016113, "global_step": 34981, "epoch": 832} {"train_loss": -5.550004959106445, "global_step": 34982, "epoch": 832} {"train_loss": -5.588911533355713, "global_step": 34983, "epoch": 832} {"train_loss": -5.492525577545166, "global_step": 34984, "epoch": 832} {"train_loss": -5.562914280664353, "global_step": 34985, "epoch": 832, "val_loss": 74301.640625} {"train_loss": -5.458169460296631, "global_step": 34986, "epoch": 833} {"train_loss": -5.5981245040893555, "global_step": 34987, "epoch": 833} {"train_loss": -5.704958915710449, "global_step": 34988, "epoch": 833} {"train_loss": -5.5645294189453125, "global_step": 34989, "epoch": 833} {"train_loss": -5.5977559089660645, "global_step": 34990, "epoch": 833} {"train_loss": -5.586542129516602, "global_step": 34991, "epoch": 833} {"train_loss": -5.617887496948242, "global_step": 34992, "epoch": 833} {"train_loss": -5.610620498657227, "global_step": 34993, "epoch": 833} {"train_loss": -5.484625339508057, "global_step": 34994, "epoch": 833} {"train_loss": -5.649301528930664, "global_step": 34995, "epoch": 833} {"train_loss": -5.361654281616211, "global_step": 34996, "epoch": 833} {"train_loss": -5.624698638916016, "global_step": 34997, "epoch": 833} {"train_loss": -5.48887300491333, "global_step": 34998, "epoch": 833} {"train_loss": -5.443665504455566, "global_step": 34999, "epoch": 833} {"train_loss": -5.524691581726074, "global_step": 35000, "epoch": 833} {"train_loss": -5.51896333694458, "global_step": 35001, "epoch": 833} {"train_loss": -5.434617519378662, "global_step": 35002, "epoch": 833} {"train_loss": -5.383644104003906, "global_step": 35003, "epoch": 833} {"train_loss": -5.534667491912842, "global_step": 35004, "epoch": 833} {"train_loss": -5.537806510925293, "global_step": 35005, "epoch": 833} {"train_loss": -5.61074161529541, "global_step": 35006, "epoch": 833} {"train_loss": -5.445777893066406, "global_step": 35007, "epoch": 833} {"train_loss": -5.540278434753418, "global_step": 35008, "epoch": 833} {"train_loss": -5.48499059677124, "global_step": 35009, "epoch": 833} {"train_loss": -5.408323287963867, "global_step": 35010, "epoch": 833} {"train_loss": -5.418249130249023, "global_step": 35011, "epoch": 833} {"train_loss": -5.457526206970215, "global_step": 35012, "epoch": 833} {"train_loss": -5.605436325073242, "global_step": 35013, "epoch": 833} {"train_loss": -5.466832160949707, "global_step": 35014, "epoch": 833} {"train_loss": -5.492265701293945, "global_step": 35015, "epoch": 833} {"train_loss": -5.42508602142334, "global_step": 35016, "epoch": 833} {"train_loss": -5.542296409606934, "global_step": 35017, "epoch": 833} {"train_loss": -5.561830520629883, "global_step": 35018, "epoch": 833} {"train_loss": -5.435398101806641, "global_step": 35019, "epoch": 833} {"train_loss": -5.661396026611328, "global_step": 35020, "epoch": 833} {"train_loss": -5.577852249145508, "global_step": 35021, "epoch": 833} {"train_loss": -5.647411346435547, "global_step": 35022, "epoch": 833} {"train_loss": -5.636491298675537, "global_step": 35023, "epoch": 833} {"train_loss": -5.6343913078308105, "global_step": 35024, "epoch": 833} {"train_loss": -5.466821670532227, "global_step": 35025, "epoch": 833} {"train_loss": -5.600131988525391, "global_step": 35026, "epoch": 833} {"train_loss": -5.534492424556187, "global_step": 35027, "epoch": 833, "val_loss": 74053.9609375} {"train_loss": -5.50166130065918, "global_step": 35028, "epoch": 834} {"train_loss": -5.455309867858887, "global_step": 35029, "epoch": 834} {"train_loss": -5.523405075073242, "global_step": 35030, "epoch": 834} {"train_loss": -5.653165817260742, "global_step": 35031, "epoch": 834} {"train_loss": -5.485780239105225, "global_step": 35032, "epoch": 834} {"train_loss": -5.610888481140137, "global_step": 35033, "epoch": 834} {"train_loss": -5.650656223297119, "global_step": 35034, "epoch": 834} {"train_loss": -5.516912937164307, "global_step": 35035, "epoch": 834} {"train_loss": -5.48859167098999, "global_step": 35036, "epoch": 834} {"train_loss": -5.6733808517456055, "global_step": 35037, "epoch": 834} {"train_loss": -5.488030433654785, "global_step": 35038, "epoch": 834} {"train_loss": -5.548730850219727, "global_step": 35039, "epoch": 834} {"train_loss": -5.615886688232422, "global_step": 35040, "epoch": 834} {"train_loss": -5.664499282836914, "global_step": 35041, "epoch": 834} {"train_loss": -5.7298665046691895, "global_step": 35042, "epoch": 834} {"train_loss": -5.564431667327881, "global_step": 35043, "epoch": 834} {"train_loss": -5.69434928894043, "global_step": 35044, "epoch": 834} {"train_loss": -5.539055824279785, "global_step": 35045, "epoch": 834} {"train_loss": -5.567296028137207, "global_step": 35046, "epoch": 834} {"train_loss": -5.540986061096191, "global_step": 35047, "epoch": 834} {"train_loss": -5.616596221923828, "global_step": 35048, "epoch": 834} {"train_loss": -5.60242223739624, "global_step": 35049, "epoch": 834} {"train_loss": -5.543438911437988, "global_step": 35050, "epoch": 834} {"train_loss": -5.494390487670898, "global_step": 35051, "epoch": 834} {"train_loss": -5.420853614807129, "global_step": 35052, "epoch": 834} {"train_loss": -5.48618221282959, "global_step": 35053, "epoch": 834} {"train_loss": -5.41972541809082, "global_step": 35054, "epoch": 834} {"train_loss": -5.441526412963867, "global_step": 35055, "epoch": 834} {"train_loss": -5.63857364654541, "global_step": 35056, "epoch": 834} {"train_loss": -5.490568161010742, "global_step": 35057, "epoch": 834} {"train_loss": -5.624302864074707, "global_step": 35058, "epoch": 834} {"train_loss": -5.5068254470825195, "global_step": 35059, "epoch": 834} {"train_loss": -5.356849670410156, "global_step": 35060, "epoch": 834} {"train_loss": -5.467408180236816, "global_step": 35061, "epoch": 834} {"train_loss": -5.558594226837158, "global_step": 35062, "epoch": 834} {"train_loss": -5.495358467102051, "global_step": 35063, "epoch": 834} {"train_loss": -5.509513854980469, "global_step": 35064, "epoch": 834} {"train_loss": -5.517900466918945, "global_step": 35065, "epoch": 834} {"train_loss": -5.606189250946045, "global_step": 35066, "epoch": 834} {"train_loss": -5.508960247039795, "global_step": 35067, "epoch": 834} {"train_loss": -5.578880310058594, "global_step": 35068, "epoch": 834} {"train_loss": -5.549818595250447, "global_step": 35069, "epoch": 834, "val_loss": 74626.53125} {"train_loss": -5.7146196365356445, "global_step": 35070, "epoch": 835} {"train_loss": -5.523947715759277, "global_step": 35071, "epoch": 835} {"train_loss": -5.585285186767578, "global_step": 35072, "epoch": 835} {"train_loss": -5.575024604797363, "global_step": 35073, "epoch": 835} {"train_loss": -5.645573616027832, "global_step": 35074, "epoch": 835} {"train_loss": -5.610138893127441, "global_step": 35075, "epoch": 835} {"train_loss": -5.54734992980957, "global_step": 35076, "epoch": 835} {"train_loss": -5.468536376953125, "global_step": 35077, "epoch": 835} {"train_loss": -5.579822063446045, "global_step": 35078, "epoch": 835} {"train_loss": -5.485672950744629, "global_step": 35079, "epoch": 835} {"train_loss": -5.659688472747803, "global_step": 35080, "epoch": 835} {"train_loss": -5.554035186767578, "global_step": 35081, "epoch": 835} {"train_loss": -5.517007350921631, "global_step": 35082, "epoch": 835} {"train_loss": -5.542929649353027, "global_step": 35083, "epoch": 835} {"train_loss": -5.630177974700928, "global_step": 35084, "epoch": 835} {"train_loss": -5.468200206756592, "global_step": 35085, "epoch": 835} {"train_loss": -5.496896266937256, "global_step": 35086, "epoch": 835} {"train_loss": -5.6117658615112305, "global_step": 35087, "epoch": 835} {"train_loss": -5.643134117126465, "global_step": 35088, "epoch": 835} {"train_loss": -5.485581398010254, "global_step": 35089, "epoch": 835} {"train_loss": -5.675470352172852, "global_step": 35090, "epoch": 835} {"train_loss": -5.631755828857422, "global_step": 35091, "epoch": 835} {"train_loss": -5.449055194854736, "global_step": 35092, "epoch": 835} {"train_loss": -5.556378364562988, "global_step": 35093, "epoch": 835} {"train_loss": -5.487220287322998, "global_step": 35094, "epoch": 835} {"train_loss": -5.681144714355469, "global_step": 35095, "epoch": 835} {"train_loss": -5.608903884887695, "global_step": 35096, "epoch": 835} {"train_loss": -5.5558624267578125, "global_step": 35097, "epoch": 835} {"train_loss": -5.5017242431640625, "global_step": 35098, "epoch": 835} {"train_loss": -5.484621524810791, "global_step": 35099, "epoch": 835} {"train_loss": -5.713615894317627, "global_step": 35100, "epoch": 835} {"train_loss": -5.509801864624023, "global_step": 35101, "epoch": 835} {"train_loss": -5.61362361907959, "global_step": 35102, "epoch": 835} {"train_loss": -5.641060829162598, "global_step": 35103, "epoch": 835} {"train_loss": -5.612433433532715, "global_step": 35104, "epoch": 835} {"train_loss": -5.588681221008301, "global_step": 35105, "epoch": 835} {"train_loss": -5.605257034301758, "global_step": 35106, "epoch": 835} {"train_loss": -5.531317710876465, "global_step": 35107, "epoch": 835} {"train_loss": -5.538692951202393, "global_step": 35108, "epoch": 835} {"train_loss": -5.582755088806152, "global_step": 35109, "epoch": 835} {"train_loss": -5.568150997161865, "global_step": 35110, "epoch": 835} {"train_loss": -5.57219105675107, "global_step": 35111, "epoch": 835, "val_loss": 73982.4140625} {"train_loss": -5.487626075744629, "global_step": 35112, "epoch": 836} {"train_loss": -5.538919925689697, "global_step": 35113, "epoch": 836} {"train_loss": -5.617269992828369, "global_step": 35114, "epoch": 836} {"train_loss": -5.616204738616943, "global_step": 35115, "epoch": 836} {"train_loss": -5.598313331604004, "global_step": 35116, "epoch": 836} {"train_loss": -5.631183624267578, "global_step": 35117, "epoch": 836} {"train_loss": -5.723958969116211, "global_step": 35118, "epoch": 836} {"train_loss": -5.531068325042725, "global_step": 35119, "epoch": 836} {"train_loss": -5.5230712890625, "global_step": 35120, "epoch": 836} {"train_loss": -5.648348808288574, "global_step": 35121, "epoch": 836} {"train_loss": -5.411454677581787, "global_step": 35122, "epoch": 836} {"train_loss": -5.541671276092529, "global_step": 35123, "epoch": 836} {"train_loss": -5.566454887390137, "global_step": 35124, "epoch": 836} {"train_loss": -5.536998271942139, "global_step": 35125, "epoch": 836} {"train_loss": -5.446325302124023, "global_step": 35126, "epoch": 836} {"train_loss": -5.672563552856445, "global_step": 35127, "epoch": 836} {"train_loss": -5.592976093292236, "global_step": 35128, "epoch": 836} {"train_loss": -5.423986434936523, "global_step": 35129, "epoch": 836} {"train_loss": -5.5388641357421875, "global_step": 35130, "epoch": 836} {"train_loss": -5.650550842285156, "global_step": 35131, "epoch": 836} {"train_loss": -5.546238899230957, "global_step": 35132, "epoch": 836} {"train_loss": -5.597959041595459, "global_step": 35133, "epoch": 836} {"train_loss": -5.551513195037842, "global_step": 35134, "epoch": 836} {"train_loss": -5.513246536254883, "global_step": 35135, "epoch": 836} {"train_loss": -5.513535499572754, "global_step": 35136, "epoch": 836} {"train_loss": -5.466123104095459, "global_step": 35137, "epoch": 836} {"train_loss": -5.50324010848999, "global_step": 35138, "epoch": 836} {"train_loss": -5.581239700317383, "global_step": 35139, "epoch": 836} {"train_loss": -5.513443946838379, "global_step": 35140, "epoch": 836} {"train_loss": -5.563100814819336, "global_step": 35141, "epoch": 836} {"train_loss": -5.554041862487793, "global_step": 35142, "epoch": 836} {"train_loss": -5.57319450378418, "global_step": 35143, "epoch": 836} {"train_loss": -5.289083957672119, "global_step": 35144, "epoch": 836} {"train_loss": -5.4508466720581055, "global_step": 35145, "epoch": 836} {"train_loss": -5.446061134338379, "global_step": 35146, "epoch": 836} {"train_loss": -5.293587684631348, "global_step": 35147, "epoch": 836} {"train_loss": -5.548579216003418, "global_step": 35148, "epoch": 836} {"train_loss": -5.281561851501465, "global_step": 35149, "epoch": 836} {"train_loss": -5.371603965759277, "global_step": 35150, "epoch": 836} {"train_loss": -5.456382751464844, "global_step": 35151, "epoch": 836} {"train_loss": -5.5546417236328125, "global_step": 35152, "epoch": 836} {"train_loss": -5.5248402413867765, "global_step": 35153, "epoch": 836, "val_loss": 74662.1796875} {"train_loss": -5.474645137786865, "global_step": 35154, "epoch": 837} {"train_loss": -5.4276018142700195, "global_step": 35155, "epoch": 837} {"train_loss": -5.571796417236328, "global_step": 35156, "epoch": 837} {"train_loss": -5.580671787261963, "global_step": 35157, "epoch": 837} {"train_loss": -5.46614408493042, "global_step": 35158, "epoch": 837} {"train_loss": -5.480585098266602, "global_step": 35159, "epoch": 837} {"train_loss": -5.669467449188232, "global_step": 35160, "epoch": 837} {"train_loss": -5.52219295501709, "global_step": 35161, "epoch": 837} {"train_loss": -5.465310573577881, "global_step": 35162, "epoch": 837} {"train_loss": -5.540445327758789, "global_step": 35163, "epoch": 837} {"train_loss": -5.524383544921875, "global_step": 35164, "epoch": 837} {"train_loss": -5.665632247924805, "global_step": 35165, "epoch": 837} {"train_loss": -5.463066101074219, "global_step": 35166, "epoch": 837} {"train_loss": -5.6057891845703125, "global_step": 35167, "epoch": 837} {"train_loss": -5.551822662353516, "global_step": 35168, "epoch": 837} {"train_loss": -5.34672737121582, "global_step": 35169, "epoch": 837} {"train_loss": -5.4625325202941895, "global_step": 35170, "epoch": 837} {"train_loss": -5.51457405090332, "global_step": 35171, "epoch": 837} {"train_loss": -5.6384806632995605, "global_step": 35172, "epoch": 837} {"train_loss": -5.570879936218262, "global_step": 35173, "epoch": 837} {"train_loss": -5.454384803771973, "global_step": 35174, "epoch": 837} {"train_loss": -5.553959846496582, "global_step": 35175, "epoch": 837} {"train_loss": -5.5669474601745605, "global_step": 35176, "epoch": 837} {"train_loss": -5.50367546081543, "global_step": 35177, "epoch": 837} {"train_loss": -5.5828447341918945, "global_step": 35178, "epoch": 837} {"train_loss": -5.422201156616211, "global_step": 35179, "epoch": 837} {"train_loss": -5.4113922119140625, "global_step": 35180, "epoch": 837} {"train_loss": -5.497993469238281, "global_step": 35181, "epoch": 837} {"train_loss": -5.61006498336792, "global_step": 35182, "epoch": 837} {"train_loss": -5.542530059814453, "global_step": 35183, "epoch": 837} {"train_loss": -5.508095741271973, "global_step": 35184, "epoch": 837} {"train_loss": -5.5297675132751465, "global_step": 35185, "epoch": 837} {"train_loss": -5.513390064239502, "global_step": 35186, "epoch": 837} {"train_loss": -5.55474853515625, "global_step": 35187, "epoch": 837} {"train_loss": -5.521040916442871, "global_step": 35188, "epoch": 837} {"train_loss": -5.700436592102051, "global_step": 35189, "epoch": 837} {"train_loss": -5.569450855255127, "global_step": 35190, "epoch": 837} {"train_loss": -5.402907848358154, "global_step": 35191, "epoch": 837} {"train_loss": -5.578718185424805, "global_step": 35192, "epoch": 837} {"train_loss": -5.418146133422852, "global_step": 35193, "epoch": 837} {"train_loss": -5.698112487792969, "global_step": 35194, "epoch": 837} {"train_loss": -5.528748580387661, "global_step": 35195, "epoch": 837, "val_loss": 73885.390625} {"train_loss": -5.5618181228637695, "global_step": 35196, "epoch": 838} {"train_loss": -5.497808456420898, "global_step": 35197, "epoch": 838} {"train_loss": -5.7018890380859375, "global_step": 35198, "epoch": 838} {"train_loss": -5.509398937225342, "global_step": 35199, "epoch": 838} {"train_loss": -5.504208564758301, "global_step": 35200, "epoch": 838} {"train_loss": -5.492498397827148, "global_step": 35201, "epoch": 838} {"train_loss": -5.614284515380859, "global_step": 35202, "epoch": 838} {"train_loss": -5.62656307220459, "global_step": 35203, "epoch": 838} {"train_loss": -5.618798732757568, "global_step": 35204, "epoch": 838} {"train_loss": -5.472683906555176, "global_step": 35205, "epoch": 838} {"train_loss": -5.553406238555908, "global_step": 35206, "epoch": 838} {"train_loss": -5.444150924682617, "global_step": 35207, "epoch": 838} {"train_loss": -5.514006614685059, "global_step": 35208, "epoch": 838} {"train_loss": -5.611571788787842, "global_step": 35209, "epoch": 838} {"train_loss": -5.6336669921875, "global_step": 35210, "epoch": 838} {"train_loss": -5.5034894943237305, "global_step": 35211, "epoch": 838} {"train_loss": -5.542947769165039, "global_step": 35212, "epoch": 838} {"train_loss": -5.471737861633301, "global_step": 35213, "epoch": 838} {"train_loss": -5.549080848693848, "global_step": 35214, "epoch": 838} {"train_loss": -5.45192813873291, "global_step": 35215, "epoch": 838} {"train_loss": -5.483010292053223, "global_step": 35216, "epoch": 838} {"train_loss": -5.513089179992676, "global_step": 35217, "epoch": 838} {"train_loss": -5.50041389465332, "global_step": 35218, "epoch": 838} {"train_loss": -5.563435077667236, "global_step": 35219, "epoch": 838} {"train_loss": -5.5459442138671875, "global_step": 35220, "epoch": 838} {"train_loss": -5.389583587646484, "global_step": 35221, "epoch": 838} {"train_loss": -5.545574188232422, "global_step": 35222, "epoch": 838} {"train_loss": -5.441034317016602, "global_step": 35223, "epoch": 838} {"train_loss": -5.50521993637085, "global_step": 35224, "epoch": 838} {"train_loss": -5.397073745727539, "global_step": 35225, "epoch": 838} {"train_loss": -5.462299346923828, "global_step": 35226, "epoch": 838} {"train_loss": -5.502931118011475, "global_step": 35227, "epoch": 838} {"train_loss": -5.453822612762451, "global_step": 35228, "epoch": 838} {"train_loss": -5.595963478088379, "global_step": 35229, "epoch": 838} {"train_loss": -5.5733137130737305, "global_step": 35230, "epoch": 838} {"train_loss": -5.4571380615234375, "global_step": 35231, "epoch": 838} {"train_loss": -5.571042060852051, "global_step": 35232, "epoch": 838} {"train_loss": -5.551532745361328, "global_step": 35233, "epoch": 838} {"train_loss": -5.431281089782715, "global_step": 35234, "epoch": 838} {"train_loss": -5.4241509437561035, "global_step": 35235, "epoch": 838} {"train_loss": -5.494829177856445, "global_step": 35236, "epoch": 838} {"train_loss": -5.519264947800409, "global_step": 35237, "epoch": 838, "val_loss": 74313.328125} {"train_loss": -5.602275848388672, "global_step": 35238, "epoch": 839} {"train_loss": -5.584951400756836, "global_step": 35239, "epoch": 839} {"train_loss": -5.596144676208496, "global_step": 35240, "epoch": 839} {"train_loss": -5.589729309082031, "global_step": 35241, "epoch": 839} {"train_loss": -5.609297752380371, "global_step": 35242, "epoch": 839} {"train_loss": -5.652431011199951, "global_step": 35243, "epoch": 839} {"train_loss": -5.610929012298584, "global_step": 35244, "epoch": 839} {"train_loss": -5.58719539642334, "global_step": 35245, "epoch": 839} {"train_loss": -5.60605525970459, "global_step": 35246, "epoch": 839} {"train_loss": -5.450224876403809, "global_step": 35247, "epoch": 839} {"train_loss": -5.646214485168457, "global_step": 35248, "epoch": 839} {"train_loss": -5.383720397949219, "global_step": 35249, "epoch": 839} {"train_loss": -5.620688438415527, "global_step": 35250, "epoch": 839} {"train_loss": -5.576868534088135, "global_step": 35251, "epoch": 839} {"train_loss": -5.420586109161377, "global_step": 35252, "epoch": 839} {"train_loss": -5.554852485656738, "global_step": 35253, "epoch": 839} {"train_loss": -5.560056686401367, "global_step": 35254, "epoch": 839} {"train_loss": -5.611130714416504, "global_step": 35255, "epoch": 839} {"train_loss": -5.681476593017578, "global_step": 35256, "epoch": 839} {"train_loss": -5.457187652587891, "global_step": 35257, "epoch": 839} {"train_loss": -5.468319892883301, "global_step": 35258, "epoch": 839} {"train_loss": -5.542950630187988, "global_step": 35259, "epoch": 839} {"train_loss": -5.637676239013672, "global_step": 35260, "epoch": 839} {"train_loss": -5.5659260749816895, "global_step": 35261, "epoch": 839} {"train_loss": -5.408587455749512, "global_step": 35262, "epoch": 839} {"train_loss": -5.666910171508789, "global_step": 35263, "epoch": 839} {"train_loss": -5.4600982666015625, "global_step": 35264, "epoch": 839} {"train_loss": -5.560507774353027, "global_step": 35265, "epoch": 839} {"train_loss": -5.573812484741211, "global_step": 35266, "epoch": 839} {"train_loss": -5.53137731552124, "global_step": 35267, "epoch": 839} {"train_loss": -5.604935646057129, "global_step": 35268, "epoch": 839} {"train_loss": -5.4207353591918945, "global_step": 35269, "epoch": 839} {"train_loss": -5.39755916595459, "global_step": 35270, "epoch": 839} {"train_loss": -5.655643463134766, "global_step": 35271, "epoch": 839} {"train_loss": -5.538474082946777, "global_step": 35272, "epoch": 839} {"train_loss": -5.475559711456299, "global_step": 35273, "epoch": 839} {"train_loss": -5.411127090454102, "global_step": 35274, "epoch": 839} {"train_loss": -5.504214763641357, "global_step": 35275, "epoch": 839} {"train_loss": -5.471871376037598, "global_step": 35276, "epoch": 839} {"train_loss": -5.539399147033691, "global_step": 35277, "epoch": 839} {"train_loss": -5.549652099609375, "global_step": 35278, "epoch": 839} {"train_loss": -5.544402553921654, "global_step": 35279, "epoch": 839, "val_loss": 74105.9140625} {"train_loss": -5.423569202423096, "global_step": 35280, "epoch": 840} {"train_loss": -5.417477607727051, "global_step": 35281, "epoch": 840} {"train_loss": -5.450589179992676, "global_step": 35282, "epoch": 840} {"train_loss": -5.548206329345703, "global_step": 35283, "epoch": 840} {"train_loss": -5.396636009216309, "global_step": 35284, "epoch": 840} {"train_loss": -5.586240768432617, "global_step": 35285, "epoch": 840} {"train_loss": -5.4043989181518555, "global_step": 35286, "epoch": 840} {"train_loss": -5.557018280029297, "global_step": 35287, "epoch": 840} {"train_loss": -5.463748931884766, "global_step": 35288, "epoch": 840} {"train_loss": -5.469525337219238, "global_step": 35289, "epoch": 840} {"train_loss": -5.560826301574707, "global_step": 35290, "epoch": 840} {"train_loss": -5.366052627563477, "global_step": 35291, "epoch": 840} {"train_loss": -5.564574718475342, "global_step": 35292, "epoch": 840} {"train_loss": -5.454798698425293, "global_step": 35293, "epoch": 840} {"train_loss": -5.500446796417236, "global_step": 35294, "epoch": 840} {"train_loss": -5.576810359954834, "global_step": 35295, "epoch": 840} {"train_loss": -5.524849891662598, "global_step": 35296, "epoch": 840} {"train_loss": -5.649291038513184, "global_step": 35297, "epoch": 840} {"train_loss": -5.477635860443115, "global_step": 35298, "epoch": 840} {"train_loss": -5.5370378494262695, "global_step": 35299, "epoch": 840} {"train_loss": -5.587101936340332, "global_step": 35300, "epoch": 840} {"train_loss": -5.51162576675415, "global_step": 35301, "epoch": 840} {"train_loss": -5.615605354309082, "global_step": 35302, "epoch": 840} {"train_loss": -5.642856597900391, "global_step": 35303, "epoch": 840} {"train_loss": -5.537541389465332, "global_step": 35304, "epoch": 840} {"train_loss": -5.59982442855835, "global_step": 35305, "epoch": 840} {"train_loss": -5.590523719787598, "global_step": 35306, "epoch": 840} {"train_loss": -5.586470603942871, "global_step": 35307, "epoch": 840} {"train_loss": -5.764215469360352, "global_step": 35308, "epoch": 840} {"train_loss": -5.560998916625977, "global_step": 35309, "epoch": 840} {"train_loss": -5.56764030456543, "global_step": 35310, "epoch": 840} {"train_loss": -5.605358600616455, "global_step": 35311, "epoch": 840} {"train_loss": -5.576347827911377, "global_step": 35312, "epoch": 840} {"train_loss": -5.504560470581055, "global_step": 35313, "epoch": 840} {"train_loss": -5.41593074798584, "global_step": 35314, "epoch": 840} {"train_loss": -5.721558094024658, "global_step": 35315, "epoch": 840} {"train_loss": -5.500604629516602, "global_step": 35316, "epoch": 840} {"train_loss": -5.506272315979004, "global_step": 35317, "epoch": 840} {"train_loss": -5.563671112060547, "global_step": 35318, "epoch": 840} {"train_loss": -5.664795875549316, "global_step": 35319, "epoch": 840} {"train_loss": -5.564253330230713, "global_step": 35320, "epoch": 840} {"train_loss": -5.5405331793285555, "global_step": 35321, "epoch": 840, "val_loss": 74245.96875} {"train_loss": -5.453448295593262, "global_step": 35322, "epoch": 841} {"train_loss": -5.673591136932373, "global_step": 35323, "epoch": 841} {"train_loss": -5.374007701873779, "global_step": 35324, "epoch": 841} {"train_loss": -5.583236217498779, "global_step": 35325, "epoch": 841} {"train_loss": -5.608402252197266, "global_step": 35326, "epoch": 841} {"train_loss": -5.550074577331543, "global_step": 35327, "epoch": 841} {"train_loss": -5.634267807006836, "global_step": 35328, "epoch": 841} {"train_loss": -5.445736408233643, "global_step": 35329, "epoch": 841} {"train_loss": -5.464391708374023, "global_step": 35330, "epoch": 841} {"train_loss": -5.638867378234863, "global_step": 35331, "epoch": 841} {"train_loss": -5.509197235107422, "global_step": 35332, "epoch": 841} {"train_loss": -5.542009353637695, "global_step": 35333, "epoch": 841} {"train_loss": -5.654701232910156, "global_step": 35334, "epoch": 841} {"train_loss": -5.466640949249268, "global_step": 35335, "epoch": 841} {"train_loss": -5.568767070770264, "global_step": 35336, "epoch": 841} {"train_loss": -5.465934753417969, "global_step": 35337, "epoch": 841} {"train_loss": -5.652746677398682, "global_step": 35338, "epoch": 841} {"train_loss": -5.483679294586182, "global_step": 35339, "epoch": 841} {"train_loss": -5.489355087280273, "global_step": 35340, "epoch": 841} {"train_loss": -5.544866561889648, "global_step": 35341, "epoch": 841} {"train_loss": -5.491089344024658, "global_step": 35342, "epoch": 841} {"train_loss": -5.510061264038086, "global_step": 35343, "epoch": 841} {"train_loss": -5.608428955078125, "global_step": 35344, "epoch": 841} {"train_loss": -5.470690727233887, "global_step": 35345, "epoch": 841} {"train_loss": -5.586208343505859, "global_step": 35346, "epoch": 841} {"train_loss": -5.532021522521973, "global_step": 35347, "epoch": 841} {"train_loss": -5.548632621765137, "global_step": 35348, "epoch": 841} {"train_loss": -5.592175006866455, "global_step": 35349, "epoch": 841} {"train_loss": -5.45783805847168, "global_step": 35350, "epoch": 841} {"train_loss": -5.539472579956055, "global_step": 35351, "epoch": 841} {"train_loss": -5.587475776672363, "global_step": 35352, "epoch": 841} {"train_loss": -5.515235900878906, "global_step": 35353, "epoch": 841} {"train_loss": -5.583093166351318, "global_step": 35354, "epoch": 841} {"train_loss": -5.525835037231445, "global_step": 35355, "epoch": 841} {"train_loss": -5.611461639404297, "global_step": 35356, "epoch": 841} {"train_loss": -5.517862796783447, "global_step": 35357, "epoch": 841} {"train_loss": -5.486686706542969, "global_step": 35358, "epoch": 841} {"train_loss": -5.480070114135742, "global_step": 35359, "epoch": 841} {"train_loss": -5.512560844421387, "global_step": 35360, "epoch": 841} {"train_loss": -5.5015153884887695, "global_step": 35361, "epoch": 841} {"train_loss": -5.519324779510498, "global_step": 35362, "epoch": 841} {"train_loss": -5.5335494336627775, "global_step": 35363, "epoch": 841, "val_loss": 74908.625} {"train_loss": -5.491772174835205, "global_step": 35364, "epoch": 842} {"train_loss": -5.644776344299316, "global_step": 35365, "epoch": 842} {"train_loss": -5.5700812339782715, "global_step": 35366, "epoch": 842} {"train_loss": -5.576792240142822, "global_step": 35367, "epoch": 842} {"train_loss": -5.717872619628906, "global_step": 35368, "epoch": 842} {"train_loss": -5.495457649230957, "global_step": 35369, "epoch": 842} {"train_loss": -5.488692760467529, "global_step": 35370, "epoch": 842} {"train_loss": -5.524328708648682, "global_step": 35371, "epoch": 842} {"train_loss": -5.5488996505737305, "global_step": 35372, "epoch": 842} {"train_loss": -5.551248550415039, "global_step": 35373, "epoch": 842} {"train_loss": -5.614264488220215, "global_step": 35374, "epoch": 842} {"train_loss": -5.610898017883301, "global_step": 35375, "epoch": 842} {"train_loss": -5.520526885986328, "global_step": 35376, "epoch": 842} {"train_loss": -5.6230788230896, "global_step": 35377, "epoch": 842} {"train_loss": -5.47430419921875, "global_step": 35378, "epoch": 842} {"train_loss": -5.660845756530762, "global_step": 35379, "epoch": 842} {"train_loss": -5.683550834655762, "global_step": 35380, "epoch": 842} {"train_loss": -5.377251148223877, "global_step": 35381, "epoch": 842} {"train_loss": -5.47076940536499, "global_step": 35382, "epoch": 842} {"train_loss": -5.581939697265625, "global_step": 35383, "epoch": 842} {"train_loss": -5.464387893676758, "global_step": 35384, "epoch": 842} {"train_loss": -5.504910469055176, "global_step": 35385, "epoch": 842} {"train_loss": -5.4219746589660645, "global_step": 35386, "epoch": 842} {"train_loss": -5.578148365020752, "global_step": 35387, "epoch": 842} {"train_loss": -5.441390037536621, "global_step": 35388, "epoch": 842} {"train_loss": -5.565278053283691, "global_step": 35389, "epoch": 842} {"train_loss": -5.4392313957214355, "global_step": 35390, "epoch": 842} {"train_loss": -5.622620105743408, "global_step": 35391, "epoch": 842} {"train_loss": -5.5631608963012695, "global_step": 35392, "epoch": 842} {"train_loss": -5.530759811401367, "global_step": 35393, "epoch": 842} {"train_loss": -5.398727893829346, "global_step": 35394, "epoch": 842} {"train_loss": -5.579399108886719, "global_step": 35395, "epoch": 842} {"train_loss": -5.511481761932373, "global_step": 35396, "epoch": 842} {"train_loss": -5.495392799377441, "global_step": 35397, "epoch": 842} {"train_loss": -5.51054573059082, "global_step": 35398, "epoch": 842} {"train_loss": -5.450380802154541, "global_step": 35399, "epoch": 842} {"train_loss": -5.569446563720703, "global_step": 35400, "epoch": 842} {"train_loss": -5.602913856506348, "global_step": 35401, "epoch": 842} {"train_loss": -5.673744201660156, "global_step": 35402, "epoch": 842} {"train_loss": -5.52467155456543, "global_step": 35403, "epoch": 842} {"train_loss": -5.55440092086792, "global_step": 35404, "epoch": 842} {"train_loss": -5.54176850545974, "global_step": 35405, "epoch": 842, "val_loss": 73927.8046875} {"train_loss": -5.5771684646606445, "global_step": 35406, "epoch": 843} {"train_loss": -5.633636474609375, "global_step": 35407, "epoch": 843} {"train_loss": -5.627085208892822, "global_step": 35408, "epoch": 843} {"train_loss": -5.647933006286621, "global_step": 35409, "epoch": 843} {"train_loss": -5.564184188842773, "global_step": 35410, "epoch": 843} {"train_loss": -5.597150802612305, "global_step": 35411, "epoch": 843} {"train_loss": -5.591451168060303, "global_step": 35412, "epoch": 843} {"train_loss": -5.587883472442627, "global_step": 35413, "epoch": 843} {"train_loss": -5.508105278015137, "global_step": 35414, "epoch": 843} {"train_loss": -5.654269218444824, "global_step": 35415, "epoch": 843} {"train_loss": -5.48681640625, "global_step": 35416, "epoch": 843} {"train_loss": -5.662464141845703, "global_step": 35417, "epoch": 843} {"train_loss": -5.548345565795898, "global_step": 35418, "epoch": 843} {"train_loss": -5.5747389793396, "global_step": 35419, "epoch": 843} {"train_loss": -5.496241092681885, "global_step": 35420, "epoch": 843} {"train_loss": -5.645364284515381, "global_step": 35421, "epoch": 843} {"train_loss": -5.450249671936035, "global_step": 35422, "epoch": 843} {"train_loss": -5.457078456878662, "global_step": 35423, "epoch": 843} {"train_loss": -5.466729164123535, "global_step": 35424, "epoch": 843} {"train_loss": -5.589027404785156, "global_step": 35425, "epoch": 843} {"train_loss": -5.5046186447143555, "global_step": 35426, "epoch": 843} {"train_loss": -5.569338798522949, "global_step": 35427, "epoch": 843} {"train_loss": -5.580971717834473, "global_step": 35428, "epoch": 843} {"train_loss": -5.59733772277832, "global_step": 35429, "epoch": 843} {"train_loss": -5.574314117431641, "global_step": 35430, "epoch": 843} {"train_loss": -5.5870466232299805, "global_step": 35431, "epoch": 843} {"train_loss": -5.607053756713867, "global_step": 35432, "epoch": 843} {"train_loss": -5.631982326507568, "global_step": 35433, "epoch": 843} {"train_loss": -5.467970848083496, "global_step": 35434, "epoch": 843} {"train_loss": -5.690356254577637, "global_step": 35435, "epoch": 843} {"train_loss": -5.520255088806152, "global_step": 35436, "epoch": 843} {"train_loss": -5.579418182373047, "global_step": 35437, "epoch": 843} {"train_loss": -5.472093105316162, "global_step": 35438, "epoch": 843} {"train_loss": -5.6143598556518555, "global_step": 35439, "epoch": 843} {"train_loss": -5.405059814453125, "global_step": 35440, "epoch": 843} {"train_loss": -5.566961288452148, "global_step": 35441, "epoch": 843} {"train_loss": -5.619973182678223, "global_step": 35442, "epoch": 843} {"train_loss": -5.425206661224365, "global_step": 35443, "epoch": 843} {"train_loss": -5.500615119934082, "global_step": 35444, "epoch": 843} {"train_loss": -5.674193859100342, "global_step": 35445, "epoch": 843} {"train_loss": -5.604008197784424, "global_step": 35446, "epoch": 843} {"train_loss": -5.561519418443952, "global_step": 35447, "epoch": 843, "val_loss": 73766.671875} {"train_loss": -5.459850311279297, "global_step": 35448, "epoch": 844} {"train_loss": -5.545771598815918, "global_step": 35449, "epoch": 844} {"train_loss": -5.446091651916504, "global_step": 35450, "epoch": 844} {"train_loss": -5.648663520812988, "global_step": 35451, "epoch": 844} {"train_loss": -5.476483345031738, "global_step": 35452, "epoch": 844} {"train_loss": -5.550989627838135, "global_step": 35453, "epoch": 844} {"train_loss": -5.588539123535156, "global_step": 35454, "epoch": 844} {"train_loss": -5.511899948120117, "global_step": 35455, "epoch": 844} {"train_loss": -5.453858375549316, "global_step": 35456, "epoch": 844} {"train_loss": -5.443544387817383, "global_step": 35457, "epoch": 844} {"train_loss": -5.392589092254639, "global_step": 35458, "epoch": 844} {"train_loss": -5.39726448059082, "global_step": 35459, "epoch": 844} {"train_loss": -5.6766886711120605, "global_step": 35460, "epoch": 844} {"train_loss": -5.638890266418457, "global_step": 35461, "epoch": 844} {"train_loss": -5.560273170471191, "global_step": 35462, "epoch": 844} {"train_loss": -5.593220233917236, "global_step": 35463, "epoch": 844} {"train_loss": -5.603033065795898, "global_step": 35464, "epoch": 844} {"train_loss": -5.55721378326416, "global_step": 35465, "epoch": 844} {"train_loss": -5.660749435424805, "global_step": 35466, "epoch": 844} {"train_loss": -5.7102155685424805, "global_step": 35467, "epoch": 844} {"train_loss": -5.588865756988525, "global_step": 35468, "epoch": 844} {"train_loss": -5.495356559753418, "global_step": 35469, "epoch": 844} {"train_loss": -5.575458526611328, "global_step": 35470, "epoch": 844} {"train_loss": -5.610928535461426, "global_step": 35471, "epoch": 844} {"train_loss": -5.550273895263672, "global_step": 35472, "epoch": 844} {"train_loss": -5.6680908203125, "global_step": 35473, "epoch": 844} {"train_loss": -5.702129364013672, "global_step": 35474, "epoch": 844} {"train_loss": -5.474321365356445, "global_step": 35475, "epoch": 844} {"train_loss": -5.625733852386475, "global_step": 35476, "epoch": 844} {"train_loss": -5.581934452056885, "global_step": 35477, "epoch": 844} {"train_loss": -5.691784858703613, "global_step": 35478, "epoch": 844} {"train_loss": -5.4985504150390625, "global_step": 35479, "epoch": 844} {"train_loss": -5.562265396118164, "global_step": 35480, "epoch": 844} {"train_loss": -5.452569961547852, "global_step": 35481, "epoch": 844} {"train_loss": -5.452548027038574, "global_step": 35482, "epoch": 844} {"train_loss": -5.546338081359863, "global_step": 35483, "epoch": 844} {"train_loss": -5.394650459289551, "global_step": 35484, "epoch": 844} {"train_loss": -5.5295209884643555, "global_step": 35485, "epoch": 844} {"train_loss": -5.477165222167969, "global_step": 35486, "epoch": 844} {"train_loss": -5.567508697509766, "global_step": 35487, "epoch": 844} {"train_loss": -5.498157978057861, "global_step": 35488, "epoch": 844} {"train_loss": -5.549633366721017, "global_step": 35489, "epoch": 844, "val_loss": 74342.6640625} {"train_loss": -5.627263069152832, "global_step": 35490, "epoch": 845} {"train_loss": -5.588407516479492, "global_step": 35491, "epoch": 845} {"train_loss": -5.60720157623291, "global_step": 35492, "epoch": 845} {"train_loss": -5.498691558837891, "global_step": 35493, "epoch": 845} {"train_loss": -5.560518741607666, "global_step": 35494, "epoch": 845} {"train_loss": -5.462696075439453, "global_step": 35495, "epoch": 845} {"train_loss": -5.65830135345459, "global_step": 35496, "epoch": 845} {"train_loss": -5.458320140838623, "global_step": 35497, "epoch": 845} {"train_loss": -5.47962760925293, "global_step": 35498, "epoch": 845} {"train_loss": -5.598730087280273, "global_step": 35499, "epoch": 845} {"train_loss": -5.548299789428711, "global_step": 35500, "epoch": 845} {"train_loss": -5.508398056030273, "global_step": 35501, "epoch": 845} {"train_loss": -5.519161701202393, "global_step": 35502, "epoch": 845} {"train_loss": -5.5197553634643555, "global_step": 35503, "epoch": 845} {"train_loss": -5.619336128234863, "global_step": 35504, "epoch": 845} {"train_loss": -5.537219047546387, "global_step": 35505, "epoch": 845} {"train_loss": -5.4854207038879395, "global_step": 35506, "epoch": 845} {"train_loss": -5.580000877380371, "global_step": 35507, "epoch": 845} {"train_loss": -5.511866092681885, "global_step": 35508, "epoch": 845} {"train_loss": -5.581399917602539, "global_step": 35509, "epoch": 845} {"train_loss": -5.59119176864624, "global_step": 35510, "epoch": 845} {"train_loss": -5.616805076599121, "global_step": 35511, "epoch": 845} {"train_loss": -5.643259048461914, "global_step": 35512, "epoch": 845} {"train_loss": -5.672266960144043, "global_step": 35513, "epoch": 845} {"train_loss": -5.682435989379883, "global_step": 35514, "epoch": 845} {"train_loss": -5.588443279266357, "global_step": 35515, "epoch": 845} {"train_loss": -5.629881858825684, "global_step": 35516, "epoch": 845} {"train_loss": -5.674408912658691, "global_step": 35517, "epoch": 845} {"train_loss": -5.622998237609863, "global_step": 35518, "epoch": 845} {"train_loss": -5.607796669006348, "global_step": 35519, "epoch": 845} {"train_loss": -5.475272178649902, "global_step": 35520, "epoch": 845} {"train_loss": -5.56735897064209, "global_step": 35521, "epoch": 845} {"train_loss": -5.545701026916504, "global_step": 35522, "epoch": 845} {"train_loss": -5.629279136657715, "global_step": 35523, "epoch": 845} {"train_loss": -5.605036735534668, "global_step": 35524, "epoch": 845} {"train_loss": -5.541329383850098, "global_step": 35525, "epoch": 845} {"train_loss": -5.552837371826172, "global_step": 35526, "epoch": 845} {"train_loss": -5.593854904174805, "global_step": 35527, "epoch": 845} {"train_loss": -5.65681266784668, "global_step": 35528, "epoch": 845} {"train_loss": -5.726146697998047, "global_step": 35529, "epoch": 845} {"train_loss": -5.6645121574401855, "global_step": 35530, "epoch": 845} {"train_loss": -5.579611869085403, "global_step": 35531, "epoch": 845, "val_loss": 73986.9609375} {"train_loss": -5.667171955108643, "global_step": 35532, "epoch": 846} {"train_loss": -5.6123857498168945, "global_step": 35533, "epoch": 846} {"train_loss": -5.564491271972656, "global_step": 35534, "epoch": 846} {"train_loss": -5.758035659790039, "global_step": 35535, "epoch": 846} {"train_loss": -5.555932998657227, "global_step": 35536, "epoch": 846} {"train_loss": -5.5139241218566895, "global_step": 35537, "epoch": 846} {"train_loss": -5.516684532165527, "global_step": 35538, "epoch": 846} {"train_loss": -5.464301586151123, "global_step": 35539, "epoch": 846} {"train_loss": -5.459022521972656, "global_step": 35540, "epoch": 846} {"train_loss": -5.557883262634277, "global_step": 35541, "epoch": 846} {"train_loss": -5.389999866485596, "global_step": 35542, "epoch": 846} {"train_loss": -5.553197860717773, "global_step": 35543, "epoch": 846} {"train_loss": -5.667022705078125, "global_step": 35544, "epoch": 846} {"train_loss": -5.601593494415283, "global_step": 35545, "epoch": 846} {"train_loss": -5.601631164550781, "global_step": 35546, "epoch": 846} {"train_loss": -5.649687767028809, "global_step": 35547, "epoch": 846} {"train_loss": -5.479190349578857, "global_step": 35548, "epoch": 846} {"train_loss": -5.54276180267334, "global_step": 35549, "epoch": 846} {"train_loss": -5.585869312286377, "global_step": 35550, "epoch": 846} {"train_loss": -5.64777946472168, "global_step": 35551, "epoch": 846} {"train_loss": -5.681357383728027, "global_step": 35552, "epoch": 846} {"train_loss": -5.592747688293457, "global_step": 35553, "epoch": 846} {"train_loss": -5.4762420654296875, "global_step": 35554, "epoch": 846} {"train_loss": -5.478105545043945, "global_step": 35555, "epoch": 846} {"train_loss": -5.548448085784912, "global_step": 35556, "epoch": 846} {"train_loss": -5.644649028778076, "global_step": 35557, "epoch": 846} {"train_loss": -5.660538673400879, "global_step": 35558, "epoch": 846} {"train_loss": -5.554220199584961, "global_step": 35559, "epoch": 846} {"train_loss": -5.532872200012207, "global_step": 35560, "epoch": 846} {"train_loss": -5.540354251861572, "global_step": 35561, "epoch": 846} {"train_loss": -5.613948822021484, "global_step": 35562, "epoch": 846} {"train_loss": -5.65526008605957, "global_step": 35563, "epoch": 846} {"train_loss": -5.53868293762207, "global_step": 35564, "epoch": 846} {"train_loss": -5.599809169769287, "global_step": 35565, "epoch": 846} {"train_loss": -5.6595001220703125, "global_step": 35566, "epoch": 846} {"train_loss": -5.496106147766113, "global_step": 35567, "epoch": 846} {"train_loss": -5.572876930236816, "global_step": 35568, "epoch": 846} {"train_loss": -5.6004533767700195, "global_step": 35569, "epoch": 846} {"train_loss": -5.540499687194824, "global_step": 35570, "epoch": 846} {"train_loss": -5.510318756103516, "global_step": 35571, "epoch": 846} {"train_loss": -5.637497901916504, "global_step": 35572, "epoch": 846} {"train_loss": -5.574749356224423, "global_step": 35573, "epoch": 846, "val_loss": 74160.1015625} {"train_loss": -5.613746643066406, "global_step": 35574, "epoch": 847} {"train_loss": -5.663597106933594, "global_step": 35575, "epoch": 847} {"train_loss": -5.63004207611084, "global_step": 35576, "epoch": 847} {"train_loss": -5.3416852951049805, "global_step": 35577, "epoch": 847} {"train_loss": -5.523862838745117, "global_step": 35578, "epoch": 847} {"train_loss": -5.6710100173950195, "global_step": 35579, "epoch": 847} {"train_loss": -5.494586944580078, "global_step": 35580, "epoch": 847} {"train_loss": -5.502168655395508, "global_step": 35581, "epoch": 847} {"train_loss": -5.469945907592773, "global_step": 35582, "epoch": 847} {"train_loss": -5.47390604019165, "global_step": 35583, "epoch": 847} {"train_loss": -5.541139602661133, "global_step": 35584, "epoch": 847} {"train_loss": -5.520726203918457, "global_step": 35585, "epoch": 847} {"train_loss": -5.444538593292236, "global_step": 35586, "epoch": 847} {"train_loss": -5.443867206573486, "global_step": 35587, "epoch": 847} {"train_loss": -5.4611406326293945, "global_step": 35588, "epoch": 847} {"train_loss": -5.558881759643555, "global_step": 35589, "epoch": 847} {"train_loss": -5.46470308303833, "global_step": 35590, "epoch": 847} {"train_loss": -5.47947359085083, "global_step": 35591, "epoch": 847} {"train_loss": -5.57853889465332, "global_step": 35592, "epoch": 847} {"train_loss": -5.521186828613281, "global_step": 35593, "epoch": 847} {"train_loss": -5.564696311950684, "global_step": 35594, "epoch": 847} {"train_loss": -5.40478515625, "global_step": 35595, "epoch": 847} {"train_loss": -5.553021430969238, "global_step": 35596, "epoch": 847} {"train_loss": -5.540041446685791, "global_step": 35597, "epoch": 847} {"train_loss": -5.421191215515137, "global_step": 35598, "epoch": 847} {"train_loss": -5.452689170837402, "global_step": 35599, "epoch": 847} {"train_loss": -5.557998180389404, "global_step": 35600, "epoch": 847} {"train_loss": -5.243715286254883, "global_step": 35601, "epoch": 847} {"train_loss": -5.612735748291016, "global_step": 35602, "epoch": 847} {"train_loss": -5.5123701095581055, "global_step": 35603, "epoch": 847} {"train_loss": -5.504324913024902, "global_step": 35604, "epoch": 847} {"train_loss": -5.5343451499938965, "global_step": 35605, "epoch": 847} {"train_loss": -5.476222038269043, "global_step": 35606, "epoch": 847} {"train_loss": -5.602621555328369, "global_step": 35607, "epoch": 847} {"train_loss": -5.5906476974487305, "global_step": 35608, "epoch": 847} {"train_loss": -5.524808883666992, "global_step": 35609, "epoch": 847} {"train_loss": -5.774662017822266, "global_step": 35610, "epoch": 847} {"train_loss": -5.632882595062256, "global_step": 35611, "epoch": 847} {"train_loss": -5.569826126098633, "global_step": 35612, "epoch": 847} {"train_loss": -5.594213008880615, "global_step": 35613, "epoch": 847} {"train_loss": -5.541684150695801, "global_step": 35614, "epoch": 847} {"train_loss": -5.524511768704369, "global_step": 35615, "epoch": 847, "val_loss": 74146.2890625} {"train_loss": -5.6277360916137695, "global_step": 35616, "epoch": 848} {"train_loss": -5.556836128234863, "global_step": 35617, "epoch": 848} {"train_loss": -5.374894142150879, "global_step": 35618, "epoch": 848} {"train_loss": -5.587677955627441, "global_step": 35619, "epoch": 848} {"train_loss": -5.65289306640625, "global_step": 35620, "epoch": 848} {"train_loss": -5.492101669311523, "global_step": 35621, "epoch": 848} {"train_loss": -5.55679988861084, "global_step": 35622, "epoch": 848} {"train_loss": -5.546952247619629, "global_step": 35623, "epoch": 848} {"train_loss": -5.634270668029785, "global_step": 35624, "epoch": 848} {"train_loss": -5.465965270996094, "global_step": 35625, "epoch": 848} {"train_loss": -5.499857425689697, "global_step": 35626, "epoch": 848} {"train_loss": -5.611615180969238, "global_step": 35627, "epoch": 848} {"train_loss": -5.505853652954102, "global_step": 35628, "epoch": 848} {"train_loss": -5.551896572113037, "global_step": 35629, "epoch": 848} {"train_loss": -5.556334972381592, "global_step": 35630, "epoch": 848} {"train_loss": -5.580936431884766, "global_step": 35631, "epoch": 848} {"train_loss": -5.5399394035339355, "global_step": 35632, "epoch": 848} {"train_loss": -5.593642234802246, "global_step": 35633, "epoch": 848} {"train_loss": -5.49686861038208, "global_step": 35634, "epoch": 848} {"train_loss": -5.514152526855469, "global_step": 35635, "epoch": 848} {"train_loss": -5.614416122436523, "global_step": 35636, "epoch": 848} {"train_loss": -5.455066204071045, "global_step": 35637, "epoch": 848} {"train_loss": -5.53347635269165, "global_step": 35638, "epoch": 848} {"train_loss": -5.489011764526367, "global_step": 35639, "epoch": 848} {"train_loss": -5.584405422210693, "global_step": 35640, "epoch": 848} {"train_loss": -5.560386657714844, "global_step": 35641, "epoch": 848} {"train_loss": -5.551032066345215, "global_step": 35642, "epoch": 848} {"train_loss": -5.663694381713867, "global_step": 35643, "epoch": 848} {"train_loss": -5.638791084289551, "global_step": 35644, "epoch": 848} {"train_loss": -5.529088020324707, "global_step": 35645, "epoch": 848} {"train_loss": -5.519840240478516, "global_step": 35646, "epoch": 848} {"train_loss": -5.536277770996094, "global_step": 35647, "epoch": 848} {"train_loss": -5.555757522583008, "global_step": 35648, "epoch": 848} {"train_loss": -5.423446178436279, "global_step": 35649, "epoch": 848} {"train_loss": -5.547628402709961, "global_step": 35650, "epoch": 848} {"train_loss": -5.569323539733887, "global_step": 35651, "epoch": 848} {"train_loss": -5.522917747497559, "global_step": 35652, "epoch": 848} {"train_loss": -5.487698554992676, "global_step": 35653, "epoch": 848} {"train_loss": -5.543976306915283, "global_step": 35654, "epoch": 848} {"train_loss": -5.49951696395874, "global_step": 35655, "epoch": 848} {"train_loss": -5.496582984924316, "global_step": 35656, "epoch": 848} {"train_loss": -5.544341314406622, "global_step": 35657, "epoch": 848, "val_loss": 74627.90625} {"train_loss": -5.579365253448486, "global_step": 35658, "epoch": 849} {"train_loss": -5.6181321144104, "global_step": 35659, "epoch": 849} {"train_loss": -5.642980575561523, "global_step": 35660, "epoch": 849} {"train_loss": -5.621350288391113, "global_step": 35661, "epoch": 849} {"train_loss": -5.580390453338623, "global_step": 35662, "epoch": 849} {"train_loss": -5.511466026306152, "global_step": 35663, "epoch": 849} {"train_loss": -5.462527275085449, "global_step": 35664, "epoch": 849} {"train_loss": -5.587800025939941, "global_step": 35665, "epoch": 849} {"train_loss": -5.361297130584717, "global_step": 35666, "epoch": 849} {"train_loss": -5.572832107543945, "global_step": 35667, "epoch": 849} {"train_loss": -5.551543235778809, "global_step": 35668, "epoch": 849} {"train_loss": -5.5055670738220215, "global_step": 35669, "epoch": 849} {"train_loss": -5.4870758056640625, "global_step": 35670, "epoch": 849} {"train_loss": -5.569333076477051, "global_step": 35671, "epoch": 849} {"train_loss": -5.506547927856445, "global_step": 35672, "epoch": 849} {"train_loss": -5.6224870681762695, "global_step": 35673, "epoch": 849} {"train_loss": -5.573516845703125, "global_step": 35674, "epoch": 849} {"train_loss": -5.521601676940918, "global_step": 35675, "epoch": 849} {"train_loss": -5.54226541519165, "global_step": 35676, "epoch": 849} {"train_loss": -5.69513463973999, "global_step": 35677, "epoch": 849} {"train_loss": -5.677803993225098, "global_step": 35678, "epoch": 849} {"train_loss": -5.6103057861328125, "global_step": 35679, "epoch": 849} {"train_loss": -5.611759185791016, "global_step": 35680, "epoch": 849} {"train_loss": -5.567551136016846, "global_step": 35681, "epoch": 849} {"train_loss": -5.619154930114746, "global_step": 35682, "epoch": 849} {"train_loss": -5.386521339416504, "global_step": 35683, "epoch": 849} {"train_loss": -5.46712589263916, "global_step": 35684, "epoch": 849} {"train_loss": -5.593194961547852, "global_step": 35685, "epoch": 849} {"train_loss": -5.550604820251465, "global_step": 35686, "epoch": 849} {"train_loss": -5.544379234313965, "global_step": 35687, "epoch": 849} {"train_loss": -5.657873630523682, "global_step": 35688, "epoch": 849} {"train_loss": -5.4751176834106445, "global_step": 35689, "epoch": 849} {"train_loss": -5.576963424682617, "global_step": 35690, "epoch": 849} {"train_loss": -5.581186294555664, "global_step": 35691, "epoch": 849} {"train_loss": -5.50946569442749, "global_step": 35692, "epoch": 849} {"train_loss": -5.48867654800415, "global_step": 35693, "epoch": 849} {"train_loss": -5.559096336364746, "global_step": 35694, "epoch": 849} {"train_loss": -5.585230350494385, "global_step": 35695, "epoch": 849} {"train_loss": -5.539300918579102, "global_step": 35696, "epoch": 849} {"train_loss": -5.497528553009033, "global_step": 35697, "epoch": 849} {"train_loss": -5.5520172119140625, "global_step": 35698, "epoch": 849} {"train_loss": -5.555930966422672, "global_step": 35699, "epoch": 849, "val_loss": 74114.2578125} {"train_loss": -5.624576568603516, "global_step": 35700, "epoch": 850} {"train_loss": -5.517208099365234, "global_step": 35701, "epoch": 850} {"train_loss": -5.494840621948242, "global_step": 35702, "epoch": 850} {"train_loss": -5.562273025512695, "global_step": 35703, "epoch": 850} {"train_loss": -5.441524028778076, "global_step": 35704, "epoch": 850} {"train_loss": -5.64911413192749, "global_step": 35705, "epoch": 850} {"train_loss": -5.513251304626465, "global_step": 35706, "epoch": 850} {"train_loss": -5.744714736938477, "global_step": 35707, "epoch": 850} {"train_loss": -5.532661437988281, "global_step": 35708, "epoch": 850} {"train_loss": -5.567208290100098, "global_step": 35709, "epoch": 850} {"train_loss": -5.547235488891602, "global_step": 35710, "epoch": 850} {"train_loss": -5.633106231689453, "global_step": 35711, "epoch": 850} {"train_loss": -5.5317463874816895, "global_step": 35712, "epoch": 850} {"train_loss": -5.523789405822754, "global_step": 35713, "epoch": 850} {"train_loss": -5.643959045410156, "global_step": 35714, "epoch": 850} {"train_loss": -5.672877311706543, "global_step": 35715, "epoch": 850} {"train_loss": -5.536249160766602, "global_step": 35716, "epoch": 850} {"train_loss": -5.438835144042969, "global_step": 35717, "epoch": 850} {"train_loss": -5.528045177459717, "global_step": 35718, "epoch": 850} {"train_loss": -5.463350296020508, "global_step": 35719, "epoch": 850} {"train_loss": -5.619725704193115, "global_step": 35720, "epoch": 850} {"train_loss": -5.539490699768066, "global_step": 35721, "epoch": 850} {"train_loss": -5.562050819396973, "global_step": 35722, "epoch": 850} {"train_loss": -5.502255439758301, "global_step": 35723, "epoch": 850} {"train_loss": -5.589951515197754, "global_step": 35724, "epoch": 850} {"train_loss": -5.505704879760742, "global_step": 35725, "epoch": 850} {"train_loss": -5.586972236633301, "global_step": 35726, "epoch": 850} {"train_loss": -5.527985095977783, "global_step": 35727, "epoch": 850} {"train_loss": -5.5856451988220215, "global_step": 35728, "epoch": 850} {"train_loss": -5.539234161376953, "global_step": 35729, "epoch": 850} {"train_loss": -5.526803016662598, "global_step": 35730, "epoch": 850} {"train_loss": -5.628563404083252, "global_step": 35731, "epoch": 850} {"train_loss": -5.5819244384765625, "global_step": 35732, "epoch": 850} {"train_loss": -5.5454325675964355, "global_step": 35733, "epoch": 850} {"train_loss": -5.527795791625977, "global_step": 35734, "epoch": 850} {"train_loss": -5.471053123474121, "global_step": 35735, "epoch": 850} {"train_loss": -5.510335922241211, "global_step": 35736, "epoch": 850} {"train_loss": -5.698608875274658, "global_step": 35737, "epoch": 850} {"train_loss": -5.552301406860352, "global_step": 35738, "epoch": 850} {"train_loss": -5.490812301635742, "global_step": 35739, "epoch": 850} {"train_loss": -5.495563983917236, "global_step": 35740, "epoch": 850} {"train_loss": -5.556588785988944, "global_step": 35741, "epoch": 850, "train/sim_max_reward_0": 0.5083053048256557, "train/sim_max_reward_1": 0.15384599351474626, "train/sim_max_reward_2": 0.5544640986667947, "train/sim_max_reward_3": 0.22917386941874637, "train/sim_max_reward_4": 0.5918786729171568, "train/sim_max_reward_5": 0.5070782260021237, "test/sim_max_reward_4500000": 0.751605428978055, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.0, "test/sim_max_reward_4500003": 0.6976488549203673, "test/sim_max_reward_4500004": 0.07614990421765569, "test/sim_max_reward_4500005": 0.25116569458488097, "test/sim_max_reward_4500006": 0.8486161234653461, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.028133082584471822, "test/sim_max_reward_4500009": 0.37102960951769315, "test/sim_max_reward_4500010": 0.598804696988804, "test/sim_max_reward_4500011": 0.4113991874265027, "test/sim_max_reward_4500012": 0.4539965402063578, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.3614286576078815, "test/sim_max_reward_4500015": 0.5015822711845807, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.14083997809362533, "test/sim_max_reward_4500019": 0.6359204999875665, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.42772717171156505, "test/sim_max_reward_4500022": 0.7997912139550089, "test/sim_max_reward_4500023": 0.5950431718373694, "test/sim_max_reward_4500024": 0.11444587603982995, "test/sim_max_reward_4500025": 0.6319906375874106, "test/sim_max_reward_4500026": 0.24619187547604449, "test/sim_max_reward_4500027": 0.732676577031436, "test/sim_max_reward_4500028": 0.19634285331321, "test/sim_max_reward_4500029": 0.07195900700022187, "test/sim_max_reward_4500030": 0.25394869709626444, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.10330686403747735, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.793785099862697, "test/sim_max_reward_4500035": 0.44153585349316904, "test/sim_max_reward_4500036": 0.43696553396472104, "test/sim_max_reward_4500037": 0.1684011327277173, "test/sim_max_reward_4500038": 0.34745031128947645, "test/sim_max_reward_4500039": 0.5871868352332996, "test/sim_max_reward_4500040": 0.21598692467865035, "test/sim_max_reward_4500041": 0.20876905106912136, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.5984824747684254, "test/sim_max_reward_4500044": 0.7427777247496872, "test/sim_max_reward_4500045": 0.6727537749507144, "test/sim_max_reward_4500046": 0.2771711229847297, "test/sim_max_reward_4500047": 0.662177292515498, "test/sim_max_reward_4500048": 0.27521624738763284, "test/sim_max_reward_4500049": 0.9634267024430866, "train/mean_score": 0.42412436089087063, "test/mean_score": 0.3542299568082019, "val_loss": 74281.6484375} {"train_loss": -5.546689987182617, "global_step": 35742, "epoch": 851} {"train_loss": -5.489479064941406, "global_step": 35743, "epoch": 851} {"train_loss": -5.60842227935791, "global_step": 35744, "epoch": 851} {"train_loss": -5.581083297729492, "global_step": 35745, "epoch": 851} {"train_loss": -5.584939002990723, "global_step": 35746, "epoch": 851} {"train_loss": -5.595471382141113, "global_step": 35747, "epoch": 851} {"train_loss": -5.705851078033447, "global_step": 35748, "epoch": 851} {"train_loss": -5.555472373962402, "global_step": 35749, "epoch": 851} {"train_loss": -5.5720062255859375, "global_step": 35750, "epoch": 851} {"train_loss": -5.422837257385254, "global_step": 35751, "epoch": 851} {"train_loss": -5.500434875488281, "global_step": 35752, "epoch": 851} {"train_loss": -5.5686187744140625, "global_step": 35753, "epoch": 851} {"train_loss": -5.648367881774902, "global_step": 35754, "epoch": 851} {"train_loss": -5.5533952713012695, "global_step": 35755, "epoch": 851} {"train_loss": -5.623992443084717, "global_step": 35756, "epoch": 851} {"train_loss": -5.581319332122803, "global_step": 35757, "epoch": 851} {"train_loss": -5.621424674987793, "global_step": 35758, "epoch": 851} {"train_loss": -5.765682220458984, "global_step": 35759, "epoch": 851} {"train_loss": -5.414399147033691, "global_step": 35760, "epoch": 851} {"train_loss": -5.531223297119141, "global_step": 35761, "epoch": 851} {"train_loss": -5.654882431030273, "global_step": 35762, "epoch": 851} {"train_loss": -5.590017318725586, "global_step": 35763, "epoch": 851} {"train_loss": -5.414959907531738, "global_step": 35764, "epoch": 851} {"train_loss": -5.568996906280518, "global_step": 35765, "epoch": 851} {"train_loss": -5.450044631958008, "global_step": 35766, "epoch": 851} {"train_loss": -5.521206855773926, "global_step": 35767, "epoch": 851} {"train_loss": -5.601531505584717, "global_step": 35768, "epoch": 851} {"train_loss": -5.288495063781738, "global_step": 35769, "epoch": 851} {"train_loss": -5.540040493011475, "global_step": 35770, "epoch": 851} {"train_loss": -5.418022632598877, "global_step": 35771, "epoch": 851} {"train_loss": -5.400721549987793, "global_step": 35772, "epoch": 851} {"train_loss": -5.603508949279785, "global_step": 35773, "epoch": 851} {"train_loss": -5.26167106628418, "global_step": 35774, "epoch": 851} {"train_loss": -5.494022369384766, "global_step": 35775, "epoch": 851} {"train_loss": -5.335470199584961, "global_step": 35776, "epoch": 851} {"train_loss": -5.639711856842041, "global_step": 35777, "epoch": 851} {"train_loss": -5.404331207275391, "global_step": 35778, "epoch": 851} {"train_loss": -5.471321105957031, "global_step": 35779, "epoch": 851} {"train_loss": -5.621589183807373, "global_step": 35780, "epoch": 851} {"train_loss": -5.447175979614258, "global_step": 35781, "epoch": 851} {"train_loss": -5.521059036254883, "global_step": 35782, "epoch": 851} {"train_loss": -5.5285210950034, "global_step": 35783, "epoch": 851, "val_loss": 73951.78125} {"train_loss": -5.525331497192383, "global_step": 35784, "epoch": 852} {"train_loss": -5.561774730682373, "global_step": 35785, "epoch": 852} {"train_loss": -5.502175331115723, "global_step": 35786, "epoch": 852} {"train_loss": -5.507488250732422, "global_step": 35787, "epoch": 852} {"train_loss": -5.520801544189453, "global_step": 35788, "epoch": 852} {"train_loss": -5.545989036560059, "global_step": 35789, "epoch": 852} {"train_loss": -5.504847526550293, "global_step": 35790, "epoch": 852} {"train_loss": -5.7129058837890625, "global_step": 35791, "epoch": 852} {"train_loss": -5.599926471710205, "global_step": 35792, "epoch": 852} {"train_loss": -5.650956153869629, "global_step": 35793, "epoch": 852} {"train_loss": -5.507021903991699, "global_step": 35794, "epoch": 852} {"train_loss": -5.56659460067749, "global_step": 35795, "epoch": 852} {"train_loss": -5.477743148803711, "global_step": 35796, "epoch": 852} {"train_loss": -5.628213405609131, "global_step": 35797, "epoch": 852} {"train_loss": -5.57928991317749, "global_step": 35798, "epoch": 852} {"train_loss": -5.642024993896484, "global_step": 35799, "epoch": 852} {"train_loss": -5.571491718292236, "global_step": 35800, "epoch": 852} {"train_loss": -5.567790985107422, "global_step": 35801, "epoch": 852} {"train_loss": -5.665815353393555, "global_step": 35802, "epoch": 852} {"train_loss": -5.649864196777344, "global_step": 35803, "epoch": 852} {"train_loss": -5.557904243469238, "global_step": 35804, "epoch": 852} {"train_loss": -5.539037227630615, "global_step": 35805, "epoch": 852} {"train_loss": -5.6638665199279785, "global_step": 35806, "epoch": 852} {"train_loss": -5.424016952514648, "global_step": 35807, "epoch": 852} {"train_loss": -5.633896827697754, "global_step": 35808, "epoch": 852} {"train_loss": -5.676810264587402, "global_step": 35809, "epoch": 852} {"train_loss": -5.467840194702148, "global_step": 35810, "epoch": 852} {"train_loss": -5.543793678283691, "global_step": 35811, "epoch": 852} {"train_loss": -5.643352031707764, "global_step": 35812, "epoch": 852} {"train_loss": -5.492272853851318, "global_step": 35813, "epoch": 852} {"train_loss": -5.478139877319336, "global_step": 35814, "epoch": 852} {"train_loss": -5.604616641998291, "global_step": 35815, "epoch": 852} {"train_loss": -5.535449981689453, "global_step": 35816, "epoch": 852} {"train_loss": -5.526384353637695, "global_step": 35817, "epoch": 852} {"train_loss": -5.583786964416504, "global_step": 35818, "epoch": 852} {"train_loss": -5.556639671325684, "global_step": 35819, "epoch": 852} {"train_loss": -5.487348556518555, "global_step": 35820, "epoch": 852} {"train_loss": -5.464313507080078, "global_step": 35821, "epoch": 852} {"train_loss": -5.619209289550781, "global_step": 35822, "epoch": 852} {"train_loss": -5.487433433532715, "global_step": 35823, "epoch": 852} {"train_loss": -5.445080757141113, "global_step": 35824, "epoch": 852} {"train_loss": -5.559537615094866, "global_step": 35825, "epoch": 852, "val_loss": 73947.984375} {"train_loss": -5.486800670623779, "global_step": 35826, "epoch": 853} {"train_loss": -5.658909797668457, "global_step": 35827, "epoch": 853} {"train_loss": -5.535957336425781, "global_step": 35828, "epoch": 853} {"train_loss": -5.616143226623535, "global_step": 35829, "epoch": 853} {"train_loss": -5.602510452270508, "global_step": 35830, "epoch": 853} {"train_loss": -5.609965801239014, "global_step": 35831, "epoch": 853} {"train_loss": -5.689124584197998, "global_step": 35832, "epoch": 853} {"train_loss": -5.48664665222168, "global_step": 35833, "epoch": 853} {"train_loss": -5.6116437911987305, "global_step": 35834, "epoch": 853} {"train_loss": -5.582302570343018, "global_step": 35835, "epoch": 853} {"train_loss": -5.645003318786621, "global_step": 35836, "epoch": 853} {"train_loss": -5.518733501434326, "global_step": 35837, "epoch": 853} {"train_loss": -5.496641159057617, "global_step": 35838, "epoch": 853} {"train_loss": -5.4791669845581055, "global_step": 35839, "epoch": 853} {"train_loss": -5.565004348754883, "global_step": 35840, "epoch": 853} {"train_loss": -5.515170097351074, "global_step": 35841, "epoch": 853} {"train_loss": -5.45503044128418, "global_step": 35842, "epoch": 853} {"train_loss": -5.419564723968506, "global_step": 35843, "epoch": 853} {"train_loss": -5.574925899505615, "global_step": 35844, "epoch": 853} {"train_loss": -5.534561634063721, "global_step": 35845, "epoch": 853} {"train_loss": -5.501112461090088, "global_step": 35846, "epoch": 853} {"train_loss": -5.472095489501953, "global_step": 35847, "epoch": 853} {"train_loss": -5.507948875427246, "global_step": 35848, "epoch": 853} {"train_loss": -5.538074970245361, "global_step": 35849, "epoch": 853} {"train_loss": -5.470856189727783, "global_step": 35850, "epoch": 853} {"train_loss": -5.669503688812256, "global_step": 35851, "epoch": 853} {"train_loss": -5.635340213775635, "global_step": 35852, "epoch": 853} {"train_loss": -5.63218355178833, "global_step": 35853, "epoch": 853} {"train_loss": -5.602189064025879, "global_step": 35854, "epoch": 853} {"train_loss": -5.597092628479004, "global_step": 35855, "epoch": 853} {"train_loss": -5.60127067565918, "global_step": 35856, "epoch": 853} {"train_loss": -5.458847522735596, "global_step": 35857, "epoch": 853} {"train_loss": -5.483475208282471, "global_step": 35858, "epoch": 853} {"train_loss": -5.516369819641113, "global_step": 35859, "epoch": 853} {"train_loss": -5.596421241760254, "global_step": 35860, "epoch": 853} {"train_loss": -5.513977527618408, "global_step": 35861, "epoch": 853} {"train_loss": -5.581543445587158, "global_step": 35862, "epoch": 853} {"train_loss": -5.4562530517578125, "global_step": 35863, "epoch": 853} {"train_loss": -5.539180755615234, "global_step": 35864, "epoch": 853} {"train_loss": -5.533102035522461, "global_step": 35865, "epoch": 853} {"train_loss": -5.496534824371338, "global_step": 35866, "epoch": 853} {"train_loss": -5.544093779155186, "global_step": 35867, "epoch": 853, "val_loss": 74500.3203125} {"train_loss": -5.451184272766113, "global_step": 35868, "epoch": 854} {"train_loss": -5.559602737426758, "global_step": 35869, "epoch": 854} {"train_loss": -5.499032974243164, "global_step": 35870, "epoch": 854} {"train_loss": -5.437189102172852, "global_step": 35871, "epoch": 854} {"train_loss": -5.4758195877075195, "global_step": 35872, "epoch": 854} {"train_loss": -5.608883857727051, "global_step": 35873, "epoch": 854} {"train_loss": -5.508553504943848, "global_step": 35874, "epoch": 854} {"train_loss": -5.575972557067871, "global_step": 35875, "epoch": 854} {"train_loss": -5.699638366699219, "global_step": 35876, "epoch": 854} {"train_loss": -5.670713901519775, "global_step": 35877, "epoch": 854} {"train_loss": -5.60193395614624, "global_step": 35878, "epoch": 854} {"train_loss": -5.669407367706299, "global_step": 35879, "epoch": 854} {"train_loss": -5.469376087188721, "global_step": 35880, "epoch": 854} {"train_loss": -5.647479057312012, "global_step": 35881, "epoch": 854} {"train_loss": -5.6797895431518555, "global_step": 35882, "epoch": 854} {"train_loss": -5.629459857940674, "global_step": 35883, "epoch": 854} {"train_loss": -5.667383193969727, "global_step": 35884, "epoch": 854} {"train_loss": -5.500502586364746, "global_step": 35885, "epoch": 854} {"train_loss": -5.625807285308838, "global_step": 35886, "epoch": 854} {"train_loss": -5.740505218505859, "global_step": 35887, "epoch": 854} {"train_loss": -5.598524570465088, "global_step": 35888, "epoch": 854} {"train_loss": -5.678727149963379, "global_step": 35889, "epoch": 854} {"train_loss": -5.51444149017334, "global_step": 35890, "epoch": 854} {"train_loss": -5.534207344055176, "global_step": 35891, "epoch": 854} {"train_loss": -5.62770938873291, "global_step": 35892, "epoch": 854} {"train_loss": -5.507627010345459, "global_step": 35893, "epoch": 854} {"train_loss": -5.63616418838501, "global_step": 35894, "epoch": 854} {"train_loss": -5.518747329711914, "global_step": 35895, "epoch": 854} {"train_loss": -5.533217430114746, "global_step": 35896, "epoch": 854} {"train_loss": -5.612158298492432, "global_step": 35897, "epoch": 854} {"train_loss": -5.694354057312012, "global_step": 35898, "epoch": 854} {"train_loss": -5.718839168548584, "global_step": 35899, "epoch": 854} {"train_loss": -5.494172096252441, "global_step": 35900, "epoch": 854} {"train_loss": -5.627840995788574, "global_step": 35901, "epoch": 854} {"train_loss": -5.509406566619873, "global_step": 35902, "epoch": 854} {"train_loss": -5.634590148925781, "global_step": 35903, "epoch": 854} {"train_loss": -5.496027946472168, "global_step": 35904, "epoch": 854} {"train_loss": -5.511305809020996, "global_step": 35905, "epoch": 854} {"train_loss": -5.493869781494141, "global_step": 35906, "epoch": 854} {"train_loss": -5.382996559143066, "global_step": 35907, "epoch": 854} {"train_loss": -5.565107345581055, "global_step": 35908, "epoch": 854} {"train_loss": -5.572054022834415, "global_step": 35909, "epoch": 854, "val_loss": 74520.984375} {"train_loss": -5.350727558135986, "global_step": 35910, "epoch": 855} {"train_loss": -5.698216438293457, "global_step": 35911, "epoch": 855} {"train_loss": -5.508169174194336, "global_step": 35912, "epoch": 855} {"train_loss": -5.481497764587402, "global_step": 35913, "epoch": 855} {"train_loss": -5.599169731140137, "global_step": 35914, "epoch": 855} {"train_loss": -5.643471717834473, "global_step": 35915, "epoch": 855} {"train_loss": -5.6426215171813965, "global_step": 35916, "epoch": 855} {"train_loss": -5.519957542419434, "global_step": 35917, "epoch": 855} {"train_loss": -5.6151227951049805, "global_step": 35918, "epoch": 855} {"train_loss": -5.564964294433594, "global_step": 35919, "epoch": 855} {"train_loss": -5.552587509155273, "global_step": 35920, "epoch": 855} {"train_loss": -5.592536449432373, "global_step": 35921, "epoch": 855} {"train_loss": -5.567019462585449, "global_step": 35922, "epoch": 855} {"train_loss": -5.571652412414551, "global_step": 35923, "epoch": 855} {"train_loss": -5.635738372802734, "global_step": 35924, "epoch": 855} {"train_loss": -5.451634883880615, "global_step": 35925, "epoch": 855} {"train_loss": -5.544910430908203, "global_step": 35926, "epoch": 855} {"train_loss": -5.600399017333984, "global_step": 35927, "epoch": 855} {"train_loss": -5.545969009399414, "global_step": 35928, "epoch": 855} {"train_loss": -5.507846832275391, "global_step": 35929, "epoch": 855} {"train_loss": -5.580334186553955, "global_step": 35930, "epoch": 855} {"train_loss": -5.563798427581787, "global_step": 35931, "epoch": 855} {"train_loss": -5.522994518280029, "global_step": 35932, "epoch": 855} {"train_loss": -5.603954792022705, "global_step": 35933, "epoch": 855} {"train_loss": -5.516750335693359, "global_step": 35934, "epoch": 855} {"train_loss": -5.535257816314697, "global_step": 35935, "epoch": 855} {"train_loss": -5.473888874053955, "global_step": 35936, "epoch": 855} {"train_loss": -5.529804229736328, "global_step": 35937, "epoch": 855} {"train_loss": -5.489495277404785, "global_step": 35938, "epoch": 855} {"train_loss": -5.606680393218994, "global_step": 35939, "epoch": 855} {"train_loss": -5.472657203674316, "global_step": 35940, "epoch": 855} {"train_loss": -5.550537109375, "global_step": 35941, "epoch": 855} {"train_loss": -5.576866149902344, "global_step": 35942, "epoch": 855} {"train_loss": -5.601301193237305, "global_step": 35943, "epoch": 855} {"train_loss": -5.674008369445801, "global_step": 35944, "epoch": 855} {"train_loss": -5.63018798828125, "global_step": 35945, "epoch": 855} {"train_loss": -5.5856428146362305, "global_step": 35946, "epoch": 855} {"train_loss": -5.668983459472656, "global_step": 35947, "epoch": 855} {"train_loss": -5.545223236083984, "global_step": 35948, "epoch": 855} {"train_loss": -5.69254207611084, "global_step": 35949, "epoch": 855} {"train_loss": -5.512785911560059, "global_step": 35950, "epoch": 855} {"train_loss": -5.564584516343617, "global_step": 35951, "epoch": 855, "val_loss": 74194.8203125} {"train_loss": -5.5285491943359375, "global_step": 35952, "epoch": 856} {"train_loss": -5.585514068603516, "global_step": 35953, "epoch": 856} {"train_loss": -5.65153694152832, "global_step": 35954, "epoch": 856} {"train_loss": -5.586459159851074, "global_step": 35955, "epoch": 856} {"train_loss": -5.644174575805664, "global_step": 35956, "epoch": 856} {"train_loss": -5.592895030975342, "global_step": 35957, "epoch": 856} {"train_loss": -5.5743560791015625, "global_step": 35958, "epoch": 856} {"train_loss": -5.5121307373046875, "global_step": 35959, "epoch": 856} {"train_loss": -5.64467716217041, "global_step": 35960, "epoch": 856} {"train_loss": -5.472416400909424, "global_step": 35961, "epoch": 856} {"train_loss": -5.63378381729126, "global_step": 35962, "epoch": 856} {"train_loss": -5.579207420349121, "global_step": 35963, "epoch": 856} {"train_loss": -5.507777214050293, "global_step": 35964, "epoch": 856} {"train_loss": -5.732900619506836, "global_step": 35965, "epoch": 856} {"train_loss": -5.378173828125, "global_step": 35966, "epoch": 856} {"train_loss": -5.538800239562988, "global_step": 35967, "epoch": 856} {"train_loss": -5.592578887939453, "global_step": 35968, "epoch": 856} {"train_loss": -5.348758220672607, "global_step": 35969, "epoch": 856} {"train_loss": -5.3808369636535645, "global_step": 35970, "epoch": 856} {"train_loss": -5.6205220222473145, "global_step": 35971, "epoch": 856} {"train_loss": -5.425073623657227, "global_step": 35972, "epoch": 856} {"train_loss": -5.498623847961426, "global_step": 35973, "epoch": 856} {"train_loss": -5.50706148147583, "global_step": 35974, "epoch": 856} {"train_loss": -5.563340187072754, "global_step": 35975, "epoch": 856} {"train_loss": -5.440183639526367, "global_step": 35976, "epoch": 856} {"train_loss": -5.479511260986328, "global_step": 35977, "epoch": 856} {"train_loss": -5.519720077514648, "global_step": 35978, "epoch": 856} {"train_loss": -5.523594856262207, "global_step": 35979, "epoch": 856} {"train_loss": -5.501870155334473, "global_step": 35980, "epoch": 856} {"train_loss": -5.56502103805542, "global_step": 35981, "epoch": 856} {"train_loss": -5.542994022369385, "global_step": 35982, "epoch": 856} {"train_loss": -5.551224708557129, "global_step": 35983, "epoch": 856} {"train_loss": -5.532034873962402, "global_step": 35984, "epoch": 856} {"train_loss": -5.594660758972168, "global_step": 35985, "epoch": 856} {"train_loss": -5.518421173095703, "global_step": 35986, "epoch": 856} {"train_loss": -5.506789207458496, "global_step": 35987, "epoch": 856} {"train_loss": -5.52954626083374, "global_step": 35988, "epoch": 856} {"train_loss": -5.544000148773193, "global_step": 35989, "epoch": 856} {"train_loss": -5.460955619812012, "global_step": 35990, "epoch": 856} {"train_loss": -5.754820346832275, "global_step": 35991, "epoch": 856} {"train_loss": -5.589011192321777, "global_step": 35992, "epoch": 856} {"train_loss": -5.545042446681431, "global_step": 35993, "epoch": 856, "val_loss": 73665.6484375} {"train_loss": -5.523248672485352, "global_step": 35994, "epoch": 857} {"train_loss": -5.531329154968262, "global_step": 35995, "epoch": 857} {"train_loss": -5.53000020980835, "global_step": 35996, "epoch": 857} {"train_loss": -5.603447914123535, "global_step": 35997, "epoch": 857} {"train_loss": -5.693202972412109, "global_step": 35998, "epoch": 857} {"train_loss": -5.577950477600098, "global_step": 35999, "epoch": 857} {"train_loss": -5.501011848449707, "global_step": 36000, "epoch": 857} {"train_loss": -5.59773063659668, "global_step": 36001, "epoch": 857} {"train_loss": -5.721374988555908, "global_step": 36002, "epoch": 857} {"train_loss": -5.630979061126709, "global_step": 36003, "epoch": 857} {"train_loss": -5.609275817871094, "global_step": 36004, "epoch": 857} {"train_loss": -5.559157371520996, "global_step": 36005, "epoch": 857} {"train_loss": -5.4794769287109375, "global_step": 36006, "epoch": 857} {"train_loss": -5.537177085876465, "global_step": 36007, "epoch": 857} {"train_loss": -5.633138179779053, "global_step": 36008, "epoch": 857} {"train_loss": -5.703124046325684, "global_step": 36009, "epoch": 857} {"train_loss": -5.549751281738281, "global_step": 36010, "epoch": 857} {"train_loss": -5.551009178161621, "global_step": 36011, "epoch": 857} {"train_loss": -5.487060070037842, "global_step": 36012, "epoch": 857} {"train_loss": -5.456281661987305, "global_step": 36013, "epoch": 857} {"train_loss": -5.564525604248047, "global_step": 36014, "epoch": 857} {"train_loss": -5.577796936035156, "global_step": 36015, "epoch": 857} {"train_loss": -5.646305561065674, "global_step": 36016, "epoch": 857} {"train_loss": -5.630608081817627, "global_step": 36017, "epoch": 857} {"train_loss": -5.559878349304199, "global_step": 36018, "epoch": 857} {"train_loss": -5.661683559417725, "global_step": 36019, "epoch": 857} {"train_loss": -5.6230998039245605, "global_step": 36020, "epoch": 857} {"train_loss": -5.5701704025268555, "global_step": 36021, "epoch": 857} {"train_loss": -5.638893127441406, "global_step": 36022, "epoch": 857} {"train_loss": -5.577854156494141, "global_step": 36023, "epoch": 857} {"train_loss": -5.544367790222168, "global_step": 36024, "epoch": 857} {"train_loss": -5.540343761444092, "global_step": 36025, "epoch": 857} {"train_loss": -5.580416202545166, "global_step": 36026, "epoch": 857} {"train_loss": -5.56572151184082, "global_step": 36027, "epoch": 857} {"train_loss": -5.648471832275391, "global_step": 36028, "epoch": 857} {"train_loss": -5.676571846008301, "global_step": 36029, "epoch": 857} {"train_loss": -5.556674003601074, "global_step": 36030, "epoch": 857} {"train_loss": -5.639872074127197, "global_step": 36031, "epoch": 857} {"train_loss": -5.575422286987305, "global_step": 36032, "epoch": 857} {"train_loss": -5.744812965393066, "global_step": 36033, "epoch": 857} {"train_loss": -5.490171909332275, "global_step": 36034, "epoch": 857} {"train_loss": -5.585572844459897, "global_step": 36035, "epoch": 857, "val_loss": 73564.640625} {"train_loss": -5.585309982299805, "global_step": 36036, "epoch": 858} {"train_loss": -5.651898384094238, "global_step": 36037, "epoch": 858} {"train_loss": -5.52574348449707, "global_step": 36038, "epoch": 858} {"train_loss": -5.647488117218018, "global_step": 36039, "epoch": 858} {"train_loss": -5.561544418334961, "global_step": 36040, "epoch": 858} {"train_loss": -5.5819501876831055, "global_step": 36041, "epoch": 858} {"train_loss": -5.523187637329102, "global_step": 36042, "epoch": 858} {"train_loss": -5.549202919006348, "global_step": 36043, "epoch": 858} {"train_loss": -5.528791427612305, "global_step": 36044, "epoch": 858} {"train_loss": -5.61983585357666, "global_step": 36045, "epoch": 858} {"train_loss": -5.4608564376831055, "global_step": 36046, "epoch": 858} {"train_loss": -5.4998931884765625, "global_step": 36047, "epoch": 858} {"train_loss": -5.646665573120117, "global_step": 36048, "epoch": 858} {"train_loss": -5.457603454589844, "global_step": 36049, "epoch": 858} {"train_loss": -5.560829162597656, "global_step": 36050, "epoch": 858} {"train_loss": -5.436022758483887, "global_step": 36051, "epoch": 858} {"train_loss": -5.5815534591674805, "global_step": 36052, "epoch": 858} {"train_loss": -5.680083274841309, "global_step": 36053, "epoch": 858} {"train_loss": -5.511229515075684, "global_step": 36054, "epoch": 858} {"train_loss": -5.496982574462891, "global_step": 36055, "epoch": 858} {"train_loss": -5.468480110168457, "global_step": 36056, "epoch": 858} {"train_loss": -5.5273261070251465, "global_step": 36057, "epoch": 858} {"train_loss": -5.602022171020508, "global_step": 36058, "epoch": 858} {"train_loss": -5.506646156311035, "global_step": 36059, "epoch": 858} {"train_loss": -5.490688323974609, "global_step": 36060, "epoch": 858} {"train_loss": -5.588801383972168, "global_step": 36061, "epoch": 858} {"train_loss": -5.599798202514648, "global_step": 36062, "epoch": 858} {"train_loss": -5.563007354736328, "global_step": 36063, "epoch": 858} {"train_loss": -5.614102363586426, "global_step": 36064, "epoch": 858} {"train_loss": -5.525053024291992, "global_step": 36065, "epoch": 858} {"train_loss": -5.4982194900512695, "global_step": 36066, "epoch": 858} {"train_loss": -5.568185806274414, "global_step": 36067, "epoch": 858} {"train_loss": -5.475907325744629, "global_step": 36068, "epoch": 858} {"train_loss": -5.473406791687012, "global_step": 36069, "epoch": 858} {"train_loss": -5.599813938140869, "global_step": 36070, "epoch": 858} {"train_loss": -5.521399021148682, "global_step": 36071, "epoch": 858} {"train_loss": -5.589529037475586, "global_step": 36072, "epoch": 858} {"train_loss": -5.555855751037598, "global_step": 36073, "epoch": 858} {"train_loss": -5.533846855163574, "global_step": 36074, "epoch": 858} {"train_loss": -5.5073466300964355, "global_step": 36075, "epoch": 858} {"train_loss": -5.487756729125977, "global_step": 36076, "epoch": 858} {"train_loss": -5.543640034539359, "global_step": 36077, "epoch": 858, "val_loss": 74069.921875} {"train_loss": -5.584000587463379, "global_step": 36078, "epoch": 859} {"train_loss": -5.596076011657715, "global_step": 36079, "epoch": 859} {"train_loss": -5.626808166503906, "global_step": 36080, "epoch": 859} {"train_loss": -5.553035736083984, "global_step": 36081, "epoch": 859} {"train_loss": -5.551119804382324, "global_step": 36082, "epoch": 859} {"train_loss": -5.447827339172363, "global_step": 36083, "epoch": 859} {"train_loss": -5.535921096801758, "global_step": 36084, "epoch": 859} {"train_loss": -5.4240617752075195, "global_step": 36085, "epoch": 859} {"train_loss": -5.6356425285339355, "global_step": 36086, "epoch": 859} {"train_loss": -5.582538604736328, "global_step": 36087, "epoch": 859} {"train_loss": -5.451311111450195, "global_step": 36088, "epoch": 859} {"train_loss": -5.451496124267578, "global_step": 36089, "epoch": 859} {"train_loss": -5.515759468078613, "global_step": 36090, "epoch": 859} {"train_loss": -5.585250377655029, "global_step": 36091, "epoch": 859} {"train_loss": -5.624673843383789, "global_step": 36092, "epoch": 859} {"train_loss": -5.651535987854004, "global_step": 36093, "epoch": 859} {"train_loss": -5.50723934173584, "global_step": 36094, "epoch": 859} {"train_loss": -5.574413776397705, "global_step": 36095, "epoch": 859} {"train_loss": -5.468273639678955, "global_step": 36096, "epoch": 859} {"train_loss": -5.484915256500244, "global_step": 36097, "epoch": 859} {"train_loss": -5.488913536071777, "global_step": 36098, "epoch": 859} {"train_loss": -5.519609451293945, "global_step": 36099, "epoch": 859} {"train_loss": -5.490904331207275, "global_step": 36100, "epoch": 859} {"train_loss": -5.546063423156738, "global_step": 36101, "epoch": 859} {"train_loss": -5.4984846115112305, "global_step": 36102, "epoch": 859} {"train_loss": -5.583070755004883, "global_step": 36103, "epoch": 859} {"train_loss": -5.533519268035889, "global_step": 36104, "epoch": 859} {"train_loss": -5.646544456481934, "global_step": 36105, "epoch": 859} {"train_loss": -5.560870170593262, "global_step": 36106, "epoch": 859} {"train_loss": -5.554973602294922, "global_step": 36107, "epoch": 859} {"train_loss": -5.634547233581543, "global_step": 36108, "epoch": 859} {"train_loss": -5.529693603515625, "global_step": 36109, "epoch": 859} {"train_loss": -5.472574710845947, "global_step": 36110, "epoch": 859} {"train_loss": -5.495128631591797, "global_step": 36111, "epoch": 859} {"train_loss": -5.576244354248047, "global_step": 36112, "epoch": 859} {"train_loss": -5.400437831878662, "global_step": 36113, "epoch": 859} {"train_loss": -5.668882369995117, "global_step": 36114, "epoch": 859} {"train_loss": -5.499899864196777, "global_step": 36115, "epoch": 859} {"train_loss": -5.682757377624512, "global_step": 36116, "epoch": 859} {"train_loss": -5.500382423400879, "global_step": 36117, "epoch": 859} {"train_loss": -5.558751583099365, "global_step": 36118, "epoch": 859} {"train_loss": -5.54660025097075, "global_step": 36119, "epoch": 859, "val_loss": 74415.984375} {"train_loss": -5.605783462524414, "global_step": 36120, "epoch": 860} {"train_loss": -5.602843284606934, "global_step": 36121, "epoch": 860} {"train_loss": -5.494966983795166, "global_step": 36122, "epoch": 860} {"train_loss": -5.634817123413086, "global_step": 36123, "epoch": 860} {"train_loss": -5.523272514343262, "global_step": 36124, "epoch": 860} {"train_loss": -5.447556495666504, "global_step": 36125, "epoch": 860} {"train_loss": -5.477107048034668, "global_step": 36126, "epoch": 860} {"train_loss": -5.602545738220215, "global_step": 36127, "epoch": 860} {"train_loss": -5.559548377990723, "global_step": 36128, "epoch": 860} {"train_loss": -5.581404685974121, "global_step": 36129, "epoch": 860} {"train_loss": -5.593332290649414, "global_step": 36130, "epoch": 860} {"train_loss": -5.524317741394043, "global_step": 36131, "epoch": 860} {"train_loss": -5.582633018493652, "global_step": 36132, "epoch": 860} {"train_loss": -5.615372657775879, "global_step": 36133, "epoch": 860} {"train_loss": -5.621096134185791, "global_step": 36134, "epoch": 860} {"train_loss": -5.646724700927734, "global_step": 36135, "epoch": 860} {"train_loss": -5.489955902099609, "global_step": 36136, "epoch": 860} {"train_loss": -5.61323881149292, "global_step": 36137, "epoch": 860} {"train_loss": -5.4251484870910645, "global_step": 36138, "epoch": 860} {"train_loss": -5.4820780754089355, "global_step": 36139, "epoch": 860} {"train_loss": -5.602367877960205, "global_step": 36140, "epoch": 860} {"train_loss": -5.410107135772705, "global_step": 36141, "epoch": 860} {"train_loss": -5.631551265716553, "global_step": 36142, "epoch": 860} {"train_loss": -5.695137977600098, "global_step": 36143, "epoch": 860} {"train_loss": -5.622724533081055, "global_step": 36144, "epoch": 860} {"train_loss": -5.496494293212891, "global_step": 36145, "epoch": 860} {"train_loss": -5.634853839874268, "global_step": 36146, "epoch": 860} {"train_loss": -5.619714736938477, "global_step": 36147, "epoch": 860} {"train_loss": -5.625948905944824, "global_step": 36148, "epoch": 860} {"train_loss": -5.608870983123779, "global_step": 36149, "epoch": 860} {"train_loss": -5.541013717651367, "global_step": 36150, "epoch": 860} {"train_loss": -5.5135416984558105, "global_step": 36151, "epoch": 860} {"train_loss": -5.642204284667969, "global_step": 36152, "epoch": 860} {"train_loss": -5.625682830810547, "global_step": 36153, "epoch": 860} {"train_loss": -5.5752129554748535, "global_step": 36154, "epoch": 860} {"train_loss": -5.534078598022461, "global_step": 36155, "epoch": 860} {"train_loss": -5.519830703735352, "global_step": 36156, "epoch": 860} {"train_loss": -5.535556793212891, "global_step": 36157, "epoch": 860} {"train_loss": -5.649737358093262, "global_step": 36158, "epoch": 860} {"train_loss": -5.586136341094971, "global_step": 36159, "epoch": 860} {"train_loss": -5.448493003845215, "global_step": 36160, "epoch": 860} {"train_loss": -5.568100282124111, "global_step": 36161, "epoch": 860, "val_loss": 73863.734375} {"train_loss": -5.6184515953063965, "global_step": 36162, "epoch": 861} {"train_loss": -5.518312931060791, "global_step": 36163, "epoch": 861} {"train_loss": -5.588740348815918, "global_step": 36164, "epoch": 861} {"train_loss": -5.546639442443848, "global_step": 36165, "epoch": 861} {"train_loss": -5.540838241577148, "global_step": 36166, "epoch": 861} {"train_loss": -5.638049602508545, "global_step": 36167, "epoch": 861} {"train_loss": -5.6609344482421875, "global_step": 36168, "epoch": 861} {"train_loss": -5.55330753326416, "global_step": 36169, "epoch": 861} {"train_loss": -5.627859115600586, "global_step": 36170, "epoch": 861} {"train_loss": -5.535862445831299, "global_step": 36171, "epoch": 861} {"train_loss": -5.525437355041504, "global_step": 36172, "epoch": 861} {"train_loss": -5.627934455871582, "global_step": 36173, "epoch": 861} {"train_loss": -5.652674674987793, "global_step": 36174, "epoch": 861} {"train_loss": -5.426760673522949, "global_step": 36175, "epoch": 861} {"train_loss": -5.6884541511535645, "global_step": 36176, "epoch": 861} {"train_loss": -5.554399490356445, "global_step": 36177, "epoch": 861} {"train_loss": -5.5253520011901855, "global_step": 36178, "epoch": 861} {"train_loss": -5.55492639541626, "global_step": 36179, "epoch": 861} {"train_loss": -5.595317840576172, "global_step": 36180, "epoch": 861} {"train_loss": -5.460761547088623, "global_step": 36181, "epoch": 861} {"train_loss": -5.533984661102295, "global_step": 36182, "epoch": 861} {"train_loss": -5.581225395202637, "global_step": 36183, "epoch": 861} {"train_loss": -5.530768394470215, "global_step": 36184, "epoch": 861} {"train_loss": -5.545217514038086, "global_step": 36185, "epoch": 861} {"train_loss": -5.643238067626953, "global_step": 36186, "epoch": 861} {"train_loss": -5.533209800720215, "global_step": 36187, "epoch": 861} {"train_loss": -5.642096519470215, "global_step": 36188, "epoch": 861} {"train_loss": -5.504418849945068, "global_step": 36189, "epoch": 861} {"train_loss": -5.465322494506836, "global_step": 36190, "epoch": 861} {"train_loss": -5.5173234939575195, "global_step": 36191, "epoch": 861} {"train_loss": -5.410409927368164, "global_step": 36192, "epoch": 861} {"train_loss": -5.540339946746826, "global_step": 36193, "epoch": 861} {"train_loss": -5.599510192871094, "global_step": 36194, "epoch": 861} {"train_loss": -5.684634208679199, "global_step": 36195, "epoch": 861} {"train_loss": -5.625756740570068, "global_step": 36196, "epoch": 861} {"train_loss": -5.581266403198242, "global_step": 36197, "epoch": 861} {"train_loss": -5.601767063140869, "global_step": 36198, "epoch": 861} {"train_loss": -5.478303909301758, "global_step": 36199, "epoch": 861} {"train_loss": -5.570671081542969, "global_step": 36200, "epoch": 861} {"train_loss": -5.561300277709961, "global_step": 36201, "epoch": 861} {"train_loss": -5.63458251953125, "global_step": 36202, "epoch": 861} {"train_loss": -5.568277915318807, "global_step": 36203, "epoch": 861, "val_loss": 74323.609375} {"train_loss": -5.644534111022949, "global_step": 36204, "epoch": 862} {"train_loss": -5.54074239730835, "global_step": 36205, "epoch": 862} {"train_loss": -5.573974132537842, "global_step": 36206, "epoch": 862} {"train_loss": -5.645768165588379, "global_step": 36207, "epoch": 862} {"train_loss": -5.561720848083496, "global_step": 36208, "epoch": 862} {"train_loss": -5.631233215332031, "global_step": 36209, "epoch": 862} {"train_loss": -5.605546474456787, "global_step": 36210, "epoch": 862} {"train_loss": -5.512998580932617, "global_step": 36211, "epoch": 862} {"train_loss": -5.646688461303711, "global_step": 36212, "epoch": 862} {"train_loss": -5.562814712524414, "global_step": 36213, "epoch": 862} {"train_loss": -5.671631336212158, "global_step": 36214, "epoch": 862} {"train_loss": -5.5760979652404785, "global_step": 36215, "epoch": 862} {"train_loss": -5.4635186195373535, "global_step": 36216, "epoch": 862} {"train_loss": -5.612786769866943, "global_step": 36217, "epoch": 862} {"train_loss": -5.549420356750488, "global_step": 36218, "epoch": 862} {"train_loss": -5.402807712554932, "global_step": 36219, "epoch": 862} {"train_loss": -5.5632195472717285, "global_step": 36220, "epoch": 862} {"train_loss": -5.558671951293945, "global_step": 36221, "epoch": 862} {"train_loss": -5.453248023986816, "global_step": 36222, "epoch": 862} {"train_loss": -5.590690612792969, "global_step": 36223, "epoch": 862} {"train_loss": -5.641763687133789, "global_step": 36224, "epoch": 862} {"train_loss": -5.572347640991211, "global_step": 36225, "epoch": 862} {"train_loss": -5.6600775718688965, "global_step": 36226, "epoch": 862} {"train_loss": -5.603009223937988, "global_step": 36227, "epoch": 862} {"train_loss": -5.563292503356934, "global_step": 36228, "epoch": 862} {"train_loss": -5.6274027824401855, "global_step": 36229, "epoch": 862} {"train_loss": -5.476879596710205, "global_step": 36230, "epoch": 862} {"train_loss": -5.581406593322754, "global_step": 36231, "epoch": 862} {"train_loss": -5.6236891746521, "global_step": 36232, "epoch": 862} {"train_loss": -5.596564292907715, "global_step": 36233, "epoch": 862} {"train_loss": -5.620009422302246, "global_step": 36234, "epoch": 862} {"train_loss": -5.590061664581299, "global_step": 36235, "epoch": 862} {"train_loss": -5.598576068878174, "global_step": 36236, "epoch": 862} {"train_loss": -5.49516487121582, "global_step": 36237, "epoch": 862} {"train_loss": -5.450844764709473, "global_step": 36238, "epoch": 862} {"train_loss": -5.486629486083984, "global_step": 36239, "epoch": 862} {"train_loss": -5.525997638702393, "global_step": 36240, "epoch": 862} {"train_loss": -5.562221527099609, "global_step": 36241, "epoch": 862} {"train_loss": -5.68294620513916, "global_step": 36242, "epoch": 862} {"train_loss": -5.629715919494629, "global_step": 36243, "epoch": 862} {"train_loss": -5.520618438720703, "global_step": 36244, "epoch": 862} {"train_loss": -5.570313033603487, "global_step": 36245, "epoch": 862, "val_loss": 74498.671875} {"train_loss": -5.477224349975586, "global_step": 36246, "epoch": 863} {"train_loss": -5.4449052810668945, "global_step": 36247, "epoch": 863} {"train_loss": -5.5568671226501465, "global_step": 36248, "epoch": 863} {"train_loss": -5.350582599639893, "global_step": 36249, "epoch": 863} {"train_loss": -5.623514652252197, "global_step": 36250, "epoch": 863} {"train_loss": -5.39630126953125, "global_step": 36251, "epoch": 863} {"train_loss": -5.550914764404297, "global_step": 36252, "epoch": 863} {"train_loss": -5.602007865905762, "global_step": 36253, "epoch": 863} {"train_loss": -5.5619120597839355, "global_step": 36254, "epoch": 863} {"train_loss": -5.54230260848999, "global_step": 36255, "epoch": 863} {"train_loss": -5.561453342437744, "global_step": 36256, "epoch": 863} {"train_loss": -5.635977745056152, "global_step": 36257, "epoch": 863} {"train_loss": -5.551244258880615, "global_step": 36258, "epoch": 863} {"train_loss": -5.611870765686035, "global_step": 36259, "epoch": 863} {"train_loss": -5.622005939483643, "global_step": 36260, "epoch": 863} {"train_loss": -5.519371509552002, "global_step": 36261, "epoch": 863} {"train_loss": -5.4676666259765625, "global_step": 36262, "epoch": 863} {"train_loss": -5.585603713989258, "global_step": 36263, "epoch": 863} {"train_loss": -5.646939277648926, "global_step": 36264, "epoch": 863} {"train_loss": -5.50958251953125, "global_step": 36265, "epoch": 863} {"train_loss": -5.560236930847168, "global_step": 36266, "epoch": 863} {"train_loss": -5.533221244812012, "global_step": 36267, "epoch": 863} {"train_loss": -5.539203643798828, "global_step": 36268, "epoch": 863} {"train_loss": -5.474424839019775, "global_step": 36269, "epoch": 863} {"train_loss": -5.543087959289551, "global_step": 36270, "epoch": 863} {"train_loss": -5.591678619384766, "global_step": 36271, "epoch": 863} {"train_loss": -5.522850513458252, "global_step": 36272, "epoch": 863} {"train_loss": -5.573174953460693, "global_step": 36273, "epoch": 863} {"train_loss": -5.60045051574707, "global_step": 36274, "epoch": 863} {"train_loss": -5.560272216796875, "global_step": 36275, "epoch": 863} {"train_loss": -5.551667213439941, "global_step": 36276, "epoch": 863} {"train_loss": -5.567507743835449, "global_step": 36277, "epoch": 863} {"train_loss": -5.534414291381836, "global_step": 36278, "epoch": 863} {"train_loss": -5.544799327850342, "global_step": 36279, "epoch": 863} {"train_loss": -5.574343204498291, "global_step": 36280, "epoch": 863} {"train_loss": -5.571516036987305, "global_step": 36281, "epoch": 863} {"train_loss": -5.6106977462768555, "global_step": 36282, "epoch": 863} {"train_loss": -5.578113555908203, "global_step": 36283, "epoch": 863} {"train_loss": -5.587428569793701, "global_step": 36284, "epoch": 863} {"train_loss": -5.624270439147949, "global_step": 36285, "epoch": 863} {"train_loss": -5.6216864585876465, "global_step": 36286, "epoch": 863} {"train_loss": -5.555789913449969, "global_step": 36287, "epoch": 863, "val_loss": 73920.8359375} {"train_loss": -5.516602039337158, "global_step": 36288, "epoch": 864} {"train_loss": -5.633354187011719, "global_step": 36289, "epoch": 864} {"train_loss": -5.587686538696289, "global_step": 36290, "epoch": 864} {"train_loss": -5.501590728759766, "global_step": 36291, "epoch": 864} {"train_loss": -5.585324287414551, "global_step": 36292, "epoch": 864} {"train_loss": -5.640713691711426, "global_step": 36293, "epoch": 864} {"train_loss": -5.60549259185791, "global_step": 36294, "epoch": 864} {"train_loss": -5.501076698303223, "global_step": 36295, "epoch": 864} {"train_loss": -5.632440567016602, "global_step": 36296, "epoch": 864} {"train_loss": -5.580899715423584, "global_step": 36297, "epoch": 864} {"train_loss": -5.587889671325684, "global_step": 36298, "epoch": 864} {"train_loss": -5.616519451141357, "global_step": 36299, "epoch": 864} {"train_loss": -5.563251972198486, "global_step": 36300, "epoch": 864} {"train_loss": -5.566682815551758, "global_step": 36301, "epoch": 864} {"train_loss": -5.697481155395508, "global_step": 36302, "epoch": 864} {"train_loss": -5.6951470375061035, "global_step": 36303, "epoch": 864} {"train_loss": -5.601327896118164, "global_step": 36304, "epoch": 864} {"train_loss": -5.644961357116699, "global_step": 36305, "epoch": 864} {"train_loss": -5.537042617797852, "global_step": 36306, "epoch": 864} {"train_loss": -5.657148361206055, "global_step": 36307, "epoch": 864} {"train_loss": -5.5938920974731445, "global_step": 36308, "epoch": 864} {"train_loss": -5.499749183654785, "global_step": 36309, "epoch": 864} {"train_loss": -5.55552864074707, "global_step": 36310, "epoch": 864} {"train_loss": -5.58427619934082, "global_step": 36311, "epoch": 864} {"train_loss": -5.562283039093018, "global_step": 36312, "epoch": 864} {"train_loss": -5.434150218963623, "global_step": 36313, "epoch": 864} {"train_loss": -5.491769313812256, "global_step": 36314, "epoch": 864} {"train_loss": -5.633122444152832, "global_step": 36315, "epoch": 864} {"train_loss": -5.468894004821777, "global_step": 36316, "epoch": 864} {"train_loss": -5.489284992218018, "global_step": 36317, "epoch": 864} {"train_loss": -5.523100852966309, "global_step": 36318, "epoch": 864} {"train_loss": -5.497578144073486, "global_step": 36319, "epoch": 864} {"train_loss": -5.570884704589844, "global_step": 36320, "epoch": 864} {"train_loss": -5.642151832580566, "global_step": 36321, "epoch": 864} {"train_loss": -5.553204536437988, "global_step": 36322, "epoch": 864} {"train_loss": -5.603911399841309, "global_step": 36323, "epoch": 864} {"train_loss": -5.6427693367004395, "global_step": 36324, "epoch": 864} {"train_loss": -5.471796035766602, "global_step": 36325, "epoch": 864} {"train_loss": -5.558229923248291, "global_step": 36326, "epoch": 864} {"train_loss": -5.533308029174805, "global_step": 36327, "epoch": 864} {"train_loss": -5.541469097137451, "global_step": 36328, "epoch": 864} {"train_loss": -5.5696597666967484, "global_step": 36329, "epoch": 864, "val_loss": 73807.7109375} {"train_loss": -5.591146469116211, "global_step": 36330, "epoch": 865} {"train_loss": -5.597479820251465, "global_step": 36331, "epoch": 865} {"train_loss": -5.599349021911621, "global_step": 36332, "epoch": 865} {"train_loss": -5.5842204093933105, "global_step": 36333, "epoch": 865} {"train_loss": -5.53606653213501, "global_step": 36334, "epoch": 865} {"train_loss": -5.722668647766113, "global_step": 36335, "epoch": 865} {"train_loss": -5.636898994445801, "global_step": 36336, "epoch": 865} {"train_loss": -5.584980487823486, "global_step": 36337, "epoch": 865} {"train_loss": -5.640355110168457, "global_step": 36338, "epoch": 865} {"train_loss": -5.5611467361450195, "global_step": 36339, "epoch": 865} {"train_loss": -5.585313320159912, "global_step": 36340, "epoch": 865} {"train_loss": -5.594803810119629, "global_step": 36341, "epoch": 865} {"train_loss": -5.5963263511657715, "global_step": 36342, "epoch": 865} {"train_loss": -5.6151604652404785, "global_step": 36343, "epoch": 865} {"train_loss": -5.634360313415527, "global_step": 36344, "epoch": 865} {"train_loss": -5.556832313537598, "global_step": 36345, "epoch": 865} {"train_loss": -5.703477382659912, "global_step": 36346, "epoch": 865} {"train_loss": -5.60902738571167, "global_step": 36347, "epoch": 865} {"train_loss": -5.618231773376465, "global_step": 36348, "epoch": 865} {"train_loss": -5.5509233474731445, "global_step": 36349, "epoch": 865} {"train_loss": -5.641498565673828, "global_step": 36350, "epoch": 865} {"train_loss": -5.624806880950928, "global_step": 36351, "epoch": 865} {"train_loss": -5.563618183135986, "global_step": 36352, "epoch": 865} {"train_loss": -5.497620582580566, "global_step": 36353, "epoch": 865} {"train_loss": -5.556510925292969, "global_step": 36354, "epoch": 865} {"train_loss": -5.523991584777832, "global_step": 36355, "epoch": 865} {"train_loss": -5.589151382446289, "global_step": 36356, "epoch": 865} {"train_loss": -5.66370964050293, "global_step": 36357, "epoch": 865} {"train_loss": -5.667257785797119, "global_step": 36358, "epoch": 865} {"train_loss": -5.544712066650391, "global_step": 36359, "epoch": 865} {"train_loss": -5.5106201171875, "global_step": 36360, "epoch": 865} {"train_loss": -5.657129287719727, "global_step": 36361, "epoch": 865} {"train_loss": -5.552229881286621, "global_step": 36362, "epoch": 865} {"train_loss": -5.627105236053467, "global_step": 36363, "epoch": 865} {"train_loss": -5.602449417114258, "global_step": 36364, "epoch": 865} {"train_loss": -5.662443161010742, "global_step": 36365, "epoch": 865} {"train_loss": -5.468923091888428, "global_step": 36366, "epoch": 865} {"train_loss": -5.5482282638549805, "global_step": 36367, "epoch": 865} {"train_loss": -5.547516822814941, "global_step": 36368, "epoch": 865} {"train_loss": -5.575146675109863, "global_step": 36369, "epoch": 865} {"train_loss": -5.386019229888916, "global_step": 36370, "epoch": 865} {"train_loss": -5.5854848225911455, "global_step": 36371, "epoch": 865, "val_loss": 74703.2734375} {"train_loss": -5.513003826141357, "global_step": 36372, "epoch": 866} {"train_loss": -5.608546257019043, "global_step": 36373, "epoch": 866} {"train_loss": -5.550990581512451, "global_step": 36374, "epoch": 866} {"train_loss": -5.519107818603516, "global_step": 36375, "epoch": 866} {"train_loss": -5.544563293457031, "global_step": 36376, "epoch": 866} {"train_loss": -5.542688369750977, "global_step": 36377, "epoch": 866} {"train_loss": -5.520807266235352, "global_step": 36378, "epoch": 866} {"train_loss": -5.6144304275512695, "global_step": 36379, "epoch": 866} {"train_loss": -5.470486640930176, "global_step": 36380, "epoch": 866} {"train_loss": -5.524396896362305, "global_step": 36381, "epoch": 866} {"train_loss": -5.607229232788086, "global_step": 36382, "epoch": 866} {"train_loss": -5.629134178161621, "global_step": 36383, "epoch": 866} {"train_loss": -5.571390151977539, "global_step": 36384, "epoch": 866} {"train_loss": -5.531006813049316, "global_step": 36385, "epoch": 866} {"train_loss": -5.720218658447266, "global_step": 36386, "epoch": 866} {"train_loss": -5.5006232261657715, "global_step": 36387, "epoch": 866} {"train_loss": -5.55900764465332, "global_step": 36388, "epoch": 866} {"train_loss": -5.630987167358398, "global_step": 36389, "epoch": 866} {"train_loss": -5.630251884460449, "global_step": 36390, "epoch": 866} {"train_loss": -5.626255989074707, "global_step": 36391, "epoch": 866} {"train_loss": -5.530927658081055, "global_step": 36392, "epoch": 866} {"train_loss": -5.685937881469727, "global_step": 36393, "epoch": 866} {"train_loss": -5.550125598907471, "global_step": 36394, "epoch": 866} {"train_loss": -5.571157455444336, "global_step": 36395, "epoch": 866} {"train_loss": -5.589831352233887, "global_step": 36396, "epoch": 866} {"train_loss": -5.5615010261535645, "global_step": 36397, "epoch": 866} {"train_loss": -5.489353179931641, "global_step": 36398, "epoch": 866} {"train_loss": -5.511519432067871, "global_step": 36399, "epoch": 866} {"train_loss": -5.63726806640625, "global_step": 36400, "epoch": 866} {"train_loss": -5.529327392578125, "global_step": 36401, "epoch": 866} {"train_loss": -5.627699851989746, "global_step": 36402, "epoch": 866} {"train_loss": -5.514376163482666, "global_step": 36403, "epoch": 866} {"train_loss": -5.500563621520996, "global_step": 36404, "epoch": 866} {"train_loss": -5.530888557434082, "global_step": 36405, "epoch": 866} {"train_loss": -5.682573318481445, "global_step": 36406, "epoch": 866} {"train_loss": -5.589860916137695, "global_step": 36407, "epoch": 866} {"train_loss": -5.45590877532959, "global_step": 36408, "epoch": 866} {"train_loss": -5.653313159942627, "global_step": 36409, "epoch": 866} {"train_loss": -5.580304145812988, "global_step": 36410, "epoch": 866} {"train_loss": -5.539488792419434, "global_step": 36411, "epoch": 866} {"train_loss": -5.455768585205078, "global_step": 36412, "epoch": 866} {"train_loss": -5.562904460089547, "global_step": 36413, "epoch": 866, "val_loss": 73927.5234375} {"train_loss": -5.5587005615234375, "global_step": 36414, "epoch": 867} {"train_loss": -5.621063232421875, "global_step": 36415, "epoch": 867} {"train_loss": -5.642632484436035, "global_step": 36416, "epoch": 867} {"train_loss": -5.558269023895264, "global_step": 36417, "epoch": 867} {"train_loss": -5.702780246734619, "global_step": 36418, "epoch": 867} {"train_loss": -5.639902114868164, "global_step": 36419, "epoch": 867} {"train_loss": -5.498917102813721, "global_step": 36420, "epoch": 867} {"train_loss": -5.613801002502441, "global_step": 36421, "epoch": 867} {"train_loss": -5.518005847930908, "global_step": 36422, "epoch": 867} {"train_loss": -5.577713489532471, "global_step": 36423, "epoch": 867} {"train_loss": -5.654966354370117, "global_step": 36424, "epoch": 867} {"train_loss": -5.557974815368652, "global_step": 36425, "epoch": 867} {"train_loss": -5.472526550292969, "global_step": 36426, "epoch": 867} {"train_loss": -5.632551193237305, "global_step": 36427, "epoch": 867} {"train_loss": -5.660658359527588, "global_step": 36428, "epoch": 867} {"train_loss": -5.564420223236084, "global_step": 36429, "epoch": 867} {"train_loss": -5.535268306732178, "global_step": 36430, "epoch": 867} {"train_loss": -5.539447784423828, "global_step": 36431, "epoch": 867} {"train_loss": -5.593831539154053, "global_step": 36432, "epoch": 867} {"train_loss": -5.575786590576172, "global_step": 36433, "epoch": 867} {"train_loss": -5.544332027435303, "global_step": 36434, "epoch": 867} {"train_loss": -5.662850379943848, "global_step": 36435, "epoch": 867} {"train_loss": -5.580289363861084, "global_step": 36436, "epoch": 867} {"train_loss": -5.44842529296875, "global_step": 36437, "epoch": 867} {"train_loss": -5.494220733642578, "global_step": 36438, "epoch": 867} {"train_loss": -5.699167728424072, "global_step": 36439, "epoch": 867} {"train_loss": -5.6067118644714355, "global_step": 36440, "epoch": 867} {"train_loss": -5.613680839538574, "global_step": 36441, "epoch": 867} {"train_loss": -5.605119705200195, "global_step": 36442, "epoch": 867} {"train_loss": -5.584176063537598, "global_step": 36443, "epoch": 867} {"train_loss": -5.598784446716309, "global_step": 36444, "epoch": 867} {"train_loss": -5.45134162902832, "global_step": 36445, "epoch": 867} {"train_loss": -5.6538567543029785, "global_step": 36446, "epoch": 867} {"train_loss": -5.653423309326172, "global_step": 36447, "epoch": 867} {"train_loss": -5.56820011138916, "global_step": 36448, "epoch": 867} {"train_loss": -5.502460479736328, "global_step": 36449, "epoch": 867} {"train_loss": -5.542832851409912, "global_step": 36450, "epoch": 867} {"train_loss": -5.623157501220703, "global_step": 36451, "epoch": 867} {"train_loss": -5.641500949859619, "global_step": 36452, "epoch": 867} {"train_loss": -5.656299114227295, "global_step": 36453, "epoch": 867} {"train_loss": -5.618415832519531, "global_step": 36454, "epoch": 867} {"train_loss": -5.588086650485084, "global_step": 36455, "epoch": 867, "val_loss": 74270.8125} {"train_loss": -5.527890205383301, "global_step": 36456, "epoch": 868} {"train_loss": -5.637515068054199, "global_step": 36457, "epoch": 868} {"train_loss": -5.570925712585449, "global_step": 36458, "epoch": 868} {"train_loss": -5.508896350860596, "global_step": 36459, "epoch": 868} {"train_loss": -5.6912431716918945, "global_step": 36460, "epoch": 868} {"train_loss": -5.532711029052734, "global_step": 36461, "epoch": 868} {"train_loss": -5.602246284484863, "global_step": 36462, "epoch": 868} {"train_loss": -5.647090435028076, "global_step": 36463, "epoch": 868} {"train_loss": -5.582006454467773, "global_step": 36464, "epoch": 868} {"train_loss": -5.636809349060059, "global_step": 36465, "epoch": 868} {"train_loss": -5.685248374938965, "global_step": 36466, "epoch": 868} {"train_loss": -5.54775857925415, "global_step": 36467, "epoch": 868} {"train_loss": -5.601688385009766, "global_step": 36468, "epoch": 868} {"train_loss": -5.617626190185547, "global_step": 36469, "epoch": 868} {"train_loss": -5.606324195861816, "global_step": 36470, "epoch": 868} {"train_loss": -5.5228729248046875, "global_step": 36471, "epoch": 868} {"train_loss": -5.633248329162598, "global_step": 36472, "epoch": 868} {"train_loss": -5.690920352935791, "global_step": 36473, "epoch": 868} {"train_loss": -5.554737567901611, "global_step": 36474, "epoch": 868} {"train_loss": -5.640375137329102, "global_step": 36475, "epoch": 868} {"train_loss": -5.61945915222168, "global_step": 36476, "epoch": 868} {"train_loss": -5.556203842163086, "global_step": 36477, "epoch": 868} {"train_loss": -5.577458381652832, "global_step": 36478, "epoch": 868} {"train_loss": -5.582517147064209, "global_step": 36479, "epoch": 868} {"train_loss": -5.435299873352051, "global_step": 36480, "epoch": 868} {"train_loss": -5.6470489501953125, "global_step": 36481, "epoch": 868} {"train_loss": -5.571714401245117, "global_step": 36482, "epoch": 868} {"train_loss": -5.576003074645996, "global_step": 36483, "epoch": 868} {"train_loss": -5.535689830780029, "global_step": 36484, "epoch": 868} {"train_loss": -5.522982597351074, "global_step": 36485, "epoch": 868} {"train_loss": -5.581550598144531, "global_step": 36486, "epoch": 868} {"train_loss": -5.672537326812744, "global_step": 36487, "epoch": 868} {"train_loss": -5.568179130554199, "global_step": 36488, "epoch": 868} {"train_loss": -5.580914497375488, "global_step": 36489, "epoch": 868} {"train_loss": -5.528016567230225, "global_step": 36490, "epoch": 868} {"train_loss": -5.476594924926758, "global_step": 36491, "epoch": 868} {"train_loss": -5.532891273498535, "global_step": 36492, "epoch": 868} {"train_loss": -5.506406307220459, "global_step": 36493, "epoch": 868} {"train_loss": -5.501140117645264, "global_step": 36494, "epoch": 868} {"train_loss": -5.621610164642334, "global_step": 36495, "epoch": 868} {"train_loss": -5.4531707763671875, "global_step": 36496, "epoch": 868} {"train_loss": -5.577364422026134, "global_step": 36497, "epoch": 868, "val_loss": 74342.921875} {"train_loss": -5.523110389709473, "global_step": 36498, "epoch": 869} {"train_loss": -5.313615798950195, "global_step": 36499, "epoch": 869} {"train_loss": -5.552074909210205, "global_step": 36500, "epoch": 869} {"train_loss": -5.420675277709961, "global_step": 36501, "epoch": 869} {"train_loss": -5.58625602722168, "global_step": 36502, "epoch": 869} {"train_loss": -5.609466075897217, "global_step": 36503, "epoch": 869} {"train_loss": -5.575247764587402, "global_step": 36504, "epoch": 869} {"train_loss": -5.484121322631836, "global_step": 36505, "epoch": 869} {"train_loss": -5.641110420227051, "global_step": 36506, "epoch": 869} {"train_loss": -5.4653520584106445, "global_step": 36507, "epoch": 869} {"train_loss": -5.599281311035156, "global_step": 36508, "epoch": 869} {"train_loss": -5.589669704437256, "global_step": 36509, "epoch": 869} {"train_loss": -5.542788505554199, "global_step": 36510, "epoch": 869} {"train_loss": -5.539470672607422, "global_step": 36511, "epoch": 869} {"train_loss": -5.628481388092041, "global_step": 36512, "epoch": 869} {"train_loss": -5.592349052429199, "global_step": 36513, "epoch": 869} {"train_loss": -5.537015914916992, "global_step": 36514, "epoch": 869} {"train_loss": -5.604702949523926, "global_step": 36515, "epoch": 869} {"train_loss": -5.627305030822754, "global_step": 36516, "epoch": 869} {"train_loss": -5.578530311584473, "global_step": 36517, "epoch": 869} {"train_loss": -5.642977714538574, "global_step": 36518, "epoch": 869} {"train_loss": -5.646042346954346, "global_step": 36519, "epoch": 869} {"train_loss": -5.601283073425293, "global_step": 36520, "epoch": 869} {"train_loss": -5.718014717102051, "global_step": 36521, "epoch": 869} {"train_loss": -5.540673732757568, "global_step": 36522, "epoch": 869} {"train_loss": -5.703826904296875, "global_step": 36523, "epoch": 869} {"train_loss": -5.422956943511963, "global_step": 36524, "epoch": 869} {"train_loss": -5.500805854797363, "global_step": 36525, "epoch": 869} {"train_loss": -5.435574531555176, "global_step": 36526, "epoch": 869} {"train_loss": -5.684615135192871, "global_step": 36527, "epoch": 869} {"train_loss": -5.5993146896362305, "global_step": 36528, "epoch": 869} {"train_loss": -5.487243175506592, "global_step": 36529, "epoch": 869} {"train_loss": -5.696569442749023, "global_step": 36530, "epoch": 869} {"train_loss": -5.669081687927246, "global_step": 36531, "epoch": 869} {"train_loss": -5.558773517608643, "global_step": 36532, "epoch": 869} {"train_loss": -5.642380237579346, "global_step": 36533, "epoch": 869} {"train_loss": -5.599156379699707, "global_step": 36534, "epoch": 869} {"train_loss": -5.632834434509277, "global_step": 36535, "epoch": 869} {"train_loss": -5.559685230255127, "global_step": 36536, "epoch": 869} {"train_loss": -5.711087226867676, "global_step": 36537, "epoch": 869} {"train_loss": -5.692785263061523, "global_step": 36538, "epoch": 869} {"train_loss": -5.576586598441715, "global_step": 36539, "epoch": 869, "val_loss": 74485.84375} {"train_loss": -5.560306549072266, "global_step": 36540, "epoch": 870} {"train_loss": -5.568169116973877, "global_step": 36541, "epoch": 870} {"train_loss": -5.517899036407471, "global_step": 36542, "epoch": 870} {"train_loss": -5.529476165771484, "global_step": 36543, "epoch": 870} {"train_loss": -5.550713539123535, "global_step": 36544, "epoch": 870} {"train_loss": -5.7025909423828125, "global_step": 36545, "epoch": 870} {"train_loss": -5.574494361877441, "global_step": 36546, "epoch": 870} {"train_loss": -5.607434272766113, "global_step": 36547, "epoch": 870} {"train_loss": -5.630229949951172, "global_step": 36548, "epoch": 870} {"train_loss": -5.536550521850586, "global_step": 36549, "epoch": 870} {"train_loss": -5.52461576461792, "global_step": 36550, "epoch": 870} {"train_loss": -5.647220611572266, "global_step": 36551, "epoch": 870} {"train_loss": -5.542346000671387, "global_step": 36552, "epoch": 870} {"train_loss": -5.608857154846191, "global_step": 36553, "epoch": 870} {"train_loss": -5.5988898277282715, "global_step": 36554, "epoch": 870} {"train_loss": -5.6242523193359375, "global_step": 36555, "epoch": 870} {"train_loss": -5.742519378662109, "global_step": 36556, "epoch": 870} {"train_loss": -5.536977767944336, "global_step": 36557, "epoch": 870} {"train_loss": -5.529603004455566, "global_step": 36558, "epoch": 870} {"train_loss": -5.484437942504883, "global_step": 36559, "epoch": 870} {"train_loss": -5.63759708404541, "global_step": 36560, "epoch": 870} {"train_loss": -5.519920349121094, "global_step": 36561, "epoch": 870} {"train_loss": -5.550245761871338, "global_step": 36562, "epoch": 870} {"train_loss": -5.649876594543457, "global_step": 36563, "epoch": 870} {"train_loss": -5.603553771972656, "global_step": 36564, "epoch": 870} {"train_loss": -5.537167072296143, "global_step": 36565, "epoch": 870} {"train_loss": -5.541796684265137, "global_step": 36566, "epoch": 870} {"train_loss": -5.590734481811523, "global_step": 36567, "epoch": 870} {"train_loss": -5.466102123260498, "global_step": 36568, "epoch": 870} {"train_loss": -5.642650127410889, "global_step": 36569, "epoch": 870} {"train_loss": -5.550394058227539, "global_step": 36570, "epoch": 870} {"train_loss": -5.6344733238220215, "global_step": 36571, "epoch": 870} {"train_loss": -5.55947208404541, "global_step": 36572, "epoch": 870} {"train_loss": -5.627350807189941, "global_step": 36573, "epoch": 870} {"train_loss": -5.5526604652404785, "global_step": 36574, "epoch": 870} {"train_loss": -5.575591087341309, "global_step": 36575, "epoch": 870} {"train_loss": -5.634220600128174, "global_step": 36576, "epoch": 870} {"train_loss": -5.565615177154541, "global_step": 36577, "epoch": 870} {"train_loss": -5.430948734283447, "global_step": 36578, "epoch": 870} {"train_loss": -5.4677228927612305, "global_step": 36579, "epoch": 870} {"train_loss": -5.71487283706665, "global_step": 36580, "epoch": 870} {"train_loss": -5.579490593501499, "global_step": 36581, "epoch": 870, "val_loss": 73948.8984375} {"train_loss": -5.605371475219727, "global_step": 36582, "epoch": 871} {"train_loss": -5.492626190185547, "global_step": 36583, "epoch": 871} {"train_loss": -5.549054145812988, "global_step": 36584, "epoch": 871} {"train_loss": -5.590435028076172, "global_step": 36585, "epoch": 871} {"train_loss": -5.473773956298828, "global_step": 36586, "epoch": 871} {"train_loss": -5.559221267700195, "global_step": 36587, "epoch": 871} {"train_loss": -5.427257061004639, "global_step": 36588, "epoch": 871} {"train_loss": -5.56805419921875, "global_step": 36589, "epoch": 871} {"train_loss": -5.48667049407959, "global_step": 36590, "epoch": 871} {"train_loss": -5.4643425941467285, "global_step": 36591, "epoch": 871} {"train_loss": -5.571229934692383, "global_step": 36592, "epoch": 871} {"train_loss": -5.5247931480407715, "global_step": 36593, "epoch": 871} {"train_loss": -5.533560752868652, "global_step": 36594, "epoch": 871} {"train_loss": -5.4780097007751465, "global_step": 36595, "epoch": 871} {"train_loss": -5.4859466552734375, "global_step": 36596, "epoch": 871} {"train_loss": -5.565913200378418, "global_step": 36597, "epoch": 871} {"train_loss": -5.572934627532959, "global_step": 36598, "epoch": 871} {"train_loss": -5.454294204711914, "global_step": 36599, "epoch": 871} {"train_loss": -5.536625385284424, "global_step": 36600, "epoch": 871} {"train_loss": -5.691099166870117, "global_step": 36601, "epoch": 871} {"train_loss": -5.555075645446777, "global_step": 36602, "epoch": 871} {"train_loss": -5.57921028137207, "global_step": 36603, "epoch": 871} {"train_loss": -5.581743240356445, "global_step": 36604, "epoch": 871} {"train_loss": -5.646048545837402, "global_step": 36605, "epoch": 871} {"train_loss": -5.562880992889404, "global_step": 36606, "epoch": 871} {"train_loss": -5.548942565917969, "global_step": 36607, "epoch": 871} {"train_loss": -5.689006805419922, "global_step": 36608, "epoch": 871} {"train_loss": -5.617938041687012, "global_step": 36609, "epoch": 871} {"train_loss": -5.662765026092529, "global_step": 36610, "epoch": 871} {"train_loss": -5.700865745544434, "global_step": 36611, "epoch": 871} {"train_loss": -5.713018417358398, "global_step": 36612, "epoch": 871} {"train_loss": -5.499700546264648, "global_step": 36613, "epoch": 871} {"train_loss": -5.655544281005859, "global_step": 36614, "epoch": 871} {"train_loss": -5.560982704162598, "global_step": 36615, "epoch": 871} {"train_loss": -5.519477844238281, "global_step": 36616, "epoch": 871} {"train_loss": -5.526973247528076, "global_step": 36617, "epoch": 871} {"train_loss": -5.487722873687744, "global_step": 36618, "epoch": 871} {"train_loss": -5.411571502685547, "global_step": 36619, "epoch": 871} {"train_loss": -5.524009704589844, "global_step": 36620, "epoch": 871} {"train_loss": -5.636053562164307, "global_step": 36621, "epoch": 871} {"train_loss": -5.592720985412598, "global_step": 36622, "epoch": 871} {"train_loss": -5.560983419418335, "global_step": 36623, "epoch": 871, "val_loss": 74767.5} {"train_loss": -5.563352584838867, "global_step": 36624, "epoch": 872} {"train_loss": -5.510631561279297, "global_step": 36625, "epoch": 872} {"train_loss": -5.570484161376953, "global_step": 36626, "epoch": 872} {"train_loss": -5.443222999572754, "global_step": 36627, "epoch": 872} {"train_loss": -5.557471752166748, "global_step": 36628, "epoch": 872} {"train_loss": -5.5804924964904785, "global_step": 36629, "epoch": 872} {"train_loss": -5.596474647521973, "global_step": 36630, "epoch": 872} {"train_loss": -5.596301555633545, "global_step": 36631, "epoch": 872} {"train_loss": -5.664391040802002, "global_step": 36632, "epoch": 872} {"train_loss": -5.674054145812988, "global_step": 36633, "epoch": 872} {"train_loss": -5.543529033660889, "global_step": 36634, "epoch": 872} {"train_loss": -5.522029399871826, "global_step": 36635, "epoch": 872} {"train_loss": -5.463287353515625, "global_step": 36636, "epoch": 872} {"train_loss": -5.566924095153809, "global_step": 36637, "epoch": 872} {"train_loss": -5.527952671051025, "global_step": 36638, "epoch": 872} {"train_loss": -5.570529937744141, "global_step": 36639, "epoch": 872} {"train_loss": -5.48620080947876, "global_step": 36640, "epoch": 872} {"train_loss": -5.666934967041016, "global_step": 36641, "epoch": 872} {"train_loss": -5.5141096115112305, "global_step": 36642, "epoch": 872} {"train_loss": -5.557121276855469, "global_step": 36643, "epoch": 872} {"train_loss": -5.5638885498046875, "global_step": 36644, "epoch": 872} {"train_loss": -5.5601301193237305, "global_step": 36645, "epoch": 872} {"train_loss": -5.674471855163574, "global_step": 36646, "epoch": 872} {"train_loss": -5.484973430633545, "global_step": 36647, "epoch": 872} {"train_loss": -5.387279987335205, "global_step": 36648, "epoch": 872} {"train_loss": -5.628237247467041, "global_step": 36649, "epoch": 872} {"train_loss": -5.604877948760986, "global_step": 36650, "epoch": 872} {"train_loss": -5.613075256347656, "global_step": 36651, "epoch": 872} {"train_loss": -5.509642124176025, "global_step": 36652, "epoch": 872} {"train_loss": -5.610877990722656, "global_step": 36653, "epoch": 872} {"train_loss": -5.597229480743408, "global_step": 36654, "epoch": 872} {"train_loss": -5.485624313354492, "global_step": 36655, "epoch": 872} {"train_loss": -5.622305870056152, "global_step": 36656, "epoch": 872} {"train_loss": -5.684858322143555, "global_step": 36657, "epoch": 872} {"train_loss": -5.485805511474609, "global_step": 36658, "epoch": 872} {"train_loss": -5.677595138549805, "global_step": 36659, "epoch": 872} {"train_loss": -5.621185302734375, "global_step": 36660, "epoch": 872} {"train_loss": -5.67058801651001, "global_step": 36661, "epoch": 872} {"train_loss": -5.539413928985596, "global_step": 36662, "epoch": 872} {"train_loss": -5.451760292053223, "global_step": 36663, "epoch": 872} {"train_loss": -5.4479475021362305, "global_step": 36664, "epoch": 872} {"train_loss": -5.564059677578154, "global_step": 36665, "epoch": 872, "val_loss": 74213.3515625} {"train_loss": -5.690304756164551, "global_step": 36666, "epoch": 873} {"train_loss": -5.428553104400635, "global_step": 36667, "epoch": 873} {"train_loss": -5.531441688537598, "global_step": 36668, "epoch": 873} {"train_loss": -5.657901763916016, "global_step": 36669, "epoch": 873} {"train_loss": -5.593120574951172, "global_step": 36670, "epoch": 873} {"train_loss": -5.559259414672852, "global_step": 36671, "epoch": 873} {"train_loss": -5.546648025512695, "global_step": 36672, "epoch": 873} {"train_loss": -5.6494903564453125, "global_step": 36673, "epoch": 873} {"train_loss": -5.672574043273926, "global_step": 36674, "epoch": 873} {"train_loss": -5.6406660079956055, "global_step": 36675, "epoch": 873} {"train_loss": -5.720603942871094, "global_step": 36676, "epoch": 873} {"train_loss": -5.5408430099487305, "global_step": 36677, "epoch": 873} {"train_loss": -5.5340375900268555, "global_step": 36678, "epoch": 873} {"train_loss": -5.713210105895996, "global_step": 36679, "epoch": 873} {"train_loss": -5.626351356506348, "global_step": 36680, "epoch": 873} {"train_loss": -5.623235702514648, "global_step": 36681, "epoch": 873} {"train_loss": -5.6651763916015625, "global_step": 36682, "epoch": 873} {"train_loss": -5.543060302734375, "global_step": 36683, "epoch": 873} {"train_loss": -5.659351348876953, "global_step": 36684, "epoch": 873} {"train_loss": -5.4872846603393555, "global_step": 36685, "epoch": 873} {"train_loss": -5.449170112609863, "global_step": 36686, "epoch": 873} {"train_loss": -5.486641883850098, "global_step": 36687, "epoch": 873} {"train_loss": -5.526331901550293, "global_step": 36688, "epoch": 873} {"train_loss": -5.376605987548828, "global_step": 36689, "epoch": 873} {"train_loss": -5.595869541168213, "global_step": 36690, "epoch": 873} {"train_loss": -5.573912143707275, "global_step": 36691, "epoch": 873} {"train_loss": -5.605499267578125, "global_step": 36692, "epoch": 873} {"train_loss": -5.583756446838379, "global_step": 36693, "epoch": 873} {"train_loss": -5.610320091247559, "global_step": 36694, "epoch": 873} {"train_loss": -5.625597953796387, "global_step": 36695, "epoch": 873} {"train_loss": -5.754369735717773, "global_step": 36696, "epoch": 873} {"train_loss": -5.652400970458984, "global_step": 36697, "epoch": 873} {"train_loss": -5.670401573181152, "global_step": 36698, "epoch": 873} {"train_loss": -5.563942909240723, "global_step": 36699, "epoch": 873} {"train_loss": -5.636783599853516, "global_step": 36700, "epoch": 873} {"train_loss": -5.5133490562438965, "global_step": 36701, "epoch": 873} {"train_loss": -5.629803657531738, "global_step": 36702, "epoch": 873} {"train_loss": -5.654696464538574, "global_step": 36703, "epoch": 873} {"train_loss": -5.511088848114014, "global_step": 36704, "epoch": 873} {"train_loss": -5.562682151794434, "global_step": 36705, "epoch": 873} {"train_loss": -5.414290428161621, "global_step": 36706, "epoch": 873} {"train_loss": -5.587352457500639, "global_step": 36707, "epoch": 873, "val_loss": 74649.1953125} {"train_loss": -5.6553053855896, "global_step": 36708, "epoch": 874} {"train_loss": -5.496913909912109, "global_step": 36709, "epoch": 874} {"train_loss": -5.650269508361816, "global_step": 36710, "epoch": 874} {"train_loss": -5.556179046630859, "global_step": 36711, "epoch": 874} {"train_loss": -5.55055046081543, "global_step": 36712, "epoch": 874} {"train_loss": -5.598119735717773, "global_step": 36713, "epoch": 874} {"train_loss": -5.692819118499756, "global_step": 36714, "epoch": 874} {"train_loss": -5.572484016418457, "global_step": 36715, "epoch": 874} {"train_loss": -5.623276710510254, "global_step": 36716, "epoch": 874} {"train_loss": -5.653160095214844, "global_step": 36717, "epoch": 874} {"train_loss": -5.489589691162109, "global_step": 36718, "epoch": 874} {"train_loss": -5.6056928634643555, "global_step": 36719, "epoch": 874} {"train_loss": -5.599634170532227, "global_step": 36720, "epoch": 874} {"train_loss": -5.614666938781738, "global_step": 36721, "epoch": 874} {"train_loss": -5.544703960418701, "global_step": 36722, "epoch": 874} {"train_loss": -5.75086784362793, "global_step": 36723, "epoch": 874} {"train_loss": -5.615585803985596, "global_step": 36724, "epoch": 874} {"train_loss": -5.527810573577881, "global_step": 36725, "epoch": 874} {"train_loss": -5.557064056396484, "global_step": 36726, "epoch": 874} {"train_loss": -5.597213268280029, "global_step": 36727, "epoch": 874} {"train_loss": -5.580198287963867, "global_step": 36728, "epoch": 874} {"train_loss": -5.547999382019043, "global_step": 36729, "epoch": 874} {"train_loss": -5.656692981719971, "global_step": 36730, "epoch": 874} {"train_loss": -5.558252334594727, "global_step": 36731, "epoch": 874} {"train_loss": -5.602245330810547, "global_step": 36732, "epoch": 874} {"train_loss": -5.612171173095703, "global_step": 36733, "epoch": 874} {"train_loss": -5.524160861968994, "global_step": 36734, "epoch": 874} {"train_loss": -5.573086738586426, "global_step": 36735, "epoch": 874} {"train_loss": -5.491689682006836, "global_step": 36736, "epoch": 874} {"train_loss": -5.5384016036987305, "global_step": 36737, "epoch": 874} {"train_loss": -5.518458366394043, "global_step": 36738, "epoch": 874} {"train_loss": -5.631418228149414, "global_step": 36739, "epoch": 874} {"train_loss": -5.456757068634033, "global_step": 36740, "epoch": 874} {"train_loss": -5.5901947021484375, "global_step": 36741, "epoch": 874} {"train_loss": -5.511472702026367, "global_step": 36742, "epoch": 874} {"train_loss": -5.6139726638793945, "global_step": 36743, "epoch": 874} {"train_loss": -5.674983978271484, "global_step": 36744, "epoch": 874} {"train_loss": -5.4510273933410645, "global_step": 36745, "epoch": 874} {"train_loss": -5.394216537475586, "global_step": 36746, "epoch": 874} {"train_loss": -5.657419681549072, "global_step": 36747, "epoch": 874} {"train_loss": -5.720494270324707, "global_step": 36748, "epoch": 874} {"train_loss": -5.581236827941168, "global_step": 36749, "epoch": 874, "val_loss": 74472.8984375} {"train_loss": -5.481015205383301, "global_step": 36750, "epoch": 875} {"train_loss": -5.640751838684082, "global_step": 36751, "epoch": 875} {"train_loss": -5.460874557495117, "global_step": 36752, "epoch": 875} {"train_loss": -5.654572486877441, "global_step": 36753, "epoch": 875} {"train_loss": -5.658312797546387, "global_step": 36754, "epoch": 875} {"train_loss": -5.556133270263672, "global_step": 36755, "epoch": 875} {"train_loss": -5.5226240158081055, "global_step": 36756, "epoch": 875} {"train_loss": -5.527776718139648, "global_step": 36757, "epoch": 875} {"train_loss": -5.452166557312012, "global_step": 36758, "epoch": 875} {"train_loss": -5.509161949157715, "global_step": 36759, "epoch": 875} {"train_loss": -5.562691688537598, "global_step": 36760, "epoch": 875} {"train_loss": -5.581655502319336, "global_step": 36761, "epoch": 875} {"train_loss": -5.444586753845215, "global_step": 36762, "epoch": 875} {"train_loss": -5.581164836883545, "global_step": 36763, "epoch": 875} {"train_loss": -5.472505569458008, "global_step": 36764, "epoch": 875} {"train_loss": -5.4788007736206055, "global_step": 36765, "epoch": 875} {"train_loss": -5.52455472946167, "global_step": 36766, "epoch": 875} {"train_loss": -5.625336170196533, "global_step": 36767, "epoch": 875} {"train_loss": -5.508529186248779, "global_step": 36768, "epoch": 875} {"train_loss": -5.604109287261963, "global_step": 36769, "epoch": 875} {"train_loss": -5.477930068969727, "global_step": 36770, "epoch": 875} {"train_loss": -5.550396919250488, "global_step": 36771, "epoch": 875} {"train_loss": -5.479937553405762, "global_step": 36772, "epoch": 875} {"train_loss": -5.468097686767578, "global_step": 36773, "epoch": 875} {"train_loss": -5.498325347900391, "global_step": 36774, "epoch": 875} {"train_loss": -5.431297779083252, "global_step": 36775, "epoch": 875} {"train_loss": -5.645689487457275, "global_step": 36776, "epoch": 875} {"train_loss": -5.543841361999512, "global_step": 36777, "epoch": 875} {"train_loss": -5.509561538696289, "global_step": 36778, "epoch": 875} {"train_loss": -5.654201507568359, "global_step": 36779, "epoch": 875} {"train_loss": -5.641127109527588, "global_step": 36780, "epoch": 875} {"train_loss": -5.545252323150635, "global_step": 36781, "epoch": 875} {"train_loss": -5.501428604125977, "global_step": 36782, "epoch": 875} {"train_loss": -5.732606887817383, "global_step": 36783, "epoch": 875} {"train_loss": -5.624185562133789, "global_step": 36784, "epoch": 875} {"train_loss": -5.671381950378418, "global_step": 36785, "epoch": 875} {"train_loss": -5.514169216156006, "global_step": 36786, "epoch": 875} {"train_loss": -5.443477630615234, "global_step": 36787, "epoch": 875} {"train_loss": -5.622262001037598, "global_step": 36788, "epoch": 875} {"train_loss": -5.495997905731201, "global_step": 36789, "epoch": 875} {"train_loss": -5.751613616943359, "global_step": 36790, "epoch": 875} {"train_loss": -5.556030897867112, "global_step": 36791, "epoch": 875, "val_loss": 73757.578125} {"train_loss": -5.493988037109375, "global_step": 36792, "epoch": 876} {"train_loss": -5.536327838897705, "global_step": 36793, "epoch": 876} {"train_loss": -5.523275852203369, "global_step": 36794, "epoch": 876} {"train_loss": -5.5229597091674805, "global_step": 36795, "epoch": 876} {"train_loss": -5.485301971435547, "global_step": 36796, "epoch": 876} {"train_loss": -5.526828765869141, "global_step": 36797, "epoch": 876} {"train_loss": -5.5072760581970215, "global_step": 36798, "epoch": 876} {"train_loss": -5.616944789886475, "global_step": 36799, "epoch": 876} {"train_loss": -5.548182010650635, "global_step": 36800, "epoch": 876} {"train_loss": -5.498294830322266, "global_step": 36801, "epoch": 876} {"train_loss": -5.543262004852295, "global_step": 36802, "epoch": 876} {"train_loss": -5.59255313873291, "global_step": 36803, "epoch": 876} {"train_loss": -5.510862350463867, "global_step": 36804, "epoch": 876} {"train_loss": -5.6183271408081055, "global_step": 36805, "epoch": 876} {"train_loss": -5.498388767242432, "global_step": 36806, "epoch": 876} {"train_loss": -5.60321044921875, "global_step": 36807, "epoch": 876} {"train_loss": -5.577824592590332, "global_step": 36808, "epoch": 876} {"train_loss": -5.657129287719727, "global_step": 36809, "epoch": 876} {"train_loss": -5.452573299407959, "global_step": 36810, "epoch": 876} {"train_loss": -5.685198783874512, "global_step": 36811, "epoch": 876} {"train_loss": -5.535104751586914, "global_step": 36812, "epoch": 876} {"train_loss": -5.638007164001465, "global_step": 36813, "epoch": 876} {"train_loss": -5.564227104187012, "global_step": 36814, "epoch": 876} {"train_loss": -5.6511430740356445, "global_step": 36815, "epoch": 876} {"train_loss": -5.504190921783447, "global_step": 36816, "epoch": 876} {"train_loss": -5.538630962371826, "global_step": 36817, "epoch": 876} {"train_loss": -5.717560768127441, "global_step": 36818, "epoch": 876} {"train_loss": -5.615074157714844, "global_step": 36819, "epoch": 876} {"train_loss": -5.563234806060791, "global_step": 36820, "epoch": 876} {"train_loss": -5.480841159820557, "global_step": 36821, "epoch": 876} {"train_loss": -5.640115261077881, "global_step": 36822, "epoch": 876} {"train_loss": -5.561681747436523, "global_step": 36823, "epoch": 876} {"train_loss": -5.57502555847168, "global_step": 36824, "epoch": 876} {"train_loss": -5.511465549468994, "global_step": 36825, "epoch": 876} {"train_loss": -5.636410236358643, "global_step": 36826, "epoch": 876} {"train_loss": -5.737649917602539, "global_step": 36827, "epoch": 876} {"train_loss": -5.470927715301514, "global_step": 36828, "epoch": 876} {"train_loss": -5.649206161499023, "global_step": 36829, "epoch": 876} {"train_loss": -5.5445709228515625, "global_step": 36830, "epoch": 876} {"train_loss": -5.6152238845825195, "global_step": 36831, "epoch": 876} {"train_loss": -5.6217875480651855, "global_step": 36832, "epoch": 876} {"train_loss": -5.569120100566319, "global_step": 36833, "epoch": 876, "val_loss": 74834.3671875} {"train_loss": -5.6911773681640625, "global_step": 36834, "epoch": 877} {"train_loss": -5.559591770172119, "global_step": 36835, "epoch": 877} {"train_loss": -5.471949577331543, "global_step": 36836, "epoch": 877} {"train_loss": -5.663498878479004, "global_step": 36837, "epoch": 877} {"train_loss": -5.468916893005371, "global_step": 36838, "epoch": 877} {"train_loss": -5.5452680587768555, "global_step": 36839, "epoch": 877} {"train_loss": -5.618103981018066, "global_step": 36840, "epoch": 877} {"train_loss": -5.486238479614258, "global_step": 36841, "epoch": 877} {"train_loss": -5.559620380401611, "global_step": 36842, "epoch": 877} {"train_loss": -5.6398396492004395, "global_step": 36843, "epoch": 877} {"train_loss": -5.513751983642578, "global_step": 36844, "epoch": 877} {"train_loss": -5.373266696929932, "global_step": 36845, "epoch": 877} {"train_loss": -5.637106895446777, "global_step": 36846, "epoch": 877} {"train_loss": -5.673000812530518, "global_step": 36847, "epoch": 877} {"train_loss": -5.448133945465088, "global_step": 36848, "epoch": 877} {"train_loss": -5.724699020385742, "global_step": 36849, "epoch": 877} {"train_loss": -5.598982334136963, "global_step": 36850, "epoch": 877} {"train_loss": -5.521225452423096, "global_step": 36851, "epoch": 877} {"train_loss": -5.592662811279297, "global_step": 36852, "epoch": 877} {"train_loss": -5.627684116363525, "global_step": 36853, "epoch": 877} {"train_loss": -5.574090003967285, "global_step": 36854, "epoch": 877} {"train_loss": -5.594090461730957, "global_step": 36855, "epoch": 877} {"train_loss": -5.559621810913086, "global_step": 36856, "epoch": 877} {"train_loss": -5.460467338562012, "global_step": 36857, "epoch": 877} {"train_loss": -5.660179615020752, "global_step": 36858, "epoch": 877} {"train_loss": -5.651566028594971, "global_step": 36859, "epoch": 877} {"train_loss": -5.571559906005859, "global_step": 36860, "epoch": 877} {"train_loss": -5.484203338623047, "global_step": 36861, "epoch": 877} {"train_loss": -5.551790237426758, "global_step": 36862, "epoch": 877} {"train_loss": -5.643904685974121, "global_step": 36863, "epoch": 877} {"train_loss": -5.610091209411621, "global_step": 36864, "epoch": 877} {"train_loss": -5.578825950622559, "global_step": 36865, "epoch": 877} {"train_loss": -5.599717617034912, "global_step": 36866, "epoch": 877} {"train_loss": -5.513016700744629, "global_step": 36867, "epoch": 877} {"train_loss": -5.59838342666626, "global_step": 36868, "epoch": 877} {"train_loss": -5.578380584716797, "global_step": 36869, "epoch": 877} {"train_loss": -5.410608291625977, "global_step": 36870, "epoch": 877} {"train_loss": -5.493022918701172, "global_step": 36871, "epoch": 877} {"train_loss": -5.545971393585205, "global_step": 36872, "epoch": 877} {"train_loss": -5.503190040588379, "global_step": 36873, "epoch": 877} {"train_loss": -5.575211048126221, "global_step": 36874, "epoch": 877} {"train_loss": -5.563452470870245, "global_step": 36875, "epoch": 877, "val_loss": 74804.75} {"train_loss": -5.459085464477539, "global_step": 36876, "epoch": 878} {"train_loss": -5.572380065917969, "global_step": 36877, "epoch": 878} {"train_loss": -5.49928092956543, "global_step": 36878, "epoch": 878} {"train_loss": -5.522645473480225, "global_step": 36879, "epoch": 878} {"train_loss": -5.720930576324463, "global_step": 36880, "epoch": 878} {"train_loss": -5.552109718322754, "global_step": 36881, "epoch": 878} {"train_loss": -5.70125675201416, "global_step": 36882, "epoch": 878} {"train_loss": -5.503979682922363, "global_step": 36883, "epoch": 878} {"train_loss": -5.536205291748047, "global_step": 36884, "epoch": 878} {"train_loss": -5.545042037963867, "global_step": 36885, "epoch": 878} {"train_loss": -5.582528114318848, "global_step": 36886, "epoch": 878} {"train_loss": -5.581240177154541, "global_step": 36887, "epoch": 878} {"train_loss": -5.604586124420166, "global_step": 36888, "epoch": 878} {"train_loss": -5.555100917816162, "global_step": 36889, "epoch": 878} {"train_loss": -5.40756368637085, "global_step": 36890, "epoch": 878} {"train_loss": -5.639660358428955, "global_step": 36891, "epoch": 878} {"train_loss": -5.690340042114258, "global_step": 36892, "epoch": 878} {"train_loss": -5.745927810668945, "global_step": 36893, "epoch": 878} {"train_loss": -5.575099945068359, "global_step": 36894, "epoch": 878} {"train_loss": -5.610848426818848, "global_step": 36895, "epoch": 878} {"train_loss": -5.468855381011963, "global_step": 36896, "epoch": 878} {"train_loss": -5.585376262664795, "global_step": 36897, "epoch": 878} {"train_loss": -5.530426025390625, "global_step": 36898, "epoch": 878} {"train_loss": -5.472689151763916, "global_step": 36899, "epoch": 878} {"train_loss": -5.563440322875977, "global_step": 36900, "epoch": 878} {"train_loss": -5.447041034698486, "global_step": 36901, "epoch": 878} {"train_loss": -5.406708717346191, "global_step": 36902, "epoch": 878} {"train_loss": -5.524999618530273, "global_step": 36903, "epoch": 878} {"train_loss": -5.365603923797607, "global_step": 36904, "epoch": 878} {"train_loss": -5.554218292236328, "global_step": 36905, "epoch": 878} {"train_loss": -5.396213531494141, "global_step": 36906, "epoch": 878} {"train_loss": -5.56935453414917, "global_step": 36907, "epoch": 878} {"train_loss": -5.5585856437683105, "global_step": 36908, "epoch": 878} {"train_loss": -5.4214701652526855, "global_step": 36909, "epoch": 878} {"train_loss": -5.489164352416992, "global_step": 36910, "epoch": 878} {"train_loss": -5.400559902191162, "global_step": 36911, "epoch": 878} {"train_loss": -5.5752716064453125, "global_step": 36912, "epoch": 878} {"train_loss": -5.508808135986328, "global_step": 36913, "epoch": 878} {"train_loss": -5.69647216796875, "global_step": 36914, "epoch": 878} {"train_loss": -5.508674621582031, "global_step": 36915, "epoch": 878} {"train_loss": -5.571110248565674, "global_step": 36916, "epoch": 878} {"train_loss": -5.546621992474511, "global_step": 36917, "epoch": 878, "val_loss": 74087.234375} {"train_loss": -5.542022705078125, "global_step": 36918, "epoch": 879} {"train_loss": -5.64208459854126, "global_step": 36919, "epoch": 879} {"train_loss": -5.656101226806641, "global_step": 36920, "epoch": 879} {"train_loss": -5.515102386474609, "global_step": 36921, "epoch": 879} {"train_loss": -5.5739922523498535, "global_step": 36922, "epoch": 879} {"train_loss": -5.630497932434082, "global_step": 36923, "epoch": 879} {"train_loss": -5.575181007385254, "global_step": 36924, "epoch": 879} {"train_loss": -5.580567359924316, "global_step": 36925, "epoch": 879} {"train_loss": -5.810153961181641, "global_step": 36926, "epoch": 879} {"train_loss": -5.672528266906738, "global_step": 36927, "epoch": 879} {"train_loss": -5.639339447021484, "global_step": 36928, "epoch": 879} {"train_loss": -5.5401716232299805, "global_step": 36929, "epoch": 879} {"train_loss": -5.547497272491455, "global_step": 36930, "epoch": 879} {"train_loss": -5.668849945068359, "global_step": 36931, "epoch": 879} {"train_loss": -5.575475692749023, "global_step": 36932, "epoch": 879} {"train_loss": -5.532060623168945, "global_step": 36933, "epoch": 879} {"train_loss": -5.5818562507629395, "global_step": 36934, "epoch": 879} {"train_loss": -5.592270374298096, "global_step": 36935, "epoch": 879} {"train_loss": -5.616347789764404, "global_step": 36936, "epoch": 879} {"train_loss": -5.579013824462891, "global_step": 36937, "epoch": 879} {"train_loss": -5.620926856994629, "global_step": 36938, "epoch": 879} {"train_loss": -5.707027435302734, "global_step": 36939, "epoch": 879} {"train_loss": -5.664226531982422, "global_step": 36940, "epoch": 879} {"train_loss": -5.675110816955566, "global_step": 36941, "epoch": 879} {"train_loss": -5.5812249183654785, "global_step": 36942, "epoch": 879} {"train_loss": -5.524720191955566, "global_step": 36943, "epoch": 879} {"train_loss": -5.543773651123047, "global_step": 36944, "epoch": 879} {"train_loss": -5.656821250915527, "global_step": 36945, "epoch": 879} {"train_loss": -5.652730464935303, "global_step": 36946, "epoch": 879} {"train_loss": -5.546368598937988, "global_step": 36947, "epoch": 879} {"train_loss": -5.51125431060791, "global_step": 36948, "epoch": 879} {"train_loss": -5.582110404968262, "global_step": 36949, "epoch": 879} {"train_loss": -5.6486005783081055, "global_step": 36950, "epoch": 879} {"train_loss": -5.559063911437988, "global_step": 36951, "epoch": 879} {"train_loss": -5.678140163421631, "global_step": 36952, "epoch": 879} {"train_loss": -5.567138671875, "global_step": 36953, "epoch": 879} {"train_loss": -5.653650283813477, "global_step": 36954, "epoch": 879} {"train_loss": -5.593753814697266, "global_step": 36955, "epoch": 879} {"train_loss": -5.542662620544434, "global_step": 36956, "epoch": 879} {"train_loss": -5.535335540771484, "global_step": 36957, "epoch": 879} {"train_loss": -5.470320701599121, "global_step": 36958, "epoch": 879} {"train_loss": -5.596301453454154, "global_step": 36959, "epoch": 879, "val_loss": 73897.71875} {"train_loss": -5.671865463256836, "global_step": 36960, "epoch": 880} {"train_loss": -5.650814533233643, "global_step": 36961, "epoch": 880} {"train_loss": -5.554939270019531, "global_step": 36962, "epoch": 880} {"train_loss": -5.681514739990234, "global_step": 36963, "epoch": 880} {"train_loss": -5.510220527648926, "global_step": 36964, "epoch": 880} {"train_loss": -5.71402645111084, "global_step": 36965, "epoch": 880} {"train_loss": -5.698483467102051, "global_step": 36966, "epoch": 880} {"train_loss": -5.575051307678223, "global_step": 36967, "epoch": 880} {"train_loss": -5.627931594848633, "global_step": 36968, "epoch": 880} {"train_loss": -5.577714920043945, "global_step": 36969, "epoch": 880} {"train_loss": -5.66507625579834, "global_step": 36970, "epoch": 880} {"train_loss": -5.579246520996094, "global_step": 36971, "epoch": 880} {"train_loss": -5.570618629455566, "global_step": 36972, "epoch": 880} {"train_loss": -5.550283908843994, "global_step": 36973, "epoch": 880} {"train_loss": -5.480642318725586, "global_step": 36974, "epoch": 880} {"train_loss": -5.621760368347168, "global_step": 36975, "epoch": 880} {"train_loss": -5.5069379806518555, "global_step": 36976, "epoch": 880} {"train_loss": -5.4677910804748535, "global_step": 36977, "epoch": 880} {"train_loss": -5.575355529785156, "global_step": 36978, "epoch": 880} {"train_loss": -5.608029842376709, "global_step": 36979, "epoch": 880} {"train_loss": -5.587391376495361, "global_step": 36980, "epoch": 880} {"train_loss": -5.611523628234863, "global_step": 36981, "epoch": 880} {"train_loss": -5.484384536743164, "global_step": 36982, "epoch": 880} {"train_loss": -5.618871688842773, "global_step": 36983, "epoch": 880} {"train_loss": -5.479514122009277, "global_step": 36984, "epoch": 880} {"train_loss": -5.746331214904785, "global_step": 36985, "epoch": 880} {"train_loss": -5.60636043548584, "global_step": 36986, "epoch": 880} {"train_loss": -5.483715534210205, "global_step": 36987, "epoch": 880} {"train_loss": -5.651895999908447, "global_step": 36988, "epoch": 880} {"train_loss": -5.567147254943848, "global_step": 36989, "epoch": 880} {"train_loss": -5.557429313659668, "global_step": 36990, "epoch": 880} {"train_loss": -5.507180213928223, "global_step": 36991, "epoch": 880} {"train_loss": -5.478377342224121, "global_step": 36992, "epoch": 880} {"train_loss": -5.538146018981934, "global_step": 36993, "epoch": 880} {"train_loss": -5.5504302978515625, "global_step": 36994, "epoch": 880} {"train_loss": -5.5919928550720215, "global_step": 36995, "epoch": 880} {"train_loss": -5.598963737487793, "global_step": 36996, "epoch": 880} {"train_loss": -5.618100166320801, "global_step": 36997, "epoch": 880} {"train_loss": -5.5476579666137695, "global_step": 36998, "epoch": 880} {"train_loss": -5.520211219787598, "global_step": 36999, "epoch": 880} {"train_loss": -5.574983596801758, "global_step": 37000, "epoch": 880} {"train_loss": -5.577014230546498, "global_step": 37001, "epoch": 880, "val_loss": 74097.4921875} {"train_loss": -5.621901512145996, "global_step": 37002, "epoch": 881} {"train_loss": -5.603977680206299, "global_step": 37003, "epoch": 881} {"train_loss": -5.474374294281006, "global_step": 37004, "epoch": 881} {"train_loss": -5.694768905639648, "global_step": 37005, "epoch": 881} {"train_loss": -5.609502792358398, "global_step": 37006, "epoch": 881} {"train_loss": -5.540712356567383, "global_step": 37007, "epoch": 881} {"train_loss": -5.386198997497559, "global_step": 37008, "epoch": 881} {"train_loss": -5.604434967041016, "global_step": 37009, "epoch": 881} {"train_loss": -5.51518440246582, "global_step": 37010, "epoch": 881} {"train_loss": -5.59156608581543, "global_step": 37011, "epoch": 881} {"train_loss": -5.495381832122803, "global_step": 37012, "epoch": 881} {"train_loss": -5.517319679260254, "global_step": 37013, "epoch": 881} {"train_loss": -5.655725479125977, "global_step": 37014, "epoch": 881} {"train_loss": -5.621260166168213, "global_step": 37015, "epoch": 881} {"train_loss": -5.536567687988281, "global_step": 37016, "epoch": 881} {"train_loss": -5.588128089904785, "global_step": 37017, "epoch": 881} {"train_loss": -5.53296422958374, "global_step": 37018, "epoch": 881} {"train_loss": -5.605040550231934, "global_step": 37019, "epoch": 881} {"train_loss": -5.590687274932861, "global_step": 37020, "epoch": 881} {"train_loss": -5.484270095825195, "global_step": 37021, "epoch": 881} {"train_loss": -5.566102981567383, "global_step": 37022, "epoch": 881} {"train_loss": -5.550703525543213, "global_step": 37023, "epoch": 881} {"train_loss": -5.458696365356445, "global_step": 37024, "epoch": 881} {"train_loss": -5.715234756469727, "global_step": 37025, "epoch": 881} {"train_loss": -5.509858131408691, "global_step": 37026, "epoch": 881} {"train_loss": -5.4933600425720215, "global_step": 37027, "epoch": 881} {"train_loss": -5.6479010581970215, "global_step": 37028, "epoch": 881} {"train_loss": -5.6493682861328125, "global_step": 37029, "epoch": 881} {"train_loss": -5.548070907592773, "global_step": 37030, "epoch": 881} {"train_loss": -5.623593330383301, "global_step": 37031, "epoch": 881} {"train_loss": -5.713451385498047, "global_step": 37032, "epoch": 881} {"train_loss": -5.535239219665527, "global_step": 37033, "epoch": 881} {"train_loss": -5.523766040802002, "global_step": 37034, "epoch": 881} {"train_loss": -5.536911964416504, "global_step": 37035, "epoch": 881} {"train_loss": -5.594701766967773, "global_step": 37036, "epoch": 881} {"train_loss": -5.3944292068481445, "global_step": 37037, "epoch": 881} {"train_loss": -5.473727703094482, "global_step": 37038, "epoch": 881} {"train_loss": -5.460651874542236, "global_step": 37039, "epoch": 881} {"train_loss": -5.516323089599609, "global_step": 37040, "epoch": 881} {"train_loss": -5.650940895080566, "global_step": 37041, "epoch": 881} {"train_loss": -5.471538543701172, "global_step": 37042, "epoch": 881} {"train_loss": -5.558022703443255, "global_step": 37043, "epoch": 881, "val_loss": 74205.8359375} {"train_loss": -5.753684043884277, "global_step": 37044, "epoch": 882} {"train_loss": -5.3114519119262695, "global_step": 37045, "epoch": 882} {"train_loss": -5.657846927642822, "global_step": 37046, "epoch": 882} {"train_loss": -5.499463081359863, "global_step": 37047, "epoch": 882} {"train_loss": -5.582951545715332, "global_step": 37048, "epoch": 882} {"train_loss": -5.678853988647461, "global_step": 37049, "epoch": 882} {"train_loss": -5.407520294189453, "global_step": 37050, "epoch": 882} {"train_loss": -5.6026506423950195, "global_step": 37051, "epoch": 882} {"train_loss": -5.52081298828125, "global_step": 37052, "epoch": 882} {"train_loss": -5.57088565826416, "global_step": 37053, "epoch": 882} {"train_loss": -5.573341369628906, "global_step": 37054, "epoch": 882} {"train_loss": -5.402597427368164, "global_step": 37055, "epoch": 882} {"train_loss": -5.471734046936035, "global_step": 37056, "epoch": 882} {"train_loss": -5.604811191558838, "global_step": 37057, "epoch": 882} {"train_loss": -5.607187271118164, "global_step": 37058, "epoch": 882} {"train_loss": -5.393401622772217, "global_step": 37059, "epoch": 882} {"train_loss": -5.597317695617676, "global_step": 37060, "epoch": 882} {"train_loss": -5.550870895385742, "global_step": 37061, "epoch": 882} {"train_loss": -5.589295387268066, "global_step": 37062, "epoch": 882} {"train_loss": -5.574341773986816, "global_step": 37063, "epoch": 882} {"train_loss": -5.502429008483887, "global_step": 37064, "epoch": 882} {"train_loss": -5.559317588806152, "global_step": 37065, "epoch": 882} {"train_loss": -5.619963645935059, "global_step": 37066, "epoch": 882} {"train_loss": -5.602541923522949, "global_step": 37067, "epoch": 882} {"train_loss": -5.534862518310547, "global_step": 37068, "epoch": 882} {"train_loss": -5.647993087768555, "global_step": 37069, "epoch": 882} {"train_loss": -5.570620536804199, "global_step": 37070, "epoch": 882} {"train_loss": -5.644524574279785, "global_step": 37071, "epoch": 882} {"train_loss": -5.5821146965026855, "global_step": 37072, "epoch": 882} {"train_loss": -5.591053485870361, "global_step": 37073, "epoch": 882} {"train_loss": -5.592144012451172, "global_step": 37074, "epoch": 882} {"train_loss": -5.444480895996094, "global_step": 37075, "epoch": 882} {"train_loss": -5.591411113739014, "global_step": 37076, "epoch": 882} {"train_loss": -5.5357441902160645, "global_step": 37077, "epoch": 882} {"train_loss": -5.674991130828857, "global_step": 37078, "epoch": 882} {"train_loss": -5.669217586517334, "global_step": 37079, "epoch": 882} {"train_loss": -5.603400230407715, "global_step": 37080, "epoch": 882} {"train_loss": -5.711939811706543, "global_step": 37081, "epoch": 882} {"train_loss": -5.67085075378418, "global_step": 37082, "epoch": 882} {"train_loss": -5.5718159675598145, "global_step": 37083, "epoch": 882} {"train_loss": -5.529356956481934, "global_step": 37084, "epoch": 882} {"train_loss": -5.572858674185617, "global_step": 37085, "epoch": 882, "val_loss": 73750.234375} {"train_loss": -5.590975284576416, "global_step": 37086, "epoch": 883} {"train_loss": -5.678639888763428, "global_step": 37087, "epoch": 883} {"train_loss": -5.635631084442139, "global_step": 37088, "epoch": 883} {"train_loss": -5.5997419357299805, "global_step": 37089, "epoch": 883} {"train_loss": -5.741029262542725, "global_step": 37090, "epoch": 883} {"train_loss": -5.60247802734375, "global_step": 37091, "epoch": 883} {"train_loss": -5.56445837020874, "global_step": 37092, "epoch": 883} {"train_loss": -5.642421722412109, "global_step": 37093, "epoch": 883} {"train_loss": -5.581947326660156, "global_step": 37094, "epoch": 883} {"train_loss": -5.5536394119262695, "global_step": 37095, "epoch": 883} {"train_loss": -5.592693328857422, "global_step": 37096, "epoch": 883} {"train_loss": -5.555363178253174, "global_step": 37097, "epoch": 883} {"train_loss": -5.419565677642822, "global_step": 37098, "epoch": 883} {"train_loss": -5.6306610107421875, "global_step": 37099, "epoch": 883} {"train_loss": -5.577315330505371, "global_step": 37100, "epoch": 883} {"train_loss": -5.594451904296875, "global_step": 37101, "epoch": 883} {"train_loss": -5.617003440856934, "global_step": 37102, "epoch": 883} {"train_loss": -5.538758277893066, "global_step": 37103, "epoch": 883} {"train_loss": -5.670930862426758, "global_step": 37104, "epoch": 883} {"train_loss": -5.667458534240723, "global_step": 37105, "epoch": 883} {"train_loss": -5.480118751525879, "global_step": 37106, "epoch": 883} {"train_loss": -5.46454381942749, "global_step": 37107, "epoch": 883} {"train_loss": -5.746769428253174, "global_step": 37108, "epoch": 883} {"train_loss": -5.626314163208008, "global_step": 37109, "epoch": 883} {"train_loss": -5.507625579833984, "global_step": 37110, "epoch": 883} {"train_loss": -5.534734725952148, "global_step": 37111, "epoch": 883} {"train_loss": -5.560639381408691, "global_step": 37112, "epoch": 883} {"train_loss": -5.555502891540527, "global_step": 37113, "epoch": 883} {"train_loss": -5.5073041915893555, "global_step": 37114, "epoch": 883} {"train_loss": -5.564324855804443, "global_step": 37115, "epoch": 883} {"train_loss": -5.546093463897705, "global_step": 37116, "epoch": 883} {"train_loss": -5.699902534484863, "global_step": 37117, "epoch": 883} {"train_loss": -5.5996551513671875, "global_step": 37118, "epoch": 883} {"train_loss": -5.559035778045654, "global_step": 37119, "epoch": 883} {"train_loss": -5.636292934417725, "global_step": 37120, "epoch": 883} {"train_loss": -5.553414344787598, "global_step": 37121, "epoch": 883} {"train_loss": -5.563591480255127, "global_step": 37122, "epoch": 883} {"train_loss": -5.605574607849121, "global_step": 37123, "epoch": 883} {"train_loss": -5.55856990814209, "global_step": 37124, "epoch": 883} {"train_loss": -5.526617050170898, "global_step": 37125, "epoch": 883} {"train_loss": -5.474191188812256, "global_step": 37126, "epoch": 883} {"train_loss": -5.582947004409063, "global_step": 37127, "epoch": 883, "val_loss": 73541.21875} {"train_loss": -5.612082004547119, "global_step": 37128, "epoch": 884} {"train_loss": -5.513690948486328, "global_step": 37129, "epoch": 884} {"train_loss": -5.648373603820801, "global_step": 37130, "epoch": 884} {"train_loss": -5.659595489501953, "global_step": 37131, "epoch": 884} {"train_loss": -5.534160614013672, "global_step": 37132, "epoch": 884} {"train_loss": -5.544069766998291, "global_step": 37133, "epoch": 884} {"train_loss": -5.673793315887451, "global_step": 37134, "epoch": 884} {"train_loss": -5.5661115646362305, "global_step": 37135, "epoch": 884} {"train_loss": -5.730477333068848, "global_step": 37136, "epoch": 884} {"train_loss": -5.3898701667785645, "global_step": 37137, "epoch": 884} {"train_loss": -5.5420708656311035, "global_step": 37138, "epoch": 884} {"train_loss": -5.653291702270508, "global_step": 37139, "epoch": 884} {"train_loss": -5.555545330047607, "global_step": 37140, "epoch": 884} {"train_loss": -5.43281364440918, "global_step": 37141, "epoch": 884} {"train_loss": -5.561361789703369, "global_step": 37142, "epoch": 884} {"train_loss": -5.403964996337891, "global_step": 37143, "epoch": 884} {"train_loss": -5.633821487426758, "global_step": 37144, "epoch": 884} {"train_loss": -5.61824369430542, "global_step": 37145, "epoch": 884} {"train_loss": -5.316690921783447, "global_step": 37146, "epoch": 884} {"train_loss": -5.48341178894043, "global_step": 37147, "epoch": 884} {"train_loss": -5.437748432159424, "global_step": 37148, "epoch": 884} {"train_loss": -5.528191566467285, "global_step": 37149, "epoch": 884} {"train_loss": -5.591923713684082, "global_step": 37150, "epoch": 884} {"train_loss": -5.429083824157715, "global_step": 37151, "epoch": 884} {"train_loss": -5.518576622009277, "global_step": 37152, "epoch": 884} {"train_loss": -5.485439300537109, "global_step": 37153, "epoch": 884} {"train_loss": -5.551494598388672, "global_step": 37154, "epoch": 884} {"train_loss": -5.5008697509765625, "global_step": 37155, "epoch": 884} {"train_loss": -5.582580089569092, "global_step": 37156, "epoch": 884} {"train_loss": -5.5508341789245605, "global_step": 37157, "epoch": 884} {"train_loss": -5.492889404296875, "global_step": 37158, "epoch": 884} {"train_loss": -5.481082916259766, "global_step": 37159, "epoch": 884} {"train_loss": -5.5408477783203125, "global_step": 37160, "epoch": 884} {"train_loss": -5.5435471534729, "global_step": 37161, "epoch": 884} {"train_loss": -5.426936149597168, "global_step": 37162, "epoch": 884} {"train_loss": -5.633704662322998, "global_step": 37163, "epoch": 884} {"train_loss": -5.420504570007324, "global_step": 37164, "epoch": 884} {"train_loss": -5.607268333435059, "global_step": 37165, "epoch": 884} {"train_loss": -5.6341753005981445, "global_step": 37166, "epoch": 884} {"train_loss": -5.511600494384766, "global_step": 37167, "epoch": 884} {"train_loss": -5.644326210021973, "global_step": 37168, "epoch": 884} {"train_loss": -5.541993175234113, "global_step": 37169, "epoch": 884, "val_loss": 74859.4765625} {"train_loss": -5.526028633117676, "global_step": 37170, "epoch": 885} {"train_loss": -5.516229629516602, "global_step": 37171, "epoch": 885} {"train_loss": -5.521134376525879, "global_step": 37172, "epoch": 885} {"train_loss": -5.557029724121094, "global_step": 37173, "epoch": 885} {"train_loss": -5.582700729370117, "global_step": 37174, "epoch": 885} {"train_loss": -5.6208391189575195, "global_step": 37175, "epoch": 885} {"train_loss": -5.61752986907959, "global_step": 37176, "epoch": 885} {"train_loss": -5.433421611785889, "global_step": 37177, "epoch": 885} {"train_loss": -5.462059497833252, "global_step": 37178, "epoch": 885} {"train_loss": -5.514770984649658, "global_step": 37179, "epoch": 885} {"train_loss": -5.498496055603027, "global_step": 37180, "epoch": 885} {"train_loss": -5.404023170471191, "global_step": 37181, "epoch": 885} {"train_loss": -5.666820526123047, "global_step": 37182, "epoch": 885} {"train_loss": -5.501749038696289, "global_step": 37183, "epoch": 885} {"train_loss": -5.518329620361328, "global_step": 37184, "epoch": 885} {"train_loss": -5.663606643676758, "global_step": 37185, "epoch": 885} {"train_loss": -5.568943977355957, "global_step": 37186, "epoch": 885} {"train_loss": -5.549088478088379, "global_step": 37187, "epoch": 885} {"train_loss": -5.5886125564575195, "global_step": 37188, "epoch": 885} {"train_loss": -5.5018720626831055, "global_step": 37189, "epoch": 885} {"train_loss": -5.541698455810547, "global_step": 37190, "epoch": 885} {"train_loss": -5.503313064575195, "global_step": 37191, "epoch": 885} {"train_loss": -5.554883003234863, "global_step": 37192, "epoch": 885} {"train_loss": -5.500904560089111, "global_step": 37193, "epoch": 885} {"train_loss": -5.471397399902344, "global_step": 37194, "epoch": 885} {"train_loss": -5.66226863861084, "global_step": 37195, "epoch": 885} {"train_loss": -5.610086441040039, "global_step": 37196, "epoch": 885} {"train_loss": -5.6745500564575195, "global_step": 37197, "epoch": 885} {"train_loss": -5.620170593261719, "global_step": 37198, "epoch": 885} {"train_loss": -5.5923357009887695, "global_step": 37199, "epoch": 885} {"train_loss": -5.610830307006836, "global_step": 37200, "epoch": 885} {"train_loss": -5.611630439758301, "global_step": 37201, "epoch": 885} {"train_loss": -5.579233169555664, "global_step": 37202, "epoch": 885} {"train_loss": -5.779402732849121, "global_step": 37203, "epoch": 885} {"train_loss": -5.663508892059326, "global_step": 37204, "epoch": 885} {"train_loss": -5.452336311340332, "global_step": 37205, "epoch": 885} {"train_loss": -5.569271087646484, "global_step": 37206, "epoch": 885} {"train_loss": -5.732327461242676, "global_step": 37207, "epoch": 885} {"train_loss": -5.8143510818481445, "global_step": 37208, "epoch": 885} {"train_loss": -5.679070472717285, "global_step": 37209, "epoch": 885} {"train_loss": -5.763391017913818, "global_step": 37210, "epoch": 885} {"train_loss": -5.577984071913219, "global_step": 37211, "epoch": 885, "val_loss": 73888.4140625} {"train_loss": -5.539569854736328, "global_step": 37212, "epoch": 886} {"train_loss": -5.735462188720703, "global_step": 37213, "epoch": 886} {"train_loss": -5.641294956207275, "global_step": 37214, "epoch": 886} {"train_loss": -5.546718120574951, "global_step": 37215, "epoch": 886} {"train_loss": -5.583454132080078, "global_step": 37216, "epoch": 886} {"train_loss": -5.656825065612793, "global_step": 37217, "epoch": 886} {"train_loss": -5.637172222137451, "global_step": 37218, "epoch": 886} {"train_loss": -5.46932315826416, "global_step": 37219, "epoch": 886} {"train_loss": -5.531445503234863, "global_step": 37220, "epoch": 886} {"train_loss": -5.755169868469238, "global_step": 37221, "epoch": 886} {"train_loss": -5.508523941040039, "global_step": 37222, "epoch": 886} {"train_loss": -5.4571380615234375, "global_step": 37223, "epoch": 886} {"train_loss": -5.704840660095215, "global_step": 37224, "epoch": 886} {"train_loss": -5.525599002838135, "global_step": 37225, "epoch": 886} {"train_loss": -5.679408073425293, "global_step": 37226, "epoch": 886} {"train_loss": -5.622045993804932, "global_step": 37227, "epoch": 886} {"train_loss": -5.602314472198486, "global_step": 37228, "epoch": 886} {"train_loss": -5.587955474853516, "global_step": 37229, "epoch": 886} {"train_loss": -5.726556301116943, "global_step": 37230, "epoch": 886} {"train_loss": -5.510502338409424, "global_step": 37231, "epoch": 886} {"train_loss": -5.6261773109436035, "global_step": 37232, "epoch": 886} {"train_loss": -5.61734676361084, "global_step": 37233, "epoch": 886} {"train_loss": -5.544284820556641, "global_step": 37234, "epoch": 886} {"train_loss": -5.504819869995117, "global_step": 37235, "epoch": 886} {"train_loss": -5.60854434967041, "global_step": 37236, "epoch": 886} {"train_loss": -5.610581398010254, "global_step": 37237, "epoch": 886} {"train_loss": -5.515924453735352, "global_step": 37238, "epoch": 886} {"train_loss": -5.588438034057617, "global_step": 37239, "epoch": 886} {"train_loss": -5.619778156280518, "global_step": 37240, "epoch": 886} {"train_loss": -5.4476141929626465, "global_step": 37241, "epoch": 886} {"train_loss": -5.732668876647949, "global_step": 37242, "epoch": 886} {"train_loss": -5.646263599395752, "global_step": 37243, "epoch": 886} {"train_loss": -5.503178596496582, "global_step": 37244, "epoch": 886} {"train_loss": -5.563014030456543, "global_step": 37245, "epoch": 886} {"train_loss": -5.550481796264648, "global_step": 37246, "epoch": 886} {"train_loss": -5.489518165588379, "global_step": 37247, "epoch": 886} {"train_loss": -5.564513206481934, "global_step": 37248, "epoch": 886} {"train_loss": -5.490459442138672, "global_step": 37249, "epoch": 886} {"train_loss": -5.618531227111816, "global_step": 37250, "epoch": 886} {"train_loss": -5.483857154846191, "global_step": 37251, "epoch": 886} {"train_loss": -5.529910087585449, "global_step": 37252, "epoch": 886} {"train_loss": -5.583551622572399, "global_step": 37253, "epoch": 886, "val_loss": 73976.8828125} {"train_loss": -5.579026222229004, "global_step": 37254, "epoch": 887} {"train_loss": -5.578803062438965, "global_step": 37255, "epoch": 887} {"train_loss": -5.596951484680176, "global_step": 37256, "epoch": 887} {"train_loss": -5.680468559265137, "global_step": 37257, "epoch": 887} {"train_loss": -5.567816734313965, "global_step": 37258, "epoch": 887} {"train_loss": -5.462085723876953, "global_step": 37259, "epoch": 887} {"train_loss": -5.570285320281982, "global_step": 37260, "epoch": 887} {"train_loss": -5.628535270690918, "global_step": 37261, "epoch": 887} {"train_loss": -5.547774314880371, "global_step": 37262, "epoch": 887} {"train_loss": -5.58723783493042, "global_step": 37263, "epoch": 887} {"train_loss": -5.526462554931641, "global_step": 37264, "epoch": 887} {"train_loss": -5.557764530181885, "global_step": 37265, "epoch": 887} {"train_loss": -5.599410057067871, "global_step": 37266, "epoch": 887} {"train_loss": -5.604832172393799, "global_step": 37267, "epoch": 887} {"train_loss": -5.633513927459717, "global_step": 37268, "epoch": 887} {"train_loss": -5.515085697174072, "global_step": 37269, "epoch": 887} {"train_loss": -5.5712080001831055, "global_step": 37270, "epoch": 887} {"train_loss": -5.652233123779297, "global_step": 37271, "epoch": 887} {"train_loss": -5.479876518249512, "global_step": 37272, "epoch": 887} {"train_loss": -5.656265735626221, "global_step": 37273, "epoch": 887} {"train_loss": -5.630170822143555, "global_step": 37274, "epoch": 887} {"train_loss": -5.632378578186035, "global_step": 37275, "epoch": 887} {"train_loss": -5.612319469451904, "global_step": 37276, "epoch": 887} {"train_loss": -5.655416488647461, "global_step": 37277, "epoch": 887} {"train_loss": -5.637550354003906, "global_step": 37278, "epoch": 887} {"train_loss": -5.4983062744140625, "global_step": 37279, "epoch": 887} {"train_loss": -5.618544578552246, "global_step": 37280, "epoch": 887} {"train_loss": -5.741358757019043, "global_step": 37281, "epoch": 887} {"train_loss": -5.661629676818848, "global_step": 37282, "epoch": 887} {"train_loss": -5.543565273284912, "global_step": 37283, "epoch": 887} {"train_loss": -5.627906799316406, "global_step": 37284, "epoch": 887} {"train_loss": -5.592074394226074, "global_step": 37285, "epoch": 887} {"train_loss": -5.5638017654418945, "global_step": 37286, "epoch": 887} {"train_loss": -5.53310489654541, "global_step": 37287, "epoch": 887} {"train_loss": -5.621594429016113, "global_step": 37288, "epoch": 887} {"train_loss": -5.517606735229492, "global_step": 37289, "epoch": 887} {"train_loss": -5.61870813369751, "global_step": 37290, "epoch": 887} {"train_loss": -5.644345283508301, "global_step": 37291, "epoch": 887} {"train_loss": -5.618971824645996, "global_step": 37292, "epoch": 887} {"train_loss": -5.54337739944458, "global_step": 37293, "epoch": 887} {"train_loss": -5.560931205749512, "global_step": 37294, "epoch": 887} {"train_loss": -5.591387237821307, "global_step": 37295, "epoch": 887, "val_loss": 73886.203125} {"train_loss": -5.599985122680664, "global_step": 37296, "epoch": 888} {"train_loss": -5.635256767272949, "global_step": 37297, "epoch": 888} {"train_loss": -5.575982093811035, "global_step": 37298, "epoch": 888} {"train_loss": -5.460829257965088, "global_step": 37299, "epoch": 888} {"train_loss": -5.589539527893066, "global_step": 37300, "epoch": 888} {"train_loss": -5.578479766845703, "global_step": 37301, "epoch": 888} {"train_loss": -5.600193977355957, "global_step": 37302, "epoch": 888} {"train_loss": -5.542971611022949, "global_step": 37303, "epoch": 888} {"train_loss": -5.641560077667236, "global_step": 37304, "epoch": 888} {"train_loss": -5.705747604370117, "global_step": 37305, "epoch": 888} {"train_loss": -5.623554229736328, "global_step": 37306, "epoch": 888} {"train_loss": -5.510620594024658, "global_step": 37307, "epoch": 888} {"train_loss": -5.496307373046875, "global_step": 37308, "epoch": 888} {"train_loss": -5.5586652755737305, "global_step": 37309, "epoch": 888} {"train_loss": -5.61976432800293, "global_step": 37310, "epoch": 888} {"train_loss": -5.611468315124512, "global_step": 37311, "epoch": 888} {"train_loss": -5.568296432495117, "global_step": 37312, "epoch": 888} {"train_loss": -5.593749046325684, "global_step": 37313, "epoch": 888} {"train_loss": -5.56644344329834, "global_step": 37314, "epoch": 888} {"train_loss": -5.558523178100586, "global_step": 37315, "epoch": 888} {"train_loss": -5.636775016784668, "global_step": 37316, "epoch": 888} {"train_loss": -5.565323829650879, "global_step": 37317, "epoch": 888} {"train_loss": -5.590224742889404, "global_step": 37318, "epoch": 888} {"train_loss": -5.590847969055176, "global_step": 37319, "epoch": 888} {"train_loss": -5.702357769012451, "global_step": 37320, "epoch": 888} {"train_loss": -5.606968879699707, "global_step": 37321, "epoch": 888} {"train_loss": -5.726630210876465, "global_step": 37322, "epoch": 888} {"train_loss": -5.543972492218018, "global_step": 37323, "epoch": 888} {"train_loss": -5.663154602050781, "global_step": 37324, "epoch": 888} {"train_loss": -5.608412265777588, "global_step": 37325, "epoch": 888} {"train_loss": -5.580855846405029, "global_step": 37326, "epoch": 888} {"train_loss": -5.53572940826416, "global_step": 37327, "epoch": 888} {"train_loss": -5.617012977600098, "global_step": 37328, "epoch": 888} {"train_loss": -5.646649360656738, "global_step": 37329, "epoch": 888} {"train_loss": -5.6925859451293945, "global_step": 37330, "epoch": 888} {"train_loss": -5.616968631744385, "global_step": 37331, "epoch": 888} {"train_loss": -5.66292667388916, "global_step": 37332, "epoch": 888} {"train_loss": -5.619964122772217, "global_step": 37333, "epoch": 888} {"train_loss": -5.5202317237854, "global_step": 37334, "epoch": 888} {"train_loss": -5.677992820739746, "global_step": 37335, "epoch": 888} {"train_loss": -5.712100028991699, "global_step": 37336, "epoch": 888} {"train_loss": -5.603194588706607, "global_step": 37337, "epoch": 888, "val_loss": 73904.34375} {"train_loss": -5.541730880737305, "global_step": 37338, "epoch": 889} {"train_loss": -5.6351494789123535, "global_step": 37339, "epoch": 889} {"train_loss": -5.432143211364746, "global_step": 37340, "epoch": 889} {"train_loss": -5.569145202636719, "global_step": 37341, "epoch": 889} {"train_loss": -5.523008346557617, "global_step": 37342, "epoch": 889} {"train_loss": -5.513996601104736, "global_step": 37343, "epoch": 889} {"train_loss": -5.538611888885498, "global_step": 37344, "epoch": 889} {"train_loss": -5.5270891189575195, "global_step": 37345, "epoch": 889} {"train_loss": -5.499716758728027, "global_step": 37346, "epoch": 889} {"train_loss": -5.593698024749756, "global_step": 37347, "epoch": 889} {"train_loss": -5.492707252502441, "global_step": 37348, "epoch": 889} {"train_loss": -5.6337738037109375, "global_step": 37349, "epoch": 889} {"train_loss": -5.427434921264648, "global_step": 37350, "epoch": 889} {"train_loss": -5.534760475158691, "global_step": 37351, "epoch": 889} {"train_loss": -5.506600856781006, "global_step": 37352, "epoch": 889} {"train_loss": -5.611645698547363, "global_step": 37353, "epoch": 889} {"train_loss": -5.725783348083496, "global_step": 37354, "epoch": 889} {"train_loss": -5.526944637298584, "global_step": 37355, "epoch": 889} {"train_loss": -5.615978240966797, "global_step": 37356, "epoch": 889} {"train_loss": -5.561267852783203, "global_step": 37357, "epoch": 889} {"train_loss": -5.641488075256348, "global_step": 37358, "epoch": 889} {"train_loss": -5.491671562194824, "global_step": 37359, "epoch": 889} {"train_loss": -5.524562835693359, "global_step": 37360, "epoch": 889} {"train_loss": -5.650189399719238, "global_step": 37361, "epoch": 889} {"train_loss": -5.534694194793701, "global_step": 37362, "epoch": 889} {"train_loss": -5.568939208984375, "global_step": 37363, "epoch": 889} {"train_loss": -5.6990509033203125, "global_step": 37364, "epoch": 889} {"train_loss": -5.426281452178955, "global_step": 37365, "epoch": 889} {"train_loss": -5.782042503356934, "global_step": 37366, "epoch": 889} {"train_loss": -5.489016532897949, "global_step": 37367, "epoch": 889} {"train_loss": -5.5111236572265625, "global_step": 37368, "epoch": 889} {"train_loss": -5.592925071716309, "global_step": 37369, "epoch": 889} {"train_loss": -5.614461898803711, "global_step": 37370, "epoch": 889} {"train_loss": -5.655117988586426, "global_step": 37371, "epoch": 889} {"train_loss": -5.586509704589844, "global_step": 37372, "epoch": 889} {"train_loss": -5.734936714172363, "global_step": 37373, "epoch": 889} {"train_loss": -5.585082054138184, "global_step": 37374, "epoch": 889} {"train_loss": -5.519434928894043, "global_step": 37375, "epoch": 889} {"train_loss": -5.590590000152588, "global_step": 37376, "epoch": 889} {"train_loss": -5.65622615814209, "global_step": 37377, "epoch": 889} {"train_loss": -5.591503143310547, "global_step": 37378, "epoch": 889} {"train_loss": -5.573899144218082, "global_step": 37379, "epoch": 889, "val_loss": 74727.0078125} {"train_loss": -5.440362930297852, "global_step": 37380, "epoch": 890} {"train_loss": -5.588760852813721, "global_step": 37381, "epoch": 890} {"train_loss": -5.549416542053223, "global_step": 37382, "epoch": 890} {"train_loss": -5.456900596618652, "global_step": 37383, "epoch": 890} {"train_loss": -5.50557804107666, "global_step": 37384, "epoch": 890} {"train_loss": -5.585678577423096, "global_step": 37385, "epoch": 890} {"train_loss": -5.518241882324219, "global_step": 37386, "epoch": 890} {"train_loss": -5.713381767272949, "global_step": 37387, "epoch": 890} {"train_loss": -5.7608442306518555, "global_step": 37388, "epoch": 890} {"train_loss": -5.584157943725586, "global_step": 37389, "epoch": 890} {"train_loss": -5.519863605499268, "global_step": 37390, "epoch": 890} {"train_loss": -5.653213977813721, "global_step": 37391, "epoch": 890} {"train_loss": -5.599904537200928, "global_step": 37392, "epoch": 890} {"train_loss": -5.630136489868164, "global_step": 37393, "epoch": 890} {"train_loss": -5.666547775268555, "global_step": 37394, "epoch": 890} {"train_loss": -5.583097457885742, "global_step": 37395, "epoch": 890} {"train_loss": -5.503802299499512, "global_step": 37396, "epoch": 890} {"train_loss": -5.668064594268799, "global_step": 37397, "epoch": 890} {"train_loss": -5.604559898376465, "global_step": 37398, "epoch": 890} {"train_loss": -5.573248863220215, "global_step": 37399, "epoch": 890} {"train_loss": -5.638063430786133, "global_step": 37400, "epoch": 890} {"train_loss": -5.596603870391846, "global_step": 37401, "epoch": 890} {"train_loss": -5.68202018737793, "global_step": 37402, "epoch": 890} {"train_loss": -5.607872009277344, "global_step": 37403, "epoch": 890} {"train_loss": -5.565534591674805, "global_step": 37404, "epoch": 890} {"train_loss": -5.53653621673584, "global_step": 37405, "epoch": 890} {"train_loss": -5.673806667327881, "global_step": 37406, "epoch": 890} {"train_loss": -5.548513889312744, "global_step": 37407, "epoch": 890} {"train_loss": -5.542446136474609, "global_step": 37408, "epoch": 890} {"train_loss": -5.60407829284668, "global_step": 37409, "epoch": 890} {"train_loss": -5.6614556312561035, "global_step": 37410, "epoch": 890} {"train_loss": -5.58462381362915, "global_step": 37411, "epoch": 890} {"train_loss": -5.520758152008057, "global_step": 37412, "epoch": 890} {"train_loss": -5.53883171081543, "global_step": 37413, "epoch": 890} {"train_loss": -5.5471038818359375, "global_step": 37414, "epoch": 890} {"train_loss": -5.64802360534668, "global_step": 37415, "epoch": 890} {"train_loss": -5.691025257110596, "global_step": 37416, "epoch": 890} {"train_loss": -5.504250526428223, "global_step": 37417, "epoch": 890} {"train_loss": -5.511099338531494, "global_step": 37418, "epoch": 890} {"train_loss": -5.476280212402344, "global_step": 37419, "epoch": 890} {"train_loss": -5.478191375732422, "global_step": 37420, "epoch": 890} {"train_loss": -5.582443032945905, "global_step": 37421, "epoch": 890, "val_loss": 74439.28125} {"train_loss": -5.509953498840332, "global_step": 37422, "epoch": 891} {"train_loss": -5.531224250793457, "global_step": 37423, "epoch": 891} {"train_loss": -5.469947814941406, "global_step": 37424, "epoch": 891} {"train_loss": -5.531331539154053, "global_step": 37425, "epoch": 891} {"train_loss": -5.491672515869141, "global_step": 37426, "epoch": 891} {"train_loss": -5.66229248046875, "global_step": 37427, "epoch": 891} {"train_loss": -5.620661735534668, "global_step": 37428, "epoch": 891} {"train_loss": -5.59077262878418, "global_step": 37429, "epoch": 891} {"train_loss": -5.519301891326904, "global_step": 37430, "epoch": 891} {"train_loss": -5.587718486785889, "global_step": 37431, "epoch": 891} {"train_loss": -5.567599773406982, "global_step": 37432, "epoch": 891} {"train_loss": -5.499448299407959, "global_step": 37433, "epoch": 891} {"train_loss": -5.498682975769043, "global_step": 37434, "epoch": 891} {"train_loss": -5.530684471130371, "global_step": 37435, "epoch": 891} {"train_loss": -5.537266731262207, "global_step": 37436, "epoch": 891} {"train_loss": -5.590047836303711, "global_step": 37437, "epoch": 891} {"train_loss": -5.741457939147949, "global_step": 37438, "epoch": 891} {"train_loss": -5.530925273895264, "global_step": 37439, "epoch": 891} {"train_loss": -5.579887390136719, "global_step": 37440, "epoch": 891} {"train_loss": -5.595328330993652, "global_step": 37441, "epoch": 891} {"train_loss": -5.605842113494873, "global_step": 37442, "epoch": 891} {"train_loss": -5.57083797454834, "global_step": 37443, "epoch": 891} {"train_loss": -5.585590362548828, "global_step": 37444, "epoch": 891} {"train_loss": -5.598291397094727, "global_step": 37445, "epoch": 891} {"train_loss": -5.599151611328125, "global_step": 37446, "epoch": 891} {"train_loss": -5.551342487335205, "global_step": 37447, "epoch": 891} {"train_loss": -5.663473606109619, "global_step": 37448, "epoch": 891} {"train_loss": -5.65535831451416, "global_step": 37449, "epoch": 891} {"train_loss": -5.481408596038818, "global_step": 37450, "epoch": 891} {"train_loss": -5.710191249847412, "global_step": 37451, "epoch": 891} {"train_loss": -5.653775215148926, "global_step": 37452, "epoch": 891} {"train_loss": -5.638172149658203, "global_step": 37453, "epoch": 891} {"train_loss": -5.647727966308594, "global_step": 37454, "epoch": 891} {"train_loss": -5.601439476013184, "global_step": 37455, "epoch": 891} {"train_loss": -5.47023868560791, "global_step": 37456, "epoch": 891} {"train_loss": -5.551976203918457, "global_step": 37457, "epoch": 891} {"train_loss": -5.594605445861816, "global_step": 37458, "epoch": 891} {"train_loss": -5.611894607543945, "global_step": 37459, "epoch": 891} {"train_loss": -5.647412300109863, "global_step": 37460, "epoch": 891} {"train_loss": -5.611569404602051, "global_step": 37461, "epoch": 891} {"train_loss": -5.579825401306152, "global_step": 37462, "epoch": 891} {"train_loss": -5.582805962789626, "global_step": 37463, "epoch": 891, "val_loss": 73906.3046875} {"train_loss": -5.648594856262207, "global_step": 37464, "epoch": 892} {"train_loss": -5.561568260192871, "global_step": 37465, "epoch": 892} {"train_loss": -5.581969261169434, "global_step": 37466, "epoch": 892} {"train_loss": -5.532900333404541, "global_step": 37467, "epoch": 892} {"train_loss": -5.683646202087402, "global_step": 37468, "epoch": 892} {"train_loss": -5.419780731201172, "global_step": 37469, "epoch": 892} {"train_loss": -5.584486961364746, "global_step": 37470, "epoch": 892} {"train_loss": -5.434195518493652, "global_step": 37471, "epoch": 892} {"train_loss": -5.487050533294678, "global_step": 37472, "epoch": 892} {"train_loss": -5.627681255340576, "global_step": 37473, "epoch": 892} {"train_loss": -5.463994026184082, "global_step": 37474, "epoch": 892} {"train_loss": -5.539680480957031, "global_step": 37475, "epoch": 892} {"train_loss": -5.6365814208984375, "global_step": 37476, "epoch": 892} {"train_loss": -5.582849502563477, "global_step": 37477, "epoch": 892} {"train_loss": -5.517921447753906, "global_step": 37478, "epoch": 892} {"train_loss": -5.552397727966309, "global_step": 37479, "epoch": 892} {"train_loss": -5.665965557098389, "global_step": 37480, "epoch": 892} {"train_loss": -5.5473222732543945, "global_step": 37481, "epoch": 892} {"train_loss": -5.6078200340271, "global_step": 37482, "epoch": 892} {"train_loss": -5.683684349060059, "global_step": 37483, "epoch": 892} {"train_loss": -5.6595306396484375, "global_step": 37484, "epoch": 892} {"train_loss": -5.624934196472168, "global_step": 37485, "epoch": 892} {"train_loss": -5.562260150909424, "global_step": 37486, "epoch": 892} {"train_loss": -5.547805309295654, "global_step": 37487, "epoch": 892} {"train_loss": -5.547504425048828, "global_step": 37488, "epoch": 892} {"train_loss": -5.555553436279297, "global_step": 37489, "epoch": 892} {"train_loss": -5.66146183013916, "global_step": 37490, "epoch": 892} {"train_loss": -5.465376377105713, "global_step": 37491, "epoch": 892} {"train_loss": -5.642482757568359, "global_step": 37492, "epoch": 892} {"train_loss": -5.5939621925354, "global_step": 37493, "epoch": 892} {"train_loss": -5.653678894042969, "global_step": 37494, "epoch": 892} {"train_loss": -5.707468509674072, "global_step": 37495, "epoch": 892} {"train_loss": -5.479520797729492, "global_step": 37496, "epoch": 892} {"train_loss": -5.402589797973633, "global_step": 37497, "epoch": 892} {"train_loss": -5.5283002853393555, "global_step": 37498, "epoch": 892} {"train_loss": -5.681368350982666, "global_step": 37499, "epoch": 892} {"train_loss": -5.470082759857178, "global_step": 37500, "epoch": 892} {"train_loss": -5.562640190124512, "global_step": 37501, "epoch": 892} {"train_loss": -5.571819305419922, "global_step": 37502, "epoch": 892} {"train_loss": -5.554352760314941, "global_step": 37503, "epoch": 892} {"train_loss": -5.566256046295166, "global_step": 37504, "epoch": 892} {"train_loss": -5.569904259272984, "global_step": 37505, "epoch": 892, "val_loss": 74239.0390625} {"train_loss": -5.511101722717285, "global_step": 37506, "epoch": 893} {"train_loss": -5.626583576202393, "global_step": 37507, "epoch": 893} {"train_loss": -5.597060680389404, "global_step": 37508, "epoch": 893} {"train_loss": -5.683158874511719, "global_step": 37509, "epoch": 893} {"train_loss": -5.628460884094238, "global_step": 37510, "epoch": 893} {"train_loss": -5.569180488586426, "global_step": 37511, "epoch": 893} {"train_loss": -5.690272331237793, "global_step": 37512, "epoch": 893} {"train_loss": -5.557242393493652, "global_step": 37513, "epoch": 893} {"train_loss": -5.57036018371582, "global_step": 37514, "epoch": 893} {"train_loss": -5.6411027908325195, "global_step": 37515, "epoch": 893} {"train_loss": -5.548126220703125, "global_step": 37516, "epoch": 893} {"train_loss": -5.65766716003418, "global_step": 37517, "epoch": 893} {"train_loss": -5.642566680908203, "global_step": 37518, "epoch": 893} {"train_loss": -5.639077186584473, "global_step": 37519, "epoch": 893} {"train_loss": -5.57357120513916, "global_step": 37520, "epoch": 893} {"train_loss": -5.672934055328369, "global_step": 37521, "epoch": 893} {"train_loss": -5.555728912353516, "global_step": 37522, "epoch": 893} {"train_loss": -5.592035293579102, "global_step": 37523, "epoch": 893} {"train_loss": -5.467897891998291, "global_step": 37524, "epoch": 893} {"train_loss": -5.572935581207275, "global_step": 37525, "epoch": 893} {"train_loss": -5.524717330932617, "global_step": 37526, "epoch": 893} {"train_loss": -5.518398761749268, "global_step": 37527, "epoch": 893} {"train_loss": -5.6020073890686035, "global_step": 37528, "epoch": 893} {"train_loss": -5.628959655761719, "global_step": 37529, "epoch": 893} {"train_loss": -5.418940544128418, "global_step": 37530, "epoch": 893} {"train_loss": -5.572720527648926, "global_step": 37531, "epoch": 893} {"train_loss": -5.440284729003906, "global_step": 37532, "epoch": 893} {"train_loss": -5.367259502410889, "global_step": 37533, "epoch": 893} {"train_loss": -5.540414810180664, "global_step": 37534, "epoch": 893} {"train_loss": -5.4721174240112305, "global_step": 37535, "epoch": 893} {"train_loss": -5.511898994445801, "global_step": 37536, "epoch": 893} {"train_loss": -5.506328582763672, "global_step": 37537, "epoch": 893} {"train_loss": -5.506111145019531, "global_step": 37538, "epoch": 893} {"train_loss": -5.5693159103393555, "global_step": 37539, "epoch": 893} {"train_loss": -5.533071041107178, "global_step": 37540, "epoch": 893} {"train_loss": -5.546271800994873, "global_step": 37541, "epoch": 893} {"train_loss": -5.537630081176758, "global_step": 37542, "epoch": 893} {"train_loss": -5.566770076751709, "global_step": 37543, "epoch": 893} {"train_loss": -5.723587512969971, "global_step": 37544, "epoch": 893} {"train_loss": -5.549619674682617, "global_step": 37545, "epoch": 893} {"train_loss": -5.5684003829956055, "global_step": 37546, "epoch": 893} {"train_loss": -5.564948399861653, "global_step": 37547, "epoch": 893, "val_loss": 73552.390625} {"train_loss": -5.674358367919922, "global_step": 37548, "epoch": 894} {"train_loss": -5.470413684844971, "global_step": 37549, "epoch": 894} {"train_loss": -5.637255668640137, "global_step": 37550, "epoch": 894} {"train_loss": -5.5716753005981445, "global_step": 37551, "epoch": 894} {"train_loss": -5.623599529266357, "global_step": 37552, "epoch": 894} {"train_loss": -5.626026153564453, "global_step": 37553, "epoch": 894} {"train_loss": -5.613584518432617, "global_step": 37554, "epoch": 894} {"train_loss": -5.442441940307617, "global_step": 37555, "epoch": 894} {"train_loss": -5.712738990783691, "global_step": 37556, "epoch": 894} {"train_loss": -5.613816261291504, "global_step": 37557, "epoch": 894} {"train_loss": -5.538845539093018, "global_step": 37558, "epoch": 894} {"train_loss": -5.806265830993652, "global_step": 37559, "epoch": 894} {"train_loss": -5.588541030883789, "global_step": 37560, "epoch": 894} {"train_loss": -5.425632476806641, "global_step": 37561, "epoch": 894} {"train_loss": -5.662923336029053, "global_step": 37562, "epoch": 894} {"train_loss": -5.623572826385498, "global_step": 37563, "epoch": 894} {"train_loss": -5.601195335388184, "global_step": 37564, "epoch": 894} {"train_loss": -5.618462562561035, "global_step": 37565, "epoch": 894} {"train_loss": -5.684645652770996, "global_step": 37566, "epoch": 894} {"train_loss": -5.66648530960083, "global_step": 37567, "epoch": 894} {"train_loss": -5.548800468444824, "global_step": 37568, "epoch": 894} {"train_loss": -5.564915657043457, "global_step": 37569, "epoch": 894} {"train_loss": -5.58909273147583, "global_step": 37570, "epoch": 894} {"train_loss": -5.525677680969238, "global_step": 37571, "epoch": 894} {"train_loss": -5.558897018432617, "global_step": 37572, "epoch": 894} {"train_loss": -5.451005935668945, "global_step": 37573, "epoch": 894} {"train_loss": -5.582308769226074, "global_step": 37574, "epoch": 894} {"train_loss": -5.561629295349121, "global_step": 37575, "epoch": 894} {"train_loss": -5.7036309242248535, "global_step": 37576, "epoch": 894} {"train_loss": -5.581616401672363, "global_step": 37577, "epoch": 894} {"train_loss": -5.602783203125, "global_step": 37578, "epoch": 894} {"train_loss": -5.613620281219482, "global_step": 37579, "epoch": 894} {"train_loss": -5.438527584075928, "global_step": 37580, "epoch": 894} {"train_loss": -5.578568458557129, "global_step": 37581, "epoch": 894} {"train_loss": -5.679797172546387, "global_step": 37582, "epoch": 894} {"train_loss": -5.5636491775512695, "global_step": 37583, "epoch": 894} {"train_loss": -5.561593055725098, "global_step": 37584, "epoch": 894} {"train_loss": -5.441988468170166, "global_step": 37585, "epoch": 894} {"train_loss": -5.658069610595703, "global_step": 37586, "epoch": 894} {"train_loss": -5.523222923278809, "global_step": 37587, "epoch": 894} {"train_loss": -5.587070465087891, "global_step": 37588, "epoch": 894} {"train_loss": -5.587938331422352, "global_step": 37589, "epoch": 894, "val_loss": 73911.4140625} {"train_loss": -5.5704240798950195, "global_step": 37590, "epoch": 895} {"train_loss": -5.639627456665039, "global_step": 37591, "epoch": 895} {"train_loss": -5.581602573394775, "global_step": 37592, "epoch": 895} {"train_loss": -5.448155403137207, "global_step": 37593, "epoch": 895} {"train_loss": -5.631892204284668, "global_step": 37594, "epoch": 895} {"train_loss": -5.649812698364258, "global_step": 37595, "epoch": 895} {"train_loss": -5.46694803237915, "global_step": 37596, "epoch": 895} {"train_loss": -5.533103942871094, "global_step": 37597, "epoch": 895} {"train_loss": -5.747889041900635, "global_step": 37598, "epoch": 895} {"train_loss": -5.646849155426025, "global_step": 37599, "epoch": 895} {"train_loss": -5.539070129394531, "global_step": 37600, "epoch": 895} {"train_loss": -5.427267551422119, "global_step": 37601, "epoch": 895} {"train_loss": -5.5550456047058105, "global_step": 37602, "epoch": 895} {"train_loss": -5.627957344055176, "global_step": 37603, "epoch": 895} {"train_loss": -5.635626792907715, "global_step": 37604, "epoch": 895} {"train_loss": -5.613602638244629, "global_step": 37605, "epoch": 895} {"train_loss": -5.622835636138916, "global_step": 37606, "epoch": 895} {"train_loss": -5.511238098144531, "global_step": 37607, "epoch": 895} {"train_loss": -5.655256271362305, "global_step": 37608, "epoch": 895} {"train_loss": -5.674734115600586, "global_step": 37609, "epoch": 895} {"train_loss": -5.549379348754883, "global_step": 37610, "epoch": 895} {"train_loss": -5.5764970779418945, "global_step": 37611, "epoch": 895} {"train_loss": -5.478747367858887, "global_step": 37612, "epoch": 895} {"train_loss": -5.684142112731934, "global_step": 37613, "epoch": 895} {"train_loss": -5.582205772399902, "global_step": 37614, "epoch": 895} {"train_loss": -5.59820032119751, "global_step": 37615, "epoch": 895} {"train_loss": -5.727823257446289, "global_step": 37616, "epoch": 895} {"train_loss": -5.467494010925293, "global_step": 37617, "epoch": 895} {"train_loss": -5.5611724853515625, "global_step": 37618, "epoch": 895} {"train_loss": -5.664350509643555, "global_step": 37619, "epoch": 895} {"train_loss": -5.553092956542969, "global_step": 37620, "epoch": 895} {"train_loss": -5.537032127380371, "global_step": 37621, "epoch": 895} {"train_loss": -5.530813694000244, "global_step": 37622, "epoch": 895} {"train_loss": -5.53688383102417, "global_step": 37623, "epoch": 895} {"train_loss": -5.746668815612793, "global_step": 37624, "epoch": 895} {"train_loss": -5.606216907501221, "global_step": 37625, "epoch": 895} {"train_loss": -5.470179557800293, "global_step": 37626, "epoch": 895} {"train_loss": -5.551708221435547, "global_step": 37627, "epoch": 895} {"train_loss": -5.697329521179199, "global_step": 37628, "epoch": 895} {"train_loss": -5.65576171875, "global_step": 37629, "epoch": 895} {"train_loss": -5.811368942260742, "global_step": 37630, "epoch": 895} {"train_loss": -5.594312179656256, "global_step": 37631, "epoch": 895, "val_loss": 73673.2734375} {"train_loss": -5.745062828063965, "global_step": 37632, "epoch": 896} {"train_loss": -5.613985538482666, "global_step": 37633, "epoch": 896} {"train_loss": -5.567984580993652, "global_step": 37634, "epoch": 896} {"train_loss": -5.695266246795654, "global_step": 37635, "epoch": 896} {"train_loss": -5.46734619140625, "global_step": 37636, "epoch": 896} {"train_loss": -5.534312725067139, "global_step": 37637, "epoch": 896} {"train_loss": -5.525516510009766, "global_step": 37638, "epoch": 896} {"train_loss": -5.656889915466309, "global_step": 37639, "epoch": 896} {"train_loss": -5.5755720138549805, "global_step": 37640, "epoch": 896} {"train_loss": -5.517570495605469, "global_step": 37641, "epoch": 896} {"train_loss": -5.39762020111084, "global_step": 37642, "epoch": 896} {"train_loss": -5.5799055099487305, "global_step": 37643, "epoch": 896} {"train_loss": -5.615382194519043, "global_step": 37644, "epoch": 896} {"train_loss": -5.3744025230407715, "global_step": 37645, "epoch": 896} {"train_loss": -5.708521366119385, "global_step": 37646, "epoch": 896} {"train_loss": -5.604581832885742, "global_step": 37647, "epoch": 896} {"train_loss": -5.57541561126709, "global_step": 37648, "epoch": 896} {"train_loss": -5.565542221069336, "global_step": 37649, "epoch": 896} {"train_loss": -5.617099761962891, "global_step": 37650, "epoch": 896} {"train_loss": -5.416363716125488, "global_step": 37651, "epoch": 896} {"train_loss": -5.634446620941162, "global_step": 37652, "epoch": 896} {"train_loss": -5.496101379394531, "global_step": 37653, "epoch": 896} {"train_loss": -5.572264194488525, "global_step": 37654, "epoch": 896} {"train_loss": -5.607271671295166, "global_step": 37655, "epoch": 896} {"train_loss": -5.641532897949219, "global_step": 37656, "epoch": 896} {"train_loss": -5.6467204093933105, "global_step": 37657, "epoch": 896} {"train_loss": -5.537240982055664, "global_step": 37658, "epoch": 896} {"train_loss": -5.573453903198242, "global_step": 37659, "epoch": 896} {"train_loss": -5.555876731872559, "global_step": 37660, "epoch": 896} {"train_loss": -5.630239486694336, "global_step": 37661, "epoch": 896} {"train_loss": -5.613622665405273, "global_step": 37662, "epoch": 896} {"train_loss": -5.6385369300842285, "global_step": 37663, "epoch": 896} {"train_loss": -5.649917125701904, "global_step": 37664, "epoch": 896} {"train_loss": -5.431949615478516, "global_step": 37665, "epoch": 896} {"train_loss": -5.53270149230957, "global_step": 37666, "epoch": 896} {"train_loss": -5.515081405639648, "global_step": 37667, "epoch": 896} {"train_loss": -5.697371482849121, "global_step": 37668, "epoch": 896} {"train_loss": -5.499159812927246, "global_step": 37669, "epoch": 896} {"train_loss": -5.726042747497559, "global_step": 37670, "epoch": 896} {"train_loss": -5.6698408126831055, "global_step": 37671, "epoch": 896} {"train_loss": -5.56429386138916, "global_step": 37672, "epoch": 896} {"train_loss": -5.582111131577265, "global_step": 37673, "epoch": 896, "val_loss": 73415.671875} {"train_loss": -5.478435516357422, "global_step": 37674, "epoch": 897} {"train_loss": -5.625577926635742, "global_step": 37675, "epoch": 897} {"train_loss": -5.590023040771484, "global_step": 37676, "epoch": 897} {"train_loss": -5.5978240966796875, "global_step": 37677, "epoch": 897} {"train_loss": -5.60262393951416, "global_step": 37678, "epoch": 897} {"train_loss": -5.607862949371338, "global_step": 37679, "epoch": 897} {"train_loss": -5.674480438232422, "global_step": 37680, "epoch": 897} {"train_loss": -5.60888147354126, "global_step": 37681, "epoch": 897} {"train_loss": -5.628392219543457, "global_step": 37682, "epoch": 897} {"train_loss": -5.532214164733887, "global_step": 37683, "epoch": 897} {"train_loss": -5.527891159057617, "global_step": 37684, "epoch": 897} {"train_loss": -5.549205780029297, "global_step": 37685, "epoch": 897} {"train_loss": -5.494915962219238, "global_step": 37686, "epoch": 897} {"train_loss": -5.6155781745910645, "global_step": 37687, "epoch": 897} {"train_loss": -5.664205074310303, "global_step": 37688, "epoch": 897} {"train_loss": -5.613225936889648, "global_step": 37689, "epoch": 897} {"train_loss": -5.547329902648926, "global_step": 37690, "epoch": 897} {"train_loss": -5.556612968444824, "global_step": 37691, "epoch": 897} {"train_loss": -5.6779022216796875, "global_step": 37692, "epoch": 897} {"train_loss": -5.653007984161377, "global_step": 37693, "epoch": 897} {"train_loss": -5.556009292602539, "global_step": 37694, "epoch": 897} {"train_loss": -5.622244834899902, "global_step": 37695, "epoch": 897} {"train_loss": -5.638686180114746, "global_step": 37696, "epoch": 897} {"train_loss": -5.667042255401611, "global_step": 37697, "epoch": 897} {"train_loss": -5.494135856628418, "global_step": 37698, "epoch": 897} {"train_loss": -5.652311325073242, "global_step": 37699, "epoch": 897} {"train_loss": -5.6615777015686035, "global_step": 37700, "epoch": 897} {"train_loss": -5.59388542175293, "global_step": 37701, "epoch": 897} {"train_loss": -5.629396438598633, "global_step": 37702, "epoch": 897} {"train_loss": -5.614415645599365, "global_step": 37703, "epoch": 897} {"train_loss": -5.67410945892334, "global_step": 37704, "epoch": 897} {"train_loss": -5.771416187286377, "global_step": 37705, "epoch": 897} {"train_loss": -5.583518028259277, "global_step": 37706, "epoch": 897} {"train_loss": -5.585597038269043, "global_step": 37707, "epoch": 897} {"train_loss": -5.631589412689209, "global_step": 37708, "epoch": 897} {"train_loss": -5.548369884490967, "global_step": 37709, "epoch": 897} {"train_loss": -5.539172649383545, "global_step": 37710, "epoch": 897} {"train_loss": -5.575014114379883, "global_step": 37711, "epoch": 897} {"train_loss": -5.5793585777282715, "global_step": 37712, "epoch": 897} {"train_loss": -5.632643699645996, "global_step": 37713, "epoch": 897} {"train_loss": -5.690351486206055, "global_step": 37714, "epoch": 897} {"train_loss": -5.605752456755865, "global_step": 37715, "epoch": 897, "val_loss": 73790.8046875} {"train_loss": -5.607113838195801, "global_step": 37716, "epoch": 898} {"train_loss": -5.526768207550049, "global_step": 37717, "epoch": 898} {"train_loss": -5.589829444885254, "global_step": 37718, "epoch": 898} {"train_loss": -5.622188568115234, "global_step": 37719, "epoch": 898} {"train_loss": -5.503910064697266, "global_step": 37720, "epoch": 898} {"train_loss": -5.645735740661621, "global_step": 37721, "epoch": 898} {"train_loss": -5.654080867767334, "global_step": 37722, "epoch": 898} {"train_loss": -5.523929595947266, "global_step": 37723, "epoch": 898} {"train_loss": -5.621504306793213, "global_step": 37724, "epoch": 898} {"train_loss": -5.678977012634277, "global_step": 37725, "epoch": 898} {"train_loss": -5.598026275634766, "global_step": 37726, "epoch": 898} {"train_loss": -5.542349815368652, "global_step": 37727, "epoch": 898} {"train_loss": -5.642579078674316, "global_step": 37728, "epoch": 898} {"train_loss": -5.564628601074219, "global_step": 37729, "epoch": 898} {"train_loss": -5.41471529006958, "global_step": 37730, "epoch": 898} {"train_loss": -5.651408672332764, "global_step": 37731, "epoch": 898} {"train_loss": -5.639475345611572, "global_step": 37732, "epoch": 898} {"train_loss": -5.558753967285156, "global_step": 37733, "epoch": 898} {"train_loss": -5.60667610168457, "global_step": 37734, "epoch": 898} {"train_loss": -5.601667881011963, "global_step": 37735, "epoch": 898} {"train_loss": -5.610006332397461, "global_step": 37736, "epoch": 898} {"train_loss": -5.616732597351074, "global_step": 37737, "epoch": 898} {"train_loss": -5.639115333557129, "global_step": 37738, "epoch": 898} {"train_loss": -5.6058349609375, "global_step": 37739, "epoch": 898} {"train_loss": -5.671132564544678, "global_step": 37740, "epoch": 898} {"train_loss": -5.688446998596191, "global_step": 37741, "epoch": 898} {"train_loss": -5.524298667907715, "global_step": 37742, "epoch": 898} {"train_loss": -5.559564590454102, "global_step": 37743, "epoch": 898} {"train_loss": -5.5395917892456055, "global_step": 37744, "epoch": 898} {"train_loss": -5.618917942047119, "global_step": 37745, "epoch": 898} {"train_loss": -5.570557594299316, "global_step": 37746, "epoch": 898} {"train_loss": -5.420281410217285, "global_step": 37747, "epoch": 898} {"train_loss": -5.563374042510986, "global_step": 37748, "epoch": 898} {"train_loss": -5.608927249908447, "global_step": 37749, "epoch": 898} {"train_loss": -5.485935211181641, "global_step": 37750, "epoch": 898} {"train_loss": -5.625981330871582, "global_step": 37751, "epoch": 898} {"train_loss": -5.540812969207764, "global_step": 37752, "epoch": 898} {"train_loss": -5.539247512817383, "global_step": 37753, "epoch": 898} {"train_loss": -5.518278121948242, "global_step": 37754, "epoch": 898} {"train_loss": -5.52943754196167, "global_step": 37755, "epoch": 898} {"train_loss": -5.550814628601074, "global_step": 37756, "epoch": 898} {"train_loss": -5.581156060809181, "global_step": 37757, "epoch": 898, "val_loss": 73611.1484375} {"train_loss": -5.704525947570801, "global_step": 37758, "epoch": 899} {"train_loss": -5.599100112915039, "global_step": 37759, "epoch": 899} {"train_loss": -5.530961513519287, "global_step": 37760, "epoch": 899} {"train_loss": -5.65786075592041, "global_step": 37761, "epoch": 899} {"train_loss": -5.628042221069336, "global_step": 37762, "epoch": 899} {"train_loss": -5.611104965209961, "global_step": 37763, "epoch": 899} {"train_loss": -5.66165828704834, "global_step": 37764, "epoch": 899} {"train_loss": -5.497514247894287, "global_step": 37765, "epoch": 899} {"train_loss": -5.559524059295654, "global_step": 37766, "epoch": 899} {"train_loss": -5.692157745361328, "global_step": 37767, "epoch": 899} {"train_loss": -5.552026748657227, "global_step": 37768, "epoch": 899} {"train_loss": -5.646934509277344, "global_step": 37769, "epoch": 899} {"train_loss": -5.555653095245361, "global_step": 37770, "epoch": 899} {"train_loss": -5.722413063049316, "global_step": 37771, "epoch": 899} {"train_loss": -5.611494064331055, "global_step": 37772, "epoch": 899} {"train_loss": -5.5381879806518555, "global_step": 37773, "epoch": 899} {"train_loss": -5.5323100090026855, "global_step": 37774, "epoch": 899} {"train_loss": -5.690732002258301, "global_step": 37775, "epoch": 899} {"train_loss": -5.693251609802246, "global_step": 37776, "epoch": 899} {"train_loss": -5.67848539352417, "global_step": 37777, "epoch": 899} {"train_loss": -5.757740020751953, "global_step": 37778, "epoch": 899} {"train_loss": -5.569169998168945, "global_step": 37779, "epoch": 899} {"train_loss": -5.635536193847656, "global_step": 37780, "epoch": 899} {"train_loss": -5.588146209716797, "global_step": 37781, "epoch": 899} {"train_loss": -5.574260234832764, "global_step": 37782, "epoch": 899} {"train_loss": -5.515463352203369, "global_step": 37783, "epoch": 899} {"train_loss": -5.593921184539795, "global_step": 37784, "epoch": 899} {"train_loss": -5.340527057647705, "global_step": 37785, "epoch": 899} {"train_loss": -5.6870222091674805, "global_step": 37786, "epoch": 899} {"train_loss": -5.489544868469238, "global_step": 37787, "epoch": 899} {"train_loss": -5.648436546325684, "global_step": 37788, "epoch": 899} {"train_loss": -5.557096004486084, "global_step": 37789, "epoch": 899} {"train_loss": -5.457665920257568, "global_step": 37790, "epoch": 899} {"train_loss": -5.503340721130371, "global_step": 37791, "epoch": 899} {"train_loss": -5.506618022918701, "global_step": 37792, "epoch": 899} {"train_loss": -5.601950168609619, "global_step": 37793, "epoch": 899} {"train_loss": -5.664939880371094, "global_step": 37794, "epoch": 899} {"train_loss": -5.595165252685547, "global_step": 37795, "epoch": 899} {"train_loss": -5.642368793487549, "global_step": 37796, "epoch": 899} {"train_loss": -5.648777961730957, "global_step": 37797, "epoch": 899} {"train_loss": -5.511422634124756, "global_step": 37798, "epoch": 899} {"train_loss": -5.600351628803072, "global_step": 37799, "epoch": 899, "val_loss": 73897.5078125} {"train_loss": -5.568604469299316, "global_step": 37800, "epoch": 900} {"train_loss": -5.640833854675293, "global_step": 37801, "epoch": 900} {"train_loss": -5.6516828536987305, "global_step": 37802, "epoch": 900} {"train_loss": -5.62176513671875, "global_step": 37803, "epoch": 900} {"train_loss": -5.618351936340332, "global_step": 37804, "epoch": 900} {"train_loss": -5.618320941925049, "global_step": 37805, "epoch": 900} {"train_loss": -5.473409652709961, "global_step": 37806, "epoch": 900} {"train_loss": -5.603034496307373, "global_step": 37807, "epoch": 900} {"train_loss": -5.631245136260986, "global_step": 37808, "epoch": 900} {"train_loss": -5.683744430541992, "global_step": 37809, "epoch": 900} {"train_loss": -5.561246871948242, "global_step": 37810, "epoch": 900} {"train_loss": -5.6814446449279785, "global_step": 37811, "epoch": 900} {"train_loss": -5.700896739959717, "global_step": 37812, "epoch": 900} {"train_loss": -5.619732856750488, "global_step": 37813, "epoch": 900} {"train_loss": -5.594593048095703, "global_step": 37814, "epoch": 900} {"train_loss": -5.622971534729004, "global_step": 37815, "epoch": 900} {"train_loss": -5.722253799438477, "global_step": 37816, "epoch": 900} {"train_loss": -5.555259704589844, "global_step": 37817, "epoch": 900} {"train_loss": -5.409463882446289, "global_step": 37818, "epoch": 900} {"train_loss": -5.592886924743652, "global_step": 37819, "epoch": 900} {"train_loss": -5.558357238769531, "global_step": 37820, "epoch": 900} {"train_loss": -5.585325241088867, "global_step": 37821, "epoch": 900} {"train_loss": -5.567687511444092, "global_step": 37822, "epoch": 900} {"train_loss": -5.392144203186035, "global_step": 37823, "epoch": 900} {"train_loss": -5.6522216796875, "global_step": 37824, "epoch": 900} {"train_loss": -5.627906799316406, "global_step": 37825, "epoch": 900} {"train_loss": -5.589990139007568, "global_step": 37826, "epoch": 900} {"train_loss": -5.564519882202148, "global_step": 37827, "epoch": 900} {"train_loss": -5.568358421325684, "global_step": 37828, "epoch": 900} {"train_loss": -5.616965293884277, "global_step": 37829, "epoch": 900} {"train_loss": -5.540836334228516, "global_step": 37830, "epoch": 900} {"train_loss": -5.61750602722168, "global_step": 37831, "epoch": 900} {"train_loss": -5.676257133483887, "global_step": 37832, "epoch": 900} {"train_loss": -5.544724464416504, "global_step": 37833, "epoch": 900} {"train_loss": -5.540218830108643, "global_step": 37834, "epoch": 900} {"train_loss": -5.688484191894531, "global_step": 37835, "epoch": 900} {"train_loss": -5.386847972869873, "global_step": 37836, "epoch": 900} {"train_loss": -5.512359142303467, "global_step": 37837, "epoch": 900} {"train_loss": -5.5184831619262695, "global_step": 37838, "epoch": 900} {"train_loss": -5.614969253540039, "global_step": 37839, "epoch": 900} {"train_loss": -5.591429233551025, "global_step": 37840, "epoch": 900} {"train_loss": -5.586886667069935, "global_step": 37841, "epoch": 900, "train/sim_max_reward_0": 0.4594857058200651, "train/sim_max_reward_1": 0.22835416034800476, "train/sim_max_reward_2": 0.5218646257446343, "train/sim_max_reward_3": 0.16477693996845774, "train/sim_max_reward_4": 0.3654880392677678, "train/sim_max_reward_5": 0.29435575246533474, "test/sim_max_reward_4500000": 0.3620336333032774, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.41179811031951646, "test/sim_max_reward_4500003": 0.555955857603219, "test/sim_max_reward_4500004": 0.1281057620199091, "test/sim_max_reward_4500005": 0.24236719208601035, "test/sim_max_reward_4500006": 0.4209259206263483, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.45576901514455576, "test/sim_max_reward_4500010": 0.41871486251702217, "test/sim_max_reward_4500011": 0.3863961898886225, "test/sim_max_reward_4500012": 0.3256519574395099, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.36893157829393775, "test/sim_max_reward_4500015": 0.033980620462254627, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.00023629381843596618, "test/sim_max_reward_4500018": 0.35844798970918423, "test/sim_max_reward_4500019": 0.7481085428923135, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.7382163726745021, "test/sim_max_reward_4500022": 0.35217504643252145, "test/sim_max_reward_4500023": 0.855013084034137, "test/sim_max_reward_4500024": 0.15717544171661046, "test/sim_max_reward_4500025": 0.3484781317524406, "test/sim_max_reward_4500026": 0.2554695966297123, "test/sim_max_reward_4500027": 0.6198122312808859, "test/sim_max_reward_4500028": 0.5030692190246355, "test/sim_max_reward_4500029": 0.24947316395140412, "test/sim_max_reward_4500030": 0.45305295568234305, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.7279616233718221, "test/sim_max_reward_4500033": 0.06449980291198594, "test/sim_max_reward_4500034": 0.7152587540327138, "test/sim_max_reward_4500035": 0.4812774103864851, "test/sim_max_reward_4500036": 0.37641820269157755, "test/sim_max_reward_4500037": 0.6093638435677604, "test/sim_max_reward_4500038": 0.8462415327992083, "test/sim_max_reward_4500039": 0.46079341914764127, "test/sim_max_reward_4500040": 0.7141688899221055, "test/sim_max_reward_4500041": 0.2634683485746549, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.3368571390502889, "test/sim_max_reward_4500044": 0.21902982050267378, "test/sim_max_reward_4500045": 0.12093410127977063, "test/sim_max_reward_4500046": 0.5867336694344727, "test/sim_max_reward_4500047": 0.005041475295940158, "test/sim_max_reward_4500048": 0.44202967655797154, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.33905420393571073, "test/mean_score": 0.3351884057081012, "val_loss": 74038.6015625} {"train_loss": -5.460580825805664, "global_step": 37842, "epoch": 901} {"train_loss": -5.600366592407227, "global_step": 37843, "epoch": 901} {"train_loss": -5.512199401855469, "global_step": 37844, "epoch": 901} {"train_loss": -5.554651260375977, "global_step": 37845, "epoch": 901} {"train_loss": -5.628843307495117, "global_step": 37846, "epoch": 901} {"train_loss": -5.563043117523193, "global_step": 37847, "epoch": 901} {"train_loss": -5.5578227043151855, "global_step": 37848, "epoch": 901} {"train_loss": -5.573357105255127, "global_step": 37849, "epoch": 901} {"train_loss": -5.6036577224731445, "global_step": 37850, "epoch": 901} {"train_loss": -5.545990467071533, "global_step": 37851, "epoch": 901} {"train_loss": -5.591057300567627, "global_step": 37852, "epoch": 901} {"train_loss": -5.541650295257568, "global_step": 37853, "epoch": 901} {"train_loss": -5.7014055252075195, "global_step": 37854, "epoch": 901} {"train_loss": -5.675354480743408, "global_step": 37855, "epoch": 901} {"train_loss": -5.666201591491699, "global_step": 37856, "epoch": 901} {"train_loss": -5.644394397735596, "global_step": 37857, "epoch": 901} {"train_loss": -5.572597503662109, "global_step": 37858, "epoch": 901} {"train_loss": -5.600619316101074, "global_step": 37859, "epoch": 901} {"train_loss": -5.568609237670898, "global_step": 37860, "epoch": 901} {"train_loss": -5.6000261306762695, "global_step": 37861, "epoch": 901} {"train_loss": -5.583544731140137, "global_step": 37862, "epoch": 901} {"train_loss": -5.72067928314209, "global_step": 37863, "epoch": 901} {"train_loss": -5.518377304077148, "global_step": 37864, "epoch": 901} {"train_loss": -5.5714430809021, "global_step": 37865, "epoch": 901} {"train_loss": -5.529727458953857, "global_step": 37866, "epoch": 901} {"train_loss": -5.5689473152160645, "global_step": 37867, "epoch": 901} {"train_loss": -5.701784133911133, "global_step": 37868, "epoch": 901} {"train_loss": -5.454437255859375, "global_step": 37869, "epoch": 901} {"train_loss": -5.5560173988342285, "global_step": 37870, "epoch": 901} {"train_loss": -5.558459281921387, "global_step": 37871, "epoch": 901} {"train_loss": -5.631096363067627, "global_step": 37872, "epoch": 901} {"train_loss": -5.509383678436279, "global_step": 37873, "epoch": 901} {"train_loss": -5.490150451660156, "global_step": 37874, "epoch": 901} {"train_loss": -5.717430114746094, "global_step": 37875, "epoch": 901} {"train_loss": -5.548534393310547, "global_step": 37876, "epoch": 901} {"train_loss": -5.619712829589844, "global_step": 37877, "epoch": 901} {"train_loss": -5.590236186981201, "global_step": 37878, "epoch": 901} {"train_loss": -5.547774314880371, "global_step": 37879, "epoch": 901} {"train_loss": -5.449647903442383, "global_step": 37880, "epoch": 901} {"train_loss": -5.587647914886475, "global_step": 37881, "epoch": 901} {"train_loss": -5.389530658721924, "global_step": 37882, "epoch": 901} {"train_loss": -5.576197601500011, "global_step": 37883, "epoch": 901, "val_loss": 74676.3359375} {"train_loss": -5.516613006591797, "global_step": 37884, "epoch": 902} {"train_loss": -5.702140808105469, "global_step": 37885, "epoch": 902} {"train_loss": -5.531193733215332, "global_step": 37886, "epoch": 902} {"train_loss": -5.5824432373046875, "global_step": 37887, "epoch": 902} {"train_loss": -5.716997146606445, "global_step": 37888, "epoch": 902} {"train_loss": -5.358708381652832, "global_step": 37889, "epoch": 902} {"train_loss": -5.578412055969238, "global_step": 37890, "epoch": 902} {"train_loss": -5.47151517868042, "global_step": 37891, "epoch": 902} {"train_loss": -5.769113063812256, "global_step": 37892, "epoch": 902} {"train_loss": -5.425325393676758, "global_step": 37893, "epoch": 902} {"train_loss": -5.628622055053711, "global_step": 37894, "epoch": 902} {"train_loss": -5.549538612365723, "global_step": 37895, "epoch": 902} {"train_loss": -5.488994598388672, "global_step": 37896, "epoch": 902} {"train_loss": -5.6173601150512695, "global_step": 37897, "epoch": 902} {"train_loss": -5.563417434692383, "global_step": 37898, "epoch": 902} {"train_loss": -5.656523704528809, "global_step": 37899, "epoch": 902} {"train_loss": -5.509605407714844, "global_step": 37900, "epoch": 902} {"train_loss": -5.533581256866455, "global_step": 37901, "epoch": 902} {"train_loss": -5.641566276550293, "global_step": 37902, "epoch": 902} {"train_loss": -5.5728607177734375, "global_step": 37903, "epoch": 902} {"train_loss": -5.543060302734375, "global_step": 37904, "epoch": 902} {"train_loss": -5.550500869750977, "global_step": 37905, "epoch": 902} {"train_loss": -5.5118513107299805, "global_step": 37906, "epoch": 902} {"train_loss": -5.612752914428711, "global_step": 37907, "epoch": 902} {"train_loss": -5.539206027984619, "global_step": 37908, "epoch": 902} {"train_loss": -5.630477428436279, "global_step": 37909, "epoch": 902} {"train_loss": -5.54536247253418, "global_step": 37910, "epoch": 902} {"train_loss": -5.526418685913086, "global_step": 37911, "epoch": 902} {"train_loss": -5.5849785804748535, "global_step": 37912, "epoch": 902} {"train_loss": -5.7918314933776855, "global_step": 37913, "epoch": 902} {"train_loss": -5.60539436340332, "global_step": 37914, "epoch": 902} {"train_loss": -5.626646041870117, "global_step": 37915, "epoch": 902} {"train_loss": -5.6031036376953125, "global_step": 37916, "epoch": 902} {"train_loss": -5.455745220184326, "global_step": 37917, "epoch": 902} {"train_loss": -5.642678260803223, "global_step": 37918, "epoch": 902} {"train_loss": -5.611919403076172, "global_step": 37919, "epoch": 902} {"train_loss": -5.567017078399658, "global_step": 37920, "epoch": 902} {"train_loss": -5.595832824707031, "global_step": 37921, "epoch": 902} {"train_loss": -5.657257080078125, "global_step": 37922, "epoch": 902} {"train_loss": -5.696356773376465, "global_step": 37923, "epoch": 902} {"train_loss": -5.635765552520752, "global_step": 37924, "epoch": 902} {"train_loss": -5.585700784410749, "global_step": 37925, "epoch": 902, "val_loss": 73611.5625} {"train_loss": -5.70484733581543, "global_step": 37926, "epoch": 903} {"train_loss": -5.625284671783447, "global_step": 37927, "epoch": 903} {"train_loss": -5.524320602416992, "global_step": 37928, "epoch": 903} {"train_loss": -5.702418327331543, "global_step": 37929, "epoch": 903} {"train_loss": -5.648448944091797, "global_step": 37930, "epoch": 903} {"train_loss": -5.783217430114746, "global_step": 37931, "epoch": 903} {"train_loss": -5.693156719207764, "global_step": 37932, "epoch": 903} {"train_loss": -5.683109283447266, "global_step": 37933, "epoch": 903} {"train_loss": -5.529845237731934, "global_step": 37934, "epoch": 903} {"train_loss": -5.663295269012451, "global_step": 37935, "epoch": 903} {"train_loss": -5.6071062088012695, "global_step": 37936, "epoch": 903} {"train_loss": -5.563810348510742, "global_step": 37937, "epoch": 903} {"train_loss": -5.505681991577148, "global_step": 37938, "epoch": 903} {"train_loss": -5.532050609588623, "global_step": 37939, "epoch": 903} {"train_loss": -5.66931676864624, "global_step": 37940, "epoch": 903} {"train_loss": -5.622648239135742, "global_step": 37941, "epoch": 903} {"train_loss": -5.644500255584717, "global_step": 37942, "epoch": 903} {"train_loss": -5.614924430847168, "global_step": 37943, "epoch": 903} {"train_loss": -5.683521270751953, "global_step": 37944, "epoch": 903} {"train_loss": -5.587632179260254, "global_step": 37945, "epoch": 903} {"train_loss": -5.569351673126221, "global_step": 37946, "epoch": 903} {"train_loss": -5.569379806518555, "global_step": 37947, "epoch": 903} {"train_loss": -5.615117073059082, "global_step": 37948, "epoch": 903} {"train_loss": -5.520166873931885, "global_step": 37949, "epoch": 903} {"train_loss": -5.585605144500732, "global_step": 37950, "epoch": 903} {"train_loss": -5.656553268432617, "global_step": 37951, "epoch": 903} {"train_loss": -5.573700904846191, "global_step": 37952, "epoch": 903} {"train_loss": -5.488873481750488, "global_step": 37953, "epoch": 903} {"train_loss": -5.645460605621338, "global_step": 37954, "epoch": 903} {"train_loss": -5.658782958984375, "global_step": 37955, "epoch": 903} {"train_loss": -5.376130104064941, "global_step": 37956, "epoch": 903} {"train_loss": -5.5373029708862305, "global_step": 37957, "epoch": 903} {"train_loss": -5.390023231506348, "global_step": 37958, "epoch": 903} {"train_loss": -5.5978851318359375, "global_step": 37959, "epoch": 903} {"train_loss": -5.354496955871582, "global_step": 37960, "epoch": 903} {"train_loss": -5.5045576095581055, "global_step": 37961, "epoch": 903} {"train_loss": -5.589008808135986, "global_step": 37962, "epoch": 903} {"train_loss": -5.618222713470459, "global_step": 37963, "epoch": 903} {"train_loss": -5.509908676147461, "global_step": 37964, "epoch": 903} {"train_loss": -5.582970142364502, "global_step": 37965, "epoch": 903} {"train_loss": -5.497872352600098, "global_step": 37966, "epoch": 903} {"train_loss": -5.5868571145193915, "global_step": 37967, "epoch": 903, "val_loss": 74415.609375} {"train_loss": -5.609079360961914, "global_step": 37968, "epoch": 904} {"train_loss": -5.625552177429199, "global_step": 37969, "epoch": 904} {"train_loss": -5.657657623291016, "global_step": 37970, "epoch": 904} {"train_loss": -5.630209445953369, "global_step": 37971, "epoch": 904} {"train_loss": -5.608248710632324, "global_step": 37972, "epoch": 904} {"train_loss": -5.521682262420654, "global_step": 37973, "epoch": 904} {"train_loss": -5.512322902679443, "global_step": 37974, "epoch": 904} {"train_loss": -5.635196208953857, "global_step": 37975, "epoch": 904} {"train_loss": -5.723618507385254, "global_step": 37976, "epoch": 904} {"train_loss": -5.647253513336182, "global_step": 37977, "epoch": 904} {"train_loss": -5.648958206176758, "global_step": 37978, "epoch": 904} {"train_loss": -5.66951322555542, "global_step": 37979, "epoch": 904} {"train_loss": -5.653288841247559, "global_step": 37980, "epoch": 904} {"train_loss": -5.544651508331299, "global_step": 37981, "epoch": 904} {"train_loss": -5.556796550750732, "global_step": 37982, "epoch": 904} {"train_loss": -5.684022903442383, "global_step": 37983, "epoch": 904} {"train_loss": -5.523815155029297, "global_step": 37984, "epoch": 904} {"train_loss": -5.713920593261719, "global_step": 37985, "epoch": 904} {"train_loss": -5.608611583709717, "global_step": 37986, "epoch": 904} {"train_loss": -5.550843715667725, "global_step": 37987, "epoch": 904} {"train_loss": -5.5356268882751465, "global_step": 37988, "epoch": 904} {"train_loss": -5.626983642578125, "global_step": 37989, "epoch": 904} {"train_loss": -5.614119052886963, "global_step": 37990, "epoch": 904} {"train_loss": -5.700179576873779, "global_step": 37991, "epoch": 904} {"train_loss": -5.589427947998047, "global_step": 37992, "epoch": 904} {"train_loss": -5.545510292053223, "global_step": 37993, "epoch": 904} {"train_loss": -5.680267333984375, "global_step": 37994, "epoch": 904} {"train_loss": -5.454320907592773, "global_step": 37995, "epoch": 904} {"train_loss": -5.692693710327148, "global_step": 37996, "epoch": 904} {"train_loss": -5.518628120422363, "global_step": 37997, "epoch": 904} {"train_loss": -5.501655101776123, "global_step": 37998, "epoch": 904} {"train_loss": -5.487764358520508, "global_step": 37999, "epoch": 904} {"train_loss": -5.497280597686768, "global_step": 38000, "epoch": 904} {"train_loss": -5.514528274536133, "global_step": 38001, "epoch": 904} {"train_loss": -5.51654577255249, "global_step": 38002, "epoch": 904} {"train_loss": -5.627804756164551, "global_step": 38003, "epoch": 904} {"train_loss": -5.304029941558838, "global_step": 38004, "epoch": 904} {"train_loss": -5.665247440338135, "global_step": 38005, "epoch": 904} {"train_loss": -5.334984302520752, "global_step": 38006, "epoch": 904} {"train_loss": -5.54858922958374, "global_step": 38007, "epoch": 904} {"train_loss": -5.426591396331787, "global_step": 38008, "epoch": 904} {"train_loss": -5.577026106062389, "global_step": 38009, "epoch": 904, "val_loss": 74892.3125} {"train_loss": -5.486733436584473, "global_step": 38010, "epoch": 905} {"train_loss": -5.6074018478393555, "global_step": 38011, "epoch": 905} {"train_loss": -5.572789192199707, "global_step": 38012, "epoch": 905} {"train_loss": -5.461809158325195, "global_step": 38013, "epoch": 905} {"train_loss": -5.522994041442871, "global_step": 38014, "epoch": 905} {"train_loss": -5.457660675048828, "global_step": 38015, "epoch": 905} {"train_loss": -5.594049453735352, "global_step": 38016, "epoch": 905} {"train_loss": -5.392474174499512, "global_step": 38017, "epoch": 905} {"train_loss": -5.709331512451172, "global_step": 38018, "epoch": 905} {"train_loss": -5.530754089355469, "global_step": 38019, "epoch": 905} {"train_loss": -5.6624250411987305, "global_step": 38020, "epoch": 905} {"train_loss": -5.620254039764404, "global_step": 38021, "epoch": 905} {"train_loss": -5.552201271057129, "global_step": 38022, "epoch": 905} {"train_loss": -5.533835411071777, "global_step": 38023, "epoch": 905} {"train_loss": -5.468845367431641, "global_step": 38024, "epoch": 905} {"train_loss": -5.601407527923584, "global_step": 38025, "epoch": 905} {"train_loss": -5.752130508422852, "global_step": 38026, "epoch": 905} {"train_loss": -5.610427379608154, "global_step": 38027, "epoch": 905} {"train_loss": -5.620940208435059, "global_step": 38028, "epoch": 905} {"train_loss": -5.6478471755981445, "global_step": 38029, "epoch": 905} {"train_loss": -5.596041202545166, "global_step": 38030, "epoch": 905} {"train_loss": -5.570900917053223, "global_step": 38031, "epoch": 905} {"train_loss": -5.435227870941162, "global_step": 38032, "epoch": 905} {"train_loss": -5.5914812088012695, "global_step": 38033, "epoch": 905} {"train_loss": -5.590899467468262, "global_step": 38034, "epoch": 905} {"train_loss": -5.596858978271484, "global_step": 38035, "epoch": 905} {"train_loss": -5.574618339538574, "global_step": 38036, "epoch": 905} {"train_loss": -5.7155609130859375, "global_step": 38037, "epoch": 905} {"train_loss": -5.591102600097656, "global_step": 38038, "epoch": 905} {"train_loss": -5.654298305511475, "global_step": 38039, "epoch": 905} {"train_loss": -5.644655704498291, "global_step": 38040, "epoch": 905} {"train_loss": -5.624137878417969, "global_step": 38041, "epoch": 905} {"train_loss": -5.571150779724121, "global_step": 38042, "epoch": 905} {"train_loss": -5.787174224853516, "global_step": 38043, "epoch": 905} {"train_loss": -5.6222615242004395, "global_step": 38044, "epoch": 905} {"train_loss": -5.638935089111328, "global_step": 38045, "epoch": 905} {"train_loss": -5.683263778686523, "global_step": 38046, "epoch": 905} {"train_loss": -5.487253189086914, "global_step": 38047, "epoch": 905} {"train_loss": -5.567963600158691, "global_step": 38048, "epoch": 905} {"train_loss": -5.670042991638184, "global_step": 38049, "epoch": 905} {"train_loss": -5.629199028015137, "global_step": 38050, "epoch": 905} {"train_loss": -5.592701821100144, "global_step": 38051, "epoch": 905, "val_loss": 74803.828125} {"train_loss": -5.660243988037109, "global_step": 38052, "epoch": 906} {"train_loss": -5.606900215148926, "global_step": 38053, "epoch": 906} {"train_loss": -5.5997748374938965, "global_step": 38054, "epoch": 906} {"train_loss": -5.535004615783691, "global_step": 38055, "epoch": 906} {"train_loss": -5.427465438842773, "global_step": 38056, "epoch": 906} {"train_loss": -5.569493293762207, "global_step": 38057, "epoch": 906} {"train_loss": -5.8473591804504395, "global_step": 38058, "epoch": 906} {"train_loss": -5.6148681640625, "global_step": 38059, "epoch": 906} {"train_loss": -5.572999954223633, "global_step": 38060, "epoch": 906} {"train_loss": -5.499429225921631, "global_step": 38061, "epoch": 906} {"train_loss": -5.566719055175781, "global_step": 38062, "epoch": 906} {"train_loss": -5.707849502563477, "global_step": 38063, "epoch": 906} {"train_loss": -5.595280170440674, "global_step": 38064, "epoch": 906} {"train_loss": -5.652127265930176, "global_step": 38065, "epoch": 906} {"train_loss": -5.710009574890137, "global_step": 38066, "epoch": 906} {"train_loss": -5.649986743927002, "global_step": 38067, "epoch": 906} {"train_loss": -5.509621620178223, "global_step": 38068, "epoch": 906} {"train_loss": -5.654144287109375, "global_step": 38069, "epoch": 906} {"train_loss": -5.505928039550781, "global_step": 38070, "epoch": 906} {"train_loss": -5.53876256942749, "global_step": 38071, "epoch": 906} {"train_loss": -5.59940242767334, "global_step": 38072, "epoch": 906} {"train_loss": -5.614974021911621, "global_step": 38073, "epoch": 906} {"train_loss": -5.622393608093262, "global_step": 38074, "epoch": 906} {"train_loss": -5.557460308074951, "global_step": 38075, "epoch": 906} {"train_loss": -5.605093002319336, "global_step": 38076, "epoch": 906} {"train_loss": -5.5451555252075195, "global_step": 38077, "epoch": 906} {"train_loss": -5.498980522155762, "global_step": 38078, "epoch": 906} {"train_loss": -5.66896915435791, "global_step": 38079, "epoch": 906} {"train_loss": -5.723923206329346, "global_step": 38080, "epoch": 906} {"train_loss": -5.688580513000488, "global_step": 38081, "epoch": 906} {"train_loss": -5.618962287902832, "global_step": 38082, "epoch": 906} {"train_loss": -5.698757171630859, "global_step": 38083, "epoch": 906} {"train_loss": -5.62375545501709, "global_step": 38084, "epoch": 906} {"train_loss": -5.5852508544921875, "global_step": 38085, "epoch": 906} {"train_loss": -5.682944297790527, "global_step": 38086, "epoch": 906} {"train_loss": -5.718076705932617, "global_step": 38087, "epoch": 906} {"train_loss": -5.664188385009766, "global_step": 38088, "epoch": 906} {"train_loss": -5.679671287536621, "global_step": 38089, "epoch": 906} {"train_loss": -5.663553237915039, "global_step": 38090, "epoch": 906} {"train_loss": -5.713196277618408, "global_step": 38091, "epoch": 906} {"train_loss": -5.577306747436523, "global_step": 38092, "epoch": 906} {"train_loss": -5.620344706944057, "global_step": 38093, "epoch": 906, "val_loss": 73699.2890625} {"train_loss": -5.7015533447265625, "global_step": 38094, "epoch": 907} {"train_loss": -5.647168159484863, "global_step": 38095, "epoch": 907} {"train_loss": -5.553319931030273, "global_step": 38096, "epoch": 907} {"train_loss": -5.814857482910156, "global_step": 38097, "epoch": 907} {"train_loss": -5.609012126922607, "global_step": 38098, "epoch": 907} {"train_loss": -5.587515830993652, "global_step": 38099, "epoch": 907} {"train_loss": -5.571630954742432, "global_step": 38100, "epoch": 907} {"train_loss": -5.662245750427246, "global_step": 38101, "epoch": 907} {"train_loss": -5.578184604644775, "global_step": 38102, "epoch": 907} {"train_loss": -5.589275360107422, "global_step": 38103, "epoch": 907} {"train_loss": -5.551312446594238, "global_step": 38104, "epoch": 907} {"train_loss": -5.655274391174316, "global_step": 38105, "epoch": 907} {"train_loss": -5.549346923828125, "global_step": 38106, "epoch": 907} {"train_loss": -5.602052688598633, "global_step": 38107, "epoch": 907} {"train_loss": -5.582849979400635, "global_step": 38108, "epoch": 907} {"train_loss": -5.558279037475586, "global_step": 38109, "epoch": 907} {"train_loss": -5.530867099761963, "global_step": 38110, "epoch": 907} {"train_loss": -5.544146537780762, "global_step": 38111, "epoch": 907} {"train_loss": -5.694456577301025, "global_step": 38112, "epoch": 907} {"train_loss": -5.5782928466796875, "global_step": 38113, "epoch": 907} {"train_loss": -5.641029357910156, "global_step": 38114, "epoch": 907} {"train_loss": -5.717905044555664, "global_step": 38115, "epoch": 907} {"train_loss": -5.628538608551025, "global_step": 38116, "epoch": 907} {"train_loss": -5.632164001464844, "global_step": 38117, "epoch": 907} {"train_loss": -5.589938163757324, "global_step": 38118, "epoch": 907} {"train_loss": -5.547691345214844, "global_step": 38119, "epoch": 907} {"train_loss": -5.68330192565918, "global_step": 38120, "epoch": 907} {"train_loss": -5.6111674308776855, "global_step": 38121, "epoch": 907} {"train_loss": -5.642991542816162, "global_step": 38122, "epoch": 907} {"train_loss": -5.33150053024292, "global_step": 38123, "epoch": 907} {"train_loss": -5.6908650398254395, "global_step": 38124, "epoch": 907} {"train_loss": -5.697576522827148, "global_step": 38125, "epoch": 907} {"train_loss": -5.416567802429199, "global_step": 38126, "epoch": 907} {"train_loss": -5.662696838378906, "global_step": 38127, "epoch": 907} {"train_loss": -5.424658298492432, "global_step": 38128, "epoch": 907} {"train_loss": -5.462762355804443, "global_step": 38129, "epoch": 907} {"train_loss": -5.575551986694336, "global_step": 38130, "epoch": 907} {"train_loss": -5.645596027374268, "global_step": 38131, "epoch": 907} {"train_loss": -5.557052135467529, "global_step": 38132, "epoch": 907} {"train_loss": -5.534883499145508, "global_step": 38133, "epoch": 907} {"train_loss": -5.575023651123047, "global_step": 38134, "epoch": 907} {"train_loss": -5.595702545983451, "global_step": 38135, "epoch": 907, "val_loss": 73347.5234375} {"train_loss": -5.487241744995117, "global_step": 38136, "epoch": 908} {"train_loss": -5.495610237121582, "global_step": 38137, "epoch": 908} {"train_loss": -5.4586896896362305, "global_step": 38138, "epoch": 908} {"train_loss": -5.475231647491455, "global_step": 38139, "epoch": 908} {"train_loss": -5.4993062019348145, "global_step": 38140, "epoch": 908} {"train_loss": -5.551661014556885, "global_step": 38141, "epoch": 908} {"train_loss": -5.548429012298584, "global_step": 38142, "epoch": 908} {"train_loss": -5.63737678527832, "global_step": 38143, "epoch": 908} {"train_loss": -5.511022567749023, "global_step": 38144, "epoch": 908} {"train_loss": -5.521457672119141, "global_step": 38145, "epoch": 908} {"train_loss": -5.620588302612305, "global_step": 38146, "epoch": 908} {"train_loss": -5.545039176940918, "global_step": 38147, "epoch": 908} {"train_loss": -5.520315647125244, "global_step": 38148, "epoch": 908} {"train_loss": -5.809308052062988, "global_step": 38149, "epoch": 908} {"train_loss": -5.593421936035156, "global_step": 38150, "epoch": 908} {"train_loss": -5.6071882247924805, "global_step": 38151, "epoch": 908} {"train_loss": -5.616805076599121, "global_step": 38152, "epoch": 908} {"train_loss": -5.475709438323975, "global_step": 38153, "epoch": 908} {"train_loss": -5.504462242126465, "global_step": 38154, "epoch": 908} {"train_loss": -5.5375847816467285, "global_step": 38155, "epoch": 908} {"train_loss": -5.644439220428467, "global_step": 38156, "epoch": 908} {"train_loss": -5.446608543395996, "global_step": 38157, "epoch": 908} {"train_loss": -5.620089054107666, "global_step": 38158, "epoch": 908} {"train_loss": -5.489965438842773, "global_step": 38159, "epoch": 908} {"train_loss": -5.452720642089844, "global_step": 38160, "epoch": 908} {"train_loss": -5.508719444274902, "global_step": 38161, "epoch": 908} {"train_loss": -5.579535484313965, "global_step": 38162, "epoch": 908} {"train_loss": -5.626415252685547, "global_step": 38163, "epoch": 908} {"train_loss": -5.572312831878662, "global_step": 38164, "epoch": 908} {"train_loss": -5.573545455932617, "global_step": 38165, "epoch": 908} {"train_loss": -5.493766784667969, "global_step": 38166, "epoch": 908} {"train_loss": -5.550604820251465, "global_step": 38167, "epoch": 908} {"train_loss": -5.625055313110352, "global_step": 38168, "epoch": 908} {"train_loss": -5.580260276794434, "global_step": 38169, "epoch": 908} {"train_loss": -5.611428260803223, "global_step": 38170, "epoch": 908} {"train_loss": -5.603652000427246, "global_step": 38171, "epoch": 908} {"train_loss": -5.473840713500977, "global_step": 38172, "epoch": 908} {"train_loss": -5.613045692443848, "global_step": 38173, "epoch": 908} {"train_loss": -5.644906997680664, "global_step": 38174, "epoch": 908} {"train_loss": -5.54857063293457, "global_step": 38175, "epoch": 908} {"train_loss": -5.512967586517334, "global_step": 38176, "epoch": 908} {"train_loss": -5.559568098613194, "global_step": 38177, "epoch": 908, "val_loss": 74162.203125} {"train_loss": -5.471119403839111, "global_step": 38178, "epoch": 909} {"train_loss": -5.75852632522583, "global_step": 38179, "epoch": 909} {"train_loss": -5.629467964172363, "global_step": 38180, "epoch": 909} {"train_loss": -5.610879421234131, "global_step": 38181, "epoch": 909} {"train_loss": -5.618366718292236, "global_step": 38182, "epoch": 909} {"train_loss": -5.521450996398926, "global_step": 38183, "epoch": 909} {"train_loss": -5.65665340423584, "global_step": 38184, "epoch": 909} {"train_loss": -5.654242038726807, "global_step": 38185, "epoch": 909} {"train_loss": -5.5499267578125, "global_step": 38186, "epoch": 909} {"train_loss": -5.620824813842773, "global_step": 38187, "epoch": 909} {"train_loss": -5.657044887542725, "global_step": 38188, "epoch": 909} {"train_loss": -5.683442115783691, "global_step": 38189, "epoch": 909} {"train_loss": -5.557951927185059, "global_step": 38190, "epoch": 909} {"train_loss": -5.730660438537598, "global_step": 38191, "epoch": 909} {"train_loss": -5.655416488647461, "global_step": 38192, "epoch": 909} {"train_loss": -5.60612154006958, "global_step": 38193, "epoch": 909} {"train_loss": -5.627976417541504, "global_step": 38194, "epoch": 909} {"train_loss": -5.698665142059326, "global_step": 38195, "epoch": 909} {"train_loss": -5.633432388305664, "global_step": 38196, "epoch": 909} {"train_loss": -5.617659568786621, "global_step": 38197, "epoch": 909} {"train_loss": -5.685253143310547, "global_step": 38198, "epoch": 909} {"train_loss": -5.626638412475586, "global_step": 38199, "epoch": 909} {"train_loss": -5.670217037200928, "global_step": 38200, "epoch": 909} {"train_loss": -5.653929710388184, "global_step": 38201, "epoch": 909} {"train_loss": -5.727972984313965, "global_step": 38202, "epoch": 909} {"train_loss": -5.550361633300781, "global_step": 38203, "epoch": 909} {"train_loss": -5.645880222320557, "global_step": 38204, "epoch": 909} {"train_loss": -5.588925361633301, "global_step": 38205, "epoch": 909} {"train_loss": -5.493847370147705, "global_step": 38206, "epoch": 909} {"train_loss": -5.423151016235352, "global_step": 38207, "epoch": 909} {"train_loss": -5.623071193695068, "global_step": 38208, "epoch": 909} {"train_loss": -5.655251502990723, "global_step": 38209, "epoch": 909} {"train_loss": -5.567948818206787, "global_step": 38210, "epoch": 909} {"train_loss": -5.6724138259887695, "global_step": 38211, "epoch": 909} {"train_loss": -5.610540390014648, "global_step": 38212, "epoch": 909} {"train_loss": -5.514982223510742, "global_step": 38213, "epoch": 909} {"train_loss": -5.58922004699707, "global_step": 38214, "epoch": 909} {"train_loss": -5.434323310852051, "global_step": 38215, "epoch": 909} {"train_loss": -5.670652389526367, "global_step": 38216, "epoch": 909} {"train_loss": -5.650940895080566, "global_step": 38217, "epoch": 909} {"train_loss": -5.576834678649902, "global_step": 38218, "epoch": 909} {"train_loss": -5.611933197293963, "global_step": 38219, "epoch": 909, "val_loss": 74016.015625} {"train_loss": -5.616246223449707, "global_step": 38220, "epoch": 910} {"train_loss": -5.494710445404053, "global_step": 38221, "epoch": 910} {"train_loss": -5.5410027503967285, "global_step": 38222, "epoch": 910} {"train_loss": -5.627154350280762, "global_step": 38223, "epoch": 910} {"train_loss": -5.557405471801758, "global_step": 38224, "epoch": 910} {"train_loss": -5.595859527587891, "global_step": 38225, "epoch": 910} {"train_loss": -5.635610580444336, "global_step": 38226, "epoch": 910} {"train_loss": -5.694845676422119, "global_step": 38227, "epoch": 910} {"train_loss": -5.658698081970215, "global_step": 38228, "epoch": 910} {"train_loss": -5.773542404174805, "global_step": 38229, "epoch": 910} {"train_loss": -5.58177375793457, "global_step": 38230, "epoch": 910} {"train_loss": -5.655496597290039, "global_step": 38231, "epoch": 910} {"train_loss": -5.71967887878418, "global_step": 38232, "epoch": 910} {"train_loss": -5.624701499938965, "global_step": 38233, "epoch": 910} {"train_loss": -5.51005744934082, "global_step": 38234, "epoch": 910} {"train_loss": -5.630832195281982, "global_step": 38235, "epoch": 910} {"train_loss": -5.553285121917725, "global_step": 38236, "epoch": 910} {"train_loss": -5.725619316101074, "global_step": 38237, "epoch": 910} {"train_loss": -5.610836029052734, "global_step": 38238, "epoch": 910} {"train_loss": -5.7628631591796875, "global_step": 38239, "epoch": 910} {"train_loss": -5.529653549194336, "global_step": 38240, "epoch": 910} {"train_loss": -5.477629661560059, "global_step": 38241, "epoch": 910} {"train_loss": -5.615553379058838, "global_step": 38242, "epoch": 910} {"train_loss": -5.57827091217041, "global_step": 38243, "epoch": 910} {"train_loss": -5.6071248054504395, "global_step": 38244, "epoch": 910} {"train_loss": -5.6788787841796875, "global_step": 38245, "epoch": 910} {"train_loss": -5.756986618041992, "global_step": 38246, "epoch": 910} {"train_loss": -5.621371746063232, "global_step": 38247, "epoch": 910} {"train_loss": -5.603992462158203, "global_step": 38248, "epoch": 910} {"train_loss": -5.654240608215332, "global_step": 38249, "epoch": 910} {"train_loss": -5.639418601989746, "global_step": 38250, "epoch": 910} {"train_loss": -5.641180038452148, "global_step": 38251, "epoch": 910} {"train_loss": -5.405982971191406, "global_step": 38252, "epoch": 910} {"train_loss": -5.543141841888428, "global_step": 38253, "epoch": 910} {"train_loss": -5.491103649139404, "global_step": 38254, "epoch": 910} {"train_loss": -5.691006660461426, "global_step": 38255, "epoch": 910} {"train_loss": -5.505607604980469, "global_step": 38256, "epoch": 910} {"train_loss": -5.624813556671143, "global_step": 38257, "epoch": 910} {"train_loss": -5.634335041046143, "global_step": 38258, "epoch": 910} {"train_loss": -5.6757049560546875, "global_step": 38259, "epoch": 910} {"train_loss": -5.600821495056152, "global_step": 38260, "epoch": 910} {"train_loss": -5.613600526537214, "global_step": 38261, "epoch": 910, "val_loss": 73050.515625} {"train_loss": -5.636995792388916, "global_step": 38262, "epoch": 911} {"train_loss": -5.604040622711182, "global_step": 38263, "epoch": 911} {"train_loss": -5.638344764709473, "global_step": 38264, "epoch": 911} {"train_loss": -5.592576026916504, "global_step": 38265, "epoch": 911} {"train_loss": -5.529347896575928, "global_step": 38266, "epoch": 911} {"train_loss": -5.616001129150391, "global_step": 38267, "epoch": 911} {"train_loss": -5.561825752258301, "global_step": 38268, "epoch": 911} {"train_loss": -5.615077495574951, "global_step": 38269, "epoch": 911} {"train_loss": -5.398548603057861, "global_step": 38270, "epoch": 911} {"train_loss": -5.534489154815674, "global_step": 38271, "epoch": 911} {"train_loss": -5.577409744262695, "global_step": 38272, "epoch": 911} {"train_loss": -5.506932735443115, "global_step": 38273, "epoch": 911} {"train_loss": -5.5563812255859375, "global_step": 38274, "epoch": 911} {"train_loss": -5.430131912231445, "global_step": 38275, "epoch": 911} {"train_loss": -5.596127510070801, "global_step": 38276, "epoch": 911} {"train_loss": -5.558155059814453, "global_step": 38277, "epoch": 911} {"train_loss": -5.471836090087891, "global_step": 38278, "epoch": 911} {"train_loss": -5.578768730163574, "global_step": 38279, "epoch": 911} {"train_loss": -5.731452465057373, "global_step": 38280, "epoch": 911} {"train_loss": -5.472546577453613, "global_step": 38281, "epoch": 911} {"train_loss": -5.63251256942749, "global_step": 38282, "epoch": 911} {"train_loss": -5.461338043212891, "global_step": 38283, "epoch": 911} {"train_loss": -5.621593952178955, "global_step": 38284, "epoch": 911} {"train_loss": -5.534677982330322, "global_step": 38285, "epoch": 911} {"train_loss": -5.62685489654541, "global_step": 38286, "epoch": 911} {"train_loss": -5.524749755859375, "global_step": 38287, "epoch": 911} {"train_loss": -5.469400882720947, "global_step": 38288, "epoch": 911} {"train_loss": -5.571496486663818, "global_step": 38289, "epoch": 911} {"train_loss": -5.602226734161377, "global_step": 38290, "epoch": 911} {"train_loss": -5.52378511428833, "global_step": 38291, "epoch": 911} {"train_loss": -5.672374725341797, "global_step": 38292, "epoch": 911} {"train_loss": -5.6658525466918945, "global_step": 38293, "epoch": 911} {"train_loss": -5.59230375289917, "global_step": 38294, "epoch": 911} {"train_loss": -5.681793212890625, "global_step": 38295, "epoch": 911} {"train_loss": -5.605343818664551, "global_step": 38296, "epoch": 911} {"train_loss": -5.493199348449707, "global_step": 38297, "epoch": 911} {"train_loss": -5.602148532867432, "global_step": 38298, "epoch": 911} {"train_loss": -5.541380882263184, "global_step": 38299, "epoch": 911} {"train_loss": -5.6230268478393555, "global_step": 38300, "epoch": 911} {"train_loss": -5.639095783233643, "global_step": 38301, "epoch": 911} {"train_loss": -5.54193639755249, "global_step": 38302, "epoch": 911} {"train_loss": -5.5710350558871315, "global_step": 38303, "epoch": 911, "val_loss": 74465.640625} {"train_loss": -5.648628234863281, "global_step": 38304, "epoch": 912} {"train_loss": -5.689676761627197, "global_step": 38305, "epoch": 912} {"train_loss": -5.648338794708252, "global_step": 38306, "epoch": 912} {"train_loss": -5.5051116943359375, "global_step": 38307, "epoch": 912} {"train_loss": -5.656189918518066, "global_step": 38308, "epoch": 912} {"train_loss": -5.640983581542969, "global_step": 38309, "epoch": 912} {"train_loss": -5.640002250671387, "global_step": 38310, "epoch": 912} {"train_loss": -5.61607027053833, "global_step": 38311, "epoch": 912} {"train_loss": -5.530060768127441, "global_step": 38312, "epoch": 912} {"train_loss": -5.53373384475708, "global_step": 38313, "epoch": 912} {"train_loss": -5.55985164642334, "global_step": 38314, "epoch": 912} {"train_loss": -5.656774044036865, "global_step": 38315, "epoch": 912} {"train_loss": -5.544314384460449, "global_step": 38316, "epoch": 912} {"train_loss": -5.565232753753662, "global_step": 38317, "epoch": 912} {"train_loss": -5.654987335205078, "global_step": 38318, "epoch": 912} {"train_loss": -5.623692035675049, "global_step": 38319, "epoch": 912} {"train_loss": -5.753161907196045, "global_step": 38320, "epoch": 912} {"train_loss": -5.556125640869141, "global_step": 38321, "epoch": 912} {"train_loss": -5.55855655670166, "global_step": 38322, "epoch": 912} {"train_loss": -5.524967670440674, "global_step": 38323, "epoch": 912} {"train_loss": -5.590998649597168, "global_step": 38324, "epoch": 912} {"train_loss": -5.58122444152832, "global_step": 38325, "epoch": 912} {"train_loss": -5.658949851989746, "global_step": 38326, "epoch": 912} {"train_loss": -5.636800289154053, "global_step": 38327, "epoch": 912} {"train_loss": -5.6110758781433105, "global_step": 38328, "epoch": 912} {"train_loss": -5.439868927001953, "global_step": 38329, "epoch": 912} {"train_loss": -5.61165714263916, "global_step": 38330, "epoch": 912} {"train_loss": -5.599833965301514, "global_step": 38331, "epoch": 912} {"train_loss": -5.595295429229736, "global_step": 38332, "epoch": 912} {"train_loss": -5.5650434494018555, "global_step": 38333, "epoch": 912} {"train_loss": -5.730624675750732, "global_step": 38334, "epoch": 912} {"train_loss": -5.607421875, "global_step": 38335, "epoch": 912} {"train_loss": -5.549213409423828, "global_step": 38336, "epoch": 912} {"train_loss": -5.699129104614258, "global_step": 38337, "epoch": 912} {"train_loss": -5.552583694458008, "global_step": 38338, "epoch": 912} {"train_loss": -5.532764911651611, "global_step": 38339, "epoch": 912} {"train_loss": -5.4462890625, "global_step": 38340, "epoch": 912} {"train_loss": -5.5482258796691895, "global_step": 38341, "epoch": 912} {"train_loss": -5.59909200668335, "global_step": 38342, "epoch": 912} {"train_loss": -5.533938407897949, "global_step": 38343, "epoch": 912} {"train_loss": -5.638271331787109, "global_step": 38344, "epoch": 912} {"train_loss": -5.59716610681443, "global_step": 38345, "epoch": 912, "val_loss": 74417.078125} {"train_loss": -5.583333969116211, "global_step": 38346, "epoch": 913} {"train_loss": -5.72063684463501, "global_step": 38347, "epoch": 913} {"train_loss": -5.546122074127197, "global_step": 38348, "epoch": 913} {"train_loss": -5.528731822967529, "global_step": 38349, "epoch": 913} {"train_loss": -5.624556064605713, "global_step": 38350, "epoch": 913} {"train_loss": -5.727205276489258, "global_step": 38351, "epoch": 913} {"train_loss": -5.615835189819336, "global_step": 38352, "epoch": 913} {"train_loss": -5.697561264038086, "global_step": 38353, "epoch": 913} {"train_loss": -5.580738067626953, "global_step": 38354, "epoch": 913} {"train_loss": -5.594236850738525, "global_step": 38355, "epoch": 913} {"train_loss": -5.524164199829102, "global_step": 38356, "epoch": 913} {"train_loss": -5.611520767211914, "global_step": 38357, "epoch": 913} {"train_loss": -5.554220676422119, "global_step": 38358, "epoch": 913} {"train_loss": -5.614805698394775, "global_step": 38359, "epoch": 913} {"train_loss": -5.664702415466309, "global_step": 38360, "epoch": 913} {"train_loss": -5.45441198348999, "global_step": 38361, "epoch": 913} {"train_loss": -5.66690731048584, "global_step": 38362, "epoch": 913} {"train_loss": -5.549455642700195, "global_step": 38363, "epoch": 913} {"train_loss": -5.621043682098389, "global_step": 38364, "epoch": 913} {"train_loss": -5.5131378173828125, "global_step": 38365, "epoch": 913} {"train_loss": -5.646574974060059, "global_step": 38366, "epoch": 913} {"train_loss": -5.65568208694458, "global_step": 38367, "epoch": 913} {"train_loss": -5.654596328735352, "global_step": 38368, "epoch": 913} {"train_loss": -5.637693405151367, "global_step": 38369, "epoch": 913} {"train_loss": -5.63032341003418, "global_step": 38370, "epoch": 913} {"train_loss": -5.575058937072754, "global_step": 38371, "epoch": 913} {"train_loss": -5.533257961273193, "global_step": 38372, "epoch": 913} {"train_loss": -5.520409107208252, "global_step": 38373, "epoch": 913} {"train_loss": -5.7030744552612305, "global_step": 38374, "epoch": 913} {"train_loss": -5.587392807006836, "global_step": 38375, "epoch": 913} {"train_loss": -5.6473188400268555, "global_step": 38376, "epoch": 913} {"train_loss": -5.686233043670654, "global_step": 38377, "epoch": 913} {"train_loss": -5.7001495361328125, "global_step": 38378, "epoch": 913} {"train_loss": -5.552725791931152, "global_step": 38379, "epoch": 913} {"train_loss": -5.607779026031494, "global_step": 38380, "epoch": 913} {"train_loss": -5.641695976257324, "global_step": 38381, "epoch": 913} {"train_loss": -5.659212112426758, "global_step": 38382, "epoch": 913} {"train_loss": -5.604233741760254, "global_step": 38383, "epoch": 913} {"train_loss": -5.558294296264648, "global_step": 38384, "epoch": 913} {"train_loss": -5.574190616607666, "global_step": 38385, "epoch": 913} {"train_loss": -5.597738742828369, "global_step": 38386, "epoch": 913} {"train_loss": -5.6046663125356035, "global_step": 38387, "epoch": 913, "val_loss": 73400.1171875} {"train_loss": -5.6040778160095215, "global_step": 38388, "epoch": 914} {"train_loss": -5.560585021972656, "global_step": 38389, "epoch": 914} {"train_loss": -5.417160987854004, "global_step": 38390, "epoch": 914} {"train_loss": -5.593992710113525, "global_step": 38391, "epoch": 914} {"train_loss": -5.698165416717529, "global_step": 38392, "epoch": 914} {"train_loss": -5.551975727081299, "global_step": 38393, "epoch": 914} {"train_loss": -5.6096649169921875, "global_step": 38394, "epoch": 914} {"train_loss": -5.61445426940918, "global_step": 38395, "epoch": 914} {"train_loss": -5.603823661804199, "global_step": 38396, "epoch": 914} {"train_loss": -5.639876365661621, "global_step": 38397, "epoch": 914} {"train_loss": -5.511288166046143, "global_step": 38398, "epoch": 914} {"train_loss": -5.5773162841796875, "global_step": 38399, "epoch": 914} {"train_loss": -5.609147548675537, "global_step": 38400, "epoch": 914} {"train_loss": -5.465265274047852, "global_step": 38401, "epoch": 914} {"train_loss": -5.625054836273193, "global_step": 38402, "epoch": 914} {"train_loss": -5.5604448318481445, "global_step": 38403, "epoch": 914} {"train_loss": -5.561452865600586, "global_step": 38404, "epoch": 914} {"train_loss": -5.5079755783081055, "global_step": 38405, "epoch": 914} {"train_loss": -5.645955562591553, "global_step": 38406, "epoch": 914} {"train_loss": -5.555166721343994, "global_step": 38407, "epoch": 914} {"train_loss": -5.696599960327148, "global_step": 38408, "epoch": 914} {"train_loss": -5.606851577758789, "global_step": 38409, "epoch": 914} {"train_loss": -5.599698543548584, "global_step": 38410, "epoch": 914} {"train_loss": -5.597010612487793, "global_step": 38411, "epoch": 914} {"train_loss": -5.635901927947998, "global_step": 38412, "epoch": 914} {"train_loss": -5.605940818786621, "global_step": 38413, "epoch": 914} {"train_loss": -5.650354862213135, "global_step": 38414, "epoch": 914} {"train_loss": -5.51409912109375, "global_step": 38415, "epoch": 914} {"train_loss": -5.464354515075684, "global_step": 38416, "epoch": 914} {"train_loss": -5.571236610412598, "global_step": 38417, "epoch": 914} {"train_loss": -5.600766658782959, "global_step": 38418, "epoch": 914} {"train_loss": -5.479516506195068, "global_step": 38419, "epoch": 914} {"train_loss": -5.656917572021484, "global_step": 38420, "epoch": 914} {"train_loss": -5.497181415557861, "global_step": 38421, "epoch": 914} {"train_loss": -5.557240962982178, "global_step": 38422, "epoch": 914} {"train_loss": -5.5063276290893555, "global_step": 38423, "epoch": 914} {"train_loss": -5.556488990783691, "global_step": 38424, "epoch": 914} {"train_loss": -5.610540866851807, "global_step": 38425, "epoch": 914} {"train_loss": -5.537206649780273, "global_step": 38426, "epoch": 914} {"train_loss": -5.625489234924316, "global_step": 38427, "epoch": 914} {"train_loss": -5.5371174812316895, "global_step": 38428, "epoch": 914} {"train_loss": -5.575999328068325, "global_step": 38429, "epoch": 914, "val_loss": 74614.4453125} {"train_loss": -5.685783863067627, "global_step": 38430, "epoch": 915} {"train_loss": -5.535983085632324, "global_step": 38431, "epoch": 915} {"train_loss": -5.469285011291504, "global_step": 38432, "epoch": 915} {"train_loss": -5.528866291046143, "global_step": 38433, "epoch": 915} {"train_loss": -5.5774335861206055, "global_step": 38434, "epoch": 915} {"train_loss": -5.724824905395508, "global_step": 38435, "epoch": 915} {"train_loss": -5.678149700164795, "global_step": 38436, "epoch": 915} {"train_loss": -5.497478485107422, "global_step": 38437, "epoch": 915} {"train_loss": -5.513106346130371, "global_step": 38438, "epoch": 915} {"train_loss": -5.587552070617676, "global_step": 38439, "epoch": 915} {"train_loss": -5.7237653732299805, "global_step": 38440, "epoch": 915} {"train_loss": -5.490180015563965, "global_step": 38441, "epoch": 915} {"train_loss": -5.552621841430664, "global_step": 38442, "epoch": 915} {"train_loss": -5.5508575439453125, "global_step": 38443, "epoch": 915} {"train_loss": -5.655966758728027, "global_step": 38444, "epoch": 915} {"train_loss": -5.549010753631592, "global_step": 38445, "epoch": 915} {"train_loss": -5.674976348876953, "global_step": 38446, "epoch": 915} {"train_loss": -5.628780364990234, "global_step": 38447, "epoch": 915} {"train_loss": -5.635659694671631, "global_step": 38448, "epoch": 915} {"train_loss": -5.640772819519043, "global_step": 38449, "epoch": 915} {"train_loss": -5.743973731994629, "global_step": 38450, "epoch": 915} {"train_loss": -5.584328651428223, "global_step": 38451, "epoch": 915} {"train_loss": -5.682849884033203, "global_step": 38452, "epoch": 915} {"train_loss": -5.673128604888916, "global_step": 38453, "epoch": 915} {"train_loss": -5.631610870361328, "global_step": 38454, "epoch": 915} {"train_loss": -5.671553611755371, "global_step": 38455, "epoch": 915} {"train_loss": -5.62269926071167, "global_step": 38456, "epoch": 915} {"train_loss": -5.503395080566406, "global_step": 38457, "epoch": 915} {"train_loss": -5.586986064910889, "global_step": 38458, "epoch": 915} {"train_loss": -5.562726974487305, "global_step": 38459, "epoch": 915} {"train_loss": -5.480808258056641, "global_step": 38460, "epoch": 915} {"train_loss": -5.5389790534973145, "global_step": 38461, "epoch": 915} {"train_loss": -5.6025309562683105, "global_step": 38462, "epoch": 915} {"train_loss": -5.703372001647949, "global_step": 38463, "epoch": 915} {"train_loss": -5.699670791625977, "global_step": 38464, "epoch": 915} {"train_loss": -5.751658916473389, "global_step": 38465, "epoch": 915} {"train_loss": -5.668315887451172, "global_step": 38466, "epoch": 915} {"train_loss": -5.494894027709961, "global_step": 38467, "epoch": 915} {"train_loss": -5.533407211303711, "global_step": 38468, "epoch": 915} {"train_loss": -5.631752014160156, "global_step": 38469, "epoch": 915} {"train_loss": -5.598456382751465, "global_step": 38470, "epoch": 915} {"train_loss": -5.60630152339027, "global_step": 38471, "epoch": 915, "val_loss": 73775.859375} {"train_loss": -5.6662397384643555, "global_step": 38472, "epoch": 916} {"train_loss": -5.663625240325928, "global_step": 38473, "epoch": 916} {"train_loss": -5.666623115539551, "global_step": 38474, "epoch": 916} {"train_loss": -5.451007843017578, "global_step": 38475, "epoch": 916} {"train_loss": -5.678326606750488, "global_step": 38476, "epoch": 916} {"train_loss": -5.6617536544799805, "global_step": 38477, "epoch": 916} {"train_loss": -5.624279022216797, "global_step": 38478, "epoch": 916} {"train_loss": -5.632872581481934, "global_step": 38479, "epoch": 916} {"train_loss": -5.572693824768066, "global_step": 38480, "epoch": 916} {"train_loss": -5.552519798278809, "global_step": 38481, "epoch": 916} {"train_loss": -5.634330749511719, "global_step": 38482, "epoch": 916} {"train_loss": -5.44038724899292, "global_step": 38483, "epoch": 916} {"train_loss": -5.411606311798096, "global_step": 38484, "epoch": 916} {"train_loss": -5.738391876220703, "global_step": 38485, "epoch": 916} {"train_loss": -5.369054794311523, "global_step": 38486, "epoch": 916} {"train_loss": -5.552718162536621, "global_step": 38487, "epoch": 916} {"train_loss": -5.422148704528809, "global_step": 38488, "epoch": 916} {"train_loss": -5.515057563781738, "global_step": 38489, "epoch": 916} {"train_loss": -5.643599033355713, "global_step": 38490, "epoch": 916} {"train_loss": -5.60015869140625, "global_step": 38491, "epoch": 916} {"train_loss": -5.646282196044922, "global_step": 38492, "epoch": 916} {"train_loss": -5.514638900756836, "global_step": 38493, "epoch": 916} {"train_loss": -5.594053745269775, "global_step": 38494, "epoch": 916} {"train_loss": -5.503145217895508, "global_step": 38495, "epoch": 916} {"train_loss": -5.549088478088379, "global_step": 38496, "epoch": 916} {"train_loss": -5.531427383422852, "global_step": 38497, "epoch": 916} {"train_loss": -5.595802307128906, "global_step": 38498, "epoch": 916} {"train_loss": -5.636018753051758, "global_step": 38499, "epoch": 916} {"train_loss": -5.513014316558838, "global_step": 38500, "epoch": 916} {"train_loss": -5.517976760864258, "global_step": 38501, "epoch": 916} {"train_loss": -5.425629138946533, "global_step": 38502, "epoch": 916} {"train_loss": -5.443283557891846, "global_step": 38503, "epoch": 916} {"train_loss": -5.581789016723633, "global_step": 38504, "epoch": 916} {"train_loss": -5.493157863616943, "global_step": 38505, "epoch": 916} {"train_loss": -5.659226417541504, "global_step": 38506, "epoch": 916} {"train_loss": -5.528011322021484, "global_step": 38507, "epoch": 916} {"train_loss": -5.444509506225586, "global_step": 38508, "epoch": 916} {"train_loss": -5.669262886047363, "global_step": 38509, "epoch": 916} {"train_loss": -5.599307537078857, "global_step": 38510, "epoch": 916} {"train_loss": -5.543181419372559, "global_step": 38511, "epoch": 916} {"train_loss": -5.49008846282959, "global_step": 38512, "epoch": 916} {"train_loss": -5.561814637411208, "global_step": 38513, "epoch": 916, "val_loss": 73528.359375} {"train_loss": -5.601611137390137, "global_step": 38514, "epoch": 917} {"train_loss": -5.560095310211182, "global_step": 38515, "epoch": 917} {"train_loss": -5.684464454650879, "global_step": 38516, "epoch": 917} {"train_loss": -5.511746406555176, "global_step": 38517, "epoch": 917} {"train_loss": -5.596085071563721, "global_step": 38518, "epoch": 917} {"train_loss": -5.607360363006592, "global_step": 38519, "epoch": 917} {"train_loss": -5.593878746032715, "global_step": 38520, "epoch": 917} {"train_loss": -5.687047004699707, "global_step": 38521, "epoch": 917} {"train_loss": -5.523841857910156, "global_step": 38522, "epoch": 917} {"train_loss": -5.5630083084106445, "global_step": 38523, "epoch": 917} {"train_loss": -5.570998191833496, "global_step": 38524, "epoch": 917} {"train_loss": -5.594391345977783, "global_step": 38525, "epoch": 917} {"train_loss": -5.679765701293945, "global_step": 38526, "epoch": 917} {"train_loss": -5.5179853439331055, "global_step": 38527, "epoch": 917} {"train_loss": -5.718166351318359, "global_step": 38528, "epoch": 917} {"train_loss": -5.556863784790039, "global_step": 38529, "epoch": 917} {"train_loss": -5.701052188873291, "global_step": 38530, "epoch": 917} {"train_loss": -5.634134292602539, "global_step": 38531, "epoch": 917} {"train_loss": -5.558901309967041, "global_step": 38532, "epoch": 917} {"train_loss": -5.630718231201172, "global_step": 38533, "epoch": 917} {"train_loss": -5.637104511260986, "global_step": 38534, "epoch": 917} {"train_loss": -5.532406806945801, "global_step": 38535, "epoch": 917} {"train_loss": -5.466616153717041, "global_step": 38536, "epoch": 917} {"train_loss": -5.518809795379639, "global_step": 38537, "epoch": 917} {"train_loss": -5.617993354797363, "global_step": 38538, "epoch": 917} {"train_loss": -5.5229644775390625, "global_step": 38539, "epoch": 917} {"train_loss": -5.508152008056641, "global_step": 38540, "epoch": 917} {"train_loss": -5.6714277267456055, "global_step": 38541, "epoch": 917} {"train_loss": -5.428404808044434, "global_step": 38542, "epoch": 917} {"train_loss": -5.544378280639648, "global_step": 38543, "epoch": 917} {"train_loss": -5.617893218994141, "global_step": 38544, "epoch": 917} {"train_loss": -5.594735145568848, "global_step": 38545, "epoch": 917} {"train_loss": -5.6020307540893555, "global_step": 38546, "epoch": 917} {"train_loss": -5.550411224365234, "global_step": 38547, "epoch": 917} {"train_loss": -5.540581226348877, "global_step": 38548, "epoch": 917} {"train_loss": -5.555532455444336, "global_step": 38549, "epoch": 917} {"train_loss": -5.54087495803833, "global_step": 38550, "epoch": 917} {"train_loss": -5.603900909423828, "global_step": 38551, "epoch": 917} {"train_loss": -5.495116710662842, "global_step": 38552, "epoch": 917} {"train_loss": -5.53072452545166, "global_step": 38553, "epoch": 917} {"train_loss": -5.617448806762695, "global_step": 38554, "epoch": 917} {"train_loss": -5.581411361694336, "global_step": 38555, "epoch": 917, "val_loss": 74025.2890625} {"train_loss": -5.604857921600342, "global_step": 38556, "epoch": 918} {"train_loss": -5.5100998878479, "global_step": 38557, "epoch": 918} {"train_loss": -5.527705192565918, "global_step": 38558, "epoch": 918} {"train_loss": -5.556034088134766, "global_step": 38559, "epoch": 918} {"train_loss": -5.480067253112793, "global_step": 38560, "epoch": 918} {"train_loss": -5.654091835021973, "global_step": 38561, "epoch": 918} {"train_loss": -5.461296558380127, "global_step": 38562, "epoch": 918} {"train_loss": -5.487327575683594, "global_step": 38563, "epoch": 918} {"train_loss": -5.482268333435059, "global_step": 38564, "epoch": 918} {"train_loss": -5.558216094970703, "global_step": 38565, "epoch": 918} {"train_loss": -5.486730098724365, "global_step": 38566, "epoch": 918} {"train_loss": -5.55478048324585, "global_step": 38567, "epoch": 918} {"train_loss": -5.663233280181885, "global_step": 38568, "epoch": 918} {"train_loss": -5.523519992828369, "global_step": 38569, "epoch": 918} {"train_loss": -5.703451633453369, "global_step": 38570, "epoch": 918} {"train_loss": -5.6329803466796875, "global_step": 38571, "epoch": 918} {"train_loss": -5.625161170959473, "global_step": 38572, "epoch": 918} {"train_loss": -5.677278518676758, "global_step": 38573, "epoch": 918} {"train_loss": -5.621427059173584, "global_step": 38574, "epoch": 918} {"train_loss": -5.544878959655762, "global_step": 38575, "epoch": 918} {"train_loss": -5.572669506072998, "global_step": 38576, "epoch": 918} {"train_loss": -5.546225547790527, "global_step": 38577, "epoch": 918} {"train_loss": -5.653092861175537, "global_step": 38578, "epoch": 918} {"train_loss": -5.608729839324951, "global_step": 38579, "epoch": 918} {"train_loss": -5.6542253494262695, "global_step": 38580, "epoch": 918} {"train_loss": -5.7007904052734375, "global_step": 38581, "epoch": 918} {"train_loss": -5.484795570373535, "global_step": 38582, "epoch": 918} {"train_loss": -5.693626403808594, "global_step": 38583, "epoch": 918} {"train_loss": -5.645249843597412, "global_step": 38584, "epoch": 918} {"train_loss": -5.47878360748291, "global_step": 38585, "epoch": 918} {"train_loss": -5.6091389656066895, "global_step": 38586, "epoch": 918} {"train_loss": -5.680177688598633, "global_step": 38587, "epoch": 918} {"train_loss": -5.647198677062988, "global_step": 38588, "epoch": 918} {"train_loss": -5.6172380447387695, "global_step": 38589, "epoch": 918} {"train_loss": -5.611086368560791, "global_step": 38590, "epoch": 918} {"train_loss": -5.650638580322266, "global_step": 38591, "epoch": 918} {"train_loss": -5.677700042724609, "global_step": 38592, "epoch": 918} {"train_loss": -5.679056644439697, "global_step": 38593, "epoch": 918} {"train_loss": -5.67579460144043, "global_step": 38594, "epoch": 918} {"train_loss": -5.57088041305542, "global_step": 38595, "epoch": 918} {"train_loss": -5.594821929931641, "global_step": 38596, "epoch": 918} {"train_loss": -5.598966916402181, "global_step": 38597, "epoch": 918, "val_loss": 73181.2109375} {"train_loss": -5.64386510848999, "global_step": 38598, "epoch": 919} {"train_loss": -5.683444499969482, "global_step": 38599, "epoch": 919} {"train_loss": -5.569513320922852, "global_step": 38600, "epoch": 919} {"train_loss": -5.668933868408203, "global_step": 38601, "epoch": 919} {"train_loss": -5.706329345703125, "global_step": 38602, "epoch": 919} {"train_loss": -5.669817924499512, "global_step": 38603, "epoch": 919} {"train_loss": -5.714956283569336, "global_step": 38604, "epoch": 919} {"train_loss": -5.659421920776367, "global_step": 38605, "epoch": 919} {"train_loss": -5.781414985656738, "global_step": 38606, "epoch": 919} {"train_loss": -5.516323089599609, "global_step": 38607, "epoch": 919} {"train_loss": -5.6491546630859375, "global_step": 38608, "epoch": 919} {"train_loss": -5.639010906219482, "global_step": 38609, "epoch": 919} {"train_loss": -5.671784400939941, "global_step": 38610, "epoch": 919} {"train_loss": -5.714529991149902, "global_step": 38611, "epoch": 919} {"train_loss": -5.656137466430664, "global_step": 38612, "epoch": 919} {"train_loss": -5.555463790893555, "global_step": 38613, "epoch": 919} {"train_loss": -5.556571960449219, "global_step": 38614, "epoch": 919} {"train_loss": -5.757054328918457, "global_step": 38615, "epoch": 919} {"train_loss": -5.503210067749023, "global_step": 38616, "epoch": 919} {"train_loss": -5.5557861328125, "global_step": 38617, "epoch": 919} {"train_loss": -5.576896667480469, "global_step": 38618, "epoch": 919} {"train_loss": -5.653069496154785, "global_step": 38619, "epoch": 919} {"train_loss": -5.64845609664917, "global_step": 38620, "epoch": 919} {"train_loss": -5.687745571136475, "global_step": 38621, "epoch": 919} {"train_loss": -5.540282726287842, "global_step": 38622, "epoch": 919} {"train_loss": -5.554083824157715, "global_step": 38623, "epoch": 919} {"train_loss": -5.493948936462402, "global_step": 38624, "epoch": 919} {"train_loss": -5.593499183654785, "global_step": 38625, "epoch": 919} {"train_loss": -5.534923553466797, "global_step": 38626, "epoch": 919} {"train_loss": -5.664729595184326, "global_step": 38627, "epoch": 919} {"train_loss": -5.602998733520508, "global_step": 38628, "epoch": 919} {"train_loss": -5.507353782653809, "global_step": 38629, "epoch": 919} {"train_loss": -5.630876541137695, "global_step": 38630, "epoch": 919} {"train_loss": -5.615968704223633, "global_step": 38631, "epoch": 919} {"train_loss": -5.5251312255859375, "global_step": 38632, "epoch": 919} {"train_loss": -5.697544574737549, "global_step": 38633, "epoch": 919} {"train_loss": -5.561803817749023, "global_step": 38634, "epoch": 919} {"train_loss": -5.566473007202148, "global_step": 38635, "epoch": 919} {"train_loss": -5.593607425689697, "global_step": 38636, "epoch": 919} {"train_loss": -5.627200126647949, "global_step": 38637, "epoch": 919} {"train_loss": -5.539523124694824, "global_step": 38638, "epoch": 919} {"train_loss": -5.614872989200411, "global_step": 38639, "epoch": 919, "val_loss": 73371.078125} {"train_loss": -5.69968318939209, "global_step": 38640, "epoch": 920} {"train_loss": -5.636775970458984, "global_step": 38641, "epoch": 920} {"train_loss": -5.64422607421875, "global_step": 38642, "epoch": 920} {"train_loss": -5.686964511871338, "global_step": 38643, "epoch": 920} {"train_loss": -5.692739486694336, "global_step": 38644, "epoch": 920} {"train_loss": -5.568820953369141, "global_step": 38645, "epoch": 920} {"train_loss": -5.768008232116699, "global_step": 38646, "epoch": 920} {"train_loss": -5.6998515129089355, "global_step": 38647, "epoch": 920} {"train_loss": -5.6555070877075195, "global_step": 38648, "epoch": 920} {"train_loss": -5.513564109802246, "global_step": 38649, "epoch": 920} {"train_loss": -5.626991271972656, "global_step": 38650, "epoch": 920} {"train_loss": -5.727500915527344, "global_step": 38651, "epoch": 920} {"train_loss": -5.563577651977539, "global_step": 38652, "epoch": 920} {"train_loss": -5.636344909667969, "global_step": 38653, "epoch": 920} {"train_loss": -5.659462928771973, "global_step": 38654, "epoch": 920} {"train_loss": -5.5655951499938965, "global_step": 38655, "epoch": 920} {"train_loss": -5.583722114562988, "global_step": 38656, "epoch": 920} {"train_loss": -5.538379669189453, "global_step": 38657, "epoch": 920} {"train_loss": -5.593935966491699, "global_step": 38658, "epoch": 920} {"train_loss": -5.655760765075684, "global_step": 38659, "epoch": 920} {"train_loss": -5.627333641052246, "global_step": 38660, "epoch": 920} {"train_loss": -5.650392532348633, "global_step": 38661, "epoch": 920} {"train_loss": -5.678487777709961, "global_step": 38662, "epoch": 920} {"train_loss": -5.657590866088867, "global_step": 38663, "epoch": 920} {"train_loss": -5.565536022186279, "global_step": 38664, "epoch": 920} {"train_loss": -5.669409275054932, "global_step": 38665, "epoch": 920} {"train_loss": -5.757693290710449, "global_step": 38666, "epoch": 920} {"train_loss": -5.467206954956055, "global_step": 38667, "epoch": 920} {"train_loss": -5.569948196411133, "global_step": 38668, "epoch": 920} {"train_loss": -5.5849409103393555, "global_step": 38669, "epoch": 920} {"train_loss": -5.641733169555664, "global_step": 38670, "epoch": 920} {"train_loss": -5.573166847229004, "global_step": 38671, "epoch": 920} {"train_loss": -5.55018424987793, "global_step": 38672, "epoch": 920} {"train_loss": -5.731135368347168, "global_step": 38673, "epoch": 920} {"train_loss": -5.650970458984375, "global_step": 38674, "epoch": 920} {"train_loss": -5.672102451324463, "global_step": 38675, "epoch": 920} {"train_loss": -5.586530685424805, "global_step": 38676, "epoch": 920} {"train_loss": -5.561471939086914, "global_step": 38677, "epoch": 920} {"train_loss": -5.660239219665527, "global_step": 38678, "epoch": 920} {"train_loss": -5.590762138366699, "global_step": 38679, "epoch": 920} {"train_loss": -5.633488655090332, "global_step": 38680, "epoch": 920} {"train_loss": -5.625162737710135, "global_step": 38681, "epoch": 920, "val_loss": 74328.546875} {"train_loss": -5.667377471923828, "global_step": 38682, "epoch": 921} {"train_loss": -5.6236252784729, "global_step": 38683, "epoch": 921} {"train_loss": -5.51823616027832, "global_step": 38684, "epoch": 921} {"train_loss": -5.660237789154053, "global_step": 38685, "epoch": 921} {"train_loss": -5.524236679077148, "global_step": 38686, "epoch": 921} {"train_loss": -5.673120021820068, "global_step": 38687, "epoch": 921} {"train_loss": -5.498546600341797, "global_step": 38688, "epoch": 921} {"train_loss": -5.5503153800964355, "global_step": 38689, "epoch": 921} {"train_loss": -5.582190036773682, "global_step": 38690, "epoch": 921} {"train_loss": -5.465625286102295, "global_step": 38691, "epoch": 921} {"train_loss": -5.492944717407227, "global_step": 38692, "epoch": 921} {"train_loss": -5.597912788391113, "global_step": 38693, "epoch": 921} {"train_loss": -5.503107070922852, "global_step": 38694, "epoch": 921} {"train_loss": -5.590725898742676, "global_step": 38695, "epoch": 921} {"train_loss": -5.43343448638916, "global_step": 38696, "epoch": 921} {"train_loss": -5.586150169372559, "global_step": 38697, "epoch": 921} {"train_loss": -5.50039005279541, "global_step": 38698, "epoch": 921} {"train_loss": -5.485848903656006, "global_step": 38699, "epoch": 921} {"train_loss": -5.598845481872559, "global_step": 38700, "epoch": 921} {"train_loss": -5.430585861206055, "global_step": 38701, "epoch": 921} {"train_loss": -5.686753273010254, "global_step": 38702, "epoch": 921} {"train_loss": -5.472810745239258, "global_step": 38703, "epoch": 921} {"train_loss": -5.632778644561768, "global_step": 38704, "epoch": 921} {"train_loss": -5.541345596313477, "global_step": 38705, "epoch": 921} {"train_loss": -5.500278472900391, "global_step": 38706, "epoch": 921} {"train_loss": -5.652393817901611, "global_step": 38707, "epoch": 921} {"train_loss": -5.650875091552734, "global_step": 38708, "epoch": 921} {"train_loss": -5.648061752319336, "global_step": 38709, "epoch": 921} {"train_loss": -5.653100967407227, "global_step": 38710, "epoch": 921} {"train_loss": -5.708037376403809, "global_step": 38711, "epoch": 921} {"train_loss": -5.605145454406738, "global_step": 38712, "epoch": 921} {"train_loss": -5.579133987426758, "global_step": 38713, "epoch": 921} {"train_loss": -5.490357875823975, "global_step": 38714, "epoch": 921} {"train_loss": -5.687167167663574, "global_step": 38715, "epoch": 921} {"train_loss": -5.683499813079834, "global_step": 38716, "epoch": 921} {"train_loss": -5.620596885681152, "global_step": 38717, "epoch": 921} {"train_loss": -5.717931747436523, "global_step": 38718, "epoch": 921} {"train_loss": -5.650290489196777, "global_step": 38719, "epoch": 921} {"train_loss": -5.696977615356445, "global_step": 38720, "epoch": 921} {"train_loss": -5.5372209548950195, "global_step": 38721, "epoch": 921} {"train_loss": -5.641633033752441, "global_step": 38722, "epoch": 921} {"train_loss": -5.5903457232884, "global_step": 38723, "epoch": 921, "val_loss": 73915.5546875} {"train_loss": -5.626949310302734, "global_step": 38724, "epoch": 922} {"train_loss": -5.5145769119262695, "global_step": 38725, "epoch": 922} {"train_loss": -5.620157241821289, "global_step": 38726, "epoch": 922} {"train_loss": -5.584552764892578, "global_step": 38727, "epoch": 922} {"train_loss": -5.69554328918457, "global_step": 38728, "epoch": 922} {"train_loss": -5.5680718421936035, "global_step": 38729, "epoch": 922} {"train_loss": -5.579923629760742, "global_step": 38730, "epoch": 922} {"train_loss": -5.615481853485107, "global_step": 38731, "epoch": 922} {"train_loss": -5.670750617980957, "global_step": 38732, "epoch": 922} {"train_loss": -5.602931976318359, "global_step": 38733, "epoch": 922} {"train_loss": -5.611306667327881, "global_step": 38734, "epoch": 922} {"train_loss": -5.445396423339844, "global_step": 38735, "epoch": 922} {"train_loss": -5.620235443115234, "global_step": 38736, "epoch": 922} {"train_loss": -5.625487327575684, "global_step": 38737, "epoch": 922} {"train_loss": -5.541775703430176, "global_step": 38738, "epoch": 922} {"train_loss": -5.5297346115112305, "global_step": 38739, "epoch": 922} {"train_loss": -5.760630130767822, "global_step": 38740, "epoch": 922} {"train_loss": -5.678947448730469, "global_step": 38741, "epoch": 922} {"train_loss": -5.582969665527344, "global_step": 38742, "epoch": 922} {"train_loss": -5.606533050537109, "global_step": 38743, "epoch": 922} {"train_loss": -5.613463401794434, "global_step": 38744, "epoch": 922} {"train_loss": -5.578729152679443, "global_step": 38745, "epoch": 922} {"train_loss": -5.4858527183532715, "global_step": 38746, "epoch": 922} {"train_loss": -5.701353073120117, "global_step": 38747, "epoch": 922} {"train_loss": -5.577445030212402, "global_step": 38748, "epoch": 922} {"train_loss": -5.519566059112549, "global_step": 38749, "epoch": 922} {"train_loss": -5.67392110824585, "global_step": 38750, "epoch": 922} {"train_loss": -5.631651878356934, "global_step": 38751, "epoch": 922} {"train_loss": -5.650873184204102, "global_step": 38752, "epoch": 922} {"train_loss": -5.836315155029297, "global_step": 38753, "epoch": 922} {"train_loss": -5.499896049499512, "global_step": 38754, "epoch": 922} {"train_loss": -5.6966376304626465, "global_step": 38755, "epoch": 922} {"train_loss": -5.711428165435791, "global_step": 38756, "epoch": 922} {"train_loss": -5.677151203155518, "global_step": 38757, "epoch": 922} {"train_loss": -5.5936408042907715, "global_step": 38758, "epoch": 922} {"train_loss": -5.603208065032959, "global_step": 38759, "epoch": 922} {"train_loss": -5.752549171447754, "global_step": 38760, "epoch": 922} {"train_loss": -5.561777114868164, "global_step": 38761, "epoch": 922} {"train_loss": -5.593053817749023, "global_step": 38762, "epoch": 922} {"train_loss": -5.5416154861450195, "global_step": 38763, "epoch": 922} {"train_loss": -5.502664566040039, "global_step": 38764, "epoch": 922} {"train_loss": -5.610379491533552, "global_step": 38765, "epoch": 922, "val_loss": 73794.6015625} {"train_loss": -5.530195713043213, "global_step": 38766, "epoch": 923} {"train_loss": -5.658607482910156, "global_step": 38767, "epoch": 923} {"train_loss": -5.635039329528809, "global_step": 38768, "epoch": 923} {"train_loss": -5.535741329193115, "global_step": 38769, "epoch": 923} {"train_loss": -5.44664192199707, "global_step": 38770, "epoch": 923} {"train_loss": -5.592209815979004, "global_step": 38771, "epoch": 923} {"train_loss": -5.62912654876709, "global_step": 38772, "epoch": 923} {"train_loss": -5.438834190368652, "global_step": 38773, "epoch": 923} {"train_loss": -5.551177024841309, "global_step": 38774, "epoch": 923} {"train_loss": -5.6152873039245605, "global_step": 38775, "epoch": 923} {"train_loss": -5.463469505310059, "global_step": 38776, "epoch": 923} {"train_loss": -5.506730556488037, "global_step": 38777, "epoch": 923} {"train_loss": -5.507931709289551, "global_step": 38778, "epoch": 923} {"train_loss": -5.464405536651611, "global_step": 38779, "epoch": 923} {"train_loss": -5.528550624847412, "global_step": 38780, "epoch": 923} {"train_loss": -5.550289154052734, "global_step": 38781, "epoch": 923} {"train_loss": -5.543180465698242, "global_step": 38782, "epoch": 923} {"train_loss": -5.425580024719238, "global_step": 38783, "epoch": 923} {"train_loss": -5.453305244445801, "global_step": 38784, "epoch": 923} {"train_loss": -5.583230972290039, "global_step": 38785, "epoch": 923} {"train_loss": -5.528677940368652, "global_step": 38786, "epoch": 923} {"train_loss": -5.502479076385498, "global_step": 38787, "epoch": 923} {"train_loss": -5.6215667724609375, "global_step": 38788, "epoch": 923} {"train_loss": -5.672494888305664, "global_step": 38789, "epoch": 923} {"train_loss": -5.490810871124268, "global_step": 38790, "epoch": 923} {"train_loss": -5.720745086669922, "global_step": 38791, "epoch": 923} {"train_loss": -5.574896812438965, "global_step": 38792, "epoch": 923} {"train_loss": -5.640514373779297, "global_step": 38793, "epoch": 923} {"train_loss": -5.6382527351379395, "global_step": 38794, "epoch": 923} {"train_loss": -5.653236389160156, "global_step": 38795, "epoch": 923} {"train_loss": -5.585503101348877, "global_step": 38796, "epoch": 923} {"train_loss": -5.566877365112305, "global_step": 38797, "epoch": 923} {"train_loss": -5.599128723144531, "global_step": 38798, "epoch": 923} {"train_loss": -5.659420013427734, "global_step": 38799, "epoch": 923} {"train_loss": -5.606697082519531, "global_step": 38800, "epoch": 923} {"train_loss": -5.703423023223877, "global_step": 38801, "epoch": 923} {"train_loss": -5.626189708709717, "global_step": 38802, "epoch": 923} {"train_loss": -5.6296916007995605, "global_step": 38803, "epoch": 923} {"train_loss": -5.5870490074157715, "global_step": 38804, "epoch": 923} {"train_loss": -5.723616600036621, "global_step": 38805, "epoch": 923} {"train_loss": -5.641019821166992, "global_step": 38806, "epoch": 923} {"train_loss": -5.579689150764828, "global_step": 38807, "epoch": 923, "val_loss": 73806.171875} {"train_loss": -5.654618740081787, "global_step": 38808, "epoch": 924} {"train_loss": -5.6430792808532715, "global_step": 38809, "epoch": 924} {"train_loss": -5.827204704284668, "global_step": 38810, "epoch": 924} {"train_loss": -5.623779296875, "global_step": 38811, "epoch": 924} {"train_loss": -5.607600212097168, "global_step": 38812, "epoch": 924} {"train_loss": -5.64985466003418, "global_step": 38813, "epoch": 924} {"train_loss": -5.7286248207092285, "global_step": 38814, "epoch": 924} {"train_loss": -5.55265474319458, "global_step": 38815, "epoch": 924} {"train_loss": -5.655917167663574, "global_step": 38816, "epoch": 924} {"train_loss": -5.529304504394531, "global_step": 38817, "epoch": 924} {"train_loss": -5.67091178894043, "global_step": 38818, "epoch": 924} {"train_loss": -5.478522300720215, "global_step": 38819, "epoch": 924} {"train_loss": -5.64270544052124, "global_step": 38820, "epoch": 924} {"train_loss": -5.581255912780762, "global_step": 38821, "epoch": 924} {"train_loss": -5.624860763549805, "global_step": 38822, "epoch": 924} {"train_loss": -5.563130855560303, "global_step": 38823, "epoch": 924} {"train_loss": -5.669782638549805, "global_step": 38824, "epoch": 924} {"train_loss": -5.595340251922607, "global_step": 38825, "epoch": 924} {"train_loss": -5.600865364074707, "global_step": 38826, "epoch": 924} {"train_loss": -5.629034996032715, "global_step": 38827, "epoch": 924} {"train_loss": -5.521780490875244, "global_step": 38828, "epoch": 924} {"train_loss": -5.634222984313965, "global_step": 38829, "epoch": 924} {"train_loss": -5.643061637878418, "global_step": 38830, "epoch": 924} {"train_loss": -5.543753623962402, "global_step": 38831, "epoch": 924} {"train_loss": -5.603767395019531, "global_step": 38832, "epoch": 924} {"train_loss": -5.607975006103516, "global_step": 38833, "epoch": 924} {"train_loss": -5.620062828063965, "global_step": 38834, "epoch": 924} {"train_loss": -5.586114883422852, "global_step": 38835, "epoch": 924} {"train_loss": -5.549523830413818, "global_step": 38836, "epoch": 924} {"train_loss": -5.777478218078613, "global_step": 38837, "epoch": 924} {"train_loss": -5.517114639282227, "global_step": 38838, "epoch": 924} {"train_loss": -5.478589057922363, "global_step": 38839, "epoch": 924} {"train_loss": -5.645540714263916, "global_step": 38840, "epoch": 924} {"train_loss": -5.628623008728027, "global_step": 38841, "epoch": 924} {"train_loss": -5.5890607833862305, "global_step": 38842, "epoch": 924} {"train_loss": -5.541565418243408, "global_step": 38843, "epoch": 924} {"train_loss": -5.541035175323486, "global_step": 38844, "epoch": 924} {"train_loss": -5.6324238777160645, "global_step": 38845, "epoch": 924} {"train_loss": -5.600261688232422, "global_step": 38846, "epoch": 924} {"train_loss": -5.627941131591797, "global_step": 38847, "epoch": 924} {"train_loss": -5.5902838706970215, "global_step": 38848, "epoch": 924} {"train_loss": -5.607662859417143, "global_step": 38849, "epoch": 924, "val_loss": 73898.4453125} {"train_loss": -5.64124870300293, "global_step": 38850, "epoch": 925} {"train_loss": -5.697671890258789, "global_step": 38851, "epoch": 925} {"train_loss": -5.495355606079102, "global_step": 38852, "epoch": 925} {"train_loss": -5.720981121063232, "global_step": 38853, "epoch": 925} {"train_loss": -5.646717548370361, "global_step": 38854, "epoch": 925} {"train_loss": -5.618556022644043, "global_step": 38855, "epoch": 925} {"train_loss": -5.716217041015625, "global_step": 38856, "epoch": 925} {"train_loss": -5.576336860656738, "global_step": 38857, "epoch": 925} {"train_loss": -5.429837226867676, "global_step": 38858, "epoch": 925} {"train_loss": -5.638379096984863, "global_step": 38859, "epoch": 925} {"train_loss": -5.445338249206543, "global_step": 38860, "epoch": 925} {"train_loss": -5.589539527893066, "global_step": 38861, "epoch": 925} {"train_loss": -5.552921295166016, "global_step": 38862, "epoch": 925} {"train_loss": -5.5435051918029785, "global_step": 38863, "epoch": 925} {"train_loss": -5.532983779907227, "global_step": 38864, "epoch": 925} {"train_loss": -5.440841197967529, "global_step": 38865, "epoch": 925} {"train_loss": -5.528482437133789, "global_step": 38866, "epoch": 925} {"train_loss": -5.637795448303223, "global_step": 38867, "epoch": 925} {"train_loss": -5.647091865539551, "global_step": 38868, "epoch": 925} {"train_loss": -5.628233909606934, "global_step": 38869, "epoch": 925} {"train_loss": -5.544935703277588, "global_step": 38870, "epoch": 925} {"train_loss": -5.6275177001953125, "global_step": 38871, "epoch": 925} {"train_loss": -5.571166515350342, "global_step": 38872, "epoch": 925} {"train_loss": -5.623362064361572, "global_step": 38873, "epoch": 925} {"train_loss": -5.596611499786377, "global_step": 38874, "epoch": 925} {"train_loss": -5.6030049324035645, "global_step": 38875, "epoch": 925} {"train_loss": -5.783503532409668, "global_step": 38876, "epoch": 925} {"train_loss": -5.58194637298584, "global_step": 38877, "epoch": 925} {"train_loss": -5.512179374694824, "global_step": 38878, "epoch": 925} {"train_loss": -5.4278035163879395, "global_step": 38879, "epoch": 925} {"train_loss": -5.609064102172852, "global_step": 38880, "epoch": 925} {"train_loss": -5.6120219230651855, "global_step": 38881, "epoch": 925} {"train_loss": -5.5265703201293945, "global_step": 38882, "epoch": 925} {"train_loss": -5.727817535400391, "global_step": 38883, "epoch": 925} {"train_loss": -5.6536865234375, "global_step": 38884, "epoch": 925} {"train_loss": -5.695053577423096, "global_step": 38885, "epoch": 925} {"train_loss": -5.610767364501953, "global_step": 38886, "epoch": 925} {"train_loss": -5.625919342041016, "global_step": 38887, "epoch": 925} {"train_loss": -5.617555618286133, "global_step": 38888, "epoch": 925} {"train_loss": -5.505231857299805, "global_step": 38889, "epoch": 925} {"train_loss": -5.693775177001953, "global_step": 38890, "epoch": 925} {"train_loss": -5.598437286558605, "global_step": 38891, "epoch": 925, "val_loss": 73855.90625} {"train_loss": -5.572432994842529, "global_step": 38892, "epoch": 926} {"train_loss": -5.578635215759277, "global_step": 38893, "epoch": 926} {"train_loss": -5.595550537109375, "global_step": 38894, "epoch": 926} {"train_loss": -5.490060806274414, "global_step": 38895, "epoch": 926} {"train_loss": -5.650508880615234, "global_step": 38896, "epoch": 926} {"train_loss": -5.530155658721924, "global_step": 38897, "epoch": 926} {"train_loss": -5.575118064880371, "global_step": 38898, "epoch": 926} {"train_loss": -5.619129180908203, "global_step": 38899, "epoch": 926} {"train_loss": -5.701067924499512, "global_step": 38900, "epoch": 926} {"train_loss": -5.6845269203186035, "global_step": 38901, "epoch": 926} {"train_loss": -5.621451377868652, "global_step": 38902, "epoch": 926} {"train_loss": -5.793145656585693, "global_step": 38903, "epoch": 926} {"train_loss": -5.519118309020996, "global_step": 38904, "epoch": 926} {"train_loss": -5.632575035095215, "global_step": 38905, "epoch": 926} {"train_loss": -5.568423748016357, "global_step": 38906, "epoch": 926} {"train_loss": -5.598631381988525, "global_step": 38907, "epoch": 926} {"train_loss": -5.743775367736816, "global_step": 38908, "epoch": 926} {"train_loss": -5.635719299316406, "global_step": 38909, "epoch": 926} {"train_loss": -5.56467866897583, "global_step": 38910, "epoch": 926} {"train_loss": -5.602221965789795, "global_step": 38911, "epoch": 926} {"train_loss": -5.514630317687988, "global_step": 38912, "epoch": 926} {"train_loss": -5.533082962036133, "global_step": 38913, "epoch": 926} {"train_loss": -5.618931293487549, "global_step": 38914, "epoch": 926} {"train_loss": -5.6626787185668945, "global_step": 38915, "epoch": 926} {"train_loss": -5.602983474731445, "global_step": 38916, "epoch": 926} {"train_loss": -5.5889763832092285, "global_step": 38917, "epoch": 926} {"train_loss": -5.628340721130371, "global_step": 38918, "epoch": 926} {"train_loss": -5.5662841796875, "global_step": 38919, "epoch": 926} {"train_loss": -5.609108924865723, "global_step": 38920, "epoch": 926} {"train_loss": -5.5435285568237305, "global_step": 38921, "epoch": 926} {"train_loss": -5.745424270629883, "global_step": 38922, "epoch": 926} {"train_loss": -5.663311958312988, "global_step": 38923, "epoch": 926} {"train_loss": -5.664471626281738, "global_step": 38924, "epoch": 926} {"train_loss": -5.666692733764648, "global_step": 38925, "epoch": 926} {"train_loss": -5.651644706726074, "global_step": 38926, "epoch": 926} {"train_loss": -5.731270790100098, "global_step": 38927, "epoch": 926} {"train_loss": -5.674260139465332, "global_step": 38928, "epoch": 926} {"train_loss": -5.628090858459473, "global_step": 38929, "epoch": 926} {"train_loss": -5.634669303894043, "global_step": 38930, "epoch": 926} {"train_loss": -5.455169677734375, "global_step": 38931, "epoch": 926} {"train_loss": -5.509444713592529, "global_step": 38932, "epoch": 926} {"train_loss": -5.615039507548015, "global_step": 38933, "epoch": 926, "val_loss": 73628.1015625} {"train_loss": -5.6954665184021, "global_step": 38934, "epoch": 927} {"train_loss": -5.723712921142578, "global_step": 38935, "epoch": 927} {"train_loss": -5.573751926422119, "global_step": 38936, "epoch": 927} {"train_loss": -5.613250732421875, "global_step": 38937, "epoch": 927} {"train_loss": -5.566112518310547, "global_step": 38938, "epoch": 927} {"train_loss": -5.637279987335205, "global_step": 38939, "epoch": 927} {"train_loss": -5.5638628005981445, "global_step": 38940, "epoch": 927} {"train_loss": -5.512434482574463, "global_step": 38941, "epoch": 927} {"train_loss": -5.578685760498047, "global_step": 38942, "epoch": 927} {"train_loss": -5.62283992767334, "global_step": 38943, "epoch": 927} {"train_loss": -5.458492279052734, "global_step": 38944, "epoch": 927} {"train_loss": -5.570611000061035, "global_step": 38945, "epoch": 927} {"train_loss": -5.6332597732543945, "global_step": 38946, "epoch": 927} {"train_loss": -5.586409568786621, "global_step": 38947, "epoch": 927} {"train_loss": -5.48902702331543, "global_step": 38948, "epoch": 927} {"train_loss": -5.6587653160095215, "global_step": 38949, "epoch": 927} {"train_loss": -5.464059829711914, "global_step": 38950, "epoch": 927} {"train_loss": -5.604147434234619, "global_step": 38951, "epoch": 927} {"train_loss": -5.619398593902588, "global_step": 38952, "epoch": 927} {"train_loss": -5.515480995178223, "global_step": 38953, "epoch": 927} {"train_loss": -5.641107559204102, "global_step": 38954, "epoch": 927} {"train_loss": -5.512213230133057, "global_step": 38955, "epoch": 927} {"train_loss": -5.628948211669922, "global_step": 38956, "epoch": 927} {"train_loss": -5.635085105895996, "global_step": 38957, "epoch": 927} {"train_loss": -5.504341125488281, "global_step": 38958, "epoch": 927} {"train_loss": -5.5695061683654785, "global_step": 38959, "epoch": 927} {"train_loss": -5.639232158660889, "global_step": 38960, "epoch": 927} {"train_loss": -5.547494411468506, "global_step": 38961, "epoch": 927} {"train_loss": -5.535147666931152, "global_step": 38962, "epoch": 927} {"train_loss": -5.602087020874023, "global_step": 38963, "epoch": 927} {"train_loss": -5.652096748352051, "global_step": 38964, "epoch": 927} {"train_loss": -5.849150657653809, "global_step": 38965, "epoch": 927} {"train_loss": -5.470555305480957, "global_step": 38966, "epoch": 927} {"train_loss": -5.628793239593506, "global_step": 38967, "epoch": 927} {"train_loss": -5.637035846710205, "global_step": 38968, "epoch": 927} {"train_loss": -5.466997146606445, "global_step": 38969, "epoch": 927} {"train_loss": -5.624485015869141, "global_step": 38970, "epoch": 927} {"train_loss": -5.613034725189209, "global_step": 38971, "epoch": 927} {"train_loss": -5.688841819763184, "global_step": 38972, "epoch": 927} {"train_loss": -5.644116401672363, "global_step": 38973, "epoch": 927} {"train_loss": -5.696653366088867, "global_step": 38974, "epoch": 927} {"train_loss": -5.598700103305635, "global_step": 38975, "epoch": 927, "val_loss": 73596.515625} {"train_loss": -5.724028587341309, "global_step": 38976, "epoch": 928} {"train_loss": -5.666348457336426, "global_step": 38977, "epoch": 928} {"train_loss": -5.599527835845947, "global_step": 38978, "epoch": 928} {"train_loss": -5.529215335845947, "global_step": 38979, "epoch": 928} {"train_loss": -5.622487545013428, "global_step": 38980, "epoch": 928} {"train_loss": -5.639041423797607, "global_step": 38981, "epoch": 928} {"train_loss": -5.718756675720215, "global_step": 38982, "epoch": 928} {"train_loss": -5.60598611831665, "global_step": 38983, "epoch": 928} {"train_loss": -5.574695587158203, "global_step": 38984, "epoch": 928} {"train_loss": -5.619846343994141, "global_step": 38985, "epoch": 928} {"train_loss": -5.715676307678223, "global_step": 38986, "epoch": 928} {"train_loss": -5.651208877563477, "global_step": 38987, "epoch": 928} {"train_loss": -5.627437591552734, "global_step": 38988, "epoch": 928} {"train_loss": -5.647558212280273, "global_step": 38989, "epoch": 928} {"train_loss": -5.582239151000977, "global_step": 38990, "epoch": 928} {"train_loss": -5.637850284576416, "global_step": 38991, "epoch": 928} {"train_loss": -5.677921295166016, "global_step": 38992, "epoch": 928} {"train_loss": -5.583422660827637, "global_step": 38993, "epoch": 928} {"train_loss": -5.607940673828125, "global_step": 38994, "epoch": 928} {"train_loss": -5.6726884841918945, "global_step": 38995, "epoch": 928} {"train_loss": -5.504010200500488, "global_step": 38996, "epoch": 928} {"train_loss": -5.612941265106201, "global_step": 38997, "epoch": 928} {"train_loss": -5.591075420379639, "global_step": 38998, "epoch": 928} {"train_loss": -5.740802764892578, "global_step": 38999, "epoch": 928} {"train_loss": -5.6265153884887695, "global_step": 39000, "epoch": 928} {"train_loss": -5.678921222686768, "global_step": 39001, "epoch": 928} {"train_loss": -5.507436275482178, "global_step": 39002, "epoch": 928} {"train_loss": -5.6637396812438965, "global_step": 39003, "epoch": 928} {"train_loss": -5.741690158843994, "global_step": 39004, "epoch": 928} {"train_loss": -5.598875045776367, "global_step": 39005, "epoch": 928} {"train_loss": -5.532310962677002, "global_step": 39006, "epoch": 928} {"train_loss": -5.559903621673584, "global_step": 39007, "epoch": 928} {"train_loss": -5.644762992858887, "global_step": 39008, "epoch": 928} {"train_loss": -5.552096366882324, "global_step": 39009, "epoch": 928} {"train_loss": -5.73325777053833, "global_step": 39010, "epoch": 928} {"train_loss": -5.648958683013916, "global_step": 39011, "epoch": 928} {"train_loss": -5.611270904541016, "global_step": 39012, "epoch": 928} {"train_loss": -5.710092544555664, "global_step": 39013, "epoch": 928} {"train_loss": -5.60926628112793, "global_step": 39014, "epoch": 928} {"train_loss": -5.569304466247559, "global_step": 39015, "epoch": 928} {"train_loss": -5.537083625793457, "global_step": 39016, "epoch": 928} {"train_loss": -5.62719251995995, "global_step": 39017, "epoch": 928, "val_loss": 74057.1875} {"train_loss": -5.651839733123779, "global_step": 39018, "epoch": 929} {"train_loss": -5.492746353149414, "global_step": 39019, "epoch": 929} {"train_loss": -5.543820381164551, "global_step": 39020, "epoch": 929} {"train_loss": -5.576501846313477, "global_step": 39021, "epoch": 929} {"train_loss": -5.5684404373168945, "global_step": 39022, "epoch": 929} {"train_loss": -5.527632713317871, "global_step": 39023, "epoch": 929} {"train_loss": -5.689113616943359, "global_step": 39024, "epoch": 929} {"train_loss": -5.543895244598389, "global_step": 39025, "epoch": 929} {"train_loss": -5.542089939117432, "global_step": 39026, "epoch": 929} {"train_loss": -5.564461708068848, "global_step": 39027, "epoch": 929} {"train_loss": -5.556341171264648, "global_step": 39028, "epoch": 929} {"train_loss": -5.533271312713623, "global_step": 39029, "epoch": 929} {"train_loss": -5.721566200256348, "global_step": 39030, "epoch": 929} {"train_loss": -5.567554473876953, "global_step": 39031, "epoch": 929} {"train_loss": -5.697242736816406, "global_step": 39032, "epoch": 929} {"train_loss": -5.7280731201171875, "global_step": 39033, "epoch": 929} {"train_loss": -5.753591537475586, "global_step": 39034, "epoch": 929} {"train_loss": -5.674648284912109, "global_step": 39035, "epoch": 929} {"train_loss": -5.64925479888916, "global_step": 39036, "epoch": 929} {"train_loss": -5.563413143157959, "global_step": 39037, "epoch": 929} {"train_loss": -5.640424728393555, "global_step": 39038, "epoch": 929} {"train_loss": -5.669318199157715, "global_step": 39039, "epoch": 929} {"train_loss": -5.7448320388793945, "global_step": 39040, "epoch": 929} {"train_loss": -5.641670227050781, "global_step": 39041, "epoch": 929} {"train_loss": -5.564573764801025, "global_step": 39042, "epoch": 929} {"train_loss": -5.482948303222656, "global_step": 39043, "epoch": 929} {"train_loss": -5.597792625427246, "global_step": 39044, "epoch": 929} {"train_loss": -5.561345100402832, "global_step": 39045, "epoch": 929} {"train_loss": -5.572279930114746, "global_step": 39046, "epoch": 929} {"train_loss": -5.659507751464844, "global_step": 39047, "epoch": 929} {"train_loss": -5.514719486236572, "global_step": 39048, "epoch": 929} {"train_loss": -5.5547285079956055, "global_step": 39049, "epoch": 929} {"train_loss": -5.604565620422363, "global_step": 39050, "epoch": 929} {"train_loss": -5.5755295753479, "global_step": 39051, "epoch": 929} {"train_loss": -5.72845458984375, "global_step": 39052, "epoch": 929} {"train_loss": -5.420592308044434, "global_step": 39053, "epoch": 929} {"train_loss": -5.7452921867370605, "global_step": 39054, "epoch": 929} {"train_loss": -5.578909873962402, "global_step": 39055, "epoch": 929} {"train_loss": -5.6027021408081055, "global_step": 39056, "epoch": 929} {"train_loss": -5.629345893859863, "global_step": 39057, "epoch": 929} {"train_loss": -5.4739885330200195, "global_step": 39058, "epoch": 929} {"train_loss": -5.602531614757719, "global_step": 39059, "epoch": 929, "val_loss": 74145.796875} {"train_loss": -5.504777431488037, "global_step": 39060, "epoch": 930} {"train_loss": -5.774218559265137, "global_step": 39061, "epoch": 930} {"train_loss": -5.61433219909668, "global_step": 39062, "epoch": 930} {"train_loss": -5.57917594909668, "global_step": 39063, "epoch": 930} {"train_loss": -5.543097496032715, "global_step": 39064, "epoch": 930} {"train_loss": -5.576775550842285, "global_step": 39065, "epoch": 930} {"train_loss": -5.705000877380371, "global_step": 39066, "epoch": 930} {"train_loss": -5.647946357727051, "global_step": 39067, "epoch": 930} {"train_loss": -5.611332893371582, "global_step": 39068, "epoch": 930} {"train_loss": -5.519236087799072, "global_step": 39069, "epoch": 930} {"train_loss": -5.539972305297852, "global_step": 39070, "epoch": 930} {"train_loss": -5.548888206481934, "global_step": 39071, "epoch": 930} {"train_loss": -5.67672061920166, "global_step": 39072, "epoch": 930} {"train_loss": -5.549490451812744, "global_step": 39073, "epoch": 930} {"train_loss": -5.563709259033203, "global_step": 39074, "epoch": 930} {"train_loss": -5.640586853027344, "global_step": 39075, "epoch": 930} {"train_loss": -5.506782531738281, "global_step": 39076, "epoch": 930} {"train_loss": -5.6154632568359375, "global_step": 39077, "epoch": 930} {"train_loss": -5.598457336425781, "global_step": 39078, "epoch": 930} {"train_loss": -5.433895111083984, "global_step": 39079, "epoch": 930} {"train_loss": -5.682041168212891, "global_step": 39080, "epoch": 930} {"train_loss": -5.52023458480835, "global_step": 39081, "epoch": 930} {"train_loss": -5.570825576782227, "global_step": 39082, "epoch": 930} {"train_loss": -5.487314224243164, "global_step": 39083, "epoch": 930} {"train_loss": -5.385235786437988, "global_step": 39084, "epoch": 930} {"train_loss": -5.577944755554199, "global_step": 39085, "epoch": 930} {"train_loss": -5.514444351196289, "global_step": 39086, "epoch": 930} {"train_loss": -5.61122989654541, "global_step": 39087, "epoch": 930} {"train_loss": -5.474132061004639, "global_step": 39088, "epoch": 930} {"train_loss": -5.588145732879639, "global_step": 39089, "epoch": 930} {"train_loss": -5.6666259765625, "global_step": 39090, "epoch": 930} {"train_loss": -5.512528419494629, "global_step": 39091, "epoch": 930} {"train_loss": -5.50990629196167, "global_step": 39092, "epoch": 930} {"train_loss": -5.426331996917725, "global_step": 39093, "epoch": 930} {"train_loss": -5.532549858093262, "global_step": 39094, "epoch": 930} {"train_loss": -5.584657669067383, "global_step": 39095, "epoch": 930} {"train_loss": -5.587484836578369, "global_step": 39096, "epoch": 930} {"train_loss": -5.585239887237549, "global_step": 39097, "epoch": 930} {"train_loss": -5.596997261047363, "global_step": 39098, "epoch": 930} {"train_loss": -5.609781265258789, "global_step": 39099, "epoch": 930} {"train_loss": -5.643289566040039, "global_step": 39100, "epoch": 930} {"train_loss": -5.5722114358629495, "global_step": 39101, "epoch": 930, "val_loss": 73749.59375} {"train_loss": -5.566111087799072, "global_step": 39102, "epoch": 931} {"train_loss": -5.704375743865967, "global_step": 39103, "epoch": 931} {"train_loss": -5.752159118652344, "global_step": 39104, "epoch": 931} {"train_loss": -5.5326995849609375, "global_step": 39105, "epoch": 931} {"train_loss": -5.622668266296387, "global_step": 39106, "epoch": 931} {"train_loss": -5.681478500366211, "global_step": 39107, "epoch": 931} {"train_loss": -5.483397006988525, "global_step": 39108, "epoch": 931} {"train_loss": -5.6512556076049805, "global_step": 39109, "epoch": 931} {"train_loss": -5.4887495040893555, "global_step": 39110, "epoch": 931} {"train_loss": -5.567148208618164, "global_step": 39111, "epoch": 931} {"train_loss": -5.494674205780029, "global_step": 39112, "epoch": 931} {"train_loss": -5.659295082092285, "global_step": 39113, "epoch": 931} {"train_loss": -5.6725850105285645, "global_step": 39114, "epoch": 931} {"train_loss": -5.591135025024414, "global_step": 39115, "epoch": 931} {"train_loss": -5.611940383911133, "global_step": 39116, "epoch": 931} {"train_loss": -5.675775527954102, "global_step": 39117, "epoch": 931} {"train_loss": -5.748950958251953, "global_step": 39118, "epoch": 931} {"train_loss": -5.671209335327148, "global_step": 39119, "epoch": 931} {"train_loss": -5.623234748840332, "global_step": 39120, "epoch": 931} {"train_loss": -5.5502753257751465, "global_step": 39121, "epoch": 931} {"train_loss": -5.564990043640137, "global_step": 39122, "epoch": 931} {"train_loss": -5.5251054763793945, "global_step": 39123, "epoch": 931} {"train_loss": -5.548396587371826, "global_step": 39124, "epoch": 931} {"train_loss": -5.619991302490234, "global_step": 39125, "epoch": 931} {"train_loss": -5.58187198638916, "global_step": 39126, "epoch": 931} {"train_loss": -5.646400451660156, "global_step": 39127, "epoch": 931} {"train_loss": -5.5435590744018555, "global_step": 39128, "epoch": 931} {"train_loss": -5.674675941467285, "global_step": 39129, "epoch": 931} {"train_loss": -5.622725486755371, "global_step": 39130, "epoch": 931} {"train_loss": -5.611745834350586, "global_step": 39131, "epoch": 931} {"train_loss": -5.573204517364502, "global_step": 39132, "epoch": 931} {"train_loss": -5.6402387619018555, "global_step": 39133, "epoch": 931} {"train_loss": -5.660483360290527, "global_step": 39134, "epoch": 931} {"train_loss": -5.592312335968018, "global_step": 39135, "epoch": 931} {"train_loss": -5.6033525466918945, "global_step": 39136, "epoch": 931} {"train_loss": -5.57503604888916, "global_step": 39137, "epoch": 931} {"train_loss": -5.545088768005371, "global_step": 39138, "epoch": 931} {"train_loss": -5.550687313079834, "global_step": 39139, "epoch": 931} {"train_loss": -5.670068740844727, "global_step": 39140, "epoch": 931} {"train_loss": -5.597222328186035, "global_step": 39141, "epoch": 931} {"train_loss": -5.519207000732422, "global_step": 39142, "epoch": 931} {"train_loss": -5.607948825472877, "global_step": 39143, "epoch": 931, "val_loss": 74430.7421875} {"train_loss": -5.453343868255615, "global_step": 39144, "epoch": 932} {"train_loss": -5.648832321166992, "global_step": 39145, "epoch": 932} {"train_loss": -5.564398765563965, "global_step": 39146, "epoch": 932} {"train_loss": -5.611513137817383, "global_step": 39147, "epoch": 932} {"train_loss": -5.5935187339782715, "global_step": 39148, "epoch": 932} {"train_loss": -5.718160152435303, "global_step": 39149, "epoch": 932} {"train_loss": -5.7522478103637695, "global_step": 39150, "epoch": 932} {"train_loss": -5.600874900817871, "global_step": 39151, "epoch": 932} {"train_loss": -5.646594524383545, "global_step": 39152, "epoch": 932} {"train_loss": -5.615966796875, "global_step": 39153, "epoch": 932} {"train_loss": -5.572000980377197, "global_step": 39154, "epoch": 932} {"train_loss": -5.625598430633545, "global_step": 39155, "epoch": 932} {"train_loss": -5.605088710784912, "global_step": 39156, "epoch": 932} {"train_loss": -5.664362907409668, "global_step": 39157, "epoch": 932} {"train_loss": -5.610105514526367, "global_step": 39158, "epoch": 932} {"train_loss": -5.657537460327148, "global_step": 39159, "epoch": 932} {"train_loss": -5.585552215576172, "global_step": 39160, "epoch": 932} {"train_loss": -5.563347816467285, "global_step": 39161, "epoch": 932} {"train_loss": -5.6832427978515625, "global_step": 39162, "epoch": 932} {"train_loss": -5.45435905456543, "global_step": 39163, "epoch": 932} {"train_loss": -5.531527519226074, "global_step": 39164, "epoch": 932} {"train_loss": -5.687576770782471, "global_step": 39165, "epoch": 932} {"train_loss": -5.523859977722168, "global_step": 39166, "epoch": 932} {"train_loss": -5.608716011047363, "global_step": 39167, "epoch": 932} {"train_loss": -5.493346214294434, "global_step": 39168, "epoch": 932} {"train_loss": -5.573678016662598, "global_step": 39169, "epoch": 932} {"train_loss": -5.582404136657715, "global_step": 39170, "epoch": 932} {"train_loss": -5.5402512550354, "global_step": 39171, "epoch": 932} {"train_loss": -5.678093910217285, "global_step": 39172, "epoch": 932} {"train_loss": -5.536927223205566, "global_step": 39173, "epoch": 932} {"train_loss": -5.7104926109313965, "global_step": 39174, "epoch": 932} {"train_loss": -5.465124130249023, "global_step": 39175, "epoch": 932} {"train_loss": -5.620292663574219, "global_step": 39176, "epoch": 932} {"train_loss": -5.653453826904297, "global_step": 39177, "epoch": 932} {"train_loss": -5.596153259277344, "global_step": 39178, "epoch": 932} {"train_loss": -5.609220027923584, "global_step": 39179, "epoch": 932} {"train_loss": -5.638171195983887, "global_step": 39180, "epoch": 932} {"train_loss": -5.626198768615723, "global_step": 39181, "epoch": 932} {"train_loss": -5.429030418395996, "global_step": 39182, "epoch": 932} {"train_loss": -5.689761161804199, "global_step": 39183, "epoch": 932} {"train_loss": -5.681787967681885, "global_step": 39184, "epoch": 932} {"train_loss": -5.60266637802124, "global_step": 39185, "epoch": 932, "val_loss": 73955.015625} {"train_loss": -5.51747989654541, "global_step": 39186, "epoch": 933} {"train_loss": -5.621506690979004, "global_step": 39187, "epoch": 933} {"train_loss": -5.609508991241455, "global_step": 39188, "epoch": 933} {"train_loss": -5.448724269866943, "global_step": 39189, "epoch": 933} {"train_loss": -5.522508144378662, "global_step": 39190, "epoch": 933} {"train_loss": -5.3396711349487305, "global_step": 39191, "epoch": 933} {"train_loss": -5.5742950439453125, "global_step": 39192, "epoch": 933} {"train_loss": -5.515389442443848, "global_step": 39193, "epoch": 933} {"train_loss": -5.502184867858887, "global_step": 39194, "epoch": 933} {"train_loss": -5.706533908843994, "global_step": 39195, "epoch": 933} {"train_loss": -5.437891960144043, "global_step": 39196, "epoch": 933} {"train_loss": -5.6736249923706055, "global_step": 39197, "epoch": 933} {"train_loss": -5.5061140060424805, "global_step": 39198, "epoch": 933} {"train_loss": -5.622812747955322, "global_step": 39199, "epoch": 933} {"train_loss": -5.536647796630859, "global_step": 39200, "epoch": 933} {"train_loss": -5.580810546875, "global_step": 39201, "epoch": 933} {"train_loss": -5.520348072052002, "global_step": 39202, "epoch": 933} {"train_loss": -5.547590255737305, "global_step": 39203, "epoch": 933} {"train_loss": -5.617598056793213, "global_step": 39204, "epoch": 933} {"train_loss": -5.552641868591309, "global_step": 39205, "epoch": 933} {"train_loss": -5.607270240783691, "global_step": 39206, "epoch": 933} {"train_loss": -5.634143829345703, "global_step": 39207, "epoch": 933} {"train_loss": -5.661179065704346, "global_step": 39208, "epoch": 933} {"train_loss": -5.580552101135254, "global_step": 39209, "epoch": 933} {"train_loss": -5.548267364501953, "global_step": 39210, "epoch": 933} {"train_loss": -5.629186630249023, "global_step": 39211, "epoch": 933} {"train_loss": -5.630440711975098, "global_step": 39212, "epoch": 933} {"train_loss": -5.732732772827148, "global_step": 39213, "epoch": 933} {"train_loss": -5.584393501281738, "global_step": 39214, "epoch": 933} {"train_loss": -5.602407455444336, "global_step": 39215, "epoch": 933} {"train_loss": -5.540943145751953, "global_step": 39216, "epoch": 933} {"train_loss": -5.615931510925293, "global_step": 39217, "epoch": 933} {"train_loss": -5.753802299499512, "global_step": 39218, "epoch": 933} {"train_loss": -5.589301109313965, "global_step": 39219, "epoch": 933} {"train_loss": -5.687588691711426, "global_step": 39220, "epoch": 933} {"train_loss": -5.6627197265625, "global_step": 39221, "epoch": 933} {"train_loss": -5.577378273010254, "global_step": 39222, "epoch": 933} {"train_loss": -5.744424819946289, "global_step": 39223, "epoch": 933} {"train_loss": -5.568016052246094, "global_step": 39224, "epoch": 933} {"train_loss": -5.412440299987793, "global_step": 39225, "epoch": 933} {"train_loss": -5.653011322021484, "global_step": 39226, "epoch": 933} {"train_loss": -5.5840281418391635, "global_step": 39227, "epoch": 933, "val_loss": 74804.4609375} {"train_loss": -5.413210868835449, "global_step": 39228, "epoch": 934} {"train_loss": -5.629300117492676, "global_step": 39229, "epoch": 934} {"train_loss": -5.443301200866699, "global_step": 39230, "epoch": 934} {"train_loss": -5.654793739318848, "global_step": 39231, "epoch": 934} {"train_loss": -5.563031196594238, "global_step": 39232, "epoch": 934} {"train_loss": -5.388427734375, "global_step": 39233, "epoch": 934} {"train_loss": -5.667762756347656, "global_step": 39234, "epoch": 934} {"train_loss": -5.662419319152832, "global_step": 39235, "epoch": 934} {"train_loss": -5.585238933563232, "global_step": 39236, "epoch": 934} {"train_loss": -5.441278457641602, "global_step": 39237, "epoch": 934} {"train_loss": -5.6842193603515625, "global_step": 39238, "epoch": 934} {"train_loss": -5.5315423011779785, "global_step": 39239, "epoch": 934} {"train_loss": -5.584918022155762, "global_step": 39240, "epoch": 934} {"train_loss": -5.467302322387695, "global_step": 39241, "epoch": 934} {"train_loss": -5.6836090087890625, "global_step": 39242, "epoch": 934} {"train_loss": -5.533224105834961, "global_step": 39243, "epoch": 934} {"train_loss": -5.5496416091918945, "global_step": 39244, "epoch": 934} {"train_loss": -5.536680221557617, "global_step": 39245, "epoch": 934} {"train_loss": -5.59705924987793, "global_step": 39246, "epoch": 934} {"train_loss": -5.612608909606934, "global_step": 39247, "epoch": 934} {"train_loss": -5.501718521118164, "global_step": 39248, "epoch": 934} {"train_loss": -5.519962310791016, "global_step": 39249, "epoch": 934} {"train_loss": -5.746943473815918, "global_step": 39250, "epoch": 934} {"train_loss": -5.633230209350586, "global_step": 39251, "epoch": 934} {"train_loss": -5.5817437171936035, "global_step": 39252, "epoch": 934} {"train_loss": -5.571120262145996, "global_step": 39253, "epoch": 934} {"train_loss": -5.61698579788208, "global_step": 39254, "epoch": 934} {"train_loss": -5.829677581787109, "global_step": 39255, "epoch": 934} {"train_loss": -5.65447998046875, "global_step": 39256, "epoch": 934} {"train_loss": -5.649896621704102, "global_step": 39257, "epoch": 934} {"train_loss": -5.650932312011719, "global_step": 39258, "epoch": 934} {"train_loss": -5.5252685546875, "global_step": 39259, "epoch": 934} {"train_loss": -5.572239875793457, "global_step": 39260, "epoch": 934} {"train_loss": -5.5361328125, "global_step": 39261, "epoch": 934} {"train_loss": -5.634448051452637, "global_step": 39262, "epoch": 934} {"train_loss": -5.580862522125244, "global_step": 39263, "epoch": 934} {"train_loss": -5.576903343200684, "global_step": 39264, "epoch": 934} {"train_loss": -5.612227439880371, "global_step": 39265, "epoch": 934} {"train_loss": -5.669557571411133, "global_step": 39266, "epoch": 934} {"train_loss": -5.569412708282471, "global_step": 39267, "epoch": 934} {"train_loss": -5.682145118713379, "global_step": 39268, "epoch": 934} {"train_loss": -5.589022965658279, "global_step": 39269, "epoch": 934, "val_loss": 74558.5390625} {"train_loss": -5.700501441955566, "global_step": 39270, "epoch": 935} {"train_loss": -5.65262508392334, "global_step": 39271, "epoch": 935} {"train_loss": -5.53094482421875, "global_step": 39272, "epoch": 935} {"train_loss": -5.5620927810668945, "global_step": 39273, "epoch": 935} {"train_loss": -5.641988277435303, "global_step": 39274, "epoch": 935} {"train_loss": -5.689678192138672, "global_step": 39275, "epoch": 935} {"train_loss": -5.7009687423706055, "global_step": 39276, "epoch": 935} {"train_loss": -5.570060729980469, "global_step": 39277, "epoch": 935} {"train_loss": -5.53659725189209, "global_step": 39278, "epoch": 935} {"train_loss": -5.691530227661133, "global_step": 39279, "epoch": 935} {"train_loss": -5.629299163818359, "global_step": 39280, "epoch": 935} {"train_loss": -5.531786918640137, "global_step": 39281, "epoch": 935} {"train_loss": -5.564932346343994, "global_step": 39282, "epoch": 935} {"train_loss": -5.753118515014648, "global_step": 39283, "epoch": 935} {"train_loss": -5.60804557800293, "global_step": 39284, "epoch": 935} {"train_loss": -5.622659206390381, "global_step": 39285, "epoch": 935} {"train_loss": -5.676442623138428, "global_step": 39286, "epoch": 935} {"train_loss": -5.592907428741455, "global_step": 39287, "epoch": 935} {"train_loss": -5.68776273727417, "global_step": 39288, "epoch": 935} {"train_loss": -5.607918739318848, "global_step": 39289, "epoch": 935} {"train_loss": -5.608388900756836, "global_step": 39290, "epoch": 935} {"train_loss": -5.5588579177856445, "global_step": 39291, "epoch": 935} {"train_loss": -5.541455268859863, "global_step": 39292, "epoch": 935} {"train_loss": -5.6484575271606445, "global_step": 39293, "epoch": 935} {"train_loss": -5.566270351409912, "global_step": 39294, "epoch": 935} {"train_loss": -5.669418811798096, "global_step": 39295, "epoch": 935} {"train_loss": -5.55461311340332, "global_step": 39296, "epoch": 935} {"train_loss": -5.663628101348877, "global_step": 39297, "epoch": 935} {"train_loss": -5.620643138885498, "global_step": 39298, "epoch": 935} {"train_loss": -5.642064571380615, "global_step": 39299, "epoch": 935} {"train_loss": -5.5941267013549805, "global_step": 39300, "epoch": 935} {"train_loss": -5.711731433868408, "global_step": 39301, "epoch": 935} {"train_loss": -5.58817195892334, "global_step": 39302, "epoch": 935} {"train_loss": -5.627449989318848, "global_step": 39303, "epoch": 935} {"train_loss": -5.6819257736206055, "global_step": 39304, "epoch": 935} {"train_loss": -5.656713485717773, "global_step": 39305, "epoch": 935} {"train_loss": -5.505983352661133, "global_step": 39306, "epoch": 935} {"train_loss": -5.734699249267578, "global_step": 39307, "epoch": 935} {"train_loss": -5.6159348487854, "global_step": 39308, "epoch": 935} {"train_loss": -5.601595878601074, "global_step": 39309, "epoch": 935} {"train_loss": -5.575796127319336, "global_step": 39310, "epoch": 935} {"train_loss": -5.621868757974534, "global_step": 39311, "epoch": 935, "val_loss": 74031.8984375} {"train_loss": -5.485784530639648, "global_step": 39312, "epoch": 936} {"train_loss": -5.573071479797363, "global_step": 39313, "epoch": 936} {"train_loss": -5.396248817443848, "global_step": 39314, "epoch": 936} {"train_loss": -5.638399600982666, "global_step": 39315, "epoch": 936} {"train_loss": -5.462925910949707, "global_step": 39316, "epoch": 936} {"train_loss": -5.559650897979736, "global_step": 39317, "epoch": 936} {"train_loss": -5.770354270935059, "global_step": 39318, "epoch": 936} {"train_loss": -5.542183876037598, "global_step": 39319, "epoch": 936} {"train_loss": -5.521964073181152, "global_step": 39320, "epoch": 936} {"train_loss": -5.5378828048706055, "global_step": 39321, "epoch": 936} {"train_loss": -5.581782817840576, "global_step": 39322, "epoch": 936} {"train_loss": -5.583303451538086, "global_step": 39323, "epoch": 936} {"train_loss": -5.55994176864624, "global_step": 39324, "epoch": 936} {"train_loss": -5.652004241943359, "global_step": 39325, "epoch": 936} {"train_loss": -5.578163146972656, "global_step": 39326, "epoch": 936} {"train_loss": -5.534117698669434, "global_step": 39327, "epoch": 936} {"train_loss": -5.562220573425293, "global_step": 39328, "epoch": 936} {"train_loss": -5.6389923095703125, "global_step": 39329, "epoch": 936} {"train_loss": -5.61747932434082, "global_step": 39330, "epoch": 936} {"train_loss": -5.473073959350586, "global_step": 39331, "epoch": 936} {"train_loss": -5.576284408569336, "global_step": 39332, "epoch": 936} {"train_loss": -5.56381368637085, "global_step": 39333, "epoch": 936} {"train_loss": -5.459378242492676, "global_step": 39334, "epoch": 936} {"train_loss": -5.48450231552124, "global_step": 39335, "epoch": 936} {"train_loss": -5.6143317222595215, "global_step": 39336, "epoch": 936} {"train_loss": -5.486485481262207, "global_step": 39337, "epoch": 936} {"train_loss": -5.534602165222168, "global_step": 39338, "epoch": 936} {"train_loss": -5.653988361358643, "global_step": 39339, "epoch": 936} {"train_loss": -5.5391364097595215, "global_step": 39340, "epoch": 936} {"train_loss": -5.709324836730957, "global_step": 39341, "epoch": 936} {"train_loss": -5.524080276489258, "global_step": 39342, "epoch": 936} {"train_loss": -5.552346706390381, "global_step": 39343, "epoch": 936} {"train_loss": -5.588440895080566, "global_step": 39344, "epoch": 936} {"train_loss": -5.650287628173828, "global_step": 39345, "epoch": 936} {"train_loss": -5.59359073638916, "global_step": 39346, "epoch": 936} {"train_loss": -5.703510761260986, "global_step": 39347, "epoch": 936} {"train_loss": -5.593050479888916, "global_step": 39348, "epoch": 936} {"train_loss": -5.727297306060791, "global_step": 39349, "epoch": 936} {"train_loss": -5.592675685882568, "global_step": 39350, "epoch": 936} {"train_loss": -5.542201519012451, "global_step": 39351, "epoch": 936} {"train_loss": -5.690009593963623, "global_step": 39352, "epoch": 936} {"train_loss": -5.581874960944766, "global_step": 39353, "epoch": 936, "val_loss": 73694.75} {"train_loss": -5.531536102294922, "global_step": 39354, "epoch": 937} {"train_loss": -5.524386405944824, "global_step": 39355, "epoch": 937} {"train_loss": -5.423192977905273, "global_step": 39356, "epoch": 937} {"train_loss": -5.504315376281738, "global_step": 39357, "epoch": 937} {"train_loss": -5.466440200805664, "global_step": 39358, "epoch": 937} {"train_loss": -5.580191612243652, "global_step": 39359, "epoch": 937} {"train_loss": -5.601919174194336, "global_step": 39360, "epoch": 937} {"train_loss": -5.670142650604248, "global_step": 39361, "epoch": 937} {"train_loss": -5.651278972625732, "global_step": 39362, "epoch": 937} {"train_loss": -5.549979209899902, "global_step": 39363, "epoch": 937} {"train_loss": -5.689020156860352, "global_step": 39364, "epoch": 937} {"train_loss": -5.6991682052612305, "global_step": 39365, "epoch": 937} {"train_loss": -5.578714370727539, "global_step": 39366, "epoch": 937} {"train_loss": -5.575047492980957, "global_step": 39367, "epoch": 937} {"train_loss": -5.686131477355957, "global_step": 39368, "epoch": 937} {"train_loss": -5.581308364868164, "global_step": 39369, "epoch": 937} {"train_loss": -5.570676803588867, "global_step": 39370, "epoch": 937} {"train_loss": -5.602631568908691, "global_step": 39371, "epoch": 937} {"train_loss": -5.624743461608887, "global_step": 39372, "epoch": 937} {"train_loss": -5.569604873657227, "global_step": 39373, "epoch": 937} {"train_loss": -5.638751983642578, "global_step": 39374, "epoch": 937} {"train_loss": -5.649548053741455, "global_step": 39375, "epoch": 937} {"train_loss": -5.4566426277160645, "global_step": 39376, "epoch": 937} {"train_loss": -5.671486854553223, "global_step": 39377, "epoch": 937} {"train_loss": -5.574871063232422, "global_step": 39378, "epoch": 937} {"train_loss": -5.520476818084717, "global_step": 39379, "epoch": 937} {"train_loss": -5.576837539672852, "global_step": 39380, "epoch": 937} {"train_loss": -5.568821907043457, "global_step": 39381, "epoch": 937} {"train_loss": -5.550787925720215, "global_step": 39382, "epoch": 937} {"train_loss": -5.5743727684021, "global_step": 39383, "epoch": 937} {"train_loss": -5.657671928405762, "global_step": 39384, "epoch": 937} {"train_loss": -5.645204544067383, "global_step": 39385, "epoch": 937} {"train_loss": -5.570498466491699, "global_step": 39386, "epoch": 937} {"train_loss": -5.661759376525879, "global_step": 39387, "epoch": 937} {"train_loss": -5.694343566894531, "global_step": 39388, "epoch": 937} {"train_loss": -5.677227020263672, "global_step": 39389, "epoch": 937} {"train_loss": -5.653444290161133, "global_step": 39390, "epoch": 937} {"train_loss": -5.635517597198486, "global_step": 39391, "epoch": 937} {"train_loss": -5.693912506103516, "global_step": 39392, "epoch": 937} {"train_loss": -5.597795486450195, "global_step": 39393, "epoch": 937} {"train_loss": -5.649618625640869, "global_step": 39394, "epoch": 937} {"train_loss": -5.601966540018718, "global_step": 39395, "epoch": 937, "val_loss": 73492.359375} {"train_loss": -5.665310859680176, "global_step": 39396, "epoch": 938} {"train_loss": -5.543895721435547, "global_step": 39397, "epoch": 938} {"train_loss": -5.6163458824157715, "global_step": 39398, "epoch": 938} {"train_loss": -5.720606803894043, "global_step": 39399, "epoch": 938} {"train_loss": -5.659513473510742, "global_step": 39400, "epoch": 938} {"train_loss": -5.628302097320557, "global_step": 39401, "epoch": 938} {"train_loss": -5.736743927001953, "global_step": 39402, "epoch": 938} {"train_loss": -5.509981155395508, "global_step": 39403, "epoch": 938} {"train_loss": -5.760334491729736, "global_step": 39404, "epoch": 938} {"train_loss": -5.721004486083984, "global_step": 39405, "epoch": 938} {"train_loss": -5.594815254211426, "global_step": 39406, "epoch": 938} {"train_loss": -5.608468055725098, "global_step": 39407, "epoch": 938} {"train_loss": -5.628026962280273, "global_step": 39408, "epoch": 938} {"train_loss": -5.584897518157959, "global_step": 39409, "epoch": 938} {"train_loss": -5.691561222076416, "global_step": 39410, "epoch": 938} {"train_loss": -5.501584053039551, "global_step": 39411, "epoch": 938} {"train_loss": -5.619147777557373, "global_step": 39412, "epoch": 938} {"train_loss": -5.666501045227051, "global_step": 39413, "epoch": 938} {"train_loss": -5.713428497314453, "global_step": 39414, "epoch": 938} {"train_loss": -5.65404748916626, "global_step": 39415, "epoch": 938} {"train_loss": -5.557080268859863, "global_step": 39416, "epoch": 938} {"train_loss": -5.590282440185547, "global_step": 39417, "epoch": 938} {"train_loss": -5.6394853591918945, "global_step": 39418, "epoch": 938} {"train_loss": -5.694418907165527, "global_step": 39419, "epoch": 938} {"train_loss": -5.6254377365112305, "global_step": 39420, "epoch": 938} {"train_loss": -5.6400604248046875, "global_step": 39421, "epoch": 938} {"train_loss": -5.635009765625, "global_step": 39422, "epoch": 938} {"train_loss": -5.715683937072754, "global_step": 39423, "epoch": 938} {"train_loss": -5.74911642074585, "global_step": 39424, "epoch": 938} {"train_loss": -5.659695148468018, "global_step": 39425, "epoch": 938} {"train_loss": -5.731596946716309, "global_step": 39426, "epoch": 938} {"train_loss": -5.53365421295166, "global_step": 39427, "epoch": 938} {"train_loss": -5.512092590332031, "global_step": 39428, "epoch": 938} {"train_loss": -5.727407455444336, "global_step": 39429, "epoch": 938} {"train_loss": -5.737740516662598, "global_step": 39430, "epoch": 938} {"train_loss": -5.717948913574219, "global_step": 39431, "epoch": 938} {"train_loss": -5.673149108886719, "global_step": 39432, "epoch": 938} {"train_loss": -5.608821392059326, "global_step": 39433, "epoch": 938} {"train_loss": -5.623960494995117, "global_step": 39434, "epoch": 938} {"train_loss": -5.639156341552734, "global_step": 39435, "epoch": 938} {"train_loss": -5.684752941131592, "global_step": 39436, "epoch": 938} {"train_loss": -5.645294802529471, "global_step": 39437, "epoch": 938, "val_loss": 73317.3125} {"train_loss": -5.583423137664795, "global_step": 39438, "epoch": 939} {"train_loss": -5.730484962463379, "global_step": 39439, "epoch": 939} {"train_loss": -5.506853103637695, "global_step": 39440, "epoch": 939} {"train_loss": -5.579099178314209, "global_step": 39441, "epoch": 939} {"train_loss": -5.474587440490723, "global_step": 39442, "epoch": 939} {"train_loss": -5.630151748657227, "global_step": 39443, "epoch": 939} {"train_loss": -5.640871047973633, "global_step": 39444, "epoch": 939} {"train_loss": -5.650062084197998, "global_step": 39445, "epoch": 939} {"train_loss": -5.660113334655762, "global_step": 39446, "epoch": 939} {"train_loss": -5.581345558166504, "global_step": 39447, "epoch": 939} {"train_loss": -5.604654312133789, "global_step": 39448, "epoch": 939} {"train_loss": -5.501526355743408, "global_step": 39449, "epoch": 939} {"train_loss": -5.629073619842529, "global_step": 39450, "epoch": 939} {"train_loss": -5.674080848693848, "global_step": 39451, "epoch": 939} {"train_loss": -5.643448829650879, "global_step": 39452, "epoch": 939} {"train_loss": -5.738012313842773, "global_step": 39453, "epoch": 939} {"train_loss": -5.6101531982421875, "global_step": 39454, "epoch": 939} {"train_loss": -5.6316609382629395, "global_step": 39455, "epoch": 939} {"train_loss": -5.625914573669434, "global_step": 39456, "epoch": 939} {"train_loss": -5.560729503631592, "global_step": 39457, "epoch": 939} {"train_loss": -5.658535957336426, "global_step": 39458, "epoch": 939} {"train_loss": -5.656435012817383, "global_step": 39459, "epoch": 939} {"train_loss": -5.574951171875, "global_step": 39460, "epoch": 939} {"train_loss": -5.60273551940918, "global_step": 39461, "epoch": 939} {"train_loss": -5.731632232666016, "global_step": 39462, "epoch": 939} {"train_loss": -5.540988922119141, "global_step": 39463, "epoch": 939} {"train_loss": -5.635541915893555, "global_step": 39464, "epoch": 939} {"train_loss": -5.663976669311523, "global_step": 39465, "epoch": 939} {"train_loss": -5.533788681030273, "global_step": 39466, "epoch": 939} {"train_loss": -5.591114044189453, "global_step": 39467, "epoch": 939} {"train_loss": -5.705367088317871, "global_step": 39468, "epoch": 939} {"train_loss": -5.697729587554932, "global_step": 39469, "epoch": 939} {"train_loss": -5.5529961585998535, "global_step": 39470, "epoch": 939} {"train_loss": -5.57257080078125, "global_step": 39471, "epoch": 939} {"train_loss": -5.553588390350342, "global_step": 39472, "epoch": 939} {"train_loss": -5.758490562438965, "global_step": 39473, "epoch": 939} {"train_loss": -5.722444534301758, "global_step": 39474, "epoch": 939} {"train_loss": -5.610871315002441, "global_step": 39475, "epoch": 939} {"train_loss": -5.735169410705566, "global_step": 39476, "epoch": 939} {"train_loss": -5.7353081703186035, "global_step": 39477, "epoch": 939} {"train_loss": -5.641173362731934, "global_step": 39478, "epoch": 939} {"train_loss": -5.630511635825748, "global_step": 39479, "epoch": 939, "val_loss": 73966.9140625} {"train_loss": -5.651784420013428, "global_step": 39480, "epoch": 940} {"train_loss": -5.722752094268799, "global_step": 39481, "epoch": 940} {"train_loss": -5.602586269378662, "global_step": 39482, "epoch": 940} {"train_loss": -5.637073516845703, "global_step": 39483, "epoch": 940} {"train_loss": -5.537194728851318, "global_step": 39484, "epoch": 940} {"train_loss": -5.545370578765869, "global_step": 39485, "epoch": 940} {"train_loss": -5.723267078399658, "global_step": 39486, "epoch": 940} {"train_loss": -5.678507328033447, "global_step": 39487, "epoch": 940} {"train_loss": -5.618401527404785, "global_step": 39488, "epoch": 940} {"train_loss": -5.709630966186523, "global_step": 39489, "epoch": 940} {"train_loss": -5.612244606018066, "global_step": 39490, "epoch": 940} {"train_loss": -5.668020725250244, "global_step": 39491, "epoch": 940} {"train_loss": -5.603641033172607, "global_step": 39492, "epoch": 940} {"train_loss": -5.53967809677124, "global_step": 39493, "epoch": 940} {"train_loss": -5.562686920166016, "global_step": 39494, "epoch": 940} {"train_loss": -5.620573997497559, "global_step": 39495, "epoch": 940} {"train_loss": -5.665450096130371, "global_step": 39496, "epoch": 940} {"train_loss": -5.616696357727051, "global_step": 39497, "epoch": 940} {"train_loss": -5.762993812561035, "global_step": 39498, "epoch": 940} {"train_loss": -5.673595428466797, "global_step": 39499, "epoch": 940} {"train_loss": -5.6176910400390625, "global_step": 39500, "epoch": 940} {"train_loss": -5.611831188201904, "global_step": 39501, "epoch": 940} {"train_loss": -5.686575889587402, "global_step": 39502, "epoch": 940} {"train_loss": -5.654424667358398, "global_step": 39503, "epoch": 940} {"train_loss": -5.523107528686523, "global_step": 39504, "epoch": 940} {"train_loss": -5.695876121520996, "global_step": 39505, "epoch": 940} {"train_loss": -5.568234443664551, "global_step": 39506, "epoch": 940} {"train_loss": -5.582944393157959, "global_step": 39507, "epoch": 940} {"train_loss": -5.622511863708496, "global_step": 39508, "epoch": 940} {"train_loss": -5.651055335998535, "global_step": 39509, "epoch": 940} {"train_loss": -5.49004602432251, "global_step": 39510, "epoch": 940} {"train_loss": -5.608242034912109, "global_step": 39511, "epoch": 940} {"train_loss": -5.694289207458496, "global_step": 39512, "epoch": 940} {"train_loss": -5.478096008300781, "global_step": 39513, "epoch": 940} {"train_loss": -5.594581604003906, "global_step": 39514, "epoch": 940} {"train_loss": -5.574681758880615, "global_step": 39515, "epoch": 940} {"train_loss": -5.5530171394348145, "global_step": 39516, "epoch": 940} {"train_loss": -5.619122505187988, "global_step": 39517, "epoch": 940} {"train_loss": -5.6838579177856445, "global_step": 39518, "epoch": 940} {"train_loss": -5.521752834320068, "global_step": 39519, "epoch": 940} {"train_loss": -5.664472579956055, "global_step": 39520, "epoch": 940} {"train_loss": -5.622106381825039, "global_step": 39521, "epoch": 940, "val_loss": 73696.515625} {"train_loss": -5.6766510009765625, "global_step": 39522, "epoch": 941} {"train_loss": -5.645079612731934, "global_step": 39523, "epoch": 941} {"train_loss": -5.608549118041992, "global_step": 39524, "epoch": 941} {"train_loss": -5.563084125518799, "global_step": 39525, "epoch": 941} {"train_loss": -5.723086357116699, "global_step": 39526, "epoch": 941} {"train_loss": -5.580859184265137, "global_step": 39527, "epoch": 941} {"train_loss": -5.567218780517578, "global_step": 39528, "epoch": 941} {"train_loss": -5.6373610496521, "global_step": 39529, "epoch": 941} {"train_loss": -5.684018135070801, "global_step": 39530, "epoch": 941} {"train_loss": -5.509932518005371, "global_step": 39531, "epoch": 941} {"train_loss": -5.6991095542907715, "global_step": 39532, "epoch": 941} {"train_loss": -5.612973213195801, "global_step": 39533, "epoch": 941} {"train_loss": -5.714692115783691, "global_step": 39534, "epoch": 941} {"train_loss": -5.52904748916626, "global_step": 39535, "epoch": 941} {"train_loss": -5.560833930969238, "global_step": 39536, "epoch": 941} {"train_loss": -5.533201694488525, "global_step": 39537, "epoch": 941} {"train_loss": -5.615413665771484, "global_step": 39538, "epoch": 941} {"train_loss": -5.522787094116211, "global_step": 39539, "epoch": 941} {"train_loss": -5.631287574768066, "global_step": 39540, "epoch": 941} {"train_loss": -5.442955017089844, "global_step": 39541, "epoch": 941} {"train_loss": -5.592533588409424, "global_step": 39542, "epoch": 941} {"train_loss": -5.64406681060791, "global_step": 39543, "epoch": 941} {"train_loss": -5.453183174133301, "global_step": 39544, "epoch": 941} {"train_loss": -5.697144508361816, "global_step": 39545, "epoch": 941} {"train_loss": -5.581844329833984, "global_step": 39546, "epoch": 941} {"train_loss": -5.627092361450195, "global_step": 39547, "epoch": 941} {"train_loss": -5.55928373336792, "global_step": 39548, "epoch": 941} {"train_loss": -5.616512298583984, "global_step": 39549, "epoch": 941} {"train_loss": -5.657495498657227, "global_step": 39550, "epoch": 941} {"train_loss": -5.589268684387207, "global_step": 39551, "epoch": 941} {"train_loss": -5.548964977264404, "global_step": 39552, "epoch": 941} {"train_loss": -5.554093837738037, "global_step": 39553, "epoch": 941} {"train_loss": -5.604097366333008, "global_step": 39554, "epoch": 941} {"train_loss": -5.556027412414551, "global_step": 39555, "epoch": 941} {"train_loss": -5.575894832611084, "global_step": 39556, "epoch": 941} {"train_loss": -5.7059645652771, "global_step": 39557, "epoch": 941} {"train_loss": -5.545352935791016, "global_step": 39558, "epoch": 941} {"train_loss": -5.646049976348877, "global_step": 39559, "epoch": 941} {"train_loss": -5.716169357299805, "global_step": 39560, "epoch": 941} {"train_loss": -5.591632843017578, "global_step": 39561, "epoch": 941} {"train_loss": -5.650398254394531, "global_step": 39562, "epoch": 941} {"train_loss": -5.606532040096464, "global_step": 39563, "epoch": 941, "val_loss": 73227.921875} {"train_loss": -5.718445777893066, "global_step": 39564, "epoch": 942} {"train_loss": -5.653412818908691, "global_step": 39565, "epoch": 942} {"train_loss": -5.592803478240967, "global_step": 39566, "epoch": 942} {"train_loss": -5.64655876159668, "global_step": 39567, "epoch": 942} {"train_loss": -5.564786911010742, "global_step": 39568, "epoch": 942} {"train_loss": -5.624251842498779, "global_step": 39569, "epoch": 942} {"train_loss": -5.701574325561523, "global_step": 39570, "epoch": 942} {"train_loss": -5.515576362609863, "global_step": 39571, "epoch": 942} {"train_loss": -5.7645769119262695, "global_step": 39572, "epoch": 942} {"train_loss": -5.63162899017334, "global_step": 39573, "epoch": 942} {"train_loss": -5.560652256011963, "global_step": 39574, "epoch": 942} {"train_loss": -5.698369026184082, "global_step": 39575, "epoch": 942} {"train_loss": -5.6593427658081055, "global_step": 39576, "epoch": 942} {"train_loss": -5.679200172424316, "global_step": 39577, "epoch": 942} {"train_loss": -5.6218461990356445, "global_step": 39578, "epoch": 942} {"train_loss": -5.6319355964660645, "global_step": 39579, "epoch": 942} {"train_loss": -5.770613670349121, "global_step": 39580, "epoch": 942} {"train_loss": -5.643815994262695, "global_step": 39581, "epoch": 942} {"train_loss": -5.5337233543396, "global_step": 39582, "epoch": 942} {"train_loss": -5.599143028259277, "global_step": 39583, "epoch": 942} {"train_loss": -5.523245811462402, "global_step": 39584, "epoch": 942} {"train_loss": -5.759550094604492, "global_step": 39585, "epoch": 942} {"train_loss": -5.593349456787109, "global_step": 39586, "epoch": 942} {"train_loss": -5.596900939941406, "global_step": 39587, "epoch": 942} {"train_loss": -5.661511421203613, "global_step": 39588, "epoch": 942} {"train_loss": -5.447957992553711, "global_step": 39589, "epoch": 942} {"train_loss": -5.623636245727539, "global_step": 39590, "epoch": 942} {"train_loss": -5.625510215759277, "global_step": 39591, "epoch": 942} {"train_loss": -5.754758834838867, "global_step": 39592, "epoch": 942} {"train_loss": -5.655099868774414, "global_step": 39593, "epoch": 942} {"train_loss": -5.735134601593018, "global_step": 39594, "epoch": 942} {"train_loss": -5.608891487121582, "global_step": 39595, "epoch": 942} {"train_loss": -5.716961860656738, "global_step": 39596, "epoch": 942} {"train_loss": -5.613890171051025, "global_step": 39597, "epoch": 942} {"train_loss": -5.684897422790527, "global_step": 39598, "epoch": 942} {"train_loss": -5.559874534606934, "global_step": 39599, "epoch": 942} {"train_loss": -5.6297831535339355, "global_step": 39600, "epoch": 942} {"train_loss": -5.530610084533691, "global_step": 39601, "epoch": 942} {"train_loss": -5.722315788269043, "global_step": 39602, "epoch": 942} {"train_loss": -5.684267520904541, "global_step": 39603, "epoch": 942} {"train_loss": -5.580430030822754, "global_step": 39604, "epoch": 942} {"train_loss": -5.635685580117362, "global_step": 39605, "epoch": 942, "val_loss": 73804.4375} {"train_loss": -5.552901268005371, "global_step": 39606, "epoch": 943} {"train_loss": -5.669672966003418, "global_step": 39607, "epoch": 943} {"train_loss": -5.669527530670166, "global_step": 39608, "epoch": 943} {"train_loss": -5.577850818634033, "global_step": 39609, "epoch": 943} {"train_loss": -5.67307186126709, "global_step": 39610, "epoch": 943} {"train_loss": -5.678997993469238, "global_step": 39611, "epoch": 943} {"train_loss": -5.681897163391113, "global_step": 39612, "epoch": 943} {"train_loss": -5.647998809814453, "global_step": 39613, "epoch": 943} {"train_loss": -5.633289337158203, "global_step": 39614, "epoch": 943} {"train_loss": -5.5849609375, "global_step": 39615, "epoch": 943} {"train_loss": -5.554653644561768, "global_step": 39616, "epoch": 943} {"train_loss": -5.562323093414307, "global_step": 39617, "epoch": 943} {"train_loss": -5.7461347579956055, "global_step": 39618, "epoch": 943} {"train_loss": -5.467954635620117, "global_step": 39619, "epoch": 943} {"train_loss": -5.651102066040039, "global_step": 39620, "epoch": 943} {"train_loss": -5.612124443054199, "global_step": 39621, "epoch": 943} {"train_loss": -5.508664131164551, "global_step": 39622, "epoch": 943} {"train_loss": -5.514737129211426, "global_step": 39623, "epoch": 943} {"train_loss": -5.573428153991699, "global_step": 39624, "epoch": 943} {"train_loss": -5.491434574127197, "global_step": 39625, "epoch": 943} {"train_loss": -5.5315165519714355, "global_step": 39626, "epoch": 943} {"train_loss": -5.566155433654785, "global_step": 39627, "epoch": 943} {"train_loss": -5.603291034698486, "global_step": 39628, "epoch": 943} {"train_loss": -5.591012001037598, "global_step": 39629, "epoch": 943} {"train_loss": -5.552467346191406, "global_step": 39630, "epoch": 943} {"train_loss": -5.6914472579956055, "global_step": 39631, "epoch": 943} {"train_loss": -5.645113945007324, "global_step": 39632, "epoch": 943} {"train_loss": -5.6740875244140625, "global_step": 39633, "epoch": 943} {"train_loss": -5.699960231781006, "global_step": 39634, "epoch": 943} {"train_loss": -5.683363914489746, "global_step": 39635, "epoch": 943} {"train_loss": -5.588525772094727, "global_step": 39636, "epoch": 943} {"train_loss": -5.633430480957031, "global_step": 39637, "epoch": 943} {"train_loss": -5.578062534332275, "global_step": 39638, "epoch": 943} {"train_loss": -5.650178909301758, "global_step": 39639, "epoch": 943} {"train_loss": -5.663653373718262, "global_step": 39640, "epoch": 943} {"train_loss": -5.564993858337402, "global_step": 39641, "epoch": 943} {"train_loss": -5.622179985046387, "global_step": 39642, "epoch": 943} {"train_loss": -5.690511703491211, "global_step": 39643, "epoch": 943} {"train_loss": -5.726799488067627, "global_step": 39644, "epoch": 943} {"train_loss": -5.556460380554199, "global_step": 39645, "epoch": 943} {"train_loss": -5.647129058837891, "global_step": 39646, "epoch": 943} {"train_loss": -5.6201171875, "global_step": 39647, "epoch": 943, "val_loss": 73634.6796875} {"train_loss": -5.682190895080566, "global_step": 39648, "epoch": 944} {"train_loss": -5.638564586639404, "global_step": 39649, "epoch": 944} {"train_loss": -5.558199882507324, "global_step": 39650, "epoch": 944} {"train_loss": -5.586111068725586, "global_step": 39651, "epoch": 944} {"train_loss": -5.505019664764404, "global_step": 39652, "epoch": 944} {"train_loss": -5.705689430236816, "global_step": 39653, "epoch": 944} {"train_loss": -5.759496688842773, "global_step": 39654, "epoch": 944} {"train_loss": -5.586965084075928, "global_step": 39655, "epoch": 944} {"train_loss": -5.42045783996582, "global_step": 39656, "epoch": 944} {"train_loss": -5.544472694396973, "global_step": 39657, "epoch": 944} {"train_loss": -5.738875389099121, "global_step": 39658, "epoch": 944} {"train_loss": -5.606395244598389, "global_step": 39659, "epoch": 944} {"train_loss": -5.462884902954102, "global_step": 39660, "epoch": 944} {"train_loss": -5.564764499664307, "global_step": 39661, "epoch": 944} {"train_loss": -5.569529056549072, "global_step": 39662, "epoch": 944} {"train_loss": -5.610487937927246, "global_step": 39663, "epoch": 944} {"train_loss": -5.650856971740723, "global_step": 39664, "epoch": 944} {"train_loss": -5.655470371246338, "global_step": 39665, "epoch": 944} {"train_loss": -5.641545295715332, "global_step": 39666, "epoch": 944} {"train_loss": -5.686968803405762, "global_step": 39667, "epoch": 944} {"train_loss": -5.501803398132324, "global_step": 39668, "epoch": 944} {"train_loss": -5.69239616394043, "global_step": 39669, "epoch": 944} {"train_loss": -5.545854568481445, "global_step": 39670, "epoch": 944} {"train_loss": -5.734195232391357, "global_step": 39671, "epoch": 944} {"train_loss": -5.6772918701171875, "global_step": 39672, "epoch": 944} {"train_loss": -5.473800182342529, "global_step": 39673, "epoch": 944} {"train_loss": -5.567418098449707, "global_step": 39674, "epoch": 944} {"train_loss": -5.47307825088501, "global_step": 39675, "epoch": 944} {"train_loss": -5.522146224975586, "global_step": 39676, "epoch": 944} {"train_loss": -5.610294818878174, "global_step": 39677, "epoch": 944} {"train_loss": -5.524425029754639, "global_step": 39678, "epoch": 944} {"train_loss": -5.73029899597168, "global_step": 39679, "epoch": 944} {"train_loss": -5.702369689941406, "global_step": 39680, "epoch": 944} {"train_loss": -5.739422798156738, "global_step": 39681, "epoch": 944} {"train_loss": -5.669520378112793, "global_step": 39682, "epoch": 944} {"train_loss": -5.586594581604004, "global_step": 39683, "epoch": 944} {"train_loss": -5.824031829833984, "global_step": 39684, "epoch": 944} {"train_loss": -5.728250503540039, "global_step": 39685, "epoch": 944} {"train_loss": -5.568857669830322, "global_step": 39686, "epoch": 944} {"train_loss": -5.629573822021484, "global_step": 39687, "epoch": 944} {"train_loss": -5.626765251159668, "global_step": 39688, "epoch": 944} {"train_loss": -5.615038996651059, "global_step": 39689, "epoch": 944, "val_loss": 73929.3359375} {"train_loss": -5.722967147827148, "global_step": 39690, "epoch": 945} {"train_loss": -5.659380912780762, "global_step": 39691, "epoch": 945} {"train_loss": -5.615191459655762, "global_step": 39692, "epoch": 945} {"train_loss": -5.647104740142822, "global_step": 39693, "epoch": 945} {"train_loss": -5.741785049438477, "global_step": 39694, "epoch": 945} {"train_loss": -5.742318630218506, "global_step": 39695, "epoch": 945} {"train_loss": -5.633077621459961, "global_step": 39696, "epoch": 945} {"train_loss": -5.709497451782227, "global_step": 39697, "epoch": 945} {"train_loss": -5.595961570739746, "global_step": 39698, "epoch": 945} {"train_loss": -5.60850191116333, "global_step": 39699, "epoch": 945} {"train_loss": -5.575910568237305, "global_step": 39700, "epoch": 945} {"train_loss": -5.735126495361328, "global_step": 39701, "epoch": 945} {"train_loss": -5.579678535461426, "global_step": 39702, "epoch": 945} {"train_loss": -5.689017295837402, "global_step": 39703, "epoch": 945} {"train_loss": -5.57866907119751, "global_step": 39704, "epoch": 945} {"train_loss": -5.69786262512207, "global_step": 39705, "epoch": 945} {"train_loss": -5.640936851501465, "global_step": 39706, "epoch": 945} {"train_loss": -5.629917144775391, "global_step": 39707, "epoch": 945} {"train_loss": -5.637874126434326, "global_step": 39708, "epoch": 945} {"train_loss": -5.505514144897461, "global_step": 39709, "epoch": 945} {"train_loss": -5.599472999572754, "global_step": 39710, "epoch": 945} {"train_loss": -5.630130767822266, "global_step": 39711, "epoch": 945} {"train_loss": -5.522863388061523, "global_step": 39712, "epoch": 945} {"train_loss": -5.586935043334961, "global_step": 39713, "epoch": 945} {"train_loss": -5.642495155334473, "global_step": 39714, "epoch": 945} {"train_loss": -5.623952865600586, "global_step": 39715, "epoch": 945} {"train_loss": -5.71405029296875, "global_step": 39716, "epoch": 945} {"train_loss": -5.68698263168335, "global_step": 39717, "epoch": 945} {"train_loss": -5.598698616027832, "global_step": 39718, "epoch": 945} {"train_loss": -5.641266822814941, "global_step": 39719, "epoch": 945} {"train_loss": -5.65928840637207, "global_step": 39720, "epoch": 945} {"train_loss": -5.676000118255615, "global_step": 39721, "epoch": 945} {"train_loss": -5.574625492095947, "global_step": 39722, "epoch": 945} {"train_loss": -5.657240390777588, "global_step": 39723, "epoch": 945} {"train_loss": -5.682808876037598, "global_step": 39724, "epoch": 945} {"train_loss": -5.562720775604248, "global_step": 39725, "epoch": 945} {"train_loss": -5.566001892089844, "global_step": 39726, "epoch": 945} {"train_loss": -5.69482946395874, "global_step": 39727, "epoch": 945} {"train_loss": -5.637624740600586, "global_step": 39728, "epoch": 945} {"train_loss": -5.552515506744385, "global_step": 39729, "epoch": 945} {"train_loss": -5.587314605712891, "global_step": 39730, "epoch": 945} {"train_loss": -5.6339088508061, "global_step": 39731, "epoch": 945, "val_loss": 74182.5625} {"train_loss": -5.503879547119141, "global_step": 39732, "epoch": 946} {"train_loss": -5.5750932693481445, "global_step": 39733, "epoch": 946} {"train_loss": -5.684603214263916, "global_step": 39734, "epoch": 946} {"train_loss": -5.762620449066162, "global_step": 39735, "epoch": 946} {"train_loss": -5.705455303192139, "global_step": 39736, "epoch": 946} {"train_loss": -5.6036882400512695, "global_step": 39737, "epoch": 946} {"train_loss": -5.674450874328613, "global_step": 39738, "epoch": 946} {"train_loss": -5.553466320037842, "global_step": 39739, "epoch": 946} {"train_loss": -5.483959674835205, "global_step": 39740, "epoch": 946} {"train_loss": -5.556551933288574, "global_step": 39741, "epoch": 946} {"train_loss": -5.615004539489746, "global_step": 39742, "epoch": 946} {"train_loss": -5.630470275878906, "global_step": 39743, "epoch": 946} {"train_loss": -5.5613813400268555, "global_step": 39744, "epoch": 946} {"train_loss": -5.681853294372559, "global_step": 39745, "epoch": 946} {"train_loss": -5.628012180328369, "global_step": 39746, "epoch": 946} {"train_loss": -5.701361656188965, "global_step": 39747, "epoch": 946} {"train_loss": -5.604785442352295, "global_step": 39748, "epoch": 946} {"train_loss": -5.677146911621094, "global_step": 39749, "epoch": 946} {"train_loss": -5.656513214111328, "global_step": 39750, "epoch": 946} {"train_loss": -5.544466018676758, "global_step": 39751, "epoch": 946} {"train_loss": -5.628462791442871, "global_step": 39752, "epoch": 946} {"train_loss": -5.767210960388184, "global_step": 39753, "epoch": 946} {"train_loss": -5.558164119720459, "global_step": 39754, "epoch": 946} {"train_loss": -5.766195297241211, "global_step": 39755, "epoch": 946} {"train_loss": -5.740593910217285, "global_step": 39756, "epoch": 946} {"train_loss": -5.737825393676758, "global_step": 39757, "epoch": 946} {"train_loss": -5.6514739990234375, "global_step": 39758, "epoch": 946} {"train_loss": -5.731174945831299, "global_step": 39759, "epoch": 946} {"train_loss": -5.584905624389648, "global_step": 39760, "epoch": 946} {"train_loss": -5.536927223205566, "global_step": 39761, "epoch": 946} {"train_loss": -5.555035591125488, "global_step": 39762, "epoch": 946} {"train_loss": -5.622768402099609, "global_step": 39763, "epoch": 946} {"train_loss": -5.563769817352295, "global_step": 39764, "epoch": 946} {"train_loss": -5.660149097442627, "global_step": 39765, "epoch": 946} {"train_loss": -5.662989616394043, "global_step": 39766, "epoch": 946} {"train_loss": -5.634622573852539, "global_step": 39767, "epoch": 946} {"train_loss": -5.588861465454102, "global_step": 39768, "epoch": 946} {"train_loss": -5.746417045593262, "global_step": 39769, "epoch": 946} {"train_loss": -5.566734790802002, "global_step": 39770, "epoch": 946} {"train_loss": -5.645386695861816, "global_step": 39771, "epoch": 946} {"train_loss": -5.5675153732299805, "global_step": 39772, "epoch": 946} {"train_loss": -5.6299651350293844, "global_step": 39773, "epoch": 946, "val_loss": 73879.671875} {"train_loss": -5.612104415893555, "global_step": 39774, "epoch": 947} {"train_loss": -5.617928981781006, "global_step": 39775, "epoch": 947} {"train_loss": -5.655569076538086, "global_step": 39776, "epoch": 947} {"train_loss": -5.668079376220703, "global_step": 39777, "epoch": 947} {"train_loss": -5.511327266693115, "global_step": 39778, "epoch": 947} {"train_loss": -5.636238098144531, "global_step": 39779, "epoch": 947} {"train_loss": -5.681497573852539, "global_step": 39780, "epoch": 947} {"train_loss": -5.600302696228027, "global_step": 39781, "epoch": 947} {"train_loss": -5.615389347076416, "global_step": 39782, "epoch": 947} {"train_loss": -5.711239814758301, "global_step": 39783, "epoch": 947} {"train_loss": -5.480634689331055, "global_step": 39784, "epoch": 947} {"train_loss": -5.555873870849609, "global_step": 39785, "epoch": 947} {"train_loss": -5.653693675994873, "global_step": 39786, "epoch": 947} {"train_loss": -5.54716682434082, "global_step": 39787, "epoch": 947} {"train_loss": -5.578242301940918, "global_step": 39788, "epoch": 947} {"train_loss": -5.51050329208374, "global_step": 39789, "epoch": 947} {"train_loss": -5.652656555175781, "global_step": 39790, "epoch": 947} {"train_loss": -5.727106094360352, "global_step": 39791, "epoch": 947} {"train_loss": -5.623718738555908, "global_step": 39792, "epoch": 947} {"train_loss": -5.786852836608887, "global_step": 39793, "epoch": 947} {"train_loss": -5.603936195373535, "global_step": 39794, "epoch": 947} {"train_loss": -5.573412895202637, "global_step": 39795, "epoch": 947} {"train_loss": -5.737469673156738, "global_step": 39796, "epoch": 947} {"train_loss": -5.563968658447266, "global_step": 39797, "epoch": 947} {"train_loss": -5.6320061683654785, "global_step": 39798, "epoch": 947} {"train_loss": -5.598969459533691, "global_step": 39799, "epoch": 947} {"train_loss": -5.691949844360352, "global_step": 39800, "epoch": 947} {"train_loss": -5.670536518096924, "global_step": 39801, "epoch": 947} {"train_loss": -5.670248031616211, "global_step": 39802, "epoch": 947} {"train_loss": -5.589038372039795, "global_step": 39803, "epoch": 947} {"train_loss": -5.731800556182861, "global_step": 39804, "epoch": 947} {"train_loss": -5.539431095123291, "global_step": 39805, "epoch": 947} {"train_loss": -5.702043533325195, "global_step": 39806, "epoch": 947} {"train_loss": -5.7003021240234375, "global_step": 39807, "epoch": 947} {"train_loss": -5.56226110458374, "global_step": 39808, "epoch": 947} {"train_loss": -5.714773654937744, "global_step": 39809, "epoch": 947} {"train_loss": -5.6958746910095215, "global_step": 39810, "epoch": 947} {"train_loss": -5.622964859008789, "global_step": 39811, "epoch": 947} {"train_loss": -5.574460029602051, "global_step": 39812, "epoch": 947} {"train_loss": -5.712091445922852, "global_step": 39813, "epoch": 947} {"train_loss": -5.598026275634766, "global_step": 39814, "epoch": 947} {"train_loss": -5.630402973720005, "global_step": 39815, "epoch": 947, "val_loss": 74023.53125} {"train_loss": -5.692562103271484, "global_step": 39816, "epoch": 948} {"train_loss": -5.675531387329102, "global_step": 39817, "epoch": 948} {"train_loss": -5.629040718078613, "global_step": 39818, "epoch": 948} {"train_loss": -5.714845657348633, "global_step": 39819, "epoch": 948} {"train_loss": -5.661246299743652, "global_step": 39820, "epoch": 948} {"train_loss": -5.643912315368652, "global_step": 39821, "epoch": 948} {"train_loss": -5.66254997253418, "global_step": 39822, "epoch": 948} {"train_loss": -5.800207138061523, "global_step": 39823, "epoch": 948} {"train_loss": -5.635571479797363, "global_step": 39824, "epoch": 948} {"train_loss": -5.671042442321777, "global_step": 39825, "epoch": 948} {"train_loss": -5.663802623748779, "global_step": 39826, "epoch": 948} {"train_loss": -5.66864013671875, "global_step": 39827, "epoch": 948} {"train_loss": -5.528237342834473, "global_step": 39828, "epoch": 948} {"train_loss": -5.560689926147461, "global_step": 39829, "epoch": 948} {"train_loss": -5.635909080505371, "global_step": 39830, "epoch": 948} {"train_loss": -5.680673599243164, "global_step": 39831, "epoch": 948} {"train_loss": -5.571224689483643, "global_step": 39832, "epoch": 948} {"train_loss": -5.719353199005127, "global_step": 39833, "epoch": 948} {"train_loss": -5.551899433135986, "global_step": 39834, "epoch": 948} {"train_loss": -5.714946746826172, "global_step": 39835, "epoch": 948} {"train_loss": -5.67494010925293, "global_step": 39836, "epoch": 948} {"train_loss": -5.604128837585449, "global_step": 39837, "epoch": 948} {"train_loss": -5.582023620605469, "global_step": 39838, "epoch": 948} {"train_loss": -5.601051330566406, "global_step": 39839, "epoch": 948} {"train_loss": -5.6040730476379395, "global_step": 39840, "epoch": 948} {"train_loss": -5.481837272644043, "global_step": 39841, "epoch": 948} {"train_loss": -5.6057209968566895, "global_step": 39842, "epoch": 948} {"train_loss": -5.354169845581055, "global_step": 39843, "epoch": 948} {"train_loss": -5.610377311706543, "global_step": 39844, "epoch": 948} {"train_loss": -5.741589546203613, "global_step": 39845, "epoch": 948} {"train_loss": -5.614613056182861, "global_step": 39846, "epoch": 948} {"train_loss": -5.499881744384766, "global_step": 39847, "epoch": 948} {"train_loss": -5.703545570373535, "global_step": 39848, "epoch": 948} {"train_loss": -5.659212112426758, "global_step": 39849, "epoch": 948} {"train_loss": -5.543726444244385, "global_step": 39850, "epoch": 948} {"train_loss": -5.672305107116699, "global_step": 39851, "epoch": 948} {"train_loss": -5.547732353210449, "global_step": 39852, "epoch": 948} {"train_loss": -5.637697696685791, "global_step": 39853, "epoch": 948} {"train_loss": -5.652958869934082, "global_step": 39854, "epoch": 948} {"train_loss": -5.62375020980835, "global_step": 39855, "epoch": 948} {"train_loss": -5.457612037658691, "global_step": 39856, "epoch": 948} {"train_loss": -5.623513573691959, "global_step": 39857, "epoch": 948, "val_loss": 74265.7421875} {"train_loss": -5.528413772583008, "global_step": 39858, "epoch": 949} {"train_loss": -5.460205078125, "global_step": 39859, "epoch": 949} {"train_loss": -5.686954498291016, "global_step": 39860, "epoch": 949} {"train_loss": -5.6186113357543945, "global_step": 39861, "epoch": 949} {"train_loss": -5.527482509613037, "global_step": 39862, "epoch": 949} {"train_loss": -5.726266860961914, "global_step": 39863, "epoch": 949} {"train_loss": -5.692453861236572, "global_step": 39864, "epoch": 949} {"train_loss": -5.637398719787598, "global_step": 39865, "epoch": 949} {"train_loss": -5.70826530456543, "global_step": 39866, "epoch": 949} {"train_loss": -5.721189022064209, "global_step": 39867, "epoch": 949} {"train_loss": -5.693821907043457, "global_step": 39868, "epoch": 949} {"train_loss": -5.627201080322266, "global_step": 39869, "epoch": 949} {"train_loss": -5.577579498291016, "global_step": 39870, "epoch": 949} {"train_loss": -5.69696044921875, "global_step": 39871, "epoch": 949} {"train_loss": -5.721047401428223, "global_step": 39872, "epoch": 949} {"train_loss": -5.601835250854492, "global_step": 39873, "epoch": 949} {"train_loss": -5.768075942993164, "global_step": 39874, "epoch": 949} {"train_loss": -5.730687141418457, "global_step": 39875, "epoch": 949} {"train_loss": -5.634598731994629, "global_step": 39876, "epoch": 949} {"train_loss": -5.756075859069824, "global_step": 39877, "epoch": 949} {"train_loss": -5.752455711364746, "global_step": 39878, "epoch": 949} {"train_loss": -5.634876251220703, "global_step": 39879, "epoch": 949} {"train_loss": -5.5994462966918945, "global_step": 39880, "epoch": 949} {"train_loss": -5.550091743469238, "global_step": 39881, "epoch": 949} {"train_loss": -5.691688060760498, "global_step": 39882, "epoch": 949} {"train_loss": -5.720734119415283, "global_step": 39883, "epoch": 949} {"train_loss": -5.651053428649902, "global_step": 39884, "epoch": 949} {"train_loss": -5.671685218811035, "global_step": 39885, "epoch": 949} {"train_loss": -5.605410575866699, "global_step": 39886, "epoch": 949} {"train_loss": -5.539951324462891, "global_step": 39887, "epoch": 949} {"train_loss": -5.611357688903809, "global_step": 39888, "epoch": 949} {"train_loss": -5.532597541809082, "global_step": 39889, "epoch": 949} {"train_loss": -5.53084135055542, "global_step": 39890, "epoch": 949} {"train_loss": -5.5724382400512695, "global_step": 39891, "epoch": 949} {"train_loss": -5.494284629821777, "global_step": 39892, "epoch": 949} {"train_loss": -5.713863849639893, "global_step": 39893, "epoch": 949} {"train_loss": -5.553928375244141, "global_step": 39894, "epoch": 949} {"train_loss": -5.57027530670166, "global_step": 39895, "epoch": 949} {"train_loss": -5.751898765563965, "global_step": 39896, "epoch": 949} {"train_loss": -5.644933223724365, "global_step": 39897, "epoch": 949} {"train_loss": -5.52512264251709, "global_step": 39898, "epoch": 949} {"train_loss": -5.63450042406718, "global_step": 39899, "epoch": 949, "val_loss": 74241.28125} {"train_loss": -5.547309875488281, "global_step": 39900, "epoch": 950} {"train_loss": -5.5815935134887695, "global_step": 39901, "epoch": 950} {"train_loss": -5.607775688171387, "global_step": 39902, "epoch": 950} {"train_loss": -5.408339977264404, "global_step": 39903, "epoch": 950} {"train_loss": -5.4536848068237305, "global_step": 39904, "epoch": 950} {"train_loss": -5.659944534301758, "global_step": 39905, "epoch": 950} {"train_loss": -5.610448360443115, "global_step": 39906, "epoch": 950} {"train_loss": -5.6651692390441895, "global_step": 39907, "epoch": 950} {"train_loss": -5.48908805847168, "global_step": 39908, "epoch": 950} {"train_loss": -5.70166015625, "global_step": 39909, "epoch": 950} {"train_loss": -5.560934543609619, "global_step": 39910, "epoch": 950} {"train_loss": -5.665610313415527, "global_step": 39911, "epoch": 950} {"train_loss": -5.485481262207031, "global_step": 39912, "epoch": 950} {"train_loss": -5.696794509887695, "global_step": 39913, "epoch": 950} {"train_loss": -5.673900604248047, "global_step": 39914, "epoch": 950} {"train_loss": -5.679211616516113, "global_step": 39915, "epoch": 950} {"train_loss": -5.796177864074707, "global_step": 39916, "epoch": 950} {"train_loss": -5.661630630493164, "global_step": 39917, "epoch": 950} {"train_loss": -5.627847671508789, "global_step": 39918, "epoch": 950} {"train_loss": -5.585587501525879, "global_step": 39919, "epoch": 950} {"train_loss": -5.711359024047852, "global_step": 39920, "epoch": 950} {"train_loss": -5.670260429382324, "global_step": 39921, "epoch": 950} {"train_loss": -5.668008804321289, "global_step": 39922, "epoch": 950} {"train_loss": -5.529587745666504, "global_step": 39923, "epoch": 950} {"train_loss": -5.646668434143066, "global_step": 39924, "epoch": 950} {"train_loss": -5.760777473449707, "global_step": 39925, "epoch": 950} {"train_loss": -5.605435371398926, "global_step": 39926, "epoch": 950} {"train_loss": -5.56832218170166, "global_step": 39927, "epoch": 950} {"train_loss": -5.64912748336792, "global_step": 39928, "epoch": 950} {"train_loss": -5.490157127380371, "global_step": 39929, "epoch": 950} {"train_loss": -5.574186325073242, "global_step": 39930, "epoch": 950} {"train_loss": -5.53291654586792, "global_step": 39931, "epoch": 950} {"train_loss": -5.649576187133789, "global_step": 39932, "epoch": 950} {"train_loss": -5.643326282501221, "global_step": 39933, "epoch": 950} {"train_loss": -5.485238075256348, "global_step": 39934, "epoch": 950} {"train_loss": -5.642397403717041, "global_step": 39935, "epoch": 950} {"train_loss": -5.651978969573975, "global_step": 39936, "epoch": 950} {"train_loss": -5.448101997375488, "global_step": 39937, "epoch": 950} {"train_loss": -5.608767986297607, "global_step": 39938, "epoch": 950} {"train_loss": -5.582132339477539, "global_step": 39939, "epoch": 950} {"train_loss": -5.594691276550293, "global_step": 39940, "epoch": 950} {"train_loss": -5.606842143195016, "global_step": 39941, "epoch": 950, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.7988974062140228, "train/sim_max_reward_2": 0.45926645124709436, "train/sim_max_reward_3": 0.17481105573056022, "train/sim_max_reward_4": 0.9525917247338506, "train/sim_max_reward_5": 0.5850830728942209, "test/sim_max_reward_4500000": 0.4916535568859201, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8169410788790759, "test/sim_max_reward_4500003": 0.29798471475540333, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.5161128952494929, "test/sim_max_reward_4500006": 0.8085076825125106, "test/sim_max_reward_4500007": 0.8774319713649027, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.053707604052498775, "test/sim_max_reward_4500010": 0.5691043329593395, "test/sim_max_reward_4500011": 0.9274526768545515, "test/sim_max_reward_4500012": 0.7381292646564553, "test/sim_max_reward_4500013": 2.7072809083901155e-05, "test/sim_max_reward_4500014": 0.9340691322007955, "test/sim_max_reward_4500015": 0.0016954567142534955, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.007277238216077341, "test/sim_max_reward_4500019": 0.725740801893074, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.7800721690747673, "test/sim_max_reward_4500022": 0.5274264039098879, "test/sim_max_reward_4500023": 0.9100538225710774, "test/sim_max_reward_4500024": 0.9244447819109266, "test/sim_max_reward_4500025": 0.44054444331457693, "test/sim_max_reward_4500026": 0.25494899803754734, "test/sim_max_reward_4500027": 0.7203488793053016, "test/sim_max_reward_4500028": 0.46541026133943986, "test/sim_max_reward_4500029": 0.055050955911750354, "test/sim_max_reward_4500030": 0.22013220502949704, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.6302917831686414, "test/sim_max_reward_4500034": 0.781448511067123, "test/sim_max_reward_4500035": 0.798718965467127, "test/sim_max_reward_4500036": 0.9914404693741006, "test/sim_max_reward_4500037": 0.11094066301652025, "test/sim_max_reward_4500038": 0.6756830507761876, "test/sim_max_reward_4500039": 0.21789597073115027, "test/sim_max_reward_4500040": 0.8018463766425454, "test/sim_max_reward_4500041": 0.3696779896113664, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.2215920133439607, "test/sim_max_reward_4500044": 0.3498662759315483, "test/sim_max_reward_4500045": 0.8086107417632225, "test/sim_max_reward_4500046": 0.84040340654365, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.8028510030682199, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5268245345709668, "test/mean_score": 0.43213217967907164, "val_loss": 73635.1875} {"train_loss": -5.637130260467529, "global_step": 39942, "epoch": 951} {"train_loss": -5.532588958740234, "global_step": 39943, "epoch": 951} {"train_loss": -5.564256191253662, "global_step": 39944, "epoch": 951} {"train_loss": -5.71420955657959, "global_step": 39945, "epoch": 951} {"train_loss": -5.544149398803711, "global_step": 39946, "epoch": 951} {"train_loss": -5.599625587463379, "global_step": 39947, "epoch": 951} {"train_loss": -5.520319938659668, "global_step": 39948, "epoch": 951} {"train_loss": -5.49526309967041, "global_step": 39949, "epoch": 951} {"train_loss": -5.600569725036621, "global_step": 39950, "epoch": 951} {"train_loss": -5.643100738525391, "global_step": 39951, "epoch": 951} {"train_loss": -5.545137405395508, "global_step": 39952, "epoch": 951} {"train_loss": -5.7463059425354, "global_step": 39953, "epoch": 951} {"train_loss": -5.631668567657471, "global_step": 39954, "epoch": 951} {"train_loss": -5.8351335525512695, "global_step": 39955, "epoch": 951} {"train_loss": -5.63785457611084, "global_step": 39956, "epoch": 951} {"train_loss": -5.553899765014648, "global_step": 39957, "epoch": 951} {"train_loss": -5.791976451873779, "global_step": 39958, "epoch": 951} {"train_loss": -5.52153205871582, "global_step": 39959, "epoch": 951} {"train_loss": -5.745828628540039, "global_step": 39960, "epoch": 951} {"train_loss": -5.7021636962890625, "global_step": 39961, "epoch": 951} {"train_loss": -5.595264434814453, "global_step": 39962, "epoch": 951} {"train_loss": -5.619747638702393, "global_step": 39963, "epoch": 951} {"train_loss": -5.678865432739258, "global_step": 39964, "epoch": 951} {"train_loss": -5.635249137878418, "global_step": 39965, "epoch": 951} {"train_loss": -5.638944625854492, "global_step": 39966, "epoch": 951} {"train_loss": -5.75816535949707, "global_step": 39967, "epoch": 951} {"train_loss": -5.624811172485352, "global_step": 39968, "epoch": 951} {"train_loss": -5.60876989364624, "global_step": 39969, "epoch": 951} {"train_loss": -5.715363502502441, "global_step": 39970, "epoch": 951} {"train_loss": -5.645212173461914, "global_step": 39971, "epoch": 951} {"train_loss": -5.727004051208496, "global_step": 39972, "epoch": 951} {"train_loss": -5.7665252685546875, "global_step": 39973, "epoch": 951} {"train_loss": -5.701355934143066, "global_step": 39974, "epoch": 951} {"train_loss": -5.5605549812316895, "global_step": 39975, "epoch": 951} {"train_loss": -5.664997100830078, "global_step": 39976, "epoch": 951} {"train_loss": -5.701432228088379, "global_step": 39977, "epoch": 951} {"train_loss": -5.670406341552734, "global_step": 39978, "epoch": 951} {"train_loss": -5.691240310668945, "global_step": 39979, "epoch": 951} {"train_loss": -5.551063537597656, "global_step": 39980, "epoch": 951} {"train_loss": -5.594333648681641, "global_step": 39981, "epoch": 951} {"train_loss": -5.566436767578125, "global_step": 39982, "epoch": 951} {"train_loss": -5.637061107726324, "global_step": 39983, "epoch": 951, "val_loss": 73771.25} {"train_loss": -5.651059627532959, "global_step": 39984, "epoch": 952} {"train_loss": -5.536003112792969, "global_step": 39985, "epoch": 952} {"train_loss": -5.545809745788574, "global_step": 39986, "epoch": 952} {"train_loss": -5.696691513061523, "global_step": 39987, "epoch": 952} {"train_loss": -5.569191932678223, "global_step": 39988, "epoch": 952} {"train_loss": -5.60710334777832, "global_step": 39989, "epoch": 952} {"train_loss": -5.473599433898926, "global_step": 39990, "epoch": 952} {"train_loss": -5.5789971351623535, "global_step": 39991, "epoch": 952} {"train_loss": -5.646311283111572, "global_step": 39992, "epoch": 952} {"train_loss": -5.595228672027588, "global_step": 39993, "epoch": 952} {"train_loss": -5.604134559631348, "global_step": 39994, "epoch": 952} {"train_loss": -5.464620590209961, "global_step": 39995, "epoch": 952} {"train_loss": -5.560644626617432, "global_step": 39996, "epoch": 952} {"train_loss": -5.584729194641113, "global_step": 39997, "epoch": 952} {"train_loss": -5.571953773498535, "global_step": 39998, "epoch": 952} {"train_loss": -5.582657337188721, "global_step": 39999, "epoch": 952} {"train_loss": -5.626986503601074, "global_step": 40000, "epoch": 952} {"train_loss": -5.639276504516602, "global_step": 40001, "epoch": 952} {"train_loss": -5.596829414367676, "global_step": 40002, "epoch": 952} {"train_loss": -5.596815586090088, "global_step": 40003, "epoch": 952} {"train_loss": -5.684443473815918, "global_step": 40004, "epoch": 952} {"train_loss": -5.644888401031494, "global_step": 40005, "epoch": 952} {"train_loss": -5.5692901611328125, "global_step": 40006, "epoch": 952} {"train_loss": -5.654515266418457, "global_step": 40007, "epoch": 952} {"train_loss": -5.4578857421875, "global_step": 40008, "epoch": 952} {"train_loss": -5.561371803283691, "global_step": 40009, "epoch": 952} {"train_loss": -5.671744346618652, "global_step": 40010, "epoch": 952} {"train_loss": -5.512019157409668, "global_step": 40011, "epoch": 952} {"train_loss": -5.536355495452881, "global_step": 40012, "epoch": 952} {"train_loss": -5.693761825561523, "global_step": 40013, "epoch": 952} {"train_loss": -5.738620281219482, "global_step": 40014, "epoch": 952} {"train_loss": -5.669317245483398, "global_step": 40015, "epoch": 952} {"train_loss": -5.565528869628906, "global_step": 40016, "epoch": 952} {"train_loss": -5.638696193695068, "global_step": 40017, "epoch": 952} {"train_loss": -5.613989353179932, "global_step": 40018, "epoch": 952} {"train_loss": -5.559920310974121, "global_step": 40019, "epoch": 952} {"train_loss": -5.590921401977539, "global_step": 40020, "epoch": 952} {"train_loss": -5.658702850341797, "global_step": 40021, "epoch": 952} {"train_loss": -5.530259132385254, "global_step": 40022, "epoch": 952} {"train_loss": -5.7374162673950195, "global_step": 40023, "epoch": 952} {"train_loss": -5.718717575073242, "global_step": 40024, "epoch": 952} {"train_loss": -5.604502564384823, "global_step": 40025, "epoch": 952, "val_loss": 73712.375} {"train_loss": -5.514322280883789, "global_step": 40026, "epoch": 953} {"train_loss": -5.743410110473633, "global_step": 40027, "epoch": 953} {"train_loss": -5.570554256439209, "global_step": 40028, "epoch": 953} {"train_loss": -5.517828941345215, "global_step": 40029, "epoch": 953} {"train_loss": -5.635439872741699, "global_step": 40030, "epoch": 953} {"train_loss": -5.639284133911133, "global_step": 40031, "epoch": 953} {"train_loss": -5.703243255615234, "global_step": 40032, "epoch": 953} {"train_loss": -5.605998992919922, "global_step": 40033, "epoch": 953} {"train_loss": -5.77166748046875, "global_step": 40034, "epoch": 953} {"train_loss": -5.593227386474609, "global_step": 40035, "epoch": 953} {"train_loss": -5.594187259674072, "global_step": 40036, "epoch": 953} {"train_loss": -5.569278717041016, "global_step": 40037, "epoch": 953} {"train_loss": -5.621865749359131, "global_step": 40038, "epoch": 953} {"train_loss": -5.628606796264648, "global_step": 40039, "epoch": 953} {"train_loss": -5.6703314781188965, "global_step": 40040, "epoch": 953} {"train_loss": -5.673778533935547, "global_step": 40041, "epoch": 953} {"train_loss": -5.669734001159668, "global_step": 40042, "epoch": 953} {"train_loss": -5.683443069458008, "global_step": 40043, "epoch": 953} {"train_loss": -5.554570198059082, "global_step": 40044, "epoch": 953} {"train_loss": -5.639447212219238, "global_step": 40045, "epoch": 953} {"train_loss": -5.535958290100098, "global_step": 40046, "epoch": 953} {"train_loss": -5.553751468658447, "global_step": 40047, "epoch": 953} {"train_loss": -5.654861927032471, "global_step": 40048, "epoch": 953} {"train_loss": -5.670690059661865, "global_step": 40049, "epoch": 953} {"train_loss": -5.743972301483154, "global_step": 40050, "epoch": 953} {"train_loss": -5.5648274421691895, "global_step": 40051, "epoch": 953} {"train_loss": -5.654149055480957, "global_step": 40052, "epoch": 953} {"train_loss": -5.721292972564697, "global_step": 40053, "epoch": 953} {"train_loss": -5.6720757484436035, "global_step": 40054, "epoch": 953} {"train_loss": -5.621631622314453, "global_step": 40055, "epoch": 953} {"train_loss": -5.619008541107178, "global_step": 40056, "epoch": 953} {"train_loss": -5.72139835357666, "global_step": 40057, "epoch": 953} {"train_loss": -5.581608772277832, "global_step": 40058, "epoch": 953} {"train_loss": -5.770133972167969, "global_step": 40059, "epoch": 953} {"train_loss": -5.682396411895752, "global_step": 40060, "epoch": 953} {"train_loss": -5.6290059089660645, "global_step": 40061, "epoch": 953} {"train_loss": -5.5706329345703125, "global_step": 40062, "epoch": 953} {"train_loss": -5.699960708618164, "global_step": 40063, "epoch": 953} {"train_loss": -5.601285934448242, "global_step": 40064, "epoch": 953} {"train_loss": -5.629654407501221, "global_step": 40065, "epoch": 953} {"train_loss": -5.757962226867676, "global_step": 40066, "epoch": 953} {"train_loss": -5.641513075147357, "global_step": 40067, "epoch": 953, "val_loss": 74181.796875} {"train_loss": -5.656566619873047, "global_step": 40068, "epoch": 954} {"train_loss": -5.566745281219482, "global_step": 40069, "epoch": 954} {"train_loss": -5.637556076049805, "global_step": 40070, "epoch": 954} {"train_loss": -5.555301666259766, "global_step": 40071, "epoch": 954} {"train_loss": -5.6328911781311035, "global_step": 40072, "epoch": 954} {"train_loss": -5.634217262268066, "global_step": 40073, "epoch": 954} {"train_loss": -5.565770149230957, "global_step": 40074, "epoch": 954} {"train_loss": -5.577930927276611, "global_step": 40075, "epoch": 954} {"train_loss": -5.600114822387695, "global_step": 40076, "epoch": 954} {"train_loss": -5.616413116455078, "global_step": 40077, "epoch": 954} {"train_loss": -5.457996368408203, "global_step": 40078, "epoch": 954} {"train_loss": -5.613363742828369, "global_step": 40079, "epoch": 954} {"train_loss": -5.467167854309082, "global_step": 40080, "epoch": 954} {"train_loss": -5.55537223815918, "global_step": 40081, "epoch": 954} {"train_loss": -5.556894302368164, "global_step": 40082, "epoch": 954} {"train_loss": -5.45892333984375, "global_step": 40083, "epoch": 954} {"train_loss": -5.601669788360596, "global_step": 40084, "epoch": 954} {"train_loss": -5.534391403198242, "global_step": 40085, "epoch": 954} {"train_loss": -5.463384628295898, "global_step": 40086, "epoch": 954} {"train_loss": -5.584866046905518, "global_step": 40087, "epoch": 954} {"train_loss": -5.629022598266602, "global_step": 40088, "epoch": 954} {"train_loss": -5.564164161682129, "global_step": 40089, "epoch": 954} {"train_loss": -5.563164710998535, "global_step": 40090, "epoch": 954} {"train_loss": -5.620694637298584, "global_step": 40091, "epoch": 954} {"train_loss": -5.53836727142334, "global_step": 40092, "epoch": 954} {"train_loss": -5.699820518493652, "global_step": 40093, "epoch": 954} {"train_loss": -5.457648277282715, "global_step": 40094, "epoch": 954} {"train_loss": -5.657710075378418, "global_step": 40095, "epoch": 954} {"train_loss": -5.620560646057129, "global_step": 40096, "epoch": 954} {"train_loss": -5.560799598693848, "global_step": 40097, "epoch": 954} {"train_loss": -5.567636489868164, "global_step": 40098, "epoch": 954} {"train_loss": -5.6637444496154785, "global_step": 40099, "epoch": 954} {"train_loss": -5.650640964508057, "global_step": 40100, "epoch": 954} {"train_loss": -5.583117485046387, "global_step": 40101, "epoch": 954} {"train_loss": -5.637086868286133, "global_step": 40102, "epoch": 954} {"train_loss": -5.608351230621338, "global_step": 40103, "epoch": 954} {"train_loss": -5.627248764038086, "global_step": 40104, "epoch": 954} {"train_loss": -5.6059441566467285, "global_step": 40105, "epoch": 954} {"train_loss": -5.610496520996094, "global_step": 40106, "epoch": 954} {"train_loss": -5.442487716674805, "global_step": 40107, "epoch": 954} {"train_loss": -5.525781154632568, "global_step": 40108, "epoch": 954} {"train_loss": -5.581044662566412, "global_step": 40109, "epoch": 954, "val_loss": 74554.921875} {"train_loss": -5.449009895324707, "global_step": 40110, "epoch": 955} {"train_loss": -5.581630229949951, "global_step": 40111, "epoch": 955} {"train_loss": -5.5690741539001465, "global_step": 40112, "epoch": 955} {"train_loss": -5.514072418212891, "global_step": 40113, "epoch": 955} {"train_loss": -5.51978874206543, "global_step": 40114, "epoch": 955} {"train_loss": -5.529206275939941, "global_step": 40115, "epoch": 955} {"train_loss": -5.5745368003845215, "global_step": 40116, "epoch": 955} {"train_loss": -5.688742160797119, "global_step": 40117, "epoch": 955} {"train_loss": -5.7462687492370605, "global_step": 40118, "epoch": 955} {"train_loss": -5.695785045623779, "global_step": 40119, "epoch": 955} {"train_loss": -5.553287506103516, "global_step": 40120, "epoch": 955} {"train_loss": -5.658760070800781, "global_step": 40121, "epoch": 955} {"train_loss": -5.47075891494751, "global_step": 40122, "epoch": 955} {"train_loss": -5.719412326812744, "global_step": 40123, "epoch": 955} {"train_loss": -5.4583892822265625, "global_step": 40124, "epoch": 955} {"train_loss": -5.620891094207764, "global_step": 40125, "epoch": 955} {"train_loss": -5.615365982055664, "global_step": 40126, "epoch": 955} {"train_loss": -5.649454116821289, "global_step": 40127, "epoch": 955} {"train_loss": -5.647309303283691, "global_step": 40128, "epoch": 955} {"train_loss": -5.684051513671875, "global_step": 40129, "epoch": 955} {"train_loss": -5.566156387329102, "global_step": 40130, "epoch": 955} {"train_loss": -5.690237998962402, "global_step": 40131, "epoch": 955} {"train_loss": -5.7060866355896, "global_step": 40132, "epoch": 955} {"train_loss": -5.578963279724121, "global_step": 40133, "epoch": 955} {"train_loss": -5.794418811798096, "global_step": 40134, "epoch": 955} {"train_loss": -5.764996528625488, "global_step": 40135, "epoch": 955} {"train_loss": -5.564897537231445, "global_step": 40136, "epoch": 955} {"train_loss": -5.716442108154297, "global_step": 40137, "epoch": 955} {"train_loss": -5.5272626876831055, "global_step": 40138, "epoch": 955} {"train_loss": -5.558113098144531, "global_step": 40139, "epoch": 955} {"train_loss": -5.582540512084961, "global_step": 40140, "epoch": 955} {"train_loss": -5.652412414550781, "global_step": 40141, "epoch": 955} {"train_loss": -5.6150007247924805, "global_step": 40142, "epoch": 955} {"train_loss": -5.54917049407959, "global_step": 40143, "epoch": 955} {"train_loss": -5.499876022338867, "global_step": 40144, "epoch": 955} {"train_loss": -5.655652046203613, "global_step": 40145, "epoch": 955} {"train_loss": -5.668636322021484, "global_step": 40146, "epoch": 955} {"train_loss": -5.561027526855469, "global_step": 40147, "epoch": 955} {"train_loss": -5.505004405975342, "global_step": 40148, "epoch": 955} {"train_loss": -5.743117332458496, "global_step": 40149, "epoch": 955} {"train_loss": -5.524669170379639, "global_step": 40150, "epoch": 955} {"train_loss": -5.605459304082961, "global_step": 40151, "epoch": 955, "val_loss": 73921.828125} {"train_loss": -5.594264984130859, "global_step": 40152, "epoch": 956} {"train_loss": -5.561443328857422, "global_step": 40153, "epoch": 956} {"train_loss": -5.517894744873047, "global_step": 40154, "epoch": 956} {"train_loss": -5.629927158355713, "global_step": 40155, "epoch": 956} {"train_loss": -5.634436130523682, "global_step": 40156, "epoch": 956} {"train_loss": -5.6573076248168945, "global_step": 40157, "epoch": 956} {"train_loss": -5.776267051696777, "global_step": 40158, "epoch": 956} {"train_loss": -5.613265514373779, "global_step": 40159, "epoch": 956} {"train_loss": -5.595693111419678, "global_step": 40160, "epoch": 956} {"train_loss": -5.64554500579834, "global_step": 40161, "epoch": 956} {"train_loss": -5.609269142150879, "global_step": 40162, "epoch": 956} {"train_loss": -5.631175994873047, "global_step": 40163, "epoch": 956} {"train_loss": -5.567269325256348, "global_step": 40164, "epoch": 956} {"train_loss": -5.641355037689209, "global_step": 40165, "epoch": 956} {"train_loss": -5.57830810546875, "global_step": 40166, "epoch": 956} {"train_loss": -5.696674823760986, "global_step": 40167, "epoch": 956} {"train_loss": -5.590146064758301, "global_step": 40168, "epoch": 956} {"train_loss": -5.535198211669922, "global_step": 40169, "epoch": 956} {"train_loss": -5.60990047454834, "global_step": 40170, "epoch": 956} {"train_loss": -5.550657749176025, "global_step": 40171, "epoch": 956} {"train_loss": -5.530911922454834, "global_step": 40172, "epoch": 956} {"train_loss": -5.622735977172852, "global_step": 40173, "epoch": 956} {"train_loss": -5.582011699676514, "global_step": 40174, "epoch": 956} {"train_loss": -5.68165397644043, "global_step": 40175, "epoch": 956} {"train_loss": -5.629284858703613, "global_step": 40176, "epoch": 956} {"train_loss": -5.57799768447876, "global_step": 40177, "epoch": 956} {"train_loss": -5.7792744636535645, "global_step": 40178, "epoch": 956} {"train_loss": -5.69011926651001, "global_step": 40179, "epoch": 956} {"train_loss": -5.7036590576171875, "global_step": 40180, "epoch": 956} {"train_loss": -5.671429634094238, "global_step": 40181, "epoch": 956} {"train_loss": -5.55088472366333, "global_step": 40182, "epoch": 956} {"train_loss": -5.680794715881348, "global_step": 40183, "epoch": 956} {"train_loss": -5.736525058746338, "global_step": 40184, "epoch": 956} {"train_loss": -5.634517669677734, "global_step": 40185, "epoch": 956} {"train_loss": -5.675807952880859, "global_step": 40186, "epoch": 956} {"train_loss": -5.683300971984863, "global_step": 40187, "epoch": 956} {"train_loss": -5.6649980545043945, "global_step": 40188, "epoch": 956} {"train_loss": -5.696749687194824, "global_step": 40189, "epoch": 956} {"train_loss": -5.662806034088135, "global_step": 40190, "epoch": 956} {"train_loss": -5.59963321685791, "global_step": 40191, "epoch": 956} {"train_loss": -5.651792526245117, "global_step": 40192, "epoch": 956} {"train_loss": -5.630929129464286, "global_step": 40193, "epoch": 956, "val_loss": 74371.71875} {"train_loss": -5.748861789703369, "global_step": 40194, "epoch": 957} {"train_loss": -5.599402904510498, "global_step": 40195, "epoch": 957} {"train_loss": -5.566650390625, "global_step": 40196, "epoch": 957} {"train_loss": -5.625385284423828, "global_step": 40197, "epoch": 957} {"train_loss": -5.6244893074035645, "global_step": 40198, "epoch": 957} {"train_loss": -5.711671352386475, "global_step": 40199, "epoch": 957} {"train_loss": -5.565840721130371, "global_step": 40200, "epoch": 957} {"train_loss": -5.676548957824707, "global_step": 40201, "epoch": 957} {"train_loss": -5.820167541503906, "global_step": 40202, "epoch": 957} {"train_loss": -5.732532978057861, "global_step": 40203, "epoch": 957} {"train_loss": -5.618027687072754, "global_step": 40204, "epoch": 957} {"train_loss": -5.673792362213135, "global_step": 40205, "epoch": 957} {"train_loss": -5.654871463775635, "global_step": 40206, "epoch": 957} {"train_loss": -5.713294506072998, "global_step": 40207, "epoch": 957} {"train_loss": -5.656805038452148, "global_step": 40208, "epoch": 957} {"train_loss": -5.733458042144775, "global_step": 40209, "epoch": 957} {"train_loss": -5.531889915466309, "global_step": 40210, "epoch": 957} {"train_loss": -5.683367729187012, "global_step": 40211, "epoch": 957} {"train_loss": -5.6737871170043945, "global_step": 40212, "epoch": 957} {"train_loss": -5.5449395179748535, "global_step": 40213, "epoch": 957} {"train_loss": -5.601377010345459, "global_step": 40214, "epoch": 957} {"train_loss": -5.578939437866211, "global_step": 40215, "epoch": 957} {"train_loss": -5.661925315856934, "global_step": 40216, "epoch": 957} {"train_loss": -5.722076416015625, "global_step": 40217, "epoch": 957} {"train_loss": -5.671394348144531, "global_step": 40218, "epoch": 957} {"train_loss": -5.682585716247559, "global_step": 40219, "epoch": 957} {"train_loss": -5.671424388885498, "global_step": 40220, "epoch": 957} {"train_loss": -5.579715728759766, "global_step": 40221, "epoch": 957} {"train_loss": -5.57349967956543, "global_step": 40222, "epoch": 957} {"train_loss": -5.642956733703613, "global_step": 40223, "epoch": 957} {"train_loss": -5.600296497344971, "global_step": 40224, "epoch": 957} {"train_loss": -5.6169328689575195, "global_step": 40225, "epoch": 957} {"train_loss": -5.668570041656494, "global_step": 40226, "epoch": 957} {"train_loss": -5.665852069854736, "global_step": 40227, "epoch": 957} {"train_loss": -5.458081245422363, "global_step": 40228, "epoch": 957} {"train_loss": -5.699091911315918, "global_step": 40229, "epoch": 957} {"train_loss": -5.713717460632324, "global_step": 40230, "epoch": 957} {"train_loss": -5.573604583740234, "global_step": 40231, "epoch": 957} {"train_loss": -5.584057331085205, "global_step": 40232, "epoch": 957} {"train_loss": -5.622884750366211, "global_step": 40233, "epoch": 957} {"train_loss": -5.78452205657959, "global_step": 40234, "epoch": 957} {"train_loss": -5.650176547822499, "global_step": 40235, "epoch": 957, "val_loss": 74144.140625} {"train_loss": -5.788331031799316, "global_step": 40236, "epoch": 958} {"train_loss": -5.691366195678711, "global_step": 40237, "epoch": 958} {"train_loss": -5.5486345291137695, "global_step": 40238, "epoch": 958} {"train_loss": -5.6274847984313965, "global_step": 40239, "epoch": 958} {"train_loss": -5.569336891174316, "global_step": 40240, "epoch": 958} {"train_loss": -5.769983768463135, "global_step": 40241, "epoch": 958} {"train_loss": -5.535053253173828, "global_step": 40242, "epoch": 958} {"train_loss": -5.661435127258301, "global_step": 40243, "epoch": 958} {"train_loss": -5.582796573638916, "global_step": 40244, "epoch": 958} {"train_loss": -5.6075897216796875, "global_step": 40245, "epoch": 958} {"train_loss": -5.631591320037842, "global_step": 40246, "epoch": 958} {"train_loss": -5.6050333976745605, "global_step": 40247, "epoch": 958} {"train_loss": -5.767709255218506, "global_step": 40248, "epoch": 958} {"train_loss": -5.577878952026367, "global_step": 40249, "epoch": 958} {"train_loss": -5.578115463256836, "global_step": 40250, "epoch": 958} {"train_loss": -5.652441024780273, "global_step": 40251, "epoch": 958} {"train_loss": -5.533416748046875, "global_step": 40252, "epoch": 958} {"train_loss": -5.57047176361084, "global_step": 40253, "epoch": 958} {"train_loss": -5.608664512634277, "global_step": 40254, "epoch": 958} {"train_loss": -5.508770942687988, "global_step": 40255, "epoch": 958} {"train_loss": -5.572781085968018, "global_step": 40256, "epoch": 958} {"train_loss": -5.460612773895264, "global_step": 40257, "epoch": 958} {"train_loss": -5.631634712219238, "global_step": 40258, "epoch": 958} {"train_loss": -5.551869869232178, "global_step": 40259, "epoch": 958} {"train_loss": -5.511914253234863, "global_step": 40260, "epoch": 958} {"train_loss": -5.548711776733398, "global_step": 40261, "epoch": 958} {"train_loss": -5.415079116821289, "global_step": 40262, "epoch": 958} {"train_loss": -5.583146572113037, "global_step": 40263, "epoch": 958} {"train_loss": -5.652708053588867, "global_step": 40264, "epoch": 958} {"train_loss": -5.625381946563721, "global_step": 40265, "epoch": 958} {"train_loss": -5.656182289123535, "global_step": 40266, "epoch": 958} {"train_loss": -5.5270867347717285, "global_step": 40267, "epoch": 958} {"train_loss": -5.576403617858887, "global_step": 40268, "epoch": 958} {"train_loss": -5.625208854675293, "global_step": 40269, "epoch": 958} {"train_loss": -5.648669242858887, "global_step": 40270, "epoch": 958} {"train_loss": -5.61618709564209, "global_step": 40271, "epoch": 958} {"train_loss": -5.727853775024414, "global_step": 40272, "epoch": 958} {"train_loss": -5.68047571182251, "global_step": 40273, "epoch": 958} {"train_loss": -5.584184646606445, "global_step": 40274, "epoch": 958} {"train_loss": -5.663152694702148, "global_step": 40275, "epoch": 958} {"train_loss": -5.605782508850098, "global_step": 40276, "epoch": 958} {"train_loss": -5.606367111206055, "global_step": 40277, "epoch": 958, "val_loss": 73894.7109375} {"train_loss": -5.575051307678223, "global_step": 40278, "epoch": 959} {"train_loss": -5.662262916564941, "global_step": 40279, "epoch": 959} {"train_loss": -5.631937026977539, "global_step": 40280, "epoch": 959} {"train_loss": -5.517770290374756, "global_step": 40281, "epoch": 959} {"train_loss": -5.7992634773254395, "global_step": 40282, "epoch": 959} {"train_loss": -5.663251876831055, "global_step": 40283, "epoch": 959} {"train_loss": -5.5892333984375, "global_step": 40284, "epoch": 959} {"train_loss": -5.6681809425354, "global_step": 40285, "epoch": 959} {"train_loss": -5.686882972717285, "global_step": 40286, "epoch": 959} {"train_loss": -5.568513870239258, "global_step": 40287, "epoch": 959} {"train_loss": -5.759342670440674, "global_step": 40288, "epoch": 959} {"train_loss": -5.77913761138916, "global_step": 40289, "epoch": 959} {"train_loss": -5.632926940917969, "global_step": 40290, "epoch": 959} {"train_loss": -5.565606117248535, "global_step": 40291, "epoch": 959} {"train_loss": -5.652977466583252, "global_step": 40292, "epoch": 959} {"train_loss": -5.651131629943848, "global_step": 40293, "epoch": 959} {"train_loss": -5.687156677246094, "global_step": 40294, "epoch": 959} {"train_loss": -5.661623001098633, "global_step": 40295, "epoch": 959} {"train_loss": -5.54094123840332, "global_step": 40296, "epoch": 959} {"train_loss": -5.627557754516602, "global_step": 40297, "epoch": 959} {"train_loss": -5.705460548400879, "global_step": 40298, "epoch": 959} {"train_loss": -5.710319519042969, "global_step": 40299, "epoch": 959} {"train_loss": -5.591220378875732, "global_step": 40300, "epoch": 959} {"train_loss": -5.575084686279297, "global_step": 40301, "epoch": 959} {"train_loss": -5.682226181030273, "global_step": 40302, "epoch": 959} {"train_loss": -5.4176130294799805, "global_step": 40303, "epoch": 959} {"train_loss": -5.722672462463379, "global_step": 40304, "epoch": 959} {"train_loss": -5.5396528244018555, "global_step": 40305, "epoch": 959} {"train_loss": -5.4383392333984375, "global_step": 40306, "epoch": 959} {"train_loss": -5.621234893798828, "global_step": 40307, "epoch": 959} {"train_loss": -5.521554946899414, "global_step": 40308, "epoch": 959} {"train_loss": -5.675368309020996, "global_step": 40309, "epoch": 959} {"train_loss": -5.598672866821289, "global_step": 40310, "epoch": 959} {"train_loss": -5.476674556732178, "global_step": 40311, "epoch": 959} {"train_loss": -5.5230817794799805, "global_step": 40312, "epoch": 959} {"train_loss": -5.5261359214782715, "global_step": 40313, "epoch": 959} {"train_loss": -5.7083940505981445, "global_step": 40314, "epoch": 959} {"train_loss": -5.539805889129639, "global_step": 40315, "epoch": 959} {"train_loss": -5.534680366516113, "global_step": 40316, "epoch": 959} {"train_loss": -5.541623592376709, "global_step": 40317, "epoch": 959} {"train_loss": -5.65287971496582, "global_step": 40318, "epoch": 959} {"train_loss": -5.615371522449312, "global_step": 40319, "epoch": 959, "val_loss": 74083.578125} {"train_loss": -5.702210903167725, "global_step": 40320, "epoch": 960} {"train_loss": -5.582019805908203, "global_step": 40321, "epoch": 960} {"train_loss": -5.56567907333374, "global_step": 40322, "epoch": 960} {"train_loss": -5.738068580627441, "global_step": 40323, "epoch": 960} {"train_loss": -5.605740547180176, "global_step": 40324, "epoch": 960} {"train_loss": -5.634567737579346, "global_step": 40325, "epoch": 960} {"train_loss": -5.547359466552734, "global_step": 40326, "epoch": 960} {"train_loss": -5.704460620880127, "global_step": 40327, "epoch": 960} {"train_loss": -5.608325481414795, "global_step": 40328, "epoch": 960} {"train_loss": -5.587686538696289, "global_step": 40329, "epoch": 960} {"train_loss": -5.551334381103516, "global_step": 40330, "epoch": 960} {"train_loss": -5.601346969604492, "global_step": 40331, "epoch": 960} {"train_loss": -5.744866847991943, "global_step": 40332, "epoch": 960} {"train_loss": -5.644366264343262, "global_step": 40333, "epoch": 960} {"train_loss": -5.590967178344727, "global_step": 40334, "epoch": 960} {"train_loss": -5.638716697692871, "global_step": 40335, "epoch": 960} {"train_loss": -5.477302551269531, "global_step": 40336, "epoch": 960} {"train_loss": -5.569430828094482, "global_step": 40337, "epoch": 960} {"train_loss": -5.6875529289245605, "global_step": 40338, "epoch": 960} {"train_loss": -5.559444904327393, "global_step": 40339, "epoch": 960} {"train_loss": -5.642589569091797, "global_step": 40340, "epoch": 960} {"train_loss": -5.505299091339111, "global_step": 40341, "epoch": 960} {"train_loss": -5.649475574493408, "global_step": 40342, "epoch": 960} {"train_loss": -5.680228233337402, "global_step": 40343, "epoch": 960} {"train_loss": -5.611562728881836, "global_step": 40344, "epoch": 960} {"train_loss": -5.628973960876465, "global_step": 40345, "epoch": 960} {"train_loss": -5.782468318939209, "global_step": 40346, "epoch": 960} {"train_loss": -5.636039733886719, "global_step": 40347, "epoch": 960} {"train_loss": -5.614220142364502, "global_step": 40348, "epoch": 960} {"train_loss": -5.665633678436279, "global_step": 40349, "epoch": 960} {"train_loss": -5.647261142730713, "global_step": 40350, "epoch": 960} {"train_loss": -5.705849647521973, "global_step": 40351, "epoch": 960} {"train_loss": -5.611927032470703, "global_step": 40352, "epoch": 960} {"train_loss": -5.680363178253174, "global_step": 40353, "epoch": 960} {"train_loss": -5.735400199890137, "global_step": 40354, "epoch": 960} {"train_loss": -5.537105560302734, "global_step": 40355, "epoch": 960} {"train_loss": -5.535170555114746, "global_step": 40356, "epoch": 960} {"train_loss": -5.66578483581543, "global_step": 40357, "epoch": 960} {"train_loss": -5.634524822235107, "global_step": 40358, "epoch": 960} {"train_loss": -5.595954895019531, "global_step": 40359, "epoch": 960} {"train_loss": -5.687780857086182, "global_step": 40360, "epoch": 960} {"train_loss": -5.6309645402999156, "global_step": 40361, "epoch": 960, "val_loss": 73695.3984375} {"train_loss": -5.634743690490723, "global_step": 40362, "epoch": 961} {"train_loss": -5.559680938720703, "global_step": 40363, "epoch": 961} {"train_loss": -5.647334098815918, "global_step": 40364, "epoch": 961} {"train_loss": -5.617693901062012, "global_step": 40365, "epoch": 961} {"train_loss": -5.841121673583984, "global_step": 40366, "epoch": 961} {"train_loss": -5.6422271728515625, "global_step": 40367, "epoch": 961} {"train_loss": -5.704465866088867, "global_step": 40368, "epoch": 961} {"train_loss": -5.502595901489258, "global_step": 40369, "epoch": 961} {"train_loss": -5.692626476287842, "global_step": 40370, "epoch": 961} {"train_loss": -5.739435195922852, "global_step": 40371, "epoch": 961} {"train_loss": -5.734159469604492, "global_step": 40372, "epoch": 961} {"train_loss": -5.781147003173828, "global_step": 40373, "epoch": 961} {"train_loss": -5.727675437927246, "global_step": 40374, "epoch": 961} {"train_loss": -5.578214645385742, "global_step": 40375, "epoch": 961} {"train_loss": -5.686100006103516, "global_step": 40376, "epoch": 961} {"train_loss": -5.731369495391846, "global_step": 40377, "epoch": 961} {"train_loss": -5.552837371826172, "global_step": 40378, "epoch": 961} {"train_loss": -5.498643398284912, "global_step": 40379, "epoch": 961} {"train_loss": -5.562551498413086, "global_step": 40380, "epoch": 961} {"train_loss": -5.539341926574707, "global_step": 40381, "epoch": 961} {"train_loss": -5.680666923522949, "global_step": 40382, "epoch": 961} {"train_loss": -5.525750160217285, "global_step": 40383, "epoch": 961} {"train_loss": -5.667858123779297, "global_step": 40384, "epoch": 961} {"train_loss": -5.584920883178711, "global_step": 40385, "epoch": 961} {"train_loss": -5.52083158493042, "global_step": 40386, "epoch": 961} {"train_loss": -5.554727554321289, "global_step": 40387, "epoch": 961} {"train_loss": -5.634003639221191, "global_step": 40388, "epoch": 961} {"train_loss": -5.686444282531738, "global_step": 40389, "epoch": 961} {"train_loss": -5.560296058654785, "global_step": 40390, "epoch": 961} {"train_loss": -5.686584949493408, "global_step": 40391, "epoch": 961} {"train_loss": -5.610725402832031, "global_step": 40392, "epoch": 961} {"train_loss": -5.6625285148620605, "global_step": 40393, "epoch": 961} {"train_loss": -5.704479217529297, "global_step": 40394, "epoch": 961} {"train_loss": -5.555306434631348, "global_step": 40395, "epoch": 961} {"train_loss": -5.564697742462158, "global_step": 40396, "epoch": 961} {"train_loss": -5.69799280166626, "global_step": 40397, "epoch": 961} {"train_loss": -5.576849937438965, "global_step": 40398, "epoch": 961} {"train_loss": -5.601604461669922, "global_step": 40399, "epoch": 961} {"train_loss": -5.669866561889648, "global_step": 40400, "epoch": 961} {"train_loss": -5.60984992980957, "global_step": 40401, "epoch": 961} {"train_loss": -5.63526725769043, "global_step": 40402, "epoch": 961} {"train_loss": -5.635728029977708, "global_step": 40403, "epoch": 961, "val_loss": 74086.640625} {"train_loss": -5.631619930267334, "global_step": 40404, "epoch": 962} {"train_loss": -5.697805881500244, "global_step": 40405, "epoch": 962} {"train_loss": -5.4632391929626465, "global_step": 40406, "epoch": 962} {"train_loss": -5.528136730194092, "global_step": 40407, "epoch": 962} {"train_loss": -5.567861557006836, "global_step": 40408, "epoch": 962} {"train_loss": -5.6785736083984375, "global_step": 40409, "epoch": 962} {"train_loss": -5.571126461029053, "global_step": 40410, "epoch": 962} {"train_loss": -5.72268009185791, "global_step": 40411, "epoch": 962} {"train_loss": -5.509413242340088, "global_step": 40412, "epoch": 962} {"train_loss": -5.59108304977417, "global_step": 40413, "epoch": 962} {"train_loss": -5.672833442687988, "global_step": 40414, "epoch": 962} {"train_loss": -5.55534553527832, "global_step": 40415, "epoch": 962} {"train_loss": -5.618899822235107, "global_step": 40416, "epoch": 962} {"train_loss": -5.53970193862915, "global_step": 40417, "epoch": 962} {"train_loss": -5.71980094909668, "global_step": 40418, "epoch": 962} {"train_loss": -5.519351005554199, "global_step": 40419, "epoch": 962} {"train_loss": -5.584955215454102, "global_step": 40420, "epoch": 962} {"train_loss": -5.6102094650268555, "global_step": 40421, "epoch": 962} {"train_loss": -5.570910453796387, "global_step": 40422, "epoch": 962} {"train_loss": -5.612217903137207, "global_step": 40423, "epoch": 962} {"train_loss": -5.710701942443848, "global_step": 40424, "epoch": 962} {"train_loss": -5.477551460266113, "global_step": 40425, "epoch": 962} {"train_loss": -5.622195243835449, "global_step": 40426, "epoch": 962} {"train_loss": -5.643712043762207, "global_step": 40427, "epoch": 962} {"train_loss": -5.604428291320801, "global_step": 40428, "epoch": 962} {"train_loss": -5.59214448928833, "global_step": 40429, "epoch": 962} {"train_loss": -5.635190963745117, "global_step": 40430, "epoch": 962} {"train_loss": -5.678946495056152, "global_step": 40431, "epoch": 962} {"train_loss": -5.653738021850586, "global_step": 40432, "epoch": 962} {"train_loss": -5.549480438232422, "global_step": 40433, "epoch": 962} {"train_loss": -5.81241512298584, "global_step": 40434, "epoch": 962} {"train_loss": -5.520790100097656, "global_step": 40435, "epoch": 962} {"train_loss": -5.597560882568359, "global_step": 40436, "epoch": 962} {"train_loss": -5.532294750213623, "global_step": 40437, "epoch": 962} {"train_loss": -5.540908336639404, "global_step": 40438, "epoch": 962} {"train_loss": -5.641383171081543, "global_step": 40439, "epoch": 962} {"train_loss": -5.593805313110352, "global_step": 40440, "epoch": 962} {"train_loss": -5.601277828216553, "global_step": 40441, "epoch": 962} {"train_loss": -5.667054176330566, "global_step": 40442, "epoch": 962} {"train_loss": -5.503762245178223, "global_step": 40443, "epoch": 962} {"train_loss": -5.648312091827393, "global_step": 40444, "epoch": 962} {"train_loss": -5.604517334983463, "global_step": 40445, "epoch": 962, "val_loss": 74507.5546875} {"train_loss": -5.630523204803467, "global_step": 40446, "epoch": 963} {"train_loss": -5.554999351501465, "global_step": 40447, "epoch": 963} {"train_loss": -5.720993995666504, "global_step": 40448, "epoch": 963} {"train_loss": -5.62791633605957, "global_step": 40449, "epoch": 963} {"train_loss": -5.632614612579346, "global_step": 40450, "epoch": 963} {"train_loss": -5.8255157470703125, "global_step": 40451, "epoch": 963} {"train_loss": -5.527002334594727, "global_step": 40452, "epoch": 963} {"train_loss": -5.642825603485107, "global_step": 40453, "epoch": 963} {"train_loss": -5.697836875915527, "global_step": 40454, "epoch": 963} {"train_loss": -5.555336952209473, "global_step": 40455, "epoch": 963} {"train_loss": -5.790395736694336, "global_step": 40456, "epoch": 963} {"train_loss": -5.636672019958496, "global_step": 40457, "epoch": 963} {"train_loss": -5.537947177886963, "global_step": 40458, "epoch": 963} {"train_loss": -5.765514373779297, "global_step": 40459, "epoch": 963} {"train_loss": -5.614160060882568, "global_step": 40460, "epoch": 963} {"train_loss": -5.716092109680176, "global_step": 40461, "epoch": 963} {"train_loss": -5.656404972076416, "global_step": 40462, "epoch": 963} {"train_loss": -5.530374526977539, "global_step": 40463, "epoch": 963} {"train_loss": -5.647354602813721, "global_step": 40464, "epoch": 963} {"train_loss": -5.691413879394531, "global_step": 40465, "epoch": 963} {"train_loss": -5.675074577331543, "global_step": 40466, "epoch": 963} {"train_loss": -5.6588454246521, "global_step": 40467, "epoch": 963} {"train_loss": -5.721881866455078, "global_step": 40468, "epoch": 963} {"train_loss": -5.610267162322998, "global_step": 40469, "epoch": 963} {"train_loss": -5.537444114685059, "global_step": 40470, "epoch": 963} {"train_loss": -5.626209259033203, "global_step": 40471, "epoch": 963} {"train_loss": -5.747007846832275, "global_step": 40472, "epoch": 963} {"train_loss": -5.596009254455566, "global_step": 40473, "epoch": 963} {"train_loss": -5.680202484130859, "global_step": 40474, "epoch": 963} {"train_loss": -5.5338335037231445, "global_step": 40475, "epoch": 963} {"train_loss": -5.509463787078857, "global_step": 40476, "epoch": 963} {"train_loss": -5.567300319671631, "global_step": 40477, "epoch": 963} {"train_loss": -5.459134101867676, "global_step": 40478, "epoch": 963} {"train_loss": -5.627179145812988, "global_step": 40479, "epoch": 963} {"train_loss": -5.4686126708984375, "global_step": 40480, "epoch": 963} {"train_loss": -5.588533401489258, "global_step": 40481, "epoch": 963} {"train_loss": -5.7257080078125, "global_step": 40482, "epoch": 963} {"train_loss": -5.7176008224487305, "global_step": 40483, "epoch": 963} {"train_loss": -5.608498573303223, "global_step": 40484, "epoch": 963} {"train_loss": -5.669452667236328, "global_step": 40485, "epoch": 963} {"train_loss": -5.658329963684082, "global_step": 40486, "epoch": 963} {"train_loss": -5.632428975332351, "global_step": 40487, "epoch": 963, "val_loss": 74164.3359375} {"train_loss": -5.584026336669922, "global_step": 40488, "epoch": 964} {"train_loss": -5.544974327087402, "global_step": 40489, "epoch": 964} {"train_loss": -5.611312389373779, "global_step": 40490, "epoch": 964} {"train_loss": -5.616701126098633, "global_step": 40491, "epoch": 964} {"train_loss": -5.753488540649414, "global_step": 40492, "epoch": 964} {"train_loss": -5.528312683105469, "global_step": 40493, "epoch": 964} {"train_loss": -5.695368766784668, "global_step": 40494, "epoch": 964} {"train_loss": -5.569451332092285, "global_step": 40495, "epoch": 964} {"train_loss": -5.726548671722412, "global_step": 40496, "epoch": 964} {"train_loss": -5.611000061035156, "global_step": 40497, "epoch": 964} {"train_loss": -5.552400588989258, "global_step": 40498, "epoch": 964} {"train_loss": -5.6766862869262695, "global_step": 40499, "epoch": 964} {"train_loss": -5.570581436157227, "global_step": 40500, "epoch": 964} {"train_loss": -5.83962345123291, "global_step": 40501, "epoch": 964} {"train_loss": -5.724405288696289, "global_step": 40502, "epoch": 964} {"train_loss": -5.564162254333496, "global_step": 40503, "epoch": 964} {"train_loss": -5.593454837799072, "global_step": 40504, "epoch": 964} {"train_loss": -5.655115604400635, "global_step": 40505, "epoch": 964} {"train_loss": -5.555695533752441, "global_step": 40506, "epoch": 964} {"train_loss": -5.637812614440918, "global_step": 40507, "epoch": 964} {"train_loss": -5.705194473266602, "global_step": 40508, "epoch": 964} {"train_loss": -5.6889848709106445, "global_step": 40509, "epoch": 964} {"train_loss": -5.717685699462891, "global_step": 40510, "epoch": 964} {"train_loss": -5.680291175842285, "global_step": 40511, "epoch": 964} {"train_loss": -5.566363334655762, "global_step": 40512, "epoch": 964} {"train_loss": -5.559538841247559, "global_step": 40513, "epoch": 964} {"train_loss": -5.649105548858643, "global_step": 40514, "epoch": 964} {"train_loss": -5.560144424438477, "global_step": 40515, "epoch": 964} {"train_loss": -5.667027473449707, "global_step": 40516, "epoch": 964} {"train_loss": -5.4855194091796875, "global_step": 40517, "epoch": 964} {"train_loss": -5.601223945617676, "global_step": 40518, "epoch": 964} {"train_loss": -5.601777076721191, "global_step": 40519, "epoch": 964} {"train_loss": -5.489326477050781, "global_step": 40520, "epoch": 964} {"train_loss": -5.73037052154541, "global_step": 40521, "epoch": 964} {"train_loss": -5.597115516662598, "global_step": 40522, "epoch": 964} {"train_loss": -5.707610130310059, "global_step": 40523, "epoch": 964} {"train_loss": -5.569126129150391, "global_step": 40524, "epoch": 964} {"train_loss": -5.58285665512085, "global_step": 40525, "epoch": 964} {"train_loss": -5.562463283538818, "global_step": 40526, "epoch": 964} {"train_loss": -5.584592342376709, "global_step": 40527, "epoch": 964} {"train_loss": -5.655295372009277, "global_step": 40528, "epoch": 964} {"train_loss": -5.625070481073289, "global_step": 40529, "epoch": 964, "val_loss": 74203.3828125} {"train_loss": -5.5431013107299805, "global_step": 40530, "epoch": 965} {"train_loss": -5.566531658172607, "global_step": 40531, "epoch": 965} {"train_loss": -5.6744537353515625, "global_step": 40532, "epoch": 965} {"train_loss": -5.643744468688965, "global_step": 40533, "epoch": 965} {"train_loss": -5.577073097229004, "global_step": 40534, "epoch": 965} {"train_loss": -5.730014801025391, "global_step": 40535, "epoch": 965} {"train_loss": -5.635152816772461, "global_step": 40536, "epoch": 965} {"train_loss": -5.6475114822387695, "global_step": 40537, "epoch": 965} {"train_loss": -5.622422218322754, "global_step": 40538, "epoch": 965} {"train_loss": -5.659651279449463, "global_step": 40539, "epoch": 965} {"train_loss": -5.5504350662231445, "global_step": 40540, "epoch": 965} {"train_loss": -5.483429908752441, "global_step": 40541, "epoch": 965} {"train_loss": -5.612796306610107, "global_step": 40542, "epoch": 965} {"train_loss": -5.616158485412598, "global_step": 40543, "epoch": 965} {"train_loss": -5.541345596313477, "global_step": 40544, "epoch": 965} {"train_loss": -5.645425319671631, "global_step": 40545, "epoch": 965} {"train_loss": -5.605085372924805, "global_step": 40546, "epoch": 965} {"train_loss": -5.597198486328125, "global_step": 40547, "epoch": 965} {"train_loss": -5.684506416320801, "global_step": 40548, "epoch": 965} {"train_loss": -5.655113220214844, "global_step": 40549, "epoch": 965} {"train_loss": -5.696506977081299, "global_step": 40550, "epoch": 965} {"train_loss": -5.782639503479004, "global_step": 40551, "epoch": 965} {"train_loss": -5.6124091148376465, "global_step": 40552, "epoch": 965} {"train_loss": -5.7721967697143555, "global_step": 40553, "epoch": 965} {"train_loss": -5.536680221557617, "global_step": 40554, "epoch": 965} {"train_loss": -5.613031387329102, "global_step": 40555, "epoch": 965} {"train_loss": -5.57687520980835, "global_step": 40556, "epoch": 965} {"train_loss": -5.585077285766602, "global_step": 40557, "epoch": 965} {"train_loss": -5.694643497467041, "global_step": 40558, "epoch": 965} {"train_loss": -5.683953762054443, "global_step": 40559, "epoch": 965} {"train_loss": -5.67665433883667, "global_step": 40560, "epoch": 965} {"train_loss": -5.720630645751953, "global_step": 40561, "epoch": 965} {"train_loss": -5.657681465148926, "global_step": 40562, "epoch": 965} {"train_loss": -5.594637870788574, "global_step": 40563, "epoch": 965} {"train_loss": -5.7116498947143555, "global_step": 40564, "epoch": 965} {"train_loss": -5.7699079513549805, "global_step": 40565, "epoch": 965} {"train_loss": -5.59273624420166, "global_step": 40566, "epoch": 965} {"train_loss": -5.704449653625488, "global_step": 40567, "epoch": 965} {"train_loss": -5.626218318939209, "global_step": 40568, "epoch": 965} {"train_loss": -5.608283996582031, "global_step": 40569, "epoch": 965} {"train_loss": -5.5219526290893555, "global_step": 40570, "epoch": 965} {"train_loss": -5.634702603022258, "global_step": 40571, "epoch": 965, "val_loss": 73819.8515625} {"train_loss": -5.722734451293945, "global_step": 40572, "epoch": 966} {"train_loss": -5.801301002502441, "global_step": 40573, "epoch": 966} {"train_loss": -5.605984687805176, "global_step": 40574, "epoch": 966} {"train_loss": -5.632116317749023, "global_step": 40575, "epoch": 966} {"train_loss": -5.666574001312256, "global_step": 40576, "epoch": 966} {"train_loss": -5.519420623779297, "global_step": 40577, "epoch": 966} {"train_loss": -5.737028121948242, "global_step": 40578, "epoch": 966} {"train_loss": -5.666506767272949, "global_step": 40579, "epoch": 966} {"train_loss": -5.69033145904541, "global_step": 40580, "epoch": 966} {"train_loss": -5.750515937805176, "global_step": 40581, "epoch": 966} {"train_loss": -5.69880485534668, "global_step": 40582, "epoch": 966} {"train_loss": -5.660351753234863, "global_step": 40583, "epoch": 966} {"train_loss": -5.689765930175781, "global_step": 40584, "epoch": 966} {"train_loss": -5.617688179016113, "global_step": 40585, "epoch": 966} {"train_loss": -5.628542900085449, "global_step": 40586, "epoch": 966} {"train_loss": -5.557535171508789, "global_step": 40587, "epoch": 966} {"train_loss": -5.55021858215332, "global_step": 40588, "epoch": 966} {"train_loss": -5.687259674072266, "global_step": 40589, "epoch": 966} {"train_loss": -5.672353744506836, "global_step": 40590, "epoch": 966} {"train_loss": -5.6053361892700195, "global_step": 40591, "epoch": 966} {"train_loss": -5.717709064483643, "global_step": 40592, "epoch": 966} {"train_loss": -5.677985191345215, "global_step": 40593, "epoch": 966} {"train_loss": -5.66914701461792, "global_step": 40594, "epoch": 966} {"train_loss": -5.6243791580200195, "global_step": 40595, "epoch": 966} {"train_loss": -5.581753730773926, "global_step": 40596, "epoch": 966} {"train_loss": -5.611323356628418, "global_step": 40597, "epoch": 966} {"train_loss": -5.635709762573242, "global_step": 40598, "epoch": 966} {"train_loss": -5.703805923461914, "global_step": 40599, "epoch": 966} {"train_loss": -5.680050849914551, "global_step": 40600, "epoch": 966} {"train_loss": -5.66752815246582, "global_step": 40601, "epoch": 966} {"train_loss": -5.700582027435303, "global_step": 40602, "epoch": 966} {"train_loss": -5.628344535827637, "global_step": 40603, "epoch": 966} {"train_loss": -5.492297172546387, "global_step": 40604, "epoch": 966} {"train_loss": -5.689042091369629, "global_step": 40605, "epoch": 966} {"train_loss": -5.645989418029785, "global_step": 40606, "epoch": 966} {"train_loss": -5.548039436340332, "global_step": 40607, "epoch": 966} {"train_loss": -5.676272392272949, "global_step": 40608, "epoch": 966} {"train_loss": -5.591827869415283, "global_step": 40609, "epoch": 966} {"train_loss": -5.652257442474365, "global_step": 40610, "epoch": 966} {"train_loss": -5.504653453826904, "global_step": 40611, "epoch": 966} {"train_loss": -5.7136945724487305, "global_step": 40612, "epoch": 966} {"train_loss": -5.649877332505726, "global_step": 40613, "epoch": 966, "val_loss": 74241.0546875} {"train_loss": -5.505146026611328, "global_step": 40614, "epoch": 967} {"train_loss": -5.631426811218262, "global_step": 40615, "epoch": 967} {"train_loss": -5.495039939880371, "global_step": 40616, "epoch": 967} {"train_loss": -5.4510016441345215, "global_step": 40617, "epoch": 967} {"train_loss": -5.617727279663086, "global_step": 40618, "epoch": 967} {"train_loss": -5.41596794128418, "global_step": 40619, "epoch": 967} {"train_loss": -5.552186489105225, "global_step": 40620, "epoch": 967} {"train_loss": -5.61563777923584, "global_step": 40621, "epoch": 967} {"train_loss": -5.635750770568848, "global_step": 40622, "epoch": 967} {"train_loss": -5.614880084991455, "global_step": 40623, "epoch": 967} {"train_loss": -5.546871185302734, "global_step": 40624, "epoch": 967} {"train_loss": -5.603066921234131, "global_step": 40625, "epoch": 967} {"train_loss": -5.5361785888671875, "global_step": 40626, "epoch": 967} {"train_loss": -5.594438552856445, "global_step": 40627, "epoch": 967} {"train_loss": -5.716522216796875, "global_step": 40628, "epoch": 967} {"train_loss": -5.596329689025879, "global_step": 40629, "epoch": 967} {"train_loss": -5.652426719665527, "global_step": 40630, "epoch": 967} {"train_loss": -5.6879754066467285, "global_step": 40631, "epoch": 967} {"train_loss": -5.715511322021484, "global_step": 40632, "epoch": 967} {"train_loss": -5.71104621887207, "global_step": 40633, "epoch": 967} {"train_loss": -5.596356391906738, "global_step": 40634, "epoch": 967} {"train_loss": -5.7281389236450195, "global_step": 40635, "epoch": 967} {"train_loss": -5.501018524169922, "global_step": 40636, "epoch": 967} {"train_loss": -5.482996463775635, "global_step": 40637, "epoch": 967} {"train_loss": -5.496536731719971, "global_step": 40638, "epoch": 967} {"train_loss": -5.666633129119873, "global_step": 40639, "epoch": 967} {"train_loss": -5.680243492126465, "global_step": 40640, "epoch": 967} {"train_loss": -5.693071365356445, "global_step": 40641, "epoch": 967} {"train_loss": -5.609096050262451, "global_step": 40642, "epoch": 967} {"train_loss": -5.787109375, "global_step": 40643, "epoch": 967} {"train_loss": -5.721372604370117, "global_step": 40644, "epoch": 967} {"train_loss": -5.733004570007324, "global_step": 40645, "epoch": 967} {"train_loss": -5.74587345123291, "global_step": 40646, "epoch": 967} {"train_loss": -5.5977091789245605, "global_step": 40647, "epoch": 967} {"train_loss": -5.541883945465088, "global_step": 40648, "epoch": 967} {"train_loss": -5.751508712768555, "global_step": 40649, "epoch": 967} {"train_loss": -5.7317304611206055, "global_step": 40650, "epoch": 967} {"train_loss": -5.54954719543457, "global_step": 40651, "epoch": 967} {"train_loss": -5.661602020263672, "global_step": 40652, "epoch": 967} {"train_loss": -5.683143615722656, "global_step": 40653, "epoch": 967} {"train_loss": -5.67864990234375, "global_step": 40654, "epoch": 967} {"train_loss": -5.621730338959467, "global_step": 40655, "epoch": 967, "val_loss": 73832.0234375} {"train_loss": -5.574267864227295, "global_step": 40656, "epoch": 968} {"train_loss": -5.668946743011475, "global_step": 40657, "epoch": 968} {"train_loss": -5.688596725463867, "global_step": 40658, "epoch": 968} {"train_loss": -5.463362693786621, "global_step": 40659, "epoch": 968} {"train_loss": -5.83836555480957, "global_step": 40660, "epoch": 968} {"train_loss": -5.638557434082031, "global_step": 40661, "epoch": 968} {"train_loss": -5.630549430847168, "global_step": 40662, "epoch": 968} {"train_loss": -5.709693908691406, "global_step": 40663, "epoch": 968} {"train_loss": -5.610784530639648, "global_step": 40664, "epoch": 968} {"train_loss": -5.6743268966674805, "global_step": 40665, "epoch": 968} {"train_loss": -5.573950290679932, "global_step": 40666, "epoch": 968} {"train_loss": -5.5247321128845215, "global_step": 40667, "epoch": 968} {"train_loss": -5.619300842285156, "global_step": 40668, "epoch": 968} {"train_loss": -5.381686210632324, "global_step": 40669, "epoch": 968} {"train_loss": -5.725828647613525, "global_step": 40670, "epoch": 968} {"train_loss": -5.634451866149902, "global_step": 40671, "epoch": 968} {"train_loss": -5.484831809997559, "global_step": 40672, "epoch": 968} {"train_loss": -5.674009799957275, "global_step": 40673, "epoch": 968} {"train_loss": -5.609709739685059, "global_step": 40674, "epoch": 968} {"train_loss": -5.686356067657471, "global_step": 40675, "epoch": 968} {"train_loss": -5.556514739990234, "global_step": 40676, "epoch": 968} {"train_loss": -5.563706398010254, "global_step": 40677, "epoch": 968} {"train_loss": -5.650277137756348, "global_step": 40678, "epoch": 968} {"train_loss": -5.720078945159912, "global_step": 40679, "epoch": 968} {"train_loss": -5.650796413421631, "global_step": 40680, "epoch": 968} {"train_loss": -5.693789482116699, "global_step": 40681, "epoch": 968} {"train_loss": -5.743267059326172, "global_step": 40682, "epoch": 968} {"train_loss": -5.58930778503418, "global_step": 40683, "epoch": 968} {"train_loss": -5.721515655517578, "global_step": 40684, "epoch": 968} {"train_loss": -5.654651165008545, "global_step": 40685, "epoch": 968} {"train_loss": -5.507846832275391, "global_step": 40686, "epoch": 968} {"train_loss": -5.665029525756836, "global_step": 40687, "epoch": 968} {"train_loss": -5.667862892150879, "global_step": 40688, "epoch": 968} {"train_loss": -5.656063556671143, "global_step": 40689, "epoch": 968} {"train_loss": -5.621530055999756, "global_step": 40690, "epoch": 968} {"train_loss": -5.587215423583984, "global_step": 40691, "epoch": 968} {"train_loss": -5.492342472076416, "global_step": 40692, "epoch": 968} {"train_loss": -5.572030544281006, "global_step": 40693, "epoch": 968} {"train_loss": -5.692817687988281, "global_step": 40694, "epoch": 968} {"train_loss": -5.62299108505249, "global_step": 40695, "epoch": 968} {"train_loss": -5.655391693115234, "global_step": 40696, "epoch": 968} {"train_loss": -5.626285700570969, "global_step": 40697, "epoch": 968, "val_loss": 73550.859375} {"train_loss": -5.627577304840088, "global_step": 40698, "epoch": 969} {"train_loss": -5.657773017883301, "global_step": 40699, "epoch": 969} {"train_loss": -5.677022933959961, "global_step": 40700, "epoch": 969} {"train_loss": -5.6589884757995605, "global_step": 40701, "epoch": 969} {"train_loss": -5.740192890167236, "global_step": 40702, "epoch": 969} {"train_loss": -5.6674604415893555, "global_step": 40703, "epoch": 969} {"train_loss": -5.5974650382995605, "global_step": 40704, "epoch": 969} {"train_loss": -5.810914993286133, "global_step": 40705, "epoch": 969} {"train_loss": -5.765783786773682, "global_step": 40706, "epoch": 969} {"train_loss": -5.54428243637085, "global_step": 40707, "epoch": 969} {"train_loss": -5.637636184692383, "global_step": 40708, "epoch": 969} {"train_loss": -5.573919296264648, "global_step": 40709, "epoch": 969} {"train_loss": -5.7470598220825195, "global_step": 40710, "epoch": 969} {"train_loss": -5.671385765075684, "global_step": 40711, "epoch": 969} {"train_loss": -5.770791053771973, "global_step": 40712, "epoch": 969} {"train_loss": -5.626123905181885, "global_step": 40713, "epoch": 969} {"train_loss": -5.527871131896973, "global_step": 40714, "epoch": 969} {"train_loss": -5.456272125244141, "global_step": 40715, "epoch": 969} {"train_loss": -5.627785682678223, "global_step": 40716, "epoch": 969} {"train_loss": -5.6054768562316895, "global_step": 40717, "epoch": 969} {"train_loss": -5.569557189941406, "global_step": 40718, "epoch": 969} {"train_loss": -5.620177745819092, "global_step": 40719, "epoch": 969} {"train_loss": -5.50560188293457, "global_step": 40720, "epoch": 969} {"train_loss": -5.620063304901123, "global_step": 40721, "epoch": 969} {"train_loss": -5.577395439147949, "global_step": 40722, "epoch": 969} {"train_loss": -5.799889087677002, "global_step": 40723, "epoch": 969} {"train_loss": -5.657976150512695, "global_step": 40724, "epoch": 969} {"train_loss": -5.626465797424316, "global_step": 40725, "epoch": 969} {"train_loss": -5.554247856140137, "global_step": 40726, "epoch": 969} {"train_loss": -5.555694580078125, "global_step": 40727, "epoch": 969} {"train_loss": -5.649620532989502, "global_step": 40728, "epoch": 969} {"train_loss": -5.526229381561279, "global_step": 40729, "epoch": 969} {"train_loss": -5.627641201019287, "global_step": 40730, "epoch": 969} {"train_loss": -5.65689754486084, "global_step": 40731, "epoch": 969} {"train_loss": -5.70188570022583, "global_step": 40732, "epoch": 969} {"train_loss": -5.5979461669921875, "global_step": 40733, "epoch": 969} {"train_loss": -5.557419776916504, "global_step": 40734, "epoch": 969} {"train_loss": -5.601529121398926, "global_step": 40735, "epoch": 969} {"train_loss": -5.650991439819336, "global_step": 40736, "epoch": 969} {"train_loss": -5.495545387268066, "global_step": 40737, "epoch": 969} {"train_loss": -5.497865676879883, "global_step": 40738, "epoch": 969} {"train_loss": -5.629713217417399, "global_step": 40739, "epoch": 969, "val_loss": 73930.4765625} {"train_loss": -5.514397144317627, "global_step": 40740, "epoch": 970} {"train_loss": -5.617649078369141, "global_step": 40741, "epoch": 970} {"train_loss": -5.585244655609131, "global_step": 40742, "epoch": 970} {"train_loss": -5.530297756195068, "global_step": 40743, "epoch": 970} {"train_loss": -5.597173690795898, "global_step": 40744, "epoch": 970} {"train_loss": -5.556781768798828, "global_step": 40745, "epoch": 970} {"train_loss": -5.631346702575684, "global_step": 40746, "epoch": 970} {"train_loss": -5.652580261230469, "global_step": 40747, "epoch": 970} {"train_loss": -5.557440757751465, "global_step": 40748, "epoch": 970} {"train_loss": -5.776301383972168, "global_step": 40749, "epoch": 970} {"train_loss": -5.711097240447998, "global_step": 40750, "epoch": 970} {"train_loss": -5.697643756866455, "global_step": 40751, "epoch": 970} {"train_loss": -5.754341125488281, "global_step": 40752, "epoch": 970} {"train_loss": -5.607983589172363, "global_step": 40753, "epoch": 970} {"train_loss": -5.671102523803711, "global_step": 40754, "epoch": 970} {"train_loss": -5.7125349044799805, "global_step": 40755, "epoch": 970} {"train_loss": -5.767521858215332, "global_step": 40756, "epoch": 970} {"train_loss": -5.680970668792725, "global_step": 40757, "epoch": 970} {"train_loss": -5.576170921325684, "global_step": 40758, "epoch": 970} {"train_loss": -5.667294979095459, "global_step": 40759, "epoch": 970} {"train_loss": -5.666401386260986, "global_step": 40760, "epoch": 970} {"train_loss": -5.6188459396362305, "global_step": 40761, "epoch": 970} {"train_loss": -5.630585670471191, "global_step": 40762, "epoch": 970} {"train_loss": -5.485864162445068, "global_step": 40763, "epoch": 970} {"train_loss": -5.727230072021484, "global_step": 40764, "epoch": 970} {"train_loss": -5.672263145446777, "global_step": 40765, "epoch": 970} {"train_loss": -5.677538871765137, "global_step": 40766, "epoch": 970} {"train_loss": -5.5429911613464355, "global_step": 40767, "epoch": 970} {"train_loss": -5.770540714263916, "global_step": 40768, "epoch": 970} {"train_loss": -5.45849084854126, "global_step": 40769, "epoch": 970} {"train_loss": -5.685096740722656, "global_step": 40770, "epoch": 970} {"train_loss": -5.635871410369873, "global_step": 40771, "epoch": 970} {"train_loss": -5.653035640716553, "global_step": 40772, "epoch": 970} {"train_loss": -5.631119728088379, "global_step": 40773, "epoch": 970} {"train_loss": -5.542062282562256, "global_step": 40774, "epoch": 970} {"train_loss": -5.6041107177734375, "global_step": 40775, "epoch": 970} {"train_loss": -5.5239105224609375, "global_step": 40776, "epoch": 970} {"train_loss": -5.618200302124023, "global_step": 40777, "epoch": 970} {"train_loss": -5.532994747161865, "global_step": 40778, "epoch": 970} {"train_loss": -5.572206497192383, "global_step": 40779, "epoch": 970} {"train_loss": -5.628566741943359, "global_step": 40780, "epoch": 970} {"train_loss": -5.629072563988822, "global_step": 40781, "epoch": 970, "val_loss": 73883.75} {"train_loss": -5.577761650085449, "global_step": 40782, "epoch": 971} {"train_loss": -5.587789535522461, "global_step": 40783, "epoch": 971} {"train_loss": -5.692986488342285, "global_step": 40784, "epoch": 971} {"train_loss": -5.6392316818237305, "global_step": 40785, "epoch": 971} {"train_loss": -5.5988616943359375, "global_step": 40786, "epoch": 971} {"train_loss": -5.538024425506592, "global_step": 40787, "epoch": 971} {"train_loss": -5.674082279205322, "global_step": 40788, "epoch": 971} {"train_loss": -5.510889053344727, "global_step": 40789, "epoch": 971} {"train_loss": -5.641827583312988, "global_step": 40790, "epoch": 971} {"train_loss": -5.735381126403809, "global_step": 40791, "epoch": 971} {"train_loss": -5.6650190353393555, "global_step": 40792, "epoch": 971} {"train_loss": -5.6769256591796875, "global_step": 40793, "epoch": 971} {"train_loss": -5.639666557312012, "global_step": 40794, "epoch": 971} {"train_loss": -5.639591693878174, "global_step": 40795, "epoch": 971} {"train_loss": -5.542323112487793, "global_step": 40796, "epoch": 971} {"train_loss": -5.7235565185546875, "global_step": 40797, "epoch": 971} {"train_loss": -5.570069313049316, "global_step": 40798, "epoch": 971} {"train_loss": -5.646121978759766, "global_step": 40799, "epoch": 971} {"train_loss": -5.6109113693237305, "global_step": 40800, "epoch": 971} {"train_loss": -5.583823204040527, "global_step": 40801, "epoch": 971} {"train_loss": -5.527221202850342, "global_step": 40802, "epoch": 971} {"train_loss": -5.64263391494751, "global_step": 40803, "epoch": 971} {"train_loss": -5.596986770629883, "global_step": 40804, "epoch": 971} {"train_loss": -5.5028581619262695, "global_step": 40805, "epoch": 971} {"train_loss": -5.560009002685547, "global_step": 40806, "epoch": 971} {"train_loss": -5.544317245483398, "global_step": 40807, "epoch": 971} {"train_loss": -5.531188011169434, "global_step": 40808, "epoch": 971} {"train_loss": -5.649722099304199, "global_step": 40809, "epoch": 971} {"train_loss": -5.633916854858398, "global_step": 40810, "epoch": 971} {"train_loss": -5.657880783081055, "global_step": 40811, "epoch": 971} {"train_loss": -5.641741752624512, "global_step": 40812, "epoch": 971} {"train_loss": -5.5428619384765625, "global_step": 40813, "epoch": 971} {"train_loss": -5.672546863555908, "global_step": 40814, "epoch": 971} {"train_loss": -5.669370651245117, "global_step": 40815, "epoch": 971} {"train_loss": -5.602960586547852, "global_step": 40816, "epoch": 971} {"train_loss": -5.5749382972717285, "global_step": 40817, "epoch": 971} {"train_loss": -5.6695475578308105, "global_step": 40818, "epoch": 971} {"train_loss": -5.746462821960449, "global_step": 40819, "epoch": 971} {"train_loss": -5.606324195861816, "global_step": 40820, "epoch": 971} {"train_loss": -5.640318870544434, "global_step": 40821, "epoch": 971} {"train_loss": -5.76345157623291, "global_step": 40822, "epoch": 971} {"train_loss": -5.619961409341721, "global_step": 40823, "epoch": 971, "val_loss": 73853.109375} {"train_loss": -5.719168663024902, "global_step": 40824, "epoch": 972} {"train_loss": -5.673633575439453, "global_step": 40825, "epoch": 972} {"train_loss": -5.703945159912109, "global_step": 40826, "epoch": 972} {"train_loss": -5.529339790344238, "global_step": 40827, "epoch": 972} {"train_loss": -5.510678291320801, "global_step": 40828, "epoch": 972} {"train_loss": -5.683622360229492, "global_step": 40829, "epoch": 972} {"train_loss": -5.60636568069458, "global_step": 40830, "epoch": 972} {"train_loss": -5.620211124420166, "global_step": 40831, "epoch": 972} {"train_loss": -5.62911319732666, "global_step": 40832, "epoch": 972} {"train_loss": -5.62635612487793, "global_step": 40833, "epoch": 972} {"train_loss": -5.642303466796875, "global_step": 40834, "epoch": 972} {"train_loss": -5.717992782592773, "global_step": 40835, "epoch": 972} {"train_loss": -5.766324996948242, "global_step": 40836, "epoch": 972} {"train_loss": -5.656069755554199, "global_step": 40837, "epoch": 972} {"train_loss": -5.618705749511719, "global_step": 40838, "epoch": 972} {"train_loss": -5.601856231689453, "global_step": 40839, "epoch": 972} {"train_loss": -5.676209926605225, "global_step": 40840, "epoch": 972} {"train_loss": -5.562325954437256, "global_step": 40841, "epoch": 972} {"train_loss": -5.6134819984436035, "global_step": 40842, "epoch": 972} {"train_loss": -5.63719367980957, "global_step": 40843, "epoch": 972} {"train_loss": -5.625471591949463, "global_step": 40844, "epoch": 972} {"train_loss": -5.549380302429199, "global_step": 40845, "epoch": 972} {"train_loss": -5.681233882904053, "global_step": 40846, "epoch": 972} {"train_loss": -5.524493217468262, "global_step": 40847, "epoch": 972} {"train_loss": -5.644380569458008, "global_step": 40848, "epoch": 972} {"train_loss": -5.7685227394104, "global_step": 40849, "epoch": 972} {"train_loss": -5.617286205291748, "global_step": 40850, "epoch": 972} {"train_loss": -5.749048233032227, "global_step": 40851, "epoch": 972} {"train_loss": -5.623167037963867, "global_step": 40852, "epoch": 972} {"train_loss": -5.462248802185059, "global_step": 40853, "epoch": 972} {"train_loss": -5.64849853515625, "global_step": 40854, "epoch": 972} {"train_loss": -5.496213912963867, "global_step": 40855, "epoch": 972} {"train_loss": -5.489027500152588, "global_step": 40856, "epoch": 972} {"train_loss": -5.6041669845581055, "global_step": 40857, "epoch": 972} {"train_loss": -5.607601165771484, "global_step": 40858, "epoch": 972} {"train_loss": -5.5753326416015625, "global_step": 40859, "epoch": 972} {"train_loss": -5.50467586517334, "global_step": 40860, "epoch": 972} {"train_loss": -5.565919399261475, "global_step": 40861, "epoch": 972} {"train_loss": -5.638463020324707, "global_step": 40862, "epoch": 972} {"train_loss": -5.53456449508667, "global_step": 40863, "epoch": 972} {"train_loss": -5.641073226928711, "global_step": 40864, "epoch": 972} {"train_loss": -5.618361336844308, "global_step": 40865, "epoch": 972, "val_loss": 73956.9453125} {"train_loss": -5.561825752258301, "global_step": 40866, "epoch": 973} {"train_loss": -5.534834384918213, "global_step": 40867, "epoch": 973} {"train_loss": -5.560965061187744, "global_step": 40868, "epoch": 973} {"train_loss": -5.656300067901611, "global_step": 40869, "epoch": 973} {"train_loss": -5.471362590789795, "global_step": 40870, "epoch": 973} {"train_loss": -5.69630765914917, "global_step": 40871, "epoch": 973} {"train_loss": -5.566525459289551, "global_step": 40872, "epoch": 973} {"train_loss": -5.676065444946289, "global_step": 40873, "epoch": 973} {"train_loss": -5.542849063873291, "global_step": 40874, "epoch": 973} {"train_loss": -5.624643325805664, "global_step": 40875, "epoch": 973} {"train_loss": -5.6685686111450195, "global_step": 40876, "epoch": 973} {"train_loss": -5.479698657989502, "global_step": 40877, "epoch": 973} {"train_loss": -5.613183498382568, "global_step": 40878, "epoch": 973} {"train_loss": -5.600411415100098, "global_step": 40879, "epoch": 973} {"train_loss": -5.56939697265625, "global_step": 40880, "epoch": 973} {"train_loss": -5.567997932434082, "global_step": 40881, "epoch": 973} {"train_loss": -5.573559761047363, "global_step": 40882, "epoch": 973} {"train_loss": -5.49958610534668, "global_step": 40883, "epoch": 973} {"train_loss": -5.535218715667725, "global_step": 40884, "epoch": 973} {"train_loss": -5.758663177490234, "global_step": 40885, "epoch": 973} {"train_loss": -5.712615013122559, "global_step": 40886, "epoch": 973} {"train_loss": -5.621410369873047, "global_step": 40887, "epoch": 973} {"train_loss": -5.60532808303833, "global_step": 40888, "epoch": 973} {"train_loss": -5.5651350021362305, "global_step": 40889, "epoch": 973} {"train_loss": -5.638936996459961, "global_step": 40890, "epoch": 973} {"train_loss": -5.730822563171387, "global_step": 40891, "epoch": 973} {"train_loss": -5.759231090545654, "global_step": 40892, "epoch": 973} {"train_loss": -5.649700164794922, "global_step": 40893, "epoch": 973} {"train_loss": -5.634835243225098, "global_step": 40894, "epoch": 973} {"train_loss": -5.629119873046875, "global_step": 40895, "epoch": 973} {"train_loss": -5.659879684448242, "global_step": 40896, "epoch": 973} {"train_loss": -5.627006530761719, "global_step": 40897, "epoch": 973} {"train_loss": -5.77432918548584, "global_step": 40898, "epoch": 973} {"train_loss": -5.660499572753906, "global_step": 40899, "epoch": 973} {"train_loss": -5.633774757385254, "global_step": 40900, "epoch": 973} {"train_loss": -5.814531326293945, "global_step": 40901, "epoch": 973} {"train_loss": -5.741281509399414, "global_step": 40902, "epoch": 973} {"train_loss": -5.707655906677246, "global_step": 40903, "epoch": 973} {"train_loss": -5.556802272796631, "global_step": 40904, "epoch": 973} {"train_loss": -5.712618827819824, "global_step": 40905, "epoch": 973} {"train_loss": -5.5826921463012695, "global_step": 40906, "epoch": 973} {"train_loss": -5.628456070309594, "global_step": 40907, "epoch": 973, "val_loss": 74133.0} {"train_loss": -5.583878040313721, "global_step": 40908, "epoch": 974} {"train_loss": -5.811838150024414, "global_step": 40909, "epoch": 974} {"train_loss": -5.68701696395874, "global_step": 40910, "epoch": 974} {"train_loss": -5.5822882652282715, "global_step": 40911, "epoch": 974} {"train_loss": -5.627662181854248, "global_step": 40912, "epoch": 974} {"train_loss": -5.618329048156738, "global_step": 40913, "epoch": 974} {"train_loss": -5.6180524826049805, "global_step": 40914, "epoch": 974} {"train_loss": -5.59820032119751, "global_step": 40915, "epoch": 974} {"train_loss": -5.609530448913574, "global_step": 40916, "epoch": 974} {"train_loss": -5.671342849731445, "global_step": 40917, "epoch": 974} {"train_loss": -5.815411567687988, "global_step": 40918, "epoch": 974} {"train_loss": -5.691129684448242, "global_step": 40919, "epoch": 974} {"train_loss": -5.685985565185547, "global_step": 40920, "epoch": 974} {"train_loss": -5.67100715637207, "global_step": 40921, "epoch": 974} {"train_loss": -5.70216178894043, "global_step": 40922, "epoch": 974} {"train_loss": -5.682473659515381, "global_step": 40923, "epoch": 974} {"train_loss": -5.548093795776367, "global_step": 40924, "epoch": 974} {"train_loss": -5.552204132080078, "global_step": 40925, "epoch": 974} {"train_loss": -5.659317970275879, "global_step": 40926, "epoch": 974} {"train_loss": -5.594687461853027, "global_step": 40927, "epoch": 974} {"train_loss": -5.6803998947143555, "global_step": 40928, "epoch": 974} {"train_loss": -5.820184707641602, "global_step": 40929, "epoch": 974} {"train_loss": -5.620173454284668, "global_step": 40930, "epoch": 974} {"train_loss": -5.488504409790039, "global_step": 40931, "epoch": 974} {"train_loss": -5.593188285827637, "global_step": 40932, "epoch": 974} {"train_loss": -5.589787483215332, "global_step": 40933, "epoch": 974} {"train_loss": -5.7200751304626465, "global_step": 40934, "epoch": 974} {"train_loss": -5.615835189819336, "global_step": 40935, "epoch": 974} {"train_loss": -5.732736110687256, "global_step": 40936, "epoch": 974} {"train_loss": -5.85737419128418, "global_step": 40937, "epoch": 974} {"train_loss": -5.6116132736206055, "global_step": 40938, "epoch": 974} {"train_loss": -5.625925540924072, "global_step": 40939, "epoch": 974} {"train_loss": -5.67932653427124, "global_step": 40940, "epoch": 974} {"train_loss": -5.673145294189453, "global_step": 40941, "epoch": 974} {"train_loss": -5.630194187164307, "global_step": 40942, "epoch": 974} {"train_loss": -5.6256256103515625, "global_step": 40943, "epoch": 974} {"train_loss": -5.674236297607422, "global_step": 40944, "epoch": 974} {"train_loss": -5.720640182495117, "global_step": 40945, "epoch": 974} {"train_loss": -5.667505264282227, "global_step": 40946, "epoch": 974} {"train_loss": -5.583169937133789, "global_step": 40947, "epoch": 974} {"train_loss": -5.711993217468262, "global_step": 40948, "epoch": 974} {"train_loss": -5.65904578708467, "global_step": 40949, "epoch": 974, "val_loss": 74077.5859375} {"train_loss": -5.756460666656494, "global_step": 40950, "epoch": 975} {"train_loss": -5.70706844329834, "global_step": 40951, "epoch": 975} {"train_loss": -5.580706596374512, "global_step": 40952, "epoch": 975} {"train_loss": -5.651177883148193, "global_step": 40953, "epoch": 975} {"train_loss": -5.485282897949219, "global_step": 40954, "epoch": 975} {"train_loss": -5.613392353057861, "global_step": 40955, "epoch": 975} {"train_loss": -5.641490936279297, "global_step": 40956, "epoch": 975} {"train_loss": -5.62827205657959, "global_step": 40957, "epoch": 975} {"train_loss": -5.6757097244262695, "global_step": 40958, "epoch": 975} {"train_loss": -5.562164306640625, "global_step": 40959, "epoch": 975} {"train_loss": -5.702909469604492, "global_step": 40960, "epoch": 975} {"train_loss": -5.619966506958008, "global_step": 40961, "epoch": 975} {"train_loss": -5.610075950622559, "global_step": 40962, "epoch": 975} {"train_loss": -5.699329376220703, "global_step": 40963, "epoch": 975} {"train_loss": -5.844106197357178, "global_step": 40964, "epoch": 975} {"train_loss": -5.630481719970703, "global_step": 40965, "epoch": 975} {"train_loss": -5.712037563323975, "global_step": 40966, "epoch": 975} {"train_loss": -5.600263595581055, "global_step": 40967, "epoch": 975} {"train_loss": -5.703019142150879, "global_step": 40968, "epoch": 975} {"train_loss": -5.702790260314941, "global_step": 40969, "epoch": 975} {"train_loss": -5.527212142944336, "global_step": 40970, "epoch": 975} {"train_loss": -5.696501731872559, "global_step": 40971, "epoch": 975} {"train_loss": -5.545482635498047, "global_step": 40972, "epoch": 975} {"train_loss": -5.683125972747803, "global_step": 40973, "epoch": 975} {"train_loss": -5.545810699462891, "global_step": 40974, "epoch": 975} {"train_loss": -5.7197794914245605, "global_step": 40975, "epoch": 975} {"train_loss": -5.686748504638672, "global_step": 40976, "epoch": 975} {"train_loss": -5.70548152923584, "global_step": 40977, "epoch": 975} {"train_loss": -5.770734786987305, "global_step": 40978, "epoch": 975} {"train_loss": -5.598371982574463, "global_step": 40979, "epoch": 975} {"train_loss": -5.530559062957764, "global_step": 40980, "epoch": 975} {"train_loss": -5.667442321777344, "global_step": 40981, "epoch": 975} {"train_loss": -5.672472953796387, "global_step": 40982, "epoch": 975} {"train_loss": -5.649493217468262, "global_step": 40983, "epoch": 975} {"train_loss": -5.532266616821289, "global_step": 40984, "epoch": 975} {"train_loss": -5.598847389221191, "global_step": 40985, "epoch": 975} {"train_loss": -5.625877380371094, "global_step": 40986, "epoch": 975} {"train_loss": -5.6415019035339355, "global_step": 40987, "epoch": 975} {"train_loss": -5.75228214263916, "global_step": 40988, "epoch": 975} {"train_loss": -5.61793327331543, "global_step": 40989, "epoch": 975} {"train_loss": -5.757521629333496, "global_step": 40990, "epoch": 975} {"train_loss": -5.6496178195590065, "global_step": 40991, "epoch": 975, "val_loss": 73816.90625} {"train_loss": -5.467929840087891, "global_step": 40992, "epoch": 976} {"train_loss": -5.534263610839844, "global_step": 40993, "epoch": 976} {"train_loss": -5.529898643493652, "global_step": 40994, "epoch": 976} {"train_loss": -5.672883987426758, "global_step": 40995, "epoch": 976} {"train_loss": -5.57460880279541, "global_step": 40996, "epoch": 976} {"train_loss": -5.4056549072265625, "global_step": 40997, "epoch": 976} {"train_loss": -5.606545448303223, "global_step": 40998, "epoch": 976} {"train_loss": -5.754066467285156, "global_step": 40999, "epoch": 976} {"train_loss": -5.741354942321777, "global_step": 41000, "epoch": 976} {"train_loss": -5.695418357849121, "global_step": 41001, "epoch": 976} {"train_loss": -5.712403774261475, "global_step": 41002, "epoch": 976} {"train_loss": -5.749600410461426, "global_step": 41003, "epoch": 976} {"train_loss": -5.5904436111450195, "global_step": 41004, "epoch": 976} {"train_loss": -5.711750030517578, "global_step": 41005, "epoch": 976} {"train_loss": -5.678375244140625, "global_step": 41006, "epoch": 976} {"train_loss": -5.790446758270264, "global_step": 41007, "epoch": 976} {"train_loss": -5.548148155212402, "global_step": 41008, "epoch": 976} {"train_loss": -5.548251152038574, "global_step": 41009, "epoch": 976} {"train_loss": -5.677247524261475, "global_step": 41010, "epoch": 976} {"train_loss": -5.7481489181518555, "global_step": 41011, "epoch": 976} {"train_loss": -5.747817039489746, "global_step": 41012, "epoch": 976} {"train_loss": -5.737022399902344, "global_step": 41013, "epoch": 976} {"train_loss": -5.720370292663574, "global_step": 41014, "epoch": 976} {"train_loss": -5.700791358947754, "global_step": 41015, "epoch": 976} {"train_loss": -5.615469455718994, "global_step": 41016, "epoch": 976} {"train_loss": -5.669254302978516, "global_step": 41017, "epoch": 976} {"train_loss": -5.699160575866699, "global_step": 41018, "epoch": 976} {"train_loss": -5.641561031341553, "global_step": 41019, "epoch": 976} {"train_loss": -5.674596786499023, "global_step": 41020, "epoch": 976} {"train_loss": -5.646562576293945, "global_step": 41021, "epoch": 976} {"train_loss": -5.511765480041504, "global_step": 41022, "epoch": 976} {"train_loss": -5.640054225921631, "global_step": 41023, "epoch": 976} {"train_loss": -5.638267517089844, "global_step": 41024, "epoch": 976} {"train_loss": -5.511075973510742, "global_step": 41025, "epoch": 976} {"train_loss": -5.7113237380981445, "global_step": 41026, "epoch": 976} {"train_loss": -5.757694244384766, "global_step": 41027, "epoch": 976} {"train_loss": -5.711899757385254, "global_step": 41028, "epoch": 976} {"train_loss": -5.575470924377441, "global_step": 41029, "epoch": 976} {"train_loss": -5.627542495727539, "global_step": 41030, "epoch": 976} {"train_loss": -5.563807964324951, "global_step": 41031, "epoch": 976} {"train_loss": -5.611259460449219, "global_step": 41032, "epoch": 976} {"train_loss": -5.644711494445801, "global_step": 41033, "epoch": 976, "val_loss": 74109.859375} {"train_loss": -5.537246227264404, "global_step": 41034, "epoch": 977} {"train_loss": -5.774320602416992, "global_step": 41035, "epoch": 977} {"train_loss": -5.5851545333862305, "global_step": 41036, "epoch": 977} {"train_loss": -5.700202941894531, "global_step": 41037, "epoch": 977} {"train_loss": -5.650634765625, "global_step": 41038, "epoch": 977} {"train_loss": -5.670289993286133, "global_step": 41039, "epoch": 977} {"train_loss": -5.549718856811523, "global_step": 41040, "epoch": 977} {"train_loss": -5.617062568664551, "global_step": 41041, "epoch": 977} {"train_loss": -5.675738334655762, "global_step": 41042, "epoch": 977} {"train_loss": -5.657158851623535, "global_step": 41043, "epoch": 977} {"train_loss": -5.804786682128906, "global_step": 41044, "epoch": 977} {"train_loss": -5.677726745605469, "global_step": 41045, "epoch": 977} {"train_loss": -5.765712738037109, "global_step": 41046, "epoch": 977} {"train_loss": -5.67509126663208, "global_step": 41047, "epoch": 977} {"train_loss": -5.803554534912109, "global_step": 41048, "epoch": 977} {"train_loss": -5.609748840332031, "global_step": 41049, "epoch": 977} {"train_loss": -5.745415687561035, "global_step": 41050, "epoch": 977} {"train_loss": -5.487787246704102, "global_step": 41051, "epoch": 977} {"train_loss": -5.763686180114746, "global_step": 41052, "epoch": 977} {"train_loss": -5.605518341064453, "global_step": 41053, "epoch": 977} {"train_loss": -5.568499565124512, "global_step": 41054, "epoch": 977} {"train_loss": -5.519793510437012, "global_step": 41055, "epoch": 977} {"train_loss": -5.667278289794922, "global_step": 41056, "epoch": 977} {"train_loss": -5.495765686035156, "global_step": 41057, "epoch": 977} {"train_loss": -5.65141487121582, "global_step": 41058, "epoch": 977} {"train_loss": -5.525925636291504, "global_step": 41059, "epoch": 977} {"train_loss": -5.550772666931152, "global_step": 41060, "epoch": 977} {"train_loss": -5.701534748077393, "global_step": 41061, "epoch": 977} {"train_loss": -5.688371658325195, "global_step": 41062, "epoch": 977} {"train_loss": -5.481439590454102, "global_step": 41063, "epoch": 977} {"train_loss": -5.740505218505859, "global_step": 41064, "epoch": 977} {"train_loss": -5.523540496826172, "global_step": 41065, "epoch": 977} {"train_loss": -5.534275531768799, "global_step": 41066, "epoch": 977} {"train_loss": -5.7262749671936035, "global_step": 41067, "epoch": 977} {"train_loss": -5.694085121154785, "global_step": 41068, "epoch": 977} {"train_loss": -5.537633419036865, "global_step": 41069, "epoch": 977} {"train_loss": -5.645257949829102, "global_step": 41070, "epoch": 977} {"train_loss": -5.4538116455078125, "global_step": 41071, "epoch": 977} {"train_loss": -5.685400009155273, "global_step": 41072, "epoch": 977} {"train_loss": -5.647331714630127, "global_step": 41073, "epoch": 977} {"train_loss": -5.692257881164551, "global_step": 41074, "epoch": 977} {"train_loss": -5.635182755334037, "global_step": 41075, "epoch": 977, "val_loss": 73937.9375} {"train_loss": -5.717860221862793, "global_step": 41076, "epoch": 978} {"train_loss": -5.522092819213867, "global_step": 41077, "epoch": 978} {"train_loss": -5.676301002502441, "global_step": 41078, "epoch": 978} {"train_loss": -5.739978790283203, "global_step": 41079, "epoch": 978} {"train_loss": -5.595362663269043, "global_step": 41080, "epoch": 978} {"train_loss": -5.705608367919922, "global_step": 41081, "epoch": 978} {"train_loss": -5.631364822387695, "global_step": 41082, "epoch": 978} {"train_loss": -5.743813514709473, "global_step": 41083, "epoch": 978} {"train_loss": -5.6725687980651855, "global_step": 41084, "epoch": 978} {"train_loss": -5.617609977722168, "global_step": 41085, "epoch": 978} {"train_loss": -5.630326271057129, "global_step": 41086, "epoch": 978} {"train_loss": -5.6417717933654785, "global_step": 41087, "epoch": 978} {"train_loss": -5.740044116973877, "global_step": 41088, "epoch": 978} {"train_loss": -5.557363510131836, "global_step": 41089, "epoch": 978} {"train_loss": -5.625617027282715, "global_step": 41090, "epoch": 978} {"train_loss": -5.721003532409668, "global_step": 41091, "epoch": 978} {"train_loss": -5.529271602630615, "global_step": 41092, "epoch": 978} {"train_loss": -5.539305686950684, "global_step": 41093, "epoch": 978} {"train_loss": -5.522684574127197, "global_step": 41094, "epoch": 978} {"train_loss": -5.700173377990723, "global_step": 41095, "epoch": 978} {"train_loss": -5.625002861022949, "global_step": 41096, "epoch": 978} {"train_loss": -5.674027442932129, "global_step": 41097, "epoch": 978} {"train_loss": -5.57994270324707, "global_step": 41098, "epoch": 978} {"train_loss": -5.648656368255615, "global_step": 41099, "epoch": 978} {"train_loss": -5.589963912963867, "global_step": 41100, "epoch": 978} {"train_loss": -5.6904754638671875, "global_step": 41101, "epoch": 978} {"train_loss": -5.577955722808838, "global_step": 41102, "epoch": 978} {"train_loss": -5.545389175415039, "global_step": 41103, "epoch": 978} {"train_loss": -5.675281524658203, "global_step": 41104, "epoch": 978} {"train_loss": -5.546897888183594, "global_step": 41105, "epoch": 978} {"train_loss": -5.702470779418945, "global_step": 41106, "epoch": 978} {"train_loss": -5.643835067749023, "global_step": 41107, "epoch": 978} {"train_loss": -5.645936489105225, "global_step": 41108, "epoch": 978} {"train_loss": -5.45850944519043, "global_step": 41109, "epoch": 978} {"train_loss": -5.614121437072754, "global_step": 41110, "epoch": 978} {"train_loss": -5.683442115783691, "global_step": 41111, "epoch": 978} {"train_loss": -5.664717197418213, "global_step": 41112, "epoch": 978} {"train_loss": -5.626856327056885, "global_step": 41113, "epoch": 978} {"train_loss": -5.686337471008301, "global_step": 41114, "epoch": 978} {"train_loss": -5.631538391113281, "global_step": 41115, "epoch": 978} {"train_loss": -5.688705921173096, "global_step": 41116, "epoch": 978} {"train_loss": -5.636006309872582, "global_step": 41117, "epoch": 978, "val_loss": 73976.9375} {"train_loss": -5.656737327575684, "global_step": 41118, "epoch": 979} {"train_loss": -5.688425064086914, "global_step": 41119, "epoch": 979} {"train_loss": -5.629091739654541, "global_step": 41120, "epoch": 979} {"train_loss": -5.507654190063477, "global_step": 41121, "epoch": 979} {"train_loss": -5.66823148727417, "global_step": 41122, "epoch": 979} {"train_loss": -5.485409259796143, "global_step": 41123, "epoch": 979} {"train_loss": -5.734703063964844, "global_step": 41124, "epoch": 979} {"train_loss": -5.653717041015625, "global_step": 41125, "epoch": 979} {"train_loss": -5.5506181716918945, "global_step": 41126, "epoch": 979} {"train_loss": -5.733898162841797, "global_step": 41127, "epoch": 979} {"train_loss": -5.78515625, "global_step": 41128, "epoch": 979} {"train_loss": -5.5362324714660645, "global_step": 41129, "epoch": 979} {"train_loss": -5.621978759765625, "global_step": 41130, "epoch": 979} {"train_loss": -5.687045574188232, "global_step": 41131, "epoch": 979} {"train_loss": -5.770516872406006, "global_step": 41132, "epoch": 979} {"train_loss": -5.633568286895752, "global_step": 41133, "epoch": 979} {"train_loss": -5.568386554718018, "global_step": 41134, "epoch": 979} {"train_loss": -5.713083744049072, "global_step": 41135, "epoch": 979} {"train_loss": -5.6922688484191895, "global_step": 41136, "epoch": 979} {"train_loss": -5.658868312835693, "global_step": 41137, "epoch": 979} {"train_loss": -5.5071702003479, "global_step": 41138, "epoch": 979} {"train_loss": -5.641230583190918, "global_step": 41139, "epoch": 979} {"train_loss": -5.530536651611328, "global_step": 41140, "epoch": 979} {"train_loss": -5.590490341186523, "global_step": 41141, "epoch": 979} {"train_loss": -5.492883682250977, "global_step": 41142, "epoch": 979} {"train_loss": -5.706786155700684, "global_step": 41143, "epoch": 979} {"train_loss": -5.694975852966309, "global_step": 41144, "epoch": 979} {"train_loss": -5.743902206420898, "global_step": 41145, "epoch": 979} {"train_loss": -5.617208480834961, "global_step": 41146, "epoch": 979} {"train_loss": -5.6516618728637695, "global_step": 41147, "epoch": 979} {"train_loss": -5.598380088806152, "global_step": 41148, "epoch": 979} {"train_loss": -5.723056793212891, "global_step": 41149, "epoch": 979} {"train_loss": -5.609847068786621, "global_step": 41150, "epoch": 979} {"train_loss": -5.607911109924316, "global_step": 41151, "epoch": 979} {"train_loss": -5.532320499420166, "global_step": 41152, "epoch": 979} {"train_loss": -5.614591121673584, "global_step": 41153, "epoch": 979} {"train_loss": -5.635075569152832, "global_step": 41154, "epoch": 979} {"train_loss": -5.697805404663086, "global_step": 41155, "epoch": 979} {"train_loss": -5.635551929473877, "global_step": 41156, "epoch": 979} {"train_loss": -5.543673515319824, "global_step": 41157, "epoch": 979} {"train_loss": -5.689495086669922, "global_step": 41158, "epoch": 979} {"train_loss": -5.637314558029175, "global_step": 41159, "epoch": 979, "val_loss": 73990.1015625} {"train_loss": -5.716421127319336, "global_step": 41160, "epoch": 980} {"train_loss": -5.697835922241211, "global_step": 41161, "epoch": 980} {"train_loss": -5.589095115661621, "global_step": 41162, "epoch": 980} {"train_loss": -5.7166852951049805, "global_step": 41163, "epoch": 980} {"train_loss": -5.555230617523193, "global_step": 41164, "epoch": 980} {"train_loss": -5.7152509689331055, "global_step": 41165, "epoch": 980} {"train_loss": -5.698106288909912, "global_step": 41166, "epoch": 980} {"train_loss": -5.612300872802734, "global_step": 41167, "epoch": 980} {"train_loss": -5.655567169189453, "global_step": 41168, "epoch": 980} {"train_loss": -5.70257568359375, "global_step": 41169, "epoch": 980} {"train_loss": -5.57869291305542, "global_step": 41170, "epoch": 980} {"train_loss": -5.561829566955566, "global_step": 41171, "epoch": 980} {"train_loss": -5.622983932495117, "global_step": 41172, "epoch": 980} {"train_loss": -5.624783515930176, "global_step": 41173, "epoch": 980} {"train_loss": -5.65119743347168, "global_step": 41174, "epoch": 980} {"train_loss": -5.562320232391357, "global_step": 41175, "epoch": 980} {"train_loss": -5.6014556884765625, "global_step": 41176, "epoch": 980} {"train_loss": -5.560239315032959, "global_step": 41177, "epoch": 980} {"train_loss": -5.755861282348633, "global_step": 41178, "epoch": 980} {"train_loss": -5.530364036560059, "global_step": 41179, "epoch": 980} {"train_loss": -5.636032581329346, "global_step": 41180, "epoch": 980} {"train_loss": -5.67057991027832, "global_step": 41181, "epoch": 980} {"train_loss": -5.663874626159668, "global_step": 41182, "epoch": 980} {"train_loss": -5.538260459899902, "global_step": 41183, "epoch": 980} {"train_loss": -5.764011859893799, "global_step": 41184, "epoch": 980} {"train_loss": -5.475404739379883, "global_step": 41185, "epoch": 980} {"train_loss": -5.608293056488037, "global_step": 41186, "epoch": 980} {"train_loss": -5.669806480407715, "global_step": 41187, "epoch": 980} {"train_loss": -5.574369430541992, "global_step": 41188, "epoch": 980} {"train_loss": -5.689377784729004, "global_step": 41189, "epoch": 980} {"train_loss": -5.4633283615112305, "global_step": 41190, "epoch": 980} {"train_loss": -5.685074329376221, "global_step": 41191, "epoch": 980} {"train_loss": -5.548778533935547, "global_step": 41192, "epoch": 980} {"train_loss": -5.590934753417969, "global_step": 41193, "epoch": 980} {"train_loss": -5.494063854217529, "global_step": 41194, "epoch": 980} {"train_loss": -5.669898509979248, "global_step": 41195, "epoch": 980} {"train_loss": -5.557967185974121, "global_step": 41196, "epoch": 980} {"train_loss": -5.555994033813477, "global_step": 41197, "epoch": 980} {"train_loss": -5.510271072387695, "global_step": 41198, "epoch": 980} {"train_loss": -5.670698165893555, "global_step": 41199, "epoch": 980} {"train_loss": -5.686862945556641, "global_step": 41200, "epoch": 980} {"train_loss": -5.616585504441034, "global_step": 41201, "epoch": 980, "val_loss": 73782.6796875} {"train_loss": -5.678197383880615, "global_step": 41202, "epoch": 981} {"train_loss": -5.66726016998291, "global_step": 41203, "epoch": 981} {"train_loss": -5.68873405456543, "global_step": 41204, "epoch": 981} {"train_loss": -5.669891357421875, "global_step": 41205, "epoch": 981} {"train_loss": -5.535155773162842, "global_step": 41206, "epoch": 981} {"train_loss": -5.642316818237305, "global_step": 41207, "epoch": 981} {"train_loss": -5.563059329986572, "global_step": 41208, "epoch": 981} {"train_loss": -5.661345481872559, "global_step": 41209, "epoch": 981} {"train_loss": -5.621132850646973, "global_step": 41210, "epoch": 981} {"train_loss": -5.561758041381836, "global_step": 41211, "epoch": 981} {"train_loss": -5.6422576904296875, "global_step": 41212, "epoch": 981} {"train_loss": -5.644381999969482, "global_step": 41213, "epoch": 981} {"train_loss": -5.533047676086426, "global_step": 41214, "epoch": 981} {"train_loss": -5.6305718421936035, "global_step": 41215, "epoch": 981} {"train_loss": -5.665187835693359, "global_step": 41216, "epoch": 981} {"train_loss": -5.56055212020874, "global_step": 41217, "epoch": 981} {"train_loss": -5.5378618240356445, "global_step": 41218, "epoch": 981} {"train_loss": -5.529182434082031, "global_step": 41219, "epoch": 981} {"train_loss": -5.607120990753174, "global_step": 41220, "epoch": 981} {"train_loss": -5.471160888671875, "global_step": 41221, "epoch": 981} {"train_loss": -5.710444450378418, "global_step": 41222, "epoch": 981} {"train_loss": -5.572834014892578, "global_step": 41223, "epoch": 981} {"train_loss": -5.600621223449707, "global_step": 41224, "epoch": 981} {"train_loss": -5.6616058349609375, "global_step": 41225, "epoch": 981} {"train_loss": -5.589079856872559, "global_step": 41226, "epoch": 981} {"train_loss": -5.595447540283203, "global_step": 41227, "epoch": 981} {"train_loss": -5.676088809967041, "global_step": 41228, "epoch": 981} {"train_loss": -5.6391191482543945, "global_step": 41229, "epoch": 981} {"train_loss": -5.615016937255859, "global_step": 41230, "epoch": 981} {"train_loss": -5.581382751464844, "global_step": 41231, "epoch": 981} {"train_loss": -5.631134986877441, "global_step": 41232, "epoch": 981} {"train_loss": -5.681125164031982, "global_step": 41233, "epoch": 981} {"train_loss": -5.723430156707764, "global_step": 41234, "epoch": 981} {"train_loss": -5.694252014160156, "global_step": 41235, "epoch": 981} {"train_loss": -5.5675530433654785, "global_step": 41236, "epoch": 981} {"train_loss": -5.565577507019043, "global_step": 41237, "epoch": 981} {"train_loss": -5.6169633865356445, "global_step": 41238, "epoch": 981} {"train_loss": -5.685617446899414, "global_step": 41239, "epoch": 981} {"train_loss": -5.637788772583008, "global_step": 41240, "epoch": 981} {"train_loss": -5.728013038635254, "global_step": 41241, "epoch": 981} {"train_loss": -5.680459022521973, "global_step": 41242, "epoch": 981} {"train_loss": -5.622169426509312, "global_step": 41243, "epoch": 981, "val_loss": 73980.2421875} {"train_loss": -5.606409072875977, "global_step": 41244, "epoch": 982} {"train_loss": -5.610461235046387, "global_step": 41245, "epoch": 982} {"train_loss": -5.651862144470215, "global_step": 41246, "epoch": 982} {"train_loss": -5.761280536651611, "global_step": 41247, "epoch": 982} {"train_loss": -5.4987030029296875, "global_step": 41248, "epoch": 982} {"train_loss": -5.636442184448242, "global_step": 41249, "epoch": 982} {"train_loss": -5.653735160827637, "global_step": 41250, "epoch": 982} {"train_loss": -5.653197288513184, "global_step": 41251, "epoch": 982} {"train_loss": -5.604796409606934, "global_step": 41252, "epoch": 982} {"train_loss": -5.633656024932861, "global_step": 41253, "epoch": 982} {"train_loss": -5.63267183303833, "global_step": 41254, "epoch": 982} {"train_loss": -5.664760589599609, "global_step": 41255, "epoch": 982} {"train_loss": -5.718445777893066, "global_step": 41256, "epoch": 982} {"train_loss": -5.710700511932373, "global_step": 41257, "epoch": 982} {"train_loss": -5.712642669677734, "global_step": 41258, "epoch": 982} {"train_loss": -5.52910041809082, "global_step": 41259, "epoch": 982} {"train_loss": -5.741472244262695, "global_step": 41260, "epoch": 982} {"train_loss": -5.650763034820557, "global_step": 41261, "epoch": 982} {"train_loss": -5.566490650177002, "global_step": 41262, "epoch": 982} {"train_loss": -5.73883056640625, "global_step": 41263, "epoch": 982} {"train_loss": -5.657783031463623, "global_step": 41264, "epoch": 982} {"train_loss": -5.57822322845459, "global_step": 41265, "epoch": 982} {"train_loss": -5.5345354080200195, "global_step": 41266, "epoch": 982} {"train_loss": -5.7237749099731445, "global_step": 41267, "epoch": 982} {"train_loss": -5.47628927230835, "global_step": 41268, "epoch": 982} {"train_loss": -5.645824909210205, "global_step": 41269, "epoch": 982} {"train_loss": -5.493415355682373, "global_step": 41270, "epoch": 982} {"train_loss": -5.591517448425293, "global_step": 41271, "epoch": 982} {"train_loss": -5.746458053588867, "global_step": 41272, "epoch": 982} {"train_loss": -5.473127365112305, "global_step": 41273, "epoch": 982} {"train_loss": -5.616660118103027, "global_step": 41274, "epoch": 982} {"train_loss": -5.552260398864746, "global_step": 41275, "epoch": 982} {"train_loss": -5.739346981048584, "global_step": 41276, "epoch": 982} {"train_loss": -5.565607070922852, "global_step": 41277, "epoch": 982} {"train_loss": -5.70138692855835, "global_step": 41278, "epoch": 982} {"train_loss": -5.655081748962402, "global_step": 41279, "epoch": 982} {"train_loss": -5.638375282287598, "global_step": 41280, "epoch": 982} {"train_loss": -5.611004829406738, "global_step": 41281, "epoch": 982} {"train_loss": -5.61335563659668, "global_step": 41282, "epoch": 982} {"train_loss": -5.554001808166504, "global_step": 41283, "epoch": 982} {"train_loss": -5.608230113983154, "global_step": 41284, "epoch": 982} {"train_loss": -5.629837206431797, "global_step": 41285, "epoch": 982, "val_loss": 73947.2421875} {"train_loss": -5.648092269897461, "global_step": 41286, "epoch": 983} {"train_loss": -5.606965065002441, "global_step": 41287, "epoch": 983} {"train_loss": -5.650975227355957, "global_step": 41288, "epoch": 983} {"train_loss": -5.577325820922852, "global_step": 41289, "epoch": 983} {"train_loss": -5.84747314453125, "global_step": 41290, "epoch": 983} {"train_loss": -5.681092262268066, "global_step": 41291, "epoch": 983} {"train_loss": -5.711983680725098, "global_step": 41292, "epoch": 983} {"train_loss": -5.51917028427124, "global_step": 41293, "epoch": 983} {"train_loss": -5.688494682312012, "global_step": 41294, "epoch": 983} {"train_loss": -5.690396308898926, "global_step": 41295, "epoch": 983} {"train_loss": -5.604572296142578, "global_step": 41296, "epoch": 983} {"train_loss": -5.698610782623291, "global_step": 41297, "epoch": 983} {"train_loss": -5.706812858581543, "global_step": 41298, "epoch": 983} {"train_loss": -5.787624359130859, "global_step": 41299, "epoch": 983} {"train_loss": -5.694188594818115, "global_step": 41300, "epoch": 983} {"train_loss": -5.772449016571045, "global_step": 41301, "epoch": 983} {"train_loss": -5.514409065246582, "global_step": 41302, "epoch": 983} {"train_loss": -5.6407790184021, "global_step": 41303, "epoch": 983} {"train_loss": -5.6092119216918945, "global_step": 41304, "epoch": 983} {"train_loss": -5.649393558502197, "global_step": 41305, "epoch": 983} {"train_loss": -5.72578239440918, "global_step": 41306, "epoch": 983} {"train_loss": -5.61375617980957, "global_step": 41307, "epoch": 983} {"train_loss": -5.689021110534668, "global_step": 41308, "epoch": 983} {"train_loss": -5.548689842224121, "global_step": 41309, "epoch": 983} {"train_loss": -5.758537292480469, "global_step": 41310, "epoch": 983} {"train_loss": -5.614016532897949, "global_step": 41311, "epoch": 983} {"train_loss": -5.53434944152832, "global_step": 41312, "epoch": 983} {"train_loss": -5.734086036682129, "global_step": 41313, "epoch": 983} {"train_loss": -5.544909477233887, "global_step": 41314, "epoch": 983} {"train_loss": -5.459897041320801, "global_step": 41315, "epoch": 983} {"train_loss": -5.530466079711914, "global_step": 41316, "epoch": 983} {"train_loss": -5.408335208892822, "global_step": 41317, "epoch": 983} {"train_loss": -5.697995185852051, "global_step": 41318, "epoch": 983} {"train_loss": -5.737568378448486, "global_step": 41319, "epoch": 983} {"train_loss": -5.518431186676025, "global_step": 41320, "epoch": 983} {"train_loss": -5.629228115081787, "global_step": 41321, "epoch": 983} {"train_loss": -5.614802360534668, "global_step": 41322, "epoch": 983} {"train_loss": -5.735461711883545, "global_step": 41323, "epoch": 983} {"train_loss": -5.554696083068848, "global_step": 41324, "epoch": 983} {"train_loss": -5.604636192321777, "global_step": 41325, "epoch": 983} {"train_loss": -5.588710784912109, "global_step": 41326, "epoch": 983} {"train_loss": -5.638149159295218, "global_step": 41327, "epoch": 983, "val_loss": 74026.6328125} {"train_loss": -5.653630256652832, "global_step": 41328, "epoch": 984} {"train_loss": -5.659510612487793, "global_step": 41329, "epoch": 984} {"train_loss": -5.6039137840271, "global_step": 41330, "epoch": 984} {"train_loss": -5.714369773864746, "global_step": 41331, "epoch": 984} {"train_loss": -5.568609237670898, "global_step": 41332, "epoch": 984} {"train_loss": -5.685216903686523, "global_step": 41333, "epoch": 984} {"train_loss": -5.666393280029297, "global_step": 41334, "epoch": 984} {"train_loss": -5.740516662597656, "global_step": 41335, "epoch": 984} {"train_loss": -5.696451187133789, "global_step": 41336, "epoch": 984} {"train_loss": -5.648667812347412, "global_step": 41337, "epoch": 984} {"train_loss": -5.643923759460449, "global_step": 41338, "epoch": 984} {"train_loss": -5.719162940979004, "global_step": 41339, "epoch": 984} {"train_loss": -5.603449821472168, "global_step": 41340, "epoch": 984} {"train_loss": -5.609627723693848, "global_step": 41341, "epoch": 984} {"train_loss": -5.666888236999512, "global_step": 41342, "epoch": 984} {"train_loss": -5.756287097930908, "global_step": 41343, "epoch": 984} {"train_loss": -5.553130626678467, "global_step": 41344, "epoch": 984} {"train_loss": -5.723720550537109, "global_step": 41345, "epoch": 984} {"train_loss": -5.675337314605713, "global_step": 41346, "epoch": 984} {"train_loss": -5.671735763549805, "global_step": 41347, "epoch": 984} {"train_loss": -5.734503746032715, "global_step": 41348, "epoch": 984} {"train_loss": -5.704908847808838, "global_step": 41349, "epoch": 984} {"train_loss": -5.705049514770508, "global_step": 41350, "epoch": 984} {"train_loss": -5.756030559539795, "global_step": 41351, "epoch": 984} {"train_loss": -5.678747653961182, "global_step": 41352, "epoch": 984} {"train_loss": -5.6768598556518555, "global_step": 41353, "epoch": 984} {"train_loss": -5.735050678253174, "global_step": 41354, "epoch": 984} {"train_loss": -5.723232269287109, "global_step": 41355, "epoch": 984} {"train_loss": -5.641140937805176, "global_step": 41356, "epoch": 984} {"train_loss": -5.66339111328125, "global_step": 41357, "epoch": 984} {"train_loss": -5.692915916442871, "global_step": 41358, "epoch": 984} {"train_loss": -5.6947479248046875, "global_step": 41359, "epoch": 984} {"train_loss": -5.6014628410339355, "global_step": 41360, "epoch": 984} {"train_loss": -5.692844867706299, "global_step": 41361, "epoch": 984} {"train_loss": -5.576751232147217, "global_step": 41362, "epoch": 984} {"train_loss": -5.576267719268799, "global_step": 41363, "epoch": 984} {"train_loss": -5.690944671630859, "global_step": 41364, "epoch": 984} {"train_loss": -5.6673994064331055, "global_step": 41365, "epoch": 984} {"train_loss": -5.65190315246582, "global_step": 41366, "epoch": 984} {"train_loss": -5.652417182922363, "global_step": 41367, "epoch": 984} {"train_loss": -5.555385589599609, "global_step": 41368, "epoch": 984} {"train_loss": -5.6677219186510355, "global_step": 41369, "epoch": 984, "val_loss": 74080.7265625} {"train_loss": -5.697458267211914, "global_step": 41370, "epoch": 985} {"train_loss": -5.644961357116699, "global_step": 41371, "epoch": 985} {"train_loss": -5.717252731323242, "global_step": 41372, "epoch": 985} {"train_loss": -5.703132629394531, "global_step": 41373, "epoch": 985} {"train_loss": -5.5250959396362305, "global_step": 41374, "epoch": 985} {"train_loss": -5.618459701538086, "global_step": 41375, "epoch": 985} {"train_loss": -5.599769592285156, "global_step": 41376, "epoch": 985} {"train_loss": -5.605553150177002, "global_step": 41377, "epoch": 985} {"train_loss": -5.641227722167969, "global_step": 41378, "epoch": 985} {"train_loss": -5.399895668029785, "global_step": 41379, "epoch": 985} {"train_loss": -5.653036117553711, "global_step": 41380, "epoch": 985} {"train_loss": -5.561847686767578, "global_step": 41381, "epoch": 985} {"train_loss": -5.521529197692871, "global_step": 41382, "epoch": 985} {"train_loss": -5.58345890045166, "global_step": 41383, "epoch": 985} {"train_loss": -5.69439172744751, "global_step": 41384, "epoch": 985} {"train_loss": -5.447244167327881, "global_step": 41385, "epoch": 985} {"train_loss": -5.7197370529174805, "global_step": 41386, "epoch": 985} {"train_loss": -5.606637954711914, "global_step": 41387, "epoch": 985} {"train_loss": -5.555924892425537, "global_step": 41388, "epoch": 985} {"train_loss": -5.705683708190918, "global_step": 41389, "epoch": 985} {"train_loss": -5.684135913848877, "global_step": 41390, "epoch": 985} {"train_loss": -5.434634208679199, "global_step": 41391, "epoch": 985} {"train_loss": -5.633647918701172, "global_step": 41392, "epoch": 985} {"train_loss": -5.508397102355957, "global_step": 41393, "epoch": 985} {"train_loss": -5.647381782531738, "global_step": 41394, "epoch": 985} {"train_loss": -5.563010215759277, "global_step": 41395, "epoch": 985} {"train_loss": -5.706610679626465, "global_step": 41396, "epoch": 985} {"train_loss": -5.660252571105957, "global_step": 41397, "epoch": 985} {"train_loss": -5.580869674682617, "global_step": 41398, "epoch": 985} {"train_loss": -5.733058929443359, "global_step": 41399, "epoch": 985} {"train_loss": -5.549304008483887, "global_step": 41400, "epoch": 985} {"train_loss": -5.631986618041992, "global_step": 41401, "epoch": 985} {"train_loss": -5.505671977996826, "global_step": 41402, "epoch": 985} {"train_loss": -5.726024627685547, "global_step": 41403, "epoch": 985} {"train_loss": -5.63044548034668, "global_step": 41404, "epoch": 985} {"train_loss": -5.674137115478516, "global_step": 41405, "epoch": 985} {"train_loss": -5.5570268630981445, "global_step": 41406, "epoch": 985} {"train_loss": -5.6018290519714355, "global_step": 41407, "epoch": 985} {"train_loss": -5.591355800628662, "global_step": 41408, "epoch": 985} {"train_loss": -5.571488380432129, "global_step": 41409, "epoch": 985} {"train_loss": -5.611594200134277, "global_step": 41410, "epoch": 985} {"train_loss": -5.6121674832843595, "global_step": 41411, "epoch": 985, "val_loss": 74173.09375} {"train_loss": -5.801877975463867, "global_step": 41412, "epoch": 986} {"train_loss": -5.673681259155273, "global_step": 41413, "epoch": 986} {"train_loss": -5.60482120513916, "global_step": 41414, "epoch": 986} {"train_loss": -5.573995590209961, "global_step": 41415, "epoch": 986} {"train_loss": -5.665898323059082, "global_step": 41416, "epoch": 986} {"train_loss": -5.724253177642822, "global_step": 41417, "epoch": 986} {"train_loss": -5.662448883056641, "global_step": 41418, "epoch": 986} {"train_loss": -5.608334541320801, "global_step": 41419, "epoch": 986} {"train_loss": -5.798903465270996, "global_step": 41420, "epoch": 986} {"train_loss": -5.760862350463867, "global_step": 41421, "epoch": 986} {"train_loss": -5.623318672180176, "global_step": 41422, "epoch": 986} {"train_loss": -5.672451496124268, "global_step": 41423, "epoch": 986} {"train_loss": -5.566344261169434, "global_step": 41424, "epoch": 986} {"train_loss": -5.5528411865234375, "global_step": 41425, "epoch": 986} {"train_loss": -5.610000133514404, "global_step": 41426, "epoch": 986} {"train_loss": -5.6305365562438965, "global_step": 41427, "epoch": 986} {"train_loss": -5.573417663574219, "global_step": 41428, "epoch": 986} {"train_loss": -5.636114120483398, "global_step": 41429, "epoch": 986} {"train_loss": -5.707871437072754, "global_step": 41430, "epoch": 986} {"train_loss": -5.589067459106445, "global_step": 41431, "epoch": 986} {"train_loss": -5.6376190185546875, "global_step": 41432, "epoch": 986} {"train_loss": -5.590639114379883, "global_step": 41433, "epoch": 986} {"train_loss": -5.606954097747803, "global_step": 41434, "epoch": 986} {"train_loss": -5.568209648132324, "global_step": 41435, "epoch": 986} {"train_loss": -5.745813369750977, "global_step": 41436, "epoch": 986} {"train_loss": -5.7574687004089355, "global_step": 41437, "epoch": 986} {"train_loss": -5.640752792358398, "global_step": 41438, "epoch": 986} {"train_loss": -5.612424850463867, "global_step": 41439, "epoch": 986} {"train_loss": -5.573850631713867, "global_step": 41440, "epoch": 986} {"train_loss": -5.5725860595703125, "global_step": 41441, "epoch": 986} {"train_loss": -5.612800598144531, "global_step": 41442, "epoch": 986} {"train_loss": -5.669384002685547, "global_step": 41443, "epoch": 986} {"train_loss": -5.717798233032227, "global_step": 41444, "epoch": 986} {"train_loss": -5.531876087188721, "global_step": 41445, "epoch": 986} {"train_loss": -5.6588921546936035, "global_step": 41446, "epoch": 986} {"train_loss": -5.644754409790039, "global_step": 41447, "epoch": 986} {"train_loss": -5.60462760925293, "global_step": 41448, "epoch": 986} {"train_loss": -5.738502025604248, "global_step": 41449, "epoch": 986} {"train_loss": -5.828469753265381, "global_step": 41450, "epoch": 986} {"train_loss": -5.6547465324401855, "global_step": 41451, "epoch": 986} {"train_loss": -5.619868755340576, "global_step": 41452, "epoch": 986} {"train_loss": -5.651883942740304, "global_step": 41453, "epoch": 986, "val_loss": 73486.5859375} {"train_loss": -5.791688919067383, "global_step": 41454, "epoch": 987} {"train_loss": -5.638466835021973, "global_step": 41455, "epoch": 987} {"train_loss": -5.639486789703369, "global_step": 41456, "epoch": 987} {"train_loss": -5.648212432861328, "global_step": 41457, "epoch": 987} {"train_loss": -5.7267231941223145, "global_step": 41458, "epoch": 987} {"train_loss": -5.645435810089111, "global_step": 41459, "epoch": 987} {"train_loss": -5.701277732849121, "global_step": 41460, "epoch": 987} {"train_loss": -5.602877616882324, "global_step": 41461, "epoch": 987} {"train_loss": -5.684889793395996, "global_step": 41462, "epoch": 987} {"train_loss": -5.634361267089844, "global_step": 41463, "epoch": 987} {"train_loss": -5.689371109008789, "global_step": 41464, "epoch": 987} {"train_loss": -5.6681108474731445, "global_step": 41465, "epoch": 987} {"train_loss": -5.722292423248291, "global_step": 41466, "epoch": 987} {"train_loss": -5.619884967803955, "global_step": 41467, "epoch": 987} {"train_loss": -5.571067810058594, "global_step": 41468, "epoch": 987} {"train_loss": -5.687593460083008, "global_step": 41469, "epoch": 987} {"train_loss": -5.812317848205566, "global_step": 41470, "epoch": 987} {"train_loss": -5.616203784942627, "global_step": 41471, "epoch": 987} {"train_loss": -5.724787712097168, "global_step": 41472, "epoch": 987} {"train_loss": -5.7242536544799805, "global_step": 41473, "epoch": 987} {"train_loss": -5.64539909362793, "global_step": 41474, "epoch": 987} {"train_loss": -5.5599365234375, "global_step": 41475, "epoch": 987} {"train_loss": -5.679022312164307, "global_step": 41476, "epoch": 987} {"train_loss": -5.7085161209106445, "global_step": 41477, "epoch": 987} {"train_loss": -5.515647888183594, "global_step": 41478, "epoch": 987} {"train_loss": -5.796420574188232, "global_step": 41479, "epoch": 987} {"train_loss": -5.564236640930176, "global_step": 41480, "epoch": 987} {"train_loss": -5.691904544830322, "global_step": 41481, "epoch": 987} {"train_loss": -5.613515853881836, "global_step": 41482, "epoch": 987} {"train_loss": -5.751800537109375, "global_step": 41483, "epoch": 987} {"train_loss": -5.763576507568359, "global_step": 41484, "epoch": 987} {"train_loss": -5.719623565673828, "global_step": 41485, "epoch": 987} {"train_loss": -5.6911234855651855, "global_step": 41486, "epoch": 987} {"train_loss": -5.698508262634277, "global_step": 41487, "epoch": 987} {"train_loss": -5.61759614944458, "global_step": 41488, "epoch": 987} {"train_loss": -5.750975608825684, "global_step": 41489, "epoch": 987} {"train_loss": -5.650599956512451, "global_step": 41490, "epoch": 987} {"train_loss": -5.814605712890625, "global_step": 41491, "epoch": 987} {"train_loss": -5.634710311889648, "global_step": 41492, "epoch": 987} {"train_loss": -5.64818811416626, "global_step": 41493, "epoch": 987} {"train_loss": -5.731935977935791, "global_step": 41494, "epoch": 987} {"train_loss": -5.676335743495396, "global_step": 41495, "epoch": 987, "val_loss": 73736.6328125} {"train_loss": -5.8219523429870605, "global_step": 41496, "epoch": 988} {"train_loss": -5.69711971282959, "global_step": 41497, "epoch": 988} {"train_loss": -5.664689540863037, "global_step": 41498, "epoch": 988} {"train_loss": -5.7081499099731445, "global_step": 41499, "epoch": 988} {"train_loss": -5.626351833343506, "global_step": 41500, "epoch": 988} {"train_loss": -5.768280029296875, "global_step": 41501, "epoch": 988} {"train_loss": -5.717026710510254, "global_step": 41502, "epoch": 988} {"train_loss": -5.643573760986328, "global_step": 41503, "epoch": 988} {"train_loss": -5.680398941040039, "global_step": 41504, "epoch": 988} {"train_loss": -5.686766624450684, "global_step": 41505, "epoch": 988} {"train_loss": -5.693795204162598, "global_step": 41506, "epoch": 988} {"train_loss": -5.733241081237793, "global_step": 41507, "epoch": 988} {"train_loss": -5.574974060058594, "global_step": 41508, "epoch": 988} {"train_loss": -5.687633037567139, "global_step": 41509, "epoch": 988} {"train_loss": -5.643216609954834, "global_step": 41510, "epoch": 988} {"train_loss": -5.657814025878906, "global_step": 41511, "epoch": 988} {"train_loss": -5.53736686706543, "global_step": 41512, "epoch": 988} {"train_loss": -5.6627092361450195, "global_step": 41513, "epoch": 988} {"train_loss": -5.655683517456055, "global_step": 41514, "epoch": 988} {"train_loss": -5.813436508178711, "global_step": 41515, "epoch": 988} {"train_loss": -5.754185676574707, "global_step": 41516, "epoch": 988} {"train_loss": -5.681023120880127, "global_step": 41517, "epoch": 988} {"train_loss": -5.586399078369141, "global_step": 41518, "epoch": 988} {"train_loss": -5.780767440795898, "global_step": 41519, "epoch": 988} {"train_loss": -5.728595733642578, "global_step": 41520, "epoch": 988} {"train_loss": -5.6496405601501465, "global_step": 41521, "epoch": 988} {"train_loss": -5.74852991104126, "global_step": 41522, "epoch": 988} {"train_loss": -5.619178771972656, "global_step": 41523, "epoch": 988} {"train_loss": -5.65009069442749, "global_step": 41524, "epoch": 988} {"train_loss": -5.575747489929199, "global_step": 41525, "epoch": 988} {"train_loss": -5.707357406616211, "global_step": 41526, "epoch": 988} {"train_loss": -5.505214691162109, "global_step": 41527, "epoch": 988} {"train_loss": -5.610799789428711, "global_step": 41528, "epoch": 988} {"train_loss": -5.541018009185791, "global_step": 41529, "epoch": 988} {"train_loss": -5.579621315002441, "global_step": 41530, "epoch": 988} {"train_loss": -5.575224876403809, "global_step": 41531, "epoch": 988} {"train_loss": -5.685971260070801, "global_step": 41532, "epoch": 988} {"train_loss": -5.5854387283325195, "global_step": 41533, "epoch": 988} {"train_loss": -5.427947998046875, "global_step": 41534, "epoch": 988} {"train_loss": -5.709227561950684, "global_step": 41535, "epoch": 988} {"train_loss": -5.595902442932129, "global_step": 41536, "epoch": 988} {"train_loss": -5.657764673233032, "global_step": 41537, "epoch": 988, "val_loss": 74085.4140625} {"train_loss": -5.649934768676758, "global_step": 41538, "epoch": 989} {"train_loss": -5.672859191894531, "global_step": 41539, "epoch": 989} {"train_loss": -5.656149864196777, "global_step": 41540, "epoch": 989} {"train_loss": -5.594482421875, "global_step": 41541, "epoch": 989} {"train_loss": -5.742173671722412, "global_step": 41542, "epoch": 989} {"train_loss": -5.720955848693848, "global_step": 41543, "epoch": 989} {"train_loss": -5.718363285064697, "global_step": 41544, "epoch": 989} {"train_loss": -5.721198081970215, "global_step": 41545, "epoch": 989} {"train_loss": -5.7277936935424805, "global_step": 41546, "epoch": 989} {"train_loss": -5.694884300231934, "global_step": 41547, "epoch": 989} {"train_loss": -5.616114139556885, "global_step": 41548, "epoch": 989} {"train_loss": -5.626476287841797, "global_step": 41549, "epoch": 989} {"train_loss": -5.756534576416016, "global_step": 41550, "epoch": 989} {"train_loss": -5.531598091125488, "global_step": 41551, "epoch": 989} {"train_loss": -5.684069633483887, "global_step": 41552, "epoch": 989} {"train_loss": -5.522636413574219, "global_step": 41553, "epoch": 989} {"train_loss": -5.756330490112305, "global_step": 41554, "epoch": 989} {"train_loss": -5.478099822998047, "global_step": 41555, "epoch": 989} {"train_loss": -5.6383056640625, "global_step": 41556, "epoch": 989} {"train_loss": -5.6615376472473145, "global_step": 41557, "epoch": 989} {"train_loss": -5.8088812828063965, "global_step": 41558, "epoch": 989} {"train_loss": -5.6097211837768555, "global_step": 41559, "epoch": 989} {"train_loss": -5.642793655395508, "global_step": 41560, "epoch": 989} {"train_loss": -5.672993183135986, "global_step": 41561, "epoch": 989} {"train_loss": -5.620720386505127, "global_step": 41562, "epoch": 989} {"train_loss": -5.735867977142334, "global_step": 41563, "epoch": 989} {"train_loss": -5.6924848556518555, "global_step": 41564, "epoch": 989} {"train_loss": -5.662469387054443, "global_step": 41565, "epoch": 989} {"train_loss": -5.648749351501465, "global_step": 41566, "epoch": 989} {"train_loss": -5.537588596343994, "global_step": 41567, "epoch": 989} {"train_loss": -5.743854522705078, "global_step": 41568, "epoch": 989} {"train_loss": -5.558076858520508, "global_step": 41569, "epoch": 989} {"train_loss": -5.528690814971924, "global_step": 41570, "epoch": 989} {"train_loss": -5.6006669998168945, "global_step": 41571, "epoch": 989} {"train_loss": -5.603564739227295, "global_step": 41572, "epoch": 989} {"train_loss": -5.679774284362793, "global_step": 41573, "epoch": 989} {"train_loss": -5.682559013366699, "global_step": 41574, "epoch": 989} {"train_loss": -5.589259147644043, "global_step": 41575, "epoch": 989} {"train_loss": -5.805944442749023, "global_step": 41576, "epoch": 989} {"train_loss": -5.630436420440674, "global_step": 41577, "epoch": 989} {"train_loss": -5.495804786682129, "global_step": 41578, "epoch": 989} {"train_loss": -5.651438236236572, "global_step": 41579, "epoch": 989, "val_loss": 74034.6484375} {"train_loss": -5.638564586639404, "global_step": 41580, "epoch": 990} {"train_loss": -5.600246906280518, "global_step": 41581, "epoch": 990} {"train_loss": -5.768106460571289, "global_step": 41582, "epoch": 990} {"train_loss": -5.5205583572387695, "global_step": 41583, "epoch": 990} {"train_loss": -5.694380760192871, "global_step": 41584, "epoch": 990} {"train_loss": -5.790897369384766, "global_step": 41585, "epoch": 990} {"train_loss": -5.7312750816345215, "global_step": 41586, "epoch": 990} {"train_loss": -5.586798667907715, "global_step": 41587, "epoch": 990} {"train_loss": -5.768657207489014, "global_step": 41588, "epoch": 990} {"train_loss": -5.606050968170166, "global_step": 41589, "epoch": 990} {"train_loss": -5.6178297996521, "global_step": 41590, "epoch": 990} {"train_loss": -5.674202919006348, "global_step": 41591, "epoch": 990} {"train_loss": -5.60886287689209, "global_step": 41592, "epoch": 990} {"train_loss": -5.71990966796875, "global_step": 41593, "epoch": 990} {"train_loss": -5.556463241577148, "global_step": 41594, "epoch": 990} {"train_loss": -5.546401023864746, "global_step": 41595, "epoch": 990} {"train_loss": -5.7153706550598145, "global_step": 41596, "epoch": 990} {"train_loss": -5.572608947753906, "global_step": 41597, "epoch": 990} {"train_loss": -5.62824821472168, "global_step": 41598, "epoch": 990} {"train_loss": -5.673471927642822, "global_step": 41599, "epoch": 990} {"train_loss": -5.601315498352051, "global_step": 41600, "epoch": 990} {"train_loss": -5.734904766082764, "global_step": 41601, "epoch": 990} {"train_loss": -5.7230682373046875, "global_step": 41602, "epoch": 990} {"train_loss": -5.567094326019287, "global_step": 41603, "epoch": 990} {"train_loss": -5.576722145080566, "global_step": 41604, "epoch": 990} {"train_loss": -5.773018836975098, "global_step": 41605, "epoch": 990} {"train_loss": -5.590345859527588, "global_step": 41606, "epoch": 990} {"train_loss": -5.6229143142700195, "global_step": 41607, "epoch": 990} {"train_loss": -5.666001319885254, "global_step": 41608, "epoch": 990} {"train_loss": -5.6464080810546875, "global_step": 41609, "epoch": 990} {"train_loss": -5.760610103607178, "global_step": 41610, "epoch": 990} {"train_loss": -5.523016929626465, "global_step": 41611, "epoch": 990} {"train_loss": -5.663979530334473, "global_step": 41612, "epoch": 990} {"train_loss": -5.763210296630859, "global_step": 41613, "epoch": 990} {"train_loss": -5.710358142852783, "global_step": 41614, "epoch": 990} {"train_loss": -5.612442493438721, "global_step": 41615, "epoch": 990} {"train_loss": -5.673035144805908, "global_step": 41616, "epoch": 990} {"train_loss": -5.764196395874023, "global_step": 41617, "epoch": 990} {"train_loss": -5.588078022003174, "global_step": 41618, "epoch": 990} {"train_loss": -5.5432915687561035, "global_step": 41619, "epoch": 990} {"train_loss": -5.664223670959473, "global_step": 41620, "epoch": 990} {"train_loss": -5.650996798560733, "global_step": 41621, "epoch": 990, "val_loss": 73773.578125} {"train_loss": -5.698493957519531, "global_step": 41622, "epoch": 991} {"train_loss": -5.768438339233398, "global_step": 41623, "epoch": 991} {"train_loss": -5.676665782928467, "global_step": 41624, "epoch": 991} {"train_loss": -5.744120121002197, "global_step": 41625, "epoch": 991} {"train_loss": -5.681676387786865, "global_step": 41626, "epoch": 991} {"train_loss": -5.715539932250977, "global_step": 41627, "epoch": 991} {"train_loss": -5.670823097229004, "global_step": 41628, "epoch": 991} {"train_loss": -5.675816535949707, "global_step": 41629, "epoch": 991} {"train_loss": -5.55211067199707, "global_step": 41630, "epoch": 991} {"train_loss": -5.631660461425781, "global_step": 41631, "epoch": 991} {"train_loss": -5.753705978393555, "global_step": 41632, "epoch": 991} {"train_loss": -5.697925567626953, "global_step": 41633, "epoch": 991} {"train_loss": -5.696663856506348, "global_step": 41634, "epoch": 991} {"train_loss": -5.758436679840088, "global_step": 41635, "epoch": 991} {"train_loss": -5.70351505279541, "global_step": 41636, "epoch": 991} {"train_loss": -5.694331169128418, "global_step": 41637, "epoch": 991} {"train_loss": -5.740086555480957, "global_step": 41638, "epoch": 991} {"train_loss": -5.659434795379639, "global_step": 41639, "epoch": 991} {"train_loss": -5.588872909545898, "global_step": 41640, "epoch": 991} {"train_loss": -5.75864839553833, "global_step": 41641, "epoch": 991} {"train_loss": -5.5115251541137695, "global_step": 41642, "epoch": 991} {"train_loss": -5.776337623596191, "global_step": 41643, "epoch": 991} {"train_loss": -5.699549198150635, "global_step": 41644, "epoch": 991} {"train_loss": -5.595376014709473, "global_step": 41645, "epoch": 991} {"train_loss": -5.633894920349121, "global_step": 41646, "epoch": 991} {"train_loss": -5.727837562561035, "global_step": 41647, "epoch": 991} {"train_loss": -5.4643425941467285, "global_step": 41648, "epoch": 991} {"train_loss": -5.71047306060791, "global_step": 41649, "epoch": 991} {"train_loss": -5.594019889831543, "global_step": 41650, "epoch": 991} {"train_loss": -5.596592903137207, "global_step": 41651, "epoch": 991} {"train_loss": -5.666230201721191, "global_step": 41652, "epoch": 991} {"train_loss": -5.488184928894043, "global_step": 41653, "epoch": 991} {"train_loss": -5.631982803344727, "global_step": 41654, "epoch": 991} {"train_loss": -5.602723121643066, "global_step": 41655, "epoch": 991} {"train_loss": -5.531869888305664, "global_step": 41656, "epoch": 991} {"train_loss": -5.607093811035156, "global_step": 41657, "epoch": 991} {"train_loss": -5.659428596496582, "global_step": 41658, "epoch": 991} {"train_loss": -5.548300743103027, "global_step": 41659, "epoch": 991} {"train_loss": -5.638123512268066, "global_step": 41660, "epoch": 991} {"train_loss": -5.648792266845703, "global_step": 41661, "epoch": 991} {"train_loss": -5.645040988922119, "global_step": 41662, "epoch": 991} {"train_loss": -5.655015638896397, "global_step": 41663, "epoch": 991, "val_loss": 73935.234375} {"train_loss": -5.607439041137695, "global_step": 41664, "epoch": 992} {"train_loss": -5.696074962615967, "global_step": 41665, "epoch": 992} {"train_loss": -5.6120829582214355, "global_step": 41666, "epoch": 992} {"train_loss": -5.691335201263428, "global_step": 41667, "epoch": 992} {"train_loss": -5.740616798400879, "global_step": 41668, "epoch": 992} {"train_loss": -5.600918769836426, "global_step": 41669, "epoch": 992} {"train_loss": -5.621455192565918, "global_step": 41670, "epoch": 992} {"train_loss": -5.760346412658691, "global_step": 41671, "epoch": 992} {"train_loss": -5.73294734954834, "global_step": 41672, "epoch": 992} {"train_loss": -5.658112525939941, "global_step": 41673, "epoch": 992} {"train_loss": -5.747271537780762, "global_step": 41674, "epoch": 992} {"train_loss": -5.730177879333496, "global_step": 41675, "epoch": 992} {"train_loss": -5.710972785949707, "global_step": 41676, "epoch": 992} {"train_loss": -5.729742050170898, "global_step": 41677, "epoch": 992} {"train_loss": -5.527507781982422, "global_step": 41678, "epoch": 992} {"train_loss": -5.660292625427246, "global_step": 41679, "epoch": 992} {"train_loss": -5.847081184387207, "global_step": 41680, "epoch": 992} {"train_loss": -5.645012855529785, "global_step": 41681, "epoch": 992} {"train_loss": -5.598021507263184, "global_step": 41682, "epoch": 992} {"train_loss": -5.7066755294799805, "global_step": 41683, "epoch": 992} {"train_loss": -5.693450450897217, "global_step": 41684, "epoch": 992} {"train_loss": -5.675246715545654, "global_step": 41685, "epoch": 992} {"train_loss": -5.5806803703308105, "global_step": 41686, "epoch": 992} {"train_loss": -5.617258548736572, "global_step": 41687, "epoch": 992} {"train_loss": -5.632247447967529, "global_step": 41688, "epoch": 992} {"train_loss": -5.623730659484863, "global_step": 41689, "epoch": 992} {"train_loss": -5.666182994842529, "global_step": 41690, "epoch": 992} {"train_loss": -5.615091323852539, "global_step": 41691, "epoch": 992} {"train_loss": -5.643007755279541, "global_step": 41692, "epoch": 992} {"train_loss": -5.561933994293213, "global_step": 41693, "epoch": 992} {"train_loss": -5.753114223480225, "global_step": 41694, "epoch": 992} {"train_loss": -5.575037002563477, "global_step": 41695, "epoch": 992} {"train_loss": -5.59797477722168, "global_step": 41696, "epoch": 992} {"train_loss": -5.597217082977295, "global_step": 41697, "epoch": 992} {"train_loss": -5.559093475341797, "global_step": 41698, "epoch": 992} {"train_loss": -5.656253337860107, "global_step": 41699, "epoch": 992} {"train_loss": -5.6256561279296875, "global_step": 41700, "epoch": 992} {"train_loss": -5.71828031539917, "global_step": 41701, "epoch": 992} {"train_loss": -5.64448356628418, "global_step": 41702, "epoch": 992} {"train_loss": -5.5975341796875, "global_step": 41703, "epoch": 992} {"train_loss": -5.67501163482666, "global_step": 41704, "epoch": 992} {"train_loss": -5.651965459187825, "global_step": 41705, "epoch": 992, "val_loss": 74191.890625} {"train_loss": -5.774261951446533, "global_step": 41706, "epoch": 993} {"train_loss": -5.637845516204834, "global_step": 41707, "epoch": 993} {"train_loss": -5.747766494750977, "global_step": 41708, "epoch": 993} {"train_loss": -5.583731651306152, "global_step": 41709, "epoch": 993} {"train_loss": -5.548674583435059, "global_step": 41710, "epoch": 993} {"train_loss": -5.666559219360352, "global_step": 41711, "epoch": 993} {"train_loss": -5.6544694900512695, "global_step": 41712, "epoch": 993} {"train_loss": -5.5218939781188965, "global_step": 41713, "epoch": 993} {"train_loss": -5.742987632751465, "global_step": 41714, "epoch": 993} {"train_loss": -5.630960464477539, "global_step": 41715, "epoch": 993} {"train_loss": -5.509674072265625, "global_step": 41716, "epoch": 993} {"train_loss": -5.618393898010254, "global_step": 41717, "epoch": 993} {"train_loss": -5.575298309326172, "global_step": 41718, "epoch": 993} {"train_loss": -5.555540084838867, "global_step": 41719, "epoch": 993} {"train_loss": -5.436078071594238, "global_step": 41720, "epoch": 993} {"train_loss": -5.579317092895508, "global_step": 41721, "epoch": 993} {"train_loss": -5.676934242248535, "global_step": 41722, "epoch": 993} {"train_loss": -5.520483016967773, "global_step": 41723, "epoch": 993} {"train_loss": -5.638978958129883, "global_step": 41724, "epoch": 993} {"train_loss": -5.717288017272949, "global_step": 41725, "epoch": 993} {"train_loss": -5.6009111404418945, "global_step": 41726, "epoch": 993} {"train_loss": -5.727128505706787, "global_step": 41727, "epoch": 993} {"train_loss": -5.725403785705566, "global_step": 41728, "epoch": 993} {"train_loss": -5.680824279785156, "global_step": 41729, "epoch": 993} {"train_loss": -5.6632304191589355, "global_step": 41730, "epoch": 993} {"train_loss": -5.5534210205078125, "global_step": 41731, "epoch": 993} {"train_loss": -5.649858474731445, "global_step": 41732, "epoch": 993} {"train_loss": -5.634590148925781, "global_step": 41733, "epoch": 993} {"train_loss": -5.694469928741455, "global_step": 41734, "epoch": 993} {"train_loss": -5.7050981521606445, "global_step": 41735, "epoch": 993} {"train_loss": -5.7704572677612305, "global_step": 41736, "epoch": 993} {"train_loss": -5.604757785797119, "global_step": 41737, "epoch": 993} {"train_loss": -5.64589786529541, "global_step": 41738, "epoch": 993} {"train_loss": -5.662965297698975, "global_step": 41739, "epoch": 993} {"train_loss": -5.703366279602051, "global_step": 41740, "epoch": 993} {"train_loss": -5.7015790939331055, "global_step": 41741, "epoch": 993} {"train_loss": -5.755623817443848, "global_step": 41742, "epoch": 993} {"train_loss": -5.533470153808594, "global_step": 41743, "epoch": 993} {"train_loss": -5.7027716636657715, "global_step": 41744, "epoch": 993} {"train_loss": -5.604357719421387, "global_step": 41745, "epoch": 993} {"train_loss": -5.685128211975098, "global_step": 41746, "epoch": 993} {"train_loss": -5.647053253083002, "global_step": 41747, "epoch": 993, "val_loss": 74263.09375} {"train_loss": -5.475114822387695, "global_step": 41748, "epoch": 994} {"train_loss": -5.703093528747559, "global_step": 41749, "epoch": 994} {"train_loss": -5.7170796394348145, "global_step": 41750, "epoch": 994} {"train_loss": -5.616617202758789, "global_step": 41751, "epoch": 994} {"train_loss": -5.614043235778809, "global_step": 41752, "epoch": 994} {"train_loss": -5.6089982986450195, "global_step": 41753, "epoch": 994} {"train_loss": -5.668174743652344, "global_step": 41754, "epoch": 994} {"train_loss": -5.598340034484863, "global_step": 41755, "epoch": 994} {"train_loss": -5.758643627166748, "global_step": 41756, "epoch": 994} {"train_loss": -5.63025426864624, "global_step": 41757, "epoch": 994} {"train_loss": -5.62099552154541, "global_step": 41758, "epoch": 994} {"train_loss": -5.766049861907959, "global_step": 41759, "epoch": 994} {"train_loss": -5.779216766357422, "global_step": 41760, "epoch": 994} {"train_loss": -5.63168478012085, "global_step": 41761, "epoch": 994} {"train_loss": -5.686450958251953, "global_step": 41762, "epoch": 994} {"train_loss": -5.706491470336914, "global_step": 41763, "epoch": 994} {"train_loss": -5.590224266052246, "global_step": 41764, "epoch": 994} {"train_loss": -5.679080963134766, "global_step": 41765, "epoch": 994} {"train_loss": -5.607089996337891, "global_step": 41766, "epoch": 994} {"train_loss": -5.616827011108398, "global_step": 41767, "epoch": 994} {"train_loss": -5.714809417724609, "global_step": 41768, "epoch": 994} {"train_loss": -5.624558448791504, "global_step": 41769, "epoch": 994} {"train_loss": -5.628456115722656, "global_step": 41770, "epoch": 994} {"train_loss": -5.506545066833496, "global_step": 41771, "epoch": 994} {"train_loss": -5.793678283691406, "global_step": 41772, "epoch": 994} {"train_loss": -5.820754051208496, "global_step": 41773, "epoch": 994} {"train_loss": -5.761224269866943, "global_step": 41774, "epoch": 994} {"train_loss": -5.6949262619018555, "global_step": 41775, "epoch": 994} {"train_loss": -5.589598655700684, "global_step": 41776, "epoch": 994} {"train_loss": -5.727868556976318, "global_step": 41777, "epoch": 994} {"train_loss": -5.564162254333496, "global_step": 41778, "epoch": 994} {"train_loss": -5.758750915527344, "global_step": 41779, "epoch": 994} {"train_loss": -5.651883125305176, "global_step": 41780, "epoch": 994} {"train_loss": -5.707622528076172, "global_step": 41781, "epoch": 994} {"train_loss": -5.665873050689697, "global_step": 41782, "epoch": 994} {"train_loss": -5.570381164550781, "global_step": 41783, "epoch": 994} {"train_loss": -5.6277875900268555, "global_step": 41784, "epoch": 994} {"train_loss": -5.57110595703125, "global_step": 41785, "epoch": 994} {"train_loss": -5.738471984863281, "global_step": 41786, "epoch": 994} {"train_loss": -5.540624618530273, "global_step": 41787, "epoch": 994} {"train_loss": -5.529721260070801, "global_step": 41788, "epoch": 994} {"train_loss": -5.654657738549369, "global_step": 41789, "epoch": 994, "val_loss": 73856.0625} {"train_loss": -5.649844169616699, "global_step": 41790, "epoch": 995} {"train_loss": -5.618269443511963, "global_step": 41791, "epoch": 995} {"train_loss": -5.676677703857422, "global_step": 41792, "epoch": 995} {"train_loss": -5.642661094665527, "global_step": 41793, "epoch": 995} {"train_loss": -5.757370948791504, "global_step": 41794, "epoch": 995} {"train_loss": -5.699650764465332, "global_step": 41795, "epoch": 995} {"train_loss": -5.744002819061279, "global_step": 41796, "epoch": 995} {"train_loss": -5.71373176574707, "global_step": 41797, "epoch": 995} {"train_loss": -5.672987937927246, "global_step": 41798, "epoch": 995} {"train_loss": -5.6771464347839355, "global_step": 41799, "epoch": 995} {"train_loss": -5.733301639556885, "global_step": 41800, "epoch": 995} {"train_loss": -5.547625541687012, "global_step": 41801, "epoch": 995} {"train_loss": -5.606534957885742, "global_step": 41802, "epoch": 995} {"train_loss": -5.706543445587158, "global_step": 41803, "epoch": 995} {"train_loss": -5.690398216247559, "global_step": 41804, "epoch": 995} {"train_loss": -5.516362190246582, "global_step": 41805, "epoch": 995} {"train_loss": -5.560964584350586, "global_step": 41806, "epoch": 995} {"train_loss": -5.578079700469971, "global_step": 41807, "epoch": 995} {"train_loss": -5.597522258758545, "global_step": 41808, "epoch": 995} {"train_loss": -5.779152870178223, "global_step": 41809, "epoch": 995} {"train_loss": -5.620798587799072, "global_step": 41810, "epoch": 995} {"train_loss": -5.663835525512695, "global_step": 41811, "epoch": 995} {"train_loss": -5.543489456176758, "global_step": 41812, "epoch": 995} {"train_loss": -5.633401870727539, "global_step": 41813, "epoch": 995} {"train_loss": -5.7540998458862305, "global_step": 41814, "epoch": 995} {"train_loss": -5.499096870422363, "global_step": 41815, "epoch": 995} {"train_loss": -5.556987285614014, "global_step": 41816, "epoch": 995} {"train_loss": -5.5664215087890625, "global_step": 41817, "epoch": 995} {"train_loss": -5.644601345062256, "global_step": 41818, "epoch": 995} {"train_loss": -5.648416519165039, "global_step": 41819, "epoch": 995} {"train_loss": -5.822322845458984, "global_step": 41820, "epoch": 995} {"train_loss": -5.605805397033691, "global_step": 41821, "epoch": 995} {"train_loss": -5.567554950714111, "global_step": 41822, "epoch": 995} {"train_loss": -5.666706085205078, "global_step": 41823, "epoch": 995} {"train_loss": -5.564274311065674, "global_step": 41824, "epoch": 995} {"train_loss": -5.6518144607543945, "global_step": 41825, "epoch": 995} {"train_loss": -5.549939155578613, "global_step": 41826, "epoch": 995} {"train_loss": -5.621913909912109, "global_step": 41827, "epoch": 995} {"train_loss": -5.567510604858398, "global_step": 41828, "epoch": 995} {"train_loss": -5.588254928588867, "global_step": 41829, "epoch": 995} {"train_loss": -5.479978084564209, "global_step": 41830, "epoch": 995} {"train_loss": -5.635173070998419, "global_step": 41831, "epoch": 995, "val_loss": 74279.15625} {"train_loss": -5.54844331741333, "global_step": 41832, "epoch": 996} {"train_loss": -5.57763147354126, "global_step": 41833, "epoch": 996} {"train_loss": -5.750912666320801, "global_step": 41834, "epoch": 996} {"train_loss": -5.628094673156738, "global_step": 41835, "epoch": 996} {"train_loss": -5.64862060546875, "global_step": 41836, "epoch": 996} {"train_loss": -5.600014686584473, "global_step": 41837, "epoch": 996} {"train_loss": -5.694705009460449, "global_step": 41838, "epoch": 996} {"train_loss": -5.67242956161499, "global_step": 41839, "epoch": 996} {"train_loss": -5.664252281188965, "global_step": 41840, "epoch": 996} {"train_loss": -5.7281904220581055, "global_step": 41841, "epoch": 996} {"train_loss": -5.641890048980713, "global_step": 41842, "epoch": 996} {"train_loss": -5.602481842041016, "global_step": 41843, "epoch": 996} {"train_loss": -5.596136093139648, "global_step": 41844, "epoch": 996} {"train_loss": -5.756130218505859, "global_step": 41845, "epoch": 996} {"train_loss": -5.550634384155273, "global_step": 41846, "epoch": 996} {"train_loss": -5.621434688568115, "global_step": 41847, "epoch": 996} {"train_loss": -5.781136989593506, "global_step": 41848, "epoch": 996} {"train_loss": -5.7737627029418945, "global_step": 41849, "epoch": 996} {"train_loss": -5.665408134460449, "global_step": 41850, "epoch": 996} {"train_loss": -5.619792461395264, "global_step": 41851, "epoch": 996} {"train_loss": -5.634353160858154, "global_step": 41852, "epoch": 996} {"train_loss": -5.634461879730225, "global_step": 41853, "epoch": 996} {"train_loss": -5.598320960998535, "global_step": 41854, "epoch": 996} {"train_loss": -5.627716064453125, "global_step": 41855, "epoch": 996} {"train_loss": -5.558002948760986, "global_step": 41856, "epoch": 996} {"train_loss": -5.7933430671691895, "global_step": 41857, "epoch": 996} {"train_loss": -5.534563064575195, "global_step": 41858, "epoch": 996} {"train_loss": -5.627904415130615, "global_step": 41859, "epoch": 996} {"train_loss": -5.756387233734131, "global_step": 41860, "epoch": 996} {"train_loss": -5.662667274475098, "global_step": 41861, "epoch": 996} {"train_loss": -5.7662577629089355, "global_step": 41862, "epoch": 996} {"train_loss": -5.650903701782227, "global_step": 41863, "epoch": 996} {"train_loss": -5.616216659545898, "global_step": 41864, "epoch": 996} {"train_loss": -5.496380805969238, "global_step": 41865, "epoch": 996} {"train_loss": -5.7391180992126465, "global_step": 41866, "epoch": 996} {"train_loss": -5.666965484619141, "global_step": 41867, "epoch": 996} {"train_loss": -5.598101615905762, "global_step": 41868, "epoch": 996} {"train_loss": -5.673566818237305, "global_step": 41869, "epoch": 996} {"train_loss": -5.7097272872924805, "global_step": 41870, "epoch": 996} {"train_loss": -5.638804912567139, "global_step": 41871, "epoch": 996} {"train_loss": -5.758858680725098, "global_step": 41872, "epoch": 996} {"train_loss": -5.654576732998803, "global_step": 41873, "epoch": 996, "val_loss": 74228.8125} {"train_loss": -5.604333400726318, "global_step": 41874, "epoch": 997} {"train_loss": -5.888933181762695, "global_step": 41875, "epoch": 997} {"train_loss": -5.623125076293945, "global_step": 41876, "epoch": 997} {"train_loss": -5.697826862335205, "global_step": 41877, "epoch": 997} {"train_loss": -5.735151290893555, "global_step": 41878, "epoch": 997} {"train_loss": -5.770967960357666, "global_step": 41879, "epoch": 997} {"train_loss": -5.820261001586914, "global_step": 41880, "epoch": 997} {"train_loss": -5.637414932250977, "global_step": 41881, "epoch": 997} {"train_loss": -5.67186164855957, "global_step": 41882, "epoch": 997} {"train_loss": -5.647624969482422, "global_step": 41883, "epoch": 997} {"train_loss": -5.786197662353516, "global_step": 41884, "epoch": 997} {"train_loss": -5.540678977966309, "global_step": 41885, "epoch": 997} {"train_loss": -5.677979469299316, "global_step": 41886, "epoch": 997} {"train_loss": -5.486025810241699, "global_step": 41887, "epoch": 997} {"train_loss": -5.601386070251465, "global_step": 41888, "epoch": 997} {"train_loss": -5.710038661956787, "global_step": 41889, "epoch": 997} {"train_loss": -5.481922149658203, "global_step": 41890, "epoch": 997} {"train_loss": -5.669887065887451, "global_step": 41891, "epoch": 997} {"train_loss": -5.581110000610352, "global_step": 41892, "epoch": 997} {"train_loss": -5.591424942016602, "global_step": 41893, "epoch": 997} {"train_loss": -5.618599891662598, "global_step": 41894, "epoch": 997} {"train_loss": -5.570767879486084, "global_step": 41895, "epoch": 997} {"train_loss": -5.499028205871582, "global_step": 41896, "epoch": 997} {"train_loss": -5.6068620681762695, "global_step": 41897, "epoch": 997} {"train_loss": -5.457088470458984, "global_step": 41898, "epoch": 997} {"train_loss": -5.522708415985107, "global_step": 41899, "epoch": 997} {"train_loss": -5.705724239349365, "global_step": 41900, "epoch": 997} {"train_loss": -5.65777063369751, "global_step": 41901, "epoch": 997} {"train_loss": -5.662473678588867, "global_step": 41902, "epoch": 997} {"train_loss": -5.660406589508057, "global_step": 41903, "epoch": 997} {"train_loss": -5.5590901374816895, "global_step": 41904, "epoch": 997} {"train_loss": -5.586245536804199, "global_step": 41905, "epoch": 997} {"train_loss": -5.699956893920898, "global_step": 41906, "epoch": 997} {"train_loss": -5.572470664978027, "global_step": 41907, "epoch": 997} {"train_loss": -5.711812973022461, "global_step": 41908, "epoch": 997} {"train_loss": -5.654143333435059, "global_step": 41909, "epoch": 997} {"train_loss": -5.770468711853027, "global_step": 41910, "epoch": 997} {"train_loss": -5.698134899139404, "global_step": 41911, "epoch": 997} {"train_loss": -5.548426628112793, "global_step": 41912, "epoch": 997} {"train_loss": -5.702601432800293, "global_step": 41913, "epoch": 997} {"train_loss": -5.7077202796936035, "global_step": 41914, "epoch": 997} {"train_loss": -5.641395228249686, "global_step": 41915, "epoch": 997, "val_loss": 74209.375} {"train_loss": -5.612198829650879, "global_step": 41916, "epoch": 998} {"train_loss": -5.654911041259766, "global_step": 41917, "epoch": 998} {"train_loss": -5.649981498718262, "global_step": 41918, "epoch": 998} {"train_loss": -5.628931522369385, "global_step": 41919, "epoch": 998} {"train_loss": -5.625336170196533, "global_step": 41920, "epoch": 998} {"train_loss": -5.753425598144531, "global_step": 41921, "epoch": 998} {"train_loss": -5.787386417388916, "global_step": 41922, "epoch": 998} {"train_loss": -5.753612518310547, "global_step": 41923, "epoch": 998} {"train_loss": -5.605497360229492, "global_step": 41924, "epoch": 998} {"train_loss": -5.783783912658691, "global_step": 41925, "epoch": 998} {"train_loss": -5.62571382522583, "global_step": 41926, "epoch": 998} {"train_loss": -5.7371416091918945, "global_step": 41927, "epoch": 998} {"train_loss": -5.725208282470703, "global_step": 41928, "epoch": 998} {"train_loss": -5.658344745635986, "global_step": 41929, "epoch": 998} {"train_loss": -5.659908294677734, "global_step": 41930, "epoch": 998} {"train_loss": -5.629754066467285, "global_step": 41931, "epoch": 998} {"train_loss": -5.690230369567871, "global_step": 41932, "epoch": 998} {"train_loss": -5.5503249168396, "global_step": 41933, "epoch": 998} {"train_loss": -5.626726150512695, "global_step": 41934, "epoch": 998} {"train_loss": -5.6650238037109375, "global_step": 41935, "epoch": 998} {"train_loss": -5.527231216430664, "global_step": 41936, "epoch": 998} {"train_loss": -5.67535400390625, "global_step": 41937, "epoch": 998} {"train_loss": -5.706172943115234, "global_step": 41938, "epoch": 998} {"train_loss": -5.489421844482422, "global_step": 41939, "epoch": 998} {"train_loss": -5.731626510620117, "global_step": 41940, "epoch": 998} {"train_loss": -5.689963340759277, "global_step": 41941, "epoch": 998} {"train_loss": -5.53989315032959, "global_step": 41942, "epoch": 998} {"train_loss": -5.6844635009765625, "global_step": 41943, "epoch": 998} {"train_loss": -5.7231621742248535, "global_step": 41944, "epoch": 998} {"train_loss": -5.665276527404785, "global_step": 41945, "epoch": 998} {"train_loss": -5.74001407623291, "global_step": 41946, "epoch": 998} {"train_loss": -5.541123390197754, "global_step": 41947, "epoch": 998} {"train_loss": -5.633072853088379, "global_step": 41948, "epoch": 998} {"train_loss": -5.58098030090332, "global_step": 41949, "epoch": 998} {"train_loss": -5.7555365562438965, "global_step": 41950, "epoch": 998} {"train_loss": -5.591091156005859, "global_step": 41951, "epoch": 998} {"train_loss": -5.653129577636719, "global_step": 41952, "epoch": 998} {"train_loss": -5.581109046936035, "global_step": 41953, "epoch": 998} {"train_loss": -5.520280838012695, "global_step": 41954, "epoch": 998} {"train_loss": -5.51390266418457, "global_step": 41955, "epoch": 998} {"train_loss": -5.6282758712768555, "global_step": 41956, "epoch": 998} {"train_loss": -5.648228372846331, "global_step": 41957, "epoch": 998, "val_loss": 73632.1171875} {"train_loss": -5.757857322692871, "global_step": 41958, "epoch": 999} {"train_loss": -5.65540885925293, "global_step": 41959, "epoch": 999} {"train_loss": -5.713400363922119, "global_step": 41960, "epoch": 999} {"train_loss": -5.535576820373535, "global_step": 41961, "epoch": 999} {"train_loss": -5.664455890655518, "global_step": 41962, "epoch": 999} {"train_loss": -5.597886562347412, "global_step": 41963, "epoch": 999} {"train_loss": -5.710201263427734, "global_step": 41964, "epoch": 999} {"train_loss": -5.681192398071289, "global_step": 41965, "epoch": 999} {"train_loss": -5.690393924713135, "global_step": 41966, "epoch": 999} {"train_loss": -5.652349472045898, "global_step": 41967, "epoch": 999} {"train_loss": -5.74509859085083, "global_step": 41968, "epoch": 999} {"train_loss": -5.801972389221191, "global_step": 41969, "epoch": 999} {"train_loss": -5.822475910186768, "global_step": 41970, "epoch": 999} {"train_loss": -5.693599700927734, "global_step": 41971, "epoch": 999} {"train_loss": -5.672738075256348, "global_step": 41972, "epoch": 999} {"train_loss": -5.481446266174316, "global_step": 41973, "epoch": 999} {"train_loss": -5.637132167816162, "global_step": 41974, "epoch": 999} {"train_loss": -5.658915996551514, "global_step": 41975, "epoch": 999} {"train_loss": -5.50186824798584, "global_step": 41976, "epoch": 999} {"train_loss": -5.698202610015869, "global_step": 41977, "epoch": 999} {"train_loss": -5.593784332275391, "global_step": 41978, "epoch": 999} {"train_loss": -5.501128196716309, "global_step": 41979, "epoch": 999} {"train_loss": -5.565454959869385, "global_step": 41980, "epoch": 999} {"train_loss": -5.717555046081543, "global_step": 41981, "epoch": 999} {"train_loss": -5.574366569519043, "global_step": 41982, "epoch": 999} {"train_loss": -5.650574207305908, "global_step": 41983, "epoch": 999} {"train_loss": -5.6587138175964355, "global_step": 41984, "epoch": 999} {"train_loss": -5.647726058959961, "global_step": 41985, "epoch": 999} {"train_loss": -5.736582279205322, "global_step": 41986, "epoch": 999} {"train_loss": -5.661272048950195, "global_step": 41987, "epoch": 999} {"train_loss": -5.609480857849121, "global_step": 41988, "epoch": 999} {"train_loss": -5.669422149658203, "global_step": 41989, "epoch": 999} {"train_loss": -5.720934867858887, "global_step": 41990, "epoch": 999} {"train_loss": -5.590051651000977, "global_step": 41991, "epoch": 999} {"train_loss": -5.658664226531982, "global_step": 41992, "epoch": 999} {"train_loss": -5.678184509277344, "global_step": 41993, "epoch": 999} {"train_loss": -5.715209484100342, "global_step": 41994, "epoch": 999} {"train_loss": -5.437981128692627, "global_step": 41995, "epoch": 999} {"train_loss": -5.7598724365234375, "global_step": 41996, "epoch": 999} {"train_loss": -5.812225341796875, "global_step": 41997, "epoch": 999} {"train_loss": -5.632396697998047, "global_step": 41998, "epoch": 999} {"train_loss": -5.655030080250332, "global_step": 41999, "epoch": 999, "val_loss": 74254.046875} {"train_loss": -5.740384101867676, "global_step": 42000, "epoch": 1000} {"train_loss": -5.592331886291504, "global_step": 42001, "epoch": 1000} {"train_loss": -5.629953384399414, "global_step": 42002, "epoch": 1000} {"train_loss": -5.7074785232543945, "global_step": 42003, "epoch": 1000} {"train_loss": -5.7473859786987305, "global_step": 42004, "epoch": 1000} {"train_loss": -5.637872695922852, "global_step": 42005, "epoch": 1000} {"train_loss": -5.6570539474487305, "global_step": 42006, "epoch": 1000} {"train_loss": -5.726051330566406, "global_step": 42007, "epoch": 1000} {"train_loss": -5.765831470489502, "global_step": 42008, "epoch": 1000} {"train_loss": -5.774018287658691, "global_step": 42009, "epoch": 1000} {"train_loss": -5.791610240936279, "global_step": 42010, "epoch": 1000} {"train_loss": -5.570401191711426, "global_step": 42011, "epoch": 1000} {"train_loss": -5.649087905883789, "global_step": 42012, "epoch": 1000} {"train_loss": -5.632043838500977, "global_step": 42013, "epoch": 1000} {"train_loss": -5.566915512084961, "global_step": 42014, "epoch": 1000} {"train_loss": -5.702181339263916, "global_step": 42015, "epoch": 1000} {"train_loss": -5.60307502746582, "global_step": 42016, "epoch": 1000} {"train_loss": -5.690902233123779, "global_step": 42017, "epoch": 1000} {"train_loss": -5.751777648925781, "global_step": 42018, "epoch": 1000} {"train_loss": -5.668725490570068, "global_step": 42019, "epoch": 1000} {"train_loss": -5.690738677978516, "global_step": 42020, "epoch": 1000} {"train_loss": -5.552945613861084, "global_step": 42021, "epoch": 1000} {"train_loss": -5.751734733581543, "global_step": 42022, "epoch": 1000} {"train_loss": -5.627931594848633, "global_step": 42023, "epoch": 1000} {"train_loss": -5.605712890625, "global_step": 42024, "epoch": 1000} {"train_loss": -5.585980415344238, "global_step": 42025, "epoch": 1000} {"train_loss": -5.667806148529053, "global_step": 42026, "epoch": 1000} {"train_loss": -5.389616012573242, "global_step": 42027, "epoch": 1000} {"train_loss": -5.564477920532227, "global_step": 42028, "epoch": 1000} {"train_loss": -5.618708610534668, "global_step": 42029, "epoch": 1000} {"train_loss": -5.744515895843506, "global_step": 42030, "epoch": 1000} {"train_loss": -5.551638603210449, "global_step": 42031, "epoch": 1000} {"train_loss": -5.374629974365234, "global_step": 42032, "epoch": 1000} {"train_loss": -5.603703498840332, "global_step": 42033, "epoch": 1000} {"train_loss": -5.574645042419434, "global_step": 42034, "epoch": 1000} {"train_loss": -5.50075626373291, "global_step": 42035, "epoch": 1000} {"train_loss": -5.584125995635986, "global_step": 42036, "epoch": 1000} {"train_loss": -5.520178318023682, "global_step": 42037, "epoch": 1000} {"train_loss": -5.5238776206970215, "global_step": 42038, "epoch": 1000} {"train_loss": -5.629118919372559, "global_step": 42039, "epoch": 1000} {"train_loss": -5.518956184387207, "global_step": 42040, "epoch": 1000} {"train_loss": -5.627850453058879, "global_step": 42041, "epoch": 1000, "train/sim_max_reward_0": 0.41068229851013616, "train/sim_max_reward_1": 0.3977710041384537, "train/sim_max_reward_2": 0.5910173302150681, "train/sim_max_reward_3": 0.5383089607610134, "train/sim_max_reward_4": 0.4850508169448111, "train/sim_max_reward_5": 0.5531944758985575, "test/sim_max_reward_4500000": 0.9216297623493862, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.6926761186363373, "test/sim_max_reward_4500003": 0.5850639028030629, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.6942336953961085, "test/sim_max_reward_4500006": 0.35162992669139687, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.13877151901595638, "test/sim_max_reward_4500009": 0.2136971958267994, "test/sim_max_reward_4500010": 0.3921447383294135, "test/sim_max_reward_4500011": 0.9681201670534111, "test/sim_max_reward_4500012": 0.2506877536011513, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.8130988997045789, "test/sim_max_reward_4500015": 0.6090737707947426, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.37247843816384324, "test/sim_max_reward_4500019": 0.7615899862431637, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.551204370331159, "test/sim_max_reward_4500022": 0.5937605478217479, "test/sim_max_reward_4500023": 0.859618065267892, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8814650858307259, "test/sim_max_reward_4500026": 0.15682830335809547, "test/sim_max_reward_4500027": 0.9777121216957934, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.05167089020169172, "test/sim_max_reward_4500030": 0.3277649434222934, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.4008160885969732, "test/sim_max_reward_4500033": 0.003052211634319562, "test/sim_max_reward_4500034": 0.7829123546330673, "test/sim_max_reward_4500035": 0.888257664235745, "test/sim_max_reward_4500036": 0.755644966742541, "test/sim_max_reward_4500037": 0.9229105816544813, "test/sim_max_reward_4500038": 0.19484509856831206, "test/sim_max_reward_4500039": 0.9477558137299398, "test/sim_max_reward_4500040": 0.8733492370887871, "test/sim_max_reward_4500041": 0.47518039085804004, "test/sim_max_reward_4500042": 0.15409132046204316, "test/sim_max_reward_4500043": 0.16525366166568656, "test/sim_max_reward_4500044": 0.5050334574047289, "test/sim_max_reward_4500045": 0.34772970015873866, "test/sim_max_reward_4500046": 0.6190128255290769, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9336384678550675, "test/sim_max_reward_4500049": 0.5115024853164117, "train/mean_score": 0.49600414774467333, "test/mean_score": 0.43812416422862294, "val_loss": 73874.234375} {"train_loss": -5.576715469360352, "global_step": 42042, "epoch": 1001} {"train_loss": -5.552457809448242, "global_step": 42043, "epoch": 1001} {"train_loss": -5.768886566162109, "global_step": 42044, "epoch": 1001} {"train_loss": -5.776174545288086, "global_step": 42045, "epoch": 1001} {"train_loss": -5.691913604736328, "global_step": 42046, "epoch": 1001} {"train_loss": -5.592798233032227, "global_step": 42047, "epoch": 1001} {"train_loss": -5.804682731628418, "global_step": 42048, "epoch": 1001} {"train_loss": -5.529677391052246, "global_step": 42049, "epoch": 1001} {"train_loss": -5.655163764953613, "global_step": 42050, "epoch": 1001} {"train_loss": -5.711688995361328, "global_step": 42051, "epoch": 1001} {"train_loss": -5.564033031463623, "global_step": 42052, "epoch": 1001} {"train_loss": -5.643463134765625, "global_step": 42053, "epoch": 1001} {"train_loss": -5.670097351074219, "global_step": 42054, "epoch": 1001} {"train_loss": -5.620425224304199, "global_step": 42055, "epoch": 1001} {"train_loss": -5.619654178619385, "global_step": 42056, "epoch": 1001} {"train_loss": -5.686241149902344, "global_step": 42057, "epoch": 1001} {"train_loss": -5.71274471282959, "global_step": 42058, "epoch": 1001} {"train_loss": -5.578423500061035, "global_step": 42059, "epoch": 1001} {"train_loss": -5.773586750030518, "global_step": 42060, "epoch": 1001} {"train_loss": -5.578993797302246, "global_step": 42061, "epoch": 1001} {"train_loss": -5.641517639160156, "global_step": 42062, "epoch": 1001} {"train_loss": -5.6686296463012695, "global_step": 42063, "epoch": 1001} {"train_loss": -5.688930988311768, "global_step": 42064, "epoch": 1001} {"train_loss": -5.690557479858398, "global_step": 42065, "epoch": 1001} {"train_loss": -5.645048141479492, "global_step": 42066, "epoch": 1001} {"train_loss": -5.592703819274902, "global_step": 42067, "epoch": 1001} {"train_loss": -5.712669372558594, "global_step": 42068, "epoch": 1001} {"train_loss": -5.667191982269287, "global_step": 42069, "epoch": 1001} {"train_loss": -5.684645175933838, "global_step": 42070, "epoch": 1001} {"train_loss": -5.661403656005859, "global_step": 42071, "epoch": 1001} {"train_loss": -5.6352691650390625, "global_step": 42072, "epoch": 1001} {"train_loss": -5.640592575073242, "global_step": 42073, "epoch": 1001} {"train_loss": -5.636266708374023, "global_step": 42074, "epoch": 1001} {"train_loss": -5.598806858062744, "global_step": 42075, "epoch": 1001} {"train_loss": -5.7042622566223145, "global_step": 42076, "epoch": 1001} {"train_loss": -5.695683479309082, "global_step": 42077, "epoch": 1001} {"train_loss": -5.756924629211426, "global_step": 42078, "epoch": 1001} {"train_loss": -5.753011703491211, "global_step": 42079, "epoch": 1001} {"train_loss": -5.7243242263793945, "global_step": 42080, "epoch": 1001} {"train_loss": -5.603050231933594, "global_step": 42081, "epoch": 1001} {"train_loss": -5.560751438140869, "global_step": 42082, "epoch": 1001} {"train_loss": -5.661726735887074, "global_step": 42083, "epoch": 1001, "val_loss": 74066.7421875} {"train_loss": -5.598822593688965, "global_step": 42084, "epoch": 1002} {"train_loss": -5.662628173828125, "global_step": 42085, "epoch": 1002} {"train_loss": -5.6358232498168945, "global_step": 42086, "epoch": 1002} {"train_loss": -5.570700645446777, "global_step": 42087, "epoch": 1002} {"train_loss": -5.655367374420166, "global_step": 42088, "epoch": 1002} {"train_loss": -5.710224151611328, "global_step": 42089, "epoch": 1002} {"train_loss": -5.531032562255859, "global_step": 42090, "epoch": 1002} {"train_loss": -5.652333736419678, "global_step": 42091, "epoch": 1002} {"train_loss": -5.841107368469238, "global_step": 42092, "epoch": 1002} {"train_loss": -5.701084136962891, "global_step": 42093, "epoch": 1002} {"train_loss": -5.710041046142578, "global_step": 42094, "epoch": 1002} {"train_loss": -5.660465717315674, "global_step": 42095, "epoch": 1002} {"train_loss": -5.656363487243652, "global_step": 42096, "epoch": 1002} {"train_loss": -5.705211639404297, "global_step": 42097, "epoch": 1002} {"train_loss": -5.619696617126465, "global_step": 42098, "epoch": 1002} {"train_loss": -5.544340133666992, "global_step": 42099, "epoch": 1002} {"train_loss": -5.720156669616699, "global_step": 42100, "epoch": 1002} {"train_loss": -5.686552047729492, "global_step": 42101, "epoch": 1002} {"train_loss": -5.670285224914551, "global_step": 42102, "epoch": 1002} {"train_loss": -5.766488075256348, "global_step": 42103, "epoch": 1002} {"train_loss": -5.726816654205322, "global_step": 42104, "epoch": 1002} {"train_loss": -5.672714710235596, "global_step": 42105, "epoch": 1002} {"train_loss": -5.673666954040527, "global_step": 42106, "epoch": 1002} {"train_loss": -5.8135576248168945, "global_step": 42107, "epoch": 1002} {"train_loss": -5.641189098358154, "global_step": 42108, "epoch": 1002} {"train_loss": -5.630361557006836, "global_step": 42109, "epoch": 1002} {"train_loss": -5.63330078125, "global_step": 42110, "epoch": 1002} {"train_loss": -5.705453872680664, "global_step": 42111, "epoch": 1002} {"train_loss": -5.730541229248047, "global_step": 42112, "epoch": 1002} {"train_loss": -5.468148231506348, "global_step": 42113, "epoch": 1002} {"train_loss": -5.637157440185547, "global_step": 42114, "epoch": 1002} {"train_loss": -5.600942611694336, "global_step": 42115, "epoch": 1002} {"train_loss": -5.742641925811768, "global_step": 42116, "epoch": 1002} {"train_loss": -5.568306922912598, "global_step": 42117, "epoch": 1002} {"train_loss": -5.666103363037109, "global_step": 42118, "epoch": 1002} {"train_loss": -5.66562557220459, "global_step": 42119, "epoch": 1002} {"train_loss": -5.659814834594727, "global_step": 42120, "epoch": 1002} {"train_loss": -5.56365966796875, "global_step": 42121, "epoch": 1002} {"train_loss": -5.626983642578125, "global_step": 42122, "epoch": 1002} {"train_loss": -5.607409477233887, "global_step": 42123, "epoch": 1002} {"train_loss": -5.685070991516113, "global_step": 42124, "epoch": 1002} {"train_loss": -5.659215245928083, "global_step": 42125, "epoch": 1002, "val_loss": 74391.7109375} {"train_loss": -5.588253021240234, "global_step": 42126, "epoch": 1003} {"train_loss": -5.646415710449219, "global_step": 42127, "epoch": 1003} {"train_loss": -5.640575408935547, "global_step": 42128, "epoch": 1003} {"train_loss": -5.577495574951172, "global_step": 42129, "epoch": 1003} {"train_loss": -5.725228786468506, "global_step": 42130, "epoch": 1003} {"train_loss": -5.566650390625, "global_step": 42131, "epoch": 1003} {"train_loss": -5.642181396484375, "global_step": 42132, "epoch": 1003} {"train_loss": -5.543874263763428, "global_step": 42133, "epoch": 1003} {"train_loss": -5.698542594909668, "global_step": 42134, "epoch": 1003} {"train_loss": -5.56629753112793, "global_step": 42135, "epoch": 1003} {"train_loss": -5.790740966796875, "global_step": 42136, "epoch": 1003} {"train_loss": -5.622462272644043, "global_step": 42137, "epoch": 1003} {"train_loss": -5.593788146972656, "global_step": 42138, "epoch": 1003} {"train_loss": -5.672544956207275, "global_step": 42139, "epoch": 1003} {"train_loss": -5.717310428619385, "global_step": 42140, "epoch": 1003} {"train_loss": -5.71921443939209, "global_step": 42141, "epoch": 1003} {"train_loss": -5.572025299072266, "global_step": 42142, "epoch": 1003} {"train_loss": -5.607182502746582, "global_step": 42143, "epoch": 1003} {"train_loss": -5.727870941162109, "global_step": 42144, "epoch": 1003} {"train_loss": -5.651308059692383, "global_step": 42145, "epoch": 1003} {"train_loss": -5.6438703536987305, "global_step": 42146, "epoch": 1003} {"train_loss": -5.613842487335205, "global_step": 42147, "epoch": 1003} {"train_loss": -5.648333549499512, "global_step": 42148, "epoch": 1003} {"train_loss": -5.595863342285156, "global_step": 42149, "epoch": 1003} {"train_loss": -5.719884872436523, "global_step": 42150, "epoch": 1003} {"train_loss": -5.485736846923828, "global_step": 42151, "epoch": 1003} {"train_loss": -5.676610469818115, "global_step": 42152, "epoch": 1003} {"train_loss": -5.7127227783203125, "global_step": 42153, "epoch": 1003} {"train_loss": -5.675343036651611, "global_step": 42154, "epoch": 1003} {"train_loss": -5.501800060272217, "global_step": 42155, "epoch": 1003} {"train_loss": -5.605287551879883, "global_step": 42156, "epoch": 1003} {"train_loss": -5.7673139572143555, "global_step": 42157, "epoch": 1003} {"train_loss": -5.390992164611816, "global_step": 42158, "epoch": 1003} {"train_loss": -5.631910800933838, "global_step": 42159, "epoch": 1003} {"train_loss": -5.6789960861206055, "global_step": 42160, "epoch": 1003} {"train_loss": -5.517953395843506, "global_step": 42161, "epoch": 1003} {"train_loss": -5.593850612640381, "global_step": 42162, "epoch": 1003} {"train_loss": -5.66706657409668, "global_step": 42163, "epoch": 1003} {"train_loss": -5.609105110168457, "global_step": 42164, "epoch": 1003} {"train_loss": -5.60004997253418, "global_step": 42165, "epoch": 1003} {"train_loss": -5.504818916320801, "global_step": 42166, "epoch": 1003} {"train_loss": -5.629194543475196, "global_step": 42167, "epoch": 1003, "val_loss": 74458.140625} {"train_loss": -5.538449764251709, "global_step": 42168, "epoch": 1004} {"train_loss": -5.574694633483887, "global_step": 42169, "epoch": 1004} {"train_loss": -5.566490173339844, "global_step": 42170, "epoch": 1004} {"train_loss": -5.638692855834961, "global_step": 42171, "epoch": 1004} {"train_loss": -5.564088821411133, "global_step": 42172, "epoch": 1004} {"train_loss": -5.549920558929443, "global_step": 42173, "epoch": 1004} {"train_loss": -5.687012195587158, "global_step": 42174, "epoch": 1004} {"train_loss": -5.610511779785156, "global_step": 42175, "epoch": 1004} {"train_loss": -5.542137145996094, "global_step": 42176, "epoch": 1004} {"train_loss": -5.502129554748535, "global_step": 42177, "epoch": 1004} {"train_loss": -5.648463726043701, "global_step": 42178, "epoch": 1004} {"train_loss": -5.5704193115234375, "global_step": 42179, "epoch": 1004} {"train_loss": -5.641849517822266, "global_step": 42180, "epoch": 1004} {"train_loss": -5.6750006675720215, "global_step": 42181, "epoch": 1004} {"train_loss": -5.664639472961426, "global_step": 42182, "epoch": 1004} {"train_loss": -5.707770347595215, "global_step": 42183, "epoch": 1004} {"train_loss": -5.599286079406738, "global_step": 42184, "epoch": 1004} {"train_loss": -5.633927345275879, "global_step": 42185, "epoch": 1004} {"train_loss": -5.769655704498291, "global_step": 42186, "epoch": 1004} {"train_loss": -5.629159927368164, "global_step": 42187, "epoch": 1004} {"train_loss": -5.676118850708008, "global_step": 42188, "epoch": 1004} {"train_loss": -5.766287803649902, "global_step": 42189, "epoch": 1004} {"train_loss": -5.641561508178711, "global_step": 42190, "epoch": 1004} {"train_loss": -5.599639892578125, "global_step": 42191, "epoch": 1004} {"train_loss": -5.68303108215332, "global_step": 42192, "epoch": 1004} {"train_loss": -5.740733623504639, "global_step": 42193, "epoch": 1004} {"train_loss": -5.676883220672607, "global_step": 42194, "epoch": 1004} {"train_loss": -5.544582843780518, "global_step": 42195, "epoch": 1004} {"train_loss": -5.85075044631958, "global_step": 42196, "epoch": 1004} {"train_loss": -5.6592888832092285, "global_step": 42197, "epoch": 1004} {"train_loss": -5.711711883544922, "global_step": 42198, "epoch": 1004} {"train_loss": -5.544334411621094, "global_step": 42199, "epoch": 1004} {"train_loss": -5.572722434997559, "global_step": 42200, "epoch": 1004} {"train_loss": -5.851579666137695, "global_step": 42201, "epoch": 1004} {"train_loss": -5.723871231079102, "global_step": 42202, "epoch": 1004} {"train_loss": -5.620511054992676, "global_step": 42203, "epoch": 1004} {"train_loss": -5.503355026245117, "global_step": 42204, "epoch": 1004} {"train_loss": -5.664579391479492, "global_step": 42205, "epoch": 1004} {"train_loss": -5.705644607543945, "global_step": 42206, "epoch": 1004} {"train_loss": -5.67296028137207, "global_step": 42207, "epoch": 1004} {"train_loss": -5.717324256896973, "global_step": 42208, "epoch": 1004} {"train_loss": -5.644077323731922, "global_step": 42209, "epoch": 1004, "val_loss": 74132.7734375} {"train_loss": -5.618083477020264, "global_step": 42210, "epoch": 1005} {"train_loss": -5.563074111938477, "global_step": 42211, "epoch": 1005} {"train_loss": -5.633153438568115, "global_step": 42212, "epoch": 1005} {"train_loss": -5.614671230316162, "global_step": 42213, "epoch": 1005} {"train_loss": -5.5771989822387695, "global_step": 42214, "epoch": 1005} {"train_loss": -5.665643692016602, "global_step": 42215, "epoch": 1005} {"train_loss": -5.425745010375977, "global_step": 42216, "epoch": 1005} {"train_loss": -5.697170734405518, "global_step": 42217, "epoch": 1005} {"train_loss": -5.695187568664551, "global_step": 42218, "epoch": 1005} {"train_loss": -5.700503349304199, "global_step": 42219, "epoch": 1005} {"train_loss": -5.724349021911621, "global_step": 42220, "epoch": 1005} {"train_loss": -5.637393951416016, "global_step": 42221, "epoch": 1005} {"train_loss": -5.743639945983887, "global_step": 42222, "epoch": 1005} {"train_loss": -5.680480480194092, "global_step": 42223, "epoch": 1005} {"train_loss": -5.759147644042969, "global_step": 42224, "epoch": 1005} {"train_loss": -5.543091773986816, "global_step": 42225, "epoch": 1005} {"train_loss": -5.723414897918701, "global_step": 42226, "epoch": 1005} {"train_loss": -5.672222137451172, "global_step": 42227, "epoch": 1005} {"train_loss": -5.738862037658691, "global_step": 42228, "epoch": 1005} {"train_loss": -5.526627540588379, "global_step": 42229, "epoch": 1005} {"train_loss": -5.539323329925537, "global_step": 42230, "epoch": 1005} {"train_loss": -5.594356060028076, "global_step": 42231, "epoch": 1005} {"train_loss": -5.711418151855469, "global_step": 42232, "epoch": 1005} {"train_loss": -5.593277931213379, "global_step": 42233, "epoch": 1005} {"train_loss": -5.5696516036987305, "global_step": 42234, "epoch": 1005} {"train_loss": -5.717137336730957, "global_step": 42235, "epoch": 1005} {"train_loss": -5.649079322814941, "global_step": 42236, "epoch": 1005} {"train_loss": -5.673418998718262, "global_step": 42237, "epoch": 1005} {"train_loss": -5.589132785797119, "global_step": 42238, "epoch": 1005} {"train_loss": -5.660031795501709, "global_step": 42239, "epoch": 1005} {"train_loss": -5.677997589111328, "global_step": 42240, "epoch": 1005} {"train_loss": -5.579564571380615, "global_step": 42241, "epoch": 1005} {"train_loss": -5.688551425933838, "global_step": 42242, "epoch": 1005} {"train_loss": -5.713580131530762, "global_step": 42243, "epoch": 1005} {"train_loss": -5.570916652679443, "global_step": 42244, "epoch": 1005} {"train_loss": -5.5725202560424805, "global_step": 42245, "epoch": 1005} {"train_loss": -5.806880474090576, "global_step": 42246, "epoch": 1005} {"train_loss": -5.625546455383301, "global_step": 42247, "epoch": 1005} {"train_loss": -5.765078544616699, "global_step": 42248, "epoch": 1005} {"train_loss": -5.706207275390625, "global_step": 42249, "epoch": 1005} {"train_loss": -5.639285087585449, "global_step": 42250, "epoch": 1005} {"train_loss": -5.648514384315128, "global_step": 42251, "epoch": 1005, "val_loss": 74179.3984375} {"train_loss": -5.642888069152832, "global_step": 42252, "epoch": 1006} {"train_loss": -5.685026168823242, "global_step": 42253, "epoch": 1006} {"train_loss": -5.583606719970703, "global_step": 42254, "epoch": 1006} {"train_loss": -5.794271945953369, "global_step": 42255, "epoch": 1006} {"train_loss": -5.542008399963379, "global_step": 42256, "epoch": 1006} {"train_loss": -5.651854991912842, "global_step": 42257, "epoch": 1006} {"train_loss": -5.669543743133545, "global_step": 42258, "epoch": 1006} {"train_loss": -5.6144304275512695, "global_step": 42259, "epoch": 1006} {"train_loss": -5.729910373687744, "global_step": 42260, "epoch": 1006} {"train_loss": -5.599019527435303, "global_step": 42261, "epoch": 1006} {"train_loss": -5.752344131469727, "global_step": 42262, "epoch": 1006} {"train_loss": -5.743774890899658, "global_step": 42263, "epoch": 1006} {"train_loss": -5.6047587394714355, "global_step": 42264, "epoch": 1006} {"train_loss": -5.644340515136719, "global_step": 42265, "epoch": 1006} {"train_loss": -5.6392388343811035, "global_step": 42266, "epoch": 1006} {"train_loss": -5.641483306884766, "global_step": 42267, "epoch": 1006} {"train_loss": -5.619466781616211, "global_step": 42268, "epoch": 1006} {"train_loss": -5.68836784362793, "global_step": 42269, "epoch": 1006} {"train_loss": -5.512722969055176, "global_step": 42270, "epoch": 1006} {"train_loss": -5.617724418640137, "global_step": 42271, "epoch": 1006} {"train_loss": -5.666515827178955, "global_step": 42272, "epoch": 1006} {"train_loss": -5.534851551055908, "global_step": 42273, "epoch": 1006} {"train_loss": -5.7472686767578125, "global_step": 42274, "epoch": 1006} {"train_loss": -5.557858943939209, "global_step": 42275, "epoch": 1006} {"train_loss": -5.633933067321777, "global_step": 42276, "epoch": 1006} {"train_loss": -5.554023742675781, "global_step": 42277, "epoch": 1006} {"train_loss": -5.509757041931152, "global_step": 42278, "epoch": 1006} {"train_loss": -5.648298740386963, "global_step": 42279, "epoch": 1006} {"train_loss": -5.7022857666015625, "global_step": 42280, "epoch": 1006} {"train_loss": -5.371323585510254, "global_step": 42281, "epoch": 1006} {"train_loss": -5.629964351654053, "global_step": 42282, "epoch": 1006} {"train_loss": -5.376979827880859, "global_step": 42283, "epoch": 1006} {"train_loss": -5.614069938659668, "global_step": 42284, "epoch": 1006} {"train_loss": -5.643911361694336, "global_step": 42285, "epoch": 1006} {"train_loss": -5.7436113357543945, "global_step": 42286, "epoch": 1006} {"train_loss": -5.640169143676758, "global_step": 42287, "epoch": 1006} {"train_loss": -5.576430797576904, "global_step": 42288, "epoch": 1006} {"train_loss": -5.564355850219727, "global_step": 42289, "epoch": 1006} {"train_loss": -5.522183418273926, "global_step": 42290, "epoch": 1006} {"train_loss": -5.593764305114746, "global_step": 42291, "epoch": 1006} {"train_loss": -5.7584028244018555, "global_step": 42292, "epoch": 1006} {"train_loss": -5.622402304694766, "global_step": 42293, "epoch": 1006, "val_loss": 73950.0546875} {"train_loss": -5.758349418640137, "global_step": 42294, "epoch": 1007} {"train_loss": -5.539881229400635, "global_step": 42295, "epoch": 1007} {"train_loss": -5.637641429901123, "global_step": 42296, "epoch": 1007} {"train_loss": -5.664777755737305, "global_step": 42297, "epoch": 1007} {"train_loss": -5.678806304931641, "global_step": 42298, "epoch": 1007} {"train_loss": -5.689864158630371, "global_step": 42299, "epoch": 1007} {"train_loss": -5.5945143699646, "global_step": 42300, "epoch": 1007} {"train_loss": -5.607882499694824, "global_step": 42301, "epoch": 1007} {"train_loss": -5.597792148590088, "global_step": 42302, "epoch": 1007} {"train_loss": -5.711554050445557, "global_step": 42303, "epoch": 1007} {"train_loss": -5.599609851837158, "global_step": 42304, "epoch": 1007} {"train_loss": -5.688111782073975, "global_step": 42305, "epoch": 1007} {"train_loss": -5.757697582244873, "global_step": 42306, "epoch": 1007} {"train_loss": -5.670358180999756, "global_step": 42307, "epoch": 1007} {"train_loss": -5.742768287658691, "global_step": 42308, "epoch": 1007} {"train_loss": -5.541928291320801, "global_step": 42309, "epoch": 1007} {"train_loss": -5.623361587524414, "global_step": 42310, "epoch": 1007} {"train_loss": -5.557323455810547, "global_step": 42311, "epoch": 1007} {"train_loss": -5.572183609008789, "global_step": 42312, "epoch": 1007} {"train_loss": -5.546507835388184, "global_step": 42313, "epoch": 1007} {"train_loss": -5.630219459533691, "global_step": 42314, "epoch": 1007} {"train_loss": -5.592026710510254, "global_step": 42315, "epoch": 1007} {"train_loss": -5.6158833503723145, "global_step": 42316, "epoch": 1007} {"train_loss": -5.72349214553833, "global_step": 42317, "epoch": 1007} {"train_loss": -5.676201820373535, "global_step": 42318, "epoch": 1007} {"train_loss": -5.681198596954346, "global_step": 42319, "epoch": 1007} {"train_loss": -5.537215232849121, "global_step": 42320, "epoch": 1007} {"train_loss": -5.565530776977539, "global_step": 42321, "epoch": 1007} {"train_loss": -5.554528713226318, "global_step": 42322, "epoch": 1007} {"train_loss": -5.635365009307861, "global_step": 42323, "epoch": 1007} {"train_loss": -5.504459381103516, "global_step": 42324, "epoch": 1007} {"train_loss": -5.676112174987793, "global_step": 42325, "epoch": 1007} {"train_loss": -5.6735944747924805, "global_step": 42326, "epoch": 1007} {"train_loss": -5.562206268310547, "global_step": 42327, "epoch": 1007} {"train_loss": -5.6587934494018555, "global_step": 42328, "epoch": 1007} {"train_loss": -5.6172075271606445, "global_step": 42329, "epoch": 1007} {"train_loss": -5.56624698638916, "global_step": 42330, "epoch": 1007} {"train_loss": -5.690733909606934, "global_step": 42331, "epoch": 1007} {"train_loss": -5.741881370544434, "global_step": 42332, "epoch": 1007} {"train_loss": -5.670645713806152, "global_step": 42333, "epoch": 1007} {"train_loss": -5.647160530090332, "global_step": 42334, "epoch": 1007} {"train_loss": -5.634394112087431, "global_step": 42335, "epoch": 1007, "val_loss": 73723.1953125} {"train_loss": -5.587745666503906, "global_step": 42336, "epoch": 1008} {"train_loss": -5.635528087615967, "global_step": 42337, "epoch": 1008} {"train_loss": -5.716228008270264, "global_step": 42338, "epoch": 1008} {"train_loss": -5.562591075897217, "global_step": 42339, "epoch": 1008} {"train_loss": -5.580986022949219, "global_step": 42340, "epoch": 1008} {"train_loss": -5.772707939147949, "global_step": 42341, "epoch": 1008} {"train_loss": -5.527338981628418, "global_step": 42342, "epoch": 1008} {"train_loss": -5.579968452453613, "global_step": 42343, "epoch": 1008} {"train_loss": -5.60970401763916, "global_step": 42344, "epoch": 1008} {"train_loss": -5.673979759216309, "global_step": 42345, "epoch": 1008} {"train_loss": -5.636255741119385, "global_step": 42346, "epoch": 1008} {"train_loss": -5.6829423904418945, "global_step": 42347, "epoch": 1008} {"train_loss": -5.611285209655762, "global_step": 42348, "epoch": 1008} {"train_loss": -5.485720157623291, "global_step": 42349, "epoch": 1008} {"train_loss": -5.777961730957031, "global_step": 42350, "epoch": 1008} {"train_loss": -5.646343231201172, "global_step": 42351, "epoch": 1008} {"train_loss": -5.626957893371582, "global_step": 42352, "epoch": 1008} {"train_loss": -5.609416961669922, "global_step": 42353, "epoch": 1008} {"train_loss": -5.747280597686768, "global_step": 42354, "epoch": 1008} {"train_loss": -5.786285400390625, "global_step": 42355, "epoch": 1008} {"train_loss": -5.638796806335449, "global_step": 42356, "epoch": 1008} {"train_loss": -5.702543258666992, "global_step": 42357, "epoch": 1008} {"train_loss": -5.6584320068359375, "global_step": 42358, "epoch": 1008} {"train_loss": -5.690908432006836, "global_step": 42359, "epoch": 1008} {"train_loss": -5.51465368270874, "global_step": 42360, "epoch": 1008} {"train_loss": -5.61476469039917, "global_step": 42361, "epoch": 1008} {"train_loss": -5.733426094055176, "global_step": 42362, "epoch": 1008} {"train_loss": -5.710476875305176, "global_step": 42363, "epoch": 1008} {"train_loss": -5.673433303833008, "global_step": 42364, "epoch": 1008} {"train_loss": -5.668404579162598, "global_step": 42365, "epoch": 1008} {"train_loss": -5.652415752410889, "global_step": 42366, "epoch": 1008} {"train_loss": -5.68210506439209, "global_step": 42367, "epoch": 1008} {"train_loss": -5.651234149932861, "global_step": 42368, "epoch": 1008} {"train_loss": -5.558472633361816, "global_step": 42369, "epoch": 1008} {"train_loss": -5.6788649559021, "global_step": 42370, "epoch": 1008} {"train_loss": -5.519157886505127, "global_step": 42371, "epoch": 1008} {"train_loss": -5.625412940979004, "global_step": 42372, "epoch": 1008} {"train_loss": -5.453439712524414, "global_step": 42373, "epoch": 1008} {"train_loss": -5.7841105461120605, "global_step": 42374, "epoch": 1008} {"train_loss": -5.6986083984375, "global_step": 42375, "epoch": 1008} {"train_loss": -5.566763877868652, "global_step": 42376, "epoch": 1008} {"train_loss": -5.644476595379057, "global_step": 42377, "epoch": 1008, "val_loss": 73680.3515625} {"train_loss": -5.670120716094971, "global_step": 42378, "epoch": 1009} {"train_loss": -5.611303329467773, "global_step": 42379, "epoch": 1009} {"train_loss": -5.699310779571533, "global_step": 42380, "epoch": 1009} {"train_loss": -5.610912322998047, "global_step": 42381, "epoch": 1009} {"train_loss": -5.758221626281738, "global_step": 42382, "epoch": 1009} {"train_loss": -5.738040924072266, "global_step": 42383, "epoch": 1009} {"train_loss": -5.74771785736084, "global_step": 42384, "epoch": 1009} {"train_loss": -5.631005764007568, "global_step": 42385, "epoch": 1009} {"train_loss": -5.7108659744262695, "global_step": 42386, "epoch": 1009} {"train_loss": -5.688641548156738, "global_step": 42387, "epoch": 1009} {"train_loss": -5.736071586608887, "global_step": 42388, "epoch": 1009} {"train_loss": -5.604870796203613, "global_step": 42389, "epoch": 1009} {"train_loss": -5.622046947479248, "global_step": 42390, "epoch": 1009} {"train_loss": -5.770122051239014, "global_step": 42391, "epoch": 1009} {"train_loss": -5.697078704833984, "global_step": 42392, "epoch": 1009} {"train_loss": -5.732649803161621, "global_step": 42393, "epoch": 1009} {"train_loss": -5.675256729125977, "global_step": 42394, "epoch": 1009} {"train_loss": -5.650284767150879, "global_step": 42395, "epoch": 1009} {"train_loss": -5.617217063903809, "global_step": 42396, "epoch": 1009} {"train_loss": -5.697028160095215, "global_step": 42397, "epoch": 1009} {"train_loss": -5.70682430267334, "global_step": 42398, "epoch": 1009} {"train_loss": -5.59101676940918, "global_step": 42399, "epoch": 1009} {"train_loss": -5.563263893127441, "global_step": 42400, "epoch": 1009} {"train_loss": -5.727793216705322, "global_step": 42401, "epoch": 1009} {"train_loss": -5.748198509216309, "global_step": 42402, "epoch": 1009} {"train_loss": -5.696694374084473, "global_step": 42403, "epoch": 1009} {"train_loss": -5.640477180480957, "global_step": 42404, "epoch": 1009} {"train_loss": -5.647559642791748, "global_step": 42405, "epoch": 1009} {"train_loss": -5.558685302734375, "global_step": 42406, "epoch": 1009} {"train_loss": -5.713838577270508, "global_step": 42407, "epoch": 1009} {"train_loss": -5.658307075500488, "global_step": 42408, "epoch": 1009} {"train_loss": -5.666335105895996, "global_step": 42409, "epoch": 1009} {"train_loss": -5.738777160644531, "global_step": 42410, "epoch": 1009} {"train_loss": -5.564452648162842, "global_step": 42411, "epoch": 1009} {"train_loss": -5.546990394592285, "global_step": 42412, "epoch": 1009} {"train_loss": -5.6522216796875, "global_step": 42413, "epoch": 1009} {"train_loss": -5.570042610168457, "global_step": 42414, "epoch": 1009} {"train_loss": -5.717160224914551, "global_step": 42415, "epoch": 1009} {"train_loss": -5.715014934539795, "global_step": 42416, "epoch": 1009} {"train_loss": -5.684168815612793, "global_step": 42417, "epoch": 1009} {"train_loss": -5.659375190734863, "global_step": 42418, "epoch": 1009} {"train_loss": -5.6690958340962725, "global_step": 42419, "epoch": 1009, "val_loss": 74496.8828125} {"train_loss": -5.546645164489746, "global_step": 42420, "epoch": 1010} {"train_loss": -5.629931449890137, "global_step": 42421, "epoch": 1010} {"train_loss": -5.651893615722656, "global_step": 42422, "epoch": 1010} {"train_loss": -5.787052631378174, "global_step": 42423, "epoch": 1010} {"train_loss": -5.724287986755371, "global_step": 42424, "epoch": 1010} {"train_loss": -5.662210464477539, "global_step": 42425, "epoch": 1010} {"train_loss": -5.674428939819336, "global_step": 42426, "epoch": 1010} {"train_loss": -5.621272087097168, "global_step": 42427, "epoch": 1010} {"train_loss": -5.62806510925293, "global_step": 42428, "epoch": 1010} {"train_loss": -5.602737903594971, "global_step": 42429, "epoch": 1010} {"train_loss": -5.767942428588867, "global_step": 42430, "epoch": 1010} {"train_loss": -5.713430404663086, "global_step": 42431, "epoch": 1010} {"train_loss": -5.737851142883301, "global_step": 42432, "epoch": 1010} {"train_loss": -5.756960868835449, "global_step": 42433, "epoch": 1010} {"train_loss": -5.609189987182617, "global_step": 42434, "epoch": 1010} {"train_loss": -5.750132083892822, "global_step": 42435, "epoch": 1010} {"train_loss": -5.777172088623047, "global_step": 42436, "epoch": 1010} {"train_loss": -5.678321361541748, "global_step": 42437, "epoch": 1010} {"train_loss": -5.723860740661621, "global_step": 42438, "epoch": 1010} {"train_loss": -5.843211650848389, "global_step": 42439, "epoch": 1010} {"train_loss": -5.6041717529296875, "global_step": 42440, "epoch": 1010} {"train_loss": -5.686176300048828, "global_step": 42441, "epoch": 1010} {"train_loss": -5.754171848297119, "global_step": 42442, "epoch": 1010} {"train_loss": -5.6992082595825195, "global_step": 42443, "epoch": 1010} {"train_loss": -5.683141708374023, "global_step": 42444, "epoch": 1010} {"train_loss": -5.690044403076172, "global_step": 42445, "epoch": 1010} {"train_loss": -5.53072452545166, "global_step": 42446, "epoch": 1010} {"train_loss": -5.7284698486328125, "global_step": 42447, "epoch": 1010} {"train_loss": -5.783008098602295, "global_step": 42448, "epoch": 1010} {"train_loss": -5.593951225280762, "global_step": 42449, "epoch": 1010} {"train_loss": -5.6665449142456055, "global_step": 42450, "epoch": 1010} {"train_loss": -5.621469497680664, "global_step": 42451, "epoch": 1010} {"train_loss": -5.654789924621582, "global_step": 42452, "epoch": 1010} {"train_loss": -5.745832443237305, "global_step": 42453, "epoch": 1010} {"train_loss": -5.671689033508301, "global_step": 42454, "epoch": 1010} {"train_loss": -5.611379623413086, "global_step": 42455, "epoch": 1010} {"train_loss": -5.677981376647949, "global_step": 42456, "epoch": 1010} {"train_loss": -5.7489914894104, "global_step": 42457, "epoch": 1010} {"train_loss": -5.6410017013549805, "global_step": 42458, "epoch": 1010} {"train_loss": -5.56312370300293, "global_step": 42459, "epoch": 1010} {"train_loss": -5.639154434204102, "global_step": 42460, "epoch": 1010} {"train_loss": -5.680810088203067, "global_step": 42461, "epoch": 1010, "val_loss": 73715.9140625} {"train_loss": -5.654740333557129, "global_step": 42462, "epoch": 1011} {"train_loss": -5.585814952850342, "global_step": 42463, "epoch": 1011} {"train_loss": -5.562972545623779, "global_step": 42464, "epoch": 1011} {"train_loss": -5.754701614379883, "global_step": 42465, "epoch": 1011} {"train_loss": -5.685153484344482, "global_step": 42466, "epoch": 1011} {"train_loss": -5.676670074462891, "global_step": 42467, "epoch": 1011} {"train_loss": -5.750048637390137, "global_step": 42468, "epoch": 1011} {"train_loss": -5.630245208740234, "global_step": 42469, "epoch": 1011} {"train_loss": -5.5606231689453125, "global_step": 42470, "epoch": 1011} {"train_loss": -5.668155670166016, "global_step": 42471, "epoch": 1011} {"train_loss": -5.733311653137207, "global_step": 42472, "epoch": 1011} {"train_loss": -5.631874084472656, "global_step": 42473, "epoch": 1011} {"train_loss": -5.885937213897705, "global_step": 42474, "epoch": 1011} {"train_loss": -5.70244836807251, "global_step": 42475, "epoch": 1011} {"train_loss": -5.7923583984375, "global_step": 42476, "epoch": 1011} {"train_loss": -5.699756145477295, "global_step": 42477, "epoch": 1011} {"train_loss": -5.677298545837402, "global_step": 42478, "epoch": 1011} {"train_loss": -5.619982719421387, "global_step": 42479, "epoch": 1011} {"train_loss": -5.695947647094727, "global_step": 42480, "epoch": 1011} {"train_loss": -5.565982341766357, "global_step": 42481, "epoch": 1011} {"train_loss": -5.636874198913574, "global_step": 42482, "epoch": 1011} {"train_loss": -5.6422576904296875, "global_step": 42483, "epoch": 1011} {"train_loss": -5.649420261383057, "global_step": 42484, "epoch": 1011} {"train_loss": -5.657106876373291, "global_step": 42485, "epoch": 1011} {"train_loss": -5.747698783874512, "global_step": 42486, "epoch": 1011} {"train_loss": -5.707159996032715, "global_step": 42487, "epoch": 1011} {"train_loss": -5.73184871673584, "global_step": 42488, "epoch": 1011} {"train_loss": -5.736551284790039, "global_step": 42489, "epoch": 1011} {"train_loss": -5.769550323486328, "global_step": 42490, "epoch": 1011} {"train_loss": -5.721574783325195, "global_step": 42491, "epoch": 1011} {"train_loss": -5.733664512634277, "global_step": 42492, "epoch": 1011} {"train_loss": -5.6654744148254395, "global_step": 42493, "epoch": 1011} {"train_loss": -5.782069683074951, "global_step": 42494, "epoch": 1011} {"train_loss": -5.579906940460205, "global_step": 42495, "epoch": 1011} {"train_loss": -5.615265846252441, "global_step": 42496, "epoch": 1011} {"train_loss": -5.677741527557373, "global_step": 42497, "epoch": 1011} {"train_loss": -5.648610591888428, "global_step": 42498, "epoch": 1011} {"train_loss": -5.648425579071045, "global_step": 42499, "epoch": 1011} {"train_loss": -5.755935192108154, "global_step": 42500, "epoch": 1011} {"train_loss": -5.67775821685791, "global_step": 42501, "epoch": 1011} {"train_loss": -5.753910064697266, "global_step": 42502, "epoch": 1011} {"train_loss": -5.686981133052281, "global_step": 42503, "epoch": 1011, "val_loss": 73707.1484375} {"train_loss": -5.621848106384277, "global_step": 42504, "epoch": 1012} {"train_loss": -5.716984272003174, "global_step": 42505, "epoch": 1012} {"train_loss": -5.589810371398926, "global_step": 42506, "epoch": 1012} {"train_loss": -5.76007080078125, "global_step": 42507, "epoch": 1012} {"train_loss": -5.584779739379883, "global_step": 42508, "epoch": 1012} {"train_loss": -5.62441349029541, "global_step": 42509, "epoch": 1012} {"train_loss": -5.724084854125977, "global_step": 42510, "epoch": 1012} {"train_loss": -5.651037216186523, "global_step": 42511, "epoch": 1012} {"train_loss": -5.614262580871582, "global_step": 42512, "epoch": 1012} {"train_loss": -5.805723190307617, "global_step": 42513, "epoch": 1012} {"train_loss": -5.770285606384277, "global_step": 42514, "epoch": 1012} {"train_loss": -5.757109642028809, "global_step": 42515, "epoch": 1012} {"train_loss": -5.651593208312988, "global_step": 42516, "epoch": 1012} {"train_loss": -5.73891544342041, "global_step": 42517, "epoch": 1012} {"train_loss": -5.722233772277832, "global_step": 42518, "epoch": 1012} {"train_loss": -5.702671051025391, "global_step": 42519, "epoch": 1012} {"train_loss": -5.735097885131836, "global_step": 42520, "epoch": 1012} {"train_loss": -5.822358131408691, "global_step": 42521, "epoch": 1012} {"train_loss": -5.7376508712768555, "global_step": 42522, "epoch": 1012} {"train_loss": -5.677136421203613, "global_step": 42523, "epoch": 1012} {"train_loss": -5.68022346496582, "global_step": 42524, "epoch": 1012} {"train_loss": -5.578866958618164, "global_step": 42525, "epoch": 1012} {"train_loss": -5.6386919021606445, "global_step": 42526, "epoch": 1012} {"train_loss": -5.688712120056152, "global_step": 42527, "epoch": 1012} {"train_loss": -5.73185920715332, "global_step": 42528, "epoch": 1012} {"train_loss": -5.5198822021484375, "global_step": 42529, "epoch": 1012} {"train_loss": -5.690035820007324, "global_step": 42530, "epoch": 1012} {"train_loss": -5.638523101806641, "global_step": 42531, "epoch": 1012} {"train_loss": -5.716194152832031, "global_step": 42532, "epoch": 1012} {"train_loss": -5.639126777648926, "global_step": 42533, "epoch": 1012} {"train_loss": -5.709206581115723, "global_step": 42534, "epoch": 1012} {"train_loss": -5.622804641723633, "global_step": 42535, "epoch": 1012} {"train_loss": -5.567732810974121, "global_step": 42536, "epoch": 1012} {"train_loss": -5.628468036651611, "global_step": 42537, "epoch": 1012} {"train_loss": -5.5772552490234375, "global_step": 42538, "epoch": 1012} {"train_loss": -5.532257556915283, "global_step": 42539, "epoch": 1012} {"train_loss": -5.644874572753906, "global_step": 42540, "epoch": 1012} {"train_loss": -5.645273685455322, "global_step": 42541, "epoch": 1012} {"train_loss": -5.513815402984619, "global_step": 42542, "epoch": 1012} {"train_loss": -5.582034111022949, "global_step": 42543, "epoch": 1012} {"train_loss": -5.562595367431641, "global_step": 42544, "epoch": 1012} {"train_loss": -5.659375145321801, "global_step": 42545, "epoch": 1012, "val_loss": 74385.2578125} {"train_loss": -5.386938095092773, "global_step": 42546, "epoch": 1013} {"train_loss": -5.694863319396973, "global_step": 42547, "epoch": 1013} {"train_loss": -5.627686500549316, "global_step": 42548, "epoch": 1013} {"train_loss": -5.598668098449707, "global_step": 42549, "epoch": 1013} {"train_loss": -5.695616722106934, "global_step": 42550, "epoch": 1013} {"train_loss": -5.659460067749023, "global_step": 42551, "epoch": 1013} {"train_loss": -5.639019012451172, "global_step": 42552, "epoch": 1013} {"train_loss": -5.57942008972168, "global_step": 42553, "epoch": 1013} {"train_loss": -5.569606781005859, "global_step": 42554, "epoch": 1013} {"train_loss": -5.695809364318848, "global_step": 42555, "epoch": 1013} {"train_loss": -5.6547160148620605, "global_step": 42556, "epoch": 1013} {"train_loss": -5.634591102600098, "global_step": 42557, "epoch": 1013} {"train_loss": -5.732907772064209, "global_step": 42558, "epoch": 1013} {"train_loss": -5.78355073928833, "global_step": 42559, "epoch": 1013} {"train_loss": -5.546929359436035, "global_step": 42560, "epoch": 1013} {"train_loss": -5.545021057128906, "global_step": 42561, "epoch": 1013} {"train_loss": -5.668830871582031, "global_step": 42562, "epoch": 1013} {"train_loss": -5.592006683349609, "global_step": 42563, "epoch": 1013} {"train_loss": -5.615102767944336, "global_step": 42564, "epoch": 1013} {"train_loss": -5.646984577178955, "global_step": 42565, "epoch": 1013} {"train_loss": -5.652959823608398, "global_step": 42566, "epoch": 1013} {"train_loss": -5.617264747619629, "global_step": 42567, "epoch": 1013} {"train_loss": -5.55197811126709, "global_step": 42568, "epoch": 1013} {"train_loss": -5.558971405029297, "global_step": 42569, "epoch": 1013} {"train_loss": -5.56035041809082, "global_step": 42570, "epoch": 1013} {"train_loss": -5.824866771697998, "global_step": 42571, "epoch": 1013} {"train_loss": -5.62531852722168, "global_step": 42572, "epoch": 1013} {"train_loss": -5.7605366706848145, "global_step": 42573, "epoch": 1013} {"train_loss": -5.839815139770508, "global_step": 42574, "epoch": 1013} {"train_loss": -5.743714809417725, "global_step": 42575, "epoch": 1013} {"train_loss": -5.751284599304199, "global_step": 42576, "epoch": 1013} {"train_loss": -5.672056198120117, "global_step": 42577, "epoch": 1013} {"train_loss": -5.603569984436035, "global_step": 42578, "epoch": 1013} {"train_loss": -5.699806213378906, "global_step": 42579, "epoch": 1013} {"train_loss": -5.711176872253418, "global_step": 42580, "epoch": 1013} {"train_loss": -5.753750801086426, "global_step": 42581, "epoch": 1013} {"train_loss": -5.738027095794678, "global_step": 42582, "epoch": 1013} {"train_loss": -5.653525352478027, "global_step": 42583, "epoch": 1013} {"train_loss": -5.660038948059082, "global_step": 42584, "epoch": 1013} {"train_loss": -5.616413593292236, "global_step": 42585, "epoch": 1013} {"train_loss": -5.781038761138916, "global_step": 42586, "epoch": 1013} {"train_loss": -5.659013180505662, "global_step": 42587, "epoch": 1013, "val_loss": 73565.484375} {"train_loss": -5.770347595214844, "global_step": 42588, "epoch": 1014} {"train_loss": -5.520514488220215, "global_step": 42589, "epoch": 1014} {"train_loss": -5.62446403503418, "global_step": 42590, "epoch": 1014} {"train_loss": -5.548781871795654, "global_step": 42591, "epoch": 1014} {"train_loss": -5.5738301277160645, "global_step": 42592, "epoch": 1014} {"train_loss": -5.624856948852539, "global_step": 42593, "epoch": 1014} {"train_loss": -5.812725067138672, "global_step": 42594, "epoch": 1014} {"train_loss": -5.678491592407227, "global_step": 42595, "epoch": 1014} {"train_loss": -5.57027530670166, "global_step": 42596, "epoch": 1014} {"train_loss": -5.815027236938477, "global_step": 42597, "epoch": 1014} {"train_loss": -5.712924003601074, "global_step": 42598, "epoch": 1014} {"train_loss": -5.67488956451416, "global_step": 42599, "epoch": 1014} {"train_loss": -5.662970542907715, "global_step": 42600, "epoch": 1014} {"train_loss": -5.7328596115112305, "global_step": 42601, "epoch": 1014} {"train_loss": -5.617705345153809, "global_step": 42602, "epoch": 1014} {"train_loss": -5.803749084472656, "global_step": 42603, "epoch": 1014} {"train_loss": -5.669623851776123, "global_step": 42604, "epoch": 1014} {"train_loss": -5.7639265060424805, "global_step": 42605, "epoch": 1014} {"train_loss": -5.693368911743164, "global_step": 42606, "epoch": 1014} {"train_loss": -5.61581563949585, "global_step": 42607, "epoch": 1014} {"train_loss": -5.722872257232666, "global_step": 42608, "epoch": 1014} {"train_loss": -5.729057312011719, "global_step": 42609, "epoch": 1014} {"train_loss": -5.677987098693848, "global_step": 42610, "epoch": 1014} {"train_loss": -5.676949501037598, "global_step": 42611, "epoch": 1014} {"train_loss": -5.666759490966797, "global_step": 42612, "epoch": 1014} {"train_loss": -5.654509544372559, "global_step": 42613, "epoch": 1014} {"train_loss": -5.758672714233398, "global_step": 42614, "epoch": 1014} {"train_loss": -5.652187824249268, "global_step": 42615, "epoch": 1014} {"train_loss": -5.721395492553711, "global_step": 42616, "epoch": 1014} {"train_loss": -5.60166072845459, "global_step": 42617, "epoch": 1014} {"train_loss": -5.643945693969727, "global_step": 42618, "epoch": 1014} {"train_loss": -5.6960859298706055, "global_step": 42619, "epoch": 1014} {"train_loss": -5.568519592285156, "global_step": 42620, "epoch": 1014} {"train_loss": -5.708314895629883, "global_step": 42621, "epoch": 1014} {"train_loss": -5.6282830238342285, "global_step": 42622, "epoch": 1014} {"train_loss": -5.687069892883301, "global_step": 42623, "epoch": 1014} {"train_loss": -5.747061729431152, "global_step": 42624, "epoch": 1014} {"train_loss": -5.628086566925049, "global_step": 42625, "epoch": 1014} {"train_loss": -5.707103729248047, "global_step": 42626, "epoch": 1014} {"train_loss": -5.730035781860352, "global_step": 42627, "epoch": 1014} {"train_loss": -5.677060604095459, "global_step": 42628, "epoch": 1014} {"train_loss": -5.676949183146159, "global_step": 42629, "epoch": 1014, "val_loss": 74162.9296875} {"train_loss": -5.660417556762695, "global_step": 42630, "epoch": 1015} {"train_loss": -5.75834321975708, "global_step": 42631, "epoch": 1015} {"train_loss": -5.634100914001465, "global_step": 42632, "epoch": 1015} {"train_loss": -5.750683784484863, "global_step": 42633, "epoch": 1015} {"train_loss": -5.667071342468262, "global_step": 42634, "epoch": 1015} {"train_loss": -5.643251419067383, "global_step": 42635, "epoch": 1015} {"train_loss": -5.637185573577881, "global_step": 42636, "epoch": 1015} {"train_loss": -5.603950500488281, "global_step": 42637, "epoch": 1015} {"train_loss": -5.614962577819824, "global_step": 42638, "epoch": 1015} {"train_loss": -5.618427753448486, "global_step": 42639, "epoch": 1015} {"train_loss": -5.705777168273926, "global_step": 42640, "epoch": 1015} {"train_loss": -5.50814151763916, "global_step": 42641, "epoch": 1015} {"train_loss": -5.704631805419922, "global_step": 42642, "epoch": 1015} {"train_loss": -5.504368782043457, "global_step": 42643, "epoch": 1015} {"train_loss": -5.585984230041504, "global_step": 42644, "epoch": 1015} {"train_loss": -5.66597843170166, "global_step": 42645, "epoch": 1015} {"train_loss": -5.721715450286865, "global_step": 42646, "epoch": 1015} {"train_loss": -5.617803573608398, "global_step": 42647, "epoch": 1015} {"train_loss": -5.6536970138549805, "global_step": 42648, "epoch": 1015} {"train_loss": -5.50554084777832, "global_step": 42649, "epoch": 1015} {"train_loss": -5.73280668258667, "global_step": 42650, "epoch": 1015} {"train_loss": -5.715471267700195, "global_step": 42651, "epoch": 1015} {"train_loss": -5.5623321533203125, "global_step": 42652, "epoch": 1015} {"train_loss": -5.618204116821289, "global_step": 42653, "epoch": 1015} {"train_loss": -5.607054710388184, "global_step": 42654, "epoch": 1015} {"train_loss": -5.423286437988281, "global_step": 42655, "epoch": 1015} {"train_loss": -5.6110334396362305, "global_step": 42656, "epoch": 1015} {"train_loss": -5.567839622497559, "global_step": 42657, "epoch": 1015} {"train_loss": -5.652707099914551, "global_step": 42658, "epoch": 1015} {"train_loss": -5.56643533706665, "global_step": 42659, "epoch": 1015} {"train_loss": -5.527035713195801, "global_step": 42660, "epoch": 1015} {"train_loss": -5.595730304718018, "global_step": 42661, "epoch": 1015} {"train_loss": -5.528192043304443, "global_step": 42662, "epoch": 1015} {"train_loss": -5.687857151031494, "global_step": 42663, "epoch": 1015} {"train_loss": -5.434543132781982, "global_step": 42664, "epoch": 1015} {"train_loss": -5.604773044586182, "global_step": 42665, "epoch": 1015} {"train_loss": -5.563533782958984, "global_step": 42666, "epoch": 1015} {"train_loss": -5.620367527008057, "global_step": 42667, "epoch": 1015} {"train_loss": -5.67177677154541, "global_step": 42668, "epoch": 1015} {"train_loss": -5.666885852813721, "global_step": 42669, "epoch": 1015} {"train_loss": -5.6326704025268555, "global_step": 42670, "epoch": 1015} {"train_loss": -5.6201443785712835, "global_step": 42671, "epoch": 1015, "val_loss": 73910.453125} {"train_loss": -5.55010986328125, "global_step": 42672, "epoch": 1016} {"train_loss": -5.630765914916992, "global_step": 42673, "epoch": 1016} {"train_loss": -5.638667106628418, "global_step": 42674, "epoch": 1016} {"train_loss": -5.6081953048706055, "global_step": 42675, "epoch": 1016} {"train_loss": -5.66208553314209, "global_step": 42676, "epoch": 1016} {"train_loss": -5.7488532066345215, "global_step": 42677, "epoch": 1016} {"train_loss": -5.722449779510498, "global_step": 42678, "epoch": 1016} {"train_loss": -5.726192951202393, "global_step": 42679, "epoch": 1016} {"train_loss": -5.641988754272461, "global_step": 42680, "epoch": 1016} {"train_loss": -5.6494832038879395, "global_step": 42681, "epoch": 1016} {"train_loss": -5.706806659698486, "global_step": 42682, "epoch": 1016} {"train_loss": -5.579432487487793, "global_step": 42683, "epoch": 1016} {"train_loss": -5.767119407653809, "global_step": 42684, "epoch": 1016} {"train_loss": -5.662374496459961, "global_step": 42685, "epoch": 1016} {"train_loss": -5.695905685424805, "global_step": 42686, "epoch": 1016} {"train_loss": -5.503170013427734, "global_step": 42687, "epoch": 1016} {"train_loss": -5.623025417327881, "global_step": 42688, "epoch": 1016} {"train_loss": -5.714061737060547, "global_step": 42689, "epoch": 1016} {"train_loss": -5.7189154624938965, "global_step": 42690, "epoch": 1016} {"train_loss": -5.643499374389648, "global_step": 42691, "epoch": 1016} {"train_loss": -5.70999813079834, "global_step": 42692, "epoch": 1016} {"train_loss": -5.6371169090271, "global_step": 42693, "epoch": 1016} {"train_loss": -5.59707498550415, "global_step": 42694, "epoch": 1016} {"train_loss": -5.584231853485107, "global_step": 42695, "epoch": 1016} {"train_loss": -5.70711612701416, "global_step": 42696, "epoch": 1016} {"train_loss": -5.798183917999268, "global_step": 42697, "epoch": 1016} {"train_loss": -5.524378299713135, "global_step": 42698, "epoch": 1016} {"train_loss": -5.791944980621338, "global_step": 42699, "epoch": 1016} {"train_loss": -5.691032886505127, "global_step": 42700, "epoch": 1016} {"train_loss": -5.62170934677124, "global_step": 42701, "epoch": 1016} {"train_loss": -5.643329620361328, "global_step": 42702, "epoch": 1016} {"train_loss": -5.604912757873535, "global_step": 42703, "epoch": 1016} {"train_loss": -5.684779644012451, "global_step": 42704, "epoch": 1016} {"train_loss": -5.648894309997559, "global_step": 42705, "epoch": 1016} {"train_loss": -5.740350723266602, "global_step": 42706, "epoch": 1016} {"train_loss": -5.633577346801758, "global_step": 42707, "epoch": 1016} {"train_loss": -5.677066802978516, "global_step": 42708, "epoch": 1016} {"train_loss": -5.7291059494018555, "global_step": 42709, "epoch": 1016} {"train_loss": -5.56754207611084, "global_step": 42710, "epoch": 1016} {"train_loss": -5.613911151885986, "global_step": 42711, "epoch": 1016} {"train_loss": -5.569308280944824, "global_step": 42712, "epoch": 1016} {"train_loss": -5.656158004488264, "global_step": 42713, "epoch": 1016, "val_loss": 74241.9921875} {"train_loss": -5.6724348068237305, "global_step": 42714, "epoch": 1017} {"train_loss": -5.4717183113098145, "global_step": 42715, "epoch": 1017} {"train_loss": -5.663368225097656, "global_step": 42716, "epoch": 1017} {"train_loss": -5.594932556152344, "global_step": 42717, "epoch": 1017} {"train_loss": -5.649497985839844, "global_step": 42718, "epoch": 1017} {"train_loss": -5.717526435852051, "global_step": 42719, "epoch": 1017} {"train_loss": -5.521903038024902, "global_step": 42720, "epoch": 1017} {"train_loss": -5.749881744384766, "global_step": 42721, "epoch": 1017} {"train_loss": -5.519587516784668, "global_step": 42722, "epoch": 1017} {"train_loss": -5.629518508911133, "global_step": 42723, "epoch": 1017} {"train_loss": -5.69816780090332, "global_step": 42724, "epoch": 1017} {"train_loss": -5.76816463470459, "global_step": 42725, "epoch": 1017} {"train_loss": -5.772505283355713, "global_step": 42726, "epoch": 1017} {"train_loss": -5.756025314331055, "global_step": 42727, "epoch": 1017} {"train_loss": -5.607797622680664, "global_step": 42728, "epoch": 1017} {"train_loss": -5.655735969543457, "global_step": 42729, "epoch": 1017} {"train_loss": -5.704814434051514, "global_step": 42730, "epoch": 1017} {"train_loss": -5.686468601226807, "global_step": 42731, "epoch": 1017} {"train_loss": -5.642691612243652, "global_step": 42732, "epoch": 1017} {"train_loss": -5.653566837310791, "global_step": 42733, "epoch": 1017} {"train_loss": -5.555872917175293, "global_step": 42734, "epoch": 1017} {"train_loss": -5.62187385559082, "global_step": 42735, "epoch": 1017} {"train_loss": -5.567048072814941, "global_step": 42736, "epoch": 1017} {"train_loss": -5.679960250854492, "global_step": 42737, "epoch": 1017} {"train_loss": -5.805769920349121, "global_step": 42738, "epoch": 1017} {"train_loss": -5.657582759857178, "global_step": 42739, "epoch": 1017} {"train_loss": -5.755504608154297, "global_step": 42740, "epoch": 1017} {"train_loss": -5.660384654998779, "global_step": 42741, "epoch": 1017} {"train_loss": -5.697431564331055, "global_step": 42742, "epoch": 1017} {"train_loss": -5.710253715515137, "global_step": 42743, "epoch": 1017} {"train_loss": -5.848296642303467, "global_step": 42744, "epoch": 1017} {"train_loss": -5.692409515380859, "global_step": 42745, "epoch": 1017} {"train_loss": -5.664526462554932, "global_step": 42746, "epoch": 1017} {"train_loss": -5.730018615722656, "global_step": 42747, "epoch": 1017} {"train_loss": -5.7419939041137695, "global_step": 42748, "epoch": 1017} {"train_loss": -5.653131484985352, "global_step": 42749, "epoch": 1017} {"train_loss": -5.717617988586426, "global_step": 42750, "epoch": 1017} {"train_loss": -5.630706787109375, "global_step": 42751, "epoch": 1017} {"train_loss": -5.612955570220947, "global_step": 42752, "epoch": 1017} {"train_loss": -5.549535751342773, "global_step": 42753, "epoch": 1017} {"train_loss": -5.577748775482178, "global_step": 42754, "epoch": 1017} {"train_loss": -5.6647026879446845, "global_step": 42755, "epoch": 1017, "val_loss": 73706.7578125} {"train_loss": -5.668186664581299, "global_step": 42756, "epoch": 1018} {"train_loss": -5.651285171508789, "global_step": 42757, "epoch": 1018} {"train_loss": -5.7091875076293945, "global_step": 42758, "epoch": 1018} {"train_loss": -5.665767669677734, "global_step": 42759, "epoch": 1018} {"train_loss": -5.598049163818359, "global_step": 42760, "epoch": 1018} {"train_loss": -5.569243431091309, "global_step": 42761, "epoch": 1018} {"train_loss": -5.756731986999512, "global_step": 42762, "epoch": 1018} {"train_loss": -5.6348371505737305, "global_step": 42763, "epoch": 1018} {"train_loss": -5.724481105804443, "global_step": 42764, "epoch": 1018} {"train_loss": -5.6942243576049805, "global_step": 42765, "epoch": 1018} {"train_loss": -5.558555603027344, "global_step": 42766, "epoch": 1018} {"train_loss": -5.7958083152771, "global_step": 42767, "epoch": 1018} {"train_loss": -5.6514739990234375, "global_step": 42768, "epoch": 1018} {"train_loss": -5.616629600524902, "global_step": 42769, "epoch": 1018} {"train_loss": -5.845385551452637, "global_step": 42770, "epoch": 1018} {"train_loss": -5.820831298828125, "global_step": 42771, "epoch": 1018} {"train_loss": -5.74581241607666, "global_step": 42772, "epoch": 1018} {"train_loss": -5.810502052307129, "global_step": 42773, "epoch": 1018} {"train_loss": -5.634760856628418, "global_step": 42774, "epoch": 1018} {"train_loss": -5.697298526763916, "global_step": 42775, "epoch": 1018} {"train_loss": -5.583675384521484, "global_step": 42776, "epoch": 1018} {"train_loss": -5.649139404296875, "global_step": 42777, "epoch": 1018} {"train_loss": -5.643875598907471, "global_step": 42778, "epoch": 1018} {"train_loss": -5.70815372467041, "global_step": 42779, "epoch": 1018} {"train_loss": -5.663514137268066, "global_step": 42780, "epoch": 1018} {"train_loss": -5.7546706199646, "global_step": 42781, "epoch": 1018} {"train_loss": -5.6062822341918945, "global_step": 42782, "epoch": 1018} {"train_loss": -5.676135540008545, "global_step": 42783, "epoch": 1018} {"train_loss": -5.627408027648926, "global_step": 42784, "epoch": 1018} {"train_loss": -5.743346691131592, "global_step": 42785, "epoch": 1018} {"train_loss": -5.601632118225098, "global_step": 42786, "epoch": 1018} {"train_loss": -5.726572036743164, "global_step": 42787, "epoch": 1018} {"train_loss": -5.734549045562744, "global_step": 42788, "epoch": 1018} {"train_loss": -5.5774312019348145, "global_step": 42789, "epoch": 1018} {"train_loss": -5.641420364379883, "global_step": 42790, "epoch": 1018} {"train_loss": -5.756988525390625, "global_step": 42791, "epoch": 1018} {"train_loss": -5.428117275238037, "global_step": 42792, "epoch": 1018} {"train_loss": -5.646241188049316, "global_step": 42793, "epoch": 1018} {"train_loss": -5.496784210205078, "global_step": 42794, "epoch": 1018} {"train_loss": -5.577804088592529, "global_step": 42795, "epoch": 1018} {"train_loss": -5.614482879638672, "global_step": 42796, "epoch": 1018} {"train_loss": -5.66230186961946, "global_step": 42797, "epoch": 1018, "val_loss": 74334.234375} {"train_loss": -5.520504951477051, "global_step": 42798, "epoch": 1019} {"train_loss": -5.6870598793029785, "global_step": 42799, "epoch": 1019} {"train_loss": -5.637174606323242, "global_step": 42800, "epoch": 1019} {"train_loss": -5.705818176269531, "global_step": 42801, "epoch": 1019} {"train_loss": -5.533135414123535, "global_step": 42802, "epoch": 1019} {"train_loss": -5.725574493408203, "global_step": 42803, "epoch": 1019} {"train_loss": -5.485695838928223, "global_step": 42804, "epoch": 1019} {"train_loss": -5.546449184417725, "global_step": 42805, "epoch": 1019} {"train_loss": -5.593292713165283, "global_step": 42806, "epoch": 1019} {"train_loss": -5.5518598556518555, "global_step": 42807, "epoch": 1019} {"train_loss": -5.554872512817383, "global_step": 42808, "epoch": 1019} {"train_loss": -5.636288642883301, "global_step": 42809, "epoch": 1019} {"train_loss": -5.6547040939331055, "global_step": 42810, "epoch": 1019} {"train_loss": -5.683584213256836, "global_step": 42811, "epoch": 1019} {"train_loss": -5.703559875488281, "global_step": 42812, "epoch": 1019} {"train_loss": -5.637395858764648, "global_step": 42813, "epoch": 1019} {"train_loss": -5.71082878112793, "global_step": 42814, "epoch": 1019} {"train_loss": -5.662977695465088, "global_step": 42815, "epoch": 1019} {"train_loss": -5.621973037719727, "global_step": 42816, "epoch": 1019} {"train_loss": -5.71945858001709, "global_step": 42817, "epoch": 1019} {"train_loss": -5.63623571395874, "global_step": 42818, "epoch": 1019} {"train_loss": -5.693274021148682, "global_step": 42819, "epoch": 1019} {"train_loss": -5.640946388244629, "global_step": 42820, "epoch": 1019} {"train_loss": -5.675817489624023, "global_step": 42821, "epoch": 1019} {"train_loss": -5.760236740112305, "global_step": 42822, "epoch": 1019} {"train_loss": -5.794615745544434, "global_step": 42823, "epoch": 1019} {"train_loss": -5.640139102935791, "global_step": 42824, "epoch": 1019} {"train_loss": -5.63245964050293, "global_step": 42825, "epoch": 1019} {"train_loss": -5.596964359283447, "global_step": 42826, "epoch": 1019} {"train_loss": -5.614226341247559, "global_step": 42827, "epoch": 1019} {"train_loss": -5.610930442810059, "global_step": 42828, "epoch": 1019} {"train_loss": -5.695710182189941, "global_step": 42829, "epoch": 1019} {"train_loss": -5.706186294555664, "global_step": 42830, "epoch": 1019} {"train_loss": -5.725058555603027, "global_step": 42831, "epoch": 1019} {"train_loss": -5.661747932434082, "global_step": 42832, "epoch": 1019} {"train_loss": -5.713614463806152, "global_step": 42833, "epoch": 1019} {"train_loss": -5.622829914093018, "global_step": 42834, "epoch": 1019} {"train_loss": -5.670865535736084, "global_step": 42835, "epoch": 1019} {"train_loss": -5.713117599487305, "global_step": 42836, "epoch": 1019} {"train_loss": -5.631529808044434, "global_step": 42837, "epoch": 1019} {"train_loss": -5.620593070983887, "global_step": 42838, "epoch": 1019} {"train_loss": -5.647575526010423, "global_step": 42839, "epoch": 1019, "val_loss": 73680.03125} {"train_loss": -5.667403221130371, "global_step": 42840, "epoch": 1020} {"train_loss": -5.687069416046143, "global_step": 42841, "epoch": 1020} {"train_loss": -5.645265102386475, "global_step": 42842, "epoch": 1020} {"train_loss": -5.599468231201172, "global_step": 42843, "epoch": 1020} {"train_loss": -5.669163703918457, "global_step": 42844, "epoch": 1020} {"train_loss": -5.722705841064453, "global_step": 42845, "epoch": 1020} {"train_loss": -5.669630527496338, "global_step": 42846, "epoch": 1020} {"train_loss": -5.789737701416016, "global_step": 42847, "epoch": 1020} {"train_loss": -5.684509754180908, "global_step": 42848, "epoch": 1020} {"train_loss": -5.586355209350586, "global_step": 42849, "epoch": 1020} {"train_loss": -5.585206985473633, "global_step": 42850, "epoch": 1020} {"train_loss": -5.708649158477783, "global_step": 42851, "epoch": 1020} {"train_loss": -5.771549224853516, "global_step": 42852, "epoch": 1020} {"train_loss": -5.797853469848633, "global_step": 42853, "epoch": 1020} {"train_loss": -5.718643665313721, "global_step": 42854, "epoch": 1020} {"train_loss": -5.702317237854004, "global_step": 42855, "epoch": 1020} {"train_loss": -5.762596130371094, "global_step": 42856, "epoch": 1020} {"train_loss": -5.6410112380981445, "global_step": 42857, "epoch": 1020} {"train_loss": -5.620159149169922, "global_step": 42858, "epoch": 1020} {"train_loss": -5.6378493309021, "global_step": 42859, "epoch": 1020} {"train_loss": -5.5842132568359375, "global_step": 42860, "epoch": 1020} {"train_loss": -5.7057037353515625, "global_step": 42861, "epoch": 1020} {"train_loss": -5.599884986877441, "global_step": 42862, "epoch": 1020} {"train_loss": -5.710206031799316, "global_step": 42863, "epoch": 1020} {"train_loss": -5.689607620239258, "global_step": 42864, "epoch": 1020} {"train_loss": -5.654439926147461, "global_step": 42865, "epoch": 1020} {"train_loss": -5.718375205993652, "global_step": 42866, "epoch": 1020} {"train_loss": -5.65339469909668, "global_step": 42867, "epoch": 1020} {"train_loss": -5.615715026855469, "global_step": 42868, "epoch": 1020} {"train_loss": -5.624882698059082, "global_step": 42869, "epoch": 1020} {"train_loss": -5.5622992515563965, "global_step": 42870, "epoch": 1020} {"train_loss": -5.729540824890137, "global_step": 42871, "epoch": 1020} {"train_loss": -5.608449459075928, "global_step": 42872, "epoch": 1020} {"train_loss": -5.693632125854492, "global_step": 42873, "epoch": 1020} {"train_loss": -5.6371612548828125, "global_step": 42874, "epoch": 1020} {"train_loss": -5.7020263671875, "global_step": 42875, "epoch": 1020} {"train_loss": -5.708822250366211, "global_step": 42876, "epoch": 1020} {"train_loss": -5.626702308654785, "global_step": 42877, "epoch": 1020} {"train_loss": -5.625157356262207, "global_step": 42878, "epoch": 1020} {"train_loss": -5.65303897857666, "global_step": 42879, "epoch": 1020} {"train_loss": -5.560332775115967, "global_step": 42880, "epoch": 1020} {"train_loss": -5.669699044454665, "global_step": 42881, "epoch": 1020, "val_loss": 74312.6953125} {"train_loss": -5.533586025238037, "global_step": 42882, "epoch": 1021} {"train_loss": -5.685250282287598, "global_step": 42883, "epoch": 1021} {"train_loss": -5.544044494628906, "global_step": 42884, "epoch": 1021} {"train_loss": -5.615089416503906, "global_step": 42885, "epoch": 1021} {"train_loss": -5.61735725402832, "global_step": 42886, "epoch": 1021} {"train_loss": -5.603930473327637, "global_step": 42887, "epoch": 1021} {"train_loss": -5.689146041870117, "global_step": 42888, "epoch": 1021} {"train_loss": -5.607250690460205, "global_step": 42889, "epoch": 1021} {"train_loss": -5.656310558319092, "global_step": 42890, "epoch": 1021} {"train_loss": -5.611513137817383, "global_step": 42891, "epoch": 1021} {"train_loss": -5.6074724197387695, "global_step": 42892, "epoch": 1021} {"train_loss": -5.6695637702941895, "global_step": 42893, "epoch": 1021} {"train_loss": -5.612673759460449, "global_step": 42894, "epoch": 1021} {"train_loss": -5.642175674438477, "global_step": 42895, "epoch": 1021} {"train_loss": -5.560891628265381, "global_step": 42896, "epoch": 1021} {"train_loss": -5.600118637084961, "global_step": 42897, "epoch": 1021} {"train_loss": -5.579591274261475, "global_step": 42898, "epoch": 1021} {"train_loss": -5.626808166503906, "global_step": 42899, "epoch": 1021} {"train_loss": -5.593935489654541, "global_step": 42900, "epoch": 1021} {"train_loss": -5.670672416687012, "global_step": 42901, "epoch": 1021} {"train_loss": -5.680704593658447, "global_step": 42902, "epoch": 1021} {"train_loss": -5.634711742401123, "global_step": 42903, "epoch": 1021} {"train_loss": -5.6389570236206055, "global_step": 42904, "epoch": 1021} {"train_loss": -5.693844795227051, "global_step": 42905, "epoch": 1021} {"train_loss": -5.660271644592285, "global_step": 42906, "epoch": 1021} {"train_loss": -5.673617839813232, "global_step": 42907, "epoch": 1021} {"train_loss": -5.77928352355957, "global_step": 42908, "epoch": 1021} {"train_loss": -5.63554573059082, "global_step": 42909, "epoch": 1021} {"train_loss": -5.697548866271973, "global_step": 42910, "epoch": 1021} {"train_loss": -5.673378944396973, "global_step": 42911, "epoch": 1021} {"train_loss": -5.707191467285156, "global_step": 42912, "epoch": 1021} {"train_loss": -5.697193145751953, "global_step": 42913, "epoch": 1021} {"train_loss": -5.691227436065674, "global_step": 42914, "epoch": 1021} {"train_loss": -5.6546173095703125, "global_step": 42915, "epoch": 1021} {"train_loss": -5.774447441101074, "global_step": 42916, "epoch": 1021} {"train_loss": -5.738770008087158, "global_step": 42917, "epoch": 1021} {"train_loss": -5.72659158706665, "global_step": 42918, "epoch": 1021} {"train_loss": -5.6330766677856445, "global_step": 42919, "epoch": 1021} {"train_loss": -5.7343034744262695, "global_step": 42920, "epoch": 1021} {"train_loss": -5.778964042663574, "global_step": 42921, "epoch": 1021} {"train_loss": -5.521416664123535, "global_step": 42922, "epoch": 1021} {"train_loss": -5.6546503475734164, "global_step": 42923, "epoch": 1021, "val_loss": 73505.1953125} {"train_loss": -5.669078826904297, "global_step": 42924, "epoch": 1022} {"train_loss": -5.647392272949219, "global_step": 42925, "epoch": 1022} {"train_loss": -5.616885185241699, "global_step": 42926, "epoch": 1022} {"train_loss": -5.624096393585205, "global_step": 42927, "epoch": 1022} {"train_loss": -5.633240699768066, "global_step": 42928, "epoch": 1022} {"train_loss": -5.739686965942383, "global_step": 42929, "epoch": 1022} {"train_loss": -5.781342506408691, "global_step": 42930, "epoch": 1022} {"train_loss": -5.576169967651367, "global_step": 42931, "epoch": 1022} {"train_loss": -5.716989517211914, "global_step": 42932, "epoch": 1022} {"train_loss": -5.784614562988281, "global_step": 42933, "epoch": 1022} {"train_loss": -5.581600666046143, "global_step": 42934, "epoch": 1022} {"train_loss": -5.8260955810546875, "global_step": 42935, "epoch": 1022} {"train_loss": -5.8466901779174805, "global_step": 42936, "epoch": 1022} {"train_loss": -5.636905193328857, "global_step": 42937, "epoch": 1022} {"train_loss": -5.579108238220215, "global_step": 42938, "epoch": 1022} {"train_loss": -5.7478742599487305, "global_step": 42939, "epoch": 1022} {"train_loss": -5.709938049316406, "global_step": 42940, "epoch": 1022} {"train_loss": -5.717985153198242, "global_step": 42941, "epoch": 1022} {"train_loss": -5.775402069091797, "global_step": 42942, "epoch": 1022} {"train_loss": -5.616580963134766, "global_step": 42943, "epoch": 1022} {"train_loss": -5.56234884262085, "global_step": 42944, "epoch": 1022} {"train_loss": -5.859615325927734, "global_step": 42945, "epoch": 1022} {"train_loss": -5.658463954925537, "global_step": 42946, "epoch": 1022} {"train_loss": -5.6908063888549805, "global_step": 42947, "epoch": 1022} {"train_loss": -5.7025370597839355, "global_step": 42948, "epoch": 1022} {"train_loss": -5.739645481109619, "global_step": 42949, "epoch": 1022} {"train_loss": -5.52699089050293, "global_step": 42950, "epoch": 1022} {"train_loss": -5.649994850158691, "global_step": 42951, "epoch": 1022} {"train_loss": -5.658835411071777, "global_step": 42952, "epoch": 1022} {"train_loss": -5.665131568908691, "global_step": 42953, "epoch": 1022} {"train_loss": -5.798987865447998, "global_step": 42954, "epoch": 1022} {"train_loss": -5.5179009437561035, "global_step": 42955, "epoch": 1022} {"train_loss": -5.72951078414917, "global_step": 42956, "epoch": 1022} {"train_loss": -5.81899356842041, "global_step": 42957, "epoch": 1022} {"train_loss": -5.471743583679199, "global_step": 42958, "epoch": 1022} {"train_loss": -5.620683193206787, "global_step": 42959, "epoch": 1022} {"train_loss": -5.642890930175781, "global_step": 42960, "epoch": 1022} {"train_loss": -5.716134071350098, "global_step": 42961, "epoch": 1022} {"train_loss": -5.712530136108398, "global_step": 42962, "epoch": 1022} {"train_loss": -5.81553840637207, "global_step": 42963, "epoch": 1022} {"train_loss": -5.62000036239624, "global_step": 42964, "epoch": 1022} {"train_loss": -5.6786424318949384, "global_step": 42965, "epoch": 1022, "val_loss": 73872.5078125} {"train_loss": -5.7594475746154785, "global_step": 42966, "epoch": 1023} {"train_loss": -5.617615699768066, "global_step": 42967, "epoch": 1023} {"train_loss": -5.456623077392578, "global_step": 42968, "epoch": 1023} {"train_loss": -5.718947410583496, "global_step": 42969, "epoch": 1023} {"train_loss": -5.771479606628418, "global_step": 42970, "epoch": 1023} {"train_loss": -5.588488578796387, "global_step": 42971, "epoch": 1023} {"train_loss": -5.738768577575684, "global_step": 42972, "epoch": 1023} {"train_loss": -5.675403594970703, "global_step": 42973, "epoch": 1023} {"train_loss": -5.470272064208984, "global_step": 42974, "epoch": 1023} {"train_loss": -5.634735107421875, "global_step": 42975, "epoch": 1023} {"train_loss": -5.593920707702637, "global_step": 42976, "epoch": 1023} {"train_loss": -5.5842485427856445, "global_step": 42977, "epoch": 1023} {"train_loss": -5.531839370727539, "global_step": 42978, "epoch": 1023} {"train_loss": -5.645769119262695, "global_step": 42979, "epoch": 1023} {"train_loss": -5.539377689361572, "global_step": 42980, "epoch": 1023} {"train_loss": -5.606375694274902, "global_step": 42981, "epoch": 1023} {"train_loss": -5.601009368896484, "global_step": 42982, "epoch": 1023} {"train_loss": -5.696393013000488, "global_step": 42983, "epoch": 1023} {"train_loss": -5.571977615356445, "global_step": 42984, "epoch": 1023} {"train_loss": -5.752058029174805, "global_step": 42985, "epoch": 1023} {"train_loss": -5.680601596832275, "global_step": 42986, "epoch": 1023} {"train_loss": -5.635197162628174, "global_step": 42987, "epoch": 1023} {"train_loss": -5.607193946838379, "global_step": 42988, "epoch": 1023} {"train_loss": -5.605226993560791, "global_step": 42989, "epoch": 1023} {"train_loss": -5.815858840942383, "global_step": 42990, "epoch": 1023} {"train_loss": -5.812376022338867, "global_step": 42991, "epoch": 1023} {"train_loss": -5.697300434112549, "global_step": 42992, "epoch": 1023} {"train_loss": -5.771603107452393, "global_step": 42993, "epoch": 1023} {"train_loss": -5.731873512268066, "global_step": 42994, "epoch": 1023} {"train_loss": -5.782890319824219, "global_step": 42995, "epoch": 1023} {"train_loss": -5.717191696166992, "global_step": 42996, "epoch": 1023} {"train_loss": -5.719148635864258, "global_step": 42997, "epoch": 1023} {"train_loss": -5.821277618408203, "global_step": 42998, "epoch": 1023} {"train_loss": -5.794159889221191, "global_step": 42999, "epoch": 1023} {"train_loss": -5.664702415466309, "global_step": 43000, "epoch": 1023} {"train_loss": -5.614255428314209, "global_step": 43001, "epoch": 1023} {"train_loss": -5.67558479309082, "global_step": 43002, "epoch": 1023} {"train_loss": -5.68744421005249, "global_step": 43003, "epoch": 1023} {"train_loss": -5.695735454559326, "global_step": 43004, "epoch": 1023} {"train_loss": -5.717903137207031, "global_step": 43005, "epoch": 1023} {"train_loss": -5.773638725280762, "global_step": 43006, "epoch": 1023} {"train_loss": -5.672725575310843, "global_step": 43007, "epoch": 1023, "val_loss": 73953.53125} {"train_loss": -5.735787391662598, "global_step": 43008, "epoch": 1024} {"train_loss": -5.749080657958984, "global_step": 43009, "epoch": 1024} {"train_loss": -5.824999809265137, "global_step": 43010, "epoch": 1024} {"train_loss": -5.669633865356445, "global_step": 43011, "epoch": 1024} {"train_loss": -5.559990882873535, "global_step": 43012, "epoch": 1024} {"train_loss": -5.590874195098877, "global_step": 43013, "epoch": 1024} {"train_loss": -5.544017791748047, "global_step": 43014, "epoch": 1024} {"train_loss": -5.854514122009277, "global_step": 43015, "epoch": 1024} {"train_loss": -5.602075576782227, "global_step": 43016, "epoch": 1024} {"train_loss": -5.711202144622803, "global_step": 43017, "epoch": 1024} {"train_loss": -5.65768575668335, "global_step": 43018, "epoch": 1024} {"train_loss": -5.694103717803955, "global_step": 43019, "epoch": 1024} {"train_loss": -5.566995620727539, "global_step": 43020, "epoch": 1024} {"train_loss": -5.658019542694092, "global_step": 43021, "epoch": 1024} {"train_loss": -5.828178405761719, "global_step": 43022, "epoch": 1024} {"train_loss": -5.662557601928711, "global_step": 43023, "epoch": 1024} {"train_loss": -5.756096363067627, "global_step": 43024, "epoch": 1024} {"train_loss": -5.6355438232421875, "global_step": 43025, "epoch": 1024} {"train_loss": -5.618531227111816, "global_step": 43026, "epoch": 1024} {"train_loss": -5.706927299499512, "global_step": 43027, "epoch": 1024} {"train_loss": -5.623340129852295, "global_step": 43028, "epoch": 1024} {"train_loss": -5.634244918823242, "global_step": 43029, "epoch": 1024} {"train_loss": -5.660819053649902, "global_step": 43030, "epoch": 1024} {"train_loss": -5.570292949676514, "global_step": 43031, "epoch": 1024} {"train_loss": -5.695835113525391, "global_step": 43032, "epoch": 1024} {"train_loss": -5.636381149291992, "global_step": 43033, "epoch": 1024} {"train_loss": -5.5514421463012695, "global_step": 43034, "epoch": 1024} {"train_loss": -5.74564790725708, "global_step": 43035, "epoch": 1024} {"train_loss": -5.595856666564941, "global_step": 43036, "epoch": 1024} {"train_loss": -5.626373291015625, "global_step": 43037, "epoch": 1024} {"train_loss": -5.784201622009277, "global_step": 43038, "epoch": 1024} {"train_loss": -5.637633323669434, "global_step": 43039, "epoch": 1024} {"train_loss": -5.772182464599609, "global_step": 43040, "epoch": 1024} {"train_loss": -5.618769645690918, "global_step": 43041, "epoch": 1024} {"train_loss": -5.5485639572143555, "global_step": 43042, "epoch": 1024} {"train_loss": -5.784642696380615, "global_step": 43043, "epoch": 1024} {"train_loss": -5.57773494720459, "global_step": 43044, "epoch": 1024} {"train_loss": -5.811306953430176, "global_step": 43045, "epoch": 1024} {"train_loss": -5.552164554595947, "global_step": 43046, "epoch": 1024} {"train_loss": -5.611781120300293, "global_step": 43047, "epoch": 1024} {"train_loss": -5.748257637023926, "global_step": 43048, "epoch": 1024} {"train_loss": -5.667485861551194, "global_step": 43049, "epoch": 1024, "val_loss": 74011.65625} {"train_loss": -5.718857288360596, "global_step": 43050, "epoch": 1025} {"train_loss": -5.715546607971191, "global_step": 43051, "epoch": 1025} {"train_loss": -5.762172698974609, "global_step": 43052, "epoch": 1025} {"train_loss": -5.676666259765625, "global_step": 43053, "epoch": 1025} {"train_loss": -5.719026565551758, "global_step": 43054, "epoch": 1025} {"train_loss": -5.699556350708008, "global_step": 43055, "epoch": 1025} {"train_loss": -5.615151405334473, "global_step": 43056, "epoch": 1025} {"train_loss": -5.575064659118652, "global_step": 43057, "epoch": 1025} {"train_loss": -5.538246154785156, "global_step": 43058, "epoch": 1025} {"train_loss": -5.6538543701171875, "global_step": 43059, "epoch": 1025} {"train_loss": -5.770614147186279, "global_step": 43060, "epoch": 1025} {"train_loss": -5.6013031005859375, "global_step": 43061, "epoch": 1025} {"train_loss": -5.7951812744140625, "global_step": 43062, "epoch": 1025} {"train_loss": -5.617979526519775, "global_step": 43063, "epoch": 1025} {"train_loss": -5.476533889770508, "global_step": 43064, "epoch": 1025} {"train_loss": -5.729029655456543, "global_step": 43065, "epoch": 1025} {"train_loss": -5.472151279449463, "global_step": 43066, "epoch": 1025} {"train_loss": -5.763773441314697, "global_step": 43067, "epoch": 1025} {"train_loss": -5.665188312530518, "global_step": 43068, "epoch": 1025} {"train_loss": -5.5880937576293945, "global_step": 43069, "epoch": 1025} {"train_loss": -5.65543270111084, "global_step": 43070, "epoch": 1025} {"train_loss": -5.568453311920166, "global_step": 43071, "epoch": 1025} {"train_loss": -5.52487325668335, "global_step": 43072, "epoch": 1025} {"train_loss": -5.508502006530762, "global_step": 43073, "epoch": 1025} {"train_loss": -5.522129058837891, "global_step": 43074, "epoch": 1025} {"train_loss": -5.62786340713501, "global_step": 43075, "epoch": 1025} {"train_loss": -5.669608116149902, "global_step": 43076, "epoch": 1025} {"train_loss": -5.591490268707275, "global_step": 43077, "epoch": 1025} {"train_loss": -5.64168643951416, "global_step": 43078, "epoch": 1025} {"train_loss": -5.599959373474121, "global_step": 43079, "epoch": 1025} {"train_loss": -5.571941375732422, "global_step": 43080, "epoch": 1025} {"train_loss": -5.6352620124816895, "global_step": 43081, "epoch": 1025} {"train_loss": -5.700455188751221, "global_step": 43082, "epoch": 1025} {"train_loss": -5.647556781768799, "global_step": 43083, "epoch": 1025} {"train_loss": -5.723829746246338, "global_step": 43084, "epoch": 1025} {"train_loss": -5.676451683044434, "global_step": 43085, "epoch": 1025} {"train_loss": -5.553061485290527, "global_step": 43086, "epoch": 1025} {"train_loss": -5.707433700561523, "global_step": 43087, "epoch": 1025} {"train_loss": -5.778407573699951, "global_step": 43088, "epoch": 1025} {"train_loss": -5.708442211151123, "global_step": 43089, "epoch": 1025} {"train_loss": -5.664307594299316, "global_step": 43090, "epoch": 1025} {"train_loss": -5.646888937268939, "global_step": 43091, "epoch": 1025, "val_loss": 73883.84375} {"train_loss": -5.717191219329834, "global_step": 43092, "epoch": 1026} {"train_loss": -5.765851020812988, "global_step": 43093, "epoch": 1026} {"train_loss": -5.587505340576172, "global_step": 43094, "epoch": 1026} {"train_loss": -5.5526628494262695, "global_step": 43095, "epoch": 1026} {"train_loss": -5.757472038269043, "global_step": 43096, "epoch": 1026} {"train_loss": -5.6236572265625, "global_step": 43097, "epoch": 1026} {"train_loss": -5.753971099853516, "global_step": 43098, "epoch": 1026} {"train_loss": -5.688867568969727, "global_step": 43099, "epoch": 1026} {"train_loss": -5.645811557769775, "global_step": 43100, "epoch": 1026} {"train_loss": -5.7567009925842285, "global_step": 43101, "epoch": 1026} {"train_loss": -5.603981018066406, "global_step": 43102, "epoch": 1026} {"train_loss": -5.796194553375244, "global_step": 43103, "epoch": 1026} {"train_loss": -5.727288246154785, "global_step": 43104, "epoch": 1026} {"train_loss": -5.666604995727539, "global_step": 43105, "epoch": 1026} {"train_loss": -5.709591865539551, "global_step": 43106, "epoch": 1026} {"train_loss": -5.608397483825684, "global_step": 43107, "epoch": 1026} {"train_loss": -5.662395477294922, "global_step": 43108, "epoch": 1026} {"train_loss": -5.63619327545166, "global_step": 43109, "epoch": 1026} {"train_loss": -5.694859981536865, "global_step": 43110, "epoch": 1026} {"train_loss": -5.684835433959961, "global_step": 43111, "epoch": 1026} {"train_loss": -5.7103447914123535, "global_step": 43112, "epoch": 1026} {"train_loss": -5.721870422363281, "global_step": 43113, "epoch": 1026} {"train_loss": -5.599794387817383, "global_step": 43114, "epoch": 1026} {"train_loss": -5.606828689575195, "global_step": 43115, "epoch": 1026} {"train_loss": -5.681988716125488, "global_step": 43116, "epoch": 1026} {"train_loss": -5.673102855682373, "global_step": 43117, "epoch": 1026} {"train_loss": -5.635103702545166, "global_step": 43118, "epoch": 1026} {"train_loss": -5.716738224029541, "global_step": 43119, "epoch": 1026} {"train_loss": -5.816972732543945, "global_step": 43120, "epoch": 1026} {"train_loss": -5.646397590637207, "global_step": 43121, "epoch": 1026} {"train_loss": -5.714893341064453, "global_step": 43122, "epoch": 1026} {"train_loss": -5.684427261352539, "global_step": 43123, "epoch": 1026} {"train_loss": -5.51626443862915, "global_step": 43124, "epoch": 1026} {"train_loss": -5.755819320678711, "global_step": 43125, "epoch": 1026} {"train_loss": -5.733787536621094, "global_step": 43126, "epoch": 1026} {"train_loss": -5.691778182983398, "global_step": 43127, "epoch": 1026} {"train_loss": -5.593341827392578, "global_step": 43128, "epoch": 1026} {"train_loss": -5.5088958740234375, "global_step": 43129, "epoch": 1026} {"train_loss": -5.64325475692749, "global_step": 43130, "epoch": 1026} {"train_loss": -5.669086933135986, "global_step": 43131, "epoch": 1026} {"train_loss": -5.734411716461182, "global_step": 43132, "epoch": 1026} {"train_loss": -5.675592694963727, "global_step": 43133, "epoch": 1026, "val_loss": 73550.96875} {"train_loss": -5.681144714355469, "global_step": 43134, "epoch": 1027} {"train_loss": -5.689960479736328, "global_step": 43135, "epoch": 1027} {"train_loss": -5.677447319030762, "global_step": 43136, "epoch": 1027} {"train_loss": -5.568478584289551, "global_step": 43137, "epoch": 1027} {"train_loss": -5.66929817199707, "global_step": 43138, "epoch": 1027} {"train_loss": -5.6290483474731445, "global_step": 43139, "epoch": 1027} {"train_loss": -5.736220836639404, "global_step": 43140, "epoch": 1027} {"train_loss": -5.582088470458984, "global_step": 43141, "epoch": 1027} {"train_loss": -5.594836235046387, "global_step": 43142, "epoch": 1027} {"train_loss": -5.720996379852295, "global_step": 43143, "epoch": 1027} {"train_loss": -5.677801132202148, "global_step": 43144, "epoch": 1027} {"train_loss": -5.535833358764648, "global_step": 43145, "epoch": 1027} {"train_loss": -5.717344284057617, "global_step": 43146, "epoch": 1027} {"train_loss": -5.505512237548828, "global_step": 43147, "epoch": 1027} {"train_loss": -5.6144914627075195, "global_step": 43148, "epoch": 1027} {"train_loss": -5.69261360168457, "global_step": 43149, "epoch": 1027} {"train_loss": -5.495469570159912, "global_step": 43150, "epoch": 1027} {"train_loss": -5.746689796447754, "global_step": 43151, "epoch": 1027} {"train_loss": -5.750086307525635, "global_step": 43152, "epoch": 1027} {"train_loss": -5.68179988861084, "global_step": 43153, "epoch": 1027} {"train_loss": -5.7129034996032715, "global_step": 43154, "epoch": 1027} {"train_loss": -5.565744876861572, "global_step": 43155, "epoch": 1027} {"train_loss": -5.8213090896606445, "global_step": 43156, "epoch": 1027} {"train_loss": -5.7191009521484375, "global_step": 43157, "epoch": 1027} {"train_loss": -5.633371353149414, "global_step": 43158, "epoch": 1027} {"train_loss": -5.697379112243652, "global_step": 43159, "epoch": 1027} {"train_loss": -5.616959095001221, "global_step": 43160, "epoch": 1027} {"train_loss": -5.642108917236328, "global_step": 43161, "epoch": 1027} {"train_loss": -5.738336086273193, "global_step": 43162, "epoch": 1027} {"train_loss": -5.763607978820801, "global_step": 43163, "epoch": 1027} {"train_loss": -5.703372001647949, "global_step": 43164, "epoch": 1027} {"train_loss": -5.722733497619629, "global_step": 43165, "epoch": 1027} {"train_loss": -5.521533012390137, "global_step": 43166, "epoch": 1027} {"train_loss": -5.549253940582275, "global_step": 43167, "epoch": 1027} {"train_loss": -5.693739891052246, "global_step": 43168, "epoch": 1027} {"train_loss": -5.559665203094482, "global_step": 43169, "epoch": 1027} {"train_loss": -5.680217742919922, "global_step": 43170, "epoch": 1027} {"train_loss": -5.679753303527832, "global_step": 43171, "epoch": 1027} {"train_loss": -5.76548957824707, "global_step": 43172, "epoch": 1027} {"train_loss": -5.543699741363525, "global_step": 43173, "epoch": 1027} {"train_loss": -5.731625556945801, "global_step": 43174, "epoch": 1027} {"train_loss": -5.657486416044689, "global_step": 43175, "epoch": 1027, "val_loss": 74338.4375} {"train_loss": -5.555630683898926, "global_step": 43176, "epoch": 1028} {"train_loss": -5.721139430999756, "global_step": 43177, "epoch": 1028} {"train_loss": -5.766841411590576, "global_step": 43178, "epoch": 1028} {"train_loss": -5.641742706298828, "global_step": 43179, "epoch": 1028} {"train_loss": -5.7511491775512695, "global_step": 43180, "epoch": 1028} {"train_loss": -5.683638572692871, "global_step": 43181, "epoch": 1028} {"train_loss": -5.603309154510498, "global_step": 43182, "epoch": 1028} {"train_loss": -5.7216267585754395, "global_step": 43183, "epoch": 1028} {"train_loss": -5.467297554016113, "global_step": 43184, "epoch": 1028} {"train_loss": -5.738579750061035, "global_step": 43185, "epoch": 1028} {"train_loss": -5.571555137634277, "global_step": 43186, "epoch": 1028} {"train_loss": -5.708156585693359, "global_step": 43187, "epoch": 1028} {"train_loss": -5.601901054382324, "global_step": 43188, "epoch": 1028} {"train_loss": -5.667441368103027, "global_step": 43189, "epoch": 1028} {"train_loss": -5.647421360015869, "global_step": 43190, "epoch": 1028} {"train_loss": -5.667869567871094, "global_step": 43191, "epoch": 1028} {"train_loss": -5.686063766479492, "global_step": 43192, "epoch": 1028} {"train_loss": -5.427823066711426, "global_step": 43193, "epoch": 1028} {"train_loss": -5.634765148162842, "global_step": 43194, "epoch": 1028} {"train_loss": -5.555395126342773, "global_step": 43195, "epoch": 1028} {"train_loss": -5.6580424308776855, "global_step": 43196, "epoch": 1028} {"train_loss": -5.6312713623046875, "global_step": 43197, "epoch": 1028} {"train_loss": -5.463024139404297, "global_step": 43198, "epoch": 1028} {"train_loss": -5.660343170166016, "global_step": 43199, "epoch": 1028} {"train_loss": -5.52773904800415, "global_step": 43200, "epoch": 1028} {"train_loss": -5.5597028732299805, "global_step": 43201, "epoch": 1028} {"train_loss": -5.624817848205566, "global_step": 43202, "epoch": 1028} {"train_loss": -5.531712055206299, "global_step": 43203, "epoch": 1028} {"train_loss": -5.722379684448242, "global_step": 43204, "epoch": 1028} {"train_loss": -5.490322113037109, "global_step": 43205, "epoch": 1028} {"train_loss": -5.562771797180176, "global_step": 43206, "epoch": 1028} {"train_loss": -5.541534900665283, "global_step": 43207, "epoch": 1028} {"train_loss": -5.636899948120117, "global_step": 43208, "epoch": 1028} {"train_loss": -5.654575347900391, "global_step": 43209, "epoch": 1028} {"train_loss": -5.631096839904785, "global_step": 43210, "epoch": 1028} {"train_loss": -5.565471649169922, "global_step": 43211, "epoch": 1028} {"train_loss": -5.641387462615967, "global_step": 43212, "epoch": 1028} {"train_loss": -5.646336555480957, "global_step": 43213, "epoch": 1028} {"train_loss": -5.509578704833984, "global_step": 43214, "epoch": 1028} {"train_loss": -5.5966925621032715, "global_step": 43215, "epoch": 1028} {"train_loss": -5.705504417419434, "global_step": 43216, "epoch": 1028} {"train_loss": -5.619323741822016, "global_step": 43217, "epoch": 1028, "val_loss": 74332.2578125} {"train_loss": -5.5830583572387695, "global_step": 43218, "epoch": 1029} {"train_loss": -5.572443008422852, "global_step": 43219, "epoch": 1029} {"train_loss": -5.586484909057617, "global_step": 43220, "epoch": 1029} {"train_loss": -5.548436164855957, "global_step": 43221, "epoch": 1029} {"train_loss": -5.73947811126709, "global_step": 43222, "epoch": 1029} {"train_loss": -5.610200881958008, "global_step": 43223, "epoch": 1029} {"train_loss": -5.698995113372803, "global_step": 43224, "epoch": 1029} {"train_loss": -5.697323799133301, "global_step": 43225, "epoch": 1029} {"train_loss": -5.627015113830566, "global_step": 43226, "epoch": 1029} {"train_loss": -5.6531572341918945, "global_step": 43227, "epoch": 1029} {"train_loss": -5.540844917297363, "global_step": 43228, "epoch": 1029} {"train_loss": -5.723371505737305, "global_step": 43229, "epoch": 1029} {"train_loss": -5.523906707763672, "global_step": 43230, "epoch": 1029} {"train_loss": -5.641384124755859, "global_step": 43231, "epoch": 1029} {"train_loss": -5.721678733825684, "global_step": 43232, "epoch": 1029} {"train_loss": -5.561395168304443, "global_step": 43233, "epoch": 1029} {"train_loss": -5.640383720397949, "global_step": 43234, "epoch": 1029} {"train_loss": -5.744604110717773, "global_step": 43235, "epoch": 1029} {"train_loss": -5.653958320617676, "global_step": 43236, "epoch": 1029} {"train_loss": -5.792573928833008, "global_step": 43237, "epoch": 1029} {"train_loss": -5.643400192260742, "global_step": 43238, "epoch": 1029} {"train_loss": -5.572826862335205, "global_step": 43239, "epoch": 1029} {"train_loss": -5.579272270202637, "global_step": 43240, "epoch": 1029} {"train_loss": -5.60349178314209, "global_step": 43241, "epoch": 1029} {"train_loss": -5.479952335357666, "global_step": 43242, "epoch": 1029} {"train_loss": -5.583608627319336, "global_step": 43243, "epoch": 1029} {"train_loss": -5.589450836181641, "global_step": 43244, "epoch": 1029} {"train_loss": -5.570991516113281, "global_step": 43245, "epoch": 1029} {"train_loss": -5.723751544952393, "global_step": 43246, "epoch": 1029} {"train_loss": -5.676278114318848, "global_step": 43247, "epoch": 1029} {"train_loss": -5.66215705871582, "global_step": 43248, "epoch": 1029} {"train_loss": -5.793683052062988, "global_step": 43249, "epoch": 1029} {"train_loss": -5.768463611602783, "global_step": 43250, "epoch": 1029} {"train_loss": -5.705372333526611, "global_step": 43251, "epoch": 1029} {"train_loss": -5.691293239593506, "global_step": 43252, "epoch": 1029} {"train_loss": -5.611876487731934, "global_step": 43253, "epoch": 1029} {"train_loss": -5.749440670013428, "global_step": 43254, "epoch": 1029} {"train_loss": -5.675303936004639, "global_step": 43255, "epoch": 1029} {"train_loss": -5.6578779220581055, "global_step": 43256, "epoch": 1029} {"train_loss": -5.6769232749938965, "global_step": 43257, "epoch": 1029} {"train_loss": -5.7232985496521, "global_step": 43258, "epoch": 1029} {"train_loss": -5.649631545657203, "global_step": 43259, "epoch": 1029, "val_loss": 73988.078125} {"train_loss": -5.645218849182129, "global_step": 43260, "epoch": 1030} {"train_loss": -5.716653823852539, "global_step": 43261, "epoch": 1030} {"train_loss": -5.689119815826416, "global_step": 43262, "epoch": 1030} {"train_loss": -5.670522689819336, "global_step": 43263, "epoch": 1030} {"train_loss": -5.57891321182251, "global_step": 43264, "epoch": 1030} {"train_loss": -5.617195129394531, "global_step": 43265, "epoch": 1030} {"train_loss": -5.67793083190918, "global_step": 43266, "epoch": 1030} {"train_loss": -5.674095153808594, "global_step": 43267, "epoch": 1030} {"train_loss": -5.793361663818359, "global_step": 43268, "epoch": 1030} {"train_loss": -5.608271598815918, "global_step": 43269, "epoch": 1030} {"train_loss": -5.665637969970703, "global_step": 43270, "epoch": 1030} {"train_loss": -5.650547981262207, "global_step": 43271, "epoch": 1030} {"train_loss": -5.73234748840332, "global_step": 43272, "epoch": 1030} {"train_loss": -5.684806823730469, "global_step": 43273, "epoch": 1030} {"train_loss": -5.720431327819824, "global_step": 43274, "epoch": 1030} {"train_loss": -5.667635917663574, "global_step": 43275, "epoch": 1030} {"train_loss": -5.725294589996338, "global_step": 43276, "epoch": 1030} {"train_loss": -5.751760482788086, "global_step": 43277, "epoch": 1030} {"train_loss": -5.645393371582031, "global_step": 43278, "epoch": 1030} {"train_loss": -5.588570594787598, "global_step": 43279, "epoch": 1030} {"train_loss": -5.741453647613525, "global_step": 43280, "epoch": 1030} {"train_loss": -5.565412998199463, "global_step": 43281, "epoch": 1030} {"train_loss": -5.613700866699219, "global_step": 43282, "epoch": 1030} {"train_loss": -5.785270690917969, "global_step": 43283, "epoch": 1030} {"train_loss": -5.672455787658691, "global_step": 43284, "epoch": 1030} {"train_loss": -5.763274669647217, "global_step": 43285, "epoch": 1030} {"train_loss": -5.744108200073242, "global_step": 43286, "epoch": 1030} {"train_loss": -5.702701568603516, "global_step": 43287, "epoch": 1030} {"train_loss": -5.683058738708496, "global_step": 43288, "epoch": 1030} {"train_loss": -5.831293106079102, "global_step": 43289, "epoch": 1030} {"train_loss": -5.695122241973877, "global_step": 43290, "epoch": 1030} {"train_loss": -5.781381130218506, "global_step": 43291, "epoch": 1030} {"train_loss": -5.612486362457275, "global_step": 43292, "epoch": 1030} {"train_loss": -5.731040000915527, "global_step": 43293, "epoch": 1030} {"train_loss": -5.75919246673584, "global_step": 43294, "epoch": 1030} {"train_loss": -5.7366042137146, "global_step": 43295, "epoch": 1030} {"train_loss": -5.672296524047852, "global_step": 43296, "epoch": 1030} {"train_loss": -5.688234806060791, "global_step": 43297, "epoch": 1030} {"train_loss": -5.63576602935791, "global_step": 43298, "epoch": 1030} {"train_loss": -5.762980937957764, "global_step": 43299, "epoch": 1030} {"train_loss": -5.6276960372924805, "global_step": 43300, "epoch": 1030} {"train_loss": -5.688951322010586, "global_step": 43301, "epoch": 1030, "val_loss": 73877.6875} {"train_loss": -5.64650821685791, "global_step": 43302, "epoch": 1031} {"train_loss": -5.655956745147705, "global_step": 43303, "epoch": 1031} {"train_loss": -5.731474876403809, "global_step": 43304, "epoch": 1031} {"train_loss": -5.642765045166016, "global_step": 43305, "epoch": 1031} {"train_loss": -5.69826602935791, "global_step": 43306, "epoch": 1031} {"train_loss": -5.6321258544921875, "global_step": 43307, "epoch": 1031} {"train_loss": -5.713265895843506, "global_step": 43308, "epoch": 1031} {"train_loss": -5.547033786773682, "global_step": 43309, "epoch": 1031} {"train_loss": -5.542325019836426, "global_step": 43310, "epoch": 1031} {"train_loss": -5.7676239013671875, "global_step": 43311, "epoch": 1031} {"train_loss": -5.638449192047119, "global_step": 43312, "epoch": 1031} {"train_loss": -5.72202205657959, "global_step": 43313, "epoch": 1031} {"train_loss": -5.716655731201172, "global_step": 43314, "epoch": 1031} {"train_loss": -5.6941680908203125, "global_step": 43315, "epoch": 1031} {"train_loss": -5.683973789215088, "global_step": 43316, "epoch": 1031} {"train_loss": -5.708202362060547, "global_step": 43317, "epoch": 1031} {"train_loss": -5.741045951843262, "global_step": 43318, "epoch": 1031} {"train_loss": -5.663542747497559, "global_step": 43319, "epoch": 1031} {"train_loss": -5.651764392852783, "global_step": 43320, "epoch": 1031} {"train_loss": -5.634521007537842, "global_step": 43321, "epoch": 1031} {"train_loss": -5.690303802490234, "global_step": 43322, "epoch": 1031} {"train_loss": -5.628155708312988, "global_step": 43323, "epoch": 1031} {"train_loss": -5.712589263916016, "global_step": 43324, "epoch": 1031} {"train_loss": -5.761170864105225, "global_step": 43325, "epoch": 1031} {"train_loss": -5.722782135009766, "global_step": 43326, "epoch": 1031} {"train_loss": -5.778820037841797, "global_step": 43327, "epoch": 1031} {"train_loss": -5.784590244293213, "global_step": 43328, "epoch": 1031} {"train_loss": -5.503684043884277, "global_step": 43329, "epoch": 1031} {"train_loss": -5.710554599761963, "global_step": 43330, "epoch": 1031} {"train_loss": -5.585550308227539, "global_step": 43331, "epoch": 1031} {"train_loss": -5.735897064208984, "global_step": 43332, "epoch": 1031} {"train_loss": -5.748331069946289, "global_step": 43333, "epoch": 1031} {"train_loss": -5.735472679138184, "global_step": 43334, "epoch": 1031} {"train_loss": -5.72245454788208, "global_step": 43335, "epoch": 1031} {"train_loss": -5.701772689819336, "global_step": 43336, "epoch": 1031} {"train_loss": -5.572525978088379, "global_step": 43337, "epoch": 1031} {"train_loss": -5.759966850280762, "global_step": 43338, "epoch": 1031} {"train_loss": -5.634537220001221, "global_step": 43339, "epoch": 1031} {"train_loss": -5.6804962158203125, "global_step": 43340, "epoch": 1031} {"train_loss": -5.587793827056885, "global_step": 43341, "epoch": 1031} {"train_loss": -5.678537845611572, "global_step": 43342, "epoch": 1031} {"train_loss": -5.680959043048677, "global_step": 43343, "epoch": 1031, "val_loss": 74299.546875} {"train_loss": -5.62900447845459, "global_step": 43344, "epoch": 1032} {"train_loss": -5.698784351348877, "global_step": 43345, "epoch": 1032} {"train_loss": -5.596470832824707, "global_step": 43346, "epoch": 1032} {"train_loss": -5.598324298858643, "global_step": 43347, "epoch": 1032} {"train_loss": -5.667220592498779, "global_step": 43348, "epoch": 1032} {"train_loss": -5.667736530303955, "global_step": 43349, "epoch": 1032} {"train_loss": -5.574475288391113, "global_step": 43350, "epoch": 1032} {"train_loss": -5.618768692016602, "global_step": 43351, "epoch": 1032} {"train_loss": -5.549399375915527, "global_step": 43352, "epoch": 1032} {"train_loss": -5.6420135498046875, "global_step": 43353, "epoch": 1032} {"train_loss": -5.760910987854004, "global_step": 43354, "epoch": 1032} {"train_loss": -5.575872421264648, "global_step": 43355, "epoch": 1032} {"train_loss": -5.687674522399902, "global_step": 43356, "epoch": 1032} {"train_loss": -5.683791160583496, "global_step": 43357, "epoch": 1032} {"train_loss": -5.537833213806152, "global_step": 43358, "epoch": 1032} {"train_loss": -5.690332412719727, "global_step": 43359, "epoch": 1032} {"train_loss": -5.735291481018066, "global_step": 43360, "epoch": 1032} {"train_loss": -5.615042686462402, "global_step": 43361, "epoch": 1032} {"train_loss": -5.540219783782959, "global_step": 43362, "epoch": 1032} {"train_loss": -5.697072982788086, "global_step": 43363, "epoch": 1032} {"train_loss": -5.6025166511535645, "global_step": 43364, "epoch": 1032} {"train_loss": -5.616480350494385, "global_step": 43365, "epoch": 1032} {"train_loss": -5.724671363830566, "global_step": 43366, "epoch": 1032} {"train_loss": -5.616918563842773, "global_step": 43367, "epoch": 1032} {"train_loss": -5.728488445281982, "global_step": 43368, "epoch": 1032} {"train_loss": -5.604437351226807, "global_step": 43369, "epoch": 1032} {"train_loss": -5.607995986938477, "global_step": 43370, "epoch": 1032} {"train_loss": -5.723702430725098, "global_step": 43371, "epoch": 1032} {"train_loss": -5.616486549377441, "global_step": 43372, "epoch": 1032} {"train_loss": -5.610722541809082, "global_step": 43373, "epoch": 1032} {"train_loss": -5.7008748054504395, "global_step": 43374, "epoch": 1032} {"train_loss": -5.566375732421875, "global_step": 43375, "epoch": 1032} {"train_loss": -5.647184371948242, "global_step": 43376, "epoch": 1032} {"train_loss": -5.704085350036621, "global_step": 43377, "epoch": 1032} {"train_loss": -5.690153121948242, "global_step": 43378, "epoch": 1032} {"train_loss": -5.617362976074219, "global_step": 43379, "epoch": 1032} {"train_loss": -5.6915602684021, "global_step": 43380, "epoch": 1032} {"train_loss": -5.69064998626709, "global_step": 43381, "epoch": 1032} {"train_loss": -5.683375358581543, "global_step": 43382, "epoch": 1032} {"train_loss": -5.77131986618042, "global_step": 43383, "epoch": 1032} {"train_loss": -5.7060041427612305, "global_step": 43384, "epoch": 1032} {"train_loss": -5.650807017371768, "global_step": 43385, "epoch": 1032, "val_loss": 73681.7109375} {"train_loss": -5.866823196411133, "global_step": 43386, "epoch": 1033} {"train_loss": -5.910493850708008, "global_step": 43387, "epoch": 1033} {"train_loss": -5.7584710121154785, "global_step": 43388, "epoch": 1033} {"train_loss": -5.6504011154174805, "global_step": 43389, "epoch": 1033} {"train_loss": -5.759546279907227, "global_step": 43390, "epoch": 1033} {"train_loss": -5.758966445922852, "global_step": 43391, "epoch": 1033} {"train_loss": -5.722835540771484, "global_step": 43392, "epoch": 1033} {"train_loss": -5.717866897583008, "global_step": 43393, "epoch": 1033} {"train_loss": -5.622034072875977, "global_step": 43394, "epoch": 1033} {"train_loss": -5.7294416427612305, "global_step": 43395, "epoch": 1033} {"train_loss": -5.688790798187256, "global_step": 43396, "epoch": 1033} {"train_loss": -5.766793251037598, "global_step": 43397, "epoch": 1033} {"train_loss": -5.669683456420898, "global_step": 43398, "epoch": 1033} {"train_loss": -5.531922817230225, "global_step": 43399, "epoch": 1033} {"train_loss": -5.6370649337768555, "global_step": 43400, "epoch": 1033} {"train_loss": -5.645236968994141, "global_step": 43401, "epoch": 1033} {"train_loss": -5.686995983123779, "global_step": 43402, "epoch": 1033} {"train_loss": -5.686878204345703, "global_step": 43403, "epoch": 1033} {"train_loss": -5.591161727905273, "global_step": 43404, "epoch": 1033} {"train_loss": -5.805531024932861, "global_step": 43405, "epoch": 1033} {"train_loss": -5.724300861358643, "global_step": 43406, "epoch": 1033} {"train_loss": -5.741559982299805, "global_step": 43407, "epoch": 1033} {"train_loss": -5.736217498779297, "global_step": 43408, "epoch": 1033} {"train_loss": -5.708922863006592, "global_step": 43409, "epoch": 1033} {"train_loss": -5.626545429229736, "global_step": 43410, "epoch": 1033} {"train_loss": -5.615878582000732, "global_step": 43411, "epoch": 1033} {"train_loss": -5.618881702423096, "global_step": 43412, "epoch": 1033} {"train_loss": -5.813330173492432, "global_step": 43413, "epoch": 1033} {"train_loss": -5.666149139404297, "global_step": 43414, "epoch": 1033} {"train_loss": -5.665867805480957, "global_step": 43415, "epoch": 1033} {"train_loss": -5.67677116394043, "global_step": 43416, "epoch": 1033} {"train_loss": -5.707666397094727, "global_step": 43417, "epoch": 1033} {"train_loss": -5.791984558105469, "global_step": 43418, "epoch": 1033} {"train_loss": -5.690786361694336, "global_step": 43419, "epoch": 1033} {"train_loss": -5.713596343994141, "global_step": 43420, "epoch": 1033} {"train_loss": -5.711240768432617, "global_step": 43421, "epoch": 1033} {"train_loss": -5.635207176208496, "global_step": 43422, "epoch": 1033} {"train_loss": -5.691028118133545, "global_step": 43423, "epoch": 1033} {"train_loss": -5.614076137542725, "global_step": 43424, "epoch": 1033} {"train_loss": -5.712182521820068, "global_step": 43425, "epoch": 1033} {"train_loss": -5.761678695678711, "global_step": 43426, "epoch": 1033} {"train_loss": -5.7044098150162466, "global_step": 43427, "epoch": 1033, "val_loss": 74008.9375} {"train_loss": -5.7430877685546875, "global_step": 43428, "epoch": 1034} {"train_loss": -5.6767168045043945, "global_step": 43429, "epoch": 1034} {"train_loss": -5.717260360717773, "global_step": 43430, "epoch": 1034} {"train_loss": -5.638463020324707, "global_step": 43431, "epoch": 1034} {"train_loss": -5.4594268798828125, "global_step": 43432, "epoch": 1034} {"train_loss": -5.696086406707764, "global_step": 43433, "epoch": 1034} {"train_loss": -5.5876898765563965, "global_step": 43434, "epoch": 1034} {"train_loss": -5.735976696014404, "global_step": 43435, "epoch": 1034} {"train_loss": -5.689006328582764, "global_step": 43436, "epoch": 1034} {"train_loss": -5.65457010269165, "global_step": 43437, "epoch": 1034} {"train_loss": -5.657238006591797, "global_step": 43438, "epoch": 1034} {"train_loss": -5.690600872039795, "global_step": 43439, "epoch": 1034} {"train_loss": -5.607901096343994, "global_step": 43440, "epoch": 1034} {"train_loss": -5.783320426940918, "global_step": 43441, "epoch": 1034} {"train_loss": -5.668959617614746, "global_step": 43442, "epoch": 1034} {"train_loss": -5.699292182922363, "global_step": 43443, "epoch": 1034} {"train_loss": -5.778371810913086, "global_step": 43444, "epoch": 1034} {"train_loss": -5.651407718658447, "global_step": 43445, "epoch": 1034} {"train_loss": -5.641869068145752, "global_step": 43446, "epoch": 1034} {"train_loss": -5.853452682495117, "global_step": 43447, "epoch": 1034} {"train_loss": -5.793585777282715, "global_step": 43448, "epoch": 1034} {"train_loss": -5.597686767578125, "global_step": 43449, "epoch": 1034} {"train_loss": -5.721468925476074, "global_step": 43450, "epoch": 1034} {"train_loss": -5.689296245574951, "global_step": 43451, "epoch": 1034} {"train_loss": -5.802506446838379, "global_step": 43452, "epoch": 1034} {"train_loss": -5.724647521972656, "global_step": 43453, "epoch": 1034} {"train_loss": -5.706598281860352, "global_step": 43454, "epoch": 1034} {"train_loss": -5.771842002868652, "global_step": 43455, "epoch": 1034} {"train_loss": -5.584497451782227, "global_step": 43456, "epoch": 1034} {"train_loss": -5.60100793838501, "global_step": 43457, "epoch": 1034} {"train_loss": -5.699386119842529, "global_step": 43458, "epoch": 1034} {"train_loss": -5.593181610107422, "global_step": 43459, "epoch": 1034} {"train_loss": -5.604327201843262, "global_step": 43460, "epoch": 1034} {"train_loss": -5.65757417678833, "global_step": 43461, "epoch": 1034} {"train_loss": -5.528079986572266, "global_step": 43462, "epoch": 1034} {"train_loss": -5.595391273498535, "global_step": 43463, "epoch": 1034} {"train_loss": -5.728138446807861, "global_step": 43464, "epoch": 1034} {"train_loss": -5.684792995452881, "global_step": 43465, "epoch": 1034} {"train_loss": -5.6648478507995605, "global_step": 43466, "epoch": 1034} {"train_loss": -5.586647987365723, "global_step": 43467, "epoch": 1034} {"train_loss": -5.707705497741699, "global_step": 43468, "epoch": 1034} {"train_loss": -5.6757425126575285, "global_step": 43469, "epoch": 1034, "val_loss": 74180.6484375} {"train_loss": -5.646548748016357, "global_step": 43470, "epoch": 1035} {"train_loss": -5.714734077453613, "global_step": 43471, "epoch": 1035} {"train_loss": -5.5973124504089355, "global_step": 43472, "epoch": 1035} {"train_loss": -5.702220916748047, "global_step": 43473, "epoch": 1035} {"train_loss": -5.6795549392700195, "global_step": 43474, "epoch": 1035} {"train_loss": -5.634777545928955, "global_step": 43475, "epoch": 1035} {"train_loss": -5.67800235748291, "global_step": 43476, "epoch": 1035} {"train_loss": -5.837198257446289, "global_step": 43477, "epoch": 1035} {"train_loss": -5.65277099609375, "global_step": 43478, "epoch": 1035} {"train_loss": -5.644223213195801, "global_step": 43479, "epoch": 1035} {"train_loss": -5.706336975097656, "global_step": 43480, "epoch": 1035} {"train_loss": -5.663351058959961, "global_step": 43481, "epoch": 1035} {"train_loss": -5.816865921020508, "global_step": 43482, "epoch": 1035} {"train_loss": -5.679150581359863, "global_step": 43483, "epoch": 1035} {"train_loss": -5.622641563415527, "global_step": 43484, "epoch": 1035} {"train_loss": -5.709446907043457, "global_step": 43485, "epoch": 1035} {"train_loss": -5.616307258605957, "global_step": 43486, "epoch": 1035} {"train_loss": -5.663496017456055, "global_step": 43487, "epoch": 1035} {"train_loss": -5.632510185241699, "global_step": 43488, "epoch": 1035} {"train_loss": -5.604525566101074, "global_step": 43489, "epoch": 1035} {"train_loss": -5.515905857086182, "global_step": 43490, "epoch": 1035} {"train_loss": -5.64804744720459, "global_step": 43491, "epoch": 1035} {"train_loss": -5.704404830932617, "global_step": 43492, "epoch": 1035} {"train_loss": -5.545605659484863, "global_step": 43493, "epoch": 1035} {"train_loss": -5.640529632568359, "global_step": 43494, "epoch": 1035} {"train_loss": -5.6075897216796875, "global_step": 43495, "epoch": 1035} {"train_loss": -5.621851921081543, "global_step": 43496, "epoch": 1035} {"train_loss": -5.821084499359131, "global_step": 43497, "epoch": 1035} {"train_loss": -5.636826992034912, "global_step": 43498, "epoch": 1035} {"train_loss": -5.732393741607666, "global_step": 43499, "epoch": 1035} {"train_loss": -5.716507911682129, "global_step": 43500, "epoch": 1035} {"train_loss": -5.506599426269531, "global_step": 43501, "epoch": 1035} {"train_loss": -5.6343607902526855, "global_step": 43502, "epoch": 1035} {"train_loss": -5.659566879272461, "global_step": 43503, "epoch": 1035} {"train_loss": -5.60669469833374, "global_step": 43504, "epoch": 1035} {"train_loss": -5.587336540222168, "global_step": 43505, "epoch": 1035} {"train_loss": -5.6507768630981445, "global_step": 43506, "epoch": 1035} {"train_loss": -5.712699890136719, "global_step": 43507, "epoch": 1035} {"train_loss": -5.612001419067383, "global_step": 43508, "epoch": 1035} {"train_loss": -5.685075759887695, "global_step": 43509, "epoch": 1035} {"train_loss": -5.581632614135742, "global_step": 43510, "epoch": 1035} {"train_loss": -5.65820634932745, "global_step": 43511, "epoch": 1035, "val_loss": 74403.859375} {"train_loss": -5.726474761962891, "global_step": 43512, "epoch": 1036} {"train_loss": -5.763140678405762, "global_step": 43513, "epoch": 1036} {"train_loss": -5.693275451660156, "global_step": 43514, "epoch": 1036} {"train_loss": -5.677640914916992, "global_step": 43515, "epoch": 1036} {"train_loss": -5.686366081237793, "global_step": 43516, "epoch": 1036} {"train_loss": -5.678056240081787, "global_step": 43517, "epoch": 1036} {"train_loss": -5.656157970428467, "global_step": 43518, "epoch": 1036} {"train_loss": -5.5998053550720215, "global_step": 43519, "epoch": 1036} {"train_loss": -5.655581474304199, "global_step": 43520, "epoch": 1036} {"train_loss": -5.680658340454102, "global_step": 43521, "epoch": 1036} {"train_loss": -5.703366279602051, "global_step": 43522, "epoch": 1036} {"train_loss": -5.674633026123047, "global_step": 43523, "epoch": 1036} {"train_loss": -5.706326007843018, "global_step": 43524, "epoch": 1036} {"train_loss": -5.767815589904785, "global_step": 43525, "epoch": 1036} {"train_loss": -5.590542793273926, "global_step": 43526, "epoch": 1036} {"train_loss": -5.7295918464660645, "global_step": 43527, "epoch": 1036} {"train_loss": -5.650609016418457, "global_step": 43528, "epoch": 1036} {"train_loss": -5.621596813201904, "global_step": 43529, "epoch": 1036} {"train_loss": -5.568240642547607, "global_step": 43530, "epoch": 1036} {"train_loss": -5.706863880157471, "global_step": 43531, "epoch": 1036} {"train_loss": -5.747047424316406, "global_step": 43532, "epoch": 1036} {"train_loss": -5.7034912109375, "global_step": 43533, "epoch": 1036} {"train_loss": -5.576067924499512, "global_step": 43534, "epoch": 1036} {"train_loss": -5.73565673828125, "global_step": 43535, "epoch": 1036} {"train_loss": -5.703068733215332, "global_step": 43536, "epoch": 1036} {"train_loss": -5.688292026519775, "global_step": 43537, "epoch": 1036} {"train_loss": -5.64473819732666, "global_step": 43538, "epoch": 1036} {"train_loss": -5.702852249145508, "global_step": 43539, "epoch": 1036} {"train_loss": -5.646197319030762, "global_step": 43540, "epoch": 1036} {"train_loss": -5.745697021484375, "global_step": 43541, "epoch": 1036} {"train_loss": -5.757920265197754, "global_step": 43542, "epoch": 1036} {"train_loss": -5.678606033325195, "global_step": 43543, "epoch": 1036} {"train_loss": -5.547503471374512, "global_step": 43544, "epoch": 1036} {"train_loss": -5.725898742675781, "global_step": 43545, "epoch": 1036} {"train_loss": -5.596768379211426, "global_step": 43546, "epoch": 1036} {"train_loss": -5.744387626647949, "global_step": 43547, "epoch": 1036} {"train_loss": -5.658459186553955, "global_step": 43548, "epoch": 1036} {"train_loss": -5.760891914367676, "global_step": 43549, "epoch": 1036} {"train_loss": -5.8024396896362305, "global_step": 43550, "epoch": 1036} {"train_loss": -5.728409290313721, "global_step": 43551, "epoch": 1036} {"train_loss": -5.718155860900879, "global_step": 43552, "epoch": 1036} {"train_loss": -5.684622571581886, "global_step": 43553, "epoch": 1036, "val_loss": 74077.765625} {"train_loss": -5.672357559204102, "global_step": 43554, "epoch": 1037} {"train_loss": -5.6461639404296875, "global_step": 43555, "epoch": 1037} {"train_loss": -5.6559953689575195, "global_step": 43556, "epoch": 1037} {"train_loss": -5.6550703048706055, "global_step": 43557, "epoch": 1037} {"train_loss": -5.749929904937744, "global_step": 43558, "epoch": 1037} {"train_loss": -5.723526954650879, "global_step": 43559, "epoch": 1037} {"train_loss": -5.655552864074707, "global_step": 43560, "epoch": 1037} {"train_loss": -5.709052085876465, "global_step": 43561, "epoch": 1037} {"train_loss": -5.641061782836914, "global_step": 43562, "epoch": 1037} {"train_loss": -5.6133527755737305, "global_step": 43563, "epoch": 1037} {"train_loss": -5.639089107513428, "global_step": 43564, "epoch": 1037} {"train_loss": -5.562156677246094, "global_step": 43565, "epoch": 1037} {"train_loss": -5.670905113220215, "global_step": 43566, "epoch": 1037} {"train_loss": -5.584866523742676, "global_step": 43567, "epoch": 1037} {"train_loss": -5.676858901977539, "global_step": 43568, "epoch": 1037} {"train_loss": -5.667838096618652, "global_step": 43569, "epoch": 1037} {"train_loss": -5.7262492179870605, "global_step": 43570, "epoch": 1037} {"train_loss": -5.738286972045898, "global_step": 43571, "epoch": 1037} {"train_loss": -5.614809989929199, "global_step": 43572, "epoch": 1037} {"train_loss": -5.633772850036621, "global_step": 43573, "epoch": 1037} {"train_loss": -5.734587669372559, "global_step": 43574, "epoch": 1037} {"train_loss": -5.794589042663574, "global_step": 43575, "epoch": 1037} {"train_loss": -5.766223430633545, "global_step": 43576, "epoch": 1037} {"train_loss": -5.717979907989502, "global_step": 43577, "epoch": 1037} {"train_loss": -5.696738243103027, "global_step": 43578, "epoch": 1037} {"train_loss": -5.650657653808594, "global_step": 43579, "epoch": 1037} {"train_loss": -5.786645889282227, "global_step": 43580, "epoch": 1037} {"train_loss": -5.723247528076172, "global_step": 43581, "epoch": 1037} {"train_loss": -5.729679107666016, "global_step": 43582, "epoch": 1037} {"train_loss": -5.787258148193359, "global_step": 43583, "epoch": 1037} {"train_loss": -5.581754684448242, "global_step": 43584, "epoch": 1037} {"train_loss": -5.6699395179748535, "global_step": 43585, "epoch": 1037} {"train_loss": -5.633877277374268, "global_step": 43586, "epoch": 1037} {"train_loss": -5.67494010925293, "global_step": 43587, "epoch": 1037} {"train_loss": -5.646249294281006, "global_step": 43588, "epoch": 1037} {"train_loss": -5.699102878570557, "global_step": 43589, "epoch": 1037} {"train_loss": -5.672563552856445, "global_step": 43590, "epoch": 1037} {"train_loss": -5.725500106811523, "global_step": 43591, "epoch": 1037} {"train_loss": -5.698922157287598, "global_step": 43592, "epoch": 1037} {"train_loss": -5.72003698348999, "global_step": 43593, "epoch": 1037} {"train_loss": -5.68106746673584, "global_step": 43594, "epoch": 1037} {"train_loss": -5.685330231984456, "global_step": 43595, "epoch": 1037, "val_loss": 74011.5078125} {"train_loss": -5.811244010925293, "global_step": 43596, "epoch": 1038} {"train_loss": -5.4472503662109375, "global_step": 43597, "epoch": 1038} {"train_loss": -5.605555057525635, "global_step": 43598, "epoch": 1038} {"train_loss": -5.648375034332275, "global_step": 43599, "epoch": 1038} {"train_loss": -5.494316577911377, "global_step": 43600, "epoch": 1038} {"train_loss": -5.734710693359375, "global_step": 43601, "epoch": 1038} {"train_loss": -5.8702192306518555, "global_step": 43602, "epoch": 1038} {"train_loss": -5.602710723876953, "global_step": 43603, "epoch": 1038} {"train_loss": -5.728517055511475, "global_step": 43604, "epoch": 1038} {"train_loss": -5.629922866821289, "global_step": 43605, "epoch": 1038} {"train_loss": -5.629655361175537, "global_step": 43606, "epoch": 1038} {"train_loss": -5.5910234451293945, "global_step": 43607, "epoch": 1038} {"train_loss": -5.540932655334473, "global_step": 43608, "epoch": 1038} {"train_loss": -5.743966102600098, "global_step": 43609, "epoch": 1038} {"train_loss": -5.5089616775512695, "global_step": 43610, "epoch": 1038} {"train_loss": -5.716970920562744, "global_step": 43611, "epoch": 1038} {"train_loss": -5.705012321472168, "global_step": 43612, "epoch": 1038} {"train_loss": -5.679487705230713, "global_step": 43613, "epoch": 1038} {"train_loss": -5.720553398132324, "global_step": 43614, "epoch": 1038} {"train_loss": -5.781357765197754, "global_step": 43615, "epoch": 1038} {"train_loss": -5.75948429107666, "global_step": 43616, "epoch": 1038} {"train_loss": -5.62967586517334, "global_step": 43617, "epoch": 1038} {"train_loss": -5.6441650390625, "global_step": 43618, "epoch": 1038} {"train_loss": -5.778732776641846, "global_step": 43619, "epoch": 1038} {"train_loss": -5.604059219360352, "global_step": 43620, "epoch": 1038} {"train_loss": -5.829326629638672, "global_step": 43621, "epoch": 1038} {"train_loss": -5.699318885803223, "global_step": 43622, "epoch": 1038} {"train_loss": -5.599917411804199, "global_step": 43623, "epoch": 1038} {"train_loss": -5.6268768310546875, "global_step": 43624, "epoch": 1038} {"train_loss": -5.754905700683594, "global_step": 43625, "epoch": 1038} {"train_loss": -5.639636039733887, "global_step": 43626, "epoch": 1038} {"train_loss": -5.636713981628418, "global_step": 43627, "epoch": 1038} {"train_loss": -5.651242256164551, "global_step": 43628, "epoch": 1038} {"train_loss": -5.652278900146484, "global_step": 43629, "epoch": 1038} {"train_loss": -5.813785552978516, "global_step": 43630, "epoch": 1038} {"train_loss": -5.527626037597656, "global_step": 43631, "epoch": 1038} {"train_loss": -5.557492256164551, "global_step": 43632, "epoch": 1038} {"train_loss": -5.670490741729736, "global_step": 43633, "epoch": 1038} {"train_loss": -5.483820915222168, "global_step": 43634, "epoch": 1038} {"train_loss": -5.691285133361816, "global_step": 43635, "epoch": 1038} {"train_loss": -5.653070449829102, "global_step": 43636, "epoch": 1038} {"train_loss": -5.659108025687082, "global_step": 43637, "epoch": 1038, "val_loss": 74041.125} {"train_loss": -5.7608561515808105, "global_step": 43638, "epoch": 1039} {"train_loss": -5.69946813583374, "global_step": 43639, "epoch": 1039} {"train_loss": -5.628211975097656, "global_step": 43640, "epoch": 1039} {"train_loss": -5.713152885437012, "global_step": 43641, "epoch": 1039} {"train_loss": -5.547794818878174, "global_step": 43642, "epoch": 1039} {"train_loss": -5.725902557373047, "global_step": 43643, "epoch": 1039} {"train_loss": -5.861992835998535, "global_step": 43644, "epoch": 1039} {"train_loss": -5.507074356079102, "global_step": 43645, "epoch": 1039} {"train_loss": -5.636669158935547, "global_step": 43646, "epoch": 1039} {"train_loss": -5.6687164306640625, "global_step": 43647, "epoch": 1039} {"train_loss": -5.631186485290527, "global_step": 43648, "epoch": 1039} {"train_loss": -5.6327362060546875, "global_step": 43649, "epoch": 1039} {"train_loss": -5.642230987548828, "global_step": 43650, "epoch": 1039} {"train_loss": -5.666508674621582, "global_step": 43651, "epoch": 1039} {"train_loss": -5.579869270324707, "global_step": 43652, "epoch": 1039} {"train_loss": -5.56401252746582, "global_step": 43653, "epoch": 1039} {"train_loss": -5.668671131134033, "global_step": 43654, "epoch": 1039} {"train_loss": -5.6642279624938965, "global_step": 43655, "epoch": 1039} {"train_loss": -5.765727519989014, "global_step": 43656, "epoch": 1039} {"train_loss": -5.683933734893799, "global_step": 43657, "epoch": 1039} {"train_loss": -5.626795768737793, "global_step": 43658, "epoch": 1039} {"train_loss": -5.686030864715576, "global_step": 43659, "epoch": 1039} {"train_loss": -5.640249252319336, "global_step": 43660, "epoch": 1039} {"train_loss": -5.5898518562316895, "global_step": 43661, "epoch": 1039} {"train_loss": -5.822331428527832, "global_step": 43662, "epoch": 1039} {"train_loss": -5.699348449707031, "global_step": 43663, "epoch": 1039} {"train_loss": -5.676478862762451, "global_step": 43664, "epoch": 1039} {"train_loss": -5.6794257164001465, "global_step": 43665, "epoch": 1039} {"train_loss": -5.7471923828125, "global_step": 43666, "epoch": 1039} {"train_loss": -5.601809501647949, "global_step": 43667, "epoch": 1039} {"train_loss": -5.61376428604126, "global_step": 43668, "epoch": 1039} {"train_loss": -5.655693054199219, "global_step": 43669, "epoch": 1039} {"train_loss": -5.766305923461914, "global_step": 43670, "epoch": 1039} {"train_loss": -5.652469635009766, "global_step": 43671, "epoch": 1039} {"train_loss": -5.59019660949707, "global_step": 43672, "epoch": 1039} {"train_loss": -5.730213642120361, "global_step": 43673, "epoch": 1039} {"train_loss": -5.629307270050049, "global_step": 43674, "epoch": 1039} {"train_loss": -5.620211601257324, "global_step": 43675, "epoch": 1039} {"train_loss": -5.6573920249938965, "global_step": 43676, "epoch": 1039} {"train_loss": -5.629924774169922, "global_step": 43677, "epoch": 1039} {"train_loss": -5.7929205894470215, "global_step": 43678, "epoch": 1039} {"train_loss": -5.666541837510609, "global_step": 43679, "epoch": 1039, "val_loss": 74033.609375} {"train_loss": -5.733731269836426, "global_step": 43680, "epoch": 1040} {"train_loss": -5.728167533874512, "global_step": 43681, "epoch": 1040} {"train_loss": -5.758845329284668, "global_step": 43682, "epoch": 1040} {"train_loss": -5.668603897094727, "global_step": 43683, "epoch": 1040} {"train_loss": -5.589641571044922, "global_step": 43684, "epoch": 1040} {"train_loss": -5.648855209350586, "global_step": 43685, "epoch": 1040} {"train_loss": -5.780827522277832, "global_step": 43686, "epoch": 1040} {"train_loss": -5.6532440185546875, "global_step": 43687, "epoch": 1040} {"train_loss": -5.7475128173828125, "global_step": 43688, "epoch": 1040} {"train_loss": -5.757810115814209, "global_step": 43689, "epoch": 1040} {"train_loss": -5.759535789489746, "global_step": 43690, "epoch": 1040} {"train_loss": -5.626618385314941, "global_step": 43691, "epoch": 1040} {"train_loss": -5.73255729675293, "global_step": 43692, "epoch": 1040} {"train_loss": -5.728031158447266, "global_step": 43693, "epoch": 1040} {"train_loss": -5.716235160827637, "global_step": 43694, "epoch": 1040} {"train_loss": -5.441060543060303, "global_step": 43695, "epoch": 1040} {"train_loss": -5.7371344566345215, "global_step": 43696, "epoch": 1040} {"train_loss": -5.619623184204102, "global_step": 43697, "epoch": 1040} {"train_loss": -5.642666816711426, "global_step": 43698, "epoch": 1040} {"train_loss": -5.638473987579346, "global_step": 43699, "epoch": 1040} {"train_loss": -5.6385297775268555, "global_step": 43700, "epoch": 1040} {"train_loss": -5.5561017990112305, "global_step": 43701, "epoch": 1040} {"train_loss": -5.636063575744629, "global_step": 43702, "epoch": 1040} {"train_loss": -5.610450744628906, "global_step": 43703, "epoch": 1040} {"train_loss": -5.601422309875488, "global_step": 43704, "epoch": 1040} {"train_loss": -5.5609211921691895, "global_step": 43705, "epoch": 1040} {"train_loss": -5.675073623657227, "global_step": 43706, "epoch": 1040} {"train_loss": -5.6346588134765625, "global_step": 43707, "epoch": 1040} {"train_loss": -5.587215900421143, "global_step": 43708, "epoch": 1040} {"train_loss": -5.776391983032227, "global_step": 43709, "epoch": 1040} {"train_loss": -5.696963310241699, "global_step": 43710, "epoch": 1040} {"train_loss": -5.609562873840332, "global_step": 43711, "epoch": 1040} {"train_loss": -5.699362754821777, "global_step": 43712, "epoch": 1040} {"train_loss": -5.710155487060547, "global_step": 43713, "epoch": 1040} {"train_loss": -5.719143867492676, "global_step": 43714, "epoch": 1040} {"train_loss": -5.640127658843994, "global_step": 43715, "epoch": 1040} {"train_loss": -5.735348701477051, "global_step": 43716, "epoch": 1040} {"train_loss": -5.623116493225098, "global_step": 43717, "epoch": 1040} {"train_loss": -5.732481956481934, "global_step": 43718, "epoch": 1040} {"train_loss": -5.695138931274414, "global_step": 43719, "epoch": 1040} {"train_loss": -5.708818435668945, "global_step": 43720, "epoch": 1040} {"train_loss": -5.674254020055135, "global_step": 43721, "epoch": 1040, "val_loss": 74348.859375} {"train_loss": -5.604856491088867, "global_step": 43722, "epoch": 1041} {"train_loss": -5.720535755157471, "global_step": 43723, "epoch": 1041} {"train_loss": -5.846521854400635, "global_step": 43724, "epoch": 1041} {"train_loss": -5.613944053649902, "global_step": 43725, "epoch": 1041} {"train_loss": -5.710236072540283, "global_step": 43726, "epoch": 1041} {"train_loss": -5.653900623321533, "global_step": 43727, "epoch": 1041} {"train_loss": -5.692272663116455, "global_step": 43728, "epoch": 1041} {"train_loss": -5.692079067230225, "global_step": 43729, "epoch": 1041} {"train_loss": -5.713634490966797, "global_step": 43730, "epoch": 1041} {"train_loss": -5.712980270385742, "global_step": 43731, "epoch": 1041} {"train_loss": -5.790444374084473, "global_step": 43732, "epoch": 1041} {"train_loss": -5.661290168762207, "global_step": 43733, "epoch": 1041} {"train_loss": -5.705663681030273, "global_step": 43734, "epoch": 1041} {"train_loss": -5.668575763702393, "global_step": 43735, "epoch": 1041} {"train_loss": -5.664358139038086, "global_step": 43736, "epoch": 1041} {"train_loss": -5.743175506591797, "global_step": 43737, "epoch": 1041} {"train_loss": -5.6639251708984375, "global_step": 43738, "epoch": 1041} {"train_loss": -5.516643524169922, "global_step": 43739, "epoch": 1041} {"train_loss": -5.769235134124756, "global_step": 43740, "epoch": 1041} {"train_loss": -5.549684047698975, "global_step": 43741, "epoch": 1041} {"train_loss": -5.6954240798950195, "global_step": 43742, "epoch": 1041} {"train_loss": -5.669301509857178, "global_step": 43743, "epoch": 1041} {"train_loss": -5.543519020080566, "global_step": 43744, "epoch": 1041} {"train_loss": -5.701556205749512, "global_step": 43745, "epoch": 1041} {"train_loss": -5.6784563064575195, "global_step": 43746, "epoch": 1041} {"train_loss": -5.649179935455322, "global_step": 43747, "epoch": 1041} {"train_loss": -5.6070556640625, "global_step": 43748, "epoch": 1041} {"train_loss": -5.5689778327941895, "global_step": 43749, "epoch": 1041} {"train_loss": -5.64210844039917, "global_step": 43750, "epoch": 1041} {"train_loss": -5.687132358551025, "global_step": 43751, "epoch": 1041} {"train_loss": -5.600258827209473, "global_step": 43752, "epoch": 1041} {"train_loss": -5.543563365936279, "global_step": 43753, "epoch": 1041} {"train_loss": -5.8097615242004395, "global_step": 43754, "epoch": 1041} {"train_loss": -5.702315330505371, "global_step": 43755, "epoch": 1041} {"train_loss": -5.65578556060791, "global_step": 43756, "epoch": 1041} {"train_loss": -5.714855194091797, "global_step": 43757, "epoch": 1041} {"train_loss": -5.761081695556641, "global_step": 43758, "epoch": 1041} {"train_loss": -5.557427883148193, "global_step": 43759, "epoch": 1041} {"train_loss": -5.662924766540527, "global_step": 43760, "epoch": 1041} {"train_loss": -5.642871856689453, "global_step": 43761, "epoch": 1041} {"train_loss": -5.798244476318359, "global_step": 43762, "epoch": 1041} {"train_loss": -5.672810849689302, "global_step": 43763, "epoch": 1041, "val_loss": 73978.875} {"train_loss": -5.81773042678833, "global_step": 43764, "epoch": 1042} {"train_loss": -5.666723251342773, "global_step": 43765, "epoch": 1042} {"train_loss": -5.6526689529418945, "global_step": 43766, "epoch": 1042} {"train_loss": -5.694620609283447, "global_step": 43767, "epoch": 1042} {"train_loss": -5.713561534881592, "global_step": 43768, "epoch": 1042} {"train_loss": -5.763181686401367, "global_step": 43769, "epoch": 1042} {"train_loss": -5.702530860900879, "global_step": 43770, "epoch": 1042} {"train_loss": -5.697403430938721, "global_step": 43771, "epoch": 1042} {"train_loss": -5.757391452789307, "global_step": 43772, "epoch": 1042} {"train_loss": -5.759703636169434, "global_step": 43773, "epoch": 1042} {"train_loss": -5.691416263580322, "global_step": 43774, "epoch": 1042} {"train_loss": -5.6975579261779785, "global_step": 43775, "epoch": 1042} {"train_loss": -5.695399284362793, "global_step": 43776, "epoch": 1042} {"train_loss": -5.584816932678223, "global_step": 43777, "epoch": 1042} {"train_loss": -5.687900066375732, "global_step": 43778, "epoch": 1042} {"train_loss": -5.816961765289307, "global_step": 43779, "epoch": 1042} {"train_loss": -5.671697616577148, "global_step": 43780, "epoch": 1042} {"train_loss": -5.800484657287598, "global_step": 43781, "epoch": 1042} {"train_loss": -5.780200481414795, "global_step": 43782, "epoch": 1042} {"train_loss": -5.708558082580566, "global_step": 43783, "epoch": 1042} {"train_loss": -5.643125534057617, "global_step": 43784, "epoch": 1042} {"train_loss": -5.697125434875488, "global_step": 43785, "epoch": 1042} {"train_loss": -5.619519233703613, "global_step": 43786, "epoch": 1042} {"train_loss": -5.70900821685791, "global_step": 43787, "epoch": 1042} {"train_loss": -5.832846164703369, "global_step": 43788, "epoch": 1042} {"train_loss": -5.716432571411133, "global_step": 43789, "epoch": 1042} {"train_loss": -5.673434257507324, "global_step": 43790, "epoch": 1042} {"train_loss": -5.597949981689453, "global_step": 43791, "epoch": 1042} {"train_loss": -5.619021415710449, "global_step": 43792, "epoch": 1042} {"train_loss": -5.523073673248291, "global_step": 43793, "epoch": 1042} {"train_loss": -5.708416938781738, "global_step": 43794, "epoch": 1042} {"train_loss": -5.740782737731934, "global_step": 43795, "epoch": 1042} {"train_loss": -5.743776321411133, "global_step": 43796, "epoch": 1042} {"train_loss": -5.676536560058594, "global_step": 43797, "epoch": 1042} {"train_loss": -5.706249713897705, "global_step": 43798, "epoch": 1042} {"train_loss": -5.580771446228027, "global_step": 43799, "epoch": 1042} {"train_loss": -5.668631553649902, "global_step": 43800, "epoch": 1042} {"train_loss": -5.694086074829102, "global_step": 43801, "epoch": 1042} {"train_loss": -5.634006500244141, "global_step": 43802, "epoch": 1042} {"train_loss": -5.552002429962158, "global_step": 43803, "epoch": 1042} {"train_loss": -5.74968957901001, "global_step": 43804, "epoch": 1042} {"train_loss": -5.695181483314151, "global_step": 43805, "epoch": 1042, "val_loss": 73684.359375} {"train_loss": -5.694938659667969, "global_step": 43806, "epoch": 1043} {"train_loss": -5.688170433044434, "global_step": 43807, "epoch": 1043} {"train_loss": -5.740667343139648, "global_step": 43808, "epoch": 1043} {"train_loss": -5.5709147453308105, "global_step": 43809, "epoch": 1043} {"train_loss": -5.7094926834106445, "global_step": 43810, "epoch": 1043} {"train_loss": -5.6817522048950195, "global_step": 43811, "epoch": 1043} {"train_loss": -5.6466755867004395, "global_step": 43812, "epoch": 1043} {"train_loss": -5.766227722167969, "global_step": 43813, "epoch": 1043} {"train_loss": -5.5849432945251465, "global_step": 43814, "epoch": 1043} {"train_loss": -5.600510597229004, "global_step": 43815, "epoch": 1043} {"train_loss": -5.735895156860352, "global_step": 43816, "epoch": 1043} {"train_loss": -5.514491081237793, "global_step": 43817, "epoch": 1043} {"train_loss": -5.71103572845459, "global_step": 43818, "epoch": 1043} {"train_loss": -5.48038387298584, "global_step": 43819, "epoch": 1043} {"train_loss": -5.601747512817383, "global_step": 43820, "epoch": 1043} {"train_loss": -5.659674644470215, "global_step": 43821, "epoch": 1043} {"train_loss": -5.620075225830078, "global_step": 43822, "epoch": 1043} {"train_loss": -5.847594261169434, "global_step": 43823, "epoch": 1043} {"train_loss": -5.624988555908203, "global_step": 43824, "epoch": 1043} {"train_loss": -5.756864547729492, "global_step": 43825, "epoch": 1043} {"train_loss": -5.578764915466309, "global_step": 43826, "epoch": 1043} {"train_loss": -5.809170722961426, "global_step": 43827, "epoch": 1043} {"train_loss": -5.635080337524414, "global_step": 43828, "epoch": 1043} {"train_loss": -5.690651893615723, "global_step": 43829, "epoch": 1043} {"train_loss": -5.5744829177856445, "global_step": 43830, "epoch": 1043} {"train_loss": -5.552027225494385, "global_step": 43831, "epoch": 1043} {"train_loss": -5.58514928817749, "global_step": 43832, "epoch": 1043} {"train_loss": -5.583514213562012, "global_step": 43833, "epoch": 1043} {"train_loss": -5.618208885192871, "global_step": 43834, "epoch": 1043} {"train_loss": -5.824516296386719, "global_step": 43835, "epoch": 1043} {"train_loss": -5.654184341430664, "global_step": 43836, "epoch": 1043} {"train_loss": -5.763728141784668, "global_step": 43837, "epoch": 1043} {"train_loss": -5.734593391418457, "global_step": 43838, "epoch": 1043} {"train_loss": -5.599518299102783, "global_step": 43839, "epoch": 1043} {"train_loss": -5.686485290527344, "global_step": 43840, "epoch": 1043} {"train_loss": -5.754714012145996, "global_step": 43841, "epoch": 1043} {"train_loss": -5.669463157653809, "global_step": 43842, "epoch": 1043} {"train_loss": -5.734856605529785, "global_step": 43843, "epoch": 1043} {"train_loss": -5.712680339813232, "global_step": 43844, "epoch": 1043} {"train_loss": -5.655664443969727, "global_step": 43845, "epoch": 1043} {"train_loss": -5.722878932952881, "global_step": 43846, "epoch": 1043} {"train_loss": -5.664873747598557, "global_step": 43847, "epoch": 1043, "val_loss": 74287.1953125} {"train_loss": -5.599441051483154, "global_step": 43848, "epoch": 1044} {"train_loss": -5.684475898742676, "global_step": 43849, "epoch": 1044} {"train_loss": -5.653305530548096, "global_step": 43850, "epoch": 1044} {"train_loss": -5.723230361938477, "global_step": 43851, "epoch": 1044} {"train_loss": -5.676484107971191, "global_step": 43852, "epoch": 1044} {"train_loss": -5.779994010925293, "global_step": 43853, "epoch": 1044} {"train_loss": -5.667572975158691, "global_step": 43854, "epoch": 1044} {"train_loss": -5.731132984161377, "global_step": 43855, "epoch": 1044} {"train_loss": -5.661716461181641, "global_step": 43856, "epoch": 1044} {"train_loss": -5.580357074737549, "global_step": 43857, "epoch": 1044} {"train_loss": -5.738272666931152, "global_step": 43858, "epoch": 1044} {"train_loss": -5.731770038604736, "global_step": 43859, "epoch": 1044} {"train_loss": -5.8141374588012695, "global_step": 43860, "epoch": 1044} {"train_loss": -5.5849833488464355, "global_step": 43861, "epoch": 1044} {"train_loss": -5.628692626953125, "global_step": 43862, "epoch": 1044} {"train_loss": -5.707486629486084, "global_step": 43863, "epoch": 1044} {"train_loss": -5.551258087158203, "global_step": 43864, "epoch": 1044} {"train_loss": -5.665988922119141, "global_step": 43865, "epoch": 1044} {"train_loss": -5.534534454345703, "global_step": 43866, "epoch": 1044} {"train_loss": -5.531116962432861, "global_step": 43867, "epoch": 1044} {"train_loss": -5.688259124755859, "global_step": 43868, "epoch": 1044} {"train_loss": -5.6761474609375, "global_step": 43869, "epoch": 1044} {"train_loss": -5.536030292510986, "global_step": 43870, "epoch": 1044} {"train_loss": -5.585293769836426, "global_step": 43871, "epoch": 1044} {"train_loss": -5.706964015960693, "global_step": 43872, "epoch": 1044} {"train_loss": -5.669564247131348, "global_step": 43873, "epoch": 1044} {"train_loss": -5.590480804443359, "global_step": 43874, "epoch": 1044} {"train_loss": -5.588834285736084, "global_step": 43875, "epoch": 1044} {"train_loss": -5.577631950378418, "global_step": 43876, "epoch": 1044} {"train_loss": -5.7846832275390625, "global_step": 43877, "epoch": 1044} {"train_loss": -5.68782901763916, "global_step": 43878, "epoch": 1044} {"train_loss": -5.628103256225586, "global_step": 43879, "epoch": 1044} {"train_loss": -5.7506914138793945, "global_step": 43880, "epoch": 1044} {"train_loss": -5.665859222412109, "global_step": 43881, "epoch": 1044} {"train_loss": -5.675670623779297, "global_step": 43882, "epoch": 1044} {"train_loss": -5.73237419128418, "global_step": 43883, "epoch": 1044} {"train_loss": -5.6338725090026855, "global_step": 43884, "epoch": 1044} {"train_loss": -5.630611419677734, "global_step": 43885, "epoch": 1044} {"train_loss": -5.641036033630371, "global_step": 43886, "epoch": 1044} {"train_loss": -5.7642998695373535, "global_step": 43887, "epoch": 1044} {"train_loss": -5.768263816833496, "global_step": 43888, "epoch": 1044} {"train_loss": -5.665262154170445, "global_step": 43889, "epoch": 1044, "val_loss": 74014.59375} {"train_loss": -5.719515323638916, "global_step": 43890, "epoch": 1045} {"train_loss": -5.7667131423950195, "global_step": 43891, "epoch": 1045} {"train_loss": -5.809161186218262, "global_step": 43892, "epoch": 1045} {"train_loss": -5.664769172668457, "global_step": 43893, "epoch": 1045} {"train_loss": -5.7679595947265625, "global_step": 43894, "epoch": 1045} {"train_loss": -5.677586078643799, "global_step": 43895, "epoch": 1045} {"train_loss": -5.769700527191162, "global_step": 43896, "epoch": 1045} {"train_loss": -5.691366672515869, "global_step": 43897, "epoch": 1045} {"train_loss": -5.7272748947143555, "global_step": 43898, "epoch": 1045} {"train_loss": -5.660285949707031, "global_step": 43899, "epoch": 1045} {"train_loss": -5.738254547119141, "global_step": 43900, "epoch": 1045} {"train_loss": -5.7171525955200195, "global_step": 43901, "epoch": 1045} {"train_loss": -5.537802696228027, "global_step": 43902, "epoch": 1045} {"train_loss": -5.70754861831665, "global_step": 43903, "epoch": 1045} {"train_loss": -5.688731670379639, "global_step": 43904, "epoch": 1045} {"train_loss": -5.625850200653076, "global_step": 43905, "epoch": 1045} {"train_loss": -5.633737564086914, "global_step": 43906, "epoch": 1045} {"train_loss": -5.671382904052734, "global_step": 43907, "epoch": 1045} {"train_loss": -5.635344982147217, "global_step": 43908, "epoch": 1045} {"train_loss": -5.843729496002197, "global_step": 43909, "epoch": 1045} {"train_loss": -5.621582984924316, "global_step": 43910, "epoch": 1045} {"train_loss": -5.644238471984863, "global_step": 43911, "epoch": 1045} {"train_loss": -5.5830583572387695, "global_step": 43912, "epoch": 1045} {"train_loss": -5.760444641113281, "global_step": 43913, "epoch": 1045} {"train_loss": -5.869727611541748, "global_step": 43914, "epoch": 1045} {"train_loss": -5.469758987426758, "global_step": 43915, "epoch": 1045} {"train_loss": -5.791319847106934, "global_step": 43916, "epoch": 1045} {"train_loss": -5.682611465454102, "global_step": 43917, "epoch": 1045} {"train_loss": -5.4867329597473145, "global_step": 43918, "epoch": 1045} {"train_loss": -5.596378326416016, "global_step": 43919, "epoch": 1045} {"train_loss": -5.648189544677734, "global_step": 43920, "epoch": 1045} {"train_loss": -5.65402889251709, "global_step": 43921, "epoch": 1045} {"train_loss": -5.610993385314941, "global_step": 43922, "epoch": 1045} {"train_loss": -5.598031044006348, "global_step": 43923, "epoch": 1045} {"train_loss": -5.6363935470581055, "global_step": 43924, "epoch": 1045} {"train_loss": -5.548127174377441, "global_step": 43925, "epoch": 1045} {"train_loss": -5.6611328125, "global_step": 43926, "epoch": 1045} {"train_loss": -5.555802345275879, "global_step": 43927, "epoch": 1045} {"train_loss": -5.667270660400391, "global_step": 43928, "epoch": 1045} {"train_loss": -5.416537761688232, "global_step": 43929, "epoch": 1045} {"train_loss": -5.732621192932129, "global_step": 43930, "epoch": 1045} {"train_loss": -5.666322151819865, "global_step": 43931, "epoch": 1045, "val_loss": 74037.21875} {"train_loss": -5.7123260498046875, "global_step": 43932, "epoch": 1046} {"train_loss": -5.742344856262207, "global_step": 43933, "epoch": 1046} {"train_loss": -5.664665222167969, "global_step": 43934, "epoch": 1046} {"train_loss": -5.655606269836426, "global_step": 43935, "epoch": 1046} {"train_loss": -5.47206974029541, "global_step": 43936, "epoch": 1046} {"train_loss": -5.680083274841309, "global_step": 43937, "epoch": 1046} {"train_loss": -5.742156982421875, "global_step": 43938, "epoch": 1046} {"train_loss": -5.704216957092285, "global_step": 43939, "epoch": 1046} {"train_loss": -5.67786979675293, "global_step": 43940, "epoch": 1046} {"train_loss": -5.725872993469238, "global_step": 43941, "epoch": 1046} {"train_loss": -5.728452682495117, "global_step": 43942, "epoch": 1046} {"train_loss": -5.676210403442383, "global_step": 43943, "epoch": 1046} {"train_loss": -5.7465434074401855, "global_step": 43944, "epoch": 1046} {"train_loss": -5.716867446899414, "global_step": 43945, "epoch": 1046} {"train_loss": -5.793338775634766, "global_step": 43946, "epoch": 1046} {"train_loss": -5.74691915512085, "global_step": 43947, "epoch": 1046} {"train_loss": -5.770931720733643, "global_step": 43948, "epoch": 1046} {"train_loss": -5.763037204742432, "global_step": 43949, "epoch": 1046} {"train_loss": -5.581979274749756, "global_step": 43950, "epoch": 1046} {"train_loss": -5.6536712646484375, "global_step": 43951, "epoch": 1046} {"train_loss": -5.7980756759643555, "global_step": 43952, "epoch": 1046} {"train_loss": -5.568276882171631, "global_step": 43953, "epoch": 1046} {"train_loss": -5.589138031005859, "global_step": 43954, "epoch": 1046} {"train_loss": -5.612550735473633, "global_step": 43955, "epoch": 1046} {"train_loss": -5.64622163772583, "global_step": 43956, "epoch": 1046} {"train_loss": -5.745997428894043, "global_step": 43957, "epoch": 1046} {"train_loss": -5.711999893188477, "global_step": 43958, "epoch": 1046} {"train_loss": -5.637856483459473, "global_step": 43959, "epoch": 1046} {"train_loss": -5.729036331176758, "global_step": 43960, "epoch": 1046} {"train_loss": -5.644335746765137, "global_step": 43961, "epoch": 1046} {"train_loss": -5.653676509857178, "global_step": 43962, "epoch": 1046} {"train_loss": -5.725315093994141, "global_step": 43963, "epoch": 1046} {"train_loss": -5.700780391693115, "global_step": 43964, "epoch": 1046} {"train_loss": -5.591875076293945, "global_step": 43965, "epoch": 1046} {"train_loss": -5.5841264724731445, "global_step": 43966, "epoch": 1046} {"train_loss": -5.786443710327148, "global_step": 43967, "epoch": 1046} {"train_loss": -5.511298656463623, "global_step": 43968, "epoch": 1046} {"train_loss": -5.7300124168396, "global_step": 43969, "epoch": 1046} {"train_loss": -5.4974212646484375, "global_step": 43970, "epoch": 1046} {"train_loss": -5.645357608795166, "global_step": 43971, "epoch": 1046} {"train_loss": -5.485661029815674, "global_step": 43972, "epoch": 1046} {"train_loss": -5.6694894064040415, "global_step": 43973, "epoch": 1046, "val_loss": 74335.265625} {"train_loss": -5.80696964263916, "global_step": 43974, "epoch": 1047} {"train_loss": -5.677618980407715, "global_step": 43975, "epoch": 1047} {"train_loss": -5.608654022216797, "global_step": 43976, "epoch": 1047} {"train_loss": -5.776424407958984, "global_step": 43977, "epoch": 1047} {"train_loss": -5.609883785247803, "global_step": 43978, "epoch": 1047} {"train_loss": -5.664615154266357, "global_step": 43979, "epoch": 1047} {"train_loss": -5.696962833404541, "global_step": 43980, "epoch": 1047} {"train_loss": -5.688055992126465, "global_step": 43981, "epoch": 1047} {"train_loss": -5.630897521972656, "global_step": 43982, "epoch": 1047} {"train_loss": -5.741395950317383, "global_step": 43983, "epoch": 1047} {"train_loss": -5.697204113006592, "global_step": 43984, "epoch": 1047} {"train_loss": -5.66278076171875, "global_step": 43985, "epoch": 1047} {"train_loss": -5.696240425109863, "global_step": 43986, "epoch": 1047} {"train_loss": -5.617637634277344, "global_step": 43987, "epoch": 1047} {"train_loss": -5.703505516052246, "global_step": 43988, "epoch": 1047} {"train_loss": -5.739817142486572, "global_step": 43989, "epoch": 1047} {"train_loss": -5.703861236572266, "global_step": 43990, "epoch": 1047} {"train_loss": -5.7704668045043945, "global_step": 43991, "epoch": 1047} {"train_loss": -5.6948747634887695, "global_step": 43992, "epoch": 1047} {"train_loss": -5.778042793273926, "global_step": 43993, "epoch": 1047} {"train_loss": -5.827695846557617, "global_step": 43994, "epoch": 1047} {"train_loss": -5.770890235900879, "global_step": 43995, "epoch": 1047} {"train_loss": -5.571115970611572, "global_step": 43996, "epoch": 1047} {"train_loss": -5.685811996459961, "global_step": 43997, "epoch": 1047} {"train_loss": -5.566893577575684, "global_step": 43998, "epoch": 1047} {"train_loss": -5.686452865600586, "global_step": 43999, "epoch": 1047} {"train_loss": -5.659938812255859, "global_step": 44000, "epoch": 1047} {"train_loss": -5.656393527984619, "global_step": 44001, "epoch": 1047} {"train_loss": -5.660778999328613, "global_step": 44002, "epoch": 1047} {"train_loss": -5.798650741577148, "global_step": 44003, "epoch": 1047} {"train_loss": -5.616127967834473, "global_step": 44004, "epoch": 1047} {"train_loss": -5.66090726852417, "global_step": 44005, "epoch": 1047} {"train_loss": -5.704179763793945, "global_step": 44006, "epoch": 1047} {"train_loss": -5.726914405822754, "global_step": 44007, "epoch": 1047} {"train_loss": -5.704403877258301, "global_step": 44008, "epoch": 1047} {"train_loss": -5.696322441101074, "global_step": 44009, "epoch": 1047} {"train_loss": -5.787161827087402, "global_step": 44010, "epoch": 1047} {"train_loss": -5.712344169616699, "global_step": 44011, "epoch": 1047} {"train_loss": -5.696745872497559, "global_step": 44012, "epoch": 1047} {"train_loss": -5.68209981918335, "global_step": 44013, "epoch": 1047} {"train_loss": -5.670029640197754, "global_step": 44014, "epoch": 1047} {"train_loss": -5.693444603965396, "global_step": 44015, "epoch": 1047, "val_loss": 74196.0} {"train_loss": -5.671184539794922, "global_step": 44016, "epoch": 1048} {"train_loss": -5.683935165405273, "global_step": 44017, "epoch": 1048} {"train_loss": -5.730990409851074, "global_step": 44018, "epoch": 1048} {"train_loss": -5.658857345581055, "global_step": 44019, "epoch": 1048} {"train_loss": -5.811496734619141, "global_step": 44020, "epoch": 1048} {"train_loss": -5.7490105628967285, "global_step": 44021, "epoch": 1048} {"train_loss": -5.619158744812012, "global_step": 44022, "epoch": 1048} {"train_loss": -5.84151554107666, "global_step": 44023, "epoch": 1048} {"train_loss": -5.711580276489258, "global_step": 44024, "epoch": 1048} {"train_loss": -5.703298568725586, "global_step": 44025, "epoch": 1048} {"train_loss": -5.766034126281738, "global_step": 44026, "epoch": 1048} {"train_loss": -5.702556133270264, "global_step": 44027, "epoch": 1048} {"train_loss": -5.726276874542236, "global_step": 44028, "epoch": 1048} {"train_loss": -5.697511672973633, "global_step": 44029, "epoch": 1048} {"train_loss": -5.780117988586426, "global_step": 44030, "epoch": 1048} {"train_loss": -5.610948085784912, "global_step": 44031, "epoch": 1048} {"train_loss": -5.688711166381836, "global_step": 44032, "epoch": 1048} {"train_loss": -5.712761878967285, "global_step": 44033, "epoch": 1048} {"train_loss": -5.718555450439453, "global_step": 44034, "epoch": 1048} {"train_loss": -5.77495002746582, "global_step": 44035, "epoch": 1048} {"train_loss": -5.81855583190918, "global_step": 44036, "epoch": 1048} {"train_loss": -5.649514198303223, "global_step": 44037, "epoch": 1048} {"train_loss": -5.723956108093262, "global_step": 44038, "epoch": 1048} {"train_loss": -5.658391952514648, "global_step": 44039, "epoch": 1048} {"train_loss": -5.639133453369141, "global_step": 44040, "epoch": 1048} {"train_loss": -5.732997894287109, "global_step": 44041, "epoch": 1048} {"train_loss": -5.710025787353516, "global_step": 44042, "epoch": 1048} {"train_loss": -5.733531951904297, "global_step": 44043, "epoch": 1048} {"train_loss": -5.79506778717041, "global_step": 44044, "epoch": 1048} {"train_loss": -5.611037254333496, "global_step": 44045, "epoch": 1048} {"train_loss": -5.715648651123047, "global_step": 44046, "epoch": 1048} {"train_loss": -5.624489784240723, "global_step": 44047, "epoch": 1048} {"train_loss": -5.695992469787598, "global_step": 44048, "epoch": 1048} {"train_loss": -5.650014877319336, "global_step": 44049, "epoch": 1048} {"train_loss": -5.612003803253174, "global_step": 44050, "epoch": 1048} {"train_loss": -5.735101699829102, "global_step": 44051, "epoch": 1048} {"train_loss": -5.561530113220215, "global_step": 44052, "epoch": 1048} {"train_loss": -5.70237398147583, "global_step": 44053, "epoch": 1048} {"train_loss": -5.569276809692383, "global_step": 44054, "epoch": 1048} {"train_loss": -5.696949005126953, "global_step": 44055, "epoch": 1048} {"train_loss": -5.61956787109375, "global_step": 44056, "epoch": 1048} {"train_loss": -5.696534440630958, "global_step": 44057, "epoch": 1048, "val_loss": 74072.890625} {"train_loss": -5.764159202575684, "global_step": 44058, "epoch": 1049} {"train_loss": -5.743606090545654, "global_step": 44059, "epoch": 1049} {"train_loss": -5.6568427085876465, "global_step": 44060, "epoch": 1049} {"train_loss": -5.546914100646973, "global_step": 44061, "epoch": 1049} {"train_loss": -5.773899555206299, "global_step": 44062, "epoch": 1049} {"train_loss": -5.643156051635742, "global_step": 44063, "epoch": 1049} {"train_loss": -5.696469306945801, "global_step": 44064, "epoch": 1049} {"train_loss": -5.745841026306152, "global_step": 44065, "epoch": 1049} {"train_loss": -5.742903709411621, "global_step": 44066, "epoch": 1049} {"train_loss": -5.635383129119873, "global_step": 44067, "epoch": 1049} {"train_loss": -5.663335800170898, "global_step": 44068, "epoch": 1049} {"train_loss": -5.7533721923828125, "global_step": 44069, "epoch": 1049} {"train_loss": -5.622474670410156, "global_step": 44070, "epoch": 1049} {"train_loss": -5.6892266273498535, "global_step": 44071, "epoch": 1049} {"train_loss": -5.712679862976074, "global_step": 44072, "epoch": 1049} {"train_loss": -5.704489707946777, "global_step": 44073, "epoch": 1049} {"train_loss": -5.63889217376709, "global_step": 44074, "epoch": 1049} {"train_loss": -5.655875205993652, "global_step": 44075, "epoch": 1049} {"train_loss": -5.767189025878906, "global_step": 44076, "epoch": 1049} {"train_loss": -5.631527900695801, "global_step": 44077, "epoch": 1049} {"train_loss": -5.824920654296875, "global_step": 44078, "epoch": 1049} {"train_loss": -5.654733657836914, "global_step": 44079, "epoch": 1049} {"train_loss": -5.681545257568359, "global_step": 44080, "epoch": 1049} {"train_loss": -5.796342849731445, "global_step": 44081, "epoch": 1049} {"train_loss": -5.689953327178955, "global_step": 44082, "epoch": 1049} {"train_loss": -5.6665215492248535, "global_step": 44083, "epoch": 1049} {"train_loss": -5.676979064941406, "global_step": 44084, "epoch": 1049} {"train_loss": -5.846595764160156, "global_step": 44085, "epoch": 1049} {"train_loss": -5.697768211364746, "global_step": 44086, "epoch": 1049} {"train_loss": -5.7501020431518555, "global_step": 44087, "epoch": 1049} {"train_loss": -5.785799026489258, "global_step": 44088, "epoch": 1049} {"train_loss": -5.7244696617126465, "global_step": 44089, "epoch": 1049} {"train_loss": -5.746159553527832, "global_step": 44090, "epoch": 1049} {"train_loss": -5.677444934844971, "global_step": 44091, "epoch": 1049} {"train_loss": -5.660296440124512, "global_step": 44092, "epoch": 1049} {"train_loss": -5.669747352600098, "global_step": 44093, "epoch": 1049} {"train_loss": -5.69480562210083, "global_step": 44094, "epoch": 1049} {"train_loss": -5.72310733795166, "global_step": 44095, "epoch": 1049} {"train_loss": -5.644298553466797, "global_step": 44096, "epoch": 1049} {"train_loss": -5.687636375427246, "global_step": 44097, "epoch": 1049} {"train_loss": -5.788793563842773, "global_step": 44098, "epoch": 1049} {"train_loss": -5.706439290727888, "global_step": 44099, "epoch": 1049, "val_loss": 74382.78125} {"train_loss": -5.748184680938721, "global_step": 44100, "epoch": 1050} {"train_loss": -5.699306488037109, "global_step": 44101, "epoch": 1050} {"train_loss": -5.684510707855225, "global_step": 44102, "epoch": 1050} {"train_loss": -5.675971984863281, "global_step": 44103, "epoch": 1050} {"train_loss": -5.676796913146973, "global_step": 44104, "epoch": 1050} {"train_loss": -5.634097099304199, "global_step": 44105, "epoch": 1050} {"train_loss": -5.716374397277832, "global_step": 44106, "epoch": 1050} {"train_loss": -5.791894435882568, "global_step": 44107, "epoch": 1050} {"train_loss": -5.779609680175781, "global_step": 44108, "epoch": 1050} {"train_loss": -5.741899490356445, "global_step": 44109, "epoch": 1050} {"train_loss": -5.532272815704346, "global_step": 44110, "epoch": 1050} {"train_loss": -5.569738388061523, "global_step": 44111, "epoch": 1050} {"train_loss": -5.644375801086426, "global_step": 44112, "epoch": 1050} {"train_loss": -5.6809468269348145, "global_step": 44113, "epoch": 1050} {"train_loss": -5.777832984924316, "global_step": 44114, "epoch": 1050} {"train_loss": -5.696986198425293, "global_step": 44115, "epoch": 1050} {"train_loss": -5.7079362869262695, "global_step": 44116, "epoch": 1050} {"train_loss": -5.805934906005859, "global_step": 44117, "epoch": 1050} {"train_loss": -5.741316795349121, "global_step": 44118, "epoch": 1050} {"train_loss": -5.604120254516602, "global_step": 44119, "epoch": 1050} {"train_loss": -5.714044570922852, "global_step": 44120, "epoch": 1050} {"train_loss": -5.814323425292969, "global_step": 44121, "epoch": 1050} {"train_loss": -5.692938804626465, "global_step": 44122, "epoch": 1050} {"train_loss": -5.735540866851807, "global_step": 44123, "epoch": 1050} {"train_loss": -5.750754356384277, "global_step": 44124, "epoch": 1050} {"train_loss": -5.758453369140625, "global_step": 44125, "epoch": 1050} {"train_loss": -5.6065216064453125, "global_step": 44126, "epoch": 1050} {"train_loss": -5.6634063720703125, "global_step": 44127, "epoch": 1050} {"train_loss": -5.533469200134277, "global_step": 44128, "epoch": 1050} {"train_loss": -5.703571319580078, "global_step": 44129, "epoch": 1050} {"train_loss": -5.740382194519043, "global_step": 44130, "epoch": 1050} {"train_loss": -5.585110664367676, "global_step": 44131, "epoch": 1050} {"train_loss": -5.717028617858887, "global_step": 44132, "epoch": 1050} {"train_loss": -5.584479808807373, "global_step": 44133, "epoch": 1050} {"train_loss": -5.699207782745361, "global_step": 44134, "epoch": 1050} {"train_loss": -5.709555625915527, "global_step": 44135, "epoch": 1050} {"train_loss": -5.650260925292969, "global_step": 44136, "epoch": 1050} {"train_loss": -5.82554817199707, "global_step": 44137, "epoch": 1050} {"train_loss": -5.686541557312012, "global_step": 44138, "epoch": 1050} {"train_loss": -5.679662227630615, "global_step": 44139, "epoch": 1050} {"train_loss": -5.662870407104492, "global_step": 44140, "epoch": 1050} {"train_loss": -5.691040788378034, "global_step": 44141, "epoch": 1050, "train/sim_max_reward_0": 0.5731910840813028, "train/sim_max_reward_1": 0.7577223536520278, "train/sim_max_reward_2": 0.4919324153303401, "train/sim_max_reward_3": 0.16525512355222613, "train/sim_max_reward_4": 0.3476483908979126, "train/sim_max_reward_5": 0.7078780350539081, "test/sim_max_reward_4500000": 0.33500304411042403, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8097501329476225, "test/sim_max_reward_4500003": 0.9332901223238123, "test/sim_max_reward_4500004": 0.09703926571523132, "test/sim_max_reward_4500005": 0.7016293250210237, "test/sim_max_reward_4500006": 0.8381198194550046, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.04861890432239735, "test/sim_max_reward_4500009": 0.3416585702147566, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.8694126716550628, "test/sim_max_reward_4500012": 0.9514011678894468, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.8714413226892384, "test/sim_max_reward_4500015": 0.8427301323928502, "test/sim_max_reward_4500016": 0.01530448240335299, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.004275406616992941, "test/sim_max_reward_4500019": 0.8144545211290392, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.6947014062602808, "test/sim_max_reward_4500022": 0.490194204803315, "test/sim_max_reward_4500023": 0.8874534613827911, "test/sim_max_reward_4500024": 0.7239035351129955, "test/sim_max_reward_4500025": 0.5360672186452299, "test/sim_max_reward_4500026": 0.14413689557340115, "test/sim_max_reward_4500027": 0.798057191940499, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.05008697635837085, "test/sim_max_reward_4500030": 0.26528773590532234, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.16238457252404806, "test/sim_max_reward_4500034": 0.6076531031079494, "test/sim_max_reward_4500035": 0.707972631713406, "test/sim_max_reward_4500036": 0.38220415818725056, "test/sim_max_reward_4500037": 0.4796949129479504, "test/sim_max_reward_4500038": 0.7338151711070293, "test/sim_max_reward_4500039": 0.7308572018125346, "test/sim_max_reward_4500040": 0.8823704233830922, "test/sim_max_reward_4500041": 0.36653264283939185, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.29456922788809464, "test/sim_max_reward_4500045": 0.8740326108061104, "test/sim_max_reward_4500046": 0.6642871111139504, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5072712337612862, "test/mean_score": 0.4041503576266837, "val_loss": 74471.8515625} {"train_loss": -5.596034049987793, "global_step": 44142, "epoch": 1051} {"train_loss": -5.766383171081543, "global_step": 44143, "epoch": 1051} {"train_loss": -5.670815467834473, "global_step": 44144, "epoch": 1051} {"train_loss": -5.698067665100098, "global_step": 44145, "epoch": 1051} {"train_loss": -5.6570587158203125, "global_step": 44146, "epoch": 1051} {"train_loss": -5.812762260437012, "global_step": 44147, "epoch": 1051} {"train_loss": -5.64067268371582, "global_step": 44148, "epoch": 1051} {"train_loss": -5.667071342468262, "global_step": 44149, "epoch": 1051} {"train_loss": -5.817815780639648, "global_step": 44150, "epoch": 1051} {"train_loss": -5.650629997253418, "global_step": 44151, "epoch": 1051} {"train_loss": -5.659638404846191, "global_step": 44152, "epoch": 1051} {"train_loss": -5.804405212402344, "global_step": 44153, "epoch": 1051} {"train_loss": -5.5460100173950195, "global_step": 44154, "epoch": 1051} {"train_loss": -5.65841007232666, "global_step": 44155, "epoch": 1051} {"train_loss": -5.498959064483643, "global_step": 44156, "epoch": 1051} {"train_loss": -5.618525505065918, "global_step": 44157, "epoch": 1051} {"train_loss": -5.730261325836182, "global_step": 44158, "epoch": 1051} {"train_loss": -5.708755016326904, "global_step": 44159, "epoch": 1051} {"train_loss": -5.615151882171631, "global_step": 44160, "epoch": 1051} {"train_loss": -5.666059494018555, "global_step": 44161, "epoch": 1051} {"train_loss": -5.665836811065674, "global_step": 44162, "epoch": 1051} {"train_loss": -5.679189682006836, "global_step": 44163, "epoch": 1051} {"train_loss": -5.691927909851074, "global_step": 44164, "epoch": 1051} {"train_loss": -5.696088790893555, "global_step": 44165, "epoch": 1051} {"train_loss": -5.725575923919678, "global_step": 44166, "epoch": 1051} {"train_loss": -5.6023454666137695, "global_step": 44167, "epoch": 1051} {"train_loss": -5.7166547775268555, "global_step": 44168, "epoch": 1051} {"train_loss": -5.723094940185547, "global_step": 44169, "epoch": 1051} {"train_loss": -5.707801818847656, "global_step": 44170, "epoch": 1051} {"train_loss": -5.745597839355469, "global_step": 44171, "epoch": 1051} {"train_loss": -5.754322052001953, "global_step": 44172, "epoch": 1051} {"train_loss": -5.817503452301025, "global_step": 44173, "epoch": 1051} {"train_loss": -5.695696830749512, "global_step": 44174, "epoch": 1051} {"train_loss": -5.69630241394043, "global_step": 44175, "epoch": 1051} {"train_loss": -5.711599349975586, "global_step": 44176, "epoch": 1051} {"train_loss": -5.591292381286621, "global_step": 44177, "epoch": 1051} {"train_loss": -5.578891754150391, "global_step": 44178, "epoch": 1051} {"train_loss": -5.683813571929932, "global_step": 44179, "epoch": 1051} {"train_loss": -5.709407329559326, "global_step": 44180, "epoch": 1051} {"train_loss": -5.705227851867676, "global_step": 44181, "epoch": 1051} {"train_loss": -5.628660202026367, "global_step": 44182, "epoch": 1051} {"train_loss": -5.681562537238712, "global_step": 44183, "epoch": 1051, "val_loss": 74824.421875} {"train_loss": -5.541576862335205, "global_step": 44184, "epoch": 1052} {"train_loss": -5.7166242599487305, "global_step": 44185, "epoch": 1052} {"train_loss": -5.644338607788086, "global_step": 44186, "epoch": 1052} {"train_loss": -5.678938865661621, "global_step": 44187, "epoch": 1052} {"train_loss": -5.703941345214844, "global_step": 44188, "epoch": 1052} {"train_loss": -5.7424635887146, "global_step": 44189, "epoch": 1052} {"train_loss": -5.638628959655762, "global_step": 44190, "epoch": 1052} {"train_loss": -5.6975626945495605, "global_step": 44191, "epoch": 1052} {"train_loss": -5.825194358825684, "global_step": 44192, "epoch": 1052} {"train_loss": -5.74009895324707, "global_step": 44193, "epoch": 1052} {"train_loss": -5.702813625335693, "global_step": 44194, "epoch": 1052} {"train_loss": -5.785299301147461, "global_step": 44195, "epoch": 1052} {"train_loss": -5.736934185028076, "global_step": 44196, "epoch": 1052} {"train_loss": -5.69049596786499, "global_step": 44197, "epoch": 1052} {"train_loss": -5.708653450012207, "global_step": 44198, "epoch": 1052} {"train_loss": -5.589393615722656, "global_step": 44199, "epoch": 1052} {"train_loss": -5.658779144287109, "global_step": 44200, "epoch": 1052} {"train_loss": -5.764154434204102, "global_step": 44201, "epoch": 1052} {"train_loss": -5.575561046600342, "global_step": 44202, "epoch": 1052} {"train_loss": -5.7214555740356445, "global_step": 44203, "epoch": 1052} {"train_loss": -5.556055545806885, "global_step": 44204, "epoch": 1052} {"train_loss": -5.658137798309326, "global_step": 44205, "epoch": 1052} {"train_loss": -5.813054084777832, "global_step": 44206, "epoch": 1052} {"train_loss": -5.723729610443115, "global_step": 44207, "epoch": 1052} {"train_loss": -5.614018440246582, "global_step": 44208, "epoch": 1052} {"train_loss": -5.6554155349731445, "global_step": 44209, "epoch": 1052} {"train_loss": -5.677918910980225, "global_step": 44210, "epoch": 1052} {"train_loss": -5.832631587982178, "global_step": 44211, "epoch": 1052} {"train_loss": -5.667068958282471, "global_step": 44212, "epoch": 1052} {"train_loss": -5.708612442016602, "global_step": 44213, "epoch": 1052} {"train_loss": -5.741894721984863, "global_step": 44214, "epoch": 1052} {"train_loss": -5.608985900878906, "global_step": 44215, "epoch": 1052} {"train_loss": -5.7163543701171875, "global_step": 44216, "epoch": 1052} {"train_loss": -5.743908882141113, "global_step": 44217, "epoch": 1052} {"train_loss": -5.519623756408691, "global_step": 44218, "epoch": 1052} {"train_loss": -5.7143330574035645, "global_step": 44219, "epoch": 1052} {"train_loss": -5.755009174346924, "global_step": 44220, "epoch": 1052} {"train_loss": -5.67685604095459, "global_step": 44221, "epoch": 1052} {"train_loss": -5.52590274810791, "global_step": 44222, "epoch": 1052} {"train_loss": -5.70938777923584, "global_step": 44223, "epoch": 1052} {"train_loss": -5.75282096862793, "global_step": 44224, "epoch": 1052} {"train_loss": -5.689564761661348, "global_step": 44225, "epoch": 1052, "val_loss": 73976.171875} {"train_loss": -5.653850078582764, "global_step": 44226, "epoch": 1053} {"train_loss": -5.609501838684082, "global_step": 44227, "epoch": 1053} {"train_loss": -5.726998329162598, "global_step": 44228, "epoch": 1053} {"train_loss": -5.6646528244018555, "global_step": 44229, "epoch": 1053} {"train_loss": -5.589856147766113, "global_step": 44230, "epoch": 1053} {"train_loss": -5.687727928161621, "global_step": 44231, "epoch": 1053} {"train_loss": -5.669644355773926, "global_step": 44232, "epoch": 1053} {"train_loss": -5.665301322937012, "global_step": 44233, "epoch": 1053} {"train_loss": -5.7899041175842285, "global_step": 44234, "epoch": 1053} {"train_loss": -5.706822395324707, "global_step": 44235, "epoch": 1053} {"train_loss": -5.8802080154418945, "global_step": 44236, "epoch": 1053} {"train_loss": -5.593194484710693, "global_step": 44237, "epoch": 1053} {"train_loss": -5.802751541137695, "global_step": 44238, "epoch": 1053} {"train_loss": -5.723066329956055, "global_step": 44239, "epoch": 1053} {"train_loss": -5.684672832489014, "global_step": 44240, "epoch": 1053} {"train_loss": -5.7422990798950195, "global_step": 44241, "epoch": 1053} {"train_loss": -5.6191864013671875, "global_step": 44242, "epoch": 1053} {"train_loss": -5.878122329711914, "global_step": 44243, "epoch": 1053} {"train_loss": -5.790688514709473, "global_step": 44244, "epoch": 1053} {"train_loss": -5.696676731109619, "global_step": 44245, "epoch": 1053} {"train_loss": -5.664941787719727, "global_step": 44246, "epoch": 1053} {"train_loss": -5.670629501342773, "global_step": 44247, "epoch": 1053} {"train_loss": -5.749422073364258, "global_step": 44248, "epoch": 1053} {"train_loss": -5.746355056762695, "global_step": 44249, "epoch": 1053} {"train_loss": -5.714897632598877, "global_step": 44250, "epoch": 1053} {"train_loss": -5.771511077880859, "global_step": 44251, "epoch": 1053} {"train_loss": -5.593306541442871, "global_step": 44252, "epoch": 1053} {"train_loss": -5.837221622467041, "global_step": 44253, "epoch": 1053} {"train_loss": -5.718166351318359, "global_step": 44254, "epoch": 1053} {"train_loss": -5.594176292419434, "global_step": 44255, "epoch": 1053} {"train_loss": -5.6578216552734375, "global_step": 44256, "epoch": 1053} {"train_loss": -5.856745719909668, "global_step": 44257, "epoch": 1053} {"train_loss": -5.770761966705322, "global_step": 44258, "epoch": 1053} {"train_loss": -5.730096817016602, "global_step": 44259, "epoch": 1053} {"train_loss": -5.6692118644714355, "global_step": 44260, "epoch": 1053} {"train_loss": -5.625126361846924, "global_step": 44261, "epoch": 1053} {"train_loss": -5.675457000732422, "global_step": 44262, "epoch": 1053} {"train_loss": -5.733258247375488, "global_step": 44263, "epoch": 1053} {"train_loss": -5.6349897384643555, "global_step": 44264, "epoch": 1053} {"train_loss": -5.665821552276611, "global_step": 44265, "epoch": 1053} {"train_loss": -5.6093244552612305, "global_step": 44266, "epoch": 1053} {"train_loss": -5.698902822676159, "global_step": 44267, "epoch": 1053, "val_loss": 74103.5859375} {"train_loss": -5.814017295837402, "global_step": 44268, "epoch": 1054} {"train_loss": -5.694726943969727, "global_step": 44269, "epoch": 1054} {"train_loss": -5.545821189880371, "global_step": 44270, "epoch": 1054} {"train_loss": -5.7000885009765625, "global_step": 44271, "epoch": 1054} {"train_loss": -5.6557512283325195, "global_step": 44272, "epoch": 1054} {"train_loss": -5.494543552398682, "global_step": 44273, "epoch": 1054} {"train_loss": -5.785028457641602, "global_step": 44274, "epoch": 1054} {"train_loss": -5.68958854675293, "global_step": 44275, "epoch": 1054} {"train_loss": -5.636631011962891, "global_step": 44276, "epoch": 1054} {"train_loss": -5.745339393615723, "global_step": 44277, "epoch": 1054} {"train_loss": -5.600801467895508, "global_step": 44278, "epoch": 1054} {"train_loss": -5.688035011291504, "global_step": 44279, "epoch": 1054} {"train_loss": -5.593632221221924, "global_step": 44280, "epoch": 1054} {"train_loss": -5.609661102294922, "global_step": 44281, "epoch": 1054} {"train_loss": -5.664877891540527, "global_step": 44282, "epoch": 1054} {"train_loss": -5.57436990737915, "global_step": 44283, "epoch": 1054} {"train_loss": -5.576225280761719, "global_step": 44284, "epoch": 1054} {"train_loss": -5.6903486251831055, "global_step": 44285, "epoch": 1054} {"train_loss": -5.696130752563477, "global_step": 44286, "epoch": 1054} {"train_loss": -5.541489601135254, "global_step": 44287, "epoch": 1054} {"train_loss": -5.678686618804932, "global_step": 44288, "epoch": 1054} {"train_loss": -5.589394569396973, "global_step": 44289, "epoch": 1054} {"train_loss": -5.793329238891602, "global_step": 44290, "epoch": 1054} {"train_loss": -5.645023345947266, "global_step": 44291, "epoch": 1054} {"train_loss": -5.621623992919922, "global_step": 44292, "epoch": 1054} {"train_loss": -5.622298717498779, "global_step": 44293, "epoch": 1054} {"train_loss": -5.652122497558594, "global_step": 44294, "epoch": 1054} {"train_loss": -5.621885299682617, "global_step": 44295, "epoch": 1054} {"train_loss": -5.549655437469482, "global_step": 44296, "epoch": 1054} {"train_loss": -5.7457098960876465, "global_step": 44297, "epoch": 1054} {"train_loss": -5.759080410003662, "global_step": 44298, "epoch": 1054} {"train_loss": -5.6699628829956055, "global_step": 44299, "epoch": 1054} {"train_loss": -5.664912223815918, "global_step": 44300, "epoch": 1054} {"train_loss": -5.6925368309021, "global_step": 44301, "epoch": 1054} {"train_loss": -5.7484941482543945, "global_step": 44302, "epoch": 1054} {"train_loss": -5.680105209350586, "global_step": 44303, "epoch": 1054} {"train_loss": -5.787299633026123, "global_step": 44304, "epoch": 1054} {"train_loss": -5.718088150024414, "global_step": 44305, "epoch": 1054} {"train_loss": -5.6365251541137695, "global_step": 44306, "epoch": 1054} {"train_loss": -5.619815349578857, "global_step": 44307, "epoch": 1054} {"train_loss": -5.762217044830322, "global_step": 44308, "epoch": 1054} {"train_loss": -5.662936755589077, "global_step": 44309, "epoch": 1054, "val_loss": 73803.9609375} {"train_loss": -5.767181396484375, "global_step": 44310, "epoch": 1055} {"train_loss": -5.7661004066467285, "global_step": 44311, "epoch": 1055} {"train_loss": -5.7075066566467285, "global_step": 44312, "epoch": 1055} {"train_loss": -5.7457098960876465, "global_step": 44313, "epoch": 1055} {"train_loss": -5.660545349121094, "global_step": 44314, "epoch": 1055} {"train_loss": -5.684179782867432, "global_step": 44315, "epoch": 1055} {"train_loss": -5.806452751159668, "global_step": 44316, "epoch": 1055} {"train_loss": -5.656613826751709, "global_step": 44317, "epoch": 1055} {"train_loss": -5.734129905700684, "global_step": 44318, "epoch": 1055} {"train_loss": -5.718415260314941, "global_step": 44319, "epoch": 1055} {"train_loss": -5.724468231201172, "global_step": 44320, "epoch": 1055} {"train_loss": -5.884738922119141, "global_step": 44321, "epoch": 1055} {"train_loss": -5.744851112365723, "global_step": 44322, "epoch": 1055} {"train_loss": -5.742298603057861, "global_step": 44323, "epoch": 1055} {"train_loss": -5.704106330871582, "global_step": 44324, "epoch": 1055} {"train_loss": -5.512313365936279, "global_step": 44325, "epoch": 1055} {"train_loss": -5.722788333892822, "global_step": 44326, "epoch": 1055} {"train_loss": -5.69893741607666, "global_step": 44327, "epoch": 1055} {"train_loss": -5.500474452972412, "global_step": 44328, "epoch": 1055} {"train_loss": -5.659210205078125, "global_step": 44329, "epoch": 1055} {"train_loss": -5.5847978591918945, "global_step": 44330, "epoch": 1055} {"train_loss": -5.718236923217773, "global_step": 44331, "epoch": 1055} {"train_loss": -5.631976127624512, "global_step": 44332, "epoch": 1055} {"train_loss": -5.67742919921875, "global_step": 44333, "epoch": 1055} {"train_loss": -5.727247714996338, "global_step": 44334, "epoch": 1055} {"train_loss": -5.666093826293945, "global_step": 44335, "epoch": 1055} {"train_loss": -5.601120948791504, "global_step": 44336, "epoch": 1055} {"train_loss": -5.656721591949463, "global_step": 44337, "epoch": 1055} {"train_loss": -5.736419677734375, "global_step": 44338, "epoch": 1055} {"train_loss": -5.762925148010254, "global_step": 44339, "epoch": 1055} {"train_loss": -5.579602241516113, "global_step": 44340, "epoch": 1055} {"train_loss": -5.596559524536133, "global_step": 44341, "epoch": 1055} {"train_loss": -5.6056365966796875, "global_step": 44342, "epoch": 1055} {"train_loss": -5.743330955505371, "global_step": 44343, "epoch": 1055} {"train_loss": -5.721726417541504, "global_step": 44344, "epoch": 1055} {"train_loss": -5.630343437194824, "global_step": 44345, "epoch": 1055} {"train_loss": -5.6631574630737305, "global_step": 44346, "epoch": 1055} {"train_loss": -5.762643814086914, "global_step": 44347, "epoch": 1055} {"train_loss": -5.644901752471924, "global_step": 44348, "epoch": 1055} {"train_loss": -5.639655113220215, "global_step": 44349, "epoch": 1055} {"train_loss": -5.706742763519287, "global_step": 44350, "epoch": 1055} {"train_loss": -5.688193082809448, "global_step": 44351, "epoch": 1055, "val_loss": 73917.9609375} {"train_loss": -5.630040168762207, "global_step": 44352, "epoch": 1056} {"train_loss": -5.653747081756592, "global_step": 44353, "epoch": 1056} {"train_loss": -5.738502502441406, "global_step": 44354, "epoch": 1056} {"train_loss": -5.721796035766602, "global_step": 44355, "epoch": 1056} {"train_loss": -5.748832702636719, "global_step": 44356, "epoch": 1056} {"train_loss": -5.549023628234863, "global_step": 44357, "epoch": 1056} {"train_loss": -5.707976341247559, "global_step": 44358, "epoch": 1056} {"train_loss": -5.692048072814941, "global_step": 44359, "epoch": 1056} {"train_loss": -5.744516372680664, "global_step": 44360, "epoch": 1056} {"train_loss": -5.779272079467773, "global_step": 44361, "epoch": 1056} {"train_loss": -5.69438362121582, "global_step": 44362, "epoch": 1056} {"train_loss": -5.62206506729126, "global_step": 44363, "epoch": 1056} {"train_loss": -5.480037689208984, "global_step": 44364, "epoch": 1056} {"train_loss": -5.583771228790283, "global_step": 44365, "epoch": 1056} {"train_loss": -5.618710994720459, "global_step": 44366, "epoch": 1056} {"train_loss": -5.643911838531494, "global_step": 44367, "epoch": 1056} {"train_loss": -5.735240936279297, "global_step": 44368, "epoch": 1056} {"train_loss": -5.657665252685547, "global_step": 44369, "epoch": 1056} {"train_loss": -5.653930187225342, "global_step": 44370, "epoch": 1056} {"train_loss": -5.6260175704956055, "global_step": 44371, "epoch": 1056} {"train_loss": -5.655885696411133, "global_step": 44372, "epoch": 1056} {"train_loss": -5.655620574951172, "global_step": 44373, "epoch": 1056} {"train_loss": -5.5438385009765625, "global_step": 44374, "epoch": 1056} {"train_loss": -5.7104949951171875, "global_step": 44375, "epoch": 1056} {"train_loss": -5.534316062927246, "global_step": 44376, "epoch": 1056} {"train_loss": -5.647390365600586, "global_step": 44377, "epoch": 1056} {"train_loss": -5.614096641540527, "global_step": 44378, "epoch": 1056} {"train_loss": -5.529292583465576, "global_step": 44379, "epoch": 1056} {"train_loss": -5.6388349533081055, "global_step": 44380, "epoch": 1056} {"train_loss": -5.560503005981445, "global_step": 44381, "epoch": 1056} {"train_loss": -5.873812675476074, "global_step": 44382, "epoch": 1056} {"train_loss": -5.679910659790039, "global_step": 44383, "epoch": 1056} {"train_loss": -5.772863864898682, "global_step": 44384, "epoch": 1056} {"train_loss": -5.555747985839844, "global_step": 44385, "epoch": 1056} {"train_loss": -5.635231971740723, "global_step": 44386, "epoch": 1056} {"train_loss": -5.627224922180176, "global_step": 44387, "epoch": 1056} {"train_loss": -5.760108470916748, "global_step": 44388, "epoch": 1056} {"train_loss": -5.717970848083496, "global_step": 44389, "epoch": 1056} {"train_loss": -5.769815921783447, "global_step": 44390, "epoch": 1056} {"train_loss": -5.671877861022949, "global_step": 44391, "epoch": 1056} {"train_loss": -5.76519775390625, "global_step": 44392, "epoch": 1056} {"train_loss": -5.663992518470401, "global_step": 44393, "epoch": 1056, "val_loss": 73768.78125} {"train_loss": -5.777435302734375, "global_step": 44394, "epoch": 1057} {"train_loss": -5.560650825500488, "global_step": 44395, "epoch": 1057} {"train_loss": -5.625988006591797, "global_step": 44396, "epoch": 1057} {"train_loss": -5.612595558166504, "global_step": 44397, "epoch": 1057} {"train_loss": -5.673126220703125, "global_step": 44398, "epoch": 1057} {"train_loss": -5.795485496520996, "global_step": 44399, "epoch": 1057} {"train_loss": -5.687145233154297, "global_step": 44400, "epoch": 1057} {"train_loss": -5.806208610534668, "global_step": 44401, "epoch": 1057} {"train_loss": -5.779522895812988, "global_step": 44402, "epoch": 1057} {"train_loss": -5.676388740539551, "global_step": 44403, "epoch": 1057} {"train_loss": -5.711848735809326, "global_step": 44404, "epoch": 1057} {"train_loss": -5.704531669616699, "global_step": 44405, "epoch": 1057} {"train_loss": -5.818532943725586, "global_step": 44406, "epoch": 1057} {"train_loss": -5.72434139251709, "global_step": 44407, "epoch": 1057} {"train_loss": -5.714256286621094, "global_step": 44408, "epoch": 1057} {"train_loss": -5.729966640472412, "global_step": 44409, "epoch": 1057} {"train_loss": -5.653189659118652, "global_step": 44410, "epoch": 1057} {"train_loss": -5.654102802276611, "global_step": 44411, "epoch": 1057} {"train_loss": -5.774188041687012, "global_step": 44412, "epoch": 1057} {"train_loss": -5.655151844024658, "global_step": 44413, "epoch": 1057} {"train_loss": -5.716211318969727, "global_step": 44414, "epoch": 1057} {"train_loss": -5.65322208404541, "global_step": 44415, "epoch": 1057} {"train_loss": -5.698788642883301, "global_step": 44416, "epoch": 1057} {"train_loss": -5.711780548095703, "global_step": 44417, "epoch": 1057} {"train_loss": -5.778085708618164, "global_step": 44418, "epoch": 1057} {"train_loss": -5.630034923553467, "global_step": 44419, "epoch": 1057} {"train_loss": -5.743557929992676, "global_step": 44420, "epoch": 1057} {"train_loss": -5.836062908172607, "global_step": 44421, "epoch": 1057} {"train_loss": -5.813195705413818, "global_step": 44422, "epoch": 1057} {"train_loss": -5.707833766937256, "global_step": 44423, "epoch": 1057} {"train_loss": -5.710819721221924, "global_step": 44424, "epoch": 1057} {"train_loss": -5.776079177856445, "global_step": 44425, "epoch": 1057} {"train_loss": -5.733712673187256, "global_step": 44426, "epoch": 1057} {"train_loss": -5.61097526550293, "global_step": 44427, "epoch": 1057} {"train_loss": -5.658941745758057, "global_step": 44428, "epoch": 1057} {"train_loss": -5.792635917663574, "global_step": 44429, "epoch": 1057} {"train_loss": -5.661890029907227, "global_step": 44430, "epoch": 1057} {"train_loss": -5.703659534454346, "global_step": 44431, "epoch": 1057} {"train_loss": -5.808096408843994, "global_step": 44432, "epoch": 1057} {"train_loss": -5.687680244445801, "global_step": 44433, "epoch": 1057} {"train_loss": -5.6111979484558105, "global_step": 44434, "epoch": 1057} {"train_loss": -5.711222012837728, "global_step": 44435, "epoch": 1057, "val_loss": 73544.3359375} {"train_loss": -5.793176174163818, "global_step": 44436, "epoch": 1058} {"train_loss": -5.6455230712890625, "global_step": 44437, "epoch": 1058} {"train_loss": -5.67926025390625, "global_step": 44438, "epoch": 1058} {"train_loss": -5.664449691772461, "global_step": 44439, "epoch": 1058} {"train_loss": -5.6133270263671875, "global_step": 44440, "epoch": 1058} {"train_loss": -5.684263229370117, "global_step": 44441, "epoch": 1058} {"train_loss": -5.644786834716797, "global_step": 44442, "epoch": 1058} {"train_loss": -5.720180034637451, "global_step": 44443, "epoch": 1058} {"train_loss": -5.796940803527832, "global_step": 44444, "epoch": 1058} {"train_loss": -5.7555317878723145, "global_step": 44445, "epoch": 1058} {"train_loss": -5.636617660522461, "global_step": 44446, "epoch": 1058} {"train_loss": -5.5672502517700195, "global_step": 44447, "epoch": 1058} {"train_loss": -5.828533172607422, "global_step": 44448, "epoch": 1058} {"train_loss": -5.582740783691406, "global_step": 44449, "epoch": 1058} {"train_loss": -5.682923316955566, "global_step": 44450, "epoch": 1058} {"train_loss": -5.6500420570373535, "global_step": 44451, "epoch": 1058} {"train_loss": -5.644096374511719, "global_step": 44452, "epoch": 1058} {"train_loss": -5.807183265686035, "global_step": 44453, "epoch": 1058} {"train_loss": -5.7983856201171875, "global_step": 44454, "epoch": 1058} {"train_loss": -5.642070770263672, "global_step": 44455, "epoch": 1058} {"train_loss": -5.69514274597168, "global_step": 44456, "epoch": 1058} {"train_loss": -5.750723838806152, "global_step": 44457, "epoch": 1058} {"train_loss": -5.7065629959106445, "global_step": 44458, "epoch": 1058} {"train_loss": -5.774147987365723, "global_step": 44459, "epoch": 1058} {"train_loss": -5.705874443054199, "global_step": 44460, "epoch": 1058} {"train_loss": -5.67476224899292, "global_step": 44461, "epoch": 1058} {"train_loss": -5.6640472412109375, "global_step": 44462, "epoch": 1058} {"train_loss": -5.631329536437988, "global_step": 44463, "epoch": 1058} {"train_loss": -5.780460357666016, "global_step": 44464, "epoch": 1058} {"train_loss": -5.698321342468262, "global_step": 44465, "epoch": 1058} {"train_loss": -5.643253326416016, "global_step": 44466, "epoch": 1058} {"train_loss": -5.590359687805176, "global_step": 44467, "epoch": 1058} {"train_loss": -5.619207382202148, "global_step": 44468, "epoch": 1058} {"train_loss": -5.726184844970703, "global_step": 44469, "epoch": 1058} {"train_loss": -5.7491655349731445, "global_step": 44470, "epoch": 1058} {"train_loss": -5.577129364013672, "global_step": 44471, "epoch": 1058} {"train_loss": -5.809563159942627, "global_step": 44472, "epoch": 1058} {"train_loss": -5.701436996459961, "global_step": 44473, "epoch": 1058} {"train_loss": -5.683891773223877, "global_step": 44474, "epoch": 1058} {"train_loss": -5.675878047943115, "global_step": 44475, "epoch": 1058} {"train_loss": -5.650376796722412, "global_step": 44476, "epoch": 1058} {"train_loss": -5.693417174475534, "global_step": 44477, "epoch": 1058, "val_loss": 73833.6640625} {"train_loss": -5.653894901275635, "global_step": 44478, "epoch": 1059} {"train_loss": -5.73188591003418, "global_step": 44479, "epoch": 1059} {"train_loss": -5.696155548095703, "global_step": 44480, "epoch": 1059} {"train_loss": -5.670549392700195, "global_step": 44481, "epoch": 1059} {"train_loss": -5.697734355926514, "global_step": 44482, "epoch": 1059} {"train_loss": -5.709585189819336, "global_step": 44483, "epoch": 1059} {"train_loss": -5.761991500854492, "global_step": 44484, "epoch": 1059} {"train_loss": -5.7643609046936035, "global_step": 44485, "epoch": 1059} {"train_loss": -5.610861778259277, "global_step": 44486, "epoch": 1059} {"train_loss": -5.91168737411499, "global_step": 44487, "epoch": 1059} {"train_loss": -5.756471633911133, "global_step": 44488, "epoch": 1059} {"train_loss": -5.775761604309082, "global_step": 44489, "epoch": 1059} {"train_loss": -5.794322967529297, "global_step": 44490, "epoch": 1059} {"train_loss": -5.88803768157959, "global_step": 44491, "epoch": 1059} {"train_loss": -5.684195518493652, "global_step": 44492, "epoch": 1059} {"train_loss": -5.804293155670166, "global_step": 44493, "epoch": 1059} {"train_loss": -5.698651313781738, "global_step": 44494, "epoch": 1059} {"train_loss": -5.712682723999023, "global_step": 44495, "epoch": 1059} {"train_loss": -5.812161445617676, "global_step": 44496, "epoch": 1059} {"train_loss": -5.712928771972656, "global_step": 44497, "epoch": 1059} {"train_loss": -5.578145980834961, "global_step": 44498, "epoch": 1059} {"train_loss": -5.670046329498291, "global_step": 44499, "epoch": 1059} {"train_loss": -5.772045612335205, "global_step": 44500, "epoch": 1059} {"train_loss": -5.698873519897461, "global_step": 44501, "epoch": 1059} {"train_loss": -5.663121223449707, "global_step": 44502, "epoch": 1059} {"train_loss": -5.690835952758789, "global_step": 44503, "epoch": 1059} {"train_loss": -5.743478775024414, "global_step": 44504, "epoch": 1059} {"train_loss": -5.647900581359863, "global_step": 44505, "epoch": 1059} {"train_loss": -5.676120758056641, "global_step": 44506, "epoch": 1059} {"train_loss": -5.5664167404174805, "global_step": 44507, "epoch": 1059} {"train_loss": -5.756500244140625, "global_step": 44508, "epoch": 1059} {"train_loss": -5.681872367858887, "global_step": 44509, "epoch": 1059} {"train_loss": -5.684213161468506, "global_step": 44510, "epoch": 1059} {"train_loss": -5.615232467651367, "global_step": 44511, "epoch": 1059} {"train_loss": -5.701565742492676, "global_step": 44512, "epoch": 1059} {"train_loss": -5.714111804962158, "global_step": 44513, "epoch": 1059} {"train_loss": -5.59152889251709, "global_step": 44514, "epoch": 1059} {"train_loss": -5.653903961181641, "global_step": 44515, "epoch": 1059} {"train_loss": -5.534823417663574, "global_step": 44516, "epoch": 1059} {"train_loss": -5.707420349121094, "global_step": 44517, "epoch": 1059} {"train_loss": -5.806339263916016, "global_step": 44518, "epoch": 1059} {"train_loss": -5.706080141521635, "global_step": 44519, "epoch": 1059, "val_loss": 73750.6640625} {"train_loss": -5.719008922576904, "global_step": 44520, "epoch": 1060} {"train_loss": -5.714814186096191, "global_step": 44521, "epoch": 1060} {"train_loss": -5.662609577178955, "global_step": 44522, "epoch": 1060} {"train_loss": -5.609475135803223, "global_step": 44523, "epoch": 1060} {"train_loss": -5.592337608337402, "global_step": 44524, "epoch": 1060} {"train_loss": -5.806702613830566, "global_step": 44525, "epoch": 1060} {"train_loss": -5.630760192871094, "global_step": 44526, "epoch": 1060} {"train_loss": -5.576992034912109, "global_step": 44527, "epoch": 1060} {"train_loss": -5.778497695922852, "global_step": 44528, "epoch": 1060} {"train_loss": -5.738591194152832, "global_step": 44529, "epoch": 1060} {"train_loss": -5.831870079040527, "global_step": 44530, "epoch": 1060} {"train_loss": -5.655503273010254, "global_step": 44531, "epoch": 1060} {"train_loss": -5.678703308105469, "global_step": 44532, "epoch": 1060} {"train_loss": -5.760471820831299, "global_step": 44533, "epoch": 1060} {"train_loss": -5.68607234954834, "global_step": 44534, "epoch": 1060} {"train_loss": -5.823838233947754, "global_step": 44535, "epoch": 1060} {"train_loss": -5.693339824676514, "global_step": 44536, "epoch": 1060} {"train_loss": -5.724682331085205, "global_step": 44537, "epoch": 1060} {"train_loss": -5.68935489654541, "global_step": 44538, "epoch": 1060} {"train_loss": -5.712365627288818, "global_step": 44539, "epoch": 1060} {"train_loss": -5.715224266052246, "global_step": 44540, "epoch": 1060} {"train_loss": -5.642856597900391, "global_step": 44541, "epoch": 1060} {"train_loss": -5.737709045410156, "global_step": 44542, "epoch": 1060} {"train_loss": -5.680502891540527, "global_step": 44543, "epoch": 1060} {"train_loss": -5.829282760620117, "global_step": 44544, "epoch": 1060} {"train_loss": -5.558642387390137, "global_step": 44545, "epoch": 1060} {"train_loss": -5.733473777770996, "global_step": 44546, "epoch": 1060} {"train_loss": -5.746957302093506, "global_step": 44547, "epoch": 1060} {"train_loss": -5.6267499923706055, "global_step": 44548, "epoch": 1060} {"train_loss": -5.713043689727783, "global_step": 44549, "epoch": 1060} {"train_loss": -5.623587608337402, "global_step": 44550, "epoch": 1060} {"train_loss": -5.68126106262207, "global_step": 44551, "epoch": 1060} {"train_loss": -5.716618537902832, "global_step": 44552, "epoch": 1060} {"train_loss": -5.816114902496338, "global_step": 44553, "epoch": 1060} {"train_loss": -5.901243686676025, "global_step": 44554, "epoch": 1060} {"train_loss": -5.683610439300537, "global_step": 44555, "epoch": 1060} {"train_loss": -5.6833953857421875, "global_step": 44556, "epoch": 1060} {"train_loss": -5.6781005859375, "global_step": 44557, "epoch": 1060} {"train_loss": -5.721303939819336, "global_step": 44558, "epoch": 1060} {"train_loss": -5.779204845428467, "global_step": 44559, "epoch": 1060} {"train_loss": -5.7265191078186035, "global_step": 44560, "epoch": 1060} {"train_loss": -5.7088160287766225, "global_step": 44561, "epoch": 1060, "val_loss": 74523.59375} {"train_loss": -5.633288860321045, "global_step": 44562, "epoch": 1061} {"train_loss": -5.739748001098633, "global_step": 44563, "epoch": 1061} {"train_loss": -5.755190849304199, "global_step": 44564, "epoch": 1061} {"train_loss": -5.665233135223389, "global_step": 44565, "epoch": 1061} {"train_loss": -5.784808158874512, "global_step": 44566, "epoch": 1061} {"train_loss": -5.700852870941162, "global_step": 44567, "epoch": 1061} {"train_loss": -5.704765796661377, "global_step": 44568, "epoch": 1061} {"train_loss": -5.622906684875488, "global_step": 44569, "epoch": 1061} {"train_loss": -5.538867950439453, "global_step": 44570, "epoch": 1061} {"train_loss": -5.855620861053467, "global_step": 44571, "epoch": 1061} {"train_loss": -5.725712776184082, "global_step": 44572, "epoch": 1061} {"train_loss": -5.661306381225586, "global_step": 44573, "epoch": 1061} {"train_loss": -5.782233238220215, "global_step": 44574, "epoch": 1061} {"train_loss": -5.632603168487549, "global_step": 44575, "epoch": 1061} {"train_loss": -5.670570373535156, "global_step": 44576, "epoch": 1061} {"train_loss": -5.733288764953613, "global_step": 44577, "epoch": 1061} {"train_loss": -5.560896873474121, "global_step": 44578, "epoch": 1061} {"train_loss": -5.649400234222412, "global_step": 44579, "epoch": 1061} {"train_loss": -5.589668273925781, "global_step": 44580, "epoch": 1061} {"train_loss": -5.624028205871582, "global_step": 44581, "epoch": 1061} {"train_loss": -5.551596164703369, "global_step": 44582, "epoch": 1061} {"train_loss": -5.797411918640137, "global_step": 44583, "epoch": 1061} {"train_loss": -5.684476375579834, "global_step": 44584, "epoch": 1061} {"train_loss": -5.761784553527832, "global_step": 44585, "epoch": 1061} {"train_loss": -5.497148513793945, "global_step": 44586, "epoch": 1061} {"train_loss": -5.593507766723633, "global_step": 44587, "epoch": 1061} {"train_loss": -5.6743855476379395, "global_step": 44588, "epoch": 1061} {"train_loss": -5.684953689575195, "global_step": 44589, "epoch": 1061} {"train_loss": -5.647083282470703, "global_step": 44590, "epoch": 1061} {"train_loss": -5.741002082824707, "global_step": 44591, "epoch": 1061} {"train_loss": -5.688096046447754, "global_step": 44592, "epoch": 1061} {"train_loss": -5.72718620300293, "global_step": 44593, "epoch": 1061} {"train_loss": -5.864433288574219, "global_step": 44594, "epoch": 1061} {"train_loss": -5.615849494934082, "global_step": 44595, "epoch": 1061} {"train_loss": -5.686408042907715, "global_step": 44596, "epoch": 1061} {"train_loss": -5.683956146240234, "global_step": 44597, "epoch": 1061} {"train_loss": -5.624518394470215, "global_step": 44598, "epoch": 1061} {"train_loss": -5.648353099822998, "global_step": 44599, "epoch": 1061} {"train_loss": -5.823708534240723, "global_step": 44600, "epoch": 1061} {"train_loss": -5.64840030670166, "global_step": 44601, "epoch": 1061} {"train_loss": -5.676690578460693, "global_step": 44602, "epoch": 1061} {"train_loss": -5.680422294707525, "global_step": 44603, "epoch": 1061, "val_loss": 74234.1953125} {"train_loss": -5.649199485778809, "global_step": 44604, "epoch": 1062} {"train_loss": -5.702917575836182, "global_step": 44605, "epoch": 1062} {"train_loss": -5.629288673400879, "global_step": 44606, "epoch": 1062} {"train_loss": -5.668163299560547, "global_step": 44607, "epoch": 1062} {"train_loss": -5.693533420562744, "global_step": 44608, "epoch": 1062} {"train_loss": -5.585064888000488, "global_step": 44609, "epoch": 1062} {"train_loss": -5.762998580932617, "global_step": 44610, "epoch": 1062} {"train_loss": -5.724967002868652, "global_step": 44611, "epoch": 1062} {"train_loss": -5.632917881011963, "global_step": 44612, "epoch": 1062} {"train_loss": -5.619688987731934, "global_step": 44613, "epoch": 1062} {"train_loss": -5.760315418243408, "global_step": 44614, "epoch": 1062} {"train_loss": -5.779994010925293, "global_step": 44615, "epoch": 1062} {"train_loss": -5.748457908630371, "global_step": 44616, "epoch": 1062} {"train_loss": -5.724176406860352, "global_step": 44617, "epoch": 1062} {"train_loss": -5.721334457397461, "global_step": 44618, "epoch": 1062} {"train_loss": -5.820108890533447, "global_step": 44619, "epoch": 1062} {"train_loss": -5.698385238647461, "global_step": 44620, "epoch": 1062} {"train_loss": -5.5396318435668945, "global_step": 44621, "epoch": 1062} {"train_loss": -5.6916656494140625, "global_step": 44622, "epoch": 1062} {"train_loss": -5.6816229820251465, "global_step": 44623, "epoch": 1062} {"train_loss": -5.619612693786621, "global_step": 44624, "epoch": 1062} {"train_loss": -5.918183326721191, "global_step": 44625, "epoch": 1062} {"train_loss": -5.63420295715332, "global_step": 44626, "epoch": 1062} {"train_loss": -5.635337829589844, "global_step": 44627, "epoch": 1062} {"train_loss": -5.690238952636719, "global_step": 44628, "epoch": 1062} {"train_loss": -5.594582557678223, "global_step": 44629, "epoch": 1062} {"train_loss": -5.770577430725098, "global_step": 44630, "epoch": 1062} {"train_loss": -5.677980422973633, "global_step": 44631, "epoch": 1062} {"train_loss": -5.765778541564941, "global_step": 44632, "epoch": 1062} {"train_loss": -5.8285722732543945, "global_step": 44633, "epoch": 1062} {"train_loss": -5.701371192932129, "global_step": 44634, "epoch": 1062} {"train_loss": -5.579059600830078, "global_step": 44635, "epoch": 1062} {"train_loss": -5.669491767883301, "global_step": 44636, "epoch": 1062} {"train_loss": -5.625635147094727, "global_step": 44637, "epoch": 1062} {"train_loss": -5.601421356201172, "global_step": 44638, "epoch": 1062} {"train_loss": -5.822908401489258, "global_step": 44639, "epoch": 1062} {"train_loss": -5.537411689758301, "global_step": 44640, "epoch": 1062} {"train_loss": -5.781056880950928, "global_step": 44641, "epoch": 1062} {"train_loss": -5.646426200866699, "global_step": 44642, "epoch": 1062} {"train_loss": -5.528656005859375, "global_step": 44643, "epoch": 1062} {"train_loss": -5.773898601531982, "global_step": 44644, "epoch": 1062} {"train_loss": -5.68704663004194, "global_step": 44645, "epoch": 1062, "val_loss": 73949.4765625} {"train_loss": -5.831182956695557, "global_step": 44646, "epoch": 1063} {"train_loss": -5.674697399139404, "global_step": 44647, "epoch": 1063} {"train_loss": -5.479172706604004, "global_step": 44648, "epoch": 1063} {"train_loss": -5.829147815704346, "global_step": 44649, "epoch": 1063} {"train_loss": -5.6537089347839355, "global_step": 44650, "epoch": 1063} {"train_loss": -5.719484329223633, "global_step": 44651, "epoch": 1063} {"train_loss": -5.652016639709473, "global_step": 44652, "epoch": 1063} {"train_loss": -5.738141059875488, "global_step": 44653, "epoch": 1063} {"train_loss": -5.7615861892700195, "global_step": 44654, "epoch": 1063} {"train_loss": -5.886087417602539, "global_step": 44655, "epoch": 1063} {"train_loss": -5.7135796546936035, "global_step": 44656, "epoch": 1063} {"train_loss": -5.614120006561279, "global_step": 44657, "epoch": 1063} {"train_loss": -5.723872184753418, "global_step": 44658, "epoch": 1063} {"train_loss": -5.683932304382324, "global_step": 44659, "epoch": 1063} {"train_loss": -5.709966659545898, "global_step": 44660, "epoch": 1063} {"train_loss": -5.66367244720459, "global_step": 44661, "epoch": 1063} {"train_loss": -5.817244052886963, "global_step": 44662, "epoch": 1063} {"train_loss": -5.769645690917969, "global_step": 44663, "epoch": 1063} {"train_loss": -5.670089244842529, "global_step": 44664, "epoch": 1063} {"train_loss": -5.659152984619141, "global_step": 44665, "epoch": 1063} {"train_loss": -5.608704566955566, "global_step": 44666, "epoch": 1063} {"train_loss": -5.640193462371826, "global_step": 44667, "epoch": 1063} {"train_loss": -5.808985710144043, "global_step": 44668, "epoch": 1063} {"train_loss": -5.739636421203613, "global_step": 44669, "epoch": 1063} {"train_loss": -5.714419841766357, "global_step": 44670, "epoch": 1063} {"train_loss": -5.653221130371094, "global_step": 44671, "epoch": 1063} {"train_loss": -5.562427997589111, "global_step": 44672, "epoch": 1063} {"train_loss": -5.788998126983643, "global_step": 44673, "epoch": 1063} {"train_loss": -5.629659652709961, "global_step": 44674, "epoch": 1063} {"train_loss": -5.588086128234863, "global_step": 44675, "epoch": 1063} {"train_loss": -5.78195858001709, "global_step": 44676, "epoch": 1063} {"train_loss": -5.821728706359863, "global_step": 44677, "epoch": 1063} {"train_loss": -5.662913799285889, "global_step": 44678, "epoch": 1063} {"train_loss": -5.734159469604492, "global_step": 44679, "epoch": 1063} {"train_loss": -5.70098876953125, "global_step": 44680, "epoch": 1063} {"train_loss": -5.71729850769043, "global_step": 44681, "epoch": 1063} {"train_loss": -5.6585564613342285, "global_step": 44682, "epoch": 1063} {"train_loss": -5.674124717712402, "global_step": 44683, "epoch": 1063} {"train_loss": -5.793022155761719, "global_step": 44684, "epoch": 1063} {"train_loss": -5.755398273468018, "global_step": 44685, "epoch": 1063} {"train_loss": -5.572710037231445, "global_step": 44686, "epoch": 1063} {"train_loss": -5.7026460738409135, "global_step": 44687, "epoch": 1063, "val_loss": 74137.625} {"train_loss": -5.656377792358398, "global_step": 44688, "epoch": 1064} {"train_loss": -5.802724838256836, "global_step": 44689, "epoch": 1064} {"train_loss": -5.757314682006836, "global_step": 44690, "epoch": 1064} {"train_loss": -5.77027702331543, "global_step": 44691, "epoch": 1064} {"train_loss": -5.6344780921936035, "global_step": 44692, "epoch": 1064} {"train_loss": -5.652643203735352, "global_step": 44693, "epoch": 1064} {"train_loss": -5.622711181640625, "global_step": 44694, "epoch": 1064} {"train_loss": -5.636098861694336, "global_step": 44695, "epoch": 1064} {"train_loss": -5.675377368927002, "global_step": 44696, "epoch": 1064} {"train_loss": -5.646297454833984, "global_step": 44697, "epoch": 1064} {"train_loss": -5.738734722137451, "global_step": 44698, "epoch": 1064} {"train_loss": -5.499686241149902, "global_step": 44699, "epoch": 1064} {"train_loss": -5.739151954650879, "global_step": 44700, "epoch": 1064} {"train_loss": -5.728236198425293, "global_step": 44701, "epoch": 1064} {"train_loss": -5.700402736663818, "global_step": 44702, "epoch": 1064} {"train_loss": -5.828351974487305, "global_step": 44703, "epoch": 1064} {"train_loss": -5.643738746643066, "global_step": 44704, "epoch": 1064} {"train_loss": -5.91916561126709, "global_step": 44705, "epoch": 1064} {"train_loss": -5.7896928787231445, "global_step": 44706, "epoch": 1064} {"train_loss": -5.650212287902832, "global_step": 44707, "epoch": 1064} {"train_loss": -5.732777118682861, "global_step": 44708, "epoch": 1064} {"train_loss": -5.5905914306640625, "global_step": 44709, "epoch": 1064} {"train_loss": -5.663532257080078, "global_step": 44710, "epoch": 1064} {"train_loss": -5.664472579956055, "global_step": 44711, "epoch": 1064} {"train_loss": -5.37067174911499, "global_step": 44712, "epoch": 1064} {"train_loss": -5.6390862464904785, "global_step": 44713, "epoch": 1064} {"train_loss": -5.64289665222168, "global_step": 44714, "epoch": 1064} {"train_loss": -5.554409027099609, "global_step": 44715, "epoch": 1064} {"train_loss": -5.830733299255371, "global_step": 44716, "epoch": 1064} {"train_loss": -5.627130031585693, "global_step": 44717, "epoch": 1064} {"train_loss": -5.558108806610107, "global_step": 44718, "epoch": 1064} {"train_loss": -5.549148082733154, "global_step": 44719, "epoch": 1064} {"train_loss": -5.647181987762451, "global_step": 44720, "epoch": 1064} {"train_loss": -5.640947341918945, "global_step": 44721, "epoch": 1064} {"train_loss": -5.6615753173828125, "global_step": 44722, "epoch": 1064} {"train_loss": -5.68484354019165, "global_step": 44723, "epoch": 1064} {"train_loss": -5.685320854187012, "global_step": 44724, "epoch": 1064} {"train_loss": -5.699199676513672, "global_step": 44725, "epoch": 1064} {"train_loss": -5.593059062957764, "global_step": 44726, "epoch": 1064} {"train_loss": -5.645053386688232, "global_step": 44727, "epoch": 1064} {"train_loss": -5.649623394012451, "global_step": 44728, "epoch": 1064} {"train_loss": -5.667768239974976, "global_step": 44729, "epoch": 1064, "val_loss": 74434.03125} {"train_loss": -5.614534854888916, "global_step": 44730, "epoch": 1065} {"train_loss": -5.788074493408203, "global_step": 44731, "epoch": 1065} {"train_loss": -5.660473823547363, "global_step": 44732, "epoch": 1065} {"train_loss": -5.666219711303711, "global_step": 44733, "epoch": 1065} {"train_loss": -5.637696266174316, "global_step": 44734, "epoch": 1065} {"train_loss": -5.6795525550842285, "global_step": 44735, "epoch": 1065} {"train_loss": -5.727499961853027, "global_step": 44736, "epoch": 1065} {"train_loss": -5.836199760437012, "global_step": 44737, "epoch": 1065} {"train_loss": -5.742575168609619, "global_step": 44738, "epoch": 1065} {"train_loss": -5.530129909515381, "global_step": 44739, "epoch": 1065} {"train_loss": -5.637237071990967, "global_step": 44740, "epoch": 1065} {"train_loss": -5.711020469665527, "global_step": 44741, "epoch": 1065} {"train_loss": -5.7387895584106445, "global_step": 44742, "epoch": 1065} {"train_loss": -5.729755401611328, "global_step": 44743, "epoch": 1065} {"train_loss": -5.675601005554199, "global_step": 44744, "epoch": 1065} {"train_loss": -5.730607032775879, "global_step": 44745, "epoch": 1065} {"train_loss": -5.673637390136719, "global_step": 44746, "epoch": 1065} {"train_loss": -5.7235798835754395, "global_step": 44747, "epoch": 1065} {"train_loss": -5.760544300079346, "global_step": 44748, "epoch": 1065} {"train_loss": -5.650662422180176, "global_step": 44749, "epoch": 1065} {"train_loss": -5.7261457443237305, "global_step": 44750, "epoch": 1065} {"train_loss": -5.452254295349121, "global_step": 44751, "epoch": 1065} {"train_loss": -5.807394027709961, "global_step": 44752, "epoch": 1065} {"train_loss": -5.794009208679199, "global_step": 44753, "epoch": 1065} {"train_loss": -5.674480438232422, "global_step": 44754, "epoch": 1065} {"train_loss": -5.815603256225586, "global_step": 44755, "epoch": 1065} {"train_loss": -5.809367656707764, "global_step": 44756, "epoch": 1065} {"train_loss": -5.641625881195068, "global_step": 44757, "epoch": 1065} {"train_loss": -5.828719139099121, "global_step": 44758, "epoch": 1065} {"train_loss": -5.718255996704102, "global_step": 44759, "epoch": 1065} {"train_loss": -5.6987433433532715, "global_step": 44760, "epoch": 1065} {"train_loss": -5.68558931350708, "global_step": 44761, "epoch": 1065} {"train_loss": -5.706860065460205, "global_step": 44762, "epoch": 1065} {"train_loss": -5.712004661560059, "global_step": 44763, "epoch": 1065} {"train_loss": -5.745029926300049, "global_step": 44764, "epoch": 1065} {"train_loss": -5.468456745147705, "global_step": 44765, "epoch": 1065} {"train_loss": -5.625977993011475, "global_step": 44766, "epoch": 1065} {"train_loss": -5.766692161560059, "global_step": 44767, "epoch": 1065} {"train_loss": -5.7243852615356445, "global_step": 44768, "epoch": 1065} {"train_loss": -5.775155544281006, "global_step": 44769, "epoch": 1065} {"train_loss": -5.586002349853516, "global_step": 44770, "epoch": 1065} {"train_loss": -5.6957651887621195, "global_step": 44771, "epoch": 1065, "val_loss": 74000.015625} {"train_loss": -5.738154411315918, "global_step": 44772, "epoch": 1066} {"train_loss": -5.57580041885376, "global_step": 44773, "epoch": 1066} {"train_loss": -5.58513069152832, "global_step": 44774, "epoch": 1066} {"train_loss": -5.624769687652588, "global_step": 44775, "epoch": 1066} {"train_loss": -5.6714582443237305, "global_step": 44776, "epoch": 1066} {"train_loss": -5.675075531005859, "global_step": 44777, "epoch": 1066} {"train_loss": -5.746641159057617, "global_step": 44778, "epoch": 1066} {"train_loss": -5.644899368286133, "global_step": 44779, "epoch": 1066} {"train_loss": -5.581689834594727, "global_step": 44780, "epoch": 1066} {"train_loss": -5.6675543785095215, "global_step": 44781, "epoch": 1066} {"train_loss": -5.686101913452148, "global_step": 44782, "epoch": 1066} {"train_loss": -5.754526138305664, "global_step": 44783, "epoch": 1066} {"train_loss": -5.77653169631958, "global_step": 44784, "epoch": 1066} {"train_loss": -5.605990409851074, "global_step": 44785, "epoch": 1066} {"train_loss": -5.527230262756348, "global_step": 44786, "epoch": 1066} {"train_loss": -5.695531845092773, "global_step": 44787, "epoch": 1066} {"train_loss": -5.823895454406738, "global_step": 44788, "epoch": 1066} {"train_loss": -5.723512649536133, "global_step": 44789, "epoch": 1066} {"train_loss": -5.658693313598633, "global_step": 44790, "epoch": 1066} {"train_loss": -5.658109188079834, "global_step": 44791, "epoch": 1066} {"train_loss": -5.623705863952637, "global_step": 44792, "epoch": 1066} {"train_loss": -5.690627574920654, "global_step": 44793, "epoch": 1066} {"train_loss": -5.762470722198486, "global_step": 44794, "epoch": 1066} {"train_loss": -5.681063652038574, "global_step": 44795, "epoch": 1066} {"train_loss": -5.742679595947266, "global_step": 44796, "epoch": 1066} {"train_loss": -5.611626625061035, "global_step": 44797, "epoch": 1066} {"train_loss": -5.802190780639648, "global_step": 44798, "epoch": 1066} {"train_loss": -5.630189418792725, "global_step": 44799, "epoch": 1066} {"train_loss": -5.708125114440918, "global_step": 44800, "epoch": 1066} {"train_loss": -5.685688018798828, "global_step": 44801, "epoch": 1066} {"train_loss": -5.643452167510986, "global_step": 44802, "epoch": 1066} {"train_loss": -5.640035152435303, "global_step": 44803, "epoch": 1066} {"train_loss": -5.902413368225098, "global_step": 44804, "epoch": 1066} {"train_loss": -5.810923099517822, "global_step": 44805, "epoch": 1066} {"train_loss": -5.741621971130371, "global_step": 44806, "epoch": 1066} {"train_loss": -5.711881637573242, "global_step": 44807, "epoch": 1066} {"train_loss": -5.6468353271484375, "global_step": 44808, "epoch": 1066} {"train_loss": -5.695069313049316, "global_step": 44809, "epoch": 1066} {"train_loss": -5.643086910247803, "global_step": 44810, "epoch": 1066} {"train_loss": -5.672574996948242, "global_step": 44811, "epoch": 1066} {"train_loss": -5.7354230880737305, "global_step": 44812, "epoch": 1066} {"train_loss": -5.687873942511422, "global_step": 44813, "epoch": 1066, "val_loss": 74256.3984375} {"train_loss": -5.73038387298584, "global_step": 44814, "epoch": 1067} {"train_loss": -5.693692207336426, "global_step": 44815, "epoch": 1067} {"train_loss": -5.684535980224609, "global_step": 44816, "epoch": 1067} {"train_loss": -5.680948734283447, "global_step": 44817, "epoch": 1067} {"train_loss": -5.645469665527344, "global_step": 44818, "epoch": 1067} {"train_loss": -5.62163782119751, "global_step": 44819, "epoch": 1067} {"train_loss": -5.746430397033691, "global_step": 44820, "epoch": 1067} {"train_loss": -5.623465061187744, "global_step": 44821, "epoch": 1067} {"train_loss": -5.671290397644043, "global_step": 44822, "epoch": 1067} {"train_loss": -5.699362277984619, "global_step": 44823, "epoch": 1067} {"train_loss": -5.7420573234558105, "global_step": 44824, "epoch": 1067} {"train_loss": -5.594422817230225, "global_step": 44825, "epoch": 1067} {"train_loss": -5.714269638061523, "global_step": 44826, "epoch": 1067} {"train_loss": -5.715250015258789, "global_step": 44827, "epoch": 1067} {"train_loss": -5.702958106994629, "global_step": 44828, "epoch": 1067} {"train_loss": -5.7574872970581055, "global_step": 44829, "epoch": 1067} {"train_loss": -5.641018867492676, "global_step": 44830, "epoch": 1067} {"train_loss": -5.7112908363342285, "global_step": 44831, "epoch": 1067} {"train_loss": -5.697786331176758, "global_step": 44832, "epoch": 1067} {"train_loss": -5.6534647941589355, "global_step": 44833, "epoch": 1067} {"train_loss": -5.81993293762207, "global_step": 44834, "epoch": 1067} {"train_loss": -5.601957321166992, "global_step": 44835, "epoch": 1067} {"train_loss": -5.689690589904785, "global_step": 44836, "epoch": 1067} {"train_loss": -5.617141246795654, "global_step": 44837, "epoch": 1067} {"train_loss": -5.669674873352051, "global_step": 44838, "epoch": 1067} {"train_loss": -5.484115123748779, "global_step": 44839, "epoch": 1067} {"train_loss": -5.723106861114502, "global_step": 44840, "epoch": 1067} {"train_loss": -5.4663405418396, "global_step": 44841, "epoch": 1067} {"train_loss": -5.690725326538086, "global_step": 44842, "epoch": 1067} {"train_loss": -5.702613830566406, "global_step": 44843, "epoch": 1067} {"train_loss": -5.591271877288818, "global_step": 44844, "epoch": 1067} {"train_loss": -5.539360046386719, "global_step": 44845, "epoch": 1067} {"train_loss": -5.650461196899414, "global_step": 44846, "epoch": 1067} {"train_loss": -5.457361698150635, "global_step": 44847, "epoch": 1067} {"train_loss": -5.76310920715332, "global_step": 44848, "epoch": 1067} {"train_loss": -5.517045974731445, "global_step": 44849, "epoch": 1067} {"train_loss": -5.834179401397705, "global_step": 44850, "epoch": 1067} {"train_loss": -5.472149848937988, "global_step": 44851, "epoch": 1067} {"train_loss": -5.625767707824707, "global_step": 44852, "epoch": 1067} {"train_loss": -5.743605613708496, "global_step": 44853, "epoch": 1067} {"train_loss": -5.478589057922363, "global_step": 44854, "epoch": 1067} {"train_loss": -5.653216464178903, "global_step": 44855, "epoch": 1067, "val_loss": 74917.8984375} {"train_loss": -5.560576915740967, "global_step": 44856, "epoch": 1068} {"train_loss": -5.580686092376709, "global_step": 44857, "epoch": 1068} {"train_loss": -5.514819145202637, "global_step": 44858, "epoch": 1068} {"train_loss": -5.660948276519775, "global_step": 44859, "epoch": 1068} {"train_loss": -5.611507415771484, "global_step": 44860, "epoch": 1068} {"train_loss": -5.662489891052246, "global_step": 44861, "epoch": 1068} {"train_loss": -5.750964164733887, "global_step": 44862, "epoch": 1068} {"train_loss": -5.706029891967773, "global_step": 44863, "epoch": 1068} {"train_loss": -5.7084808349609375, "global_step": 44864, "epoch": 1068} {"train_loss": -5.6540632247924805, "global_step": 44865, "epoch": 1068} {"train_loss": -5.70217227935791, "global_step": 44866, "epoch": 1068} {"train_loss": -5.749181747436523, "global_step": 44867, "epoch": 1068} {"train_loss": -5.862510681152344, "global_step": 44868, "epoch": 1068} {"train_loss": -5.613302707672119, "global_step": 44869, "epoch": 1068} {"train_loss": -5.767286777496338, "global_step": 44870, "epoch": 1068} {"train_loss": -5.618749141693115, "global_step": 44871, "epoch": 1068} {"train_loss": -5.776223182678223, "global_step": 44872, "epoch": 1068} {"train_loss": -5.760920524597168, "global_step": 44873, "epoch": 1068} {"train_loss": -5.722630977630615, "global_step": 44874, "epoch": 1068} {"train_loss": -5.74106502532959, "global_step": 44875, "epoch": 1068} {"train_loss": -5.796474456787109, "global_step": 44876, "epoch": 1068} {"train_loss": -5.611573696136475, "global_step": 44877, "epoch": 1068} {"train_loss": -5.676520347595215, "global_step": 44878, "epoch": 1068} {"train_loss": -5.710609436035156, "global_step": 44879, "epoch": 1068} {"train_loss": -5.637083530426025, "global_step": 44880, "epoch": 1068} {"train_loss": -5.6279826164245605, "global_step": 44881, "epoch": 1068} {"train_loss": -5.768075942993164, "global_step": 44882, "epoch": 1068} {"train_loss": -5.577236175537109, "global_step": 44883, "epoch": 1068} {"train_loss": -5.648053169250488, "global_step": 44884, "epoch": 1068} {"train_loss": -5.846543312072754, "global_step": 44885, "epoch": 1068} {"train_loss": -5.57122802734375, "global_step": 44886, "epoch": 1068} {"train_loss": -5.664244174957275, "global_step": 44887, "epoch": 1068} {"train_loss": -5.636157512664795, "global_step": 44888, "epoch": 1068} {"train_loss": -5.675847053527832, "global_step": 44889, "epoch": 1068} {"train_loss": -5.78696346282959, "global_step": 44890, "epoch": 1068} {"train_loss": -5.710212707519531, "global_step": 44891, "epoch": 1068} {"train_loss": -5.677424430847168, "global_step": 44892, "epoch": 1068} {"train_loss": -5.743980407714844, "global_step": 44893, "epoch": 1068} {"train_loss": -5.6742658615112305, "global_step": 44894, "epoch": 1068} {"train_loss": -5.712510108947754, "global_step": 44895, "epoch": 1068} {"train_loss": -5.756978988647461, "global_step": 44896, "epoch": 1068} {"train_loss": -5.689849853515625, "global_step": 44897, "epoch": 1068, "val_loss": 74353.4375} {"train_loss": -5.737023830413818, "global_step": 44898, "epoch": 1069} {"train_loss": -5.704195022583008, "global_step": 44899, "epoch": 1069} {"train_loss": -5.699666976928711, "global_step": 44900, "epoch": 1069} {"train_loss": -5.643181800842285, "global_step": 44901, "epoch": 1069} {"train_loss": -5.661742210388184, "global_step": 44902, "epoch": 1069} {"train_loss": -5.629036903381348, "global_step": 44903, "epoch": 1069} {"train_loss": -5.714858055114746, "global_step": 44904, "epoch": 1069} {"train_loss": -5.6748552322387695, "global_step": 44905, "epoch": 1069} {"train_loss": -5.706161022186279, "global_step": 44906, "epoch": 1069} {"train_loss": -5.612001419067383, "global_step": 44907, "epoch": 1069} {"train_loss": -5.762479782104492, "global_step": 44908, "epoch": 1069} {"train_loss": -5.755483627319336, "global_step": 44909, "epoch": 1069} {"train_loss": -5.620983123779297, "global_step": 44910, "epoch": 1069} {"train_loss": -5.631398677825928, "global_step": 44911, "epoch": 1069} {"train_loss": -5.785111427307129, "global_step": 44912, "epoch": 1069} {"train_loss": -5.60151481628418, "global_step": 44913, "epoch": 1069} {"train_loss": -5.714483737945557, "global_step": 44914, "epoch": 1069} {"train_loss": -5.68212890625, "global_step": 44915, "epoch": 1069} {"train_loss": -5.658252716064453, "global_step": 44916, "epoch": 1069} {"train_loss": -5.5945000648498535, "global_step": 44917, "epoch": 1069} {"train_loss": -5.790524005889893, "global_step": 44918, "epoch": 1069} {"train_loss": -5.841446399688721, "global_step": 44919, "epoch": 1069} {"train_loss": -5.5626020431518555, "global_step": 44920, "epoch": 1069} {"train_loss": -5.64081335067749, "global_step": 44921, "epoch": 1069} {"train_loss": -5.642469882965088, "global_step": 44922, "epoch": 1069} {"train_loss": -5.66637659072876, "global_step": 44923, "epoch": 1069} {"train_loss": -5.689775466918945, "global_step": 44924, "epoch": 1069} {"train_loss": -5.558927536010742, "global_step": 44925, "epoch": 1069} {"train_loss": -5.58839750289917, "global_step": 44926, "epoch": 1069} {"train_loss": -5.514799118041992, "global_step": 44927, "epoch": 1069} {"train_loss": -5.707479476928711, "global_step": 44928, "epoch": 1069} {"train_loss": -5.633902072906494, "global_step": 44929, "epoch": 1069} {"train_loss": -5.661030292510986, "global_step": 44930, "epoch": 1069} {"train_loss": -5.646838188171387, "global_step": 44931, "epoch": 1069} {"train_loss": -5.556183815002441, "global_step": 44932, "epoch": 1069} {"train_loss": -5.7198262214660645, "global_step": 44933, "epoch": 1069} {"train_loss": -5.6328444480896, "global_step": 44934, "epoch": 1069} {"train_loss": -5.558873176574707, "global_step": 44935, "epoch": 1069} {"train_loss": -5.793095588684082, "global_step": 44936, "epoch": 1069} {"train_loss": -5.553962707519531, "global_step": 44937, "epoch": 1069} {"train_loss": -5.70329475402832, "global_step": 44938, "epoch": 1069} {"train_loss": -5.662194706144787, "global_step": 44939, "epoch": 1069, "val_loss": 73615.6640625} {"train_loss": -5.767072677612305, "global_step": 44940, "epoch": 1070} {"train_loss": -5.651351451873779, "global_step": 44941, "epoch": 1070} {"train_loss": -5.682973861694336, "global_step": 44942, "epoch": 1070} {"train_loss": -5.67831563949585, "global_step": 44943, "epoch": 1070} {"train_loss": -5.820940971374512, "global_step": 44944, "epoch": 1070} {"train_loss": -5.836650848388672, "global_step": 44945, "epoch": 1070} {"train_loss": -5.70526123046875, "global_step": 44946, "epoch": 1070} {"train_loss": -5.717621803283691, "global_step": 44947, "epoch": 1070} {"train_loss": -5.700593948364258, "global_step": 44948, "epoch": 1070} {"train_loss": -5.849730491638184, "global_step": 44949, "epoch": 1070} {"train_loss": -5.5525665283203125, "global_step": 44950, "epoch": 1070} {"train_loss": -5.654662132263184, "global_step": 44951, "epoch": 1070} {"train_loss": -5.6748151779174805, "global_step": 44952, "epoch": 1070} {"train_loss": -5.713772773742676, "global_step": 44953, "epoch": 1070} {"train_loss": -5.6576104164123535, "global_step": 44954, "epoch": 1070} {"train_loss": -5.6891584396362305, "global_step": 44955, "epoch": 1070} {"train_loss": -5.673412322998047, "global_step": 44956, "epoch": 1070} {"train_loss": -5.568930149078369, "global_step": 44957, "epoch": 1070} {"train_loss": -5.716657638549805, "global_step": 44958, "epoch": 1070} {"train_loss": -5.658105850219727, "global_step": 44959, "epoch": 1070} {"train_loss": -5.706653594970703, "global_step": 44960, "epoch": 1070} {"train_loss": -5.725449085235596, "global_step": 44961, "epoch": 1070} {"train_loss": -5.808547019958496, "global_step": 44962, "epoch": 1070} {"train_loss": -5.683246612548828, "global_step": 44963, "epoch": 1070} {"train_loss": -5.77036190032959, "global_step": 44964, "epoch": 1070} {"train_loss": -5.779751777648926, "global_step": 44965, "epoch": 1070} {"train_loss": -5.683643817901611, "global_step": 44966, "epoch": 1070} {"train_loss": -5.567441940307617, "global_step": 44967, "epoch": 1070} {"train_loss": -5.641850471496582, "global_step": 44968, "epoch": 1070} {"train_loss": -5.633575439453125, "global_step": 44969, "epoch": 1070} {"train_loss": -5.662240028381348, "global_step": 44970, "epoch": 1070} {"train_loss": -5.646590232849121, "global_step": 44971, "epoch": 1070} {"train_loss": -5.634228229522705, "global_step": 44972, "epoch": 1070} {"train_loss": -5.803103923797607, "global_step": 44973, "epoch": 1070} {"train_loss": -5.596008777618408, "global_step": 44974, "epoch": 1070} {"train_loss": -5.745532035827637, "global_step": 44975, "epoch": 1070} {"train_loss": -5.733798980712891, "global_step": 44976, "epoch": 1070} {"train_loss": -5.670525550842285, "global_step": 44977, "epoch": 1070} {"train_loss": -5.762419700622559, "global_step": 44978, "epoch": 1070} {"train_loss": -5.617439270019531, "global_step": 44979, "epoch": 1070} {"train_loss": -5.682342529296875, "global_step": 44980, "epoch": 1070} {"train_loss": -5.6970168976556685, "global_step": 44981, "epoch": 1070, "val_loss": 73902.1796875} {"train_loss": -5.728963851928711, "global_step": 44982, "epoch": 1071} {"train_loss": -5.791000843048096, "global_step": 44983, "epoch": 1071} {"train_loss": -5.769224166870117, "global_step": 44984, "epoch": 1071} {"train_loss": -5.636342525482178, "global_step": 44985, "epoch": 1071} {"train_loss": -5.6632609367370605, "global_step": 44986, "epoch": 1071} {"train_loss": -5.894336700439453, "global_step": 44987, "epoch": 1071} {"train_loss": -5.645300388336182, "global_step": 44988, "epoch": 1071} {"train_loss": -5.714418411254883, "global_step": 44989, "epoch": 1071} {"train_loss": -5.681168556213379, "global_step": 44990, "epoch": 1071} {"train_loss": -5.703646659851074, "global_step": 44991, "epoch": 1071} {"train_loss": -5.720245361328125, "global_step": 44992, "epoch": 1071} {"train_loss": -5.682468891143799, "global_step": 44993, "epoch": 1071} {"train_loss": -5.816986083984375, "global_step": 44994, "epoch": 1071} {"train_loss": -5.738206386566162, "global_step": 44995, "epoch": 1071} {"train_loss": -5.788957595825195, "global_step": 44996, "epoch": 1071} {"train_loss": -5.735530853271484, "global_step": 44997, "epoch": 1071} {"train_loss": -5.6694440841674805, "global_step": 44998, "epoch": 1071} {"train_loss": -5.815597057342529, "global_step": 44999, "epoch": 1071} {"train_loss": -5.796053886413574, "global_step": 45000, "epoch": 1071} {"train_loss": -5.7018938064575195, "global_step": 45001, "epoch": 1071} {"train_loss": -5.723916053771973, "global_step": 45002, "epoch": 1071} {"train_loss": -5.606921672821045, "global_step": 45003, "epoch": 1071} {"train_loss": -5.71212911605835, "global_step": 45004, "epoch": 1071} {"train_loss": -5.580486297607422, "global_step": 45005, "epoch": 1071} {"train_loss": -5.641483306884766, "global_step": 45006, "epoch": 1071} {"train_loss": -5.6946563720703125, "global_step": 45007, "epoch": 1071} {"train_loss": -5.604910850524902, "global_step": 45008, "epoch": 1071} {"train_loss": -5.545710563659668, "global_step": 45009, "epoch": 1071} {"train_loss": -5.618044853210449, "global_step": 45010, "epoch": 1071} {"train_loss": -5.497403144836426, "global_step": 45011, "epoch": 1071} {"train_loss": -5.623152732849121, "global_step": 45012, "epoch": 1071} {"train_loss": -5.70349645614624, "global_step": 45013, "epoch": 1071} {"train_loss": -5.627599716186523, "global_step": 45014, "epoch": 1071} {"train_loss": -5.61759614944458, "global_step": 45015, "epoch": 1071} {"train_loss": -5.311680793762207, "global_step": 45016, "epoch": 1071} {"train_loss": -5.768560409545898, "global_step": 45017, "epoch": 1071} {"train_loss": -5.540534019470215, "global_step": 45018, "epoch": 1071} {"train_loss": -5.625773906707764, "global_step": 45019, "epoch": 1071} {"train_loss": -5.6835408210754395, "global_step": 45020, "epoch": 1071} {"train_loss": -5.673783302307129, "global_step": 45021, "epoch": 1071} {"train_loss": -5.618399620056152, "global_step": 45022, "epoch": 1071} {"train_loss": -5.677489223934355, "global_step": 45023, "epoch": 1071, "val_loss": 74355.5078125} {"train_loss": -5.58599853515625, "global_step": 45024, "epoch": 1072} {"train_loss": -5.723866939544678, "global_step": 45025, "epoch": 1072} {"train_loss": -5.655853271484375, "global_step": 45026, "epoch": 1072} {"train_loss": -5.447487831115723, "global_step": 45027, "epoch": 1072} {"train_loss": -5.703431129455566, "global_step": 45028, "epoch": 1072} {"train_loss": -5.677151679992676, "global_step": 45029, "epoch": 1072} {"train_loss": -5.63475227355957, "global_step": 45030, "epoch": 1072} {"train_loss": -5.700285911560059, "global_step": 45031, "epoch": 1072} {"train_loss": -5.6993327140808105, "global_step": 45032, "epoch": 1072} {"train_loss": -5.525129795074463, "global_step": 45033, "epoch": 1072} {"train_loss": -5.69969367980957, "global_step": 45034, "epoch": 1072} {"train_loss": -5.655730247497559, "global_step": 45035, "epoch": 1072} {"train_loss": -5.755129337310791, "global_step": 45036, "epoch": 1072} {"train_loss": -5.791480541229248, "global_step": 45037, "epoch": 1072} {"train_loss": -5.758956432342529, "global_step": 45038, "epoch": 1072} {"train_loss": -5.661870002746582, "global_step": 45039, "epoch": 1072} {"train_loss": -5.620281219482422, "global_step": 45040, "epoch": 1072} {"train_loss": -5.766928195953369, "global_step": 45041, "epoch": 1072} {"train_loss": -5.656525135040283, "global_step": 45042, "epoch": 1072} {"train_loss": -5.685098648071289, "global_step": 45043, "epoch": 1072} {"train_loss": -5.544282913208008, "global_step": 45044, "epoch": 1072} {"train_loss": -5.669422149658203, "global_step": 45045, "epoch": 1072} {"train_loss": -5.663268566131592, "global_step": 45046, "epoch": 1072} {"train_loss": -5.70738410949707, "global_step": 45047, "epoch": 1072} {"train_loss": -5.629225254058838, "global_step": 45048, "epoch": 1072} {"train_loss": -5.560406684875488, "global_step": 45049, "epoch": 1072} {"train_loss": -5.63326358795166, "global_step": 45050, "epoch": 1072} {"train_loss": -5.667285442352295, "global_step": 45051, "epoch": 1072} {"train_loss": -5.648975372314453, "global_step": 45052, "epoch": 1072} {"train_loss": -5.756899833679199, "global_step": 45053, "epoch": 1072} {"train_loss": -5.6490349769592285, "global_step": 45054, "epoch": 1072} {"train_loss": -5.741545677185059, "global_step": 45055, "epoch": 1072} {"train_loss": -5.7543487548828125, "global_step": 45056, "epoch": 1072} {"train_loss": -5.693243980407715, "global_step": 45057, "epoch": 1072} {"train_loss": -5.815357208251953, "global_step": 45058, "epoch": 1072} {"train_loss": -5.605800628662109, "global_step": 45059, "epoch": 1072} {"train_loss": -5.663776874542236, "global_step": 45060, "epoch": 1072} {"train_loss": -5.623046875, "global_step": 45061, "epoch": 1072} {"train_loss": -5.777929306030273, "global_step": 45062, "epoch": 1072} {"train_loss": -5.768387794494629, "global_step": 45063, "epoch": 1072} {"train_loss": -5.697808265686035, "global_step": 45064, "epoch": 1072} {"train_loss": -5.676825228191557, "global_step": 45065, "epoch": 1072, "val_loss": 74207.5546875} {"train_loss": -5.736025810241699, "global_step": 45066, "epoch": 1073} {"train_loss": -5.762129306793213, "global_step": 45067, "epoch": 1073} {"train_loss": -5.667628288269043, "global_step": 45068, "epoch": 1073} {"train_loss": -5.791462421417236, "global_step": 45069, "epoch": 1073} {"train_loss": -5.695843696594238, "global_step": 45070, "epoch": 1073} {"train_loss": -5.620455265045166, "global_step": 45071, "epoch": 1073} {"train_loss": -5.602687358856201, "global_step": 45072, "epoch": 1073} {"train_loss": -5.7784929275512695, "global_step": 45073, "epoch": 1073} {"train_loss": -5.710140228271484, "global_step": 45074, "epoch": 1073} {"train_loss": -5.801506996154785, "global_step": 45075, "epoch": 1073} {"train_loss": -5.653024673461914, "global_step": 45076, "epoch": 1073} {"train_loss": -5.564925193786621, "global_step": 45077, "epoch": 1073} {"train_loss": -5.722709655761719, "global_step": 45078, "epoch": 1073} {"train_loss": -5.732903003692627, "global_step": 45079, "epoch": 1073} {"train_loss": -5.795663356781006, "global_step": 45080, "epoch": 1073} {"train_loss": -5.683259010314941, "global_step": 45081, "epoch": 1073} {"train_loss": -5.723505973815918, "global_step": 45082, "epoch": 1073} {"train_loss": -5.739589691162109, "global_step": 45083, "epoch": 1073} {"train_loss": -5.753507614135742, "global_step": 45084, "epoch": 1073} {"train_loss": -5.5590620040893555, "global_step": 45085, "epoch": 1073} {"train_loss": -5.583970069885254, "global_step": 45086, "epoch": 1073} {"train_loss": -5.700572490692139, "global_step": 45087, "epoch": 1073} {"train_loss": -5.65465784072876, "global_step": 45088, "epoch": 1073} {"train_loss": -5.654289245605469, "global_step": 45089, "epoch": 1073} {"train_loss": -5.665048122406006, "global_step": 45090, "epoch": 1073} {"train_loss": -5.75356388092041, "global_step": 45091, "epoch": 1073} {"train_loss": -5.792346000671387, "global_step": 45092, "epoch": 1073} {"train_loss": -5.724871635437012, "global_step": 45093, "epoch": 1073} {"train_loss": -5.648711204528809, "global_step": 45094, "epoch": 1073} {"train_loss": -5.774111270904541, "global_step": 45095, "epoch": 1073} {"train_loss": -5.732508659362793, "global_step": 45096, "epoch": 1073} {"train_loss": -5.640800476074219, "global_step": 45097, "epoch": 1073} {"train_loss": -5.710599899291992, "global_step": 45098, "epoch": 1073} {"train_loss": -5.767902851104736, "global_step": 45099, "epoch": 1073} {"train_loss": -5.645205974578857, "global_step": 45100, "epoch": 1073} {"train_loss": -5.601949691772461, "global_step": 45101, "epoch": 1073} {"train_loss": -5.685532569885254, "global_step": 45102, "epoch": 1073} {"train_loss": -5.767876625061035, "global_step": 45103, "epoch": 1073} {"train_loss": -5.6873040199279785, "global_step": 45104, "epoch": 1073} {"train_loss": -5.646468162536621, "global_step": 45105, "epoch": 1073} {"train_loss": -5.786025047302246, "global_step": 45106, "epoch": 1073} {"train_loss": -5.699105183283488, "global_step": 45107, "epoch": 1073, "val_loss": 73873.375} {"train_loss": -5.682138442993164, "global_step": 45108, "epoch": 1074} {"train_loss": -5.576458930969238, "global_step": 45109, "epoch": 1074} {"train_loss": -5.740538597106934, "global_step": 45110, "epoch": 1074} {"train_loss": -5.625804424285889, "global_step": 45111, "epoch": 1074} {"train_loss": -5.682852268218994, "global_step": 45112, "epoch": 1074} {"train_loss": -5.801792144775391, "global_step": 45113, "epoch": 1074} {"train_loss": -5.615752220153809, "global_step": 45114, "epoch": 1074} {"train_loss": -5.699888706207275, "global_step": 45115, "epoch": 1074} {"train_loss": -5.733057022094727, "global_step": 45116, "epoch": 1074} {"train_loss": -5.782785892486572, "global_step": 45117, "epoch": 1074} {"train_loss": -5.659084796905518, "global_step": 45118, "epoch": 1074} {"train_loss": -5.557936668395996, "global_step": 45119, "epoch": 1074} {"train_loss": -5.701576232910156, "global_step": 45120, "epoch": 1074} {"train_loss": -5.6092329025268555, "global_step": 45121, "epoch": 1074} {"train_loss": -5.539735794067383, "global_step": 45122, "epoch": 1074} {"train_loss": -5.75521183013916, "global_step": 45123, "epoch": 1074} {"train_loss": -5.85648250579834, "global_step": 45124, "epoch": 1074} {"train_loss": -5.640986442565918, "global_step": 45125, "epoch": 1074} {"train_loss": -5.591891288757324, "global_step": 45126, "epoch": 1074} {"train_loss": -5.74570369720459, "global_step": 45127, "epoch": 1074} {"train_loss": -5.713404178619385, "global_step": 45128, "epoch": 1074} {"train_loss": -5.6727294921875, "global_step": 45129, "epoch": 1074} {"train_loss": -5.71079683303833, "global_step": 45130, "epoch": 1074} {"train_loss": -5.72315788269043, "global_step": 45131, "epoch": 1074} {"train_loss": -5.648316860198975, "global_step": 45132, "epoch": 1074} {"train_loss": -5.8646769523620605, "global_step": 45133, "epoch": 1074} {"train_loss": -5.663207530975342, "global_step": 45134, "epoch": 1074} {"train_loss": -5.69093132019043, "global_step": 45135, "epoch": 1074} {"train_loss": -5.824769020080566, "global_step": 45136, "epoch": 1074} {"train_loss": -5.495237827301025, "global_step": 45137, "epoch": 1074} {"train_loss": -5.657283782958984, "global_step": 45138, "epoch": 1074} {"train_loss": -5.797659397125244, "global_step": 45139, "epoch": 1074} {"train_loss": -5.7436065673828125, "global_step": 45140, "epoch": 1074} {"train_loss": -5.6136064529418945, "global_step": 45141, "epoch": 1074} {"train_loss": -5.677403450012207, "global_step": 45142, "epoch": 1074} {"train_loss": -5.540754318237305, "global_step": 45143, "epoch": 1074} {"train_loss": -5.733920097351074, "global_step": 45144, "epoch": 1074} {"train_loss": -5.620328903198242, "global_step": 45145, "epoch": 1074} {"train_loss": -5.797005653381348, "global_step": 45146, "epoch": 1074} {"train_loss": -5.438913345336914, "global_step": 45147, "epoch": 1074} {"train_loss": -5.6641387939453125, "global_step": 45148, "epoch": 1074} {"train_loss": -5.67958022299267, "global_step": 45149, "epoch": 1074, "val_loss": 75516.484375} {"train_loss": -5.3859333992004395, "global_step": 45150, "epoch": 1075} {"train_loss": -5.719579696655273, "global_step": 45151, "epoch": 1075} {"train_loss": -5.529094696044922, "global_step": 45152, "epoch": 1075} {"train_loss": -5.537949085235596, "global_step": 45153, "epoch": 1075} {"train_loss": -5.574354648590088, "global_step": 45154, "epoch": 1075} {"train_loss": -5.5217132568359375, "global_step": 45155, "epoch": 1075} {"train_loss": -5.4866228103637695, "global_step": 45156, "epoch": 1075} {"train_loss": -5.491567611694336, "global_step": 45157, "epoch": 1075} {"train_loss": -5.710788726806641, "global_step": 45158, "epoch": 1075} {"train_loss": -5.471060276031494, "global_step": 45159, "epoch": 1075} {"train_loss": -5.737255096435547, "global_step": 45160, "epoch": 1075} {"train_loss": -5.476633071899414, "global_step": 45161, "epoch": 1075} {"train_loss": -5.70089054107666, "global_step": 45162, "epoch": 1075} {"train_loss": -5.632437705993652, "global_step": 45163, "epoch": 1075} {"train_loss": -5.632121562957764, "global_step": 45164, "epoch": 1075} {"train_loss": -5.67850923538208, "global_step": 45165, "epoch": 1075} {"train_loss": -5.70658016204834, "global_step": 45166, "epoch": 1075} {"train_loss": -5.63304328918457, "global_step": 45167, "epoch": 1075} {"train_loss": -5.699481010437012, "global_step": 45168, "epoch": 1075} {"train_loss": -5.502377986907959, "global_step": 45169, "epoch": 1075} {"train_loss": -5.702449321746826, "global_step": 45170, "epoch": 1075} {"train_loss": -5.646437644958496, "global_step": 45171, "epoch": 1075} {"train_loss": -5.61488151550293, "global_step": 45172, "epoch": 1075} {"train_loss": -5.502812385559082, "global_step": 45173, "epoch": 1075} {"train_loss": -5.6098127365112305, "global_step": 45174, "epoch": 1075} {"train_loss": -5.637413501739502, "global_step": 45175, "epoch": 1075} {"train_loss": -5.68269157409668, "global_step": 45176, "epoch": 1075} {"train_loss": -5.647585868835449, "global_step": 45177, "epoch": 1075} {"train_loss": -5.580381393432617, "global_step": 45178, "epoch": 1075} {"train_loss": -5.586494445800781, "global_step": 45179, "epoch": 1075} {"train_loss": -5.663139343261719, "global_step": 45180, "epoch": 1075} {"train_loss": -5.498204231262207, "global_step": 45181, "epoch": 1075} {"train_loss": -5.648653984069824, "global_step": 45182, "epoch": 1075} {"train_loss": -5.756044387817383, "global_step": 45183, "epoch": 1075} {"train_loss": -5.6740875244140625, "global_step": 45184, "epoch": 1075} {"train_loss": -5.6425018310546875, "global_step": 45185, "epoch": 1075} {"train_loss": -5.61746883392334, "global_step": 45186, "epoch": 1075} {"train_loss": -5.760165214538574, "global_step": 45187, "epoch": 1075} {"train_loss": -5.674539566040039, "global_step": 45188, "epoch": 1075} {"train_loss": -5.710633754730225, "global_step": 45189, "epoch": 1075} {"train_loss": -5.744375228881836, "global_step": 45190, "epoch": 1075} {"train_loss": -5.6226317428407215, "global_step": 45191, "epoch": 1075, "val_loss": 73723.46875} {"train_loss": -5.800302028656006, "global_step": 45192, "epoch": 1076} {"train_loss": -5.650720596313477, "global_step": 45193, "epoch": 1076} {"train_loss": -5.662981033325195, "global_step": 45194, "epoch": 1076} {"train_loss": -5.701242446899414, "global_step": 45195, "epoch": 1076} {"train_loss": -5.61280632019043, "global_step": 45196, "epoch": 1076} {"train_loss": -5.675287246704102, "global_step": 45197, "epoch": 1076} {"train_loss": -5.78469181060791, "global_step": 45198, "epoch": 1076} {"train_loss": -5.75968074798584, "global_step": 45199, "epoch": 1076} {"train_loss": -5.725531578063965, "global_step": 45200, "epoch": 1076} {"train_loss": -5.831843376159668, "global_step": 45201, "epoch": 1076} {"train_loss": -5.496922492980957, "global_step": 45202, "epoch": 1076} {"train_loss": -5.723765850067139, "global_step": 45203, "epoch": 1076} {"train_loss": -5.695224285125732, "global_step": 45204, "epoch": 1076} {"train_loss": -5.5859880447387695, "global_step": 45205, "epoch": 1076} {"train_loss": -5.6691203117370605, "global_step": 45206, "epoch": 1076} {"train_loss": -5.673460960388184, "global_step": 45207, "epoch": 1076} {"train_loss": -5.770707607269287, "global_step": 45208, "epoch": 1076} {"train_loss": -5.753391265869141, "global_step": 45209, "epoch": 1076} {"train_loss": -5.700394630432129, "global_step": 45210, "epoch": 1076} {"train_loss": -5.7080888748168945, "global_step": 45211, "epoch": 1076} {"train_loss": -5.617915630340576, "global_step": 45212, "epoch": 1076} {"train_loss": -5.615020751953125, "global_step": 45213, "epoch": 1076} {"train_loss": -5.715921878814697, "global_step": 45214, "epoch": 1076} {"train_loss": -5.753235816955566, "global_step": 45215, "epoch": 1076} {"train_loss": -5.613513946533203, "global_step": 45216, "epoch": 1076} {"train_loss": -5.639495372772217, "global_step": 45217, "epoch": 1076} {"train_loss": -5.682327747344971, "global_step": 45218, "epoch": 1076} {"train_loss": -5.7171478271484375, "global_step": 45219, "epoch": 1076} {"train_loss": -5.779486656188965, "global_step": 45220, "epoch": 1076} {"train_loss": -5.814379692077637, "global_step": 45221, "epoch": 1076} {"train_loss": -5.518525123596191, "global_step": 45222, "epoch": 1076} {"train_loss": -5.597061634063721, "global_step": 45223, "epoch": 1076} {"train_loss": -5.623626708984375, "global_step": 45224, "epoch": 1076} {"train_loss": -5.667054176330566, "global_step": 45225, "epoch": 1076} {"train_loss": -5.706116676330566, "global_step": 45226, "epoch": 1076} {"train_loss": -5.762378692626953, "global_step": 45227, "epoch": 1076} {"train_loss": -5.584926128387451, "global_step": 45228, "epoch": 1076} {"train_loss": -5.6442179679870605, "global_step": 45229, "epoch": 1076} {"train_loss": -5.684123992919922, "global_step": 45230, "epoch": 1076} {"train_loss": -5.79274320602417, "global_step": 45231, "epoch": 1076} {"train_loss": -5.737128257751465, "global_step": 45232, "epoch": 1076} {"train_loss": -5.68960284051441, "global_step": 45233, "epoch": 1076, "val_loss": 74296.9921875} {"train_loss": -5.7403564453125, "global_step": 45234, "epoch": 1077} {"train_loss": -5.671194076538086, "global_step": 45235, "epoch": 1077} {"train_loss": -5.831278324127197, "global_step": 45236, "epoch": 1077} {"train_loss": -5.710752964019775, "global_step": 45237, "epoch": 1077} {"train_loss": -5.618688583374023, "global_step": 45238, "epoch": 1077} {"train_loss": -5.713111877441406, "global_step": 45239, "epoch": 1077} {"train_loss": -5.669228553771973, "global_step": 45240, "epoch": 1077} {"train_loss": -5.767637729644775, "global_step": 45241, "epoch": 1077} {"train_loss": -5.687923431396484, "global_step": 45242, "epoch": 1077} {"train_loss": -5.666961669921875, "global_step": 45243, "epoch": 1077} {"train_loss": -5.636782646179199, "global_step": 45244, "epoch": 1077} {"train_loss": -5.748777389526367, "global_step": 45245, "epoch": 1077} {"train_loss": -5.791692733764648, "global_step": 45246, "epoch": 1077} {"train_loss": -5.528816223144531, "global_step": 45247, "epoch": 1077} {"train_loss": -5.7541608810424805, "global_step": 45248, "epoch": 1077} {"train_loss": -5.711611747741699, "global_step": 45249, "epoch": 1077} {"train_loss": -5.556475639343262, "global_step": 45250, "epoch": 1077} {"train_loss": -5.873064994812012, "global_step": 45251, "epoch": 1077} {"train_loss": -5.733634948730469, "global_step": 45252, "epoch": 1077} {"train_loss": -5.7629313468933105, "global_step": 45253, "epoch": 1077} {"train_loss": -5.678703308105469, "global_step": 45254, "epoch": 1077} {"train_loss": -5.6478424072265625, "global_step": 45255, "epoch": 1077} {"train_loss": -5.730010509490967, "global_step": 45256, "epoch": 1077} {"train_loss": -5.714943885803223, "global_step": 45257, "epoch": 1077} {"train_loss": -5.728537082672119, "global_step": 45258, "epoch": 1077} {"train_loss": -5.728822708129883, "global_step": 45259, "epoch": 1077} {"train_loss": -5.756180763244629, "global_step": 45260, "epoch": 1077} {"train_loss": -5.850773334503174, "global_step": 45261, "epoch": 1077} {"train_loss": -5.737821578979492, "global_step": 45262, "epoch": 1077} {"train_loss": -5.696810722351074, "global_step": 45263, "epoch": 1077} {"train_loss": -5.680047988891602, "global_step": 45264, "epoch": 1077} {"train_loss": -5.796834945678711, "global_step": 45265, "epoch": 1077} {"train_loss": -5.650246620178223, "global_step": 45266, "epoch": 1077} {"train_loss": -5.747960567474365, "global_step": 45267, "epoch": 1077} {"train_loss": -5.6586689949035645, "global_step": 45268, "epoch": 1077} {"train_loss": -5.6360859870910645, "global_step": 45269, "epoch": 1077} {"train_loss": -5.659486293792725, "global_step": 45270, "epoch": 1077} {"train_loss": -5.631929397583008, "global_step": 45271, "epoch": 1077} {"train_loss": -5.732936859130859, "global_step": 45272, "epoch": 1077} {"train_loss": -5.591910362243652, "global_step": 45273, "epoch": 1077} {"train_loss": -5.6006269454956055, "global_step": 45274, "epoch": 1077} {"train_loss": -5.7032589344751266, "global_step": 45275, "epoch": 1077, "val_loss": 74476.34375} {"train_loss": -5.602624893188477, "global_step": 45276, "epoch": 1078} {"train_loss": -5.655092239379883, "global_step": 45277, "epoch": 1078} {"train_loss": -5.631975173950195, "global_step": 45278, "epoch": 1078} {"train_loss": -5.658766746520996, "global_step": 45279, "epoch": 1078} {"train_loss": -5.671442985534668, "global_step": 45280, "epoch": 1078} {"train_loss": -5.799454689025879, "global_step": 45281, "epoch": 1078} {"train_loss": -5.720293045043945, "global_step": 45282, "epoch": 1078} {"train_loss": -5.746908664703369, "global_step": 45283, "epoch": 1078} {"train_loss": -5.716683387756348, "global_step": 45284, "epoch": 1078} {"train_loss": -5.668593883514404, "global_step": 45285, "epoch": 1078} {"train_loss": -5.524435997009277, "global_step": 45286, "epoch": 1078} {"train_loss": -5.74227237701416, "global_step": 45287, "epoch": 1078} {"train_loss": -5.7858381271362305, "global_step": 45288, "epoch": 1078} {"train_loss": -5.747004508972168, "global_step": 45289, "epoch": 1078} {"train_loss": -5.760976314544678, "global_step": 45290, "epoch": 1078} {"train_loss": -5.737096786499023, "global_step": 45291, "epoch": 1078} {"train_loss": -5.622614860534668, "global_step": 45292, "epoch": 1078} {"train_loss": -5.730119705200195, "global_step": 45293, "epoch": 1078} {"train_loss": -5.729401588439941, "global_step": 45294, "epoch": 1078} {"train_loss": -5.715324878692627, "global_step": 45295, "epoch": 1078} {"train_loss": -5.683964252471924, "global_step": 45296, "epoch": 1078} {"train_loss": -5.665289402008057, "global_step": 45297, "epoch": 1078} {"train_loss": -5.666065216064453, "global_step": 45298, "epoch": 1078} {"train_loss": -5.742742538452148, "global_step": 45299, "epoch": 1078} {"train_loss": -5.654575347900391, "global_step": 45300, "epoch": 1078} {"train_loss": -5.733944416046143, "global_step": 45301, "epoch": 1078} {"train_loss": -5.59564733505249, "global_step": 45302, "epoch": 1078} {"train_loss": -5.683902740478516, "global_step": 45303, "epoch": 1078} {"train_loss": -5.679301738739014, "global_step": 45304, "epoch": 1078} {"train_loss": -5.796958923339844, "global_step": 45305, "epoch": 1078} {"train_loss": -5.627323150634766, "global_step": 45306, "epoch": 1078} {"train_loss": -5.600214004516602, "global_step": 45307, "epoch": 1078} {"train_loss": -5.603089809417725, "global_step": 45308, "epoch": 1078} {"train_loss": -5.664159774780273, "global_step": 45309, "epoch": 1078} {"train_loss": -5.79597282409668, "global_step": 45310, "epoch": 1078} {"train_loss": -5.599725246429443, "global_step": 45311, "epoch": 1078} {"train_loss": -5.613157272338867, "global_step": 45312, "epoch": 1078} {"train_loss": -5.724000930786133, "global_step": 45313, "epoch": 1078} {"train_loss": -5.672825813293457, "global_step": 45314, "epoch": 1078} {"train_loss": -5.584492206573486, "global_step": 45315, "epoch": 1078} {"train_loss": -5.702866077423096, "global_step": 45316, "epoch": 1078} {"train_loss": -5.68363322530474, "global_step": 45317, "epoch": 1078, "val_loss": 74053.03125} {"train_loss": -5.583983421325684, "global_step": 45318, "epoch": 1079} {"train_loss": -5.669195175170898, "global_step": 45319, "epoch": 1079} {"train_loss": -5.67880916595459, "global_step": 45320, "epoch": 1079} {"train_loss": -5.7503767013549805, "global_step": 45321, "epoch": 1079} {"train_loss": -5.7262187004089355, "global_step": 45322, "epoch": 1079} {"train_loss": -5.684709072113037, "global_step": 45323, "epoch": 1079} {"train_loss": -5.681330680847168, "global_step": 45324, "epoch": 1079} {"train_loss": -5.723729610443115, "global_step": 45325, "epoch": 1079} {"train_loss": -5.584321975708008, "global_step": 45326, "epoch": 1079} {"train_loss": -5.581630706787109, "global_step": 45327, "epoch": 1079} {"train_loss": -5.636641979217529, "global_step": 45328, "epoch": 1079} {"train_loss": -5.515200614929199, "global_step": 45329, "epoch": 1079} {"train_loss": -5.546662330627441, "global_step": 45330, "epoch": 1079} {"train_loss": -5.431853294372559, "global_step": 45331, "epoch": 1079} {"train_loss": -5.62286376953125, "global_step": 45332, "epoch": 1079} {"train_loss": -5.592586994171143, "global_step": 45333, "epoch": 1079} {"train_loss": -5.599844932556152, "global_step": 45334, "epoch": 1079} {"train_loss": -5.706663608551025, "global_step": 45335, "epoch": 1079} {"train_loss": -5.525086879730225, "global_step": 45336, "epoch": 1079} {"train_loss": -5.6790618896484375, "global_step": 45337, "epoch": 1079} {"train_loss": -5.69118595123291, "global_step": 45338, "epoch": 1079} {"train_loss": -5.571994781494141, "global_step": 45339, "epoch": 1079} {"train_loss": -5.665278911590576, "global_step": 45340, "epoch": 1079} {"train_loss": -5.647683143615723, "global_step": 45341, "epoch": 1079} {"train_loss": -5.6433916091918945, "global_step": 45342, "epoch": 1079} {"train_loss": -5.603938579559326, "global_step": 45343, "epoch": 1079} {"train_loss": -5.732215404510498, "global_step": 45344, "epoch": 1079} {"train_loss": -5.485713481903076, "global_step": 45345, "epoch": 1079} {"train_loss": -5.802480697631836, "global_step": 45346, "epoch": 1079} {"train_loss": -5.725905418395996, "global_step": 45347, "epoch": 1079} {"train_loss": -5.64920711517334, "global_step": 45348, "epoch": 1079} {"train_loss": -5.659810543060303, "global_step": 45349, "epoch": 1079} {"train_loss": -5.878607749938965, "global_step": 45350, "epoch": 1079} {"train_loss": -5.756252765655518, "global_step": 45351, "epoch": 1079} {"train_loss": -5.8283538818359375, "global_step": 45352, "epoch": 1079} {"train_loss": -5.799592971801758, "global_step": 45353, "epoch": 1079} {"train_loss": -5.68261194229126, "global_step": 45354, "epoch": 1079} {"train_loss": -5.840538024902344, "global_step": 45355, "epoch": 1079} {"train_loss": -5.790039539337158, "global_step": 45356, "epoch": 1079} {"train_loss": -5.717828750610352, "global_step": 45357, "epoch": 1079} {"train_loss": -5.726515769958496, "global_step": 45358, "epoch": 1079} {"train_loss": -5.669701508113316, "global_step": 45359, "epoch": 1079, "val_loss": 74165.6953125} {"train_loss": -5.767769813537598, "global_step": 45360, "epoch": 1080} {"train_loss": -5.767236232757568, "global_step": 45361, "epoch": 1080} {"train_loss": -5.690656661987305, "global_step": 45362, "epoch": 1080} {"train_loss": -5.730386734008789, "global_step": 45363, "epoch": 1080} {"train_loss": -5.7322211265563965, "global_step": 45364, "epoch": 1080} {"train_loss": -5.743927478790283, "global_step": 45365, "epoch": 1080} {"train_loss": -5.823581218719482, "global_step": 45366, "epoch": 1080} {"train_loss": -5.7351861000061035, "global_step": 45367, "epoch": 1080} {"train_loss": -5.748958587646484, "global_step": 45368, "epoch": 1080} {"train_loss": -5.7079668045043945, "global_step": 45369, "epoch": 1080} {"train_loss": -5.676253318786621, "global_step": 45370, "epoch": 1080} {"train_loss": -5.694202423095703, "global_step": 45371, "epoch": 1080} {"train_loss": -5.724972724914551, "global_step": 45372, "epoch": 1080} {"train_loss": -5.630331993103027, "global_step": 45373, "epoch": 1080} {"train_loss": -5.680538654327393, "global_step": 45374, "epoch": 1080} {"train_loss": -5.6782050132751465, "global_step": 45375, "epoch": 1080} {"train_loss": -5.836243629455566, "global_step": 45376, "epoch": 1080} {"train_loss": -5.751542568206787, "global_step": 45377, "epoch": 1080} {"train_loss": -5.659359931945801, "global_step": 45378, "epoch": 1080} {"train_loss": -5.822367191314697, "global_step": 45379, "epoch": 1080} {"train_loss": -5.740967750549316, "global_step": 45380, "epoch": 1080} {"train_loss": -5.741115093231201, "global_step": 45381, "epoch": 1080} {"train_loss": -5.835178852081299, "global_step": 45382, "epoch": 1080} {"train_loss": -5.744071960449219, "global_step": 45383, "epoch": 1080} {"train_loss": -5.790550231933594, "global_step": 45384, "epoch": 1080} {"train_loss": -5.587394714355469, "global_step": 45385, "epoch": 1080} {"train_loss": -5.81362771987915, "global_step": 45386, "epoch": 1080} {"train_loss": -5.690225601196289, "global_step": 45387, "epoch": 1080} {"train_loss": -5.59034538269043, "global_step": 45388, "epoch": 1080} {"train_loss": -5.6747541427612305, "global_step": 45389, "epoch": 1080} {"train_loss": -5.7706499099731445, "global_step": 45390, "epoch": 1080} {"train_loss": -5.8030476570129395, "global_step": 45391, "epoch": 1080} {"train_loss": -5.802031517028809, "global_step": 45392, "epoch": 1080} {"train_loss": -5.733266830444336, "global_step": 45393, "epoch": 1080} {"train_loss": -5.6265764236450195, "global_step": 45394, "epoch": 1080} {"train_loss": -5.6089277267456055, "global_step": 45395, "epoch": 1080} {"train_loss": -5.6699371337890625, "global_step": 45396, "epoch": 1080} {"train_loss": -5.738680362701416, "global_step": 45397, "epoch": 1080} {"train_loss": -5.627516269683838, "global_step": 45398, "epoch": 1080} {"train_loss": -5.8121232986450195, "global_step": 45399, "epoch": 1080} {"train_loss": -5.7556047439575195, "global_step": 45400, "epoch": 1080} {"train_loss": -5.7273078532446, "global_step": 45401, "epoch": 1080, "val_loss": 74141.1640625} {"train_loss": -5.755536079406738, "global_step": 45402, "epoch": 1081} {"train_loss": -5.735536575317383, "global_step": 45403, "epoch": 1081} {"train_loss": -5.563631057739258, "global_step": 45404, "epoch": 1081} {"train_loss": -5.571453094482422, "global_step": 45405, "epoch": 1081} {"train_loss": -5.64985466003418, "global_step": 45406, "epoch": 1081} {"train_loss": -5.694366455078125, "global_step": 45407, "epoch": 1081} {"train_loss": -5.4559407234191895, "global_step": 45408, "epoch": 1081} {"train_loss": -5.670535087585449, "global_step": 45409, "epoch": 1081} {"train_loss": -5.547996520996094, "global_step": 45410, "epoch": 1081} {"train_loss": -5.534544944763184, "global_step": 45411, "epoch": 1081} {"train_loss": -5.691643714904785, "global_step": 45412, "epoch": 1081} {"train_loss": -5.638306140899658, "global_step": 45413, "epoch": 1081} {"train_loss": -5.823843002319336, "global_step": 45414, "epoch": 1081} {"train_loss": -5.635806083679199, "global_step": 45415, "epoch": 1081} {"train_loss": -5.76090145111084, "global_step": 45416, "epoch": 1081} {"train_loss": -5.639609336853027, "global_step": 45417, "epoch": 1081} {"train_loss": -5.718109130859375, "global_step": 45418, "epoch": 1081} {"train_loss": -5.619894027709961, "global_step": 45419, "epoch": 1081} {"train_loss": -5.727206230163574, "global_step": 45420, "epoch": 1081} {"train_loss": -5.706215858459473, "global_step": 45421, "epoch": 1081} {"train_loss": -5.717487812042236, "global_step": 45422, "epoch": 1081} {"train_loss": -5.808238506317139, "global_step": 45423, "epoch": 1081} {"train_loss": -5.746568202972412, "global_step": 45424, "epoch": 1081} {"train_loss": -5.716639041900635, "global_step": 45425, "epoch": 1081} {"train_loss": -5.811361312866211, "global_step": 45426, "epoch": 1081} {"train_loss": -5.655605316162109, "global_step": 45427, "epoch": 1081} {"train_loss": -5.705389976501465, "global_step": 45428, "epoch": 1081} {"train_loss": -5.635310173034668, "global_step": 45429, "epoch": 1081} {"train_loss": -5.753835678100586, "global_step": 45430, "epoch": 1081} {"train_loss": -5.739877700805664, "global_step": 45431, "epoch": 1081} {"train_loss": -5.530716419219971, "global_step": 45432, "epoch": 1081} {"train_loss": -5.7599897384643555, "global_step": 45433, "epoch": 1081} {"train_loss": -5.700255393981934, "global_step": 45434, "epoch": 1081} {"train_loss": -5.5115966796875, "global_step": 45435, "epoch": 1081} {"train_loss": -5.731592178344727, "global_step": 45436, "epoch": 1081} {"train_loss": -5.563772201538086, "global_step": 45437, "epoch": 1081} {"train_loss": -5.706658840179443, "global_step": 45438, "epoch": 1081} {"train_loss": -5.7823100090026855, "global_step": 45439, "epoch": 1081} {"train_loss": -5.616827964782715, "global_step": 45440, "epoch": 1081} {"train_loss": -5.761523246765137, "global_step": 45441, "epoch": 1081} {"train_loss": -5.693739891052246, "global_step": 45442, "epoch": 1081} {"train_loss": -5.675767478488741, "global_step": 45443, "epoch": 1081, "val_loss": 73980.875} {"train_loss": -5.773648262023926, "global_step": 45444, "epoch": 1082} {"train_loss": -5.6723856925964355, "global_step": 45445, "epoch": 1082} {"train_loss": -5.7434282302856445, "global_step": 45446, "epoch": 1082} {"train_loss": -5.600349426269531, "global_step": 45447, "epoch": 1082} {"train_loss": -5.650846004486084, "global_step": 45448, "epoch": 1082} {"train_loss": -5.640966415405273, "global_step": 45449, "epoch": 1082} {"train_loss": -5.6621832847595215, "global_step": 45450, "epoch": 1082} {"train_loss": -5.737409591674805, "global_step": 45451, "epoch": 1082} {"train_loss": -5.743936538696289, "global_step": 45452, "epoch": 1082} {"train_loss": -5.632187843322754, "global_step": 45453, "epoch": 1082} {"train_loss": -5.6354475021362305, "global_step": 45454, "epoch": 1082} {"train_loss": -5.583751678466797, "global_step": 45455, "epoch": 1082} {"train_loss": -5.7607221603393555, "global_step": 45456, "epoch": 1082} {"train_loss": -5.664819240570068, "global_step": 45457, "epoch": 1082} {"train_loss": -5.699338912963867, "global_step": 45458, "epoch": 1082} {"train_loss": -5.663299560546875, "global_step": 45459, "epoch": 1082} {"train_loss": -5.836480140686035, "global_step": 45460, "epoch": 1082} {"train_loss": -5.816167831420898, "global_step": 45461, "epoch": 1082} {"train_loss": -5.724616050720215, "global_step": 45462, "epoch": 1082} {"train_loss": -5.757830619812012, "global_step": 45463, "epoch": 1082} {"train_loss": -5.780952453613281, "global_step": 45464, "epoch": 1082} {"train_loss": -5.683220386505127, "global_step": 45465, "epoch": 1082} {"train_loss": -5.7115983963012695, "global_step": 45466, "epoch": 1082} {"train_loss": -5.735062599182129, "global_step": 45467, "epoch": 1082} {"train_loss": -5.693044662475586, "global_step": 45468, "epoch": 1082} {"train_loss": -5.7530198097229, "global_step": 45469, "epoch": 1082} {"train_loss": -5.776717662811279, "global_step": 45470, "epoch": 1082} {"train_loss": -5.601527214050293, "global_step": 45471, "epoch": 1082} {"train_loss": -5.6492509841918945, "global_step": 45472, "epoch": 1082} {"train_loss": -5.805115699768066, "global_step": 45473, "epoch": 1082} {"train_loss": -5.596071243286133, "global_step": 45474, "epoch": 1082} {"train_loss": -5.707588195800781, "global_step": 45475, "epoch": 1082} {"train_loss": -5.7133684158325195, "global_step": 45476, "epoch": 1082} {"train_loss": -5.6997175216674805, "global_step": 45477, "epoch": 1082} {"train_loss": -5.68162202835083, "global_step": 45478, "epoch": 1082} {"train_loss": -5.751337051391602, "global_step": 45479, "epoch": 1082} {"train_loss": -5.492753028869629, "global_step": 45480, "epoch": 1082} {"train_loss": -5.794585227966309, "global_step": 45481, "epoch": 1082} {"train_loss": -5.614893913269043, "global_step": 45482, "epoch": 1082} {"train_loss": -5.512319564819336, "global_step": 45483, "epoch": 1082} {"train_loss": -5.715689182281494, "global_step": 45484, "epoch": 1082} {"train_loss": -5.6932371116819835, "global_step": 45485, "epoch": 1082, "val_loss": 74228.390625} {"train_loss": -5.593070983886719, "global_step": 45486, "epoch": 1083} {"train_loss": -5.639354705810547, "global_step": 45487, "epoch": 1083} {"train_loss": -5.7549591064453125, "global_step": 45488, "epoch": 1083} {"train_loss": -5.617920875549316, "global_step": 45489, "epoch": 1083} {"train_loss": -5.705132484436035, "global_step": 45490, "epoch": 1083} {"train_loss": -5.6245880126953125, "global_step": 45491, "epoch": 1083} {"train_loss": -5.662597179412842, "global_step": 45492, "epoch": 1083} {"train_loss": -5.560337543487549, "global_step": 45493, "epoch": 1083} {"train_loss": -5.740048408508301, "global_step": 45494, "epoch": 1083} {"train_loss": -5.752838134765625, "global_step": 45495, "epoch": 1083} {"train_loss": -5.660519599914551, "global_step": 45496, "epoch": 1083} {"train_loss": -5.753253936767578, "global_step": 45497, "epoch": 1083} {"train_loss": -5.628303527832031, "global_step": 45498, "epoch": 1083} {"train_loss": -5.728750228881836, "global_step": 45499, "epoch": 1083} {"train_loss": -5.760473251342773, "global_step": 45500, "epoch": 1083} {"train_loss": -5.682454586029053, "global_step": 45501, "epoch": 1083} {"train_loss": -5.66038703918457, "global_step": 45502, "epoch": 1083} {"train_loss": -5.692978858947754, "global_step": 45503, "epoch": 1083} {"train_loss": -5.738763809204102, "global_step": 45504, "epoch": 1083} {"train_loss": -5.701608657836914, "global_step": 45505, "epoch": 1083} {"train_loss": -5.6327972412109375, "global_step": 45506, "epoch": 1083} {"train_loss": -5.67599630355835, "global_step": 45507, "epoch": 1083} {"train_loss": -5.803656578063965, "global_step": 45508, "epoch": 1083} {"train_loss": -5.671796798706055, "global_step": 45509, "epoch": 1083} {"train_loss": -5.633476257324219, "global_step": 45510, "epoch": 1083} {"train_loss": -5.671413898468018, "global_step": 45511, "epoch": 1083} {"train_loss": -5.6265106201171875, "global_step": 45512, "epoch": 1083} {"train_loss": -5.732542037963867, "global_step": 45513, "epoch": 1083} {"train_loss": -5.7365617752075195, "global_step": 45514, "epoch": 1083} {"train_loss": -5.491128444671631, "global_step": 45515, "epoch": 1083} {"train_loss": -5.700047969818115, "global_step": 45516, "epoch": 1083} {"train_loss": -5.606750965118408, "global_step": 45517, "epoch": 1083} {"train_loss": -5.719336032867432, "global_step": 45518, "epoch": 1083} {"train_loss": -5.757563591003418, "global_step": 45519, "epoch": 1083} {"train_loss": -5.5871968269348145, "global_step": 45520, "epoch": 1083} {"train_loss": -5.718329429626465, "global_step": 45521, "epoch": 1083} {"train_loss": -5.675819396972656, "global_step": 45522, "epoch": 1083} {"train_loss": -5.763805389404297, "global_step": 45523, "epoch": 1083} {"train_loss": -5.681416988372803, "global_step": 45524, "epoch": 1083} {"train_loss": -5.707912445068359, "global_step": 45525, "epoch": 1083} {"train_loss": -5.794149398803711, "global_step": 45526, "epoch": 1083} {"train_loss": -5.684357711247036, "global_step": 45527, "epoch": 1083, "val_loss": 74260.71875} {"train_loss": -5.748805046081543, "global_step": 45528, "epoch": 1084} {"train_loss": -5.741800308227539, "global_step": 45529, "epoch": 1084} {"train_loss": -5.730029582977295, "global_step": 45530, "epoch": 1084} {"train_loss": -5.821892738342285, "global_step": 45531, "epoch": 1084} {"train_loss": -5.684657573699951, "global_step": 45532, "epoch": 1084} {"train_loss": -5.7622857093811035, "global_step": 45533, "epoch": 1084} {"train_loss": -5.757689476013184, "global_step": 45534, "epoch": 1084} {"train_loss": -5.713158130645752, "global_step": 45535, "epoch": 1084} {"train_loss": -5.734241962432861, "global_step": 45536, "epoch": 1084} {"train_loss": -5.668412685394287, "global_step": 45537, "epoch": 1084} {"train_loss": -5.7697367668151855, "global_step": 45538, "epoch": 1084} {"train_loss": -5.727174282073975, "global_step": 45539, "epoch": 1084} {"train_loss": -5.72001838684082, "global_step": 45540, "epoch": 1084} {"train_loss": -5.660983562469482, "global_step": 45541, "epoch": 1084} {"train_loss": -5.655880928039551, "global_step": 45542, "epoch": 1084} {"train_loss": -5.56947135925293, "global_step": 45543, "epoch": 1084} {"train_loss": -5.634610176086426, "global_step": 45544, "epoch": 1084} {"train_loss": -5.526027679443359, "global_step": 45545, "epoch": 1084} {"train_loss": -5.471504211425781, "global_step": 45546, "epoch": 1084} {"train_loss": -5.61194372177124, "global_step": 45547, "epoch": 1084} {"train_loss": -5.4350690841674805, "global_step": 45548, "epoch": 1084} {"train_loss": -5.617956161499023, "global_step": 45549, "epoch": 1084} {"train_loss": -5.644293785095215, "global_step": 45550, "epoch": 1084} {"train_loss": -5.520343780517578, "global_step": 45551, "epoch": 1084} {"train_loss": -5.519494533538818, "global_step": 45552, "epoch": 1084} {"train_loss": -5.544682025909424, "global_step": 45553, "epoch": 1084} {"train_loss": -5.564815998077393, "global_step": 45554, "epoch": 1084} {"train_loss": -5.607316017150879, "global_step": 45555, "epoch": 1084} {"train_loss": -5.6196088790893555, "global_step": 45556, "epoch": 1084} {"train_loss": -5.611488342285156, "global_step": 45557, "epoch": 1084} {"train_loss": -5.661808967590332, "global_step": 45558, "epoch": 1084} {"train_loss": -5.748447418212891, "global_step": 45559, "epoch": 1084} {"train_loss": -5.706308364868164, "global_step": 45560, "epoch": 1084} {"train_loss": -5.754912376403809, "global_step": 45561, "epoch": 1084} {"train_loss": -5.58577823638916, "global_step": 45562, "epoch": 1084} {"train_loss": -5.749446868896484, "global_step": 45563, "epoch": 1084} {"train_loss": -5.715578079223633, "global_step": 45564, "epoch": 1084} {"train_loss": -5.576084136962891, "global_step": 45565, "epoch": 1084} {"train_loss": -5.650400161743164, "global_step": 45566, "epoch": 1084} {"train_loss": -5.628535270690918, "global_step": 45567, "epoch": 1084} {"train_loss": -5.700746536254883, "global_step": 45568, "epoch": 1084} {"train_loss": -5.655993314016433, "global_step": 45569, "epoch": 1084, "val_loss": 73970.171875} {"train_loss": -5.615612983703613, "global_step": 45570, "epoch": 1085} {"train_loss": -5.7093706130981445, "global_step": 45571, "epoch": 1085} {"train_loss": -5.567206382751465, "global_step": 45572, "epoch": 1085} {"train_loss": -5.66386604309082, "global_step": 45573, "epoch": 1085} {"train_loss": -5.715285301208496, "global_step": 45574, "epoch": 1085} {"train_loss": -5.7591352462768555, "global_step": 45575, "epoch": 1085} {"train_loss": -5.721333026885986, "global_step": 45576, "epoch": 1085} {"train_loss": -5.888144493103027, "global_step": 45577, "epoch": 1085} {"train_loss": -5.757580757141113, "global_step": 45578, "epoch": 1085} {"train_loss": -5.7647199630737305, "global_step": 45579, "epoch": 1085} {"train_loss": -5.851831436157227, "global_step": 45580, "epoch": 1085} {"train_loss": -5.804025650024414, "global_step": 45581, "epoch": 1085} {"train_loss": -5.761755466461182, "global_step": 45582, "epoch": 1085} {"train_loss": -5.844900131225586, "global_step": 45583, "epoch": 1085} {"train_loss": -5.716647624969482, "global_step": 45584, "epoch": 1085} {"train_loss": -5.769148826599121, "global_step": 45585, "epoch": 1085} {"train_loss": -5.682450771331787, "global_step": 45586, "epoch": 1085} {"train_loss": -5.572752952575684, "global_step": 45587, "epoch": 1085} {"train_loss": -5.6577582359313965, "global_step": 45588, "epoch": 1085} {"train_loss": -5.502129554748535, "global_step": 45589, "epoch": 1085} {"train_loss": -5.691895484924316, "global_step": 45590, "epoch": 1085} {"train_loss": -5.6006669998168945, "global_step": 45591, "epoch": 1085} {"train_loss": -5.600436210632324, "global_step": 45592, "epoch": 1085} {"train_loss": -5.739420413970947, "global_step": 45593, "epoch": 1085} {"train_loss": -5.519921779632568, "global_step": 45594, "epoch": 1085} {"train_loss": -5.739986419677734, "global_step": 45595, "epoch": 1085} {"train_loss": -5.690116882324219, "global_step": 45596, "epoch": 1085} {"train_loss": -5.634819030761719, "global_step": 45597, "epoch": 1085} {"train_loss": -5.6920366287231445, "global_step": 45598, "epoch": 1085} {"train_loss": -5.645712852478027, "global_step": 45599, "epoch": 1085} {"train_loss": -5.641226768493652, "global_step": 45600, "epoch": 1085} {"train_loss": -5.744614124298096, "global_step": 45601, "epoch": 1085} {"train_loss": -5.688053131103516, "global_step": 45602, "epoch": 1085} {"train_loss": -5.719748020172119, "global_step": 45603, "epoch": 1085} {"train_loss": -5.834765434265137, "global_step": 45604, "epoch": 1085} {"train_loss": -5.640536308288574, "global_step": 45605, "epoch": 1085} {"train_loss": -5.725980758666992, "global_step": 45606, "epoch": 1085} {"train_loss": -5.715726852416992, "global_step": 45607, "epoch": 1085} {"train_loss": -5.685000419616699, "global_step": 45608, "epoch": 1085} {"train_loss": -5.706523418426514, "global_step": 45609, "epoch": 1085} {"train_loss": -5.679620742797852, "global_step": 45610, "epoch": 1085} {"train_loss": -5.703022355125064, "global_step": 45611, "epoch": 1085, "val_loss": 74486.28125} {"train_loss": -5.5551652908325195, "global_step": 45612, "epoch": 1086} {"train_loss": -5.763965606689453, "global_step": 45613, "epoch": 1086} {"train_loss": -5.7515869140625, "global_step": 45614, "epoch": 1086} {"train_loss": -5.858260154724121, "global_step": 45615, "epoch": 1086} {"train_loss": -5.664515018463135, "global_step": 45616, "epoch": 1086} {"train_loss": -5.682758331298828, "global_step": 45617, "epoch": 1086} {"train_loss": -5.701000213623047, "global_step": 45618, "epoch": 1086} {"train_loss": -5.659298896789551, "global_step": 45619, "epoch": 1086} {"train_loss": -5.66690731048584, "global_step": 45620, "epoch": 1086} {"train_loss": -5.588082313537598, "global_step": 45621, "epoch": 1086} {"train_loss": -5.657508373260498, "global_step": 45622, "epoch": 1086} {"train_loss": -5.673749923706055, "global_step": 45623, "epoch": 1086} {"train_loss": -5.647669315338135, "global_step": 45624, "epoch": 1086} {"train_loss": -5.697826385498047, "global_step": 45625, "epoch": 1086} {"train_loss": -5.511089324951172, "global_step": 45626, "epoch": 1086} {"train_loss": -5.772055149078369, "global_step": 45627, "epoch": 1086} {"train_loss": -5.590825080871582, "global_step": 45628, "epoch": 1086} {"train_loss": -5.714357852935791, "global_step": 45629, "epoch": 1086} {"train_loss": -5.75200080871582, "global_step": 45630, "epoch": 1086} {"train_loss": -5.693028450012207, "global_step": 45631, "epoch": 1086} {"train_loss": -5.7328996658325195, "global_step": 45632, "epoch": 1086} {"train_loss": -5.786814212799072, "global_step": 45633, "epoch": 1086} {"train_loss": -5.69467306137085, "global_step": 45634, "epoch": 1086} {"train_loss": -5.474330902099609, "global_step": 45635, "epoch": 1086} {"train_loss": -5.648054122924805, "global_step": 45636, "epoch": 1086} {"train_loss": -5.686732292175293, "global_step": 45637, "epoch": 1086} {"train_loss": -5.711637496948242, "global_step": 45638, "epoch": 1086} {"train_loss": -5.8043107986450195, "global_step": 45639, "epoch": 1086} {"train_loss": -5.765119552612305, "global_step": 45640, "epoch": 1086} {"train_loss": -5.727833271026611, "global_step": 45641, "epoch": 1086} {"train_loss": -5.618582725524902, "global_step": 45642, "epoch": 1086} {"train_loss": -5.6230854988098145, "global_step": 45643, "epoch": 1086} {"train_loss": -5.67999792098999, "global_step": 45644, "epoch": 1086} {"train_loss": -5.678028583526611, "global_step": 45645, "epoch": 1086} {"train_loss": -5.734714508056641, "global_step": 45646, "epoch": 1086} {"train_loss": -5.695110321044922, "global_step": 45647, "epoch": 1086} {"train_loss": -5.764780044555664, "global_step": 45648, "epoch": 1086} {"train_loss": -5.661114692687988, "global_step": 45649, "epoch": 1086} {"train_loss": -5.649608612060547, "global_step": 45650, "epoch": 1086} {"train_loss": -5.802045822143555, "global_step": 45651, "epoch": 1086} {"train_loss": -5.796395301818848, "global_step": 45652, "epoch": 1086} {"train_loss": -5.6916441803886775, "global_step": 45653, "epoch": 1086, "val_loss": 73908.8046875} {"train_loss": -5.814694404602051, "global_step": 45654, "epoch": 1087} {"train_loss": -5.719231605529785, "global_step": 45655, "epoch": 1087} {"train_loss": -5.840691089630127, "global_step": 45656, "epoch": 1087} {"train_loss": -5.846234321594238, "global_step": 45657, "epoch": 1087} {"train_loss": -5.561941146850586, "global_step": 45658, "epoch": 1087} {"train_loss": -5.870636940002441, "global_step": 45659, "epoch": 1087} {"train_loss": -5.618464469909668, "global_step": 45660, "epoch": 1087} {"train_loss": -5.695401668548584, "global_step": 45661, "epoch": 1087} {"train_loss": -5.81962776184082, "global_step": 45662, "epoch": 1087} {"train_loss": -5.796065330505371, "global_step": 45663, "epoch": 1087} {"train_loss": -5.744157791137695, "global_step": 45664, "epoch": 1087} {"train_loss": -5.747081756591797, "global_step": 45665, "epoch": 1087} {"train_loss": -5.817704200744629, "global_step": 45666, "epoch": 1087} {"train_loss": -5.797656536102295, "global_step": 45667, "epoch": 1087} {"train_loss": -5.828164577484131, "global_step": 45668, "epoch": 1087} {"train_loss": -5.6696271896362305, "global_step": 45669, "epoch": 1087} {"train_loss": -5.771051406860352, "global_step": 45670, "epoch": 1087} {"train_loss": -5.604245662689209, "global_step": 45671, "epoch": 1087} {"train_loss": -5.723577499389648, "global_step": 45672, "epoch": 1087} {"train_loss": -5.742491722106934, "global_step": 45673, "epoch": 1087} {"train_loss": -5.627798080444336, "global_step": 45674, "epoch": 1087} {"train_loss": -5.58132266998291, "global_step": 45675, "epoch": 1087} {"train_loss": -5.6477556228637695, "global_step": 45676, "epoch": 1087} {"train_loss": -5.513608932495117, "global_step": 45677, "epoch": 1087} {"train_loss": -5.705889701843262, "global_step": 45678, "epoch": 1087} {"train_loss": -5.6913161277771, "global_step": 45679, "epoch": 1087} {"train_loss": -5.677030563354492, "global_step": 45680, "epoch": 1087} {"train_loss": -5.741609573364258, "global_step": 45681, "epoch": 1087} {"train_loss": -5.780537128448486, "global_step": 45682, "epoch": 1087} {"train_loss": -5.622241020202637, "global_step": 45683, "epoch": 1087} {"train_loss": -5.852301597595215, "global_step": 45684, "epoch": 1087} {"train_loss": -5.717628002166748, "global_step": 45685, "epoch": 1087} {"train_loss": -5.821884632110596, "global_step": 45686, "epoch": 1087} {"train_loss": -5.669741153717041, "global_step": 45687, "epoch": 1087} {"train_loss": -5.73081111907959, "global_step": 45688, "epoch": 1087} {"train_loss": -5.7476019859313965, "global_step": 45689, "epoch": 1087} {"train_loss": -5.767902374267578, "global_step": 45690, "epoch": 1087} {"train_loss": -5.57429313659668, "global_step": 45691, "epoch": 1087} {"train_loss": -5.714910984039307, "global_step": 45692, "epoch": 1087} {"train_loss": -5.720300197601318, "global_step": 45693, "epoch": 1087} {"train_loss": -5.7402801513671875, "global_step": 45694, "epoch": 1087} {"train_loss": -5.722670078277588, "global_step": 45695, "epoch": 1087, "val_loss": 73909.4453125} {"train_loss": -5.8098602294921875, "global_step": 45696, "epoch": 1088} {"train_loss": -5.717598915100098, "global_step": 45697, "epoch": 1088} {"train_loss": -5.672947406768799, "global_step": 45698, "epoch": 1088} {"train_loss": -5.653761386871338, "global_step": 45699, "epoch": 1088} {"train_loss": -5.694918632507324, "global_step": 45700, "epoch": 1088} {"train_loss": -5.58631706237793, "global_step": 45701, "epoch": 1088} {"train_loss": -5.780396461486816, "global_step": 45702, "epoch": 1088} {"train_loss": -5.745790481567383, "global_step": 45703, "epoch": 1088} {"train_loss": -5.747351169586182, "global_step": 45704, "epoch": 1088} {"train_loss": -5.762383937835693, "global_step": 45705, "epoch": 1088} {"train_loss": -5.57025146484375, "global_step": 45706, "epoch": 1088} {"train_loss": -5.743871688842773, "global_step": 45707, "epoch": 1088} {"train_loss": -5.76725435256958, "global_step": 45708, "epoch": 1088} {"train_loss": -5.432389259338379, "global_step": 45709, "epoch": 1088} {"train_loss": -5.69823694229126, "global_step": 45710, "epoch": 1088} {"train_loss": -5.472570419311523, "global_step": 45711, "epoch": 1088} {"train_loss": -5.664422988891602, "global_step": 45712, "epoch": 1088} {"train_loss": -5.7883477210998535, "global_step": 45713, "epoch": 1088} {"train_loss": -5.511317253112793, "global_step": 45714, "epoch": 1088} {"train_loss": -5.616808891296387, "global_step": 45715, "epoch": 1088} {"train_loss": -5.6909003257751465, "global_step": 45716, "epoch": 1088} {"train_loss": -5.708780765533447, "global_step": 45717, "epoch": 1088} {"train_loss": -5.8075690269470215, "global_step": 45718, "epoch": 1088} {"train_loss": -5.740262508392334, "global_step": 45719, "epoch": 1088} {"train_loss": -5.620737552642822, "global_step": 45720, "epoch": 1088} {"train_loss": -5.8038835525512695, "global_step": 45721, "epoch": 1088} {"train_loss": -5.616910934448242, "global_step": 45722, "epoch": 1088} {"train_loss": -5.703261852264404, "global_step": 45723, "epoch": 1088} {"train_loss": -5.57659912109375, "global_step": 45724, "epoch": 1088} {"train_loss": -5.644528388977051, "global_step": 45725, "epoch": 1088} {"train_loss": -5.655606269836426, "global_step": 45726, "epoch": 1088} {"train_loss": -5.653690338134766, "global_step": 45727, "epoch": 1088} {"train_loss": -5.682119369506836, "global_step": 45728, "epoch": 1088} {"train_loss": -5.635341167449951, "global_step": 45729, "epoch": 1088} {"train_loss": -5.772593975067139, "global_step": 45730, "epoch": 1088} {"train_loss": -5.594076633453369, "global_step": 45731, "epoch": 1088} {"train_loss": -5.864336967468262, "global_step": 45732, "epoch": 1088} {"train_loss": -5.588627338409424, "global_step": 45733, "epoch": 1088} {"train_loss": -5.802879333496094, "global_step": 45734, "epoch": 1088} {"train_loss": -5.7918500900268555, "global_step": 45735, "epoch": 1088} {"train_loss": -5.6666646003723145, "global_step": 45736, "epoch": 1088} {"train_loss": -5.685188179924374, "global_step": 45737, "epoch": 1088, "val_loss": 74628.9140625} {"train_loss": -5.611988067626953, "global_step": 45738, "epoch": 1089} {"train_loss": -5.5599822998046875, "global_step": 45739, "epoch": 1089} {"train_loss": -5.762969017028809, "global_step": 45740, "epoch": 1089} {"train_loss": -5.657899856567383, "global_step": 45741, "epoch": 1089} {"train_loss": -5.796794414520264, "global_step": 45742, "epoch": 1089} {"train_loss": -5.742253303527832, "global_step": 45743, "epoch": 1089} {"train_loss": -5.641113758087158, "global_step": 45744, "epoch": 1089} {"train_loss": -5.8643035888671875, "global_step": 45745, "epoch": 1089} {"train_loss": -5.800511360168457, "global_step": 45746, "epoch": 1089} {"train_loss": -5.669058799743652, "global_step": 45747, "epoch": 1089} {"train_loss": -5.83607292175293, "global_step": 45748, "epoch": 1089} {"train_loss": -5.730586051940918, "global_step": 45749, "epoch": 1089} {"train_loss": -5.728470802307129, "global_step": 45750, "epoch": 1089} {"train_loss": -5.837700366973877, "global_step": 45751, "epoch": 1089} {"train_loss": -5.543347358703613, "global_step": 45752, "epoch": 1089} {"train_loss": -5.804872989654541, "global_step": 45753, "epoch": 1089} {"train_loss": -5.632271766662598, "global_step": 45754, "epoch": 1089} {"train_loss": -5.55768346786499, "global_step": 45755, "epoch": 1089} {"train_loss": -5.831161975860596, "global_step": 45756, "epoch": 1089} {"train_loss": -5.736754417419434, "global_step": 45757, "epoch": 1089} {"train_loss": -5.708707332611084, "global_step": 45758, "epoch": 1089} {"train_loss": -5.584643363952637, "global_step": 45759, "epoch": 1089} {"train_loss": -5.766384124755859, "global_step": 45760, "epoch": 1089} {"train_loss": -5.858989715576172, "global_step": 45761, "epoch": 1089} {"train_loss": -5.538592338562012, "global_step": 45762, "epoch": 1089} {"train_loss": -5.650055885314941, "global_step": 45763, "epoch": 1089} {"train_loss": -5.696999549865723, "global_step": 45764, "epoch": 1089} {"train_loss": -5.717415809631348, "global_step": 45765, "epoch": 1089} {"train_loss": -5.653899192810059, "global_step": 45766, "epoch": 1089} {"train_loss": -5.655685901641846, "global_step": 45767, "epoch": 1089} {"train_loss": -5.722418785095215, "global_step": 45768, "epoch": 1089} {"train_loss": -5.54949951171875, "global_step": 45769, "epoch": 1089} {"train_loss": -5.600616455078125, "global_step": 45770, "epoch": 1089} {"train_loss": -5.665142059326172, "global_step": 45771, "epoch": 1089} {"train_loss": -5.688117504119873, "global_step": 45772, "epoch": 1089} {"train_loss": -5.635437965393066, "global_step": 45773, "epoch": 1089} {"train_loss": -5.734744071960449, "global_step": 45774, "epoch": 1089} {"train_loss": -5.600484371185303, "global_step": 45775, "epoch": 1089} {"train_loss": -5.842350959777832, "global_step": 45776, "epoch": 1089} {"train_loss": -5.6634087562561035, "global_step": 45777, "epoch": 1089} {"train_loss": -5.618981838226318, "global_step": 45778, "epoch": 1089} {"train_loss": -5.694978339331491, "global_step": 45779, "epoch": 1089, "val_loss": 74215.34375} {"train_loss": -5.740438461303711, "global_step": 45780, "epoch": 1090} {"train_loss": -5.570075035095215, "global_step": 45781, "epoch": 1090} {"train_loss": -5.792160987854004, "global_step": 45782, "epoch": 1090} {"train_loss": -5.669754981994629, "global_step": 45783, "epoch": 1090} {"train_loss": -5.701828956604004, "global_step": 45784, "epoch": 1090} {"train_loss": -5.7614359855651855, "global_step": 45785, "epoch": 1090} {"train_loss": -5.746856689453125, "global_step": 45786, "epoch": 1090} {"train_loss": -5.824667930603027, "global_step": 45787, "epoch": 1090} {"train_loss": -5.660735130310059, "global_step": 45788, "epoch": 1090} {"train_loss": -5.77565860748291, "global_step": 45789, "epoch": 1090} {"train_loss": -5.679333209991455, "global_step": 45790, "epoch": 1090} {"train_loss": -5.725108623504639, "global_step": 45791, "epoch": 1090} {"train_loss": -5.689629554748535, "global_step": 45792, "epoch": 1090} {"train_loss": -5.80609130859375, "global_step": 45793, "epoch": 1090} {"train_loss": -5.707609176635742, "global_step": 45794, "epoch": 1090} {"train_loss": -5.798188209533691, "global_step": 45795, "epoch": 1090} {"train_loss": -5.644345283508301, "global_step": 45796, "epoch": 1090} {"train_loss": -5.668887138366699, "global_step": 45797, "epoch": 1090} {"train_loss": -5.760220527648926, "global_step": 45798, "epoch": 1090} {"train_loss": -5.772650718688965, "global_step": 45799, "epoch": 1090} {"train_loss": -5.72645378112793, "global_step": 45800, "epoch": 1090} {"train_loss": -5.685126781463623, "global_step": 45801, "epoch": 1090} {"train_loss": -5.798788547515869, "global_step": 45802, "epoch": 1090} {"train_loss": -5.73969841003418, "global_step": 45803, "epoch": 1090} {"train_loss": -5.681353569030762, "global_step": 45804, "epoch": 1090} {"train_loss": -5.681825160980225, "global_step": 45805, "epoch": 1090} {"train_loss": -5.708893775939941, "global_step": 45806, "epoch": 1090} {"train_loss": -5.680948257446289, "global_step": 45807, "epoch": 1090} {"train_loss": -5.691773414611816, "global_step": 45808, "epoch": 1090} {"train_loss": -5.741475582122803, "global_step": 45809, "epoch": 1090} {"train_loss": -5.699173450469971, "global_step": 45810, "epoch": 1090} {"train_loss": -5.741523742675781, "global_step": 45811, "epoch": 1090} {"train_loss": -5.630378723144531, "global_step": 45812, "epoch": 1090} {"train_loss": -5.7103424072265625, "global_step": 45813, "epoch": 1090} {"train_loss": -5.85040283203125, "global_step": 45814, "epoch": 1090} {"train_loss": -5.790729522705078, "global_step": 45815, "epoch": 1090} {"train_loss": -5.7327446937561035, "global_step": 45816, "epoch": 1090} {"train_loss": -5.646720886230469, "global_step": 45817, "epoch": 1090} {"train_loss": -5.775416374206543, "global_step": 45818, "epoch": 1090} {"train_loss": -5.5237860679626465, "global_step": 45819, "epoch": 1090} {"train_loss": -5.7263054847717285, "global_step": 45820, "epoch": 1090} {"train_loss": -5.71532484463283, "global_step": 45821, "epoch": 1090, "val_loss": 74021.328125} {"train_loss": -5.823965072631836, "global_step": 45822, "epoch": 1091} {"train_loss": -5.706279277801514, "global_step": 45823, "epoch": 1091} {"train_loss": -5.686251640319824, "global_step": 45824, "epoch": 1091} {"train_loss": -5.687108993530273, "global_step": 45825, "epoch": 1091} {"train_loss": -5.588112831115723, "global_step": 45826, "epoch": 1091} {"train_loss": -5.818351745605469, "global_step": 45827, "epoch": 1091} {"train_loss": -5.649938106536865, "global_step": 45828, "epoch": 1091} {"train_loss": -5.650997638702393, "global_step": 45829, "epoch": 1091} {"train_loss": -5.660951614379883, "global_step": 45830, "epoch": 1091} {"train_loss": -5.629052639007568, "global_step": 45831, "epoch": 1091} {"train_loss": -5.620565891265869, "global_step": 45832, "epoch": 1091} {"train_loss": -5.740347385406494, "global_step": 45833, "epoch": 1091} {"train_loss": -5.76317024230957, "global_step": 45834, "epoch": 1091} {"train_loss": -5.782192230224609, "global_step": 45835, "epoch": 1091} {"train_loss": -5.5894083976745605, "global_step": 45836, "epoch": 1091} {"train_loss": -5.759684085845947, "global_step": 45837, "epoch": 1091} {"train_loss": -5.6359052658081055, "global_step": 45838, "epoch": 1091} {"train_loss": -5.721076011657715, "global_step": 45839, "epoch": 1091} {"train_loss": -5.734046936035156, "global_step": 45840, "epoch": 1091} {"train_loss": -5.592779159545898, "global_step": 45841, "epoch": 1091} {"train_loss": -5.676941871643066, "global_step": 45842, "epoch": 1091} {"train_loss": -5.808063983917236, "global_step": 45843, "epoch": 1091} {"train_loss": -5.609404563903809, "global_step": 45844, "epoch": 1091} {"train_loss": -5.731160640716553, "global_step": 45845, "epoch": 1091} {"train_loss": -5.571504592895508, "global_step": 45846, "epoch": 1091} {"train_loss": -5.592307090759277, "global_step": 45847, "epoch": 1091} {"train_loss": -5.673783779144287, "global_step": 45848, "epoch": 1091} {"train_loss": -5.740650177001953, "global_step": 45849, "epoch": 1091} {"train_loss": -5.757367134094238, "global_step": 45850, "epoch": 1091} {"train_loss": -5.745388507843018, "global_step": 45851, "epoch": 1091} {"train_loss": -5.721635341644287, "global_step": 45852, "epoch": 1091} {"train_loss": -5.684577941894531, "global_step": 45853, "epoch": 1091} {"train_loss": -5.7084479331970215, "global_step": 45854, "epoch": 1091} {"train_loss": -5.622711181640625, "global_step": 45855, "epoch": 1091} {"train_loss": -5.794828414916992, "global_step": 45856, "epoch": 1091} {"train_loss": -5.721646785736084, "global_step": 45857, "epoch": 1091} {"train_loss": -5.7054972648620605, "global_step": 45858, "epoch": 1091} {"train_loss": -5.72957706451416, "global_step": 45859, "epoch": 1091} {"train_loss": -5.66071891784668, "global_step": 45860, "epoch": 1091} {"train_loss": -5.790424346923828, "global_step": 45861, "epoch": 1091} {"train_loss": -5.615697860717773, "global_step": 45862, "epoch": 1091} {"train_loss": -5.694540023803711, "global_step": 45863, "epoch": 1091, "val_loss": 73675.2734375} {"train_loss": -5.815185546875, "global_step": 45864, "epoch": 1092} {"train_loss": -5.674797058105469, "global_step": 45865, "epoch": 1092} {"train_loss": -5.707437992095947, "global_step": 45866, "epoch": 1092} {"train_loss": -5.751860618591309, "global_step": 45867, "epoch": 1092} {"train_loss": -5.666067600250244, "global_step": 45868, "epoch": 1092} {"train_loss": -5.684398651123047, "global_step": 45869, "epoch": 1092} {"train_loss": -5.618669509887695, "global_step": 45870, "epoch": 1092} {"train_loss": -5.694547176361084, "global_step": 45871, "epoch": 1092} {"train_loss": -5.686485290527344, "global_step": 45872, "epoch": 1092} {"train_loss": -5.645180702209473, "global_step": 45873, "epoch": 1092} {"train_loss": -5.714085578918457, "global_step": 45874, "epoch": 1092} {"train_loss": -5.689219951629639, "global_step": 45875, "epoch": 1092} {"train_loss": -5.632453441619873, "global_step": 45876, "epoch": 1092} {"train_loss": -5.795718669891357, "global_step": 45877, "epoch": 1092} {"train_loss": -5.638068199157715, "global_step": 45878, "epoch": 1092} {"train_loss": -5.654691696166992, "global_step": 45879, "epoch": 1092} {"train_loss": -5.70157527923584, "global_step": 45880, "epoch": 1092} {"train_loss": -5.710569381713867, "global_step": 45881, "epoch": 1092} {"train_loss": -5.70584774017334, "global_step": 45882, "epoch": 1092} {"train_loss": -5.783185958862305, "global_step": 45883, "epoch": 1092} {"train_loss": -5.825740814208984, "global_step": 45884, "epoch": 1092} {"train_loss": -5.653251647949219, "global_step": 45885, "epoch": 1092} {"train_loss": -5.670943737030029, "global_step": 45886, "epoch": 1092} {"train_loss": -5.672654151916504, "global_step": 45887, "epoch": 1092} {"train_loss": -5.7020769119262695, "global_step": 45888, "epoch": 1092} {"train_loss": -5.699222564697266, "global_step": 45889, "epoch": 1092} {"train_loss": -5.806751728057861, "global_step": 45890, "epoch": 1092} {"train_loss": -5.66420841217041, "global_step": 45891, "epoch": 1092} {"train_loss": -5.669974327087402, "global_step": 45892, "epoch": 1092} {"train_loss": -5.845465660095215, "global_step": 45893, "epoch": 1092} {"train_loss": -5.735472679138184, "global_step": 45894, "epoch": 1092} {"train_loss": -5.644415855407715, "global_step": 45895, "epoch": 1092} {"train_loss": -5.781894683837891, "global_step": 45896, "epoch": 1092} {"train_loss": -5.671239852905273, "global_step": 45897, "epoch": 1092} {"train_loss": -5.7725958824157715, "global_step": 45898, "epoch": 1092} {"train_loss": -5.698979377746582, "global_step": 45899, "epoch": 1092} {"train_loss": -5.634642124176025, "global_step": 45900, "epoch": 1092} {"train_loss": -5.818839073181152, "global_step": 45901, "epoch": 1092} {"train_loss": -5.690104961395264, "global_step": 45902, "epoch": 1092} {"train_loss": -5.795711517333984, "global_step": 45903, "epoch": 1092} {"train_loss": -5.846373558044434, "global_step": 45904, "epoch": 1092} {"train_loss": -5.713588521594093, "global_step": 45905, "epoch": 1092, "val_loss": 73962.0} {"train_loss": -5.737093925476074, "global_step": 45906, "epoch": 1093} {"train_loss": -5.753938674926758, "global_step": 45907, "epoch": 1093} {"train_loss": -5.803707122802734, "global_step": 45908, "epoch": 1093} {"train_loss": -5.536575794219971, "global_step": 45909, "epoch": 1093} {"train_loss": -5.7291107177734375, "global_step": 45910, "epoch": 1093} {"train_loss": -5.60416316986084, "global_step": 45911, "epoch": 1093} {"train_loss": -5.783170700073242, "global_step": 45912, "epoch": 1093} {"train_loss": -5.810205459594727, "global_step": 45913, "epoch": 1093} {"train_loss": -5.685036659240723, "global_step": 45914, "epoch": 1093} {"train_loss": -5.761473655700684, "global_step": 45915, "epoch": 1093} {"train_loss": -5.6642255783081055, "global_step": 45916, "epoch": 1093} {"train_loss": -5.764120101928711, "global_step": 45917, "epoch": 1093} {"train_loss": -5.916597366333008, "global_step": 45918, "epoch": 1093} {"train_loss": -5.698569297790527, "global_step": 45919, "epoch": 1093} {"train_loss": -5.656955718994141, "global_step": 45920, "epoch": 1093} {"train_loss": -5.744215488433838, "global_step": 45921, "epoch": 1093} {"train_loss": -5.611945152282715, "global_step": 45922, "epoch": 1093} {"train_loss": -5.811774253845215, "global_step": 45923, "epoch": 1093} {"train_loss": -5.7608747482299805, "global_step": 45924, "epoch": 1093} {"train_loss": -5.742629051208496, "global_step": 45925, "epoch": 1093} {"train_loss": -5.672671794891357, "global_step": 45926, "epoch": 1093} {"train_loss": -5.761345386505127, "global_step": 45927, "epoch": 1093} {"train_loss": -5.5880937576293945, "global_step": 45928, "epoch": 1093} {"train_loss": -5.779690265655518, "global_step": 45929, "epoch": 1093} {"train_loss": -5.691500663757324, "global_step": 45930, "epoch": 1093} {"train_loss": -5.799534797668457, "global_step": 45931, "epoch": 1093} {"train_loss": -5.764980316162109, "global_step": 45932, "epoch": 1093} {"train_loss": -5.7017035484313965, "global_step": 45933, "epoch": 1093} {"train_loss": -5.702157974243164, "global_step": 45934, "epoch": 1093} {"train_loss": -5.663425445556641, "global_step": 45935, "epoch": 1093} {"train_loss": -5.703405857086182, "global_step": 45936, "epoch": 1093} {"train_loss": -5.7765398025512695, "global_step": 45937, "epoch": 1093} {"train_loss": -5.769977569580078, "global_step": 45938, "epoch": 1093} {"train_loss": -5.626326560974121, "global_step": 45939, "epoch": 1093} {"train_loss": -5.753665447235107, "global_step": 45940, "epoch": 1093} {"train_loss": -5.700119495391846, "global_step": 45941, "epoch": 1093} {"train_loss": -5.712050437927246, "global_step": 45942, "epoch": 1093} {"train_loss": -5.734684467315674, "global_step": 45943, "epoch": 1093} {"train_loss": -5.762449741363525, "global_step": 45944, "epoch": 1093} {"train_loss": -5.661760330200195, "global_step": 45945, "epoch": 1093} {"train_loss": -5.708554744720459, "global_step": 45946, "epoch": 1093} {"train_loss": -5.722223735990978, "global_step": 45947, "epoch": 1093, "val_loss": 74277.7109375} {"train_loss": -5.754697322845459, "global_step": 45948, "epoch": 1094} {"train_loss": -5.764209747314453, "global_step": 45949, "epoch": 1094} {"train_loss": -5.672005653381348, "global_step": 45950, "epoch": 1094} {"train_loss": -5.839020729064941, "global_step": 45951, "epoch": 1094} {"train_loss": -5.6426310539245605, "global_step": 45952, "epoch": 1094} {"train_loss": -5.650168418884277, "global_step": 45953, "epoch": 1094} {"train_loss": -5.7454833984375, "global_step": 45954, "epoch": 1094} {"train_loss": -5.742954730987549, "global_step": 45955, "epoch": 1094} {"train_loss": -5.699724197387695, "global_step": 45956, "epoch": 1094} {"train_loss": -5.690898895263672, "global_step": 45957, "epoch": 1094} {"train_loss": -5.658169746398926, "global_step": 45958, "epoch": 1094} {"train_loss": -5.771570205688477, "global_step": 45959, "epoch": 1094} {"train_loss": -5.5838823318481445, "global_step": 45960, "epoch": 1094} {"train_loss": -5.727513313293457, "global_step": 45961, "epoch": 1094} {"train_loss": -5.862335681915283, "global_step": 45962, "epoch": 1094} {"train_loss": -5.7962493896484375, "global_step": 45963, "epoch": 1094} {"train_loss": -5.655910491943359, "global_step": 45964, "epoch": 1094} {"train_loss": -5.7427568435668945, "global_step": 45965, "epoch": 1094} {"train_loss": -5.656922817230225, "global_step": 45966, "epoch": 1094} {"train_loss": -5.703723907470703, "global_step": 45967, "epoch": 1094} {"train_loss": -5.6828413009643555, "global_step": 45968, "epoch": 1094} {"train_loss": -5.615644454956055, "global_step": 45969, "epoch": 1094} {"train_loss": -5.835687160491943, "global_step": 45970, "epoch": 1094} {"train_loss": -5.785996437072754, "global_step": 45971, "epoch": 1094} {"train_loss": -5.891451358795166, "global_step": 45972, "epoch": 1094} {"train_loss": -5.709759712219238, "global_step": 45973, "epoch": 1094} {"train_loss": -5.842582702636719, "global_step": 45974, "epoch": 1094} {"train_loss": -5.718951225280762, "global_step": 45975, "epoch": 1094} {"train_loss": -5.786188125610352, "global_step": 45976, "epoch": 1094} {"train_loss": -5.528250694274902, "global_step": 45977, "epoch": 1094} {"train_loss": -5.725671768188477, "global_step": 45978, "epoch": 1094} {"train_loss": -5.73299503326416, "global_step": 45979, "epoch": 1094} {"train_loss": -5.621212959289551, "global_step": 45980, "epoch": 1094} {"train_loss": -5.789795875549316, "global_step": 45981, "epoch": 1094} {"train_loss": -5.71138334274292, "global_step": 45982, "epoch": 1094} {"train_loss": -5.753118515014648, "global_step": 45983, "epoch": 1094} {"train_loss": -5.641942977905273, "global_step": 45984, "epoch": 1094} {"train_loss": -5.568902015686035, "global_step": 45985, "epoch": 1094} {"train_loss": -5.675559997558594, "global_step": 45986, "epoch": 1094} {"train_loss": -5.730473041534424, "global_step": 45987, "epoch": 1094} {"train_loss": -5.690814018249512, "global_step": 45988, "epoch": 1094} {"train_loss": -5.7158132167089555, "global_step": 45989, "epoch": 1094, "val_loss": 73810.1640625} {"train_loss": -5.682586193084717, "global_step": 45990, "epoch": 1095} {"train_loss": -5.921383857727051, "global_step": 45991, "epoch": 1095} {"train_loss": -5.704095840454102, "global_step": 45992, "epoch": 1095} {"train_loss": -5.779583930969238, "global_step": 45993, "epoch": 1095} {"train_loss": -5.667871952056885, "global_step": 45994, "epoch": 1095} {"train_loss": -5.611763000488281, "global_step": 45995, "epoch": 1095} {"train_loss": -5.702299118041992, "global_step": 45996, "epoch": 1095} {"train_loss": -5.597289085388184, "global_step": 45997, "epoch": 1095} {"train_loss": -5.74017858505249, "global_step": 45998, "epoch": 1095} {"train_loss": -5.817899703979492, "global_step": 45999, "epoch": 1095} {"train_loss": -5.485474586486816, "global_step": 46000, "epoch": 1095} {"train_loss": -5.762151718139648, "global_step": 46001, "epoch": 1095} {"train_loss": -5.679307460784912, "global_step": 46002, "epoch": 1095} {"train_loss": -5.684779167175293, "global_step": 46003, "epoch": 1095} {"train_loss": -5.720912933349609, "global_step": 46004, "epoch": 1095} {"train_loss": -5.770575523376465, "global_step": 46005, "epoch": 1095} {"train_loss": -5.783306121826172, "global_step": 46006, "epoch": 1095} {"train_loss": -5.521167755126953, "global_step": 46007, "epoch": 1095} {"train_loss": -5.838095664978027, "global_step": 46008, "epoch": 1095} {"train_loss": -5.720231056213379, "global_step": 46009, "epoch": 1095} {"train_loss": -5.646646499633789, "global_step": 46010, "epoch": 1095} {"train_loss": -5.751126766204834, "global_step": 46011, "epoch": 1095} {"train_loss": -5.754194259643555, "global_step": 46012, "epoch": 1095} {"train_loss": -5.713367462158203, "global_step": 46013, "epoch": 1095} {"train_loss": -5.701025009155273, "global_step": 46014, "epoch": 1095} {"train_loss": -5.5809550285339355, "global_step": 46015, "epoch": 1095} {"train_loss": -5.747331142425537, "global_step": 46016, "epoch": 1095} {"train_loss": -5.8094282150268555, "global_step": 46017, "epoch": 1095} {"train_loss": -5.794404029846191, "global_step": 46018, "epoch": 1095} {"train_loss": -5.769950866699219, "global_step": 46019, "epoch": 1095} {"train_loss": -5.730714797973633, "global_step": 46020, "epoch": 1095} {"train_loss": -5.841412544250488, "global_step": 46021, "epoch": 1095} {"train_loss": -5.7602996826171875, "global_step": 46022, "epoch": 1095} {"train_loss": -5.747400283813477, "global_step": 46023, "epoch": 1095} {"train_loss": -5.774580001831055, "global_step": 46024, "epoch": 1095} {"train_loss": -5.705606937408447, "global_step": 46025, "epoch": 1095} {"train_loss": -5.735503673553467, "global_step": 46026, "epoch": 1095} {"train_loss": -5.664511680603027, "global_step": 46027, "epoch": 1095} {"train_loss": -5.6888532638549805, "global_step": 46028, "epoch": 1095} {"train_loss": -5.67774772644043, "global_step": 46029, "epoch": 1095} {"train_loss": -5.734818935394287, "global_step": 46030, "epoch": 1095} {"train_loss": -5.719354572750273, "global_step": 46031, "epoch": 1095, "val_loss": 74092.7890625} {"train_loss": -5.690936088562012, "global_step": 46032, "epoch": 1096} {"train_loss": -5.865257263183594, "global_step": 46033, "epoch": 1096} {"train_loss": -5.786971092224121, "global_step": 46034, "epoch": 1096} {"train_loss": -5.693171501159668, "global_step": 46035, "epoch": 1096} {"train_loss": -5.717860698699951, "global_step": 46036, "epoch": 1096} {"train_loss": -5.731664180755615, "global_step": 46037, "epoch": 1096} {"train_loss": -5.799178123474121, "global_step": 46038, "epoch": 1096} {"train_loss": -5.596752643585205, "global_step": 46039, "epoch": 1096} {"train_loss": -5.669778823852539, "global_step": 46040, "epoch": 1096} {"train_loss": -5.67929220199585, "global_step": 46041, "epoch": 1096} {"train_loss": -5.783357620239258, "global_step": 46042, "epoch": 1096} {"train_loss": -5.733212471008301, "global_step": 46043, "epoch": 1096} {"train_loss": -5.742849349975586, "global_step": 46044, "epoch": 1096} {"train_loss": -5.661523818969727, "global_step": 46045, "epoch": 1096} {"train_loss": -5.668156623840332, "global_step": 46046, "epoch": 1096} {"train_loss": -5.71604061126709, "global_step": 46047, "epoch": 1096} {"train_loss": -5.722825050354004, "global_step": 46048, "epoch": 1096} {"train_loss": -5.874332427978516, "global_step": 46049, "epoch": 1096} {"train_loss": -5.659692764282227, "global_step": 46050, "epoch": 1096} {"train_loss": -5.624976634979248, "global_step": 46051, "epoch": 1096} {"train_loss": -5.802521705627441, "global_step": 46052, "epoch": 1096} {"train_loss": -5.6214141845703125, "global_step": 46053, "epoch": 1096} {"train_loss": -5.787625312805176, "global_step": 46054, "epoch": 1096} {"train_loss": -5.716679573059082, "global_step": 46055, "epoch": 1096} {"train_loss": -5.723083972930908, "global_step": 46056, "epoch": 1096} {"train_loss": -5.739499092102051, "global_step": 46057, "epoch": 1096} {"train_loss": -5.721004009246826, "global_step": 46058, "epoch": 1096} {"train_loss": -5.726850509643555, "global_step": 46059, "epoch": 1096} {"train_loss": -5.8575286865234375, "global_step": 46060, "epoch": 1096} {"train_loss": -5.6343584060668945, "global_step": 46061, "epoch": 1096} {"train_loss": -5.695219039916992, "global_step": 46062, "epoch": 1096} {"train_loss": -5.775470733642578, "global_step": 46063, "epoch": 1096} {"train_loss": -5.68306303024292, "global_step": 46064, "epoch": 1096} {"train_loss": -5.587949752807617, "global_step": 46065, "epoch": 1096} {"train_loss": -5.679477691650391, "global_step": 46066, "epoch": 1096} {"train_loss": -5.662034034729004, "global_step": 46067, "epoch": 1096} {"train_loss": -5.757676601409912, "global_step": 46068, "epoch": 1096} {"train_loss": -5.738903999328613, "global_step": 46069, "epoch": 1096} {"train_loss": -5.689261436462402, "global_step": 46070, "epoch": 1096} {"train_loss": -5.647536277770996, "global_step": 46071, "epoch": 1096} {"train_loss": -5.811141014099121, "global_step": 46072, "epoch": 1096} {"train_loss": -5.720017308280582, "global_step": 46073, "epoch": 1096, "val_loss": 74263.5859375} {"train_loss": -5.762434005737305, "global_step": 46074, "epoch": 1097} {"train_loss": -5.633846759796143, "global_step": 46075, "epoch": 1097} {"train_loss": -5.629474639892578, "global_step": 46076, "epoch": 1097} {"train_loss": -5.724222183227539, "global_step": 46077, "epoch": 1097} {"train_loss": -5.670138835906982, "global_step": 46078, "epoch": 1097} {"train_loss": -5.735711097717285, "global_step": 46079, "epoch": 1097} {"train_loss": -5.527106285095215, "global_step": 46080, "epoch": 1097} {"train_loss": -5.659544944763184, "global_step": 46081, "epoch": 1097} {"train_loss": -5.723999977111816, "global_step": 46082, "epoch": 1097} {"train_loss": -5.631324768066406, "global_step": 46083, "epoch": 1097} {"train_loss": -5.605688095092773, "global_step": 46084, "epoch": 1097} {"train_loss": -5.573935508728027, "global_step": 46085, "epoch": 1097} {"train_loss": -5.664234161376953, "global_step": 46086, "epoch": 1097} {"train_loss": -5.5996012687683105, "global_step": 46087, "epoch": 1097} {"train_loss": -5.7064127922058105, "global_step": 46088, "epoch": 1097} {"train_loss": -5.694461345672607, "global_step": 46089, "epoch": 1097} {"train_loss": -5.6880364418029785, "global_step": 46090, "epoch": 1097} {"train_loss": -5.694014549255371, "global_step": 46091, "epoch": 1097} {"train_loss": -5.712831497192383, "global_step": 46092, "epoch": 1097} {"train_loss": -5.753757476806641, "global_step": 46093, "epoch": 1097} {"train_loss": -5.736363410949707, "global_step": 46094, "epoch": 1097} {"train_loss": -5.549037933349609, "global_step": 46095, "epoch": 1097} {"train_loss": -5.7062578201293945, "global_step": 46096, "epoch": 1097} {"train_loss": -5.787665367126465, "global_step": 46097, "epoch": 1097} {"train_loss": -5.5925822257995605, "global_step": 46098, "epoch": 1097} {"train_loss": -5.762677192687988, "global_step": 46099, "epoch": 1097} {"train_loss": -5.716362953186035, "global_step": 46100, "epoch": 1097} {"train_loss": -5.683284282684326, "global_step": 46101, "epoch": 1097} {"train_loss": -5.739118576049805, "global_step": 46102, "epoch": 1097} {"train_loss": -5.671360015869141, "global_step": 46103, "epoch": 1097} {"train_loss": -5.722064018249512, "global_step": 46104, "epoch": 1097} {"train_loss": -5.633931636810303, "global_step": 46105, "epoch": 1097} {"train_loss": -5.712320327758789, "global_step": 46106, "epoch": 1097} {"train_loss": -5.695418357849121, "global_step": 46107, "epoch": 1097} {"train_loss": -5.765978813171387, "global_step": 46108, "epoch": 1097} {"train_loss": -5.731359481811523, "global_step": 46109, "epoch": 1097} {"train_loss": -5.684107780456543, "global_step": 46110, "epoch": 1097} {"train_loss": -5.694890022277832, "global_step": 46111, "epoch": 1097} {"train_loss": -5.736502170562744, "global_step": 46112, "epoch": 1097} {"train_loss": -5.7376508712768555, "global_step": 46113, "epoch": 1097} {"train_loss": -5.649839401245117, "global_step": 46114, "epoch": 1097} {"train_loss": -5.683269080661592, "global_step": 46115, "epoch": 1097, "val_loss": 73787.0078125} {"train_loss": -5.788592338562012, "global_step": 46116, "epoch": 1098} {"train_loss": -5.821708679199219, "global_step": 46117, "epoch": 1098} {"train_loss": -5.665801048278809, "global_step": 46118, "epoch": 1098} {"train_loss": -5.761794090270996, "global_step": 46119, "epoch": 1098} {"train_loss": -5.668182849884033, "global_step": 46120, "epoch": 1098} {"train_loss": -5.711250305175781, "global_step": 46121, "epoch": 1098} {"train_loss": -5.701269149780273, "global_step": 46122, "epoch": 1098} {"train_loss": -5.714097023010254, "global_step": 46123, "epoch": 1098} {"train_loss": -5.70201301574707, "global_step": 46124, "epoch": 1098} {"train_loss": -5.776780128479004, "global_step": 46125, "epoch": 1098} {"train_loss": -5.745949745178223, "global_step": 46126, "epoch": 1098} {"train_loss": -5.71138334274292, "global_step": 46127, "epoch": 1098} {"train_loss": -5.586560249328613, "global_step": 46128, "epoch": 1098} {"train_loss": -5.604043960571289, "global_step": 46129, "epoch": 1098} {"train_loss": -5.642175197601318, "global_step": 46130, "epoch": 1098} {"train_loss": -5.740092754364014, "global_step": 46131, "epoch": 1098} {"train_loss": -5.684924602508545, "global_step": 46132, "epoch": 1098} {"train_loss": -5.7661895751953125, "global_step": 46133, "epoch": 1098} {"train_loss": -5.714334487915039, "global_step": 46134, "epoch": 1098} {"train_loss": -5.702691078186035, "global_step": 46135, "epoch": 1098} {"train_loss": -5.756492614746094, "global_step": 46136, "epoch": 1098} {"train_loss": -5.678207874298096, "global_step": 46137, "epoch": 1098} {"train_loss": -5.692424774169922, "global_step": 46138, "epoch": 1098} {"train_loss": -5.829952716827393, "global_step": 46139, "epoch": 1098} {"train_loss": -5.6924147605896, "global_step": 46140, "epoch": 1098} {"train_loss": -5.715617656707764, "global_step": 46141, "epoch": 1098} {"train_loss": -5.680346965789795, "global_step": 46142, "epoch": 1098} {"train_loss": -5.700533866882324, "global_step": 46143, "epoch": 1098} {"train_loss": -5.709763050079346, "global_step": 46144, "epoch": 1098} {"train_loss": -5.688325881958008, "global_step": 46145, "epoch": 1098} {"train_loss": -5.614304542541504, "global_step": 46146, "epoch": 1098} {"train_loss": -5.637612819671631, "global_step": 46147, "epoch": 1098} {"train_loss": -5.839651584625244, "global_step": 46148, "epoch": 1098} {"train_loss": -5.64705753326416, "global_step": 46149, "epoch": 1098} {"train_loss": -5.717811107635498, "global_step": 46150, "epoch": 1098} {"train_loss": -5.671390533447266, "global_step": 46151, "epoch": 1098} {"train_loss": -5.622003555297852, "global_step": 46152, "epoch": 1098} {"train_loss": -5.762813568115234, "global_step": 46153, "epoch": 1098} {"train_loss": -5.579658508300781, "global_step": 46154, "epoch": 1098} {"train_loss": -5.7721099853515625, "global_step": 46155, "epoch": 1098} {"train_loss": -5.622488975524902, "global_step": 46156, "epoch": 1098} {"train_loss": -5.7035541988554455, "global_step": 46157, "epoch": 1098, "val_loss": 74053.6640625} {"train_loss": -5.569052219390869, "global_step": 46158, "epoch": 1099} {"train_loss": -5.734073638916016, "global_step": 46159, "epoch": 1099} {"train_loss": -5.833703994750977, "global_step": 46160, "epoch": 1099} {"train_loss": -5.68754768371582, "global_step": 46161, "epoch": 1099} {"train_loss": -5.637720108032227, "global_step": 46162, "epoch": 1099} {"train_loss": -5.747271537780762, "global_step": 46163, "epoch": 1099} {"train_loss": -5.824428558349609, "global_step": 46164, "epoch": 1099} {"train_loss": -5.77451229095459, "global_step": 46165, "epoch": 1099} {"train_loss": -5.692074298858643, "global_step": 46166, "epoch": 1099} {"train_loss": -5.660984992980957, "global_step": 46167, "epoch": 1099} {"train_loss": -5.740721702575684, "global_step": 46168, "epoch": 1099} {"train_loss": -5.768058776855469, "global_step": 46169, "epoch": 1099} {"train_loss": -5.751283645629883, "global_step": 46170, "epoch": 1099} {"train_loss": -5.727802276611328, "global_step": 46171, "epoch": 1099} {"train_loss": -5.8544721603393555, "global_step": 46172, "epoch": 1099} {"train_loss": -5.742368698120117, "global_step": 46173, "epoch": 1099} {"train_loss": -5.682231903076172, "global_step": 46174, "epoch": 1099} {"train_loss": -5.546060085296631, "global_step": 46175, "epoch": 1099} {"train_loss": -5.697831153869629, "global_step": 46176, "epoch": 1099} {"train_loss": -5.64899206161499, "global_step": 46177, "epoch": 1099} {"train_loss": -5.723935604095459, "global_step": 46178, "epoch": 1099} {"train_loss": -5.6282958984375, "global_step": 46179, "epoch": 1099} {"train_loss": -5.692765235900879, "global_step": 46180, "epoch": 1099} {"train_loss": -5.616245269775391, "global_step": 46181, "epoch": 1099} {"train_loss": -5.712494850158691, "global_step": 46182, "epoch": 1099} {"train_loss": -5.695857048034668, "global_step": 46183, "epoch": 1099} {"train_loss": -5.7411394119262695, "global_step": 46184, "epoch": 1099} {"train_loss": -5.560807704925537, "global_step": 46185, "epoch": 1099} {"train_loss": -5.706218719482422, "global_step": 46186, "epoch": 1099} {"train_loss": -5.681206703186035, "global_step": 46187, "epoch": 1099} {"train_loss": -5.861626625061035, "global_step": 46188, "epoch": 1099} {"train_loss": -5.614323139190674, "global_step": 46189, "epoch": 1099} {"train_loss": -5.752407073974609, "global_step": 46190, "epoch": 1099} {"train_loss": -5.752509117126465, "global_step": 46191, "epoch": 1099} {"train_loss": -5.714669704437256, "global_step": 46192, "epoch": 1099} {"train_loss": -5.693821430206299, "global_step": 46193, "epoch": 1099} {"train_loss": -5.735805511474609, "global_step": 46194, "epoch": 1099} {"train_loss": -5.794079303741455, "global_step": 46195, "epoch": 1099} {"train_loss": -5.7004780769348145, "global_step": 46196, "epoch": 1099} {"train_loss": -5.7388811111450195, "global_step": 46197, "epoch": 1099} {"train_loss": -5.7837724685668945, "global_step": 46198, "epoch": 1099} {"train_loss": -5.714365550449917, "global_step": 46199, "epoch": 1099, "val_loss": 74618.4296875} {"train_loss": -5.71946382522583, "global_step": 46200, "epoch": 1100} {"train_loss": -5.828854084014893, "global_step": 46201, "epoch": 1100} {"train_loss": -5.621241569519043, "global_step": 46202, "epoch": 1100} {"train_loss": -5.614483833312988, "global_step": 46203, "epoch": 1100} {"train_loss": -5.712793827056885, "global_step": 46204, "epoch": 1100} {"train_loss": -5.609204292297363, "global_step": 46205, "epoch": 1100} {"train_loss": -5.802756309509277, "global_step": 46206, "epoch": 1100} {"train_loss": -5.7315592765808105, "global_step": 46207, "epoch": 1100} {"train_loss": -5.625556468963623, "global_step": 46208, "epoch": 1100} {"train_loss": -5.742621421813965, "global_step": 46209, "epoch": 1100} {"train_loss": -5.733498573303223, "global_step": 46210, "epoch": 1100} {"train_loss": -5.542373180389404, "global_step": 46211, "epoch": 1100} {"train_loss": -5.641948699951172, "global_step": 46212, "epoch": 1100} {"train_loss": -5.751344203948975, "global_step": 46213, "epoch": 1100} {"train_loss": -5.845810890197754, "global_step": 46214, "epoch": 1100} {"train_loss": -5.729368209838867, "global_step": 46215, "epoch": 1100} {"train_loss": -5.705443382263184, "global_step": 46216, "epoch": 1100} {"train_loss": -5.749738693237305, "global_step": 46217, "epoch": 1100} {"train_loss": -5.697151184082031, "global_step": 46218, "epoch": 1100} {"train_loss": -5.664823532104492, "global_step": 46219, "epoch": 1100} {"train_loss": -5.672245979309082, "global_step": 46220, "epoch": 1100} {"train_loss": -5.76580810546875, "global_step": 46221, "epoch": 1100} {"train_loss": -5.760400295257568, "global_step": 46222, "epoch": 1100} {"train_loss": -5.793224811553955, "global_step": 46223, "epoch": 1100} {"train_loss": -5.709277153015137, "global_step": 46224, "epoch": 1100} {"train_loss": -5.801517486572266, "global_step": 46225, "epoch": 1100} {"train_loss": -5.760472774505615, "global_step": 46226, "epoch": 1100} {"train_loss": -5.689872741699219, "global_step": 46227, "epoch": 1100} {"train_loss": -5.759674072265625, "global_step": 46228, "epoch": 1100} {"train_loss": -5.8723859786987305, "global_step": 46229, "epoch": 1100} {"train_loss": -5.741522312164307, "global_step": 46230, "epoch": 1100} {"train_loss": -5.7972941398620605, "global_step": 46231, "epoch": 1100} {"train_loss": -5.7578864097595215, "global_step": 46232, "epoch": 1100} {"train_loss": -5.75779914855957, "global_step": 46233, "epoch": 1100} {"train_loss": -5.613509178161621, "global_step": 46234, "epoch": 1100} {"train_loss": -5.767003059387207, "global_step": 46235, "epoch": 1100} {"train_loss": -5.717555522918701, "global_step": 46236, "epoch": 1100} {"train_loss": -5.695234298706055, "global_step": 46237, "epoch": 1100} {"train_loss": -5.842623710632324, "global_step": 46238, "epoch": 1100} {"train_loss": -5.6456298828125, "global_step": 46239, "epoch": 1100} {"train_loss": -5.710812568664551, "global_step": 46240, "epoch": 1100} {"train_loss": -5.727283159891765, "global_step": 46241, "epoch": 1100, "train/sim_max_reward_0": 0.5609207729434496, "train/sim_max_reward_1": 0.7748882433759743, "train/sim_max_reward_2": 0.4714512359870268, "train/sim_max_reward_3": 0.15404012846353785, "train/sim_max_reward_4": 0.9063951191407963, "train/sim_max_reward_5": 0.9404000751804351, "test/sim_max_reward_4500000": 0.7252324325643741, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.6461746528616037, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.054580065317177094, "test/sim_max_reward_4500005": 0.39208435577071704, "test/sim_max_reward_4500006": 0.683106248660195, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.009461953320122885, "test/sim_max_reward_4500009": 0.2735369574750792, "test/sim_max_reward_4500010": 0.8541089101804608, "test/sim_max_reward_4500011": 0.7683600135432692, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.3787561851675076, "test/sim_max_reward_4500015": 0.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0, "test/sim_max_reward_4500018": 0.004249031229020703, "test/sim_max_reward_4500019": 0.9341031530080547, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8560741136111284, "test/sim_max_reward_4500022": 0.593736780684158, "test/sim_max_reward_4500023": 0.801079546585824, "test/sim_max_reward_4500024": 0.7460499948934725, "test/sim_max_reward_4500025": 0.3521146581626666, "test/sim_max_reward_4500026": 0.1574603243630826, "test/sim_max_reward_4500027": 0.8635661575431272, "test/sim_max_reward_4500028": 0.188886229065905, "test/sim_max_reward_4500029": 0.31130224956812685, "test/sim_max_reward_4500030": 0.9346974741900298, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.21666726707165554, "test/sim_max_reward_4500034": 0.9095410946096143, "test/sim_max_reward_4500035": 0.8043280648222568, "test/sim_max_reward_4500036": 0.3902291629442461, "test/sim_max_reward_4500037": 0.5475783878134362, "test/sim_max_reward_4500038": 0.3429887630769499, "test/sim_max_reward_4500039": 0.715291909736487, "test/sim_max_reward_4500040": 0.9125339925006309, "test/sim_max_reward_4500041": 0.3594391074682488, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.43468690072792504, "test/sim_max_reward_4500045": 0.3621919357476743, "test/sim_max_reward_4500046": 0.8604657252679974, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.7668039547313544, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6346825958485366, "test/mean_score": 0.384798567519902, "val_loss": 74281.40625} {"train_loss": -5.7080888748168945, "global_step": 46242, "epoch": 1101} {"train_loss": -5.6445465087890625, "global_step": 46243, "epoch": 1101} {"train_loss": -5.752806663513184, "global_step": 46244, "epoch": 1101} {"train_loss": -5.846263885498047, "global_step": 46245, "epoch": 1101} {"train_loss": -5.822298049926758, "global_step": 46246, "epoch": 1101} {"train_loss": -5.682621002197266, "global_step": 46247, "epoch": 1101} {"train_loss": -5.6886067390441895, "global_step": 46248, "epoch": 1101} {"train_loss": -5.649566650390625, "global_step": 46249, "epoch": 1101} {"train_loss": -5.608138084411621, "global_step": 46250, "epoch": 1101} {"train_loss": -5.7868523597717285, "global_step": 46251, "epoch": 1101} {"train_loss": -5.650417804718018, "global_step": 46252, "epoch": 1101} {"train_loss": -5.660019874572754, "global_step": 46253, "epoch": 1101} {"train_loss": -5.778337478637695, "global_step": 46254, "epoch": 1101} {"train_loss": -5.786732196807861, "global_step": 46255, "epoch": 1101} {"train_loss": -5.699580669403076, "global_step": 46256, "epoch": 1101} {"train_loss": -5.767626762390137, "global_step": 46257, "epoch": 1101} {"train_loss": -5.698860168457031, "global_step": 46258, "epoch": 1101} {"train_loss": -5.732954978942871, "global_step": 46259, "epoch": 1101} {"train_loss": -5.573386192321777, "global_step": 46260, "epoch": 1101} {"train_loss": -5.742448806762695, "global_step": 46261, "epoch": 1101} {"train_loss": -5.961809158325195, "global_step": 46262, "epoch": 1101} {"train_loss": -5.8184614181518555, "global_step": 46263, "epoch": 1101} {"train_loss": -5.73226261138916, "global_step": 46264, "epoch": 1101} {"train_loss": -5.792919158935547, "global_step": 46265, "epoch": 1101} {"train_loss": -5.792332649230957, "global_step": 46266, "epoch": 1101} {"train_loss": -5.753391742706299, "global_step": 46267, "epoch": 1101} {"train_loss": -5.832254409790039, "global_step": 46268, "epoch": 1101} {"train_loss": -5.666744709014893, "global_step": 46269, "epoch": 1101} {"train_loss": -5.70896053314209, "global_step": 46270, "epoch": 1101} {"train_loss": -5.768597602844238, "global_step": 46271, "epoch": 1101} {"train_loss": -5.756037712097168, "global_step": 46272, "epoch": 1101} {"train_loss": -5.75559139251709, "global_step": 46273, "epoch": 1101} {"train_loss": -5.712790489196777, "global_step": 46274, "epoch": 1101} {"train_loss": -5.746877193450928, "global_step": 46275, "epoch": 1101} {"train_loss": -5.661046028137207, "global_step": 46276, "epoch": 1101} {"train_loss": -5.711712837219238, "global_step": 46277, "epoch": 1101} {"train_loss": -5.745309829711914, "global_step": 46278, "epoch": 1101} {"train_loss": -5.740570068359375, "global_step": 46279, "epoch": 1101} {"train_loss": -5.75008487701416, "global_step": 46280, "epoch": 1101} {"train_loss": -5.700929164886475, "global_step": 46281, "epoch": 1101} {"train_loss": -5.714298248291016, "global_step": 46282, "epoch": 1101} {"train_loss": -5.733800524757022, "global_step": 46283, "epoch": 1101, "val_loss": 74049.4453125} {"train_loss": -5.783346652984619, "global_step": 46284, "epoch": 1102} {"train_loss": -5.711275100708008, "global_step": 46285, "epoch": 1102} {"train_loss": -5.857220649719238, "global_step": 46286, "epoch": 1102} {"train_loss": -5.855750560760498, "global_step": 46287, "epoch": 1102} {"train_loss": -5.72073221206665, "global_step": 46288, "epoch": 1102} {"train_loss": -5.734018325805664, "global_step": 46289, "epoch": 1102} {"train_loss": -5.78272819519043, "global_step": 46290, "epoch": 1102} {"train_loss": -5.6068220138549805, "global_step": 46291, "epoch": 1102} {"train_loss": -5.798894882202148, "global_step": 46292, "epoch": 1102} {"train_loss": -5.720212936401367, "global_step": 46293, "epoch": 1102} {"train_loss": -5.688665390014648, "global_step": 46294, "epoch": 1102} {"train_loss": -5.665735721588135, "global_step": 46295, "epoch": 1102} {"train_loss": -5.625919342041016, "global_step": 46296, "epoch": 1102} {"train_loss": -5.622053146362305, "global_step": 46297, "epoch": 1102} {"train_loss": -5.733407497406006, "global_step": 46298, "epoch": 1102} {"train_loss": -5.626051425933838, "global_step": 46299, "epoch": 1102} {"train_loss": -5.884007453918457, "global_step": 46300, "epoch": 1102} {"train_loss": -5.746522903442383, "global_step": 46301, "epoch": 1102} {"train_loss": -5.658490180969238, "global_step": 46302, "epoch": 1102} {"train_loss": -5.816547393798828, "global_step": 46303, "epoch": 1102} {"train_loss": -5.678924560546875, "global_step": 46304, "epoch": 1102} {"train_loss": -5.679588317871094, "global_step": 46305, "epoch": 1102} {"train_loss": -5.739828109741211, "global_step": 46306, "epoch": 1102} {"train_loss": -5.757803916931152, "global_step": 46307, "epoch": 1102} {"train_loss": -5.689557075500488, "global_step": 46308, "epoch": 1102} {"train_loss": -5.649295330047607, "global_step": 46309, "epoch": 1102} {"train_loss": -5.67604923248291, "global_step": 46310, "epoch": 1102} {"train_loss": -5.736261367797852, "global_step": 46311, "epoch": 1102} {"train_loss": -5.552634239196777, "global_step": 46312, "epoch": 1102} {"train_loss": -5.807770729064941, "global_step": 46313, "epoch": 1102} {"train_loss": -5.552609443664551, "global_step": 46314, "epoch": 1102} {"train_loss": -5.730210304260254, "global_step": 46315, "epoch": 1102} {"train_loss": -5.787445545196533, "global_step": 46316, "epoch": 1102} {"train_loss": -5.628787040710449, "global_step": 46317, "epoch": 1102} {"train_loss": -5.597734451293945, "global_step": 46318, "epoch": 1102} {"train_loss": -5.631814002990723, "global_step": 46319, "epoch": 1102} {"train_loss": -5.638965129852295, "global_step": 46320, "epoch": 1102} {"train_loss": -5.747347354888916, "global_step": 46321, "epoch": 1102} {"train_loss": -5.803482532501221, "global_step": 46322, "epoch": 1102} {"train_loss": -5.6240997314453125, "global_step": 46323, "epoch": 1102} {"train_loss": -5.643232345581055, "global_step": 46324, "epoch": 1102} {"train_loss": -5.704399619783674, "global_step": 46325, "epoch": 1102, "val_loss": 73934.9921875} {"train_loss": -5.726227760314941, "global_step": 46326, "epoch": 1103} {"train_loss": -5.548954963684082, "global_step": 46327, "epoch": 1103} {"train_loss": -5.821197509765625, "global_step": 46328, "epoch": 1103} {"train_loss": -5.69985818862915, "global_step": 46329, "epoch": 1103} {"train_loss": -5.755917549133301, "global_step": 46330, "epoch": 1103} {"train_loss": -5.684796333312988, "global_step": 46331, "epoch": 1103} {"train_loss": -5.766747951507568, "global_step": 46332, "epoch": 1103} {"train_loss": -5.60715389251709, "global_step": 46333, "epoch": 1103} {"train_loss": -5.844507217407227, "global_step": 46334, "epoch": 1103} {"train_loss": -5.763745307922363, "global_step": 46335, "epoch": 1103} {"train_loss": -5.720874309539795, "global_step": 46336, "epoch": 1103} {"train_loss": -5.762931823730469, "global_step": 46337, "epoch": 1103} {"train_loss": -5.666841506958008, "global_step": 46338, "epoch": 1103} {"train_loss": -5.830531597137451, "global_step": 46339, "epoch": 1103} {"train_loss": -5.761523246765137, "global_step": 46340, "epoch": 1103} {"train_loss": -5.715909004211426, "global_step": 46341, "epoch": 1103} {"train_loss": -5.86043119430542, "global_step": 46342, "epoch": 1103} {"train_loss": -5.699938774108887, "global_step": 46343, "epoch": 1103} {"train_loss": -5.751492500305176, "global_step": 46344, "epoch": 1103} {"train_loss": -5.864211559295654, "global_step": 46345, "epoch": 1103} {"train_loss": -5.725870132446289, "global_step": 46346, "epoch": 1103} {"train_loss": -5.5928263664245605, "global_step": 46347, "epoch": 1103} {"train_loss": -5.823971748352051, "global_step": 46348, "epoch": 1103} {"train_loss": -5.73570442199707, "global_step": 46349, "epoch": 1103} {"train_loss": -5.650353908538818, "global_step": 46350, "epoch": 1103} {"train_loss": -5.662086486816406, "global_step": 46351, "epoch": 1103} {"train_loss": -5.7993879318237305, "global_step": 46352, "epoch": 1103} {"train_loss": -5.74782657623291, "global_step": 46353, "epoch": 1103} {"train_loss": -5.715137481689453, "global_step": 46354, "epoch": 1103} {"train_loss": -5.717597007751465, "global_step": 46355, "epoch": 1103} {"train_loss": -5.805848121643066, "global_step": 46356, "epoch": 1103} {"train_loss": -5.73673677444458, "global_step": 46357, "epoch": 1103} {"train_loss": -5.756930828094482, "global_step": 46358, "epoch": 1103} {"train_loss": -5.671784400939941, "global_step": 46359, "epoch": 1103} {"train_loss": -5.649176120758057, "global_step": 46360, "epoch": 1103} {"train_loss": -5.716331481933594, "global_step": 46361, "epoch": 1103} {"train_loss": -5.757615566253662, "global_step": 46362, "epoch": 1103} {"train_loss": -5.7092204093933105, "global_step": 46363, "epoch": 1103} {"train_loss": -5.659141540527344, "global_step": 46364, "epoch": 1103} {"train_loss": -5.683832168579102, "global_step": 46365, "epoch": 1103} {"train_loss": -5.800544738769531, "global_step": 46366, "epoch": 1103} {"train_loss": -5.727918499992008, "global_step": 46367, "epoch": 1103, "val_loss": 74435.7421875} {"train_loss": -5.823827743530273, "global_step": 46368, "epoch": 1104} {"train_loss": -5.528943061828613, "global_step": 46369, "epoch": 1104} {"train_loss": -5.7072062492370605, "global_step": 46370, "epoch": 1104} {"train_loss": -5.773639678955078, "global_step": 46371, "epoch": 1104} {"train_loss": -5.8325514793396, "global_step": 46372, "epoch": 1104} {"train_loss": -5.766642093658447, "global_step": 46373, "epoch": 1104} {"train_loss": -5.720431804656982, "global_step": 46374, "epoch": 1104} {"train_loss": -5.704285144805908, "global_step": 46375, "epoch": 1104} {"train_loss": -5.7087836265563965, "global_step": 46376, "epoch": 1104} {"train_loss": -5.731657028198242, "global_step": 46377, "epoch": 1104} {"train_loss": -5.686286449432373, "global_step": 46378, "epoch": 1104} {"train_loss": -5.8098320960998535, "global_step": 46379, "epoch": 1104} {"train_loss": -5.7790846824646, "global_step": 46380, "epoch": 1104} {"train_loss": -5.785285472869873, "global_step": 46381, "epoch": 1104} {"train_loss": -5.619223594665527, "global_step": 46382, "epoch": 1104} {"train_loss": -5.783624172210693, "global_step": 46383, "epoch": 1104} {"train_loss": -5.741427421569824, "global_step": 46384, "epoch": 1104} {"train_loss": -5.7693071365356445, "global_step": 46385, "epoch": 1104} {"train_loss": -5.728575229644775, "global_step": 46386, "epoch": 1104} {"train_loss": -5.751266956329346, "global_step": 46387, "epoch": 1104} {"train_loss": -5.790590286254883, "global_step": 46388, "epoch": 1104} {"train_loss": -5.731412887573242, "global_step": 46389, "epoch": 1104} {"train_loss": -5.695840358734131, "global_step": 46390, "epoch": 1104} {"train_loss": -5.768020153045654, "global_step": 46391, "epoch": 1104} {"train_loss": -5.646535873413086, "global_step": 46392, "epoch": 1104} {"train_loss": -5.709892272949219, "global_step": 46393, "epoch": 1104} {"train_loss": -5.695630073547363, "global_step": 46394, "epoch": 1104} {"train_loss": -5.634214878082275, "global_step": 46395, "epoch": 1104} {"train_loss": -5.665339469909668, "global_step": 46396, "epoch": 1104} {"train_loss": -5.708497047424316, "global_step": 46397, "epoch": 1104} {"train_loss": -5.713401794433594, "global_step": 46398, "epoch": 1104} {"train_loss": -5.565947532653809, "global_step": 46399, "epoch": 1104} {"train_loss": -5.76953125, "global_step": 46400, "epoch": 1104} {"train_loss": -5.716827392578125, "global_step": 46401, "epoch": 1104} {"train_loss": -5.524714469909668, "global_step": 46402, "epoch": 1104} {"train_loss": -5.70295524597168, "global_step": 46403, "epoch": 1104} {"train_loss": -5.608098983764648, "global_step": 46404, "epoch": 1104} {"train_loss": -5.715244293212891, "global_step": 46405, "epoch": 1104} {"train_loss": -5.644043922424316, "global_step": 46406, "epoch": 1104} {"train_loss": -5.6945390701293945, "global_step": 46407, "epoch": 1104} {"train_loss": -5.739165306091309, "global_step": 46408, "epoch": 1104} {"train_loss": -5.711003678185599, "global_step": 46409, "epoch": 1104, "val_loss": 74323.96875} {"train_loss": -5.631487846374512, "global_step": 46410, "epoch": 1105} {"train_loss": -5.692070484161377, "global_step": 46411, "epoch": 1105} {"train_loss": -5.66862678527832, "global_step": 46412, "epoch": 1105} {"train_loss": -5.709174156188965, "global_step": 46413, "epoch": 1105} {"train_loss": -5.74286413192749, "global_step": 46414, "epoch": 1105} {"train_loss": -5.704207420349121, "global_step": 46415, "epoch": 1105} {"train_loss": -5.7155914306640625, "global_step": 46416, "epoch": 1105} {"train_loss": -5.638467788696289, "global_step": 46417, "epoch": 1105} {"train_loss": -5.615203380584717, "global_step": 46418, "epoch": 1105} {"train_loss": -5.744817733764648, "global_step": 46419, "epoch": 1105} {"train_loss": -5.852264881134033, "global_step": 46420, "epoch": 1105} {"train_loss": -5.709294319152832, "global_step": 46421, "epoch": 1105} {"train_loss": -5.757150650024414, "global_step": 46422, "epoch": 1105} {"train_loss": -5.740146636962891, "global_step": 46423, "epoch": 1105} {"train_loss": -5.631287574768066, "global_step": 46424, "epoch": 1105} {"train_loss": -5.774804592132568, "global_step": 46425, "epoch": 1105} {"train_loss": -5.60221004486084, "global_step": 46426, "epoch": 1105} {"train_loss": -5.604120254516602, "global_step": 46427, "epoch": 1105} {"train_loss": -5.70904541015625, "global_step": 46428, "epoch": 1105} {"train_loss": -5.648578643798828, "global_step": 46429, "epoch": 1105} {"train_loss": -5.685802936553955, "global_step": 46430, "epoch": 1105} {"train_loss": -5.724394798278809, "global_step": 46431, "epoch": 1105} {"train_loss": -5.785874366760254, "global_step": 46432, "epoch": 1105} {"train_loss": -5.624905586242676, "global_step": 46433, "epoch": 1105} {"train_loss": -5.656863212585449, "global_step": 46434, "epoch": 1105} {"train_loss": -5.845484256744385, "global_step": 46435, "epoch": 1105} {"train_loss": -5.813467979431152, "global_step": 46436, "epoch": 1105} {"train_loss": -5.775814056396484, "global_step": 46437, "epoch": 1105} {"train_loss": -5.744071006774902, "global_step": 46438, "epoch": 1105} {"train_loss": -5.694043159484863, "global_step": 46439, "epoch": 1105} {"train_loss": -5.732809066772461, "global_step": 46440, "epoch": 1105} {"train_loss": -5.712497711181641, "global_step": 46441, "epoch": 1105} {"train_loss": -5.709206581115723, "global_step": 46442, "epoch": 1105} {"train_loss": -5.733724117279053, "global_step": 46443, "epoch": 1105} {"train_loss": -5.732830047607422, "global_step": 46444, "epoch": 1105} {"train_loss": -5.72166633605957, "global_step": 46445, "epoch": 1105} {"train_loss": -5.55357027053833, "global_step": 46446, "epoch": 1105} {"train_loss": -5.81979513168335, "global_step": 46447, "epoch": 1105} {"train_loss": -5.576936721801758, "global_step": 46448, "epoch": 1105} {"train_loss": -5.542226791381836, "global_step": 46449, "epoch": 1105} {"train_loss": -5.66262149810791, "global_step": 46450, "epoch": 1105} {"train_loss": -5.700177885237194, "global_step": 46451, "epoch": 1105, "val_loss": 74340.390625} {"train_loss": -5.709555149078369, "global_step": 46452, "epoch": 1106} {"train_loss": -5.7885847091674805, "global_step": 46453, "epoch": 1106} {"train_loss": -5.605870246887207, "global_step": 46454, "epoch": 1106} {"train_loss": -5.684684753417969, "global_step": 46455, "epoch": 1106} {"train_loss": -5.624350547790527, "global_step": 46456, "epoch": 1106} {"train_loss": -5.710265159606934, "global_step": 46457, "epoch": 1106} {"train_loss": -5.567100524902344, "global_step": 46458, "epoch": 1106} {"train_loss": -5.6461076736450195, "global_step": 46459, "epoch": 1106} {"train_loss": -5.7636942863464355, "global_step": 46460, "epoch": 1106} {"train_loss": -5.706445217132568, "global_step": 46461, "epoch": 1106} {"train_loss": -5.744622230529785, "global_step": 46462, "epoch": 1106} {"train_loss": -5.695337295532227, "global_step": 46463, "epoch": 1106} {"train_loss": -5.7978925704956055, "global_step": 46464, "epoch": 1106} {"train_loss": -5.689919471740723, "global_step": 46465, "epoch": 1106} {"train_loss": -5.656162261962891, "global_step": 46466, "epoch": 1106} {"train_loss": -5.627828121185303, "global_step": 46467, "epoch": 1106} {"train_loss": -5.618363380432129, "global_step": 46468, "epoch": 1106} {"train_loss": -5.763691425323486, "global_step": 46469, "epoch": 1106} {"train_loss": -5.652768611907959, "global_step": 46470, "epoch": 1106} {"train_loss": -5.623706817626953, "global_step": 46471, "epoch": 1106} {"train_loss": -5.646719455718994, "global_step": 46472, "epoch": 1106} {"train_loss": -5.781327247619629, "global_step": 46473, "epoch": 1106} {"train_loss": -5.667362213134766, "global_step": 46474, "epoch": 1106} {"train_loss": -5.716362953186035, "global_step": 46475, "epoch": 1106} {"train_loss": -5.6979146003723145, "global_step": 46476, "epoch": 1106} {"train_loss": -5.775742053985596, "global_step": 46477, "epoch": 1106} {"train_loss": -5.73928165435791, "global_step": 46478, "epoch": 1106} {"train_loss": -5.640992164611816, "global_step": 46479, "epoch": 1106} {"train_loss": -5.683753967285156, "global_step": 46480, "epoch": 1106} {"train_loss": -5.787740707397461, "global_step": 46481, "epoch": 1106} {"train_loss": -5.7450408935546875, "global_step": 46482, "epoch": 1106} {"train_loss": -5.838281631469727, "global_step": 46483, "epoch": 1106} {"train_loss": -5.659000873565674, "global_step": 46484, "epoch": 1106} {"train_loss": -5.697388648986816, "global_step": 46485, "epoch": 1106} {"train_loss": -5.743349075317383, "global_step": 46486, "epoch": 1106} {"train_loss": -5.6475701332092285, "global_step": 46487, "epoch": 1106} {"train_loss": -5.836463928222656, "global_step": 46488, "epoch": 1106} {"train_loss": -5.723470687866211, "global_step": 46489, "epoch": 1106} {"train_loss": -5.766687393188477, "global_step": 46490, "epoch": 1106} {"train_loss": -5.748254776000977, "global_step": 46491, "epoch": 1106} {"train_loss": -5.687137603759766, "global_step": 46492, "epoch": 1106} {"train_loss": -5.706474951335362, "global_step": 46493, "epoch": 1106, "val_loss": 74246.640625} {"train_loss": -5.64738655090332, "global_step": 46494, "epoch": 1107} {"train_loss": -5.69462776184082, "global_step": 46495, "epoch": 1107} {"train_loss": -5.680624008178711, "global_step": 46496, "epoch": 1107} {"train_loss": -5.736752510070801, "global_step": 46497, "epoch": 1107} {"train_loss": -5.712750434875488, "global_step": 46498, "epoch": 1107} {"train_loss": -5.663716793060303, "global_step": 46499, "epoch": 1107} {"train_loss": -5.749320983886719, "global_step": 46500, "epoch": 1107} {"train_loss": -5.719249725341797, "global_step": 46501, "epoch": 1107} {"train_loss": -5.74235725402832, "global_step": 46502, "epoch": 1107} {"train_loss": -5.833981037139893, "global_step": 46503, "epoch": 1107} {"train_loss": -5.9518585205078125, "global_step": 46504, "epoch": 1107} {"train_loss": -5.856978893280029, "global_step": 46505, "epoch": 1107} {"train_loss": -5.685669898986816, "global_step": 46506, "epoch": 1107} {"train_loss": -5.725049018859863, "global_step": 46507, "epoch": 1107} {"train_loss": -5.795276641845703, "global_step": 46508, "epoch": 1107} {"train_loss": -5.703856468200684, "global_step": 46509, "epoch": 1107} {"train_loss": -5.659511566162109, "global_step": 46510, "epoch": 1107} {"train_loss": -5.7780256271362305, "global_step": 46511, "epoch": 1107} {"train_loss": -5.713754177093506, "global_step": 46512, "epoch": 1107} {"train_loss": -5.767025947570801, "global_step": 46513, "epoch": 1107} {"train_loss": -5.683794021606445, "global_step": 46514, "epoch": 1107} {"train_loss": -5.750020503997803, "global_step": 46515, "epoch": 1107} {"train_loss": -5.742566108703613, "global_step": 46516, "epoch": 1107} {"train_loss": -5.668343544006348, "global_step": 46517, "epoch": 1107} {"train_loss": -5.740959167480469, "global_step": 46518, "epoch": 1107} {"train_loss": -5.768107891082764, "global_step": 46519, "epoch": 1107} {"train_loss": -5.769787311553955, "global_step": 46520, "epoch": 1107} {"train_loss": -5.822658538818359, "global_step": 46521, "epoch": 1107} {"train_loss": -5.760363578796387, "global_step": 46522, "epoch": 1107} {"train_loss": -5.7645263671875, "global_step": 46523, "epoch": 1107} {"train_loss": -5.698195457458496, "global_step": 46524, "epoch": 1107} {"train_loss": -5.618136405944824, "global_step": 46525, "epoch": 1107} {"train_loss": -5.81593656539917, "global_step": 46526, "epoch": 1107} {"train_loss": -5.679928779602051, "global_step": 46527, "epoch": 1107} {"train_loss": -5.644130706787109, "global_step": 46528, "epoch": 1107} {"train_loss": -5.68631649017334, "global_step": 46529, "epoch": 1107} {"train_loss": -5.62632417678833, "global_step": 46530, "epoch": 1107} {"train_loss": -5.640071392059326, "global_step": 46531, "epoch": 1107} {"train_loss": -5.812560081481934, "global_step": 46532, "epoch": 1107} {"train_loss": -5.755466938018799, "global_step": 46533, "epoch": 1107} {"train_loss": -5.62241268157959, "global_step": 46534, "epoch": 1107} {"train_loss": -5.728348981766474, "global_step": 46535, "epoch": 1107, "val_loss": 74189.265625} {"train_loss": -5.606681823730469, "global_step": 46536, "epoch": 1108} {"train_loss": -5.748312950134277, "global_step": 46537, "epoch": 1108} {"train_loss": -5.7341084480285645, "global_step": 46538, "epoch": 1108} {"train_loss": -5.705488204956055, "global_step": 46539, "epoch": 1108} {"train_loss": -5.693058490753174, "global_step": 46540, "epoch": 1108} {"train_loss": -5.653409957885742, "global_step": 46541, "epoch": 1108} {"train_loss": -5.69000244140625, "global_step": 46542, "epoch": 1108} {"train_loss": -5.573990821838379, "global_step": 46543, "epoch": 1108} {"train_loss": -5.814910411834717, "global_step": 46544, "epoch": 1108} {"train_loss": -5.5805463790893555, "global_step": 46545, "epoch": 1108} {"train_loss": -5.603102684020996, "global_step": 46546, "epoch": 1108} {"train_loss": -5.668600559234619, "global_step": 46547, "epoch": 1108} {"train_loss": -5.6533660888671875, "global_step": 46548, "epoch": 1108} {"train_loss": -5.692843437194824, "global_step": 46549, "epoch": 1108} {"train_loss": -5.648797035217285, "global_step": 46550, "epoch": 1108} {"train_loss": -5.729545593261719, "global_step": 46551, "epoch": 1108} {"train_loss": -5.729997634887695, "global_step": 46552, "epoch": 1108} {"train_loss": -5.750308513641357, "global_step": 46553, "epoch": 1108} {"train_loss": -5.744772911071777, "global_step": 46554, "epoch": 1108} {"train_loss": -5.6882829666137695, "global_step": 46555, "epoch": 1108} {"train_loss": -5.83864688873291, "global_step": 46556, "epoch": 1108} {"train_loss": -5.690720558166504, "global_step": 46557, "epoch": 1108} {"train_loss": -5.720420837402344, "global_step": 46558, "epoch": 1108} {"train_loss": -5.820569038391113, "global_step": 46559, "epoch": 1108} {"train_loss": -5.640247344970703, "global_step": 46560, "epoch": 1108} {"train_loss": -5.714489936828613, "global_step": 46561, "epoch": 1108} {"train_loss": -5.709758758544922, "global_step": 46562, "epoch": 1108} {"train_loss": -5.749783515930176, "global_step": 46563, "epoch": 1108} {"train_loss": -5.72157621383667, "global_step": 46564, "epoch": 1108} {"train_loss": -5.7769317626953125, "global_step": 46565, "epoch": 1108} {"train_loss": -5.731115341186523, "global_step": 46566, "epoch": 1108} {"train_loss": -5.5934739112854, "global_step": 46567, "epoch": 1108} {"train_loss": -5.697410583496094, "global_step": 46568, "epoch": 1108} {"train_loss": -5.632928371429443, "global_step": 46569, "epoch": 1108} {"train_loss": -5.746079444885254, "global_step": 46570, "epoch": 1108} {"train_loss": -5.7398786544799805, "global_step": 46571, "epoch": 1108} {"train_loss": -5.707528114318848, "global_step": 46572, "epoch": 1108} {"train_loss": -5.657986640930176, "global_step": 46573, "epoch": 1108} {"train_loss": -5.638110160827637, "global_step": 46574, "epoch": 1108} {"train_loss": -5.62459135055542, "global_step": 46575, "epoch": 1108} {"train_loss": -5.576179504394531, "global_step": 46576, "epoch": 1108} {"train_loss": -5.695296378362746, "global_step": 46577, "epoch": 1108, "val_loss": 74309.5390625} {"train_loss": -5.575519561767578, "global_step": 46578, "epoch": 1109} {"train_loss": -5.47424840927124, "global_step": 46579, "epoch": 1109} {"train_loss": -5.769952774047852, "global_step": 46580, "epoch": 1109} {"train_loss": -5.485007286071777, "global_step": 46581, "epoch": 1109} {"train_loss": -5.716274261474609, "global_step": 46582, "epoch": 1109} {"train_loss": -5.7764739990234375, "global_step": 46583, "epoch": 1109} {"train_loss": -5.617223739624023, "global_step": 46584, "epoch": 1109} {"train_loss": -5.731454849243164, "global_step": 46585, "epoch": 1109} {"train_loss": -5.736721992492676, "global_step": 46586, "epoch": 1109} {"train_loss": -5.666886806488037, "global_step": 46587, "epoch": 1109} {"train_loss": -5.693852424621582, "global_step": 46588, "epoch": 1109} {"train_loss": -5.561369895935059, "global_step": 46589, "epoch": 1109} {"train_loss": -5.771367073059082, "global_step": 46590, "epoch": 1109} {"train_loss": -5.673317909240723, "global_step": 46591, "epoch": 1109} {"train_loss": -5.767200469970703, "global_step": 46592, "epoch": 1109} {"train_loss": -5.608654499053955, "global_step": 46593, "epoch": 1109} {"train_loss": -5.723470687866211, "global_step": 46594, "epoch": 1109} {"train_loss": -5.766643047332764, "global_step": 46595, "epoch": 1109} {"train_loss": -5.6868133544921875, "global_step": 46596, "epoch": 1109} {"train_loss": -5.822536945343018, "global_step": 46597, "epoch": 1109} {"train_loss": -5.842311859130859, "global_step": 46598, "epoch": 1109} {"train_loss": -5.780817031860352, "global_step": 46599, "epoch": 1109} {"train_loss": -5.8054304122924805, "global_step": 46600, "epoch": 1109} {"train_loss": -5.827452659606934, "global_step": 46601, "epoch": 1109} {"train_loss": -5.725111961364746, "global_step": 46602, "epoch": 1109} {"train_loss": -5.875004768371582, "global_step": 46603, "epoch": 1109} {"train_loss": -5.6500043869018555, "global_step": 46604, "epoch": 1109} {"train_loss": -5.652684211730957, "global_step": 46605, "epoch": 1109} {"train_loss": -5.748664855957031, "global_step": 46606, "epoch": 1109} {"train_loss": -5.732089996337891, "global_step": 46607, "epoch": 1109} {"train_loss": -5.689464092254639, "global_step": 46608, "epoch": 1109} {"train_loss": -5.7740678787231445, "global_step": 46609, "epoch": 1109} {"train_loss": -5.689857482910156, "global_step": 46610, "epoch": 1109} {"train_loss": -5.632565975189209, "global_step": 46611, "epoch": 1109} {"train_loss": -5.663029670715332, "global_step": 46612, "epoch": 1109} {"train_loss": -5.720949172973633, "global_step": 46613, "epoch": 1109} {"train_loss": -5.604589462280273, "global_step": 46614, "epoch": 1109} {"train_loss": -5.781835556030273, "global_step": 46615, "epoch": 1109} {"train_loss": -5.756956577301025, "global_step": 46616, "epoch": 1109} {"train_loss": -5.748838424682617, "global_step": 46617, "epoch": 1109} {"train_loss": -5.583898544311523, "global_step": 46618, "epoch": 1109} {"train_loss": -5.706470727920532, "global_step": 46619, "epoch": 1109, "val_loss": 74368.5546875} {"train_loss": -5.787683486938477, "global_step": 46620, "epoch": 1110} {"train_loss": -5.678140163421631, "global_step": 46621, "epoch": 1110} {"train_loss": -5.76322078704834, "global_step": 46622, "epoch": 1110} {"train_loss": -5.764455318450928, "global_step": 46623, "epoch": 1110} {"train_loss": -5.708853721618652, "global_step": 46624, "epoch": 1110} {"train_loss": -5.615917205810547, "global_step": 46625, "epoch": 1110} {"train_loss": -5.699204921722412, "global_step": 46626, "epoch": 1110} {"train_loss": -5.674154281616211, "global_step": 46627, "epoch": 1110} {"train_loss": -5.7098798751831055, "global_step": 46628, "epoch": 1110} {"train_loss": -5.76604700088501, "global_step": 46629, "epoch": 1110} {"train_loss": -5.72054386138916, "global_step": 46630, "epoch": 1110} {"train_loss": -5.759822845458984, "global_step": 46631, "epoch": 1110} {"train_loss": -5.672656536102295, "global_step": 46632, "epoch": 1110} {"train_loss": -5.693907260894775, "global_step": 46633, "epoch": 1110} {"train_loss": -5.721951484680176, "global_step": 46634, "epoch": 1110} {"train_loss": -5.698029518127441, "global_step": 46635, "epoch": 1110} {"train_loss": -5.657112121582031, "global_step": 46636, "epoch": 1110} {"train_loss": -5.7579145431518555, "global_step": 46637, "epoch": 1110} {"train_loss": -5.679332733154297, "global_step": 46638, "epoch": 1110} {"train_loss": -5.578275203704834, "global_step": 46639, "epoch": 1110} {"train_loss": -5.7623186111450195, "global_step": 46640, "epoch": 1110} {"train_loss": -5.917712211608887, "global_step": 46641, "epoch": 1110} {"train_loss": -5.862105369567871, "global_step": 46642, "epoch": 1110} {"train_loss": -5.794194221496582, "global_step": 46643, "epoch": 1110} {"train_loss": -5.8708815574646, "global_step": 46644, "epoch": 1110} {"train_loss": -5.7346649169921875, "global_step": 46645, "epoch": 1110} {"train_loss": -5.778650283813477, "global_step": 46646, "epoch": 1110} {"train_loss": -5.736690998077393, "global_step": 46647, "epoch": 1110} {"train_loss": -5.708475589752197, "global_step": 46648, "epoch": 1110} {"train_loss": -5.69504451751709, "global_step": 46649, "epoch": 1110} {"train_loss": -5.861967086791992, "global_step": 46650, "epoch": 1110} {"train_loss": -5.706195831298828, "global_step": 46651, "epoch": 1110} {"train_loss": -5.781710624694824, "global_step": 46652, "epoch": 1110} {"train_loss": -5.770570755004883, "global_step": 46653, "epoch": 1110} {"train_loss": -5.78605842590332, "global_step": 46654, "epoch": 1110} {"train_loss": -5.746822357177734, "global_step": 46655, "epoch": 1110} {"train_loss": -5.683826923370361, "global_step": 46656, "epoch": 1110} {"train_loss": -5.7366509437561035, "global_step": 46657, "epoch": 1110} {"train_loss": -5.5161919593811035, "global_step": 46658, "epoch": 1110} {"train_loss": -5.6488752365112305, "global_step": 46659, "epoch": 1110} {"train_loss": -5.72850227355957, "global_step": 46660, "epoch": 1110} {"train_loss": -5.7311026482355025, "global_step": 46661, "epoch": 1110, "val_loss": 74215.1328125} {"train_loss": -5.776963233947754, "global_step": 46662, "epoch": 1111} {"train_loss": -5.599538803100586, "global_step": 46663, "epoch": 1111} {"train_loss": -5.700164794921875, "global_step": 46664, "epoch": 1111} {"train_loss": -5.689032554626465, "global_step": 46665, "epoch": 1111} {"train_loss": -5.71619176864624, "global_step": 46666, "epoch": 1111} {"train_loss": -5.811823844909668, "global_step": 46667, "epoch": 1111} {"train_loss": -5.892805576324463, "global_step": 46668, "epoch": 1111} {"train_loss": -5.628154754638672, "global_step": 46669, "epoch": 1111} {"train_loss": -5.783088684082031, "global_step": 46670, "epoch": 1111} {"train_loss": -5.877784729003906, "global_step": 46671, "epoch": 1111} {"train_loss": -5.6842041015625, "global_step": 46672, "epoch": 1111} {"train_loss": -5.727054595947266, "global_step": 46673, "epoch": 1111} {"train_loss": -5.68317985534668, "global_step": 46674, "epoch": 1111} {"train_loss": -5.77412223815918, "global_step": 46675, "epoch": 1111} {"train_loss": -5.85101318359375, "global_step": 46676, "epoch": 1111} {"train_loss": -5.665975570678711, "global_step": 46677, "epoch": 1111} {"train_loss": -5.747716903686523, "global_step": 46678, "epoch": 1111} {"train_loss": -5.8102216720581055, "global_step": 46679, "epoch": 1111} {"train_loss": -5.781022071838379, "global_step": 46680, "epoch": 1111} {"train_loss": -5.882743835449219, "global_step": 46681, "epoch": 1111} {"train_loss": -5.748247146606445, "global_step": 46682, "epoch": 1111} {"train_loss": -5.755733013153076, "global_step": 46683, "epoch": 1111} {"train_loss": -5.805783271789551, "global_step": 46684, "epoch": 1111} {"train_loss": -5.814561367034912, "global_step": 46685, "epoch": 1111} {"train_loss": -5.694167613983154, "global_step": 46686, "epoch": 1111} {"train_loss": -5.589808940887451, "global_step": 46687, "epoch": 1111} {"train_loss": -5.682214736938477, "global_step": 46688, "epoch": 1111} {"train_loss": -5.731509208679199, "global_step": 46689, "epoch": 1111} {"train_loss": -5.646209239959717, "global_step": 46690, "epoch": 1111} {"train_loss": -5.678203105926514, "global_step": 46691, "epoch": 1111} {"train_loss": -5.773828506469727, "global_step": 46692, "epoch": 1111} {"train_loss": -5.724262237548828, "global_step": 46693, "epoch": 1111} {"train_loss": -5.787550926208496, "global_step": 46694, "epoch": 1111} {"train_loss": -5.7665557861328125, "global_step": 46695, "epoch": 1111} {"train_loss": -5.547966957092285, "global_step": 46696, "epoch": 1111} {"train_loss": -5.662352085113525, "global_step": 46697, "epoch": 1111} {"train_loss": -5.895678520202637, "global_step": 46698, "epoch": 1111} {"train_loss": -5.679162979125977, "global_step": 46699, "epoch": 1111} {"train_loss": -5.7978010177612305, "global_step": 46700, "epoch": 1111} {"train_loss": -5.711519241333008, "global_step": 46701, "epoch": 1111} {"train_loss": -5.633133888244629, "global_step": 46702, "epoch": 1111} {"train_loss": -5.734416155588059, "global_step": 46703, "epoch": 1111, "val_loss": 74319.1953125} {"train_loss": -5.672798156738281, "global_step": 46704, "epoch": 1112} {"train_loss": -5.744805335998535, "global_step": 46705, "epoch": 1112} {"train_loss": -5.679754734039307, "global_step": 46706, "epoch": 1112} {"train_loss": -5.6233110427856445, "global_step": 46707, "epoch": 1112} {"train_loss": -5.744233131408691, "global_step": 46708, "epoch": 1112} {"train_loss": -5.671015739440918, "global_step": 46709, "epoch": 1112} {"train_loss": -5.6875433921813965, "global_step": 46710, "epoch": 1112} {"train_loss": -5.734297275543213, "global_step": 46711, "epoch": 1112} {"train_loss": -5.706372261047363, "global_step": 46712, "epoch": 1112} {"train_loss": -5.689111709594727, "global_step": 46713, "epoch": 1112} {"train_loss": -5.646234512329102, "global_step": 46714, "epoch": 1112} {"train_loss": -5.719379901885986, "global_step": 46715, "epoch": 1112} {"train_loss": -5.758752822875977, "global_step": 46716, "epoch": 1112} {"train_loss": -5.793430328369141, "global_step": 46717, "epoch": 1112} {"train_loss": -5.796770095825195, "global_step": 46718, "epoch": 1112} {"train_loss": -5.534134864807129, "global_step": 46719, "epoch": 1112} {"train_loss": -5.508762359619141, "global_step": 46720, "epoch": 1112} {"train_loss": -5.791049003601074, "global_step": 46721, "epoch": 1112} {"train_loss": -5.547008514404297, "global_step": 46722, "epoch": 1112} {"train_loss": -5.7094879150390625, "global_step": 46723, "epoch": 1112} {"train_loss": -5.659211158752441, "global_step": 46724, "epoch": 1112} {"train_loss": -5.592866897583008, "global_step": 46725, "epoch": 1112} {"train_loss": -5.600948333740234, "global_step": 46726, "epoch": 1112} {"train_loss": -5.7471747398376465, "global_step": 46727, "epoch": 1112} {"train_loss": -5.584939956665039, "global_step": 46728, "epoch": 1112} {"train_loss": -5.538985252380371, "global_step": 46729, "epoch": 1112} {"train_loss": -5.715421199798584, "global_step": 46730, "epoch": 1112} {"train_loss": -5.66080904006958, "global_step": 46731, "epoch": 1112} {"train_loss": -5.442881107330322, "global_step": 46732, "epoch": 1112} {"train_loss": -5.72696590423584, "global_step": 46733, "epoch": 1112} {"train_loss": -5.577123641967773, "global_step": 46734, "epoch": 1112} {"train_loss": -5.764634609222412, "global_step": 46735, "epoch": 1112} {"train_loss": -5.623525619506836, "global_step": 46736, "epoch": 1112} {"train_loss": -5.599319934844971, "global_step": 46737, "epoch": 1112} {"train_loss": -5.748157501220703, "global_step": 46738, "epoch": 1112} {"train_loss": -5.676974296569824, "global_step": 46739, "epoch": 1112} {"train_loss": -5.652217864990234, "global_step": 46740, "epoch": 1112} {"train_loss": -5.735126972198486, "global_step": 46741, "epoch": 1112} {"train_loss": -5.77080774307251, "global_step": 46742, "epoch": 1112} {"train_loss": -5.711114883422852, "global_step": 46743, "epoch": 1112} {"train_loss": -5.645845890045166, "global_step": 46744, "epoch": 1112} {"train_loss": -5.673298756281535, "global_step": 46745, "epoch": 1112, "val_loss": 74449.8046875} {"train_loss": -5.606491565704346, "global_step": 46746, "epoch": 1113} {"train_loss": -5.775630950927734, "global_step": 46747, "epoch": 1113} {"train_loss": -5.681501388549805, "global_step": 46748, "epoch": 1113} {"train_loss": -5.739824295043945, "global_step": 46749, "epoch": 1113} {"train_loss": -5.7645649909973145, "global_step": 46750, "epoch": 1113} {"train_loss": -5.603498458862305, "global_step": 46751, "epoch": 1113} {"train_loss": -5.685568809509277, "global_step": 46752, "epoch": 1113} {"train_loss": -5.6782097816467285, "global_step": 46753, "epoch": 1113} {"train_loss": -5.652310371398926, "global_step": 46754, "epoch": 1113} {"train_loss": -5.49996280670166, "global_step": 46755, "epoch": 1113} {"train_loss": -5.726083278656006, "global_step": 46756, "epoch": 1113} {"train_loss": -5.688784599304199, "global_step": 46757, "epoch": 1113} {"train_loss": -5.788332939147949, "global_step": 46758, "epoch": 1113} {"train_loss": -5.670869827270508, "global_step": 46759, "epoch": 1113} {"train_loss": -5.601874828338623, "global_step": 46760, "epoch": 1113} {"train_loss": -5.615815162658691, "global_step": 46761, "epoch": 1113} {"train_loss": -5.8064446449279785, "global_step": 46762, "epoch": 1113} {"train_loss": -5.570418357849121, "global_step": 46763, "epoch": 1113} {"train_loss": -5.558504581451416, "global_step": 46764, "epoch": 1113} {"train_loss": -5.512303829193115, "global_step": 46765, "epoch": 1113} {"train_loss": -5.642337799072266, "global_step": 46766, "epoch": 1113} {"train_loss": -5.660100936889648, "global_step": 46767, "epoch": 1113} {"train_loss": -5.5569610595703125, "global_step": 46768, "epoch": 1113} {"train_loss": -5.64592170715332, "global_step": 46769, "epoch": 1113} {"train_loss": -5.534348487854004, "global_step": 46770, "epoch": 1113} {"train_loss": -5.928145408630371, "global_step": 46771, "epoch": 1113} {"train_loss": -5.708154678344727, "global_step": 46772, "epoch": 1113} {"train_loss": -5.6549072265625, "global_step": 46773, "epoch": 1113} {"train_loss": -5.735909461975098, "global_step": 46774, "epoch": 1113} {"train_loss": -5.681868076324463, "global_step": 46775, "epoch": 1113} {"train_loss": -5.785297870635986, "global_step": 46776, "epoch": 1113} {"train_loss": -5.887727737426758, "global_step": 46777, "epoch": 1113} {"train_loss": -5.723393440246582, "global_step": 46778, "epoch": 1113} {"train_loss": -5.786985397338867, "global_step": 46779, "epoch": 1113} {"train_loss": -5.750327110290527, "global_step": 46780, "epoch": 1113} {"train_loss": -5.829301834106445, "global_step": 46781, "epoch": 1113} {"train_loss": -5.751869201660156, "global_step": 46782, "epoch": 1113} {"train_loss": -5.711244106292725, "global_step": 46783, "epoch": 1113} {"train_loss": -5.8035478591918945, "global_step": 46784, "epoch": 1113} {"train_loss": -5.653434753417969, "global_step": 46785, "epoch": 1113} {"train_loss": -5.714831829071045, "global_step": 46786, "epoch": 1113} {"train_loss": -5.693978741055443, "global_step": 46787, "epoch": 1113, "val_loss": 74118.1484375} {"train_loss": -5.689054489135742, "global_step": 46788, "epoch": 1114} {"train_loss": -5.649299621582031, "global_step": 46789, "epoch": 1114} {"train_loss": -5.644740104675293, "global_step": 46790, "epoch": 1114} {"train_loss": -5.784913063049316, "global_step": 46791, "epoch": 1114} {"train_loss": -5.617987632751465, "global_step": 46792, "epoch": 1114} {"train_loss": -5.818785667419434, "global_step": 46793, "epoch": 1114} {"train_loss": -5.635140419006348, "global_step": 46794, "epoch": 1114} {"train_loss": -5.6963276863098145, "global_step": 46795, "epoch": 1114} {"train_loss": -5.644269943237305, "global_step": 46796, "epoch": 1114} {"train_loss": -5.724913120269775, "global_step": 46797, "epoch": 1114} {"train_loss": -5.807918071746826, "global_step": 46798, "epoch": 1114} {"train_loss": -5.695176601409912, "global_step": 46799, "epoch": 1114} {"train_loss": -5.646218299865723, "global_step": 46800, "epoch": 1114} {"train_loss": -5.746439456939697, "global_step": 46801, "epoch": 1114} {"train_loss": -5.669861793518066, "global_step": 46802, "epoch": 1114} {"train_loss": -5.628260612487793, "global_step": 46803, "epoch": 1114} {"train_loss": -5.65629768371582, "global_step": 46804, "epoch": 1114} {"train_loss": -5.621132850646973, "global_step": 46805, "epoch": 1114} {"train_loss": -5.7339558601379395, "global_step": 46806, "epoch": 1114} {"train_loss": -5.680551528930664, "global_step": 46807, "epoch": 1114} {"train_loss": -5.718474388122559, "global_step": 46808, "epoch": 1114} {"train_loss": -5.624663352966309, "global_step": 46809, "epoch": 1114} {"train_loss": -5.571059226989746, "global_step": 46810, "epoch": 1114} {"train_loss": -5.758776664733887, "global_step": 46811, "epoch": 1114} {"train_loss": -5.496666431427002, "global_step": 46812, "epoch": 1114} {"train_loss": -5.643192768096924, "global_step": 46813, "epoch": 1114} {"train_loss": -5.655608177185059, "global_step": 46814, "epoch": 1114} {"train_loss": -5.561783790588379, "global_step": 46815, "epoch": 1114} {"train_loss": -5.690641403198242, "global_step": 46816, "epoch": 1114} {"train_loss": -5.575732707977295, "global_step": 46817, "epoch": 1114} {"train_loss": -5.665129661560059, "global_step": 46818, "epoch": 1114} {"train_loss": -5.605624198913574, "global_step": 46819, "epoch": 1114} {"train_loss": -5.541788101196289, "global_step": 46820, "epoch": 1114} {"train_loss": -5.583956241607666, "global_step": 46821, "epoch": 1114} {"train_loss": -5.6112961769104, "global_step": 46822, "epoch": 1114} {"train_loss": -5.740113258361816, "global_step": 46823, "epoch": 1114} {"train_loss": -5.660072326660156, "global_step": 46824, "epoch": 1114} {"train_loss": -5.712789058685303, "global_step": 46825, "epoch": 1114} {"train_loss": -5.508847236633301, "global_step": 46826, "epoch": 1114} {"train_loss": -5.686676025390625, "global_step": 46827, "epoch": 1114} {"train_loss": -5.5649871826171875, "global_step": 46828, "epoch": 1114} {"train_loss": -5.656674260184879, "global_step": 46829, "epoch": 1114, "val_loss": 74122.765625} {"train_loss": -5.5093817710876465, "global_step": 46830, "epoch": 1115} {"train_loss": -5.516490459442139, "global_step": 46831, "epoch": 1115} {"train_loss": -5.689142227172852, "global_step": 46832, "epoch": 1115} {"train_loss": -5.565217971801758, "global_step": 46833, "epoch": 1115} {"train_loss": -5.699476718902588, "global_step": 46834, "epoch": 1115} {"train_loss": -5.619756698608398, "global_step": 46835, "epoch": 1115} {"train_loss": -5.675527095794678, "global_step": 46836, "epoch": 1115} {"train_loss": -5.607147693634033, "global_step": 46837, "epoch": 1115} {"train_loss": -5.749239444732666, "global_step": 46838, "epoch": 1115} {"train_loss": -5.584068298339844, "global_step": 46839, "epoch": 1115} {"train_loss": -5.630671977996826, "global_step": 46840, "epoch": 1115} {"train_loss": -5.656314849853516, "global_step": 46841, "epoch": 1115} {"train_loss": -5.636305809020996, "global_step": 46842, "epoch": 1115} {"train_loss": -5.627260208129883, "global_step": 46843, "epoch": 1115} {"train_loss": -5.698558807373047, "global_step": 46844, "epoch": 1115} {"train_loss": -5.6801581382751465, "global_step": 46845, "epoch": 1115} {"train_loss": -5.707253932952881, "global_step": 46846, "epoch": 1115} {"train_loss": -5.812285423278809, "global_step": 46847, "epoch": 1115} {"train_loss": -5.700141429901123, "global_step": 46848, "epoch": 1115} {"train_loss": -5.782500743865967, "global_step": 46849, "epoch": 1115} {"train_loss": -5.836723327636719, "global_step": 46850, "epoch": 1115} {"train_loss": -5.798419952392578, "global_step": 46851, "epoch": 1115} {"train_loss": -5.740640640258789, "global_step": 46852, "epoch": 1115} {"train_loss": -5.621715545654297, "global_step": 46853, "epoch": 1115} {"train_loss": -5.7736430168151855, "global_step": 46854, "epoch": 1115} {"train_loss": -5.665082931518555, "global_step": 46855, "epoch": 1115} {"train_loss": -5.749734878540039, "global_step": 46856, "epoch": 1115} {"train_loss": -5.729977130889893, "global_step": 46857, "epoch": 1115} {"train_loss": -5.744237899780273, "global_step": 46858, "epoch": 1115} {"train_loss": -5.81566858291626, "global_step": 46859, "epoch": 1115} {"train_loss": -5.676252365112305, "global_step": 46860, "epoch": 1115} {"train_loss": -5.613781452178955, "global_step": 46861, "epoch": 1115} {"train_loss": -5.640045642852783, "global_step": 46862, "epoch": 1115} {"train_loss": -5.774381160736084, "global_step": 46863, "epoch": 1115} {"train_loss": -5.778897285461426, "global_step": 46864, "epoch": 1115} {"train_loss": -5.675413608551025, "global_step": 46865, "epoch": 1115} {"train_loss": -5.696235656738281, "global_step": 46866, "epoch": 1115} {"train_loss": -5.688661575317383, "global_step": 46867, "epoch": 1115} {"train_loss": -5.681118488311768, "global_step": 46868, "epoch": 1115} {"train_loss": -5.764284133911133, "global_step": 46869, "epoch": 1115} {"train_loss": -5.727952480316162, "global_step": 46870, "epoch": 1115} {"train_loss": -5.691119035085042, "global_step": 46871, "epoch": 1115, "val_loss": 74005.84375} {"train_loss": -5.750510215759277, "global_step": 46872, "epoch": 1116} {"train_loss": -5.816127300262451, "global_step": 46873, "epoch": 1116} {"train_loss": -5.604565143585205, "global_step": 46874, "epoch": 1116} {"train_loss": -5.7238359451293945, "global_step": 46875, "epoch": 1116} {"train_loss": -5.803367614746094, "global_step": 46876, "epoch": 1116} {"train_loss": -5.716373920440674, "global_step": 46877, "epoch": 1116} {"train_loss": -5.685690402984619, "global_step": 46878, "epoch": 1116} {"train_loss": -5.716677665710449, "global_step": 46879, "epoch": 1116} {"train_loss": -5.671184539794922, "global_step": 46880, "epoch": 1116} {"train_loss": -5.710740566253662, "global_step": 46881, "epoch": 1116} {"train_loss": -5.767487525939941, "global_step": 46882, "epoch": 1116} {"train_loss": -5.692826747894287, "global_step": 46883, "epoch": 1116} {"train_loss": -5.808612823486328, "global_step": 46884, "epoch": 1116} {"train_loss": -5.806344985961914, "global_step": 46885, "epoch": 1116} {"train_loss": -5.6881561279296875, "global_step": 46886, "epoch": 1116} {"train_loss": -5.732666492462158, "global_step": 46887, "epoch": 1116} {"train_loss": -5.73009729385376, "global_step": 46888, "epoch": 1116} {"train_loss": -5.6703715324401855, "global_step": 46889, "epoch": 1116} {"train_loss": -5.753501892089844, "global_step": 46890, "epoch": 1116} {"train_loss": -5.689363479614258, "global_step": 46891, "epoch": 1116} {"train_loss": -5.755498886108398, "global_step": 46892, "epoch": 1116} {"train_loss": -5.75309944152832, "global_step": 46893, "epoch": 1116} {"train_loss": -5.746589660644531, "global_step": 46894, "epoch": 1116} {"train_loss": -5.631889343261719, "global_step": 46895, "epoch": 1116} {"train_loss": -5.730422496795654, "global_step": 46896, "epoch": 1116} {"train_loss": -5.7517828941345215, "global_step": 46897, "epoch": 1116} {"train_loss": -5.712677001953125, "global_step": 46898, "epoch": 1116} {"train_loss": -5.558091163635254, "global_step": 46899, "epoch": 1116} {"train_loss": -5.66916036605835, "global_step": 46900, "epoch": 1116} {"train_loss": -5.7095866203308105, "global_step": 46901, "epoch": 1116} {"train_loss": -5.763348579406738, "global_step": 46902, "epoch": 1116} {"train_loss": -5.589719772338867, "global_step": 46903, "epoch": 1116} {"train_loss": -5.738327503204346, "global_step": 46904, "epoch": 1116} {"train_loss": -5.618204116821289, "global_step": 46905, "epoch": 1116} {"train_loss": -5.683524131774902, "global_step": 46906, "epoch": 1116} {"train_loss": -5.704150199890137, "global_step": 46907, "epoch": 1116} {"train_loss": -5.7001872062683105, "global_step": 46908, "epoch": 1116} {"train_loss": -5.802079677581787, "global_step": 46909, "epoch": 1116} {"train_loss": -5.793004989624023, "global_step": 46910, "epoch": 1116} {"train_loss": -5.6689324378967285, "global_step": 46911, "epoch": 1116} {"train_loss": -5.679957866668701, "global_step": 46912, "epoch": 1116} {"train_loss": -5.709057694389706, "global_step": 46913, "epoch": 1116, "val_loss": 74421.2578125} {"train_loss": -5.609684944152832, "global_step": 46914, "epoch": 1117} {"train_loss": -5.789071559906006, "global_step": 46915, "epoch": 1117} {"train_loss": -5.668498992919922, "global_step": 46916, "epoch": 1117} {"train_loss": -5.826363563537598, "global_step": 46917, "epoch": 1117} {"train_loss": -5.546817302703857, "global_step": 46918, "epoch": 1117} {"train_loss": -5.690555572509766, "global_step": 46919, "epoch": 1117} {"train_loss": -5.606060028076172, "global_step": 46920, "epoch": 1117} {"train_loss": -5.584258079528809, "global_step": 46921, "epoch": 1117} {"train_loss": -5.736064434051514, "global_step": 46922, "epoch": 1117} {"train_loss": -5.67436408996582, "global_step": 46923, "epoch": 1117} {"train_loss": -5.702149391174316, "global_step": 46924, "epoch": 1117} {"train_loss": -5.604734897613525, "global_step": 46925, "epoch": 1117} {"train_loss": -5.638795375823975, "global_step": 46926, "epoch": 1117} {"train_loss": -5.709155082702637, "global_step": 46927, "epoch": 1117} {"train_loss": -5.61309814453125, "global_step": 46928, "epoch": 1117} {"train_loss": -5.618696212768555, "global_step": 46929, "epoch": 1117} {"train_loss": -5.768671989440918, "global_step": 46930, "epoch": 1117} {"train_loss": -5.705864906311035, "global_step": 46931, "epoch": 1117} {"train_loss": -5.797993183135986, "global_step": 46932, "epoch": 1117} {"train_loss": -5.554296016693115, "global_step": 46933, "epoch": 1117} {"train_loss": -5.749687671661377, "global_step": 46934, "epoch": 1117} {"train_loss": -5.7500176429748535, "global_step": 46935, "epoch": 1117} {"train_loss": -5.690991401672363, "global_step": 46936, "epoch": 1117} {"train_loss": -5.781064987182617, "global_step": 46937, "epoch": 1117} {"train_loss": -5.683510780334473, "global_step": 46938, "epoch": 1117} {"train_loss": -5.735781192779541, "global_step": 46939, "epoch": 1117} {"train_loss": -5.76834774017334, "global_step": 46940, "epoch": 1117} {"train_loss": -5.839895248413086, "global_step": 46941, "epoch": 1117} {"train_loss": -5.678759574890137, "global_step": 46942, "epoch": 1117} {"train_loss": -5.724761962890625, "global_step": 46943, "epoch": 1117} {"train_loss": -5.748247146606445, "global_step": 46944, "epoch": 1117} {"train_loss": -5.751332759857178, "global_step": 46945, "epoch": 1117} {"train_loss": -5.6294264793396, "global_step": 46946, "epoch": 1117} {"train_loss": -5.6464948654174805, "global_step": 46947, "epoch": 1117} {"train_loss": -5.830297470092773, "global_step": 46948, "epoch": 1117} {"train_loss": -5.716172695159912, "global_step": 46949, "epoch": 1117} {"train_loss": -5.783651351928711, "global_step": 46950, "epoch": 1117} {"train_loss": -5.765398025512695, "global_step": 46951, "epoch": 1117} {"train_loss": -5.7699480056762695, "global_step": 46952, "epoch": 1117} {"train_loss": -5.851950645446777, "global_step": 46953, "epoch": 1117} {"train_loss": -5.667703628540039, "global_step": 46954, "epoch": 1117} {"train_loss": -5.706261612120128, "global_step": 46955, "epoch": 1117, "val_loss": 73871.7109375} {"train_loss": -5.796870231628418, "global_step": 46956, "epoch": 1118} {"train_loss": -5.617918014526367, "global_step": 46957, "epoch": 1118} {"train_loss": -5.703708648681641, "global_step": 46958, "epoch": 1118} {"train_loss": -5.75364351272583, "global_step": 46959, "epoch": 1118} {"train_loss": -5.796958923339844, "global_step": 46960, "epoch": 1118} {"train_loss": -5.5060577392578125, "global_step": 46961, "epoch": 1118} {"train_loss": -5.568338394165039, "global_step": 46962, "epoch": 1118} {"train_loss": -5.7028045654296875, "global_step": 46963, "epoch": 1118} {"train_loss": -5.670316219329834, "global_step": 46964, "epoch": 1118} {"train_loss": -5.643210411071777, "global_step": 46965, "epoch": 1118} {"train_loss": -5.749248504638672, "global_step": 46966, "epoch": 1118} {"train_loss": -5.6087212562561035, "global_step": 46967, "epoch": 1118} {"train_loss": -5.730111122131348, "global_step": 46968, "epoch": 1118} {"train_loss": -5.738890647888184, "global_step": 46969, "epoch": 1118} {"train_loss": -5.580547332763672, "global_step": 46970, "epoch": 1118} {"train_loss": -5.686336517333984, "global_step": 46971, "epoch": 1118} {"train_loss": -5.6559739112854, "global_step": 46972, "epoch": 1118} {"train_loss": -5.740024089813232, "global_step": 46973, "epoch": 1118} {"train_loss": -5.560855865478516, "global_step": 46974, "epoch": 1118} {"train_loss": -5.597670555114746, "global_step": 46975, "epoch": 1118} {"train_loss": -5.69669771194458, "global_step": 46976, "epoch": 1118} {"train_loss": -5.6517839431762695, "global_step": 46977, "epoch": 1118} {"train_loss": -5.734011650085449, "global_step": 46978, "epoch": 1118} {"train_loss": -5.708099842071533, "global_step": 46979, "epoch": 1118} {"train_loss": -5.780478000640869, "global_step": 46980, "epoch": 1118} {"train_loss": -5.6443634033203125, "global_step": 46981, "epoch": 1118} {"train_loss": -5.659610748291016, "global_step": 46982, "epoch": 1118} {"train_loss": -5.714465141296387, "global_step": 46983, "epoch": 1118} {"train_loss": -5.615211009979248, "global_step": 46984, "epoch": 1118} {"train_loss": -5.739335060119629, "global_step": 46985, "epoch": 1118} {"train_loss": -5.6998748779296875, "global_step": 46986, "epoch": 1118} {"train_loss": -5.7784881591796875, "global_step": 46987, "epoch": 1118} {"train_loss": -5.689785003662109, "global_step": 46988, "epoch": 1118} {"train_loss": -5.60979700088501, "global_step": 46989, "epoch": 1118} {"train_loss": -5.78181266784668, "global_step": 46990, "epoch": 1118} {"train_loss": -5.8756256103515625, "global_step": 46991, "epoch": 1118} {"train_loss": -5.8029890060424805, "global_step": 46992, "epoch": 1118} {"train_loss": -5.709827899932861, "global_step": 46993, "epoch": 1118} {"train_loss": -5.7785515785217285, "global_step": 46994, "epoch": 1118} {"train_loss": -5.685471534729004, "global_step": 46995, "epoch": 1118} {"train_loss": -5.777873992919922, "global_step": 46996, "epoch": 1118} {"train_loss": -5.697779723576137, "global_step": 46997, "epoch": 1118, "val_loss": 74346.6328125} {"train_loss": -5.783498764038086, "global_step": 46998, "epoch": 1119} {"train_loss": -5.709410667419434, "global_step": 46999, "epoch": 1119} {"train_loss": -5.777379035949707, "global_step": 47000, "epoch": 1119} {"train_loss": -5.763309478759766, "global_step": 47001, "epoch": 1119} {"train_loss": -5.7921247482299805, "global_step": 47002, "epoch": 1119} {"train_loss": -5.760486602783203, "global_step": 47003, "epoch": 1119} {"train_loss": -5.664714813232422, "global_step": 47004, "epoch": 1119} {"train_loss": -5.8169846534729, "global_step": 47005, "epoch": 1119} {"train_loss": -5.649885654449463, "global_step": 47006, "epoch": 1119} {"train_loss": -5.752048969268799, "global_step": 47007, "epoch": 1119} {"train_loss": -5.816544055938721, "global_step": 47008, "epoch": 1119} {"train_loss": -5.766506195068359, "global_step": 47009, "epoch": 1119} {"train_loss": -5.8509674072265625, "global_step": 47010, "epoch": 1119} {"train_loss": -5.745240688323975, "global_step": 47011, "epoch": 1119} {"train_loss": -5.744415283203125, "global_step": 47012, "epoch": 1119} {"train_loss": -5.823166847229004, "global_step": 47013, "epoch": 1119} {"train_loss": -5.839766979217529, "global_step": 47014, "epoch": 1119} {"train_loss": -5.7612528800964355, "global_step": 47015, "epoch": 1119} {"train_loss": -5.694957733154297, "global_step": 47016, "epoch": 1119} {"train_loss": -5.681518077850342, "global_step": 47017, "epoch": 1119} {"train_loss": -5.87301778793335, "global_step": 47018, "epoch": 1119} {"train_loss": -5.780650615692139, "global_step": 47019, "epoch": 1119} {"train_loss": -5.731555938720703, "global_step": 47020, "epoch": 1119} {"train_loss": -5.694212436676025, "global_step": 47021, "epoch": 1119} {"train_loss": -5.695106506347656, "global_step": 47022, "epoch": 1119} {"train_loss": -5.670456886291504, "global_step": 47023, "epoch": 1119} {"train_loss": -5.825752258300781, "global_step": 47024, "epoch": 1119} {"train_loss": -5.853562831878662, "global_step": 47025, "epoch": 1119} {"train_loss": -5.666094779968262, "global_step": 47026, "epoch": 1119} {"train_loss": -5.608377456665039, "global_step": 47027, "epoch": 1119} {"train_loss": -5.6741251945495605, "global_step": 47028, "epoch": 1119} {"train_loss": -5.76896858215332, "global_step": 47029, "epoch": 1119} {"train_loss": -5.7616095542907715, "global_step": 47030, "epoch": 1119} {"train_loss": -5.778679847717285, "global_step": 47031, "epoch": 1119} {"train_loss": -5.840517044067383, "global_step": 47032, "epoch": 1119} {"train_loss": -5.775534629821777, "global_step": 47033, "epoch": 1119} {"train_loss": -5.768715858459473, "global_step": 47034, "epoch": 1119} {"train_loss": -5.668445587158203, "global_step": 47035, "epoch": 1119} {"train_loss": -5.687212944030762, "global_step": 47036, "epoch": 1119} {"train_loss": -5.830697536468506, "global_step": 47037, "epoch": 1119} {"train_loss": -5.792181968688965, "global_step": 47038, "epoch": 1119} {"train_loss": -5.753407444272723, "global_step": 47039, "epoch": 1119, "val_loss": 74113.15625} {"train_loss": -5.645257949829102, "global_step": 47040, "epoch": 1120} {"train_loss": -5.806984901428223, "global_step": 47041, "epoch": 1120} {"train_loss": -5.738414287567139, "global_step": 47042, "epoch": 1120} {"train_loss": -5.667521953582764, "global_step": 47043, "epoch": 1120} {"train_loss": -5.71230411529541, "global_step": 47044, "epoch": 1120} {"train_loss": -5.830379486083984, "global_step": 47045, "epoch": 1120} {"train_loss": -5.652266502380371, "global_step": 47046, "epoch": 1120} {"train_loss": -5.622827053070068, "global_step": 47047, "epoch": 1120} {"train_loss": -5.653764724731445, "global_step": 47048, "epoch": 1120} {"train_loss": -5.709493637084961, "global_step": 47049, "epoch": 1120} {"train_loss": -5.689411163330078, "global_step": 47050, "epoch": 1120} {"train_loss": -5.667638778686523, "global_step": 47051, "epoch": 1120} {"train_loss": -5.672306537628174, "global_step": 47052, "epoch": 1120} {"train_loss": -5.6958909034729, "global_step": 47053, "epoch": 1120} {"train_loss": -5.681140899658203, "global_step": 47054, "epoch": 1120} {"train_loss": -5.786147594451904, "global_step": 47055, "epoch": 1120} {"train_loss": -5.562900066375732, "global_step": 47056, "epoch": 1120} {"train_loss": -5.78986930847168, "global_step": 47057, "epoch": 1120} {"train_loss": -5.618247985839844, "global_step": 47058, "epoch": 1120} {"train_loss": -5.74114465713501, "global_step": 47059, "epoch": 1120} {"train_loss": -5.742408752441406, "global_step": 47060, "epoch": 1120} {"train_loss": -5.650681495666504, "global_step": 47061, "epoch": 1120} {"train_loss": -5.69687557220459, "global_step": 47062, "epoch": 1120} {"train_loss": -5.635528564453125, "global_step": 47063, "epoch": 1120} {"train_loss": -5.6625776290893555, "global_step": 47064, "epoch": 1120} {"train_loss": -5.733888626098633, "global_step": 47065, "epoch": 1120} {"train_loss": -5.614867210388184, "global_step": 47066, "epoch": 1120} {"train_loss": -5.766111373901367, "global_step": 47067, "epoch": 1120} {"train_loss": -5.673759460449219, "global_step": 47068, "epoch": 1120} {"train_loss": -5.725680351257324, "global_step": 47069, "epoch": 1120} {"train_loss": -5.70808219909668, "global_step": 47070, "epoch": 1120} {"train_loss": -5.782605171203613, "global_step": 47071, "epoch": 1120} {"train_loss": -5.651134014129639, "global_step": 47072, "epoch": 1120} {"train_loss": -5.713024139404297, "global_step": 47073, "epoch": 1120} {"train_loss": -5.703077793121338, "global_step": 47074, "epoch": 1120} {"train_loss": -5.636187553405762, "global_step": 47075, "epoch": 1120} {"train_loss": -5.862003803253174, "global_step": 47076, "epoch": 1120} {"train_loss": -5.909873008728027, "global_step": 47077, "epoch": 1120} {"train_loss": -5.835602283477783, "global_step": 47078, "epoch": 1120} {"train_loss": -5.8761491775512695, "global_step": 47079, "epoch": 1120} {"train_loss": -5.663042068481445, "global_step": 47080, "epoch": 1120} {"train_loss": -5.711172058468773, "global_step": 47081, "epoch": 1120, "val_loss": 74158.7890625} {"train_loss": -5.690503120422363, "global_step": 47082, "epoch": 1121} {"train_loss": -5.648462295532227, "global_step": 47083, "epoch": 1121} {"train_loss": -5.609353065490723, "global_step": 47084, "epoch": 1121} {"train_loss": -5.496189117431641, "global_step": 47085, "epoch": 1121} {"train_loss": -5.733059883117676, "global_step": 47086, "epoch": 1121} {"train_loss": -5.7961745262146, "global_step": 47087, "epoch": 1121} {"train_loss": -5.680777072906494, "global_step": 47088, "epoch": 1121} {"train_loss": -5.680577278137207, "global_step": 47089, "epoch": 1121} {"train_loss": -5.742733001708984, "global_step": 47090, "epoch": 1121} {"train_loss": -5.706411838531494, "global_step": 47091, "epoch": 1121} {"train_loss": -5.7656755447387695, "global_step": 47092, "epoch": 1121} {"train_loss": -5.628196716308594, "global_step": 47093, "epoch": 1121} {"train_loss": -5.751931190490723, "global_step": 47094, "epoch": 1121} {"train_loss": -5.796538352966309, "global_step": 47095, "epoch": 1121} {"train_loss": -5.806400299072266, "global_step": 47096, "epoch": 1121} {"train_loss": -5.707453727722168, "global_step": 47097, "epoch": 1121} {"train_loss": -5.641289710998535, "global_step": 47098, "epoch": 1121} {"train_loss": -5.859679222106934, "global_step": 47099, "epoch": 1121} {"train_loss": -5.697678089141846, "global_step": 47100, "epoch": 1121} {"train_loss": -5.70699405670166, "global_step": 47101, "epoch": 1121} {"train_loss": -5.851876735687256, "global_step": 47102, "epoch": 1121} {"train_loss": -5.668881416320801, "global_step": 47103, "epoch": 1121} {"train_loss": -5.686341762542725, "global_step": 47104, "epoch": 1121} {"train_loss": -5.540139675140381, "global_step": 47105, "epoch": 1121} {"train_loss": -5.723238945007324, "global_step": 47106, "epoch": 1121} {"train_loss": -5.733584403991699, "global_step": 47107, "epoch": 1121} {"train_loss": -5.784436225891113, "global_step": 47108, "epoch": 1121} {"train_loss": -5.863929748535156, "global_step": 47109, "epoch": 1121} {"train_loss": -5.878912448883057, "global_step": 47110, "epoch": 1121} {"train_loss": -5.807655334472656, "global_step": 47111, "epoch": 1121} {"train_loss": -5.7552361488342285, "global_step": 47112, "epoch": 1121} {"train_loss": -5.6531171798706055, "global_step": 47113, "epoch": 1121} {"train_loss": -5.776925563812256, "global_step": 47114, "epoch": 1121} {"train_loss": -5.625196933746338, "global_step": 47115, "epoch": 1121} {"train_loss": -5.800324440002441, "global_step": 47116, "epoch": 1121} {"train_loss": -5.7705230712890625, "global_step": 47117, "epoch": 1121} {"train_loss": -5.777301788330078, "global_step": 47118, "epoch": 1121} {"train_loss": -5.7694783210754395, "global_step": 47119, "epoch": 1121} {"train_loss": -5.662342548370361, "global_step": 47120, "epoch": 1121} {"train_loss": -5.840181827545166, "global_step": 47121, "epoch": 1121} {"train_loss": -5.756423473358154, "global_step": 47122, "epoch": 1121} {"train_loss": -5.727587370645432, "global_step": 47123, "epoch": 1121, "val_loss": 73978.421875} {"train_loss": -5.741942882537842, "global_step": 47124, "epoch": 1122} {"train_loss": -5.7632246017456055, "global_step": 47125, "epoch": 1122} {"train_loss": -5.711925506591797, "global_step": 47126, "epoch": 1122} {"train_loss": -5.811012268066406, "global_step": 47127, "epoch": 1122} {"train_loss": -5.728652000427246, "global_step": 47128, "epoch": 1122} {"train_loss": -5.671804904937744, "global_step": 47129, "epoch": 1122} {"train_loss": -5.908539295196533, "global_step": 47130, "epoch": 1122} {"train_loss": -5.824347496032715, "global_step": 47131, "epoch": 1122} {"train_loss": -5.724445819854736, "global_step": 47132, "epoch": 1122} {"train_loss": -5.8139801025390625, "global_step": 47133, "epoch": 1122} {"train_loss": -5.765985012054443, "global_step": 47134, "epoch": 1122} {"train_loss": -5.748776435852051, "global_step": 47135, "epoch": 1122} {"train_loss": -5.7326154708862305, "global_step": 47136, "epoch": 1122} {"train_loss": -5.77242374420166, "global_step": 47137, "epoch": 1122} {"train_loss": -5.925015449523926, "global_step": 47138, "epoch": 1122} {"train_loss": -5.763441562652588, "global_step": 47139, "epoch": 1122} {"train_loss": -5.7200469970703125, "global_step": 47140, "epoch": 1122} {"train_loss": -5.735707759857178, "global_step": 47141, "epoch": 1122} {"train_loss": -5.723173141479492, "global_step": 47142, "epoch": 1122} {"train_loss": -5.798171043395996, "global_step": 47143, "epoch": 1122} {"train_loss": -5.730452537536621, "global_step": 47144, "epoch": 1122} {"train_loss": -5.7154622077941895, "global_step": 47145, "epoch": 1122} {"train_loss": -5.805601119995117, "global_step": 47146, "epoch": 1122} {"train_loss": -5.798172950744629, "global_step": 47147, "epoch": 1122} {"train_loss": -5.775794506072998, "global_step": 47148, "epoch": 1122} {"train_loss": -5.73944091796875, "global_step": 47149, "epoch": 1122} {"train_loss": -5.567994594573975, "global_step": 47150, "epoch": 1122} {"train_loss": -5.700972080230713, "global_step": 47151, "epoch": 1122} {"train_loss": -5.584790229797363, "global_step": 47152, "epoch": 1122} {"train_loss": -5.688738822937012, "global_step": 47153, "epoch": 1122} {"train_loss": -5.776677131652832, "global_step": 47154, "epoch": 1122} {"train_loss": -5.758878707885742, "global_step": 47155, "epoch": 1122} {"train_loss": -5.700606346130371, "global_step": 47156, "epoch": 1122} {"train_loss": -5.714258193969727, "global_step": 47157, "epoch": 1122} {"train_loss": -5.750480651855469, "global_step": 47158, "epoch": 1122} {"train_loss": -5.752918720245361, "global_step": 47159, "epoch": 1122} {"train_loss": -5.728090763092041, "global_step": 47160, "epoch": 1122} {"train_loss": -5.694218158721924, "global_step": 47161, "epoch": 1122} {"train_loss": -5.794702053070068, "global_step": 47162, "epoch": 1122} {"train_loss": -5.803518295288086, "global_step": 47163, "epoch": 1122} {"train_loss": -5.677419185638428, "global_step": 47164, "epoch": 1122} {"train_loss": -5.748637585412888, "global_step": 47165, "epoch": 1122, "val_loss": 74083.578125} {"train_loss": -5.8956828117370605, "global_step": 47166, "epoch": 1123} {"train_loss": -5.613155841827393, "global_step": 47167, "epoch": 1123} {"train_loss": -5.727870941162109, "global_step": 47168, "epoch": 1123} {"train_loss": -5.750070571899414, "global_step": 47169, "epoch": 1123} {"train_loss": -5.647853374481201, "global_step": 47170, "epoch": 1123} {"train_loss": -5.844890594482422, "global_step": 47171, "epoch": 1123} {"train_loss": -5.831025123596191, "global_step": 47172, "epoch": 1123} {"train_loss": -5.7086615562438965, "global_step": 47173, "epoch": 1123} {"train_loss": -5.84027624130249, "global_step": 47174, "epoch": 1123} {"train_loss": -5.604227066040039, "global_step": 47175, "epoch": 1123} {"train_loss": -5.73029899597168, "global_step": 47176, "epoch": 1123} {"train_loss": -5.744061470031738, "global_step": 47177, "epoch": 1123} {"train_loss": -5.790652751922607, "global_step": 47178, "epoch": 1123} {"train_loss": -5.688032150268555, "global_step": 47179, "epoch": 1123} {"train_loss": -5.762761116027832, "global_step": 47180, "epoch": 1123} {"train_loss": -5.7363152503967285, "global_step": 47181, "epoch": 1123} {"train_loss": -5.813248157501221, "global_step": 47182, "epoch": 1123} {"train_loss": -5.7401251792907715, "global_step": 47183, "epoch": 1123} {"train_loss": -5.873325347900391, "global_step": 47184, "epoch": 1123} {"train_loss": -5.735838890075684, "global_step": 47185, "epoch": 1123} {"train_loss": -5.705876350402832, "global_step": 47186, "epoch": 1123} {"train_loss": -5.801278591156006, "global_step": 47187, "epoch": 1123} {"train_loss": -5.811594486236572, "global_step": 47188, "epoch": 1123} {"train_loss": -5.7424468994140625, "global_step": 47189, "epoch": 1123} {"train_loss": -5.747446060180664, "global_step": 47190, "epoch": 1123} {"train_loss": -5.724826812744141, "global_step": 47191, "epoch": 1123} {"train_loss": -5.862306594848633, "global_step": 47192, "epoch": 1123} {"train_loss": -5.88509464263916, "global_step": 47193, "epoch": 1123} {"train_loss": -5.711942672729492, "global_step": 47194, "epoch": 1123} {"train_loss": -5.72133731842041, "global_step": 47195, "epoch": 1123} {"train_loss": -5.755577087402344, "global_step": 47196, "epoch": 1123} {"train_loss": -5.789980888366699, "global_step": 47197, "epoch": 1123} {"train_loss": -5.7449798583984375, "global_step": 47198, "epoch": 1123} {"train_loss": -5.871585369110107, "global_step": 47199, "epoch": 1123} {"train_loss": -5.690646171569824, "global_step": 47200, "epoch": 1123} {"train_loss": -5.727077484130859, "global_step": 47201, "epoch": 1123} {"train_loss": -5.627275466918945, "global_step": 47202, "epoch": 1123} {"train_loss": -5.770356178283691, "global_step": 47203, "epoch": 1123} {"train_loss": -5.630408763885498, "global_step": 47204, "epoch": 1123} {"train_loss": -5.617100715637207, "global_step": 47205, "epoch": 1123} {"train_loss": -5.705221176147461, "global_step": 47206, "epoch": 1123} {"train_loss": -5.748090653192429, "global_step": 47207, "epoch": 1123, "val_loss": 73664.0078125} {"train_loss": -5.729382514953613, "global_step": 47208, "epoch": 1124} {"train_loss": -5.690812110900879, "global_step": 47209, "epoch": 1124} {"train_loss": -5.6566386222839355, "global_step": 47210, "epoch": 1124} {"train_loss": -5.608368873596191, "global_step": 47211, "epoch": 1124} {"train_loss": -5.697895050048828, "global_step": 47212, "epoch": 1124} {"train_loss": -5.8703765869140625, "global_step": 47213, "epoch": 1124} {"train_loss": -5.7004289627075195, "global_step": 47214, "epoch": 1124} {"train_loss": -5.863260269165039, "global_step": 47215, "epoch": 1124} {"train_loss": -5.77082633972168, "global_step": 47216, "epoch": 1124} {"train_loss": -5.733404636383057, "global_step": 47217, "epoch": 1124} {"train_loss": -5.745019912719727, "global_step": 47218, "epoch": 1124} {"train_loss": -5.806493759155273, "global_step": 47219, "epoch": 1124} {"train_loss": -5.662518501281738, "global_step": 47220, "epoch": 1124} {"train_loss": -5.790163040161133, "global_step": 47221, "epoch": 1124} {"train_loss": -5.713415145874023, "global_step": 47222, "epoch": 1124} {"train_loss": -5.8736419677734375, "global_step": 47223, "epoch": 1124} {"train_loss": -5.736900806427002, "global_step": 47224, "epoch": 1124} {"train_loss": -5.566796779632568, "global_step": 47225, "epoch": 1124} {"train_loss": -5.793842315673828, "global_step": 47226, "epoch": 1124} {"train_loss": -5.813220024108887, "global_step": 47227, "epoch": 1124} {"train_loss": -5.632514476776123, "global_step": 47228, "epoch": 1124} {"train_loss": -5.7301788330078125, "global_step": 47229, "epoch": 1124} {"train_loss": -5.91360330581665, "global_step": 47230, "epoch": 1124} {"train_loss": -5.745855808258057, "global_step": 47231, "epoch": 1124} {"train_loss": -5.668022155761719, "global_step": 47232, "epoch": 1124} {"train_loss": -5.737811088562012, "global_step": 47233, "epoch": 1124} {"train_loss": -5.741551399230957, "global_step": 47234, "epoch": 1124} {"train_loss": -5.6798930168151855, "global_step": 47235, "epoch": 1124} {"train_loss": -5.708890914916992, "global_step": 47236, "epoch": 1124} {"train_loss": -5.741491317749023, "global_step": 47237, "epoch": 1124} {"train_loss": -5.642721652984619, "global_step": 47238, "epoch": 1124} {"train_loss": -5.849312782287598, "global_step": 47239, "epoch": 1124} {"train_loss": -5.769370079040527, "global_step": 47240, "epoch": 1124} {"train_loss": -5.738865852355957, "global_step": 47241, "epoch": 1124} {"train_loss": -5.828946590423584, "global_step": 47242, "epoch": 1124} {"train_loss": -5.7893242835998535, "global_step": 47243, "epoch": 1124} {"train_loss": -5.743993282318115, "global_step": 47244, "epoch": 1124} {"train_loss": -5.782663822174072, "global_step": 47245, "epoch": 1124} {"train_loss": -5.538444519042969, "global_step": 47246, "epoch": 1124} {"train_loss": -5.690071105957031, "global_step": 47247, "epoch": 1124} {"train_loss": -5.649021148681641, "global_step": 47248, "epoch": 1124} {"train_loss": -5.73623377936227, "global_step": 47249, "epoch": 1124, "val_loss": 74168.203125} {"train_loss": -5.73776912689209, "global_step": 47250, "epoch": 1125} {"train_loss": -5.746124267578125, "global_step": 47251, "epoch": 1125} {"train_loss": -5.609205722808838, "global_step": 47252, "epoch": 1125} {"train_loss": -5.804777145385742, "global_step": 47253, "epoch": 1125} {"train_loss": -5.661806106567383, "global_step": 47254, "epoch": 1125} {"train_loss": -5.686323165893555, "global_step": 47255, "epoch": 1125} {"train_loss": -5.5990071296691895, "global_step": 47256, "epoch": 1125} {"train_loss": -5.64508056640625, "global_step": 47257, "epoch": 1125} {"train_loss": -5.663124084472656, "global_step": 47258, "epoch": 1125} {"train_loss": -5.721922397613525, "global_step": 47259, "epoch": 1125} {"train_loss": -5.887381553649902, "global_step": 47260, "epoch": 1125} {"train_loss": -5.704057693481445, "global_step": 47261, "epoch": 1125} {"train_loss": -5.6868085861206055, "global_step": 47262, "epoch": 1125} {"train_loss": -5.739751815795898, "global_step": 47263, "epoch": 1125} {"train_loss": -5.779410362243652, "global_step": 47264, "epoch": 1125} {"train_loss": -5.729676246643066, "global_step": 47265, "epoch": 1125} {"train_loss": -5.88316535949707, "global_step": 47266, "epoch": 1125} {"train_loss": -5.68220853805542, "global_step": 47267, "epoch": 1125} {"train_loss": -5.7317633628845215, "global_step": 47268, "epoch": 1125} {"train_loss": -5.839067459106445, "global_step": 47269, "epoch": 1125} {"train_loss": -5.694830894470215, "global_step": 47270, "epoch": 1125} {"train_loss": -5.646013259887695, "global_step": 47271, "epoch": 1125} {"train_loss": -5.785250663757324, "global_step": 47272, "epoch": 1125} {"train_loss": -5.670007705688477, "global_step": 47273, "epoch": 1125} {"train_loss": -5.755059719085693, "global_step": 47274, "epoch": 1125} {"train_loss": -5.606657028198242, "global_step": 47275, "epoch": 1125} {"train_loss": -5.814633369445801, "global_step": 47276, "epoch": 1125} {"train_loss": -5.604684829711914, "global_step": 47277, "epoch": 1125} {"train_loss": -5.605215072631836, "global_step": 47278, "epoch": 1125} {"train_loss": -5.701363563537598, "global_step": 47279, "epoch": 1125} {"train_loss": -5.747147560119629, "global_step": 47280, "epoch": 1125} {"train_loss": -5.682348251342773, "global_step": 47281, "epoch": 1125} {"train_loss": -5.591944217681885, "global_step": 47282, "epoch": 1125} {"train_loss": -5.709590911865234, "global_step": 47283, "epoch": 1125} {"train_loss": -5.860139846801758, "global_step": 47284, "epoch": 1125} {"train_loss": -5.6297993659973145, "global_step": 47285, "epoch": 1125} {"train_loss": -5.75697660446167, "global_step": 47286, "epoch": 1125} {"train_loss": -5.790585517883301, "global_step": 47287, "epoch": 1125} {"train_loss": -5.683579444885254, "global_step": 47288, "epoch": 1125} {"train_loss": -5.859166145324707, "global_step": 47289, "epoch": 1125} {"train_loss": -5.778510093688965, "global_step": 47290, "epoch": 1125} {"train_loss": -5.71784123920259, "global_step": 47291, "epoch": 1125, "val_loss": 74072.375} {"train_loss": -5.740649223327637, "global_step": 47292, "epoch": 1126} {"train_loss": -5.763849258422852, "global_step": 47293, "epoch": 1126} {"train_loss": -5.79511833190918, "global_step": 47294, "epoch": 1126} {"train_loss": -5.736198902130127, "global_step": 47295, "epoch": 1126} {"train_loss": -5.867250442504883, "global_step": 47296, "epoch": 1126} {"train_loss": -5.654053211212158, "global_step": 47297, "epoch": 1126} {"train_loss": -5.86850643157959, "global_step": 47298, "epoch": 1126} {"train_loss": -5.676779270172119, "global_step": 47299, "epoch": 1126} {"train_loss": -5.643125534057617, "global_step": 47300, "epoch": 1126} {"train_loss": -5.748926162719727, "global_step": 47301, "epoch": 1126} {"train_loss": -5.792818069458008, "global_step": 47302, "epoch": 1126} {"train_loss": -5.856545448303223, "global_step": 47303, "epoch": 1126} {"train_loss": -5.702025413513184, "global_step": 47304, "epoch": 1126} {"train_loss": -5.725863456726074, "global_step": 47305, "epoch": 1126} {"train_loss": -5.537492752075195, "global_step": 47306, "epoch": 1126} {"train_loss": -5.7365241050720215, "global_step": 47307, "epoch": 1126} {"train_loss": -5.807243347167969, "global_step": 47308, "epoch": 1126} {"train_loss": -5.805802345275879, "global_step": 47309, "epoch": 1126} {"train_loss": -5.615503787994385, "global_step": 47310, "epoch": 1126} {"train_loss": -5.6445183753967285, "global_step": 47311, "epoch": 1126} {"train_loss": -5.648839950561523, "global_step": 47312, "epoch": 1126} {"train_loss": -5.764616966247559, "global_step": 47313, "epoch": 1126} {"train_loss": -5.693894386291504, "global_step": 47314, "epoch": 1126} {"train_loss": -5.8086419105529785, "global_step": 47315, "epoch": 1126} {"train_loss": -5.635292053222656, "global_step": 47316, "epoch": 1126} {"train_loss": -5.659852027893066, "global_step": 47317, "epoch": 1126} {"train_loss": -5.6773552894592285, "global_step": 47318, "epoch": 1126} {"train_loss": -5.600164890289307, "global_step": 47319, "epoch": 1126} {"train_loss": -5.664648056030273, "global_step": 47320, "epoch": 1126} {"train_loss": -5.595186233520508, "global_step": 47321, "epoch": 1126} {"train_loss": -5.693714141845703, "global_step": 47322, "epoch": 1126} {"train_loss": -5.686038970947266, "global_step": 47323, "epoch": 1126} {"train_loss": -5.552453994750977, "global_step": 47324, "epoch": 1126} {"train_loss": -5.631589889526367, "global_step": 47325, "epoch": 1126} {"train_loss": -5.7445197105407715, "global_step": 47326, "epoch": 1126} {"train_loss": -5.77345085144043, "global_step": 47327, "epoch": 1126} {"train_loss": -5.553433418273926, "global_step": 47328, "epoch": 1126} {"train_loss": -5.681623935699463, "global_step": 47329, "epoch": 1126} {"train_loss": -5.745192050933838, "global_step": 47330, "epoch": 1126} {"train_loss": -5.759154796600342, "global_step": 47331, "epoch": 1126} {"train_loss": -5.810832977294922, "global_step": 47332, "epoch": 1126} {"train_loss": -5.707158451988583, "global_step": 47333, "epoch": 1126, "val_loss": 74171.9453125} {"train_loss": -5.693305015563965, "global_step": 47334, "epoch": 1127} {"train_loss": -5.683537006378174, "global_step": 47335, "epoch": 1127} {"train_loss": -5.721484661102295, "global_step": 47336, "epoch": 1127} {"train_loss": -5.654603481292725, "global_step": 47337, "epoch": 1127} {"train_loss": -5.801732063293457, "global_step": 47338, "epoch": 1127} {"train_loss": -5.856345176696777, "global_step": 47339, "epoch": 1127} {"train_loss": -5.71472692489624, "global_step": 47340, "epoch": 1127} {"train_loss": -5.764044284820557, "global_step": 47341, "epoch": 1127} {"train_loss": -5.69809627532959, "global_step": 47342, "epoch": 1127} {"train_loss": -5.688112258911133, "global_step": 47343, "epoch": 1127} {"train_loss": -5.711175441741943, "global_step": 47344, "epoch": 1127} {"train_loss": -5.768189907073975, "global_step": 47345, "epoch": 1127} {"train_loss": -5.698485374450684, "global_step": 47346, "epoch": 1127} {"train_loss": -5.746096134185791, "global_step": 47347, "epoch": 1127} {"train_loss": -5.780911445617676, "global_step": 47348, "epoch": 1127} {"train_loss": -5.764885425567627, "global_step": 47349, "epoch": 1127} {"train_loss": -5.734066009521484, "global_step": 47350, "epoch": 1127} {"train_loss": -5.875517845153809, "global_step": 47351, "epoch": 1127} {"train_loss": -5.71804141998291, "global_step": 47352, "epoch": 1127} {"train_loss": -5.8024749755859375, "global_step": 47353, "epoch": 1127} {"train_loss": -5.803218841552734, "global_step": 47354, "epoch": 1127} {"train_loss": -5.637373924255371, "global_step": 47355, "epoch": 1127} {"train_loss": -5.6781697273254395, "global_step": 47356, "epoch": 1127} {"train_loss": -5.747369289398193, "global_step": 47357, "epoch": 1127} {"train_loss": -5.682652473449707, "global_step": 47358, "epoch": 1127} {"train_loss": -5.792118072509766, "global_step": 47359, "epoch": 1127} {"train_loss": -5.745527267456055, "global_step": 47360, "epoch": 1127} {"train_loss": -5.766525745391846, "global_step": 47361, "epoch": 1127} {"train_loss": -5.65629243850708, "global_step": 47362, "epoch": 1127} {"train_loss": -5.7674689292907715, "global_step": 47363, "epoch": 1127} {"train_loss": -5.739306926727295, "global_step": 47364, "epoch": 1127} {"train_loss": -5.863339424133301, "global_step": 47365, "epoch": 1127} {"train_loss": -5.738393783569336, "global_step": 47366, "epoch": 1127} {"train_loss": -5.772923469543457, "global_step": 47367, "epoch": 1127} {"train_loss": -5.6961236000061035, "global_step": 47368, "epoch": 1127} {"train_loss": -5.523253440856934, "global_step": 47369, "epoch": 1127} {"train_loss": -5.630950927734375, "global_step": 47370, "epoch": 1127} {"train_loss": -5.6425933837890625, "global_step": 47371, "epoch": 1127} {"train_loss": -5.672292709350586, "global_step": 47372, "epoch": 1127} {"train_loss": -5.784112453460693, "global_step": 47373, "epoch": 1127} {"train_loss": -5.649662017822266, "global_step": 47374, "epoch": 1127} {"train_loss": -5.72846067519415, "global_step": 47375, "epoch": 1127, "val_loss": 73911.28125} {"train_loss": -5.618105888366699, "global_step": 47376, "epoch": 1128} {"train_loss": -5.748778343200684, "global_step": 47377, "epoch": 1128} {"train_loss": -5.715949058532715, "global_step": 47378, "epoch": 1128} {"train_loss": -5.737367153167725, "global_step": 47379, "epoch": 1128} {"train_loss": -5.762448310852051, "global_step": 47380, "epoch": 1128} {"train_loss": -5.697636604309082, "global_step": 47381, "epoch": 1128} {"train_loss": -5.6443305015563965, "global_step": 47382, "epoch": 1128} {"train_loss": -5.767905235290527, "global_step": 47383, "epoch": 1128} {"train_loss": -5.666922569274902, "global_step": 47384, "epoch": 1128} {"train_loss": -5.7536540031433105, "global_step": 47385, "epoch": 1128} {"train_loss": -5.614529609680176, "global_step": 47386, "epoch": 1128} {"train_loss": -5.77562141418457, "global_step": 47387, "epoch": 1128} {"train_loss": -5.838579177856445, "global_step": 47388, "epoch": 1128} {"train_loss": -5.716350555419922, "global_step": 47389, "epoch": 1128} {"train_loss": -5.88253927230835, "global_step": 47390, "epoch": 1128} {"train_loss": -5.668946266174316, "global_step": 47391, "epoch": 1128} {"train_loss": -5.655616760253906, "global_step": 47392, "epoch": 1128} {"train_loss": -5.6983747482299805, "global_step": 47393, "epoch": 1128} {"train_loss": -5.807575225830078, "global_step": 47394, "epoch": 1128} {"train_loss": -5.644447326660156, "global_step": 47395, "epoch": 1128} {"train_loss": -5.645679473876953, "global_step": 47396, "epoch": 1128} {"train_loss": -5.658300876617432, "global_step": 47397, "epoch": 1128} {"train_loss": -5.660512447357178, "global_step": 47398, "epoch": 1128} {"train_loss": -5.724712371826172, "global_step": 47399, "epoch": 1128} {"train_loss": -5.672654151916504, "global_step": 47400, "epoch": 1128} {"train_loss": -5.865492820739746, "global_step": 47401, "epoch": 1128} {"train_loss": -5.738508224487305, "global_step": 47402, "epoch": 1128} {"train_loss": -5.685168743133545, "global_step": 47403, "epoch": 1128} {"train_loss": -5.681209564208984, "global_step": 47404, "epoch": 1128} {"train_loss": -5.828018665313721, "global_step": 47405, "epoch": 1128} {"train_loss": -5.730893135070801, "global_step": 47406, "epoch": 1128} {"train_loss": -5.675482273101807, "global_step": 47407, "epoch": 1128} {"train_loss": -5.657979965209961, "global_step": 47408, "epoch": 1128} {"train_loss": -5.7689690589904785, "global_step": 47409, "epoch": 1128} {"train_loss": -5.615082263946533, "global_step": 47410, "epoch": 1128} {"train_loss": -5.709874153137207, "global_step": 47411, "epoch": 1128} {"train_loss": -5.668842315673828, "global_step": 47412, "epoch": 1128} {"train_loss": -5.771778106689453, "global_step": 47413, "epoch": 1128} {"train_loss": -5.767577171325684, "global_step": 47414, "epoch": 1128} {"train_loss": -5.738394737243652, "global_step": 47415, "epoch": 1128} {"train_loss": -5.7259321212768555, "global_step": 47416, "epoch": 1128} {"train_loss": -5.71628677277338, "global_step": 47417, "epoch": 1128, "val_loss": 74281.140625} {"train_loss": -5.8010382652282715, "global_step": 47418, "epoch": 1129} {"train_loss": -5.783182144165039, "global_step": 47419, "epoch": 1129} {"train_loss": -5.785642147064209, "global_step": 47420, "epoch": 1129} {"train_loss": -5.807782173156738, "global_step": 47421, "epoch": 1129} {"train_loss": -5.828691482543945, "global_step": 47422, "epoch": 1129} {"train_loss": -5.756779670715332, "global_step": 47423, "epoch": 1129} {"train_loss": -5.703823089599609, "global_step": 47424, "epoch": 1129} {"train_loss": -5.738313674926758, "global_step": 47425, "epoch": 1129} {"train_loss": -5.777385711669922, "global_step": 47426, "epoch": 1129} {"train_loss": -5.723734378814697, "global_step": 47427, "epoch": 1129} {"train_loss": -5.790501117706299, "global_step": 47428, "epoch": 1129} {"train_loss": -5.758180618286133, "global_step": 47429, "epoch": 1129} {"train_loss": -5.78306770324707, "global_step": 47430, "epoch": 1129} {"train_loss": -5.803496837615967, "global_step": 47431, "epoch": 1129} {"train_loss": -5.6393208503723145, "global_step": 47432, "epoch": 1129} {"train_loss": -5.716838836669922, "global_step": 47433, "epoch": 1129} {"train_loss": -5.751595497131348, "global_step": 47434, "epoch": 1129} {"train_loss": -5.788822174072266, "global_step": 47435, "epoch": 1129} {"train_loss": -5.861014366149902, "global_step": 47436, "epoch": 1129} {"train_loss": -5.71408224105835, "global_step": 47437, "epoch": 1129} {"train_loss": -5.815375328063965, "global_step": 47438, "epoch": 1129} {"train_loss": -5.631211757659912, "global_step": 47439, "epoch": 1129} {"train_loss": -5.726537704467773, "global_step": 47440, "epoch": 1129} {"train_loss": -5.775978088378906, "global_step": 47441, "epoch": 1129} {"train_loss": -5.686528205871582, "global_step": 47442, "epoch": 1129} {"train_loss": -5.5733842849731445, "global_step": 47443, "epoch": 1129} {"train_loss": -5.771091461181641, "global_step": 47444, "epoch": 1129} {"train_loss": -5.714359760284424, "global_step": 47445, "epoch": 1129} {"train_loss": -5.54489803314209, "global_step": 47446, "epoch": 1129} {"train_loss": -5.852871894836426, "global_step": 47447, "epoch": 1129} {"train_loss": -5.582065105438232, "global_step": 47448, "epoch": 1129} {"train_loss": -5.611049652099609, "global_step": 47449, "epoch": 1129} {"train_loss": -5.774717330932617, "global_step": 47450, "epoch": 1129} {"train_loss": -5.692564487457275, "global_step": 47451, "epoch": 1129} {"train_loss": -5.682704925537109, "global_step": 47452, "epoch": 1129} {"train_loss": -5.8011088371276855, "global_step": 47453, "epoch": 1129} {"train_loss": -5.7412309646606445, "global_step": 47454, "epoch": 1129} {"train_loss": -5.671391010284424, "global_step": 47455, "epoch": 1129} {"train_loss": -5.675304889678955, "global_step": 47456, "epoch": 1129} {"train_loss": -5.754334926605225, "global_step": 47457, "epoch": 1129} {"train_loss": -5.706502914428711, "global_step": 47458, "epoch": 1129} {"train_loss": -5.731690077554612, "global_step": 47459, "epoch": 1129, "val_loss": 74422.203125} {"train_loss": -5.8958210945129395, "global_step": 47460, "epoch": 1130} {"train_loss": -5.787683963775635, "global_step": 47461, "epoch": 1130} {"train_loss": -5.70610237121582, "global_step": 47462, "epoch": 1130} {"train_loss": -5.767004013061523, "global_step": 47463, "epoch": 1130} {"train_loss": -5.754388809204102, "global_step": 47464, "epoch": 1130} {"train_loss": -5.726329803466797, "global_step": 47465, "epoch": 1130} {"train_loss": -5.725636005401611, "global_step": 47466, "epoch": 1130} {"train_loss": -5.642597198486328, "global_step": 47467, "epoch": 1130} {"train_loss": -5.782888412475586, "global_step": 47468, "epoch": 1130} {"train_loss": -5.669646739959717, "global_step": 47469, "epoch": 1130} {"train_loss": -5.840541839599609, "global_step": 47470, "epoch": 1130} {"train_loss": -5.632523536682129, "global_step": 47471, "epoch": 1130} {"train_loss": -5.714117050170898, "global_step": 47472, "epoch": 1130} {"train_loss": -5.75802755355835, "global_step": 47473, "epoch": 1130} {"train_loss": -5.672084808349609, "global_step": 47474, "epoch": 1130} {"train_loss": -5.744381904602051, "global_step": 47475, "epoch": 1130} {"train_loss": -5.811884880065918, "global_step": 47476, "epoch": 1130} {"train_loss": -5.574932098388672, "global_step": 47477, "epoch": 1130} {"train_loss": -5.6450090408325195, "global_step": 47478, "epoch": 1130} {"train_loss": -5.720641136169434, "global_step": 47479, "epoch": 1130} {"train_loss": -5.680638313293457, "global_step": 47480, "epoch": 1130} {"train_loss": -5.62415885925293, "global_step": 47481, "epoch": 1130} {"train_loss": -5.884963035583496, "global_step": 47482, "epoch": 1130} {"train_loss": -5.700130939483643, "global_step": 47483, "epoch": 1130} {"train_loss": -5.824921607971191, "global_step": 47484, "epoch": 1130} {"train_loss": -5.654622554779053, "global_step": 47485, "epoch": 1130} {"train_loss": -5.560641288757324, "global_step": 47486, "epoch": 1130} {"train_loss": -5.888031482696533, "global_step": 47487, "epoch": 1130} {"train_loss": -5.665657043457031, "global_step": 47488, "epoch": 1130} {"train_loss": -5.640630722045898, "global_step": 47489, "epoch": 1130} {"train_loss": -5.768522262573242, "global_step": 47490, "epoch": 1130} {"train_loss": -5.755698204040527, "global_step": 47491, "epoch": 1130} {"train_loss": -5.790972709655762, "global_step": 47492, "epoch": 1130} {"train_loss": -5.763106346130371, "global_step": 47493, "epoch": 1130} {"train_loss": -5.712014198303223, "global_step": 47494, "epoch": 1130} {"train_loss": -5.726100921630859, "global_step": 47495, "epoch": 1130} {"train_loss": -5.901497840881348, "global_step": 47496, "epoch": 1130} {"train_loss": -5.679476737976074, "global_step": 47497, "epoch": 1130} {"train_loss": -5.711096286773682, "global_step": 47498, "epoch": 1130} {"train_loss": -5.81378173828125, "global_step": 47499, "epoch": 1130} {"train_loss": -5.665041446685791, "global_step": 47500, "epoch": 1130} {"train_loss": -5.731012264887492, "global_step": 47501, "epoch": 1130, "val_loss": 74199.7109375} {"train_loss": -5.647917747497559, "global_step": 47502, "epoch": 1131} {"train_loss": -5.830531597137451, "global_step": 47503, "epoch": 1131} {"train_loss": -5.733790397644043, "global_step": 47504, "epoch": 1131} {"train_loss": -5.6474080085754395, "global_step": 47505, "epoch": 1131} {"train_loss": -5.7920122146606445, "global_step": 47506, "epoch": 1131} {"train_loss": -5.898075103759766, "global_step": 47507, "epoch": 1131} {"train_loss": -5.62636661529541, "global_step": 47508, "epoch": 1131} {"train_loss": -5.676461696624756, "global_step": 47509, "epoch": 1131} {"train_loss": -5.692976951599121, "global_step": 47510, "epoch": 1131} {"train_loss": -5.722985744476318, "global_step": 47511, "epoch": 1131} {"train_loss": -5.67742919921875, "global_step": 47512, "epoch": 1131} {"train_loss": -5.549799919128418, "global_step": 47513, "epoch": 1131} {"train_loss": -5.758364677429199, "global_step": 47514, "epoch": 1131} {"train_loss": -5.696043968200684, "global_step": 47515, "epoch": 1131} {"train_loss": -5.699874401092529, "global_step": 47516, "epoch": 1131} {"train_loss": -5.746708869934082, "global_step": 47517, "epoch": 1131} {"train_loss": -5.733895301818848, "global_step": 47518, "epoch": 1131} {"train_loss": -5.707314491271973, "global_step": 47519, "epoch": 1131} {"train_loss": -5.769227981567383, "global_step": 47520, "epoch": 1131} {"train_loss": -5.693011283874512, "global_step": 47521, "epoch": 1131} {"train_loss": -5.633811950683594, "global_step": 47522, "epoch": 1131} {"train_loss": -5.7071533203125, "global_step": 47523, "epoch": 1131} {"train_loss": -5.558948516845703, "global_step": 47524, "epoch": 1131} {"train_loss": -5.65422248840332, "global_step": 47525, "epoch": 1131} {"train_loss": -5.730830192565918, "global_step": 47526, "epoch": 1131} {"train_loss": -5.674873352050781, "global_step": 47527, "epoch": 1131} {"train_loss": -5.730938911437988, "global_step": 47528, "epoch": 1131} {"train_loss": -5.6249847412109375, "global_step": 47529, "epoch": 1131} {"train_loss": -5.610330581665039, "global_step": 47530, "epoch": 1131} {"train_loss": -5.713766574859619, "global_step": 47531, "epoch": 1131} {"train_loss": -5.701138973236084, "global_step": 47532, "epoch": 1131} {"train_loss": -5.6721110343933105, "global_step": 47533, "epoch": 1131} {"train_loss": -5.59447717666626, "global_step": 47534, "epoch": 1131} {"train_loss": -5.781842231750488, "global_step": 47535, "epoch": 1131} {"train_loss": -5.655466556549072, "global_step": 47536, "epoch": 1131} {"train_loss": -5.707147598266602, "global_step": 47537, "epoch": 1131} {"train_loss": -5.852636337280273, "global_step": 47538, "epoch": 1131} {"train_loss": -5.7447967529296875, "global_step": 47539, "epoch": 1131} {"train_loss": -5.749445915222168, "global_step": 47540, "epoch": 1131} {"train_loss": -5.828136444091797, "global_step": 47541, "epoch": 1131} {"train_loss": -5.696624755859375, "global_step": 47542, "epoch": 1131} {"train_loss": -5.70865367707752, "global_step": 47543, "epoch": 1131, "val_loss": 74215.8359375} {"train_loss": -5.809048652648926, "global_step": 47544, "epoch": 1132} {"train_loss": -5.719661712646484, "global_step": 47545, "epoch": 1132} {"train_loss": -5.750470161437988, "global_step": 47546, "epoch": 1132} {"train_loss": -5.665317535400391, "global_step": 47547, "epoch": 1132} {"train_loss": -5.859407424926758, "global_step": 47548, "epoch": 1132} {"train_loss": -5.837770938873291, "global_step": 47549, "epoch": 1132} {"train_loss": -5.818395614624023, "global_step": 47550, "epoch": 1132} {"train_loss": -5.8208770751953125, "global_step": 47551, "epoch": 1132} {"train_loss": -5.670884132385254, "global_step": 47552, "epoch": 1132} {"train_loss": -5.80550479888916, "global_step": 47553, "epoch": 1132} {"train_loss": -5.676922798156738, "global_step": 47554, "epoch": 1132} {"train_loss": -5.80224084854126, "global_step": 47555, "epoch": 1132} {"train_loss": -5.836318016052246, "global_step": 47556, "epoch": 1132} {"train_loss": -5.783350944519043, "global_step": 47557, "epoch": 1132} {"train_loss": -5.687387943267822, "global_step": 47558, "epoch": 1132} {"train_loss": -5.7149858474731445, "global_step": 47559, "epoch": 1132} {"train_loss": -5.739044666290283, "global_step": 47560, "epoch": 1132} {"train_loss": -5.829361915588379, "global_step": 47561, "epoch": 1132} {"train_loss": -5.678731441497803, "global_step": 47562, "epoch": 1132} {"train_loss": -5.680009841918945, "global_step": 47563, "epoch": 1132} {"train_loss": -5.89041805267334, "global_step": 47564, "epoch": 1132} {"train_loss": -5.664127349853516, "global_step": 47565, "epoch": 1132} {"train_loss": -5.766815185546875, "global_step": 47566, "epoch": 1132} {"train_loss": -5.751125812530518, "global_step": 47567, "epoch": 1132} {"train_loss": -5.657066345214844, "global_step": 47568, "epoch": 1132} {"train_loss": -5.84065055847168, "global_step": 47569, "epoch": 1132} {"train_loss": -5.717043876647949, "global_step": 47570, "epoch": 1132} {"train_loss": -5.752408027648926, "global_step": 47571, "epoch": 1132} {"train_loss": -5.799528121948242, "global_step": 47572, "epoch": 1132} {"train_loss": -5.708961486816406, "global_step": 47573, "epoch": 1132} {"train_loss": -5.755802154541016, "global_step": 47574, "epoch": 1132} {"train_loss": -5.815450668334961, "global_step": 47575, "epoch": 1132} {"train_loss": -5.745152473449707, "global_step": 47576, "epoch": 1132} {"train_loss": -5.6785383224487305, "global_step": 47577, "epoch": 1132} {"train_loss": -5.793560028076172, "global_step": 47578, "epoch": 1132} {"train_loss": -5.730817794799805, "global_step": 47579, "epoch": 1132} {"train_loss": -5.65882682800293, "global_step": 47580, "epoch": 1132} {"train_loss": -5.729866981506348, "global_step": 47581, "epoch": 1132} {"train_loss": -5.711684226989746, "global_step": 47582, "epoch": 1132} {"train_loss": -5.655147552490234, "global_step": 47583, "epoch": 1132} {"train_loss": -5.774674415588379, "global_step": 47584, "epoch": 1132} {"train_loss": -5.748934904734294, "global_step": 47585, "epoch": 1132, "val_loss": 73720.8125} {"train_loss": -5.723024845123291, "global_step": 47586, "epoch": 1133} {"train_loss": -5.859292030334473, "global_step": 47587, "epoch": 1133} {"train_loss": -5.709131240844727, "global_step": 47588, "epoch": 1133} {"train_loss": -5.683053970336914, "global_step": 47589, "epoch": 1133} {"train_loss": -5.7306647300720215, "global_step": 47590, "epoch": 1133} {"train_loss": -5.8470354080200195, "global_step": 47591, "epoch": 1133} {"train_loss": -5.711811542510986, "global_step": 47592, "epoch": 1133} {"train_loss": -5.81059455871582, "global_step": 47593, "epoch": 1133} {"train_loss": -5.762476921081543, "global_step": 47594, "epoch": 1133} {"train_loss": -5.679661750793457, "global_step": 47595, "epoch": 1133} {"train_loss": -5.705829620361328, "global_step": 47596, "epoch": 1133} {"train_loss": -5.7740020751953125, "global_step": 47597, "epoch": 1133} {"train_loss": -5.7373528480529785, "global_step": 47598, "epoch": 1133} {"train_loss": -5.723746299743652, "global_step": 47599, "epoch": 1133} {"train_loss": -5.686040878295898, "global_step": 47600, "epoch": 1133} {"train_loss": -5.7683515548706055, "global_step": 47601, "epoch": 1133} {"train_loss": -5.754878520965576, "global_step": 47602, "epoch": 1133} {"train_loss": -5.8361921310424805, "global_step": 47603, "epoch": 1133} {"train_loss": -5.744636535644531, "global_step": 47604, "epoch": 1133} {"train_loss": -5.92006778717041, "global_step": 47605, "epoch": 1133} {"train_loss": -5.739013195037842, "global_step": 47606, "epoch": 1133} {"train_loss": -5.81851863861084, "global_step": 47607, "epoch": 1133} {"train_loss": -5.621300220489502, "global_step": 47608, "epoch": 1133} {"train_loss": -5.835633754730225, "global_step": 47609, "epoch": 1133} {"train_loss": -5.75937032699585, "global_step": 47610, "epoch": 1133} {"train_loss": -5.807865619659424, "global_step": 47611, "epoch": 1133} {"train_loss": -5.957335472106934, "global_step": 47612, "epoch": 1133} {"train_loss": -5.709173679351807, "global_step": 47613, "epoch": 1133} {"train_loss": -5.77593469619751, "global_step": 47614, "epoch": 1133} {"train_loss": -5.732373237609863, "global_step": 47615, "epoch": 1133} {"train_loss": -5.824276924133301, "global_step": 47616, "epoch": 1133} {"train_loss": -5.8082275390625, "global_step": 47617, "epoch": 1133} {"train_loss": -5.8361406326293945, "global_step": 47618, "epoch": 1133} {"train_loss": -5.763654708862305, "global_step": 47619, "epoch": 1133} {"train_loss": -5.786561489105225, "global_step": 47620, "epoch": 1133} {"train_loss": -5.737873077392578, "global_step": 47621, "epoch": 1133} {"train_loss": -5.771430969238281, "global_step": 47622, "epoch": 1133} {"train_loss": -5.694538593292236, "global_step": 47623, "epoch": 1133} {"train_loss": -5.815638542175293, "global_step": 47624, "epoch": 1133} {"train_loss": -5.746882438659668, "global_step": 47625, "epoch": 1133} {"train_loss": -5.618886470794678, "global_step": 47626, "epoch": 1133} {"train_loss": -5.761486870901925, "global_step": 47627, "epoch": 1133, "val_loss": 73963.625} {"train_loss": -5.788919448852539, "global_step": 47628, "epoch": 1134} {"train_loss": -5.8221282958984375, "global_step": 47629, "epoch": 1134} {"train_loss": -5.679570198059082, "global_step": 47630, "epoch": 1134} {"train_loss": -5.756595611572266, "global_step": 47631, "epoch": 1134} {"train_loss": -5.812745094299316, "global_step": 47632, "epoch": 1134} {"train_loss": -5.751175403594971, "global_step": 47633, "epoch": 1134} {"train_loss": -5.7016425132751465, "global_step": 47634, "epoch": 1134} {"train_loss": -5.773606777191162, "global_step": 47635, "epoch": 1134} {"train_loss": -5.764657974243164, "global_step": 47636, "epoch": 1134} {"train_loss": -5.702300071716309, "global_step": 47637, "epoch": 1134} {"train_loss": -5.8260955810546875, "global_step": 47638, "epoch": 1134} {"train_loss": -5.684171676635742, "global_step": 47639, "epoch": 1134} {"train_loss": -5.7553510665893555, "global_step": 47640, "epoch": 1134} {"train_loss": -5.691079139709473, "global_step": 47641, "epoch": 1134} {"train_loss": -5.6570658683776855, "global_step": 47642, "epoch": 1134} {"train_loss": -5.623607158660889, "global_step": 47643, "epoch": 1134} {"train_loss": -5.67228889465332, "global_step": 47644, "epoch": 1134} {"train_loss": -5.6450042724609375, "global_step": 47645, "epoch": 1134} {"train_loss": -5.61562442779541, "global_step": 47646, "epoch": 1134} {"train_loss": -5.688833236694336, "global_step": 47647, "epoch": 1134} {"train_loss": -5.722760200500488, "global_step": 47648, "epoch": 1134} {"train_loss": -5.649050712585449, "global_step": 47649, "epoch": 1134} {"train_loss": -5.722689151763916, "global_step": 47650, "epoch": 1134} {"train_loss": -5.690052509307861, "global_step": 47651, "epoch": 1134} {"train_loss": -5.647016525268555, "global_step": 47652, "epoch": 1134} {"train_loss": -5.673666477203369, "global_step": 47653, "epoch": 1134} {"train_loss": -5.718220233917236, "global_step": 47654, "epoch": 1134} {"train_loss": -5.739536285400391, "global_step": 47655, "epoch": 1134} {"train_loss": -5.714229106903076, "global_step": 47656, "epoch": 1134} {"train_loss": -5.572779655456543, "global_step": 47657, "epoch": 1134} {"train_loss": -5.764440536499023, "global_step": 47658, "epoch": 1134} {"train_loss": -5.782629489898682, "global_step": 47659, "epoch": 1134} {"train_loss": -5.803836345672607, "global_step": 47660, "epoch": 1134} {"train_loss": -5.716761589050293, "global_step": 47661, "epoch": 1134} {"train_loss": -5.793900966644287, "global_step": 47662, "epoch": 1134} {"train_loss": -5.784860610961914, "global_step": 47663, "epoch": 1134} {"train_loss": -5.719796180725098, "global_step": 47664, "epoch": 1134} {"train_loss": -5.822860240936279, "global_step": 47665, "epoch": 1134} {"train_loss": -5.805324077606201, "global_step": 47666, "epoch": 1134} {"train_loss": -5.757913589477539, "global_step": 47667, "epoch": 1134} {"train_loss": -5.688786029815674, "global_step": 47668, "epoch": 1134} {"train_loss": -5.725521984554472, "global_step": 47669, "epoch": 1134, "val_loss": 73886.3515625} {"train_loss": -5.687390327453613, "global_step": 47670, "epoch": 1135} {"train_loss": -5.6542816162109375, "global_step": 47671, "epoch": 1135} {"train_loss": -5.881789207458496, "global_step": 47672, "epoch": 1135} {"train_loss": -5.67744255065918, "global_step": 47673, "epoch": 1135} {"train_loss": -5.684139251708984, "global_step": 47674, "epoch": 1135} {"train_loss": -5.695372581481934, "global_step": 47675, "epoch": 1135} {"train_loss": -5.850703239440918, "global_step": 47676, "epoch": 1135} {"train_loss": -5.737797260284424, "global_step": 47677, "epoch": 1135} {"train_loss": -5.691774368286133, "global_step": 47678, "epoch": 1135} {"train_loss": -5.773197174072266, "global_step": 47679, "epoch": 1135} {"train_loss": -5.826547622680664, "global_step": 47680, "epoch": 1135} {"train_loss": -5.744387626647949, "global_step": 47681, "epoch": 1135} {"train_loss": -5.795327186584473, "global_step": 47682, "epoch": 1135} {"train_loss": -5.9778852462768555, "global_step": 47683, "epoch": 1135} {"train_loss": -5.811061382293701, "global_step": 47684, "epoch": 1135} {"train_loss": -5.713076114654541, "global_step": 47685, "epoch": 1135} {"train_loss": -5.681273460388184, "global_step": 47686, "epoch": 1135} {"train_loss": -5.67751407623291, "global_step": 47687, "epoch": 1135} {"train_loss": -5.690590858459473, "global_step": 47688, "epoch": 1135} {"train_loss": -5.77133846282959, "global_step": 47689, "epoch": 1135} {"train_loss": -5.6455230712890625, "global_step": 47690, "epoch": 1135} {"train_loss": -5.721950054168701, "global_step": 47691, "epoch": 1135} {"train_loss": -5.618382453918457, "global_step": 47692, "epoch": 1135} {"train_loss": -5.674028396606445, "global_step": 47693, "epoch": 1135} {"train_loss": -5.700685501098633, "global_step": 47694, "epoch": 1135} {"train_loss": -5.713292121887207, "global_step": 47695, "epoch": 1135} {"train_loss": -5.782576084136963, "global_step": 47696, "epoch": 1135} {"train_loss": -5.6979241371154785, "global_step": 47697, "epoch": 1135} {"train_loss": -5.722311019897461, "global_step": 47698, "epoch": 1135} {"train_loss": -5.6571221351623535, "global_step": 47699, "epoch": 1135} {"train_loss": -5.794356822967529, "global_step": 47700, "epoch": 1135} {"train_loss": -5.848128318786621, "global_step": 47701, "epoch": 1135} {"train_loss": -5.721505165100098, "global_step": 47702, "epoch": 1135} {"train_loss": -5.668951988220215, "global_step": 47703, "epoch": 1135} {"train_loss": -5.650648593902588, "global_step": 47704, "epoch": 1135} {"train_loss": -5.6524763107299805, "global_step": 47705, "epoch": 1135} {"train_loss": -5.512216567993164, "global_step": 47706, "epoch": 1135} {"train_loss": -5.750666618347168, "global_step": 47707, "epoch": 1135} {"train_loss": -5.907122611999512, "global_step": 47708, "epoch": 1135} {"train_loss": -5.638041019439697, "global_step": 47709, "epoch": 1135} {"train_loss": -5.691684722900391, "global_step": 47710, "epoch": 1135} {"train_loss": -5.726613169624692, "global_step": 47711, "epoch": 1135, "val_loss": 74495.0625} {"train_loss": -5.592406272888184, "global_step": 47712, "epoch": 1136} {"train_loss": -5.761030197143555, "global_step": 47713, "epoch": 1136} {"train_loss": -5.7004828453063965, "global_step": 47714, "epoch": 1136} {"train_loss": -5.550335884094238, "global_step": 47715, "epoch": 1136} {"train_loss": -5.696965217590332, "global_step": 47716, "epoch": 1136} {"train_loss": -5.655886173248291, "global_step": 47717, "epoch": 1136} {"train_loss": -5.823225021362305, "global_step": 47718, "epoch": 1136} {"train_loss": -5.720460891723633, "global_step": 47719, "epoch": 1136} {"train_loss": -5.615353107452393, "global_step": 47720, "epoch": 1136} {"train_loss": -5.776364326477051, "global_step": 47721, "epoch": 1136} {"train_loss": -5.641094207763672, "global_step": 47722, "epoch": 1136} {"train_loss": -5.748195648193359, "global_step": 47723, "epoch": 1136} {"train_loss": -5.744419097900391, "global_step": 47724, "epoch": 1136} {"train_loss": -5.812343597412109, "global_step": 47725, "epoch": 1136} {"train_loss": -5.739554405212402, "global_step": 47726, "epoch": 1136} {"train_loss": -5.745813846588135, "global_step": 47727, "epoch": 1136} {"train_loss": -5.75130558013916, "global_step": 47728, "epoch": 1136} {"train_loss": -5.762862682342529, "global_step": 47729, "epoch": 1136} {"train_loss": -5.794849395751953, "global_step": 47730, "epoch": 1136} {"train_loss": -5.740634918212891, "global_step": 47731, "epoch": 1136} {"train_loss": -5.637479782104492, "global_step": 47732, "epoch": 1136} {"train_loss": -5.632065773010254, "global_step": 47733, "epoch": 1136} {"train_loss": -5.8492231369018555, "global_step": 47734, "epoch": 1136} {"train_loss": -5.7164082527160645, "global_step": 47735, "epoch": 1136} {"train_loss": -5.790508270263672, "global_step": 47736, "epoch": 1136} {"train_loss": -5.6869683265686035, "global_step": 47737, "epoch": 1136} {"train_loss": -5.655505180358887, "global_step": 47738, "epoch": 1136} {"train_loss": -5.764382362365723, "global_step": 47739, "epoch": 1136} {"train_loss": -5.78179407119751, "global_step": 47740, "epoch": 1136} {"train_loss": -5.792418956756592, "global_step": 47741, "epoch": 1136} {"train_loss": -5.6841936111450195, "global_step": 47742, "epoch": 1136} {"train_loss": -5.775524139404297, "global_step": 47743, "epoch": 1136} {"train_loss": -5.819392681121826, "global_step": 47744, "epoch": 1136} {"train_loss": -5.74422550201416, "global_step": 47745, "epoch": 1136} {"train_loss": -5.721058368682861, "global_step": 47746, "epoch": 1136} {"train_loss": -5.598099708557129, "global_step": 47747, "epoch": 1136} {"train_loss": -5.710549354553223, "global_step": 47748, "epoch": 1136} {"train_loss": -5.599963188171387, "global_step": 47749, "epoch": 1136} {"train_loss": -5.679530143737793, "global_step": 47750, "epoch": 1136} {"train_loss": -5.670960426330566, "global_step": 47751, "epoch": 1136} {"train_loss": -5.786281585693359, "global_step": 47752, "epoch": 1136} {"train_loss": -5.716803210122245, "global_step": 47753, "epoch": 1136, "val_loss": 74421.265625} {"train_loss": -5.777284622192383, "global_step": 47754, "epoch": 1137} {"train_loss": -5.639869689941406, "global_step": 47755, "epoch": 1137} {"train_loss": -5.7353973388671875, "global_step": 47756, "epoch": 1137} {"train_loss": -5.708205223083496, "global_step": 47757, "epoch": 1137} {"train_loss": -5.8378400802612305, "global_step": 47758, "epoch": 1137} {"train_loss": -5.762730598449707, "global_step": 47759, "epoch": 1137} {"train_loss": -5.723495006561279, "global_step": 47760, "epoch": 1137} {"train_loss": -5.723597049713135, "global_step": 47761, "epoch": 1137} {"train_loss": -5.632558822631836, "global_step": 47762, "epoch": 1137} {"train_loss": -5.593001365661621, "global_step": 47763, "epoch": 1137} {"train_loss": -5.744269371032715, "global_step": 47764, "epoch": 1137} {"train_loss": -5.699579238891602, "global_step": 47765, "epoch": 1137} {"train_loss": -5.64693546295166, "global_step": 47766, "epoch": 1137} {"train_loss": -5.836982727050781, "global_step": 47767, "epoch": 1137} {"train_loss": -5.770757675170898, "global_step": 47768, "epoch": 1137} {"train_loss": -5.749810218811035, "global_step": 47769, "epoch": 1137} {"train_loss": -5.652770042419434, "global_step": 47770, "epoch": 1137} {"train_loss": -5.768791198730469, "global_step": 47771, "epoch": 1137} {"train_loss": -5.755064010620117, "global_step": 47772, "epoch": 1137} {"train_loss": -5.8170928955078125, "global_step": 47773, "epoch": 1137} {"train_loss": -5.769320011138916, "global_step": 47774, "epoch": 1137} {"train_loss": -5.789804458618164, "global_step": 47775, "epoch": 1137} {"train_loss": -5.797034740447998, "global_step": 47776, "epoch": 1137} {"train_loss": -5.77689790725708, "global_step": 47777, "epoch": 1137} {"train_loss": -5.661752700805664, "global_step": 47778, "epoch": 1137} {"train_loss": -5.65733528137207, "global_step": 47779, "epoch": 1137} {"train_loss": -5.775867462158203, "global_step": 47780, "epoch": 1137} {"train_loss": -5.6932783126831055, "global_step": 47781, "epoch": 1137} {"train_loss": -5.577064514160156, "global_step": 47782, "epoch": 1137} {"train_loss": -5.792008399963379, "global_step": 47783, "epoch": 1137} {"train_loss": -5.661229133605957, "global_step": 47784, "epoch": 1137} {"train_loss": -5.619697093963623, "global_step": 47785, "epoch": 1137} {"train_loss": -5.7779860496521, "global_step": 47786, "epoch": 1137} {"train_loss": -5.516300201416016, "global_step": 47787, "epoch": 1137} {"train_loss": -5.7967376708984375, "global_step": 47788, "epoch": 1137} {"train_loss": -5.5824785232543945, "global_step": 47789, "epoch": 1137} {"train_loss": -5.714550971984863, "global_step": 47790, "epoch": 1137} {"train_loss": -5.760655879974365, "global_step": 47791, "epoch": 1137} {"train_loss": -5.734145164489746, "global_step": 47792, "epoch": 1137} {"train_loss": -5.672741889953613, "global_step": 47793, "epoch": 1137} {"train_loss": -5.697615623474121, "global_step": 47794, "epoch": 1137} {"train_loss": -5.716929163251605, "global_step": 47795, "epoch": 1137, "val_loss": 74641.4921875} {"train_loss": -5.681976795196533, "global_step": 47796, "epoch": 1138} {"train_loss": -5.827098846435547, "global_step": 47797, "epoch": 1138} {"train_loss": -5.593346118927002, "global_step": 47798, "epoch": 1138} {"train_loss": -5.649277687072754, "global_step": 47799, "epoch": 1138} {"train_loss": -5.608241081237793, "global_step": 47800, "epoch": 1138} {"train_loss": -5.725536346435547, "global_step": 47801, "epoch": 1138} {"train_loss": -5.619785308837891, "global_step": 47802, "epoch": 1138} {"train_loss": -5.7052836418151855, "global_step": 47803, "epoch": 1138} {"train_loss": -5.768410682678223, "global_step": 47804, "epoch": 1138} {"train_loss": -5.850756645202637, "global_step": 47805, "epoch": 1138} {"train_loss": -5.736269950866699, "global_step": 47806, "epoch": 1138} {"train_loss": -5.691013336181641, "global_step": 47807, "epoch": 1138} {"train_loss": -5.827253341674805, "global_step": 47808, "epoch": 1138} {"train_loss": -5.770590782165527, "global_step": 47809, "epoch": 1138} {"train_loss": -5.693676948547363, "global_step": 47810, "epoch": 1138} {"train_loss": -5.843847274780273, "global_step": 47811, "epoch": 1138} {"train_loss": -5.634641170501709, "global_step": 47812, "epoch": 1138} {"train_loss": -5.9263505935668945, "global_step": 47813, "epoch": 1138} {"train_loss": -5.781406402587891, "global_step": 47814, "epoch": 1138} {"train_loss": -5.666382312774658, "global_step": 47815, "epoch": 1138} {"train_loss": -5.711341857910156, "global_step": 47816, "epoch": 1138} {"train_loss": -5.813655853271484, "global_step": 47817, "epoch": 1138} {"train_loss": -5.9145731925964355, "global_step": 47818, "epoch": 1138} {"train_loss": -5.6168928146362305, "global_step": 47819, "epoch": 1138} {"train_loss": -5.689404487609863, "global_step": 47820, "epoch": 1138} {"train_loss": -5.775015830993652, "global_step": 47821, "epoch": 1138} {"train_loss": -5.776307106018066, "global_step": 47822, "epoch": 1138} {"train_loss": -5.728999137878418, "global_step": 47823, "epoch": 1138} {"train_loss": -5.772420883178711, "global_step": 47824, "epoch": 1138} {"train_loss": -5.6312127113342285, "global_step": 47825, "epoch": 1138} {"train_loss": -5.672428131103516, "global_step": 47826, "epoch": 1138} {"train_loss": -5.670876502990723, "global_step": 47827, "epoch": 1138} {"train_loss": -5.6643781661987305, "global_step": 47828, "epoch": 1138} {"train_loss": -5.7170634269714355, "global_step": 47829, "epoch": 1138} {"train_loss": -5.773124694824219, "global_step": 47830, "epoch": 1138} {"train_loss": -5.675381183624268, "global_step": 47831, "epoch": 1138} {"train_loss": -5.710406303405762, "global_step": 47832, "epoch": 1138} {"train_loss": -5.784186840057373, "global_step": 47833, "epoch": 1138} {"train_loss": -5.537168502807617, "global_step": 47834, "epoch": 1138} {"train_loss": -5.6402177810668945, "global_step": 47835, "epoch": 1138} {"train_loss": -5.676513671875, "global_step": 47836, "epoch": 1138} {"train_loss": -5.721037717092605, "global_step": 47837, "epoch": 1138, "val_loss": 73954.921875} {"train_loss": -5.728264808654785, "global_step": 47838, "epoch": 1139} {"train_loss": -5.611255645751953, "global_step": 47839, "epoch": 1139} {"train_loss": -5.6965813636779785, "global_step": 47840, "epoch": 1139} {"train_loss": -5.779496669769287, "global_step": 47841, "epoch": 1139} {"train_loss": -5.814113616943359, "global_step": 47842, "epoch": 1139} {"train_loss": -5.762452125549316, "global_step": 47843, "epoch": 1139} {"train_loss": -5.702867031097412, "global_step": 47844, "epoch": 1139} {"train_loss": -5.918412208557129, "global_step": 47845, "epoch": 1139} {"train_loss": -5.75804328918457, "global_step": 47846, "epoch": 1139} {"train_loss": -5.746484279632568, "global_step": 47847, "epoch": 1139} {"train_loss": -5.767248630523682, "global_step": 47848, "epoch": 1139} {"train_loss": -5.876452922821045, "global_step": 47849, "epoch": 1139} {"train_loss": -5.734521389007568, "global_step": 47850, "epoch": 1139} {"train_loss": -5.579281806945801, "global_step": 47851, "epoch": 1139} {"train_loss": -5.833768844604492, "global_step": 47852, "epoch": 1139} {"train_loss": -5.611941814422607, "global_step": 47853, "epoch": 1139} {"train_loss": -5.737809658050537, "global_step": 47854, "epoch": 1139} {"train_loss": -5.706645488739014, "global_step": 47855, "epoch": 1139} {"train_loss": -5.735968589782715, "global_step": 47856, "epoch": 1139} {"train_loss": -5.711905479431152, "global_step": 47857, "epoch": 1139} {"train_loss": -5.804644584655762, "global_step": 47858, "epoch": 1139} {"train_loss": -5.776968002319336, "global_step": 47859, "epoch": 1139} {"train_loss": -5.827469825744629, "global_step": 47860, "epoch": 1139} {"train_loss": -5.681888580322266, "global_step": 47861, "epoch": 1139} {"train_loss": -5.72401237487793, "global_step": 47862, "epoch": 1139} {"train_loss": -5.641461372375488, "global_step": 47863, "epoch": 1139} {"train_loss": -5.800299167633057, "global_step": 47864, "epoch": 1139} {"train_loss": -5.676290035247803, "global_step": 47865, "epoch": 1139} {"train_loss": -5.726235389709473, "global_step": 47866, "epoch": 1139} {"train_loss": -5.7083916664123535, "global_step": 47867, "epoch": 1139} {"train_loss": -5.659049987792969, "global_step": 47868, "epoch": 1139} {"train_loss": -5.8167619705200195, "global_step": 47869, "epoch": 1139} {"train_loss": -5.709649562835693, "global_step": 47870, "epoch": 1139} {"train_loss": -5.827215671539307, "global_step": 47871, "epoch": 1139} {"train_loss": -5.750096321105957, "global_step": 47872, "epoch": 1139} {"train_loss": -5.784668922424316, "global_step": 47873, "epoch": 1139} {"train_loss": -5.756801128387451, "global_step": 47874, "epoch": 1139} {"train_loss": -5.94173002243042, "global_step": 47875, "epoch": 1139} {"train_loss": -5.838662147521973, "global_step": 47876, "epoch": 1139} {"train_loss": -5.780601501464844, "global_step": 47877, "epoch": 1139} {"train_loss": -5.816757678985596, "global_step": 47878, "epoch": 1139} {"train_loss": -5.7507729189736505, "global_step": 47879, "epoch": 1139, "val_loss": 74027.375} {"train_loss": -5.753421306610107, "global_step": 47880, "epoch": 1140} {"train_loss": -5.641921520233154, "global_step": 47881, "epoch": 1140} {"train_loss": -5.825768947601318, "global_step": 47882, "epoch": 1140} {"train_loss": -5.756305694580078, "global_step": 47883, "epoch": 1140} {"train_loss": -5.688579559326172, "global_step": 47884, "epoch": 1140} {"train_loss": -5.688972473144531, "global_step": 47885, "epoch": 1140} {"train_loss": -5.830845832824707, "global_step": 47886, "epoch": 1140} {"train_loss": -6.002328872680664, "global_step": 47887, "epoch": 1140} {"train_loss": -5.831751823425293, "global_step": 47888, "epoch": 1140} {"train_loss": -5.68673849105835, "global_step": 47889, "epoch": 1140} {"train_loss": -5.734949588775635, "global_step": 47890, "epoch": 1140} {"train_loss": -5.806774139404297, "global_step": 47891, "epoch": 1140} {"train_loss": -5.5959391593933105, "global_step": 47892, "epoch": 1140} {"train_loss": -5.682050704956055, "global_step": 47893, "epoch": 1140} {"train_loss": -5.846579551696777, "global_step": 47894, "epoch": 1140} {"train_loss": -5.730819225311279, "global_step": 47895, "epoch": 1140} {"train_loss": -5.566330432891846, "global_step": 47896, "epoch": 1140} {"train_loss": -5.856570243835449, "global_step": 47897, "epoch": 1140} {"train_loss": -5.779195785522461, "global_step": 47898, "epoch": 1140} {"train_loss": -5.641993522644043, "global_step": 47899, "epoch": 1140} {"train_loss": -5.720507621765137, "global_step": 47900, "epoch": 1140} {"train_loss": -5.795388221740723, "global_step": 47901, "epoch": 1140} {"train_loss": -5.818786144256592, "global_step": 47902, "epoch": 1140} {"train_loss": -5.802773475646973, "global_step": 47903, "epoch": 1140} {"train_loss": -5.704998016357422, "global_step": 47904, "epoch": 1140} {"train_loss": -5.753726005554199, "global_step": 47905, "epoch": 1140} {"train_loss": -5.684287071228027, "global_step": 47906, "epoch": 1140} {"train_loss": -5.855892181396484, "global_step": 47907, "epoch": 1140} {"train_loss": -5.5757904052734375, "global_step": 47908, "epoch": 1140} {"train_loss": -5.732184410095215, "global_step": 47909, "epoch": 1140} {"train_loss": -5.826237678527832, "global_step": 47910, "epoch": 1140} {"train_loss": -5.773891448974609, "global_step": 47911, "epoch": 1140} {"train_loss": -5.778700828552246, "global_step": 47912, "epoch": 1140} {"train_loss": -5.812613487243652, "global_step": 47913, "epoch": 1140} {"train_loss": -5.647372245788574, "global_step": 47914, "epoch": 1140} {"train_loss": -5.741472244262695, "global_step": 47915, "epoch": 1140} {"train_loss": -5.780455112457275, "global_step": 47916, "epoch": 1140} {"train_loss": -5.790630340576172, "global_step": 47917, "epoch": 1140} {"train_loss": -5.703669548034668, "global_step": 47918, "epoch": 1140} {"train_loss": -5.816373825073242, "global_step": 47919, "epoch": 1140} {"train_loss": -5.730164527893066, "global_step": 47920, "epoch": 1140} {"train_loss": -5.753202052343459, "global_step": 47921, "epoch": 1140, "val_loss": 73928.171875} {"train_loss": -5.87969970703125, "global_step": 47922, "epoch": 1141} {"train_loss": -5.911465644836426, "global_step": 47923, "epoch": 1141} {"train_loss": -5.7583770751953125, "global_step": 47924, "epoch": 1141} {"train_loss": -5.802130699157715, "global_step": 47925, "epoch": 1141} {"train_loss": -5.792262077331543, "global_step": 47926, "epoch": 1141} {"train_loss": -5.812499046325684, "global_step": 47927, "epoch": 1141} {"train_loss": -5.795572757720947, "global_step": 47928, "epoch": 1141} {"train_loss": -5.79092264175415, "global_step": 47929, "epoch": 1141} {"train_loss": -5.890193939208984, "global_step": 47930, "epoch": 1141} {"train_loss": -5.705933570861816, "global_step": 47931, "epoch": 1141} {"train_loss": -5.797678470611572, "global_step": 47932, "epoch": 1141} {"train_loss": -5.763317108154297, "global_step": 47933, "epoch": 1141} {"train_loss": -5.737099647521973, "global_step": 47934, "epoch": 1141} {"train_loss": -5.741517066955566, "global_step": 47935, "epoch": 1141} {"train_loss": -5.698589324951172, "global_step": 47936, "epoch": 1141} {"train_loss": -5.626439571380615, "global_step": 47937, "epoch": 1141} {"train_loss": -5.826510429382324, "global_step": 47938, "epoch": 1141} {"train_loss": -5.886123180389404, "global_step": 47939, "epoch": 1141} {"train_loss": -5.555088043212891, "global_step": 47940, "epoch": 1141} {"train_loss": -5.885361671447754, "global_step": 47941, "epoch": 1141} {"train_loss": -5.612332344055176, "global_step": 47942, "epoch": 1141} {"train_loss": -5.703221321105957, "global_step": 47943, "epoch": 1141} {"train_loss": -5.761753082275391, "global_step": 47944, "epoch": 1141} {"train_loss": -5.652890205383301, "global_step": 47945, "epoch": 1141} {"train_loss": -5.6206207275390625, "global_step": 47946, "epoch": 1141} {"train_loss": -5.8324079513549805, "global_step": 47947, "epoch": 1141} {"train_loss": -5.6813764572143555, "global_step": 47948, "epoch": 1141} {"train_loss": -5.594934463500977, "global_step": 47949, "epoch": 1141} {"train_loss": -5.770195007324219, "global_step": 47950, "epoch": 1141} {"train_loss": -5.669002532958984, "global_step": 47951, "epoch": 1141} {"train_loss": -5.670125961303711, "global_step": 47952, "epoch": 1141} {"train_loss": -5.664575576782227, "global_step": 47953, "epoch": 1141} {"train_loss": -5.745537757873535, "global_step": 47954, "epoch": 1141} {"train_loss": -5.753991603851318, "global_step": 47955, "epoch": 1141} {"train_loss": -5.613466262817383, "global_step": 47956, "epoch": 1141} {"train_loss": -5.724974632263184, "global_step": 47957, "epoch": 1141} {"train_loss": -5.714510440826416, "global_step": 47958, "epoch": 1141} {"train_loss": -5.731086730957031, "global_step": 47959, "epoch": 1141} {"train_loss": -5.765988349914551, "global_step": 47960, "epoch": 1141} {"train_loss": -5.803436279296875, "global_step": 47961, "epoch": 1141} {"train_loss": -5.575865268707275, "global_step": 47962, "epoch": 1141} {"train_loss": -5.7379977476029165, "global_step": 47963, "epoch": 1141, "val_loss": 74056.953125} {"train_loss": -5.703372955322266, "global_step": 47964, "epoch": 1142} {"train_loss": -5.705939769744873, "global_step": 47965, "epoch": 1142} {"train_loss": -5.744137763977051, "global_step": 47966, "epoch": 1142} {"train_loss": -5.608610153198242, "global_step": 47967, "epoch": 1142} {"train_loss": -5.74032735824585, "global_step": 47968, "epoch": 1142} {"train_loss": -5.681177616119385, "global_step": 47969, "epoch": 1142} {"train_loss": -5.817561626434326, "global_step": 47970, "epoch": 1142} {"train_loss": -5.772746562957764, "global_step": 47971, "epoch": 1142} {"train_loss": -5.818804740905762, "global_step": 47972, "epoch": 1142} {"train_loss": -5.802732944488525, "global_step": 47973, "epoch": 1142} {"train_loss": -5.773111820220947, "global_step": 47974, "epoch": 1142} {"train_loss": -5.807997226715088, "global_step": 47975, "epoch": 1142} {"train_loss": -5.695287704467773, "global_step": 47976, "epoch": 1142} {"train_loss": -5.764535903930664, "global_step": 47977, "epoch": 1142} {"train_loss": -5.702999114990234, "global_step": 47978, "epoch": 1142} {"train_loss": -5.693521022796631, "global_step": 47979, "epoch": 1142} {"train_loss": -5.731176853179932, "global_step": 47980, "epoch": 1142} {"train_loss": -5.786492824554443, "global_step": 47981, "epoch": 1142} {"train_loss": -5.663005828857422, "global_step": 47982, "epoch": 1142} {"train_loss": -5.690572261810303, "global_step": 47983, "epoch": 1142} {"train_loss": -5.713230609893799, "global_step": 47984, "epoch": 1142} {"train_loss": -5.691982269287109, "global_step": 47985, "epoch": 1142} {"train_loss": -5.701807975769043, "global_step": 47986, "epoch": 1142} {"train_loss": -5.6656975746154785, "global_step": 47987, "epoch": 1142} {"train_loss": -5.753230094909668, "global_step": 47988, "epoch": 1142} {"train_loss": -5.76281213760376, "global_step": 47989, "epoch": 1142} {"train_loss": -5.75697135925293, "global_step": 47990, "epoch": 1142} {"train_loss": -5.738781929016113, "global_step": 47991, "epoch": 1142} {"train_loss": -5.750825881958008, "global_step": 47992, "epoch": 1142} {"train_loss": -5.780303955078125, "global_step": 47993, "epoch": 1142} {"train_loss": -5.718676567077637, "global_step": 47994, "epoch": 1142} {"train_loss": -5.867009162902832, "global_step": 47995, "epoch": 1142} {"train_loss": -5.73192024230957, "global_step": 47996, "epoch": 1142} {"train_loss": -5.750802993774414, "global_step": 47997, "epoch": 1142} {"train_loss": -5.791725158691406, "global_step": 47998, "epoch": 1142} {"train_loss": -5.827917098999023, "global_step": 47999, "epoch": 1142} {"train_loss": -5.854520797729492, "global_step": 48000, "epoch": 1142} {"train_loss": -5.7724289894104, "global_step": 48001, "epoch": 1142} {"train_loss": -5.86525821685791, "global_step": 48002, "epoch": 1142} {"train_loss": -5.6710662841796875, "global_step": 48003, "epoch": 1142} {"train_loss": -5.6890106201171875, "global_step": 48004, "epoch": 1142} {"train_loss": -5.743588878994896, "global_step": 48005, "epoch": 1142, "val_loss": 73938.2890625} {"train_loss": -5.848684787750244, "global_step": 48006, "epoch": 1143} {"train_loss": -5.758091926574707, "global_step": 48007, "epoch": 1143} {"train_loss": -5.680380821228027, "global_step": 48008, "epoch": 1143} {"train_loss": -5.773940086364746, "global_step": 48009, "epoch": 1143} {"train_loss": -5.535573959350586, "global_step": 48010, "epoch": 1143} {"train_loss": -5.651368618011475, "global_step": 48011, "epoch": 1143} {"train_loss": -5.644669532775879, "global_step": 48012, "epoch": 1143} {"train_loss": -5.649415493011475, "global_step": 48013, "epoch": 1143} {"train_loss": -5.67503547668457, "global_step": 48014, "epoch": 1143} {"train_loss": -5.640813827514648, "global_step": 48015, "epoch": 1143} {"train_loss": -5.519842147827148, "global_step": 48016, "epoch": 1143} {"train_loss": -5.7367024421691895, "global_step": 48017, "epoch": 1143} {"train_loss": -5.698533535003662, "global_step": 48018, "epoch": 1143} {"train_loss": -5.639615535736084, "global_step": 48019, "epoch": 1143} {"train_loss": -5.802680969238281, "global_step": 48020, "epoch": 1143} {"train_loss": -5.505018711090088, "global_step": 48021, "epoch": 1143} {"train_loss": -5.776192665100098, "global_step": 48022, "epoch": 1143} {"train_loss": -5.628083229064941, "global_step": 48023, "epoch": 1143} {"train_loss": -5.688712120056152, "global_step": 48024, "epoch": 1143} {"train_loss": -5.62436580657959, "global_step": 48025, "epoch": 1143} {"train_loss": -5.7695441246032715, "global_step": 48026, "epoch": 1143} {"train_loss": -5.6880292892456055, "global_step": 48027, "epoch": 1143} {"train_loss": -5.752090930938721, "global_step": 48028, "epoch": 1143} {"train_loss": -5.74567174911499, "global_step": 48029, "epoch": 1143} {"train_loss": -5.648266792297363, "global_step": 48030, "epoch": 1143} {"train_loss": -5.679531097412109, "global_step": 48031, "epoch": 1143} {"train_loss": -5.808614253997803, "global_step": 48032, "epoch": 1143} {"train_loss": -5.755146026611328, "global_step": 48033, "epoch": 1143} {"train_loss": -5.582092761993408, "global_step": 48034, "epoch": 1143} {"train_loss": -5.694341659545898, "global_step": 48035, "epoch": 1143} {"train_loss": -5.763049602508545, "global_step": 48036, "epoch": 1143} {"train_loss": -5.707635879516602, "global_step": 48037, "epoch": 1143} {"train_loss": -5.699491500854492, "global_step": 48038, "epoch": 1143} {"train_loss": -5.72578763961792, "global_step": 48039, "epoch": 1143} {"train_loss": -5.710920333862305, "global_step": 48040, "epoch": 1143} {"train_loss": -5.636477947235107, "global_step": 48041, "epoch": 1143} {"train_loss": -5.634615421295166, "global_step": 48042, "epoch": 1143} {"train_loss": -5.8588738441467285, "global_step": 48043, "epoch": 1143} {"train_loss": -5.6009931564331055, "global_step": 48044, "epoch": 1143} {"train_loss": -5.845978260040283, "global_step": 48045, "epoch": 1143} {"train_loss": -5.623204231262207, "global_step": 48046, "epoch": 1143} {"train_loss": -5.695291564578102, "global_step": 48047, "epoch": 1143, "val_loss": 74619.9375} {"train_loss": -5.674299716949463, "global_step": 48048, "epoch": 1144} {"train_loss": -5.737502098083496, "global_step": 48049, "epoch": 1144} {"train_loss": -5.742706298828125, "global_step": 48050, "epoch": 1144} {"train_loss": -5.483354568481445, "global_step": 48051, "epoch": 1144} {"train_loss": -5.623844146728516, "global_step": 48052, "epoch": 1144} {"train_loss": -5.697784423828125, "global_step": 48053, "epoch": 1144} {"train_loss": -5.688492774963379, "global_step": 48054, "epoch": 1144} {"train_loss": -5.872973442077637, "global_step": 48055, "epoch": 1144} {"train_loss": -5.711358070373535, "global_step": 48056, "epoch": 1144} {"train_loss": -5.679418563842773, "global_step": 48057, "epoch": 1144} {"train_loss": -5.805917739868164, "global_step": 48058, "epoch": 1144} {"train_loss": -5.736176490783691, "global_step": 48059, "epoch": 1144} {"train_loss": -5.660446643829346, "global_step": 48060, "epoch": 1144} {"train_loss": -5.780035972595215, "global_step": 48061, "epoch": 1144} {"train_loss": -5.787649154663086, "global_step": 48062, "epoch": 1144} {"train_loss": -5.727917194366455, "global_step": 48063, "epoch": 1144} {"train_loss": -5.71665096282959, "global_step": 48064, "epoch": 1144} {"train_loss": -5.663932800292969, "global_step": 48065, "epoch": 1144} {"train_loss": -5.798802852630615, "global_step": 48066, "epoch": 1144} {"train_loss": -5.859933853149414, "global_step": 48067, "epoch": 1144} {"train_loss": -5.712244987487793, "global_step": 48068, "epoch": 1144} {"train_loss": -5.676726341247559, "global_step": 48069, "epoch": 1144} {"train_loss": -5.634573936462402, "global_step": 48070, "epoch": 1144} {"train_loss": -5.817379474639893, "global_step": 48071, "epoch": 1144} {"train_loss": -5.745410919189453, "global_step": 48072, "epoch": 1144} {"train_loss": -5.810901641845703, "global_step": 48073, "epoch": 1144} {"train_loss": -5.8026933670043945, "global_step": 48074, "epoch": 1144} {"train_loss": -5.738933086395264, "global_step": 48075, "epoch": 1144} {"train_loss": -5.689629554748535, "global_step": 48076, "epoch": 1144} {"train_loss": -5.923471450805664, "global_step": 48077, "epoch": 1144} {"train_loss": -5.818533897399902, "global_step": 48078, "epoch": 1144} {"train_loss": -5.724517822265625, "global_step": 48079, "epoch": 1144} {"train_loss": -5.731433868408203, "global_step": 48080, "epoch": 1144} {"train_loss": -5.757837295532227, "global_step": 48081, "epoch": 1144} {"train_loss": -5.673198699951172, "global_step": 48082, "epoch": 1144} {"train_loss": -5.738016605377197, "global_step": 48083, "epoch": 1144} {"train_loss": -5.728924751281738, "global_step": 48084, "epoch": 1144} {"train_loss": -5.732125759124756, "global_step": 48085, "epoch": 1144} {"train_loss": -5.693507194519043, "global_step": 48086, "epoch": 1144} {"train_loss": -5.7845563888549805, "global_step": 48087, "epoch": 1144} {"train_loss": -5.643604278564453, "global_step": 48088, "epoch": 1144} {"train_loss": -5.732516016278948, "global_step": 48089, "epoch": 1144, "val_loss": 73998.875} {"train_loss": -5.834022521972656, "global_step": 48090, "epoch": 1145} {"train_loss": -5.7291436195373535, "global_step": 48091, "epoch": 1145} {"train_loss": -5.785170555114746, "global_step": 48092, "epoch": 1145} {"train_loss": -5.670360088348389, "global_step": 48093, "epoch": 1145} {"train_loss": -5.886350631713867, "global_step": 48094, "epoch": 1145} {"train_loss": -5.835821151733398, "global_step": 48095, "epoch": 1145} {"train_loss": -5.8325934410095215, "global_step": 48096, "epoch": 1145} {"train_loss": -5.66151237487793, "global_step": 48097, "epoch": 1145} {"train_loss": -5.686458587646484, "global_step": 48098, "epoch": 1145} {"train_loss": -5.761684417724609, "global_step": 48099, "epoch": 1145} {"train_loss": -5.671760559082031, "global_step": 48100, "epoch": 1145} {"train_loss": -5.768824577331543, "global_step": 48101, "epoch": 1145} {"train_loss": -5.907378196716309, "global_step": 48102, "epoch": 1145} {"train_loss": -5.846533298492432, "global_step": 48103, "epoch": 1145} {"train_loss": -5.7852373123168945, "global_step": 48104, "epoch": 1145} {"train_loss": -5.772039413452148, "global_step": 48105, "epoch": 1145} {"train_loss": -5.824183464050293, "global_step": 48106, "epoch": 1145} {"train_loss": -5.856377601623535, "global_step": 48107, "epoch": 1145} {"train_loss": -5.6976318359375, "global_step": 48108, "epoch": 1145} {"train_loss": -5.685495376586914, "global_step": 48109, "epoch": 1145} {"train_loss": -5.796034812927246, "global_step": 48110, "epoch": 1145} {"train_loss": -5.766207695007324, "global_step": 48111, "epoch": 1145} {"train_loss": -5.782473564147949, "global_step": 48112, "epoch": 1145} {"train_loss": -5.626611709594727, "global_step": 48113, "epoch": 1145} {"train_loss": -5.674538612365723, "global_step": 48114, "epoch": 1145} {"train_loss": -5.664895057678223, "global_step": 48115, "epoch": 1145} {"train_loss": -5.740729331970215, "global_step": 48116, "epoch": 1145} {"train_loss": -5.762247085571289, "global_step": 48117, "epoch": 1145} {"train_loss": -5.70158576965332, "global_step": 48118, "epoch": 1145} {"train_loss": -5.89630651473999, "global_step": 48119, "epoch": 1145} {"train_loss": -5.670689582824707, "global_step": 48120, "epoch": 1145} {"train_loss": -5.759244918823242, "global_step": 48121, "epoch": 1145} {"train_loss": -5.767164707183838, "global_step": 48122, "epoch": 1145} {"train_loss": -5.679956436157227, "global_step": 48123, "epoch": 1145} {"train_loss": -5.71616268157959, "global_step": 48124, "epoch": 1145} {"train_loss": -5.665827751159668, "global_step": 48125, "epoch": 1145} {"train_loss": -5.57889986038208, "global_step": 48126, "epoch": 1145} {"train_loss": -5.7386474609375, "global_step": 48127, "epoch": 1145} {"train_loss": -5.70448112487793, "global_step": 48128, "epoch": 1145} {"train_loss": -5.77344274520874, "global_step": 48129, "epoch": 1145} {"train_loss": -5.883929252624512, "global_step": 48130, "epoch": 1145} {"train_loss": -5.749877475556874, "global_step": 48131, "epoch": 1145, "val_loss": 74108.5} {"train_loss": -5.826471328735352, "global_step": 48132, "epoch": 1146} {"train_loss": -5.911039352416992, "global_step": 48133, "epoch": 1146} {"train_loss": -5.680878162384033, "global_step": 48134, "epoch": 1146} {"train_loss": -5.765868186950684, "global_step": 48135, "epoch": 1146} {"train_loss": -5.702566146850586, "global_step": 48136, "epoch": 1146} {"train_loss": -5.689266204833984, "global_step": 48137, "epoch": 1146} {"train_loss": -5.671298503875732, "global_step": 48138, "epoch": 1146} {"train_loss": -5.659463405609131, "global_step": 48139, "epoch": 1146} {"train_loss": -5.689291954040527, "global_step": 48140, "epoch": 1146} {"train_loss": -5.788434982299805, "global_step": 48141, "epoch": 1146} {"train_loss": -5.750988960266113, "global_step": 48142, "epoch": 1146} {"train_loss": -5.760426044464111, "global_step": 48143, "epoch": 1146} {"train_loss": -5.8036956787109375, "global_step": 48144, "epoch": 1146} {"train_loss": -5.84578800201416, "global_step": 48145, "epoch": 1146} {"train_loss": -5.696036338806152, "global_step": 48146, "epoch": 1146} {"train_loss": -5.654212474822998, "global_step": 48147, "epoch": 1146} {"train_loss": -5.7940592765808105, "global_step": 48148, "epoch": 1146} {"train_loss": -5.832306385040283, "global_step": 48149, "epoch": 1146} {"train_loss": -5.771744251251221, "global_step": 48150, "epoch": 1146} {"train_loss": -5.756087303161621, "global_step": 48151, "epoch": 1146} {"train_loss": -5.803770065307617, "global_step": 48152, "epoch": 1146} {"train_loss": -5.677276611328125, "global_step": 48153, "epoch": 1146} {"train_loss": -5.722419738769531, "global_step": 48154, "epoch": 1146} {"train_loss": -5.678947448730469, "global_step": 48155, "epoch": 1146} {"train_loss": -5.751175403594971, "global_step": 48156, "epoch": 1146} {"train_loss": -5.808107852935791, "global_step": 48157, "epoch": 1146} {"train_loss": -5.803426265716553, "global_step": 48158, "epoch": 1146} {"train_loss": -5.559930324554443, "global_step": 48159, "epoch": 1146} {"train_loss": -5.711634635925293, "global_step": 48160, "epoch": 1146} {"train_loss": -5.659338474273682, "global_step": 48161, "epoch": 1146} {"train_loss": -5.799389839172363, "global_step": 48162, "epoch": 1146} {"train_loss": -5.812108039855957, "global_step": 48163, "epoch": 1146} {"train_loss": -5.7656378746032715, "global_step": 48164, "epoch": 1146} {"train_loss": -5.748492240905762, "global_step": 48165, "epoch": 1146} {"train_loss": -5.750937461853027, "global_step": 48166, "epoch": 1146} {"train_loss": -5.743288516998291, "global_step": 48167, "epoch": 1146} {"train_loss": -5.754586696624756, "global_step": 48168, "epoch": 1146} {"train_loss": -5.736499786376953, "global_step": 48169, "epoch": 1146} {"train_loss": -5.805232048034668, "global_step": 48170, "epoch": 1146} {"train_loss": -5.662832260131836, "global_step": 48171, "epoch": 1146} {"train_loss": -5.771416664123535, "global_step": 48172, "epoch": 1146} {"train_loss": -5.747717301050822, "global_step": 48173, "epoch": 1146, "val_loss": 73952.703125} {"train_loss": -5.692753314971924, "global_step": 48174, "epoch": 1147} {"train_loss": -5.825039863586426, "global_step": 48175, "epoch": 1147} {"train_loss": -5.694248199462891, "global_step": 48176, "epoch": 1147} {"train_loss": -5.684350967407227, "global_step": 48177, "epoch": 1147} {"train_loss": -5.762599945068359, "global_step": 48178, "epoch": 1147} {"train_loss": -5.797507286071777, "global_step": 48179, "epoch": 1147} {"train_loss": -5.7811102867126465, "global_step": 48180, "epoch": 1147} {"train_loss": -5.786917686462402, "global_step": 48181, "epoch": 1147} {"train_loss": -5.846958160400391, "global_step": 48182, "epoch": 1147} {"train_loss": -5.911365032196045, "global_step": 48183, "epoch": 1147} {"train_loss": -5.6913909912109375, "global_step": 48184, "epoch": 1147} {"train_loss": -5.753877639770508, "global_step": 48185, "epoch": 1147} {"train_loss": -5.723043441772461, "global_step": 48186, "epoch": 1147} {"train_loss": -5.886394500732422, "global_step": 48187, "epoch": 1147} {"train_loss": -5.875658988952637, "global_step": 48188, "epoch": 1147} {"train_loss": -5.568921089172363, "global_step": 48189, "epoch": 1147} {"train_loss": -5.819166660308838, "global_step": 48190, "epoch": 1147} {"train_loss": -5.732697486877441, "global_step": 48191, "epoch": 1147} {"train_loss": -5.592252731323242, "global_step": 48192, "epoch": 1147} {"train_loss": -5.86011266708374, "global_step": 48193, "epoch": 1147} {"train_loss": -5.9055070877075195, "global_step": 48194, "epoch": 1147} {"train_loss": -5.663944721221924, "global_step": 48195, "epoch": 1147} {"train_loss": -5.6975932121276855, "global_step": 48196, "epoch": 1147} {"train_loss": -5.833522796630859, "global_step": 48197, "epoch": 1147} {"train_loss": -5.792402267456055, "global_step": 48198, "epoch": 1147} {"train_loss": -5.589258193969727, "global_step": 48199, "epoch": 1147} {"train_loss": -5.694103717803955, "global_step": 48200, "epoch": 1147} {"train_loss": -5.697700023651123, "global_step": 48201, "epoch": 1147} {"train_loss": -5.648228645324707, "global_step": 48202, "epoch": 1147} {"train_loss": -5.658580780029297, "global_step": 48203, "epoch": 1147} {"train_loss": -5.8940749168396, "global_step": 48204, "epoch": 1147} {"train_loss": -5.831564903259277, "global_step": 48205, "epoch": 1147} {"train_loss": -5.71547794342041, "global_step": 48206, "epoch": 1147} {"train_loss": -5.757862567901611, "global_step": 48207, "epoch": 1147} {"train_loss": -5.846487522125244, "global_step": 48208, "epoch": 1147} {"train_loss": -5.810519695281982, "global_step": 48209, "epoch": 1147} {"train_loss": -5.721362590789795, "global_step": 48210, "epoch": 1147} {"train_loss": -5.753464698791504, "global_step": 48211, "epoch": 1147} {"train_loss": -5.660935401916504, "global_step": 48212, "epoch": 1147} {"train_loss": -5.710381031036377, "global_step": 48213, "epoch": 1147} {"train_loss": -5.821046829223633, "global_step": 48214, "epoch": 1147} {"train_loss": -5.756912379037766, "global_step": 48215, "epoch": 1147, "val_loss": 74110.6875} {"train_loss": -5.711108207702637, "global_step": 48216, "epoch": 1148} {"train_loss": -5.790766716003418, "global_step": 48217, "epoch": 1148} {"train_loss": -5.836138725280762, "global_step": 48218, "epoch": 1148} {"train_loss": -5.854013442993164, "global_step": 48219, "epoch": 1148} {"train_loss": -5.751338005065918, "global_step": 48220, "epoch": 1148} {"train_loss": -5.7969841957092285, "global_step": 48221, "epoch": 1148} {"train_loss": -5.7400803565979, "global_step": 48222, "epoch": 1148} {"train_loss": -5.7243828773498535, "global_step": 48223, "epoch": 1148} {"train_loss": -5.621278762817383, "global_step": 48224, "epoch": 1148} {"train_loss": -5.837226390838623, "global_step": 48225, "epoch": 1148} {"train_loss": -5.676344871520996, "global_step": 48226, "epoch": 1148} {"train_loss": -5.670571327209473, "global_step": 48227, "epoch": 1148} {"train_loss": -5.803640365600586, "global_step": 48228, "epoch": 1148} {"train_loss": -5.7307891845703125, "global_step": 48229, "epoch": 1148} {"train_loss": -5.732128620147705, "global_step": 48230, "epoch": 1148} {"train_loss": -5.714439392089844, "global_step": 48231, "epoch": 1148} {"train_loss": -5.757923126220703, "global_step": 48232, "epoch": 1148} {"train_loss": -5.70067024230957, "global_step": 48233, "epoch": 1148} {"train_loss": -5.845104217529297, "global_step": 48234, "epoch": 1148} {"train_loss": -5.785989761352539, "global_step": 48235, "epoch": 1148} {"train_loss": -5.714720726013184, "global_step": 48236, "epoch": 1148} {"train_loss": -5.85990571975708, "global_step": 48237, "epoch": 1148} {"train_loss": -5.817607879638672, "global_step": 48238, "epoch": 1148} {"train_loss": -5.931999206542969, "global_step": 48239, "epoch": 1148} {"train_loss": -5.776978969573975, "global_step": 48240, "epoch": 1148} {"train_loss": -5.689059257507324, "global_step": 48241, "epoch": 1148} {"train_loss": -5.726593017578125, "global_step": 48242, "epoch": 1148} {"train_loss": -5.724832534790039, "global_step": 48243, "epoch": 1148} {"train_loss": -5.80529260635376, "global_step": 48244, "epoch": 1148} {"train_loss": -5.787934303283691, "global_step": 48245, "epoch": 1148} {"train_loss": -5.667741775512695, "global_step": 48246, "epoch": 1148} {"train_loss": -5.706371784210205, "global_step": 48247, "epoch": 1148} {"train_loss": -5.790751934051514, "global_step": 48248, "epoch": 1148} {"train_loss": -5.764299392700195, "global_step": 48249, "epoch": 1148} {"train_loss": -5.709573268890381, "global_step": 48250, "epoch": 1148} {"train_loss": -5.804910659790039, "global_step": 48251, "epoch": 1148} {"train_loss": -5.653055191040039, "global_step": 48252, "epoch": 1148} {"train_loss": -5.771806716918945, "global_step": 48253, "epoch": 1148} {"train_loss": -5.74702262878418, "global_step": 48254, "epoch": 1148} {"train_loss": -5.634415149688721, "global_step": 48255, "epoch": 1148} {"train_loss": -5.776996612548828, "global_step": 48256, "epoch": 1148} {"train_loss": -5.754473073141916, "global_step": 48257, "epoch": 1148, "val_loss": 73973.6953125} {"train_loss": -5.6847920417785645, "global_step": 48258, "epoch": 1149} {"train_loss": -5.799318313598633, "global_step": 48259, "epoch": 1149} {"train_loss": -5.682302474975586, "global_step": 48260, "epoch": 1149} {"train_loss": -5.677910804748535, "global_step": 48261, "epoch": 1149} {"train_loss": -5.833367824554443, "global_step": 48262, "epoch": 1149} {"train_loss": -5.788597106933594, "global_step": 48263, "epoch": 1149} {"train_loss": -5.736105442047119, "global_step": 48264, "epoch": 1149} {"train_loss": -5.623779773712158, "global_step": 48265, "epoch": 1149} {"train_loss": -5.867282867431641, "global_step": 48266, "epoch": 1149} {"train_loss": -5.804956436157227, "global_step": 48267, "epoch": 1149} {"train_loss": -5.730581283569336, "global_step": 48268, "epoch": 1149} {"train_loss": -5.857199192047119, "global_step": 48269, "epoch": 1149} {"train_loss": -5.75417423248291, "global_step": 48270, "epoch": 1149} {"train_loss": -5.7026801109313965, "global_step": 48271, "epoch": 1149} {"train_loss": -5.625420570373535, "global_step": 48272, "epoch": 1149} {"train_loss": -5.811737060546875, "global_step": 48273, "epoch": 1149} {"train_loss": -5.866690635681152, "global_step": 48274, "epoch": 1149} {"train_loss": -5.836604118347168, "global_step": 48275, "epoch": 1149} {"train_loss": -5.774071216583252, "global_step": 48276, "epoch": 1149} {"train_loss": -5.75437593460083, "global_step": 48277, "epoch": 1149} {"train_loss": -5.790688991546631, "global_step": 48278, "epoch": 1149} {"train_loss": -5.760899543762207, "global_step": 48279, "epoch": 1149} {"train_loss": -5.760575771331787, "global_step": 48280, "epoch": 1149} {"train_loss": -5.737262725830078, "global_step": 48281, "epoch": 1149} {"train_loss": -5.733613014221191, "global_step": 48282, "epoch": 1149} {"train_loss": -5.761866569519043, "global_step": 48283, "epoch": 1149} {"train_loss": -5.70088005065918, "global_step": 48284, "epoch": 1149} {"train_loss": -5.720614433288574, "global_step": 48285, "epoch": 1149} {"train_loss": -5.818472862243652, "global_step": 48286, "epoch": 1149} {"train_loss": -5.711757659912109, "global_step": 48287, "epoch": 1149} {"train_loss": -5.823616027832031, "global_step": 48288, "epoch": 1149} {"train_loss": -5.834344863891602, "global_step": 48289, "epoch": 1149} {"train_loss": -5.606564998626709, "global_step": 48290, "epoch": 1149} {"train_loss": -5.822963714599609, "global_step": 48291, "epoch": 1149} {"train_loss": -5.672628402709961, "global_step": 48292, "epoch": 1149} {"train_loss": -5.802566051483154, "global_step": 48293, "epoch": 1149} {"train_loss": -5.880105972290039, "global_step": 48294, "epoch": 1149} {"train_loss": -5.715347766876221, "global_step": 48295, "epoch": 1149} {"train_loss": -5.696771621704102, "global_step": 48296, "epoch": 1149} {"train_loss": -5.7833147048950195, "global_step": 48297, "epoch": 1149} {"train_loss": -5.774236679077148, "global_step": 48298, "epoch": 1149} {"train_loss": -5.757231666928246, "global_step": 48299, "epoch": 1149, "val_loss": 74091.671875} {"train_loss": -5.871378421783447, "global_step": 48300, "epoch": 1150} {"train_loss": -5.781180381774902, "global_step": 48301, "epoch": 1150} {"train_loss": -5.718705177307129, "global_step": 48302, "epoch": 1150} {"train_loss": -5.788205146789551, "global_step": 48303, "epoch": 1150} {"train_loss": -5.817634582519531, "global_step": 48304, "epoch": 1150} {"train_loss": -5.658251762390137, "global_step": 48305, "epoch": 1150} {"train_loss": -5.938904762268066, "global_step": 48306, "epoch": 1150} {"train_loss": -5.832059860229492, "global_step": 48307, "epoch": 1150} {"train_loss": -5.7164788246154785, "global_step": 48308, "epoch": 1150} {"train_loss": -5.774209976196289, "global_step": 48309, "epoch": 1150} {"train_loss": -5.790410995483398, "global_step": 48310, "epoch": 1150} {"train_loss": -5.743873119354248, "global_step": 48311, "epoch": 1150} {"train_loss": -5.670048713684082, "global_step": 48312, "epoch": 1150} {"train_loss": -5.696519374847412, "global_step": 48313, "epoch": 1150} {"train_loss": -5.540474891662598, "global_step": 48314, "epoch": 1150} {"train_loss": -5.823375225067139, "global_step": 48315, "epoch": 1150} {"train_loss": -5.579479217529297, "global_step": 48316, "epoch": 1150} {"train_loss": -5.603214263916016, "global_step": 48317, "epoch": 1150} {"train_loss": -5.628210067749023, "global_step": 48318, "epoch": 1150} {"train_loss": -5.6008501052856445, "global_step": 48319, "epoch": 1150} {"train_loss": -5.81484317779541, "global_step": 48320, "epoch": 1150} {"train_loss": -5.549769401550293, "global_step": 48321, "epoch": 1150} {"train_loss": -5.733702659606934, "global_step": 48322, "epoch": 1150} {"train_loss": -5.668515205383301, "global_step": 48323, "epoch": 1150} {"train_loss": -5.607067108154297, "global_step": 48324, "epoch": 1150} {"train_loss": -5.66873836517334, "global_step": 48325, "epoch": 1150} {"train_loss": -5.687277317047119, "global_step": 48326, "epoch": 1150} {"train_loss": -5.590553283691406, "global_step": 48327, "epoch": 1150} {"train_loss": -5.609671115875244, "global_step": 48328, "epoch": 1150} {"train_loss": -5.696362495422363, "global_step": 48329, "epoch": 1150} {"train_loss": -5.708645820617676, "global_step": 48330, "epoch": 1150} {"train_loss": -5.6753034591674805, "global_step": 48331, "epoch": 1150} {"train_loss": -5.739569664001465, "global_step": 48332, "epoch": 1150} {"train_loss": -5.779318332672119, "global_step": 48333, "epoch": 1150} {"train_loss": -5.662112236022949, "global_step": 48334, "epoch": 1150} {"train_loss": -5.682682991027832, "global_step": 48335, "epoch": 1150} {"train_loss": -5.678855895996094, "global_step": 48336, "epoch": 1150} {"train_loss": -5.816034317016602, "global_step": 48337, "epoch": 1150} {"train_loss": -5.782033920288086, "global_step": 48338, "epoch": 1150} {"train_loss": -5.786120414733887, "global_step": 48339, "epoch": 1150} {"train_loss": -5.724562644958496, "global_step": 48340, "epoch": 1150} {"train_loss": -5.71486006464277, "global_step": 48341, "epoch": 1150, "train/sim_max_reward_0": 0.42534808261647833, "train/sim_max_reward_1": 0.5137263182924368, "train/sim_max_reward_2": 0.651655848978226, "train/sim_max_reward_3": 0.14823350728656523, "train/sim_max_reward_4": 0.8941425705641641, "train/sim_max_reward_5": 0.6888567830997004, "test/sim_max_reward_4500000": 0.6722720726819099, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8737420157303768, "test/sim_max_reward_4500003": 0.001967323988682413, "test/sim_max_reward_4500004": 0.0663961009827197, "test/sim_max_reward_4500005": 0.4956353249963348, "test/sim_max_reward_4500006": 0.8402542493688047, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.05364947033794582, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9267910625923509, "test/sim_max_reward_4500012": 0.8249434751724773, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.17984740546121233, "test/sim_max_reward_4500015": 0.8965022238556093, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0013415800251672392, "test/sim_max_reward_4500018": 0.23042005305833624, "test/sim_max_reward_4500019": 0.8748359270783361, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.6319392811655542, "test/sim_max_reward_4500022": 0.770460479401817, "test/sim_max_reward_4500023": 0.8575493078352681, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.10188516808467046, "test/sim_max_reward_4500027": 0.9781790553163385, "test/sim_max_reward_4500028": 0.23981034575554244, "test/sim_max_reward_4500029": 0.12889932229650397, "test/sim_max_reward_4500030": 0.8251560845590257, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04835742885081101, "test/sim_max_reward_4500033": 0.953375780751941, "test/sim_max_reward_4500034": 0.8022775685787614, "test/sim_max_reward_4500035": 0.9692752982956596, "test/sim_max_reward_4500036": 0.8868716483345256, "test/sim_max_reward_4500037": 0.8515939808768016, "test/sim_max_reward_4500038": 0.34433444520141565, "test/sim_max_reward_4500039": 0.7575770129894951, "test/sim_max_reward_4500040": 0.9206301811996546, "test/sim_max_reward_4500041": 0.4443580388082164, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.939120318505697, "test/sim_max_reward_4500044": 0.37189300025780436, "test/sim_max_reward_4500045": 0.44458718688468524, "test/sim_max_reward_4500046": 0.8752618682338787, "test/sim_max_reward_4500047": 0.6484003465505759, "test/sim_max_reward_4500048": 0.15300626517174504, "test/sim_max_reward_4500049": 0.9354558002126758, "train/mean_score": 0.5536605184729285, "test/mean_score": 0.45672795315027825, "val_loss": 73947.375} {"train_loss": -5.791961669921875, "global_step": 48342, "epoch": 1151} {"train_loss": -5.798471450805664, "global_step": 48343, "epoch": 1151} {"train_loss": -5.73938512802124, "global_step": 48344, "epoch": 1151} {"train_loss": -5.82258415222168, "global_step": 48345, "epoch": 1151} {"train_loss": -5.778367042541504, "global_step": 48346, "epoch": 1151} {"train_loss": -5.702400207519531, "global_step": 48347, "epoch": 1151} {"train_loss": -5.65003776550293, "global_step": 48348, "epoch": 1151} {"train_loss": -5.567394256591797, "global_step": 48349, "epoch": 1151} {"train_loss": -5.781339168548584, "global_step": 48350, "epoch": 1151} {"train_loss": -5.748709678649902, "global_step": 48351, "epoch": 1151} {"train_loss": -5.637399673461914, "global_step": 48352, "epoch": 1151} {"train_loss": -5.737848281860352, "global_step": 48353, "epoch": 1151} {"train_loss": -5.822354316711426, "global_step": 48354, "epoch": 1151} {"train_loss": -5.586081504821777, "global_step": 48355, "epoch": 1151} {"train_loss": -5.765152931213379, "global_step": 48356, "epoch": 1151} {"train_loss": -5.745358467102051, "global_step": 48357, "epoch": 1151} {"train_loss": -5.630122184753418, "global_step": 48358, "epoch": 1151} {"train_loss": -5.856660842895508, "global_step": 48359, "epoch": 1151} {"train_loss": -5.816190719604492, "global_step": 48360, "epoch": 1151} {"train_loss": -5.660511016845703, "global_step": 48361, "epoch": 1151} {"train_loss": -5.8274688720703125, "global_step": 48362, "epoch": 1151} {"train_loss": -5.67043399810791, "global_step": 48363, "epoch": 1151} {"train_loss": -5.721085548400879, "global_step": 48364, "epoch": 1151} {"train_loss": -5.5728254318237305, "global_step": 48365, "epoch": 1151} {"train_loss": -5.750911712646484, "global_step": 48366, "epoch": 1151} {"train_loss": -5.7836151123046875, "global_step": 48367, "epoch": 1151} {"train_loss": -5.670564651489258, "global_step": 48368, "epoch": 1151} {"train_loss": -5.827866554260254, "global_step": 48369, "epoch": 1151} {"train_loss": -5.749985694885254, "global_step": 48370, "epoch": 1151} {"train_loss": -5.735250473022461, "global_step": 48371, "epoch": 1151} {"train_loss": -5.680819511413574, "global_step": 48372, "epoch": 1151} {"train_loss": -5.734842300415039, "global_step": 48373, "epoch": 1151} {"train_loss": -5.724474906921387, "global_step": 48374, "epoch": 1151} {"train_loss": -5.7990546226501465, "global_step": 48375, "epoch": 1151} {"train_loss": -5.774170398712158, "global_step": 48376, "epoch": 1151} {"train_loss": -5.7224812507629395, "global_step": 48377, "epoch": 1151} {"train_loss": -5.709195137023926, "global_step": 48378, "epoch": 1151} {"train_loss": -5.725071907043457, "global_step": 48379, "epoch": 1151} {"train_loss": -5.717150688171387, "global_step": 48380, "epoch": 1151} {"train_loss": -5.796858787536621, "global_step": 48381, "epoch": 1151} {"train_loss": -5.707783222198486, "global_step": 48382, "epoch": 1151} {"train_loss": -5.736436287562053, "global_step": 48383, "epoch": 1151, "val_loss": 74046.8515625} {"train_loss": -5.630014419555664, "global_step": 48384, "epoch": 1152} {"train_loss": -5.750361442565918, "global_step": 48385, "epoch": 1152} {"train_loss": -5.692890167236328, "global_step": 48386, "epoch": 1152} {"train_loss": -5.724266052246094, "global_step": 48387, "epoch": 1152} {"train_loss": -5.6999406814575195, "global_step": 48388, "epoch": 1152} {"train_loss": -5.7692413330078125, "global_step": 48389, "epoch": 1152} {"train_loss": -5.604958534240723, "global_step": 48390, "epoch": 1152} {"train_loss": -5.885124683380127, "global_step": 48391, "epoch": 1152} {"train_loss": -5.784668445587158, "global_step": 48392, "epoch": 1152} {"train_loss": -5.691788196563721, "global_step": 48393, "epoch": 1152} {"train_loss": -5.5713300704956055, "global_step": 48394, "epoch": 1152} {"train_loss": -5.738781452178955, "global_step": 48395, "epoch": 1152} {"train_loss": -5.658883571624756, "global_step": 48396, "epoch": 1152} {"train_loss": -5.7678728103637695, "global_step": 48397, "epoch": 1152} {"train_loss": -5.630054950714111, "global_step": 48398, "epoch": 1152} {"train_loss": -5.833347797393799, "global_step": 48399, "epoch": 1152} {"train_loss": -5.874317646026611, "global_step": 48400, "epoch": 1152} {"train_loss": -5.733341217041016, "global_step": 48401, "epoch": 1152} {"train_loss": -5.633238315582275, "global_step": 48402, "epoch": 1152} {"train_loss": -5.674355506896973, "global_step": 48403, "epoch": 1152} {"train_loss": -5.678747177124023, "global_step": 48404, "epoch": 1152} {"train_loss": -5.828907012939453, "global_step": 48405, "epoch": 1152} {"train_loss": -5.69153356552124, "global_step": 48406, "epoch": 1152} {"train_loss": -5.813599586486816, "global_step": 48407, "epoch": 1152} {"train_loss": -5.748199462890625, "global_step": 48408, "epoch": 1152} {"train_loss": -5.592721939086914, "global_step": 48409, "epoch": 1152} {"train_loss": -5.821925163269043, "global_step": 48410, "epoch": 1152} {"train_loss": -5.706499099731445, "global_step": 48411, "epoch": 1152} {"train_loss": -5.783525466918945, "global_step": 48412, "epoch": 1152} {"train_loss": -5.7930402755737305, "global_step": 48413, "epoch": 1152} {"train_loss": -5.611810684204102, "global_step": 48414, "epoch": 1152} {"train_loss": -5.610317230224609, "global_step": 48415, "epoch": 1152} {"train_loss": -5.648262977600098, "global_step": 48416, "epoch": 1152} {"train_loss": -5.839139938354492, "global_step": 48417, "epoch": 1152} {"train_loss": -5.809853553771973, "global_step": 48418, "epoch": 1152} {"train_loss": -5.826882362365723, "global_step": 48419, "epoch": 1152} {"train_loss": -5.7536773681640625, "global_step": 48420, "epoch": 1152} {"train_loss": -5.766382217407227, "global_step": 48421, "epoch": 1152} {"train_loss": -5.846782207489014, "global_step": 48422, "epoch": 1152} {"train_loss": -5.800101280212402, "global_step": 48423, "epoch": 1152} {"train_loss": -5.952765464782715, "global_step": 48424, "epoch": 1152} {"train_loss": -5.7402559121449785, "global_step": 48425, "epoch": 1152, "val_loss": 73918.734375} {"train_loss": -5.808312892913818, "global_step": 48426, "epoch": 1153} {"train_loss": -5.769171714782715, "global_step": 48427, "epoch": 1153} {"train_loss": -5.867663383483887, "global_step": 48428, "epoch": 1153} {"train_loss": -5.740475654602051, "global_step": 48429, "epoch": 1153} {"train_loss": -5.736804962158203, "global_step": 48430, "epoch": 1153} {"train_loss": -5.72435998916626, "global_step": 48431, "epoch": 1153} {"train_loss": -5.728187561035156, "global_step": 48432, "epoch": 1153} {"train_loss": -5.610902309417725, "global_step": 48433, "epoch": 1153} {"train_loss": -5.704885959625244, "global_step": 48434, "epoch": 1153} {"train_loss": -5.763028621673584, "global_step": 48435, "epoch": 1153} {"train_loss": -5.6066436767578125, "global_step": 48436, "epoch": 1153} {"train_loss": -5.657751560211182, "global_step": 48437, "epoch": 1153} {"train_loss": -5.73488712310791, "global_step": 48438, "epoch": 1153} {"train_loss": -5.7547783851623535, "global_step": 48439, "epoch": 1153} {"train_loss": -5.67426872253418, "global_step": 48440, "epoch": 1153} {"train_loss": -5.835954666137695, "global_step": 48441, "epoch": 1153} {"train_loss": -5.708653926849365, "global_step": 48442, "epoch": 1153} {"train_loss": -5.694321632385254, "global_step": 48443, "epoch": 1153} {"train_loss": -5.800158500671387, "global_step": 48444, "epoch": 1153} {"train_loss": -5.727701187133789, "global_step": 48445, "epoch": 1153} {"train_loss": -5.799746513366699, "global_step": 48446, "epoch": 1153} {"train_loss": -5.767387390136719, "global_step": 48447, "epoch": 1153} {"train_loss": -5.772268772125244, "global_step": 48448, "epoch": 1153} {"train_loss": -5.8617753982543945, "global_step": 48449, "epoch": 1153} {"train_loss": -5.6436591148376465, "global_step": 48450, "epoch": 1153} {"train_loss": -5.632746696472168, "global_step": 48451, "epoch": 1153} {"train_loss": -5.806509017944336, "global_step": 48452, "epoch": 1153} {"train_loss": -5.710241317749023, "global_step": 48453, "epoch": 1153} {"train_loss": -5.804062366485596, "global_step": 48454, "epoch": 1153} {"train_loss": -5.831423759460449, "global_step": 48455, "epoch": 1153} {"train_loss": -5.695688247680664, "global_step": 48456, "epoch": 1153} {"train_loss": -5.526233673095703, "global_step": 48457, "epoch": 1153} {"train_loss": -5.764298439025879, "global_step": 48458, "epoch": 1153} {"train_loss": -5.867681980133057, "global_step": 48459, "epoch": 1153} {"train_loss": -5.7026448249816895, "global_step": 48460, "epoch": 1153} {"train_loss": -5.769853115081787, "global_step": 48461, "epoch": 1153} {"train_loss": -5.665606498718262, "global_step": 48462, "epoch": 1153} {"train_loss": -5.710317611694336, "global_step": 48463, "epoch": 1153} {"train_loss": -5.819080352783203, "global_step": 48464, "epoch": 1153} {"train_loss": -5.7433271408081055, "global_step": 48465, "epoch": 1153} {"train_loss": -5.7509684562683105, "global_step": 48466, "epoch": 1153} {"train_loss": -5.741127638589768, "global_step": 48467, "epoch": 1153, "val_loss": 74180.734375} {"train_loss": -5.767202854156494, "global_step": 48468, "epoch": 1154} {"train_loss": -5.849303245544434, "global_step": 48469, "epoch": 1154} {"train_loss": -5.850964546203613, "global_step": 48470, "epoch": 1154} {"train_loss": -5.615222930908203, "global_step": 48471, "epoch": 1154} {"train_loss": -5.772093772888184, "global_step": 48472, "epoch": 1154} {"train_loss": -5.732078552246094, "global_step": 48473, "epoch": 1154} {"train_loss": -5.694619178771973, "global_step": 48474, "epoch": 1154} {"train_loss": -5.820359230041504, "global_step": 48475, "epoch": 1154} {"train_loss": -5.740973472595215, "global_step": 48476, "epoch": 1154} {"train_loss": -5.761059761047363, "global_step": 48477, "epoch": 1154} {"train_loss": -5.83329439163208, "global_step": 48478, "epoch": 1154} {"train_loss": -5.695297718048096, "global_step": 48479, "epoch": 1154} {"train_loss": -5.646083354949951, "global_step": 48480, "epoch": 1154} {"train_loss": -5.683946132659912, "global_step": 48481, "epoch": 1154} {"train_loss": -5.840065956115723, "global_step": 48482, "epoch": 1154} {"train_loss": -5.654079437255859, "global_step": 48483, "epoch": 1154} {"train_loss": -5.709478855133057, "global_step": 48484, "epoch": 1154} {"train_loss": -5.722569465637207, "global_step": 48485, "epoch": 1154} {"train_loss": -5.734462738037109, "global_step": 48486, "epoch": 1154} {"train_loss": -5.769187927246094, "global_step": 48487, "epoch": 1154} {"train_loss": -5.708120346069336, "global_step": 48488, "epoch": 1154} {"train_loss": -5.810967445373535, "global_step": 48489, "epoch": 1154} {"train_loss": -5.669370651245117, "global_step": 48490, "epoch": 1154} {"train_loss": -5.736100196838379, "global_step": 48491, "epoch": 1154} {"train_loss": -5.848300457000732, "global_step": 48492, "epoch": 1154} {"train_loss": -5.719897270202637, "global_step": 48493, "epoch": 1154} {"train_loss": -5.740799903869629, "global_step": 48494, "epoch": 1154} {"train_loss": -5.707036018371582, "global_step": 48495, "epoch": 1154} {"train_loss": -5.839757919311523, "global_step": 48496, "epoch": 1154} {"train_loss": -5.709451675415039, "global_step": 48497, "epoch": 1154} {"train_loss": -5.82228946685791, "global_step": 48498, "epoch": 1154} {"train_loss": -5.755512714385986, "global_step": 48499, "epoch": 1154} {"train_loss": -5.632465362548828, "global_step": 48500, "epoch": 1154} {"train_loss": -5.817450523376465, "global_step": 48501, "epoch": 1154} {"train_loss": -5.748238563537598, "global_step": 48502, "epoch": 1154} {"train_loss": -5.7812180519104, "global_step": 48503, "epoch": 1154} {"train_loss": -5.549790382385254, "global_step": 48504, "epoch": 1154} {"train_loss": -5.698335647583008, "global_step": 48505, "epoch": 1154} {"train_loss": -5.7432146072387695, "global_step": 48506, "epoch": 1154} {"train_loss": -5.6431169509887695, "global_step": 48507, "epoch": 1154} {"train_loss": -5.704720497131348, "global_step": 48508, "epoch": 1154} {"train_loss": -5.739666643596831, "global_step": 48509, "epoch": 1154, "val_loss": 74221.1640625} {"train_loss": -5.746030807495117, "global_step": 48510, "epoch": 1155} {"train_loss": -5.787875175476074, "global_step": 48511, "epoch": 1155} {"train_loss": -5.764425277709961, "global_step": 48512, "epoch": 1155} {"train_loss": -5.764065265655518, "global_step": 48513, "epoch": 1155} {"train_loss": -5.763000011444092, "global_step": 48514, "epoch": 1155} {"train_loss": -5.690534591674805, "global_step": 48515, "epoch": 1155} {"train_loss": -5.817609786987305, "global_step": 48516, "epoch": 1155} {"train_loss": -5.626610279083252, "global_step": 48517, "epoch": 1155} {"train_loss": -5.63902473449707, "global_step": 48518, "epoch": 1155} {"train_loss": -5.756625175476074, "global_step": 48519, "epoch": 1155} {"train_loss": -5.730709075927734, "global_step": 48520, "epoch": 1155} {"train_loss": -5.79592227935791, "global_step": 48521, "epoch": 1155} {"train_loss": -5.752530097961426, "global_step": 48522, "epoch": 1155} {"train_loss": -5.7498860359191895, "global_step": 48523, "epoch": 1155} {"train_loss": -5.65341854095459, "global_step": 48524, "epoch": 1155} {"train_loss": -5.712060928344727, "global_step": 48525, "epoch": 1155} {"train_loss": -5.779172897338867, "global_step": 48526, "epoch": 1155} {"train_loss": -5.720804691314697, "global_step": 48527, "epoch": 1155} {"train_loss": -5.7685675621032715, "global_step": 48528, "epoch": 1155} {"train_loss": -5.751095771789551, "global_step": 48529, "epoch": 1155} {"train_loss": -5.880784511566162, "global_step": 48530, "epoch": 1155} {"train_loss": -5.8164873123168945, "global_step": 48531, "epoch": 1155} {"train_loss": -5.6236371994018555, "global_step": 48532, "epoch": 1155} {"train_loss": -5.838519096374512, "global_step": 48533, "epoch": 1155} {"train_loss": -5.764050006866455, "global_step": 48534, "epoch": 1155} {"train_loss": -5.705951690673828, "global_step": 48535, "epoch": 1155} {"train_loss": -5.785632133483887, "global_step": 48536, "epoch": 1155} {"train_loss": -5.793756484985352, "global_step": 48537, "epoch": 1155} {"train_loss": -5.7094573974609375, "global_step": 48538, "epoch": 1155} {"train_loss": -5.710175514221191, "global_step": 48539, "epoch": 1155} {"train_loss": -5.7697649002075195, "global_step": 48540, "epoch": 1155} {"train_loss": -5.874639511108398, "global_step": 48541, "epoch": 1155} {"train_loss": -5.836113929748535, "global_step": 48542, "epoch": 1155} {"train_loss": -5.744383811950684, "global_step": 48543, "epoch": 1155} {"train_loss": -5.799777984619141, "global_step": 48544, "epoch": 1155} {"train_loss": -5.799710273742676, "global_step": 48545, "epoch": 1155} {"train_loss": -5.655303001403809, "global_step": 48546, "epoch": 1155} {"train_loss": -5.579022407531738, "global_step": 48547, "epoch": 1155} {"train_loss": -5.758601665496826, "global_step": 48548, "epoch": 1155} {"train_loss": -5.575756072998047, "global_step": 48549, "epoch": 1155} {"train_loss": -5.62310791015625, "global_step": 48550, "epoch": 1155} {"train_loss": -5.740002904619489, "global_step": 48551, "epoch": 1155, "val_loss": 74455.5078125} {"train_loss": -5.6903557777404785, "global_step": 48552, "epoch": 1156} {"train_loss": -5.759547710418701, "global_step": 48553, "epoch": 1156} {"train_loss": -5.644768714904785, "global_step": 48554, "epoch": 1156} {"train_loss": -5.7845048904418945, "global_step": 48555, "epoch": 1156} {"train_loss": -5.632460594177246, "global_step": 48556, "epoch": 1156} {"train_loss": -5.7366533279418945, "global_step": 48557, "epoch": 1156} {"train_loss": -5.645997047424316, "global_step": 48558, "epoch": 1156} {"train_loss": -5.681063175201416, "global_step": 48559, "epoch": 1156} {"train_loss": -5.852112770080566, "global_step": 48560, "epoch": 1156} {"train_loss": -5.705129146575928, "global_step": 48561, "epoch": 1156} {"train_loss": -5.763119697570801, "global_step": 48562, "epoch": 1156} {"train_loss": -5.790996551513672, "global_step": 48563, "epoch": 1156} {"train_loss": -5.873720169067383, "global_step": 48564, "epoch": 1156} {"train_loss": -5.75506067276001, "global_step": 48565, "epoch": 1156} {"train_loss": -5.795441627502441, "global_step": 48566, "epoch": 1156} {"train_loss": -5.790876388549805, "global_step": 48567, "epoch": 1156} {"train_loss": -5.727070331573486, "global_step": 48568, "epoch": 1156} {"train_loss": -5.8074541091918945, "global_step": 48569, "epoch": 1156} {"train_loss": -5.688024520874023, "global_step": 48570, "epoch": 1156} {"train_loss": -5.788804531097412, "global_step": 48571, "epoch": 1156} {"train_loss": -5.712554454803467, "global_step": 48572, "epoch": 1156} {"train_loss": -5.726870536804199, "global_step": 48573, "epoch": 1156} {"train_loss": -5.647101402282715, "global_step": 48574, "epoch": 1156} {"train_loss": -5.711976051330566, "global_step": 48575, "epoch": 1156} {"train_loss": -5.639441013336182, "global_step": 48576, "epoch": 1156} {"train_loss": -5.7268853187561035, "global_step": 48577, "epoch": 1156} {"train_loss": -5.737614631652832, "global_step": 48578, "epoch": 1156} {"train_loss": -5.658684253692627, "global_step": 48579, "epoch": 1156} {"train_loss": -5.7789106369018555, "global_step": 48580, "epoch": 1156} {"train_loss": -5.743330001831055, "global_step": 48581, "epoch": 1156} {"train_loss": -5.508856773376465, "global_step": 48582, "epoch": 1156} {"train_loss": -5.683895587921143, "global_step": 48583, "epoch": 1156} {"train_loss": -5.815347671508789, "global_step": 48584, "epoch": 1156} {"train_loss": -5.647245407104492, "global_step": 48585, "epoch": 1156} {"train_loss": -5.754314422607422, "global_step": 48586, "epoch": 1156} {"train_loss": -5.799551010131836, "global_step": 48587, "epoch": 1156} {"train_loss": -5.791024208068848, "global_step": 48588, "epoch": 1156} {"train_loss": -5.659513473510742, "global_step": 48589, "epoch": 1156} {"train_loss": -5.7942376136779785, "global_step": 48590, "epoch": 1156} {"train_loss": -5.666057586669922, "global_step": 48591, "epoch": 1156} {"train_loss": -5.671365737915039, "global_step": 48592, "epoch": 1156} {"train_loss": -5.726018496922085, "global_step": 48593, "epoch": 1156, "val_loss": 74261.328125} {"train_loss": -5.621846675872803, "global_step": 48594, "epoch": 1157} {"train_loss": -5.863093376159668, "global_step": 48595, "epoch": 1157} {"train_loss": -5.724224090576172, "global_step": 48596, "epoch": 1157} {"train_loss": -5.722475051879883, "global_step": 48597, "epoch": 1157} {"train_loss": -5.766301155090332, "global_step": 48598, "epoch": 1157} {"train_loss": -5.614007949829102, "global_step": 48599, "epoch": 1157} {"train_loss": -5.6937994956970215, "global_step": 48600, "epoch": 1157} {"train_loss": -5.629264831542969, "global_step": 48601, "epoch": 1157} {"train_loss": -5.741752624511719, "global_step": 48602, "epoch": 1157} {"train_loss": -5.663755416870117, "global_step": 48603, "epoch": 1157} {"train_loss": -5.636748790740967, "global_step": 48604, "epoch": 1157} {"train_loss": -5.691824913024902, "global_step": 48605, "epoch": 1157} {"train_loss": -5.733640670776367, "global_step": 48606, "epoch": 1157} {"train_loss": -5.684876441955566, "global_step": 48607, "epoch": 1157} {"train_loss": -5.670382976531982, "global_step": 48608, "epoch": 1157} {"train_loss": -5.765885829925537, "global_step": 48609, "epoch": 1157} {"train_loss": -5.675995826721191, "global_step": 48610, "epoch": 1157} {"train_loss": -5.752187728881836, "global_step": 48611, "epoch": 1157} {"train_loss": -5.6238298416137695, "global_step": 48612, "epoch": 1157} {"train_loss": -5.738408088684082, "global_step": 48613, "epoch": 1157} {"train_loss": -5.760909080505371, "global_step": 48614, "epoch": 1157} {"train_loss": -5.75432014465332, "global_step": 48615, "epoch": 1157} {"train_loss": -5.685502052307129, "global_step": 48616, "epoch": 1157} {"train_loss": -5.787293434143066, "global_step": 48617, "epoch": 1157} {"train_loss": -5.679376602172852, "global_step": 48618, "epoch": 1157} {"train_loss": -5.885543346405029, "global_step": 48619, "epoch": 1157} {"train_loss": -5.679571151733398, "global_step": 48620, "epoch": 1157} {"train_loss": -5.771895408630371, "global_step": 48621, "epoch": 1157} {"train_loss": -5.708773136138916, "global_step": 48622, "epoch": 1157} {"train_loss": -5.6904449462890625, "global_step": 48623, "epoch": 1157} {"train_loss": -5.830255031585693, "global_step": 48624, "epoch": 1157} {"train_loss": -5.663666725158691, "global_step": 48625, "epoch": 1157} {"train_loss": -5.693727493286133, "global_step": 48626, "epoch": 1157} {"train_loss": -5.682254314422607, "global_step": 48627, "epoch": 1157} {"train_loss": -5.640745162963867, "global_step": 48628, "epoch": 1157} {"train_loss": -5.634041786193848, "global_step": 48629, "epoch": 1157} {"train_loss": -5.755667686462402, "global_step": 48630, "epoch": 1157} {"train_loss": -5.754917144775391, "global_step": 48631, "epoch": 1157} {"train_loss": -5.847667694091797, "global_step": 48632, "epoch": 1157} {"train_loss": -5.742283344268799, "global_step": 48633, "epoch": 1157} {"train_loss": -5.785196304321289, "global_step": 48634, "epoch": 1157} {"train_loss": -5.720550752821422, "global_step": 48635, "epoch": 1157, "val_loss": 74063.484375} {"train_loss": -5.740736484527588, "global_step": 48636, "epoch": 1158} {"train_loss": -5.768728733062744, "global_step": 48637, "epoch": 1158} {"train_loss": -5.552820205688477, "global_step": 48638, "epoch": 1158} {"train_loss": -5.780290126800537, "global_step": 48639, "epoch": 1158} {"train_loss": -5.796932220458984, "global_step": 48640, "epoch": 1158} {"train_loss": -5.82286262512207, "global_step": 48641, "epoch": 1158} {"train_loss": -5.795380592346191, "global_step": 48642, "epoch": 1158} {"train_loss": -5.701700210571289, "global_step": 48643, "epoch": 1158} {"train_loss": -5.769373893737793, "global_step": 48644, "epoch": 1158} {"train_loss": -5.636361122131348, "global_step": 48645, "epoch": 1158} {"train_loss": -5.791294097900391, "global_step": 48646, "epoch": 1158} {"train_loss": -5.799864768981934, "global_step": 48647, "epoch": 1158} {"train_loss": -5.78715705871582, "global_step": 48648, "epoch": 1158} {"train_loss": -5.735207557678223, "global_step": 48649, "epoch": 1158} {"train_loss": -5.665999412536621, "global_step": 48650, "epoch": 1158} {"train_loss": -5.621462821960449, "global_step": 48651, "epoch": 1158} {"train_loss": -5.75093936920166, "global_step": 48652, "epoch": 1158} {"train_loss": -5.887787818908691, "global_step": 48653, "epoch": 1158} {"train_loss": -5.6428141593933105, "global_step": 48654, "epoch": 1158} {"train_loss": -5.607067108154297, "global_step": 48655, "epoch": 1158} {"train_loss": -5.677968978881836, "global_step": 48656, "epoch": 1158} {"train_loss": -5.7058820724487305, "global_step": 48657, "epoch": 1158} {"train_loss": -5.789490699768066, "global_step": 48658, "epoch": 1158} {"train_loss": -5.7510600090026855, "global_step": 48659, "epoch": 1158} {"train_loss": -5.8350934982299805, "global_step": 48660, "epoch": 1158} {"train_loss": -5.846043586730957, "global_step": 48661, "epoch": 1158} {"train_loss": -5.755724906921387, "global_step": 48662, "epoch": 1158} {"train_loss": -5.766034126281738, "global_step": 48663, "epoch": 1158} {"train_loss": -5.562798023223877, "global_step": 48664, "epoch": 1158} {"train_loss": -5.815957069396973, "global_step": 48665, "epoch": 1158} {"train_loss": -5.760331630706787, "global_step": 48666, "epoch": 1158} {"train_loss": -5.7616472244262695, "global_step": 48667, "epoch": 1158} {"train_loss": -5.755092144012451, "global_step": 48668, "epoch": 1158} {"train_loss": -5.712085723876953, "global_step": 48669, "epoch": 1158} {"train_loss": -5.83219051361084, "global_step": 48670, "epoch": 1158} {"train_loss": -5.567196369171143, "global_step": 48671, "epoch": 1158} {"train_loss": -5.800286293029785, "global_step": 48672, "epoch": 1158} {"train_loss": -5.757147789001465, "global_step": 48673, "epoch": 1158} {"train_loss": -5.815039157867432, "global_step": 48674, "epoch": 1158} {"train_loss": -5.684010028839111, "global_step": 48675, "epoch": 1158} {"train_loss": -5.617115020751953, "global_step": 48676, "epoch": 1158} {"train_loss": -5.737087340581985, "global_step": 48677, "epoch": 1158, "val_loss": 73981.3359375} {"train_loss": -5.703597068786621, "global_step": 48678, "epoch": 1159} {"train_loss": -5.710901260375977, "global_step": 48679, "epoch": 1159} {"train_loss": -5.793376922607422, "global_step": 48680, "epoch": 1159} {"train_loss": -5.64539909362793, "global_step": 48681, "epoch": 1159} {"train_loss": -5.739261627197266, "global_step": 48682, "epoch": 1159} {"train_loss": -5.684811115264893, "global_step": 48683, "epoch": 1159} {"train_loss": -5.79782772064209, "global_step": 48684, "epoch": 1159} {"train_loss": -5.702780723571777, "global_step": 48685, "epoch": 1159} {"train_loss": -5.812290668487549, "global_step": 48686, "epoch": 1159} {"train_loss": -5.847480773925781, "global_step": 48687, "epoch": 1159} {"train_loss": -5.712429523468018, "global_step": 48688, "epoch": 1159} {"train_loss": -5.882565498352051, "global_step": 48689, "epoch": 1159} {"train_loss": -5.71618127822876, "global_step": 48690, "epoch": 1159} {"train_loss": -5.629753589630127, "global_step": 48691, "epoch": 1159} {"train_loss": -5.750480651855469, "global_step": 48692, "epoch": 1159} {"train_loss": -5.657843112945557, "global_step": 48693, "epoch": 1159} {"train_loss": -5.810516357421875, "global_step": 48694, "epoch": 1159} {"train_loss": -5.729623794555664, "global_step": 48695, "epoch": 1159} {"train_loss": -5.630524158477783, "global_step": 48696, "epoch": 1159} {"train_loss": -5.762401580810547, "global_step": 48697, "epoch": 1159} {"train_loss": -5.814061641693115, "global_step": 48698, "epoch": 1159} {"train_loss": -5.701817989349365, "global_step": 48699, "epoch": 1159} {"train_loss": -5.724863052368164, "global_step": 48700, "epoch": 1159} {"train_loss": -5.701437950134277, "global_step": 48701, "epoch": 1159} {"train_loss": -5.714025497436523, "global_step": 48702, "epoch": 1159} {"train_loss": -5.789582252502441, "global_step": 48703, "epoch": 1159} {"train_loss": -5.757769584655762, "global_step": 48704, "epoch": 1159} {"train_loss": -5.850330352783203, "global_step": 48705, "epoch": 1159} {"train_loss": -5.679778099060059, "global_step": 48706, "epoch": 1159} {"train_loss": -5.737912178039551, "global_step": 48707, "epoch": 1159} {"train_loss": -5.779318809509277, "global_step": 48708, "epoch": 1159} {"train_loss": -5.561391830444336, "global_step": 48709, "epoch": 1159} {"train_loss": -5.81124210357666, "global_step": 48710, "epoch": 1159} {"train_loss": -5.775570392608643, "global_step": 48711, "epoch": 1159} {"train_loss": -5.8380208015441895, "global_step": 48712, "epoch": 1159} {"train_loss": -5.69971227645874, "global_step": 48713, "epoch": 1159} {"train_loss": -5.816481590270996, "global_step": 48714, "epoch": 1159} {"train_loss": -5.745250701904297, "global_step": 48715, "epoch": 1159} {"train_loss": -5.811517715454102, "global_step": 48716, "epoch": 1159} {"train_loss": -5.879763603210449, "global_step": 48717, "epoch": 1159} {"train_loss": -5.811682224273682, "global_step": 48718, "epoch": 1159} {"train_loss": -5.749440181823004, "global_step": 48719, "epoch": 1159, "val_loss": 74148.0390625} {"train_loss": -5.673007965087891, "global_step": 48720, "epoch": 1160} {"train_loss": -5.734784126281738, "global_step": 48721, "epoch": 1160} {"train_loss": -5.725109100341797, "global_step": 48722, "epoch": 1160} {"train_loss": -5.907543659210205, "global_step": 48723, "epoch": 1160} {"train_loss": -5.581204891204834, "global_step": 48724, "epoch": 1160} {"train_loss": -5.748879432678223, "global_step": 48725, "epoch": 1160} {"train_loss": -5.759255409240723, "global_step": 48726, "epoch": 1160} {"train_loss": -5.753284454345703, "global_step": 48727, "epoch": 1160} {"train_loss": -5.7600178718566895, "global_step": 48728, "epoch": 1160} {"train_loss": -5.835223197937012, "global_step": 48729, "epoch": 1160} {"train_loss": -5.738512992858887, "global_step": 48730, "epoch": 1160} {"train_loss": -5.690245151519775, "global_step": 48731, "epoch": 1160} {"train_loss": -5.830864429473877, "global_step": 48732, "epoch": 1160} {"train_loss": -5.605428695678711, "global_step": 48733, "epoch": 1160} {"train_loss": -5.868393421173096, "global_step": 48734, "epoch": 1160} {"train_loss": -5.754060745239258, "global_step": 48735, "epoch": 1160} {"train_loss": -5.775789260864258, "global_step": 48736, "epoch": 1160} {"train_loss": -5.785472869873047, "global_step": 48737, "epoch": 1160} {"train_loss": -5.835185527801514, "global_step": 48738, "epoch": 1160} {"train_loss": -5.678280353546143, "global_step": 48739, "epoch": 1160} {"train_loss": -5.794319152832031, "global_step": 48740, "epoch": 1160} {"train_loss": -5.706969261169434, "global_step": 48741, "epoch": 1160} {"train_loss": -5.949071884155273, "global_step": 48742, "epoch": 1160} {"train_loss": -5.801146030426025, "global_step": 48743, "epoch": 1160} {"train_loss": -5.798386096954346, "global_step": 48744, "epoch": 1160} {"train_loss": -5.831547737121582, "global_step": 48745, "epoch": 1160} {"train_loss": -5.797616958618164, "global_step": 48746, "epoch": 1160} {"train_loss": -5.660457134246826, "global_step": 48747, "epoch": 1160} {"train_loss": -5.730625152587891, "global_step": 48748, "epoch": 1160} {"train_loss": -5.7422685623168945, "global_step": 48749, "epoch": 1160} {"train_loss": -5.563255786895752, "global_step": 48750, "epoch": 1160} {"train_loss": -5.719359397888184, "global_step": 48751, "epoch": 1160} {"train_loss": -5.778664588928223, "global_step": 48752, "epoch": 1160} {"train_loss": -5.808078765869141, "global_step": 48753, "epoch": 1160} {"train_loss": -5.77300500869751, "global_step": 48754, "epoch": 1160} {"train_loss": -5.807063579559326, "global_step": 48755, "epoch": 1160} {"train_loss": -5.745694160461426, "global_step": 48756, "epoch": 1160} {"train_loss": -5.855913162231445, "global_step": 48757, "epoch": 1160} {"train_loss": -5.713962554931641, "global_step": 48758, "epoch": 1160} {"train_loss": -5.802707672119141, "global_step": 48759, "epoch": 1160} {"train_loss": -5.756943702697754, "global_step": 48760, "epoch": 1160} {"train_loss": -5.760023991266887, "global_step": 48761, "epoch": 1160, "val_loss": 73951.3125} {"train_loss": -5.771415710449219, "global_step": 48762, "epoch": 1161} {"train_loss": -5.72544002532959, "global_step": 48763, "epoch": 1161} {"train_loss": -5.711538314819336, "global_step": 48764, "epoch": 1161} {"train_loss": -5.881982803344727, "global_step": 48765, "epoch": 1161} {"train_loss": -5.810975551605225, "global_step": 48766, "epoch": 1161} {"train_loss": -5.760744094848633, "global_step": 48767, "epoch": 1161} {"train_loss": -5.729867935180664, "global_step": 48768, "epoch": 1161} {"train_loss": -5.855568885803223, "global_step": 48769, "epoch": 1161} {"train_loss": -5.656407356262207, "global_step": 48770, "epoch": 1161} {"train_loss": -5.700167655944824, "global_step": 48771, "epoch": 1161} {"train_loss": -5.751692295074463, "global_step": 48772, "epoch": 1161} {"train_loss": -5.78861665725708, "global_step": 48773, "epoch": 1161} {"train_loss": -5.865966796875, "global_step": 48774, "epoch": 1161} {"train_loss": -5.858346939086914, "global_step": 48775, "epoch": 1161} {"train_loss": -5.775694847106934, "global_step": 48776, "epoch": 1161} {"train_loss": -5.756109714508057, "global_step": 48777, "epoch": 1161} {"train_loss": -5.693758010864258, "global_step": 48778, "epoch": 1161} {"train_loss": -5.578709602355957, "global_step": 48779, "epoch": 1161} {"train_loss": -5.75200080871582, "global_step": 48780, "epoch": 1161} {"train_loss": -5.810196876525879, "global_step": 48781, "epoch": 1161} {"train_loss": -5.732569694519043, "global_step": 48782, "epoch": 1161} {"train_loss": -5.749273300170898, "global_step": 48783, "epoch": 1161} {"train_loss": -5.777792930603027, "global_step": 48784, "epoch": 1161} {"train_loss": -5.747433185577393, "global_step": 48785, "epoch": 1161} {"train_loss": -5.687756061553955, "global_step": 48786, "epoch": 1161} {"train_loss": -5.7662858963012695, "global_step": 48787, "epoch": 1161} {"train_loss": -5.713860988616943, "global_step": 48788, "epoch": 1161} {"train_loss": -5.720829963684082, "global_step": 48789, "epoch": 1161} {"train_loss": -5.611842155456543, "global_step": 48790, "epoch": 1161} {"train_loss": -5.795036315917969, "global_step": 48791, "epoch": 1161} {"train_loss": -5.741499900817871, "global_step": 48792, "epoch": 1161} {"train_loss": -5.753571510314941, "global_step": 48793, "epoch": 1161} {"train_loss": -5.695215225219727, "global_step": 48794, "epoch": 1161} {"train_loss": -5.851295471191406, "global_step": 48795, "epoch": 1161} {"train_loss": -5.7930192947387695, "global_step": 48796, "epoch": 1161} {"train_loss": -5.735243320465088, "global_step": 48797, "epoch": 1161} {"train_loss": -5.761926651000977, "global_step": 48798, "epoch": 1161} {"train_loss": -5.812686920166016, "global_step": 48799, "epoch": 1161} {"train_loss": -5.6460041999816895, "global_step": 48800, "epoch": 1161} {"train_loss": -5.745698928833008, "global_step": 48801, "epoch": 1161} {"train_loss": -5.9052581787109375, "global_step": 48802, "epoch": 1161} {"train_loss": -5.759774968737648, "global_step": 48803, "epoch": 1161, "val_loss": 74334.25} {"train_loss": -5.72930908203125, "global_step": 48804, "epoch": 1162} {"train_loss": -5.752696514129639, "global_step": 48805, "epoch": 1162} {"train_loss": -5.691614151000977, "global_step": 48806, "epoch": 1162} {"train_loss": -5.72376823425293, "global_step": 48807, "epoch": 1162} {"train_loss": -5.733470439910889, "global_step": 48808, "epoch": 1162} {"train_loss": -5.6548075675964355, "global_step": 48809, "epoch": 1162} {"train_loss": -5.653130054473877, "global_step": 48810, "epoch": 1162} {"train_loss": -5.772421360015869, "global_step": 48811, "epoch": 1162} {"train_loss": -5.556580066680908, "global_step": 48812, "epoch": 1162} {"train_loss": -5.667068958282471, "global_step": 48813, "epoch": 1162} {"train_loss": -5.778658866882324, "global_step": 48814, "epoch": 1162} {"train_loss": -5.757311820983887, "global_step": 48815, "epoch": 1162} {"train_loss": -5.846896171569824, "global_step": 48816, "epoch": 1162} {"train_loss": -5.862118721008301, "global_step": 48817, "epoch": 1162} {"train_loss": -5.573911666870117, "global_step": 48818, "epoch": 1162} {"train_loss": -5.6955366134643555, "global_step": 48819, "epoch": 1162} {"train_loss": -5.710251808166504, "global_step": 48820, "epoch": 1162} {"train_loss": -5.546044826507568, "global_step": 48821, "epoch": 1162} {"train_loss": -5.702248573303223, "global_step": 48822, "epoch": 1162} {"train_loss": -5.803093433380127, "global_step": 48823, "epoch": 1162} {"train_loss": -5.622705936431885, "global_step": 48824, "epoch": 1162} {"train_loss": -5.768204689025879, "global_step": 48825, "epoch": 1162} {"train_loss": -5.800694465637207, "global_step": 48826, "epoch": 1162} {"train_loss": -5.810561656951904, "global_step": 48827, "epoch": 1162} {"train_loss": -5.831682205200195, "global_step": 48828, "epoch": 1162} {"train_loss": -5.791767120361328, "global_step": 48829, "epoch": 1162} {"train_loss": -5.675775527954102, "global_step": 48830, "epoch": 1162} {"train_loss": -5.730480194091797, "global_step": 48831, "epoch": 1162} {"train_loss": -5.612532615661621, "global_step": 48832, "epoch": 1162} {"train_loss": -5.865072250366211, "global_step": 48833, "epoch": 1162} {"train_loss": -5.8730363845825195, "global_step": 48834, "epoch": 1162} {"train_loss": -5.660938262939453, "global_step": 48835, "epoch": 1162} {"train_loss": -5.6275835037231445, "global_step": 48836, "epoch": 1162} {"train_loss": -5.80806303024292, "global_step": 48837, "epoch": 1162} {"train_loss": -5.7370476722717285, "global_step": 48838, "epoch": 1162} {"train_loss": -5.7971978187561035, "global_step": 48839, "epoch": 1162} {"train_loss": -5.736945629119873, "global_step": 48840, "epoch": 1162} {"train_loss": -5.681576728820801, "global_step": 48841, "epoch": 1162} {"train_loss": -5.662412643432617, "global_step": 48842, "epoch": 1162} {"train_loss": -5.802189826965332, "global_step": 48843, "epoch": 1162} {"train_loss": -5.704751968383789, "global_step": 48844, "epoch": 1162} {"train_loss": -5.729612702415103, "global_step": 48845, "epoch": 1162, "val_loss": 73741.3046875} {"train_loss": -5.77800178527832, "global_step": 48846, "epoch": 1163} {"train_loss": -5.869454383850098, "global_step": 48847, "epoch": 1163} {"train_loss": -5.908489227294922, "global_step": 48848, "epoch": 1163} {"train_loss": -5.829341888427734, "global_step": 48849, "epoch": 1163} {"train_loss": -5.736540794372559, "global_step": 48850, "epoch": 1163} {"train_loss": -5.8878583908081055, "global_step": 48851, "epoch": 1163} {"train_loss": -5.80695915222168, "global_step": 48852, "epoch": 1163} {"train_loss": -5.735751152038574, "global_step": 48853, "epoch": 1163} {"train_loss": -5.811755180358887, "global_step": 48854, "epoch": 1163} {"train_loss": -5.609957695007324, "global_step": 48855, "epoch": 1163} {"train_loss": -5.781580924987793, "global_step": 48856, "epoch": 1163} {"train_loss": -5.776181221008301, "global_step": 48857, "epoch": 1163} {"train_loss": -5.656926155090332, "global_step": 48858, "epoch": 1163} {"train_loss": -5.77872896194458, "global_step": 48859, "epoch": 1163} {"train_loss": -5.7369608879089355, "global_step": 48860, "epoch": 1163} {"train_loss": -5.738648414611816, "global_step": 48861, "epoch": 1163} {"train_loss": -5.757649898529053, "global_step": 48862, "epoch": 1163} {"train_loss": -5.762567043304443, "global_step": 48863, "epoch": 1163} {"train_loss": -5.750239372253418, "global_step": 48864, "epoch": 1163} {"train_loss": -5.64727258682251, "global_step": 48865, "epoch": 1163} {"train_loss": -5.557146072387695, "global_step": 48866, "epoch": 1163} {"train_loss": -5.624764442443848, "global_step": 48867, "epoch": 1163} {"train_loss": -5.704152584075928, "global_step": 48868, "epoch": 1163} {"train_loss": -5.705060005187988, "global_step": 48869, "epoch": 1163} {"train_loss": -5.688958644866943, "global_step": 48870, "epoch": 1163} {"train_loss": -5.667412757873535, "global_step": 48871, "epoch": 1163} {"train_loss": -5.735648155212402, "global_step": 48872, "epoch": 1163} {"train_loss": -5.734039783477783, "global_step": 48873, "epoch": 1163} {"train_loss": -5.777458667755127, "global_step": 48874, "epoch": 1163} {"train_loss": -5.678561210632324, "global_step": 48875, "epoch": 1163} {"train_loss": -5.691769123077393, "global_step": 48876, "epoch": 1163} {"train_loss": -5.899117469787598, "global_step": 48877, "epoch": 1163} {"train_loss": -5.755475044250488, "global_step": 48878, "epoch": 1163} {"train_loss": -5.663578987121582, "global_step": 48879, "epoch": 1163} {"train_loss": -5.7229743003845215, "global_step": 48880, "epoch": 1163} {"train_loss": -5.801163673400879, "global_step": 48881, "epoch": 1163} {"train_loss": -5.779201984405518, "global_step": 48882, "epoch": 1163} {"train_loss": -5.74191427230835, "global_step": 48883, "epoch": 1163} {"train_loss": -5.758959770202637, "global_step": 48884, "epoch": 1163} {"train_loss": -5.733147144317627, "global_step": 48885, "epoch": 1163} {"train_loss": -5.789504051208496, "global_step": 48886, "epoch": 1163} {"train_loss": -5.744128090994699, "global_step": 48887, "epoch": 1163, "val_loss": 73917.8125} {"train_loss": -5.840798854827881, "global_step": 48888, "epoch": 1164} {"train_loss": -5.789844512939453, "global_step": 48889, "epoch": 1164} {"train_loss": -5.881674766540527, "global_step": 48890, "epoch": 1164} {"train_loss": -5.727085113525391, "global_step": 48891, "epoch": 1164} {"train_loss": -5.83065128326416, "global_step": 48892, "epoch": 1164} {"train_loss": -5.878335475921631, "global_step": 48893, "epoch": 1164} {"train_loss": -5.820731163024902, "global_step": 48894, "epoch": 1164} {"train_loss": -5.773872375488281, "global_step": 48895, "epoch": 1164} {"train_loss": -5.688830375671387, "global_step": 48896, "epoch": 1164} {"train_loss": -5.653534889221191, "global_step": 48897, "epoch": 1164} {"train_loss": -5.884598731994629, "global_step": 48898, "epoch": 1164} {"train_loss": -5.682107925415039, "global_step": 48899, "epoch": 1164} {"train_loss": -5.755901336669922, "global_step": 48900, "epoch": 1164} {"train_loss": -5.6680192947387695, "global_step": 48901, "epoch": 1164} {"train_loss": -5.877391338348389, "global_step": 48902, "epoch": 1164} {"train_loss": -5.8236589431762695, "global_step": 48903, "epoch": 1164} {"train_loss": -5.733563423156738, "global_step": 48904, "epoch": 1164} {"train_loss": -5.77217960357666, "global_step": 48905, "epoch": 1164} {"train_loss": -5.756056785583496, "global_step": 48906, "epoch": 1164} {"train_loss": -5.623969554901123, "global_step": 48907, "epoch": 1164} {"train_loss": -5.7440185546875, "global_step": 48908, "epoch": 1164} {"train_loss": -5.620584964752197, "global_step": 48909, "epoch": 1164} {"train_loss": -5.735555171966553, "global_step": 48910, "epoch": 1164} {"train_loss": -5.761882781982422, "global_step": 48911, "epoch": 1164} {"train_loss": -5.721100330352783, "global_step": 48912, "epoch": 1164} {"train_loss": -5.718562126159668, "global_step": 48913, "epoch": 1164} {"train_loss": -5.758147239685059, "global_step": 48914, "epoch": 1164} {"train_loss": -5.853263854980469, "global_step": 48915, "epoch": 1164} {"train_loss": -5.767934322357178, "global_step": 48916, "epoch": 1164} {"train_loss": -5.771785736083984, "global_step": 48917, "epoch": 1164} {"train_loss": -5.853461265563965, "global_step": 48918, "epoch": 1164} {"train_loss": -5.724975109100342, "global_step": 48919, "epoch": 1164} {"train_loss": -5.840825080871582, "global_step": 48920, "epoch": 1164} {"train_loss": -5.6935834884643555, "global_step": 48921, "epoch": 1164} {"train_loss": -5.797040939331055, "global_step": 48922, "epoch": 1164} {"train_loss": -5.77651309967041, "global_step": 48923, "epoch": 1164} {"train_loss": -5.777005195617676, "global_step": 48924, "epoch": 1164} {"train_loss": -5.737714767456055, "global_step": 48925, "epoch": 1164} {"train_loss": -5.7722930908203125, "global_step": 48926, "epoch": 1164} {"train_loss": -5.723402976989746, "global_step": 48927, "epoch": 1164} {"train_loss": -5.760524749755859, "global_step": 48928, "epoch": 1164} {"train_loss": -5.765252726418631, "global_step": 48929, "epoch": 1164, "val_loss": 74004.3046875} {"train_loss": -5.768072128295898, "global_step": 48930, "epoch": 1165} {"train_loss": -5.583392143249512, "global_step": 48931, "epoch": 1165} {"train_loss": -5.684564590454102, "global_step": 48932, "epoch": 1165} {"train_loss": -5.7925214767456055, "global_step": 48933, "epoch": 1165} {"train_loss": -5.665460586547852, "global_step": 48934, "epoch": 1165} {"train_loss": -5.759394645690918, "global_step": 48935, "epoch": 1165} {"train_loss": -5.796690464019775, "global_step": 48936, "epoch": 1165} {"train_loss": -5.762109756469727, "global_step": 48937, "epoch": 1165} {"train_loss": -5.740060329437256, "global_step": 48938, "epoch": 1165} {"train_loss": -5.877270698547363, "global_step": 48939, "epoch": 1165} {"train_loss": -5.736089706420898, "global_step": 48940, "epoch": 1165} {"train_loss": -5.675601959228516, "global_step": 48941, "epoch": 1165} {"train_loss": -5.870682716369629, "global_step": 48942, "epoch": 1165} {"train_loss": -5.8563690185546875, "global_step": 48943, "epoch": 1165} {"train_loss": -5.777505874633789, "global_step": 48944, "epoch": 1165} {"train_loss": -5.87242317199707, "global_step": 48945, "epoch": 1165} {"train_loss": -5.635640621185303, "global_step": 48946, "epoch": 1165} {"train_loss": -5.767175674438477, "global_step": 48947, "epoch": 1165} {"train_loss": -5.750288963317871, "global_step": 48948, "epoch": 1165} {"train_loss": -5.604294300079346, "global_step": 48949, "epoch": 1165} {"train_loss": -5.718012809753418, "global_step": 48950, "epoch": 1165} {"train_loss": -5.762734413146973, "global_step": 48951, "epoch": 1165} {"train_loss": -5.696579933166504, "global_step": 48952, "epoch": 1165} {"train_loss": -5.692622184753418, "global_step": 48953, "epoch": 1165} {"train_loss": -5.657273292541504, "global_step": 48954, "epoch": 1165} {"train_loss": -5.627433776855469, "global_step": 48955, "epoch": 1165} {"train_loss": -5.7216362953186035, "global_step": 48956, "epoch": 1165} {"train_loss": -5.743227958679199, "global_step": 48957, "epoch": 1165} {"train_loss": -5.653266429901123, "global_step": 48958, "epoch": 1165} {"train_loss": -5.62655782699585, "global_step": 48959, "epoch": 1165} {"train_loss": -5.724214553833008, "global_step": 48960, "epoch": 1165} {"train_loss": -5.737640857696533, "global_step": 48961, "epoch": 1165} {"train_loss": -5.70966100692749, "global_step": 48962, "epoch": 1165} {"train_loss": -5.857303142547607, "global_step": 48963, "epoch": 1165} {"train_loss": -5.785641670227051, "global_step": 48964, "epoch": 1165} {"train_loss": -5.722842216491699, "global_step": 48965, "epoch": 1165} {"train_loss": -5.72610330581665, "global_step": 48966, "epoch": 1165} {"train_loss": -5.904115676879883, "global_step": 48967, "epoch": 1165} {"train_loss": -5.591392517089844, "global_step": 48968, "epoch": 1165} {"train_loss": -5.728605270385742, "global_step": 48969, "epoch": 1165} {"train_loss": -5.78630256652832, "global_step": 48970, "epoch": 1165} {"train_loss": -5.7387406258356, "global_step": 48971, "epoch": 1165, "val_loss": 73796.6484375} {"train_loss": -5.967100143432617, "global_step": 48972, "epoch": 1166} {"train_loss": -5.795539855957031, "global_step": 48973, "epoch": 1166} {"train_loss": -5.758172035217285, "global_step": 48974, "epoch": 1166} {"train_loss": -5.6065897941589355, "global_step": 48975, "epoch": 1166} {"train_loss": -5.707217216491699, "global_step": 48976, "epoch": 1166} {"train_loss": -5.791330814361572, "global_step": 48977, "epoch": 1166} {"train_loss": -5.742396831512451, "global_step": 48978, "epoch": 1166} {"train_loss": -5.746747016906738, "global_step": 48979, "epoch": 1166} {"train_loss": -5.849726676940918, "global_step": 48980, "epoch": 1166} {"train_loss": -5.711304187774658, "global_step": 48981, "epoch": 1166} {"train_loss": -5.604942321777344, "global_step": 48982, "epoch": 1166} {"train_loss": -5.697595596313477, "global_step": 48983, "epoch": 1166} {"train_loss": -5.698908805847168, "global_step": 48984, "epoch": 1166} {"train_loss": -5.690713882446289, "global_step": 48985, "epoch": 1166} {"train_loss": -5.721986770629883, "global_step": 48986, "epoch": 1166} {"train_loss": -5.666993618011475, "global_step": 48987, "epoch": 1166} {"train_loss": -5.71489143371582, "global_step": 48988, "epoch": 1166} {"train_loss": -5.726705551147461, "global_step": 48989, "epoch": 1166} {"train_loss": -5.642276763916016, "global_step": 48990, "epoch": 1166} {"train_loss": -5.747270584106445, "global_step": 48991, "epoch": 1166} {"train_loss": -5.591464042663574, "global_step": 48992, "epoch": 1166} {"train_loss": -5.709690093994141, "global_step": 48993, "epoch": 1166} {"train_loss": -5.708328723907471, "global_step": 48994, "epoch": 1166} {"train_loss": -5.694555759429932, "global_step": 48995, "epoch": 1166} {"train_loss": -5.797016143798828, "global_step": 48996, "epoch": 1166} {"train_loss": -5.674766540527344, "global_step": 48997, "epoch": 1166} {"train_loss": -5.787842750549316, "global_step": 48998, "epoch": 1166} {"train_loss": -5.819770812988281, "global_step": 48999, "epoch": 1166} {"train_loss": -5.711114406585693, "global_step": 49000, "epoch": 1166} {"train_loss": -5.876537322998047, "global_step": 49001, "epoch": 1166} {"train_loss": -5.636820316314697, "global_step": 49002, "epoch": 1166} {"train_loss": -5.617041110992432, "global_step": 49003, "epoch": 1166} {"train_loss": -5.725809097290039, "global_step": 49004, "epoch": 1166} {"train_loss": -5.835466384887695, "global_step": 49005, "epoch": 1166} {"train_loss": -5.731437683105469, "global_step": 49006, "epoch": 1166} {"train_loss": -5.849167823791504, "global_step": 49007, "epoch": 1166} {"train_loss": -5.693643093109131, "global_step": 49008, "epoch": 1166} {"train_loss": -5.761298179626465, "global_step": 49009, "epoch": 1166} {"train_loss": -5.8125739097595215, "global_step": 49010, "epoch": 1166} {"train_loss": -5.753579616546631, "global_step": 49011, "epoch": 1166} {"train_loss": -5.777415752410889, "global_step": 49012, "epoch": 1166} {"train_loss": -5.732812801996867, "global_step": 49013, "epoch": 1166, "val_loss": 74525.390625} {"train_loss": -5.7569074630737305, "global_step": 49014, "epoch": 1167} {"train_loss": -5.8010711669921875, "global_step": 49015, "epoch": 1167} {"train_loss": -5.820149898529053, "global_step": 49016, "epoch": 1167} {"train_loss": -5.685640335083008, "global_step": 49017, "epoch": 1167} {"train_loss": -5.822054862976074, "global_step": 49018, "epoch": 1167} {"train_loss": -5.781721115112305, "global_step": 49019, "epoch": 1167} {"train_loss": -5.6805009841918945, "global_step": 49020, "epoch": 1167} {"train_loss": -5.818948268890381, "global_step": 49021, "epoch": 1167} {"train_loss": -5.730847358703613, "global_step": 49022, "epoch": 1167} {"train_loss": -5.794153213500977, "global_step": 49023, "epoch": 1167} {"train_loss": -5.807098865509033, "global_step": 49024, "epoch": 1167} {"train_loss": -5.73537540435791, "global_step": 49025, "epoch": 1167} {"train_loss": -5.81768798828125, "global_step": 49026, "epoch": 1167} {"train_loss": -5.799959182739258, "global_step": 49027, "epoch": 1167} {"train_loss": -5.79764461517334, "global_step": 49028, "epoch": 1167} {"train_loss": -5.753300666809082, "global_step": 49029, "epoch": 1167} {"train_loss": -5.739789009094238, "global_step": 49030, "epoch": 1167} {"train_loss": -5.852779388427734, "global_step": 49031, "epoch": 1167} {"train_loss": -5.831610679626465, "global_step": 49032, "epoch": 1167} {"train_loss": -5.82689094543457, "global_step": 49033, "epoch": 1167} {"train_loss": -5.772336959838867, "global_step": 49034, "epoch": 1167} {"train_loss": -5.768592357635498, "global_step": 49035, "epoch": 1167} {"train_loss": -5.748786926269531, "global_step": 49036, "epoch": 1167} {"train_loss": -5.8476786613464355, "global_step": 49037, "epoch": 1167} {"train_loss": -5.734336853027344, "global_step": 49038, "epoch": 1167} {"train_loss": -5.64088773727417, "global_step": 49039, "epoch": 1167} {"train_loss": -5.6155805587768555, "global_step": 49040, "epoch": 1167} {"train_loss": -5.785650730133057, "global_step": 49041, "epoch": 1167} {"train_loss": -5.577911853790283, "global_step": 49042, "epoch": 1167} {"train_loss": -5.731359481811523, "global_step": 49043, "epoch": 1167} {"train_loss": -5.642323017120361, "global_step": 49044, "epoch": 1167} {"train_loss": -5.660297393798828, "global_step": 49045, "epoch": 1167} {"train_loss": -5.684676647186279, "global_step": 49046, "epoch": 1167} {"train_loss": -5.679022312164307, "global_step": 49047, "epoch": 1167} {"train_loss": -5.801002025604248, "global_step": 49048, "epoch": 1167} {"train_loss": -5.741250038146973, "global_step": 49049, "epoch": 1167} {"train_loss": -5.678123474121094, "global_step": 49050, "epoch": 1167} {"train_loss": -5.7681989669799805, "global_step": 49051, "epoch": 1167} {"train_loss": -5.6755475997924805, "global_step": 49052, "epoch": 1167} {"train_loss": -5.780265808105469, "global_step": 49053, "epoch": 1167} {"train_loss": -5.799491882324219, "global_step": 49054, "epoch": 1167} {"train_loss": -5.752414067586263, "global_step": 49055, "epoch": 1167, "val_loss": 74468.8515625} {"train_loss": -5.618344306945801, "global_step": 49056, "epoch": 1168} {"train_loss": -5.80082368850708, "global_step": 49057, "epoch": 1168} {"train_loss": -5.755126476287842, "global_step": 49058, "epoch": 1168} {"train_loss": -5.767998695373535, "global_step": 49059, "epoch": 1168} {"train_loss": -5.680830955505371, "global_step": 49060, "epoch": 1168} {"train_loss": -5.772540092468262, "global_step": 49061, "epoch": 1168} {"train_loss": -5.808732986450195, "global_step": 49062, "epoch": 1168} {"train_loss": -5.885969161987305, "global_step": 49063, "epoch": 1168} {"train_loss": -5.576038360595703, "global_step": 49064, "epoch": 1168} {"train_loss": -5.814697742462158, "global_step": 49065, "epoch": 1168} {"train_loss": -5.82816743850708, "global_step": 49066, "epoch": 1168} {"train_loss": -5.799984931945801, "global_step": 49067, "epoch": 1168} {"train_loss": -5.744727611541748, "global_step": 49068, "epoch": 1168} {"train_loss": -5.833451271057129, "global_step": 49069, "epoch": 1168} {"train_loss": -5.833498954772949, "global_step": 49070, "epoch": 1168} {"train_loss": -5.848919868469238, "global_step": 49071, "epoch": 1168} {"train_loss": -5.752437591552734, "global_step": 49072, "epoch": 1168} {"train_loss": -5.724973201751709, "global_step": 49073, "epoch": 1168} {"train_loss": -5.865894317626953, "global_step": 49074, "epoch": 1168} {"train_loss": -5.82257080078125, "global_step": 49075, "epoch": 1168} {"train_loss": -5.675961971282959, "global_step": 49076, "epoch": 1168} {"train_loss": -5.740464210510254, "global_step": 49077, "epoch": 1168} {"train_loss": -5.995240211486816, "global_step": 49078, "epoch": 1168} {"train_loss": -5.868800640106201, "global_step": 49079, "epoch": 1168} {"train_loss": -5.722275733947754, "global_step": 49080, "epoch": 1168} {"train_loss": -5.641646385192871, "global_step": 49081, "epoch": 1168} {"train_loss": -5.8017449378967285, "global_step": 49082, "epoch": 1168} {"train_loss": -5.804276466369629, "global_step": 49083, "epoch": 1168} {"train_loss": -5.834813117980957, "global_step": 49084, "epoch": 1168} {"train_loss": -5.780092239379883, "global_step": 49085, "epoch": 1168} {"train_loss": -5.649651527404785, "global_step": 49086, "epoch": 1168} {"train_loss": -5.760784149169922, "global_step": 49087, "epoch": 1168} {"train_loss": -5.738375663757324, "global_step": 49088, "epoch": 1168} {"train_loss": -5.82559871673584, "global_step": 49089, "epoch": 1168} {"train_loss": -5.73382568359375, "global_step": 49090, "epoch": 1168} {"train_loss": -5.8826704025268555, "global_step": 49091, "epoch": 1168} {"train_loss": -5.809944152832031, "global_step": 49092, "epoch": 1168} {"train_loss": -5.897148609161377, "global_step": 49093, "epoch": 1168} {"train_loss": -5.836014747619629, "global_step": 49094, "epoch": 1168} {"train_loss": -5.752601623535156, "global_step": 49095, "epoch": 1168} {"train_loss": -5.751012325286865, "global_step": 49096, "epoch": 1168} {"train_loss": -5.779872042792184, "global_step": 49097, "epoch": 1168, "val_loss": 74174.0078125} {"train_loss": -5.761006832122803, "global_step": 49098, "epoch": 1169} {"train_loss": -5.868110656738281, "global_step": 49099, "epoch": 1169} {"train_loss": -5.882718563079834, "global_step": 49100, "epoch": 1169} {"train_loss": -5.639874458312988, "global_step": 49101, "epoch": 1169} {"train_loss": -5.823009014129639, "global_step": 49102, "epoch": 1169} {"train_loss": -5.760871410369873, "global_step": 49103, "epoch": 1169} {"train_loss": -5.710981845855713, "global_step": 49104, "epoch": 1169} {"train_loss": -5.909317970275879, "global_step": 49105, "epoch": 1169} {"train_loss": -5.779885768890381, "global_step": 49106, "epoch": 1169} {"train_loss": -5.794573783874512, "global_step": 49107, "epoch": 1169} {"train_loss": -5.810082912445068, "global_step": 49108, "epoch": 1169} {"train_loss": -5.736443519592285, "global_step": 49109, "epoch": 1169} {"train_loss": -5.795315742492676, "global_step": 49110, "epoch": 1169} {"train_loss": -5.7966628074646, "global_step": 49111, "epoch": 1169} {"train_loss": -5.767336368560791, "global_step": 49112, "epoch": 1169} {"train_loss": -5.844964981079102, "global_step": 49113, "epoch": 1169} {"train_loss": -5.6968994140625, "global_step": 49114, "epoch": 1169} {"train_loss": -5.879924774169922, "global_step": 49115, "epoch": 1169} {"train_loss": -5.820077419281006, "global_step": 49116, "epoch": 1169} {"train_loss": -5.720510005950928, "global_step": 49117, "epoch": 1169} {"train_loss": -5.813721656799316, "global_step": 49118, "epoch": 1169} {"train_loss": -5.849235534667969, "global_step": 49119, "epoch": 1169} {"train_loss": -5.747681617736816, "global_step": 49120, "epoch": 1169} {"train_loss": -5.819675922393799, "global_step": 49121, "epoch": 1169} {"train_loss": -5.721189498901367, "global_step": 49122, "epoch": 1169} {"train_loss": -5.682422161102295, "global_step": 49123, "epoch": 1169} {"train_loss": -5.7964372634887695, "global_step": 49124, "epoch": 1169} {"train_loss": -5.84323787689209, "global_step": 49125, "epoch": 1169} {"train_loss": -5.667751312255859, "global_step": 49126, "epoch": 1169} {"train_loss": -5.75852632522583, "global_step": 49127, "epoch": 1169} {"train_loss": -5.731050968170166, "global_step": 49128, "epoch": 1169} {"train_loss": -5.8184733390808105, "global_step": 49129, "epoch": 1169} {"train_loss": -5.949069023132324, "global_step": 49130, "epoch": 1169} {"train_loss": -5.673735618591309, "global_step": 49131, "epoch": 1169} {"train_loss": -5.703629493713379, "global_step": 49132, "epoch": 1169} {"train_loss": -5.684077262878418, "global_step": 49133, "epoch": 1169} {"train_loss": -5.678930759429932, "global_step": 49134, "epoch": 1169} {"train_loss": -5.6170430183410645, "global_step": 49135, "epoch": 1169} {"train_loss": -5.776691436767578, "global_step": 49136, "epoch": 1169} {"train_loss": -5.683500289916992, "global_step": 49137, "epoch": 1169} {"train_loss": -5.5792059898376465, "global_step": 49138, "epoch": 1169} {"train_loss": -5.765146221433367, "global_step": 49139, "epoch": 1169, "val_loss": 74311.2421875} {"train_loss": -5.663478374481201, "global_step": 49140, "epoch": 1170} {"train_loss": -5.733096122741699, "global_step": 49141, "epoch": 1170} {"train_loss": -5.723753452301025, "global_step": 49142, "epoch": 1170} {"train_loss": -5.571147918701172, "global_step": 49143, "epoch": 1170} {"train_loss": -5.685400485992432, "global_step": 49144, "epoch": 1170} {"train_loss": -5.5800042152404785, "global_step": 49145, "epoch": 1170} {"train_loss": -5.7448320388793945, "global_step": 49146, "epoch": 1170} {"train_loss": -5.7176642417907715, "global_step": 49147, "epoch": 1170} {"train_loss": -5.821023941040039, "global_step": 49148, "epoch": 1170} {"train_loss": -5.6017303466796875, "global_step": 49149, "epoch": 1170} {"train_loss": -5.557197570800781, "global_step": 49150, "epoch": 1170} {"train_loss": -5.832397937774658, "global_step": 49151, "epoch": 1170} {"train_loss": -5.651133060455322, "global_step": 49152, "epoch": 1170} {"train_loss": -5.609023571014404, "global_step": 49153, "epoch": 1170} {"train_loss": -5.677145957946777, "global_step": 49154, "epoch": 1170} {"train_loss": -5.638670921325684, "global_step": 49155, "epoch": 1170} {"train_loss": -5.827958106994629, "global_step": 49156, "epoch": 1170} {"train_loss": -5.675480842590332, "global_step": 49157, "epoch": 1170} {"train_loss": -5.719173431396484, "global_step": 49158, "epoch": 1170} {"train_loss": -5.8152360916137695, "global_step": 49159, "epoch": 1170} {"train_loss": -5.800117015838623, "global_step": 49160, "epoch": 1170} {"train_loss": -5.688066482543945, "global_step": 49161, "epoch": 1170} {"train_loss": -5.732666015625, "global_step": 49162, "epoch": 1170} {"train_loss": -5.763100624084473, "global_step": 49163, "epoch": 1170} {"train_loss": -5.747953414916992, "global_step": 49164, "epoch": 1170} {"train_loss": -5.703014850616455, "global_step": 49165, "epoch": 1170} {"train_loss": -5.8077802658081055, "global_step": 49166, "epoch": 1170} {"train_loss": -5.797670364379883, "global_step": 49167, "epoch": 1170} {"train_loss": -5.622281074523926, "global_step": 49168, "epoch": 1170} {"train_loss": -5.782825469970703, "global_step": 49169, "epoch": 1170} {"train_loss": -5.807226181030273, "global_step": 49170, "epoch": 1170} {"train_loss": -5.755568504333496, "global_step": 49171, "epoch": 1170} {"train_loss": -5.7280707359313965, "global_step": 49172, "epoch": 1170} {"train_loss": -5.902259826660156, "global_step": 49173, "epoch": 1170} {"train_loss": -5.805277347564697, "global_step": 49174, "epoch": 1170} {"train_loss": -5.74870491027832, "global_step": 49175, "epoch": 1170} {"train_loss": -5.820069313049316, "global_step": 49176, "epoch": 1170} {"train_loss": -5.811857223510742, "global_step": 49177, "epoch": 1170} {"train_loss": -5.802735328674316, "global_step": 49178, "epoch": 1170} {"train_loss": -5.683600425720215, "global_step": 49179, "epoch": 1170} {"train_loss": -5.720024585723877, "global_step": 49180, "epoch": 1170} {"train_loss": -5.728926147733416, "global_step": 49181, "epoch": 1170, "val_loss": 73906.5} {"train_loss": -5.891937255859375, "global_step": 49182, "epoch": 1171} {"train_loss": -5.754582405090332, "global_step": 49183, "epoch": 1171} {"train_loss": -5.713818073272705, "global_step": 49184, "epoch": 1171} {"train_loss": -5.734951496124268, "global_step": 49185, "epoch": 1171} {"train_loss": -5.839210510253906, "global_step": 49186, "epoch": 1171} {"train_loss": -5.827205657958984, "global_step": 49187, "epoch": 1171} {"train_loss": -5.785561561584473, "global_step": 49188, "epoch": 1171} {"train_loss": -5.654443740844727, "global_step": 49189, "epoch": 1171} {"train_loss": -5.713565826416016, "global_step": 49190, "epoch": 1171} {"train_loss": -5.728785514831543, "global_step": 49191, "epoch": 1171} {"train_loss": -5.79758882522583, "global_step": 49192, "epoch": 1171} {"train_loss": -5.709906578063965, "global_step": 49193, "epoch": 1171} {"train_loss": -5.754847049713135, "global_step": 49194, "epoch": 1171} {"train_loss": -5.752806663513184, "global_step": 49195, "epoch": 1171} {"train_loss": -5.658512115478516, "global_step": 49196, "epoch": 1171} {"train_loss": -5.781011581420898, "global_step": 49197, "epoch": 1171} {"train_loss": -5.61476469039917, "global_step": 49198, "epoch": 1171} {"train_loss": -5.711764335632324, "global_step": 49199, "epoch": 1171} {"train_loss": -5.822220802307129, "global_step": 49200, "epoch": 1171} {"train_loss": -5.585351943969727, "global_step": 49201, "epoch": 1171} {"train_loss": -5.631800651550293, "global_step": 49202, "epoch": 1171} {"train_loss": -5.828621864318848, "global_step": 49203, "epoch": 1171} {"train_loss": -5.639302730560303, "global_step": 49204, "epoch": 1171} {"train_loss": -5.723217010498047, "global_step": 49205, "epoch": 1171} {"train_loss": -5.700331687927246, "global_step": 49206, "epoch": 1171} {"train_loss": -5.750985145568848, "global_step": 49207, "epoch": 1171} {"train_loss": -5.904358386993408, "global_step": 49208, "epoch": 1171} {"train_loss": -5.813791275024414, "global_step": 49209, "epoch": 1171} {"train_loss": -5.648744583129883, "global_step": 49210, "epoch": 1171} {"train_loss": -5.746020317077637, "global_step": 49211, "epoch": 1171} {"train_loss": -5.745169639587402, "global_step": 49212, "epoch": 1171} {"train_loss": -5.7284698486328125, "global_step": 49213, "epoch": 1171} {"train_loss": -5.762978553771973, "global_step": 49214, "epoch": 1171} {"train_loss": -5.730902671813965, "global_step": 49215, "epoch": 1171} {"train_loss": -5.854491233825684, "global_step": 49216, "epoch": 1171} {"train_loss": -5.757307529449463, "global_step": 49217, "epoch": 1171} {"train_loss": -5.705451011657715, "global_step": 49218, "epoch": 1171} {"train_loss": -5.893969535827637, "global_step": 49219, "epoch": 1171} {"train_loss": -5.780483245849609, "global_step": 49220, "epoch": 1171} {"train_loss": -5.625162124633789, "global_step": 49221, "epoch": 1171} {"train_loss": -5.617384910583496, "global_step": 49222, "epoch": 1171} {"train_loss": -5.740637302398682, "global_step": 49223, "epoch": 1171, "val_loss": 74475.78125} {"train_loss": -5.6665730476379395, "global_step": 49224, "epoch": 1172} {"train_loss": -5.8213396072387695, "global_step": 49225, "epoch": 1172} {"train_loss": -5.725325107574463, "global_step": 49226, "epoch": 1172} {"train_loss": -5.666505813598633, "global_step": 49227, "epoch": 1172} {"train_loss": -5.743189811706543, "global_step": 49228, "epoch": 1172} {"train_loss": -5.693116188049316, "global_step": 49229, "epoch": 1172} {"train_loss": -5.687634468078613, "global_step": 49230, "epoch": 1172} {"train_loss": -5.815661907196045, "global_step": 49231, "epoch": 1172} {"train_loss": -5.685093879699707, "global_step": 49232, "epoch": 1172} {"train_loss": -5.796382427215576, "global_step": 49233, "epoch": 1172} {"train_loss": -5.6756181716918945, "global_step": 49234, "epoch": 1172} {"train_loss": -5.861054420471191, "global_step": 49235, "epoch": 1172} {"train_loss": -5.714328289031982, "global_step": 49236, "epoch": 1172} {"train_loss": -5.776336193084717, "global_step": 49237, "epoch": 1172} {"train_loss": -5.780632019042969, "global_step": 49238, "epoch": 1172} {"train_loss": -5.894265174865723, "global_step": 49239, "epoch": 1172} {"train_loss": -5.662887096405029, "global_step": 49240, "epoch": 1172} {"train_loss": -5.797182083129883, "global_step": 49241, "epoch": 1172} {"train_loss": -5.798820495605469, "global_step": 49242, "epoch": 1172} {"train_loss": -5.757850170135498, "global_step": 49243, "epoch": 1172} {"train_loss": -5.916058540344238, "global_step": 49244, "epoch": 1172} {"train_loss": -5.708497047424316, "global_step": 49245, "epoch": 1172} {"train_loss": -5.6631669998168945, "global_step": 49246, "epoch": 1172} {"train_loss": -5.74869441986084, "global_step": 49247, "epoch": 1172} {"train_loss": -5.671980381011963, "global_step": 49248, "epoch": 1172} {"train_loss": -5.751479148864746, "global_step": 49249, "epoch": 1172} {"train_loss": -5.792688846588135, "global_step": 49250, "epoch": 1172} {"train_loss": -5.737183570861816, "global_step": 49251, "epoch": 1172} {"train_loss": -5.565326690673828, "global_step": 49252, "epoch": 1172} {"train_loss": -5.793981552124023, "global_step": 49253, "epoch": 1172} {"train_loss": -5.647278785705566, "global_step": 49254, "epoch": 1172} {"train_loss": -5.610793113708496, "global_step": 49255, "epoch": 1172} {"train_loss": -5.799046516418457, "global_step": 49256, "epoch": 1172} {"train_loss": -5.732872009277344, "global_step": 49257, "epoch": 1172} {"train_loss": -5.654548645019531, "global_step": 49258, "epoch": 1172} {"train_loss": -5.842118740081787, "global_step": 49259, "epoch": 1172} {"train_loss": -5.643367767333984, "global_step": 49260, "epoch": 1172} {"train_loss": -5.61683464050293, "global_step": 49261, "epoch": 1172} {"train_loss": -5.699677467346191, "global_step": 49262, "epoch": 1172} {"train_loss": -5.710872650146484, "global_step": 49263, "epoch": 1172} {"train_loss": -5.703732490539551, "global_step": 49264, "epoch": 1172} {"train_loss": -5.734426259994507, "global_step": 49265, "epoch": 1172, "val_loss": 74068.1953125} {"train_loss": -5.771849632263184, "global_step": 49266, "epoch": 1173} {"train_loss": -5.864136695861816, "global_step": 49267, "epoch": 1173} {"train_loss": -5.794758319854736, "global_step": 49268, "epoch": 1173} {"train_loss": -5.68716287612915, "global_step": 49269, "epoch": 1173} {"train_loss": -5.826666831970215, "global_step": 49270, "epoch": 1173} {"train_loss": -5.689959526062012, "global_step": 49271, "epoch": 1173} {"train_loss": -5.786386013031006, "global_step": 49272, "epoch": 1173} {"train_loss": -5.657051086425781, "global_step": 49273, "epoch": 1173} {"train_loss": -5.690792083740234, "global_step": 49274, "epoch": 1173} {"train_loss": -5.811079025268555, "global_step": 49275, "epoch": 1173} {"train_loss": -5.602474212646484, "global_step": 49276, "epoch": 1173} {"train_loss": -5.901389122009277, "global_step": 49277, "epoch": 1173} {"train_loss": -5.748019695281982, "global_step": 49278, "epoch": 1173} {"train_loss": -5.633411884307861, "global_step": 49279, "epoch": 1173} {"train_loss": -5.749943733215332, "global_step": 49280, "epoch": 1173} {"train_loss": -5.706335067749023, "global_step": 49281, "epoch": 1173} {"train_loss": -5.730131149291992, "global_step": 49282, "epoch": 1173} {"train_loss": -5.816130638122559, "global_step": 49283, "epoch": 1173} {"train_loss": -5.764514923095703, "global_step": 49284, "epoch": 1173} {"train_loss": -5.817348480224609, "global_step": 49285, "epoch": 1173} {"train_loss": -5.605305194854736, "global_step": 49286, "epoch": 1173} {"train_loss": -5.846166610717773, "global_step": 49287, "epoch": 1173} {"train_loss": -5.740562915802002, "global_step": 49288, "epoch": 1173} {"train_loss": -5.741507053375244, "global_step": 49289, "epoch": 1173} {"train_loss": -5.719626426696777, "global_step": 49290, "epoch": 1173} {"train_loss": -5.740152835845947, "global_step": 49291, "epoch": 1173} {"train_loss": -5.717754364013672, "global_step": 49292, "epoch": 1173} {"train_loss": -5.73474645614624, "global_step": 49293, "epoch": 1173} {"train_loss": -5.715696334838867, "global_step": 49294, "epoch": 1173} {"train_loss": -5.837729454040527, "global_step": 49295, "epoch": 1173} {"train_loss": -5.7820329666137695, "global_step": 49296, "epoch": 1173} {"train_loss": -5.725492477416992, "global_step": 49297, "epoch": 1173} {"train_loss": -5.729806900024414, "global_step": 49298, "epoch": 1173} {"train_loss": -5.691006660461426, "global_step": 49299, "epoch": 1173} {"train_loss": -5.839174270629883, "global_step": 49300, "epoch": 1173} {"train_loss": -5.85630989074707, "global_step": 49301, "epoch": 1173} {"train_loss": -5.78360652923584, "global_step": 49302, "epoch": 1173} {"train_loss": -5.780764579772949, "global_step": 49303, "epoch": 1173} {"train_loss": -5.695085048675537, "global_step": 49304, "epoch": 1173} {"train_loss": -5.770872592926025, "global_step": 49305, "epoch": 1173} {"train_loss": -5.854032039642334, "global_step": 49306, "epoch": 1173} {"train_loss": -5.757218088422503, "global_step": 49307, "epoch": 1173, "val_loss": 74227.140625} {"train_loss": -5.76556396484375, "global_step": 49308, "epoch": 1174} {"train_loss": -5.739228248596191, "global_step": 49309, "epoch": 1174} {"train_loss": -5.77940034866333, "global_step": 49310, "epoch": 1174} {"train_loss": -5.7135772705078125, "global_step": 49311, "epoch": 1174} {"train_loss": -5.75193977355957, "global_step": 49312, "epoch": 1174} {"train_loss": -5.814841270446777, "global_step": 49313, "epoch": 1174} {"train_loss": -5.758322715759277, "global_step": 49314, "epoch": 1174} {"train_loss": -5.848498344421387, "global_step": 49315, "epoch": 1174} {"train_loss": -5.82530403137207, "global_step": 49316, "epoch": 1174} {"train_loss": -5.818197250366211, "global_step": 49317, "epoch": 1174} {"train_loss": -5.6689629554748535, "global_step": 49318, "epoch": 1174} {"train_loss": -5.71769905090332, "global_step": 49319, "epoch": 1174} {"train_loss": -5.763933181762695, "global_step": 49320, "epoch": 1174} {"train_loss": -5.725894927978516, "global_step": 49321, "epoch": 1174} {"train_loss": -5.8808817863464355, "global_step": 49322, "epoch": 1174} {"train_loss": -5.789154529571533, "global_step": 49323, "epoch": 1174} {"train_loss": -5.901747226715088, "global_step": 49324, "epoch": 1174} {"train_loss": -5.805401802062988, "global_step": 49325, "epoch": 1174} {"train_loss": -5.61316442489624, "global_step": 49326, "epoch": 1174} {"train_loss": -5.732147216796875, "global_step": 49327, "epoch": 1174} {"train_loss": -5.8303680419921875, "global_step": 49328, "epoch": 1174} {"train_loss": -5.720527648925781, "global_step": 49329, "epoch": 1174} {"train_loss": -5.699706554412842, "global_step": 49330, "epoch": 1174} {"train_loss": -5.818706512451172, "global_step": 49331, "epoch": 1174} {"train_loss": -5.738624572753906, "global_step": 49332, "epoch": 1174} {"train_loss": -5.835468292236328, "global_step": 49333, "epoch": 1174} {"train_loss": -5.840163230895996, "global_step": 49334, "epoch": 1174} {"train_loss": -5.958968162536621, "global_step": 49335, "epoch": 1174} {"train_loss": -5.867349147796631, "global_step": 49336, "epoch": 1174} {"train_loss": -5.927463531494141, "global_step": 49337, "epoch": 1174} {"train_loss": -5.781729698181152, "global_step": 49338, "epoch": 1174} {"train_loss": -5.796661853790283, "global_step": 49339, "epoch": 1174} {"train_loss": -5.833103179931641, "global_step": 49340, "epoch": 1174} {"train_loss": -5.775341987609863, "global_step": 49341, "epoch": 1174} {"train_loss": -5.87086296081543, "global_step": 49342, "epoch": 1174} {"train_loss": -5.634756565093994, "global_step": 49343, "epoch": 1174} {"train_loss": -5.715600967407227, "global_step": 49344, "epoch": 1174} {"train_loss": -5.820477485656738, "global_step": 49345, "epoch": 1174} {"train_loss": -5.906473636627197, "global_step": 49346, "epoch": 1174} {"train_loss": -5.719460487365723, "global_step": 49347, "epoch": 1174} {"train_loss": -5.784084320068359, "global_step": 49348, "epoch": 1174} {"train_loss": -5.786079315912156, "global_step": 49349, "epoch": 1174, "val_loss": 74397.1171875} {"train_loss": -5.76251745223999, "global_step": 49350, "epoch": 1175} {"train_loss": -5.788360595703125, "global_step": 49351, "epoch": 1175} {"train_loss": -5.864006519317627, "global_step": 49352, "epoch": 1175} {"train_loss": -5.872501850128174, "global_step": 49353, "epoch": 1175} {"train_loss": -5.757785320281982, "global_step": 49354, "epoch": 1175} {"train_loss": -5.790390968322754, "global_step": 49355, "epoch": 1175} {"train_loss": -5.630640983581543, "global_step": 49356, "epoch": 1175} {"train_loss": -5.714184761047363, "global_step": 49357, "epoch": 1175} {"train_loss": -5.853102684020996, "global_step": 49358, "epoch": 1175} {"train_loss": -5.632913112640381, "global_step": 49359, "epoch": 1175} {"train_loss": -5.5403828620910645, "global_step": 49360, "epoch": 1175} {"train_loss": -5.755087852478027, "global_step": 49361, "epoch": 1175} {"train_loss": -5.844527721405029, "global_step": 49362, "epoch": 1175} {"train_loss": -5.737457275390625, "global_step": 49363, "epoch": 1175} {"train_loss": -5.745279788970947, "global_step": 49364, "epoch": 1175} {"train_loss": -5.727182388305664, "global_step": 49365, "epoch": 1175} {"train_loss": -5.75712776184082, "global_step": 49366, "epoch": 1175} {"train_loss": -5.918697357177734, "global_step": 49367, "epoch": 1175} {"train_loss": -5.721261978149414, "global_step": 49368, "epoch": 1175} {"train_loss": -5.790083885192871, "global_step": 49369, "epoch": 1175} {"train_loss": -5.8742289543151855, "global_step": 49370, "epoch": 1175} {"train_loss": -5.754246711730957, "global_step": 49371, "epoch": 1175} {"train_loss": -5.957213401794434, "global_step": 49372, "epoch": 1175} {"train_loss": -5.759239196777344, "global_step": 49373, "epoch": 1175} {"train_loss": -5.685114860534668, "global_step": 49374, "epoch": 1175} {"train_loss": -5.761397361755371, "global_step": 49375, "epoch": 1175} {"train_loss": -5.756712913513184, "global_step": 49376, "epoch": 1175} {"train_loss": -5.806462287902832, "global_step": 49377, "epoch": 1175} {"train_loss": -5.868083953857422, "global_step": 49378, "epoch": 1175} {"train_loss": -5.772464752197266, "global_step": 49379, "epoch": 1175} {"train_loss": -5.799783706665039, "global_step": 49380, "epoch": 1175} {"train_loss": -5.820840835571289, "global_step": 49381, "epoch": 1175} {"train_loss": -5.740852355957031, "global_step": 49382, "epoch": 1175} {"train_loss": -5.848677635192871, "global_step": 49383, "epoch": 1175} {"train_loss": -5.818452835083008, "global_step": 49384, "epoch": 1175} {"train_loss": -5.891921043395996, "global_step": 49385, "epoch": 1175} {"train_loss": -5.865046977996826, "global_step": 49386, "epoch": 1175} {"train_loss": -5.764102935791016, "global_step": 49387, "epoch": 1175} {"train_loss": -5.761656761169434, "global_step": 49388, "epoch": 1175} {"train_loss": -5.897776126861572, "global_step": 49389, "epoch": 1175} {"train_loss": -5.787240028381348, "global_step": 49390, "epoch": 1175} {"train_loss": -5.786294653302147, "global_step": 49391, "epoch": 1175, "val_loss": 74303.3359375} {"train_loss": -5.632401943206787, "global_step": 49392, "epoch": 1176} {"train_loss": -5.781619071960449, "global_step": 49393, "epoch": 1176} {"train_loss": -5.767838478088379, "global_step": 49394, "epoch": 1176} {"train_loss": -5.806398391723633, "global_step": 49395, "epoch": 1176} {"train_loss": -5.769141674041748, "global_step": 49396, "epoch": 1176} {"train_loss": -5.740170955657959, "global_step": 49397, "epoch": 1176} {"train_loss": -5.799892425537109, "global_step": 49398, "epoch": 1176} {"train_loss": -5.677189826965332, "global_step": 49399, "epoch": 1176} {"train_loss": -5.740440845489502, "global_step": 49400, "epoch": 1176} {"train_loss": -5.75210428237915, "global_step": 49401, "epoch": 1176} {"train_loss": -5.700169086456299, "global_step": 49402, "epoch": 1176} {"train_loss": -5.658805847167969, "global_step": 49403, "epoch": 1176} {"train_loss": -5.740180969238281, "global_step": 49404, "epoch": 1176} {"train_loss": -5.77186918258667, "global_step": 49405, "epoch": 1176} {"train_loss": -5.788850784301758, "global_step": 49406, "epoch": 1176} {"train_loss": -5.809466361999512, "global_step": 49407, "epoch": 1176} {"train_loss": -5.7169575691223145, "global_step": 49408, "epoch": 1176} {"train_loss": -5.876971244812012, "global_step": 49409, "epoch": 1176} {"train_loss": -5.789999961853027, "global_step": 49410, "epoch": 1176} {"train_loss": -5.705495834350586, "global_step": 49411, "epoch": 1176} {"train_loss": -5.734912872314453, "global_step": 49412, "epoch": 1176} {"train_loss": -5.682455062866211, "global_step": 49413, "epoch": 1176} {"train_loss": -5.719605445861816, "global_step": 49414, "epoch": 1176} {"train_loss": -5.765021324157715, "global_step": 49415, "epoch": 1176} {"train_loss": -5.800512313842773, "global_step": 49416, "epoch": 1176} {"train_loss": -5.810953617095947, "global_step": 49417, "epoch": 1176} {"train_loss": -5.72605562210083, "global_step": 49418, "epoch": 1176} {"train_loss": -5.916634559631348, "global_step": 49419, "epoch": 1176} {"train_loss": -5.644131660461426, "global_step": 49420, "epoch": 1176} {"train_loss": -5.713931083679199, "global_step": 49421, "epoch": 1176} {"train_loss": -5.801959991455078, "global_step": 49422, "epoch": 1176} {"train_loss": -5.702205181121826, "global_step": 49423, "epoch": 1176} {"train_loss": -5.625044822692871, "global_step": 49424, "epoch": 1176} {"train_loss": -5.852306365966797, "global_step": 49425, "epoch": 1176} {"train_loss": -5.625093460083008, "global_step": 49426, "epoch": 1176} {"train_loss": -5.749764919281006, "global_step": 49427, "epoch": 1176} {"train_loss": -5.578268051147461, "global_step": 49428, "epoch": 1176} {"train_loss": -5.584141731262207, "global_step": 49429, "epoch": 1176} {"train_loss": -5.6189470291137695, "global_step": 49430, "epoch": 1176} {"train_loss": -5.615591049194336, "global_step": 49431, "epoch": 1176} {"train_loss": -5.695433616638184, "global_step": 49432, "epoch": 1176} {"train_loss": -5.730289175396874, "global_step": 49433, "epoch": 1176, "val_loss": 74171.4921875} {"train_loss": -5.719559192657471, "global_step": 49434, "epoch": 1177} {"train_loss": -5.661997318267822, "global_step": 49435, "epoch": 1177} {"train_loss": -5.794402599334717, "global_step": 49436, "epoch": 1177} {"train_loss": -5.735114097595215, "global_step": 49437, "epoch": 1177} {"train_loss": -5.839272499084473, "global_step": 49438, "epoch": 1177} {"train_loss": -5.776792526245117, "global_step": 49439, "epoch": 1177} {"train_loss": -5.798707962036133, "global_step": 49440, "epoch": 1177} {"train_loss": -5.7242512702941895, "global_step": 49441, "epoch": 1177} {"train_loss": -5.666399955749512, "global_step": 49442, "epoch": 1177} {"train_loss": -5.752938747406006, "global_step": 49443, "epoch": 1177} {"train_loss": -5.56095027923584, "global_step": 49444, "epoch": 1177} {"train_loss": -5.670256614685059, "global_step": 49445, "epoch": 1177} {"train_loss": -5.715175151824951, "global_step": 49446, "epoch": 1177} {"train_loss": -5.81134557723999, "global_step": 49447, "epoch": 1177} {"train_loss": -5.576478958129883, "global_step": 49448, "epoch": 1177} {"train_loss": -5.756274223327637, "global_step": 49449, "epoch": 1177} {"train_loss": -5.628016948699951, "global_step": 49450, "epoch": 1177} {"train_loss": -5.533405303955078, "global_step": 49451, "epoch": 1177} {"train_loss": -5.76257848739624, "global_step": 49452, "epoch": 1177} {"train_loss": -5.551830291748047, "global_step": 49453, "epoch": 1177} {"train_loss": -5.777493476867676, "global_step": 49454, "epoch": 1177} {"train_loss": -5.648247718811035, "global_step": 49455, "epoch": 1177} {"train_loss": -5.54752254486084, "global_step": 49456, "epoch": 1177} {"train_loss": -5.676333427429199, "global_step": 49457, "epoch": 1177} {"train_loss": -5.6012654304504395, "global_step": 49458, "epoch": 1177} {"train_loss": -5.586078643798828, "global_step": 49459, "epoch": 1177} {"train_loss": -5.718803405761719, "global_step": 49460, "epoch": 1177} {"train_loss": -5.765555381774902, "global_step": 49461, "epoch": 1177} {"train_loss": -5.631109714508057, "global_step": 49462, "epoch": 1177} {"train_loss": -5.694800853729248, "global_step": 49463, "epoch": 1177} {"train_loss": -5.76053524017334, "global_step": 49464, "epoch": 1177} {"train_loss": -5.7540388107299805, "global_step": 49465, "epoch": 1177} {"train_loss": -5.703180313110352, "global_step": 49466, "epoch": 1177} {"train_loss": -5.84008264541626, "global_step": 49467, "epoch": 1177} {"train_loss": -5.598440170288086, "global_step": 49468, "epoch": 1177} {"train_loss": -5.782859802246094, "global_step": 49469, "epoch": 1177} {"train_loss": -5.764377117156982, "global_step": 49470, "epoch": 1177} {"train_loss": -5.780365943908691, "global_step": 49471, "epoch": 1177} {"train_loss": -5.7086029052734375, "global_step": 49472, "epoch": 1177} {"train_loss": -5.632168769836426, "global_step": 49473, "epoch": 1177} {"train_loss": -5.768424987792969, "global_step": 49474, "epoch": 1177} {"train_loss": -5.69891449383327, "global_step": 49475, "epoch": 1177, "val_loss": 73924.328125} {"train_loss": -5.857067108154297, "global_step": 49476, "epoch": 1178} {"train_loss": -5.692319393157959, "global_step": 49477, "epoch": 1178} {"train_loss": -5.832302093505859, "global_step": 49478, "epoch": 1178} {"train_loss": -5.833862781524658, "global_step": 49479, "epoch": 1178} {"train_loss": -5.7146897315979, "global_step": 49480, "epoch": 1178} {"train_loss": -5.89100456237793, "global_step": 49481, "epoch": 1178} {"train_loss": -5.835127830505371, "global_step": 49482, "epoch": 1178} {"train_loss": -5.819423198699951, "global_step": 49483, "epoch": 1178} {"train_loss": -5.872147560119629, "global_step": 49484, "epoch": 1178} {"train_loss": -5.797347545623779, "global_step": 49485, "epoch": 1178} {"train_loss": -5.63578987121582, "global_step": 49486, "epoch": 1178} {"train_loss": -5.721755027770996, "global_step": 49487, "epoch": 1178} {"train_loss": -5.776644706726074, "global_step": 49488, "epoch": 1178} {"train_loss": -5.827720642089844, "global_step": 49489, "epoch": 1178} {"train_loss": -5.818961143493652, "global_step": 49490, "epoch": 1178} {"train_loss": -5.7799835205078125, "global_step": 49491, "epoch": 1178} {"train_loss": -5.8540191650390625, "global_step": 49492, "epoch": 1178} {"train_loss": -5.606461524963379, "global_step": 49493, "epoch": 1178} {"train_loss": -5.802779197692871, "global_step": 49494, "epoch": 1178} {"train_loss": -5.770242691040039, "global_step": 49495, "epoch": 1178} {"train_loss": -5.792908668518066, "global_step": 49496, "epoch": 1178} {"train_loss": -5.698092460632324, "global_step": 49497, "epoch": 1178} {"train_loss": -5.720641613006592, "global_step": 49498, "epoch": 1178} {"train_loss": -5.6012725830078125, "global_step": 49499, "epoch": 1178} {"train_loss": -5.734944820404053, "global_step": 49500, "epoch": 1178} {"train_loss": -5.739146709442139, "global_step": 49501, "epoch": 1178} {"train_loss": -5.6274919509887695, "global_step": 49502, "epoch": 1178} {"train_loss": -5.705578327178955, "global_step": 49503, "epoch": 1178} {"train_loss": -5.590228080749512, "global_step": 49504, "epoch": 1178} {"train_loss": -5.74151611328125, "global_step": 49505, "epoch": 1178} {"train_loss": -5.615076541900635, "global_step": 49506, "epoch": 1178} {"train_loss": -5.781927585601807, "global_step": 49507, "epoch": 1178} {"train_loss": -5.718006134033203, "global_step": 49508, "epoch": 1178} {"train_loss": -5.665090084075928, "global_step": 49509, "epoch": 1178} {"train_loss": -5.752298831939697, "global_step": 49510, "epoch": 1178} {"train_loss": -5.69630765914917, "global_step": 49511, "epoch": 1178} {"train_loss": -5.730863571166992, "global_step": 49512, "epoch": 1178} {"train_loss": -5.616677284240723, "global_step": 49513, "epoch": 1178} {"train_loss": -5.690611839294434, "global_step": 49514, "epoch": 1178} {"train_loss": -5.630887031555176, "global_step": 49515, "epoch": 1178} {"train_loss": -5.630257606506348, "global_step": 49516, "epoch": 1178} {"train_loss": -5.73922754469372, "global_step": 49517, "epoch": 1178, "val_loss": 74481.3125} {"train_loss": -5.777152061462402, "global_step": 49518, "epoch": 1179} {"train_loss": -5.775275230407715, "global_step": 49519, "epoch": 1179} {"train_loss": -5.831898212432861, "global_step": 49520, "epoch": 1179} {"train_loss": -5.794390678405762, "global_step": 49521, "epoch": 1179} {"train_loss": -5.732721328735352, "global_step": 49522, "epoch": 1179} {"train_loss": -5.724689483642578, "global_step": 49523, "epoch": 1179} {"train_loss": -5.781795501708984, "global_step": 49524, "epoch": 1179} {"train_loss": -5.914096355438232, "global_step": 49525, "epoch": 1179} {"train_loss": -5.759831428527832, "global_step": 49526, "epoch": 1179} {"train_loss": -5.774287223815918, "global_step": 49527, "epoch": 1179} {"train_loss": -5.717604637145996, "global_step": 49528, "epoch": 1179} {"train_loss": -5.693540573120117, "global_step": 49529, "epoch": 1179} {"train_loss": -5.7578020095825195, "global_step": 49530, "epoch": 1179} {"train_loss": -5.901487350463867, "global_step": 49531, "epoch": 1179} {"train_loss": -5.739016056060791, "global_step": 49532, "epoch": 1179} {"train_loss": -6.015403747558594, "global_step": 49533, "epoch": 1179} {"train_loss": -5.775228500366211, "global_step": 49534, "epoch": 1179} {"train_loss": -5.7180585861206055, "global_step": 49535, "epoch": 1179} {"train_loss": -5.8397369384765625, "global_step": 49536, "epoch": 1179} {"train_loss": -5.750088691711426, "global_step": 49537, "epoch": 1179} {"train_loss": -5.675230026245117, "global_step": 49538, "epoch": 1179} {"train_loss": -5.699899673461914, "global_step": 49539, "epoch": 1179} {"train_loss": -5.692698955535889, "global_step": 49540, "epoch": 1179} {"train_loss": -5.735934734344482, "global_step": 49541, "epoch": 1179} {"train_loss": -5.72415828704834, "global_step": 49542, "epoch": 1179} {"train_loss": -5.757295608520508, "global_step": 49543, "epoch": 1179} {"train_loss": -5.713815689086914, "global_step": 49544, "epoch": 1179} {"train_loss": -5.626031875610352, "global_step": 49545, "epoch": 1179} {"train_loss": -5.797336578369141, "global_step": 49546, "epoch": 1179} {"train_loss": -5.78190279006958, "global_step": 49547, "epoch": 1179} {"train_loss": -5.763005256652832, "global_step": 49548, "epoch": 1179} {"train_loss": -5.789332389831543, "global_step": 49549, "epoch": 1179} {"train_loss": -5.7939863204956055, "global_step": 49550, "epoch": 1179} {"train_loss": -5.724663734436035, "global_step": 49551, "epoch": 1179} {"train_loss": -5.755073547363281, "global_step": 49552, "epoch": 1179} {"train_loss": -5.665188789367676, "global_step": 49553, "epoch": 1179} {"train_loss": -5.703951358795166, "global_step": 49554, "epoch": 1179} {"train_loss": -5.790913105010986, "global_step": 49555, "epoch": 1179} {"train_loss": -5.722467422485352, "global_step": 49556, "epoch": 1179} {"train_loss": -5.7927961349487305, "global_step": 49557, "epoch": 1179} {"train_loss": -5.85457181930542, "global_step": 49558, "epoch": 1179} {"train_loss": -5.7661007813044955, "global_step": 49559, "epoch": 1179, "val_loss": 74501.234375} {"train_loss": -5.736208915710449, "global_step": 49560, "epoch": 1180} {"train_loss": -5.711142539978027, "global_step": 49561, "epoch": 1180} {"train_loss": -5.840529441833496, "global_step": 49562, "epoch": 1180} {"train_loss": -5.694238185882568, "global_step": 49563, "epoch": 1180} {"train_loss": -5.615988254547119, "global_step": 49564, "epoch": 1180} {"train_loss": -5.778450965881348, "global_step": 49565, "epoch": 1180} {"train_loss": -5.821418285369873, "global_step": 49566, "epoch": 1180} {"train_loss": -5.7502241134643555, "global_step": 49567, "epoch": 1180} {"train_loss": -5.809601783752441, "global_step": 49568, "epoch": 1180} {"train_loss": -5.597887992858887, "global_step": 49569, "epoch": 1180} {"train_loss": -5.900252819061279, "global_step": 49570, "epoch": 1180} {"train_loss": -5.639193058013916, "global_step": 49571, "epoch": 1180} {"train_loss": -5.643285274505615, "global_step": 49572, "epoch": 1180} {"train_loss": -5.852663516998291, "global_step": 49573, "epoch": 1180} {"train_loss": -5.837396621704102, "global_step": 49574, "epoch": 1180} {"train_loss": -5.885006904602051, "global_step": 49575, "epoch": 1180} {"train_loss": -5.779059410095215, "global_step": 49576, "epoch": 1180} {"train_loss": -5.734837532043457, "global_step": 49577, "epoch": 1180} {"train_loss": -5.659753799438477, "global_step": 49578, "epoch": 1180} {"train_loss": -5.787120342254639, "global_step": 49579, "epoch": 1180} {"train_loss": -5.7194294929504395, "global_step": 49580, "epoch": 1180} {"train_loss": -5.695713043212891, "global_step": 49581, "epoch": 1180} {"train_loss": -5.718403339385986, "global_step": 49582, "epoch": 1180} {"train_loss": -5.827520847320557, "global_step": 49583, "epoch": 1180} {"train_loss": -5.7895026206970215, "global_step": 49584, "epoch": 1180} {"train_loss": -5.7308197021484375, "global_step": 49585, "epoch": 1180} {"train_loss": -5.8374223709106445, "global_step": 49586, "epoch": 1180} {"train_loss": -5.854814529418945, "global_step": 49587, "epoch": 1180} {"train_loss": -5.872792720794678, "global_step": 49588, "epoch": 1180} {"train_loss": -5.672806739807129, "global_step": 49589, "epoch": 1180} {"train_loss": -5.840731620788574, "global_step": 49590, "epoch": 1180} {"train_loss": -5.7010345458984375, "global_step": 49591, "epoch": 1180} {"train_loss": -5.768156051635742, "global_step": 49592, "epoch": 1180} {"train_loss": -5.762148857116699, "global_step": 49593, "epoch": 1180} {"train_loss": -5.843242645263672, "global_step": 49594, "epoch": 1180} {"train_loss": -5.811919689178467, "global_step": 49595, "epoch": 1180} {"train_loss": -5.737576484680176, "global_step": 49596, "epoch": 1180} {"train_loss": -5.755891799926758, "global_step": 49597, "epoch": 1180} {"train_loss": -5.796582221984863, "global_step": 49598, "epoch": 1180} {"train_loss": -5.651694297790527, "global_step": 49599, "epoch": 1180} {"train_loss": -5.813129425048828, "global_step": 49600, "epoch": 1180} {"train_loss": -5.764060304278419, "global_step": 49601, "epoch": 1180, "val_loss": 74025.9921875} {"train_loss": -5.790957450866699, "global_step": 49602, "epoch": 1181} {"train_loss": -5.775726318359375, "global_step": 49603, "epoch": 1181} {"train_loss": -5.766544818878174, "global_step": 49604, "epoch": 1181} {"train_loss": -5.810888767242432, "global_step": 49605, "epoch": 1181} {"train_loss": -6.015867710113525, "global_step": 49606, "epoch": 1181} {"train_loss": -5.810086250305176, "global_step": 49607, "epoch": 1181} {"train_loss": -5.710359573364258, "global_step": 49608, "epoch": 1181} {"train_loss": -5.8101348876953125, "global_step": 49609, "epoch": 1181} {"train_loss": -5.7357940673828125, "global_step": 49610, "epoch": 1181} {"train_loss": -5.867457866668701, "global_step": 49611, "epoch": 1181} {"train_loss": -5.800567150115967, "global_step": 49612, "epoch": 1181} {"train_loss": -5.768831253051758, "global_step": 49613, "epoch": 1181} {"train_loss": -5.685306549072266, "global_step": 49614, "epoch": 1181} {"train_loss": -5.792961597442627, "global_step": 49615, "epoch": 1181} {"train_loss": -5.652337074279785, "global_step": 49616, "epoch": 1181} {"train_loss": -5.696342468261719, "global_step": 49617, "epoch": 1181} {"train_loss": -5.682518005371094, "global_step": 49618, "epoch": 1181} {"train_loss": -5.76597261428833, "global_step": 49619, "epoch": 1181} {"train_loss": -5.866939067840576, "global_step": 49620, "epoch": 1181} {"train_loss": -5.854325294494629, "global_step": 49621, "epoch": 1181} {"train_loss": -5.7355637550354, "global_step": 49622, "epoch": 1181} {"train_loss": -5.7441325187683105, "global_step": 49623, "epoch": 1181} {"train_loss": -5.717681884765625, "global_step": 49624, "epoch": 1181} {"train_loss": -5.84351921081543, "global_step": 49625, "epoch": 1181} {"train_loss": -5.694033622741699, "global_step": 49626, "epoch": 1181} {"train_loss": -5.751954078674316, "global_step": 49627, "epoch": 1181} {"train_loss": -5.656472206115723, "global_step": 49628, "epoch": 1181} {"train_loss": -5.748315811157227, "global_step": 49629, "epoch": 1181} {"train_loss": -5.676634788513184, "global_step": 49630, "epoch": 1181} {"train_loss": -5.843197822570801, "global_step": 49631, "epoch": 1181} {"train_loss": -5.7364888191223145, "global_step": 49632, "epoch": 1181} {"train_loss": -5.728995323181152, "global_step": 49633, "epoch": 1181} {"train_loss": -5.714056491851807, "global_step": 49634, "epoch": 1181} {"train_loss": -5.714991092681885, "global_step": 49635, "epoch": 1181} {"train_loss": -5.650763988494873, "global_step": 49636, "epoch": 1181} {"train_loss": -5.667935371398926, "global_step": 49637, "epoch": 1181} {"train_loss": -5.68304443359375, "global_step": 49638, "epoch": 1181} {"train_loss": -5.7756500244140625, "global_step": 49639, "epoch": 1181} {"train_loss": -5.826433181762695, "global_step": 49640, "epoch": 1181} {"train_loss": -5.815759658813477, "global_step": 49641, "epoch": 1181} {"train_loss": -5.820137977600098, "global_step": 49642, "epoch": 1181} {"train_loss": -5.7639042763482955, "global_step": 49643, "epoch": 1181, "val_loss": 74075.3984375} {"train_loss": -5.759397506713867, "global_step": 49644, "epoch": 1182} {"train_loss": -5.8483967781066895, "global_step": 49645, "epoch": 1182} {"train_loss": -5.870693206787109, "global_step": 49646, "epoch": 1182} {"train_loss": -5.759819030761719, "global_step": 49647, "epoch": 1182} {"train_loss": -5.73828649520874, "global_step": 49648, "epoch": 1182} {"train_loss": -5.883755207061768, "global_step": 49649, "epoch": 1182} {"train_loss": -5.73043155670166, "global_step": 49650, "epoch": 1182} {"train_loss": -5.792300701141357, "global_step": 49651, "epoch": 1182} {"train_loss": -5.857927322387695, "global_step": 49652, "epoch": 1182} {"train_loss": -5.713173866271973, "global_step": 49653, "epoch": 1182} {"train_loss": -5.843379497528076, "global_step": 49654, "epoch": 1182} {"train_loss": -5.697269439697266, "global_step": 49655, "epoch": 1182} {"train_loss": -5.783931732177734, "global_step": 49656, "epoch": 1182} {"train_loss": -5.805659294128418, "global_step": 49657, "epoch": 1182} {"train_loss": -5.7111053466796875, "global_step": 49658, "epoch": 1182} {"train_loss": -5.7460222244262695, "global_step": 49659, "epoch": 1182} {"train_loss": -5.734930992126465, "global_step": 49660, "epoch": 1182} {"train_loss": -5.738940238952637, "global_step": 49661, "epoch": 1182} {"train_loss": -5.6703901290893555, "global_step": 49662, "epoch": 1182} {"train_loss": -5.783241271972656, "global_step": 49663, "epoch": 1182} {"train_loss": -5.6134185791015625, "global_step": 49664, "epoch": 1182} {"train_loss": -5.78565788269043, "global_step": 49665, "epoch": 1182} {"train_loss": -5.735980033874512, "global_step": 49666, "epoch": 1182} {"train_loss": -5.742059230804443, "global_step": 49667, "epoch": 1182} {"train_loss": -5.867799282073975, "global_step": 49668, "epoch": 1182} {"train_loss": -5.815779209136963, "global_step": 49669, "epoch": 1182} {"train_loss": -5.720808029174805, "global_step": 49670, "epoch": 1182} {"train_loss": -5.789120674133301, "global_step": 49671, "epoch": 1182} {"train_loss": -5.798274993896484, "global_step": 49672, "epoch": 1182} {"train_loss": -5.711536407470703, "global_step": 49673, "epoch": 1182} {"train_loss": -5.756050109863281, "global_step": 49674, "epoch": 1182} {"train_loss": -5.7547287940979, "global_step": 49675, "epoch": 1182} {"train_loss": -5.77855110168457, "global_step": 49676, "epoch": 1182} {"train_loss": -5.766645431518555, "global_step": 49677, "epoch": 1182} {"train_loss": -5.790812015533447, "global_step": 49678, "epoch": 1182} {"train_loss": -5.777531623840332, "global_step": 49679, "epoch": 1182} {"train_loss": -5.854788303375244, "global_step": 49680, "epoch": 1182} {"train_loss": -5.802649021148682, "global_step": 49681, "epoch": 1182} {"train_loss": -5.869428634643555, "global_step": 49682, "epoch": 1182} {"train_loss": -5.8542656898498535, "global_step": 49683, "epoch": 1182} {"train_loss": -5.778312683105469, "global_step": 49684, "epoch": 1182} {"train_loss": -5.778296243576777, "global_step": 49685, "epoch": 1182, "val_loss": 74277.1328125} {"train_loss": -5.860886573791504, "global_step": 49686, "epoch": 1183} {"train_loss": -5.729035377502441, "global_step": 49687, "epoch": 1183} {"train_loss": -5.774815559387207, "global_step": 49688, "epoch": 1183} {"train_loss": -5.805158615112305, "global_step": 49689, "epoch": 1183} {"train_loss": -5.861394882202148, "global_step": 49690, "epoch": 1183} {"train_loss": -5.8566083908081055, "global_step": 49691, "epoch": 1183} {"train_loss": -5.718135833740234, "global_step": 49692, "epoch": 1183} {"train_loss": -5.557317733764648, "global_step": 49693, "epoch": 1183} {"train_loss": -5.762418746948242, "global_step": 49694, "epoch": 1183} {"train_loss": -5.666533470153809, "global_step": 49695, "epoch": 1183} {"train_loss": -5.5161662101745605, "global_step": 49696, "epoch": 1183} {"train_loss": -5.874399185180664, "global_step": 49697, "epoch": 1183} {"train_loss": -5.717226982116699, "global_step": 49698, "epoch": 1183} {"train_loss": -5.816208839416504, "global_step": 49699, "epoch": 1183} {"train_loss": -5.758301734924316, "global_step": 49700, "epoch": 1183} {"train_loss": -5.674637317657471, "global_step": 49701, "epoch": 1183} {"train_loss": -5.692338466644287, "global_step": 49702, "epoch": 1183} {"train_loss": -5.705844879150391, "global_step": 49703, "epoch": 1183} {"train_loss": -5.739519119262695, "global_step": 49704, "epoch": 1183} {"train_loss": -5.68781042098999, "global_step": 49705, "epoch": 1183} {"train_loss": -5.683717727661133, "global_step": 49706, "epoch": 1183} {"train_loss": -5.836587905883789, "global_step": 49707, "epoch": 1183} {"train_loss": -5.755163192749023, "global_step": 49708, "epoch": 1183} {"train_loss": -5.70689582824707, "global_step": 49709, "epoch": 1183} {"train_loss": -5.839498519897461, "global_step": 49710, "epoch": 1183} {"train_loss": -5.69367790222168, "global_step": 49711, "epoch": 1183} {"train_loss": -5.789361953735352, "global_step": 49712, "epoch": 1183} {"train_loss": -5.6088175773620605, "global_step": 49713, "epoch": 1183} {"train_loss": -5.787509918212891, "global_step": 49714, "epoch": 1183} {"train_loss": -5.802302360534668, "global_step": 49715, "epoch": 1183} {"train_loss": -5.6179399490356445, "global_step": 49716, "epoch": 1183} {"train_loss": -5.830534934997559, "global_step": 49717, "epoch": 1183} {"train_loss": -5.681249141693115, "global_step": 49718, "epoch": 1183} {"train_loss": -5.669046401977539, "global_step": 49719, "epoch": 1183} {"train_loss": -5.719152450561523, "global_step": 49720, "epoch": 1183} {"train_loss": -5.754884243011475, "global_step": 49721, "epoch": 1183} {"train_loss": -5.794417381286621, "global_step": 49722, "epoch": 1183} {"train_loss": -5.777960777282715, "global_step": 49723, "epoch": 1183} {"train_loss": -5.640158653259277, "global_step": 49724, "epoch": 1183} {"train_loss": -5.892955780029297, "global_step": 49725, "epoch": 1183} {"train_loss": -5.697909355163574, "global_step": 49726, "epoch": 1183} {"train_loss": -5.742951177415394, "global_step": 49727, "epoch": 1183, "val_loss": 74125.6875} {"train_loss": -5.71095085144043, "global_step": 49728, "epoch": 1184} {"train_loss": -5.845717430114746, "global_step": 49729, "epoch": 1184} {"train_loss": -5.754947662353516, "global_step": 49730, "epoch": 1184} {"train_loss": -5.874049186706543, "global_step": 49731, "epoch": 1184} {"train_loss": -5.918093681335449, "global_step": 49732, "epoch": 1184} {"train_loss": -5.58512020111084, "global_step": 49733, "epoch": 1184} {"train_loss": -5.691256523132324, "global_step": 49734, "epoch": 1184} {"train_loss": -5.718955039978027, "global_step": 49735, "epoch": 1184} {"train_loss": -5.705312728881836, "global_step": 49736, "epoch": 1184} {"train_loss": -5.702297210693359, "global_step": 49737, "epoch": 1184} {"train_loss": -5.7640581130981445, "global_step": 49738, "epoch": 1184} {"train_loss": -5.7109375, "global_step": 49739, "epoch": 1184} {"train_loss": -5.780069351196289, "global_step": 49740, "epoch": 1184} {"train_loss": -5.77451229095459, "global_step": 49741, "epoch": 1184} {"train_loss": -5.714111804962158, "global_step": 49742, "epoch": 1184} {"train_loss": -5.816225051879883, "global_step": 49743, "epoch": 1184} {"train_loss": -5.782728672027588, "global_step": 49744, "epoch": 1184} {"train_loss": -5.833806037902832, "global_step": 49745, "epoch": 1184} {"train_loss": -5.65961217880249, "global_step": 49746, "epoch": 1184} {"train_loss": -5.780550479888916, "global_step": 49747, "epoch": 1184} {"train_loss": -5.875877857208252, "global_step": 49748, "epoch": 1184} {"train_loss": -5.6966094970703125, "global_step": 49749, "epoch": 1184} {"train_loss": -5.736138343811035, "global_step": 49750, "epoch": 1184} {"train_loss": -5.828544616699219, "global_step": 49751, "epoch": 1184} {"train_loss": -5.800722122192383, "global_step": 49752, "epoch": 1184} {"train_loss": -5.688542366027832, "global_step": 49753, "epoch": 1184} {"train_loss": -5.891875267028809, "global_step": 49754, "epoch": 1184} {"train_loss": -5.874744415283203, "global_step": 49755, "epoch": 1184} {"train_loss": -5.6915740966796875, "global_step": 49756, "epoch": 1184} {"train_loss": -5.787196159362793, "global_step": 49757, "epoch": 1184} {"train_loss": -5.7677788734436035, "global_step": 49758, "epoch": 1184} {"train_loss": -5.754436016082764, "global_step": 49759, "epoch": 1184} {"train_loss": -5.807652473449707, "global_step": 49760, "epoch": 1184} {"train_loss": -5.808420658111572, "global_step": 49761, "epoch": 1184} {"train_loss": -5.822164535522461, "global_step": 49762, "epoch": 1184} {"train_loss": -5.799907684326172, "global_step": 49763, "epoch": 1184} {"train_loss": -5.783150672912598, "global_step": 49764, "epoch": 1184} {"train_loss": -5.804210662841797, "global_step": 49765, "epoch": 1184} {"train_loss": -5.76059627532959, "global_step": 49766, "epoch": 1184} {"train_loss": -5.653757572174072, "global_step": 49767, "epoch": 1184} {"train_loss": -5.772599697113037, "global_step": 49768, "epoch": 1184} {"train_loss": -5.770898977915446, "global_step": 49769, "epoch": 1184, "val_loss": 74214.46875} {"train_loss": -5.7849202156066895, "global_step": 49770, "epoch": 1185} {"train_loss": -5.818408012390137, "global_step": 49771, "epoch": 1185} {"train_loss": -5.865544319152832, "global_step": 49772, "epoch": 1185} {"train_loss": -5.881871700286865, "global_step": 49773, "epoch": 1185} {"train_loss": -5.847508907318115, "global_step": 49774, "epoch": 1185} {"train_loss": -5.816287994384766, "global_step": 49775, "epoch": 1185} {"train_loss": -5.82930850982666, "global_step": 49776, "epoch": 1185} {"train_loss": -5.785580635070801, "global_step": 49777, "epoch": 1185} {"train_loss": -5.986717224121094, "global_step": 49778, "epoch": 1185} {"train_loss": -5.884979248046875, "global_step": 49779, "epoch": 1185} {"train_loss": -5.843262672424316, "global_step": 49780, "epoch": 1185} {"train_loss": -5.840434551239014, "global_step": 49781, "epoch": 1185} {"train_loss": -5.753054618835449, "global_step": 49782, "epoch": 1185} {"train_loss": -5.5947675704956055, "global_step": 49783, "epoch": 1185} {"train_loss": -5.811278343200684, "global_step": 49784, "epoch": 1185} {"train_loss": -5.5523271560668945, "global_step": 49785, "epoch": 1185} {"train_loss": -5.724555492401123, "global_step": 49786, "epoch": 1185} {"train_loss": -5.72832727432251, "global_step": 49787, "epoch": 1185} {"train_loss": -5.69938850402832, "global_step": 49788, "epoch": 1185} {"train_loss": -5.758028030395508, "global_step": 49789, "epoch": 1185} {"train_loss": -5.701572895050049, "global_step": 49790, "epoch": 1185} {"train_loss": -5.694515705108643, "global_step": 49791, "epoch": 1185} {"train_loss": -5.726027011871338, "global_step": 49792, "epoch": 1185} {"train_loss": -5.661351203918457, "global_step": 49793, "epoch": 1185} {"train_loss": -5.791686058044434, "global_step": 49794, "epoch": 1185} {"train_loss": -5.632416725158691, "global_step": 49795, "epoch": 1185} {"train_loss": -5.655918121337891, "global_step": 49796, "epoch": 1185} {"train_loss": -5.84686803817749, "global_step": 49797, "epoch": 1185} {"train_loss": -5.802548408508301, "global_step": 49798, "epoch": 1185} {"train_loss": -5.764840126037598, "global_step": 49799, "epoch": 1185} {"train_loss": -5.817895412445068, "global_step": 49800, "epoch": 1185} {"train_loss": -5.820742130279541, "global_step": 49801, "epoch": 1185} {"train_loss": -5.861560821533203, "global_step": 49802, "epoch": 1185} {"train_loss": -5.723443508148193, "global_step": 49803, "epoch": 1185} {"train_loss": -5.706671237945557, "global_step": 49804, "epoch": 1185} {"train_loss": -5.740962982177734, "global_step": 49805, "epoch": 1185} {"train_loss": -5.808306694030762, "global_step": 49806, "epoch": 1185} {"train_loss": -5.723909378051758, "global_step": 49807, "epoch": 1185} {"train_loss": -5.76932430267334, "global_step": 49808, "epoch": 1185} {"train_loss": -5.762511730194092, "global_step": 49809, "epoch": 1185} {"train_loss": -5.74508810043335, "global_step": 49810, "epoch": 1185} {"train_loss": -5.772067807969593, "global_step": 49811, "epoch": 1185, "val_loss": 74253.1640625} {"train_loss": -5.801597595214844, "global_step": 49812, "epoch": 1186} {"train_loss": -5.713850975036621, "global_step": 49813, "epoch": 1186} {"train_loss": -5.80805778503418, "global_step": 49814, "epoch": 1186} {"train_loss": -5.611752510070801, "global_step": 49815, "epoch": 1186} {"train_loss": -5.740508079528809, "global_step": 49816, "epoch": 1186} {"train_loss": -5.790330410003662, "global_step": 49817, "epoch": 1186} {"train_loss": -5.653736114501953, "global_step": 49818, "epoch": 1186} {"train_loss": -5.8165059089660645, "global_step": 49819, "epoch": 1186} {"train_loss": -5.742649555206299, "global_step": 49820, "epoch": 1186} {"train_loss": -5.618114948272705, "global_step": 49821, "epoch": 1186} {"train_loss": -5.804945945739746, "global_step": 49822, "epoch": 1186} {"train_loss": -5.571237564086914, "global_step": 49823, "epoch": 1186} {"train_loss": -5.680601596832275, "global_step": 49824, "epoch": 1186} {"train_loss": -5.756689548492432, "global_step": 49825, "epoch": 1186} {"train_loss": -5.741330146789551, "global_step": 49826, "epoch": 1186} {"train_loss": -5.735870361328125, "global_step": 49827, "epoch": 1186} {"train_loss": -5.672436237335205, "global_step": 49828, "epoch": 1186} {"train_loss": -5.633508682250977, "global_step": 49829, "epoch": 1186} {"train_loss": -5.587413787841797, "global_step": 49830, "epoch": 1186} {"train_loss": -5.713983535766602, "global_step": 49831, "epoch": 1186} {"train_loss": -5.67509651184082, "global_step": 49832, "epoch": 1186} {"train_loss": -5.835330009460449, "global_step": 49833, "epoch": 1186} {"train_loss": -5.858517646789551, "global_step": 49834, "epoch": 1186} {"train_loss": -5.849675178527832, "global_step": 49835, "epoch": 1186} {"train_loss": -5.78890323638916, "global_step": 49836, "epoch": 1186} {"train_loss": -5.7085347175598145, "global_step": 49837, "epoch": 1186} {"train_loss": -5.896223068237305, "global_step": 49838, "epoch": 1186} {"train_loss": -5.71242094039917, "global_step": 49839, "epoch": 1186} {"train_loss": -5.790346145629883, "global_step": 49840, "epoch": 1186} {"train_loss": -5.824525833129883, "global_step": 49841, "epoch": 1186} {"train_loss": -5.655058860778809, "global_step": 49842, "epoch": 1186} {"train_loss": -5.907040596008301, "global_step": 49843, "epoch": 1186} {"train_loss": -5.602675914764404, "global_step": 49844, "epoch": 1186} {"train_loss": -5.752650260925293, "global_step": 49845, "epoch": 1186} {"train_loss": -5.834809303283691, "global_step": 49846, "epoch": 1186} {"train_loss": -5.758281230926514, "global_step": 49847, "epoch": 1186} {"train_loss": -5.779260635375977, "global_step": 49848, "epoch": 1186} {"train_loss": -5.774352073669434, "global_step": 49849, "epoch": 1186} {"train_loss": -5.748802185058594, "global_step": 49850, "epoch": 1186} {"train_loss": -5.850652694702148, "global_step": 49851, "epoch": 1186} {"train_loss": -5.822176933288574, "global_step": 49852, "epoch": 1186} {"train_loss": -5.745715822492327, "global_step": 49853, "epoch": 1186, "val_loss": 74324.7109375} {"train_loss": -5.869866371154785, "global_step": 49854, "epoch": 1187} {"train_loss": -5.784562110900879, "global_step": 49855, "epoch": 1187} {"train_loss": -5.798554420471191, "global_step": 49856, "epoch": 1187} {"train_loss": -5.827592849731445, "global_step": 49857, "epoch": 1187} {"train_loss": -5.816351890563965, "global_step": 49858, "epoch": 1187} {"train_loss": -5.7525739669799805, "global_step": 49859, "epoch": 1187} {"train_loss": -5.646546363830566, "global_step": 49860, "epoch": 1187} {"train_loss": -5.89150333404541, "global_step": 49861, "epoch": 1187} {"train_loss": -5.850532531738281, "global_step": 49862, "epoch": 1187} {"train_loss": -5.697740077972412, "global_step": 49863, "epoch": 1187} {"train_loss": -5.838611602783203, "global_step": 49864, "epoch": 1187} {"train_loss": -5.800814628601074, "global_step": 49865, "epoch": 1187} {"train_loss": -5.768826484680176, "global_step": 49866, "epoch": 1187} {"train_loss": -5.795313835144043, "global_step": 49867, "epoch": 1187} {"train_loss": -5.6811699867248535, "global_step": 49868, "epoch": 1187} {"train_loss": -5.810223579406738, "global_step": 49869, "epoch": 1187} {"train_loss": -5.74720573425293, "global_step": 49870, "epoch": 1187} {"train_loss": -5.752923965454102, "global_step": 49871, "epoch": 1187} {"train_loss": -5.72437047958374, "global_step": 49872, "epoch": 1187} {"train_loss": -5.767467021942139, "global_step": 49873, "epoch": 1187} {"train_loss": -5.6413373947143555, "global_step": 49874, "epoch": 1187} {"train_loss": -5.70065975189209, "global_step": 49875, "epoch": 1187} {"train_loss": -5.695065975189209, "global_step": 49876, "epoch": 1187} {"train_loss": -5.662463188171387, "global_step": 49877, "epoch": 1187} {"train_loss": -5.739389896392822, "global_step": 49878, "epoch": 1187} {"train_loss": -5.641857624053955, "global_step": 49879, "epoch": 1187} {"train_loss": -5.62155294418335, "global_step": 49880, "epoch": 1187} {"train_loss": -5.694965839385986, "global_step": 49881, "epoch": 1187} {"train_loss": -5.70473575592041, "global_step": 49882, "epoch": 1187} {"train_loss": -5.753586292266846, "global_step": 49883, "epoch": 1187} {"train_loss": -5.7646660804748535, "global_step": 49884, "epoch": 1187} {"train_loss": -5.807908058166504, "global_step": 49885, "epoch": 1187} {"train_loss": -5.722716808319092, "global_step": 49886, "epoch": 1187} {"train_loss": -5.829503059387207, "global_step": 49887, "epoch": 1187} {"train_loss": -5.662569046020508, "global_step": 49888, "epoch": 1187} {"train_loss": -5.754193305969238, "global_step": 49889, "epoch": 1187} {"train_loss": -5.789765357971191, "global_step": 49890, "epoch": 1187} {"train_loss": -5.798161506652832, "global_step": 49891, "epoch": 1187} {"train_loss": -5.788407325744629, "global_step": 49892, "epoch": 1187} {"train_loss": -5.746264457702637, "global_step": 49893, "epoch": 1187} {"train_loss": -5.690395832061768, "global_step": 49894, "epoch": 1187} {"train_loss": -5.7522529647463845, "global_step": 49895, "epoch": 1187, "val_loss": 74352.1875} {"train_loss": -5.7226104736328125, "global_step": 49896, "epoch": 1188} {"train_loss": -5.778292655944824, "global_step": 49897, "epoch": 1188} {"train_loss": -5.8079094886779785, "global_step": 49898, "epoch": 1188} {"train_loss": -5.803496360778809, "global_step": 49899, "epoch": 1188} {"train_loss": -5.739959239959717, "global_step": 49900, "epoch": 1188} {"train_loss": -5.764334678649902, "global_step": 49901, "epoch": 1188} {"train_loss": -5.765840530395508, "global_step": 49902, "epoch": 1188} {"train_loss": -5.766839027404785, "global_step": 49903, "epoch": 1188} {"train_loss": -5.769773483276367, "global_step": 49904, "epoch": 1188} {"train_loss": -5.788459777832031, "global_step": 49905, "epoch": 1188} {"train_loss": -5.625247955322266, "global_step": 49906, "epoch": 1188} {"train_loss": -5.709595203399658, "global_step": 49907, "epoch": 1188} {"train_loss": -5.732113838195801, "global_step": 49908, "epoch": 1188} {"train_loss": -5.7198004722595215, "global_step": 49909, "epoch": 1188} {"train_loss": -5.721634864807129, "global_step": 49910, "epoch": 1188} {"train_loss": -5.679002285003662, "global_step": 49911, "epoch": 1188} {"train_loss": -5.641523361206055, "global_step": 49912, "epoch": 1188} {"train_loss": -5.691533088684082, "global_step": 49913, "epoch": 1188} {"train_loss": -5.6107659339904785, "global_step": 49914, "epoch": 1188} {"train_loss": -5.671072006225586, "global_step": 49915, "epoch": 1188} {"train_loss": -5.671463489532471, "global_step": 49916, "epoch": 1188} {"train_loss": -5.628692626953125, "global_step": 49917, "epoch": 1188} {"train_loss": -5.637451648712158, "global_step": 49918, "epoch": 1188} {"train_loss": -5.7486653327941895, "global_step": 49919, "epoch": 1188} {"train_loss": -5.743610382080078, "global_step": 49920, "epoch": 1188} {"train_loss": -5.649934768676758, "global_step": 49921, "epoch": 1188} {"train_loss": -5.793445110321045, "global_step": 49922, "epoch": 1188} {"train_loss": -5.636458396911621, "global_step": 49923, "epoch": 1188} {"train_loss": -5.741325378417969, "global_step": 49924, "epoch": 1188} {"train_loss": -5.695486068725586, "global_step": 49925, "epoch": 1188} {"train_loss": -5.66138219833374, "global_step": 49926, "epoch": 1188} {"train_loss": -5.77421760559082, "global_step": 49927, "epoch": 1188} {"train_loss": -5.756475925445557, "global_step": 49928, "epoch": 1188} {"train_loss": -5.675602912902832, "global_step": 49929, "epoch": 1188} {"train_loss": -5.778359413146973, "global_step": 49930, "epoch": 1188} {"train_loss": -5.8412580490112305, "global_step": 49931, "epoch": 1188} {"train_loss": -5.831881999969482, "global_step": 49932, "epoch": 1188} {"train_loss": -5.750497817993164, "global_step": 49933, "epoch": 1188} {"train_loss": -5.7600626945495605, "global_step": 49934, "epoch": 1188} {"train_loss": -5.841163158416748, "global_step": 49935, "epoch": 1188} {"train_loss": -5.723818302154541, "global_step": 49936, "epoch": 1188} {"train_loss": -5.72992315746489, "global_step": 49937, "epoch": 1188, "val_loss": 74190.8203125} {"train_loss": -5.758727073669434, "global_step": 49938, "epoch": 1189} {"train_loss": -5.712719440460205, "global_step": 49939, "epoch": 1189} {"train_loss": -5.807606220245361, "global_step": 49940, "epoch": 1189} {"train_loss": -5.758923053741455, "global_step": 49941, "epoch": 1189} {"train_loss": -5.71681022644043, "global_step": 49942, "epoch": 1189} {"train_loss": -5.708754539489746, "global_step": 49943, "epoch": 1189} {"train_loss": -5.681677341461182, "global_step": 49944, "epoch": 1189} {"train_loss": -5.786710739135742, "global_step": 49945, "epoch": 1189} {"train_loss": -5.599734306335449, "global_step": 49946, "epoch": 1189} {"train_loss": -5.8503923416137695, "global_step": 49947, "epoch": 1189} {"train_loss": -5.618134498596191, "global_step": 49948, "epoch": 1189} {"train_loss": -5.65456485748291, "global_step": 49949, "epoch": 1189} {"train_loss": -5.72926139831543, "global_step": 49950, "epoch": 1189} {"train_loss": -5.580623149871826, "global_step": 49951, "epoch": 1189} {"train_loss": -5.794216156005859, "global_step": 49952, "epoch": 1189} {"train_loss": -5.747198581695557, "global_step": 49953, "epoch": 1189} {"train_loss": -5.819227695465088, "global_step": 49954, "epoch": 1189} {"train_loss": -5.6269850730896, "global_step": 49955, "epoch": 1189} {"train_loss": -5.7006964683532715, "global_step": 49956, "epoch": 1189} {"train_loss": -5.84239387512207, "global_step": 49957, "epoch": 1189} {"train_loss": -5.738746166229248, "global_step": 49958, "epoch": 1189} {"train_loss": -5.734802722930908, "global_step": 49959, "epoch": 1189} {"train_loss": -5.774387359619141, "global_step": 49960, "epoch": 1189} {"train_loss": -5.739645957946777, "global_step": 49961, "epoch": 1189} {"train_loss": -5.753170967102051, "global_step": 49962, "epoch": 1189} {"train_loss": -5.743204116821289, "global_step": 49963, "epoch": 1189} {"train_loss": -5.786211967468262, "global_step": 49964, "epoch": 1189} {"train_loss": -5.782235622406006, "global_step": 49965, "epoch": 1189} {"train_loss": -5.707520008087158, "global_step": 49966, "epoch": 1189} {"train_loss": -5.839295387268066, "global_step": 49967, "epoch": 1189} {"train_loss": -5.737339496612549, "global_step": 49968, "epoch": 1189} {"train_loss": -5.7920942306518555, "global_step": 49969, "epoch": 1189} {"train_loss": -5.8720197677612305, "global_step": 49970, "epoch": 1189} {"train_loss": -5.716497421264648, "global_step": 49971, "epoch": 1189} {"train_loss": -5.774239540100098, "global_step": 49972, "epoch": 1189} {"train_loss": -5.720404624938965, "global_step": 49973, "epoch": 1189} {"train_loss": -5.7574992179870605, "global_step": 49974, "epoch": 1189} {"train_loss": -5.7668046951293945, "global_step": 49975, "epoch": 1189} {"train_loss": -5.744748115539551, "global_step": 49976, "epoch": 1189} {"train_loss": -5.724803924560547, "global_step": 49977, "epoch": 1189} {"train_loss": -5.949344635009766, "global_step": 49978, "epoch": 1189} {"train_loss": -5.745979036603655, "global_step": 49979, "epoch": 1189, "val_loss": 73994.140625} {"train_loss": -5.757443428039551, "global_step": 49980, "epoch": 1190} {"train_loss": -5.7737717628479, "global_step": 49981, "epoch": 1190} {"train_loss": -5.852961540222168, "global_step": 49982, "epoch": 1190} {"train_loss": -5.678689956665039, "global_step": 49983, "epoch": 1190} {"train_loss": -5.680670261383057, "global_step": 49984, "epoch": 1190} {"train_loss": -5.688311576843262, "global_step": 49985, "epoch": 1190} {"train_loss": -5.636861324310303, "global_step": 49986, "epoch": 1190} {"train_loss": -5.629847526550293, "global_step": 49987, "epoch": 1190} {"train_loss": -5.767282962799072, "global_step": 49988, "epoch": 1190} {"train_loss": -5.790596008300781, "global_step": 49989, "epoch": 1190} {"train_loss": -5.86924409866333, "global_step": 49990, "epoch": 1190} {"train_loss": -5.8192291259765625, "global_step": 49991, "epoch": 1190} {"train_loss": -5.760369300842285, "global_step": 49992, "epoch": 1190} {"train_loss": -5.661870956420898, "global_step": 49993, "epoch": 1190} {"train_loss": -5.820664882659912, "global_step": 49994, "epoch": 1190} {"train_loss": -5.7830963134765625, "global_step": 49995, "epoch": 1190} {"train_loss": -5.809375286102295, "global_step": 49996, "epoch": 1190} {"train_loss": -5.832448959350586, "global_step": 49997, "epoch": 1190} {"train_loss": -5.713977336883545, "global_step": 49998, "epoch": 1190} {"train_loss": -5.779521465301514, "global_step": 49999, "epoch": 1190} {"train_loss": -5.861364364624023, "global_step": 50000, "epoch": 1190} {"train_loss": -5.825606346130371, "global_step": 50001, "epoch": 1190} {"train_loss": -5.781658172607422, "global_step": 50002, "epoch": 1190} {"train_loss": -5.729838848114014, "global_step": 50003, "epoch": 1190} {"train_loss": -5.773313522338867, "global_step": 50004, "epoch": 1190} {"train_loss": -5.856968402862549, "global_step": 50005, "epoch": 1190} {"train_loss": -5.786467552185059, "global_step": 50006, "epoch": 1190} {"train_loss": -5.77473258972168, "global_step": 50007, "epoch": 1190} {"train_loss": -5.717109203338623, "global_step": 50008, "epoch": 1190} {"train_loss": -5.653906345367432, "global_step": 50009, "epoch": 1190} {"train_loss": -5.7429118156433105, "global_step": 50010, "epoch": 1190} {"train_loss": -5.818072319030762, "global_step": 50011, "epoch": 1190} {"train_loss": -5.831073760986328, "global_step": 50012, "epoch": 1190} {"train_loss": -5.727975845336914, "global_step": 50013, "epoch": 1190} {"train_loss": -5.78773307800293, "global_step": 50014, "epoch": 1190} {"train_loss": -5.668169021606445, "global_step": 50015, "epoch": 1190} {"train_loss": -5.7310967445373535, "global_step": 50016, "epoch": 1190} {"train_loss": -5.758022308349609, "global_step": 50017, "epoch": 1190} {"train_loss": -5.851676940917969, "global_step": 50018, "epoch": 1190} {"train_loss": -5.60877799987793, "global_step": 50019, "epoch": 1190} {"train_loss": -5.708700180053711, "global_step": 50020, "epoch": 1190} {"train_loss": -5.758595182782128, "global_step": 50021, "epoch": 1190, "val_loss": 74283.9609375} {"train_loss": -5.791001319885254, "global_step": 50022, "epoch": 1191} {"train_loss": -5.785977363586426, "global_step": 50023, "epoch": 1191} {"train_loss": -5.698305130004883, "global_step": 50024, "epoch": 1191} {"train_loss": -5.702252388000488, "global_step": 50025, "epoch": 1191} {"train_loss": -5.678417682647705, "global_step": 50026, "epoch": 1191} {"train_loss": -5.699321746826172, "global_step": 50027, "epoch": 1191} {"train_loss": -5.562013626098633, "global_step": 50028, "epoch": 1191} {"train_loss": -5.70991325378418, "global_step": 50029, "epoch": 1191} {"train_loss": -5.5920610427856445, "global_step": 50030, "epoch": 1191} {"train_loss": -5.766860008239746, "global_step": 50031, "epoch": 1191} {"train_loss": -5.830940246582031, "global_step": 50032, "epoch": 1191} {"train_loss": -5.862789154052734, "global_step": 50033, "epoch": 1191} {"train_loss": -5.653583526611328, "global_step": 50034, "epoch": 1191} {"train_loss": -5.595596790313721, "global_step": 50035, "epoch": 1191} {"train_loss": -5.64027214050293, "global_step": 50036, "epoch": 1191} {"train_loss": -5.788388729095459, "global_step": 50037, "epoch": 1191} {"train_loss": -5.722761631011963, "global_step": 50038, "epoch": 1191} {"train_loss": -5.685455322265625, "global_step": 50039, "epoch": 1191} {"train_loss": -5.723408222198486, "global_step": 50040, "epoch": 1191} {"train_loss": -5.7106122970581055, "global_step": 50041, "epoch": 1191} {"train_loss": -5.548099040985107, "global_step": 50042, "epoch": 1191} {"train_loss": -5.738284111022949, "global_step": 50043, "epoch": 1191} {"train_loss": -5.635134696960449, "global_step": 50044, "epoch": 1191} {"train_loss": -5.674164772033691, "global_step": 50045, "epoch": 1191} {"train_loss": -5.7221879959106445, "global_step": 50046, "epoch": 1191} {"train_loss": -5.686088562011719, "global_step": 50047, "epoch": 1191} {"train_loss": -5.760796546936035, "global_step": 50048, "epoch": 1191} {"train_loss": -5.6527252197265625, "global_step": 50049, "epoch": 1191} {"train_loss": -5.784054756164551, "global_step": 50050, "epoch": 1191} {"train_loss": -5.675245761871338, "global_step": 50051, "epoch": 1191} {"train_loss": -5.7867817878723145, "global_step": 50052, "epoch": 1191} {"train_loss": -5.7732391357421875, "global_step": 50053, "epoch": 1191} {"train_loss": -5.807272434234619, "global_step": 50054, "epoch": 1191} {"train_loss": -5.670126438140869, "global_step": 50055, "epoch": 1191} {"train_loss": -5.733161926269531, "global_step": 50056, "epoch": 1191} {"train_loss": -5.759140491485596, "global_step": 50057, "epoch": 1191} {"train_loss": -5.716274261474609, "global_step": 50058, "epoch": 1191} {"train_loss": -5.674552917480469, "global_step": 50059, "epoch": 1191} {"train_loss": -5.722603797912598, "global_step": 50060, "epoch": 1191} {"train_loss": -5.850712776184082, "global_step": 50061, "epoch": 1191} {"train_loss": -5.887775421142578, "global_step": 50062, "epoch": 1191} {"train_loss": -5.718346164340065, "global_step": 50063, "epoch": 1191, "val_loss": 74219.28125} {"train_loss": -5.81389856338501, "global_step": 50064, "epoch": 1192} {"train_loss": -5.6829376220703125, "global_step": 50065, "epoch": 1192} {"train_loss": -5.684635162353516, "global_step": 50066, "epoch": 1192} {"train_loss": -5.762568950653076, "global_step": 50067, "epoch": 1192} {"train_loss": -5.738289833068848, "global_step": 50068, "epoch": 1192} {"train_loss": -5.724867820739746, "global_step": 50069, "epoch": 1192} {"train_loss": -5.886772632598877, "global_step": 50070, "epoch": 1192} {"train_loss": -5.862181663513184, "global_step": 50071, "epoch": 1192} {"train_loss": -5.75096321105957, "global_step": 50072, "epoch": 1192} {"train_loss": -5.771162033081055, "global_step": 50073, "epoch": 1192} {"train_loss": -5.769969940185547, "global_step": 50074, "epoch": 1192} {"train_loss": -5.7927680015563965, "global_step": 50075, "epoch": 1192} {"train_loss": -5.825591564178467, "global_step": 50076, "epoch": 1192} {"train_loss": -5.821784019470215, "global_step": 50077, "epoch": 1192} {"train_loss": -5.687921524047852, "global_step": 50078, "epoch": 1192} {"train_loss": -5.858846664428711, "global_step": 50079, "epoch": 1192} {"train_loss": -5.767881870269775, "global_step": 50080, "epoch": 1192} {"train_loss": -5.804447650909424, "global_step": 50081, "epoch": 1192} {"train_loss": -5.953968524932861, "global_step": 50082, "epoch": 1192} {"train_loss": -5.745826721191406, "global_step": 50083, "epoch": 1192} {"train_loss": -5.749237060546875, "global_step": 50084, "epoch": 1192} {"train_loss": -5.7838053703308105, "global_step": 50085, "epoch": 1192} {"train_loss": -5.785849571228027, "global_step": 50086, "epoch": 1192} {"train_loss": -5.737140655517578, "global_step": 50087, "epoch": 1192} {"train_loss": -5.920222282409668, "global_step": 50088, "epoch": 1192} {"train_loss": -5.655868053436279, "global_step": 50089, "epoch": 1192} {"train_loss": -5.7271575927734375, "global_step": 50090, "epoch": 1192} {"train_loss": -5.854173183441162, "global_step": 50091, "epoch": 1192} {"train_loss": -5.714694976806641, "global_step": 50092, "epoch": 1192} {"train_loss": -5.578325271606445, "global_step": 50093, "epoch": 1192} {"train_loss": -5.791507244110107, "global_step": 50094, "epoch": 1192} {"train_loss": -5.687458038330078, "global_step": 50095, "epoch": 1192} {"train_loss": -5.666514873504639, "global_step": 50096, "epoch": 1192} {"train_loss": -5.568292617797852, "global_step": 50097, "epoch": 1192} {"train_loss": -5.81796932220459, "global_step": 50098, "epoch": 1192} {"train_loss": -5.783100128173828, "global_step": 50099, "epoch": 1192} {"train_loss": -5.713759422302246, "global_step": 50100, "epoch": 1192} {"train_loss": -5.896761894226074, "global_step": 50101, "epoch": 1192} {"train_loss": -5.6997270584106445, "global_step": 50102, "epoch": 1192} {"train_loss": -5.7296600341796875, "global_step": 50103, "epoch": 1192} {"train_loss": -5.750069618225098, "global_step": 50104, "epoch": 1192} {"train_loss": -5.76500601995559, "global_step": 50105, "epoch": 1192, "val_loss": 74587.5078125} {"train_loss": -5.84197473526001, "global_step": 50106, "epoch": 1193} {"train_loss": -5.7472310066223145, "global_step": 50107, "epoch": 1193} {"train_loss": -5.8620147705078125, "global_step": 50108, "epoch": 1193} {"train_loss": -5.778314590454102, "global_step": 50109, "epoch": 1193} {"train_loss": -5.795299053192139, "global_step": 50110, "epoch": 1193} {"train_loss": -5.591048240661621, "global_step": 50111, "epoch": 1193} {"train_loss": -5.830739974975586, "global_step": 50112, "epoch": 1193} {"train_loss": -5.670327186584473, "global_step": 50113, "epoch": 1193} {"train_loss": -5.781904697418213, "global_step": 50114, "epoch": 1193} {"train_loss": -5.747261047363281, "global_step": 50115, "epoch": 1193} {"train_loss": -5.875019550323486, "global_step": 50116, "epoch": 1193} {"train_loss": -5.718991756439209, "global_step": 50117, "epoch": 1193} {"train_loss": -5.913244247436523, "global_step": 50118, "epoch": 1193} {"train_loss": -5.815485954284668, "global_step": 50119, "epoch": 1193} {"train_loss": -5.773710250854492, "global_step": 50120, "epoch": 1193} {"train_loss": -5.792269706726074, "global_step": 50121, "epoch": 1193} {"train_loss": -5.792426109313965, "global_step": 50122, "epoch": 1193} {"train_loss": -5.877375602722168, "global_step": 50123, "epoch": 1193} {"train_loss": -5.899672508239746, "global_step": 50124, "epoch": 1193} {"train_loss": -5.788797378540039, "global_step": 50125, "epoch": 1193} {"train_loss": -5.7966742515563965, "global_step": 50126, "epoch": 1193} {"train_loss": -5.759147644042969, "global_step": 50127, "epoch": 1193} {"train_loss": -5.774498462677002, "global_step": 50128, "epoch": 1193} {"train_loss": -5.763868808746338, "global_step": 50129, "epoch": 1193} {"train_loss": -5.685433864593506, "global_step": 50130, "epoch": 1193} {"train_loss": -5.7261505126953125, "global_step": 50131, "epoch": 1193} {"train_loss": -5.747658729553223, "global_step": 50132, "epoch": 1193} {"train_loss": -5.764981269836426, "global_step": 50133, "epoch": 1193} {"train_loss": -5.611553192138672, "global_step": 50134, "epoch": 1193} {"train_loss": -5.834987640380859, "global_step": 50135, "epoch": 1193} {"train_loss": -5.668374061584473, "global_step": 50136, "epoch": 1193} {"train_loss": -5.826595783233643, "global_step": 50137, "epoch": 1193} {"train_loss": -5.753759384155273, "global_step": 50138, "epoch": 1193} {"train_loss": -5.957059860229492, "global_step": 50139, "epoch": 1193} {"train_loss": -5.91242790222168, "global_step": 50140, "epoch": 1193} {"train_loss": -5.743246555328369, "global_step": 50141, "epoch": 1193} {"train_loss": -5.849452972412109, "global_step": 50142, "epoch": 1193} {"train_loss": -5.858880996704102, "global_step": 50143, "epoch": 1193} {"train_loss": -5.6700592041015625, "global_step": 50144, "epoch": 1193} {"train_loss": -5.769474029541016, "global_step": 50145, "epoch": 1193} {"train_loss": -5.771799087524414, "global_step": 50146, "epoch": 1193} {"train_loss": -5.785099653970628, "global_step": 50147, "epoch": 1193, "val_loss": 73997.6953125} {"train_loss": -5.833909034729004, "global_step": 50148, "epoch": 1194} {"train_loss": -5.762084007263184, "global_step": 50149, "epoch": 1194} {"train_loss": -5.88850212097168, "global_step": 50150, "epoch": 1194} {"train_loss": -5.702992916107178, "global_step": 50151, "epoch": 1194} {"train_loss": -5.7507195472717285, "global_step": 50152, "epoch": 1194} {"train_loss": -5.833375453948975, "global_step": 50153, "epoch": 1194} {"train_loss": -5.782609462738037, "global_step": 50154, "epoch": 1194} {"train_loss": -6.04120397567749, "global_step": 50155, "epoch": 1194} {"train_loss": -5.846990585327148, "global_step": 50156, "epoch": 1194} {"train_loss": -5.832465171813965, "global_step": 50157, "epoch": 1194} {"train_loss": -5.795222759246826, "global_step": 50158, "epoch": 1194} {"train_loss": -5.85366153717041, "global_step": 50159, "epoch": 1194} {"train_loss": -5.829188823699951, "global_step": 50160, "epoch": 1194} {"train_loss": -5.866358757019043, "global_step": 50161, "epoch": 1194} {"train_loss": -5.855380535125732, "global_step": 50162, "epoch": 1194} {"train_loss": -5.800145149230957, "global_step": 50163, "epoch": 1194} {"train_loss": -5.7383880615234375, "global_step": 50164, "epoch": 1194} {"train_loss": -5.832286834716797, "global_step": 50165, "epoch": 1194} {"train_loss": -5.804999351501465, "global_step": 50166, "epoch": 1194} {"train_loss": -5.834458827972412, "global_step": 50167, "epoch": 1194} {"train_loss": -5.720734596252441, "global_step": 50168, "epoch": 1194} {"train_loss": -5.810198783874512, "global_step": 50169, "epoch": 1194} {"train_loss": -5.805339813232422, "global_step": 50170, "epoch": 1194} {"train_loss": -5.789709091186523, "global_step": 50171, "epoch": 1194} {"train_loss": -5.806395530700684, "global_step": 50172, "epoch": 1194} {"train_loss": -5.822877883911133, "global_step": 50173, "epoch": 1194} {"train_loss": -5.715094566345215, "global_step": 50174, "epoch": 1194} {"train_loss": -5.724235534667969, "global_step": 50175, "epoch": 1194} {"train_loss": -5.795397758483887, "global_step": 50176, "epoch": 1194} {"train_loss": -5.631980895996094, "global_step": 50177, "epoch": 1194} {"train_loss": -5.752137184143066, "global_step": 50178, "epoch": 1194} {"train_loss": -5.880334854125977, "global_step": 50179, "epoch": 1194} {"train_loss": -5.554178714752197, "global_step": 50180, "epoch": 1194} {"train_loss": -5.679116249084473, "global_step": 50181, "epoch": 1194} {"train_loss": -5.661870956420898, "global_step": 50182, "epoch": 1194} {"train_loss": -5.67677116394043, "global_step": 50183, "epoch": 1194} {"train_loss": -5.673750877380371, "global_step": 50184, "epoch": 1194} {"train_loss": -5.7616400718688965, "global_step": 50185, "epoch": 1194} {"train_loss": -5.579442501068115, "global_step": 50186, "epoch": 1194} {"train_loss": -5.711042404174805, "global_step": 50187, "epoch": 1194} {"train_loss": -5.624086380004883, "global_step": 50188, "epoch": 1194} {"train_loss": -5.766978706632342, "global_step": 50189, "epoch": 1194, "val_loss": 74249.140625} {"train_loss": -5.726871490478516, "global_step": 50190, "epoch": 1195} {"train_loss": -5.736629009246826, "global_step": 50191, "epoch": 1195} {"train_loss": -5.865362644195557, "global_step": 50192, "epoch": 1195} {"train_loss": -5.594182968139648, "global_step": 50193, "epoch": 1195} {"train_loss": -5.707454681396484, "global_step": 50194, "epoch": 1195} {"train_loss": -5.556385517120361, "global_step": 50195, "epoch": 1195} {"train_loss": -5.655674934387207, "global_step": 50196, "epoch": 1195} {"train_loss": -5.665158271789551, "global_step": 50197, "epoch": 1195} {"train_loss": -5.779972553253174, "global_step": 50198, "epoch": 1195} {"train_loss": -5.70479679107666, "global_step": 50199, "epoch": 1195} {"train_loss": -5.713583946228027, "global_step": 50200, "epoch": 1195} {"train_loss": -5.71538782119751, "global_step": 50201, "epoch": 1195} {"train_loss": -5.778628349304199, "global_step": 50202, "epoch": 1195} {"train_loss": -5.794745445251465, "global_step": 50203, "epoch": 1195} {"train_loss": -5.59131383895874, "global_step": 50204, "epoch": 1195} {"train_loss": -5.910040855407715, "global_step": 50205, "epoch": 1195} {"train_loss": -5.703490257263184, "global_step": 50206, "epoch": 1195} {"train_loss": -5.667357921600342, "global_step": 50207, "epoch": 1195} {"train_loss": -5.814220905303955, "global_step": 50208, "epoch": 1195} {"train_loss": -5.758446216583252, "global_step": 50209, "epoch": 1195} {"train_loss": -5.764259338378906, "global_step": 50210, "epoch": 1195} {"train_loss": -5.813225269317627, "global_step": 50211, "epoch": 1195} {"train_loss": -5.837200164794922, "global_step": 50212, "epoch": 1195} {"train_loss": -5.701198101043701, "global_step": 50213, "epoch": 1195} {"train_loss": -5.773398399353027, "global_step": 50214, "epoch": 1195} {"train_loss": -5.712741851806641, "global_step": 50215, "epoch": 1195} {"train_loss": -5.896150588989258, "global_step": 50216, "epoch": 1195} {"train_loss": -5.608270645141602, "global_step": 50217, "epoch": 1195} {"train_loss": -5.758601188659668, "global_step": 50218, "epoch": 1195} {"train_loss": -5.673255443572998, "global_step": 50219, "epoch": 1195} {"train_loss": -5.765893459320068, "global_step": 50220, "epoch": 1195} {"train_loss": -5.696315765380859, "global_step": 50221, "epoch": 1195} {"train_loss": -5.786654949188232, "global_step": 50222, "epoch": 1195} {"train_loss": -5.722265243530273, "global_step": 50223, "epoch": 1195} {"train_loss": -5.860815525054932, "global_step": 50224, "epoch": 1195} {"train_loss": -5.750337600708008, "global_step": 50225, "epoch": 1195} {"train_loss": -5.746137619018555, "global_step": 50226, "epoch": 1195} {"train_loss": -5.789900779724121, "global_step": 50227, "epoch": 1195} {"train_loss": -5.781414985656738, "global_step": 50228, "epoch": 1195} {"train_loss": -5.830631256103516, "global_step": 50229, "epoch": 1195} {"train_loss": -5.757326602935791, "global_step": 50230, "epoch": 1195} {"train_loss": -5.741718065171015, "global_step": 50231, "epoch": 1195, "val_loss": 74227.21875} {"train_loss": -5.869549751281738, "global_step": 50232, "epoch": 1196} {"train_loss": -5.872542381286621, "global_step": 50233, "epoch": 1196} {"train_loss": -5.743171691894531, "global_step": 50234, "epoch": 1196} {"train_loss": -5.907942771911621, "global_step": 50235, "epoch": 1196} {"train_loss": -5.669636249542236, "global_step": 50236, "epoch": 1196} {"train_loss": -5.817749977111816, "global_step": 50237, "epoch": 1196} {"train_loss": -5.739108085632324, "global_step": 50238, "epoch": 1196} {"train_loss": -5.826556205749512, "global_step": 50239, "epoch": 1196} {"train_loss": -5.841829776763916, "global_step": 50240, "epoch": 1196} {"train_loss": -5.694942474365234, "global_step": 50241, "epoch": 1196} {"train_loss": -5.885903835296631, "global_step": 50242, "epoch": 1196} {"train_loss": -5.622594833374023, "global_step": 50243, "epoch": 1196} {"train_loss": -5.7971954345703125, "global_step": 50244, "epoch": 1196} {"train_loss": -5.796857833862305, "global_step": 50245, "epoch": 1196} {"train_loss": -5.81028413772583, "global_step": 50246, "epoch": 1196} {"train_loss": -5.81257438659668, "global_step": 50247, "epoch": 1196} {"train_loss": -5.847227096557617, "global_step": 50248, "epoch": 1196} {"train_loss": -5.824686050415039, "global_step": 50249, "epoch": 1196} {"train_loss": -5.753225326538086, "global_step": 50250, "epoch": 1196} {"train_loss": -5.730284690856934, "global_step": 50251, "epoch": 1196} {"train_loss": -5.687165260314941, "global_step": 50252, "epoch": 1196} {"train_loss": -5.847972869873047, "global_step": 50253, "epoch": 1196} {"train_loss": -5.60697078704834, "global_step": 50254, "epoch": 1196} {"train_loss": -5.7153544425964355, "global_step": 50255, "epoch": 1196} {"train_loss": -5.736498832702637, "global_step": 50256, "epoch": 1196} {"train_loss": -5.704587936401367, "global_step": 50257, "epoch": 1196} {"train_loss": -5.799905300140381, "global_step": 50258, "epoch": 1196} {"train_loss": -5.857980728149414, "global_step": 50259, "epoch": 1196} {"train_loss": -5.655533790588379, "global_step": 50260, "epoch": 1196} {"train_loss": -5.696329116821289, "global_step": 50261, "epoch": 1196} {"train_loss": -5.836897850036621, "global_step": 50262, "epoch": 1196} {"train_loss": -5.692234992980957, "global_step": 50263, "epoch": 1196} {"train_loss": -5.828235149383545, "global_step": 50264, "epoch": 1196} {"train_loss": -5.699649810791016, "global_step": 50265, "epoch": 1196} {"train_loss": -5.832124710083008, "global_step": 50266, "epoch": 1196} {"train_loss": -5.833996772766113, "global_step": 50267, "epoch": 1196} {"train_loss": -5.706913948059082, "global_step": 50268, "epoch": 1196} {"train_loss": -5.876068115234375, "global_step": 50269, "epoch": 1196} {"train_loss": -5.864660739898682, "global_step": 50270, "epoch": 1196} {"train_loss": -5.633290767669678, "global_step": 50271, "epoch": 1196} {"train_loss": -5.7626118659973145, "global_step": 50272, "epoch": 1196} {"train_loss": -5.773168609255836, "global_step": 50273, "epoch": 1196, "val_loss": 74047.390625} {"train_loss": -5.829227447509766, "global_step": 50274, "epoch": 1197} {"train_loss": -5.78803825378418, "global_step": 50275, "epoch": 1197} {"train_loss": -5.78140926361084, "global_step": 50276, "epoch": 1197} {"train_loss": -5.78288459777832, "global_step": 50277, "epoch": 1197} {"train_loss": -5.838005065917969, "global_step": 50278, "epoch": 1197} {"train_loss": -5.834197998046875, "global_step": 50279, "epoch": 1197} {"train_loss": -5.779786586761475, "global_step": 50280, "epoch": 1197} {"train_loss": -5.836497783660889, "global_step": 50281, "epoch": 1197} {"train_loss": -5.888123989105225, "global_step": 50282, "epoch": 1197} {"train_loss": -5.812754154205322, "global_step": 50283, "epoch": 1197} {"train_loss": -5.794833183288574, "global_step": 50284, "epoch": 1197} {"train_loss": -5.906425476074219, "global_step": 50285, "epoch": 1197} {"train_loss": -5.727426528930664, "global_step": 50286, "epoch": 1197} {"train_loss": -5.806516647338867, "global_step": 50287, "epoch": 1197} {"train_loss": -5.92839241027832, "global_step": 50288, "epoch": 1197} {"train_loss": -5.84931755065918, "global_step": 50289, "epoch": 1197} {"train_loss": -5.912140846252441, "global_step": 50290, "epoch": 1197} {"train_loss": -5.798506736755371, "global_step": 50291, "epoch": 1197} {"train_loss": -5.899566650390625, "global_step": 50292, "epoch": 1197} {"train_loss": -5.742181301116943, "global_step": 50293, "epoch": 1197} {"train_loss": -5.728675365447998, "global_step": 50294, "epoch": 1197} {"train_loss": -5.856606960296631, "global_step": 50295, "epoch": 1197} {"train_loss": -5.819116592407227, "global_step": 50296, "epoch": 1197} {"train_loss": -5.689760208129883, "global_step": 50297, "epoch": 1197} {"train_loss": -5.8269147872924805, "global_step": 50298, "epoch": 1197} {"train_loss": -5.7142415046691895, "global_step": 50299, "epoch": 1197} {"train_loss": -5.766797065734863, "global_step": 50300, "epoch": 1197} {"train_loss": -5.793916702270508, "global_step": 50301, "epoch": 1197} {"train_loss": -5.709509372711182, "global_step": 50302, "epoch": 1197} {"train_loss": -5.729743957519531, "global_step": 50303, "epoch": 1197} {"train_loss": -5.793868064880371, "global_step": 50304, "epoch": 1197} {"train_loss": -5.650553226470947, "global_step": 50305, "epoch": 1197} {"train_loss": -5.654712200164795, "global_step": 50306, "epoch": 1197} {"train_loss": -5.777949333190918, "global_step": 50307, "epoch": 1197} {"train_loss": -5.709683418273926, "global_step": 50308, "epoch": 1197} {"train_loss": -5.623124122619629, "global_step": 50309, "epoch": 1197} {"train_loss": -5.8605170249938965, "global_step": 50310, "epoch": 1197} {"train_loss": -5.702689170837402, "global_step": 50311, "epoch": 1197} {"train_loss": -5.648529052734375, "global_step": 50312, "epoch": 1197} {"train_loss": -5.781705379486084, "global_step": 50313, "epoch": 1197} {"train_loss": -5.586014270782471, "global_step": 50314, "epoch": 1197} {"train_loss": -5.780745971770513, "global_step": 50315, "epoch": 1197, "val_loss": 74180.6484375} {"train_loss": -5.852066993713379, "global_step": 50316, "epoch": 1198} {"train_loss": -5.713415145874023, "global_step": 50317, "epoch": 1198} {"train_loss": -5.764110565185547, "global_step": 50318, "epoch": 1198} {"train_loss": -5.809145927429199, "global_step": 50319, "epoch": 1198} {"train_loss": -5.719020843505859, "global_step": 50320, "epoch": 1198} {"train_loss": -5.835470676422119, "global_step": 50321, "epoch": 1198} {"train_loss": -5.773860931396484, "global_step": 50322, "epoch": 1198} {"train_loss": -5.7414655685424805, "global_step": 50323, "epoch": 1198} {"train_loss": -5.859745025634766, "global_step": 50324, "epoch": 1198} {"train_loss": -5.656804084777832, "global_step": 50325, "epoch": 1198} {"train_loss": -5.677614688873291, "global_step": 50326, "epoch": 1198} {"train_loss": -5.861299991607666, "global_step": 50327, "epoch": 1198} {"train_loss": -5.760598182678223, "global_step": 50328, "epoch": 1198} {"train_loss": -5.717034816741943, "global_step": 50329, "epoch": 1198} {"train_loss": -5.7845139503479, "global_step": 50330, "epoch": 1198} {"train_loss": -5.694876194000244, "global_step": 50331, "epoch": 1198} {"train_loss": -5.797260284423828, "global_step": 50332, "epoch": 1198} {"train_loss": -5.628737926483154, "global_step": 50333, "epoch": 1198} {"train_loss": -5.6975250244140625, "global_step": 50334, "epoch": 1198} {"train_loss": -5.846548557281494, "global_step": 50335, "epoch": 1198} {"train_loss": -5.638260841369629, "global_step": 50336, "epoch": 1198} {"train_loss": -5.729971408843994, "global_step": 50337, "epoch": 1198} {"train_loss": -5.7537360191345215, "global_step": 50338, "epoch": 1198} {"train_loss": -5.660111904144287, "global_step": 50339, "epoch": 1198} {"train_loss": -5.586112976074219, "global_step": 50340, "epoch": 1198} {"train_loss": -5.655923366546631, "global_step": 50341, "epoch": 1198} {"train_loss": -5.693906784057617, "global_step": 50342, "epoch": 1198} {"train_loss": -5.660245895385742, "global_step": 50343, "epoch": 1198} {"train_loss": -5.650339126586914, "global_step": 50344, "epoch": 1198} {"train_loss": -5.780831336975098, "global_step": 50345, "epoch": 1198} {"train_loss": -5.6847076416015625, "global_step": 50346, "epoch": 1198} {"train_loss": -5.792870998382568, "global_step": 50347, "epoch": 1198} {"train_loss": -5.668367385864258, "global_step": 50348, "epoch": 1198} {"train_loss": -5.71951961517334, "global_step": 50349, "epoch": 1198} {"train_loss": -5.739071846008301, "global_step": 50350, "epoch": 1198} {"train_loss": -5.807728290557861, "global_step": 50351, "epoch": 1198} {"train_loss": -5.679551124572754, "global_step": 50352, "epoch": 1198} {"train_loss": -5.822595596313477, "global_step": 50353, "epoch": 1198} {"train_loss": -5.900266170501709, "global_step": 50354, "epoch": 1198} {"train_loss": -5.652543067932129, "global_step": 50355, "epoch": 1198} {"train_loss": -5.779461860656738, "global_step": 50356, "epoch": 1198} {"train_loss": -5.739824317750477, "global_step": 50357, "epoch": 1198, "val_loss": 74519.78125} {"train_loss": -5.847080707550049, "global_step": 50358, "epoch": 1199} {"train_loss": -5.665748596191406, "global_step": 50359, "epoch": 1199} {"train_loss": -5.705194473266602, "global_step": 50360, "epoch": 1199} {"train_loss": -5.657135009765625, "global_step": 50361, "epoch": 1199} {"train_loss": -5.851170539855957, "global_step": 50362, "epoch": 1199} {"train_loss": -5.6811323165893555, "global_step": 50363, "epoch": 1199} {"train_loss": -5.904294490814209, "global_step": 50364, "epoch": 1199} {"train_loss": -5.688019275665283, "global_step": 50365, "epoch": 1199} {"train_loss": -5.78931999206543, "global_step": 50366, "epoch": 1199} {"train_loss": -5.777555465698242, "global_step": 50367, "epoch": 1199} {"train_loss": -5.737527847290039, "global_step": 50368, "epoch": 1199} {"train_loss": -5.765403747558594, "global_step": 50369, "epoch": 1199} {"train_loss": -5.81805419921875, "global_step": 50370, "epoch": 1199} {"train_loss": -5.890169143676758, "global_step": 50371, "epoch": 1199} {"train_loss": -5.691195487976074, "global_step": 50372, "epoch": 1199} {"train_loss": -5.703702449798584, "global_step": 50373, "epoch": 1199} {"train_loss": -5.759346008300781, "global_step": 50374, "epoch": 1199} {"train_loss": -5.812930107116699, "global_step": 50375, "epoch": 1199} {"train_loss": -5.660898208618164, "global_step": 50376, "epoch": 1199} {"train_loss": -5.654031753540039, "global_step": 50377, "epoch": 1199} {"train_loss": -5.826871871948242, "global_step": 50378, "epoch": 1199} {"train_loss": -5.771018028259277, "global_step": 50379, "epoch": 1199} {"train_loss": -5.825044631958008, "global_step": 50380, "epoch": 1199} {"train_loss": -5.759933948516846, "global_step": 50381, "epoch": 1199} {"train_loss": -5.635309219360352, "global_step": 50382, "epoch": 1199} {"train_loss": -5.713974475860596, "global_step": 50383, "epoch": 1199} {"train_loss": -5.700048446655273, "global_step": 50384, "epoch": 1199} {"train_loss": -5.6201372146606445, "global_step": 50385, "epoch": 1199} {"train_loss": -5.6792144775390625, "global_step": 50386, "epoch": 1199} {"train_loss": -5.729979038238525, "global_step": 50387, "epoch": 1199} {"train_loss": -5.763606548309326, "global_step": 50388, "epoch": 1199} {"train_loss": -5.690248489379883, "global_step": 50389, "epoch": 1199} {"train_loss": -5.681723117828369, "global_step": 50390, "epoch": 1199} {"train_loss": -5.737924575805664, "global_step": 50391, "epoch": 1199} {"train_loss": -5.745731353759766, "global_step": 50392, "epoch": 1199} {"train_loss": -5.771737098693848, "global_step": 50393, "epoch": 1199} {"train_loss": -5.817234992980957, "global_step": 50394, "epoch": 1199} {"train_loss": -5.688091278076172, "global_step": 50395, "epoch": 1199} {"train_loss": -5.886840343475342, "global_step": 50396, "epoch": 1199} {"train_loss": -5.613289833068848, "global_step": 50397, "epoch": 1199} {"train_loss": -5.846044540405273, "global_step": 50398, "epoch": 1199} {"train_loss": -5.745536758786156, "global_step": 50399, "epoch": 1199, "val_loss": 74380.2578125} {"train_loss": -5.685355186462402, "global_step": 50400, "epoch": 1200} {"train_loss": -5.871748924255371, "global_step": 50401, "epoch": 1200} {"train_loss": -5.711992263793945, "global_step": 50402, "epoch": 1200} {"train_loss": -5.80118465423584, "global_step": 50403, "epoch": 1200} {"train_loss": -5.772489070892334, "global_step": 50404, "epoch": 1200} {"train_loss": -5.747095108032227, "global_step": 50405, "epoch": 1200} {"train_loss": -5.841935157775879, "global_step": 50406, "epoch": 1200} {"train_loss": -5.718710899353027, "global_step": 50407, "epoch": 1200} {"train_loss": -5.869340419769287, "global_step": 50408, "epoch": 1200} {"train_loss": -5.789488315582275, "global_step": 50409, "epoch": 1200} {"train_loss": -5.810833930969238, "global_step": 50410, "epoch": 1200} {"train_loss": -5.7582807540893555, "global_step": 50411, "epoch": 1200} {"train_loss": -5.773995876312256, "global_step": 50412, "epoch": 1200} {"train_loss": -5.876635551452637, "global_step": 50413, "epoch": 1200} {"train_loss": -5.786072254180908, "global_step": 50414, "epoch": 1200} {"train_loss": -5.7667694091796875, "global_step": 50415, "epoch": 1200} {"train_loss": -5.834807395935059, "global_step": 50416, "epoch": 1200} {"train_loss": -5.728627681732178, "global_step": 50417, "epoch": 1200} {"train_loss": -5.82570219039917, "global_step": 50418, "epoch": 1200} {"train_loss": -5.725768089294434, "global_step": 50419, "epoch": 1200} {"train_loss": -5.795762062072754, "global_step": 50420, "epoch": 1200} {"train_loss": -5.7767415046691895, "global_step": 50421, "epoch": 1200} {"train_loss": -5.891186714172363, "global_step": 50422, "epoch": 1200} {"train_loss": -5.801713466644287, "global_step": 50423, "epoch": 1200} {"train_loss": -5.791830539703369, "global_step": 50424, "epoch": 1200} {"train_loss": -5.828373908996582, "global_step": 50425, "epoch": 1200} {"train_loss": -5.63996696472168, "global_step": 50426, "epoch": 1200} {"train_loss": -5.757022857666016, "global_step": 50427, "epoch": 1200} {"train_loss": -5.804866790771484, "global_step": 50428, "epoch": 1200} {"train_loss": -5.7683210372924805, "global_step": 50429, "epoch": 1200} {"train_loss": -5.925381660461426, "global_step": 50430, "epoch": 1200} {"train_loss": -5.8791656494140625, "global_step": 50431, "epoch": 1200} {"train_loss": -5.75944709777832, "global_step": 50432, "epoch": 1200} {"train_loss": -5.7866902351379395, "global_step": 50433, "epoch": 1200} {"train_loss": -5.818559169769287, "global_step": 50434, "epoch": 1200} {"train_loss": -5.644740104675293, "global_step": 50435, "epoch": 1200} {"train_loss": -5.881770610809326, "global_step": 50436, "epoch": 1200} {"train_loss": -5.6596293449401855, "global_step": 50437, "epoch": 1200} {"train_loss": -5.652040958404541, "global_step": 50438, "epoch": 1200} {"train_loss": -5.837505340576172, "global_step": 50439, "epoch": 1200} {"train_loss": -5.752028942108154, "global_step": 50440, "epoch": 1200} {"train_loss": -5.783962158929734, "global_step": 50441, "epoch": 1200, "train/sim_max_reward_0": 0.49370765594606997, "train/sim_max_reward_1": 0.8981175870187599, "train/sim_max_reward_2": 0.8072901655358342, "train/sim_max_reward_3": 0.5891192771000892, "train/sim_max_reward_4": 0.40646917190852855, "train/sim_max_reward_5": 0.8215708236232078, "test/sim_max_reward_4500000": 0.45944262168713884, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9853568034120931, "test/sim_max_reward_4500003": 0.8637370567479064, "test/sim_max_reward_4500004": 0.08833606468241163, "test/sim_max_reward_4500005": 0.27573757883402744, "test/sim_max_reward_4500006": 0.881358841227626, "test/sim_max_reward_4500007": 0.6435562976856279, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.9724922524007061, "test/sim_max_reward_4500010": 1.0, "test/sim_max_reward_4500011": 0.8803938715506017, "test/sim_max_reward_4500012": 0.3715733969294193, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.8594258616406516, "test/sim_max_reward_4500015": 0.531814578868227, "test/sim_max_reward_4500016": 0.015089744258460179, "test/sim_max_reward_4500017": 0.029772830093719584, "test/sim_max_reward_4500018": 0.2785402871674197, "test/sim_max_reward_4500019": 0.8073713102733683, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.5827612202513733, "test/sim_max_reward_4500023": 0.8907674576939133, "test/sim_max_reward_4500024": 0.2608466235428868, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.09416926652891078, "test/sim_max_reward_4500027": 0.7579479966035362, "test/sim_max_reward_4500028": 0.45672664785576694, "test/sim_max_reward_4500029": 0.10648911112458755, "test/sim_max_reward_4500030": 0.9583942125082148, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.8179111521330892, "test/sim_max_reward_4500034": 0.7878325666547514, "test/sim_max_reward_4500035": 0.8897068467894498, "test/sim_max_reward_4500036": 0.8856693245917888, "test/sim_max_reward_4500037": 0.8579136387524684, "test/sim_max_reward_4500038": 0.35193604600499234, "test/sim_max_reward_4500039": 0.7438672158094243, "test/sim_max_reward_4500040": 0.8724002838497767, "test/sim_max_reward_4500041": 0.8551139757366507, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.36970242025103445, "test/sim_max_reward_4500044": 0.8297612923982562, "test/sim_max_reward_4500045": 0.15839140970779483, "test/sim_max_reward_4500046": 0.7613276632742604, "test/sim_max_reward_4500047": 0.6396709525833464, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6693791135220817, "test/mean_score": 0.5188451172352785, "val_loss": 74064.84375} {"train_loss": -5.799442291259766, "global_step": 50442, "epoch": 1201} {"train_loss": -5.778331756591797, "global_step": 50443, "epoch": 1201} {"train_loss": -5.795977592468262, "global_step": 50444, "epoch": 1201} {"train_loss": -5.699545860290527, "global_step": 50445, "epoch": 1201} {"train_loss": -5.763010025024414, "global_step": 50446, "epoch": 1201} {"train_loss": -5.6799750328063965, "global_step": 50447, "epoch": 1201} {"train_loss": -5.689547538757324, "global_step": 50448, "epoch": 1201} {"train_loss": -5.804269790649414, "global_step": 50449, "epoch": 1201} {"train_loss": -5.90032958984375, "global_step": 50450, "epoch": 1201} {"train_loss": -5.663315296173096, "global_step": 50451, "epoch": 1201} {"train_loss": -5.715253829956055, "global_step": 50452, "epoch": 1201} {"train_loss": -5.652803421020508, "global_step": 50453, "epoch": 1201} {"train_loss": -5.77189826965332, "global_step": 50454, "epoch": 1201} {"train_loss": -5.752288341522217, "global_step": 50455, "epoch": 1201} {"train_loss": -5.801916122436523, "global_step": 50456, "epoch": 1201} {"train_loss": -5.827689170837402, "global_step": 50457, "epoch": 1201} {"train_loss": -5.758551597595215, "global_step": 50458, "epoch": 1201} {"train_loss": -5.701061248779297, "global_step": 50459, "epoch": 1201} {"train_loss": -5.707474708557129, "global_step": 50460, "epoch": 1201} {"train_loss": -5.792961120605469, "global_step": 50461, "epoch": 1201} {"train_loss": -5.633695602416992, "global_step": 50462, "epoch": 1201} {"train_loss": -5.78181266784668, "global_step": 50463, "epoch": 1201} {"train_loss": -5.745432376861572, "global_step": 50464, "epoch": 1201} {"train_loss": -5.889894485473633, "global_step": 50465, "epoch": 1201} {"train_loss": -5.8020172119140625, "global_step": 50466, "epoch": 1201} {"train_loss": -5.805902004241943, "global_step": 50467, "epoch": 1201} {"train_loss": -5.818709373474121, "global_step": 50468, "epoch": 1201} {"train_loss": -5.767294406890869, "global_step": 50469, "epoch": 1201} {"train_loss": -5.869521141052246, "global_step": 50470, "epoch": 1201} {"train_loss": -5.896146774291992, "global_step": 50471, "epoch": 1201} {"train_loss": -5.788856506347656, "global_step": 50472, "epoch": 1201} {"train_loss": -5.638221263885498, "global_step": 50473, "epoch": 1201} {"train_loss": -5.743138313293457, "global_step": 50474, "epoch": 1201} {"train_loss": -5.733160972595215, "global_step": 50475, "epoch": 1201} {"train_loss": -5.780603408813477, "global_step": 50476, "epoch": 1201} {"train_loss": -5.691135406494141, "global_step": 50477, "epoch": 1201} {"train_loss": -5.650940895080566, "global_step": 50478, "epoch": 1201} {"train_loss": -5.766784191131592, "global_step": 50479, "epoch": 1201} {"train_loss": -5.648955345153809, "global_step": 50480, "epoch": 1201} {"train_loss": -5.666167259216309, "global_step": 50481, "epoch": 1201} {"train_loss": -5.649959087371826, "global_step": 50482, "epoch": 1201} {"train_loss": -5.749919493993123, "global_step": 50483, "epoch": 1201, "val_loss": 74619.125} {"train_loss": -5.855597496032715, "global_step": 50484, "epoch": 1202} {"train_loss": -5.629498481750488, "global_step": 50485, "epoch": 1202} {"train_loss": -5.7731547355651855, "global_step": 50486, "epoch": 1202} {"train_loss": -5.654754638671875, "global_step": 50487, "epoch": 1202} {"train_loss": -5.683379650115967, "global_step": 50488, "epoch": 1202} {"train_loss": -5.777750492095947, "global_step": 50489, "epoch": 1202} {"train_loss": -5.81954288482666, "global_step": 50490, "epoch": 1202} {"train_loss": -5.811367034912109, "global_step": 50491, "epoch": 1202} {"train_loss": -5.879208564758301, "global_step": 50492, "epoch": 1202} {"train_loss": -5.740889549255371, "global_step": 50493, "epoch": 1202} {"train_loss": -5.7323713302612305, "global_step": 50494, "epoch": 1202} {"train_loss": -5.78180456161499, "global_step": 50495, "epoch": 1202} {"train_loss": -5.8815107345581055, "global_step": 50496, "epoch": 1202} {"train_loss": -5.916744232177734, "global_step": 50497, "epoch": 1202} {"train_loss": -5.8731889724731445, "global_step": 50498, "epoch": 1202} {"train_loss": -5.784608364105225, "global_step": 50499, "epoch": 1202} {"train_loss": -5.695696830749512, "global_step": 50500, "epoch": 1202} {"train_loss": -5.7572784423828125, "global_step": 50501, "epoch": 1202} {"train_loss": -5.838560104370117, "global_step": 50502, "epoch": 1202} {"train_loss": -5.724947929382324, "global_step": 50503, "epoch": 1202} {"train_loss": -5.7511820793151855, "global_step": 50504, "epoch": 1202} {"train_loss": -5.752408027648926, "global_step": 50505, "epoch": 1202} {"train_loss": -5.728671073913574, "global_step": 50506, "epoch": 1202} {"train_loss": -5.770880699157715, "global_step": 50507, "epoch": 1202} {"train_loss": -5.734107971191406, "global_step": 50508, "epoch": 1202} {"train_loss": -5.773937702178955, "global_step": 50509, "epoch": 1202} {"train_loss": -5.738400459289551, "global_step": 50510, "epoch": 1202} {"train_loss": -5.753594875335693, "global_step": 50511, "epoch": 1202} {"train_loss": -5.796886444091797, "global_step": 50512, "epoch": 1202} {"train_loss": -5.7754950523376465, "global_step": 50513, "epoch": 1202} {"train_loss": -5.832221508026123, "global_step": 50514, "epoch": 1202} {"train_loss": -5.733088970184326, "global_step": 50515, "epoch": 1202} {"train_loss": -5.861007213592529, "global_step": 50516, "epoch": 1202} {"train_loss": -5.7959208488464355, "global_step": 50517, "epoch": 1202} {"train_loss": -5.82660436630249, "global_step": 50518, "epoch": 1202} {"train_loss": -5.797446250915527, "global_step": 50519, "epoch": 1202} {"train_loss": -5.768930912017822, "global_step": 50520, "epoch": 1202} {"train_loss": -5.688549518585205, "global_step": 50521, "epoch": 1202} {"train_loss": -5.734621047973633, "global_step": 50522, "epoch": 1202} {"train_loss": -5.848541259765625, "global_step": 50523, "epoch": 1202} {"train_loss": -5.758330821990967, "global_step": 50524, "epoch": 1202} {"train_loss": -5.777717022668748, "global_step": 50525, "epoch": 1202, "val_loss": 74050.9375} {"train_loss": -5.808378219604492, "global_step": 50526, "epoch": 1203} {"train_loss": -5.9370927810668945, "global_step": 50527, "epoch": 1203} {"train_loss": -5.74948787689209, "global_step": 50528, "epoch": 1203} {"train_loss": -5.886008262634277, "global_step": 50529, "epoch": 1203} {"train_loss": -5.712161540985107, "global_step": 50530, "epoch": 1203} {"train_loss": -5.661631107330322, "global_step": 50531, "epoch": 1203} {"train_loss": -5.848952293395996, "global_step": 50532, "epoch": 1203} {"train_loss": -5.727217674255371, "global_step": 50533, "epoch": 1203} {"train_loss": -5.918635368347168, "global_step": 50534, "epoch": 1203} {"train_loss": -5.798450469970703, "global_step": 50535, "epoch": 1203} {"train_loss": -5.81082010269165, "global_step": 50536, "epoch": 1203} {"train_loss": -5.813712120056152, "global_step": 50537, "epoch": 1203} {"train_loss": -5.823624610900879, "global_step": 50538, "epoch": 1203} {"train_loss": -5.868929386138916, "global_step": 50539, "epoch": 1203} {"train_loss": -5.761357307434082, "global_step": 50540, "epoch": 1203} {"train_loss": -5.759563446044922, "global_step": 50541, "epoch": 1203} {"train_loss": -5.8432512283325195, "global_step": 50542, "epoch": 1203} {"train_loss": -5.77340030670166, "global_step": 50543, "epoch": 1203} {"train_loss": -5.633423805236816, "global_step": 50544, "epoch": 1203} {"train_loss": -5.758757591247559, "global_step": 50545, "epoch": 1203} {"train_loss": -5.850175380706787, "global_step": 50546, "epoch": 1203} {"train_loss": -5.777320384979248, "global_step": 50547, "epoch": 1203} {"train_loss": -5.802095413208008, "global_step": 50548, "epoch": 1203} {"train_loss": -5.751041412353516, "global_step": 50549, "epoch": 1203} {"train_loss": -5.5719404220581055, "global_step": 50550, "epoch": 1203} {"train_loss": -5.751298427581787, "global_step": 50551, "epoch": 1203} {"train_loss": -5.770086288452148, "global_step": 50552, "epoch": 1203} {"train_loss": -5.857023239135742, "global_step": 50553, "epoch": 1203} {"train_loss": -5.732388019561768, "global_step": 50554, "epoch": 1203} {"train_loss": -5.851016044616699, "global_step": 50555, "epoch": 1203} {"train_loss": -5.663002967834473, "global_step": 50556, "epoch": 1203} {"train_loss": -5.846578598022461, "global_step": 50557, "epoch": 1203} {"train_loss": -5.733028411865234, "global_step": 50558, "epoch": 1203} {"train_loss": -5.831485748291016, "global_step": 50559, "epoch": 1203} {"train_loss": -5.8512420654296875, "global_step": 50560, "epoch": 1203} {"train_loss": -5.780202865600586, "global_step": 50561, "epoch": 1203} {"train_loss": -5.718598365783691, "global_step": 50562, "epoch": 1203} {"train_loss": -5.780363082885742, "global_step": 50563, "epoch": 1203} {"train_loss": -5.862271308898926, "global_step": 50564, "epoch": 1203} {"train_loss": -5.76875114440918, "global_step": 50565, "epoch": 1203} {"train_loss": -5.885276794433594, "global_step": 50566, "epoch": 1203} {"train_loss": -5.789968865258353, "global_step": 50567, "epoch": 1203, "val_loss": 74037.2890625} {"train_loss": -5.764130592346191, "global_step": 50568, "epoch": 1204} {"train_loss": -5.8916215896606445, "global_step": 50569, "epoch": 1204} {"train_loss": -5.885736465454102, "global_step": 50570, "epoch": 1204} {"train_loss": -5.877874374389648, "global_step": 50571, "epoch": 1204} {"train_loss": -5.873500823974609, "global_step": 50572, "epoch": 1204} {"train_loss": -5.886229515075684, "global_step": 50573, "epoch": 1204} {"train_loss": -5.696578502655029, "global_step": 50574, "epoch": 1204} {"train_loss": -5.838181495666504, "global_step": 50575, "epoch": 1204} {"train_loss": -5.678390979766846, "global_step": 50576, "epoch": 1204} {"train_loss": -5.642204284667969, "global_step": 50577, "epoch": 1204} {"train_loss": -5.801530838012695, "global_step": 50578, "epoch": 1204} {"train_loss": -5.810548782348633, "global_step": 50579, "epoch": 1204} {"train_loss": -5.7620954513549805, "global_step": 50580, "epoch": 1204} {"train_loss": -5.789902687072754, "global_step": 50581, "epoch": 1204} {"train_loss": -5.878835678100586, "global_step": 50582, "epoch": 1204} {"train_loss": -5.636653900146484, "global_step": 50583, "epoch": 1204} {"train_loss": -5.813732147216797, "global_step": 50584, "epoch": 1204} {"train_loss": -5.688445091247559, "global_step": 50585, "epoch": 1204} {"train_loss": -5.623584270477295, "global_step": 50586, "epoch": 1204} {"train_loss": -5.809563636779785, "global_step": 50587, "epoch": 1204} {"train_loss": -5.652461051940918, "global_step": 50588, "epoch": 1204} {"train_loss": -5.807543754577637, "global_step": 50589, "epoch": 1204} {"train_loss": -5.702941417694092, "global_step": 50590, "epoch": 1204} {"train_loss": -5.804565906524658, "global_step": 50591, "epoch": 1204} {"train_loss": -5.649802207946777, "global_step": 50592, "epoch": 1204} {"train_loss": -5.67906379699707, "global_step": 50593, "epoch": 1204} {"train_loss": -5.765951633453369, "global_step": 50594, "epoch": 1204} {"train_loss": -5.648565292358398, "global_step": 50595, "epoch": 1204} {"train_loss": -5.754421234130859, "global_step": 50596, "epoch": 1204} {"train_loss": -5.60616397857666, "global_step": 50597, "epoch": 1204} {"train_loss": -5.682500839233398, "global_step": 50598, "epoch": 1204} {"train_loss": -5.644853591918945, "global_step": 50599, "epoch": 1204} {"train_loss": -5.777494430541992, "global_step": 50600, "epoch": 1204} {"train_loss": -5.731122970581055, "global_step": 50601, "epoch": 1204} {"train_loss": -5.824145317077637, "global_step": 50602, "epoch": 1204} {"train_loss": -5.783483505249023, "global_step": 50603, "epoch": 1204} {"train_loss": -5.796494007110596, "global_step": 50604, "epoch": 1204} {"train_loss": -5.728787422180176, "global_step": 50605, "epoch": 1204} {"train_loss": -5.774713039398193, "global_step": 50606, "epoch": 1204} {"train_loss": -5.8292975425720215, "global_step": 50607, "epoch": 1204} {"train_loss": -5.799156188964844, "global_step": 50608, "epoch": 1204} {"train_loss": -5.759655884334019, "global_step": 50609, "epoch": 1204, "val_loss": 73856.9609375} {"train_loss": -5.855542182922363, "global_step": 50610, "epoch": 1205} {"train_loss": -5.753050804138184, "global_step": 50611, "epoch": 1205} {"train_loss": -5.688089370727539, "global_step": 50612, "epoch": 1205} {"train_loss": -5.696338653564453, "global_step": 50613, "epoch": 1205} {"train_loss": -5.688287734985352, "global_step": 50614, "epoch": 1205} {"train_loss": -5.824067115783691, "global_step": 50615, "epoch": 1205} {"train_loss": -5.744269371032715, "global_step": 50616, "epoch": 1205} {"train_loss": -5.799427509307861, "global_step": 50617, "epoch": 1205} {"train_loss": -5.712367534637451, "global_step": 50618, "epoch": 1205} {"train_loss": -5.8238749504089355, "global_step": 50619, "epoch": 1205} {"train_loss": -5.815655708312988, "global_step": 50620, "epoch": 1205} {"train_loss": -5.727933883666992, "global_step": 50621, "epoch": 1205} {"train_loss": -5.87797737121582, "global_step": 50622, "epoch": 1205} {"train_loss": -5.964722633361816, "global_step": 50623, "epoch": 1205} {"train_loss": -5.796292304992676, "global_step": 50624, "epoch": 1205} {"train_loss": -5.8153791427612305, "global_step": 50625, "epoch": 1205} {"train_loss": -5.700273513793945, "global_step": 50626, "epoch": 1205} {"train_loss": -5.714330673217773, "global_step": 50627, "epoch": 1205} {"train_loss": -5.788541793823242, "global_step": 50628, "epoch": 1205} {"train_loss": -5.798274517059326, "global_step": 50629, "epoch": 1205} {"train_loss": -5.841569900512695, "global_step": 50630, "epoch": 1205} {"train_loss": -5.784090042114258, "global_step": 50631, "epoch": 1205} {"train_loss": -5.688446998596191, "global_step": 50632, "epoch": 1205} {"train_loss": -5.808576583862305, "global_step": 50633, "epoch": 1205} {"train_loss": -5.794639587402344, "global_step": 50634, "epoch": 1205} {"train_loss": -5.770305633544922, "global_step": 50635, "epoch": 1205} {"train_loss": -5.821796894073486, "global_step": 50636, "epoch": 1205} {"train_loss": -5.719409942626953, "global_step": 50637, "epoch": 1205} {"train_loss": -5.761056900024414, "global_step": 50638, "epoch": 1205} {"train_loss": -5.88329553604126, "global_step": 50639, "epoch": 1205} {"train_loss": -5.680172920227051, "global_step": 50640, "epoch": 1205} {"train_loss": -5.757346153259277, "global_step": 50641, "epoch": 1205} {"train_loss": -5.745471000671387, "global_step": 50642, "epoch": 1205} {"train_loss": -5.585946559906006, "global_step": 50643, "epoch": 1205} {"train_loss": -5.741964340209961, "global_step": 50644, "epoch": 1205} {"train_loss": -5.590510845184326, "global_step": 50645, "epoch": 1205} {"train_loss": -5.8209638595581055, "global_step": 50646, "epoch": 1205} {"train_loss": -5.71960973739624, "global_step": 50647, "epoch": 1205} {"train_loss": -5.651310443878174, "global_step": 50648, "epoch": 1205} {"train_loss": -5.748726844787598, "global_step": 50649, "epoch": 1205} {"train_loss": -5.639273643493652, "global_step": 50650, "epoch": 1205} {"train_loss": -5.752972409838722, "global_step": 50651, "epoch": 1205, "val_loss": 74391.203125} {"train_loss": -5.726066589355469, "global_step": 50652, "epoch": 1206} {"train_loss": -5.692112922668457, "global_step": 50653, "epoch": 1206} {"train_loss": -5.589837551116943, "global_step": 50654, "epoch": 1206} {"train_loss": -5.685333251953125, "global_step": 50655, "epoch": 1206} {"train_loss": -5.674247741699219, "global_step": 50656, "epoch": 1206} {"train_loss": -5.715904712677002, "global_step": 50657, "epoch": 1206} {"train_loss": -5.679589748382568, "global_step": 50658, "epoch": 1206} {"train_loss": -5.686182975769043, "global_step": 50659, "epoch": 1206} {"train_loss": -5.789327621459961, "global_step": 50660, "epoch": 1206} {"train_loss": -5.596697807312012, "global_step": 50661, "epoch": 1206} {"train_loss": -5.783962249755859, "global_step": 50662, "epoch": 1206} {"train_loss": -5.761770248413086, "global_step": 50663, "epoch": 1206} {"train_loss": -5.790323257446289, "global_step": 50664, "epoch": 1206} {"train_loss": -5.711082458496094, "global_step": 50665, "epoch": 1206} {"train_loss": -5.763147830963135, "global_step": 50666, "epoch": 1206} {"train_loss": -5.772311687469482, "global_step": 50667, "epoch": 1206} {"train_loss": -5.770917892456055, "global_step": 50668, "epoch": 1206} {"train_loss": -5.716591835021973, "global_step": 50669, "epoch": 1206} {"train_loss": -5.776063919067383, "global_step": 50670, "epoch": 1206} {"train_loss": -5.809030532836914, "global_step": 50671, "epoch": 1206} {"train_loss": -5.839797019958496, "global_step": 50672, "epoch": 1206} {"train_loss": -5.8354716300964355, "global_step": 50673, "epoch": 1206} {"train_loss": -5.882437705993652, "global_step": 50674, "epoch": 1206} {"train_loss": -5.821747779846191, "global_step": 50675, "epoch": 1206} {"train_loss": -5.864247798919678, "global_step": 50676, "epoch": 1206} {"train_loss": -5.676931381225586, "global_step": 50677, "epoch": 1206} {"train_loss": -5.68388557434082, "global_step": 50678, "epoch": 1206} {"train_loss": -5.794846057891846, "global_step": 50679, "epoch": 1206} {"train_loss": -5.587200164794922, "global_step": 50680, "epoch": 1206} {"train_loss": -5.676152229309082, "global_step": 50681, "epoch": 1206} {"train_loss": -5.364719867706299, "global_step": 50682, "epoch": 1206} {"train_loss": -5.599579811096191, "global_step": 50683, "epoch": 1206} {"train_loss": -5.469573497772217, "global_step": 50684, "epoch": 1206} {"train_loss": -5.424776554107666, "global_step": 50685, "epoch": 1206} {"train_loss": -5.51352596282959, "global_step": 50686, "epoch": 1206} {"train_loss": -5.4698357582092285, "global_step": 50687, "epoch": 1206} {"train_loss": -5.475888252258301, "global_step": 50688, "epoch": 1206} {"train_loss": -5.622311592102051, "global_step": 50689, "epoch": 1206} {"train_loss": -5.52778959274292, "global_step": 50690, "epoch": 1206} {"train_loss": -5.572325229644775, "global_step": 50691, "epoch": 1206} {"train_loss": -5.686952590942383, "global_step": 50692, "epoch": 1206} {"train_loss": -5.678896608806792, "global_step": 50693, "epoch": 1206, "val_loss": 74488.859375} {"train_loss": -5.640586853027344, "global_step": 50694, "epoch": 1207} {"train_loss": -5.636353492736816, "global_step": 50695, "epoch": 1207} {"train_loss": -5.656956195831299, "global_step": 50696, "epoch": 1207} {"train_loss": -5.700967311859131, "global_step": 50697, "epoch": 1207} {"train_loss": -5.655980110168457, "global_step": 50698, "epoch": 1207} {"train_loss": -5.6936187744140625, "global_step": 50699, "epoch": 1207} {"train_loss": -5.717003345489502, "global_step": 50700, "epoch": 1207} {"train_loss": -5.667144775390625, "global_step": 50701, "epoch": 1207} {"train_loss": -5.788942813873291, "global_step": 50702, "epoch": 1207} {"train_loss": -5.926565170288086, "global_step": 50703, "epoch": 1207} {"train_loss": -5.722627639770508, "global_step": 50704, "epoch": 1207} {"train_loss": -5.763343334197998, "global_step": 50705, "epoch": 1207} {"train_loss": -5.830144882202148, "global_step": 50706, "epoch": 1207} {"train_loss": -5.781881332397461, "global_step": 50707, "epoch": 1207} {"train_loss": -5.741418838500977, "global_step": 50708, "epoch": 1207} {"train_loss": -5.889069080352783, "global_step": 50709, "epoch": 1207} {"train_loss": -5.730961799621582, "global_step": 50710, "epoch": 1207} {"train_loss": -5.721282958984375, "global_step": 50711, "epoch": 1207} {"train_loss": -5.690871238708496, "global_step": 50712, "epoch": 1207} {"train_loss": -5.72947883605957, "global_step": 50713, "epoch": 1207} {"train_loss": -5.56547737121582, "global_step": 50714, "epoch": 1207} {"train_loss": -5.5957489013671875, "global_step": 50715, "epoch": 1207} {"train_loss": -5.732785701751709, "global_step": 50716, "epoch": 1207} {"train_loss": -5.487239837646484, "global_step": 50717, "epoch": 1207} {"train_loss": -5.676460266113281, "global_step": 50718, "epoch": 1207} {"train_loss": -5.724864482879639, "global_step": 50719, "epoch": 1207} {"train_loss": -5.61089563369751, "global_step": 50720, "epoch": 1207} {"train_loss": -5.750399589538574, "global_step": 50721, "epoch": 1207} {"train_loss": -5.476361274719238, "global_step": 50722, "epoch": 1207} {"train_loss": -5.77595329284668, "global_step": 50723, "epoch": 1207} {"train_loss": -5.428021430969238, "global_step": 50724, "epoch": 1207} {"train_loss": -5.792609214782715, "global_step": 50725, "epoch": 1207} {"train_loss": -5.598494529724121, "global_step": 50726, "epoch": 1207} {"train_loss": -5.83626651763916, "global_step": 50727, "epoch": 1207} {"train_loss": -5.673459529876709, "global_step": 50728, "epoch": 1207} {"train_loss": -5.608107089996338, "global_step": 50729, "epoch": 1207} {"train_loss": -5.574377059936523, "global_step": 50730, "epoch": 1207} {"train_loss": -5.843628406524658, "global_step": 50731, "epoch": 1207} {"train_loss": -5.59843635559082, "global_step": 50732, "epoch": 1207} {"train_loss": -5.783199310302734, "global_step": 50733, "epoch": 1207} {"train_loss": -5.724991321563721, "global_step": 50734, "epoch": 1207} {"train_loss": -5.699816556203933, "global_step": 50735, "epoch": 1207, "val_loss": 74352.4609375} {"train_loss": -5.76096773147583, "global_step": 50736, "epoch": 1208} {"train_loss": -5.857088088989258, "global_step": 50737, "epoch": 1208} {"train_loss": -5.760897636413574, "global_step": 50738, "epoch": 1208} {"train_loss": -5.7004780769348145, "global_step": 50739, "epoch": 1208} {"train_loss": -5.822062969207764, "global_step": 50740, "epoch": 1208} {"train_loss": -5.830576419830322, "global_step": 50741, "epoch": 1208} {"train_loss": -5.8915181159973145, "global_step": 50742, "epoch": 1208} {"train_loss": -5.71435022354126, "global_step": 50743, "epoch": 1208} {"train_loss": -5.663008689880371, "global_step": 50744, "epoch": 1208} {"train_loss": -5.858188152313232, "global_step": 50745, "epoch": 1208} {"train_loss": -5.768031597137451, "global_step": 50746, "epoch": 1208} {"train_loss": -5.85014533996582, "global_step": 50747, "epoch": 1208} {"train_loss": -5.762564659118652, "global_step": 50748, "epoch": 1208} {"train_loss": -5.811583518981934, "global_step": 50749, "epoch": 1208} {"train_loss": -5.811685085296631, "global_step": 50750, "epoch": 1208} {"train_loss": -5.887406826019287, "global_step": 50751, "epoch": 1208} {"train_loss": -5.710351467132568, "global_step": 50752, "epoch": 1208} {"train_loss": -5.814882278442383, "global_step": 50753, "epoch": 1208} {"train_loss": -5.79340124130249, "global_step": 50754, "epoch": 1208} {"train_loss": -5.545413970947266, "global_step": 50755, "epoch": 1208} {"train_loss": -5.798901557922363, "global_step": 50756, "epoch": 1208} {"train_loss": -5.783940315246582, "global_step": 50757, "epoch": 1208} {"train_loss": -5.847385883331299, "global_step": 50758, "epoch": 1208} {"train_loss": -5.83906364440918, "global_step": 50759, "epoch": 1208} {"train_loss": -5.70757532119751, "global_step": 50760, "epoch": 1208} {"train_loss": -5.69747257232666, "global_step": 50761, "epoch": 1208} {"train_loss": -5.78877067565918, "global_step": 50762, "epoch": 1208} {"train_loss": -5.844655513763428, "global_step": 50763, "epoch": 1208} {"train_loss": -5.713192939758301, "global_step": 50764, "epoch": 1208} {"train_loss": -5.81782341003418, "global_step": 50765, "epoch": 1208} {"train_loss": -5.758002281188965, "global_step": 50766, "epoch": 1208} {"train_loss": -5.732614040374756, "global_step": 50767, "epoch": 1208} {"train_loss": -5.650843143463135, "global_step": 50768, "epoch": 1208} {"train_loss": -5.735090732574463, "global_step": 50769, "epoch": 1208} {"train_loss": -5.794668197631836, "global_step": 50770, "epoch": 1208} {"train_loss": -5.761395454406738, "global_step": 50771, "epoch": 1208} {"train_loss": -5.729030609130859, "global_step": 50772, "epoch": 1208} {"train_loss": -5.710503578186035, "global_step": 50773, "epoch": 1208} {"train_loss": -5.788344860076904, "global_step": 50774, "epoch": 1208} {"train_loss": -5.885730743408203, "global_step": 50775, "epoch": 1208} {"train_loss": -5.819618225097656, "global_step": 50776, "epoch": 1208} {"train_loss": -5.77307178860619, "global_step": 50777, "epoch": 1208, "val_loss": 74172.578125} {"train_loss": -5.7877984046936035, "global_step": 50778, "epoch": 1209} {"train_loss": -5.732703685760498, "global_step": 50779, "epoch": 1209} {"train_loss": -5.781956195831299, "global_step": 50780, "epoch": 1209} {"train_loss": -5.718976020812988, "global_step": 50781, "epoch": 1209} {"train_loss": -5.836800575256348, "global_step": 50782, "epoch": 1209} {"train_loss": -5.7739715576171875, "global_step": 50783, "epoch": 1209} {"train_loss": -5.721590042114258, "global_step": 50784, "epoch": 1209} {"train_loss": -5.762145042419434, "global_step": 50785, "epoch": 1209} {"train_loss": -5.797496795654297, "global_step": 50786, "epoch": 1209} {"train_loss": -5.781734466552734, "global_step": 50787, "epoch": 1209} {"train_loss": -5.778277397155762, "global_step": 50788, "epoch": 1209} {"train_loss": -5.871176719665527, "global_step": 50789, "epoch": 1209} {"train_loss": -5.785720348358154, "global_step": 50790, "epoch": 1209} {"train_loss": -5.840641021728516, "global_step": 50791, "epoch": 1209} {"train_loss": -5.785857677459717, "global_step": 50792, "epoch": 1209} {"train_loss": -5.6617560386657715, "global_step": 50793, "epoch": 1209} {"train_loss": -5.883289813995361, "global_step": 50794, "epoch": 1209} {"train_loss": -5.679286003112793, "global_step": 50795, "epoch": 1209} {"train_loss": -5.925018310546875, "global_step": 50796, "epoch": 1209} {"train_loss": -5.7844672203063965, "global_step": 50797, "epoch": 1209} {"train_loss": -5.718454837799072, "global_step": 50798, "epoch": 1209} {"train_loss": -5.835412979125977, "global_step": 50799, "epoch": 1209} {"train_loss": -5.802004337310791, "global_step": 50800, "epoch": 1209} {"train_loss": -5.778818130493164, "global_step": 50801, "epoch": 1209} {"train_loss": -5.695383548736572, "global_step": 50802, "epoch": 1209} {"train_loss": -5.7431488037109375, "global_step": 50803, "epoch": 1209} {"train_loss": -5.65478515625, "global_step": 50804, "epoch": 1209} {"train_loss": -5.920584678649902, "global_step": 50805, "epoch": 1209} {"train_loss": -5.809432029724121, "global_step": 50806, "epoch": 1209} {"train_loss": -5.645081520080566, "global_step": 50807, "epoch": 1209} {"train_loss": -5.818295478820801, "global_step": 50808, "epoch": 1209} {"train_loss": -5.681217193603516, "global_step": 50809, "epoch": 1209} {"train_loss": -5.923680305480957, "global_step": 50810, "epoch": 1209} {"train_loss": -5.659764766693115, "global_step": 50811, "epoch": 1209} {"train_loss": -5.919262886047363, "global_step": 50812, "epoch": 1209} {"train_loss": -5.850834369659424, "global_step": 50813, "epoch": 1209} {"train_loss": -5.8126115798950195, "global_step": 50814, "epoch": 1209} {"train_loss": -5.9039716720581055, "global_step": 50815, "epoch": 1209} {"train_loss": -5.729412078857422, "global_step": 50816, "epoch": 1209} {"train_loss": -5.8113532066345215, "global_step": 50817, "epoch": 1209} {"train_loss": -5.7169036865234375, "global_step": 50818, "epoch": 1209} {"train_loss": -5.782808065414429, "global_step": 50819, "epoch": 1209, "val_loss": 74509.6640625} {"train_loss": -5.803452491760254, "global_step": 50820, "epoch": 1210} {"train_loss": -5.743853569030762, "global_step": 50821, "epoch": 1210} {"train_loss": -5.784959316253662, "global_step": 50822, "epoch": 1210} {"train_loss": -5.703932762145996, "global_step": 50823, "epoch": 1210} {"train_loss": -5.759281158447266, "global_step": 50824, "epoch": 1210} {"train_loss": -5.70402193069458, "global_step": 50825, "epoch": 1210} {"train_loss": -5.709566116333008, "global_step": 50826, "epoch": 1210} {"train_loss": -5.778794288635254, "global_step": 50827, "epoch": 1210} {"train_loss": -5.7374372482299805, "global_step": 50828, "epoch": 1210} {"train_loss": -5.720701217651367, "global_step": 50829, "epoch": 1210} {"train_loss": -5.818092346191406, "global_step": 50830, "epoch": 1210} {"train_loss": -5.689506530761719, "global_step": 50831, "epoch": 1210} {"train_loss": -5.627008438110352, "global_step": 50832, "epoch": 1210} {"train_loss": -5.864495277404785, "global_step": 50833, "epoch": 1210} {"train_loss": -5.700739860534668, "global_step": 50834, "epoch": 1210} {"train_loss": -5.771241188049316, "global_step": 50835, "epoch": 1210} {"train_loss": -5.870687484741211, "global_step": 50836, "epoch": 1210} {"train_loss": -5.667404651641846, "global_step": 50837, "epoch": 1210} {"train_loss": -5.822955131530762, "global_step": 50838, "epoch": 1210} {"train_loss": -5.7004804611206055, "global_step": 50839, "epoch": 1210} {"train_loss": -5.870765209197998, "global_step": 50840, "epoch": 1210} {"train_loss": -5.8306498527526855, "global_step": 50841, "epoch": 1210} {"train_loss": -5.751253128051758, "global_step": 50842, "epoch": 1210} {"train_loss": -5.742527008056641, "global_step": 50843, "epoch": 1210} {"train_loss": -5.879952430725098, "global_step": 50844, "epoch": 1210} {"train_loss": -5.816659927368164, "global_step": 50845, "epoch": 1210} {"train_loss": -5.882987976074219, "global_step": 50846, "epoch": 1210} {"train_loss": -5.623808860778809, "global_step": 50847, "epoch": 1210} {"train_loss": -5.742399215698242, "global_step": 50848, "epoch": 1210} {"train_loss": -5.777202606201172, "global_step": 50849, "epoch": 1210} {"train_loss": -5.718476295471191, "global_step": 50850, "epoch": 1210} {"train_loss": -5.967019557952881, "global_step": 50851, "epoch": 1210} {"train_loss": -5.665931701660156, "global_step": 50852, "epoch": 1210} {"train_loss": -5.810832500457764, "global_step": 50853, "epoch": 1210} {"train_loss": -5.7428388595581055, "global_step": 50854, "epoch": 1210} {"train_loss": -5.754115104675293, "global_step": 50855, "epoch": 1210} {"train_loss": -5.778552532196045, "global_step": 50856, "epoch": 1210} {"train_loss": -5.842573165893555, "global_step": 50857, "epoch": 1210} {"train_loss": -5.7306227684021, "global_step": 50858, "epoch": 1210} {"train_loss": -5.862930774688721, "global_step": 50859, "epoch": 1210} {"train_loss": -5.803606986999512, "global_step": 50860, "epoch": 1210} {"train_loss": -5.768297127314976, "global_step": 50861, "epoch": 1210, "val_loss": 74088.390625} {"train_loss": -5.763274192810059, "global_step": 50862, "epoch": 1211} {"train_loss": -5.74724006652832, "global_step": 50863, "epoch": 1211} {"train_loss": -5.769777774810791, "global_step": 50864, "epoch": 1211} {"train_loss": -5.6771697998046875, "global_step": 50865, "epoch": 1211} {"train_loss": -5.784206390380859, "global_step": 50866, "epoch": 1211} {"train_loss": -5.90869140625, "global_step": 50867, "epoch": 1211} {"train_loss": -5.719834804534912, "global_step": 50868, "epoch": 1211} {"train_loss": -5.759821891784668, "global_step": 50869, "epoch": 1211} {"train_loss": -5.794821739196777, "global_step": 50870, "epoch": 1211} {"train_loss": -5.774359226226807, "global_step": 50871, "epoch": 1211} {"train_loss": -5.794924736022949, "global_step": 50872, "epoch": 1211} {"train_loss": -5.798894882202148, "global_step": 50873, "epoch": 1211} {"train_loss": -5.876806259155273, "global_step": 50874, "epoch": 1211} {"train_loss": -5.714267730712891, "global_step": 50875, "epoch": 1211} {"train_loss": -5.7102813720703125, "global_step": 50876, "epoch": 1211} {"train_loss": -5.86464786529541, "global_step": 50877, "epoch": 1211} {"train_loss": -5.735380172729492, "global_step": 50878, "epoch": 1211} {"train_loss": -5.648812294006348, "global_step": 50879, "epoch": 1211} {"train_loss": -5.75777530670166, "global_step": 50880, "epoch": 1211} {"train_loss": -5.7697858810424805, "global_step": 50881, "epoch": 1211} {"train_loss": -5.705320835113525, "global_step": 50882, "epoch": 1211} {"train_loss": -5.602685451507568, "global_step": 50883, "epoch": 1211} {"train_loss": -5.714922904968262, "global_step": 50884, "epoch": 1211} {"train_loss": -5.723270893096924, "global_step": 50885, "epoch": 1211} {"train_loss": -5.738778114318848, "global_step": 50886, "epoch": 1211} {"train_loss": -5.7842864990234375, "global_step": 50887, "epoch": 1211} {"train_loss": -5.774643898010254, "global_step": 50888, "epoch": 1211} {"train_loss": -5.794803142547607, "global_step": 50889, "epoch": 1211} {"train_loss": -5.788381099700928, "global_step": 50890, "epoch": 1211} {"train_loss": -5.745594024658203, "global_step": 50891, "epoch": 1211} {"train_loss": -5.8022284507751465, "global_step": 50892, "epoch": 1211} {"train_loss": -5.717689514160156, "global_step": 50893, "epoch": 1211} {"train_loss": -5.830385208129883, "global_step": 50894, "epoch": 1211} {"train_loss": -5.685781955718994, "global_step": 50895, "epoch": 1211} {"train_loss": -5.738583564758301, "global_step": 50896, "epoch": 1211} {"train_loss": -5.868748664855957, "global_step": 50897, "epoch": 1211} {"train_loss": -5.704185485839844, "global_step": 50898, "epoch": 1211} {"train_loss": -5.77392578125, "global_step": 50899, "epoch": 1211} {"train_loss": -5.701733589172363, "global_step": 50900, "epoch": 1211} {"train_loss": -5.84086275100708, "global_step": 50901, "epoch": 1211} {"train_loss": -5.718707084655762, "global_step": 50902, "epoch": 1211} {"train_loss": -5.761744748978388, "global_step": 50903, "epoch": 1211, "val_loss": 74149.796875} {"train_loss": -5.785307884216309, "global_step": 50904, "epoch": 1212} {"train_loss": -5.598183631896973, "global_step": 50905, "epoch": 1212} {"train_loss": -5.864706993103027, "global_step": 50906, "epoch": 1212} {"train_loss": -5.678435802459717, "global_step": 50907, "epoch": 1212} {"train_loss": -5.732169151306152, "global_step": 50908, "epoch": 1212} {"train_loss": -5.79815673828125, "global_step": 50909, "epoch": 1212} {"train_loss": -5.747859001159668, "global_step": 50910, "epoch": 1212} {"train_loss": -5.62952184677124, "global_step": 50911, "epoch": 1212} {"train_loss": -5.882983207702637, "global_step": 50912, "epoch": 1212} {"train_loss": -5.685693740844727, "global_step": 50913, "epoch": 1212} {"train_loss": -5.840738296508789, "global_step": 50914, "epoch": 1212} {"train_loss": -5.610007286071777, "global_step": 50915, "epoch": 1212} {"train_loss": -5.671558380126953, "global_step": 50916, "epoch": 1212} {"train_loss": -5.798664093017578, "global_step": 50917, "epoch": 1212} {"train_loss": -5.6988677978515625, "global_step": 50918, "epoch": 1212} {"train_loss": -5.766559600830078, "global_step": 50919, "epoch": 1212} {"train_loss": -5.733715057373047, "global_step": 50920, "epoch": 1212} {"train_loss": -5.718700408935547, "global_step": 50921, "epoch": 1212} {"train_loss": -5.674740791320801, "global_step": 50922, "epoch": 1212} {"train_loss": -5.605666637420654, "global_step": 50923, "epoch": 1212} {"train_loss": -5.718236923217773, "global_step": 50924, "epoch": 1212} {"train_loss": -5.698446273803711, "global_step": 50925, "epoch": 1212} {"train_loss": -5.829315185546875, "global_step": 50926, "epoch": 1212} {"train_loss": -5.630903244018555, "global_step": 50927, "epoch": 1212} {"train_loss": -5.734546184539795, "global_step": 50928, "epoch": 1212} {"train_loss": -5.728960037231445, "global_step": 50929, "epoch": 1212} {"train_loss": -5.708832740783691, "global_step": 50930, "epoch": 1212} {"train_loss": -5.745565414428711, "global_step": 50931, "epoch": 1212} {"train_loss": -5.734199523925781, "global_step": 50932, "epoch": 1212} {"train_loss": -5.67964506149292, "global_step": 50933, "epoch": 1212} {"train_loss": -5.802823066711426, "global_step": 50934, "epoch": 1212} {"train_loss": -5.840390205383301, "global_step": 50935, "epoch": 1212} {"train_loss": -5.659006118774414, "global_step": 50936, "epoch": 1212} {"train_loss": -5.818996429443359, "global_step": 50937, "epoch": 1212} {"train_loss": -5.835053443908691, "global_step": 50938, "epoch": 1212} {"train_loss": -5.726848602294922, "global_step": 50939, "epoch": 1212} {"train_loss": -5.669271469116211, "global_step": 50940, "epoch": 1212} {"train_loss": -5.679534912109375, "global_step": 50941, "epoch": 1212} {"train_loss": -5.695206642150879, "global_step": 50942, "epoch": 1212} {"train_loss": -5.783054828643799, "global_step": 50943, "epoch": 1212} {"train_loss": -5.784614562988281, "global_step": 50944, "epoch": 1212} {"train_loss": -5.734153225308373, "global_step": 50945, "epoch": 1212, "val_loss": 74012.921875} {"train_loss": -5.8955607414245605, "global_step": 50946, "epoch": 1213} {"train_loss": -5.777617454528809, "global_step": 50947, "epoch": 1213} {"train_loss": -5.908164978027344, "global_step": 50948, "epoch": 1213} {"train_loss": -5.848752021789551, "global_step": 50949, "epoch": 1213} {"train_loss": -5.759686470031738, "global_step": 50950, "epoch": 1213} {"train_loss": -5.8025312423706055, "global_step": 50951, "epoch": 1213} {"train_loss": -5.855512619018555, "global_step": 50952, "epoch": 1213} {"train_loss": -5.857173919677734, "global_step": 50953, "epoch": 1213} {"train_loss": -5.85685396194458, "global_step": 50954, "epoch": 1213} {"train_loss": -5.883708477020264, "global_step": 50955, "epoch": 1213} {"train_loss": -5.667994976043701, "global_step": 50956, "epoch": 1213} {"train_loss": -5.731293678283691, "global_step": 50957, "epoch": 1213} {"train_loss": -5.800098896026611, "global_step": 50958, "epoch": 1213} {"train_loss": -5.915546417236328, "global_step": 50959, "epoch": 1213} {"train_loss": -5.627752304077148, "global_step": 50960, "epoch": 1213} {"train_loss": -5.643966197967529, "global_step": 50961, "epoch": 1213} {"train_loss": -5.847459316253662, "global_step": 50962, "epoch": 1213} {"train_loss": -5.912498950958252, "global_step": 50963, "epoch": 1213} {"train_loss": -5.804007530212402, "global_step": 50964, "epoch": 1213} {"train_loss": -5.780004501342773, "global_step": 50965, "epoch": 1213} {"train_loss": -5.8846821784973145, "global_step": 50966, "epoch": 1213} {"train_loss": -5.663235664367676, "global_step": 50967, "epoch": 1213} {"train_loss": -5.793814182281494, "global_step": 50968, "epoch": 1213} {"train_loss": -5.692696571350098, "global_step": 50969, "epoch": 1213} {"train_loss": -5.817837238311768, "global_step": 50970, "epoch": 1213} {"train_loss": -5.871901512145996, "global_step": 50971, "epoch": 1213} {"train_loss": -5.858018398284912, "global_step": 50972, "epoch": 1213} {"train_loss": -5.676326751708984, "global_step": 50973, "epoch": 1213} {"train_loss": -5.624174118041992, "global_step": 50974, "epoch": 1213} {"train_loss": -5.704124927520752, "global_step": 50975, "epoch": 1213} {"train_loss": -5.8069748878479, "global_step": 50976, "epoch": 1213} {"train_loss": -5.692715644836426, "global_step": 50977, "epoch": 1213} {"train_loss": -5.72850227355957, "global_step": 50978, "epoch": 1213} {"train_loss": -5.7320098876953125, "global_step": 50979, "epoch": 1213} {"train_loss": -5.788558006286621, "global_step": 50980, "epoch": 1213} {"train_loss": -5.724859237670898, "global_step": 50981, "epoch": 1213} {"train_loss": -5.675574779510498, "global_step": 50982, "epoch": 1213} {"train_loss": -5.6034417152404785, "global_step": 50983, "epoch": 1213} {"train_loss": -5.717259407043457, "global_step": 50984, "epoch": 1213} {"train_loss": -5.835344314575195, "global_step": 50985, "epoch": 1213} {"train_loss": -5.773312091827393, "global_step": 50986, "epoch": 1213} {"train_loss": -5.777174779347011, "global_step": 50987, "epoch": 1213, "val_loss": 74133.0078125} {"train_loss": -5.807925224304199, "global_step": 50988, "epoch": 1214} {"train_loss": -5.585368633270264, "global_step": 50989, "epoch": 1214} {"train_loss": -5.742702960968018, "global_step": 50990, "epoch": 1214} {"train_loss": -5.74931526184082, "global_step": 50991, "epoch": 1214} {"train_loss": -5.7700886726379395, "global_step": 50992, "epoch": 1214} {"train_loss": -5.741237640380859, "global_step": 50993, "epoch": 1214} {"train_loss": -5.761281490325928, "global_step": 50994, "epoch": 1214} {"train_loss": -5.850105285644531, "global_step": 50995, "epoch": 1214} {"train_loss": -5.8131022453308105, "global_step": 50996, "epoch": 1214} {"train_loss": -5.7987823486328125, "global_step": 50997, "epoch": 1214} {"train_loss": -5.796197414398193, "global_step": 50998, "epoch": 1214} {"train_loss": -5.850584030151367, "global_step": 50999, "epoch": 1214} {"train_loss": -5.769290924072266, "global_step": 51000, "epoch": 1214} {"train_loss": -5.816524505615234, "global_step": 51001, "epoch": 1214} {"train_loss": -5.6651082038879395, "global_step": 51002, "epoch": 1214} {"train_loss": -5.693140983581543, "global_step": 51003, "epoch": 1214} {"train_loss": -5.804928302764893, "global_step": 51004, "epoch": 1214} {"train_loss": -5.759183883666992, "global_step": 51005, "epoch": 1214} {"train_loss": -5.828133583068848, "global_step": 51006, "epoch": 1214} {"train_loss": -5.810386657714844, "global_step": 51007, "epoch": 1214} {"train_loss": -5.875941753387451, "global_step": 51008, "epoch": 1214} {"train_loss": -5.838610649108887, "global_step": 51009, "epoch": 1214} {"train_loss": -5.928949356079102, "global_step": 51010, "epoch": 1214} {"train_loss": -5.9030961990356445, "global_step": 51011, "epoch": 1214} {"train_loss": -5.8962788581848145, "global_step": 51012, "epoch": 1214} {"train_loss": -5.780362129211426, "global_step": 51013, "epoch": 1214} {"train_loss": -5.834501266479492, "global_step": 51014, "epoch": 1214} {"train_loss": -5.95392370223999, "global_step": 51015, "epoch": 1214} {"train_loss": -5.7194695472717285, "global_step": 51016, "epoch": 1214} {"train_loss": -5.83825159072876, "global_step": 51017, "epoch": 1214} {"train_loss": -5.870947360992432, "global_step": 51018, "epoch": 1214} {"train_loss": -5.748568534851074, "global_step": 51019, "epoch": 1214} {"train_loss": -5.90572452545166, "global_step": 51020, "epoch": 1214} {"train_loss": -5.715554237365723, "global_step": 51021, "epoch": 1214} {"train_loss": -5.818047523498535, "global_step": 51022, "epoch": 1214} {"train_loss": -5.905646324157715, "global_step": 51023, "epoch": 1214} {"train_loss": -5.750097751617432, "global_step": 51024, "epoch": 1214} {"train_loss": -5.839755535125732, "global_step": 51025, "epoch": 1214} {"train_loss": -5.821541786193848, "global_step": 51026, "epoch": 1214} {"train_loss": -5.641177177429199, "global_step": 51027, "epoch": 1214} {"train_loss": -5.699230194091797, "global_step": 51028, "epoch": 1214} {"train_loss": -5.79912501289731, "global_step": 51029, "epoch": 1214, "val_loss": 74476.234375} {"train_loss": -5.916420936584473, "global_step": 51030, "epoch": 1215} {"train_loss": -5.818157196044922, "global_step": 51031, "epoch": 1215} {"train_loss": -5.790866851806641, "global_step": 51032, "epoch": 1215} {"train_loss": -5.802116394042969, "global_step": 51033, "epoch": 1215} {"train_loss": -5.76076602935791, "global_step": 51034, "epoch": 1215} {"train_loss": -5.759197235107422, "global_step": 51035, "epoch": 1215} {"train_loss": -5.7801194190979, "global_step": 51036, "epoch": 1215} {"train_loss": -5.75445556640625, "global_step": 51037, "epoch": 1215} {"train_loss": -5.8606767654418945, "global_step": 51038, "epoch": 1215} {"train_loss": -5.822342872619629, "global_step": 51039, "epoch": 1215} {"train_loss": -5.578310966491699, "global_step": 51040, "epoch": 1215} {"train_loss": -5.748939514160156, "global_step": 51041, "epoch": 1215} {"train_loss": -5.717848777770996, "global_step": 51042, "epoch": 1215} {"train_loss": -5.676556587219238, "global_step": 51043, "epoch": 1215} {"train_loss": -5.862142562866211, "global_step": 51044, "epoch": 1215} {"train_loss": -5.738415718078613, "global_step": 51045, "epoch": 1215} {"train_loss": -5.881203651428223, "global_step": 51046, "epoch": 1215} {"train_loss": -5.718152046203613, "global_step": 51047, "epoch": 1215} {"train_loss": -5.797362327575684, "global_step": 51048, "epoch": 1215} {"train_loss": -5.884157657623291, "global_step": 51049, "epoch": 1215} {"train_loss": -5.751061916351318, "global_step": 51050, "epoch": 1215} {"train_loss": -5.832983493804932, "global_step": 51051, "epoch": 1215} {"train_loss": -5.752630233764648, "global_step": 51052, "epoch": 1215} {"train_loss": -5.638087749481201, "global_step": 51053, "epoch": 1215} {"train_loss": -5.855806350708008, "global_step": 51054, "epoch": 1215} {"train_loss": -5.733126640319824, "global_step": 51055, "epoch": 1215} {"train_loss": -5.697566986083984, "global_step": 51056, "epoch": 1215} {"train_loss": -5.843557357788086, "global_step": 51057, "epoch": 1215} {"train_loss": -5.817940711975098, "global_step": 51058, "epoch": 1215} {"train_loss": -5.729104042053223, "global_step": 51059, "epoch": 1215} {"train_loss": -5.847036361694336, "global_step": 51060, "epoch": 1215} {"train_loss": -5.769614219665527, "global_step": 51061, "epoch": 1215} {"train_loss": -5.726995468139648, "global_step": 51062, "epoch": 1215} {"train_loss": -5.747727870941162, "global_step": 51063, "epoch": 1215} {"train_loss": -5.7333879470825195, "global_step": 51064, "epoch": 1215} {"train_loss": -5.738519668579102, "global_step": 51065, "epoch": 1215} {"train_loss": -5.877463340759277, "global_step": 51066, "epoch": 1215} {"train_loss": -5.636710166931152, "global_step": 51067, "epoch": 1215} {"train_loss": -5.784150123596191, "global_step": 51068, "epoch": 1215} {"train_loss": -5.620848655700684, "global_step": 51069, "epoch": 1215} {"train_loss": -5.863529205322266, "global_step": 51070, "epoch": 1215} {"train_loss": -5.772766737710862, "global_step": 51071, "epoch": 1215, "val_loss": 74249.9375} {"train_loss": -5.792035102844238, "global_step": 51072, "epoch": 1216} {"train_loss": -5.7096052169799805, "global_step": 51073, "epoch": 1216} {"train_loss": -5.704928398132324, "global_step": 51074, "epoch": 1216} {"train_loss": -5.826840877532959, "global_step": 51075, "epoch": 1216} {"train_loss": -5.67143440246582, "global_step": 51076, "epoch": 1216} {"train_loss": -5.811982154846191, "global_step": 51077, "epoch": 1216} {"train_loss": -5.828522682189941, "global_step": 51078, "epoch": 1216} {"train_loss": -5.828291893005371, "global_step": 51079, "epoch": 1216} {"train_loss": -5.750493049621582, "global_step": 51080, "epoch": 1216} {"train_loss": -5.7197160720825195, "global_step": 51081, "epoch": 1216} {"train_loss": -5.720243453979492, "global_step": 51082, "epoch": 1216} {"train_loss": -5.83416748046875, "global_step": 51083, "epoch": 1216} {"train_loss": -5.856366157531738, "global_step": 51084, "epoch": 1216} {"train_loss": -5.672092914581299, "global_step": 51085, "epoch": 1216} {"train_loss": -5.741839408874512, "global_step": 51086, "epoch": 1216} {"train_loss": -5.809374809265137, "global_step": 51087, "epoch": 1216} {"train_loss": -5.794580459594727, "global_step": 51088, "epoch": 1216} {"train_loss": -5.646164894104004, "global_step": 51089, "epoch": 1216} {"train_loss": -5.734444618225098, "global_step": 51090, "epoch": 1216} {"train_loss": -5.686184883117676, "global_step": 51091, "epoch": 1216} {"train_loss": -5.910547256469727, "global_step": 51092, "epoch": 1216} {"train_loss": -5.903367519378662, "global_step": 51093, "epoch": 1216} {"train_loss": -5.779562950134277, "global_step": 51094, "epoch": 1216} {"train_loss": -5.710133075714111, "global_step": 51095, "epoch": 1216} {"train_loss": -5.773149490356445, "global_step": 51096, "epoch": 1216} {"train_loss": -5.807003021240234, "global_step": 51097, "epoch": 1216} {"train_loss": -5.756723403930664, "global_step": 51098, "epoch": 1216} {"train_loss": -5.782903671264648, "global_step": 51099, "epoch": 1216} {"train_loss": -5.751320838928223, "global_step": 51100, "epoch": 1216} {"train_loss": -5.68263053894043, "global_step": 51101, "epoch": 1216} {"train_loss": -5.836614608764648, "global_step": 51102, "epoch": 1216} {"train_loss": -5.854544639587402, "global_step": 51103, "epoch": 1216} {"train_loss": -5.862563133239746, "global_step": 51104, "epoch": 1216} {"train_loss": -5.862306594848633, "global_step": 51105, "epoch": 1216} {"train_loss": -5.7470703125, "global_step": 51106, "epoch": 1216} {"train_loss": -5.867887496948242, "global_step": 51107, "epoch": 1216} {"train_loss": -5.86401891708374, "global_step": 51108, "epoch": 1216} {"train_loss": -5.784313201904297, "global_step": 51109, "epoch": 1216} {"train_loss": -5.813590049743652, "global_step": 51110, "epoch": 1216} {"train_loss": -5.880814075469971, "global_step": 51111, "epoch": 1216} {"train_loss": -5.822196960449219, "global_step": 51112, "epoch": 1216} {"train_loss": -5.7843299025581, "global_step": 51113, "epoch": 1216, "val_loss": 73978.609375} {"train_loss": -5.82548189163208, "global_step": 51114, "epoch": 1217} {"train_loss": -5.892184734344482, "global_step": 51115, "epoch": 1217} {"train_loss": -5.795903205871582, "global_step": 51116, "epoch": 1217} {"train_loss": -5.738750457763672, "global_step": 51117, "epoch": 1217} {"train_loss": -5.715827941894531, "global_step": 51118, "epoch": 1217} {"train_loss": -5.685623645782471, "global_step": 51119, "epoch": 1217} {"train_loss": -5.775423049926758, "global_step": 51120, "epoch": 1217} {"train_loss": -5.832202911376953, "global_step": 51121, "epoch": 1217} {"train_loss": -5.7733259201049805, "global_step": 51122, "epoch": 1217} {"train_loss": -5.883535385131836, "global_step": 51123, "epoch": 1217} {"train_loss": -5.78537654876709, "global_step": 51124, "epoch": 1217} {"train_loss": -5.852129936218262, "global_step": 51125, "epoch": 1217} {"train_loss": -5.698954105377197, "global_step": 51126, "epoch": 1217} {"train_loss": -5.841877460479736, "global_step": 51127, "epoch": 1217} {"train_loss": -5.72434139251709, "global_step": 51128, "epoch": 1217} {"train_loss": -5.580658912658691, "global_step": 51129, "epoch": 1217} {"train_loss": -5.710572242736816, "global_step": 51130, "epoch": 1217} {"train_loss": -5.755273342132568, "global_step": 51131, "epoch": 1217} {"train_loss": -5.73475456237793, "global_step": 51132, "epoch": 1217} {"train_loss": -5.81993293762207, "global_step": 51133, "epoch": 1217} {"train_loss": -5.874720573425293, "global_step": 51134, "epoch": 1217} {"train_loss": -5.786951541900635, "global_step": 51135, "epoch": 1217} {"train_loss": -5.790162086486816, "global_step": 51136, "epoch": 1217} {"train_loss": -5.855515003204346, "global_step": 51137, "epoch": 1217} {"train_loss": -5.785026550292969, "global_step": 51138, "epoch": 1217} {"train_loss": -5.695993423461914, "global_step": 51139, "epoch": 1217} {"train_loss": -5.695281505584717, "global_step": 51140, "epoch": 1217} {"train_loss": -5.9007182121276855, "global_step": 51141, "epoch": 1217} {"train_loss": -5.807103157043457, "global_step": 51142, "epoch": 1217} {"train_loss": -5.734023094177246, "global_step": 51143, "epoch": 1217} {"train_loss": -5.717162132263184, "global_step": 51144, "epoch": 1217} {"train_loss": -5.734724044799805, "global_step": 51145, "epoch": 1217} {"train_loss": -5.67222785949707, "global_step": 51146, "epoch": 1217} {"train_loss": -5.824560642242432, "global_step": 51147, "epoch": 1217} {"train_loss": -5.815424919128418, "global_step": 51148, "epoch": 1217} {"train_loss": -5.714886665344238, "global_step": 51149, "epoch": 1217} {"train_loss": -5.690567970275879, "global_step": 51150, "epoch": 1217} {"train_loss": -5.7373175621032715, "global_step": 51151, "epoch": 1217} {"train_loss": -5.792959213256836, "global_step": 51152, "epoch": 1217} {"train_loss": -5.79603385925293, "global_step": 51153, "epoch": 1217} {"train_loss": -5.655369758605957, "global_step": 51154, "epoch": 1217} {"train_loss": -5.768425237564814, "global_step": 51155, "epoch": 1217, "val_loss": 74295.8984375} {"train_loss": -5.7902727127075195, "global_step": 51156, "epoch": 1218} {"train_loss": -5.63916015625, "global_step": 51157, "epoch": 1218} {"train_loss": -5.758650779724121, "global_step": 51158, "epoch": 1218} {"train_loss": -5.793562889099121, "global_step": 51159, "epoch": 1218} {"train_loss": -5.8763427734375, "global_step": 51160, "epoch": 1218} {"train_loss": -5.825356483459473, "global_step": 51161, "epoch": 1218} {"train_loss": -5.694616794586182, "global_step": 51162, "epoch": 1218} {"train_loss": -5.752445220947266, "global_step": 51163, "epoch": 1218} {"train_loss": -5.814853191375732, "global_step": 51164, "epoch": 1218} {"train_loss": -5.730508804321289, "global_step": 51165, "epoch": 1218} {"train_loss": -5.76792049407959, "global_step": 51166, "epoch": 1218} {"train_loss": -5.7721757888793945, "global_step": 51167, "epoch": 1218} {"train_loss": -5.704211235046387, "global_step": 51168, "epoch": 1218} {"train_loss": -5.8533124923706055, "global_step": 51169, "epoch": 1218} {"train_loss": -5.763917922973633, "global_step": 51170, "epoch": 1218} {"train_loss": -5.735953330993652, "global_step": 51171, "epoch": 1218} {"train_loss": -5.802036285400391, "global_step": 51172, "epoch": 1218} {"train_loss": -5.776828289031982, "global_step": 51173, "epoch": 1218} {"train_loss": -5.834672927856445, "global_step": 51174, "epoch": 1218} {"train_loss": -5.9046711921691895, "global_step": 51175, "epoch": 1218} {"train_loss": -5.652899742126465, "global_step": 51176, "epoch": 1218} {"train_loss": -5.9010138511657715, "global_step": 51177, "epoch": 1218} {"train_loss": -5.6948676109313965, "global_step": 51178, "epoch": 1218} {"train_loss": -5.6679582595825195, "global_step": 51179, "epoch": 1218} {"train_loss": -5.7267165184021, "global_step": 51180, "epoch": 1218} {"train_loss": -5.704150676727295, "global_step": 51181, "epoch": 1218} {"train_loss": -5.7593793869018555, "global_step": 51182, "epoch": 1218} {"train_loss": -5.816991806030273, "global_step": 51183, "epoch": 1218} {"train_loss": -5.724185466766357, "global_step": 51184, "epoch": 1218} {"train_loss": -5.814774513244629, "global_step": 51185, "epoch": 1218} {"train_loss": -5.830760955810547, "global_step": 51186, "epoch": 1218} {"train_loss": -5.741837501525879, "global_step": 51187, "epoch": 1218} {"train_loss": -5.788003921508789, "global_step": 51188, "epoch": 1218} {"train_loss": -5.732237815856934, "global_step": 51189, "epoch": 1218} {"train_loss": -5.7678303718566895, "global_step": 51190, "epoch": 1218} {"train_loss": -5.975098609924316, "global_step": 51191, "epoch": 1218} {"train_loss": -5.845486640930176, "global_step": 51192, "epoch": 1218} {"train_loss": -5.949019432067871, "global_step": 51193, "epoch": 1218} {"train_loss": -5.682577133178711, "global_step": 51194, "epoch": 1218} {"train_loss": -5.872920513153076, "global_step": 51195, "epoch": 1218} {"train_loss": -5.829452037811279, "global_step": 51196, "epoch": 1218} {"train_loss": -5.785111960910616, "global_step": 51197, "epoch": 1218, "val_loss": 74170.1015625} {"train_loss": -5.752462387084961, "global_step": 51198, "epoch": 1219} {"train_loss": -5.802423477172852, "global_step": 51199, "epoch": 1219} {"train_loss": -5.76929235458374, "global_step": 51200, "epoch": 1219} {"train_loss": -5.783756732940674, "global_step": 51201, "epoch": 1219} {"train_loss": -5.786064147949219, "global_step": 51202, "epoch": 1219} {"train_loss": -5.828790664672852, "global_step": 51203, "epoch": 1219} {"train_loss": -5.720754146575928, "global_step": 51204, "epoch": 1219} {"train_loss": -5.835294723510742, "global_step": 51205, "epoch": 1219} {"train_loss": -5.719585418701172, "global_step": 51206, "epoch": 1219} {"train_loss": -5.702195167541504, "global_step": 51207, "epoch": 1219} {"train_loss": -5.798798084259033, "global_step": 51208, "epoch": 1219} {"train_loss": -5.6764421463012695, "global_step": 51209, "epoch": 1219} {"train_loss": -5.723355293273926, "global_step": 51210, "epoch": 1219} {"train_loss": -5.754217624664307, "global_step": 51211, "epoch": 1219} {"train_loss": -5.648884296417236, "global_step": 51212, "epoch": 1219} {"train_loss": -5.797060966491699, "global_step": 51213, "epoch": 1219} {"train_loss": -5.757822513580322, "global_step": 51214, "epoch": 1219} {"train_loss": -5.7073588371276855, "global_step": 51215, "epoch": 1219} {"train_loss": -5.7221527099609375, "global_step": 51216, "epoch": 1219} {"train_loss": -5.878613471984863, "global_step": 51217, "epoch": 1219} {"train_loss": -5.885318279266357, "global_step": 51218, "epoch": 1219} {"train_loss": -5.830958366394043, "global_step": 51219, "epoch": 1219} {"train_loss": -5.818639755249023, "global_step": 51220, "epoch": 1219} {"train_loss": -5.943292617797852, "global_step": 51221, "epoch": 1219} {"train_loss": -5.815492630004883, "global_step": 51222, "epoch": 1219} {"train_loss": -5.800821304321289, "global_step": 51223, "epoch": 1219} {"train_loss": -5.752765655517578, "global_step": 51224, "epoch": 1219} {"train_loss": -5.710142135620117, "global_step": 51225, "epoch": 1219} {"train_loss": -5.8656110763549805, "global_step": 51226, "epoch": 1219} {"train_loss": -5.728322982788086, "global_step": 51227, "epoch": 1219} {"train_loss": -5.7315144538879395, "global_step": 51228, "epoch": 1219} {"train_loss": -5.761977195739746, "global_step": 51229, "epoch": 1219} {"train_loss": -5.8225202560424805, "global_step": 51230, "epoch": 1219} {"train_loss": -5.744740962982178, "global_step": 51231, "epoch": 1219} {"train_loss": -5.688819408416748, "global_step": 51232, "epoch": 1219} {"train_loss": -5.838624000549316, "global_step": 51233, "epoch": 1219} {"train_loss": -5.85075569152832, "global_step": 51234, "epoch": 1219} {"train_loss": -5.717430114746094, "global_step": 51235, "epoch": 1219} {"train_loss": -5.758896827697754, "global_step": 51236, "epoch": 1219} {"train_loss": -5.758725166320801, "global_step": 51237, "epoch": 1219} {"train_loss": -5.78330135345459, "global_step": 51238, "epoch": 1219} {"train_loss": -5.775103183019729, "global_step": 51239, "epoch": 1219, "val_loss": 74213.2265625} {"train_loss": -5.8627424240112305, "global_step": 51240, "epoch": 1220} {"train_loss": -5.893479824066162, "global_step": 51241, "epoch": 1220} {"train_loss": -5.84716796875, "global_step": 51242, "epoch": 1220} {"train_loss": -5.7797040939331055, "global_step": 51243, "epoch": 1220} {"train_loss": -5.7855143547058105, "global_step": 51244, "epoch": 1220} {"train_loss": -5.807793140411377, "global_step": 51245, "epoch": 1220} {"train_loss": -5.682611465454102, "global_step": 51246, "epoch": 1220} {"train_loss": -5.725488662719727, "global_step": 51247, "epoch": 1220} {"train_loss": -5.78273868560791, "global_step": 51248, "epoch": 1220} {"train_loss": -5.691037178039551, "global_step": 51249, "epoch": 1220} {"train_loss": -5.796716690063477, "global_step": 51250, "epoch": 1220} {"train_loss": -5.756862640380859, "global_step": 51251, "epoch": 1220} {"train_loss": -5.773016452789307, "global_step": 51252, "epoch": 1220} {"train_loss": -5.804792404174805, "global_step": 51253, "epoch": 1220} {"train_loss": -5.731308937072754, "global_step": 51254, "epoch": 1220} {"train_loss": -5.816143989562988, "global_step": 51255, "epoch": 1220} {"train_loss": -5.828671932220459, "global_step": 51256, "epoch": 1220} {"train_loss": -5.8072509765625, "global_step": 51257, "epoch": 1220} {"train_loss": -5.862630844116211, "global_step": 51258, "epoch": 1220} {"train_loss": -5.8351898193359375, "global_step": 51259, "epoch": 1220} {"train_loss": -5.842113494873047, "global_step": 51260, "epoch": 1220} {"train_loss": -5.876897811889648, "global_step": 51261, "epoch": 1220} {"train_loss": -5.853955268859863, "global_step": 51262, "epoch": 1220} {"train_loss": -5.779416084289551, "global_step": 51263, "epoch": 1220} {"train_loss": -5.820433616638184, "global_step": 51264, "epoch": 1220} {"train_loss": -5.756437301635742, "global_step": 51265, "epoch": 1220} {"train_loss": -5.756442546844482, "global_step": 51266, "epoch": 1220} {"train_loss": -5.962657928466797, "global_step": 51267, "epoch": 1220} {"train_loss": -5.898050785064697, "global_step": 51268, "epoch": 1220} {"train_loss": -5.7521138191223145, "global_step": 51269, "epoch": 1220} {"train_loss": -5.824423789978027, "global_step": 51270, "epoch": 1220} {"train_loss": -5.855414390563965, "global_step": 51271, "epoch": 1220} {"train_loss": -5.644138336181641, "global_step": 51272, "epoch": 1220} {"train_loss": -5.802488327026367, "global_step": 51273, "epoch": 1220} {"train_loss": -5.953775405883789, "global_step": 51274, "epoch": 1220} {"train_loss": -5.672819137573242, "global_step": 51275, "epoch": 1220} {"train_loss": -5.755776882171631, "global_step": 51276, "epoch": 1220} {"train_loss": -5.8058671951293945, "global_step": 51277, "epoch": 1220} {"train_loss": -5.717531681060791, "global_step": 51278, "epoch": 1220} {"train_loss": -5.790994644165039, "global_step": 51279, "epoch": 1220} {"train_loss": -5.780370712280273, "global_step": 51280, "epoch": 1220} {"train_loss": -5.80011983144851, "global_step": 51281, "epoch": 1220, "val_loss": 74615.2421875} {"train_loss": -5.789440155029297, "global_step": 51282, "epoch": 1221} {"train_loss": -5.883083343505859, "global_step": 51283, "epoch": 1221} {"train_loss": -5.73513126373291, "global_step": 51284, "epoch": 1221} {"train_loss": -5.819966793060303, "global_step": 51285, "epoch": 1221} {"train_loss": -5.805375099182129, "global_step": 51286, "epoch": 1221} {"train_loss": -5.951976776123047, "global_step": 51287, "epoch": 1221} {"train_loss": -5.821639537811279, "global_step": 51288, "epoch": 1221} {"train_loss": -5.631872177124023, "global_step": 51289, "epoch": 1221} {"train_loss": -5.766541004180908, "global_step": 51290, "epoch": 1221} {"train_loss": -5.857386589050293, "global_step": 51291, "epoch": 1221} {"train_loss": -5.716536521911621, "global_step": 51292, "epoch": 1221} {"train_loss": -5.83652400970459, "global_step": 51293, "epoch": 1221} {"train_loss": -5.8488287925720215, "global_step": 51294, "epoch": 1221} {"train_loss": -5.832745552062988, "global_step": 51295, "epoch": 1221} {"train_loss": -5.902832984924316, "global_step": 51296, "epoch": 1221} {"train_loss": -5.789983749389648, "global_step": 51297, "epoch": 1221} {"train_loss": -5.887618064880371, "global_step": 51298, "epoch": 1221} {"train_loss": -5.685406684875488, "global_step": 51299, "epoch": 1221} {"train_loss": -5.78455114364624, "global_step": 51300, "epoch": 1221} {"train_loss": -5.721296310424805, "global_step": 51301, "epoch": 1221} {"train_loss": -5.771991729736328, "global_step": 51302, "epoch": 1221} {"train_loss": -5.747111797332764, "global_step": 51303, "epoch": 1221} {"train_loss": -5.7802348136901855, "global_step": 51304, "epoch": 1221} {"train_loss": -5.599820137023926, "global_step": 51305, "epoch": 1221} {"train_loss": -5.927097797393799, "global_step": 51306, "epoch": 1221} {"train_loss": -5.76583194732666, "global_step": 51307, "epoch": 1221} {"train_loss": -5.72502326965332, "global_step": 51308, "epoch": 1221} {"train_loss": -5.78382682800293, "global_step": 51309, "epoch": 1221} {"train_loss": -5.790533065795898, "global_step": 51310, "epoch": 1221} {"train_loss": -5.927879810333252, "global_step": 51311, "epoch": 1221} {"train_loss": -5.751716613769531, "global_step": 51312, "epoch": 1221} {"train_loss": -5.815484046936035, "global_step": 51313, "epoch": 1221} {"train_loss": -5.659117698669434, "global_step": 51314, "epoch": 1221} {"train_loss": -5.719359874725342, "global_step": 51315, "epoch": 1221} {"train_loss": -5.780398368835449, "global_step": 51316, "epoch": 1221} {"train_loss": -5.836300373077393, "global_step": 51317, "epoch": 1221} {"train_loss": -5.686946392059326, "global_step": 51318, "epoch": 1221} {"train_loss": -5.758233070373535, "global_step": 51319, "epoch": 1221} {"train_loss": -5.785253524780273, "global_step": 51320, "epoch": 1221} {"train_loss": -5.864212989807129, "global_step": 51321, "epoch": 1221} {"train_loss": -5.784599304199219, "global_step": 51322, "epoch": 1221} {"train_loss": -5.79185886610122, "global_step": 51323, "epoch": 1221, "val_loss": 74397.6796875} {"train_loss": -5.777430534362793, "global_step": 51324, "epoch": 1222} {"train_loss": -5.825483322143555, "global_step": 51325, "epoch": 1222} {"train_loss": -5.8830366134643555, "global_step": 51326, "epoch": 1222} {"train_loss": -5.714086055755615, "global_step": 51327, "epoch": 1222} {"train_loss": -5.939361572265625, "global_step": 51328, "epoch": 1222} {"train_loss": -5.649684429168701, "global_step": 51329, "epoch": 1222} {"train_loss": -5.812444686889648, "global_step": 51330, "epoch": 1222} {"train_loss": -5.798476219177246, "global_step": 51331, "epoch": 1222} {"train_loss": -5.8190412521362305, "global_step": 51332, "epoch": 1222} {"train_loss": -5.807991027832031, "global_step": 51333, "epoch": 1222} {"train_loss": -5.840538024902344, "global_step": 51334, "epoch": 1222} {"train_loss": -5.726710319519043, "global_step": 51335, "epoch": 1222} {"train_loss": -5.852705001831055, "global_step": 51336, "epoch": 1222} {"train_loss": -5.679620742797852, "global_step": 51337, "epoch": 1222} {"train_loss": -5.738364219665527, "global_step": 51338, "epoch": 1222} {"train_loss": -5.805865287780762, "global_step": 51339, "epoch": 1222} {"train_loss": -5.719179630279541, "global_step": 51340, "epoch": 1222} {"train_loss": -5.782772541046143, "global_step": 51341, "epoch": 1222} {"train_loss": -5.874734878540039, "global_step": 51342, "epoch": 1222} {"train_loss": -5.638138771057129, "global_step": 51343, "epoch": 1222} {"train_loss": -5.726678371429443, "global_step": 51344, "epoch": 1222} {"train_loss": -5.718930721282959, "global_step": 51345, "epoch": 1222} {"train_loss": -5.815672397613525, "global_step": 51346, "epoch": 1222} {"train_loss": -5.755814552307129, "global_step": 51347, "epoch": 1222} {"train_loss": -5.805116176605225, "global_step": 51348, "epoch": 1222} {"train_loss": -5.693545341491699, "global_step": 51349, "epoch": 1222} {"train_loss": -5.940621376037598, "global_step": 51350, "epoch": 1222} {"train_loss": -5.720129013061523, "global_step": 51351, "epoch": 1222} {"train_loss": -5.873762130737305, "global_step": 51352, "epoch": 1222} {"train_loss": -5.747709274291992, "global_step": 51353, "epoch": 1222} {"train_loss": -5.800437927246094, "global_step": 51354, "epoch": 1222} {"train_loss": -5.799252033233643, "global_step": 51355, "epoch": 1222} {"train_loss": -5.807826995849609, "global_step": 51356, "epoch": 1222} {"train_loss": -5.769584655761719, "global_step": 51357, "epoch": 1222} {"train_loss": -5.819002151489258, "global_step": 51358, "epoch": 1222} {"train_loss": -5.850556373596191, "global_step": 51359, "epoch": 1222} {"train_loss": -5.782111644744873, "global_step": 51360, "epoch": 1222} {"train_loss": -5.8455939292907715, "global_step": 51361, "epoch": 1222} {"train_loss": -5.750464916229248, "global_step": 51362, "epoch": 1222} {"train_loss": -5.902446746826172, "global_step": 51363, "epoch": 1222} {"train_loss": -5.810366630554199, "global_step": 51364, "epoch": 1222} {"train_loss": -5.791516826266334, "global_step": 51365, "epoch": 1222, "val_loss": 74090.984375} {"train_loss": -5.807297229766846, "global_step": 51366, "epoch": 1223} {"train_loss": -5.759037017822266, "global_step": 51367, "epoch": 1223} {"train_loss": -5.775357246398926, "global_step": 51368, "epoch": 1223} {"train_loss": -5.704902648925781, "global_step": 51369, "epoch": 1223} {"train_loss": -5.811217784881592, "global_step": 51370, "epoch": 1223} {"train_loss": -5.752634048461914, "global_step": 51371, "epoch": 1223} {"train_loss": -5.850135803222656, "global_step": 51372, "epoch": 1223} {"train_loss": -5.843542098999023, "global_step": 51373, "epoch": 1223} {"train_loss": -5.590946674346924, "global_step": 51374, "epoch": 1223} {"train_loss": -5.756736755371094, "global_step": 51375, "epoch": 1223} {"train_loss": -5.848508358001709, "global_step": 51376, "epoch": 1223} {"train_loss": -5.645650863647461, "global_step": 51377, "epoch": 1223} {"train_loss": -5.752035140991211, "global_step": 51378, "epoch": 1223} {"train_loss": -5.819182395935059, "global_step": 51379, "epoch": 1223} {"train_loss": -5.810157775878906, "global_step": 51380, "epoch": 1223} {"train_loss": -5.708293914794922, "global_step": 51381, "epoch": 1223} {"train_loss": -5.776035308837891, "global_step": 51382, "epoch": 1223} {"train_loss": -5.82430362701416, "global_step": 51383, "epoch": 1223} {"train_loss": -5.781205654144287, "global_step": 51384, "epoch": 1223} {"train_loss": -5.785425186157227, "global_step": 51385, "epoch": 1223} {"train_loss": -5.7763543128967285, "global_step": 51386, "epoch": 1223} {"train_loss": -5.81716251373291, "global_step": 51387, "epoch": 1223} {"train_loss": -5.822986602783203, "global_step": 51388, "epoch": 1223} {"train_loss": -5.761842727661133, "global_step": 51389, "epoch": 1223} {"train_loss": -5.845476150512695, "global_step": 51390, "epoch": 1223} {"train_loss": -5.824441432952881, "global_step": 51391, "epoch": 1223} {"train_loss": -5.737456798553467, "global_step": 51392, "epoch": 1223} {"train_loss": -5.781991004943848, "global_step": 51393, "epoch": 1223} {"train_loss": -5.751335620880127, "global_step": 51394, "epoch": 1223} {"train_loss": -5.700412750244141, "global_step": 51395, "epoch": 1223} {"train_loss": -5.770228862762451, "global_step": 51396, "epoch": 1223} {"train_loss": -5.877565860748291, "global_step": 51397, "epoch": 1223} {"train_loss": -5.797283172607422, "global_step": 51398, "epoch": 1223} {"train_loss": -5.815368175506592, "global_step": 51399, "epoch": 1223} {"train_loss": -5.772497177124023, "global_step": 51400, "epoch": 1223} {"train_loss": -5.786735534667969, "global_step": 51401, "epoch": 1223} {"train_loss": -5.806061744689941, "global_step": 51402, "epoch": 1223} {"train_loss": -5.7246413230896, "global_step": 51403, "epoch": 1223} {"train_loss": -5.852997779846191, "global_step": 51404, "epoch": 1223} {"train_loss": -5.586963653564453, "global_step": 51405, "epoch": 1223} {"train_loss": -5.886551856994629, "global_step": 51406, "epoch": 1223} {"train_loss": -5.775709118161883, "global_step": 51407, "epoch": 1223, "val_loss": 74508.640625} {"train_loss": -5.695136547088623, "global_step": 51408, "epoch": 1224} {"train_loss": -5.830471992492676, "global_step": 51409, "epoch": 1224} {"train_loss": -5.644376754760742, "global_step": 51410, "epoch": 1224} {"train_loss": -5.76796293258667, "global_step": 51411, "epoch": 1224} {"train_loss": -5.811480522155762, "global_step": 51412, "epoch": 1224} {"train_loss": -5.810710906982422, "global_step": 51413, "epoch": 1224} {"train_loss": -5.701878547668457, "global_step": 51414, "epoch": 1224} {"train_loss": -5.682602882385254, "global_step": 51415, "epoch": 1224} {"train_loss": -5.744631767272949, "global_step": 51416, "epoch": 1224} {"train_loss": -5.892570495605469, "global_step": 51417, "epoch": 1224} {"train_loss": -5.757067680358887, "global_step": 51418, "epoch": 1224} {"train_loss": -5.756040573120117, "global_step": 51419, "epoch": 1224} {"train_loss": -5.7817769050598145, "global_step": 51420, "epoch": 1224} {"train_loss": -5.761025905609131, "global_step": 51421, "epoch": 1224} {"train_loss": -5.7131500244140625, "global_step": 51422, "epoch": 1224} {"train_loss": -5.905605316162109, "global_step": 51423, "epoch": 1224} {"train_loss": -5.938478946685791, "global_step": 51424, "epoch": 1224} {"train_loss": -5.9179558753967285, "global_step": 51425, "epoch": 1224} {"train_loss": -5.816168785095215, "global_step": 51426, "epoch": 1224} {"train_loss": -5.830936431884766, "global_step": 51427, "epoch": 1224} {"train_loss": -5.73783540725708, "global_step": 51428, "epoch": 1224} {"train_loss": -5.887294292449951, "global_step": 51429, "epoch": 1224} {"train_loss": -5.778116703033447, "global_step": 51430, "epoch": 1224} {"train_loss": -5.849626541137695, "global_step": 51431, "epoch": 1224} {"train_loss": -5.809972286224365, "global_step": 51432, "epoch": 1224} {"train_loss": -5.680733680725098, "global_step": 51433, "epoch": 1224} {"train_loss": -5.796813011169434, "global_step": 51434, "epoch": 1224} {"train_loss": -5.684759616851807, "global_step": 51435, "epoch": 1224} {"train_loss": -5.714564800262451, "global_step": 51436, "epoch": 1224} {"train_loss": -5.878663539886475, "global_step": 51437, "epoch": 1224} {"train_loss": -5.776394844055176, "global_step": 51438, "epoch": 1224} {"train_loss": -5.826783180236816, "global_step": 51439, "epoch": 1224} {"train_loss": -5.845582485198975, "global_step": 51440, "epoch": 1224} {"train_loss": -5.72420072555542, "global_step": 51441, "epoch": 1224} {"train_loss": -5.829317092895508, "global_step": 51442, "epoch": 1224} {"train_loss": -5.741846084594727, "global_step": 51443, "epoch": 1224} {"train_loss": -5.733675479888916, "global_step": 51444, "epoch": 1224} {"train_loss": -5.695974826812744, "global_step": 51445, "epoch": 1224} {"train_loss": -5.851494789123535, "global_step": 51446, "epoch": 1224} {"train_loss": -5.854595184326172, "global_step": 51447, "epoch": 1224} {"train_loss": -5.83819055557251, "global_step": 51448, "epoch": 1224} {"train_loss": -5.7860605489640005, "global_step": 51449, "epoch": 1224, "val_loss": 74487.3359375} {"train_loss": -5.899784088134766, "global_step": 51450, "epoch": 1225} {"train_loss": -5.820572376251221, "global_step": 51451, "epoch": 1225} {"train_loss": -5.8297624588012695, "global_step": 51452, "epoch": 1225} {"train_loss": -5.7845258712768555, "global_step": 51453, "epoch": 1225} {"train_loss": -5.780667781829834, "global_step": 51454, "epoch": 1225} {"train_loss": -5.8004961013793945, "global_step": 51455, "epoch": 1225} {"train_loss": -5.845028400421143, "global_step": 51456, "epoch": 1225} {"train_loss": -5.736513137817383, "global_step": 51457, "epoch": 1225} {"train_loss": -5.858545303344727, "global_step": 51458, "epoch": 1225} {"train_loss": -5.816022872924805, "global_step": 51459, "epoch": 1225} {"train_loss": -5.72462272644043, "global_step": 51460, "epoch": 1225} {"train_loss": -5.870583534240723, "global_step": 51461, "epoch": 1225} {"train_loss": -5.7769036293029785, "global_step": 51462, "epoch": 1225} {"train_loss": -5.778159141540527, "global_step": 51463, "epoch": 1225} {"train_loss": -5.792364597320557, "global_step": 51464, "epoch": 1225} {"train_loss": -5.82330322265625, "global_step": 51465, "epoch": 1225} {"train_loss": -5.657801151275635, "global_step": 51466, "epoch": 1225} {"train_loss": -5.698242664337158, "global_step": 51467, "epoch": 1225} {"train_loss": -5.75899600982666, "global_step": 51468, "epoch": 1225} {"train_loss": -5.834424018859863, "global_step": 51469, "epoch": 1225} {"train_loss": -5.785968780517578, "global_step": 51470, "epoch": 1225} {"train_loss": -5.755566596984863, "global_step": 51471, "epoch": 1225} {"train_loss": -5.8037004470825195, "global_step": 51472, "epoch": 1225} {"train_loss": -5.782852649688721, "global_step": 51473, "epoch": 1225} {"train_loss": -5.78126335144043, "global_step": 51474, "epoch": 1225} {"train_loss": -5.80301570892334, "global_step": 51475, "epoch": 1225} {"train_loss": -5.850303649902344, "global_step": 51476, "epoch": 1225} {"train_loss": -5.836796760559082, "global_step": 51477, "epoch": 1225} {"train_loss": -5.770469665527344, "global_step": 51478, "epoch": 1225} {"train_loss": -5.739889144897461, "global_step": 51479, "epoch": 1225} {"train_loss": -5.910246849060059, "global_step": 51480, "epoch": 1225} {"train_loss": -5.78061056137085, "global_step": 51481, "epoch": 1225} {"train_loss": -5.777596473693848, "global_step": 51482, "epoch": 1225} {"train_loss": -5.76607608795166, "global_step": 51483, "epoch": 1225} {"train_loss": -5.80056619644165, "global_step": 51484, "epoch": 1225} {"train_loss": -5.732886791229248, "global_step": 51485, "epoch": 1225} {"train_loss": -5.967449188232422, "global_step": 51486, "epoch": 1225} {"train_loss": -5.758783340454102, "global_step": 51487, "epoch": 1225} {"train_loss": -5.896109580993652, "global_step": 51488, "epoch": 1225} {"train_loss": -5.746604919433594, "global_step": 51489, "epoch": 1225} {"train_loss": -5.7340593338012695, "global_step": 51490, "epoch": 1225} {"train_loss": -5.798987195605323, "global_step": 51491, "epoch": 1225, "val_loss": 74042.6171875} {"train_loss": -5.794822692871094, "global_step": 51492, "epoch": 1226} {"train_loss": -5.799524307250977, "global_step": 51493, "epoch": 1226} {"train_loss": -6.023176670074463, "global_step": 51494, "epoch": 1226} {"train_loss": -5.842874526977539, "global_step": 51495, "epoch": 1226} {"train_loss": -5.821927070617676, "global_step": 51496, "epoch": 1226} {"train_loss": -5.9043803215026855, "global_step": 51497, "epoch": 1226} {"train_loss": -5.8289875984191895, "global_step": 51498, "epoch": 1226} {"train_loss": -5.885276794433594, "global_step": 51499, "epoch": 1226} {"train_loss": -5.834827423095703, "global_step": 51500, "epoch": 1226} {"train_loss": -5.836320877075195, "global_step": 51501, "epoch": 1226} {"train_loss": -5.923816680908203, "global_step": 51502, "epoch": 1226} {"train_loss": -5.662289142608643, "global_step": 51503, "epoch": 1226} {"train_loss": -5.7755866050720215, "global_step": 51504, "epoch": 1226} {"train_loss": -5.797244548797607, "global_step": 51505, "epoch": 1226} {"train_loss": -5.875215530395508, "global_step": 51506, "epoch": 1226} {"train_loss": -5.825418472290039, "global_step": 51507, "epoch": 1226} {"train_loss": -5.862419128417969, "global_step": 51508, "epoch": 1226} {"train_loss": -5.833300590515137, "global_step": 51509, "epoch": 1226} {"train_loss": -5.821023941040039, "global_step": 51510, "epoch": 1226} {"train_loss": -5.641576766967773, "global_step": 51511, "epoch": 1226} {"train_loss": -5.730376243591309, "global_step": 51512, "epoch": 1226} {"train_loss": -5.807169437408447, "global_step": 51513, "epoch": 1226} {"train_loss": -5.746583938598633, "global_step": 51514, "epoch": 1226} {"train_loss": -5.784566402435303, "global_step": 51515, "epoch": 1226} {"train_loss": -5.739994049072266, "global_step": 51516, "epoch": 1226} {"train_loss": -5.6328864097595215, "global_step": 51517, "epoch": 1226} {"train_loss": -5.823618412017822, "global_step": 51518, "epoch": 1226} {"train_loss": -5.775180816650391, "global_step": 51519, "epoch": 1226} {"train_loss": -5.71155309677124, "global_step": 51520, "epoch": 1226} {"train_loss": -5.866879940032959, "global_step": 51521, "epoch": 1226} {"train_loss": -5.672837257385254, "global_step": 51522, "epoch": 1226} {"train_loss": -5.7771711349487305, "global_step": 51523, "epoch": 1226} {"train_loss": -5.868194580078125, "global_step": 51524, "epoch": 1226} {"train_loss": -5.728975296020508, "global_step": 51525, "epoch": 1226} {"train_loss": -5.708735466003418, "global_step": 51526, "epoch": 1226} {"train_loss": -5.869583606719971, "global_step": 51527, "epoch": 1226} {"train_loss": -5.786941051483154, "global_step": 51528, "epoch": 1226} {"train_loss": -5.763817310333252, "global_step": 51529, "epoch": 1226} {"train_loss": -5.729553699493408, "global_step": 51530, "epoch": 1226} {"train_loss": -5.813599586486816, "global_step": 51531, "epoch": 1226} {"train_loss": -5.8078765869140625, "global_step": 51532, "epoch": 1226} {"train_loss": -5.799466348829723, "global_step": 51533, "epoch": 1226, "val_loss": 74182.03125} {"train_loss": -5.727647304534912, "global_step": 51534, "epoch": 1227} {"train_loss": -5.851024150848389, "global_step": 51535, "epoch": 1227} {"train_loss": -5.918622970581055, "global_step": 51536, "epoch": 1227} {"train_loss": -5.864205837249756, "global_step": 51537, "epoch": 1227} {"train_loss": -5.867109298706055, "global_step": 51538, "epoch": 1227} {"train_loss": -5.734949588775635, "global_step": 51539, "epoch": 1227} {"train_loss": -5.687593460083008, "global_step": 51540, "epoch": 1227} {"train_loss": -5.833016395568848, "global_step": 51541, "epoch": 1227} {"train_loss": -5.708018779754639, "global_step": 51542, "epoch": 1227} {"train_loss": -5.767367362976074, "global_step": 51543, "epoch": 1227} {"train_loss": -5.9626007080078125, "global_step": 51544, "epoch": 1227} {"train_loss": -5.692594528198242, "global_step": 51545, "epoch": 1227} {"train_loss": -5.650243282318115, "global_step": 51546, "epoch": 1227} {"train_loss": -5.7713141441345215, "global_step": 51547, "epoch": 1227} {"train_loss": -5.829097270965576, "global_step": 51548, "epoch": 1227} {"train_loss": -5.7746262550354, "global_step": 51549, "epoch": 1227} {"train_loss": -5.810728073120117, "global_step": 51550, "epoch": 1227} {"train_loss": -5.884718894958496, "global_step": 51551, "epoch": 1227} {"train_loss": -5.733401298522949, "global_step": 51552, "epoch": 1227} {"train_loss": -5.777660369873047, "global_step": 51553, "epoch": 1227} {"train_loss": -5.764385223388672, "global_step": 51554, "epoch": 1227} {"train_loss": -5.788668632507324, "global_step": 51555, "epoch": 1227} {"train_loss": -5.820272445678711, "global_step": 51556, "epoch": 1227} {"train_loss": -5.687530517578125, "global_step": 51557, "epoch": 1227} {"train_loss": -5.7779951095581055, "global_step": 51558, "epoch": 1227} {"train_loss": -5.6879496574401855, "global_step": 51559, "epoch": 1227} {"train_loss": -5.8445611000061035, "global_step": 51560, "epoch": 1227} {"train_loss": -5.824838638305664, "global_step": 51561, "epoch": 1227} {"train_loss": -5.8589324951171875, "global_step": 51562, "epoch": 1227} {"train_loss": -5.785702705383301, "global_step": 51563, "epoch": 1227} {"train_loss": -5.77243709564209, "global_step": 51564, "epoch": 1227} {"train_loss": -5.786390781402588, "global_step": 51565, "epoch": 1227} {"train_loss": -5.775295257568359, "global_step": 51566, "epoch": 1227} {"train_loss": -5.713558673858643, "global_step": 51567, "epoch": 1227} {"train_loss": -5.740004062652588, "global_step": 51568, "epoch": 1227} {"train_loss": -5.796879768371582, "global_step": 51569, "epoch": 1227} {"train_loss": -5.823287010192871, "global_step": 51570, "epoch": 1227} {"train_loss": -5.682084083557129, "global_step": 51571, "epoch": 1227} {"train_loss": -5.772113800048828, "global_step": 51572, "epoch": 1227} {"train_loss": -5.708687782287598, "global_step": 51573, "epoch": 1227} {"train_loss": -5.851263999938965, "global_step": 51574, "epoch": 1227} {"train_loss": -5.783134437742687, "global_step": 51575, "epoch": 1227, "val_loss": 74530.53125} {"train_loss": -5.817677974700928, "global_step": 51576, "epoch": 1228} {"train_loss": -5.803696632385254, "global_step": 51577, "epoch": 1228} {"train_loss": -5.835691452026367, "global_step": 51578, "epoch": 1228} {"train_loss": -5.7501373291015625, "global_step": 51579, "epoch": 1228} {"train_loss": -5.722502708435059, "global_step": 51580, "epoch": 1228} {"train_loss": -5.8946709632873535, "global_step": 51581, "epoch": 1228} {"train_loss": -5.757480144500732, "global_step": 51582, "epoch": 1228} {"train_loss": -5.809105396270752, "global_step": 51583, "epoch": 1228} {"train_loss": -5.773354530334473, "global_step": 51584, "epoch": 1228} {"train_loss": -5.808439254760742, "global_step": 51585, "epoch": 1228} {"train_loss": -5.837224960327148, "global_step": 51586, "epoch": 1228} {"train_loss": -5.5896992683410645, "global_step": 51587, "epoch": 1228} {"train_loss": -5.690157413482666, "global_step": 51588, "epoch": 1228} {"train_loss": -5.812469482421875, "global_step": 51589, "epoch": 1228} {"train_loss": -5.8506927490234375, "global_step": 51590, "epoch": 1228} {"train_loss": -5.808428764343262, "global_step": 51591, "epoch": 1228} {"train_loss": -5.675782203674316, "global_step": 51592, "epoch": 1228} {"train_loss": -5.760616302490234, "global_step": 51593, "epoch": 1228} {"train_loss": -5.79920768737793, "global_step": 51594, "epoch": 1228} {"train_loss": -5.7539472579956055, "global_step": 51595, "epoch": 1228} {"train_loss": -5.867718696594238, "global_step": 51596, "epoch": 1228} {"train_loss": -5.766462326049805, "global_step": 51597, "epoch": 1228} {"train_loss": -5.829217433929443, "global_step": 51598, "epoch": 1228} {"train_loss": -5.912362575531006, "global_step": 51599, "epoch": 1228} {"train_loss": -5.6627607345581055, "global_step": 51600, "epoch": 1228} {"train_loss": -5.871757984161377, "global_step": 51601, "epoch": 1228} {"train_loss": -5.793230056762695, "global_step": 51602, "epoch": 1228} {"train_loss": -5.7690749168396, "global_step": 51603, "epoch": 1228} {"train_loss": -5.762073040008545, "global_step": 51604, "epoch": 1228} {"train_loss": -5.807098388671875, "global_step": 51605, "epoch": 1228} {"train_loss": -5.789437294006348, "global_step": 51606, "epoch": 1228} {"train_loss": -5.836799621582031, "global_step": 51607, "epoch": 1228} {"train_loss": -5.686349868774414, "global_step": 51608, "epoch": 1228} {"train_loss": -5.711984634399414, "global_step": 51609, "epoch": 1228} {"train_loss": -5.739065170288086, "global_step": 51610, "epoch": 1228} {"train_loss": -5.605740070343018, "global_step": 51611, "epoch": 1228} {"train_loss": -5.7816948890686035, "global_step": 51612, "epoch": 1228} {"train_loss": -5.6847686767578125, "global_step": 51613, "epoch": 1228} {"train_loss": -5.744564056396484, "global_step": 51614, "epoch": 1228} {"train_loss": -5.77391242980957, "global_step": 51615, "epoch": 1228} {"train_loss": -5.758416175842285, "global_step": 51616, "epoch": 1228} {"train_loss": -5.773072753633771, "global_step": 51617, "epoch": 1228, "val_loss": 74607.15625} {"train_loss": -5.688230514526367, "global_step": 51618, "epoch": 1229} {"train_loss": -5.874972820281982, "global_step": 51619, "epoch": 1229} {"train_loss": -5.659547328948975, "global_step": 51620, "epoch": 1229} {"train_loss": -5.663710117340088, "global_step": 51621, "epoch": 1229} {"train_loss": -5.8176469802856445, "global_step": 51622, "epoch": 1229} {"train_loss": -5.698988914489746, "global_step": 51623, "epoch": 1229} {"train_loss": -5.8188252449035645, "global_step": 51624, "epoch": 1229} {"train_loss": -5.7362213134765625, "global_step": 51625, "epoch": 1229} {"train_loss": -5.771121501922607, "global_step": 51626, "epoch": 1229} {"train_loss": -5.682648181915283, "global_step": 51627, "epoch": 1229} {"train_loss": -5.774006366729736, "global_step": 51628, "epoch": 1229} {"train_loss": -5.712968826293945, "global_step": 51629, "epoch": 1229} {"train_loss": -5.8717756271362305, "global_step": 51630, "epoch": 1229} {"train_loss": -5.791665077209473, "global_step": 51631, "epoch": 1229} {"train_loss": -5.877096652984619, "global_step": 51632, "epoch": 1229} {"train_loss": -5.876965522766113, "global_step": 51633, "epoch": 1229} {"train_loss": -5.7345781326293945, "global_step": 51634, "epoch": 1229} {"train_loss": -5.756148338317871, "global_step": 51635, "epoch": 1229} {"train_loss": -5.776569366455078, "global_step": 51636, "epoch": 1229} {"train_loss": -5.724025726318359, "global_step": 51637, "epoch": 1229} {"train_loss": -5.802220344543457, "global_step": 51638, "epoch": 1229} {"train_loss": -5.810420513153076, "global_step": 51639, "epoch": 1229} {"train_loss": -5.70134162902832, "global_step": 51640, "epoch": 1229} {"train_loss": -5.66738224029541, "global_step": 51641, "epoch": 1229} {"train_loss": -5.8648271560668945, "global_step": 51642, "epoch": 1229} {"train_loss": -5.729792594909668, "global_step": 51643, "epoch": 1229} {"train_loss": -5.836185932159424, "global_step": 51644, "epoch": 1229} {"train_loss": -5.754824161529541, "global_step": 51645, "epoch": 1229} {"train_loss": -5.724481582641602, "global_step": 51646, "epoch": 1229} {"train_loss": -5.781391620635986, "global_step": 51647, "epoch": 1229} {"train_loss": -5.768206596374512, "global_step": 51648, "epoch": 1229} {"train_loss": -5.698298454284668, "global_step": 51649, "epoch": 1229} {"train_loss": -5.676517963409424, "global_step": 51650, "epoch": 1229} {"train_loss": -5.647868633270264, "global_step": 51651, "epoch": 1229} {"train_loss": -5.719146728515625, "global_step": 51652, "epoch": 1229} {"train_loss": -5.760589599609375, "global_step": 51653, "epoch": 1229} {"train_loss": -5.740952968597412, "global_step": 51654, "epoch": 1229} {"train_loss": -5.725557327270508, "global_step": 51655, "epoch": 1229} {"train_loss": -5.761757850646973, "global_step": 51656, "epoch": 1229} {"train_loss": -5.829013347625732, "global_step": 51657, "epoch": 1229} {"train_loss": -5.844570636749268, "global_step": 51658, "epoch": 1229} {"train_loss": -5.758645511808849, "global_step": 51659, "epoch": 1229, "val_loss": 74621.515625} {"train_loss": -5.76276969909668, "global_step": 51660, "epoch": 1230} {"train_loss": -5.830146312713623, "global_step": 51661, "epoch": 1230} {"train_loss": -5.697267532348633, "global_step": 51662, "epoch": 1230} {"train_loss": -5.81276798248291, "global_step": 51663, "epoch": 1230} {"train_loss": -5.812809467315674, "global_step": 51664, "epoch": 1230} {"train_loss": -5.848475456237793, "global_step": 51665, "epoch": 1230} {"train_loss": -5.900753498077393, "global_step": 51666, "epoch": 1230} {"train_loss": -5.5912766456604, "global_step": 51667, "epoch": 1230} {"train_loss": -5.901006698608398, "global_step": 51668, "epoch": 1230} {"train_loss": -5.7781195640563965, "global_step": 51669, "epoch": 1230} {"train_loss": -5.704263210296631, "global_step": 51670, "epoch": 1230} {"train_loss": -5.834284782409668, "global_step": 51671, "epoch": 1230} {"train_loss": -5.913904190063477, "global_step": 51672, "epoch": 1230} {"train_loss": -5.804194450378418, "global_step": 51673, "epoch": 1230} {"train_loss": -5.81601619720459, "global_step": 51674, "epoch": 1230} {"train_loss": -5.7208571434021, "global_step": 51675, "epoch": 1230} {"train_loss": -5.7474188804626465, "global_step": 51676, "epoch": 1230} {"train_loss": -5.934525489807129, "global_step": 51677, "epoch": 1230} {"train_loss": -5.631080150604248, "global_step": 51678, "epoch": 1230} {"train_loss": -5.813665390014648, "global_step": 51679, "epoch": 1230} {"train_loss": -5.734842777252197, "global_step": 51680, "epoch": 1230} {"train_loss": -5.835115909576416, "global_step": 51681, "epoch": 1230} {"train_loss": -5.833415985107422, "global_step": 51682, "epoch": 1230} {"train_loss": -5.729321479797363, "global_step": 51683, "epoch": 1230} {"train_loss": -5.795407772064209, "global_step": 51684, "epoch": 1230} {"train_loss": -5.823910713195801, "global_step": 51685, "epoch": 1230} {"train_loss": -5.825735092163086, "global_step": 51686, "epoch": 1230} {"train_loss": -5.77269983291626, "global_step": 51687, "epoch": 1230} {"train_loss": -5.583420753479004, "global_step": 51688, "epoch": 1230} {"train_loss": -5.731807708740234, "global_step": 51689, "epoch": 1230} {"train_loss": -5.75521993637085, "global_step": 51690, "epoch": 1230} {"train_loss": -5.729705810546875, "global_step": 51691, "epoch": 1230} {"train_loss": -5.752995491027832, "global_step": 51692, "epoch": 1230} {"train_loss": -5.884239196777344, "global_step": 51693, "epoch": 1230} {"train_loss": -5.728977203369141, "global_step": 51694, "epoch": 1230} {"train_loss": -5.837333679199219, "global_step": 51695, "epoch": 1230} {"train_loss": -5.7363457679748535, "global_step": 51696, "epoch": 1230} {"train_loss": -5.806384563446045, "global_step": 51697, "epoch": 1230} {"train_loss": -5.67937707901001, "global_step": 51698, "epoch": 1230} {"train_loss": -5.585541248321533, "global_step": 51699, "epoch": 1230} {"train_loss": -5.762916564941406, "global_step": 51700, "epoch": 1230} {"train_loss": -5.775283734003703, "global_step": 51701, "epoch": 1230, "val_loss": 74209.5078125} {"train_loss": -5.707599639892578, "global_step": 51702, "epoch": 1231} {"train_loss": -5.8704681396484375, "global_step": 51703, "epoch": 1231} {"train_loss": -5.804009914398193, "global_step": 51704, "epoch": 1231} {"train_loss": -5.863478660583496, "global_step": 51705, "epoch": 1231} {"train_loss": -5.753035545349121, "global_step": 51706, "epoch": 1231} {"train_loss": -5.628268241882324, "global_step": 51707, "epoch": 1231} {"train_loss": -5.78596830368042, "global_step": 51708, "epoch": 1231} {"train_loss": -5.710010051727295, "global_step": 51709, "epoch": 1231} {"train_loss": -5.806895732879639, "global_step": 51710, "epoch": 1231} {"train_loss": -5.83774471282959, "global_step": 51711, "epoch": 1231} {"train_loss": -5.830150604248047, "global_step": 51712, "epoch": 1231} {"train_loss": -5.629895210266113, "global_step": 51713, "epoch": 1231} {"train_loss": -5.940756797790527, "global_step": 51714, "epoch": 1231} {"train_loss": -5.734291076660156, "global_step": 51715, "epoch": 1231} {"train_loss": -5.790849685668945, "global_step": 51716, "epoch": 1231} {"train_loss": -5.628431797027588, "global_step": 51717, "epoch": 1231} {"train_loss": -5.741739273071289, "global_step": 51718, "epoch": 1231} {"train_loss": -5.759888648986816, "global_step": 51719, "epoch": 1231} {"train_loss": -5.847403049468994, "global_step": 51720, "epoch": 1231} {"train_loss": -5.761092185974121, "global_step": 51721, "epoch": 1231} {"train_loss": -5.727155685424805, "global_step": 51722, "epoch": 1231} {"train_loss": -5.769513130187988, "global_step": 51723, "epoch": 1231} {"train_loss": -5.77889347076416, "global_step": 51724, "epoch": 1231} {"train_loss": -5.879545211791992, "global_step": 51725, "epoch": 1231} {"train_loss": -5.837250709533691, "global_step": 51726, "epoch": 1231} {"train_loss": -5.760754585266113, "global_step": 51727, "epoch": 1231} {"train_loss": -5.689872741699219, "global_step": 51728, "epoch": 1231} {"train_loss": -5.703039169311523, "global_step": 51729, "epoch": 1231} {"train_loss": -5.734127044677734, "global_step": 51730, "epoch": 1231} {"train_loss": -5.81156063079834, "global_step": 51731, "epoch": 1231} {"train_loss": -5.848092079162598, "global_step": 51732, "epoch": 1231} {"train_loss": -5.75335693359375, "global_step": 51733, "epoch": 1231} {"train_loss": -5.85181188583374, "global_step": 51734, "epoch": 1231} {"train_loss": -5.7183518409729, "global_step": 51735, "epoch": 1231} {"train_loss": -5.766273021697998, "global_step": 51736, "epoch": 1231} {"train_loss": -5.762302875518799, "global_step": 51737, "epoch": 1231} {"train_loss": -5.749367713928223, "global_step": 51738, "epoch": 1231} {"train_loss": -5.850470066070557, "global_step": 51739, "epoch": 1231} {"train_loss": -5.80658483505249, "global_step": 51740, "epoch": 1231} {"train_loss": -5.755582809448242, "global_step": 51741, "epoch": 1231} {"train_loss": -5.937911033630371, "global_step": 51742, "epoch": 1231} {"train_loss": -5.778840950557163, "global_step": 51743, "epoch": 1231, "val_loss": 74045.9375} {"train_loss": -5.773390769958496, "global_step": 51744, "epoch": 1232} {"train_loss": -5.824695587158203, "global_step": 51745, "epoch": 1232} {"train_loss": -5.781932830810547, "global_step": 51746, "epoch": 1232} {"train_loss": -5.830862522125244, "global_step": 51747, "epoch": 1232} {"train_loss": -5.923827171325684, "global_step": 51748, "epoch": 1232} {"train_loss": -5.729434967041016, "global_step": 51749, "epoch": 1232} {"train_loss": -5.852489471435547, "global_step": 51750, "epoch": 1232} {"train_loss": -5.796419143676758, "global_step": 51751, "epoch": 1232} {"train_loss": -5.823552131652832, "global_step": 51752, "epoch": 1232} {"train_loss": -5.831085205078125, "global_step": 51753, "epoch": 1232} {"train_loss": -5.821455955505371, "global_step": 51754, "epoch": 1232} {"train_loss": -5.735032081604004, "global_step": 51755, "epoch": 1232} {"train_loss": -5.79509162902832, "global_step": 51756, "epoch": 1232} {"train_loss": -5.686137676239014, "global_step": 51757, "epoch": 1232} {"train_loss": -5.997610092163086, "global_step": 51758, "epoch": 1232} {"train_loss": -5.8758649826049805, "global_step": 51759, "epoch": 1232} {"train_loss": -5.658617973327637, "global_step": 51760, "epoch": 1232} {"train_loss": -5.831851959228516, "global_step": 51761, "epoch": 1232} {"train_loss": -5.80671501159668, "global_step": 51762, "epoch": 1232} {"train_loss": -5.756357192993164, "global_step": 51763, "epoch": 1232} {"train_loss": -5.665432929992676, "global_step": 51764, "epoch": 1232} {"train_loss": -5.621601104736328, "global_step": 51765, "epoch": 1232} {"train_loss": -5.692685127258301, "global_step": 51766, "epoch": 1232} {"train_loss": -5.71272087097168, "global_step": 51767, "epoch": 1232} {"train_loss": -5.681538105010986, "global_step": 51768, "epoch": 1232} {"train_loss": -5.806544303894043, "global_step": 51769, "epoch": 1232} {"train_loss": -5.7758073806762695, "global_step": 51770, "epoch": 1232} {"train_loss": -5.645854473114014, "global_step": 51771, "epoch": 1232} {"train_loss": -5.706077575683594, "global_step": 51772, "epoch": 1232} {"train_loss": -5.743889808654785, "global_step": 51773, "epoch": 1232} {"train_loss": -5.731100082397461, "global_step": 51774, "epoch": 1232} {"train_loss": -5.73927640914917, "global_step": 51775, "epoch": 1232} {"train_loss": -5.834718704223633, "global_step": 51776, "epoch": 1232} {"train_loss": -5.683426380157471, "global_step": 51777, "epoch": 1232} {"train_loss": -5.654892444610596, "global_step": 51778, "epoch": 1232} {"train_loss": -5.831604957580566, "global_step": 51779, "epoch": 1232} {"train_loss": -5.707533359527588, "global_step": 51780, "epoch": 1232} {"train_loss": -5.711568832397461, "global_step": 51781, "epoch": 1232} {"train_loss": -5.788135528564453, "global_step": 51782, "epoch": 1232} {"train_loss": -5.776815414428711, "global_step": 51783, "epoch": 1232} {"train_loss": -5.873167514801025, "global_step": 51784, "epoch": 1232} {"train_loss": -5.7685163134620305, "global_step": 51785, "epoch": 1232, "val_loss": 74014.828125} {"train_loss": -5.885166645050049, "global_step": 51786, "epoch": 1233} {"train_loss": -5.913852691650391, "global_step": 51787, "epoch": 1233} {"train_loss": -5.712024688720703, "global_step": 51788, "epoch": 1233} {"train_loss": -5.821432113647461, "global_step": 51789, "epoch": 1233} {"train_loss": -5.838422775268555, "global_step": 51790, "epoch": 1233} {"train_loss": -5.849177837371826, "global_step": 51791, "epoch": 1233} {"train_loss": -5.78170108795166, "global_step": 51792, "epoch": 1233} {"train_loss": -5.864016532897949, "global_step": 51793, "epoch": 1233} {"train_loss": -5.721906661987305, "global_step": 51794, "epoch": 1233} {"train_loss": -5.753440856933594, "global_step": 51795, "epoch": 1233} {"train_loss": -5.648834705352783, "global_step": 51796, "epoch": 1233} {"train_loss": -5.741669178009033, "global_step": 51797, "epoch": 1233} {"train_loss": -5.836513996124268, "global_step": 51798, "epoch": 1233} {"train_loss": -5.682881832122803, "global_step": 51799, "epoch": 1233} {"train_loss": -5.666199684143066, "global_step": 51800, "epoch": 1233} {"train_loss": -5.727434158325195, "global_step": 51801, "epoch": 1233} {"train_loss": -5.663590431213379, "global_step": 51802, "epoch": 1233} {"train_loss": -5.705564022064209, "global_step": 51803, "epoch": 1233} {"train_loss": -5.671331405639648, "global_step": 51804, "epoch": 1233} {"train_loss": -5.747140407562256, "global_step": 51805, "epoch": 1233} {"train_loss": -5.710130214691162, "global_step": 51806, "epoch": 1233} {"train_loss": -5.687875747680664, "global_step": 51807, "epoch": 1233} {"train_loss": -5.673535346984863, "global_step": 51808, "epoch": 1233} {"train_loss": -5.672572135925293, "global_step": 51809, "epoch": 1233} {"train_loss": -5.69821310043335, "global_step": 51810, "epoch": 1233} {"train_loss": -5.713833808898926, "global_step": 51811, "epoch": 1233} {"train_loss": -5.74267053604126, "global_step": 51812, "epoch": 1233} {"train_loss": -5.595834732055664, "global_step": 51813, "epoch": 1233} {"train_loss": -5.7430830001831055, "global_step": 51814, "epoch": 1233} {"train_loss": -5.536368370056152, "global_step": 51815, "epoch": 1233} {"train_loss": -5.691219329833984, "global_step": 51816, "epoch": 1233} {"train_loss": -5.672957420349121, "global_step": 51817, "epoch": 1233} {"train_loss": -5.716252326965332, "global_step": 51818, "epoch": 1233} {"train_loss": -5.748152256011963, "global_step": 51819, "epoch": 1233} {"train_loss": -5.674482345581055, "global_step": 51820, "epoch": 1233} {"train_loss": -5.584934234619141, "global_step": 51821, "epoch": 1233} {"train_loss": -5.70028018951416, "global_step": 51822, "epoch": 1233} {"train_loss": -5.5607194900512695, "global_step": 51823, "epoch": 1233} {"train_loss": -5.661859512329102, "global_step": 51824, "epoch": 1233} {"train_loss": -5.693149566650391, "global_step": 51825, "epoch": 1233} {"train_loss": -5.592514514923096, "global_step": 51826, "epoch": 1233} {"train_loss": -5.715622163954235, "global_step": 51827, "epoch": 1233, "val_loss": 75657.21875} {"train_loss": -5.561359405517578, "global_step": 51828, "epoch": 1234} {"train_loss": -5.677844047546387, "global_step": 51829, "epoch": 1234} {"train_loss": -5.71695613861084, "global_step": 51830, "epoch": 1234} {"train_loss": -5.766417503356934, "global_step": 51831, "epoch": 1234} {"train_loss": -5.697713375091553, "global_step": 51832, "epoch": 1234} {"train_loss": -5.65882682800293, "global_step": 51833, "epoch": 1234} {"train_loss": -5.702350616455078, "global_step": 51834, "epoch": 1234} {"train_loss": -5.692507743835449, "global_step": 51835, "epoch": 1234} {"train_loss": -5.816971302032471, "global_step": 51836, "epoch": 1234} {"train_loss": -5.716769695281982, "global_step": 51837, "epoch": 1234} {"train_loss": -5.753861427307129, "global_step": 51838, "epoch": 1234} {"train_loss": -5.731603622436523, "global_step": 51839, "epoch": 1234} {"train_loss": -5.746367454528809, "global_step": 51840, "epoch": 1234} {"train_loss": -5.704188346862793, "global_step": 51841, "epoch": 1234} {"train_loss": -5.74770975112915, "global_step": 51842, "epoch": 1234} {"train_loss": -5.73940896987915, "global_step": 51843, "epoch": 1234} {"train_loss": -5.829341888427734, "global_step": 51844, "epoch": 1234} {"train_loss": -5.618500709533691, "global_step": 51845, "epoch": 1234} {"train_loss": -5.680957317352295, "global_step": 51846, "epoch": 1234} {"train_loss": -5.74343204498291, "global_step": 51847, "epoch": 1234} {"train_loss": -5.775625705718994, "global_step": 51848, "epoch": 1234} {"train_loss": -5.840154647827148, "global_step": 51849, "epoch": 1234} {"train_loss": -5.652616500854492, "global_step": 51850, "epoch": 1234} {"train_loss": -5.787507057189941, "global_step": 51851, "epoch": 1234} {"train_loss": -5.735705852508545, "global_step": 51852, "epoch": 1234} {"train_loss": -5.82807731628418, "global_step": 51853, "epoch": 1234} {"train_loss": -5.696053981781006, "global_step": 51854, "epoch": 1234} {"train_loss": -5.7087860107421875, "global_step": 51855, "epoch": 1234} {"train_loss": -5.90994930267334, "global_step": 51856, "epoch": 1234} {"train_loss": -5.689053058624268, "global_step": 51857, "epoch": 1234} {"train_loss": -5.825291156768799, "global_step": 51858, "epoch": 1234} {"train_loss": -5.722053527832031, "global_step": 51859, "epoch": 1234} {"train_loss": -5.749139785766602, "global_step": 51860, "epoch": 1234} {"train_loss": -5.886321067810059, "global_step": 51861, "epoch": 1234} {"train_loss": -5.870124816894531, "global_step": 51862, "epoch": 1234} {"train_loss": -5.880414009094238, "global_step": 51863, "epoch": 1234} {"train_loss": -5.83525276184082, "global_step": 51864, "epoch": 1234} {"train_loss": -5.899206161499023, "global_step": 51865, "epoch": 1234} {"train_loss": -5.895305156707764, "global_step": 51866, "epoch": 1234} {"train_loss": -5.845947265625, "global_step": 51867, "epoch": 1234} {"train_loss": -5.755865097045898, "global_step": 51868, "epoch": 1234} {"train_loss": -5.760211660748436, "global_step": 51869, "epoch": 1234, "val_loss": 74283.796875} {"train_loss": -5.78393030166626, "global_step": 51870, "epoch": 1235} {"train_loss": -5.682754039764404, "global_step": 51871, "epoch": 1235} {"train_loss": -5.726616859436035, "global_step": 51872, "epoch": 1235} {"train_loss": -5.80844783782959, "global_step": 51873, "epoch": 1235} {"train_loss": -5.698348045349121, "global_step": 51874, "epoch": 1235} {"train_loss": -5.7595109939575195, "global_step": 51875, "epoch": 1235} {"train_loss": -5.8201422691345215, "global_step": 51876, "epoch": 1235} {"train_loss": -5.582559585571289, "global_step": 51877, "epoch": 1235} {"train_loss": -5.7390336990356445, "global_step": 51878, "epoch": 1235} {"train_loss": -5.788974761962891, "global_step": 51879, "epoch": 1235} {"train_loss": -5.682738780975342, "global_step": 51880, "epoch": 1235} {"train_loss": -5.713883876800537, "global_step": 51881, "epoch": 1235} {"train_loss": -5.562406539916992, "global_step": 51882, "epoch": 1235} {"train_loss": -5.710733890533447, "global_step": 51883, "epoch": 1235} {"train_loss": -5.635989189147949, "global_step": 51884, "epoch": 1235} {"train_loss": -5.834866046905518, "global_step": 51885, "epoch": 1235} {"train_loss": -5.637584209442139, "global_step": 51886, "epoch": 1235} {"train_loss": -5.754081726074219, "global_step": 51887, "epoch": 1235} {"train_loss": -5.643694877624512, "global_step": 51888, "epoch": 1235} {"train_loss": -5.795591354370117, "global_step": 51889, "epoch": 1235} {"train_loss": -5.645488739013672, "global_step": 51890, "epoch": 1235} {"train_loss": -5.7708940505981445, "global_step": 51891, "epoch": 1235} {"train_loss": -5.643115997314453, "global_step": 51892, "epoch": 1235} {"train_loss": -5.8361921310424805, "global_step": 51893, "epoch": 1235} {"train_loss": -5.680758476257324, "global_step": 51894, "epoch": 1235} {"train_loss": -5.834141731262207, "global_step": 51895, "epoch": 1235} {"train_loss": -5.7067108154296875, "global_step": 51896, "epoch": 1235} {"train_loss": -5.727372646331787, "global_step": 51897, "epoch": 1235} {"train_loss": -5.682316780090332, "global_step": 51898, "epoch": 1235} {"train_loss": -5.770503997802734, "global_step": 51899, "epoch": 1235} {"train_loss": -5.77347469329834, "global_step": 51900, "epoch": 1235} {"train_loss": -5.8863372802734375, "global_step": 51901, "epoch": 1235} {"train_loss": -5.788069248199463, "global_step": 51902, "epoch": 1235} {"train_loss": -5.638646602630615, "global_step": 51903, "epoch": 1235} {"train_loss": -5.830690383911133, "global_step": 51904, "epoch": 1235} {"train_loss": -5.777347087860107, "global_step": 51905, "epoch": 1235} {"train_loss": -5.833461284637451, "global_step": 51906, "epoch": 1235} {"train_loss": -5.763761520385742, "global_step": 51907, "epoch": 1235} {"train_loss": -5.842836856842041, "global_step": 51908, "epoch": 1235} {"train_loss": -5.870724678039551, "global_step": 51909, "epoch": 1235} {"train_loss": -5.724752426147461, "global_step": 51910, "epoch": 1235} {"train_loss": -5.742660874412174, "global_step": 51911, "epoch": 1235, "val_loss": 74184.4609375} {"train_loss": -5.90365743637085, "global_step": 51912, "epoch": 1236} {"train_loss": -5.905875205993652, "global_step": 51913, "epoch": 1236} {"train_loss": -5.968188762664795, "global_step": 51914, "epoch": 1236} {"train_loss": -5.834964752197266, "global_step": 51915, "epoch": 1236} {"train_loss": -5.861564636230469, "global_step": 51916, "epoch": 1236} {"train_loss": -5.832381248474121, "global_step": 51917, "epoch": 1236} {"train_loss": -5.898099422454834, "global_step": 51918, "epoch": 1236} {"train_loss": -5.838480472564697, "global_step": 51919, "epoch": 1236} {"train_loss": -5.862993240356445, "global_step": 51920, "epoch": 1236} {"train_loss": -5.788775444030762, "global_step": 51921, "epoch": 1236} {"train_loss": -5.804303169250488, "global_step": 51922, "epoch": 1236} {"train_loss": -5.720733165740967, "global_step": 51923, "epoch": 1236} {"train_loss": -5.868912220001221, "global_step": 51924, "epoch": 1236} {"train_loss": -5.803234100341797, "global_step": 51925, "epoch": 1236} {"train_loss": -5.751742362976074, "global_step": 51926, "epoch": 1236} {"train_loss": -5.737288475036621, "global_step": 51927, "epoch": 1236} {"train_loss": -5.69156551361084, "global_step": 51928, "epoch": 1236} {"train_loss": -5.724409103393555, "global_step": 51929, "epoch": 1236} {"train_loss": -5.657623291015625, "global_step": 51930, "epoch": 1236} {"train_loss": -5.934404373168945, "global_step": 51931, "epoch": 1236} {"train_loss": -5.630862712860107, "global_step": 51932, "epoch": 1236} {"train_loss": -5.797133922576904, "global_step": 51933, "epoch": 1236} {"train_loss": -5.843456268310547, "global_step": 51934, "epoch": 1236} {"train_loss": -5.62169075012207, "global_step": 51935, "epoch": 1236} {"train_loss": -5.839058876037598, "global_step": 51936, "epoch": 1236} {"train_loss": -5.693127155303955, "global_step": 51937, "epoch": 1236} {"train_loss": -5.751936912536621, "global_step": 51938, "epoch": 1236} {"train_loss": -5.683341026306152, "global_step": 51939, "epoch": 1236} {"train_loss": -5.8348493576049805, "global_step": 51940, "epoch": 1236} {"train_loss": -5.794869899749756, "global_step": 51941, "epoch": 1236} {"train_loss": -5.714423179626465, "global_step": 51942, "epoch": 1236} {"train_loss": -5.807483673095703, "global_step": 51943, "epoch": 1236} {"train_loss": -5.851191997528076, "global_step": 51944, "epoch": 1236} {"train_loss": -5.741369247436523, "global_step": 51945, "epoch": 1236} {"train_loss": -5.852336883544922, "global_step": 51946, "epoch": 1236} {"train_loss": -5.69477653503418, "global_step": 51947, "epoch": 1236} {"train_loss": -5.939902305603027, "global_step": 51948, "epoch": 1236} {"train_loss": -5.895431041717529, "global_step": 51949, "epoch": 1236} {"train_loss": -5.755470275878906, "global_step": 51950, "epoch": 1236} {"train_loss": -5.872032165527344, "global_step": 51951, "epoch": 1236} {"train_loss": -5.687017440795898, "global_step": 51952, "epoch": 1236} {"train_loss": -5.796553293863933, "global_step": 51953, "epoch": 1236, "val_loss": 73923.9296875} {"train_loss": -5.917245864868164, "global_step": 51954, "epoch": 1237} {"train_loss": -5.851710319519043, "global_step": 51955, "epoch": 1237} {"train_loss": -5.865195274353027, "global_step": 51956, "epoch": 1237} {"train_loss": -5.813131332397461, "global_step": 51957, "epoch": 1237} {"train_loss": -5.761434555053711, "global_step": 51958, "epoch": 1237} {"train_loss": -5.713212966918945, "global_step": 51959, "epoch": 1237} {"train_loss": -5.834649562835693, "global_step": 51960, "epoch": 1237} {"train_loss": -5.729375839233398, "global_step": 51961, "epoch": 1237} {"train_loss": -5.88580322265625, "global_step": 51962, "epoch": 1237} {"train_loss": -5.76114559173584, "global_step": 51963, "epoch": 1237} {"train_loss": -5.732635974884033, "global_step": 51964, "epoch": 1237} {"train_loss": -5.760961055755615, "global_step": 51965, "epoch": 1237} {"train_loss": -5.804959297180176, "global_step": 51966, "epoch": 1237} {"train_loss": -5.726214408874512, "global_step": 51967, "epoch": 1237} {"train_loss": -5.847352027893066, "global_step": 51968, "epoch": 1237} {"train_loss": -5.74652624130249, "global_step": 51969, "epoch": 1237} {"train_loss": -5.75914192199707, "global_step": 51970, "epoch": 1237} {"train_loss": -5.8193464279174805, "global_step": 51971, "epoch": 1237} {"train_loss": -5.840620040893555, "global_step": 51972, "epoch": 1237} {"train_loss": -5.683393478393555, "global_step": 51973, "epoch": 1237} {"train_loss": -5.779781341552734, "global_step": 51974, "epoch": 1237} {"train_loss": -5.696372032165527, "global_step": 51975, "epoch": 1237} {"train_loss": -5.814375877380371, "global_step": 51976, "epoch": 1237} {"train_loss": -5.726064682006836, "global_step": 51977, "epoch": 1237} {"train_loss": -5.751772880554199, "global_step": 51978, "epoch": 1237} {"train_loss": -5.686861515045166, "global_step": 51979, "epoch": 1237} {"train_loss": -5.732865810394287, "global_step": 51980, "epoch": 1237} {"train_loss": -5.6833600997924805, "global_step": 51981, "epoch": 1237} {"train_loss": -5.5937910079956055, "global_step": 51982, "epoch": 1237} {"train_loss": -5.742610454559326, "global_step": 51983, "epoch": 1237} {"train_loss": -5.862526893615723, "global_step": 51984, "epoch": 1237} {"train_loss": -5.814355850219727, "global_step": 51985, "epoch": 1237} {"train_loss": -5.793087005615234, "global_step": 51986, "epoch": 1237} {"train_loss": -5.718034267425537, "global_step": 51987, "epoch": 1237} {"train_loss": -5.87199592590332, "global_step": 51988, "epoch": 1237} {"train_loss": -5.788331508636475, "global_step": 51989, "epoch": 1237} {"train_loss": -5.79022216796875, "global_step": 51990, "epoch": 1237} {"train_loss": -5.795290946960449, "global_step": 51991, "epoch": 1237} {"train_loss": -5.621857643127441, "global_step": 51992, "epoch": 1237} {"train_loss": -5.862317085266113, "global_step": 51993, "epoch": 1237} {"train_loss": -5.785582542419434, "global_step": 51994, "epoch": 1237} {"train_loss": -5.774435860770089, "global_step": 51995, "epoch": 1237, "val_loss": 74378.171875} {"train_loss": -5.8033671379089355, "global_step": 51996, "epoch": 1238} {"train_loss": -5.649101257324219, "global_step": 51997, "epoch": 1238} {"train_loss": -5.732062816619873, "global_step": 51998, "epoch": 1238} {"train_loss": -5.898771286010742, "global_step": 51999, "epoch": 1238} {"train_loss": -5.877925872802734, "global_step": 52000, "epoch": 1238} {"train_loss": -5.844790458679199, "global_step": 52001, "epoch": 1238} {"train_loss": -5.812196731567383, "global_step": 52002, "epoch": 1238} {"train_loss": -5.894521236419678, "global_step": 52003, "epoch": 1238} {"train_loss": -5.802062511444092, "global_step": 52004, "epoch": 1238} {"train_loss": -5.861700057983398, "global_step": 52005, "epoch": 1238} {"train_loss": -5.84332275390625, "global_step": 52006, "epoch": 1238} {"train_loss": -5.837514877319336, "global_step": 52007, "epoch": 1238} {"train_loss": -5.702996253967285, "global_step": 52008, "epoch": 1238} {"train_loss": -5.739540100097656, "global_step": 52009, "epoch": 1238} {"train_loss": -5.857895851135254, "global_step": 52010, "epoch": 1238} {"train_loss": -5.641602516174316, "global_step": 52011, "epoch": 1238} {"train_loss": -5.820398330688477, "global_step": 52012, "epoch": 1238} {"train_loss": -5.786990165710449, "global_step": 52013, "epoch": 1238} {"train_loss": -5.6852946281433105, "global_step": 52014, "epoch": 1238} {"train_loss": -5.833077907562256, "global_step": 52015, "epoch": 1238} {"train_loss": -5.799490451812744, "global_step": 52016, "epoch": 1238} {"train_loss": -5.859017372131348, "global_step": 52017, "epoch": 1238} {"train_loss": -5.929337501525879, "global_step": 52018, "epoch": 1238} {"train_loss": -5.812221050262451, "global_step": 52019, "epoch": 1238} {"train_loss": -5.81825590133667, "global_step": 52020, "epoch": 1238} {"train_loss": -5.8584160804748535, "global_step": 52021, "epoch": 1238} {"train_loss": -5.855278491973877, "global_step": 52022, "epoch": 1238} {"train_loss": -5.811289310455322, "global_step": 52023, "epoch": 1238} {"train_loss": -5.793998718261719, "global_step": 52024, "epoch": 1238} {"train_loss": -5.775959014892578, "global_step": 52025, "epoch": 1238} {"train_loss": -5.880959510803223, "global_step": 52026, "epoch": 1238} {"train_loss": -5.771579742431641, "global_step": 52027, "epoch": 1238} {"train_loss": -5.697997570037842, "global_step": 52028, "epoch": 1238} {"train_loss": -5.65959358215332, "global_step": 52029, "epoch": 1238} {"train_loss": -5.698630332946777, "global_step": 52030, "epoch": 1238} {"train_loss": -5.724392890930176, "global_step": 52031, "epoch": 1238} {"train_loss": -5.895520210266113, "global_step": 52032, "epoch": 1238} {"train_loss": -5.8301191329956055, "global_step": 52033, "epoch": 1238} {"train_loss": -5.814571380615234, "global_step": 52034, "epoch": 1238} {"train_loss": -5.796581745147705, "global_step": 52035, "epoch": 1238} {"train_loss": -5.726969242095947, "global_step": 52036, "epoch": 1238} {"train_loss": -5.801227580933344, "global_step": 52037, "epoch": 1238, "val_loss": 74834.90625} {"train_loss": -5.739238739013672, "global_step": 52038, "epoch": 1239} {"train_loss": -5.781003952026367, "global_step": 52039, "epoch": 1239} {"train_loss": -5.767455101013184, "global_step": 52040, "epoch": 1239} {"train_loss": -5.7956109046936035, "global_step": 52041, "epoch": 1239} {"train_loss": -5.864776611328125, "global_step": 52042, "epoch": 1239} {"train_loss": -5.836866855621338, "global_step": 52043, "epoch": 1239} {"train_loss": -5.842720031738281, "global_step": 52044, "epoch": 1239} {"train_loss": -5.862021446228027, "global_step": 52045, "epoch": 1239} {"train_loss": -5.7439446449279785, "global_step": 52046, "epoch": 1239} {"train_loss": -5.6584792137146, "global_step": 52047, "epoch": 1239} {"train_loss": -5.8029279708862305, "global_step": 52048, "epoch": 1239} {"train_loss": -5.844050407409668, "global_step": 52049, "epoch": 1239} {"train_loss": -5.68366813659668, "global_step": 52050, "epoch": 1239} {"train_loss": -5.906235694885254, "global_step": 52051, "epoch": 1239} {"train_loss": -5.729977607727051, "global_step": 52052, "epoch": 1239} {"train_loss": -5.686731338500977, "global_step": 52053, "epoch": 1239} {"train_loss": -5.741279602050781, "global_step": 52054, "epoch": 1239} {"train_loss": -5.76310920715332, "global_step": 52055, "epoch": 1239} {"train_loss": -5.784290790557861, "global_step": 52056, "epoch": 1239} {"train_loss": -5.752593994140625, "global_step": 52057, "epoch": 1239} {"train_loss": -5.6786322593688965, "global_step": 52058, "epoch": 1239} {"train_loss": -5.791526794433594, "global_step": 52059, "epoch": 1239} {"train_loss": -5.810459136962891, "global_step": 52060, "epoch": 1239} {"train_loss": -5.776273727416992, "global_step": 52061, "epoch": 1239} {"train_loss": -5.750548839569092, "global_step": 52062, "epoch": 1239} {"train_loss": -5.884734153747559, "global_step": 52063, "epoch": 1239} {"train_loss": -5.803745269775391, "global_step": 52064, "epoch": 1239} {"train_loss": -5.772174835205078, "global_step": 52065, "epoch": 1239} {"train_loss": -5.809422016143799, "global_step": 52066, "epoch": 1239} {"train_loss": -5.771602630615234, "global_step": 52067, "epoch": 1239} {"train_loss": -5.818849086761475, "global_step": 52068, "epoch": 1239} {"train_loss": -5.840810775756836, "global_step": 52069, "epoch": 1239} {"train_loss": -5.815568923950195, "global_step": 52070, "epoch": 1239} {"train_loss": -5.828609943389893, "global_step": 52071, "epoch": 1239} {"train_loss": -5.70207405090332, "global_step": 52072, "epoch": 1239} {"train_loss": -5.759270668029785, "global_step": 52073, "epoch": 1239} {"train_loss": -5.880946159362793, "global_step": 52074, "epoch": 1239} {"train_loss": -5.947307586669922, "global_step": 52075, "epoch": 1239} {"train_loss": -5.7515387535095215, "global_step": 52076, "epoch": 1239} {"train_loss": -5.832683563232422, "global_step": 52077, "epoch": 1239} {"train_loss": -5.812995433807373, "global_step": 52078, "epoch": 1239} {"train_loss": -5.791772740227835, "global_step": 52079, "epoch": 1239, "val_loss": 74602.1484375} {"train_loss": -5.780943870544434, "global_step": 52080, "epoch": 1240} {"train_loss": -5.738463401794434, "global_step": 52081, "epoch": 1240} {"train_loss": -5.8778204917907715, "global_step": 52082, "epoch": 1240} {"train_loss": -5.863918304443359, "global_step": 52083, "epoch": 1240} {"train_loss": -5.741395950317383, "global_step": 52084, "epoch": 1240} {"train_loss": -5.83447265625, "global_step": 52085, "epoch": 1240} {"train_loss": -5.7269439697265625, "global_step": 52086, "epoch": 1240} {"train_loss": -5.8790693283081055, "global_step": 52087, "epoch": 1240} {"train_loss": -5.873513698577881, "global_step": 52088, "epoch": 1240} {"train_loss": -5.757567405700684, "global_step": 52089, "epoch": 1240} {"train_loss": -5.8573150634765625, "global_step": 52090, "epoch": 1240} {"train_loss": -5.892035961151123, "global_step": 52091, "epoch": 1240} {"train_loss": -5.649662494659424, "global_step": 52092, "epoch": 1240} {"train_loss": -5.789708614349365, "global_step": 52093, "epoch": 1240} {"train_loss": -5.928712368011475, "global_step": 52094, "epoch": 1240} {"train_loss": -5.7780442237854, "global_step": 52095, "epoch": 1240} {"train_loss": -5.83156681060791, "global_step": 52096, "epoch": 1240} {"train_loss": -5.720781326293945, "global_step": 52097, "epoch": 1240} {"train_loss": -5.852070331573486, "global_step": 52098, "epoch": 1240} {"train_loss": -5.813785552978516, "global_step": 52099, "epoch": 1240} {"train_loss": -5.8357977867126465, "global_step": 52100, "epoch": 1240} {"train_loss": -5.810094833374023, "global_step": 52101, "epoch": 1240} {"train_loss": -5.697093486785889, "global_step": 52102, "epoch": 1240} {"train_loss": -5.742168426513672, "global_step": 52103, "epoch": 1240} {"train_loss": -5.861169815063477, "global_step": 52104, "epoch": 1240} {"train_loss": -5.698521137237549, "global_step": 52105, "epoch": 1240} {"train_loss": -5.778690338134766, "global_step": 52106, "epoch": 1240} {"train_loss": -5.790347099304199, "global_step": 52107, "epoch": 1240} {"train_loss": -5.804091930389404, "global_step": 52108, "epoch": 1240} {"train_loss": -5.754370212554932, "global_step": 52109, "epoch": 1240} {"train_loss": -5.822264194488525, "global_step": 52110, "epoch": 1240} {"train_loss": -5.782646179199219, "global_step": 52111, "epoch": 1240} {"train_loss": -5.636379718780518, "global_step": 52112, "epoch": 1240} {"train_loss": -5.959524631500244, "global_step": 52113, "epoch": 1240} {"train_loss": -5.802570343017578, "global_step": 52114, "epoch": 1240} {"train_loss": -5.712255477905273, "global_step": 52115, "epoch": 1240} {"train_loss": -5.8826904296875, "global_step": 52116, "epoch": 1240} {"train_loss": -5.808549404144287, "global_step": 52117, "epoch": 1240} {"train_loss": -5.954211235046387, "global_step": 52118, "epoch": 1240} {"train_loss": -5.7782511711120605, "global_step": 52119, "epoch": 1240} {"train_loss": -5.70866584777832, "global_step": 52120, "epoch": 1240} {"train_loss": -5.79921080952599, "global_step": 52121, "epoch": 1240, "val_loss": 74442.578125} {"train_loss": -5.73814582824707, "global_step": 52122, "epoch": 1241} {"train_loss": -5.776984214782715, "global_step": 52123, "epoch": 1241} {"train_loss": -5.880115509033203, "global_step": 52124, "epoch": 1241} {"train_loss": -5.757585525512695, "global_step": 52125, "epoch": 1241} {"train_loss": -5.802467346191406, "global_step": 52126, "epoch": 1241} {"train_loss": -5.894495964050293, "global_step": 52127, "epoch": 1241} {"train_loss": -5.8555450439453125, "global_step": 52128, "epoch": 1241} {"train_loss": -5.85962438583374, "global_step": 52129, "epoch": 1241} {"train_loss": -5.890139102935791, "global_step": 52130, "epoch": 1241} {"train_loss": -5.738611698150635, "global_step": 52131, "epoch": 1241} {"train_loss": -5.824336051940918, "global_step": 52132, "epoch": 1241} {"train_loss": -5.854337692260742, "global_step": 52133, "epoch": 1241} {"train_loss": -5.862421989440918, "global_step": 52134, "epoch": 1241} {"train_loss": -5.71199369430542, "global_step": 52135, "epoch": 1241} {"train_loss": -5.7359089851379395, "global_step": 52136, "epoch": 1241} {"train_loss": -5.841433525085449, "global_step": 52137, "epoch": 1241} {"train_loss": -5.687062740325928, "global_step": 52138, "epoch": 1241} {"train_loss": -5.898897171020508, "global_step": 52139, "epoch": 1241} {"train_loss": -5.826568603515625, "global_step": 52140, "epoch": 1241} {"train_loss": -5.717453956604004, "global_step": 52141, "epoch": 1241} {"train_loss": -5.85888147354126, "global_step": 52142, "epoch": 1241} {"train_loss": -5.811166763305664, "global_step": 52143, "epoch": 1241} {"train_loss": -5.9463300704956055, "global_step": 52144, "epoch": 1241} {"train_loss": -5.786066055297852, "global_step": 52145, "epoch": 1241} {"train_loss": -5.762784957885742, "global_step": 52146, "epoch": 1241} {"train_loss": -5.795736312866211, "global_step": 52147, "epoch": 1241} {"train_loss": -5.959708213806152, "global_step": 52148, "epoch": 1241} {"train_loss": -5.731307506561279, "global_step": 52149, "epoch": 1241} {"train_loss": -5.7414326667785645, "global_step": 52150, "epoch": 1241} {"train_loss": -5.829798698425293, "global_step": 52151, "epoch": 1241} {"train_loss": -5.798159122467041, "global_step": 52152, "epoch": 1241} {"train_loss": -5.741840362548828, "global_step": 52153, "epoch": 1241} {"train_loss": -5.701803207397461, "global_step": 52154, "epoch": 1241} {"train_loss": -5.77349328994751, "global_step": 52155, "epoch": 1241} {"train_loss": -5.691727638244629, "global_step": 52156, "epoch": 1241} {"train_loss": -5.765027046203613, "global_step": 52157, "epoch": 1241} {"train_loss": -5.680657863616943, "global_step": 52158, "epoch": 1241} {"train_loss": -5.8423333168029785, "global_step": 52159, "epoch": 1241} {"train_loss": -5.682835578918457, "global_step": 52160, "epoch": 1241} {"train_loss": -5.7309675216674805, "global_step": 52161, "epoch": 1241} {"train_loss": -5.758806228637695, "global_step": 52162, "epoch": 1241} {"train_loss": -5.793169180552165, "global_step": 52163, "epoch": 1241, "val_loss": 74646.421875} {"train_loss": -5.877405166625977, "global_step": 52164, "epoch": 1242} {"train_loss": -5.777421951293945, "global_step": 52165, "epoch": 1242} {"train_loss": -5.708745956420898, "global_step": 52166, "epoch": 1242} {"train_loss": -5.737003326416016, "global_step": 52167, "epoch": 1242} {"train_loss": -5.84743595123291, "global_step": 52168, "epoch": 1242} {"train_loss": -5.792810440063477, "global_step": 52169, "epoch": 1242} {"train_loss": -5.779374122619629, "global_step": 52170, "epoch": 1242} {"train_loss": -5.759646415710449, "global_step": 52171, "epoch": 1242} {"train_loss": -5.745001792907715, "global_step": 52172, "epoch": 1242} {"train_loss": -5.687973976135254, "global_step": 52173, "epoch": 1242} {"train_loss": -5.877458095550537, "global_step": 52174, "epoch": 1242} {"train_loss": -5.724061489105225, "global_step": 52175, "epoch": 1242} {"train_loss": -5.8055419921875, "global_step": 52176, "epoch": 1242} {"train_loss": -5.707158088684082, "global_step": 52177, "epoch": 1242} {"train_loss": -5.867998123168945, "global_step": 52178, "epoch": 1242} {"train_loss": -5.742529392242432, "global_step": 52179, "epoch": 1242} {"train_loss": -5.8088274002075195, "global_step": 52180, "epoch": 1242} {"train_loss": -5.825409889221191, "global_step": 52181, "epoch": 1242} {"train_loss": -5.835649013519287, "global_step": 52182, "epoch": 1242} {"train_loss": -5.920802116394043, "global_step": 52183, "epoch": 1242} {"train_loss": -5.764848709106445, "global_step": 52184, "epoch": 1242} {"train_loss": -5.671789169311523, "global_step": 52185, "epoch": 1242} {"train_loss": -5.87545108795166, "global_step": 52186, "epoch": 1242} {"train_loss": -5.8898234367370605, "global_step": 52187, "epoch": 1242} {"train_loss": -5.708071708679199, "global_step": 52188, "epoch": 1242} {"train_loss": -5.781455993652344, "global_step": 52189, "epoch": 1242} {"train_loss": -5.649007797241211, "global_step": 52190, "epoch": 1242} {"train_loss": -5.717331409454346, "global_step": 52191, "epoch": 1242} {"train_loss": -5.762063026428223, "global_step": 52192, "epoch": 1242} {"train_loss": -5.741906642913818, "global_step": 52193, "epoch": 1242} {"train_loss": -5.788939952850342, "global_step": 52194, "epoch": 1242} {"train_loss": -5.788616180419922, "global_step": 52195, "epoch": 1242} {"train_loss": -5.733590126037598, "global_step": 52196, "epoch": 1242} {"train_loss": -5.635573387145996, "global_step": 52197, "epoch": 1242} {"train_loss": -5.803471565246582, "global_step": 52198, "epoch": 1242} {"train_loss": -5.820180416107178, "global_step": 52199, "epoch": 1242} {"train_loss": -5.637347221374512, "global_step": 52200, "epoch": 1242} {"train_loss": -5.957265853881836, "global_step": 52201, "epoch": 1242} {"train_loss": -5.771756172180176, "global_step": 52202, "epoch": 1242} {"train_loss": -5.707615852355957, "global_step": 52203, "epoch": 1242} {"train_loss": -5.770232677459717, "global_step": 52204, "epoch": 1242} {"train_loss": -5.779418275469825, "global_step": 52205, "epoch": 1242, "val_loss": 74816.671875} {"train_loss": -5.7081499099731445, "global_step": 52206, "epoch": 1243} {"train_loss": -5.633932113647461, "global_step": 52207, "epoch": 1243} {"train_loss": -5.7918829917907715, "global_step": 52208, "epoch": 1243} {"train_loss": -5.78850793838501, "global_step": 52209, "epoch": 1243} {"train_loss": -5.871046543121338, "global_step": 52210, "epoch": 1243} {"train_loss": -5.798208713531494, "global_step": 52211, "epoch": 1243} {"train_loss": -5.798084259033203, "global_step": 52212, "epoch": 1243} {"train_loss": -5.876202583312988, "global_step": 52213, "epoch": 1243} {"train_loss": -5.7977118492126465, "global_step": 52214, "epoch": 1243} {"train_loss": -5.688612937927246, "global_step": 52215, "epoch": 1243} {"train_loss": -5.782527923583984, "global_step": 52216, "epoch": 1243} {"train_loss": -5.801292419433594, "global_step": 52217, "epoch": 1243} {"train_loss": -5.7698516845703125, "global_step": 52218, "epoch": 1243} {"train_loss": -5.804288864135742, "global_step": 52219, "epoch": 1243} {"train_loss": -5.860945224761963, "global_step": 52220, "epoch": 1243} {"train_loss": -5.800779819488525, "global_step": 52221, "epoch": 1243} {"train_loss": -5.849287986755371, "global_step": 52222, "epoch": 1243} {"train_loss": -5.892920970916748, "global_step": 52223, "epoch": 1243} {"train_loss": -5.950389862060547, "global_step": 52224, "epoch": 1243} {"train_loss": -5.72973108291626, "global_step": 52225, "epoch": 1243} {"train_loss": -5.706383228302002, "global_step": 52226, "epoch": 1243} {"train_loss": -5.73966646194458, "global_step": 52227, "epoch": 1243} {"train_loss": -5.780147552490234, "global_step": 52228, "epoch": 1243} {"train_loss": -5.844263553619385, "global_step": 52229, "epoch": 1243} {"train_loss": -5.809159278869629, "global_step": 52230, "epoch": 1243} {"train_loss": -5.765005588531494, "global_step": 52231, "epoch": 1243} {"train_loss": -5.685866355895996, "global_step": 52232, "epoch": 1243} {"train_loss": -5.967932224273682, "global_step": 52233, "epoch": 1243} {"train_loss": -5.779509544372559, "global_step": 52234, "epoch": 1243} {"train_loss": -5.768155097961426, "global_step": 52235, "epoch": 1243} {"train_loss": -5.7478227615356445, "global_step": 52236, "epoch": 1243} {"train_loss": -5.729355812072754, "global_step": 52237, "epoch": 1243} {"train_loss": -5.829806327819824, "global_step": 52238, "epoch": 1243} {"train_loss": -5.691612720489502, "global_step": 52239, "epoch": 1243} {"train_loss": -5.794712066650391, "global_step": 52240, "epoch": 1243} {"train_loss": -5.632426738739014, "global_step": 52241, "epoch": 1243} {"train_loss": -5.758969306945801, "global_step": 52242, "epoch": 1243} {"train_loss": -5.7275309562683105, "global_step": 52243, "epoch": 1243} {"train_loss": -5.620086193084717, "global_step": 52244, "epoch": 1243} {"train_loss": -5.722742557525635, "global_step": 52245, "epoch": 1243} {"train_loss": -5.667484283447266, "global_step": 52246, "epoch": 1243} {"train_loss": -5.772543997991653, "global_step": 52247, "epoch": 1243, "val_loss": 74410.3515625} {"train_loss": -5.808720588684082, "global_step": 52248, "epoch": 1244} {"train_loss": -5.720008373260498, "global_step": 52249, "epoch": 1244} {"train_loss": -5.913332939147949, "global_step": 52250, "epoch": 1244} {"train_loss": -5.750131607055664, "global_step": 52251, "epoch": 1244} {"train_loss": -5.6895647048950195, "global_step": 52252, "epoch": 1244} {"train_loss": -5.8337578773498535, "global_step": 52253, "epoch": 1244} {"train_loss": -5.796821594238281, "global_step": 52254, "epoch": 1244} {"train_loss": -5.727538585662842, "global_step": 52255, "epoch": 1244} {"train_loss": -5.857488632202148, "global_step": 52256, "epoch": 1244} {"train_loss": -5.6708478927612305, "global_step": 52257, "epoch": 1244} {"train_loss": -5.8028974533081055, "global_step": 52258, "epoch": 1244} {"train_loss": -5.919904708862305, "global_step": 52259, "epoch": 1244} {"train_loss": -5.794098854064941, "global_step": 52260, "epoch": 1244} {"train_loss": -5.903751373291016, "global_step": 52261, "epoch": 1244} {"train_loss": -5.712353229522705, "global_step": 52262, "epoch": 1244} {"train_loss": -5.852015495300293, "global_step": 52263, "epoch": 1244} {"train_loss": -5.78270959854126, "global_step": 52264, "epoch": 1244} {"train_loss": -5.793992519378662, "global_step": 52265, "epoch": 1244} {"train_loss": -5.817595481872559, "global_step": 52266, "epoch": 1244} {"train_loss": -5.869865417480469, "global_step": 52267, "epoch": 1244} {"train_loss": -5.798673629760742, "global_step": 52268, "epoch": 1244} {"train_loss": -5.80185604095459, "global_step": 52269, "epoch": 1244} {"train_loss": -5.839638710021973, "global_step": 52270, "epoch": 1244} {"train_loss": -5.897792816162109, "global_step": 52271, "epoch": 1244} {"train_loss": -5.860321044921875, "global_step": 52272, "epoch": 1244} {"train_loss": -5.77879524230957, "global_step": 52273, "epoch": 1244} {"train_loss": -5.893144130706787, "global_step": 52274, "epoch": 1244} {"train_loss": -5.869650840759277, "global_step": 52275, "epoch": 1244} {"train_loss": -5.721888065338135, "global_step": 52276, "epoch": 1244} {"train_loss": -5.728898048400879, "global_step": 52277, "epoch": 1244} {"train_loss": -5.738104820251465, "global_step": 52278, "epoch": 1244} {"train_loss": -5.8562822341918945, "global_step": 52279, "epoch": 1244} {"train_loss": -5.918835639953613, "global_step": 52280, "epoch": 1244} {"train_loss": -5.653064727783203, "global_step": 52281, "epoch": 1244} {"train_loss": -5.750616073608398, "global_step": 52282, "epoch": 1244} {"train_loss": -5.784853935241699, "global_step": 52283, "epoch": 1244} {"train_loss": -5.823644161224365, "global_step": 52284, "epoch": 1244} {"train_loss": -5.83035135269165, "global_step": 52285, "epoch": 1244} {"train_loss": -5.881576061248779, "global_step": 52286, "epoch": 1244} {"train_loss": -5.745430946350098, "global_step": 52287, "epoch": 1244} {"train_loss": -5.842669486999512, "global_step": 52288, "epoch": 1244} {"train_loss": -5.806334166299729, "global_step": 52289, "epoch": 1244, "val_loss": 74250.3515625} {"train_loss": -5.743175029754639, "global_step": 52290, "epoch": 1245} {"train_loss": -5.711704730987549, "global_step": 52291, "epoch": 1245} {"train_loss": -5.72072172164917, "global_step": 52292, "epoch": 1245} {"train_loss": -5.758919715881348, "global_step": 52293, "epoch": 1245} {"train_loss": -5.718616485595703, "global_step": 52294, "epoch": 1245} {"train_loss": -5.75730037689209, "global_step": 52295, "epoch": 1245} {"train_loss": -5.861652374267578, "global_step": 52296, "epoch": 1245} {"train_loss": -5.710752487182617, "global_step": 52297, "epoch": 1245} {"train_loss": -5.808704853057861, "global_step": 52298, "epoch": 1245} {"train_loss": -5.807992935180664, "global_step": 52299, "epoch": 1245} {"train_loss": -5.713062763214111, "global_step": 52300, "epoch": 1245} {"train_loss": -5.727904319763184, "global_step": 52301, "epoch": 1245} {"train_loss": -5.649043083190918, "global_step": 52302, "epoch": 1245} {"train_loss": -5.666277885437012, "global_step": 52303, "epoch": 1245} {"train_loss": -5.77932071685791, "global_step": 52304, "epoch": 1245} {"train_loss": -5.795225143432617, "global_step": 52305, "epoch": 1245} {"train_loss": -5.744778633117676, "global_step": 52306, "epoch": 1245} {"train_loss": -5.768567085266113, "global_step": 52307, "epoch": 1245} {"train_loss": -5.730662822723389, "global_step": 52308, "epoch": 1245} {"train_loss": -5.813920974731445, "global_step": 52309, "epoch": 1245} {"train_loss": -5.724565029144287, "global_step": 52310, "epoch": 1245} {"train_loss": -5.854418754577637, "global_step": 52311, "epoch": 1245} {"train_loss": -5.668445587158203, "global_step": 52312, "epoch": 1245} {"train_loss": -5.781932830810547, "global_step": 52313, "epoch": 1245} {"train_loss": -5.786947250366211, "global_step": 52314, "epoch": 1245} {"train_loss": -5.740996360778809, "global_step": 52315, "epoch": 1245} {"train_loss": -5.708049774169922, "global_step": 52316, "epoch": 1245} {"train_loss": -5.669984340667725, "global_step": 52317, "epoch": 1245} {"train_loss": -5.707116603851318, "global_step": 52318, "epoch": 1245} {"train_loss": -5.743722915649414, "global_step": 52319, "epoch": 1245} {"train_loss": -5.77017879486084, "global_step": 52320, "epoch": 1245} {"train_loss": -5.744627952575684, "global_step": 52321, "epoch": 1245} {"train_loss": -5.789542198181152, "global_step": 52322, "epoch": 1245} {"train_loss": -5.730429649353027, "global_step": 52323, "epoch": 1245} {"train_loss": -5.8121843338012695, "global_step": 52324, "epoch": 1245} {"train_loss": -5.736025333404541, "global_step": 52325, "epoch": 1245} {"train_loss": -5.861087799072266, "global_step": 52326, "epoch": 1245} {"train_loss": -5.899711608886719, "global_step": 52327, "epoch": 1245} {"train_loss": -5.752513885498047, "global_step": 52328, "epoch": 1245} {"train_loss": -5.920141220092773, "global_step": 52329, "epoch": 1245} {"train_loss": -5.716814041137695, "global_step": 52330, "epoch": 1245} {"train_loss": -5.75906152952285, "global_step": 52331, "epoch": 1245, "val_loss": 75414.625} {"train_loss": -5.76908540725708, "global_step": 52332, "epoch": 1246} {"train_loss": -5.7703537940979, "global_step": 52333, "epoch": 1246} {"train_loss": -5.826753616333008, "global_step": 52334, "epoch": 1246} {"train_loss": -5.647387981414795, "global_step": 52335, "epoch": 1246} {"train_loss": -5.842859745025635, "global_step": 52336, "epoch": 1246} {"train_loss": -5.730608940124512, "global_step": 52337, "epoch": 1246} {"train_loss": -5.656120300292969, "global_step": 52338, "epoch": 1246} {"train_loss": -5.746035575866699, "global_step": 52339, "epoch": 1246} {"train_loss": -5.783206939697266, "global_step": 52340, "epoch": 1246} {"train_loss": -5.7665510177612305, "global_step": 52341, "epoch": 1246} {"train_loss": -5.633001327514648, "global_step": 52342, "epoch": 1246} {"train_loss": -5.76075553894043, "global_step": 52343, "epoch": 1246} {"train_loss": -5.782735824584961, "global_step": 52344, "epoch": 1246} {"train_loss": -5.676877975463867, "global_step": 52345, "epoch": 1246} {"train_loss": -5.772719860076904, "global_step": 52346, "epoch": 1246} {"train_loss": -5.779252529144287, "global_step": 52347, "epoch": 1246} {"train_loss": -5.895276069641113, "global_step": 52348, "epoch": 1246} {"train_loss": -5.80820369720459, "global_step": 52349, "epoch": 1246} {"train_loss": -5.710782051086426, "global_step": 52350, "epoch": 1246} {"train_loss": -5.775932788848877, "global_step": 52351, "epoch": 1246} {"train_loss": -5.741991996765137, "global_step": 52352, "epoch": 1246} {"train_loss": -5.711885452270508, "global_step": 52353, "epoch": 1246} {"train_loss": -5.765130519866943, "global_step": 52354, "epoch": 1246} {"train_loss": -5.686935901641846, "global_step": 52355, "epoch": 1246} {"train_loss": -5.7990217208862305, "global_step": 52356, "epoch": 1246} {"train_loss": -5.8283891677856445, "global_step": 52357, "epoch": 1246} {"train_loss": -5.809473514556885, "global_step": 52358, "epoch": 1246} {"train_loss": -5.728785514831543, "global_step": 52359, "epoch": 1246} {"train_loss": -5.723575115203857, "global_step": 52360, "epoch": 1246} {"train_loss": -5.754739761352539, "global_step": 52361, "epoch": 1246} {"train_loss": -5.8649582862854, "global_step": 52362, "epoch": 1246} {"train_loss": -5.855767250061035, "global_step": 52363, "epoch": 1246} {"train_loss": -5.869917392730713, "global_step": 52364, "epoch": 1246} {"train_loss": -5.847914695739746, "global_step": 52365, "epoch": 1246} {"train_loss": -5.81669807434082, "global_step": 52366, "epoch": 1246} {"train_loss": -5.86236572265625, "global_step": 52367, "epoch": 1246} {"train_loss": -5.800772666931152, "global_step": 52368, "epoch": 1246} {"train_loss": -5.7464919090271, "global_step": 52369, "epoch": 1246} {"train_loss": -5.809884071350098, "global_step": 52370, "epoch": 1246} {"train_loss": -5.838892936706543, "global_step": 52371, "epoch": 1246} {"train_loss": -5.781864643096924, "global_step": 52372, "epoch": 1246} {"train_loss": -5.779125622340611, "global_step": 52373, "epoch": 1246, "val_loss": 74129.3671875} {"train_loss": -5.834941864013672, "global_step": 52374, "epoch": 1247} {"train_loss": -5.750898361206055, "global_step": 52375, "epoch": 1247} {"train_loss": -5.823567867279053, "global_step": 52376, "epoch": 1247} {"train_loss": -5.856410503387451, "global_step": 52377, "epoch": 1247} {"train_loss": -5.923044681549072, "global_step": 52378, "epoch": 1247} {"train_loss": -5.72472620010376, "global_step": 52379, "epoch": 1247} {"train_loss": -5.753389835357666, "global_step": 52380, "epoch": 1247} {"train_loss": -5.934103012084961, "global_step": 52381, "epoch": 1247} {"train_loss": -5.906562805175781, "global_step": 52382, "epoch": 1247} {"train_loss": -5.905901908874512, "global_step": 52383, "epoch": 1247} {"train_loss": -5.749066352844238, "global_step": 52384, "epoch": 1247} {"train_loss": -5.715307712554932, "global_step": 52385, "epoch": 1247} {"train_loss": -5.679258346557617, "global_step": 52386, "epoch": 1247} {"train_loss": -5.8806986808776855, "global_step": 52387, "epoch": 1247} {"train_loss": -5.794894695281982, "global_step": 52388, "epoch": 1247} {"train_loss": -5.659296035766602, "global_step": 52389, "epoch": 1247} {"train_loss": -5.780551910400391, "global_step": 52390, "epoch": 1247} {"train_loss": -5.743843078613281, "global_step": 52391, "epoch": 1247} {"train_loss": -5.783378601074219, "global_step": 52392, "epoch": 1247} {"train_loss": -5.907169818878174, "global_step": 52393, "epoch": 1247} {"train_loss": -5.816695213317871, "global_step": 52394, "epoch": 1247} {"train_loss": -5.828367710113525, "global_step": 52395, "epoch": 1247} {"train_loss": -5.835197448730469, "global_step": 52396, "epoch": 1247} {"train_loss": -5.678603172302246, "global_step": 52397, "epoch": 1247} {"train_loss": -5.794520378112793, "global_step": 52398, "epoch": 1247} {"train_loss": -5.7458696365356445, "global_step": 52399, "epoch": 1247} {"train_loss": -5.812378406524658, "global_step": 52400, "epoch": 1247} {"train_loss": -5.796440124511719, "global_step": 52401, "epoch": 1247} {"train_loss": -5.780925750732422, "global_step": 52402, "epoch": 1247} {"train_loss": -5.855149269104004, "global_step": 52403, "epoch": 1247} {"train_loss": -5.8069047927856445, "global_step": 52404, "epoch": 1247} {"train_loss": -5.773645401000977, "global_step": 52405, "epoch": 1247} {"train_loss": -5.759526252746582, "global_step": 52406, "epoch": 1247} {"train_loss": -5.6299285888671875, "global_step": 52407, "epoch": 1247} {"train_loss": -5.789007186889648, "global_step": 52408, "epoch": 1247} {"train_loss": -5.722225189208984, "global_step": 52409, "epoch": 1247} {"train_loss": -5.785029411315918, "global_step": 52410, "epoch": 1247} {"train_loss": -5.7085113525390625, "global_step": 52411, "epoch": 1247} {"train_loss": -5.766932487487793, "global_step": 52412, "epoch": 1247} {"train_loss": -5.892192363739014, "global_step": 52413, "epoch": 1247} {"train_loss": -5.781040668487549, "global_step": 52414, "epoch": 1247} {"train_loss": -5.791276261920021, "global_step": 52415, "epoch": 1247, "val_loss": 74471.6796875} {"train_loss": -5.774239540100098, "global_step": 52416, "epoch": 1248} {"train_loss": -5.856057167053223, "global_step": 52417, "epoch": 1248} {"train_loss": -5.795853614807129, "global_step": 52418, "epoch": 1248} {"train_loss": -5.756203651428223, "global_step": 52419, "epoch": 1248} {"train_loss": -5.741407871246338, "global_step": 52420, "epoch": 1248} {"train_loss": -5.8102264404296875, "global_step": 52421, "epoch": 1248} {"train_loss": -5.8155012130737305, "global_step": 52422, "epoch": 1248} {"train_loss": -5.835900783538818, "global_step": 52423, "epoch": 1248} {"train_loss": -5.730684280395508, "global_step": 52424, "epoch": 1248} {"train_loss": -5.794921875, "global_step": 52425, "epoch": 1248} {"train_loss": -5.829597473144531, "global_step": 52426, "epoch": 1248} {"train_loss": -6.0486650466918945, "global_step": 52427, "epoch": 1248} {"train_loss": -5.784924030303955, "global_step": 52428, "epoch": 1248} {"train_loss": -5.677712440490723, "global_step": 52429, "epoch": 1248} {"train_loss": -5.792173385620117, "global_step": 52430, "epoch": 1248} {"train_loss": -5.6900634765625, "global_step": 52431, "epoch": 1248} {"train_loss": -5.704682350158691, "global_step": 52432, "epoch": 1248} {"train_loss": -5.915287971496582, "global_step": 52433, "epoch": 1248} {"train_loss": -5.9280290603637695, "global_step": 52434, "epoch": 1248} {"train_loss": -5.715288162231445, "global_step": 52435, "epoch": 1248} {"train_loss": -5.750083923339844, "global_step": 52436, "epoch": 1248} {"train_loss": -5.791731357574463, "global_step": 52437, "epoch": 1248} {"train_loss": -5.760890007019043, "global_step": 52438, "epoch": 1248} {"train_loss": -5.744976997375488, "global_step": 52439, "epoch": 1248} {"train_loss": -5.819001197814941, "global_step": 52440, "epoch": 1248} {"train_loss": -5.691262245178223, "global_step": 52441, "epoch": 1248} {"train_loss": -5.83240270614624, "global_step": 52442, "epoch": 1248} {"train_loss": -5.683807373046875, "global_step": 52443, "epoch": 1248} {"train_loss": -5.791847229003906, "global_step": 52444, "epoch": 1248} {"train_loss": -5.833774089813232, "global_step": 52445, "epoch": 1248} {"train_loss": -5.719531059265137, "global_step": 52446, "epoch": 1248} {"train_loss": -5.661532878875732, "global_step": 52447, "epoch": 1248} {"train_loss": -5.7978644371032715, "global_step": 52448, "epoch": 1248} {"train_loss": -5.774359703063965, "global_step": 52449, "epoch": 1248} {"train_loss": -5.655246734619141, "global_step": 52450, "epoch": 1248} {"train_loss": -5.787640571594238, "global_step": 52451, "epoch": 1248} {"train_loss": -5.766049385070801, "global_step": 52452, "epoch": 1248} {"train_loss": -5.661191463470459, "global_step": 52453, "epoch": 1248} {"train_loss": -5.850834369659424, "global_step": 52454, "epoch": 1248} {"train_loss": -5.89310359954834, "global_step": 52455, "epoch": 1248} {"train_loss": -5.903685092926025, "global_step": 52456, "epoch": 1248} {"train_loss": -5.787852491651263, "global_step": 52457, "epoch": 1248, "val_loss": 74480.0859375} {"train_loss": -5.804819107055664, "global_step": 52458, "epoch": 1249} {"train_loss": -5.772920608520508, "global_step": 52459, "epoch": 1249} {"train_loss": -5.752109527587891, "global_step": 52460, "epoch": 1249} {"train_loss": -5.851981163024902, "global_step": 52461, "epoch": 1249} {"train_loss": -5.830497741699219, "global_step": 52462, "epoch": 1249} {"train_loss": -5.752861022949219, "global_step": 52463, "epoch": 1249} {"train_loss": -5.726781845092773, "global_step": 52464, "epoch": 1249} {"train_loss": -5.837403297424316, "global_step": 52465, "epoch": 1249} {"train_loss": -5.694914817810059, "global_step": 52466, "epoch": 1249} {"train_loss": -5.803949356079102, "global_step": 52467, "epoch": 1249} {"train_loss": -5.722862243652344, "global_step": 52468, "epoch": 1249} {"train_loss": -5.895059585571289, "global_step": 52469, "epoch": 1249} {"train_loss": -5.677762985229492, "global_step": 52470, "epoch": 1249} {"train_loss": -5.735273361206055, "global_step": 52471, "epoch": 1249} {"train_loss": -5.972107887268066, "global_step": 52472, "epoch": 1249} {"train_loss": -5.76829195022583, "global_step": 52473, "epoch": 1249} {"train_loss": -5.7883524894714355, "global_step": 52474, "epoch": 1249} {"train_loss": -5.782995223999023, "global_step": 52475, "epoch": 1249} {"train_loss": -5.675538063049316, "global_step": 52476, "epoch": 1249} {"train_loss": -5.886502265930176, "global_step": 52477, "epoch": 1249} {"train_loss": -5.673078536987305, "global_step": 52478, "epoch": 1249} {"train_loss": -5.79177188873291, "global_step": 52479, "epoch": 1249} {"train_loss": -5.706386566162109, "global_step": 52480, "epoch": 1249} {"train_loss": -5.6400556564331055, "global_step": 52481, "epoch": 1249} {"train_loss": -5.713061332702637, "global_step": 52482, "epoch": 1249} {"train_loss": -5.712730407714844, "global_step": 52483, "epoch": 1249} {"train_loss": -5.787655353546143, "global_step": 52484, "epoch": 1249} {"train_loss": -5.714829444885254, "global_step": 52485, "epoch": 1249} {"train_loss": -5.722692489624023, "global_step": 52486, "epoch": 1249} {"train_loss": -5.821352005004883, "global_step": 52487, "epoch": 1249} {"train_loss": -5.804862022399902, "global_step": 52488, "epoch": 1249} {"train_loss": -5.739871978759766, "global_step": 52489, "epoch": 1249} {"train_loss": -5.86885929107666, "global_step": 52490, "epoch": 1249} {"train_loss": -5.804155349731445, "global_step": 52491, "epoch": 1249} {"train_loss": -5.699108123779297, "global_step": 52492, "epoch": 1249} {"train_loss": -5.7884674072265625, "global_step": 52493, "epoch": 1249} {"train_loss": -5.795937538146973, "global_step": 52494, "epoch": 1249} {"train_loss": -5.6771721839904785, "global_step": 52495, "epoch": 1249} {"train_loss": -5.716399192810059, "global_step": 52496, "epoch": 1249} {"train_loss": -5.927467346191406, "global_step": 52497, "epoch": 1249} {"train_loss": -5.8069939613342285, "global_step": 52498, "epoch": 1249} {"train_loss": -5.769333033334641, "global_step": 52499, "epoch": 1249, "val_loss": 73915.53125} {"train_loss": -5.775150299072266, "global_step": 52500, "epoch": 1250} {"train_loss": -5.899044036865234, "global_step": 52501, "epoch": 1250} {"train_loss": -5.832876205444336, "global_step": 52502, "epoch": 1250} {"train_loss": -5.837995529174805, "global_step": 52503, "epoch": 1250} {"train_loss": -5.822233200073242, "global_step": 52504, "epoch": 1250} {"train_loss": -5.670536041259766, "global_step": 52505, "epoch": 1250} {"train_loss": -5.728912830352783, "global_step": 52506, "epoch": 1250} {"train_loss": -5.810513496398926, "global_step": 52507, "epoch": 1250} {"train_loss": -5.752970218658447, "global_step": 52508, "epoch": 1250} {"train_loss": -5.855633735656738, "global_step": 52509, "epoch": 1250} {"train_loss": -5.85613489151001, "global_step": 52510, "epoch": 1250} {"train_loss": -5.757701873779297, "global_step": 52511, "epoch": 1250} {"train_loss": -5.908812522888184, "global_step": 52512, "epoch": 1250} {"train_loss": -5.7579240798950195, "global_step": 52513, "epoch": 1250} {"train_loss": -5.9151153564453125, "global_step": 52514, "epoch": 1250} {"train_loss": -5.68508243560791, "global_step": 52515, "epoch": 1250} {"train_loss": -5.789192199707031, "global_step": 52516, "epoch": 1250} {"train_loss": -5.777099609375, "global_step": 52517, "epoch": 1250} {"train_loss": -5.799272537231445, "global_step": 52518, "epoch": 1250} {"train_loss": -5.804441452026367, "global_step": 52519, "epoch": 1250} {"train_loss": -5.765430450439453, "global_step": 52520, "epoch": 1250} {"train_loss": -5.725783348083496, "global_step": 52521, "epoch": 1250} {"train_loss": -5.805542945861816, "global_step": 52522, "epoch": 1250} {"train_loss": -5.684397220611572, "global_step": 52523, "epoch": 1250} {"train_loss": -5.830687999725342, "global_step": 52524, "epoch": 1250} {"train_loss": -5.871714115142822, "global_step": 52525, "epoch": 1250} {"train_loss": -5.665384292602539, "global_step": 52526, "epoch": 1250} {"train_loss": -5.8394775390625, "global_step": 52527, "epoch": 1250} {"train_loss": -5.735065937042236, "global_step": 52528, "epoch": 1250} {"train_loss": -5.901434898376465, "global_step": 52529, "epoch": 1250} {"train_loss": -5.917824745178223, "global_step": 52530, "epoch": 1250} {"train_loss": -5.626741409301758, "global_step": 52531, "epoch": 1250} {"train_loss": -5.877915382385254, "global_step": 52532, "epoch": 1250} {"train_loss": -5.872931003570557, "global_step": 52533, "epoch": 1250} {"train_loss": -5.696907997131348, "global_step": 52534, "epoch": 1250} {"train_loss": -5.872793197631836, "global_step": 52535, "epoch": 1250} {"train_loss": -5.812347412109375, "global_step": 52536, "epoch": 1250} {"train_loss": -5.833313941955566, "global_step": 52537, "epoch": 1250} {"train_loss": -5.765786647796631, "global_step": 52538, "epoch": 1250} {"train_loss": -5.75384521484375, "global_step": 52539, "epoch": 1250} {"train_loss": -5.833273887634277, "global_step": 52540, "epoch": 1250} {"train_loss": -5.800673076084682, "global_step": 52541, "epoch": 1250, "train/sim_max_reward_0": 0.9259781135480892, "train/sim_max_reward_1": 0.6746580938998343, "train/sim_max_reward_2": 0.5658005653574617, "train/sim_max_reward_3": 0.139431250911733, "train/sim_max_reward_4": 0.41891344779878953, "train/sim_max_reward_5": 0.8228751593256236, "test/sim_max_reward_4500000": 0.32023789377064793, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8816345214129429, "test/sim_max_reward_4500003": 0.5972237466696264, "test/sim_max_reward_4500004": 0.05468702709333585, "test/sim_max_reward_4500005": 0.3888866143425817, "test/sim_max_reward_4500006": 0.9263239097216338, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.2822435325270765, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9602953249983891, "test/sim_max_reward_4500012": 0.0, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.35893905115794306, "test/sim_max_reward_4500015": 0.08646417765588638, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0029722537904241235, "test/sim_max_reward_4500018": 0.11908052867523143, "test/sim_max_reward_4500019": 0.8431386075287456, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9270672845457446, "test/sim_max_reward_4500022": 0.8201786885463579, "test/sim_max_reward_4500023": 0.8061637961067525, "test/sim_max_reward_4500024": 0.8807443076837088, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.07957633617312626, "test/sim_max_reward_4500027": 0.9614858977247588, "test/sim_max_reward_4500028": 0.29505293749083633, "test/sim_max_reward_4500029": 0.11410017684410358, "test/sim_max_reward_4500030": 0.8118268178765659, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9499812973782211, "test/sim_max_reward_4500034": 0.7616545494564403, "test/sim_max_reward_4500035": 0.8394761055162682, "test/sim_max_reward_4500036": 0.9699966393176527, "test/sim_max_reward_4500037": 0.9435492984208298, "test/sim_max_reward_4500038": 0.29931139154823827, "test/sim_max_reward_4500039": 0.9593597848286216, "test/sim_max_reward_4500040": 0.9432075476689471, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.22728128382862545, "test/sim_max_reward_4500044": 0.05085184312018397, "test/sim_max_reward_4500045": 0.828260774958561, "test/sim_max_reward_4500046": 0.7778194602037823, "test/sim_max_reward_4500047": 0.8291207547114255, "test/sim_max_reward_4500048": 0.7616162268389777, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5912761051402552, "test/mean_score": 0.4549260737571206, "val_loss": 74124.890625} {"train_loss": -5.887612819671631, "global_step": 52542, "epoch": 1251} {"train_loss": -5.812414169311523, "global_step": 52543, "epoch": 1251} {"train_loss": -5.7581634521484375, "global_step": 52544, "epoch": 1251} {"train_loss": -5.840183258056641, "global_step": 52545, "epoch": 1251} {"train_loss": -5.906391143798828, "global_step": 52546, "epoch": 1251} {"train_loss": -5.891623497009277, "global_step": 52547, "epoch": 1251} {"train_loss": -5.858572006225586, "global_step": 52548, "epoch": 1251} {"train_loss": -5.787996292114258, "global_step": 52549, "epoch": 1251} {"train_loss": -5.752801895141602, "global_step": 52550, "epoch": 1251} {"train_loss": -5.752313613891602, "global_step": 52551, "epoch": 1251} {"train_loss": -5.834548473358154, "global_step": 52552, "epoch": 1251} {"train_loss": -5.668392181396484, "global_step": 52553, "epoch": 1251} {"train_loss": -5.840047359466553, "global_step": 52554, "epoch": 1251} {"train_loss": -5.906425952911377, "global_step": 52555, "epoch": 1251} {"train_loss": -5.812012672424316, "global_step": 52556, "epoch": 1251} {"train_loss": -5.785005569458008, "global_step": 52557, "epoch": 1251} {"train_loss": -5.89516544342041, "global_step": 52558, "epoch": 1251} {"train_loss": -5.7724833488464355, "global_step": 52559, "epoch": 1251} {"train_loss": -5.885745048522949, "global_step": 52560, "epoch": 1251} {"train_loss": -5.807048320770264, "global_step": 52561, "epoch": 1251} {"train_loss": -5.805173397064209, "global_step": 52562, "epoch": 1251} {"train_loss": -5.79918098449707, "global_step": 52563, "epoch": 1251} {"train_loss": -5.832773208618164, "global_step": 52564, "epoch": 1251} {"train_loss": -5.677822113037109, "global_step": 52565, "epoch": 1251} {"train_loss": -5.82060432434082, "global_step": 52566, "epoch": 1251} {"train_loss": -5.750310897827148, "global_step": 52567, "epoch": 1251} {"train_loss": -5.677938461303711, "global_step": 52568, "epoch": 1251} {"train_loss": -5.826013565063477, "global_step": 52569, "epoch": 1251} {"train_loss": -5.633088111877441, "global_step": 52570, "epoch": 1251} {"train_loss": -5.824942111968994, "global_step": 52571, "epoch": 1251} {"train_loss": -5.793222427368164, "global_step": 52572, "epoch": 1251} {"train_loss": -5.707457542419434, "global_step": 52573, "epoch": 1251} {"train_loss": -5.834649085998535, "global_step": 52574, "epoch": 1251} {"train_loss": -5.816475868225098, "global_step": 52575, "epoch": 1251} {"train_loss": -5.809052467346191, "global_step": 52576, "epoch": 1251} {"train_loss": -5.832827091217041, "global_step": 52577, "epoch": 1251} {"train_loss": -5.623294353485107, "global_step": 52578, "epoch": 1251} {"train_loss": -5.790487289428711, "global_step": 52579, "epoch": 1251} {"train_loss": -5.783075332641602, "global_step": 52580, "epoch": 1251} {"train_loss": -5.802873611450195, "global_step": 52581, "epoch": 1251} {"train_loss": -6.02288818359375, "global_step": 52582, "epoch": 1251} {"train_loss": -5.80671307018825, "global_step": 52583, "epoch": 1251, "val_loss": 74184.2734375} {"train_loss": -5.906764984130859, "global_step": 52584, "epoch": 1252} {"train_loss": -5.779954433441162, "global_step": 52585, "epoch": 1252} {"train_loss": -5.898232460021973, "global_step": 52586, "epoch": 1252} {"train_loss": -5.780208587646484, "global_step": 52587, "epoch": 1252} {"train_loss": -5.849605560302734, "global_step": 52588, "epoch": 1252} {"train_loss": -5.960613250732422, "global_step": 52589, "epoch": 1252} {"train_loss": -5.931591987609863, "global_step": 52590, "epoch": 1252} {"train_loss": -5.8682966232299805, "global_step": 52591, "epoch": 1252} {"train_loss": -5.592672348022461, "global_step": 52592, "epoch": 1252} {"train_loss": -5.779537200927734, "global_step": 52593, "epoch": 1252} {"train_loss": -5.8754987716674805, "global_step": 52594, "epoch": 1252} {"train_loss": -5.87879753112793, "global_step": 52595, "epoch": 1252} {"train_loss": -5.807180404663086, "global_step": 52596, "epoch": 1252} {"train_loss": -5.733381748199463, "global_step": 52597, "epoch": 1252} {"train_loss": -5.784945487976074, "global_step": 52598, "epoch": 1252} {"train_loss": -5.734097480773926, "global_step": 52599, "epoch": 1252} {"train_loss": -5.682528495788574, "global_step": 52600, "epoch": 1252} {"train_loss": -5.748736381530762, "global_step": 52601, "epoch": 1252} {"train_loss": -5.840883255004883, "global_step": 52602, "epoch": 1252} {"train_loss": -5.842272758483887, "global_step": 52603, "epoch": 1252} {"train_loss": -5.803967475891113, "global_step": 52604, "epoch": 1252} {"train_loss": -5.937936782836914, "global_step": 52605, "epoch": 1252} {"train_loss": -5.78415584564209, "global_step": 52606, "epoch": 1252} {"train_loss": -5.9203996658325195, "global_step": 52607, "epoch": 1252} {"train_loss": -5.832531929016113, "global_step": 52608, "epoch": 1252} {"train_loss": -5.689101219177246, "global_step": 52609, "epoch": 1252} {"train_loss": -5.681169509887695, "global_step": 52610, "epoch": 1252} {"train_loss": -5.731657028198242, "global_step": 52611, "epoch": 1252} {"train_loss": -5.81939697265625, "global_step": 52612, "epoch": 1252} {"train_loss": -5.829168319702148, "global_step": 52613, "epoch": 1252} {"train_loss": -5.716342926025391, "global_step": 52614, "epoch": 1252} {"train_loss": -5.894478797912598, "global_step": 52615, "epoch": 1252} {"train_loss": -5.794854640960693, "global_step": 52616, "epoch": 1252} {"train_loss": -5.789559364318848, "global_step": 52617, "epoch": 1252} {"train_loss": -5.81544828414917, "global_step": 52618, "epoch": 1252} {"train_loss": -5.853686332702637, "global_step": 52619, "epoch": 1252} {"train_loss": -5.75284481048584, "global_step": 52620, "epoch": 1252} {"train_loss": -5.832785606384277, "global_step": 52621, "epoch": 1252} {"train_loss": -5.800751686096191, "global_step": 52622, "epoch": 1252} {"train_loss": -5.760822296142578, "global_step": 52623, "epoch": 1252} {"train_loss": -5.824158668518066, "global_step": 52624, "epoch": 1252} {"train_loss": -5.8068470273699075, "global_step": 52625, "epoch": 1252, "val_loss": 74152.0546875} {"train_loss": -5.851144313812256, "global_step": 52626, "epoch": 1253} {"train_loss": -5.845974922180176, "global_step": 52627, "epoch": 1253} {"train_loss": -5.8174519538879395, "global_step": 52628, "epoch": 1253} {"train_loss": -5.87110710144043, "global_step": 52629, "epoch": 1253} {"train_loss": -5.720673561096191, "global_step": 52630, "epoch": 1253} {"train_loss": -5.816932678222656, "global_step": 52631, "epoch": 1253} {"train_loss": -5.806607246398926, "global_step": 52632, "epoch": 1253} {"train_loss": -5.77202033996582, "global_step": 52633, "epoch": 1253} {"train_loss": -5.861478805541992, "global_step": 52634, "epoch": 1253} {"train_loss": -5.722561836242676, "global_step": 52635, "epoch": 1253} {"train_loss": -5.749462127685547, "global_step": 52636, "epoch": 1253} {"train_loss": -5.766390800476074, "global_step": 52637, "epoch": 1253} {"train_loss": -5.859562873840332, "global_step": 52638, "epoch": 1253} {"train_loss": -5.758952617645264, "global_step": 52639, "epoch": 1253} {"train_loss": -5.903991222381592, "global_step": 52640, "epoch": 1253} {"train_loss": -5.8644819259643555, "global_step": 52641, "epoch": 1253} {"train_loss": -5.670930862426758, "global_step": 52642, "epoch": 1253} {"train_loss": -5.76993465423584, "global_step": 52643, "epoch": 1253} {"train_loss": -5.6051177978515625, "global_step": 52644, "epoch": 1253} {"train_loss": -5.752495288848877, "global_step": 52645, "epoch": 1253} {"train_loss": -5.787978172302246, "global_step": 52646, "epoch": 1253} {"train_loss": -5.708613395690918, "global_step": 52647, "epoch": 1253} {"train_loss": -5.842669486999512, "global_step": 52648, "epoch": 1253} {"train_loss": -5.852819442749023, "global_step": 52649, "epoch": 1253} {"train_loss": -5.8498687744140625, "global_step": 52650, "epoch": 1253} {"train_loss": -5.7298479080200195, "global_step": 52651, "epoch": 1253} {"train_loss": -5.657229423522949, "global_step": 52652, "epoch": 1253} {"train_loss": -5.714737892150879, "global_step": 52653, "epoch": 1253} {"train_loss": -5.636346817016602, "global_step": 52654, "epoch": 1253} {"train_loss": -5.8960652351379395, "global_step": 52655, "epoch": 1253} {"train_loss": -5.639030456542969, "global_step": 52656, "epoch": 1253} {"train_loss": -5.947853088378906, "global_step": 52657, "epoch": 1253} {"train_loss": -5.7616119384765625, "global_step": 52658, "epoch": 1253} {"train_loss": -5.750748634338379, "global_step": 52659, "epoch": 1253} {"train_loss": -5.713820457458496, "global_step": 52660, "epoch": 1253} {"train_loss": -5.853488922119141, "global_step": 52661, "epoch": 1253} {"train_loss": -5.694626808166504, "global_step": 52662, "epoch": 1253} {"train_loss": -5.771733283996582, "global_step": 52663, "epoch": 1253} {"train_loss": -5.780570030212402, "global_step": 52664, "epoch": 1253} {"train_loss": -5.751948356628418, "global_step": 52665, "epoch": 1253} {"train_loss": -5.738741874694824, "global_step": 52666, "epoch": 1253} {"train_loss": -5.775931732995169, "global_step": 52667, "epoch": 1253, "val_loss": 74322.34375} {"train_loss": -5.839911460876465, "global_step": 52668, "epoch": 1254} {"train_loss": -5.777858734130859, "global_step": 52669, "epoch": 1254} {"train_loss": -5.847105026245117, "global_step": 52670, "epoch": 1254} {"train_loss": -5.82060432434082, "global_step": 52671, "epoch": 1254} {"train_loss": -5.660815715789795, "global_step": 52672, "epoch": 1254} {"train_loss": -5.730849266052246, "global_step": 52673, "epoch": 1254} {"train_loss": -5.904372215270996, "global_step": 52674, "epoch": 1254} {"train_loss": -5.676146507263184, "global_step": 52675, "epoch": 1254} {"train_loss": -5.799766540527344, "global_step": 52676, "epoch": 1254} {"train_loss": -5.577389717102051, "global_step": 52677, "epoch": 1254} {"train_loss": -5.744602203369141, "global_step": 52678, "epoch": 1254} {"train_loss": -5.757044792175293, "global_step": 52679, "epoch": 1254} {"train_loss": -5.7651872634887695, "global_step": 52680, "epoch": 1254} {"train_loss": -5.824651718139648, "global_step": 52681, "epoch": 1254} {"train_loss": -5.737138271331787, "global_step": 52682, "epoch": 1254} {"train_loss": -5.680537700653076, "global_step": 52683, "epoch": 1254} {"train_loss": -5.904297828674316, "global_step": 52684, "epoch": 1254} {"train_loss": -5.717432022094727, "global_step": 52685, "epoch": 1254} {"train_loss": -5.945237636566162, "global_step": 52686, "epoch": 1254} {"train_loss": -5.853438854217529, "global_step": 52687, "epoch": 1254} {"train_loss": -5.851423263549805, "global_step": 52688, "epoch": 1254} {"train_loss": -5.695527076721191, "global_step": 52689, "epoch": 1254} {"train_loss": -5.816396236419678, "global_step": 52690, "epoch": 1254} {"train_loss": -5.696043014526367, "global_step": 52691, "epoch": 1254} {"train_loss": -5.839560508728027, "global_step": 52692, "epoch": 1254} {"train_loss": -5.740329265594482, "global_step": 52693, "epoch": 1254} {"train_loss": -5.785723686218262, "global_step": 52694, "epoch": 1254} {"train_loss": -5.730551242828369, "global_step": 52695, "epoch": 1254} {"train_loss": -5.712713718414307, "global_step": 52696, "epoch": 1254} {"train_loss": -5.696537494659424, "global_step": 52697, "epoch": 1254} {"train_loss": -5.757248878479004, "global_step": 52698, "epoch": 1254} {"train_loss": -5.7842583656311035, "global_step": 52699, "epoch": 1254} {"train_loss": -5.920763969421387, "global_step": 52700, "epoch": 1254} {"train_loss": -5.752158164978027, "global_step": 52701, "epoch": 1254} {"train_loss": -5.8366851806640625, "global_step": 52702, "epoch": 1254} {"train_loss": -5.835735321044922, "global_step": 52703, "epoch": 1254} {"train_loss": -5.7499895095825195, "global_step": 52704, "epoch": 1254} {"train_loss": -5.765061378479004, "global_step": 52705, "epoch": 1254} {"train_loss": -5.724862098693848, "global_step": 52706, "epoch": 1254} {"train_loss": -5.813640594482422, "global_step": 52707, "epoch": 1254} {"train_loss": -5.905970573425293, "global_step": 52708, "epoch": 1254} {"train_loss": -5.778699863524664, "global_step": 52709, "epoch": 1254, "val_loss": 74337.4140625} {"train_loss": -5.829613208770752, "global_step": 52710, "epoch": 1255} {"train_loss": -5.769706726074219, "global_step": 52711, "epoch": 1255} {"train_loss": -5.843110084533691, "global_step": 52712, "epoch": 1255} {"train_loss": -5.803781509399414, "global_step": 52713, "epoch": 1255} {"train_loss": -5.80810546875, "global_step": 52714, "epoch": 1255} {"train_loss": -5.874079704284668, "global_step": 52715, "epoch": 1255} {"train_loss": -5.749352931976318, "global_step": 52716, "epoch": 1255} {"train_loss": -5.798787593841553, "global_step": 52717, "epoch": 1255} {"train_loss": -5.754023551940918, "global_step": 52718, "epoch": 1255} {"train_loss": -5.799561500549316, "global_step": 52719, "epoch": 1255} {"train_loss": -6.008791923522949, "global_step": 52720, "epoch": 1255} {"train_loss": -5.80211067199707, "global_step": 52721, "epoch": 1255} {"train_loss": -5.781045436859131, "global_step": 52722, "epoch": 1255} {"train_loss": -5.860912322998047, "global_step": 52723, "epoch": 1255} {"train_loss": -5.770900726318359, "global_step": 52724, "epoch": 1255} {"train_loss": -5.8878679275512695, "global_step": 52725, "epoch": 1255} {"train_loss": -5.916914463043213, "global_step": 52726, "epoch": 1255} {"train_loss": -5.7496490478515625, "global_step": 52727, "epoch": 1255} {"train_loss": -5.7979912757873535, "global_step": 52728, "epoch": 1255} {"train_loss": -5.844226837158203, "global_step": 52729, "epoch": 1255} {"train_loss": -5.778345584869385, "global_step": 52730, "epoch": 1255} {"train_loss": -5.934726715087891, "global_step": 52731, "epoch": 1255} {"train_loss": -5.796303749084473, "global_step": 52732, "epoch": 1255} {"train_loss": -5.78245210647583, "global_step": 52733, "epoch": 1255} {"train_loss": -5.8636932373046875, "global_step": 52734, "epoch": 1255} {"train_loss": -5.8429718017578125, "global_step": 52735, "epoch": 1255} {"train_loss": -5.921907901763916, "global_step": 52736, "epoch": 1255} {"train_loss": -5.7541303634643555, "global_step": 52737, "epoch": 1255} {"train_loss": -5.795973777770996, "global_step": 52738, "epoch": 1255} {"train_loss": -5.852255821228027, "global_step": 52739, "epoch": 1255} {"train_loss": -5.797903537750244, "global_step": 52740, "epoch": 1255} {"train_loss": -5.781794548034668, "global_step": 52741, "epoch": 1255} {"train_loss": -5.635691165924072, "global_step": 52742, "epoch": 1255} {"train_loss": -5.809139251708984, "global_step": 52743, "epoch": 1255} {"train_loss": -5.948793411254883, "global_step": 52744, "epoch": 1255} {"train_loss": -5.718318462371826, "global_step": 52745, "epoch": 1255} {"train_loss": -5.734016418457031, "global_step": 52746, "epoch": 1255} {"train_loss": -5.662156105041504, "global_step": 52747, "epoch": 1255} {"train_loss": -5.877013206481934, "global_step": 52748, "epoch": 1255} {"train_loss": -5.926100730895996, "global_step": 52749, "epoch": 1255} {"train_loss": -5.8035454750061035, "global_step": 52750, "epoch": 1255} {"train_loss": -5.817718744277954, "global_step": 52751, "epoch": 1255, "val_loss": 74204.3359375} {"train_loss": -5.895636081695557, "global_step": 52752, "epoch": 1256} {"train_loss": -5.77669095993042, "global_step": 52753, "epoch": 1256} {"train_loss": -5.839158535003662, "global_step": 52754, "epoch": 1256} {"train_loss": -5.80906343460083, "global_step": 52755, "epoch": 1256} {"train_loss": -5.881885528564453, "global_step": 52756, "epoch": 1256} {"train_loss": -5.842263221740723, "global_step": 52757, "epoch": 1256} {"train_loss": -5.780035972595215, "global_step": 52758, "epoch": 1256} {"train_loss": -5.740898132324219, "global_step": 52759, "epoch": 1256} {"train_loss": -5.742278099060059, "global_step": 52760, "epoch": 1256} {"train_loss": -5.671642303466797, "global_step": 52761, "epoch": 1256} {"train_loss": -5.813026428222656, "global_step": 52762, "epoch": 1256} {"train_loss": -5.6552934646606445, "global_step": 52763, "epoch": 1256} {"train_loss": -5.657564163208008, "global_step": 52764, "epoch": 1256} {"train_loss": -5.830353736877441, "global_step": 52765, "epoch": 1256} {"train_loss": -5.771634578704834, "global_step": 52766, "epoch": 1256} {"train_loss": -5.666620254516602, "global_step": 52767, "epoch": 1256} {"train_loss": -5.726954460144043, "global_step": 52768, "epoch": 1256} {"train_loss": -5.8743062019348145, "global_step": 52769, "epoch": 1256} {"train_loss": -5.840555191040039, "global_step": 52770, "epoch": 1256} {"train_loss": -5.870394706726074, "global_step": 52771, "epoch": 1256} {"train_loss": -5.813943862915039, "global_step": 52772, "epoch": 1256} {"train_loss": -5.856819152832031, "global_step": 52773, "epoch": 1256} {"train_loss": -5.820878982543945, "global_step": 52774, "epoch": 1256} {"train_loss": -5.778321266174316, "global_step": 52775, "epoch": 1256} {"train_loss": -5.787164211273193, "global_step": 52776, "epoch": 1256} {"train_loss": -5.710814952850342, "global_step": 52777, "epoch": 1256} {"train_loss": -5.764431476593018, "global_step": 52778, "epoch": 1256} {"train_loss": -5.8014702796936035, "global_step": 52779, "epoch": 1256} {"train_loss": -5.795406341552734, "global_step": 52780, "epoch": 1256} {"train_loss": -5.890433311462402, "global_step": 52781, "epoch": 1256} {"train_loss": -5.839699745178223, "global_step": 52782, "epoch": 1256} {"train_loss": -5.815709114074707, "global_step": 52783, "epoch": 1256} {"train_loss": -5.837850570678711, "global_step": 52784, "epoch": 1256} {"train_loss": -5.849663257598877, "global_step": 52785, "epoch": 1256} {"train_loss": -5.780160903930664, "global_step": 52786, "epoch": 1256} {"train_loss": -5.871180534362793, "global_step": 52787, "epoch": 1256} {"train_loss": -5.850945472717285, "global_step": 52788, "epoch": 1256} {"train_loss": -5.8171467781066895, "global_step": 52789, "epoch": 1256} {"train_loss": -5.8529791831970215, "global_step": 52790, "epoch": 1256} {"train_loss": -5.787508964538574, "global_step": 52791, "epoch": 1256} {"train_loss": -5.876237869262695, "global_step": 52792, "epoch": 1256} {"train_loss": -5.801135483242216, "global_step": 52793, "epoch": 1256, "val_loss": 74280.3984375} {"train_loss": -5.759337902069092, "global_step": 52794, "epoch": 1257} {"train_loss": -5.796311378479004, "global_step": 52795, "epoch": 1257} {"train_loss": -5.87601375579834, "global_step": 52796, "epoch": 1257} {"train_loss": -5.860279083251953, "global_step": 52797, "epoch": 1257} {"train_loss": -5.760380744934082, "global_step": 52798, "epoch": 1257} {"train_loss": -5.873641014099121, "global_step": 52799, "epoch": 1257} {"train_loss": -5.740422248840332, "global_step": 52800, "epoch": 1257} {"train_loss": -5.895697593688965, "global_step": 52801, "epoch": 1257} {"train_loss": -5.8351030349731445, "global_step": 52802, "epoch": 1257} {"train_loss": -5.748343467712402, "global_step": 52803, "epoch": 1257} {"train_loss": -5.910130500793457, "global_step": 52804, "epoch": 1257} {"train_loss": -5.774656295776367, "global_step": 52805, "epoch": 1257} {"train_loss": -5.710004806518555, "global_step": 52806, "epoch": 1257} {"train_loss": -5.898097038269043, "global_step": 52807, "epoch": 1257} {"train_loss": -5.781588077545166, "global_step": 52808, "epoch": 1257} {"train_loss": -5.7969584465026855, "global_step": 52809, "epoch": 1257} {"train_loss": -5.847762107849121, "global_step": 52810, "epoch": 1257} {"train_loss": -5.746143341064453, "global_step": 52811, "epoch": 1257} {"train_loss": -5.8152852058410645, "global_step": 52812, "epoch": 1257} {"train_loss": -5.844273567199707, "global_step": 52813, "epoch": 1257} {"train_loss": -5.703590393066406, "global_step": 52814, "epoch": 1257} {"train_loss": -5.791842460632324, "global_step": 52815, "epoch": 1257} {"train_loss": -5.807094573974609, "global_step": 52816, "epoch": 1257} {"train_loss": -5.812064170837402, "global_step": 52817, "epoch": 1257} {"train_loss": -5.809844017028809, "global_step": 52818, "epoch": 1257} {"train_loss": -5.7029290199279785, "global_step": 52819, "epoch": 1257} {"train_loss": -5.7539777755737305, "global_step": 52820, "epoch": 1257} {"train_loss": -5.874519348144531, "global_step": 52821, "epoch": 1257} {"train_loss": -5.7178239822387695, "global_step": 52822, "epoch": 1257} {"train_loss": -5.777499198913574, "global_step": 52823, "epoch": 1257} {"train_loss": -5.836268424987793, "global_step": 52824, "epoch": 1257} {"train_loss": -5.728120803833008, "global_step": 52825, "epoch": 1257} {"train_loss": -5.74836540222168, "global_step": 52826, "epoch": 1257} {"train_loss": -5.6670732498168945, "global_step": 52827, "epoch": 1257} {"train_loss": -5.7813029289245605, "global_step": 52828, "epoch": 1257} {"train_loss": -5.785252571105957, "global_step": 52829, "epoch": 1257} {"train_loss": -5.845302581787109, "global_step": 52830, "epoch": 1257} {"train_loss": -5.77634334564209, "global_step": 52831, "epoch": 1257} {"train_loss": -5.893223285675049, "global_step": 52832, "epoch": 1257} {"train_loss": -5.80672550201416, "global_step": 52833, "epoch": 1257} {"train_loss": -5.776438236236572, "global_step": 52834, "epoch": 1257} {"train_loss": -5.798796131497338, "global_step": 52835, "epoch": 1257, "val_loss": 74948.0390625} {"train_loss": -5.677945137023926, "global_step": 52836, "epoch": 1258} {"train_loss": -5.844825267791748, "global_step": 52837, "epoch": 1258} {"train_loss": -5.835727691650391, "global_step": 52838, "epoch": 1258} {"train_loss": -5.824840545654297, "global_step": 52839, "epoch": 1258} {"train_loss": -5.746399402618408, "global_step": 52840, "epoch": 1258} {"train_loss": -5.8702521324157715, "global_step": 52841, "epoch": 1258} {"train_loss": -5.720381259918213, "global_step": 52842, "epoch": 1258} {"train_loss": -5.789330959320068, "global_step": 52843, "epoch": 1258} {"train_loss": -5.827653884887695, "global_step": 52844, "epoch": 1258} {"train_loss": -5.831900596618652, "global_step": 52845, "epoch": 1258} {"train_loss": -5.863168716430664, "global_step": 52846, "epoch": 1258} {"train_loss": -5.867565631866455, "global_step": 52847, "epoch": 1258} {"train_loss": -5.6427836418151855, "global_step": 52848, "epoch": 1258} {"train_loss": -5.784775733947754, "global_step": 52849, "epoch": 1258} {"train_loss": -5.639542579650879, "global_step": 52850, "epoch": 1258} {"train_loss": -5.863296031951904, "global_step": 52851, "epoch": 1258} {"train_loss": -5.8091630935668945, "global_step": 52852, "epoch": 1258} {"train_loss": -5.723953723907471, "global_step": 52853, "epoch": 1258} {"train_loss": -5.696993350982666, "global_step": 52854, "epoch": 1258} {"train_loss": -5.763063430786133, "global_step": 52855, "epoch": 1258} {"train_loss": -5.731306552886963, "global_step": 52856, "epoch": 1258} {"train_loss": -5.769240379333496, "global_step": 52857, "epoch": 1258} {"train_loss": -5.768572807312012, "global_step": 52858, "epoch": 1258} {"train_loss": -5.863214492797852, "global_step": 52859, "epoch": 1258} {"train_loss": -5.802480697631836, "global_step": 52860, "epoch": 1258} {"train_loss": -5.802123069763184, "global_step": 52861, "epoch": 1258} {"train_loss": -5.816062927246094, "global_step": 52862, "epoch": 1258} {"train_loss": -5.72313117980957, "global_step": 52863, "epoch": 1258} {"train_loss": -5.73909854888916, "global_step": 52864, "epoch": 1258} {"train_loss": -5.769163608551025, "global_step": 52865, "epoch": 1258} {"train_loss": -5.691287994384766, "global_step": 52866, "epoch": 1258} {"train_loss": -5.9312968254089355, "global_step": 52867, "epoch": 1258} {"train_loss": -5.75759220123291, "global_step": 52868, "epoch": 1258} {"train_loss": -5.688992023468018, "global_step": 52869, "epoch": 1258} {"train_loss": -5.8154616355896, "global_step": 52870, "epoch": 1258} {"train_loss": -5.87335729598999, "global_step": 52871, "epoch": 1258} {"train_loss": -5.700270175933838, "global_step": 52872, "epoch": 1258} {"train_loss": -5.803793907165527, "global_step": 52873, "epoch": 1258} {"train_loss": -5.779549598693848, "global_step": 52874, "epoch": 1258} {"train_loss": -5.760055065155029, "global_step": 52875, "epoch": 1258} {"train_loss": -5.8068528175354, "global_step": 52876, "epoch": 1258} {"train_loss": -5.782106399536133, "global_step": 52877, "epoch": 1258, "val_loss": 74579.734375} {"train_loss": -5.733389377593994, "global_step": 52878, "epoch": 1259} {"train_loss": -5.699698448181152, "global_step": 52879, "epoch": 1259} {"train_loss": -6.003297805786133, "global_step": 52880, "epoch": 1259} {"train_loss": -5.765451908111572, "global_step": 52881, "epoch": 1259} {"train_loss": -5.871787071228027, "global_step": 52882, "epoch": 1259} {"train_loss": -5.801225662231445, "global_step": 52883, "epoch": 1259} {"train_loss": -5.717694282531738, "global_step": 52884, "epoch": 1259} {"train_loss": -5.784366607666016, "global_step": 52885, "epoch": 1259} {"train_loss": -5.8878583908081055, "global_step": 52886, "epoch": 1259} {"train_loss": -5.795984745025635, "global_step": 52887, "epoch": 1259} {"train_loss": -5.690210819244385, "global_step": 52888, "epoch": 1259} {"train_loss": -5.786192417144775, "global_step": 52889, "epoch": 1259} {"train_loss": -5.861112594604492, "global_step": 52890, "epoch": 1259} {"train_loss": -5.819149494171143, "global_step": 52891, "epoch": 1259} {"train_loss": -5.821535110473633, "global_step": 52892, "epoch": 1259} {"train_loss": -5.924972057342529, "global_step": 52893, "epoch": 1259} {"train_loss": -5.790700912475586, "global_step": 52894, "epoch": 1259} {"train_loss": -5.7874531745910645, "global_step": 52895, "epoch": 1259} {"train_loss": -5.81712532043457, "global_step": 52896, "epoch": 1259} {"train_loss": -5.756011009216309, "global_step": 52897, "epoch": 1259} {"train_loss": -5.905611991882324, "global_step": 52898, "epoch": 1259} {"train_loss": -5.836252212524414, "global_step": 52899, "epoch": 1259} {"train_loss": -5.86622428894043, "global_step": 52900, "epoch": 1259} {"train_loss": -5.725409507751465, "global_step": 52901, "epoch": 1259} {"train_loss": -5.845520496368408, "global_step": 52902, "epoch": 1259} {"train_loss": -5.666044235229492, "global_step": 52903, "epoch": 1259} {"train_loss": -5.62496280670166, "global_step": 52904, "epoch": 1259} {"train_loss": -5.738895416259766, "global_step": 52905, "epoch": 1259} {"train_loss": -5.726404190063477, "global_step": 52906, "epoch": 1259} {"train_loss": -5.6800312995910645, "global_step": 52907, "epoch": 1259} {"train_loss": -5.817787170410156, "global_step": 52908, "epoch": 1259} {"train_loss": -5.74366569519043, "global_step": 52909, "epoch": 1259} {"train_loss": -5.776167869567871, "global_step": 52910, "epoch": 1259} {"train_loss": -5.827382564544678, "global_step": 52911, "epoch": 1259} {"train_loss": -5.877219200134277, "global_step": 52912, "epoch": 1259} {"train_loss": -5.794011116027832, "global_step": 52913, "epoch": 1259} {"train_loss": -5.887703895568848, "global_step": 52914, "epoch": 1259} {"train_loss": -5.756180763244629, "global_step": 52915, "epoch": 1259} {"train_loss": -5.76335334777832, "global_step": 52916, "epoch": 1259} {"train_loss": -5.702584266662598, "global_step": 52917, "epoch": 1259} {"train_loss": -5.828055381774902, "global_step": 52918, "epoch": 1259} {"train_loss": -5.790294556390672, "global_step": 52919, "epoch": 1259, "val_loss": 74741.6484375} {"train_loss": -5.63109827041626, "global_step": 52920, "epoch": 1260} {"train_loss": -5.851123332977295, "global_step": 52921, "epoch": 1260} {"train_loss": -5.7965521812438965, "global_step": 52922, "epoch": 1260} {"train_loss": -5.818476676940918, "global_step": 52923, "epoch": 1260} {"train_loss": -5.7062530517578125, "global_step": 52924, "epoch": 1260} {"train_loss": -5.785885334014893, "global_step": 52925, "epoch": 1260} {"train_loss": -5.833916664123535, "global_step": 52926, "epoch": 1260} {"train_loss": -5.741767883300781, "global_step": 52927, "epoch": 1260} {"train_loss": -5.777843952178955, "global_step": 52928, "epoch": 1260} {"train_loss": -5.897383689880371, "global_step": 52929, "epoch": 1260} {"train_loss": -5.845280170440674, "global_step": 52930, "epoch": 1260} {"train_loss": -5.764925956726074, "global_step": 52931, "epoch": 1260} {"train_loss": -5.830665588378906, "global_step": 52932, "epoch": 1260} {"train_loss": -5.8350934982299805, "global_step": 52933, "epoch": 1260} {"train_loss": -5.798981666564941, "global_step": 52934, "epoch": 1260} {"train_loss": -5.730210304260254, "global_step": 52935, "epoch": 1260} {"train_loss": -5.7762451171875, "global_step": 52936, "epoch": 1260} {"train_loss": -5.8650712966918945, "global_step": 52937, "epoch": 1260} {"train_loss": -5.818606376647949, "global_step": 52938, "epoch": 1260} {"train_loss": -5.7008161544799805, "global_step": 52939, "epoch": 1260} {"train_loss": -5.8794965744018555, "global_step": 52940, "epoch": 1260} {"train_loss": -5.751698970794678, "global_step": 52941, "epoch": 1260} {"train_loss": -5.835090637207031, "global_step": 52942, "epoch": 1260} {"train_loss": -5.846440315246582, "global_step": 52943, "epoch": 1260} {"train_loss": -5.795133590698242, "global_step": 52944, "epoch": 1260} {"train_loss": -5.877832412719727, "global_step": 52945, "epoch": 1260} {"train_loss": -5.820782661437988, "global_step": 52946, "epoch": 1260} {"train_loss": -5.837989330291748, "global_step": 52947, "epoch": 1260} {"train_loss": -5.81455135345459, "global_step": 52948, "epoch": 1260} {"train_loss": -5.741093635559082, "global_step": 52949, "epoch": 1260} {"train_loss": -5.9521484375, "global_step": 52950, "epoch": 1260} {"train_loss": -5.922252178192139, "global_step": 52951, "epoch": 1260} {"train_loss": -5.8170485496521, "global_step": 52952, "epoch": 1260} {"train_loss": -5.813336372375488, "global_step": 52953, "epoch": 1260} {"train_loss": -5.852834701538086, "global_step": 52954, "epoch": 1260} {"train_loss": -5.764699459075928, "global_step": 52955, "epoch": 1260} {"train_loss": -5.904763221740723, "global_step": 52956, "epoch": 1260} {"train_loss": -5.845823287963867, "global_step": 52957, "epoch": 1260} {"train_loss": -5.779102325439453, "global_step": 52958, "epoch": 1260} {"train_loss": -5.810879230499268, "global_step": 52959, "epoch": 1260} {"train_loss": -5.866032600402832, "global_step": 52960, "epoch": 1260} {"train_loss": -5.815161466598511, "global_step": 52961, "epoch": 1260, "val_loss": 74411.53125} {"train_loss": -5.844424247741699, "global_step": 52962, "epoch": 1261} {"train_loss": -5.958712577819824, "global_step": 52963, "epoch": 1261} {"train_loss": -5.735355377197266, "global_step": 52964, "epoch": 1261} {"train_loss": -5.866823673248291, "global_step": 52965, "epoch": 1261} {"train_loss": -5.8793110847473145, "global_step": 52966, "epoch": 1261} {"train_loss": -5.883143424987793, "global_step": 52967, "epoch": 1261} {"train_loss": -5.786787033081055, "global_step": 52968, "epoch": 1261} {"train_loss": -5.848881721496582, "global_step": 52969, "epoch": 1261} {"train_loss": -5.862270355224609, "global_step": 52970, "epoch": 1261} {"train_loss": -5.9259443283081055, "global_step": 52971, "epoch": 1261} {"train_loss": -5.775516510009766, "global_step": 52972, "epoch": 1261} {"train_loss": -5.862639427185059, "global_step": 52973, "epoch": 1261} {"train_loss": -5.801759719848633, "global_step": 52974, "epoch": 1261} {"train_loss": -5.814940929412842, "global_step": 52975, "epoch": 1261} {"train_loss": -5.887749671936035, "global_step": 52976, "epoch": 1261} {"train_loss": -5.779884338378906, "global_step": 52977, "epoch": 1261} {"train_loss": -5.762936115264893, "global_step": 52978, "epoch": 1261} {"train_loss": -5.889827728271484, "global_step": 52979, "epoch": 1261} {"train_loss": -5.827369689941406, "global_step": 52980, "epoch": 1261} {"train_loss": -5.891821384429932, "global_step": 52981, "epoch": 1261} {"train_loss": -5.791681289672852, "global_step": 52982, "epoch": 1261} {"train_loss": -5.813567161560059, "global_step": 52983, "epoch": 1261} {"train_loss": -5.823641300201416, "global_step": 52984, "epoch": 1261} {"train_loss": -5.902444362640381, "global_step": 52985, "epoch": 1261} {"train_loss": -5.845824241638184, "global_step": 52986, "epoch": 1261} {"train_loss": -5.736067771911621, "global_step": 52987, "epoch": 1261} {"train_loss": -5.939913272857666, "global_step": 52988, "epoch": 1261} {"train_loss": -5.754708290100098, "global_step": 52989, "epoch": 1261} {"train_loss": -5.746371269226074, "global_step": 52990, "epoch": 1261} {"train_loss": -5.81131649017334, "global_step": 52991, "epoch": 1261} {"train_loss": -5.810330390930176, "global_step": 52992, "epoch": 1261} {"train_loss": -5.813775062561035, "global_step": 52993, "epoch": 1261} {"train_loss": -5.853513717651367, "global_step": 52994, "epoch": 1261} {"train_loss": -5.842396259307861, "global_step": 52995, "epoch": 1261} {"train_loss": -5.820478439331055, "global_step": 52996, "epoch": 1261} {"train_loss": -5.82150936126709, "global_step": 52997, "epoch": 1261} {"train_loss": -5.819101333618164, "global_step": 52998, "epoch": 1261} {"train_loss": -5.827559471130371, "global_step": 52999, "epoch": 1261} {"train_loss": -5.768571853637695, "global_step": 53000, "epoch": 1261} {"train_loss": -5.861279487609863, "global_step": 53001, "epoch": 1261} {"train_loss": -5.854625225067139, "global_step": 53002, "epoch": 1261} {"train_loss": -5.829708825974238, "global_step": 53003, "epoch": 1261, "val_loss": 74634.0546875} {"train_loss": -5.819309234619141, "global_step": 53004, "epoch": 1262} {"train_loss": -5.853215217590332, "global_step": 53005, "epoch": 1262} {"train_loss": -5.879977226257324, "global_step": 53006, "epoch": 1262} {"train_loss": -5.8870015144348145, "global_step": 53007, "epoch": 1262} {"train_loss": -5.888321876525879, "global_step": 53008, "epoch": 1262} {"train_loss": -5.82635498046875, "global_step": 53009, "epoch": 1262} {"train_loss": -5.726552963256836, "global_step": 53010, "epoch": 1262} {"train_loss": -5.845925331115723, "global_step": 53011, "epoch": 1262} {"train_loss": -5.862689018249512, "global_step": 53012, "epoch": 1262} {"train_loss": -5.916641712188721, "global_step": 53013, "epoch": 1262} {"train_loss": -5.871514797210693, "global_step": 53014, "epoch": 1262} {"train_loss": -5.9023590087890625, "global_step": 53015, "epoch": 1262} {"train_loss": -5.84684419631958, "global_step": 53016, "epoch": 1262} {"train_loss": -5.894345283508301, "global_step": 53017, "epoch": 1262} {"train_loss": -5.765484809875488, "global_step": 53018, "epoch": 1262} {"train_loss": -5.756548881530762, "global_step": 53019, "epoch": 1262} {"train_loss": -5.848136901855469, "global_step": 53020, "epoch": 1262} {"train_loss": -5.836791515350342, "global_step": 53021, "epoch": 1262} {"train_loss": -5.764060974121094, "global_step": 53022, "epoch": 1262} {"train_loss": -5.8255720138549805, "global_step": 53023, "epoch": 1262} {"train_loss": -5.803585052490234, "global_step": 53024, "epoch": 1262} {"train_loss": -5.816614627838135, "global_step": 53025, "epoch": 1262} {"train_loss": -5.815072059631348, "global_step": 53026, "epoch": 1262} {"train_loss": -5.766579627990723, "global_step": 53027, "epoch": 1262} {"train_loss": -5.815647125244141, "global_step": 53028, "epoch": 1262} {"train_loss": -5.871323585510254, "global_step": 53029, "epoch": 1262} {"train_loss": -5.762644290924072, "global_step": 53030, "epoch": 1262} {"train_loss": -5.884100914001465, "global_step": 53031, "epoch": 1262} {"train_loss": -5.753216743469238, "global_step": 53032, "epoch": 1262} {"train_loss": -5.722284317016602, "global_step": 53033, "epoch": 1262} {"train_loss": -5.786850452423096, "global_step": 53034, "epoch": 1262} {"train_loss": -5.74924373626709, "global_step": 53035, "epoch": 1262} {"train_loss": -5.860939025878906, "global_step": 53036, "epoch": 1262} {"train_loss": -5.85070276260376, "global_step": 53037, "epoch": 1262} {"train_loss": -5.851208209991455, "global_step": 53038, "epoch": 1262} {"train_loss": -5.842277526855469, "global_step": 53039, "epoch": 1262} {"train_loss": -5.789463043212891, "global_step": 53040, "epoch": 1262} {"train_loss": -5.812447547912598, "global_step": 53041, "epoch": 1262} {"train_loss": -5.928402423858643, "global_step": 53042, "epoch": 1262} {"train_loss": -5.9194841384887695, "global_step": 53043, "epoch": 1262} {"train_loss": -5.738508224487305, "global_step": 53044, "epoch": 1262} {"train_loss": -5.828895932152157, "global_step": 53045, "epoch": 1262, "val_loss": 74176.828125} {"train_loss": -5.85482120513916, "global_step": 53046, "epoch": 1263} {"train_loss": -5.795498371124268, "global_step": 53047, "epoch": 1263} {"train_loss": -5.837468147277832, "global_step": 53048, "epoch": 1263} {"train_loss": -5.753638744354248, "global_step": 53049, "epoch": 1263} {"train_loss": -5.687963485717773, "global_step": 53050, "epoch": 1263} {"train_loss": -5.747561454772949, "global_step": 53051, "epoch": 1263} {"train_loss": -5.652529716491699, "global_step": 53052, "epoch": 1263} {"train_loss": -5.744584083557129, "global_step": 53053, "epoch": 1263} {"train_loss": -5.905045509338379, "global_step": 53054, "epoch": 1263} {"train_loss": -5.786120414733887, "global_step": 53055, "epoch": 1263} {"train_loss": -5.669257164001465, "global_step": 53056, "epoch": 1263} {"train_loss": -5.836730003356934, "global_step": 53057, "epoch": 1263} {"train_loss": -5.790139675140381, "global_step": 53058, "epoch": 1263} {"train_loss": -5.805853366851807, "global_step": 53059, "epoch": 1263} {"train_loss": -5.820320129394531, "global_step": 53060, "epoch": 1263} {"train_loss": -5.797305107116699, "global_step": 53061, "epoch": 1263} {"train_loss": -5.719956398010254, "global_step": 53062, "epoch": 1263} {"train_loss": -5.794084548950195, "global_step": 53063, "epoch": 1263} {"train_loss": -5.823952674865723, "global_step": 53064, "epoch": 1263} {"train_loss": -5.784512519836426, "global_step": 53065, "epoch": 1263} {"train_loss": -5.52561616897583, "global_step": 53066, "epoch": 1263} {"train_loss": -5.803016662597656, "global_step": 53067, "epoch": 1263} {"train_loss": -5.92277717590332, "global_step": 53068, "epoch": 1263} {"train_loss": -5.679523468017578, "global_step": 53069, "epoch": 1263} {"train_loss": -5.864445686340332, "global_step": 53070, "epoch": 1263} {"train_loss": -5.6731367111206055, "global_step": 53071, "epoch": 1263} {"train_loss": -5.644725799560547, "global_step": 53072, "epoch": 1263} {"train_loss": -5.760654449462891, "global_step": 53073, "epoch": 1263} {"train_loss": -5.648926734924316, "global_step": 53074, "epoch": 1263} {"train_loss": -5.854826927185059, "global_step": 53075, "epoch": 1263} {"train_loss": -5.757381439208984, "global_step": 53076, "epoch": 1263} {"train_loss": -5.7064948081970215, "global_step": 53077, "epoch": 1263} {"train_loss": -5.82546854019165, "global_step": 53078, "epoch": 1263} {"train_loss": -5.787380218505859, "global_step": 53079, "epoch": 1263} {"train_loss": -5.72205114364624, "global_step": 53080, "epoch": 1263} {"train_loss": -5.894248962402344, "global_step": 53081, "epoch": 1263} {"train_loss": -5.719160079956055, "global_step": 53082, "epoch": 1263} {"train_loss": -5.771322727203369, "global_step": 53083, "epoch": 1263} {"train_loss": -5.809462070465088, "global_step": 53084, "epoch": 1263} {"train_loss": -5.676731586456299, "global_step": 53085, "epoch": 1263} {"train_loss": -5.805929183959961, "global_step": 53086, "epoch": 1263} {"train_loss": -5.767704407374064, "global_step": 53087, "epoch": 1263, "val_loss": 74318.921875} {"train_loss": -5.769647598266602, "global_step": 53088, "epoch": 1264} {"train_loss": -5.833352088928223, "global_step": 53089, "epoch": 1264} {"train_loss": -5.847125053405762, "global_step": 53090, "epoch": 1264} {"train_loss": -5.885581016540527, "global_step": 53091, "epoch": 1264} {"train_loss": -5.731943607330322, "global_step": 53092, "epoch": 1264} {"train_loss": -5.904962539672852, "global_step": 53093, "epoch": 1264} {"train_loss": -5.780098915100098, "global_step": 53094, "epoch": 1264} {"train_loss": -5.880163192749023, "global_step": 53095, "epoch": 1264} {"train_loss": -5.783982276916504, "global_step": 53096, "epoch": 1264} {"train_loss": -5.835422039031982, "global_step": 53097, "epoch": 1264} {"train_loss": -5.769652366638184, "global_step": 53098, "epoch": 1264} {"train_loss": -5.609490394592285, "global_step": 53099, "epoch": 1264} {"train_loss": -5.941434860229492, "global_step": 53100, "epoch": 1264} {"train_loss": -5.7377729415893555, "global_step": 53101, "epoch": 1264} {"train_loss": -5.854412078857422, "global_step": 53102, "epoch": 1264} {"train_loss": -5.867198944091797, "global_step": 53103, "epoch": 1264} {"train_loss": -5.854372978210449, "global_step": 53104, "epoch": 1264} {"train_loss": -5.881259918212891, "global_step": 53105, "epoch": 1264} {"train_loss": -5.846522808074951, "global_step": 53106, "epoch": 1264} {"train_loss": -5.724727630615234, "global_step": 53107, "epoch": 1264} {"train_loss": -5.7578043937683105, "global_step": 53108, "epoch": 1264} {"train_loss": -5.8732404708862305, "global_step": 53109, "epoch": 1264} {"train_loss": -5.820087432861328, "global_step": 53110, "epoch": 1264} {"train_loss": -5.712080955505371, "global_step": 53111, "epoch": 1264} {"train_loss": -5.783759593963623, "global_step": 53112, "epoch": 1264} {"train_loss": -5.854946136474609, "global_step": 53113, "epoch": 1264} {"train_loss": -5.761756896972656, "global_step": 53114, "epoch": 1264} {"train_loss": -5.837442398071289, "global_step": 53115, "epoch": 1264} {"train_loss": -5.738526344299316, "global_step": 53116, "epoch": 1264} {"train_loss": -5.7092695236206055, "global_step": 53117, "epoch": 1264} {"train_loss": -5.770190715789795, "global_step": 53118, "epoch": 1264} {"train_loss": -5.790250778198242, "global_step": 53119, "epoch": 1264} {"train_loss": -5.8286309242248535, "global_step": 53120, "epoch": 1264} {"train_loss": -5.837000846862793, "global_step": 53121, "epoch": 1264} {"train_loss": -5.797096252441406, "global_step": 53122, "epoch": 1264} {"train_loss": -5.860332489013672, "global_step": 53123, "epoch": 1264} {"train_loss": -5.878843784332275, "global_step": 53124, "epoch": 1264} {"train_loss": -5.890894889831543, "global_step": 53125, "epoch": 1264} {"train_loss": -5.713302135467529, "global_step": 53126, "epoch": 1264} {"train_loss": -5.882597923278809, "global_step": 53127, "epoch": 1264} {"train_loss": -5.718371391296387, "global_step": 53128, "epoch": 1264} {"train_loss": -5.810233910878499, "global_step": 53129, "epoch": 1264, "val_loss": 74328.28125} {"train_loss": -5.832983016967773, "global_step": 53130, "epoch": 1265} {"train_loss": -5.731539249420166, "global_step": 53131, "epoch": 1265} {"train_loss": -5.747684001922607, "global_step": 53132, "epoch": 1265} {"train_loss": -5.819841384887695, "global_step": 53133, "epoch": 1265} {"train_loss": -5.819338798522949, "global_step": 53134, "epoch": 1265} {"train_loss": -5.831996440887451, "global_step": 53135, "epoch": 1265} {"train_loss": -5.779854774475098, "global_step": 53136, "epoch": 1265} {"train_loss": -5.86264705657959, "global_step": 53137, "epoch": 1265} {"train_loss": -5.7133355140686035, "global_step": 53138, "epoch": 1265} {"train_loss": -5.76735782623291, "global_step": 53139, "epoch": 1265} {"train_loss": -5.832904815673828, "global_step": 53140, "epoch": 1265} {"train_loss": -5.878333568572998, "global_step": 53141, "epoch": 1265} {"train_loss": -5.775103569030762, "global_step": 53142, "epoch": 1265} {"train_loss": -5.885841369628906, "global_step": 53143, "epoch": 1265} {"train_loss": -5.902806282043457, "global_step": 53144, "epoch": 1265} {"train_loss": -5.74375057220459, "global_step": 53145, "epoch": 1265} {"train_loss": -5.777511119842529, "global_step": 53146, "epoch": 1265} {"train_loss": -5.799654483795166, "global_step": 53147, "epoch": 1265} {"train_loss": -5.691441059112549, "global_step": 53148, "epoch": 1265} {"train_loss": -5.79195499420166, "global_step": 53149, "epoch": 1265} {"train_loss": -5.799249649047852, "global_step": 53150, "epoch": 1265} {"train_loss": -5.770158767700195, "global_step": 53151, "epoch": 1265} {"train_loss": -5.7772088050842285, "global_step": 53152, "epoch": 1265} {"train_loss": -5.832934379577637, "global_step": 53153, "epoch": 1265} {"train_loss": -5.780402183532715, "global_step": 53154, "epoch": 1265} {"train_loss": -5.706582069396973, "global_step": 53155, "epoch": 1265} {"train_loss": -5.813344478607178, "global_step": 53156, "epoch": 1265} {"train_loss": -5.74935245513916, "global_step": 53157, "epoch": 1265} {"train_loss": -5.761106491088867, "global_step": 53158, "epoch": 1265} {"train_loss": -5.816202163696289, "global_step": 53159, "epoch": 1265} {"train_loss": -5.803784370422363, "global_step": 53160, "epoch": 1265} {"train_loss": -5.816941261291504, "global_step": 53161, "epoch": 1265} {"train_loss": -5.781968116760254, "global_step": 53162, "epoch": 1265} {"train_loss": -5.733613967895508, "global_step": 53163, "epoch": 1265} {"train_loss": -5.756013870239258, "global_step": 53164, "epoch": 1265} {"train_loss": -5.938633441925049, "global_step": 53165, "epoch": 1265} {"train_loss": -5.744605541229248, "global_step": 53166, "epoch": 1265} {"train_loss": -5.71366024017334, "global_step": 53167, "epoch": 1265} {"train_loss": -5.743279933929443, "global_step": 53168, "epoch": 1265} {"train_loss": -5.704820156097412, "global_step": 53169, "epoch": 1265} {"train_loss": -5.828664779663086, "global_step": 53170, "epoch": 1265} {"train_loss": -5.789207787740798, "global_step": 53171, "epoch": 1265, "val_loss": 74517.1640625} {"train_loss": -5.753361225128174, "global_step": 53172, "epoch": 1266} {"train_loss": -5.8868937492370605, "global_step": 53173, "epoch": 1266} {"train_loss": -5.759106159210205, "global_step": 53174, "epoch": 1266} {"train_loss": -5.852934837341309, "global_step": 53175, "epoch": 1266} {"train_loss": -5.744458198547363, "global_step": 53176, "epoch": 1266} {"train_loss": -5.788706302642822, "global_step": 53177, "epoch": 1266} {"train_loss": -5.734196662902832, "global_step": 53178, "epoch": 1266} {"train_loss": -5.88214635848999, "global_step": 53179, "epoch": 1266} {"train_loss": -5.811697483062744, "global_step": 53180, "epoch": 1266} {"train_loss": -5.8738112449646, "global_step": 53181, "epoch": 1266} {"train_loss": -5.811866760253906, "global_step": 53182, "epoch": 1266} {"train_loss": -5.914981842041016, "global_step": 53183, "epoch": 1266} {"train_loss": -5.844794273376465, "global_step": 53184, "epoch": 1266} {"train_loss": -5.823364734649658, "global_step": 53185, "epoch": 1266} {"train_loss": -5.780786037445068, "global_step": 53186, "epoch": 1266} {"train_loss": -5.745638847351074, "global_step": 53187, "epoch": 1266} {"train_loss": -5.769669532775879, "global_step": 53188, "epoch": 1266} {"train_loss": -5.778328895568848, "global_step": 53189, "epoch": 1266} {"train_loss": -5.859622955322266, "global_step": 53190, "epoch": 1266} {"train_loss": -5.877023696899414, "global_step": 53191, "epoch": 1266} {"train_loss": -5.740665912628174, "global_step": 53192, "epoch": 1266} {"train_loss": -5.6871747970581055, "global_step": 53193, "epoch": 1266} {"train_loss": -5.767910957336426, "global_step": 53194, "epoch": 1266} {"train_loss": -5.803896903991699, "global_step": 53195, "epoch": 1266} {"train_loss": -5.7557525634765625, "global_step": 53196, "epoch": 1266} {"train_loss": -5.842950820922852, "global_step": 53197, "epoch": 1266} {"train_loss": -5.8803300857543945, "global_step": 53198, "epoch": 1266} {"train_loss": -5.839158058166504, "global_step": 53199, "epoch": 1266} {"train_loss": -5.874382972717285, "global_step": 53200, "epoch": 1266} {"train_loss": -5.848713397979736, "global_step": 53201, "epoch": 1266} {"train_loss": -5.660038471221924, "global_step": 53202, "epoch": 1266} {"train_loss": -5.731256008148193, "global_step": 53203, "epoch": 1266} {"train_loss": -5.860136985778809, "global_step": 53204, "epoch": 1266} {"train_loss": -5.89767599105835, "global_step": 53205, "epoch": 1266} {"train_loss": -5.924372673034668, "global_step": 53206, "epoch": 1266} {"train_loss": -5.930763244628906, "global_step": 53207, "epoch": 1266} {"train_loss": -5.822608947753906, "global_step": 53208, "epoch": 1266} {"train_loss": -5.7437639236450195, "global_step": 53209, "epoch": 1266} {"train_loss": -5.834263801574707, "global_step": 53210, "epoch": 1266} {"train_loss": -5.770155906677246, "global_step": 53211, "epoch": 1266} {"train_loss": -5.905981063842773, "global_step": 53212, "epoch": 1266} {"train_loss": -5.815459467115856, "global_step": 53213, "epoch": 1266, "val_loss": 74268.28125} {"train_loss": -5.865355014801025, "global_step": 53214, "epoch": 1267} {"train_loss": -5.7813286781311035, "global_step": 53215, "epoch": 1267} {"train_loss": -5.920947074890137, "global_step": 53216, "epoch": 1267} {"train_loss": -5.86024808883667, "global_step": 53217, "epoch": 1267} {"train_loss": -5.860692501068115, "global_step": 53218, "epoch": 1267} {"train_loss": -5.859157562255859, "global_step": 53219, "epoch": 1267} {"train_loss": -5.746847152709961, "global_step": 53220, "epoch": 1267} {"train_loss": -5.793919563293457, "global_step": 53221, "epoch": 1267} {"train_loss": -5.7595062255859375, "global_step": 53222, "epoch": 1267} {"train_loss": -5.745288848876953, "global_step": 53223, "epoch": 1267} {"train_loss": -5.670619964599609, "global_step": 53224, "epoch": 1267} {"train_loss": -5.8306732177734375, "global_step": 53225, "epoch": 1267} {"train_loss": -5.680060386657715, "global_step": 53226, "epoch": 1267} {"train_loss": -5.853300094604492, "global_step": 53227, "epoch": 1267} {"train_loss": -5.919899940490723, "global_step": 53228, "epoch": 1267} {"train_loss": -5.655948638916016, "global_step": 53229, "epoch": 1267} {"train_loss": -5.912885665893555, "global_step": 53230, "epoch": 1267} {"train_loss": -5.896419048309326, "global_step": 53231, "epoch": 1267} {"train_loss": -5.821040153503418, "global_step": 53232, "epoch": 1267} {"train_loss": -5.82356071472168, "global_step": 53233, "epoch": 1267} {"train_loss": -5.738006591796875, "global_step": 53234, "epoch": 1267} {"train_loss": -5.846128940582275, "global_step": 53235, "epoch": 1267} {"train_loss": -5.761443138122559, "global_step": 53236, "epoch": 1267} {"train_loss": -5.703181743621826, "global_step": 53237, "epoch": 1267} {"train_loss": -5.84271764755249, "global_step": 53238, "epoch": 1267} {"train_loss": -5.772382736206055, "global_step": 53239, "epoch": 1267} {"train_loss": -5.7214460372924805, "global_step": 53240, "epoch": 1267} {"train_loss": -5.791813850402832, "global_step": 53241, "epoch": 1267} {"train_loss": -5.630549430847168, "global_step": 53242, "epoch": 1267} {"train_loss": -5.718252182006836, "global_step": 53243, "epoch": 1267} {"train_loss": -5.708958625793457, "global_step": 53244, "epoch": 1267} {"train_loss": -5.752447128295898, "global_step": 53245, "epoch": 1267} {"train_loss": -5.780948162078857, "global_step": 53246, "epoch": 1267} {"train_loss": -5.928275108337402, "global_step": 53247, "epoch": 1267} {"train_loss": -5.742732048034668, "global_step": 53248, "epoch": 1267} {"train_loss": -5.887033462524414, "global_step": 53249, "epoch": 1267} {"train_loss": -5.699985027313232, "global_step": 53250, "epoch": 1267} {"train_loss": -5.767164707183838, "global_step": 53251, "epoch": 1267} {"train_loss": -5.77703857421875, "global_step": 53252, "epoch": 1267} {"train_loss": -5.8449177742004395, "global_step": 53253, "epoch": 1267} {"train_loss": -5.7741498947143555, "global_step": 53254, "epoch": 1267} {"train_loss": -5.793026049931844, "global_step": 53255, "epoch": 1267, "val_loss": 73946.5} {"train_loss": -5.858709812164307, "global_step": 53256, "epoch": 1268} {"train_loss": -5.829748153686523, "global_step": 53257, "epoch": 1268} {"train_loss": -5.770992755889893, "global_step": 53258, "epoch": 1268} {"train_loss": -5.878081321716309, "global_step": 53259, "epoch": 1268} {"train_loss": -5.9816999435424805, "global_step": 53260, "epoch": 1268} {"train_loss": -5.828025817871094, "global_step": 53261, "epoch": 1268} {"train_loss": -5.753487586975098, "global_step": 53262, "epoch": 1268} {"train_loss": -5.7682294845581055, "global_step": 53263, "epoch": 1268} {"train_loss": -5.70034122467041, "global_step": 53264, "epoch": 1268} {"train_loss": -5.721497058868408, "global_step": 53265, "epoch": 1268} {"train_loss": -5.803274154663086, "global_step": 53266, "epoch": 1268} {"train_loss": -5.736203193664551, "global_step": 53267, "epoch": 1268} {"train_loss": -5.74846887588501, "global_step": 53268, "epoch": 1268} {"train_loss": -5.819139003753662, "global_step": 53269, "epoch": 1268} {"train_loss": -5.714755058288574, "global_step": 53270, "epoch": 1268} {"train_loss": -5.831273078918457, "global_step": 53271, "epoch": 1268} {"train_loss": -5.757421493530273, "global_step": 53272, "epoch": 1268} {"train_loss": -5.669075012207031, "global_step": 53273, "epoch": 1268} {"train_loss": -5.873459339141846, "global_step": 53274, "epoch": 1268} {"train_loss": -5.7757463455200195, "global_step": 53275, "epoch": 1268} {"train_loss": -5.68111515045166, "global_step": 53276, "epoch": 1268} {"train_loss": -5.861920356750488, "global_step": 53277, "epoch": 1268} {"train_loss": -5.903995513916016, "global_step": 53278, "epoch": 1268} {"train_loss": -5.7389678955078125, "global_step": 53279, "epoch": 1268} {"train_loss": -5.699587821960449, "global_step": 53280, "epoch": 1268} {"train_loss": -5.879348278045654, "global_step": 53281, "epoch": 1268} {"train_loss": -5.800911903381348, "global_step": 53282, "epoch": 1268} {"train_loss": -5.745352745056152, "global_step": 53283, "epoch": 1268} {"train_loss": -5.737383842468262, "global_step": 53284, "epoch": 1268} {"train_loss": -5.732707500457764, "global_step": 53285, "epoch": 1268} {"train_loss": -5.835087299346924, "global_step": 53286, "epoch": 1268} {"train_loss": -5.78062105178833, "global_step": 53287, "epoch": 1268} {"train_loss": -5.798816680908203, "global_step": 53288, "epoch": 1268} {"train_loss": -5.823662757873535, "global_step": 53289, "epoch": 1268} {"train_loss": -5.82478141784668, "global_step": 53290, "epoch": 1268} {"train_loss": -5.892913818359375, "global_step": 53291, "epoch": 1268} {"train_loss": -5.770500659942627, "global_step": 53292, "epoch": 1268} {"train_loss": -5.772687911987305, "global_step": 53293, "epoch": 1268} {"train_loss": -5.841262340545654, "global_step": 53294, "epoch": 1268} {"train_loss": -5.8015570640563965, "global_step": 53295, "epoch": 1268} {"train_loss": -5.852390289306641, "global_step": 53296, "epoch": 1268} {"train_loss": -5.7948042551676435, "global_step": 53297, "epoch": 1268, "val_loss": 74540.6328125} {"train_loss": -5.886778831481934, "global_step": 53298, "epoch": 1269} {"train_loss": -5.790271759033203, "global_step": 53299, "epoch": 1269} {"train_loss": -5.59159517288208, "global_step": 53300, "epoch": 1269} {"train_loss": -5.876619338989258, "global_step": 53301, "epoch": 1269} {"train_loss": -5.817171096801758, "global_step": 53302, "epoch": 1269} {"train_loss": -5.798369407653809, "global_step": 53303, "epoch": 1269} {"train_loss": -5.708557605743408, "global_step": 53304, "epoch": 1269} {"train_loss": -5.79983377456665, "global_step": 53305, "epoch": 1269} {"train_loss": -5.835128307342529, "global_step": 53306, "epoch": 1269} {"train_loss": -5.697360515594482, "global_step": 53307, "epoch": 1269} {"train_loss": -5.843654632568359, "global_step": 53308, "epoch": 1269} {"train_loss": -5.8884453773498535, "global_step": 53309, "epoch": 1269} {"train_loss": -5.72721004486084, "global_step": 53310, "epoch": 1269} {"train_loss": -5.882425308227539, "global_step": 53311, "epoch": 1269} {"train_loss": -5.780555725097656, "global_step": 53312, "epoch": 1269} {"train_loss": -5.763829231262207, "global_step": 53313, "epoch": 1269} {"train_loss": -5.831849575042725, "global_step": 53314, "epoch": 1269} {"train_loss": -5.828037738800049, "global_step": 53315, "epoch": 1269} {"train_loss": -5.985480785369873, "global_step": 53316, "epoch": 1269} {"train_loss": -5.7535600662231445, "global_step": 53317, "epoch": 1269} {"train_loss": -5.782515048980713, "global_step": 53318, "epoch": 1269} {"train_loss": -5.7961883544921875, "global_step": 53319, "epoch": 1269} {"train_loss": -5.842351913452148, "global_step": 53320, "epoch": 1269} {"train_loss": -5.778002738952637, "global_step": 53321, "epoch": 1269} {"train_loss": -5.875903129577637, "global_step": 53322, "epoch": 1269} {"train_loss": -5.828947067260742, "global_step": 53323, "epoch": 1269} {"train_loss": -5.839910507202148, "global_step": 53324, "epoch": 1269} {"train_loss": -5.884830474853516, "global_step": 53325, "epoch": 1269} {"train_loss": -5.778169631958008, "global_step": 53326, "epoch": 1269} {"train_loss": -5.787508010864258, "global_step": 53327, "epoch": 1269} {"train_loss": -5.821425437927246, "global_step": 53328, "epoch": 1269} {"train_loss": -5.9060516357421875, "global_step": 53329, "epoch": 1269} {"train_loss": -5.65159797668457, "global_step": 53330, "epoch": 1269} {"train_loss": -5.938961029052734, "global_step": 53331, "epoch": 1269} {"train_loss": -5.887209892272949, "global_step": 53332, "epoch": 1269} {"train_loss": -5.716904640197754, "global_step": 53333, "epoch": 1269} {"train_loss": -5.94867467880249, "global_step": 53334, "epoch": 1269} {"train_loss": -5.898768424987793, "global_step": 53335, "epoch": 1269} {"train_loss": -5.809202671051025, "global_step": 53336, "epoch": 1269} {"train_loss": -5.741169452667236, "global_step": 53337, "epoch": 1269} {"train_loss": -5.661653518676758, "global_step": 53338, "epoch": 1269} {"train_loss": -5.815329642522903, "global_step": 53339, "epoch": 1269, "val_loss": 74290.609375} {"train_loss": -5.901303768157959, "global_step": 53340, "epoch": 1270} {"train_loss": -5.852988243103027, "global_step": 53341, "epoch": 1270} {"train_loss": -5.859532356262207, "global_step": 53342, "epoch": 1270} {"train_loss": -5.906213283538818, "global_step": 53343, "epoch": 1270} {"train_loss": -5.782098770141602, "global_step": 53344, "epoch": 1270} {"train_loss": -5.844956874847412, "global_step": 53345, "epoch": 1270} {"train_loss": -5.855501174926758, "global_step": 53346, "epoch": 1270} {"train_loss": -5.867356300354004, "global_step": 53347, "epoch": 1270} {"train_loss": -5.698266983032227, "global_step": 53348, "epoch": 1270} {"train_loss": -5.908008575439453, "global_step": 53349, "epoch": 1270} {"train_loss": -5.7788591384887695, "global_step": 53350, "epoch": 1270} {"train_loss": -5.6825032234191895, "global_step": 53351, "epoch": 1270} {"train_loss": -5.899174690246582, "global_step": 53352, "epoch": 1270} {"train_loss": -5.7171430587768555, "global_step": 53353, "epoch": 1270} {"train_loss": -5.740131378173828, "global_step": 53354, "epoch": 1270} {"train_loss": -5.809449672698975, "global_step": 53355, "epoch": 1270} {"train_loss": -5.767009735107422, "global_step": 53356, "epoch": 1270} {"train_loss": -5.875230312347412, "global_step": 53357, "epoch": 1270} {"train_loss": -5.753866195678711, "global_step": 53358, "epoch": 1270} {"train_loss": -5.92006778717041, "global_step": 53359, "epoch": 1270} {"train_loss": -5.843869686126709, "global_step": 53360, "epoch": 1270} {"train_loss": -5.839597702026367, "global_step": 53361, "epoch": 1270} {"train_loss": -5.801054954528809, "global_step": 53362, "epoch": 1270} {"train_loss": -5.922037601470947, "global_step": 53363, "epoch": 1270} {"train_loss": -5.86961030960083, "global_step": 53364, "epoch": 1270} {"train_loss": -5.961718559265137, "global_step": 53365, "epoch": 1270} {"train_loss": -5.700307846069336, "global_step": 53366, "epoch": 1270} {"train_loss": -5.7888078689575195, "global_step": 53367, "epoch": 1270} {"train_loss": -5.917938232421875, "global_step": 53368, "epoch": 1270} {"train_loss": -5.891742706298828, "global_step": 53369, "epoch": 1270} {"train_loss": -5.824070930480957, "global_step": 53370, "epoch": 1270} {"train_loss": -5.729273319244385, "global_step": 53371, "epoch": 1270} {"train_loss": -5.801684379577637, "global_step": 53372, "epoch": 1270} {"train_loss": -5.730291366577148, "global_step": 53373, "epoch": 1270} {"train_loss": -5.788636207580566, "global_step": 53374, "epoch": 1270} {"train_loss": -5.857268810272217, "global_step": 53375, "epoch": 1270} {"train_loss": -5.79701042175293, "global_step": 53376, "epoch": 1270} {"train_loss": -5.711974143981934, "global_step": 53377, "epoch": 1270} {"train_loss": -5.737351417541504, "global_step": 53378, "epoch": 1270} {"train_loss": -5.779598236083984, "global_step": 53379, "epoch": 1270} {"train_loss": -5.874316215515137, "global_step": 53380, "epoch": 1270} {"train_loss": -5.818765674318586, "global_step": 53381, "epoch": 1270, "val_loss": 74702.6015625} {"train_loss": -5.806267738342285, "global_step": 53382, "epoch": 1271} {"train_loss": -5.866874694824219, "global_step": 53383, "epoch": 1271} {"train_loss": -5.787330150604248, "global_step": 53384, "epoch": 1271} {"train_loss": -5.749238967895508, "global_step": 53385, "epoch": 1271} {"train_loss": -5.830844402313232, "global_step": 53386, "epoch": 1271} {"train_loss": -5.65257453918457, "global_step": 53387, "epoch": 1271} {"train_loss": -5.785812854766846, "global_step": 53388, "epoch": 1271} {"train_loss": -5.85116720199585, "global_step": 53389, "epoch": 1271} {"train_loss": -5.555605888366699, "global_step": 53390, "epoch": 1271} {"train_loss": -5.769756317138672, "global_step": 53391, "epoch": 1271} {"train_loss": -5.696276664733887, "global_step": 53392, "epoch": 1271} {"train_loss": -5.634535312652588, "global_step": 53393, "epoch": 1271} {"train_loss": -5.812406539916992, "global_step": 53394, "epoch": 1271} {"train_loss": -5.705206394195557, "global_step": 53395, "epoch": 1271} {"train_loss": -5.692663192749023, "global_step": 53396, "epoch": 1271} {"train_loss": -5.717353343963623, "global_step": 53397, "epoch": 1271} {"train_loss": -5.6439690589904785, "global_step": 53398, "epoch": 1271} {"train_loss": -5.764214515686035, "global_step": 53399, "epoch": 1271} {"train_loss": -5.716780662536621, "global_step": 53400, "epoch": 1271} {"train_loss": -5.8683037757873535, "global_step": 53401, "epoch": 1271} {"train_loss": -5.71356201171875, "global_step": 53402, "epoch": 1271} {"train_loss": -5.783726692199707, "global_step": 53403, "epoch": 1271} {"train_loss": -5.838326454162598, "global_step": 53404, "epoch": 1271} {"train_loss": -5.800109386444092, "global_step": 53405, "epoch": 1271} {"train_loss": -5.842198371887207, "global_step": 53406, "epoch": 1271} {"train_loss": -5.7751784324646, "global_step": 53407, "epoch": 1271} {"train_loss": -5.8507466316223145, "global_step": 53408, "epoch": 1271} {"train_loss": -5.819973945617676, "global_step": 53409, "epoch": 1271} {"train_loss": -5.846439361572266, "global_step": 53410, "epoch": 1271} {"train_loss": -5.831760406494141, "global_step": 53411, "epoch": 1271} {"train_loss": -5.693351745605469, "global_step": 53412, "epoch": 1271} {"train_loss": -5.799363136291504, "global_step": 53413, "epoch": 1271} {"train_loss": -5.796380043029785, "global_step": 53414, "epoch": 1271} {"train_loss": -5.7383904457092285, "global_step": 53415, "epoch": 1271} {"train_loss": -5.881160736083984, "global_step": 53416, "epoch": 1271} {"train_loss": -5.809154987335205, "global_step": 53417, "epoch": 1271} {"train_loss": -5.960935115814209, "global_step": 53418, "epoch": 1271} {"train_loss": -5.8876447677612305, "global_step": 53419, "epoch": 1271} {"train_loss": -5.7773942947387695, "global_step": 53420, "epoch": 1271} {"train_loss": -5.95053768157959, "global_step": 53421, "epoch": 1271} {"train_loss": -5.693005561828613, "global_step": 53422, "epoch": 1271} {"train_loss": -5.782414459046864, "global_step": 53423, "epoch": 1271, "val_loss": 73959.0546875} {"train_loss": -5.939502716064453, "global_step": 53424, "epoch": 1272} {"train_loss": -5.744938850402832, "global_step": 53425, "epoch": 1272} {"train_loss": -5.7799882888793945, "global_step": 53426, "epoch": 1272} {"train_loss": -5.810016632080078, "global_step": 53427, "epoch": 1272} {"train_loss": -5.842942237854004, "global_step": 53428, "epoch": 1272} {"train_loss": -5.824546813964844, "global_step": 53429, "epoch": 1272} {"train_loss": -5.968837738037109, "global_step": 53430, "epoch": 1272} {"train_loss": -5.827691078186035, "global_step": 53431, "epoch": 1272} {"train_loss": -5.779335975646973, "global_step": 53432, "epoch": 1272} {"train_loss": -5.820407390594482, "global_step": 53433, "epoch": 1272} {"train_loss": -5.668368816375732, "global_step": 53434, "epoch": 1272} {"train_loss": -5.705808162689209, "global_step": 53435, "epoch": 1272} {"train_loss": -5.954816818237305, "global_step": 53436, "epoch": 1272} {"train_loss": -5.653454780578613, "global_step": 53437, "epoch": 1272} {"train_loss": -5.764716148376465, "global_step": 53438, "epoch": 1272} {"train_loss": -5.803670406341553, "global_step": 53439, "epoch": 1272} {"train_loss": -5.68701696395874, "global_step": 53440, "epoch": 1272} {"train_loss": -5.754209518432617, "global_step": 53441, "epoch": 1272} {"train_loss": -5.778003215789795, "global_step": 53442, "epoch": 1272} {"train_loss": -5.890469551086426, "global_step": 53443, "epoch": 1272} {"train_loss": -5.621187686920166, "global_step": 53444, "epoch": 1272} {"train_loss": -5.843225479125977, "global_step": 53445, "epoch": 1272} {"train_loss": -5.822807312011719, "global_step": 53446, "epoch": 1272} {"train_loss": -5.855199813842773, "global_step": 53447, "epoch": 1272} {"train_loss": -5.7628045082092285, "global_step": 53448, "epoch": 1272} {"train_loss": -5.786930561065674, "global_step": 53449, "epoch": 1272} {"train_loss": -5.740848541259766, "global_step": 53450, "epoch": 1272} {"train_loss": -5.85939884185791, "global_step": 53451, "epoch": 1272} {"train_loss": -5.784638404846191, "global_step": 53452, "epoch": 1272} {"train_loss": -5.941320896148682, "global_step": 53453, "epoch": 1272} {"train_loss": -5.816915035247803, "global_step": 53454, "epoch": 1272} {"train_loss": -5.7041015625, "global_step": 53455, "epoch": 1272} {"train_loss": -5.828204154968262, "global_step": 53456, "epoch": 1272} {"train_loss": -5.801340103149414, "global_step": 53457, "epoch": 1272} {"train_loss": -5.679502010345459, "global_step": 53458, "epoch": 1272} {"train_loss": -5.8448333740234375, "global_step": 53459, "epoch": 1272} {"train_loss": -5.658982753753662, "global_step": 53460, "epoch": 1272} {"train_loss": -5.762392044067383, "global_step": 53461, "epoch": 1272} {"train_loss": -5.903926849365234, "global_step": 53462, "epoch": 1272} {"train_loss": -5.861018180847168, "global_step": 53463, "epoch": 1272} {"train_loss": -5.846248626708984, "global_step": 53464, "epoch": 1272} {"train_loss": -5.798372336796352, "global_step": 53465, "epoch": 1272, "val_loss": 74583.6328125} {"train_loss": -5.879595756530762, "global_step": 53466, "epoch": 1273} {"train_loss": -5.679276943206787, "global_step": 53467, "epoch": 1273} {"train_loss": -5.839489936828613, "global_step": 53468, "epoch": 1273} {"train_loss": -5.9229302406311035, "global_step": 53469, "epoch": 1273} {"train_loss": -5.82302188873291, "global_step": 53470, "epoch": 1273} {"train_loss": -5.927460193634033, "global_step": 53471, "epoch": 1273} {"train_loss": -5.724735736846924, "global_step": 53472, "epoch": 1273} {"train_loss": -5.819058418273926, "global_step": 53473, "epoch": 1273} {"train_loss": -5.717619895935059, "global_step": 53474, "epoch": 1273} {"train_loss": -5.694209098815918, "global_step": 53475, "epoch": 1273} {"train_loss": -5.829668045043945, "global_step": 53476, "epoch": 1273} {"train_loss": -5.832464694976807, "global_step": 53477, "epoch": 1273} {"train_loss": -5.829973220825195, "global_step": 53478, "epoch": 1273} {"train_loss": -5.879263877868652, "global_step": 53479, "epoch": 1273} {"train_loss": -5.884675025939941, "global_step": 53480, "epoch": 1273} {"train_loss": -5.877388954162598, "global_step": 53481, "epoch": 1273} {"train_loss": -5.850983142852783, "global_step": 53482, "epoch": 1273} {"train_loss": -5.780196666717529, "global_step": 53483, "epoch": 1273} {"train_loss": -5.822979927062988, "global_step": 53484, "epoch": 1273} {"train_loss": -5.811624526977539, "global_step": 53485, "epoch": 1273} {"train_loss": -5.882574558258057, "global_step": 53486, "epoch": 1273} {"train_loss": -5.925820350646973, "global_step": 53487, "epoch": 1273} {"train_loss": -5.878697395324707, "global_step": 53488, "epoch": 1273} {"train_loss": -5.7739152908325195, "global_step": 53489, "epoch": 1273} {"train_loss": -5.811018943786621, "global_step": 53490, "epoch": 1273} {"train_loss": -5.757218360900879, "global_step": 53491, "epoch": 1273} {"train_loss": -5.887556076049805, "global_step": 53492, "epoch": 1273} {"train_loss": -5.890414237976074, "global_step": 53493, "epoch": 1273} {"train_loss": -5.870777130126953, "global_step": 53494, "epoch": 1273} {"train_loss": -5.903656005859375, "global_step": 53495, "epoch": 1273} {"train_loss": -5.812381744384766, "global_step": 53496, "epoch": 1273} {"train_loss": -5.96194314956665, "global_step": 53497, "epoch": 1273} {"train_loss": -5.826635837554932, "global_step": 53498, "epoch": 1273} {"train_loss": -5.749687194824219, "global_step": 53499, "epoch": 1273} {"train_loss": -5.74356746673584, "global_step": 53500, "epoch": 1273} {"train_loss": -5.766295433044434, "global_step": 53501, "epoch": 1273} {"train_loss": -5.9268479347229, "global_step": 53502, "epoch": 1273} {"train_loss": -5.831892967224121, "global_step": 53503, "epoch": 1273} {"train_loss": -5.798078536987305, "global_step": 53504, "epoch": 1273} {"train_loss": -5.771381855010986, "global_step": 53505, "epoch": 1273} {"train_loss": -5.813753128051758, "global_step": 53506, "epoch": 1273} {"train_loss": -5.831086726415725, "global_step": 53507, "epoch": 1273, "val_loss": 74027.5078125} {"train_loss": -5.830289840698242, "global_step": 53508, "epoch": 1274} {"train_loss": -5.927242755889893, "global_step": 53509, "epoch": 1274} {"train_loss": -5.804701805114746, "global_step": 53510, "epoch": 1274} {"train_loss": -5.803884506225586, "global_step": 53511, "epoch": 1274} {"train_loss": -5.91140079498291, "global_step": 53512, "epoch": 1274} {"train_loss": -5.7899580001831055, "global_step": 53513, "epoch": 1274} {"train_loss": -5.815878391265869, "global_step": 53514, "epoch": 1274} {"train_loss": -5.776368141174316, "global_step": 53515, "epoch": 1274} {"train_loss": -5.760923385620117, "global_step": 53516, "epoch": 1274} {"train_loss": -5.860354423522949, "global_step": 53517, "epoch": 1274} {"train_loss": -5.7535624504089355, "global_step": 53518, "epoch": 1274} {"train_loss": -5.805937767028809, "global_step": 53519, "epoch": 1274} {"train_loss": -5.752175331115723, "global_step": 53520, "epoch": 1274} {"train_loss": -5.880828857421875, "global_step": 53521, "epoch": 1274} {"train_loss": -5.844738960266113, "global_step": 53522, "epoch": 1274} {"train_loss": -5.834743976593018, "global_step": 53523, "epoch": 1274} {"train_loss": -5.7381181716918945, "global_step": 53524, "epoch": 1274} {"train_loss": -5.890905857086182, "global_step": 53525, "epoch": 1274} {"train_loss": -5.896549224853516, "global_step": 53526, "epoch": 1274} {"train_loss": -5.682198524475098, "global_step": 53527, "epoch": 1274} {"train_loss": -5.818924903869629, "global_step": 53528, "epoch": 1274} {"train_loss": -5.875548362731934, "global_step": 53529, "epoch": 1274} {"train_loss": -5.720170974731445, "global_step": 53530, "epoch": 1274} {"train_loss": -5.828893184661865, "global_step": 53531, "epoch": 1274} {"train_loss": -5.697323799133301, "global_step": 53532, "epoch": 1274} {"train_loss": -5.807209014892578, "global_step": 53533, "epoch": 1274} {"train_loss": -5.896411895751953, "global_step": 53534, "epoch": 1274} {"train_loss": -5.993031024932861, "global_step": 53535, "epoch": 1274} {"train_loss": -5.791518211364746, "global_step": 53536, "epoch": 1274} {"train_loss": -5.811309337615967, "global_step": 53537, "epoch": 1274} {"train_loss": -5.869692802429199, "global_step": 53538, "epoch": 1274} {"train_loss": -5.76810359954834, "global_step": 53539, "epoch": 1274} {"train_loss": -5.875116348266602, "global_step": 53540, "epoch": 1274} {"train_loss": -5.809865951538086, "global_step": 53541, "epoch": 1274} {"train_loss": -5.7729692459106445, "global_step": 53542, "epoch": 1274} {"train_loss": -5.786515712738037, "global_step": 53543, "epoch": 1274} {"train_loss": -5.833388328552246, "global_step": 53544, "epoch": 1274} {"train_loss": -5.842640399932861, "global_step": 53545, "epoch": 1274} {"train_loss": -5.836371898651123, "global_step": 53546, "epoch": 1274} {"train_loss": -5.796753883361816, "global_step": 53547, "epoch": 1274} {"train_loss": -5.807517051696777, "global_step": 53548, "epoch": 1274} {"train_loss": -5.8140800793965655, "global_step": 53549, "epoch": 1274, "val_loss": 74039.078125} {"train_loss": -5.737435340881348, "global_step": 53550, "epoch": 1275} {"train_loss": -5.761934280395508, "global_step": 53551, "epoch": 1275} {"train_loss": -5.862417221069336, "global_step": 53552, "epoch": 1275} {"train_loss": -5.78700590133667, "global_step": 53553, "epoch": 1275} {"train_loss": -5.753143310546875, "global_step": 53554, "epoch": 1275} {"train_loss": -5.847612380981445, "global_step": 53555, "epoch": 1275} {"train_loss": -5.683719635009766, "global_step": 53556, "epoch": 1275} {"train_loss": -5.8734307289123535, "global_step": 53557, "epoch": 1275} {"train_loss": -5.696787357330322, "global_step": 53558, "epoch": 1275} {"train_loss": -5.867913246154785, "global_step": 53559, "epoch": 1275} {"train_loss": -5.87162971496582, "global_step": 53560, "epoch": 1275} {"train_loss": -5.73374080657959, "global_step": 53561, "epoch": 1275} {"train_loss": -5.802567481994629, "global_step": 53562, "epoch": 1275} {"train_loss": -5.754711151123047, "global_step": 53563, "epoch": 1275} {"train_loss": -5.816215991973877, "global_step": 53564, "epoch": 1275} {"train_loss": -5.793788433074951, "global_step": 53565, "epoch": 1275} {"train_loss": -5.87985372543335, "global_step": 53566, "epoch": 1275} {"train_loss": -5.914422035217285, "global_step": 53567, "epoch": 1275} {"train_loss": -5.81905460357666, "global_step": 53568, "epoch": 1275} {"train_loss": -5.7898783683776855, "global_step": 53569, "epoch": 1275} {"train_loss": -5.890453338623047, "global_step": 53570, "epoch": 1275} {"train_loss": -5.788827896118164, "global_step": 53571, "epoch": 1275} {"train_loss": -5.852245807647705, "global_step": 53572, "epoch": 1275} {"train_loss": -5.77752685546875, "global_step": 53573, "epoch": 1275} {"train_loss": -5.8012590408325195, "global_step": 53574, "epoch": 1275} {"train_loss": -5.873236179351807, "global_step": 53575, "epoch": 1275} {"train_loss": -5.764803409576416, "global_step": 53576, "epoch": 1275} {"train_loss": -5.700712203979492, "global_step": 53577, "epoch": 1275} {"train_loss": -5.850363254547119, "global_step": 53578, "epoch": 1275} {"train_loss": -5.87125825881958, "global_step": 53579, "epoch": 1275} {"train_loss": -5.823137283325195, "global_step": 53580, "epoch": 1275} {"train_loss": -5.811807632446289, "global_step": 53581, "epoch": 1275} {"train_loss": -5.787755012512207, "global_step": 53582, "epoch": 1275} {"train_loss": -5.864442825317383, "global_step": 53583, "epoch": 1275} {"train_loss": -5.721959590911865, "global_step": 53584, "epoch": 1275} {"train_loss": -5.929433822631836, "global_step": 53585, "epoch": 1275} {"train_loss": -5.88741397857666, "global_step": 53586, "epoch": 1275} {"train_loss": -5.800894737243652, "global_step": 53587, "epoch": 1275} {"train_loss": -5.789707660675049, "global_step": 53588, "epoch": 1275} {"train_loss": -5.766801834106445, "global_step": 53589, "epoch": 1275} {"train_loss": -5.887495517730713, "global_step": 53590, "epoch": 1275} {"train_loss": -5.812936192467099, "global_step": 53591, "epoch": 1275, "val_loss": 74449.171875} {"train_loss": -5.861253261566162, "global_step": 53592, "epoch": 1276} {"train_loss": -5.817057132720947, "global_step": 53593, "epoch": 1276} {"train_loss": -6.008474349975586, "global_step": 53594, "epoch": 1276} {"train_loss": -5.6548686027526855, "global_step": 53595, "epoch": 1276} {"train_loss": -5.816494941711426, "global_step": 53596, "epoch": 1276} {"train_loss": -5.8560051918029785, "global_step": 53597, "epoch": 1276} {"train_loss": -5.918403625488281, "global_step": 53598, "epoch": 1276} {"train_loss": -5.863703727722168, "global_step": 53599, "epoch": 1276} {"train_loss": -5.814723014831543, "global_step": 53600, "epoch": 1276} {"train_loss": -5.9097795486450195, "global_step": 53601, "epoch": 1276} {"train_loss": -5.714664936065674, "global_step": 53602, "epoch": 1276} {"train_loss": -5.857527732849121, "global_step": 53603, "epoch": 1276} {"train_loss": -5.778989791870117, "global_step": 53604, "epoch": 1276} {"train_loss": -5.853946685791016, "global_step": 53605, "epoch": 1276} {"train_loss": -5.8499979972839355, "global_step": 53606, "epoch": 1276} {"train_loss": -5.849837303161621, "global_step": 53607, "epoch": 1276} {"train_loss": -5.934271812438965, "global_step": 53608, "epoch": 1276} {"train_loss": -5.9293131828308105, "global_step": 53609, "epoch": 1276} {"train_loss": -5.8345232009887695, "global_step": 53610, "epoch": 1276} {"train_loss": -5.769403457641602, "global_step": 53611, "epoch": 1276} {"train_loss": -5.821755409240723, "global_step": 53612, "epoch": 1276} {"train_loss": -5.711485862731934, "global_step": 53613, "epoch": 1276} {"train_loss": -5.657218933105469, "global_step": 53614, "epoch": 1276} {"train_loss": -6.029043197631836, "global_step": 53615, "epoch": 1276} {"train_loss": -5.742213249206543, "global_step": 53616, "epoch": 1276} {"train_loss": -5.770925521850586, "global_step": 53617, "epoch": 1276} {"train_loss": -5.877144813537598, "global_step": 53618, "epoch": 1276} {"train_loss": -5.928143501281738, "global_step": 53619, "epoch": 1276} {"train_loss": -5.700155258178711, "global_step": 53620, "epoch": 1276} {"train_loss": -5.933189392089844, "global_step": 53621, "epoch": 1276} {"train_loss": -5.7637128829956055, "global_step": 53622, "epoch": 1276} {"train_loss": -5.718889236450195, "global_step": 53623, "epoch": 1276} {"train_loss": -5.771240711212158, "global_step": 53624, "epoch": 1276} {"train_loss": -5.913581848144531, "global_step": 53625, "epoch": 1276} {"train_loss": -5.773557186126709, "global_step": 53626, "epoch": 1276} {"train_loss": -5.8936967849731445, "global_step": 53627, "epoch": 1276} {"train_loss": -5.808112144470215, "global_step": 53628, "epoch": 1276} {"train_loss": -5.826990604400635, "global_step": 53629, "epoch": 1276} {"train_loss": -5.875724792480469, "global_step": 53630, "epoch": 1276} {"train_loss": -5.789042949676514, "global_step": 53631, "epoch": 1276} {"train_loss": -5.751171112060547, "global_step": 53632, "epoch": 1276} {"train_loss": -5.828747261138189, "global_step": 53633, "epoch": 1276, "val_loss": 74482.8828125} {"train_loss": -5.777397155761719, "global_step": 53634, "epoch": 1277} {"train_loss": -5.799962043762207, "global_step": 53635, "epoch": 1277} {"train_loss": -5.8392486572265625, "global_step": 53636, "epoch": 1277} {"train_loss": -5.857577323913574, "global_step": 53637, "epoch": 1277} {"train_loss": -5.882839202880859, "global_step": 53638, "epoch": 1277} {"train_loss": -5.813697814941406, "global_step": 53639, "epoch": 1277} {"train_loss": -5.846821308135986, "global_step": 53640, "epoch": 1277} {"train_loss": -5.832319259643555, "global_step": 53641, "epoch": 1277} {"train_loss": -5.868205547332764, "global_step": 53642, "epoch": 1277} {"train_loss": -5.718667030334473, "global_step": 53643, "epoch": 1277} {"train_loss": -5.754214286804199, "global_step": 53644, "epoch": 1277} {"train_loss": -5.840760231018066, "global_step": 53645, "epoch": 1277} {"train_loss": -5.883491516113281, "global_step": 53646, "epoch": 1277} {"train_loss": -5.8521952629089355, "global_step": 53647, "epoch": 1277} {"train_loss": -5.906139373779297, "global_step": 53648, "epoch": 1277} {"train_loss": -5.875419616699219, "global_step": 53649, "epoch": 1277} {"train_loss": -5.745203018188477, "global_step": 53650, "epoch": 1277} {"train_loss": -5.840356826782227, "global_step": 53651, "epoch": 1277} {"train_loss": -5.8714470863342285, "global_step": 53652, "epoch": 1277} {"train_loss": -5.930851936340332, "global_step": 53653, "epoch": 1277} {"train_loss": -5.799605369567871, "global_step": 53654, "epoch": 1277} {"train_loss": -5.848358631134033, "global_step": 53655, "epoch": 1277} {"train_loss": -5.892265319824219, "global_step": 53656, "epoch": 1277} {"train_loss": -5.957281112670898, "global_step": 53657, "epoch": 1277} {"train_loss": -5.825560092926025, "global_step": 53658, "epoch": 1277} {"train_loss": -5.819372653961182, "global_step": 53659, "epoch": 1277} {"train_loss": -5.8234148025512695, "global_step": 53660, "epoch": 1277} {"train_loss": -5.790127754211426, "global_step": 53661, "epoch": 1277} {"train_loss": -5.8335041999816895, "global_step": 53662, "epoch": 1277} {"train_loss": -5.844144344329834, "global_step": 53663, "epoch": 1277} {"train_loss": -5.943226337432861, "global_step": 53664, "epoch": 1277} {"train_loss": -5.785808563232422, "global_step": 53665, "epoch": 1277} {"train_loss": -5.844396591186523, "global_step": 53666, "epoch": 1277} {"train_loss": -5.771420478820801, "global_step": 53667, "epoch": 1277} {"train_loss": -5.823651313781738, "global_step": 53668, "epoch": 1277} {"train_loss": -5.713980674743652, "global_step": 53669, "epoch": 1277} {"train_loss": -5.988275527954102, "global_step": 53670, "epoch": 1277} {"train_loss": -5.875280380249023, "global_step": 53671, "epoch": 1277} {"train_loss": -5.876411437988281, "global_step": 53672, "epoch": 1277} {"train_loss": -5.903038024902344, "global_step": 53673, "epoch": 1277} {"train_loss": -5.812141418457031, "global_step": 53674, "epoch": 1277} {"train_loss": -5.840054818562099, "global_step": 53675, "epoch": 1277, "val_loss": 74305.9921875} {"train_loss": -5.798666954040527, "global_step": 53676, "epoch": 1278} {"train_loss": -5.738926887512207, "global_step": 53677, "epoch": 1278} {"train_loss": -5.76179313659668, "global_step": 53678, "epoch": 1278} {"train_loss": -5.862601280212402, "global_step": 53679, "epoch": 1278} {"train_loss": -5.718662738800049, "global_step": 53680, "epoch": 1278} {"train_loss": -5.849178314208984, "global_step": 53681, "epoch": 1278} {"train_loss": -5.813979625701904, "global_step": 53682, "epoch": 1278} {"train_loss": -5.719350814819336, "global_step": 53683, "epoch": 1278} {"train_loss": -5.853817939758301, "global_step": 53684, "epoch": 1278} {"train_loss": -5.8010334968566895, "global_step": 53685, "epoch": 1278} {"train_loss": -5.887622833251953, "global_step": 53686, "epoch": 1278} {"train_loss": -5.778237342834473, "global_step": 53687, "epoch": 1278} {"train_loss": -5.6291937828063965, "global_step": 53688, "epoch": 1278} {"train_loss": -5.754604339599609, "global_step": 53689, "epoch": 1278} {"train_loss": -5.8199262619018555, "global_step": 53690, "epoch": 1278} {"train_loss": -5.890918731689453, "global_step": 53691, "epoch": 1278} {"train_loss": -5.873163223266602, "global_step": 53692, "epoch": 1278} {"train_loss": -5.791553020477295, "global_step": 53693, "epoch": 1278} {"train_loss": -5.760538101196289, "global_step": 53694, "epoch": 1278} {"train_loss": -5.761566162109375, "global_step": 53695, "epoch": 1278} {"train_loss": -5.701009750366211, "global_step": 53696, "epoch": 1278} {"train_loss": -5.940832138061523, "global_step": 53697, "epoch": 1278} {"train_loss": -5.751792907714844, "global_step": 53698, "epoch": 1278} {"train_loss": -5.7367048263549805, "global_step": 53699, "epoch": 1278} {"train_loss": -5.702052116394043, "global_step": 53700, "epoch": 1278} {"train_loss": -5.793492794036865, "global_step": 53701, "epoch": 1278} {"train_loss": -5.850759506225586, "global_step": 53702, "epoch": 1278} {"train_loss": -5.790949821472168, "global_step": 53703, "epoch": 1278} {"train_loss": -5.639493465423584, "global_step": 53704, "epoch": 1278} {"train_loss": -5.843827247619629, "global_step": 53705, "epoch": 1278} {"train_loss": -5.789194107055664, "global_step": 53706, "epoch": 1278} {"train_loss": -5.788341045379639, "global_step": 53707, "epoch": 1278} {"train_loss": -5.901877403259277, "global_step": 53708, "epoch": 1278} {"train_loss": -5.864733695983887, "global_step": 53709, "epoch": 1278} {"train_loss": -5.754093170166016, "global_step": 53710, "epoch": 1278} {"train_loss": -5.8649396896362305, "global_step": 53711, "epoch": 1278} {"train_loss": -5.819329738616943, "global_step": 53712, "epoch": 1278} {"train_loss": -5.8529229164123535, "global_step": 53713, "epoch": 1278} {"train_loss": -5.790031433105469, "global_step": 53714, "epoch": 1278} {"train_loss": -5.898859977722168, "global_step": 53715, "epoch": 1278} {"train_loss": -5.938186168670654, "global_step": 53716, "epoch": 1278} {"train_loss": -5.799518880389986, "global_step": 53717, "epoch": 1278, "val_loss": 74229.484375} {"train_loss": -5.995113849639893, "global_step": 53718, "epoch": 1279} {"train_loss": -5.923571586608887, "global_step": 53719, "epoch": 1279} {"train_loss": -5.855788230895996, "global_step": 53720, "epoch": 1279} {"train_loss": -5.7135210037231445, "global_step": 53721, "epoch": 1279} {"train_loss": -5.862977027893066, "global_step": 53722, "epoch": 1279} {"train_loss": -5.816352844238281, "global_step": 53723, "epoch": 1279} {"train_loss": -5.935446739196777, "global_step": 53724, "epoch": 1279} {"train_loss": -5.855650424957275, "global_step": 53725, "epoch": 1279} {"train_loss": -5.777125358581543, "global_step": 53726, "epoch": 1279} {"train_loss": -5.870305061340332, "global_step": 53727, "epoch": 1279} {"train_loss": -5.72981071472168, "global_step": 53728, "epoch": 1279} {"train_loss": -5.793166160583496, "global_step": 53729, "epoch": 1279} {"train_loss": -5.921848297119141, "global_step": 53730, "epoch": 1279} {"train_loss": -5.777054786682129, "global_step": 53731, "epoch": 1279} {"train_loss": -5.771516799926758, "global_step": 53732, "epoch": 1279} {"train_loss": -5.981757640838623, "global_step": 53733, "epoch": 1279} {"train_loss": -5.838080406188965, "global_step": 53734, "epoch": 1279} {"train_loss": -5.8555803298950195, "global_step": 53735, "epoch": 1279} {"train_loss": -5.689882755279541, "global_step": 53736, "epoch": 1279} {"train_loss": -5.786157131195068, "global_step": 53737, "epoch": 1279} {"train_loss": -5.742220878601074, "global_step": 53738, "epoch": 1279} {"train_loss": -5.871211051940918, "global_step": 53739, "epoch": 1279} {"train_loss": -5.86667537689209, "global_step": 53740, "epoch": 1279} {"train_loss": -5.723775386810303, "global_step": 53741, "epoch": 1279} {"train_loss": -5.795109748840332, "global_step": 53742, "epoch": 1279} {"train_loss": -5.8672261238098145, "global_step": 53743, "epoch": 1279} {"train_loss": -5.713910102844238, "global_step": 53744, "epoch": 1279} {"train_loss": -5.754249572753906, "global_step": 53745, "epoch": 1279} {"train_loss": -5.781889915466309, "global_step": 53746, "epoch": 1279} {"train_loss": -5.706435203552246, "global_step": 53747, "epoch": 1279} {"train_loss": -5.9411492347717285, "global_step": 53748, "epoch": 1279} {"train_loss": -5.820369720458984, "global_step": 53749, "epoch": 1279} {"train_loss": -5.809869766235352, "global_step": 53750, "epoch": 1279} {"train_loss": -5.779684543609619, "global_step": 53751, "epoch": 1279} {"train_loss": -5.787755012512207, "global_step": 53752, "epoch": 1279} {"train_loss": -5.764733791351318, "global_step": 53753, "epoch": 1279} {"train_loss": -5.8390913009643555, "global_step": 53754, "epoch": 1279} {"train_loss": -5.890108585357666, "global_step": 53755, "epoch": 1279} {"train_loss": -5.868928909301758, "global_step": 53756, "epoch": 1279} {"train_loss": -5.888330459594727, "global_step": 53757, "epoch": 1279} {"train_loss": -5.795968532562256, "global_step": 53758, "epoch": 1279} {"train_loss": -5.8224662599109465, "global_step": 53759, "epoch": 1279, "val_loss": 74261.1953125} {"train_loss": -5.837039947509766, "global_step": 53760, "epoch": 1280} {"train_loss": -5.672126770019531, "global_step": 53761, "epoch": 1280} {"train_loss": -5.872675895690918, "global_step": 53762, "epoch": 1280} {"train_loss": -5.77113151550293, "global_step": 53763, "epoch": 1280} {"train_loss": -5.816097259521484, "global_step": 53764, "epoch": 1280} {"train_loss": -5.865860462188721, "global_step": 53765, "epoch": 1280} {"train_loss": -5.801523208618164, "global_step": 53766, "epoch": 1280} {"train_loss": -5.764698028564453, "global_step": 53767, "epoch": 1280} {"train_loss": -5.9791717529296875, "global_step": 53768, "epoch": 1280} {"train_loss": -5.777909755706787, "global_step": 53769, "epoch": 1280} {"train_loss": -5.786890506744385, "global_step": 53770, "epoch": 1280} {"train_loss": -5.75392484664917, "global_step": 53771, "epoch": 1280} {"train_loss": -5.843018054962158, "global_step": 53772, "epoch": 1280} {"train_loss": -5.776595115661621, "global_step": 53773, "epoch": 1280} {"train_loss": -5.739864349365234, "global_step": 53774, "epoch": 1280} {"train_loss": -5.885052680969238, "global_step": 53775, "epoch": 1280} {"train_loss": -5.901834011077881, "global_step": 53776, "epoch": 1280} {"train_loss": -5.819412708282471, "global_step": 53777, "epoch": 1280} {"train_loss": -5.834926605224609, "global_step": 53778, "epoch": 1280} {"train_loss": -5.752313613891602, "global_step": 53779, "epoch": 1280} {"train_loss": -5.8308820724487305, "global_step": 53780, "epoch": 1280} {"train_loss": -5.767965316772461, "global_step": 53781, "epoch": 1280} {"train_loss": -5.827729225158691, "global_step": 53782, "epoch": 1280} {"train_loss": -5.947662353515625, "global_step": 53783, "epoch": 1280} {"train_loss": -5.850898742675781, "global_step": 53784, "epoch": 1280} {"train_loss": -5.8553876876831055, "global_step": 53785, "epoch": 1280} {"train_loss": -5.915337085723877, "global_step": 53786, "epoch": 1280} {"train_loss": -5.750171661376953, "global_step": 53787, "epoch": 1280} {"train_loss": -5.950073719024658, "global_step": 53788, "epoch": 1280} {"train_loss": -5.750563621520996, "global_step": 53789, "epoch": 1280} {"train_loss": -5.842518329620361, "global_step": 53790, "epoch": 1280} {"train_loss": -5.853688716888428, "global_step": 53791, "epoch": 1280} {"train_loss": -5.8343095779418945, "global_step": 53792, "epoch": 1280} {"train_loss": -5.837546348571777, "global_step": 53793, "epoch": 1280} {"train_loss": -5.91600227355957, "global_step": 53794, "epoch": 1280} {"train_loss": -5.734116077423096, "global_step": 53795, "epoch": 1280} {"train_loss": -5.841184616088867, "global_step": 53796, "epoch": 1280} {"train_loss": -5.8393378257751465, "global_step": 53797, "epoch": 1280} {"train_loss": -5.91006326675415, "global_step": 53798, "epoch": 1280} {"train_loss": -5.814297676086426, "global_step": 53799, "epoch": 1280} {"train_loss": -5.872994899749756, "global_step": 53800, "epoch": 1280} {"train_loss": -5.832655543372745, "global_step": 53801, "epoch": 1280, "val_loss": 74635.90625} {"train_loss": -5.740273475646973, "global_step": 53802, "epoch": 1281} {"train_loss": -5.87509298324585, "global_step": 53803, "epoch": 1281} {"train_loss": -5.864443778991699, "global_step": 53804, "epoch": 1281} {"train_loss": -5.8711652755737305, "global_step": 53805, "epoch": 1281} {"train_loss": -5.7219557762146, "global_step": 53806, "epoch": 1281} {"train_loss": -5.723515510559082, "global_step": 53807, "epoch": 1281} {"train_loss": -5.835376739501953, "global_step": 53808, "epoch": 1281} {"train_loss": -5.86134672164917, "global_step": 53809, "epoch": 1281} {"train_loss": -5.819271087646484, "global_step": 53810, "epoch": 1281} {"train_loss": -5.863216876983643, "global_step": 53811, "epoch": 1281} {"train_loss": -5.935421943664551, "global_step": 53812, "epoch": 1281} {"train_loss": -5.952133655548096, "global_step": 53813, "epoch": 1281} {"train_loss": -5.85678243637085, "global_step": 53814, "epoch": 1281} {"train_loss": -5.817720413208008, "global_step": 53815, "epoch": 1281} {"train_loss": -5.727632522583008, "global_step": 53816, "epoch": 1281} {"train_loss": -5.823674201965332, "global_step": 53817, "epoch": 1281} {"train_loss": -5.81311559677124, "global_step": 53818, "epoch": 1281} {"train_loss": -5.783721923828125, "global_step": 53819, "epoch": 1281} {"train_loss": -5.78411865234375, "global_step": 53820, "epoch": 1281} {"train_loss": -5.8964362144470215, "global_step": 53821, "epoch": 1281} {"train_loss": -5.886415481567383, "global_step": 53822, "epoch": 1281} {"train_loss": -5.8416571617126465, "global_step": 53823, "epoch": 1281} {"train_loss": -5.91721248626709, "global_step": 53824, "epoch": 1281} {"train_loss": -5.830844402313232, "global_step": 53825, "epoch": 1281} {"train_loss": -5.925477027893066, "global_step": 53826, "epoch": 1281} {"train_loss": -5.81451416015625, "global_step": 53827, "epoch": 1281} {"train_loss": -5.860103130340576, "global_step": 53828, "epoch": 1281} {"train_loss": -5.755131721496582, "global_step": 53829, "epoch": 1281} {"train_loss": -5.744439125061035, "global_step": 53830, "epoch": 1281} {"train_loss": -6.003866672515869, "global_step": 53831, "epoch": 1281} {"train_loss": -5.828281879425049, "global_step": 53832, "epoch": 1281} {"train_loss": -5.859753608703613, "global_step": 53833, "epoch": 1281} {"train_loss": -5.676112174987793, "global_step": 53834, "epoch": 1281} {"train_loss": -5.748928546905518, "global_step": 53835, "epoch": 1281} {"train_loss": -5.8444318771362305, "global_step": 53836, "epoch": 1281} {"train_loss": -5.93074893951416, "global_step": 53837, "epoch": 1281} {"train_loss": -5.934660911560059, "global_step": 53838, "epoch": 1281} {"train_loss": -5.8679351806640625, "global_step": 53839, "epoch": 1281} {"train_loss": -5.947230339050293, "global_step": 53840, "epoch": 1281} {"train_loss": -5.751502990722656, "global_step": 53841, "epoch": 1281} {"train_loss": -5.579037666320801, "global_step": 53842, "epoch": 1281} {"train_loss": -5.834935426712036, "global_step": 53843, "epoch": 1281, "val_loss": 74272.109375} {"train_loss": -5.914276599884033, "global_step": 53844, "epoch": 1282} {"train_loss": -5.767282485961914, "global_step": 53845, "epoch": 1282} {"train_loss": -5.912468910217285, "global_step": 53846, "epoch": 1282} {"train_loss": -5.835309982299805, "global_step": 53847, "epoch": 1282} {"train_loss": -5.919703483581543, "global_step": 53848, "epoch": 1282} {"train_loss": -5.837860107421875, "global_step": 53849, "epoch": 1282} {"train_loss": -5.755862236022949, "global_step": 53850, "epoch": 1282} {"train_loss": -5.813372611999512, "global_step": 53851, "epoch": 1282} {"train_loss": -5.7404890060424805, "global_step": 53852, "epoch": 1282} {"train_loss": -5.81496524810791, "global_step": 53853, "epoch": 1282} {"train_loss": -5.645360946655273, "global_step": 53854, "epoch": 1282} {"train_loss": -5.766961574554443, "global_step": 53855, "epoch": 1282} {"train_loss": -5.736845970153809, "global_step": 53856, "epoch": 1282} {"train_loss": -5.722344875335693, "global_step": 53857, "epoch": 1282} {"train_loss": -5.797614574432373, "global_step": 53858, "epoch": 1282} {"train_loss": -5.747823238372803, "global_step": 53859, "epoch": 1282} {"train_loss": -5.841969966888428, "global_step": 53860, "epoch": 1282} {"train_loss": -5.97402811050415, "global_step": 53861, "epoch": 1282} {"train_loss": -5.809326171875, "global_step": 53862, "epoch": 1282} {"train_loss": -5.765861511230469, "global_step": 53863, "epoch": 1282} {"train_loss": -5.8491740226745605, "global_step": 53864, "epoch": 1282} {"train_loss": -5.768711566925049, "global_step": 53865, "epoch": 1282} {"train_loss": -5.887262344360352, "global_step": 53866, "epoch": 1282} {"train_loss": -5.810092449188232, "global_step": 53867, "epoch": 1282} {"train_loss": -5.943251132965088, "global_step": 53868, "epoch": 1282} {"train_loss": -5.795261383056641, "global_step": 53869, "epoch": 1282} {"train_loss": -5.876230239868164, "global_step": 53870, "epoch": 1282} {"train_loss": -5.98298454284668, "global_step": 53871, "epoch": 1282} {"train_loss": -5.789541721343994, "global_step": 53872, "epoch": 1282} {"train_loss": -5.7329888343811035, "global_step": 53873, "epoch": 1282} {"train_loss": -5.849145412445068, "global_step": 53874, "epoch": 1282} {"train_loss": -5.768000602722168, "global_step": 53875, "epoch": 1282} {"train_loss": -5.673313140869141, "global_step": 53876, "epoch": 1282} {"train_loss": -5.837603569030762, "global_step": 53877, "epoch": 1282} {"train_loss": -5.856856346130371, "global_step": 53878, "epoch": 1282} {"train_loss": -5.924497127532959, "global_step": 53879, "epoch": 1282} {"train_loss": -5.83925724029541, "global_step": 53880, "epoch": 1282} {"train_loss": -5.874515533447266, "global_step": 53881, "epoch": 1282} {"train_loss": -5.846540451049805, "global_step": 53882, "epoch": 1282} {"train_loss": -5.812511444091797, "global_step": 53883, "epoch": 1282} {"train_loss": -5.839098930358887, "global_step": 53884, "epoch": 1282} {"train_loss": -5.819021508807228, "global_step": 53885, "epoch": 1282, "val_loss": 73960.8671875} {"train_loss": -5.77168083190918, "global_step": 53886, "epoch": 1283} {"train_loss": -5.910163879394531, "global_step": 53887, "epoch": 1283} {"train_loss": -5.838508605957031, "global_step": 53888, "epoch": 1283} {"train_loss": -5.895511150360107, "global_step": 53889, "epoch": 1283} {"train_loss": -5.920278549194336, "global_step": 53890, "epoch": 1283} {"train_loss": -5.849518775939941, "global_step": 53891, "epoch": 1283} {"train_loss": -5.904574871063232, "global_step": 53892, "epoch": 1283} {"train_loss": -5.782159805297852, "global_step": 53893, "epoch": 1283} {"train_loss": -5.854221343994141, "global_step": 53894, "epoch": 1283} {"train_loss": -5.7835893630981445, "global_step": 53895, "epoch": 1283} {"train_loss": -5.763062477111816, "global_step": 53896, "epoch": 1283} {"train_loss": -5.913313865661621, "global_step": 53897, "epoch": 1283} {"train_loss": -5.775165557861328, "global_step": 53898, "epoch": 1283} {"train_loss": -5.797549247741699, "global_step": 53899, "epoch": 1283} {"train_loss": -5.675540924072266, "global_step": 53900, "epoch": 1283} {"train_loss": -5.728545188903809, "global_step": 53901, "epoch": 1283} {"train_loss": -5.70883846282959, "global_step": 53902, "epoch": 1283} {"train_loss": -5.644628047943115, "global_step": 53903, "epoch": 1283} {"train_loss": -5.8078413009643555, "global_step": 53904, "epoch": 1283} {"train_loss": -5.6242876052856445, "global_step": 53905, "epoch": 1283} {"train_loss": -5.844094276428223, "global_step": 53906, "epoch": 1283} {"train_loss": -5.678830623626709, "global_step": 53907, "epoch": 1283} {"train_loss": -5.680885314941406, "global_step": 53908, "epoch": 1283} {"train_loss": -5.935128211975098, "global_step": 53909, "epoch": 1283} {"train_loss": -5.731545448303223, "global_step": 53910, "epoch": 1283} {"train_loss": -5.826807975769043, "global_step": 53911, "epoch": 1283} {"train_loss": -5.619999885559082, "global_step": 53912, "epoch": 1283} {"train_loss": -5.748570442199707, "global_step": 53913, "epoch": 1283} {"train_loss": -5.598821640014648, "global_step": 53914, "epoch": 1283} {"train_loss": -5.752800941467285, "global_step": 53915, "epoch": 1283} {"train_loss": -5.817823886871338, "global_step": 53916, "epoch": 1283} {"train_loss": -5.981583118438721, "global_step": 53917, "epoch": 1283} {"train_loss": -5.756556510925293, "global_step": 53918, "epoch": 1283} {"train_loss": -5.63380241394043, "global_step": 53919, "epoch": 1283} {"train_loss": -5.738763809204102, "global_step": 53920, "epoch": 1283} {"train_loss": -5.718221664428711, "global_step": 53921, "epoch": 1283} {"train_loss": -5.831347942352295, "global_step": 53922, "epoch": 1283} {"train_loss": -5.78128719329834, "global_step": 53923, "epoch": 1283} {"train_loss": -5.705848693847656, "global_step": 53924, "epoch": 1283} {"train_loss": -5.652153015136719, "global_step": 53925, "epoch": 1283} {"train_loss": -5.736148357391357, "global_step": 53926, "epoch": 1283} {"train_loss": -5.774601993106661, "global_step": 53927, "epoch": 1283, "val_loss": 74448.4140625} {"train_loss": -5.786679744720459, "global_step": 53928, "epoch": 1284} {"train_loss": -5.69985294342041, "global_step": 53929, "epoch": 1284} {"train_loss": -5.713940620422363, "global_step": 53930, "epoch": 1284} {"train_loss": -5.868887901306152, "global_step": 53931, "epoch": 1284} {"train_loss": -5.883061408996582, "global_step": 53932, "epoch": 1284} {"train_loss": -5.706945419311523, "global_step": 53933, "epoch": 1284} {"train_loss": -5.661415100097656, "global_step": 53934, "epoch": 1284} {"train_loss": -5.732532501220703, "global_step": 53935, "epoch": 1284} {"train_loss": -5.863605976104736, "global_step": 53936, "epoch": 1284} {"train_loss": -5.678184509277344, "global_step": 53937, "epoch": 1284} {"train_loss": -5.774594306945801, "global_step": 53938, "epoch": 1284} {"train_loss": -5.842489242553711, "global_step": 53939, "epoch": 1284} {"train_loss": -5.683485984802246, "global_step": 53940, "epoch": 1284} {"train_loss": -5.774473667144775, "global_step": 53941, "epoch": 1284} {"train_loss": -5.8901824951171875, "global_step": 53942, "epoch": 1284} {"train_loss": -5.683870315551758, "global_step": 53943, "epoch": 1284} {"train_loss": -5.873350143432617, "global_step": 53944, "epoch": 1284} {"train_loss": -5.885274887084961, "global_step": 53945, "epoch": 1284} {"train_loss": -5.884294509887695, "global_step": 53946, "epoch": 1284} {"train_loss": -5.884305953979492, "global_step": 53947, "epoch": 1284} {"train_loss": -5.787022590637207, "global_step": 53948, "epoch": 1284} {"train_loss": -5.719504356384277, "global_step": 53949, "epoch": 1284} {"train_loss": -5.835628509521484, "global_step": 53950, "epoch": 1284} {"train_loss": -5.80537748336792, "global_step": 53951, "epoch": 1284} {"train_loss": -5.846868991851807, "global_step": 53952, "epoch": 1284} {"train_loss": -5.841485023498535, "global_step": 53953, "epoch": 1284} {"train_loss": -5.889101982116699, "global_step": 53954, "epoch": 1284} {"train_loss": -6.003607749938965, "global_step": 53955, "epoch": 1284} {"train_loss": -5.744289398193359, "global_step": 53956, "epoch": 1284} {"train_loss": -5.879129409790039, "global_step": 53957, "epoch": 1284} {"train_loss": -5.805682182312012, "global_step": 53958, "epoch": 1284} {"train_loss": -5.649712562561035, "global_step": 53959, "epoch": 1284} {"train_loss": -5.9007673263549805, "global_step": 53960, "epoch": 1284} {"train_loss": -5.770613670349121, "global_step": 53961, "epoch": 1284} {"train_loss": -5.774523735046387, "global_step": 53962, "epoch": 1284} {"train_loss": -5.838988304138184, "global_step": 53963, "epoch": 1284} {"train_loss": -5.780508041381836, "global_step": 53964, "epoch": 1284} {"train_loss": -5.783668041229248, "global_step": 53965, "epoch": 1284} {"train_loss": -5.870959758758545, "global_step": 53966, "epoch": 1284} {"train_loss": -5.623025417327881, "global_step": 53967, "epoch": 1284} {"train_loss": -5.901855945587158, "global_step": 53968, "epoch": 1284} {"train_loss": -5.799641393479847, "global_step": 53969, "epoch": 1284, "val_loss": 74586.4453125} {"train_loss": -5.765534400939941, "global_step": 53970, "epoch": 1285} {"train_loss": -5.862044811248779, "global_step": 53971, "epoch": 1285} {"train_loss": -5.736228942871094, "global_step": 53972, "epoch": 1285} {"train_loss": -5.915062427520752, "global_step": 53973, "epoch": 1285} {"train_loss": -5.7494025230407715, "global_step": 53974, "epoch": 1285} {"train_loss": -5.827493667602539, "global_step": 53975, "epoch": 1285} {"train_loss": -5.779026031494141, "global_step": 53976, "epoch": 1285} {"train_loss": -5.773422718048096, "global_step": 53977, "epoch": 1285} {"train_loss": -5.833072662353516, "global_step": 53978, "epoch": 1285} {"train_loss": -5.815881729125977, "global_step": 53979, "epoch": 1285} {"train_loss": -5.728660583496094, "global_step": 53980, "epoch": 1285} {"train_loss": -5.842562675476074, "global_step": 53981, "epoch": 1285} {"train_loss": -5.803897857666016, "global_step": 53982, "epoch": 1285} {"train_loss": -5.902818202972412, "global_step": 53983, "epoch": 1285} {"train_loss": -5.85600471496582, "global_step": 53984, "epoch": 1285} {"train_loss": -5.959612846374512, "global_step": 53985, "epoch": 1285} {"train_loss": -5.822451591491699, "global_step": 53986, "epoch": 1285} {"train_loss": -5.825909614562988, "global_step": 53987, "epoch": 1285} {"train_loss": -5.829697608947754, "global_step": 53988, "epoch": 1285} {"train_loss": -5.774763584136963, "global_step": 53989, "epoch": 1285} {"train_loss": -5.789277076721191, "global_step": 53990, "epoch": 1285} {"train_loss": -5.809883117675781, "global_step": 53991, "epoch": 1285} {"train_loss": -5.899614334106445, "global_step": 53992, "epoch": 1285} {"train_loss": -5.971085548400879, "global_step": 53993, "epoch": 1285} {"train_loss": -5.834347724914551, "global_step": 53994, "epoch": 1285} {"train_loss": -5.677237510681152, "global_step": 53995, "epoch": 1285} {"train_loss": -5.791351318359375, "global_step": 53996, "epoch": 1285} {"train_loss": -5.72166633605957, "global_step": 53997, "epoch": 1285} {"train_loss": -5.847944259643555, "global_step": 53998, "epoch": 1285} {"train_loss": -5.744997024536133, "global_step": 53999, "epoch": 1285} {"train_loss": -5.7803497314453125, "global_step": 54000, "epoch": 1285} {"train_loss": -5.721138954162598, "global_step": 54001, "epoch": 1285} {"train_loss": -5.652950286865234, "global_step": 54002, "epoch": 1285} {"train_loss": -5.755947589874268, "global_step": 54003, "epoch": 1285} {"train_loss": -5.985287666320801, "global_step": 54004, "epoch": 1285} {"train_loss": -5.746263027191162, "global_step": 54005, "epoch": 1285} {"train_loss": -5.850648880004883, "global_step": 54006, "epoch": 1285} {"train_loss": -5.833063125610352, "global_step": 54007, "epoch": 1285} {"train_loss": -5.882090091705322, "global_step": 54008, "epoch": 1285} {"train_loss": -5.861469268798828, "global_step": 54009, "epoch": 1285} {"train_loss": -5.873325824737549, "global_step": 54010, "epoch": 1285} {"train_loss": -5.814968688147409, "global_step": 54011, "epoch": 1285, "val_loss": 73851.7421875} {"train_loss": -5.963895797729492, "global_step": 54012, "epoch": 1286} {"train_loss": -5.816537857055664, "global_step": 54013, "epoch": 1286} {"train_loss": -5.869693756103516, "global_step": 54014, "epoch": 1286} {"train_loss": -5.8562726974487305, "global_step": 54015, "epoch": 1286} {"train_loss": -5.897821426391602, "global_step": 54016, "epoch": 1286} {"train_loss": -5.903134822845459, "global_step": 54017, "epoch": 1286} {"train_loss": -5.851173400878906, "global_step": 54018, "epoch": 1286} {"train_loss": -5.593895435333252, "global_step": 54019, "epoch": 1286} {"train_loss": -5.799283981323242, "global_step": 54020, "epoch": 1286} {"train_loss": -5.838022232055664, "global_step": 54021, "epoch": 1286} {"train_loss": -5.761302947998047, "global_step": 54022, "epoch": 1286} {"train_loss": -5.809684753417969, "global_step": 54023, "epoch": 1286} {"train_loss": -5.801272392272949, "global_step": 54024, "epoch": 1286} {"train_loss": -5.748916149139404, "global_step": 54025, "epoch": 1286} {"train_loss": -5.723772048950195, "global_step": 54026, "epoch": 1286} {"train_loss": -5.925279140472412, "global_step": 54027, "epoch": 1286} {"train_loss": -5.826031684875488, "global_step": 54028, "epoch": 1286} {"train_loss": -5.757069110870361, "global_step": 54029, "epoch": 1286} {"train_loss": -5.746189594268799, "global_step": 54030, "epoch": 1286} {"train_loss": -5.742453098297119, "global_step": 54031, "epoch": 1286} {"train_loss": -5.746057033538818, "global_step": 54032, "epoch": 1286} {"train_loss": -5.718981742858887, "global_step": 54033, "epoch": 1286} {"train_loss": -5.635394096374512, "global_step": 54034, "epoch": 1286} {"train_loss": -5.8436079025268555, "global_step": 54035, "epoch": 1286} {"train_loss": -5.778791427612305, "global_step": 54036, "epoch": 1286} {"train_loss": -5.79611349105835, "global_step": 54037, "epoch": 1286} {"train_loss": -5.86858606338501, "global_step": 54038, "epoch": 1286} {"train_loss": -5.815546035766602, "global_step": 54039, "epoch": 1286} {"train_loss": -5.782094955444336, "global_step": 54040, "epoch": 1286} {"train_loss": -5.665463447570801, "global_step": 54041, "epoch": 1286} {"train_loss": -5.839003562927246, "global_step": 54042, "epoch": 1286} {"train_loss": -5.906987190246582, "global_step": 54043, "epoch": 1286} {"train_loss": -5.726413726806641, "global_step": 54044, "epoch": 1286} {"train_loss": -5.795307159423828, "global_step": 54045, "epoch": 1286} {"train_loss": -5.892078399658203, "global_step": 54046, "epoch": 1286} {"train_loss": -5.861316680908203, "global_step": 54047, "epoch": 1286} {"train_loss": -5.803542137145996, "global_step": 54048, "epoch": 1286} {"train_loss": -5.915335178375244, "global_step": 54049, "epoch": 1286} {"train_loss": -5.749766826629639, "global_step": 54050, "epoch": 1286} {"train_loss": -5.807939529418945, "global_step": 54051, "epoch": 1286} {"train_loss": -5.865712642669678, "global_step": 54052, "epoch": 1286} {"train_loss": -5.807489304315476, "global_step": 54053, "epoch": 1286, "val_loss": 74217.453125} {"train_loss": -5.9017252922058105, "global_step": 54054, "epoch": 1287} {"train_loss": -5.8313164710998535, "global_step": 54055, "epoch": 1287} {"train_loss": -5.882514953613281, "global_step": 54056, "epoch": 1287} {"train_loss": -5.7260565757751465, "global_step": 54057, "epoch": 1287} {"train_loss": -5.918947219848633, "global_step": 54058, "epoch": 1287} {"train_loss": -5.7270894050598145, "global_step": 54059, "epoch": 1287} {"train_loss": -5.857306957244873, "global_step": 54060, "epoch": 1287} {"train_loss": -5.794064998626709, "global_step": 54061, "epoch": 1287} {"train_loss": -5.835378646850586, "global_step": 54062, "epoch": 1287} {"train_loss": -5.727318286895752, "global_step": 54063, "epoch": 1287} {"train_loss": -5.9150710105896, "global_step": 54064, "epoch": 1287} {"train_loss": -5.7569804191589355, "global_step": 54065, "epoch": 1287} {"train_loss": -5.886536598205566, "global_step": 54066, "epoch": 1287} {"train_loss": -5.829708099365234, "global_step": 54067, "epoch": 1287} {"train_loss": -5.768498420715332, "global_step": 54068, "epoch": 1287} {"train_loss": -5.7444257736206055, "global_step": 54069, "epoch": 1287} {"train_loss": -5.793962001800537, "global_step": 54070, "epoch": 1287} {"train_loss": -5.7580132484436035, "global_step": 54071, "epoch": 1287} {"train_loss": -5.708748817443848, "global_step": 54072, "epoch": 1287} {"train_loss": -5.64745569229126, "global_step": 54073, "epoch": 1287} {"train_loss": -5.874103546142578, "global_step": 54074, "epoch": 1287} {"train_loss": -5.778792381286621, "global_step": 54075, "epoch": 1287} {"train_loss": -5.677996635437012, "global_step": 54076, "epoch": 1287} {"train_loss": -5.860572814941406, "global_step": 54077, "epoch": 1287} {"train_loss": -5.831777095794678, "global_step": 54078, "epoch": 1287} {"train_loss": -5.816466808319092, "global_step": 54079, "epoch": 1287} {"train_loss": -5.786039352416992, "global_step": 54080, "epoch": 1287} {"train_loss": -5.573151588439941, "global_step": 54081, "epoch": 1287} {"train_loss": -5.761752605438232, "global_step": 54082, "epoch": 1287} {"train_loss": -5.768247604370117, "global_step": 54083, "epoch": 1287} {"train_loss": -5.787938117980957, "global_step": 54084, "epoch": 1287} {"train_loss": -5.683588027954102, "global_step": 54085, "epoch": 1287} {"train_loss": -5.796016216278076, "global_step": 54086, "epoch": 1287} {"train_loss": -5.661716461181641, "global_step": 54087, "epoch": 1287} {"train_loss": -5.85548210144043, "global_step": 54088, "epoch": 1287} {"train_loss": -5.741188049316406, "global_step": 54089, "epoch": 1287} {"train_loss": -5.7778096199035645, "global_step": 54090, "epoch": 1287} {"train_loss": -5.821542263031006, "global_step": 54091, "epoch": 1287} {"train_loss": -5.881876468658447, "global_step": 54092, "epoch": 1287} {"train_loss": -5.776111602783203, "global_step": 54093, "epoch": 1287} {"train_loss": -5.788660049438477, "global_step": 54094, "epoch": 1287} {"train_loss": -5.790278991063436, "global_step": 54095, "epoch": 1287, "val_loss": 74278.9921875} {"train_loss": -5.770843505859375, "global_step": 54096, "epoch": 1288} {"train_loss": -5.6739702224731445, "global_step": 54097, "epoch": 1288} {"train_loss": -5.76103401184082, "global_step": 54098, "epoch": 1288} {"train_loss": -5.703343391418457, "global_step": 54099, "epoch": 1288} {"train_loss": -5.88967227935791, "global_step": 54100, "epoch": 1288} {"train_loss": -5.820100784301758, "global_step": 54101, "epoch": 1288} {"train_loss": -5.764344215393066, "global_step": 54102, "epoch": 1288} {"train_loss": -5.925654411315918, "global_step": 54103, "epoch": 1288} {"train_loss": -5.719353675842285, "global_step": 54104, "epoch": 1288} {"train_loss": -5.799990653991699, "global_step": 54105, "epoch": 1288} {"train_loss": -5.787175178527832, "global_step": 54106, "epoch": 1288} {"train_loss": -5.832297325134277, "global_step": 54107, "epoch": 1288} {"train_loss": -5.920426368713379, "global_step": 54108, "epoch": 1288} {"train_loss": -5.947263240814209, "global_step": 54109, "epoch": 1288} {"train_loss": -5.823142051696777, "global_step": 54110, "epoch": 1288} {"train_loss": -5.878711700439453, "global_step": 54111, "epoch": 1288} {"train_loss": -5.893641948699951, "global_step": 54112, "epoch": 1288} {"train_loss": -5.8765869140625, "global_step": 54113, "epoch": 1288} {"train_loss": -5.872743606567383, "global_step": 54114, "epoch": 1288} {"train_loss": -5.8142619132995605, "global_step": 54115, "epoch": 1288} {"train_loss": -5.866369247436523, "global_step": 54116, "epoch": 1288} {"train_loss": -5.66763162612915, "global_step": 54117, "epoch": 1288} {"train_loss": -5.850965976715088, "global_step": 54118, "epoch": 1288} {"train_loss": -5.711426734924316, "global_step": 54119, "epoch": 1288} {"train_loss": -5.889128684997559, "global_step": 54120, "epoch": 1288} {"train_loss": -5.934277534484863, "global_step": 54121, "epoch": 1288} {"train_loss": -5.815518856048584, "global_step": 54122, "epoch": 1288} {"train_loss": -5.884903430938721, "global_step": 54123, "epoch": 1288} {"train_loss": -5.8207621574401855, "global_step": 54124, "epoch": 1288} {"train_loss": -5.8221235275268555, "global_step": 54125, "epoch": 1288} {"train_loss": -5.742649078369141, "global_step": 54126, "epoch": 1288} {"train_loss": -5.783336639404297, "global_step": 54127, "epoch": 1288} {"train_loss": -5.858048439025879, "global_step": 54128, "epoch": 1288} {"train_loss": -5.828231334686279, "global_step": 54129, "epoch": 1288} {"train_loss": -5.92784309387207, "global_step": 54130, "epoch": 1288} {"train_loss": -5.930995941162109, "global_step": 54131, "epoch": 1288} {"train_loss": -5.868562698364258, "global_step": 54132, "epoch": 1288} {"train_loss": -5.839679718017578, "global_step": 54133, "epoch": 1288} {"train_loss": -6.009501934051514, "global_step": 54134, "epoch": 1288} {"train_loss": -5.888138294219971, "global_step": 54135, "epoch": 1288} {"train_loss": -5.831901550292969, "global_step": 54136, "epoch": 1288} {"train_loss": -5.835804417019799, "global_step": 54137, "epoch": 1288, "val_loss": 74366.703125} {"train_loss": -5.8397016525268555, "global_step": 54138, "epoch": 1289} {"train_loss": -5.755862236022949, "global_step": 54139, "epoch": 1289} {"train_loss": -5.687396049499512, "global_step": 54140, "epoch": 1289} {"train_loss": -5.798537254333496, "global_step": 54141, "epoch": 1289} {"train_loss": -5.773284435272217, "global_step": 54142, "epoch": 1289} {"train_loss": -5.8824238777160645, "global_step": 54143, "epoch": 1289} {"train_loss": -5.788422107696533, "global_step": 54144, "epoch": 1289} {"train_loss": -5.754644393920898, "global_step": 54145, "epoch": 1289} {"train_loss": -5.765129089355469, "global_step": 54146, "epoch": 1289} {"train_loss": -5.82657527923584, "global_step": 54147, "epoch": 1289} {"train_loss": -5.8403825759887695, "global_step": 54148, "epoch": 1289} {"train_loss": -5.781454086303711, "global_step": 54149, "epoch": 1289} {"train_loss": -5.782233715057373, "global_step": 54150, "epoch": 1289} {"train_loss": -5.866324424743652, "global_step": 54151, "epoch": 1289} {"train_loss": -5.48595666885376, "global_step": 54152, "epoch": 1289} {"train_loss": -5.86668586730957, "global_step": 54153, "epoch": 1289} {"train_loss": -5.666801929473877, "global_step": 54154, "epoch": 1289} {"train_loss": -5.731550693511963, "global_step": 54155, "epoch": 1289} {"train_loss": -5.749833106994629, "global_step": 54156, "epoch": 1289} {"train_loss": -5.652745246887207, "global_step": 54157, "epoch": 1289} {"train_loss": -5.8174543380737305, "global_step": 54158, "epoch": 1289} {"train_loss": -5.671316146850586, "global_step": 54159, "epoch": 1289} {"train_loss": -5.747949600219727, "global_step": 54160, "epoch": 1289} {"train_loss": -5.820954322814941, "global_step": 54161, "epoch": 1289} {"train_loss": -5.757594108581543, "global_step": 54162, "epoch": 1289} {"train_loss": -5.748651504516602, "global_step": 54163, "epoch": 1289} {"train_loss": -5.737236022949219, "global_step": 54164, "epoch": 1289} {"train_loss": -5.759116172790527, "global_step": 54165, "epoch": 1289} {"train_loss": -5.715973854064941, "global_step": 54166, "epoch": 1289} {"train_loss": -5.815657615661621, "global_step": 54167, "epoch": 1289} {"train_loss": -5.765375137329102, "global_step": 54168, "epoch": 1289} {"train_loss": -5.710029602050781, "global_step": 54169, "epoch": 1289} {"train_loss": -5.994624137878418, "global_step": 54170, "epoch": 1289} {"train_loss": -5.695282936096191, "global_step": 54171, "epoch": 1289} {"train_loss": -5.921207427978516, "global_step": 54172, "epoch": 1289} {"train_loss": -5.76419734954834, "global_step": 54173, "epoch": 1289} {"train_loss": -5.717418670654297, "global_step": 54174, "epoch": 1289} {"train_loss": -5.734370708465576, "global_step": 54175, "epoch": 1289} {"train_loss": -5.696181297302246, "global_step": 54176, "epoch": 1289} {"train_loss": -5.822965145111084, "global_step": 54177, "epoch": 1289} {"train_loss": -5.96909236907959, "global_step": 54178, "epoch": 1289} {"train_loss": -5.774420590627761, "global_step": 54179, "epoch": 1289, "val_loss": 74288.515625} {"train_loss": -5.867765426635742, "global_step": 54180, "epoch": 1290} {"train_loss": -5.862846374511719, "global_step": 54181, "epoch": 1290} {"train_loss": -5.754294395446777, "global_step": 54182, "epoch": 1290} {"train_loss": -5.777990818023682, "global_step": 54183, "epoch": 1290} {"train_loss": -5.794437408447266, "global_step": 54184, "epoch": 1290} {"train_loss": -5.916591644287109, "global_step": 54185, "epoch": 1290} {"train_loss": -5.868917942047119, "global_step": 54186, "epoch": 1290} {"train_loss": -5.94606351852417, "global_step": 54187, "epoch": 1290} {"train_loss": -5.836302757263184, "global_step": 54188, "epoch": 1290} {"train_loss": -5.787900924682617, "global_step": 54189, "epoch": 1290} {"train_loss": -5.814205169677734, "global_step": 54190, "epoch": 1290} {"train_loss": -5.83820915222168, "global_step": 54191, "epoch": 1290} {"train_loss": -5.712969779968262, "global_step": 54192, "epoch": 1290} {"train_loss": -5.822018623352051, "global_step": 54193, "epoch": 1290} {"train_loss": -5.719585418701172, "global_step": 54194, "epoch": 1290} {"train_loss": -5.835538864135742, "global_step": 54195, "epoch": 1290} {"train_loss": -5.764181137084961, "global_step": 54196, "epoch": 1290} {"train_loss": -5.740724086761475, "global_step": 54197, "epoch": 1290} {"train_loss": -5.741432189941406, "global_step": 54198, "epoch": 1290} {"train_loss": -5.786774158477783, "global_step": 54199, "epoch": 1290} {"train_loss": -5.774290561676025, "global_step": 54200, "epoch": 1290} {"train_loss": -5.761688232421875, "global_step": 54201, "epoch": 1290} {"train_loss": -5.831681251525879, "global_step": 54202, "epoch": 1290} {"train_loss": -5.87027645111084, "global_step": 54203, "epoch": 1290} {"train_loss": -5.772948265075684, "global_step": 54204, "epoch": 1290} {"train_loss": -5.775523662567139, "global_step": 54205, "epoch": 1290} {"train_loss": -5.851570129394531, "global_step": 54206, "epoch": 1290} {"train_loss": -5.7714152336120605, "global_step": 54207, "epoch": 1290} {"train_loss": -5.896700859069824, "global_step": 54208, "epoch": 1290} {"train_loss": -5.811884880065918, "global_step": 54209, "epoch": 1290} {"train_loss": -5.7718915939331055, "global_step": 54210, "epoch": 1290} {"train_loss": -5.792527675628662, "global_step": 54211, "epoch": 1290} {"train_loss": -5.832331657409668, "global_step": 54212, "epoch": 1290} {"train_loss": -5.808114051818848, "global_step": 54213, "epoch": 1290} {"train_loss": -5.775909423828125, "global_step": 54214, "epoch": 1290} {"train_loss": -5.793196201324463, "global_step": 54215, "epoch": 1290} {"train_loss": -5.835166931152344, "global_step": 54216, "epoch": 1290} {"train_loss": -5.7101054191589355, "global_step": 54217, "epoch": 1290} {"train_loss": -5.8167266845703125, "global_step": 54218, "epoch": 1290} {"train_loss": -5.839271545410156, "global_step": 54219, "epoch": 1290} {"train_loss": -5.854959487915039, "global_step": 54220, "epoch": 1290} {"train_loss": -5.80698519661313, "global_step": 54221, "epoch": 1290, "val_loss": 74351.1875} {"train_loss": -5.815764427185059, "global_step": 54222, "epoch": 1291} {"train_loss": -5.958740711212158, "global_step": 54223, "epoch": 1291} {"train_loss": -5.92840576171875, "global_step": 54224, "epoch": 1291} {"train_loss": -5.8453521728515625, "global_step": 54225, "epoch": 1291} {"train_loss": -5.895134925842285, "global_step": 54226, "epoch": 1291} {"train_loss": -5.716917037963867, "global_step": 54227, "epoch": 1291} {"train_loss": -5.9137349128723145, "global_step": 54228, "epoch": 1291} {"train_loss": -5.747211456298828, "global_step": 54229, "epoch": 1291} {"train_loss": -5.760989189147949, "global_step": 54230, "epoch": 1291} {"train_loss": -5.800692081451416, "global_step": 54231, "epoch": 1291} {"train_loss": -5.826598167419434, "global_step": 54232, "epoch": 1291} {"train_loss": -6.0484819412231445, "global_step": 54233, "epoch": 1291} {"train_loss": -5.7672505378723145, "global_step": 54234, "epoch": 1291} {"train_loss": -5.833312034606934, "global_step": 54235, "epoch": 1291} {"train_loss": -5.830507278442383, "global_step": 54236, "epoch": 1291} {"train_loss": -5.753072738647461, "global_step": 54237, "epoch": 1291} {"train_loss": -5.737800598144531, "global_step": 54238, "epoch": 1291} {"train_loss": -5.817291259765625, "global_step": 54239, "epoch": 1291} {"train_loss": -5.7716064453125, "global_step": 54240, "epoch": 1291} {"train_loss": -5.841437816619873, "global_step": 54241, "epoch": 1291} {"train_loss": -5.859371185302734, "global_step": 54242, "epoch": 1291} {"train_loss": -5.75083065032959, "global_step": 54243, "epoch": 1291} {"train_loss": -5.676890850067139, "global_step": 54244, "epoch": 1291} {"train_loss": -5.783997058868408, "global_step": 54245, "epoch": 1291} {"train_loss": -5.847884178161621, "global_step": 54246, "epoch": 1291} {"train_loss": -5.631945610046387, "global_step": 54247, "epoch": 1291} {"train_loss": -5.906664848327637, "global_step": 54248, "epoch": 1291} {"train_loss": -5.770471572875977, "global_step": 54249, "epoch": 1291} {"train_loss": -5.854876518249512, "global_step": 54250, "epoch": 1291} {"train_loss": -5.720992565155029, "global_step": 54251, "epoch": 1291} {"train_loss": -5.832786560058594, "global_step": 54252, "epoch": 1291} {"train_loss": -5.813284873962402, "global_step": 54253, "epoch": 1291} {"train_loss": -5.865777969360352, "global_step": 54254, "epoch": 1291} {"train_loss": -5.850810527801514, "global_step": 54255, "epoch": 1291} {"train_loss": -5.86385440826416, "global_step": 54256, "epoch": 1291} {"train_loss": -5.840452671051025, "global_step": 54257, "epoch": 1291} {"train_loss": -5.883869171142578, "global_step": 54258, "epoch": 1291} {"train_loss": -5.909891128540039, "global_step": 54259, "epoch": 1291} {"train_loss": -5.812867164611816, "global_step": 54260, "epoch": 1291} {"train_loss": -5.889535903930664, "global_step": 54261, "epoch": 1291} {"train_loss": -5.8091816902160645, "global_step": 54262, "epoch": 1291} {"train_loss": -5.823419514156523, "global_step": 54263, "epoch": 1291, "val_loss": 74150.3828125} {"train_loss": -5.884634017944336, "global_step": 54264, "epoch": 1292} {"train_loss": -5.680683612823486, "global_step": 54265, "epoch": 1292} {"train_loss": -5.84809684753418, "global_step": 54266, "epoch": 1292} {"train_loss": -5.741543292999268, "global_step": 54267, "epoch": 1292} {"train_loss": -5.8943891525268555, "global_step": 54268, "epoch": 1292} {"train_loss": -5.8401594161987305, "global_step": 54269, "epoch": 1292} {"train_loss": -5.771461486816406, "global_step": 54270, "epoch": 1292} {"train_loss": -5.802690505981445, "global_step": 54271, "epoch": 1292} {"train_loss": -5.766656875610352, "global_step": 54272, "epoch": 1292} {"train_loss": -5.716222763061523, "global_step": 54273, "epoch": 1292} {"train_loss": -5.736309051513672, "global_step": 54274, "epoch": 1292} {"train_loss": -5.8665361404418945, "global_step": 54275, "epoch": 1292} {"train_loss": -5.929649829864502, "global_step": 54276, "epoch": 1292} {"train_loss": -5.804327964782715, "global_step": 54277, "epoch": 1292} {"train_loss": -5.773947715759277, "global_step": 54278, "epoch": 1292} {"train_loss": -5.756590366363525, "global_step": 54279, "epoch": 1292} {"train_loss": -5.838625907897949, "global_step": 54280, "epoch": 1292} {"train_loss": -5.85394287109375, "global_step": 54281, "epoch": 1292} {"train_loss": -5.8008832931518555, "global_step": 54282, "epoch": 1292} {"train_loss": -5.85472297668457, "global_step": 54283, "epoch": 1292} {"train_loss": -5.8949713706970215, "global_step": 54284, "epoch": 1292} {"train_loss": -5.816936016082764, "global_step": 54285, "epoch": 1292} {"train_loss": -5.89576530456543, "global_step": 54286, "epoch": 1292} {"train_loss": -5.919301509857178, "global_step": 54287, "epoch": 1292} {"train_loss": -5.886691093444824, "global_step": 54288, "epoch": 1292} {"train_loss": -5.844300270080566, "global_step": 54289, "epoch": 1292} {"train_loss": -5.810751438140869, "global_step": 54290, "epoch": 1292} {"train_loss": -5.922464370727539, "global_step": 54291, "epoch": 1292} {"train_loss": -5.80059814453125, "global_step": 54292, "epoch": 1292} {"train_loss": -5.787692546844482, "global_step": 54293, "epoch": 1292} {"train_loss": -5.8409318923950195, "global_step": 54294, "epoch": 1292} {"train_loss": -5.9398980140686035, "global_step": 54295, "epoch": 1292} {"train_loss": -5.907071113586426, "global_step": 54296, "epoch": 1292} {"train_loss": -5.885580062866211, "global_step": 54297, "epoch": 1292} {"train_loss": -5.7593183517456055, "global_step": 54298, "epoch": 1292} {"train_loss": -5.752620697021484, "global_step": 54299, "epoch": 1292} {"train_loss": -5.906824111938477, "global_step": 54300, "epoch": 1292} {"train_loss": -5.893923759460449, "global_step": 54301, "epoch": 1292} {"train_loss": -5.817988872528076, "global_step": 54302, "epoch": 1292} {"train_loss": -5.847574234008789, "global_step": 54303, "epoch": 1292} {"train_loss": -5.930086612701416, "global_step": 54304, "epoch": 1292} {"train_loss": -5.834520680563791, "global_step": 54305, "epoch": 1292, "val_loss": 74593.0859375} {"train_loss": -5.805667877197266, "global_step": 54306, "epoch": 1293} {"train_loss": -5.762259483337402, "global_step": 54307, "epoch": 1293} {"train_loss": -5.942934036254883, "global_step": 54308, "epoch": 1293} {"train_loss": -5.902232646942139, "global_step": 54309, "epoch": 1293} {"train_loss": -5.814330101013184, "global_step": 54310, "epoch": 1293} {"train_loss": -5.830690860748291, "global_step": 54311, "epoch": 1293} {"train_loss": -5.7460479736328125, "global_step": 54312, "epoch": 1293} {"train_loss": -5.933655738830566, "global_step": 54313, "epoch": 1293} {"train_loss": -5.724634170532227, "global_step": 54314, "epoch": 1293} {"train_loss": -5.913606643676758, "global_step": 54315, "epoch": 1293} {"train_loss": -5.783806800842285, "global_step": 54316, "epoch": 1293} {"train_loss": -5.856192588806152, "global_step": 54317, "epoch": 1293} {"train_loss": -5.7750420570373535, "global_step": 54318, "epoch": 1293} {"train_loss": -5.842990875244141, "global_step": 54319, "epoch": 1293} {"train_loss": -5.845349311828613, "global_step": 54320, "epoch": 1293} {"train_loss": -5.923373699188232, "global_step": 54321, "epoch": 1293} {"train_loss": -5.836490631103516, "global_step": 54322, "epoch": 1293} {"train_loss": -5.774163246154785, "global_step": 54323, "epoch": 1293} {"train_loss": -5.823127746582031, "global_step": 54324, "epoch": 1293} {"train_loss": -5.830772399902344, "global_step": 54325, "epoch": 1293} {"train_loss": -5.897419452667236, "global_step": 54326, "epoch": 1293} {"train_loss": -5.798830032348633, "global_step": 54327, "epoch": 1293} {"train_loss": -5.880734443664551, "global_step": 54328, "epoch": 1293} {"train_loss": -5.809737682342529, "global_step": 54329, "epoch": 1293} {"train_loss": -5.841510772705078, "global_step": 54330, "epoch": 1293} {"train_loss": -5.956906795501709, "global_step": 54331, "epoch": 1293} {"train_loss": -5.86743688583374, "global_step": 54332, "epoch": 1293} {"train_loss": -5.903966903686523, "global_step": 54333, "epoch": 1293} {"train_loss": -5.684293270111084, "global_step": 54334, "epoch": 1293} {"train_loss": -5.76157283782959, "global_step": 54335, "epoch": 1293} {"train_loss": -5.720494747161865, "global_step": 54336, "epoch": 1293} {"train_loss": -5.853714942932129, "global_step": 54337, "epoch": 1293} {"train_loss": -5.866164207458496, "global_step": 54338, "epoch": 1293} {"train_loss": -5.681191444396973, "global_step": 54339, "epoch": 1293} {"train_loss": -5.7816162109375, "global_step": 54340, "epoch": 1293} {"train_loss": -5.645641326904297, "global_step": 54341, "epoch": 1293} {"train_loss": -5.795630931854248, "global_step": 54342, "epoch": 1293} {"train_loss": -5.793225288391113, "global_step": 54343, "epoch": 1293} {"train_loss": -5.670554161071777, "global_step": 54344, "epoch": 1293} {"train_loss": -5.805594444274902, "global_step": 54345, "epoch": 1293} {"train_loss": -5.840381622314453, "global_step": 54346, "epoch": 1293} {"train_loss": -5.817204066685268, "global_step": 54347, "epoch": 1293, "val_loss": 74486.640625} {"train_loss": -5.880186080932617, "global_step": 54348, "epoch": 1294} {"train_loss": -5.730813503265381, "global_step": 54349, "epoch": 1294} {"train_loss": -5.747066020965576, "global_step": 54350, "epoch": 1294} {"train_loss": -5.82475471496582, "global_step": 54351, "epoch": 1294} {"train_loss": -5.733096122741699, "global_step": 54352, "epoch": 1294} {"train_loss": -5.844947814941406, "global_step": 54353, "epoch": 1294} {"train_loss": -5.9319353103637695, "global_step": 54354, "epoch": 1294} {"train_loss": -5.828123092651367, "global_step": 54355, "epoch": 1294} {"train_loss": -5.844280242919922, "global_step": 54356, "epoch": 1294} {"train_loss": -5.664751052856445, "global_step": 54357, "epoch": 1294} {"train_loss": -5.904924392700195, "global_step": 54358, "epoch": 1294} {"train_loss": -5.7855939865112305, "global_step": 54359, "epoch": 1294} {"train_loss": -5.948570251464844, "global_step": 54360, "epoch": 1294} {"train_loss": -5.806022644042969, "global_step": 54361, "epoch": 1294} {"train_loss": -5.82220983505249, "global_step": 54362, "epoch": 1294} {"train_loss": -5.820680618286133, "global_step": 54363, "epoch": 1294} {"train_loss": -5.768301010131836, "global_step": 54364, "epoch": 1294} {"train_loss": -5.83359432220459, "global_step": 54365, "epoch": 1294} {"train_loss": -5.732537269592285, "global_step": 54366, "epoch": 1294} {"train_loss": -5.815877914428711, "global_step": 54367, "epoch": 1294} {"train_loss": -5.870263576507568, "global_step": 54368, "epoch": 1294} {"train_loss": -5.905576705932617, "global_step": 54369, "epoch": 1294} {"train_loss": -5.73972225189209, "global_step": 54370, "epoch": 1294} {"train_loss": -5.801161766052246, "global_step": 54371, "epoch": 1294} {"train_loss": -5.709324836730957, "global_step": 54372, "epoch": 1294} {"train_loss": -6.0040693283081055, "global_step": 54373, "epoch": 1294} {"train_loss": -5.79619836807251, "global_step": 54374, "epoch": 1294} {"train_loss": -5.615658760070801, "global_step": 54375, "epoch": 1294} {"train_loss": -5.749042510986328, "global_step": 54376, "epoch": 1294} {"train_loss": -5.844503402709961, "global_step": 54377, "epoch": 1294} {"train_loss": -5.739063262939453, "global_step": 54378, "epoch": 1294} {"train_loss": -5.73223876953125, "global_step": 54379, "epoch": 1294} {"train_loss": -5.810239791870117, "global_step": 54380, "epoch": 1294} {"train_loss": -5.824261665344238, "global_step": 54381, "epoch": 1294} {"train_loss": -5.82405948638916, "global_step": 54382, "epoch": 1294} {"train_loss": -5.835492134094238, "global_step": 54383, "epoch": 1294} {"train_loss": -5.810671806335449, "global_step": 54384, "epoch": 1294} {"train_loss": -5.8411760330200195, "global_step": 54385, "epoch": 1294} {"train_loss": -5.828197479248047, "global_step": 54386, "epoch": 1294} {"train_loss": -5.792470455169678, "global_step": 54387, "epoch": 1294} {"train_loss": -5.868152141571045, "global_step": 54388, "epoch": 1294} {"train_loss": -5.80837326958066, "global_step": 54389, "epoch": 1294, "val_loss": 74361.0546875} {"train_loss": -5.754932403564453, "global_step": 54390, "epoch": 1295} {"train_loss": -5.811150074005127, "global_step": 54391, "epoch": 1295} {"train_loss": -5.955139636993408, "global_step": 54392, "epoch": 1295} {"train_loss": -5.804278373718262, "global_step": 54393, "epoch": 1295} {"train_loss": -5.858798980712891, "global_step": 54394, "epoch": 1295} {"train_loss": -5.896808624267578, "global_step": 54395, "epoch": 1295} {"train_loss": -5.833759307861328, "global_step": 54396, "epoch": 1295} {"train_loss": -5.836158275604248, "global_step": 54397, "epoch": 1295} {"train_loss": -5.776772499084473, "global_step": 54398, "epoch": 1295} {"train_loss": -5.752554416656494, "global_step": 54399, "epoch": 1295} {"train_loss": -5.847967624664307, "global_step": 54400, "epoch": 1295} {"train_loss": -5.9117631912231445, "global_step": 54401, "epoch": 1295} {"train_loss": -5.774488925933838, "global_step": 54402, "epoch": 1295} {"train_loss": -5.8017897605896, "global_step": 54403, "epoch": 1295} {"train_loss": -5.670372009277344, "global_step": 54404, "epoch": 1295} {"train_loss": -5.852593421936035, "global_step": 54405, "epoch": 1295} {"train_loss": -5.880017280578613, "global_step": 54406, "epoch": 1295} {"train_loss": -5.756844520568848, "global_step": 54407, "epoch": 1295} {"train_loss": -5.928384780883789, "global_step": 54408, "epoch": 1295} {"train_loss": -5.860616683959961, "global_step": 54409, "epoch": 1295} {"train_loss": -5.739903450012207, "global_step": 54410, "epoch": 1295} {"train_loss": -5.903476238250732, "global_step": 54411, "epoch": 1295} {"train_loss": -5.775153636932373, "global_step": 54412, "epoch": 1295} {"train_loss": -5.712587833404541, "global_step": 54413, "epoch": 1295} {"train_loss": -5.753562927246094, "global_step": 54414, "epoch": 1295} {"train_loss": -5.723296165466309, "global_step": 54415, "epoch": 1295} {"train_loss": -5.757678031921387, "global_step": 54416, "epoch": 1295} {"train_loss": -5.819100379943848, "global_step": 54417, "epoch": 1295} {"train_loss": -5.8053998947143555, "global_step": 54418, "epoch": 1295} {"train_loss": -5.7378435134887695, "global_step": 54419, "epoch": 1295} {"train_loss": -5.7990570068359375, "global_step": 54420, "epoch": 1295} {"train_loss": -5.627635478973389, "global_step": 54421, "epoch": 1295} {"train_loss": -5.8371992111206055, "global_step": 54422, "epoch": 1295} {"train_loss": -5.954936981201172, "global_step": 54423, "epoch": 1295} {"train_loss": -5.887770652770996, "global_step": 54424, "epoch": 1295} {"train_loss": -5.836843490600586, "global_step": 54425, "epoch": 1295} {"train_loss": -5.730298042297363, "global_step": 54426, "epoch": 1295} {"train_loss": -5.837550640106201, "global_step": 54427, "epoch": 1295} {"train_loss": -5.804142951965332, "global_step": 54428, "epoch": 1295} {"train_loss": -5.881811618804932, "global_step": 54429, "epoch": 1295} {"train_loss": -5.80295467376709, "global_step": 54430, "epoch": 1295} {"train_loss": -5.810322818301973, "global_step": 54431, "epoch": 1295, "val_loss": 74191.078125} {"train_loss": -6.010341644287109, "global_step": 54432, "epoch": 1296} {"train_loss": -5.875156402587891, "global_step": 54433, "epoch": 1296} {"train_loss": -5.852799415588379, "global_step": 54434, "epoch": 1296} {"train_loss": -5.911808967590332, "global_step": 54435, "epoch": 1296} {"train_loss": -5.96890115737915, "global_step": 54436, "epoch": 1296} {"train_loss": -5.889013290405273, "global_step": 54437, "epoch": 1296} {"train_loss": -5.915075302124023, "global_step": 54438, "epoch": 1296} {"train_loss": -5.966115951538086, "global_step": 54439, "epoch": 1296} {"train_loss": -5.850285530090332, "global_step": 54440, "epoch": 1296} {"train_loss": -5.825667381286621, "global_step": 54441, "epoch": 1296} {"train_loss": -5.8533806800842285, "global_step": 54442, "epoch": 1296} {"train_loss": -5.814822196960449, "global_step": 54443, "epoch": 1296} {"train_loss": -5.840934753417969, "global_step": 54444, "epoch": 1296} {"train_loss": -5.761277198791504, "global_step": 54445, "epoch": 1296} {"train_loss": -5.776487827301025, "global_step": 54446, "epoch": 1296} {"train_loss": -5.870718002319336, "global_step": 54447, "epoch": 1296} {"train_loss": -5.907679557800293, "global_step": 54448, "epoch": 1296} {"train_loss": -5.855452537536621, "global_step": 54449, "epoch": 1296} {"train_loss": -5.906150817871094, "global_step": 54450, "epoch": 1296} {"train_loss": -5.788557052612305, "global_step": 54451, "epoch": 1296} {"train_loss": -5.896052360534668, "global_step": 54452, "epoch": 1296} {"train_loss": -5.771872520446777, "global_step": 54453, "epoch": 1296} {"train_loss": -5.837942600250244, "global_step": 54454, "epoch": 1296} {"train_loss": -5.8240861892700195, "global_step": 54455, "epoch": 1296} {"train_loss": -5.770628929138184, "global_step": 54456, "epoch": 1296} {"train_loss": -5.858973026275635, "global_step": 54457, "epoch": 1296} {"train_loss": -5.775121688842773, "global_step": 54458, "epoch": 1296} {"train_loss": -5.8584089279174805, "global_step": 54459, "epoch": 1296} {"train_loss": -5.859422206878662, "global_step": 54460, "epoch": 1296} {"train_loss": -5.819779396057129, "global_step": 54461, "epoch": 1296} {"train_loss": -5.737990379333496, "global_step": 54462, "epoch": 1296} {"train_loss": -5.842181205749512, "global_step": 54463, "epoch": 1296} {"train_loss": -5.818904876708984, "global_step": 54464, "epoch": 1296} {"train_loss": -5.8990936279296875, "global_step": 54465, "epoch": 1296} {"train_loss": -5.763169288635254, "global_step": 54466, "epoch": 1296} {"train_loss": -5.939866065979004, "global_step": 54467, "epoch": 1296} {"train_loss": -5.806966304779053, "global_step": 54468, "epoch": 1296} {"train_loss": -5.7536492347717285, "global_step": 54469, "epoch": 1296} {"train_loss": -5.783848762512207, "global_step": 54470, "epoch": 1296} {"train_loss": -5.795952796936035, "global_step": 54471, "epoch": 1296} {"train_loss": -5.836983680725098, "global_step": 54472, "epoch": 1296} {"train_loss": -5.844921509424846, "global_step": 54473, "epoch": 1296, "val_loss": 74481.96875} {"train_loss": -5.889657974243164, "global_step": 54474, "epoch": 1297} {"train_loss": -5.8015313148498535, "global_step": 54475, "epoch": 1297} {"train_loss": -5.902191638946533, "global_step": 54476, "epoch": 1297} {"train_loss": -5.770625591278076, "global_step": 54477, "epoch": 1297} {"train_loss": -5.912545204162598, "global_step": 54478, "epoch": 1297} {"train_loss": -5.849881649017334, "global_step": 54479, "epoch": 1297} {"train_loss": -5.841041088104248, "global_step": 54480, "epoch": 1297} {"train_loss": -5.737643241882324, "global_step": 54481, "epoch": 1297} {"train_loss": -5.851093292236328, "global_step": 54482, "epoch": 1297} {"train_loss": -5.822861194610596, "global_step": 54483, "epoch": 1297} {"train_loss": -5.685271263122559, "global_step": 54484, "epoch": 1297} {"train_loss": -5.882672309875488, "global_step": 54485, "epoch": 1297} {"train_loss": -5.847291946411133, "global_step": 54486, "epoch": 1297} {"train_loss": -5.901926040649414, "global_step": 54487, "epoch": 1297} {"train_loss": -5.866237640380859, "global_step": 54488, "epoch": 1297} {"train_loss": -5.865190029144287, "global_step": 54489, "epoch": 1297} {"train_loss": -5.861317157745361, "global_step": 54490, "epoch": 1297} {"train_loss": -5.887899398803711, "global_step": 54491, "epoch": 1297} {"train_loss": -5.84427547454834, "global_step": 54492, "epoch": 1297} {"train_loss": -5.851787567138672, "global_step": 54493, "epoch": 1297} {"train_loss": -5.790843963623047, "global_step": 54494, "epoch": 1297} {"train_loss": -5.796666145324707, "global_step": 54495, "epoch": 1297} {"train_loss": -5.764667987823486, "global_step": 54496, "epoch": 1297} {"train_loss": -5.806967735290527, "global_step": 54497, "epoch": 1297} {"train_loss": -5.80703067779541, "global_step": 54498, "epoch": 1297} {"train_loss": -5.941291809082031, "global_step": 54499, "epoch": 1297} {"train_loss": -5.788752555847168, "global_step": 54500, "epoch": 1297} {"train_loss": -5.87257194519043, "global_step": 54501, "epoch": 1297} {"train_loss": -5.98311710357666, "global_step": 54502, "epoch": 1297} {"train_loss": -5.879881381988525, "global_step": 54503, "epoch": 1297} {"train_loss": -5.876314640045166, "global_step": 54504, "epoch": 1297} {"train_loss": -5.727416038513184, "global_step": 54505, "epoch": 1297} {"train_loss": -5.852248191833496, "global_step": 54506, "epoch": 1297} {"train_loss": -5.801982402801514, "global_step": 54507, "epoch": 1297} {"train_loss": -5.808039665222168, "global_step": 54508, "epoch": 1297} {"train_loss": -5.753678321838379, "global_step": 54509, "epoch": 1297} {"train_loss": -5.746885299682617, "global_step": 54510, "epoch": 1297} {"train_loss": -5.9414873123168945, "global_step": 54511, "epoch": 1297} {"train_loss": -5.713187217712402, "global_step": 54512, "epoch": 1297} {"train_loss": -5.690690040588379, "global_step": 54513, "epoch": 1297} {"train_loss": -5.7664971351623535, "global_step": 54514, "epoch": 1297} {"train_loss": -5.826961358388265, "global_step": 54515, "epoch": 1297, "val_loss": 74318.921875} {"train_loss": -5.799532890319824, "global_step": 54516, "epoch": 1298} {"train_loss": -5.624300479888916, "global_step": 54517, "epoch": 1298} {"train_loss": -5.744063377380371, "global_step": 54518, "epoch": 1298} {"train_loss": -5.833003044128418, "global_step": 54519, "epoch": 1298} {"train_loss": -5.8127946853637695, "global_step": 54520, "epoch": 1298} {"train_loss": -5.784711837768555, "global_step": 54521, "epoch": 1298} {"train_loss": -5.913091659545898, "global_step": 54522, "epoch": 1298} {"train_loss": -5.771618366241455, "global_step": 54523, "epoch": 1298} {"train_loss": -5.767813205718994, "global_step": 54524, "epoch": 1298} {"train_loss": -5.710124969482422, "global_step": 54525, "epoch": 1298} {"train_loss": -5.846945762634277, "global_step": 54526, "epoch": 1298} {"train_loss": -5.7313642501831055, "global_step": 54527, "epoch": 1298} {"train_loss": -5.7699713706970215, "global_step": 54528, "epoch": 1298} {"train_loss": -5.801536560058594, "global_step": 54529, "epoch": 1298} {"train_loss": -5.813747406005859, "global_step": 54530, "epoch": 1298} {"train_loss": -5.802038192749023, "global_step": 54531, "epoch": 1298} {"train_loss": -5.786706924438477, "global_step": 54532, "epoch": 1298} {"train_loss": -5.852485656738281, "global_step": 54533, "epoch": 1298} {"train_loss": -5.716973304748535, "global_step": 54534, "epoch": 1298} {"train_loss": -5.685155391693115, "global_step": 54535, "epoch": 1298} {"train_loss": -5.912092685699463, "global_step": 54536, "epoch": 1298} {"train_loss": -5.814818382263184, "global_step": 54537, "epoch": 1298} {"train_loss": -5.820710182189941, "global_step": 54538, "epoch": 1298} {"train_loss": -5.912657737731934, "global_step": 54539, "epoch": 1298} {"train_loss": -5.927957534790039, "global_step": 54540, "epoch": 1298} {"train_loss": -5.81599760055542, "global_step": 54541, "epoch": 1298} {"train_loss": -5.949030876159668, "global_step": 54542, "epoch": 1298} {"train_loss": -5.876437187194824, "global_step": 54543, "epoch": 1298} {"train_loss": -5.784595489501953, "global_step": 54544, "epoch": 1298} {"train_loss": -5.782960891723633, "global_step": 54545, "epoch": 1298} {"train_loss": -5.7373127937316895, "global_step": 54546, "epoch": 1298} {"train_loss": -5.922913074493408, "global_step": 54547, "epoch": 1298} {"train_loss": -5.765778541564941, "global_step": 54548, "epoch": 1298} {"train_loss": -5.890528678894043, "global_step": 54549, "epoch": 1298} {"train_loss": -5.789248466491699, "global_step": 54550, "epoch": 1298} {"train_loss": -5.74547004699707, "global_step": 54551, "epoch": 1298} {"train_loss": -5.871347427368164, "global_step": 54552, "epoch": 1298} {"train_loss": -5.913895606994629, "global_step": 54553, "epoch": 1298} {"train_loss": -6.005265235900879, "global_step": 54554, "epoch": 1298} {"train_loss": -5.810335636138916, "global_step": 54555, "epoch": 1298} {"train_loss": -5.89251708984375, "global_step": 54556, "epoch": 1298} {"train_loss": -5.8153679597945445, "global_step": 54557, "epoch": 1298, "val_loss": 74383.7890625} {"train_loss": -5.9349045753479, "global_step": 54558, "epoch": 1299} {"train_loss": -5.835675239562988, "global_step": 54559, "epoch": 1299} {"train_loss": -5.753906726837158, "global_step": 54560, "epoch": 1299} {"train_loss": -5.969645023345947, "global_step": 54561, "epoch": 1299} {"train_loss": -5.7402215003967285, "global_step": 54562, "epoch": 1299} {"train_loss": -5.607422351837158, "global_step": 54563, "epoch": 1299} {"train_loss": -5.884224891662598, "global_step": 54564, "epoch": 1299} {"train_loss": -5.761333465576172, "global_step": 54565, "epoch": 1299} {"train_loss": -5.828817367553711, "global_step": 54566, "epoch": 1299} {"train_loss": -5.685819625854492, "global_step": 54567, "epoch": 1299} {"train_loss": -5.826004981994629, "global_step": 54568, "epoch": 1299} {"train_loss": -6.00534725189209, "global_step": 54569, "epoch": 1299} {"train_loss": -5.7935471534729, "global_step": 54570, "epoch": 1299} {"train_loss": -5.877067565917969, "global_step": 54571, "epoch": 1299} {"train_loss": -5.90376091003418, "global_step": 54572, "epoch": 1299} {"train_loss": -5.885140419006348, "global_step": 54573, "epoch": 1299} {"train_loss": -5.860956192016602, "global_step": 54574, "epoch": 1299} {"train_loss": -5.810598373413086, "global_step": 54575, "epoch": 1299} {"train_loss": -5.899614334106445, "global_step": 54576, "epoch": 1299} {"train_loss": -5.792928695678711, "global_step": 54577, "epoch": 1299} {"train_loss": -5.844071388244629, "global_step": 54578, "epoch": 1299} {"train_loss": -5.908716201782227, "global_step": 54579, "epoch": 1299} {"train_loss": -5.698060035705566, "global_step": 54580, "epoch": 1299} {"train_loss": -5.919707298278809, "global_step": 54581, "epoch": 1299} {"train_loss": -5.824901580810547, "global_step": 54582, "epoch": 1299} {"train_loss": -5.788907051086426, "global_step": 54583, "epoch": 1299} {"train_loss": -5.894038200378418, "global_step": 54584, "epoch": 1299} {"train_loss": -5.773189544677734, "global_step": 54585, "epoch": 1299} {"train_loss": -5.753129005432129, "global_step": 54586, "epoch": 1299} {"train_loss": -5.864756107330322, "global_step": 54587, "epoch": 1299} {"train_loss": -5.8645429611206055, "global_step": 54588, "epoch": 1299} {"train_loss": -5.79022216796875, "global_step": 54589, "epoch": 1299} {"train_loss": -5.748382091522217, "global_step": 54590, "epoch": 1299} {"train_loss": -5.819669723510742, "global_step": 54591, "epoch": 1299} {"train_loss": -5.853409290313721, "global_step": 54592, "epoch": 1299} {"train_loss": -5.768308639526367, "global_step": 54593, "epoch": 1299} {"train_loss": -5.790533065795898, "global_step": 54594, "epoch": 1299} {"train_loss": -5.873007297515869, "global_step": 54595, "epoch": 1299} {"train_loss": -5.767755508422852, "global_step": 54596, "epoch": 1299} {"train_loss": -5.719794273376465, "global_step": 54597, "epoch": 1299} {"train_loss": -5.971922874450684, "global_step": 54598, "epoch": 1299} {"train_loss": -5.8268854050409224, "global_step": 54599, "epoch": 1299, "val_loss": 74185.953125} {"train_loss": -5.887472629547119, "global_step": 54600, "epoch": 1300} {"train_loss": -5.92861270904541, "global_step": 54601, "epoch": 1300} {"train_loss": -5.78616189956665, "global_step": 54602, "epoch": 1300} {"train_loss": -5.831473350524902, "global_step": 54603, "epoch": 1300} {"train_loss": -5.738324165344238, "global_step": 54604, "epoch": 1300} {"train_loss": -5.899434566497803, "global_step": 54605, "epoch": 1300} {"train_loss": -5.744884490966797, "global_step": 54606, "epoch": 1300} {"train_loss": -5.75390625, "global_step": 54607, "epoch": 1300} {"train_loss": -5.816229343414307, "global_step": 54608, "epoch": 1300} {"train_loss": -5.776113510131836, "global_step": 54609, "epoch": 1300} {"train_loss": -5.826693534851074, "global_step": 54610, "epoch": 1300} {"train_loss": -5.891730308532715, "global_step": 54611, "epoch": 1300} {"train_loss": -5.88395357131958, "global_step": 54612, "epoch": 1300} {"train_loss": -5.806027412414551, "global_step": 54613, "epoch": 1300} {"train_loss": -5.794341087341309, "global_step": 54614, "epoch": 1300} {"train_loss": -5.821193695068359, "global_step": 54615, "epoch": 1300} {"train_loss": -5.924007892608643, "global_step": 54616, "epoch": 1300} {"train_loss": -5.8979034423828125, "global_step": 54617, "epoch": 1300} {"train_loss": -5.788870811462402, "global_step": 54618, "epoch": 1300} {"train_loss": -5.722740173339844, "global_step": 54619, "epoch": 1300} {"train_loss": -5.9639410972595215, "global_step": 54620, "epoch": 1300} {"train_loss": -5.973549842834473, "global_step": 54621, "epoch": 1300} {"train_loss": -5.921442031860352, "global_step": 54622, "epoch": 1300} {"train_loss": -5.750129699707031, "global_step": 54623, "epoch": 1300} {"train_loss": -5.933257102966309, "global_step": 54624, "epoch": 1300} {"train_loss": -5.981231689453125, "global_step": 54625, "epoch": 1300} {"train_loss": -5.860856533050537, "global_step": 54626, "epoch": 1300} {"train_loss": -5.839567184448242, "global_step": 54627, "epoch": 1300} {"train_loss": -5.798708915710449, "global_step": 54628, "epoch": 1300} {"train_loss": -5.949746131896973, "global_step": 54629, "epoch": 1300} {"train_loss": -5.8020172119140625, "global_step": 54630, "epoch": 1300} {"train_loss": -5.801881790161133, "global_step": 54631, "epoch": 1300} {"train_loss": -5.864617347717285, "global_step": 54632, "epoch": 1300} {"train_loss": -5.728935241699219, "global_step": 54633, "epoch": 1300} {"train_loss": -5.731897354125977, "global_step": 54634, "epoch": 1300} {"train_loss": -5.758440971374512, "global_step": 54635, "epoch": 1300} {"train_loss": -5.857423305511475, "global_step": 54636, "epoch": 1300} {"train_loss": -5.853460311889648, "global_step": 54637, "epoch": 1300} {"train_loss": -5.848467826843262, "global_step": 54638, "epoch": 1300} {"train_loss": -5.784923553466797, "global_step": 54639, "epoch": 1300} {"train_loss": -5.927168369293213, "global_step": 54640, "epoch": 1300} {"train_loss": -5.839534566515968, "global_step": 54641, "epoch": 1300, "train/sim_max_reward_0": 0.41987754028793633, "train/sim_max_reward_1": 0.8577880552537903, "train/sim_max_reward_2": 0.6214802711454889, "train/sim_max_reward_3": 0.15716848129268135, "train/sim_max_reward_4": 0.3571515091011566, "train/sim_max_reward_5": 0.5572292716367394, "test/sim_max_reward_4500000": 0.34155533942112354, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.5572029974398982, "test/sim_max_reward_4500003": 0.8891931201214248, "test/sim_max_reward_4500004": 0.05957316553773981, "test/sim_max_reward_4500005": 0.9643928115030737, "test/sim_max_reward_4500006": 0.6302498114258736, "test/sim_max_reward_4500007": 0.4964434381426772, "test/sim_max_reward_4500008": 0.15339725272816054, "test/sim_max_reward_4500009": 0.7913033996182156, "test/sim_max_reward_4500010": 0.9338105821429858, "test/sim_max_reward_4500011": 0.3044197653011636, "test/sim_max_reward_4500012": 0.3300611925754333, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.36844243946177374, "test/sim_max_reward_4500015": 0.958745488105699, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.045613632157952624, "test/sim_max_reward_4500018": 0.5319842751869968, "test/sim_max_reward_4500019": 0.494891482616643, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9514629506606151, "test/sim_max_reward_4500022": 0.7650281542417908, "test/sim_max_reward_4500023": 0.8835895694296702, "test/sim_max_reward_4500024": 0.307196254722733, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.13522760353809382, "test/sim_max_reward_4500027": 0.754023157910257, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.13568527629942198, "test/sim_max_reward_4500030": 0.8887799929327568, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.43339577127661594, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.6860005690771233, "test/sim_max_reward_4500035": 0.6692022952645212, "test/sim_max_reward_4500036": 0.3638755405598461, "test/sim_max_reward_4500037": 0.8941011234028032, "test/sim_max_reward_4500038": 0.3227747901223859, "test/sim_max_reward_4500039": 0.4914042131161362, "test/sim_max_reward_4500040": 0.8963818299099151, "test/sim_max_reward_4500041": 0.8265959129365101, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.8397573599285637, "test/sim_max_reward_4500044": 0.05613865772089219, "test/sim_max_reward_4500045": 0.15076063963991898, "test/sim_max_reward_4500046": 0.2949802225513107, "test/sim_max_reward_4500047": 0.9184343748619355, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.8757586057080942, "train/mean_score": 0.4951158547862988, "test/mean_score": 0.4519535960423452, "val_loss": 74340.140625} {"train_loss": -5.80733060836792, "global_step": 54642, "epoch": 1301} {"train_loss": -5.786076545715332, "global_step": 54643, "epoch": 1301} {"train_loss": -5.803798198699951, "global_step": 54644, "epoch": 1301} {"train_loss": -5.824699401855469, "global_step": 54645, "epoch": 1301} {"train_loss": -5.691646575927734, "global_step": 54646, "epoch": 1301} {"train_loss": -5.771999359130859, "global_step": 54647, "epoch": 1301} {"train_loss": -5.793356418609619, "global_step": 54648, "epoch": 1301} {"train_loss": -5.753565788269043, "global_step": 54649, "epoch": 1301} {"train_loss": -5.791133880615234, "global_step": 54650, "epoch": 1301} {"train_loss": -5.817510604858398, "global_step": 54651, "epoch": 1301} {"train_loss": -5.750162124633789, "global_step": 54652, "epoch": 1301} {"train_loss": -5.841257572174072, "global_step": 54653, "epoch": 1301} {"train_loss": -5.6536335945129395, "global_step": 54654, "epoch": 1301} {"train_loss": -5.811318397521973, "global_step": 54655, "epoch": 1301} {"train_loss": -5.760891914367676, "global_step": 54656, "epoch": 1301} {"train_loss": -5.881032943725586, "global_step": 54657, "epoch": 1301} {"train_loss": -5.745913028717041, "global_step": 54658, "epoch": 1301} {"train_loss": -5.8741021156311035, "global_step": 54659, "epoch": 1301} {"train_loss": -5.800209999084473, "global_step": 54660, "epoch": 1301} {"train_loss": -5.744446754455566, "global_step": 54661, "epoch": 1301} {"train_loss": -5.693571090698242, "global_step": 54662, "epoch": 1301} {"train_loss": -5.78048038482666, "global_step": 54663, "epoch": 1301} {"train_loss": -5.742103576660156, "global_step": 54664, "epoch": 1301} {"train_loss": -5.731670379638672, "global_step": 54665, "epoch": 1301} {"train_loss": -5.839249610900879, "global_step": 54666, "epoch": 1301} {"train_loss": -5.89377498626709, "global_step": 54667, "epoch": 1301} {"train_loss": -5.813785076141357, "global_step": 54668, "epoch": 1301} {"train_loss": -5.878122329711914, "global_step": 54669, "epoch": 1301} {"train_loss": -5.858913421630859, "global_step": 54670, "epoch": 1301} {"train_loss": -5.915765762329102, "global_step": 54671, "epoch": 1301} {"train_loss": -5.762332916259766, "global_step": 54672, "epoch": 1301} {"train_loss": -5.784616947174072, "global_step": 54673, "epoch": 1301} {"train_loss": -5.760791778564453, "global_step": 54674, "epoch": 1301} {"train_loss": -5.893404960632324, "global_step": 54675, "epoch": 1301} {"train_loss": -5.678022384643555, "global_step": 54676, "epoch": 1301} {"train_loss": -5.784839630126953, "global_step": 54677, "epoch": 1301} {"train_loss": -5.857851982116699, "global_step": 54678, "epoch": 1301} {"train_loss": -5.7773542404174805, "global_step": 54679, "epoch": 1301} {"train_loss": -5.776663780212402, "global_step": 54680, "epoch": 1301} {"train_loss": -5.887054443359375, "global_step": 54681, "epoch": 1301} {"train_loss": -5.752617835998535, "global_step": 54682, "epoch": 1301} {"train_loss": -5.795348757789249, "global_step": 54683, "epoch": 1301, "val_loss": 74370.21875} {"train_loss": -5.73571252822876, "global_step": 54684, "epoch": 1302} {"train_loss": -5.835906505584717, "global_step": 54685, "epoch": 1302} {"train_loss": -5.819366455078125, "global_step": 54686, "epoch": 1302} {"train_loss": -5.921940803527832, "global_step": 54687, "epoch": 1302} {"train_loss": -5.803203582763672, "global_step": 54688, "epoch": 1302} {"train_loss": -5.964797019958496, "global_step": 54689, "epoch": 1302} {"train_loss": -5.7758917808532715, "global_step": 54690, "epoch": 1302} {"train_loss": -5.831124305725098, "global_step": 54691, "epoch": 1302} {"train_loss": -5.869707107543945, "global_step": 54692, "epoch": 1302} {"train_loss": -5.77518367767334, "global_step": 54693, "epoch": 1302} {"train_loss": -5.803977966308594, "global_step": 54694, "epoch": 1302} {"train_loss": -5.710244178771973, "global_step": 54695, "epoch": 1302} {"train_loss": -5.814488410949707, "global_step": 54696, "epoch": 1302} {"train_loss": -5.834621429443359, "global_step": 54697, "epoch": 1302} {"train_loss": -5.8145294189453125, "global_step": 54698, "epoch": 1302} {"train_loss": -5.8069963455200195, "global_step": 54699, "epoch": 1302} {"train_loss": -5.74737548828125, "global_step": 54700, "epoch": 1302} {"train_loss": -5.857326507568359, "global_step": 54701, "epoch": 1302} {"train_loss": -5.833000183105469, "global_step": 54702, "epoch": 1302} {"train_loss": -5.731927871704102, "global_step": 54703, "epoch": 1302} {"train_loss": -5.871908187866211, "global_step": 54704, "epoch": 1302} {"train_loss": -5.834084510803223, "global_step": 54705, "epoch": 1302} {"train_loss": -5.843701362609863, "global_step": 54706, "epoch": 1302} {"train_loss": -5.820411682128906, "global_step": 54707, "epoch": 1302} {"train_loss": -5.98361873626709, "global_step": 54708, "epoch": 1302} {"train_loss": -5.853279113769531, "global_step": 54709, "epoch": 1302} {"train_loss": -5.7518792152404785, "global_step": 54710, "epoch": 1302} {"train_loss": -5.954217433929443, "global_step": 54711, "epoch": 1302} {"train_loss": -5.804719924926758, "global_step": 54712, "epoch": 1302} {"train_loss": -5.9513750076293945, "global_step": 54713, "epoch": 1302} {"train_loss": -5.823932647705078, "global_step": 54714, "epoch": 1302} {"train_loss": -5.711319446563721, "global_step": 54715, "epoch": 1302} {"train_loss": -5.800112724304199, "global_step": 54716, "epoch": 1302} {"train_loss": -5.823969841003418, "global_step": 54717, "epoch": 1302} {"train_loss": -5.835396766662598, "global_step": 54718, "epoch": 1302} {"train_loss": -5.790142059326172, "global_step": 54719, "epoch": 1302} {"train_loss": -5.829542636871338, "global_step": 54720, "epoch": 1302} {"train_loss": -5.825601100921631, "global_step": 54721, "epoch": 1302} {"train_loss": -5.871242523193359, "global_step": 54722, "epoch": 1302} {"train_loss": -5.709712028503418, "global_step": 54723, "epoch": 1302} {"train_loss": -5.8675737380981445, "global_step": 54724, "epoch": 1302} {"train_loss": -5.822665997913906, "global_step": 54725, "epoch": 1302, "val_loss": 74237.28125} {"train_loss": -5.730710029602051, "global_step": 54726, "epoch": 1303} {"train_loss": -5.873689651489258, "global_step": 54727, "epoch": 1303} {"train_loss": -5.745964050292969, "global_step": 54728, "epoch": 1303} {"train_loss": -5.8740553855896, "global_step": 54729, "epoch": 1303} {"train_loss": -5.80448055267334, "global_step": 54730, "epoch": 1303} {"train_loss": -5.817866802215576, "global_step": 54731, "epoch": 1303} {"train_loss": -5.719786167144775, "global_step": 54732, "epoch": 1303} {"train_loss": -5.849575996398926, "global_step": 54733, "epoch": 1303} {"train_loss": -5.655561923980713, "global_step": 54734, "epoch": 1303} {"train_loss": -5.706457614898682, "global_step": 54735, "epoch": 1303} {"train_loss": -5.716080665588379, "global_step": 54736, "epoch": 1303} {"train_loss": -5.815332412719727, "global_step": 54737, "epoch": 1303} {"train_loss": -5.8157525062561035, "global_step": 54738, "epoch": 1303} {"train_loss": -5.763309478759766, "global_step": 54739, "epoch": 1303} {"train_loss": -5.859836578369141, "global_step": 54740, "epoch": 1303} {"train_loss": -5.84403657913208, "global_step": 54741, "epoch": 1303} {"train_loss": -5.71162223815918, "global_step": 54742, "epoch": 1303} {"train_loss": -5.818499565124512, "global_step": 54743, "epoch": 1303} {"train_loss": -5.793972969055176, "global_step": 54744, "epoch": 1303} {"train_loss": -5.9449663162231445, "global_step": 54745, "epoch": 1303} {"train_loss": -5.768632888793945, "global_step": 54746, "epoch": 1303} {"train_loss": -5.849052429199219, "global_step": 54747, "epoch": 1303} {"train_loss": -5.778825759887695, "global_step": 54748, "epoch": 1303} {"train_loss": -5.733542442321777, "global_step": 54749, "epoch": 1303} {"train_loss": -5.776281356811523, "global_step": 54750, "epoch": 1303} {"train_loss": -5.676745891571045, "global_step": 54751, "epoch": 1303} {"train_loss": -5.706510543823242, "global_step": 54752, "epoch": 1303} {"train_loss": -5.797119617462158, "global_step": 54753, "epoch": 1303} {"train_loss": -5.847590446472168, "global_step": 54754, "epoch": 1303} {"train_loss": -5.828532695770264, "global_step": 54755, "epoch": 1303} {"train_loss": -5.878902912139893, "global_step": 54756, "epoch": 1303} {"train_loss": -5.874208450317383, "global_step": 54757, "epoch": 1303} {"train_loss": -5.864903450012207, "global_step": 54758, "epoch": 1303} {"train_loss": -5.705377101898193, "global_step": 54759, "epoch": 1303} {"train_loss": -5.776076316833496, "global_step": 54760, "epoch": 1303} {"train_loss": -5.744898796081543, "global_step": 54761, "epoch": 1303} {"train_loss": -5.695529937744141, "global_step": 54762, "epoch": 1303} {"train_loss": -5.753479957580566, "global_step": 54763, "epoch": 1303} {"train_loss": -5.914009094238281, "global_step": 54764, "epoch": 1303} {"train_loss": -5.794493675231934, "global_step": 54765, "epoch": 1303} {"train_loss": -5.778303623199463, "global_step": 54766, "epoch": 1303} {"train_loss": -5.791695912679036, "global_step": 54767, "epoch": 1303, "val_loss": 74460.0625} {"train_loss": -5.751748085021973, "global_step": 54768, "epoch": 1304} {"train_loss": -5.9149169921875, "global_step": 54769, "epoch": 1304} {"train_loss": -5.782611846923828, "global_step": 54770, "epoch": 1304} {"train_loss": -5.895840167999268, "global_step": 54771, "epoch": 1304} {"train_loss": -5.886358261108398, "global_step": 54772, "epoch": 1304} {"train_loss": -5.746579170227051, "global_step": 54773, "epoch": 1304} {"train_loss": -5.805116653442383, "global_step": 54774, "epoch": 1304} {"train_loss": -5.808210849761963, "global_step": 54775, "epoch": 1304} {"train_loss": -5.918941497802734, "global_step": 54776, "epoch": 1304} {"train_loss": -5.775528907775879, "global_step": 54777, "epoch": 1304} {"train_loss": -5.8030853271484375, "global_step": 54778, "epoch": 1304} {"train_loss": -5.817501068115234, "global_step": 54779, "epoch": 1304} {"train_loss": -5.870719909667969, "global_step": 54780, "epoch": 1304} {"train_loss": -5.955409049987793, "global_step": 54781, "epoch": 1304} {"train_loss": -5.90424919128418, "global_step": 54782, "epoch": 1304} {"train_loss": -5.79874324798584, "global_step": 54783, "epoch": 1304} {"train_loss": -5.916727542877197, "global_step": 54784, "epoch": 1304} {"train_loss": -5.838570594787598, "global_step": 54785, "epoch": 1304} {"train_loss": -5.8130693435668945, "global_step": 54786, "epoch": 1304} {"train_loss": -5.8329925537109375, "global_step": 54787, "epoch": 1304} {"train_loss": -5.8828558921813965, "global_step": 54788, "epoch": 1304} {"train_loss": -5.826383590698242, "global_step": 54789, "epoch": 1304} {"train_loss": -5.816474914550781, "global_step": 54790, "epoch": 1304} {"train_loss": -5.914670467376709, "global_step": 54791, "epoch": 1304} {"train_loss": -5.859192848205566, "global_step": 54792, "epoch": 1304} {"train_loss": -5.94642448425293, "global_step": 54793, "epoch": 1304} {"train_loss": -5.867440223693848, "global_step": 54794, "epoch": 1304} {"train_loss": -5.8876752853393555, "global_step": 54795, "epoch": 1304} {"train_loss": -5.933884143829346, "global_step": 54796, "epoch": 1304} {"train_loss": -5.895094871520996, "global_step": 54797, "epoch": 1304} {"train_loss": -5.82163143157959, "global_step": 54798, "epoch": 1304} {"train_loss": -5.83370304107666, "global_step": 54799, "epoch": 1304} {"train_loss": -5.870312690734863, "global_step": 54800, "epoch": 1304} {"train_loss": -5.761316299438477, "global_step": 54801, "epoch": 1304} {"train_loss": -5.956889629364014, "global_step": 54802, "epoch": 1304} {"train_loss": -5.812169075012207, "global_step": 54803, "epoch": 1304} {"train_loss": -5.801935195922852, "global_step": 54804, "epoch": 1304} {"train_loss": -5.715568542480469, "global_step": 54805, "epoch": 1304} {"train_loss": -5.768840789794922, "global_step": 54806, "epoch": 1304} {"train_loss": -5.792508125305176, "global_step": 54807, "epoch": 1304} {"train_loss": -5.860250473022461, "global_step": 54808, "epoch": 1304} {"train_loss": -5.844174385070801, "global_step": 54809, "epoch": 1304, "val_loss": 74643.8046875} {"train_loss": -5.833085060119629, "global_step": 54810, "epoch": 1305} {"train_loss": -5.690521717071533, "global_step": 54811, "epoch": 1305} {"train_loss": -5.750600814819336, "global_step": 54812, "epoch": 1305} {"train_loss": -5.893052101135254, "global_step": 54813, "epoch": 1305} {"train_loss": -5.900636196136475, "global_step": 54814, "epoch": 1305} {"train_loss": -5.789246559143066, "global_step": 54815, "epoch": 1305} {"train_loss": -5.805603981018066, "global_step": 54816, "epoch": 1305} {"train_loss": -5.78809118270874, "global_step": 54817, "epoch": 1305} {"train_loss": -5.861217021942139, "global_step": 54818, "epoch": 1305} {"train_loss": -5.784175872802734, "global_step": 54819, "epoch": 1305} {"train_loss": -5.878686904907227, "global_step": 54820, "epoch": 1305} {"train_loss": -5.887687683105469, "global_step": 54821, "epoch": 1305} {"train_loss": -5.882582664489746, "global_step": 54822, "epoch": 1305} {"train_loss": -5.843771457672119, "global_step": 54823, "epoch": 1305} {"train_loss": -5.787405967712402, "global_step": 54824, "epoch": 1305} {"train_loss": -5.821806907653809, "global_step": 54825, "epoch": 1305} {"train_loss": -5.886570930480957, "global_step": 54826, "epoch": 1305} {"train_loss": -5.767792224884033, "global_step": 54827, "epoch": 1305} {"train_loss": -5.868956565856934, "global_step": 54828, "epoch": 1305} {"train_loss": -5.742151260375977, "global_step": 54829, "epoch": 1305} {"train_loss": -5.817882537841797, "global_step": 54830, "epoch": 1305} {"train_loss": -5.906353950500488, "global_step": 54831, "epoch": 1305} {"train_loss": -5.883828163146973, "global_step": 54832, "epoch": 1305} {"train_loss": -5.734196662902832, "global_step": 54833, "epoch": 1305} {"train_loss": -5.869141578674316, "global_step": 54834, "epoch": 1305} {"train_loss": -5.925694465637207, "global_step": 54835, "epoch": 1305} {"train_loss": -5.8073272705078125, "global_step": 54836, "epoch": 1305} {"train_loss": -5.892396450042725, "global_step": 54837, "epoch": 1305} {"train_loss": -5.848748207092285, "global_step": 54838, "epoch": 1305} {"train_loss": -5.696961402893066, "global_step": 54839, "epoch": 1305} {"train_loss": -5.743191719055176, "global_step": 54840, "epoch": 1305} {"train_loss": -5.672248840332031, "global_step": 54841, "epoch": 1305} {"train_loss": -5.861815452575684, "global_step": 54842, "epoch": 1305} {"train_loss": -5.837828636169434, "global_step": 54843, "epoch": 1305} {"train_loss": -5.833272457122803, "global_step": 54844, "epoch": 1305} {"train_loss": -5.870512962341309, "global_step": 54845, "epoch": 1305} {"train_loss": -5.945855140686035, "global_step": 54846, "epoch": 1305} {"train_loss": -5.796648979187012, "global_step": 54847, "epoch": 1305} {"train_loss": -5.88261079788208, "global_step": 54848, "epoch": 1305} {"train_loss": -5.8392415046691895, "global_step": 54849, "epoch": 1305} {"train_loss": -5.849310398101807, "global_step": 54850, "epoch": 1305} {"train_loss": -5.828027940931774, "global_step": 54851, "epoch": 1305, "val_loss": 74184.109375} {"train_loss": -5.852308750152588, "global_step": 54852, "epoch": 1306} {"train_loss": -5.846085548400879, "global_step": 54853, "epoch": 1306} {"train_loss": -5.907999038696289, "global_step": 54854, "epoch": 1306} {"train_loss": -5.789386749267578, "global_step": 54855, "epoch": 1306} {"train_loss": -5.760113716125488, "global_step": 54856, "epoch": 1306} {"train_loss": -5.897479057312012, "global_step": 54857, "epoch": 1306} {"train_loss": -5.867615699768066, "global_step": 54858, "epoch": 1306} {"train_loss": -5.900285720825195, "global_step": 54859, "epoch": 1306} {"train_loss": -5.9358320236206055, "global_step": 54860, "epoch": 1306} {"train_loss": -5.808913230895996, "global_step": 54861, "epoch": 1306} {"train_loss": -5.871126174926758, "global_step": 54862, "epoch": 1306} {"train_loss": -5.862815856933594, "global_step": 54863, "epoch": 1306} {"train_loss": -5.736082077026367, "global_step": 54864, "epoch": 1306} {"train_loss": -5.797680854797363, "global_step": 54865, "epoch": 1306} {"train_loss": -5.809927940368652, "global_step": 54866, "epoch": 1306} {"train_loss": -5.811454772949219, "global_step": 54867, "epoch": 1306} {"train_loss": -5.833337783813477, "global_step": 54868, "epoch": 1306} {"train_loss": -5.839230060577393, "global_step": 54869, "epoch": 1306} {"train_loss": -5.842732906341553, "global_step": 54870, "epoch": 1306} {"train_loss": -5.839077472686768, "global_step": 54871, "epoch": 1306} {"train_loss": -5.872729778289795, "global_step": 54872, "epoch": 1306} {"train_loss": -5.790390968322754, "global_step": 54873, "epoch": 1306} {"train_loss": -5.925742149353027, "global_step": 54874, "epoch": 1306} {"train_loss": -5.787266731262207, "global_step": 54875, "epoch": 1306} {"train_loss": -5.890531539916992, "global_step": 54876, "epoch": 1306} {"train_loss": -5.852376937866211, "global_step": 54877, "epoch": 1306} {"train_loss": -5.899811744689941, "global_step": 54878, "epoch": 1306} {"train_loss": -5.901223182678223, "global_step": 54879, "epoch": 1306} {"train_loss": -5.803937911987305, "global_step": 54880, "epoch": 1306} {"train_loss": -5.811824321746826, "global_step": 54881, "epoch": 1306} {"train_loss": -5.838591575622559, "global_step": 54882, "epoch": 1306} {"train_loss": -5.823000907897949, "global_step": 54883, "epoch": 1306} {"train_loss": -5.87380313873291, "global_step": 54884, "epoch": 1306} {"train_loss": -5.851688385009766, "global_step": 54885, "epoch": 1306} {"train_loss": -5.793779373168945, "global_step": 54886, "epoch": 1306} {"train_loss": -5.790775299072266, "global_step": 54887, "epoch": 1306} {"train_loss": -5.806848526000977, "global_step": 54888, "epoch": 1306} {"train_loss": -5.8478593826293945, "global_step": 54889, "epoch": 1306} {"train_loss": -5.919065952301025, "global_step": 54890, "epoch": 1306} {"train_loss": -5.772678375244141, "global_step": 54891, "epoch": 1306} {"train_loss": -5.840945243835449, "global_step": 54892, "epoch": 1306} {"train_loss": -5.841229086830502, "global_step": 54893, "epoch": 1306, "val_loss": 74462.8515625} {"train_loss": -5.8896942138671875, "global_step": 54894, "epoch": 1307} {"train_loss": -5.805919647216797, "global_step": 54895, "epoch": 1307} {"train_loss": -5.774008750915527, "global_step": 54896, "epoch": 1307} {"train_loss": -5.851413249969482, "global_step": 54897, "epoch": 1307} {"train_loss": -5.865805625915527, "global_step": 54898, "epoch": 1307} {"train_loss": -5.950697898864746, "global_step": 54899, "epoch": 1307} {"train_loss": -5.754994869232178, "global_step": 54900, "epoch": 1307} {"train_loss": -6.010839462280273, "global_step": 54901, "epoch": 1307} {"train_loss": -5.892230033874512, "global_step": 54902, "epoch": 1307} {"train_loss": -5.761508464813232, "global_step": 54903, "epoch": 1307} {"train_loss": -5.786187171936035, "global_step": 54904, "epoch": 1307} {"train_loss": -5.817370414733887, "global_step": 54905, "epoch": 1307} {"train_loss": -5.856449604034424, "global_step": 54906, "epoch": 1307} {"train_loss": -5.814174652099609, "global_step": 54907, "epoch": 1307} {"train_loss": -5.796792030334473, "global_step": 54908, "epoch": 1307} {"train_loss": -5.983465194702148, "global_step": 54909, "epoch": 1307} {"train_loss": -5.825934886932373, "global_step": 54910, "epoch": 1307} {"train_loss": -5.827873706817627, "global_step": 54911, "epoch": 1307} {"train_loss": -5.784791469573975, "global_step": 54912, "epoch": 1307} {"train_loss": -5.9054856300354, "global_step": 54913, "epoch": 1307} {"train_loss": -5.9209699630737305, "global_step": 54914, "epoch": 1307} {"train_loss": -5.817546844482422, "global_step": 54915, "epoch": 1307} {"train_loss": -5.831929683685303, "global_step": 54916, "epoch": 1307} {"train_loss": -5.925339698791504, "global_step": 54917, "epoch": 1307} {"train_loss": -5.791632652282715, "global_step": 54918, "epoch": 1307} {"train_loss": -5.88472843170166, "global_step": 54919, "epoch": 1307} {"train_loss": -5.784751892089844, "global_step": 54920, "epoch": 1307} {"train_loss": -5.757706642150879, "global_step": 54921, "epoch": 1307} {"train_loss": -5.779230117797852, "global_step": 54922, "epoch": 1307} {"train_loss": -5.893118858337402, "global_step": 54923, "epoch": 1307} {"train_loss": -5.838620185852051, "global_step": 54924, "epoch": 1307} {"train_loss": -5.884193420410156, "global_step": 54925, "epoch": 1307} {"train_loss": -5.8745036125183105, "global_step": 54926, "epoch": 1307} {"train_loss": -5.752466201782227, "global_step": 54927, "epoch": 1307} {"train_loss": -5.846020698547363, "global_step": 54928, "epoch": 1307} {"train_loss": -5.8947296142578125, "global_step": 54929, "epoch": 1307} {"train_loss": -5.724211692810059, "global_step": 54930, "epoch": 1307} {"train_loss": -5.791342735290527, "global_step": 54931, "epoch": 1307} {"train_loss": -5.797456741333008, "global_step": 54932, "epoch": 1307} {"train_loss": -5.795590400695801, "global_step": 54933, "epoch": 1307} {"train_loss": -5.7259063720703125, "global_step": 54934, "epoch": 1307} {"train_loss": -5.833504551932926, "global_step": 54935, "epoch": 1307, "val_loss": 74050.140625} {"train_loss": -5.902223587036133, "global_step": 54936, "epoch": 1308} {"train_loss": -5.993224143981934, "global_step": 54937, "epoch": 1308} {"train_loss": -5.831542491912842, "global_step": 54938, "epoch": 1308} {"train_loss": -5.943330764770508, "global_step": 54939, "epoch": 1308} {"train_loss": -5.887204170227051, "global_step": 54940, "epoch": 1308} {"train_loss": -5.956892490386963, "global_step": 54941, "epoch": 1308} {"train_loss": -6.015820026397705, "global_step": 54942, "epoch": 1308} {"train_loss": -5.786172866821289, "global_step": 54943, "epoch": 1308} {"train_loss": -5.850404262542725, "global_step": 54944, "epoch": 1308} {"train_loss": -5.952320098876953, "global_step": 54945, "epoch": 1308} {"train_loss": -5.813881874084473, "global_step": 54946, "epoch": 1308} {"train_loss": -5.926872730255127, "global_step": 54947, "epoch": 1308} {"train_loss": -5.741845607757568, "global_step": 54948, "epoch": 1308} {"train_loss": -5.865936279296875, "global_step": 54949, "epoch": 1308} {"train_loss": -5.800124645233154, "global_step": 54950, "epoch": 1308} {"train_loss": -5.9809370040893555, "global_step": 54951, "epoch": 1308} {"train_loss": -5.599595069885254, "global_step": 54952, "epoch": 1308} {"train_loss": -5.934902191162109, "global_step": 54953, "epoch": 1308} {"train_loss": -5.932948112487793, "global_step": 54954, "epoch": 1308} {"train_loss": -5.745058059692383, "global_step": 54955, "epoch": 1308} {"train_loss": -5.795888423919678, "global_step": 54956, "epoch": 1308} {"train_loss": -5.820046901702881, "global_step": 54957, "epoch": 1308} {"train_loss": -5.805051803588867, "global_step": 54958, "epoch": 1308} {"train_loss": -5.753227233886719, "global_step": 54959, "epoch": 1308} {"train_loss": -5.7861480712890625, "global_step": 54960, "epoch": 1308} {"train_loss": -5.746111869812012, "global_step": 54961, "epoch": 1308} {"train_loss": -5.781929016113281, "global_step": 54962, "epoch": 1308} {"train_loss": -5.877291679382324, "global_step": 54963, "epoch": 1308} {"train_loss": -5.805381774902344, "global_step": 54964, "epoch": 1308} {"train_loss": -5.695940971374512, "global_step": 54965, "epoch": 1308} {"train_loss": -5.9368391036987305, "global_step": 54966, "epoch": 1308} {"train_loss": -5.753504276275635, "global_step": 54967, "epoch": 1308} {"train_loss": -5.8188090324401855, "global_step": 54968, "epoch": 1308} {"train_loss": -5.816914081573486, "global_step": 54969, "epoch": 1308} {"train_loss": -5.791584014892578, "global_step": 54970, "epoch": 1308} {"train_loss": -5.729581356048584, "global_step": 54971, "epoch": 1308} {"train_loss": -5.843454360961914, "global_step": 54972, "epoch": 1308} {"train_loss": -5.710331439971924, "global_step": 54973, "epoch": 1308} {"train_loss": -5.840131759643555, "global_step": 54974, "epoch": 1308} {"train_loss": -5.778865814208984, "global_step": 54975, "epoch": 1308} {"train_loss": -5.815184116363525, "global_step": 54976, "epoch": 1308} {"train_loss": -5.833109503700619, "global_step": 54977, "epoch": 1308, "val_loss": 74268.359375} {"train_loss": -5.75224494934082, "global_step": 54978, "epoch": 1309} {"train_loss": -5.792271614074707, "global_step": 54979, "epoch": 1309} {"train_loss": -5.774394512176514, "global_step": 54980, "epoch": 1309} {"train_loss": -5.909613132476807, "global_step": 54981, "epoch": 1309} {"train_loss": -5.867615699768066, "global_step": 54982, "epoch": 1309} {"train_loss": -5.7554931640625, "global_step": 54983, "epoch": 1309} {"train_loss": -5.826169967651367, "global_step": 54984, "epoch": 1309} {"train_loss": -5.8972625732421875, "global_step": 54985, "epoch": 1309} {"train_loss": -5.743444442749023, "global_step": 54986, "epoch": 1309} {"train_loss": -5.842012882232666, "global_step": 54987, "epoch": 1309} {"train_loss": -5.712488174438477, "global_step": 54988, "epoch": 1309} {"train_loss": -5.783384799957275, "global_step": 54989, "epoch": 1309} {"train_loss": -5.816206932067871, "global_step": 54990, "epoch": 1309} {"train_loss": -5.800429344177246, "global_step": 54991, "epoch": 1309} {"train_loss": -5.890089511871338, "global_step": 54992, "epoch": 1309} {"train_loss": -5.8900146484375, "global_step": 54993, "epoch": 1309} {"train_loss": -5.856036186218262, "global_step": 54994, "epoch": 1309} {"train_loss": -5.791631698608398, "global_step": 54995, "epoch": 1309} {"train_loss": -5.836061477661133, "global_step": 54996, "epoch": 1309} {"train_loss": -5.838954925537109, "global_step": 54997, "epoch": 1309} {"train_loss": -5.820965766906738, "global_step": 54998, "epoch": 1309} {"train_loss": -5.836617469787598, "global_step": 54999, "epoch": 1309} {"train_loss": -5.909333229064941, "global_step": 55000, "epoch": 1309} {"train_loss": -5.842527866363525, "global_step": 55001, "epoch": 1309} {"train_loss": -5.745410442352295, "global_step": 55002, "epoch": 1309} {"train_loss": -5.876918792724609, "global_step": 55003, "epoch": 1309} {"train_loss": -5.741506576538086, "global_step": 55004, "epoch": 1309} {"train_loss": -5.76629638671875, "global_step": 55005, "epoch": 1309} {"train_loss": -5.8015875816345215, "global_step": 55006, "epoch": 1309} {"train_loss": -5.810494422912598, "global_step": 55007, "epoch": 1309} {"train_loss": -5.696258068084717, "global_step": 55008, "epoch": 1309} {"train_loss": -5.6755475997924805, "global_step": 55009, "epoch": 1309} {"train_loss": -5.738447189331055, "global_step": 55010, "epoch": 1309} {"train_loss": -5.888600826263428, "global_step": 55011, "epoch": 1309} {"train_loss": -5.835783958435059, "global_step": 55012, "epoch": 1309} {"train_loss": -5.819197177886963, "global_step": 55013, "epoch": 1309} {"train_loss": -5.849350929260254, "global_step": 55014, "epoch": 1309} {"train_loss": -5.7186126708984375, "global_step": 55015, "epoch": 1309} {"train_loss": -5.815192222595215, "global_step": 55016, "epoch": 1309} {"train_loss": -5.7464141845703125, "global_step": 55017, "epoch": 1309} {"train_loss": -5.837003707885742, "global_step": 55018, "epoch": 1309} {"train_loss": -5.807976824896676, "global_step": 55019, "epoch": 1309, "val_loss": 74377.8046875} {"train_loss": -5.721068859100342, "global_step": 55020, "epoch": 1310} {"train_loss": -5.755989074707031, "global_step": 55021, "epoch": 1310} {"train_loss": -5.847167491912842, "global_step": 55022, "epoch": 1310} {"train_loss": -5.710536956787109, "global_step": 55023, "epoch": 1310} {"train_loss": -5.828756332397461, "global_step": 55024, "epoch": 1310} {"train_loss": -5.769018173217773, "global_step": 55025, "epoch": 1310} {"train_loss": -5.697558403015137, "global_step": 55026, "epoch": 1310} {"train_loss": -5.7660722732543945, "global_step": 55027, "epoch": 1310} {"train_loss": -5.6146721839904785, "global_step": 55028, "epoch": 1310} {"train_loss": -5.687099456787109, "global_step": 55029, "epoch": 1310} {"train_loss": -5.895564079284668, "global_step": 55030, "epoch": 1310} {"train_loss": -5.888640403747559, "global_step": 55031, "epoch": 1310} {"train_loss": -5.844174385070801, "global_step": 55032, "epoch": 1310} {"train_loss": -5.920470237731934, "global_step": 55033, "epoch": 1310} {"train_loss": -5.835195541381836, "global_step": 55034, "epoch": 1310} {"train_loss": -5.769873142242432, "global_step": 55035, "epoch": 1310} {"train_loss": -5.792726993560791, "global_step": 55036, "epoch": 1310} {"train_loss": -5.833402633666992, "global_step": 55037, "epoch": 1310} {"train_loss": -5.743213653564453, "global_step": 55038, "epoch": 1310} {"train_loss": -5.831215858459473, "global_step": 55039, "epoch": 1310} {"train_loss": -5.726757526397705, "global_step": 55040, "epoch": 1310} {"train_loss": -5.739401817321777, "global_step": 55041, "epoch": 1310} {"train_loss": -5.9299540519714355, "global_step": 55042, "epoch": 1310} {"train_loss": -5.818547248840332, "global_step": 55043, "epoch": 1310} {"train_loss": -5.9264326095581055, "global_step": 55044, "epoch": 1310} {"train_loss": -5.816589832305908, "global_step": 55045, "epoch": 1310} {"train_loss": -5.804471969604492, "global_step": 55046, "epoch": 1310} {"train_loss": -5.83640718460083, "global_step": 55047, "epoch": 1310} {"train_loss": -5.749670028686523, "global_step": 55048, "epoch": 1310} {"train_loss": -5.865721225738525, "global_step": 55049, "epoch": 1310} {"train_loss": -5.765604496002197, "global_step": 55050, "epoch": 1310} {"train_loss": -5.79707670211792, "global_step": 55051, "epoch": 1310} {"train_loss": -5.656822681427002, "global_step": 55052, "epoch": 1310} {"train_loss": -5.784488677978516, "global_step": 55053, "epoch": 1310} {"train_loss": -5.856599807739258, "global_step": 55054, "epoch": 1310} {"train_loss": -5.829849720001221, "global_step": 55055, "epoch": 1310} {"train_loss": -5.9165239334106445, "global_step": 55056, "epoch": 1310} {"train_loss": -5.7264556884765625, "global_step": 55057, "epoch": 1310} {"train_loss": -5.803476333618164, "global_step": 55058, "epoch": 1310} {"train_loss": -5.895024299621582, "global_step": 55059, "epoch": 1310} {"train_loss": -5.912221908569336, "global_step": 55060, "epoch": 1310} {"train_loss": -5.80374398685637, "global_step": 55061, "epoch": 1310, "val_loss": 74373.4453125} {"train_loss": -5.908814430236816, "global_step": 55062, "epoch": 1311} {"train_loss": -5.900976657867432, "global_step": 55063, "epoch": 1311} {"train_loss": -5.908359527587891, "global_step": 55064, "epoch": 1311} {"train_loss": -5.876314163208008, "global_step": 55065, "epoch": 1311} {"train_loss": -5.754954814910889, "global_step": 55066, "epoch": 1311} {"train_loss": -5.867608070373535, "global_step": 55067, "epoch": 1311} {"train_loss": -5.906633377075195, "global_step": 55068, "epoch": 1311} {"train_loss": -5.896036148071289, "global_step": 55069, "epoch": 1311} {"train_loss": -5.856450080871582, "global_step": 55070, "epoch": 1311} {"train_loss": -5.846156120300293, "global_step": 55071, "epoch": 1311} {"train_loss": -5.838055610656738, "global_step": 55072, "epoch": 1311} {"train_loss": -5.868257522583008, "global_step": 55073, "epoch": 1311} {"train_loss": -5.876553058624268, "global_step": 55074, "epoch": 1311} {"train_loss": -5.686509132385254, "global_step": 55075, "epoch": 1311} {"train_loss": -5.784070014953613, "global_step": 55076, "epoch": 1311} {"train_loss": -5.791087627410889, "global_step": 55077, "epoch": 1311} {"train_loss": -5.79705810546875, "global_step": 55078, "epoch": 1311} {"train_loss": -5.895977020263672, "global_step": 55079, "epoch": 1311} {"train_loss": -5.916870594024658, "global_step": 55080, "epoch": 1311} {"train_loss": -5.846054553985596, "global_step": 55081, "epoch": 1311} {"train_loss": -5.8347015380859375, "global_step": 55082, "epoch": 1311} {"train_loss": -5.89260721206665, "global_step": 55083, "epoch": 1311} {"train_loss": -5.745737075805664, "global_step": 55084, "epoch": 1311} {"train_loss": -5.794511795043945, "global_step": 55085, "epoch": 1311} {"train_loss": -5.747934341430664, "global_step": 55086, "epoch": 1311} {"train_loss": -5.886249542236328, "global_step": 55087, "epoch": 1311} {"train_loss": -5.894306182861328, "global_step": 55088, "epoch": 1311} {"train_loss": -5.887746810913086, "global_step": 55089, "epoch": 1311} {"train_loss": -5.8756561279296875, "global_step": 55090, "epoch": 1311} {"train_loss": -5.8001227378845215, "global_step": 55091, "epoch": 1311} {"train_loss": -5.770572662353516, "global_step": 55092, "epoch": 1311} {"train_loss": -5.809120178222656, "global_step": 55093, "epoch": 1311} {"train_loss": -5.936498641967773, "global_step": 55094, "epoch": 1311} {"train_loss": -5.83978271484375, "global_step": 55095, "epoch": 1311} {"train_loss": -5.82666015625, "global_step": 55096, "epoch": 1311} {"train_loss": -5.878976821899414, "global_step": 55097, "epoch": 1311} {"train_loss": -5.848539352416992, "global_step": 55098, "epoch": 1311} {"train_loss": -5.781979560852051, "global_step": 55099, "epoch": 1311} {"train_loss": -5.927883625030518, "global_step": 55100, "epoch": 1311} {"train_loss": -5.889222145080566, "global_step": 55101, "epoch": 1311} {"train_loss": -5.794054985046387, "global_step": 55102, "epoch": 1311} {"train_loss": -5.84625194186256, "global_step": 55103, "epoch": 1311, "val_loss": 74461.0859375} {"train_loss": -5.926743507385254, "global_step": 55104, "epoch": 1312} {"train_loss": -5.9168853759765625, "global_step": 55105, "epoch": 1312} {"train_loss": -5.83394718170166, "global_step": 55106, "epoch": 1312} {"train_loss": -5.852219104766846, "global_step": 55107, "epoch": 1312} {"train_loss": -5.852076530456543, "global_step": 55108, "epoch": 1312} {"train_loss": -5.758360385894775, "global_step": 55109, "epoch": 1312} {"train_loss": -5.791142463684082, "global_step": 55110, "epoch": 1312} {"train_loss": -5.847323894500732, "global_step": 55111, "epoch": 1312} {"train_loss": -5.676242351531982, "global_step": 55112, "epoch": 1312} {"train_loss": -5.92977237701416, "global_step": 55113, "epoch": 1312} {"train_loss": -5.847757339477539, "global_step": 55114, "epoch": 1312} {"train_loss": -5.92325496673584, "global_step": 55115, "epoch": 1312} {"train_loss": -5.793553352355957, "global_step": 55116, "epoch": 1312} {"train_loss": -5.6965179443359375, "global_step": 55117, "epoch": 1312} {"train_loss": -5.687290668487549, "global_step": 55118, "epoch": 1312} {"train_loss": -5.92034912109375, "global_step": 55119, "epoch": 1312} {"train_loss": -5.830557823181152, "global_step": 55120, "epoch": 1312} {"train_loss": -5.898216247558594, "global_step": 55121, "epoch": 1312} {"train_loss": -5.804750919342041, "global_step": 55122, "epoch": 1312} {"train_loss": -5.868880271911621, "global_step": 55123, "epoch": 1312} {"train_loss": -5.927040100097656, "global_step": 55124, "epoch": 1312} {"train_loss": -5.813294410705566, "global_step": 55125, "epoch": 1312} {"train_loss": -5.811846733093262, "global_step": 55126, "epoch": 1312} {"train_loss": -5.799037933349609, "global_step": 55127, "epoch": 1312} {"train_loss": -5.925734043121338, "global_step": 55128, "epoch": 1312} {"train_loss": -5.7641801834106445, "global_step": 55129, "epoch": 1312} {"train_loss": -5.855207443237305, "global_step": 55130, "epoch": 1312} {"train_loss": -5.6790852546691895, "global_step": 55131, "epoch": 1312} {"train_loss": -5.7411956787109375, "global_step": 55132, "epoch": 1312} {"train_loss": -5.75510311126709, "global_step": 55133, "epoch": 1312} {"train_loss": -5.742241382598877, "global_step": 55134, "epoch": 1312} {"train_loss": -5.843782424926758, "global_step": 55135, "epoch": 1312} {"train_loss": -5.771045684814453, "global_step": 55136, "epoch": 1312} {"train_loss": -5.784012317657471, "global_step": 55137, "epoch": 1312} {"train_loss": -5.8353800773620605, "global_step": 55138, "epoch": 1312} {"train_loss": -5.696473121643066, "global_step": 55139, "epoch": 1312} {"train_loss": -5.720044136047363, "global_step": 55140, "epoch": 1312} {"train_loss": -5.745075225830078, "global_step": 55141, "epoch": 1312} {"train_loss": -5.8178205490112305, "global_step": 55142, "epoch": 1312} {"train_loss": -5.755108833312988, "global_step": 55143, "epoch": 1312} {"train_loss": -5.971139907836914, "global_step": 55144, "epoch": 1312} {"train_loss": -5.813431455975487, "global_step": 55145, "epoch": 1312, "val_loss": 74210.125} {"train_loss": -5.830657482147217, "global_step": 55146, "epoch": 1313} {"train_loss": -5.837026596069336, "global_step": 55147, "epoch": 1313} {"train_loss": -5.857875823974609, "global_step": 55148, "epoch": 1313} {"train_loss": -5.914316654205322, "global_step": 55149, "epoch": 1313} {"train_loss": -5.971164703369141, "global_step": 55150, "epoch": 1313} {"train_loss": -5.855860710144043, "global_step": 55151, "epoch": 1313} {"train_loss": -5.806039333343506, "global_step": 55152, "epoch": 1313} {"train_loss": -5.831604957580566, "global_step": 55153, "epoch": 1313} {"train_loss": -5.83579158782959, "global_step": 55154, "epoch": 1313} {"train_loss": -5.762709617614746, "global_step": 55155, "epoch": 1313} {"train_loss": -5.900298118591309, "global_step": 55156, "epoch": 1313} {"train_loss": -5.640437126159668, "global_step": 55157, "epoch": 1313} {"train_loss": -5.936365127563477, "global_step": 55158, "epoch": 1313} {"train_loss": -5.927266597747803, "global_step": 55159, "epoch": 1313} {"train_loss": -5.9372878074646, "global_step": 55160, "epoch": 1313} {"train_loss": -5.753694534301758, "global_step": 55161, "epoch": 1313} {"train_loss": -5.801469802856445, "global_step": 55162, "epoch": 1313} {"train_loss": -5.976945877075195, "global_step": 55163, "epoch": 1313} {"train_loss": -5.7649245262146, "global_step": 55164, "epoch": 1313} {"train_loss": -5.90335750579834, "global_step": 55165, "epoch": 1313} {"train_loss": -5.833233833312988, "global_step": 55166, "epoch": 1313} {"train_loss": -5.886519432067871, "global_step": 55167, "epoch": 1313} {"train_loss": -5.847372055053711, "global_step": 55168, "epoch": 1313} {"train_loss": -5.7508440017700195, "global_step": 55169, "epoch": 1313} {"train_loss": -5.8774027824401855, "global_step": 55170, "epoch": 1313} {"train_loss": -5.797334671020508, "global_step": 55171, "epoch": 1313} {"train_loss": -5.891538619995117, "global_step": 55172, "epoch": 1313} {"train_loss": -5.756938457489014, "global_step": 55173, "epoch": 1313} {"train_loss": -5.736629486083984, "global_step": 55174, "epoch": 1313} {"train_loss": -5.749770164489746, "global_step": 55175, "epoch": 1313} {"train_loss": -5.7372612953186035, "global_step": 55176, "epoch": 1313} {"train_loss": -5.790584564208984, "global_step": 55177, "epoch": 1313} {"train_loss": -5.918665885925293, "global_step": 55178, "epoch": 1313} {"train_loss": -5.815761566162109, "global_step": 55179, "epoch": 1313} {"train_loss": -5.904478073120117, "global_step": 55180, "epoch": 1313} {"train_loss": -5.782456398010254, "global_step": 55181, "epoch": 1313} {"train_loss": -6.01800012588501, "global_step": 55182, "epoch": 1313} {"train_loss": -5.871706485748291, "global_step": 55183, "epoch": 1313} {"train_loss": -5.773855209350586, "global_step": 55184, "epoch": 1313} {"train_loss": -5.810050964355469, "global_step": 55185, "epoch": 1313} {"train_loss": -5.774808406829834, "global_step": 55186, "epoch": 1313} {"train_loss": -5.834725629715693, "global_step": 55187, "epoch": 1313, "val_loss": 74439.53125} {"train_loss": -5.751619815826416, "global_step": 55188, "epoch": 1314} {"train_loss": -5.836432456970215, "global_step": 55189, "epoch": 1314} {"train_loss": -5.795190334320068, "global_step": 55190, "epoch": 1314} {"train_loss": -5.974092483520508, "global_step": 55191, "epoch": 1314} {"train_loss": -5.713901519775391, "global_step": 55192, "epoch": 1314} {"train_loss": -5.901529312133789, "global_step": 55193, "epoch": 1314} {"train_loss": -5.785764694213867, "global_step": 55194, "epoch": 1314} {"train_loss": -5.838505268096924, "global_step": 55195, "epoch": 1314} {"train_loss": -5.706625461578369, "global_step": 55196, "epoch": 1314} {"train_loss": -5.82345724105835, "global_step": 55197, "epoch": 1314} {"train_loss": -5.855288982391357, "global_step": 55198, "epoch": 1314} {"train_loss": -5.880740642547607, "global_step": 55199, "epoch": 1314} {"train_loss": -5.89411735534668, "global_step": 55200, "epoch": 1314} {"train_loss": -5.781685829162598, "global_step": 55201, "epoch": 1314} {"train_loss": -5.778767108917236, "global_step": 55202, "epoch": 1314} {"train_loss": -5.884208679199219, "global_step": 55203, "epoch": 1314} {"train_loss": -5.769957065582275, "global_step": 55204, "epoch": 1314} {"train_loss": -5.811500549316406, "global_step": 55205, "epoch": 1314} {"train_loss": -5.855747222900391, "global_step": 55206, "epoch": 1314} {"train_loss": -5.7929487228393555, "global_step": 55207, "epoch": 1314} {"train_loss": -5.9164347648620605, "global_step": 55208, "epoch": 1314} {"train_loss": -5.713127613067627, "global_step": 55209, "epoch": 1314} {"train_loss": -5.950233459472656, "global_step": 55210, "epoch": 1314} {"train_loss": -5.718646049499512, "global_step": 55211, "epoch": 1314} {"train_loss": -5.867087364196777, "global_step": 55212, "epoch": 1314} {"train_loss": -5.881209373474121, "global_step": 55213, "epoch": 1314} {"train_loss": -5.789138317108154, "global_step": 55214, "epoch": 1314} {"train_loss": -5.8077216148376465, "global_step": 55215, "epoch": 1314} {"train_loss": -5.823467254638672, "global_step": 55216, "epoch": 1314} {"train_loss": -5.886029243469238, "global_step": 55217, "epoch": 1314} {"train_loss": -5.86328125, "global_step": 55218, "epoch": 1314} {"train_loss": -5.781666278839111, "global_step": 55219, "epoch": 1314} {"train_loss": -5.790731430053711, "global_step": 55220, "epoch": 1314} {"train_loss": -5.883984565734863, "global_step": 55221, "epoch": 1314} {"train_loss": -5.8933563232421875, "global_step": 55222, "epoch": 1314} {"train_loss": -5.823361873626709, "global_step": 55223, "epoch": 1314} {"train_loss": -5.79965353012085, "global_step": 55224, "epoch": 1314} {"train_loss": -5.802580833435059, "global_step": 55225, "epoch": 1314} {"train_loss": -5.931208610534668, "global_step": 55226, "epoch": 1314} {"train_loss": -5.739151954650879, "global_step": 55227, "epoch": 1314} {"train_loss": -5.752857208251953, "global_step": 55228, "epoch": 1314} {"train_loss": -5.825077090944562, "global_step": 55229, "epoch": 1314, "val_loss": 74347.5859375} {"train_loss": -5.767146110534668, "global_step": 55230, "epoch": 1315} {"train_loss": -5.931149959564209, "global_step": 55231, "epoch": 1315} {"train_loss": -5.757718086242676, "global_step": 55232, "epoch": 1315} {"train_loss": -5.750335693359375, "global_step": 55233, "epoch": 1315} {"train_loss": -5.851168632507324, "global_step": 55234, "epoch": 1315} {"train_loss": -5.813844203948975, "global_step": 55235, "epoch": 1315} {"train_loss": -5.895855903625488, "global_step": 55236, "epoch": 1315} {"train_loss": -5.936907768249512, "global_step": 55237, "epoch": 1315} {"train_loss": -5.818307876586914, "global_step": 55238, "epoch": 1315} {"train_loss": -5.8595733642578125, "global_step": 55239, "epoch": 1315} {"train_loss": -5.753019332885742, "global_step": 55240, "epoch": 1315} {"train_loss": -5.838379383087158, "global_step": 55241, "epoch": 1315} {"train_loss": -5.735878944396973, "global_step": 55242, "epoch": 1315} {"train_loss": -5.814927101135254, "global_step": 55243, "epoch": 1315} {"train_loss": -5.878340721130371, "global_step": 55244, "epoch": 1315} {"train_loss": -5.73016357421875, "global_step": 55245, "epoch": 1315} {"train_loss": -5.772372245788574, "global_step": 55246, "epoch": 1315} {"train_loss": -5.928102493286133, "global_step": 55247, "epoch": 1315} {"train_loss": -5.927475929260254, "global_step": 55248, "epoch": 1315} {"train_loss": -5.867439270019531, "global_step": 55249, "epoch": 1315} {"train_loss": -5.836782932281494, "global_step": 55250, "epoch": 1315} {"train_loss": -5.807766914367676, "global_step": 55251, "epoch": 1315} {"train_loss": -5.904152870178223, "global_step": 55252, "epoch": 1315} {"train_loss": -5.817881107330322, "global_step": 55253, "epoch": 1315} {"train_loss": -5.787298202514648, "global_step": 55254, "epoch": 1315} {"train_loss": -5.797601699829102, "global_step": 55255, "epoch": 1315} {"train_loss": -5.927713871002197, "global_step": 55256, "epoch": 1315} {"train_loss": -5.775430679321289, "global_step": 55257, "epoch": 1315} {"train_loss": -5.860983848571777, "global_step": 55258, "epoch": 1315} {"train_loss": -5.871833801269531, "global_step": 55259, "epoch": 1315} {"train_loss": -5.782761573791504, "global_step": 55260, "epoch": 1315} {"train_loss": -5.74334192276001, "global_step": 55261, "epoch": 1315} {"train_loss": -5.946490287780762, "global_step": 55262, "epoch": 1315} {"train_loss": -5.780298233032227, "global_step": 55263, "epoch": 1315} {"train_loss": -5.875438690185547, "global_step": 55264, "epoch": 1315} {"train_loss": -5.88572359085083, "global_step": 55265, "epoch": 1315} {"train_loss": -5.926933288574219, "global_step": 55266, "epoch": 1315} {"train_loss": -5.8965911865234375, "global_step": 55267, "epoch": 1315} {"train_loss": -5.8246378898620605, "global_step": 55268, "epoch": 1315} {"train_loss": -5.848451137542725, "global_step": 55269, "epoch": 1315} {"train_loss": -5.871847152709961, "global_step": 55270, "epoch": 1315} {"train_loss": -5.835900863011678, "global_step": 55271, "epoch": 1315, "val_loss": 74579.7421875} {"train_loss": -5.868501663208008, "global_step": 55272, "epoch": 1316} {"train_loss": -5.722546100616455, "global_step": 55273, "epoch": 1316} {"train_loss": -5.832307815551758, "global_step": 55274, "epoch": 1316} {"train_loss": -5.771101474761963, "global_step": 55275, "epoch": 1316} {"train_loss": -5.906919479370117, "global_step": 55276, "epoch": 1316} {"train_loss": -5.782016277313232, "global_step": 55277, "epoch": 1316} {"train_loss": -5.879208564758301, "global_step": 55278, "epoch": 1316} {"train_loss": -5.924901008605957, "global_step": 55279, "epoch": 1316} {"train_loss": -5.79386568069458, "global_step": 55280, "epoch": 1316} {"train_loss": -5.798391342163086, "global_step": 55281, "epoch": 1316} {"train_loss": -5.872788429260254, "global_step": 55282, "epoch": 1316} {"train_loss": -5.83747673034668, "global_step": 55283, "epoch": 1316} {"train_loss": -5.870742321014404, "global_step": 55284, "epoch": 1316} {"train_loss": -5.834329605102539, "global_step": 55285, "epoch": 1316} {"train_loss": -5.793825149536133, "global_step": 55286, "epoch": 1316} {"train_loss": -5.934746742248535, "global_step": 55287, "epoch": 1316} {"train_loss": -5.814827919006348, "global_step": 55288, "epoch": 1316} {"train_loss": -5.816987991333008, "global_step": 55289, "epoch": 1316} {"train_loss": -5.863252639770508, "global_step": 55290, "epoch": 1316} {"train_loss": -5.831368923187256, "global_step": 55291, "epoch": 1316} {"train_loss": -5.906796932220459, "global_step": 55292, "epoch": 1316} {"train_loss": -5.731351852416992, "global_step": 55293, "epoch": 1316} {"train_loss": -5.80996036529541, "global_step": 55294, "epoch": 1316} {"train_loss": -5.820724010467529, "global_step": 55295, "epoch": 1316} {"train_loss": -5.865262031555176, "global_step": 55296, "epoch": 1316} {"train_loss": -5.73392391204834, "global_step": 55297, "epoch": 1316} {"train_loss": -5.99680233001709, "global_step": 55298, "epoch": 1316} {"train_loss": -5.879166126251221, "global_step": 55299, "epoch": 1316} {"train_loss": -5.795476913452148, "global_step": 55300, "epoch": 1316} {"train_loss": -5.839068412780762, "global_step": 55301, "epoch": 1316} {"train_loss": -5.822397232055664, "global_step": 55302, "epoch": 1316} {"train_loss": -5.8562421798706055, "global_step": 55303, "epoch": 1316} {"train_loss": -5.793735504150391, "global_step": 55304, "epoch": 1316} {"train_loss": -5.604859352111816, "global_step": 55305, "epoch": 1316} {"train_loss": -5.89071798324585, "global_step": 55306, "epoch": 1316} {"train_loss": -5.904290199279785, "global_step": 55307, "epoch": 1316} {"train_loss": -5.935001373291016, "global_step": 55308, "epoch": 1316} {"train_loss": -5.854597568511963, "global_step": 55309, "epoch": 1316} {"train_loss": -5.756073951721191, "global_step": 55310, "epoch": 1316} {"train_loss": -5.779882431030273, "global_step": 55311, "epoch": 1316} {"train_loss": -5.895622730255127, "global_step": 55312, "epoch": 1316} {"train_loss": -5.834907543091547, "global_step": 55313, "epoch": 1316, "val_loss": 74085.7578125} {"train_loss": -5.867836952209473, "global_step": 55314, "epoch": 1317} {"train_loss": -5.841681957244873, "global_step": 55315, "epoch": 1317} {"train_loss": -5.920821189880371, "global_step": 55316, "epoch": 1317} {"train_loss": -5.936896324157715, "global_step": 55317, "epoch": 1317} {"train_loss": -5.896427631378174, "global_step": 55318, "epoch": 1317} {"train_loss": -5.766788482666016, "global_step": 55319, "epoch": 1317} {"train_loss": -5.92371940612793, "global_step": 55320, "epoch": 1317} {"train_loss": -5.88001012802124, "global_step": 55321, "epoch": 1317} {"train_loss": -5.9493207931518555, "global_step": 55322, "epoch": 1317} {"train_loss": -5.809098243713379, "global_step": 55323, "epoch": 1317} {"train_loss": -5.829822063446045, "global_step": 55324, "epoch": 1317} {"train_loss": -5.91646671295166, "global_step": 55325, "epoch": 1317} {"train_loss": -5.7900848388671875, "global_step": 55326, "epoch": 1317} {"train_loss": -5.899587631225586, "global_step": 55327, "epoch": 1317} {"train_loss": -5.766156196594238, "global_step": 55328, "epoch": 1317} {"train_loss": -5.85930061340332, "global_step": 55329, "epoch": 1317} {"train_loss": -5.8167901039123535, "global_step": 55330, "epoch": 1317} {"train_loss": -5.857032299041748, "global_step": 55331, "epoch": 1317} {"train_loss": -5.920267581939697, "global_step": 55332, "epoch": 1317} {"train_loss": -5.703065872192383, "global_step": 55333, "epoch": 1317} {"train_loss": -5.870767116546631, "global_step": 55334, "epoch": 1317} {"train_loss": -5.836560249328613, "global_step": 55335, "epoch": 1317} {"train_loss": -5.879369735717773, "global_step": 55336, "epoch": 1317} {"train_loss": -5.800786972045898, "global_step": 55337, "epoch": 1317} {"train_loss": -5.854248523712158, "global_step": 55338, "epoch": 1317} {"train_loss": -5.814497947692871, "global_step": 55339, "epoch": 1317} {"train_loss": -5.800897598266602, "global_step": 55340, "epoch": 1317} {"train_loss": -5.792350769042969, "global_step": 55341, "epoch": 1317} {"train_loss": -5.633154392242432, "global_step": 55342, "epoch": 1317} {"train_loss": -5.785159111022949, "global_step": 55343, "epoch": 1317} {"train_loss": -5.824256896972656, "global_step": 55344, "epoch": 1317} {"train_loss": -5.849228858947754, "global_step": 55345, "epoch": 1317} {"train_loss": -5.941717147827148, "global_step": 55346, "epoch": 1317} {"train_loss": -5.7868804931640625, "global_step": 55347, "epoch": 1317} {"train_loss": -5.787385940551758, "global_step": 55348, "epoch": 1317} {"train_loss": -5.775200843811035, "global_step": 55349, "epoch": 1317} {"train_loss": -5.775629997253418, "global_step": 55350, "epoch": 1317} {"train_loss": -5.743115425109863, "global_step": 55351, "epoch": 1317} {"train_loss": -5.8558669090271, "global_step": 55352, "epoch": 1317} {"train_loss": -5.792551040649414, "global_step": 55353, "epoch": 1317} {"train_loss": -5.84256649017334, "global_step": 55354, "epoch": 1317} {"train_loss": -5.835185652687436, "global_step": 55355, "epoch": 1317, "val_loss": 74535.015625} {"train_loss": -5.898037910461426, "global_step": 55356, "epoch": 1318} {"train_loss": -5.8802080154418945, "global_step": 55357, "epoch": 1318} {"train_loss": -5.776766777038574, "global_step": 55358, "epoch": 1318} {"train_loss": -5.759064674377441, "global_step": 55359, "epoch": 1318} {"train_loss": -5.860293865203857, "global_step": 55360, "epoch": 1318} {"train_loss": -5.846964359283447, "global_step": 55361, "epoch": 1318} {"train_loss": -5.730384826660156, "global_step": 55362, "epoch": 1318} {"train_loss": -5.8611016273498535, "global_step": 55363, "epoch": 1318} {"train_loss": -5.833270072937012, "global_step": 55364, "epoch": 1318} {"train_loss": -5.744533538818359, "global_step": 55365, "epoch": 1318} {"train_loss": -5.8151326179504395, "global_step": 55366, "epoch": 1318} {"train_loss": -5.803472995758057, "global_step": 55367, "epoch": 1318} {"train_loss": -6.026796340942383, "global_step": 55368, "epoch": 1318} {"train_loss": -5.894205093383789, "global_step": 55369, "epoch": 1318} {"train_loss": -5.848909378051758, "global_step": 55370, "epoch": 1318} {"train_loss": -5.906623363494873, "global_step": 55371, "epoch": 1318} {"train_loss": -5.846534252166748, "global_step": 55372, "epoch": 1318} {"train_loss": -5.8943939208984375, "global_step": 55373, "epoch": 1318} {"train_loss": -5.879603385925293, "global_step": 55374, "epoch": 1318} {"train_loss": -5.81924295425415, "global_step": 55375, "epoch": 1318} {"train_loss": -5.858639717102051, "global_step": 55376, "epoch": 1318} {"train_loss": -5.9550557136535645, "global_step": 55377, "epoch": 1318} {"train_loss": -5.953711032867432, "global_step": 55378, "epoch": 1318} {"train_loss": -5.857434272766113, "global_step": 55379, "epoch": 1318} {"train_loss": -5.819684028625488, "global_step": 55380, "epoch": 1318} {"train_loss": -5.8416643142700195, "global_step": 55381, "epoch": 1318} {"train_loss": -5.8465728759765625, "global_step": 55382, "epoch": 1318} {"train_loss": -5.880527496337891, "global_step": 55383, "epoch": 1318} {"train_loss": -5.799388885498047, "global_step": 55384, "epoch": 1318} {"train_loss": -5.826111793518066, "global_step": 55385, "epoch": 1318} {"train_loss": -5.854767799377441, "global_step": 55386, "epoch": 1318} {"train_loss": -5.794178485870361, "global_step": 55387, "epoch": 1318} {"train_loss": -5.899281024932861, "global_step": 55388, "epoch": 1318} {"train_loss": -5.860101699829102, "global_step": 55389, "epoch": 1318} {"train_loss": -5.774446487426758, "global_step": 55390, "epoch": 1318} {"train_loss": -5.7547502517700195, "global_step": 55391, "epoch": 1318} {"train_loss": -5.725447654724121, "global_step": 55392, "epoch": 1318} {"train_loss": -5.824276447296143, "global_step": 55393, "epoch": 1318} {"train_loss": -5.816689968109131, "global_step": 55394, "epoch": 1318} {"train_loss": -5.794084548950195, "global_step": 55395, "epoch": 1318} {"train_loss": -5.933911323547363, "global_step": 55396, "epoch": 1318} {"train_loss": -5.841656083152408, "global_step": 55397, "epoch": 1318, "val_loss": 73886.8359375} {"train_loss": -5.868974685668945, "global_step": 55398, "epoch": 1319} {"train_loss": -5.784151077270508, "global_step": 55399, "epoch": 1319} {"train_loss": -5.94433069229126, "global_step": 55400, "epoch": 1319} {"train_loss": -6.008131504058838, "global_step": 55401, "epoch": 1319} {"train_loss": -5.823524475097656, "global_step": 55402, "epoch": 1319} {"train_loss": -5.880154132843018, "global_step": 55403, "epoch": 1319} {"train_loss": -5.890797138214111, "global_step": 55404, "epoch": 1319} {"train_loss": -5.878364562988281, "global_step": 55405, "epoch": 1319} {"train_loss": -5.810514450073242, "global_step": 55406, "epoch": 1319} {"train_loss": -5.9030537605285645, "global_step": 55407, "epoch": 1319} {"train_loss": -5.873181343078613, "global_step": 55408, "epoch": 1319} {"train_loss": -5.913602828979492, "global_step": 55409, "epoch": 1319} {"train_loss": -5.845938682556152, "global_step": 55410, "epoch": 1319} {"train_loss": -5.881117820739746, "global_step": 55411, "epoch": 1319} {"train_loss": -5.904747009277344, "global_step": 55412, "epoch": 1319} {"train_loss": -5.848576068878174, "global_step": 55413, "epoch": 1319} {"train_loss": -5.669748783111572, "global_step": 55414, "epoch": 1319} {"train_loss": -5.911149978637695, "global_step": 55415, "epoch": 1319} {"train_loss": -5.810879707336426, "global_step": 55416, "epoch": 1319} {"train_loss": -5.819435119628906, "global_step": 55417, "epoch": 1319} {"train_loss": -5.936265468597412, "global_step": 55418, "epoch": 1319} {"train_loss": -5.845589637756348, "global_step": 55419, "epoch": 1319} {"train_loss": -5.795173645019531, "global_step": 55420, "epoch": 1319} {"train_loss": -5.727953910827637, "global_step": 55421, "epoch": 1319} {"train_loss": -5.863337516784668, "global_step": 55422, "epoch": 1319} {"train_loss": -5.787349700927734, "global_step": 55423, "epoch": 1319} {"train_loss": -5.930386066436768, "global_step": 55424, "epoch": 1319} {"train_loss": -5.700494766235352, "global_step": 55425, "epoch": 1319} {"train_loss": -5.797122001647949, "global_step": 55426, "epoch": 1319} {"train_loss": -5.795321941375732, "global_step": 55427, "epoch": 1319} {"train_loss": -5.799238204956055, "global_step": 55428, "epoch": 1319} {"train_loss": -5.802852630615234, "global_step": 55429, "epoch": 1319} {"train_loss": -5.922579765319824, "global_step": 55430, "epoch": 1319} {"train_loss": -5.868627071380615, "global_step": 55431, "epoch": 1319} {"train_loss": -5.724591255187988, "global_step": 55432, "epoch": 1319} {"train_loss": -5.795053482055664, "global_step": 55433, "epoch": 1319} {"train_loss": -5.673670768737793, "global_step": 55434, "epoch": 1319} {"train_loss": -5.834560871124268, "global_step": 55435, "epoch": 1319} {"train_loss": -5.74855375289917, "global_step": 55436, "epoch": 1319} {"train_loss": -5.712868690490723, "global_step": 55437, "epoch": 1319} {"train_loss": -5.768988609313965, "global_step": 55438, "epoch": 1319} {"train_loss": -5.8303323700314476, "global_step": 55439, "epoch": 1319, "val_loss": 74374.9453125} {"train_loss": -5.861593246459961, "global_step": 55440, "epoch": 1320} {"train_loss": -5.760012626647949, "global_step": 55441, "epoch": 1320} {"train_loss": -5.809728622436523, "global_step": 55442, "epoch": 1320} {"train_loss": -5.828908920288086, "global_step": 55443, "epoch": 1320} {"train_loss": -5.752283096313477, "global_step": 55444, "epoch": 1320} {"train_loss": -5.868585109710693, "global_step": 55445, "epoch": 1320} {"train_loss": -5.926667213439941, "global_step": 55446, "epoch": 1320} {"train_loss": -5.746277809143066, "global_step": 55447, "epoch": 1320} {"train_loss": -5.690025329589844, "global_step": 55448, "epoch": 1320} {"train_loss": -5.799922466278076, "global_step": 55449, "epoch": 1320} {"train_loss": -5.925013065338135, "global_step": 55450, "epoch": 1320} {"train_loss": -5.637513637542725, "global_step": 55451, "epoch": 1320} {"train_loss": -5.769980430603027, "global_step": 55452, "epoch": 1320} {"train_loss": -5.661135673522949, "global_step": 55453, "epoch": 1320} {"train_loss": -5.8224897384643555, "global_step": 55454, "epoch": 1320} {"train_loss": -5.8301801681518555, "global_step": 55455, "epoch": 1320} {"train_loss": -5.878185749053955, "global_step": 55456, "epoch": 1320} {"train_loss": -5.784890174865723, "global_step": 55457, "epoch": 1320} {"train_loss": -5.837316513061523, "global_step": 55458, "epoch": 1320} {"train_loss": -5.922744274139404, "global_step": 55459, "epoch": 1320} {"train_loss": -5.642853736877441, "global_step": 55460, "epoch": 1320} {"train_loss": -5.919637680053711, "global_step": 55461, "epoch": 1320} {"train_loss": -5.809823989868164, "global_step": 55462, "epoch": 1320} {"train_loss": -5.868635177612305, "global_step": 55463, "epoch": 1320} {"train_loss": -5.716632843017578, "global_step": 55464, "epoch": 1320} {"train_loss": -5.895013809204102, "global_step": 55465, "epoch": 1320} {"train_loss": -5.750530242919922, "global_step": 55466, "epoch": 1320} {"train_loss": -5.7109880447387695, "global_step": 55467, "epoch": 1320} {"train_loss": -5.8978705406188965, "global_step": 55468, "epoch": 1320} {"train_loss": -5.822005748748779, "global_step": 55469, "epoch": 1320} {"train_loss": -5.847903251647949, "global_step": 55470, "epoch": 1320} {"train_loss": -5.79591178894043, "global_step": 55471, "epoch": 1320} {"train_loss": -5.917861461639404, "global_step": 55472, "epoch": 1320} {"train_loss": -5.800264358520508, "global_step": 55473, "epoch": 1320} {"train_loss": -5.869440078735352, "global_step": 55474, "epoch": 1320} {"train_loss": -5.877952575683594, "global_step": 55475, "epoch": 1320} {"train_loss": -5.86897611618042, "global_step": 55476, "epoch": 1320} {"train_loss": -5.988413333892822, "global_step": 55477, "epoch": 1320} {"train_loss": -5.9158220291137695, "global_step": 55478, "epoch": 1320} {"train_loss": -5.823026180267334, "global_step": 55479, "epoch": 1320} {"train_loss": -5.790821075439453, "global_step": 55480, "epoch": 1320} {"train_loss": -5.82175384249006, "global_step": 55481, "epoch": 1320, "val_loss": 74096.3203125} {"train_loss": -5.87999153137207, "global_step": 55482, "epoch": 1321} {"train_loss": -5.749020099639893, "global_step": 55483, "epoch": 1321} {"train_loss": -5.984311103820801, "global_step": 55484, "epoch": 1321} {"train_loss": -5.866129398345947, "global_step": 55485, "epoch": 1321} {"train_loss": -5.876865386962891, "global_step": 55486, "epoch": 1321} {"train_loss": -5.835611343383789, "global_step": 55487, "epoch": 1321} {"train_loss": -5.753449440002441, "global_step": 55488, "epoch": 1321} {"train_loss": -5.8685712814331055, "global_step": 55489, "epoch": 1321} {"train_loss": -5.667234420776367, "global_step": 55490, "epoch": 1321} {"train_loss": -5.883928298950195, "global_step": 55491, "epoch": 1321} {"train_loss": -5.892249584197998, "global_step": 55492, "epoch": 1321} {"train_loss": -5.928297519683838, "global_step": 55493, "epoch": 1321} {"train_loss": -5.878357410430908, "global_step": 55494, "epoch": 1321} {"train_loss": -5.863574028015137, "global_step": 55495, "epoch": 1321} {"train_loss": -5.877737998962402, "global_step": 55496, "epoch": 1321} {"train_loss": -5.807015895843506, "global_step": 55497, "epoch": 1321} {"train_loss": -5.925736427307129, "global_step": 55498, "epoch": 1321} {"train_loss": -5.994366645812988, "global_step": 55499, "epoch": 1321} {"train_loss": -5.865839004516602, "global_step": 55500, "epoch": 1321} {"train_loss": -5.96807861328125, "global_step": 55501, "epoch": 1321} {"train_loss": -5.856706142425537, "global_step": 55502, "epoch": 1321} {"train_loss": -5.777375221252441, "global_step": 55503, "epoch": 1321} {"train_loss": -5.930708885192871, "global_step": 55504, "epoch": 1321} {"train_loss": -5.787080764770508, "global_step": 55505, "epoch": 1321} {"train_loss": -5.718052864074707, "global_step": 55506, "epoch": 1321} {"train_loss": -5.897714614868164, "global_step": 55507, "epoch": 1321} {"train_loss": -5.939513206481934, "global_step": 55508, "epoch": 1321} {"train_loss": -5.930438995361328, "global_step": 55509, "epoch": 1321} {"train_loss": -5.823293685913086, "global_step": 55510, "epoch": 1321} {"train_loss": -5.777279853820801, "global_step": 55511, "epoch": 1321} {"train_loss": -5.8795318603515625, "global_step": 55512, "epoch": 1321} {"train_loss": -5.895450592041016, "global_step": 55513, "epoch": 1321} {"train_loss": -5.727322578430176, "global_step": 55514, "epoch": 1321} {"train_loss": -5.756612300872803, "global_step": 55515, "epoch": 1321} {"train_loss": -5.807936191558838, "global_step": 55516, "epoch": 1321} {"train_loss": -5.730191230773926, "global_step": 55517, "epoch": 1321} {"train_loss": -5.877379894256592, "global_step": 55518, "epoch": 1321} {"train_loss": -5.889652252197266, "global_step": 55519, "epoch": 1321} {"train_loss": -5.803831577301025, "global_step": 55520, "epoch": 1321} {"train_loss": -5.781495094299316, "global_step": 55521, "epoch": 1321} {"train_loss": -5.851556301116943, "global_step": 55522, "epoch": 1321} {"train_loss": -5.846755765733265, "global_step": 55523, "epoch": 1321, "val_loss": 74301.4453125} {"train_loss": -5.823052406311035, "global_step": 55524, "epoch": 1322} {"train_loss": -6.013341426849365, "global_step": 55525, "epoch": 1322} {"train_loss": -5.718673229217529, "global_step": 55526, "epoch": 1322} {"train_loss": -5.879582405090332, "global_step": 55527, "epoch": 1322} {"train_loss": -5.919893741607666, "global_step": 55528, "epoch": 1322} {"train_loss": -5.847754955291748, "global_step": 55529, "epoch": 1322} {"train_loss": -5.74172830581665, "global_step": 55530, "epoch": 1322} {"train_loss": -5.8784918785095215, "global_step": 55531, "epoch": 1322} {"train_loss": -5.909441947937012, "global_step": 55532, "epoch": 1322} {"train_loss": -5.789187431335449, "global_step": 55533, "epoch": 1322} {"train_loss": -5.943097114562988, "global_step": 55534, "epoch": 1322} {"train_loss": -5.741735458374023, "global_step": 55535, "epoch": 1322} {"train_loss": -5.890882968902588, "global_step": 55536, "epoch": 1322} {"train_loss": -5.810786247253418, "global_step": 55537, "epoch": 1322} {"train_loss": -5.857729911804199, "global_step": 55538, "epoch": 1322} {"train_loss": -5.8666229248046875, "global_step": 55539, "epoch": 1322} {"train_loss": -5.849089622497559, "global_step": 55540, "epoch": 1322} {"train_loss": -5.776988983154297, "global_step": 55541, "epoch": 1322} {"train_loss": -5.760307312011719, "global_step": 55542, "epoch": 1322} {"train_loss": -5.7959394454956055, "global_step": 55543, "epoch": 1322} {"train_loss": -5.927435874938965, "global_step": 55544, "epoch": 1322} {"train_loss": -5.749835014343262, "global_step": 55545, "epoch": 1322} {"train_loss": -5.936467170715332, "global_step": 55546, "epoch": 1322} {"train_loss": -5.980997085571289, "global_step": 55547, "epoch": 1322} {"train_loss": -5.898138999938965, "global_step": 55548, "epoch": 1322} {"train_loss": -5.862327575683594, "global_step": 55549, "epoch": 1322} {"train_loss": -5.926761150360107, "global_step": 55550, "epoch": 1322} {"train_loss": -5.808237552642822, "global_step": 55551, "epoch": 1322} {"train_loss": -5.796991348266602, "global_step": 55552, "epoch": 1322} {"train_loss": -5.8634257316589355, "global_step": 55553, "epoch": 1322} {"train_loss": -5.858264923095703, "global_step": 55554, "epoch": 1322} {"train_loss": -5.844825744628906, "global_step": 55555, "epoch": 1322} {"train_loss": -5.884632110595703, "global_step": 55556, "epoch": 1322} {"train_loss": -5.779624938964844, "global_step": 55557, "epoch": 1322} {"train_loss": -5.885526657104492, "global_step": 55558, "epoch": 1322} {"train_loss": -5.822563648223877, "global_step": 55559, "epoch": 1322} {"train_loss": -5.760176658630371, "global_step": 55560, "epoch": 1322} {"train_loss": -5.8323774337768555, "global_step": 55561, "epoch": 1322} {"train_loss": -5.91448974609375, "global_step": 55562, "epoch": 1322} {"train_loss": -5.837327480316162, "global_step": 55563, "epoch": 1322} {"train_loss": -5.935974597930908, "global_step": 55564, "epoch": 1322} {"train_loss": -5.848193668183827, "global_step": 55565, "epoch": 1322, "val_loss": 74250.59375} {"train_loss": -5.979587078094482, "global_step": 55566, "epoch": 1323} {"train_loss": -5.840481758117676, "global_step": 55567, "epoch": 1323} {"train_loss": -5.93019962310791, "global_step": 55568, "epoch": 1323} {"train_loss": -5.873522758483887, "global_step": 55569, "epoch": 1323} {"train_loss": -5.82465934753418, "global_step": 55570, "epoch": 1323} {"train_loss": -5.878112316131592, "global_step": 55571, "epoch": 1323} {"train_loss": -5.921627044677734, "global_step": 55572, "epoch": 1323} {"train_loss": -5.723777770996094, "global_step": 55573, "epoch": 1323} {"train_loss": -5.794152736663818, "global_step": 55574, "epoch": 1323} {"train_loss": -5.9300336837768555, "global_step": 55575, "epoch": 1323} {"train_loss": -5.891869068145752, "global_step": 55576, "epoch": 1323} {"train_loss": -5.860167503356934, "global_step": 55577, "epoch": 1323} {"train_loss": -5.728669166564941, "global_step": 55578, "epoch": 1323} {"train_loss": -5.83985710144043, "global_step": 55579, "epoch": 1323} {"train_loss": -5.794656753540039, "global_step": 55580, "epoch": 1323} {"train_loss": -5.745009422302246, "global_step": 55581, "epoch": 1323} {"train_loss": -5.877780914306641, "global_step": 55582, "epoch": 1323} {"train_loss": -5.865176677703857, "global_step": 55583, "epoch": 1323} {"train_loss": -5.860476493835449, "global_step": 55584, "epoch": 1323} {"train_loss": -5.775466442108154, "global_step": 55585, "epoch": 1323} {"train_loss": -5.907733917236328, "global_step": 55586, "epoch": 1323} {"train_loss": -5.963105201721191, "global_step": 55587, "epoch": 1323} {"train_loss": -5.835934638977051, "global_step": 55588, "epoch": 1323} {"train_loss": -5.9330339431762695, "global_step": 55589, "epoch": 1323} {"train_loss": -5.8560333251953125, "global_step": 55590, "epoch": 1323} {"train_loss": -5.838500499725342, "global_step": 55591, "epoch": 1323} {"train_loss": -5.8519182205200195, "global_step": 55592, "epoch": 1323} {"train_loss": -5.967116832733154, "global_step": 55593, "epoch": 1323} {"train_loss": -5.989886283874512, "global_step": 55594, "epoch": 1323} {"train_loss": -5.792231559753418, "global_step": 55595, "epoch": 1323} {"train_loss": -5.786375045776367, "global_step": 55596, "epoch": 1323} {"train_loss": -5.730739116668701, "global_step": 55597, "epoch": 1323} {"train_loss": -5.831787109375, "global_step": 55598, "epoch": 1323} {"train_loss": -5.857328414916992, "global_step": 55599, "epoch": 1323} {"train_loss": -5.943341255187988, "global_step": 55600, "epoch": 1323} {"train_loss": -5.8463592529296875, "global_step": 55601, "epoch": 1323} {"train_loss": -5.814144134521484, "global_step": 55602, "epoch": 1323} {"train_loss": -5.9573774337768555, "global_step": 55603, "epoch": 1323} {"train_loss": -5.719222068786621, "global_step": 55604, "epoch": 1323} {"train_loss": -5.853320598602295, "global_step": 55605, "epoch": 1323} {"train_loss": -5.967279434204102, "global_step": 55606, "epoch": 1323} {"train_loss": -5.857101292837234, "global_step": 55607, "epoch": 1323, "val_loss": 74342.21875} {"train_loss": -5.84012508392334, "global_step": 55608, "epoch": 1324} {"train_loss": -5.720518112182617, "global_step": 55609, "epoch": 1324} {"train_loss": -5.886113166809082, "global_step": 55610, "epoch": 1324} {"train_loss": -5.976247787475586, "global_step": 55611, "epoch": 1324} {"train_loss": -5.874408721923828, "global_step": 55612, "epoch": 1324} {"train_loss": -5.827744483947754, "global_step": 55613, "epoch": 1324} {"train_loss": -6.001585006713867, "global_step": 55614, "epoch": 1324} {"train_loss": -5.813643932342529, "global_step": 55615, "epoch": 1324} {"train_loss": -5.942577362060547, "global_step": 55616, "epoch": 1324} {"train_loss": -5.884120941162109, "global_step": 55617, "epoch": 1324} {"train_loss": -5.923492431640625, "global_step": 55618, "epoch": 1324} {"train_loss": -5.927753448486328, "global_step": 55619, "epoch": 1324} {"train_loss": -5.89976167678833, "global_step": 55620, "epoch": 1324} {"train_loss": -5.953446388244629, "global_step": 55621, "epoch": 1324} {"train_loss": -5.87577486038208, "global_step": 55622, "epoch": 1324} {"train_loss": -5.847001552581787, "global_step": 55623, "epoch": 1324} {"train_loss": -5.890804767608643, "global_step": 55624, "epoch": 1324} {"train_loss": -5.981623649597168, "global_step": 55625, "epoch": 1324} {"train_loss": -5.810114860534668, "global_step": 55626, "epoch": 1324} {"train_loss": -5.97407341003418, "global_step": 55627, "epoch": 1324} {"train_loss": -5.819744110107422, "global_step": 55628, "epoch": 1324} {"train_loss": -5.907167434692383, "global_step": 55629, "epoch": 1324} {"train_loss": -5.78574275970459, "global_step": 55630, "epoch": 1324} {"train_loss": -5.87060546875, "global_step": 55631, "epoch": 1324} {"train_loss": -5.85800313949585, "global_step": 55632, "epoch": 1324} {"train_loss": -5.797406196594238, "global_step": 55633, "epoch": 1324} {"train_loss": -5.955796241760254, "global_step": 55634, "epoch": 1324} {"train_loss": -5.843746185302734, "global_step": 55635, "epoch": 1324} {"train_loss": -5.74186897277832, "global_step": 55636, "epoch": 1324} {"train_loss": -5.933127403259277, "global_step": 55637, "epoch": 1324} {"train_loss": -5.769104480743408, "global_step": 55638, "epoch": 1324} {"train_loss": -5.8584442138671875, "global_step": 55639, "epoch": 1324} {"train_loss": -5.741180419921875, "global_step": 55640, "epoch": 1324} {"train_loss": -5.821439266204834, "global_step": 55641, "epoch": 1324} {"train_loss": -5.875000953674316, "global_step": 55642, "epoch": 1324} {"train_loss": -5.804666996002197, "global_step": 55643, "epoch": 1324} {"train_loss": -5.852442741394043, "global_step": 55644, "epoch": 1324} {"train_loss": -5.7652435302734375, "global_step": 55645, "epoch": 1324} {"train_loss": -5.762828826904297, "global_step": 55646, "epoch": 1324} {"train_loss": -5.809284687042236, "global_step": 55647, "epoch": 1324} {"train_loss": -5.7508392333984375, "global_step": 55648, "epoch": 1324} {"train_loss": -5.855938900084722, "global_step": 55649, "epoch": 1324, "val_loss": 74277.6953125} {"train_loss": -5.79588508605957, "global_step": 55650, "epoch": 1325} {"train_loss": -5.8054094314575195, "global_step": 55651, "epoch": 1325} {"train_loss": -5.8369293212890625, "global_step": 55652, "epoch": 1325} {"train_loss": -5.878449440002441, "global_step": 55653, "epoch": 1325} {"train_loss": -5.936957359313965, "global_step": 55654, "epoch": 1325} {"train_loss": -5.862216472625732, "global_step": 55655, "epoch": 1325} {"train_loss": -5.931550979614258, "global_step": 55656, "epoch": 1325} {"train_loss": -5.7548370361328125, "global_step": 55657, "epoch": 1325} {"train_loss": -5.923558712005615, "global_step": 55658, "epoch": 1325} {"train_loss": -5.783782482147217, "global_step": 55659, "epoch": 1325} {"train_loss": -5.761765480041504, "global_step": 55660, "epoch": 1325} {"train_loss": -5.72993278503418, "global_step": 55661, "epoch": 1325} {"train_loss": -5.8482136726379395, "global_step": 55662, "epoch": 1325} {"train_loss": -5.913336753845215, "global_step": 55663, "epoch": 1325} {"train_loss": -5.737301826477051, "global_step": 55664, "epoch": 1325} {"train_loss": -5.84002685546875, "global_step": 55665, "epoch": 1325} {"train_loss": -5.864596843719482, "global_step": 55666, "epoch": 1325} {"train_loss": -5.8393964767456055, "global_step": 55667, "epoch": 1325} {"train_loss": -5.821086883544922, "global_step": 55668, "epoch": 1325} {"train_loss": -5.737240791320801, "global_step": 55669, "epoch": 1325} {"train_loss": -5.8264055252075195, "global_step": 55670, "epoch": 1325} {"train_loss": -5.604517936706543, "global_step": 55671, "epoch": 1325} {"train_loss": -5.870222091674805, "global_step": 55672, "epoch": 1325} {"train_loss": -5.842118263244629, "global_step": 55673, "epoch": 1325} {"train_loss": -5.797388076782227, "global_step": 55674, "epoch": 1325} {"train_loss": -5.762746810913086, "global_step": 55675, "epoch": 1325} {"train_loss": -5.708178520202637, "global_step": 55676, "epoch": 1325} {"train_loss": -5.9476470947265625, "global_step": 55677, "epoch": 1325} {"train_loss": -5.819091796875, "global_step": 55678, "epoch": 1325} {"train_loss": -5.833893775939941, "global_step": 55679, "epoch": 1325} {"train_loss": -5.760944843292236, "global_step": 55680, "epoch": 1325} {"train_loss": -5.835533142089844, "global_step": 55681, "epoch": 1325} {"train_loss": -5.882883071899414, "global_step": 55682, "epoch": 1325} {"train_loss": -5.7873005867004395, "global_step": 55683, "epoch": 1325} {"train_loss": -5.8129448890686035, "global_step": 55684, "epoch": 1325} {"train_loss": -5.831349849700928, "global_step": 55685, "epoch": 1325} {"train_loss": -5.901699542999268, "global_step": 55686, "epoch": 1325} {"train_loss": -5.85435676574707, "global_step": 55687, "epoch": 1325} {"train_loss": -5.874317169189453, "global_step": 55688, "epoch": 1325} {"train_loss": -5.830432415008545, "global_step": 55689, "epoch": 1325} {"train_loss": -5.839311599731445, "global_step": 55690, "epoch": 1325} {"train_loss": -5.82745749609811, "global_step": 55691, "epoch": 1325, "val_loss": 74175.4765625} {"train_loss": -5.872620582580566, "global_step": 55692, "epoch": 1326} {"train_loss": -5.851279258728027, "global_step": 55693, "epoch": 1326} {"train_loss": -5.916129112243652, "global_step": 55694, "epoch": 1326} {"train_loss": -5.802271366119385, "global_step": 55695, "epoch": 1326} {"train_loss": -5.822042465209961, "global_step": 55696, "epoch": 1326} {"train_loss": -5.856846809387207, "global_step": 55697, "epoch": 1326} {"train_loss": -5.777589797973633, "global_step": 55698, "epoch": 1326} {"train_loss": -5.768744468688965, "global_step": 55699, "epoch": 1326} {"train_loss": -5.923173904418945, "global_step": 55700, "epoch": 1326} {"train_loss": -5.87639045715332, "global_step": 55701, "epoch": 1326} {"train_loss": -5.867366313934326, "global_step": 55702, "epoch": 1326} {"train_loss": -5.8292460441589355, "global_step": 55703, "epoch": 1326} {"train_loss": -5.8133225440979, "global_step": 55704, "epoch": 1326} {"train_loss": -5.8123016357421875, "global_step": 55705, "epoch": 1326} {"train_loss": -5.838765621185303, "global_step": 55706, "epoch": 1326} {"train_loss": -5.868447303771973, "global_step": 55707, "epoch": 1326} {"train_loss": -5.8874664306640625, "global_step": 55708, "epoch": 1326} {"train_loss": -5.870062828063965, "global_step": 55709, "epoch": 1326} {"train_loss": -5.815474033355713, "global_step": 55710, "epoch": 1326} {"train_loss": -5.814259052276611, "global_step": 55711, "epoch": 1326} {"train_loss": -5.879181861877441, "global_step": 55712, "epoch": 1326} {"train_loss": -5.821322917938232, "global_step": 55713, "epoch": 1326} {"train_loss": -5.779468059539795, "global_step": 55714, "epoch": 1326} {"train_loss": -5.888684272766113, "global_step": 55715, "epoch": 1326} {"train_loss": -5.864087104797363, "global_step": 55716, "epoch": 1326} {"train_loss": -5.903782367706299, "global_step": 55717, "epoch": 1326} {"train_loss": -5.993203163146973, "global_step": 55718, "epoch": 1326} {"train_loss": -5.758458137512207, "global_step": 55719, "epoch": 1326} {"train_loss": -5.905547142028809, "global_step": 55720, "epoch": 1326} {"train_loss": -5.744167327880859, "global_step": 55721, "epoch": 1326} {"train_loss": -5.82513952255249, "global_step": 55722, "epoch": 1326} {"train_loss": -5.914968490600586, "global_step": 55723, "epoch": 1326} {"train_loss": -5.856009483337402, "global_step": 55724, "epoch": 1326} {"train_loss": -5.808043479919434, "global_step": 55725, "epoch": 1326} {"train_loss": -5.800865173339844, "global_step": 55726, "epoch": 1326} {"train_loss": -5.852272987365723, "global_step": 55727, "epoch": 1326} {"train_loss": -5.921968936920166, "global_step": 55728, "epoch": 1326} {"train_loss": -5.943755626678467, "global_step": 55729, "epoch": 1326} {"train_loss": -5.9083781242370605, "global_step": 55730, "epoch": 1326} {"train_loss": -5.859884262084961, "global_step": 55731, "epoch": 1326} {"train_loss": -5.8066582679748535, "global_step": 55732, "epoch": 1326} {"train_loss": -5.851919775917416, "global_step": 55733, "epoch": 1326, "val_loss": 74629.0234375} {"train_loss": -5.731327533721924, "global_step": 55734, "epoch": 1327} {"train_loss": -5.828956604003906, "global_step": 55735, "epoch": 1327} {"train_loss": -5.943703651428223, "global_step": 55736, "epoch": 1327} {"train_loss": -5.888491630554199, "global_step": 55737, "epoch": 1327} {"train_loss": -5.770046234130859, "global_step": 55738, "epoch": 1327} {"train_loss": -5.717532157897949, "global_step": 55739, "epoch": 1327} {"train_loss": -5.7522196769714355, "global_step": 55740, "epoch": 1327} {"train_loss": -5.891705513000488, "global_step": 55741, "epoch": 1327} {"train_loss": -5.754246234893799, "global_step": 55742, "epoch": 1327} {"train_loss": -5.817748546600342, "global_step": 55743, "epoch": 1327} {"train_loss": -5.938375473022461, "global_step": 55744, "epoch": 1327} {"train_loss": -5.869314193725586, "global_step": 55745, "epoch": 1327} {"train_loss": -5.7298712730407715, "global_step": 55746, "epoch": 1327} {"train_loss": -5.798700332641602, "global_step": 55747, "epoch": 1327} {"train_loss": -5.833417892456055, "global_step": 55748, "epoch": 1327} {"train_loss": -5.823993682861328, "global_step": 55749, "epoch": 1327} {"train_loss": -5.826390266418457, "global_step": 55750, "epoch": 1327} {"train_loss": -5.821567058563232, "global_step": 55751, "epoch": 1327} {"train_loss": -5.781041145324707, "global_step": 55752, "epoch": 1327} {"train_loss": -5.940207481384277, "global_step": 55753, "epoch": 1327} {"train_loss": -5.6506876945495605, "global_step": 55754, "epoch": 1327} {"train_loss": -5.786624908447266, "global_step": 55755, "epoch": 1327} {"train_loss": -5.733402729034424, "global_step": 55756, "epoch": 1327} {"train_loss": -5.9305620193481445, "global_step": 55757, "epoch": 1327} {"train_loss": -5.840218544006348, "global_step": 55758, "epoch": 1327} {"train_loss": -5.777510643005371, "global_step": 55759, "epoch": 1327} {"train_loss": -5.899995803833008, "global_step": 55760, "epoch": 1327} {"train_loss": -5.810444355010986, "global_step": 55761, "epoch": 1327} {"train_loss": -5.709798336029053, "global_step": 55762, "epoch": 1327} {"train_loss": -5.785120010375977, "global_step": 55763, "epoch": 1327} {"train_loss": -5.814764022827148, "global_step": 55764, "epoch": 1327} {"train_loss": -5.835958480834961, "global_step": 55765, "epoch": 1327} {"train_loss": -5.9777631759643555, "global_step": 55766, "epoch": 1327} {"train_loss": -5.721962928771973, "global_step": 55767, "epoch": 1327} {"train_loss": -5.854121208190918, "global_step": 55768, "epoch": 1327} {"train_loss": -5.784645080566406, "global_step": 55769, "epoch": 1327} {"train_loss": -5.80642032623291, "global_step": 55770, "epoch": 1327} {"train_loss": -5.741483211517334, "global_step": 55771, "epoch": 1327} {"train_loss": -5.768578052520752, "global_step": 55772, "epoch": 1327} {"train_loss": -5.7604169845581055, "global_step": 55773, "epoch": 1327} {"train_loss": -5.7622480392456055, "global_step": 55774, "epoch": 1327} {"train_loss": -5.811916487557547, "global_step": 55775, "epoch": 1327, "val_loss": 74266.640625} {"train_loss": -5.822870254516602, "global_step": 55776, "epoch": 1328} {"train_loss": -5.747429847717285, "global_step": 55777, "epoch": 1328} {"train_loss": -5.743875503540039, "global_step": 55778, "epoch": 1328} {"train_loss": -5.978445053100586, "global_step": 55779, "epoch": 1328} {"train_loss": -5.750086307525635, "global_step": 55780, "epoch": 1328} {"train_loss": -5.808785438537598, "global_step": 55781, "epoch": 1328} {"train_loss": -5.821954250335693, "global_step": 55782, "epoch": 1328} {"train_loss": -5.874822616577148, "global_step": 55783, "epoch": 1328} {"train_loss": -5.933312892913818, "global_step": 55784, "epoch": 1328} {"train_loss": -5.857442855834961, "global_step": 55785, "epoch": 1328} {"train_loss": -5.857789039611816, "global_step": 55786, "epoch": 1328} {"train_loss": -5.812478065490723, "global_step": 55787, "epoch": 1328} {"train_loss": -5.817020416259766, "global_step": 55788, "epoch": 1328} {"train_loss": -5.895064830780029, "global_step": 55789, "epoch": 1328} {"train_loss": -5.998998641967773, "global_step": 55790, "epoch": 1328} {"train_loss": -5.867669105529785, "global_step": 55791, "epoch": 1328} {"train_loss": -5.846590995788574, "global_step": 55792, "epoch": 1328} {"train_loss": -5.858393669128418, "global_step": 55793, "epoch": 1328} {"train_loss": -5.88682222366333, "global_step": 55794, "epoch": 1328} {"train_loss": -5.786158561706543, "global_step": 55795, "epoch": 1328} {"train_loss": -5.755306720733643, "global_step": 55796, "epoch": 1328} {"train_loss": -5.867319107055664, "global_step": 55797, "epoch": 1328} {"train_loss": -5.933959007263184, "global_step": 55798, "epoch": 1328} {"train_loss": -5.955150604248047, "global_step": 55799, "epoch": 1328} {"train_loss": -5.861510276794434, "global_step": 55800, "epoch": 1328} {"train_loss": -5.919720649719238, "global_step": 55801, "epoch": 1328} {"train_loss": -5.819028377532959, "global_step": 55802, "epoch": 1328} {"train_loss": -5.85288667678833, "global_step": 55803, "epoch": 1328} {"train_loss": -5.870405673980713, "global_step": 55804, "epoch": 1328} {"train_loss": -5.779850482940674, "global_step": 55805, "epoch": 1328} {"train_loss": -5.856770038604736, "global_step": 55806, "epoch": 1328} {"train_loss": -5.893963813781738, "global_step": 55807, "epoch": 1328} {"train_loss": -5.874233245849609, "global_step": 55808, "epoch": 1328} {"train_loss": -5.774547576904297, "global_step": 55809, "epoch": 1328} {"train_loss": -5.962280750274658, "global_step": 55810, "epoch": 1328} {"train_loss": -5.925236225128174, "global_step": 55811, "epoch": 1328} {"train_loss": -5.875059127807617, "global_step": 55812, "epoch": 1328} {"train_loss": -5.819228172302246, "global_step": 55813, "epoch": 1328} {"train_loss": -5.898755073547363, "global_step": 55814, "epoch": 1328} {"train_loss": -5.915659427642822, "global_step": 55815, "epoch": 1328} {"train_loss": -5.960283279418945, "global_step": 55816, "epoch": 1328} {"train_loss": -5.859829244159517, "global_step": 55817, "epoch": 1328, "val_loss": 74457.09375} {"train_loss": -5.817743301391602, "global_step": 55818, "epoch": 1329} {"train_loss": -5.829476356506348, "global_step": 55819, "epoch": 1329} {"train_loss": -5.838544845581055, "global_step": 55820, "epoch": 1329} {"train_loss": -5.863984107971191, "global_step": 55821, "epoch": 1329} {"train_loss": -5.861462116241455, "global_step": 55822, "epoch": 1329} {"train_loss": -5.78839111328125, "global_step": 55823, "epoch": 1329} {"train_loss": -5.820669174194336, "global_step": 55824, "epoch": 1329} {"train_loss": -5.853362083435059, "global_step": 55825, "epoch": 1329} {"train_loss": -5.8166823387146, "global_step": 55826, "epoch": 1329} {"train_loss": -5.826801300048828, "global_step": 55827, "epoch": 1329} {"train_loss": -5.8228654861450195, "global_step": 55828, "epoch": 1329} {"train_loss": -5.812567234039307, "global_step": 55829, "epoch": 1329} {"train_loss": -5.923624038696289, "global_step": 55830, "epoch": 1329} {"train_loss": -5.935425281524658, "global_step": 55831, "epoch": 1329} {"train_loss": -5.8415422439575195, "global_step": 55832, "epoch": 1329} {"train_loss": -5.6743879318237305, "global_step": 55833, "epoch": 1329} {"train_loss": -5.724033355712891, "global_step": 55834, "epoch": 1329} {"train_loss": -5.948394775390625, "global_step": 55835, "epoch": 1329} {"train_loss": -5.661132335662842, "global_step": 55836, "epoch": 1329} {"train_loss": -5.7504167556762695, "global_step": 55837, "epoch": 1329} {"train_loss": -5.933483123779297, "global_step": 55838, "epoch": 1329} {"train_loss": -5.676583766937256, "global_step": 55839, "epoch": 1329} {"train_loss": -5.748804092407227, "global_step": 55840, "epoch": 1329} {"train_loss": -5.7176737785339355, "global_step": 55841, "epoch": 1329} {"train_loss": -5.757194519042969, "global_step": 55842, "epoch": 1329} {"train_loss": -5.708889007568359, "global_step": 55843, "epoch": 1329} {"train_loss": -5.563687801361084, "global_step": 55844, "epoch": 1329} {"train_loss": -5.77686071395874, "global_step": 55845, "epoch": 1329} {"train_loss": -5.507144927978516, "global_step": 55846, "epoch": 1329} {"train_loss": -5.828560829162598, "global_step": 55847, "epoch": 1329} {"train_loss": -5.481884002685547, "global_step": 55848, "epoch": 1329} {"train_loss": -5.757297992706299, "global_step": 55849, "epoch": 1329} {"train_loss": -5.572067737579346, "global_step": 55850, "epoch": 1329} {"train_loss": -5.693325042724609, "global_step": 55851, "epoch": 1329} {"train_loss": -5.819833278656006, "global_step": 55852, "epoch": 1329} {"train_loss": -5.833835124969482, "global_step": 55853, "epoch": 1329} {"train_loss": -5.662738800048828, "global_step": 55854, "epoch": 1329} {"train_loss": -5.811949729919434, "global_step": 55855, "epoch": 1329} {"train_loss": -5.733591079711914, "global_step": 55856, "epoch": 1329} {"train_loss": -5.834503173828125, "global_step": 55857, "epoch": 1329} {"train_loss": -5.824435234069824, "global_step": 55858, "epoch": 1329} {"train_loss": -5.772499288831439, "global_step": 55859, "epoch": 1329, "val_loss": 75116.703125} {"train_loss": -5.764703750610352, "global_step": 55860, "epoch": 1330} {"train_loss": -5.878758907318115, "global_step": 55861, "epoch": 1330} {"train_loss": -5.713566303253174, "global_step": 55862, "epoch": 1330} {"train_loss": -5.794131278991699, "global_step": 55863, "epoch": 1330} {"train_loss": -5.849157333374023, "global_step": 55864, "epoch": 1330} {"train_loss": -5.8894453048706055, "global_step": 55865, "epoch": 1330} {"train_loss": -5.735495567321777, "global_step": 55866, "epoch": 1330} {"train_loss": -5.816030979156494, "global_step": 55867, "epoch": 1330} {"train_loss": -5.891735076904297, "global_step": 55868, "epoch": 1330} {"train_loss": -5.803401470184326, "global_step": 55869, "epoch": 1330} {"train_loss": -5.857963562011719, "global_step": 55870, "epoch": 1330} {"train_loss": -5.862323760986328, "global_step": 55871, "epoch": 1330} {"train_loss": -5.986018657684326, "global_step": 55872, "epoch": 1330} {"train_loss": -5.878920555114746, "global_step": 55873, "epoch": 1330} {"train_loss": -5.87033748626709, "global_step": 55874, "epoch": 1330} {"train_loss": -5.882851600646973, "global_step": 55875, "epoch": 1330} {"train_loss": -5.839090347290039, "global_step": 55876, "epoch": 1330} {"train_loss": -5.979844093322754, "global_step": 55877, "epoch": 1330} {"train_loss": -5.923405647277832, "global_step": 55878, "epoch": 1330} {"train_loss": -5.7503342628479, "global_step": 55879, "epoch": 1330} {"train_loss": -5.814496040344238, "global_step": 55880, "epoch": 1330} {"train_loss": -5.84094762802124, "global_step": 55881, "epoch": 1330} {"train_loss": -5.795323371887207, "global_step": 55882, "epoch": 1330} {"train_loss": -5.929276466369629, "global_step": 55883, "epoch": 1330} {"train_loss": -5.730843544006348, "global_step": 55884, "epoch": 1330} {"train_loss": -5.894436836242676, "global_step": 55885, "epoch": 1330} {"train_loss": -5.862093448638916, "global_step": 55886, "epoch": 1330} {"train_loss": -5.830911159515381, "global_step": 55887, "epoch": 1330} {"train_loss": -5.749232292175293, "global_step": 55888, "epoch": 1330} {"train_loss": -5.766051292419434, "global_step": 55889, "epoch": 1330} {"train_loss": -5.82835054397583, "global_step": 55890, "epoch": 1330} {"train_loss": -5.817140579223633, "global_step": 55891, "epoch": 1330} {"train_loss": -5.944871425628662, "global_step": 55892, "epoch": 1330} {"train_loss": -5.8282389640808105, "global_step": 55893, "epoch": 1330} {"train_loss": -5.954071998596191, "global_step": 55894, "epoch": 1330} {"train_loss": -5.8276495933532715, "global_step": 55895, "epoch": 1330} {"train_loss": -5.871187210083008, "global_step": 55896, "epoch": 1330} {"train_loss": -5.766045570373535, "global_step": 55897, "epoch": 1330} {"train_loss": -6.00688362121582, "global_step": 55898, "epoch": 1330} {"train_loss": -5.8578643798828125, "global_step": 55899, "epoch": 1330} {"train_loss": -5.968358993530273, "global_step": 55900, "epoch": 1330} {"train_loss": -5.851241475059872, "global_step": 55901, "epoch": 1330, "val_loss": 74221.8125} {"train_loss": -5.984212398529053, "global_step": 55902, "epoch": 1331} {"train_loss": -5.871325969696045, "global_step": 55903, "epoch": 1331} {"train_loss": -5.825553894042969, "global_step": 55904, "epoch": 1331} {"train_loss": -5.794212818145752, "global_step": 55905, "epoch": 1331} {"train_loss": -5.780163764953613, "global_step": 55906, "epoch": 1331} {"train_loss": -5.870473384857178, "global_step": 55907, "epoch": 1331} {"train_loss": -5.887870788574219, "global_step": 55908, "epoch": 1331} {"train_loss": -5.786986827850342, "global_step": 55909, "epoch": 1331} {"train_loss": -5.820131301879883, "global_step": 55910, "epoch": 1331} {"train_loss": -5.78157901763916, "global_step": 55911, "epoch": 1331} {"train_loss": -5.877283096313477, "global_step": 55912, "epoch": 1331} {"train_loss": -5.7927141189575195, "global_step": 55913, "epoch": 1331} {"train_loss": -5.743877410888672, "global_step": 55914, "epoch": 1331} {"train_loss": -5.905868053436279, "global_step": 55915, "epoch": 1331} {"train_loss": -5.89503812789917, "global_step": 55916, "epoch": 1331} {"train_loss": -5.816364288330078, "global_step": 55917, "epoch": 1331} {"train_loss": -5.863935470581055, "global_step": 55918, "epoch": 1331} {"train_loss": -5.894231796264648, "global_step": 55919, "epoch": 1331} {"train_loss": -5.904201984405518, "global_step": 55920, "epoch": 1331} {"train_loss": -5.846439361572266, "global_step": 55921, "epoch": 1331} {"train_loss": -5.902815341949463, "global_step": 55922, "epoch": 1331} {"train_loss": -5.810932636260986, "global_step": 55923, "epoch": 1331} {"train_loss": -5.851415157318115, "global_step": 55924, "epoch": 1331} {"train_loss": -5.941307544708252, "global_step": 55925, "epoch": 1331} {"train_loss": -5.849800109863281, "global_step": 55926, "epoch": 1331} {"train_loss": -5.869631290435791, "global_step": 55927, "epoch": 1331} {"train_loss": -5.799651145935059, "global_step": 55928, "epoch": 1331} {"train_loss": -5.889122009277344, "global_step": 55929, "epoch": 1331} {"train_loss": -5.704559803009033, "global_step": 55930, "epoch": 1331} {"train_loss": -5.804853439331055, "global_step": 55931, "epoch": 1331} {"train_loss": -5.7936906814575195, "global_step": 55932, "epoch": 1331} {"train_loss": -5.883063793182373, "global_step": 55933, "epoch": 1331} {"train_loss": -5.795534610748291, "global_step": 55934, "epoch": 1331} {"train_loss": -5.953480243682861, "global_step": 55935, "epoch": 1331} {"train_loss": -5.932587623596191, "global_step": 55936, "epoch": 1331} {"train_loss": -5.776729583740234, "global_step": 55937, "epoch": 1331} {"train_loss": -5.819546699523926, "global_step": 55938, "epoch": 1331} {"train_loss": -5.67252254486084, "global_step": 55939, "epoch": 1331} {"train_loss": -5.871782302856445, "global_step": 55940, "epoch": 1331} {"train_loss": -5.829883098602295, "global_step": 55941, "epoch": 1331} {"train_loss": -5.851211071014404, "global_step": 55942, "epoch": 1331} {"train_loss": -5.8449691817874, "global_step": 55943, "epoch": 1331, "val_loss": 74173.7578125} {"train_loss": -5.677682876586914, "global_step": 55944, "epoch": 1332} {"train_loss": -5.889144420623779, "global_step": 55945, "epoch": 1332} {"train_loss": -5.982316017150879, "global_step": 55946, "epoch": 1332} {"train_loss": -5.704678535461426, "global_step": 55947, "epoch": 1332} {"train_loss": -5.731932640075684, "global_step": 55948, "epoch": 1332} {"train_loss": -5.745497226715088, "global_step": 55949, "epoch": 1332} {"train_loss": -5.813259124755859, "global_step": 55950, "epoch": 1332} {"train_loss": -5.82830810546875, "global_step": 55951, "epoch": 1332} {"train_loss": -5.941821098327637, "global_step": 55952, "epoch": 1332} {"train_loss": -5.796582221984863, "global_step": 55953, "epoch": 1332} {"train_loss": -5.790147304534912, "global_step": 55954, "epoch": 1332} {"train_loss": -5.754570960998535, "global_step": 55955, "epoch": 1332} {"train_loss": -5.7981791496276855, "global_step": 55956, "epoch": 1332} {"train_loss": -5.796074867248535, "global_step": 55957, "epoch": 1332} {"train_loss": -5.778815269470215, "global_step": 55958, "epoch": 1332} {"train_loss": -5.813507080078125, "global_step": 55959, "epoch": 1332} {"train_loss": -5.881051540374756, "global_step": 55960, "epoch": 1332} {"train_loss": -5.866888046264648, "global_step": 55961, "epoch": 1332} {"train_loss": -5.888524055480957, "global_step": 55962, "epoch": 1332} {"train_loss": -5.868393421173096, "global_step": 55963, "epoch": 1332} {"train_loss": -5.789854049682617, "global_step": 55964, "epoch": 1332} {"train_loss": -5.808808326721191, "global_step": 55965, "epoch": 1332} {"train_loss": -5.776322841644287, "global_step": 55966, "epoch": 1332} {"train_loss": -5.912588119506836, "global_step": 55967, "epoch": 1332} {"train_loss": -5.838530540466309, "global_step": 55968, "epoch": 1332} {"train_loss": -5.862423896789551, "global_step": 55969, "epoch": 1332} {"train_loss": -5.943376064300537, "global_step": 55970, "epoch": 1332} {"train_loss": -5.858726501464844, "global_step": 55971, "epoch": 1332} {"train_loss": -5.918900489807129, "global_step": 55972, "epoch": 1332} {"train_loss": -5.8135986328125, "global_step": 55973, "epoch": 1332} {"train_loss": -5.7258195877075195, "global_step": 55974, "epoch": 1332} {"train_loss": -5.897481918334961, "global_step": 55975, "epoch": 1332} {"train_loss": -5.798907279968262, "global_step": 55976, "epoch": 1332} {"train_loss": -5.786539077758789, "global_step": 55977, "epoch": 1332} {"train_loss": -5.862010955810547, "global_step": 55978, "epoch": 1332} {"train_loss": -5.81849479675293, "global_step": 55979, "epoch": 1332} {"train_loss": -5.919973373413086, "global_step": 55980, "epoch": 1332} {"train_loss": -5.750968933105469, "global_step": 55981, "epoch": 1332} {"train_loss": -5.831988334655762, "global_step": 55982, "epoch": 1332} {"train_loss": -5.873591423034668, "global_step": 55983, "epoch": 1332} {"train_loss": -5.653375625610352, "global_step": 55984, "epoch": 1332} {"train_loss": -5.823762995856149, "global_step": 55985, "epoch": 1332, "val_loss": 74355.7109375} {"train_loss": -5.998896598815918, "global_step": 55986, "epoch": 1333} {"train_loss": -5.773519515991211, "global_step": 55987, "epoch": 1333} {"train_loss": -5.924263954162598, "global_step": 55988, "epoch": 1333} {"train_loss": -5.800948619842529, "global_step": 55989, "epoch": 1333} {"train_loss": -5.846401214599609, "global_step": 55990, "epoch": 1333} {"train_loss": -5.974002838134766, "global_step": 55991, "epoch": 1333} {"train_loss": -5.741751670837402, "global_step": 55992, "epoch": 1333} {"train_loss": -5.885811805725098, "global_step": 55993, "epoch": 1333} {"train_loss": -5.792523384094238, "global_step": 55994, "epoch": 1333} {"train_loss": -5.780148029327393, "global_step": 55995, "epoch": 1333} {"train_loss": -5.8892035484313965, "global_step": 55996, "epoch": 1333} {"train_loss": -5.782346248626709, "global_step": 55997, "epoch": 1333} {"train_loss": -5.795792102813721, "global_step": 55998, "epoch": 1333} {"train_loss": -5.890851974487305, "global_step": 55999, "epoch": 1333} {"train_loss": -5.810205936431885, "global_step": 56000, "epoch": 1333} {"train_loss": -6.013978004455566, "global_step": 56001, "epoch": 1333} {"train_loss": -5.839085102081299, "global_step": 56002, "epoch": 1333} {"train_loss": -5.932493686676025, "global_step": 56003, "epoch": 1333} {"train_loss": -5.768194198608398, "global_step": 56004, "epoch": 1333} {"train_loss": -5.873931407928467, "global_step": 56005, "epoch": 1333} {"train_loss": -5.835474967956543, "global_step": 56006, "epoch": 1333} {"train_loss": -5.86580228805542, "global_step": 56007, "epoch": 1333} {"train_loss": -5.782232284545898, "global_step": 56008, "epoch": 1333} {"train_loss": -5.843070030212402, "global_step": 56009, "epoch": 1333} {"train_loss": -5.89100980758667, "global_step": 56010, "epoch": 1333} {"train_loss": -5.816366195678711, "global_step": 56011, "epoch": 1333} {"train_loss": -5.837535381317139, "global_step": 56012, "epoch": 1333} {"train_loss": -5.847005844116211, "global_step": 56013, "epoch": 1333} {"train_loss": -5.777860164642334, "global_step": 56014, "epoch": 1333} {"train_loss": -5.843475818634033, "global_step": 56015, "epoch": 1333} {"train_loss": -5.785693645477295, "global_step": 56016, "epoch": 1333} {"train_loss": -5.727423667907715, "global_step": 56017, "epoch": 1333} {"train_loss": -5.767708778381348, "global_step": 56018, "epoch": 1333} {"train_loss": -5.689620494842529, "global_step": 56019, "epoch": 1333} {"train_loss": -5.764584541320801, "global_step": 56020, "epoch": 1333} {"train_loss": -5.863641262054443, "global_step": 56021, "epoch": 1333} {"train_loss": -5.979589462280273, "global_step": 56022, "epoch": 1333} {"train_loss": -5.899353981018066, "global_step": 56023, "epoch": 1333} {"train_loss": -5.843462944030762, "global_step": 56024, "epoch": 1333} {"train_loss": -5.854404449462891, "global_step": 56025, "epoch": 1333} {"train_loss": -5.758166790008545, "global_step": 56026, "epoch": 1333} {"train_loss": -5.837816499528431, "global_step": 56027, "epoch": 1333, "val_loss": 74472.125} {"train_loss": -5.846566677093506, "global_step": 56028, "epoch": 1334} {"train_loss": -5.863788604736328, "global_step": 56029, "epoch": 1334} {"train_loss": -5.877376556396484, "global_step": 56030, "epoch": 1334} {"train_loss": -5.910823822021484, "global_step": 56031, "epoch": 1334} {"train_loss": -5.775051116943359, "global_step": 56032, "epoch": 1334} {"train_loss": -5.898859977722168, "global_step": 56033, "epoch": 1334} {"train_loss": -5.730053901672363, "global_step": 56034, "epoch": 1334} {"train_loss": -5.890813827514648, "global_step": 56035, "epoch": 1334} {"train_loss": -5.784738540649414, "global_step": 56036, "epoch": 1334} {"train_loss": -5.890453815460205, "global_step": 56037, "epoch": 1334} {"train_loss": -5.905434608459473, "global_step": 56038, "epoch": 1334} {"train_loss": -5.898202896118164, "global_step": 56039, "epoch": 1334} {"train_loss": -5.876623630523682, "global_step": 56040, "epoch": 1334} {"train_loss": -5.936405181884766, "global_step": 56041, "epoch": 1334} {"train_loss": -5.873136520385742, "global_step": 56042, "epoch": 1334} {"train_loss": -5.910691261291504, "global_step": 56043, "epoch": 1334} {"train_loss": -5.856315612792969, "global_step": 56044, "epoch": 1334} {"train_loss": -5.926769733428955, "global_step": 56045, "epoch": 1334} {"train_loss": -5.900712013244629, "global_step": 56046, "epoch": 1334} {"train_loss": -5.792679786682129, "global_step": 56047, "epoch": 1334} {"train_loss": -5.835732460021973, "global_step": 56048, "epoch": 1334} {"train_loss": -5.786526679992676, "global_step": 56049, "epoch": 1334} {"train_loss": -5.880122184753418, "global_step": 56050, "epoch": 1334} {"train_loss": -5.820125579833984, "global_step": 56051, "epoch": 1334} {"train_loss": -5.885949611663818, "global_step": 56052, "epoch": 1334} {"train_loss": -5.833603858947754, "global_step": 56053, "epoch": 1334} {"train_loss": -5.792414665222168, "global_step": 56054, "epoch": 1334} {"train_loss": -5.776386260986328, "global_step": 56055, "epoch": 1334} {"train_loss": -5.880369186401367, "global_step": 56056, "epoch": 1334} {"train_loss": -5.845091819763184, "global_step": 56057, "epoch": 1334} {"train_loss": -5.783069133758545, "global_step": 56058, "epoch": 1334} {"train_loss": -5.686385154724121, "global_step": 56059, "epoch": 1334} {"train_loss": -5.711312770843506, "global_step": 56060, "epoch": 1334} {"train_loss": -5.793420791625977, "global_step": 56061, "epoch": 1334} {"train_loss": -5.84827184677124, "global_step": 56062, "epoch": 1334} {"train_loss": -5.885008811950684, "global_step": 56063, "epoch": 1334} {"train_loss": -5.869019031524658, "global_step": 56064, "epoch": 1334} {"train_loss": -5.800912380218506, "global_step": 56065, "epoch": 1334} {"train_loss": -5.810892105102539, "global_step": 56066, "epoch": 1334} {"train_loss": -5.833248615264893, "global_step": 56067, "epoch": 1334} {"train_loss": -5.809543609619141, "global_step": 56068, "epoch": 1334} {"train_loss": -5.843456325076875, "global_step": 56069, "epoch": 1334, "val_loss": 74369.2578125} {"train_loss": -5.813694000244141, "global_step": 56070, "epoch": 1335} {"train_loss": -5.849276542663574, "global_step": 56071, "epoch": 1335} {"train_loss": -5.915852069854736, "global_step": 56072, "epoch": 1335} {"train_loss": -5.772579193115234, "global_step": 56073, "epoch": 1335} {"train_loss": -5.886081695556641, "global_step": 56074, "epoch": 1335} {"train_loss": -5.708295822143555, "global_step": 56075, "epoch": 1335} {"train_loss": -5.939947128295898, "global_step": 56076, "epoch": 1335} {"train_loss": -5.859255790710449, "global_step": 56077, "epoch": 1335} {"train_loss": -5.67917537689209, "global_step": 56078, "epoch": 1335} {"train_loss": -5.8737382888793945, "global_step": 56079, "epoch": 1335} {"train_loss": -5.82892370223999, "global_step": 56080, "epoch": 1335} {"train_loss": -5.845560073852539, "global_step": 56081, "epoch": 1335} {"train_loss": -5.924877166748047, "global_step": 56082, "epoch": 1335} {"train_loss": -5.94814920425415, "global_step": 56083, "epoch": 1335} {"train_loss": -5.779305934906006, "global_step": 56084, "epoch": 1335} {"train_loss": -5.771883010864258, "global_step": 56085, "epoch": 1335} {"train_loss": -5.887821197509766, "global_step": 56086, "epoch": 1335} {"train_loss": -5.806946277618408, "global_step": 56087, "epoch": 1335} {"train_loss": -5.802549839019775, "global_step": 56088, "epoch": 1335} {"train_loss": -5.924159049987793, "global_step": 56089, "epoch": 1335} {"train_loss": -5.7999725341796875, "global_step": 56090, "epoch": 1335} {"train_loss": -5.931815147399902, "global_step": 56091, "epoch": 1335} {"train_loss": -5.755451202392578, "global_step": 56092, "epoch": 1335} {"train_loss": -5.845557689666748, "global_step": 56093, "epoch": 1335} {"train_loss": -5.891465187072754, "global_step": 56094, "epoch": 1335} {"train_loss": -5.934018135070801, "global_step": 56095, "epoch": 1335} {"train_loss": -5.834860801696777, "global_step": 56096, "epoch": 1335} {"train_loss": -5.700267791748047, "global_step": 56097, "epoch": 1335} {"train_loss": -5.958737373352051, "global_step": 56098, "epoch": 1335} {"train_loss": -5.801276206970215, "global_step": 56099, "epoch": 1335} {"train_loss": -5.809162139892578, "global_step": 56100, "epoch": 1335} {"train_loss": -5.842761993408203, "global_step": 56101, "epoch": 1335} {"train_loss": -5.88167142868042, "global_step": 56102, "epoch": 1335} {"train_loss": -5.850783824920654, "global_step": 56103, "epoch": 1335} {"train_loss": -5.875542640686035, "global_step": 56104, "epoch": 1335} {"train_loss": -5.871301651000977, "global_step": 56105, "epoch": 1335} {"train_loss": -5.986037731170654, "global_step": 56106, "epoch": 1335} {"train_loss": -5.839086532592773, "global_step": 56107, "epoch": 1335} {"train_loss": -5.846377372741699, "global_step": 56108, "epoch": 1335} {"train_loss": -5.825414657592773, "global_step": 56109, "epoch": 1335} {"train_loss": -5.872766494750977, "global_step": 56110, "epoch": 1335} {"train_loss": -5.848108473278227, "global_step": 56111, "epoch": 1335, "val_loss": 74465.15625} {"train_loss": -5.7104644775390625, "global_step": 56112, "epoch": 1336} {"train_loss": -5.813996315002441, "global_step": 56113, "epoch": 1336} {"train_loss": -5.9017791748046875, "global_step": 56114, "epoch": 1336} {"train_loss": -5.773816108703613, "global_step": 56115, "epoch": 1336} {"train_loss": -5.799851417541504, "global_step": 56116, "epoch": 1336} {"train_loss": -5.851263999938965, "global_step": 56117, "epoch": 1336} {"train_loss": -5.835397720336914, "global_step": 56118, "epoch": 1336} {"train_loss": -5.93266487121582, "global_step": 56119, "epoch": 1336} {"train_loss": -5.88368034362793, "global_step": 56120, "epoch": 1336} {"train_loss": -5.724921226501465, "global_step": 56121, "epoch": 1336} {"train_loss": -5.916027069091797, "global_step": 56122, "epoch": 1336} {"train_loss": -5.765962600708008, "global_step": 56123, "epoch": 1336} {"train_loss": -5.749370574951172, "global_step": 56124, "epoch": 1336} {"train_loss": -5.826964855194092, "global_step": 56125, "epoch": 1336} {"train_loss": -5.801708698272705, "global_step": 56126, "epoch": 1336} {"train_loss": -5.773680686950684, "global_step": 56127, "epoch": 1336} {"train_loss": -5.798467636108398, "global_step": 56128, "epoch": 1336} {"train_loss": -5.938003063201904, "global_step": 56129, "epoch": 1336} {"train_loss": -5.763243675231934, "global_step": 56130, "epoch": 1336} {"train_loss": -5.791860580444336, "global_step": 56131, "epoch": 1336} {"train_loss": -5.852583408355713, "global_step": 56132, "epoch": 1336} {"train_loss": -5.804882049560547, "global_step": 56133, "epoch": 1336} {"train_loss": -5.783257484436035, "global_step": 56134, "epoch": 1336} {"train_loss": -5.889468193054199, "global_step": 56135, "epoch": 1336} {"train_loss": -5.781794548034668, "global_step": 56136, "epoch": 1336} {"train_loss": -5.782199859619141, "global_step": 56137, "epoch": 1336} {"train_loss": -5.910503387451172, "global_step": 56138, "epoch": 1336} {"train_loss": -5.865619659423828, "global_step": 56139, "epoch": 1336} {"train_loss": -5.759894847869873, "global_step": 56140, "epoch": 1336} {"train_loss": -5.830018043518066, "global_step": 56141, "epoch": 1336} {"train_loss": -5.794382095336914, "global_step": 56142, "epoch": 1336} {"train_loss": -5.88704776763916, "global_step": 56143, "epoch": 1336} {"train_loss": -5.928723335266113, "global_step": 56144, "epoch": 1336} {"train_loss": -5.883467674255371, "global_step": 56145, "epoch": 1336} {"train_loss": -5.857954025268555, "global_step": 56146, "epoch": 1336} {"train_loss": -5.988459587097168, "global_step": 56147, "epoch": 1336} {"train_loss": -5.764841079711914, "global_step": 56148, "epoch": 1336} {"train_loss": -5.82466459274292, "global_step": 56149, "epoch": 1336} {"train_loss": -5.8570427894592285, "global_step": 56150, "epoch": 1336} {"train_loss": -5.755641937255859, "global_step": 56151, "epoch": 1336} {"train_loss": -5.777412414550781, "global_step": 56152, "epoch": 1336} {"train_loss": -5.826161623001099, "global_step": 56153, "epoch": 1336, "val_loss": 75292.109375} {"train_loss": -5.578544616699219, "global_step": 56154, "epoch": 1337} {"train_loss": -5.776089668273926, "global_step": 56155, "epoch": 1337} {"train_loss": -5.705521106719971, "global_step": 56156, "epoch": 1337} {"train_loss": -5.813963890075684, "global_step": 56157, "epoch": 1337} {"train_loss": -5.884139537811279, "global_step": 56158, "epoch": 1337} {"train_loss": -5.852775573730469, "global_step": 56159, "epoch": 1337} {"train_loss": -5.871696472167969, "global_step": 56160, "epoch": 1337} {"train_loss": -5.711780071258545, "global_step": 56161, "epoch": 1337} {"train_loss": -5.807210445404053, "global_step": 56162, "epoch": 1337} {"train_loss": -5.64624547958374, "global_step": 56163, "epoch": 1337} {"train_loss": -5.816685199737549, "global_step": 56164, "epoch": 1337} {"train_loss": -5.833026885986328, "global_step": 56165, "epoch": 1337} {"train_loss": -5.8198771476745605, "global_step": 56166, "epoch": 1337} {"train_loss": -5.683432579040527, "global_step": 56167, "epoch": 1337} {"train_loss": -5.868784427642822, "global_step": 56168, "epoch": 1337} {"train_loss": -5.733853340148926, "global_step": 56169, "epoch": 1337} {"train_loss": -5.889512062072754, "global_step": 56170, "epoch": 1337} {"train_loss": -5.923106670379639, "global_step": 56171, "epoch": 1337} {"train_loss": -5.8525590896606445, "global_step": 56172, "epoch": 1337} {"train_loss": -5.794329643249512, "global_step": 56173, "epoch": 1337} {"train_loss": -5.929599761962891, "global_step": 56174, "epoch": 1337} {"train_loss": -5.862792491912842, "global_step": 56175, "epoch": 1337} {"train_loss": -5.928791046142578, "global_step": 56176, "epoch": 1337} {"train_loss": -5.871753215789795, "global_step": 56177, "epoch": 1337} {"train_loss": -5.8329758644104, "global_step": 56178, "epoch": 1337} {"train_loss": -5.830791473388672, "global_step": 56179, "epoch": 1337} {"train_loss": -5.862947940826416, "global_step": 56180, "epoch": 1337} {"train_loss": -5.9036455154418945, "global_step": 56181, "epoch": 1337} {"train_loss": -5.841526985168457, "global_step": 56182, "epoch": 1337} {"train_loss": -5.885308742523193, "global_step": 56183, "epoch": 1337} {"train_loss": -5.85057258605957, "global_step": 56184, "epoch": 1337} {"train_loss": -5.864774703979492, "global_step": 56185, "epoch": 1337} {"train_loss": -5.776021480560303, "global_step": 56186, "epoch": 1337} {"train_loss": -5.817405700683594, "global_step": 56187, "epoch": 1337} {"train_loss": -5.930027008056641, "global_step": 56188, "epoch": 1337} {"train_loss": -5.838913917541504, "global_step": 56189, "epoch": 1337} {"train_loss": -5.780789375305176, "global_step": 56190, "epoch": 1337} {"train_loss": -5.899028778076172, "global_step": 56191, "epoch": 1337} {"train_loss": -5.749223709106445, "global_step": 56192, "epoch": 1337} {"train_loss": -5.736512184143066, "global_step": 56193, "epoch": 1337} {"train_loss": -5.860004425048828, "global_step": 56194, "epoch": 1337} {"train_loss": -5.821364561716716, "global_step": 56195, "epoch": 1337, "val_loss": 74286.7890625} {"train_loss": -5.85477352142334, "global_step": 56196, "epoch": 1338} {"train_loss": -5.786969184875488, "global_step": 56197, "epoch": 1338} {"train_loss": -6.020411491394043, "global_step": 56198, "epoch": 1338} {"train_loss": -5.878120422363281, "global_step": 56199, "epoch": 1338} {"train_loss": -5.938852310180664, "global_step": 56200, "epoch": 1338} {"train_loss": -5.9278435707092285, "global_step": 56201, "epoch": 1338} {"train_loss": -5.952469825744629, "global_step": 56202, "epoch": 1338} {"train_loss": -5.920404434204102, "global_step": 56203, "epoch": 1338} {"train_loss": -5.830174446105957, "global_step": 56204, "epoch": 1338} {"train_loss": -5.86691427230835, "global_step": 56205, "epoch": 1338} {"train_loss": -5.859275817871094, "global_step": 56206, "epoch": 1338} {"train_loss": -5.878837585449219, "global_step": 56207, "epoch": 1338} {"train_loss": -5.8186354637146, "global_step": 56208, "epoch": 1338} {"train_loss": -5.869947910308838, "global_step": 56209, "epoch": 1338} {"train_loss": -5.834432601928711, "global_step": 56210, "epoch": 1338} {"train_loss": -5.91766357421875, "global_step": 56211, "epoch": 1338} {"train_loss": -5.859788417816162, "global_step": 56212, "epoch": 1338} {"train_loss": -5.9413628578186035, "global_step": 56213, "epoch": 1338} {"train_loss": -5.839605331420898, "global_step": 56214, "epoch": 1338} {"train_loss": -5.842842102050781, "global_step": 56215, "epoch": 1338} {"train_loss": -5.76525354385376, "global_step": 56216, "epoch": 1338} {"train_loss": -5.893036842346191, "global_step": 56217, "epoch": 1338} {"train_loss": -5.801214218139648, "global_step": 56218, "epoch": 1338} {"train_loss": -5.890508651733398, "global_step": 56219, "epoch": 1338} {"train_loss": -5.873621940612793, "global_step": 56220, "epoch": 1338} {"train_loss": -5.803158760070801, "global_step": 56221, "epoch": 1338} {"train_loss": -5.973571300506592, "global_step": 56222, "epoch": 1338} {"train_loss": -5.9326653480529785, "global_step": 56223, "epoch": 1338} {"train_loss": -5.9134626388549805, "global_step": 56224, "epoch": 1338} {"train_loss": -5.841723918914795, "global_step": 56225, "epoch": 1338} {"train_loss": -5.8900146484375, "global_step": 56226, "epoch": 1338} {"train_loss": -5.830343723297119, "global_step": 56227, "epoch": 1338} {"train_loss": -5.961270332336426, "global_step": 56228, "epoch": 1338} {"train_loss": -5.9082183837890625, "global_step": 56229, "epoch": 1338} {"train_loss": -5.924225330352783, "global_step": 56230, "epoch": 1338} {"train_loss": -5.910587310791016, "global_step": 56231, "epoch": 1338} {"train_loss": -5.779857635498047, "global_step": 56232, "epoch": 1338} {"train_loss": -5.836192607879639, "global_step": 56233, "epoch": 1338} {"train_loss": -5.784451007843018, "global_step": 56234, "epoch": 1338} {"train_loss": -5.847367286682129, "global_step": 56235, "epoch": 1338} {"train_loss": -5.777745723724365, "global_step": 56236, "epoch": 1338} {"train_loss": -5.868796223685855, "global_step": 56237, "epoch": 1338, "val_loss": 74612.9921875} {"train_loss": -5.855116844177246, "global_step": 56238, "epoch": 1339} {"train_loss": -5.928811073303223, "global_step": 56239, "epoch": 1339} {"train_loss": -5.762234687805176, "global_step": 56240, "epoch": 1339} {"train_loss": -5.904179573059082, "global_step": 56241, "epoch": 1339} {"train_loss": -5.84776496887207, "global_step": 56242, "epoch": 1339} {"train_loss": -5.828007221221924, "global_step": 56243, "epoch": 1339} {"train_loss": -5.931734085083008, "global_step": 56244, "epoch": 1339} {"train_loss": -5.858848571777344, "global_step": 56245, "epoch": 1339} {"train_loss": -5.889880180358887, "global_step": 56246, "epoch": 1339} {"train_loss": -5.902932643890381, "global_step": 56247, "epoch": 1339} {"train_loss": -5.798070430755615, "global_step": 56248, "epoch": 1339} {"train_loss": -5.784624099731445, "global_step": 56249, "epoch": 1339} {"train_loss": -5.857693672180176, "global_step": 56250, "epoch": 1339} {"train_loss": -5.8688788414001465, "global_step": 56251, "epoch": 1339} {"train_loss": -5.895598411560059, "global_step": 56252, "epoch": 1339} {"train_loss": -5.723010063171387, "global_step": 56253, "epoch": 1339} {"train_loss": -5.80650520324707, "global_step": 56254, "epoch": 1339} {"train_loss": -5.8580522537231445, "global_step": 56255, "epoch": 1339} {"train_loss": -5.8331451416015625, "global_step": 56256, "epoch": 1339} {"train_loss": -5.899162292480469, "global_step": 56257, "epoch": 1339} {"train_loss": -5.818470001220703, "global_step": 56258, "epoch": 1339} {"train_loss": -5.811152935028076, "global_step": 56259, "epoch": 1339} {"train_loss": -5.734273910522461, "global_step": 56260, "epoch": 1339} {"train_loss": -5.885217666625977, "global_step": 56261, "epoch": 1339} {"train_loss": -5.805832386016846, "global_step": 56262, "epoch": 1339} {"train_loss": -5.889891147613525, "global_step": 56263, "epoch": 1339} {"train_loss": -5.847438335418701, "global_step": 56264, "epoch": 1339} {"train_loss": -5.850066661834717, "global_step": 56265, "epoch": 1339} {"train_loss": -5.884121417999268, "global_step": 56266, "epoch": 1339} {"train_loss": -5.8529205322265625, "global_step": 56267, "epoch": 1339} {"train_loss": -5.832464218139648, "global_step": 56268, "epoch": 1339} {"train_loss": -5.919134140014648, "global_step": 56269, "epoch": 1339} {"train_loss": -5.915849208831787, "global_step": 56270, "epoch": 1339} {"train_loss": -5.803419589996338, "global_step": 56271, "epoch": 1339} {"train_loss": -5.8015031814575195, "global_step": 56272, "epoch": 1339} {"train_loss": -5.901359558105469, "global_step": 56273, "epoch": 1339} {"train_loss": -5.755154609680176, "global_step": 56274, "epoch": 1339} {"train_loss": -5.918968200683594, "global_step": 56275, "epoch": 1339} {"train_loss": -5.872424125671387, "global_step": 56276, "epoch": 1339} {"train_loss": -5.853508949279785, "global_step": 56277, "epoch": 1339} {"train_loss": -5.890751361846924, "global_step": 56278, "epoch": 1339} {"train_loss": -5.851290895825341, "global_step": 56279, "epoch": 1339, "val_loss": 74403.0859375} {"train_loss": -5.799103736877441, "global_step": 56280, "epoch": 1340} {"train_loss": -5.916608810424805, "global_step": 56281, "epoch": 1340} {"train_loss": -5.817628383636475, "global_step": 56282, "epoch": 1340} {"train_loss": -5.736112594604492, "global_step": 56283, "epoch": 1340} {"train_loss": -5.879884243011475, "global_step": 56284, "epoch": 1340} {"train_loss": -5.776588439941406, "global_step": 56285, "epoch": 1340} {"train_loss": -6.00306510925293, "global_step": 56286, "epoch": 1340} {"train_loss": -5.861406326293945, "global_step": 56287, "epoch": 1340} {"train_loss": -5.849641799926758, "global_step": 56288, "epoch": 1340} {"train_loss": -5.858699798583984, "global_step": 56289, "epoch": 1340} {"train_loss": -5.854310512542725, "global_step": 56290, "epoch": 1340} {"train_loss": -5.834785461425781, "global_step": 56291, "epoch": 1340} {"train_loss": -5.745590686798096, "global_step": 56292, "epoch": 1340} {"train_loss": -5.704211711883545, "global_step": 56293, "epoch": 1340} {"train_loss": -5.809298515319824, "global_step": 56294, "epoch": 1340} {"train_loss": -5.862931251525879, "global_step": 56295, "epoch": 1340} {"train_loss": -5.778691291809082, "global_step": 56296, "epoch": 1340} {"train_loss": -5.915871620178223, "global_step": 56297, "epoch": 1340} {"train_loss": -5.858886241912842, "global_step": 56298, "epoch": 1340} {"train_loss": -5.869721412658691, "global_step": 56299, "epoch": 1340} {"train_loss": -5.800575256347656, "global_step": 56300, "epoch": 1340} {"train_loss": -5.859570026397705, "global_step": 56301, "epoch": 1340} {"train_loss": -5.775652885437012, "global_step": 56302, "epoch": 1340} {"train_loss": -5.940483093261719, "global_step": 56303, "epoch": 1340} {"train_loss": -5.979887008666992, "global_step": 56304, "epoch": 1340} {"train_loss": -5.8464460372924805, "global_step": 56305, "epoch": 1340} {"train_loss": -5.811434745788574, "global_step": 56306, "epoch": 1340} {"train_loss": -5.767855644226074, "global_step": 56307, "epoch": 1340} {"train_loss": -5.834702491760254, "global_step": 56308, "epoch": 1340} {"train_loss": -5.873546600341797, "global_step": 56309, "epoch": 1340} {"train_loss": -5.823639869689941, "global_step": 56310, "epoch": 1340} {"train_loss": -5.855846405029297, "global_step": 56311, "epoch": 1340} {"train_loss": -5.85627555847168, "global_step": 56312, "epoch": 1340} {"train_loss": -5.939111232757568, "global_step": 56313, "epoch": 1340} {"train_loss": -5.8463239669799805, "global_step": 56314, "epoch": 1340} {"train_loss": -5.941898345947266, "global_step": 56315, "epoch": 1340} {"train_loss": -5.8404154777526855, "global_step": 56316, "epoch": 1340} {"train_loss": -5.818680763244629, "global_step": 56317, "epoch": 1340} {"train_loss": -5.787205696105957, "global_step": 56318, "epoch": 1340} {"train_loss": -5.8966474533081055, "global_step": 56319, "epoch": 1340} {"train_loss": -5.81503963470459, "global_step": 56320, "epoch": 1340} {"train_loss": -5.844976266225179, "global_step": 56321, "epoch": 1340, "val_loss": 74343.2109375} {"train_loss": -5.838945388793945, "global_step": 56322, "epoch": 1341} {"train_loss": -5.825308799743652, "global_step": 56323, "epoch": 1341} {"train_loss": -5.922369956970215, "global_step": 56324, "epoch": 1341} {"train_loss": -5.816815376281738, "global_step": 56325, "epoch": 1341} {"train_loss": -5.739797115325928, "global_step": 56326, "epoch": 1341} {"train_loss": -5.871624946594238, "global_step": 56327, "epoch": 1341} {"train_loss": -5.801244735717773, "global_step": 56328, "epoch": 1341} {"train_loss": -5.85094690322876, "global_step": 56329, "epoch": 1341} {"train_loss": -5.8297600746154785, "global_step": 56330, "epoch": 1341} {"train_loss": -5.816816329956055, "global_step": 56331, "epoch": 1341} {"train_loss": -5.854854106903076, "global_step": 56332, "epoch": 1341} {"train_loss": -5.865915298461914, "global_step": 56333, "epoch": 1341} {"train_loss": -5.839135646820068, "global_step": 56334, "epoch": 1341} {"train_loss": -5.788073539733887, "global_step": 56335, "epoch": 1341} {"train_loss": -5.8072099685668945, "global_step": 56336, "epoch": 1341} {"train_loss": -5.85874080657959, "global_step": 56337, "epoch": 1341} {"train_loss": -6.032570838928223, "global_step": 56338, "epoch": 1341} {"train_loss": -5.8021039962768555, "global_step": 56339, "epoch": 1341} {"train_loss": -5.830935001373291, "global_step": 56340, "epoch": 1341} {"train_loss": -5.898128986358643, "global_step": 56341, "epoch": 1341} {"train_loss": -5.989684104919434, "global_step": 56342, "epoch": 1341} {"train_loss": -5.959928512573242, "global_step": 56343, "epoch": 1341} {"train_loss": -5.82676887512207, "global_step": 56344, "epoch": 1341} {"train_loss": -5.832928657531738, "global_step": 56345, "epoch": 1341} {"train_loss": -5.840417385101318, "global_step": 56346, "epoch": 1341} {"train_loss": -5.857118606567383, "global_step": 56347, "epoch": 1341} {"train_loss": -5.893824577331543, "global_step": 56348, "epoch": 1341} {"train_loss": -5.822481155395508, "global_step": 56349, "epoch": 1341} {"train_loss": -5.713515281677246, "global_step": 56350, "epoch": 1341} {"train_loss": -5.773707389831543, "global_step": 56351, "epoch": 1341} {"train_loss": -5.849753379821777, "global_step": 56352, "epoch": 1341} {"train_loss": -5.842380523681641, "global_step": 56353, "epoch": 1341} {"train_loss": -5.885011672973633, "global_step": 56354, "epoch": 1341} {"train_loss": -5.8754425048828125, "global_step": 56355, "epoch": 1341} {"train_loss": -5.824437141418457, "global_step": 56356, "epoch": 1341} {"train_loss": -5.873589515686035, "global_step": 56357, "epoch": 1341} {"train_loss": -5.840448379516602, "global_step": 56358, "epoch": 1341} {"train_loss": -5.769167900085449, "global_step": 56359, "epoch": 1341} {"train_loss": -5.8040971755981445, "global_step": 56360, "epoch": 1341} {"train_loss": -5.757808685302734, "global_step": 56361, "epoch": 1341} {"train_loss": -5.8531293869018555, "global_step": 56362, "epoch": 1341} {"train_loss": -5.841788995833624, "global_step": 56363, "epoch": 1341, "val_loss": 74286.578125} {"train_loss": -5.844873428344727, "global_step": 56364, "epoch": 1342} {"train_loss": -5.78095006942749, "global_step": 56365, "epoch": 1342} {"train_loss": -5.816953659057617, "global_step": 56366, "epoch": 1342} {"train_loss": -5.795263290405273, "global_step": 56367, "epoch": 1342} {"train_loss": -5.8441009521484375, "global_step": 56368, "epoch": 1342} {"train_loss": -5.819443702697754, "global_step": 56369, "epoch": 1342} {"train_loss": -5.801187038421631, "global_step": 56370, "epoch": 1342} {"train_loss": -5.85525369644165, "global_step": 56371, "epoch": 1342} {"train_loss": -5.864178657531738, "global_step": 56372, "epoch": 1342} {"train_loss": -5.812288284301758, "global_step": 56373, "epoch": 1342} {"train_loss": -5.9261794090271, "global_step": 56374, "epoch": 1342} {"train_loss": -5.855099678039551, "global_step": 56375, "epoch": 1342} {"train_loss": -5.7973246574401855, "global_step": 56376, "epoch": 1342} {"train_loss": -5.824319839477539, "global_step": 56377, "epoch": 1342} {"train_loss": -5.778819561004639, "global_step": 56378, "epoch": 1342} {"train_loss": -5.868811130523682, "global_step": 56379, "epoch": 1342} {"train_loss": -5.858207702636719, "global_step": 56380, "epoch": 1342} {"train_loss": -5.826541423797607, "global_step": 56381, "epoch": 1342} {"train_loss": -5.90177059173584, "global_step": 56382, "epoch": 1342} {"train_loss": -5.641166687011719, "global_step": 56383, "epoch": 1342} {"train_loss": -5.876082420349121, "global_step": 56384, "epoch": 1342} {"train_loss": -5.849701881408691, "global_step": 56385, "epoch": 1342} {"train_loss": -5.804146766662598, "global_step": 56386, "epoch": 1342} {"train_loss": -5.784484386444092, "global_step": 56387, "epoch": 1342} {"train_loss": -5.73582649230957, "global_step": 56388, "epoch": 1342} {"train_loss": -5.982032775878906, "global_step": 56389, "epoch": 1342} {"train_loss": -5.8995256423950195, "global_step": 56390, "epoch": 1342} {"train_loss": -5.712701797485352, "global_step": 56391, "epoch": 1342} {"train_loss": -5.932069778442383, "global_step": 56392, "epoch": 1342} {"train_loss": -5.9438252449035645, "global_step": 56393, "epoch": 1342} {"train_loss": -5.869026184082031, "global_step": 56394, "epoch": 1342} {"train_loss": -5.918127059936523, "global_step": 56395, "epoch": 1342} {"train_loss": -5.797894477844238, "global_step": 56396, "epoch": 1342} {"train_loss": -5.846529960632324, "global_step": 56397, "epoch": 1342} {"train_loss": -5.7843732833862305, "global_step": 56398, "epoch": 1342} {"train_loss": -5.754698753356934, "global_step": 56399, "epoch": 1342} {"train_loss": -5.927761077880859, "global_step": 56400, "epoch": 1342} {"train_loss": -5.6451497077941895, "global_step": 56401, "epoch": 1342} {"train_loss": -6.04572868347168, "global_step": 56402, "epoch": 1342} {"train_loss": -5.941746234893799, "global_step": 56403, "epoch": 1342} {"train_loss": -5.879482269287109, "global_step": 56404, "epoch": 1342} {"train_loss": -5.841653596787226, "global_step": 56405, "epoch": 1342, "val_loss": 74573.234375} {"train_loss": -5.788341522216797, "global_step": 56406, "epoch": 1343} {"train_loss": -5.847531318664551, "global_step": 56407, "epoch": 1343} {"train_loss": -5.774412155151367, "global_step": 56408, "epoch": 1343} {"train_loss": -5.787393569946289, "global_step": 56409, "epoch": 1343} {"train_loss": -5.9314751625061035, "global_step": 56410, "epoch": 1343} {"train_loss": -5.875741958618164, "global_step": 56411, "epoch": 1343} {"train_loss": -5.773238658905029, "global_step": 56412, "epoch": 1343} {"train_loss": -5.830690383911133, "global_step": 56413, "epoch": 1343} {"train_loss": -5.86802864074707, "global_step": 56414, "epoch": 1343} {"train_loss": -5.812561988830566, "global_step": 56415, "epoch": 1343} {"train_loss": -5.872549057006836, "global_step": 56416, "epoch": 1343} {"train_loss": -5.805513381958008, "global_step": 56417, "epoch": 1343} {"train_loss": -5.872579097747803, "global_step": 56418, "epoch": 1343} {"train_loss": -5.858590126037598, "global_step": 56419, "epoch": 1343} {"train_loss": -5.803335666656494, "global_step": 56420, "epoch": 1343} {"train_loss": -5.854326248168945, "global_step": 56421, "epoch": 1343} {"train_loss": -5.851069927215576, "global_step": 56422, "epoch": 1343} {"train_loss": -5.864989280700684, "global_step": 56423, "epoch": 1343} {"train_loss": -5.780386924743652, "global_step": 56424, "epoch": 1343} {"train_loss": -5.786803245544434, "global_step": 56425, "epoch": 1343} {"train_loss": -5.8087158203125, "global_step": 56426, "epoch": 1343} {"train_loss": -5.682923316955566, "global_step": 56427, "epoch": 1343} {"train_loss": -5.84593391418457, "global_step": 56428, "epoch": 1343} {"train_loss": -5.833056449890137, "global_step": 56429, "epoch": 1343} {"train_loss": -5.783360004425049, "global_step": 56430, "epoch": 1343} {"train_loss": -5.826828956604004, "global_step": 56431, "epoch": 1343} {"train_loss": -5.892063140869141, "global_step": 56432, "epoch": 1343} {"train_loss": -5.716214656829834, "global_step": 56433, "epoch": 1343} {"train_loss": -5.779743671417236, "global_step": 56434, "epoch": 1343} {"train_loss": -5.781757354736328, "global_step": 56435, "epoch": 1343} {"train_loss": -5.803816795349121, "global_step": 56436, "epoch": 1343} {"train_loss": -5.879260540008545, "global_step": 56437, "epoch": 1343} {"train_loss": -5.938035011291504, "global_step": 56438, "epoch": 1343} {"train_loss": -5.934490203857422, "global_step": 56439, "epoch": 1343} {"train_loss": -5.859323978424072, "global_step": 56440, "epoch": 1343} {"train_loss": -5.718032360076904, "global_step": 56441, "epoch": 1343} {"train_loss": -5.924984455108643, "global_step": 56442, "epoch": 1343} {"train_loss": -5.803274631500244, "global_step": 56443, "epoch": 1343} {"train_loss": -5.962156295776367, "global_step": 56444, "epoch": 1343} {"train_loss": -5.926141262054443, "global_step": 56445, "epoch": 1343} {"train_loss": -5.806461811065674, "global_step": 56446, "epoch": 1343} {"train_loss": -5.833065759567988, "global_step": 56447, "epoch": 1343, "val_loss": 74325.2109375} {"train_loss": -5.832948684692383, "global_step": 56448, "epoch": 1344} {"train_loss": -5.800187110900879, "global_step": 56449, "epoch": 1344} {"train_loss": -5.795927047729492, "global_step": 56450, "epoch": 1344} {"train_loss": -5.911172866821289, "global_step": 56451, "epoch": 1344} {"train_loss": -5.863450050354004, "global_step": 56452, "epoch": 1344} {"train_loss": -5.911192893981934, "global_step": 56453, "epoch": 1344} {"train_loss": -5.921896934509277, "global_step": 56454, "epoch": 1344} {"train_loss": -5.928147792816162, "global_step": 56455, "epoch": 1344} {"train_loss": -5.8957133293151855, "global_step": 56456, "epoch": 1344} {"train_loss": -5.9147257804870605, "global_step": 56457, "epoch": 1344} {"train_loss": -5.861686706542969, "global_step": 56458, "epoch": 1344} {"train_loss": -5.8349080085754395, "global_step": 56459, "epoch": 1344} {"train_loss": -5.780067443847656, "global_step": 56460, "epoch": 1344} {"train_loss": -5.857861518859863, "global_step": 56461, "epoch": 1344} {"train_loss": -5.822518348693848, "global_step": 56462, "epoch": 1344} {"train_loss": -5.833199501037598, "global_step": 56463, "epoch": 1344} {"train_loss": -5.737849235534668, "global_step": 56464, "epoch": 1344} {"train_loss": -5.808171272277832, "global_step": 56465, "epoch": 1344} {"train_loss": -5.822709083557129, "global_step": 56466, "epoch": 1344} {"train_loss": -5.87808895111084, "global_step": 56467, "epoch": 1344} {"train_loss": -5.754946231842041, "global_step": 56468, "epoch": 1344} {"train_loss": -5.944537162780762, "global_step": 56469, "epoch": 1344} {"train_loss": -5.780322074890137, "global_step": 56470, "epoch": 1344} {"train_loss": -6.01310920715332, "global_step": 56471, "epoch": 1344} {"train_loss": -5.846680641174316, "global_step": 56472, "epoch": 1344} {"train_loss": -5.808784484863281, "global_step": 56473, "epoch": 1344} {"train_loss": -5.884764194488525, "global_step": 56474, "epoch": 1344} {"train_loss": -5.854059219360352, "global_step": 56475, "epoch": 1344} {"train_loss": -5.903356552124023, "global_step": 56476, "epoch": 1344} {"train_loss": -5.781750679016113, "global_step": 56477, "epoch": 1344} {"train_loss": -5.778515338897705, "global_step": 56478, "epoch": 1344} {"train_loss": -5.7833051681518555, "global_step": 56479, "epoch": 1344} {"train_loss": -5.704836845397949, "global_step": 56480, "epoch": 1344} {"train_loss": -5.888299942016602, "global_step": 56481, "epoch": 1344} {"train_loss": -5.778220176696777, "global_step": 56482, "epoch": 1344} {"train_loss": -5.898560523986816, "global_step": 56483, "epoch": 1344} {"train_loss": -5.7067084312438965, "global_step": 56484, "epoch": 1344} {"train_loss": -5.621822357177734, "global_step": 56485, "epoch": 1344} {"train_loss": -5.840334415435791, "global_step": 56486, "epoch": 1344} {"train_loss": -5.758029460906982, "global_step": 56487, "epoch": 1344} {"train_loss": -5.771047592163086, "global_step": 56488, "epoch": 1344} {"train_loss": -5.831637075969151, "global_step": 56489, "epoch": 1344, "val_loss": 74329.3125} {"train_loss": -5.842649936676025, "global_step": 56490, "epoch": 1345} {"train_loss": -5.788813591003418, "global_step": 56491, "epoch": 1345} {"train_loss": -5.835224151611328, "global_step": 56492, "epoch": 1345} {"train_loss": -5.745603084564209, "global_step": 56493, "epoch": 1345} {"train_loss": -5.823605060577393, "global_step": 56494, "epoch": 1345} {"train_loss": -5.798829078674316, "global_step": 56495, "epoch": 1345} {"train_loss": -5.797839641571045, "global_step": 56496, "epoch": 1345} {"train_loss": -5.815230369567871, "global_step": 56497, "epoch": 1345} {"train_loss": -5.832720756530762, "global_step": 56498, "epoch": 1345} {"train_loss": -5.7490553855896, "global_step": 56499, "epoch": 1345} {"train_loss": -5.819209098815918, "global_step": 56500, "epoch": 1345} {"train_loss": -5.8721747398376465, "global_step": 56501, "epoch": 1345} {"train_loss": -5.916234970092773, "global_step": 56502, "epoch": 1345} {"train_loss": -5.906055450439453, "global_step": 56503, "epoch": 1345} {"train_loss": -5.871368408203125, "global_step": 56504, "epoch": 1345} {"train_loss": -5.931682586669922, "global_step": 56505, "epoch": 1345} {"train_loss": -5.966263771057129, "global_step": 56506, "epoch": 1345} {"train_loss": -5.840768337249756, "global_step": 56507, "epoch": 1345} {"train_loss": -5.948232650756836, "global_step": 56508, "epoch": 1345} {"train_loss": -5.794195652008057, "global_step": 56509, "epoch": 1345} {"train_loss": -5.949357032775879, "global_step": 56510, "epoch": 1345} {"train_loss": -5.764189720153809, "global_step": 56511, "epoch": 1345} {"train_loss": -5.949691295623779, "global_step": 56512, "epoch": 1345} {"train_loss": -5.85438871383667, "global_step": 56513, "epoch": 1345} {"train_loss": -5.9353532791137695, "global_step": 56514, "epoch": 1345} {"train_loss": -5.844117641448975, "global_step": 56515, "epoch": 1345} {"train_loss": -6.017960548400879, "global_step": 56516, "epoch": 1345} {"train_loss": -5.795019149780273, "global_step": 56517, "epoch": 1345} {"train_loss": -5.810641288757324, "global_step": 56518, "epoch": 1345} {"train_loss": -5.785531044006348, "global_step": 56519, "epoch": 1345} {"train_loss": -5.825028896331787, "global_step": 56520, "epoch": 1345} {"train_loss": -5.812495231628418, "global_step": 56521, "epoch": 1345} {"train_loss": -5.915024757385254, "global_step": 56522, "epoch": 1345} {"train_loss": -5.834593772888184, "global_step": 56523, "epoch": 1345} {"train_loss": -5.768796920776367, "global_step": 56524, "epoch": 1345} {"train_loss": -5.911197185516357, "global_step": 56525, "epoch": 1345} {"train_loss": -5.843328952789307, "global_step": 56526, "epoch": 1345} {"train_loss": -5.786882400512695, "global_step": 56527, "epoch": 1345} {"train_loss": -5.83528995513916, "global_step": 56528, "epoch": 1345} {"train_loss": -5.817380905151367, "global_step": 56529, "epoch": 1345} {"train_loss": -5.826091766357422, "global_step": 56530, "epoch": 1345} {"train_loss": -5.8496204898470925, "global_step": 56531, "epoch": 1345, "val_loss": 74898.984375} {"train_loss": -5.687568664550781, "global_step": 56532, "epoch": 1346} {"train_loss": -5.792922496795654, "global_step": 56533, "epoch": 1346} {"train_loss": -5.788782119750977, "global_step": 56534, "epoch": 1346} {"train_loss": -5.883277893066406, "global_step": 56535, "epoch": 1346} {"train_loss": -5.826162338256836, "global_step": 56536, "epoch": 1346} {"train_loss": -5.750113010406494, "global_step": 56537, "epoch": 1346} {"train_loss": -5.730794906616211, "global_step": 56538, "epoch": 1346} {"train_loss": -5.863056182861328, "global_step": 56539, "epoch": 1346} {"train_loss": -5.87967586517334, "global_step": 56540, "epoch": 1346} {"train_loss": -5.864116668701172, "global_step": 56541, "epoch": 1346} {"train_loss": -5.788957595825195, "global_step": 56542, "epoch": 1346} {"train_loss": -5.915726661682129, "global_step": 56543, "epoch": 1346} {"train_loss": -5.881594657897949, "global_step": 56544, "epoch": 1346} {"train_loss": -5.807662010192871, "global_step": 56545, "epoch": 1346} {"train_loss": -5.7762370109558105, "global_step": 56546, "epoch": 1346} {"train_loss": -5.725985050201416, "global_step": 56547, "epoch": 1346} {"train_loss": -5.668581962585449, "global_step": 56548, "epoch": 1346} {"train_loss": -5.806333541870117, "global_step": 56549, "epoch": 1346} {"train_loss": -5.781655311584473, "global_step": 56550, "epoch": 1346} {"train_loss": -5.949619293212891, "global_step": 56551, "epoch": 1346} {"train_loss": -5.870919704437256, "global_step": 56552, "epoch": 1346} {"train_loss": -5.837756156921387, "global_step": 56553, "epoch": 1346} {"train_loss": -5.8525896072387695, "global_step": 56554, "epoch": 1346} {"train_loss": -5.767580032348633, "global_step": 56555, "epoch": 1346} {"train_loss": -5.887590408325195, "global_step": 56556, "epoch": 1346} {"train_loss": -5.951602935791016, "global_step": 56557, "epoch": 1346} {"train_loss": -5.946373462677002, "global_step": 56558, "epoch": 1346} {"train_loss": -5.8122429847717285, "global_step": 56559, "epoch": 1346} {"train_loss": -5.845681190490723, "global_step": 56560, "epoch": 1346} {"train_loss": -5.811294078826904, "global_step": 56561, "epoch": 1346} {"train_loss": -5.931488037109375, "global_step": 56562, "epoch": 1346} {"train_loss": -5.865243911743164, "global_step": 56563, "epoch": 1346} {"train_loss": -5.904872417449951, "global_step": 56564, "epoch": 1346} {"train_loss": -5.897276878356934, "global_step": 56565, "epoch": 1346} {"train_loss": -5.745139122009277, "global_step": 56566, "epoch": 1346} {"train_loss": -5.925500869750977, "global_step": 56567, "epoch": 1346} {"train_loss": -5.813469886779785, "global_step": 56568, "epoch": 1346} {"train_loss": -5.749948024749756, "global_step": 56569, "epoch": 1346} {"train_loss": -5.819027900695801, "global_step": 56570, "epoch": 1346} {"train_loss": -5.745718479156494, "global_step": 56571, "epoch": 1346} {"train_loss": -5.8816022872924805, "global_step": 56572, "epoch": 1346} {"train_loss": -5.831672339212327, "global_step": 56573, "epoch": 1346, "val_loss": 74214.0859375} {"train_loss": -5.846708297729492, "global_step": 56574, "epoch": 1347} {"train_loss": -5.876206398010254, "global_step": 56575, "epoch": 1347} {"train_loss": -5.910613059997559, "global_step": 56576, "epoch": 1347} {"train_loss": -5.918830394744873, "global_step": 56577, "epoch": 1347} {"train_loss": -5.922702789306641, "global_step": 56578, "epoch": 1347} {"train_loss": -5.907902717590332, "global_step": 56579, "epoch": 1347} {"train_loss": -5.9501051902771, "global_step": 56580, "epoch": 1347} {"train_loss": -5.939788818359375, "global_step": 56581, "epoch": 1347} {"train_loss": -5.868631839752197, "global_step": 56582, "epoch": 1347} {"train_loss": -5.798572063446045, "global_step": 56583, "epoch": 1347} {"train_loss": -5.763079643249512, "global_step": 56584, "epoch": 1347} {"train_loss": -5.790094375610352, "global_step": 56585, "epoch": 1347} {"train_loss": -5.820040702819824, "global_step": 56586, "epoch": 1347} {"train_loss": -5.772536754608154, "global_step": 56587, "epoch": 1347} {"train_loss": -5.981828689575195, "global_step": 56588, "epoch": 1347} {"train_loss": -5.896839618682861, "global_step": 56589, "epoch": 1347} {"train_loss": -5.819046497344971, "global_step": 56590, "epoch": 1347} {"train_loss": -5.9082207679748535, "global_step": 56591, "epoch": 1347} {"train_loss": -5.93308162689209, "global_step": 56592, "epoch": 1347} {"train_loss": -5.812622547149658, "global_step": 56593, "epoch": 1347} {"train_loss": -5.875648498535156, "global_step": 56594, "epoch": 1347} {"train_loss": -5.8564252853393555, "global_step": 56595, "epoch": 1347} {"train_loss": -5.7900800704956055, "global_step": 56596, "epoch": 1347} {"train_loss": -5.844356060028076, "global_step": 56597, "epoch": 1347} {"train_loss": -5.973282814025879, "global_step": 56598, "epoch": 1347} {"train_loss": -5.836761474609375, "global_step": 56599, "epoch": 1347} {"train_loss": -5.858637809753418, "global_step": 56600, "epoch": 1347} {"train_loss": -5.79302978515625, "global_step": 56601, "epoch": 1347} {"train_loss": -5.90195369720459, "global_step": 56602, "epoch": 1347} {"train_loss": -5.791143417358398, "global_step": 56603, "epoch": 1347} {"train_loss": -5.8991289138793945, "global_step": 56604, "epoch": 1347} {"train_loss": -5.947969436645508, "global_step": 56605, "epoch": 1347} {"train_loss": -5.866313457489014, "global_step": 56606, "epoch": 1347} {"train_loss": -5.926338195800781, "global_step": 56607, "epoch": 1347} {"train_loss": -5.7574615478515625, "global_step": 56608, "epoch": 1347} {"train_loss": -5.8725666999816895, "global_step": 56609, "epoch": 1347} {"train_loss": -5.791312217712402, "global_step": 56610, "epoch": 1347} {"train_loss": -5.764858722686768, "global_step": 56611, "epoch": 1347} {"train_loss": -5.796568870544434, "global_step": 56612, "epoch": 1347} {"train_loss": -5.791380882263184, "global_step": 56613, "epoch": 1347} {"train_loss": -5.893832206726074, "global_step": 56614, "epoch": 1347} {"train_loss": -5.857357842581613, "global_step": 56615, "epoch": 1347, "val_loss": 74433.71875} {"train_loss": -5.74437952041626, "global_step": 56616, "epoch": 1348} {"train_loss": -5.853099822998047, "global_step": 56617, "epoch": 1348} {"train_loss": -5.750757217407227, "global_step": 56618, "epoch": 1348} {"train_loss": -5.789604187011719, "global_step": 56619, "epoch": 1348} {"train_loss": -5.760191440582275, "global_step": 56620, "epoch": 1348} {"train_loss": -5.819440841674805, "global_step": 56621, "epoch": 1348} {"train_loss": -5.790582180023193, "global_step": 56622, "epoch": 1348} {"train_loss": -5.737855911254883, "global_step": 56623, "epoch": 1348} {"train_loss": -5.847085952758789, "global_step": 56624, "epoch": 1348} {"train_loss": -5.837499618530273, "global_step": 56625, "epoch": 1348} {"train_loss": -5.692584037780762, "global_step": 56626, "epoch": 1348} {"train_loss": -5.869365692138672, "global_step": 56627, "epoch": 1348} {"train_loss": -5.781224727630615, "global_step": 56628, "epoch": 1348} {"train_loss": -5.824848175048828, "global_step": 56629, "epoch": 1348} {"train_loss": -5.778517246246338, "global_step": 56630, "epoch": 1348} {"train_loss": -5.811286926269531, "global_step": 56631, "epoch": 1348} {"train_loss": -5.826543807983398, "global_step": 56632, "epoch": 1348} {"train_loss": -5.8903889656066895, "global_step": 56633, "epoch": 1348} {"train_loss": -5.862537384033203, "global_step": 56634, "epoch": 1348} {"train_loss": -5.854846954345703, "global_step": 56635, "epoch": 1348} {"train_loss": -5.692222595214844, "global_step": 56636, "epoch": 1348} {"train_loss": -5.835911273956299, "global_step": 56637, "epoch": 1348} {"train_loss": -5.894048690795898, "global_step": 56638, "epoch": 1348} {"train_loss": -5.939353942871094, "global_step": 56639, "epoch": 1348} {"train_loss": -5.842669486999512, "global_step": 56640, "epoch": 1348} {"train_loss": -5.8980512619018555, "global_step": 56641, "epoch": 1348} {"train_loss": -5.820300579071045, "global_step": 56642, "epoch": 1348} {"train_loss": -5.848894119262695, "global_step": 56643, "epoch": 1348} {"train_loss": -5.686829566955566, "global_step": 56644, "epoch": 1348} {"train_loss": -5.831894874572754, "global_step": 56645, "epoch": 1348} {"train_loss": -5.746620178222656, "global_step": 56646, "epoch": 1348} {"train_loss": -5.955693244934082, "global_step": 56647, "epoch": 1348} {"train_loss": -5.770999908447266, "global_step": 56648, "epoch": 1348} {"train_loss": -5.7852630615234375, "global_step": 56649, "epoch": 1348} {"train_loss": -5.8991594314575195, "global_step": 56650, "epoch": 1348} {"train_loss": -5.787876129150391, "global_step": 56651, "epoch": 1348} {"train_loss": -5.827247619628906, "global_step": 56652, "epoch": 1348} {"train_loss": -5.82090950012207, "global_step": 56653, "epoch": 1348} {"train_loss": -5.809618949890137, "global_step": 56654, "epoch": 1348} {"train_loss": -5.834394931793213, "global_step": 56655, "epoch": 1348} {"train_loss": -5.766860008239746, "global_step": 56656, "epoch": 1348} {"train_loss": -5.816875412350609, "global_step": 56657, "epoch": 1348, "val_loss": 74497.5859375} {"train_loss": -5.767875671386719, "global_step": 56658, "epoch": 1349} {"train_loss": -5.732402324676514, "global_step": 56659, "epoch": 1349} {"train_loss": -5.915616035461426, "global_step": 56660, "epoch": 1349} {"train_loss": -5.853643894195557, "global_step": 56661, "epoch": 1349} {"train_loss": -5.891740322113037, "global_step": 56662, "epoch": 1349} {"train_loss": -5.934453964233398, "global_step": 56663, "epoch": 1349} {"train_loss": -5.809189796447754, "global_step": 56664, "epoch": 1349} {"train_loss": -5.860036849975586, "global_step": 56665, "epoch": 1349} {"train_loss": -5.865482330322266, "global_step": 56666, "epoch": 1349} {"train_loss": -5.887448310852051, "global_step": 56667, "epoch": 1349} {"train_loss": -5.8015899658203125, "global_step": 56668, "epoch": 1349} {"train_loss": -5.89870548248291, "global_step": 56669, "epoch": 1349} {"train_loss": -5.759355545043945, "global_step": 56670, "epoch": 1349} {"train_loss": -5.948963642120361, "global_step": 56671, "epoch": 1349} {"train_loss": -5.806318759918213, "global_step": 56672, "epoch": 1349} {"train_loss": -5.885106086730957, "global_step": 56673, "epoch": 1349} {"train_loss": -5.828476905822754, "global_step": 56674, "epoch": 1349} {"train_loss": -5.968039512634277, "global_step": 56675, "epoch": 1349} {"train_loss": -5.907050132751465, "global_step": 56676, "epoch": 1349} {"train_loss": -5.880365371704102, "global_step": 56677, "epoch": 1349} {"train_loss": -5.926438331604004, "global_step": 56678, "epoch": 1349} {"train_loss": -5.864816188812256, "global_step": 56679, "epoch": 1349} {"train_loss": -5.831145286560059, "global_step": 56680, "epoch": 1349} {"train_loss": -5.72334098815918, "global_step": 56681, "epoch": 1349} {"train_loss": -5.900256156921387, "global_step": 56682, "epoch": 1349} {"train_loss": -5.708256244659424, "global_step": 56683, "epoch": 1349} {"train_loss": -5.8655595779418945, "global_step": 56684, "epoch": 1349} {"train_loss": -5.978939056396484, "global_step": 56685, "epoch": 1349} {"train_loss": -5.6573991775512695, "global_step": 56686, "epoch": 1349} {"train_loss": -5.864350318908691, "global_step": 56687, "epoch": 1349} {"train_loss": -5.752870559692383, "global_step": 56688, "epoch": 1349} {"train_loss": -5.760284423828125, "global_step": 56689, "epoch": 1349} {"train_loss": -5.8913750648498535, "global_step": 56690, "epoch": 1349} {"train_loss": -5.739955902099609, "global_step": 56691, "epoch": 1349} {"train_loss": -5.892242431640625, "global_step": 56692, "epoch": 1349} {"train_loss": -5.730585098266602, "global_step": 56693, "epoch": 1349} {"train_loss": -5.648728370666504, "global_step": 56694, "epoch": 1349} {"train_loss": -5.878066062927246, "global_step": 56695, "epoch": 1349} {"train_loss": -5.751158237457275, "global_step": 56696, "epoch": 1349} {"train_loss": -5.787384033203125, "global_step": 56697, "epoch": 1349} {"train_loss": -5.818183898925781, "global_step": 56698, "epoch": 1349} {"train_loss": -5.832753374463036, "global_step": 56699, "epoch": 1349, "val_loss": 74348.015625} {"train_loss": -5.932593822479248, "global_step": 56700, "epoch": 1350} {"train_loss": -5.849237442016602, "global_step": 56701, "epoch": 1350} {"train_loss": -5.8721113204956055, "global_step": 56702, "epoch": 1350} {"train_loss": -5.745271682739258, "global_step": 56703, "epoch": 1350} {"train_loss": -5.907303810119629, "global_step": 56704, "epoch": 1350} {"train_loss": -5.865126609802246, "global_step": 56705, "epoch": 1350} {"train_loss": -5.933567047119141, "global_step": 56706, "epoch": 1350} {"train_loss": -5.866005897521973, "global_step": 56707, "epoch": 1350} {"train_loss": -5.861508369445801, "global_step": 56708, "epoch": 1350} {"train_loss": -5.882055282592773, "global_step": 56709, "epoch": 1350} {"train_loss": -5.853953838348389, "global_step": 56710, "epoch": 1350} {"train_loss": -5.895985126495361, "global_step": 56711, "epoch": 1350} {"train_loss": -5.913257122039795, "global_step": 56712, "epoch": 1350} {"train_loss": -5.83420467376709, "global_step": 56713, "epoch": 1350} {"train_loss": -5.821533203125, "global_step": 56714, "epoch": 1350} {"train_loss": -5.888405799865723, "global_step": 56715, "epoch": 1350} {"train_loss": -5.993584632873535, "global_step": 56716, "epoch": 1350} {"train_loss": -5.911343097686768, "global_step": 56717, "epoch": 1350} {"train_loss": -5.967093467712402, "global_step": 56718, "epoch": 1350} {"train_loss": -5.8173933029174805, "global_step": 56719, "epoch": 1350} {"train_loss": -5.787088871002197, "global_step": 56720, "epoch": 1350} {"train_loss": -5.787888050079346, "global_step": 56721, "epoch": 1350} {"train_loss": -5.966082572937012, "global_step": 56722, "epoch": 1350} {"train_loss": -5.855011940002441, "global_step": 56723, "epoch": 1350} {"train_loss": -5.819190979003906, "global_step": 56724, "epoch": 1350} {"train_loss": -5.824670314788818, "global_step": 56725, "epoch": 1350} {"train_loss": -5.828312397003174, "global_step": 56726, "epoch": 1350} {"train_loss": -5.745414733886719, "global_step": 56727, "epoch": 1350} {"train_loss": -5.881561279296875, "global_step": 56728, "epoch": 1350} {"train_loss": -5.852530002593994, "global_step": 56729, "epoch": 1350} {"train_loss": -5.727107048034668, "global_step": 56730, "epoch": 1350} {"train_loss": -5.7557454109191895, "global_step": 56731, "epoch": 1350} {"train_loss": -5.959439277648926, "global_step": 56732, "epoch": 1350} {"train_loss": -5.754796981811523, "global_step": 56733, "epoch": 1350} {"train_loss": -5.977280616760254, "global_step": 56734, "epoch": 1350} {"train_loss": -5.805675029754639, "global_step": 56735, "epoch": 1350} {"train_loss": -5.736512184143066, "global_step": 56736, "epoch": 1350} {"train_loss": -5.896388530731201, "global_step": 56737, "epoch": 1350} {"train_loss": -5.752187728881836, "global_step": 56738, "epoch": 1350} {"train_loss": -5.977474212646484, "global_step": 56739, "epoch": 1350} {"train_loss": -5.867442607879639, "global_step": 56740, "epoch": 1350} {"train_loss": -5.859542869386219, "global_step": 56741, "epoch": 1350, "train/sim_max_reward_0": 0.3326479920962226, "train/sim_max_reward_1": 0.9877103452482958, "train/sim_max_reward_2": 0.7809769390524823, "train/sim_max_reward_3": 0.8241103906617551, "train/sim_max_reward_4": 0.9931073553045942, "train/sim_max_reward_5": 0.8768763926280261, "test/sim_max_reward_4500000": 0.800091119121841, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8951932002845098, "test/sim_max_reward_4500003": 0.6228212246387902, "test/sim_max_reward_4500004": 0.07271841440462942, "test/sim_max_reward_4500005": 0.3972606116958666, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.6703992237438485, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.9420318283673595, "test/sim_max_reward_4500010": 0.7576436012114706, "test/sim_max_reward_4500011": 0.9138859775003877, "test/sim_max_reward_4500012": 0.5507571871433457, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.8132340917600938, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.5811316972158064, "test/sim_max_reward_4500018": 0.08016772513289808, "test/sim_max_reward_4500019": 0.901987505572175, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.45435546201991206, "test/sim_max_reward_4500022": 0.7308017659265085, "test/sim_max_reward_4500023": 0.9014238425191927, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.8433848401128763, "test/sim_max_reward_4500027": 0.8526972688585744, "test/sim_max_reward_4500028": 0.2784616798518524, "test/sim_max_reward_4500029": 0.24129727289148717, "test/sim_max_reward_4500030": 0.9694529891944519, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04830548892594175, "test/sim_max_reward_4500033": 0.8473346635097895, "test/sim_max_reward_4500034": 0.824021329680801, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 0.41311399279937466, "test/sim_max_reward_4500037": 0.6376622018309674, "test/sim_max_reward_4500038": 0.29964246815480544, "test/sim_max_reward_4500039": 0.8274404027224231, "test/sim_max_reward_4500040": 0.964833411915802, "test/sim_max_reward_4500041": 0.9962276448198358, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.6095666866418273, "test/sim_max_reward_4500044": 0.20631230381701074, "test/sim_max_reward_4500045": 0.15989160909582434, "test/sim_max_reward_4500046": 0.6174653399855228, "test/sim_max_reward_4500047": 0.9124573179078276, "test/sim_max_reward_4500048": 0.9159844955445087, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.7992382358318961, "test/mean_score": 0.5318288338618964, "val_loss": 74312.6953125} {"train_loss": -5.812040328979492, "global_step": 56742, "epoch": 1351} {"train_loss": -5.829911708831787, "global_step": 56743, "epoch": 1351} {"train_loss": -5.911515712738037, "global_step": 56744, "epoch": 1351} {"train_loss": -5.785676002502441, "global_step": 56745, "epoch": 1351} {"train_loss": -5.751536846160889, "global_step": 56746, "epoch": 1351} {"train_loss": -5.814450740814209, "global_step": 56747, "epoch": 1351} {"train_loss": -5.928439140319824, "global_step": 56748, "epoch": 1351} {"train_loss": -5.942492961883545, "global_step": 56749, "epoch": 1351} {"train_loss": -5.99021577835083, "global_step": 56750, "epoch": 1351} {"train_loss": -5.8213276863098145, "global_step": 56751, "epoch": 1351} {"train_loss": -5.819236755371094, "global_step": 56752, "epoch": 1351} {"train_loss": -5.8458967208862305, "global_step": 56753, "epoch": 1351} {"train_loss": -5.861706733703613, "global_step": 56754, "epoch": 1351} {"train_loss": -5.7124223709106445, "global_step": 56755, "epoch": 1351} {"train_loss": -5.756172180175781, "global_step": 56756, "epoch": 1351} {"train_loss": -5.716740608215332, "global_step": 56757, "epoch": 1351} {"train_loss": -5.931972026824951, "global_step": 56758, "epoch": 1351} {"train_loss": -5.854447841644287, "global_step": 56759, "epoch": 1351} {"train_loss": -5.798613548278809, "global_step": 56760, "epoch": 1351} {"train_loss": -5.877561569213867, "global_step": 56761, "epoch": 1351} {"train_loss": -5.9120683670043945, "global_step": 56762, "epoch": 1351} {"train_loss": -5.770607948303223, "global_step": 56763, "epoch": 1351} {"train_loss": -5.856700897216797, "global_step": 56764, "epoch": 1351} {"train_loss": -5.904551982879639, "global_step": 56765, "epoch": 1351} {"train_loss": -5.85928201675415, "global_step": 56766, "epoch": 1351} {"train_loss": -5.905793190002441, "global_step": 56767, "epoch": 1351} {"train_loss": -5.862708568572998, "global_step": 56768, "epoch": 1351} {"train_loss": -5.814708709716797, "global_step": 56769, "epoch": 1351} {"train_loss": -5.851123332977295, "global_step": 56770, "epoch": 1351} {"train_loss": -5.961067199707031, "global_step": 56771, "epoch": 1351} {"train_loss": -5.963041305541992, "global_step": 56772, "epoch": 1351} {"train_loss": -5.893340110778809, "global_step": 56773, "epoch": 1351} {"train_loss": -6.0432000160217285, "global_step": 56774, "epoch": 1351} {"train_loss": -5.917473793029785, "global_step": 56775, "epoch": 1351} {"train_loss": -5.8698859214782715, "global_step": 56776, "epoch": 1351} {"train_loss": -5.829324722290039, "global_step": 56777, "epoch": 1351} {"train_loss": -5.908392906188965, "global_step": 56778, "epoch": 1351} {"train_loss": -5.885024070739746, "global_step": 56779, "epoch": 1351} {"train_loss": -5.825474262237549, "global_step": 56780, "epoch": 1351} {"train_loss": -5.815480709075928, "global_step": 56781, "epoch": 1351} {"train_loss": -5.874214172363281, "global_step": 56782, "epoch": 1351} {"train_loss": -5.861884979974656, "global_step": 56783, "epoch": 1351, "val_loss": 74439.8125} {"train_loss": -5.814040184020996, "global_step": 56784, "epoch": 1352} {"train_loss": -5.937091827392578, "global_step": 56785, "epoch": 1352} {"train_loss": -5.805541038513184, "global_step": 56786, "epoch": 1352} {"train_loss": -5.925114631652832, "global_step": 56787, "epoch": 1352} {"train_loss": -5.842042446136475, "global_step": 56788, "epoch": 1352} {"train_loss": -5.891068458557129, "global_step": 56789, "epoch": 1352} {"train_loss": -5.786712646484375, "global_step": 56790, "epoch": 1352} {"train_loss": -5.883351802825928, "global_step": 56791, "epoch": 1352} {"train_loss": -5.932474613189697, "global_step": 56792, "epoch": 1352} {"train_loss": -5.927673816680908, "global_step": 56793, "epoch": 1352} {"train_loss": -5.945394515991211, "global_step": 56794, "epoch": 1352} {"train_loss": -5.840511322021484, "global_step": 56795, "epoch": 1352} {"train_loss": -5.9753336906433105, "global_step": 56796, "epoch": 1352} {"train_loss": -5.902493953704834, "global_step": 56797, "epoch": 1352} {"train_loss": -5.7903900146484375, "global_step": 56798, "epoch": 1352} {"train_loss": -5.862157821655273, "global_step": 56799, "epoch": 1352} {"train_loss": -5.799831867218018, "global_step": 56800, "epoch": 1352} {"train_loss": -5.726008892059326, "global_step": 56801, "epoch": 1352} {"train_loss": -5.7822675704956055, "global_step": 56802, "epoch": 1352} {"train_loss": -5.683152198791504, "global_step": 56803, "epoch": 1352} {"train_loss": -5.8426618576049805, "global_step": 56804, "epoch": 1352} {"train_loss": -5.827258586883545, "global_step": 56805, "epoch": 1352} {"train_loss": -5.700104713439941, "global_step": 56806, "epoch": 1352} {"train_loss": -5.846529960632324, "global_step": 56807, "epoch": 1352} {"train_loss": -5.696451663970947, "global_step": 56808, "epoch": 1352} {"train_loss": -5.912519454956055, "global_step": 56809, "epoch": 1352} {"train_loss": -5.720235824584961, "global_step": 56810, "epoch": 1352} {"train_loss": -5.723295211791992, "global_step": 56811, "epoch": 1352} {"train_loss": -5.7217607498168945, "global_step": 56812, "epoch": 1352} {"train_loss": -5.9143171310424805, "global_step": 56813, "epoch": 1352} {"train_loss": -5.7989397048950195, "global_step": 56814, "epoch": 1352} {"train_loss": -5.8178253173828125, "global_step": 56815, "epoch": 1352} {"train_loss": -5.712270259857178, "global_step": 56816, "epoch": 1352} {"train_loss": -5.854599952697754, "global_step": 56817, "epoch": 1352} {"train_loss": -5.736320972442627, "global_step": 56818, "epoch": 1352} {"train_loss": -5.833130359649658, "global_step": 56819, "epoch": 1352} {"train_loss": -5.844358444213867, "global_step": 56820, "epoch": 1352} {"train_loss": -5.787781715393066, "global_step": 56821, "epoch": 1352} {"train_loss": -5.947037220001221, "global_step": 56822, "epoch": 1352} {"train_loss": -5.801795482635498, "global_step": 56823, "epoch": 1352} {"train_loss": -5.770310401916504, "global_step": 56824, "epoch": 1352} {"train_loss": -5.823815731775193, "global_step": 56825, "epoch": 1352, "val_loss": 74298.375} {"train_loss": -5.825815200805664, "global_step": 56826, "epoch": 1353} {"train_loss": -5.656156539916992, "global_step": 56827, "epoch": 1353} {"train_loss": -5.879702091217041, "global_step": 56828, "epoch": 1353} {"train_loss": -5.7176361083984375, "global_step": 56829, "epoch": 1353} {"train_loss": -5.826416015625, "global_step": 56830, "epoch": 1353} {"train_loss": -5.876589775085449, "global_step": 56831, "epoch": 1353} {"train_loss": -5.96523904800415, "global_step": 56832, "epoch": 1353} {"train_loss": -5.851751327514648, "global_step": 56833, "epoch": 1353} {"train_loss": -5.811555862426758, "global_step": 56834, "epoch": 1353} {"train_loss": -5.789236068725586, "global_step": 56835, "epoch": 1353} {"train_loss": -5.790599346160889, "global_step": 56836, "epoch": 1353} {"train_loss": -5.7808756828308105, "global_step": 56837, "epoch": 1353} {"train_loss": -5.81085205078125, "global_step": 56838, "epoch": 1353} {"train_loss": -5.876396179199219, "global_step": 56839, "epoch": 1353} {"train_loss": -5.924023151397705, "global_step": 56840, "epoch": 1353} {"train_loss": -6.0206193923950195, "global_step": 56841, "epoch": 1353} {"train_loss": -5.862948894500732, "global_step": 56842, "epoch": 1353} {"train_loss": -5.79744815826416, "global_step": 56843, "epoch": 1353} {"train_loss": -5.84199333190918, "global_step": 56844, "epoch": 1353} {"train_loss": -5.802886009216309, "global_step": 56845, "epoch": 1353} {"train_loss": -5.677819728851318, "global_step": 56846, "epoch": 1353} {"train_loss": -5.838102340698242, "global_step": 56847, "epoch": 1353} {"train_loss": -5.866849899291992, "global_step": 56848, "epoch": 1353} {"train_loss": -5.745729446411133, "global_step": 56849, "epoch": 1353} {"train_loss": -5.823662281036377, "global_step": 56850, "epoch": 1353} {"train_loss": -5.904306411743164, "global_step": 56851, "epoch": 1353} {"train_loss": -5.8613128662109375, "global_step": 56852, "epoch": 1353} {"train_loss": -5.914088726043701, "global_step": 56853, "epoch": 1353} {"train_loss": -5.90333366394043, "global_step": 56854, "epoch": 1353} {"train_loss": -5.824211597442627, "global_step": 56855, "epoch": 1353} {"train_loss": -5.806556224822998, "global_step": 56856, "epoch": 1353} {"train_loss": -5.8720855712890625, "global_step": 56857, "epoch": 1353} {"train_loss": -5.918868064880371, "global_step": 56858, "epoch": 1353} {"train_loss": -5.940191268920898, "global_step": 56859, "epoch": 1353} {"train_loss": -5.885834693908691, "global_step": 56860, "epoch": 1353} {"train_loss": -5.839104175567627, "global_step": 56861, "epoch": 1353} {"train_loss": -5.74455451965332, "global_step": 56862, "epoch": 1353} {"train_loss": -5.860232353210449, "global_step": 56863, "epoch": 1353} {"train_loss": -5.766892433166504, "global_step": 56864, "epoch": 1353} {"train_loss": -5.945778846740723, "global_step": 56865, "epoch": 1353} {"train_loss": -5.870952606201172, "global_step": 56866, "epoch": 1353} {"train_loss": -5.844046649478731, "global_step": 56867, "epoch": 1353, "val_loss": 74331.875} {"train_loss": -5.8229594230651855, "global_step": 56868, "epoch": 1354} {"train_loss": -5.917496204376221, "global_step": 56869, "epoch": 1354} {"train_loss": -5.9314141273498535, "global_step": 56870, "epoch": 1354} {"train_loss": -5.928650379180908, "global_step": 56871, "epoch": 1354} {"train_loss": -5.941932678222656, "global_step": 56872, "epoch": 1354} {"train_loss": -5.823588848114014, "global_step": 56873, "epoch": 1354} {"train_loss": -5.851322174072266, "global_step": 56874, "epoch": 1354} {"train_loss": -5.851009368896484, "global_step": 56875, "epoch": 1354} {"train_loss": -5.865222930908203, "global_step": 56876, "epoch": 1354} {"train_loss": -5.88470458984375, "global_step": 56877, "epoch": 1354} {"train_loss": -5.826274871826172, "global_step": 56878, "epoch": 1354} {"train_loss": -5.825271129608154, "global_step": 56879, "epoch": 1354} {"train_loss": -5.856356620788574, "global_step": 56880, "epoch": 1354} {"train_loss": -5.896068096160889, "global_step": 56881, "epoch": 1354} {"train_loss": -5.846296310424805, "global_step": 56882, "epoch": 1354} {"train_loss": -5.918951034545898, "global_step": 56883, "epoch": 1354} {"train_loss": -5.903520584106445, "global_step": 56884, "epoch": 1354} {"train_loss": -5.974482536315918, "global_step": 56885, "epoch": 1354} {"train_loss": -5.836297035217285, "global_step": 56886, "epoch": 1354} {"train_loss": -5.892516136169434, "global_step": 56887, "epoch": 1354} {"train_loss": -6.027104377746582, "global_step": 56888, "epoch": 1354} {"train_loss": -5.913870334625244, "global_step": 56889, "epoch": 1354} {"train_loss": -5.975963592529297, "global_step": 56890, "epoch": 1354} {"train_loss": -5.936640739440918, "global_step": 56891, "epoch": 1354} {"train_loss": -5.818042755126953, "global_step": 56892, "epoch": 1354} {"train_loss": -5.831334590911865, "global_step": 56893, "epoch": 1354} {"train_loss": -5.913930892944336, "global_step": 56894, "epoch": 1354} {"train_loss": -5.886387825012207, "global_step": 56895, "epoch": 1354} {"train_loss": -5.75498628616333, "global_step": 56896, "epoch": 1354} {"train_loss": -5.7344279289245605, "global_step": 56897, "epoch": 1354} {"train_loss": -5.812182903289795, "global_step": 56898, "epoch": 1354} {"train_loss": -5.857765197753906, "global_step": 56899, "epoch": 1354} {"train_loss": -5.949901103973389, "global_step": 56900, "epoch": 1354} {"train_loss": -5.916834831237793, "global_step": 56901, "epoch": 1354} {"train_loss": -5.865878105163574, "global_step": 56902, "epoch": 1354} {"train_loss": -5.909055233001709, "global_step": 56903, "epoch": 1354} {"train_loss": -6.077690601348877, "global_step": 56904, "epoch": 1354} {"train_loss": -5.811559677124023, "global_step": 56905, "epoch": 1354} {"train_loss": -5.938718795776367, "global_step": 56906, "epoch": 1354} {"train_loss": -5.842291831970215, "global_step": 56907, "epoch": 1354} {"train_loss": -5.862115859985352, "global_step": 56908, "epoch": 1354} {"train_loss": -5.882983718599592, "global_step": 56909, "epoch": 1354, "val_loss": 74383.140625} {"train_loss": -5.859457015991211, "global_step": 56910, "epoch": 1355} {"train_loss": -5.939981937408447, "global_step": 56911, "epoch": 1355} {"train_loss": -5.7958984375, "global_step": 56912, "epoch": 1355} {"train_loss": -5.823418617248535, "global_step": 56913, "epoch": 1355} {"train_loss": -5.889382839202881, "global_step": 56914, "epoch": 1355} {"train_loss": -5.8106513023376465, "global_step": 56915, "epoch": 1355} {"train_loss": -5.885313987731934, "global_step": 56916, "epoch": 1355} {"train_loss": -5.857364654541016, "global_step": 56917, "epoch": 1355} {"train_loss": -5.785435676574707, "global_step": 56918, "epoch": 1355} {"train_loss": -5.910683631896973, "global_step": 56919, "epoch": 1355} {"train_loss": -5.738230228424072, "global_step": 56920, "epoch": 1355} {"train_loss": -5.88335657119751, "global_step": 56921, "epoch": 1355} {"train_loss": -5.847138404846191, "global_step": 56922, "epoch": 1355} {"train_loss": -5.8034563064575195, "global_step": 56923, "epoch": 1355} {"train_loss": -5.780379772186279, "global_step": 56924, "epoch": 1355} {"train_loss": -5.963004112243652, "global_step": 56925, "epoch": 1355} {"train_loss": -5.852655410766602, "global_step": 56926, "epoch": 1355} {"train_loss": -5.761636734008789, "global_step": 56927, "epoch": 1355} {"train_loss": -5.904428005218506, "global_step": 56928, "epoch": 1355} {"train_loss": -5.808367729187012, "global_step": 56929, "epoch": 1355} {"train_loss": -5.77824592590332, "global_step": 56930, "epoch": 1355} {"train_loss": -5.856108665466309, "global_step": 56931, "epoch": 1355} {"train_loss": -5.915621280670166, "global_step": 56932, "epoch": 1355} {"train_loss": -5.913678169250488, "global_step": 56933, "epoch": 1355} {"train_loss": -5.859218597412109, "global_step": 56934, "epoch": 1355} {"train_loss": -5.866875648498535, "global_step": 56935, "epoch": 1355} {"train_loss": -5.893054962158203, "global_step": 56936, "epoch": 1355} {"train_loss": -5.676243782043457, "global_step": 56937, "epoch": 1355} {"train_loss": -5.745596408843994, "global_step": 56938, "epoch": 1355} {"train_loss": -5.875279426574707, "global_step": 56939, "epoch": 1355} {"train_loss": -5.802970886230469, "global_step": 56940, "epoch": 1355} {"train_loss": -5.798781394958496, "global_step": 56941, "epoch": 1355} {"train_loss": -5.707474708557129, "global_step": 56942, "epoch": 1355} {"train_loss": -5.820061206817627, "global_step": 56943, "epoch": 1355} {"train_loss": -5.901928901672363, "global_step": 56944, "epoch": 1355} {"train_loss": -5.786539554595947, "global_step": 56945, "epoch": 1355} {"train_loss": -5.826772689819336, "global_step": 56946, "epoch": 1355} {"train_loss": -5.6286773681640625, "global_step": 56947, "epoch": 1355} {"train_loss": -5.86087703704834, "global_step": 56948, "epoch": 1355} {"train_loss": -5.929625034332275, "global_step": 56949, "epoch": 1355} {"train_loss": -5.759323596954346, "global_step": 56950, "epoch": 1355} {"train_loss": -5.831482569376628, "global_step": 56951, "epoch": 1355, "val_loss": 75070.8046875} {"train_loss": -5.78204345703125, "global_step": 56952, "epoch": 1356} {"train_loss": -5.763007640838623, "global_step": 56953, "epoch": 1356} {"train_loss": -5.803653717041016, "global_step": 56954, "epoch": 1356} {"train_loss": -5.940723896026611, "global_step": 56955, "epoch": 1356} {"train_loss": -5.931473255157471, "global_step": 56956, "epoch": 1356} {"train_loss": -5.774664878845215, "global_step": 56957, "epoch": 1356} {"train_loss": -5.961940765380859, "global_step": 56958, "epoch": 1356} {"train_loss": -5.920862674713135, "global_step": 56959, "epoch": 1356} {"train_loss": -5.93195915222168, "global_step": 56960, "epoch": 1356} {"train_loss": -5.865286827087402, "global_step": 56961, "epoch": 1356} {"train_loss": -5.919159412384033, "global_step": 56962, "epoch": 1356} {"train_loss": -5.834840774536133, "global_step": 56963, "epoch": 1356} {"train_loss": -5.820750713348389, "global_step": 56964, "epoch": 1356} {"train_loss": -5.889886856079102, "global_step": 56965, "epoch": 1356} {"train_loss": -5.740594387054443, "global_step": 56966, "epoch": 1356} {"train_loss": -5.92529296875, "global_step": 56967, "epoch": 1356} {"train_loss": -5.820122241973877, "global_step": 56968, "epoch": 1356} {"train_loss": -6.016737461090088, "global_step": 56969, "epoch": 1356} {"train_loss": -5.72160530090332, "global_step": 56970, "epoch": 1356} {"train_loss": -5.963222503662109, "global_step": 56971, "epoch": 1356} {"train_loss": -5.729140281677246, "global_step": 56972, "epoch": 1356} {"train_loss": -5.8452677726745605, "global_step": 56973, "epoch": 1356} {"train_loss": -5.895768165588379, "global_step": 56974, "epoch": 1356} {"train_loss": -5.756919860839844, "global_step": 56975, "epoch": 1356} {"train_loss": -5.791900634765625, "global_step": 56976, "epoch": 1356} {"train_loss": -5.919818878173828, "global_step": 56977, "epoch": 1356} {"train_loss": -5.819611549377441, "global_step": 56978, "epoch": 1356} {"train_loss": -5.77711820602417, "global_step": 56979, "epoch": 1356} {"train_loss": -5.845161437988281, "global_step": 56980, "epoch": 1356} {"train_loss": -5.871408462524414, "global_step": 56981, "epoch": 1356} {"train_loss": -5.794897079467773, "global_step": 56982, "epoch": 1356} {"train_loss": -5.797023773193359, "global_step": 56983, "epoch": 1356} {"train_loss": -5.937807083129883, "global_step": 56984, "epoch": 1356} {"train_loss": -5.827258586883545, "global_step": 56985, "epoch": 1356} {"train_loss": -5.790363311767578, "global_step": 56986, "epoch": 1356} {"train_loss": -5.95119571685791, "global_step": 56987, "epoch": 1356} {"train_loss": -5.914828777313232, "global_step": 56988, "epoch": 1356} {"train_loss": -5.830844879150391, "global_step": 56989, "epoch": 1356} {"train_loss": -5.907745361328125, "global_step": 56990, "epoch": 1356} {"train_loss": -5.778277397155762, "global_step": 56991, "epoch": 1356} {"train_loss": -5.778564453125, "global_step": 56992, "epoch": 1356} {"train_loss": -5.8515753746032715, "global_step": 56993, "epoch": 1356, "val_loss": 74551.234375} {"train_loss": -5.943986892700195, "global_step": 56994, "epoch": 1357} {"train_loss": -5.8039655685424805, "global_step": 56995, "epoch": 1357} {"train_loss": -5.863390922546387, "global_step": 56996, "epoch": 1357} {"train_loss": -5.806290626525879, "global_step": 56997, "epoch": 1357} {"train_loss": -5.8448357582092285, "global_step": 56998, "epoch": 1357} {"train_loss": -5.862390518188477, "global_step": 56999, "epoch": 1357} {"train_loss": -5.827846050262451, "global_step": 57000, "epoch": 1357} {"train_loss": -5.825715065002441, "global_step": 57001, "epoch": 1357} {"train_loss": -5.94296407699585, "global_step": 57002, "epoch": 1357} {"train_loss": -5.837508201599121, "global_step": 57003, "epoch": 1357} {"train_loss": -5.863746643066406, "global_step": 57004, "epoch": 1357} {"train_loss": -5.956047058105469, "global_step": 57005, "epoch": 1357} {"train_loss": -5.819604396820068, "global_step": 57006, "epoch": 1357} {"train_loss": -5.97556209564209, "global_step": 57007, "epoch": 1357} {"train_loss": -5.832874298095703, "global_step": 57008, "epoch": 1357} {"train_loss": -5.8630170822143555, "global_step": 57009, "epoch": 1357} {"train_loss": -5.835399627685547, "global_step": 57010, "epoch": 1357} {"train_loss": -5.772722244262695, "global_step": 57011, "epoch": 1357} {"train_loss": -5.890110492706299, "global_step": 57012, "epoch": 1357} {"train_loss": -5.890803337097168, "global_step": 57013, "epoch": 1357} {"train_loss": -5.815122604370117, "global_step": 57014, "epoch": 1357} {"train_loss": -5.985160827636719, "global_step": 57015, "epoch": 1357} {"train_loss": -5.852911949157715, "global_step": 57016, "epoch": 1357} {"train_loss": -5.899648666381836, "global_step": 57017, "epoch": 1357} {"train_loss": -5.8870391845703125, "global_step": 57018, "epoch": 1357} {"train_loss": -5.785767555236816, "global_step": 57019, "epoch": 1357} {"train_loss": -5.9656267166137695, "global_step": 57020, "epoch": 1357} {"train_loss": -5.835893630981445, "global_step": 57021, "epoch": 1357} {"train_loss": -5.718416213989258, "global_step": 57022, "epoch": 1357} {"train_loss": -5.754379749298096, "global_step": 57023, "epoch": 1357} {"train_loss": -5.735463619232178, "global_step": 57024, "epoch": 1357} {"train_loss": -5.890871047973633, "global_step": 57025, "epoch": 1357} {"train_loss": -5.845727920532227, "global_step": 57026, "epoch": 1357} {"train_loss": -5.797060966491699, "global_step": 57027, "epoch": 1357} {"train_loss": -5.905008316040039, "global_step": 57028, "epoch": 1357} {"train_loss": -5.793988227844238, "global_step": 57029, "epoch": 1357} {"train_loss": -5.81760311126709, "global_step": 57030, "epoch": 1357} {"train_loss": -5.968201160430908, "global_step": 57031, "epoch": 1357} {"train_loss": -5.908845901489258, "global_step": 57032, "epoch": 1357} {"train_loss": -5.799532413482666, "global_step": 57033, "epoch": 1357} {"train_loss": -5.785097599029541, "global_step": 57034, "epoch": 1357} {"train_loss": -5.856326182683309, "global_step": 57035, "epoch": 1357, "val_loss": 74419.6015625} {"train_loss": -5.811736106872559, "global_step": 57036, "epoch": 1358} {"train_loss": -5.882826328277588, "global_step": 57037, "epoch": 1358} {"train_loss": -5.748007297515869, "global_step": 57038, "epoch": 1358} {"train_loss": -5.849809646606445, "global_step": 57039, "epoch": 1358} {"train_loss": -5.909301280975342, "global_step": 57040, "epoch": 1358} {"train_loss": -5.868860244750977, "global_step": 57041, "epoch": 1358} {"train_loss": -5.965572357177734, "global_step": 57042, "epoch": 1358} {"train_loss": -6.010140419006348, "global_step": 57043, "epoch": 1358} {"train_loss": -5.839506149291992, "global_step": 57044, "epoch": 1358} {"train_loss": -5.871380805969238, "global_step": 57045, "epoch": 1358} {"train_loss": -5.863443374633789, "global_step": 57046, "epoch": 1358} {"train_loss": -5.828752040863037, "global_step": 57047, "epoch": 1358} {"train_loss": -5.9000444412231445, "global_step": 57048, "epoch": 1358} {"train_loss": -5.9216132164001465, "global_step": 57049, "epoch": 1358} {"train_loss": -5.811750411987305, "global_step": 57050, "epoch": 1358} {"train_loss": -5.766395568847656, "global_step": 57051, "epoch": 1358} {"train_loss": -5.906682968139648, "global_step": 57052, "epoch": 1358} {"train_loss": -5.7985076904296875, "global_step": 57053, "epoch": 1358} {"train_loss": -5.948291778564453, "global_step": 57054, "epoch": 1358} {"train_loss": -5.967248916625977, "global_step": 57055, "epoch": 1358} {"train_loss": -5.858614921569824, "global_step": 57056, "epoch": 1358} {"train_loss": -5.951148986816406, "global_step": 57057, "epoch": 1358} {"train_loss": -5.992687225341797, "global_step": 57058, "epoch": 1358} {"train_loss": -5.943237781524658, "global_step": 57059, "epoch": 1358} {"train_loss": -5.877841949462891, "global_step": 57060, "epoch": 1358} {"train_loss": -5.912406921386719, "global_step": 57061, "epoch": 1358} {"train_loss": -5.79682731628418, "global_step": 57062, "epoch": 1358} {"train_loss": -5.792360305786133, "global_step": 57063, "epoch": 1358} {"train_loss": -5.968114852905273, "global_step": 57064, "epoch": 1358} {"train_loss": -5.910547256469727, "global_step": 57065, "epoch": 1358} {"train_loss": -5.779314994812012, "global_step": 57066, "epoch": 1358} {"train_loss": -5.947847843170166, "global_step": 57067, "epoch": 1358} {"train_loss": -5.882587432861328, "global_step": 57068, "epoch": 1358} {"train_loss": -5.8152079582214355, "global_step": 57069, "epoch": 1358} {"train_loss": -5.765493392944336, "global_step": 57070, "epoch": 1358} {"train_loss": -5.779336929321289, "global_step": 57071, "epoch": 1358} {"train_loss": -5.835289001464844, "global_step": 57072, "epoch": 1358} {"train_loss": -5.8605804443359375, "global_step": 57073, "epoch": 1358} {"train_loss": -5.998878479003906, "global_step": 57074, "epoch": 1358} {"train_loss": -5.92915153503418, "global_step": 57075, "epoch": 1358} {"train_loss": -5.859533786773682, "global_step": 57076, "epoch": 1358} {"train_loss": -5.8741399220057895, "global_step": 57077, "epoch": 1358, "val_loss": 74077.6796875} {"train_loss": -5.8706512451171875, "global_step": 57078, "epoch": 1359} {"train_loss": -5.85715389251709, "global_step": 57079, "epoch": 1359} {"train_loss": -5.88252592086792, "global_step": 57080, "epoch": 1359} {"train_loss": -5.892552852630615, "global_step": 57081, "epoch": 1359} {"train_loss": -5.950934410095215, "global_step": 57082, "epoch": 1359} {"train_loss": -5.9770307540893555, "global_step": 57083, "epoch": 1359} {"train_loss": -5.752274036407471, "global_step": 57084, "epoch": 1359} {"train_loss": -5.789037227630615, "global_step": 57085, "epoch": 1359} {"train_loss": -5.6832780838012695, "global_step": 57086, "epoch": 1359} {"train_loss": -5.889538288116455, "global_step": 57087, "epoch": 1359} {"train_loss": -5.920290946960449, "global_step": 57088, "epoch": 1359} {"train_loss": -5.861830234527588, "global_step": 57089, "epoch": 1359} {"train_loss": -5.702221393585205, "global_step": 57090, "epoch": 1359} {"train_loss": -5.923830986022949, "global_step": 57091, "epoch": 1359} {"train_loss": -5.92795467376709, "global_step": 57092, "epoch": 1359} {"train_loss": -5.9753804206848145, "global_step": 57093, "epoch": 1359} {"train_loss": -5.88175106048584, "global_step": 57094, "epoch": 1359} {"train_loss": -5.7842793464660645, "global_step": 57095, "epoch": 1359} {"train_loss": -5.999963760375977, "global_step": 57096, "epoch": 1359} {"train_loss": -5.903261184692383, "global_step": 57097, "epoch": 1359} {"train_loss": -5.925768852233887, "global_step": 57098, "epoch": 1359} {"train_loss": -5.888035774230957, "global_step": 57099, "epoch": 1359} {"train_loss": -5.893733024597168, "global_step": 57100, "epoch": 1359} {"train_loss": -5.994400501251221, "global_step": 57101, "epoch": 1359} {"train_loss": -5.66756010055542, "global_step": 57102, "epoch": 1359} {"train_loss": -5.8365960121154785, "global_step": 57103, "epoch": 1359} {"train_loss": -5.863067626953125, "global_step": 57104, "epoch": 1359} {"train_loss": -5.8439531326293945, "global_step": 57105, "epoch": 1359} {"train_loss": -5.852238655090332, "global_step": 57106, "epoch": 1359} {"train_loss": -5.935279846191406, "global_step": 57107, "epoch": 1359} {"train_loss": -5.845378398895264, "global_step": 57108, "epoch": 1359} {"train_loss": -5.9689178466796875, "global_step": 57109, "epoch": 1359} {"train_loss": -5.857222557067871, "global_step": 57110, "epoch": 1359} {"train_loss": -5.781346321105957, "global_step": 57111, "epoch": 1359} {"train_loss": -5.858601093292236, "global_step": 57112, "epoch": 1359} {"train_loss": -5.853503227233887, "global_step": 57113, "epoch": 1359} {"train_loss": -5.9867634773254395, "global_step": 57114, "epoch": 1359} {"train_loss": -5.962543487548828, "global_step": 57115, "epoch": 1359} {"train_loss": -5.7742695808410645, "global_step": 57116, "epoch": 1359} {"train_loss": -5.833987712860107, "global_step": 57117, "epoch": 1359} {"train_loss": -5.928731918334961, "global_step": 57118, "epoch": 1359} {"train_loss": -5.875414984566825, "global_step": 57119, "epoch": 1359, "val_loss": 74499.5546875} {"train_loss": -5.79042387008667, "global_step": 57120, "epoch": 1360} {"train_loss": -5.803022384643555, "global_step": 57121, "epoch": 1360} {"train_loss": -5.909562110900879, "global_step": 57122, "epoch": 1360} {"train_loss": -5.785497665405273, "global_step": 57123, "epoch": 1360} {"train_loss": -5.738582611083984, "global_step": 57124, "epoch": 1360} {"train_loss": -5.8442535400390625, "global_step": 57125, "epoch": 1360} {"train_loss": -5.861127853393555, "global_step": 57126, "epoch": 1360} {"train_loss": -5.884905815124512, "global_step": 57127, "epoch": 1360} {"train_loss": -5.71658182144165, "global_step": 57128, "epoch": 1360} {"train_loss": -5.785788059234619, "global_step": 57129, "epoch": 1360} {"train_loss": -5.950255393981934, "global_step": 57130, "epoch": 1360} {"train_loss": -5.7052321434021, "global_step": 57131, "epoch": 1360} {"train_loss": -5.801499843597412, "global_step": 57132, "epoch": 1360} {"train_loss": -5.9718017578125, "global_step": 57133, "epoch": 1360} {"train_loss": -5.725683689117432, "global_step": 57134, "epoch": 1360} {"train_loss": -5.884292125701904, "global_step": 57135, "epoch": 1360} {"train_loss": -5.846010208129883, "global_step": 57136, "epoch": 1360} {"train_loss": -5.828917503356934, "global_step": 57137, "epoch": 1360} {"train_loss": -5.800507545471191, "global_step": 57138, "epoch": 1360} {"train_loss": -5.849183082580566, "global_step": 57139, "epoch": 1360} {"train_loss": -5.90001106262207, "global_step": 57140, "epoch": 1360} {"train_loss": -5.881024360656738, "global_step": 57141, "epoch": 1360} {"train_loss": -5.895671844482422, "global_step": 57142, "epoch": 1360} {"train_loss": -5.888269424438477, "global_step": 57143, "epoch": 1360} {"train_loss": -5.856263160705566, "global_step": 57144, "epoch": 1360} {"train_loss": -5.93295955657959, "global_step": 57145, "epoch": 1360} {"train_loss": -5.902917861938477, "global_step": 57146, "epoch": 1360} {"train_loss": -5.871834754943848, "global_step": 57147, "epoch": 1360} {"train_loss": -5.82090425491333, "global_step": 57148, "epoch": 1360} {"train_loss": -5.809974193572998, "global_step": 57149, "epoch": 1360} {"train_loss": -5.910487174987793, "global_step": 57150, "epoch": 1360} {"train_loss": -5.758903503417969, "global_step": 57151, "epoch": 1360} {"train_loss": -5.922902584075928, "global_step": 57152, "epoch": 1360} {"train_loss": -5.854653358459473, "global_step": 57153, "epoch": 1360} {"train_loss": -5.835662364959717, "global_step": 57154, "epoch": 1360} {"train_loss": -5.931240081787109, "global_step": 57155, "epoch": 1360} {"train_loss": -5.883671283721924, "global_step": 57156, "epoch": 1360} {"train_loss": -5.829084873199463, "global_step": 57157, "epoch": 1360} {"train_loss": -5.877999305725098, "global_step": 57158, "epoch": 1360} {"train_loss": -5.884700298309326, "global_step": 57159, "epoch": 1360} {"train_loss": -5.880910873413086, "global_step": 57160, "epoch": 1360} {"train_loss": -5.850468590146019, "global_step": 57161, "epoch": 1360, "val_loss": 74748.4375} {"train_loss": -5.691205978393555, "global_step": 57162, "epoch": 1361} {"train_loss": -5.975638389587402, "global_step": 57163, "epoch": 1361} {"train_loss": -5.91302490234375, "global_step": 57164, "epoch": 1361} {"train_loss": -5.777520656585693, "global_step": 57165, "epoch": 1361} {"train_loss": -5.923381805419922, "global_step": 57166, "epoch": 1361} {"train_loss": -5.966561317443848, "global_step": 57167, "epoch": 1361} {"train_loss": -5.855744361877441, "global_step": 57168, "epoch": 1361} {"train_loss": -5.808492660522461, "global_step": 57169, "epoch": 1361} {"train_loss": -5.881998538970947, "global_step": 57170, "epoch": 1361} {"train_loss": -5.8673810958862305, "global_step": 57171, "epoch": 1361} {"train_loss": -5.783163070678711, "global_step": 57172, "epoch": 1361} {"train_loss": -5.9710869789123535, "global_step": 57173, "epoch": 1361} {"train_loss": -5.780984878540039, "global_step": 57174, "epoch": 1361} {"train_loss": -5.915600299835205, "global_step": 57175, "epoch": 1361} {"train_loss": -5.890695571899414, "global_step": 57176, "epoch": 1361} {"train_loss": -5.826183319091797, "global_step": 57177, "epoch": 1361} {"train_loss": -5.816906929016113, "global_step": 57178, "epoch": 1361} {"train_loss": -5.9011945724487305, "global_step": 57179, "epoch": 1361} {"train_loss": -5.8878254890441895, "global_step": 57180, "epoch": 1361} {"train_loss": -5.9395976066589355, "global_step": 57181, "epoch": 1361} {"train_loss": -5.919149398803711, "global_step": 57182, "epoch": 1361} {"train_loss": -5.691999435424805, "global_step": 57183, "epoch": 1361} {"train_loss": -5.899931907653809, "global_step": 57184, "epoch": 1361} {"train_loss": -5.737793445587158, "global_step": 57185, "epoch": 1361} {"train_loss": -5.798431396484375, "global_step": 57186, "epoch": 1361} {"train_loss": -5.927643299102783, "global_step": 57187, "epoch": 1361} {"train_loss": -5.795444488525391, "global_step": 57188, "epoch": 1361} {"train_loss": -5.866110801696777, "global_step": 57189, "epoch": 1361} {"train_loss": -5.741397857666016, "global_step": 57190, "epoch": 1361} {"train_loss": -5.869483947753906, "global_step": 57191, "epoch": 1361} {"train_loss": -5.816445350646973, "global_step": 57192, "epoch": 1361} {"train_loss": -5.870936393737793, "global_step": 57193, "epoch": 1361} {"train_loss": -5.80728006362915, "global_step": 57194, "epoch": 1361} {"train_loss": -5.759190559387207, "global_step": 57195, "epoch": 1361} {"train_loss": -5.869184494018555, "global_step": 57196, "epoch": 1361} {"train_loss": -5.9276299476623535, "global_step": 57197, "epoch": 1361} {"train_loss": -5.805940628051758, "global_step": 57198, "epoch": 1361} {"train_loss": -5.825654029846191, "global_step": 57199, "epoch": 1361} {"train_loss": -5.96928596496582, "global_step": 57200, "epoch": 1361} {"train_loss": -5.9239501953125, "global_step": 57201, "epoch": 1361} {"train_loss": -5.899110317230225, "global_step": 57202, "epoch": 1361} {"train_loss": -5.856963350659325, "global_step": 57203, "epoch": 1361, "val_loss": 74327.8515625} {"train_loss": -5.936830520629883, "global_step": 57204, "epoch": 1362} {"train_loss": -5.866727828979492, "global_step": 57205, "epoch": 1362} {"train_loss": -5.982066631317139, "global_step": 57206, "epoch": 1362} {"train_loss": -5.898184299468994, "global_step": 57207, "epoch": 1362} {"train_loss": -5.848807334899902, "global_step": 57208, "epoch": 1362} {"train_loss": -5.958472728729248, "global_step": 57209, "epoch": 1362} {"train_loss": -5.698979377746582, "global_step": 57210, "epoch": 1362} {"train_loss": -5.747404098510742, "global_step": 57211, "epoch": 1362} {"train_loss": -5.853508949279785, "global_step": 57212, "epoch": 1362} {"train_loss": -5.786141395568848, "global_step": 57213, "epoch": 1362} {"train_loss": -5.8657355308532715, "global_step": 57214, "epoch": 1362} {"train_loss": -5.7646942138671875, "global_step": 57215, "epoch": 1362} {"train_loss": -5.774471759796143, "global_step": 57216, "epoch": 1362} {"train_loss": -5.830644607543945, "global_step": 57217, "epoch": 1362} {"train_loss": -5.76997184753418, "global_step": 57218, "epoch": 1362} {"train_loss": -5.942607879638672, "global_step": 57219, "epoch": 1362} {"train_loss": -5.901211738586426, "global_step": 57220, "epoch": 1362} {"train_loss": -5.7463531494140625, "global_step": 57221, "epoch": 1362} {"train_loss": -5.8810014724731445, "global_step": 57222, "epoch": 1362} {"train_loss": -5.817295551300049, "global_step": 57223, "epoch": 1362} {"train_loss": -5.768787384033203, "global_step": 57224, "epoch": 1362} {"train_loss": -5.83817720413208, "global_step": 57225, "epoch": 1362} {"train_loss": -5.8040266036987305, "global_step": 57226, "epoch": 1362} {"train_loss": -5.816888332366943, "global_step": 57227, "epoch": 1362} {"train_loss": -5.89754581451416, "global_step": 57228, "epoch": 1362} {"train_loss": -5.823195934295654, "global_step": 57229, "epoch": 1362} {"train_loss": -5.982749938964844, "global_step": 57230, "epoch": 1362} {"train_loss": -5.803089141845703, "global_step": 57231, "epoch": 1362} {"train_loss": -5.820031642913818, "global_step": 57232, "epoch": 1362} {"train_loss": -5.763044834136963, "global_step": 57233, "epoch": 1362} {"train_loss": -5.861629009246826, "global_step": 57234, "epoch": 1362} {"train_loss": -5.733187675476074, "global_step": 57235, "epoch": 1362} {"train_loss": -5.633895397186279, "global_step": 57236, "epoch": 1362} {"train_loss": -5.8241472244262695, "global_step": 57237, "epoch": 1362} {"train_loss": -5.600480079650879, "global_step": 57238, "epoch": 1362} {"train_loss": -5.74997615814209, "global_step": 57239, "epoch": 1362} {"train_loss": -5.756892204284668, "global_step": 57240, "epoch": 1362} {"train_loss": -5.733339309692383, "global_step": 57241, "epoch": 1362} {"train_loss": -5.696320056915283, "global_step": 57242, "epoch": 1362} {"train_loss": -5.795489311218262, "global_step": 57243, "epoch": 1362} {"train_loss": -5.825654983520508, "global_step": 57244, "epoch": 1362} {"train_loss": -5.813645203908284, "global_step": 57245, "epoch": 1362, "val_loss": 74472.6953125} {"train_loss": -5.928681373596191, "global_step": 57246, "epoch": 1363} {"train_loss": -5.732011318206787, "global_step": 57247, "epoch": 1363} {"train_loss": -5.848015785217285, "global_step": 57248, "epoch": 1363} {"train_loss": -5.845773696899414, "global_step": 57249, "epoch": 1363} {"train_loss": -5.774387359619141, "global_step": 57250, "epoch": 1363} {"train_loss": -5.819735527038574, "global_step": 57251, "epoch": 1363} {"train_loss": -5.8453850746154785, "global_step": 57252, "epoch": 1363} {"train_loss": -5.833565711975098, "global_step": 57253, "epoch": 1363} {"train_loss": -5.834650039672852, "global_step": 57254, "epoch": 1363} {"train_loss": -5.892299652099609, "global_step": 57255, "epoch": 1363} {"train_loss": -5.9060516357421875, "global_step": 57256, "epoch": 1363} {"train_loss": -5.763721942901611, "global_step": 57257, "epoch": 1363} {"train_loss": -5.998637676239014, "global_step": 57258, "epoch": 1363} {"train_loss": -5.974727630615234, "global_step": 57259, "epoch": 1363} {"train_loss": -5.861029624938965, "global_step": 57260, "epoch": 1363} {"train_loss": -5.830025672912598, "global_step": 57261, "epoch": 1363} {"train_loss": -5.8819899559021, "global_step": 57262, "epoch": 1363} {"train_loss": -5.912213325500488, "global_step": 57263, "epoch": 1363} {"train_loss": -5.840429306030273, "global_step": 57264, "epoch": 1363} {"train_loss": -5.883770942687988, "global_step": 57265, "epoch": 1363} {"train_loss": -5.859796524047852, "global_step": 57266, "epoch": 1363} {"train_loss": -5.9087605476379395, "global_step": 57267, "epoch": 1363} {"train_loss": -5.890483856201172, "global_step": 57268, "epoch": 1363} {"train_loss": -5.933936595916748, "global_step": 57269, "epoch": 1363} {"train_loss": -5.7992730140686035, "global_step": 57270, "epoch": 1363} {"train_loss": -5.906432151794434, "global_step": 57271, "epoch": 1363} {"train_loss": -5.838836193084717, "global_step": 57272, "epoch": 1363} {"train_loss": -5.85269832611084, "global_step": 57273, "epoch": 1363} {"train_loss": -5.919317245483398, "global_step": 57274, "epoch": 1363} {"train_loss": -5.704821586608887, "global_step": 57275, "epoch": 1363} {"train_loss": -5.953927516937256, "global_step": 57276, "epoch": 1363} {"train_loss": -5.856643199920654, "global_step": 57277, "epoch": 1363} {"train_loss": -5.782292366027832, "global_step": 57278, "epoch": 1363} {"train_loss": -5.737786293029785, "global_step": 57279, "epoch": 1363} {"train_loss": -5.8359479904174805, "global_step": 57280, "epoch": 1363} {"train_loss": -5.817168235778809, "global_step": 57281, "epoch": 1363} {"train_loss": -5.86631965637207, "global_step": 57282, "epoch": 1363} {"train_loss": -5.778048515319824, "global_step": 57283, "epoch": 1363} {"train_loss": -5.860138416290283, "global_step": 57284, "epoch": 1363} {"train_loss": -5.7696213722229, "global_step": 57285, "epoch": 1363} {"train_loss": -5.788990020751953, "global_step": 57286, "epoch": 1363} {"train_loss": -5.85370609873817, "global_step": 57287, "epoch": 1363, "val_loss": 74101.4609375} {"train_loss": -5.793338775634766, "global_step": 57288, "epoch": 1364} {"train_loss": -5.716341972351074, "global_step": 57289, "epoch": 1364} {"train_loss": -5.779808044433594, "global_step": 57290, "epoch": 1364} {"train_loss": -5.945076942443848, "global_step": 57291, "epoch": 1364} {"train_loss": -5.969067573547363, "global_step": 57292, "epoch": 1364} {"train_loss": -5.8893585205078125, "global_step": 57293, "epoch": 1364} {"train_loss": -5.822999954223633, "global_step": 57294, "epoch": 1364} {"train_loss": -5.875572204589844, "global_step": 57295, "epoch": 1364} {"train_loss": -5.91847038269043, "global_step": 57296, "epoch": 1364} {"train_loss": -5.843026638031006, "global_step": 57297, "epoch": 1364} {"train_loss": -5.965372085571289, "global_step": 57298, "epoch": 1364} {"train_loss": -5.83638334274292, "global_step": 57299, "epoch": 1364} {"train_loss": -5.934028148651123, "global_step": 57300, "epoch": 1364} {"train_loss": -5.863719463348389, "global_step": 57301, "epoch": 1364} {"train_loss": -5.762243270874023, "global_step": 57302, "epoch": 1364} {"train_loss": -5.8984479904174805, "global_step": 57303, "epoch": 1364} {"train_loss": -5.933150291442871, "global_step": 57304, "epoch": 1364} {"train_loss": -5.924291610717773, "global_step": 57305, "epoch": 1364} {"train_loss": -5.845559597015381, "global_step": 57306, "epoch": 1364} {"train_loss": -5.974689483642578, "global_step": 57307, "epoch": 1364} {"train_loss": -5.881339073181152, "global_step": 57308, "epoch": 1364} {"train_loss": -5.853445053100586, "global_step": 57309, "epoch": 1364} {"train_loss": -5.993090629577637, "global_step": 57310, "epoch": 1364} {"train_loss": -5.951254844665527, "global_step": 57311, "epoch": 1364} {"train_loss": -5.86198091506958, "global_step": 57312, "epoch": 1364} {"train_loss": -5.939320087432861, "global_step": 57313, "epoch": 1364} {"train_loss": -5.820700168609619, "global_step": 57314, "epoch": 1364} {"train_loss": -5.847270488739014, "global_step": 57315, "epoch": 1364} {"train_loss": -5.911821365356445, "global_step": 57316, "epoch": 1364} {"train_loss": -5.911282539367676, "global_step": 57317, "epoch": 1364} {"train_loss": -5.979713439941406, "global_step": 57318, "epoch": 1364} {"train_loss": -5.905797958374023, "global_step": 57319, "epoch": 1364} {"train_loss": -5.9768853187561035, "global_step": 57320, "epoch": 1364} {"train_loss": -5.951840877532959, "global_step": 57321, "epoch": 1364} {"train_loss": -5.902719497680664, "global_step": 57322, "epoch": 1364} {"train_loss": -5.923210620880127, "global_step": 57323, "epoch": 1364} {"train_loss": -5.851872444152832, "global_step": 57324, "epoch": 1364} {"train_loss": -5.765558242797852, "global_step": 57325, "epoch": 1364} {"train_loss": -5.765700340270996, "global_step": 57326, "epoch": 1364} {"train_loss": -5.825484275817871, "global_step": 57327, "epoch": 1364} {"train_loss": -5.914973258972168, "global_step": 57328, "epoch": 1364} {"train_loss": -5.8844765822092695, "global_step": 57329, "epoch": 1364, "val_loss": 74673.390625} {"train_loss": -5.846186637878418, "global_step": 57330, "epoch": 1365} {"train_loss": -5.790665149688721, "global_step": 57331, "epoch": 1365} {"train_loss": -5.8424787521362305, "global_step": 57332, "epoch": 1365} {"train_loss": -5.899759769439697, "global_step": 57333, "epoch": 1365} {"train_loss": -5.916983127593994, "global_step": 57334, "epoch": 1365} {"train_loss": -5.881349563598633, "global_step": 57335, "epoch": 1365} {"train_loss": -5.848369598388672, "global_step": 57336, "epoch": 1365} {"train_loss": -5.900650978088379, "global_step": 57337, "epoch": 1365} {"train_loss": -5.855260372161865, "global_step": 57338, "epoch": 1365} {"train_loss": -5.946948051452637, "global_step": 57339, "epoch": 1365} {"train_loss": -5.932169437408447, "global_step": 57340, "epoch": 1365} {"train_loss": -5.977609634399414, "global_step": 57341, "epoch": 1365} {"train_loss": -5.851864814758301, "global_step": 57342, "epoch": 1365} {"train_loss": -5.970911026000977, "global_step": 57343, "epoch": 1365} {"train_loss": -5.91011381149292, "global_step": 57344, "epoch": 1365} {"train_loss": -5.751302242279053, "global_step": 57345, "epoch": 1365} {"train_loss": -5.950814723968506, "global_step": 57346, "epoch": 1365} {"train_loss": -5.862455368041992, "global_step": 57347, "epoch": 1365} {"train_loss": -5.897821426391602, "global_step": 57348, "epoch": 1365} {"train_loss": -5.942898750305176, "global_step": 57349, "epoch": 1365} {"train_loss": -5.954090595245361, "global_step": 57350, "epoch": 1365} {"train_loss": -5.918509483337402, "global_step": 57351, "epoch": 1365} {"train_loss": -5.803308486938477, "global_step": 57352, "epoch": 1365} {"train_loss": -5.982844352722168, "global_step": 57353, "epoch": 1365} {"train_loss": -5.968906402587891, "global_step": 57354, "epoch": 1365} {"train_loss": -5.895279884338379, "global_step": 57355, "epoch": 1365} {"train_loss": -5.878045558929443, "global_step": 57356, "epoch": 1365} {"train_loss": -5.974312782287598, "global_step": 57357, "epoch": 1365} {"train_loss": -5.76951789855957, "global_step": 57358, "epoch": 1365} {"train_loss": -5.855224609375, "global_step": 57359, "epoch": 1365} {"train_loss": -5.909997940063477, "global_step": 57360, "epoch": 1365} {"train_loss": -5.880954742431641, "global_step": 57361, "epoch": 1365} {"train_loss": -5.931554794311523, "global_step": 57362, "epoch": 1365} {"train_loss": -5.898635387420654, "global_step": 57363, "epoch": 1365} {"train_loss": -5.80379581451416, "global_step": 57364, "epoch": 1365} {"train_loss": -5.7441277503967285, "global_step": 57365, "epoch": 1365} {"train_loss": -5.914095878601074, "global_step": 57366, "epoch": 1365} {"train_loss": -5.864693641662598, "global_step": 57367, "epoch": 1365} {"train_loss": -5.780097007751465, "global_step": 57368, "epoch": 1365} {"train_loss": -5.880453109741211, "global_step": 57369, "epoch": 1365} {"train_loss": -5.899095058441162, "global_step": 57370, "epoch": 1365} {"train_loss": -5.882007950828189, "global_step": 57371, "epoch": 1365, "val_loss": 74200.2578125} {"train_loss": -5.866393566131592, "global_step": 57372, "epoch": 1366} {"train_loss": -5.776021480560303, "global_step": 57373, "epoch": 1366} {"train_loss": -5.877379417419434, "global_step": 57374, "epoch": 1366} {"train_loss": -5.771173477172852, "global_step": 57375, "epoch": 1366} {"train_loss": -5.817476272583008, "global_step": 57376, "epoch": 1366} {"train_loss": -5.802220344543457, "global_step": 57377, "epoch": 1366} {"train_loss": -5.881664752960205, "global_step": 57378, "epoch": 1366} {"train_loss": -5.795725345611572, "global_step": 57379, "epoch": 1366} {"train_loss": -5.913081645965576, "global_step": 57380, "epoch": 1366} {"train_loss": -5.96345329284668, "global_step": 57381, "epoch": 1366} {"train_loss": -5.785606861114502, "global_step": 57382, "epoch": 1366} {"train_loss": -5.873826503753662, "global_step": 57383, "epoch": 1366} {"train_loss": -5.8566365242004395, "global_step": 57384, "epoch": 1366} {"train_loss": -5.955465316772461, "global_step": 57385, "epoch": 1366} {"train_loss": -5.797489166259766, "global_step": 57386, "epoch": 1366} {"train_loss": -5.808380126953125, "global_step": 57387, "epoch": 1366} {"train_loss": -5.870018005371094, "global_step": 57388, "epoch": 1366} {"train_loss": -5.8581109046936035, "global_step": 57389, "epoch": 1366} {"train_loss": -5.88576602935791, "global_step": 57390, "epoch": 1366} {"train_loss": -5.8430891036987305, "global_step": 57391, "epoch": 1366} {"train_loss": -5.863699436187744, "global_step": 57392, "epoch": 1366} {"train_loss": -5.823349475860596, "global_step": 57393, "epoch": 1366} {"train_loss": -5.845779895782471, "global_step": 57394, "epoch": 1366} {"train_loss": -6.004965782165527, "global_step": 57395, "epoch": 1366} {"train_loss": -5.873692035675049, "global_step": 57396, "epoch": 1366} {"train_loss": -5.934258937835693, "global_step": 57397, "epoch": 1366} {"train_loss": -5.817933082580566, "global_step": 57398, "epoch": 1366} {"train_loss": -5.887155532836914, "global_step": 57399, "epoch": 1366} {"train_loss": -5.943096160888672, "global_step": 57400, "epoch": 1366} {"train_loss": -5.817768096923828, "global_step": 57401, "epoch": 1366} {"train_loss": -5.945071220397949, "global_step": 57402, "epoch": 1366} {"train_loss": -5.821000099182129, "global_step": 57403, "epoch": 1366} {"train_loss": -5.902823448181152, "global_step": 57404, "epoch": 1366} {"train_loss": -5.927272796630859, "global_step": 57405, "epoch": 1366} {"train_loss": -5.9739603996276855, "global_step": 57406, "epoch": 1366} {"train_loss": -5.741024971008301, "global_step": 57407, "epoch": 1366} {"train_loss": -5.837975025177002, "global_step": 57408, "epoch": 1366} {"train_loss": -5.887382507324219, "global_step": 57409, "epoch": 1366} {"train_loss": -5.861843585968018, "global_step": 57410, "epoch": 1366} {"train_loss": -5.871589660644531, "global_step": 57411, "epoch": 1366} {"train_loss": -5.885807514190674, "global_step": 57412, "epoch": 1366} {"train_loss": -5.866526058741978, "global_step": 57413, "epoch": 1366, "val_loss": 74564.3984375} {"train_loss": -5.832437515258789, "global_step": 57414, "epoch": 1367} {"train_loss": -5.925624847412109, "global_step": 57415, "epoch": 1367} {"train_loss": -5.865193843841553, "global_step": 57416, "epoch": 1367} {"train_loss": -5.857570648193359, "global_step": 57417, "epoch": 1367} {"train_loss": -5.748899936676025, "global_step": 57418, "epoch": 1367} {"train_loss": -5.92966365814209, "global_step": 57419, "epoch": 1367} {"train_loss": -5.853065490722656, "global_step": 57420, "epoch": 1367} {"train_loss": -5.8955559730529785, "global_step": 57421, "epoch": 1367} {"train_loss": -5.869423866271973, "global_step": 57422, "epoch": 1367} {"train_loss": -5.7482404708862305, "global_step": 57423, "epoch": 1367} {"train_loss": -5.616596221923828, "global_step": 57424, "epoch": 1367} {"train_loss": -5.797778129577637, "global_step": 57425, "epoch": 1367} {"train_loss": -5.8292741775512695, "global_step": 57426, "epoch": 1367} {"train_loss": -5.850703239440918, "global_step": 57427, "epoch": 1367} {"train_loss": -5.9984941482543945, "global_step": 57428, "epoch": 1367} {"train_loss": -5.734859466552734, "global_step": 57429, "epoch": 1367} {"train_loss": -5.877825736999512, "global_step": 57430, "epoch": 1367} {"train_loss": -5.808813095092773, "global_step": 57431, "epoch": 1367} {"train_loss": -5.767139434814453, "global_step": 57432, "epoch": 1367} {"train_loss": -5.792665958404541, "global_step": 57433, "epoch": 1367} {"train_loss": -5.775467872619629, "global_step": 57434, "epoch": 1367} {"train_loss": -5.82747745513916, "global_step": 57435, "epoch": 1367} {"train_loss": -5.848818302154541, "global_step": 57436, "epoch": 1367} {"train_loss": -5.784241676330566, "global_step": 57437, "epoch": 1367} {"train_loss": -5.826846122741699, "global_step": 57438, "epoch": 1367} {"train_loss": -5.879192352294922, "global_step": 57439, "epoch": 1367} {"train_loss": -5.675627708435059, "global_step": 57440, "epoch": 1367} {"train_loss": -5.871706485748291, "global_step": 57441, "epoch": 1367} {"train_loss": -5.8962907791137695, "global_step": 57442, "epoch": 1367} {"train_loss": -5.965085506439209, "global_step": 57443, "epoch": 1367} {"train_loss": -5.854784965515137, "global_step": 57444, "epoch": 1367} {"train_loss": -5.816071510314941, "global_step": 57445, "epoch": 1367} {"train_loss": -5.8175811767578125, "global_step": 57446, "epoch": 1367} {"train_loss": -5.918100357055664, "global_step": 57447, "epoch": 1367} {"train_loss": -5.855467796325684, "global_step": 57448, "epoch": 1367} {"train_loss": -5.938241481781006, "global_step": 57449, "epoch": 1367} {"train_loss": -5.844880104064941, "global_step": 57450, "epoch": 1367} {"train_loss": -5.963476181030273, "global_step": 57451, "epoch": 1367} {"train_loss": -5.7998948097229, "global_step": 57452, "epoch": 1367} {"train_loss": -5.830522537231445, "global_step": 57453, "epoch": 1367} {"train_loss": -5.975299835205078, "global_step": 57454, "epoch": 1367} {"train_loss": -5.844839073362804, "global_step": 57455, "epoch": 1367, "val_loss": 74265.0234375} {"train_loss": -5.886980056762695, "global_step": 57456, "epoch": 1368} {"train_loss": -5.953595161437988, "global_step": 57457, "epoch": 1368} {"train_loss": -5.921746253967285, "global_step": 57458, "epoch": 1368} {"train_loss": -5.804628849029541, "global_step": 57459, "epoch": 1368} {"train_loss": -5.937357425689697, "global_step": 57460, "epoch": 1368} {"train_loss": -5.910961151123047, "global_step": 57461, "epoch": 1368} {"train_loss": -5.958046913146973, "global_step": 57462, "epoch": 1368} {"train_loss": -5.924954414367676, "global_step": 57463, "epoch": 1368} {"train_loss": -5.877290725708008, "global_step": 57464, "epoch": 1368} {"train_loss": -5.905611038208008, "global_step": 57465, "epoch": 1368} {"train_loss": -5.902988433837891, "global_step": 57466, "epoch": 1368} {"train_loss": -5.738143444061279, "global_step": 57467, "epoch": 1368} {"train_loss": -6.023773670196533, "global_step": 57468, "epoch": 1368} {"train_loss": -5.894222259521484, "global_step": 57469, "epoch": 1368} {"train_loss": -5.877142906188965, "global_step": 57470, "epoch": 1368} {"train_loss": -5.855339050292969, "global_step": 57471, "epoch": 1368} {"train_loss": -5.798375606536865, "global_step": 57472, "epoch": 1368} {"train_loss": -5.953651428222656, "global_step": 57473, "epoch": 1368} {"train_loss": -5.860900402069092, "global_step": 57474, "epoch": 1368} {"train_loss": -5.866610050201416, "global_step": 57475, "epoch": 1368} {"train_loss": -5.856095314025879, "global_step": 57476, "epoch": 1368} {"train_loss": -5.876553535461426, "global_step": 57477, "epoch": 1368} {"train_loss": -5.855578899383545, "global_step": 57478, "epoch": 1368} {"train_loss": -5.759862899780273, "global_step": 57479, "epoch": 1368} {"train_loss": -5.774857521057129, "global_step": 57480, "epoch": 1368} {"train_loss": -5.860769271850586, "global_step": 57481, "epoch": 1368} {"train_loss": -5.843446731567383, "global_step": 57482, "epoch": 1368} {"train_loss": -5.881296157836914, "global_step": 57483, "epoch": 1368} {"train_loss": -5.877196788787842, "global_step": 57484, "epoch": 1368} {"train_loss": -5.778988838195801, "global_step": 57485, "epoch": 1368} {"train_loss": -5.830243110656738, "global_step": 57486, "epoch": 1368} {"train_loss": -5.779314994812012, "global_step": 57487, "epoch": 1368} {"train_loss": -5.795313835144043, "global_step": 57488, "epoch": 1368} {"train_loss": -5.85447883605957, "global_step": 57489, "epoch": 1368} {"train_loss": -5.760262489318848, "global_step": 57490, "epoch": 1368} {"train_loss": -5.946059226989746, "global_step": 57491, "epoch": 1368} {"train_loss": -5.7153000831604, "global_step": 57492, "epoch": 1368} {"train_loss": -5.803569316864014, "global_step": 57493, "epoch": 1368} {"train_loss": -5.728579521179199, "global_step": 57494, "epoch": 1368} {"train_loss": -5.759761810302734, "global_step": 57495, "epoch": 1368} {"train_loss": -5.895520210266113, "global_step": 57496, "epoch": 1368} {"train_loss": -5.8522551740918844, "global_step": 57497, "epoch": 1368, "val_loss": 74721.640625} {"train_loss": -5.873932838439941, "global_step": 57498, "epoch": 1369} {"train_loss": -5.745214462280273, "global_step": 57499, "epoch": 1369} {"train_loss": -5.811373233795166, "global_step": 57500, "epoch": 1369} {"train_loss": -5.809081554412842, "global_step": 57501, "epoch": 1369} {"train_loss": -5.6803741455078125, "global_step": 57502, "epoch": 1369} {"train_loss": -5.704535484313965, "global_step": 57503, "epoch": 1369} {"train_loss": -5.892546653747559, "global_step": 57504, "epoch": 1369} {"train_loss": -5.816900730133057, "global_step": 57505, "epoch": 1369} {"train_loss": -5.8010711669921875, "global_step": 57506, "epoch": 1369} {"train_loss": -5.802439212799072, "global_step": 57507, "epoch": 1369} {"train_loss": -5.935647487640381, "global_step": 57508, "epoch": 1369} {"train_loss": -5.846779823303223, "global_step": 57509, "epoch": 1369} {"train_loss": -5.792729377746582, "global_step": 57510, "epoch": 1369} {"train_loss": -5.930280685424805, "global_step": 57511, "epoch": 1369} {"train_loss": -5.7482523918151855, "global_step": 57512, "epoch": 1369} {"train_loss": -5.7795634269714355, "global_step": 57513, "epoch": 1369} {"train_loss": -5.8162689208984375, "global_step": 57514, "epoch": 1369} {"train_loss": -5.759368896484375, "global_step": 57515, "epoch": 1369} {"train_loss": -5.855135440826416, "global_step": 57516, "epoch": 1369} {"train_loss": -5.796896457672119, "global_step": 57517, "epoch": 1369} {"train_loss": -5.852102279663086, "global_step": 57518, "epoch": 1369} {"train_loss": -5.795363903045654, "global_step": 57519, "epoch": 1369} {"train_loss": -5.9690656661987305, "global_step": 57520, "epoch": 1369} {"train_loss": -5.821249008178711, "global_step": 57521, "epoch": 1369} {"train_loss": -5.929710388183594, "global_step": 57522, "epoch": 1369} {"train_loss": -5.793310165405273, "global_step": 57523, "epoch": 1369} {"train_loss": -5.78885555267334, "global_step": 57524, "epoch": 1369} {"train_loss": -5.793461799621582, "global_step": 57525, "epoch": 1369} {"train_loss": -5.725239276885986, "global_step": 57526, "epoch": 1369} {"train_loss": -5.873029708862305, "global_step": 57527, "epoch": 1369} {"train_loss": -5.932167053222656, "global_step": 57528, "epoch": 1369} {"train_loss": -5.792004108428955, "global_step": 57529, "epoch": 1369} {"train_loss": -5.838263511657715, "global_step": 57530, "epoch": 1369} {"train_loss": -5.816298484802246, "global_step": 57531, "epoch": 1369} {"train_loss": -5.8751654624938965, "global_step": 57532, "epoch": 1369} {"train_loss": -5.861849784851074, "global_step": 57533, "epoch": 1369} {"train_loss": -5.805950164794922, "global_step": 57534, "epoch": 1369} {"train_loss": -5.787291526794434, "global_step": 57535, "epoch": 1369} {"train_loss": -5.935650825500488, "global_step": 57536, "epoch": 1369} {"train_loss": -5.765669822692871, "global_step": 57537, "epoch": 1369} {"train_loss": -5.833386421203613, "global_step": 57538, "epoch": 1369} {"train_loss": -5.824604624793643, "global_step": 57539, "epoch": 1369, "val_loss": 74208.46875} {"train_loss": -5.9381256103515625, "global_step": 57540, "epoch": 1370} {"train_loss": -5.648593902587891, "global_step": 57541, "epoch": 1370} {"train_loss": -5.854152679443359, "global_step": 57542, "epoch": 1370} {"train_loss": -5.827540397644043, "global_step": 57543, "epoch": 1370} {"train_loss": -5.96937370300293, "global_step": 57544, "epoch": 1370} {"train_loss": -5.879141330718994, "global_step": 57545, "epoch": 1370} {"train_loss": -5.839244842529297, "global_step": 57546, "epoch": 1370} {"train_loss": -5.870837211608887, "global_step": 57547, "epoch": 1370} {"train_loss": -5.785055160522461, "global_step": 57548, "epoch": 1370} {"train_loss": -5.8605804443359375, "global_step": 57549, "epoch": 1370} {"train_loss": -5.993133544921875, "global_step": 57550, "epoch": 1370} {"train_loss": -5.825287818908691, "global_step": 57551, "epoch": 1370} {"train_loss": -5.809872627258301, "global_step": 57552, "epoch": 1370} {"train_loss": -5.979846000671387, "global_step": 57553, "epoch": 1370} {"train_loss": -5.925800323486328, "global_step": 57554, "epoch": 1370} {"train_loss": -5.822968006134033, "global_step": 57555, "epoch": 1370} {"train_loss": -5.894492149353027, "global_step": 57556, "epoch": 1370} {"train_loss": -5.954507350921631, "global_step": 57557, "epoch": 1370} {"train_loss": -5.858523368835449, "global_step": 57558, "epoch": 1370} {"train_loss": -5.85344934463501, "global_step": 57559, "epoch": 1370} {"train_loss": -5.928257942199707, "global_step": 57560, "epoch": 1370} {"train_loss": -5.878618240356445, "global_step": 57561, "epoch": 1370} {"train_loss": -5.852028846740723, "global_step": 57562, "epoch": 1370} {"train_loss": -5.886821746826172, "global_step": 57563, "epoch": 1370} {"train_loss": -5.838644504547119, "global_step": 57564, "epoch": 1370} {"train_loss": -5.9146857261657715, "global_step": 57565, "epoch": 1370} {"train_loss": -5.765302658081055, "global_step": 57566, "epoch": 1370} {"train_loss": -5.875003814697266, "global_step": 57567, "epoch": 1370} {"train_loss": -5.66355562210083, "global_step": 57568, "epoch": 1370} {"train_loss": -5.869458198547363, "global_step": 57569, "epoch": 1370} {"train_loss": -5.877507209777832, "global_step": 57570, "epoch": 1370} {"train_loss": -5.912125110626221, "global_step": 57571, "epoch": 1370} {"train_loss": -5.870388984680176, "global_step": 57572, "epoch": 1370} {"train_loss": -5.822205543518066, "global_step": 57573, "epoch": 1370} {"train_loss": -5.828188896179199, "global_step": 57574, "epoch": 1370} {"train_loss": -5.835638046264648, "global_step": 57575, "epoch": 1370} {"train_loss": -5.733974456787109, "global_step": 57576, "epoch": 1370} {"train_loss": -5.8590545654296875, "global_step": 57577, "epoch": 1370} {"train_loss": -5.811566352844238, "global_step": 57578, "epoch": 1370} {"train_loss": -5.811864852905273, "global_step": 57579, "epoch": 1370} {"train_loss": -5.850320816040039, "global_step": 57580, "epoch": 1370} {"train_loss": -5.853608653658912, "global_step": 57581, "epoch": 1370, "val_loss": 74282.2421875} {"train_loss": -5.88419246673584, "global_step": 57582, "epoch": 1371} {"train_loss": -5.853309631347656, "global_step": 57583, "epoch": 1371} {"train_loss": -5.760785102844238, "global_step": 57584, "epoch": 1371} {"train_loss": -5.934272766113281, "global_step": 57585, "epoch": 1371} {"train_loss": -5.822925567626953, "global_step": 57586, "epoch": 1371} {"train_loss": -5.767009735107422, "global_step": 57587, "epoch": 1371} {"train_loss": -5.903143882751465, "global_step": 57588, "epoch": 1371} {"train_loss": -5.865718841552734, "global_step": 57589, "epoch": 1371} {"train_loss": -5.674899578094482, "global_step": 57590, "epoch": 1371} {"train_loss": -5.734339237213135, "global_step": 57591, "epoch": 1371} {"train_loss": -5.7101030349731445, "global_step": 57592, "epoch": 1371} {"train_loss": -5.81048583984375, "global_step": 57593, "epoch": 1371} {"train_loss": -5.899523735046387, "global_step": 57594, "epoch": 1371} {"train_loss": -5.863131999969482, "global_step": 57595, "epoch": 1371} {"train_loss": -5.935232639312744, "global_step": 57596, "epoch": 1371} {"train_loss": -5.871796607971191, "global_step": 57597, "epoch": 1371} {"train_loss": -5.834683418273926, "global_step": 57598, "epoch": 1371} {"train_loss": -5.897944450378418, "global_step": 57599, "epoch": 1371} {"train_loss": -5.8396453857421875, "global_step": 57600, "epoch": 1371} {"train_loss": -5.919845104217529, "global_step": 57601, "epoch": 1371} {"train_loss": -5.950106620788574, "global_step": 57602, "epoch": 1371} {"train_loss": -5.887773513793945, "global_step": 57603, "epoch": 1371} {"train_loss": -5.879806041717529, "global_step": 57604, "epoch": 1371} {"train_loss": -5.712414264678955, "global_step": 57605, "epoch": 1371} {"train_loss": -5.9370012283325195, "global_step": 57606, "epoch": 1371} {"train_loss": -5.79338264465332, "global_step": 57607, "epoch": 1371} {"train_loss": -5.776665687561035, "global_step": 57608, "epoch": 1371} {"train_loss": -5.915082931518555, "global_step": 57609, "epoch": 1371} {"train_loss": -5.849968910217285, "global_step": 57610, "epoch": 1371} {"train_loss": -5.899119853973389, "global_step": 57611, "epoch": 1371} {"train_loss": -5.813057899475098, "global_step": 57612, "epoch": 1371} {"train_loss": -5.771394729614258, "global_step": 57613, "epoch": 1371} {"train_loss": -5.829954147338867, "global_step": 57614, "epoch": 1371} {"train_loss": -5.773731708526611, "global_step": 57615, "epoch": 1371} {"train_loss": -5.922257423400879, "global_step": 57616, "epoch": 1371} {"train_loss": -5.815645217895508, "global_step": 57617, "epoch": 1371} {"train_loss": -5.72511100769043, "global_step": 57618, "epoch": 1371} {"train_loss": -5.815858840942383, "global_step": 57619, "epoch": 1371} {"train_loss": -5.700411796569824, "global_step": 57620, "epoch": 1371} {"train_loss": -5.810956954956055, "global_step": 57621, "epoch": 1371} {"train_loss": -5.941690444946289, "global_step": 57622, "epoch": 1371} {"train_loss": -5.8377647286369685, "global_step": 57623, "epoch": 1371, "val_loss": 74619.359375} {"train_loss": -5.8170576095581055, "global_step": 57624, "epoch": 1372} {"train_loss": -5.754240989685059, "global_step": 57625, "epoch": 1372} {"train_loss": -5.822853088378906, "global_step": 57626, "epoch": 1372} {"train_loss": -5.889622688293457, "global_step": 57627, "epoch": 1372} {"train_loss": -5.84303617477417, "global_step": 57628, "epoch": 1372} {"train_loss": -5.967425346374512, "global_step": 57629, "epoch": 1372} {"train_loss": -5.7693328857421875, "global_step": 57630, "epoch": 1372} {"train_loss": -5.803866386413574, "global_step": 57631, "epoch": 1372} {"train_loss": -5.8083882331848145, "global_step": 57632, "epoch": 1372} {"train_loss": -5.921300888061523, "global_step": 57633, "epoch": 1372} {"train_loss": -5.945979118347168, "global_step": 57634, "epoch": 1372} {"train_loss": -5.766213893890381, "global_step": 57635, "epoch": 1372} {"train_loss": -5.790019512176514, "global_step": 57636, "epoch": 1372} {"train_loss": -5.8524932861328125, "global_step": 57637, "epoch": 1372} {"train_loss": -5.918918609619141, "global_step": 57638, "epoch": 1372} {"train_loss": -5.893813133239746, "global_step": 57639, "epoch": 1372} {"train_loss": -5.913904666900635, "global_step": 57640, "epoch": 1372} {"train_loss": -5.7954816818237305, "global_step": 57641, "epoch": 1372} {"train_loss": -5.947136878967285, "global_step": 57642, "epoch": 1372} {"train_loss": -5.874972820281982, "global_step": 57643, "epoch": 1372} {"train_loss": -5.881436347961426, "global_step": 57644, "epoch": 1372} {"train_loss": -5.932482719421387, "global_step": 57645, "epoch": 1372} {"train_loss": -5.868905544281006, "global_step": 57646, "epoch": 1372} {"train_loss": -5.8879170417785645, "global_step": 57647, "epoch": 1372} {"train_loss": -5.925776481628418, "global_step": 57648, "epoch": 1372} {"train_loss": -5.894763946533203, "global_step": 57649, "epoch": 1372} {"train_loss": -5.904658317565918, "global_step": 57650, "epoch": 1372} {"train_loss": -5.843319892883301, "global_step": 57651, "epoch": 1372} {"train_loss": -5.932761192321777, "global_step": 57652, "epoch": 1372} {"train_loss": -5.810547828674316, "global_step": 57653, "epoch": 1372} {"train_loss": -5.863609790802002, "global_step": 57654, "epoch": 1372} {"train_loss": -5.827692031860352, "global_step": 57655, "epoch": 1372} {"train_loss": -5.930298805236816, "global_step": 57656, "epoch": 1372} {"train_loss": -5.735982894897461, "global_step": 57657, "epoch": 1372} {"train_loss": -5.965237617492676, "global_step": 57658, "epoch": 1372} {"train_loss": -5.958601951599121, "global_step": 57659, "epoch": 1372} {"train_loss": -5.953512668609619, "global_step": 57660, "epoch": 1372} {"train_loss": -5.88284969329834, "global_step": 57661, "epoch": 1372} {"train_loss": -5.958499431610107, "global_step": 57662, "epoch": 1372} {"train_loss": -5.7773942947387695, "global_step": 57663, "epoch": 1372} {"train_loss": -5.936032772064209, "global_step": 57664, "epoch": 1372} {"train_loss": -5.871056409109206, "global_step": 57665, "epoch": 1372, "val_loss": 74667.4453125} {"train_loss": -5.805200576782227, "global_step": 57666, "epoch": 1373} {"train_loss": -5.692983627319336, "global_step": 57667, "epoch": 1373} {"train_loss": -5.79811954498291, "global_step": 57668, "epoch": 1373} {"train_loss": -5.862215995788574, "global_step": 57669, "epoch": 1373} {"train_loss": -5.783341407775879, "global_step": 57670, "epoch": 1373} {"train_loss": -5.791027069091797, "global_step": 57671, "epoch": 1373} {"train_loss": -5.8247761726379395, "global_step": 57672, "epoch": 1373} {"train_loss": -5.88961124420166, "global_step": 57673, "epoch": 1373} {"train_loss": -5.811819076538086, "global_step": 57674, "epoch": 1373} {"train_loss": -5.6625566482543945, "global_step": 57675, "epoch": 1373} {"train_loss": -5.922524929046631, "global_step": 57676, "epoch": 1373} {"train_loss": -5.845290184020996, "global_step": 57677, "epoch": 1373} {"train_loss": -5.964824199676514, "global_step": 57678, "epoch": 1373} {"train_loss": -5.86623477935791, "global_step": 57679, "epoch": 1373} {"train_loss": -5.834541320800781, "global_step": 57680, "epoch": 1373} {"train_loss": -6.0977783203125, "global_step": 57681, "epoch": 1373} {"train_loss": -5.931704998016357, "global_step": 57682, "epoch": 1373} {"train_loss": -5.935277938842773, "global_step": 57683, "epoch": 1373} {"train_loss": -5.848960876464844, "global_step": 57684, "epoch": 1373} {"train_loss": -5.844357013702393, "global_step": 57685, "epoch": 1373} {"train_loss": -5.9457244873046875, "global_step": 57686, "epoch": 1373} {"train_loss": -5.810459136962891, "global_step": 57687, "epoch": 1373} {"train_loss": -5.904491424560547, "global_step": 57688, "epoch": 1373} {"train_loss": -5.795788764953613, "global_step": 57689, "epoch": 1373} {"train_loss": -5.8792219161987305, "global_step": 57690, "epoch": 1373} {"train_loss": -5.97404146194458, "global_step": 57691, "epoch": 1373} {"train_loss": -5.823204517364502, "global_step": 57692, "epoch": 1373} {"train_loss": -5.8151655197143555, "global_step": 57693, "epoch": 1373} {"train_loss": -5.989597320556641, "global_step": 57694, "epoch": 1373} {"train_loss": -5.888430595397949, "global_step": 57695, "epoch": 1373} {"train_loss": -5.876433372497559, "global_step": 57696, "epoch": 1373} {"train_loss": -5.9152326583862305, "global_step": 57697, "epoch": 1373} {"train_loss": -5.890895366668701, "global_step": 57698, "epoch": 1373} {"train_loss": -5.920863151550293, "global_step": 57699, "epoch": 1373} {"train_loss": -6.026854515075684, "global_step": 57700, "epoch": 1373} {"train_loss": -5.973605155944824, "global_step": 57701, "epoch": 1373} {"train_loss": -5.858001708984375, "global_step": 57702, "epoch": 1373} {"train_loss": -5.905359268188477, "global_step": 57703, "epoch": 1373} {"train_loss": -5.6920342445373535, "global_step": 57704, "epoch": 1373} {"train_loss": -5.8916826248168945, "global_step": 57705, "epoch": 1373} {"train_loss": -5.882514476776123, "global_step": 57706, "epoch": 1373} {"train_loss": -5.867926415942964, "global_step": 57707, "epoch": 1373, "val_loss": 74388.859375} {"train_loss": -5.92657470703125, "global_step": 57708, "epoch": 1374} {"train_loss": -5.864360809326172, "global_step": 57709, "epoch": 1374} {"train_loss": -5.822861194610596, "global_step": 57710, "epoch": 1374} {"train_loss": -5.80601692199707, "global_step": 57711, "epoch": 1374} {"train_loss": -5.855379104614258, "global_step": 57712, "epoch": 1374} {"train_loss": -5.959159851074219, "global_step": 57713, "epoch": 1374} {"train_loss": -5.726016044616699, "global_step": 57714, "epoch": 1374} {"train_loss": -5.836188316345215, "global_step": 57715, "epoch": 1374} {"train_loss": -5.867148399353027, "global_step": 57716, "epoch": 1374} {"train_loss": -5.835665702819824, "global_step": 57717, "epoch": 1374} {"train_loss": -5.904702186584473, "global_step": 57718, "epoch": 1374} {"train_loss": -5.911243438720703, "global_step": 57719, "epoch": 1374} {"train_loss": -6.00537109375, "global_step": 57720, "epoch": 1374} {"train_loss": -5.949592590332031, "global_step": 57721, "epoch": 1374} {"train_loss": -5.796878814697266, "global_step": 57722, "epoch": 1374} {"train_loss": -5.822864055633545, "global_step": 57723, "epoch": 1374} {"train_loss": -5.825818061828613, "global_step": 57724, "epoch": 1374} {"train_loss": -5.722838401794434, "global_step": 57725, "epoch": 1374} {"train_loss": -5.73399543762207, "global_step": 57726, "epoch": 1374} {"train_loss": -5.873140335083008, "global_step": 57727, "epoch": 1374} {"train_loss": -5.727024555206299, "global_step": 57728, "epoch": 1374} {"train_loss": -5.903632164001465, "global_step": 57729, "epoch": 1374} {"train_loss": -5.722568511962891, "global_step": 57730, "epoch": 1374} {"train_loss": -5.7173237800598145, "global_step": 57731, "epoch": 1374} {"train_loss": -5.778932571411133, "global_step": 57732, "epoch": 1374} {"train_loss": -5.762157917022705, "global_step": 57733, "epoch": 1374} {"train_loss": -5.575878620147705, "global_step": 57734, "epoch": 1374} {"train_loss": -5.824847221374512, "global_step": 57735, "epoch": 1374} {"train_loss": -5.681518077850342, "global_step": 57736, "epoch": 1374} {"train_loss": -5.796676158905029, "global_step": 57737, "epoch": 1374} {"train_loss": -5.778648376464844, "global_step": 57738, "epoch": 1374} {"train_loss": -5.850711822509766, "global_step": 57739, "epoch": 1374} {"train_loss": -5.722417831420898, "global_step": 57740, "epoch": 1374} {"train_loss": -5.917617321014404, "global_step": 57741, "epoch": 1374} {"train_loss": -5.753525733947754, "global_step": 57742, "epoch": 1374} {"train_loss": -5.746111869812012, "global_step": 57743, "epoch": 1374} {"train_loss": -5.802351951599121, "global_step": 57744, "epoch": 1374} {"train_loss": -6.011005878448486, "global_step": 57745, "epoch": 1374} {"train_loss": -5.8507771492004395, "global_step": 57746, "epoch": 1374} {"train_loss": -5.929210662841797, "global_step": 57747, "epoch": 1374} {"train_loss": -5.770200729370117, "global_step": 57748, "epoch": 1374} {"train_loss": -5.823871453603108, "global_step": 57749, "epoch": 1374, "val_loss": 74683.734375} {"train_loss": -5.838618278503418, "global_step": 57750, "epoch": 1375} {"train_loss": -5.873293399810791, "global_step": 57751, "epoch": 1375} {"train_loss": -5.7678751945495605, "global_step": 57752, "epoch": 1375} {"train_loss": -5.822574615478516, "global_step": 57753, "epoch": 1375} {"train_loss": -5.973625659942627, "global_step": 57754, "epoch": 1375} {"train_loss": -5.8084635734558105, "global_step": 57755, "epoch": 1375} {"train_loss": -5.90676212310791, "global_step": 57756, "epoch": 1375} {"train_loss": -5.928043365478516, "global_step": 57757, "epoch": 1375} {"train_loss": -5.892086982727051, "global_step": 57758, "epoch": 1375} {"train_loss": -5.902935981750488, "global_step": 57759, "epoch": 1375} {"train_loss": -5.890571117401123, "global_step": 57760, "epoch": 1375} {"train_loss": -5.931766986846924, "global_step": 57761, "epoch": 1375} {"train_loss": -5.96611213684082, "global_step": 57762, "epoch": 1375} {"train_loss": -5.848209381103516, "global_step": 57763, "epoch": 1375} {"train_loss": -5.871077537536621, "global_step": 57764, "epoch": 1375} {"train_loss": -5.8611555099487305, "global_step": 57765, "epoch": 1375} {"train_loss": -5.897546768188477, "global_step": 57766, "epoch": 1375} {"train_loss": -5.878780364990234, "global_step": 57767, "epoch": 1375} {"train_loss": -5.829751968383789, "global_step": 57768, "epoch": 1375} {"train_loss": -5.995158672332764, "global_step": 57769, "epoch": 1375} {"train_loss": -5.9256181716918945, "global_step": 57770, "epoch": 1375} {"train_loss": -5.901244163513184, "global_step": 57771, "epoch": 1375} {"train_loss": -5.887603759765625, "global_step": 57772, "epoch": 1375} {"train_loss": -5.8995513916015625, "global_step": 57773, "epoch": 1375} {"train_loss": -5.869471549987793, "global_step": 57774, "epoch": 1375} {"train_loss": -5.862127304077148, "global_step": 57775, "epoch": 1375} {"train_loss": -5.836040019989014, "global_step": 57776, "epoch": 1375} {"train_loss": -5.750740051269531, "global_step": 57777, "epoch": 1375} {"train_loss": -5.882808685302734, "global_step": 57778, "epoch": 1375} {"train_loss": -5.755519866943359, "global_step": 57779, "epoch": 1375} {"train_loss": -5.938651084899902, "global_step": 57780, "epoch": 1375} {"train_loss": -5.90684700012207, "global_step": 57781, "epoch": 1375} {"train_loss": -5.831147193908691, "global_step": 57782, "epoch": 1375} {"train_loss": -5.880974769592285, "global_step": 57783, "epoch": 1375} {"train_loss": -5.910315990447998, "global_step": 57784, "epoch": 1375} {"train_loss": -5.889423847198486, "global_step": 57785, "epoch": 1375} {"train_loss": -5.8748016357421875, "global_step": 57786, "epoch": 1375} {"train_loss": -5.984994888305664, "global_step": 57787, "epoch": 1375} {"train_loss": -5.854748249053955, "global_step": 57788, "epoch": 1375} {"train_loss": -5.772672653198242, "global_step": 57789, "epoch": 1375} {"train_loss": -5.966141700744629, "global_step": 57790, "epoch": 1375} {"train_loss": -5.878335328329177, "global_step": 57791, "epoch": 1375, "val_loss": 74400.640625} {"train_loss": -5.855515480041504, "global_step": 57792, "epoch": 1376} {"train_loss": -5.7223100662231445, "global_step": 57793, "epoch": 1376} {"train_loss": -5.908884048461914, "global_step": 57794, "epoch": 1376} {"train_loss": -5.9483442306518555, "global_step": 57795, "epoch": 1376} {"train_loss": -5.845932960510254, "global_step": 57796, "epoch": 1376} {"train_loss": -5.840442657470703, "global_step": 57797, "epoch": 1376} {"train_loss": -5.925803184509277, "global_step": 57798, "epoch": 1376} {"train_loss": -5.855180263519287, "global_step": 57799, "epoch": 1376} {"train_loss": -5.772265434265137, "global_step": 57800, "epoch": 1376} {"train_loss": -5.8298492431640625, "global_step": 57801, "epoch": 1376} {"train_loss": -5.878878593444824, "global_step": 57802, "epoch": 1376} {"train_loss": -5.783171653747559, "global_step": 57803, "epoch": 1376} {"train_loss": -5.833037376403809, "global_step": 57804, "epoch": 1376} {"train_loss": -5.865106105804443, "global_step": 57805, "epoch": 1376} {"train_loss": -5.975147724151611, "global_step": 57806, "epoch": 1376} {"train_loss": -5.84477424621582, "global_step": 57807, "epoch": 1376} {"train_loss": -5.745250701904297, "global_step": 57808, "epoch": 1376} {"train_loss": -5.8964691162109375, "global_step": 57809, "epoch": 1376} {"train_loss": -5.790531635284424, "global_step": 57810, "epoch": 1376} {"train_loss": -5.903018951416016, "global_step": 57811, "epoch": 1376} {"train_loss": -5.7494683265686035, "global_step": 57812, "epoch": 1376} {"train_loss": -5.675006866455078, "global_step": 57813, "epoch": 1376} {"train_loss": -5.988749980926514, "global_step": 57814, "epoch": 1376} {"train_loss": -5.716750144958496, "global_step": 57815, "epoch": 1376} {"train_loss": -5.804584503173828, "global_step": 57816, "epoch": 1376} {"train_loss": -5.826440811157227, "global_step": 57817, "epoch": 1376} {"train_loss": -5.721903324127197, "global_step": 57818, "epoch": 1376} {"train_loss": -5.935126304626465, "global_step": 57819, "epoch": 1376} {"train_loss": -5.907070159912109, "global_step": 57820, "epoch": 1376} {"train_loss": -5.709654808044434, "global_step": 57821, "epoch": 1376} {"train_loss": -5.8174638748168945, "global_step": 57822, "epoch": 1376} {"train_loss": -5.780353546142578, "global_step": 57823, "epoch": 1376} {"train_loss": -5.866684436798096, "global_step": 57824, "epoch": 1376} {"train_loss": -5.776273250579834, "global_step": 57825, "epoch": 1376} {"train_loss": -5.855207443237305, "global_step": 57826, "epoch": 1376} {"train_loss": -5.814897060394287, "global_step": 57827, "epoch": 1376} {"train_loss": -5.905266761779785, "global_step": 57828, "epoch": 1376} {"train_loss": -5.752256393432617, "global_step": 57829, "epoch": 1376} {"train_loss": -5.88735294342041, "global_step": 57830, "epoch": 1376} {"train_loss": -5.862264633178711, "global_step": 57831, "epoch": 1376} {"train_loss": -5.857424736022949, "global_step": 57832, "epoch": 1376} {"train_loss": -5.835339761915661, "global_step": 57833, "epoch": 1376, "val_loss": 74786.953125} {"train_loss": -5.768653869628906, "global_step": 57834, "epoch": 1377} {"train_loss": -5.853187561035156, "global_step": 57835, "epoch": 1377} {"train_loss": -5.872992515563965, "global_step": 57836, "epoch": 1377} {"train_loss": -5.879605293273926, "global_step": 57837, "epoch": 1377} {"train_loss": -5.826152801513672, "global_step": 57838, "epoch": 1377} {"train_loss": -5.837566375732422, "global_step": 57839, "epoch": 1377} {"train_loss": -5.891547203063965, "global_step": 57840, "epoch": 1377} {"train_loss": -5.903975486755371, "global_step": 57841, "epoch": 1377} {"train_loss": -5.835709571838379, "global_step": 57842, "epoch": 1377} {"train_loss": -5.894678115844727, "global_step": 57843, "epoch": 1377} {"train_loss": -6.0181565284729, "global_step": 57844, "epoch": 1377} {"train_loss": -5.900875091552734, "global_step": 57845, "epoch": 1377} {"train_loss": -5.951406478881836, "global_step": 57846, "epoch": 1377} {"train_loss": -5.826164722442627, "global_step": 57847, "epoch": 1377} {"train_loss": -5.879347801208496, "global_step": 57848, "epoch": 1377} {"train_loss": -5.809764862060547, "global_step": 57849, "epoch": 1377} {"train_loss": -5.874302864074707, "global_step": 57850, "epoch": 1377} {"train_loss": -5.868983745574951, "global_step": 57851, "epoch": 1377} {"train_loss": -5.809671401977539, "global_step": 57852, "epoch": 1377} {"train_loss": -5.695440769195557, "global_step": 57853, "epoch": 1377} {"train_loss": -5.8093976974487305, "global_step": 57854, "epoch": 1377} {"train_loss": -5.87406587600708, "global_step": 57855, "epoch": 1377} {"train_loss": -5.798701286315918, "global_step": 57856, "epoch": 1377} {"train_loss": -6.023727893829346, "global_step": 57857, "epoch": 1377} {"train_loss": -5.782242774963379, "global_step": 57858, "epoch": 1377} {"train_loss": -5.779469966888428, "global_step": 57859, "epoch": 1377} {"train_loss": -5.755033016204834, "global_step": 57860, "epoch": 1377} {"train_loss": -5.832859039306641, "global_step": 57861, "epoch": 1377} {"train_loss": -5.854894161224365, "global_step": 57862, "epoch": 1377} {"train_loss": -5.92457389831543, "global_step": 57863, "epoch": 1377} {"train_loss": -5.865569591522217, "global_step": 57864, "epoch": 1377} {"train_loss": -5.852530479431152, "global_step": 57865, "epoch": 1377} {"train_loss": -5.900686264038086, "global_step": 57866, "epoch": 1377} {"train_loss": -5.920148849487305, "global_step": 57867, "epoch": 1377} {"train_loss": -6.023318290710449, "global_step": 57868, "epoch": 1377} {"train_loss": -6.003963470458984, "global_step": 57869, "epoch": 1377} {"train_loss": -5.912385940551758, "global_step": 57870, "epoch": 1377} {"train_loss": -5.896320819854736, "global_step": 57871, "epoch": 1377} {"train_loss": -5.923841953277588, "global_step": 57872, "epoch": 1377} {"train_loss": -5.921006679534912, "global_step": 57873, "epoch": 1377} {"train_loss": -6.0755391120910645, "global_step": 57874, "epoch": 1377} {"train_loss": -5.878127450034732, "global_step": 57875, "epoch": 1377, "val_loss": 74221.21875} {"train_loss": -5.891898155212402, "global_step": 57876, "epoch": 1378} {"train_loss": -5.898806571960449, "global_step": 57877, "epoch": 1378} {"train_loss": -5.822253227233887, "global_step": 57878, "epoch": 1378} {"train_loss": -5.858290672302246, "global_step": 57879, "epoch": 1378} {"train_loss": -5.92464542388916, "global_step": 57880, "epoch": 1378} {"train_loss": -5.942392349243164, "global_step": 57881, "epoch": 1378} {"train_loss": -5.827847003936768, "global_step": 57882, "epoch": 1378} {"train_loss": -5.941997051239014, "global_step": 57883, "epoch": 1378} {"train_loss": -5.916426658630371, "global_step": 57884, "epoch": 1378} {"train_loss": -5.918590545654297, "global_step": 57885, "epoch": 1378} {"train_loss": -5.807730197906494, "global_step": 57886, "epoch": 1378} {"train_loss": -5.919928550720215, "global_step": 57887, "epoch": 1378} {"train_loss": -5.8381781578063965, "global_step": 57888, "epoch": 1378} {"train_loss": -5.966740131378174, "global_step": 57889, "epoch": 1378} {"train_loss": -5.857524394989014, "global_step": 57890, "epoch": 1378} {"train_loss": -5.815879821777344, "global_step": 57891, "epoch": 1378} {"train_loss": -5.979250907897949, "global_step": 57892, "epoch": 1378} {"train_loss": -5.890606880187988, "global_step": 57893, "epoch": 1378} {"train_loss": -5.9421916007995605, "global_step": 57894, "epoch": 1378} {"train_loss": -5.931339263916016, "global_step": 57895, "epoch": 1378} {"train_loss": -5.942028999328613, "global_step": 57896, "epoch": 1378} {"train_loss": -5.90889310836792, "global_step": 57897, "epoch": 1378} {"train_loss": -5.911643981933594, "global_step": 57898, "epoch": 1378} {"train_loss": -5.869137287139893, "global_step": 57899, "epoch": 1378} {"train_loss": -5.791871070861816, "global_step": 57900, "epoch": 1378} {"train_loss": -5.808444976806641, "global_step": 57901, "epoch": 1378} {"train_loss": -5.921147346496582, "global_step": 57902, "epoch": 1378} {"train_loss": -5.82755708694458, "global_step": 57903, "epoch": 1378} {"train_loss": -5.895779132843018, "global_step": 57904, "epoch": 1378} {"train_loss": -5.879956245422363, "global_step": 57905, "epoch": 1378} {"train_loss": -5.833619117736816, "global_step": 57906, "epoch": 1378} {"train_loss": -5.942790985107422, "global_step": 57907, "epoch": 1378} {"train_loss": -5.816473007202148, "global_step": 57908, "epoch": 1378} {"train_loss": -6.011743545532227, "global_step": 57909, "epoch": 1378} {"train_loss": -5.868891716003418, "global_step": 57910, "epoch": 1378} {"train_loss": -5.832039833068848, "global_step": 57911, "epoch": 1378} {"train_loss": -5.8950042724609375, "global_step": 57912, "epoch": 1378} {"train_loss": -5.864457607269287, "global_step": 57913, "epoch": 1378} {"train_loss": -5.906250953674316, "global_step": 57914, "epoch": 1378} {"train_loss": -5.831056594848633, "global_step": 57915, "epoch": 1378} {"train_loss": -5.851285934448242, "global_step": 57916, "epoch": 1378} {"train_loss": -5.884142058236258, "global_step": 57917, "epoch": 1378, "val_loss": 74190.3359375} {"train_loss": -5.924341201782227, "global_step": 57918, "epoch": 1379} {"train_loss": -5.788393497467041, "global_step": 57919, "epoch": 1379} {"train_loss": -5.926278591156006, "global_step": 57920, "epoch": 1379} {"train_loss": -5.855269432067871, "global_step": 57921, "epoch": 1379} {"train_loss": -5.809842586517334, "global_step": 57922, "epoch": 1379} {"train_loss": -5.903613090515137, "global_step": 57923, "epoch": 1379} {"train_loss": -5.915807247161865, "global_step": 57924, "epoch": 1379} {"train_loss": -5.884784698486328, "global_step": 57925, "epoch": 1379} {"train_loss": -5.931247711181641, "global_step": 57926, "epoch": 1379} {"train_loss": -5.882386207580566, "global_step": 57927, "epoch": 1379} {"train_loss": -5.911632537841797, "global_step": 57928, "epoch": 1379} {"train_loss": -5.7749834060668945, "global_step": 57929, "epoch": 1379} {"train_loss": -5.820687294006348, "global_step": 57930, "epoch": 1379} {"train_loss": -5.914610385894775, "global_step": 57931, "epoch": 1379} {"train_loss": -5.803607940673828, "global_step": 57932, "epoch": 1379} {"train_loss": -5.8876423835754395, "global_step": 57933, "epoch": 1379} {"train_loss": -5.813640117645264, "global_step": 57934, "epoch": 1379} {"train_loss": -5.886821269989014, "global_step": 57935, "epoch": 1379} {"train_loss": -5.866990089416504, "global_step": 57936, "epoch": 1379} {"train_loss": -6.072863578796387, "global_step": 57937, "epoch": 1379} {"train_loss": -5.969522476196289, "global_step": 57938, "epoch": 1379} {"train_loss": -5.759767055511475, "global_step": 57939, "epoch": 1379} {"train_loss": -5.892140865325928, "global_step": 57940, "epoch": 1379} {"train_loss": -5.896299362182617, "global_step": 57941, "epoch": 1379} {"train_loss": -5.753434181213379, "global_step": 57942, "epoch": 1379} {"train_loss": -5.963204860687256, "global_step": 57943, "epoch": 1379} {"train_loss": -5.931060791015625, "global_step": 57944, "epoch": 1379} {"train_loss": -5.960453033447266, "global_step": 57945, "epoch": 1379} {"train_loss": -5.905609607696533, "global_step": 57946, "epoch": 1379} {"train_loss": -5.833443641662598, "global_step": 57947, "epoch": 1379} {"train_loss": -5.826690673828125, "global_step": 57948, "epoch": 1379} {"train_loss": -5.845251560211182, "global_step": 57949, "epoch": 1379} {"train_loss": -5.826169013977051, "global_step": 57950, "epoch": 1379} {"train_loss": -5.926885604858398, "global_step": 57951, "epoch": 1379} {"train_loss": -5.802031517028809, "global_step": 57952, "epoch": 1379} {"train_loss": -5.937045574188232, "global_step": 57953, "epoch": 1379} {"train_loss": -5.911079406738281, "global_step": 57954, "epoch": 1379} {"train_loss": -5.899972915649414, "global_step": 57955, "epoch": 1379} {"train_loss": -5.8297882080078125, "global_step": 57956, "epoch": 1379} {"train_loss": -5.918879508972168, "global_step": 57957, "epoch": 1379} {"train_loss": -5.824800491333008, "global_step": 57958, "epoch": 1379} {"train_loss": -5.875609817959013, "global_step": 57959, "epoch": 1379, "val_loss": 74402.140625} {"train_loss": -5.911703109741211, "global_step": 57960, "epoch": 1380} {"train_loss": -5.915826797485352, "global_step": 57961, "epoch": 1380} {"train_loss": -5.8854265213012695, "global_step": 57962, "epoch": 1380} {"train_loss": -5.881677627563477, "global_step": 57963, "epoch": 1380} {"train_loss": -5.8744096755981445, "global_step": 57964, "epoch": 1380} {"train_loss": -5.806713104248047, "global_step": 57965, "epoch": 1380} {"train_loss": -5.971858978271484, "global_step": 57966, "epoch": 1380} {"train_loss": -5.931231498718262, "global_step": 57967, "epoch": 1380} {"train_loss": -5.99782133102417, "global_step": 57968, "epoch": 1380} {"train_loss": -5.841968536376953, "global_step": 57969, "epoch": 1380} {"train_loss": -5.813482284545898, "global_step": 57970, "epoch": 1380} {"train_loss": -5.899028778076172, "global_step": 57971, "epoch": 1380} {"train_loss": -5.860175609588623, "global_step": 57972, "epoch": 1380} {"train_loss": -5.87303352355957, "global_step": 57973, "epoch": 1380} {"train_loss": -5.852212429046631, "global_step": 57974, "epoch": 1380} {"train_loss": -5.901024341583252, "global_step": 57975, "epoch": 1380} {"train_loss": -5.78482723236084, "global_step": 57976, "epoch": 1380} {"train_loss": -5.843351364135742, "global_step": 57977, "epoch": 1380} {"train_loss": -5.7668609619140625, "global_step": 57978, "epoch": 1380} {"train_loss": -5.93538761138916, "global_step": 57979, "epoch": 1380} {"train_loss": -5.882601737976074, "global_step": 57980, "epoch": 1380} {"train_loss": -5.9233245849609375, "global_step": 57981, "epoch": 1380} {"train_loss": -5.852277755737305, "global_step": 57982, "epoch": 1380} {"train_loss": -5.890753269195557, "global_step": 57983, "epoch": 1380} {"train_loss": -5.880581855773926, "global_step": 57984, "epoch": 1380} {"train_loss": -5.795414924621582, "global_step": 57985, "epoch": 1380} {"train_loss": -5.775105953216553, "global_step": 57986, "epoch": 1380} {"train_loss": -5.8424811363220215, "global_step": 57987, "epoch": 1380} {"train_loss": -5.974579334259033, "global_step": 57988, "epoch": 1380} {"train_loss": -5.719295501708984, "global_step": 57989, "epoch": 1380} {"train_loss": -5.821262359619141, "global_step": 57990, "epoch": 1380} {"train_loss": -5.821861267089844, "global_step": 57991, "epoch": 1380} {"train_loss": -5.846073627471924, "global_step": 57992, "epoch": 1380} {"train_loss": -5.8216447830200195, "global_step": 57993, "epoch": 1380} {"train_loss": -5.814027786254883, "global_step": 57994, "epoch": 1380} {"train_loss": -5.977198600769043, "global_step": 57995, "epoch": 1380} {"train_loss": -5.7953386306762695, "global_step": 57996, "epoch": 1380} {"train_loss": -5.879730701446533, "global_step": 57997, "epoch": 1380} {"train_loss": -5.799989700317383, "global_step": 57998, "epoch": 1380} {"train_loss": -5.733144283294678, "global_step": 57999, "epoch": 1380} {"train_loss": -5.947854042053223, "global_step": 58000, "epoch": 1380} {"train_loss": -5.859071935926165, "global_step": 58001, "epoch": 1380, "val_loss": 74528.0859375} {"train_loss": -5.96504020690918, "global_step": 58002, "epoch": 1381} {"train_loss": -5.821147441864014, "global_step": 58003, "epoch": 1381} {"train_loss": -5.726470947265625, "global_step": 58004, "epoch": 1381} {"train_loss": -5.813102722167969, "global_step": 58005, "epoch": 1381} {"train_loss": -5.7715325355529785, "global_step": 58006, "epoch": 1381} {"train_loss": -5.862722396850586, "global_step": 58007, "epoch": 1381} {"train_loss": -5.874819755554199, "global_step": 58008, "epoch": 1381} {"train_loss": -5.710363388061523, "global_step": 58009, "epoch": 1381} {"train_loss": -5.916242599487305, "global_step": 58010, "epoch": 1381} {"train_loss": -5.738628387451172, "global_step": 58011, "epoch": 1381} {"train_loss": -5.925622463226318, "global_step": 58012, "epoch": 1381} {"train_loss": -5.770111083984375, "global_step": 58013, "epoch": 1381} {"train_loss": -5.770798683166504, "global_step": 58014, "epoch": 1381} {"train_loss": -5.864769458770752, "global_step": 58015, "epoch": 1381} {"train_loss": -5.845888137817383, "global_step": 58016, "epoch": 1381} {"train_loss": -5.868721961975098, "global_step": 58017, "epoch": 1381} {"train_loss": -5.916254043579102, "global_step": 58018, "epoch": 1381} {"train_loss": -5.803189754486084, "global_step": 58019, "epoch": 1381} {"train_loss": -5.822356224060059, "global_step": 58020, "epoch": 1381} {"train_loss": -5.928861618041992, "global_step": 58021, "epoch": 1381} {"train_loss": -5.9059319496154785, "global_step": 58022, "epoch": 1381} {"train_loss": -5.834535121917725, "global_step": 58023, "epoch": 1381} {"train_loss": -6.012212753295898, "global_step": 58024, "epoch": 1381} {"train_loss": -5.9403815269470215, "global_step": 58025, "epoch": 1381} {"train_loss": -5.821481704711914, "global_step": 58026, "epoch": 1381} {"train_loss": -5.929826736450195, "global_step": 58027, "epoch": 1381} {"train_loss": -6.047045707702637, "global_step": 58028, "epoch": 1381} {"train_loss": -5.937256336212158, "global_step": 58029, "epoch": 1381} {"train_loss": -6.049060344696045, "global_step": 58030, "epoch": 1381} {"train_loss": -5.851974010467529, "global_step": 58031, "epoch": 1381} {"train_loss": -5.887688159942627, "global_step": 58032, "epoch": 1381} {"train_loss": -5.672398567199707, "global_step": 58033, "epoch": 1381} {"train_loss": -5.913215637207031, "global_step": 58034, "epoch": 1381} {"train_loss": -5.913853645324707, "global_step": 58035, "epoch": 1381} {"train_loss": -5.76181697845459, "global_step": 58036, "epoch": 1381} {"train_loss": -5.990396499633789, "global_step": 58037, "epoch": 1381} {"train_loss": -5.783262729644775, "global_step": 58038, "epoch": 1381} {"train_loss": -5.731110572814941, "global_step": 58039, "epoch": 1381} {"train_loss": -5.9283528327941895, "global_step": 58040, "epoch": 1381} {"train_loss": -5.870818138122559, "global_step": 58041, "epoch": 1381} {"train_loss": -5.846676826477051, "global_step": 58042, "epoch": 1381} {"train_loss": -5.85915173803057, "global_step": 58043, "epoch": 1381, "val_loss": 75062.2734375} {"train_loss": -5.666180610656738, "global_step": 58044, "epoch": 1382} {"train_loss": -5.8734540939331055, "global_step": 58045, "epoch": 1382} {"train_loss": -5.7647199630737305, "global_step": 58046, "epoch": 1382} {"train_loss": -5.714175701141357, "global_step": 58047, "epoch": 1382} {"train_loss": -5.92808723449707, "global_step": 58048, "epoch": 1382} {"train_loss": -5.67892599105835, "global_step": 58049, "epoch": 1382} {"train_loss": -5.883535385131836, "global_step": 58050, "epoch": 1382} {"train_loss": -5.8492431640625, "global_step": 58051, "epoch": 1382} {"train_loss": -5.764349937438965, "global_step": 58052, "epoch": 1382} {"train_loss": -5.902196884155273, "global_step": 58053, "epoch": 1382} {"train_loss": -5.836714267730713, "global_step": 58054, "epoch": 1382} {"train_loss": -5.734488487243652, "global_step": 58055, "epoch": 1382} {"train_loss": -5.801590919494629, "global_step": 58056, "epoch": 1382} {"train_loss": -5.788358688354492, "global_step": 58057, "epoch": 1382} {"train_loss": -5.815774917602539, "global_step": 58058, "epoch": 1382} {"train_loss": -5.745571136474609, "global_step": 58059, "epoch": 1382} {"train_loss": -6.006010055541992, "global_step": 58060, "epoch": 1382} {"train_loss": -5.740960121154785, "global_step": 58061, "epoch": 1382} {"train_loss": -5.836068153381348, "global_step": 58062, "epoch": 1382} {"train_loss": -5.763584136962891, "global_step": 58063, "epoch": 1382} {"train_loss": -5.876806259155273, "global_step": 58064, "epoch": 1382} {"train_loss": -5.785940170288086, "global_step": 58065, "epoch": 1382} {"train_loss": -5.933156490325928, "global_step": 58066, "epoch": 1382} {"train_loss": -5.95231819152832, "global_step": 58067, "epoch": 1382} {"train_loss": -5.839581489562988, "global_step": 58068, "epoch": 1382} {"train_loss": -5.823355197906494, "global_step": 58069, "epoch": 1382} {"train_loss": -5.858926773071289, "global_step": 58070, "epoch": 1382} {"train_loss": -5.95806884765625, "global_step": 58071, "epoch": 1382} {"train_loss": -5.869376182556152, "global_step": 58072, "epoch": 1382} {"train_loss": -5.820459842681885, "global_step": 58073, "epoch": 1382} {"train_loss": -5.795563220977783, "global_step": 58074, "epoch": 1382} {"train_loss": -5.746882915496826, "global_step": 58075, "epoch": 1382} {"train_loss": -5.955915927886963, "global_step": 58076, "epoch": 1382} {"train_loss": -5.918757438659668, "global_step": 58077, "epoch": 1382} {"train_loss": -5.945323944091797, "global_step": 58078, "epoch": 1382} {"train_loss": -5.913937568664551, "global_step": 58079, "epoch": 1382} {"train_loss": -5.80674934387207, "global_step": 58080, "epoch": 1382} {"train_loss": -5.859071731567383, "global_step": 58081, "epoch": 1382} {"train_loss": -5.966021537780762, "global_step": 58082, "epoch": 1382} {"train_loss": -5.876834869384766, "global_step": 58083, "epoch": 1382} {"train_loss": -5.828587055206299, "global_step": 58084, "epoch": 1382} {"train_loss": -5.83957534744626, "global_step": 58085, "epoch": 1382, "val_loss": 74683.3203125} {"train_loss": -5.856396198272705, "global_step": 58086, "epoch": 1383} {"train_loss": -5.881494998931885, "global_step": 58087, "epoch": 1383} {"train_loss": -6.006448745727539, "global_step": 58088, "epoch": 1383} {"train_loss": -5.862517356872559, "global_step": 58089, "epoch": 1383} {"train_loss": -5.8898820877075195, "global_step": 58090, "epoch": 1383} {"train_loss": -5.720798492431641, "global_step": 58091, "epoch": 1383} {"train_loss": -5.953364372253418, "global_step": 58092, "epoch": 1383} {"train_loss": -5.877531051635742, "global_step": 58093, "epoch": 1383} {"train_loss": -5.88236665725708, "global_step": 58094, "epoch": 1383} {"train_loss": -5.861105918884277, "global_step": 58095, "epoch": 1383} {"train_loss": -6.00192403793335, "global_step": 58096, "epoch": 1383} {"train_loss": -5.9191155433654785, "global_step": 58097, "epoch": 1383} {"train_loss": -5.906904220581055, "global_step": 58098, "epoch": 1383} {"train_loss": -5.999785423278809, "global_step": 58099, "epoch": 1383} {"train_loss": -6.071113586425781, "global_step": 58100, "epoch": 1383} {"train_loss": -5.875168800354004, "global_step": 58101, "epoch": 1383} {"train_loss": -5.934540271759033, "global_step": 58102, "epoch": 1383} {"train_loss": -5.865264415740967, "global_step": 58103, "epoch": 1383} {"train_loss": -6.024249076843262, "global_step": 58104, "epoch": 1383} {"train_loss": -5.867349624633789, "global_step": 58105, "epoch": 1383} {"train_loss": -5.92972469329834, "global_step": 58106, "epoch": 1383} {"train_loss": -5.814042091369629, "global_step": 58107, "epoch": 1383} {"train_loss": -5.902113914489746, "global_step": 58108, "epoch": 1383} {"train_loss": -5.846683502197266, "global_step": 58109, "epoch": 1383} {"train_loss": -5.873493671417236, "global_step": 58110, "epoch": 1383} {"train_loss": -5.815324306488037, "global_step": 58111, "epoch": 1383} {"train_loss": -5.7923359870910645, "global_step": 58112, "epoch": 1383} {"train_loss": -5.9111738204956055, "global_step": 58113, "epoch": 1383} {"train_loss": -5.8256988525390625, "global_step": 58114, "epoch": 1383} {"train_loss": -5.830450057983398, "global_step": 58115, "epoch": 1383} {"train_loss": -5.90640926361084, "global_step": 58116, "epoch": 1383} {"train_loss": -5.782844066619873, "global_step": 58117, "epoch": 1383} {"train_loss": -5.76059627532959, "global_step": 58118, "epoch": 1383} {"train_loss": -5.963384628295898, "global_step": 58119, "epoch": 1383} {"train_loss": -5.7789788246154785, "global_step": 58120, "epoch": 1383} {"train_loss": -5.760591506958008, "global_step": 58121, "epoch": 1383} {"train_loss": -5.907451629638672, "global_step": 58122, "epoch": 1383} {"train_loss": -5.822698593139648, "global_step": 58123, "epoch": 1383} {"train_loss": -5.759596347808838, "global_step": 58124, "epoch": 1383} {"train_loss": -5.865506172180176, "global_step": 58125, "epoch": 1383} {"train_loss": -5.929736137390137, "global_step": 58126, "epoch": 1383} {"train_loss": -5.87940552121117, "global_step": 58127, "epoch": 1383, "val_loss": 74300.7578125} {"train_loss": -5.89989709854126, "global_step": 58128, "epoch": 1384} {"train_loss": -5.920993804931641, "global_step": 58129, "epoch": 1384} {"train_loss": -6.011354446411133, "global_step": 58130, "epoch": 1384} {"train_loss": -5.819520473480225, "global_step": 58131, "epoch": 1384} {"train_loss": -6.008181095123291, "global_step": 58132, "epoch": 1384} {"train_loss": -5.6861090660095215, "global_step": 58133, "epoch": 1384} {"train_loss": -5.801677703857422, "global_step": 58134, "epoch": 1384} {"train_loss": -5.828413009643555, "global_step": 58135, "epoch": 1384} {"train_loss": -5.9745402336120605, "global_step": 58136, "epoch": 1384} {"train_loss": -5.830974578857422, "global_step": 58137, "epoch": 1384} {"train_loss": -5.982499599456787, "global_step": 58138, "epoch": 1384} {"train_loss": -5.9490861892700195, "global_step": 58139, "epoch": 1384} {"train_loss": -5.867696285247803, "global_step": 58140, "epoch": 1384} {"train_loss": -5.7745256423950195, "global_step": 58141, "epoch": 1384} {"train_loss": -5.80272102355957, "global_step": 58142, "epoch": 1384} {"train_loss": -5.858687400817871, "global_step": 58143, "epoch": 1384} {"train_loss": -5.764613151550293, "global_step": 58144, "epoch": 1384} {"train_loss": -5.9422101974487305, "global_step": 58145, "epoch": 1384} {"train_loss": -5.868420600891113, "global_step": 58146, "epoch": 1384} {"train_loss": -5.836042404174805, "global_step": 58147, "epoch": 1384} {"train_loss": -5.962258338928223, "global_step": 58148, "epoch": 1384} {"train_loss": -5.7673115730285645, "global_step": 58149, "epoch": 1384} {"train_loss": -5.973996162414551, "global_step": 58150, "epoch": 1384} {"train_loss": -5.896238327026367, "global_step": 58151, "epoch": 1384} {"train_loss": -5.8062896728515625, "global_step": 58152, "epoch": 1384} {"train_loss": -5.960114479064941, "global_step": 58153, "epoch": 1384} {"train_loss": -5.900632858276367, "global_step": 58154, "epoch": 1384} {"train_loss": -5.960119247436523, "global_step": 58155, "epoch": 1384} {"train_loss": -5.940485000610352, "global_step": 58156, "epoch": 1384} {"train_loss": -5.939122200012207, "global_step": 58157, "epoch": 1384} {"train_loss": -5.899544715881348, "global_step": 58158, "epoch": 1384} {"train_loss": -5.833657264709473, "global_step": 58159, "epoch": 1384} {"train_loss": -5.912156581878662, "global_step": 58160, "epoch": 1384} {"train_loss": -6.028921604156494, "global_step": 58161, "epoch": 1384} {"train_loss": -5.796877861022949, "global_step": 58162, "epoch": 1384} {"train_loss": -5.976527214050293, "global_step": 58163, "epoch": 1384} {"train_loss": -5.877503871917725, "global_step": 58164, "epoch": 1384} {"train_loss": -5.920910358428955, "global_step": 58165, "epoch": 1384} {"train_loss": -5.912843227386475, "global_step": 58166, "epoch": 1384} {"train_loss": -5.817491054534912, "global_step": 58167, "epoch": 1384} {"train_loss": -5.707026481628418, "global_step": 58168, "epoch": 1384} {"train_loss": -5.88254071417309, "global_step": 58169, "epoch": 1384, "val_loss": 74451.0078125} {"train_loss": -5.7599711418151855, "global_step": 58170, "epoch": 1385} {"train_loss": -5.873662948608398, "global_step": 58171, "epoch": 1385} {"train_loss": -5.968372344970703, "global_step": 58172, "epoch": 1385} {"train_loss": -5.708509922027588, "global_step": 58173, "epoch": 1385} {"train_loss": -5.869921684265137, "global_step": 58174, "epoch": 1385} {"train_loss": -5.739324569702148, "global_step": 58175, "epoch": 1385} {"train_loss": -5.85102653503418, "global_step": 58176, "epoch": 1385} {"train_loss": -5.882187843322754, "global_step": 58177, "epoch": 1385} {"train_loss": -5.933986663818359, "global_step": 58178, "epoch": 1385} {"train_loss": -5.838804244995117, "global_step": 58179, "epoch": 1385} {"train_loss": -5.842270851135254, "global_step": 58180, "epoch": 1385} {"train_loss": -5.7860822677612305, "global_step": 58181, "epoch": 1385} {"train_loss": -5.944794654846191, "global_step": 58182, "epoch": 1385} {"train_loss": -5.932248115539551, "global_step": 58183, "epoch": 1385} {"train_loss": -5.950742721557617, "global_step": 58184, "epoch": 1385} {"train_loss": -5.864007949829102, "global_step": 58185, "epoch": 1385} {"train_loss": -5.84220552444458, "global_step": 58186, "epoch": 1385} {"train_loss": -5.895857334136963, "global_step": 58187, "epoch": 1385} {"train_loss": -5.9041547775268555, "global_step": 58188, "epoch": 1385} {"train_loss": -5.927213191986084, "global_step": 58189, "epoch": 1385} {"train_loss": -5.759479999542236, "global_step": 58190, "epoch": 1385} {"train_loss": -5.8866472244262695, "global_step": 58191, "epoch": 1385} {"train_loss": -5.917843818664551, "global_step": 58192, "epoch": 1385} {"train_loss": -5.905552864074707, "global_step": 58193, "epoch": 1385} {"train_loss": -5.870791912078857, "global_step": 58194, "epoch": 1385} {"train_loss": -5.7818098068237305, "global_step": 58195, "epoch": 1385} {"train_loss": -5.828006744384766, "global_step": 58196, "epoch": 1385} {"train_loss": -5.953683853149414, "global_step": 58197, "epoch": 1385} {"train_loss": -6.0144453048706055, "global_step": 58198, "epoch": 1385} {"train_loss": -5.816484451293945, "global_step": 58199, "epoch": 1385} {"train_loss": -5.933638572692871, "global_step": 58200, "epoch": 1385} {"train_loss": -5.836841106414795, "global_step": 58201, "epoch": 1385} {"train_loss": -5.921822547912598, "global_step": 58202, "epoch": 1385} {"train_loss": -5.9088873863220215, "global_step": 58203, "epoch": 1385} {"train_loss": -5.90138578414917, "global_step": 58204, "epoch": 1385} {"train_loss": -5.962701797485352, "global_step": 58205, "epoch": 1385} {"train_loss": -5.9623589515686035, "global_step": 58206, "epoch": 1385} {"train_loss": -5.8739142417907715, "global_step": 58207, "epoch": 1385} {"train_loss": -5.900720119476318, "global_step": 58208, "epoch": 1385} {"train_loss": -5.946255207061768, "global_step": 58209, "epoch": 1385} {"train_loss": -5.828265190124512, "global_step": 58210, "epoch": 1385} {"train_loss": -5.879425230480376, "global_step": 58211, "epoch": 1385, "val_loss": 74098.140625} {"train_loss": -5.9601640701293945, "global_step": 58212, "epoch": 1386} {"train_loss": -5.807966232299805, "global_step": 58213, "epoch": 1386} {"train_loss": -5.868206977844238, "global_step": 58214, "epoch": 1386} {"train_loss": -5.899867057800293, "global_step": 58215, "epoch": 1386} {"train_loss": -5.918696403503418, "global_step": 58216, "epoch": 1386} {"train_loss": -5.9004411697387695, "global_step": 58217, "epoch": 1386} {"train_loss": -5.873649597167969, "global_step": 58218, "epoch": 1386} {"train_loss": -5.798748016357422, "global_step": 58219, "epoch": 1386} {"train_loss": -5.903387069702148, "global_step": 58220, "epoch": 1386} {"train_loss": -5.879571437835693, "global_step": 58221, "epoch": 1386} {"train_loss": -5.987449645996094, "global_step": 58222, "epoch": 1386} {"train_loss": -5.887546539306641, "global_step": 58223, "epoch": 1386} {"train_loss": -5.7233991622924805, "global_step": 58224, "epoch": 1386} {"train_loss": -5.794757843017578, "global_step": 58225, "epoch": 1386} {"train_loss": -5.851237773895264, "global_step": 58226, "epoch": 1386} {"train_loss": -5.769295692443848, "global_step": 58227, "epoch": 1386} {"train_loss": -5.852538108825684, "global_step": 58228, "epoch": 1386} {"train_loss": -5.759003639221191, "global_step": 58229, "epoch": 1386} {"train_loss": -5.901993274688721, "global_step": 58230, "epoch": 1386} {"train_loss": -5.9472575187683105, "global_step": 58231, "epoch": 1386} {"train_loss": -5.84047794342041, "global_step": 58232, "epoch": 1386} {"train_loss": -5.705984115600586, "global_step": 58233, "epoch": 1386} {"train_loss": -5.883964538574219, "global_step": 58234, "epoch": 1386} {"train_loss": -5.917729377746582, "global_step": 58235, "epoch": 1386} {"train_loss": -5.738070011138916, "global_step": 58236, "epoch": 1386} {"train_loss": -5.842507839202881, "global_step": 58237, "epoch": 1386} {"train_loss": -5.882209777832031, "global_step": 58238, "epoch": 1386} {"train_loss": -5.809789657592773, "global_step": 58239, "epoch": 1386} {"train_loss": -5.746628284454346, "global_step": 58240, "epoch": 1386} {"train_loss": -5.924301624298096, "global_step": 58241, "epoch": 1386} {"train_loss": -5.8314056396484375, "global_step": 58242, "epoch": 1386} {"train_loss": -5.92421817779541, "global_step": 58243, "epoch": 1386} {"train_loss": -5.966144561767578, "global_step": 58244, "epoch": 1386} {"train_loss": -5.736392021179199, "global_step": 58245, "epoch": 1386} {"train_loss": -5.813673496246338, "global_step": 58246, "epoch": 1386} {"train_loss": -5.817643642425537, "global_step": 58247, "epoch": 1386} {"train_loss": -5.7201690673828125, "global_step": 58248, "epoch": 1386} {"train_loss": -5.909985542297363, "global_step": 58249, "epoch": 1386} {"train_loss": -5.815995216369629, "global_step": 58250, "epoch": 1386} {"train_loss": -5.927290916442871, "global_step": 58251, "epoch": 1386} {"train_loss": -5.914380073547363, "global_step": 58252, "epoch": 1386} {"train_loss": -5.85512239592416, "global_step": 58253, "epoch": 1386, "val_loss": 74301.3359375} {"train_loss": -5.847935676574707, "global_step": 58254, "epoch": 1387} {"train_loss": -5.878714561462402, "global_step": 58255, "epoch": 1387} {"train_loss": -5.930363655090332, "global_step": 58256, "epoch": 1387} {"train_loss": -5.951625823974609, "global_step": 58257, "epoch": 1387} {"train_loss": -5.901247501373291, "global_step": 58258, "epoch": 1387} {"train_loss": -5.921236991882324, "global_step": 58259, "epoch": 1387} {"train_loss": -5.85077428817749, "global_step": 58260, "epoch": 1387} {"train_loss": -5.943734169006348, "global_step": 58261, "epoch": 1387} {"train_loss": -5.85574197769165, "global_step": 58262, "epoch": 1387} {"train_loss": -5.795943260192871, "global_step": 58263, "epoch": 1387} {"train_loss": -5.930662631988525, "global_step": 58264, "epoch": 1387} {"train_loss": -6.007319927215576, "global_step": 58265, "epoch": 1387} {"train_loss": -5.890042304992676, "global_step": 58266, "epoch": 1387} {"train_loss": -5.949412822723389, "global_step": 58267, "epoch": 1387} {"train_loss": -5.963460445404053, "global_step": 58268, "epoch": 1387} {"train_loss": -5.851109504699707, "global_step": 58269, "epoch": 1387} {"train_loss": -5.962185382843018, "global_step": 58270, "epoch": 1387} {"train_loss": -5.96142578125, "global_step": 58271, "epoch": 1387} {"train_loss": -5.917558670043945, "global_step": 58272, "epoch": 1387} {"train_loss": -5.8786420822143555, "global_step": 58273, "epoch": 1387} {"train_loss": -5.8479180335998535, "global_step": 58274, "epoch": 1387} {"train_loss": -5.8821258544921875, "global_step": 58275, "epoch": 1387} {"train_loss": -5.789499282836914, "global_step": 58276, "epoch": 1387} {"train_loss": -5.8736772537231445, "global_step": 58277, "epoch": 1387} {"train_loss": -5.924748420715332, "global_step": 58278, "epoch": 1387} {"train_loss": -5.853453636169434, "global_step": 58279, "epoch": 1387} {"train_loss": -5.980602264404297, "global_step": 58280, "epoch": 1387} {"train_loss": -5.951026916503906, "global_step": 58281, "epoch": 1387} {"train_loss": -5.942249298095703, "global_step": 58282, "epoch": 1387} {"train_loss": -5.739660739898682, "global_step": 58283, "epoch": 1387} {"train_loss": -5.8841400146484375, "global_step": 58284, "epoch": 1387} {"train_loss": -5.765885829925537, "global_step": 58285, "epoch": 1387} {"train_loss": -5.7688703536987305, "global_step": 58286, "epoch": 1387} {"train_loss": -5.882910251617432, "global_step": 58287, "epoch": 1387} {"train_loss": -5.832736492156982, "global_step": 58288, "epoch": 1387} {"train_loss": -5.899527549743652, "global_step": 58289, "epoch": 1387} {"train_loss": -5.902156352996826, "global_step": 58290, "epoch": 1387} {"train_loss": -5.750739574432373, "global_step": 58291, "epoch": 1387} {"train_loss": -5.894052028656006, "global_step": 58292, "epoch": 1387} {"train_loss": -5.972707748413086, "global_step": 58293, "epoch": 1387} {"train_loss": -5.905825138092041, "global_step": 58294, "epoch": 1387} {"train_loss": -5.889887843813215, "global_step": 58295, "epoch": 1387, "val_loss": 74188.09375} {"train_loss": -5.901676654815674, "global_step": 58296, "epoch": 1388} {"train_loss": -5.784904479980469, "global_step": 58297, "epoch": 1388} {"train_loss": -5.992286682128906, "global_step": 58298, "epoch": 1388} {"train_loss": -5.818708419799805, "global_step": 58299, "epoch": 1388} {"train_loss": -5.829971790313721, "global_step": 58300, "epoch": 1388} {"train_loss": -5.807130813598633, "global_step": 58301, "epoch": 1388} {"train_loss": -5.882695198059082, "global_step": 58302, "epoch": 1388} {"train_loss": -5.826876640319824, "global_step": 58303, "epoch": 1388} {"train_loss": -5.92405891418457, "global_step": 58304, "epoch": 1388} {"train_loss": -5.935486316680908, "global_step": 58305, "epoch": 1388} {"train_loss": -6.0145673751831055, "global_step": 58306, "epoch": 1388} {"train_loss": -5.761976718902588, "global_step": 58307, "epoch": 1388} {"train_loss": -5.780013084411621, "global_step": 58308, "epoch": 1388} {"train_loss": -5.865863800048828, "global_step": 58309, "epoch": 1388} {"train_loss": -5.83512020111084, "global_step": 58310, "epoch": 1388} {"train_loss": -5.7553300857543945, "global_step": 58311, "epoch": 1388} {"train_loss": -5.967022895812988, "global_step": 58312, "epoch": 1388} {"train_loss": -5.806840419769287, "global_step": 58313, "epoch": 1388} {"train_loss": -5.8404459953308105, "global_step": 58314, "epoch": 1388} {"train_loss": -5.856241703033447, "global_step": 58315, "epoch": 1388} {"train_loss": -5.92813777923584, "global_step": 58316, "epoch": 1388} {"train_loss": -5.8757548332214355, "global_step": 58317, "epoch": 1388} {"train_loss": -5.923410892486572, "global_step": 58318, "epoch": 1388} {"train_loss": -5.882582187652588, "global_step": 58319, "epoch": 1388} {"train_loss": -5.88114070892334, "global_step": 58320, "epoch": 1388} {"train_loss": -5.847352027893066, "global_step": 58321, "epoch": 1388} {"train_loss": -5.85262393951416, "global_step": 58322, "epoch": 1388} {"train_loss": -5.861013412475586, "global_step": 58323, "epoch": 1388} {"train_loss": -5.78786563873291, "global_step": 58324, "epoch": 1388} {"train_loss": -5.910732269287109, "global_step": 58325, "epoch": 1388} {"train_loss": -5.890892028808594, "global_step": 58326, "epoch": 1388} {"train_loss": -5.869140625, "global_step": 58327, "epoch": 1388} {"train_loss": -5.904788017272949, "global_step": 58328, "epoch": 1388} {"train_loss": -5.798046588897705, "global_step": 58329, "epoch": 1388} {"train_loss": -5.965944290161133, "global_step": 58330, "epoch": 1388} {"train_loss": -5.887270450592041, "global_step": 58331, "epoch": 1388} {"train_loss": -5.8529205322265625, "global_step": 58332, "epoch": 1388} {"train_loss": -5.818563461303711, "global_step": 58333, "epoch": 1388} {"train_loss": -5.811744689941406, "global_step": 58334, "epoch": 1388} {"train_loss": -5.938743591308594, "global_step": 58335, "epoch": 1388} {"train_loss": -5.767060279846191, "global_step": 58336, "epoch": 1388} {"train_loss": -5.8637715975443525, "global_step": 58337, "epoch": 1388, "val_loss": 74545.5390625} {"train_loss": -5.867624282836914, "global_step": 58338, "epoch": 1389} {"train_loss": -5.967158317565918, "global_step": 58339, "epoch": 1389} {"train_loss": -5.798367500305176, "global_step": 58340, "epoch": 1389} {"train_loss": -5.909486293792725, "global_step": 58341, "epoch": 1389} {"train_loss": -5.782529354095459, "global_step": 58342, "epoch": 1389} {"train_loss": -5.838737487792969, "global_step": 58343, "epoch": 1389} {"train_loss": -5.882196426391602, "global_step": 58344, "epoch": 1389} {"train_loss": -5.839893817901611, "global_step": 58345, "epoch": 1389} {"train_loss": -5.826507568359375, "global_step": 58346, "epoch": 1389} {"train_loss": -5.989739418029785, "global_step": 58347, "epoch": 1389} {"train_loss": -5.805801868438721, "global_step": 58348, "epoch": 1389} {"train_loss": -5.916019439697266, "global_step": 58349, "epoch": 1389} {"train_loss": -5.775649070739746, "global_step": 58350, "epoch": 1389} {"train_loss": -5.862271308898926, "global_step": 58351, "epoch": 1389} {"train_loss": -5.768383502960205, "global_step": 58352, "epoch": 1389} {"train_loss": -5.906620025634766, "global_step": 58353, "epoch": 1389} {"train_loss": -5.8238725662231445, "global_step": 58354, "epoch": 1389} {"train_loss": -5.789203643798828, "global_step": 58355, "epoch": 1389} {"train_loss": -5.936943054199219, "global_step": 58356, "epoch": 1389} {"train_loss": -5.802977561950684, "global_step": 58357, "epoch": 1389} {"train_loss": -5.887679100036621, "global_step": 58358, "epoch": 1389} {"train_loss": -5.936187744140625, "global_step": 58359, "epoch": 1389} {"train_loss": -5.738823413848877, "global_step": 58360, "epoch": 1389} {"train_loss": -5.843866348266602, "global_step": 58361, "epoch": 1389} {"train_loss": -5.850120544433594, "global_step": 58362, "epoch": 1389} {"train_loss": -5.8950886726379395, "global_step": 58363, "epoch": 1389} {"train_loss": -5.7755126953125, "global_step": 58364, "epoch": 1389} {"train_loss": -5.883002758026123, "global_step": 58365, "epoch": 1389} {"train_loss": -5.883737087249756, "global_step": 58366, "epoch": 1389} {"train_loss": -5.865655422210693, "global_step": 58367, "epoch": 1389} {"train_loss": -5.926276683807373, "global_step": 58368, "epoch": 1389} {"train_loss": -5.8458571434021, "global_step": 58369, "epoch": 1389} {"train_loss": -5.737513065338135, "global_step": 58370, "epoch": 1389} {"train_loss": -5.798737525939941, "global_step": 58371, "epoch": 1389} {"train_loss": -5.773345470428467, "global_step": 58372, "epoch": 1389} {"train_loss": -5.7288618087768555, "global_step": 58373, "epoch": 1389} {"train_loss": -6.037395477294922, "global_step": 58374, "epoch": 1389} {"train_loss": -5.8684515953063965, "global_step": 58375, "epoch": 1389} {"train_loss": -5.8690032958984375, "global_step": 58376, "epoch": 1389} {"train_loss": -5.80565071105957, "global_step": 58377, "epoch": 1389} {"train_loss": -5.964524269104004, "global_step": 58378, "epoch": 1389} {"train_loss": -5.853574480329241, "global_step": 58379, "epoch": 1389, "val_loss": 74479.875} {"train_loss": -5.894256591796875, "global_step": 58380, "epoch": 1390} {"train_loss": -5.869112491607666, "global_step": 58381, "epoch": 1390} {"train_loss": -5.92598295211792, "global_step": 58382, "epoch": 1390} {"train_loss": -5.895849227905273, "global_step": 58383, "epoch": 1390} {"train_loss": -5.762521743774414, "global_step": 58384, "epoch": 1390} {"train_loss": -5.926006317138672, "global_step": 58385, "epoch": 1390} {"train_loss": -5.783106803894043, "global_step": 58386, "epoch": 1390} {"train_loss": -5.9602556228637695, "global_step": 58387, "epoch": 1390} {"train_loss": -5.783885478973389, "global_step": 58388, "epoch": 1390} {"train_loss": -5.829174041748047, "global_step": 58389, "epoch": 1390} {"train_loss": -5.837339878082275, "global_step": 58390, "epoch": 1390} {"train_loss": -5.837996482849121, "global_step": 58391, "epoch": 1390} {"train_loss": -5.780922889709473, "global_step": 58392, "epoch": 1390} {"train_loss": -5.886077880859375, "global_step": 58393, "epoch": 1390} {"train_loss": -5.841316223144531, "global_step": 58394, "epoch": 1390} {"train_loss": -5.857715606689453, "global_step": 58395, "epoch": 1390} {"train_loss": -5.7517194747924805, "global_step": 58396, "epoch": 1390} {"train_loss": -5.901565074920654, "global_step": 58397, "epoch": 1390} {"train_loss": -5.831695556640625, "global_step": 58398, "epoch": 1390} {"train_loss": -5.879849910736084, "global_step": 58399, "epoch": 1390} {"train_loss": -5.919508934020996, "global_step": 58400, "epoch": 1390} {"train_loss": -5.917695999145508, "global_step": 58401, "epoch": 1390} {"train_loss": -5.9298787117004395, "global_step": 58402, "epoch": 1390} {"train_loss": -5.84859561920166, "global_step": 58403, "epoch": 1390} {"train_loss": -5.862194061279297, "global_step": 58404, "epoch": 1390} {"train_loss": -5.863821029663086, "global_step": 58405, "epoch": 1390} {"train_loss": -5.8652238845825195, "global_step": 58406, "epoch": 1390} {"train_loss": -5.766815185546875, "global_step": 58407, "epoch": 1390} {"train_loss": -5.791501998901367, "global_step": 58408, "epoch": 1390} {"train_loss": -5.985679626464844, "global_step": 58409, "epoch": 1390} {"train_loss": -5.792684078216553, "global_step": 58410, "epoch": 1390} {"train_loss": -5.8677825927734375, "global_step": 58411, "epoch": 1390} {"train_loss": -5.835657119750977, "global_step": 58412, "epoch": 1390} {"train_loss": -5.879967212677002, "global_step": 58413, "epoch": 1390} {"train_loss": -5.866434097290039, "global_step": 58414, "epoch": 1390} {"train_loss": -5.871686935424805, "global_step": 58415, "epoch": 1390} {"train_loss": -5.752686023712158, "global_step": 58416, "epoch": 1390} {"train_loss": -5.86952018737793, "global_step": 58417, "epoch": 1390} {"train_loss": -6.041042327880859, "global_step": 58418, "epoch": 1390} {"train_loss": -5.910742282867432, "global_step": 58419, "epoch": 1390} {"train_loss": -5.808786869049072, "global_step": 58420, "epoch": 1390} {"train_loss": -5.862833931332543, "global_step": 58421, "epoch": 1390, "val_loss": 74183.5703125} {"train_loss": -5.828418731689453, "global_step": 58422, "epoch": 1391} {"train_loss": -5.894103527069092, "global_step": 58423, "epoch": 1391} {"train_loss": -5.931436061859131, "global_step": 58424, "epoch": 1391} {"train_loss": -5.940289497375488, "global_step": 58425, "epoch": 1391} {"train_loss": -5.873608589172363, "global_step": 58426, "epoch": 1391} {"train_loss": -5.784151077270508, "global_step": 58427, "epoch": 1391} {"train_loss": -5.8779096603393555, "global_step": 58428, "epoch": 1391} {"train_loss": -5.955043792724609, "global_step": 58429, "epoch": 1391} {"train_loss": -5.908090591430664, "global_step": 58430, "epoch": 1391} {"train_loss": -5.982869625091553, "global_step": 58431, "epoch": 1391} {"train_loss": -5.879864692687988, "global_step": 58432, "epoch": 1391} {"train_loss": -5.921692848205566, "global_step": 58433, "epoch": 1391} {"train_loss": -5.929748058319092, "global_step": 58434, "epoch": 1391} {"train_loss": -5.871904373168945, "global_step": 58435, "epoch": 1391} {"train_loss": -5.939046859741211, "global_step": 58436, "epoch": 1391} {"train_loss": -5.942184925079346, "global_step": 58437, "epoch": 1391} {"train_loss": -5.966054439544678, "global_step": 58438, "epoch": 1391} {"train_loss": -5.859211444854736, "global_step": 58439, "epoch": 1391} {"train_loss": -6.022683620452881, "global_step": 58440, "epoch": 1391} {"train_loss": -5.808539867401123, "global_step": 58441, "epoch": 1391} {"train_loss": -5.8258891105651855, "global_step": 58442, "epoch": 1391} {"train_loss": -5.961079120635986, "global_step": 58443, "epoch": 1391} {"train_loss": -5.78702449798584, "global_step": 58444, "epoch": 1391} {"train_loss": -5.905606746673584, "global_step": 58445, "epoch": 1391} {"train_loss": -5.858572006225586, "global_step": 58446, "epoch": 1391} {"train_loss": -6.003790855407715, "global_step": 58447, "epoch": 1391} {"train_loss": -5.946533203125, "global_step": 58448, "epoch": 1391} {"train_loss": -5.856868743896484, "global_step": 58449, "epoch": 1391} {"train_loss": -5.887029647827148, "global_step": 58450, "epoch": 1391} {"train_loss": -5.76715087890625, "global_step": 58451, "epoch": 1391} {"train_loss": -5.850788116455078, "global_step": 58452, "epoch": 1391} {"train_loss": -5.783681869506836, "global_step": 58453, "epoch": 1391} {"train_loss": -5.933055877685547, "global_step": 58454, "epoch": 1391} {"train_loss": -5.914737701416016, "global_step": 58455, "epoch": 1391} {"train_loss": -5.882650852203369, "global_step": 58456, "epoch": 1391} {"train_loss": -5.864659309387207, "global_step": 58457, "epoch": 1391} {"train_loss": -5.788215637207031, "global_step": 58458, "epoch": 1391} {"train_loss": -5.895687580108643, "global_step": 58459, "epoch": 1391} {"train_loss": -5.821894645690918, "global_step": 58460, "epoch": 1391} {"train_loss": -5.875396251678467, "global_step": 58461, "epoch": 1391} {"train_loss": -5.980393409729004, "global_step": 58462, "epoch": 1391} {"train_loss": -5.894744963873, "global_step": 58463, "epoch": 1391, "val_loss": 74335.46875} {"train_loss": -5.951996803283691, "global_step": 58464, "epoch": 1392} {"train_loss": -5.925324440002441, "global_step": 58465, "epoch": 1392} {"train_loss": -5.947751998901367, "global_step": 58466, "epoch": 1392} {"train_loss": -5.725775718688965, "global_step": 58467, "epoch": 1392} {"train_loss": -5.934928894042969, "global_step": 58468, "epoch": 1392} {"train_loss": -5.938315391540527, "global_step": 58469, "epoch": 1392} {"train_loss": -5.9034743309021, "global_step": 58470, "epoch": 1392} {"train_loss": -5.906059265136719, "global_step": 58471, "epoch": 1392} {"train_loss": -5.923617839813232, "global_step": 58472, "epoch": 1392} {"train_loss": -5.9239325523376465, "global_step": 58473, "epoch": 1392} {"train_loss": -5.922717571258545, "global_step": 58474, "epoch": 1392} {"train_loss": -5.842121601104736, "global_step": 58475, "epoch": 1392} {"train_loss": -5.837440490722656, "global_step": 58476, "epoch": 1392} {"train_loss": -5.803733825683594, "global_step": 58477, "epoch": 1392} {"train_loss": -5.847942352294922, "global_step": 58478, "epoch": 1392} {"train_loss": -5.884573936462402, "global_step": 58479, "epoch": 1392} {"train_loss": -5.8284406661987305, "global_step": 58480, "epoch": 1392} {"train_loss": -6.005069732666016, "global_step": 58481, "epoch": 1392} {"train_loss": -5.905056953430176, "global_step": 58482, "epoch": 1392} {"train_loss": -5.873666763305664, "global_step": 58483, "epoch": 1392} {"train_loss": -5.91695499420166, "global_step": 58484, "epoch": 1392} {"train_loss": -5.914304256439209, "global_step": 58485, "epoch": 1392} {"train_loss": -5.894769191741943, "global_step": 58486, "epoch": 1392} {"train_loss": -5.843386173248291, "global_step": 58487, "epoch": 1392} {"train_loss": -5.879345417022705, "global_step": 58488, "epoch": 1392} {"train_loss": -5.756506443023682, "global_step": 58489, "epoch": 1392} {"train_loss": -5.862663269042969, "global_step": 58490, "epoch": 1392} {"train_loss": -5.822937965393066, "global_step": 58491, "epoch": 1392} {"train_loss": -5.760351181030273, "global_step": 58492, "epoch": 1392} {"train_loss": -5.887127876281738, "global_step": 58493, "epoch": 1392} {"train_loss": -5.749733924865723, "global_step": 58494, "epoch": 1392} {"train_loss": -5.946101188659668, "global_step": 58495, "epoch": 1392} {"train_loss": -5.823847770690918, "global_step": 58496, "epoch": 1392} {"train_loss": -5.910186767578125, "global_step": 58497, "epoch": 1392} {"train_loss": -5.888116836547852, "global_step": 58498, "epoch": 1392} {"train_loss": -5.823470592498779, "global_step": 58499, "epoch": 1392} {"train_loss": -5.859161376953125, "global_step": 58500, "epoch": 1392} {"train_loss": -5.85906982421875, "global_step": 58501, "epoch": 1392} {"train_loss": -5.848837852478027, "global_step": 58502, "epoch": 1392} {"train_loss": -5.788152694702148, "global_step": 58503, "epoch": 1392} {"train_loss": -5.802339553833008, "global_step": 58504, "epoch": 1392} {"train_loss": -5.869803315117245, "global_step": 58505, "epoch": 1392, "val_loss": 74270.1953125} {"train_loss": -5.790204048156738, "global_step": 58506, "epoch": 1393} {"train_loss": -5.883668422698975, "global_step": 58507, "epoch": 1393} {"train_loss": -5.772229194641113, "global_step": 58508, "epoch": 1393} {"train_loss": -5.808168411254883, "global_step": 58509, "epoch": 1393} {"train_loss": -5.85772180557251, "global_step": 58510, "epoch": 1393} {"train_loss": -5.75963020324707, "global_step": 58511, "epoch": 1393} {"train_loss": -5.876863479614258, "global_step": 58512, "epoch": 1393} {"train_loss": -5.8223676681518555, "global_step": 58513, "epoch": 1393} {"train_loss": -5.869946479797363, "global_step": 58514, "epoch": 1393} {"train_loss": -5.915956497192383, "global_step": 58515, "epoch": 1393} {"train_loss": -5.888830184936523, "global_step": 58516, "epoch": 1393} {"train_loss": -5.798216819763184, "global_step": 58517, "epoch": 1393} {"train_loss": -5.884025573730469, "global_step": 58518, "epoch": 1393} {"train_loss": -5.809510231018066, "global_step": 58519, "epoch": 1393} {"train_loss": -5.954403877258301, "global_step": 58520, "epoch": 1393} {"train_loss": -5.784336090087891, "global_step": 58521, "epoch": 1393} {"train_loss": -5.7979326248168945, "global_step": 58522, "epoch": 1393} {"train_loss": -5.90289831161499, "global_step": 58523, "epoch": 1393} {"train_loss": -5.975238800048828, "global_step": 58524, "epoch": 1393} {"train_loss": -5.91141939163208, "global_step": 58525, "epoch": 1393} {"train_loss": -5.876127243041992, "global_step": 58526, "epoch": 1393} {"train_loss": -5.916814804077148, "global_step": 58527, "epoch": 1393} {"train_loss": -5.993255615234375, "global_step": 58528, "epoch": 1393} {"train_loss": -5.764293670654297, "global_step": 58529, "epoch": 1393} {"train_loss": -5.829833030700684, "global_step": 58530, "epoch": 1393} {"train_loss": -5.798702239990234, "global_step": 58531, "epoch": 1393} {"train_loss": -5.908026218414307, "global_step": 58532, "epoch": 1393} {"train_loss": -5.6536641120910645, "global_step": 58533, "epoch": 1393} {"train_loss": -5.852090835571289, "global_step": 58534, "epoch": 1393} {"train_loss": -5.800505638122559, "global_step": 58535, "epoch": 1393} {"train_loss": -5.896838188171387, "global_step": 58536, "epoch": 1393} {"train_loss": -6.012179374694824, "global_step": 58537, "epoch": 1393} {"train_loss": -5.7194929122924805, "global_step": 58538, "epoch": 1393} {"train_loss": -5.882572174072266, "global_step": 58539, "epoch": 1393} {"train_loss": -5.848546504974365, "global_step": 58540, "epoch": 1393} {"train_loss": -5.862432479858398, "global_step": 58541, "epoch": 1393} {"train_loss": -5.811407566070557, "global_step": 58542, "epoch": 1393} {"train_loss": -5.8891191482543945, "global_step": 58543, "epoch": 1393} {"train_loss": -6.067325592041016, "global_step": 58544, "epoch": 1393} {"train_loss": -5.890664100646973, "global_step": 58545, "epoch": 1393} {"train_loss": -5.8527936935424805, "global_step": 58546, "epoch": 1393} {"train_loss": -5.859205404917399, "global_step": 58547, "epoch": 1393, "val_loss": 74306.328125} {"train_loss": -5.740931034088135, "global_step": 58548, "epoch": 1394} {"train_loss": -5.824544906616211, "global_step": 58549, "epoch": 1394} {"train_loss": -5.827134132385254, "global_step": 58550, "epoch": 1394} {"train_loss": -5.886593341827393, "global_step": 58551, "epoch": 1394} {"train_loss": -5.828073024749756, "global_step": 58552, "epoch": 1394} {"train_loss": -5.8982462882995605, "global_step": 58553, "epoch": 1394} {"train_loss": -5.848721504211426, "global_step": 58554, "epoch": 1394} {"train_loss": -5.63056755065918, "global_step": 58555, "epoch": 1394} {"train_loss": -5.867023944854736, "global_step": 58556, "epoch": 1394} {"train_loss": -5.894681930541992, "global_step": 58557, "epoch": 1394} {"train_loss": -5.939145088195801, "global_step": 58558, "epoch": 1394} {"train_loss": -5.862602233886719, "global_step": 58559, "epoch": 1394} {"train_loss": -5.940857887268066, "global_step": 58560, "epoch": 1394} {"train_loss": -5.893328666687012, "global_step": 58561, "epoch": 1394} {"train_loss": -5.9138054847717285, "global_step": 58562, "epoch": 1394} {"train_loss": -5.86406135559082, "global_step": 58563, "epoch": 1394} {"train_loss": -5.94533634185791, "global_step": 58564, "epoch": 1394} {"train_loss": -5.936561107635498, "global_step": 58565, "epoch": 1394} {"train_loss": -5.879523277282715, "global_step": 58566, "epoch": 1394} {"train_loss": -5.961058616638184, "global_step": 58567, "epoch": 1394} {"train_loss": -5.961566925048828, "global_step": 58568, "epoch": 1394} {"train_loss": -5.720008373260498, "global_step": 58569, "epoch": 1394} {"train_loss": -5.868037223815918, "global_step": 58570, "epoch": 1394} {"train_loss": -5.730855464935303, "global_step": 58571, "epoch": 1394} {"train_loss": -5.78653621673584, "global_step": 58572, "epoch": 1394} {"train_loss": -5.8227434158325195, "global_step": 58573, "epoch": 1394} {"train_loss": -5.86696720123291, "global_step": 58574, "epoch": 1394} {"train_loss": -5.788842678070068, "global_step": 58575, "epoch": 1394} {"train_loss": -5.903158664703369, "global_step": 58576, "epoch": 1394} {"train_loss": -5.928383827209473, "global_step": 58577, "epoch": 1394} {"train_loss": -5.888340473175049, "global_step": 58578, "epoch": 1394} {"train_loss": -5.962275505065918, "global_step": 58579, "epoch": 1394} {"train_loss": -5.9677019119262695, "global_step": 58580, "epoch": 1394} {"train_loss": -6.003662109375, "global_step": 58581, "epoch": 1394} {"train_loss": -5.826391220092773, "global_step": 58582, "epoch": 1394} {"train_loss": -5.898236274719238, "global_step": 58583, "epoch": 1394} {"train_loss": -5.807525634765625, "global_step": 58584, "epoch": 1394} {"train_loss": -5.821089744567871, "global_step": 58585, "epoch": 1394} {"train_loss": -5.851897239685059, "global_step": 58586, "epoch": 1394} {"train_loss": -5.909945964813232, "global_step": 58587, "epoch": 1394} {"train_loss": -5.860341548919678, "global_step": 58588, "epoch": 1394} {"train_loss": -5.868071976162138, "global_step": 58589, "epoch": 1394, "val_loss": 74317.2578125} {"train_loss": -6.003868103027344, "global_step": 58590, "epoch": 1395} {"train_loss": -5.728213310241699, "global_step": 58591, "epoch": 1395} {"train_loss": -5.867832660675049, "global_step": 58592, "epoch": 1395} {"train_loss": -5.921047210693359, "global_step": 58593, "epoch": 1395} {"train_loss": -5.854092597961426, "global_step": 58594, "epoch": 1395} {"train_loss": -5.848883628845215, "global_step": 58595, "epoch": 1395} {"train_loss": -5.9013671875, "global_step": 58596, "epoch": 1395} {"train_loss": -5.905427932739258, "global_step": 58597, "epoch": 1395} {"train_loss": -5.941861152648926, "global_step": 58598, "epoch": 1395} {"train_loss": -5.836583137512207, "global_step": 58599, "epoch": 1395} {"train_loss": -5.766522407531738, "global_step": 58600, "epoch": 1395} {"train_loss": -5.973815441131592, "global_step": 58601, "epoch": 1395} {"train_loss": -5.949548244476318, "global_step": 58602, "epoch": 1395} {"train_loss": -5.937166690826416, "global_step": 58603, "epoch": 1395} {"train_loss": -5.861785888671875, "global_step": 58604, "epoch": 1395} {"train_loss": -5.902195453643799, "global_step": 58605, "epoch": 1395} {"train_loss": -5.94600248336792, "global_step": 58606, "epoch": 1395} {"train_loss": -5.9207963943481445, "global_step": 58607, "epoch": 1395} {"train_loss": -5.975495338439941, "global_step": 58608, "epoch": 1395} {"train_loss": -5.850262641906738, "global_step": 58609, "epoch": 1395} {"train_loss": -5.988001823425293, "global_step": 58610, "epoch": 1395} {"train_loss": -5.843384265899658, "global_step": 58611, "epoch": 1395} {"train_loss": -5.798849105834961, "global_step": 58612, "epoch": 1395} {"train_loss": -5.883872985839844, "global_step": 58613, "epoch": 1395} {"train_loss": -5.773932456970215, "global_step": 58614, "epoch": 1395} {"train_loss": -5.87449836730957, "global_step": 58615, "epoch": 1395} {"train_loss": -5.980473041534424, "global_step": 58616, "epoch": 1395} {"train_loss": -5.950809478759766, "global_step": 58617, "epoch": 1395} {"train_loss": -5.884410858154297, "global_step": 58618, "epoch": 1395} {"train_loss": -5.939749717712402, "global_step": 58619, "epoch": 1395} {"train_loss": -5.933980464935303, "global_step": 58620, "epoch": 1395} {"train_loss": -5.88764762878418, "global_step": 58621, "epoch": 1395} {"train_loss": -5.725864410400391, "global_step": 58622, "epoch": 1395} {"train_loss": -5.787509918212891, "global_step": 58623, "epoch": 1395} {"train_loss": -5.798328876495361, "global_step": 58624, "epoch": 1395} {"train_loss": -5.827654838562012, "global_step": 58625, "epoch": 1395} {"train_loss": -5.918975830078125, "global_step": 58626, "epoch": 1395} {"train_loss": -5.920736789703369, "global_step": 58627, "epoch": 1395} {"train_loss": -5.986180305480957, "global_step": 58628, "epoch": 1395} {"train_loss": -5.856376647949219, "global_step": 58629, "epoch": 1395} {"train_loss": -5.894447326660156, "global_step": 58630, "epoch": 1395} {"train_loss": -5.8848404203142435, "global_step": 58631, "epoch": 1395, "val_loss": 74702.28125} {"train_loss": -5.862201690673828, "global_step": 58632, "epoch": 1396} {"train_loss": -5.845387935638428, "global_step": 58633, "epoch": 1396} {"train_loss": -5.789702415466309, "global_step": 58634, "epoch": 1396} {"train_loss": -5.962031841278076, "global_step": 58635, "epoch": 1396} {"train_loss": -5.829614162445068, "global_step": 58636, "epoch": 1396} {"train_loss": -5.95866584777832, "global_step": 58637, "epoch": 1396} {"train_loss": -5.763431549072266, "global_step": 58638, "epoch": 1396} {"train_loss": -5.812943458557129, "global_step": 58639, "epoch": 1396} {"train_loss": -5.883111476898193, "global_step": 58640, "epoch": 1396} {"train_loss": -5.8130388259887695, "global_step": 58641, "epoch": 1396} {"train_loss": -5.886699199676514, "global_step": 58642, "epoch": 1396} {"train_loss": -5.874184608459473, "global_step": 58643, "epoch": 1396} {"train_loss": -5.95354700088501, "global_step": 58644, "epoch": 1396} {"train_loss": -5.938713073730469, "global_step": 58645, "epoch": 1396} {"train_loss": -5.764504432678223, "global_step": 58646, "epoch": 1396} {"train_loss": -5.817409992218018, "global_step": 58647, "epoch": 1396} {"train_loss": -5.889030456542969, "global_step": 58648, "epoch": 1396} {"train_loss": -5.841731548309326, "global_step": 58649, "epoch": 1396} {"train_loss": -5.951384544372559, "global_step": 58650, "epoch": 1396} {"train_loss": -5.857785224914551, "global_step": 58651, "epoch": 1396} {"train_loss": -5.812108516693115, "global_step": 58652, "epoch": 1396} {"train_loss": -5.875650882720947, "global_step": 58653, "epoch": 1396} {"train_loss": -5.810969352722168, "global_step": 58654, "epoch": 1396} {"train_loss": -5.728854179382324, "global_step": 58655, "epoch": 1396} {"train_loss": -5.850155353546143, "global_step": 58656, "epoch": 1396} {"train_loss": -5.889187812805176, "global_step": 58657, "epoch": 1396} {"train_loss": -5.886172294616699, "global_step": 58658, "epoch": 1396} {"train_loss": -5.793333053588867, "global_step": 58659, "epoch": 1396} {"train_loss": -5.76629114151001, "global_step": 58660, "epoch": 1396} {"train_loss": -5.784010887145996, "global_step": 58661, "epoch": 1396} {"train_loss": -5.850783348083496, "global_step": 58662, "epoch": 1396} {"train_loss": -5.834270477294922, "global_step": 58663, "epoch": 1396} {"train_loss": -5.775808334350586, "global_step": 58664, "epoch": 1396} {"train_loss": -5.70084810256958, "global_step": 58665, "epoch": 1396} {"train_loss": -5.78287410736084, "global_step": 58666, "epoch": 1396} {"train_loss": -5.7463836669921875, "global_step": 58667, "epoch": 1396} {"train_loss": -5.633429527282715, "global_step": 58668, "epoch": 1396} {"train_loss": -5.686440467834473, "global_step": 58669, "epoch": 1396} {"train_loss": -5.648449897766113, "global_step": 58670, "epoch": 1396} {"train_loss": -5.945812225341797, "global_step": 58671, "epoch": 1396} {"train_loss": -5.75141716003418, "global_step": 58672, "epoch": 1396} {"train_loss": -5.823771170207432, "global_step": 58673, "epoch": 1396, "val_loss": 74464.875} {"train_loss": -5.723777770996094, "global_step": 58674, "epoch": 1397} {"train_loss": -5.766567707061768, "global_step": 58675, "epoch": 1397} {"train_loss": -5.7839837074279785, "global_step": 58676, "epoch": 1397} {"train_loss": -5.794214725494385, "global_step": 58677, "epoch": 1397} {"train_loss": -5.944250106811523, "global_step": 58678, "epoch": 1397} {"train_loss": -5.869377613067627, "global_step": 58679, "epoch": 1397} {"train_loss": -5.977368354797363, "global_step": 58680, "epoch": 1397} {"train_loss": -5.7576518058776855, "global_step": 58681, "epoch": 1397} {"train_loss": -5.751522541046143, "global_step": 58682, "epoch": 1397} {"train_loss": -5.872859954833984, "global_step": 58683, "epoch": 1397} {"train_loss": -5.8212995529174805, "global_step": 58684, "epoch": 1397} {"train_loss": -5.90835428237915, "global_step": 58685, "epoch": 1397} {"train_loss": -5.8255767822265625, "global_step": 58686, "epoch": 1397} {"train_loss": -5.913275241851807, "global_step": 58687, "epoch": 1397} {"train_loss": -5.852328300476074, "global_step": 58688, "epoch": 1397} {"train_loss": -5.919578552246094, "global_step": 58689, "epoch": 1397} {"train_loss": -5.820781707763672, "global_step": 58690, "epoch": 1397} {"train_loss": -5.888788223266602, "global_step": 58691, "epoch": 1397} {"train_loss": -5.950292587280273, "global_step": 58692, "epoch": 1397} {"train_loss": -5.907801151275635, "global_step": 58693, "epoch": 1397} {"train_loss": -5.895952224731445, "global_step": 58694, "epoch": 1397} {"train_loss": -5.823153972625732, "global_step": 58695, "epoch": 1397} {"train_loss": -5.915951251983643, "global_step": 58696, "epoch": 1397} {"train_loss": -5.855550289154053, "global_step": 58697, "epoch": 1397} {"train_loss": -5.848003387451172, "global_step": 58698, "epoch": 1397} {"train_loss": -5.912149429321289, "global_step": 58699, "epoch": 1397} {"train_loss": -5.963778495788574, "global_step": 58700, "epoch": 1397} {"train_loss": -5.834364891052246, "global_step": 58701, "epoch": 1397} {"train_loss": -5.856273651123047, "global_step": 58702, "epoch": 1397} {"train_loss": -5.893315315246582, "global_step": 58703, "epoch": 1397} {"train_loss": -5.869731903076172, "global_step": 58704, "epoch": 1397} {"train_loss": -5.881239891052246, "global_step": 58705, "epoch": 1397} {"train_loss": -5.848092079162598, "global_step": 58706, "epoch": 1397} {"train_loss": -5.8222150802612305, "global_step": 58707, "epoch": 1397} {"train_loss": -5.945644378662109, "global_step": 58708, "epoch": 1397} {"train_loss": -5.890927314758301, "global_step": 58709, "epoch": 1397} {"train_loss": -5.832663059234619, "global_step": 58710, "epoch": 1397} {"train_loss": -5.756186485290527, "global_step": 58711, "epoch": 1397} {"train_loss": -5.7679643630981445, "global_step": 58712, "epoch": 1397} {"train_loss": -5.876129150390625, "global_step": 58713, "epoch": 1397} {"train_loss": -5.976579666137695, "global_step": 58714, "epoch": 1397} {"train_loss": -5.861032985505604, "global_step": 58715, "epoch": 1397, "val_loss": 74315.078125} {"train_loss": -5.823863506317139, "global_step": 58716, "epoch": 1398} {"train_loss": -5.788598537445068, "global_step": 58717, "epoch": 1398} {"train_loss": -5.774717330932617, "global_step": 58718, "epoch": 1398} {"train_loss": -5.816860675811768, "global_step": 58719, "epoch": 1398} {"train_loss": -5.759066104888916, "global_step": 58720, "epoch": 1398} {"train_loss": -5.913528919219971, "global_step": 58721, "epoch": 1398} {"train_loss": -5.893021583557129, "global_step": 58722, "epoch": 1398} {"train_loss": -5.804673194885254, "global_step": 58723, "epoch": 1398} {"train_loss": -5.904438495635986, "global_step": 58724, "epoch": 1398} {"train_loss": -5.849053382873535, "global_step": 58725, "epoch": 1398} {"train_loss": -5.865832328796387, "global_step": 58726, "epoch": 1398} {"train_loss": -5.913823127746582, "global_step": 58727, "epoch": 1398} {"train_loss": -5.910826683044434, "global_step": 58728, "epoch": 1398} {"train_loss": -5.9277801513671875, "global_step": 58729, "epoch": 1398} {"train_loss": -5.916296005249023, "global_step": 58730, "epoch": 1398} {"train_loss": -5.798524379730225, "global_step": 58731, "epoch": 1398} {"train_loss": -5.930554389953613, "global_step": 58732, "epoch": 1398} {"train_loss": -5.847551345825195, "global_step": 58733, "epoch": 1398} {"train_loss": -5.779918193817139, "global_step": 58734, "epoch": 1398} {"train_loss": -5.8231096267700195, "global_step": 58735, "epoch": 1398} {"train_loss": -5.753257751464844, "global_step": 58736, "epoch": 1398} {"train_loss": -6.008289813995361, "global_step": 58737, "epoch": 1398} {"train_loss": -5.792691230773926, "global_step": 58738, "epoch": 1398} {"train_loss": -5.827786445617676, "global_step": 58739, "epoch": 1398} {"train_loss": -5.949662685394287, "global_step": 58740, "epoch": 1398} {"train_loss": -5.906303405761719, "global_step": 58741, "epoch": 1398} {"train_loss": -5.831014156341553, "global_step": 58742, "epoch": 1398} {"train_loss": -5.846188545227051, "global_step": 58743, "epoch": 1398} {"train_loss": -5.8576202392578125, "global_step": 58744, "epoch": 1398} {"train_loss": -5.878170013427734, "global_step": 58745, "epoch": 1398} {"train_loss": -5.904942512512207, "global_step": 58746, "epoch": 1398} {"train_loss": -5.884374618530273, "global_step": 58747, "epoch": 1398} {"train_loss": -5.984092712402344, "global_step": 58748, "epoch": 1398} {"train_loss": -5.772607803344727, "global_step": 58749, "epoch": 1398} {"train_loss": -5.7979936599731445, "global_step": 58750, "epoch": 1398} {"train_loss": -5.912080764770508, "global_step": 58751, "epoch": 1398} {"train_loss": -5.882161617279053, "global_step": 58752, "epoch": 1398} {"train_loss": -5.881869792938232, "global_step": 58753, "epoch": 1398} {"train_loss": -5.801656723022461, "global_step": 58754, "epoch": 1398} {"train_loss": -5.74627685546875, "global_step": 58755, "epoch": 1398} {"train_loss": -5.92079496383667, "global_step": 58756, "epoch": 1398} {"train_loss": -5.8607342810857865, "global_step": 58757, "epoch": 1398, "val_loss": 74467.515625} {"train_loss": -5.906076908111572, "global_step": 58758, "epoch": 1399} {"train_loss": -5.877820014953613, "global_step": 58759, "epoch": 1399} {"train_loss": -5.831480026245117, "global_step": 58760, "epoch": 1399} {"train_loss": -5.835350513458252, "global_step": 58761, "epoch": 1399} {"train_loss": -5.960148811340332, "global_step": 58762, "epoch": 1399} {"train_loss": -5.899825572967529, "global_step": 58763, "epoch": 1399} {"train_loss": -5.880083084106445, "global_step": 58764, "epoch": 1399} {"train_loss": -5.970900535583496, "global_step": 58765, "epoch": 1399} {"train_loss": -5.899494171142578, "global_step": 58766, "epoch": 1399} {"train_loss": -5.941316604614258, "global_step": 58767, "epoch": 1399} {"train_loss": -6.068638324737549, "global_step": 58768, "epoch": 1399} {"train_loss": -5.75146484375, "global_step": 58769, "epoch": 1399} {"train_loss": -5.915622234344482, "global_step": 58770, "epoch": 1399} {"train_loss": -5.753222465515137, "global_step": 58771, "epoch": 1399} {"train_loss": -5.813545227050781, "global_step": 58772, "epoch": 1399} {"train_loss": -6.029208660125732, "global_step": 58773, "epoch": 1399} {"train_loss": -6.025282859802246, "global_step": 58774, "epoch": 1399} {"train_loss": -5.876603126525879, "global_step": 58775, "epoch": 1399} {"train_loss": -5.902407646179199, "global_step": 58776, "epoch": 1399} {"train_loss": -5.887867450714111, "global_step": 58777, "epoch": 1399} {"train_loss": -5.795611381530762, "global_step": 58778, "epoch": 1399} {"train_loss": -5.8479695320129395, "global_step": 58779, "epoch": 1399} {"train_loss": -5.878015518188477, "global_step": 58780, "epoch": 1399} {"train_loss": -6.024491310119629, "global_step": 58781, "epoch": 1399} {"train_loss": -5.984153747558594, "global_step": 58782, "epoch": 1399} {"train_loss": -5.903525352478027, "global_step": 58783, "epoch": 1399} {"train_loss": -5.871607780456543, "global_step": 58784, "epoch": 1399} {"train_loss": -6.076408386230469, "global_step": 58785, "epoch": 1399} {"train_loss": -5.938750267028809, "global_step": 58786, "epoch": 1399} {"train_loss": -5.901615142822266, "global_step": 58787, "epoch": 1399} {"train_loss": -5.858370780944824, "global_step": 58788, "epoch": 1399} {"train_loss": -5.902795791625977, "global_step": 58789, "epoch": 1399} {"train_loss": -5.810856819152832, "global_step": 58790, "epoch": 1399} {"train_loss": -5.955084800720215, "global_step": 58791, "epoch": 1399} {"train_loss": -5.827832221984863, "global_step": 58792, "epoch": 1399} {"train_loss": -5.87662410736084, "global_step": 58793, "epoch": 1399} {"train_loss": -5.8523054122924805, "global_step": 58794, "epoch": 1399} {"train_loss": -5.736122131347656, "global_step": 58795, "epoch": 1399} {"train_loss": -5.910141944885254, "global_step": 58796, "epoch": 1399} {"train_loss": -5.917874336242676, "global_step": 58797, "epoch": 1399} {"train_loss": -5.908942699432373, "global_step": 58798, "epoch": 1399} {"train_loss": -5.893580289114089, "global_step": 58799, "epoch": 1399, "val_loss": 74497.46875} {"train_loss": -5.9586381912231445, "global_step": 58800, "epoch": 1400} {"train_loss": -5.933481216430664, "global_step": 58801, "epoch": 1400} {"train_loss": -5.985637664794922, "global_step": 58802, "epoch": 1400} {"train_loss": -5.975205421447754, "global_step": 58803, "epoch": 1400} {"train_loss": -6.020338535308838, "global_step": 58804, "epoch": 1400} {"train_loss": -5.990285873413086, "global_step": 58805, "epoch": 1400} {"train_loss": -5.831997394561768, "global_step": 58806, "epoch": 1400} {"train_loss": -5.692692756652832, "global_step": 58807, "epoch": 1400} {"train_loss": -5.972296714782715, "global_step": 58808, "epoch": 1400} {"train_loss": -5.818730354309082, "global_step": 58809, "epoch": 1400} {"train_loss": -5.737184047698975, "global_step": 58810, "epoch": 1400} {"train_loss": -5.853705883026123, "global_step": 58811, "epoch": 1400} {"train_loss": -5.749621391296387, "global_step": 58812, "epoch": 1400} {"train_loss": -5.745558738708496, "global_step": 58813, "epoch": 1400} {"train_loss": -6.018857955932617, "global_step": 58814, "epoch": 1400} {"train_loss": -6.066659450531006, "global_step": 58815, "epoch": 1400} {"train_loss": -5.796085357666016, "global_step": 58816, "epoch": 1400} {"train_loss": -5.942832946777344, "global_step": 58817, "epoch": 1400} {"train_loss": -5.893184661865234, "global_step": 58818, "epoch": 1400} {"train_loss": -5.870636463165283, "global_step": 58819, "epoch": 1400} {"train_loss": -5.942407131195068, "global_step": 58820, "epoch": 1400} {"train_loss": -5.791409492492676, "global_step": 58821, "epoch": 1400} {"train_loss": -5.7211785316467285, "global_step": 58822, "epoch": 1400} {"train_loss": -5.925883769989014, "global_step": 58823, "epoch": 1400} {"train_loss": -5.734161376953125, "global_step": 58824, "epoch": 1400} {"train_loss": -5.776562690734863, "global_step": 58825, "epoch": 1400} {"train_loss": -5.76179313659668, "global_step": 58826, "epoch": 1400} {"train_loss": -5.916695594787598, "global_step": 58827, "epoch": 1400} {"train_loss": -5.826769828796387, "global_step": 58828, "epoch": 1400} {"train_loss": -5.869409561157227, "global_step": 58829, "epoch": 1400} {"train_loss": -5.957457542419434, "global_step": 58830, "epoch": 1400} {"train_loss": -5.887408256530762, "global_step": 58831, "epoch": 1400} {"train_loss": -5.820260047912598, "global_step": 58832, "epoch": 1400} {"train_loss": -5.8467912673950195, "global_step": 58833, "epoch": 1400} {"train_loss": -5.881752014160156, "global_step": 58834, "epoch": 1400} {"train_loss": -5.996068000793457, "global_step": 58835, "epoch": 1400} {"train_loss": -5.991333484649658, "global_step": 58836, "epoch": 1400} {"train_loss": -5.954416275024414, "global_step": 58837, "epoch": 1400} {"train_loss": -5.836075782775879, "global_step": 58838, "epoch": 1400} {"train_loss": -5.901679039001465, "global_step": 58839, "epoch": 1400} {"train_loss": -5.933391571044922, "global_step": 58840, "epoch": 1400} {"train_loss": -5.880649521237328, "global_step": 58841, "epoch": 1400, "train/sim_max_reward_0": 0.5475335082301844, "train/sim_max_reward_1": 0.31205029940740525, "train/sim_max_reward_2": 0.9001797587785062, "train/sim_max_reward_3": 0.16099525598156667, "train/sim_max_reward_4": 0.5215010238526454, "train/sim_max_reward_5": 0.31632383545615556, "test/sim_max_reward_4500000": 0.7110645025813503, "test/sim_max_reward_4500001": 0.8310251053485047, "test/sim_max_reward_4500002": 0.825266813624306, "test/sim_max_reward_4500003": 0.5967643940405951, "test/sim_max_reward_4500004": 0.07998108665141815, "test/sim_max_reward_4500005": 0.31501802908725696, "test/sim_max_reward_4500006": 0.9567550645110783, "test/sim_max_reward_4500007": 0.7402815145489569, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.8985512847764692, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.5161497077470033, "test/sim_max_reward_4500012": 1.2998196217210992e-06, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.36770605220595864, "test/sim_max_reward_4500015": 7.33684522307471e-05, "test/sim_max_reward_4500016": 0.385833281836314, "test/sim_max_reward_4500017": 0.03801266595621818, "test/sim_max_reward_4500018": 0.11297983252536677, "test/sim_max_reward_4500019": 0.9312046580800593, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.8361260443089593, "test/sim_max_reward_4500023": 0.8421727569172657, "test/sim_max_reward_4500024": 0.6602603790591274, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.1229165386625927, "test/sim_max_reward_4500027": 0.9501670312598447, "test/sim_max_reward_4500028": 0.23385912230064493, "test/sim_max_reward_4500029": 0.1790928372112118, "test/sim_max_reward_4500030": 0.9204310696194179, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.052042402798202325, "test/sim_max_reward_4500033": 0.2204588222550124, "test/sim_max_reward_4500034": 0.7795972012337409, "test/sim_max_reward_4500035": 0.8662069935302255, "test/sim_max_reward_4500036": 0.47994366358387425, "test/sim_max_reward_4500037": 0.69204151932724, "test/sim_max_reward_4500038": 0.21926038455293634, "test/sim_max_reward_4500039": 0.7796593874649148, "test/sim_max_reward_4500040": 0.9191467896015695, "test/sim_max_reward_4500041": 0.9354331324820541, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.17081422419881193, "test/sim_max_reward_4500044": 0.2350910378344014, "test/sim_max_reward_4500045": 0.7500677808065347, "test/sim_max_reward_4500046": 0.8389640731901372, "test/sim_max_reward_4500047": 0.8236325078411427, "test/sim_max_reward_4500048": 0.9562677240454198, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.45976394695107725, "test/mean_score": 0.4758552346877616, "val_loss": 74681.6875} {"train_loss": -5.8695573806762695, "global_step": 58842, "epoch": 1401} {"train_loss": -5.848200798034668, "global_step": 58843, "epoch": 1401} {"train_loss": -5.906001091003418, "global_step": 58844, "epoch": 1401} {"train_loss": -5.907731056213379, "global_step": 58845, "epoch": 1401} {"train_loss": -5.885571479797363, "global_step": 58846, "epoch": 1401} {"train_loss": -5.852590560913086, "global_step": 58847, "epoch": 1401} {"train_loss": -5.962645053863525, "global_step": 58848, "epoch": 1401} {"train_loss": -5.889583587646484, "global_step": 58849, "epoch": 1401} {"train_loss": -5.957862377166748, "global_step": 58850, "epoch": 1401} {"train_loss": -5.8867292404174805, "global_step": 58851, "epoch": 1401} {"train_loss": -5.919753074645996, "global_step": 58852, "epoch": 1401} {"train_loss": -5.759599685668945, "global_step": 58853, "epoch": 1401} {"train_loss": -5.858006477355957, "global_step": 58854, "epoch": 1401} {"train_loss": -5.899840354919434, "global_step": 58855, "epoch": 1401} {"train_loss": -5.907215118408203, "global_step": 58856, "epoch": 1401} {"train_loss": -5.916791915893555, "global_step": 58857, "epoch": 1401} {"train_loss": -5.943556308746338, "global_step": 58858, "epoch": 1401} {"train_loss": -5.891884803771973, "global_step": 58859, "epoch": 1401} {"train_loss": -5.906267166137695, "global_step": 58860, "epoch": 1401} {"train_loss": -5.892889022827148, "global_step": 58861, "epoch": 1401} {"train_loss": -6.02758264541626, "global_step": 58862, "epoch": 1401} {"train_loss": -5.857261657714844, "global_step": 58863, "epoch": 1401} {"train_loss": -5.935780048370361, "global_step": 58864, "epoch": 1401} {"train_loss": -5.91600227355957, "global_step": 58865, "epoch": 1401} {"train_loss": -5.865403175354004, "global_step": 58866, "epoch": 1401} {"train_loss": -5.94617223739624, "global_step": 58867, "epoch": 1401} {"train_loss": -5.831141471862793, "global_step": 58868, "epoch": 1401} {"train_loss": -5.932555198669434, "global_step": 58869, "epoch": 1401} {"train_loss": -5.919172286987305, "global_step": 58870, "epoch": 1401} {"train_loss": -5.887979030609131, "global_step": 58871, "epoch": 1401} {"train_loss": -5.795009613037109, "global_step": 58872, "epoch": 1401} {"train_loss": -5.943314075469971, "global_step": 58873, "epoch": 1401} {"train_loss": -5.9480791091918945, "global_step": 58874, "epoch": 1401} {"train_loss": -5.736205101013184, "global_step": 58875, "epoch": 1401} {"train_loss": -5.8633527755737305, "global_step": 58876, "epoch": 1401} {"train_loss": -5.9649553298950195, "global_step": 58877, "epoch": 1401} {"train_loss": -5.957149982452393, "global_step": 58878, "epoch": 1401} {"train_loss": -5.802192687988281, "global_step": 58879, "epoch": 1401} {"train_loss": -5.940345764160156, "global_step": 58880, "epoch": 1401} {"train_loss": -5.738955497741699, "global_step": 58881, "epoch": 1401} {"train_loss": -5.714974880218506, "global_step": 58882, "epoch": 1401} {"train_loss": -5.887453624180385, "global_step": 58883, "epoch": 1401, "val_loss": 74694.1953125} {"train_loss": -5.816252708435059, "global_step": 58884, "epoch": 1402} {"train_loss": -5.741756439208984, "global_step": 58885, "epoch": 1402} {"train_loss": -5.847621440887451, "global_step": 58886, "epoch": 1402} {"train_loss": -5.728760719299316, "global_step": 58887, "epoch": 1402} {"train_loss": -5.857728481292725, "global_step": 58888, "epoch": 1402} {"train_loss": -5.868404865264893, "global_step": 58889, "epoch": 1402} {"train_loss": -5.819953918457031, "global_step": 58890, "epoch": 1402} {"train_loss": -5.885470390319824, "global_step": 58891, "epoch": 1402} {"train_loss": -5.785893440246582, "global_step": 58892, "epoch": 1402} {"train_loss": -5.923430442810059, "global_step": 58893, "epoch": 1402} {"train_loss": -5.895885467529297, "global_step": 58894, "epoch": 1402} {"train_loss": -5.856464385986328, "global_step": 58895, "epoch": 1402} {"train_loss": -5.795790672302246, "global_step": 58896, "epoch": 1402} {"train_loss": -5.799939155578613, "global_step": 58897, "epoch": 1402} {"train_loss": -5.879593849182129, "global_step": 58898, "epoch": 1402} {"train_loss": -5.937130928039551, "global_step": 58899, "epoch": 1402} {"train_loss": -5.707867622375488, "global_step": 58900, "epoch": 1402} {"train_loss": -5.855801582336426, "global_step": 58901, "epoch": 1402} {"train_loss": -5.865443229675293, "global_step": 58902, "epoch": 1402} {"train_loss": -5.881488800048828, "global_step": 58903, "epoch": 1402} {"train_loss": -5.968296527862549, "global_step": 58904, "epoch": 1402} {"train_loss": -5.879481315612793, "global_step": 58905, "epoch": 1402} {"train_loss": -5.816366195678711, "global_step": 58906, "epoch": 1402} {"train_loss": -5.817534446716309, "global_step": 58907, "epoch": 1402} {"train_loss": -5.974651336669922, "global_step": 58908, "epoch": 1402} {"train_loss": -5.782020092010498, "global_step": 58909, "epoch": 1402} {"train_loss": -5.899936676025391, "global_step": 58910, "epoch": 1402} {"train_loss": -5.795985221862793, "global_step": 58911, "epoch": 1402} {"train_loss": -5.881674766540527, "global_step": 58912, "epoch": 1402} {"train_loss": -5.9444146156311035, "global_step": 58913, "epoch": 1402} {"train_loss": -5.805932998657227, "global_step": 58914, "epoch": 1402} {"train_loss": -5.942983627319336, "global_step": 58915, "epoch": 1402} {"train_loss": -5.9643378257751465, "global_step": 58916, "epoch": 1402} {"train_loss": -5.940123558044434, "global_step": 58917, "epoch": 1402} {"train_loss": -5.864976406097412, "global_step": 58918, "epoch": 1402} {"train_loss": -5.850481986999512, "global_step": 58919, "epoch": 1402} {"train_loss": -6.011805534362793, "global_step": 58920, "epoch": 1402} {"train_loss": -5.98526668548584, "global_step": 58921, "epoch": 1402} {"train_loss": -5.971273422241211, "global_step": 58922, "epoch": 1402} {"train_loss": -5.956854820251465, "global_step": 58923, "epoch": 1402} {"train_loss": -6.069056987762451, "global_step": 58924, "epoch": 1402} {"train_loss": -5.873757453191848, "global_step": 58925, "epoch": 1402, "val_loss": 74289.8203125} {"train_loss": -5.876369953155518, "global_step": 58926, "epoch": 1403} {"train_loss": -5.895298004150391, "global_step": 58927, "epoch": 1403} {"train_loss": -5.888486862182617, "global_step": 58928, "epoch": 1403} {"train_loss": -5.889104843139648, "global_step": 58929, "epoch": 1403} {"train_loss": -5.879323959350586, "global_step": 58930, "epoch": 1403} {"train_loss": -5.954981803894043, "global_step": 58931, "epoch": 1403} {"train_loss": -5.861128807067871, "global_step": 58932, "epoch": 1403} {"train_loss": -5.763767242431641, "global_step": 58933, "epoch": 1403} {"train_loss": -5.913491249084473, "global_step": 58934, "epoch": 1403} {"train_loss": -5.855478763580322, "global_step": 58935, "epoch": 1403} {"train_loss": -5.847324371337891, "global_step": 58936, "epoch": 1403} {"train_loss": -5.843018054962158, "global_step": 58937, "epoch": 1403} {"train_loss": -5.819949150085449, "global_step": 58938, "epoch": 1403} {"train_loss": -5.865178108215332, "global_step": 58939, "epoch": 1403} {"train_loss": -5.93519926071167, "global_step": 58940, "epoch": 1403} {"train_loss": -5.844700813293457, "global_step": 58941, "epoch": 1403} {"train_loss": -5.7937331199646, "global_step": 58942, "epoch": 1403} {"train_loss": -5.895331382751465, "global_step": 58943, "epoch": 1403} {"train_loss": -5.906848430633545, "global_step": 58944, "epoch": 1403} {"train_loss": -5.807160377502441, "global_step": 58945, "epoch": 1403} {"train_loss": -5.909922122955322, "global_step": 58946, "epoch": 1403} {"train_loss": -5.833591938018799, "global_step": 58947, "epoch": 1403} {"train_loss": -5.803624629974365, "global_step": 58948, "epoch": 1403} {"train_loss": -5.858303070068359, "global_step": 58949, "epoch": 1403} {"train_loss": -5.931398868560791, "global_step": 58950, "epoch": 1403} {"train_loss": -5.8538737297058105, "global_step": 58951, "epoch": 1403} {"train_loss": -5.899333953857422, "global_step": 58952, "epoch": 1403} {"train_loss": -5.95307731628418, "global_step": 58953, "epoch": 1403} {"train_loss": -5.853598117828369, "global_step": 58954, "epoch": 1403} {"train_loss": -5.843277931213379, "global_step": 58955, "epoch": 1403} {"train_loss": -5.882022380828857, "global_step": 58956, "epoch": 1403} {"train_loss": -5.978758811950684, "global_step": 58957, "epoch": 1403} {"train_loss": -5.795641899108887, "global_step": 58958, "epoch": 1403} {"train_loss": -5.931992530822754, "global_step": 58959, "epoch": 1403} {"train_loss": -5.929522514343262, "global_step": 58960, "epoch": 1403} {"train_loss": -5.879009246826172, "global_step": 58961, "epoch": 1403} {"train_loss": -5.919972896575928, "global_step": 58962, "epoch": 1403} {"train_loss": -5.880067825317383, "global_step": 58963, "epoch": 1403} {"train_loss": -5.848028182983398, "global_step": 58964, "epoch": 1403} {"train_loss": -5.961870193481445, "global_step": 58965, "epoch": 1403} {"train_loss": -5.946074962615967, "global_step": 58966, "epoch": 1403} {"train_loss": -5.8780013266063875, "global_step": 58967, "epoch": 1403, "val_loss": 74299.3984375} {"train_loss": -5.8883161544799805, "global_step": 58968, "epoch": 1404} {"train_loss": -5.87526798248291, "global_step": 58969, "epoch": 1404} {"train_loss": -5.831079483032227, "global_step": 58970, "epoch": 1404} {"train_loss": -5.710812568664551, "global_step": 58971, "epoch": 1404} {"train_loss": -5.8718461990356445, "global_step": 58972, "epoch": 1404} {"train_loss": -5.900079727172852, "global_step": 58973, "epoch": 1404} {"train_loss": -5.771161079406738, "global_step": 58974, "epoch": 1404} {"train_loss": -5.915280818939209, "global_step": 58975, "epoch": 1404} {"train_loss": -5.9157257080078125, "global_step": 58976, "epoch": 1404} {"train_loss": -5.833499431610107, "global_step": 58977, "epoch": 1404} {"train_loss": -5.982176780700684, "global_step": 58978, "epoch": 1404} {"train_loss": -5.788948059082031, "global_step": 58979, "epoch": 1404} {"train_loss": -5.906347274780273, "global_step": 58980, "epoch": 1404} {"train_loss": -5.913660049438477, "global_step": 58981, "epoch": 1404} {"train_loss": -5.918501853942871, "global_step": 58982, "epoch": 1404} {"train_loss": -5.923093795776367, "global_step": 58983, "epoch": 1404} {"train_loss": -5.9488444328308105, "global_step": 58984, "epoch": 1404} {"train_loss": -5.8734331130981445, "global_step": 58985, "epoch": 1404} {"train_loss": -5.935968399047852, "global_step": 58986, "epoch": 1404} {"train_loss": -5.817476272583008, "global_step": 58987, "epoch": 1404} {"train_loss": -5.906075477600098, "global_step": 58988, "epoch": 1404} {"train_loss": -5.919304847717285, "global_step": 58989, "epoch": 1404} {"train_loss": -5.764838218688965, "global_step": 58990, "epoch": 1404} {"train_loss": -5.826184272766113, "global_step": 58991, "epoch": 1404} {"train_loss": -5.845243453979492, "global_step": 58992, "epoch": 1404} {"train_loss": -5.8581414222717285, "global_step": 58993, "epoch": 1404} {"train_loss": -5.742365837097168, "global_step": 58994, "epoch": 1404} {"train_loss": -5.8015289306640625, "global_step": 58995, "epoch": 1404} {"train_loss": -5.849977493286133, "global_step": 58996, "epoch": 1404} {"train_loss": -5.832231044769287, "global_step": 58997, "epoch": 1404} {"train_loss": -5.902050018310547, "global_step": 58998, "epoch": 1404} {"train_loss": -5.856137752532959, "global_step": 58999, "epoch": 1404} {"train_loss": -5.8457841873168945, "global_step": 59000, "epoch": 1404} {"train_loss": -5.872570991516113, "global_step": 59001, "epoch": 1404} {"train_loss": -5.742239952087402, "global_step": 59002, "epoch": 1404} {"train_loss": -5.926063537597656, "global_step": 59003, "epoch": 1404} {"train_loss": -5.919905662536621, "global_step": 59004, "epoch": 1404} {"train_loss": -5.951979637145996, "global_step": 59005, "epoch": 1404} {"train_loss": -5.920790195465088, "global_step": 59006, "epoch": 1404} {"train_loss": -5.852509021759033, "global_step": 59007, "epoch": 1404} {"train_loss": -5.852034568786621, "global_step": 59008, "epoch": 1404} {"train_loss": -5.866212186359224, "global_step": 59009, "epoch": 1404, "val_loss": 74552.96875} {"train_loss": -5.891411781311035, "global_step": 59010, "epoch": 1405} {"train_loss": -5.80624532699585, "global_step": 59011, "epoch": 1405} {"train_loss": -5.985759258270264, "global_step": 59012, "epoch": 1405} {"train_loss": -5.902314186096191, "global_step": 59013, "epoch": 1405} {"train_loss": -5.814231872558594, "global_step": 59014, "epoch": 1405} {"train_loss": -5.916656970977783, "global_step": 59015, "epoch": 1405} {"train_loss": -6.048858642578125, "global_step": 59016, "epoch": 1405} {"train_loss": -5.6438751220703125, "global_step": 59017, "epoch": 1405} {"train_loss": -5.835760116577148, "global_step": 59018, "epoch": 1405} {"train_loss": -5.859959125518799, "global_step": 59019, "epoch": 1405} {"train_loss": -5.898233890533447, "global_step": 59020, "epoch": 1405} {"train_loss": -5.9964423179626465, "global_step": 59021, "epoch": 1405} {"train_loss": -5.861143589019775, "global_step": 59022, "epoch": 1405} {"train_loss": -5.89487886428833, "global_step": 59023, "epoch": 1405} {"train_loss": -5.934289932250977, "global_step": 59024, "epoch": 1405} {"train_loss": -5.905779838562012, "global_step": 59025, "epoch": 1405} {"train_loss": -5.865687370300293, "global_step": 59026, "epoch": 1405} {"train_loss": -5.792858600616455, "global_step": 59027, "epoch": 1405} {"train_loss": -5.78501558303833, "global_step": 59028, "epoch": 1405} {"train_loss": -5.856563568115234, "global_step": 59029, "epoch": 1405} {"train_loss": -5.795421123504639, "global_step": 59030, "epoch": 1405} {"train_loss": -5.936148643493652, "global_step": 59031, "epoch": 1405} {"train_loss": -5.880737781524658, "global_step": 59032, "epoch": 1405} {"train_loss": -5.819305419921875, "global_step": 59033, "epoch": 1405} {"train_loss": -5.812070846557617, "global_step": 59034, "epoch": 1405} {"train_loss": -5.750341415405273, "global_step": 59035, "epoch": 1405} {"train_loss": -5.970402717590332, "global_step": 59036, "epoch": 1405} {"train_loss": -5.852130889892578, "global_step": 59037, "epoch": 1405} {"train_loss": -5.764886856079102, "global_step": 59038, "epoch": 1405} {"train_loss": -5.728096008300781, "global_step": 59039, "epoch": 1405} {"train_loss": -5.838578224182129, "global_step": 59040, "epoch": 1405} {"train_loss": -5.907523155212402, "global_step": 59041, "epoch": 1405} {"train_loss": -5.752699851989746, "global_step": 59042, "epoch": 1405} {"train_loss": -5.89051628112793, "global_step": 59043, "epoch": 1405} {"train_loss": -5.826045036315918, "global_step": 59044, "epoch": 1405} {"train_loss": -5.862394332885742, "global_step": 59045, "epoch": 1405} {"train_loss": -5.8399858474731445, "global_step": 59046, "epoch": 1405} {"train_loss": -5.868257522583008, "global_step": 59047, "epoch": 1405} {"train_loss": -5.863735675811768, "global_step": 59048, "epoch": 1405} {"train_loss": -5.688631534576416, "global_step": 59049, "epoch": 1405} {"train_loss": -5.934106349945068, "global_step": 59050, "epoch": 1405} {"train_loss": -5.853097416105724, "global_step": 59051, "epoch": 1405, "val_loss": 74770.703125} {"train_loss": -5.707146644592285, "global_step": 59052, "epoch": 1406} {"train_loss": -5.865945339202881, "global_step": 59053, "epoch": 1406} {"train_loss": -5.86400032043457, "global_step": 59054, "epoch": 1406} {"train_loss": -5.787034511566162, "global_step": 59055, "epoch": 1406} {"train_loss": -5.987524032592773, "global_step": 59056, "epoch": 1406} {"train_loss": -5.847047805786133, "global_step": 59057, "epoch": 1406} {"train_loss": -5.935718536376953, "global_step": 59058, "epoch": 1406} {"train_loss": -5.83900260925293, "global_step": 59059, "epoch": 1406} {"train_loss": -5.9362616539001465, "global_step": 59060, "epoch": 1406} {"train_loss": -5.8708343505859375, "global_step": 59061, "epoch": 1406} {"train_loss": -5.921072006225586, "global_step": 59062, "epoch": 1406} {"train_loss": -6.029907703399658, "global_step": 59063, "epoch": 1406} {"train_loss": -5.785704612731934, "global_step": 59064, "epoch": 1406} {"train_loss": -5.825418472290039, "global_step": 59065, "epoch": 1406} {"train_loss": -5.84517765045166, "global_step": 59066, "epoch": 1406} {"train_loss": -5.946630477905273, "global_step": 59067, "epoch": 1406} {"train_loss": -5.833161354064941, "global_step": 59068, "epoch": 1406} {"train_loss": -5.852534294128418, "global_step": 59069, "epoch": 1406} {"train_loss": -5.766382694244385, "global_step": 59070, "epoch": 1406} {"train_loss": -5.814101219177246, "global_step": 59071, "epoch": 1406} {"train_loss": -5.896889686584473, "global_step": 59072, "epoch": 1406} {"train_loss": -5.77730655670166, "global_step": 59073, "epoch": 1406} {"train_loss": -5.763456344604492, "global_step": 59074, "epoch": 1406} {"train_loss": -5.741112232208252, "global_step": 59075, "epoch": 1406} {"train_loss": -5.8357696533203125, "global_step": 59076, "epoch": 1406} {"train_loss": -5.811890602111816, "global_step": 59077, "epoch": 1406} {"train_loss": -5.901548385620117, "global_step": 59078, "epoch": 1406} {"train_loss": -5.894415378570557, "global_step": 59079, "epoch": 1406} {"train_loss": -5.757884979248047, "global_step": 59080, "epoch": 1406} {"train_loss": -5.932604789733887, "global_step": 59081, "epoch": 1406} {"train_loss": -5.836695194244385, "global_step": 59082, "epoch": 1406} {"train_loss": -5.90277099609375, "global_step": 59083, "epoch": 1406} {"train_loss": -5.988358020782471, "global_step": 59084, "epoch": 1406} {"train_loss": -5.919432163238525, "global_step": 59085, "epoch": 1406} {"train_loss": -5.937359809875488, "global_step": 59086, "epoch": 1406} {"train_loss": -5.849676132202148, "global_step": 59087, "epoch": 1406} {"train_loss": -5.804602146148682, "global_step": 59088, "epoch": 1406} {"train_loss": -5.93014669418335, "global_step": 59089, "epoch": 1406} {"train_loss": -5.916299819946289, "global_step": 59090, "epoch": 1406} {"train_loss": -5.795808792114258, "global_step": 59091, "epoch": 1406} {"train_loss": -5.953935623168945, "global_step": 59092, "epoch": 1406} {"train_loss": -5.86492859749567, "global_step": 59093, "epoch": 1406, "val_loss": 74909.078125} {"train_loss": -5.59409236907959, "global_step": 59094, "epoch": 1407} {"train_loss": -5.9224066734313965, "global_step": 59095, "epoch": 1407} {"train_loss": -5.763068199157715, "global_step": 59096, "epoch": 1407} {"train_loss": -5.856494903564453, "global_step": 59097, "epoch": 1407} {"train_loss": -5.854330062866211, "global_step": 59098, "epoch": 1407} {"train_loss": -5.731115818023682, "global_step": 59099, "epoch": 1407} {"train_loss": -5.754171848297119, "global_step": 59100, "epoch": 1407} {"train_loss": -5.7468366622924805, "global_step": 59101, "epoch": 1407} {"train_loss": -5.912911415100098, "global_step": 59102, "epoch": 1407} {"train_loss": -5.806698799133301, "global_step": 59103, "epoch": 1407} {"train_loss": -5.911517143249512, "global_step": 59104, "epoch": 1407} {"train_loss": -5.7881598472595215, "global_step": 59105, "epoch": 1407} {"train_loss": -5.891608238220215, "global_step": 59106, "epoch": 1407} {"train_loss": -5.869792938232422, "global_step": 59107, "epoch": 1407} {"train_loss": -5.844931602478027, "global_step": 59108, "epoch": 1407} {"train_loss": -5.833132743835449, "global_step": 59109, "epoch": 1407} {"train_loss": -5.877222061157227, "global_step": 59110, "epoch": 1407} {"train_loss": -5.795418739318848, "global_step": 59111, "epoch": 1407} {"train_loss": -5.86726188659668, "global_step": 59112, "epoch": 1407} {"train_loss": -5.917281150817871, "global_step": 59113, "epoch": 1407} {"train_loss": -5.993814468383789, "global_step": 59114, "epoch": 1407} {"train_loss": -5.948277473449707, "global_step": 59115, "epoch": 1407} {"train_loss": -5.880654811859131, "global_step": 59116, "epoch": 1407} {"train_loss": -5.936805248260498, "global_step": 59117, "epoch": 1407} {"train_loss": -5.906615734100342, "global_step": 59118, "epoch": 1407} {"train_loss": -5.840287208557129, "global_step": 59119, "epoch": 1407} {"train_loss": -5.987574577331543, "global_step": 59120, "epoch": 1407} {"train_loss": -5.912176132202148, "global_step": 59121, "epoch": 1407} {"train_loss": -6.035665035247803, "global_step": 59122, "epoch": 1407} {"train_loss": -5.865504264831543, "global_step": 59123, "epoch": 1407} {"train_loss": -5.931504249572754, "global_step": 59124, "epoch": 1407} {"train_loss": -5.949182033538818, "global_step": 59125, "epoch": 1407} {"train_loss": -5.8175554275512695, "global_step": 59126, "epoch": 1407} {"train_loss": -5.89569091796875, "global_step": 59127, "epoch": 1407} {"train_loss": -5.938244819641113, "global_step": 59128, "epoch": 1407} {"train_loss": -5.856385231018066, "global_step": 59129, "epoch": 1407} {"train_loss": -5.998233795166016, "global_step": 59130, "epoch": 1407} {"train_loss": -5.800817489624023, "global_step": 59131, "epoch": 1407} {"train_loss": -5.937263488769531, "global_step": 59132, "epoch": 1407} {"train_loss": -5.984482765197754, "global_step": 59133, "epoch": 1407} {"train_loss": -5.765808582305908, "global_step": 59134, "epoch": 1407} {"train_loss": -5.870430060795376, "global_step": 59135, "epoch": 1407, "val_loss": 74512.4921875} {"train_loss": -5.951059818267822, "global_step": 59136, "epoch": 1408} {"train_loss": -5.863390922546387, "global_step": 59137, "epoch": 1408} {"train_loss": -5.950601577758789, "global_step": 59138, "epoch": 1408} {"train_loss": -5.978070259094238, "global_step": 59139, "epoch": 1408} {"train_loss": -5.680832386016846, "global_step": 59140, "epoch": 1408} {"train_loss": -5.83702278137207, "global_step": 59141, "epoch": 1408} {"train_loss": -5.922511577606201, "global_step": 59142, "epoch": 1408} {"train_loss": -5.961083889007568, "global_step": 59143, "epoch": 1408} {"train_loss": -6.01652717590332, "global_step": 59144, "epoch": 1408} {"train_loss": -5.851664066314697, "global_step": 59145, "epoch": 1408} {"train_loss": -5.8408966064453125, "global_step": 59146, "epoch": 1408} {"train_loss": -5.8603129386901855, "global_step": 59147, "epoch": 1408} {"train_loss": -5.987156867980957, "global_step": 59148, "epoch": 1408} {"train_loss": -5.948729991912842, "global_step": 59149, "epoch": 1408} {"train_loss": -5.8450469970703125, "global_step": 59150, "epoch": 1408} {"train_loss": -5.818118095397949, "global_step": 59151, "epoch": 1408} {"train_loss": -5.885561466217041, "global_step": 59152, "epoch": 1408} {"train_loss": -5.900526523590088, "global_step": 59153, "epoch": 1408} {"train_loss": -5.855860710144043, "global_step": 59154, "epoch": 1408} {"train_loss": -5.930994510650635, "global_step": 59155, "epoch": 1408} {"train_loss": -5.835716247558594, "global_step": 59156, "epoch": 1408} {"train_loss": -5.875931739807129, "global_step": 59157, "epoch": 1408} {"train_loss": -5.953616619110107, "global_step": 59158, "epoch": 1408} {"train_loss": -6.017168045043945, "global_step": 59159, "epoch": 1408} {"train_loss": -5.863802909851074, "global_step": 59160, "epoch": 1408} {"train_loss": -5.830772876739502, "global_step": 59161, "epoch": 1408} {"train_loss": -5.8549723625183105, "global_step": 59162, "epoch": 1408} {"train_loss": -5.828573226928711, "global_step": 59163, "epoch": 1408} {"train_loss": -5.843331336975098, "global_step": 59164, "epoch": 1408} {"train_loss": -5.974709510803223, "global_step": 59165, "epoch": 1408} {"train_loss": -5.89238166809082, "global_step": 59166, "epoch": 1408} {"train_loss": -5.85375452041626, "global_step": 59167, "epoch": 1408} {"train_loss": -5.782637596130371, "global_step": 59168, "epoch": 1408} {"train_loss": -5.949001312255859, "global_step": 59169, "epoch": 1408} {"train_loss": -5.848907470703125, "global_step": 59170, "epoch": 1408} {"train_loss": -5.97646427154541, "global_step": 59171, "epoch": 1408} {"train_loss": -5.796139717102051, "global_step": 59172, "epoch": 1408} {"train_loss": -5.9849090576171875, "global_step": 59173, "epoch": 1408} {"train_loss": -5.816303253173828, "global_step": 59174, "epoch": 1408} {"train_loss": -5.8612470626831055, "global_step": 59175, "epoch": 1408} {"train_loss": -5.882776737213135, "global_step": 59176, "epoch": 1408} {"train_loss": -5.888740653083438, "global_step": 59177, "epoch": 1408, "val_loss": 74266.734375} {"train_loss": -5.868407726287842, "global_step": 59178, "epoch": 1409} {"train_loss": -5.929237365722656, "global_step": 59179, "epoch": 1409} {"train_loss": -5.919109344482422, "global_step": 59180, "epoch": 1409} {"train_loss": -5.9063005447387695, "global_step": 59181, "epoch": 1409} {"train_loss": -5.782342910766602, "global_step": 59182, "epoch": 1409} {"train_loss": -6.023586273193359, "global_step": 59183, "epoch": 1409} {"train_loss": -5.910823345184326, "global_step": 59184, "epoch": 1409} {"train_loss": -5.957469940185547, "global_step": 59185, "epoch": 1409} {"train_loss": -5.898431777954102, "global_step": 59186, "epoch": 1409} {"train_loss": -5.920868873596191, "global_step": 59187, "epoch": 1409} {"train_loss": -5.765214920043945, "global_step": 59188, "epoch": 1409} {"train_loss": -5.945491313934326, "global_step": 59189, "epoch": 1409} {"train_loss": -5.963254928588867, "global_step": 59190, "epoch": 1409} {"train_loss": -5.904196262359619, "global_step": 59191, "epoch": 1409} {"train_loss": -5.915647029876709, "global_step": 59192, "epoch": 1409} {"train_loss": -5.954601287841797, "global_step": 59193, "epoch": 1409} {"train_loss": -5.899916172027588, "global_step": 59194, "epoch": 1409} {"train_loss": -5.9633588790893555, "global_step": 59195, "epoch": 1409} {"train_loss": -5.871209144592285, "global_step": 59196, "epoch": 1409} {"train_loss": -5.9730682373046875, "global_step": 59197, "epoch": 1409} {"train_loss": -5.849956035614014, "global_step": 59198, "epoch": 1409} {"train_loss": -5.888055801391602, "global_step": 59199, "epoch": 1409} {"train_loss": -5.849812030792236, "global_step": 59200, "epoch": 1409} {"train_loss": -5.873201370239258, "global_step": 59201, "epoch": 1409} {"train_loss": -5.828763008117676, "global_step": 59202, "epoch": 1409} {"train_loss": -5.847574234008789, "global_step": 59203, "epoch": 1409} {"train_loss": -5.899632453918457, "global_step": 59204, "epoch": 1409} {"train_loss": -5.854893684387207, "global_step": 59205, "epoch": 1409} {"train_loss": -5.809246063232422, "global_step": 59206, "epoch": 1409} {"train_loss": -5.854894638061523, "global_step": 59207, "epoch": 1409} {"train_loss": -5.785600662231445, "global_step": 59208, "epoch": 1409} {"train_loss": -5.770887851715088, "global_step": 59209, "epoch": 1409} {"train_loss": -5.838061809539795, "global_step": 59210, "epoch": 1409} {"train_loss": -5.774296760559082, "global_step": 59211, "epoch": 1409} {"train_loss": -5.805166244506836, "global_step": 59212, "epoch": 1409} {"train_loss": -5.851598262786865, "global_step": 59213, "epoch": 1409} {"train_loss": -5.865842819213867, "global_step": 59214, "epoch": 1409} {"train_loss": -5.904573440551758, "global_step": 59215, "epoch": 1409} {"train_loss": -5.954115867614746, "global_step": 59216, "epoch": 1409} {"train_loss": -5.907824993133545, "global_step": 59217, "epoch": 1409} {"train_loss": -6.01411771774292, "global_step": 59218, "epoch": 1409} {"train_loss": -5.883930739902315, "global_step": 59219, "epoch": 1409, "val_loss": 74582.5234375} {"train_loss": -5.874750137329102, "global_step": 59220, "epoch": 1410} {"train_loss": -5.834625720977783, "global_step": 59221, "epoch": 1410} {"train_loss": -5.820561408996582, "global_step": 59222, "epoch": 1410} {"train_loss": -5.862752914428711, "global_step": 59223, "epoch": 1410} {"train_loss": -5.797994613647461, "global_step": 59224, "epoch": 1410} {"train_loss": -5.966769695281982, "global_step": 59225, "epoch": 1410} {"train_loss": -5.818086624145508, "global_step": 59226, "epoch": 1410} {"train_loss": -5.9361042976379395, "global_step": 59227, "epoch": 1410} {"train_loss": -5.7091779708862305, "global_step": 59228, "epoch": 1410} {"train_loss": -5.803483963012695, "global_step": 59229, "epoch": 1410} {"train_loss": -5.901242256164551, "global_step": 59230, "epoch": 1410} {"train_loss": -5.790582180023193, "global_step": 59231, "epoch": 1410} {"train_loss": -5.873880386352539, "global_step": 59232, "epoch": 1410} {"train_loss": -5.82423210144043, "global_step": 59233, "epoch": 1410} {"train_loss": -5.896914958953857, "global_step": 59234, "epoch": 1410} {"train_loss": -5.9693450927734375, "global_step": 59235, "epoch": 1410} {"train_loss": -5.837525367736816, "global_step": 59236, "epoch": 1410} {"train_loss": -5.964663505554199, "global_step": 59237, "epoch": 1410} {"train_loss": -5.912991523742676, "global_step": 59238, "epoch": 1410} {"train_loss": -5.773848533630371, "global_step": 59239, "epoch": 1410} {"train_loss": -5.8317108154296875, "global_step": 59240, "epoch": 1410} {"train_loss": -5.909101486206055, "global_step": 59241, "epoch": 1410} {"train_loss": -5.9906721115112305, "global_step": 59242, "epoch": 1410} {"train_loss": -5.95775032043457, "global_step": 59243, "epoch": 1410} {"train_loss": -5.953310012817383, "global_step": 59244, "epoch": 1410} {"train_loss": -5.918890953063965, "global_step": 59245, "epoch": 1410} {"train_loss": -5.859750747680664, "global_step": 59246, "epoch": 1410} {"train_loss": -5.944081783294678, "global_step": 59247, "epoch": 1410} {"train_loss": -5.91268253326416, "global_step": 59248, "epoch": 1410} {"train_loss": -5.824368476867676, "global_step": 59249, "epoch": 1410} {"train_loss": -5.996984958648682, "global_step": 59250, "epoch": 1410} {"train_loss": -5.844958305358887, "global_step": 59251, "epoch": 1410} {"train_loss": -5.838378429412842, "global_step": 59252, "epoch": 1410} {"train_loss": -5.904114723205566, "global_step": 59253, "epoch": 1410} {"train_loss": -5.998391628265381, "global_step": 59254, "epoch": 1410} {"train_loss": -5.850790023803711, "global_step": 59255, "epoch": 1410} {"train_loss": -5.879515647888184, "global_step": 59256, "epoch": 1410} {"train_loss": -5.872200965881348, "global_step": 59257, "epoch": 1410} {"train_loss": -5.967083930969238, "global_step": 59258, "epoch": 1410} {"train_loss": -5.8863348960876465, "global_step": 59259, "epoch": 1410} {"train_loss": -5.83397102355957, "global_step": 59260, "epoch": 1410} {"train_loss": -5.8815692492893765, "global_step": 59261, "epoch": 1410, "val_loss": 74483.375} {"train_loss": -5.84615421295166, "global_step": 59262, "epoch": 1411} {"train_loss": -5.7590107917785645, "global_step": 59263, "epoch": 1411} {"train_loss": -5.955488681793213, "global_step": 59264, "epoch": 1411} {"train_loss": -5.893251419067383, "global_step": 59265, "epoch": 1411} {"train_loss": -5.920477867126465, "global_step": 59266, "epoch": 1411} {"train_loss": -5.863011360168457, "global_step": 59267, "epoch": 1411} {"train_loss": -6.061603546142578, "global_step": 59268, "epoch": 1411} {"train_loss": -5.857471466064453, "global_step": 59269, "epoch": 1411} {"train_loss": -5.954444408416748, "global_step": 59270, "epoch": 1411} {"train_loss": -5.880352020263672, "global_step": 59271, "epoch": 1411} {"train_loss": -5.969686031341553, "global_step": 59272, "epoch": 1411} {"train_loss": -5.843921661376953, "global_step": 59273, "epoch": 1411} {"train_loss": -5.919930934906006, "global_step": 59274, "epoch": 1411} {"train_loss": -5.994324684143066, "global_step": 59275, "epoch": 1411} {"train_loss": -5.836155414581299, "global_step": 59276, "epoch": 1411} {"train_loss": -5.7931952476501465, "global_step": 59277, "epoch": 1411} {"train_loss": -5.998625755310059, "global_step": 59278, "epoch": 1411} {"train_loss": -5.783634185791016, "global_step": 59279, "epoch": 1411} {"train_loss": -5.836936950683594, "global_step": 59280, "epoch": 1411} {"train_loss": -5.90274715423584, "global_step": 59281, "epoch": 1411} {"train_loss": -5.841038703918457, "global_step": 59282, "epoch": 1411} {"train_loss": -5.7747907638549805, "global_step": 59283, "epoch": 1411} {"train_loss": -5.921930313110352, "global_step": 59284, "epoch": 1411} {"train_loss": -5.873733997344971, "global_step": 59285, "epoch": 1411} {"train_loss": -5.917560577392578, "global_step": 59286, "epoch": 1411} {"train_loss": -5.936740398406982, "global_step": 59287, "epoch": 1411} {"train_loss": -5.941359519958496, "global_step": 59288, "epoch": 1411} {"train_loss": -5.9952616691589355, "global_step": 59289, "epoch": 1411} {"train_loss": -5.876398086547852, "global_step": 59290, "epoch": 1411} {"train_loss": -6.002931594848633, "global_step": 59291, "epoch": 1411} {"train_loss": -5.9070281982421875, "global_step": 59292, "epoch": 1411} {"train_loss": -5.937558174133301, "global_step": 59293, "epoch": 1411} {"train_loss": -5.85287618637085, "global_step": 59294, "epoch": 1411} {"train_loss": -5.863409996032715, "global_step": 59295, "epoch": 1411} {"train_loss": -5.906105041503906, "global_step": 59296, "epoch": 1411} {"train_loss": -6.014826774597168, "global_step": 59297, "epoch": 1411} {"train_loss": -5.823509693145752, "global_step": 59298, "epoch": 1411} {"train_loss": -5.87907600402832, "global_step": 59299, "epoch": 1411} {"train_loss": -5.839290618896484, "global_step": 59300, "epoch": 1411} {"train_loss": -5.844980716705322, "global_step": 59301, "epoch": 1411} {"train_loss": -5.980905532836914, "global_step": 59302, "epoch": 1411} {"train_loss": -5.89774014836266, "global_step": 59303, "epoch": 1411, "val_loss": 74330.15625} {"train_loss": -5.8784379959106445, "global_step": 59304, "epoch": 1412} {"train_loss": -5.929641246795654, "global_step": 59305, "epoch": 1412} {"train_loss": -5.9160051345825195, "global_step": 59306, "epoch": 1412} {"train_loss": -5.890041351318359, "global_step": 59307, "epoch": 1412} {"train_loss": -6.003810882568359, "global_step": 59308, "epoch": 1412} {"train_loss": -5.942924499511719, "global_step": 59309, "epoch": 1412} {"train_loss": -5.922802448272705, "global_step": 59310, "epoch": 1412} {"train_loss": -5.968372821807861, "global_step": 59311, "epoch": 1412} {"train_loss": -5.836352825164795, "global_step": 59312, "epoch": 1412} {"train_loss": -5.975662708282471, "global_step": 59313, "epoch": 1412} {"train_loss": -5.894444465637207, "global_step": 59314, "epoch": 1412} {"train_loss": -5.833952903747559, "global_step": 59315, "epoch": 1412} {"train_loss": -5.895687103271484, "global_step": 59316, "epoch": 1412} {"train_loss": -5.878674030303955, "global_step": 59317, "epoch": 1412} {"train_loss": -5.991957664489746, "global_step": 59318, "epoch": 1412} {"train_loss": -5.9354352951049805, "global_step": 59319, "epoch": 1412} {"train_loss": -5.837202072143555, "global_step": 59320, "epoch": 1412} {"train_loss": -5.821935176849365, "global_step": 59321, "epoch": 1412} {"train_loss": -5.993657112121582, "global_step": 59322, "epoch": 1412} {"train_loss": -5.9517502784729, "global_step": 59323, "epoch": 1412} {"train_loss": -5.934773921966553, "global_step": 59324, "epoch": 1412} {"train_loss": -5.847049713134766, "global_step": 59325, "epoch": 1412} {"train_loss": -5.968669891357422, "global_step": 59326, "epoch": 1412} {"train_loss": -5.980435848236084, "global_step": 59327, "epoch": 1412} {"train_loss": -5.97476863861084, "global_step": 59328, "epoch": 1412} {"train_loss": -5.932394981384277, "global_step": 59329, "epoch": 1412} {"train_loss": -5.92902946472168, "global_step": 59330, "epoch": 1412} {"train_loss": -5.838201522827148, "global_step": 59331, "epoch": 1412} {"train_loss": -5.829059600830078, "global_step": 59332, "epoch": 1412} {"train_loss": -5.826545715332031, "global_step": 59333, "epoch": 1412} {"train_loss": -5.904085159301758, "global_step": 59334, "epoch": 1412} {"train_loss": -5.839557647705078, "global_step": 59335, "epoch": 1412} {"train_loss": -5.822887420654297, "global_step": 59336, "epoch": 1412} {"train_loss": -5.970897197723389, "global_step": 59337, "epoch": 1412} {"train_loss": -5.971277236938477, "global_step": 59338, "epoch": 1412} {"train_loss": -5.994653224945068, "global_step": 59339, "epoch": 1412} {"train_loss": -5.877002716064453, "global_step": 59340, "epoch": 1412} {"train_loss": -5.859663963317871, "global_step": 59341, "epoch": 1412} {"train_loss": -5.916441917419434, "global_step": 59342, "epoch": 1412} {"train_loss": -5.846344947814941, "global_step": 59343, "epoch": 1412} {"train_loss": -5.827683925628662, "global_step": 59344, "epoch": 1412} {"train_loss": -5.9048787752787275, "global_step": 59345, "epoch": 1412, "val_loss": 74536.0703125} {"train_loss": -5.864549160003662, "global_step": 59346, "epoch": 1413} {"train_loss": -5.790824890136719, "global_step": 59347, "epoch": 1413} {"train_loss": -5.863869667053223, "global_step": 59348, "epoch": 1413} {"train_loss": -6.048248291015625, "global_step": 59349, "epoch": 1413} {"train_loss": -5.977946758270264, "global_step": 59350, "epoch": 1413} {"train_loss": -5.904847145080566, "global_step": 59351, "epoch": 1413} {"train_loss": -5.863503456115723, "global_step": 59352, "epoch": 1413} {"train_loss": -5.84068489074707, "global_step": 59353, "epoch": 1413} {"train_loss": -5.818007469177246, "global_step": 59354, "epoch": 1413} {"train_loss": -5.826981544494629, "global_step": 59355, "epoch": 1413} {"train_loss": -5.902338981628418, "global_step": 59356, "epoch": 1413} {"train_loss": -6.0015764236450195, "global_step": 59357, "epoch": 1413} {"train_loss": -5.966383934020996, "global_step": 59358, "epoch": 1413} {"train_loss": -5.939607620239258, "global_step": 59359, "epoch": 1413} {"train_loss": -5.924999237060547, "global_step": 59360, "epoch": 1413} {"train_loss": -5.906756401062012, "global_step": 59361, "epoch": 1413} {"train_loss": -5.809825420379639, "global_step": 59362, "epoch": 1413} {"train_loss": -5.925352096557617, "global_step": 59363, "epoch": 1413} {"train_loss": -5.886669158935547, "global_step": 59364, "epoch": 1413} {"train_loss": -5.878204822540283, "global_step": 59365, "epoch": 1413} {"train_loss": -5.953039169311523, "global_step": 59366, "epoch": 1413} {"train_loss": -5.81782341003418, "global_step": 59367, "epoch": 1413} {"train_loss": -5.877346992492676, "global_step": 59368, "epoch": 1413} {"train_loss": -5.839999198913574, "global_step": 59369, "epoch": 1413} {"train_loss": -5.85227632522583, "global_step": 59370, "epoch": 1413} {"train_loss": -5.863205909729004, "global_step": 59371, "epoch": 1413} {"train_loss": -5.88946533203125, "global_step": 59372, "epoch": 1413} {"train_loss": -5.824991226196289, "global_step": 59373, "epoch": 1413} {"train_loss": -5.85847282409668, "global_step": 59374, "epoch": 1413} {"train_loss": -5.939482688903809, "global_step": 59375, "epoch": 1413} {"train_loss": -5.917198181152344, "global_step": 59376, "epoch": 1413} {"train_loss": -5.9221696853637695, "global_step": 59377, "epoch": 1413} {"train_loss": -5.940633296966553, "global_step": 59378, "epoch": 1413} {"train_loss": -5.950282096862793, "global_step": 59379, "epoch": 1413} {"train_loss": -5.870910167694092, "global_step": 59380, "epoch": 1413} {"train_loss": -5.918961524963379, "global_step": 59381, "epoch": 1413} {"train_loss": -5.826903343200684, "global_step": 59382, "epoch": 1413} {"train_loss": -5.8528947830200195, "global_step": 59383, "epoch": 1413} {"train_loss": -5.975693702697754, "global_step": 59384, "epoch": 1413} {"train_loss": -5.804274559020996, "global_step": 59385, "epoch": 1413} {"train_loss": -5.940143585205078, "global_step": 59386, "epoch": 1413} {"train_loss": -5.891447725750151, "global_step": 59387, "epoch": 1413, "val_loss": 74211.234375} {"train_loss": -5.9259419441223145, "global_step": 59388, "epoch": 1414} {"train_loss": -5.965144157409668, "global_step": 59389, "epoch": 1414} {"train_loss": -5.697530269622803, "global_step": 59390, "epoch": 1414} {"train_loss": -5.889875888824463, "global_step": 59391, "epoch": 1414} {"train_loss": -5.811431884765625, "global_step": 59392, "epoch": 1414} {"train_loss": -5.873783111572266, "global_step": 59393, "epoch": 1414} {"train_loss": -5.924046516418457, "global_step": 59394, "epoch": 1414} {"train_loss": -5.856727600097656, "global_step": 59395, "epoch": 1414} {"train_loss": -5.9290266036987305, "global_step": 59396, "epoch": 1414} {"train_loss": -5.835735321044922, "global_step": 59397, "epoch": 1414} {"train_loss": -5.843231678009033, "global_step": 59398, "epoch": 1414} {"train_loss": -5.875469207763672, "global_step": 59399, "epoch": 1414} {"train_loss": -5.919466495513916, "global_step": 59400, "epoch": 1414} {"train_loss": -5.896409511566162, "global_step": 59401, "epoch": 1414} {"train_loss": -5.935410499572754, "global_step": 59402, "epoch": 1414} {"train_loss": -5.8631415367126465, "global_step": 59403, "epoch": 1414} {"train_loss": -5.782289505004883, "global_step": 59404, "epoch": 1414} {"train_loss": -5.914866924285889, "global_step": 59405, "epoch": 1414} {"train_loss": -5.9167046546936035, "global_step": 59406, "epoch": 1414} {"train_loss": -5.822463035583496, "global_step": 59407, "epoch": 1414} {"train_loss": -5.807026386260986, "global_step": 59408, "epoch": 1414} {"train_loss": -5.948116779327393, "global_step": 59409, "epoch": 1414} {"train_loss": -5.917046546936035, "global_step": 59410, "epoch": 1414} {"train_loss": -5.9407734870910645, "global_step": 59411, "epoch": 1414} {"train_loss": -5.993867874145508, "global_step": 59412, "epoch": 1414} {"train_loss": -5.864295482635498, "global_step": 59413, "epoch": 1414} {"train_loss": -5.893767356872559, "global_step": 59414, "epoch": 1414} {"train_loss": -5.884992599487305, "global_step": 59415, "epoch": 1414} {"train_loss": -5.951291084289551, "global_step": 59416, "epoch": 1414} {"train_loss": -6.0523681640625, "global_step": 59417, "epoch": 1414} {"train_loss": -5.883805274963379, "global_step": 59418, "epoch": 1414} {"train_loss": -5.858656883239746, "global_step": 59419, "epoch": 1414} {"train_loss": -5.750380516052246, "global_step": 59420, "epoch": 1414} {"train_loss": -5.969078063964844, "global_step": 59421, "epoch": 1414} {"train_loss": -5.823914527893066, "global_step": 59422, "epoch": 1414} {"train_loss": -5.766030311584473, "global_step": 59423, "epoch": 1414} {"train_loss": -5.893525123596191, "global_step": 59424, "epoch": 1414} {"train_loss": -5.90550422668457, "global_step": 59425, "epoch": 1414} {"train_loss": -5.776369094848633, "global_step": 59426, "epoch": 1414} {"train_loss": -5.848056793212891, "global_step": 59427, "epoch": 1414} {"train_loss": -5.8360466957092285, "global_step": 59428, "epoch": 1414} {"train_loss": -5.8764366990044, "global_step": 59429, "epoch": 1414, "val_loss": 74402.578125} {"train_loss": -5.870436191558838, "global_step": 59430, "epoch": 1415} {"train_loss": -5.776396751403809, "global_step": 59431, "epoch": 1415} {"train_loss": -5.871018409729004, "global_step": 59432, "epoch": 1415} {"train_loss": -5.872133255004883, "global_step": 59433, "epoch": 1415} {"train_loss": -5.851596832275391, "global_step": 59434, "epoch": 1415} {"train_loss": -5.922489166259766, "global_step": 59435, "epoch": 1415} {"train_loss": -5.896327972412109, "global_step": 59436, "epoch": 1415} {"train_loss": -5.90297269821167, "global_step": 59437, "epoch": 1415} {"train_loss": -5.898232460021973, "global_step": 59438, "epoch": 1415} {"train_loss": -5.779715538024902, "global_step": 59439, "epoch": 1415} {"train_loss": -5.863169193267822, "global_step": 59440, "epoch": 1415} {"train_loss": -5.833518981933594, "global_step": 59441, "epoch": 1415} {"train_loss": -5.8966755867004395, "global_step": 59442, "epoch": 1415} {"train_loss": -5.932394981384277, "global_step": 59443, "epoch": 1415} {"train_loss": -5.844456672668457, "global_step": 59444, "epoch": 1415} {"train_loss": -5.959440231323242, "global_step": 59445, "epoch": 1415} {"train_loss": -5.839803695678711, "global_step": 59446, "epoch": 1415} {"train_loss": -5.733561992645264, "global_step": 59447, "epoch": 1415} {"train_loss": -5.851711273193359, "global_step": 59448, "epoch": 1415} {"train_loss": -5.892541885375977, "global_step": 59449, "epoch": 1415} {"train_loss": -6.0344696044921875, "global_step": 59450, "epoch": 1415} {"train_loss": -5.794517993927002, "global_step": 59451, "epoch": 1415} {"train_loss": -5.803063869476318, "global_step": 59452, "epoch": 1415} {"train_loss": -5.994786262512207, "global_step": 59453, "epoch": 1415} {"train_loss": -5.775059223175049, "global_step": 59454, "epoch": 1415} {"train_loss": -5.86020565032959, "global_step": 59455, "epoch": 1415} {"train_loss": -5.882197856903076, "global_step": 59456, "epoch": 1415} {"train_loss": -5.691406726837158, "global_step": 59457, "epoch": 1415} {"train_loss": -5.968901634216309, "global_step": 59458, "epoch": 1415} {"train_loss": -5.862744331359863, "global_step": 59459, "epoch": 1415} {"train_loss": -5.890520095825195, "global_step": 59460, "epoch": 1415} {"train_loss": -5.9969000816345215, "global_step": 59461, "epoch": 1415} {"train_loss": -5.969029426574707, "global_step": 59462, "epoch": 1415} {"train_loss": -5.859531402587891, "global_step": 59463, "epoch": 1415} {"train_loss": -5.8568196296691895, "global_step": 59464, "epoch": 1415} {"train_loss": -5.898798942565918, "global_step": 59465, "epoch": 1415} {"train_loss": -5.926059722900391, "global_step": 59466, "epoch": 1415} {"train_loss": -5.89334774017334, "global_step": 59467, "epoch": 1415} {"train_loss": -5.860876083374023, "global_step": 59468, "epoch": 1415} {"train_loss": -5.902680397033691, "global_step": 59469, "epoch": 1415} {"train_loss": -5.837307929992676, "global_step": 59470, "epoch": 1415} {"train_loss": -5.875901665006365, "global_step": 59471, "epoch": 1415, "val_loss": 74609.0} {"train_loss": -5.882218360900879, "global_step": 59472, "epoch": 1416} {"train_loss": -5.9693603515625, "global_step": 59473, "epoch": 1416} {"train_loss": -5.958939075469971, "global_step": 59474, "epoch": 1416} {"train_loss": -5.9057769775390625, "global_step": 59475, "epoch": 1416} {"train_loss": -5.968811988830566, "global_step": 59476, "epoch": 1416} {"train_loss": -5.930820465087891, "global_step": 59477, "epoch": 1416} {"train_loss": -5.936770439147949, "global_step": 59478, "epoch": 1416} {"train_loss": -5.857100009918213, "global_step": 59479, "epoch": 1416} {"train_loss": -5.905472755432129, "global_step": 59480, "epoch": 1416} {"train_loss": -5.931492805480957, "global_step": 59481, "epoch": 1416} {"train_loss": -5.943289279937744, "global_step": 59482, "epoch": 1416} {"train_loss": -5.88789176940918, "global_step": 59483, "epoch": 1416} {"train_loss": -5.818912506103516, "global_step": 59484, "epoch": 1416} {"train_loss": -6.0612921714782715, "global_step": 59485, "epoch": 1416} {"train_loss": -5.810455322265625, "global_step": 59486, "epoch": 1416} {"train_loss": -5.922776222229004, "global_step": 59487, "epoch": 1416} {"train_loss": -5.900250434875488, "global_step": 59488, "epoch": 1416} {"train_loss": -6.008686542510986, "global_step": 59489, "epoch": 1416} {"train_loss": -5.834280014038086, "global_step": 59490, "epoch": 1416} {"train_loss": -5.943533420562744, "global_step": 59491, "epoch": 1416} {"train_loss": -5.919079780578613, "global_step": 59492, "epoch": 1416} {"train_loss": -5.984643459320068, "global_step": 59493, "epoch": 1416} {"train_loss": -5.915095329284668, "global_step": 59494, "epoch": 1416} {"train_loss": -5.91356086730957, "global_step": 59495, "epoch": 1416} {"train_loss": -5.9323296546936035, "global_step": 59496, "epoch": 1416} {"train_loss": -5.9908952713012695, "global_step": 59497, "epoch": 1416} {"train_loss": -5.9657182693481445, "global_step": 59498, "epoch": 1416} {"train_loss": -5.9630022048950195, "global_step": 59499, "epoch": 1416} {"train_loss": -5.972299575805664, "global_step": 59500, "epoch": 1416} {"train_loss": -5.861724853515625, "global_step": 59501, "epoch": 1416} {"train_loss": -5.910859107971191, "global_step": 59502, "epoch": 1416} {"train_loss": -5.843942642211914, "global_step": 59503, "epoch": 1416} {"train_loss": -5.901893615722656, "global_step": 59504, "epoch": 1416} {"train_loss": -5.876858711242676, "global_step": 59505, "epoch": 1416} {"train_loss": -5.8406982421875, "global_step": 59506, "epoch": 1416} {"train_loss": -5.779219627380371, "global_step": 59507, "epoch": 1416} {"train_loss": -5.959107398986816, "global_step": 59508, "epoch": 1416} {"train_loss": -5.840929985046387, "global_step": 59509, "epoch": 1416} {"train_loss": -5.769156455993652, "global_step": 59510, "epoch": 1416} {"train_loss": -5.783438205718994, "global_step": 59511, "epoch": 1416} {"train_loss": -5.85786247253418, "global_step": 59512, "epoch": 1416} {"train_loss": -5.903074514298212, "global_step": 59513, "epoch": 1416, "val_loss": 74455.3203125} {"train_loss": -5.855208396911621, "global_step": 59514, "epoch": 1417} {"train_loss": -5.810516834259033, "global_step": 59515, "epoch": 1417} {"train_loss": -5.917189598083496, "global_step": 59516, "epoch": 1417} {"train_loss": -5.9142961502075195, "global_step": 59517, "epoch": 1417} {"train_loss": -5.832222938537598, "global_step": 59518, "epoch": 1417} {"train_loss": -5.800309658050537, "global_step": 59519, "epoch": 1417} {"train_loss": -5.904531955718994, "global_step": 59520, "epoch": 1417} {"train_loss": -5.907994270324707, "global_step": 59521, "epoch": 1417} {"train_loss": -5.936609745025635, "global_step": 59522, "epoch": 1417} {"train_loss": -5.919679641723633, "global_step": 59523, "epoch": 1417} {"train_loss": -5.892195224761963, "global_step": 59524, "epoch": 1417} {"train_loss": -5.929327487945557, "global_step": 59525, "epoch": 1417} {"train_loss": -5.792621612548828, "global_step": 59526, "epoch": 1417} {"train_loss": -5.907578468322754, "global_step": 59527, "epoch": 1417} {"train_loss": -5.975473403930664, "global_step": 59528, "epoch": 1417} {"train_loss": -5.8982343673706055, "global_step": 59529, "epoch": 1417} {"train_loss": -5.756435394287109, "global_step": 59530, "epoch": 1417} {"train_loss": -5.864339828491211, "global_step": 59531, "epoch": 1417} {"train_loss": -5.789880752563477, "global_step": 59532, "epoch": 1417} {"train_loss": -5.688477039337158, "global_step": 59533, "epoch": 1417} {"train_loss": -6.020214080810547, "global_step": 59534, "epoch": 1417} {"train_loss": -5.712911605834961, "global_step": 59535, "epoch": 1417} {"train_loss": -5.851043701171875, "global_step": 59536, "epoch": 1417} {"train_loss": -5.893287658691406, "global_step": 59537, "epoch": 1417} {"train_loss": -5.899953365325928, "global_step": 59538, "epoch": 1417} {"train_loss": -5.993974685668945, "global_step": 59539, "epoch": 1417} {"train_loss": -5.850759506225586, "global_step": 59540, "epoch": 1417} {"train_loss": -5.781380653381348, "global_step": 59541, "epoch": 1417} {"train_loss": -5.892019271850586, "global_step": 59542, "epoch": 1417} {"train_loss": -5.8932390213012695, "global_step": 59543, "epoch": 1417} {"train_loss": -5.9100847244262695, "global_step": 59544, "epoch": 1417} {"train_loss": -5.9945831298828125, "global_step": 59545, "epoch": 1417} {"train_loss": -5.751836776733398, "global_step": 59546, "epoch": 1417} {"train_loss": -5.962454795837402, "global_step": 59547, "epoch": 1417} {"train_loss": -5.816969394683838, "global_step": 59548, "epoch": 1417} {"train_loss": -5.870643615722656, "global_step": 59549, "epoch": 1417} {"train_loss": -5.969686985015869, "global_step": 59550, "epoch": 1417} {"train_loss": -5.9402055740356445, "global_step": 59551, "epoch": 1417} {"train_loss": -5.9025983810424805, "global_step": 59552, "epoch": 1417} {"train_loss": -5.848193168640137, "global_step": 59553, "epoch": 1417} {"train_loss": -6.000701904296875, "global_step": 59554, "epoch": 1417} {"train_loss": -5.87688896769569, "global_step": 59555, "epoch": 1417, "val_loss": 74637.1484375} {"train_loss": -5.949678421020508, "global_step": 59556, "epoch": 1418} {"train_loss": -5.878325939178467, "global_step": 59557, "epoch": 1418} {"train_loss": -5.925264358520508, "global_step": 59558, "epoch": 1418} {"train_loss": -5.8540472984313965, "global_step": 59559, "epoch": 1418} {"train_loss": -5.959011077880859, "global_step": 59560, "epoch": 1418} {"train_loss": -6.030252933502197, "global_step": 59561, "epoch": 1418} {"train_loss": -6.0073041915893555, "global_step": 59562, "epoch": 1418} {"train_loss": -5.923901557922363, "global_step": 59563, "epoch": 1418} {"train_loss": -5.9771647453308105, "global_step": 59564, "epoch": 1418} {"train_loss": -5.935639381408691, "global_step": 59565, "epoch": 1418} {"train_loss": -5.889589786529541, "global_step": 59566, "epoch": 1418} {"train_loss": -5.922865390777588, "global_step": 59567, "epoch": 1418} {"train_loss": -6.048802375793457, "global_step": 59568, "epoch": 1418} {"train_loss": -5.918663024902344, "global_step": 59569, "epoch": 1418} {"train_loss": -5.945797443389893, "global_step": 59570, "epoch": 1418} {"train_loss": -5.863808631896973, "global_step": 59571, "epoch": 1418} {"train_loss": -5.845608711242676, "global_step": 59572, "epoch": 1418} {"train_loss": -5.828455924987793, "global_step": 59573, "epoch": 1418} {"train_loss": -5.9500813484191895, "global_step": 59574, "epoch": 1418} {"train_loss": -5.8796491622924805, "global_step": 59575, "epoch": 1418} {"train_loss": -5.88817024230957, "global_step": 59576, "epoch": 1418} {"train_loss": -5.914966583251953, "global_step": 59577, "epoch": 1418} {"train_loss": -5.924815654754639, "global_step": 59578, "epoch": 1418} {"train_loss": -5.916448593139648, "global_step": 59579, "epoch": 1418} {"train_loss": -5.882258415222168, "global_step": 59580, "epoch": 1418} {"train_loss": -5.916115760803223, "global_step": 59581, "epoch": 1418} {"train_loss": -5.9556498527526855, "global_step": 59582, "epoch": 1418} {"train_loss": -5.887854099273682, "global_step": 59583, "epoch": 1418} {"train_loss": -5.864068031311035, "global_step": 59584, "epoch": 1418} {"train_loss": -5.801878929138184, "global_step": 59585, "epoch": 1418} {"train_loss": -5.932644844055176, "global_step": 59586, "epoch": 1418} {"train_loss": -5.772834777832031, "global_step": 59587, "epoch": 1418} {"train_loss": -5.912886142730713, "global_step": 59588, "epoch": 1418} {"train_loss": -5.923686981201172, "global_step": 59589, "epoch": 1418} {"train_loss": -5.811580657958984, "global_step": 59590, "epoch": 1418} {"train_loss": -5.874568939208984, "global_step": 59591, "epoch": 1418} {"train_loss": -6.03543758392334, "global_step": 59592, "epoch": 1418} {"train_loss": -5.7398881912231445, "global_step": 59593, "epoch": 1418} {"train_loss": -5.8147077560424805, "global_step": 59594, "epoch": 1418} {"train_loss": -5.88555908203125, "global_step": 59595, "epoch": 1418} {"train_loss": -5.90435791015625, "global_step": 59596, "epoch": 1418} {"train_loss": -5.901836088725498, "global_step": 59597, "epoch": 1418, "val_loss": 74455.1328125} {"train_loss": -5.911653995513916, "global_step": 59598, "epoch": 1419} {"train_loss": -5.931980609893799, "global_step": 59599, "epoch": 1419} {"train_loss": -5.809395790100098, "global_step": 59600, "epoch": 1419} {"train_loss": -5.832282066345215, "global_step": 59601, "epoch": 1419} {"train_loss": -5.904728889465332, "global_step": 59602, "epoch": 1419} {"train_loss": -5.73013973236084, "global_step": 59603, "epoch": 1419} {"train_loss": -5.926016330718994, "global_step": 59604, "epoch": 1419} {"train_loss": -5.889677047729492, "global_step": 59605, "epoch": 1419} {"train_loss": -5.743488788604736, "global_step": 59606, "epoch": 1419} {"train_loss": -5.915532112121582, "global_step": 59607, "epoch": 1419} {"train_loss": -5.831818580627441, "global_step": 59608, "epoch": 1419} {"train_loss": -5.880989074707031, "global_step": 59609, "epoch": 1419} {"train_loss": -5.964948654174805, "global_step": 59610, "epoch": 1419} {"train_loss": -5.786050796508789, "global_step": 59611, "epoch": 1419} {"train_loss": -5.816560745239258, "global_step": 59612, "epoch": 1419} {"train_loss": -5.915436267852783, "global_step": 59613, "epoch": 1419} {"train_loss": -5.958253860473633, "global_step": 59614, "epoch": 1419} {"train_loss": -5.947260856628418, "global_step": 59615, "epoch": 1419} {"train_loss": -5.963921546936035, "global_step": 59616, "epoch": 1419} {"train_loss": -5.89141845703125, "global_step": 59617, "epoch": 1419} {"train_loss": -5.896778583526611, "global_step": 59618, "epoch": 1419} {"train_loss": -5.9505085945129395, "global_step": 59619, "epoch": 1419} {"train_loss": -6.029085159301758, "global_step": 59620, "epoch": 1419} {"train_loss": -5.971033096313477, "global_step": 59621, "epoch": 1419} {"train_loss": -5.909111022949219, "global_step": 59622, "epoch": 1419} {"train_loss": -5.863925933837891, "global_step": 59623, "epoch": 1419} {"train_loss": -5.916284561157227, "global_step": 59624, "epoch": 1419} {"train_loss": -5.840154647827148, "global_step": 59625, "epoch": 1419} {"train_loss": -5.9095635414123535, "global_step": 59626, "epoch": 1419} {"train_loss": -5.87194299697876, "global_step": 59627, "epoch": 1419} {"train_loss": -5.898221015930176, "global_step": 59628, "epoch": 1419} {"train_loss": -5.886273384094238, "global_step": 59629, "epoch": 1419} {"train_loss": -5.829932689666748, "global_step": 59630, "epoch": 1419} {"train_loss": -5.810715675354004, "global_step": 59631, "epoch": 1419} {"train_loss": -5.735394477844238, "global_step": 59632, "epoch": 1419} {"train_loss": -5.8448333740234375, "global_step": 59633, "epoch": 1419} {"train_loss": -5.709847927093506, "global_step": 59634, "epoch": 1419} {"train_loss": -5.773323059082031, "global_step": 59635, "epoch": 1419} {"train_loss": -5.856560230255127, "global_step": 59636, "epoch": 1419} {"train_loss": -5.988037586212158, "global_step": 59637, "epoch": 1419} {"train_loss": -5.8049468994140625, "global_step": 59638, "epoch": 1419} {"train_loss": -5.873992999394734, "global_step": 59639, "epoch": 1419, "val_loss": 74529.5234375} {"train_loss": -5.818547248840332, "global_step": 59640, "epoch": 1420} {"train_loss": -5.822588920593262, "global_step": 59641, "epoch": 1420} {"train_loss": -5.829239845275879, "global_step": 59642, "epoch": 1420} {"train_loss": -5.822571754455566, "global_step": 59643, "epoch": 1420} {"train_loss": -5.853428840637207, "global_step": 59644, "epoch": 1420} {"train_loss": -5.901782035827637, "global_step": 59645, "epoch": 1420} {"train_loss": -5.939713001251221, "global_step": 59646, "epoch": 1420} {"train_loss": -5.725543975830078, "global_step": 59647, "epoch": 1420} {"train_loss": -5.877945423126221, "global_step": 59648, "epoch": 1420} {"train_loss": -5.935681343078613, "global_step": 59649, "epoch": 1420} {"train_loss": -5.9785871505737305, "global_step": 59650, "epoch": 1420} {"train_loss": -5.906637191772461, "global_step": 59651, "epoch": 1420} {"train_loss": -5.898530006408691, "global_step": 59652, "epoch": 1420} {"train_loss": -5.917962551116943, "global_step": 59653, "epoch": 1420} {"train_loss": -5.8437604904174805, "global_step": 59654, "epoch": 1420} {"train_loss": -5.935112476348877, "global_step": 59655, "epoch": 1420} {"train_loss": -5.940374851226807, "global_step": 59656, "epoch": 1420} {"train_loss": -5.848769664764404, "global_step": 59657, "epoch": 1420} {"train_loss": -5.913691520690918, "global_step": 59658, "epoch": 1420} {"train_loss": -5.895667552947998, "global_step": 59659, "epoch": 1420} {"train_loss": -5.8452959060668945, "global_step": 59660, "epoch": 1420} {"train_loss": -5.831854820251465, "global_step": 59661, "epoch": 1420} {"train_loss": -5.990690231323242, "global_step": 59662, "epoch": 1420} {"train_loss": -5.779648780822754, "global_step": 59663, "epoch": 1420} {"train_loss": -5.882204055786133, "global_step": 59664, "epoch": 1420} {"train_loss": -5.7870941162109375, "global_step": 59665, "epoch": 1420} {"train_loss": -5.92779016494751, "global_step": 59666, "epoch": 1420} {"train_loss": -5.8518476486206055, "global_step": 59667, "epoch": 1420} {"train_loss": -5.794641494750977, "global_step": 59668, "epoch": 1420} {"train_loss": -5.814550399780273, "global_step": 59669, "epoch": 1420} {"train_loss": -5.882503509521484, "global_step": 59670, "epoch": 1420} {"train_loss": -5.93134880065918, "global_step": 59671, "epoch": 1420} {"train_loss": -5.780301094055176, "global_step": 59672, "epoch": 1420} {"train_loss": -5.859038352966309, "global_step": 59673, "epoch": 1420} {"train_loss": -5.930415153503418, "global_step": 59674, "epoch": 1420} {"train_loss": -5.879168510437012, "global_step": 59675, "epoch": 1420} {"train_loss": -5.955497741699219, "global_step": 59676, "epoch": 1420} {"train_loss": -5.831377983093262, "global_step": 59677, "epoch": 1420} {"train_loss": -5.949213027954102, "global_step": 59678, "epoch": 1420} {"train_loss": -5.919336318969727, "global_step": 59679, "epoch": 1420} {"train_loss": -5.79529333114624, "global_step": 59680, "epoch": 1420} {"train_loss": -5.872344017028809, "global_step": 59681, "epoch": 1420, "val_loss": 74747.1484375} {"train_loss": -5.81638765335083, "global_step": 59682, "epoch": 1421} {"train_loss": -5.935090065002441, "global_step": 59683, "epoch": 1421} {"train_loss": -5.863277912139893, "global_step": 59684, "epoch": 1421} {"train_loss": -5.892667293548584, "global_step": 59685, "epoch": 1421} {"train_loss": -5.881214141845703, "global_step": 59686, "epoch": 1421} {"train_loss": -5.836090087890625, "global_step": 59687, "epoch": 1421} {"train_loss": -5.867025375366211, "global_step": 59688, "epoch": 1421} {"train_loss": -5.806942462921143, "global_step": 59689, "epoch": 1421} {"train_loss": -5.8076887130737305, "global_step": 59690, "epoch": 1421} {"train_loss": -5.8379011154174805, "global_step": 59691, "epoch": 1421} {"train_loss": -5.889578342437744, "global_step": 59692, "epoch": 1421} {"train_loss": -5.86566162109375, "global_step": 59693, "epoch": 1421} {"train_loss": -5.8426713943481445, "global_step": 59694, "epoch": 1421} {"train_loss": -5.9217939376831055, "global_step": 59695, "epoch": 1421} {"train_loss": -5.953003406524658, "global_step": 59696, "epoch": 1421} {"train_loss": -5.9478302001953125, "global_step": 59697, "epoch": 1421} {"train_loss": -5.900810718536377, "global_step": 59698, "epoch": 1421} {"train_loss": -5.823083400726318, "global_step": 59699, "epoch": 1421} {"train_loss": -5.794660568237305, "global_step": 59700, "epoch": 1421} {"train_loss": -5.876349925994873, "global_step": 59701, "epoch": 1421} {"train_loss": -5.833193778991699, "global_step": 59702, "epoch": 1421} {"train_loss": -5.877074718475342, "global_step": 59703, "epoch": 1421} {"train_loss": -5.839540481567383, "global_step": 59704, "epoch": 1421} {"train_loss": -5.882290840148926, "global_step": 59705, "epoch": 1421} {"train_loss": -5.876772403717041, "global_step": 59706, "epoch": 1421} {"train_loss": -5.916441440582275, "global_step": 59707, "epoch": 1421} {"train_loss": -5.95304536819458, "global_step": 59708, "epoch": 1421} {"train_loss": -5.933128356933594, "global_step": 59709, "epoch": 1421} {"train_loss": -5.989921569824219, "global_step": 59710, "epoch": 1421} {"train_loss": -5.835010528564453, "global_step": 59711, "epoch": 1421} {"train_loss": -5.838919639587402, "global_step": 59712, "epoch": 1421} {"train_loss": -5.925279140472412, "global_step": 59713, "epoch": 1421} {"train_loss": -5.799455642700195, "global_step": 59714, "epoch": 1421} {"train_loss": -5.904401779174805, "global_step": 59715, "epoch": 1421} {"train_loss": -5.915386199951172, "global_step": 59716, "epoch": 1421} {"train_loss": -5.815788269042969, "global_step": 59717, "epoch": 1421} {"train_loss": -5.893008232116699, "global_step": 59718, "epoch": 1421} {"train_loss": -5.817334175109863, "global_step": 59719, "epoch": 1421} {"train_loss": -5.984532356262207, "global_step": 59720, "epoch": 1421} {"train_loss": -5.8731160163879395, "global_step": 59721, "epoch": 1421} {"train_loss": -5.861796855926514, "global_step": 59722, "epoch": 1421} {"train_loss": -5.876227708089919, "global_step": 59723, "epoch": 1421, "val_loss": 74373.0390625} {"train_loss": -5.8706865310668945, "global_step": 59724, "epoch": 1422} {"train_loss": -5.891141891479492, "global_step": 59725, "epoch": 1422} {"train_loss": -5.963010311126709, "global_step": 59726, "epoch": 1422} {"train_loss": -5.891138553619385, "global_step": 59727, "epoch": 1422} {"train_loss": -5.907325744628906, "global_step": 59728, "epoch": 1422} {"train_loss": -5.831129550933838, "global_step": 59729, "epoch": 1422} {"train_loss": -5.880131721496582, "global_step": 59730, "epoch": 1422} {"train_loss": -5.884300231933594, "global_step": 59731, "epoch": 1422} {"train_loss": -6.0080108642578125, "global_step": 59732, "epoch": 1422} {"train_loss": -5.8235063552856445, "global_step": 59733, "epoch": 1422} {"train_loss": -5.9142608642578125, "global_step": 59734, "epoch": 1422} {"train_loss": -5.898967742919922, "global_step": 59735, "epoch": 1422} {"train_loss": -5.874285697937012, "global_step": 59736, "epoch": 1422} {"train_loss": -5.9739580154418945, "global_step": 59737, "epoch": 1422} {"train_loss": -5.810158729553223, "global_step": 59738, "epoch": 1422} {"train_loss": -5.898754596710205, "global_step": 59739, "epoch": 1422} {"train_loss": -5.976181983947754, "global_step": 59740, "epoch": 1422} {"train_loss": -5.85765266418457, "global_step": 59741, "epoch": 1422} {"train_loss": -5.873815059661865, "global_step": 59742, "epoch": 1422} {"train_loss": -5.9344987869262695, "global_step": 59743, "epoch": 1422} {"train_loss": -5.92392635345459, "global_step": 59744, "epoch": 1422} {"train_loss": -5.910605430603027, "global_step": 59745, "epoch": 1422} {"train_loss": -5.978113651275635, "global_step": 59746, "epoch": 1422} {"train_loss": -5.911837577819824, "global_step": 59747, "epoch": 1422} {"train_loss": -5.9437255859375, "global_step": 59748, "epoch": 1422} {"train_loss": -5.868412017822266, "global_step": 59749, "epoch": 1422} {"train_loss": -5.902024269104004, "global_step": 59750, "epoch": 1422} {"train_loss": -5.876946449279785, "global_step": 59751, "epoch": 1422} {"train_loss": -5.90416145324707, "global_step": 59752, "epoch": 1422} {"train_loss": -5.902585506439209, "global_step": 59753, "epoch": 1422} {"train_loss": -5.938625812530518, "global_step": 59754, "epoch": 1422} {"train_loss": -6.028669357299805, "global_step": 59755, "epoch": 1422} {"train_loss": -5.981785774230957, "global_step": 59756, "epoch": 1422} {"train_loss": -5.8185834884643555, "global_step": 59757, "epoch": 1422} {"train_loss": -5.934653282165527, "global_step": 59758, "epoch": 1422} {"train_loss": -5.872381210327148, "global_step": 59759, "epoch": 1422} {"train_loss": -5.921785831451416, "global_step": 59760, "epoch": 1422} {"train_loss": -5.96112060546875, "global_step": 59761, "epoch": 1422} {"train_loss": -5.939909934997559, "global_step": 59762, "epoch": 1422} {"train_loss": -5.93503475189209, "global_step": 59763, "epoch": 1422} {"train_loss": -5.960818290710449, "global_step": 59764, "epoch": 1422} {"train_loss": -5.913578328632173, "global_step": 59765, "epoch": 1422, "val_loss": 74323.9609375} {"train_loss": -5.998306751251221, "global_step": 59766, "epoch": 1423} {"train_loss": -5.966148853302002, "global_step": 59767, "epoch": 1423} {"train_loss": -5.84587287902832, "global_step": 59768, "epoch": 1423} {"train_loss": -6.020456790924072, "global_step": 59769, "epoch": 1423} {"train_loss": -5.822181701660156, "global_step": 59770, "epoch": 1423} {"train_loss": -5.829434871673584, "global_step": 59771, "epoch": 1423} {"train_loss": -5.827445030212402, "global_step": 59772, "epoch": 1423} {"train_loss": -5.831900596618652, "global_step": 59773, "epoch": 1423} {"train_loss": -5.889493942260742, "global_step": 59774, "epoch": 1423} {"train_loss": -5.870950698852539, "global_step": 59775, "epoch": 1423} {"train_loss": -6.0392961502075195, "global_step": 59776, "epoch": 1423} {"train_loss": -5.8936028480529785, "global_step": 59777, "epoch": 1423} {"train_loss": -5.823342323303223, "global_step": 59778, "epoch": 1423} {"train_loss": -5.9014105796813965, "global_step": 59779, "epoch": 1423} {"train_loss": -5.827378273010254, "global_step": 59780, "epoch": 1423} {"train_loss": -6.00078010559082, "global_step": 59781, "epoch": 1423} {"train_loss": -5.9644269943237305, "global_step": 59782, "epoch": 1423} {"train_loss": -5.965582847595215, "global_step": 59783, "epoch": 1423} {"train_loss": -5.8949408531188965, "global_step": 59784, "epoch": 1423} {"train_loss": -5.8766937255859375, "global_step": 59785, "epoch": 1423} {"train_loss": -5.815160274505615, "global_step": 59786, "epoch": 1423} {"train_loss": -5.846490383148193, "global_step": 59787, "epoch": 1423} {"train_loss": -5.915124893188477, "global_step": 59788, "epoch": 1423} {"train_loss": -5.970460414886475, "global_step": 59789, "epoch": 1423} {"train_loss": -5.808021545410156, "global_step": 59790, "epoch": 1423} {"train_loss": -5.892103672027588, "global_step": 59791, "epoch": 1423} {"train_loss": -5.8955488204956055, "global_step": 59792, "epoch": 1423} {"train_loss": -5.922799110412598, "global_step": 59793, "epoch": 1423} {"train_loss": -5.933778285980225, "global_step": 59794, "epoch": 1423} {"train_loss": -5.900032997131348, "global_step": 59795, "epoch": 1423} {"train_loss": -5.879478454589844, "global_step": 59796, "epoch": 1423} {"train_loss": -5.803460597991943, "global_step": 59797, "epoch": 1423} {"train_loss": -5.742315769195557, "global_step": 59798, "epoch": 1423} {"train_loss": -5.782044887542725, "global_step": 59799, "epoch": 1423} {"train_loss": -5.852992057800293, "global_step": 59800, "epoch": 1423} {"train_loss": -5.891249656677246, "global_step": 59801, "epoch": 1423} {"train_loss": -5.850546836853027, "global_step": 59802, "epoch": 1423} {"train_loss": -5.937434196472168, "global_step": 59803, "epoch": 1423} {"train_loss": -5.801392555236816, "global_step": 59804, "epoch": 1423} {"train_loss": -5.850764274597168, "global_step": 59805, "epoch": 1423} {"train_loss": -5.759011268615723, "global_step": 59806, "epoch": 1423} {"train_loss": -5.88098026457287, "global_step": 59807, "epoch": 1423, "val_loss": 74254.234375} {"train_loss": -5.960904121398926, "global_step": 59808, "epoch": 1424} {"train_loss": -5.88355016708374, "global_step": 59809, "epoch": 1424} {"train_loss": -5.8857927322387695, "global_step": 59810, "epoch": 1424} {"train_loss": -5.8438920974731445, "global_step": 59811, "epoch": 1424} {"train_loss": -5.8344244956970215, "global_step": 59812, "epoch": 1424} {"train_loss": -5.9024577140808105, "global_step": 59813, "epoch": 1424} {"train_loss": -5.829504013061523, "global_step": 59814, "epoch": 1424} {"train_loss": -5.811208248138428, "global_step": 59815, "epoch": 1424} {"train_loss": -5.957813262939453, "global_step": 59816, "epoch": 1424} {"train_loss": -5.775238037109375, "global_step": 59817, "epoch": 1424} {"train_loss": -5.939871788024902, "global_step": 59818, "epoch": 1424} {"train_loss": -5.880904674530029, "global_step": 59819, "epoch": 1424} {"train_loss": -5.946284294128418, "global_step": 59820, "epoch": 1424} {"train_loss": -5.912590026855469, "global_step": 59821, "epoch": 1424} {"train_loss": -5.863397598266602, "global_step": 59822, "epoch": 1424} {"train_loss": -5.734816551208496, "global_step": 59823, "epoch": 1424} {"train_loss": -5.9222846031188965, "global_step": 59824, "epoch": 1424} {"train_loss": -5.981629371643066, "global_step": 59825, "epoch": 1424} {"train_loss": -5.967988967895508, "global_step": 59826, "epoch": 1424} {"train_loss": -5.862704277038574, "global_step": 59827, "epoch": 1424} {"train_loss": -5.976524353027344, "global_step": 59828, "epoch": 1424} {"train_loss": -6.090183734893799, "global_step": 59829, "epoch": 1424} {"train_loss": -5.934330940246582, "global_step": 59830, "epoch": 1424} {"train_loss": -6.012927055358887, "global_step": 59831, "epoch": 1424} {"train_loss": -5.95388650894165, "global_step": 59832, "epoch": 1424} {"train_loss": -5.831098556518555, "global_step": 59833, "epoch": 1424} {"train_loss": -5.985306739807129, "global_step": 59834, "epoch": 1424} {"train_loss": -5.835909843444824, "global_step": 59835, "epoch": 1424} {"train_loss": -5.913002014160156, "global_step": 59836, "epoch": 1424} {"train_loss": -5.873652935028076, "global_step": 59837, "epoch": 1424} {"train_loss": -5.913994789123535, "global_step": 59838, "epoch": 1424} {"train_loss": -5.8238067626953125, "global_step": 59839, "epoch": 1424} {"train_loss": -5.862894535064697, "global_step": 59840, "epoch": 1424} {"train_loss": -5.954450607299805, "global_step": 59841, "epoch": 1424} {"train_loss": -5.866045951843262, "global_step": 59842, "epoch": 1424} {"train_loss": -5.8319783210754395, "global_step": 59843, "epoch": 1424} {"train_loss": -5.725405693054199, "global_step": 59844, "epoch": 1424} {"train_loss": -5.955608367919922, "global_step": 59845, "epoch": 1424} {"train_loss": -5.8422136306762695, "global_step": 59846, "epoch": 1424} {"train_loss": -5.805895805358887, "global_step": 59847, "epoch": 1424} {"train_loss": -5.832359790802002, "global_step": 59848, "epoch": 1424} {"train_loss": -5.889843339011783, "global_step": 59849, "epoch": 1424, "val_loss": 74570.53125} {"train_loss": -5.96464729309082, "global_step": 59850, "epoch": 1425} {"train_loss": -5.924320220947266, "global_step": 59851, "epoch": 1425} {"train_loss": -5.897295951843262, "global_step": 59852, "epoch": 1425} {"train_loss": -5.889601707458496, "global_step": 59853, "epoch": 1425} {"train_loss": -6.049201965332031, "global_step": 59854, "epoch": 1425} {"train_loss": -5.7771830558776855, "global_step": 59855, "epoch": 1425} {"train_loss": -5.843502998352051, "global_step": 59856, "epoch": 1425} {"train_loss": -5.997743606567383, "global_step": 59857, "epoch": 1425} {"train_loss": -5.889400482177734, "global_step": 59858, "epoch": 1425} {"train_loss": -5.876005172729492, "global_step": 59859, "epoch": 1425} {"train_loss": -5.899599075317383, "global_step": 59860, "epoch": 1425} {"train_loss": -5.9008588790893555, "global_step": 59861, "epoch": 1425} {"train_loss": -5.895904064178467, "global_step": 59862, "epoch": 1425} {"train_loss": -5.8282470703125, "global_step": 59863, "epoch": 1425} {"train_loss": -5.918489456176758, "global_step": 59864, "epoch": 1425} {"train_loss": -5.95674991607666, "global_step": 59865, "epoch": 1425} {"train_loss": -5.96568489074707, "global_step": 59866, "epoch": 1425} {"train_loss": -5.866429328918457, "global_step": 59867, "epoch": 1425} {"train_loss": -5.9109272956848145, "global_step": 59868, "epoch": 1425} {"train_loss": -5.9270429611206055, "global_step": 59869, "epoch": 1425} {"train_loss": -5.927825927734375, "global_step": 59870, "epoch": 1425} {"train_loss": -5.860469818115234, "global_step": 59871, "epoch": 1425} {"train_loss": -5.967044353485107, "global_step": 59872, "epoch": 1425} {"train_loss": -5.876525402069092, "global_step": 59873, "epoch": 1425} {"train_loss": -5.974559307098389, "global_step": 59874, "epoch": 1425} {"train_loss": -5.897276401519775, "global_step": 59875, "epoch": 1425} {"train_loss": -5.991904258728027, "global_step": 59876, "epoch": 1425} {"train_loss": -5.85390043258667, "global_step": 59877, "epoch": 1425} {"train_loss": -5.895705223083496, "global_step": 59878, "epoch": 1425} {"train_loss": -5.952092170715332, "global_step": 59879, "epoch": 1425} {"train_loss": -5.955097198486328, "global_step": 59880, "epoch": 1425} {"train_loss": -5.846392631530762, "global_step": 59881, "epoch": 1425} {"train_loss": -5.925576210021973, "global_step": 59882, "epoch": 1425} {"train_loss": -5.785444736480713, "global_step": 59883, "epoch": 1425} {"train_loss": -5.919616222381592, "global_step": 59884, "epoch": 1425} {"train_loss": -5.780538558959961, "global_step": 59885, "epoch": 1425} {"train_loss": -5.908313274383545, "global_step": 59886, "epoch": 1425} {"train_loss": -5.880810737609863, "global_step": 59887, "epoch": 1425} {"train_loss": -5.924882411956787, "global_step": 59888, "epoch": 1425} {"train_loss": -5.777898788452148, "global_step": 59889, "epoch": 1425} {"train_loss": -5.971390724182129, "global_step": 59890, "epoch": 1425} {"train_loss": -5.90159737496149, "global_step": 59891, "epoch": 1425, "val_loss": 74368.0390625} {"train_loss": -5.902327537536621, "global_step": 59892, "epoch": 1426} {"train_loss": -5.7951860427856445, "global_step": 59893, "epoch": 1426} {"train_loss": -5.9080376625061035, "global_step": 59894, "epoch": 1426} {"train_loss": -5.971729755401611, "global_step": 59895, "epoch": 1426} {"train_loss": -5.913082599639893, "global_step": 59896, "epoch": 1426} {"train_loss": -5.896533012390137, "global_step": 59897, "epoch": 1426} {"train_loss": -5.9596638679504395, "global_step": 59898, "epoch": 1426} {"train_loss": -5.897757053375244, "global_step": 59899, "epoch": 1426} {"train_loss": -5.86353874206543, "global_step": 59900, "epoch": 1426} {"train_loss": -5.858592510223389, "global_step": 59901, "epoch": 1426} {"train_loss": -5.9181623458862305, "global_step": 59902, "epoch": 1426} {"train_loss": -5.857877731323242, "global_step": 59903, "epoch": 1426} {"train_loss": -5.810370445251465, "global_step": 59904, "epoch": 1426} {"train_loss": -5.825308799743652, "global_step": 59905, "epoch": 1426} {"train_loss": -5.698506832122803, "global_step": 59906, "epoch": 1426} {"train_loss": -5.978183746337891, "global_step": 59907, "epoch": 1426} {"train_loss": -5.886818885803223, "global_step": 59908, "epoch": 1426} {"train_loss": -5.874578475952148, "global_step": 59909, "epoch": 1426} {"train_loss": -5.86761474609375, "global_step": 59910, "epoch": 1426} {"train_loss": -5.9138336181640625, "global_step": 59911, "epoch": 1426} {"train_loss": -5.9513115882873535, "global_step": 59912, "epoch": 1426} {"train_loss": -5.882576942443848, "global_step": 59913, "epoch": 1426} {"train_loss": -5.910721778869629, "global_step": 59914, "epoch": 1426} {"train_loss": -5.897175312042236, "global_step": 59915, "epoch": 1426} {"train_loss": -5.792545795440674, "global_step": 59916, "epoch": 1426} {"train_loss": -5.862998008728027, "global_step": 59917, "epoch": 1426} {"train_loss": -5.950948715209961, "global_step": 59918, "epoch": 1426} {"train_loss": -5.987168312072754, "global_step": 59919, "epoch": 1426} {"train_loss": -6.070024013519287, "global_step": 59920, "epoch": 1426} {"train_loss": -5.885581970214844, "global_step": 59921, "epoch": 1426} {"train_loss": -5.9180803298950195, "global_step": 59922, "epoch": 1426} {"train_loss": -5.945927619934082, "global_step": 59923, "epoch": 1426} {"train_loss": -6.017910003662109, "global_step": 59924, "epoch": 1426} {"train_loss": -5.935122489929199, "global_step": 59925, "epoch": 1426} {"train_loss": -5.976524353027344, "global_step": 59926, "epoch": 1426} {"train_loss": -5.9387102127075195, "global_step": 59927, "epoch": 1426} {"train_loss": -5.924470901489258, "global_step": 59928, "epoch": 1426} {"train_loss": -5.988770484924316, "global_step": 59929, "epoch": 1426} {"train_loss": -5.840792655944824, "global_step": 59930, "epoch": 1426} {"train_loss": -5.912646770477295, "global_step": 59931, "epoch": 1426} {"train_loss": -5.999607086181641, "global_step": 59932, "epoch": 1426} {"train_loss": -5.908703826722645, "global_step": 59933, "epoch": 1426, "val_loss": 74401.7421875} {"train_loss": -5.967226982116699, "global_step": 59934, "epoch": 1427} {"train_loss": -5.9885101318359375, "global_step": 59935, "epoch": 1427} {"train_loss": -6.016831398010254, "global_step": 59936, "epoch": 1427} {"train_loss": -6.017819404602051, "global_step": 59937, "epoch": 1427} {"train_loss": -5.941557884216309, "global_step": 59938, "epoch": 1427} {"train_loss": -5.8448486328125, "global_step": 59939, "epoch": 1427} {"train_loss": -5.8862199783325195, "global_step": 59940, "epoch": 1427} {"train_loss": -5.975931167602539, "global_step": 59941, "epoch": 1427} {"train_loss": -5.8003926277160645, "global_step": 59942, "epoch": 1427} {"train_loss": -5.86866569519043, "global_step": 59943, "epoch": 1427} {"train_loss": -5.79771614074707, "global_step": 59944, "epoch": 1427} {"train_loss": -5.7716145515441895, "global_step": 59945, "epoch": 1427} {"train_loss": -5.939341068267822, "global_step": 59946, "epoch": 1427} {"train_loss": -5.745649337768555, "global_step": 59947, "epoch": 1427} {"train_loss": -5.834346771240234, "global_step": 59948, "epoch": 1427} {"train_loss": -5.944838047027588, "global_step": 59949, "epoch": 1427} {"train_loss": -5.751368522644043, "global_step": 59950, "epoch": 1427} {"train_loss": -5.948144912719727, "global_step": 59951, "epoch": 1427} {"train_loss": -5.968662738800049, "global_step": 59952, "epoch": 1427} {"train_loss": -5.893294334411621, "global_step": 59953, "epoch": 1427} {"train_loss": -5.885310173034668, "global_step": 59954, "epoch": 1427} {"train_loss": -5.802469253540039, "global_step": 59955, "epoch": 1427} {"train_loss": -6.0388712882995605, "global_step": 59956, "epoch": 1427} {"train_loss": -5.856210708618164, "global_step": 59957, "epoch": 1427} {"train_loss": -5.913238525390625, "global_step": 59958, "epoch": 1427} {"train_loss": -5.876908302307129, "global_step": 59959, "epoch": 1427} {"train_loss": -5.828420162200928, "global_step": 59960, "epoch": 1427} {"train_loss": -5.844822883605957, "global_step": 59961, "epoch": 1427} {"train_loss": -5.8856048583984375, "global_step": 59962, "epoch": 1427} {"train_loss": -5.943061828613281, "global_step": 59963, "epoch": 1427} {"train_loss": -5.8497395515441895, "global_step": 59964, "epoch": 1427} {"train_loss": -5.895016670227051, "global_step": 59965, "epoch": 1427} {"train_loss": -5.825884819030762, "global_step": 59966, "epoch": 1427} {"train_loss": -5.902139186859131, "global_step": 59967, "epoch": 1427} {"train_loss": -5.875694274902344, "global_step": 59968, "epoch": 1427} {"train_loss": -5.875820636749268, "global_step": 59969, "epoch": 1427} {"train_loss": -6.012913227081299, "global_step": 59970, "epoch": 1427} {"train_loss": -5.861073970794678, "global_step": 59971, "epoch": 1427} {"train_loss": -6.014891147613525, "global_step": 59972, "epoch": 1427} {"train_loss": -5.916113376617432, "global_step": 59973, "epoch": 1427} {"train_loss": -5.912040710449219, "global_step": 59974, "epoch": 1427} {"train_loss": -5.89414584069025, "global_step": 59975, "epoch": 1427, "val_loss": 74161.671875} {"train_loss": -5.863624095916748, "global_step": 59976, "epoch": 1428} {"train_loss": -5.911941051483154, "global_step": 59977, "epoch": 1428} {"train_loss": -5.773760795593262, "global_step": 59978, "epoch": 1428} {"train_loss": -5.8859405517578125, "global_step": 59979, "epoch": 1428} {"train_loss": -5.767307758331299, "global_step": 59980, "epoch": 1428} {"train_loss": -5.83159875869751, "global_step": 59981, "epoch": 1428} {"train_loss": -5.915387153625488, "global_step": 59982, "epoch": 1428} {"train_loss": -5.789811134338379, "global_step": 59983, "epoch": 1428} {"train_loss": -5.87172794342041, "global_step": 59984, "epoch": 1428} {"train_loss": -5.869095802307129, "global_step": 59985, "epoch": 1428} {"train_loss": -5.847869873046875, "global_step": 59986, "epoch": 1428} {"train_loss": -5.907588005065918, "global_step": 59987, "epoch": 1428} {"train_loss": -5.9047722816467285, "global_step": 59988, "epoch": 1428} {"train_loss": -5.955216407775879, "global_step": 59989, "epoch": 1428} {"train_loss": -5.990556716918945, "global_step": 59990, "epoch": 1428} {"train_loss": -5.88385009765625, "global_step": 59991, "epoch": 1428} {"train_loss": -5.878891468048096, "global_step": 59992, "epoch": 1428} {"train_loss": -5.778933048248291, "global_step": 59993, "epoch": 1428} {"train_loss": -5.880359649658203, "global_step": 59994, "epoch": 1428} {"train_loss": -5.810596466064453, "global_step": 59995, "epoch": 1428} {"train_loss": -5.8100690841674805, "global_step": 59996, "epoch": 1428} {"train_loss": -5.762688636779785, "global_step": 59997, "epoch": 1428} {"train_loss": -5.874447822570801, "global_step": 59998, "epoch": 1428} {"train_loss": -5.871798038482666, "global_step": 59999, "epoch": 1428} {"train_loss": -5.955913066864014, "global_step": 60000, "epoch": 1428} {"train_loss": -5.867027282714844, "global_step": 60001, "epoch": 1428} {"train_loss": -5.839809894561768, "global_step": 60002, "epoch": 1428} {"train_loss": -5.795504570007324, "global_step": 60003, "epoch": 1428} {"train_loss": -5.803056240081787, "global_step": 60004, "epoch": 1428} {"train_loss": -5.901858329772949, "global_step": 60005, "epoch": 1428} {"train_loss": -5.907626628875732, "global_step": 60006, "epoch": 1428} {"train_loss": -5.90771484375, "global_step": 60007, "epoch": 1428} {"train_loss": -5.831578731536865, "global_step": 60008, "epoch": 1428} {"train_loss": -5.864997863769531, "global_step": 60009, "epoch": 1428} {"train_loss": -5.911978721618652, "global_step": 60010, "epoch": 1428} {"train_loss": -5.806414604187012, "global_step": 60011, "epoch": 1428} {"train_loss": -5.798089504241943, "global_step": 60012, "epoch": 1428} {"train_loss": -5.959564208984375, "global_step": 60013, "epoch": 1428} {"train_loss": -5.856823444366455, "global_step": 60014, "epoch": 1428} {"train_loss": -5.931246280670166, "global_step": 60015, "epoch": 1428} {"train_loss": -5.812459468841553, "global_step": 60016, "epoch": 1428} {"train_loss": -5.86025443531218, "global_step": 60017, "epoch": 1428, "val_loss": 74583.828125} {"train_loss": -5.8553466796875, "global_step": 60018, "epoch": 1429} {"train_loss": -5.891158580780029, "global_step": 60019, "epoch": 1429} {"train_loss": -5.884273052215576, "global_step": 60020, "epoch": 1429} {"train_loss": -5.768393516540527, "global_step": 60021, "epoch": 1429} {"train_loss": -5.788232803344727, "global_step": 60022, "epoch": 1429} {"train_loss": -5.81074857711792, "global_step": 60023, "epoch": 1429} {"train_loss": -5.930018424987793, "global_step": 60024, "epoch": 1429} {"train_loss": -5.873568534851074, "global_step": 60025, "epoch": 1429} {"train_loss": -5.699751853942871, "global_step": 60026, "epoch": 1429} {"train_loss": -5.856529712677002, "global_step": 60027, "epoch": 1429} {"train_loss": -5.918627738952637, "global_step": 60028, "epoch": 1429} {"train_loss": -5.920143127441406, "global_step": 60029, "epoch": 1429} {"train_loss": -5.866425037384033, "global_step": 60030, "epoch": 1429} {"train_loss": -5.865635871887207, "global_step": 60031, "epoch": 1429} {"train_loss": -5.898021697998047, "global_step": 60032, "epoch": 1429} {"train_loss": -5.894582748413086, "global_step": 60033, "epoch": 1429} {"train_loss": -5.919279098510742, "global_step": 60034, "epoch": 1429} {"train_loss": -6.001913547515869, "global_step": 60035, "epoch": 1429} {"train_loss": -5.849788188934326, "global_step": 60036, "epoch": 1429} {"train_loss": -5.901844024658203, "global_step": 60037, "epoch": 1429} {"train_loss": -5.909686088562012, "global_step": 60038, "epoch": 1429} {"train_loss": -5.842893123626709, "global_step": 60039, "epoch": 1429} {"train_loss": -5.937034606933594, "global_step": 60040, "epoch": 1429} {"train_loss": -5.960755348205566, "global_step": 60041, "epoch": 1429} {"train_loss": -5.784204483032227, "global_step": 60042, "epoch": 1429} {"train_loss": -5.882728576660156, "global_step": 60043, "epoch": 1429} {"train_loss": -5.873229503631592, "global_step": 60044, "epoch": 1429} {"train_loss": -5.758092880249023, "global_step": 60045, "epoch": 1429} {"train_loss": -6.01395845413208, "global_step": 60046, "epoch": 1429} {"train_loss": -5.910064697265625, "global_step": 60047, "epoch": 1429} {"train_loss": -5.915988922119141, "global_step": 60048, "epoch": 1429} {"train_loss": -5.877695083618164, "global_step": 60049, "epoch": 1429} {"train_loss": -5.951184272766113, "global_step": 60050, "epoch": 1429} {"train_loss": -5.918302536010742, "global_step": 60051, "epoch": 1429} {"train_loss": -6.0140275955200195, "global_step": 60052, "epoch": 1429} {"train_loss": -5.7436747550964355, "global_step": 60053, "epoch": 1429} {"train_loss": -5.8174052238464355, "global_step": 60054, "epoch": 1429} {"train_loss": -5.894625186920166, "global_step": 60055, "epoch": 1429} {"train_loss": -5.853912353515625, "global_step": 60056, "epoch": 1429} {"train_loss": -5.797842979431152, "global_step": 60057, "epoch": 1429} {"train_loss": -5.861374378204346, "global_step": 60058, "epoch": 1429} {"train_loss": -5.873088564191546, "global_step": 60059, "epoch": 1429, "val_loss": 74256.2109375} {"train_loss": -5.985039710998535, "global_step": 60060, "epoch": 1430} {"train_loss": -5.870457649230957, "global_step": 60061, "epoch": 1430} {"train_loss": -5.831482410430908, "global_step": 60062, "epoch": 1430} {"train_loss": -5.9231109619140625, "global_step": 60063, "epoch": 1430} {"train_loss": -5.9439616203308105, "global_step": 60064, "epoch": 1430} {"train_loss": -6.058380126953125, "global_step": 60065, "epoch": 1430} {"train_loss": -5.793641567230225, "global_step": 60066, "epoch": 1430} {"train_loss": -5.843544960021973, "global_step": 60067, "epoch": 1430} {"train_loss": -5.985302925109863, "global_step": 60068, "epoch": 1430} {"train_loss": -5.931336402893066, "global_step": 60069, "epoch": 1430} {"train_loss": -5.894094467163086, "global_step": 60070, "epoch": 1430} {"train_loss": -5.778345108032227, "global_step": 60071, "epoch": 1430} {"train_loss": -5.898100852966309, "global_step": 60072, "epoch": 1430} {"train_loss": -5.904020309448242, "global_step": 60073, "epoch": 1430} {"train_loss": -5.979019641876221, "global_step": 60074, "epoch": 1430} {"train_loss": -5.988482475280762, "global_step": 60075, "epoch": 1430} {"train_loss": -5.82288122177124, "global_step": 60076, "epoch": 1430} {"train_loss": -5.833038330078125, "global_step": 60077, "epoch": 1430} {"train_loss": -5.762612342834473, "global_step": 60078, "epoch": 1430} {"train_loss": -5.832903861999512, "global_step": 60079, "epoch": 1430} {"train_loss": -5.9696044921875, "global_step": 60080, "epoch": 1430} {"train_loss": -5.826887607574463, "global_step": 60081, "epoch": 1430} {"train_loss": -5.7926225662231445, "global_step": 60082, "epoch": 1430} {"train_loss": -5.939508438110352, "global_step": 60083, "epoch": 1430} {"train_loss": -5.620016098022461, "global_step": 60084, "epoch": 1430} {"train_loss": -5.85308837890625, "global_step": 60085, "epoch": 1430} {"train_loss": -5.816122531890869, "global_step": 60086, "epoch": 1430} {"train_loss": -5.8746232986450195, "global_step": 60087, "epoch": 1430} {"train_loss": -5.934346675872803, "global_step": 60088, "epoch": 1430} {"train_loss": -5.903074264526367, "global_step": 60089, "epoch": 1430} {"train_loss": -5.887472629547119, "global_step": 60090, "epoch": 1430} {"train_loss": -5.852086544036865, "global_step": 60091, "epoch": 1430} {"train_loss": -5.848676681518555, "global_step": 60092, "epoch": 1430} {"train_loss": -5.946234703063965, "global_step": 60093, "epoch": 1430} {"train_loss": -5.758513927459717, "global_step": 60094, "epoch": 1430} {"train_loss": -5.887145042419434, "global_step": 60095, "epoch": 1430} {"train_loss": -5.896933555603027, "global_step": 60096, "epoch": 1430} {"train_loss": -5.989103317260742, "global_step": 60097, "epoch": 1430} {"train_loss": -5.855280876159668, "global_step": 60098, "epoch": 1430} {"train_loss": -5.931175231933594, "global_step": 60099, "epoch": 1430} {"train_loss": -5.858691215515137, "global_step": 60100, "epoch": 1430} {"train_loss": -5.879690272467477, "global_step": 60101, "epoch": 1430, "val_loss": 74551.375} {"train_loss": -5.8467607498168945, "global_step": 60102, "epoch": 1431} {"train_loss": -5.928293228149414, "global_step": 60103, "epoch": 1431} {"train_loss": -6.124053001403809, "global_step": 60104, "epoch": 1431} {"train_loss": -5.9782915115356445, "global_step": 60105, "epoch": 1431} {"train_loss": -5.889582633972168, "global_step": 60106, "epoch": 1431} {"train_loss": -5.8681206703186035, "global_step": 60107, "epoch": 1431} {"train_loss": -5.919119834899902, "global_step": 60108, "epoch": 1431} {"train_loss": -5.9530158042907715, "global_step": 60109, "epoch": 1431} {"train_loss": -5.985973358154297, "global_step": 60110, "epoch": 1431} {"train_loss": -5.775022506713867, "global_step": 60111, "epoch": 1431} {"train_loss": -5.957908630371094, "global_step": 60112, "epoch": 1431} {"train_loss": -5.899889945983887, "global_step": 60113, "epoch": 1431} {"train_loss": -5.848667621612549, "global_step": 60114, "epoch": 1431} {"train_loss": -5.891234874725342, "global_step": 60115, "epoch": 1431} {"train_loss": -5.829530715942383, "global_step": 60116, "epoch": 1431} {"train_loss": -5.912863731384277, "global_step": 60117, "epoch": 1431} {"train_loss": -5.899801254272461, "global_step": 60118, "epoch": 1431} {"train_loss": -5.835743427276611, "global_step": 60119, "epoch": 1431} {"train_loss": -5.86588191986084, "global_step": 60120, "epoch": 1431} {"train_loss": -5.896956443786621, "global_step": 60121, "epoch": 1431} {"train_loss": -5.9341888427734375, "global_step": 60122, "epoch": 1431} {"train_loss": -5.99255895614624, "global_step": 60123, "epoch": 1431} {"train_loss": -5.894524097442627, "global_step": 60124, "epoch": 1431} {"train_loss": -5.969951629638672, "global_step": 60125, "epoch": 1431} {"train_loss": -5.949245452880859, "global_step": 60126, "epoch": 1431} {"train_loss": -5.948307991027832, "global_step": 60127, "epoch": 1431} {"train_loss": -5.807991027832031, "global_step": 60128, "epoch": 1431} {"train_loss": -5.9415082931518555, "global_step": 60129, "epoch": 1431} {"train_loss": -5.838274002075195, "global_step": 60130, "epoch": 1431} {"train_loss": -5.958581447601318, "global_step": 60131, "epoch": 1431} {"train_loss": -5.931368350982666, "global_step": 60132, "epoch": 1431} {"train_loss": -5.90248966217041, "global_step": 60133, "epoch": 1431} {"train_loss": -5.74123477935791, "global_step": 60134, "epoch": 1431} {"train_loss": -5.801751136779785, "global_step": 60135, "epoch": 1431} {"train_loss": -5.839635372161865, "global_step": 60136, "epoch": 1431} {"train_loss": -5.930972099304199, "global_step": 60137, "epoch": 1431} {"train_loss": -5.920401573181152, "global_step": 60138, "epoch": 1431} {"train_loss": -5.817610263824463, "global_step": 60139, "epoch": 1431} {"train_loss": -6.053625583648682, "global_step": 60140, "epoch": 1431} {"train_loss": -5.899542331695557, "global_step": 60141, "epoch": 1431} {"train_loss": -5.996047019958496, "global_step": 60142, "epoch": 1431} {"train_loss": -5.908491679600307, "global_step": 60143, "epoch": 1431, "val_loss": 74309.7578125} {"train_loss": -5.823403358459473, "global_step": 60144, "epoch": 1432} {"train_loss": -5.937453269958496, "global_step": 60145, "epoch": 1432} {"train_loss": -6.031428813934326, "global_step": 60146, "epoch": 1432} {"train_loss": -5.974905490875244, "global_step": 60147, "epoch": 1432} {"train_loss": -5.750221252441406, "global_step": 60148, "epoch": 1432} {"train_loss": -5.901118755340576, "global_step": 60149, "epoch": 1432} {"train_loss": -5.819581031799316, "global_step": 60150, "epoch": 1432} {"train_loss": -5.885639190673828, "global_step": 60151, "epoch": 1432} {"train_loss": -5.850303649902344, "global_step": 60152, "epoch": 1432} {"train_loss": -5.882098197937012, "global_step": 60153, "epoch": 1432} {"train_loss": -5.926143646240234, "global_step": 60154, "epoch": 1432} {"train_loss": -5.93914794921875, "global_step": 60155, "epoch": 1432} {"train_loss": -5.771440505981445, "global_step": 60156, "epoch": 1432} {"train_loss": -5.870208740234375, "global_step": 60157, "epoch": 1432} {"train_loss": -5.9051079750061035, "global_step": 60158, "epoch": 1432} {"train_loss": -5.833957672119141, "global_step": 60159, "epoch": 1432} {"train_loss": -5.826935768127441, "global_step": 60160, "epoch": 1432} {"train_loss": -5.969555854797363, "global_step": 60161, "epoch": 1432} {"train_loss": -5.735955715179443, "global_step": 60162, "epoch": 1432} {"train_loss": -5.882920265197754, "global_step": 60163, "epoch": 1432} {"train_loss": -5.838420867919922, "global_step": 60164, "epoch": 1432} {"train_loss": -5.973589897155762, "global_step": 60165, "epoch": 1432} {"train_loss": -5.910897731781006, "global_step": 60166, "epoch": 1432} {"train_loss": -6.028897285461426, "global_step": 60167, "epoch": 1432} {"train_loss": -5.9081010818481445, "global_step": 60168, "epoch": 1432} {"train_loss": -5.896539211273193, "global_step": 60169, "epoch": 1432} {"train_loss": -5.959212779998779, "global_step": 60170, "epoch": 1432} {"train_loss": -6.081758499145508, "global_step": 60171, "epoch": 1432} {"train_loss": -5.880951881408691, "global_step": 60172, "epoch": 1432} {"train_loss": -5.913954734802246, "global_step": 60173, "epoch": 1432} {"train_loss": -5.968575477600098, "global_step": 60174, "epoch": 1432} {"train_loss": -5.95849609375, "global_step": 60175, "epoch": 1432} {"train_loss": -5.810733318328857, "global_step": 60176, "epoch": 1432} {"train_loss": -6.028873443603516, "global_step": 60177, "epoch": 1432} {"train_loss": -5.8826823234558105, "global_step": 60178, "epoch": 1432} {"train_loss": -6.023890495300293, "global_step": 60179, "epoch": 1432} {"train_loss": -5.919061660766602, "global_step": 60180, "epoch": 1432} {"train_loss": -5.9332804679870605, "global_step": 60181, "epoch": 1432} {"train_loss": -5.979494571685791, "global_step": 60182, "epoch": 1432} {"train_loss": -5.88165283203125, "global_step": 60183, "epoch": 1432} {"train_loss": -5.927184104919434, "global_step": 60184, "epoch": 1432} {"train_loss": -5.911336864743914, "global_step": 60185, "epoch": 1432, "val_loss": 74267.859375} {"train_loss": -5.92072868347168, "global_step": 60186, "epoch": 1433} {"train_loss": -5.946595668792725, "global_step": 60187, "epoch": 1433} {"train_loss": -5.858233451843262, "global_step": 60188, "epoch": 1433} {"train_loss": -5.910873889923096, "global_step": 60189, "epoch": 1433} {"train_loss": -5.9185261726379395, "global_step": 60190, "epoch": 1433} {"train_loss": -5.942272186279297, "global_step": 60191, "epoch": 1433} {"train_loss": -5.965882301330566, "global_step": 60192, "epoch": 1433} {"train_loss": -5.935356616973877, "global_step": 60193, "epoch": 1433} {"train_loss": -5.8470587730407715, "global_step": 60194, "epoch": 1433} {"train_loss": -5.888840675354004, "global_step": 60195, "epoch": 1433} {"train_loss": -5.934190273284912, "global_step": 60196, "epoch": 1433} {"train_loss": -5.918904781341553, "global_step": 60197, "epoch": 1433} {"train_loss": -5.722833633422852, "global_step": 60198, "epoch": 1433} {"train_loss": -5.920116901397705, "global_step": 60199, "epoch": 1433} {"train_loss": -5.834568977355957, "global_step": 60200, "epoch": 1433} {"train_loss": -5.883944034576416, "global_step": 60201, "epoch": 1433} {"train_loss": -5.9059834480285645, "global_step": 60202, "epoch": 1433} {"train_loss": -5.8523712158203125, "global_step": 60203, "epoch": 1433} {"train_loss": -5.973233699798584, "global_step": 60204, "epoch": 1433} {"train_loss": -5.913420677185059, "global_step": 60205, "epoch": 1433} {"train_loss": -6.030182838439941, "global_step": 60206, "epoch": 1433} {"train_loss": -5.989175319671631, "global_step": 60207, "epoch": 1433} {"train_loss": -5.916835784912109, "global_step": 60208, "epoch": 1433} {"train_loss": -5.899194240570068, "global_step": 60209, "epoch": 1433} {"train_loss": -5.940929412841797, "global_step": 60210, "epoch": 1433} {"train_loss": -5.875348091125488, "global_step": 60211, "epoch": 1433} {"train_loss": -5.842715740203857, "global_step": 60212, "epoch": 1433} {"train_loss": -5.871455192565918, "global_step": 60213, "epoch": 1433} {"train_loss": -6.0302019119262695, "global_step": 60214, "epoch": 1433} {"train_loss": -5.927506446838379, "global_step": 60215, "epoch": 1433} {"train_loss": -5.809023380279541, "global_step": 60216, "epoch": 1433} {"train_loss": -5.971305847167969, "global_step": 60217, "epoch": 1433} {"train_loss": -5.883709907531738, "global_step": 60218, "epoch": 1433} {"train_loss": -5.811968803405762, "global_step": 60219, "epoch": 1433} {"train_loss": -5.788830280303955, "global_step": 60220, "epoch": 1433} {"train_loss": -5.838258743286133, "global_step": 60221, "epoch": 1433} {"train_loss": -5.870458602905273, "global_step": 60222, "epoch": 1433} {"train_loss": -5.760689735412598, "global_step": 60223, "epoch": 1433} {"train_loss": -5.8883256912231445, "global_step": 60224, "epoch": 1433} {"train_loss": -5.909700393676758, "global_step": 60225, "epoch": 1433} {"train_loss": -5.831022262573242, "global_step": 60226, "epoch": 1433} {"train_loss": -5.894460030964443, "global_step": 60227, "epoch": 1433, "val_loss": 74534.0703125} {"train_loss": -5.833983421325684, "global_step": 60228, "epoch": 1434} {"train_loss": -5.906774520874023, "global_step": 60229, "epoch": 1434} {"train_loss": -5.86520528793335, "global_step": 60230, "epoch": 1434} {"train_loss": -5.824099063873291, "global_step": 60231, "epoch": 1434} {"train_loss": -5.904200553894043, "global_step": 60232, "epoch": 1434} {"train_loss": -5.903971195220947, "global_step": 60233, "epoch": 1434} {"train_loss": -5.892291069030762, "global_step": 60234, "epoch": 1434} {"train_loss": -5.881168842315674, "global_step": 60235, "epoch": 1434} {"train_loss": -5.831612586975098, "global_step": 60236, "epoch": 1434} {"train_loss": -5.769204616546631, "global_step": 60237, "epoch": 1434} {"train_loss": -5.937188148498535, "global_step": 60238, "epoch": 1434} {"train_loss": -5.849915981292725, "global_step": 60239, "epoch": 1434} {"train_loss": -5.811531066894531, "global_step": 60240, "epoch": 1434} {"train_loss": -5.9820556640625, "global_step": 60241, "epoch": 1434} {"train_loss": -5.741981506347656, "global_step": 60242, "epoch": 1434} {"train_loss": -5.7573394775390625, "global_step": 60243, "epoch": 1434} {"train_loss": -5.8556060791015625, "global_step": 60244, "epoch": 1434} {"train_loss": -5.918663024902344, "global_step": 60245, "epoch": 1434} {"train_loss": -5.961846351623535, "global_step": 60246, "epoch": 1434} {"train_loss": -5.802362442016602, "global_step": 60247, "epoch": 1434} {"train_loss": -5.792295455932617, "global_step": 60248, "epoch": 1434} {"train_loss": -5.793597221374512, "global_step": 60249, "epoch": 1434} {"train_loss": -5.83066463470459, "global_step": 60250, "epoch": 1434} {"train_loss": -5.712802410125732, "global_step": 60251, "epoch": 1434} {"train_loss": -5.891239643096924, "global_step": 60252, "epoch": 1434} {"train_loss": -5.832047939300537, "global_step": 60253, "epoch": 1434} {"train_loss": -5.807852745056152, "global_step": 60254, "epoch": 1434} {"train_loss": -5.899706840515137, "global_step": 60255, "epoch": 1434} {"train_loss": -5.817652702331543, "global_step": 60256, "epoch": 1434} {"train_loss": -5.854588508605957, "global_step": 60257, "epoch": 1434} {"train_loss": -5.883215427398682, "global_step": 60258, "epoch": 1434} {"train_loss": -5.891408443450928, "global_step": 60259, "epoch": 1434} {"train_loss": -5.997968673706055, "global_step": 60260, "epoch": 1434} {"train_loss": -5.9451704025268555, "global_step": 60261, "epoch": 1434} {"train_loss": -5.898148536682129, "global_step": 60262, "epoch": 1434} {"train_loss": -6.026206970214844, "global_step": 60263, "epoch": 1434} {"train_loss": -5.852782249450684, "global_step": 60264, "epoch": 1434} {"train_loss": -5.892278671264648, "global_step": 60265, "epoch": 1434} {"train_loss": -5.9595255851745605, "global_step": 60266, "epoch": 1434} {"train_loss": -6.055837631225586, "global_step": 60267, "epoch": 1434} {"train_loss": -5.925500869750977, "global_step": 60268, "epoch": 1434} {"train_loss": -5.876375470842634, "global_step": 60269, "epoch": 1434, "val_loss": 74707.375} {"train_loss": -5.923250198364258, "global_step": 60270, "epoch": 1435} {"train_loss": -5.89239501953125, "global_step": 60271, "epoch": 1435} {"train_loss": -5.896590232849121, "global_step": 60272, "epoch": 1435} {"train_loss": -5.934789180755615, "global_step": 60273, "epoch": 1435} {"train_loss": -5.955604553222656, "global_step": 60274, "epoch": 1435} {"train_loss": -5.7628631591796875, "global_step": 60275, "epoch": 1435} {"train_loss": -5.872798442840576, "global_step": 60276, "epoch": 1435} {"train_loss": -5.865177154541016, "global_step": 60277, "epoch": 1435} {"train_loss": -5.86724328994751, "global_step": 60278, "epoch": 1435} {"train_loss": -5.797468662261963, "global_step": 60279, "epoch": 1435} {"train_loss": -6.000946044921875, "global_step": 60280, "epoch": 1435} {"train_loss": -5.726703643798828, "global_step": 60281, "epoch": 1435} {"train_loss": -5.913761138916016, "global_step": 60282, "epoch": 1435} {"train_loss": -5.813480377197266, "global_step": 60283, "epoch": 1435} {"train_loss": -5.799827575683594, "global_step": 60284, "epoch": 1435} {"train_loss": -5.766203880310059, "global_step": 60285, "epoch": 1435} {"train_loss": -5.852865219116211, "global_step": 60286, "epoch": 1435} {"train_loss": -5.84932804107666, "global_step": 60287, "epoch": 1435} {"train_loss": -5.832457542419434, "global_step": 60288, "epoch": 1435} {"train_loss": -5.939788818359375, "global_step": 60289, "epoch": 1435} {"train_loss": -5.860217571258545, "global_step": 60290, "epoch": 1435} {"train_loss": -5.917652130126953, "global_step": 60291, "epoch": 1435} {"train_loss": -5.795339584350586, "global_step": 60292, "epoch": 1435} {"train_loss": -5.813787460327148, "global_step": 60293, "epoch": 1435} {"train_loss": -5.914120197296143, "global_step": 60294, "epoch": 1435} {"train_loss": -5.875277519226074, "global_step": 60295, "epoch": 1435} {"train_loss": -5.932876110076904, "global_step": 60296, "epoch": 1435} {"train_loss": -5.8625712394714355, "global_step": 60297, "epoch": 1435} {"train_loss": -5.985383987426758, "global_step": 60298, "epoch": 1435} {"train_loss": -5.815041542053223, "global_step": 60299, "epoch": 1435} {"train_loss": -5.742218494415283, "global_step": 60300, "epoch": 1435} {"train_loss": -5.85749626159668, "global_step": 60301, "epoch": 1435} {"train_loss": -5.868386268615723, "global_step": 60302, "epoch": 1435} {"train_loss": -5.862131595611572, "global_step": 60303, "epoch": 1435} {"train_loss": -5.865067481994629, "global_step": 60304, "epoch": 1435} {"train_loss": -5.815131187438965, "global_step": 60305, "epoch": 1435} {"train_loss": -6.019687652587891, "global_step": 60306, "epoch": 1435} {"train_loss": -5.870165824890137, "global_step": 60307, "epoch": 1435} {"train_loss": -5.786980628967285, "global_step": 60308, "epoch": 1435} {"train_loss": -5.964565277099609, "global_step": 60309, "epoch": 1435} {"train_loss": -5.986839294433594, "global_step": 60310, "epoch": 1435} {"train_loss": -5.871011438823881, "global_step": 60311, "epoch": 1435, "val_loss": 74389.7109375} {"train_loss": -5.936159610748291, "global_step": 60312, "epoch": 1436} {"train_loss": -6.0006513595581055, "global_step": 60313, "epoch": 1436} {"train_loss": -5.829702377319336, "global_step": 60314, "epoch": 1436} {"train_loss": -5.846205711364746, "global_step": 60315, "epoch": 1436} {"train_loss": -5.944590091705322, "global_step": 60316, "epoch": 1436} {"train_loss": -5.855771541595459, "global_step": 60317, "epoch": 1436} {"train_loss": -6.022279739379883, "global_step": 60318, "epoch": 1436} {"train_loss": -5.878582000732422, "global_step": 60319, "epoch": 1436} {"train_loss": -5.9775495529174805, "global_step": 60320, "epoch": 1436} {"train_loss": -5.903412818908691, "global_step": 60321, "epoch": 1436} {"train_loss": -5.813647747039795, "global_step": 60322, "epoch": 1436} {"train_loss": -5.812751770019531, "global_step": 60323, "epoch": 1436} {"train_loss": -5.933480262756348, "global_step": 60324, "epoch": 1436} {"train_loss": -5.855177879333496, "global_step": 60325, "epoch": 1436} {"train_loss": -5.876204490661621, "global_step": 60326, "epoch": 1436} {"train_loss": -5.870089054107666, "global_step": 60327, "epoch": 1436} {"train_loss": -6.004103660583496, "global_step": 60328, "epoch": 1436} {"train_loss": -5.947367191314697, "global_step": 60329, "epoch": 1436} {"train_loss": -6.048193454742432, "global_step": 60330, "epoch": 1436} {"train_loss": -5.933511257171631, "global_step": 60331, "epoch": 1436} {"train_loss": -5.891302108764648, "global_step": 60332, "epoch": 1436} {"train_loss": -5.981942176818848, "global_step": 60333, "epoch": 1436} {"train_loss": -5.965069770812988, "global_step": 60334, "epoch": 1436} {"train_loss": -5.8742828369140625, "global_step": 60335, "epoch": 1436} {"train_loss": -6.001990795135498, "global_step": 60336, "epoch": 1436} {"train_loss": -5.996767044067383, "global_step": 60337, "epoch": 1436} {"train_loss": -5.86137580871582, "global_step": 60338, "epoch": 1436} {"train_loss": -5.924298286437988, "global_step": 60339, "epoch": 1436} {"train_loss": -5.805753707885742, "global_step": 60340, "epoch": 1436} {"train_loss": -5.878997802734375, "global_step": 60341, "epoch": 1436} {"train_loss": -5.938916206359863, "global_step": 60342, "epoch": 1436} {"train_loss": -5.834454536437988, "global_step": 60343, "epoch": 1436} {"train_loss": -5.880302429199219, "global_step": 60344, "epoch": 1436} {"train_loss": -5.88530158996582, "global_step": 60345, "epoch": 1436} {"train_loss": -5.855457305908203, "global_step": 60346, "epoch": 1436} {"train_loss": -5.812328815460205, "global_step": 60347, "epoch": 1436} {"train_loss": -5.9325971603393555, "global_step": 60348, "epoch": 1436} {"train_loss": -5.857541084289551, "global_step": 60349, "epoch": 1436} {"train_loss": -5.906192302703857, "global_step": 60350, "epoch": 1436} {"train_loss": -5.70064640045166, "global_step": 60351, "epoch": 1436} {"train_loss": -5.908370018005371, "global_step": 60352, "epoch": 1436} {"train_loss": -5.902325085231236, "global_step": 60353, "epoch": 1436, "val_loss": 74830.40625} {"train_loss": -5.853928565979004, "global_step": 60354, "epoch": 1437} {"train_loss": -6.011861324310303, "global_step": 60355, "epoch": 1437} {"train_loss": -5.836334705352783, "global_step": 60356, "epoch": 1437} {"train_loss": -5.924620628356934, "global_step": 60357, "epoch": 1437} {"train_loss": -5.847705364227295, "global_step": 60358, "epoch": 1437} {"train_loss": -5.885907173156738, "global_step": 60359, "epoch": 1437} {"train_loss": -5.8660783767700195, "global_step": 60360, "epoch": 1437} {"train_loss": -5.810935974121094, "global_step": 60361, "epoch": 1437} {"train_loss": -5.920475006103516, "global_step": 60362, "epoch": 1437} {"train_loss": -5.884489059448242, "global_step": 60363, "epoch": 1437} {"train_loss": -5.8533477783203125, "global_step": 60364, "epoch": 1437} {"train_loss": -5.987309455871582, "global_step": 60365, "epoch": 1437} {"train_loss": -5.89589786529541, "global_step": 60366, "epoch": 1437} {"train_loss": -5.932934284210205, "global_step": 60367, "epoch": 1437} {"train_loss": -5.838593482971191, "global_step": 60368, "epoch": 1437} {"train_loss": -5.898496150970459, "global_step": 60369, "epoch": 1437} {"train_loss": -5.880307197570801, "global_step": 60370, "epoch": 1437} {"train_loss": -5.886969566345215, "global_step": 60371, "epoch": 1437} {"train_loss": -5.9125075340271, "global_step": 60372, "epoch": 1437} {"train_loss": -5.82838249206543, "global_step": 60373, "epoch": 1437} {"train_loss": -5.868074893951416, "global_step": 60374, "epoch": 1437} {"train_loss": -5.926573753356934, "global_step": 60375, "epoch": 1437} {"train_loss": -6.048279762268066, "global_step": 60376, "epoch": 1437} {"train_loss": -6.004628658294678, "global_step": 60377, "epoch": 1437} {"train_loss": -5.893124580383301, "global_step": 60378, "epoch": 1437} {"train_loss": -5.91882848739624, "global_step": 60379, "epoch": 1437} {"train_loss": -5.883938312530518, "global_step": 60380, "epoch": 1437} {"train_loss": -5.904498100280762, "global_step": 60381, "epoch": 1437} {"train_loss": -5.9187822341918945, "global_step": 60382, "epoch": 1437} {"train_loss": -5.919835567474365, "global_step": 60383, "epoch": 1437} {"train_loss": -5.938294410705566, "global_step": 60384, "epoch": 1437} {"train_loss": -5.988877296447754, "global_step": 60385, "epoch": 1437} {"train_loss": -5.858318328857422, "global_step": 60386, "epoch": 1437} {"train_loss": -5.786505699157715, "global_step": 60387, "epoch": 1437} {"train_loss": -5.908613204956055, "global_step": 60388, "epoch": 1437} {"train_loss": -5.9984517097473145, "global_step": 60389, "epoch": 1437} {"train_loss": -5.921356201171875, "global_step": 60390, "epoch": 1437} {"train_loss": -5.879670143127441, "global_step": 60391, "epoch": 1437} {"train_loss": -5.839849472045898, "global_step": 60392, "epoch": 1437} {"train_loss": -5.9017863273620605, "global_step": 60393, "epoch": 1437} {"train_loss": -5.908725738525391, "global_step": 60394, "epoch": 1437} {"train_loss": -5.903786159697033, "global_step": 60395, "epoch": 1437, "val_loss": 74530.671875} {"train_loss": -5.898521423339844, "global_step": 60396, "epoch": 1438} {"train_loss": -5.9422197341918945, "global_step": 60397, "epoch": 1438} {"train_loss": -6.031772613525391, "global_step": 60398, "epoch": 1438} {"train_loss": -5.87144660949707, "global_step": 60399, "epoch": 1438} {"train_loss": -5.86474084854126, "global_step": 60400, "epoch": 1438} {"train_loss": -5.887692451477051, "global_step": 60401, "epoch": 1438} {"train_loss": -6.005526542663574, "global_step": 60402, "epoch": 1438} {"train_loss": -5.99592924118042, "global_step": 60403, "epoch": 1438} {"train_loss": -5.839908599853516, "global_step": 60404, "epoch": 1438} {"train_loss": -5.805291175842285, "global_step": 60405, "epoch": 1438} {"train_loss": -5.863617897033691, "global_step": 60406, "epoch": 1438} {"train_loss": -5.837650299072266, "global_step": 60407, "epoch": 1438} {"train_loss": -5.9158501625061035, "global_step": 60408, "epoch": 1438} {"train_loss": -5.977761268615723, "global_step": 60409, "epoch": 1438} {"train_loss": -6.049241065979004, "global_step": 60410, "epoch": 1438} {"train_loss": -5.952515602111816, "global_step": 60411, "epoch": 1438} {"train_loss": -5.937916278839111, "global_step": 60412, "epoch": 1438} {"train_loss": -6.010310173034668, "global_step": 60413, "epoch": 1438} {"train_loss": -6.014009952545166, "global_step": 60414, "epoch": 1438} {"train_loss": -5.851158142089844, "global_step": 60415, "epoch": 1438} {"train_loss": -5.90012264251709, "global_step": 60416, "epoch": 1438} {"train_loss": -5.845196723937988, "global_step": 60417, "epoch": 1438} {"train_loss": -5.90993595123291, "global_step": 60418, "epoch": 1438} {"train_loss": -5.860421657562256, "global_step": 60419, "epoch": 1438} {"train_loss": -5.985527992248535, "global_step": 60420, "epoch": 1438} {"train_loss": -5.821906566619873, "global_step": 60421, "epoch": 1438} {"train_loss": -5.863574028015137, "global_step": 60422, "epoch": 1438} {"train_loss": -5.851184844970703, "global_step": 60423, "epoch": 1438} {"train_loss": -5.876333236694336, "global_step": 60424, "epoch": 1438} {"train_loss": -5.966367244720459, "global_step": 60425, "epoch": 1438} {"train_loss": -5.8239593505859375, "global_step": 60426, "epoch": 1438} {"train_loss": -5.96253776550293, "global_step": 60427, "epoch": 1438} {"train_loss": -5.921735763549805, "global_step": 60428, "epoch": 1438} {"train_loss": -6.023843765258789, "global_step": 60429, "epoch": 1438} {"train_loss": -5.9169721603393555, "global_step": 60430, "epoch": 1438} {"train_loss": -5.819486141204834, "global_step": 60431, "epoch": 1438} {"train_loss": -6.06917667388916, "global_step": 60432, "epoch": 1438} {"train_loss": -5.716952323913574, "global_step": 60433, "epoch": 1438} {"train_loss": -5.901163101196289, "global_step": 60434, "epoch": 1438} {"train_loss": -5.918492317199707, "global_step": 60435, "epoch": 1438} {"train_loss": -5.95444917678833, "global_step": 60436, "epoch": 1438} {"train_loss": -5.911728836241222, "global_step": 60437, "epoch": 1438, "val_loss": 74192.7890625} {"train_loss": -5.921766757965088, "global_step": 60438, "epoch": 1439} {"train_loss": -5.937272548675537, "global_step": 60439, "epoch": 1439} {"train_loss": -5.9917120933532715, "global_step": 60440, "epoch": 1439} {"train_loss": -5.969394683837891, "global_step": 60441, "epoch": 1439} {"train_loss": -5.935964584350586, "global_step": 60442, "epoch": 1439} {"train_loss": -5.935237884521484, "global_step": 60443, "epoch": 1439} {"train_loss": -6.0386223793029785, "global_step": 60444, "epoch": 1439} {"train_loss": -5.867590427398682, "global_step": 60445, "epoch": 1439} {"train_loss": -6.052515506744385, "global_step": 60446, "epoch": 1439} {"train_loss": -5.964201927185059, "global_step": 60447, "epoch": 1439} {"train_loss": -5.859255790710449, "global_step": 60448, "epoch": 1439} {"train_loss": -5.966945648193359, "global_step": 60449, "epoch": 1439} {"train_loss": -5.923364162445068, "global_step": 60450, "epoch": 1439} {"train_loss": -6.028174877166748, "global_step": 60451, "epoch": 1439} {"train_loss": -5.7821807861328125, "global_step": 60452, "epoch": 1439} {"train_loss": -5.841936111450195, "global_step": 60453, "epoch": 1439} {"train_loss": -5.971580505371094, "global_step": 60454, "epoch": 1439} {"train_loss": -5.836896896362305, "global_step": 60455, "epoch": 1439} {"train_loss": -5.931290626525879, "global_step": 60456, "epoch": 1439} {"train_loss": -5.900860786437988, "global_step": 60457, "epoch": 1439} {"train_loss": -5.977258682250977, "global_step": 60458, "epoch": 1439} {"train_loss": -5.9525556564331055, "global_step": 60459, "epoch": 1439} {"train_loss": -5.905587673187256, "global_step": 60460, "epoch": 1439} {"train_loss": -5.963200092315674, "global_step": 60461, "epoch": 1439} {"train_loss": -5.988054275512695, "global_step": 60462, "epoch": 1439} {"train_loss": -5.842973232269287, "global_step": 60463, "epoch": 1439} {"train_loss": -5.921262264251709, "global_step": 60464, "epoch": 1439} {"train_loss": -5.885393142700195, "global_step": 60465, "epoch": 1439} {"train_loss": -5.919156074523926, "global_step": 60466, "epoch": 1439} {"train_loss": -5.996424674987793, "global_step": 60467, "epoch": 1439} {"train_loss": -5.994061470031738, "global_step": 60468, "epoch": 1439} {"train_loss": -5.964321136474609, "global_step": 60469, "epoch": 1439} {"train_loss": -5.854282379150391, "global_step": 60470, "epoch": 1439} {"train_loss": -5.865221977233887, "global_step": 60471, "epoch": 1439} {"train_loss": -5.860880374908447, "global_step": 60472, "epoch": 1439} {"train_loss": -5.906317234039307, "global_step": 60473, "epoch": 1439} {"train_loss": -5.955406188964844, "global_step": 60474, "epoch": 1439} {"train_loss": -5.649604797363281, "global_step": 60475, "epoch": 1439} {"train_loss": -5.829318046569824, "global_step": 60476, "epoch": 1439} {"train_loss": -5.816405296325684, "global_step": 60477, "epoch": 1439} {"train_loss": -5.841412544250488, "global_step": 60478, "epoch": 1439} {"train_loss": -5.915302378790719, "global_step": 60479, "epoch": 1439, "val_loss": 74391.828125} {"train_loss": -5.840710639953613, "global_step": 60480, "epoch": 1440} {"train_loss": -5.895132064819336, "global_step": 60481, "epoch": 1440} {"train_loss": -5.919614315032959, "global_step": 60482, "epoch": 1440} {"train_loss": -5.9314703941345215, "global_step": 60483, "epoch": 1440} {"train_loss": -5.849792003631592, "global_step": 60484, "epoch": 1440} {"train_loss": -5.780743598937988, "global_step": 60485, "epoch": 1440} {"train_loss": -5.89714241027832, "global_step": 60486, "epoch": 1440} {"train_loss": -5.962774276733398, "global_step": 60487, "epoch": 1440} {"train_loss": -5.920416831970215, "global_step": 60488, "epoch": 1440} {"train_loss": -5.988080024719238, "global_step": 60489, "epoch": 1440} {"train_loss": -5.887506484985352, "global_step": 60490, "epoch": 1440} {"train_loss": -5.982088088989258, "global_step": 60491, "epoch": 1440} {"train_loss": -5.810202598571777, "global_step": 60492, "epoch": 1440} {"train_loss": -5.89759635925293, "global_step": 60493, "epoch": 1440} {"train_loss": -5.938998222351074, "global_step": 60494, "epoch": 1440} {"train_loss": -5.865428924560547, "global_step": 60495, "epoch": 1440} {"train_loss": -5.918412208557129, "global_step": 60496, "epoch": 1440} {"train_loss": -5.868556022644043, "global_step": 60497, "epoch": 1440} {"train_loss": -5.965702533721924, "global_step": 60498, "epoch": 1440} {"train_loss": -5.917153358459473, "global_step": 60499, "epoch": 1440} {"train_loss": -5.865481376647949, "global_step": 60500, "epoch": 1440} {"train_loss": -5.874495506286621, "global_step": 60501, "epoch": 1440} {"train_loss": -5.934049606323242, "global_step": 60502, "epoch": 1440} {"train_loss": -5.879366397857666, "global_step": 60503, "epoch": 1440} {"train_loss": -5.882245063781738, "global_step": 60504, "epoch": 1440} {"train_loss": -5.839282989501953, "global_step": 60505, "epoch": 1440} {"train_loss": -5.857189178466797, "global_step": 60506, "epoch": 1440} {"train_loss": -5.813965797424316, "global_step": 60507, "epoch": 1440} {"train_loss": -5.789355278015137, "global_step": 60508, "epoch": 1440} {"train_loss": -5.825743198394775, "global_step": 60509, "epoch": 1440} {"train_loss": -5.890995979309082, "global_step": 60510, "epoch": 1440} {"train_loss": -5.8140950202941895, "global_step": 60511, "epoch": 1440} {"train_loss": -5.839685440063477, "global_step": 60512, "epoch": 1440} {"train_loss": -5.926391124725342, "global_step": 60513, "epoch": 1440} {"train_loss": -5.895330905914307, "global_step": 60514, "epoch": 1440} {"train_loss": -5.865204811096191, "global_step": 60515, "epoch": 1440} {"train_loss": -5.935220718383789, "global_step": 60516, "epoch": 1440} {"train_loss": -5.753167152404785, "global_step": 60517, "epoch": 1440} {"train_loss": -5.911808013916016, "global_step": 60518, "epoch": 1440} {"train_loss": -5.848709583282471, "global_step": 60519, "epoch": 1440} {"train_loss": -5.891210079193115, "global_step": 60520, "epoch": 1440} {"train_loss": -5.882686365218389, "global_step": 60521, "epoch": 1440, "val_loss": 74954.1328125} {"train_loss": -5.910129547119141, "global_step": 60522, "epoch": 1441} {"train_loss": -5.867056846618652, "global_step": 60523, "epoch": 1441} {"train_loss": -5.918525695800781, "global_step": 60524, "epoch": 1441} {"train_loss": -5.891233921051025, "global_step": 60525, "epoch": 1441} {"train_loss": -5.865070819854736, "global_step": 60526, "epoch": 1441} {"train_loss": -5.868386268615723, "global_step": 60527, "epoch": 1441} {"train_loss": -5.870482444763184, "global_step": 60528, "epoch": 1441} {"train_loss": -5.869000434875488, "global_step": 60529, "epoch": 1441} {"train_loss": -5.94346809387207, "global_step": 60530, "epoch": 1441} {"train_loss": -5.928775787353516, "global_step": 60531, "epoch": 1441} {"train_loss": -5.814302444458008, "global_step": 60532, "epoch": 1441} {"train_loss": -5.733926773071289, "global_step": 60533, "epoch": 1441} {"train_loss": -5.916991233825684, "global_step": 60534, "epoch": 1441} {"train_loss": -5.757656097412109, "global_step": 60535, "epoch": 1441} {"train_loss": -6.012863636016846, "global_step": 60536, "epoch": 1441} {"train_loss": -5.85386848449707, "global_step": 60537, "epoch": 1441} {"train_loss": -5.856154441833496, "global_step": 60538, "epoch": 1441} {"train_loss": -5.8243584632873535, "global_step": 60539, "epoch": 1441} {"train_loss": -5.813482761383057, "global_step": 60540, "epoch": 1441} {"train_loss": -5.870362281799316, "global_step": 60541, "epoch": 1441} {"train_loss": -5.881670951843262, "global_step": 60542, "epoch": 1441} {"train_loss": -5.792791366577148, "global_step": 60543, "epoch": 1441} {"train_loss": -5.903967380523682, "global_step": 60544, "epoch": 1441} {"train_loss": -5.747464179992676, "global_step": 60545, "epoch": 1441} {"train_loss": -5.916356563568115, "global_step": 60546, "epoch": 1441} {"train_loss": -5.843421936035156, "global_step": 60547, "epoch": 1441} {"train_loss": -5.91970157623291, "global_step": 60548, "epoch": 1441} {"train_loss": -5.9416093826293945, "global_step": 60549, "epoch": 1441} {"train_loss": -5.877717018127441, "global_step": 60550, "epoch": 1441} {"train_loss": -5.828705787658691, "global_step": 60551, "epoch": 1441} {"train_loss": -5.9098920822143555, "global_step": 60552, "epoch": 1441} {"train_loss": -5.877171516418457, "global_step": 60553, "epoch": 1441} {"train_loss": -5.9081878662109375, "global_step": 60554, "epoch": 1441} {"train_loss": -5.928348541259766, "global_step": 60555, "epoch": 1441} {"train_loss": -5.941502571105957, "global_step": 60556, "epoch": 1441} {"train_loss": -5.7993669509887695, "global_step": 60557, "epoch": 1441} {"train_loss": -6.004395008087158, "global_step": 60558, "epoch": 1441} {"train_loss": -5.864372253417969, "global_step": 60559, "epoch": 1441} {"train_loss": -5.9567084312438965, "global_step": 60560, "epoch": 1441} {"train_loss": -5.790473461151123, "global_step": 60561, "epoch": 1441} {"train_loss": -5.899456024169922, "global_step": 60562, "epoch": 1441} {"train_loss": -5.877025695074172, "global_step": 60563, "epoch": 1441, "val_loss": 74111.1484375} {"train_loss": -5.99245023727417, "global_step": 60564, "epoch": 1442} {"train_loss": -5.932835102081299, "global_step": 60565, "epoch": 1442} {"train_loss": -5.881898880004883, "global_step": 60566, "epoch": 1442} {"train_loss": -5.806667327880859, "global_step": 60567, "epoch": 1442} {"train_loss": -5.842759609222412, "global_step": 60568, "epoch": 1442} {"train_loss": -5.792265892028809, "global_step": 60569, "epoch": 1442} {"train_loss": -5.897693634033203, "global_step": 60570, "epoch": 1442} {"train_loss": -5.988797187805176, "global_step": 60571, "epoch": 1442} {"train_loss": -5.758596420288086, "global_step": 60572, "epoch": 1442} {"train_loss": -5.857991695404053, "global_step": 60573, "epoch": 1442} {"train_loss": -5.9131879806518555, "global_step": 60574, "epoch": 1442} {"train_loss": -5.909245014190674, "global_step": 60575, "epoch": 1442} {"train_loss": -5.868588447570801, "global_step": 60576, "epoch": 1442} {"train_loss": -5.886454105377197, "global_step": 60577, "epoch": 1442} {"train_loss": -5.907706260681152, "global_step": 60578, "epoch": 1442} {"train_loss": -5.919175148010254, "global_step": 60579, "epoch": 1442} {"train_loss": -5.944364070892334, "global_step": 60580, "epoch": 1442} {"train_loss": -5.8133544921875, "global_step": 60581, "epoch": 1442} {"train_loss": -5.81147575378418, "global_step": 60582, "epoch": 1442} {"train_loss": -5.9363813400268555, "global_step": 60583, "epoch": 1442} {"train_loss": -5.735713481903076, "global_step": 60584, "epoch": 1442} {"train_loss": -5.859255790710449, "global_step": 60585, "epoch": 1442} {"train_loss": -5.8736958503723145, "global_step": 60586, "epoch": 1442} {"train_loss": -5.6933770179748535, "global_step": 60587, "epoch": 1442} {"train_loss": -5.80885124206543, "global_step": 60588, "epoch": 1442} {"train_loss": -5.752249717712402, "global_step": 60589, "epoch": 1442} {"train_loss": -5.748998641967773, "global_step": 60590, "epoch": 1442} {"train_loss": -5.786224365234375, "global_step": 60591, "epoch": 1442} {"train_loss": -5.706843852996826, "global_step": 60592, "epoch": 1442} {"train_loss": -5.827253341674805, "global_step": 60593, "epoch": 1442} {"train_loss": -5.928927898406982, "global_step": 60594, "epoch": 1442} {"train_loss": -5.802249908447266, "global_step": 60595, "epoch": 1442} {"train_loss": -5.808399200439453, "global_step": 60596, "epoch": 1442} {"train_loss": -5.791797637939453, "global_step": 60597, "epoch": 1442} {"train_loss": -5.83584451675415, "global_step": 60598, "epoch": 1442} {"train_loss": -5.8566107749938965, "global_step": 60599, "epoch": 1442} {"train_loss": -5.8448381423950195, "global_step": 60600, "epoch": 1442} {"train_loss": -5.925475597381592, "global_step": 60601, "epoch": 1442} {"train_loss": -5.761219501495361, "global_step": 60602, "epoch": 1442} {"train_loss": -5.861616134643555, "global_step": 60603, "epoch": 1442} {"train_loss": -5.848779201507568, "global_step": 60604, "epoch": 1442} {"train_loss": -5.849582728885469, "global_step": 60605, "epoch": 1442, "val_loss": 74544.734375} {"train_loss": -5.906556129455566, "global_step": 60606, "epoch": 1443} {"train_loss": -5.8685302734375, "global_step": 60607, "epoch": 1443} {"train_loss": -5.937206745147705, "global_step": 60608, "epoch": 1443} {"train_loss": -5.9234185218811035, "global_step": 60609, "epoch": 1443} {"train_loss": -5.7721757888793945, "global_step": 60610, "epoch": 1443} {"train_loss": -5.73109769821167, "global_step": 60611, "epoch": 1443} {"train_loss": -5.968786239624023, "global_step": 60612, "epoch": 1443} {"train_loss": -5.822959899902344, "global_step": 60613, "epoch": 1443} {"train_loss": -5.901265621185303, "global_step": 60614, "epoch": 1443} {"train_loss": -5.981453895568848, "global_step": 60615, "epoch": 1443} {"train_loss": -5.97529411315918, "global_step": 60616, "epoch": 1443} {"train_loss": -5.971108436584473, "global_step": 60617, "epoch": 1443} {"train_loss": -5.8960161209106445, "global_step": 60618, "epoch": 1443} {"train_loss": -5.941859245300293, "global_step": 60619, "epoch": 1443} {"train_loss": -5.9735870361328125, "global_step": 60620, "epoch": 1443} {"train_loss": -5.951258659362793, "global_step": 60621, "epoch": 1443} {"train_loss": -5.935276031494141, "global_step": 60622, "epoch": 1443} {"train_loss": -5.891828536987305, "global_step": 60623, "epoch": 1443} {"train_loss": -5.7817277908325195, "global_step": 60624, "epoch": 1443} {"train_loss": -5.868215560913086, "global_step": 60625, "epoch": 1443} {"train_loss": -5.814083576202393, "global_step": 60626, "epoch": 1443} {"train_loss": -5.967426300048828, "global_step": 60627, "epoch": 1443} {"train_loss": -5.779560089111328, "global_step": 60628, "epoch": 1443} {"train_loss": -5.883237838745117, "global_step": 60629, "epoch": 1443} {"train_loss": -5.869606971740723, "global_step": 60630, "epoch": 1443} {"train_loss": -6.027750015258789, "global_step": 60631, "epoch": 1443} {"train_loss": -5.992471694946289, "global_step": 60632, "epoch": 1443} {"train_loss": -5.969459533691406, "global_step": 60633, "epoch": 1443} {"train_loss": -5.991202354431152, "global_step": 60634, "epoch": 1443} {"train_loss": -6.015779495239258, "global_step": 60635, "epoch": 1443} {"train_loss": -5.891373634338379, "global_step": 60636, "epoch": 1443} {"train_loss": -5.870718955993652, "global_step": 60637, "epoch": 1443} {"train_loss": -5.963443756103516, "global_step": 60638, "epoch": 1443} {"train_loss": -5.822826862335205, "global_step": 60639, "epoch": 1443} {"train_loss": -5.979305267333984, "global_step": 60640, "epoch": 1443} {"train_loss": -5.938911437988281, "global_step": 60641, "epoch": 1443} {"train_loss": -5.774326801300049, "global_step": 60642, "epoch": 1443} {"train_loss": -5.862812519073486, "global_step": 60643, "epoch": 1443} {"train_loss": -5.951210975646973, "global_step": 60644, "epoch": 1443} {"train_loss": -5.765806674957275, "global_step": 60645, "epoch": 1443} {"train_loss": -5.86976432800293, "global_step": 60646, "epoch": 1443} {"train_loss": -5.901820659637451, "global_step": 60647, "epoch": 1443, "val_loss": 74278.4296875} {"train_loss": -5.927646636962891, "global_step": 60648, "epoch": 1444} {"train_loss": -5.870813369750977, "global_step": 60649, "epoch": 1444} {"train_loss": -5.904666423797607, "global_step": 60650, "epoch": 1444} {"train_loss": -5.871613502502441, "global_step": 60651, "epoch": 1444} {"train_loss": -5.89249849319458, "global_step": 60652, "epoch": 1444} {"train_loss": -5.997518539428711, "global_step": 60653, "epoch": 1444} {"train_loss": -5.862513542175293, "global_step": 60654, "epoch": 1444} {"train_loss": -5.760645866394043, "global_step": 60655, "epoch": 1444} {"train_loss": -5.76025390625, "global_step": 60656, "epoch": 1444} {"train_loss": -5.825290679931641, "global_step": 60657, "epoch": 1444} {"train_loss": -5.800623893737793, "global_step": 60658, "epoch": 1444} {"train_loss": -5.851543426513672, "global_step": 60659, "epoch": 1444} {"train_loss": -5.869368076324463, "global_step": 60660, "epoch": 1444} {"train_loss": -5.797419548034668, "global_step": 60661, "epoch": 1444} {"train_loss": -5.889257431030273, "global_step": 60662, "epoch": 1444} {"train_loss": -5.869206428527832, "global_step": 60663, "epoch": 1444} {"train_loss": -5.898456573486328, "global_step": 60664, "epoch": 1444} {"train_loss": -5.88346004486084, "global_step": 60665, "epoch": 1444} {"train_loss": -5.89921760559082, "global_step": 60666, "epoch": 1444} {"train_loss": -5.9699811935424805, "global_step": 60667, "epoch": 1444} {"train_loss": -5.844600200653076, "global_step": 60668, "epoch": 1444} {"train_loss": -5.897695541381836, "global_step": 60669, "epoch": 1444} {"train_loss": -5.792232036590576, "global_step": 60670, "epoch": 1444} {"train_loss": -5.906973361968994, "global_step": 60671, "epoch": 1444} {"train_loss": -6.021196365356445, "global_step": 60672, "epoch": 1444} {"train_loss": -5.899677276611328, "global_step": 60673, "epoch": 1444} {"train_loss": -5.98677396774292, "global_step": 60674, "epoch": 1444} {"train_loss": -5.8095903396606445, "global_step": 60675, "epoch": 1444} {"train_loss": -5.893884658813477, "global_step": 60676, "epoch": 1444} {"train_loss": -6.0056562423706055, "global_step": 60677, "epoch": 1444} {"train_loss": -5.914904594421387, "global_step": 60678, "epoch": 1444} {"train_loss": -5.9671478271484375, "global_step": 60679, "epoch": 1444} {"train_loss": -5.930325508117676, "global_step": 60680, "epoch": 1444} {"train_loss": -5.965106964111328, "global_step": 60681, "epoch": 1444} {"train_loss": -5.857082366943359, "global_step": 60682, "epoch": 1444} {"train_loss": -5.932806968688965, "global_step": 60683, "epoch": 1444} {"train_loss": -5.966354846954346, "global_step": 60684, "epoch": 1444} {"train_loss": -6.036801338195801, "global_step": 60685, "epoch": 1444} {"train_loss": -5.916721820831299, "global_step": 60686, "epoch": 1444} {"train_loss": -5.849259376525879, "global_step": 60687, "epoch": 1444} {"train_loss": -5.981417655944824, "global_step": 60688, "epoch": 1444} {"train_loss": -5.895990780421665, "global_step": 60689, "epoch": 1444, "val_loss": 74488.0546875} {"train_loss": -5.807490825653076, "global_step": 60690, "epoch": 1445} {"train_loss": -5.960744857788086, "global_step": 60691, "epoch": 1445} {"train_loss": -5.862781524658203, "global_step": 60692, "epoch": 1445} {"train_loss": -5.866276264190674, "global_step": 60693, "epoch": 1445} {"train_loss": -5.846297264099121, "global_step": 60694, "epoch": 1445} {"train_loss": -5.835141181945801, "global_step": 60695, "epoch": 1445} {"train_loss": -5.895169258117676, "global_step": 60696, "epoch": 1445} {"train_loss": -5.898984909057617, "global_step": 60697, "epoch": 1445} {"train_loss": -5.804582595825195, "global_step": 60698, "epoch": 1445} {"train_loss": -6.019538879394531, "global_step": 60699, "epoch": 1445} {"train_loss": -5.841618061065674, "global_step": 60700, "epoch": 1445} {"train_loss": -5.8356523513793945, "global_step": 60701, "epoch": 1445} {"train_loss": -5.92119026184082, "global_step": 60702, "epoch": 1445} {"train_loss": -5.938711166381836, "global_step": 60703, "epoch": 1445} {"train_loss": -5.912445068359375, "global_step": 60704, "epoch": 1445} {"train_loss": -5.777464866638184, "global_step": 60705, "epoch": 1445} {"train_loss": -5.910566329956055, "global_step": 60706, "epoch": 1445} {"train_loss": -5.847808837890625, "global_step": 60707, "epoch": 1445} {"train_loss": -5.866336822509766, "global_step": 60708, "epoch": 1445} {"train_loss": -6.054139137268066, "global_step": 60709, "epoch": 1445} {"train_loss": -5.855829238891602, "global_step": 60710, "epoch": 1445} {"train_loss": -5.722902297973633, "global_step": 60711, "epoch": 1445} {"train_loss": -6.023905277252197, "global_step": 60712, "epoch": 1445} {"train_loss": -5.910653114318848, "global_step": 60713, "epoch": 1445} {"train_loss": -5.954146862030029, "global_step": 60714, "epoch": 1445} {"train_loss": -5.897666931152344, "global_step": 60715, "epoch": 1445} {"train_loss": -5.976883888244629, "global_step": 60716, "epoch": 1445} {"train_loss": -5.962608814239502, "global_step": 60717, "epoch": 1445} {"train_loss": -5.965024948120117, "global_step": 60718, "epoch": 1445} {"train_loss": -5.9470367431640625, "global_step": 60719, "epoch": 1445} {"train_loss": -6.004353046417236, "global_step": 60720, "epoch": 1445} {"train_loss": -5.786210060119629, "global_step": 60721, "epoch": 1445} {"train_loss": -5.947634696960449, "global_step": 60722, "epoch": 1445} {"train_loss": -5.915081977844238, "global_step": 60723, "epoch": 1445} {"train_loss": -5.871743679046631, "global_step": 60724, "epoch": 1445} {"train_loss": -5.957857608795166, "global_step": 60725, "epoch": 1445} {"train_loss": -5.81489896774292, "global_step": 60726, "epoch": 1445} {"train_loss": -5.848933219909668, "global_step": 60727, "epoch": 1445} {"train_loss": -5.762092590332031, "global_step": 60728, "epoch": 1445} {"train_loss": -5.797001838684082, "global_step": 60729, "epoch": 1445} {"train_loss": -5.800924301147461, "global_step": 60730, "epoch": 1445} {"train_loss": -5.889160508201236, "global_step": 60731, "epoch": 1445, "val_loss": 74450.5390625} {"train_loss": -5.923826217651367, "global_step": 60732, "epoch": 1446} {"train_loss": -5.890574932098389, "global_step": 60733, "epoch": 1446} {"train_loss": -5.872527122497559, "global_step": 60734, "epoch": 1446} {"train_loss": -5.927364349365234, "global_step": 60735, "epoch": 1446} {"train_loss": -5.8571882247924805, "global_step": 60736, "epoch": 1446} {"train_loss": -5.956666946411133, "global_step": 60737, "epoch": 1446} {"train_loss": -5.880797386169434, "global_step": 60738, "epoch": 1446} {"train_loss": -5.904335021972656, "global_step": 60739, "epoch": 1446} {"train_loss": -5.951325416564941, "global_step": 60740, "epoch": 1446} {"train_loss": -6.033620357513428, "global_step": 60741, "epoch": 1446} {"train_loss": -5.9265618324279785, "global_step": 60742, "epoch": 1446} {"train_loss": -5.9907684326171875, "global_step": 60743, "epoch": 1446} {"train_loss": -5.828278541564941, "global_step": 60744, "epoch": 1446} {"train_loss": -5.780819892883301, "global_step": 60745, "epoch": 1446} {"train_loss": -5.863577365875244, "global_step": 60746, "epoch": 1446} {"train_loss": -5.810562610626221, "global_step": 60747, "epoch": 1446} {"train_loss": -5.782650470733643, "global_step": 60748, "epoch": 1446} {"train_loss": -6.04160213470459, "global_step": 60749, "epoch": 1446} {"train_loss": -5.7825493812561035, "global_step": 60750, "epoch": 1446} {"train_loss": -5.948049545288086, "global_step": 60751, "epoch": 1446} {"train_loss": -5.854791164398193, "global_step": 60752, "epoch": 1446} {"train_loss": -5.881800174713135, "global_step": 60753, "epoch": 1446} {"train_loss": -5.867207050323486, "global_step": 60754, "epoch": 1446} {"train_loss": -5.842586994171143, "global_step": 60755, "epoch": 1446} {"train_loss": -5.767692565917969, "global_step": 60756, "epoch": 1446} {"train_loss": -5.955014705657959, "global_step": 60757, "epoch": 1446} {"train_loss": -5.80133056640625, "global_step": 60758, "epoch": 1446} {"train_loss": -5.915217399597168, "global_step": 60759, "epoch": 1446} {"train_loss": -5.9296722412109375, "global_step": 60760, "epoch": 1446} {"train_loss": -5.786742210388184, "global_step": 60761, "epoch": 1446} {"train_loss": -5.912891864776611, "global_step": 60762, "epoch": 1446} {"train_loss": -5.733770370483398, "global_step": 60763, "epoch": 1446} {"train_loss": -5.923047065734863, "global_step": 60764, "epoch": 1446} {"train_loss": -5.766763210296631, "global_step": 60765, "epoch": 1446} {"train_loss": -5.822482109069824, "global_step": 60766, "epoch": 1446} {"train_loss": -5.916979789733887, "global_step": 60767, "epoch": 1446} {"train_loss": -5.895028114318848, "global_step": 60768, "epoch": 1446} {"train_loss": -5.9203200340271, "global_step": 60769, "epoch": 1446} {"train_loss": -5.884307384490967, "global_step": 60770, "epoch": 1446} {"train_loss": -5.816781997680664, "global_step": 60771, "epoch": 1446} {"train_loss": -5.855325698852539, "global_step": 60772, "epoch": 1446} {"train_loss": -5.88170694169544, "global_step": 60773, "epoch": 1446, "val_loss": 74663.796875} {"train_loss": -5.878167629241943, "global_step": 60774, "epoch": 1447} {"train_loss": -5.980955600738525, "global_step": 60775, "epoch": 1447} {"train_loss": -5.916717052459717, "global_step": 60776, "epoch": 1447} {"train_loss": -5.840595722198486, "global_step": 60777, "epoch": 1447} {"train_loss": -5.899631977081299, "global_step": 60778, "epoch": 1447} {"train_loss": -5.927096843719482, "global_step": 60779, "epoch": 1447} {"train_loss": -5.929652214050293, "global_step": 60780, "epoch": 1447} {"train_loss": -5.824319839477539, "global_step": 60781, "epoch": 1447} {"train_loss": -5.9001054763793945, "global_step": 60782, "epoch": 1447} {"train_loss": -5.924041271209717, "global_step": 60783, "epoch": 1447} {"train_loss": -5.746201992034912, "global_step": 60784, "epoch": 1447} {"train_loss": -5.965117454528809, "global_step": 60785, "epoch": 1447} {"train_loss": -5.929647445678711, "global_step": 60786, "epoch": 1447} {"train_loss": -5.972248077392578, "global_step": 60787, "epoch": 1447} {"train_loss": -5.830446720123291, "global_step": 60788, "epoch": 1447} {"train_loss": -5.800046443939209, "global_step": 60789, "epoch": 1447} {"train_loss": -5.7745513916015625, "global_step": 60790, "epoch": 1447} {"train_loss": -5.907021522521973, "global_step": 60791, "epoch": 1447} {"train_loss": -5.8845648765563965, "global_step": 60792, "epoch": 1447} {"train_loss": -5.949383735656738, "global_step": 60793, "epoch": 1447} {"train_loss": -5.980418682098389, "global_step": 60794, "epoch": 1447} {"train_loss": -5.8235673904418945, "global_step": 60795, "epoch": 1447} {"train_loss": -5.884754657745361, "global_step": 60796, "epoch": 1447} {"train_loss": -6.044346809387207, "global_step": 60797, "epoch": 1447} {"train_loss": -5.799309730529785, "global_step": 60798, "epoch": 1447} {"train_loss": -5.902341842651367, "global_step": 60799, "epoch": 1447} {"train_loss": -5.852629661560059, "global_step": 60800, "epoch": 1447} {"train_loss": -5.925297737121582, "global_step": 60801, "epoch": 1447} {"train_loss": -5.919493675231934, "global_step": 60802, "epoch": 1447} {"train_loss": -5.853341102600098, "global_step": 60803, "epoch": 1447} {"train_loss": -5.942617416381836, "global_step": 60804, "epoch": 1447} {"train_loss": -5.982341766357422, "global_step": 60805, "epoch": 1447} {"train_loss": -5.827263832092285, "global_step": 60806, "epoch": 1447} {"train_loss": -5.8746137619018555, "global_step": 60807, "epoch": 1447} {"train_loss": -5.97312068939209, "global_step": 60808, "epoch": 1447} {"train_loss": -5.815057754516602, "global_step": 60809, "epoch": 1447} {"train_loss": -5.886062145233154, "global_step": 60810, "epoch": 1447} {"train_loss": -5.913926124572754, "global_step": 60811, "epoch": 1447} {"train_loss": -5.930084228515625, "global_step": 60812, "epoch": 1447} {"train_loss": -5.913344383239746, "global_step": 60813, "epoch": 1447} {"train_loss": -5.83726692199707, "global_step": 60814, "epoch": 1447} {"train_loss": -5.8932563577379495, "global_step": 60815, "epoch": 1447, "val_loss": 74263.3046875} {"train_loss": -5.909196853637695, "global_step": 60816, "epoch": 1448} {"train_loss": -6.030699253082275, "global_step": 60817, "epoch": 1448} {"train_loss": -5.837380409240723, "global_step": 60818, "epoch": 1448} {"train_loss": -5.978026390075684, "global_step": 60819, "epoch": 1448} {"train_loss": -5.855322360992432, "global_step": 60820, "epoch": 1448} {"train_loss": -5.860752105712891, "global_step": 60821, "epoch": 1448} {"train_loss": -5.853142261505127, "global_step": 60822, "epoch": 1448} {"train_loss": -5.892480850219727, "global_step": 60823, "epoch": 1448} {"train_loss": -5.955812931060791, "global_step": 60824, "epoch": 1448} {"train_loss": -5.863466262817383, "global_step": 60825, "epoch": 1448} {"train_loss": -5.879676818847656, "global_step": 60826, "epoch": 1448} {"train_loss": -5.738557815551758, "global_step": 60827, "epoch": 1448} {"train_loss": -5.8305816650390625, "global_step": 60828, "epoch": 1448} {"train_loss": -5.981193542480469, "global_step": 60829, "epoch": 1448} {"train_loss": -5.891804218292236, "global_step": 60830, "epoch": 1448} {"train_loss": -6.01059627532959, "global_step": 60831, "epoch": 1448} {"train_loss": -5.883892059326172, "global_step": 60832, "epoch": 1448} {"train_loss": -6.014742851257324, "global_step": 60833, "epoch": 1448} {"train_loss": -5.960323333740234, "global_step": 60834, "epoch": 1448} {"train_loss": -5.9061126708984375, "global_step": 60835, "epoch": 1448} {"train_loss": -5.932166576385498, "global_step": 60836, "epoch": 1448} {"train_loss": -5.84272575378418, "global_step": 60837, "epoch": 1448} {"train_loss": -6.035162448883057, "global_step": 60838, "epoch": 1448} {"train_loss": -6.0009260177612305, "global_step": 60839, "epoch": 1448} {"train_loss": -5.896026611328125, "global_step": 60840, "epoch": 1448} {"train_loss": -5.809675693511963, "global_step": 60841, "epoch": 1448} {"train_loss": -5.867808818817139, "global_step": 60842, "epoch": 1448} {"train_loss": -5.948058605194092, "global_step": 60843, "epoch": 1448} {"train_loss": -5.967685699462891, "global_step": 60844, "epoch": 1448} {"train_loss": -5.967872142791748, "global_step": 60845, "epoch": 1448} {"train_loss": -5.845699787139893, "global_step": 60846, "epoch": 1448} {"train_loss": -5.957351207733154, "global_step": 60847, "epoch": 1448} {"train_loss": -5.9339280128479, "global_step": 60848, "epoch": 1448} {"train_loss": -5.979709148406982, "global_step": 60849, "epoch": 1448} {"train_loss": -5.962634086608887, "global_step": 60850, "epoch": 1448} {"train_loss": -5.924698352813721, "global_step": 60851, "epoch": 1448} {"train_loss": -5.957191467285156, "global_step": 60852, "epoch": 1448} {"train_loss": -6.00127649307251, "global_step": 60853, "epoch": 1448} {"train_loss": -5.886460304260254, "global_step": 60854, "epoch": 1448} {"train_loss": -5.959338188171387, "global_step": 60855, "epoch": 1448} {"train_loss": -6.0396270751953125, "global_step": 60856, "epoch": 1448} {"train_loss": -5.924700805119106, "global_step": 60857, "epoch": 1448, "val_loss": 75064.3359375} {"train_loss": -5.961771011352539, "global_step": 60858, "epoch": 1449} {"train_loss": -5.87013053894043, "global_step": 60859, "epoch": 1449} {"train_loss": -5.77529239654541, "global_step": 60860, "epoch": 1449} {"train_loss": -5.954095363616943, "global_step": 60861, "epoch": 1449} {"train_loss": -5.959037780761719, "global_step": 60862, "epoch": 1449} {"train_loss": -5.855456829071045, "global_step": 60863, "epoch": 1449} {"train_loss": -5.970210075378418, "global_step": 60864, "epoch": 1449} {"train_loss": -5.927858352661133, "global_step": 60865, "epoch": 1449} {"train_loss": -5.925945281982422, "global_step": 60866, "epoch": 1449} {"train_loss": -5.910303115844727, "global_step": 60867, "epoch": 1449} {"train_loss": -5.9841413497924805, "global_step": 60868, "epoch": 1449} {"train_loss": -5.925167560577393, "global_step": 60869, "epoch": 1449} {"train_loss": -5.874987602233887, "global_step": 60870, "epoch": 1449} {"train_loss": -5.885246753692627, "global_step": 60871, "epoch": 1449} {"train_loss": -5.9139885902404785, "global_step": 60872, "epoch": 1449} {"train_loss": -5.9946370124816895, "global_step": 60873, "epoch": 1449} {"train_loss": -5.815061569213867, "global_step": 60874, "epoch": 1449} {"train_loss": -5.917457103729248, "global_step": 60875, "epoch": 1449} {"train_loss": -5.9914350509643555, "global_step": 60876, "epoch": 1449} {"train_loss": -5.994437217712402, "global_step": 60877, "epoch": 1449} {"train_loss": -5.823879241943359, "global_step": 60878, "epoch": 1449} {"train_loss": -6.007209777832031, "global_step": 60879, "epoch": 1449} {"train_loss": -5.702446937561035, "global_step": 60880, "epoch": 1449} {"train_loss": -5.762224197387695, "global_step": 60881, "epoch": 1449} {"train_loss": -5.813140869140625, "global_step": 60882, "epoch": 1449} {"train_loss": -5.7143449783325195, "global_step": 60883, "epoch": 1449} {"train_loss": -5.774775981903076, "global_step": 60884, "epoch": 1449} {"train_loss": -5.920353889465332, "global_step": 60885, "epoch": 1449} {"train_loss": -5.827423572540283, "global_step": 60886, "epoch": 1449} {"train_loss": -5.989744663238525, "global_step": 60887, "epoch": 1449} {"train_loss": -5.953805923461914, "global_step": 60888, "epoch": 1449} {"train_loss": -5.759291172027588, "global_step": 60889, "epoch": 1449} {"train_loss": -5.829496383666992, "global_step": 60890, "epoch": 1449} {"train_loss": -5.8856329917907715, "global_step": 60891, "epoch": 1449} {"train_loss": -5.927095890045166, "global_step": 60892, "epoch": 1449} {"train_loss": -5.852453231811523, "global_step": 60893, "epoch": 1449} {"train_loss": -5.7458415031433105, "global_step": 60894, "epoch": 1449} {"train_loss": -5.862043380737305, "global_step": 60895, "epoch": 1449} {"train_loss": -5.9559478759765625, "global_step": 60896, "epoch": 1449} {"train_loss": -5.903875350952148, "global_step": 60897, "epoch": 1449} {"train_loss": -5.981021881103516, "global_step": 60898, "epoch": 1449} {"train_loss": -5.886649619965326, "global_step": 60899, "epoch": 1449, "val_loss": 74446.921875} {"train_loss": -5.96397066116333, "global_step": 60900, "epoch": 1450} {"train_loss": -5.927999019622803, "global_step": 60901, "epoch": 1450} {"train_loss": -5.922318458557129, "global_step": 60902, "epoch": 1450} {"train_loss": -5.896720886230469, "global_step": 60903, "epoch": 1450} {"train_loss": -5.857823371887207, "global_step": 60904, "epoch": 1450} {"train_loss": -6.060624122619629, "global_step": 60905, "epoch": 1450} {"train_loss": -5.785989761352539, "global_step": 60906, "epoch": 1450} {"train_loss": -5.781919002532959, "global_step": 60907, "epoch": 1450} {"train_loss": -5.979180335998535, "global_step": 60908, "epoch": 1450} {"train_loss": -5.738834381103516, "global_step": 60909, "epoch": 1450} {"train_loss": -5.830723762512207, "global_step": 60910, "epoch": 1450} {"train_loss": -5.861398696899414, "global_step": 60911, "epoch": 1450} {"train_loss": -5.895270824432373, "global_step": 60912, "epoch": 1450} {"train_loss": -5.941645622253418, "global_step": 60913, "epoch": 1450} {"train_loss": -5.93329381942749, "global_step": 60914, "epoch": 1450} {"train_loss": -5.858370780944824, "global_step": 60915, "epoch": 1450} {"train_loss": -5.892488479614258, "global_step": 60916, "epoch": 1450} {"train_loss": -6.009640693664551, "global_step": 60917, "epoch": 1450} {"train_loss": -5.811890602111816, "global_step": 60918, "epoch": 1450} {"train_loss": -5.804996013641357, "global_step": 60919, "epoch": 1450} {"train_loss": -5.973921775817871, "global_step": 60920, "epoch": 1450} {"train_loss": -5.826516151428223, "global_step": 60921, "epoch": 1450} {"train_loss": -5.849305152893066, "global_step": 60922, "epoch": 1450} {"train_loss": -5.859307765960693, "global_step": 60923, "epoch": 1450} {"train_loss": -5.91763973236084, "global_step": 60924, "epoch": 1450} {"train_loss": -5.868817329406738, "global_step": 60925, "epoch": 1450} {"train_loss": -5.9302873611450195, "global_step": 60926, "epoch": 1450} {"train_loss": -5.869009971618652, "global_step": 60927, "epoch": 1450} {"train_loss": -5.805553436279297, "global_step": 60928, "epoch": 1450} {"train_loss": -5.989318370819092, "global_step": 60929, "epoch": 1450} {"train_loss": -5.904300689697266, "global_step": 60930, "epoch": 1450} {"train_loss": -5.916692733764648, "global_step": 60931, "epoch": 1450} {"train_loss": -5.810690879821777, "global_step": 60932, "epoch": 1450} {"train_loss": -5.766661643981934, "global_step": 60933, "epoch": 1450} {"train_loss": -6.032650947570801, "global_step": 60934, "epoch": 1450} {"train_loss": -5.9894514083862305, "global_step": 60935, "epoch": 1450} {"train_loss": -6.009913921356201, "global_step": 60936, "epoch": 1450} {"train_loss": -5.927474021911621, "global_step": 60937, "epoch": 1450} {"train_loss": -5.883772373199463, "global_step": 60938, "epoch": 1450} {"train_loss": -5.803837776184082, "global_step": 60939, "epoch": 1450} {"train_loss": -5.94537353515625, "global_step": 60940, "epoch": 1450} {"train_loss": -5.8942635627019975, "global_step": 60941, "epoch": 1450, "train/sim_max_reward_0": 0.7942176063860529, "train/sim_max_reward_1": 0.34185791739649757, "train/sim_max_reward_2": 0.5570807676143433, "train/sim_max_reward_3": 0.16371253915302073, "train/sim_max_reward_4": 0.9079603452663869, "train/sim_max_reward_5": 0.5744625547437809, "test/sim_max_reward_4500000": 0.8775875497895816, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8353988696811643, "test/sim_max_reward_4500003": 0.9180627430474639, "test/sim_max_reward_4500004": 0.06572861799977678, "test/sim_max_reward_4500005": 0.46945825377983547, "test/sim_max_reward_4500006": 0.9096646894272816, "test/sim_max_reward_4500007": 0.8216805483720985, "test/sim_max_reward_4500008": 0.882958608095057, "test/sim_max_reward_4500009": 0.6863293654478263, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 0.7288060935280813, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.38039944682290644, "test/sim_max_reward_4500015": 0.03021306844818846, "test/sim_max_reward_4500016": 0.82630137803382, "test/sim_max_reward_4500017": 0.0004200147066431702, "test/sim_max_reward_4500018": 0.04572241758841444, "test/sim_max_reward_4500019": 0.9722096452286367, "test/sim_max_reward_4500020": 0.0888066224083191, "test/sim_max_reward_4500021": 0.972723236965146, "test/sim_max_reward_4500022": 0.8191774900656631, "test/sim_max_reward_4500023": 0.8815642430286713, "test/sim_max_reward_4500024": 0.8426079054512988, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.921122867547703, "test/sim_max_reward_4500027": 0.5095131864642164, "test/sim_max_reward_4500028": 0.2318690751378077, "test/sim_max_reward_4500029": 0.11288245142822101, "test/sim_max_reward_4500030": 0.8585361906585935, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.07430405347813909, "test/sim_max_reward_4500033": 0.8530443737533346, "test/sim_max_reward_4500034": 0.6987562438814796, "test/sim_max_reward_4500035": 0.9847497130597113, "test/sim_max_reward_4500036": 0.3545594192667713, "test/sim_max_reward_4500037": 0.705764350369426, "test/sim_max_reward_4500038": 0.2884808424514231, "test/sim_max_reward_4500039": 0.9016431438170568, "test/sim_max_reward_4500040": 0.910535148577515, "test/sim_max_reward_4500041": 0.814344552893551, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.39998277258221354, "test/sim_max_reward_4500045": 0.16796040025287975, "test/sim_max_reward_4500046": 0.39285887687180104, "test/sim_max_reward_4500047": 0.8745680358833519, "test/sim_max_reward_4500048": 0.8901779450996024, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5565486217600139, "test/mean_score": 0.5204782819980153, "val_loss": 74202.3984375} {"train_loss": -5.989109992980957, "global_step": 60942, "epoch": 1451} {"train_loss": -5.955695152282715, "global_step": 60943, "epoch": 1451} {"train_loss": -6.043368339538574, "global_step": 60944, "epoch": 1451} {"train_loss": -5.649994850158691, "global_step": 60945, "epoch": 1451} {"train_loss": -5.879678726196289, "global_step": 60946, "epoch": 1451} {"train_loss": -5.933028221130371, "global_step": 60947, "epoch": 1451} {"train_loss": -5.928121566772461, "global_step": 60948, "epoch": 1451} {"train_loss": -5.952041149139404, "global_step": 60949, "epoch": 1451} {"train_loss": -5.951840400695801, "global_step": 60950, "epoch": 1451} {"train_loss": -5.968753337860107, "global_step": 60951, "epoch": 1451} {"train_loss": -5.719463348388672, "global_step": 60952, "epoch": 1451} {"train_loss": -5.851252555847168, "global_step": 60953, "epoch": 1451} {"train_loss": -5.731520175933838, "global_step": 60954, "epoch": 1451} {"train_loss": -5.854265213012695, "global_step": 60955, "epoch": 1451} {"train_loss": -5.870931625366211, "global_step": 60956, "epoch": 1451} {"train_loss": -5.862850189208984, "global_step": 60957, "epoch": 1451} {"train_loss": -5.888590335845947, "global_step": 60958, "epoch": 1451} {"train_loss": -5.886784553527832, "global_step": 60959, "epoch": 1451} {"train_loss": -5.999889850616455, "global_step": 60960, "epoch": 1451} {"train_loss": -5.956543922424316, "global_step": 60961, "epoch": 1451} {"train_loss": -6.001346588134766, "global_step": 60962, "epoch": 1451} {"train_loss": -5.943914413452148, "global_step": 60963, "epoch": 1451} {"train_loss": -5.903682708740234, "global_step": 60964, "epoch": 1451} {"train_loss": -5.80826473236084, "global_step": 60965, "epoch": 1451} {"train_loss": -5.8891119956970215, "global_step": 60966, "epoch": 1451} {"train_loss": -5.931547164916992, "global_step": 60967, "epoch": 1451} {"train_loss": -5.882266521453857, "global_step": 60968, "epoch": 1451} {"train_loss": -5.947124481201172, "global_step": 60969, "epoch": 1451} {"train_loss": -5.8757195472717285, "global_step": 60970, "epoch": 1451} {"train_loss": -5.838323593139648, "global_step": 60971, "epoch": 1451} {"train_loss": -5.911783218383789, "global_step": 60972, "epoch": 1451} {"train_loss": -5.92598819732666, "global_step": 60973, "epoch": 1451} {"train_loss": -5.975418567657471, "global_step": 60974, "epoch": 1451} {"train_loss": -5.8983612060546875, "global_step": 60975, "epoch": 1451} {"train_loss": -5.95577335357666, "global_step": 60976, "epoch": 1451} {"train_loss": -5.858189105987549, "global_step": 60977, "epoch": 1451} {"train_loss": -5.757328510284424, "global_step": 60978, "epoch": 1451} {"train_loss": -5.804237365722656, "global_step": 60979, "epoch": 1451} {"train_loss": -5.899771690368652, "global_step": 60980, "epoch": 1451} {"train_loss": -5.954729080200195, "global_step": 60981, "epoch": 1451} {"train_loss": -5.828325271606445, "global_step": 60982, "epoch": 1451} {"train_loss": -5.895988963899159, "global_step": 60983, "epoch": 1451, "val_loss": 74802.59375} {"train_loss": -5.835230350494385, "global_step": 60984, "epoch": 1452} {"train_loss": -5.805123329162598, "global_step": 60985, "epoch": 1452} {"train_loss": -5.864672660827637, "global_step": 60986, "epoch": 1452} {"train_loss": -5.919045448303223, "global_step": 60987, "epoch": 1452} {"train_loss": -5.841009616851807, "global_step": 60988, "epoch": 1452} {"train_loss": -5.9103546142578125, "global_step": 60989, "epoch": 1452} {"train_loss": -5.767094612121582, "global_step": 60990, "epoch": 1452} {"train_loss": -5.708589553833008, "global_step": 60991, "epoch": 1452} {"train_loss": -5.826951026916504, "global_step": 60992, "epoch": 1452} {"train_loss": -5.755674362182617, "global_step": 60993, "epoch": 1452} {"train_loss": -5.941159248352051, "global_step": 60994, "epoch": 1452} {"train_loss": -6.025979518890381, "global_step": 60995, "epoch": 1452} {"train_loss": -5.956898212432861, "global_step": 60996, "epoch": 1452} {"train_loss": -5.869473934173584, "global_step": 60997, "epoch": 1452} {"train_loss": -5.859795570373535, "global_step": 60998, "epoch": 1452} {"train_loss": -5.897164344787598, "global_step": 60999, "epoch": 1452} {"train_loss": -6.00091552734375, "global_step": 61000, "epoch": 1452} {"train_loss": -6.066005229949951, "global_step": 61001, "epoch": 1452} {"train_loss": -5.852731704711914, "global_step": 61002, "epoch": 1452} {"train_loss": -5.942907333374023, "global_step": 61003, "epoch": 1452} {"train_loss": -5.993396759033203, "global_step": 61004, "epoch": 1452} {"train_loss": -5.83504581451416, "global_step": 61005, "epoch": 1452} {"train_loss": -5.949021339416504, "global_step": 61006, "epoch": 1452} {"train_loss": -5.913568496704102, "global_step": 61007, "epoch": 1452} {"train_loss": -6.004914283752441, "global_step": 61008, "epoch": 1452} {"train_loss": -5.81015682220459, "global_step": 61009, "epoch": 1452} {"train_loss": -5.964788436889648, "global_step": 61010, "epoch": 1452} {"train_loss": -5.975083351135254, "global_step": 61011, "epoch": 1452} {"train_loss": -6.007335662841797, "global_step": 61012, "epoch": 1452} {"train_loss": -5.869174003601074, "global_step": 61013, "epoch": 1452} {"train_loss": -5.999460697174072, "global_step": 61014, "epoch": 1452} {"train_loss": -5.945401191711426, "global_step": 61015, "epoch": 1452} {"train_loss": -5.986369609832764, "global_step": 61016, "epoch": 1452} {"train_loss": -5.963133811950684, "global_step": 61017, "epoch": 1452} {"train_loss": -5.858402252197266, "global_step": 61018, "epoch": 1452} {"train_loss": -5.889509201049805, "global_step": 61019, "epoch": 1452} {"train_loss": -5.890406608581543, "global_step": 61020, "epoch": 1452} {"train_loss": -5.770107269287109, "global_step": 61021, "epoch": 1452} {"train_loss": -5.893117904663086, "global_step": 61022, "epoch": 1452} {"train_loss": -5.870919704437256, "global_step": 61023, "epoch": 1452} {"train_loss": -5.879098415374756, "global_step": 61024, "epoch": 1452} {"train_loss": -5.90302350407555, "global_step": 61025, "epoch": 1452, "val_loss": 74258.8515625} {"train_loss": -6.024991512298584, "global_step": 61026, "epoch": 1453} {"train_loss": -5.967623710632324, "global_step": 61027, "epoch": 1453} {"train_loss": -5.912761211395264, "global_step": 61028, "epoch": 1453} {"train_loss": -5.893406867980957, "global_step": 61029, "epoch": 1453} {"train_loss": -5.967309951782227, "global_step": 61030, "epoch": 1453} {"train_loss": -6.081262588500977, "global_step": 61031, "epoch": 1453} {"train_loss": -5.887053489685059, "global_step": 61032, "epoch": 1453} {"train_loss": -5.997620582580566, "global_step": 61033, "epoch": 1453} {"train_loss": -5.914708137512207, "global_step": 61034, "epoch": 1453} {"train_loss": -5.960432052612305, "global_step": 61035, "epoch": 1453} {"train_loss": -5.923284530639648, "global_step": 61036, "epoch": 1453} {"train_loss": -5.949388027191162, "global_step": 61037, "epoch": 1453} {"train_loss": -6.119511604309082, "global_step": 61038, "epoch": 1453} {"train_loss": -5.8467254638671875, "global_step": 61039, "epoch": 1453} {"train_loss": -6.049222946166992, "global_step": 61040, "epoch": 1453} {"train_loss": -5.954425811767578, "global_step": 61041, "epoch": 1453} {"train_loss": -5.916699409484863, "global_step": 61042, "epoch": 1453} {"train_loss": -5.8630876541137695, "global_step": 61043, "epoch": 1453} {"train_loss": -5.9104905128479, "global_step": 61044, "epoch": 1453} {"train_loss": -5.838091850280762, "global_step": 61045, "epoch": 1453} {"train_loss": -5.959991455078125, "global_step": 61046, "epoch": 1453} {"train_loss": -5.827176094055176, "global_step": 61047, "epoch": 1453} {"train_loss": -5.979755401611328, "global_step": 61048, "epoch": 1453} {"train_loss": -5.877964973449707, "global_step": 61049, "epoch": 1453} {"train_loss": -5.935457229614258, "global_step": 61050, "epoch": 1453} {"train_loss": -5.933849334716797, "global_step": 61051, "epoch": 1453} {"train_loss": -5.9330573081970215, "global_step": 61052, "epoch": 1453} {"train_loss": -5.919539451599121, "global_step": 61053, "epoch": 1453} {"train_loss": -5.765130043029785, "global_step": 61054, "epoch": 1453} {"train_loss": -5.917041301727295, "global_step": 61055, "epoch": 1453} {"train_loss": -5.9948272705078125, "global_step": 61056, "epoch": 1453} {"train_loss": -6.0508880615234375, "global_step": 61057, "epoch": 1453} {"train_loss": -5.949382305145264, "global_step": 61058, "epoch": 1453} {"train_loss": -5.768545627593994, "global_step": 61059, "epoch": 1453} {"train_loss": -5.9876861572265625, "global_step": 61060, "epoch": 1453} {"train_loss": -5.997518539428711, "global_step": 61061, "epoch": 1453} {"train_loss": -5.800990104675293, "global_step": 61062, "epoch": 1453} {"train_loss": -5.874417781829834, "global_step": 61063, "epoch": 1453} {"train_loss": -5.917583465576172, "global_step": 61064, "epoch": 1453} {"train_loss": -5.996232986450195, "global_step": 61065, "epoch": 1453} {"train_loss": -5.881838798522949, "global_step": 61066, "epoch": 1453} {"train_loss": -5.930680865333194, "global_step": 61067, "epoch": 1453, "val_loss": 74312.1953125} {"train_loss": -5.830397605895996, "global_step": 61068, "epoch": 1454} {"train_loss": -6.02461051940918, "global_step": 61069, "epoch": 1454} {"train_loss": -5.953915596008301, "global_step": 61070, "epoch": 1454} {"train_loss": -5.871800422668457, "global_step": 61071, "epoch": 1454} {"train_loss": -5.886008262634277, "global_step": 61072, "epoch": 1454} {"train_loss": -6.01807165145874, "global_step": 61073, "epoch": 1454} {"train_loss": -5.869226455688477, "global_step": 61074, "epoch": 1454} {"train_loss": -5.917189598083496, "global_step": 61075, "epoch": 1454} {"train_loss": -6.007526397705078, "global_step": 61076, "epoch": 1454} {"train_loss": -5.914179801940918, "global_step": 61077, "epoch": 1454} {"train_loss": -5.841214179992676, "global_step": 61078, "epoch": 1454} {"train_loss": -5.827328681945801, "global_step": 61079, "epoch": 1454} {"train_loss": -5.878615856170654, "global_step": 61080, "epoch": 1454} {"train_loss": -5.963739395141602, "global_step": 61081, "epoch": 1454} {"train_loss": -5.984875679016113, "global_step": 61082, "epoch": 1454} {"train_loss": -5.936490058898926, "global_step": 61083, "epoch": 1454} {"train_loss": -5.952497482299805, "global_step": 61084, "epoch": 1454} {"train_loss": -5.978952407836914, "global_step": 61085, "epoch": 1454} {"train_loss": -5.898298263549805, "global_step": 61086, "epoch": 1454} {"train_loss": -5.9248738288879395, "global_step": 61087, "epoch": 1454} {"train_loss": -6.00871467590332, "global_step": 61088, "epoch": 1454} {"train_loss": -5.925266265869141, "global_step": 61089, "epoch": 1454} {"train_loss": -6.04796028137207, "global_step": 61090, "epoch": 1454} {"train_loss": -6.018930435180664, "global_step": 61091, "epoch": 1454} {"train_loss": -5.912670135498047, "global_step": 61092, "epoch": 1454} {"train_loss": -5.925070762634277, "global_step": 61093, "epoch": 1454} {"train_loss": -5.830820083618164, "global_step": 61094, "epoch": 1454} {"train_loss": -5.963173866271973, "global_step": 61095, "epoch": 1454} {"train_loss": -5.841316223144531, "global_step": 61096, "epoch": 1454} {"train_loss": -5.941307067871094, "global_step": 61097, "epoch": 1454} {"train_loss": -5.811742782592773, "global_step": 61098, "epoch": 1454} {"train_loss": -5.893999099731445, "global_step": 61099, "epoch": 1454} {"train_loss": -6.068395614624023, "global_step": 61100, "epoch": 1454} {"train_loss": -5.9363932609558105, "global_step": 61101, "epoch": 1454} {"train_loss": -5.826672554016113, "global_step": 61102, "epoch": 1454} {"train_loss": -5.864409923553467, "global_step": 61103, "epoch": 1454} {"train_loss": -5.866025447845459, "global_step": 61104, "epoch": 1454} {"train_loss": -5.880119800567627, "global_step": 61105, "epoch": 1454} {"train_loss": -5.857751846313477, "global_step": 61106, "epoch": 1454} {"train_loss": -5.849551200866699, "global_step": 61107, "epoch": 1454} {"train_loss": -5.9190168380737305, "global_step": 61108, "epoch": 1454} {"train_loss": -5.917035375322614, "global_step": 61109, "epoch": 1454, "val_loss": 74629.3359375} {"train_loss": -5.793489456176758, "global_step": 61110, "epoch": 1455} {"train_loss": -5.98197603225708, "global_step": 61111, "epoch": 1455} {"train_loss": -6.027409553527832, "global_step": 61112, "epoch": 1455} {"train_loss": -5.921642303466797, "global_step": 61113, "epoch": 1455} {"train_loss": -6.0598673820495605, "global_step": 61114, "epoch": 1455} {"train_loss": -5.9482421875, "global_step": 61115, "epoch": 1455} {"train_loss": -5.8743205070495605, "global_step": 61116, "epoch": 1455} {"train_loss": -5.765867233276367, "global_step": 61117, "epoch": 1455} {"train_loss": -5.939435958862305, "global_step": 61118, "epoch": 1455} {"train_loss": -5.843116760253906, "global_step": 61119, "epoch": 1455} {"train_loss": -5.92723274230957, "global_step": 61120, "epoch": 1455} {"train_loss": -5.893269062042236, "global_step": 61121, "epoch": 1455} {"train_loss": -5.982120513916016, "global_step": 61122, "epoch": 1455} {"train_loss": -5.6861491203308105, "global_step": 61123, "epoch": 1455} {"train_loss": -5.950627326965332, "global_step": 61124, "epoch": 1455} {"train_loss": -5.951754570007324, "global_step": 61125, "epoch": 1455} {"train_loss": -5.944123268127441, "global_step": 61126, "epoch": 1455} {"train_loss": -5.916043281555176, "global_step": 61127, "epoch": 1455} {"train_loss": -5.9192891120910645, "global_step": 61128, "epoch": 1455} {"train_loss": -5.889191627502441, "global_step": 61129, "epoch": 1455} {"train_loss": -5.864031791687012, "global_step": 61130, "epoch": 1455} {"train_loss": -5.935146331787109, "global_step": 61131, "epoch": 1455} {"train_loss": -5.846705436706543, "global_step": 61132, "epoch": 1455} {"train_loss": -5.83298397064209, "global_step": 61133, "epoch": 1455} {"train_loss": -6.037019729614258, "global_step": 61134, "epoch": 1455} {"train_loss": -5.883106231689453, "global_step": 61135, "epoch": 1455} {"train_loss": -5.961260795593262, "global_step": 61136, "epoch": 1455} {"train_loss": -5.7888407707214355, "global_step": 61137, "epoch": 1455} {"train_loss": -5.7842183113098145, "global_step": 61138, "epoch": 1455} {"train_loss": -5.85087776184082, "global_step": 61139, "epoch": 1455} {"train_loss": -5.822787761688232, "global_step": 61140, "epoch": 1455} {"train_loss": -5.903141498565674, "global_step": 61141, "epoch": 1455} {"train_loss": -5.891698360443115, "global_step": 61142, "epoch": 1455} {"train_loss": -5.891142845153809, "global_step": 61143, "epoch": 1455} {"train_loss": -5.958950042724609, "global_step": 61144, "epoch": 1455} {"train_loss": -5.861364364624023, "global_step": 61145, "epoch": 1455} {"train_loss": -5.993037223815918, "global_step": 61146, "epoch": 1455} {"train_loss": -5.84031343460083, "global_step": 61147, "epoch": 1455} {"train_loss": -5.896001815795898, "global_step": 61148, "epoch": 1455} {"train_loss": -5.88754415512085, "global_step": 61149, "epoch": 1455} {"train_loss": -5.72554874420166, "global_step": 61150, "epoch": 1455} {"train_loss": -5.895774160112653, "global_step": 61151, "epoch": 1455, "val_loss": 74652.8359375} {"train_loss": -5.932387351989746, "global_step": 61152, "epoch": 1456} {"train_loss": -5.941649436950684, "global_step": 61153, "epoch": 1456} {"train_loss": -6.02336311340332, "global_step": 61154, "epoch": 1456} {"train_loss": -6.030908584594727, "global_step": 61155, "epoch": 1456} {"train_loss": -5.958505630493164, "global_step": 61156, "epoch": 1456} {"train_loss": -5.947542190551758, "global_step": 61157, "epoch": 1456} {"train_loss": -5.818310737609863, "global_step": 61158, "epoch": 1456} {"train_loss": -6.072140693664551, "global_step": 61159, "epoch": 1456} {"train_loss": -5.951845169067383, "global_step": 61160, "epoch": 1456} {"train_loss": -5.871341705322266, "global_step": 61161, "epoch": 1456} {"train_loss": -6.058002471923828, "global_step": 61162, "epoch": 1456} {"train_loss": -5.966022491455078, "global_step": 61163, "epoch": 1456} {"train_loss": -5.972029685974121, "global_step": 61164, "epoch": 1456} {"train_loss": -5.907993793487549, "global_step": 61165, "epoch": 1456} {"train_loss": -5.931720733642578, "global_step": 61166, "epoch": 1456} {"train_loss": -5.996815204620361, "global_step": 61167, "epoch": 1456} {"train_loss": -5.859979152679443, "global_step": 61168, "epoch": 1456} {"train_loss": -5.820553779602051, "global_step": 61169, "epoch": 1456} {"train_loss": -5.840458869934082, "global_step": 61170, "epoch": 1456} {"train_loss": -5.912532806396484, "global_step": 61171, "epoch": 1456} {"train_loss": -5.765545845031738, "global_step": 61172, "epoch": 1456} {"train_loss": -5.814020156860352, "global_step": 61173, "epoch": 1456} {"train_loss": -5.787844657897949, "global_step": 61174, "epoch": 1456} {"train_loss": -5.834832668304443, "global_step": 61175, "epoch": 1456} {"train_loss": -5.836062908172607, "global_step": 61176, "epoch": 1456} {"train_loss": -5.8822126388549805, "global_step": 61177, "epoch": 1456} {"train_loss": -5.8552446365356445, "global_step": 61178, "epoch": 1456} {"train_loss": -5.978862285614014, "global_step": 61179, "epoch": 1456} {"train_loss": -5.833432197570801, "global_step": 61180, "epoch": 1456} {"train_loss": -5.88864803314209, "global_step": 61181, "epoch": 1456} {"train_loss": -5.930994987487793, "global_step": 61182, "epoch": 1456} {"train_loss": -5.94280481338501, "global_step": 61183, "epoch": 1456} {"train_loss": -5.948944091796875, "global_step": 61184, "epoch": 1456} {"train_loss": -5.9657440185546875, "global_step": 61185, "epoch": 1456} {"train_loss": -5.909177780151367, "global_step": 61186, "epoch": 1456} {"train_loss": -5.8726630210876465, "global_step": 61187, "epoch": 1456} {"train_loss": -5.997879505157471, "global_step": 61188, "epoch": 1456} {"train_loss": -5.908534049987793, "global_step": 61189, "epoch": 1456} {"train_loss": -5.942227363586426, "global_step": 61190, "epoch": 1456} {"train_loss": -5.929666519165039, "global_step": 61191, "epoch": 1456} {"train_loss": -5.903226375579834, "global_step": 61192, "epoch": 1456} {"train_loss": -5.915181841169085, "global_step": 61193, "epoch": 1456, "val_loss": 74324.1015625} {"train_loss": -5.917200088500977, "global_step": 61194, "epoch": 1457} {"train_loss": -5.99655818939209, "global_step": 61195, "epoch": 1457} {"train_loss": -5.863065719604492, "global_step": 61196, "epoch": 1457} {"train_loss": -5.8459882736206055, "global_step": 61197, "epoch": 1457} {"train_loss": -5.833981037139893, "global_step": 61198, "epoch": 1457} {"train_loss": -5.867781162261963, "global_step": 61199, "epoch": 1457} {"train_loss": -5.771380424499512, "global_step": 61200, "epoch": 1457} {"train_loss": -5.913576126098633, "global_step": 61201, "epoch": 1457} {"train_loss": -5.834723472595215, "global_step": 61202, "epoch": 1457} {"train_loss": -5.824087142944336, "global_step": 61203, "epoch": 1457} {"train_loss": -5.927206516265869, "global_step": 61204, "epoch": 1457} {"train_loss": -5.811028480529785, "global_step": 61205, "epoch": 1457} {"train_loss": -5.908991813659668, "global_step": 61206, "epoch": 1457} {"train_loss": -5.895793914794922, "global_step": 61207, "epoch": 1457} {"train_loss": -5.926731109619141, "global_step": 61208, "epoch": 1457} {"train_loss": -5.864341735839844, "global_step": 61209, "epoch": 1457} {"train_loss": -5.872928619384766, "global_step": 61210, "epoch": 1457} {"train_loss": -5.913052558898926, "global_step": 61211, "epoch": 1457} {"train_loss": -5.911336898803711, "global_step": 61212, "epoch": 1457} {"train_loss": -6.016143798828125, "global_step": 61213, "epoch": 1457} {"train_loss": -6.05490255355835, "global_step": 61214, "epoch": 1457} {"train_loss": -5.9638519287109375, "global_step": 61215, "epoch": 1457} {"train_loss": -5.83955192565918, "global_step": 61216, "epoch": 1457} {"train_loss": -5.900067329406738, "global_step": 61217, "epoch": 1457} {"train_loss": -6.031620025634766, "global_step": 61218, "epoch": 1457} {"train_loss": -5.843265533447266, "global_step": 61219, "epoch": 1457} {"train_loss": -5.932823181152344, "global_step": 61220, "epoch": 1457} {"train_loss": -5.927434921264648, "global_step": 61221, "epoch": 1457} {"train_loss": -5.946957111358643, "global_step": 61222, "epoch": 1457} {"train_loss": -6.013790130615234, "global_step": 61223, "epoch": 1457} {"train_loss": -6.025571823120117, "global_step": 61224, "epoch": 1457} {"train_loss": -5.897611141204834, "global_step": 61225, "epoch": 1457} {"train_loss": -6.067926406860352, "global_step": 61226, "epoch": 1457} {"train_loss": -5.905402183532715, "global_step": 61227, "epoch": 1457} {"train_loss": -5.931430816650391, "global_step": 61228, "epoch": 1457} {"train_loss": -5.999307632446289, "global_step": 61229, "epoch": 1457} {"train_loss": -5.907773017883301, "global_step": 61230, "epoch": 1457} {"train_loss": -5.87063455581665, "global_step": 61231, "epoch": 1457} {"train_loss": -5.949001312255859, "global_step": 61232, "epoch": 1457} {"train_loss": -5.878393650054932, "global_step": 61233, "epoch": 1457} {"train_loss": -5.968292236328125, "global_step": 61234, "epoch": 1457} {"train_loss": -5.918135643005371, "global_step": 61235, "epoch": 1457, "val_loss": 74284.2578125} {"train_loss": -6.044310569763184, "global_step": 61236, "epoch": 1458} {"train_loss": -5.808444499969482, "global_step": 61237, "epoch": 1458} {"train_loss": -5.876657485961914, "global_step": 61238, "epoch": 1458} {"train_loss": -5.895859241485596, "global_step": 61239, "epoch": 1458} {"train_loss": -5.902651786804199, "global_step": 61240, "epoch": 1458} {"train_loss": -5.940068244934082, "global_step": 61241, "epoch": 1458} {"train_loss": -5.926812648773193, "global_step": 61242, "epoch": 1458} {"train_loss": -5.917388439178467, "global_step": 61243, "epoch": 1458} {"train_loss": -5.838716506958008, "global_step": 61244, "epoch": 1458} {"train_loss": -6.006951332092285, "global_step": 61245, "epoch": 1458} {"train_loss": -5.863638401031494, "global_step": 61246, "epoch": 1458} {"train_loss": -5.893162727355957, "global_step": 61247, "epoch": 1458} {"train_loss": -5.905019283294678, "global_step": 61248, "epoch": 1458} {"train_loss": -5.826928615570068, "global_step": 61249, "epoch": 1458} {"train_loss": -5.8827009201049805, "global_step": 61250, "epoch": 1458} {"train_loss": -5.9473772048950195, "global_step": 61251, "epoch": 1458} {"train_loss": -5.945718288421631, "global_step": 61252, "epoch": 1458} {"train_loss": -5.898151397705078, "global_step": 61253, "epoch": 1458} {"train_loss": -5.834267616271973, "global_step": 61254, "epoch": 1458} {"train_loss": -5.861132621765137, "global_step": 61255, "epoch": 1458} {"train_loss": -5.971418380737305, "global_step": 61256, "epoch": 1458} {"train_loss": -5.795107841491699, "global_step": 61257, "epoch": 1458} {"train_loss": -5.841180801391602, "global_step": 61258, "epoch": 1458} {"train_loss": -5.872219085693359, "global_step": 61259, "epoch": 1458} {"train_loss": -5.931985378265381, "global_step": 61260, "epoch": 1458} {"train_loss": -6.019417762756348, "global_step": 61261, "epoch": 1458} {"train_loss": -5.915408134460449, "global_step": 61262, "epoch": 1458} {"train_loss": -5.978482246398926, "global_step": 61263, "epoch": 1458} {"train_loss": -5.972338676452637, "global_step": 61264, "epoch": 1458} {"train_loss": -5.920678615570068, "global_step": 61265, "epoch": 1458} {"train_loss": -5.868991851806641, "global_step": 61266, "epoch": 1458} {"train_loss": -5.88862419128418, "global_step": 61267, "epoch": 1458} {"train_loss": -5.95379638671875, "global_step": 61268, "epoch": 1458} {"train_loss": -5.787520408630371, "global_step": 61269, "epoch": 1458} {"train_loss": -5.891160488128662, "global_step": 61270, "epoch": 1458} {"train_loss": -5.848255157470703, "global_step": 61271, "epoch": 1458} {"train_loss": -5.770552635192871, "global_step": 61272, "epoch": 1458} {"train_loss": -5.95391321182251, "global_step": 61273, "epoch": 1458} {"train_loss": -5.907866477966309, "global_step": 61274, "epoch": 1458} {"train_loss": -5.992948532104492, "global_step": 61275, "epoch": 1458} {"train_loss": -5.891162395477295, "global_step": 61276, "epoch": 1458} {"train_loss": -5.901356969560895, "global_step": 61277, "epoch": 1458, "val_loss": 74404.90625} {"train_loss": -6.007478713989258, "global_step": 61278, "epoch": 1459} {"train_loss": -6.061519622802734, "global_step": 61279, "epoch": 1459} {"train_loss": -6.008792400360107, "global_step": 61280, "epoch": 1459} {"train_loss": -5.9778523445129395, "global_step": 61281, "epoch": 1459} {"train_loss": -5.9566497802734375, "global_step": 61282, "epoch": 1459} {"train_loss": -5.992247581481934, "global_step": 61283, "epoch": 1459} {"train_loss": -5.92218542098999, "global_step": 61284, "epoch": 1459} {"train_loss": -5.877400875091553, "global_step": 61285, "epoch": 1459} {"train_loss": -6.010861396789551, "global_step": 61286, "epoch": 1459} {"train_loss": -5.879399299621582, "global_step": 61287, "epoch": 1459} {"train_loss": -5.943610191345215, "global_step": 61288, "epoch": 1459} {"train_loss": -6.019848823547363, "global_step": 61289, "epoch": 1459} {"train_loss": -5.817126750946045, "global_step": 61290, "epoch": 1459} {"train_loss": -5.9522199630737305, "global_step": 61291, "epoch": 1459} {"train_loss": -5.851895809173584, "global_step": 61292, "epoch": 1459} {"train_loss": -5.92674446105957, "global_step": 61293, "epoch": 1459} {"train_loss": -5.876720428466797, "global_step": 61294, "epoch": 1459} {"train_loss": -5.786462783813477, "global_step": 61295, "epoch": 1459} {"train_loss": -5.945296287536621, "global_step": 61296, "epoch": 1459} {"train_loss": -5.7558274269104, "global_step": 61297, "epoch": 1459} {"train_loss": -5.837810516357422, "global_step": 61298, "epoch": 1459} {"train_loss": -5.809289932250977, "global_step": 61299, "epoch": 1459} {"train_loss": -5.854969024658203, "global_step": 61300, "epoch": 1459} {"train_loss": -5.738332748413086, "global_step": 61301, "epoch": 1459} {"train_loss": -5.923727512359619, "global_step": 61302, "epoch": 1459} {"train_loss": -5.7528252601623535, "global_step": 61303, "epoch": 1459} {"train_loss": -5.8456597328186035, "global_step": 61304, "epoch": 1459} {"train_loss": -5.979016304016113, "global_step": 61305, "epoch": 1459} {"train_loss": -5.737843036651611, "global_step": 61306, "epoch": 1459} {"train_loss": -5.7652764320373535, "global_step": 61307, "epoch": 1459} {"train_loss": -5.779603481292725, "global_step": 61308, "epoch": 1459} {"train_loss": -5.901034832000732, "global_step": 61309, "epoch": 1459} {"train_loss": -5.871274471282959, "global_step": 61310, "epoch": 1459} {"train_loss": -5.816961288452148, "global_step": 61311, "epoch": 1459} {"train_loss": -5.8342695236206055, "global_step": 61312, "epoch": 1459} {"train_loss": -5.858670234680176, "global_step": 61313, "epoch": 1459} {"train_loss": -5.955471992492676, "global_step": 61314, "epoch": 1459} {"train_loss": -5.976238250732422, "global_step": 61315, "epoch": 1459} {"train_loss": -5.956488609313965, "global_step": 61316, "epoch": 1459} {"train_loss": -5.918858528137207, "global_step": 61317, "epoch": 1459} {"train_loss": -5.934395790100098, "global_step": 61318, "epoch": 1459} {"train_loss": -5.893609932490757, "global_step": 61319, "epoch": 1459, "val_loss": 74297.4375} {"train_loss": -5.81447172164917, "global_step": 61320, "epoch": 1460} {"train_loss": -6.018470764160156, "global_step": 61321, "epoch": 1460} {"train_loss": -5.85828161239624, "global_step": 61322, "epoch": 1460} {"train_loss": -5.975454330444336, "global_step": 61323, "epoch": 1460} {"train_loss": -5.871657371520996, "global_step": 61324, "epoch": 1460} {"train_loss": -5.938496112823486, "global_step": 61325, "epoch": 1460} {"train_loss": -5.8816375732421875, "global_step": 61326, "epoch": 1460} {"train_loss": -5.896412372589111, "global_step": 61327, "epoch": 1460} {"train_loss": -5.876649856567383, "global_step": 61328, "epoch": 1460} {"train_loss": -5.998391151428223, "global_step": 61329, "epoch": 1460} {"train_loss": -5.8531599044799805, "global_step": 61330, "epoch": 1460} {"train_loss": -5.78400993347168, "global_step": 61331, "epoch": 1460} {"train_loss": -5.874565601348877, "global_step": 61332, "epoch": 1460} {"train_loss": -5.845365524291992, "global_step": 61333, "epoch": 1460} {"train_loss": -5.909388542175293, "global_step": 61334, "epoch": 1460} {"train_loss": -5.930925369262695, "global_step": 61335, "epoch": 1460} {"train_loss": -6.016880512237549, "global_step": 61336, "epoch": 1460} {"train_loss": -5.9592180252075195, "global_step": 61337, "epoch": 1460} {"train_loss": -5.867999076843262, "global_step": 61338, "epoch": 1460} {"train_loss": -5.869344234466553, "global_step": 61339, "epoch": 1460} {"train_loss": -5.777440071105957, "global_step": 61340, "epoch": 1460} {"train_loss": -5.828723907470703, "global_step": 61341, "epoch": 1460} {"train_loss": -5.871407508850098, "global_step": 61342, "epoch": 1460} {"train_loss": -5.903289318084717, "global_step": 61343, "epoch": 1460} {"train_loss": -5.842668533325195, "global_step": 61344, "epoch": 1460} {"train_loss": -5.981332778930664, "global_step": 61345, "epoch": 1460} {"train_loss": -5.782552242279053, "global_step": 61346, "epoch": 1460} {"train_loss": -5.815195083618164, "global_step": 61347, "epoch": 1460} {"train_loss": -5.850655555725098, "global_step": 61348, "epoch": 1460} {"train_loss": -5.832037925720215, "global_step": 61349, "epoch": 1460} {"train_loss": -5.902260780334473, "global_step": 61350, "epoch": 1460} {"train_loss": -5.845719814300537, "global_step": 61351, "epoch": 1460} {"train_loss": -5.781200885772705, "global_step": 61352, "epoch": 1460} {"train_loss": -5.883768081665039, "global_step": 61353, "epoch": 1460} {"train_loss": -5.92613410949707, "global_step": 61354, "epoch": 1460} {"train_loss": -5.987185478210449, "global_step": 61355, "epoch": 1460} {"train_loss": -5.976578712463379, "global_step": 61356, "epoch": 1460} {"train_loss": -5.960554122924805, "global_step": 61357, "epoch": 1460} {"train_loss": -5.810874938964844, "global_step": 61358, "epoch": 1460} {"train_loss": -5.886845588684082, "global_step": 61359, "epoch": 1460} {"train_loss": -5.83198356628418, "global_step": 61360, "epoch": 1460} {"train_loss": -5.889034191767375, "global_step": 61361, "epoch": 1460, "val_loss": 75102.40625} {"train_loss": -5.854813575744629, "global_step": 61362, "epoch": 1461} {"train_loss": -5.917239189147949, "global_step": 61363, "epoch": 1461} {"train_loss": -5.831009864807129, "global_step": 61364, "epoch": 1461} {"train_loss": -5.926801681518555, "global_step": 61365, "epoch": 1461} {"train_loss": -5.891387939453125, "global_step": 61366, "epoch": 1461} {"train_loss": -5.9047441482543945, "global_step": 61367, "epoch": 1461} {"train_loss": -5.904626369476318, "global_step": 61368, "epoch": 1461} {"train_loss": -5.7997283935546875, "global_step": 61369, "epoch": 1461} {"train_loss": -6.013656139373779, "global_step": 61370, "epoch": 1461} {"train_loss": -6.007621765136719, "global_step": 61371, "epoch": 1461} {"train_loss": -5.861183166503906, "global_step": 61372, "epoch": 1461} {"train_loss": -5.975070953369141, "global_step": 61373, "epoch": 1461} {"train_loss": -5.9065423011779785, "global_step": 61374, "epoch": 1461} {"train_loss": -5.892176628112793, "global_step": 61375, "epoch": 1461} {"train_loss": -5.998012065887451, "global_step": 61376, "epoch": 1461} {"train_loss": -5.817718029022217, "global_step": 61377, "epoch": 1461} {"train_loss": -5.924019813537598, "global_step": 61378, "epoch": 1461} {"train_loss": -6.03770112991333, "global_step": 61379, "epoch": 1461} {"train_loss": -5.877919673919678, "global_step": 61380, "epoch": 1461} {"train_loss": -5.760000228881836, "global_step": 61381, "epoch": 1461} {"train_loss": -5.904730319976807, "global_step": 61382, "epoch": 1461} {"train_loss": -5.858025550842285, "global_step": 61383, "epoch": 1461} {"train_loss": -5.784089088439941, "global_step": 61384, "epoch": 1461} {"train_loss": -5.82861328125, "global_step": 61385, "epoch": 1461} {"train_loss": -5.8725152015686035, "global_step": 61386, "epoch": 1461} {"train_loss": -5.875338554382324, "global_step": 61387, "epoch": 1461} {"train_loss": -5.946974754333496, "global_step": 61388, "epoch": 1461} {"train_loss": -5.862496376037598, "global_step": 61389, "epoch": 1461} {"train_loss": -5.942212104797363, "global_step": 61390, "epoch": 1461} {"train_loss": -5.853522300720215, "global_step": 61391, "epoch": 1461} {"train_loss": -5.898049831390381, "global_step": 61392, "epoch": 1461} {"train_loss": -5.821611404418945, "global_step": 61393, "epoch": 1461} {"train_loss": -5.9259114265441895, "global_step": 61394, "epoch": 1461} {"train_loss": -5.780665874481201, "global_step": 61395, "epoch": 1461} {"train_loss": -5.860850811004639, "global_step": 61396, "epoch": 1461} {"train_loss": -5.926385402679443, "global_step": 61397, "epoch": 1461} {"train_loss": -5.891328811645508, "global_step": 61398, "epoch": 1461} {"train_loss": -5.814184665679932, "global_step": 61399, "epoch": 1461} {"train_loss": -5.703807830810547, "global_step": 61400, "epoch": 1461} {"train_loss": -5.844688415527344, "global_step": 61401, "epoch": 1461} {"train_loss": -5.863162994384766, "global_step": 61402, "epoch": 1461} {"train_loss": -5.881241298857189, "global_step": 61403, "epoch": 1461, "val_loss": 75288.6875} {"train_loss": -5.935393333435059, "global_step": 61404, "epoch": 1462} {"train_loss": -5.829440116882324, "global_step": 61405, "epoch": 1462} {"train_loss": -6.015875339508057, "global_step": 61406, "epoch": 1462} {"train_loss": -5.891951560974121, "global_step": 61407, "epoch": 1462} {"train_loss": -6.001727104187012, "global_step": 61408, "epoch": 1462} {"train_loss": -5.814672470092773, "global_step": 61409, "epoch": 1462} {"train_loss": -5.836180686950684, "global_step": 61410, "epoch": 1462} {"train_loss": -6.102257251739502, "global_step": 61411, "epoch": 1462} {"train_loss": -5.829934120178223, "global_step": 61412, "epoch": 1462} {"train_loss": -5.951075553894043, "global_step": 61413, "epoch": 1462} {"train_loss": -5.845889091491699, "global_step": 61414, "epoch": 1462} {"train_loss": -5.846550941467285, "global_step": 61415, "epoch": 1462} {"train_loss": -5.715579986572266, "global_step": 61416, "epoch": 1462} {"train_loss": -5.952530384063721, "global_step": 61417, "epoch": 1462} {"train_loss": -5.754907608032227, "global_step": 61418, "epoch": 1462} {"train_loss": -5.811387062072754, "global_step": 61419, "epoch": 1462} {"train_loss": -6.011331081390381, "global_step": 61420, "epoch": 1462} {"train_loss": -5.724394798278809, "global_step": 61421, "epoch": 1462} {"train_loss": -6.002506256103516, "global_step": 61422, "epoch": 1462} {"train_loss": -5.9132819175720215, "global_step": 61423, "epoch": 1462} {"train_loss": -5.774510383605957, "global_step": 61424, "epoch": 1462} {"train_loss": -5.7762451171875, "global_step": 61425, "epoch": 1462} {"train_loss": -5.943436145782471, "global_step": 61426, "epoch": 1462} {"train_loss": -5.729855537414551, "global_step": 61427, "epoch": 1462} {"train_loss": -5.902101993560791, "global_step": 61428, "epoch": 1462} {"train_loss": -5.84101676940918, "global_step": 61429, "epoch": 1462} {"train_loss": -5.86710262298584, "global_step": 61430, "epoch": 1462} {"train_loss": -5.759181499481201, "global_step": 61431, "epoch": 1462} {"train_loss": -5.638971328735352, "global_step": 61432, "epoch": 1462} {"train_loss": -5.8525190353393555, "global_step": 61433, "epoch": 1462} {"train_loss": -5.790911674499512, "global_step": 61434, "epoch": 1462} {"train_loss": -5.858009338378906, "global_step": 61435, "epoch": 1462} {"train_loss": -5.843538284301758, "global_step": 61436, "epoch": 1462} {"train_loss": -5.887800216674805, "global_step": 61437, "epoch": 1462} {"train_loss": -5.724770545959473, "global_step": 61438, "epoch": 1462} {"train_loss": -5.884186744689941, "global_step": 61439, "epoch": 1462} {"train_loss": -5.861871719360352, "global_step": 61440, "epoch": 1462} {"train_loss": -5.848325729370117, "global_step": 61441, "epoch": 1462} {"train_loss": -5.882110595703125, "global_step": 61442, "epoch": 1462} {"train_loss": -5.876654624938965, "global_step": 61443, "epoch": 1462} {"train_loss": -5.861204147338867, "global_step": 61444, "epoch": 1462} {"train_loss": -5.858915726343791, "global_step": 61445, "epoch": 1462, "val_loss": 74503.328125} {"train_loss": -5.898989200592041, "global_step": 61446, "epoch": 1463} {"train_loss": -5.964607238769531, "global_step": 61447, "epoch": 1463} {"train_loss": -5.900297164916992, "global_step": 61448, "epoch": 1463} {"train_loss": -5.897031784057617, "global_step": 61449, "epoch": 1463} {"train_loss": -5.843377113342285, "global_step": 61450, "epoch": 1463} {"train_loss": -6.068902969360352, "global_step": 61451, "epoch": 1463} {"train_loss": -5.892265319824219, "global_step": 61452, "epoch": 1463} {"train_loss": -5.922152519226074, "global_step": 61453, "epoch": 1463} {"train_loss": -5.96100378036499, "global_step": 61454, "epoch": 1463} {"train_loss": -5.9027814865112305, "global_step": 61455, "epoch": 1463} {"train_loss": -5.814992904663086, "global_step": 61456, "epoch": 1463} {"train_loss": -5.896365165710449, "global_step": 61457, "epoch": 1463} {"train_loss": -5.856048107147217, "global_step": 61458, "epoch": 1463} {"train_loss": -5.878516674041748, "global_step": 61459, "epoch": 1463} {"train_loss": -6.003589153289795, "global_step": 61460, "epoch": 1463} {"train_loss": -5.87956428527832, "global_step": 61461, "epoch": 1463} {"train_loss": -5.9846906661987305, "global_step": 61462, "epoch": 1463} {"train_loss": -6.038155555725098, "global_step": 61463, "epoch": 1463} {"train_loss": -5.903285980224609, "global_step": 61464, "epoch": 1463} {"train_loss": -5.895180702209473, "global_step": 61465, "epoch": 1463} {"train_loss": -5.866007328033447, "global_step": 61466, "epoch": 1463} {"train_loss": -5.941183567047119, "global_step": 61467, "epoch": 1463} {"train_loss": -5.8418426513671875, "global_step": 61468, "epoch": 1463} {"train_loss": -5.947359561920166, "global_step": 61469, "epoch": 1463} {"train_loss": -5.979188919067383, "global_step": 61470, "epoch": 1463} {"train_loss": -5.818195343017578, "global_step": 61471, "epoch": 1463} {"train_loss": -5.895892143249512, "global_step": 61472, "epoch": 1463} {"train_loss": -6.0327863693237305, "global_step": 61473, "epoch": 1463} {"train_loss": -5.894847869873047, "global_step": 61474, "epoch": 1463} {"train_loss": -5.991462230682373, "global_step": 61475, "epoch": 1463} {"train_loss": -5.926692962646484, "global_step": 61476, "epoch": 1463} {"train_loss": -5.767642974853516, "global_step": 61477, "epoch": 1463} {"train_loss": -5.903226852416992, "global_step": 61478, "epoch": 1463} {"train_loss": -5.977103233337402, "global_step": 61479, "epoch": 1463} {"train_loss": -6.069230079650879, "global_step": 61480, "epoch": 1463} {"train_loss": -5.831766605377197, "global_step": 61481, "epoch": 1463} {"train_loss": -6.001987457275391, "global_step": 61482, "epoch": 1463} {"train_loss": -5.950503349304199, "global_step": 61483, "epoch": 1463} {"train_loss": -5.94864559173584, "global_step": 61484, "epoch": 1463} {"train_loss": -5.894776821136475, "global_step": 61485, "epoch": 1463} {"train_loss": -6.061277866363525, "global_step": 61486, "epoch": 1463} {"train_loss": -5.926530769893101, "global_step": 61487, "epoch": 1463, "val_loss": 74769.8984375} {"train_loss": -5.871190547943115, "global_step": 61488, "epoch": 1464} {"train_loss": -6.086999893188477, "global_step": 61489, "epoch": 1464} {"train_loss": -5.909271717071533, "global_step": 61490, "epoch": 1464} {"train_loss": -5.999570369720459, "global_step": 61491, "epoch": 1464} {"train_loss": -6.0215253829956055, "global_step": 61492, "epoch": 1464} {"train_loss": -5.908637523651123, "global_step": 61493, "epoch": 1464} {"train_loss": -5.971181869506836, "global_step": 61494, "epoch": 1464} {"train_loss": -5.953747749328613, "global_step": 61495, "epoch": 1464} {"train_loss": -5.6970014572143555, "global_step": 61496, "epoch": 1464} {"train_loss": -5.895637512207031, "global_step": 61497, "epoch": 1464} {"train_loss": -6.012940406799316, "global_step": 61498, "epoch": 1464} {"train_loss": -5.789402961730957, "global_step": 61499, "epoch": 1464} {"train_loss": -5.827328205108643, "global_step": 61500, "epoch": 1464} {"train_loss": -5.90841817855835, "global_step": 61501, "epoch": 1464} {"train_loss": -5.799853801727295, "global_step": 61502, "epoch": 1464} {"train_loss": -5.94361686706543, "global_step": 61503, "epoch": 1464} {"train_loss": -5.935863971710205, "global_step": 61504, "epoch": 1464} {"train_loss": -5.947354316711426, "global_step": 61505, "epoch": 1464} {"train_loss": -5.829333782196045, "global_step": 61506, "epoch": 1464} {"train_loss": -5.847213268280029, "global_step": 61507, "epoch": 1464} {"train_loss": -5.930759906768799, "global_step": 61508, "epoch": 1464} {"train_loss": -5.9959716796875, "global_step": 61509, "epoch": 1464} {"train_loss": -5.7970428466796875, "global_step": 61510, "epoch": 1464} {"train_loss": -6.065613746643066, "global_step": 61511, "epoch": 1464} {"train_loss": -5.734761714935303, "global_step": 61512, "epoch": 1464} {"train_loss": -5.940709590911865, "global_step": 61513, "epoch": 1464} {"train_loss": -5.827097415924072, "global_step": 61514, "epoch": 1464} {"train_loss": -5.806951522827148, "global_step": 61515, "epoch": 1464} {"train_loss": -5.940153121948242, "global_step": 61516, "epoch": 1464} {"train_loss": -5.858048439025879, "global_step": 61517, "epoch": 1464} {"train_loss": -5.8934431076049805, "global_step": 61518, "epoch": 1464} {"train_loss": -5.787456512451172, "global_step": 61519, "epoch": 1464} {"train_loss": -5.9690728187561035, "global_step": 61520, "epoch": 1464} {"train_loss": -5.868105888366699, "global_step": 61521, "epoch": 1464} {"train_loss": -5.950584411621094, "global_step": 61522, "epoch": 1464} {"train_loss": -5.845807075500488, "global_step": 61523, "epoch": 1464} {"train_loss": -5.8573713302612305, "global_step": 61524, "epoch": 1464} {"train_loss": -5.8860650062561035, "global_step": 61525, "epoch": 1464} {"train_loss": -5.923612594604492, "global_step": 61526, "epoch": 1464} {"train_loss": -5.980474472045898, "global_step": 61527, "epoch": 1464} {"train_loss": -5.844511985778809, "global_step": 61528, "epoch": 1464} {"train_loss": -5.897845029830933, "global_step": 61529, "epoch": 1464, "val_loss": 74353.953125} {"train_loss": -5.918971061706543, "global_step": 61530, "epoch": 1465} {"train_loss": -5.9097185134887695, "global_step": 61531, "epoch": 1465} {"train_loss": -5.887823581695557, "global_step": 61532, "epoch": 1465} {"train_loss": -5.886183738708496, "global_step": 61533, "epoch": 1465} {"train_loss": -5.981668472290039, "global_step": 61534, "epoch": 1465} {"train_loss": -5.995923042297363, "global_step": 61535, "epoch": 1465} {"train_loss": -5.878240585327148, "global_step": 61536, "epoch": 1465} {"train_loss": -6.036788463592529, "global_step": 61537, "epoch": 1465} {"train_loss": -5.879011631011963, "global_step": 61538, "epoch": 1465} {"train_loss": -6.013144493103027, "global_step": 61539, "epoch": 1465} {"train_loss": -5.9304304122924805, "global_step": 61540, "epoch": 1465} {"train_loss": -5.901333332061768, "global_step": 61541, "epoch": 1465} {"train_loss": -6.0620503425598145, "global_step": 61542, "epoch": 1465} {"train_loss": -5.985742092132568, "global_step": 61543, "epoch": 1465} {"train_loss": -6.004973411560059, "global_step": 61544, "epoch": 1465} {"train_loss": -5.911255359649658, "global_step": 61545, "epoch": 1465} {"train_loss": -5.941765785217285, "global_step": 61546, "epoch": 1465} {"train_loss": -6.006433486938477, "global_step": 61547, "epoch": 1465} {"train_loss": -5.832493782043457, "global_step": 61548, "epoch": 1465} {"train_loss": -5.898548126220703, "global_step": 61549, "epoch": 1465} {"train_loss": -5.967942714691162, "global_step": 61550, "epoch": 1465} {"train_loss": -5.894964218139648, "global_step": 61551, "epoch": 1465} {"train_loss": -6.0256428718566895, "global_step": 61552, "epoch": 1465} {"train_loss": -5.985997676849365, "global_step": 61553, "epoch": 1465} {"train_loss": -6.0247883796691895, "global_step": 61554, "epoch": 1465} {"train_loss": -5.928210258483887, "global_step": 61555, "epoch": 1465} {"train_loss": -5.84163761138916, "global_step": 61556, "epoch": 1465} {"train_loss": -5.88594913482666, "global_step": 61557, "epoch": 1465} {"train_loss": -5.707701683044434, "global_step": 61558, "epoch": 1465} {"train_loss": -5.966350555419922, "global_step": 61559, "epoch": 1465} {"train_loss": -5.961389541625977, "global_step": 61560, "epoch": 1465} {"train_loss": -5.810580253601074, "global_step": 61561, "epoch": 1465} {"train_loss": -5.912008285522461, "global_step": 61562, "epoch": 1465} {"train_loss": -5.773221015930176, "global_step": 61563, "epoch": 1465} {"train_loss": -5.866028785705566, "global_step": 61564, "epoch": 1465} {"train_loss": -5.792979717254639, "global_step": 61565, "epoch": 1465} {"train_loss": -5.899413108825684, "global_step": 61566, "epoch": 1465} {"train_loss": -5.84168815612793, "global_step": 61567, "epoch": 1465} {"train_loss": -5.942978382110596, "global_step": 61568, "epoch": 1465} {"train_loss": -5.787652492523193, "global_step": 61569, "epoch": 1465} {"train_loss": -5.934839725494385, "global_step": 61570, "epoch": 1465} {"train_loss": -5.9176191829499745, "global_step": 61571, "epoch": 1465, "val_loss": 74357.9453125} {"train_loss": -5.907698154449463, "global_step": 61572, "epoch": 1466} {"train_loss": -5.924877643585205, "global_step": 61573, "epoch": 1466} {"train_loss": -5.881560325622559, "global_step": 61574, "epoch": 1466} {"train_loss": -5.868642330169678, "global_step": 61575, "epoch": 1466} {"train_loss": -5.905502796173096, "global_step": 61576, "epoch": 1466} {"train_loss": -5.963785648345947, "global_step": 61577, "epoch": 1466} {"train_loss": -5.944034099578857, "global_step": 61578, "epoch": 1466} {"train_loss": -5.9740705490112305, "global_step": 61579, "epoch": 1466} {"train_loss": -5.897355079650879, "global_step": 61580, "epoch": 1466} {"train_loss": -5.962277412414551, "global_step": 61581, "epoch": 1466} {"train_loss": -5.945667266845703, "global_step": 61582, "epoch": 1466} {"train_loss": -5.897897720336914, "global_step": 61583, "epoch": 1466} {"train_loss": -5.988513946533203, "global_step": 61584, "epoch": 1466} {"train_loss": -5.89499568939209, "global_step": 61585, "epoch": 1466} {"train_loss": -5.914238452911377, "global_step": 61586, "epoch": 1466} {"train_loss": -5.866378307342529, "global_step": 61587, "epoch": 1466} {"train_loss": -5.935148239135742, "global_step": 61588, "epoch": 1466} {"train_loss": -5.977034568786621, "global_step": 61589, "epoch": 1466} {"train_loss": -5.884425163269043, "global_step": 61590, "epoch": 1466} {"train_loss": -6.0088958740234375, "global_step": 61591, "epoch": 1466} {"train_loss": -5.965577125549316, "global_step": 61592, "epoch": 1466} {"train_loss": -5.840564727783203, "global_step": 61593, "epoch": 1466} {"train_loss": -5.793990612030029, "global_step": 61594, "epoch": 1466} {"train_loss": -5.9712629318237305, "global_step": 61595, "epoch": 1466} {"train_loss": -5.796013832092285, "global_step": 61596, "epoch": 1466} {"train_loss": -5.895078659057617, "global_step": 61597, "epoch": 1466} {"train_loss": -5.990094184875488, "global_step": 61598, "epoch": 1466} {"train_loss": -5.823956489562988, "global_step": 61599, "epoch": 1466} {"train_loss": -5.882567882537842, "global_step": 61600, "epoch": 1466} {"train_loss": -5.956388473510742, "global_step": 61601, "epoch": 1466} {"train_loss": -5.87849235534668, "global_step": 61602, "epoch": 1466} {"train_loss": -5.996638774871826, "global_step": 61603, "epoch": 1466} {"train_loss": -5.838503360748291, "global_step": 61604, "epoch": 1466} {"train_loss": -6.011054992675781, "global_step": 61605, "epoch": 1466} {"train_loss": -5.934993743896484, "global_step": 61606, "epoch": 1466} {"train_loss": -5.9633002281188965, "global_step": 61607, "epoch": 1466} {"train_loss": -5.939148902893066, "global_step": 61608, "epoch": 1466} {"train_loss": -6.096378326416016, "global_step": 61609, "epoch": 1466} {"train_loss": -5.939378261566162, "global_step": 61610, "epoch": 1466} {"train_loss": -5.8704938888549805, "global_step": 61611, "epoch": 1466} {"train_loss": -5.92788028717041, "global_step": 61612, "epoch": 1466} {"train_loss": -5.925206547691708, "global_step": 61613, "epoch": 1466, "val_loss": 74515.390625} {"train_loss": -5.883539199829102, "global_step": 61614, "epoch": 1467} {"train_loss": -5.900256633758545, "global_step": 61615, "epoch": 1467} {"train_loss": -6.068819046020508, "global_step": 61616, "epoch": 1467} {"train_loss": -5.907381057739258, "global_step": 61617, "epoch": 1467} {"train_loss": -5.858309745788574, "global_step": 61618, "epoch": 1467} {"train_loss": -5.925029277801514, "global_step": 61619, "epoch": 1467} {"train_loss": -5.896241664886475, "global_step": 61620, "epoch": 1467} {"train_loss": -5.923619270324707, "global_step": 61621, "epoch": 1467} {"train_loss": -6.082945823669434, "global_step": 61622, "epoch": 1467} {"train_loss": -5.955877304077148, "global_step": 61623, "epoch": 1467} {"train_loss": -5.970022201538086, "global_step": 61624, "epoch": 1467} {"train_loss": -5.7680888175964355, "global_step": 61625, "epoch": 1467} {"train_loss": -6.03948974609375, "global_step": 61626, "epoch": 1467} {"train_loss": -6.028903007507324, "global_step": 61627, "epoch": 1467} {"train_loss": -5.905491828918457, "global_step": 61628, "epoch": 1467} {"train_loss": -5.881341934204102, "global_step": 61629, "epoch": 1467} {"train_loss": -5.978797435760498, "global_step": 61630, "epoch": 1467} {"train_loss": -5.789945602416992, "global_step": 61631, "epoch": 1467} {"train_loss": -5.95210075378418, "global_step": 61632, "epoch": 1467} {"train_loss": -6.017154216766357, "global_step": 61633, "epoch": 1467} {"train_loss": -5.928306579589844, "global_step": 61634, "epoch": 1467} {"train_loss": -5.822053909301758, "global_step": 61635, "epoch": 1467} {"train_loss": -5.954855918884277, "global_step": 61636, "epoch": 1467} {"train_loss": -5.867910861968994, "global_step": 61637, "epoch": 1467} {"train_loss": -5.925266265869141, "global_step": 61638, "epoch": 1467} {"train_loss": -5.973570823669434, "global_step": 61639, "epoch": 1467} {"train_loss": -5.912811279296875, "global_step": 61640, "epoch": 1467} {"train_loss": -5.8633928298950195, "global_step": 61641, "epoch": 1467} {"train_loss": -5.821152210235596, "global_step": 61642, "epoch": 1467} {"train_loss": -6.080981254577637, "global_step": 61643, "epoch": 1467} {"train_loss": -5.911774158477783, "global_step": 61644, "epoch": 1467} {"train_loss": -5.983527660369873, "global_step": 61645, "epoch": 1467} {"train_loss": -5.866940975189209, "global_step": 61646, "epoch": 1467} {"train_loss": -5.898028373718262, "global_step": 61647, "epoch": 1467} {"train_loss": -5.906783103942871, "global_step": 61648, "epoch": 1467} {"train_loss": -5.858140468597412, "global_step": 61649, "epoch": 1467} {"train_loss": -5.930136203765869, "global_step": 61650, "epoch": 1467} {"train_loss": -5.899994850158691, "global_step": 61651, "epoch": 1467} {"train_loss": -5.8789849281311035, "global_step": 61652, "epoch": 1467} {"train_loss": -5.901179313659668, "global_step": 61653, "epoch": 1467} {"train_loss": -5.897168159484863, "global_step": 61654, "epoch": 1467} {"train_loss": -5.921187707356045, "global_step": 61655, "epoch": 1467, "val_loss": 74566.921875} {"train_loss": -5.835852146148682, "global_step": 61656, "epoch": 1468} {"train_loss": -5.872194290161133, "global_step": 61657, "epoch": 1468} {"train_loss": -5.87058162689209, "global_step": 61658, "epoch": 1468} {"train_loss": -5.809484481811523, "global_step": 61659, "epoch": 1468} {"train_loss": -5.926773548126221, "global_step": 61660, "epoch": 1468} {"train_loss": -5.857964515686035, "global_step": 61661, "epoch": 1468} {"train_loss": -5.956852912902832, "global_step": 61662, "epoch": 1468} {"train_loss": -6.0338006019592285, "global_step": 61663, "epoch": 1468} {"train_loss": -5.929964065551758, "global_step": 61664, "epoch": 1468} {"train_loss": -5.931855201721191, "global_step": 61665, "epoch": 1468} {"train_loss": -5.920071125030518, "global_step": 61666, "epoch": 1468} {"train_loss": -5.9816694259643555, "global_step": 61667, "epoch": 1468} {"train_loss": -5.924833297729492, "global_step": 61668, "epoch": 1468} {"train_loss": -6.024993896484375, "global_step": 61669, "epoch": 1468} {"train_loss": -5.913522720336914, "global_step": 61670, "epoch": 1468} {"train_loss": -5.895862102508545, "global_step": 61671, "epoch": 1468} {"train_loss": -5.926585674285889, "global_step": 61672, "epoch": 1468} {"train_loss": -6.019369125366211, "global_step": 61673, "epoch": 1468} {"train_loss": -6.072382926940918, "global_step": 61674, "epoch": 1468} {"train_loss": -5.977489471435547, "global_step": 61675, "epoch": 1468} {"train_loss": -5.960362434387207, "global_step": 61676, "epoch": 1468} {"train_loss": -5.791295051574707, "global_step": 61677, "epoch": 1468} {"train_loss": -5.932936191558838, "global_step": 61678, "epoch": 1468} {"train_loss": -5.969847202301025, "global_step": 61679, "epoch": 1468} {"train_loss": -5.884211540222168, "global_step": 61680, "epoch": 1468} {"train_loss": -5.9075422286987305, "global_step": 61681, "epoch": 1468} {"train_loss": -5.956485748291016, "global_step": 61682, "epoch": 1468} {"train_loss": -6.046230316162109, "global_step": 61683, "epoch": 1468} {"train_loss": -5.961775779724121, "global_step": 61684, "epoch": 1468} {"train_loss": -5.988973617553711, "global_step": 61685, "epoch": 1468} {"train_loss": -5.946813583374023, "global_step": 61686, "epoch": 1468} {"train_loss": -5.920958518981934, "global_step": 61687, "epoch": 1468} {"train_loss": -5.887275695800781, "global_step": 61688, "epoch": 1468} {"train_loss": -5.966826438903809, "global_step": 61689, "epoch": 1468} {"train_loss": -6.013280391693115, "global_step": 61690, "epoch": 1468} {"train_loss": -5.94130277633667, "global_step": 61691, "epoch": 1468} {"train_loss": -5.855506896972656, "global_step": 61692, "epoch": 1468} {"train_loss": -5.921418190002441, "global_step": 61693, "epoch": 1468} {"train_loss": -5.97113037109375, "global_step": 61694, "epoch": 1468} {"train_loss": -5.811453819274902, "global_step": 61695, "epoch": 1468} {"train_loss": -5.817917823791504, "global_step": 61696, "epoch": 1468} {"train_loss": -5.930111351467314, "global_step": 61697, "epoch": 1468, "val_loss": 74651.1484375} {"train_loss": -5.891010284423828, "global_step": 61698, "epoch": 1469} {"train_loss": -5.931076526641846, "global_step": 61699, "epoch": 1469} {"train_loss": -5.923468589782715, "global_step": 61700, "epoch": 1469} {"train_loss": -5.891529083251953, "global_step": 61701, "epoch": 1469} {"train_loss": -5.872504234313965, "global_step": 61702, "epoch": 1469} {"train_loss": -5.868521213531494, "global_step": 61703, "epoch": 1469} {"train_loss": -5.859631538391113, "global_step": 61704, "epoch": 1469} {"train_loss": -5.8917436599731445, "global_step": 61705, "epoch": 1469} {"train_loss": -5.935061931610107, "global_step": 61706, "epoch": 1469} {"train_loss": -6.015357971191406, "global_step": 61707, "epoch": 1469} {"train_loss": -5.934164524078369, "global_step": 61708, "epoch": 1469} {"train_loss": -6.019192695617676, "global_step": 61709, "epoch": 1469} {"train_loss": -5.921026229858398, "global_step": 61710, "epoch": 1469} {"train_loss": -5.993735313415527, "global_step": 61711, "epoch": 1469} {"train_loss": -5.955778121948242, "global_step": 61712, "epoch": 1469} {"train_loss": -5.983844757080078, "global_step": 61713, "epoch": 1469} {"train_loss": -5.973147392272949, "global_step": 61714, "epoch": 1469} {"train_loss": -5.983246803283691, "global_step": 61715, "epoch": 1469} {"train_loss": -5.787611484527588, "global_step": 61716, "epoch": 1469} {"train_loss": -5.960273742675781, "global_step": 61717, "epoch": 1469} {"train_loss": -5.936302661895752, "global_step": 61718, "epoch": 1469} {"train_loss": -5.963233947753906, "global_step": 61719, "epoch": 1469} {"train_loss": -6.011828422546387, "global_step": 61720, "epoch": 1469} {"train_loss": -6.014449596405029, "global_step": 61721, "epoch": 1469} {"train_loss": -5.9351115226745605, "global_step": 61722, "epoch": 1469} {"train_loss": -5.755043029785156, "global_step": 61723, "epoch": 1469} {"train_loss": -5.880828857421875, "global_step": 61724, "epoch": 1469} {"train_loss": -5.90623664855957, "global_step": 61725, "epoch": 1469} {"train_loss": -5.903554916381836, "global_step": 61726, "epoch": 1469} {"train_loss": -5.903984069824219, "global_step": 61727, "epoch": 1469} {"train_loss": -5.903168201446533, "global_step": 61728, "epoch": 1469} {"train_loss": -5.795414447784424, "global_step": 61729, "epoch": 1469} {"train_loss": -5.950573444366455, "global_step": 61730, "epoch": 1469} {"train_loss": -6.036466121673584, "global_step": 61731, "epoch": 1469} {"train_loss": -5.879685401916504, "global_step": 61732, "epoch": 1469} {"train_loss": -5.952124118804932, "global_step": 61733, "epoch": 1469} {"train_loss": -5.856264591217041, "global_step": 61734, "epoch": 1469} {"train_loss": -5.984787940979004, "global_step": 61735, "epoch": 1469} {"train_loss": -5.908222198486328, "global_step": 61736, "epoch": 1469} {"train_loss": -5.8651628494262695, "global_step": 61737, "epoch": 1469} {"train_loss": -5.923347473144531, "global_step": 61738, "epoch": 1469} {"train_loss": -5.924521639233544, "global_step": 61739, "epoch": 1469, "val_loss": 74897.8671875} {"train_loss": -5.939688682556152, "global_step": 61740, "epoch": 1470} {"train_loss": -5.976966381072998, "global_step": 61741, "epoch": 1470} {"train_loss": -5.877073287963867, "global_step": 61742, "epoch": 1470} {"train_loss": -5.929355621337891, "global_step": 61743, "epoch": 1470} {"train_loss": -5.968255043029785, "global_step": 61744, "epoch": 1470} {"train_loss": -5.887167930603027, "global_step": 61745, "epoch": 1470} {"train_loss": -5.9337158203125, "global_step": 61746, "epoch": 1470} {"train_loss": -5.947550296783447, "global_step": 61747, "epoch": 1470} {"train_loss": -5.8197808265686035, "global_step": 61748, "epoch": 1470} {"train_loss": -5.895496368408203, "global_step": 61749, "epoch": 1470} {"train_loss": -5.834837913513184, "global_step": 61750, "epoch": 1470} {"train_loss": -6.044870376586914, "global_step": 61751, "epoch": 1470} {"train_loss": -6.009711265563965, "global_step": 61752, "epoch": 1470} {"train_loss": -5.9284210205078125, "global_step": 61753, "epoch": 1470} {"train_loss": -5.922610282897949, "global_step": 61754, "epoch": 1470} {"train_loss": -5.9156084060668945, "global_step": 61755, "epoch": 1470} {"train_loss": -5.92350959777832, "global_step": 61756, "epoch": 1470} {"train_loss": -5.912806987762451, "global_step": 61757, "epoch": 1470} {"train_loss": -5.952256202697754, "global_step": 61758, "epoch": 1470} {"train_loss": -5.927730560302734, "global_step": 61759, "epoch": 1470} {"train_loss": -5.9331207275390625, "global_step": 61760, "epoch": 1470} {"train_loss": -5.910211563110352, "global_step": 61761, "epoch": 1470} {"train_loss": -5.876630783081055, "global_step": 61762, "epoch": 1470} {"train_loss": -5.922989368438721, "global_step": 61763, "epoch": 1470} {"train_loss": -5.88014030456543, "global_step": 61764, "epoch": 1470} {"train_loss": -5.842428207397461, "global_step": 61765, "epoch": 1470} {"train_loss": -5.891420364379883, "global_step": 61766, "epoch": 1470} {"train_loss": -5.934825897216797, "global_step": 61767, "epoch": 1470} {"train_loss": -5.966475963592529, "global_step": 61768, "epoch": 1470} {"train_loss": -5.969612121582031, "global_step": 61769, "epoch": 1470} {"train_loss": -6.0339579582214355, "global_step": 61770, "epoch": 1470} {"train_loss": -6.013721466064453, "global_step": 61771, "epoch": 1470} {"train_loss": -5.870264530181885, "global_step": 61772, "epoch": 1470} {"train_loss": -5.966078758239746, "global_step": 61773, "epoch": 1470} {"train_loss": -5.861259937286377, "global_step": 61774, "epoch": 1470} {"train_loss": -5.851062774658203, "global_step": 61775, "epoch": 1470} {"train_loss": -5.71791934967041, "global_step": 61776, "epoch": 1470} {"train_loss": -5.862321376800537, "global_step": 61777, "epoch": 1470} {"train_loss": -5.775763988494873, "global_step": 61778, "epoch": 1470} {"train_loss": -5.838563919067383, "global_step": 61779, "epoch": 1470} {"train_loss": -5.970578193664551, "global_step": 61780, "epoch": 1470} {"train_loss": -5.911685489472889, "global_step": 61781, "epoch": 1470, "val_loss": 74744.6640625} {"train_loss": -5.846302032470703, "global_step": 61782, "epoch": 1471} {"train_loss": -5.779358863830566, "global_step": 61783, "epoch": 1471} {"train_loss": -5.780742168426514, "global_step": 61784, "epoch": 1471} {"train_loss": -5.939458847045898, "global_step": 61785, "epoch": 1471} {"train_loss": -5.817703723907471, "global_step": 61786, "epoch": 1471} {"train_loss": -5.99946403503418, "global_step": 61787, "epoch": 1471} {"train_loss": -5.945324897766113, "global_step": 61788, "epoch": 1471} {"train_loss": -5.892488479614258, "global_step": 61789, "epoch": 1471} {"train_loss": -5.931216716766357, "global_step": 61790, "epoch": 1471} {"train_loss": -5.889985084533691, "global_step": 61791, "epoch": 1471} {"train_loss": -5.958843231201172, "global_step": 61792, "epoch": 1471} {"train_loss": -5.794557094573975, "global_step": 61793, "epoch": 1471} {"train_loss": -5.889678955078125, "global_step": 61794, "epoch": 1471} {"train_loss": -5.884902000427246, "global_step": 61795, "epoch": 1471} {"train_loss": -5.902034759521484, "global_step": 61796, "epoch": 1471} {"train_loss": -5.9374566078186035, "global_step": 61797, "epoch": 1471} {"train_loss": -5.957123756408691, "global_step": 61798, "epoch": 1471} {"train_loss": -5.983121871948242, "global_step": 61799, "epoch": 1471} {"train_loss": -5.964035987854004, "global_step": 61800, "epoch": 1471} {"train_loss": -5.852844715118408, "global_step": 61801, "epoch": 1471} {"train_loss": -6.07038688659668, "global_step": 61802, "epoch": 1471} {"train_loss": -5.941007614135742, "global_step": 61803, "epoch": 1471} {"train_loss": -5.83322811126709, "global_step": 61804, "epoch": 1471} {"train_loss": -5.84957218170166, "global_step": 61805, "epoch": 1471} {"train_loss": -5.86033296585083, "global_step": 61806, "epoch": 1471} {"train_loss": -5.978163719177246, "global_step": 61807, "epoch": 1471} {"train_loss": -5.947450160980225, "global_step": 61808, "epoch": 1471} {"train_loss": -5.9341349601745605, "global_step": 61809, "epoch": 1471} {"train_loss": -5.946282386779785, "global_step": 61810, "epoch": 1471} {"train_loss": -5.929232120513916, "global_step": 61811, "epoch": 1471} {"train_loss": -6.024598121643066, "global_step": 61812, "epoch": 1471} {"train_loss": -6.014530181884766, "global_step": 61813, "epoch": 1471} {"train_loss": -5.880821228027344, "global_step": 61814, "epoch": 1471} {"train_loss": -5.996060371398926, "global_step": 61815, "epoch": 1471} {"train_loss": -6.056941986083984, "global_step": 61816, "epoch": 1471} {"train_loss": -5.893217086791992, "global_step": 61817, "epoch": 1471} {"train_loss": -5.843169212341309, "global_step": 61818, "epoch": 1471} {"train_loss": -5.8982391357421875, "global_step": 61819, "epoch": 1471} {"train_loss": -5.850063800811768, "global_step": 61820, "epoch": 1471} {"train_loss": -5.8081955909729, "global_step": 61821, "epoch": 1471} {"train_loss": -5.993701934814453, "global_step": 61822, "epoch": 1471} {"train_loss": -5.913337889171782, "global_step": 61823, "epoch": 1471, "val_loss": 74419.984375} {"train_loss": -6.001702308654785, "global_step": 61824, "epoch": 1472} {"train_loss": -6.0290374755859375, "global_step": 61825, "epoch": 1472} {"train_loss": -6.024532318115234, "global_step": 61826, "epoch": 1472} {"train_loss": -5.888594150543213, "global_step": 61827, "epoch": 1472} {"train_loss": -5.922178268432617, "global_step": 61828, "epoch": 1472} {"train_loss": -6.0840911865234375, "global_step": 61829, "epoch": 1472} {"train_loss": -6.004812240600586, "global_step": 61830, "epoch": 1472} {"train_loss": -6.052133560180664, "global_step": 61831, "epoch": 1472} {"train_loss": -5.890804290771484, "global_step": 61832, "epoch": 1472} {"train_loss": -6.004029750823975, "global_step": 61833, "epoch": 1472} {"train_loss": -5.919733047485352, "global_step": 61834, "epoch": 1472} {"train_loss": -5.925182819366455, "global_step": 61835, "epoch": 1472} {"train_loss": -5.904072284698486, "global_step": 61836, "epoch": 1472} {"train_loss": -5.801959037780762, "global_step": 61837, "epoch": 1472} {"train_loss": -5.8390960693359375, "global_step": 61838, "epoch": 1472} {"train_loss": -5.989197254180908, "global_step": 61839, "epoch": 1472} {"train_loss": -5.913049697875977, "global_step": 61840, "epoch": 1472} {"train_loss": -6.072361946105957, "global_step": 61841, "epoch": 1472} {"train_loss": -5.954557418823242, "global_step": 61842, "epoch": 1472} {"train_loss": -5.93710994720459, "global_step": 61843, "epoch": 1472} {"train_loss": -5.9859771728515625, "global_step": 61844, "epoch": 1472} {"train_loss": -5.942864418029785, "global_step": 61845, "epoch": 1472} {"train_loss": -5.896988868713379, "global_step": 61846, "epoch": 1472} {"train_loss": -5.87672758102417, "global_step": 61847, "epoch": 1472} {"train_loss": -6.042912006378174, "global_step": 61848, "epoch": 1472} {"train_loss": -5.911307334899902, "global_step": 61849, "epoch": 1472} {"train_loss": -5.910942554473877, "global_step": 61850, "epoch": 1472} {"train_loss": -5.893686294555664, "global_step": 61851, "epoch": 1472} {"train_loss": -5.934272766113281, "global_step": 61852, "epoch": 1472} {"train_loss": -5.980148792266846, "global_step": 61853, "epoch": 1472} {"train_loss": -5.878826141357422, "global_step": 61854, "epoch": 1472} {"train_loss": -5.955500602722168, "global_step": 61855, "epoch": 1472} {"train_loss": -5.938865661621094, "global_step": 61856, "epoch": 1472} {"train_loss": -5.870522499084473, "global_step": 61857, "epoch": 1472} {"train_loss": -5.854650974273682, "global_step": 61858, "epoch": 1472} {"train_loss": -5.826043605804443, "global_step": 61859, "epoch": 1472} {"train_loss": -5.840601921081543, "global_step": 61860, "epoch": 1472} {"train_loss": -5.9993133544921875, "global_step": 61861, "epoch": 1472} {"train_loss": -5.830419063568115, "global_step": 61862, "epoch": 1472} {"train_loss": -5.896663665771484, "global_step": 61863, "epoch": 1472} {"train_loss": -5.903406620025635, "global_step": 61864, "epoch": 1472} {"train_loss": -5.93449760618664, "global_step": 61865, "epoch": 1472, "val_loss": 74454.7578125} {"train_loss": -6.063392639160156, "global_step": 61866, "epoch": 1473} {"train_loss": -5.9688920974731445, "global_step": 61867, "epoch": 1473} {"train_loss": -5.939019203186035, "global_step": 61868, "epoch": 1473} {"train_loss": -6.006331443786621, "global_step": 61869, "epoch": 1473} {"train_loss": -5.858981132507324, "global_step": 61870, "epoch": 1473} {"train_loss": -5.899387359619141, "global_step": 61871, "epoch": 1473} {"train_loss": -5.863329887390137, "global_step": 61872, "epoch": 1473} {"train_loss": -6.001688480377197, "global_step": 61873, "epoch": 1473} {"train_loss": -5.874059677124023, "global_step": 61874, "epoch": 1473} {"train_loss": -5.772485256195068, "global_step": 61875, "epoch": 1473} {"train_loss": -5.817514419555664, "global_step": 61876, "epoch": 1473} {"train_loss": -5.830955505371094, "global_step": 61877, "epoch": 1473} {"train_loss": -5.951838493347168, "global_step": 61878, "epoch": 1473} {"train_loss": -5.898044109344482, "global_step": 61879, "epoch": 1473} {"train_loss": -5.815084457397461, "global_step": 61880, "epoch": 1473} {"train_loss": -5.944112777709961, "global_step": 61881, "epoch": 1473} {"train_loss": -5.772738456726074, "global_step": 61882, "epoch": 1473} {"train_loss": -5.960333824157715, "global_step": 61883, "epoch": 1473} {"train_loss": -5.9201459884643555, "global_step": 61884, "epoch": 1473} {"train_loss": -5.823887825012207, "global_step": 61885, "epoch": 1473} {"train_loss": -5.839084148406982, "global_step": 61886, "epoch": 1473} {"train_loss": -6.061636924743652, "global_step": 61887, "epoch": 1473} {"train_loss": -5.868361949920654, "global_step": 61888, "epoch": 1473} {"train_loss": -5.844586372375488, "global_step": 61889, "epoch": 1473} {"train_loss": -5.980179786682129, "global_step": 61890, "epoch": 1473} {"train_loss": -6.062427043914795, "global_step": 61891, "epoch": 1473} {"train_loss": -5.977090835571289, "global_step": 61892, "epoch": 1473} {"train_loss": -5.976258754730225, "global_step": 61893, "epoch": 1473} {"train_loss": -6.03156042098999, "global_step": 61894, "epoch": 1473} {"train_loss": -5.927042484283447, "global_step": 61895, "epoch": 1473} {"train_loss": -5.971540451049805, "global_step": 61896, "epoch": 1473} {"train_loss": -5.883623123168945, "global_step": 61897, "epoch": 1473} {"train_loss": -5.884240627288818, "global_step": 61898, "epoch": 1473} {"train_loss": -5.928011894226074, "global_step": 61899, "epoch": 1473} {"train_loss": -5.887582302093506, "global_step": 61900, "epoch": 1473} {"train_loss": -5.880068778991699, "global_step": 61901, "epoch": 1473} {"train_loss": -5.861826419830322, "global_step": 61902, "epoch": 1473} {"train_loss": -5.712113380432129, "global_step": 61903, "epoch": 1473} {"train_loss": -5.81230354309082, "global_step": 61904, "epoch": 1473} {"train_loss": -5.859495639801025, "global_step": 61905, "epoch": 1473} {"train_loss": -5.859111309051514, "global_step": 61906, "epoch": 1473} {"train_loss": -5.907357295354207, "global_step": 61907, "epoch": 1473, "val_loss": 74538.953125} {"train_loss": -5.722381591796875, "global_step": 61908, "epoch": 1474} {"train_loss": -5.965340614318848, "global_step": 61909, "epoch": 1474} {"train_loss": -5.942038536071777, "global_step": 61910, "epoch": 1474} {"train_loss": -5.898958206176758, "global_step": 61911, "epoch": 1474} {"train_loss": -5.926252365112305, "global_step": 61912, "epoch": 1474} {"train_loss": -5.9948930740356445, "global_step": 61913, "epoch": 1474} {"train_loss": -6.07878303527832, "global_step": 61914, "epoch": 1474} {"train_loss": -5.958171844482422, "global_step": 61915, "epoch": 1474} {"train_loss": -5.854864120483398, "global_step": 61916, "epoch": 1474} {"train_loss": -5.931763648986816, "global_step": 61917, "epoch": 1474} {"train_loss": -5.925454139709473, "global_step": 61918, "epoch": 1474} {"train_loss": -5.829649925231934, "global_step": 61919, "epoch": 1474} {"train_loss": -5.876532554626465, "global_step": 61920, "epoch": 1474} {"train_loss": -5.8984551429748535, "global_step": 61921, "epoch": 1474} {"train_loss": -5.9229230880737305, "global_step": 61922, "epoch": 1474} {"train_loss": -5.943929672241211, "global_step": 61923, "epoch": 1474} {"train_loss": -5.848094940185547, "global_step": 61924, "epoch": 1474} {"train_loss": -5.864032745361328, "global_step": 61925, "epoch": 1474} {"train_loss": -5.760365962982178, "global_step": 61926, "epoch": 1474} {"train_loss": -5.811964511871338, "global_step": 61927, "epoch": 1474} {"train_loss": -5.817490100860596, "global_step": 61928, "epoch": 1474} {"train_loss": -5.91214656829834, "global_step": 61929, "epoch": 1474} {"train_loss": -5.781532287597656, "global_step": 61930, "epoch": 1474} {"train_loss": -5.822113037109375, "global_step": 61931, "epoch": 1474} {"train_loss": -5.873596668243408, "global_step": 61932, "epoch": 1474} {"train_loss": -5.9419121742248535, "global_step": 61933, "epoch": 1474} {"train_loss": -5.666067123413086, "global_step": 61934, "epoch": 1474} {"train_loss": -5.921319484710693, "global_step": 61935, "epoch": 1474} {"train_loss": -5.6974968910217285, "global_step": 61936, "epoch": 1474} {"train_loss": -5.89687967300415, "global_step": 61937, "epoch": 1474} {"train_loss": -5.861688613891602, "global_step": 61938, "epoch": 1474} {"train_loss": -5.76867151260376, "global_step": 61939, "epoch": 1474} {"train_loss": -6.005620002746582, "global_step": 61940, "epoch": 1474} {"train_loss": -5.7967376708984375, "global_step": 61941, "epoch": 1474} {"train_loss": -5.935085296630859, "global_step": 61942, "epoch": 1474} {"train_loss": -5.846162796020508, "global_step": 61943, "epoch": 1474} {"train_loss": -5.849178314208984, "global_step": 61944, "epoch": 1474} {"train_loss": -5.885056018829346, "global_step": 61945, "epoch": 1474} {"train_loss": -5.833362579345703, "global_step": 61946, "epoch": 1474} {"train_loss": -5.890498638153076, "global_step": 61947, "epoch": 1474} {"train_loss": -5.851938247680664, "global_step": 61948, "epoch": 1474} {"train_loss": -5.874643212273007, "global_step": 61949, "epoch": 1474, "val_loss": 74819.78125} {"train_loss": -5.824246883392334, "global_step": 61950, "epoch": 1475} {"train_loss": -5.911725997924805, "global_step": 61951, "epoch": 1475} {"train_loss": -5.865906715393066, "global_step": 61952, "epoch": 1475} {"train_loss": -6.02694034576416, "global_step": 61953, "epoch": 1475} {"train_loss": -5.901679992675781, "global_step": 61954, "epoch": 1475} {"train_loss": -5.959425449371338, "global_step": 61955, "epoch": 1475} {"train_loss": -5.978582382202148, "global_step": 61956, "epoch": 1475} {"train_loss": -6.007864952087402, "global_step": 61957, "epoch": 1475} {"train_loss": -5.978105545043945, "global_step": 61958, "epoch": 1475} {"train_loss": -5.874663829803467, "global_step": 61959, "epoch": 1475} {"train_loss": -6.078843116760254, "global_step": 61960, "epoch": 1475} {"train_loss": -5.95168924331665, "global_step": 61961, "epoch": 1475} {"train_loss": -6.025527000427246, "global_step": 61962, "epoch": 1475} {"train_loss": -5.911657810211182, "global_step": 61963, "epoch": 1475} {"train_loss": -5.948642253875732, "global_step": 61964, "epoch": 1475} {"train_loss": -5.837438583374023, "global_step": 61965, "epoch": 1475} {"train_loss": -5.938343524932861, "global_step": 61966, "epoch": 1475} {"train_loss": -5.952118873596191, "global_step": 61967, "epoch": 1475} {"train_loss": -5.962213039398193, "global_step": 61968, "epoch": 1475} {"train_loss": -5.887763977050781, "global_step": 61969, "epoch": 1475} {"train_loss": -5.906241416931152, "global_step": 61970, "epoch": 1475} {"train_loss": -5.931422710418701, "global_step": 61971, "epoch": 1475} {"train_loss": -5.8283281326293945, "global_step": 61972, "epoch": 1475} {"train_loss": -5.9126973152160645, "global_step": 61973, "epoch": 1475} {"train_loss": -5.997386455535889, "global_step": 61974, "epoch": 1475} {"train_loss": -6.0137104988098145, "global_step": 61975, "epoch": 1475} {"train_loss": -5.917377948760986, "global_step": 61976, "epoch": 1475} {"train_loss": -5.831760406494141, "global_step": 61977, "epoch": 1475} {"train_loss": -5.907014846801758, "global_step": 61978, "epoch": 1475} {"train_loss": -5.95093297958374, "global_step": 61979, "epoch": 1475} {"train_loss": -5.920680999755859, "global_step": 61980, "epoch": 1475} {"train_loss": -5.864762783050537, "global_step": 61981, "epoch": 1475} {"train_loss": -5.889379978179932, "global_step": 61982, "epoch": 1475} {"train_loss": -6.00492000579834, "global_step": 61983, "epoch": 1475} {"train_loss": -6.015214920043945, "global_step": 61984, "epoch": 1475} {"train_loss": -5.881377220153809, "global_step": 61985, "epoch": 1475} {"train_loss": -6.071566581726074, "global_step": 61986, "epoch": 1475} {"train_loss": -5.881114482879639, "global_step": 61987, "epoch": 1475} {"train_loss": -5.959240913391113, "global_step": 61988, "epoch": 1475} {"train_loss": -5.867311954498291, "global_step": 61989, "epoch": 1475} {"train_loss": -5.993385314941406, "global_step": 61990, "epoch": 1475} {"train_loss": -5.93349720182873, "global_step": 61991, "epoch": 1475, "val_loss": 74636.3203125} {"train_loss": -5.763302803039551, "global_step": 61992, "epoch": 1476} {"train_loss": -5.95590353012085, "global_step": 61993, "epoch": 1476} {"train_loss": -5.867099761962891, "global_step": 61994, "epoch": 1476} {"train_loss": -5.82108736038208, "global_step": 61995, "epoch": 1476} {"train_loss": -5.900672912597656, "global_step": 61996, "epoch": 1476} {"train_loss": -5.857627868652344, "global_step": 61997, "epoch": 1476} {"train_loss": -6.0290045738220215, "global_step": 61998, "epoch": 1476} {"train_loss": -5.834713459014893, "global_step": 61999, "epoch": 1476} {"train_loss": -5.931896209716797, "global_step": 62000, "epoch": 1476} {"train_loss": -5.957427978515625, "global_step": 62001, "epoch": 1476} {"train_loss": -5.912180423736572, "global_step": 62002, "epoch": 1476} {"train_loss": -5.859362602233887, "global_step": 62003, "epoch": 1476} {"train_loss": -6.027245044708252, "global_step": 62004, "epoch": 1476} {"train_loss": -5.902399063110352, "global_step": 62005, "epoch": 1476} {"train_loss": -5.9596991539001465, "global_step": 62006, "epoch": 1476} {"train_loss": -5.942269325256348, "global_step": 62007, "epoch": 1476} {"train_loss": -5.999664306640625, "global_step": 62008, "epoch": 1476} {"train_loss": -5.857004165649414, "global_step": 62009, "epoch": 1476} {"train_loss": -5.9759745597839355, "global_step": 62010, "epoch": 1476} {"train_loss": -5.933820724487305, "global_step": 62011, "epoch": 1476} {"train_loss": -5.932375431060791, "global_step": 62012, "epoch": 1476} {"train_loss": -6.120667457580566, "global_step": 62013, "epoch": 1476} {"train_loss": -5.79818058013916, "global_step": 62014, "epoch": 1476} {"train_loss": -5.954187393188477, "global_step": 62015, "epoch": 1476} {"train_loss": -6.014154434204102, "global_step": 62016, "epoch": 1476} {"train_loss": -5.986351490020752, "global_step": 62017, "epoch": 1476} {"train_loss": -6.001820087432861, "global_step": 62018, "epoch": 1476} {"train_loss": -5.8270697593688965, "global_step": 62019, "epoch": 1476} {"train_loss": -5.799156665802002, "global_step": 62020, "epoch": 1476} {"train_loss": -6.04690408706665, "global_step": 62021, "epoch": 1476} {"train_loss": -5.989739894866943, "global_step": 62022, "epoch": 1476} {"train_loss": -5.767881393432617, "global_step": 62023, "epoch": 1476} {"train_loss": -5.96243953704834, "global_step": 62024, "epoch": 1476} {"train_loss": -5.850390434265137, "global_step": 62025, "epoch": 1476} {"train_loss": -5.855966567993164, "global_step": 62026, "epoch": 1476} {"train_loss": -5.949628829956055, "global_step": 62027, "epoch": 1476} {"train_loss": -5.919930458068848, "global_step": 62028, "epoch": 1476} {"train_loss": -5.894957542419434, "global_step": 62029, "epoch": 1476} {"train_loss": -5.9043684005737305, "global_step": 62030, "epoch": 1476} {"train_loss": -5.97836446762085, "global_step": 62031, "epoch": 1476} {"train_loss": -6.041595935821533, "global_step": 62032, "epoch": 1476} {"train_loss": -5.9241128876095726, "global_step": 62033, "epoch": 1476, "val_loss": 74638.765625} {"train_loss": -6.003251075744629, "global_step": 62034, "epoch": 1477} {"train_loss": -6.045113563537598, "global_step": 62035, "epoch": 1477} {"train_loss": -5.864418029785156, "global_step": 62036, "epoch": 1477} {"train_loss": -5.889666557312012, "global_step": 62037, "epoch": 1477} {"train_loss": -5.877314567565918, "global_step": 62038, "epoch": 1477} {"train_loss": -5.644915580749512, "global_step": 62039, "epoch": 1477} {"train_loss": -5.819348335266113, "global_step": 62040, "epoch": 1477} {"train_loss": -5.904849529266357, "global_step": 62041, "epoch": 1477} {"train_loss": -5.662336826324463, "global_step": 62042, "epoch": 1477} {"train_loss": -5.926484107971191, "global_step": 62043, "epoch": 1477} {"train_loss": -5.798389911651611, "global_step": 62044, "epoch": 1477} {"train_loss": -5.781188488006592, "global_step": 62045, "epoch": 1477} {"train_loss": -5.9859113693237305, "global_step": 62046, "epoch": 1477} {"train_loss": -5.78181266784668, "global_step": 62047, "epoch": 1477} {"train_loss": -5.844787120819092, "global_step": 62048, "epoch": 1477} {"train_loss": -5.856234550476074, "global_step": 62049, "epoch": 1477} {"train_loss": -5.808495998382568, "global_step": 62050, "epoch": 1477} {"train_loss": -5.9146504402160645, "global_step": 62051, "epoch": 1477} {"train_loss": -5.8859357833862305, "global_step": 62052, "epoch": 1477} {"train_loss": -5.911781311035156, "global_step": 62053, "epoch": 1477} {"train_loss": -5.858968734741211, "global_step": 62054, "epoch": 1477} {"train_loss": -5.749676704406738, "global_step": 62055, "epoch": 1477} {"train_loss": -5.83710241317749, "global_step": 62056, "epoch": 1477} {"train_loss": -5.846736907958984, "global_step": 62057, "epoch": 1477} {"train_loss": -5.861237525939941, "global_step": 62058, "epoch": 1477} {"train_loss": -5.889351844787598, "global_step": 62059, "epoch": 1477} {"train_loss": -5.783276557922363, "global_step": 62060, "epoch": 1477} {"train_loss": -6.006572723388672, "global_step": 62061, "epoch": 1477} {"train_loss": -5.923825263977051, "global_step": 62062, "epoch": 1477} {"train_loss": -5.870284557342529, "global_step": 62063, "epoch": 1477} {"train_loss": -5.916739463806152, "global_step": 62064, "epoch": 1477} {"train_loss": -5.943144798278809, "global_step": 62065, "epoch": 1477} {"train_loss": -5.979828834533691, "global_step": 62066, "epoch": 1477} {"train_loss": -5.876333236694336, "global_step": 62067, "epoch": 1477} {"train_loss": -6.030360221862793, "global_step": 62068, "epoch": 1477} {"train_loss": -5.976259231567383, "global_step": 62069, "epoch": 1477} {"train_loss": -5.9391326904296875, "global_step": 62070, "epoch": 1477} {"train_loss": -5.860842704772949, "global_step": 62071, "epoch": 1477} {"train_loss": -6.035861968994141, "global_step": 62072, "epoch": 1477} {"train_loss": -5.989573955535889, "global_step": 62073, "epoch": 1477} {"train_loss": -6.012538433074951, "global_step": 62074, "epoch": 1477} {"train_loss": -5.888403654098511, "global_step": 62075, "epoch": 1477, "val_loss": 74752.0546875} {"train_loss": -5.857119560241699, "global_step": 62076, "epoch": 1478} {"train_loss": -5.880980968475342, "global_step": 62077, "epoch": 1478} {"train_loss": -5.880939483642578, "global_step": 62078, "epoch": 1478} {"train_loss": -6.079803466796875, "global_step": 62079, "epoch": 1478} {"train_loss": -5.990836143493652, "global_step": 62080, "epoch": 1478} {"train_loss": -5.929312705993652, "global_step": 62081, "epoch": 1478} {"train_loss": -6.05506706237793, "global_step": 62082, "epoch": 1478} {"train_loss": -6.001819610595703, "global_step": 62083, "epoch": 1478} {"train_loss": -6.0554704666137695, "global_step": 62084, "epoch": 1478} {"train_loss": -5.900491237640381, "global_step": 62085, "epoch": 1478} {"train_loss": -5.816307544708252, "global_step": 62086, "epoch": 1478} {"train_loss": -5.95350456237793, "global_step": 62087, "epoch": 1478} {"train_loss": -5.927889347076416, "global_step": 62088, "epoch": 1478} {"train_loss": -5.751935005187988, "global_step": 62089, "epoch": 1478} {"train_loss": -6.017455101013184, "global_step": 62090, "epoch": 1478} {"train_loss": -5.97796630859375, "global_step": 62091, "epoch": 1478} {"train_loss": -5.764084815979004, "global_step": 62092, "epoch": 1478} {"train_loss": -5.861563682556152, "global_step": 62093, "epoch": 1478} {"train_loss": -5.9042887687683105, "global_step": 62094, "epoch": 1478} {"train_loss": -5.901704788208008, "global_step": 62095, "epoch": 1478} {"train_loss": -5.922691345214844, "global_step": 62096, "epoch": 1478} {"train_loss": -5.834329128265381, "global_step": 62097, "epoch": 1478} {"train_loss": -5.83212947845459, "global_step": 62098, "epoch": 1478} {"train_loss": -5.975775241851807, "global_step": 62099, "epoch": 1478} {"train_loss": -5.8636064529418945, "global_step": 62100, "epoch": 1478} {"train_loss": -5.836772441864014, "global_step": 62101, "epoch": 1478} {"train_loss": -5.7885589599609375, "global_step": 62102, "epoch": 1478} {"train_loss": -5.807265281677246, "global_step": 62103, "epoch": 1478} {"train_loss": -5.994412422180176, "global_step": 62104, "epoch": 1478} {"train_loss": -5.94460391998291, "global_step": 62105, "epoch": 1478} {"train_loss": -5.911347389221191, "global_step": 62106, "epoch": 1478} {"train_loss": -5.924968719482422, "global_step": 62107, "epoch": 1478} {"train_loss": -6.045692443847656, "global_step": 62108, "epoch": 1478} {"train_loss": -5.955528259277344, "global_step": 62109, "epoch": 1478} {"train_loss": -5.893763542175293, "global_step": 62110, "epoch": 1478} {"train_loss": -5.951343059539795, "global_step": 62111, "epoch": 1478} {"train_loss": -6.0400800704956055, "global_step": 62112, "epoch": 1478} {"train_loss": -5.927674293518066, "global_step": 62113, "epoch": 1478} {"train_loss": -5.811448097229004, "global_step": 62114, "epoch": 1478} {"train_loss": -5.962285041809082, "global_step": 62115, "epoch": 1478} {"train_loss": -5.871609687805176, "global_step": 62116, "epoch": 1478} {"train_loss": -5.917319195611136, "global_step": 62117, "epoch": 1478, "val_loss": 74482.125} {"train_loss": -5.940849304199219, "global_step": 62118, "epoch": 1479} {"train_loss": -5.850166320800781, "global_step": 62119, "epoch": 1479} {"train_loss": -5.906162261962891, "global_step": 62120, "epoch": 1479} {"train_loss": -5.947086334228516, "global_step": 62121, "epoch": 1479} {"train_loss": -5.8834052085876465, "global_step": 62122, "epoch": 1479} {"train_loss": -5.952768325805664, "global_step": 62123, "epoch": 1479} {"train_loss": -5.910758972167969, "global_step": 62124, "epoch": 1479} {"train_loss": -5.935445785522461, "global_step": 62125, "epoch": 1479} {"train_loss": -5.842214107513428, "global_step": 62126, "epoch": 1479} {"train_loss": -5.963619232177734, "global_step": 62127, "epoch": 1479} {"train_loss": -5.883512020111084, "global_step": 62128, "epoch": 1479} {"train_loss": -5.856423377990723, "global_step": 62129, "epoch": 1479} {"train_loss": -6.051468849182129, "global_step": 62130, "epoch": 1479} {"train_loss": -5.9389142990112305, "global_step": 62131, "epoch": 1479} {"train_loss": -5.836242198944092, "global_step": 62132, "epoch": 1479} {"train_loss": -5.9029541015625, "global_step": 62133, "epoch": 1479} {"train_loss": -5.899128437042236, "global_step": 62134, "epoch": 1479} {"train_loss": -6.009711742401123, "global_step": 62135, "epoch": 1479} {"train_loss": -5.9188947677612305, "global_step": 62136, "epoch": 1479} {"train_loss": -5.7751665115356445, "global_step": 62137, "epoch": 1479} {"train_loss": -5.918027877807617, "global_step": 62138, "epoch": 1479} {"train_loss": -6.000275611877441, "global_step": 62139, "epoch": 1479} {"train_loss": -5.890576362609863, "global_step": 62140, "epoch": 1479} {"train_loss": -5.970746994018555, "global_step": 62141, "epoch": 1479} {"train_loss": -5.936711311340332, "global_step": 62142, "epoch": 1479} {"train_loss": -5.924661159515381, "global_step": 62143, "epoch": 1479} {"train_loss": -5.953824043273926, "global_step": 62144, "epoch": 1479} {"train_loss": -5.896437644958496, "global_step": 62145, "epoch": 1479} {"train_loss": -5.904915809631348, "global_step": 62146, "epoch": 1479} {"train_loss": -5.8712968826293945, "global_step": 62147, "epoch": 1479} {"train_loss": -5.88170051574707, "global_step": 62148, "epoch": 1479} {"train_loss": -5.72955846786499, "global_step": 62149, "epoch": 1479} {"train_loss": -5.916630268096924, "global_step": 62150, "epoch": 1479} {"train_loss": -5.926023006439209, "global_step": 62151, "epoch": 1479} {"train_loss": -5.852212905883789, "global_step": 62152, "epoch": 1479} {"train_loss": -5.993709564208984, "global_step": 62153, "epoch": 1479} {"train_loss": -5.982278347015381, "global_step": 62154, "epoch": 1479} {"train_loss": -5.954968452453613, "global_step": 62155, "epoch": 1479} {"train_loss": -5.9647955894470215, "global_step": 62156, "epoch": 1479} {"train_loss": -5.901874542236328, "global_step": 62157, "epoch": 1479} {"train_loss": -5.808587551116943, "global_step": 62158, "epoch": 1479} {"train_loss": -5.914779084069388, "global_step": 62159, "epoch": 1479, "val_loss": 74499.71875} {"train_loss": -5.81967830657959, "global_step": 62160, "epoch": 1480} {"train_loss": -5.786667823791504, "global_step": 62161, "epoch": 1480} {"train_loss": -5.933401584625244, "global_step": 62162, "epoch": 1480} {"train_loss": -5.8534135818481445, "global_step": 62163, "epoch": 1480} {"train_loss": -6.001166343688965, "global_step": 62164, "epoch": 1480} {"train_loss": -5.974682807922363, "global_step": 62165, "epoch": 1480} {"train_loss": -5.910796165466309, "global_step": 62166, "epoch": 1480} {"train_loss": -5.907743453979492, "global_step": 62167, "epoch": 1480} {"train_loss": -5.976617813110352, "global_step": 62168, "epoch": 1480} {"train_loss": -5.890175819396973, "global_step": 62169, "epoch": 1480} {"train_loss": -5.869722366333008, "global_step": 62170, "epoch": 1480} {"train_loss": -5.94989013671875, "global_step": 62171, "epoch": 1480} {"train_loss": -5.924209117889404, "global_step": 62172, "epoch": 1480} {"train_loss": -5.965228080749512, "global_step": 62173, "epoch": 1480} {"train_loss": -5.815708637237549, "global_step": 62174, "epoch": 1480} {"train_loss": -5.836645126342773, "global_step": 62175, "epoch": 1480} {"train_loss": -5.964565277099609, "global_step": 62176, "epoch": 1480} {"train_loss": -5.982653617858887, "global_step": 62177, "epoch": 1480} {"train_loss": -5.949350357055664, "global_step": 62178, "epoch": 1480} {"train_loss": -5.931724548339844, "global_step": 62179, "epoch": 1480} {"train_loss": -5.870893478393555, "global_step": 62180, "epoch": 1480} {"train_loss": -5.867880821228027, "global_step": 62181, "epoch": 1480} {"train_loss": -6.0144500732421875, "global_step": 62182, "epoch": 1480} {"train_loss": -5.951010704040527, "global_step": 62183, "epoch": 1480} {"train_loss": -5.924121856689453, "global_step": 62184, "epoch": 1480} {"train_loss": -5.921039581298828, "global_step": 62185, "epoch": 1480} {"train_loss": -5.8778977394104, "global_step": 62186, "epoch": 1480} {"train_loss": -5.905233860015869, "global_step": 62187, "epoch": 1480} {"train_loss": -5.79809045791626, "global_step": 62188, "epoch": 1480} {"train_loss": -5.964654922485352, "global_step": 62189, "epoch": 1480} {"train_loss": -5.984072685241699, "global_step": 62190, "epoch": 1480} {"train_loss": -5.92571496963501, "global_step": 62191, "epoch": 1480} {"train_loss": -6.017223358154297, "global_step": 62192, "epoch": 1480} {"train_loss": -5.791375637054443, "global_step": 62193, "epoch": 1480} {"train_loss": -5.954247951507568, "global_step": 62194, "epoch": 1480} {"train_loss": -5.871463775634766, "global_step": 62195, "epoch": 1480} {"train_loss": -5.914738178253174, "global_step": 62196, "epoch": 1480} {"train_loss": -5.895374774932861, "global_step": 62197, "epoch": 1480} {"train_loss": -5.890865325927734, "global_step": 62198, "epoch": 1480} {"train_loss": -6.01063346862793, "global_step": 62199, "epoch": 1480} {"train_loss": -5.979867935180664, "global_step": 62200, "epoch": 1480} {"train_loss": -5.917486168089367, "global_step": 62201, "epoch": 1480, "val_loss": 74329.4296875} {"train_loss": -5.949398994445801, "global_step": 62202, "epoch": 1481} {"train_loss": -6.086337566375732, "global_step": 62203, "epoch": 1481} {"train_loss": -5.935882568359375, "global_step": 62204, "epoch": 1481} {"train_loss": -5.952686309814453, "global_step": 62205, "epoch": 1481} {"train_loss": -5.939273357391357, "global_step": 62206, "epoch": 1481} {"train_loss": -6.000953674316406, "global_step": 62207, "epoch": 1481} {"train_loss": -5.958974838256836, "global_step": 62208, "epoch": 1481} {"train_loss": -5.869576930999756, "global_step": 62209, "epoch": 1481} {"train_loss": -5.935244560241699, "global_step": 62210, "epoch": 1481} {"train_loss": -5.96711540222168, "global_step": 62211, "epoch": 1481} {"train_loss": -6.019173622131348, "global_step": 62212, "epoch": 1481} {"train_loss": -6.029144287109375, "global_step": 62213, "epoch": 1481} {"train_loss": -6.0095534324646, "global_step": 62214, "epoch": 1481} {"train_loss": -5.896729469299316, "global_step": 62215, "epoch": 1481} {"train_loss": -5.984883785247803, "global_step": 62216, "epoch": 1481} {"train_loss": -5.876107215881348, "global_step": 62217, "epoch": 1481} {"train_loss": -5.882929801940918, "global_step": 62218, "epoch": 1481} {"train_loss": -6.033807754516602, "global_step": 62219, "epoch": 1481} {"train_loss": -5.883995532989502, "global_step": 62220, "epoch": 1481} {"train_loss": -5.873987674713135, "global_step": 62221, "epoch": 1481} {"train_loss": -5.904066562652588, "global_step": 62222, "epoch": 1481} {"train_loss": -5.872539520263672, "global_step": 62223, "epoch": 1481} {"train_loss": -5.986184120178223, "global_step": 62224, "epoch": 1481} {"train_loss": -5.939422607421875, "global_step": 62225, "epoch": 1481} {"train_loss": -5.852215766906738, "global_step": 62226, "epoch": 1481} {"train_loss": -6.083386421203613, "global_step": 62227, "epoch": 1481} {"train_loss": -5.988676071166992, "global_step": 62228, "epoch": 1481} {"train_loss": -5.781224250793457, "global_step": 62229, "epoch": 1481} {"train_loss": -5.865623474121094, "global_step": 62230, "epoch": 1481} {"train_loss": -5.964123725891113, "global_step": 62231, "epoch": 1481} {"train_loss": -5.85692024230957, "global_step": 62232, "epoch": 1481} {"train_loss": -5.956169605255127, "global_step": 62233, "epoch": 1481} {"train_loss": -5.947882652282715, "global_step": 62234, "epoch": 1481} {"train_loss": -5.8800225257873535, "global_step": 62235, "epoch": 1481} {"train_loss": -5.784695625305176, "global_step": 62236, "epoch": 1481} {"train_loss": -5.824881553649902, "global_step": 62237, "epoch": 1481} {"train_loss": -5.897647857666016, "global_step": 62238, "epoch": 1481} {"train_loss": -5.8726606369018555, "global_step": 62239, "epoch": 1481} {"train_loss": -5.795351028442383, "global_step": 62240, "epoch": 1481} {"train_loss": -5.844620704650879, "global_step": 62241, "epoch": 1481} {"train_loss": -5.9954657554626465, "global_step": 62242, "epoch": 1481} {"train_loss": -5.925190573646908, "global_step": 62243, "epoch": 1481, "val_loss": 74646.484375} {"train_loss": -5.886655807495117, "global_step": 62244, "epoch": 1482} {"train_loss": -5.869062423706055, "global_step": 62245, "epoch": 1482} {"train_loss": -5.788847923278809, "global_step": 62246, "epoch": 1482} {"train_loss": -5.913302898406982, "global_step": 62247, "epoch": 1482} {"train_loss": -5.989388942718506, "global_step": 62248, "epoch": 1482} {"train_loss": -5.870079517364502, "global_step": 62249, "epoch": 1482} {"train_loss": -5.8971171379089355, "global_step": 62250, "epoch": 1482} {"train_loss": -5.754730701446533, "global_step": 62251, "epoch": 1482} {"train_loss": -5.9008002281188965, "global_step": 62252, "epoch": 1482} {"train_loss": -5.946047306060791, "global_step": 62253, "epoch": 1482} {"train_loss": -5.916282653808594, "global_step": 62254, "epoch": 1482} {"train_loss": -5.947778701782227, "global_step": 62255, "epoch": 1482} {"train_loss": -5.84531307220459, "global_step": 62256, "epoch": 1482} {"train_loss": -5.94245719909668, "global_step": 62257, "epoch": 1482} {"train_loss": -5.912736892700195, "global_step": 62258, "epoch": 1482} {"train_loss": -5.815842628479004, "global_step": 62259, "epoch": 1482} {"train_loss": -5.896735191345215, "global_step": 62260, "epoch": 1482} {"train_loss": -5.800960540771484, "global_step": 62261, "epoch": 1482} {"train_loss": -5.946233749389648, "global_step": 62262, "epoch": 1482} {"train_loss": -6.029749870300293, "global_step": 62263, "epoch": 1482} {"train_loss": -5.847227096557617, "global_step": 62264, "epoch": 1482} {"train_loss": -6.004901885986328, "global_step": 62265, "epoch": 1482} {"train_loss": -5.801551342010498, "global_step": 62266, "epoch": 1482} {"train_loss": -5.91618537902832, "global_step": 62267, "epoch": 1482} {"train_loss": -5.980159282684326, "global_step": 62268, "epoch": 1482} {"train_loss": -5.888049125671387, "global_step": 62269, "epoch": 1482} {"train_loss": -5.982698440551758, "global_step": 62270, "epoch": 1482} {"train_loss": -6.002017021179199, "global_step": 62271, "epoch": 1482} {"train_loss": -5.960418701171875, "global_step": 62272, "epoch": 1482} {"train_loss": -5.939882755279541, "global_step": 62273, "epoch": 1482} {"train_loss": -5.971294403076172, "global_step": 62274, "epoch": 1482} {"train_loss": -6.0376434326171875, "global_step": 62275, "epoch": 1482} {"train_loss": -6.073601722717285, "global_step": 62276, "epoch": 1482} {"train_loss": -5.926257610321045, "global_step": 62277, "epoch": 1482} {"train_loss": -6.0129876136779785, "global_step": 62278, "epoch": 1482} {"train_loss": -5.942343711853027, "global_step": 62279, "epoch": 1482} {"train_loss": -6.049821376800537, "global_step": 62280, "epoch": 1482} {"train_loss": -6.0348358154296875, "global_step": 62281, "epoch": 1482} {"train_loss": -5.858094215393066, "global_step": 62282, "epoch": 1482} {"train_loss": -5.849043369293213, "global_step": 62283, "epoch": 1482} {"train_loss": -5.995965480804443, "global_step": 62284, "epoch": 1482} {"train_loss": -5.9265139784131735, "global_step": 62285, "epoch": 1482, "val_loss": 74593.84375} {"train_loss": -5.997980117797852, "global_step": 62286, "epoch": 1483} {"train_loss": -5.89224910736084, "global_step": 62287, "epoch": 1483} {"train_loss": -5.890271186828613, "global_step": 62288, "epoch": 1483} {"train_loss": -5.841567516326904, "global_step": 62289, "epoch": 1483} {"train_loss": -5.927223205566406, "global_step": 62290, "epoch": 1483} {"train_loss": -6.017335414886475, "global_step": 62291, "epoch": 1483} {"train_loss": -6.027980804443359, "global_step": 62292, "epoch": 1483} {"train_loss": -5.952834129333496, "global_step": 62293, "epoch": 1483} {"train_loss": -6.061053276062012, "global_step": 62294, "epoch": 1483} {"train_loss": -5.986401557922363, "global_step": 62295, "epoch": 1483} {"train_loss": -5.886285305023193, "global_step": 62296, "epoch": 1483} {"train_loss": -5.91347599029541, "global_step": 62297, "epoch": 1483} {"train_loss": -5.913204193115234, "global_step": 62298, "epoch": 1483} {"train_loss": -5.846746444702148, "global_step": 62299, "epoch": 1483} {"train_loss": -5.9513983726501465, "global_step": 62300, "epoch": 1483} {"train_loss": -5.849108695983887, "global_step": 62301, "epoch": 1483} {"train_loss": -5.935842514038086, "global_step": 62302, "epoch": 1483} {"train_loss": -5.961108207702637, "global_step": 62303, "epoch": 1483} {"train_loss": -5.918097972869873, "global_step": 62304, "epoch": 1483} {"train_loss": -5.845890998840332, "global_step": 62305, "epoch": 1483} {"train_loss": -5.902132987976074, "global_step": 62306, "epoch": 1483} {"train_loss": -5.939121246337891, "global_step": 62307, "epoch": 1483} {"train_loss": -5.956692695617676, "global_step": 62308, "epoch": 1483} {"train_loss": -5.950575828552246, "global_step": 62309, "epoch": 1483} {"train_loss": -5.95124626159668, "global_step": 62310, "epoch": 1483} {"train_loss": -5.96567440032959, "global_step": 62311, "epoch": 1483} {"train_loss": -5.877775192260742, "global_step": 62312, "epoch": 1483} {"train_loss": -5.990385055541992, "global_step": 62313, "epoch": 1483} {"train_loss": -5.980947017669678, "global_step": 62314, "epoch": 1483} {"train_loss": -5.821949005126953, "global_step": 62315, "epoch": 1483} {"train_loss": -5.884483337402344, "global_step": 62316, "epoch": 1483} {"train_loss": -6.0375871658325195, "global_step": 62317, "epoch": 1483} {"train_loss": -5.952739715576172, "global_step": 62318, "epoch": 1483} {"train_loss": -5.830582618713379, "global_step": 62319, "epoch": 1483} {"train_loss": -5.918288230895996, "global_step": 62320, "epoch": 1483} {"train_loss": -5.979557037353516, "global_step": 62321, "epoch": 1483} {"train_loss": -5.744357109069824, "global_step": 62322, "epoch": 1483} {"train_loss": -5.844743728637695, "global_step": 62323, "epoch": 1483} {"train_loss": -5.785502910614014, "global_step": 62324, "epoch": 1483} {"train_loss": -6.008816719055176, "global_step": 62325, "epoch": 1483} {"train_loss": -5.926271438598633, "global_step": 62326, "epoch": 1483} {"train_loss": -5.924034368424189, "global_step": 62327, "epoch": 1483, "val_loss": 74437.328125} {"train_loss": -5.95696496963501, "global_step": 62328, "epoch": 1484} {"train_loss": -5.9863176345825195, "global_step": 62329, "epoch": 1484} {"train_loss": -5.8938798904418945, "global_step": 62330, "epoch": 1484} {"train_loss": -5.910897731781006, "global_step": 62331, "epoch": 1484} {"train_loss": -5.867631912231445, "global_step": 62332, "epoch": 1484} {"train_loss": -5.834153175354004, "global_step": 62333, "epoch": 1484} {"train_loss": -6.04237699508667, "global_step": 62334, "epoch": 1484} {"train_loss": -6.043928146362305, "global_step": 62335, "epoch": 1484} {"train_loss": -6.001195907592773, "global_step": 62336, "epoch": 1484} {"train_loss": -6.078031539916992, "global_step": 62337, "epoch": 1484} {"train_loss": -5.898027420043945, "global_step": 62338, "epoch": 1484} {"train_loss": -5.7768354415893555, "global_step": 62339, "epoch": 1484} {"train_loss": -5.908585071563721, "global_step": 62340, "epoch": 1484} {"train_loss": -5.938584327697754, "global_step": 62341, "epoch": 1484} {"train_loss": -5.942979335784912, "global_step": 62342, "epoch": 1484} {"train_loss": -5.764959335327148, "global_step": 62343, "epoch": 1484} {"train_loss": -6.158063888549805, "global_step": 62344, "epoch": 1484} {"train_loss": -5.884302139282227, "global_step": 62345, "epoch": 1484} {"train_loss": -5.84028434753418, "global_step": 62346, "epoch": 1484} {"train_loss": -5.891409397125244, "global_step": 62347, "epoch": 1484} {"train_loss": -5.991113185882568, "global_step": 62348, "epoch": 1484} {"train_loss": -5.864794731140137, "global_step": 62349, "epoch": 1484} {"train_loss": -6.001325607299805, "global_step": 62350, "epoch": 1484} {"train_loss": -5.960132598876953, "global_step": 62351, "epoch": 1484} {"train_loss": -5.842887878417969, "global_step": 62352, "epoch": 1484} {"train_loss": -5.924498558044434, "global_step": 62353, "epoch": 1484} {"train_loss": -5.938899993896484, "global_step": 62354, "epoch": 1484} {"train_loss": -6.072631359100342, "global_step": 62355, "epoch": 1484} {"train_loss": -5.837601661682129, "global_step": 62356, "epoch": 1484} {"train_loss": -5.8687334060668945, "global_step": 62357, "epoch": 1484} {"train_loss": -6.055421829223633, "global_step": 62358, "epoch": 1484} {"train_loss": -5.945723533630371, "global_step": 62359, "epoch": 1484} {"train_loss": -5.806055068969727, "global_step": 62360, "epoch": 1484} {"train_loss": -5.912060737609863, "global_step": 62361, "epoch": 1484} {"train_loss": -5.896035194396973, "global_step": 62362, "epoch": 1484} {"train_loss": -6.032696723937988, "global_step": 62363, "epoch": 1484} {"train_loss": -5.917532920837402, "global_step": 62364, "epoch": 1484} {"train_loss": -5.9070563316345215, "global_step": 62365, "epoch": 1484} {"train_loss": -5.881424903869629, "global_step": 62366, "epoch": 1484} {"train_loss": -5.9384965896606445, "global_step": 62367, "epoch": 1484} {"train_loss": -5.968050956726074, "global_step": 62368, "epoch": 1484} {"train_loss": -5.932699248904274, "global_step": 62369, "epoch": 1484, "val_loss": 74382.5859375} {"train_loss": -5.884635925292969, "global_step": 62370, "epoch": 1485} {"train_loss": -5.937004089355469, "global_step": 62371, "epoch": 1485} {"train_loss": -5.93575382232666, "global_step": 62372, "epoch": 1485} {"train_loss": -5.913887977600098, "global_step": 62373, "epoch": 1485} {"train_loss": -5.940437316894531, "global_step": 62374, "epoch": 1485} {"train_loss": -5.870845794677734, "global_step": 62375, "epoch": 1485} {"train_loss": -5.912533760070801, "global_step": 62376, "epoch": 1485} {"train_loss": -5.994128704071045, "global_step": 62377, "epoch": 1485} {"train_loss": -5.928093910217285, "global_step": 62378, "epoch": 1485} {"train_loss": -5.9102983474731445, "global_step": 62379, "epoch": 1485} {"train_loss": -6.100243091583252, "global_step": 62380, "epoch": 1485} {"train_loss": -5.968873023986816, "global_step": 62381, "epoch": 1485} {"train_loss": -5.858474254608154, "global_step": 62382, "epoch": 1485} {"train_loss": -5.946836948394775, "global_step": 62383, "epoch": 1485} {"train_loss": -5.893470764160156, "global_step": 62384, "epoch": 1485} {"train_loss": -5.71126651763916, "global_step": 62385, "epoch": 1485} {"train_loss": -5.968866348266602, "global_step": 62386, "epoch": 1485} {"train_loss": -5.843300819396973, "global_step": 62387, "epoch": 1485} {"train_loss": -5.920902252197266, "global_step": 62388, "epoch": 1485} {"train_loss": -5.900604248046875, "global_step": 62389, "epoch": 1485} {"train_loss": -5.939831733703613, "global_step": 62390, "epoch": 1485} {"train_loss": -5.8892822265625, "global_step": 62391, "epoch": 1485} {"train_loss": -5.909793853759766, "global_step": 62392, "epoch": 1485} {"train_loss": -5.9355010986328125, "global_step": 62393, "epoch": 1485} {"train_loss": -5.835062026977539, "global_step": 62394, "epoch": 1485} {"train_loss": -5.735633850097656, "global_step": 62395, "epoch": 1485} {"train_loss": -6.036306858062744, "global_step": 62396, "epoch": 1485} {"train_loss": -5.97925329208374, "global_step": 62397, "epoch": 1485} {"train_loss": -5.975901126861572, "global_step": 62398, "epoch": 1485} {"train_loss": -5.918610572814941, "global_step": 62399, "epoch": 1485} {"train_loss": -5.95695161819458, "global_step": 62400, "epoch": 1485} {"train_loss": -5.953000068664551, "global_step": 62401, "epoch": 1485} {"train_loss": -6.048488616943359, "global_step": 62402, "epoch": 1485} {"train_loss": -5.96435546875, "global_step": 62403, "epoch": 1485} {"train_loss": -5.964903831481934, "global_step": 62404, "epoch": 1485} {"train_loss": -5.90817928314209, "global_step": 62405, "epoch": 1485} {"train_loss": -5.937033653259277, "global_step": 62406, "epoch": 1485} {"train_loss": -5.848913192749023, "global_step": 62407, "epoch": 1485} {"train_loss": -5.958124160766602, "global_step": 62408, "epoch": 1485} {"train_loss": -5.94098424911499, "global_step": 62409, "epoch": 1485} {"train_loss": -5.962469100952148, "global_step": 62410, "epoch": 1485} {"train_loss": -5.927605912798927, "global_step": 62411, "epoch": 1485, "val_loss": 74336.7578125} {"train_loss": -6.013984203338623, "global_step": 62412, "epoch": 1486} {"train_loss": -5.808432579040527, "global_step": 62413, "epoch": 1486} {"train_loss": -6.0119171142578125, "global_step": 62414, "epoch": 1486} {"train_loss": -5.85247802734375, "global_step": 62415, "epoch": 1486} {"train_loss": -5.7987060546875, "global_step": 62416, "epoch": 1486} {"train_loss": -5.955224514007568, "global_step": 62417, "epoch": 1486} {"train_loss": -5.9725236892700195, "global_step": 62418, "epoch": 1486} {"train_loss": -5.797926425933838, "global_step": 62419, "epoch": 1486} {"train_loss": -5.904810428619385, "global_step": 62420, "epoch": 1486} {"train_loss": -5.948733329772949, "global_step": 62421, "epoch": 1486} {"train_loss": -5.939968109130859, "global_step": 62422, "epoch": 1486} {"train_loss": -5.903562068939209, "global_step": 62423, "epoch": 1486} {"train_loss": -5.917271614074707, "global_step": 62424, "epoch": 1486} {"train_loss": -5.957544326782227, "global_step": 62425, "epoch": 1486} {"train_loss": -5.801004409790039, "global_step": 62426, "epoch": 1486} {"train_loss": -5.975837707519531, "global_step": 62427, "epoch": 1486} {"train_loss": -5.838066101074219, "global_step": 62428, "epoch": 1486} {"train_loss": -5.792637825012207, "global_step": 62429, "epoch": 1486} {"train_loss": -5.8828444480896, "global_step": 62430, "epoch": 1486} {"train_loss": -5.830995082855225, "global_step": 62431, "epoch": 1486} {"train_loss": -5.812129020690918, "global_step": 62432, "epoch": 1486} {"train_loss": -5.857487678527832, "global_step": 62433, "epoch": 1486} {"train_loss": -5.7011027336120605, "global_step": 62434, "epoch": 1486} {"train_loss": -5.9134602546691895, "global_step": 62435, "epoch": 1486} {"train_loss": -5.829961776733398, "global_step": 62436, "epoch": 1486} {"train_loss": -5.987449645996094, "global_step": 62437, "epoch": 1486} {"train_loss": -5.832768440246582, "global_step": 62438, "epoch": 1486} {"train_loss": -5.914854049682617, "global_step": 62439, "epoch": 1486} {"train_loss": -5.824919700622559, "global_step": 62440, "epoch": 1486} {"train_loss": -6.062960147857666, "global_step": 62441, "epoch": 1486} {"train_loss": -5.882466793060303, "global_step": 62442, "epoch": 1486} {"train_loss": -5.831090927124023, "global_step": 62443, "epoch": 1486} {"train_loss": -5.975740909576416, "global_step": 62444, "epoch": 1486} {"train_loss": -5.937033653259277, "global_step": 62445, "epoch": 1486} {"train_loss": -5.911681175231934, "global_step": 62446, "epoch": 1486} {"train_loss": -5.891851425170898, "global_step": 62447, "epoch": 1486} {"train_loss": -5.996264934539795, "global_step": 62448, "epoch": 1486} {"train_loss": -5.967320442199707, "global_step": 62449, "epoch": 1486} {"train_loss": -6.022624492645264, "global_step": 62450, "epoch": 1486} {"train_loss": -6.06890869140625, "global_step": 62451, "epoch": 1486} {"train_loss": -5.900136947631836, "global_step": 62452, "epoch": 1486} {"train_loss": -5.904137202671596, "global_step": 62453, "epoch": 1486, "val_loss": 74466.3046875} {"train_loss": -5.918722152709961, "global_step": 62454, "epoch": 1487} {"train_loss": -5.871036529541016, "global_step": 62455, "epoch": 1487} {"train_loss": -5.9388298988342285, "global_step": 62456, "epoch": 1487} {"train_loss": -5.894467353820801, "global_step": 62457, "epoch": 1487} {"train_loss": -5.956600189208984, "global_step": 62458, "epoch": 1487} {"train_loss": -5.626897811889648, "global_step": 62459, "epoch": 1487} {"train_loss": -5.946621417999268, "global_step": 62460, "epoch": 1487} {"train_loss": -5.921013832092285, "global_step": 62461, "epoch": 1487} {"train_loss": -5.93553352355957, "global_step": 62462, "epoch": 1487} {"train_loss": -5.975948333740234, "global_step": 62463, "epoch": 1487} {"train_loss": -5.866163730621338, "global_step": 62464, "epoch": 1487} {"train_loss": -5.756842613220215, "global_step": 62465, "epoch": 1487} {"train_loss": -5.768012046813965, "global_step": 62466, "epoch": 1487} {"train_loss": -5.968263626098633, "global_step": 62467, "epoch": 1487} {"train_loss": -5.941439628601074, "global_step": 62468, "epoch": 1487} {"train_loss": -5.829577445983887, "global_step": 62469, "epoch": 1487} {"train_loss": -5.92704963684082, "global_step": 62470, "epoch": 1487} {"train_loss": -5.835513114929199, "global_step": 62471, "epoch": 1487} {"train_loss": -5.812229633331299, "global_step": 62472, "epoch": 1487} {"train_loss": -5.7966766357421875, "global_step": 62473, "epoch": 1487} {"train_loss": -5.844447135925293, "global_step": 62474, "epoch": 1487} {"train_loss": -5.915812969207764, "global_step": 62475, "epoch": 1487} {"train_loss": -5.987793922424316, "global_step": 62476, "epoch": 1487} {"train_loss": -5.948007106781006, "global_step": 62477, "epoch": 1487} {"train_loss": -5.9302592277526855, "global_step": 62478, "epoch": 1487} {"train_loss": -5.822750091552734, "global_step": 62479, "epoch": 1487} {"train_loss": -5.983263969421387, "global_step": 62480, "epoch": 1487} {"train_loss": -5.914361953735352, "global_step": 62481, "epoch": 1487} {"train_loss": -5.949289798736572, "global_step": 62482, "epoch": 1487} {"train_loss": -5.916067600250244, "global_step": 62483, "epoch": 1487} {"train_loss": -5.780364036560059, "global_step": 62484, "epoch": 1487} {"train_loss": -5.9614577293396, "global_step": 62485, "epoch": 1487} {"train_loss": -5.974900245666504, "global_step": 62486, "epoch": 1487} {"train_loss": -5.821185111999512, "global_step": 62487, "epoch": 1487} {"train_loss": -5.963621139526367, "global_step": 62488, "epoch": 1487} {"train_loss": -5.941959381103516, "global_step": 62489, "epoch": 1487} {"train_loss": -5.950281143188477, "global_step": 62490, "epoch": 1487} {"train_loss": -5.835604190826416, "global_step": 62491, "epoch": 1487} {"train_loss": -6.04347562789917, "global_step": 62492, "epoch": 1487} {"train_loss": -5.822553634643555, "global_step": 62493, "epoch": 1487} {"train_loss": -5.91508674621582, "global_step": 62494, "epoch": 1487} {"train_loss": -5.895672809510004, "global_step": 62495, "epoch": 1487, "val_loss": 74515.65625} {"train_loss": -5.8477911949157715, "global_step": 62496, "epoch": 1488} {"train_loss": -5.983725547790527, "global_step": 62497, "epoch": 1488} {"train_loss": -5.9292755126953125, "global_step": 62498, "epoch": 1488} {"train_loss": -5.878237724304199, "global_step": 62499, "epoch": 1488} {"train_loss": -5.872823715209961, "global_step": 62500, "epoch": 1488} {"train_loss": -5.9067230224609375, "global_step": 62501, "epoch": 1488} {"train_loss": -5.744831085205078, "global_step": 62502, "epoch": 1488} {"train_loss": -6.027342796325684, "global_step": 62503, "epoch": 1488} {"train_loss": -5.9356560707092285, "global_step": 62504, "epoch": 1488} {"train_loss": -6.107025623321533, "global_step": 62505, "epoch": 1488} {"train_loss": -5.958157062530518, "global_step": 62506, "epoch": 1488} {"train_loss": -5.851345062255859, "global_step": 62507, "epoch": 1488} {"train_loss": -5.9980149269104, "global_step": 62508, "epoch": 1488} {"train_loss": -5.918732166290283, "global_step": 62509, "epoch": 1488} {"train_loss": -5.914671897888184, "global_step": 62510, "epoch": 1488} {"train_loss": -5.991592884063721, "global_step": 62511, "epoch": 1488} {"train_loss": -5.923501014709473, "global_step": 62512, "epoch": 1488} {"train_loss": -5.946083068847656, "global_step": 62513, "epoch": 1488} {"train_loss": -5.898080825805664, "global_step": 62514, "epoch": 1488} {"train_loss": -5.976339340209961, "global_step": 62515, "epoch": 1488} {"train_loss": -6.06736946105957, "global_step": 62516, "epoch": 1488} {"train_loss": -5.940279483795166, "global_step": 62517, "epoch": 1488} {"train_loss": -6.044686794281006, "global_step": 62518, "epoch": 1488} {"train_loss": -5.930417060852051, "global_step": 62519, "epoch": 1488} {"train_loss": -5.928082466125488, "global_step": 62520, "epoch": 1488} {"train_loss": -5.995114326477051, "global_step": 62521, "epoch": 1488} {"train_loss": -5.922857284545898, "global_step": 62522, "epoch": 1488} {"train_loss": -5.822021484375, "global_step": 62523, "epoch": 1488} {"train_loss": -5.785406112670898, "global_step": 62524, "epoch": 1488} {"train_loss": -5.911073684692383, "global_step": 62525, "epoch": 1488} {"train_loss": -5.889708042144775, "global_step": 62526, "epoch": 1488} {"train_loss": -5.84305477142334, "global_step": 62527, "epoch": 1488} {"train_loss": -5.8110785484313965, "global_step": 62528, "epoch": 1488} {"train_loss": -5.9487624168396, "global_step": 62529, "epoch": 1488} {"train_loss": -5.863855838775635, "global_step": 62530, "epoch": 1488} {"train_loss": -5.8259501457214355, "global_step": 62531, "epoch": 1488} {"train_loss": -5.929248332977295, "global_step": 62532, "epoch": 1488} {"train_loss": -5.842439651489258, "global_step": 62533, "epoch": 1488} {"train_loss": -5.772956848144531, "global_step": 62534, "epoch": 1488} {"train_loss": -5.9350786209106445, "global_step": 62535, "epoch": 1488} {"train_loss": -5.900918006896973, "global_step": 62536, "epoch": 1488} {"train_loss": -5.916948091416132, "global_step": 62537, "epoch": 1488, "val_loss": 74649.7890625} {"train_loss": -5.956938743591309, "global_step": 62538, "epoch": 1489} {"train_loss": -5.92869758605957, "global_step": 62539, "epoch": 1489} {"train_loss": -5.795376777648926, "global_step": 62540, "epoch": 1489} {"train_loss": -5.94758415222168, "global_step": 62541, "epoch": 1489} {"train_loss": -5.852071762084961, "global_step": 62542, "epoch": 1489} {"train_loss": -6.010465621948242, "global_step": 62543, "epoch": 1489} {"train_loss": -5.9096784591674805, "global_step": 62544, "epoch": 1489} {"train_loss": -5.8429694175720215, "global_step": 62545, "epoch": 1489} {"train_loss": -5.981622219085693, "global_step": 62546, "epoch": 1489} {"train_loss": -5.962794303894043, "global_step": 62547, "epoch": 1489} {"train_loss": -5.974071979522705, "global_step": 62548, "epoch": 1489} {"train_loss": -5.939918518066406, "global_step": 62549, "epoch": 1489} {"train_loss": -6.012201309204102, "global_step": 62550, "epoch": 1489} {"train_loss": -6.003687858581543, "global_step": 62551, "epoch": 1489} {"train_loss": -5.898312091827393, "global_step": 62552, "epoch": 1489} {"train_loss": -5.965105056762695, "global_step": 62553, "epoch": 1489} {"train_loss": -5.864404201507568, "global_step": 62554, "epoch": 1489} {"train_loss": -5.862281799316406, "global_step": 62555, "epoch": 1489} {"train_loss": -6.055968284606934, "global_step": 62556, "epoch": 1489} {"train_loss": -5.959759712219238, "global_step": 62557, "epoch": 1489} {"train_loss": -5.9984354972839355, "global_step": 62558, "epoch": 1489} {"train_loss": -6.044445991516113, "global_step": 62559, "epoch": 1489} {"train_loss": -5.905125141143799, "global_step": 62560, "epoch": 1489} {"train_loss": -5.876079082489014, "global_step": 62561, "epoch": 1489} {"train_loss": -6.047650337219238, "global_step": 62562, "epoch": 1489} {"train_loss": -5.9183454513549805, "global_step": 62563, "epoch": 1489} {"train_loss": -5.9831647872924805, "global_step": 62564, "epoch": 1489} {"train_loss": -5.93950080871582, "global_step": 62565, "epoch": 1489} {"train_loss": -5.953211784362793, "global_step": 62566, "epoch": 1489} {"train_loss": -5.985052108764648, "global_step": 62567, "epoch": 1489} {"train_loss": -6.045975208282471, "global_step": 62568, "epoch": 1489} {"train_loss": -5.876218795776367, "global_step": 62569, "epoch": 1489} {"train_loss": -5.797700881958008, "global_step": 62570, "epoch": 1489} {"train_loss": -5.988130569458008, "global_step": 62571, "epoch": 1489} {"train_loss": -5.9058427810668945, "global_step": 62572, "epoch": 1489} {"train_loss": -5.950445175170898, "global_step": 62573, "epoch": 1489} {"train_loss": -5.905066013336182, "global_step": 62574, "epoch": 1489} {"train_loss": -5.848200798034668, "global_step": 62575, "epoch": 1489} {"train_loss": -6.020546913146973, "global_step": 62576, "epoch": 1489} {"train_loss": -5.865673542022705, "global_step": 62577, "epoch": 1489} {"train_loss": -5.871142387390137, "global_step": 62578, "epoch": 1489} {"train_loss": -5.935902277628581, "global_step": 62579, "epoch": 1489, "val_loss": 74421.9765625} {"train_loss": -6.076293468475342, "global_step": 62580, "epoch": 1490} {"train_loss": -5.990024566650391, "global_step": 62581, "epoch": 1490} {"train_loss": -6.036201477050781, "global_step": 62582, "epoch": 1490} {"train_loss": -5.921295166015625, "global_step": 62583, "epoch": 1490} {"train_loss": -5.971009731292725, "global_step": 62584, "epoch": 1490} {"train_loss": -5.978110313415527, "global_step": 62585, "epoch": 1490} {"train_loss": -5.935531139373779, "global_step": 62586, "epoch": 1490} {"train_loss": -5.923055648803711, "global_step": 62587, "epoch": 1490} {"train_loss": -5.843679428100586, "global_step": 62588, "epoch": 1490} {"train_loss": -5.874948978424072, "global_step": 62589, "epoch": 1490} {"train_loss": -5.952553749084473, "global_step": 62590, "epoch": 1490} {"train_loss": -5.979477882385254, "global_step": 62591, "epoch": 1490} {"train_loss": -5.955435752868652, "global_step": 62592, "epoch": 1490} {"train_loss": -6.011606693267822, "global_step": 62593, "epoch": 1490} {"train_loss": -6.007826328277588, "global_step": 62594, "epoch": 1490} {"train_loss": -5.932464599609375, "global_step": 62595, "epoch": 1490} {"train_loss": -5.8833327293396, "global_step": 62596, "epoch": 1490} {"train_loss": -5.9223809242248535, "global_step": 62597, "epoch": 1490} {"train_loss": -6.015415191650391, "global_step": 62598, "epoch": 1490} {"train_loss": -5.952366352081299, "global_step": 62599, "epoch": 1490} {"train_loss": -5.86827278137207, "global_step": 62600, "epoch": 1490} {"train_loss": -5.932847023010254, "global_step": 62601, "epoch": 1490} {"train_loss": -5.7664079666137695, "global_step": 62602, "epoch": 1490} {"train_loss": -5.943408966064453, "global_step": 62603, "epoch": 1490} {"train_loss": -5.972816467285156, "global_step": 62604, "epoch": 1490} {"train_loss": -5.829888820648193, "global_step": 62605, "epoch": 1490} {"train_loss": -5.972958564758301, "global_step": 62606, "epoch": 1490} {"train_loss": -5.917792797088623, "global_step": 62607, "epoch": 1490} {"train_loss": -5.80436897277832, "global_step": 62608, "epoch": 1490} {"train_loss": -5.887511253356934, "global_step": 62609, "epoch": 1490} {"train_loss": -5.963255405426025, "global_step": 62610, "epoch": 1490} {"train_loss": -5.815408706665039, "global_step": 62611, "epoch": 1490} {"train_loss": -5.953110694885254, "global_step": 62612, "epoch": 1490} {"train_loss": -5.860044956207275, "global_step": 62613, "epoch": 1490} {"train_loss": -5.9366960525512695, "global_step": 62614, "epoch": 1490} {"train_loss": -5.894710063934326, "global_step": 62615, "epoch": 1490} {"train_loss": -5.8631463050842285, "global_step": 62616, "epoch": 1490} {"train_loss": -5.930368900299072, "global_step": 62617, "epoch": 1490} {"train_loss": -5.949893951416016, "global_step": 62618, "epoch": 1490} {"train_loss": -5.9350433349609375, "global_step": 62619, "epoch": 1490} {"train_loss": -5.8846659660339355, "global_step": 62620, "epoch": 1490} {"train_loss": -5.9257980074201315, "global_step": 62621, "epoch": 1490, "val_loss": 74996.953125} {"train_loss": -5.799812316894531, "global_step": 62622, "epoch": 1491} {"train_loss": -5.862334728240967, "global_step": 62623, "epoch": 1491} {"train_loss": -6.064443588256836, "global_step": 62624, "epoch": 1491} {"train_loss": -5.791966438293457, "global_step": 62625, "epoch": 1491} {"train_loss": -5.911740303039551, "global_step": 62626, "epoch": 1491} {"train_loss": -5.9016923904418945, "global_step": 62627, "epoch": 1491} {"train_loss": -5.795197486877441, "global_step": 62628, "epoch": 1491} {"train_loss": -5.954657554626465, "global_step": 62629, "epoch": 1491} {"train_loss": -6.0113420486450195, "global_step": 62630, "epoch": 1491} {"train_loss": -5.938990592956543, "global_step": 62631, "epoch": 1491} {"train_loss": -5.911409854888916, "global_step": 62632, "epoch": 1491} {"train_loss": -5.91923189163208, "global_step": 62633, "epoch": 1491} {"train_loss": -5.993654251098633, "global_step": 62634, "epoch": 1491} {"train_loss": -5.816805839538574, "global_step": 62635, "epoch": 1491} {"train_loss": -5.939121723175049, "global_step": 62636, "epoch": 1491} {"train_loss": -5.957662582397461, "global_step": 62637, "epoch": 1491} {"train_loss": -5.8800201416015625, "global_step": 62638, "epoch": 1491} {"train_loss": -6.047508716583252, "global_step": 62639, "epoch": 1491} {"train_loss": -5.941810607910156, "global_step": 62640, "epoch": 1491} {"train_loss": -5.844783782958984, "global_step": 62641, "epoch": 1491} {"train_loss": -6.063054084777832, "global_step": 62642, "epoch": 1491} {"train_loss": -6.008727073669434, "global_step": 62643, "epoch": 1491} {"train_loss": -5.959486961364746, "global_step": 62644, "epoch": 1491} {"train_loss": -5.995791912078857, "global_step": 62645, "epoch": 1491} {"train_loss": -5.944225311279297, "global_step": 62646, "epoch": 1491} {"train_loss": -6.02018928527832, "global_step": 62647, "epoch": 1491} {"train_loss": -5.946396827697754, "global_step": 62648, "epoch": 1491} {"train_loss": -6.033388137817383, "global_step": 62649, "epoch": 1491} {"train_loss": -5.951791763305664, "global_step": 62650, "epoch": 1491} {"train_loss": -5.951010704040527, "global_step": 62651, "epoch": 1491} {"train_loss": -5.8622212409973145, "global_step": 62652, "epoch": 1491} {"train_loss": -5.9078288078308105, "global_step": 62653, "epoch": 1491} {"train_loss": -5.97775936126709, "global_step": 62654, "epoch": 1491} {"train_loss": -5.921817302703857, "global_step": 62655, "epoch": 1491} {"train_loss": -5.9463372230529785, "global_step": 62656, "epoch": 1491} {"train_loss": -5.8704633712768555, "global_step": 62657, "epoch": 1491} {"train_loss": -5.964450836181641, "global_step": 62658, "epoch": 1491} {"train_loss": -5.918452262878418, "global_step": 62659, "epoch": 1491} {"train_loss": -5.963688850402832, "global_step": 62660, "epoch": 1491} {"train_loss": -5.863530158996582, "global_step": 62661, "epoch": 1491} {"train_loss": -5.905175685882568, "global_step": 62662, "epoch": 1491} {"train_loss": -5.931553511392503, "global_step": 62663, "epoch": 1491, "val_loss": 74552.7265625} {"train_loss": -5.864681720733643, "global_step": 62664, "epoch": 1492} {"train_loss": -5.960057258605957, "global_step": 62665, "epoch": 1492} {"train_loss": -5.863910675048828, "global_step": 62666, "epoch": 1492} {"train_loss": -5.912996292114258, "global_step": 62667, "epoch": 1492} {"train_loss": -5.8559980392456055, "global_step": 62668, "epoch": 1492} {"train_loss": -5.936631202697754, "global_step": 62669, "epoch": 1492} {"train_loss": -5.957973957061768, "global_step": 62670, "epoch": 1492} {"train_loss": -5.898793697357178, "global_step": 62671, "epoch": 1492} {"train_loss": -5.895822048187256, "global_step": 62672, "epoch": 1492} {"train_loss": -5.923972129821777, "global_step": 62673, "epoch": 1492} {"train_loss": -6.139970302581787, "global_step": 62674, "epoch": 1492} {"train_loss": -5.899494171142578, "global_step": 62675, "epoch": 1492} {"train_loss": -5.958808898925781, "global_step": 62676, "epoch": 1492} {"train_loss": -6.0659589767456055, "global_step": 62677, "epoch": 1492} {"train_loss": -6.019606113433838, "global_step": 62678, "epoch": 1492} {"train_loss": -5.956063747406006, "global_step": 62679, "epoch": 1492} {"train_loss": -5.985478401184082, "global_step": 62680, "epoch": 1492} {"train_loss": -5.910150527954102, "global_step": 62681, "epoch": 1492} {"train_loss": -5.864770889282227, "global_step": 62682, "epoch": 1492} {"train_loss": -5.9450297355651855, "global_step": 62683, "epoch": 1492} {"train_loss": -5.8864426612854, "global_step": 62684, "epoch": 1492} {"train_loss": -5.95397424697876, "global_step": 62685, "epoch": 1492} {"train_loss": -6.024194717407227, "global_step": 62686, "epoch": 1492} {"train_loss": -5.903281211853027, "global_step": 62687, "epoch": 1492} {"train_loss": -5.888343811035156, "global_step": 62688, "epoch": 1492} {"train_loss": -5.974977493286133, "global_step": 62689, "epoch": 1492} {"train_loss": -5.876898765563965, "global_step": 62690, "epoch": 1492} {"train_loss": -5.831063270568848, "global_step": 62691, "epoch": 1492} {"train_loss": -5.940938949584961, "global_step": 62692, "epoch": 1492} {"train_loss": -5.939119815826416, "global_step": 62693, "epoch": 1492} {"train_loss": -5.889688491821289, "global_step": 62694, "epoch": 1492} {"train_loss": -5.896522521972656, "global_step": 62695, "epoch": 1492} {"train_loss": -5.823808193206787, "global_step": 62696, "epoch": 1492} {"train_loss": -5.856435298919678, "global_step": 62697, "epoch": 1492} {"train_loss": -5.83258581161499, "global_step": 62698, "epoch": 1492} {"train_loss": -5.9950761795043945, "global_step": 62699, "epoch": 1492} {"train_loss": -5.834465980529785, "global_step": 62700, "epoch": 1492} {"train_loss": -6.026823043823242, "global_step": 62701, "epoch": 1492} {"train_loss": -5.949413776397705, "global_step": 62702, "epoch": 1492} {"train_loss": -5.97420597076416, "global_step": 62703, "epoch": 1492} {"train_loss": -5.809808254241943, "global_step": 62704, "epoch": 1492} {"train_loss": -5.9268284525190085, "global_step": 62705, "epoch": 1492, "val_loss": 74710.984375} {"train_loss": -5.866781234741211, "global_step": 62706, "epoch": 1493} {"train_loss": -5.906767845153809, "global_step": 62707, "epoch": 1493} {"train_loss": -5.9660539627075195, "global_step": 62708, "epoch": 1493} {"train_loss": -5.894479751586914, "global_step": 62709, "epoch": 1493} {"train_loss": -5.920131206512451, "global_step": 62710, "epoch": 1493} {"train_loss": -5.9214677810668945, "global_step": 62711, "epoch": 1493} {"train_loss": -5.943536758422852, "global_step": 62712, "epoch": 1493} {"train_loss": -6.056615829467773, "global_step": 62713, "epoch": 1493} {"train_loss": -5.945946216583252, "global_step": 62714, "epoch": 1493} {"train_loss": -5.950586318969727, "global_step": 62715, "epoch": 1493} {"train_loss": -5.848231315612793, "global_step": 62716, "epoch": 1493} {"train_loss": -5.9652533531188965, "global_step": 62717, "epoch": 1493} {"train_loss": -5.948452949523926, "global_step": 62718, "epoch": 1493} {"train_loss": -5.90753698348999, "global_step": 62719, "epoch": 1493} {"train_loss": -5.887424468994141, "global_step": 62720, "epoch": 1493} {"train_loss": -5.97479248046875, "global_step": 62721, "epoch": 1493} {"train_loss": -5.796504974365234, "global_step": 62722, "epoch": 1493} {"train_loss": -5.933018684387207, "global_step": 62723, "epoch": 1493} {"train_loss": -5.843178749084473, "global_step": 62724, "epoch": 1493} {"train_loss": -5.968824863433838, "global_step": 62725, "epoch": 1493} {"train_loss": -5.840795993804932, "global_step": 62726, "epoch": 1493} {"train_loss": -5.989768028259277, "global_step": 62727, "epoch": 1493} {"train_loss": -5.970565319061279, "global_step": 62728, "epoch": 1493} {"train_loss": -5.9515299797058105, "global_step": 62729, "epoch": 1493} {"train_loss": -6.025442123413086, "global_step": 62730, "epoch": 1493} {"train_loss": -5.8850178718566895, "global_step": 62731, "epoch": 1493} {"train_loss": -5.901518821716309, "global_step": 62732, "epoch": 1493} {"train_loss": -5.877048969268799, "global_step": 62733, "epoch": 1493} {"train_loss": -5.986523151397705, "global_step": 62734, "epoch": 1493} {"train_loss": -5.951890468597412, "global_step": 62735, "epoch": 1493} {"train_loss": -5.880125999450684, "global_step": 62736, "epoch": 1493} {"train_loss": -6.036618232727051, "global_step": 62737, "epoch": 1493} {"train_loss": -5.946077823638916, "global_step": 62738, "epoch": 1493} {"train_loss": -5.943967342376709, "global_step": 62739, "epoch": 1493} {"train_loss": -5.91973876953125, "global_step": 62740, "epoch": 1493} {"train_loss": -5.927896499633789, "global_step": 62741, "epoch": 1493} {"train_loss": -5.833697319030762, "global_step": 62742, "epoch": 1493} {"train_loss": -5.904123306274414, "global_step": 62743, "epoch": 1493} {"train_loss": -5.835803031921387, "global_step": 62744, "epoch": 1493} {"train_loss": -5.911844253540039, "global_step": 62745, "epoch": 1493} {"train_loss": -5.800804615020752, "global_step": 62746, "epoch": 1493} {"train_loss": -5.9189123539697555, "global_step": 62747, "epoch": 1493, "val_loss": 74456.2578125} {"train_loss": -5.928243637084961, "global_step": 62748, "epoch": 1494} {"train_loss": -5.966042518615723, "global_step": 62749, "epoch": 1494} {"train_loss": -5.952425003051758, "global_step": 62750, "epoch": 1494} {"train_loss": -5.842411994934082, "global_step": 62751, "epoch": 1494} {"train_loss": -5.940074920654297, "global_step": 62752, "epoch": 1494} {"train_loss": -5.908083438873291, "global_step": 62753, "epoch": 1494} {"train_loss": -6.023526191711426, "global_step": 62754, "epoch": 1494} {"train_loss": -6.056954383850098, "global_step": 62755, "epoch": 1494} {"train_loss": -5.880489349365234, "global_step": 62756, "epoch": 1494} {"train_loss": -6.013506889343262, "global_step": 62757, "epoch": 1494} {"train_loss": -5.907135963439941, "global_step": 62758, "epoch": 1494} {"train_loss": -6.027490139007568, "global_step": 62759, "epoch": 1494} {"train_loss": -5.99783992767334, "global_step": 62760, "epoch": 1494} {"train_loss": -5.8623366355896, "global_step": 62761, "epoch": 1494} {"train_loss": -5.870879650115967, "global_step": 62762, "epoch": 1494} {"train_loss": -5.907684326171875, "global_step": 62763, "epoch": 1494} {"train_loss": -5.90080451965332, "global_step": 62764, "epoch": 1494} {"train_loss": -5.98783016204834, "global_step": 62765, "epoch": 1494} {"train_loss": -5.9103922843933105, "global_step": 62766, "epoch": 1494} {"train_loss": -5.709927082061768, "global_step": 62767, "epoch": 1494} {"train_loss": -5.867752552032471, "global_step": 62768, "epoch": 1494} {"train_loss": -5.892951011657715, "global_step": 62769, "epoch": 1494} {"train_loss": -5.770909786224365, "global_step": 62770, "epoch": 1494} {"train_loss": -5.7986249923706055, "global_step": 62771, "epoch": 1494} {"train_loss": -5.952930450439453, "global_step": 62772, "epoch": 1494} {"train_loss": -5.899374008178711, "global_step": 62773, "epoch": 1494} {"train_loss": -5.791618347167969, "global_step": 62774, "epoch": 1494} {"train_loss": -5.938529968261719, "global_step": 62775, "epoch": 1494} {"train_loss": -5.936617851257324, "global_step": 62776, "epoch": 1494} {"train_loss": -5.951942443847656, "global_step": 62777, "epoch": 1494} {"train_loss": -5.9219255447387695, "global_step": 62778, "epoch": 1494} {"train_loss": -5.939676284790039, "global_step": 62779, "epoch": 1494} {"train_loss": -5.780150890350342, "global_step": 62780, "epoch": 1494} {"train_loss": -5.896763801574707, "global_step": 62781, "epoch": 1494} {"train_loss": -6.027973175048828, "global_step": 62782, "epoch": 1494} {"train_loss": -5.866230010986328, "global_step": 62783, "epoch": 1494} {"train_loss": -5.901009559631348, "global_step": 62784, "epoch": 1494} {"train_loss": -5.92232608795166, "global_step": 62785, "epoch": 1494} {"train_loss": -6.029752254486084, "global_step": 62786, "epoch": 1494} {"train_loss": -5.839034080505371, "global_step": 62787, "epoch": 1494} {"train_loss": -5.954172134399414, "global_step": 62788, "epoch": 1494} {"train_loss": -5.915358418510074, "global_step": 62789, "epoch": 1494, "val_loss": 74426.5859375} {"train_loss": -5.930501937866211, "global_step": 62790, "epoch": 1495} {"train_loss": -6.006137847900391, "global_step": 62791, "epoch": 1495} {"train_loss": -6.083498477935791, "global_step": 62792, "epoch": 1495} {"train_loss": -5.89933967590332, "global_step": 62793, "epoch": 1495} {"train_loss": -6.014742851257324, "global_step": 62794, "epoch": 1495} {"train_loss": -5.872475624084473, "global_step": 62795, "epoch": 1495} {"train_loss": -5.937483787536621, "global_step": 62796, "epoch": 1495} {"train_loss": -6.04200553894043, "global_step": 62797, "epoch": 1495} {"train_loss": -5.945310592651367, "global_step": 62798, "epoch": 1495} {"train_loss": -5.876588821411133, "global_step": 62799, "epoch": 1495} {"train_loss": -5.957343101501465, "global_step": 62800, "epoch": 1495} {"train_loss": -6.002856731414795, "global_step": 62801, "epoch": 1495} {"train_loss": -5.951169490814209, "global_step": 62802, "epoch": 1495} {"train_loss": -5.923738956451416, "global_step": 62803, "epoch": 1495} {"train_loss": -5.922492027282715, "global_step": 62804, "epoch": 1495} {"train_loss": -5.934998512268066, "global_step": 62805, "epoch": 1495} {"train_loss": -6.03023099899292, "global_step": 62806, "epoch": 1495} {"train_loss": -5.924320220947266, "global_step": 62807, "epoch": 1495} {"train_loss": -5.93826150894165, "global_step": 62808, "epoch": 1495} {"train_loss": -5.829967498779297, "global_step": 62809, "epoch": 1495} {"train_loss": -5.861930847167969, "global_step": 62810, "epoch": 1495} {"train_loss": -5.903534412384033, "global_step": 62811, "epoch": 1495} {"train_loss": -5.893445014953613, "global_step": 62812, "epoch": 1495} {"train_loss": -5.9462456703186035, "global_step": 62813, "epoch": 1495} {"train_loss": -5.883788585662842, "global_step": 62814, "epoch": 1495} {"train_loss": -5.791782379150391, "global_step": 62815, "epoch": 1495} {"train_loss": -5.912076950073242, "global_step": 62816, "epoch": 1495} {"train_loss": -5.861948490142822, "global_step": 62817, "epoch": 1495} {"train_loss": -5.894702434539795, "global_step": 62818, "epoch": 1495} {"train_loss": -5.9083991050720215, "global_step": 62819, "epoch": 1495} {"train_loss": -5.823659896850586, "global_step": 62820, "epoch": 1495} {"train_loss": -5.800016403198242, "global_step": 62821, "epoch": 1495} {"train_loss": -5.863568305969238, "global_step": 62822, "epoch": 1495} {"train_loss": -5.83054256439209, "global_step": 62823, "epoch": 1495} {"train_loss": -5.865989685058594, "global_step": 62824, "epoch": 1495} {"train_loss": -5.885823726654053, "global_step": 62825, "epoch": 1495} {"train_loss": -5.967809677124023, "global_step": 62826, "epoch": 1495} {"train_loss": -5.876015663146973, "global_step": 62827, "epoch": 1495} {"train_loss": -5.880855560302734, "global_step": 62828, "epoch": 1495} {"train_loss": -5.739677429199219, "global_step": 62829, "epoch": 1495} {"train_loss": -6.032014846801758, "global_step": 62830, "epoch": 1495} {"train_loss": -5.911752405620756, "global_step": 62831, "epoch": 1495, "val_loss": 74518.3125} {"train_loss": -6.009927749633789, "global_step": 62832, "epoch": 1496} {"train_loss": -5.916989326477051, "global_step": 62833, "epoch": 1496} {"train_loss": -5.920445442199707, "global_step": 62834, "epoch": 1496} {"train_loss": -5.887402534484863, "global_step": 62835, "epoch": 1496} {"train_loss": -5.847733974456787, "global_step": 62836, "epoch": 1496} {"train_loss": -5.961575508117676, "global_step": 62837, "epoch": 1496} {"train_loss": -5.859805107116699, "global_step": 62838, "epoch": 1496} {"train_loss": -6.018232345581055, "global_step": 62839, "epoch": 1496} {"train_loss": -5.941240310668945, "global_step": 62840, "epoch": 1496} {"train_loss": -6.012377738952637, "global_step": 62841, "epoch": 1496} {"train_loss": -6.023955345153809, "global_step": 62842, "epoch": 1496} {"train_loss": -5.99446964263916, "global_step": 62843, "epoch": 1496} {"train_loss": -5.940575122833252, "global_step": 62844, "epoch": 1496} {"train_loss": -5.914135932922363, "global_step": 62845, "epoch": 1496} {"train_loss": -5.9555511474609375, "global_step": 62846, "epoch": 1496} {"train_loss": -5.963589668273926, "global_step": 62847, "epoch": 1496} {"train_loss": -6.057552814483643, "global_step": 62848, "epoch": 1496} {"train_loss": -6.048971176147461, "global_step": 62849, "epoch": 1496} {"train_loss": -5.941020488739014, "global_step": 62850, "epoch": 1496} {"train_loss": -5.884768486022949, "global_step": 62851, "epoch": 1496} {"train_loss": -5.970997333526611, "global_step": 62852, "epoch": 1496} {"train_loss": -5.79766845703125, "global_step": 62853, "epoch": 1496} {"train_loss": -5.928834438323975, "global_step": 62854, "epoch": 1496} {"train_loss": -6.087302207946777, "global_step": 62855, "epoch": 1496} {"train_loss": -5.8825225830078125, "global_step": 62856, "epoch": 1496} {"train_loss": -5.889244079589844, "global_step": 62857, "epoch": 1496} {"train_loss": -5.876817226409912, "global_step": 62858, "epoch": 1496} {"train_loss": -5.800605297088623, "global_step": 62859, "epoch": 1496} {"train_loss": -6.00715446472168, "global_step": 62860, "epoch": 1496} {"train_loss": -5.85384464263916, "global_step": 62861, "epoch": 1496} {"train_loss": -5.897435665130615, "global_step": 62862, "epoch": 1496} {"train_loss": -5.9742608070373535, "global_step": 62863, "epoch": 1496} {"train_loss": -6.0212297439575195, "global_step": 62864, "epoch": 1496} {"train_loss": -6.021510601043701, "global_step": 62865, "epoch": 1496} {"train_loss": -5.8978424072265625, "global_step": 62866, "epoch": 1496} {"train_loss": -5.851296424865723, "global_step": 62867, "epoch": 1496} {"train_loss": -5.963594436645508, "global_step": 62868, "epoch": 1496} {"train_loss": -5.86449670791626, "global_step": 62869, "epoch": 1496} {"train_loss": -5.900699615478516, "global_step": 62870, "epoch": 1496} {"train_loss": -5.986484527587891, "global_step": 62871, "epoch": 1496} {"train_loss": -6.006555080413818, "global_step": 62872, "epoch": 1496} {"train_loss": -5.940082436516171, "global_step": 62873, "epoch": 1496, "val_loss": 74607.8125} {"train_loss": -5.913140773773193, "global_step": 62874, "epoch": 1497} {"train_loss": -5.9486870765686035, "global_step": 62875, "epoch": 1497} {"train_loss": -5.958863258361816, "global_step": 62876, "epoch": 1497} {"train_loss": -5.8651227951049805, "global_step": 62877, "epoch": 1497} {"train_loss": -5.902595520019531, "global_step": 62878, "epoch": 1497} {"train_loss": -6.002054214477539, "global_step": 62879, "epoch": 1497} {"train_loss": -5.975602149963379, "global_step": 62880, "epoch": 1497} {"train_loss": -5.936773300170898, "global_step": 62881, "epoch": 1497} {"train_loss": -5.972256183624268, "global_step": 62882, "epoch": 1497} {"train_loss": -5.918203353881836, "global_step": 62883, "epoch": 1497} {"train_loss": -5.84102201461792, "global_step": 62884, "epoch": 1497} {"train_loss": -5.975234031677246, "global_step": 62885, "epoch": 1497} {"train_loss": -5.954216480255127, "global_step": 62886, "epoch": 1497} {"train_loss": -5.864108562469482, "global_step": 62887, "epoch": 1497} {"train_loss": -5.900391578674316, "global_step": 62888, "epoch": 1497} {"train_loss": -5.9750566482543945, "global_step": 62889, "epoch": 1497} {"train_loss": -5.975231170654297, "global_step": 62890, "epoch": 1497} {"train_loss": -5.767837047576904, "global_step": 62891, "epoch": 1497} {"train_loss": -5.958240509033203, "global_step": 62892, "epoch": 1497} {"train_loss": -5.966920375823975, "global_step": 62893, "epoch": 1497} {"train_loss": -5.867726802825928, "global_step": 62894, "epoch": 1497} {"train_loss": -5.9949846267700195, "global_step": 62895, "epoch": 1497} {"train_loss": -5.923831939697266, "global_step": 62896, "epoch": 1497} {"train_loss": -5.983396530151367, "global_step": 62897, "epoch": 1497} {"train_loss": -5.917230129241943, "global_step": 62898, "epoch": 1497} {"train_loss": -5.966466426849365, "global_step": 62899, "epoch": 1497} {"train_loss": -5.97777795791626, "global_step": 62900, "epoch": 1497} {"train_loss": -6.02197790145874, "global_step": 62901, "epoch": 1497} {"train_loss": -5.858783721923828, "global_step": 62902, "epoch": 1497} {"train_loss": -5.937885284423828, "global_step": 62903, "epoch": 1497} {"train_loss": -5.913064479827881, "global_step": 62904, "epoch": 1497} {"train_loss": -5.960620880126953, "global_step": 62905, "epoch": 1497} {"train_loss": -5.836690902709961, "global_step": 62906, "epoch": 1497} {"train_loss": -5.803359508514404, "global_step": 62907, "epoch": 1497} {"train_loss": -5.831464767456055, "global_step": 62908, "epoch": 1497} {"train_loss": -6.004678726196289, "global_step": 62909, "epoch": 1497} {"train_loss": -5.908620834350586, "global_step": 62910, "epoch": 1497} {"train_loss": -5.970305442810059, "global_step": 62911, "epoch": 1497} {"train_loss": -5.931134223937988, "global_step": 62912, "epoch": 1497} {"train_loss": -5.94879150390625, "global_step": 62913, "epoch": 1497} {"train_loss": -5.963328838348389, "global_step": 62914, "epoch": 1497} {"train_loss": -5.930129562105451, "global_step": 62915, "epoch": 1497, "val_loss": 74551.0} {"train_loss": -5.971230506896973, "global_step": 62916, "epoch": 1498} {"train_loss": -5.844419956207275, "global_step": 62917, "epoch": 1498} {"train_loss": -5.876339912414551, "global_step": 62918, "epoch": 1498} {"train_loss": -5.852455139160156, "global_step": 62919, "epoch": 1498} {"train_loss": -5.993525505065918, "global_step": 62920, "epoch": 1498} {"train_loss": -5.833332061767578, "global_step": 62921, "epoch": 1498} {"train_loss": -5.940633773803711, "global_step": 62922, "epoch": 1498} {"train_loss": -5.911614894866943, "global_step": 62923, "epoch": 1498} {"train_loss": -5.740041732788086, "global_step": 62924, "epoch": 1498} {"train_loss": -5.864902496337891, "global_step": 62925, "epoch": 1498} {"train_loss": -5.844463348388672, "global_step": 62926, "epoch": 1498} {"train_loss": -6.049862384796143, "global_step": 62927, "epoch": 1498} {"train_loss": -5.850586414337158, "global_step": 62928, "epoch": 1498} {"train_loss": -5.865069389343262, "global_step": 62929, "epoch": 1498} {"train_loss": -5.848143577575684, "global_step": 62930, "epoch": 1498} {"train_loss": -5.915154457092285, "global_step": 62931, "epoch": 1498} {"train_loss": -5.868781566619873, "global_step": 62932, "epoch": 1498} {"train_loss": -5.9920454025268555, "global_step": 62933, "epoch": 1498} {"train_loss": -6.084934234619141, "global_step": 62934, "epoch": 1498} {"train_loss": -6.056963920593262, "global_step": 62935, "epoch": 1498} {"train_loss": -5.980931282043457, "global_step": 62936, "epoch": 1498} {"train_loss": -5.963104248046875, "global_step": 62937, "epoch": 1498} {"train_loss": -5.930170059204102, "global_step": 62938, "epoch": 1498} {"train_loss": -5.988471031188965, "global_step": 62939, "epoch": 1498} {"train_loss": -6.016866683959961, "global_step": 62940, "epoch": 1498} {"train_loss": -5.946345806121826, "global_step": 62941, "epoch": 1498} {"train_loss": -6.067376613616943, "global_step": 62942, "epoch": 1498} {"train_loss": -6.019545555114746, "global_step": 62943, "epoch": 1498} {"train_loss": -6.01633358001709, "global_step": 62944, "epoch": 1498} {"train_loss": -5.925349235534668, "global_step": 62945, "epoch": 1498} {"train_loss": -5.9999566078186035, "global_step": 62946, "epoch": 1498} {"train_loss": -6.027848243713379, "global_step": 62947, "epoch": 1498} {"train_loss": -5.9341607093811035, "global_step": 62948, "epoch": 1498} {"train_loss": -5.802114486694336, "global_step": 62949, "epoch": 1498} {"train_loss": -5.980288982391357, "global_step": 62950, "epoch": 1498} {"train_loss": -5.941802501678467, "global_step": 62951, "epoch": 1498} {"train_loss": -5.826563835144043, "global_step": 62952, "epoch": 1498} {"train_loss": -5.893306732177734, "global_step": 62953, "epoch": 1498} {"train_loss": -5.791715145111084, "global_step": 62954, "epoch": 1498} {"train_loss": -5.943305969238281, "global_step": 62955, "epoch": 1498} {"train_loss": -5.8029656410217285, "global_step": 62956, "epoch": 1498} {"train_loss": -5.924253815696353, "global_step": 62957, "epoch": 1498, "val_loss": 74369.53125} {"train_loss": -5.891976356506348, "global_step": 62958, "epoch": 1499} {"train_loss": -5.874423980712891, "global_step": 62959, "epoch": 1499} {"train_loss": -5.820816993713379, "global_step": 62960, "epoch": 1499} {"train_loss": -5.9229865074157715, "global_step": 62961, "epoch": 1499} {"train_loss": -5.930948257446289, "global_step": 62962, "epoch": 1499} {"train_loss": -5.902756690979004, "global_step": 62963, "epoch": 1499} {"train_loss": -5.802125930786133, "global_step": 62964, "epoch": 1499} {"train_loss": -5.9911956787109375, "global_step": 62965, "epoch": 1499} {"train_loss": -6.03790807723999, "global_step": 62966, "epoch": 1499} {"train_loss": -6.04384708404541, "global_step": 62967, "epoch": 1499} {"train_loss": -5.980650901794434, "global_step": 62968, "epoch": 1499} {"train_loss": -5.964215278625488, "global_step": 62969, "epoch": 1499} {"train_loss": -5.979499340057373, "global_step": 62970, "epoch": 1499} {"train_loss": -5.89939022064209, "global_step": 62971, "epoch": 1499} {"train_loss": -5.993511199951172, "global_step": 62972, "epoch": 1499} {"train_loss": -5.950244903564453, "global_step": 62973, "epoch": 1499} {"train_loss": -5.987062454223633, "global_step": 62974, "epoch": 1499} {"train_loss": -5.9620256423950195, "global_step": 62975, "epoch": 1499} {"train_loss": -5.983694076538086, "global_step": 62976, "epoch": 1499} {"train_loss": -5.848343849182129, "global_step": 62977, "epoch": 1499} {"train_loss": -5.910659313201904, "global_step": 62978, "epoch": 1499} {"train_loss": -6.007721900939941, "global_step": 62979, "epoch": 1499} {"train_loss": -5.96950626373291, "global_step": 62980, "epoch": 1499} {"train_loss": -5.961554527282715, "global_step": 62981, "epoch": 1499} {"train_loss": -5.961769104003906, "global_step": 62982, "epoch": 1499} {"train_loss": -5.871929168701172, "global_step": 62983, "epoch": 1499} {"train_loss": -5.897736549377441, "global_step": 62984, "epoch": 1499} {"train_loss": -5.879316329956055, "global_step": 62985, "epoch": 1499} {"train_loss": -5.861023902893066, "global_step": 62986, "epoch": 1499} {"train_loss": -5.87841272354126, "global_step": 62987, "epoch": 1499} {"train_loss": -5.903280258178711, "global_step": 62988, "epoch": 1499} {"train_loss": -5.932358741760254, "global_step": 62989, "epoch": 1499} {"train_loss": -6.03131628036499, "global_step": 62990, "epoch": 1499} {"train_loss": -6.103274345397949, "global_step": 62991, "epoch": 1499} {"train_loss": -5.886735916137695, "global_step": 62992, "epoch": 1499} {"train_loss": -5.945984363555908, "global_step": 62993, "epoch": 1499} {"train_loss": -5.896692752838135, "global_step": 62994, "epoch": 1499} {"train_loss": -5.991400718688965, "global_step": 62995, "epoch": 1499} {"train_loss": -5.928014278411865, "global_step": 62996, "epoch": 1499} {"train_loss": -6.034860134124756, "global_step": 62997, "epoch": 1499} {"train_loss": -5.94891357421875, "global_step": 62998, "epoch": 1499} {"train_loss": -5.9403550284249445, "global_step": 62999, "epoch": 1499, "val_loss": 74345.28125} {"train_loss": -5.957636833190918, "global_step": 63000, "epoch": 1500} {"train_loss": -5.861898422241211, "global_step": 63001, "epoch": 1500} {"train_loss": -5.917044162750244, "global_step": 63002, "epoch": 1500} {"train_loss": -5.871356010437012, "global_step": 63003, "epoch": 1500} {"train_loss": -5.983373641967773, "global_step": 63004, "epoch": 1500} {"train_loss": -6.045714378356934, "global_step": 63005, "epoch": 1500} {"train_loss": -5.896642684936523, "global_step": 63006, "epoch": 1500} {"train_loss": -5.942592620849609, "global_step": 63007, "epoch": 1500} {"train_loss": -5.963736534118652, "global_step": 63008, "epoch": 1500} {"train_loss": -5.857561111450195, "global_step": 63009, "epoch": 1500} {"train_loss": -6.083467960357666, "global_step": 63010, "epoch": 1500} {"train_loss": -5.880210876464844, "global_step": 63011, "epoch": 1500} {"train_loss": -5.961826801300049, "global_step": 63012, "epoch": 1500} {"train_loss": -6.034392356872559, "global_step": 63013, "epoch": 1500} {"train_loss": -5.938544273376465, "global_step": 63014, "epoch": 1500} {"train_loss": -5.967167854309082, "global_step": 63015, "epoch": 1500} {"train_loss": -6.067932605743408, "global_step": 63016, "epoch": 1500} {"train_loss": -5.957858085632324, "global_step": 63017, "epoch": 1500} {"train_loss": -5.909696578979492, "global_step": 63018, "epoch": 1500} {"train_loss": -5.893404960632324, "global_step": 63019, "epoch": 1500} {"train_loss": -5.887938499450684, "global_step": 63020, "epoch": 1500} {"train_loss": -5.8735246658325195, "global_step": 63021, "epoch": 1500} {"train_loss": -6.060834884643555, "global_step": 63022, "epoch": 1500} {"train_loss": -5.959195137023926, "global_step": 63023, "epoch": 1500} {"train_loss": -5.9286932945251465, "global_step": 63024, "epoch": 1500} {"train_loss": -5.929283142089844, "global_step": 63025, "epoch": 1500} {"train_loss": -5.888291835784912, "global_step": 63026, "epoch": 1500} {"train_loss": -5.781344890594482, "global_step": 63027, "epoch": 1500} {"train_loss": -5.917093276977539, "global_step": 63028, "epoch": 1500} {"train_loss": -5.918325901031494, "global_step": 63029, "epoch": 1500} {"train_loss": -5.892186164855957, "global_step": 63030, "epoch": 1500} {"train_loss": -5.9119720458984375, "global_step": 63031, "epoch": 1500} {"train_loss": -5.885969638824463, "global_step": 63032, "epoch": 1500} {"train_loss": -5.8365797996521, "global_step": 63033, "epoch": 1500} {"train_loss": -5.977734565734863, "global_step": 63034, "epoch": 1500} {"train_loss": -5.844719886779785, "global_step": 63035, "epoch": 1500} {"train_loss": -5.966917037963867, "global_step": 63036, "epoch": 1500} {"train_loss": -5.915378093719482, "global_step": 63037, "epoch": 1500} {"train_loss": -5.875588417053223, "global_step": 63038, "epoch": 1500} {"train_loss": -5.976971626281738, "global_step": 63039, "epoch": 1500} {"train_loss": -5.681040287017822, "global_step": 63040, "epoch": 1500} {"train_loss": -5.921341975529988, "global_step": 63041, "epoch": 1500, "train/sim_max_reward_0": 0.4264540463651546, "train/sim_max_reward_1": 0.9318714808093649, "train/sim_max_reward_2": 0.23899365440684464, "train/sim_max_reward_3": 0.14642320847442292, "train/sim_max_reward_4": 0.7194360836910154, "train/sim_max_reward_5": 0.9802533713161011, "test/sim_max_reward_4500000": 0.816123120479191, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.5292733272101178, "test/sim_max_reward_4500003": 0.7861088255228136, "test/sim_max_reward_4500004": 0.09507896516152717, "test/sim_max_reward_4500005": 0.3767625669926382, "test/sim_max_reward_4500006": 0.8741905482431482, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.1304227672835033, "test/sim_max_reward_4500009": 0.8817371284738568, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.38586949062921677, "test/sim_max_reward_4500012": 0.8818810040074314, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.7794484689775328, "test/sim_max_reward_4500015": 0.8701645263874527, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.013851256221411014, "test/sim_max_reward_4500018": 0.10106401876146544, "test/sim_max_reward_4500019": 0.9248311324277076, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.655961705390254, "test/sim_max_reward_4500022": 0.7117710788838757, "test/sim_max_reward_4500023": 0.812350568670537, "test/sim_max_reward_4500024": 0.8437664858016797, "test/sim_max_reward_4500025": 1.3100103176495102e-06, "test/sim_max_reward_4500026": 0.7519450552898962, "test/sim_max_reward_4500027": 0.8164122673722776, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.2223223226126051, "test/sim_max_reward_4500030": 0.8771370091810342, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.6878954055514529, "test/sim_max_reward_4500033": 0.3642497275229981, "test/sim_max_reward_4500034": 0.8540636074937754, "test/sim_max_reward_4500035": 0.8127229789275024, "test/sim_max_reward_4500036": 0.3564900571533165, "test/sim_max_reward_4500037": 0.589505279014758, "test/sim_max_reward_4500038": 0.7922127302918635, "test/sim_max_reward_4500039": 0.9573879176179019, "test/sim_max_reward_4500040": 0.9440432533483567, "test/sim_max_reward_4500041": 0.36095682053572176, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.21192157402631748, "test/sim_max_reward_4500044": 0.11107349106109592, "test/sim_max_reward_4500045": 0.5056070798089639, "test/sim_max_reward_4500046": 0.5819191258253152, "test/sim_max_reward_4500047": 0.9250755292770005, "test/sim_max_reward_4500048": 0.9977048323169272, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.573905307510484, "test/mean_score": 0.5083893125143221, "val_loss": 74833.078125} {"train_loss": -5.929045677185059, "global_step": 63042, "epoch": 1501} {"train_loss": -5.929529190063477, "global_step": 63043, "epoch": 1501} {"train_loss": -5.851441383361816, "global_step": 63044, "epoch": 1501} {"train_loss": -5.941837310791016, "global_step": 63045, "epoch": 1501} {"train_loss": -5.998538017272949, "global_step": 63046, "epoch": 1501} {"train_loss": -6.057526111602783, "global_step": 63047, "epoch": 1501} {"train_loss": -6.009302616119385, "global_step": 63048, "epoch": 1501} {"train_loss": -5.903343200683594, "global_step": 63049, "epoch": 1501} {"train_loss": -6.056879997253418, "global_step": 63050, "epoch": 1501} {"train_loss": -5.971860885620117, "global_step": 63051, "epoch": 1501} {"train_loss": -5.947918891906738, "global_step": 63052, "epoch": 1501} {"train_loss": -5.841871738433838, "global_step": 63053, "epoch": 1501} {"train_loss": -5.889407157897949, "global_step": 63054, "epoch": 1501} {"train_loss": -5.9417853355407715, "global_step": 63055, "epoch": 1501} {"train_loss": -5.951530933380127, "global_step": 63056, "epoch": 1501} {"train_loss": -5.9912614822387695, "global_step": 63057, "epoch": 1501} {"train_loss": -5.88521671295166, "global_step": 63058, "epoch": 1501} {"train_loss": -5.8799357414245605, "global_step": 63059, "epoch": 1501} {"train_loss": -5.912360668182373, "global_step": 63060, "epoch": 1501} {"train_loss": -5.827556610107422, "global_step": 63061, "epoch": 1501} {"train_loss": -5.920482158660889, "global_step": 63062, "epoch": 1501} {"train_loss": -5.75961446762085, "global_step": 63063, "epoch": 1501} {"train_loss": -5.858708381652832, "global_step": 63064, "epoch": 1501} {"train_loss": -5.948014259338379, "global_step": 63065, "epoch": 1501} {"train_loss": -5.851468563079834, "global_step": 63066, "epoch": 1501} {"train_loss": -5.85806131362915, "global_step": 63067, "epoch": 1501} {"train_loss": -5.866937637329102, "global_step": 63068, "epoch": 1501} {"train_loss": -5.895957946777344, "global_step": 63069, "epoch": 1501} {"train_loss": -5.952253341674805, "global_step": 63070, "epoch": 1501} {"train_loss": -5.8527984619140625, "global_step": 63071, "epoch": 1501} {"train_loss": -6.031894683837891, "global_step": 63072, "epoch": 1501} {"train_loss": -5.920196533203125, "global_step": 63073, "epoch": 1501} {"train_loss": -5.897758483886719, "global_step": 63074, "epoch": 1501} {"train_loss": -5.975273132324219, "global_step": 63075, "epoch": 1501} {"train_loss": -5.924923896789551, "global_step": 63076, "epoch": 1501} {"train_loss": -6.072771072387695, "global_step": 63077, "epoch": 1501} {"train_loss": -5.760220527648926, "global_step": 63078, "epoch": 1501} {"train_loss": -5.944077491760254, "global_step": 63079, "epoch": 1501} {"train_loss": -5.820221424102783, "global_step": 63080, "epoch": 1501} {"train_loss": -5.921659469604492, "global_step": 63081, "epoch": 1501} {"train_loss": -5.95020866394043, "global_step": 63082, "epoch": 1501} {"train_loss": -5.9179831232343405, "global_step": 63083, "epoch": 1501, "val_loss": 74552.9375} {"train_loss": -5.970707893371582, "global_step": 63084, "epoch": 1502} {"train_loss": -5.832424640655518, "global_step": 63085, "epoch": 1502} {"train_loss": -5.769445896148682, "global_step": 63086, "epoch": 1502} {"train_loss": -5.833339691162109, "global_step": 63087, "epoch": 1502} {"train_loss": -5.902322292327881, "global_step": 63088, "epoch": 1502} {"train_loss": -5.982770919799805, "global_step": 63089, "epoch": 1502} {"train_loss": -5.902512550354004, "global_step": 63090, "epoch": 1502} {"train_loss": -5.862951755523682, "global_step": 63091, "epoch": 1502} {"train_loss": -5.682923316955566, "global_step": 63092, "epoch": 1502} {"train_loss": -5.93967866897583, "global_step": 63093, "epoch": 1502} {"train_loss": -5.906223297119141, "global_step": 63094, "epoch": 1502} {"train_loss": -5.940881729125977, "global_step": 63095, "epoch": 1502} {"train_loss": -5.839102268218994, "global_step": 63096, "epoch": 1502} {"train_loss": -5.993133544921875, "global_step": 63097, "epoch": 1502} {"train_loss": -6.007847785949707, "global_step": 63098, "epoch": 1502} {"train_loss": -5.788527965545654, "global_step": 63099, "epoch": 1502} {"train_loss": -5.98293399810791, "global_step": 63100, "epoch": 1502} {"train_loss": -5.809492588043213, "global_step": 63101, "epoch": 1502} {"train_loss": -5.869978427886963, "global_step": 63102, "epoch": 1502} {"train_loss": -5.959774971008301, "global_step": 63103, "epoch": 1502} {"train_loss": -5.84681510925293, "global_step": 63104, "epoch": 1502} {"train_loss": -5.943883895874023, "global_step": 63105, "epoch": 1502} {"train_loss": -5.879617691040039, "global_step": 63106, "epoch": 1502} {"train_loss": -5.800038814544678, "global_step": 63107, "epoch": 1502} {"train_loss": -5.943839073181152, "global_step": 63108, "epoch": 1502} {"train_loss": -5.885631561279297, "global_step": 63109, "epoch": 1502} {"train_loss": -6.037378311157227, "global_step": 63110, "epoch": 1502} {"train_loss": -5.907323837280273, "global_step": 63111, "epoch": 1502} {"train_loss": -5.930208206176758, "global_step": 63112, "epoch": 1502} {"train_loss": -5.951605796813965, "global_step": 63113, "epoch": 1502} {"train_loss": -5.954297065734863, "global_step": 63114, "epoch": 1502} {"train_loss": -5.894534111022949, "global_step": 63115, "epoch": 1502} {"train_loss": -5.910617828369141, "global_step": 63116, "epoch": 1502} {"train_loss": -5.960634231567383, "global_step": 63117, "epoch": 1502} {"train_loss": -5.880776882171631, "global_step": 63118, "epoch": 1502} {"train_loss": -6.017624855041504, "global_step": 63119, "epoch": 1502} {"train_loss": -5.834012985229492, "global_step": 63120, "epoch": 1502} {"train_loss": -6.042733192443848, "global_step": 63121, "epoch": 1502} {"train_loss": -5.965749740600586, "global_step": 63122, "epoch": 1502} {"train_loss": -5.91318941116333, "global_step": 63123, "epoch": 1502} {"train_loss": -6.009654998779297, "global_step": 63124, "epoch": 1502} {"train_loss": -5.907691978272938, "global_step": 63125, "epoch": 1502, "val_loss": 75014.96875} {"train_loss": -6.003488540649414, "global_step": 63126, "epoch": 1503} {"train_loss": -5.890063285827637, "global_step": 63127, "epoch": 1503} {"train_loss": -5.849526405334473, "global_step": 63128, "epoch": 1503} {"train_loss": -5.988018035888672, "global_step": 63129, "epoch": 1503} {"train_loss": -5.688359260559082, "global_step": 63130, "epoch": 1503} {"train_loss": -5.933016777038574, "global_step": 63131, "epoch": 1503} {"train_loss": -5.921239852905273, "global_step": 63132, "epoch": 1503} {"train_loss": -5.844553470611572, "global_step": 63133, "epoch": 1503} {"train_loss": -5.946651458740234, "global_step": 63134, "epoch": 1503} {"train_loss": -5.910292148590088, "global_step": 63135, "epoch": 1503} {"train_loss": -5.79343318939209, "global_step": 63136, "epoch": 1503} {"train_loss": -5.945832252502441, "global_step": 63137, "epoch": 1503} {"train_loss": -5.785488128662109, "global_step": 63138, "epoch": 1503} {"train_loss": -6.011530876159668, "global_step": 63139, "epoch": 1503} {"train_loss": -5.815025329589844, "global_step": 63140, "epoch": 1503} {"train_loss": -5.943584442138672, "global_step": 63141, "epoch": 1503} {"train_loss": -5.924847602844238, "global_step": 63142, "epoch": 1503} {"train_loss": -5.919642448425293, "global_step": 63143, "epoch": 1503} {"train_loss": -5.932974815368652, "global_step": 63144, "epoch": 1503} {"train_loss": -6.014102458953857, "global_step": 63145, "epoch": 1503} {"train_loss": -5.920835971832275, "global_step": 63146, "epoch": 1503} {"train_loss": -5.971676826477051, "global_step": 63147, "epoch": 1503} {"train_loss": -5.983371257781982, "global_step": 63148, "epoch": 1503} {"train_loss": -5.882228851318359, "global_step": 63149, "epoch": 1503} {"train_loss": -5.847544193267822, "global_step": 63150, "epoch": 1503} {"train_loss": -5.912535667419434, "global_step": 63151, "epoch": 1503} {"train_loss": -6.060177803039551, "global_step": 63152, "epoch": 1503} {"train_loss": -5.856081008911133, "global_step": 63153, "epoch": 1503} {"train_loss": -5.973392486572266, "global_step": 63154, "epoch": 1503} {"train_loss": -5.759599208831787, "global_step": 63155, "epoch": 1503} {"train_loss": -6.011935710906982, "global_step": 63156, "epoch": 1503} {"train_loss": -5.929065704345703, "global_step": 63157, "epoch": 1503} {"train_loss": -5.918595314025879, "global_step": 63158, "epoch": 1503} {"train_loss": -5.946419715881348, "global_step": 63159, "epoch": 1503} {"train_loss": -5.888993263244629, "global_step": 63160, "epoch": 1503} {"train_loss": -5.873924255371094, "global_step": 63161, "epoch": 1503} {"train_loss": -5.889245986938477, "global_step": 63162, "epoch": 1503} {"train_loss": -5.956871032714844, "global_step": 63163, "epoch": 1503} {"train_loss": -5.980558395385742, "global_step": 63164, "epoch": 1503} {"train_loss": -5.93665885925293, "global_step": 63165, "epoch": 1503} {"train_loss": -5.880645751953125, "global_step": 63166, "epoch": 1503} {"train_loss": -5.915875820886521, "global_step": 63167, "epoch": 1503, "val_loss": 74990.015625} {"train_loss": -5.895284652709961, "global_step": 63168, "epoch": 1504} {"train_loss": -5.896472930908203, "global_step": 63169, "epoch": 1504} {"train_loss": -5.956954002380371, "global_step": 63170, "epoch": 1504} {"train_loss": -5.906909942626953, "global_step": 63171, "epoch": 1504} {"train_loss": -6.029559135437012, "global_step": 63172, "epoch": 1504} {"train_loss": -5.843631267547607, "global_step": 63173, "epoch": 1504} {"train_loss": -5.956429481506348, "global_step": 63174, "epoch": 1504} {"train_loss": -5.893162727355957, "global_step": 63175, "epoch": 1504} {"train_loss": -6.102158069610596, "global_step": 63176, "epoch": 1504} {"train_loss": -5.857789993286133, "global_step": 63177, "epoch": 1504} {"train_loss": -5.991855621337891, "global_step": 63178, "epoch": 1504} {"train_loss": -5.887356758117676, "global_step": 63179, "epoch": 1504} {"train_loss": -6.018056869506836, "global_step": 63180, "epoch": 1504} {"train_loss": -5.978370666503906, "global_step": 63181, "epoch": 1504} {"train_loss": -5.920352458953857, "global_step": 63182, "epoch": 1504} {"train_loss": -5.992306709289551, "global_step": 63183, "epoch": 1504} {"train_loss": -6.088265895843506, "global_step": 63184, "epoch": 1504} {"train_loss": -5.933911323547363, "global_step": 63185, "epoch": 1504} {"train_loss": -5.967449188232422, "global_step": 63186, "epoch": 1504} {"train_loss": -5.983000755310059, "global_step": 63187, "epoch": 1504} {"train_loss": -5.924226760864258, "global_step": 63188, "epoch": 1504} {"train_loss": -6.022958755493164, "global_step": 63189, "epoch": 1504} {"train_loss": -5.917067527770996, "global_step": 63190, "epoch": 1504} {"train_loss": -6.092744827270508, "global_step": 63191, "epoch": 1504} {"train_loss": -6.030643463134766, "global_step": 63192, "epoch": 1504} {"train_loss": -5.765036582946777, "global_step": 63193, "epoch": 1504} {"train_loss": -6.0000834465026855, "global_step": 63194, "epoch": 1504} {"train_loss": -5.988965034484863, "global_step": 63195, "epoch": 1504} {"train_loss": -5.885159015655518, "global_step": 63196, "epoch": 1504} {"train_loss": -6.013389587402344, "global_step": 63197, "epoch": 1504} {"train_loss": -5.816368579864502, "global_step": 63198, "epoch": 1504} {"train_loss": -5.8190412521362305, "global_step": 63199, "epoch": 1504} {"train_loss": -6.004964828491211, "global_step": 63200, "epoch": 1504} {"train_loss": -5.728048324584961, "global_step": 63201, "epoch": 1504} {"train_loss": -5.996759414672852, "global_step": 63202, "epoch": 1504} {"train_loss": -5.978534698486328, "global_step": 63203, "epoch": 1504} {"train_loss": -5.964675426483154, "global_step": 63204, "epoch": 1504} {"train_loss": -5.919716835021973, "global_step": 63205, "epoch": 1504} {"train_loss": -5.898460388183594, "global_step": 63206, "epoch": 1504} {"train_loss": -5.942287445068359, "global_step": 63207, "epoch": 1504} {"train_loss": -5.753027439117432, "global_step": 63208, "epoch": 1504} {"train_loss": -5.941105433872768, "global_step": 63209, "epoch": 1504, "val_loss": 74681.4765625} {"train_loss": -5.953835964202881, "global_step": 63210, "epoch": 1505} {"train_loss": -5.920875549316406, "global_step": 63211, "epoch": 1505} {"train_loss": -5.861441612243652, "global_step": 63212, "epoch": 1505} {"train_loss": -5.945218086242676, "global_step": 63213, "epoch": 1505} {"train_loss": -5.94264030456543, "global_step": 63214, "epoch": 1505} {"train_loss": -5.853358745574951, "global_step": 63215, "epoch": 1505} {"train_loss": -5.9276885986328125, "global_step": 63216, "epoch": 1505} {"train_loss": -5.999238014221191, "global_step": 63217, "epoch": 1505} {"train_loss": -5.825728416442871, "global_step": 63218, "epoch": 1505} {"train_loss": -6.024606704711914, "global_step": 63219, "epoch": 1505} {"train_loss": -5.963305473327637, "global_step": 63220, "epoch": 1505} {"train_loss": -5.980801105499268, "global_step": 63221, "epoch": 1505} {"train_loss": -5.853692054748535, "global_step": 63222, "epoch": 1505} {"train_loss": -5.818567276000977, "global_step": 63223, "epoch": 1505} {"train_loss": -5.980380535125732, "global_step": 63224, "epoch": 1505} {"train_loss": -5.973093032836914, "global_step": 63225, "epoch": 1505} {"train_loss": -6.049971103668213, "global_step": 63226, "epoch": 1505} {"train_loss": -5.910240173339844, "global_step": 63227, "epoch": 1505} {"train_loss": -5.960040092468262, "global_step": 63228, "epoch": 1505} {"train_loss": -5.85526180267334, "global_step": 63229, "epoch": 1505} {"train_loss": -5.835354804992676, "global_step": 63230, "epoch": 1505} {"train_loss": -5.916171073913574, "global_step": 63231, "epoch": 1505} {"train_loss": -5.911590099334717, "global_step": 63232, "epoch": 1505} {"train_loss": -5.917387008666992, "global_step": 63233, "epoch": 1505} {"train_loss": -6.018848419189453, "global_step": 63234, "epoch": 1505} {"train_loss": -5.902822017669678, "global_step": 63235, "epoch": 1505} {"train_loss": -6.021210193634033, "global_step": 63236, "epoch": 1505} {"train_loss": -5.8123884201049805, "global_step": 63237, "epoch": 1505} {"train_loss": -5.925772666931152, "global_step": 63238, "epoch": 1505} {"train_loss": -6.017184257507324, "global_step": 63239, "epoch": 1505} {"train_loss": -5.9858598709106445, "global_step": 63240, "epoch": 1505} {"train_loss": -5.855112075805664, "global_step": 63241, "epoch": 1505} {"train_loss": -6.028741836547852, "global_step": 63242, "epoch": 1505} {"train_loss": -5.947566032409668, "global_step": 63243, "epoch": 1505} {"train_loss": -5.8777313232421875, "global_step": 63244, "epoch": 1505} {"train_loss": -5.973907470703125, "global_step": 63245, "epoch": 1505} {"train_loss": -5.863447189331055, "global_step": 63246, "epoch": 1505} {"train_loss": -5.964756011962891, "global_step": 63247, "epoch": 1505} {"train_loss": -5.7664947509765625, "global_step": 63248, "epoch": 1505} {"train_loss": -5.824637413024902, "global_step": 63249, "epoch": 1505} {"train_loss": -5.846499443054199, "global_step": 63250, "epoch": 1505} {"train_loss": -5.922048466546195, "global_step": 63251, "epoch": 1505, "val_loss": 74820.734375} {"train_loss": -5.729646682739258, "global_step": 63252, "epoch": 1506} {"train_loss": -5.955712795257568, "global_step": 63253, "epoch": 1506} {"train_loss": -5.912731647491455, "global_step": 63254, "epoch": 1506} {"train_loss": -5.754822731018066, "global_step": 63255, "epoch": 1506} {"train_loss": -5.979650974273682, "global_step": 63256, "epoch": 1506} {"train_loss": -5.841361045837402, "global_step": 63257, "epoch": 1506} {"train_loss": -5.9430155754089355, "global_step": 63258, "epoch": 1506} {"train_loss": -5.798664093017578, "global_step": 63259, "epoch": 1506} {"train_loss": -5.892612934112549, "global_step": 63260, "epoch": 1506} {"train_loss": -5.811827659606934, "global_step": 63261, "epoch": 1506} {"train_loss": -6.042584419250488, "global_step": 63262, "epoch": 1506} {"train_loss": -5.940244197845459, "global_step": 63263, "epoch": 1506} {"train_loss": -5.851276397705078, "global_step": 63264, "epoch": 1506} {"train_loss": -5.891846179962158, "global_step": 63265, "epoch": 1506} {"train_loss": -5.9525909423828125, "global_step": 63266, "epoch": 1506} {"train_loss": -5.892958164215088, "global_step": 63267, "epoch": 1506} {"train_loss": -5.852921962738037, "global_step": 63268, "epoch": 1506} {"train_loss": -5.9059858322143555, "global_step": 63269, "epoch": 1506} {"train_loss": -5.910675048828125, "global_step": 63270, "epoch": 1506} {"train_loss": -5.830091953277588, "global_step": 63271, "epoch": 1506} {"train_loss": -5.8775858879089355, "global_step": 63272, "epoch": 1506} {"train_loss": -5.961080074310303, "global_step": 63273, "epoch": 1506} {"train_loss": -5.746664047241211, "global_step": 63274, "epoch": 1506} {"train_loss": -6.0326385498046875, "global_step": 63275, "epoch": 1506} {"train_loss": -6.027427673339844, "global_step": 63276, "epoch": 1506} {"train_loss": -5.900287628173828, "global_step": 63277, "epoch": 1506} {"train_loss": -5.9193878173828125, "global_step": 63278, "epoch": 1506} {"train_loss": -5.9532952308654785, "global_step": 63279, "epoch": 1506} {"train_loss": -5.818680763244629, "global_step": 63280, "epoch": 1506} {"train_loss": -6.086483001708984, "global_step": 63281, "epoch": 1506} {"train_loss": -5.940153121948242, "global_step": 63282, "epoch": 1506} {"train_loss": -5.996154308319092, "global_step": 63283, "epoch": 1506} {"train_loss": -6.0738525390625, "global_step": 63284, "epoch": 1506} {"train_loss": -6.01715087890625, "global_step": 63285, "epoch": 1506} {"train_loss": -5.929285049438477, "global_step": 63286, "epoch": 1506} {"train_loss": -5.847998142242432, "global_step": 63287, "epoch": 1506} {"train_loss": -5.9363603591918945, "global_step": 63288, "epoch": 1506} {"train_loss": -5.99809455871582, "global_step": 63289, "epoch": 1506} {"train_loss": -5.966424942016602, "global_step": 63290, "epoch": 1506} {"train_loss": -5.89651346206665, "global_step": 63291, "epoch": 1506} {"train_loss": -5.926143646240234, "global_step": 63292, "epoch": 1506} {"train_loss": -5.916777088528588, "global_step": 63293, "epoch": 1506, "val_loss": 74450.7265625} {"train_loss": -5.890185356140137, "global_step": 63294, "epoch": 1507} {"train_loss": -5.96080207824707, "global_step": 63295, "epoch": 1507} {"train_loss": -5.980579376220703, "global_step": 63296, "epoch": 1507} {"train_loss": -5.852402210235596, "global_step": 63297, "epoch": 1507} {"train_loss": -6.075545310974121, "global_step": 63298, "epoch": 1507} {"train_loss": -5.963515281677246, "global_step": 63299, "epoch": 1507} {"train_loss": -5.981198310852051, "global_step": 63300, "epoch": 1507} {"train_loss": -5.959062099456787, "global_step": 63301, "epoch": 1507} {"train_loss": -6.069445610046387, "global_step": 63302, "epoch": 1507} {"train_loss": -5.907397270202637, "global_step": 63303, "epoch": 1507} {"train_loss": -5.833828926086426, "global_step": 63304, "epoch": 1507} {"train_loss": -5.941875457763672, "global_step": 63305, "epoch": 1507} {"train_loss": -5.856081008911133, "global_step": 63306, "epoch": 1507} {"train_loss": -5.961460113525391, "global_step": 63307, "epoch": 1507} {"train_loss": -5.987616539001465, "global_step": 63308, "epoch": 1507} {"train_loss": -5.866415023803711, "global_step": 63309, "epoch": 1507} {"train_loss": -5.8693108558654785, "global_step": 63310, "epoch": 1507} {"train_loss": -6.000112056732178, "global_step": 63311, "epoch": 1507} {"train_loss": -5.971614837646484, "global_step": 63312, "epoch": 1507} {"train_loss": -5.892334938049316, "global_step": 63313, "epoch": 1507} {"train_loss": -5.813881874084473, "global_step": 63314, "epoch": 1507} {"train_loss": -5.916564464569092, "global_step": 63315, "epoch": 1507} {"train_loss": -5.877520561218262, "global_step": 63316, "epoch": 1507} {"train_loss": -5.935549736022949, "global_step": 63317, "epoch": 1507} {"train_loss": -5.849163055419922, "global_step": 63318, "epoch": 1507} {"train_loss": -5.932736396789551, "global_step": 63319, "epoch": 1507} {"train_loss": -6.068848609924316, "global_step": 63320, "epoch": 1507} {"train_loss": -5.974297523498535, "global_step": 63321, "epoch": 1507} {"train_loss": -5.93745231628418, "global_step": 63322, "epoch": 1507} {"train_loss": -5.987070083618164, "global_step": 63323, "epoch": 1507} {"train_loss": -5.9177141189575195, "global_step": 63324, "epoch": 1507} {"train_loss": -5.860418319702148, "global_step": 63325, "epoch": 1507} {"train_loss": -5.942601203918457, "global_step": 63326, "epoch": 1507} {"train_loss": -5.721085548400879, "global_step": 63327, "epoch": 1507} {"train_loss": -5.89256477355957, "global_step": 63328, "epoch": 1507} {"train_loss": -5.858558654785156, "global_step": 63329, "epoch": 1507} {"train_loss": -5.826986312866211, "global_step": 63330, "epoch": 1507} {"train_loss": -5.836082458496094, "global_step": 63331, "epoch": 1507} {"train_loss": -5.864083290100098, "global_step": 63332, "epoch": 1507} {"train_loss": -5.971512794494629, "global_step": 63333, "epoch": 1507} {"train_loss": -5.832488059997559, "global_step": 63334, "epoch": 1507} {"train_loss": -5.917329481669834, "global_step": 63335, "epoch": 1507, "val_loss": 74896.7734375} {"train_loss": -5.768402099609375, "global_step": 63336, "epoch": 1508} {"train_loss": -5.998516082763672, "global_step": 63337, "epoch": 1508} {"train_loss": -5.822737216949463, "global_step": 63338, "epoch": 1508} {"train_loss": -5.938332557678223, "global_step": 63339, "epoch": 1508} {"train_loss": -5.8984527587890625, "global_step": 63340, "epoch": 1508} {"train_loss": -5.909975051879883, "global_step": 63341, "epoch": 1508} {"train_loss": -5.954951286315918, "global_step": 63342, "epoch": 1508} {"train_loss": -5.883915424346924, "global_step": 63343, "epoch": 1508} {"train_loss": -5.868880271911621, "global_step": 63344, "epoch": 1508} {"train_loss": -5.876280307769775, "global_step": 63345, "epoch": 1508} {"train_loss": -6.007800102233887, "global_step": 63346, "epoch": 1508} {"train_loss": -5.902000427246094, "global_step": 63347, "epoch": 1508} {"train_loss": -5.79271125793457, "global_step": 63348, "epoch": 1508} {"train_loss": -5.8293914794921875, "global_step": 63349, "epoch": 1508} {"train_loss": -6.012526512145996, "global_step": 63350, "epoch": 1508} {"train_loss": -5.837615966796875, "global_step": 63351, "epoch": 1508} {"train_loss": -6.140013694763184, "global_step": 63352, "epoch": 1508} {"train_loss": -5.777859687805176, "global_step": 63353, "epoch": 1508} {"train_loss": -5.971485137939453, "global_step": 63354, "epoch": 1508} {"train_loss": -5.9742431640625, "global_step": 63355, "epoch": 1508} {"train_loss": -5.867218017578125, "global_step": 63356, "epoch": 1508} {"train_loss": -5.979174613952637, "global_step": 63357, "epoch": 1508} {"train_loss": -5.817235946655273, "global_step": 63358, "epoch": 1508} {"train_loss": -5.867735862731934, "global_step": 63359, "epoch": 1508} {"train_loss": -5.847877502441406, "global_step": 63360, "epoch": 1508} {"train_loss": -6.057562351226807, "global_step": 63361, "epoch": 1508} {"train_loss": -6.005373954772949, "global_step": 63362, "epoch": 1508} {"train_loss": -5.986485004425049, "global_step": 63363, "epoch": 1508} {"train_loss": -5.944775581359863, "global_step": 63364, "epoch": 1508} {"train_loss": -5.922918319702148, "global_step": 63365, "epoch": 1508} {"train_loss": -5.942164897918701, "global_step": 63366, "epoch": 1508} {"train_loss": -5.938243865966797, "global_step": 63367, "epoch": 1508} {"train_loss": -5.936891555786133, "global_step": 63368, "epoch": 1508} {"train_loss": -6.006131649017334, "global_step": 63369, "epoch": 1508} {"train_loss": -6.002708435058594, "global_step": 63370, "epoch": 1508} {"train_loss": -5.97968864440918, "global_step": 63371, "epoch": 1508} {"train_loss": -5.94520378112793, "global_step": 63372, "epoch": 1508} {"train_loss": -5.987090110778809, "global_step": 63373, "epoch": 1508} {"train_loss": -5.798671722412109, "global_step": 63374, "epoch": 1508} {"train_loss": -5.981058597564697, "global_step": 63375, "epoch": 1508} {"train_loss": -6.033605098724365, "global_step": 63376, "epoch": 1508} {"train_loss": -5.928551730655489, "global_step": 63377, "epoch": 1508, "val_loss": 74701.53125} {"train_loss": -5.795243263244629, "global_step": 63378, "epoch": 1509} {"train_loss": -6.067352294921875, "global_step": 63379, "epoch": 1509} {"train_loss": -6.042736053466797, "global_step": 63380, "epoch": 1509} {"train_loss": -5.926349639892578, "global_step": 63381, "epoch": 1509} {"train_loss": -6.054209232330322, "global_step": 63382, "epoch": 1509} {"train_loss": -5.925112724304199, "global_step": 63383, "epoch": 1509} {"train_loss": -5.898011207580566, "global_step": 63384, "epoch": 1509} {"train_loss": -6.031441688537598, "global_step": 63385, "epoch": 1509} {"train_loss": -5.9083709716796875, "global_step": 63386, "epoch": 1509} {"train_loss": -5.878173828125, "global_step": 63387, "epoch": 1509} {"train_loss": -5.9603986740112305, "global_step": 63388, "epoch": 1509} {"train_loss": -5.967365264892578, "global_step": 63389, "epoch": 1509} {"train_loss": -5.87959098815918, "global_step": 63390, "epoch": 1509} {"train_loss": -5.913470268249512, "global_step": 63391, "epoch": 1509} {"train_loss": -6.078029632568359, "global_step": 63392, "epoch": 1509} {"train_loss": -6.052960395812988, "global_step": 63393, "epoch": 1509} {"train_loss": -5.980110168457031, "global_step": 63394, "epoch": 1509} {"train_loss": -5.96972131729126, "global_step": 63395, "epoch": 1509} {"train_loss": -5.958606719970703, "global_step": 63396, "epoch": 1509} {"train_loss": -5.768118381500244, "global_step": 63397, "epoch": 1509} {"train_loss": -5.851454734802246, "global_step": 63398, "epoch": 1509} {"train_loss": -5.8162946701049805, "global_step": 63399, "epoch": 1509} {"train_loss": -5.948286056518555, "global_step": 63400, "epoch": 1509} {"train_loss": -5.951308250427246, "global_step": 63401, "epoch": 1509} {"train_loss": -5.887192726135254, "global_step": 63402, "epoch": 1509} {"train_loss": -5.841470718383789, "global_step": 63403, "epoch": 1509} {"train_loss": -5.94504451751709, "global_step": 63404, "epoch": 1509} {"train_loss": -5.871175765991211, "global_step": 63405, "epoch": 1509} {"train_loss": -5.768429756164551, "global_step": 63406, "epoch": 1509} {"train_loss": -5.967796802520752, "global_step": 63407, "epoch": 1509} {"train_loss": -6.052702903747559, "global_step": 63408, "epoch": 1509} {"train_loss": -5.826810359954834, "global_step": 63409, "epoch": 1509} {"train_loss": -5.893164157867432, "global_step": 63410, "epoch": 1509} {"train_loss": -6.027698993682861, "global_step": 63411, "epoch": 1509} {"train_loss": -6.053811550140381, "global_step": 63412, "epoch": 1509} {"train_loss": -6.020505905151367, "global_step": 63413, "epoch": 1509} {"train_loss": -5.9206085205078125, "global_step": 63414, "epoch": 1509} {"train_loss": -5.959495544433594, "global_step": 63415, "epoch": 1509} {"train_loss": -5.997200965881348, "global_step": 63416, "epoch": 1509} {"train_loss": -5.955235958099365, "global_step": 63417, "epoch": 1509} {"train_loss": -6.013016700744629, "global_step": 63418, "epoch": 1509} {"train_loss": -5.943460294178554, "global_step": 63419, "epoch": 1509, "val_loss": 74486.6953125} {"train_loss": -5.885831356048584, "global_step": 63420, "epoch": 1510} {"train_loss": -5.925548553466797, "global_step": 63421, "epoch": 1510} {"train_loss": -6.008679389953613, "global_step": 63422, "epoch": 1510} {"train_loss": -5.889993667602539, "global_step": 63423, "epoch": 1510} {"train_loss": -6.026628494262695, "global_step": 63424, "epoch": 1510} {"train_loss": -5.880385398864746, "global_step": 63425, "epoch": 1510} {"train_loss": -5.910530090332031, "global_step": 63426, "epoch": 1510} {"train_loss": -5.916738510131836, "global_step": 63427, "epoch": 1510} {"train_loss": -5.980796813964844, "global_step": 63428, "epoch": 1510} {"train_loss": -5.938686370849609, "global_step": 63429, "epoch": 1510} {"train_loss": -5.977188587188721, "global_step": 63430, "epoch": 1510} {"train_loss": -6.169064521789551, "global_step": 63431, "epoch": 1510} {"train_loss": -6.0617218017578125, "global_step": 63432, "epoch": 1510} {"train_loss": -6.018187046051025, "global_step": 63433, "epoch": 1510} {"train_loss": -5.977295875549316, "global_step": 63434, "epoch": 1510} {"train_loss": -5.92161750793457, "global_step": 63435, "epoch": 1510} {"train_loss": -5.931994438171387, "global_step": 63436, "epoch": 1510} {"train_loss": -5.892239093780518, "global_step": 63437, "epoch": 1510} {"train_loss": -5.890081405639648, "global_step": 63438, "epoch": 1510} {"train_loss": -5.8938798904418945, "global_step": 63439, "epoch": 1510} {"train_loss": -6.027477264404297, "global_step": 63440, "epoch": 1510} {"train_loss": -5.949488639831543, "global_step": 63441, "epoch": 1510} {"train_loss": -5.939839839935303, "global_step": 63442, "epoch": 1510} {"train_loss": -6.031774997711182, "global_step": 63443, "epoch": 1510} {"train_loss": -5.96975040435791, "global_step": 63444, "epoch": 1510} {"train_loss": -6.004504203796387, "global_step": 63445, "epoch": 1510} {"train_loss": -5.880510330200195, "global_step": 63446, "epoch": 1510} {"train_loss": -5.8859052658081055, "global_step": 63447, "epoch": 1510} {"train_loss": -5.882657527923584, "global_step": 63448, "epoch": 1510} {"train_loss": -6.007155895233154, "global_step": 63449, "epoch": 1510} {"train_loss": -5.9341864585876465, "global_step": 63450, "epoch": 1510} {"train_loss": -5.846722602844238, "global_step": 63451, "epoch": 1510} {"train_loss": -5.887146949768066, "global_step": 63452, "epoch": 1510} {"train_loss": -5.8519182205200195, "global_step": 63453, "epoch": 1510} {"train_loss": -5.980462074279785, "global_step": 63454, "epoch": 1510} {"train_loss": -5.860857009887695, "global_step": 63455, "epoch": 1510} {"train_loss": -5.990571022033691, "global_step": 63456, "epoch": 1510} {"train_loss": -6.073511123657227, "global_step": 63457, "epoch": 1510} {"train_loss": -6.050020217895508, "global_step": 63458, "epoch": 1510} {"train_loss": -5.850819110870361, "global_step": 63459, "epoch": 1510} {"train_loss": -5.948087692260742, "global_step": 63460, "epoch": 1510} {"train_loss": -5.951180072057815, "global_step": 63461, "epoch": 1510, "val_loss": 74120.2578125} {"train_loss": -6.017060279846191, "global_step": 63462, "epoch": 1511} {"train_loss": -6.000341892242432, "global_step": 63463, "epoch": 1511} {"train_loss": -5.962972640991211, "global_step": 63464, "epoch": 1511} {"train_loss": -5.930655479431152, "global_step": 63465, "epoch": 1511} {"train_loss": -6.073185920715332, "global_step": 63466, "epoch": 1511} {"train_loss": -5.947074890136719, "global_step": 63467, "epoch": 1511} {"train_loss": -6.048439979553223, "global_step": 63468, "epoch": 1511} {"train_loss": -5.889728546142578, "global_step": 63469, "epoch": 1511} {"train_loss": -5.909328460693359, "global_step": 63470, "epoch": 1511} {"train_loss": -5.86570405960083, "global_step": 63471, "epoch": 1511} {"train_loss": -5.895657539367676, "global_step": 63472, "epoch": 1511} {"train_loss": -5.915689468383789, "global_step": 63473, "epoch": 1511} {"train_loss": -5.866158485412598, "global_step": 63474, "epoch": 1511} {"train_loss": -5.922247409820557, "global_step": 63475, "epoch": 1511} {"train_loss": -5.83750057220459, "global_step": 63476, "epoch": 1511} {"train_loss": -5.848916053771973, "global_step": 63477, "epoch": 1511} {"train_loss": -6.021036148071289, "global_step": 63478, "epoch": 1511} {"train_loss": -5.764734745025635, "global_step": 63479, "epoch": 1511} {"train_loss": -5.980669021606445, "global_step": 63480, "epoch": 1511} {"train_loss": -5.9653425216674805, "global_step": 63481, "epoch": 1511} {"train_loss": -5.874558448791504, "global_step": 63482, "epoch": 1511} {"train_loss": -5.882794380187988, "global_step": 63483, "epoch": 1511} {"train_loss": -5.916714668273926, "global_step": 63484, "epoch": 1511} {"train_loss": -5.970822334289551, "global_step": 63485, "epoch": 1511} {"train_loss": -5.839966773986816, "global_step": 63486, "epoch": 1511} {"train_loss": -5.928612232208252, "global_step": 63487, "epoch": 1511} {"train_loss": -5.9327592849731445, "global_step": 63488, "epoch": 1511} {"train_loss": -5.768927574157715, "global_step": 63489, "epoch": 1511} {"train_loss": -6.052258491516113, "global_step": 63490, "epoch": 1511} {"train_loss": -5.926795959472656, "global_step": 63491, "epoch": 1511} {"train_loss": -5.939243793487549, "global_step": 63492, "epoch": 1511} {"train_loss": -6.02398157119751, "global_step": 63493, "epoch": 1511} {"train_loss": -5.8291473388671875, "global_step": 63494, "epoch": 1511} {"train_loss": -5.8431291580200195, "global_step": 63495, "epoch": 1511} {"train_loss": -5.930915832519531, "global_step": 63496, "epoch": 1511} {"train_loss": -5.948537349700928, "global_step": 63497, "epoch": 1511} {"train_loss": -6.016323089599609, "global_step": 63498, "epoch": 1511} {"train_loss": -5.982599258422852, "global_step": 63499, "epoch": 1511} {"train_loss": -5.98300313949585, "global_step": 63500, "epoch": 1511} {"train_loss": -5.821476936340332, "global_step": 63501, "epoch": 1511} {"train_loss": -5.941131591796875, "global_step": 63502, "epoch": 1511} {"train_loss": -5.927652790432885, "global_step": 63503, "epoch": 1511, "val_loss": 74741.984375} {"train_loss": -6.012740135192871, "global_step": 63504, "epoch": 1512} {"train_loss": -5.810638427734375, "global_step": 63505, "epoch": 1512} {"train_loss": -5.979923725128174, "global_step": 63506, "epoch": 1512} {"train_loss": -5.962579727172852, "global_step": 63507, "epoch": 1512} {"train_loss": -5.763815402984619, "global_step": 63508, "epoch": 1512} {"train_loss": -5.980690002441406, "global_step": 63509, "epoch": 1512} {"train_loss": -5.918832302093506, "global_step": 63510, "epoch": 1512} {"train_loss": -5.905247688293457, "global_step": 63511, "epoch": 1512} {"train_loss": -5.947630882263184, "global_step": 63512, "epoch": 1512} {"train_loss": -5.964488983154297, "global_step": 63513, "epoch": 1512} {"train_loss": -5.864323616027832, "global_step": 63514, "epoch": 1512} {"train_loss": -5.980125427246094, "global_step": 63515, "epoch": 1512} {"train_loss": -5.908289432525635, "global_step": 63516, "epoch": 1512} {"train_loss": -5.9009809494018555, "global_step": 63517, "epoch": 1512} {"train_loss": -5.961084365844727, "global_step": 63518, "epoch": 1512} {"train_loss": -5.906458854675293, "global_step": 63519, "epoch": 1512} {"train_loss": -5.824878692626953, "global_step": 63520, "epoch": 1512} {"train_loss": -6.0308709144592285, "global_step": 63521, "epoch": 1512} {"train_loss": -5.769672393798828, "global_step": 63522, "epoch": 1512} {"train_loss": -5.970206260681152, "global_step": 63523, "epoch": 1512} {"train_loss": -5.951894760131836, "global_step": 63524, "epoch": 1512} {"train_loss": -5.917719841003418, "global_step": 63525, "epoch": 1512} {"train_loss": -6.035932540893555, "global_step": 63526, "epoch": 1512} {"train_loss": -5.905496597290039, "global_step": 63527, "epoch": 1512} {"train_loss": -6.017136573791504, "global_step": 63528, "epoch": 1512} {"train_loss": -5.862889289855957, "global_step": 63529, "epoch": 1512} {"train_loss": -5.971307754516602, "global_step": 63530, "epoch": 1512} {"train_loss": -6.05622673034668, "global_step": 63531, "epoch": 1512} {"train_loss": -5.956017017364502, "global_step": 63532, "epoch": 1512} {"train_loss": -6.006139755249023, "global_step": 63533, "epoch": 1512} {"train_loss": -5.960646629333496, "global_step": 63534, "epoch": 1512} {"train_loss": -5.972620964050293, "global_step": 63535, "epoch": 1512} {"train_loss": -6.0185747146606445, "global_step": 63536, "epoch": 1512} {"train_loss": -5.935385227203369, "global_step": 63537, "epoch": 1512} {"train_loss": -5.974933624267578, "global_step": 63538, "epoch": 1512} {"train_loss": -6.036318302154541, "global_step": 63539, "epoch": 1512} {"train_loss": -5.959721088409424, "global_step": 63540, "epoch": 1512} {"train_loss": -5.9159040451049805, "global_step": 63541, "epoch": 1512} {"train_loss": -5.978951454162598, "global_step": 63542, "epoch": 1512} {"train_loss": -5.943499565124512, "global_step": 63543, "epoch": 1512} {"train_loss": -5.906100273132324, "global_step": 63544, "epoch": 1512} {"train_loss": -5.943799325398037, "global_step": 63545, "epoch": 1512, "val_loss": 74302.03125} {"train_loss": -5.946697235107422, "global_step": 63546, "epoch": 1513} {"train_loss": -5.995871067047119, "global_step": 63547, "epoch": 1513} {"train_loss": -5.967979431152344, "global_step": 63548, "epoch": 1513} {"train_loss": -6.010651588439941, "global_step": 63549, "epoch": 1513} {"train_loss": -5.9741950035095215, "global_step": 63550, "epoch": 1513} {"train_loss": -5.920626163482666, "global_step": 63551, "epoch": 1513} {"train_loss": -5.924572944641113, "global_step": 63552, "epoch": 1513} {"train_loss": -5.96223783493042, "global_step": 63553, "epoch": 1513} {"train_loss": -6.02498197555542, "global_step": 63554, "epoch": 1513} {"train_loss": -5.896828651428223, "global_step": 63555, "epoch": 1513} {"train_loss": -5.874510765075684, "global_step": 63556, "epoch": 1513} {"train_loss": -5.958034515380859, "global_step": 63557, "epoch": 1513} {"train_loss": -5.925576210021973, "global_step": 63558, "epoch": 1513} {"train_loss": -5.958033561706543, "global_step": 63559, "epoch": 1513} {"train_loss": -5.882575035095215, "global_step": 63560, "epoch": 1513} {"train_loss": -5.98776388168335, "global_step": 63561, "epoch": 1513} {"train_loss": -6.033748626708984, "global_step": 63562, "epoch": 1513} {"train_loss": -5.867184638977051, "global_step": 63563, "epoch": 1513} {"train_loss": -5.963938236236572, "global_step": 63564, "epoch": 1513} {"train_loss": -6.013439655303955, "global_step": 63565, "epoch": 1513} {"train_loss": -5.982540130615234, "global_step": 63566, "epoch": 1513} {"train_loss": -5.972006797790527, "global_step": 63567, "epoch": 1513} {"train_loss": -5.911903381347656, "global_step": 63568, "epoch": 1513} {"train_loss": -5.9500322341918945, "global_step": 63569, "epoch": 1513} {"train_loss": -5.945204734802246, "global_step": 63570, "epoch": 1513} {"train_loss": -5.811991214752197, "global_step": 63571, "epoch": 1513} {"train_loss": -5.872979640960693, "global_step": 63572, "epoch": 1513} {"train_loss": -5.829280853271484, "global_step": 63573, "epoch": 1513} {"train_loss": -5.917993068695068, "global_step": 63574, "epoch": 1513} {"train_loss": -5.848341941833496, "global_step": 63575, "epoch": 1513} {"train_loss": -5.973730564117432, "global_step": 63576, "epoch": 1513} {"train_loss": -5.941073894500732, "global_step": 63577, "epoch": 1513} {"train_loss": -5.92331075668335, "global_step": 63578, "epoch": 1513} {"train_loss": -5.937950134277344, "global_step": 63579, "epoch": 1513} {"train_loss": -5.954482078552246, "global_step": 63580, "epoch": 1513} {"train_loss": -5.97369384765625, "global_step": 63581, "epoch": 1513} {"train_loss": -5.883414268493652, "global_step": 63582, "epoch": 1513} {"train_loss": -5.875391006469727, "global_step": 63583, "epoch": 1513} {"train_loss": -5.972115516662598, "global_step": 63584, "epoch": 1513} {"train_loss": -5.9389190673828125, "global_step": 63585, "epoch": 1513} {"train_loss": -5.953853607177734, "global_step": 63586, "epoch": 1513} {"train_loss": -5.938679354531424, "global_step": 63587, "epoch": 1513, "val_loss": 74316.546875} {"train_loss": -6.010404109954834, "global_step": 63588, "epoch": 1514} {"train_loss": -5.95061731338501, "global_step": 63589, "epoch": 1514} {"train_loss": -5.900026798248291, "global_step": 63590, "epoch": 1514} {"train_loss": -5.871744632720947, "global_step": 63591, "epoch": 1514} {"train_loss": -6.009340286254883, "global_step": 63592, "epoch": 1514} {"train_loss": -6.025113582611084, "global_step": 63593, "epoch": 1514} {"train_loss": -5.971427917480469, "global_step": 63594, "epoch": 1514} {"train_loss": -5.998567581176758, "global_step": 63595, "epoch": 1514} {"train_loss": -5.913946151733398, "global_step": 63596, "epoch": 1514} {"train_loss": -6.051191329956055, "global_step": 63597, "epoch": 1514} {"train_loss": -5.953549861907959, "global_step": 63598, "epoch": 1514} {"train_loss": -5.838457107543945, "global_step": 63599, "epoch": 1514} {"train_loss": -6.007833003997803, "global_step": 63600, "epoch": 1514} {"train_loss": -5.897464752197266, "global_step": 63601, "epoch": 1514} {"train_loss": -5.976629257202148, "global_step": 63602, "epoch": 1514} {"train_loss": -6.0830888748168945, "global_step": 63603, "epoch": 1514} {"train_loss": -5.9647040367126465, "global_step": 63604, "epoch": 1514} {"train_loss": -5.950654983520508, "global_step": 63605, "epoch": 1514} {"train_loss": -5.881394386291504, "global_step": 63606, "epoch": 1514} {"train_loss": -5.880165100097656, "global_step": 63607, "epoch": 1514} {"train_loss": -5.847705841064453, "global_step": 63608, "epoch": 1514} {"train_loss": -5.880903244018555, "global_step": 63609, "epoch": 1514} {"train_loss": -6.005073547363281, "global_step": 63610, "epoch": 1514} {"train_loss": -5.975616455078125, "global_step": 63611, "epoch": 1514} {"train_loss": -6.024441719055176, "global_step": 63612, "epoch": 1514} {"train_loss": -5.972600936889648, "global_step": 63613, "epoch": 1514} {"train_loss": -6.034669399261475, "global_step": 63614, "epoch": 1514} {"train_loss": -6.022350311279297, "global_step": 63615, "epoch": 1514} {"train_loss": -6.07180118560791, "global_step": 63616, "epoch": 1514} {"train_loss": -6.0245184898376465, "global_step": 63617, "epoch": 1514} {"train_loss": -6.0166120529174805, "global_step": 63618, "epoch": 1514} {"train_loss": -5.884746074676514, "global_step": 63619, "epoch": 1514} {"train_loss": -5.832190990447998, "global_step": 63620, "epoch": 1514} {"train_loss": -6.0499067306518555, "global_step": 63621, "epoch": 1514} {"train_loss": -5.899925708770752, "global_step": 63622, "epoch": 1514} {"train_loss": -5.98198127746582, "global_step": 63623, "epoch": 1514} {"train_loss": -5.928557395935059, "global_step": 63624, "epoch": 1514} {"train_loss": -5.929896831512451, "global_step": 63625, "epoch": 1514} {"train_loss": -5.954540252685547, "global_step": 63626, "epoch": 1514} {"train_loss": -5.96990966796875, "global_step": 63627, "epoch": 1514} {"train_loss": -5.965277671813965, "global_step": 63628, "epoch": 1514} {"train_loss": -5.960046836308071, "global_step": 63629, "epoch": 1514, "val_loss": 74553.3359375} {"train_loss": -5.838747978210449, "global_step": 63630, "epoch": 1515} {"train_loss": -5.919013977050781, "global_step": 63631, "epoch": 1515} {"train_loss": -5.9499006271362305, "global_step": 63632, "epoch": 1515} {"train_loss": -5.968595504760742, "global_step": 63633, "epoch": 1515} {"train_loss": -5.899146556854248, "global_step": 63634, "epoch": 1515} {"train_loss": -6.023653030395508, "global_step": 63635, "epoch": 1515} {"train_loss": -5.909943580627441, "global_step": 63636, "epoch": 1515} {"train_loss": -6.096502304077148, "global_step": 63637, "epoch": 1515} {"train_loss": -5.924855709075928, "global_step": 63638, "epoch": 1515} {"train_loss": -5.924628257751465, "global_step": 63639, "epoch": 1515} {"train_loss": -5.931352138519287, "global_step": 63640, "epoch": 1515} {"train_loss": -6.00006103515625, "global_step": 63641, "epoch": 1515} {"train_loss": -5.917616844177246, "global_step": 63642, "epoch": 1515} {"train_loss": -5.971643447875977, "global_step": 63643, "epoch": 1515} {"train_loss": -6.041823387145996, "global_step": 63644, "epoch": 1515} {"train_loss": -5.986083030700684, "global_step": 63645, "epoch": 1515} {"train_loss": -5.976524353027344, "global_step": 63646, "epoch": 1515} {"train_loss": -5.876365661621094, "global_step": 63647, "epoch": 1515} {"train_loss": -5.941844463348389, "global_step": 63648, "epoch": 1515} {"train_loss": -5.900465965270996, "global_step": 63649, "epoch": 1515} {"train_loss": -5.887975692749023, "global_step": 63650, "epoch": 1515} {"train_loss": -5.908139228820801, "global_step": 63651, "epoch": 1515} {"train_loss": -5.94819450378418, "global_step": 63652, "epoch": 1515} {"train_loss": -5.924200057983398, "global_step": 63653, "epoch": 1515} {"train_loss": -5.954838752746582, "global_step": 63654, "epoch": 1515} {"train_loss": -5.790717124938965, "global_step": 63655, "epoch": 1515} {"train_loss": -5.880718231201172, "global_step": 63656, "epoch": 1515} {"train_loss": -5.854101181030273, "global_step": 63657, "epoch": 1515} {"train_loss": -5.941357135772705, "global_step": 63658, "epoch": 1515} {"train_loss": -5.985137462615967, "global_step": 63659, "epoch": 1515} {"train_loss": -5.990816116333008, "global_step": 63660, "epoch": 1515} {"train_loss": -5.98923397064209, "global_step": 63661, "epoch": 1515} {"train_loss": -5.9836931228637695, "global_step": 63662, "epoch": 1515} {"train_loss": -5.992818832397461, "global_step": 63663, "epoch": 1515} {"train_loss": -5.9676833152771, "global_step": 63664, "epoch": 1515} {"train_loss": -6.002175331115723, "global_step": 63665, "epoch": 1515} {"train_loss": -6.016574859619141, "global_step": 63666, "epoch": 1515} {"train_loss": -6.021084785461426, "global_step": 63667, "epoch": 1515} {"train_loss": -5.813681602478027, "global_step": 63668, "epoch": 1515} {"train_loss": -5.934839248657227, "global_step": 63669, "epoch": 1515} {"train_loss": -5.887924671173096, "global_step": 63670, "epoch": 1515} {"train_loss": -5.945494765327091, "global_step": 63671, "epoch": 1515, "val_loss": 74721.0625} {"train_loss": -5.966094970703125, "global_step": 63672, "epoch": 1516} {"train_loss": -6.00404167175293, "global_step": 63673, "epoch": 1516} {"train_loss": -6.011753082275391, "global_step": 63674, "epoch": 1516} {"train_loss": -5.912961959838867, "global_step": 63675, "epoch": 1516} {"train_loss": -5.90192985534668, "global_step": 63676, "epoch": 1516} {"train_loss": -5.951866149902344, "global_step": 63677, "epoch": 1516} {"train_loss": -5.779367923736572, "global_step": 63678, "epoch": 1516} {"train_loss": -5.99298620223999, "global_step": 63679, "epoch": 1516} {"train_loss": -6.018512725830078, "global_step": 63680, "epoch": 1516} {"train_loss": -5.826543807983398, "global_step": 63681, "epoch": 1516} {"train_loss": -5.847916603088379, "global_step": 63682, "epoch": 1516} {"train_loss": -5.951996803283691, "global_step": 63683, "epoch": 1516} {"train_loss": -6.050579071044922, "global_step": 63684, "epoch": 1516} {"train_loss": -5.877986907958984, "global_step": 63685, "epoch": 1516} {"train_loss": -5.953395366668701, "global_step": 63686, "epoch": 1516} {"train_loss": -5.979647636413574, "global_step": 63687, "epoch": 1516} {"train_loss": -6.003016471862793, "global_step": 63688, "epoch": 1516} {"train_loss": -5.952846527099609, "global_step": 63689, "epoch": 1516} {"train_loss": -5.915078163146973, "global_step": 63690, "epoch": 1516} {"train_loss": -6.030013084411621, "global_step": 63691, "epoch": 1516} {"train_loss": -5.948902130126953, "global_step": 63692, "epoch": 1516} {"train_loss": -5.893287658691406, "global_step": 63693, "epoch": 1516} {"train_loss": -5.937278747558594, "global_step": 63694, "epoch": 1516} {"train_loss": -5.968762397766113, "global_step": 63695, "epoch": 1516} {"train_loss": -5.975987911224365, "global_step": 63696, "epoch": 1516} {"train_loss": -5.940792083740234, "global_step": 63697, "epoch": 1516} {"train_loss": -5.86467170715332, "global_step": 63698, "epoch": 1516} {"train_loss": -6.061614036560059, "global_step": 63699, "epoch": 1516} {"train_loss": -5.841064453125, "global_step": 63700, "epoch": 1516} {"train_loss": -5.960089206695557, "global_step": 63701, "epoch": 1516} {"train_loss": -6.0011115074157715, "global_step": 63702, "epoch": 1516} {"train_loss": -5.826663017272949, "global_step": 63703, "epoch": 1516} {"train_loss": -5.905790328979492, "global_step": 63704, "epoch": 1516} {"train_loss": -5.933081150054932, "global_step": 63705, "epoch": 1516} {"train_loss": -5.993829727172852, "global_step": 63706, "epoch": 1516} {"train_loss": -5.839986801147461, "global_step": 63707, "epoch": 1516} {"train_loss": -5.946348667144775, "global_step": 63708, "epoch": 1516} {"train_loss": -5.984475135803223, "global_step": 63709, "epoch": 1516} {"train_loss": -5.946741104125977, "global_step": 63710, "epoch": 1516} {"train_loss": -5.99223518371582, "global_step": 63711, "epoch": 1516} {"train_loss": -5.896506309509277, "global_step": 63712, "epoch": 1516} {"train_loss": -5.942681664512271, "global_step": 63713, "epoch": 1516, "val_loss": 74491.8203125} {"train_loss": -6.102866172790527, "global_step": 63714, "epoch": 1517} {"train_loss": -5.931534767150879, "global_step": 63715, "epoch": 1517} {"train_loss": -5.959456443786621, "global_step": 63716, "epoch": 1517} {"train_loss": -6.015765190124512, "global_step": 63717, "epoch": 1517} {"train_loss": -5.890890121459961, "global_step": 63718, "epoch": 1517} {"train_loss": -6.008115768432617, "global_step": 63719, "epoch": 1517} {"train_loss": -6.0365447998046875, "global_step": 63720, "epoch": 1517} {"train_loss": -5.967709541320801, "global_step": 63721, "epoch": 1517} {"train_loss": -5.913926601409912, "global_step": 63722, "epoch": 1517} {"train_loss": -6.0301008224487305, "global_step": 63723, "epoch": 1517} {"train_loss": -5.92514181137085, "global_step": 63724, "epoch": 1517} {"train_loss": -5.899825572967529, "global_step": 63725, "epoch": 1517} {"train_loss": -5.942577838897705, "global_step": 63726, "epoch": 1517} {"train_loss": -5.908388614654541, "global_step": 63727, "epoch": 1517} {"train_loss": -5.999744415283203, "global_step": 63728, "epoch": 1517} {"train_loss": -5.969210624694824, "global_step": 63729, "epoch": 1517} {"train_loss": -5.984111785888672, "global_step": 63730, "epoch": 1517} {"train_loss": -6.085362434387207, "global_step": 63731, "epoch": 1517} {"train_loss": -5.929990291595459, "global_step": 63732, "epoch": 1517} {"train_loss": -5.991785049438477, "global_step": 63733, "epoch": 1517} {"train_loss": -5.938399791717529, "global_step": 63734, "epoch": 1517} {"train_loss": -6.063061714172363, "global_step": 63735, "epoch": 1517} {"train_loss": -5.970975875854492, "global_step": 63736, "epoch": 1517} {"train_loss": -6.015103340148926, "global_step": 63737, "epoch": 1517} {"train_loss": -5.9616193771362305, "global_step": 63738, "epoch": 1517} {"train_loss": -5.992368698120117, "global_step": 63739, "epoch": 1517} {"train_loss": -6.0704193115234375, "global_step": 63740, "epoch": 1517} {"train_loss": -5.96898078918457, "global_step": 63741, "epoch": 1517} {"train_loss": -5.938255310058594, "global_step": 63742, "epoch": 1517} {"train_loss": -6.029667377471924, "global_step": 63743, "epoch": 1517} {"train_loss": -5.903586387634277, "global_step": 63744, "epoch": 1517} {"train_loss": -5.85334587097168, "global_step": 63745, "epoch": 1517} {"train_loss": -5.985918045043945, "global_step": 63746, "epoch": 1517} {"train_loss": -5.889226913452148, "global_step": 63747, "epoch": 1517} {"train_loss": -5.941844940185547, "global_step": 63748, "epoch": 1517} {"train_loss": -5.895259857177734, "global_step": 63749, "epoch": 1517} {"train_loss": -6.012073516845703, "global_step": 63750, "epoch": 1517} {"train_loss": -5.933510780334473, "global_step": 63751, "epoch": 1517} {"train_loss": -5.866361141204834, "global_step": 63752, "epoch": 1517} {"train_loss": -5.9363813400268555, "global_step": 63753, "epoch": 1517} {"train_loss": -5.937704086303711, "global_step": 63754, "epoch": 1517} {"train_loss": -5.9662009080251055, "global_step": 63755, "epoch": 1517, "val_loss": 74701.7109375} {"train_loss": -5.879977226257324, "global_step": 63756, "epoch": 1518} {"train_loss": -5.867184638977051, "global_step": 63757, "epoch": 1518} {"train_loss": -5.979946136474609, "global_step": 63758, "epoch": 1518} {"train_loss": -5.932795524597168, "global_step": 63759, "epoch": 1518} {"train_loss": -5.880336761474609, "global_step": 63760, "epoch": 1518} {"train_loss": -5.944840431213379, "global_step": 63761, "epoch": 1518} {"train_loss": -5.983672142028809, "global_step": 63762, "epoch": 1518} {"train_loss": -6.033760070800781, "global_step": 63763, "epoch": 1518} {"train_loss": -5.969183444976807, "global_step": 63764, "epoch": 1518} {"train_loss": -5.993773460388184, "global_step": 63765, "epoch": 1518} {"train_loss": -5.831507682800293, "global_step": 63766, "epoch": 1518} {"train_loss": -6.02154541015625, "global_step": 63767, "epoch": 1518} {"train_loss": -6.004533767700195, "global_step": 63768, "epoch": 1518} {"train_loss": -5.934915542602539, "global_step": 63769, "epoch": 1518} {"train_loss": -5.899864673614502, "global_step": 63770, "epoch": 1518} {"train_loss": -5.935444355010986, "global_step": 63771, "epoch": 1518} {"train_loss": -5.8088178634643555, "global_step": 63772, "epoch": 1518} {"train_loss": -5.836709499359131, "global_step": 63773, "epoch": 1518} {"train_loss": -6.046817779541016, "global_step": 63774, "epoch": 1518} {"train_loss": -5.808010101318359, "global_step": 63775, "epoch": 1518} {"train_loss": -6.008393287658691, "global_step": 63776, "epoch": 1518} {"train_loss": -5.822094440460205, "global_step": 63777, "epoch": 1518} {"train_loss": -5.811203479766846, "global_step": 63778, "epoch": 1518} {"train_loss": -5.9599504470825195, "global_step": 63779, "epoch": 1518} {"train_loss": -5.967904090881348, "global_step": 63780, "epoch": 1518} {"train_loss": -6.116890907287598, "global_step": 63781, "epoch": 1518} {"train_loss": -5.949618339538574, "global_step": 63782, "epoch": 1518} {"train_loss": -5.938302516937256, "global_step": 63783, "epoch": 1518} {"train_loss": -6.060636043548584, "global_step": 63784, "epoch": 1518} {"train_loss": -5.929793834686279, "global_step": 63785, "epoch": 1518} {"train_loss": -5.999595642089844, "global_step": 63786, "epoch": 1518} {"train_loss": -5.951920986175537, "global_step": 63787, "epoch": 1518} {"train_loss": -5.852358818054199, "global_step": 63788, "epoch": 1518} {"train_loss": -5.991235733032227, "global_step": 63789, "epoch": 1518} {"train_loss": -5.816338539123535, "global_step": 63790, "epoch": 1518} {"train_loss": -5.954569339752197, "global_step": 63791, "epoch": 1518} {"train_loss": -5.937291145324707, "global_step": 63792, "epoch": 1518} {"train_loss": -5.959939479827881, "global_step": 63793, "epoch": 1518} {"train_loss": -5.779747009277344, "global_step": 63794, "epoch": 1518} {"train_loss": -5.897390842437744, "global_step": 63795, "epoch": 1518} {"train_loss": -5.993513107299805, "global_step": 63796, "epoch": 1518} {"train_loss": -5.934759537378947, "global_step": 63797, "epoch": 1518, "val_loss": 74670.6484375} {"train_loss": -5.955430507659912, "global_step": 63798, "epoch": 1519} {"train_loss": -5.8622331619262695, "global_step": 63799, "epoch": 1519} {"train_loss": -6.004031181335449, "global_step": 63800, "epoch": 1519} {"train_loss": -5.882810592651367, "global_step": 63801, "epoch": 1519} {"train_loss": -5.915838241577148, "global_step": 63802, "epoch": 1519} {"train_loss": -6.027933120727539, "global_step": 63803, "epoch": 1519} {"train_loss": -5.92800235748291, "global_step": 63804, "epoch": 1519} {"train_loss": -5.956916332244873, "global_step": 63805, "epoch": 1519} {"train_loss": -5.920635223388672, "global_step": 63806, "epoch": 1519} {"train_loss": -5.986200332641602, "global_step": 63807, "epoch": 1519} {"train_loss": -5.867194175720215, "global_step": 63808, "epoch": 1519} {"train_loss": -6.059603691101074, "global_step": 63809, "epoch": 1519} {"train_loss": -5.822208881378174, "global_step": 63810, "epoch": 1519} {"train_loss": -6.0185370445251465, "global_step": 63811, "epoch": 1519} {"train_loss": -5.909060478210449, "global_step": 63812, "epoch": 1519} {"train_loss": -6.015697956085205, "global_step": 63813, "epoch": 1519} {"train_loss": -5.85439395904541, "global_step": 63814, "epoch": 1519} {"train_loss": -5.931352615356445, "global_step": 63815, "epoch": 1519} {"train_loss": -6.030627250671387, "global_step": 63816, "epoch": 1519} {"train_loss": -5.8011579513549805, "global_step": 63817, "epoch": 1519} {"train_loss": -5.949472427368164, "global_step": 63818, "epoch": 1519} {"train_loss": -5.806000709533691, "global_step": 63819, "epoch": 1519} {"train_loss": -5.855851650238037, "global_step": 63820, "epoch": 1519} {"train_loss": -5.8697309494018555, "global_step": 63821, "epoch": 1519} {"train_loss": -6.077892303466797, "global_step": 63822, "epoch": 1519} {"train_loss": -5.975661277770996, "global_step": 63823, "epoch": 1519} {"train_loss": -5.8208842277526855, "global_step": 63824, "epoch": 1519} {"train_loss": -5.941404342651367, "global_step": 63825, "epoch": 1519} {"train_loss": -6.005084991455078, "global_step": 63826, "epoch": 1519} {"train_loss": -5.976531028747559, "global_step": 63827, "epoch": 1519} {"train_loss": -5.953484535217285, "global_step": 63828, "epoch": 1519} {"train_loss": -5.884394645690918, "global_step": 63829, "epoch": 1519} {"train_loss": -5.975776672363281, "global_step": 63830, "epoch": 1519} {"train_loss": -5.926020622253418, "global_step": 63831, "epoch": 1519} {"train_loss": -5.965522766113281, "global_step": 63832, "epoch": 1519} {"train_loss": -5.970087051391602, "global_step": 63833, "epoch": 1519} {"train_loss": -5.990542888641357, "global_step": 63834, "epoch": 1519} {"train_loss": -5.952080726623535, "global_step": 63835, "epoch": 1519} {"train_loss": -6.020291328430176, "global_step": 63836, "epoch": 1519} {"train_loss": -5.937071323394775, "global_step": 63837, "epoch": 1519} {"train_loss": -5.9818220138549805, "global_step": 63838, "epoch": 1519} {"train_loss": -5.941012711752029, "global_step": 63839, "epoch": 1519, "val_loss": 74848.734375} {"train_loss": -5.982767105102539, "global_step": 63840, "epoch": 1520} {"train_loss": -5.839432239532471, "global_step": 63841, "epoch": 1520} {"train_loss": -5.828652381896973, "global_step": 63842, "epoch": 1520} {"train_loss": -6.067197799682617, "global_step": 63843, "epoch": 1520} {"train_loss": -6.015623092651367, "global_step": 63844, "epoch": 1520} {"train_loss": -6.006336212158203, "global_step": 63845, "epoch": 1520} {"train_loss": -5.983354568481445, "global_step": 63846, "epoch": 1520} {"train_loss": -5.863724231719971, "global_step": 63847, "epoch": 1520} {"train_loss": -5.916942596435547, "global_step": 63848, "epoch": 1520} {"train_loss": -6.016141414642334, "global_step": 63849, "epoch": 1520} {"train_loss": -5.863677024841309, "global_step": 63850, "epoch": 1520} {"train_loss": -5.82485294342041, "global_step": 63851, "epoch": 1520} {"train_loss": -5.8549017906188965, "global_step": 63852, "epoch": 1520} {"train_loss": -5.880486488342285, "global_step": 63853, "epoch": 1520} {"train_loss": -5.889068126678467, "global_step": 63854, "epoch": 1520} {"train_loss": -5.928060531616211, "global_step": 63855, "epoch": 1520} {"train_loss": -5.7934441566467285, "global_step": 63856, "epoch": 1520} {"train_loss": -5.960524082183838, "global_step": 63857, "epoch": 1520} {"train_loss": -5.938286304473877, "global_step": 63858, "epoch": 1520} {"train_loss": -5.8545074462890625, "global_step": 63859, "epoch": 1520} {"train_loss": -6.032414436340332, "global_step": 63860, "epoch": 1520} {"train_loss": -6.009735107421875, "global_step": 63861, "epoch": 1520} {"train_loss": -5.97641658782959, "global_step": 63862, "epoch": 1520} {"train_loss": -5.898825645446777, "global_step": 63863, "epoch": 1520} {"train_loss": -6.049801826477051, "global_step": 63864, "epoch": 1520} {"train_loss": -6.039628982543945, "global_step": 63865, "epoch": 1520} {"train_loss": -5.906782150268555, "global_step": 63866, "epoch": 1520} {"train_loss": -5.963727951049805, "global_step": 63867, "epoch": 1520} {"train_loss": -5.922388076782227, "global_step": 63868, "epoch": 1520} {"train_loss": -6.012974262237549, "global_step": 63869, "epoch": 1520} {"train_loss": -6.010424613952637, "global_step": 63870, "epoch": 1520} {"train_loss": -5.899016380310059, "global_step": 63871, "epoch": 1520} {"train_loss": -5.916168212890625, "global_step": 63872, "epoch": 1520} {"train_loss": -5.934110641479492, "global_step": 63873, "epoch": 1520} {"train_loss": -5.937897682189941, "global_step": 63874, "epoch": 1520} {"train_loss": -5.911520957946777, "global_step": 63875, "epoch": 1520} {"train_loss": -6.038919448852539, "global_step": 63876, "epoch": 1520} {"train_loss": -5.847314834594727, "global_step": 63877, "epoch": 1520} {"train_loss": -5.968658447265625, "global_step": 63878, "epoch": 1520} {"train_loss": -5.901408672332764, "global_step": 63879, "epoch": 1520} {"train_loss": -5.907431125640869, "global_step": 63880, "epoch": 1520} {"train_loss": -5.937639531635103, "global_step": 63881, "epoch": 1520, "val_loss": 74426.609375} {"train_loss": -6.054009437561035, "global_step": 63882, "epoch": 1521} {"train_loss": -5.953491687774658, "global_step": 63883, "epoch": 1521} {"train_loss": -5.95361328125, "global_step": 63884, "epoch": 1521} {"train_loss": -5.979959487915039, "global_step": 63885, "epoch": 1521} {"train_loss": -5.877532005310059, "global_step": 63886, "epoch": 1521} {"train_loss": -5.92960786819458, "global_step": 63887, "epoch": 1521} {"train_loss": -5.892244815826416, "global_step": 63888, "epoch": 1521} {"train_loss": -5.942980766296387, "global_step": 63889, "epoch": 1521} {"train_loss": -5.927276611328125, "global_step": 63890, "epoch": 1521} {"train_loss": -5.949993133544922, "global_step": 63891, "epoch": 1521} {"train_loss": -5.965179920196533, "global_step": 63892, "epoch": 1521} {"train_loss": -5.8373637199401855, "global_step": 63893, "epoch": 1521} {"train_loss": -5.943670272827148, "global_step": 63894, "epoch": 1521} {"train_loss": -5.92778205871582, "global_step": 63895, "epoch": 1521} {"train_loss": -5.911811828613281, "global_step": 63896, "epoch": 1521} {"train_loss": -5.964058876037598, "global_step": 63897, "epoch": 1521} {"train_loss": -6.026952743530273, "global_step": 63898, "epoch": 1521} {"train_loss": -5.888581275939941, "global_step": 63899, "epoch": 1521} {"train_loss": -6.02883768081665, "global_step": 63900, "epoch": 1521} {"train_loss": -6.036781311035156, "global_step": 63901, "epoch": 1521} {"train_loss": -5.86189079284668, "global_step": 63902, "epoch": 1521} {"train_loss": -6.019092082977295, "global_step": 63903, "epoch": 1521} {"train_loss": -5.834293365478516, "global_step": 63904, "epoch": 1521} {"train_loss": -6.01984977722168, "global_step": 63905, "epoch": 1521} {"train_loss": -5.918511867523193, "global_step": 63906, "epoch": 1521} {"train_loss": -5.926090240478516, "global_step": 63907, "epoch": 1521} {"train_loss": -5.890105724334717, "global_step": 63908, "epoch": 1521} {"train_loss": -5.883301734924316, "global_step": 63909, "epoch": 1521} {"train_loss": -5.9085893630981445, "global_step": 63910, "epoch": 1521} {"train_loss": -5.9821624755859375, "global_step": 63911, "epoch": 1521} {"train_loss": -5.997622013092041, "global_step": 63912, "epoch": 1521} {"train_loss": -5.998053550720215, "global_step": 63913, "epoch": 1521} {"train_loss": -6.034389019012451, "global_step": 63914, "epoch": 1521} {"train_loss": -5.9648237228393555, "global_step": 63915, "epoch": 1521} {"train_loss": -5.91761589050293, "global_step": 63916, "epoch": 1521} {"train_loss": -6.041833877563477, "global_step": 63917, "epoch": 1521} {"train_loss": -6.03978157043457, "global_step": 63918, "epoch": 1521} {"train_loss": -5.98685359954834, "global_step": 63919, "epoch": 1521} {"train_loss": -5.955939769744873, "global_step": 63920, "epoch": 1521} {"train_loss": -6.021655559539795, "global_step": 63921, "epoch": 1521} {"train_loss": -6.082057952880859, "global_step": 63922, "epoch": 1521} {"train_loss": -5.958245674769084, "global_step": 63923, "epoch": 1521, "val_loss": 74728.0390625} {"train_loss": -5.963327407836914, "global_step": 63924, "epoch": 1522} {"train_loss": -6.02105712890625, "global_step": 63925, "epoch": 1522} {"train_loss": -6.117650508880615, "global_step": 63926, "epoch": 1522} {"train_loss": -5.91025447845459, "global_step": 63927, "epoch": 1522} {"train_loss": -5.936894416809082, "global_step": 63928, "epoch": 1522} {"train_loss": -5.968682289123535, "global_step": 63929, "epoch": 1522} {"train_loss": -5.978829383850098, "global_step": 63930, "epoch": 1522} {"train_loss": -5.9967498779296875, "global_step": 63931, "epoch": 1522} {"train_loss": -6.00763463973999, "global_step": 63932, "epoch": 1522} {"train_loss": -5.988865852355957, "global_step": 63933, "epoch": 1522} {"train_loss": -6.057929992675781, "global_step": 63934, "epoch": 1522} {"train_loss": -5.910375595092773, "global_step": 63935, "epoch": 1522} {"train_loss": -5.864750385284424, "global_step": 63936, "epoch": 1522} {"train_loss": -5.888741493225098, "global_step": 63937, "epoch": 1522} {"train_loss": -5.954652786254883, "global_step": 63938, "epoch": 1522} {"train_loss": -5.875284671783447, "global_step": 63939, "epoch": 1522} {"train_loss": -5.927430152893066, "global_step": 63940, "epoch": 1522} {"train_loss": -6.10915470123291, "global_step": 63941, "epoch": 1522} {"train_loss": -5.967341423034668, "global_step": 63942, "epoch": 1522} {"train_loss": -5.935656547546387, "global_step": 63943, "epoch": 1522} {"train_loss": -5.953097343444824, "global_step": 63944, "epoch": 1522} {"train_loss": -6.000170707702637, "global_step": 63945, "epoch": 1522} {"train_loss": -5.850444793701172, "global_step": 63946, "epoch": 1522} {"train_loss": -5.965340614318848, "global_step": 63947, "epoch": 1522} {"train_loss": -5.870345115661621, "global_step": 63948, "epoch": 1522} {"train_loss": -5.749369144439697, "global_step": 63949, "epoch": 1522} {"train_loss": -5.987443447113037, "global_step": 63950, "epoch": 1522} {"train_loss": -5.987549781799316, "global_step": 63951, "epoch": 1522} {"train_loss": -6.090662002563477, "global_step": 63952, "epoch": 1522} {"train_loss": -5.9702653884887695, "global_step": 63953, "epoch": 1522} {"train_loss": -5.9183831214904785, "global_step": 63954, "epoch": 1522} {"train_loss": -5.860102653503418, "global_step": 63955, "epoch": 1522} {"train_loss": -5.921049118041992, "global_step": 63956, "epoch": 1522} {"train_loss": -5.879636764526367, "global_step": 63957, "epoch": 1522} {"train_loss": -5.902684211730957, "global_step": 63958, "epoch": 1522} {"train_loss": -5.832700729370117, "global_step": 63959, "epoch": 1522} {"train_loss": -5.973230361938477, "global_step": 63960, "epoch": 1522} {"train_loss": -5.881338119506836, "global_step": 63961, "epoch": 1522} {"train_loss": -5.872300148010254, "global_step": 63962, "epoch": 1522} {"train_loss": -5.783285140991211, "global_step": 63963, "epoch": 1522} {"train_loss": -6.05505895614624, "global_step": 63964, "epoch": 1522} {"train_loss": -5.941901331856137, "global_step": 63965, "epoch": 1522, "val_loss": 74677.5859375} {"train_loss": -6.10140323638916, "global_step": 63966, "epoch": 1523} {"train_loss": -5.861683368682861, "global_step": 63967, "epoch": 1523} {"train_loss": -5.848570823669434, "global_step": 63968, "epoch": 1523} {"train_loss": -5.968050479888916, "global_step": 63969, "epoch": 1523} {"train_loss": -5.90191125869751, "global_step": 63970, "epoch": 1523} {"train_loss": -5.999847412109375, "global_step": 63971, "epoch": 1523} {"train_loss": -5.902011871337891, "global_step": 63972, "epoch": 1523} {"train_loss": -5.96562385559082, "global_step": 63973, "epoch": 1523} {"train_loss": -6.01142692565918, "global_step": 63974, "epoch": 1523} {"train_loss": -5.975305080413818, "global_step": 63975, "epoch": 1523} {"train_loss": -5.88809061050415, "global_step": 63976, "epoch": 1523} {"train_loss": -5.878807067871094, "global_step": 63977, "epoch": 1523} {"train_loss": -5.947591781616211, "global_step": 63978, "epoch": 1523} {"train_loss": -6.006617546081543, "global_step": 63979, "epoch": 1523} {"train_loss": -5.981060028076172, "global_step": 63980, "epoch": 1523} {"train_loss": -5.968941688537598, "global_step": 63981, "epoch": 1523} {"train_loss": -5.895598411560059, "global_step": 63982, "epoch": 1523} {"train_loss": -5.968090057373047, "global_step": 63983, "epoch": 1523} {"train_loss": -6.023440837860107, "global_step": 63984, "epoch": 1523} {"train_loss": -5.943029403686523, "global_step": 63985, "epoch": 1523} {"train_loss": -6.05399751663208, "global_step": 63986, "epoch": 1523} {"train_loss": -5.898587226867676, "global_step": 63987, "epoch": 1523} {"train_loss": -5.917330265045166, "global_step": 63988, "epoch": 1523} {"train_loss": -5.982409954071045, "global_step": 63989, "epoch": 1523} {"train_loss": -5.854303359985352, "global_step": 63990, "epoch": 1523} {"train_loss": -5.930307388305664, "global_step": 63991, "epoch": 1523} {"train_loss": -5.954287528991699, "global_step": 63992, "epoch": 1523} {"train_loss": -5.96419095993042, "global_step": 63993, "epoch": 1523} {"train_loss": -6.04013729095459, "global_step": 63994, "epoch": 1523} {"train_loss": -5.9411091804504395, "global_step": 63995, "epoch": 1523} {"train_loss": -5.997639179229736, "global_step": 63996, "epoch": 1523} {"train_loss": -5.9105305671691895, "global_step": 63997, "epoch": 1523} {"train_loss": -5.9272894859313965, "global_step": 63998, "epoch": 1523} {"train_loss": -5.902174949645996, "global_step": 63999, "epoch": 1523} {"train_loss": -5.986161231994629, "global_step": 64000, "epoch": 1523} {"train_loss": -5.942215919494629, "global_step": 64001, "epoch": 1523} {"train_loss": -5.914458274841309, "global_step": 64002, "epoch": 1523} {"train_loss": -5.878207683563232, "global_step": 64003, "epoch": 1523} {"train_loss": -5.891914367675781, "global_step": 64004, "epoch": 1523} {"train_loss": -5.9362993240356445, "global_step": 64005, "epoch": 1523} {"train_loss": -5.918999671936035, "global_step": 64006, "epoch": 1523} {"train_loss": -5.944113765444074, "global_step": 64007, "epoch": 1523, "val_loss": 75033.421875} {"train_loss": -5.778083801269531, "global_step": 64008, "epoch": 1524} {"train_loss": -5.80642032623291, "global_step": 64009, "epoch": 1524} {"train_loss": -5.919290542602539, "global_step": 64010, "epoch": 1524} {"train_loss": -5.845061302185059, "global_step": 64011, "epoch": 1524} {"train_loss": -5.962050437927246, "global_step": 64012, "epoch": 1524} {"train_loss": -5.849186897277832, "global_step": 64013, "epoch": 1524} {"train_loss": -5.919661521911621, "global_step": 64014, "epoch": 1524} {"train_loss": -5.85334587097168, "global_step": 64015, "epoch": 1524} {"train_loss": -5.922754287719727, "global_step": 64016, "epoch": 1524} {"train_loss": -5.873337745666504, "global_step": 64017, "epoch": 1524} {"train_loss": -5.898955345153809, "global_step": 64018, "epoch": 1524} {"train_loss": -5.913225173950195, "global_step": 64019, "epoch": 1524} {"train_loss": -5.98740291595459, "global_step": 64020, "epoch": 1524} {"train_loss": -5.96485710144043, "global_step": 64021, "epoch": 1524} {"train_loss": -6.022837162017822, "global_step": 64022, "epoch": 1524} {"train_loss": -6.006163597106934, "global_step": 64023, "epoch": 1524} {"train_loss": -5.922154426574707, "global_step": 64024, "epoch": 1524} {"train_loss": -6.068987846374512, "global_step": 64025, "epoch": 1524} {"train_loss": -5.9290666580200195, "global_step": 64026, "epoch": 1524} {"train_loss": -5.88907527923584, "global_step": 64027, "epoch": 1524} {"train_loss": -6.077438831329346, "global_step": 64028, "epoch": 1524} {"train_loss": -5.969168186187744, "global_step": 64029, "epoch": 1524} {"train_loss": -6.11669397354126, "global_step": 64030, "epoch": 1524} {"train_loss": -6.019844055175781, "global_step": 64031, "epoch": 1524} {"train_loss": -5.9811177253723145, "global_step": 64032, "epoch": 1524} {"train_loss": -5.995357036590576, "global_step": 64033, "epoch": 1524} {"train_loss": -5.964428901672363, "global_step": 64034, "epoch": 1524} {"train_loss": -5.857538223266602, "global_step": 64035, "epoch": 1524} {"train_loss": -6.0270490646362305, "global_step": 64036, "epoch": 1524} {"train_loss": -5.906813621520996, "global_step": 64037, "epoch": 1524} {"train_loss": -5.9899091720581055, "global_step": 64038, "epoch": 1524} {"train_loss": -6.059601783752441, "global_step": 64039, "epoch": 1524} {"train_loss": -5.993821144104004, "global_step": 64040, "epoch": 1524} {"train_loss": -5.8248491287231445, "global_step": 64041, "epoch": 1524} {"train_loss": -5.97122049331665, "global_step": 64042, "epoch": 1524} {"train_loss": -6.013882637023926, "global_step": 64043, "epoch": 1524} {"train_loss": -6.020389556884766, "global_step": 64044, "epoch": 1524} {"train_loss": -5.9423065185546875, "global_step": 64045, "epoch": 1524} {"train_loss": -5.859248161315918, "global_step": 64046, "epoch": 1524} {"train_loss": -5.8802809715271, "global_step": 64047, "epoch": 1524} {"train_loss": -5.929442405700684, "global_step": 64048, "epoch": 1524} {"train_loss": -5.9431401661464145, "global_step": 64049, "epoch": 1524, "val_loss": 74574.9921875} {"train_loss": -6.022958755493164, "global_step": 64050, "epoch": 1525} {"train_loss": -5.88603401184082, "global_step": 64051, "epoch": 1525} {"train_loss": -5.913843154907227, "global_step": 64052, "epoch": 1525} {"train_loss": -5.929238319396973, "global_step": 64053, "epoch": 1525} {"train_loss": -5.91618537902832, "global_step": 64054, "epoch": 1525} {"train_loss": -5.995150566101074, "global_step": 64055, "epoch": 1525} {"train_loss": -5.981788158416748, "global_step": 64056, "epoch": 1525} {"train_loss": -5.900530815124512, "global_step": 64057, "epoch": 1525} {"train_loss": -5.920547962188721, "global_step": 64058, "epoch": 1525} {"train_loss": -5.9268364906311035, "global_step": 64059, "epoch": 1525} {"train_loss": -5.9439239501953125, "global_step": 64060, "epoch": 1525} {"train_loss": -5.935922622680664, "global_step": 64061, "epoch": 1525} {"train_loss": -5.842265605926514, "global_step": 64062, "epoch": 1525} {"train_loss": -6.000422954559326, "global_step": 64063, "epoch": 1525} {"train_loss": -5.8578691482543945, "global_step": 64064, "epoch": 1525} {"train_loss": -5.926824569702148, "global_step": 64065, "epoch": 1525} {"train_loss": -5.959375381469727, "global_step": 64066, "epoch": 1525} {"train_loss": -5.82437801361084, "global_step": 64067, "epoch": 1525} {"train_loss": -5.900064945220947, "global_step": 64068, "epoch": 1525} {"train_loss": -5.897639274597168, "global_step": 64069, "epoch": 1525} {"train_loss": -5.956643104553223, "global_step": 64070, "epoch": 1525} {"train_loss": -5.942005157470703, "global_step": 64071, "epoch": 1525} {"train_loss": -5.854971408843994, "global_step": 64072, "epoch": 1525} {"train_loss": -5.772478103637695, "global_step": 64073, "epoch": 1525} {"train_loss": -5.9816083908081055, "global_step": 64074, "epoch": 1525} {"train_loss": -5.856499195098877, "global_step": 64075, "epoch": 1525} {"train_loss": -5.930048942565918, "global_step": 64076, "epoch": 1525} {"train_loss": -6.027091979980469, "global_step": 64077, "epoch": 1525} {"train_loss": -5.766720771789551, "global_step": 64078, "epoch": 1525} {"train_loss": -5.98371696472168, "global_step": 64079, "epoch": 1525} {"train_loss": -5.858906269073486, "global_step": 64080, "epoch": 1525} {"train_loss": -5.967461585998535, "global_step": 64081, "epoch": 1525} {"train_loss": -5.856584548950195, "global_step": 64082, "epoch": 1525} {"train_loss": -5.845810890197754, "global_step": 64083, "epoch": 1525} {"train_loss": -5.857224464416504, "global_step": 64084, "epoch": 1525} {"train_loss": -5.9333367347717285, "global_step": 64085, "epoch": 1525} {"train_loss": -5.9453043937683105, "global_step": 64086, "epoch": 1525} {"train_loss": -5.942864418029785, "global_step": 64087, "epoch": 1525} {"train_loss": -5.937526702880859, "global_step": 64088, "epoch": 1525} {"train_loss": -6.097682952880859, "global_step": 64089, "epoch": 1525} {"train_loss": -5.892693519592285, "global_step": 64090, "epoch": 1525} {"train_loss": -5.919036842527843, "global_step": 64091, "epoch": 1525, "val_loss": 74640.7578125} {"train_loss": -6.052907466888428, "global_step": 64092, "epoch": 1526} {"train_loss": -5.876036167144775, "global_step": 64093, "epoch": 1526} {"train_loss": -5.931530952453613, "global_step": 64094, "epoch": 1526} {"train_loss": -5.865427494049072, "global_step": 64095, "epoch": 1526} {"train_loss": -5.9186506271362305, "global_step": 64096, "epoch": 1526} {"train_loss": -5.906280517578125, "global_step": 64097, "epoch": 1526} {"train_loss": -5.916781425476074, "global_step": 64098, "epoch": 1526} {"train_loss": -5.800447463989258, "global_step": 64099, "epoch": 1526} {"train_loss": -5.955911636352539, "global_step": 64100, "epoch": 1526} {"train_loss": -5.906572341918945, "global_step": 64101, "epoch": 1526} {"train_loss": -5.929262161254883, "global_step": 64102, "epoch": 1526} {"train_loss": -5.932943344116211, "global_step": 64103, "epoch": 1526} {"train_loss": -6.035101890563965, "global_step": 64104, "epoch": 1526} {"train_loss": -5.966038703918457, "global_step": 64105, "epoch": 1526} {"train_loss": -5.879021167755127, "global_step": 64106, "epoch": 1526} {"train_loss": -5.862706184387207, "global_step": 64107, "epoch": 1526} {"train_loss": -5.999529838562012, "global_step": 64108, "epoch": 1526} {"train_loss": -5.835129261016846, "global_step": 64109, "epoch": 1526} {"train_loss": -5.936842441558838, "global_step": 64110, "epoch": 1526} {"train_loss": -5.988438129425049, "global_step": 64111, "epoch": 1526} {"train_loss": -5.878371238708496, "global_step": 64112, "epoch": 1526} {"train_loss": -5.87886905670166, "global_step": 64113, "epoch": 1526} {"train_loss": -5.923089027404785, "global_step": 64114, "epoch": 1526} {"train_loss": -5.929535865783691, "global_step": 64115, "epoch": 1526} {"train_loss": -5.964962959289551, "global_step": 64116, "epoch": 1526} {"train_loss": -6.058745384216309, "global_step": 64117, "epoch": 1526} {"train_loss": -5.870117664337158, "global_step": 64118, "epoch": 1526} {"train_loss": -5.9703474044799805, "global_step": 64119, "epoch": 1526} {"train_loss": -5.866209983825684, "global_step": 64120, "epoch": 1526} {"train_loss": -6.045757293701172, "global_step": 64121, "epoch": 1526} {"train_loss": -5.883111000061035, "global_step": 64122, "epoch": 1526} {"train_loss": -5.975257396697998, "global_step": 64123, "epoch": 1526} {"train_loss": -5.979933738708496, "global_step": 64124, "epoch": 1526} {"train_loss": -6.085453510284424, "global_step": 64125, "epoch": 1526} {"train_loss": -5.98293924331665, "global_step": 64126, "epoch": 1526} {"train_loss": -5.941608428955078, "global_step": 64127, "epoch": 1526} {"train_loss": -5.944452285766602, "global_step": 64128, "epoch": 1526} {"train_loss": -6.015848159790039, "global_step": 64129, "epoch": 1526} {"train_loss": -5.843231201171875, "global_step": 64130, "epoch": 1526} {"train_loss": -5.934940338134766, "global_step": 64131, "epoch": 1526} {"train_loss": -5.971621990203857, "global_step": 64132, "epoch": 1526} {"train_loss": -5.93697882833935, "global_step": 64133, "epoch": 1526, "val_loss": 74613.328125} {"train_loss": -5.8426103591918945, "global_step": 64134, "epoch": 1527} {"train_loss": -6.037056922912598, "global_step": 64135, "epoch": 1527} {"train_loss": -5.937170505523682, "global_step": 64136, "epoch": 1527} {"train_loss": -5.907910346984863, "global_step": 64137, "epoch": 1527} {"train_loss": -5.80600118637085, "global_step": 64138, "epoch": 1527} {"train_loss": -5.993169784545898, "global_step": 64139, "epoch": 1527} {"train_loss": -5.954208850860596, "global_step": 64140, "epoch": 1527} {"train_loss": -5.857825756072998, "global_step": 64141, "epoch": 1527} {"train_loss": -5.924455642700195, "global_step": 64142, "epoch": 1527} {"train_loss": -5.867053985595703, "global_step": 64143, "epoch": 1527} {"train_loss": -5.952360153198242, "global_step": 64144, "epoch": 1527} {"train_loss": -5.900003910064697, "global_step": 64145, "epoch": 1527} {"train_loss": -6.105265140533447, "global_step": 64146, "epoch": 1527} {"train_loss": -5.953908920288086, "global_step": 64147, "epoch": 1527} {"train_loss": -6.008635520935059, "global_step": 64148, "epoch": 1527} {"train_loss": -5.961833953857422, "global_step": 64149, "epoch": 1527} {"train_loss": -5.9128594398498535, "global_step": 64150, "epoch": 1527} {"train_loss": -5.974299430847168, "global_step": 64151, "epoch": 1527} {"train_loss": -5.965538024902344, "global_step": 64152, "epoch": 1527} {"train_loss": -6.009073257446289, "global_step": 64153, "epoch": 1527} {"train_loss": -5.879275321960449, "global_step": 64154, "epoch": 1527} {"train_loss": -5.985802173614502, "global_step": 64155, "epoch": 1527} {"train_loss": -5.900172233581543, "global_step": 64156, "epoch": 1527} {"train_loss": -6.001675128936768, "global_step": 64157, "epoch": 1527} {"train_loss": -5.903629302978516, "global_step": 64158, "epoch": 1527} {"train_loss": -5.912092208862305, "global_step": 64159, "epoch": 1527} {"train_loss": -5.9485764503479, "global_step": 64160, "epoch": 1527} {"train_loss": -5.949125289916992, "global_step": 64161, "epoch": 1527} {"train_loss": -6.007411956787109, "global_step": 64162, "epoch": 1527} {"train_loss": -5.996683120727539, "global_step": 64163, "epoch": 1527} {"train_loss": -5.913134574890137, "global_step": 64164, "epoch": 1527} {"train_loss": -6.084380626678467, "global_step": 64165, "epoch": 1527} {"train_loss": -5.854049205780029, "global_step": 64166, "epoch": 1527} {"train_loss": -5.9526872634887695, "global_step": 64167, "epoch": 1527} {"train_loss": -6.021766662597656, "global_step": 64168, "epoch": 1527} {"train_loss": -5.841224193572998, "global_step": 64169, "epoch": 1527} {"train_loss": -5.974424362182617, "global_step": 64170, "epoch": 1527} {"train_loss": -5.848796844482422, "global_step": 64171, "epoch": 1527} {"train_loss": -5.860099792480469, "global_step": 64172, "epoch": 1527} {"train_loss": -5.947774887084961, "global_step": 64173, "epoch": 1527} {"train_loss": -5.84999942779541, "global_step": 64174, "epoch": 1527} {"train_loss": -5.935480481102353, "global_step": 64175, "epoch": 1527, "val_loss": 74499.0234375} {"train_loss": -5.839912414550781, "global_step": 64176, "epoch": 1528} {"train_loss": -5.9378981590271, "global_step": 64177, "epoch": 1528} {"train_loss": -5.903450012207031, "global_step": 64178, "epoch": 1528} {"train_loss": -5.976175308227539, "global_step": 64179, "epoch": 1528} {"train_loss": -6.0579423904418945, "global_step": 64180, "epoch": 1528} {"train_loss": -5.910582542419434, "global_step": 64181, "epoch": 1528} {"train_loss": -5.823078155517578, "global_step": 64182, "epoch": 1528} {"train_loss": -5.933218479156494, "global_step": 64183, "epoch": 1528} {"train_loss": -5.832376480102539, "global_step": 64184, "epoch": 1528} {"train_loss": -5.886737823486328, "global_step": 64185, "epoch": 1528} {"train_loss": -5.830924987792969, "global_step": 64186, "epoch": 1528} {"train_loss": -6.100551605224609, "global_step": 64187, "epoch": 1528} {"train_loss": -5.872490882873535, "global_step": 64188, "epoch": 1528} {"train_loss": -5.9480133056640625, "global_step": 64189, "epoch": 1528} {"train_loss": -5.959144592285156, "global_step": 64190, "epoch": 1528} {"train_loss": -5.916866779327393, "global_step": 64191, "epoch": 1528} {"train_loss": -5.996782302856445, "global_step": 64192, "epoch": 1528} {"train_loss": -6.005642890930176, "global_step": 64193, "epoch": 1528} {"train_loss": -5.895167350769043, "global_step": 64194, "epoch": 1528} {"train_loss": -5.813146591186523, "global_step": 64195, "epoch": 1528} {"train_loss": -5.988750457763672, "global_step": 64196, "epoch": 1528} {"train_loss": -5.955887794494629, "global_step": 64197, "epoch": 1528} {"train_loss": -5.885463714599609, "global_step": 64198, "epoch": 1528} {"train_loss": -5.903339862823486, "global_step": 64199, "epoch": 1528} {"train_loss": -5.88935661315918, "global_step": 64200, "epoch": 1528} {"train_loss": -5.912535667419434, "global_step": 64201, "epoch": 1528} {"train_loss": -6.022838592529297, "global_step": 64202, "epoch": 1528} {"train_loss": -6.012388229370117, "global_step": 64203, "epoch": 1528} {"train_loss": -5.9288434982299805, "global_step": 64204, "epoch": 1528} {"train_loss": -5.922379493713379, "global_step": 64205, "epoch": 1528} {"train_loss": -5.921648979187012, "global_step": 64206, "epoch": 1528} {"train_loss": -5.970259189605713, "global_step": 64207, "epoch": 1528} {"train_loss": -6.088202476501465, "global_step": 64208, "epoch": 1528} {"train_loss": -5.915215015411377, "global_step": 64209, "epoch": 1528} {"train_loss": -5.926568031311035, "global_step": 64210, "epoch": 1528} {"train_loss": -5.931881904602051, "global_step": 64211, "epoch": 1528} {"train_loss": -5.903341770172119, "global_step": 64212, "epoch": 1528} {"train_loss": -5.97373104095459, "global_step": 64213, "epoch": 1528} {"train_loss": -5.969060897827148, "global_step": 64214, "epoch": 1528} {"train_loss": -5.893847942352295, "global_step": 64215, "epoch": 1528} {"train_loss": -5.976509094238281, "global_step": 64216, "epoch": 1528} {"train_loss": -5.930441572552636, "global_step": 64217, "epoch": 1528, "val_loss": 74965.6875} {"train_loss": -5.962836742401123, "global_step": 64218, "epoch": 1529} {"train_loss": -5.9725341796875, "global_step": 64219, "epoch": 1529} {"train_loss": -5.923394203186035, "global_step": 64220, "epoch": 1529} {"train_loss": -5.960925102233887, "global_step": 64221, "epoch": 1529} {"train_loss": -5.998628616333008, "global_step": 64222, "epoch": 1529} {"train_loss": -5.964775562286377, "global_step": 64223, "epoch": 1529} {"train_loss": -5.9573073387146, "global_step": 64224, "epoch": 1529} {"train_loss": -6.0613813400268555, "global_step": 64225, "epoch": 1529} {"train_loss": -5.943041801452637, "global_step": 64226, "epoch": 1529} {"train_loss": -6.0422821044921875, "global_step": 64227, "epoch": 1529} {"train_loss": -5.849090576171875, "global_step": 64228, "epoch": 1529} {"train_loss": -5.861930847167969, "global_step": 64229, "epoch": 1529} {"train_loss": -5.945318222045898, "global_step": 64230, "epoch": 1529} {"train_loss": -5.921355247497559, "global_step": 64231, "epoch": 1529} {"train_loss": -5.934763431549072, "global_step": 64232, "epoch": 1529} {"train_loss": -6.037261009216309, "global_step": 64233, "epoch": 1529} {"train_loss": -5.904388904571533, "global_step": 64234, "epoch": 1529} {"train_loss": -5.875371932983398, "global_step": 64235, "epoch": 1529} {"train_loss": -5.895549774169922, "global_step": 64236, "epoch": 1529} {"train_loss": -5.9247236251831055, "global_step": 64237, "epoch": 1529} {"train_loss": -5.868587493896484, "global_step": 64238, "epoch": 1529} {"train_loss": -5.9358978271484375, "global_step": 64239, "epoch": 1529} {"train_loss": -5.866459846496582, "global_step": 64240, "epoch": 1529} {"train_loss": -5.931512832641602, "global_step": 64241, "epoch": 1529} {"train_loss": -5.891127109527588, "global_step": 64242, "epoch": 1529} {"train_loss": -5.74747896194458, "global_step": 64243, "epoch": 1529} {"train_loss": -5.918572425842285, "global_step": 64244, "epoch": 1529} {"train_loss": -5.845744609832764, "global_step": 64245, "epoch": 1529} {"train_loss": -5.863737106323242, "global_step": 64246, "epoch": 1529} {"train_loss": -5.83842134475708, "global_step": 64247, "epoch": 1529} {"train_loss": -5.94651985168457, "global_step": 64248, "epoch": 1529} {"train_loss": -6.038059234619141, "global_step": 64249, "epoch": 1529} {"train_loss": -5.903800964355469, "global_step": 64250, "epoch": 1529} {"train_loss": -5.912147045135498, "global_step": 64251, "epoch": 1529} {"train_loss": -5.888182163238525, "global_step": 64252, "epoch": 1529} {"train_loss": -6.038609981536865, "global_step": 64253, "epoch": 1529} {"train_loss": -5.964409828186035, "global_step": 64254, "epoch": 1529} {"train_loss": -5.932457447052002, "global_step": 64255, "epoch": 1529} {"train_loss": -6.171049118041992, "global_step": 64256, "epoch": 1529} {"train_loss": -5.85638427734375, "global_step": 64257, "epoch": 1529} {"train_loss": -5.887973308563232, "global_step": 64258, "epoch": 1529} {"train_loss": -5.932234854925246, "global_step": 64259, "epoch": 1529, "val_loss": 74600.8671875} {"train_loss": -5.8721466064453125, "global_step": 64260, "epoch": 1530} {"train_loss": -5.968890190124512, "global_step": 64261, "epoch": 1530} {"train_loss": -6.002622604370117, "global_step": 64262, "epoch": 1530} {"train_loss": -5.962165355682373, "global_step": 64263, "epoch": 1530} {"train_loss": -5.918205261230469, "global_step": 64264, "epoch": 1530} {"train_loss": -5.859646797180176, "global_step": 64265, "epoch": 1530} {"train_loss": -5.87619161605835, "global_step": 64266, "epoch": 1530} {"train_loss": -5.985806941986084, "global_step": 64267, "epoch": 1530} {"train_loss": -5.9924798011779785, "global_step": 64268, "epoch": 1530} {"train_loss": -5.988201141357422, "global_step": 64269, "epoch": 1530} {"train_loss": -6.057634353637695, "global_step": 64270, "epoch": 1530} {"train_loss": -5.85841178894043, "global_step": 64271, "epoch": 1530} {"train_loss": -5.894754409790039, "global_step": 64272, "epoch": 1530} {"train_loss": -6.002197265625, "global_step": 64273, "epoch": 1530} {"train_loss": -5.924535751342773, "global_step": 64274, "epoch": 1530} {"train_loss": -5.912614822387695, "global_step": 64275, "epoch": 1530} {"train_loss": -5.952954292297363, "global_step": 64276, "epoch": 1530} {"train_loss": -5.883333206176758, "global_step": 64277, "epoch": 1530} {"train_loss": -6.004138469696045, "global_step": 64278, "epoch": 1530} {"train_loss": -5.828465461730957, "global_step": 64279, "epoch": 1530} {"train_loss": -6.102854251861572, "global_step": 64280, "epoch": 1530} {"train_loss": -6.013635635375977, "global_step": 64281, "epoch": 1530} {"train_loss": -6.0154900550842285, "global_step": 64282, "epoch": 1530} {"train_loss": -5.930850982666016, "global_step": 64283, "epoch": 1530} {"train_loss": -5.765627861022949, "global_step": 64284, "epoch": 1530} {"train_loss": -5.866320610046387, "global_step": 64285, "epoch": 1530} {"train_loss": -5.994847774505615, "global_step": 64286, "epoch": 1530} {"train_loss": -6.027290344238281, "global_step": 64287, "epoch": 1530} {"train_loss": -5.908239364624023, "global_step": 64288, "epoch": 1530} {"train_loss": -5.961522102355957, "global_step": 64289, "epoch": 1530} {"train_loss": -5.708253383636475, "global_step": 64290, "epoch": 1530} {"train_loss": -5.775576591491699, "global_step": 64291, "epoch": 1530} {"train_loss": -5.958986759185791, "global_step": 64292, "epoch": 1530} {"train_loss": -5.852315425872803, "global_step": 64293, "epoch": 1530} {"train_loss": -5.958278656005859, "global_step": 64294, "epoch": 1530} {"train_loss": -5.984552383422852, "global_step": 64295, "epoch": 1530} {"train_loss": -5.916285514831543, "global_step": 64296, "epoch": 1530} {"train_loss": -5.969629287719727, "global_step": 64297, "epoch": 1530} {"train_loss": -5.914351463317871, "global_step": 64298, "epoch": 1530} {"train_loss": -5.853855133056641, "global_step": 64299, "epoch": 1530} {"train_loss": -6.063851833343506, "global_step": 64300, "epoch": 1530} {"train_loss": -5.933833383378529, "global_step": 64301, "epoch": 1530, "val_loss": 74557.21875} {"train_loss": -5.82960844039917, "global_step": 64302, "epoch": 1531} {"train_loss": -5.8932695388793945, "global_step": 64303, "epoch": 1531} {"train_loss": -5.98569917678833, "global_step": 64304, "epoch": 1531} {"train_loss": -5.922208786010742, "global_step": 64305, "epoch": 1531} {"train_loss": -5.865551948547363, "global_step": 64306, "epoch": 1531} {"train_loss": -6.054327964782715, "global_step": 64307, "epoch": 1531} {"train_loss": -5.762903213500977, "global_step": 64308, "epoch": 1531} {"train_loss": -6.0426740646362305, "global_step": 64309, "epoch": 1531} {"train_loss": -5.942395210266113, "global_step": 64310, "epoch": 1531} {"train_loss": -5.850354194641113, "global_step": 64311, "epoch": 1531} {"train_loss": -5.878253936767578, "global_step": 64312, "epoch": 1531} {"train_loss": -5.87282133102417, "global_step": 64313, "epoch": 1531} {"train_loss": -6.025759220123291, "global_step": 64314, "epoch": 1531} {"train_loss": -5.951564311981201, "global_step": 64315, "epoch": 1531} {"train_loss": -5.872746467590332, "global_step": 64316, "epoch": 1531} {"train_loss": -5.95544958114624, "global_step": 64317, "epoch": 1531} {"train_loss": -5.997060775756836, "global_step": 64318, "epoch": 1531} {"train_loss": -6.005133628845215, "global_step": 64319, "epoch": 1531} {"train_loss": -6.020810127258301, "global_step": 64320, "epoch": 1531} {"train_loss": -5.956361770629883, "global_step": 64321, "epoch": 1531} {"train_loss": -5.870710849761963, "global_step": 64322, "epoch": 1531} {"train_loss": -5.917707920074463, "global_step": 64323, "epoch": 1531} {"train_loss": -5.9282121658325195, "global_step": 64324, "epoch": 1531} {"train_loss": -6.029852867126465, "global_step": 64325, "epoch": 1531} {"train_loss": -6.050053596496582, "global_step": 64326, "epoch": 1531} {"train_loss": -6.020606994628906, "global_step": 64327, "epoch": 1531} {"train_loss": -5.985710144042969, "global_step": 64328, "epoch": 1531} {"train_loss": -6.045453071594238, "global_step": 64329, "epoch": 1531} {"train_loss": -6.008163928985596, "global_step": 64330, "epoch": 1531} {"train_loss": -5.965226650238037, "global_step": 64331, "epoch": 1531} {"train_loss": -6.026190757751465, "global_step": 64332, "epoch": 1531} {"train_loss": -5.921344757080078, "global_step": 64333, "epoch": 1531} {"train_loss": -6.067686557769775, "global_step": 64334, "epoch": 1531} {"train_loss": -5.999502658843994, "global_step": 64335, "epoch": 1531} {"train_loss": -5.885740280151367, "global_step": 64336, "epoch": 1531} {"train_loss": -5.987674713134766, "global_step": 64337, "epoch": 1531} {"train_loss": -6.071621894836426, "global_step": 64338, "epoch": 1531} {"train_loss": -5.963421821594238, "global_step": 64339, "epoch": 1531} {"train_loss": -5.932613372802734, "global_step": 64340, "epoch": 1531} {"train_loss": -6.01762580871582, "global_step": 64341, "epoch": 1531} {"train_loss": -5.935866832733154, "global_step": 64342, "epoch": 1531} {"train_loss": -5.960072540101551, "global_step": 64343, "epoch": 1531, "val_loss": 74573.96875} {"train_loss": -6.013622283935547, "global_step": 64344, "epoch": 1532} {"train_loss": -5.9844207763671875, "global_step": 64345, "epoch": 1532} {"train_loss": -5.982756614685059, "global_step": 64346, "epoch": 1532} {"train_loss": -5.9982781410217285, "global_step": 64347, "epoch": 1532} {"train_loss": -5.982307434082031, "global_step": 64348, "epoch": 1532} {"train_loss": -5.986756324768066, "global_step": 64349, "epoch": 1532} {"train_loss": -5.895483493804932, "global_step": 64350, "epoch": 1532} {"train_loss": -5.982266902923584, "global_step": 64351, "epoch": 1532} {"train_loss": -6.032759666442871, "global_step": 64352, "epoch": 1532} {"train_loss": -5.913006782531738, "global_step": 64353, "epoch": 1532} {"train_loss": -5.895163536071777, "global_step": 64354, "epoch": 1532} {"train_loss": -5.937239170074463, "global_step": 64355, "epoch": 1532} {"train_loss": -5.906432151794434, "global_step": 64356, "epoch": 1532} {"train_loss": -5.939760684967041, "global_step": 64357, "epoch": 1532} {"train_loss": -5.9814133644104, "global_step": 64358, "epoch": 1532} {"train_loss": -5.816376209259033, "global_step": 64359, "epoch": 1532} {"train_loss": -5.990884780883789, "global_step": 64360, "epoch": 1532} {"train_loss": -5.930111885070801, "global_step": 64361, "epoch": 1532} {"train_loss": -5.888866424560547, "global_step": 64362, "epoch": 1532} {"train_loss": -5.991691589355469, "global_step": 64363, "epoch": 1532} {"train_loss": -5.889397144317627, "global_step": 64364, "epoch": 1532} {"train_loss": -5.912389278411865, "global_step": 64365, "epoch": 1532} {"train_loss": -5.912335395812988, "global_step": 64366, "epoch": 1532} {"train_loss": -5.965287208557129, "global_step": 64367, "epoch": 1532} {"train_loss": -6.07443904876709, "global_step": 64368, "epoch": 1532} {"train_loss": -6.003237724304199, "global_step": 64369, "epoch": 1532} {"train_loss": -5.922421455383301, "global_step": 64370, "epoch": 1532} {"train_loss": -6.013094902038574, "global_step": 64371, "epoch": 1532} {"train_loss": -5.846405029296875, "global_step": 64372, "epoch": 1532} {"train_loss": -5.927937030792236, "global_step": 64373, "epoch": 1532} {"train_loss": -5.8793487548828125, "global_step": 64374, "epoch": 1532} {"train_loss": -5.898092269897461, "global_step": 64375, "epoch": 1532} {"train_loss": -6.0043625831604, "global_step": 64376, "epoch": 1532} {"train_loss": -5.918087005615234, "global_step": 64377, "epoch": 1532} {"train_loss": -6.059203624725342, "global_step": 64378, "epoch": 1532} {"train_loss": -5.944095611572266, "global_step": 64379, "epoch": 1532} {"train_loss": -5.887959003448486, "global_step": 64380, "epoch": 1532} {"train_loss": -6.007652282714844, "global_step": 64381, "epoch": 1532} {"train_loss": -5.9225921630859375, "global_step": 64382, "epoch": 1532} {"train_loss": -5.978245735168457, "global_step": 64383, "epoch": 1532} {"train_loss": -5.954624176025391, "global_step": 64384, "epoch": 1532} {"train_loss": -5.952742917197091, "global_step": 64385, "epoch": 1532, "val_loss": 74859.2578125} {"train_loss": -6.017620086669922, "global_step": 64386, "epoch": 1533} {"train_loss": -6.021021842956543, "global_step": 64387, "epoch": 1533} {"train_loss": -5.99725866317749, "global_step": 64388, "epoch": 1533} {"train_loss": -6.032986640930176, "global_step": 64389, "epoch": 1533} {"train_loss": -5.916057586669922, "global_step": 64390, "epoch": 1533} {"train_loss": -5.965616703033447, "global_step": 64391, "epoch": 1533} {"train_loss": -6.055206298828125, "global_step": 64392, "epoch": 1533} {"train_loss": -5.869701862335205, "global_step": 64393, "epoch": 1533} {"train_loss": -6.013336658477783, "global_step": 64394, "epoch": 1533} {"train_loss": -5.969388961791992, "global_step": 64395, "epoch": 1533} {"train_loss": -6.0083909034729, "global_step": 64396, "epoch": 1533} {"train_loss": -6.053086280822754, "global_step": 64397, "epoch": 1533} {"train_loss": -5.890345573425293, "global_step": 64398, "epoch": 1533} {"train_loss": -6.017536640167236, "global_step": 64399, "epoch": 1533} {"train_loss": -6.062704086303711, "global_step": 64400, "epoch": 1533} {"train_loss": -5.933592319488525, "global_step": 64401, "epoch": 1533} {"train_loss": -5.895883560180664, "global_step": 64402, "epoch": 1533} {"train_loss": -5.921326637268066, "global_step": 64403, "epoch": 1533} {"train_loss": -5.971080780029297, "global_step": 64404, "epoch": 1533} {"train_loss": -5.903326034545898, "global_step": 64405, "epoch": 1533} {"train_loss": -6.042468547821045, "global_step": 64406, "epoch": 1533} {"train_loss": -5.982460021972656, "global_step": 64407, "epoch": 1533} {"train_loss": -6.041513442993164, "global_step": 64408, "epoch": 1533} {"train_loss": -6.016371726989746, "global_step": 64409, "epoch": 1533} {"train_loss": -5.931723594665527, "global_step": 64410, "epoch": 1533} {"train_loss": -5.877472400665283, "global_step": 64411, "epoch": 1533} {"train_loss": -5.893862724304199, "global_step": 64412, "epoch": 1533} {"train_loss": -5.86444091796875, "global_step": 64413, "epoch": 1533} {"train_loss": -5.963886260986328, "global_step": 64414, "epoch": 1533} {"train_loss": -5.929671764373779, "global_step": 64415, "epoch": 1533} {"train_loss": -6.027254104614258, "global_step": 64416, "epoch": 1533} {"train_loss": -6.017468452453613, "global_step": 64417, "epoch": 1533} {"train_loss": -6.02799129486084, "global_step": 64418, "epoch": 1533} {"train_loss": -6.007484436035156, "global_step": 64419, "epoch": 1533} {"train_loss": -5.874702453613281, "global_step": 64420, "epoch": 1533} {"train_loss": -5.985033988952637, "global_step": 64421, "epoch": 1533} {"train_loss": -5.915044784545898, "global_step": 64422, "epoch": 1533} {"train_loss": -5.9689249992370605, "global_step": 64423, "epoch": 1533} {"train_loss": -5.851564407348633, "global_step": 64424, "epoch": 1533} {"train_loss": -6.025239944458008, "global_step": 64425, "epoch": 1533} {"train_loss": -5.977962493896484, "global_step": 64426, "epoch": 1533} {"train_loss": -5.970358269555228, "global_step": 64427, "epoch": 1533, "val_loss": 74679.1953125} {"train_loss": -5.875460624694824, "global_step": 64428, "epoch": 1534} {"train_loss": -5.934973239898682, "global_step": 64429, "epoch": 1534} {"train_loss": -5.995704650878906, "global_step": 64430, "epoch": 1534} {"train_loss": -5.77977180480957, "global_step": 64431, "epoch": 1534} {"train_loss": -6.055400371551514, "global_step": 64432, "epoch": 1534} {"train_loss": -5.864798545837402, "global_step": 64433, "epoch": 1534} {"train_loss": -5.881083965301514, "global_step": 64434, "epoch": 1534} {"train_loss": -5.896700859069824, "global_step": 64435, "epoch": 1534} {"train_loss": -6.026411533355713, "global_step": 64436, "epoch": 1534} {"train_loss": -5.928961753845215, "global_step": 64437, "epoch": 1534} {"train_loss": -6.067532539367676, "global_step": 64438, "epoch": 1534} {"train_loss": -5.901064395904541, "global_step": 64439, "epoch": 1534} {"train_loss": -5.837958812713623, "global_step": 64440, "epoch": 1534} {"train_loss": -5.938339710235596, "global_step": 64441, "epoch": 1534} {"train_loss": -6.024598121643066, "global_step": 64442, "epoch": 1534} {"train_loss": -6.019343376159668, "global_step": 64443, "epoch": 1534} {"train_loss": -6.062806129455566, "global_step": 64444, "epoch": 1534} {"train_loss": -6.006782531738281, "global_step": 64445, "epoch": 1534} {"train_loss": -5.963366508483887, "global_step": 64446, "epoch": 1534} {"train_loss": -5.950888633728027, "global_step": 64447, "epoch": 1534} {"train_loss": -5.972387313842773, "global_step": 64448, "epoch": 1534} {"train_loss": -5.935502529144287, "global_step": 64449, "epoch": 1534} {"train_loss": -6.006474018096924, "global_step": 64450, "epoch": 1534} {"train_loss": -5.945375919342041, "global_step": 64451, "epoch": 1534} {"train_loss": -6.025524139404297, "global_step": 64452, "epoch": 1534} {"train_loss": -5.927483081817627, "global_step": 64453, "epoch": 1534} {"train_loss": -5.943756103515625, "global_step": 64454, "epoch": 1534} {"train_loss": -5.956273078918457, "global_step": 64455, "epoch": 1534} {"train_loss": -5.9102020263671875, "global_step": 64456, "epoch": 1534} {"train_loss": -5.93260383605957, "global_step": 64457, "epoch": 1534} {"train_loss": -5.956315994262695, "global_step": 64458, "epoch": 1534} {"train_loss": -5.881439685821533, "global_step": 64459, "epoch": 1534} {"train_loss": -5.831484794616699, "global_step": 64460, "epoch": 1534} {"train_loss": -5.800175666809082, "global_step": 64461, "epoch": 1534} {"train_loss": -5.938687324523926, "global_step": 64462, "epoch": 1534} {"train_loss": -5.8978424072265625, "global_step": 64463, "epoch": 1534} {"train_loss": -6.078624725341797, "global_step": 64464, "epoch": 1534} {"train_loss": -5.907148838043213, "global_step": 64465, "epoch": 1534} {"train_loss": -5.851357460021973, "global_step": 64466, "epoch": 1534} {"train_loss": -5.971869468688965, "global_step": 64467, "epoch": 1534} {"train_loss": -5.991977691650391, "global_step": 64468, "epoch": 1534} {"train_loss": -5.937976348967779, "global_step": 64469, "epoch": 1534, "val_loss": 74815.1640625} {"train_loss": -5.993382453918457, "global_step": 64470, "epoch": 1535} {"train_loss": -5.890143394470215, "global_step": 64471, "epoch": 1535} {"train_loss": -5.767985820770264, "global_step": 64472, "epoch": 1535} {"train_loss": -5.847282409667969, "global_step": 64473, "epoch": 1535} {"train_loss": -5.7523088455200195, "global_step": 64474, "epoch": 1535} {"train_loss": -5.906054973602295, "global_step": 64475, "epoch": 1535} {"train_loss": -5.924343109130859, "global_step": 64476, "epoch": 1535} {"train_loss": -6.012391090393066, "global_step": 64477, "epoch": 1535} {"train_loss": -5.899089336395264, "global_step": 64478, "epoch": 1535} {"train_loss": -5.990140914916992, "global_step": 64479, "epoch": 1535} {"train_loss": -6.040412902832031, "global_step": 64480, "epoch": 1535} {"train_loss": -5.939384460449219, "global_step": 64481, "epoch": 1535} {"train_loss": -6.0331268310546875, "global_step": 64482, "epoch": 1535} {"train_loss": -5.861618995666504, "global_step": 64483, "epoch": 1535} {"train_loss": -5.953552722930908, "global_step": 64484, "epoch": 1535} {"train_loss": -5.900077819824219, "global_step": 64485, "epoch": 1535} {"train_loss": -6.043723106384277, "global_step": 64486, "epoch": 1535} {"train_loss": -5.867164134979248, "global_step": 64487, "epoch": 1535} {"train_loss": -6.007964134216309, "global_step": 64488, "epoch": 1535} {"train_loss": -5.906516075134277, "global_step": 64489, "epoch": 1535} {"train_loss": -5.92988920211792, "global_step": 64490, "epoch": 1535} {"train_loss": -5.95142936706543, "global_step": 64491, "epoch": 1535} {"train_loss": -5.962808609008789, "global_step": 64492, "epoch": 1535} {"train_loss": -5.848890781402588, "global_step": 64493, "epoch": 1535} {"train_loss": -5.909400939941406, "global_step": 64494, "epoch": 1535} {"train_loss": -5.880414962768555, "global_step": 64495, "epoch": 1535} {"train_loss": -5.893342018127441, "global_step": 64496, "epoch": 1535} {"train_loss": -5.8689422607421875, "global_step": 64497, "epoch": 1535} {"train_loss": -5.8318257331848145, "global_step": 64498, "epoch": 1535} {"train_loss": -5.966939449310303, "global_step": 64499, "epoch": 1535} {"train_loss": -5.929292678833008, "global_step": 64500, "epoch": 1535} {"train_loss": -5.941603660583496, "global_step": 64501, "epoch": 1535} {"train_loss": -5.900673866271973, "global_step": 64502, "epoch": 1535} {"train_loss": -5.821537494659424, "global_step": 64503, "epoch": 1535} {"train_loss": -5.947940826416016, "global_step": 64504, "epoch": 1535} {"train_loss": -5.8566460609436035, "global_step": 64505, "epoch": 1535} {"train_loss": -5.930751323699951, "global_step": 64506, "epoch": 1535} {"train_loss": -6.0311408042907715, "global_step": 64507, "epoch": 1535} {"train_loss": -5.897894859313965, "global_step": 64508, "epoch": 1535} {"train_loss": -5.837088584899902, "global_step": 64509, "epoch": 1535} {"train_loss": -5.8819193840026855, "global_step": 64510, "epoch": 1535} {"train_loss": -5.916511660530453, "global_step": 64511, "epoch": 1535, "val_loss": 74582.109375} {"train_loss": -6.043614387512207, "global_step": 64512, "epoch": 1536} {"train_loss": -5.941620826721191, "global_step": 64513, "epoch": 1536} {"train_loss": -5.955354690551758, "global_step": 64514, "epoch": 1536} {"train_loss": -5.9600443840026855, "global_step": 64515, "epoch": 1536} {"train_loss": -5.995552062988281, "global_step": 64516, "epoch": 1536} {"train_loss": -6.041669845581055, "global_step": 64517, "epoch": 1536} {"train_loss": -6.090641975402832, "global_step": 64518, "epoch": 1536} {"train_loss": -5.9390363693237305, "global_step": 64519, "epoch": 1536} {"train_loss": -5.9670562744140625, "global_step": 64520, "epoch": 1536} {"train_loss": -5.979059219360352, "global_step": 64521, "epoch": 1536} {"train_loss": -6.0355048179626465, "global_step": 64522, "epoch": 1536} {"train_loss": -5.927445888519287, "global_step": 64523, "epoch": 1536} {"train_loss": -5.972826957702637, "global_step": 64524, "epoch": 1536} {"train_loss": -6.012383937835693, "global_step": 64525, "epoch": 1536} {"train_loss": -6.0485124588012695, "global_step": 64526, "epoch": 1536} {"train_loss": -5.97010612487793, "global_step": 64527, "epoch": 1536} {"train_loss": -5.96509313583374, "global_step": 64528, "epoch": 1536} {"train_loss": -6.080699920654297, "global_step": 64529, "epoch": 1536} {"train_loss": -6.05405855178833, "global_step": 64530, "epoch": 1536} {"train_loss": -5.998315334320068, "global_step": 64531, "epoch": 1536} {"train_loss": -6.026910781860352, "global_step": 64532, "epoch": 1536} {"train_loss": -5.963834762573242, "global_step": 64533, "epoch": 1536} {"train_loss": -6.003700256347656, "global_step": 64534, "epoch": 1536} {"train_loss": -6.0167131423950195, "global_step": 64535, "epoch": 1536} {"train_loss": -6.019431114196777, "global_step": 64536, "epoch": 1536} {"train_loss": -6.062973976135254, "global_step": 64537, "epoch": 1536} {"train_loss": -6.017645835876465, "global_step": 64538, "epoch": 1536} {"train_loss": -5.954965591430664, "global_step": 64539, "epoch": 1536} {"train_loss": -5.948469161987305, "global_step": 64540, "epoch": 1536} {"train_loss": -6.088440895080566, "global_step": 64541, "epoch": 1536} {"train_loss": -5.936085224151611, "global_step": 64542, "epoch": 1536} {"train_loss": -6.009777069091797, "global_step": 64543, "epoch": 1536} {"train_loss": -6.008424758911133, "global_step": 64544, "epoch": 1536} {"train_loss": -6.042093753814697, "global_step": 64545, "epoch": 1536} {"train_loss": -5.858667373657227, "global_step": 64546, "epoch": 1536} {"train_loss": -5.896491050720215, "global_step": 64547, "epoch": 1536} {"train_loss": -5.83073616027832, "global_step": 64548, "epoch": 1536} {"train_loss": -5.8571624755859375, "global_step": 64549, "epoch": 1536} {"train_loss": -5.978052139282227, "global_step": 64550, "epoch": 1536} {"train_loss": -5.964275360107422, "global_step": 64551, "epoch": 1536} {"train_loss": -5.908843994140625, "global_step": 64552, "epoch": 1536} {"train_loss": -5.98220960299174, "global_step": 64553, "epoch": 1536, "val_loss": 74873.203125} {"train_loss": -5.896106719970703, "global_step": 64554, "epoch": 1537} {"train_loss": -5.812043190002441, "global_step": 64555, "epoch": 1537} {"train_loss": -5.957308769226074, "global_step": 64556, "epoch": 1537} {"train_loss": -5.841475486755371, "global_step": 64557, "epoch": 1537} {"train_loss": -5.991657257080078, "global_step": 64558, "epoch": 1537} {"train_loss": -5.877817153930664, "global_step": 64559, "epoch": 1537} {"train_loss": -5.871698379516602, "global_step": 64560, "epoch": 1537} {"train_loss": -6.036235332489014, "global_step": 64561, "epoch": 1537} {"train_loss": -5.785192489624023, "global_step": 64562, "epoch": 1537} {"train_loss": -5.892219543457031, "global_step": 64563, "epoch": 1537} {"train_loss": -5.9701337814331055, "global_step": 64564, "epoch": 1537} {"train_loss": -5.748358726501465, "global_step": 64565, "epoch": 1537} {"train_loss": -5.894624710083008, "global_step": 64566, "epoch": 1537} {"train_loss": -5.871520042419434, "global_step": 64567, "epoch": 1537} {"train_loss": -5.900589942932129, "global_step": 64568, "epoch": 1537} {"train_loss": -5.812902450561523, "global_step": 64569, "epoch": 1537} {"train_loss": -5.909126281738281, "global_step": 64570, "epoch": 1537} {"train_loss": -5.9038262367248535, "global_step": 64571, "epoch": 1537} {"train_loss": -5.8578338623046875, "global_step": 64572, "epoch": 1537} {"train_loss": -5.987673759460449, "global_step": 64573, "epoch": 1537} {"train_loss": -5.936128616333008, "global_step": 64574, "epoch": 1537} {"train_loss": -5.9457502365112305, "global_step": 64575, "epoch": 1537} {"train_loss": -5.859491348266602, "global_step": 64576, "epoch": 1537} {"train_loss": -5.827193737030029, "global_step": 64577, "epoch": 1537} {"train_loss": -5.919103622436523, "global_step": 64578, "epoch": 1537} {"train_loss": -5.9789557456970215, "global_step": 64579, "epoch": 1537} {"train_loss": -5.970128059387207, "global_step": 64580, "epoch": 1537} {"train_loss": -5.940007209777832, "global_step": 64581, "epoch": 1537} {"train_loss": -5.908069133758545, "global_step": 64582, "epoch": 1537} {"train_loss": -5.877060890197754, "global_step": 64583, "epoch": 1537} {"train_loss": -5.810001850128174, "global_step": 64584, "epoch": 1537} {"train_loss": -5.921253204345703, "global_step": 64585, "epoch": 1537} {"train_loss": -5.981680870056152, "global_step": 64586, "epoch": 1537} {"train_loss": -5.9029951095581055, "global_step": 64587, "epoch": 1537} {"train_loss": -5.9477739334106445, "global_step": 64588, "epoch": 1537} {"train_loss": -6.018826484680176, "global_step": 64589, "epoch": 1537} {"train_loss": -5.896130084991455, "global_step": 64590, "epoch": 1537} {"train_loss": -5.989177703857422, "global_step": 64591, "epoch": 1537} {"train_loss": -5.974344253540039, "global_step": 64592, "epoch": 1537} {"train_loss": -5.862598419189453, "global_step": 64593, "epoch": 1537} {"train_loss": -5.995029449462891, "global_step": 64594, "epoch": 1537} {"train_loss": -5.911388851347423, "global_step": 64595, "epoch": 1537, "val_loss": 74532.6640625} {"train_loss": -5.991031646728516, "global_step": 64596, "epoch": 1538} {"train_loss": -5.856217384338379, "global_step": 64597, "epoch": 1538} {"train_loss": -6.036325454711914, "global_step": 64598, "epoch": 1538} {"train_loss": -5.974479675292969, "global_step": 64599, "epoch": 1538} {"train_loss": -6.004419326782227, "global_step": 64600, "epoch": 1538} {"train_loss": -5.970767021179199, "global_step": 64601, "epoch": 1538} {"train_loss": -6.008327007293701, "global_step": 64602, "epoch": 1538} {"train_loss": -5.905414581298828, "global_step": 64603, "epoch": 1538} {"train_loss": -5.9377031326293945, "global_step": 64604, "epoch": 1538} {"train_loss": -5.996596336364746, "global_step": 64605, "epoch": 1538} {"train_loss": -5.959172248840332, "global_step": 64606, "epoch": 1538} {"train_loss": -5.944998741149902, "global_step": 64607, "epoch": 1538} {"train_loss": -5.962808132171631, "global_step": 64608, "epoch": 1538} {"train_loss": -5.900446891784668, "global_step": 64609, "epoch": 1538} {"train_loss": -5.974874496459961, "global_step": 64610, "epoch": 1538} {"train_loss": -5.984706401824951, "global_step": 64611, "epoch": 1538} {"train_loss": -5.876788139343262, "global_step": 64612, "epoch": 1538} {"train_loss": -5.916772842407227, "global_step": 64613, "epoch": 1538} {"train_loss": -5.976190567016602, "global_step": 64614, "epoch": 1538} {"train_loss": -5.929229736328125, "global_step": 64615, "epoch": 1538} {"train_loss": -5.885437488555908, "global_step": 64616, "epoch": 1538} {"train_loss": -5.917342185974121, "global_step": 64617, "epoch": 1538} {"train_loss": -5.8927130699157715, "global_step": 64618, "epoch": 1538} {"train_loss": -5.885893821716309, "global_step": 64619, "epoch": 1538} {"train_loss": -5.9996113777160645, "global_step": 64620, "epoch": 1538} {"train_loss": -6.018919944763184, "global_step": 64621, "epoch": 1538} {"train_loss": -5.873144149780273, "global_step": 64622, "epoch": 1538} {"train_loss": -5.807761192321777, "global_step": 64623, "epoch": 1538} {"train_loss": -6.000677108764648, "global_step": 64624, "epoch": 1538} {"train_loss": -5.878776550292969, "global_step": 64625, "epoch": 1538} {"train_loss": -5.854483127593994, "global_step": 64626, "epoch": 1538} {"train_loss": -6.012166500091553, "global_step": 64627, "epoch": 1538} {"train_loss": -5.8608808517456055, "global_step": 64628, "epoch": 1538} {"train_loss": -5.9926910400390625, "global_step": 64629, "epoch": 1538} {"train_loss": -5.956902503967285, "global_step": 64630, "epoch": 1538} {"train_loss": -5.896703243255615, "global_step": 64631, "epoch": 1538} {"train_loss": -6.023320198059082, "global_step": 64632, "epoch": 1538} {"train_loss": -5.8469648361206055, "global_step": 64633, "epoch": 1538} {"train_loss": -5.974190711975098, "global_step": 64634, "epoch": 1538} {"train_loss": -6.039628028869629, "global_step": 64635, "epoch": 1538} {"train_loss": -6.041825294494629, "global_step": 64636, "epoch": 1538} {"train_loss": -5.942935773304531, "global_step": 64637, "epoch": 1538, "val_loss": 74406.265625} {"train_loss": -6.031852722167969, "global_step": 64638, "epoch": 1539} {"train_loss": -6.008001327514648, "global_step": 64639, "epoch": 1539} {"train_loss": -5.861224174499512, "global_step": 64640, "epoch": 1539} {"train_loss": -5.847307205200195, "global_step": 64641, "epoch": 1539} {"train_loss": -6.0442423820495605, "global_step": 64642, "epoch": 1539} {"train_loss": -5.963168144226074, "global_step": 64643, "epoch": 1539} {"train_loss": -5.868516445159912, "global_step": 64644, "epoch": 1539} {"train_loss": -5.804037094116211, "global_step": 64645, "epoch": 1539} {"train_loss": -6.003171920776367, "global_step": 64646, "epoch": 1539} {"train_loss": -5.991978168487549, "global_step": 64647, "epoch": 1539} {"train_loss": -5.980780601501465, "global_step": 64648, "epoch": 1539} {"train_loss": -5.92306661605835, "global_step": 64649, "epoch": 1539} {"train_loss": -5.91539192199707, "global_step": 64650, "epoch": 1539} {"train_loss": -5.879321098327637, "global_step": 64651, "epoch": 1539} {"train_loss": -5.979154109954834, "global_step": 64652, "epoch": 1539} {"train_loss": -5.942278861999512, "global_step": 64653, "epoch": 1539} {"train_loss": -5.988956451416016, "global_step": 64654, "epoch": 1539} {"train_loss": -5.983198642730713, "global_step": 64655, "epoch": 1539} {"train_loss": -5.918114185333252, "global_step": 64656, "epoch": 1539} {"train_loss": -5.95824670791626, "global_step": 64657, "epoch": 1539} {"train_loss": -5.9888458251953125, "global_step": 64658, "epoch": 1539} {"train_loss": -6.051009654998779, "global_step": 64659, "epoch": 1539} {"train_loss": -6.023111343383789, "global_step": 64660, "epoch": 1539} {"train_loss": -5.939289569854736, "global_step": 64661, "epoch": 1539} {"train_loss": -5.913283348083496, "global_step": 64662, "epoch": 1539} {"train_loss": -5.9033203125, "global_step": 64663, "epoch": 1539} {"train_loss": -5.967019081115723, "global_step": 64664, "epoch": 1539} {"train_loss": -6.001075744628906, "global_step": 64665, "epoch": 1539} {"train_loss": -5.864843368530273, "global_step": 64666, "epoch": 1539} {"train_loss": -5.91650915145874, "global_step": 64667, "epoch": 1539} {"train_loss": -6.001162528991699, "global_step": 64668, "epoch": 1539} {"train_loss": -5.936361789703369, "global_step": 64669, "epoch": 1539} {"train_loss": -6.072125434875488, "global_step": 64670, "epoch": 1539} {"train_loss": -5.9802565574646, "global_step": 64671, "epoch": 1539} {"train_loss": -5.90711784362793, "global_step": 64672, "epoch": 1539} {"train_loss": -5.9943342208862305, "global_step": 64673, "epoch": 1539} {"train_loss": -6.058835506439209, "global_step": 64674, "epoch": 1539} {"train_loss": -6.014488220214844, "global_step": 64675, "epoch": 1539} {"train_loss": -5.917357444763184, "global_step": 64676, "epoch": 1539} {"train_loss": -5.941338539123535, "global_step": 64677, "epoch": 1539} {"train_loss": -5.84470796585083, "global_step": 64678, "epoch": 1539} {"train_loss": -5.950633378255935, "global_step": 64679, "epoch": 1539, "val_loss": 75063.3515625} {"train_loss": -5.938780784606934, "global_step": 64680, "epoch": 1540} {"train_loss": -5.946765899658203, "global_step": 64681, "epoch": 1540} {"train_loss": -5.852082252502441, "global_step": 64682, "epoch": 1540} {"train_loss": -5.929289817810059, "global_step": 64683, "epoch": 1540} {"train_loss": -5.8463335037231445, "global_step": 64684, "epoch": 1540} {"train_loss": -5.819870948791504, "global_step": 64685, "epoch": 1540} {"train_loss": -6.0390448570251465, "global_step": 64686, "epoch": 1540} {"train_loss": -5.781018257141113, "global_step": 64687, "epoch": 1540} {"train_loss": -5.975100040435791, "global_step": 64688, "epoch": 1540} {"train_loss": -5.926506996154785, "global_step": 64689, "epoch": 1540} {"train_loss": -5.8253865242004395, "global_step": 64690, "epoch": 1540} {"train_loss": -6.02281379699707, "global_step": 64691, "epoch": 1540} {"train_loss": -5.875050067901611, "global_step": 64692, "epoch": 1540} {"train_loss": -5.924320697784424, "global_step": 64693, "epoch": 1540} {"train_loss": -5.916486740112305, "global_step": 64694, "epoch": 1540} {"train_loss": -5.963479518890381, "global_step": 64695, "epoch": 1540} {"train_loss": -5.918161392211914, "global_step": 64696, "epoch": 1540} {"train_loss": -6.059910774230957, "global_step": 64697, "epoch": 1540} {"train_loss": -6.022148132324219, "global_step": 64698, "epoch": 1540} {"train_loss": -5.924554347991943, "global_step": 64699, "epoch": 1540} {"train_loss": -5.906863212585449, "global_step": 64700, "epoch": 1540} {"train_loss": -6.014390468597412, "global_step": 64701, "epoch": 1540} {"train_loss": -5.968347549438477, "global_step": 64702, "epoch": 1540} {"train_loss": -5.820816993713379, "global_step": 64703, "epoch": 1540} {"train_loss": -6.049430847167969, "global_step": 64704, "epoch": 1540} {"train_loss": -6.043859958648682, "global_step": 64705, "epoch": 1540} {"train_loss": -5.8729705810546875, "global_step": 64706, "epoch": 1540} {"train_loss": -6.083033084869385, "global_step": 64707, "epoch": 1540} {"train_loss": -5.899410247802734, "global_step": 64708, "epoch": 1540} {"train_loss": -5.944733619689941, "global_step": 64709, "epoch": 1540} {"train_loss": -5.942733287811279, "global_step": 64710, "epoch": 1540} {"train_loss": -6.0077595710754395, "global_step": 64711, "epoch": 1540} {"train_loss": -5.971174240112305, "global_step": 64712, "epoch": 1540} {"train_loss": -5.888119697570801, "global_step": 64713, "epoch": 1540} {"train_loss": -5.932478904724121, "global_step": 64714, "epoch": 1540} {"train_loss": -6.086223602294922, "global_step": 64715, "epoch": 1540} {"train_loss": -5.826908588409424, "global_step": 64716, "epoch": 1540} {"train_loss": -5.88917350769043, "global_step": 64717, "epoch": 1540} {"train_loss": -5.970132827758789, "global_step": 64718, "epoch": 1540} {"train_loss": -5.977700233459473, "global_step": 64719, "epoch": 1540} {"train_loss": -5.8443379402160645, "global_step": 64720, "epoch": 1540} {"train_loss": -5.940264270419166, "global_step": 64721, "epoch": 1540, "val_loss": 74462.7421875} {"train_loss": -6.048637866973877, "global_step": 64722, "epoch": 1541} {"train_loss": -5.875006675720215, "global_step": 64723, "epoch": 1541} {"train_loss": -5.924160003662109, "global_step": 64724, "epoch": 1541} {"train_loss": -6.013446807861328, "global_step": 64725, "epoch": 1541} {"train_loss": -5.91133451461792, "global_step": 64726, "epoch": 1541} {"train_loss": -5.993202209472656, "global_step": 64727, "epoch": 1541} {"train_loss": -5.903921127319336, "global_step": 64728, "epoch": 1541} {"train_loss": -5.922073841094971, "global_step": 64729, "epoch": 1541} {"train_loss": -5.97952938079834, "global_step": 64730, "epoch": 1541} {"train_loss": -5.989136695861816, "global_step": 64731, "epoch": 1541} {"train_loss": -5.966991424560547, "global_step": 64732, "epoch": 1541} {"train_loss": -5.923044204711914, "global_step": 64733, "epoch": 1541} {"train_loss": -5.924820899963379, "global_step": 64734, "epoch": 1541} {"train_loss": -5.91136360168457, "global_step": 64735, "epoch": 1541} {"train_loss": -5.782803535461426, "global_step": 64736, "epoch": 1541} {"train_loss": -6.036375045776367, "global_step": 64737, "epoch": 1541} {"train_loss": -5.899347305297852, "global_step": 64738, "epoch": 1541} {"train_loss": -5.908862113952637, "global_step": 64739, "epoch": 1541} {"train_loss": -5.966553688049316, "global_step": 64740, "epoch": 1541} {"train_loss": -5.881892204284668, "global_step": 64741, "epoch": 1541} {"train_loss": -6.10240364074707, "global_step": 64742, "epoch": 1541} {"train_loss": -5.930622100830078, "global_step": 64743, "epoch": 1541} {"train_loss": -6.002590656280518, "global_step": 64744, "epoch": 1541} {"train_loss": -5.91922664642334, "global_step": 64745, "epoch": 1541} {"train_loss": -6.021908283233643, "global_step": 64746, "epoch": 1541} {"train_loss": -6.091205596923828, "global_step": 64747, "epoch": 1541} {"train_loss": -5.93768310546875, "global_step": 64748, "epoch": 1541} {"train_loss": -6.045801162719727, "global_step": 64749, "epoch": 1541} {"train_loss": -6.036339282989502, "global_step": 64750, "epoch": 1541} {"train_loss": -5.9365057945251465, "global_step": 64751, "epoch": 1541} {"train_loss": -6.067248821258545, "global_step": 64752, "epoch": 1541} {"train_loss": -6.091736793518066, "global_step": 64753, "epoch": 1541} {"train_loss": -5.938720703125, "global_step": 64754, "epoch": 1541} {"train_loss": -6.000609874725342, "global_step": 64755, "epoch": 1541} {"train_loss": -5.940702438354492, "global_step": 64756, "epoch": 1541} {"train_loss": -6.1215314865112305, "global_step": 64757, "epoch": 1541} {"train_loss": -5.982544898986816, "global_step": 64758, "epoch": 1541} {"train_loss": -5.878695487976074, "global_step": 64759, "epoch": 1541} {"train_loss": -6.189414024353027, "global_step": 64760, "epoch": 1541} {"train_loss": -5.992187023162842, "global_step": 64761, "epoch": 1541} {"train_loss": -6.062387466430664, "global_step": 64762, "epoch": 1541} {"train_loss": -5.977668205897014, "global_step": 64763, "epoch": 1541, "val_loss": 74648.9296875} {"train_loss": -5.94340705871582, "global_step": 64764, "epoch": 1542} {"train_loss": -5.8872971534729, "global_step": 64765, "epoch": 1542} {"train_loss": -6.063462257385254, "global_step": 64766, "epoch": 1542} {"train_loss": -5.898988723754883, "global_step": 64767, "epoch": 1542} {"train_loss": -5.926181793212891, "global_step": 64768, "epoch": 1542} {"train_loss": -5.86839485168457, "global_step": 64769, "epoch": 1542} {"train_loss": -6.064573287963867, "global_step": 64770, "epoch": 1542} {"train_loss": -5.962594509124756, "global_step": 64771, "epoch": 1542} {"train_loss": -5.870227813720703, "global_step": 64772, "epoch": 1542} {"train_loss": -5.8500566482543945, "global_step": 64773, "epoch": 1542} {"train_loss": -5.929299354553223, "global_step": 64774, "epoch": 1542} {"train_loss": -6.007360458374023, "global_step": 64775, "epoch": 1542} {"train_loss": -6.041879653930664, "global_step": 64776, "epoch": 1542} {"train_loss": -6.014304161071777, "global_step": 64777, "epoch": 1542} {"train_loss": -5.887625694274902, "global_step": 64778, "epoch": 1542} {"train_loss": -5.974002838134766, "global_step": 64779, "epoch": 1542} {"train_loss": -6.018072605133057, "global_step": 64780, "epoch": 1542} {"train_loss": -5.8889007568359375, "global_step": 64781, "epoch": 1542} {"train_loss": -5.953431129455566, "global_step": 64782, "epoch": 1542} {"train_loss": -6.02647590637207, "global_step": 64783, "epoch": 1542} {"train_loss": -5.892096996307373, "global_step": 64784, "epoch": 1542} {"train_loss": -5.946107864379883, "global_step": 64785, "epoch": 1542} {"train_loss": -5.953001499176025, "global_step": 64786, "epoch": 1542} {"train_loss": -5.985931396484375, "global_step": 64787, "epoch": 1542} {"train_loss": -5.894604682922363, "global_step": 64788, "epoch": 1542} {"train_loss": -5.847512245178223, "global_step": 64789, "epoch": 1542} {"train_loss": -5.935345649719238, "global_step": 64790, "epoch": 1542} {"train_loss": -5.9651641845703125, "global_step": 64791, "epoch": 1542} {"train_loss": -5.8768486976623535, "global_step": 64792, "epoch": 1542} {"train_loss": -5.988702774047852, "global_step": 64793, "epoch": 1542} {"train_loss": -5.848012924194336, "global_step": 64794, "epoch": 1542} {"train_loss": -5.749578475952148, "global_step": 64795, "epoch": 1542} {"train_loss": -6.020697593688965, "global_step": 64796, "epoch": 1542} {"train_loss": -5.747274398803711, "global_step": 64797, "epoch": 1542} {"train_loss": -5.93406867980957, "global_step": 64798, "epoch": 1542} {"train_loss": -5.920348167419434, "global_step": 64799, "epoch": 1542} {"train_loss": -5.915194511413574, "global_step": 64800, "epoch": 1542} {"train_loss": -5.964151382446289, "global_step": 64801, "epoch": 1542} {"train_loss": -5.965153217315674, "global_step": 64802, "epoch": 1542} {"train_loss": -5.833773612976074, "global_step": 64803, "epoch": 1542} {"train_loss": -5.937192440032959, "global_step": 64804, "epoch": 1542} {"train_loss": -5.933024826503935, "global_step": 64805, "epoch": 1542, "val_loss": 74704.6015625} {"train_loss": -6.020106315612793, "global_step": 64806, "epoch": 1543} {"train_loss": -5.838593482971191, "global_step": 64807, "epoch": 1543} {"train_loss": -5.912700653076172, "global_step": 64808, "epoch": 1543} {"train_loss": -5.876523971557617, "global_step": 64809, "epoch": 1543} {"train_loss": -5.876640796661377, "global_step": 64810, "epoch": 1543} {"train_loss": -5.977286338806152, "global_step": 64811, "epoch": 1543} {"train_loss": -5.848023414611816, "global_step": 64812, "epoch": 1543} {"train_loss": -5.929088592529297, "global_step": 64813, "epoch": 1543} {"train_loss": -5.914395809173584, "global_step": 64814, "epoch": 1543} {"train_loss": -5.921075344085693, "global_step": 64815, "epoch": 1543} {"train_loss": -5.938077449798584, "global_step": 64816, "epoch": 1543} {"train_loss": -5.87851619720459, "global_step": 64817, "epoch": 1543} {"train_loss": -5.999430179595947, "global_step": 64818, "epoch": 1543} {"train_loss": -5.931760311126709, "global_step": 64819, "epoch": 1543} {"train_loss": -5.947479724884033, "global_step": 64820, "epoch": 1543} {"train_loss": -6.0175557136535645, "global_step": 64821, "epoch": 1543} {"train_loss": -5.95731258392334, "global_step": 64822, "epoch": 1543} {"train_loss": -5.821828842163086, "global_step": 64823, "epoch": 1543} {"train_loss": -6.114900588989258, "global_step": 64824, "epoch": 1543} {"train_loss": -5.94584846496582, "global_step": 64825, "epoch": 1543} {"train_loss": -5.840654373168945, "global_step": 64826, "epoch": 1543} {"train_loss": -5.981684684753418, "global_step": 64827, "epoch": 1543} {"train_loss": -5.893630027770996, "global_step": 64828, "epoch": 1543} {"train_loss": -6.099187850952148, "global_step": 64829, "epoch": 1543} {"train_loss": -5.9542236328125, "global_step": 64830, "epoch": 1543} {"train_loss": -5.900856018066406, "global_step": 64831, "epoch": 1543} {"train_loss": -5.947762489318848, "global_step": 64832, "epoch": 1543} {"train_loss": -5.893857002258301, "global_step": 64833, "epoch": 1543} {"train_loss": -5.83148193359375, "global_step": 64834, "epoch": 1543} {"train_loss": -5.853847026824951, "global_step": 64835, "epoch": 1543} {"train_loss": -6.013904571533203, "global_step": 64836, "epoch": 1543} {"train_loss": -5.945337295532227, "global_step": 64837, "epoch": 1543} {"train_loss": -5.726097583770752, "global_step": 64838, "epoch": 1543} {"train_loss": -5.994076251983643, "global_step": 64839, "epoch": 1543} {"train_loss": -5.978401184082031, "global_step": 64840, "epoch": 1543} {"train_loss": -5.9645795822143555, "global_step": 64841, "epoch": 1543} {"train_loss": -6.002938270568848, "global_step": 64842, "epoch": 1543} {"train_loss": -5.90946102142334, "global_step": 64843, "epoch": 1543} {"train_loss": -5.817594528198242, "global_step": 64844, "epoch": 1543} {"train_loss": -5.834802627563477, "global_step": 64845, "epoch": 1543} {"train_loss": -5.783748626708984, "global_step": 64846, "epoch": 1543} {"train_loss": -5.92476885659354, "global_step": 64847, "epoch": 1543, "val_loss": 75669.5078125} {"train_loss": -5.8557024002075195, "global_step": 64848, "epoch": 1544} {"train_loss": -5.9758195877075195, "global_step": 64849, "epoch": 1544} {"train_loss": -5.961552619934082, "global_step": 64850, "epoch": 1544} {"train_loss": -5.927292823791504, "global_step": 64851, "epoch": 1544} {"train_loss": -5.797918319702148, "global_step": 64852, "epoch": 1544} {"train_loss": -5.900972366333008, "global_step": 64853, "epoch": 1544} {"train_loss": -5.882315635681152, "global_step": 64854, "epoch": 1544} {"train_loss": -5.93661642074585, "global_step": 64855, "epoch": 1544} {"train_loss": -5.995609283447266, "global_step": 64856, "epoch": 1544} {"train_loss": -5.909175872802734, "global_step": 64857, "epoch": 1544} {"train_loss": -5.973388671875, "global_step": 64858, "epoch": 1544} {"train_loss": -6.002635478973389, "global_step": 64859, "epoch": 1544} {"train_loss": -5.92679500579834, "global_step": 64860, "epoch": 1544} {"train_loss": -5.867369651794434, "global_step": 64861, "epoch": 1544} {"train_loss": -5.94288444519043, "global_step": 64862, "epoch": 1544} {"train_loss": -5.886049270629883, "global_step": 64863, "epoch": 1544} {"train_loss": -5.8916215896606445, "global_step": 64864, "epoch": 1544} {"train_loss": -5.972177982330322, "global_step": 64865, "epoch": 1544} {"train_loss": -5.86598539352417, "global_step": 64866, "epoch": 1544} {"train_loss": -6.030065536499023, "global_step": 64867, "epoch": 1544} {"train_loss": -5.957399368286133, "global_step": 64868, "epoch": 1544} {"train_loss": -5.916563034057617, "global_step": 64869, "epoch": 1544} {"train_loss": -6.079408645629883, "global_step": 64870, "epoch": 1544} {"train_loss": -5.755434989929199, "global_step": 64871, "epoch": 1544} {"train_loss": -5.956822395324707, "global_step": 64872, "epoch": 1544} {"train_loss": -5.8732805252075195, "global_step": 64873, "epoch": 1544} {"train_loss": -5.800481796264648, "global_step": 64874, "epoch": 1544} {"train_loss": -5.976448059082031, "global_step": 64875, "epoch": 1544} {"train_loss": -5.858602523803711, "global_step": 64876, "epoch": 1544} {"train_loss": -6.032805442810059, "global_step": 64877, "epoch": 1544} {"train_loss": -5.984498500823975, "global_step": 64878, "epoch": 1544} {"train_loss": -6.074132919311523, "global_step": 64879, "epoch": 1544} {"train_loss": -6.038670063018799, "global_step": 64880, "epoch": 1544} {"train_loss": -5.925654411315918, "global_step": 64881, "epoch": 1544} {"train_loss": -6.043641090393066, "global_step": 64882, "epoch": 1544} {"train_loss": -6.003274440765381, "global_step": 64883, "epoch": 1544} {"train_loss": -6.119899749755859, "global_step": 64884, "epoch": 1544} {"train_loss": -5.9821648597717285, "global_step": 64885, "epoch": 1544} {"train_loss": -6.00687837600708, "global_step": 64886, "epoch": 1544} {"train_loss": -5.95632791519165, "global_step": 64887, "epoch": 1544} {"train_loss": -5.896450519561768, "global_step": 64888, "epoch": 1544} {"train_loss": -5.944665999639602, "global_step": 64889, "epoch": 1544, "val_loss": 74476.515625} {"train_loss": -5.897845268249512, "global_step": 64890, "epoch": 1545} {"train_loss": -6.131533622741699, "global_step": 64891, "epoch": 1545} {"train_loss": -6.046393871307373, "global_step": 64892, "epoch": 1545} {"train_loss": -5.9537577629089355, "global_step": 64893, "epoch": 1545} {"train_loss": -6.03709602355957, "global_step": 64894, "epoch": 1545} {"train_loss": -5.989654541015625, "global_step": 64895, "epoch": 1545} {"train_loss": -5.918331146240234, "global_step": 64896, "epoch": 1545} {"train_loss": -6.094879150390625, "global_step": 64897, "epoch": 1545} {"train_loss": -5.922481536865234, "global_step": 64898, "epoch": 1545} {"train_loss": -5.963435173034668, "global_step": 64899, "epoch": 1545} {"train_loss": -6.066247940063477, "global_step": 64900, "epoch": 1545} {"train_loss": -6.080343723297119, "global_step": 64901, "epoch": 1545} {"train_loss": -6.0506157875061035, "global_step": 64902, "epoch": 1545} {"train_loss": -5.901819229125977, "global_step": 64903, "epoch": 1545} {"train_loss": -6.044610023498535, "global_step": 64904, "epoch": 1545} {"train_loss": -6.01556396484375, "global_step": 64905, "epoch": 1545} {"train_loss": -6.118763446807861, "global_step": 64906, "epoch": 1545} {"train_loss": -5.892426490783691, "global_step": 64907, "epoch": 1545} {"train_loss": -5.863564968109131, "global_step": 64908, "epoch": 1545} {"train_loss": -6.044759750366211, "global_step": 64909, "epoch": 1545} {"train_loss": -6.058958053588867, "global_step": 64910, "epoch": 1545} {"train_loss": -5.96927547454834, "global_step": 64911, "epoch": 1545} {"train_loss": -5.932101249694824, "global_step": 64912, "epoch": 1545} {"train_loss": -5.952136993408203, "global_step": 64913, "epoch": 1545} {"train_loss": -5.920239448547363, "global_step": 64914, "epoch": 1545} {"train_loss": -5.950711250305176, "global_step": 64915, "epoch": 1545} {"train_loss": -5.897911071777344, "global_step": 64916, "epoch": 1545} {"train_loss": -6.008179664611816, "global_step": 64917, "epoch": 1545} {"train_loss": -5.96956205368042, "global_step": 64918, "epoch": 1545} {"train_loss": -5.896897792816162, "global_step": 64919, "epoch": 1545} {"train_loss": -5.907731533050537, "global_step": 64920, "epoch": 1545} {"train_loss": -5.952991485595703, "global_step": 64921, "epoch": 1545} {"train_loss": -6.003812313079834, "global_step": 64922, "epoch": 1545} {"train_loss": -5.9877705574035645, "global_step": 64923, "epoch": 1545} {"train_loss": -5.928954124450684, "global_step": 64924, "epoch": 1545} {"train_loss": -6.02958869934082, "global_step": 64925, "epoch": 1545} {"train_loss": -5.8946051597595215, "global_step": 64926, "epoch": 1545} {"train_loss": -5.989428520202637, "global_step": 64927, "epoch": 1545} {"train_loss": -5.815260887145996, "global_step": 64928, "epoch": 1545} {"train_loss": -5.889092445373535, "global_step": 64929, "epoch": 1545} {"train_loss": -6.056517601013184, "global_step": 64930, "epoch": 1545} {"train_loss": -5.977136509759085, "global_step": 64931, "epoch": 1545, "val_loss": 74529.9921875} {"train_loss": -6.10315465927124, "global_step": 64932, "epoch": 1546} {"train_loss": -5.9037065505981445, "global_step": 64933, "epoch": 1546} {"train_loss": -6.033717632293701, "global_step": 64934, "epoch": 1546} {"train_loss": -6.0440497398376465, "global_step": 64935, "epoch": 1546} {"train_loss": -5.970095634460449, "global_step": 64936, "epoch": 1546} {"train_loss": -5.929460525512695, "global_step": 64937, "epoch": 1546} {"train_loss": -5.878461837768555, "global_step": 64938, "epoch": 1546} {"train_loss": -5.909608840942383, "global_step": 64939, "epoch": 1546} {"train_loss": -5.9843854904174805, "global_step": 64940, "epoch": 1546} {"train_loss": -5.981755256652832, "global_step": 64941, "epoch": 1546} {"train_loss": -5.963465213775635, "global_step": 64942, "epoch": 1546} {"train_loss": -5.882246971130371, "global_step": 64943, "epoch": 1546} {"train_loss": -5.871771812438965, "global_step": 64944, "epoch": 1546} {"train_loss": -5.945193767547607, "global_step": 64945, "epoch": 1546} {"train_loss": -5.898155689239502, "global_step": 64946, "epoch": 1546} {"train_loss": -5.985461235046387, "global_step": 64947, "epoch": 1546} {"train_loss": -5.937614440917969, "global_step": 64948, "epoch": 1546} {"train_loss": -6.080209255218506, "global_step": 64949, "epoch": 1546} {"train_loss": -5.891776084899902, "global_step": 64950, "epoch": 1546} {"train_loss": -5.994531631469727, "global_step": 64951, "epoch": 1546} {"train_loss": -5.948864936828613, "global_step": 64952, "epoch": 1546} {"train_loss": -5.910377025604248, "global_step": 64953, "epoch": 1546} {"train_loss": -5.952973365783691, "global_step": 64954, "epoch": 1546} {"train_loss": -5.921995639801025, "global_step": 64955, "epoch": 1546} {"train_loss": -6.026135444641113, "global_step": 64956, "epoch": 1546} {"train_loss": -5.968591690063477, "global_step": 64957, "epoch": 1546} {"train_loss": -6.07136344909668, "global_step": 64958, "epoch": 1546} {"train_loss": -6.0407609939575195, "global_step": 64959, "epoch": 1546} {"train_loss": -5.898415565490723, "global_step": 64960, "epoch": 1546} {"train_loss": -5.937887191772461, "global_step": 64961, "epoch": 1546} {"train_loss": -5.989131927490234, "global_step": 64962, "epoch": 1546} {"train_loss": -5.99287223815918, "global_step": 64963, "epoch": 1546} {"train_loss": -5.822173118591309, "global_step": 64964, "epoch": 1546} {"train_loss": -6.029876232147217, "global_step": 64965, "epoch": 1546} {"train_loss": -5.834805488586426, "global_step": 64966, "epoch": 1546} {"train_loss": -5.897603511810303, "global_step": 64967, "epoch": 1546} {"train_loss": -5.976271152496338, "global_step": 64968, "epoch": 1546} {"train_loss": -5.919496536254883, "global_step": 64969, "epoch": 1546} {"train_loss": -5.866340637207031, "global_step": 64970, "epoch": 1546} {"train_loss": -5.9333953857421875, "global_step": 64971, "epoch": 1546} {"train_loss": -5.849034786224365, "global_step": 64972, "epoch": 1546} {"train_loss": -5.9509702410016745, "global_step": 64973, "epoch": 1546, "val_loss": 74421.03125} {"train_loss": -5.927654266357422, "global_step": 64974, "epoch": 1547} {"train_loss": -5.95789909362793, "global_step": 64975, "epoch": 1547} {"train_loss": -5.950087547302246, "global_step": 64976, "epoch": 1547} {"train_loss": -5.903489112854004, "global_step": 64977, "epoch": 1547} {"train_loss": -6.014021396636963, "global_step": 64978, "epoch": 1547} {"train_loss": -5.88188362121582, "global_step": 64979, "epoch": 1547} {"train_loss": -5.972285270690918, "global_step": 64980, "epoch": 1547} {"train_loss": -5.987180233001709, "global_step": 64981, "epoch": 1547} {"train_loss": -6.015924453735352, "global_step": 64982, "epoch": 1547} {"train_loss": -5.831281661987305, "global_step": 64983, "epoch": 1547} {"train_loss": -6.002310752868652, "global_step": 64984, "epoch": 1547} {"train_loss": -5.932852745056152, "global_step": 64985, "epoch": 1547} {"train_loss": -5.83446741104126, "global_step": 64986, "epoch": 1547} {"train_loss": -6.027008056640625, "global_step": 64987, "epoch": 1547} {"train_loss": -6.026657581329346, "global_step": 64988, "epoch": 1547} {"train_loss": -5.9119720458984375, "global_step": 64989, "epoch": 1547} {"train_loss": -5.92348575592041, "global_step": 64990, "epoch": 1547} {"train_loss": -5.88314151763916, "global_step": 64991, "epoch": 1547} {"train_loss": -5.977862358093262, "global_step": 64992, "epoch": 1547} {"train_loss": -5.947075843811035, "global_step": 64993, "epoch": 1547} {"train_loss": -5.974685192108154, "global_step": 64994, "epoch": 1547} {"train_loss": -5.994606971740723, "global_step": 64995, "epoch": 1547} {"train_loss": -5.925906181335449, "global_step": 64996, "epoch": 1547} {"train_loss": -5.914346218109131, "global_step": 64997, "epoch": 1547} {"train_loss": -5.842451572418213, "global_step": 64998, "epoch": 1547} {"train_loss": -5.986197471618652, "global_step": 64999, "epoch": 1547} {"train_loss": -6.0346760749816895, "global_step": 65000, "epoch": 1547} {"train_loss": -6.071481704711914, "global_step": 65001, "epoch": 1547} {"train_loss": -5.939087390899658, "global_step": 65002, "epoch": 1547} {"train_loss": -5.966719627380371, "global_step": 65003, "epoch": 1547} {"train_loss": -5.982290267944336, "global_step": 65004, "epoch": 1547} {"train_loss": -5.945403099060059, "global_step": 65005, "epoch": 1547} {"train_loss": -5.9460883140563965, "global_step": 65006, "epoch": 1547} {"train_loss": -6.0437164306640625, "global_step": 65007, "epoch": 1547} {"train_loss": -6.0412468910217285, "global_step": 65008, "epoch": 1547} {"train_loss": -5.9653778076171875, "global_step": 65009, "epoch": 1547} {"train_loss": -5.922504425048828, "global_step": 65010, "epoch": 1547} {"train_loss": -6.0006103515625, "global_step": 65011, "epoch": 1547} {"train_loss": -5.957396507263184, "global_step": 65012, "epoch": 1547} {"train_loss": -5.845067024230957, "global_step": 65013, "epoch": 1547} {"train_loss": -6.030369758605957, "global_step": 65014, "epoch": 1547} {"train_loss": -5.9573219276609874, "global_step": 65015, "epoch": 1547, "val_loss": 74523.7421875} {"train_loss": -5.864605903625488, "global_step": 65016, "epoch": 1548} {"train_loss": -5.993797302246094, "global_step": 65017, "epoch": 1548} {"train_loss": -6.065905570983887, "global_step": 65018, "epoch": 1548} {"train_loss": -5.991049289703369, "global_step": 65019, "epoch": 1548} {"train_loss": -5.974053382873535, "global_step": 65020, "epoch": 1548} {"train_loss": -5.973692893981934, "global_step": 65021, "epoch": 1548} {"train_loss": -6.042340278625488, "global_step": 65022, "epoch": 1548} {"train_loss": -5.982455730438232, "global_step": 65023, "epoch": 1548} {"train_loss": -6.070490837097168, "global_step": 65024, "epoch": 1548} {"train_loss": -5.913007736206055, "global_step": 65025, "epoch": 1548} {"train_loss": -5.894567489624023, "global_step": 65026, "epoch": 1548} {"train_loss": -6.028838157653809, "global_step": 65027, "epoch": 1548} {"train_loss": -5.913423538208008, "global_step": 65028, "epoch": 1548} {"train_loss": -5.9728803634643555, "global_step": 65029, "epoch": 1548} {"train_loss": -6.004676342010498, "global_step": 65030, "epoch": 1548} {"train_loss": -6.0461931228637695, "global_step": 65031, "epoch": 1548} {"train_loss": -5.871112823486328, "global_step": 65032, "epoch": 1548} {"train_loss": -5.916072845458984, "global_step": 65033, "epoch": 1548} {"train_loss": -6.035045146942139, "global_step": 65034, "epoch": 1548} {"train_loss": -5.908050537109375, "global_step": 65035, "epoch": 1548} {"train_loss": -5.898360252380371, "global_step": 65036, "epoch": 1548} {"train_loss": -6.006619453430176, "global_step": 65037, "epoch": 1548} {"train_loss": -5.830695152282715, "global_step": 65038, "epoch": 1548} {"train_loss": -5.789377212524414, "global_step": 65039, "epoch": 1548} {"train_loss": -5.872488975524902, "global_step": 65040, "epoch": 1548} {"train_loss": -5.935943603515625, "global_step": 65041, "epoch": 1548} {"train_loss": -5.951797962188721, "global_step": 65042, "epoch": 1548} {"train_loss": -5.858058452606201, "global_step": 65043, "epoch": 1548} {"train_loss": -5.939593315124512, "global_step": 65044, "epoch": 1548} {"train_loss": -5.858808517456055, "global_step": 65045, "epoch": 1548} {"train_loss": -5.914861679077148, "global_step": 65046, "epoch": 1548} {"train_loss": -5.8393964767456055, "global_step": 65047, "epoch": 1548} {"train_loss": -5.897132873535156, "global_step": 65048, "epoch": 1548} {"train_loss": -5.897128105163574, "global_step": 65049, "epoch": 1548} {"train_loss": -5.958071708679199, "global_step": 65050, "epoch": 1548} {"train_loss": -6.032462120056152, "global_step": 65051, "epoch": 1548} {"train_loss": -5.857721328735352, "global_step": 65052, "epoch": 1548} {"train_loss": -6.056661128997803, "global_step": 65053, "epoch": 1548} {"train_loss": -5.933972358703613, "global_step": 65054, "epoch": 1548} {"train_loss": -5.984370231628418, "global_step": 65055, "epoch": 1548} {"train_loss": -5.98807430267334, "global_step": 65056, "epoch": 1548} {"train_loss": -5.947896401087443, "global_step": 65057, "epoch": 1548, "val_loss": 74461.8203125} {"train_loss": -5.925316333770752, "global_step": 65058, "epoch": 1549} {"train_loss": -5.969022750854492, "global_step": 65059, "epoch": 1549} {"train_loss": -5.934140682220459, "global_step": 65060, "epoch": 1549} {"train_loss": -6.043649196624756, "global_step": 65061, "epoch": 1549} {"train_loss": -5.949139595031738, "global_step": 65062, "epoch": 1549} {"train_loss": -6.049045562744141, "global_step": 65063, "epoch": 1549} {"train_loss": -5.938955307006836, "global_step": 65064, "epoch": 1549} {"train_loss": -5.961078643798828, "global_step": 65065, "epoch": 1549} {"train_loss": -5.9105377197265625, "global_step": 65066, "epoch": 1549} {"train_loss": -5.876351356506348, "global_step": 65067, "epoch": 1549} {"train_loss": -5.8439621925354, "global_step": 65068, "epoch": 1549} {"train_loss": -5.998736381530762, "global_step": 65069, "epoch": 1549} {"train_loss": -5.923255920410156, "global_step": 65070, "epoch": 1549} {"train_loss": -5.968503952026367, "global_step": 65071, "epoch": 1549} {"train_loss": -6.061951160430908, "global_step": 65072, "epoch": 1549} {"train_loss": -6.090037822723389, "global_step": 65073, "epoch": 1549} {"train_loss": -5.949540615081787, "global_step": 65074, "epoch": 1549} {"train_loss": -6.092380523681641, "global_step": 65075, "epoch": 1549} {"train_loss": -5.923857688903809, "global_step": 65076, "epoch": 1549} {"train_loss": -5.882209777832031, "global_step": 65077, "epoch": 1549} {"train_loss": -5.964028358459473, "global_step": 65078, "epoch": 1549} {"train_loss": -6.016523838043213, "global_step": 65079, "epoch": 1549} {"train_loss": -6.066463470458984, "global_step": 65080, "epoch": 1549} {"train_loss": -5.985874176025391, "global_step": 65081, "epoch": 1549} {"train_loss": -6.026303291320801, "global_step": 65082, "epoch": 1549} {"train_loss": -5.881096839904785, "global_step": 65083, "epoch": 1549} {"train_loss": -6.0252885818481445, "global_step": 65084, "epoch": 1549} {"train_loss": -5.962854385375977, "global_step": 65085, "epoch": 1549} {"train_loss": -5.8512115478515625, "global_step": 65086, "epoch": 1549} {"train_loss": -5.936028480529785, "global_step": 65087, "epoch": 1549} {"train_loss": -6.034835338592529, "global_step": 65088, "epoch": 1549} {"train_loss": -5.87143611907959, "global_step": 65089, "epoch": 1549} {"train_loss": -5.909143924713135, "global_step": 65090, "epoch": 1549} {"train_loss": -6.046850681304932, "global_step": 65091, "epoch": 1549} {"train_loss": -5.816231727600098, "global_step": 65092, "epoch": 1549} {"train_loss": -6.0504865646362305, "global_step": 65093, "epoch": 1549} {"train_loss": -5.9374284744262695, "global_step": 65094, "epoch": 1549} {"train_loss": -6.021756172180176, "global_step": 65095, "epoch": 1549} {"train_loss": -6.075379848480225, "global_step": 65096, "epoch": 1549} {"train_loss": -6.049149990081787, "global_step": 65097, "epoch": 1549} {"train_loss": -6.0061750411987305, "global_step": 65098, "epoch": 1549} {"train_loss": -5.971515712283907, "global_step": 65099, "epoch": 1549, "val_loss": 74547.6484375} {"train_loss": -6.026046276092529, "global_step": 65100, "epoch": 1550} {"train_loss": -6.146787166595459, "global_step": 65101, "epoch": 1550} {"train_loss": -6.182170867919922, "global_step": 65102, "epoch": 1550} {"train_loss": -6.051779747009277, "global_step": 65103, "epoch": 1550} {"train_loss": -6.009951591491699, "global_step": 65104, "epoch": 1550} {"train_loss": -5.947714805603027, "global_step": 65105, "epoch": 1550} {"train_loss": -5.932723045349121, "global_step": 65106, "epoch": 1550} {"train_loss": -5.991555213928223, "global_step": 65107, "epoch": 1550} {"train_loss": -5.901641845703125, "global_step": 65108, "epoch": 1550} {"train_loss": -6.002859115600586, "global_step": 65109, "epoch": 1550} {"train_loss": -5.995668411254883, "global_step": 65110, "epoch": 1550} {"train_loss": -5.966945648193359, "global_step": 65111, "epoch": 1550} {"train_loss": -5.981602668762207, "global_step": 65112, "epoch": 1550} {"train_loss": -6.0120439529418945, "global_step": 65113, "epoch": 1550} {"train_loss": -5.883794784545898, "global_step": 65114, "epoch": 1550} {"train_loss": -6.037856578826904, "global_step": 65115, "epoch": 1550} {"train_loss": -5.9943437576293945, "global_step": 65116, "epoch": 1550} {"train_loss": -5.997222423553467, "global_step": 65117, "epoch": 1550} {"train_loss": -5.972848892211914, "global_step": 65118, "epoch": 1550} {"train_loss": -5.990100860595703, "global_step": 65119, "epoch": 1550} {"train_loss": -6.0665388107299805, "global_step": 65120, "epoch": 1550} {"train_loss": -5.901928901672363, "global_step": 65121, "epoch": 1550} {"train_loss": -5.984531402587891, "global_step": 65122, "epoch": 1550} {"train_loss": -5.943233966827393, "global_step": 65123, "epoch": 1550} {"train_loss": -5.997169494628906, "global_step": 65124, "epoch": 1550} {"train_loss": -5.847322463989258, "global_step": 65125, "epoch": 1550} {"train_loss": -5.917534828186035, "global_step": 65126, "epoch": 1550} {"train_loss": -5.886768341064453, "global_step": 65127, "epoch": 1550} {"train_loss": -5.892578125, "global_step": 65128, "epoch": 1550} {"train_loss": -5.924788475036621, "global_step": 65129, "epoch": 1550} {"train_loss": -5.926936149597168, "global_step": 65130, "epoch": 1550} {"train_loss": -5.651201248168945, "global_step": 65131, "epoch": 1550} {"train_loss": -6.017210006713867, "global_step": 65132, "epoch": 1550} {"train_loss": -5.655685901641846, "global_step": 65133, "epoch": 1550} {"train_loss": -5.954793453216553, "global_step": 65134, "epoch": 1550} {"train_loss": -5.78752326965332, "global_step": 65135, "epoch": 1550} {"train_loss": -5.795597076416016, "global_step": 65136, "epoch": 1550} {"train_loss": -5.8998918533325195, "global_step": 65137, "epoch": 1550} {"train_loss": -5.876008033752441, "global_step": 65138, "epoch": 1550} {"train_loss": -5.798880577087402, "global_step": 65139, "epoch": 1550} {"train_loss": -5.907265663146973, "global_step": 65140, "epoch": 1550} {"train_loss": -5.940390348434448, "global_step": 65141, "epoch": 1550, "train/sim_max_reward_0": 0.2070634740745631, "train/sim_max_reward_1": 0.7801795737162068, "train/sim_max_reward_2": 0.0851483056294674, "train/sim_max_reward_3": 0.07683413887993633, "train/sim_max_reward_4": 0.45484654560491494, "train/sim_max_reward_5": 0.5611454220268552, "test/sim_max_reward_4500000": 0.8052853070010538, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.6395540121417752, "test/sim_max_reward_4500003": 0.5888877378364107, "test/sim_max_reward_4500004": 0.11770716342563105, "test/sim_max_reward_4500005": 0.6647783723369501, "test/sim_max_reward_4500006": 0.9322354232851077, "test/sim_max_reward_4500007": 0.3498661173407864, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.3408900761557371, "test/sim_max_reward_4500010": 0.3691746356313472, "test/sim_max_reward_4500011": 0.38215867329254566, "test/sim_max_reward_4500012": 0.6964083661761274, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.9466226305136969, "test/sim_max_reward_4500015": 0.09412738627354411, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.00975969406308383, "test/sim_max_reward_4500018": 0.15961975156252436, "test/sim_max_reward_4500019": 0.7500142475189766, "test/sim_max_reward_4500020": 0.49509132428068, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.8818723732302065, "test/sim_max_reward_4500023": 0.9594811064908301, "test/sim_max_reward_4500024": 0.21112185477825832, "test/sim_max_reward_4500025": 0.0022414015982370993, "test/sim_max_reward_4500026": 0.11737204987101711, "test/sim_max_reward_4500027": 0.732899533819974, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.17404187184695433, "test/sim_max_reward_4500030": 0.9581702884957348, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05003817817516072, "test/sim_max_reward_4500033": 0.8281059038122757, "test/sim_max_reward_4500034": 0.44520547444854336, "test/sim_max_reward_4500035": 0.6078906115232096, "test/sim_max_reward_4500036": 0.7998009009544117, "test/sim_max_reward_4500037": 0.4184329089446811, "test/sim_max_reward_4500038": 0.30142989446636403, "test/sim_max_reward_4500039": 0.0, "test/sim_max_reward_4500040": 0.8987351207587704, "test/sim_max_reward_4500041": 0.6938504220841911, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.7606111205439647, "test/sim_max_reward_4500044": 0.3658611739399299, "test/sim_max_reward_4500045": 0.1201770164700382, "test/sim_max_reward_4500046": 0.7164361423238244, "test/sim_max_reward_4500047": 0.8504738541369907, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.3608695766553239, "test/mean_score": 0.42929182775001784, "val_loss": 74971.9921875} {"train_loss": -5.837063789367676, "global_step": 65142, "epoch": 1551} {"train_loss": -5.830439567565918, "global_step": 65143, "epoch": 1551} {"train_loss": -5.962156295776367, "global_step": 65144, "epoch": 1551} {"train_loss": -5.9151692390441895, "global_step": 65145, "epoch": 1551} {"train_loss": -5.720261573791504, "global_step": 65146, "epoch": 1551} {"train_loss": -6.038205146789551, "global_step": 65147, "epoch": 1551} {"train_loss": -5.881076812744141, "global_step": 65148, "epoch": 1551} {"train_loss": -5.934170722961426, "global_step": 65149, "epoch": 1551} {"train_loss": -5.962320327758789, "global_step": 65150, "epoch": 1551} {"train_loss": -5.930628776550293, "global_step": 65151, "epoch": 1551} {"train_loss": -5.8660502433776855, "global_step": 65152, "epoch": 1551} {"train_loss": -6.02301549911499, "global_step": 65153, "epoch": 1551} {"train_loss": -6.024316787719727, "global_step": 65154, "epoch": 1551} {"train_loss": -5.885001182556152, "global_step": 65155, "epoch": 1551} {"train_loss": -5.889958381652832, "global_step": 65156, "epoch": 1551} {"train_loss": -5.86414909362793, "global_step": 65157, "epoch": 1551} {"train_loss": -5.888952255249023, "global_step": 65158, "epoch": 1551} {"train_loss": -5.948416709899902, "global_step": 65159, "epoch": 1551} {"train_loss": -5.875820159912109, "global_step": 65160, "epoch": 1551} {"train_loss": -5.943513870239258, "global_step": 65161, "epoch": 1551} {"train_loss": -5.8221025466918945, "global_step": 65162, "epoch": 1551} {"train_loss": -6.015595436096191, "global_step": 65163, "epoch": 1551} {"train_loss": -5.8384108543396, "global_step": 65164, "epoch": 1551} {"train_loss": -5.867345333099365, "global_step": 65165, "epoch": 1551} {"train_loss": -5.973238945007324, "global_step": 65166, "epoch": 1551} {"train_loss": -5.809637069702148, "global_step": 65167, "epoch": 1551} {"train_loss": -5.782634735107422, "global_step": 65168, "epoch": 1551} {"train_loss": -5.8742146492004395, "global_step": 65169, "epoch": 1551} {"train_loss": -5.786017417907715, "global_step": 65170, "epoch": 1551} {"train_loss": -6.0643720626831055, "global_step": 65171, "epoch": 1551} {"train_loss": -5.699592590332031, "global_step": 65172, "epoch": 1551} {"train_loss": -5.787839889526367, "global_step": 65173, "epoch": 1551} {"train_loss": -5.941330909729004, "global_step": 65174, "epoch": 1551} {"train_loss": -5.749883651733398, "global_step": 65175, "epoch": 1551} {"train_loss": -5.93501091003418, "global_step": 65176, "epoch": 1551} {"train_loss": -5.89483642578125, "global_step": 65177, "epoch": 1551} {"train_loss": -5.927935600280762, "global_step": 65178, "epoch": 1551} {"train_loss": -5.790433883666992, "global_step": 65179, "epoch": 1551} {"train_loss": -5.8839263916015625, "global_step": 65180, "epoch": 1551} {"train_loss": -5.808597087860107, "global_step": 65181, "epoch": 1551} {"train_loss": -5.933014869689941, "global_step": 65182, "epoch": 1551} {"train_loss": -5.8886454332442515, "global_step": 65183, "epoch": 1551, "val_loss": 74752.890625} {"train_loss": -5.8547868728637695, "global_step": 65184, "epoch": 1552} {"train_loss": -5.847061634063721, "global_step": 65185, "epoch": 1552} {"train_loss": -5.8575639724731445, "global_step": 65186, "epoch": 1552} {"train_loss": -6.065996170043945, "global_step": 65187, "epoch": 1552} {"train_loss": -5.849719047546387, "global_step": 65188, "epoch": 1552} {"train_loss": -6.007716178894043, "global_step": 65189, "epoch": 1552} {"train_loss": -6.054749488830566, "global_step": 65190, "epoch": 1552} {"train_loss": -5.920950412750244, "global_step": 65191, "epoch": 1552} {"train_loss": -5.940798759460449, "global_step": 65192, "epoch": 1552} {"train_loss": -5.911345958709717, "global_step": 65193, "epoch": 1552} {"train_loss": -5.996951103210449, "global_step": 65194, "epoch": 1552} {"train_loss": -5.998470783233643, "global_step": 65195, "epoch": 1552} {"train_loss": -5.91765832901001, "global_step": 65196, "epoch": 1552} {"train_loss": -5.9226226806640625, "global_step": 65197, "epoch": 1552} {"train_loss": -5.836991786956787, "global_step": 65198, "epoch": 1552} {"train_loss": -6.006441116333008, "global_step": 65199, "epoch": 1552} {"train_loss": -5.9747185707092285, "global_step": 65200, "epoch": 1552} {"train_loss": -5.932883262634277, "global_step": 65201, "epoch": 1552} {"train_loss": -5.959969997406006, "global_step": 65202, "epoch": 1552} {"train_loss": -5.8921403884887695, "global_step": 65203, "epoch": 1552} {"train_loss": -5.805709362030029, "global_step": 65204, "epoch": 1552} {"train_loss": -5.826447010040283, "global_step": 65205, "epoch": 1552} {"train_loss": -5.993497848510742, "global_step": 65206, "epoch": 1552} {"train_loss": -5.922943592071533, "global_step": 65207, "epoch": 1552} {"train_loss": -6.049812316894531, "global_step": 65208, "epoch": 1552} {"train_loss": -5.8632307052612305, "global_step": 65209, "epoch": 1552} {"train_loss": -5.916541576385498, "global_step": 65210, "epoch": 1552} {"train_loss": -5.922945022583008, "global_step": 65211, "epoch": 1552} {"train_loss": -6.059244155883789, "global_step": 65212, "epoch": 1552} {"train_loss": -5.9494218826293945, "global_step": 65213, "epoch": 1552} {"train_loss": -5.82190465927124, "global_step": 65214, "epoch": 1552} {"train_loss": -5.984298229217529, "global_step": 65215, "epoch": 1552} {"train_loss": -6.010344505310059, "global_step": 65216, "epoch": 1552} {"train_loss": -5.834959983825684, "global_step": 65217, "epoch": 1552} {"train_loss": -5.970668792724609, "global_step": 65218, "epoch": 1552} {"train_loss": -5.9895782470703125, "global_step": 65219, "epoch": 1552} {"train_loss": -6.072425842285156, "global_step": 65220, "epoch": 1552} {"train_loss": -6.027301788330078, "global_step": 65221, "epoch": 1552} {"train_loss": -5.911923408508301, "global_step": 65222, "epoch": 1552} {"train_loss": -5.985974311828613, "global_step": 65223, "epoch": 1552} {"train_loss": -6.149499893188477, "global_step": 65224, "epoch": 1552} {"train_loss": -5.948200623194377, "global_step": 65225, "epoch": 1552, "val_loss": 74674.421875} {"train_loss": -5.985969543457031, "global_step": 65226, "epoch": 1553} {"train_loss": -6.027959823608398, "global_step": 65227, "epoch": 1553} {"train_loss": -5.953183174133301, "global_step": 65228, "epoch": 1553} {"train_loss": -5.998056888580322, "global_step": 65229, "epoch": 1553} {"train_loss": -5.85646390914917, "global_step": 65230, "epoch": 1553} {"train_loss": -5.990779876708984, "global_step": 65231, "epoch": 1553} {"train_loss": -5.957596778869629, "global_step": 65232, "epoch": 1553} {"train_loss": -5.935763359069824, "global_step": 65233, "epoch": 1553} {"train_loss": -5.893834114074707, "global_step": 65234, "epoch": 1553} {"train_loss": -5.766202926635742, "global_step": 65235, "epoch": 1553} {"train_loss": -5.890193939208984, "global_step": 65236, "epoch": 1553} {"train_loss": -6.0413360595703125, "global_step": 65237, "epoch": 1553} {"train_loss": -5.828230381011963, "global_step": 65238, "epoch": 1553} {"train_loss": -5.858170509338379, "global_step": 65239, "epoch": 1553} {"train_loss": -5.882845401763916, "global_step": 65240, "epoch": 1553} {"train_loss": -5.9257330894470215, "global_step": 65241, "epoch": 1553} {"train_loss": -5.909685134887695, "global_step": 65242, "epoch": 1553} {"train_loss": -5.865617275238037, "global_step": 65243, "epoch": 1553} {"train_loss": -5.835650444030762, "global_step": 65244, "epoch": 1553} {"train_loss": -5.891472816467285, "global_step": 65245, "epoch": 1553} {"train_loss": -5.903563499450684, "global_step": 65246, "epoch": 1553} {"train_loss": -5.928377628326416, "global_step": 65247, "epoch": 1553} {"train_loss": -5.835973739624023, "global_step": 65248, "epoch": 1553} {"train_loss": -5.916012763977051, "global_step": 65249, "epoch": 1553} {"train_loss": -5.95412540435791, "global_step": 65250, "epoch": 1553} {"train_loss": -5.95978307723999, "global_step": 65251, "epoch": 1553} {"train_loss": -5.942709922790527, "global_step": 65252, "epoch": 1553} {"train_loss": -5.882288455963135, "global_step": 65253, "epoch": 1553} {"train_loss": -5.9791717529296875, "global_step": 65254, "epoch": 1553} {"train_loss": -5.858378887176514, "global_step": 65255, "epoch": 1553} {"train_loss": -5.942906379699707, "global_step": 65256, "epoch": 1553} {"train_loss": -5.956836700439453, "global_step": 65257, "epoch": 1553} {"train_loss": -5.824785232543945, "global_step": 65258, "epoch": 1553} {"train_loss": -5.880274772644043, "global_step": 65259, "epoch": 1553} {"train_loss": -5.8365478515625, "global_step": 65260, "epoch": 1553} {"train_loss": -5.880390167236328, "global_step": 65261, "epoch": 1553} {"train_loss": -5.993081092834473, "global_step": 65262, "epoch": 1553} {"train_loss": -6.014524459838867, "global_step": 65263, "epoch": 1553} {"train_loss": -5.9369659423828125, "global_step": 65264, "epoch": 1553} {"train_loss": -6.000833511352539, "global_step": 65265, "epoch": 1553} {"train_loss": -6.007028579711914, "global_step": 65266, "epoch": 1553} {"train_loss": -5.92121300243196, "global_step": 65267, "epoch": 1553, "val_loss": 74762.5703125} {"train_loss": -6.007129669189453, "global_step": 65268, "epoch": 1554} {"train_loss": -5.987762451171875, "global_step": 65269, "epoch": 1554} {"train_loss": -5.86061429977417, "global_step": 65270, "epoch": 1554} {"train_loss": -5.865971565246582, "global_step": 65271, "epoch": 1554} {"train_loss": -5.9399213790893555, "global_step": 65272, "epoch": 1554} {"train_loss": -5.993738174438477, "global_step": 65273, "epoch": 1554} {"train_loss": -5.898394584655762, "global_step": 65274, "epoch": 1554} {"train_loss": -5.963339805603027, "global_step": 65275, "epoch": 1554} {"train_loss": -6.023612976074219, "global_step": 65276, "epoch": 1554} {"train_loss": -6.033154487609863, "global_step": 65277, "epoch": 1554} {"train_loss": -5.837324142456055, "global_step": 65278, "epoch": 1554} {"train_loss": -5.935764312744141, "global_step": 65279, "epoch": 1554} {"train_loss": -6.066776275634766, "global_step": 65280, "epoch": 1554} {"train_loss": -5.987462997436523, "global_step": 65281, "epoch": 1554} {"train_loss": -6.076993942260742, "global_step": 65282, "epoch": 1554} {"train_loss": -6.043650150299072, "global_step": 65283, "epoch": 1554} {"train_loss": -5.883854866027832, "global_step": 65284, "epoch": 1554} {"train_loss": -5.98148250579834, "global_step": 65285, "epoch": 1554} {"train_loss": -5.946043014526367, "global_step": 65286, "epoch": 1554} {"train_loss": -5.890719890594482, "global_step": 65287, "epoch": 1554} {"train_loss": -6.029137134552002, "global_step": 65288, "epoch": 1554} {"train_loss": -6.126632213592529, "global_step": 65289, "epoch": 1554} {"train_loss": -5.835583209991455, "global_step": 65290, "epoch": 1554} {"train_loss": -5.921552658081055, "global_step": 65291, "epoch": 1554} {"train_loss": -5.998007774353027, "global_step": 65292, "epoch": 1554} {"train_loss": -5.820777893066406, "global_step": 65293, "epoch": 1554} {"train_loss": -5.960916519165039, "global_step": 65294, "epoch": 1554} {"train_loss": -5.771886825561523, "global_step": 65295, "epoch": 1554} {"train_loss": -5.967141151428223, "global_step": 65296, "epoch": 1554} {"train_loss": -5.995524883270264, "global_step": 65297, "epoch": 1554} {"train_loss": -5.923812389373779, "global_step": 65298, "epoch": 1554} {"train_loss": -6.071703910827637, "global_step": 65299, "epoch": 1554} {"train_loss": -6.016194820404053, "global_step": 65300, "epoch": 1554} {"train_loss": -5.860637187957764, "global_step": 65301, "epoch": 1554} {"train_loss": -5.999929428100586, "global_step": 65302, "epoch": 1554} {"train_loss": -5.869303226470947, "global_step": 65303, "epoch": 1554} {"train_loss": -5.9484052658081055, "global_step": 65304, "epoch": 1554} {"train_loss": -5.868157386779785, "global_step": 65305, "epoch": 1554} {"train_loss": -5.981325149536133, "global_step": 65306, "epoch": 1554} {"train_loss": -5.961698532104492, "global_step": 65307, "epoch": 1554} {"train_loss": -5.879256248474121, "global_step": 65308, "epoch": 1554} {"train_loss": -5.951446964627221, "global_step": 65309, "epoch": 1554, "val_loss": 74730.15625} {"train_loss": -5.854671001434326, "global_step": 65310, "epoch": 1555} {"train_loss": -5.963475227355957, "global_step": 65311, "epoch": 1555} {"train_loss": -5.775884628295898, "global_step": 65312, "epoch": 1555} {"train_loss": -5.879096031188965, "global_step": 65313, "epoch": 1555} {"train_loss": -5.985968112945557, "global_step": 65314, "epoch": 1555} {"train_loss": -6.023166179656982, "global_step": 65315, "epoch": 1555} {"train_loss": -5.995391845703125, "global_step": 65316, "epoch": 1555} {"train_loss": -6.018847465515137, "global_step": 65317, "epoch": 1555} {"train_loss": -5.932794570922852, "global_step": 65318, "epoch": 1555} {"train_loss": -5.937615871429443, "global_step": 65319, "epoch": 1555} {"train_loss": -5.90505313873291, "global_step": 65320, "epoch": 1555} {"train_loss": -5.946511268615723, "global_step": 65321, "epoch": 1555} {"train_loss": -5.85807466506958, "global_step": 65322, "epoch": 1555} {"train_loss": -5.9456048011779785, "global_step": 65323, "epoch": 1555} {"train_loss": -6.007589340209961, "global_step": 65324, "epoch": 1555} {"train_loss": -5.9502410888671875, "global_step": 65325, "epoch": 1555} {"train_loss": -5.867769718170166, "global_step": 65326, "epoch": 1555} {"train_loss": -5.973920822143555, "global_step": 65327, "epoch": 1555} {"train_loss": -5.9358673095703125, "global_step": 65328, "epoch": 1555} {"train_loss": -5.9760260581970215, "global_step": 65329, "epoch": 1555} {"train_loss": -6.030614376068115, "global_step": 65330, "epoch": 1555} {"train_loss": -5.9542012214660645, "global_step": 65331, "epoch": 1555} {"train_loss": -5.963781356811523, "global_step": 65332, "epoch": 1555} {"train_loss": -6.115464687347412, "global_step": 65333, "epoch": 1555} {"train_loss": -6.1165313720703125, "global_step": 65334, "epoch": 1555} {"train_loss": -5.989524841308594, "global_step": 65335, "epoch": 1555} {"train_loss": -6.048096179962158, "global_step": 65336, "epoch": 1555} {"train_loss": -5.996779441833496, "global_step": 65337, "epoch": 1555} {"train_loss": -5.994014263153076, "global_step": 65338, "epoch": 1555} {"train_loss": -5.995648384094238, "global_step": 65339, "epoch": 1555} {"train_loss": -5.984641075134277, "global_step": 65340, "epoch": 1555} {"train_loss": -5.965153694152832, "global_step": 65341, "epoch": 1555} {"train_loss": -5.965319633483887, "global_step": 65342, "epoch": 1555} {"train_loss": -6.002190113067627, "global_step": 65343, "epoch": 1555} {"train_loss": -6.028921604156494, "global_step": 65344, "epoch": 1555} {"train_loss": -5.963010787963867, "global_step": 65345, "epoch": 1555} {"train_loss": -5.929304122924805, "global_step": 65346, "epoch": 1555} {"train_loss": -5.898344993591309, "global_step": 65347, "epoch": 1555} {"train_loss": -5.956072807312012, "global_step": 65348, "epoch": 1555} {"train_loss": -5.992059230804443, "global_step": 65349, "epoch": 1555} {"train_loss": -5.9700846672058105, "global_step": 65350, "epoch": 1555} {"train_loss": -5.964918182009742, "global_step": 65351, "epoch": 1555, "val_loss": 74931.234375} {"train_loss": -5.934469223022461, "global_step": 65352, "epoch": 1556} {"train_loss": -6.069973945617676, "global_step": 65353, "epoch": 1556} {"train_loss": -6.047346115112305, "global_step": 65354, "epoch": 1556} {"train_loss": -6.041803359985352, "global_step": 65355, "epoch": 1556} {"train_loss": -5.888004779815674, "global_step": 65356, "epoch": 1556} {"train_loss": -5.973127365112305, "global_step": 65357, "epoch": 1556} {"train_loss": -6.016646385192871, "global_step": 65358, "epoch": 1556} {"train_loss": -5.957542419433594, "global_step": 65359, "epoch": 1556} {"train_loss": -5.995523929595947, "global_step": 65360, "epoch": 1556} {"train_loss": -5.905601501464844, "global_step": 65361, "epoch": 1556} {"train_loss": -5.9744462966918945, "global_step": 65362, "epoch": 1556} {"train_loss": -6.004158020019531, "global_step": 65363, "epoch": 1556} {"train_loss": -6.081147193908691, "global_step": 65364, "epoch": 1556} {"train_loss": -5.900012969970703, "global_step": 65365, "epoch": 1556} {"train_loss": -5.924934387207031, "global_step": 65366, "epoch": 1556} {"train_loss": -6.018504619598389, "global_step": 65367, "epoch": 1556} {"train_loss": -6.056329727172852, "global_step": 65368, "epoch": 1556} {"train_loss": -5.879999160766602, "global_step": 65369, "epoch": 1556} {"train_loss": -5.973080635070801, "global_step": 65370, "epoch": 1556} {"train_loss": -5.997464179992676, "global_step": 65371, "epoch": 1556} {"train_loss": -5.975342273712158, "global_step": 65372, "epoch": 1556} {"train_loss": -5.874996185302734, "global_step": 65373, "epoch": 1556} {"train_loss": -5.926913261413574, "global_step": 65374, "epoch": 1556} {"train_loss": -5.996342658996582, "global_step": 65375, "epoch": 1556} {"train_loss": -6.001948356628418, "global_step": 65376, "epoch": 1556} {"train_loss": -5.969844341278076, "global_step": 65377, "epoch": 1556} {"train_loss": -5.978726387023926, "global_step": 65378, "epoch": 1556} {"train_loss": -6.025259494781494, "global_step": 65379, "epoch": 1556} {"train_loss": -5.930026054382324, "global_step": 65380, "epoch": 1556} {"train_loss": -5.972402572631836, "global_step": 65381, "epoch": 1556} {"train_loss": -6.072195053100586, "global_step": 65382, "epoch": 1556} {"train_loss": -5.92302131652832, "global_step": 65383, "epoch": 1556} {"train_loss": -5.988433837890625, "global_step": 65384, "epoch": 1556} {"train_loss": -5.991990089416504, "global_step": 65385, "epoch": 1556} {"train_loss": -5.9179534912109375, "global_step": 65386, "epoch": 1556} {"train_loss": -5.898355007171631, "global_step": 65387, "epoch": 1556} {"train_loss": -5.845410346984863, "global_step": 65388, "epoch": 1556} {"train_loss": -6.024776458740234, "global_step": 65389, "epoch": 1556} {"train_loss": -5.874947547912598, "global_step": 65390, "epoch": 1556} {"train_loss": -6.0074262619018555, "global_step": 65391, "epoch": 1556} {"train_loss": -5.762817859649658, "global_step": 65392, "epoch": 1556} {"train_loss": -5.963179940269107, "global_step": 65393, "epoch": 1556, "val_loss": 74498.8046875} {"train_loss": -6.019819259643555, "global_step": 65394, "epoch": 1557} {"train_loss": -6.042873382568359, "global_step": 65395, "epoch": 1557} {"train_loss": -5.995547294616699, "global_step": 65396, "epoch": 1557} {"train_loss": -5.966287612915039, "global_step": 65397, "epoch": 1557} {"train_loss": -6.0662126541137695, "global_step": 65398, "epoch": 1557} {"train_loss": -5.944203853607178, "global_step": 65399, "epoch": 1557} {"train_loss": -5.916891098022461, "global_step": 65400, "epoch": 1557} {"train_loss": -5.9816741943359375, "global_step": 65401, "epoch": 1557} {"train_loss": -6.00490140914917, "global_step": 65402, "epoch": 1557} {"train_loss": -5.905094146728516, "global_step": 65403, "epoch": 1557} {"train_loss": -5.841031551361084, "global_step": 65404, "epoch": 1557} {"train_loss": -5.932490348815918, "global_step": 65405, "epoch": 1557} {"train_loss": -5.994849681854248, "global_step": 65406, "epoch": 1557} {"train_loss": -5.913517951965332, "global_step": 65407, "epoch": 1557} {"train_loss": -6.028814315795898, "global_step": 65408, "epoch": 1557} {"train_loss": -6.011914253234863, "global_step": 65409, "epoch": 1557} {"train_loss": -5.966948509216309, "global_step": 65410, "epoch": 1557} {"train_loss": -5.905619144439697, "global_step": 65411, "epoch": 1557} {"train_loss": -5.9781599044799805, "global_step": 65412, "epoch": 1557} {"train_loss": -6.05142879486084, "global_step": 65413, "epoch": 1557} {"train_loss": -5.936379909515381, "global_step": 65414, "epoch": 1557} {"train_loss": -5.965665340423584, "global_step": 65415, "epoch": 1557} {"train_loss": -5.973685264587402, "global_step": 65416, "epoch": 1557} {"train_loss": -5.927687168121338, "global_step": 65417, "epoch": 1557} {"train_loss": -5.970440864562988, "global_step": 65418, "epoch": 1557} {"train_loss": -5.855480194091797, "global_step": 65419, "epoch": 1557} {"train_loss": -5.905797481536865, "global_step": 65420, "epoch": 1557} {"train_loss": -5.896245956420898, "global_step": 65421, "epoch": 1557} {"train_loss": -5.947390556335449, "global_step": 65422, "epoch": 1557} {"train_loss": -5.899682998657227, "global_step": 65423, "epoch": 1557} {"train_loss": -6.0178985595703125, "global_step": 65424, "epoch": 1557} {"train_loss": -5.962436676025391, "global_step": 65425, "epoch": 1557} {"train_loss": -5.791088104248047, "global_step": 65426, "epoch": 1557} {"train_loss": -5.987931251525879, "global_step": 65427, "epoch": 1557} {"train_loss": -5.861893653869629, "global_step": 65428, "epoch": 1557} {"train_loss": -5.953647613525391, "global_step": 65429, "epoch": 1557} {"train_loss": -5.855380058288574, "global_step": 65430, "epoch": 1557} {"train_loss": -5.917710781097412, "global_step": 65431, "epoch": 1557} {"train_loss": -6.035745143890381, "global_step": 65432, "epoch": 1557} {"train_loss": -5.873178005218506, "global_step": 65433, "epoch": 1557} {"train_loss": -6.027767181396484, "global_step": 65434, "epoch": 1557} {"train_loss": -5.948790482112339, "global_step": 65435, "epoch": 1557, "val_loss": 74709.09375} {"train_loss": -5.914588928222656, "global_step": 65436, "epoch": 1558} {"train_loss": -6.106814384460449, "global_step": 65437, "epoch": 1558} {"train_loss": -5.777884483337402, "global_step": 65438, "epoch": 1558} {"train_loss": -5.867382526397705, "global_step": 65439, "epoch": 1558} {"train_loss": -5.8054399490356445, "global_step": 65440, "epoch": 1558} {"train_loss": -6.0831804275512695, "global_step": 65441, "epoch": 1558} {"train_loss": -5.9495086669921875, "global_step": 65442, "epoch": 1558} {"train_loss": -5.933565139770508, "global_step": 65443, "epoch": 1558} {"train_loss": -5.919546127319336, "global_step": 65444, "epoch": 1558} {"train_loss": -5.878540515899658, "global_step": 65445, "epoch": 1558} {"train_loss": -5.910396099090576, "global_step": 65446, "epoch": 1558} {"train_loss": -5.8367462158203125, "global_step": 65447, "epoch": 1558} {"train_loss": -5.903876304626465, "global_step": 65448, "epoch": 1558} {"train_loss": -6.01200532913208, "global_step": 65449, "epoch": 1558} {"train_loss": -5.946408271789551, "global_step": 65450, "epoch": 1558} {"train_loss": -5.962616443634033, "global_step": 65451, "epoch": 1558} {"train_loss": -5.980284690856934, "global_step": 65452, "epoch": 1558} {"train_loss": -5.934713840484619, "global_step": 65453, "epoch": 1558} {"train_loss": -5.932415008544922, "global_step": 65454, "epoch": 1558} {"train_loss": -6.083531379699707, "global_step": 65455, "epoch": 1558} {"train_loss": -5.957690238952637, "global_step": 65456, "epoch": 1558} {"train_loss": -5.926297187805176, "global_step": 65457, "epoch": 1558} {"train_loss": -6.018075942993164, "global_step": 65458, "epoch": 1558} {"train_loss": -6.057350158691406, "global_step": 65459, "epoch": 1558} {"train_loss": -5.828082084655762, "global_step": 65460, "epoch": 1558} {"train_loss": -6.047255039215088, "global_step": 65461, "epoch": 1558} {"train_loss": -5.9962544441223145, "global_step": 65462, "epoch": 1558} {"train_loss": -5.966293811798096, "global_step": 65463, "epoch": 1558} {"train_loss": -5.9257612228393555, "global_step": 65464, "epoch": 1558} {"train_loss": -5.946608543395996, "global_step": 65465, "epoch": 1558} {"train_loss": -6.082529067993164, "global_step": 65466, "epoch": 1558} {"train_loss": -6.022894382476807, "global_step": 65467, "epoch": 1558} {"train_loss": -5.897417068481445, "global_step": 65468, "epoch": 1558} {"train_loss": -6.020757675170898, "global_step": 65469, "epoch": 1558} {"train_loss": -6.023929595947266, "global_step": 65470, "epoch": 1558} {"train_loss": -5.997056007385254, "global_step": 65471, "epoch": 1558} {"train_loss": -6.009134292602539, "global_step": 65472, "epoch": 1558} {"train_loss": -5.9278106689453125, "global_step": 65473, "epoch": 1558} {"train_loss": -6.091001033782959, "global_step": 65474, "epoch": 1558} {"train_loss": -5.972285270690918, "global_step": 65475, "epoch": 1558} {"train_loss": -5.932882308959961, "global_step": 65476, "epoch": 1558} {"train_loss": -5.961918694632394, "global_step": 65477, "epoch": 1558, "val_loss": 74374.0390625} {"train_loss": -6.053244590759277, "global_step": 65478, "epoch": 1559} {"train_loss": -5.951968669891357, "global_step": 65479, "epoch": 1559} {"train_loss": -6.056583404541016, "global_step": 65480, "epoch": 1559} {"train_loss": -6.082954406738281, "global_step": 65481, "epoch": 1559} {"train_loss": -5.919582366943359, "global_step": 65482, "epoch": 1559} {"train_loss": -6.020551681518555, "global_step": 65483, "epoch": 1559} {"train_loss": -6.022189140319824, "global_step": 65484, "epoch": 1559} {"train_loss": -6.020509719848633, "global_step": 65485, "epoch": 1559} {"train_loss": -6.019135475158691, "global_step": 65486, "epoch": 1559} {"train_loss": -5.957917213439941, "global_step": 65487, "epoch": 1559} {"train_loss": -6.068080425262451, "global_step": 65488, "epoch": 1559} {"train_loss": -5.866407871246338, "global_step": 65489, "epoch": 1559} {"train_loss": -5.904201507568359, "global_step": 65490, "epoch": 1559} {"train_loss": -5.889192581176758, "global_step": 65491, "epoch": 1559} {"train_loss": -6.083063125610352, "global_step": 65492, "epoch": 1559} {"train_loss": -6.013426780700684, "global_step": 65493, "epoch": 1559} {"train_loss": -5.939006328582764, "global_step": 65494, "epoch": 1559} {"train_loss": -5.92446231842041, "global_step": 65495, "epoch": 1559} {"train_loss": -5.96425199508667, "global_step": 65496, "epoch": 1559} {"train_loss": -5.993203163146973, "global_step": 65497, "epoch": 1559} {"train_loss": -5.951233386993408, "global_step": 65498, "epoch": 1559} {"train_loss": -5.849794864654541, "global_step": 65499, "epoch": 1559} {"train_loss": -5.974957466125488, "global_step": 65500, "epoch": 1559} {"train_loss": -5.935006141662598, "global_step": 65501, "epoch": 1559} {"train_loss": -5.890591621398926, "global_step": 65502, "epoch": 1559} {"train_loss": -5.90028715133667, "global_step": 65503, "epoch": 1559} {"train_loss": -6.041785717010498, "global_step": 65504, "epoch": 1559} {"train_loss": -5.960241794586182, "global_step": 65505, "epoch": 1559} {"train_loss": -5.799240589141846, "global_step": 65506, "epoch": 1559} {"train_loss": -5.960941791534424, "global_step": 65507, "epoch": 1559} {"train_loss": -5.895331859588623, "global_step": 65508, "epoch": 1559} {"train_loss": -5.868252277374268, "global_step": 65509, "epoch": 1559} {"train_loss": -5.882201194763184, "global_step": 65510, "epoch": 1559} {"train_loss": -5.877289772033691, "global_step": 65511, "epoch": 1559} {"train_loss": -5.958731651306152, "global_step": 65512, "epoch": 1559} {"train_loss": -6.02789306640625, "global_step": 65513, "epoch": 1559} {"train_loss": -5.9138946533203125, "global_step": 65514, "epoch": 1559} {"train_loss": -6.018423080444336, "global_step": 65515, "epoch": 1559} {"train_loss": -5.897256851196289, "global_step": 65516, "epoch": 1559} {"train_loss": -5.999804973602295, "global_step": 65517, "epoch": 1559} {"train_loss": -5.838301658630371, "global_step": 65518, "epoch": 1559} {"train_loss": -5.9586106936136884, "global_step": 65519, "epoch": 1559, "val_loss": 74324.9609375} {"train_loss": -5.926994323730469, "global_step": 65520, "epoch": 1560} {"train_loss": -6.0178608894348145, "global_step": 65521, "epoch": 1560} {"train_loss": -6.105419158935547, "global_step": 65522, "epoch": 1560} {"train_loss": -5.982211589813232, "global_step": 65523, "epoch": 1560} {"train_loss": -6.085577964782715, "global_step": 65524, "epoch": 1560} {"train_loss": -5.919235706329346, "global_step": 65525, "epoch": 1560} {"train_loss": -6.028356552124023, "global_step": 65526, "epoch": 1560} {"train_loss": -5.913209915161133, "global_step": 65527, "epoch": 1560} {"train_loss": -6.025027275085449, "global_step": 65528, "epoch": 1560} {"train_loss": -5.946950912475586, "global_step": 65529, "epoch": 1560} {"train_loss": -5.936885833740234, "global_step": 65530, "epoch": 1560} {"train_loss": -6.014000415802002, "global_step": 65531, "epoch": 1560} {"train_loss": -5.966506481170654, "global_step": 65532, "epoch": 1560} {"train_loss": -5.928442478179932, "global_step": 65533, "epoch": 1560} {"train_loss": -5.958320617675781, "global_step": 65534, "epoch": 1560} {"train_loss": -5.838263988494873, "global_step": 65535, "epoch": 1560} {"train_loss": -5.9400315284729, "global_step": 65536, "epoch": 1560} {"train_loss": -5.861790657043457, "global_step": 65537, "epoch": 1560} {"train_loss": -5.965679168701172, "global_step": 65538, "epoch": 1560} {"train_loss": -5.9395294189453125, "global_step": 65539, "epoch": 1560} {"train_loss": -5.892607688903809, "global_step": 65540, "epoch": 1560} {"train_loss": -6.066577911376953, "global_step": 65541, "epoch": 1560} {"train_loss": -6.044175148010254, "global_step": 65542, "epoch": 1560} {"train_loss": -5.971545219421387, "global_step": 65543, "epoch": 1560} {"train_loss": -6.020981311798096, "global_step": 65544, "epoch": 1560} {"train_loss": -5.941497802734375, "global_step": 65545, "epoch": 1560} {"train_loss": -5.945132255554199, "global_step": 65546, "epoch": 1560} {"train_loss": -5.946084976196289, "global_step": 65547, "epoch": 1560} {"train_loss": -5.9735870361328125, "global_step": 65548, "epoch": 1560} {"train_loss": -6.017203330993652, "global_step": 65549, "epoch": 1560} {"train_loss": -5.90471076965332, "global_step": 65550, "epoch": 1560} {"train_loss": -5.813395023345947, "global_step": 65551, "epoch": 1560} {"train_loss": -5.880736351013184, "global_step": 65552, "epoch": 1560} {"train_loss": -5.786383152008057, "global_step": 65553, "epoch": 1560} {"train_loss": -5.977371692657471, "global_step": 65554, "epoch": 1560} {"train_loss": -5.743718147277832, "global_step": 65555, "epoch": 1560} {"train_loss": -5.90363883972168, "global_step": 65556, "epoch": 1560} {"train_loss": -5.797206878662109, "global_step": 65557, "epoch": 1560} {"train_loss": -5.918194770812988, "global_step": 65558, "epoch": 1560} {"train_loss": -5.934445381164551, "global_step": 65559, "epoch": 1560} {"train_loss": -5.927069664001465, "global_step": 65560, "epoch": 1560} {"train_loss": -5.942969208671933, "global_step": 65561, "epoch": 1560, "val_loss": 74904.1875} {"train_loss": -5.920183181762695, "global_step": 65562, "epoch": 1561} {"train_loss": -5.922048568725586, "global_step": 65563, "epoch": 1561} {"train_loss": -5.826563835144043, "global_step": 65564, "epoch": 1561} {"train_loss": -5.920526504516602, "global_step": 65565, "epoch": 1561} {"train_loss": -5.873268127441406, "global_step": 65566, "epoch": 1561} {"train_loss": -5.941298961639404, "global_step": 65567, "epoch": 1561} {"train_loss": -5.965534210205078, "global_step": 65568, "epoch": 1561} {"train_loss": -5.940972328186035, "global_step": 65569, "epoch": 1561} {"train_loss": -5.981589317321777, "global_step": 65570, "epoch": 1561} {"train_loss": -5.990449905395508, "global_step": 65571, "epoch": 1561} {"train_loss": -5.963421821594238, "global_step": 65572, "epoch": 1561} {"train_loss": -5.969688415527344, "global_step": 65573, "epoch": 1561} {"train_loss": -5.8763957023620605, "global_step": 65574, "epoch": 1561} {"train_loss": -6.03464412689209, "global_step": 65575, "epoch": 1561} {"train_loss": -5.991048812866211, "global_step": 65576, "epoch": 1561} {"train_loss": -6.061300277709961, "global_step": 65577, "epoch": 1561} {"train_loss": -6.020097732543945, "global_step": 65578, "epoch": 1561} {"train_loss": -5.972191333770752, "global_step": 65579, "epoch": 1561} {"train_loss": -5.977017879486084, "global_step": 65580, "epoch": 1561} {"train_loss": -6.010069847106934, "global_step": 65581, "epoch": 1561} {"train_loss": -6.029445171356201, "global_step": 65582, "epoch": 1561} {"train_loss": -6.0218729972839355, "global_step": 65583, "epoch": 1561} {"train_loss": -5.864424705505371, "global_step": 65584, "epoch": 1561} {"train_loss": -5.849830627441406, "global_step": 65585, "epoch": 1561} {"train_loss": -6.016593933105469, "global_step": 65586, "epoch": 1561} {"train_loss": -6.0956926345825195, "global_step": 65587, "epoch": 1561} {"train_loss": -5.921145915985107, "global_step": 65588, "epoch": 1561} {"train_loss": -5.926212787628174, "global_step": 65589, "epoch": 1561} {"train_loss": -5.993610382080078, "global_step": 65590, "epoch": 1561} {"train_loss": -5.831205368041992, "global_step": 65591, "epoch": 1561} {"train_loss": -6.072573661804199, "global_step": 65592, "epoch": 1561} {"train_loss": -5.85906982421875, "global_step": 65593, "epoch": 1561} {"train_loss": -5.96912145614624, "global_step": 65594, "epoch": 1561} {"train_loss": -5.842421531677246, "global_step": 65595, "epoch": 1561} {"train_loss": -5.9646430015563965, "global_step": 65596, "epoch": 1561} {"train_loss": -5.87601375579834, "global_step": 65597, "epoch": 1561} {"train_loss": -5.925048828125, "global_step": 65598, "epoch": 1561} {"train_loss": -6.0361433029174805, "global_step": 65599, "epoch": 1561} {"train_loss": -5.896997451782227, "global_step": 65600, "epoch": 1561} {"train_loss": -5.957134246826172, "global_step": 65601, "epoch": 1561} {"train_loss": -5.9675798416137695, "global_step": 65602, "epoch": 1561} {"train_loss": -5.953227247510638, "global_step": 65603, "epoch": 1561, "val_loss": 74862.1953125} {"train_loss": -5.936164855957031, "global_step": 65604, "epoch": 1562} {"train_loss": -6.03558349609375, "global_step": 65605, "epoch": 1562} {"train_loss": -5.951264381408691, "global_step": 65606, "epoch": 1562} {"train_loss": -5.920351505279541, "global_step": 65607, "epoch": 1562} {"train_loss": -5.980596542358398, "global_step": 65608, "epoch": 1562} {"train_loss": -6.005354404449463, "global_step": 65609, "epoch": 1562} {"train_loss": -5.866286277770996, "global_step": 65610, "epoch": 1562} {"train_loss": -6.013696670532227, "global_step": 65611, "epoch": 1562} {"train_loss": -6.061058044433594, "global_step": 65612, "epoch": 1562} {"train_loss": -5.985097408294678, "global_step": 65613, "epoch": 1562} {"train_loss": -5.8875346183776855, "global_step": 65614, "epoch": 1562} {"train_loss": -5.924851417541504, "global_step": 65615, "epoch": 1562} {"train_loss": -5.991172790527344, "global_step": 65616, "epoch": 1562} {"train_loss": -5.829441070556641, "global_step": 65617, "epoch": 1562} {"train_loss": -5.929278373718262, "global_step": 65618, "epoch": 1562} {"train_loss": -5.956151008605957, "global_step": 65619, "epoch": 1562} {"train_loss": -6.007998466491699, "global_step": 65620, "epoch": 1562} {"train_loss": -5.98100471496582, "global_step": 65621, "epoch": 1562} {"train_loss": -5.8187055587768555, "global_step": 65622, "epoch": 1562} {"train_loss": -5.969632148742676, "global_step": 65623, "epoch": 1562} {"train_loss": -5.871360778808594, "global_step": 65624, "epoch": 1562} {"train_loss": -5.895589351654053, "global_step": 65625, "epoch": 1562} {"train_loss": -6.0779571533203125, "global_step": 65626, "epoch": 1562} {"train_loss": -5.899362564086914, "global_step": 65627, "epoch": 1562} {"train_loss": -5.958483695983887, "global_step": 65628, "epoch": 1562} {"train_loss": -5.922943115234375, "global_step": 65629, "epoch": 1562} {"train_loss": -5.940404415130615, "global_step": 65630, "epoch": 1562} {"train_loss": -5.988345146179199, "global_step": 65631, "epoch": 1562} {"train_loss": -5.944659233093262, "global_step": 65632, "epoch": 1562} {"train_loss": -5.921402454376221, "global_step": 65633, "epoch": 1562} {"train_loss": -5.9726762771606445, "global_step": 65634, "epoch": 1562} {"train_loss": -5.919285774230957, "global_step": 65635, "epoch": 1562} {"train_loss": -5.953386306762695, "global_step": 65636, "epoch": 1562} {"train_loss": -5.776379585266113, "global_step": 65637, "epoch": 1562} {"train_loss": -6.001994609832764, "global_step": 65638, "epoch": 1562} {"train_loss": -5.990757465362549, "global_step": 65639, "epoch": 1562} {"train_loss": -5.894532203674316, "global_step": 65640, "epoch": 1562} {"train_loss": -5.979471206665039, "global_step": 65641, "epoch": 1562} {"train_loss": -5.984189987182617, "global_step": 65642, "epoch": 1562} {"train_loss": -6.009759426116943, "global_step": 65643, "epoch": 1562} {"train_loss": -5.9585065841674805, "global_step": 65644, "epoch": 1562} {"train_loss": -5.948195639110747, "global_step": 65645, "epoch": 1562, "val_loss": 74511.03125} {"train_loss": -6.139233112335205, "global_step": 65646, "epoch": 1563} {"train_loss": -6.0079345703125, "global_step": 65647, "epoch": 1563} {"train_loss": -5.9410200119018555, "global_step": 65648, "epoch": 1563} {"train_loss": -6.005086898803711, "global_step": 65649, "epoch": 1563} {"train_loss": -5.927421569824219, "global_step": 65650, "epoch": 1563} {"train_loss": -5.977614402770996, "global_step": 65651, "epoch": 1563} {"train_loss": -6.027661323547363, "global_step": 65652, "epoch": 1563} {"train_loss": -5.905324935913086, "global_step": 65653, "epoch": 1563} {"train_loss": -5.929533958435059, "global_step": 65654, "epoch": 1563} {"train_loss": -5.906979560852051, "global_step": 65655, "epoch": 1563} {"train_loss": -5.838261127471924, "global_step": 65656, "epoch": 1563} {"train_loss": -5.958884239196777, "global_step": 65657, "epoch": 1563} {"train_loss": -5.877889633178711, "global_step": 65658, "epoch": 1563} {"train_loss": -5.955721378326416, "global_step": 65659, "epoch": 1563} {"train_loss": -5.931066989898682, "global_step": 65660, "epoch": 1563} {"train_loss": -5.900391578674316, "global_step": 65661, "epoch": 1563} {"train_loss": -5.9419331550598145, "global_step": 65662, "epoch": 1563} {"train_loss": -6.01218318939209, "global_step": 65663, "epoch": 1563} {"train_loss": -6.00481653213501, "global_step": 65664, "epoch": 1563} {"train_loss": -5.895787239074707, "global_step": 65665, "epoch": 1563} {"train_loss": -5.879778861999512, "global_step": 65666, "epoch": 1563} {"train_loss": -5.905138969421387, "global_step": 65667, "epoch": 1563} {"train_loss": -5.918458461761475, "global_step": 65668, "epoch": 1563} {"train_loss": -5.917679309844971, "global_step": 65669, "epoch": 1563} {"train_loss": -5.885863304138184, "global_step": 65670, "epoch": 1563} {"train_loss": -5.982999801635742, "global_step": 65671, "epoch": 1563} {"train_loss": -5.959099769592285, "global_step": 65672, "epoch": 1563} {"train_loss": -5.878002166748047, "global_step": 65673, "epoch": 1563} {"train_loss": -6.0404744148254395, "global_step": 65674, "epoch": 1563} {"train_loss": -5.8819499015808105, "global_step": 65675, "epoch": 1563} {"train_loss": -6.070457458496094, "global_step": 65676, "epoch": 1563} {"train_loss": -5.998994827270508, "global_step": 65677, "epoch": 1563} {"train_loss": -5.964242935180664, "global_step": 65678, "epoch": 1563} {"train_loss": -5.9544148445129395, "global_step": 65679, "epoch": 1563} {"train_loss": -5.903261184692383, "global_step": 65680, "epoch": 1563} {"train_loss": -5.975038051605225, "global_step": 65681, "epoch": 1563} {"train_loss": -5.919698715209961, "global_step": 65682, "epoch": 1563} {"train_loss": -5.987870693206787, "global_step": 65683, "epoch": 1563} {"train_loss": -6.087566375732422, "global_step": 65684, "epoch": 1563} {"train_loss": -5.867109298706055, "global_step": 65685, "epoch": 1563} {"train_loss": -6.048867702484131, "global_step": 65686, "epoch": 1563} {"train_loss": -5.954391320546468, "global_step": 65687, "epoch": 1563, "val_loss": 74576.6484375} {"train_loss": -6.053345680236816, "global_step": 65688, "epoch": 1564} {"train_loss": -6.01080322265625, "global_step": 65689, "epoch": 1564} {"train_loss": -5.968538761138916, "global_step": 65690, "epoch": 1564} {"train_loss": -5.949549674987793, "global_step": 65691, "epoch": 1564} {"train_loss": -5.8816046714782715, "global_step": 65692, "epoch": 1564} {"train_loss": -5.979760646820068, "global_step": 65693, "epoch": 1564} {"train_loss": -5.961278438568115, "global_step": 65694, "epoch": 1564} {"train_loss": -5.964873790740967, "global_step": 65695, "epoch": 1564} {"train_loss": -5.970917701721191, "global_step": 65696, "epoch": 1564} {"train_loss": -6.0884809494018555, "global_step": 65697, "epoch": 1564} {"train_loss": -5.932244777679443, "global_step": 65698, "epoch": 1564} {"train_loss": -5.940740585327148, "global_step": 65699, "epoch": 1564} {"train_loss": -6.026729106903076, "global_step": 65700, "epoch": 1564} {"train_loss": -6.0325822830200195, "global_step": 65701, "epoch": 1564} {"train_loss": -5.921914100646973, "global_step": 65702, "epoch": 1564} {"train_loss": -5.969621658325195, "global_step": 65703, "epoch": 1564} {"train_loss": -5.921984672546387, "global_step": 65704, "epoch": 1564} {"train_loss": -5.828255653381348, "global_step": 65705, "epoch": 1564} {"train_loss": -5.9703192710876465, "global_step": 65706, "epoch": 1564} {"train_loss": -5.9076313972473145, "global_step": 65707, "epoch": 1564} {"train_loss": -5.953301429748535, "global_step": 65708, "epoch": 1564} {"train_loss": -6.069560527801514, "global_step": 65709, "epoch": 1564} {"train_loss": -5.881738185882568, "global_step": 65710, "epoch": 1564} {"train_loss": -5.951063632965088, "global_step": 65711, "epoch": 1564} {"train_loss": -6.121402740478516, "global_step": 65712, "epoch": 1564} {"train_loss": -5.863282203674316, "global_step": 65713, "epoch": 1564} {"train_loss": -6.045249938964844, "global_step": 65714, "epoch": 1564} {"train_loss": -6.009673595428467, "global_step": 65715, "epoch": 1564} {"train_loss": -5.979537010192871, "global_step": 65716, "epoch": 1564} {"train_loss": -6.043042182922363, "global_step": 65717, "epoch": 1564} {"train_loss": -5.929850101470947, "global_step": 65718, "epoch": 1564} {"train_loss": -5.968967914581299, "global_step": 65719, "epoch": 1564} {"train_loss": -5.960681915283203, "global_step": 65720, "epoch": 1564} {"train_loss": -6.039359092712402, "global_step": 65721, "epoch": 1564} {"train_loss": -6.044493675231934, "global_step": 65722, "epoch": 1564} {"train_loss": -5.94552755355835, "global_step": 65723, "epoch": 1564} {"train_loss": -5.856586456298828, "global_step": 65724, "epoch": 1564} {"train_loss": -6.063934326171875, "global_step": 65725, "epoch": 1564} {"train_loss": -6.026020526885986, "global_step": 65726, "epoch": 1564} {"train_loss": -5.9825544357299805, "global_step": 65727, "epoch": 1564} {"train_loss": -5.979538440704346, "global_step": 65728, "epoch": 1564} {"train_loss": -5.978269304547991, "global_step": 65729, "epoch": 1564, "val_loss": 74967.359375} {"train_loss": -5.910877227783203, "global_step": 65730, "epoch": 1565} {"train_loss": -5.977206230163574, "global_step": 65731, "epoch": 1565} {"train_loss": -6.101028919219971, "global_step": 65732, "epoch": 1565} {"train_loss": -5.861371994018555, "global_step": 65733, "epoch": 1565} {"train_loss": -5.999652862548828, "global_step": 65734, "epoch": 1565} {"train_loss": -5.8621931076049805, "global_step": 65735, "epoch": 1565} {"train_loss": -5.814866542816162, "global_step": 65736, "epoch": 1565} {"train_loss": -5.997431755065918, "global_step": 65737, "epoch": 1565} {"train_loss": -5.764858245849609, "global_step": 65738, "epoch": 1565} {"train_loss": -5.848318576812744, "global_step": 65739, "epoch": 1565} {"train_loss": -5.840106010437012, "global_step": 65740, "epoch": 1565} {"train_loss": -5.826237201690674, "global_step": 65741, "epoch": 1565} {"train_loss": -5.986994743347168, "global_step": 65742, "epoch": 1565} {"train_loss": -5.947724342346191, "global_step": 65743, "epoch": 1565} {"train_loss": -5.939740180969238, "global_step": 65744, "epoch": 1565} {"train_loss": -5.9668989181518555, "global_step": 65745, "epoch": 1565} {"train_loss": -6.013516426086426, "global_step": 65746, "epoch": 1565} {"train_loss": -6.043924808502197, "global_step": 65747, "epoch": 1565} {"train_loss": -5.95076322555542, "global_step": 65748, "epoch": 1565} {"train_loss": -6.004176616668701, "global_step": 65749, "epoch": 1565} {"train_loss": -6.0191450119018555, "global_step": 65750, "epoch": 1565} {"train_loss": -6.021063327789307, "global_step": 65751, "epoch": 1565} {"train_loss": -6.06527042388916, "global_step": 65752, "epoch": 1565} {"train_loss": -5.914071083068848, "global_step": 65753, "epoch": 1565} {"train_loss": -5.939089775085449, "global_step": 65754, "epoch": 1565} {"train_loss": -6.041869640350342, "global_step": 65755, "epoch": 1565} {"train_loss": -5.937524795532227, "global_step": 65756, "epoch": 1565} {"train_loss": -6.029140949249268, "global_step": 65757, "epoch": 1565} {"train_loss": -5.955378532409668, "global_step": 65758, "epoch": 1565} {"train_loss": -6.046854019165039, "global_step": 65759, "epoch": 1565} {"train_loss": -6.100804328918457, "global_step": 65760, "epoch": 1565} {"train_loss": -6.057080268859863, "global_step": 65761, "epoch": 1565} {"train_loss": -5.846723556518555, "global_step": 65762, "epoch": 1565} {"train_loss": -5.9721527099609375, "global_step": 65763, "epoch": 1565} {"train_loss": -6.054126262664795, "global_step": 65764, "epoch": 1565} {"train_loss": -5.961284160614014, "global_step": 65765, "epoch": 1565} {"train_loss": -5.747591018676758, "global_step": 65766, "epoch": 1565} {"train_loss": -5.9304585456848145, "global_step": 65767, "epoch": 1565} {"train_loss": -5.890692710876465, "global_step": 65768, "epoch": 1565} {"train_loss": -5.972036361694336, "global_step": 65769, "epoch": 1565} {"train_loss": -6.001644611358643, "global_step": 65770, "epoch": 1565} {"train_loss": -5.955719334738595, "global_step": 65771, "epoch": 1565, "val_loss": 74533.8359375} {"train_loss": -5.95919132232666, "global_step": 65772, "epoch": 1566} {"train_loss": -5.863195419311523, "global_step": 65773, "epoch": 1566} {"train_loss": -6.010936737060547, "global_step": 65774, "epoch": 1566} {"train_loss": -5.979182243347168, "global_step": 65775, "epoch": 1566} {"train_loss": -5.919012069702148, "global_step": 65776, "epoch": 1566} {"train_loss": -5.870105743408203, "global_step": 65777, "epoch": 1566} {"train_loss": -6.018789291381836, "global_step": 65778, "epoch": 1566} {"train_loss": -6.054959297180176, "global_step": 65779, "epoch": 1566} {"train_loss": -6.016847610473633, "global_step": 65780, "epoch": 1566} {"train_loss": -5.998320579528809, "global_step": 65781, "epoch": 1566} {"train_loss": -6.058146953582764, "global_step": 65782, "epoch": 1566} {"train_loss": -5.9184250831604, "global_step": 65783, "epoch": 1566} {"train_loss": -5.985601425170898, "global_step": 65784, "epoch": 1566} {"train_loss": -5.8965559005737305, "global_step": 65785, "epoch": 1566} {"train_loss": -6.079085350036621, "global_step": 65786, "epoch": 1566} {"train_loss": -5.964184761047363, "global_step": 65787, "epoch": 1566} {"train_loss": -5.923001766204834, "global_step": 65788, "epoch": 1566} {"train_loss": -5.945565223693848, "global_step": 65789, "epoch": 1566} {"train_loss": -5.998472690582275, "global_step": 65790, "epoch": 1566} {"train_loss": -6.0350847244262695, "global_step": 65791, "epoch": 1566} {"train_loss": -5.966352462768555, "global_step": 65792, "epoch": 1566} {"train_loss": -5.922134876251221, "global_step": 65793, "epoch": 1566} {"train_loss": -5.941216468811035, "global_step": 65794, "epoch": 1566} {"train_loss": -6.0477519035339355, "global_step": 65795, "epoch": 1566} {"train_loss": -6.048349857330322, "global_step": 65796, "epoch": 1566} {"train_loss": -5.926429748535156, "global_step": 65797, "epoch": 1566} {"train_loss": -5.8922014236450195, "global_step": 65798, "epoch": 1566} {"train_loss": -6.0226969718933105, "global_step": 65799, "epoch": 1566} {"train_loss": -5.868208885192871, "global_step": 65800, "epoch": 1566} {"train_loss": -5.973538398742676, "global_step": 65801, "epoch": 1566} {"train_loss": -6.030913829803467, "global_step": 65802, "epoch": 1566} {"train_loss": -5.892799377441406, "global_step": 65803, "epoch": 1566} {"train_loss": -5.940757751464844, "global_step": 65804, "epoch": 1566} {"train_loss": -5.960229396820068, "global_step": 65805, "epoch": 1566} {"train_loss": -5.908411026000977, "global_step": 65806, "epoch": 1566} {"train_loss": -6.053224563598633, "global_step": 65807, "epoch": 1566} {"train_loss": -5.837332248687744, "global_step": 65808, "epoch": 1566} {"train_loss": -5.964631080627441, "global_step": 65809, "epoch": 1566} {"train_loss": -5.85569953918457, "global_step": 65810, "epoch": 1566} {"train_loss": -5.951733589172363, "global_step": 65811, "epoch": 1566} {"train_loss": -6.0168561935424805, "global_step": 65812, "epoch": 1566} {"train_loss": -5.963824158623105, "global_step": 65813, "epoch": 1566, "val_loss": 74361.703125} {"train_loss": -6.001349449157715, "global_step": 65814, "epoch": 1567} {"train_loss": -5.855197906494141, "global_step": 65815, "epoch": 1567} {"train_loss": -5.892211437225342, "global_step": 65816, "epoch": 1567} {"train_loss": -5.911243438720703, "global_step": 65817, "epoch": 1567} {"train_loss": -6.02847957611084, "global_step": 65818, "epoch": 1567} {"train_loss": -5.848023891448975, "global_step": 65819, "epoch": 1567} {"train_loss": -6.095389366149902, "global_step": 65820, "epoch": 1567} {"train_loss": -5.946504592895508, "global_step": 65821, "epoch": 1567} {"train_loss": -5.926675796508789, "global_step": 65822, "epoch": 1567} {"train_loss": -5.938416481018066, "global_step": 65823, "epoch": 1567} {"train_loss": -6.066826820373535, "global_step": 65824, "epoch": 1567} {"train_loss": -5.918962478637695, "global_step": 65825, "epoch": 1567} {"train_loss": -5.949950218200684, "global_step": 65826, "epoch": 1567} {"train_loss": -6.0773725509643555, "global_step": 65827, "epoch": 1567} {"train_loss": -5.906167030334473, "global_step": 65828, "epoch": 1567} {"train_loss": -6.031585693359375, "global_step": 65829, "epoch": 1567} {"train_loss": -6.006941795349121, "global_step": 65830, "epoch": 1567} {"train_loss": -6.029804229736328, "global_step": 65831, "epoch": 1567} {"train_loss": -6.037466049194336, "global_step": 65832, "epoch": 1567} {"train_loss": -5.995501518249512, "global_step": 65833, "epoch": 1567} {"train_loss": -5.882709503173828, "global_step": 65834, "epoch": 1567} {"train_loss": -5.963903903961182, "global_step": 65835, "epoch": 1567} {"train_loss": -5.977545738220215, "global_step": 65836, "epoch": 1567} {"train_loss": -6.053483009338379, "global_step": 65837, "epoch": 1567} {"train_loss": -5.970346927642822, "global_step": 65838, "epoch": 1567} {"train_loss": -5.912478923797607, "global_step": 65839, "epoch": 1567} {"train_loss": -5.995995044708252, "global_step": 65840, "epoch": 1567} {"train_loss": -5.981571197509766, "global_step": 65841, "epoch": 1567} {"train_loss": -5.966265678405762, "global_step": 65842, "epoch": 1567} {"train_loss": -6.007631301879883, "global_step": 65843, "epoch": 1567} {"train_loss": -6.064966201782227, "global_step": 65844, "epoch": 1567} {"train_loss": -5.947077751159668, "global_step": 65845, "epoch": 1567} {"train_loss": -5.93276309967041, "global_step": 65846, "epoch": 1567} {"train_loss": -5.793034076690674, "global_step": 65847, "epoch": 1567} {"train_loss": -5.833404064178467, "global_step": 65848, "epoch": 1567} {"train_loss": -6.01969051361084, "global_step": 65849, "epoch": 1567} {"train_loss": -5.869180679321289, "global_step": 65850, "epoch": 1567} {"train_loss": -6.003753662109375, "global_step": 65851, "epoch": 1567} {"train_loss": -5.98836088180542, "global_step": 65852, "epoch": 1567} {"train_loss": -6.080052375793457, "global_step": 65853, "epoch": 1567} {"train_loss": -5.964358329772949, "global_step": 65854, "epoch": 1567} {"train_loss": -5.964173691613333, "global_step": 65855, "epoch": 1567, "val_loss": 74628.046875} {"train_loss": -6.0511555671691895, "global_step": 65856, "epoch": 1568} {"train_loss": -5.889758586883545, "global_step": 65857, "epoch": 1568} {"train_loss": -5.8861284255981445, "global_step": 65858, "epoch": 1568} {"train_loss": -5.871819496154785, "global_step": 65859, "epoch": 1568} {"train_loss": -5.9944000244140625, "global_step": 65860, "epoch": 1568} {"train_loss": -5.900786876678467, "global_step": 65861, "epoch": 1568} {"train_loss": -6.02090311050415, "global_step": 65862, "epoch": 1568} {"train_loss": -5.813194274902344, "global_step": 65863, "epoch": 1568} {"train_loss": -5.8714141845703125, "global_step": 65864, "epoch": 1568} {"train_loss": -5.872018337249756, "global_step": 65865, "epoch": 1568} {"train_loss": -5.772879123687744, "global_step": 65866, "epoch": 1568} {"train_loss": -6.116986274719238, "global_step": 65867, "epoch": 1568} {"train_loss": -5.940530300140381, "global_step": 65868, "epoch": 1568} {"train_loss": -5.994959831237793, "global_step": 65869, "epoch": 1568} {"train_loss": -5.990546226501465, "global_step": 65870, "epoch": 1568} {"train_loss": -5.873584747314453, "global_step": 65871, "epoch": 1568} {"train_loss": -5.904382228851318, "global_step": 65872, "epoch": 1568} {"train_loss": -5.998991012573242, "global_step": 65873, "epoch": 1568} {"train_loss": -5.897438049316406, "global_step": 65874, "epoch": 1568} {"train_loss": -5.932743549346924, "global_step": 65875, "epoch": 1568} {"train_loss": -5.873394012451172, "global_step": 65876, "epoch": 1568} {"train_loss": -5.915972709655762, "global_step": 65877, "epoch": 1568} {"train_loss": -5.902292251586914, "global_step": 65878, "epoch": 1568} {"train_loss": -6.06159782409668, "global_step": 65879, "epoch": 1568} {"train_loss": -5.907188415527344, "global_step": 65880, "epoch": 1568} {"train_loss": -5.9062347412109375, "global_step": 65881, "epoch": 1568} {"train_loss": -6.028049468994141, "global_step": 65882, "epoch": 1568} {"train_loss": -5.97233772277832, "global_step": 65883, "epoch": 1568} {"train_loss": -5.92031717300415, "global_step": 65884, "epoch": 1568} {"train_loss": -5.935873985290527, "global_step": 65885, "epoch": 1568} {"train_loss": -5.852567195892334, "global_step": 65886, "epoch": 1568} {"train_loss": -5.97830057144165, "global_step": 65887, "epoch": 1568} {"train_loss": -5.91878604888916, "global_step": 65888, "epoch": 1568} {"train_loss": -5.900406837463379, "global_step": 65889, "epoch": 1568} {"train_loss": -5.852672100067139, "global_step": 65890, "epoch": 1568} {"train_loss": -5.930832862854004, "global_step": 65891, "epoch": 1568} {"train_loss": -5.958340644836426, "global_step": 65892, "epoch": 1568} {"train_loss": -6.044295787811279, "global_step": 65893, "epoch": 1568} {"train_loss": -5.930819034576416, "global_step": 65894, "epoch": 1568} {"train_loss": -5.942134857177734, "global_step": 65895, "epoch": 1568} {"train_loss": -5.955608367919922, "global_step": 65896, "epoch": 1568} {"train_loss": -5.933632623581659, "global_step": 65897, "epoch": 1568, "val_loss": 74917.6328125} {"train_loss": -5.993274211883545, "global_step": 65898, "epoch": 1569} {"train_loss": -5.83935546875, "global_step": 65899, "epoch": 1569} {"train_loss": -5.971526622772217, "global_step": 65900, "epoch": 1569} {"train_loss": -5.956653594970703, "global_step": 65901, "epoch": 1569} {"train_loss": -5.9025678634643555, "global_step": 65902, "epoch": 1569} {"train_loss": -5.927833080291748, "global_step": 65903, "epoch": 1569} {"train_loss": -5.994801998138428, "global_step": 65904, "epoch": 1569} {"train_loss": -6.0342864990234375, "global_step": 65905, "epoch": 1569} {"train_loss": -5.915907382965088, "global_step": 65906, "epoch": 1569} {"train_loss": -5.834904670715332, "global_step": 65907, "epoch": 1569} {"train_loss": -6.005620956420898, "global_step": 65908, "epoch": 1569} {"train_loss": -5.9359636306762695, "global_step": 65909, "epoch": 1569} {"train_loss": -5.919487953186035, "global_step": 65910, "epoch": 1569} {"train_loss": -5.990114212036133, "global_step": 65911, "epoch": 1569} {"train_loss": -5.884844779968262, "global_step": 65912, "epoch": 1569} {"train_loss": -5.973742961883545, "global_step": 65913, "epoch": 1569} {"train_loss": -6.032657623291016, "global_step": 65914, "epoch": 1569} {"train_loss": -6.006925582885742, "global_step": 65915, "epoch": 1569} {"train_loss": -5.94387674331665, "global_step": 65916, "epoch": 1569} {"train_loss": -5.963220596313477, "global_step": 65917, "epoch": 1569} {"train_loss": -6.112083435058594, "global_step": 65918, "epoch": 1569} {"train_loss": -5.9187912940979, "global_step": 65919, "epoch": 1569} {"train_loss": -5.837353706359863, "global_step": 65920, "epoch": 1569} {"train_loss": -6.008418083190918, "global_step": 65921, "epoch": 1569} {"train_loss": -6.084315776824951, "global_step": 65922, "epoch": 1569} {"train_loss": -6.013306617736816, "global_step": 65923, "epoch": 1569} {"train_loss": -5.885101318359375, "global_step": 65924, "epoch": 1569} {"train_loss": -5.949643611907959, "global_step": 65925, "epoch": 1569} {"train_loss": -6.113463878631592, "global_step": 65926, "epoch": 1569} {"train_loss": -5.904313087463379, "global_step": 65927, "epoch": 1569} {"train_loss": -5.945778846740723, "global_step": 65928, "epoch": 1569} {"train_loss": -5.966385841369629, "global_step": 65929, "epoch": 1569} {"train_loss": -5.993622779846191, "global_step": 65930, "epoch": 1569} {"train_loss": -6.0423994064331055, "global_step": 65931, "epoch": 1569} {"train_loss": -5.965059757232666, "global_step": 65932, "epoch": 1569} {"train_loss": -6.085638999938965, "global_step": 65933, "epoch": 1569} {"train_loss": -5.983974933624268, "global_step": 65934, "epoch": 1569} {"train_loss": -6.073681354522705, "global_step": 65935, "epoch": 1569} {"train_loss": -6.13330602645874, "global_step": 65936, "epoch": 1569} {"train_loss": -5.847939491271973, "global_step": 65937, "epoch": 1569} {"train_loss": -5.872776031494141, "global_step": 65938, "epoch": 1569} {"train_loss": -5.97050944964091, "global_step": 65939, "epoch": 1569, "val_loss": 74729.8984375} {"train_loss": -6.05195426940918, "global_step": 65940, "epoch": 1570} {"train_loss": -5.928539276123047, "global_step": 65941, "epoch": 1570} {"train_loss": -6.006731986999512, "global_step": 65942, "epoch": 1570} {"train_loss": -5.884812355041504, "global_step": 65943, "epoch": 1570} {"train_loss": -5.902161121368408, "global_step": 65944, "epoch": 1570} {"train_loss": -6.012294769287109, "global_step": 65945, "epoch": 1570} {"train_loss": -5.90894889831543, "global_step": 65946, "epoch": 1570} {"train_loss": -5.9677934646606445, "global_step": 65947, "epoch": 1570} {"train_loss": -6.0967254638671875, "global_step": 65948, "epoch": 1570} {"train_loss": -5.992249488830566, "global_step": 65949, "epoch": 1570} {"train_loss": -5.958147048950195, "global_step": 65950, "epoch": 1570} {"train_loss": -5.988772869110107, "global_step": 65951, "epoch": 1570} {"train_loss": -6.0396881103515625, "global_step": 65952, "epoch": 1570} {"train_loss": -5.967508316040039, "global_step": 65953, "epoch": 1570} {"train_loss": -6.0831379890441895, "global_step": 65954, "epoch": 1570} {"train_loss": -5.933246612548828, "global_step": 65955, "epoch": 1570} {"train_loss": -6.082160472869873, "global_step": 65956, "epoch": 1570} {"train_loss": -5.905731201171875, "global_step": 65957, "epoch": 1570} {"train_loss": -6.010300159454346, "global_step": 65958, "epoch": 1570} {"train_loss": -5.973539352416992, "global_step": 65959, "epoch": 1570} {"train_loss": -6.079196929931641, "global_step": 65960, "epoch": 1570} {"train_loss": -5.944210052490234, "global_step": 65961, "epoch": 1570} {"train_loss": -5.912204742431641, "global_step": 65962, "epoch": 1570} {"train_loss": -5.882209777832031, "global_step": 65963, "epoch": 1570} {"train_loss": -5.891460418701172, "global_step": 65964, "epoch": 1570} {"train_loss": -5.91537618637085, "global_step": 65965, "epoch": 1570} {"train_loss": -5.9577813148498535, "global_step": 65966, "epoch": 1570} {"train_loss": -6.014499664306641, "global_step": 65967, "epoch": 1570} {"train_loss": -6.003098487854004, "global_step": 65968, "epoch": 1570} {"train_loss": -5.9492106437683105, "global_step": 65969, "epoch": 1570} {"train_loss": -5.865165710449219, "global_step": 65970, "epoch": 1570} {"train_loss": -6.036620140075684, "global_step": 65971, "epoch": 1570} {"train_loss": -5.985831260681152, "global_step": 65972, "epoch": 1570} {"train_loss": -5.988914489746094, "global_step": 65973, "epoch": 1570} {"train_loss": -6.071640968322754, "global_step": 65974, "epoch": 1570} {"train_loss": -5.9149675369262695, "global_step": 65975, "epoch": 1570} {"train_loss": -5.96003532409668, "global_step": 65976, "epoch": 1570} {"train_loss": -5.995471000671387, "global_step": 65977, "epoch": 1570} {"train_loss": -5.86086368560791, "global_step": 65978, "epoch": 1570} {"train_loss": -5.993022441864014, "global_step": 65979, "epoch": 1570} {"train_loss": -5.946344375610352, "global_step": 65980, "epoch": 1570} {"train_loss": -5.9701430684044245, "global_step": 65981, "epoch": 1570, "val_loss": 74464.2734375} {"train_loss": -5.9491119384765625, "global_step": 65982, "epoch": 1571} {"train_loss": -6.073535442352295, "global_step": 65983, "epoch": 1571} {"train_loss": -5.933588981628418, "global_step": 65984, "epoch": 1571} {"train_loss": -5.979920387268066, "global_step": 65985, "epoch": 1571} {"train_loss": -6.069190979003906, "global_step": 65986, "epoch": 1571} {"train_loss": -5.861236572265625, "global_step": 65987, "epoch": 1571} {"train_loss": -5.968561172485352, "global_step": 65988, "epoch": 1571} {"train_loss": -6.039391040802002, "global_step": 65989, "epoch": 1571} {"train_loss": -5.945174694061279, "global_step": 65990, "epoch": 1571} {"train_loss": -6.03312349319458, "global_step": 65991, "epoch": 1571} {"train_loss": -5.916696548461914, "global_step": 65992, "epoch": 1571} {"train_loss": -6.094254493713379, "global_step": 65993, "epoch": 1571} {"train_loss": -5.953485488891602, "global_step": 65994, "epoch": 1571} {"train_loss": -5.872542381286621, "global_step": 65995, "epoch": 1571} {"train_loss": -6.004220008850098, "global_step": 65996, "epoch": 1571} {"train_loss": -6.001861095428467, "global_step": 65997, "epoch": 1571} {"train_loss": -6.031318664550781, "global_step": 65998, "epoch": 1571} {"train_loss": -5.853660583496094, "global_step": 65999, "epoch": 1571} {"train_loss": -5.90964412689209, "global_step": 66000, "epoch": 1571} {"train_loss": -6.0388383865356445, "global_step": 66001, "epoch": 1571} {"train_loss": -5.934491157531738, "global_step": 66002, "epoch": 1571} {"train_loss": -6.1038737297058105, "global_step": 66003, "epoch": 1571} {"train_loss": -5.934352874755859, "global_step": 66004, "epoch": 1571} {"train_loss": -5.863465309143066, "global_step": 66005, "epoch": 1571} {"train_loss": -5.880476951599121, "global_step": 66006, "epoch": 1571} {"train_loss": -5.954818248748779, "global_step": 66007, "epoch": 1571} {"train_loss": -5.931035995483398, "global_step": 66008, "epoch": 1571} {"train_loss": -5.961631774902344, "global_step": 66009, "epoch": 1571} {"train_loss": -5.967328071594238, "global_step": 66010, "epoch": 1571} {"train_loss": -5.991907119750977, "global_step": 66011, "epoch": 1571} {"train_loss": -5.973711967468262, "global_step": 66012, "epoch": 1571} {"train_loss": -5.953215599060059, "global_step": 66013, "epoch": 1571} {"train_loss": -5.9271931648254395, "global_step": 66014, "epoch": 1571} {"train_loss": -6.025336265563965, "global_step": 66015, "epoch": 1571} {"train_loss": -6.013062953948975, "global_step": 66016, "epoch": 1571} {"train_loss": -5.970414161682129, "global_step": 66017, "epoch": 1571} {"train_loss": -5.996862411499023, "global_step": 66018, "epoch": 1571} {"train_loss": -6.031377792358398, "global_step": 66019, "epoch": 1571} {"train_loss": -5.998072624206543, "global_step": 66020, "epoch": 1571} {"train_loss": -6.01283073425293, "global_step": 66021, "epoch": 1571} {"train_loss": -5.972202301025391, "global_step": 66022, "epoch": 1571} {"train_loss": -5.97119004385812, "global_step": 66023, "epoch": 1571, "val_loss": 75135.625} {"train_loss": -5.741064071655273, "global_step": 66024, "epoch": 1572} {"train_loss": -5.84291934967041, "global_step": 66025, "epoch": 1572} {"train_loss": -5.895103454589844, "global_step": 66026, "epoch": 1572} {"train_loss": -5.871691703796387, "global_step": 66027, "epoch": 1572} {"train_loss": -6.000932216644287, "global_step": 66028, "epoch": 1572} {"train_loss": -5.952166557312012, "global_step": 66029, "epoch": 1572} {"train_loss": -5.873229026794434, "global_step": 66030, "epoch": 1572} {"train_loss": -6.008319854736328, "global_step": 66031, "epoch": 1572} {"train_loss": -6.0434746742248535, "global_step": 66032, "epoch": 1572} {"train_loss": -5.929121494293213, "global_step": 66033, "epoch": 1572} {"train_loss": -6.0187788009643555, "global_step": 66034, "epoch": 1572} {"train_loss": -6.058839797973633, "global_step": 66035, "epoch": 1572} {"train_loss": -5.918030261993408, "global_step": 66036, "epoch": 1572} {"train_loss": -6.039262294769287, "global_step": 66037, "epoch": 1572} {"train_loss": -6.027547836303711, "global_step": 66038, "epoch": 1572} {"train_loss": -6.066025257110596, "global_step": 66039, "epoch": 1572} {"train_loss": -5.942079067230225, "global_step": 66040, "epoch": 1572} {"train_loss": -5.9305195808410645, "global_step": 66041, "epoch": 1572} {"train_loss": -5.954634666442871, "global_step": 66042, "epoch": 1572} {"train_loss": -6.129435062408447, "global_step": 66043, "epoch": 1572} {"train_loss": -6.013925552368164, "global_step": 66044, "epoch": 1572} {"train_loss": -5.928815841674805, "global_step": 66045, "epoch": 1572} {"train_loss": -6.010275840759277, "global_step": 66046, "epoch": 1572} {"train_loss": -6.050229072570801, "global_step": 66047, "epoch": 1572} {"train_loss": -5.954309463500977, "global_step": 66048, "epoch": 1572} {"train_loss": -6.053906440734863, "global_step": 66049, "epoch": 1572} {"train_loss": -6.117844104766846, "global_step": 66050, "epoch": 1572} {"train_loss": -6.066235065460205, "global_step": 66051, "epoch": 1572} {"train_loss": -5.9353532791137695, "global_step": 66052, "epoch": 1572} {"train_loss": -5.978172302246094, "global_step": 66053, "epoch": 1572} {"train_loss": -6.0179009437561035, "global_step": 66054, "epoch": 1572} {"train_loss": -6.0650858879089355, "global_step": 66055, "epoch": 1572} {"train_loss": -5.976102828979492, "global_step": 66056, "epoch": 1572} {"train_loss": -5.964774131774902, "global_step": 66057, "epoch": 1572} {"train_loss": -6.000232696533203, "global_step": 66058, "epoch": 1572} {"train_loss": -5.968453407287598, "global_step": 66059, "epoch": 1572} {"train_loss": -5.971965789794922, "global_step": 66060, "epoch": 1572} {"train_loss": -5.919517993927002, "global_step": 66061, "epoch": 1572} {"train_loss": -5.8753485679626465, "global_step": 66062, "epoch": 1572} {"train_loss": -5.994765758514404, "global_step": 66063, "epoch": 1572} {"train_loss": -6.056398391723633, "global_step": 66064, "epoch": 1572} {"train_loss": -5.9799200012570335, "global_step": 66065, "epoch": 1572, "val_loss": 74457.609375} {"train_loss": -6.0546369552612305, "global_step": 66066, "epoch": 1573} {"train_loss": -6.10513162612915, "global_step": 66067, "epoch": 1573} {"train_loss": -6.02501106262207, "global_step": 66068, "epoch": 1573} {"train_loss": -5.9307074546813965, "global_step": 66069, "epoch": 1573} {"train_loss": -6.067729473114014, "global_step": 66070, "epoch": 1573} {"train_loss": -6.0223236083984375, "global_step": 66071, "epoch": 1573} {"train_loss": -6.0705156326293945, "global_step": 66072, "epoch": 1573} {"train_loss": -6.021827697753906, "global_step": 66073, "epoch": 1573} {"train_loss": -6.006164073944092, "global_step": 66074, "epoch": 1573} {"train_loss": -6.046167850494385, "global_step": 66075, "epoch": 1573} {"train_loss": -6.021562576293945, "global_step": 66076, "epoch": 1573} {"train_loss": -6.058244705200195, "global_step": 66077, "epoch": 1573} {"train_loss": -5.838824272155762, "global_step": 66078, "epoch": 1573} {"train_loss": -6.09423828125, "global_step": 66079, "epoch": 1573} {"train_loss": -6.031744956970215, "global_step": 66080, "epoch": 1573} {"train_loss": -6.02956485748291, "global_step": 66081, "epoch": 1573} {"train_loss": -5.996280670166016, "global_step": 66082, "epoch": 1573} {"train_loss": -6.0409321784973145, "global_step": 66083, "epoch": 1573} {"train_loss": -5.913740158081055, "global_step": 66084, "epoch": 1573} {"train_loss": -5.986519813537598, "global_step": 66085, "epoch": 1573} {"train_loss": -6.012431621551514, "global_step": 66086, "epoch": 1573} {"train_loss": -5.980279445648193, "global_step": 66087, "epoch": 1573} {"train_loss": -6.021627426147461, "global_step": 66088, "epoch": 1573} {"train_loss": -5.985263347625732, "global_step": 66089, "epoch": 1573} {"train_loss": -6.002323150634766, "global_step": 66090, "epoch": 1573} {"train_loss": -5.992956638336182, "global_step": 66091, "epoch": 1573} {"train_loss": -5.88848876953125, "global_step": 66092, "epoch": 1573} {"train_loss": -5.976280212402344, "global_step": 66093, "epoch": 1573} {"train_loss": -6.029936790466309, "global_step": 66094, "epoch": 1573} {"train_loss": -5.910327911376953, "global_step": 66095, "epoch": 1573} {"train_loss": -5.989573001861572, "global_step": 66096, "epoch": 1573} {"train_loss": -6.031194686889648, "global_step": 66097, "epoch": 1573} {"train_loss": -5.895761489868164, "global_step": 66098, "epoch": 1573} {"train_loss": -6.018641471862793, "global_step": 66099, "epoch": 1573} {"train_loss": -5.854952335357666, "global_step": 66100, "epoch": 1573} {"train_loss": -5.937648773193359, "global_step": 66101, "epoch": 1573} {"train_loss": -6.009532928466797, "global_step": 66102, "epoch": 1573} {"train_loss": -6.072390556335449, "global_step": 66103, "epoch": 1573} {"train_loss": -5.776396751403809, "global_step": 66104, "epoch": 1573} {"train_loss": -6.121124267578125, "global_step": 66105, "epoch": 1573} {"train_loss": -6.008548736572266, "global_step": 66106, "epoch": 1573} {"train_loss": -5.997979323069255, "global_step": 66107, "epoch": 1573, "val_loss": 74589.46875} {"train_loss": -5.972343921661377, "global_step": 66108, "epoch": 1574} {"train_loss": -6.020387649536133, "global_step": 66109, "epoch": 1574} {"train_loss": -6.067553520202637, "global_step": 66110, "epoch": 1574} {"train_loss": -5.998434543609619, "global_step": 66111, "epoch": 1574} {"train_loss": -5.962985038757324, "global_step": 66112, "epoch": 1574} {"train_loss": -6.000454902648926, "global_step": 66113, "epoch": 1574} {"train_loss": -6.032658100128174, "global_step": 66114, "epoch": 1574} {"train_loss": -5.887301445007324, "global_step": 66115, "epoch": 1574} {"train_loss": -6.129443168640137, "global_step": 66116, "epoch": 1574} {"train_loss": -6.002469062805176, "global_step": 66117, "epoch": 1574} {"train_loss": -5.9961347579956055, "global_step": 66118, "epoch": 1574} {"train_loss": -6.034034729003906, "global_step": 66119, "epoch": 1574} {"train_loss": -6.045486927032471, "global_step": 66120, "epoch": 1574} {"train_loss": -5.893886566162109, "global_step": 66121, "epoch": 1574} {"train_loss": -5.931401252746582, "global_step": 66122, "epoch": 1574} {"train_loss": -5.994775295257568, "global_step": 66123, "epoch": 1574} {"train_loss": -5.946469306945801, "global_step": 66124, "epoch": 1574} {"train_loss": -5.992031097412109, "global_step": 66125, "epoch": 1574} {"train_loss": -5.899891376495361, "global_step": 66126, "epoch": 1574} {"train_loss": -5.914317607879639, "global_step": 66127, "epoch": 1574} {"train_loss": -5.797257423400879, "global_step": 66128, "epoch": 1574} {"train_loss": -5.881164073944092, "global_step": 66129, "epoch": 1574} {"train_loss": -6.035708904266357, "global_step": 66130, "epoch": 1574} {"train_loss": -5.9290876388549805, "global_step": 66131, "epoch": 1574} {"train_loss": -5.941977500915527, "global_step": 66132, "epoch": 1574} {"train_loss": -5.995903015136719, "global_step": 66133, "epoch": 1574} {"train_loss": -5.978122711181641, "global_step": 66134, "epoch": 1574} {"train_loss": -5.946002960205078, "global_step": 66135, "epoch": 1574} {"train_loss": -5.922358512878418, "global_step": 66136, "epoch": 1574} {"train_loss": -5.921391010284424, "global_step": 66137, "epoch": 1574} {"train_loss": -5.989140510559082, "global_step": 66138, "epoch": 1574} {"train_loss": -6.0742506980896, "global_step": 66139, "epoch": 1574} {"train_loss": -6.012378692626953, "global_step": 66140, "epoch": 1574} {"train_loss": -5.928985595703125, "global_step": 66141, "epoch": 1574} {"train_loss": -6.004332542419434, "global_step": 66142, "epoch": 1574} {"train_loss": -5.834244728088379, "global_step": 66143, "epoch": 1574} {"train_loss": -5.904027462005615, "global_step": 66144, "epoch": 1574} {"train_loss": -5.986931800842285, "global_step": 66145, "epoch": 1574} {"train_loss": -5.931602954864502, "global_step": 66146, "epoch": 1574} {"train_loss": -6.052032947540283, "global_step": 66147, "epoch": 1574} {"train_loss": -6.019846439361572, "global_step": 66148, "epoch": 1574} {"train_loss": -5.970494735808599, "global_step": 66149, "epoch": 1574, "val_loss": 74535.0390625} {"train_loss": -5.914135932922363, "global_step": 66150, "epoch": 1575} {"train_loss": -5.915416717529297, "global_step": 66151, "epoch": 1575} {"train_loss": -6.006401538848877, "global_step": 66152, "epoch": 1575} {"train_loss": -5.9089837074279785, "global_step": 66153, "epoch": 1575} {"train_loss": -5.955914497375488, "global_step": 66154, "epoch": 1575} {"train_loss": -5.906069278717041, "global_step": 66155, "epoch": 1575} {"train_loss": -5.892621040344238, "global_step": 66156, "epoch": 1575} {"train_loss": -5.867864608764648, "global_step": 66157, "epoch": 1575} {"train_loss": -6.095436096191406, "global_step": 66158, "epoch": 1575} {"train_loss": -5.920263767242432, "global_step": 66159, "epoch": 1575} {"train_loss": -5.949272155761719, "global_step": 66160, "epoch": 1575} {"train_loss": -5.859619140625, "global_step": 66161, "epoch": 1575} {"train_loss": -5.89730167388916, "global_step": 66162, "epoch": 1575} {"train_loss": -5.949580192565918, "global_step": 66163, "epoch": 1575} {"train_loss": -5.970841407775879, "global_step": 66164, "epoch": 1575} {"train_loss": -5.931351661682129, "global_step": 66165, "epoch": 1575} {"train_loss": -5.821791648864746, "global_step": 66166, "epoch": 1575} {"train_loss": -5.883528709411621, "global_step": 66167, "epoch": 1575} {"train_loss": -6.038180351257324, "global_step": 66168, "epoch": 1575} {"train_loss": -5.988943576812744, "global_step": 66169, "epoch": 1575} {"train_loss": -5.994754791259766, "global_step": 66170, "epoch": 1575} {"train_loss": -6.031822204589844, "global_step": 66171, "epoch": 1575} {"train_loss": -5.96420431137085, "global_step": 66172, "epoch": 1575} {"train_loss": -6.028870105743408, "global_step": 66173, "epoch": 1575} {"train_loss": -6.044259071350098, "global_step": 66174, "epoch": 1575} {"train_loss": -5.980313301086426, "global_step": 66175, "epoch": 1575} {"train_loss": -6.033237934112549, "global_step": 66176, "epoch": 1575} {"train_loss": -6.018955230712891, "global_step": 66177, "epoch": 1575} {"train_loss": -5.906425476074219, "global_step": 66178, "epoch": 1575} {"train_loss": -5.9176344871521, "global_step": 66179, "epoch": 1575} {"train_loss": -6.017086982727051, "global_step": 66180, "epoch": 1575} {"train_loss": -6.031523704528809, "global_step": 66181, "epoch": 1575} {"train_loss": -5.947872638702393, "global_step": 66182, "epoch": 1575} {"train_loss": -5.9457197189331055, "global_step": 66183, "epoch": 1575} {"train_loss": -5.962493896484375, "global_step": 66184, "epoch": 1575} {"train_loss": -6.056792259216309, "global_step": 66185, "epoch": 1575} {"train_loss": -5.942669868469238, "global_step": 66186, "epoch": 1575} {"train_loss": -5.826794147491455, "global_step": 66187, "epoch": 1575} {"train_loss": -6.053399562835693, "global_step": 66188, "epoch": 1575} {"train_loss": -6.047543525695801, "global_step": 66189, "epoch": 1575} {"train_loss": -5.980988502502441, "global_step": 66190, "epoch": 1575} {"train_loss": -5.962880259468442, "global_step": 66191, "epoch": 1575, "val_loss": 75001.53125} {"train_loss": -5.924895286560059, "global_step": 66192, "epoch": 1576} {"train_loss": -5.956844329833984, "global_step": 66193, "epoch": 1576} {"train_loss": -5.960812568664551, "global_step": 66194, "epoch": 1576} {"train_loss": -6.074717998504639, "global_step": 66195, "epoch": 1576} {"train_loss": -5.992011547088623, "global_step": 66196, "epoch": 1576} {"train_loss": -5.962139129638672, "global_step": 66197, "epoch": 1576} {"train_loss": -5.937243938446045, "global_step": 66198, "epoch": 1576} {"train_loss": -6.030008316040039, "global_step": 66199, "epoch": 1576} {"train_loss": -5.896233558654785, "global_step": 66200, "epoch": 1576} {"train_loss": -5.852748394012451, "global_step": 66201, "epoch": 1576} {"train_loss": -6.002315998077393, "global_step": 66202, "epoch": 1576} {"train_loss": -5.942690849304199, "global_step": 66203, "epoch": 1576} {"train_loss": -5.996673107147217, "global_step": 66204, "epoch": 1576} {"train_loss": -6.0874199867248535, "global_step": 66205, "epoch": 1576} {"train_loss": -5.939023971557617, "global_step": 66206, "epoch": 1576} {"train_loss": -6.110964298248291, "global_step": 66207, "epoch": 1576} {"train_loss": -5.959596633911133, "global_step": 66208, "epoch": 1576} {"train_loss": -6.039414405822754, "global_step": 66209, "epoch": 1576} {"train_loss": -6.040805339813232, "global_step": 66210, "epoch": 1576} {"train_loss": -6.073692321777344, "global_step": 66211, "epoch": 1576} {"train_loss": -5.906865119934082, "global_step": 66212, "epoch": 1576} {"train_loss": -6.02512264251709, "global_step": 66213, "epoch": 1576} {"train_loss": -6.030490875244141, "global_step": 66214, "epoch": 1576} {"train_loss": -5.98296594619751, "global_step": 66215, "epoch": 1576} {"train_loss": -6.007029056549072, "global_step": 66216, "epoch": 1576} {"train_loss": -6.064327239990234, "global_step": 66217, "epoch": 1576} {"train_loss": -5.892901420593262, "global_step": 66218, "epoch": 1576} {"train_loss": -6.045071601867676, "global_step": 66219, "epoch": 1576} {"train_loss": -5.998766899108887, "global_step": 66220, "epoch": 1576} {"train_loss": -5.951133728027344, "global_step": 66221, "epoch": 1576} {"train_loss": -5.934318542480469, "global_step": 66222, "epoch": 1576} {"train_loss": -5.9376630783081055, "global_step": 66223, "epoch": 1576} {"train_loss": -5.916379451751709, "global_step": 66224, "epoch": 1576} {"train_loss": -6.0068230628967285, "global_step": 66225, "epoch": 1576} {"train_loss": -6.0431952476501465, "global_step": 66226, "epoch": 1576} {"train_loss": -6.003297805786133, "global_step": 66227, "epoch": 1576} {"train_loss": -6.054629325866699, "global_step": 66228, "epoch": 1576} {"train_loss": -5.8639655113220215, "global_step": 66229, "epoch": 1576} {"train_loss": -5.933469772338867, "global_step": 66230, "epoch": 1576} {"train_loss": -6.01498556137085, "global_step": 66231, "epoch": 1576} {"train_loss": -6.049455165863037, "global_step": 66232, "epoch": 1576} {"train_loss": -5.985903365271432, "global_step": 66233, "epoch": 1576, "val_loss": 74398.34375} {"train_loss": -5.936753273010254, "global_step": 66234, "epoch": 1577} {"train_loss": -6.07645845413208, "global_step": 66235, "epoch": 1577} {"train_loss": -6.084561347961426, "global_step": 66236, "epoch": 1577} {"train_loss": -5.993690013885498, "global_step": 66237, "epoch": 1577} {"train_loss": -5.98655891418457, "global_step": 66238, "epoch": 1577} {"train_loss": -5.988770008087158, "global_step": 66239, "epoch": 1577} {"train_loss": -5.9826202392578125, "global_step": 66240, "epoch": 1577} {"train_loss": -5.979148864746094, "global_step": 66241, "epoch": 1577} {"train_loss": -5.938007354736328, "global_step": 66242, "epoch": 1577} {"train_loss": -6.028609275817871, "global_step": 66243, "epoch": 1577} {"train_loss": -6.034465789794922, "global_step": 66244, "epoch": 1577} {"train_loss": -5.969318389892578, "global_step": 66245, "epoch": 1577} {"train_loss": -5.905771255493164, "global_step": 66246, "epoch": 1577} {"train_loss": -5.996489524841309, "global_step": 66247, "epoch": 1577} {"train_loss": -5.982929229736328, "global_step": 66248, "epoch": 1577} {"train_loss": -5.93497896194458, "global_step": 66249, "epoch": 1577} {"train_loss": -5.90412712097168, "global_step": 66250, "epoch": 1577} {"train_loss": -5.92624568939209, "global_step": 66251, "epoch": 1577} {"train_loss": -5.970156669616699, "global_step": 66252, "epoch": 1577} {"train_loss": -5.939658164978027, "global_step": 66253, "epoch": 1577} {"train_loss": -5.9372663497924805, "global_step": 66254, "epoch": 1577} {"train_loss": -6.029411792755127, "global_step": 66255, "epoch": 1577} {"train_loss": -5.890627861022949, "global_step": 66256, "epoch": 1577} {"train_loss": -6.016236305236816, "global_step": 66257, "epoch": 1577} {"train_loss": -5.917016983032227, "global_step": 66258, "epoch": 1577} {"train_loss": -5.929889678955078, "global_step": 66259, "epoch": 1577} {"train_loss": -5.991910934448242, "global_step": 66260, "epoch": 1577} {"train_loss": -5.953268051147461, "global_step": 66261, "epoch": 1577} {"train_loss": -5.857544422149658, "global_step": 66262, "epoch": 1577} {"train_loss": -5.964349269866943, "global_step": 66263, "epoch": 1577} {"train_loss": -5.818991661071777, "global_step": 66264, "epoch": 1577} {"train_loss": -5.80864143371582, "global_step": 66265, "epoch": 1577} {"train_loss": -5.814937591552734, "global_step": 66266, "epoch": 1577} {"train_loss": -5.798189163208008, "global_step": 66267, "epoch": 1577} {"train_loss": -5.932463645935059, "global_step": 66268, "epoch": 1577} {"train_loss": -5.9427385330200195, "global_step": 66269, "epoch": 1577} {"train_loss": -5.884036540985107, "global_step": 66270, "epoch": 1577} {"train_loss": -5.838510990142822, "global_step": 66271, "epoch": 1577} {"train_loss": -5.818607807159424, "global_step": 66272, "epoch": 1577} {"train_loss": -5.837587356567383, "global_step": 66273, "epoch": 1577} {"train_loss": -5.890887260437012, "global_step": 66274, "epoch": 1577} {"train_loss": -5.935754265104022, "global_step": 66275, "epoch": 1577, "val_loss": 75095.96875} {"train_loss": -5.865300178527832, "global_step": 66276, "epoch": 1578} {"train_loss": -5.819638252258301, "global_step": 66277, "epoch": 1578} {"train_loss": -5.882297039031982, "global_step": 66278, "epoch": 1578} {"train_loss": -5.9898223876953125, "global_step": 66279, "epoch": 1578} {"train_loss": -5.767284393310547, "global_step": 66280, "epoch": 1578} {"train_loss": -5.969586372375488, "global_step": 66281, "epoch": 1578} {"train_loss": -5.9194183349609375, "global_step": 66282, "epoch": 1578} {"train_loss": -5.99220609664917, "global_step": 66283, "epoch": 1578} {"train_loss": -5.864007949829102, "global_step": 66284, "epoch": 1578} {"train_loss": -5.889058589935303, "global_step": 66285, "epoch": 1578} {"train_loss": -5.925614356994629, "global_step": 66286, "epoch": 1578} {"train_loss": -5.992204666137695, "global_step": 66287, "epoch": 1578} {"train_loss": -6.007516384124756, "global_step": 66288, "epoch": 1578} {"train_loss": -5.936661720275879, "global_step": 66289, "epoch": 1578} {"train_loss": -5.8373637199401855, "global_step": 66290, "epoch": 1578} {"train_loss": -5.959414482116699, "global_step": 66291, "epoch": 1578} {"train_loss": -6.034869194030762, "global_step": 66292, "epoch": 1578} {"train_loss": -6.025352478027344, "global_step": 66293, "epoch": 1578} {"train_loss": -5.876020431518555, "global_step": 66294, "epoch": 1578} {"train_loss": -5.941497802734375, "global_step": 66295, "epoch": 1578} {"train_loss": -5.8773603439331055, "global_step": 66296, "epoch": 1578} {"train_loss": -6.004448413848877, "global_step": 66297, "epoch": 1578} {"train_loss": -5.988602638244629, "global_step": 66298, "epoch": 1578} {"train_loss": -5.93099308013916, "global_step": 66299, "epoch": 1578} {"train_loss": -5.9936442375183105, "global_step": 66300, "epoch": 1578} {"train_loss": -6.052443027496338, "global_step": 66301, "epoch": 1578} {"train_loss": -5.877025604248047, "global_step": 66302, "epoch": 1578} {"train_loss": -5.864752769470215, "global_step": 66303, "epoch": 1578} {"train_loss": -6.041417598724365, "global_step": 66304, "epoch": 1578} {"train_loss": -5.780774116516113, "global_step": 66305, "epoch": 1578} {"train_loss": -5.79879903793335, "global_step": 66306, "epoch": 1578} {"train_loss": -5.761003494262695, "global_step": 66307, "epoch": 1578} {"train_loss": -5.9302215576171875, "global_step": 66308, "epoch": 1578} {"train_loss": -5.857512474060059, "global_step": 66309, "epoch": 1578} {"train_loss": -5.827834606170654, "global_step": 66310, "epoch": 1578} {"train_loss": -5.873440265655518, "global_step": 66311, "epoch": 1578} {"train_loss": -5.793965816497803, "global_step": 66312, "epoch": 1578} {"train_loss": -5.919512748718262, "global_step": 66313, "epoch": 1578} {"train_loss": -5.806222915649414, "global_step": 66314, "epoch": 1578} {"train_loss": -5.954794883728027, "global_step": 66315, "epoch": 1578} {"train_loss": -5.851728439331055, "global_step": 66316, "epoch": 1578} {"train_loss": -5.910398176738194, "global_step": 66317, "epoch": 1578, "val_loss": 75009.9375} {"train_loss": -5.855398178100586, "global_step": 66318, "epoch": 1579} {"train_loss": -6.000432014465332, "global_step": 66319, "epoch": 1579} {"train_loss": -5.832472324371338, "global_step": 66320, "epoch": 1579} {"train_loss": -5.935349464416504, "global_step": 66321, "epoch": 1579} {"train_loss": -5.977292537689209, "global_step": 66322, "epoch": 1579} {"train_loss": -5.967935562133789, "global_step": 66323, "epoch": 1579} {"train_loss": -5.92894983291626, "global_step": 66324, "epoch": 1579} {"train_loss": -5.891106605529785, "global_step": 66325, "epoch": 1579} {"train_loss": -5.833874702453613, "global_step": 66326, "epoch": 1579} {"train_loss": -5.948590278625488, "global_step": 66327, "epoch": 1579} {"train_loss": -5.837034225463867, "global_step": 66328, "epoch": 1579} {"train_loss": -5.956940174102783, "global_step": 66329, "epoch": 1579} {"train_loss": -6.094172954559326, "global_step": 66330, "epoch": 1579} {"train_loss": -5.902375221252441, "global_step": 66331, "epoch": 1579} {"train_loss": -6.014366626739502, "global_step": 66332, "epoch": 1579} {"train_loss": -6.054978847503662, "global_step": 66333, "epoch": 1579} {"train_loss": -5.973758697509766, "global_step": 66334, "epoch": 1579} {"train_loss": -5.911958694458008, "global_step": 66335, "epoch": 1579} {"train_loss": -5.942938327789307, "global_step": 66336, "epoch": 1579} {"train_loss": -5.9744672775268555, "global_step": 66337, "epoch": 1579} {"train_loss": -6.009371757507324, "global_step": 66338, "epoch": 1579} {"train_loss": -6.082540988922119, "global_step": 66339, "epoch": 1579} {"train_loss": -6.0606536865234375, "global_step": 66340, "epoch": 1579} {"train_loss": -5.912672996520996, "global_step": 66341, "epoch": 1579} {"train_loss": -6.018547058105469, "global_step": 66342, "epoch": 1579} {"train_loss": -6.043015003204346, "global_step": 66343, "epoch": 1579} {"train_loss": -5.975703239440918, "global_step": 66344, "epoch": 1579} {"train_loss": -5.972251892089844, "global_step": 66345, "epoch": 1579} {"train_loss": -5.913775444030762, "global_step": 66346, "epoch": 1579} {"train_loss": -5.959842681884766, "global_step": 66347, "epoch": 1579} {"train_loss": -5.839166641235352, "global_step": 66348, "epoch": 1579} {"train_loss": -6.0698041915893555, "global_step": 66349, "epoch": 1579} {"train_loss": -5.980328559875488, "global_step": 66350, "epoch": 1579} {"train_loss": -6.0401201248168945, "global_step": 66351, "epoch": 1579} {"train_loss": -5.919131755828857, "global_step": 66352, "epoch": 1579} {"train_loss": -5.897822380065918, "global_step": 66353, "epoch": 1579} {"train_loss": -5.99620246887207, "global_step": 66354, "epoch": 1579} {"train_loss": -5.923828601837158, "global_step": 66355, "epoch": 1579} {"train_loss": -5.99624490737915, "global_step": 66356, "epoch": 1579} {"train_loss": -5.805668830871582, "global_step": 66357, "epoch": 1579} {"train_loss": -5.988978862762451, "global_step": 66358, "epoch": 1579} {"train_loss": -5.961277666546049, "global_step": 66359, "epoch": 1579, "val_loss": 74641.6015625} {"train_loss": -5.907773971557617, "global_step": 66360, "epoch": 1580} {"train_loss": -6.05983829498291, "global_step": 66361, "epoch": 1580} {"train_loss": -6.0327653884887695, "global_step": 66362, "epoch": 1580} {"train_loss": -6.017385005950928, "global_step": 66363, "epoch": 1580} {"train_loss": -5.985763072967529, "global_step": 66364, "epoch": 1580} {"train_loss": -5.897144317626953, "global_step": 66365, "epoch": 1580} {"train_loss": -6.01805305480957, "global_step": 66366, "epoch": 1580} {"train_loss": -6.077502250671387, "global_step": 66367, "epoch": 1580} {"train_loss": -5.991092681884766, "global_step": 66368, "epoch": 1580} {"train_loss": -6.025232315063477, "global_step": 66369, "epoch": 1580} {"train_loss": -5.84250020980835, "global_step": 66370, "epoch": 1580} {"train_loss": -6.047909736633301, "global_step": 66371, "epoch": 1580} {"train_loss": -6.0474138259887695, "global_step": 66372, "epoch": 1580} {"train_loss": -5.9078593254089355, "global_step": 66373, "epoch": 1580} {"train_loss": -5.959860801696777, "global_step": 66374, "epoch": 1580} {"train_loss": -6.084371566772461, "global_step": 66375, "epoch": 1580} {"train_loss": -5.882001876831055, "global_step": 66376, "epoch": 1580} {"train_loss": -5.899374485015869, "global_step": 66377, "epoch": 1580} {"train_loss": -6.000560283660889, "global_step": 66378, "epoch": 1580} {"train_loss": -5.950677871704102, "global_step": 66379, "epoch": 1580} {"train_loss": -5.914730072021484, "global_step": 66380, "epoch": 1580} {"train_loss": -5.8990888595581055, "global_step": 66381, "epoch": 1580} {"train_loss": -5.934145450592041, "global_step": 66382, "epoch": 1580} {"train_loss": -5.926083564758301, "global_step": 66383, "epoch": 1580} {"train_loss": -5.923742294311523, "global_step": 66384, "epoch": 1580} {"train_loss": -5.961820602416992, "global_step": 66385, "epoch": 1580} {"train_loss": -5.944228172302246, "global_step": 66386, "epoch": 1580} {"train_loss": -6.029088020324707, "global_step": 66387, "epoch": 1580} {"train_loss": -5.912631988525391, "global_step": 66388, "epoch": 1580} {"train_loss": -5.891079902648926, "global_step": 66389, "epoch": 1580} {"train_loss": -5.981719970703125, "global_step": 66390, "epoch": 1580} {"train_loss": -5.882702827453613, "global_step": 66391, "epoch": 1580} {"train_loss": -5.83748722076416, "global_step": 66392, "epoch": 1580} {"train_loss": -5.922502517700195, "global_step": 66393, "epoch": 1580} {"train_loss": -5.807741165161133, "global_step": 66394, "epoch": 1580} {"train_loss": -6.088974475860596, "global_step": 66395, "epoch": 1580} {"train_loss": -5.897732734680176, "global_step": 66396, "epoch": 1580} {"train_loss": -5.86126708984375, "global_step": 66397, "epoch": 1580} {"train_loss": -5.857244968414307, "global_step": 66398, "epoch": 1580} {"train_loss": -5.972270965576172, "global_step": 66399, "epoch": 1580} {"train_loss": -5.868284225463867, "global_step": 66400, "epoch": 1580} {"train_loss": -5.947634004411244, "global_step": 66401, "epoch": 1580, "val_loss": 74837.734375} {"train_loss": -5.943922996520996, "global_step": 66402, "epoch": 1581} {"train_loss": -5.927678108215332, "global_step": 66403, "epoch": 1581} {"train_loss": -5.991957187652588, "global_step": 66404, "epoch": 1581} {"train_loss": -5.9892377853393555, "global_step": 66405, "epoch": 1581} {"train_loss": -5.911535263061523, "global_step": 66406, "epoch": 1581} {"train_loss": -5.833747386932373, "global_step": 66407, "epoch": 1581} {"train_loss": -5.937597274780273, "global_step": 66408, "epoch": 1581} {"train_loss": -5.986751556396484, "global_step": 66409, "epoch": 1581} {"train_loss": -5.918615818023682, "global_step": 66410, "epoch": 1581} {"train_loss": -5.9875288009643555, "global_step": 66411, "epoch": 1581} {"train_loss": -5.9726738929748535, "global_step": 66412, "epoch": 1581} {"train_loss": -5.874301910400391, "global_step": 66413, "epoch": 1581} {"train_loss": -5.947089195251465, "global_step": 66414, "epoch": 1581} {"train_loss": -5.898914813995361, "global_step": 66415, "epoch": 1581} {"train_loss": -5.973717212677002, "global_step": 66416, "epoch": 1581} {"train_loss": -5.997530937194824, "global_step": 66417, "epoch": 1581} {"train_loss": -6.072695732116699, "global_step": 66418, "epoch": 1581} {"train_loss": -6.076105117797852, "global_step": 66419, "epoch": 1581} {"train_loss": -5.978762149810791, "global_step": 66420, "epoch": 1581} {"train_loss": -6.0174970626831055, "global_step": 66421, "epoch": 1581} {"train_loss": -6.029540061950684, "global_step": 66422, "epoch": 1581} {"train_loss": -6.029695510864258, "global_step": 66423, "epoch": 1581} {"train_loss": -5.958052158355713, "global_step": 66424, "epoch": 1581} {"train_loss": -5.961504936218262, "global_step": 66425, "epoch": 1581} {"train_loss": -6.068725109100342, "global_step": 66426, "epoch": 1581} {"train_loss": -5.900626182556152, "global_step": 66427, "epoch": 1581} {"train_loss": -6.022225856781006, "global_step": 66428, "epoch": 1581} {"train_loss": -5.993043899536133, "global_step": 66429, "epoch": 1581} {"train_loss": -6.004319190979004, "global_step": 66430, "epoch": 1581} {"train_loss": -6.0070271492004395, "global_step": 66431, "epoch": 1581} {"train_loss": -5.890415668487549, "global_step": 66432, "epoch": 1581} {"train_loss": -5.968338966369629, "global_step": 66433, "epoch": 1581} {"train_loss": -5.83726167678833, "global_step": 66434, "epoch": 1581} {"train_loss": -5.96431827545166, "global_step": 66435, "epoch": 1581} {"train_loss": -5.947140693664551, "global_step": 66436, "epoch": 1581} {"train_loss": -5.961764335632324, "global_step": 66437, "epoch": 1581} {"train_loss": -6.0356221199035645, "global_step": 66438, "epoch": 1581} {"train_loss": -5.94558048248291, "global_step": 66439, "epoch": 1581} {"train_loss": -6.072550296783447, "global_step": 66440, "epoch": 1581} {"train_loss": -5.8923492431640625, "global_step": 66441, "epoch": 1581} {"train_loss": -5.972539901733398, "global_step": 66442, "epoch": 1581} {"train_loss": -5.967008159274147, "global_step": 66443, "epoch": 1581, "val_loss": 74307.453125} {"train_loss": -5.895725250244141, "global_step": 66444, "epoch": 1582} {"train_loss": -5.948783874511719, "global_step": 66445, "epoch": 1582} {"train_loss": -5.918248176574707, "global_step": 66446, "epoch": 1582} {"train_loss": -5.92042350769043, "global_step": 66447, "epoch": 1582} {"train_loss": -5.97761344909668, "global_step": 66448, "epoch": 1582} {"train_loss": -6.000365257263184, "global_step": 66449, "epoch": 1582} {"train_loss": -6.012134552001953, "global_step": 66450, "epoch": 1582} {"train_loss": -6.0147247314453125, "global_step": 66451, "epoch": 1582} {"train_loss": -6.011651515960693, "global_step": 66452, "epoch": 1582} {"train_loss": -5.9783124923706055, "global_step": 66453, "epoch": 1582} {"train_loss": -5.977994441986084, "global_step": 66454, "epoch": 1582} {"train_loss": -6.066367149353027, "global_step": 66455, "epoch": 1582} {"train_loss": -5.954458713531494, "global_step": 66456, "epoch": 1582} {"train_loss": -6.11873722076416, "global_step": 66457, "epoch": 1582} {"train_loss": -5.952149391174316, "global_step": 66458, "epoch": 1582} {"train_loss": -5.9588727951049805, "global_step": 66459, "epoch": 1582} {"train_loss": -6.135677814483643, "global_step": 66460, "epoch": 1582} {"train_loss": -6.044283866882324, "global_step": 66461, "epoch": 1582} {"train_loss": -6.080190658569336, "global_step": 66462, "epoch": 1582} {"train_loss": -5.984462261199951, "global_step": 66463, "epoch": 1582} {"train_loss": -5.876811504364014, "global_step": 66464, "epoch": 1582} {"train_loss": -6.008806228637695, "global_step": 66465, "epoch": 1582} {"train_loss": -6.105368137359619, "global_step": 66466, "epoch": 1582} {"train_loss": -6.043999671936035, "global_step": 66467, "epoch": 1582} {"train_loss": -5.93579626083374, "global_step": 66468, "epoch": 1582} {"train_loss": -5.970406532287598, "global_step": 66469, "epoch": 1582} {"train_loss": -5.938772678375244, "global_step": 66470, "epoch": 1582} {"train_loss": -5.815790176391602, "global_step": 66471, "epoch": 1582} {"train_loss": -6.077312469482422, "global_step": 66472, "epoch": 1582} {"train_loss": -6.001910209655762, "global_step": 66473, "epoch": 1582} {"train_loss": -5.913766860961914, "global_step": 66474, "epoch": 1582} {"train_loss": -5.949876308441162, "global_step": 66475, "epoch": 1582} {"train_loss": -5.8767409324646, "global_step": 66476, "epoch": 1582} {"train_loss": -5.913463592529297, "global_step": 66477, "epoch": 1582} {"train_loss": -6.010334014892578, "global_step": 66478, "epoch": 1582} {"train_loss": -6.014230251312256, "global_step": 66479, "epoch": 1582} {"train_loss": -5.951608657836914, "global_step": 66480, "epoch": 1582} {"train_loss": -6.090301513671875, "global_step": 66481, "epoch": 1582} {"train_loss": -5.9824700355529785, "global_step": 66482, "epoch": 1582} {"train_loss": -5.991522312164307, "global_step": 66483, "epoch": 1582} {"train_loss": -5.946369171142578, "global_step": 66484, "epoch": 1582} {"train_loss": -5.983719110488892, "global_step": 66485, "epoch": 1582, "val_loss": 74757.375} {"train_loss": -5.909249305725098, "global_step": 66486, "epoch": 1583} {"train_loss": -5.8029704093933105, "global_step": 66487, "epoch": 1583} {"train_loss": -6.07853889465332, "global_step": 66488, "epoch": 1583} {"train_loss": -5.8971991539001465, "global_step": 66489, "epoch": 1583} {"train_loss": -6.085080146789551, "global_step": 66490, "epoch": 1583} {"train_loss": -5.932594299316406, "global_step": 66491, "epoch": 1583} {"train_loss": -5.886087417602539, "global_step": 66492, "epoch": 1583} {"train_loss": -5.907161712646484, "global_step": 66493, "epoch": 1583} {"train_loss": -5.999266624450684, "global_step": 66494, "epoch": 1583} {"train_loss": -5.862677574157715, "global_step": 66495, "epoch": 1583} {"train_loss": -5.957581520080566, "global_step": 66496, "epoch": 1583} {"train_loss": -5.885741233825684, "global_step": 66497, "epoch": 1583} {"train_loss": -5.962451934814453, "global_step": 66498, "epoch": 1583} {"train_loss": -6.076601028442383, "global_step": 66499, "epoch": 1583} {"train_loss": -5.920773506164551, "global_step": 66500, "epoch": 1583} {"train_loss": -5.849466800689697, "global_step": 66501, "epoch": 1583} {"train_loss": -5.897655487060547, "global_step": 66502, "epoch": 1583} {"train_loss": -6.020173072814941, "global_step": 66503, "epoch": 1583} {"train_loss": -5.8653388023376465, "global_step": 66504, "epoch": 1583} {"train_loss": -5.86270809173584, "global_step": 66505, "epoch": 1583} {"train_loss": -5.947157859802246, "global_step": 66506, "epoch": 1583} {"train_loss": -5.9952850341796875, "global_step": 66507, "epoch": 1583} {"train_loss": -5.932662010192871, "global_step": 66508, "epoch": 1583} {"train_loss": -5.931676387786865, "global_step": 66509, "epoch": 1583} {"train_loss": -5.919631004333496, "global_step": 66510, "epoch": 1583} {"train_loss": -6.020105361938477, "global_step": 66511, "epoch": 1583} {"train_loss": -5.956988334655762, "global_step": 66512, "epoch": 1583} {"train_loss": -5.944640636444092, "global_step": 66513, "epoch": 1583} {"train_loss": -5.9594926834106445, "global_step": 66514, "epoch": 1583} {"train_loss": -6.048894882202148, "global_step": 66515, "epoch": 1583} {"train_loss": -5.981231689453125, "global_step": 66516, "epoch": 1583} {"train_loss": -6.013297080993652, "global_step": 66517, "epoch": 1583} {"train_loss": -5.925204277038574, "global_step": 66518, "epoch": 1583} {"train_loss": -5.854744911193848, "global_step": 66519, "epoch": 1583} {"train_loss": -5.9807891845703125, "global_step": 66520, "epoch": 1583} {"train_loss": -5.992463111877441, "global_step": 66521, "epoch": 1583} {"train_loss": -5.892069339752197, "global_step": 66522, "epoch": 1583} {"train_loss": -5.959768772125244, "global_step": 66523, "epoch": 1583} {"train_loss": -6.065496444702148, "global_step": 66524, "epoch": 1583} {"train_loss": -5.955875396728516, "global_step": 66525, "epoch": 1583} {"train_loss": -5.855640411376953, "global_step": 66526, "epoch": 1583} {"train_loss": -5.9492832365490145, "global_step": 66527, "epoch": 1583, "val_loss": 74402.2734375} {"train_loss": -6.067529678344727, "global_step": 66528, "epoch": 1584} {"train_loss": -6.067315578460693, "global_step": 66529, "epoch": 1584} {"train_loss": -6.075721740722656, "global_step": 66530, "epoch": 1584} {"train_loss": -5.874524116516113, "global_step": 66531, "epoch": 1584} {"train_loss": -6.173853874206543, "global_step": 66532, "epoch": 1584} {"train_loss": -5.867773056030273, "global_step": 66533, "epoch": 1584} {"train_loss": -5.986832618713379, "global_step": 66534, "epoch": 1584} {"train_loss": -6.038592338562012, "global_step": 66535, "epoch": 1584} {"train_loss": -6.004512786865234, "global_step": 66536, "epoch": 1584} {"train_loss": -5.903175354003906, "global_step": 66537, "epoch": 1584} {"train_loss": -5.9250593185424805, "global_step": 66538, "epoch": 1584} {"train_loss": -5.892732620239258, "global_step": 66539, "epoch": 1584} {"train_loss": -6.011693954467773, "global_step": 66540, "epoch": 1584} {"train_loss": -6.052034854888916, "global_step": 66541, "epoch": 1584} {"train_loss": -5.9545698165893555, "global_step": 66542, "epoch": 1584} {"train_loss": -6.048006534576416, "global_step": 66543, "epoch": 1584} {"train_loss": -5.958126544952393, "global_step": 66544, "epoch": 1584} {"train_loss": -6.011894226074219, "global_step": 66545, "epoch": 1584} {"train_loss": -5.969230651855469, "global_step": 66546, "epoch": 1584} {"train_loss": -5.934927940368652, "global_step": 66547, "epoch": 1584} {"train_loss": -5.990447998046875, "global_step": 66548, "epoch": 1584} {"train_loss": -5.827127933502197, "global_step": 66549, "epoch": 1584} {"train_loss": -5.8793511390686035, "global_step": 66550, "epoch": 1584} {"train_loss": -5.982378959655762, "global_step": 66551, "epoch": 1584} {"train_loss": -5.9276885986328125, "global_step": 66552, "epoch": 1584} {"train_loss": -5.921658039093018, "global_step": 66553, "epoch": 1584} {"train_loss": -6.123381614685059, "global_step": 66554, "epoch": 1584} {"train_loss": -5.909130573272705, "global_step": 66555, "epoch": 1584} {"train_loss": -5.965363502502441, "global_step": 66556, "epoch": 1584} {"train_loss": -6.047094345092773, "global_step": 66557, "epoch": 1584} {"train_loss": -5.910846710205078, "global_step": 66558, "epoch": 1584} {"train_loss": -6.097348213195801, "global_step": 66559, "epoch": 1584} {"train_loss": -6.016125679016113, "global_step": 66560, "epoch": 1584} {"train_loss": -5.905975818634033, "global_step": 66561, "epoch": 1584} {"train_loss": -6.044302463531494, "global_step": 66562, "epoch": 1584} {"train_loss": -5.996650218963623, "global_step": 66563, "epoch": 1584} {"train_loss": -5.854272842407227, "global_step": 66564, "epoch": 1584} {"train_loss": -5.914021015167236, "global_step": 66565, "epoch": 1584} {"train_loss": -5.983367443084717, "global_step": 66566, "epoch": 1584} {"train_loss": -5.954991817474365, "global_step": 66567, "epoch": 1584} {"train_loss": -6.073452949523926, "global_step": 66568, "epoch": 1584} {"train_loss": -5.980525527681623, "global_step": 66569, "epoch": 1584, "val_loss": 74995.921875} {"train_loss": -5.876673698425293, "global_step": 66570, "epoch": 1585} {"train_loss": -5.954007625579834, "global_step": 66571, "epoch": 1585} {"train_loss": -5.926312446594238, "global_step": 66572, "epoch": 1585} {"train_loss": -5.962071418762207, "global_step": 66573, "epoch": 1585} {"train_loss": -5.967965602874756, "global_step": 66574, "epoch": 1585} {"train_loss": -5.868889808654785, "global_step": 66575, "epoch": 1585} {"train_loss": -5.856762409210205, "global_step": 66576, "epoch": 1585} {"train_loss": -6.033221244812012, "global_step": 66577, "epoch": 1585} {"train_loss": -5.983418941497803, "global_step": 66578, "epoch": 1585} {"train_loss": -6.047613143920898, "global_step": 66579, "epoch": 1585} {"train_loss": -6.036581039428711, "global_step": 66580, "epoch": 1585} {"train_loss": -6.0046610832214355, "global_step": 66581, "epoch": 1585} {"train_loss": -6.0505595207214355, "global_step": 66582, "epoch": 1585} {"train_loss": -6.014998912811279, "global_step": 66583, "epoch": 1585} {"train_loss": -6.088135719299316, "global_step": 66584, "epoch": 1585} {"train_loss": -5.963233470916748, "global_step": 66585, "epoch": 1585} {"train_loss": -6.028338432312012, "global_step": 66586, "epoch": 1585} {"train_loss": -6.027315139770508, "global_step": 66587, "epoch": 1585} {"train_loss": -5.984810829162598, "global_step": 66588, "epoch": 1585} {"train_loss": -5.831566333770752, "global_step": 66589, "epoch": 1585} {"train_loss": -6.00904655456543, "global_step": 66590, "epoch": 1585} {"train_loss": -5.843029022216797, "global_step": 66591, "epoch": 1585} {"train_loss": -5.905442237854004, "global_step": 66592, "epoch": 1585} {"train_loss": -5.841370582580566, "global_step": 66593, "epoch": 1585} {"train_loss": -6.080665111541748, "global_step": 66594, "epoch": 1585} {"train_loss": -6.022062301635742, "global_step": 66595, "epoch": 1585} {"train_loss": -5.880986213684082, "global_step": 66596, "epoch": 1585} {"train_loss": -6.0402727127075195, "global_step": 66597, "epoch": 1585} {"train_loss": -5.942959785461426, "global_step": 66598, "epoch": 1585} {"train_loss": -5.98512077331543, "global_step": 66599, "epoch": 1585} {"train_loss": -5.976980209350586, "global_step": 66600, "epoch": 1585} {"train_loss": -6.221624374389648, "global_step": 66601, "epoch": 1585} {"train_loss": -5.95534610748291, "global_step": 66602, "epoch": 1585} {"train_loss": -5.961543560028076, "global_step": 66603, "epoch": 1585} {"train_loss": -5.963362216949463, "global_step": 66604, "epoch": 1585} {"train_loss": -5.977724075317383, "global_step": 66605, "epoch": 1585} {"train_loss": -5.99711799621582, "global_step": 66606, "epoch": 1585} {"train_loss": -6.042949199676514, "global_step": 66607, "epoch": 1585} {"train_loss": -6.038265228271484, "global_step": 66608, "epoch": 1585} {"train_loss": -5.962180137634277, "global_step": 66609, "epoch": 1585} {"train_loss": -5.960427761077881, "global_step": 66610, "epoch": 1585} {"train_loss": -5.974685214814686, "global_step": 66611, "epoch": 1585, "val_loss": 74692.2265625} {"train_loss": -5.964565753936768, "global_step": 66612, "epoch": 1586} {"train_loss": -5.954459190368652, "global_step": 66613, "epoch": 1586} {"train_loss": -5.937912940979004, "global_step": 66614, "epoch": 1586} {"train_loss": -5.897917747497559, "global_step": 66615, "epoch": 1586} {"train_loss": -6.022480010986328, "global_step": 66616, "epoch": 1586} {"train_loss": -5.99989128112793, "global_step": 66617, "epoch": 1586} {"train_loss": -6.090497016906738, "global_step": 66618, "epoch": 1586} {"train_loss": -5.920042991638184, "global_step": 66619, "epoch": 1586} {"train_loss": -6.025241851806641, "global_step": 66620, "epoch": 1586} {"train_loss": -6.050292491912842, "global_step": 66621, "epoch": 1586} {"train_loss": -5.976899147033691, "global_step": 66622, "epoch": 1586} {"train_loss": -5.984005928039551, "global_step": 66623, "epoch": 1586} {"train_loss": -6.075801849365234, "global_step": 66624, "epoch": 1586} {"train_loss": -6.039244651794434, "global_step": 66625, "epoch": 1586} {"train_loss": -6.0255255699157715, "global_step": 66626, "epoch": 1586} {"train_loss": -5.965555667877197, "global_step": 66627, "epoch": 1586} {"train_loss": -5.941972732543945, "global_step": 66628, "epoch": 1586} {"train_loss": -5.9321112632751465, "global_step": 66629, "epoch": 1586} {"train_loss": -6.033031463623047, "global_step": 66630, "epoch": 1586} {"train_loss": -5.959278583526611, "global_step": 66631, "epoch": 1586} {"train_loss": -5.958148956298828, "global_step": 66632, "epoch": 1586} {"train_loss": -5.8474626541137695, "global_step": 66633, "epoch": 1586} {"train_loss": -6.064526557922363, "global_step": 66634, "epoch": 1586} {"train_loss": -5.907992362976074, "global_step": 66635, "epoch": 1586} {"train_loss": -5.920924186706543, "global_step": 66636, "epoch": 1586} {"train_loss": -6.036441802978516, "global_step": 66637, "epoch": 1586} {"train_loss": -5.940847396850586, "global_step": 66638, "epoch": 1586} {"train_loss": -6.031569004058838, "global_step": 66639, "epoch": 1586} {"train_loss": -6.049905776977539, "global_step": 66640, "epoch": 1586} {"train_loss": -5.955374717712402, "global_step": 66641, "epoch": 1586} {"train_loss": -5.988709926605225, "global_step": 66642, "epoch": 1586} {"train_loss": -6.069097518920898, "global_step": 66643, "epoch": 1586} {"train_loss": -6.03135871887207, "global_step": 66644, "epoch": 1586} {"train_loss": -5.990843772888184, "global_step": 66645, "epoch": 1586} {"train_loss": -5.963839530944824, "global_step": 66646, "epoch": 1586} {"train_loss": -5.921027183532715, "global_step": 66647, "epoch": 1586} {"train_loss": -5.902325630187988, "global_step": 66648, "epoch": 1586} {"train_loss": -5.988773822784424, "global_step": 66649, "epoch": 1586} {"train_loss": -5.983706474304199, "global_step": 66650, "epoch": 1586} {"train_loss": -5.923730850219727, "global_step": 66651, "epoch": 1586} {"train_loss": -5.951560974121094, "global_step": 66652, "epoch": 1586} {"train_loss": -5.984297718320574, "global_step": 66653, "epoch": 1586, "val_loss": 74523.859375} {"train_loss": -5.901952266693115, "global_step": 66654, "epoch": 1587} {"train_loss": -5.994098663330078, "global_step": 66655, "epoch": 1587} {"train_loss": -5.958730697631836, "global_step": 66656, "epoch": 1587} {"train_loss": -6.096194267272949, "global_step": 66657, "epoch": 1587} {"train_loss": -6.122598648071289, "global_step": 66658, "epoch": 1587} {"train_loss": -6.006011486053467, "global_step": 66659, "epoch": 1587} {"train_loss": -5.954586029052734, "global_step": 66660, "epoch": 1587} {"train_loss": -6.018588066101074, "global_step": 66661, "epoch": 1587} {"train_loss": -6.005860328674316, "global_step": 66662, "epoch": 1587} {"train_loss": -6.060145378112793, "global_step": 66663, "epoch": 1587} {"train_loss": -5.978262424468994, "global_step": 66664, "epoch": 1587} {"train_loss": -6.070591926574707, "global_step": 66665, "epoch": 1587} {"train_loss": -6.040042877197266, "global_step": 66666, "epoch": 1587} {"train_loss": -6.054833889007568, "global_step": 66667, "epoch": 1587} {"train_loss": -5.81994104385376, "global_step": 66668, "epoch": 1587} {"train_loss": -5.867096424102783, "global_step": 66669, "epoch": 1587} {"train_loss": -6.000481605529785, "global_step": 66670, "epoch": 1587} {"train_loss": -5.908995628356934, "global_step": 66671, "epoch": 1587} {"train_loss": -5.973166465759277, "global_step": 66672, "epoch": 1587} {"train_loss": -5.990477561950684, "global_step": 66673, "epoch": 1587} {"train_loss": -5.9934468269348145, "global_step": 66674, "epoch": 1587} {"train_loss": -5.94497013092041, "global_step": 66675, "epoch": 1587} {"train_loss": -5.945211410522461, "global_step": 66676, "epoch": 1587} {"train_loss": -6.044907093048096, "global_step": 66677, "epoch": 1587} {"train_loss": -5.942336082458496, "global_step": 66678, "epoch": 1587} {"train_loss": -6.012739181518555, "global_step": 66679, "epoch": 1587} {"train_loss": -6.035584449768066, "global_step": 66680, "epoch": 1587} {"train_loss": -5.938408851623535, "global_step": 66681, "epoch": 1587} {"train_loss": -5.8242387771606445, "global_step": 66682, "epoch": 1587} {"train_loss": -6.0262298583984375, "global_step": 66683, "epoch": 1587} {"train_loss": -5.818817138671875, "global_step": 66684, "epoch": 1587} {"train_loss": -6.098030090332031, "global_step": 66685, "epoch": 1587} {"train_loss": -5.732677459716797, "global_step": 66686, "epoch": 1587} {"train_loss": -5.879772663116455, "global_step": 66687, "epoch": 1587} {"train_loss": -5.953197479248047, "global_step": 66688, "epoch": 1587} {"train_loss": -5.813158988952637, "global_step": 66689, "epoch": 1587} {"train_loss": -5.872613906860352, "global_step": 66690, "epoch": 1587} {"train_loss": -5.946783065795898, "global_step": 66691, "epoch": 1587} {"train_loss": -5.8366804122924805, "global_step": 66692, "epoch": 1587} {"train_loss": -5.927387237548828, "global_step": 66693, "epoch": 1587} {"train_loss": -5.999859809875488, "global_step": 66694, "epoch": 1587} {"train_loss": -5.9583690620604015, "global_step": 66695, "epoch": 1587, "val_loss": 74616.0078125} {"train_loss": -5.9896626472473145, "global_step": 66696, "epoch": 1588} {"train_loss": -5.921918869018555, "global_step": 66697, "epoch": 1588} {"train_loss": -5.953349590301514, "global_step": 66698, "epoch": 1588} {"train_loss": -6.013260364532471, "global_step": 66699, "epoch": 1588} {"train_loss": -5.952288627624512, "global_step": 66700, "epoch": 1588} {"train_loss": -5.906257152557373, "global_step": 66701, "epoch": 1588} {"train_loss": -5.935494422912598, "global_step": 66702, "epoch": 1588} {"train_loss": -6.089548110961914, "global_step": 66703, "epoch": 1588} {"train_loss": -6.014944553375244, "global_step": 66704, "epoch": 1588} {"train_loss": -5.959549427032471, "global_step": 66705, "epoch": 1588} {"train_loss": -5.806251049041748, "global_step": 66706, "epoch": 1588} {"train_loss": -5.838141441345215, "global_step": 66707, "epoch": 1588} {"train_loss": -5.935703754425049, "global_step": 66708, "epoch": 1588} {"train_loss": -5.877876281738281, "global_step": 66709, "epoch": 1588} {"train_loss": -5.913107872009277, "global_step": 66710, "epoch": 1588} {"train_loss": -5.859604835510254, "global_step": 66711, "epoch": 1588} {"train_loss": -5.934078216552734, "global_step": 66712, "epoch": 1588} {"train_loss": -5.988503456115723, "global_step": 66713, "epoch": 1588} {"train_loss": -5.798608779907227, "global_step": 66714, "epoch": 1588} {"train_loss": -6.0908894538879395, "global_step": 66715, "epoch": 1588} {"train_loss": -6.038993835449219, "global_step": 66716, "epoch": 1588} {"train_loss": -6.116721153259277, "global_step": 66717, "epoch": 1588} {"train_loss": -5.998641490936279, "global_step": 66718, "epoch": 1588} {"train_loss": -6.03286075592041, "global_step": 66719, "epoch": 1588} {"train_loss": -5.967972278594971, "global_step": 66720, "epoch": 1588} {"train_loss": -5.9809675216674805, "global_step": 66721, "epoch": 1588} {"train_loss": -6.05609130859375, "global_step": 66722, "epoch": 1588} {"train_loss": -5.927678108215332, "global_step": 66723, "epoch": 1588} {"train_loss": -6.0192790031433105, "global_step": 66724, "epoch": 1588} {"train_loss": -6.005162715911865, "global_step": 66725, "epoch": 1588} {"train_loss": -6.0739545822143555, "global_step": 66726, "epoch": 1588} {"train_loss": -6.013322830200195, "global_step": 66727, "epoch": 1588} {"train_loss": -6.084089279174805, "global_step": 66728, "epoch": 1588} {"train_loss": -6.060655117034912, "global_step": 66729, "epoch": 1588} {"train_loss": -6.001545429229736, "global_step": 66730, "epoch": 1588} {"train_loss": -5.859323501586914, "global_step": 66731, "epoch": 1588} {"train_loss": -5.940797805786133, "global_step": 66732, "epoch": 1588} {"train_loss": -6.098348617553711, "global_step": 66733, "epoch": 1588} {"train_loss": -5.998037338256836, "global_step": 66734, "epoch": 1588} {"train_loss": -5.970484256744385, "global_step": 66735, "epoch": 1588} {"train_loss": -6.0318450927734375, "global_step": 66736, "epoch": 1588} {"train_loss": -5.976986680712018, "global_step": 66737, "epoch": 1588, "val_loss": 74642.78125} {"train_loss": -6.027099609375, "global_step": 66738, "epoch": 1589} {"train_loss": -5.951504707336426, "global_step": 66739, "epoch": 1589} {"train_loss": -5.956679344177246, "global_step": 66740, "epoch": 1589} {"train_loss": -5.8468427658081055, "global_step": 66741, "epoch": 1589} {"train_loss": -5.9005126953125, "global_step": 66742, "epoch": 1589} {"train_loss": -6.08303689956665, "global_step": 66743, "epoch": 1589} {"train_loss": -5.996969223022461, "global_step": 66744, "epoch": 1589} {"train_loss": -5.962514400482178, "global_step": 66745, "epoch": 1589} {"train_loss": -6.022266387939453, "global_step": 66746, "epoch": 1589} {"train_loss": -5.989465713500977, "global_step": 66747, "epoch": 1589} {"train_loss": -5.978938579559326, "global_step": 66748, "epoch": 1589} {"train_loss": -6.046346664428711, "global_step": 66749, "epoch": 1589} {"train_loss": -5.923859596252441, "global_step": 66750, "epoch": 1589} {"train_loss": -6.060711860656738, "global_step": 66751, "epoch": 1589} {"train_loss": -5.941786766052246, "global_step": 66752, "epoch": 1589} {"train_loss": -5.848935127258301, "global_step": 66753, "epoch": 1589} {"train_loss": -5.975668907165527, "global_step": 66754, "epoch": 1589} {"train_loss": -5.932196140289307, "global_step": 66755, "epoch": 1589} {"train_loss": -5.78324031829834, "global_step": 66756, "epoch": 1589} {"train_loss": -5.959395408630371, "global_step": 66757, "epoch": 1589} {"train_loss": -5.964320182800293, "global_step": 66758, "epoch": 1589} {"train_loss": -5.908993721008301, "global_step": 66759, "epoch": 1589} {"train_loss": -5.912405014038086, "global_step": 66760, "epoch": 1589} {"train_loss": -6.034661293029785, "global_step": 66761, "epoch": 1589} {"train_loss": -5.851169109344482, "global_step": 66762, "epoch": 1589} {"train_loss": -5.916836738586426, "global_step": 66763, "epoch": 1589} {"train_loss": -5.985725402832031, "global_step": 66764, "epoch": 1589} {"train_loss": -6.019678115844727, "global_step": 66765, "epoch": 1589} {"train_loss": -5.981281280517578, "global_step": 66766, "epoch": 1589} {"train_loss": -6.00882625579834, "global_step": 66767, "epoch": 1589} {"train_loss": -6.052474021911621, "global_step": 66768, "epoch": 1589} {"train_loss": -5.956606864929199, "global_step": 66769, "epoch": 1589} {"train_loss": -5.981322765350342, "global_step": 66770, "epoch": 1589} {"train_loss": -5.970311164855957, "global_step": 66771, "epoch": 1589} {"train_loss": -6.06937313079834, "global_step": 66772, "epoch": 1589} {"train_loss": -6.055605888366699, "global_step": 66773, "epoch": 1589} {"train_loss": -5.882599353790283, "global_step": 66774, "epoch": 1589} {"train_loss": -5.980681896209717, "global_step": 66775, "epoch": 1589} {"train_loss": -6.043368339538574, "global_step": 66776, "epoch": 1589} {"train_loss": -5.959722995758057, "global_step": 66777, "epoch": 1589} {"train_loss": -6.104097366333008, "global_step": 66778, "epoch": 1589} {"train_loss": -5.969237656820388, "global_step": 66779, "epoch": 1589, "val_loss": 74777.8515625} {"train_loss": -6.097870826721191, "global_step": 66780, "epoch": 1590} {"train_loss": -6.02905797958374, "global_step": 66781, "epoch": 1590} {"train_loss": -6.015019416809082, "global_step": 66782, "epoch": 1590} {"train_loss": -5.97550106048584, "global_step": 66783, "epoch": 1590} {"train_loss": -5.892380714416504, "global_step": 66784, "epoch": 1590} {"train_loss": -6.0153608322143555, "global_step": 66785, "epoch": 1590} {"train_loss": -5.978343963623047, "global_step": 66786, "epoch": 1590} {"train_loss": -5.989920616149902, "global_step": 66787, "epoch": 1590} {"train_loss": -6.071038246154785, "global_step": 66788, "epoch": 1590} {"train_loss": -5.934811115264893, "global_step": 66789, "epoch": 1590} {"train_loss": -5.927326202392578, "global_step": 66790, "epoch": 1590} {"train_loss": -5.98745584487915, "global_step": 66791, "epoch": 1590} {"train_loss": -5.986323356628418, "global_step": 66792, "epoch": 1590} {"train_loss": -5.939605236053467, "global_step": 66793, "epoch": 1590} {"train_loss": -5.931187629699707, "global_step": 66794, "epoch": 1590} {"train_loss": -5.994266986846924, "global_step": 66795, "epoch": 1590} {"train_loss": -5.980019569396973, "global_step": 66796, "epoch": 1590} {"train_loss": -5.960428714752197, "global_step": 66797, "epoch": 1590} {"train_loss": -5.923212051391602, "global_step": 66798, "epoch": 1590} {"train_loss": -5.949259281158447, "global_step": 66799, "epoch": 1590} {"train_loss": -5.932407379150391, "global_step": 66800, "epoch": 1590} {"train_loss": -6.147934913635254, "global_step": 66801, "epoch": 1590} {"train_loss": -5.90287971496582, "global_step": 66802, "epoch": 1590} {"train_loss": -5.995831489562988, "global_step": 66803, "epoch": 1590} {"train_loss": -5.990572452545166, "global_step": 66804, "epoch": 1590} {"train_loss": -5.943630695343018, "global_step": 66805, "epoch": 1590} {"train_loss": -6.002902030944824, "global_step": 66806, "epoch": 1590} {"train_loss": -5.948545455932617, "global_step": 66807, "epoch": 1590} {"train_loss": -5.971632957458496, "global_step": 66808, "epoch": 1590} {"train_loss": -5.833342552185059, "global_step": 66809, "epoch": 1590} {"train_loss": -5.997100830078125, "global_step": 66810, "epoch": 1590} {"train_loss": -6.071722984313965, "global_step": 66811, "epoch": 1590} {"train_loss": -6.033733367919922, "global_step": 66812, "epoch": 1590} {"train_loss": -5.9139628410339355, "global_step": 66813, "epoch": 1590} {"train_loss": -5.991402626037598, "global_step": 66814, "epoch": 1590} {"train_loss": -6.072431564331055, "global_step": 66815, "epoch": 1590} {"train_loss": -6.0301008224487305, "global_step": 66816, "epoch": 1590} {"train_loss": -6.004765510559082, "global_step": 66817, "epoch": 1590} {"train_loss": -6.13896369934082, "global_step": 66818, "epoch": 1590} {"train_loss": -6.013617515563965, "global_step": 66819, "epoch": 1590} {"train_loss": -5.955979347229004, "global_step": 66820, "epoch": 1590} {"train_loss": -5.988625549134754, "global_step": 66821, "epoch": 1590, "val_loss": 74637.2421875} {"train_loss": -6.053218364715576, "global_step": 66822, "epoch": 1591} {"train_loss": -6.107598304748535, "global_step": 66823, "epoch": 1591} {"train_loss": -6.080547332763672, "global_step": 66824, "epoch": 1591} {"train_loss": -5.966698169708252, "global_step": 66825, "epoch": 1591} {"train_loss": -6.09904670715332, "global_step": 66826, "epoch": 1591} {"train_loss": -5.980848789215088, "global_step": 66827, "epoch": 1591} {"train_loss": -5.956657409667969, "global_step": 66828, "epoch": 1591} {"train_loss": -6.028190612792969, "global_step": 66829, "epoch": 1591} {"train_loss": -5.941986083984375, "global_step": 66830, "epoch": 1591} {"train_loss": -6.009507179260254, "global_step": 66831, "epoch": 1591} {"train_loss": -6.055798530578613, "global_step": 66832, "epoch": 1591} {"train_loss": -5.871700286865234, "global_step": 66833, "epoch": 1591} {"train_loss": -5.8564772605896, "global_step": 66834, "epoch": 1591} {"train_loss": -5.9151482582092285, "global_step": 66835, "epoch": 1591} {"train_loss": -5.865198135375977, "global_step": 66836, "epoch": 1591} {"train_loss": -5.868621826171875, "global_step": 66837, "epoch": 1591} {"train_loss": -5.85033655166626, "global_step": 66838, "epoch": 1591} {"train_loss": -5.896451950073242, "global_step": 66839, "epoch": 1591} {"train_loss": -5.899320125579834, "global_step": 66840, "epoch": 1591} {"train_loss": -6.066041469573975, "global_step": 66841, "epoch": 1591} {"train_loss": -6.105940341949463, "global_step": 66842, "epoch": 1591} {"train_loss": -5.923189163208008, "global_step": 66843, "epoch": 1591} {"train_loss": -6.003411293029785, "global_step": 66844, "epoch": 1591} {"train_loss": -5.9464216232299805, "global_step": 66845, "epoch": 1591} {"train_loss": -5.853747367858887, "global_step": 66846, "epoch": 1591} {"train_loss": -5.96558952331543, "global_step": 66847, "epoch": 1591} {"train_loss": -6.008251190185547, "global_step": 66848, "epoch": 1591} {"train_loss": -5.897946834564209, "global_step": 66849, "epoch": 1591} {"train_loss": -5.944549560546875, "global_step": 66850, "epoch": 1591} {"train_loss": -5.975474834442139, "global_step": 66851, "epoch": 1591} {"train_loss": -5.979426860809326, "global_step": 66852, "epoch": 1591} {"train_loss": -6.033888816833496, "global_step": 66853, "epoch": 1591} {"train_loss": -5.988828659057617, "global_step": 66854, "epoch": 1591} {"train_loss": -5.956611156463623, "global_step": 66855, "epoch": 1591} {"train_loss": -6.0660176277160645, "global_step": 66856, "epoch": 1591} {"train_loss": -6.019692420959473, "global_step": 66857, "epoch": 1591} {"train_loss": -6.014355182647705, "global_step": 66858, "epoch": 1591} {"train_loss": -6.0294880867004395, "global_step": 66859, "epoch": 1591} {"train_loss": -6.120648384094238, "global_step": 66860, "epoch": 1591} {"train_loss": -5.956667900085449, "global_step": 66861, "epoch": 1591} {"train_loss": -6.040833950042725, "global_step": 66862, "epoch": 1591} {"train_loss": -5.979335308074951, "global_step": 66863, "epoch": 1591, "val_loss": 74426.46875} {"train_loss": -5.959406852722168, "global_step": 66864, "epoch": 1592} {"train_loss": -5.938946723937988, "global_step": 66865, "epoch": 1592} {"train_loss": -5.8833746910095215, "global_step": 66866, "epoch": 1592} {"train_loss": -5.891110897064209, "global_step": 66867, "epoch": 1592} {"train_loss": -6.038387775421143, "global_step": 66868, "epoch": 1592} {"train_loss": -5.972956657409668, "global_step": 66869, "epoch": 1592} {"train_loss": -5.87427282333374, "global_step": 66870, "epoch": 1592} {"train_loss": -6.016432285308838, "global_step": 66871, "epoch": 1592} {"train_loss": -5.8905863761901855, "global_step": 66872, "epoch": 1592} {"train_loss": -5.983755111694336, "global_step": 66873, "epoch": 1592} {"train_loss": -6.035578727722168, "global_step": 66874, "epoch": 1592} {"train_loss": -6.049088001251221, "global_step": 66875, "epoch": 1592} {"train_loss": -5.9630584716796875, "global_step": 66876, "epoch": 1592} {"train_loss": -6.012168884277344, "global_step": 66877, "epoch": 1592} {"train_loss": -5.9741530418396, "global_step": 66878, "epoch": 1592} {"train_loss": -5.943653583526611, "global_step": 66879, "epoch": 1592} {"train_loss": -5.867985725402832, "global_step": 66880, "epoch": 1592} {"train_loss": -6.031313896179199, "global_step": 66881, "epoch": 1592} {"train_loss": -5.919203758239746, "global_step": 66882, "epoch": 1592} {"train_loss": -5.958269119262695, "global_step": 66883, "epoch": 1592} {"train_loss": -5.915412425994873, "global_step": 66884, "epoch": 1592} {"train_loss": -5.863739490509033, "global_step": 66885, "epoch": 1592} {"train_loss": -5.813770294189453, "global_step": 66886, "epoch": 1592} {"train_loss": -5.97629451751709, "global_step": 66887, "epoch": 1592} {"train_loss": -5.879920482635498, "global_step": 66888, "epoch": 1592} {"train_loss": -5.870823860168457, "global_step": 66889, "epoch": 1592} {"train_loss": -6.052798748016357, "global_step": 66890, "epoch": 1592} {"train_loss": -5.889895439147949, "global_step": 66891, "epoch": 1592} {"train_loss": -5.922967433929443, "global_step": 66892, "epoch": 1592} {"train_loss": -6.016607284545898, "global_step": 66893, "epoch": 1592} {"train_loss": -5.774893760681152, "global_step": 66894, "epoch": 1592} {"train_loss": -6.008359909057617, "global_step": 66895, "epoch": 1592} {"train_loss": -5.895249843597412, "global_step": 66896, "epoch": 1592} {"train_loss": -6.021792411804199, "global_step": 66897, "epoch": 1592} {"train_loss": -5.976639747619629, "global_step": 66898, "epoch": 1592} {"train_loss": -5.892848968505859, "global_step": 66899, "epoch": 1592} {"train_loss": -6.059557914733887, "global_step": 66900, "epoch": 1592} {"train_loss": -5.877389907836914, "global_step": 66901, "epoch": 1592} {"train_loss": -5.919351100921631, "global_step": 66902, "epoch": 1592} {"train_loss": -5.98110294342041, "global_step": 66903, "epoch": 1592} {"train_loss": -5.867422580718994, "global_step": 66904, "epoch": 1592} {"train_loss": -5.9439373924618675, "global_step": 66905, "epoch": 1592, "val_loss": 74906.53125} {"train_loss": -5.831521987915039, "global_step": 66906, "epoch": 1593} {"train_loss": -6.011707782745361, "global_step": 66907, "epoch": 1593} {"train_loss": -5.826596260070801, "global_step": 66908, "epoch": 1593} {"train_loss": -5.900289535522461, "global_step": 66909, "epoch": 1593} {"train_loss": -5.851845741271973, "global_step": 66910, "epoch": 1593} {"train_loss": -6.004080772399902, "global_step": 66911, "epoch": 1593} {"train_loss": -5.97963285446167, "global_step": 66912, "epoch": 1593} {"train_loss": -5.9953932762146, "global_step": 66913, "epoch": 1593} {"train_loss": -5.999113082885742, "global_step": 66914, "epoch": 1593} {"train_loss": -5.9444708824157715, "global_step": 66915, "epoch": 1593} {"train_loss": -6.065860271453857, "global_step": 66916, "epoch": 1593} {"train_loss": -5.939035415649414, "global_step": 66917, "epoch": 1593} {"train_loss": -6.0722198486328125, "global_step": 66918, "epoch": 1593} {"train_loss": -6.0259809494018555, "global_step": 66919, "epoch": 1593} {"train_loss": -6.074237823486328, "global_step": 66920, "epoch": 1593} {"train_loss": -6.002806663513184, "global_step": 66921, "epoch": 1593} {"train_loss": -5.939988136291504, "global_step": 66922, "epoch": 1593} {"train_loss": -6.014970302581787, "global_step": 66923, "epoch": 1593} {"train_loss": -6.06914758682251, "global_step": 66924, "epoch": 1593} {"train_loss": -6.029029369354248, "global_step": 66925, "epoch": 1593} {"train_loss": -6.042497634887695, "global_step": 66926, "epoch": 1593} {"train_loss": -6.032925128936768, "global_step": 66927, "epoch": 1593} {"train_loss": -6.0919904708862305, "global_step": 66928, "epoch": 1593} {"train_loss": -5.944081783294678, "global_step": 66929, "epoch": 1593} {"train_loss": -6.133825302124023, "global_step": 66930, "epoch": 1593} {"train_loss": -5.860550403594971, "global_step": 66931, "epoch": 1593} {"train_loss": -5.908200263977051, "global_step": 66932, "epoch": 1593} {"train_loss": -5.987053871154785, "global_step": 66933, "epoch": 1593} {"train_loss": -6.1218767166137695, "global_step": 66934, "epoch": 1593} {"train_loss": -5.903209209442139, "global_step": 66935, "epoch": 1593} {"train_loss": -6.080047607421875, "global_step": 66936, "epoch": 1593} {"train_loss": -6.049901008605957, "global_step": 66937, "epoch": 1593} {"train_loss": -5.972273826599121, "global_step": 66938, "epoch": 1593} {"train_loss": -5.958644390106201, "global_step": 66939, "epoch": 1593} {"train_loss": -6.013239860534668, "global_step": 66940, "epoch": 1593} {"train_loss": -6.018389701843262, "global_step": 66941, "epoch": 1593} {"train_loss": -5.913163185119629, "global_step": 66942, "epoch": 1593} {"train_loss": -5.836587905883789, "global_step": 66943, "epoch": 1593} {"train_loss": -5.8255767822265625, "global_step": 66944, "epoch": 1593} {"train_loss": -6.073444366455078, "global_step": 66945, "epoch": 1593} {"train_loss": -5.9440789222717285, "global_step": 66946, "epoch": 1593} {"train_loss": -5.983636980965024, "global_step": 66947, "epoch": 1593, "val_loss": 74646.3515625} {"train_loss": -6.067897796630859, "global_step": 66948, "epoch": 1594} {"train_loss": -5.930180549621582, "global_step": 66949, "epoch": 1594} {"train_loss": -6.022927284240723, "global_step": 66950, "epoch": 1594} {"train_loss": -6.049554347991943, "global_step": 66951, "epoch": 1594} {"train_loss": -6.080876350402832, "global_step": 66952, "epoch": 1594} {"train_loss": -5.8645172119140625, "global_step": 66953, "epoch": 1594} {"train_loss": -5.914135932922363, "global_step": 66954, "epoch": 1594} {"train_loss": -6.12993049621582, "global_step": 66955, "epoch": 1594} {"train_loss": -5.930158615112305, "global_step": 66956, "epoch": 1594} {"train_loss": -5.881767272949219, "global_step": 66957, "epoch": 1594} {"train_loss": -6.034090042114258, "global_step": 66958, "epoch": 1594} {"train_loss": -5.961857318878174, "global_step": 66959, "epoch": 1594} {"train_loss": -5.9259233474731445, "global_step": 66960, "epoch": 1594} {"train_loss": -5.807754039764404, "global_step": 66961, "epoch": 1594} {"train_loss": -6.053475856781006, "global_step": 66962, "epoch": 1594} {"train_loss": -6.106075286865234, "global_step": 66963, "epoch": 1594} {"train_loss": -6.056398391723633, "global_step": 66964, "epoch": 1594} {"train_loss": -5.903690814971924, "global_step": 66965, "epoch": 1594} {"train_loss": -6.010365009307861, "global_step": 66966, "epoch": 1594} {"train_loss": -5.851073741912842, "global_step": 66967, "epoch": 1594} {"train_loss": -6.118474960327148, "global_step": 66968, "epoch": 1594} {"train_loss": -5.886037826538086, "global_step": 66969, "epoch": 1594} {"train_loss": -5.942808151245117, "global_step": 66970, "epoch": 1594} {"train_loss": -5.927953720092773, "global_step": 66971, "epoch": 1594} {"train_loss": -5.855564117431641, "global_step": 66972, "epoch": 1594} {"train_loss": -6.010318279266357, "global_step": 66973, "epoch": 1594} {"train_loss": -5.892874717712402, "global_step": 66974, "epoch": 1594} {"train_loss": -6.1046905517578125, "global_step": 66975, "epoch": 1594} {"train_loss": -5.896095275878906, "global_step": 66976, "epoch": 1594} {"train_loss": -5.768935203552246, "global_step": 66977, "epoch": 1594} {"train_loss": -5.961511611938477, "global_step": 66978, "epoch": 1594} {"train_loss": -5.822175979614258, "global_step": 66979, "epoch": 1594} {"train_loss": -5.9657769203186035, "global_step": 66980, "epoch": 1594} {"train_loss": -5.900241851806641, "global_step": 66981, "epoch": 1594} {"train_loss": -6.034364700317383, "global_step": 66982, "epoch": 1594} {"train_loss": -5.941810131072998, "global_step": 66983, "epoch": 1594} {"train_loss": -5.984704971313477, "global_step": 66984, "epoch": 1594} {"train_loss": -6.014011859893799, "global_step": 66985, "epoch": 1594} {"train_loss": -5.992918014526367, "global_step": 66986, "epoch": 1594} {"train_loss": -6.046335220336914, "global_step": 66987, "epoch": 1594} {"train_loss": -5.868641376495361, "global_step": 66988, "epoch": 1594} {"train_loss": -5.961997804187593, "global_step": 66989, "epoch": 1594, "val_loss": 74464.4609375} {"train_loss": -5.940629959106445, "global_step": 66990, "epoch": 1595} {"train_loss": -5.908111572265625, "global_step": 66991, "epoch": 1595} {"train_loss": -6.016234874725342, "global_step": 66992, "epoch": 1595} {"train_loss": -6.090615272521973, "global_step": 66993, "epoch": 1595} {"train_loss": -5.896820068359375, "global_step": 66994, "epoch": 1595} {"train_loss": -5.992762565612793, "global_step": 66995, "epoch": 1595} {"train_loss": -5.978600978851318, "global_step": 66996, "epoch": 1595} {"train_loss": -5.931581020355225, "global_step": 66997, "epoch": 1595} {"train_loss": -5.933579444885254, "global_step": 66998, "epoch": 1595} {"train_loss": -5.925431251525879, "global_step": 66999, "epoch": 1595} {"train_loss": -5.845489501953125, "global_step": 67000, "epoch": 1595} {"train_loss": -5.886811256408691, "global_step": 67001, "epoch": 1595} {"train_loss": -6.025702953338623, "global_step": 67002, "epoch": 1595} {"train_loss": -5.961956977844238, "global_step": 67003, "epoch": 1595} {"train_loss": -5.913361549377441, "global_step": 67004, "epoch": 1595} {"train_loss": -5.916816711425781, "global_step": 67005, "epoch": 1595} {"train_loss": -5.938396453857422, "global_step": 67006, "epoch": 1595} {"train_loss": -5.976248264312744, "global_step": 67007, "epoch": 1595} {"train_loss": -6.012991905212402, "global_step": 67008, "epoch": 1595} {"train_loss": -5.909757614135742, "global_step": 67009, "epoch": 1595} {"train_loss": -6.010741710662842, "global_step": 67010, "epoch": 1595} {"train_loss": -5.9547553062438965, "global_step": 67011, "epoch": 1595} {"train_loss": -5.941706657409668, "global_step": 67012, "epoch": 1595} {"train_loss": -6.054807662963867, "global_step": 67013, "epoch": 1595} {"train_loss": -5.9627766609191895, "global_step": 67014, "epoch": 1595} {"train_loss": -5.983663082122803, "global_step": 67015, "epoch": 1595} {"train_loss": -5.930824279785156, "global_step": 67016, "epoch": 1595} {"train_loss": -6.058618545532227, "global_step": 67017, "epoch": 1595} {"train_loss": -5.935914993286133, "global_step": 67018, "epoch": 1595} {"train_loss": -5.953954696655273, "global_step": 67019, "epoch": 1595} {"train_loss": -6.043774604797363, "global_step": 67020, "epoch": 1595} {"train_loss": -5.906931400299072, "global_step": 67021, "epoch": 1595} {"train_loss": -5.973507404327393, "global_step": 67022, "epoch": 1595} {"train_loss": -5.979996204376221, "global_step": 67023, "epoch": 1595} {"train_loss": -5.970607757568359, "global_step": 67024, "epoch": 1595} {"train_loss": -5.9468913078308105, "global_step": 67025, "epoch": 1595} {"train_loss": -6.0229878425598145, "global_step": 67026, "epoch": 1595} {"train_loss": -5.917850017547607, "global_step": 67027, "epoch": 1595} {"train_loss": -5.9801740646362305, "global_step": 67028, "epoch": 1595} {"train_loss": -5.967010974884033, "global_step": 67029, "epoch": 1595} {"train_loss": -6.056971073150635, "global_step": 67030, "epoch": 1595} {"train_loss": -5.964174123037429, "global_step": 67031, "epoch": 1595, "val_loss": 74642.5078125} {"train_loss": -5.998435020446777, "global_step": 67032, "epoch": 1596} {"train_loss": -5.8712358474731445, "global_step": 67033, "epoch": 1596} {"train_loss": -5.983765602111816, "global_step": 67034, "epoch": 1596} {"train_loss": -5.860795021057129, "global_step": 67035, "epoch": 1596} {"train_loss": -6.110781669616699, "global_step": 67036, "epoch": 1596} {"train_loss": -6.023477554321289, "global_step": 67037, "epoch": 1596} {"train_loss": -6.109691619873047, "global_step": 67038, "epoch": 1596} {"train_loss": -6.0329742431640625, "global_step": 67039, "epoch": 1596} {"train_loss": -5.942380905151367, "global_step": 67040, "epoch": 1596} {"train_loss": -6.078857898712158, "global_step": 67041, "epoch": 1596} {"train_loss": -5.966888427734375, "global_step": 67042, "epoch": 1596} {"train_loss": -6.002481460571289, "global_step": 67043, "epoch": 1596} {"train_loss": -5.955244064331055, "global_step": 67044, "epoch": 1596} {"train_loss": -5.834395408630371, "global_step": 67045, "epoch": 1596} {"train_loss": -5.920706748962402, "global_step": 67046, "epoch": 1596} {"train_loss": -5.998955249786377, "global_step": 67047, "epoch": 1596} {"train_loss": -5.932538032531738, "global_step": 67048, "epoch": 1596} {"train_loss": -5.961727619171143, "global_step": 67049, "epoch": 1596} {"train_loss": -5.993492126464844, "global_step": 67050, "epoch": 1596} {"train_loss": -5.959794998168945, "global_step": 67051, "epoch": 1596} {"train_loss": -5.857911109924316, "global_step": 67052, "epoch": 1596} {"train_loss": -5.9558916091918945, "global_step": 67053, "epoch": 1596} {"train_loss": -5.972700119018555, "global_step": 67054, "epoch": 1596} {"train_loss": -6.041129112243652, "global_step": 67055, "epoch": 1596} {"train_loss": -6.0073747634887695, "global_step": 67056, "epoch": 1596} {"train_loss": -5.888941287994385, "global_step": 67057, "epoch": 1596} {"train_loss": -5.905373573303223, "global_step": 67058, "epoch": 1596} {"train_loss": -6.048040390014648, "global_step": 67059, "epoch": 1596} {"train_loss": -5.931722640991211, "global_step": 67060, "epoch": 1596} {"train_loss": -6.018495559692383, "global_step": 67061, "epoch": 1596} {"train_loss": -6.086498260498047, "global_step": 67062, "epoch": 1596} {"train_loss": -6.007893085479736, "global_step": 67063, "epoch": 1596} {"train_loss": -5.879563808441162, "global_step": 67064, "epoch": 1596} {"train_loss": -6.04553747177124, "global_step": 67065, "epoch": 1596} {"train_loss": -5.8726911544799805, "global_step": 67066, "epoch": 1596} {"train_loss": -6.049961566925049, "global_step": 67067, "epoch": 1596} {"train_loss": -6.107546806335449, "global_step": 67068, "epoch": 1596} {"train_loss": -5.984063148498535, "global_step": 67069, "epoch": 1596} {"train_loss": -5.998215198516846, "global_step": 67070, "epoch": 1596} {"train_loss": -5.942124366760254, "global_step": 67071, "epoch": 1596} {"train_loss": -6.079492092132568, "global_step": 67072, "epoch": 1596} {"train_loss": -5.982219661985125, "global_step": 67073, "epoch": 1596, "val_loss": 74723.5859375} {"train_loss": -5.982413291931152, "global_step": 67074, "epoch": 1597} {"train_loss": -6.016542434692383, "global_step": 67075, "epoch": 1597} {"train_loss": -6.028700828552246, "global_step": 67076, "epoch": 1597} {"train_loss": -6.114985466003418, "global_step": 67077, "epoch": 1597} {"train_loss": -6.045166492462158, "global_step": 67078, "epoch": 1597} {"train_loss": -5.9439496994018555, "global_step": 67079, "epoch": 1597} {"train_loss": -6.026422500610352, "global_step": 67080, "epoch": 1597} {"train_loss": -6.039519786834717, "global_step": 67081, "epoch": 1597} {"train_loss": -5.924248695373535, "global_step": 67082, "epoch": 1597} {"train_loss": -6.0218024253845215, "global_step": 67083, "epoch": 1597} {"train_loss": -6.123724937438965, "global_step": 67084, "epoch": 1597} {"train_loss": -6.046031951904297, "global_step": 67085, "epoch": 1597} {"train_loss": -5.861534118652344, "global_step": 67086, "epoch": 1597} {"train_loss": -5.854394912719727, "global_step": 67087, "epoch": 1597} {"train_loss": -6.006307601928711, "global_step": 67088, "epoch": 1597} {"train_loss": -5.995059490203857, "global_step": 67089, "epoch": 1597} {"train_loss": -5.966639518737793, "global_step": 67090, "epoch": 1597} {"train_loss": -6.0168867111206055, "global_step": 67091, "epoch": 1597} {"train_loss": -5.970808982849121, "global_step": 67092, "epoch": 1597} {"train_loss": -6.012025356292725, "global_step": 67093, "epoch": 1597} {"train_loss": -5.958681106567383, "global_step": 67094, "epoch": 1597} {"train_loss": -5.93807315826416, "global_step": 67095, "epoch": 1597} {"train_loss": -6.016477108001709, "global_step": 67096, "epoch": 1597} {"train_loss": -6.01951789855957, "global_step": 67097, "epoch": 1597} {"train_loss": -6.050208568572998, "global_step": 67098, "epoch": 1597} {"train_loss": -5.848367691040039, "global_step": 67099, "epoch": 1597} {"train_loss": -5.854908466339111, "global_step": 67100, "epoch": 1597} {"train_loss": -6.050800323486328, "global_step": 67101, "epoch": 1597} {"train_loss": -6.033700466156006, "global_step": 67102, "epoch": 1597} {"train_loss": -5.942028999328613, "global_step": 67103, "epoch": 1597} {"train_loss": -6.020291328430176, "global_step": 67104, "epoch": 1597} {"train_loss": -5.964343547821045, "global_step": 67105, "epoch": 1597} {"train_loss": -5.962353706359863, "global_step": 67106, "epoch": 1597} {"train_loss": -5.981551170349121, "global_step": 67107, "epoch": 1597} {"train_loss": -5.937446594238281, "global_step": 67108, "epoch": 1597} {"train_loss": -5.857758522033691, "global_step": 67109, "epoch": 1597} {"train_loss": -5.936676025390625, "global_step": 67110, "epoch": 1597} {"train_loss": -5.945208549499512, "global_step": 67111, "epoch": 1597} {"train_loss": -5.9925312995910645, "global_step": 67112, "epoch": 1597} {"train_loss": -6.084167957305908, "global_step": 67113, "epoch": 1597} {"train_loss": -6.105792045593262, "global_step": 67114, "epoch": 1597} {"train_loss": -5.989422582444691, "global_step": 67115, "epoch": 1597, "val_loss": 75017.59375} {"train_loss": -6.001462459564209, "global_step": 67116, "epoch": 1598} {"train_loss": -5.921270370483398, "global_step": 67117, "epoch": 1598} {"train_loss": -5.945683479309082, "global_step": 67118, "epoch": 1598} {"train_loss": -5.977294445037842, "global_step": 67119, "epoch": 1598} {"train_loss": -6.159948348999023, "global_step": 67120, "epoch": 1598} {"train_loss": -5.993667125701904, "global_step": 67121, "epoch": 1598} {"train_loss": -5.9359846115112305, "global_step": 67122, "epoch": 1598} {"train_loss": -6.044375419616699, "global_step": 67123, "epoch": 1598} {"train_loss": -6.025234222412109, "global_step": 67124, "epoch": 1598} {"train_loss": -6.092935562133789, "global_step": 67125, "epoch": 1598} {"train_loss": -5.99641227722168, "global_step": 67126, "epoch": 1598} {"train_loss": -6.082372188568115, "global_step": 67127, "epoch": 1598} {"train_loss": -5.97405481338501, "global_step": 67128, "epoch": 1598} {"train_loss": -5.972297668457031, "global_step": 67129, "epoch": 1598} {"train_loss": -6.018131256103516, "global_step": 67130, "epoch": 1598} {"train_loss": -5.865124702453613, "global_step": 67131, "epoch": 1598} {"train_loss": -6.0355024337768555, "global_step": 67132, "epoch": 1598} {"train_loss": -6.023355007171631, "global_step": 67133, "epoch": 1598} {"train_loss": -5.9498395919799805, "global_step": 67134, "epoch": 1598} {"train_loss": -5.9481201171875, "global_step": 67135, "epoch": 1598} {"train_loss": -5.97564697265625, "global_step": 67136, "epoch": 1598} {"train_loss": -5.903314590454102, "global_step": 67137, "epoch": 1598} {"train_loss": -6.035904884338379, "global_step": 67138, "epoch": 1598} {"train_loss": -6.070809364318848, "global_step": 67139, "epoch": 1598} {"train_loss": -5.853712558746338, "global_step": 67140, "epoch": 1598} {"train_loss": -5.953446388244629, "global_step": 67141, "epoch": 1598} {"train_loss": -5.967103958129883, "global_step": 67142, "epoch": 1598} {"train_loss": -5.959629058837891, "global_step": 67143, "epoch": 1598} {"train_loss": -5.980295181274414, "global_step": 67144, "epoch": 1598} {"train_loss": -6.020983695983887, "global_step": 67145, "epoch": 1598} {"train_loss": -5.940299034118652, "global_step": 67146, "epoch": 1598} {"train_loss": -6.087420463562012, "global_step": 67147, "epoch": 1598} {"train_loss": -6.001472473144531, "global_step": 67148, "epoch": 1598} {"train_loss": -5.997046947479248, "global_step": 67149, "epoch": 1598} {"train_loss": -6.0421142578125, "global_step": 67150, "epoch": 1598} {"train_loss": -6.1081037521362305, "global_step": 67151, "epoch": 1598} {"train_loss": -5.9423017501831055, "global_step": 67152, "epoch": 1598} {"train_loss": -5.910714626312256, "global_step": 67153, "epoch": 1598} {"train_loss": -6.065528869628906, "global_step": 67154, "epoch": 1598} {"train_loss": -5.974658489227295, "global_step": 67155, "epoch": 1598} {"train_loss": -6.057636260986328, "global_step": 67156, "epoch": 1598} {"train_loss": -5.994041079566593, "global_step": 67157, "epoch": 1598, "val_loss": 74704.578125} {"train_loss": -5.921489238739014, "global_step": 67158, "epoch": 1599} {"train_loss": -6.060853481292725, "global_step": 67159, "epoch": 1599} {"train_loss": -6.091675758361816, "global_step": 67160, "epoch": 1599} {"train_loss": -6.004964351654053, "global_step": 67161, "epoch": 1599} {"train_loss": -6.002811431884766, "global_step": 67162, "epoch": 1599} {"train_loss": -6.038618564605713, "global_step": 67163, "epoch": 1599} {"train_loss": -6.052186965942383, "global_step": 67164, "epoch": 1599} {"train_loss": -5.966879844665527, "global_step": 67165, "epoch": 1599} {"train_loss": -6.008667945861816, "global_step": 67166, "epoch": 1599} {"train_loss": -6.034252166748047, "global_step": 67167, "epoch": 1599} {"train_loss": -6.100068092346191, "global_step": 67168, "epoch": 1599} {"train_loss": -5.947307586669922, "global_step": 67169, "epoch": 1599} {"train_loss": -6.114892959594727, "global_step": 67170, "epoch": 1599} {"train_loss": -5.835784912109375, "global_step": 67171, "epoch": 1599} {"train_loss": -6.031254768371582, "global_step": 67172, "epoch": 1599} {"train_loss": -6.010718822479248, "global_step": 67173, "epoch": 1599} {"train_loss": -6.040637493133545, "global_step": 67174, "epoch": 1599} {"train_loss": -5.916164398193359, "global_step": 67175, "epoch": 1599} {"train_loss": -5.887831687927246, "global_step": 67176, "epoch": 1599} {"train_loss": -6.1300740242004395, "global_step": 67177, "epoch": 1599} {"train_loss": -5.941794395446777, "global_step": 67178, "epoch": 1599} {"train_loss": -5.987975120544434, "global_step": 67179, "epoch": 1599} {"train_loss": -6.1099019050598145, "global_step": 67180, "epoch": 1599} {"train_loss": -5.9893622398376465, "global_step": 67181, "epoch": 1599} {"train_loss": -6.056492328643799, "global_step": 67182, "epoch": 1599} {"train_loss": -5.9804792404174805, "global_step": 67183, "epoch": 1599} {"train_loss": -5.984220504760742, "global_step": 67184, "epoch": 1599} {"train_loss": -5.982300758361816, "global_step": 67185, "epoch": 1599} {"train_loss": -5.9778032302856445, "global_step": 67186, "epoch": 1599} {"train_loss": -6.007981777191162, "global_step": 67187, "epoch": 1599} {"train_loss": -6.027738571166992, "global_step": 67188, "epoch": 1599} {"train_loss": -5.935168743133545, "global_step": 67189, "epoch": 1599} {"train_loss": -5.97462272644043, "global_step": 67190, "epoch": 1599} {"train_loss": -5.979150772094727, "global_step": 67191, "epoch": 1599} {"train_loss": -5.978538513183594, "global_step": 67192, "epoch": 1599} {"train_loss": -5.951432704925537, "global_step": 67193, "epoch": 1599} {"train_loss": -6.098273277282715, "global_step": 67194, "epoch": 1599} {"train_loss": -6.0408735275268555, "global_step": 67195, "epoch": 1599} {"train_loss": -5.994012355804443, "global_step": 67196, "epoch": 1599} {"train_loss": -6.104223251342773, "global_step": 67197, "epoch": 1599} {"train_loss": -6.0731120109558105, "global_step": 67198, "epoch": 1599} {"train_loss": -6.008301712217785, "global_step": 67199, "epoch": 1599, "val_loss": 74566.0078125} {"train_loss": -6.07526969909668, "global_step": 67200, "epoch": 1600} {"train_loss": -6.017928123474121, "global_step": 67201, "epoch": 1600} {"train_loss": -6.094934940338135, "global_step": 67202, "epoch": 1600} {"train_loss": -6.041740417480469, "global_step": 67203, "epoch": 1600} {"train_loss": -6.113070964813232, "global_step": 67204, "epoch": 1600} {"train_loss": -6.025300979614258, "global_step": 67205, "epoch": 1600} {"train_loss": -5.948902606964111, "global_step": 67206, "epoch": 1600} {"train_loss": -6.024565696716309, "global_step": 67207, "epoch": 1600} {"train_loss": -5.999606609344482, "global_step": 67208, "epoch": 1600} {"train_loss": -6.084140777587891, "global_step": 67209, "epoch": 1600} {"train_loss": -5.93636417388916, "global_step": 67210, "epoch": 1600} {"train_loss": -5.99778938293457, "global_step": 67211, "epoch": 1600} {"train_loss": -6.018756866455078, "global_step": 67212, "epoch": 1600} {"train_loss": -5.953212738037109, "global_step": 67213, "epoch": 1600} {"train_loss": -5.878085613250732, "global_step": 67214, "epoch": 1600} {"train_loss": -6.017090797424316, "global_step": 67215, "epoch": 1600} {"train_loss": -5.941148281097412, "global_step": 67216, "epoch": 1600} {"train_loss": -5.805722236633301, "global_step": 67217, "epoch": 1600} {"train_loss": -5.939120292663574, "global_step": 67218, "epoch": 1600} {"train_loss": -5.957731246948242, "global_step": 67219, "epoch": 1600} {"train_loss": -5.940427780151367, "global_step": 67220, "epoch": 1600} {"train_loss": -5.991796016693115, "global_step": 67221, "epoch": 1600} {"train_loss": -5.963257789611816, "global_step": 67222, "epoch": 1600} {"train_loss": -5.945481300354004, "global_step": 67223, "epoch": 1600} {"train_loss": -5.91475248336792, "global_step": 67224, "epoch": 1600} {"train_loss": -5.868725776672363, "global_step": 67225, "epoch": 1600} {"train_loss": -6.042153358459473, "global_step": 67226, "epoch": 1600} {"train_loss": -5.7375168800354, "global_step": 67227, "epoch": 1600} {"train_loss": -5.969616889953613, "global_step": 67228, "epoch": 1600} {"train_loss": -6.000695705413818, "global_step": 67229, "epoch": 1600} {"train_loss": -6.040593147277832, "global_step": 67230, "epoch": 1600} {"train_loss": -5.779860496520996, "global_step": 67231, "epoch": 1600} {"train_loss": -5.906949996948242, "global_step": 67232, "epoch": 1600} {"train_loss": -5.834881782531738, "global_step": 67233, "epoch": 1600} {"train_loss": -5.905416011810303, "global_step": 67234, "epoch": 1600} {"train_loss": -5.933254241943359, "global_step": 67235, "epoch": 1600} {"train_loss": -5.967986106872559, "global_step": 67236, "epoch": 1600} {"train_loss": -6.0200886726379395, "global_step": 67237, "epoch": 1600} {"train_loss": -5.918107032775879, "global_step": 67238, "epoch": 1600} {"train_loss": -5.898507118225098, "global_step": 67239, "epoch": 1600} {"train_loss": -5.718183517456055, "global_step": 67240, "epoch": 1600} {"train_loss": -5.955126944042387, "global_step": 67241, "epoch": 1600, "train/sim_max_reward_0": 0.7303976038774049, "train/sim_max_reward_1": 0.949221362709949, "train/sim_max_reward_2": 0.38874933499781517, "train/sim_max_reward_3": 0.1462148441616843, "train/sim_max_reward_4": 0.5962778344788842, "train/sim_max_reward_5": 0.5459004526630086, "test/sim_max_reward_4500000": 0.3603062338685601, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9120414852323078, "test/sim_max_reward_4500003": 0.8419308550309564, "test/sim_max_reward_4500004": 0.14181438142468167, "test/sim_max_reward_4500005": 0.6329168357679813, "test/sim_max_reward_4500006": 0.43420205547501656, "test/sim_max_reward_4500007": 0.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.35370074840770105, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.8749953892794229, "test/sim_max_reward_4500012": 0.9417185443188051, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.3755479516369133, "test/sim_max_reward_4500015": 0.8885126258772386, "test/sim_max_reward_4500016": 0.16772451109300304, "test/sim_max_reward_4500017": 0.3013994285677881, "test/sim_max_reward_4500018": 0.27752101784821226, "test/sim_max_reward_4500019": 0.6568837966325766, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.5827570938502726, "test/sim_max_reward_4500022": 0.6659449134376092, "test/sim_max_reward_4500023": 0.5343993454044824, "test/sim_max_reward_4500024": 0.7785286683599144, "test/sim_max_reward_4500025": 0.0007914440704560897, "test/sim_max_reward_4500026": 0.8758899937399123, "test/sim_max_reward_4500027": 0.5907794275540267, "test/sim_max_reward_4500028": 0.2365391925523128, "test/sim_max_reward_4500029": 0.11563755257042008, "test/sim_max_reward_4500030": 0.8470068669097469, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05088251923086367, "test/sim_max_reward_4500033": 0.8160775698685215, "test/sim_max_reward_4500034": 0.5097521926948708, "test/sim_max_reward_4500035": 0.8797538719634295, "test/sim_max_reward_4500036": 0.9103060443086857, "test/sim_max_reward_4500037": 0.8743629888027971, "test/sim_max_reward_4500038": 0.6640747985714601, "test/sim_max_reward_4500039": 0.4655402964016708, "test/sim_max_reward_4500040": 0.9808803454387379, "test/sim_max_reward_4500041": 0.9807807509681686, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.1612673708199078, "test/sim_max_reward_4500044": 0.04659223701208032, "test/sim_max_reward_4500045": 0.11979903228074165, "test/sim_max_reward_4500046": 0.7964706777510013, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.8792132680476755, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5594602388147909, "test/mean_score": 0.4509536794316204, "val_loss": 74668.1328125} {"train_loss": -5.8338303565979, "global_step": 67242, "epoch": 1601} {"train_loss": -5.956516265869141, "global_step": 67243, "epoch": 1601} {"train_loss": -5.938512802124023, "global_step": 67244, "epoch": 1601} {"train_loss": -6.026263236999512, "global_step": 67245, "epoch": 1601} {"train_loss": -6.001588821411133, "global_step": 67246, "epoch": 1601} {"train_loss": -5.937798976898193, "global_step": 67247, "epoch": 1601} {"train_loss": -6.006591796875, "global_step": 67248, "epoch": 1601} {"train_loss": -5.907749176025391, "global_step": 67249, "epoch": 1601} {"train_loss": -5.898667335510254, "global_step": 67250, "epoch": 1601} {"train_loss": -5.992021560668945, "global_step": 67251, "epoch": 1601} {"train_loss": -5.848846912384033, "global_step": 67252, "epoch": 1601} {"train_loss": -5.93568229675293, "global_step": 67253, "epoch": 1601} {"train_loss": -6.094186782836914, "global_step": 67254, "epoch": 1601} {"train_loss": -5.8838958740234375, "global_step": 67255, "epoch": 1601} {"train_loss": -5.860077381134033, "global_step": 67256, "epoch": 1601} {"train_loss": -5.887686729431152, "global_step": 67257, "epoch": 1601} {"train_loss": -5.819221019744873, "global_step": 67258, "epoch": 1601} {"train_loss": -5.932806015014648, "global_step": 67259, "epoch": 1601} {"train_loss": -5.950732231140137, "global_step": 67260, "epoch": 1601} {"train_loss": -5.918974876403809, "global_step": 67261, "epoch": 1601} {"train_loss": -5.804026126861572, "global_step": 67262, "epoch": 1601} {"train_loss": -5.902492523193359, "global_step": 67263, "epoch": 1601} {"train_loss": -5.735909938812256, "global_step": 67264, "epoch": 1601} {"train_loss": -5.970985412597656, "global_step": 67265, "epoch": 1601} {"train_loss": -6.007896423339844, "global_step": 67266, "epoch": 1601} {"train_loss": -5.954659461975098, "global_step": 67267, "epoch": 1601} {"train_loss": -6.021149158477783, "global_step": 67268, "epoch": 1601} {"train_loss": -5.936228275299072, "global_step": 67269, "epoch": 1601} {"train_loss": -5.9824604988098145, "global_step": 67270, "epoch": 1601} {"train_loss": -5.802004814147949, "global_step": 67271, "epoch": 1601} {"train_loss": -5.905734539031982, "global_step": 67272, "epoch": 1601} {"train_loss": -5.981534957885742, "global_step": 67273, "epoch": 1601} {"train_loss": -6.026915073394775, "global_step": 67274, "epoch": 1601} {"train_loss": -5.913424491882324, "global_step": 67275, "epoch": 1601} {"train_loss": -6.050554275512695, "global_step": 67276, "epoch": 1601} {"train_loss": -5.953341960906982, "global_step": 67277, "epoch": 1601} {"train_loss": -6.045555591583252, "global_step": 67278, "epoch": 1601} {"train_loss": -5.961762428283691, "global_step": 67279, "epoch": 1601} {"train_loss": -6.055727005004883, "global_step": 67280, "epoch": 1601} {"train_loss": -5.8865966796875, "global_step": 67281, "epoch": 1601} {"train_loss": -5.9096574783325195, "global_step": 67282, "epoch": 1601} {"train_loss": -5.938289540154593, "global_step": 67283, "epoch": 1601, "val_loss": 74545.890625} {"train_loss": -5.973995685577393, "global_step": 67284, "epoch": 1602} {"train_loss": -6.012237548828125, "global_step": 67285, "epoch": 1602} {"train_loss": -6.062528610229492, "global_step": 67286, "epoch": 1602} {"train_loss": -5.920184135437012, "global_step": 67287, "epoch": 1602} {"train_loss": -6.070211410522461, "global_step": 67288, "epoch": 1602} {"train_loss": -6.054582595825195, "global_step": 67289, "epoch": 1602} {"train_loss": -6.1080474853515625, "global_step": 67290, "epoch": 1602} {"train_loss": -5.934660911560059, "global_step": 67291, "epoch": 1602} {"train_loss": -6.0183539390563965, "global_step": 67292, "epoch": 1602} {"train_loss": -5.970294952392578, "global_step": 67293, "epoch": 1602} {"train_loss": -5.9946160316467285, "global_step": 67294, "epoch": 1602} {"train_loss": -5.973559856414795, "global_step": 67295, "epoch": 1602} {"train_loss": -6.032095909118652, "global_step": 67296, "epoch": 1602} {"train_loss": -6.052478313446045, "global_step": 67297, "epoch": 1602} {"train_loss": -5.8964080810546875, "global_step": 67298, "epoch": 1602} {"train_loss": -6.009271144866943, "global_step": 67299, "epoch": 1602} {"train_loss": -5.999922752380371, "global_step": 67300, "epoch": 1602} {"train_loss": -5.919964790344238, "global_step": 67301, "epoch": 1602} {"train_loss": -6.090632438659668, "global_step": 67302, "epoch": 1602} {"train_loss": -5.812161445617676, "global_step": 67303, "epoch": 1602} {"train_loss": -6.029592514038086, "global_step": 67304, "epoch": 1602} {"train_loss": -6.046346664428711, "global_step": 67305, "epoch": 1602} {"train_loss": -5.990654945373535, "global_step": 67306, "epoch": 1602} {"train_loss": -6.024657249450684, "global_step": 67307, "epoch": 1602} {"train_loss": -5.997047424316406, "global_step": 67308, "epoch": 1602} {"train_loss": -5.924431324005127, "global_step": 67309, "epoch": 1602} {"train_loss": -5.963918685913086, "global_step": 67310, "epoch": 1602} {"train_loss": -6.103992938995361, "global_step": 67311, "epoch": 1602} {"train_loss": -6.066774368286133, "global_step": 67312, "epoch": 1602} {"train_loss": -6.021989345550537, "global_step": 67313, "epoch": 1602} {"train_loss": -5.917640209197998, "global_step": 67314, "epoch": 1602} {"train_loss": -5.906158447265625, "global_step": 67315, "epoch": 1602} {"train_loss": -5.92982292175293, "global_step": 67316, "epoch": 1602} {"train_loss": -6.112391948699951, "global_step": 67317, "epoch": 1602} {"train_loss": -5.993810653686523, "global_step": 67318, "epoch": 1602} {"train_loss": -5.960076332092285, "global_step": 67319, "epoch": 1602} {"train_loss": -6.060523986816406, "global_step": 67320, "epoch": 1602} {"train_loss": -5.944018840789795, "global_step": 67321, "epoch": 1602} {"train_loss": -6.021550178527832, "global_step": 67322, "epoch": 1602} {"train_loss": -5.971599578857422, "global_step": 67323, "epoch": 1602} {"train_loss": -6.002252578735352, "global_step": 67324, "epoch": 1602} {"train_loss": -5.997467154548282, "global_step": 67325, "epoch": 1602, "val_loss": 74373.53125} {"train_loss": -5.985147476196289, "global_step": 67326, "epoch": 1603} {"train_loss": -6.054333686828613, "global_step": 67327, "epoch": 1603} {"train_loss": -6.03995418548584, "global_step": 67328, "epoch": 1603} {"train_loss": -6.088873386383057, "global_step": 67329, "epoch": 1603} {"train_loss": -5.929538249969482, "global_step": 67330, "epoch": 1603} {"train_loss": -6.1126508712768555, "global_step": 67331, "epoch": 1603} {"train_loss": -6.049182891845703, "global_step": 67332, "epoch": 1603} {"train_loss": -6.007239818572998, "global_step": 67333, "epoch": 1603} {"train_loss": -5.979039192199707, "global_step": 67334, "epoch": 1603} {"train_loss": -6.164313316345215, "global_step": 67335, "epoch": 1603} {"train_loss": -5.961021423339844, "global_step": 67336, "epoch": 1603} {"train_loss": -5.962679386138916, "global_step": 67337, "epoch": 1603} {"train_loss": -6.068713188171387, "global_step": 67338, "epoch": 1603} {"train_loss": -5.995762825012207, "global_step": 67339, "epoch": 1603} {"train_loss": -5.930318832397461, "global_step": 67340, "epoch": 1603} {"train_loss": -6.1134033203125, "global_step": 67341, "epoch": 1603} {"train_loss": -6.108834266662598, "global_step": 67342, "epoch": 1603} {"train_loss": -6.057247638702393, "global_step": 67343, "epoch": 1603} {"train_loss": -6.027072906494141, "global_step": 67344, "epoch": 1603} {"train_loss": -6.071371078491211, "global_step": 67345, "epoch": 1603} {"train_loss": -6.039384841918945, "global_step": 67346, "epoch": 1603} {"train_loss": -6.100157260894775, "global_step": 67347, "epoch": 1603} {"train_loss": -5.909202575683594, "global_step": 67348, "epoch": 1603} {"train_loss": -5.996537208557129, "global_step": 67349, "epoch": 1603} {"train_loss": -5.933070182800293, "global_step": 67350, "epoch": 1603} {"train_loss": -5.906338691711426, "global_step": 67351, "epoch": 1603} {"train_loss": -6.026797771453857, "global_step": 67352, "epoch": 1603} {"train_loss": -5.989039897918701, "global_step": 67353, "epoch": 1603} {"train_loss": -5.846238613128662, "global_step": 67354, "epoch": 1603} {"train_loss": -6.037910461425781, "global_step": 67355, "epoch": 1603} {"train_loss": -5.91430139541626, "global_step": 67356, "epoch": 1603} {"train_loss": -5.934895992279053, "global_step": 67357, "epoch": 1603} {"train_loss": -6.020059108734131, "global_step": 67358, "epoch": 1603} {"train_loss": -5.930929660797119, "global_step": 67359, "epoch": 1603} {"train_loss": -5.9560346603393555, "global_step": 67360, "epoch": 1603} {"train_loss": -6.143232345581055, "global_step": 67361, "epoch": 1603} {"train_loss": -5.786839008331299, "global_step": 67362, "epoch": 1603} {"train_loss": -6.008671760559082, "global_step": 67363, "epoch": 1603} {"train_loss": -6.138426780700684, "global_step": 67364, "epoch": 1603} {"train_loss": -5.805946350097656, "global_step": 67365, "epoch": 1603} {"train_loss": -6.046222686767578, "global_step": 67366, "epoch": 1603} {"train_loss": -6.00233657019479, "global_step": 67367, "epoch": 1603, "val_loss": 74501.8671875} {"train_loss": -6.004006385803223, "global_step": 67368, "epoch": 1604} {"train_loss": -5.9937214851379395, "global_step": 67369, "epoch": 1604} {"train_loss": -6.015192985534668, "global_step": 67370, "epoch": 1604} {"train_loss": -5.894147872924805, "global_step": 67371, "epoch": 1604} {"train_loss": -5.914909839630127, "global_step": 67372, "epoch": 1604} {"train_loss": -6.097259998321533, "global_step": 67373, "epoch": 1604} {"train_loss": -5.995094299316406, "global_step": 67374, "epoch": 1604} {"train_loss": -5.945013046264648, "global_step": 67375, "epoch": 1604} {"train_loss": -5.941500186920166, "global_step": 67376, "epoch": 1604} {"train_loss": -5.892634391784668, "global_step": 67377, "epoch": 1604} {"train_loss": -6.045650482177734, "global_step": 67378, "epoch": 1604} {"train_loss": -5.93925666809082, "global_step": 67379, "epoch": 1604} {"train_loss": -5.902358055114746, "global_step": 67380, "epoch": 1604} {"train_loss": -5.9790191650390625, "global_step": 67381, "epoch": 1604} {"train_loss": -6.025800704956055, "global_step": 67382, "epoch": 1604} {"train_loss": -5.992537975311279, "global_step": 67383, "epoch": 1604} {"train_loss": -5.991927623748779, "global_step": 67384, "epoch": 1604} {"train_loss": -5.777114391326904, "global_step": 67385, "epoch": 1604} {"train_loss": -5.9116058349609375, "global_step": 67386, "epoch": 1604} {"train_loss": -5.927509307861328, "global_step": 67387, "epoch": 1604} {"train_loss": -5.927323341369629, "global_step": 67388, "epoch": 1604} {"train_loss": -5.93208122253418, "global_step": 67389, "epoch": 1604} {"train_loss": -5.990411281585693, "global_step": 67390, "epoch": 1604} {"train_loss": -5.890691757202148, "global_step": 67391, "epoch": 1604} {"train_loss": -6.025557518005371, "global_step": 67392, "epoch": 1604} {"train_loss": -5.739457130432129, "global_step": 67393, "epoch": 1604} {"train_loss": -5.868628978729248, "global_step": 67394, "epoch": 1604} {"train_loss": -5.888055801391602, "global_step": 67395, "epoch": 1604} {"train_loss": -5.788281440734863, "global_step": 67396, "epoch": 1604} {"train_loss": -5.980242729187012, "global_step": 67397, "epoch": 1604} {"train_loss": -5.861658096313477, "global_step": 67398, "epoch": 1604} {"train_loss": -5.8967485427856445, "global_step": 67399, "epoch": 1604} {"train_loss": -5.862519264221191, "global_step": 67400, "epoch": 1604} {"train_loss": -6.013792037963867, "global_step": 67401, "epoch": 1604} {"train_loss": -5.92368221282959, "global_step": 67402, "epoch": 1604} {"train_loss": -5.931755065917969, "global_step": 67403, "epoch": 1604} {"train_loss": -5.967720985412598, "global_step": 67404, "epoch": 1604} {"train_loss": -6.0033698081970215, "global_step": 67405, "epoch": 1604} {"train_loss": -6.02780818939209, "global_step": 67406, "epoch": 1604} {"train_loss": -5.971167087554932, "global_step": 67407, "epoch": 1604} {"train_loss": -6.046776294708252, "global_step": 67408, "epoch": 1604} {"train_loss": -5.942666598728725, "global_step": 67409, "epoch": 1604, "val_loss": 74642.484375} {"train_loss": -5.987353801727295, "global_step": 67410, "epoch": 1605} {"train_loss": -5.924163818359375, "global_step": 67411, "epoch": 1605} {"train_loss": -6.016952037811279, "global_step": 67412, "epoch": 1605} {"train_loss": -6.008987903594971, "global_step": 67413, "epoch": 1605} {"train_loss": -5.952571392059326, "global_step": 67414, "epoch": 1605} {"train_loss": -6.029718399047852, "global_step": 67415, "epoch": 1605} {"train_loss": -5.808399200439453, "global_step": 67416, "epoch": 1605} {"train_loss": -5.97580623626709, "global_step": 67417, "epoch": 1605} {"train_loss": -6.016937732696533, "global_step": 67418, "epoch": 1605} {"train_loss": -5.890769004821777, "global_step": 67419, "epoch": 1605} {"train_loss": -6.106873512268066, "global_step": 67420, "epoch": 1605} {"train_loss": -5.833039283752441, "global_step": 67421, "epoch": 1605} {"train_loss": -5.98140811920166, "global_step": 67422, "epoch": 1605} {"train_loss": -6.023156642913818, "global_step": 67423, "epoch": 1605} {"train_loss": -5.929558753967285, "global_step": 67424, "epoch": 1605} {"train_loss": -6.003193378448486, "global_step": 67425, "epoch": 1605} {"train_loss": -5.968955039978027, "global_step": 67426, "epoch": 1605} {"train_loss": -5.869414806365967, "global_step": 67427, "epoch": 1605} {"train_loss": -6.039300918579102, "global_step": 67428, "epoch": 1605} {"train_loss": -5.94959020614624, "global_step": 67429, "epoch": 1605} {"train_loss": -6.080827713012695, "global_step": 67430, "epoch": 1605} {"train_loss": -5.975459098815918, "global_step": 67431, "epoch": 1605} {"train_loss": -5.966031551361084, "global_step": 67432, "epoch": 1605} {"train_loss": -5.948114395141602, "global_step": 67433, "epoch": 1605} {"train_loss": -6.174391746520996, "global_step": 67434, "epoch": 1605} {"train_loss": -6.238504409790039, "global_step": 67435, "epoch": 1605} {"train_loss": -6.058448791503906, "global_step": 67436, "epoch": 1605} {"train_loss": -6.098689556121826, "global_step": 67437, "epoch": 1605} {"train_loss": -6.071832656860352, "global_step": 67438, "epoch": 1605} {"train_loss": -5.927971839904785, "global_step": 67439, "epoch": 1605} {"train_loss": -5.96185302734375, "global_step": 67440, "epoch": 1605} {"train_loss": -6.00509786605835, "global_step": 67441, "epoch": 1605} {"train_loss": -5.863847732543945, "global_step": 67442, "epoch": 1605} {"train_loss": -5.934185028076172, "global_step": 67443, "epoch": 1605} {"train_loss": -5.831012725830078, "global_step": 67444, "epoch": 1605} {"train_loss": -6.019253253936768, "global_step": 67445, "epoch": 1605} {"train_loss": -5.88883113861084, "global_step": 67446, "epoch": 1605} {"train_loss": -5.765775203704834, "global_step": 67447, "epoch": 1605} {"train_loss": -5.9542083740234375, "global_step": 67448, "epoch": 1605} {"train_loss": -5.935641288757324, "global_step": 67449, "epoch": 1605} {"train_loss": -6.045042037963867, "global_step": 67450, "epoch": 1605} {"train_loss": -5.975066718601045, "global_step": 67451, "epoch": 1605, "val_loss": 74666.109375} {"train_loss": -5.899476051330566, "global_step": 67452, "epoch": 1606} {"train_loss": -5.912899017333984, "global_step": 67453, "epoch": 1606} {"train_loss": -5.998076915740967, "global_step": 67454, "epoch": 1606} {"train_loss": -5.896977424621582, "global_step": 67455, "epoch": 1606} {"train_loss": -6.02293586730957, "global_step": 67456, "epoch": 1606} {"train_loss": -6.018631935119629, "global_step": 67457, "epoch": 1606} {"train_loss": -6.013920783996582, "global_step": 67458, "epoch": 1606} {"train_loss": -6.008220195770264, "global_step": 67459, "epoch": 1606} {"train_loss": -6.0054826736450195, "global_step": 67460, "epoch": 1606} {"train_loss": -6.027477264404297, "global_step": 67461, "epoch": 1606} {"train_loss": -5.9969282150268555, "global_step": 67462, "epoch": 1606} {"train_loss": -5.938131332397461, "global_step": 67463, "epoch": 1606} {"train_loss": -5.9678802490234375, "global_step": 67464, "epoch": 1606} {"train_loss": -5.860407829284668, "global_step": 67465, "epoch": 1606} {"train_loss": -6.085225582122803, "global_step": 67466, "epoch": 1606} {"train_loss": -5.93550968170166, "global_step": 67467, "epoch": 1606} {"train_loss": -5.852738380432129, "global_step": 67468, "epoch": 1606} {"train_loss": -6.023311138153076, "global_step": 67469, "epoch": 1606} {"train_loss": -5.866205215454102, "global_step": 67470, "epoch": 1606} {"train_loss": -5.966388702392578, "global_step": 67471, "epoch": 1606} {"train_loss": -6.069340229034424, "global_step": 67472, "epoch": 1606} {"train_loss": -5.92039155960083, "global_step": 67473, "epoch": 1606} {"train_loss": -6.008606433868408, "global_step": 67474, "epoch": 1606} {"train_loss": -5.976739883422852, "global_step": 67475, "epoch": 1606} {"train_loss": -5.940672874450684, "global_step": 67476, "epoch": 1606} {"train_loss": -6.030542373657227, "global_step": 67477, "epoch": 1606} {"train_loss": -5.954842567443848, "global_step": 67478, "epoch": 1606} {"train_loss": -5.845763206481934, "global_step": 67479, "epoch": 1606} {"train_loss": -6.036954402923584, "global_step": 67480, "epoch": 1606} {"train_loss": -5.9095892906188965, "global_step": 67481, "epoch": 1606} {"train_loss": -5.978700637817383, "global_step": 67482, "epoch": 1606} {"train_loss": -6.018255233764648, "global_step": 67483, "epoch": 1606} {"train_loss": -5.976110458374023, "global_step": 67484, "epoch": 1606} {"train_loss": -5.971887588500977, "global_step": 67485, "epoch": 1606} {"train_loss": -5.994453430175781, "global_step": 67486, "epoch": 1606} {"train_loss": -6.051109313964844, "global_step": 67487, "epoch": 1606} {"train_loss": -6.080723285675049, "global_step": 67488, "epoch": 1606} {"train_loss": -6.028497219085693, "global_step": 67489, "epoch": 1606} {"train_loss": -5.946993827819824, "global_step": 67490, "epoch": 1606} {"train_loss": -5.820418357849121, "global_step": 67491, "epoch": 1606} {"train_loss": -5.943936824798584, "global_step": 67492, "epoch": 1606} {"train_loss": -5.970328047162011, "global_step": 67493, "epoch": 1606, "val_loss": 75158.1796875} {"train_loss": -5.941497802734375, "global_step": 67494, "epoch": 1607} {"train_loss": -5.948723316192627, "global_step": 67495, "epoch": 1607} {"train_loss": -5.907810211181641, "global_step": 67496, "epoch": 1607} {"train_loss": -5.952447891235352, "global_step": 67497, "epoch": 1607} {"train_loss": -5.939504146575928, "global_step": 67498, "epoch": 1607} {"train_loss": -5.9478936195373535, "global_step": 67499, "epoch": 1607} {"train_loss": -5.9636030197143555, "global_step": 67500, "epoch": 1607} {"train_loss": -5.922748565673828, "global_step": 67501, "epoch": 1607} {"train_loss": -6.046932220458984, "global_step": 67502, "epoch": 1607} {"train_loss": -5.995420932769775, "global_step": 67503, "epoch": 1607} {"train_loss": -6.030133247375488, "global_step": 67504, "epoch": 1607} {"train_loss": -5.941555976867676, "global_step": 67505, "epoch": 1607} {"train_loss": -6.07194709777832, "global_step": 67506, "epoch": 1607} {"train_loss": -5.955641746520996, "global_step": 67507, "epoch": 1607} {"train_loss": -5.946640968322754, "global_step": 67508, "epoch": 1607} {"train_loss": -5.976842880249023, "global_step": 67509, "epoch": 1607} {"train_loss": -5.873106956481934, "global_step": 67510, "epoch": 1607} {"train_loss": -6.086217880249023, "global_step": 67511, "epoch": 1607} {"train_loss": -6.053783416748047, "global_step": 67512, "epoch": 1607} {"train_loss": -5.932135581970215, "global_step": 67513, "epoch": 1607} {"train_loss": -6.090459823608398, "global_step": 67514, "epoch": 1607} {"train_loss": -6.000288963317871, "global_step": 67515, "epoch": 1607} {"train_loss": -5.885219097137451, "global_step": 67516, "epoch": 1607} {"train_loss": -5.962514400482178, "global_step": 67517, "epoch": 1607} {"train_loss": -6.164283752441406, "global_step": 67518, "epoch": 1607} {"train_loss": -6.133497714996338, "global_step": 67519, "epoch": 1607} {"train_loss": -6.061387062072754, "global_step": 67520, "epoch": 1607} {"train_loss": -6.000056266784668, "global_step": 67521, "epoch": 1607} {"train_loss": -5.884563446044922, "global_step": 67522, "epoch": 1607} {"train_loss": -6.178484916687012, "global_step": 67523, "epoch": 1607} {"train_loss": -5.993113040924072, "global_step": 67524, "epoch": 1607} {"train_loss": -5.933716773986816, "global_step": 67525, "epoch": 1607} {"train_loss": -6.066462516784668, "global_step": 67526, "epoch": 1607} {"train_loss": -5.924860954284668, "global_step": 67527, "epoch": 1607} {"train_loss": -5.867269515991211, "global_step": 67528, "epoch": 1607} {"train_loss": -5.939441204071045, "global_step": 67529, "epoch": 1607} {"train_loss": -5.895594596862793, "global_step": 67530, "epoch": 1607} {"train_loss": -5.83308219909668, "global_step": 67531, "epoch": 1607} {"train_loss": -6.008060932159424, "global_step": 67532, "epoch": 1607} {"train_loss": -6.058953285217285, "global_step": 67533, "epoch": 1607} {"train_loss": -5.901872634887695, "global_step": 67534, "epoch": 1607} {"train_loss": -5.981582845960345, "global_step": 67535, "epoch": 1607, "val_loss": 74506.3984375} {"train_loss": -6.062921047210693, "global_step": 67536, "epoch": 1608} {"train_loss": -6.057910919189453, "global_step": 67537, "epoch": 1608} {"train_loss": -5.99848747253418, "global_step": 67538, "epoch": 1608} {"train_loss": -6.086224555969238, "global_step": 67539, "epoch": 1608} {"train_loss": -5.980935096740723, "global_step": 67540, "epoch": 1608} {"train_loss": -6.087099075317383, "global_step": 67541, "epoch": 1608} {"train_loss": -6.01021671295166, "global_step": 67542, "epoch": 1608} {"train_loss": -6.0276899337768555, "global_step": 67543, "epoch": 1608} {"train_loss": -5.984763145446777, "global_step": 67544, "epoch": 1608} {"train_loss": -6.009774684906006, "global_step": 67545, "epoch": 1608} {"train_loss": -5.9622578620910645, "global_step": 67546, "epoch": 1608} {"train_loss": -6.107570648193359, "global_step": 67547, "epoch": 1608} {"train_loss": -6.034265518188477, "global_step": 67548, "epoch": 1608} {"train_loss": -5.965758323669434, "global_step": 67549, "epoch": 1608} {"train_loss": -6.111257553100586, "global_step": 67550, "epoch": 1608} {"train_loss": -6.029025077819824, "global_step": 67551, "epoch": 1608} {"train_loss": -5.959046363830566, "global_step": 67552, "epoch": 1608} {"train_loss": -5.824318885803223, "global_step": 67553, "epoch": 1608} {"train_loss": -6.108202934265137, "global_step": 67554, "epoch": 1608} {"train_loss": -5.967044830322266, "global_step": 67555, "epoch": 1608} {"train_loss": -5.925038814544678, "global_step": 67556, "epoch": 1608} {"train_loss": -5.898857116699219, "global_step": 67557, "epoch": 1608} {"train_loss": -5.927255630493164, "global_step": 67558, "epoch": 1608} {"train_loss": -5.960214614868164, "global_step": 67559, "epoch": 1608} {"train_loss": -6.120035648345947, "global_step": 67560, "epoch": 1608} {"train_loss": -5.944816589355469, "global_step": 67561, "epoch": 1608} {"train_loss": -6.062089920043945, "global_step": 67562, "epoch": 1608} {"train_loss": -5.97088098526001, "global_step": 67563, "epoch": 1608} {"train_loss": -6.0829668045043945, "global_step": 67564, "epoch": 1608} {"train_loss": -6.091658592224121, "global_step": 67565, "epoch": 1608} {"train_loss": -6.034124851226807, "global_step": 67566, "epoch": 1608} {"train_loss": -6.073275566101074, "global_step": 67567, "epoch": 1608} {"train_loss": -6.140340328216553, "global_step": 67568, "epoch": 1608} {"train_loss": -5.879887580871582, "global_step": 67569, "epoch": 1608} {"train_loss": -6.0219292640686035, "global_step": 67570, "epoch": 1608} {"train_loss": -6.107944965362549, "global_step": 67571, "epoch": 1608} {"train_loss": -5.987003803253174, "global_step": 67572, "epoch": 1608} {"train_loss": -5.959465503692627, "global_step": 67573, "epoch": 1608} {"train_loss": -5.944277763366699, "global_step": 67574, "epoch": 1608} {"train_loss": -5.913455963134766, "global_step": 67575, "epoch": 1608} {"train_loss": -5.801945209503174, "global_step": 67576, "epoch": 1608} {"train_loss": -6.007649637403942, "global_step": 67577, "epoch": 1608, "val_loss": 74769.6796875} {"train_loss": -5.907302379608154, "global_step": 67578, "epoch": 1609} {"train_loss": -5.932775497436523, "global_step": 67579, "epoch": 1609} {"train_loss": -6.1677350997924805, "global_step": 67580, "epoch": 1609} {"train_loss": -6.00576639175415, "global_step": 67581, "epoch": 1609} {"train_loss": -5.972795486450195, "global_step": 67582, "epoch": 1609} {"train_loss": -6.106797218322754, "global_step": 67583, "epoch": 1609} {"train_loss": -5.951264381408691, "global_step": 67584, "epoch": 1609} {"train_loss": -6.058820724487305, "global_step": 67585, "epoch": 1609} {"train_loss": -5.843135833740234, "global_step": 67586, "epoch": 1609} {"train_loss": -6.063788890838623, "global_step": 67587, "epoch": 1609} {"train_loss": -6.0126495361328125, "global_step": 67588, "epoch": 1609} {"train_loss": -5.943561553955078, "global_step": 67589, "epoch": 1609} {"train_loss": -6.027239799499512, "global_step": 67590, "epoch": 1609} {"train_loss": -6.077489852905273, "global_step": 67591, "epoch": 1609} {"train_loss": -6.034049987792969, "global_step": 67592, "epoch": 1609} {"train_loss": -5.955381870269775, "global_step": 67593, "epoch": 1609} {"train_loss": -6.067052364349365, "global_step": 67594, "epoch": 1609} {"train_loss": -5.954043388366699, "global_step": 67595, "epoch": 1609} {"train_loss": -5.984021186828613, "global_step": 67596, "epoch": 1609} {"train_loss": -5.998594284057617, "global_step": 67597, "epoch": 1609} {"train_loss": -6.078371524810791, "global_step": 67598, "epoch": 1609} {"train_loss": -6.003030300140381, "global_step": 67599, "epoch": 1609} {"train_loss": -6.054687023162842, "global_step": 67600, "epoch": 1609} {"train_loss": -5.978342056274414, "global_step": 67601, "epoch": 1609} {"train_loss": -5.981996536254883, "global_step": 67602, "epoch": 1609} {"train_loss": -6.068080902099609, "global_step": 67603, "epoch": 1609} {"train_loss": -5.921126842498779, "global_step": 67604, "epoch": 1609} {"train_loss": -5.933538436889648, "global_step": 67605, "epoch": 1609} {"train_loss": -5.863899230957031, "global_step": 67606, "epoch": 1609} {"train_loss": -5.975671291351318, "global_step": 67607, "epoch": 1609} {"train_loss": -5.955689430236816, "global_step": 67608, "epoch": 1609} {"train_loss": -5.9967827796936035, "global_step": 67609, "epoch": 1609} {"train_loss": -6.0426812171936035, "global_step": 67610, "epoch": 1609} {"train_loss": -6.081451416015625, "global_step": 67611, "epoch": 1609} {"train_loss": -5.968198776245117, "global_step": 67612, "epoch": 1609} {"train_loss": -6.005429267883301, "global_step": 67613, "epoch": 1609} {"train_loss": -5.962382793426514, "global_step": 67614, "epoch": 1609} {"train_loss": -6.059726238250732, "global_step": 67615, "epoch": 1609} {"train_loss": -5.884520530700684, "global_step": 67616, "epoch": 1609} {"train_loss": -5.957205772399902, "global_step": 67617, "epoch": 1609} {"train_loss": -5.919630527496338, "global_step": 67618, "epoch": 1609} {"train_loss": -5.993682815915062, "global_step": 67619, "epoch": 1609, "val_loss": 74416.6171875} {"train_loss": -5.92661190032959, "global_step": 67620, "epoch": 1610} {"train_loss": -5.930942058563232, "global_step": 67621, "epoch": 1610} {"train_loss": -5.973480701446533, "global_step": 67622, "epoch": 1610} {"train_loss": -5.933194160461426, "global_step": 67623, "epoch": 1610} {"train_loss": -5.934138774871826, "global_step": 67624, "epoch": 1610} {"train_loss": -6.063880920410156, "global_step": 67625, "epoch": 1610} {"train_loss": -5.954082012176514, "global_step": 67626, "epoch": 1610} {"train_loss": -5.982400894165039, "global_step": 67627, "epoch": 1610} {"train_loss": -5.88071870803833, "global_step": 67628, "epoch": 1610} {"train_loss": -6.008265972137451, "global_step": 67629, "epoch": 1610} {"train_loss": -6.100299835205078, "global_step": 67630, "epoch": 1610} {"train_loss": -5.797033309936523, "global_step": 67631, "epoch": 1610} {"train_loss": -5.984814643859863, "global_step": 67632, "epoch": 1610} {"train_loss": -5.873347759246826, "global_step": 67633, "epoch": 1610} {"train_loss": -5.89464807510376, "global_step": 67634, "epoch": 1610} {"train_loss": -5.9431257247924805, "global_step": 67635, "epoch": 1610} {"train_loss": -5.919442176818848, "global_step": 67636, "epoch": 1610} {"train_loss": -5.846285343170166, "global_step": 67637, "epoch": 1610} {"train_loss": -6.049896717071533, "global_step": 67638, "epoch": 1610} {"train_loss": -6.000985145568848, "global_step": 67639, "epoch": 1610} {"train_loss": -5.836547374725342, "global_step": 67640, "epoch": 1610} {"train_loss": -5.989623546600342, "global_step": 67641, "epoch": 1610} {"train_loss": -5.968313694000244, "global_step": 67642, "epoch": 1610} {"train_loss": -5.963743686676025, "global_step": 67643, "epoch": 1610} {"train_loss": -6.140992641448975, "global_step": 67644, "epoch": 1610} {"train_loss": -6.026124000549316, "global_step": 67645, "epoch": 1610} {"train_loss": -5.833700180053711, "global_step": 67646, "epoch": 1610} {"train_loss": -6.008424758911133, "global_step": 67647, "epoch": 1610} {"train_loss": -5.886174201965332, "global_step": 67648, "epoch": 1610} {"train_loss": -5.895359039306641, "global_step": 67649, "epoch": 1610} {"train_loss": -5.983088493347168, "global_step": 67650, "epoch": 1610} {"train_loss": -5.978867530822754, "global_step": 67651, "epoch": 1610} {"train_loss": -6.071256637573242, "global_step": 67652, "epoch": 1610} {"train_loss": -5.954831123352051, "global_step": 67653, "epoch": 1610} {"train_loss": -6.018259048461914, "global_step": 67654, "epoch": 1610} {"train_loss": -5.974893569946289, "global_step": 67655, "epoch": 1610} {"train_loss": -5.894126892089844, "global_step": 67656, "epoch": 1610} {"train_loss": -6.007246971130371, "global_step": 67657, "epoch": 1610} {"train_loss": -5.957292079925537, "global_step": 67658, "epoch": 1610} {"train_loss": -5.957724094390869, "global_step": 67659, "epoch": 1610} {"train_loss": -5.980666160583496, "global_step": 67660, "epoch": 1610} {"train_loss": -5.961425531478155, "global_step": 67661, "epoch": 1610, "val_loss": 74674.2109375} {"train_loss": -5.936347007751465, "global_step": 67662, "epoch": 1611} {"train_loss": -6.039349555969238, "global_step": 67663, "epoch": 1611} {"train_loss": -5.935752868652344, "global_step": 67664, "epoch": 1611} {"train_loss": -5.962906837463379, "global_step": 67665, "epoch": 1611} {"train_loss": -5.834468841552734, "global_step": 67666, "epoch": 1611} {"train_loss": -5.969725608825684, "global_step": 67667, "epoch": 1611} {"train_loss": -5.95644998550415, "global_step": 67668, "epoch": 1611} {"train_loss": -5.950942516326904, "global_step": 67669, "epoch": 1611} {"train_loss": -6.00826358795166, "global_step": 67670, "epoch": 1611} {"train_loss": -5.961687088012695, "global_step": 67671, "epoch": 1611} {"train_loss": -5.993724346160889, "global_step": 67672, "epoch": 1611} {"train_loss": -5.929354190826416, "global_step": 67673, "epoch": 1611} {"train_loss": -6.17045783996582, "global_step": 67674, "epoch": 1611} {"train_loss": -6.0038371086120605, "global_step": 67675, "epoch": 1611} {"train_loss": -6.051234722137451, "global_step": 67676, "epoch": 1611} {"train_loss": -5.921316146850586, "global_step": 67677, "epoch": 1611} {"train_loss": -5.812585830688477, "global_step": 67678, "epoch": 1611} {"train_loss": -6.111177921295166, "global_step": 67679, "epoch": 1611} {"train_loss": -5.879729270935059, "global_step": 67680, "epoch": 1611} {"train_loss": -5.824028015136719, "global_step": 67681, "epoch": 1611} {"train_loss": -5.817806243896484, "global_step": 67682, "epoch": 1611} {"train_loss": -6.010305881500244, "global_step": 67683, "epoch": 1611} {"train_loss": -5.92804479598999, "global_step": 67684, "epoch": 1611} {"train_loss": -5.9166669845581055, "global_step": 67685, "epoch": 1611} {"train_loss": -6.0029377937316895, "global_step": 67686, "epoch": 1611} {"train_loss": -5.915781497955322, "global_step": 67687, "epoch": 1611} {"train_loss": -5.89448881149292, "global_step": 67688, "epoch": 1611} {"train_loss": -5.913708209991455, "global_step": 67689, "epoch": 1611} {"train_loss": -6.061737537384033, "global_step": 67690, "epoch": 1611} {"train_loss": -6.030026435852051, "global_step": 67691, "epoch": 1611} {"train_loss": -6.071902751922607, "global_step": 67692, "epoch": 1611} {"train_loss": -5.831774711608887, "global_step": 67693, "epoch": 1611} {"train_loss": -5.975202560424805, "global_step": 67694, "epoch": 1611} {"train_loss": -5.918154239654541, "global_step": 67695, "epoch": 1611} {"train_loss": -5.97678279876709, "global_step": 67696, "epoch": 1611} {"train_loss": -5.953814506530762, "global_step": 67697, "epoch": 1611} {"train_loss": -6.058740139007568, "global_step": 67698, "epoch": 1611} {"train_loss": -6.009302139282227, "global_step": 67699, "epoch": 1611} {"train_loss": -5.903361797332764, "global_step": 67700, "epoch": 1611} {"train_loss": -6.012929916381836, "global_step": 67701, "epoch": 1611} {"train_loss": -6.095763683319092, "global_step": 67702, "epoch": 1611} {"train_loss": -5.9656430426098055, "global_step": 67703, "epoch": 1611, "val_loss": 74831.3359375} {"train_loss": -6.094207763671875, "global_step": 67704, "epoch": 1612} {"train_loss": -5.97694730758667, "global_step": 67705, "epoch": 1612} {"train_loss": -5.9463653564453125, "global_step": 67706, "epoch": 1612} {"train_loss": -5.946201801300049, "global_step": 67707, "epoch": 1612} {"train_loss": -6.118839263916016, "global_step": 67708, "epoch": 1612} {"train_loss": -6.089162826538086, "global_step": 67709, "epoch": 1612} {"train_loss": -6.001481056213379, "global_step": 67710, "epoch": 1612} {"train_loss": -5.9632039070129395, "global_step": 67711, "epoch": 1612} {"train_loss": -6.033404350280762, "global_step": 67712, "epoch": 1612} {"train_loss": -5.987100601196289, "global_step": 67713, "epoch": 1612} {"train_loss": -5.9541215896606445, "global_step": 67714, "epoch": 1612} {"train_loss": -5.979007244110107, "global_step": 67715, "epoch": 1612} {"train_loss": -5.887594223022461, "global_step": 67716, "epoch": 1612} {"train_loss": -6.02834939956665, "global_step": 67717, "epoch": 1612} {"train_loss": -6.108026504516602, "global_step": 67718, "epoch": 1612} {"train_loss": -6.008715629577637, "global_step": 67719, "epoch": 1612} {"train_loss": -5.997339248657227, "global_step": 67720, "epoch": 1612} {"train_loss": -5.955582618713379, "global_step": 67721, "epoch": 1612} {"train_loss": -6.133686065673828, "global_step": 67722, "epoch": 1612} {"train_loss": -5.971194267272949, "global_step": 67723, "epoch": 1612} {"train_loss": -6.003491401672363, "global_step": 67724, "epoch": 1612} {"train_loss": -5.998791694641113, "global_step": 67725, "epoch": 1612} {"train_loss": -6.01894474029541, "global_step": 67726, "epoch": 1612} {"train_loss": -6.086365222930908, "global_step": 67727, "epoch": 1612} {"train_loss": -5.959360599517822, "global_step": 67728, "epoch": 1612} {"train_loss": -5.943652629852295, "global_step": 67729, "epoch": 1612} {"train_loss": -5.960337162017822, "global_step": 67730, "epoch": 1612} {"train_loss": -6.00394344329834, "global_step": 67731, "epoch": 1612} {"train_loss": -5.9297590255737305, "global_step": 67732, "epoch": 1612} {"train_loss": -5.882002830505371, "global_step": 67733, "epoch": 1612} {"train_loss": -5.983121395111084, "global_step": 67734, "epoch": 1612} {"train_loss": -5.932016849517822, "global_step": 67735, "epoch": 1612} {"train_loss": -5.9344801902771, "global_step": 67736, "epoch": 1612} {"train_loss": -6.04116153717041, "global_step": 67737, "epoch": 1612} {"train_loss": -6.036692142486572, "global_step": 67738, "epoch": 1612} {"train_loss": -6.001301288604736, "global_step": 67739, "epoch": 1612} {"train_loss": -5.949562072753906, "global_step": 67740, "epoch": 1612} {"train_loss": -6.058274269104004, "global_step": 67741, "epoch": 1612} {"train_loss": -5.943578243255615, "global_step": 67742, "epoch": 1612} {"train_loss": -6.01436710357666, "global_step": 67743, "epoch": 1612} {"train_loss": -6.042175769805908, "global_step": 67744, "epoch": 1612} {"train_loss": -5.996214605513073, "global_step": 67745, "epoch": 1612, "val_loss": 74569.3046875} {"train_loss": -6.034997940063477, "global_step": 67746, "epoch": 1613} {"train_loss": -5.938269138336182, "global_step": 67747, "epoch": 1613} {"train_loss": -5.9733171463012695, "global_step": 67748, "epoch": 1613} {"train_loss": -5.961829662322998, "global_step": 67749, "epoch": 1613} {"train_loss": -5.872247219085693, "global_step": 67750, "epoch": 1613} {"train_loss": -5.968201637268066, "global_step": 67751, "epoch": 1613} {"train_loss": -6.029764175415039, "global_step": 67752, "epoch": 1613} {"train_loss": -6.033934593200684, "global_step": 67753, "epoch": 1613} {"train_loss": -5.982306480407715, "global_step": 67754, "epoch": 1613} {"train_loss": -6.0347113609313965, "global_step": 67755, "epoch": 1613} {"train_loss": -5.865291118621826, "global_step": 67756, "epoch": 1613} {"train_loss": -5.980659484863281, "global_step": 67757, "epoch": 1613} {"train_loss": -5.944831848144531, "global_step": 67758, "epoch": 1613} {"train_loss": -5.961399078369141, "global_step": 67759, "epoch": 1613} {"train_loss": -5.965754508972168, "global_step": 67760, "epoch": 1613} {"train_loss": -6.009700298309326, "global_step": 67761, "epoch": 1613} {"train_loss": -6.080576419830322, "global_step": 67762, "epoch": 1613} {"train_loss": -5.864721775054932, "global_step": 67763, "epoch": 1613} {"train_loss": -5.813443183898926, "global_step": 67764, "epoch": 1613} {"train_loss": -5.900204658508301, "global_step": 67765, "epoch": 1613} {"train_loss": -6.08286714553833, "global_step": 67766, "epoch": 1613} {"train_loss": -5.952328681945801, "global_step": 67767, "epoch": 1613} {"train_loss": -6.004939556121826, "global_step": 67768, "epoch": 1613} {"train_loss": -5.989149570465088, "global_step": 67769, "epoch": 1613} {"train_loss": -5.943829536437988, "global_step": 67770, "epoch": 1613} {"train_loss": -5.971518039703369, "global_step": 67771, "epoch": 1613} {"train_loss": -6.019802093505859, "global_step": 67772, "epoch": 1613} {"train_loss": -6.034111022949219, "global_step": 67773, "epoch": 1613} {"train_loss": -5.9891743659973145, "global_step": 67774, "epoch": 1613} {"train_loss": -6.069427013397217, "global_step": 67775, "epoch": 1613} {"train_loss": -6.058684825897217, "global_step": 67776, "epoch": 1613} {"train_loss": -5.9601898193359375, "global_step": 67777, "epoch": 1613} {"train_loss": -6.001936435699463, "global_step": 67778, "epoch": 1613} {"train_loss": -6.144616603851318, "global_step": 67779, "epoch": 1613} {"train_loss": -6.038656234741211, "global_step": 67780, "epoch": 1613} {"train_loss": -6.094210624694824, "global_step": 67781, "epoch": 1613} {"train_loss": -5.9304609298706055, "global_step": 67782, "epoch": 1613} {"train_loss": -5.949573516845703, "global_step": 67783, "epoch": 1613} {"train_loss": -6.022787570953369, "global_step": 67784, "epoch": 1613} {"train_loss": -6.042226791381836, "global_step": 67785, "epoch": 1613} {"train_loss": -5.813381671905518, "global_step": 67786, "epoch": 1613} {"train_loss": -5.983897538412185, "global_step": 67787, "epoch": 1613, "val_loss": 75135.3984375} {"train_loss": -6.021058082580566, "global_step": 67788, "epoch": 1614} {"train_loss": -6.010128974914551, "global_step": 67789, "epoch": 1614} {"train_loss": -6.013144493103027, "global_step": 67790, "epoch": 1614} {"train_loss": -6.028899192810059, "global_step": 67791, "epoch": 1614} {"train_loss": -6.058910369873047, "global_step": 67792, "epoch": 1614} {"train_loss": -5.9946064949035645, "global_step": 67793, "epoch": 1614} {"train_loss": -6.024651527404785, "global_step": 67794, "epoch": 1614} {"train_loss": -5.976757049560547, "global_step": 67795, "epoch": 1614} {"train_loss": -5.954648971557617, "global_step": 67796, "epoch": 1614} {"train_loss": -6.097871780395508, "global_step": 67797, "epoch": 1614} {"train_loss": -6.052433967590332, "global_step": 67798, "epoch": 1614} {"train_loss": -5.9482102394104, "global_step": 67799, "epoch": 1614} {"train_loss": -5.985339164733887, "global_step": 67800, "epoch": 1614} {"train_loss": -6.124037742614746, "global_step": 67801, "epoch": 1614} {"train_loss": -5.892755031585693, "global_step": 67802, "epoch": 1614} {"train_loss": -5.918464660644531, "global_step": 67803, "epoch": 1614} {"train_loss": -5.86906623840332, "global_step": 67804, "epoch": 1614} {"train_loss": -5.944277763366699, "global_step": 67805, "epoch": 1614} {"train_loss": -5.970617294311523, "global_step": 67806, "epoch": 1614} {"train_loss": -5.929383277893066, "global_step": 67807, "epoch": 1614} {"train_loss": -6.120607376098633, "global_step": 67808, "epoch": 1614} {"train_loss": -5.973010540008545, "global_step": 67809, "epoch": 1614} {"train_loss": -5.933249473571777, "global_step": 67810, "epoch": 1614} {"train_loss": -5.9498748779296875, "global_step": 67811, "epoch": 1614} {"train_loss": -6.0419721603393555, "global_step": 67812, "epoch": 1614} {"train_loss": -6.026308059692383, "global_step": 67813, "epoch": 1614} {"train_loss": -5.893394947052002, "global_step": 67814, "epoch": 1614} {"train_loss": -6.03013277053833, "global_step": 67815, "epoch": 1614} {"train_loss": -5.978292465209961, "global_step": 67816, "epoch": 1614} {"train_loss": -6.008732795715332, "global_step": 67817, "epoch": 1614} {"train_loss": -5.990516662597656, "global_step": 67818, "epoch": 1614} {"train_loss": -5.947827339172363, "global_step": 67819, "epoch": 1614} {"train_loss": -6.058412551879883, "global_step": 67820, "epoch": 1614} {"train_loss": -5.966383934020996, "global_step": 67821, "epoch": 1614} {"train_loss": -6.064786911010742, "global_step": 67822, "epoch": 1614} {"train_loss": -5.9876508712768555, "global_step": 67823, "epoch": 1614} {"train_loss": -6.03029727935791, "global_step": 67824, "epoch": 1614} {"train_loss": -5.95729923248291, "global_step": 67825, "epoch": 1614} {"train_loss": -6.0069990158081055, "global_step": 67826, "epoch": 1614} {"train_loss": -5.912925720214844, "global_step": 67827, "epoch": 1614} {"train_loss": -5.9093403816223145, "global_step": 67828, "epoch": 1614} {"train_loss": -5.9896641458783835, "global_step": 67829, "epoch": 1614, "val_loss": 74596.6484375} {"train_loss": -6.042346000671387, "global_step": 67830, "epoch": 1615} {"train_loss": -5.95750617980957, "global_step": 67831, "epoch": 1615} {"train_loss": -6.055551528930664, "global_step": 67832, "epoch": 1615} {"train_loss": -5.94451379776001, "global_step": 67833, "epoch": 1615} {"train_loss": -5.8891401290893555, "global_step": 67834, "epoch": 1615} {"train_loss": -6.030306816101074, "global_step": 67835, "epoch": 1615} {"train_loss": -5.929853916168213, "global_step": 67836, "epoch": 1615} {"train_loss": -5.84763240814209, "global_step": 67837, "epoch": 1615} {"train_loss": -5.986328125, "global_step": 67838, "epoch": 1615} {"train_loss": -6.044425010681152, "global_step": 67839, "epoch": 1615} {"train_loss": -6.005657196044922, "global_step": 67840, "epoch": 1615} {"train_loss": -6.056684494018555, "global_step": 67841, "epoch": 1615} {"train_loss": -6.127784252166748, "global_step": 67842, "epoch": 1615} {"train_loss": -5.991118431091309, "global_step": 67843, "epoch": 1615} {"train_loss": -6.057419300079346, "global_step": 67844, "epoch": 1615} {"train_loss": -5.954813003540039, "global_step": 67845, "epoch": 1615} {"train_loss": -6.003293991088867, "global_step": 67846, "epoch": 1615} {"train_loss": -5.954816818237305, "global_step": 67847, "epoch": 1615} {"train_loss": -6.005826950073242, "global_step": 67848, "epoch": 1615} {"train_loss": -6.066951274871826, "global_step": 67849, "epoch": 1615} {"train_loss": -6.025883674621582, "global_step": 67850, "epoch": 1615} {"train_loss": -5.92872428894043, "global_step": 67851, "epoch": 1615} {"train_loss": -6.094139099121094, "global_step": 67852, "epoch": 1615} {"train_loss": -5.8846964836120605, "global_step": 67853, "epoch": 1615} {"train_loss": -5.921462535858154, "global_step": 67854, "epoch": 1615} {"train_loss": -5.997920989990234, "global_step": 67855, "epoch": 1615} {"train_loss": -5.819307804107666, "global_step": 67856, "epoch": 1615} {"train_loss": -5.779270172119141, "global_step": 67857, "epoch": 1615} {"train_loss": -6.012042999267578, "global_step": 67858, "epoch": 1615} {"train_loss": -5.871233940124512, "global_step": 67859, "epoch": 1615} {"train_loss": -5.995938777923584, "global_step": 67860, "epoch": 1615} {"train_loss": -5.965911388397217, "global_step": 67861, "epoch": 1615} {"train_loss": -5.933910369873047, "global_step": 67862, "epoch": 1615} {"train_loss": -6.005555152893066, "global_step": 67863, "epoch": 1615} {"train_loss": -5.829349994659424, "global_step": 67864, "epoch": 1615} {"train_loss": -5.918633460998535, "global_step": 67865, "epoch": 1615} {"train_loss": -5.948383331298828, "global_step": 67866, "epoch": 1615} {"train_loss": -5.836336612701416, "global_step": 67867, "epoch": 1615} {"train_loss": -5.962719917297363, "global_step": 67868, "epoch": 1615} {"train_loss": -5.84548282623291, "global_step": 67869, "epoch": 1615} {"train_loss": -5.937607765197754, "global_step": 67870, "epoch": 1615} {"train_loss": -5.961137828372774, "global_step": 67871, "epoch": 1615, "val_loss": 74231.6640625} {"train_loss": -6.034841537475586, "global_step": 67872, "epoch": 1616} {"train_loss": -5.933117389678955, "global_step": 67873, "epoch": 1616} {"train_loss": -5.914283275604248, "global_step": 67874, "epoch": 1616} {"train_loss": -5.934031009674072, "global_step": 67875, "epoch": 1616} {"train_loss": -5.915078639984131, "global_step": 67876, "epoch": 1616} {"train_loss": -5.850240707397461, "global_step": 67877, "epoch": 1616} {"train_loss": -5.815437316894531, "global_step": 67878, "epoch": 1616} {"train_loss": -5.88806676864624, "global_step": 67879, "epoch": 1616} {"train_loss": -6.109415054321289, "global_step": 67880, "epoch": 1616} {"train_loss": -5.980213642120361, "global_step": 67881, "epoch": 1616} {"train_loss": -6.010190010070801, "global_step": 67882, "epoch": 1616} {"train_loss": -5.96527099609375, "global_step": 67883, "epoch": 1616} {"train_loss": -5.9441046714782715, "global_step": 67884, "epoch": 1616} {"train_loss": -5.944230556488037, "global_step": 67885, "epoch": 1616} {"train_loss": -5.930710315704346, "global_step": 67886, "epoch": 1616} {"train_loss": -5.930899620056152, "global_step": 67887, "epoch": 1616} {"train_loss": -6.033581733703613, "global_step": 67888, "epoch": 1616} {"train_loss": -5.99555778503418, "global_step": 67889, "epoch": 1616} {"train_loss": -5.65899133682251, "global_step": 67890, "epoch": 1616} {"train_loss": -5.979962348937988, "global_step": 67891, "epoch": 1616} {"train_loss": -5.884040832519531, "global_step": 67892, "epoch": 1616} {"train_loss": -6.046878814697266, "global_step": 67893, "epoch": 1616} {"train_loss": -6.103123188018799, "global_step": 67894, "epoch": 1616} {"train_loss": -5.838175296783447, "global_step": 67895, "epoch": 1616} {"train_loss": -6.005681991577148, "global_step": 67896, "epoch": 1616} {"train_loss": -5.842741966247559, "global_step": 67897, "epoch": 1616} {"train_loss": -5.803251266479492, "global_step": 67898, "epoch": 1616} {"train_loss": -6.040168762207031, "global_step": 67899, "epoch": 1616} {"train_loss": -5.87661600112915, "global_step": 67900, "epoch": 1616} {"train_loss": -5.966989517211914, "global_step": 67901, "epoch": 1616} {"train_loss": -5.965799331665039, "global_step": 67902, "epoch": 1616} {"train_loss": -6.004605293273926, "global_step": 67903, "epoch": 1616} {"train_loss": -6.099281311035156, "global_step": 67904, "epoch": 1616} {"train_loss": -6.044380187988281, "global_step": 67905, "epoch": 1616} {"train_loss": -5.928611755371094, "global_step": 67906, "epoch": 1616} {"train_loss": -5.949864387512207, "global_step": 67907, "epoch": 1616} {"train_loss": -5.981265068054199, "global_step": 67908, "epoch": 1616} {"train_loss": -6.038067817687988, "global_step": 67909, "epoch": 1616} {"train_loss": -5.972269058227539, "global_step": 67910, "epoch": 1616} {"train_loss": -6.066311836242676, "global_step": 67911, "epoch": 1616} {"train_loss": -6.093546390533447, "global_step": 67912, "epoch": 1616} {"train_loss": -5.960701942443848, "global_step": 67913, "epoch": 1616, "val_loss": 74906.1640625} {"train_loss": -6.016634941101074, "global_step": 67914, "epoch": 1617} {"train_loss": -6.041412830352783, "global_step": 67915, "epoch": 1617} {"train_loss": -5.979269027709961, "global_step": 67916, "epoch": 1617} {"train_loss": -5.983491897583008, "global_step": 67917, "epoch": 1617} {"train_loss": -6.033972263336182, "global_step": 67918, "epoch": 1617} {"train_loss": -6.135470867156982, "global_step": 67919, "epoch": 1617} {"train_loss": -5.999791145324707, "global_step": 67920, "epoch": 1617} {"train_loss": -6.0189924240112305, "global_step": 67921, "epoch": 1617} {"train_loss": -6.1360063552856445, "global_step": 67922, "epoch": 1617} {"train_loss": -6.140233039855957, "global_step": 67923, "epoch": 1617} {"train_loss": -5.986413955688477, "global_step": 67924, "epoch": 1617} {"train_loss": -6.103947639465332, "global_step": 67925, "epoch": 1617} {"train_loss": -5.968575477600098, "global_step": 67926, "epoch": 1617} {"train_loss": -5.9909772872924805, "global_step": 67927, "epoch": 1617} {"train_loss": -6.00853157043457, "global_step": 67928, "epoch": 1617} {"train_loss": -6.093512535095215, "global_step": 67929, "epoch": 1617} {"train_loss": -6.011228561401367, "global_step": 67930, "epoch": 1617} {"train_loss": -5.9735107421875, "global_step": 67931, "epoch": 1617} {"train_loss": -6.109674453735352, "global_step": 67932, "epoch": 1617} {"train_loss": -6.003647804260254, "global_step": 67933, "epoch": 1617} {"train_loss": -6.06478214263916, "global_step": 67934, "epoch": 1617} {"train_loss": -6.070201873779297, "global_step": 67935, "epoch": 1617} {"train_loss": -6.032816410064697, "global_step": 67936, "epoch": 1617} {"train_loss": -5.911360263824463, "global_step": 67937, "epoch": 1617} {"train_loss": -5.983083724975586, "global_step": 67938, "epoch": 1617} {"train_loss": -5.9368896484375, "global_step": 67939, "epoch": 1617} {"train_loss": -6.062664985656738, "global_step": 67940, "epoch": 1617} {"train_loss": -6.0509161949157715, "global_step": 67941, "epoch": 1617} {"train_loss": -5.982297897338867, "global_step": 67942, "epoch": 1617} {"train_loss": -6.117849349975586, "global_step": 67943, "epoch": 1617} {"train_loss": -6.035168647766113, "global_step": 67944, "epoch": 1617} {"train_loss": -6.094260215759277, "global_step": 67945, "epoch": 1617} {"train_loss": -5.928821563720703, "global_step": 67946, "epoch": 1617} {"train_loss": -5.990694999694824, "global_step": 67947, "epoch": 1617} {"train_loss": -6.010963439941406, "global_step": 67948, "epoch": 1617} {"train_loss": -6.023077011108398, "global_step": 67949, "epoch": 1617} {"train_loss": -6.029508113861084, "global_step": 67950, "epoch": 1617} {"train_loss": -6.059549331665039, "global_step": 67951, "epoch": 1617} {"train_loss": -6.098221302032471, "global_step": 67952, "epoch": 1617} {"train_loss": -5.945512771606445, "global_step": 67953, "epoch": 1617} {"train_loss": -5.868635177612305, "global_step": 67954, "epoch": 1617} {"train_loss": -6.027128616968791, "global_step": 67955, "epoch": 1617, "val_loss": 74665.140625} {"train_loss": -5.953861236572266, "global_step": 67956, "epoch": 1618} {"train_loss": -6.004882335662842, "global_step": 67957, "epoch": 1618} {"train_loss": -5.991260528564453, "global_step": 67958, "epoch": 1618} {"train_loss": -6.095401763916016, "global_step": 67959, "epoch": 1618} {"train_loss": -5.9831037521362305, "global_step": 67960, "epoch": 1618} {"train_loss": -6.065590858459473, "global_step": 67961, "epoch": 1618} {"train_loss": -6.088069915771484, "global_step": 67962, "epoch": 1618} {"train_loss": -5.911576747894287, "global_step": 67963, "epoch": 1618} {"train_loss": -5.934715747833252, "global_step": 67964, "epoch": 1618} {"train_loss": -6.144373893737793, "global_step": 67965, "epoch": 1618} {"train_loss": -6.042850494384766, "global_step": 67966, "epoch": 1618} {"train_loss": -6.005403518676758, "global_step": 67967, "epoch": 1618} {"train_loss": -5.99753999710083, "global_step": 67968, "epoch": 1618} {"train_loss": -5.939542770385742, "global_step": 67969, "epoch": 1618} {"train_loss": -6.051743507385254, "global_step": 67970, "epoch": 1618} {"train_loss": -6.111479759216309, "global_step": 67971, "epoch": 1618} {"train_loss": -6.017538547515869, "global_step": 67972, "epoch": 1618} {"train_loss": -6.0236711502075195, "global_step": 67973, "epoch": 1618} {"train_loss": -5.9201507568359375, "global_step": 67974, "epoch": 1618} {"train_loss": -6.023388862609863, "global_step": 67975, "epoch": 1618} {"train_loss": -6.006101131439209, "global_step": 67976, "epoch": 1618} {"train_loss": -5.957455635070801, "global_step": 67977, "epoch": 1618} {"train_loss": -5.911149501800537, "global_step": 67978, "epoch": 1618} {"train_loss": -5.869782447814941, "global_step": 67979, "epoch": 1618} {"train_loss": -6.0326032638549805, "global_step": 67980, "epoch": 1618} {"train_loss": -6.069703102111816, "global_step": 67981, "epoch": 1618} {"train_loss": -5.92549991607666, "global_step": 67982, "epoch": 1618} {"train_loss": -5.971864223480225, "global_step": 67983, "epoch": 1618} {"train_loss": -5.934171676635742, "global_step": 67984, "epoch": 1618} {"train_loss": -6.005499362945557, "global_step": 67985, "epoch": 1618} {"train_loss": -5.865098476409912, "global_step": 67986, "epoch": 1618} {"train_loss": -5.844701766967773, "global_step": 67987, "epoch": 1618} {"train_loss": -5.862174034118652, "global_step": 67988, "epoch": 1618} {"train_loss": -6.020086765289307, "global_step": 67989, "epoch": 1618} {"train_loss": -5.967717170715332, "global_step": 67990, "epoch": 1618} {"train_loss": -6.013943672180176, "global_step": 67991, "epoch": 1618} {"train_loss": -5.938916206359863, "global_step": 67992, "epoch": 1618} {"train_loss": -6.069065093994141, "global_step": 67993, "epoch": 1618} {"train_loss": -6.04448127746582, "global_step": 67994, "epoch": 1618} {"train_loss": -5.919170379638672, "global_step": 67995, "epoch": 1618} {"train_loss": -5.949276924133301, "global_step": 67996, "epoch": 1618} {"train_loss": -5.988326004573277, "global_step": 67997, "epoch": 1618, "val_loss": 74387.109375} {"train_loss": -6.037938117980957, "global_step": 67998, "epoch": 1619} {"train_loss": -6.049693584442139, "global_step": 67999, "epoch": 1619} {"train_loss": -5.93430233001709, "global_step": 68000, "epoch": 1619} {"train_loss": -6.0971574783325195, "global_step": 68001, "epoch": 1619} {"train_loss": -6.0014190673828125, "global_step": 68002, "epoch": 1619} {"train_loss": -5.881709098815918, "global_step": 68003, "epoch": 1619} {"train_loss": -6.0368804931640625, "global_step": 68004, "epoch": 1619} {"train_loss": -5.832783222198486, "global_step": 68005, "epoch": 1619} {"train_loss": -5.958019256591797, "global_step": 68006, "epoch": 1619} {"train_loss": -5.847579479217529, "global_step": 68007, "epoch": 1619} {"train_loss": -5.991860389709473, "global_step": 68008, "epoch": 1619} {"train_loss": -6.00483512878418, "global_step": 68009, "epoch": 1619} {"train_loss": -6.015494346618652, "global_step": 68010, "epoch": 1619} {"train_loss": -6.001836776733398, "global_step": 68011, "epoch": 1619} {"train_loss": -5.953706741333008, "global_step": 68012, "epoch": 1619} {"train_loss": -5.949066162109375, "global_step": 68013, "epoch": 1619} {"train_loss": -5.886239051818848, "global_step": 68014, "epoch": 1619} {"train_loss": -6.050793647766113, "global_step": 68015, "epoch": 1619} {"train_loss": -6.069470405578613, "global_step": 68016, "epoch": 1619} {"train_loss": -6.0416669845581055, "global_step": 68017, "epoch": 1619} {"train_loss": -6.012845993041992, "global_step": 68018, "epoch": 1619} {"train_loss": -5.998970985412598, "global_step": 68019, "epoch": 1619} {"train_loss": -5.939568519592285, "global_step": 68020, "epoch": 1619} {"train_loss": -6.0328264236450195, "global_step": 68021, "epoch": 1619} {"train_loss": -5.8905487060546875, "global_step": 68022, "epoch": 1619} {"train_loss": -6.0183024406433105, "global_step": 68023, "epoch": 1619} {"train_loss": -6.015887260437012, "global_step": 68024, "epoch": 1619} {"train_loss": -6.0850982666015625, "global_step": 68025, "epoch": 1619} {"train_loss": -6.053837776184082, "global_step": 68026, "epoch": 1619} {"train_loss": -6.06316614151001, "global_step": 68027, "epoch": 1619} {"train_loss": -5.975498199462891, "global_step": 68028, "epoch": 1619} {"train_loss": -5.986276626586914, "global_step": 68029, "epoch": 1619} {"train_loss": -5.9888811111450195, "global_step": 68030, "epoch": 1619} {"train_loss": -5.969082355499268, "global_step": 68031, "epoch": 1619} {"train_loss": -5.96390438079834, "global_step": 68032, "epoch": 1619} {"train_loss": -5.919269561767578, "global_step": 68033, "epoch": 1619} {"train_loss": -5.877708435058594, "global_step": 68034, "epoch": 1619} {"train_loss": -5.99059534072876, "global_step": 68035, "epoch": 1619} {"train_loss": -6.051431655883789, "global_step": 68036, "epoch": 1619} {"train_loss": -6.014004230499268, "global_step": 68037, "epoch": 1619} {"train_loss": -6.065676689147949, "global_step": 68038, "epoch": 1619} {"train_loss": -5.986881664821079, "global_step": 68039, "epoch": 1619, "val_loss": 74768.15625} {"train_loss": -6.0410661697387695, "global_step": 68040, "epoch": 1620} {"train_loss": -6.055602073669434, "global_step": 68041, "epoch": 1620} {"train_loss": -5.875838279724121, "global_step": 68042, "epoch": 1620} {"train_loss": -5.962033271789551, "global_step": 68043, "epoch": 1620} {"train_loss": -5.860452175140381, "global_step": 68044, "epoch": 1620} {"train_loss": -6.056985855102539, "global_step": 68045, "epoch": 1620} {"train_loss": -5.87985897064209, "global_step": 68046, "epoch": 1620} {"train_loss": -6.043342113494873, "global_step": 68047, "epoch": 1620} {"train_loss": -5.817448616027832, "global_step": 68048, "epoch": 1620} {"train_loss": -6.132453918457031, "global_step": 68049, "epoch": 1620} {"train_loss": -6.049952507019043, "global_step": 68050, "epoch": 1620} {"train_loss": -6.130466461181641, "global_step": 68051, "epoch": 1620} {"train_loss": -5.958524227142334, "global_step": 68052, "epoch": 1620} {"train_loss": -5.993769645690918, "global_step": 68053, "epoch": 1620} {"train_loss": -6.096713066101074, "global_step": 68054, "epoch": 1620} {"train_loss": -5.973642349243164, "global_step": 68055, "epoch": 1620} {"train_loss": -6.033134460449219, "global_step": 68056, "epoch": 1620} {"train_loss": -6.014945983886719, "global_step": 68057, "epoch": 1620} {"train_loss": -6.071610450744629, "global_step": 68058, "epoch": 1620} {"train_loss": -6.0319037437438965, "global_step": 68059, "epoch": 1620} {"train_loss": -6.013055801391602, "global_step": 68060, "epoch": 1620} {"train_loss": -5.98490047454834, "global_step": 68061, "epoch": 1620} {"train_loss": -6.025018692016602, "global_step": 68062, "epoch": 1620} {"train_loss": -5.934690475463867, "global_step": 68063, "epoch": 1620} {"train_loss": -6.02530574798584, "global_step": 68064, "epoch": 1620} {"train_loss": -6.0195465087890625, "global_step": 68065, "epoch": 1620} {"train_loss": -5.902912616729736, "global_step": 68066, "epoch": 1620} {"train_loss": -5.912541389465332, "global_step": 68067, "epoch": 1620} {"train_loss": -6.058078289031982, "global_step": 68068, "epoch": 1620} {"train_loss": -5.920239448547363, "global_step": 68069, "epoch": 1620} {"train_loss": -5.996890068054199, "global_step": 68070, "epoch": 1620} {"train_loss": -6.110850811004639, "global_step": 68071, "epoch": 1620} {"train_loss": -5.892367839813232, "global_step": 68072, "epoch": 1620} {"train_loss": -5.921789169311523, "global_step": 68073, "epoch": 1620} {"train_loss": -5.870305061340332, "global_step": 68074, "epoch": 1620} {"train_loss": -5.8614606857299805, "global_step": 68075, "epoch": 1620} {"train_loss": -5.867769718170166, "global_step": 68076, "epoch": 1620} {"train_loss": -6.041560173034668, "global_step": 68077, "epoch": 1620} {"train_loss": -5.998051643371582, "global_step": 68078, "epoch": 1620} {"train_loss": -6.0430402755737305, "global_step": 68079, "epoch": 1620} {"train_loss": -5.952145576477051, "global_step": 68080, "epoch": 1620} {"train_loss": -5.979350680396671, "global_step": 68081, "epoch": 1620, "val_loss": 74762.328125} {"train_loss": -6.003232955932617, "global_step": 68082, "epoch": 1621} {"train_loss": -5.959599018096924, "global_step": 68083, "epoch": 1621} {"train_loss": -6.0135498046875, "global_step": 68084, "epoch": 1621} {"train_loss": -6.013370990753174, "global_step": 68085, "epoch": 1621} {"train_loss": -6.06806755065918, "global_step": 68086, "epoch": 1621} {"train_loss": -6.056013107299805, "global_step": 68087, "epoch": 1621} {"train_loss": -6.007320404052734, "global_step": 68088, "epoch": 1621} {"train_loss": -6.041193008422852, "global_step": 68089, "epoch": 1621} {"train_loss": -5.93690299987793, "global_step": 68090, "epoch": 1621} {"train_loss": -6.066802978515625, "global_step": 68091, "epoch": 1621} {"train_loss": -5.941571235656738, "global_step": 68092, "epoch": 1621} {"train_loss": -6.015190124511719, "global_step": 68093, "epoch": 1621} {"train_loss": -6.0096435546875, "global_step": 68094, "epoch": 1621} {"train_loss": -5.994510650634766, "global_step": 68095, "epoch": 1621} {"train_loss": -6.054841041564941, "global_step": 68096, "epoch": 1621} {"train_loss": -5.970324516296387, "global_step": 68097, "epoch": 1621} {"train_loss": -6.019341468811035, "global_step": 68098, "epoch": 1621} {"train_loss": -6.0535383224487305, "global_step": 68099, "epoch": 1621} {"train_loss": -5.873976707458496, "global_step": 68100, "epoch": 1621} {"train_loss": -6.015203952789307, "global_step": 68101, "epoch": 1621} {"train_loss": -6.025467395782471, "global_step": 68102, "epoch": 1621} {"train_loss": -6.014952659606934, "global_step": 68103, "epoch": 1621} {"train_loss": -5.990403175354004, "global_step": 68104, "epoch": 1621} {"train_loss": -6.065097332000732, "global_step": 68105, "epoch": 1621} {"train_loss": -6.022686004638672, "global_step": 68106, "epoch": 1621} {"train_loss": -6.195068359375, "global_step": 68107, "epoch": 1621} {"train_loss": -5.972825050354004, "global_step": 68108, "epoch": 1621} {"train_loss": -5.893169403076172, "global_step": 68109, "epoch": 1621} {"train_loss": -6.015588283538818, "global_step": 68110, "epoch": 1621} {"train_loss": -5.994866847991943, "global_step": 68111, "epoch": 1621} {"train_loss": -5.880732536315918, "global_step": 68112, "epoch": 1621} {"train_loss": -5.947580337524414, "global_step": 68113, "epoch": 1621} {"train_loss": -6.073925018310547, "global_step": 68114, "epoch": 1621} {"train_loss": -6.037964820861816, "global_step": 68115, "epoch": 1621} {"train_loss": -5.989429473876953, "global_step": 68116, "epoch": 1621} {"train_loss": -5.973501205444336, "global_step": 68117, "epoch": 1621} {"train_loss": -5.991552352905273, "global_step": 68118, "epoch": 1621} {"train_loss": -5.9211273193359375, "global_step": 68119, "epoch": 1621} {"train_loss": -5.996980667114258, "global_step": 68120, "epoch": 1621} {"train_loss": -5.891719818115234, "global_step": 68121, "epoch": 1621} {"train_loss": -6.1024017333984375, "global_step": 68122, "epoch": 1621} {"train_loss": -6.001700866790045, "global_step": 68123, "epoch": 1621, "val_loss": 74649.984375} {"train_loss": -5.957235336303711, "global_step": 68124, "epoch": 1622} {"train_loss": -5.902924060821533, "global_step": 68125, "epoch": 1622} {"train_loss": -5.95008659362793, "global_step": 68126, "epoch": 1622} {"train_loss": -5.996826171875, "global_step": 68127, "epoch": 1622} {"train_loss": -6.089023590087891, "global_step": 68128, "epoch": 1622} {"train_loss": -5.96854829788208, "global_step": 68129, "epoch": 1622} {"train_loss": -6.07930850982666, "global_step": 68130, "epoch": 1622} {"train_loss": -5.959481239318848, "global_step": 68131, "epoch": 1622} {"train_loss": -6.048501014709473, "global_step": 68132, "epoch": 1622} {"train_loss": -6.113205909729004, "global_step": 68133, "epoch": 1622} {"train_loss": -5.7881927490234375, "global_step": 68134, "epoch": 1622} {"train_loss": -5.908977508544922, "global_step": 68135, "epoch": 1622} {"train_loss": -5.874616622924805, "global_step": 68136, "epoch": 1622} {"train_loss": -6.110152244567871, "global_step": 68137, "epoch": 1622} {"train_loss": -5.921332836151123, "global_step": 68138, "epoch": 1622} {"train_loss": -6.034196853637695, "global_step": 68139, "epoch": 1622} {"train_loss": -6.036336421966553, "global_step": 68140, "epoch": 1622} {"train_loss": -6.078139305114746, "global_step": 68141, "epoch": 1622} {"train_loss": -6.022953987121582, "global_step": 68142, "epoch": 1622} {"train_loss": -6.0763936042785645, "global_step": 68143, "epoch": 1622} {"train_loss": -6.0217390060424805, "global_step": 68144, "epoch": 1622} {"train_loss": -5.992761611938477, "global_step": 68145, "epoch": 1622} {"train_loss": -5.9567461013793945, "global_step": 68146, "epoch": 1622} {"train_loss": -5.942469120025635, "global_step": 68147, "epoch": 1622} {"train_loss": -5.9103803634643555, "global_step": 68148, "epoch": 1622} {"train_loss": -5.884909152984619, "global_step": 68149, "epoch": 1622} {"train_loss": -6.032200813293457, "global_step": 68150, "epoch": 1622} {"train_loss": -5.9507856369018555, "global_step": 68151, "epoch": 1622} {"train_loss": -5.891594886779785, "global_step": 68152, "epoch": 1622} {"train_loss": -5.931197166442871, "global_step": 68153, "epoch": 1622} {"train_loss": -5.97838020324707, "global_step": 68154, "epoch": 1622} {"train_loss": -5.898632049560547, "global_step": 68155, "epoch": 1622} {"train_loss": -5.910726547241211, "global_step": 68156, "epoch": 1622} {"train_loss": -6.069571495056152, "global_step": 68157, "epoch": 1622} {"train_loss": -5.918023109436035, "global_step": 68158, "epoch": 1622} {"train_loss": -5.950295925140381, "global_step": 68159, "epoch": 1622} {"train_loss": -5.873744964599609, "global_step": 68160, "epoch": 1622} {"train_loss": -5.885965347290039, "global_step": 68161, "epoch": 1622} {"train_loss": -6.03953742980957, "global_step": 68162, "epoch": 1622} {"train_loss": -5.90158224105835, "global_step": 68163, "epoch": 1622} {"train_loss": -5.9450273513793945, "global_step": 68164, "epoch": 1622} {"train_loss": -5.972284646261306, "global_step": 68165, "epoch": 1622, "val_loss": 74607.1796875} {"train_loss": -5.964269638061523, "global_step": 68166, "epoch": 1623} {"train_loss": -6.004709243774414, "global_step": 68167, "epoch": 1623} {"train_loss": -6.019680500030518, "global_step": 68168, "epoch": 1623} {"train_loss": -5.909071922302246, "global_step": 68169, "epoch": 1623} {"train_loss": -6.009220123291016, "global_step": 68170, "epoch": 1623} {"train_loss": -6.033424377441406, "global_step": 68171, "epoch": 1623} {"train_loss": -6.033401012420654, "global_step": 68172, "epoch": 1623} {"train_loss": -5.959146499633789, "global_step": 68173, "epoch": 1623} {"train_loss": -6.041577339172363, "global_step": 68174, "epoch": 1623} {"train_loss": -5.969915866851807, "global_step": 68175, "epoch": 1623} {"train_loss": -6.022930145263672, "global_step": 68176, "epoch": 1623} {"train_loss": -5.9486799240112305, "global_step": 68177, "epoch": 1623} {"train_loss": -5.945740699768066, "global_step": 68178, "epoch": 1623} {"train_loss": -5.904118537902832, "global_step": 68179, "epoch": 1623} {"train_loss": -5.972440242767334, "global_step": 68180, "epoch": 1623} {"train_loss": -5.927702903747559, "global_step": 68181, "epoch": 1623} {"train_loss": -5.968581676483154, "global_step": 68182, "epoch": 1623} {"train_loss": -6.005441188812256, "global_step": 68183, "epoch": 1623} {"train_loss": -6.017742156982422, "global_step": 68184, "epoch": 1623} {"train_loss": -6.064249515533447, "global_step": 68185, "epoch": 1623} {"train_loss": -5.866473197937012, "global_step": 68186, "epoch": 1623} {"train_loss": -5.855483055114746, "global_step": 68187, "epoch": 1623} {"train_loss": -5.980759620666504, "global_step": 68188, "epoch": 1623} {"train_loss": -5.866327285766602, "global_step": 68189, "epoch": 1623} {"train_loss": -5.824527740478516, "global_step": 68190, "epoch": 1623} {"train_loss": -6.1237077713012695, "global_step": 68191, "epoch": 1623} {"train_loss": -5.747334003448486, "global_step": 68192, "epoch": 1623} {"train_loss": -5.9511518478393555, "global_step": 68193, "epoch": 1623} {"train_loss": -5.9433183670043945, "global_step": 68194, "epoch": 1623} {"train_loss": -5.966845989227295, "global_step": 68195, "epoch": 1623} {"train_loss": -5.826225757598877, "global_step": 68196, "epoch": 1623} {"train_loss": -5.988271713256836, "global_step": 68197, "epoch": 1623} {"train_loss": -5.959856986999512, "global_step": 68198, "epoch": 1623} {"train_loss": -5.917103290557861, "global_step": 68199, "epoch": 1623} {"train_loss": -6.039228439331055, "global_step": 68200, "epoch": 1623} {"train_loss": -6.039824485778809, "global_step": 68201, "epoch": 1623} {"train_loss": -5.995419979095459, "global_step": 68202, "epoch": 1623} {"train_loss": -6.08309268951416, "global_step": 68203, "epoch": 1623} {"train_loss": -6.006495475769043, "global_step": 68204, "epoch": 1623} {"train_loss": -5.904269695281982, "global_step": 68205, "epoch": 1623} {"train_loss": -6.04380989074707, "global_step": 68206, "epoch": 1623} {"train_loss": -5.968597650527954, "global_step": 68207, "epoch": 1623, "val_loss": 74487.1484375} {"train_loss": -6.087192535400391, "global_step": 68208, "epoch": 1624} {"train_loss": -5.853967189788818, "global_step": 68209, "epoch": 1624} {"train_loss": -5.83062744140625, "global_step": 68210, "epoch": 1624} {"train_loss": -6.006499290466309, "global_step": 68211, "epoch": 1624} {"train_loss": -5.949819564819336, "global_step": 68212, "epoch": 1624} {"train_loss": -5.877824306488037, "global_step": 68213, "epoch": 1624} {"train_loss": -5.87191915512085, "global_step": 68214, "epoch": 1624} {"train_loss": -5.905109405517578, "global_step": 68215, "epoch": 1624} {"train_loss": -5.983545780181885, "global_step": 68216, "epoch": 1624} {"train_loss": -5.942731857299805, "global_step": 68217, "epoch": 1624} {"train_loss": -5.904272079467773, "global_step": 68218, "epoch": 1624} {"train_loss": -6.073529243469238, "global_step": 68219, "epoch": 1624} {"train_loss": -6.026968002319336, "global_step": 68220, "epoch": 1624} {"train_loss": -6.1355133056640625, "global_step": 68221, "epoch": 1624} {"train_loss": -5.947041988372803, "global_step": 68222, "epoch": 1624} {"train_loss": -5.981934547424316, "global_step": 68223, "epoch": 1624} {"train_loss": -5.9845290184021, "global_step": 68224, "epoch": 1624} {"train_loss": -6.179619312286377, "global_step": 68225, "epoch": 1624} {"train_loss": -6.023576259613037, "global_step": 68226, "epoch": 1624} {"train_loss": -6.116945743560791, "global_step": 68227, "epoch": 1624} {"train_loss": -6.0996809005737305, "global_step": 68228, "epoch": 1624} {"train_loss": -5.971909523010254, "global_step": 68229, "epoch": 1624} {"train_loss": -6.031121730804443, "global_step": 68230, "epoch": 1624} {"train_loss": -6.101187705993652, "global_step": 68231, "epoch": 1624} {"train_loss": -6.05420446395874, "global_step": 68232, "epoch": 1624} {"train_loss": -6.058539390563965, "global_step": 68233, "epoch": 1624} {"train_loss": -6.067781448364258, "global_step": 68234, "epoch": 1624} {"train_loss": -6.146787166595459, "global_step": 68235, "epoch": 1624} {"train_loss": -5.982367515563965, "global_step": 68236, "epoch": 1624} {"train_loss": -5.951125144958496, "global_step": 68237, "epoch": 1624} {"train_loss": -6.078407287597656, "global_step": 68238, "epoch": 1624} {"train_loss": -5.970717430114746, "global_step": 68239, "epoch": 1624} {"train_loss": -5.979386329650879, "global_step": 68240, "epoch": 1624} {"train_loss": -6.145106792449951, "global_step": 68241, "epoch": 1624} {"train_loss": -6.050198554992676, "global_step": 68242, "epoch": 1624} {"train_loss": -6.000861167907715, "global_step": 68243, "epoch": 1624} {"train_loss": -6.047418117523193, "global_step": 68244, "epoch": 1624} {"train_loss": -6.02126407623291, "global_step": 68245, "epoch": 1624} {"train_loss": -6.023080825805664, "global_step": 68246, "epoch": 1624} {"train_loss": -5.993436813354492, "global_step": 68247, "epoch": 1624} {"train_loss": -6.06342887878418, "global_step": 68248, "epoch": 1624} {"train_loss": -6.013114713487171, "global_step": 68249, "epoch": 1624, "val_loss": 74676.6015625} {"train_loss": -5.984748363494873, "global_step": 68250, "epoch": 1625} {"train_loss": -6.129688262939453, "global_step": 68251, "epoch": 1625} {"train_loss": -6.005138397216797, "global_step": 68252, "epoch": 1625} {"train_loss": -6.14996337890625, "global_step": 68253, "epoch": 1625} {"train_loss": -5.861215591430664, "global_step": 68254, "epoch": 1625} {"train_loss": -6.044926166534424, "global_step": 68255, "epoch": 1625} {"train_loss": -5.935024261474609, "global_step": 68256, "epoch": 1625} {"train_loss": -6.062097072601318, "global_step": 68257, "epoch": 1625} {"train_loss": -6.08988094329834, "global_step": 68258, "epoch": 1625} {"train_loss": -5.92168664932251, "global_step": 68259, "epoch": 1625} {"train_loss": -6.138486862182617, "global_step": 68260, "epoch": 1625} {"train_loss": -6.087973594665527, "global_step": 68261, "epoch": 1625} {"train_loss": -6.011687278747559, "global_step": 68262, "epoch": 1625} {"train_loss": -6.097110271453857, "global_step": 68263, "epoch": 1625} {"train_loss": -6.10715389251709, "global_step": 68264, "epoch": 1625} {"train_loss": -6.07773494720459, "global_step": 68265, "epoch": 1625} {"train_loss": -6.047490119934082, "global_step": 68266, "epoch": 1625} {"train_loss": -6.034317970275879, "global_step": 68267, "epoch": 1625} {"train_loss": -5.883415699005127, "global_step": 68268, "epoch": 1625} {"train_loss": -6.090512275695801, "global_step": 68269, "epoch": 1625} {"train_loss": -6.0277018547058105, "global_step": 68270, "epoch": 1625} {"train_loss": -5.962281227111816, "global_step": 68271, "epoch": 1625} {"train_loss": -6.060135841369629, "global_step": 68272, "epoch": 1625} {"train_loss": -6.007663726806641, "global_step": 68273, "epoch": 1625} {"train_loss": -5.8669328689575195, "global_step": 68274, "epoch": 1625} {"train_loss": -6.11672830581665, "global_step": 68275, "epoch": 1625} {"train_loss": -6.116299629211426, "global_step": 68276, "epoch": 1625} {"train_loss": -6.018418788909912, "global_step": 68277, "epoch": 1625} {"train_loss": -6.0011186599731445, "global_step": 68278, "epoch": 1625} {"train_loss": -6.010605812072754, "global_step": 68279, "epoch": 1625} {"train_loss": -5.896331787109375, "global_step": 68280, "epoch": 1625} {"train_loss": -6.024525165557861, "global_step": 68281, "epoch": 1625} {"train_loss": -6.097350597381592, "global_step": 68282, "epoch": 1625} {"train_loss": -6.01283597946167, "global_step": 68283, "epoch": 1625} {"train_loss": -5.980923652648926, "global_step": 68284, "epoch": 1625} {"train_loss": -5.981839179992676, "global_step": 68285, "epoch": 1625} {"train_loss": -5.835153579711914, "global_step": 68286, "epoch": 1625} {"train_loss": -6.074316501617432, "global_step": 68287, "epoch": 1625} {"train_loss": -5.976783275604248, "global_step": 68288, "epoch": 1625} {"train_loss": -6.018820762634277, "global_step": 68289, "epoch": 1625} {"train_loss": -5.9798583984375, "global_step": 68290, "epoch": 1625} {"train_loss": -6.018815880730038, "global_step": 68291, "epoch": 1625, "val_loss": 74856.78125} {"train_loss": -5.98967981338501, "global_step": 68292, "epoch": 1626} {"train_loss": -5.991018295288086, "global_step": 68293, "epoch": 1626} {"train_loss": -5.9851298332214355, "global_step": 68294, "epoch": 1626} {"train_loss": -5.975629806518555, "global_step": 68295, "epoch": 1626} {"train_loss": -6.078039169311523, "global_step": 68296, "epoch": 1626} {"train_loss": -6.102357864379883, "global_step": 68297, "epoch": 1626} {"train_loss": -5.947698593139648, "global_step": 68298, "epoch": 1626} {"train_loss": -6.068727016448975, "global_step": 68299, "epoch": 1626} {"train_loss": -5.970352649688721, "global_step": 68300, "epoch": 1626} {"train_loss": -5.975687503814697, "global_step": 68301, "epoch": 1626} {"train_loss": -6.019050598144531, "global_step": 68302, "epoch": 1626} {"train_loss": -5.93351936340332, "global_step": 68303, "epoch": 1626} {"train_loss": -6.052755832672119, "global_step": 68304, "epoch": 1626} {"train_loss": -6.03300666809082, "global_step": 68305, "epoch": 1626} {"train_loss": -6.0780158042907715, "global_step": 68306, "epoch": 1626} {"train_loss": -6.034635543823242, "global_step": 68307, "epoch": 1626} {"train_loss": -5.954355239868164, "global_step": 68308, "epoch": 1626} {"train_loss": -6.0173492431640625, "global_step": 68309, "epoch": 1626} {"train_loss": -6.103827953338623, "global_step": 68310, "epoch": 1626} {"train_loss": -6.040109634399414, "global_step": 68311, "epoch": 1626} {"train_loss": -6.07047176361084, "global_step": 68312, "epoch": 1626} {"train_loss": -6.014552593231201, "global_step": 68313, "epoch": 1626} {"train_loss": -5.974673271179199, "global_step": 68314, "epoch": 1626} {"train_loss": -6.123412132263184, "global_step": 68315, "epoch": 1626} {"train_loss": -5.9674835205078125, "global_step": 68316, "epoch": 1626} {"train_loss": -5.909763336181641, "global_step": 68317, "epoch": 1626} {"train_loss": -5.953238010406494, "global_step": 68318, "epoch": 1626} {"train_loss": -6.014866828918457, "global_step": 68319, "epoch": 1626} {"train_loss": -6.0390753746032715, "global_step": 68320, "epoch": 1626} {"train_loss": -5.948482990264893, "global_step": 68321, "epoch": 1626} {"train_loss": -6.03702974319458, "global_step": 68322, "epoch": 1626} {"train_loss": -5.981107711791992, "global_step": 68323, "epoch": 1626} {"train_loss": -6.015805721282959, "global_step": 68324, "epoch": 1626} {"train_loss": -5.983978748321533, "global_step": 68325, "epoch": 1626} {"train_loss": -5.947432518005371, "global_step": 68326, "epoch": 1626} {"train_loss": -5.96266508102417, "global_step": 68327, "epoch": 1626} {"train_loss": -5.952813148498535, "global_step": 68328, "epoch": 1626} {"train_loss": -6.011096000671387, "global_step": 68329, "epoch": 1626} {"train_loss": -6.000018119812012, "global_step": 68330, "epoch": 1626} {"train_loss": -5.950769424438477, "global_step": 68331, "epoch": 1626} {"train_loss": -5.961163520812988, "global_step": 68332, "epoch": 1626} {"train_loss": -6.003544103531611, "global_step": 68333, "epoch": 1626, "val_loss": 74481.859375} {"train_loss": -6.067598819732666, "global_step": 68334, "epoch": 1627} {"train_loss": -6.008415222167969, "global_step": 68335, "epoch": 1627} {"train_loss": -5.926426887512207, "global_step": 68336, "epoch": 1627} {"train_loss": -6.049023628234863, "global_step": 68337, "epoch": 1627} {"train_loss": -5.932673454284668, "global_step": 68338, "epoch": 1627} {"train_loss": -5.976946830749512, "global_step": 68339, "epoch": 1627} {"train_loss": -6.054695129394531, "global_step": 68340, "epoch": 1627} {"train_loss": -6.006422996520996, "global_step": 68341, "epoch": 1627} {"train_loss": -6.019586563110352, "global_step": 68342, "epoch": 1627} {"train_loss": -6.0551838874816895, "global_step": 68343, "epoch": 1627} {"train_loss": -6.000042915344238, "global_step": 68344, "epoch": 1627} {"train_loss": -6.070418357849121, "global_step": 68345, "epoch": 1627} {"train_loss": -5.989786148071289, "global_step": 68346, "epoch": 1627} {"train_loss": -6.108359336853027, "global_step": 68347, "epoch": 1627} {"train_loss": -6.060666084289551, "global_step": 68348, "epoch": 1627} {"train_loss": -6.076666355133057, "global_step": 68349, "epoch": 1627} {"train_loss": -6.023438453674316, "global_step": 68350, "epoch": 1627} {"train_loss": -5.98998498916626, "global_step": 68351, "epoch": 1627} {"train_loss": -5.996391296386719, "global_step": 68352, "epoch": 1627} {"train_loss": -5.9319071769714355, "global_step": 68353, "epoch": 1627} {"train_loss": -5.924713134765625, "global_step": 68354, "epoch": 1627} {"train_loss": -6.104808807373047, "global_step": 68355, "epoch": 1627} {"train_loss": -6.116552352905273, "global_step": 68356, "epoch": 1627} {"train_loss": -5.998475074768066, "global_step": 68357, "epoch": 1627} {"train_loss": -6.054039478302002, "global_step": 68358, "epoch": 1627} {"train_loss": -5.918371677398682, "global_step": 68359, "epoch": 1627} {"train_loss": -6.054181098937988, "global_step": 68360, "epoch": 1627} {"train_loss": -6.1680450439453125, "global_step": 68361, "epoch": 1627} {"train_loss": -6.061108112335205, "global_step": 68362, "epoch": 1627} {"train_loss": -6.136594295501709, "global_step": 68363, "epoch": 1627} {"train_loss": -6.026643753051758, "global_step": 68364, "epoch": 1627} {"train_loss": -6.039353847503662, "global_step": 68365, "epoch": 1627} {"train_loss": -6.025694370269775, "global_step": 68366, "epoch": 1627} {"train_loss": -6.0188374519348145, "global_step": 68367, "epoch": 1627} {"train_loss": -6.017760276794434, "global_step": 68368, "epoch": 1627} {"train_loss": -6.097243309020996, "global_step": 68369, "epoch": 1627} {"train_loss": -5.834067344665527, "global_step": 68370, "epoch": 1627} {"train_loss": -5.968520164489746, "global_step": 68371, "epoch": 1627} {"train_loss": -5.874331474304199, "global_step": 68372, "epoch": 1627} {"train_loss": -5.92469596862793, "global_step": 68373, "epoch": 1627} {"train_loss": -5.774242877960205, "global_step": 68374, "epoch": 1627} {"train_loss": -6.009887547720046, "global_step": 68375, "epoch": 1627, "val_loss": 74847.6640625} {"train_loss": -5.977952003479004, "global_step": 68376, "epoch": 1628} {"train_loss": -5.955089569091797, "global_step": 68377, "epoch": 1628} {"train_loss": -6.055050849914551, "global_step": 68378, "epoch": 1628} {"train_loss": -5.935985088348389, "global_step": 68379, "epoch": 1628} {"train_loss": -5.96260929107666, "global_step": 68380, "epoch": 1628} {"train_loss": -5.962752819061279, "global_step": 68381, "epoch": 1628} {"train_loss": -6.039700508117676, "global_step": 68382, "epoch": 1628} {"train_loss": -6.003220558166504, "global_step": 68383, "epoch": 1628} {"train_loss": -5.920182228088379, "global_step": 68384, "epoch": 1628} {"train_loss": -5.903016090393066, "global_step": 68385, "epoch": 1628} {"train_loss": -5.835621356964111, "global_step": 68386, "epoch": 1628} {"train_loss": -6.019999027252197, "global_step": 68387, "epoch": 1628} {"train_loss": -6.059205055236816, "global_step": 68388, "epoch": 1628} {"train_loss": -5.787017345428467, "global_step": 68389, "epoch": 1628} {"train_loss": -6.038320541381836, "global_step": 68390, "epoch": 1628} {"train_loss": -5.816544055938721, "global_step": 68391, "epoch": 1628} {"train_loss": -5.732832908630371, "global_step": 68392, "epoch": 1628} {"train_loss": -6.010410308837891, "global_step": 68393, "epoch": 1628} {"train_loss": -5.837388038635254, "global_step": 68394, "epoch": 1628} {"train_loss": -5.866310119628906, "global_step": 68395, "epoch": 1628} {"train_loss": -5.858602523803711, "global_step": 68396, "epoch": 1628} {"train_loss": -5.829018592834473, "global_step": 68397, "epoch": 1628} {"train_loss": -6.012232780456543, "global_step": 68398, "epoch": 1628} {"train_loss": -5.899045944213867, "global_step": 68399, "epoch": 1628} {"train_loss": -6.002925872802734, "global_step": 68400, "epoch": 1628} {"train_loss": -6.046236991882324, "global_step": 68401, "epoch": 1628} {"train_loss": -6.008772850036621, "global_step": 68402, "epoch": 1628} {"train_loss": -5.890278339385986, "global_step": 68403, "epoch": 1628} {"train_loss": -6.05256462097168, "global_step": 68404, "epoch": 1628} {"train_loss": -5.822271347045898, "global_step": 68405, "epoch": 1628} {"train_loss": -6.040329456329346, "global_step": 68406, "epoch": 1628} {"train_loss": -5.8924560546875, "global_step": 68407, "epoch": 1628} {"train_loss": -6.00652551651001, "global_step": 68408, "epoch": 1628} {"train_loss": -5.998773574829102, "global_step": 68409, "epoch": 1628} {"train_loss": -6.026444435119629, "global_step": 68410, "epoch": 1628} {"train_loss": -5.968498229980469, "global_step": 68411, "epoch": 1628} {"train_loss": -6.00007438659668, "global_step": 68412, "epoch": 1628} {"train_loss": -6.0296630859375, "global_step": 68413, "epoch": 1628} {"train_loss": -5.922106742858887, "global_step": 68414, "epoch": 1628} {"train_loss": -5.928305625915527, "global_step": 68415, "epoch": 1628} {"train_loss": -5.946805953979492, "global_step": 68416, "epoch": 1628} {"train_loss": -5.948611293520246, "global_step": 68417, "epoch": 1628, "val_loss": 74467.7734375} {"train_loss": -6.089531421661377, "global_step": 68418, "epoch": 1629} {"train_loss": -5.988131523132324, "global_step": 68419, "epoch": 1629} {"train_loss": -5.894829750061035, "global_step": 68420, "epoch": 1629} {"train_loss": -5.967113971710205, "global_step": 68421, "epoch": 1629} {"train_loss": -5.88284158706665, "global_step": 68422, "epoch": 1629} {"train_loss": -5.986072540283203, "global_step": 68423, "epoch": 1629} {"train_loss": -6.120656967163086, "global_step": 68424, "epoch": 1629} {"train_loss": -5.881131172180176, "global_step": 68425, "epoch": 1629} {"train_loss": -6.033712387084961, "global_step": 68426, "epoch": 1629} {"train_loss": -6.023019790649414, "global_step": 68427, "epoch": 1629} {"train_loss": -5.930013656616211, "global_step": 68428, "epoch": 1629} {"train_loss": -6.036738872528076, "global_step": 68429, "epoch": 1629} {"train_loss": -5.861988544464111, "global_step": 68430, "epoch": 1629} {"train_loss": -6.000588417053223, "global_step": 68431, "epoch": 1629} {"train_loss": -6.012664794921875, "global_step": 68432, "epoch": 1629} {"train_loss": -5.8587565422058105, "global_step": 68433, "epoch": 1629} {"train_loss": -5.964613437652588, "global_step": 68434, "epoch": 1629} {"train_loss": -5.978555679321289, "global_step": 68435, "epoch": 1629} {"train_loss": -5.966042518615723, "global_step": 68436, "epoch": 1629} {"train_loss": -6.128498077392578, "global_step": 68437, "epoch": 1629} {"train_loss": -6.050134658813477, "global_step": 68438, "epoch": 1629} {"train_loss": -5.994671821594238, "global_step": 68439, "epoch": 1629} {"train_loss": -6.006887435913086, "global_step": 68440, "epoch": 1629} {"train_loss": -6.057446479797363, "global_step": 68441, "epoch": 1629} {"train_loss": -6.038919925689697, "global_step": 68442, "epoch": 1629} {"train_loss": -5.9999518394470215, "global_step": 68443, "epoch": 1629} {"train_loss": -6.004423141479492, "global_step": 68444, "epoch": 1629} {"train_loss": -5.952722072601318, "global_step": 68445, "epoch": 1629} {"train_loss": -5.917799949645996, "global_step": 68446, "epoch": 1629} {"train_loss": -6.085497856140137, "global_step": 68447, "epoch": 1629} {"train_loss": -5.985982894897461, "global_step": 68448, "epoch": 1629} {"train_loss": -5.891602039337158, "global_step": 68449, "epoch": 1629} {"train_loss": -6.0176849365234375, "global_step": 68450, "epoch": 1629} {"train_loss": -5.899019241333008, "global_step": 68451, "epoch": 1629} {"train_loss": -6.031411170959473, "global_step": 68452, "epoch": 1629} {"train_loss": -6.219180107116699, "global_step": 68453, "epoch": 1629} {"train_loss": -6.000115394592285, "global_step": 68454, "epoch": 1629} {"train_loss": -6.029288291931152, "global_step": 68455, "epoch": 1629} {"train_loss": -6.063538074493408, "global_step": 68456, "epoch": 1629} {"train_loss": -6.01897668838501, "global_step": 68457, "epoch": 1629} {"train_loss": -5.926604270935059, "global_step": 68458, "epoch": 1629} {"train_loss": -5.997548114685785, "global_step": 68459, "epoch": 1629, "val_loss": 74761.515625} {"train_loss": -6.169416427612305, "global_step": 68460, "epoch": 1630} {"train_loss": -5.925515651702881, "global_step": 68461, "epoch": 1630} {"train_loss": -6.1061625480651855, "global_step": 68462, "epoch": 1630} {"train_loss": -5.948513031005859, "global_step": 68463, "epoch": 1630} {"train_loss": -5.996787071228027, "global_step": 68464, "epoch": 1630} {"train_loss": -6.001794815063477, "global_step": 68465, "epoch": 1630} {"train_loss": -6.110520362854004, "global_step": 68466, "epoch": 1630} {"train_loss": -5.916645050048828, "global_step": 68467, "epoch": 1630} {"train_loss": -5.9115142822265625, "global_step": 68468, "epoch": 1630} {"train_loss": -6.031491279602051, "global_step": 68469, "epoch": 1630} {"train_loss": -5.9790215492248535, "global_step": 68470, "epoch": 1630} {"train_loss": -5.981417179107666, "global_step": 68471, "epoch": 1630} {"train_loss": -6.015774726867676, "global_step": 68472, "epoch": 1630} {"train_loss": -6.070743083953857, "global_step": 68473, "epoch": 1630} {"train_loss": -5.9974260330200195, "global_step": 68474, "epoch": 1630} {"train_loss": -6.101078987121582, "global_step": 68475, "epoch": 1630} {"train_loss": -5.888736724853516, "global_step": 68476, "epoch": 1630} {"train_loss": -6.047938823699951, "global_step": 68477, "epoch": 1630} {"train_loss": -6.0280351638793945, "global_step": 68478, "epoch": 1630} {"train_loss": -6.041284084320068, "global_step": 68479, "epoch": 1630} {"train_loss": -5.946712017059326, "global_step": 68480, "epoch": 1630} {"train_loss": -6.023054122924805, "global_step": 68481, "epoch": 1630} {"train_loss": -6.009151935577393, "global_step": 68482, "epoch": 1630} {"train_loss": -6.06685733795166, "global_step": 68483, "epoch": 1630} {"train_loss": -5.964210510253906, "global_step": 68484, "epoch": 1630} {"train_loss": -5.935988426208496, "global_step": 68485, "epoch": 1630} {"train_loss": -5.995071887969971, "global_step": 68486, "epoch": 1630} {"train_loss": -5.973333358764648, "global_step": 68487, "epoch": 1630} {"train_loss": -6.0174102783203125, "global_step": 68488, "epoch": 1630} {"train_loss": -5.942914962768555, "global_step": 68489, "epoch": 1630} {"train_loss": -5.9405517578125, "global_step": 68490, "epoch": 1630} {"train_loss": -6.005196571350098, "global_step": 68491, "epoch": 1630} {"train_loss": -6.1024298667907715, "global_step": 68492, "epoch": 1630} {"train_loss": -5.936285495758057, "global_step": 68493, "epoch": 1630} {"train_loss": -5.945643424987793, "global_step": 68494, "epoch": 1630} {"train_loss": -6.043422698974609, "global_step": 68495, "epoch": 1630} {"train_loss": -5.789078712463379, "global_step": 68496, "epoch": 1630} {"train_loss": -6.008631706237793, "global_step": 68497, "epoch": 1630} {"train_loss": -5.915281295776367, "global_step": 68498, "epoch": 1630} {"train_loss": -6.07667350769043, "global_step": 68499, "epoch": 1630} {"train_loss": -5.927056312561035, "global_step": 68500, "epoch": 1630} {"train_loss": -5.992886304855347, "global_step": 68501, "epoch": 1630, "val_loss": 74858.046875} {"train_loss": -5.914978981018066, "global_step": 68502, "epoch": 1631} {"train_loss": -5.896989822387695, "global_step": 68503, "epoch": 1631} {"train_loss": -5.920322418212891, "global_step": 68504, "epoch": 1631} {"train_loss": -5.961782932281494, "global_step": 68505, "epoch": 1631} {"train_loss": -5.9125261306762695, "global_step": 68506, "epoch": 1631} {"train_loss": -5.927715301513672, "global_step": 68507, "epoch": 1631} {"train_loss": -5.926209449768066, "global_step": 68508, "epoch": 1631} {"train_loss": -5.939638137817383, "global_step": 68509, "epoch": 1631} {"train_loss": -6.07326078414917, "global_step": 68510, "epoch": 1631} {"train_loss": -6.024427890777588, "global_step": 68511, "epoch": 1631} {"train_loss": -6.00015926361084, "global_step": 68512, "epoch": 1631} {"train_loss": -6.139204978942871, "global_step": 68513, "epoch": 1631} {"train_loss": -5.903127670288086, "global_step": 68514, "epoch": 1631} {"train_loss": -5.995928764343262, "global_step": 68515, "epoch": 1631} {"train_loss": -5.954228401184082, "global_step": 68516, "epoch": 1631} {"train_loss": -5.992922782897949, "global_step": 68517, "epoch": 1631} {"train_loss": -5.949239730834961, "global_step": 68518, "epoch": 1631} {"train_loss": -5.87833309173584, "global_step": 68519, "epoch": 1631} {"train_loss": -6.00160026550293, "global_step": 68520, "epoch": 1631} {"train_loss": -5.825169563293457, "global_step": 68521, "epoch": 1631} {"train_loss": -5.906942367553711, "global_step": 68522, "epoch": 1631} {"train_loss": -6.018610954284668, "global_step": 68523, "epoch": 1631} {"train_loss": -6.0119829177856445, "global_step": 68524, "epoch": 1631} {"train_loss": -5.980105400085449, "global_step": 68525, "epoch": 1631} {"train_loss": -5.982736587524414, "global_step": 68526, "epoch": 1631} {"train_loss": -5.978344917297363, "global_step": 68527, "epoch": 1631} {"train_loss": -5.964922904968262, "global_step": 68528, "epoch": 1631} {"train_loss": -6.064003944396973, "global_step": 68529, "epoch": 1631} {"train_loss": -5.998246669769287, "global_step": 68530, "epoch": 1631} {"train_loss": -5.865950584411621, "global_step": 68531, "epoch": 1631} {"train_loss": -6.0204925537109375, "global_step": 68532, "epoch": 1631} {"train_loss": -5.980341911315918, "global_step": 68533, "epoch": 1631} {"train_loss": -6.100034236907959, "global_step": 68534, "epoch": 1631} {"train_loss": -6.027382850646973, "global_step": 68535, "epoch": 1631} {"train_loss": -6.079804420471191, "global_step": 68536, "epoch": 1631} {"train_loss": -5.988747596740723, "global_step": 68537, "epoch": 1631} {"train_loss": -6.026029586791992, "global_step": 68538, "epoch": 1631} {"train_loss": -5.827911853790283, "global_step": 68539, "epoch": 1631} {"train_loss": -5.994850158691406, "global_step": 68540, "epoch": 1631} {"train_loss": -6.023125648498535, "global_step": 68541, "epoch": 1631} {"train_loss": -5.9150590896606445, "global_step": 68542, "epoch": 1631} {"train_loss": -5.973729337964739, "global_step": 68543, "epoch": 1631, "val_loss": 74482.0} {"train_loss": -6.0168776512146, "global_step": 68544, "epoch": 1632} {"train_loss": -5.86619758605957, "global_step": 68545, "epoch": 1632} {"train_loss": -6.000086307525635, "global_step": 68546, "epoch": 1632} {"train_loss": -5.881955623626709, "global_step": 68547, "epoch": 1632} {"train_loss": -6.031424522399902, "global_step": 68548, "epoch": 1632} {"train_loss": -5.90895938873291, "global_step": 68549, "epoch": 1632} {"train_loss": -5.933564186096191, "global_step": 68550, "epoch": 1632} {"train_loss": -6.080794334411621, "global_step": 68551, "epoch": 1632} {"train_loss": -5.843364238739014, "global_step": 68552, "epoch": 1632} {"train_loss": -5.945322036743164, "global_step": 68553, "epoch": 1632} {"train_loss": -5.857954502105713, "global_step": 68554, "epoch": 1632} {"train_loss": -6.031466960906982, "global_step": 68555, "epoch": 1632} {"train_loss": -6.050232410430908, "global_step": 68556, "epoch": 1632} {"train_loss": -5.939788818359375, "global_step": 68557, "epoch": 1632} {"train_loss": -5.93538761138916, "global_step": 68558, "epoch": 1632} {"train_loss": -5.901723861694336, "global_step": 68559, "epoch": 1632} {"train_loss": -5.9118452072143555, "global_step": 68560, "epoch": 1632} {"train_loss": -6.050011157989502, "global_step": 68561, "epoch": 1632} {"train_loss": -5.81014347076416, "global_step": 68562, "epoch": 1632} {"train_loss": -5.970491409301758, "global_step": 68563, "epoch": 1632} {"train_loss": -5.9621782302856445, "global_step": 68564, "epoch": 1632} {"train_loss": -5.980373382568359, "global_step": 68565, "epoch": 1632} {"train_loss": -6.080338001251221, "global_step": 68566, "epoch": 1632} {"train_loss": -5.947732925415039, "global_step": 68567, "epoch": 1632} {"train_loss": -6.056031227111816, "global_step": 68568, "epoch": 1632} {"train_loss": -5.947535991668701, "global_step": 68569, "epoch": 1632} {"train_loss": -6.063889503479004, "global_step": 68570, "epoch": 1632} {"train_loss": -6.001838207244873, "global_step": 68571, "epoch": 1632} {"train_loss": -6.036731719970703, "global_step": 68572, "epoch": 1632} {"train_loss": -5.964263439178467, "global_step": 68573, "epoch": 1632} {"train_loss": -6.068798065185547, "global_step": 68574, "epoch": 1632} {"train_loss": -5.9542083740234375, "global_step": 68575, "epoch": 1632} {"train_loss": -6.0560126304626465, "global_step": 68576, "epoch": 1632} {"train_loss": -6.0388641357421875, "global_step": 68577, "epoch": 1632} {"train_loss": -5.921123027801514, "global_step": 68578, "epoch": 1632} {"train_loss": -6.086493492126465, "global_step": 68579, "epoch": 1632} {"train_loss": -6.012280464172363, "global_step": 68580, "epoch": 1632} {"train_loss": -5.948879241943359, "global_step": 68581, "epoch": 1632} {"train_loss": -5.996819496154785, "global_step": 68582, "epoch": 1632} {"train_loss": -6.014896869659424, "global_step": 68583, "epoch": 1632} {"train_loss": -5.95513916015625, "global_step": 68584, "epoch": 1632} {"train_loss": -5.979960668654669, "global_step": 68585, "epoch": 1632, "val_loss": 74879.8984375} {"train_loss": -6.048242568969727, "global_step": 68586, "epoch": 1633} {"train_loss": -6.135753154754639, "global_step": 68587, "epoch": 1633} {"train_loss": -6.086755752563477, "global_step": 68588, "epoch": 1633} {"train_loss": -6.020381450653076, "global_step": 68589, "epoch": 1633} {"train_loss": -6.091133117675781, "global_step": 68590, "epoch": 1633} {"train_loss": -5.976337432861328, "global_step": 68591, "epoch": 1633} {"train_loss": -5.90148401260376, "global_step": 68592, "epoch": 1633} {"train_loss": -6.071732521057129, "global_step": 68593, "epoch": 1633} {"train_loss": -5.922029495239258, "global_step": 68594, "epoch": 1633} {"train_loss": -6.003981590270996, "global_step": 68595, "epoch": 1633} {"train_loss": -6.004590034484863, "global_step": 68596, "epoch": 1633} {"train_loss": -5.98798942565918, "global_step": 68597, "epoch": 1633} {"train_loss": -6.019298553466797, "global_step": 68598, "epoch": 1633} {"train_loss": -6.004545211791992, "global_step": 68599, "epoch": 1633} {"train_loss": -6.057063102722168, "global_step": 68600, "epoch": 1633} {"train_loss": -5.9293084144592285, "global_step": 68601, "epoch": 1633} {"train_loss": -6.036523342132568, "global_step": 68602, "epoch": 1633} {"train_loss": -5.958390235900879, "global_step": 68603, "epoch": 1633} {"train_loss": -6.002544403076172, "global_step": 68604, "epoch": 1633} {"train_loss": -6.114753723144531, "global_step": 68605, "epoch": 1633} {"train_loss": -5.97387170791626, "global_step": 68606, "epoch": 1633} {"train_loss": -6.071218490600586, "global_step": 68607, "epoch": 1633} {"train_loss": -6.025746822357178, "global_step": 68608, "epoch": 1633} {"train_loss": -5.995408535003662, "global_step": 68609, "epoch": 1633} {"train_loss": -6.031830787658691, "global_step": 68610, "epoch": 1633} {"train_loss": -6.056468963623047, "global_step": 68611, "epoch": 1633} {"train_loss": -6.029046535491943, "global_step": 68612, "epoch": 1633} {"train_loss": -5.967648029327393, "global_step": 68613, "epoch": 1633} {"train_loss": -6.0226030349731445, "global_step": 68614, "epoch": 1633} {"train_loss": -5.9693708419799805, "global_step": 68615, "epoch": 1633} {"train_loss": -5.982522010803223, "global_step": 68616, "epoch": 1633} {"train_loss": -6.013963222503662, "global_step": 68617, "epoch": 1633} {"train_loss": -5.950766086578369, "global_step": 68618, "epoch": 1633} {"train_loss": -6.034067153930664, "global_step": 68619, "epoch": 1633} {"train_loss": -6.0167341232299805, "global_step": 68620, "epoch": 1633} {"train_loss": -6.0030059814453125, "global_step": 68621, "epoch": 1633} {"train_loss": -5.985092639923096, "global_step": 68622, "epoch": 1633} {"train_loss": -6.081590175628662, "global_step": 68623, "epoch": 1633} {"train_loss": -6.015926361083984, "global_step": 68624, "epoch": 1633} {"train_loss": -5.999427795410156, "global_step": 68625, "epoch": 1633} {"train_loss": -6.04115104675293, "global_step": 68626, "epoch": 1633} {"train_loss": -6.013606888907296, "global_step": 68627, "epoch": 1633, "val_loss": 74624.46875} {"train_loss": -6.100152015686035, "global_step": 68628, "epoch": 1634} {"train_loss": -6.070890426635742, "global_step": 68629, "epoch": 1634} {"train_loss": -5.916896820068359, "global_step": 68630, "epoch": 1634} {"train_loss": -6.182901859283447, "global_step": 68631, "epoch": 1634} {"train_loss": -6.016244411468506, "global_step": 68632, "epoch": 1634} {"train_loss": -5.904927730560303, "global_step": 68633, "epoch": 1634} {"train_loss": -6.088279724121094, "global_step": 68634, "epoch": 1634} {"train_loss": -5.911373138427734, "global_step": 68635, "epoch": 1634} {"train_loss": -6.011767864227295, "global_step": 68636, "epoch": 1634} {"train_loss": -5.941872596740723, "global_step": 68637, "epoch": 1634} {"train_loss": -6.052913665771484, "global_step": 68638, "epoch": 1634} {"train_loss": -5.9964375495910645, "global_step": 68639, "epoch": 1634} {"train_loss": -6.028768539428711, "global_step": 68640, "epoch": 1634} {"train_loss": -6.069943428039551, "global_step": 68641, "epoch": 1634} {"train_loss": -6.066439628601074, "global_step": 68642, "epoch": 1634} {"train_loss": -5.9684600830078125, "global_step": 68643, "epoch": 1634} {"train_loss": -6.037379264831543, "global_step": 68644, "epoch": 1634} {"train_loss": -5.951171398162842, "global_step": 68645, "epoch": 1634} {"train_loss": -6.058185577392578, "global_step": 68646, "epoch": 1634} {"train_loss": -6.134793281555176, "global_step": 68647, "epoch": 1634} {"train_loss": -6.067872047424316, "global_step": 68648, "epoch": 1634} {"train_loss": -5.9337358474731445, "global_step": 68649, "epoch": 1634} {"train_loss": -6.099002838134766, "global_step": 68650, "epoch": 1634} {"train_loss": -6.018316745758057, "global_step": 68651, "epoch": 1634} {"train_loss": -5.971318244934082, "global_step": 68652, "epoch": 1634} {"train_loss": -5.931748390197754, "global_step": 68653, "epoch": 1634} {"train_loss": -5.977054119110107, "global_step": 68654, "epoch": 1634} {"train_loss": -5.995815753936768, "global_step": 68655, "epoch": 1634} {"train_loss": -5.9375410079956055, "global_step": 68656, "epoch": 1634} {"train_loss": -6.03196907043457, "global_step": 68657, "epoch": 1634} {"train_loss": -6.095353603363037, "global_step": 68658, "epoch": 1634} {"train_loss": -5.965924263000488, "global_step": 68659, "epoch": 1634} {"train_loss": -6.062581539154053, "global_step": 68660, "epoch": 1634} {"train_loss": -6.037232875823975, "global_step": 68661, "epoch": 1634} {"train_loss": -5.972532749176025, "global_step": 68662, "epoch": 1634} {"train_loss": -6.0447821617126465, "global_step": 68663, "epoch": 1634} {"train_loss": -6.021745681762695, "global_step": 68664, "epoch": 1634} {"train_loss": -6.033197402954102, "global_step": 68665, "epoch": 1634} {"train_loss": -6.015800476074219, "global_step": 68666, "epoch": 1634} {"train_loss": -5.870126724243164, "global_step": 68667, "epoch": 1634} {"train_loss": -5.949714660644531, "global_step": 68668, "epoch": 1634} {"train_loss": -6.012553601037888, "global_step": 68669, "epoch": 1634, "val_loss": 74860.875} {"train_loss": -5.909472465515137, "global_step": 68670, "epoch": 1635} {"train_loss": -6.019786834716797, "global_step": 68671, "epoch": 1635} {"train_loss": -6.034451484680176, "global_step": 68672, "epoch": 1635} {"train_loss": -5.936149597167969, "global_step": 68673, "epoch": 1635} {"train_loss": -6.072831153869629, "global_step": 68674, "epoch": 1635} {"train_loss": -6.0400390625, "global_step": 68675, "epoch": 1635} {"train_loss": -6.0275373458862305, "global_step": 68676, "epoch": 1635} {"train_loss": -6.038260459899902, "global_step": 68677, "epoch": 1635} {"train_loss": -6.008678436279297, "global_step": 68678, "epoch": 1635} {"train_loss": -5.990496635437012, "global_step": 68679, "epoch": 1635} {"train_loss": -5.973203659057617, "global_step": 68680, "epoch": 1635} {"train_loss": -5.948821067810059, "global_step": 68681, "epoch": 1635} {"train_loss": -6.1046648025512695, "global_step": 68682, "epoch": 1635} {"train_loss": -5.994925498962402, "global_step": 68683, "epoch": 1635} {"train_loss": -5.965027809143066, "global_step": 68684, "epoch": 1635} {"train_loss": -6.0472941398620605, "global_step": 68685, "epoch": 1635} {"train_loss": -6.033490180969238, "global_step": 68686, "epoch": 1635} {"train_loss": -6.025564670562744, "global_step": 68687, "epoch": 1635} {"train_loss": -6.0943169593811035, "global_step": 68688, "epoch": 1635} {"train_loss": -6.032617092132568, "global_step": 68689, "epoch": 1635} {"train_loss": -5.9156694412231445, "global_step": 68690, "epoch": 1635} {"train_loss": -6.09175968170166, "global_step": 68691, "epoch": 1635} {"train_loss": -6.078668594360352, "global_step": 68692, "epoch": 1635} {"train_loss": -5.939913749694824, "global_step": 68693, "epoch": 1635} {"train_loss": -5.890913009643555, "global_step": 68694, "epoch": 1635} {"train_loss": -5.968216896057129, "global_step": 68695, "epoch": 1635} {"train_loss": -6.0729780197143555, "global_step": 68696, "epoch": 1635} {"train_loss": -5.996745586395264, "global_step": 68697, "epoch": 1635} {"train_loss": -5.968839645385742, "global_step": 68698, "epoch": 1635} {"train_loss": -5.9326887130737305, "global_step": 68699, "epoch": 1635} {"train_loss": -5.952801704406738, "global_step": 68700, "epoch": 1635} {"train_loss": -5.994171619415283, "global_step": 68701, "epoch": 1635} {"train_loss": -5.9378767013549805, "global_step": 68702, "epoch": 1635} {"train_loss": -6.008844375610352, "global_step": 68703, "epoch": 1635} {"train_loss": -6.111569404602051, "global_step": 68704, "epoch": 1635} {"train_loss": -5.903133392333984, "global_step": 68705, "epoch": 1635} {"train_loss": -6.045902252197266, "global_step": 68706, "epoch": 1635} {"train_loss": -6.187026023864746, "global_step": 68707, "epoch": 1635} {"train_loss": -5.981165885925293, "global_step": 68708, "epoch": 1635} {"train_loss": -5.925599098205566, "global_step": 68709, "epoch": 1635} {"train_loss": -5.931931018829346, "global_step": 68710, "epoch": 1635} {"train_loss": -6.003705478849865, "global_step": 68711, "epoch": 1635, "val_loss": 74667.6015625} {"train_loss": -6.069266319274902, "global_step": 68712, "epoch": 1636} {"train_loss": -5.937352180480957, "global_step": 68713, "epoch": 1636} {"train_loss": -5.993980407714844, "global_step": 68714, "epoch": 1636} {"train_loss": -5.895389556884766, "global_step": 68715, "epoch": 1636} {"train_loss": -5.795034408569336, "global_step": 68716, "epoch": 1636} {"train_loss": -5.903106689453125, "global_step": 68717, "epoch": 1636} {"train_loss": -5.949890613555908, "global_step": 68718, "epoch": 1636} {"train_loss": -5.898189067840576, "global_step": 68719, "epoch": 1636} {"train_loss": -5.942984580993652, "global_step": 68720, "epoch": 1636} {"train_loss": -5.994259834289551, "global_step": 68721, "epoch": 1636} {"train_loss": -5.8762006759643555, "global_step": 68722, "epoch": 1636} {"train_loss": -5.860162734985352, "global_step": 68723, "epoch": 1636} {"train_loss": -5.93180513381958, "global_step": 68724, "epoch": 1636} {"train_loss": -5.867253303527832, "global_step": 68725, "epoch": 1636} {"train_loss": -6.005396842956543, "global_step": 68726, "epoch": 1636} {"train_loss": -6.032795429229736, "global_step": 68727, "epoch": 1636} {"train_loss": -5.982481002807617, "global_step": 68728, "epoch": 1636} {"train_loss": -6.046195030212402, "global_step": 68729, "epoch": 1636} {"train_loss": -6.022919178009033, "global_step": 68730, "epoch": 1636} {"train_loss": -5.966330528259277, "global_step": 68731, "epoch": 1636} {"train_loss": -5.985602855682373, "global_step": 68732, "epoch": 1636} {"train_loss": -6.059666633605957, "global_step": 68733, "epoch": 1636} {"train_loss": -5.981757164001465, "global_step": 68734, "epoch": 1636} {"train_loss": -6.049000263214111, "global_step": 68735, "epoch": 1636} {"train_loss": -6.053898811340332, "global_step": 68736, "epoch": 1636} {"train_loss": -6.052055358886719, "global_step": 68737, "epoch": 1636} {"train_loss": -6.0197062492370605, "global_step": 68738, "epoch": 1636} {"train_loss": -6.137740612030029, "global_step": 68739, "epoch": 1636} {"train_loss": -6.000761985778809, "global_step": 68740, "epoch": 1636} {"train_loss": -5.971391677856445, "global_step": 68741, "epoch": 1636} {"train_loss": -6.024974346160889, "global_step": 68742, "epoch": 1636} {"train_loss": -6.068984031677246, "global_step": 68743, "epoch": 1636} {"train_loss": -5.949799537658691, "global_step": 68744, "epoch": 1636} {"train_loss": -5.920196056365967, "global_step": 68745, "epoch": 1636} {"train_loss": -5.93709659576416, "global_step": 68746, "epoch": 1636} {"train_loss": -6.003020286560059, "global_step": 68747, "epoch": 1636} {"train_loss": -6.028204917907715, "global_step": 68748, "epoch": 1636} {"train_loss": -6.03718376159668, "global_step": 68749, "epoch": 1636} {"train_loss": -6.0304484367370605, "global_step": 68750, "epoch": 1636} {"train_loss": -6.023994445800781, "global_step": 68751, "epoch": 1636} {"train_loss": -5.992290496826172, "global_step": 68752, "epoch": 1636} {"train_loss": -5.984546457018171, "global_step": 68753, "epoch": 1636, "val_loss": 74514.0234375} {"train_loss": -6.019826889038086, "global_step": 68754, "epoch": 1637} {"train_loss": -6.032886981964111, "global_step": 68755, "epoch": 1637} {"train_loss": -6.108578205108643, "global_step": 68756, "epoch": 1637} {"train_loss": -6.041105270385742, "global_step": 68757, "epoch": 1637} {"train_loss": -6.053576469421387, "global_step": 68758, "epoch": 1637} {"train_loss": -6.064735412597656, "global_step": 68759, "epoch": 1637} {"train_loss": -6.027963161468506, "global_step": 68760, "epoch": 1637} {"train_loss": -6.059415817260742, "global_step": 68761, "epoch": 1637} {"train_loss": -6.045260906219482, "global_step": 68762, "epoch": 1637} {"train_loss": -6.094450950622559, "global_step": 68763, "epoch": 1637} {"train_loss": -6.024808883666992, "global_step": 68764, "epoch": 1637} {"train_loss": -5.894433498382568, "global_step": 68765, "epoch": 1637} {"train_loss": -6.085411071777344, "global_step": 68766, "epoch": 1637} {"train_loss": -5.969271659851074, "global_step": 68767, "epoch": 1637} {"train_loss": -5.977601528167725, "global_step": 68768, "epoch": 1637} {"train_loss": -6.106236934661865, "global_step": 68769, "epoch": 1637} {"train_loss": -5.909627914428711, "global_step": 68770, "epoch": 1637} {"train_loss": -5.97173547744751, "global_step": 68771, "epoch": 1637} {"train_loss": -5.994732856750488, "global_step": 68772, "epoch": 1637} {"train_loss": -5.942088603973389, "global_step": 68773, "epoch": 1637} {"train_loss": -5.838700294494629, "global_step": 68774, "epoch": 1637} {"train_loss": -5.95327091217041, "global_step": 68775, "epoch": 1637} {"train_loss": -5.837439060211182, "global_step": 68776, "epoch": 1637} {"train_loss": -5.98799991607666, "global_step": 68777, "epoch": 1637} {"train_loss": -5.897939682006836, "global_step": 68778, "epoch": 1637} {"train_loss": -5.872238636016846, "global_step": 68779, "epoch": 1637} {"train_loss": -6.020277976989746, "global_step": 68780, "epoch": 1637} {"train_loss": -5.890031814575195, "global_step": 68781, "epoch": 1637} {"train_loss": -5.911862373352051, "global_step": 68782, "epoch": 1637} {"train_loss": -5.968985080718994, "global_step": 68783, "epoch": 1637} {"train_loss": -5.76820182800293, "global_step": 68784, "epoch": 1637} {"train_loss": -5.831022262573242, "global_step": 68785, "epoch": 1637} {"train_loss": -6.025486946105957, "global_step": 68786, "epoch": 1637} {"train_loss": -5.9858527183532715, "global_step": 68787, "epoch": 1637} {"train_loss": -5.778603553771973, "global_step": 68788, "epoch": 1637} {"train_loss": -5.856939792633057, "global_step": 68789, "epoch": 1637} {"train_loss": -5.939826965332031, "global_step": 68790, "epoch": 1637} {"train_loss": -5.921134948730469, "global_step": 68791, "epoch": 1637} {"train_loss": -5.847489356994629, "global_step": 68792, "epoch": 1637} {"train_loss": -6.010123252868652, "global_step": 68793, "epoch": 1637} {"train_loss": -5.835445404052734, "global_step": 68794, "epoch": 1637} {"train_loss": -5.959768465587071, "global_step": 68795, "epoch": 1637, "val_loss": 74894.7890625} {"train_loss": -5.7494282722473145, "global_step": 68796, "epoch": 1638} {"train_loss": -5.99855899810791, "global_step": 68797, "epoch": 1638} {"train_loss": -5.89456844329834, "global_step": 68798, "epoch": 1638} {"train_loss": -5.992585182189941, "global_step": 68799, "epoch": 1638} {"train_loss": -5.992609977722168, "global_step": 68800, "epoch": 1638} {"train_loss": -6.0298051834106445, "global_step": 68801, "epoch": 1638} {"train_loss": -5.978806018829346, "global_step": 68802, "epoch": 1638} {"train_loss": -6.057943344116211, "global_step": 68803, "epoch": 1638} {"train_loss": -6.009769439697266, "global_step": 68804, "epoch": 1638} {"train_loss": -5.97750997543335, "global_step": 68805, "epoch": 1638} {"train_loss": -6.082906246185303, "global_step": 68806, "epoch": 1638} {"train_loss": -6.047698020935059, "global_step": 68807, "epoch": 1638} {"train_loss": -5.9888129234313965, "global_step": 68808, "epoch": 1638} {"train_loss": -5.995461463928223, "global_step": 68809, "epoch": 1638} {"train_loss": -6.070910453796387, "global_step": 68810, "epoch": 1638} {"train_loss": -5.989652633666992, "global_step": 68811, "epoch": 1638} {"train_loss": -5.997876167297363, "global_step": 68812, "epoch": 1638} {"train_loss": -5.973752975463867, "global_step": 68813, "epoch": 1638} {"train_loss": -5.871632099151611, "global_step": 68814, "epoch": 1638} {"train_loss": -5.925198554992676, "global_step": 68815, "epoch": 1638} {"train_loss": -5.862401962280273, "global_step": 68816, "epoch": 1638} {"train_loss": -5.828169345855713, "global_step": 68817, "epoch": 1638} {"train_loss": -6.0282697677612305, "global_step": 68818, "epoch": 1638} {"train_loss": -6.053595066070557, "global_step": 68819, "epoch": 1638} {"train_loss": -5.955803871154785, "global_step": 68820, "epoch": 1638} {"train_loss": -6.115804672241211, "global_step": 68821, "epoch": 1638} {"train_loss": -5.941493034362793, "global_step": 68822, "epoch": 1638} {"train_loss": -5.919577598571777, "global_step": 68823, "epoch": 1638} {"train_loss": -6.010705947875977, "global_step": 68824, "epoch": 1638} {"train_loss": -6.006712913513184, "global_step": 68825, "epoch": 1638} {"train_loss": -6.064679145812988, "global_step": 68826, "epoch": 1638} {"train_loss": -5.767974853515625, "global_step": 68827, "epoch": 1638} {"train_loss": -6.155759811401367, "global_step": 68828, "epoch": 1638} {"train_loss": -6.0398478507995605, "global_step": 68829, "epoch": 1638} {"train_loss": -5.853708267211914, "global_step": 68830, "epoch": 1638} {"train_loss": -6.000058174133301, "global_step": 68831, "epoch": 1638} {"train_loss": -5.896266460418701, "global_step": 68832, "epoch": 1638} {"train_loss": -5.999508380889893, "global_step": 68833, "epoch": 1638} {"train_loss": -6.013998508453369, "global_step": 68834, "epoch": 1638} {"train_loss": -5.858955383300781, "global_step": 68835, "epoch": 1638} {"train_loss": -5.975618839263916, "global_step": 68836, "epoch": 1638} {"train_loss": -5.976511977967762, "global_step": 68837, "epoch": 1638, "val_loss": 74895.1171875} {"train_loss": -5.940290927886963, "global_step": 68838, "epoch": 1639} {"train_loss": -6.092182159423828, "global_step": 68839, "epoch": 1639} {"train_loss": -6.001062393188477, "global_step": 68840, "epoch": 1639} {"train_loss": -6.031493186950684, "global_step": 68841, "epoch": 1639} {"train_loss": -6.119346618652344, "global_step": 68842, "epoch": 1639} {"train_loss": -6.012913227081299, "global_step": 68843, "epoch": 1639} {"train_loss": -5.915621757507324, "global_step": 68844, "epoch": 1639} {"train_loss": -6.026403427124023, "global_step": 68845, "epoch": 1639} {"train_loss": -5.952518463134766, "global_step": 68846, "epoch": 1639} {"train_loss": -6.058428764343262, "global_step": 68847, "epoch": 1639} {"train_loss": -6.128745079040527, "global_step": 68848, "epoch": 1639} {"train_loss": -5.963557243347168, "global_step": 68849, "epoch": 1639} {"train_loss": -6.032404899597168, "global_step": 68850, "epoch": 1639} {"train_loss": -5.966259002685547, "global_step": 68851, "epoch": 1639} {"train_loss": -6.128790378570557, "global_step": 68852, "epoch": 1639} {"train_loss": -6.018322467803955, "global_step": 68853, "epoch": 1639} {"train_loss": -6.126272201538086, "global_step": 68854, "epoch": 1639} {"train_loss": -5.987469673156738, "global_step": 68855, "epoch": 1639} {"train_loss": -6.107614517211914, "global_step": 68856, "epoch": 1639} {"train_loss": -5.993757247924805, "global_step": 68857, "epoch": 1639} {"train_loss": -6.014403820037842, "global_step": 68858, "epoch": 1639} {"train_loss": -6.075810432434082, "global_step": 68859, "epoch": 1639} {"train_loss": -6.035243988037109, "global_step": 68860, "epoch": 1639} {"train_loss": -6.102317810058594, "global_step": 68861, "epoch": 1639} {"train_loss": -6.036491394042969, "global_step": 68862, "epoch": 1639} {"train_loss": -6.070479393005371, "global_step": 68863, "epoch": 1639} {"train_loss": -5.965511798858643, "global_step": 68864, "epoch": 1639} {"train_loss": -6.033326148986816, "global_step": 68865, "epoch": 1639} {"train_loss": -6.041464805603027, "global_step": 68866, "epoch": 1639} {"train_loss": -5.903871536254883, "global_step": 68867, "epoch": 1639} {"train_loss": -5.953333377838135, "global_step": 68868, "epoch": 1639} {"train_loss": -5.9912238121032715, "global_step": 68869, "epoch": 1639} {"train_loss": -5.90914249420166, "global_step": 68870, "epoch": 1639} {"train_loss": -5.922264575958252, "global_step": 68871, "epoch": 1639} {"train_loss": -5.961175918579102, "global_step": 68872, "epoch": 1639} {"train_loss": -6.0440778732299805, "global_step": 68873, "epoch": 1639} {"train_loss": -5.904509544372559, "global_step": 68874, "epoch": 1639} {"train_loss": -6.062630653381348, "global_step": 68875, "epoch": 1639} {"train_loss": -6.09063196182251, "global_step": 68876, "epoch": 1639} {"train_loss": -6.002320766448975, "global_step": 68877, "epoch": 1639} {"train_loss": -5.9031291007995605, "global_step": 68878, "epoch": 1639} {"train_loss": -6.015321379616147, "global_step": 68879, "epoch": 1639, "val_loss": 74617.3125} {"train_loss": -6.019909381866455, "global_step": 68880, "epoch": 1640} {"train_loss": -5.979191303253174, "global_step": 68881, "epoch": 1640} {"train_loss": -6.12026309967041, "global_step": 68882, "epoch": 1640} {"train_loss": -6.007301330566406, "global_step": 68883, "epoch": 1640} {"train_loss": -5.831930637359619, "global_step": 68884, "epoch": 1640} {"train_loss": -6.005131721496582, "global_step": 68885, "epoch": 1640} {"train_loss": -6.0527448654174805, "global_step": 68886, "epoch": 1640} {"train_loss": -6.005870819091797, "global_step": 68887, "epoch": 1640} {"train_loss": -5.974852085113525, "global_step": 68888, "epoch": 1640} {"train_loss": -6.024965286254883, "global_step": 68889, "epoch": 1640} {"train_loss": -5.919785499572754, "global_step": 68890, "epoch": 1640} {"train_loss": -5.93502950668335, "global_step": 68891, "epoch": 1640} {"train_loss": -5.908198833465576, "global_step": 68892, "epoch": 1640} {"train_loss": -5.953932762145996, "global_step": 68893, "epoch": 1640} {"train_loss": -6.059743404388428, "global_step": 68894, "epoch": 1640} {"train_loss": -5.987128257751465, "global_step": 68895, "epoch": 1640} {"train_loss": -6.055411338806152, "global_step": 68896, "epoch": 1640} {"train_loss": -5.901881217956543, "global_step": 68897, "epoch": 1640} {"train_loss": -6.069841384887695, "global_step": 68898, "epoch": 1640} {"train_loss": -5.9612507820129395, "global_step": 68899, "epoch": 1640} {"train_loss": -6.005894660949707, "global_step": 68900, "epoch": 1640} {"train_loss": -5.997039318084717, "global_step": 68901, "epoch": 1640} {"train_loss": -6.005950450897217, "global_step": 68902, "epoch": 1640} {"train_loss": -5.996370315551758, "global_step": 68903, "epoch": 1640} {"train_loss": -5.931446075439453, "global_step": 68904, "epoch": 1640} {"train_loss": -5.934757232666016, "global_step": 68905, "epoch": 1640} {"train_loss": -6.02166223526001, "global_step": 68906, "epoch": 1640} {"train_loss": -5.972750663757324, "global_step": 68907, "epoch": 1640} {"train_loss": -6.0432915687561035, "global_step": 68908, "epoch": 1640} {"train_loss": -5.913961410522461, "global_step": 68909, "epoch": 1640} {"train_loss": -5.916954040527344, "global_step": 68910, "epoch": 1640} {"train_loss": -6.077407360076904, "global_step": 68911, "epoch": 1640} {"train_loss": -6.064584255218506, "global_step": 68912, "epoch": 1640} {"train_loss": -5.985365867614746, "global_step": 68913, "epoch": 1640} {"train_loss": -5.9436445236206055, "global_step": 68914, "epoch": 1640} {"train_loss": -6.070009231567383, "global_step": 68915, "epoch": 1640} {"train_loss": -5.9943342208862305, "global_step": 68916, "epoch": 1640} {"train_loss": -6.001001358032227, "global_step": 68917, "epoch": 1640} {"train_loss": -6.072945594787598, "global_step": 68918, "epoch": 1640} {"train_loss": -5.996865272521973, "global_step": 68919, "epoch": 1640} {"train_loss": -6.0017008781433105, "global_step": 68920, "epoch": 1640} {"train_loss": -5.995660520735241, "global_step": 68921, "epoch": 1640, "val_loss": 74428.65625} {"train_loss": -5.9449381828308105, "global_step": 68922, "epoch": 1641} {"train_loss": -6.004482746124268, "global_step": 68923, "epoch": 1641} {"train_loss": -5.9044036865234375, "global_step": 68924, "epoch": 1641} {"train_loss": -5.991261005401611, "global_step": 68925, "epoch": 1641} {"train_loss": -6.038203716278076, "global_step": 68926, "epoch": 1641} {"train_loss": -6.0109171867370605, "global_step": 68927, "epoch": 1641} {"train_loss": -6.008602619171143, "global_step": 68928, "epoch": 1641} {"train_loss": -6.010058879852295, "global_step": 68929, "epoch": 1641} {"train_loss": -5.903470516204834, "global_step": 68930, "epoch": 1641} {"train_loss": -6.011867523193359, "global_step": 68931, "epoch": 1641} {"train_loss": -6.097472190856934, "global_step": 68932, "epoch": 1641} {"train_loss": -6.009211540222168, "global_step": 68933, "epoch": 1641} {"train_loss": -6.148777484893799, "global_step": 68934, "epoch": 1641} {"train_loss": -6.073833465576172, "global_step": 68935, "epoch": 1641} {"train_loss": -5.931081771850586, "global_step": 68936, "epoch": 1641} {"train_loss": -5.990065574645996, "global_step": 68937, "epoch": 1641} {"train_loss": -6.0274271965026855, "global_step": 68938, "epoch": 1641} {"train_loss": -5.918718338012695, "global_step": 68939, "epoch": 1641} {"train_loss": -5.949552536010742, "global_step": 68940, "epoch": 1641} {"train_loss": -5.953024864196777, "global_step": 68941, "epoch": 1641} {"train_loss": -6.033383846282959, "global_step": 68942, "epoch": 1641} {"train_loss": -5.9921064376831055, "global_step": 68943, "epoch": 1641} {"train_loss": -5.8046770095825195, "global_step": 68944, "epoch": 1641} {"train_loss": -5.929520606994629, "global_step": 68945, "epoch": 1641} {"train_loss": -6.0026044845581055, "global_step": 68946, "epoch": 1641} {"train_loss": -6.084229469299316, "global_step": 68947, "epoch": 1641} {"train_loss": -6.063078880310059, "global_step": 68948, "epoch": 1641} {"train_loss": -6.112110614776611, "global_step": 68949, "epoch": 1641} {"train_loss": -6.05837345123291, "global_step": 68950, "epoch": 1641} {"train_loss": -6.070932388305664, "global_step": 68951, "epoch": 1641} {"train_loss": -6.1119465827941895, "global_step": 68952, "epoch": 1641} {"train_loss": -6.009773254394531, "global_step": 68953, "epoch": 1641} {"train_loss": -6.013120651245117, "global_step": 68954, "epoch": 1641} {"train_loss": -6.129047393798828, "global_step": 68955, "epoch": 1641} {"train_loss": -6.086773872375488, "global_step": 68956, "epoch": 1641} {"train_loss": -6.005073547363281, "global_step": 68957, "epoch": 1641} {"train_loss": -6.090460300445557, "global_step": 68958, "epoch": 1641} {"train_loss": -5.9553704261779785, "global_step": 68959, "epoch": 1641} {"train_loss": -5.975568771362305, "global_step": 68960, "epoch": 1641} {"train_loss": -6.027071952819824, "global_step": 68961, "epoch": 1641} {"train_loss": -6.028207778930664, "global_step": 68962, "epoch": 1641} {"train_loss": -6.011837380273001, "global_step": 68963, "epoch": 1641, "val_loss": 74781.9375} {"train_loss": -6.0901994705200195, "global_step": 68964, "epoch": 1642} {"train_loss": -5.911776542663574, "global_step": 68965, "epoch": 1642} {"train_loss": -5.910532474517822, "global_step": 68966, "epoch": 1642} {"train_loss": -6.119080543518066, "global_step": 68967, "epoch": 1642} {"train_loss": -5.981048583984375, "global_step": 68968, "epoch": 1642} {"train_loss": -6.088498115539551, "global_step": 68969, "epoch": 1642} {"train_loss": -5.978717803955078, "global_step": 68970, "epoch": 1642} {"train_loss": -5.992142677307129, "global_step": 68971, "epoch": 1642} {"train_loss": -6.066616058349609, "global_step": 68972, "epoch": 1642} {"train_loss": -6.058483123779297, "global_step": 68973, "epoch": 1642} {"train_loss": -6.129135608673096, "global_step": 68974, "epoch": 1642} {"train_loss": -5.986264705657959, "global_step": 68975, "epoch": 1642} {"train_loss": -5.974274635314941, "global_step": 68976, "epoch": 1642} {"train_loss": -6.04618501663208, "global_step": 68977, "epoch": 1642} {"train_loss": -6.022675514221191, "global_step": 68978, "epoch": 1642} {"train_loss": -5.98038387298584, "global_step": 68979, "epoch": 1642} {"train_loss": -6.093706130981445, "global_step": 68980, "epoch": 1642} {"train_loss": -6.048015594482422, "global_step": 68981, "epoch": 1642} {"train_loss": -6.0076189041137695, "global_step": 68982, "epoch": 1642} {"train_loss": -6.013888359069824, "global_step": 68983, "epoch": 1642} {"train_loss": -5.991283416748047, "global_step": 68984, "epoch": 1642} {"train_loss": -5.899623870849609, "global_step": 68985, "epoch": 1642} {"train_loss": -5.880288124084473, "global_step": 68986, "epoch": 1642} {"train_loss": -6.009392738342285, "global_step": 68987, "epoch": 1642} {"train_loss": -5.968149662017822, "global_step": 68988, "epoch": 1642} {"train_loss": -6.029253959655762, "global_step": 68989, "epoch": 1642} {"train_loss": -6.087780952453613, "global_step": 68990, "epoch": 1642} {"train_loss": -5.97744083404541, "global_step": 68991, "epoch": 1642} {"train_loss": -6.044699668884277, "global_step": 68992, "epoch": 1642} {"train_loss": -6.0044050216674805, "global_step": 68993, "epoch": 1642} {"train_loss": -6.0376482009887695, "global_step": 68994, "epoch": 1642} {"train_loss": -6.049630165100098, "global_step": 68995, "epoch": 1642} {"train_loss": -5.964670181274414, "global_step": 68996, "epoch": 1642} {"train_loss": -6.030029296875, "global_step": 68997, "epoch": 1642} {"train_loss": -5.928622722625732, "global_step": 68998, "epoch": 1642} {"train_loss": -5.890553951263428, "global_step": 68999, "epoch": 1642} {"train_loss": -5.981830596923828, "global_step": 69000, "epoch": 1642} {"train_loss": -5.991072654724121, "global_step": 69001, "epoch": 1642} {"train_loss": -5.937962532043457, "global_step": 69002, "epoch": 1642} {"train_loss": -6.0269622802734375, "global_step": 69003, "epoch": 1642} {"train_loss": -6.004375457763672, "global_step": 69004, "epoch": 1642} {"train_loss": -6.008328153973534, "global_step": 69005, "epoch": 1642, "val_loss": 74743.078125} {"train_loss": -6.07857084274292, "global_step": 69006, "epoch": 1643} {"train_loss": -6.0347418785095215, "global_step": 69007, "epoch": 1643} {"train_loss": -6.236859321594238, "global_step": 69008, "epoch": 1643} {"train_loss": -6.0355048179626465, "global_step": 69009, "epoch": 1643} {"train_loss": -6.0571699142456055, "global_step": 69010, "epoch": 1643} {"train_loss": -6.047287940979004, "global_step": 69011, "epoch": 1643} {"train_loss": -5.937859535217285, "global_step": 69012, "epoch": 1643} {"train_loss": -5.909390449523926, "global_step": 69013, "epoch": 1643} {"train_loss": -6.019781589508057, "global_step": 69014, "epoch": 1643} {"train_loss": -6.018482208251953, "global_step": 69015, "epoch": 1643} {"train_loss": -6.0267791748046875, "global_step": 69016, "epoch": 1643} {"train_loss": -6.034451961517334, "global_step": 69017, "epoch": 1643} {"train_loss": -5.970654487609863, "global_step": 69018, "epoch": 1643} {"train_loss": -5.962921619415283, "global_step": 69019, "epoch": 1643} {"train_loss": -5.971747398376465, "global_step": 69020, "epoch": 1643} {"train_loss": -5.928066253662109, "global_step": 69021, "epoch": 1643} {"train_loss": -5.929843902587891, "global_step": 69022, "epoch": 1643} {"train_loss": -6.064009189605713, "global_step": 69023, "epoch": 1643} {"train_loss": -6.0741071701049805, "global_step": 69024, "epoch": 1643} {"train_loss": -5.9850664138793945, "global_step": 69025, "epoch": 1643} {"train_loss": -6.064815044403076, "global_step": 69026, "epoch": 1643} {"train_loss": -5.987295627593994, "global_step": 69027, "epoch": 1643} {"train_loss": -5.842523574829102, "global_step": 69028, "epoch": 1643} {"train_loss": -6.096668243408203, "global_step": 69029, "epoch": 1643} {"train_loss": -5.909346580505371, "global_step": 69030, "epoch": 1643} {"train_loss": -5.907524108886719, "global_step": 69031, "epoch": 1643} {"train_loss": -5.9464616775512695, "global_step": 69032, "epoch": 1643} {"train_loss": -6.053862571716309, "global_step": 69033, "epoch": 1643} {"train_loss": -5.96050500869751, "global_step": 69034, "epoch": 1643} {"train_loss": -5.993330955505371, "global_step": 69035, "epoch": 1643} {"train_loss": -6.022058963775635, "global_step": 69036, "epoch": 1643} {"train_loss": -6.079076290130615, "global_step": 69037, "epoch": 1643} {"train_loss": -6.039746284484863, "global_step": 69038, "epoch": 1643} {"train_loss": -6.039167881011963, "global_step": 69039, "epoch": 1643} {"train_loss": -5.938168525695801, "global_step": 69040, "epoch": 1643} {"train_loss": -5.973545074462891, "global_step": 69041, "epoch": 1643} {"train_loss": -6.076126575469971, "global_step": 69042, "epoch": 1643} {"train_loss": -5.911947727203369, "global_step": 69043, "epoch": 1643} {"train_loss": -6.001162528991699, "global_step": 69044, "epoch": 1643} {"train_loss": -6.04734992980957, "global_step": 69045, "epoch": 1643} {"train_loss": -5.941729545593262, "global_step": 69046, "epoch": 1643} {"train_loss": -6.004781564076741, "global_step": 69047, "epoch": 1643, "val_loss": 74767.125} {"train_loss": -6.082262992858887, "global_step": 69048, "epoch": 1644} {"train_loss": -6.048997402191162, "global_step": 69049, "epoch": 1644} {"train_loss": -6.090564727783203, "global_step": 69050, "epoch": 1644} {"train_loss": -6.042203903198242, "global_step": 69051, "epoch": 1644} {"train_loss": -6.038016319274902, "global_step": 69052, "epoch": 1644} {"train_loss": -5.978031158447266, "global_step": 69053, "epoch": 1644} {"train_loss": -5.925965785980225, "global_step": 69054, "epoch": 1644} {"train_loss": -5.958075523376465, "global_step": 69055, "epoch": 1644} {"train_loss": -6.008612632751465, "global_step": 69056, "epoch": 1644} {"train_loss": -6.041954040527344, "global_step": 69057, "epoch": 1644} {"train_loss": -6.011667251586914, "global_step": 69058, "epoch": 1644} {"train_loss": -6.087266445159912, "global_step": 69059, "epoch": 1644} {"train_loss": -6.018240451812744, "global_step": 69060, "epoch": 1644} {"train_loss": -6.034883499145508, "global_step": 69061, "epoch": 1644} {"train_loss": -6.015566349029541, "global_step": 69062, "epoch": 1644} {"train_loss": -6.004642486572266, "global_step": 69063, "epoch": 1644} {"train_loss": -6.058237552642822, "global_step": 69064, "epoch": 1644} {"train_loss": -5.945810317993164, "global_step": 69065, "epoch": 1644} {"train_loss": -6.077874660491943, "global_step": 69066, "epoch": 1644} {"train_loss": -6.097491264343262, "global_step": 69067, "epoch": 1644} {"train_loss": -6.106064796447754, "global_step": 69068, "epoch": 1644} {"train_loss": -6.028232574462891, "global_step": 69069, "epoch": 1644} {"train_loss": -5.88289213180542, "global_step": 69070, "epoch": 1644} {"train_loss": -5.932722091674805, "global_step": 69071, "epoch": 1644} {"train_loss": -6.086053371429443, "global_step": 69072, "epoch": 1644} {"train_loss": -5.975549221038818, "global_step": 69073, "epoch": 1644} {"train_loss": -5.8958740234375, "global_step": 69074, "epoch": 1644} {"train_loss": -6.042557716369629, "global_step": 69075, "epoch": 1644} {"train_loss": -5.829827308654785, "global_step": 69076, "epoch": 1644} {"train_loss": -5.967623710632324, "global_step": 69077, "epoch": 1644} {"train_loss": -6.0815582275390625, "global_step": 69078, "epoch": 1644} {"train_loss": -6.029426574707031, "global_step": 69079, "epoch": 1644} {"train_loss": -6.128791809082031, "global_step": 69080, "epoch": 1644} {"train_loss": -6.122629642486572, "global_step": 69081, "epoch": 1644} {"train_loss": -6.012602806091309, "global_step": 69082, "epoch": 1644} {"train_loss": -6.056232929229736, "global_step": 69083, "epoch": 1644} {"train_loss": -6.142909049987793, "global_step": 69084, "epoch": 1644} {"train_loss": -5.964951038360596, "global_step": 69085, "epoch": 1644} {"train_loss": -6.0627923011779785, "global_step": 69086, "epoch": 1644} {"train_loss": -6.112552642822266, "global_step": 69087, "epoch": 1644} {"train_loss": -6.096567153930664, "global_step": 69088, "epoch": 1644} {"train_loss": -6.028656028565907, "global_step": 69089, "epoch": 1644, "val_loss": 74669.765625} {"train_loss": -6.001384735107422, "global_step": 69090, "epoch": 1645} {"train_loss": -6.0758209228515625, "global_step": 69091, "epoch": 1645} {"train_loss": -5.958670616149902, "global_step": 69092, "epoch": 1645} {"train_loss": -6.074365139007568, "global_step": 69093, "epoch": 1645} {"train_loss": -6.0684661865234375, "global_step": 69094, "epoch": 1645} {"train_loss": -5.952193260192871, "global_step": 69095, "epoch": 1645} {"train_loss": -5.983811855316162, "global_step": 69096, "epoch": 1645} {"train_loss": -5.917612075805664, "global_step": 69097, "epoch": 1645} {"train_loss": -5.956460952758789, "global_step": 69098, "epoch": 1645} {"train_loss": -6.036552429199219, "global_step": 69099, "epoch": 1645} {"train_loss": -5.750432968139648, "global_step": 69100, "epoch": 1645} {"train_loss": -6.095380783081055, "global_step": 69101, "epoch": 1645} {"train_loss": -5.964244842529297, "global_step": 69102, "epoch": 1645} {"train_loss": -5.8464579582214355, "global_step": 69103, "epoch": 1645} {"train_loss": -5.978029727935791, "global_step": 69104, "epoch": 1645} {"train_loss": -5.924783229827881, "global_step": 69105, "epoch": 1645} {"train_loss": -5.897756099700928, "global_step": 69106, "epoch": 1645} {"train_loss": -5.9989519119262695, "global_step": 69107, "epoch": 1645} {"train_loss": -5.881863594055176, "global_step": 69108, "epoch": 1645} {"train_loss": -5.883382797241211, "global_step": 69109, "epoch": 1645} {"train_loss": -5.957365036010742, "global_step": 69110, "epoch": 1645} {"train_loss": -5.963215351104736, "global_step": 69111, "epoch": 1645} {"train_loss": -5.999293804168701, "global_step": 69112, "epoch": 1645} {"train_loss": -5.978629112243652, "global_step": 69113, "epoch": 1645} {"train_loss": -5.830413341522217, "global_step": 69114, "epoch": 1645} {"train_loss": -5.955784320831299, "global_step": 69115, "epoch": 1645} {"train_loss": -5.849340438842773, "global_step": 69116, "epoch": 1645} {"train_loss": -5.950704574584961, "global_step": 69117, "epoch": 1645} {"train_loss": -5.937628269195557, "global_step": 69118, "epoch": 1645} {"train_loss": -5.97268009185791, "global_step": 69119, "epoch": 1645} {"train_loss": -5.95913553237915, "global_step": 69120, "epoch": 1645} {"train_loss": -6.076458930969238, "global_step": 69121, "epoch": 1645} {"train_loss": -6.052494049072266, "global_step": 69122, "epoch": 1645} {"train_loss": -5.999938488006592, "global_step": 69123, "epoch": 1645} {"train_loss": -5.970100402832031, "global_step": 69124, "epoch": 1645} {"train_loss": -6.015406131744385, "global_step": 69125, "epoch": 1645} {"train_loss": -5.983524322509766, "global_step": 69126, "epoch": 1645} {"train_loss": -6.011233329772949, "global_step": 69127, "epoch": 1645} {"train_loss": -5.968684196472168, "global_step": 69128, "epoch": 1645} {"train_loss": -6.096832275390625, "global_step": 69129, "epoch": 1645} {"train_loss": -5.9593048095703125, "global_step": 69130, "epoch": 1645} {"train_loss": -5.970718781153361, "global_step": 69131, "epoch": 1645, "val_loss": 74962.0078125} {"train_loss": -6.058022499084473, "global_step": 69132, "epoch": 1646} {"train_loss": -6.005597114562988, "global_step": 69133, "epoch": 1646} {"train_loss": -5.919431209564209, "global_step": 69134, "epoch": 1646} {"train_loss": -5.963773727416992, "global_step": 69135, "epoch": 1646} {"train_loss": -6.062182426452637, "global_step": 69136, "epoch": 1646} {"train_loss": -6.094089508056641, "global_step": 69137, "epoch": 1646} {"train_loss": -5.984127521514893, "global_step": 69138, "epoch": 1646} {"train_loss": -6.178743362426758, "global_step": 69139, "epoch": 1646} {"train_loss": -5.935632705688477, "global_step": 69140, "epoch": 1646} {"train_loss": -5.979320526123047, "global_step": 69141, "epoch": 1646} {"train_loss": -6.003780841827393, "global_step": 69142, "epoch": 1646} {"train_loss": -5.913689613342285, "global_step": 69143, "epoch": 1646} {"train_loss": -6.021030426025391, "global_step": 69144, "epoch": 1646} {"train_loss": -5.910004615783691, "global_step": 69145, "epoch": 1646} {"train_loss": -6.010839939117432, "global_step": 69146, "epoch": 1646} {"train_loss": -6.016400337219238, "global_step": 69147, "epoch": 1646} {"train_loss": -5.952914237976074, "global_step": 69148, "epoch": 1646} {"train_loss": -5.959346771240234, "global_step": 69149, "epoch": 1646} {"train_loss": -6.039836406707764, "global_step": 69150, "epoch": 1646} {"train_loss": -6.015786170959473, "global_step": 69151, "epoch": 1646} {"train_loss": -6.072646141052246, "global_step": 69152, "epoch": 1646} {"train_loss": -6.021393299102783, "global_step": 69153, "epoch": 1646} {"train_loss": -6.057039260864258, "global_step": 69154, "epoch": 1646} {"train_loss": -5.98400354385376, "global_step": 69155, "epoch": 1646} {"train_loss": -6.012966156005859, "global_step": 69156, "epoch": 1646} {"train_loss": -6.026389122009277, "global_step": 69157, "epoch": 1646} {"train_loss": -5.999327659606934, "global_step": 69158, "epoch": 1646} {"train_loss": -5.980890274047852, "global_step": 69159, "epoch": 1646} {"train_loss": -6.0296478271484375, "global_step": 69160, "epoch": 1646} {"train_loss": -6.022127628326416, "global_step": 69161, "epoch": 1646} {"train_loss": -5.9585442543029785, "global_step": 69162, "epoch": 1646} {"train_loss": -5.85521936416626, "global_step": 69163, "epoch": 1646} {"train_loss": -6.087953090667725, "global_step": 69164, "epoch": 1646} {"train_loss": -6.019590854644775, "global_step": 69165, "epoch": 1646} {"train_loss": -5.892430305480957, "global_step": 69166, "epoch": 1646} {"train_loss": -5.959184646606445, "global_step": 69167, "epoch": 1646} {"train_loss": -5.969282150268555, "global_step": 69168, "epoch": 1646} {"train_loss": -5.911352634429932, "global_step": 69169, "epoch": 1646} {"train_loss": -6.054285049438477, "global_step": 69170, "epoch": 1646} {"train_loss": -6.030160903930664, "global_step": 69171, "epoch": 1646} {"train_loss": -5.972649574279785, "global_step": 69172, "epoch": 1646} {"train_loss": -6.002908638545445, "global_step": 69173, "epoch": 1646, "val_loss": 74788.8515625} {"train_loss": -6.01570987701416, "global_step": 69174, "epoch": 1647} {"train_loss": -6.100375175476074, "global_step": 69175, "epoch": 1647} {"train_loss": -5.9035515785217285, "global_step": 69176, "epoch": 1647} {"train_loss": -5.901824951171875, "global_step": 69177, "epoch": 1647} {"train_loss": -5.9271039962768555, "global_step": 69178, "epoch": 1647} {"train_loss": -5.955577850341797, "global_step": 69179, "epoch": 1647} {"train_loss": -5.985771179199219, "global_step": 69180, "epoch": 1647} {"train_loss": -6.013899803161621, "global_step": 69181, "epoch": 1647} {"train_loss": -5.944716453552246, "global_step": 69182, "epoch": 1647} {"train_loss": -6.068183898925781, "global_step": 69183, "epoch": 1647} {"train_loss": -5.875113010406494, "global_step": 69184, "epoch": 1647} {"train_loss": -6.053276062011719, "global_step": 69185, "epoch": 1647} {"train_loss": -5.990325927734375, "global_step": 69186, "epoch": 1647} {"train_loss": -6.013306140899658, "global_step": 69187, "epoch": 1647} {"train_loss": -6.010188102722168, "global_step": 69188, "epoch": 1647} {"train_loss": -6.157258033752441, "global_step": 69189, "epoch": 1647} {"train_loss": -5.9520721435546875, "global_step": 69190, "epoch": 1647} {"train_loss": -5.975690841674805, "global_step": 69191, "epoch": 1647} {"train_loss": -5.9934587478637695, "global_step": 69192, "epoch": 1647} {"train_loss": -5.969613075256348, "global_step": 69193, "epoch": 1647} {"train_loss": -5.889756202697754, "global_step": 69194, "epoch": 1647} {"train_loss": -6.000535488128662, "global_step": 69195, "epoch": 1647} {"train_loss": -6.0677618980407715, "global_step": 69196, "epoch": 1647} {"train_loss": -6.058568000793457, "global_step": 69197, "epoch": 1647} {"train_loss": -5.984888076782227, "global_step": 69198, "epoch": 1647} {"train_loss": -5.94074821472168, "global_step": 69199, "epoch": 1647} {"train_loss": -5.9928178787231445, "global_step": 69200, "epoch": 1647} {"train_loss": -5.938718795776367, "global_step": 69201, "epoch": 1647} {"train_loss": -6.172613620758057, "global_step": 69202, "epoch": 1647} {"train_loss": -5.986015319824219, "global_step": 69203, "epoch": 1647} {"train_loss": -6.028700351715088, "global_step": 69204, "epoch": 1647} {"train_loss": -5.9905853271484375, "global_step": 69205, "epoch": 1647} {"train_loss": -5.937087059020996, "global_step": 69206, "epoch": 1647} {"train_loss": -6.118504047393799, "global_step": 69207, "epoch": 1647} {"train_loss": -6.027042388916016, "global_step": 69208, "epoch": 1647} {"train_loss": -5.86997127532959, "global_step": 69209, "epoch": 1647} {"train_loss": -6.053130626678467, "global_step": 69210, "epoch": 1647} {"train_loss": -5.9312639236450195, "global_step": 69211, "epoch": 1647} {"train_loss": -5.966150283813477, "global_step": 69212, "epoch": 1647} {"train_loss": -6.069101333618164, "global_step": 69213, "epoch": 1647} {"train_loss": -5.989380836486816, "global_step": 69214, "epoch": 1647} {"train_loss": -5.999775784356253, "global_step": 69215, "epoch": 1647, "val_loss": 74754.46875} {"train_loss": -6.174960613250732, "global_step": 69216, "epoch": 1648} {"train_loss": -6.0835371017456055, "global_step": 69217, "epoch": 1648} {"train_loss": -6.001267433166504, "global_step": 69218, "epoch": 1648} {"train_loss": -5.962304592132568, "global_step": 69219, "epoch": 1648} {"train_loss": -6.042203426361084, "global_step": 69220, "epoch": 1648} {"train_loss": -6.042013645172119, "global_step": 69221, "epoch": 1648} {"train_loss": -5.957759857177734, "global_step": 69222, "epoch": 1648} {"train_loss": -5.85563850402832, "global_step": 69223, "epoch": 1648} {"train_loss": -5.950253486633301, "global_step": 69224, "epoch": 1648} {"train_loss": -5.937903881072998, "global_step": 69225, "epoch": 1648} {"train_loss": -6.057562828063965, "global_step": 69226, "epoch": 1648} {"train_loss": -6.025596618652344, "global_step": 69227, "epoch": 1648} {"train_loss": -5.982909202575684, "global_step": 69228, "epoch": 1648} {"train_loss": -5.88143253326416, "global_step": 69229, "epoch": 1648} {"train_loss": -5.994774341583252, "global_step": 69230, "epoch": 1648} {"train_loss": -5.97669792175293, "global_step": 69231, "epoch": 1648} {"train_loss": -5.982759952545166, "global_step": 69232, "epoch": 1648} {"train_loss": -6.00856876373291, "global_step": 69233, "epoch": 1648} {"train_loss": -5.950479030609131, "global_step": 69234, "epoch": 1648} {"train_loss": -5.9400787353515625, "global_step": 69235, "epoch": 1648} {"train_loss": -5.867900848388672, "global_step": 69236, "epoch": 1648} {"train_loss": -5.992336273193359, "global_step": 69237, "epoch": 1648} {"train_loss": -6.045183181762695, "global_step": 69238, "epoch": 1648} {"train_loss": -5.957204341888428, "global_step": 69239, "epoch": 1648} {"train_loss": -6.057920455932617, "global_step": 69240, "epoch": 1648} {"train_loss": -5.877686500549316, "global_step": 69241, "epoch": 1648} {"train_loss": -5.974419116973877, "global_step": 69242, "epoch": 1648} {"train_loss": -6.181855201721191, "global_step": 69243, "epoch": 1648} {"train_loss": -5.881216526031494, "global_step": 69244, "epoch": 1648} {"train_loss": -6.011948108673096, "global_step": 69245, "epoch": 1648} {"train_loss": -6.0064167976379395, "global_step": 69246, "epoch": 1648} {"train_loss": -5.978384971618652, "global_step": 69247, "epoch": 1648} {"train_loss": -5.988343715667725, "global_step": 69248, "epoch": 1648} {"train_loss": -5.999423027038574, "global_step": 69249, "epoch": 1648} {"train_loss": -5.9593706130981445, "global_step": 69250, "epoch": 1648} {"train_loss": -5.995987415313721, "global_step": 69251, "epoch": 1648} {"train_loss": -6.021841049194336, "global_step": 69252, "epoch": 1648} {"train_loss": -5.909604549407959, "global_step": 69253, "epoch": 1648} {"train_loss": -5.992551803588867, "global_step": 69254, "epoch": 1648} {"train_loss": -5.923866271972656, "global_step": 69255, "epoch": 1648} {"train_loss": -5.948554515838623, "global_step": 69256, "epoch": 1648} {"train_loss": -5.98318084081014, "global_step": 69257, "epoch": 1648, "val_loss": 74864.8125} {"train_loss": -6.005990505218506, "global_step": 69258, "epoch": 1649} {"train_loss": -5.91209602355957, "global_step": 69259, "epoch": 1649} {"train_loss": -6.113868713378906, "global_step": 69260, "epoch": 1649} {"train_loss": -6.092913627624512, "global_step": 69261, "epoch": 1649} {"train_loss": -6.041959762573242, "global_step": 69262, "epoch": 1649} {"train_loss": -6.016345024108887, "global_step": 69263, "epoch": 1649} {"train_loss": -6.0112104415893555, "global_step": 69264, "epoch": 1649} {"train_loss": -5.921232223510742, "global_step": 69265, "epoch": 1649} {"train_loss": -5.967225074768066, "global_step": 69266, "epoch": 1649} {"train_loss": -5.983499050140381, "global_step": 69267, "epoch": 1649} {"train_loss": -5.944655418395996, "global_step": 69268, "epoch": 1649} {"train_loss": -6.071921348571777, "global_step": 69269, "epoch": 1649} {"train_loss": -5.875042915344238, "global_step": 69270, "epoch": 1649} {"train_loss": -5.962584972381592, "global_step": 69271, "epoch": 1649} {"train_loss": -6.042724609375, "global_step": 69272, "epoch": 1649} {"train_loss": -5.979315757751465, "global_step": 69273, "epoch": 1649} {"train_loss": -6.077481269836426, "global_step": 69274, "epoch": 1649} {"train_loss": -6.030627727508545, "global_step": 69275, "epoch": 1649} {"train_loss": -6.082225799560547, "global_step": 69276, "epoch": 1649} {"train_loss": -6.056268692016602, "global_step": 69277, "epoch": 1649} {"train_loss": -6.006980895996094, "global_step": 69278, "epoch": 1649} {"train_loss": -5.984758377075195, "global_step": 69279, "epoch": 1649} {"train_loss": -5.937167167663574, "global_step": 69280, "epoch": 1649} {"train_loss": -5.947789192199707, "global_step": 69281, "epoch": 1649} {"train_loss": -5.795914649963379, "global_step": 69282, "epoch": 1649} {"train_loss": -6.057605266571045, "global_step": 69283, "epoch": 1649} {"train_loss": -6.011912822723389, "global_step": 69284, "epoch": 1649} {"train_loss": -5.986417770385742, "global_step": 69285, "epoch": 1649} {"train_loss": -6.0694661140441895, "global_step": 69286, "epoch": 1649} {"train_loss": -5.912735939025879, "global_step": 69287, "epoch": 1649} {"train_loss": -6.067911148071289, "global_step": 69288, "epoch": 1649} {"train_loss": -5.967448711395264, "global_step": 69289, "epoch": 1649} {"train_loss": -5.963696479797363, "global_step": 69290, "epoch": 1649} {"train_loss": -6.026984214782715, "global_step": 69291, "epoch": 1649} {"train_loss": -5.926949501037598, "global_step": 69292, "epoch": 1649} {"train_loss": -6.088653564453125, "global_step": 69293, "epoch": 1649} {"train_loss": -5.895226955413818, "global_step": 69294, "epoch": 1649} {"train_loss": -5.933237075805664, "global_step": 69295, "epoch": 1649} {"train_loss": -5.973303318023682, "global_step": 69296, "epoch": 1649} {"train_loss": -5.914039611816406, "global_step": 69297, "epoch": 1649} {"train_loss": -5.978025436401367, "global_step": 69298, "epoch": 1649} {"train_loss": -5.989740655535743, "global_step": 69299, "epoch": 1649, "val_loss": 75241.265625} {"train_loss": -6.017208099365234, "global_step": 69300, "epoch": 1650} {"train_loss": -5.872895240783691, "global_step": 69301, "epoch": 1650} {"train_loss": -5.943488597869873, "global_step": 69302, "epoch": 1650} {"train_loss": -5.983094692230225, "global_step": 69303, "epoch": 1650} {"train_loss": -6.07163143157959, "global_step": 69304, "epoch": 1650} {"train_loss": -5.807775497436523, "global_step": 69305, "epoch": 1650} {"train_loss": -6.0366411209106445, "global_step": 69306, "epoch": 1650} {"train_loss": -6.031351089477539, "global_step": 69307, "epoch": 1650} {"train_loss": -5.949139595031738, "global_step": 69308, "epoch": 1650} {"train_loss": -5.985389232635498, "global_step": 69309, "epoch": 1650} {"train_loss": -5.939355850219727, "global_step": 69310, "epoch": 1650} {"train_loss": -6.131524085998535, "global_step": 69311, "epoch": 1650} {"train_loss": -5.999892234802246, "global_step": 69312, "epoch": 1650} {"train_loss": -5.910477638244629, "global_step": 69313, "epoch": 1650} {"train_loss": -6.130178928375244, "global_step": 69314, "epoch": 1650} {"train_loss": -5.991971969604492, "global_step": 69315, "epoch": 1650} {"train_loss": -5.9466962814331055, "global_step": 69316, "epoch": 1650} {"train_loss": -5.967886924743652, "global_step": 69317, "epoch": 1650} {"train_loss": -6.134151935577393, "global_step": 69318, "epoch": 1650} {"train_loss": -5.991645812988281, "global_step": 69319, "epoch": 1650} {"train_loss": -6.074970722198486, "global_step": 69320, "epoch": 1650} {"train_loss": -6.023556709289551, "global_step": 69321, "epoch": 1650} {"train_loss": -5.95133113861084, "global_step": 69322, "epoch": 1650} {"train_loss": -5.944432258605957, "global_step": 69323, "epoch": 1650} {"train_loss": -6.033674240112305, "global_step": 69324, "epoch": 1650} {"train_loss": -6.017993450164795, "global_step": 69325, "epoch": 1650} {"train_loss": -5.982112884521484, "global_step": 69326, "epoch": 1650} {"train_loss": -6.032808303833008, "global_step": 69327, "epoch": 1650} {"train_loss": -5.940248012542725, "global_step": 69328, "epoch": 1650} {"train_loss": -5.931187629699707, "global_step": 69329, "epoch": 1650} {"train_loss": -6.015349388122559, "global_step": 69330, "epoch": 1650} {"train_loss": -5.879522323608398, "global_step": 69331, "epoch": 1650} {"train_loss": -6.030727386474609, "global_step": 69332, "epoch": 1650} {"train_loss": -6.004498481750488, "global_step": 69333, "epoch": 1650} {"train_loss": -5.968472957611084, "global_step": 69334, "epoch": 1650} {"train_loss": -6.03981876373291, "global_step": 69335, "epoch": 1650} {"train_loss": -5.971993446350098, "global_step": 69336, "epoch": 1650} {"train_loss": -6.105494499206543, "global_step": 69337, "epoch": 1650} {"train_loss": -5.892582416534424, "global_step": 69338, "epoch": 1650} {"train_loss": -5.953590393066406, "global_step": 69339, "epoch": 1650} {"train_loss": -6.085317611694336, "global_step": 69340, "epoch": 1650} {"train_loss": -5.994776612236386, "global_step": 69341, "epoch": 1650, "train/sim_max_reward_0": 0.4057408596569597, "train/sim_max_reward_1": 0.9153161446067546, "train/sim_max_reward_2": 0.30950764590688806, "train/sim_max_reward_3": 0.13775315335200608, "train/sim_max_reward_4": 0.5347261457081744, "train/sim_max_reward_5": 0.6357890864978, "test/sim_max_reward_4500000": 0.8437560268231106, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8614914235024116, "test/sim_max_reward_4500003": 0.003264493362734348, "test/sim_max_reward_4500004": 0.07364195958654578, "test/sim_max_reward_4500005": 0.3439046049578703, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.9488159505341919, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.8483755180455508, "test/sim_max_reward_4500012": 0.10887865547126271, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.9304523852369855, "test/sim_max_reward_4500015": 0.9169609631709182, "test/sim_max_reward_4500016": 0.47496868885129995, "test/sim_max_reward_4500017": 0.007857880067518315, "test/sim_max_reward_4500018": 0.2525983052388117, "test/sim_max_reward_4500019": 0.39496762743265895, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9241839347621684, "test/sim_max_reward_4500022": 0.9684591167516093, "test/sim_max_reward_4500023": 0.8890767126905462, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.0014752519222762297, "test/sim_max_reward_4500026": 0.15591395824731924, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.25063083484290616, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.42323910431543293, "test/sim_max_reward_4500033": 0.18507124660454116, "test/sim_max_reward_4500034": 0.8060479278178688, "test/sim_max_reward_4500035": 0.8657782616959527, "test/sim_max_reward_4500036": 0.37370650605738603, "test/sim_max_reward_4500037": 0.8736658433626531, "test/sim_max_reward_4500038": 0.29279371996866055, "test/sim_max_reward_4500039": 1.0, "test/sim_max_reward_4500040": 0.765344941332842, "test/sim_max_reward_4500041": 0.972438585731041, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.7888528881290554, "test/sim_max_reward_4500044": 0.603074357392442, "test/sim_max_reward_4500045": 0.8339979310064543, "test/sim_max_reward_4500046": 0.7971145467296245, "test/sim_max_reward_4500047": 0.9020002789750872, "test/sim_max_reward_4500048": 0.990279246440439, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.48980550595476374, "test/mean_score": 0.5176739356988987, "val_loss": 74834.359375} {"train_loss": -6.072085380554199, "global_step": 69342, "epoch": 1651} {"train_loss": -6.068924427032471, "global_step": 69343, "epoch": 1651} {"train_loss": -5.947032451629639, "global_step": 69344, "epoch": 1651} {"train_loss": -6.094285011291504, "global_step": 69345, "epoch": 1651} {"train_loss": -5.988299369812012, "global_step": 69346, "epoch": 1651} {"train_loss": -6.041646957397461, "global_step": 69347, "epoch": 1651} {"train_loss": -6.05866813659668, "global_step": 69348, "epoch": 1651} {"train_loss": -6.053533554077148, "global_step": 69349, "epoch": 1651} {"train_loss": -5.987070083618164, "global_step": 69350, "epoch": 1651} {"train_loss": -6.106816291809082, "global_step": 69351, "epoch": 1651} {"train_loss": -6.092852592468262, "global_step": 69352, "epoch": 1651} {"train_loss": -6.01889705657959, "global_step": 69353, "epoch": 1651} {"train_loss": -6.156180381774902, "global_step": 69354, "epoch": 1651} {"train_loss": -6.018817901611328, "global_step": 69355, "epoch": 1651} {"train_loss": -5.990912437438965, "global_step": 69356, "epoch": 1651} {"train_loss": -6.1454973220825195, "global_step": 69357, "epoch": 1651} {"train_loss": -6.119424819946289, "global_step": 69358, "epoch": 1651} {"train_loss": -5.902633190155029, "global_step": 69359, "epoch": 1651} {"train_loss": -6.0350565910339355, "global_step": 69360, "epoch": 1651} {"train_loss": -5.998453140258789, "global_step": 69361, "epoch": 1651} {"train_loss": -6.0867156982421875, "global_step": 69362, "epoch": 1651} {"train_loss": -5.970547676086426, "global_step": 69363, "epoch": 1651} {"train_loss": -5.97946834564209, "global_step": 69364, "epoch": 1651} {"train_loss": -5.831027984619141, "global_step": 69365, "epoch": 1651} {"train_loss": -5.940596580505371, "global_step": 69366, "epoch": 1651} {"train_loss": -5.898836135864258, "global_step": 69367, "epoch": 1651} {"train_loss": -5.9897284507751465, "global_step": 69368, "epoch": 1651} {"train_loss": -5.939504146575928, "global_step": 69369, "epoch": 1651} {"train_loss": -5.944135665893555, "global_step": 69370, "epoch": 1651} {"train_loss": -6.0935444831848145, "global_step": 69371, "epoch": 1651} {"train_loss": -6.093509674072266, "global_step": 69372, "epoch": 1651} {"train_loss": -6.0719099044799805, "global_step": 69373, "epoch": 1651} {"train_loss": -5.950653076171875, "global_step": 69374, "epoch": 1651} {"train_loss": -6.119645118713379, "global_step": 69375, "epoch": 1651} {"train_loss": -5.962227821350098, "global_step": 69376, "epoch": 1651} {"train_loss": -5.856771469116211, "global_step": 69377, "epoch": 1651} {"train_loss": -5.965201377868652, "global_step": 69378, "epoch": 1651} {"train_loss": -5.96921443939209, "global_step": 69379, "epoch": 1651} {"train_loss": -5.995212554931641, "global_step": 69380, "epoch": 1651} {"train_loss": -5.945466041564941, "global_step": 69381, "epoch": 1651} {"train_loss": -5.973666191101074, "global_step": 69382, "epoch": 1651} {"train_loss": -6.009404386792864, "global_step": 69383, "epoch": 1651, "val_loss": 74643.328125} {"train_loss": -5.901973247528076, "global_step": 69384, "epoch": 1652} {"train_loss": -6.089245796203613, "global_step": 69385, "epoch": 1652} {"train_loss": -5.998522758483887, "global_step": 69386, "epoch": 1652} {"train_loss": -6.069379806518555, "global_step": 69387, "epoch": 1652} {"train_loss": -5.993988990783691, "global_step": 69388, "epoch": 1652} {"train_loss": -6.012195587158203, "global_step": 69389, "epoch": 1652} {"train_loss": -6.1377153396606445, "global_step": 69390, "epoch": 1652} {"train_loss": -5.994894504547119, "global_step": 69391, "epoch": 1652} {"train_loss": -6.0817437171936035, "global_step": 69392, "epoch": 1652} {"train_loss": -5.978884220123291, "global_step": 69393, "epoch": 1652} {"train_loss": -6.026472091674805, "global_step": 69394, "epoch": 1652} {"train_loss": -5.939427852630615, "global_step": 69395, "epoch": 1652} {"train_loss": -6.103172302246094, "global_step": 69396, "epoch": 1652} {"train_loss": -6.0364089012146, "global_step": 69397, "epoch": 1652} {"train_loss": -6.110721588134766, "global_step": 69398, "epoch": 1652} {"train_loss": -5.990965843200684, "global_step": 69399, "epoch": 1652} {"train_loss": -5.933467864990234, "global_step": 69400, "epoch": 1652} {"train_loss": -6.081036567687988, "global_step": 69401, "epoch": 1652} {"train_loss": -6.073044776916504, "global_step": 69402, "epoch": 1652} {"train_loss": -6.026283264160156, "global_step": 69403, "epoch": 1652} {"train_loss": -6.014837265014648, "global_step": 69404, "epoch": 1652} {"train_loss": -6.086999893188477, "global_step": 69405, "epoch": 1652} {"train_loss": -6.063257217407227, "global_step": 69406, "epoch": 1652} {"train_loss": -6.059508323669434, "global_step": 69407, "epoch": 1652} {"train_loss": -6.092658042907715, "global_step": 69408, "epoch": 1652} {"train_loss": -6.08408784866333, "global_step": 69409, "epoch": 1652} {"train_loss": -5.917426586151123, "global_step": 69410, "epoch": 1652} {"train_loss": -5.960083961486816, "global_step": 69411, "epoch": 1652} {"train_loss": -5.928136348724365, "global_step": 69412, "epoch": 1652} {"train_loss": -5.996695518493652, "global_step": 69413, "epoch": 1652} {"train_loss": -5.997518539428711, "global_step": 69414, "epoch": 1652} {"train_loss": -6.12838077545166, "global_step": 69415, "epoch": 1652} {"train_loss": -5.871865749359131, "global_step": 69416, "epoch": 1652} {"train_loss": -6.11605978012085, "global_step": 69417, "epoch": 1652} {"train_loss": -6.008942604064941, "global_step": 69418, "epoch": 1652} {"train_loss": -6.0674004554748535, "global_step": 69419, "epoch": 1652} {"train_loss": -6.114260673522949, "global_step": 69420, "epoch": 1652} {"train_loss": -5.948164939880371, "global_step": 69421, "epoch": 1652} {"train_loss": -6.076235294342041, "global_step": 69422, "epoch": 1652} {"train_loss": -5.917421340942383, "global_step": 69423, "epoch": 1652} {"train_loss": -5.96486234664917, "global_step": 69424, "epoch": 1652} {"train_loss": -6.022380658558437, "global_step": 69425, "epoch": 1652, "val_loss": 74792.6796875} {"train_loss": -6.050142288208008, "global_step": 69426, "epoch": 1653} {"train_loss": -6.120245933532715, "global_step": 69427, "epoch": 1653} {"train_loss": -6.050357818603516, "global_step": 69428, "epoch": 1653} {"train_loss": -5.954315185546875, "global_step": 69429, "epoch": 1653} {"train_loss": -5.939043998718262, "global_step": 69430, "epoch": 1653} {"train_loss": -6.084161281585693, "global_step": 69431, "epoch": 1653} {"train_loss": -6.089712619781494, "global_step": 69432, "epoch": 1653} {"train_loss": -6.146847724914551, "global_step": 69433, "epoch": 1653} {"train_loss": -6.044384002685547, "global_step": 69434, "epoch": 1653} {"train_loss": -6.048004150390625, "global_step": 69435, "epoch": 1653} {"train_loss": -5.943583965301514, "global_step": 69436, "epoch": 1653} {"train_loss": -6.102833271026611, "global_step": 69437, "epoch": 1653} {"train_loss": -6.177804946899414, "global_step": 69438, "epoch": 1653} {"train_loss": -5.893783092498779, "global_step": 69439, "epoch": 1653} {"train_loss": -6.0206193923950195, "global_step": 69440, "epoch": 1653} {"train_loss": -6.160211563110352, "global_step": 69441, "epoch": 1653} {"train_loss": -6.107338905334473, "global_step": 69442, "epoch": 1653} {"train_loss": -5.999676704406738, "global_step": 69443, "epoch": 1653} {"train_loss": -6.104731559753418, "global_step": 69444, "epoch": 1653} {"train_loss": -6.073141574859619, "global_step": 69445, "epoch": 1653} {"train_loss": -5.9632978439331055, "global_step": 69446, "epoch": 1653} {"train_loss": -5.948025226593018, "global_step": 69447, "epoch": 1653} {"train_loss": -5.928464889526367, "global_step": 69448, "epoch": 1653} {"train_loss": -6.012486457824707, "global_step": 69449, "epoch": 1653} {"train_loss": -5.982001781463623, "global_step": 69450, "epoch": 1653} {"train_loss": -5.887998580932617, "global_step": 69451, "epoch": 1653} {"train_loss": -6.005206108093262, "global_step": 69452, "epoch": 1653} {"train_loss": -5.995987892150879, "global_step": 69453, "epoch": 1653} {"train_loss": -5.994614601135254, "global_step": 69454, "epoch": 1653} {"train_loss": -6.068386077880859, "global_step": 69455, "epoch": 1653} {"train_loss": -6.0886430740356445, "global_step": 69456, "epoch": 1653} {"train_loss": -6.040362358093262, "global_step": 69457, "epoch": 1653} {"train_loss": -6.065847873687744, "global_step": 69458, "epoch": 1653} {"train_loss": -5.990764617919922, "global_step": 69459, "epoch": 1653} {"train_loss": -6.117501735687256, "global_step": 69460, "epoch": 1653} {"train_loss": -5.97096061706543, "global_step": 69461, "epoch": 1653} {"train_loss": -6.042205333709717, "global_step": 69462, "epoch": 1653} {"train_loss": -5.773903846740723, "global_step": 69463, "epoch": 1653} {"train_loss": -5.984064102172852, "global_step": 69464, "epoch": 1653} {"train_loss": -5.972372055053711, "global_step": 69465, "epoch": 1653} {"train_loss": -6.014198303222656, "global_step": 69466, "epoch": 1653} {"train_loss": -6.020013797850836, "global_step": 69467, "epoch": 1653, "val_loss": 74655.1484375} {"train_loss": -6.043277263641357, "global_step": 69468, "epoch": 1654} {"train_loss": -5.920289993286133, "global_step": 69469, "epoch": 1654} {"train_loss": -5.923557758331299, "global_step": 69470, "epoch": 1654} {"train_loss": -6.097356796264648, "global_step": 69471, "epoch": 1654} {"train_loss": -5.995790481567383, "global_step": 69472, "epoch": 1654} {"train_loss": -6.240571022033691, "global_step": 69473, "epoch": 1654} {"train_loss": -5.997900485992432, "global_step": 69474, "epoch": 1654} {"train_loss": -6.0652875900268555, "global_step": 69475, "epoch": 1654} {"train_loss": -6.055693626403809, "global_step": 69476, "epoch": 1654} {"train_loss": -6.0372419357299805, "global_step": 69477, "epoch": 1654} {"train_loss": -5.9823102951049805, "global_step": 69478, "epoch": 1654} {"train_loss": -6.054865837097168, "global_step": 69479, "epoch": 1654} {"train_loss": -5.99637508392334, "global_step": 69480, "epoch": 1654} {"train_loss": -5.990487098693848, "global_step": 69481, "epoch": 1654} {"train_loss": -5.924463272094727, "global_step": 69482, "epoch": 1654} {"train_loss": -6.000741958618164, "global_step": 69483, "epoch": 1654} {"train_loss": -5.897525787353516, "global_step": 69484, "epoch": 1654} {"train_loss": -5.996420860290527, "global_step": 69485, "epoch": 1654} {"train_loss": -5.960772514343262, "global_step": 69486, "epoch": 1654} {"train_loss": -5.923548698425293, "global_step": 69487, "epoch": 1654} {"train_loss": -5.945668697357178, "global_step": 69488, "epoch": 1654} {"train_loss": -5.795433044433594, "global_step": 69489, "epoch": 1654} {"train_loss": -5.7741851806640625, "global_step": 69490, "epoch": 1654} {"train_loss": -6.007118225097656, "global_step": 69491, "epoch": 1654} {"train_loss": -6.009398460388184, "global_step": 69492, "epoch": 1654} {"train_loss": -5.876482963562012, "global_step": 69493, "epoch": 1654} {"train_loss": -6.036990165710449, "global_step": 69494, "epoch": 1654} {"train_loss": -5.974736213684082, "global_step": 69495, "epoch": 1654} {"train_loss": -5.985633850097656, "global_step": 69496, "epoch": 1654} {"train_loss": -6.088245391845703, "global_step": 69497, "epoch": 1654} {"train_loss": -6.0178728103637695, "global_step": 69498, "epoch": 1654} {"train_loss": -5.976241111755371, "global_step": 69499, "epoch": 1654} {"train_loss": -5.894353866577148, "global_step": 69500, "epoch": 1654} {"train_loss": -6.034895896911621, "global_step": 69501, "epoch": 1654} {"train_loss": -5.938076496124268, "global_step": 69502, "epoch": 1654} {"train_loss": -6.099096298217773, "global_step": 69503, "epoch": 1654} {"train_loss": -5.931763648986816, "global_step": 69504, "epoch": 1654} {"train_loss": -6.0885210037231445, "global_step": 69505, "epoch": 1654} {"train_loss": -5.917133331298828, "global_step": 69506, "epoch": 1654} {"train_loss": -6.025587558746338, "global_step": 69507, "epoch": 1654} {"train_loss": -6.063044548034668, "global_step": 69508, "epoch": 1654} {"train_loss": -5.989112150101435, "global_step": 69509, "epoch": 1654, "val_loss": 74619.0078125} {"train_loss": -6.003807067871094, "global_step": 69510, "epoch": 1655} {"train_loss": -5.896604061126709, "global_step": 69511, "epoch": 1655} {"train_loss": -6.096576690673828, "global_step": 69512, "epoch": 1655} {"train_loss": -6.05014705657959, "global_step": 69513, "epoch": 1655} {"train_loss": -6.028397083282471, "global_step": 69514, "epoch": 1655} {"train_loss": -6.049951553344727, "global_step": 69515, "epoch": 1655} {"train_loss": -5.978818893432617, "global_step": 69516, "epoch": 1655} {"train_loss": -5.982591152191162, "global_step": 69517, "epoch": 1655} {"train_loss": -6.060723304748535, "global_step": 69518, "epoch": 1655} {"train_loss": -6.063163757324219, "global_step": 69519, "epoch": 1655} {"train_loss": -5.928654670715332, "global_step": 69520, "epoch": 1655} {"train_loss": -6.076004981994629, "global_step": 69521, "epoch": 1655} {"train_loss": -5.9839372634887695, "global_step": 69522, "epoch": 1655} {"train_loss": -6.040816307067871, "global_step": 69523, "epoch": 1655} {"train_loss": -5.899808883666992, "global_step": 69524, "epoch": 1655} {"train_loss": -5.924933433532715, "global_step": 69525, "epoch": 1655} {"train_loss": -5.813515663146973, "global_step": 69526, "epoch": 1655} {"train_loss": -6.097028732299805, "global_step": 69527, "epoch": 1655} {"train_loss": -6.0129570960998535, "global_step": 69528, "epoch": 1655} {"train_loss": -5.958199501037598, "global_step": 69529, "epoch": 1655} {"train_loss": -6.089517116546631, "global_step": 69530, "epoch": 1655} {"train_loss": -5.882636070251465, "global_step": 69531, "epoch": 1655} {"train_loss": -6.158510684967041, "global_step": 69532, "epoch": 1655} {"train_loss": -5.975480079650879, "global_step": 69533, "epoch": 1655} {"train_loss": -6.069941520690918, "global_step": 69534, "epoch": 1655} {"train_loss": -5.8910040855407715, "global_step": 69535, "epoch": 1655} {"train_loss": -5.961382865905762, "global_step": 69536, "epoch": 1655} {"train_loss": -5.96241569519043, "global_step": 69537, "epoch": 1655} {"train_loss": -6.058963775634766, "global_step": 69538, "epoch": 1655} {"train_loss": -6.108977794647217, "global_step": 69539, "epoch": 1655} {"train_loss": -5.96085262298584, "global_step": 69540, "epoch": 1655} {"train_loss": -5.940779685974121, "global_step": 69541, "epoch": 1655} {"train_loss": -6.084931373596191, "global_step": 69542, "epoch": 1655} {"train_loss": -6.051872253417969, "global_step": 69543, "epoch": 1655} {"train_loss": -5.955451488494873, "global_step": 69544, "epoch": 1655} {"train_loss": -6.036280155181885, "global_step": 69545, "epoch": 1655} {"train_loss": -6.106095314025879, "global_step": 69546, "epoch": 1655} {"train_loss": -6.094481468200684, "global_step": 69547, "epoch": 1655} {"train_loss": -6.011435031890869, "global_step": 69548, "epoch": 1655} {"train_loss": -5.954432964324951, "global_step": 69549, "epoch": 1655} {"train_loss": -5.965435981750488, "global_step": 69550, "epoch": 1655} {"train_loss": -6.009111461185274, "global_step": 69551, "epoch": 1655, "val_loss": 74648.234375} {"train_loss": -6.094629287719727, "global_step": 69552, "epoch": 1656} {"train_loss": -6.067816257476807, "global_step": 69553, "epoch": 1656} {"train_loss": -6.183913230895996, "global_step": 69554, "epoch": 1656} {"train_loss": -5.96036434173584, "global_step": 69555, "epoch": 1656} {"train_loss": -6.085216522216797, "global_step": 69556, "epoch": 1656} {"train_loss": -5.908276557922363, "global_step": 69557, "epoch": 1656} {"train_loss": -6.060622692108154, "global_step": 69558, "epoch": 1656} {"train_loss": -6.040342330932617, "global_step": 69559, "epoch": 1656} {"train_loss": -6.059226036071777, "global_step": 69560, "epoch": 1656} {"train_loss": -5.959102630615234, "global_step": 69561, "epoch": 1656} {"train_loss": -6.161121368408203, "global_step": 69562, "epoch": 1656} {"train_loss": -5.984152317047119, "global_step": 69563, "epoch": 1656} {"train_loss": -6.109289169311523, "global_step": 69564, "epoch": 1656} {"train_loss": -5.919498920440674, "global_step": 69565, "epoch": 1656} {"train_loss": -6.109869956970215, "global_step": 69566, "epoch": 1656} {"train_loss": -6.070372104644775, "global_step": 69567, "epoch": 1656} {"train_loss": -5.976649284362793, "global_step": 69568, "epoch": 1656} {"train_loss": -5.9146728515625, "global_step": 69569, "epoch": 1656} {"train_loss": -6.016542434692383, "global_step": 69570, "epoch": 1656} {"train_loss": -5.971700191497803, "global_step": 69571, "epoch": 1656} {"train_loss": -6.055926322937012, "global_step": 69572, "epoch": 1656} {"train_loss": -5.945614814758301, "global_step": 69573, "epoch": 1656} {"train_loss": -6.047259330749512, "global_step": 69574, "epoch": 1656} {"train_loss": -5.860418319702148, "global_step": 69575, "epoch": 1656} {"train_loss": -6.126039028167725, "global_step": 69576, "epoch": 1656} {"train_loss": -6.047447204589844, "global_step": 69577, "epoch": 1656} {"train_loss": -5.916921615600586, "global_step": 69578, "epoch": 1656} {"train_loss": -6.011346817016602, "global_step": 69579, "epoch": 1656} {"train_loss": -5.974841117858887, "global_step": 69580, "epoch": 1656} {"train_loss": -5.9762701988220215, "global_step": 69581, "epoch": 1656} {"train_loss": -6.1185526847839355, "global_step": 69582, "epoch": 1656} {"train_loss": -5.760677337646484, "global_step": 69583, "epoch": 1656} {"train_loss": -6.056699752807617, "global_step": 69584, "epoch": 1656} {"train_loss": -5.913787841796875, "global_step": 69585, "epoch": 1656} {"train_loss": -5.9410552978515625, "global_step": 69586, "epoch": 1656} {"train_loss": -6.042393684387207, "global_step": 69587, "epoch": 1656} {"train_loss": -5.832612037658691, "global_step": 69588, "epoch": 1656} {"train_loss": -5.920970916748047, "global_step": 69589, "epoch": 1656} {"train_loss": -5.867242336273193, "global_step": 69590, "epoch": 1656} {"train_loss": -5.94210958480835, "global_step": 69591, "epoch": 1656} {"train_loss": -5.888390064239502, "global_step": 69592, "epoch": 1656} {"train_loss": -5.996688865479969, "global_step": 69593, "epoch": 1656, "val_loss": 74931.796875} {"train_loss": -5.953319549560547, "global_step": 69594, "epoch": 1657} {"train_loss": -6.020802974700928, "global_step": 69595, "epoch": 1657} {"train_loss": -6.025333881378174, "global_step": 69596, "epoch": 1657} {"train_loss": -5.89403772354126, "global_step": 69597, "epoch": 1657} {"train_loss": -5.96507453918457, "global_step": 69598, "epoch": 1657} {"train_loss": -6.04971981048584, "global_step": 69599, "epoch": 1657} {"train_loss": -6.035483360290527, "global_step": 69600, "epoch": 1657} {"train_loss": -6.028151988983154, "global_step": 69601, "epoch": 1657} {"train_loss": -5.982489109039307, "global_step": 69602, "epoch": 1657} {"train_loss": -5.910823345184326, "global_step": 69603, "epoch": 1657} {"train_loss": -6.017470836639404, "global_step": 69604, "epoch": 1657} {"train_loss": -5.955523490905762, "global_step": 69605, "epoch": 1657} {"train_loss": -5.930497169494629, "global_step": 69606, "epoch": 1657} {"train_loss": -5.9720354080200195, "global_step": 69607, "epoch": 1657} {"train_loss": -6.000854015350342, "global_step": 69608, "epoch": 1657} {"train_loss": -6.045984745025635, "global_step": 69609, "epoch": 1657} {"train_loss": -6.022481918334961, "global_step": 69610, "epoch": 1657} {"train_loss": -5.987411022186279, "global_step": 69611, "epoch": 1657} {"train_loss": -5.937068939208984, "global_step": 69612, "epoch": 1657} {"train_loss": -6.079869270324707, "global_step": 69613, "epoch": 1657} {"train_loss": -5.815113067626953, "global_step": 69614, "epoch": 1657} {"train_loss": -5.935721397399902, "global_step": 69615, "epoch": 1657} {"train_loss": -5.962099552154541, "global_step": 69616, "epoch": 1657} {"train_loss": -6.016822814941406, "global_step": 69617, "epoch": 1657} {"train_loss": -6.01333475112915, "global_step": 69618, "epoch": 1657} {"train_loss": -5.789305210113525, "global_step": 69619, "epoch": 1657} {"train_loss": -5.909235000610352, "global_step": 69620, "epoch": 1657} {"train_loss": -5.9443678855896, "global_step": 69621, "epoch": 1657} {"train_loss": -5.801199436187744, "global_step": 69622, "epoch": 1657} {"train_loss": -6.026797771453857, "global_step": 69623, "epoch": 1657} {"train_loss": -5.86066198348999, "global_step": 69624, "epoch": 1657} {"train_loss": -5.880519866943359, "global_step": 69625, "epoch": 1657} {"train_loss": -5.879092216491699, "global_step": 69626, "epoch": 1657} {"train_loss": -5.885305881500244, "global_step": 69627, "epoch": 1657} {"train_loss": -5.9144744873046875, "global_step": 69628, "epoch": 1657} {"train_loss": -5.875558853149414, "global_step": 69629, "epoch": 1657} {"train_loss": -6.044984340667725, "global_step": 69630, "epoch": 1657} {"train_loss": -5.8992838859558105, "global_step": 69631, "epoch": 1657} {"train_loss": -5.881006240844727, "global_step": 69632, "epoch": 1657} {"train_loss": -5.896009922027588, "global_step": 69633, "epoch": 1657} {"train_loss": -5.946824073791504, "global_step": 69634, "epoch": 1657} {"train_loss": -5.9495509919666105, "global_step": 69635, "epoch": 1657, "val_loss": 74565.5} {"train_loss": -6.074300289154053, "global_step": 69636, "epoch": 1658} {"train_loss": -5.961944103240967, "global_step": 69637, "epoch": 1658} {"train_loss": -6.018787860870361, "global_step": 69638, "epoch": 1658} {"train_loss": -6.080410957336426, "global_step": 69639, "epoch": 1658} {"train_loss": -5.843910217285156, "global_step": 69640, "epoch": 1658} {"train_loss": -6.03774356842041, "global_step": 69641, "epoch": 1658} {"train_loss": -5.921492099761963, "global_step": 69642, "epoch": 1658} {"train_loss": -5.999632835388184, "global_step": 69643, "epoch": 1658} {"train_loss": -5.981978416442871, "global_step": 69644, "epoch": 1658} {"train_loss": -5.926871299743652, "global_step": 69645, "epoch": 1658} {"train_loss": -6.053750991821289, "global_step": 69646, "epoch": 1658} {"train_loss": -6.003344535827637, "global_step": 69647, "epoch": 1658} {"train_loss": -5.993768692016602, "global_step": 69648, "epoch": 1658} {"train_loss": -6.071969032287598, "global_step": 69649, "epoch": 1658} {"train_loss": -6.037004470825195, "global_step": 69650, "epoch": 1658} {"train_loss": -5.885936737060547, "global_step": 69651, "epoch": 1658} {"train_loss": -6.119677543640137, "global_step": 69652, "epoch": 1658} {"train_loss": -5.977043628692627, "global_step": 69653, "epoch": 1658} {"train_loss": -6.075441837310791, "global_step": 69654, "epoch": 1658} {"train_loss": -5.99970817565918, "global_step": 69655, "epoch": 1658} {"train_loss": -6.082479476928711, "global_step": 69656, "epoch": 1658} {"train_loss": -6.031985759735107, "global_step": 69657, "epoch": 1658} {"train_loss": -6.080313682556152, "global_step": 69658, "epoch": 1658} {"train_loss": -6.098546504974365, "global_step": 69659, "epoch": 1658} {"train_loss": -5.993104934692383, "global_step": 69660, "epoch": 1658} {"train_loss": -5.936870574951172, "global_step": 69661, "epoch": 1658} {"train_loss": -5.983933925628662, "global_step": 69662, "epoch": 1658} {"train_loss": -6.003757476806641, "global_step": 69663, "epoch": 1658} {"train_loss": -5.940812110900879, "global_step": 69664, "epoch": 1658} {"train_loss": -6.109949111938477, "global_step": 69665, "epoch": 1658} {"train_loss": -5.969145774841309, "global_step": 69666, "epoch": 1658} {"train_loss": -5.960013389587402, "global_step": 69667, "epoch": 1658} {"train_loss": -5.975034236907959, "global_step": 69668, "epoch": 1658} {"train_loss": -5.952125072479248, "global_step": 69669, "epoch": 1658} {"train_loss": -5.98728084564209, "global_step": 69670, "epoch": 1658} {"train_loss": -6.040270805358887, "global_step": 69671, "epoch": 1658} {"train_loss": -6.105172157287598, "global_step": 69672, "epoch": 1658} {"train_loss": -6.0454020500183105, "global_step": 69673, "epoch": 1658} {"train_loss": -6.024022102355957, "global_step": 69674, "epoch": 1658} {"train_loss": -6.108834266662598, "global_step": 69675, "epoch": 1658} {"train_loss": -6.119958877563477, "global_step": 69676, "epoch": 1658} {"train_loss": -6.014841601962135, "global_step": 69677, "epoch": 1658, "val_loss": 74844.5625} {"train_loss": -6.025519371032715, "global_step": 69678, "epoch": 1659} {"train_loss": -5.982540130615234, "global_step": 69679, "epoch": 1659} {"train_loss": -6.039800643920898, "global_step": 69680, "epoch": 1659} {"train_loss": -5.977606773376465, "global_step": 69681, "epoch": 1659} {"train_loss": -6.143922805786133, "global_step": 69682, "epoch": 1659} {"train_loss": -5.9676513671875, "global_step": 69683, "epoch": 1659} {"train_loss": -6.001220703125, "global_step": 69684, "epoch": 1659} {"train_loss": -6.0985846519470215, "global_step": 69685, "epoch": 1659} {"train_loss": -6.127991199493408, "global_step": 69686, "epoch": 1659} {"train_loss": -5.915870666503906, "global_step": 69687, "epoch": 1659} {"train_loss": -6.104990005493164, "global_step": 69688, "epoch": 1659} {"train_loss": -6.0067243576049805, "global_step": 69689, "epoch": 1659} {"train_loss": -5.955010414123535, "global_step": 69690, "epoch": 1659} {"train_loss": -6.005655288696289, "global_step": 69691, "epoch": 1659} {"train_loss": -5.985628128051758, "global_step": 69692, "epoch": 1659} {"train_loss": -6.046262264251709, "global_step": 69693, "epoch": 1659} {"train_loss": -6.035844326019287, "global_step": 69694, "epoch": 1659} {"train_loss": -5.918354511260986, "global_step": 69695, "epoch": 1659} {"train_loss": -6.009969711303711, "global_step": 69696, "epoch": 1659} {"train_loss": -5.976941108703613, "global_step": 69697, "epoch": 1659} {"train_loss": -5.89666748046875, "global_step": 69698, "epoch": 1659} {"train_loss": -6.037271022796631, "global_step": 69699, "epoch": 1659} {"train_loss": -6.0226945877075195, "global_step": 69700, "epoch": 1659} {"train_loss": -5.9600067138671875, "global_step": 69701, "epoch": 1659} {"train_loss": -6.029999732971191, "global_step": 69702, "epoch": 1659} {"train_loss": -5.885301113128662, "global_step": 69703, "epoch": 1659} {"train_loss": -5.968097686767578, "global_step": 69704, "epoch": 1659} {"train_loss": -6.023106575012207, "global_step": 69705, "epoch": 1659} {"train_loss": -5.970193862915039, "global_step": 69706, "epoch": 1659} {"train_loss": -6.0417280197143555, "global_step": 69707, "epoch": 1659} {"train_loss": -6.069756507873535, "global_step": 69708, "epoch": 1659} {"train_loss": -5.8932294845581055, "global_step": 69709, "epoch": 1659} {"train_loss": -6.1362223625183105, "global_step": 69710, "epoch": 1659} {"train_loss": -6.031850337982178, "global_step": 69711, "epoch": 1659} {"train_loss": -6.120421886444092, "global_step": 69712, "epoch": 1659} {"train_loss": -5.97583532333374, "global_step": 69713, "epoch": 1659} {"train_loss": -6.022251129150391, "global_step": 69714, "epoch": 1659} {"train_loss": -6.050619125366211, "global_step": 69715, "epoch": 1659} {"train_loss": -6.04503059387207, "global_step": 69716, "epoch": 1659} {"train_loss": -6.048689365386963, "global_step": 69717, "epoch": 1659} {"train_loss": -5.9746599197387695, "global_step": 69718, "epoch": 1659} {"train_loss": -6.011270057587397, "global_step": 69719, "epoch": 1659, "val_loss": 74856.46875} {"train_loss": -5.923436164855957, "global_step": 69720, "epoch": 1660} {"train_loss": -6.042498588562012, "global_step": 69721, "epoch": 1660} {"train_loss": -6.028295516967773, "global_step": 69722, "epoch": 1660} {"train_loss": -5.9928789138793945, "global_step": 69723, "epoch": 1660} {"train_loss": -6.024353504180908, "global_step": 69724, "epoch": 1660} {"train_loss": -5.998357772827148, "global_step": 69725, "epoch": 1660} {"train_loss": -6.095396995544434, "global_step": 69726, "epoch": 1660} {"train_loss": -6.014399528503418, "global_step": 69727, "epoch": 1660} {"train_loss": -5.980546474456787, "global_step": 69728, "epoch": 1660} {"train_loss": -5.983386039733887, "global_step": 69729, "epoch": 1660} {"train_loss": -5.95609712600708, "global_step": 69730, "epoch": 1660} {"train_loss": -6.020377159118652, "global_step": 69731, "epoch": 1660} {"train_loss": -5.874279022216797, "global_step": 69732, "epoch": 1660} {"train_loss": -5.99348783493042, "global_step": 69733, "epoch": 1660} {"train_loss": -5.925494194030762, "global_step": 69734, "epoch": 1660} {"train_loss": -5.957457542419434, "global_step": 69735, "epoch": 1660} {"train_loss": -6.014739990234375, "global_step": 69736, "epoch": 1660} {"train_loss": -6.008148193359375, "global_step": 69737, "epoch": 1660} {"train_loss": -5.998929977416992, "global_step": 69738, "epoch": 1660} {"train_loss": -6.06833028793335, "global_step": 69739, "epoch": 1660} {"train_loss": -6.109793186187744, "global_step": 69740, "epoch": 1660} {"train_loss": -6.0921478271484375, "global_step": 69741, "epoch": 1660} {"train_loss": -5.978180885314941, "global_step": 69742, "epoch": 1660} {"train_loss": -6.056309700012207, "global_step": 69743, "epoch": 1660} {"train_loss": -6.005737781524658, "global_step": 69744, "epoch": 1660} {"train_loss": -6.100131988525391, "global_step": 69745, "epoch": 1660} {"train_loss": -6.003734111785889, "global_step": 69746, "epoch": 1660} {"train_loss": -5.873910903930664, "global_step": 69747, "epoch": 1660} {"train_loss": -6.050929546356201, "global_step": 69748, "epoch": 1660} {"train_loss": -6.06188440322876, "global_step": 69749, "epoch": 1660} {"train_loss": -5.990609169006348, "global_step": 69750, "epoch": 1660} {"train_loss": -5.985835075378418, "global_step": 69751, "epoch": 1660} {"train_loss": -6.089178085327148, "global_step": 69752, "epoch": 1660} {"train_loss": -6.040753364562988, "global_step": 69753, "epoch": 1660} {"train_loss": -6.024177074432373, "global_step": 69754, "epoch": 1660} {"train_loss": -6.056046485900879, "global_step": 69755, "epoch": 1660} {"train_loss": -6.054896354675293, "global_step": 69756, "epoch": 1660} {"train_loss": -6.007984638214111, "global_step": 69757, "epoch": 1660} {"train_loss": -6.107391357421875, "global_step": 69758, "epoch": 1660} {"train_loss": -5.8311614990234375, "global_step": 69759, "epoch": 1660} {"train_loss": -6.0306782722473145, "global_step": 69760, "epoch": 1660} {"train_loss": -6.010812963758196, "global_step": 69761, "epoch": 1660, "val_loss": 74500.484375} {"train_loss": -5.976774215698242, "global_step": 69762, "epoch": 1661} {"train_loss": -5.8934102058410645, "global_step": 69763, "epoch": 1661} {"train_loss": -6.030917167663574, "global_step": 69764, "epoch": 1661} {"train_loss": -5.992321968078613, "global_step": 69765, "epoch": 1661} {"train_loss": -5.984871864318848, "global_step": 69766, "epoch": 1661} {"train_loss": -5.98569917678833, "global_step": 69767, "epoch": 1661} {"train_loss": -6.074132919311523, "global_step": 69768, "epoch": 1661} {"train_loss": -5.974884986877441, "global_step": 69769, "epoch": 1661} {"train_loss": -6.00898551940918, "global_step": 69770, "epoch": 1661} {"train_loss": -5.969659328460693, "global_step": 69771, "epoch": 1661} {"train_loss": -6.048617362976074, "global_step": 69772, "epoch": 1661} {"train_loss": -6.07463264465332, "global_step": 69773, "epoch": 1661} {"train_loss": -6.06416654586792, "global_step": 69774, "epoch": 1661} {"train_loss": -6.045136451721191, "global_step": 69775, "epoch": 1661} {"train_loss": -6.028027057647705, "global_step": 69776, "epoch": 1661} {"train_loss": -6.038065433502197, "global_step": 69777, "epoch": 1661} {"train_loss": -5.947408676147461, "global_step": 69778, "epoch": 1661} {"train_loss": -6.0805816650390625, "global_step": 69779, "epoch": 1661} {"train_loss": -6.125168800354004, "global_step": 69780, "epoch": 1661} {"train_loss": -6.085385322570801, "global_step": 69781, "epoch": 1661} {"train_loss": -5.966375350952148, "global_step": 69782, "epoch": 1661} {"train_loss": -6.036264419555664, "global_step": 69783, "epoch": 1661} {"train_loss": -6.014801025390625, "global_step": 69784, "epoch": 1661} {"train_loss": -6.0313005447387695, "global_step": 69785, "epoch": 1661} {"train_loss": -6.142856597900391, "global_step": 69786, "epoch": 1661} {"train_loss": -5.933437347412109, "global_step": 69787, "epoch": 1661} {"train_loss": -6.087392807006836, "global_step": 69788, "epoch": 1661} {"train_loss": -5.993307113647461, "global_step": 69789, "epoch": 1661} {"train_loss": -6.067707061767578, "global_step": 69790, "epoch": 1661} {"train_loss": -6.030094146728516, "global_step": 69791, "epoch": 1661} {"train_loss": -6.159482955932617, "global_step": 69792, "epoch": 1661} {"train_loss": -6.073773384094238, "global_step": 69793, "epoch": 1661} {"train_loss": -5.953993320465088, "global_step": 69794, "epoch": 1661} {"train_loss": -6.065194129943848, "global_step": 69795, "epoch": 1661} {"train_loss": -5.973688125610352, "global_step": 69796, "epoch": 1661} {"train_loss": -6.022558212280273, "global_step": 69797, "epoch": 1661} {"train_loss": -6.060171127319336, "global_step": 69798, "epoch": 1661} {"train_loss": -5.978018760681152, "global_step": 69799, "epoch": 1661} {"train_loss": -6.009237289428711, "global_step": 69800, "epoch": 1661} {"train_loss": -5.958745002746582, "global_step": 69801, "epoch": 1661} {"train_loss": -5.894924163818359, "global_step": 69802, "epoch": 1661} {"train_loss": -6.017876295816331, "global_step": 69803, "epoch": 1661, "val_loss": 74908.515625} {"train_loss": -5.90380859375, "global_step": 69804, "epoch": 1662} {"train_loss": -6.046132564544678, "global_step": 69805, "epoch": 1662} {"train_loss": -5.885641098022461, "global_step": 69806, "epoch": 1662} {"train_loss": -6.021206378936768, "global_step": 69807, "epoch": 1662} {"train_loss": -6.051673889160156, "global_step": 69808, "epoch": 1662} {"train_loss": -5.99296760559082, "global_step": 69809, "epoch": 1662} {"train_loss": -5.81942081451416, "global_step": 69810, "epoch": 1662} {"train_loss": -6.061005592346191, "global_step": 69811, "epoch": 1662} {"train_loss": -6.009793281555176, "global_step": 69812, "epoch": 1662} {"train_loss": -6.088143825531006, "global_step": 69813, "epoch": 1662} {"train_loss": -6.059531211853027, "global_step": 69814, "epoch": 1662} {"train_loss": -5.968469619750977, "global_step": 69815, "epoch": 1662} {"train_loss": -5.929042816162109, "global_step": 69816, "epoch": 1662} {"train_loss": -6.005141735076904, "global_step": 69817, "epoch": 1662} {"train_loss": -6.0724897384643555, "global_step": 69818, "epoch": 1662} {"train_loss": -5.889716148376465, "global_step": 69819, "epoch": 1662} {"train_loss": -6.053165435791016, "global_step": 69820, "epoch": 1662} {"train_loss": -6.097357749938965, "global_step": 69821, "epoch": 1662} {"train_loss": -6.086722373962402, "global_step": 69822, "epoch": 1662} {"train_loss": -6.106191635131836, "global_step": 69823, "epoch": 1662} {"train_loss": -5.997171878814697, "global_step": 69824, "epoch": 1662} {"train_loss": -6.0494704246521, "global_step": 69825, "epoch": 1662} {"train_loss": -6.037171363830566, "global_step": 69826, "epoch": 1662} {"train_loss": -5.974221706390381, "global_step": 69827, "epoch": 1662} {"train_loss": -5.990051746368408, "global_step": 69828, "epoch": 1662} {"train_loss": -5.998903751373291, "global_step": 69829, "epoch": 1662} {"train_loss": -6.125736713409424, "global_step": 69830, "epoch": 1662} {"train_loss": -6.052819728851318, "global_step": 69831, "epoch": 1662} {"train_loss": -5.998684883117676, "global_step": 69832, "epoch": 1662} {"train_loss": -5.954056262969971, "global_step": 69833, "epoch": 1662} {"train_loss": -5.986583709716797, "global_step": 69834, "epoch": 1662} {"train_loss": -5.961830139160156, "global_step": 69835, "epoch": 1662} {"train_loss": -5.915006160736084, "global_step": 69836, "epoch": 1662} {"train_loss": -6.078135013580322, "global_step": 69837, "epoch": 1662} {"train_loss": -5.967131614685059, "global_step": 69838, "epoch": 1662} {"train_loss": -5.987300872802734, "global_step": 69839, "epoch": 1662} {"train_loss": -5.997206687927246, "global_step": 69840, "epoch": 1662} {"train_loss": -5.97856330871582, "global_step": 69841, "epoch": 1662} {"train_loss": -5.996551990509033, "global_step": 69842, "epoch": 1662} {"train_loss": -6.004270553588867, "global_step": 69843, "epoch": 1662} {"train_loss": -6.031470775604248, "global_step": 69844, "epoch": 1662} {"train_loss": -6.006407896677653, "global_step": 69845, "epoch": 1662, "val_loss": 74555.78125} {"train_loss": -5.998064041137695, "global_step": 69846, "epoch": 1663} {"train_loss": -6.051183700561523, "global_step": 69847, "epoch": 1663} {"train_loss": -6.155632972717285, "global_step": 69848, "epoch": 1663} {"train_loss": -6.060971260070801, "global_step": 69849, "epoch": 1663} {"train_loss": -5.990623950958252, "global_step": 69850, "epoch": 1663} {"train_loss": -6.041691780090332, "global_step": 69851, "epoch": 1663} {"train_loss": -6.044229030609131, "global_step": 69852, "epoch": 1663} {"train_loss": -6.160487174987793, "global_step": 69853, "epoch": 1663} {"train_loss": -6.112470626831055, "global_step": 69854, "epoch": 1663} {"train_loss": -5.952902793884277, "global_step": 69855, "epoch": 1663} {"train_loss": -6.126172065734863, "global_step": 69856, "epoch": 1663} {"train_loss": -6.024568557739258, "global_step": 69857, "epoch": 1663} {"train_loss": -6.081567764282227, "global_step": 69858, "epoch": 1663} {"train_loss": -5.899492263793945, "global_step": 69859, "epoch": 1663} {"train_loss": -6.038889408111572, "global_step": 69860, "epoch": 1663} {"train_loss": -5.940264701843262, "global_step": 69861, "epoch": 1663} {"train_loss": -6.0326409339904785, "global_step": 69862, "epoch": 1663} {"train_loss": -6.027706623077393, "global_step": 69863, "epoch": 1663} {"train_loss": -6.136612892150879, "global_step": 69864, "epoch": 1663} {"train_loss": -5.9418416023254395, "global_step": 69865, "epoch": 1663} {"train_loss": -5.999571323394775, "global_step": 69866, "epoch": 1663} {"train_loss": -6.061794757843018, "global_step": 69867, "epoch": 1663} {"train_loss": -6.084033012390137, "global_step": 69868, "epoch": 1663} {"train_loss": -5.997637748718262, "global_step": 69869, "epoch": 1663} {"train_loss": -6.023435592651367, "global_step": 69870, "epoch": 1663} {"train_loss": -6.197772026062012, "global_step": 69871, "epoch": 1663} {"train_loss": -6.033888339996338, "global_step": 69872, "epoch": 1663} {"train_loss": -6.050712585449219, "global_step": 69873, "epoch": 1663} {"train_loss": -5.927966117858887, "global_step": 69874, "epoch": 1663} {"train_loss": -6.063725471496582, "global_step": 69875, "epoch": 1663} {"train_loss": -6.009632587432861, "global_step": 69876, "epoch": 1663} {"train_loss": -6.092471122741699, "global_step": 69877, "epoch": 1663} {"train_loss": -6.009963512420654, "global_step": 69878, "epoch": 1663} {"train_loss": -5.871076583862305, "global_step": 69879, "epoch": 1663} {"train_loss": -6.167031288146973, "global_step": 69880, "epoch": 1663} {"train_loss": -5.947641849517822, "global_step": 69881, "epoch": 1663} {"train_loss": -6.0530686378479, "global_step": 69882, "epoch": 1663} {"train_loss": -5.951611518859863, "global_step": 69883, "epoch": 1663} {"train_loss": -6.06960391998291, "global_step": 69884, "epoch": 1663} {"train_loss": -6.041321277618408, "global_step": 69885, "epoch": 1663} {"train_loss": -5.932695388793945, "global_step": 69886, "epoch": 1663} {"train_loss": -6.033473979859125, "global_step": 69887, "epoch": 1663, "val_loss": 74671.0390625} {"train_loss": -6.03616189956665, "global_step": 69888, "epoch": 1664} {"train_loss": -6.201688766479492, "global_step": 69889, "epoch": 1664} {"train_loss": -6.042008399963379, "global_step": 69890, "epoch": 1664} {"train_loss": -6.0645365715026855, "global_step": 69891, "epoch": 1664} {"train_loss": -6.000401020050049, "global_step": 69892, "epoch": 1664} {"train_loss": -5.961342811584473, "global_step": 69893, "epoch": 1664} {"train_loss": -5.99986457824707, "global_step": 69894, "epoch": 1664} {"train_loss": -5.952576637268066, "global_step": 69895, "epoch": 1664} {"train_loss": -5.858586311340332, "global_step": 69896, "epoch": 1664} {"train_loss": -6.020778656005859, "global_step": 69897, "epoch": 1664} {"train_loss": -6.001638889312744, "global_step": 69898, "epoch": 1664} {"train_loss": -5.9554548263549805, "global_step": 69899, "epoch": 1664} {"train_loss": -6.0013346672058105, "global_step": 69900, "epoch": 1664} {"train_loss": -5.903046131134033, "global_step": 69901, "epoch": 1664} {"train_loss": -5.988037586212158, "global_step": 69902, "epoch": 1664} {"train_loss": -6.028017044067383, "global_step": 69903, "epoch": 1664} {"train_loss": -5.896479606628418, "global_step": 69904, "epoch": 1664} {"train_loss": -6.024946212768555, "global_step": 69905, "epoch": 1664} {"train_loss": -5.9459228515625, "global_step": 69906, "epoch": 1664} {"train_loss": -6.0701422691345215, "global_step": 69907, "epoch": 1664} {"train_loss": -5.993622779846191, "global_step": 69908, "epoch": 1664} {"train_loss": -6.056558609008789, "global_step": 69909, "epoch": 1664} {"train_loss": -5.9918999671936035, "global_step": 69910, "epoch": 1664} {"train_loss": -5.990060806274414, "global_step": 69911, "epoch": 1664} {"train_loss": -6.119609832763672, "global_step": 69912, "epoch": 1664} {"train_loss": -6.054369926452637, "global_step": 69913, "epoch": 1664} {"train_loss": -6.021420478820801, "global_step": 69914, "epoch": 1664} {"train_loss": -5.982657432556152, "global_step": 69915, "epoch": 1664} {"train_loss": -6.078718185424805, "global_step": 69916, "epoch": 1664} {"train_loss": -6.021587371826172, "global_step": 69917, "epoch": 1664} {"train_loss": -6.008017539978027, "global_step": 69918, "epoch": 1664} {"train_loss": -5.972464561462402, "global_step": 69919, "epoch": 1664} {"train_loss": -5.886398792266846, "global_step": 69920, "epoch": 1664} {"train_loss": -6.071445941925049, "global_step": 69921, "epoch": 1664} {"train_loss": -6.012439250946045, "global_step": 69922, "epoch": 1664} {"train_loss": -5.977792739868164, "global_step": 69923, "epoch": 1664} {"train_loss": -6.0480451583862305, "global_step": 69924, "epoch": 1664} {"train_loss": -6.027828216552734, "global_step": 69925, "epoch": 1664} {"train_loss": -6.121144771575928, "global_step": 69926, "epoch": 1664} {"train_loss": -5.9987473487854, "global_step": 69927, "epoch": 1664} {"train_loss": -6.089415073394775, "global_step": 69928, "epoch": 1664} {"train_loss": -6.011078039805095, "global_step": 69929, "epoch": 1664, "val_loss": 74905.0859375} {"train_loss": -5.957089424133301, "global_step": 69930, "epoch": 1665} {"train_loss": -6.068883419036865, "global_step": 69931, "epoch": 1665} {"train_loss": -6.152604103088379, "global_step": 69932, "epoch": 1665} {"train_loss": -5.98824405670166, "global_step": 69933, "epoch": 1665} {"train_loss": -6.0442728996276855, "global_step": 69934, "epoch": 1665} {"train_loss": -6.066808700561523, "global_step": 69935, "epoch": 1665} {"train_loss": -6.067061424255371, "global_step": 69936, "epoch": 1665} {"train_loss": -5.939913749694824, "global_step": 69937, "epoch": 1665} {"train_loss": -6.013266563415527, "global_step": 69938, "epoch": 1665} {"train_loss": -6.102740287780762, "global_step": 69939, "epoch": 1665} {"train_loss": -5.994353771209717, "global_step": 69940, "epoch": 1665} {"train_loss": -6.096096038818359, "global_step": 69941, "epoch": 1665} {"train_loss": -5.939967155456543, "global_step": 69942, "epoch": 1665} {"train_loss": -5.9387359619140625, "global_step": 69943, "epoch": 1665} {"train_loss": -6.128659248352051, "global_step": 69944, "epoch": 1665} {"train_loss": -6.005495071411133, "global_step": 69945, "epoch": 1665} {"train_loss": -5.921391010284424, "global_step": 69946, "epoch": 1665} {"train_loss": -6.049008369445801, "global_step": 69947, "epoch": 1665} {"train_loss": -6.0538740158081055, "global_step": 69948, "epoch": 1665} {"train_loss": -6.078686714172363, "global_step": 69949, "epoch": 1665} {"train_loss": -6.0810675621032715, "global_step": 69950, "epoch": 1665} {"train_loss": -6.0724992752075195, "global_step": 69951, "epoch": 1665} {"train_loss": -6.008017539978027, "global_step": 69952, "epoch": 1665} {"train_loss": -5.999969482421875, "global_step": 69953, "epoch": 1665} {"train_loss": -6.015885353088379, "global_step": 69954, "epoch": 1665} {"train_loss": -6.068233489990234, "global_step": 69955, "epoch": 1665} {"train_loss": -6.0594353675842285, "global_step": 69956, "epoch": 1665} {"train_loss": -6.159419059753418, "global_step": 69957, "epoch": 1665} {"train_loss": -5.948625564575195, "global_step": 69958, "epoch": 1665} {"train_loss": -6.100253582000732, "global_step": 69959, "epoch": 1665} {"train_loss": -6.0370378494262695, "global_step": 69960, "epoch": 1665} {"train_loss": -5.987780570983887, "global_step": 69961, "epoch": 1665} {"train_loss": -6.036530017852783, "global_step": 69962, "epoch": 1665} {"train_loss": -6.072346210479736, "global_step": 69963, "epoch": 1665} {"train_loss": -6.009150505065918, "global_step": 69964, "epoch": 1665} {"train_loss": -5.949362754821777, "global_step": 69965, "epoch": 1665} {"train_loss": -6.138004302978516, "global_step": 69966, "epoch": 1665} {"train_loss": -6.015764236450195, "global_step": 69967, "epoch": 1665} {"train_loss": -6.048260688781738, "global_step": 69968, "epoch": 1665} {"train_loss": -6.032781600952148, "global_step": 69969, "epoch": 1665} {"train_loss": -5.918397903442383, "global_step": 69970, "epoch": 1665} {"train_loss": -6.0320033345903665, "global_step": 69971, "epoch": 1665, "val_loss": 74721.5859375} {"train_loss": -6.055748462677002, "global_step": 69972, "epoch": 1666} {"train_loss": -5.946637153625488, "global_step": 69973, "epoch": 1666} {"train_loss": -6.0418701171875, "global_step": 69974, "epoch": 1666} {"train_loss": -6.137689590454102, "global_step": 69975, "epoch": 1666} {"train_loss": -6.01213264465332, "global_step": 69976, "epoch": 1666} {"train_loss": -5.89305305480957, "global_step": 69977, "epoch": 1666} {"train_loss": -5.941144943237305, "global_step": 69978, "epoch": 1666} {"train_loss": -5.941705703735352, "global_step": 69979, "epoch": 1666} {"train_loss": -5.966485977172852, "global_step": 69980, "epoch": 1666} {"train_loss": -5.9802422523498535, "global_step": 69981, "epoch": 1666} {"train_loss": -6.084133148193359, "global_step": 69982, "epoch": 1666} {"train_loss": -5.952932357788086, "global_step": 69983, "epoch": 1666} {"train_loss": -5.934449195861816, "global_step": 69984, "epoch": 1666} {"train_loss": -6.080652713775635, "global_step": 69985, "epoch": 1666} {"train_loss": -5.948240280151367, "global_step": 69986, "epoch": 1666} {"train_loss": -6.009494781494141, "global_step": 69987, "epoch": 1666} {"train_loss": -5.917843818664551, "global_step": 69988, "epoch": 1666} {"train_loss": -5.969123840332031, "global_step": 69989, "epoch": 1666} {"train_loss": -6.081275939941406, "global_step": 69990, "epoch": 1666} {"train_loss": -5.855413913726807, "global_step": 69991, "epoch": 1666} {"train_loss": -5.969099998474121, "global_step": 69992, "epoch": 1666} {"train_loss": -5.9086503982543945, "global_step": 69993, "epoch": 1666} {"train_loss": -5.889621734619141, "global_step": 69994, "epoch": 1666} {"train_loss": -6.015676498413086, "global_step": 69995, "epoch": 1666} {"train_loss": -5.982873439788818, "global_step": 69996, "epoch": 1666} {"train_loss": -5.942531585693359, "global_step": 69997, "epoch": 1666} {"train_loss": -5.984389781951904, "global_step": 69998, "epoch": 1666} {"train_loss": -5.958371639251709, "global_step": 69999, "epoch": 1666} {"train_loss": -6.0303192138671875, "global_step": 70000, "epoch": 1666} {"train_loss": -5.976798057556152, "global_step": 70001, "epoch": 1666} {"train_loss": -5.91961669921875, "global_step": 70002, "epoch": 1666} {"train_loss": -6.066910266876221, "global_step": 70003, "epoch": 1666} {"train_loss": -6.052333831787109, "global_step": 70004, "epoch": 1666} {"train_loss": -5.992284774780273, "global_step": 70005, "epoch": 1666} {"train_loss": -6.100623607635498, "global_step": 70006, "epoch": 1666} {"train_loss": -6.0473809242248535, "global_step": 70007, "epoch": 1666} {"train_loss": -6.009650230407715, "global_step": 70008, "epoch": 1666} {"train_loss": -6.059170246124268, "global_step": 70009, "epoch": 1666} {"train_loss": -6.075730800628662, "global_step": 70010, "epoch": 1666} {"train_loss": -6.090685844421387, "global_step": 70011, "epoch": 1666} {"train_loss": -6.045671463012695, "global_step": 70012, "epoch": 1666} {"train_loss": -5.9930909134092785, "global_step": 70013, "epoch": 1666, "val_loss": 74790.2578125} {"train_loss": -6.113656997680664, "global_step": 70014, "epoch": 1667} {"train_loss": -6.178979873657227, "global_step": 70015, "epoch": 1667} {"train_loss": -6.067480087280273, "global_step": 70016, "epoch": 1667} {"train_loss": -6.055823802947998, "global_step": 70017, "epoch": 1667} {"train_loss": -5.999611854553223, "global_step": 70018, "epoch": 1667} {"train_loss": -6.035153388977051, "global_step": 70019, "epoch": 1667} {"train_loss": -6.0232439041137695, "global_step": 70020, "epoch": 1667} {"train_loss": -6.004990577697754, "global_step": 70021, "epoch": 1667} {"train_loss": -6.1251606941223145, "global_step": 70022, "epoch": 1667} {"train_loss": -5.935530662536621, "global_step": 70023, "epoch": 1667} {"train_loss": -5.902958869934082, "global_step": 70024, "epoch": 1667} {"train_loss": -6.005387306213379, "global_step": 70025, "epoch": 1667} {"train_loss": -5.964681625366211, "global_step": 70026, "epoch": 1667} {"train_loss": -6.000231742858887, "global_step": 70027, "epoch": 1667} {"train_loss": -6.053713798522949, "global_step": 70028, "epoch": 1667} {"train_loss": -6.012843132019043, "global_step": 70029, "epoch": 1667} {"train_loss": -5.971715927124023, "global_step": 70030, "epoch": 1667} {"train_loss": -5.970967769622803, "global_step": 70031, "epoch": 1667} {"train_loss": -6.008253574371338, "global_step": 70032, "epoch": 1667} {"train_loss": -5.98848819732666, "global_step": 70033, "epoch": 1667} {"train_loss": -5.944230079650879, "global_step": 70034, "epoch": 1667} {"train_loss": -5.9327192306518555, "global_step": 70035, "epoch": 1667} {"train_loss": -6.05239200592041, "global_step": 70036, "epoch": 1667} {"train_loss": -5.894033432006836, "global_step": 70037, "epoch": 1667} {"train_loss": -6.030881881713867, "global_step": 70038, "epoch": 1667} {"train_loss": -6.097425937652588, "global_step": 70039, "epoch": 1667} {"train_loss": -6.040775299072266, "global_step": 70040, "epoch": 1667} {"train_loss": -5.942838668823242, "global_step": 70041, "epoch": 1667} {"train_loss": -5.995724678039551, "global_step": 70042, "epoch": 1667} {"train_loss": -5.9805731773376465, "global_step": 70043, "epoch": 1667} {"train_loss": -6.020820140838623, "global_step": 70044, "epoch": 1667} {"train_loss": -6.010361194610596, "global_step": 70045, "epoch": 1667} {"train_loss": -6.052208423614502, "global_step": 70046, "epoch": 1667} {"train_loss": -6.074470043182373, "global_step": 70047, "epoch": 1667} {"train_loss": -6.049104690551758, "global_step": 70048, "epoch": 1667} {"train_loss": -6.046356678009033, "global_step": 70049, "epoch": 1667} {"train_loss": -6.056828498840332, "global_step": 70050, "epoch": 1667} {"train_loss": -6.072664260864258, "global_step": 70051, "epoch": 1667} {"train_loss": -5.879188537597656, "global_step": 70052, "epoch": 1667} {"train_loss": -6.052360534667969, "global_step": 70053, "epoch": 1667} {"train_loss": -5.958572864532471, "global_step": 70054, "epoch": 1667} {"train_loss": -6.0133955251602895, "global_step": 70055, "epoch": 1667, "val_loss": 74923.390625} {"train_loss": -5.86897087097168, "global_step": 70056, "epoch": 1668} {"train_loss": -6.0503973960876465, "global_step": 70057, "epoch": 1668} {"train_loss": -5.90226411819458, "global_step": 70058, "epoch": 1668} {"train_loss": -6.012213706970215, "global_step": 70059, "epoch": 1668} {"train_loss": -5.811751365661621, "global_step": 70060, "epoch": 1668} {"train_loss": -5.953276634216309, "global_step": 70061, "epoch": 1668} {"train_loss": -5.840810775756836, "global_step": 70062, "epoch": 1668} {"train_loss": -6.011247158050537, "global_step": 70063, "epoch": 1668} {"train_loss": -6.068614482879639, "global_step": 70064, "epoch": 1668} {"train_loss": -5.889230728149414, "global_step": 70065, "epoch": 1668} {"train_loss": -5.930880546569824, "global_step": 70066, "epoch": 1668} {"train_loss": -5.962924957275391, "global_step": 70067, "epoch": 1668} {"train_loss": -5.973705768585205, "global_step": 70068, "epoch": 1668} {"train_loss": -5.8312273025512695, "global_step": 70069, "epoch": 1668} {"train_loss": -5.900970458984375, "global_step": 70070, "epoch": 1668} {"train_loss": -5.799970626831055, "global_step": 70071, "epoch": 1668} {"train_loss": -5.931186676025391, "global_step": 70072, "epoch": 1668} {"train_loss": -5.842915058135986, "global_step": 70073, "epoch": 1668} {"train_loss": -5.913418292999268, "global_step": 70074, "epoch": 1668} {"train_loss": -5.906680583953857, "global_step": 70075, "epoch": 1668} {"train_loss": -6.027663230895996, "global_step": 70076, "epoch": 1668} {"train_loss": -6.010122299194336, "global_step": 70077, "epoch": 1668} {"train_loss": -5.879611015319824, "global_step": 70078, "epoch": 1668} {"train_loss": -5.926387786865234, "global_step": 70079, "epoch": 1668} {"train_loss": -5.915350914001465, "global_step": 70080, "epoch": 1668} {"train_loss": -5.937084197998047, "global_step": 70081, "epoch": 1668} {"train_loss": -5.9067583084106445, "global_step": 70082, "epoch": 1668} {"train_loss": -6.061417102813721, "global_step": 70083, "epoch": 1668} {"train_loss": -5.97584342956543, "global_step": 70084, "epoch": 1668} {"train_loss": -5.892787456512451, "global_step": 70085, "epoch": 1668} {"train_loss": -6.03377103805542, "global_step": 70086, "epoch": 1668} {"train_loss": -5.930476188659668, "global_step": 70087, "epoch": 1668} {"train_loss": -6.080843925476074, "global_step": 70088, "epoch": 1668} {"train_loss": -6.045177459716797, "global_step": 70089, "epoch": 1668} {"train_loss": -6.033629894256592, "global_step": 70090, "epoch": 1668} {"train_loss": -6.04664421081543, "global_step": 70091, "epoch": 1668} {"train_loss": -5.999886512756348, "global_step": 70092, "epoch": 1668} {"train_loss": -6.032104969024658, "global_step": 70093, "epoch": 1668} {"train_loss": -5.834430694580078, "global_step": 70094, "epoch": 1668} {"train_loss": -5.981245994567871, "global_step": 70095, "epoch": 1668} {"train_loss": -5.934222221374512, "global_step": 70096, "epoch": 1668} {"train_loss": -5.944617033004761, "global_step": 70097, "epoch": 1668, "val_loss": 74623.15625} {"train_loss": -6.105813026428223, "global_step": 70098, "epoch": 1669} {"train_loss": -5.954782485961914, "global_step": 70099, "epoch": 1669} {"train_loss": -5.886255741119385, "global_step": 70100, "epoch": 1669} {"train_loss": -6.026496410369873, "global_step": 70101, "epoch": 1669} {"train_loss": -5.910987854003906, "global_step": 70102, "epoch": 1669} {"train_loss": -5.967125415802002, "global_step": 70103, "epoch": 1669} {"train_loss": -5.922521591186523, "global_step": 70104, "epoch": 1669} {"train_loss": -5.926784515380859, "global_step": 70105, "epoch": 1669} {"train_loss": -6.086012840270996, "global_step": 70106, "epoch": 1669} {"train_loss": -6.014039993286133, "global_step": 70107, "epoch": 1669} {"train_loss": -6.096073150634766, "global_step": 70108, "epoch": 1669} {"train_loss": -6.044033050537109, "global_step": 70109, "epoch": 1669} {"train_loss": -6.097939491271973, "global_step": 70110, "epoch": 1669} {"train_loss": -5.959926128387451, "global_step": 70111, "epoch": 1669} {"train_loss": -6.014734745025635, "global_step": 70112, "epoch": 1669} {"train_loss": -6.121980667114258, "global_step": 70113, "epoch": 1669} {"train_loss": -6.102975368499756, "global_step": 70114, "epoch": 1669} {"train_loss": -6.076362609863281, "global_step": 70115, "epoch": 1669} {"train_loss": -5.9595255851745605, "global_step": 70116, "epoch": 1669} {"train_loss": -6.044151782989502, "global_step": 70117, "epoch": 1669} {"train_loss": -5.958433151245117, "global_step": 70118, "epoch": 1669} {"train_loss": -6.107724666595459, "global_step": 70119, "epoch": 1669} {"train_loss": -5.955503940582275, "global_step": 70120, "epoch": 1669} {"train_loss": -5.995517730712891, "global_step": 70121, "epoch": 1669} {"train_loss": -6.11543083190918, "global_step": 70122, "epoch": 1669} {"train_loss": -5.969643592834473, "global_step": 70123, "epoch": 1669} {"train_loss": -6.042067527770996, "global_step": 70124, "epoch": 1669} {"train_loss": -6.059199333190918, "global_step": 70125, "epoch": 1669} {"train_loss": -6.027496337890625, "global_step": 70126, "epoch": 1669} {"train_loss": -6.093097686767578, "global_step": 70127, "epoch": 1669} {"train_loss": -6.04137659072876, "global_step": 70128, "epoch": 1669} {"train_loss": -5.974729537963867, "global_step": 70129, "epoch": 1669} {"train_loss": -6.079266548156738, "global_step": 70130, "epoch": 1669} {"train_loss": -5.989625453948975, "global_step": 70131, "epoch": 1669} {"train_loss": -5.9199371337890625, "global_step": 70132, "epoch": 1669} {"train_loss": -5.967989921569824, "global_step": 70133, "epoch": 1669} {"train_loss": -6.071112632751465, "global_step": 70134, "epoch": 1669} {"train_loss": -5.886013984680176, "global_step": 70135, "epoch": 1669} {"train_loss": -5.978425979614258, "global_step": 70136, "epoch": 1669} {"train_loss": -5.97165584564209, "global_step": 70137, "epoch": 1669} {"train_loss": -5.926078796386719, "global_step": 70138, "epoch": 1669} {"train_loss": -6.010208391007923, "global_step": 70139, "epoch": 1669, "val_loss": 74868.90625} {"train_loss": -6.07718563079834, "global_step": 70140, "epoch": 1670} {"train_loss": -5.853046417236328, "global_step": 70141, "epoch": 1670} {"train_loss": -5.8989386558532715, "global_step": 70142, "epoch": 1670} {"train_loss": -6.01099967956543, "global_step": 70143, "epoch": 1670} {"train_loss": -6.11428165435791, "global_step": 70144, "epoch": 1670} {"train_loss": -6.039429664611816, "global_step": 70145, "epoch": 1670} {"train_loss": -5.966259956359863, "global_step": 70146, "epoch": 1670} {"train_loss": -6.061585903167725, "global_step": 70147, "epoch": 1670} {"train_loss": -5.9803009033203125, "global_step": 70148, "epoch": 1670} {"train_loss": -5.957991600036621, "global_step": 70149, "epoch": 1670} {"train_loss": -5.918618202209473, "global_step": 70150, "epoch": 1670} {"train_loss": -6.112274169921875, "global_step": 70151, "epoch": 1670} {"train_loss": -5.996452331542969, "global_step": 70152, "epoch": 1670} {"train_loss": -6.053432941436768, "global_step": 70153, "epoch": 1670} {"train_loss": -6.079001426696777, "global_step": 70154, "epoch": 1670} {"train_loss": -6.037715435028076, "global_step": 70155, "epoch": 1670} {"train_loss": -6.000065803527832, "global_step": 70156, "epoch": 1670} {"train_loss": -5.896961212158203, "global_step": 70157, "epoch": 1670} {"train_loss": -6.011777877807617, "global_step": 70158, "epoch": 1670} {"train_loss": -6.081856727600098, "global_step": 70159, "epoch": 1670} {"train_loss": -6.146091461181641, "global_step": 70160, "epoch": 1670} {"train_loss": -6.031922340393066, "global_step": 70161, "epoch": 1670} {"train_loss": -5.916372299194336, "global_step": 70162, "epoch": 1670} {"train_loss": -6.122947692871094, "global_step": 70163, "epoch": 1670} {"train_loss": -6.145837783813477, "global_step": 70164, "epoch": 1670} {"train_loss": -5.969852924346924, "global_step": 70165, "epoch": 1670} {"train_loss": -5.988142013549805, "global_step": 70166, "epoch": 1670} {"train_loss": -6.068390369415283, "global_step": 70167, "epoch": 1670} {"train_loss": -5.922381401062012, "global_step": 70168, "epoch": 1670} {"train_loss": -6.025345802307129, "global_step": 70169, "epoch": 1670} {"train_loss": -5.9682393074035645, "global_step": 70170, "epoch": 1670} {"train_loss": -5.993401527404785, "global_step": 70171, "epoch": 1670} {"train_loss": -6.050976276397705, "global_step": 70172, "epoch": 1670} {"train_loss": -6.073218822479248, "global_step": 70173, "epoch": 1670} {"train_loss": -5.978793144226074, "global_step": 70174, "epoch": 1670} {"train_loss": -5.964686393737793, "global_step": 70175, "epoch": 1670} {"train_loss": -5.964197158813477, "global_step": 70176, "epoch": 1670} {"train_loss": -5.915699481964111, "global_step": 70177, "epoch": 1670} {"train_loss": -5.960940361022949, "global_step": 70178, "epoch": 1670} {"train_loss": -6.054319381713867, "global_step": 70179, "epoch": 1670} {"train_loss": -6.01982307434082, "global_step": 70180, "epoch": 1670} {"train_loss": -6.0101400670551115, "global_step": 70181, "epoch": 1670, "val_loss": 74963.28125} {"train_loss": -6.018732070922852, "global_step": 70182, "epoch": 1671} {"train_loss": -6.052167892456055, "global_step": 70183, "epoch": 1671} {"train_loss": -5.982488632202148, "global_step": 70184, "epoch": 1671} {"train_loss": -5.864931106567383, "global_step": 70185, "epoch": 1671} {"train_loss": -5.873447418212891, "global_step": 70186, "epoch": 1671} {"train_loss": -5.898315906524658, "global_step": 70187, "epoch": 1671} {"train_loss": -5.885345458984375, "global_step": 70188, "epoch": 1671} {"train_loss": -5.926804065704346, "global_step": 70189, "epoch": 1671} {"train_loss": -5.987037658691406, "global_step": 70190, "epoch": 1671} {"train_loss": -6.041487693786621, "global_step": 70191, "epoch": 1671} {"train_loss": -5.882201194763184, "global_step": 70192, "epoch": 1671} {"train_loss": -6.053689002990723, "global_step": 70193, "epoch": 1671} {"train_loss": -6.028545379638672, "global_step": 70194, "epoch": 1671} {"train_loss": -6.020754814147949, "global_step": 70195, "epoch": 1671} {"train_loss": -5.972127437591553, "global_step": 70196, "epoch": 1671} {"train_loss": -6.045132637023926, "global_step": 70197, "epoch": 1671} {"train_loss": -6.0023956298828125, "global_step": 70198, "epoch": 1671} {"train_loss": -5.8770904541015625, "global_step": 70199, "epoch": 1671} {"train_loss": -6.066040992736816, "global_step": 70200, "epoch": 1671} {"train_loss": -5.944846153259277, "global_step": 70201, "epoch": 1671} {"train_loss": -5.972387790679932, "global_step": 70202, "epoch": 1671} {"train_loss": -5.934597969055176, "global_step": 70203, "epoch": 1671} {"train_loss": -5.947014808654785, "global_step": 70204, "epoch": 1671} {"train_loss": -6.000538349151611, "global_step": 70205, "epoch": 1671} {"train_loss": -5.9527506828308105, "global_step": 70206, "epoch": 1671} {"train_loss": -6.0428242683410645, "global_step": 70207, "epoch": 1671} {"train_loss": -5.923224449157715, "global_step": 70208, "epoch": 1671} {"train_loss": -6.036932945251465, "global_step": 70209, "epoch": 1671} {"train_loss": -5.960714340209961, "global_step": 70210, "epoch": 1671} {"train_loss": -6.002599716186523, "global_step": 70211, "epoch": 1671} {"train_loss": -5.9803466796875, "global_step": 70212, "epoch": 1671} {"train_loss": -6.051095485687256, "global_step": 70213, "epoch": 1671} {"train_loss": -5.990817070007324, "global_step": 70214, "epoch": 1671} {"train_loss": -6.0760345458984375, "global_step": 70215, "epoch": 1671} {"train_loss": -6.111408233642578, "global_step": 70216, "epoch": 1671} {"train_loss": -5.919800758361816, "global_step": 70217, "epoch": 1671} {"train_loss": -6.040149688720703, "global_step": 70218, "epoch": 1671} {"train_loss": -6.076992511749268, "global_step": 70219, "epoch": 1671} {"train_loss": -5.9997429847717285, "global_step": 70220, "epoch": 1671} {"train_loss": -6.059609413146973, "global_step": 70221, "epoch": 1671} {"train_loss": -6.085344314575195, "global_step": 70222, "epoch": 1671} {"train_loss": -5.9895521232060025, "global_step": 70223, "epoch": 1671, "val_loss": 74716.4921875} {"train_loss": -6.073663711547852, "global_step": 70224, "epoch": 1672} {"train_loss": -5.972607612609863, "global_step": 70225, "epoch": 1672} {"train_loss": -6.022411346435547, "global_step": 70226, "epoch": 1672} {"train_loss": -5.940834045410156, "global_step": 70227, "epoch": 1672} {"train_loss": -6.08449649810791, "global_step": 70228, "epoch": 1672} {"train_loss": -6.021762847900391, "global_step": 70229, "epoch": 1672} {"train_loss": -6.090599060058594, "global_step": 70230, "epoch": 1672} {"train_loss": -6.027037620544434, "global_step": 70231, "epoch": 1672} {"train_loss": -6.079204559326172, "global_step": 70232, "epoch": 1672} {"train_loss": -6.038278579711914, "global_step": 70233, "epoch": 1672} {"train_loss": -5.9771318435668945, "global_step": 70234, "epoch": 1672} {"train_loss": -6.0060811042785645, "global_step": 70235, "epoch": 1672} {"train_loss": -6.0745849609375, "global_step": 70236, "epoch": 1672} {"train_loss": -5.953273773193359, "global_step": 70237, "epoch": 1672} {"train_loss": -5.95850133895874, "global_step": 70238, "epoch": 1672} {"train_loss": -6.066155433654785, "global_step": 70239, "epoch": 1672} {"train_loss": -6.014101028442383, "global_step": 70240, "epoch": 1672} {"train_loss": -6.050987720489502, "global_step": 70241, "epoch": 1672} {"train_loss": -5.927244186401367, "global_step": 70242, "epoch": 1672} {"train_loss": -6.00998592376709, "global_step": 70243, "epoch": 1672} {"train_loss": -6.09207820892334, "global_step": 70244, "epoch": 1672} {"train_loss": -6.06160831451416, "global_step": 70245, "epoch": 1672} {"train_loss": -6.043673515319824, "global_step": 70246, "epoch": 1672} {"train_loss": -6.066929817199707, "global_step": 70247, "epoch": 1672} {"train_loss": -5.980067253112793, "global_step": 70248, "epoch": 1672} {"train_loss": -5.928885459899902, "global_step": 70249, "epoch": 1672} {"train_loss": -5.9751739501953125, "global_step": 70250, "epoch": 1672} {"train_loss": -6.000672340393066, "global_step": 70251, "epoch": 1672} {"train_loss": -6.022423267364502, "global_step": 70252, "epoch": 1672} {"train_loss": -6.108979225158691, "global_step": 70253, "epoch": 1672} {"train_loss": -6.062924385070801, "global_step": 70254, "epoch": 1672} {"train_loss": -6.041471481323242, "global_step": 70255, "epoch": 1672} {"train_loss": -6.1073102951049805, "global_step": 70256, "epoch": 1672} {"train_loss": -5.975734710693359, "global_step": 70257, "epoch": 1672} {"train_loss": -6.066558837890625, "global_step": 70258, "epoch": 1672} {"train_loss": -6.0262131690979, "global_step": 70259, "epoch": 1672} {"train_loss": -6.136788368225098, "global_step": 70260, "epoch": 1672} {"train_loss": -6.008622169494629, "global_step": 70261, "epoch": 1672} {"train_loss": -5.963543891906738, "global_step": 70262, "epoch": 1672} {"train_loss": -6.145577430725098, "global_step": 70263, "epoch": 1672} {"train_loss": -6.021142959594727, "global_step": 70264, "epoch": 1672} {"train_loss": -6.0307140577407115, "global_step": 70265, "epoch": 1672, "val_loss": 74914.4765625} {"train_loss": -6.084616661071777, "global_step": 70266, "epoch": 1673} {"train_loss": -6.086951732635498, "global_step": 70267, "epoch": 1673} {"train_loss": -6.052188396453857, "global_step": 70268, "epoch": 1673} {"train_loss": -6.0831170082092285, "global_step": 70269, "epoch": 1673} {"train_loss": -5.937500476837158, "global_step": 70270, "epoch": 1673} {"train_loss": -6.05136251449585, "global_step": 70271, "epoch": 1673} {"train_loss": -5.936235427856445, "global_step": 70272, "epoch": 1673} {"train_loss": -5.81748104095459, "global_step": 70273, "epoch": 1673} {"train_loss": -6.016750335693359, "global_step": 70274, "epoch": 1673} {"train_loss": -5.908989429473877, "global_step": 70275, "epoch": 1673} {"train_loss": -6.07694149017334, "global_step": 70276, "epoch": 1673} {"train_loss": -6.078330039978027, "global_step": 70277, "epoch": 1673} {"train_loss": -6.103302001953125, "global_step": 70278, "epoch": 1673} {"train_loss": -6.081545829772949, "global_step": 70279, "epoch": 1673} {"train_loss": -5.963469505310059, "global_step": 70280, "epoch": 1673} {"train_loss": -6.104609489440918, "global_step": 70281, "epoch": 1673} {"train_loss": -6.089552879333496, "global_step": 70282, "epoch": 1673} {"train_loss": -6.102953910827637, "global_step": 70283, "epoch": 1673} {"train_loss": -6.080936908721924, "global_step": 70284, "epoch": 1673} {"train_loss": -6.075716018676758, "global_step": 70285, "epoch": 1673} {"train_loss": -5.9147491455078125, "global_step": 70286, "epoch": 1673} {"train_loss": -6.025009632110596, "global_step": 70287, "epoch": 1673} {"train_loss": -6.020307540893555, "global_step": 70288, "epoch": 1673} {"train_loss": -6.099255084991455, "global_step": 70289, "epoch": 1673} {"train_loss": -6.052995681762695, "global_step": 70290, "epoch": 1673} {"train_loss": -5.994994163513184, "global_step": 70291, "epoch": 1673} {"train_loss": -6.03835391998291, "global_step": 70292, "epoch": 1673} {"train_loss": -6.028655052185059, "global_step": 70293, "epoch": 1673} {"train_loss": -6.126870155334473, "global_step": 70294, "epoch": 1673} {"train_loss": -6.000933647155762, "global_step": 70295, "epoch": 1673} {"train_loss": -5.989434242248535, "global_step": 70296, "epoch": 1673} {"train_loss": -5.961007118225098, "global_step": 70297, "epoch": 1673} {"train_loss": -6.082148551940918, "global_step": 70298, "epoch": 1673} {"train_loss": -5.988254547119141, "global_step": 70299, "epoch": 1673} {"train_loss": -6.015596866607666, "global_step": 70300, "epoch": 1673} {"train_loss": -6.097400665283203, "global_step": 70301, "epoch": 1673} {"train_loss": -6.0704145431518555, "global_step": 70302, "epoch": 1673} {"train_loss": -6.1145830154418945, "global_step": 70303, "epoch": 1673} {"train_loss": -5.985243797302246, "global_step": 70304, "epoch": 1673} {"train_loss": -6.107515811920166, "global_step": 70305, "epoch": 1673} {"train_loss": -6.067480087280273, "global_step": 70306, "epoch": 1673} {"train_loss": -6.035305681682768, "global_step": 70307, "epoch": 1673, "val_loss": 74686.03125} {"train_loss": -6.124492645263672, "global_step": 70308, "epoch": 1674} {"train_loss": -6.066161155700684, "global_step": 70309, "epoch": 1674} {"train_loss": -6.04146671295166, "global_step": 70310, "epoch": 1674} {"train_loss": -6.064540863037109, "global_step": 70311, "epoch": 1674} {"train_loss": -6.028725624084473, "global_step": 70312, "epoch": 1674} {"train_loss": -6.007828712463379, "global_step": 70313, "epoch": 1674} {"train_loss": -6.068479537963867, "global_step": 70314, "epoch": 1674} {"train_loss": -5.892653465270996, "global_step": 70315, "epoch": 1674} {"train_loss": -5.994080543518066, "global_step": 70316, "epoch": 1674} {"train_loss": -5.9670610427856445, "global_step": 70317, "epoch": 1674} {"train_loss": -6.008327484130859, "global_step": 70318, "epoch": 1674} {"train_loss": -6.0361833572387695, "global_step": 70319, "epoch": 1674} {"train_loss": -6.026615142822266, "global_step": 70320, "epoch": 1674} {"train_loss": -5.978188514709473, "global_step": 70321, "epoch": 1674} {"train_loss": -6.117327690124512, "global_step": 70322, "epoch": 1674} {"train_loss": -5.894661903381348, "global_step": 70323, "epoch": 1674} {"train_loss": -6.092307090759277, "global_step": 70324, "epoch": 1674} {"train_loss": -6.050858974456787, "global_step": 70325, "epoch": 1674} {"train_loss": -6.048737049102783, "global_step": 70326, "epoch": 1674} {"train_loss": -6.028369426727295, "global_step": 70327, "epoch": 1674} {"train_loss": -6.0031633377075195, "global_step": 70328, "epoch": 1674} {"train_loss": -5.973045349121094, "global_step": 70329, "epoch": 1674} {"train_loss": -6.04794454574585, "global_step": 70330, "epoch": 1674} {"train_loss": -5.937949180603027, "global_step": 70331, "epoch": 1674} {"train_loss": -5.927979946136475, "global_step": 70332, "epoch": 1674} {"train_loss": -5.959294319152832, "global_step": 70333, "epoch": 1674} {"train_loss": -6.120805740356445, "global_step": 70334, "epoch": 1674} {"train_loss": -6.059323310852051, "global_step": 70335, "epoch": 1674} {"train_loss": -5.982653617858887, "global_step": 70336, "epoch": 1674} {"train_loss": -5.967824459075928, "global_step": 70337, "epoch": 1674} {"train_loss": -6.010426044464111, "global_step": 70338, "epoch": 1674} {"train_loss": -6.036757469177246, "global_step": 70339, "epoch": 1674} {"train_loss": -5.954982757568359, "global_step": 70340, "epoch": 1674} {"train_loss": -6.120615482330322, "global_step": 70341, "epoch": 1674} {"train_loss": -5.948500156402588, "global_step": 70342, "epoch": 1674} {"train_loss": -6.1839189529418945, "global_step": 70343, "epoch": 1674} {"train_loss": -6.014443874359131, "global_step": 70344, "epoch": 1674} {"train_loss": -6.092755317687988, "global_step": 70345, "epoch": 1674} {"train_loss": -6.068996429443359, "global_step": 70346, "epoch": 1674} {"train_loss": -6.048736572265625, "global_step": 70347, "epoch": 1674} {"train_loss": -6.085735321044922, "global_step": 70348, "epoch": 1674} {"train_loss": -6.025034632001605, "global_step": 70349, "epoch": 1674, "val_loss": 74415.984375} {"train_loss": -5.9874420166015625, "global_step": 70350, "epoch": 1675} {"train_loss": -6.062615394592285, "global_step": 70351, "epoch": 1675} {"train_loss": -5.982906818389893, "global_step": 70352, "epoch": 1675} {"train_loss": -6.193288326263428, "global_step": 70353, "epoch": 1675} {"train_loss": -6.010547637939453, "global_step": 70354, "epoch": 1675} {"train_loss": -6.057442665100098, "global_step": 70355, "epoch": 1675} {"train_loss": -6.038754463195801, "global_step": 70356, "epoch": 1675} {"train_loss": -6.055963039398193, "global_step": 70357, "epoch": 1675} {"train_loss": -6.037235736846924, "global_step": 70358, "epoch": 1675} {"train_loss": -5.986259937286377, "global_step": 70359, "epoch": 1675} {"train_loss": -5.988619804382324, "global_step": 70360, "epoch": 1675} {"train_loss": -6.097899913787842, "global_step": 70361, "epoch": 1675} {"train_loss": -5.944665908813477, "global_step": 70362, "epoch": 1675} {"train_loss": -6.028853416442871, "global_step": 70363, "epoch": 1675} {"train_loss": -6.078210830688477, "global_step": 70364, "epoch": 1675} {"train_loss": -6.069108009338379, "global_step": 70365, "epoch": 1675} {"train_loss": -5.989372253417969, "global_step": 70366, "epoch": 1675} {"train_loss": -6.034693717956543, "global_step": 70367, "epoch": 1675} {"train_loss": -6.04543399810791, "global_step": 70368, "epoch": 1675} {"train_loss": -6.051814556121826, "global_step": 70369, "epoch": 1675} {"train_loss": -6.0494384765625, "global_step": 70370, "epoch": 1675} {"train_loss": -6.031957149505615, "global_step": 70371, "epoch": 1675} {"train_loss": -6.0975189208984375, "global_step": 70372, "epoch": 1675} {"train_loss": -5.870232105255127, "global_step": 70373, "epoch": 1675} {"train_loss": -5.940194129943848, "global_step": 70374, "epoch": 1675} {"train_loss": -6.047489643096924, "global_step": 70375, "epoch": 1675} {"train_loss": -6.064247131347656, "global_step": 70376, "epoch": 1675} {"train_loss": -6.0906901359558105, "global_step": 70377, "epoch": 1675} {"train_loss": -6.062688827514648, "global_step": 70378, "epoch": 1675} {"train_loss": -5.999664306640625, "global_step": 70379, "epoch": 1675} {"train_loss": -5.9664201736450195, "global_step": 70380, "epoch": 1675} {"train_loss": -5.978703498840332, "global_step": 70381, "epoch": 1675} {"train_loss": -6.080512046813965, "global_step": 70382, "epoch": 1675} {"train_loss": -5.88511848449707, "global_step": 70383, "epoch": 1675} {"train_loss": -6.1419501304626465, "global_step": 70384, "epoch": 1675} {"train_loss": -6.0201191902160645, "global_step": 70385, "epoch": 1675} {"train_loss": -5.863470554351807, "global_step": 70386, "epoch": 1675} {"train_loss": -6.041745185852051, "global_step": 70387, "epoch": 1675} {"train_loss": -6.012514114379883, "global_step": 70388, "epoch": 1675} {"train_loss": -5.918457984924316, "global_step": 70389, "epoch": 1675} {"train_loss": -6.088742256164551, "global_step": 70390, "epoch": 1675} {"train_loss": -6.024922563916161, "global_step": 70391, "epoch": 1675, "val_loss": 75011.53125} {"train_loss": -6.027976036071777, "global_step": 70392, "epoch": 1676} {"train_loss": -6.065825939178467, "global_step": 70393, "epoch": 1676} {"train_loss": -6.0674638748168945, "global_step": 70394, "epoch": 1676} {"train_loss": -5.948173999786377, "global_step": 70395, "epoch": 1676} {"train_loss": -6.213954925537109, "global_step": 70396, "epoch": 1676} {"train_loss": -6.0290117263793945, "global_step": 70397, "epoch": 1676} {"train_loss": -5.999577522277832, "global_step": 70398, "epoch": 1676} {"train_loss": -6.082112789154053, "global_step": 70399, "epoch": 1676} {"train_loss": -6.062742710113525, "global_step": 70400, "epoch": 1676} {"train_loss": -6.078228950500488, "global_step": 70401, "epoch": 1676} {"train_loss": -6.096307754516602, "global_step": 70402, "epoch": 1676} {"train_loss": -6.10422420501709, "global_step": 70403, "epoch": 1676} {"train_loss": -6.009773254394531, "global_step": 70404, "epoch": 1676} {"train_loss": -5.933586597442627, "global_step": 70405, "epoch": 1676} {"train_loss": -6.032111167907715, "global_step": 70406, "epoch": 1676} {"train_loss": -6.047525405883789, "global_step": 70407, "epoch": 1676} {"train_loss": -6.0371198654174805, "global_step": 70408, "epoch": 1676} {"train_loss": -6.0603508949279785, "global_step": 70409, "epoch": 1676} {"train_loss": -6.036133766174316, "global_step": 70410, "epoch": 1676} {"train_loss": -6.0551958084106445, "global_step": 70411, "epoch": 1676} {"train_loss": -6.018618583679199, "global_step": 70412, "epoch": 1676} {"train_loss": -6.137212753295898, "global_step": 70413, "epoch": 1676} {"train_loss": -6.0127363204956055, "global_step": 70414, "epoch": 1676} {"train_loss": -6.049829959869385, "global_step": 70415, "epoch": 1676} {"train_loss": -6.102260112762451, "global_step": 70416, "epoch": 1676} {"train_loss": -5.970621109008789, "global_step": 70417, "epoch": 1676} {"train_loss": -6.05455207824707, "global_step": 70418, "epoch": 1676} {"train_loss": -5.91485071182251, "global_step": 70419, "epoch": 1676} {"train_loss": -5.999623775482178, "global_step": 70420, "epoch": 1676} {"train_loss": -6.024895191192627, "global_step": 70421, "epoch": 1676} {"train_loss": -6.052371978759766, "global_step": 70422, "epoch": 1676} {"train_loss": -5.975102424621582, "global_step": 70423, "epoch": 1676} {"train_loss": -6.092772960662842, "global_step": 70424, "epoch": 1676} {"train_loss": -5.988589763641357, "global_step": 70425, "epoch": 1676} {"train_loss": -6.022628307342529, "global_step": 70426, "epoch": 1676} {"train_loss": -6.075692176818848, "global_step": 70427, "epoch": 1676} {"train_loss": -5.976222515106201, "global_step": 70428, "epoch": 1676} {"train_loss": -5.845107555389404, "global_step": 70429, "epoch": 1676} {"train_loss": -6.021368980407715, "global_step": 70430, "epoch": 1676} {"train_loss": -5.897547721862793, "global_step": 70431, "epoch": 1676} {"train_loss": -6.102736473083496, "global_step": 70432, "epoch": 1676} {"train_loss": -6.032069944200062, "global_step": 70433, "epoch": 1676, "val_loss": 74700.1796875} {"train_loss": -6.093693733215332, "global_step": 70434, "epoch": 1677} {"train_loss": -5.970908164978027, "global_step": 70435, "epoch": 1677} {"train_loss": -6.018872261047363, "global_step": 70436, "epoch": 1677} {"train_loss": -6.05303430557251, "global_step": 70437, "epoch": 1677} {"train_loss": -6.044760227203369, "global_step": 70438, "epoch": 1677} {"train_loss": -5.997766494750977, "global_step": 70439, "epoch": 1677} {"train_loss": -6.095368385314941, "global_step": 70440, "epoch": 1677} {"train_loss": -6.001116752624512, "global_step": 70441, "epoch": 1677} {"train_loss": -5.987369060516357, "global_step": 70442, "epoch": 1677} {"train_loss": -6.177969932556152, "global_step": 70443, "epoch": 1677} {"train_loss": -5.941485404968262, "global_step": 70444, "epoch": 1677} {"train_loss": -5.947408676147461, "global_step": 70445, "epoch": 1677} {"train_loss": -6.003911018371582, "global_step": 70446, "epoch": 1677} {"train_loss": -5.856735706329346, "global_step": 70447, "epoch": 1677} {"train_loss": -5.902392387390137, "global_step": 70448, "epoch": 1677} {"train_loss": -5.940378665924072, "global_step": 70449, "epoch": 1677} {"train_loss": -5.9375810623168945, "global_step": 70450, "epoch": 1677} {"train_loss": -5.913612365722656, "global_step": 70451, "epoch": 1677} {"train_loss": -5.985996723175049, "global_step": 70452, "epoch": 1677} {"train_loss": -5.99412727355957, "global_step": 70453, "epoch": 1677} {"train_loss": -5.986907958984375, "global_step": 70454, "epoch": 1677} {"train_loss": -5.913947105407715, "global_step": 70455, "epoch": 1677} {"train_loss": -5.9934797286987305, "global_step": 70456, "epoch": 1677} {"train_loss": -6.019139289855957, "global_step": 70457, "epoch": 1677} {"train_loss": -5.932268142700195, "global_step": 70458, "epoch": 1677} {"train_loss": -5.966066360473633, "global_step": 70459, "epoch": 1677} {"train_loss": -6.07012414932251, "global_step": 70460, "epoch": 1677} {"train_loss": -5.993103981018066, "global_step": 70461, "epoch": 1677} {"train_loss": -5.814305782318115, "global_step": 70462, "epoch": 1677} {"train_loss": -6.0669426918029785, "global_step": 70463, "epoch": 1677} {"train_loss": -5.877824306488037, "global_step": 70464, "epoch": 1677} {"train_loss": -5.888657569885254, "global_step": 70465, "epoch": 1677} {"train_loss": -5.996210098266602, "global_step": 70466, "epoch": 1677} {"train_loss": -5.9175004959106445, "global_step": 70467, "epoch": 1677} {"train_loss": -6.096628189086914, "global_step": 70468, "epoch": 1677} {"train_loss": -6.087793350219727, "global_step": 70469, "epoch": 1677} {"train_loss": -5.97902250289917, "global_step": 70470, "epoch": 1677} {"train_loss": -6.169098854064941, "global_step": 70471, "epoch": 1677} {"train_loss": -6.023347854614258, "global_step": 70472, "epoch": 1677} {"train_loss": -6.12419319152832, "global_step": 70473, "epoch": 1677} {"train_loss": -6.06590461730957, "global_step": 70474, "epoch": 1677} {"train_loss": -5.996416409810384, "global_step": 70475, "epoch": 1677, "val_loss": 74864.3203125} {"train_loss": -5.984399318695068, "global_step": 70476, "epoch": 1678} {"train_loss": -6.000385284423828, "global_step": 70477, "epoch": 1678} {"train_loss": -5.95883846282959, "global_step": 70478, "epoch": 1678} {"train_loss": -6.0520124435424805, "global_step": 70479, "epoch": 1678} {"train_loss": -5.960158824920654, "global_step": 70480, "epoch": 1678} {"train_loss": -6.120261192321777, "global_step": 70481, "epoch": 1678} {"train_loss": -6.144598960876465, "global_step": 70482, "epoch": 1678} {"train_loss": -6.1791510581970215, "global_step": 70483, "epoch": 1678} {"train_loss": -6.056504726409912, "global_step": 70484, "epoch": 1678} {"train_loss": -6.107514381408691, "global_step": 70485, "epoch": 1678} {"train_loss": -6.020124912261963, "global_step": 70486, "epoch": 1678} {"train_loss": -5.834373474121094, "global_step": 70487, "epoch": 1678} {"train_loss": -6.073428153991699, "global_step": 70488, "epoch": 1678} {"train_loss": -6.021341800689697, "global_step": 70489, "epoch": 1678} {"train_loss": -6.101195335388184, "global_step": 70490, "epoch": 1678} {"train_loss": -5.969475269317627, "global_step": 70491, "epoch": 1678} {"train_loss": -6.0193376541137695, "global_step": 70492, "epoch": 1678} {"train_loss": -5.93930196762085, "global_step": 70493, "epoch": 1678} {"train_loss": -6.072141170501709, "global_step": 70494, "epoch": 1678} {"train_loss": -5.959070205688477, "global_step": 70495, "epoch": 1678} {"train_loss": -5.9733781814575195, "global_step": 70496, "epoch": 1678} {"train_loss": -6.04158878326416, "global_step": 70497, "epoch": 1678} {"train_loss": -6.11443567276001, "global_step": 70498, "epoch": 1678} {"train_loss": -5.977081298828125, "global_step": 70499, "epoch": 1678} {"train_loss": -5.988720417022705, "global_step": 70500, "epoch": 1678} {"train_loss": -6.020652770996094, "global_step": 70501, "epoch": 1678} {"train_loss": -6.0670671463012695, "global_step": 70502, "epoch": 1678} {"train_loss": -6.008597373962402, "global_step": 70503, "epoch": 1678} {"train_loss": -5.930341720581055, "global_step": 70504, "epoch": 1678} {"train_loss": -6.071955680847168, "global_step": 70505, "epoch": 1678} {"train_loss": -5.899420738220215, "global_step": 70506, "epoch": 1678} {"train_loss": -6.072042942047119, "global_step": 70507, "epoch": 1678} {"train_loss": -6.137839317321777, "global_step": 70508, "epoch": 1678} {"train_loss": -5.969256401062012, "global_step": 70509, "epoch": 1678} {"train_loss": -6.0648908615112305, "global_step": 70510, "epoch": 1678} {"train_loss": -5.965419292449951, "global_step": 70511, "epoch": 1678} {"train_loss": -6.134300231933594, "global_step": 70512, "epoch": 1678} {"train_loss": -5.943439483642578, "global_step": 70513, "epoch": 1678} {"train_loss": -6.045434951782227, "global_step": 70514, "epoch": 1678} {"train_loss": -6.0000457763671875, "global_step": 70515, "epoch": 1678} {"train_loss": -6.117072582244873, "global_step": 70516, "epoch": 1678} {"train_loss": -6.024553003765288, "global_step": 70517, "epoch": 1678, "val_loss": 74582.5546875} {"train_loss": -5.939786434173584, "global_step": 70518, "epoch": 1679} {"train_loss": -6.086071491241455, "global_step": 70519, "epoch": 1679} {"train_loss": -6.113338470458984, "global_step": 70520, "epoch": 1679} {"train_loss": -6.035099983215332, "global_step": 70521, "epoch": 1679} {"train_loss": -6.063326835632324, "global_step": 70522, "epoch": 1679} {"train_loss": -6.062967300415039, "global_step": 70523, "epoch": 1679} {"train_loss": -6.07021951675415, "global_step": 70524, "epoch": 1679} {"train_loss": -6.048190116882324, "global_step": 70525, "epoch": 1679} {"train_loss": -5.985532760620117, "global_step": 70526, "epoch": 1679} {"train_loss": -5.957414627075195, "global_step": 70527, "epoch": 1679} {"train_loss": -5.77230978012085, "global_step": 70528, "epoch": 1679} {"train_loss": -6.012666702270508, "global_step": 70529, "epoch": 1679} {"train_loss": -5.974409580230713, "global_step": 70530, "epoch": 1679} {"train_loss": -5.982697010040283, "global_step": 70531, "epoch": 1679} {"train_loss": -6.087085723876953, "global_step": 70532, "epoch": 1679} {"train_loss": -5.886514663696289, "global_step": 70533, "epoch": 1679} {"train_loss": -6.043900489807129, "global_step": 70534, "epoch": 1679} {"train_loss": -5.900827407836914, "global_step": 70535, "epoch": 1679} {"train_loss": -5.945566177368164, "global_step": 70536, "epoch": 1679} {"train_loss": -6.091432094573975, "global_step": 70537, "epoch": 1679} {"train_loss": -6.0445475578308105, "global_step": 70538, "epoch": 1679} {"train_loss": -5.939260005950928, "global_step": 70539, "epoch": 1679} {"train_loss": -5.94711971282959, "global_step": 70540, "epoch": 1679} {"train_loss": -5.925230026245117, "global_step": 70541, "epoch": 1679} {"train_loss": -6.000201225280762, "global_step": 70542, "epoch": 1679} {"train_loss": -6.09847354888916, "global_step": 70543, "epoch": 1679} {"train_loss": -6.174349784851074, "global_step": 70544, "epoch": 1679} {"train_loss": -6.099616050720215, "global_step": 70545, "epoch": 1679} {"train_loss": -6.104666233062744, "global_step": 70546, "epoch": 1679} {"train_loss": -6.066664695739746, "global_step": 70547, "epoch": 1679} {"train_loss": -6.073160648345947, "global_step": 70548, "epoch": 1679} {"train_loss": -6.037242889404297, "global_step": 70549, "epoch": 1679} {"train_loss": -6.052096366882324, "global_step": 70550, "epoch": 1679} {"train_loss": -5.967752456665039, "global_step": 70551, "epoch": 1679} {"train_loss": -5.939072608947754, "global_step": 70552, "epoch": 1679} {"train_loss": -5.952434062957764, "global_step": 70553, "epoch": 1679} {"train_loss": -6.069937229156494, "global_step": 70554, "epoch": 1679} {"train_loss": -6.002376556396484, "global_step": 70555, "epoch": 1679} {"train_loss": -6.009237289428711, "global_step": 70556, "epoch": 1679} {"train_loss": -6.03894567489624, "global_step": 70557, "epoch": 1679} {"train_loss": -6.024765968322754, "global_step": 70558, "epoch": 1679} {"train_loss": -6.01646241687593, "global_step": 70559, "epoch": 1679, "val_loss": 74710.5390625} {"train_loss": -6.098567008972168, "global_step": 70560, "epoch": 1680} {"train_loss": -6.0903639793396, "global_step": 70561, "epoch": 1680} {"train_loss": -6.015226364135742, "global_step": 70562, "epoch": 1680} {"train_loss": -5.99782657623291, "global_step": 70563, "epoch": 1680} {"train_loss": -5.928709506988525, "global_step": 70564, "epoch": 1680} {"train_loss": -5.946107864379883, "global_step": 70565, "epoch": 1680} {"train_loss": -5.974608421325684, "global_step": 70566, "epoch": 1680} {"train_loss": -5.926120758056641, "global_step": 70567, "epoch": 1680} {"train_loss": -5.969480514526367, "global_step": 70568, "epoch": 1680} {"train_loss": -6.124919891357422, "global_step": 70569, "epoch": 1680} {"train_loss": -6.062259674072266, "global_step": 70570, "epoch": 1680} {"train_loss": -6.152242660522461, "global_step": 70571, "epoch": 1680} {"train_loss": -6.009730339050293, "global_step": 70572, "epoch": 1680} {"train_loss": -6.124773025512695, "global_step": 70573, "epoch": 1680} {"train_loss": -6.174399375915527, "global_step": 70574, "epoch": 1680} {"train_loss": -6.080276012420654, "global_step": 70575, "epoch": 1680} {"train_loss": -6.085600852966309, "global_step": 70576, "epoch": 1680} {"train_loss": -6.101685523986816, "global_step": 70577, "epoch": 1680} {"train_loss": -5.975732803344727, "global_step": 70578, "epoch": 1680} {"train_loss": -6.01344108581543, "global_step": 70579, "epoch": 1680} {"train_loss": -5.935515403747559, "global_step": 70580, "epoch": 1680} {"train_loss": -6.134731292724609, "global_step": 70581, "epoch": 1680} {"train_loss": -6.0475263595581055, "global_step": 70582, "epoch": 1680} {"train_loss": -6.122535228729248, "global_step": 70583, "epoch": 1680} {"train_loss": -5.998610973358154, "global_step": 70584, "epoch": 1680} {"train_loss": -5.985563278198242, "global_step": 70585, "epoch": 1680} {"train_loss": -5.945602893829346, "global_step": 70586, "epoch": 1680} {"train_loss": -6.099104881286621, "global_step": 70587, "epoch": 1680} {"train_loss": -6.023568153381348, "global_step": 70588, "epoch": 1680} {"train_loss": -6.11870002746582, "global_step": 70589, "epoch": 1680} {"train_loss": -6.0250372886657715, "global_step": 70590, "epoch": 1680} {"train_loss": -6.126336574554443, "global_step": 70591, "epoch": 1680} {"train_loss": -6.043973445892334, "global_step": 70592, "epoch": 1680} {"train_loss": -6.093881607055664, "global_step": 70593, "epoch": 1680} {"train_loss": -6.116095066070557, "global_step": 70594, "epoch": 1680} {"train_loss": -5.919157028198242, "global_step": 70595, "epoch": 1680} {"train_loss": -6.009112358093262, "global_step": 70596, "epoch": 1680} {"train_loss": -6.046290874481201, "global_step": 70597, "epoch": 1680} {"train_loss": -5.984113693237305, "global_step": 70598, "epoch": 1680} {"train_loss": -5.880030155181885, "global_step": 70599, "epoch": 1680} {"train_loss": -5.924866199493408, "global_step": 70600, "epoch": 1680} {"train_loss": -6.035468339920044, "global_step": 70601, "epoch": 1680, "val_loss": 74825.53125} {"train_loss": -5.916788101196289, "global_step": 70602, "epoch": 1681} {"train_loss": -5.983150959014893, "global_step": 70603, "epoch": 1681} {"train_loss": -6.04588508605957, "global_step": 70604, "epoch": 1681} {"train_loss": -6.057149887084961, "global_step": 70605, "epoch": 1681} {"train_loss": -6.055222034454346, "global_step": 70606, "epoch": 1681} {"train_loss": -5.972786903381348, "global_step": 70607, "epoch": 1681} {"train_loss": -6.04878044128418, "global_step": 70608, "epoch": 1681} {"train_loss": -6.073207378387451, "global_step": 70609, "epoch": 1681} {"train_loss": -6.133349418640137, "global_step": 70610, "epoch": 1681} {"train_loss": -6.062143325805664, "global_step": 70611, "epoch": 1681} {"train_loss": -6.03343391418457, "global_step": 70612, "epoch": 1681} {"train_loss": -6.000783920288086, "global_step": 70613, "epoch": 1681} {"train_loss": -6.09332275390625, "global_step": 70614, "epoch": 1681} {"train_loss": -6.025882720947266, "global_step": 70615, "epoch": 1681} {"train_loss": -6.02045202255249, "global_step": 70616, "epoch": 1681} {"train_loss": -6.021537780761719, "global_step": 70617, "epoch": 1681} {"train_loss": -5.947422027587891, "global_step": 70618, "epoch": 1681} {"train_loss": -5.957508087158203, "global_step": 70619, "epoch": 1681} {"train_loss": -6.057705402374268, "global_step": 70620, "epoch": 1681} {"train_loss": -6.144826889038086, "global_step": 70621, "epoch": 1681} {"train_loss": -5.940646171569824, "global_step": 70622, "epoch": 1681} {"train_loss": -6.013015270233154, "global_step": 70623, "epoch": 1681} {"train_loss": -5.838866233825684, "global_step": 70624, "epoch": 1681} {"train_loss": -6.150494575500488, "global_step": 70625, "epoch": 1681} {"train_loss": -5.989163398742676, "global_step": 70626, "epoch": 1681} {"train_loss": -5.982656955718994, "global_step": 70627, "epoch": 1681} {"train_loss": -6.037274360656738, "global_step": 70628, "epoch": 1681} {"train_loss": -6.043152809143066, "global_step": 70629, "epoch": 1681} {"train_loss": -6.03651237487793, "global_step": 70630, "epoch": 1681} {"train_loss": -5.935086250305176, "global_step": 70631, "epoch": 1681} {"train_loss": -5.9236602783203125, "global_step": 70632, "epoch": 1681} {"train_loss": -6.060430526733398, "global_step": 70633, "epoch": 1681} {"train_loss": -5.945302963256836, "global_step": 70634, "epoch": 1681} {"train_loss": -6.042496681213379, "global_step": 70635, "epoch": 1681} {"train_loss": -6.045820236206055, "global_step": 70636, "epoch": 1681} {"train_loss": -5.967366695404053, "global_step": 70637, "epoch": 1681} {"train_loss": -6.0118865966796875, "global_step": 70638, "epoch": 1681} {"train_loss": -6.069949626922607, "global_step": 70639, "epoch": 1681} {"train_loss": -6.082234859466553, "global_step": 70640, "epoch": 1681} {"train_loss": -6.010193347930908, "global_step": 70641, "epoch": 1681} {"train_loss": -5.993363380432129, "global_step": 70642, "epoch": 1681} {"train_loss": -6.021707580203102, "global_step": 70643, "epoch": 1681, "val_loss": 74631.359375} {"train_loss": -6.089303016662598, "global_step": 70644, "epoch": 1682} {"train_loss": -6.044886589050293, "global_step": 70645, "epoch": 1682} {"train_loss": -6.06566858291626, "global_step": 70646, "epoch": 1682} {"train_loss": -5.97623872756958, "global_step": 70647, "epoch": 1682} {"train_loss": -6.008124351501465, "global_step": 70648, "epoch": 1682} {"train_loss": -6.106777191162109, "global_step": 70649, "epoch": 1682} {"train_loss": -6.070273399353027, "global_step": 70650, "epoch": 1682} {"train_loss": -6.014657974243164, "global_step": 70651, "epoch": 1682} {"train_loss": -5.9627299308776855, "global_step": 70652, "epoch": 1682} {"train_loss": -6.024829864501953, "global_step": 70653, "epoch": 1682} {"train_loss": -5.942883014678955, "global_step": 70654, "epoch": 1682} {"train_loss": -5.967033386230469, "global_step": 70655, "epoch": 1682} {"train_loss": -6.004725456237793, "global_step": 70656, "epoch": 1682} {"train_loss": -6.07638692855835, "global_step": 70657, "epoch": 1682} {"train_loss": -6.0119805335998535, "global_step": 70658, "epoch": 1682} {"train_loss": -6.21054744720459, "global_step": 70659, "epoch": 1682} {"train_loss": -5.9580888748168945, "global_step": 70660, "epoch": 1682} {"train_loss": -5.982123374938965, "global_step": 70661, "epoch": 1682} {"train_loss": -6.118190765380859, "global_step": 70662, "epoch": 1682} {"train_loss": -6.12381649017334, "global_step": 70663, "epoch": 1682} {"train_loss": -6.155177116394043, "global_step": 70664, "epoch": 1682} {"train_loss": -5.971423625946045, "global_step": 70665, "epoch": 1682} {"train_loss": -6.137001037597656, "global_step": 70666, "epoch": 1682} {"train_loss": -6.064822673797607, "global_step": 70667, "epoch": 1682} {"train_loss": -6.020137786865234, "global_step": 70668, "epoch": 1682} {"train_loss": -5.972714424133301, "global_step": 70669, "epoch": 1682} {"train_loss": -5.988587379455566, "global_step": 70670, "epoch": 1682} {"train_loss": -6.084164142608643, "global_step": 70671, "epoch": 1682} {"train_loss": -6.150378227233887, "global_step": 70672, "epoch": 1682} {"train_loss": -6.127367973327637, "global_step": 70673, "epoch": 1682} {"train_loss": -6.015003204345703, "global_step": 70674, "epoch": 1682} {"train_loss": -6.061075210571289, "global_step": 70675, "epoch": 1682} {"train_loss": -6.07208776473999, "global_step": 70676, "epoch": 1682} {"train_loss": -5.941607475280762, "global_step": 70677, "epoch": 1682} {"train_loss": -6.013068199157715, "global_step": 70678, "epoch": 1682} {"train_loss": -5.9864702224731445, "global_step": 70679, "epoch": 1682} {"train_loss": -6.06910514831543, "global_step": 70680, "epoch": 1682} {"train_loss": -6.062112808227539, "global_step": 70681, "epoch": 1682} {"train_loss": -6.033000946044922, "global_step": 70682, "epoch": 1682} {"train_loss": -5.964615821838379, "global_step": 70683, "epoch": 1682} {"train_loss": -6.046352386474609, "global_step": 70684, "epoch": 1682} {"train_loss": -6.040176777612595, "global_step": 70685, "epoch": 1682, "val_loss": 74510.875} {"train_loss": -6.0118727684021, "global_step": 70686, "epoch": 1683} {"train_loss": -5.9306745529174805, "global_step": 70687, "epoch": 1683} {"train_loss": -6.117050647735596, "global_step": 70688, "epoch": 1683} {"train_loss": -6.08377742767334, "global_step": 70689, "epoch": 1683} {"train_loss": -5.968418598175049, "global_step": 70690, "epoch": 1683} {"train_loss": -6.050520896911621, "global_step": 70691, "epoch": 1683} {"train_loss": -6.037802696228027, "global_step": 70692, "epoch": 1683} {"train_loss": -6.061478614807129, "global_step": 70693, "epoch": 1683} {"train_loss": -5.951041221618652, "global_step": 70694, "epoch": 1683} {"train_loss": -6.09560489654541, "global_step": 70695, "epoch": 1683} {"train_loss": -5.940699100494385, "global_step": 70696, "epoch": 1683} {"train_loss": -6.0707783699035645, "global_step": 70697, "epoch": 1683} {"train_loss": -6.134549140930176, "global_step": 70698, "epoch": 1683} {"train_loss": -6.009621620178223, "global_step": 70699, "epoch": 1683} {"train_loss": -5.923745632171631, "global_step": 70700, "epoch": 1683} {"train_loss": -6.017514705657959, "global_step": 70701, "epoch": 1683} {"train_loss": -5.998292922973633, "global_step": 70702, "epoch": 1683} {"train_loss": -5.988583087921143, "global_step": 70703, "epoch": 1683} {"train_loss": -6.093924522399902, "global_step": 70704, "epoch": 1683} {"train_loss": -6.0286970138549805, "global_step": 70705, "epoch": 1683} {"train_loss": -5.945639610290527, "global_step": 70706, "epoch": 1683} {"train_loss": -6.038956642150879, "global_step": 70707, "epoch": 1683} {"train_loss": -6.087281227111816, "global_step": 70708, "epoch": 1683} {"train_loss": -6.036018371582031, "global_step": 70709, "epoch": 1683} {"train_loss": -6.191009521484375, "global_step": 70710, "epoch": 1683} {"train_loss": -6.015840530395508, "global_step": 70711, "epoch": 1683} {"train_loss": -6.153685569763184, "global_step": 70712, "epoch": 1683} {"train_loss": -6.025476455688477, "global_step": 70713, "epoch": 1683} {"train_loss": -5.998787879943848, "global_step": 70714, "epoch": 1683} {"train_loss": -6.074411869049072, "global_step": 70715, "epoch": 1683} {"train_loss": -6.076581001281738, "global_step": 70716, "epoch": 1683} {"train_loss": -5.936522483825684, "global_step": 70717, "epoch": 1683} {"train_loss": -6.1832709312438965, "global_step": 70718, "epoch": 1683} {"train_loss": -5.887301445007324, "global_step": 70719, "epoch": 1683} {"train_loss": -5.930188179016113, "global_step": 70720, "epoch": 1683} {"train_loss": -5.894351959228516, "global_step": 70721, "epoch": 1683} {"train_loss": -6.038512706756592, "global_step": 70722, "epoch": 1683} {"train_loss": -6.055915832519531, "global_step": 70723, "epoch": 1683} {"train_loss": -5.940731525421143, "global_step": 70724, "epoch": 1683} {"train_loss": -6.057865619659424, "global_step": 70725, "epoch": 1683} {"train_loss": -6.014426231384277, "global_step": 70726, "epoch": 1683} {"train_loss": -6.026684079851423, "global_step": 70727, "epoch": 1683, "val_loss": 75009.046875} {"train_loss": -6.0020904541015625, "global_step": 70728, "epoch": 1684} {"train_loss": -5.943543434143066, "global_step": 70729, "epoch": 1684} {"train_loss": -5.994955062866211, "global_step": 70730, "epoch": 1684} {"train_loss": -6.042618751525879, "global_step": 70731, "epoch": 1684} {"train_loss": -6.0426025390625, "global_step": 70732, "epoch": 1684} {"train_loss": -6.008264541625977, "global_step": 70733, "epoch": 1684} {"train_loss": -6.053585052490234, "global_step": 70734, "epoch": 1684} {"train_loss": -6.08035945892334, "global_step": 70735, "epoch": 1684} {"train_loss": -5.928837776184082, "global_step": 70736, "epoch": 1684} {"train_loss": -6.011749267578125, "global_step": 70737, "epoch": 1684} {"train_loss": -5.979498863220215, "global_step": 70738, "epoch": 1684} {"train_loss": -6.014743804931641, "global_step": 70739, "epoch": 1684} {"train_loss": -6.053465843200684, "global_step": 70740, "epoch": 1684} {"train_loss": -6.049337387084961, "global_step": 70741, "epoch": 1684} {"train_loss": -6.0779805183410645, "global_step": 70742, "epoch": 1684} {"train_loss": -6.047117233276367, "global_step": 70743, "epoch": 1684} {"train_loss": -6.080816268920898, "global_step": 70744, "epoch": 1684} {"train_loss": -5.926959037780762, "global_step": 70745, "epoch": 1684} {"train_loss": -6.093061447143555, "global_step": 70746, "epoch": 1684} {"train_loss": -5.9720282554626465, "global_step": 70747, "epoch": 1684} {"train_loss": -6.026360034942627, "global_step": 70748, "epoch": 1684} {"train_loss": -6.096364498138428, "global_step": 70749, "epoch": 1684} {"train_loss": -6.0412187576293945, "global_step": 70750, "epoch": 1684} {"train_loss": -5.989408493041992, "global_step": 70751, "epoch": 1684} {"train_loss": -6.057161331176758, "global_step": 70752, "epoch": 1684} {"train_loss": -6.154989242553711, "global_step": 70753, "epoch": 1684} {"train_loss": -5.976027011871338, "global_step": 70754, "epoch": 1684} {"train_loss": -6.047635078430176, "global_step": 70755, "epoch": 1684} {"train_loss": -5.987689018249512, "global_step": 70756, "epoch": 1684} {"train_loss": -5.900132179260254, "global_step": 70757, "epoch": 1684} {"train_loss": -6.097123146057129, "global_step": 70758, "epoch": 1684} {"train_loss": -6.057286262512207, "global_step": 70759, "epoch": 1684} {"train_loss": -6.089741230010986, "global_step": 70760, "epoch": 1684} {"train_loss": -6.07000732421875, "global_step": 70761, "epoch": 1684} {"train_loss": -6.080182075500488, "global_step": 70762, "epoch": 1684} {"train_loss": -5.925108432769775, "global_step": 70763, "epoch": 1684} {"train_loss": -6.04855489730835, "global_step": 70764, "epoch": 1684} {"train_loss": -6.095653057098389, "global_step": 70765, "epoch": 1684} {"train_loss": -6.069249153137207, "global_step": 70766, "epoch": 1684} {"train_loss": -6.131181240081787, "global_step": 70767, "epoch": 1684} {"train_loss": -5.999030113220215, "global_step": 70768, "epoch": 1684} {"train_loss": -6.0345259848095125, "global_step": 70769, "epoch": 1684, "val_loss": 75130.7109375} {"train_loss": -5.926101207733154, "global_step": 70770, "epoch": 1685} {"train_loss": -6.050502777099609, "global_step": 70771, "epoch": 1685} {"train_loss": -5.941018104553223, "global_step": 70772, "epoch": 1685} {"train_loss": -6.023773193359375, "global_step": 70773, "epoch": 1685} {"train_loss": -6.051329612731934, "global_step": 70774, "epoch": 1685} {"train_loss": -6.000063896179199, "global_step": 70775, "epoch": 1685} {"train_loss": -6.082761764526367, "global_step": 70776, "epoch": 1685} {"train_loss": -5.98042106628418, "global_step": 70777, "epoch": 1685} {"train_loss": -5.988533020019531, "global_step": 70778, "epoch": 1685} {"train_loss": -5.961009502410889, "global_step": 70779, "epoch": 1685} {"train_loss": -6.114078998565674, "global_step": 70780, "epoch": 1685} {"train_loss": -5.965194225311279, "global_step": 70781, "epoch": 1685} {"train_loss": -5.997748374938965, "global_step": 70782, "epoch": 1685} {"train_loss": -6.039078235626221, "global_step": 70783, "epoch": 1685} {"train_loss": -6.113321304321289, "global_step": 70784, "epoch": 1685} {"train_loss": -5.996532440185547, "global_step": 70785, "epoch": 1685} {"train_loss": -6.04987907409668, "global_step": 70786, "epoch": 1685} {"train_loss": -5.945242881774902, "global_step": 70787, "epoch": 1685} {"train_loss": -5.950164794921875, "global_step": 70788, "epoch": 1685} {"train_loss": -6.086554527282715, "global_step": 70789, "epoch": 1685} {"train_loss": -6.050487041473389, "global_step": 70790, "epoch": 1685} {"train_loss": -5.978163719177246, "global_step": 70791, "epoch": 1685} {"train_loss": -5.908368110656738, "global_step": 70792, "epoch": 1685} {"train_loss": -5.937355995178223, "global_step": 70793, "epoch": 1685} {"train_loss": -5.9660491943359375, "global_step": 70794, "epoch": 1685} {"train_loss": -5.855137825012207, "global_step": 70795, "epoch": 1685} {"train_loss": -5.904529094696045, "global_step": 70796, "epoch": 1685} {"train_loss": -5.987298965454102, "global_step": 70797, "epoch": 1685} {"train_loss": -5.9981794357299805, "global_step": 70798, "epoch": 1685} {"train_loss": -6.206650733947754, "global_step": 70799, "epoch": 1685} {"train_loss": -5.88992977142334, "global_step": 70800, "epoch": 1685} {"train_loss": -5.982617378234863, "global_step": 70801, "epoch": 1685} {"train_loss": -5.911775588989258, "global_step": 70802, "epoch": 1685} {"train_loss": -6.05015754699707, "global_step": 70803, "epoch": 1685} {"train_loss": -5.9983062744140625, "global_step": 70804, "epoch": 1685} {"train_loss": -5.963275909423828, "global_step": 70805, "epoch": 1685} {"train_loss": -6.068549156188965, "global_step": 70806, "epoch": 1685} {"train_loss": -5.950822830200195, "global_step": 70807, "epoch": 1685} {"train_loss": -6.007744789123535, "global_step": 70808, "epoch": 1685} {"train_loss": -6.085715293884277, "global_step": 70809, "epoch": 1685} {"train_loss": -5.925058364868164, "global_step": 70810, "epoch": 1685} {"train_loss": -6.000331594830468, "global_step": 70811, "epoch": 1685, "val_loss": 74645.7578125} {"train_loss": -5.882803440093994, "global_step": 70812, "epoch": 1686} {"train_loss": -5.938182353973389, "global_step": 70813, "epoch": 1686} {"train_loss": -6.060360908508301, "global_step": 70814, "epoch": 1686} {"train_loss": -5.9465789794921875, "global_step": 70815, "epoch": 1686} {"train_loss": -5.948291778564453, "global_step": 70816, "epoch": 1686} {"train_loss": -5.834613800048828, "global_step": 70817, "epoch": 1686} {"train_loss": -6.051756858825684, "global_step": 70818, "epoch": 1686} {"train_loss": -6.04414701461792, "global_step": 70819, "epoch": 1686} {"train_loss": -5.947083473205566, "global_step": 70820, "epoch": 1686} {"train_loss": -5.9843878746032715, "global_step": 70821, "epoch": 1686} {"train_loss": -6.00600004196167, "global_step": 70822, "epoch": 1686} {"train_loss": -6.134500026702881, "global_step": 70823, "epoch": 1686} {"train_loss": -5.964756965637207, "global_step": 70824, "epoch": 1686} {"train_loss": -5.906798839569092, "global_step": 70825, "epoch": 1686} {"train_loss": -5.976174831390381, "global_step": 70826, "epoch": 1686} {"train_loss": -6.032801151275635, "global_step": 70827, "epoch": 1686} {"train_loss": -5.955922603607178, "global_step": 70828, "epoch": 1686} {"train_loss": -6.0146989822387695, "global_step": 70829, "epoch": 1686} {"train_loss": -5.9885969161987305, "global_step": 70830, "epoch": 1686} {"train_loss": -5.908328533172607, "global_step": 70831, "epoch": 1686} {"train_loss": -5.904259204864502, "global_step": 70832, "epoch": 1686} {"train_loss": -5.983237266540527, "global_step": 70833, "epoch": 1686} {"train_loss": -5.78378438949585, "global_step": 70834, "epoch": 1686} {"train_loss": -5.791738510131836, "global_step": 70835, "epoch": 1686} {"train_loss": -5.932294845581055, "global_step": 70836, "epoch": 1686} {"train_loss": -5.97759485244751, "global_step": 70837, "epoch": 1686} {"train_loss": -6.080131530761719, "global_step": 70838, "epoch": 1686} {"train_loss": -5.976363182067871, "global_step": 70839, "epoch": 1686} {"train_loss": -5.880305767059326, "global_step": 70840, "epoch": 1686} {"train_loss": -5.953592777252197, "global_step": 70841, "epoch": 1686} {"train_loss": -5.981180191040039, "global_step": 70842, "epoch": 1686} {"train_loss": -6.050313949584961, "global_step": 70843, "epoch": 1686} {"train_loss": -5.985005855560303, "global_step": 70844, "epoch": 1686} {"train_loss": -6.002353668212891, "global_step": 70845, "epoch": 1686} {"train_loss": -6.085644721984863, "global_step": 70846, "epoch": 1686} {"train_loss": -6.076003074645996, "global_step": 70847, "epoch": 1686} {"train_loss": -6.022406101226807, "global_step": 70848, "epoch": 1686} {"train_loss": -6.089240074157715, "global_step": 70849, "epoch": 1686} {"train_loss": -6.070753574371338, "global_step": 70850, "epoch": 1686} {"train_loss": -6.055792808532715, "global_step": 70851, "epoch": 1686} {"train_loss": -6.074906826019287, "global_step": 70852, "epoch": 1686} {"train_loss": -5.980331784202939, "global_step": 70853, "epoch": 1686, "val_loss": 74561.2890625} {"train_loss": -6.033514976501465, "global_step": 70854, "epoch": 1687} {"train_loss": -6.123802185058594, "global_step": 70855, "epoch": 1687} {"train_loss": -6.044747829437256, "global_step": 70856, "epoch": 1687} {"train_loss": -6.04808235168457, "global_step": 70857, "epoch": 1687} {"train_loss": -6.02591609954834, "global_step": 70858, "epoch": 1687} {"train_loss": -6.028838634490967, "global_step": 70859, "epoch": 1687} {"train_loss": -6.126841068267822, "global_step": 70860, "epoch": 1687} {"train_loss": -5.995240688323975, "global_step": 70861, "epoch": 1687} {"train_loss": -6.083849906921387, "global_step": 70862, "epoch": 1687} {"train_loss": -6.144083023071289, "global_step": 70863, "epoch": 1687} {"train_loss": -6.068277359008789, "global_step": 70864, "epoch": 1687} {"train_loss": -5.922246932983398, "global_step": 70865, "epoch": 1687} {"train_loss": -6.069218635559082, "global_step": 70866, "epoch": 1687} {"train_loss": -6.092745304107666, "global_step": 70867, "epoch": 1687} {"train_loss": -5.926018714904785, "global_step": 70868, "epoch": 1687} {"train_loss": -5.976505756378174, "global_step": 70869, "epoch": 1687} {"train_loss": -6.030784606933594, "global_step": 70870, "epoch": 1687} {"train_loss": -6.212736129760742, "global_step": 70871, "epoch": 1687} {"train_loss": -6.038432598114014, "global_step": 70872, "epoch": 1687} {"train_loss": -6.017980098724365, "global_step": 70873, "epoch": 1687} {"train_loss": -5.97659969329834, "global_step": 70874, "epoch": 1687} {"train_loss": -6.124061107635498, "global_step": 70875, "epoch": 1687} {"train_loss": -6.013731956481934, "global_step": 70876, "epoch": 1687} {"train_loss": -6.095221519470215, "global_step": 70877, "epoch": 1687} {"train_loss": -6.0427117347717285, "global_step": 70878, "epoch": 1687} {"train_loss": -6.048368453979492, "global_step": 70879, "epoch": 1687} {"train_loss": -5.992378234863281, "global_step": 70880, "epoch": 1687} {"train_loss": -5.958788871765137, "global_step": 70881, "epoch": 1687} {"train_loss": -6.074369430541992, "global_step": 70882, "epoch": 1687} {"train_loss": -5.964753150939941, "global_step": 70883, "epoch": 1687} {"train_loss": -5.957014083862305, "global_step": 70884, "epoch": 1687} {"train_loss": -6.107322692871094, "global_step": 70885, "epoch": 1687} {"train_loss": -6.204422950744629, "global_step": 70886, "epoch": 1687} {"train_loss": -6.000024318695068, "global_step": 70887, "epoch": 1687} {"train_loss": -6.019198417663574, "global_step": 70888, "epoch": 1687} {"train_loss": -6.067432880401611, "global_step": 70889, "epoch": 1687} {"train_loss": -6.1251935958862305, "global_step": 70890, "epoch": 1687} {"train_loss": -5.94169807434082, "global_step": 70891, "epoch": 1687} {"train_loss": -6.033230304718018, "global_step": 70892, "epoch": 1687} {"train_loss": -6.000722885131836, "global_step": 70893, "epoch": 1687} {"train_loss": -6.040863037109375, "global_step": 70894, "epoch": 1687} {"train_loss": -6.04541107586452, "global_step": 70895, "epoch": 1687, "val_loss": 74558.9375} {"train_loss": -6.1431684494018555, "global_step": 70896, "epoch": 1688} {"train_loss": -6.106581211090088, "global_step": 70897, "epoch": 1688} {"train_loss": -6.099800109863281, "global_step": 70898, "epoch": 1688} {"train_loss": -6.017486572265625, "global_step": 70899, "epoch": 1688} {"train_loss": -5.919175148010254, "global_step": 70900, "epoch": 1688} {"train_loss": -6.013340473175049, "global_step": 70901, "epoch": 1688} {"train_loss": -6.028352737426758, "global_step": 70902, "epoch": 1688} {"train_loss": -5.990513801574707, "global_step": 70903, "epoch": 1688} {"train_loss": -5.968605995178223, "global_step": 70904, "epoch": 1688} {"train_loss": -5.8579301834106445, "global_step": 70905, "epoch": 1688} {"train_loss": -5.928437232971191, "global_step": 70906, "epoch": 1688} {"train_loss": -6.125267028808594, "global_step": 70907, "epoch": 1688} {"train_loss": -6.08343505859375, "global_step": 70908, "epoch": 1688} {"train_loss": -6.070775032043457, "global_step": 70909, "epoch": 1688} {"train_loss": -5.976367950439453, "global_step": 70910, "epoch": 1688} {"train_loss": -5.998908519744873, "global_step": 70911, "epoch": 1688} {"train_loss": -6.130334854125977, "global_step": 70912, "epoch": 1688} {"train_loss": -5.93350887298584, "global_step": 70913, "epoch": 1688} {"train_loss": -6.086540222167969, "global_step": 70914, "epoch": 1688} {"train_loss": -6.179698944091797, "global_step": 70915, "epoch": 1688} {"train_loss": -5.9087066650390625, "global_step": 70916, "epoch": 1688} {"train_loss": -6.029539108276367, "global_step": 70917, "epoch": 1688} {"train_loss": -6.019277572631836, "global_step": 70918, "epoch": 1688} {"train_loss": -6.024538040161133, "global_step": 70919, "epoch": 1688} {"train_loss": -5.965519905090332, "global_step": 70920, "epoch": 1688} {"train_loss": -6.184183120727539, "global_step": 70921, "epoch": 1688} {"train_loss": -5.990873336791992, "global_step": 70922, "epoch": 1688} {"train_loss": -5.956949234008789, "global_step": 70923, "epoch": 1688} {"train_loss": -5.942111968994141, "global_step": 70924, "epoch": 1688} {"train_loss": -5.999876976013184, "global_step": 70925, "epoch": 1688} {"train_loss": -5.986697673797607, "global_step": 70926, "epoch": 1688} {"train_loss": -5.899932384490967, "global_step": 70927, "epoch": 1688} {"train_loss": -5.87185525894165, "global_step": 70928, "epoch": 1688} {"train_loss": -5.918661117553711, "global_step": 70929, "epoch": 1688} {"train_loss": -5.925787448883057, "global_step": 70930, "epoch": 1688} {"train_loss": -6.050860404968262, "global_step": 70931, "epoch": 1688} {"train_loss": -5.917325496673584, "global_step": 70932, "epoch": 1688} {"train_loss": -6.040630340576172, "global_step": 70933, "epoch": 1688} {"train_loss": -6.008388996124268, "global_step": 70934, "epoch": 1688} {"train_loss": -6.039427757263184, "global_step": 70935, "epoch": 1688} {"train_loss": -6.125885486602783, "global_step": 70936, "epoch": 1688} {"train_loss": -6.012666270846412, "global_step": 70937, "epoch": 1688, "val_loss": 74727.8671875} {"train_loss": -6.06361198425293, "global_step": 70938, "epoch": 1689} {"train_loss": -6.122021198272705, "global_step": 70939, "epoch": 1689} {"train_loss": -6.143421173095703, "global_step": 70940, "epoch": 1689} {"train_loss": -5.994155406951904, "global_step": 70941, "epoch": 1689} {"train_loss": -6.067356586456299, "global_step": 70942, "epoch": 1689} {"train_loss": -6.004073143005371, "global_step": 70943, "epoch": 1689} {"train_loss": -6.045261859893799, "global_step": 70944, "epoch": 1689} {"train_loss": -6.096014022827148, "global_step": 70945, "epoch": 1689} {"train_loss": -6.049127578735352, "global_step": 70946, "epoch": 1689} {"train_loss": -6.119507312774658, "global_step": 70947, "epoch": 1689} {"train_loss": -6.069800853729248, "global_step": 70948, "epoch": 1689} {"train_loss": -6.168967247009277, "global_step": 70949, "epoch": 1689} {"train_loss": -6.102545738220215, "global_step": 70950, "epoch": 1689} {"train_loss": -5.950425624847412, "global_step": 70951, "epoch": 1689} {"train_loss": -5.996667385101318, "global_step": 70952, "epoch": 1689} {"train_loss": -5.91941499710083, "global_step": 70953, "epoch": 1689} {"train_loss": -6.132862091064453, "global_step": 70954, "epoch": 1689} {"train_loss": -5.967518329620361, "global_step": 70955, "epoch": 1689} {"train_loss": -5.980416774749756, "global_step": 70956, "epoch": 1689} {"train_loss": -6.096654891967773, "global_step": 70957, "epoch": 1689} {"train_loss": -6.007042407989502, "global_step": 70958, "epoch": 1689} {"train_loss": -6.047501564025879, "global_step": 70959, "epoch": 1689} {"train_loss": -5.98311710357666, "global_step": 70960, "epoch": 1689} {"train_loss": -5.987682819366455, "global_step": 70961, "epoch": 1689} {"train_loss": -6.011749744415283, "global_step": 70962, "epoch": 1689} {"train_loss": -6.129490852355957, "global_step": 70963, "epoch": 1689} {"train_loss": -6.16905403137207, "global_step": 70964, "epoch": 1689} {"train_loss": -6.015119552612305, "global_step": 70965, "epoch": 1689} {"train_loss": -5.887306213378906, "global_step": 70966, "epoch": 1689} {"train_loss": -6.15402889251709, "global_step": 70967, "epoch": 1689} {"train_loss": -6.112949371337891, "global_step": 70968, "epoch": 1689} {"train_loss": -5.983425140380859, "global_step": 70969, "epoch": 1689} {"train_loss": -5.988835334777832, "global_step": 70970, "epoch": 1689} {"train_loss": -6.003522872924805, "global_step": 70971, "epoch": 1689} {"train_loss": -5.916717529296875, "global_step": 70972, "epoch": 1689} {"train_loss": -6.009692192077637, "global_step": 70973, "epoch": 1689} {"train_loss": -5.992994785308838, "global_step": 70974, "epoch": 1689} {"train_loss": -5.947733402252197, "global_step": 70975, "epoch": 1689} {"train_loss": -6.130187034606934, "global_step": 70976, "epoch": 1689} {"train_loss": -6.01511287689209, "global_step": 70977, "epoch": 1689} {"train_loss": -5.955303192138672, "global_step": 70978, "epoch": 1689} {"train_loss": -6.035215025856381, "global_step": 70979, "epoch": 1689, "val_loss": 74977.71875} {"train_loss": -5.973441123962402, "global_step": 70980, "epoch": 1690} {"train_loss": -5.995772838592529, "global_step": 70981, "epoch": 1690} {"train_loss": -5.983452320098877, "global_step": 70982, "epoch": 1690} {"train_loss": -6.0364789962768555, "global_step": 70983, "epoch": 1690} {"train_loss": -5.952614784240723, "global_step": 70984, "epoch": 1690} {"train_loss": -5.997075080871582, "global_step": 70985, "epoch": 1690} {"train_loss": -6.049702167510986, "global_step": 70986, "epoch": 1690} {"train_loss": -5.975968360900879, "global_step": 70987, "epoch": 1690} {"train_loss": -6.009672164916992, "global_step": 70988, "epoch": 1690} {"train_loss": -6.031746864318848, "global_step": 70989, "epoch": 1690} {"train_loss": -5.928998947143555, "global_step": 70990, "epoch": 1690} {"train_loss": -6.039695739746094, "global_step": 70991, "epoch": 1690} {"train_loss": -6.010644435882568, "global_step": 70992, "epoch": 1690} {"train_loss": -6.020986557006836, "global_step": 70993, "epoch": 1690} {"train_loss": -6.012961387634277, "global_step": 70994, "epoch": 1690} {"train_loss": -6.117341995239258, "global_step": 70995, "epoch": 1690} {"train_loss": -5.981607437133789, "global_step": 70996, "epoch": 1690} {"train_loss": -6.082737922668457, "global_step": 70997, "epoch": 1690} {"train_loss": -6.035381317138672, "global_step": 70998, "epoch": 1690} {"train_loss": -6.031857490539551, "global_step": 70999, "epoch": 1690} {"train_loss": -5.981355667114258, "global_step": 71000, "epoch": 1690} {"train_loss": -6.126371383666992, "global_step": 71001, "epoch": 1690} {"train_loss": -6.014322280883789, "global_step": 71002, "epoch": 1690} {"train_loss": -6.015786170959473, "global_step": 71003, "epoch": 1690} {"train_loss": -6.028868675231934, "global_step": 71004, "epoch": 1690} {"train_loss": -5.981963634490967, "global_step": 71005, "epoch": 1690} {"train_loss": -6.035144329071045, "global_step": 71006, "epoch": 1690} {"train_loss": -6.043262481689453, "global_step": 71007, "epoch": 1690} {"train_loss": -6.035097122192383, "global_step": 71008, "epoch": 1690} {"train_loss": -6.017563819885254, "global_step": 71009, "epoch": 1690} {"train_loss": -5.9222092628479, "global_step": 71010, "epoch": 1690} {"train_loss": -6.051067352294922, "global_step": 71011, "epoch": 1690} {"train_loss": -6.13658332824707, "global_step": 71012, "epoch": 1690} {"train_loss": -6.008890151977539, "global_step": 71013, "epoch": 1690} {"train_loss": -6.147797107696533, "global_step": 71014, "epoch": 1690} {"train_loss": -6.074522495269775, "global_step": 71015, "epoch": 1690} {"train_loss": -6.069513320922852, "global_step": 71016, "epoch": 1690} {"train_loss": -6.039328575134277, "global_step": 71017, "epoch": 1690} {"train_loss": -6.011685371398926, "global_step": 71018, "epoch": 1690} {"train_loss": -6.109933376312256, "global_step": 71019, "epoch": 1690} {"train_loss": -6.017778396606445, "global_step": 71020, "epoch": 1690} {"train_loss": -6.026269265583584, "global_step": 71021, "epoch": 1690, "val_loss": 74591.765625} {"train_loss": -6.121542930603027, "global_step": 71022, "epoch": 1691} {"train_loss": -6.062570571899414, "global_step": 71023, "epoch": 1691} {"train_loss": -5.969112396240234, "global_step": 71024, "epoch": 1691} {"train_loss": -6.033974647521973, "global_step": 71025, "epoch": 1691} {"train_loss": -6.121824264526367, "global_step": 71026, "epoch": 1691} {"train_loss": -5.975099563598633, "global_step": 71027, "epoch": 1691} {"train_loss": -6.080961227416992, "global_step": 71028, "epoch": 1691} {"train_loss": -6.0884294509887695, "global_step": 71029, "epoch": 1691} {"train_loss": -6.169233322143555, "global_step": 71030, "epoch": 1691} {"train_loss": -6.014508247375488, "global_step": 71031, "epoch": 1691} {"train_loss": -6.011294841766357, "global_step": 71032, "epoch": 1691} {"train_loss": -6.000030517578125, "global_step": 71033, "epoch": 1691} {"train_loss": -6.117358207702637, "global_step": 71034, "epoch": 1691} {"train_loss": -6.121237277984619, "global_step": 71035, "epoch": 1691} {"train_loss": -6.220337390899658, "global_step": 71036, "epoch": 1691} {"train_loss": -6.006957530975342, "global_step": 71037, "epoch": 1691} {"train_loss": -6.141094207763672, "global_step": 71038, "epoch": 1691} {"train_loss": -6.068212032318115, "global_step": 71039, "epoch": 1691} {"train_loss": -6.119237899780273, "global_step": 71040, "epoch": 1691} {"train_loss": -5.952507019042969, "global_step": 71041, "epoch": 1691} {"train_loss": -6.031406402587891, "global_step": 71042, "epoch": 1691} {"train_loss": -5.972921848297119, "global_step": 71043, "epoch": 1691} {"train_loss": -5.99693489074707, "global_step": 71044, "epoch": 1691} {"train_loss": -6.127762317657471, "global_step": 71045, "epoch": 1691} {"train_loss": -5.934226036071777, "global_step": 71046, "epoch": 1691} {"train_loss": -6.11656379699707, "global_step": 71047, "epoch": 1691} {"train_loss": -6.014867782592773, "global_step": 71048, "epoch": 1691} {"train_loss": -6.075736999511719, "global_step": 71049, "epoch": 1691} {"train_loss": -6.023082733154297, "global_step": 71050, "epoch": 1691} {"train_loss": -6.074725151062012, "global_step": 71051, "epoch": 1691} {"train_loss": -6.003798007965088, "global_step": 71052, "epoch": 1691} {"train_loss": -6.079613208770752, "global_step": 71053, "epoch": 1691} {"train_loss": -6.067038059234619, "global_step": 71054, "epoch": 1691} {"train_loss": -6.035778999328613, "global_step": 71055, "epoch": 1691} {"train_loss": -6.109508037567139, "global_step": 71056, "epoch": 1691} {"train_loss": -6.021601676940918, "global_step": 71057, "epoch": 1691} {"train_loss": -6.074481964111328, "global_step": 71058, "epoch": 1691} {"train_loss": -6.020063877105713, "global_step": 71059, "epoch": 1691} {"train_loss": -6.061134338378906, "global_step": 71060, "epoch": 1691} {"train_loss": -6.021461486816406, "global_step": 71061, "epoch": 1691} {"train_loss": -6.1230974197387695, "global_step": 71062, "epoch": 1691} {"train_loss": -6.060212203434536, "global_step": 71063, "epoch": 1691, "val_loss": 74716.6640625} {"train_loss": -6.12300443649292, "global_step": 71064, "epoch": 1692} {"train_loss": -5.960144519805908, "global_step": 71065, "epoch": 1692} {"train_loss": -6.163532257080078, "global_step": 71066, "epoch": 1692} {"train_loss": -6.168445110321045, "global_step": 71067, "epoch": 1692} {"train_loss": -6.108668327331543, "global_step": 71068, "epoch": 1692} {"train_loss": -5.904717445373535, "global_step": 71069, "epoch": 1692} {"train_loss": -6.098503112792969, "global_step": 71070, "epoch": 1692} {"train_loss": -5.961179733276367, "global_step": 71071, "epoch": 1692} {"train_loss": -6.165550231933594, "global_step": 71072, "epoch": 1692} {"train_loss": -6.039425849914551, "global_step": 71073, "epoch": 1692} {"train_loss": -6.1973772048950195, "global_step": 71074, "epoch": 1692} {"train_loss": -6.024125576019287, "global_step": 71075, "epoch": 1692} {"train_loss": -6.026867866516113, "global_step": 71076, "epoch": 1692} {"train_loss": -6.116082668304443, "global_step": 71077, "epoch": 1692} {"train_loss": -5.994495868682861, "global_step": 71078, "epoch": 1692} {"train_loss": -6.100035667419434, "global_step": 71079, "epoch": 1692} {"train_loss": -6.121618747711182, "global_step": 71080, "epoch": 1692} {"train_loss": -6.058472633361816, "global_step": 71081, "epoch": 1692} {"train_loss": -5.932134628295898, "global_step": 71082, "epoch": 1692} {"train_loss": -6.031176567077637, "global_step": 71083, "epoch": 1692} {"train_loss": -5.987843036651611, "global_step": 71084, "epoch": 1692} {"train_loss": -5.92091178894043, "global_step": 71085, "epoch": 1692} {"train_loss": -6.117074966430664, "global_step": 71086, "epoch": 1692} {"train_loss": -5.885948181152344, "global_step": 71087, "epoch": 1692} {"train_loss": -5.828525543212891, "global_step": 71088, "epoch": 1692} {"train_loss": -6.062780380249023, "global_step": 71089, "epoch": 1692} {"train_loss": -5.987854480743408, "global_step": 71090, "epoch": 1692} {"train_loss": -6.0358357429504395, "global_step": 71091, "epoch": 1692} {"train_loss": -6.038088798522949, "global_step": 71092, "epoch": 1692} {"train_loss": -5.978466510772705, "global_step": 71093, "epoch": 1692} {"train_loss": -6.036270618438721, "global_step": 71094, "epoch": 1692} {"train_loss": -6.047203540802002, "global_step": 71095, "epoch": 1692} {"train_loss": -6.050409317016602, "global_step": 71096, "epoch": 1692} {"train_loss": -6.012819290161133, "global_step": 71097, "epoch": 1692} {"train_loss": -5.927048206329346, "global_step": 71098, "epoch": 1692} {"train_loss": -5.886002540588379, "global_step": 71099, "epoch": 1692} {"train_loss": -6.090505123138428, "global_step": 71100, "epoch": 1692} {"train_loss": -5.931285381317139, "global_step": 71101, "epoch": 1692} {"train_loss": -6.027772903442383, "global_step": 71102, "epoch": 1692} {"train_loss": -6.0388898849487305, "global_step": 71103, "epoch": 1692} {"train_loss": -5.967741966247559, "global_step": 71104, "epoch": 1692} {"train_loss": -6.027959880374727, "global_step": 71105, "epoch": 1692, "val_loss": 74935.5625} {"train_loss": -6.0497331619262695, "global_step": 71106, "epoch": 1693} {"train_loss": -6.143216609954834, "global_step": 71107, "epoch": 1693} {"train_loss": -6.080196380615234, "global_step": 71108, "epoch": 1693} {"train_loss": -6.059868335723877, "global_step": 71109, "epoch": 1693} {"train_loss": -6.127280235290527, "global_step": 71110, "epoch": 1693} {"train_loss": -5.9947190284729, "global_step": 71111, "epoch": 1693} {"train_loss": -6.059849739074707, "global_step": 71112, "epoch": 1693} {"train_loss": -5.892620086669922, "global_step": 71113, "epoch": 1693} {"train_loss": -6.142223358154297, "global_step": 71114, "epoch": 1693} {"train_loss": -5.966078758239746, "global_step": 71115, "epoch": 1693} {"train_loss": -6.1448163986206055, "global_step": 71116, "epoch": 1693} {"train_loss": -6.058593273162842, "global_step": 71117, "epoch": 1693} {"train_loss": -5.995173454284668, "global_step": 71118, "epoch": 1693} {"train_loss": -6.13147497177124, "global_step": 71119, "epoch": 1693} {"train_loss": -6.026447296142578, "global_step": 71120, "epoch": 1693} {"train_loss": -5.9076151847839355, "global_step": 71121, "epoch": 1693} {"train_loss": -6.092527866363525, "global_step": 71122, "epoch": 1693} {"train_loss": -6.044696807861328, "global_step": 71123, "epoch": 1693} {"train_loss": -5.977424621582031, "global_step": 71124, "epoch": 1693} {"train_loss": -6.0252227783203125, "global_step": 71125, "epoch": 1693} {"train_loss": -5.991551399230957, "global_step": 71126, "epoch": 1693} {"train_loss": -6.067261695861816, "global_step": 71127, "epoch": 1693} {"train_loss": -5.899084091186523, "global_step": 71128, "epoch": 1693} {"train_loss": -6.034480094909668, "global_step": 71129, "epoch": 1693} {"train_loss": -5.967604637145996, "global_step": 71130, "epoch": 1693} {"train_loss": -5.94801664352417, "global_step": 71131, "epoch": 1693} {"train_loss": -6.0213847160339355, "global_step": 71132, "epoch": 1693} {"train_loss": -5.929087162017822, "global_step": 71133, "epoch": 1693} {"train_loss": -6.052814960479736, "global_step": 71134, "epoch": 1693} {"train_loss": -5.984940528869629, "global_step": 71135, "epoch": 1693} {"train_loss": -5.982577323913574, "global_step": 71136, "epoch": 1693} {"train_loss": -6.010714530944824, "global_step": 71137, "epoch": 1693} {"train_loss": -6.009696960449219, "global_step": 71138, "epoch": 1693} {"train_loss": -6.033287048339844, "global_step": 71139, "epoch": 1693} {"train_loss": -6.022526264190674, "global_step": 71140, "epoch": 1693} {"train_loss": -6.032340049743652, "global_step": 71141, "epoch": 1693} {"train_loss": -5.956589221954346, "global_step": 71142, "epoch": 1693} {"train_loss": -6.107559680938721, "global_step": 71143, "epoch": 1693} {"train_loss": -5.945961952209473, "global_step": 71144, "epoch": 1693} {"train_loss": -6.067413330078125, "global_step": 71145, "epoch": 1693} {"train_loss": -6.109711647033691, "global_step": 71146, "epoch": 1693} {"train_loss": -6.0264944689614435, "global_step": 71147, "epoch": 1693, "val_loss": 74714.90625} {"train_loss": -5.969847679138184, "global_step": 71148, "epoch": 1694} {"train_loss": -6.123283386230469, "global_step": 71149, "epoch": 1694} {"train_loss": -6.074665069580078, "global_step": 71150, "epoch": 1694} {"train_loss": -6.137533187866211, "global_step": 71151, "epoch": 1694} {"train_loss": -5.955015182495117, "global_step": 71152, "epoch": 1694} {"train_loss": -6.045026779174805, "global_step": 71153, "epoch": 1694} {"train_loss": -6.218674182891846, "global_step": 71154, "epoch": 1694} {"train_loss": -5.9742655754089355, "global_step": 71155, "epoch": 1694} {"train_loss": -5.974457740783691, "global_step": 71156, "epoch": 1694} {"train_loss": -6.034692287445068, "global_step": 71157, "epoch": 1694} {"train_loss": -6.067303657531738, "global_step": 71158, "epoch": 1694} {"train_loss": -5.977234840393066, "global_step": 71159, "epoch": 1694} {"train_loss": -6.0114665031433105, "global_step": 71160, "epoch": 1694} {"train_loss": -6.083378791809082, "global_step": 71161, "epoch": 1694} {"train_loss": -5.958384990692139, "global_step": 71162, "epoch": 1694} {"train_loss": -6.028534412384033, "global_step": 71163, "epoch": 1694} {"train_loss": -6.040247440338135, "global_step": 71164, "epoch": 1694} {"train_loss": -6.000543117523193, "global_step": 71165, "epoch": 1694} {"train_loss": -5.990744113922119, "global_step": 71166, "epoch": 1694} {"train_loss": -5.942934989929199, "global_step": 71167, "epoch": 1694} {"train_loss": -5.966402053833008, "global_step": 71168, "epoch": 1694} {"train_loss": -6.00849723815918, "global_step": 71169, "epoch": 1694} {"train_loss": -5.8859543800354, "global_step": 71170, "epoch": 1694} {"train_loss": -6.01468563079834, "global_step": 71171, "epoch": 1694} {"train_loss": -5.968925952911377, "global_step": 71172, "epoch": 1694} {"train_loss": -6.018360137939453, "global_step": 71173, "epoch": 1694} {"train_loss": -5.991033554077148, "global_step": 71174, "epoch": 1694} {"train_loss": -6.037506103515625, "global_step": 71175, "epoch": 1694} {"train_loss": -5.969485282897949, "global_step": 71176, "epoch": 1694} {"train_loss": -6.10001277923584, "global_step": 71177, "epoch": 1694} {"train_loss": -6.002933979034424, "global_step": 71178, "epoch": 1694} {"train_loss": -6.114190101623535, "global_step": 71179, "epoch": 1694} {"train_loss": -6.074912071228027, "global_step": 71180, "epoch": 1694} {"train_loss": -6.09782600402832, "global_step": 71181, "epoch": 1694} {"train_loss": -6.0123114585876465, "global_step": 71182, "epoch": 1694} {"train_loss": -5.959043025970459, "global_step": 71183, "epoch": 1694} {"train_loss": -6.183373928070068, "global_step": 71184, "epoch": 1694} {"train_loss": -6.053524017333984, "global_step": 71185, "epoch": 1694} {"train_loss": -5.840026378631592, "global_step": 71186, "epoch": 1694} {"train_loss": -5.989485740661621, "global_step": 71187, "epoch": 1694} {"train_loss": -5.963174819946289, "global_step": 71188, "epoch": 1694} {"train_loss": -6.019963196345738, "global_step": 71189, "epoch": 1694, "val_loss": 74922.8125} {"train_loss": -5.9763593673706055, "global_step": 71190, "epoch": 1695} {"train_loss": -6.073460578918457, "global_step": 71191, "epoch": 1695} {"train_loss": -5.934218406677246, "global_step": 71192, "epoch": 1695} {"train_loss": -6.157279968261719, "global_step": 71193, "epoch": 1695} {"train_loss": -6.017159938812256, "global_step": 71194, "epoch": 1695} {"train_loss": -5.934059143066406, "global_step": 71195, "epoch": 1695} {"train_loss": -6.018943786621094, "global_step": 71196, "epoch": 1695} {"train_loss": -5.988049507141113, "global_step": 71197, "epoch": 1695} {"train_loss": -6.078953742980957, "global_step": 71198, "epoch": 1695} {"train_loss": -5.939969062805176, "global_step": 71199, "epoch": 1695} {"train_loss": -6.037393569946289, "global_step": 71200, "epoch": 1695} {"train_loss": -6.136897087097168, "global_step": 71201, "epoch": 1695} {"train_loss": -5.956490516662598, "global_step": 71202, "epoch": 1695} {"train_loss": -6.086369514465332, "global_step": 71203, "epoch": 1695} {"train_loss": -5.899703025817871, "global_step": 71204, "epoch": 1695} {"train_loss": -5.973154544830322, "global_step": 71205, "epoch": 1695} {"train_loss": -5.956856727600098, "global_step": 71206, "epoch": 1695} {"train_loss": -5.99874210357666, "global_step": 71207, "epoch": 1695} {"train_loss": -6.06565523147583, "global_step": 71208, "epoch": 1695} {"train_loss": -6.011219501495361, "global_step": 71209, "epoch": 1695} {"train_loss": -6.041147232055664, "global_step": 71210, "epoch": 1695} {"train_loss": -6.104598045349121, "global_step": 71211, "epoch": 1695} {"train_loss": -6.006945610046387, "global_step": 71212, "epoch": 1695} {"train_loss": -6.102761268615723, "global_step": 71213, "epoch": 1695} {"train_loss": -5.963651180267334, "global_step": 71214, "epoch": 1695} {"train_loss": -5.910798072814941, "global_step": 71215, "epoch": 1695} {"train_loss": -5.976520538330078, "global_step": 71216, "epoch": 1695} {"train_loss": -6.138423442840576, "global_step": 71217, "epoch": 1695} {"train_loss": -5.929032802581787, "global_step": 71218, "epoch": 1695} {"train_loss": -5.968217849731445, "global_step": 71219, "epoch": 1695} {"train_loss": -6.121776580810547, "global_step": 71220, "epoch": 1695} {"train_loss": -6.189809799194336, "global_step": 71221, "epoch": 1695} {"train_loss": -5.9755859375, "global_step": 71222, "epoch": 1695} {"train_loss": -6.023581504821777, "global_step": 71223, "epoch": 1695} {"train_loss": -6.142829895019531, "global_step": 71224, "epoch": 1695} {"train_loss": -5.8726277351379395, "global_step": 71225, "epoch": 1695} {"train_loss": -6.022732734680176, "global_step": 71226, "epoch": 1695} {"train_loss": -6.0131354331970215, "global_step": 71227, "epoch": 1695} {"train_loss": -5.884859085083008, "global_step": 71228, "epoch": 1695} {"train_loss": -5.90567684173584, "global_step": 71229, "epoch": 1695} {"train_loss": -5.953507423400879, "global_step": 71230, "epoch": 1695} {"train_loss": -6.010089431490217, "global_step": 71231, "epoch": 1695, "val_loss": 74797.3515625} {"train_loss": -6.043747901916504, "global_step": 71232, "epoch": 1696} {"train_loss": -5.88087272644043, "global_step": 71233, "epoch": 1696} {"train_loss": -5.970822334289551, "global_step": 71234, "epoch": 1696} {"train_loss": -5.853200912475586, "global_step": 71235, "epoch": 1696} {"train_loss": -6.005789756774902, "global_step": 71236, "epoch": 1696} {"train_loss": -5.9903764724731445, "global_step": 71237, "epoch": 1696} {"train_loss": -5.984684944152832, "global_step": 71238, "epoch": 1696} {"train_loss": -6.017541408538818, "global_step": 71239, "epoch": 1696} {"train_loss": -5.939607620239258, "global_step": 71240, "epoch": 1696} {"train_loss": -6.067272663116455, "global_step": 71241, "epoch": 1696} {"train_loss": -6.05721378326416, "global_step": 71242, "epoch": 1696} {"train_loss": -6.088133335113525, "global_step": 71243, "epoch": 1696} {"train_loss": -5.9753499031066895, "global_step": 71244, "epoch": 1696} {"train_loss": -5.807157516479492, "global_step": 71245, "epoch": 1696} {"train_loss": -5.942916393280029, "global_step": 71246, "epoch": 1696} {"train_loss": -6.0357866287231445, "global_step": 71247, "epoch": 1696} {"train_loss": -6.105132579803467, "global_step": 71248, "epoch": 1696} {"train_loss": -5.933782577514648, "global_step": 71249, "epoch": 1696} {"train_loss": -6.024020195007324, "global_step": 71250, "epoch": 1696} {"train_loss": -5.969986438751221, "global_step": 71251, "epoch": 1696} {"train_loss": -5.888688087463379, "global_step": 71252, "epoch": 1696} {"train_loss": -6.0997772216796875, "global_step": 71253, "epoch": 1696} {"train_loss": -5.996180534362793, "global_step": 71254, "epoch": 1696} {"train_loss": -5.973264217376709, "global_step": 71255, "epoch": 1696} {"train_loss": -5.925168037414551, "global_step": 71256, "epoch": 1696} {"train_loss": -5.985285758972168, "global_step": 71257, "epoch": 1696} {"train_loss": -5.889270782470703, "global_step": 71258, "epoch": 1696} {"train_loss": -6.0257158279418945, "global_step": 71259, "epoch": 1696} {"train_loss": -6.0668439865112305, "global_step": 71260, "epoch": 1696} {"train_loss": -5.965530872344971, "global_step": 71261, "epoch": 1696} {"train_loss": -6.105821132659912, "global_step": 71262, "epoch": 1696} {"train_loss": -6.005093574523926, "global_step": 71263, "epoch": 1696} {"train_loss": -6.118179798126221, "global_step": 71264, "epoch": 1696} {"train_loss": -6.062150001525879, "global_step": 71265, "epoch": 1696} {"train_loss": -6.053257465362549, "global_step": 71266, "epoch": 1696} {"train_loss": -5.864405155181885, "global_step": 71267, "epoch": 1696} {"train_loss": -6.050497055053711, "global_step": 71268, "epoch": 1696} {"train_loss": -6.023336887359619, "global_step": 71269, "epoch": 1696} {"train_loss": -5.976633071899414, "global_step": 71270, "epoch": 1696} {"train_loss": -6.138594627380371, "global_step": 71271, "epoch": 1696} {"train_loss": -5.989243507385254, "global_step": 71272, "epoch": 1696} {"train_loss": -5.996764955066499, "global_step": 71273, "epoch": 1696, "val_loss": 74943.03125} {"train_loss": -6.026360511779785, "global_step": 71274, "epoch": 1697} {"train_loss": -5.9520673751831055, "global_step": 71275, "epoch": 1697} {"train_loss": -6.026839256286621, "global_step": 71276, "epoch": 1697} {"train_loss": -6.082521915435791, "global_step": 71277, "epoch": 1697} {"train_loss": -5.960353851318359, "global_step": 71278, "epoch": 1697} {"train_loss": -5.928842067718506, "global_step": 71279, "epoch": 1697} {"train_loss": -6.0902814865112305, "global_step": 71280, "epoch": 1697} {"train_loss": -5.992125034332275, "global_step": 71281, "epoch": 1697} {"train_loss": -6.083034038543701, "global_step": 71282, "epoch": 1697} {"train_loss": -6.116239070892334, "global_step": 71283, "epoch": 1697} {"train_loss": -6.042008399963379, "global_step": 71284, "epoch": 1697} {"train_loss": -6.039117813110352, "global_step": 71285, "epoch": 1697} {"train_loss": -6.047214984893799, "global_step": 71286, "epoch": 1697} {"train_loss": -5.921674728393555, "global_step": 71287, "epoch": 1697} {"train_loss": -5.922684192657471, "global_step": 71288, "epoch": 1697} {"train_loss": -6.0507659912109375, "global_step": 71289, "epoch": 1697} {"train_loss": -5.966054916381836, "global_step": 71290, "epoch": 1697} {"train_loss": -5.910684585571289, "global_step": 71291, "epoch": 1697} {"train_loss": -6.03851318359375, "global_step": 71292, "epoch": 1697} {"train_loss": -5.8234968185424805, "global_step": 71293, "epoch": 1697} {"train_loss": -6.090371131896973, "global_step": 71294, "epoch": 1697} {"train_loss": -6.037832260131836, "global_step": 71295, "epoch": 1697} {"train_loss": -5.818094730377197, "global_step": 71296, "epoch": 1697} {"train_loss": -6.091035842895508, "global_step": 71297, "epoch": 1697} {"train_loss": -5.77851676940918, "global_step": 71298, "epoch": 1697} {"train_loss": -6.091500282287598, "global_step": 71299, "epoch": 1697} {"train_loss": -5.927407741546631, "global_step": 71300, "epoch": 1697} {"train_loss": -5.955615520477295, "global_step": 71301, "epoch": 1697} {"train_loss": -5.912858009338379, "global_step": 71302, "epoch": 1697} {"train_loss": -6.067935943603516, "global_step": 71303, "epoch": 1697} {"train_loss": -5.954366683959961, "global_step": 71304, "epoch": 1697} {"train_loss": -5.998234272003174, "global_step": 71305, "epoch": 1697} {"train_loss": -6.014820575714111, "global_step": 71306, "epoch": 1697} {"train_loss": -5.907522201538086, "global_step": 71307, "epoch": 1697} {"train_loss": -6.026861190795898, "global_step": 71308, "epoch": 1697} {"train_loss": -5.989954948425293, "global_step": 71309, "epoch": 1697} {"train_loss": -6.061923980712891, "global_step": 71310, "epoch": 1697} {"train_loss": -6.021181583404541, "global_step": 71311, "epoch": 1697} {"train_loss": -5.920260429382324, "global_step": 71312, "epoch": 1697} {"train_loss": -6.044630527496338, "global_step": 71313, "epoch": 1697} {"train_loss": -5.898754119873047, "global_step": 71314, "epoch": 1697} {"train_loss": -5.9906173206511, "global_step": 71315, "epoch": 1697, "val_loss": 74804.15625} {"train_loss": -6.039159774780273, "global_step": 71316, "epoch": 1698} {"train_loss": -6.007542610168457, "global_step": 71317, "epoch": 1698} {"train_loss": -6.031144142150879, "global_step": 71318, "epoch": 1698} {"train_loss": -6.015949249267578, "global_step": 71319, "epoch": 1698} {"train_loss": -5.9252543449401855, "global_step": 71320, "epoch": 1698} {"train_loss": -6.010952949523926, "global_step": 71321, "epoch": 1698} {"train_loss": -6.135479927062988, "global_step": 71322, "epoch": 1698} {"train_loss": -5.966475009918213, "global_step": 71323, "epoch": 1698} {"train_loss": -6.0726728439331055, "global_step": 71324, "epoch": 1698} {"train_loss": -6.020331859588623, "global_step": 71325, "epoch": 1698} {"train_loss": -6.046958923339844, "global_step": 71326, "epoch": 1698} {"train_loss": -5.917665004730225, "global_step": 71327, "epoch": 1698} {"train_loss": -6.119688987731934, "global_step": 71328, "epoch": 1698} {"train_loss": -6.065366744995117, "global_step": 71329, "epoch": 1698} {"train_loss": -5.995545387268066, "global_step": 71330, "epoch": 1698} {"train_loss": -6.091188430786133, "global_step": 71331, "epoch": 1698} {"train_loss": -5.966383934020996, "global_step": 71332, "epoch": 1698} {"train_loss": -6.074289321899414, "global_step": 71333, "epoch": 1698} {"train_loss": -5.889886856079102, "global_step": 71334, "epoch": 1698} {"train_loss": -5.990599632263184, "global_step": 71335, "epoch": 1698} {"train_loss": -6.034795761108398, "global_step": 71336, "epoch": 1698} {"train_loss": -6.091094970703125, "global_step": 71337, "epoch": 1698} {"train_loss": -6.0386271476745605, "global_step": 71338, "epoch": 1698} {"train_loss": -5.894493103027344, "global_step": 71339, "epoch": 1698} {"train_loss": -6.083051681518555, "global_step": 71340, "epoch": 1698} {"train_loss": -5.8918962478637695, "global_step": 71341, "epoch": 1698} {"train_loss": -5.9629926681518555, "global_step": 71342, "epoch": 1698} {"train_loss": -6.002744197845459, "global_step": 71343, "epoch": 1698} {"train_loss": -5.958505153656006, "global_step": 71344, "epoch": 1698} {"train_loss": -5.960646152496338, "global_step": 71345, "epoch": 1698} {"train_loss": -5.931836128234863, "global_step": 71346, "epoch": 1698} {"train_loss": -6.048976898193359, "global_step": 71347, "epoch": 1698} {"train_loss": -5.894247531890869, "global_step": 71348, "epoch": 1698} {"train_loss": -5.929049491882324, "global_step": 71349, "epoch": 1698} {"train_loss": -6.046398639678955, "global_step": 71350, "epoch": 1698} {"train_loss": -6.035381317138672, "global_step": 71351, "epoch": 1698} {"train_loss": -5.952788352966309, "global_step": 71352, "epoch": 1698} {"train_loss": -6.088397979736328, "global_step": 71353, "epoch": 1698} {"train_loss": -6.037524223327637, "global_step": 71354, "epoch": 1698} {"train_loss": -6.124175548553467, "global_step": 71355, "epoch": 1698} {"train_loss": -6.026516914367676, "global_step": 71356, "epoch": 1698} {"train_loss": -6.011975753875006, "global_step": 71357, "epoch": 1698, "val_loss": 74729.1484375} {"train_loss": -5.993570804595947, "global_step": 71358, "epoch": 1699} {"train_loss": -5.928062438964844, "global_step": 71359, "epoch": 1699} {"train_loss": -5.955101490020752, "global_step": 71360, "epoch": 1699} {"train_loss": -5.913421630859375, "global_step": 71361, "epoch": 1699} {"train_loss": -5.978063106536865, "global_step": 71362, "epoch": 1699} {"train_loss": -6.040322303771973, "global_step": 71363, "epoch": 1699} {"train_loss": -5.9726457595825195, "global_step": 71364, "epoch": 1699} {"train_loss": -6.063605785369873, "global_step": 71365, "epoch": 1699} {"train_loss": -6.040300369262695, "global_step": 71366, "epoch": 1699} {"train_loss": -5.937978267669678, "global_step": 71367, "epoch": 1699} {"train_loss": -6.0875067710876465, "global_step": 71368, "epoch": 1699} {"train_loss": -5.90739631652832, "global_step": 71369, "epoch": 1699} {"train_loss": -6.004098892211914, "global_step": 71370, "epoch": 1699} {"train_loss": -5.940879821777344, "global_step": 71371, "epoch": 1699} {"train_loss": -5.851151466369629, "global_step": 71372, "epoch": 1699} {"train_loss": -6.108625411987305, "global_step": 71373, "epoch": 1699} {"train_loss": -5.9623260498046875, "global_step": 71374, "epoch": 1699} {"train_loss": -6.01876163482666, "global_step": 71375, "epoch": 1699} {"train_loss": -5.954501152038574, "global_step": 71376, "epoch": 1699} {"train_loss": -6.073770523071289, "global_step": 71377, "epoch": 1699} {"train_loss": -6.051907539367676, "global_step": 71378, "epoch": 1699} {"train_loss": -5.90287971496582, "global_step": 71379, "epoch": 1699} {"train_loss": -5.913949012756348, "global_step": 71380, "epoch": 1699} {"train_loss": -5.956981658935547, "global_step": 71381, "epoch": 1699} {"train_loss": -5.898210048675537, "global_step": 71382, "epoch": 1699} {"train_loss": -6.026047706604004, "global_step": 71383, "epoch": 1699} {"train_loss": -6.023918628692627, "global_step": 71384, "epoch": 1699} {"train_loss": -5.8908371925354, "global_step": 71385, "epoch": 1699} {"train_loss": -6.048519134521484, "global_step": 71386, "epoch": 1699} {"train_loss": -5.991281509399414, "global_step": 71387, "epoch": 1699} {"train_loss": -6.037239074707031, "global_step": 71388, "epoch": 1699} {"train_loss": -6.069575309753418, "global_step": 71389, "epoch": 1699} {"train_loss": -5.882818222045898, "global_step": 71390, "epoch": 1699} {"train_loss": -5.995204925537109, "global_step": 71391, "epoch": 1699} {"train_loss": -6.021178245544434, "global_step": 71392, "epoch": 1699} {"train_loss": -6.136476993560791, "global_step": 71393, "epoch": 1699} {"train_loss": -5.936923980712891, "global_step": 71394, "epoch": 1699} {"train_loss": -6.136687278747559, "global_step": 71395, "epoch": 1699} {"train_loss": -6.0458550453186035, "global_step": 71396, "epoch": 1699} {"train_loss": -6.080893039703369, "global_step": 71397, "epoch": 1699} {"train_loss": -6.067180633544922, "global_step": 71398, "epoch": 1699} {"train_loss": -5.9969334829421275, "global_step": 71399, "epoch": 1699, "val_loss": 74861.7734375} {"train_loss": -6.144039154052734, "global_step": 71400, "epoch": 1700} {"train_loss": -6.048790454864502, "global_step": 71401, "epoch": 1700} {"train_loss": -6.076447486877441, "global_step": 71402, "epoch": 1700} {"train_loss": -6.092372894287109, "global_step": 71403, "epoch": 1700} {"train_loss": -5.998445510864258, "global_step": 71404, "epoch": 1700} {"train_loss": -6.1629533767700195, "global_step": 71405, "epoch": 1700} {"train_loss": -6.088534832000732, "global_step": 71406, "epoch": 1700} {"train_loss": -5.989690780639648, "global_step": 71407, "epoch": 1700} {"train_loss": -5.907154083251953, "global_step": 71408, "epoch": 1700} {"train_loss": -6.109910488128662, "global_step": 71409, "epoch": 1700} {"train_loss": -6.077065467834473, "global_step": 71410, "epoch": 1700} {"train_loss": -6.025346755981445, "global_step": 71411, "epoch": 1700} {"train_loss": -6.072612762451172, "global_step": 71412, "epoch": 1700} {"train_loss": -6.106223106384277, "global_step": 71413, "epoch": 1700} {"train_loss": -5.9339704513549805, "global_step": 71414, "epoch": 1700} {"train_loss": -6.011274337768555, "global_step": 71415, "epoch": 1700} {"train_loss": -6.023812770843506, "global_step": 71416, "epoch": 1700} {"train_loss": -6.193910598754883, "global_step": 71417, "epoch": 1700} {"train_loss": -6.082868576049805, "global_step": 71418, "epoch": 1700} {"train_loss": -5.99839973449707, "global_step": 71419, "epoch": 1700} {"train_loss": -6.144585132598877, "global_step": 71420, "epoch": 1700} {"train_loss": -5.983273506164551, "global_step": 71421, "epoch": 1700} {"train_loss": -6.201994895935059, "global_step": 71422, "epoch": 1700} {"train_loss": -6.061639785766602, "global_step": 71423, "epoch": 1700} {"train_loss": -6.126690864562988, "global_step": 71424, "epoch": 1700} {"train_loss": -6.019773483276367, "global_step": 71425, "epoch": 1700} {"train_loss": -6.0271687507629395, "global_step": 71426, "epoch": 1700} {"train_loss": -5.99777889251709, "global_step": 71427, "epoch": 1700} {"train_loss": -5.954434394836426, "global_step": 71428, "epoch": 1700} {"train_loss": -6.171995162963867, "global_step": 71429, "epoch": 1700} {"train_loss": -6.058413982391357, "global_step": 71430, "epoch": 1700} {"train_loss": -6.104167938232422, "global_step": 71431, "epoch": 1700} {"train_loss": -5.951563358306885, "global_step": 71432, "epoch": 1700} {"train_loss": -5.898133277893066, "global_step": 71433, "epoch": 1700} {"train_loss": -5.942285537719727, "global_step": 71434, "epoch": 1700} {"train_loss": -6.036786079406738, "global_step": 71435, "epoch": 1700} {"train_loss": -5.861939430236816, "global_step": 71436, "epoch": 1700} {"train_loss": -6.170029640197754, "global_step": 71437, "epoch": 1700} {"train_loss": -6.078310966491699, "global_step": 71438, "epoch": 1700} {"train_loss": -6.061872482299805, "global_step": 71439, "epoch": 1700} {"train_loss": -5.973384857177734, "global_step": 71440, "epoch": 1700} {"train_loss": -6.048562855947585, "global_step": 71441, "epoch": 1700, "train/sim_max_reward_0": 0.36420011130853497, "train/sim_max_reward_1": 0.9314995060674124, "train/sim_max_reward_2": 0.2812965594058186, "train/sim_max_reward_3": 0.13484814711600124, "train/sim_max_reward_4": 0.8134670402003334, "train/sim_max_reward_5": 0.8538470296289974, "test/sim_max_reward_4500000": 0.6825207968102367, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8596502496759101, "test/sim_max_reward_4500003": 0.9291497169693532, "test/sim_max_reward_4500004": 0.10991309832895638, "test/sim_max_reward_4500005": 0.8309322575637279, "test/sim_max_reward_4500006": 0.941843934543834, "test/sim_max_reward_4500007": 0.9808365497088156, "test/sim_max_reward_4500008": 0.22515340470678114, "test/sim_max_reward_4500009": 0.8970756791889496, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.4014812079983256, "test/sim_max_reward_4500012": 0.8969543276678846, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.965245889308137, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.11846567385920166, "test/sim_max_reward_4500018": 0.07535742106120681, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.771847600270089, "test/sim_max_reward_4500022": 0.8364667529668564, "test/sim_max_reward_4500023": 0.8153900122371298, "test/sim_max_reward_4500024": 0.9553908684103996, "test/sim_max_reward_4500025": 0.4286959421942725, "test/sim_max_reward_4500026": 0.8515847076832727, "test/sim_max_reward_4500027": 0.9066109170210777, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.17787860151376828, "test/sim_max_reward_4500030": 0.9501576768535074, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05850465727749761, "test/sim_max_reward_4500033": 0.9147582030028398, "test/sim_max_reward_4500034": 0.7627607877979172, "test/sim_max_reward_4500035": 0.852950976783992, "test/sim_max_reward_4500036": 0.4008953164729228, "test/sim_max_reward_4500037": 0.8861254914315253, "test/sim_max_reward_4500038": 0.5343934581342569, "test/sim_max_reward_4500039": 0.9626520888604128, "test/sim_max_reward_4500040": 0.9288004442924196, "test/sim_max_reward_4500041": 0.42709272803763615, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.24708163522986337, "test/sim_max_reward_4500044": 0.6796851272845459, "test/sim_max_reward_4500045": 0.16508512468554398, "test/sim_max_reward_4500046": 0.44699653663579897, "test/sim_max_reward_4500047": 0.9455947042374965, "test/sim_max_reward_4500048": 0.9046173664974072, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.563193065621183, "test/mean_score": 0.5469945365317554, "val_loss": 74631.84375} {"train_loss": -6.066621780395508, "global_step": 71442, "epoch": 1701} {"train_loss": -6.1586737632751465, "global_step": 71443, "epoch": 1701} {"train_loss": -6.095354080200195, "global_step": 71444, "epoch": 1701} {"train_loss": -6.089325904846191, "global_step": 71445, "epoch": 1701} {"train_loss": -6.112150192260742, "global_step": 71446, "epoch": 1701} {"train_loss": -6.041053771972656, "global_step": 71447, "epoch": 1701} {"train_loss": -6.142439365386963, "global_step": 71448, "epoch": 1701} {"train_loss": -6.083188056945801, "global_step": 71449, "epoch": 1701} {"train_loss": -6.128016471862793, "global_step": 71450, "epoch": 1701} {"train_loss": -6.0915727615356445, "global_step": 71451, "epoch": 1701} {"train_loss": -6.033536911010742, "global_step": 71452, "epoch": 1701} {"train_loss": -6.13574743270874, "global_step": 71453, "epoch": 1701} {"train_loss": -6.082455635070801, "global_step": 71454, "epoch": 1701} {"train_loss": -5.9955735206604, "global_step": 71455, "epoch": 1701} {"train_loss": -6.097715854644775, "global_step": 71456, "epoch": 1701} {"train_loss": -6.069004535675049, "global_step": 71457, "epoch": 1701} {"train_loss": -6.046020030975342, "global_step": 71458, "epoch": 1701} {"train_loss": -5.961361885070801, "global_step": 71459, "epoch": 1701} {"train_loss": -5.980334281921387, "global_step": 71460, "epoch": 1701} {"train_loss": -6.065066814422607, "global_step": 71461, "epoch": 1701} {"train_loss": -6.068414688110352, "global_step": 71462, "epoch": 1701} {"train_loss": -6.0110764503479, "global_step": 71463, "epoch": 1701} {"train_loss": -6.014711380004883, "global_step": 71464, "epoch": 1701} {"train_loss": -6.01784610748291, "global_step": 71465, "epoch": 1701} {"train_loss": -5.9554548263549805, "global_step": 71466, "epoch": 1701} {"train_loss": -6.113486289978027, "global_step": 71467, "epoch": 1701} {"train_loss": -6.05640172958374, "global_step": 71468, "epoch": 1701} {"train_loss": -6.0738420486450195, "global_step": 71469, "epoch": 1701} {"train_loss": -5.912561416625977, "global_step": 71470, "epoch": 1701} {"train_loss": -5.983567237854004, "global_step": 71471, "epoch": 1701} {"train_loss": -6.158883094787598, "global_step": 71472, "epoch": 1701} {"train_loss": -6.052165985107422, "global_step": 71473, "epoch": 1701} {"train_loss": -6.149666786193848, "global_step": 71474, "epoch": 1701} {"train_loss": -6.03508186340332, "global_step": 71475, "epoch": 1701} {"train_loss": -6.079108715057373, "global_step": 71476, "epoch": 1701} {"train_loss": -5.952883720397949, "global_step": 71477, "epoch": 1701} {"train_loss": -5.915594577789307, "global_step": 71478, "epoch": 1701} {"train_loss": -6.1231536865234375, "global_step": 71479, "epoch": 1701} {"train_loss": -6.080848693847656, "global_step": 71480, "epoch": 1701} {"train_loss": -6.051506042480469, "global_step": 71481, "epoch": 1701} {"train_loss": -6.137192726135254, "global_step": 71482, "epoch": 1701} {"train_loss": -6.05890501113165, "global_step": 71483, "epoch": 1701, "val_loss": 75061.0234375} {"train_loss": -6.053172588348389, "global_step": 71484, "epoch": 1702} {"train_loss": -5.976102828979492, "global_step": 71485, "epoch": 1702} {"train_loss": -6.025781631469727, "global_step": 71486, "epoch": 1702} {"train_loss": -6.078090190887451, "global_step": 71487, "epoch": 1702} {"train_loss": -6.040994644165039, "global_step": 71488, "epoch": 1702} {"train_loss": -6.009804725646973, "global_step": 71489, "epoch": 1702} {"train_loss": -6.149715423583984, "global_step": 71490, "epoch": 1702} {"train_loss": -6.101973056793213, "global_step": 71491, "epoch": 1702} {"train_loss": -6.0615386962890625, "global_step": 71492, "epoch": 1702} {"train_loss": -6.045431613922119, "global_step": 71493, "epoch": 1702} {"train_loss": -5.803901672363281, "global_step": 71494, "epoch": 1702} {"train_loss": -6.034603595733643, "global_step": 71495, "epoch": 1702} {"train_loss": -5.913837432861328, "global_step": 71496, "epoch": 1702} {"train_loss": -5.993570327758789, "global_step": 71497, "epoch": 1702} {"train_loss": -6.011776924133301, "global_step": 71498, "epoch": 1702} {"train_loss": -5.929247856140137, "global_step": 71499, "epoch": 1702} {"train_loss": -5.921621799468994, "global_step": 71500, "epoch": 1702} {"train_loss": -5.928354263305664, "global_step": 71501, "epoch": 1702} {"train_loss": -6.007486343383789, "global_step": 71502, "epoch": 1702} {"train_loss": -5.961130142211914, "global_step": 71503, "epoch": 1702} {"train_loss": -5.891119003295898, "global_step": 71504, "epoch": 1702} {"train_loss": -5.972944736480713, "global_step": 71505, "epoch": 1702} {"train_loss": -5.853790283203125, "global_step": 71506, "epoch": 1702} {"train_loss": -5.983611583709717, "global_step": 71507, "epoch": 1702} {"train_loss": -5.796822547912598, "global_step": 71508, "epoch": 1702} {"train_loss": -5.9659037590026855, "global_step": 71509, "epoch": 1702} {"train_loss": -5.805692195892334, "global_step": 71510, "epoch": 1702} {"train_loss": -5.987689971923828, "global_step": 71511, "epoch": 1702} {"train_loss": -5.878626823425293, "global_step": 71512, "epoch": 1702} {"train_loss": -6.055906295776367, "global_step": 71513, "epoch": 1702} {"train_loss": -5.920938491821289, "global_step": 71514, "epoch": 1702} {"train_loss": -5.938108444213867, "global_step": 71515, "epoch": 1702} {"train_loss": -5.845685005187988, "global_step": 71516, "epoch": 1702} {"train_loss": -5.879778861999512, "global_step": 71517, "epoch": 1702} {"train_loss": -5.936122417449951, "global_step": 71518, "epoch": 1702} {"train_loss": -5.966610431671143, "global_step": 71519, "epoch": 1702} {"train_loss": -5.919323444366455, "global_step": 71520, "epoch": 1702} {"train_loss": -5.942569732666016, "global_step": 71521, "epoch": 1702} {"train_loss": -5.935614585876465, "global_step": 71522, "epoch": 1702} {"train_loss": -5.997265815734863, "global_step": 71523, "epoch": 1702} {"train_loss": -5.8470025062561035, "global_step": 71524, "epoch": 1702} {"train_loss": -5.961725041979835, "global_step": 71525, "epoch": 1702, "val_loss": 74944.921875} {"train_loss": -6.0520429611206055, "global_step": 71526, "epoch": 1703} {"train_loss": -6.1171369552612305, "global_step": 71527, "epoch": 1703} {"train_loss": -5.996156215667725, "global_step": 71528, "epoch": 1703} {"train_loss": -6.063203811645508, "global_step": 71529, "epoch": 1703} {"train_loss": -5.930208206176758, "global_step": 71530, "epoch": 1703} {"train_loss": -6.0406999588012695, "global_step": 71531, "epoch": 1703} {"train_loss": -6.045743942260742, "global_step": 71532, "epoch": 1703} {"train_loss": -6.049299240112305, "global_step": 71533, "epoch": 1703} {"train_loss": -6.094597339630127, "global_step": 71534, "epoch": 1703} {"train_loss": -6.081131458282471, "global_step": 71535, "epoch": 1703} {"train_loss": -6.108153343200684, "global_step": 71536, "epoch": 1703} {"train_loss": -5.946547508239746, "global_step": 71537, "epoch": 1703} {"train_loss": -5.9704179763793945, "global_step": 71538, "epoch": 1703} {"train_loss": -6.029458522796631, "global_step": 71539, "epoch": 1703} {"train_loss": -5.902035713195801, "global_step": 71540, "epoch": 1703} {"train_loss": -6.028735160827637, "global_step": 71541, "epoch": 1703} {"train_loss": -6.067600727081299, "global_step": 71542, "epoch": 1703} {"train_loss": -5.967535972595215, "global_step": 71543, "epoch": 1703} {"train_loss": -5.973252296447754, "global_step": 71544, "epoch": 1703} {"train_loss": -5.979338645935059, "global_step": 71545, "epoch": 1703} {"train_loss": -6.006884574890137, "global_step": 71546, "epoch": 1703} {"train_loss": -5.979840278625488, "global_step": 71547, "epoch": 1703} {"train_loss": -5.994545936584473, "global_step": 71548, "epoch": 1703} {"train_loss": -6.089605808258057, "global_step": 71549, "epoch": 1703} {"train_loss": -6.160127639770508, "global_step": 71550, "epoch": 1703} {"train_loss": -6.041666030883789, "global_step": 71551, "epoch": 1703} {"train_loss": -5.938232421875, "global_step": 71552, "epoch": 1703} {"train_loss": -5.9674577713012695, "global_step": 71553, "epoch": 1703} {"train_loss": -6.08115816116333, "global_step": 71554, "epoch": 1703} {"train_loss": -6.001267433166504, "global_step": 71555, "epoch": 1703} {"train_loss": -6.018069267272949, "global_step": 71556, "epoch": 1703} {"train_loss": -6.008425712585449, "global_step": 71557, "epoch": 1703} {"train_loss": -5.982061386108398, "global_step": 71558, "epoch": 1703} {"train_loss": -6.120661735534668, "global_step": 71559, "epoch": 1703} {"train_loss": -5.994778156280518, "global_step": 71560, "epoch": 1703} {"train_loss": -5.99382209777832, "global_step": 71561, "epoch": 1703} {"train_loss": -6.0462517738342285, "global_step": 71562, "epoch": 1703} {"train_loss": -6.067387104034424, "global_step": 71563, "epoch": 1703} {"train_loss": -6.077088356018066, "global_step": 71564, "epoch": 1703} {"train_loss": -6.130276203155518, "global_step": 71565, "epoch": 1703} {"train_loss": -6.009357929229736, "global_step": 71566, "epoch": 1703} {"train_loss": -6.026733330317906, "global_step": 71567, "epoch": 1703, "val_loss": 75005.6875} {"train_loss": -6.049047470092773, "global_step": 71568, "epoch": 1704} {"train_loss": -6.099905014038086, "global_step": 71569, "epoch": 1704} {"train_loss": -6.0862860679626465, "global_step": 71570, "epoch": 1704} {"train_loss": -5.996413230895996, "global_step": 71571, "epoch": 1704} {"train_loss": -5.915895462036133, "global_step": 71572, "epoch": 1704} {"train_loss": -6.106213569641113, "global_step": 71573, "epoch": 1704} {"train_loss": -6.104646682739258, "global_step": 71574, "epoch": 1704} {"train_loss": -6.052924156188965, "global_step": 71575, "epoch": 1704} {"train_loss": -6.090857982635498, "global_step": 71576, "epoch": 1704} {"train_loss": -6.004275321960449, "global_step": 71577, "epoch": 1704} {"train_loss": -6.001296520233154, "global_step": 71578, "epoch": 1704} {"train_loss": -5.966158866882324, "global_step": 71579, "epoch": 1704} {"train_loss": -6.019282817840576, "global_step": 71580, "epoch": 1704} {"train_loss": -5.938298225402832, "global_step": 71581, "epoch": 1704} {"train_loss": -6.055660247802734, "global_step": 71582, "epoch": 1704} {"train_loss": -6.005816459655762, "global_step": 71583, "epoch": 1704} {"train_loss": -6.175903797149658, "global_step": 71584, "epoch": 1704} {"train_loss": -5.901684761047363, "global_step": 71585, "epoch": 1704} {"train_loss": -6.005514621734619, "global_step": 71586, "epoch": 1704} {"train_loss": -5.890387535095215, "global_step": 71587, "epoch": 1704} {"train_loss": -6.085463523864746, "global_step": 71588, "epoch": 1704} {"train_loss": -6.05830717086792, "global_step": 71589, "epoch": 1704} {"train_loss": -6.067347049713135, "global_step": 71590, "epoch": 1704} {"train_loss": -5.9989519119262695, "global_step": 71591, "epoch": 1704} {"train_loss": -6.0688347816467285, "global_step": 71592, "epoch": 1704} {"train_loss": -6.057730197906494, "global_step": 71593, "epoch": 1704} {"train_loss": -6.091569423675537, "global_step": 71594, "epoch": 1704} {"train_loss": -6.042115211486816, "global_step": 71595, "epoch": 1704} {"train_loss": -5.914670944213867, "global_step": 71596, "epoch": 1704} {"train_loss": -5.948464393615723, "global_step": 71597, "epoch": 1704} {"train_loss": -5.962480068206787, "global_step": 71598, "epoch": 1704} {"train_loss": -6.005847930908203, "global_step": 71599, "epoch": 1704} {"train_loss": -6.077799320220947, "global_step": 71600, "epoch": 1704} {"train_loss": -5.896507263183594, "global_step": 71601, "epoch": 1704} {"train_loss": -5.907266616821289, "global_step": 71602, "epoch": 1704} {"train_loss": -5.822467803955078, "global_step": 71603, "epoch": 1704} {"train_loss": -5.970627784729004, "global_step": 71604, "epoch": 1704} {"train_loss": -5.953449249267578, "global_step": 71605, "epoch": 1704} {"train_loss": -5.903230667114258, "global_step": 71606, "epoch": 1704} {"train_loss": -5.913089275360107, "global_step": 71607, "epoch": 1704} {"train_loss": -5.965949058532715, "global_step": 71608, "epoch": 1704} {"train_loss": -6.003920078277588, "global_step": 71609, "epoch": 1704, "val_loss": 75100.515625} {"train_loss": -5.960389137268066, "global_step": 71610, "epoch": 1705} {"train_loss": -6.107394218444824, "global_step": 71611, "epoch": 1705} {"train_loss": -5.978578567504883, "global_step": 71612, "epoch": 1705} {"train_loss": -6.0199079513549805, "global_step": 71613, "epoch": 1705} {"train_loss": -6.007155418395996, "global_step": 71614, "epoch": 1705} {"train_loss": -6.060207366943359, "global_step": 71615, "epoch": 1705} {"train_loss": -5.978079795837402, "global_step": 71616, "epoch": 1705} {"train_loss": -6.063672065734863, "global_step": 71617, "epoch": 1705} {"train_loss": -6.072017192840576, "global_step": 71618, "epoch": 1705} {"train_loss": -6.047513484954834, "global_step": 71619, "epoch": 1705} {"train_loss": -6.005155563354492, "global_step": 71620, "epoch": 1705} {"train_loss": -6.097011089324951, "global_step": 71621, "epoch": 1705} {"train_loss": -5.941749572753906, "global_step": 71622, "epoch": 1705} {"train_loss": -5.991730213165283, "global_step": 71623, "epoch": 1705} {"train_loss": -6.101280689239502, "global_step": 71624, "epoch": 1705} {"train_loss": -5.9863362312316895, "global_step": 71625, "epoch": 1705} {"train_loss": -5.885927200317383, "global_step": 71626, "epoch": 1705} {"train_loss": -6.07644510269165, "global_step": 71627, "epoch": 1705} {"train_loss": -5.940446853637695, "global_step": 71628, "epoch": 1705} {"train_loss": -6.00400447845459, "global_step": 71629, "epoch": 1705} {"train_loss": -6.1114277839660645, "global_step": 71630, "epoch": 1705} {"train_loss": -5.949227333068848, "global_step": 71631, "epoch": 1705} {"train_loss": -6.068868637084961, "global_step": 71632, "epoch": 1705} {"train_loss": -5.953925132751465, "global_step": 71633, "epoch": 1705} {"train_loss": -6.035069465637207, "global_step": 71634, "epoch": 1705} {"train_loss": -6.1244096755981445, "global_step": 71635, "epoch": 1705} {"train_loss": -5.9837446212768555, "global_step": 71636, "epoch": 1705} {"train_loss": -5.972759246826172, "global_step": 71637, "epoch": 1705} {"train_loss": -6.035347938537598, "global_step": 71638, "epoch": 1705} {"train_loss": -5.908847808837891, "global_step": 71639, "epoch": 1705} {"train_loss": -6.036234378814697, "global_step": 71640, "epoch": 1705} {"train_loss": -6.126046657562256, "global_step": 71641, "epoch": 1705} {"train_loss": -6.075472354888916, "global_step": 71642, "epoch": 1705} {"train_loss": -6.119243621826172, "global_step": 71643, "epoch": 1705} {"train_loss": -5.898079872131348, "global_step": 71644, "epoch": 1705} {"train_loss": -6.022249698638916, "global_step": 71645, "epoch": 1705} {"train_loss": -5.934980392456055, "global_step": 71646, "epoch": 1705} {"train_loss": -6.126776695251465, "global_step": 71647, "epoch": 1705} {"train_loss": -5.923975467681885, "global_step": 71648, "epoch": 1705} {"train_loss": -6.079399585723877, "global_step": 71649, "epoch": 1705} {"train_loss": -6.0099334716796875, "global_step": 71650, "epoch": 1705} {"train_loss": -6.019793101719448, "global_step": 71651, "epoch": 1705, "val_loss": 74537.21875} {"train_loss": -6.098867416381836, "global_step": 71652, "epoch": 1706} {"train_loss": -6.029902458190918, "global_step": 71653, "epoch": 1706} {"train_loss": -6.12216329574585, "global_step": 71654, "epoch": 1706} {"train_loss": -5.995677471160889, "global_step": 71655, "epoch": 1706} {"train_loss": -5.960544586181641, "global_step": 71656, "epoch": 1706} {"train_loss": -6.026450157165527, "global_step": 71657, "epoch": 1706} {"train_loss": -6.169186592102051, "global_step": 71658, "epoch": 1706} {"train_loss": -6.075634002685547, "global_step": 71659, "epoch": 1706} {"train_loss": -6.032853126525879, "global_step": 71660, "epoch": 1706} {"train_loss": -6.04455041885376, "global_step": 71661, "epoch": 1706} {"train_loss": -5.984009265899658, "global_step": 71662, "epoch": 1706} {"train_loss": -6.005913734436035, "global_step": 71663, "epoch": 1706} {"train_loss": -6.099967002868652, "global_step": 71664, "epoch": 1706} {"train_loss": -6.025778293609619, "global_step": 71665, "epoch": 1706} {"train_loss": -5.998533725738525, "global_step": 71666, "epoch": 1706} {"train_loss": -6.021175384521484, "global_step": 71667, "epoch": 1706} {"train_loss": -6.045400619506836, "global_step": 71668, "epoch": 1706} {"train_loss": -5.962497234344482, "global_step": 71669, "epoch": 1706} {"train_loss": -6.058794021606445, "global_step": 71670, "epoch": 1706} {"train_loss": -6.09425687789917, "global_step": 71671, "epoch": 1706} {"train_loss": -5.951803207397461, "global_step": 71672, "epoch": 1706} {"train_loss": -6.032181739807129, "global_step": 71673, "epoch": 1706} {"train_loss": -6.072342872619629, "global_step": 71674, "epoch": 1706} {"train_loss": -6.051929950714111, "global_step": 71675, "epoch": 1706} {"train_loss": -6.057331562042236, "global_step": 71676, "epoch": 1706} {"train_loss": -6.077171325683594, "global_step": 71677, "epoch": 1706} {"train_loss": -5.905994415283203, "global_step": 71678, "epoch": 1706} {"train_loss": -6.178840637207031, "global_step": 71679, "epoch": 1706} {"train_loss": -6.092225551605225, "global_step": 71680, "epoch": 1706} {"train_loss": -6.097225189208984, "global_step": 71681, "epoch": 1706} {"train_loss": -6.056491374969482, "global_step": 71682, "epoch": 1706} {"train_loss": -5.936464309692383, "global_step": 71683, "epoch": 1706} {"train_loss": -6.007842063903809, "global_step": 71684, "epoch": 1706} {"train_loss": -6.180367469787598, "global_step": 71685, "epoch": 1706} {"train_loss": -6.080301284790039, "global_step": 71686, "epoch": 1706} {"train_loss": -6.0898919105529785, "global_step": 71687, "epoch": 1706} {"train_loss": -5.996748447418213, "global_step": 71688, "epoch": 1706} {"train_loss": -6.08104133605957, "global_step": 71689, "epoch": 1706} {"train_loss": -6.044790744781494, "global_step": 71690, "epoch": 1706} {"train_loss": -6.1688408851623535, "global_step": 71691, "epoch": 1706} {"train_loss": -6.042291641235352, "global_step": 71692, "epoch": 1706} {"train_loss": -6.0474232491992765, "global_step": 71693, "epoch": 1706, "val_loss": 74752.3515625} {"train_loss": -6.044649124145508, "global_step": 71694, "epoch": 1707} {"train_loss": -6.2257561683654785, "global_step": 71695, "epoch": 1707} {"train_loss": -5.867476463317871, "global_step": 71696, "epoch": 1707} {"train_loss": -6.131481170654297, "global_step": 71697, "epoch": 1707} {"train_loss": -6.120153903961182, "global_step": 71698, "epoch": 1707} {"train_loss": -5.996798515319824, "global_step": 71699, "epoch": 1707} {"train_loss": -6.179397106170654, "global_step": 71700, "epoch": 1707} {"train_loss": -6.023964881896973, "global_step": 71701, "epoch": 1707} {"train_loss": -6.047743797302246, "global_step": 71702, "epoch": 1707} {"train_loss": -6.08070182800293, "global_step": 71703, "epoch": 1707} {"train_loss": -6.114720344543457, "global_step": 71704, "epoch": 1707} {"train_loss": -6.097766399383545, "global_step": 71705, "epoch": 1707} {"train_loss": -6.019455909729004, "global_step": 71706, "epoch": 1707} {"train_loss": -5.9993157386779785, "global_step": 71707, "epoch": 1707} {"train_loss": -6.016706466674805, "global_step": 71708, "epoch": 1707} {"train_loss": -6.084759712219238, "global_step": 71709, "epoch": 1707} {"train_loss": -5.819348335266113, "global_step": 71710, "epoch": 1707} {"train_loss": -6.121496200561523, "global_step": 71711, "epoch": 1707} {"train_loss": -6.0565032958984375, "global_step": 71712, "epoch": 1707} {"train_loss": -6.075425148010254, "global_step": 71713, "epoch": 1707} {"train_loss": -6.021604061126709, "global_step": 71714, "epoch": 1707} {"train_loss": -6.027698516845703, "global_step": 71715, "epoch": 1707} {"train_loss": -5.950181007385254, "global_step": 71716, "epoch": 1707} {"train_loss": -6.04536247253418, "global_step": 71717, "epoch": 1707} {"train_loss": -6.1087541580200195, "global_step": 71718, "epoch": 1707} {"train_loss": -6.034887313842773, "global_step": 71719, "epoch": 1707} {"train_loss": -6.169240951538086, "global_step": 71720, "epoch": 1707} {"train_loss": -5.950891017913818, "global_step": 71721, "epoch": 1707} {"train_loss": -6.085121154785156, "global_step": 71722, "epoch": 1707} {"train_loss": -6.091120719909668, "global_step": 71723, "epoch": 1707} {"train_loss": -6.044755458831787, "global_step": 71724, "epoch": 1707} {"train_loss": -6.182806968688965, "global_step": 71725, "epoch": 1707} {"train_loss": -5.988004684448242, "global_step": 71726, "epoch": 1707} {"train_loss": -6.099601745605469, "global_step": 71727, "epoch": 1707} {"train_loss": -6.090203285217285, "global_step": 71728, "epoch": 1707} {"train_loss": -5.930720329284668, "global_step": 71729, "epoch": 1707} {"train_loss": -6.106365203857422, "global_step": 71730, "epoch": 1707} {"train_loss": -5.960149765014648, "global_step": 71731, "epoch": 1707} {"train_loss": -5.986797332763672, "global_step": 71732, "epoch": 1707} {"train_loss": -6.108494281768799, "global_step": 71733, "epoch": 1707} {"train_loss": -6.177495002746582, "global_step": 71734, "epoch": 1707} {"train_loss": -6.055135636102586, "global_step": 71735, "epoch": 1707, "val_loss": 75009.265625} {"train_loss": -6.059816837310791, "global_step": 71736, "epoch": 1708} {"train_loss": -6.005558490753174, "global_step": 71737, "epoch": 1708} {"train_loss": -6.2079925537109375, "global_step": 71738, "epoch": 1708} {"train_loss": -6.171412467956543, "global_step": 71739, "epoch": 1708} {"train_loss": -6.029171943664551, "global_step": 71740, "epoch": 1708} {"train_loss": -5.953825950622559, "global_step": 71741, "epoch": 1708} {"train_loss": -5.976633071899414, "global_step": 71742, "epoch": 1708} {"train_loss": -6.138801574707031, "global_step": 71743, "epoch": 1708} {"train_loss": -6.058509826660156, "global_step": 71744, "epoch": 1708} {"train_loss": -6.160739421844482, "global_step": 71745, "epoch": 1708} {"train_loss": -6.046472549438477, "global_step": 71746, "epoch": 1708} {"train_loss": -6.068170070648193, "global_step": 71747, "epoch": 1708} {"train_loss": -6.029631614685059, "global_step": 71748, "epoch": 1708} {"train_loss": -6.119668006896973, "global_step": 71749, "epoch": 1708} {"train_loss": -6.055269241333008, "global_step": 71750, "epoch": 1708} {"train_loss": -6.030098915100098, "global_step": 71751, "epoch": 1708} {"train_loss": -6.113190174102783, "global_step": 71752, "epoch": 1708} {"train_loss": -6.061817169189453, "global_step": 71753, "epoch": 1708} {"train_loss": -6.015453338623047, "global_step": 71754, "epoch": 1708} {"train_loss": -6.144939422607422, "global_step": 71755, "epoch": 1708} {"train_loss": -6.055862903594971, "global_step": 71756, "epoch": 1708} {"train_loss": -6.077488422393799, "global_step": 71757, "epoch": 1708} {"train_loss": -6.046952247619629, "global_step": 71758, "epoch": 1708} {"train_loss": -6.095033645629883, "global_step": 71759, "epoch": 1708} {"train_loss": -5.9801344871521, "global_step": 71760, "epoch": 1708} {"train_loss": -6.143623352050781, "global_step": 71761, "epoch": 1708} {"train_loss": -5.993529796600342, "global_step": 71762, "epoch": 1708} {"train_loss": -5.983381271362305, "global_step": 71763, "epoch": 1708} {"train_loss": -6.008571624755859, "global_step": 71764, "epoch": 1708} {"train_loss": -6.088123798370361, "global_step": 71765, "epoch": 1708} {"train_loss": -6.055410385131836, "global_step": 71766, "epoch": 1708} {"train_loss": -5.94140100479126, "global_step": 71767, "epoch": 1708} {"train_loss": -5.985385894775391, "global_step": 71768, "epoch": 1708} {"train_loss": -6.052864074707031, "global_step": 71769, "epoch": 1708} {"train_loss": -6.027576446533203, "global_step": 71770, "epoch": 1708} {"train_loss": -6.087682723999023, "global_step": 71771, "epoch": 1708} {"train_loss": -6.0242156982421875, "global_step": 71772, "epoch": 1708} {"train_loss": -5.873861789703369, "global_step": 71773, "epoch": 1708} {"train_loss": -6.021292686462402, "global_step": 71774, "epoch": 1708} {"train_loss": -5.957294940948486, "global_step": 71775, "epoch": 1708} {"train_loss": -5.954483985900879, "global_step": 71776, "epoch": 1708} {"train_loss": -6.046172493980045, "global_step": 71777, "epoch": 1708, "val_loss": 74664.7265625} {"train_loss": -6.052494049072266, "global_step": 71778, "epoch": 1709} {"train_loss": -6.1604838371276855, "global_step": 71779, "epoch": 1709} {"train_loss": -5.993220806121826, "global_step": 71780, "epoch": 1709} {"train_loss": -6.136043071746826, "global_step": 71781, "epoch": 1709} {"train_loss": -6.044751167297363, "global_step": 71782, "epoch": 1709} {"train_loss": -6.04188346862793, "global_step": 71783, "epoch": 1709} {"train_loss": -5.969346523284912, "global_step": 71784, "epoch": 1709} {"train_loss": -6.125744342803955, "global_step": 71785, "epoch": 1709} {"train_loss": -6.154609680175781, "global_step": 71786, "epoch": 1709} {"train_loss": -6.040956974029541, "global_step": 71787, "epoch": 1709} {"train_loss": -6.080910682678223, "global_step": 71788, "epoch": 1709} {"train_loss": -6.005576133728027, "global_step": 71789, "epoch": 1709} {"train_loss": -6.113064765930176, "global_step": 71790, "epoch": 1709} {"train_loss": -6.047599792480469, "global_step": 71791, "epoch": 1709} {"train_loss": -5.911337852478027, "global_step": 71792, "epoch": 1709} {"train_loss": -6.074789524078369, "global_step": 71793, "epoch": 1709} {"train_loss": -6.025516510009766, "global_step": 71794, "epoch": 1709} {"train_loss": -5.97328519821167, "global_step": 71795, "epoch": 1709} {"train_loss": -6.083279609680176, "global_step": 71796, "epoch": 1709} {"train_loss": -5.976617813110352, "global_step": 71797, "epoch": 1709} {"train_loss": -6.085727691650391, "global_step": 71798, "epoch": 1709} {"train_loss": -6.006342887878418, "global_step": 71799, "epoch": 1709} {"train_loss": -6.003171443939209, "global_step": 71800, "epoch": 1709} {"train_loss": -6.048890113830566, "global_step": 71801, "epoch": 1709} {"train_loss": -6.013219833374023, "global_step": 71802, "epoch": 1709} {"train_loss": -6.067636013031006, "global_step": 71803, "epoch": 1709} {"train_loss": -6.151951313018799, "global_step": 71804, "epoch": 1709} {"train_loss": -6.002718925476074, "global_step": 71805, "epoch": 1709} {"train_loss": -6.008057594299316, "global_step": 71806, "epoch": 1709} {"train_loss": -6.025530815124512, "global_step": 71807, "epoch": 1709} {"train_loss": -5.951588153839111, "global_step": 71808, "epoch": 1709} {"train_loss": -5.990181922912598, "global_step": 71809, "epoch": 1709} {"train_loss": -5.973714828491211, "global_step": 71810, "epoch": 1709} {"train_loss": -6.048889636993408, "global_step": 71811, "epoch": 1709} {"train_loss": -5.95466423034668, "global_step": 71812, "epoch": 1709} {"train_loss": -5.952083587646484, "global_step": 71813, "epoch": 1709} {"train_loss": -6.068964004516602, "global_step": 71814, "epoch": 1709} {"train_loss": -6.024449825286865, "global_step": 71815, "epoch": 1709} {"train_loss": -6.028097152709961, "global_step": 71816, "epoch": 1709} {"train_loss": -6.134103775024414, "global_step": 71817, "epoch": 1709} {"train_loss": -5.979248046875, "global_step": 71818, "epoch": 1709} {"train_loss": -6.038068226405552, "global_step": 71819, "epoch": 1709, "val_loss": 74795.7421875} {"train_loss": -6.002106666564941, "global_step": 71820, "epoch": 1710} {"train_loss": -6.086367607116699, "global_step": 71821, "epoch": 1710} {"train_loss": -5.932521820068359, "global_step": 71822, "epoch": 1710} {"train_loss": -5.905278205871582, "global_step": 71823, "epoch": 1710} {"train_loss": -5.947279930114746, "global_step": 71824, "epoch": 1710} {"train_loss": -5.991411209106445, "global_step": 71825, "epoch": 1710} {"train_loss": -6.00716495513916, "global_step": 71826, "epoch": 1710} {"train_loss": -5.91423225402832, "global_step": 71827, "epoch": 1710} {"train_loss": -6.011234283447266, "global_step": 71828, "epoch": 1710} {"train_loss": -5.920881748199463, "global_step": 71829, "epoch": 1710} {"train_loss": -5.884398937225342, "global_step": 71830, "epoch": 1710} {"train_loss": -6.206080913543701, "global_step": 71831, "epoch": 1710} {"train_loss": -6.075840950012207, "global_step": 71832, "epoch": 1710} {"train_loss": -5.919172286987305, "global_step": 71833, "epoch": 1710} {"train_loss": -5.976296901702881, "global_step": 71834, "epoch": 1710} {"train_loss": -6.097282409667969, "global_step": 71835, "epoch": 1710} {"train_loss": -6.0664873123168945, "global_step": 71836, "epoch": 1710} {"train_loss": -6.021180152893066, "global_step": 71837, "epoch": 1710} {"train_loss": -6.059736251831055, "global_step": 71838, "epoch": 1710} {"train_loss": -6.100743293762207, "global_step": 71839, "epoch": 1710} {"train_loss": -6.087316513061523, "global_step": 71840, "epoch": 1710} {"train_loss": -6.071544647216797, "global_step": 71841, "epoch": 1710} {"train_loss": -6.1808905601501465, "global_step": 71842, "epoch": 1710} {"train_loss": -6.0439453125, "global_step": 71843, "epoch": 1710} {"train_loss": -5.936433792114258, "global_step": 71844, "epoch": 1710} {"train_loss": -5.988650798797607, "global_step": 71845, "epoch": 1710} {"train_loss": -6.139413833618164, "global_step": 71846, "epoch": 1710} {"train_loss": -6.185099124908447, "global_step": 71847, "epoch": 1710} {"train_loss": -6.102209091186523, "global_step": 71848, "epoch": 1710} {"train_loss": -6.1615800857543945, "global_step": 71849, "epoch": 1710} {"train_loss": -6.17601203918457, "global_step": 71850, "epoch": 1710} {"train_loss": -5.935684680938721, "global_step": 71851, "epoch": 1710} {"train_loss": -6.065039157867432, "global_step": 71852, "epoch": 1710} {"train_loss": -5.951852798461914, "global_step": 71853, "epoch": 1710} {"train_loss": -6.008887767791748, "global_step": 71854, "epoch": 1710} {"train_loss": -5.936458587646484, "global_step": 71855, "epoch": 1710} {"train_loss": -5.976313591003418, "global_step": 71856, "epoch": 1710} {"train_loss": -6.015689373016357, "global_step": 71857, "epoch": 1710} {"train_loss": -5.857572078704834, "global_step": 71858, "epoch": 1710} {"train_loss": -5.954270362854004, "global_step": 71859, "epoch": 1710} {"train_loss": -5.860289096832275, "global_step": 71860, "epoch": 1710} {"train_loss": -6.02116668791998, "global_step": 71861, "epoch": 1710, "val_loss": 74698.3984375} {"train_loss": -6.0301666259765625, "global_step": 71862, "epoch": 1711} {"train_loss": -6.024420261383057, "global_step": 71863, "epoch": 1711} {"train_loss": -6.10374641418457, "global_step": 71864, "epoch": 1711} {"train_loss": -5.960958480834961, "global_step": 71865, "epoch": 1711} {"train_loss": -6.023015022277832, "global_step": 71866, "epoch": 1711} {"train_loss": -6.108755111694336, "global_step": 71867, "epoch": 1711} {"train_loss": -6.1038618087768555, "global_step": 71868, "epoch": 1711} {"train_loss": -6.1021728515625, "global_step": 71869, "epoch": 1711} {"train_loss": -6.104592323303223, "global_step": 71870, "epoch": 1711} {"train_loss": -6.153327941894531, "global_step": 71871, "epoch": 1711} {"train_loss": -6.125831127166748, "global_step": 71872, "epoch": 1711} {"train_loss": -6.055834770202637, "global_step": 71873, "epoch": 1711} {"train_loss": -5.9961748123168945, "global_step": 71874, "epoch": 1711} {"train_loss": -6.041753768920898, "global_step": 71875, "epoch": 1711} {"train_loss": -5.960163593292236, "global_step": 71876, "epoch": 1711} {"train_loss": -6.021967887878418, "global_step": 71877, "epoch": 1711} {"train_loss": -6.003362655639648, "global_step": 71878, "epoch": 1711} {"train_loss": -5.891412734985352, "global_step": 71879, "epoch": 1711} {"train_loss": -5.98158597946167, "global_step": 71880, "epoch": 1711} {"train_loss": -6.098546981811523, "global_step": 71881, "epoch": 1711} {"train_loss": -5.954488277435303, "global_step": 71882, "epoch": 1711} {"train_loss": -6.164405822753906, "global_step": 71883, "epoch": 1711} {"train_loss": -6.001940727233887, "global_step": 71884, "epoch": 1711} {"train_loss": -5.837348937988281, "global_step": 71885, "epoch": 1711} {"train_loss": -6.018219947814941, "global_step": 71886, "epoch": 1711} {"train_loss": -6.130967140197754, "global_step": 71887, "epoch": 1711} {"train_loss": -6.0274810791015625, "global_step": 71888, "epoch": 1711} {"train_loss": -6.015742301940918, "global_step": 71889, "epoch": 1711} {"train_loss": -6.052744388580322, "global_step": 71890, "epoch": 1711} {"train_loss": -6.065061569213867, "global_step": 71891, "epoch": 1711} {"train_loss": -6.020049095153809, "global_step": 71892, "epoch": 1711} {"train_loss": -6.104336738586426, "global_step": 71893, "epoch": 1711} {"train_loss": -6.056968688964844, "global_step": 71894, "epoch": 1711} {"train_loss": -6.063488006591797, "global_step": 71895, "epoch": 1711} {"train_loss": -5.981710910797119, "global_step": 71896, "epoch": 1711} {"train_loss": -5.99530553817749, "global_step": 71897, "epoch": 1711} {"train_loss": -6.0580010414123535, "global_step": 71898, "epoch": 1711} {"train_loss": -6.030120849609375, "global_step": 71899, "epoch": 1711} {"train_loss": -5.930826187133789, "global_step": 71900, "epoch": 1711} {"train_loss": -6.1026787757873535, "global_step": 71901, "epoch": 1711} {"train_loss": -6.045220375061035, "global_step": 71902, "epoch": 1711} {"train_loss": -6.034954672768002, "global_step": 71903, "epoch": 1711, "val_loss": 75212.6953125} {"train_loss": -5.98328161239624, "global_step": 71904, "epoch": 1712} {"train_loss": -6.173473834991455, "global_step": 71905, "epoch": 1712} {"train_loss": -5.912281513214111, "global_step": 71906, "epoch": 1712} {"train_loss": -5.923212051391602, "global_step": 71907, "epoch": 1712} {"train_loss": -6.067523002624512, "global_step": 71908, "epoch": 1712} {"train_loss": -6.08303165435791, "global_step": 71909, "epoch": 1712} {"train_loss": -6.093480110168457, "global_step": 71910, "epoch": 1712} {"train_loss": -6.03079891204834, "global_step": 71911, "epoch": 1712} {"train_loss": -6.041609764099121, "global_step": 71912, "epoch": 1712} {"train_loss": -5.8850555419921875, "global_step": 71913, "epoch": 1712} {"train_loss": -5.993337631225586, "global_step": 71914, "epoch": 1712} {"train_loss": -6.0509538650512695, "global_step": 71915, "epoch": 1712} {"train_loss": -5.940629005432129, "global_step": 71916, "epoch": 1712} {"train_loss": -6.132602691650391, "global_step": 71917, "epoch": 1712} {"train_loss": -5.895861625671387, "global_step": 71918, "epoch": 1712} {"train_loss": -5.983308792114258, "global_step": 71919, "epoch": 1712} {"train_loss": -5.979973316192627, "global_step": 71920, "epoch": 1712} {"train_loss": -5.996136665344238, "global_step": 71921, "epoch": 1712} {"train_loss": -6.014782905578613, "global_step": 71922, "epoch": 1712} {"train_loss": -5.962560176849365, "global_step": 71923, "epoch": 1712} {"train_loss": -5.9604010581970215, "global_step": 71924, "epoch": 1712} {"train_loss": -5.966383457183838, "global_step": 71925, "epoch": 1712} {"train_loss": -5.885499477386475, "global_step": 71926, "epoch": 1712} {"train_loss": -6.044741630554199, "global_step": 71927, "epoch": 1712} {"train_loss": -6.039853572845459, "global_step": 71928, "epoch": 1712} {"train_loss": -6.026734352111816, "global_step": 71929, "epoch": 1712} {"train_loss": -6.034650802612305, "global_step": 71930, "epoch": 1712} {"train_loss": -6.055802345275879, "global_step": 71931, "epoch": 1712} {"train_loss": -5.9951276779174805, "global_step": 71932, "epoch": 1712} {"train_loss": -6.058221817016602, "global_step": 71933, "epoch": 1712} {"train_loss": -6.005781173706055, "global_step": 71934, "epoch": 1712} {"train_loss": -6.055879592895508, "global_step": 71935, "epoch": 1712} {"train_loss": -5.9384965896606445, "global_step": 71936, "epoch": 1712} {"train_loss": -5.9458160400390625, "global_step": 71937, "epoch": 1712} {"train_loss": -6.1153364181518555, "global_step": 71938, "epoch": 1712} {"train_loss": -5.945743083953857, "global_step": 71939, "epoch": 1712} {"train_loss": -6.063621997833252, "global_step": 71940, "epoch": 1712} {"train_loss": -5.989840030670166, "global_step": 71941, "epoch": 1712} {"train_loss": -5.9808783531188965, "global_step": 71942, "epoch": 1712} {"train_loss": -5.9948410987854, "global_step": 71943, "epoch": 1712} {"train_loss": -6.08083438873291, "global_step": 71944, "epoch": 1712} {"train_loss": -6.004926522572835, "global_step": 71945, "epoch": 1712, "val_loss": 74798.6796875} {"train_loss": -6.020563125610352, "global_step": 71946, "epoch": 1713} {"train_loss": -5.92985725402832, "global_step": 71947, "epoch": 1713} {"train_loss": -5.927155494689941, "global_step": 71948, "epoch": 1713} {"train_loss": -6.069244384765625, "global_step": 71949, "epoch": 1713} {"train_loss": -6.005255222320557, "global_step": 71950, "epoch": 1713} {"train_loss": -6.138304710388184, "global_step": 71951, "epoch": 1713} {"train_loss": -6.055621147155762, "global_step": 71952, "epoch": 1713} {"train_loss": -6.069863319396973, "global_step": 71953, "epoch": 1713} {"train_loss": -6.069334030151367, "global_step": 71954, "epoch": 1713} {"train_loss": -5.994668483734131, "global_step": 71955, "epoch": 1713} {"train_loss": -6.162077903747559, "global_step": 71956, "epoch": 1713} {"train_loss": -5.910183429718018, "global_step": 71957, "epoch": 1713} {"train_loss": -6.133458137512207, "global_step": 71958, "epoch": 1713} {"train_loss": -6.080482482910156, "global_step": 71959, "epoch": 1713} {"train_loss": -6.106569766998291, "global_step": 71960, "epoch": 1713} {"train_loss": -6.001871585845947, "global_step": 71961, "epoch": 1713} {"train_loss": -5.918540954589844, "global_step": 71962, "epoch": 1713} {"train_loss": -6.068510055541992, "global_step": 71963, "epoch": 1713} {"train_loss": -5.865958213806152, "global_step": 71964, "epoch": 1713} {"train_loss": -6.013146877288818, "global_step": 71965, "epoch": 1713} {"train_loss": -5.945032119750977, "global_step": 71966, "epoch": 1713} {"train_loss": -6.0175933837890625, "global_step": 71967, "epoch": 1713} {"train_loss": -5.959068775177002, "global_step": 71968, "epoch": 1713} {"train_loss": -6.134753704071045, "global_step": 71969, "epoch": 1713} {"train_loss": -6.055797576904297, "global_step": 71970, "epoch": 1713} {"train_loss": -6.084496021270752, "global_step": 71971, "epoch": 1713} {"train_loss": -5.917201995849609, "global_step": 71972, "epoch": 1713} {"train_loss": -6.10316276550293, "global_step": 71973, "epoch": 1713} {"train_loss": -6.014265060424805, "global_step": 71974, "epoch": 1713} {"train_loss": -6.039168357849121, "global_step": 71975, "epoch": 1713} {"train_loss": -5.99521541595459, "global_step": 71976, "epoch": 1713} {"train_loss": -5.957765579223633, "global_step": 71977, "epoch": 1713} {"train_loss": -6.059704780578613, "global_step": 71978, "epoch": 1713} {"train_loss": -6.064310073852539, "global_step": 71979, "epoch": 1713} {"train_loss": -5.9966888427734375, "global_step": 71980, "epoch": 1713} {"train_loss": -6.10675573348999, "global_step": 71981, "epoch": 1713} {"train_loss": -6.0952653884887695, "global_step": 71982, "epoch": 1713} {"train_loss": -6.010934829711914, "global_step": 71983, "epoch": 1713} {"train_loss": -6.1027631759643555, "global_step": 71984, "epoch": 1713} {"train_loss": -6.0744829177856445, "global_step": 71985, "epoch": 1713} {"train_loss": -5.859070301055908, "global_step": 71986, "epoch": 1713} {"train_loss": -6.028092452457973, "global_step": 71987, "epoch": 1713, "val_loss": 74736.921875} {"train_loss": -6.024798393249512, "global_step": 71988, "epoch": 1714} {"train_loss": -6.115894794464111, "global_step": 71989, "epoch": 1714} {"train_loss": -5.882606029510498, "global_step": 71990, "epoch": 1714} {"train_loss": -6.018747806549072, "global_step": 71991, "epoch": 1714} {"train_loss": -6.039875507354736, "global_step": 71992, "epoch": 1714} {"train_loss": -5.942808151245117, "global_step": 71993, "epoch": 1714} {"train_loss": -6.012078285217285, "global_step": 71994, "epoch": 1714} {"train_loss": -6.076894760131836, "global_step": 71995, "epoch": 1714} {"train_loss": -5.932660102844238, "global_step": 71996, "epoch": 1714} {"train_loss": -6.021040439605713, "global_step": 71997, "epoch": 1714} {"train_loss": -6.156676292419434, "global_step": 71998, "epoch": 1714} {"train_loss": -5.951389312744141, "global_step": 71999, "epoch": 1714} {"train_loss": -5.991767406463623, "global_step": 72000, "epoch": 1714} {"train_loss": -5.805418968200684, "global_step": 72001, "epoch": 1714} {"train_loss": -5.9606852531433105, "global_step": 72002, "epoch": 1714} {"train_loss": -6.070192337036133, "global_step": 72003, "epoch": 1714} {"train_loss": -5.798020839691162, "global_step": 72004, "epoch": 1714} {"train_loss": -5.949916839599609, "global_step": 72005, "epoch": 1714} {"train_loss": -5.882106781005859, "global_step": 72006, "epoch": 1714} {"train_loss": -6.0518317222595215, "global_step": 72007, "epoch": 1714} {"train_loss": -5.884949684143066, "global_step": 72008, "epoch": 1714} {"train_loss": -5.884593486785889, "global_step": 72009, "epoch": 1714} {"train_loss": -5.944947242736816, "global_step": 72010, "epoch": 1714} {"train_loss": -6.026650905609131, "global_step": 72011, "epoch": 1714} {"train_loss": -5.830406188964844, "global_step": 72012, "epoch": 1714} {"train_loss": -5.927450180053711, "global_step": 72013, "epoch": 1714} {"train_loss": -5.9888482093811035, "global_step": 72014, "epoch": 1714} {"train_loss": -5.9801483154296875, "global_step": 72015, "epoch": 1714} {"train_loss": -5.9951581954956055, "global_step": 72016, "epoch": 1714} {"train_loss": -5.988953590393066, "global_step": 72017, "epoch": 1714} {"train_loss": -5.9238433837890625, "global_step": 72018, "epoch": 1714} {"train_loss": -5.96782112121582, "global_step": 72019, "epoch": 1714} {"train_loss": -5.922628879547119, "global_step": 72020, "epoch": 1714} {"train_loss": -6.032103538513184, "global_step": 72021, "epoch": 1714} {"train_loss": -5.979269981384277, "global_step": 72022, "epoch": 1714} {"train_loss": -6.016901969909668, "global_step": 72023, "epoch": 1714} {"train_loss": -6.0675249099731445, "global_step": 72024, "epoch": 1714} {"train_loss": -6.016410827636719, "global_step": 72025, "epoch": 1714} {"train_loss": -5.969023704528809, "global_step": 72026, "epoch": 1714} {"train_loss": -6.005270004272461, "global_step": 72027, "epoch": 1714} {"train_loss": -6.0192389488220215, "global_step": 72028, "epoch": 1714} {"train_loss": -5.977025520233881, "global_step": 72029, "epoch": 1714, "val_loss": 74496.9921875} {"train_loss": -6.066307067871094, "global_step": 72030, "epoch": 1715} {"train_loss": -6.13887882232666, "global_step": 72031, "epoch": 1715} {"train_loss": -6.032098770141602, "global_step": 72032, "epoch": 1715} {"train_loss": -6.082118034362793, "global_step": 72033, "epoch": 1715} {"train_loss": -6.0203142166137695, "global_step": 72034, "epoch": 1715} {"train_loss": -6.042944431304932, "global_step": 72035, "epoch": 1715} {"train_loss": -5.987990379333496, "global_step": 72036, "epoch": 1715} {"train_loss": -5.9520463943481445, "global_step": 72037, "epoch": 1715} {"train_loss": -6.064256191253662, "global_step": 72038, "epoch": 1715} {"train_loss": -6.083630084991455, "global_step": 72039, "epoch": 1715} {"train_loss": -5.9841814041137695, "global_step": 72040, "epoch": 1715} {"train_loss": -6.046797752380371, "global_step": 72041, "epoch": 1715} {"train_loss": -6.047000885009766, "global_step": 72042, "epoch": 1715} {"train_loss": -6.025057792663574, "global_step": 72043, "epoch": 1715} {"train_loss": -6.048497200012207, "global_step": 72044, "epoch": 1715} {"train_loss": -6.09134578704834, "global_step": 72045, "epoch": 1715} {"train_loss": -6.02517557144165, "global_step": 72046, "epoch": 1715} {"train_loss": -6.030191421508789, "global_step": 72047, "epoch": 1715} {"train_loss": -6.045682907104492, "global_step": 72048, "epoch": 1715} {"train_loss": -6.004505157470703, "global_step": 72049, "epoch": 1715} {"train_loss": -6.061041355133057, "global_step": 72050, "epoch": 1715} {"train_loss": -6.079655647277832, "global_step": 72051, "epoch": 1715} {"train_loss": -6.006993293762207, "global_step": 72052, "epoch": 1715} {"train_loss": -6.018176078796387, "global_step": 72053, "epoch": 1715} {"train_loss": -6.0191802978515625, "global_step": 72054, "epoch": 1715} {"train_loss": -6.061816215515137, "global_step": 72055, "epoch": 1715} {"train_loss": -6.007604598999023, "global_step": 72056, "epoch": 1715} {"train_loss": -5.9104156494140625, "global_step": 72057, "epoch": 1715} {"train_loss": -5.994146347045898, "global_step": 72058, "epoch": 1715} {"train_loss": -6.034152507781982, "global_step": 72059, "epoch": 1715} {"train_loss": -6.078824996948242, "global_step": 72060, "epoch": 1715} {"train_loss": -6.065968036651611, "global_step": 72061, "epoch": 1715} {"train_loss": -6.003744125366211, "global_step": 72062, "epoch": 1715} {"train_loss": -6.1415910720825195, "global_step": 72063, "epoch": 1715} {"train_loss": -6.045251369476318, "global_step": 72064, "epoch": 1715} {"train_loss": -6.140327453613281, "global_step": 72065, "epoch": 1715} {"train_loss": -6.069818496704102, "global_step": 72066, "epoch": 1715} {"train_loss": -6.054072380065918, "global_step": 72067, "epoch": 1715} {"train_loss": -6.035017013549805, "global_step": 72068, "epoch": 1715} {"train_loss": -6.069829940795898, "global_step": 72069, "epoch": 1715} {"train_loss": -6.054135322570801, "global_step": 72070, "epoch": 1715} {"train_loss": -6.040659121104649, "global_step": 72071, "epoch": 1715, "val_loss": 74798.3359375} {"train_loss": -6.178215980529785, "global_step": 72072, "epoch": 1716} {"train_loss": -6.122100830078125, "global_step": 72073, "epoch": 1716} {"train_loss": -6.1642537117004395, "global_step": 72074, "epoch": 1716} {"train_loss": -5.945101737976074, "global_step": 72075, "epoch": 1716} {"train_loss": -6.0863871574401855, "global_step": 72076, "epoch": 1716} {"train_loss": -5.96970272064209, "global_step": 72077, "epoch": 1716} {"train_loss": -5.988889217376709, "global_step": 72078, "epoch": 1716} {"train_loss": -6.043803691864014, "global_step": 72079, "epoch": 1716} {"train_loss": -6.078965187072754, "global_step": 72080, "epoch": 1716} {"train_loss": -6.111266136169434, "global_step": 72081, "epoch": 1716} {"train_loss": -6.055996417999268, "global_step": 72082, "epoch": 1716} {"train_loss": -6.032366752624512, "global_step": 72083, "epoch": 1716} {"train_loss": -5.90588903427124, "global_step": 72084, "epoch": 1716} {"train_loss": -6.054441452026367, "global_step": 72085, "epoch": 1716} {"train_loss": -6.099665641784668, "global_step": 72086, "epoch": 1716} {"train_loss": -5.9988250732421875, "global_step": 72087, "epoch": 1716} {"train_loss": -6.050363540649414, "global_step": 72088, "epoch": 1716} {"train_loss": -6.032321929931641, "global_step": 72089, "epoch": 1716} {"train_loss": -5.985296726226807, "global_step": 72090, "epoch": 1716} {"train_loss": -6.108605861663818, "global_step": 72091, "epoch": 1716} {"train_loss": -6.011866569519043, "global_step": 72092, "epoch": 1716} {"train_loss": -5.860042095184326, "global_step": 72093, "epoch": 1716} {"train_loss": -5.928144931793213, "global_step": 72094, "epoch": 1716} {"train_loss": -6.012816429138184, "global_step": 72095, "epoch": 1716} {"train_loss": -5.935756683349609, "global_step": 72096, "epoch": 1716} {"train_loss": -6.0274434089660645, "global_step": 72097, "epoch": 1716} {"train_loss": -6.036182403564453, "global_step": 72098, "epoch": 1716} {"train_loss": -6.0048065185546875, "global_step": 72099, "epoch": 1716} {"train_loss": -6.016430854797363, "global_step": 72100, "epoch": 1716} {"train_loss": -6.1032280921936035, "global_step": 72101, "epoch": 1716} {"train_loss": -5.954099655151367, "global_step": 72102, "epoch": 1716} {"train_loss": -6.128501892089844, "global_step": 72103, "epoch": 1716} {"train_loss": -6.008613586425781, "global_step": 72104, "epoch": 1716} {"train_loss": -6.1422576904296875, "global_step": 72105, "epoch": 1716} {"train_loss": -6.1112565994262695, "global_step": 72106, "epoch": 1716} {"train_loss": -6.081827640533447, "global_step": 72107, "epoch": 1716} {"train_loss": -6.012834548950195, "global_step": 72108, "epoch": 1716} {"train_loss": -6.074484348297119, "global_step": 72109, "epoch": 1716} {"train_loss": -6.014848709106445, "global_step": 72110, "epoch": 1716} {"train_loss": -6.007710933685303, "global_step": 72111, "epoch": 1716} {"train_loss": -6.023220539093018, "global_step": 72112, "epoch": 1716} {"train_loss": -6.034669478734334, "global_step": 72113, "epoch": 1716, "val_loss": 74749.0078125} {"train_loss": -6.119129180908203, "global_step": 72114, "epoch": 1717} {"train_loss": -5.899610996246338, "global_step": 72115, "epoch": 1717} {"train_loss": -5.877162933349609, "global_step": 72116, "epoch": 1717} {"train_loss": -6.052979469299316, "global_step": 72117, "epoch": 1717} {"train_loss": -5.974586486816406, "global_step": 72118, "epoch": 1717} {"train_loss": -5.901150703430176, "global_step": 72119, "epoch": 1717} {"train_loss": -6.032130241394043, "global_step": 72120, "epoch": 1717} {"train_loss": -6.030341148376465, "global_step": 72121, "epoch": 1717} {"train_loss": -6.126621246337891, "global_step": 72122, "epoch": 1717} {"train_loss": -5.923759937286377, "global_step": 72123, "epoch": 1717} {"train_loss": -6.062189102172852, "global_step": 72124, "epoch": 1717} {"train_loss": -6.002062797546387, "global_step": 72125, "epoch": 1717} {"train_loss": -5.975658893585205, "global_step": 72126, "epoch": 1717} {"train_loss": -6.08514404296875, "global_step": 72127, "epoch": 1717} {"train_loss": -6.0219879150390625, "global_step": 72128, "epoch": 1717} {"train_loss": -6.048698425292969, "global_step": 72129, "epoch": 1717} {"train_loss": -6.114167213439941, "global_step": 72130, "epoch": 1717} {"train_loss": -6.090360641479492, "global_step": 72131, "epoch": 1717} {"train_loss": -5.968281269073486, "global_step": 72132, "epoch": 1717} {"train_loss": -6.010956287384033, "global_step": 72133, "epoch": 1717} {"train_loss": -5.9459428787231445, "global_step": 72134, "epoch": 1717} {"train_loss": -6.038240432739258, "global_step": 72135, "epoch": 1717} {"train_loss": -5.876554489135742, "global_step": 72136, "epoch": 1717} {"train_loss": -6.040168285369873, "global_step": 72137, "epoch": 1717} {"train_loss": -6.151082515716553, "global_step": 72138, "epoch": 1717} {"train_loss": -6.074139595031738, "global_step": 72139, "epoch": 1717} {"train_loss": -6.086530685424805, "global_step": 72140, "epoch": 1717} {"train_loss": -6.136883735656738, "global_step": 72141, "epoch": 1717} {"train_loss": -5.990102767944336, "global_step": 72142, "epoch": 1717} {"train_loss": -5.946110725402832, "global_step": 72143, "epoch": 1717} {"train_loss": -6.112159729003906, "global_step": 72144, "epoch": 1717} {"train_loss": -6.064663410186768, "global_step": 72145, "epoch": 1717} {"train_loss": -6.1587982177734375, "global_step": 72146, "epoch": 1717} {"train_loss": -6.109663963317871, "global_step": 72147, "epoch": 1717} {"train_loss": -5.99374532699585, "global_step": 72148, "epoch": 1717} {"train_loss": -5.979889392852783, "global_step": 72149, "epoch": 1717} {"train_loss": -5.922272682189941, "global_step": 72150, "epoch": 1717} {"train_loss": -6.0447998046875, "global_step": 72151, "epoch": 1717} {"train_loss": -6.021394729614258, "global_step": 72152, "epoch": 1717} {"train_loss": -5.985799312591553, "global_step": 72153, "epoch": 1717} {"train_loss": -6.018633842468262, "global_step": 72154, "epoch": 1717} {"train_loss": -6.022135700498309, "global_step": 72155, "epoch": 1717, "val_loss": 74616.4453125} {"train_loss": -6.072031497955322, "global_step": 72156, "epoch": 1718} {"train_loss": -6.023677349090576, "global_step": 72157, "epoch": 1718} {"train_loss": -6.011197566986084, "global_step": 72158, "epoch": 1718} {"train_loss": -6.0727434158325195, "global_step": 72159, "epoch": 1718} {"train_loss": -6.1104278564453125, "global_step": 72160, "epoch": 1718} {"train_loss": -6.079115867614746, "global_step": 72161, "epoch": 1718} {"train_loss": -5.9232940673828125, "global_step": 72162, "epoch": 1718} {"train_loss": -6.0803303718566895, "global_step": 72163, "epoch": 1718} {"train_loss": -6.06453800201416, "global_step": 72164, "epoch": 1718} {"train_loss": -6.001672267913818, "global_step": 72165, "epoch": 1718} {"train_loss": -5.9346418380737305, "global_step": 72166, "epoch": 1718} {"train_loss": -5.980868339538574, "global_step": 72167, "epoch": 1718} {"train_loss": -6.019765377044678, "global_step": 72168, "epoch": 1718} {"train_loss": -6.030127048492432, "global_step": 72169, "epoch": 1718} {"train_loss": -6.083029747009277, "global_step": 72170, "epoch": 1718} {"train_loss": -6.0179219245910645, "global_step": 72171, "epoch": 1718} {"train_loss": -6.002708435058594, "global_step": 72172, "epoch": 1718} {"train_loss": -6.040078163146973, "global_step": 72173, "epoch": 1718} {"train_loss": -6.140393257141113, "global_step": 72174, "epoch": 1718} {"train_loss": -6.2156829833984375, "global_step": 72175, "epoch": 1718} {"train_loss": -6.009024143218994, "global_step": 72176, "epoch": 1718} {"train_loss": -6.009757041931152, "global_step": 72177, "epoch": 1718} {"train_loss": -6.091495513916016, "global_step": 72178, "epoch": 1718} {"train_loss": -5.987821102142334, "global_step": 72179, "epoch": 1718} {"train_loss": -5.991576194763184, "global_step": 72180, "epoch": 1718} {"train_loss": -6.085527420043945, "global_step": 72181, "epoch": 1718} {"train_loss": -6.106402397155762, "global_step": 72182, "epoch": 1718} {"train_loss": -6.103926658630371, "global_step": 72183, "epoch": 1718} {"train_loss": -6.133575439453125, "global_step": 72184, "epoch": 1718} {"train_loss": -6.094847679138184, "global_step": 72185, "epoch": 1718} {"train_loss": -6.075316429138184, "global_step": 72186, "epoch": 1718} {"train_loss": -6.168063163757324, "global_step": 72187, "epoch": 1718} {"train_loss": -5.945400238037109, "global_step": 72188, "epoch": 1718} {"train_loss": -6.0339531898498535, "global_step": 72189, "epoch": 1718} {"train_loss": -6.066717624664307, "global_step": 72190, "epoch": 1718} {"train_loss": -6.016251564025879, "global_step": 72191, "epoch": 1718} {"train_loss": -6.012665748596191, "global_step": 72192, "epoch": 1718} {"train_loss": -5.921905517578125, "global_step": 72193, "epoch": 1718} {"train_loss": -5.9364914894104, "global_step": 72194, "epoch": 1718} {"train_loss": -6.191967964172363, "global_step": 72195, "epoch": 1718} {"train_loss": -6.017445087432861, "global_step": 72196, "epoch": 1718} {"train_loss": -6.049678200767154, "global_step": 72197, "epoch": 1718, "val_loss": 74794.9296875} {"train_loss": -6.144689559936523, "global_step": 72198, "epoch": 1719} {"train_loss": -5.959588527679443, "global_step": 72199, "epoch": 1719} {"train_loss": -6.160171031951904, "global_step": 72200, "epoch": 1719} {"train_loss": -5.97468900680542, "global_step": 72201, "epoch": 1719} {"train_loss": -6.074931621551514, "global_step": 72202, "epoch": 1719} {"train_loss": -6.090205192565918, "global_step": 72203, "epoch": 1719} {"train_loss": -6.038454055786133, "global_step": 72204, "epoch": 1719} {"train_loss": -6.047284126281738, "global_step": 72205, "epoch": 1719} {"train_loss": -5.994624614715576, "global_step": 72206, "epoch": 1719} {"train_loss": -6.119734764099121, "global_step": 72207, "epoch": 1719} {"train_loss": -6.016754150390625, "global_step": 72208, "epoch": 1719} {"train_loss": -6.104133605957031, "global_step": 72209, "epoch": 1719} {"train_loss": -6.018950462341309, "global_step": 72210, "epoch": 1719} {"train_loss": -5.939929008483887, "global_step": 72211, "epoch": 1719} {"train_loss": -6.04576301574707, "global_step": 72212, "epoch": 1719} {"train_loss": -5.9313859939575195, "global_step": 72213, "epoch": 1719} {"train_loss": -6.084820747375488, "global_step": 72214, "epoch": 1719} {"train_loss": -6.037659645080566, "global_step": 72215, "epoch": 1719} {"train_loss": -6.05374813079834, "global_step": 72216, "epoch": 1719} {"train_loss": -6.060952186584473, "global_step": 72217, "epoch": 1719} {"train_loss": -6.103231430053711, "global_step": 72218, "epoch": 1719} {"train_loss": -5.984166622161865, "global_step": 72219, "epoch": 1719} {"train_loss": -6.007549285888672, "global_step": 72220, "epoch": 1719} {"train_loss": -5.995091915130615, "global_step": 72221, "epoch": 1719} {"train_loss": -6.070515155792236, "global_step": 72222, "epoch": 1719} {"train_loss": -5.999186038970947, "global_step": 72223, "epoch": 1719} {"train_loss": -5.974266052246094, "global_step": 72224, "epoch": 1719} {"train_loss": -6.037099361419678, "global_step": 72225, "epoch": 1719} {"train_loss": -5.952329635620117, "global_step": 72226, "epoch": 1719} {"train_loss": -6.093623161315918, "global_step": 72227, "epoch": 1719} {"train_loss": -6.010709285736084, "global_step": 72228, "epoch": 1719} {"train_loss": -6.034182548522949, "global_step": 72229, "epoch": 1719} {"train_loss": -6.057229042053223, "global_step": 72230, "epoch": 1719} {"train_loss": -6.086073875427246, "global_step": 72231, "epoch": 1719} {"train_loss": -5.979869365692139, "global_step": 72232, "epoch": 1719} {"train_loss": -6.056189060211182, "global_step": 72233, "epoch": 1719} {"train_loss": -6.0891499519348145, "global_step": 72234, "epoch": 1719} {"train_loss": -6.046806335449219, "global_step": 72235, "epoch": 1719} {"train_loss": -6.018220901489258, "global_step": 72236, "epoch": 1719} {"train_loss": -5.955967903137207, "global_step": 72237, "epoch": 1719} {"train_loss": -6.130882263183594, "global_step": 72238, "epoch": 1719} {"train_loss": -6.0397315592992875, "global_step": 72239, "epoch": 1719, "val_loss": 74756.1640625} {"train_loss": -6.0276288986206055, "global_step": 72240, "epoch": 1720} {"train_loss": -6.070495128631592, "global_step": 72241, "epoch": 1720} {"train_loss": -5.981664657592773, "global_step": 72242, "epoch": 1720} {"train_loss": -6.058959007263184, "global_step": 72243, "epoch": 1720} {"train_loss": -5.909789562225342, "global_step": 72244, "epoch": 1720} {"train_loss": -6.022983551025391, "global_step": 72245, "epoch": 1720} {"train_loss": -6.177294731140137, "global_step": 72246, "epoch": 1720} {"train_loss": -6.042388916015625, "global_step": 72247, "epoch": 1720} {"train_loss": -6.064213752746582, "global_step": 72248, "epoch": 1720} {"train_loss": -6.03007173538208, "global_step": 72249, "epoch": 1720} {"train_loss": -5.981945991516113, "global_step": 72250, "epoch": 1720} {"train_loss": -6.01116943359375, "global_step": 72251, "epoch": 1720} {"train_loss": -5.939927577972412, "global_step": 72252, "epoch": 1720} {"train_loss": -5.895601272583008, "global_step": 72253, "epoch": 1720} {"train_loss": -6.066987037658691, "global_step": 72254, "epoch": 1720} {"train_loss": -6.025836944580078, "global_step": 72255, "epoch": 1720} {"train_loss": -6.046525001525879, "global_step": 72256, "epoch": 1720} {"train_loss": -6.03600549697876, "global_step": 72257, "epoch": 1720} {"train_loss": -6.021745681762695, "global_step": 72258, "epoch": 1720} {"train_loss": -6.222867965698242, "global_step": 72259, "epoch": 1720} {"train_loss": -6.000643253326416, "global_step": 72260, "epoch": 1720} {"train_loss": -6.047144889831543, "global_step": 72261, "epoch": 1720} {"train_loss": -6.03438663482666, "global_step": 72262, "epoch": 1720} {"train_loss": -6.024104118347168, "global_step": 72263, "epoch": 1720} {"train_loss": -6.149064064025879, "global_step": 72264, "epoch": 1720} {"train_loss": -6.043417930603027, "global_step": 72265, "epoch": 1720} {"train_loss": -6.066502571105957, "global_step": 72266, "epoch": 1720} {"train_loss": -5.972902297973633, "global_step": 72267, "epoch": 1720} {"train_loss": -6.0747785568237305, "global_step": 72268, "epoch": 1720} {"train_loss": -5.878576278686523, "global_step": 72269, "epoch": 1720} {"train_loss": -5.968731880187988, "global_step": 72270, "epoch": 1720} {"train_loss": -5.917775630950928, "global_step": 72271, "epoch": 1720} {"train_loss": -6.042028427124023, "global_step": 72272, "epoch": 1720} {"train_loss": -6.116820335388184, "global_step": 72273, "epoch": 1720} {"train_loss": -5.992928504943848, "global_step": 72274, "epoch": 1720} {"train_loss": -6.012808799743652, "global_step": 72275, "epoch": 1720} {"train_loss": -6.275118827819824, "global_step": 72276, "epoch": 1720} {"train_loss": -5.950613975524902, "global_step": 72277, "epoch": 1720} {"train_loss": -5.993630409240723, "global_step": 72278, "epoch": 1720} {"train_loss": -5.998732566833496, "global_step": 72279, "epoch": 1720} {"train_loss": -6.145848751068115, "global_step": 72280, "epoch": 1720} {"train_loss": -6.032847699664888, "global_step": 72281, "epoch": 1720, "val_loss": 74600.3515625} {"train_loss": -6.1696882247924805, "global_step": 72282, "epoch": 1721} {"train_loss": -6.04500150680542, "global_step": 72283, "epoch": 1721} {"train_loss": -6.034158706665039, "global_step": 72284, "epoch": 1721} {"train_loss": -6.1386919021606445, "global_step": 72285, "epoch": 1721} {"train_loss": -6.0737504959106445, "global_step": 72286, "epoch": 1721} {"train_loss": -6.130669593811035, "global_step": 72287, "epoch": 1721} {"train_loss": -6.070066452026367, "global_step": 72288, "epoch": 1721} {"train_loss": -5.998111724853516, "global_step": 72289, "epoch": 1721} {"train_loss": -6.079845905303955, "global_step": 72290, "epoch": 1721} {"train_loss": -6.020493984222412, "global_step": 72291, "epoch": 1721} {"train_loss": -6.049299716949463, "global_step": 72292, "epoch": 1721} {"train_loss": -6.103127479553223, "global_step": 72293, "epoch": 1721} {"train_loss": -5.962531089782715, "global_step": 72294, "epoch": 1721} {"train_loss": -6.088061809539795, "global_step": 72295, "epoch": 1721} {"train_loss": -6.0274739265441895, "global_step": 72296, "epoch": 1721} {"train_loss": -6.002184867858887, "global_step": 72297, "epoch": 1721} {"train_loss": -5.991245746612549, "global_step": 72298, "epoch": 1721} {"train_loss": -6.052472114562988, "global_step": 72299, "epoch": 1721} {"train_loss": -6.024403095245361, "global_step": 72300, "epoch": 1721} {"train_loss": -5.879164695739746, "global_step": 72301, "epoch": 1721} {"train_loss": -6.127274990081787, "global_step": 72302, "epoch": 1721} {"train_loss": -6.028015613555908, "global_step": 72303, "epoch": 1721} {"train_loss": -5.964630603790283, "global_step": 72304, "epoch": 1721} {"train_loss": -6.06063175201416, "global_step": 72305, "epoch": 1721} {"train_loss": -6.0027008056640625, "global_step": 72306, "epoch": 1721} {"train_loss": -5.857611179351807, "global_step": 72307, "epoch": 1721} {"train_loss": -6.030235290527344, "global_step": 72308, "epoch": 1721} {"train_loss": -5.97623348236084, "global_step": 72309, "epoch": 1721} {"train_loss": -5.935221195220947, "global_step": 72310, "epoch": 1721} {"train_loss": -6.1026201248168945, "global_step": 72311, "epoch": 1721} {"train_loss": -5.904946327209473, "global_step": 72312, "epoch": 1721} {"train_loss": -5.9785075187683105, "global_step": 72313, "epoch": 1721} {"train_loss": -5.947274684906006, "global_step": 72314, "epoch": 1721} {"train_loss": -6.0183892250061035, "global_step": 72315, "epoch": 1721} {"train_loss": -6.0240888595581055, "global_step": 72316, "epoch": 1721} {"train_loss": -5.938169956207275, "global_step": 72317, "epoch": 1721} {"train_loss": -5.913016319274902, "global_step": 72318, "epoch": 1721} {"train_loss": -5.873348236083984, "global_step": 72319, "epoch": 1721} {"train_loss": -5.906251430511475, "global_step": 72320, "epoch": 1721} {"train_loss": -5.9670634269714355, "global_step": 72321, "epoch": 1721} {"train_loss": -6.029301643371582, "global_step": 72322, "epoch": 1721} {"train_loss": -6.013807739530291, "global_step": 72323, "epoch": 1721, "val_loss": 74903.3828125} {"train_loss": -6.04734468460083, "global_step": 72324, "epoch": 1722} {"train_loss": -5.939235687255859, "global_step": 72325, "epoch": 1722} {"train_loss": -5.995412349700928, "global_step": 72326, "epoch": 1722} {"train_loss": -6.059614658355713, "global_step": 72327, "epoch": 1722} {"train_loss": -6.071125030517578, "global_step": 72328, "epoch": 1722} {"train_loss": -6.0096306800842285, "global_step": 72329, "epoch": 1722} {"train_loss": -6.065362930297852, "global_step": 72330, "epoch": 1722} {"train_loss": -6.078157901763916, "global_step": 72331, "epoch": 1722} {"train_loss": -6.040505886077881, "global_step": 72332, "epoch": 1722} {"train_loss": -5.93543004989624, "global_step": 72333, "epoch": 1722} {"train_loss": -6.07397985458374, "global_step": 72334, "epoch": 1722} {"train_loss": -6.034212112426758, "global_step": 72335, "epoch": 1722} {"train_loss": -5.986297607421875, "global_step": 72336, "epoch": 1722} {"train_loss": -6.029170989990234, "global_step": 72337, "epoch": 1722} {"train_loss": -5.991981029510498, "global_step": 72338, "epoch": 1722} {"train_loss": -6.095719337463379, "global_step": 72339, "epoch": 1722} {"train_loss": -6.110476493835449, "global_step": 72340, "epoch": 1722} {"train_loss": -6.013065338134766, "global_step": 72341, "epoch": 1722} {"train_loss": -6.005762100219727, "global_step": 72342, "epoch": 1722} {"train_loss": -6.083591461181641, "global_step": 72343, "epoch": 1722} {"train_loss": -5.989687919616699, "global_step": 72344, "epoch": 1722} {"train_loss": -6.043495178222656, "global_step": 72345, "epoch": 1722} {"train_loss": -6.199378967285156, "global_step": 72346, "epoch": 1722} {"train_loss": -5.925746917724609, "global_step": 72347, "epoch": 1722} {"train_loss": -6.167654991149902, "global_step": 72348, "epoch": 1722} {"train_loss": -6.063220024108887, "global_step": 72349, "epoch": 1722} {"train_loss": -5.999637603759766, "global_step": 72350, "epoch": 1722} {"train_loss": -6.057711601257324, "global_step": 72351, "epoch": 1722} {"train_loss": -5.829073905944824, "global_step": 72352, "epoch": 1722} {"train_loss": -5.973577976226807, "global_step": 72353, "epoch": 1722} {"train_loss": -5.929600715637207, "global_step": 72354, "epoch": 1722} {"train_loss": -5.898220539093018, "global_step": 72355, "epoch": 1722} {"train_loss": -6.038115501403809, "global_step": 72356, "epoch": 1722} {"train_loss": -5.890895843505859, "global_step": 72357, "epoch": 1722} {"train_loss": -5.9994354248046875, "global_step": 72358, "epoch": 1722} {"train_loss": -5.988434314727783, "global_step": 72359, "epoch": 1722} {"train_loss": -5.932955265045166, "global_step": 72360, "epoch": 1722} {"train_loss": -6.045446395874023, "global_step": 72361, "epoch": 1722} {"train_loss": -5.977618217468262, "global_step": 72362, "epoch": 1722} {"train_loss": -6.065261363983154, "global_step": 72363, "epoch": 1722} {"train_loss": -6.029365062713623, "global_step": 72364, "epoch": 1722} {"train_loss": -6.016872803370158, "global_step": 72365, "epoch": 1722, "val_loss": 74964.4140625} {"train_loss": -5.971641540527344, "global_step": 72366, "epoch": 1723} {"train_loss": -6.0945611000061035, "global_step": 72367, "epoch": 1723} {"train_loss": -5.921134948730469, "global_step": 72368, "epoch": 1723} {"train_loss": -6.026780128479004, "global_step": 72369, "epoch": 1723} {"train_loss": -6.096923828125, "global_step": 72370, "epoch": 1723} {"train_loss": -5.931206703186035, "global_step": 72371, "epoch": 1723} {"train_loss": -5.973621845245361, "global_step": 72372, "epoch": 1723} {"train_loss": -6.078921318054199, "global_step": 72373, "epoch": 1723} {"train_loss": -6.086042404174805, "global_step": 72374, "epoch": 1723} {"train_loss": -6.142704486846924, "global_step": 72375, "epoch": 1723} {"train_loss": -6.107975959777832, "global_step": 72376, "epoch": 1723} {"train_loss": -6.16066837310791, "global_step": 72377, "epoch": 1723} {"train_loss": -6.022781848907471, "global_step": 72378, "epoch": 1723} {"train_loss": -6.154532432556152, "global_step": 72379, "epoch": 1723} {"train_loss": -6.054454803466797, "global_step": 72380, "epoch": 1723} {"train_loss": -5.986061096191406, "global_step": 72381, "epoch": 1723} {"train_loss": -6.0752854347229, "global_step": 72382, "epoch": 1723} {"train_loss": -6.168901443481445, "global_step": 72383, "epoch": 1723} {"train_loss": -6.0381269454956055, "global_step": 72384, "epoch": 1723} {"train_loss": -6.132379531860352, "global_step": 72385, "epoch": 1723} {"train_loss": -6.1455841064453125, "global_step": 72386, "epoch": 1723} {"train_loss": -6.024385452270508, "global_step": 72387, "epoch": 1723} {"train_loss": -6.061619758605957, "global_step": 72388, "epoch": 1723} {"train_loss": -5.998796463012695, "global_step": 72389, "epoch": 1723} {"train_loss": -6.013057708740234, "global_step": 72390, "epoch": 1723} {"train_loss": -6.089456558227539, "global_step": 72391, "epoch": 1723} {"train_loss": -6.057993412017822, "global_step": 72392, "epoch": 1723} {"train_loss": -6.127284049987793, "global_step": 72393, "epoch": 1723} {"train_loss": -5.917013168334961, "global_step": 72394, "epoch": 1723} {"train_loss": -6.018869876861572, "global_step": 72395, "epoch": 1723} {"train_loss": -5.969374656677246, "global_step": 72396, "epoch": 1723} {"train_loss": -6.04210090637207, "global_step": 72397, "epoch": 1723} {"train_loss": -6.087456226348877, "global_step": 72398, "epoch": 1723} {"train_loss": -6.035956859588623, "global_step": 72399, "epoch": 1723} {"train_loss": -6.158371925354004, "global_step": 72400, "epoch": 1723} {"train_loss": -6.004059791564941, "global_step": 72401, "epoch": 1723} {"train_loss": -6.052703857421875, "global_step": 72402, "epoch": 1723} {"train_loss": -6.039663314819336, "global_step": 72403, "epoch": 1723} {"train_loss": -6.226982593536377, "global_step": 72404, "epoch": 1723} {"train_loss": -6.116125106811523, "global_step": 72405, "epoch": 1723} {"train_loss": -6.139235496520996, "global_step": 72406, "epoch": 1723} {"train_loss": -6.0628206843421575, "global_step": 72407, "epoch": 1723, "val_loss": 74750.140625} {"train_loss": -6.145015716552734, "global_step": 72408, "epoch": 1724} {"train_loss": -6.024531841278076, "global_step": 72409, "epoch": 1724} {"train_loss": -5.951883316040039, "global_step": 72410, "epoch": 1724} {"train_loss": -6.1053690910339355, "global_step": 72411, "epoch": 1724} {"train_loss": -6.000082969665527, "global_step": 72412, "epoch": 1724} {"train_loss": -5.886911392211914, "global_step": 72413, "epoch": 1724} {"train_loss": -6.147828578948975, "global_step": 72414, "epoch": 1724} {"train_loss": -6.004776954650879, "global_step": 72415, "epoch": 1724} {"train_loss": -6.075872898101807, "global_step": 72416, "epoch": 1724} {"train_loss": -6.061912536621094, "global_step": 72417, "epoch": 1724} {"train_loss": -5.9730730056762695, "global_step": 72418, "epoch": 1724} {"train_loss": -6.057009220123291, "global_step": 72419, "epoch": 1724} {"train_loss": -6.073971271514893, "global_step": 72420, "epoch": 1724} {"train_loss": -6.104846477508545, "global_step": 72421, "epoch": 1724} {"train_loss": -6.083696365356445, "global_step": 72422, "epoch": 1724} {"train_loss": -6.093517303466797, "global_step": 72423, "epoch": 1724} {"train_loss": -5.974969863891602, "global_step": 72424, "epoch": 1724} {"train_loss": -6.007439613342285, "global_step": 72425, "epoch": 1724} {"train_loss": -6.001943588256836, "global_step": 72426, "epoch": 1724} {"train_loss": -5.910982608795166, "global_step": 72427, "epoch": 1724} {"train_loss": -5.970921993255615, "global_step": 72428, "epoch": 1724} {"train_loss": -6.0032548904418945, "global_step": 72429, "epoch": 1724} {"train_loss": -6.018902778625488, "global_step": 72430, "epoch": 1724} {"train_loss": -6.095100402832031, "global_step": 72431, "epoch": 1724} {"train_loss": -6.18184757232666, "global_step": 72432, "epoch": 1724} {"train_loss": -6.055703639984131, "global_step": 72433, "epoch": 1724} {"train_loss": -6.075334548950195, "global_step": 72434, "epoch": 1724} {"train_loss": -6.011996269226074, "global_step": 72435, "epoch": 1724} {"train_loss": -6.206780910491943, "global_step": 72436, "epoch": 1724} {"train_loss": -5.913847923278809, "global_step": 72437, "epoch": 1724} {"train_loss": -6.044251441955566, "global_step": 72438, "epoch": 1724} {"train_loss": -6.156501770019531, "global_step": 72439, "epoch": 1724} {"train_loss": -6.191529273986816, "global_step": 72440, "epoch": 1724} {"train_loss": -6.0961103439331055, "global_step": 72441, "epoch": 1724} {"train_loss": -6.045040130615234, "global_step": 72442, "epoch": 1724} {"train_loss": -6.170119285583496, "global_step": 72443, "epoch": 1724} {"train_loss": -5.913614273071289, "global_step": 72444, "epoch": 1724} {"train_loss": -6.078214645385742, "global_step": 72445, "epoch": 1724} {"train_loss": -6.049130439758301, "global_step": 72446, "epoch": 1724} {"train_loss": -6.153146743774414, "global_step": 72447, "epoch": 1724} {"train_loss": -6.141450881958008, "global_step": 72448, "epoch": 1724} {"train_loss": -6.056423164549328, "global_step": 72449, "epoch": 1724, "val_loss": 74871.7734375} {"train_loss": -6.041110992431641, "global_step": 72450, "epoch": 1725} {"train_loss": -6.038288593292236, "global_step": 72451, "epoch": 1725} {"train_loss": -6.084514617919922, "global_step": 72452, "epoch": 1725} {"train_loss": -6.127892017364502, "global_step": 72453, "epoch": 1725} {"train_loss": -6.107037544250488, "global_step": 72454, "epoch": 1725} {"train_loss": -6.066432952880859, "global_step": 72455, "epoch": 1725} {"train_loss": -6.144170761108398, "global_step": 72456, "epoch": 1725} {"train_loss": -6.215528964996338, "global_step": 72457, "epoch": 1725} {"train_loss": -5.999112129211426, "global_step": 72458, "epoch": 1725} {"train_loss": -6.063655853271484, "global_step": 72459, "epoch": 1725} {"train_loss": -6.03853702545166, "global_step": 72460, "epoch": 1725} {"train_loss": -6.094147205352783, "global_step": 72461, "epoch": 1725} {"train_loss": -6.001253128051758, "global_step": 72462, "epoch": 1725} {"train_loss": -5.987369060516357, "global_step": 72463, "epoch": 1725} {"train_loss": -5.906903266906738, "global_step": 72464, "epoch": 1725} {"train_loss": -5.911807060241699, "global_step": 72465, "epoch": 1725} {"train_loss": -6.120885372161865, "global_step": 72466, "epoch": 1725} {"train_loss": -5.774466514587402, "global_step": 72467, "epoch": 1725} {"train_loss": -5.941145420074463, "global_step": 72468, "epoch": 1725} {"train_loss": -5.939430236816406, "global_step": 72469, "epoch": 1725} {"train_loss": -5.825099945068359, "global_step": 72470, "epoch": 1725} {"train_loss": -6.1336822509765625, "global_step": 72471, "epoch": 1725} {"train_loss": -5.997518539428711, "global_step": 72472, "epoch": 1725} {"train_loss": -6.060148239135742, "global_step": 72473, "epoch": 1725} {"train_loss": -6.030527114868164, "global_step": 72474, "epoch": 1725} {"train_loss": -6.092565059661865, "global_step": 72475, "epoch": 1725} {"train_loss": -6.08568000793457, "global_step": 72476, "epoch": 1725} {"train_loss": -6.036283493041992, "global_step": 72477, "epoch": 1725} {"train_loss": -5.90377950668335, "global_step": 72478, "epoch": 1725} {"train_loss": -5.953315734863281, "global_step": 72479, "epoch": 1725} {"train_loss": -6.04348611831665, "global_step": 72480, "epoch": 1725} {"train_loss": -5.993057727813721, "global_step": 72481, "epoch": 1725} {"train_loss": -6.108091354370117, "global_step": 72482, "epoch": 1725} {"train_loss": -6.063754081726074, "global_step": 72483, "epoch": 1725} {"train_loss": -6.0212812423706055, "global_step": 72484, "epoch": 1725} {"train_loss": -5.908553123474121, "global_step": 72485, "epoch": 1725} {"train_loss": -6.078466892242432, "global_step": 72486, "epoch": 1725} {"train_loss": -6.020712852478027, "global_step": 72487, "epoch": 1725} {"train_loss": -5.93837308883667, "global_step": 72488, "epoch": 1725} {"train_loss": -6.003814697265625, "global_step": 72489, "epoch": 1725} {"train_loss": -5.995124816894531, "global_step": 72490, "epoch": 1725} {"train_loss": -6.020731721605573, "global_step": 72491, "epoch": 1725, "val_loss": 74976.625} {"train_loss": -6.072434425354004, "global_step": 72492, "epoch": 1726} {"train_loss": -6.021211624145508, "global_step": 72493, "epoch": 1726} {"train_loss": -5.89058780670166, "global_step": 72494, "epoch": 1726} {"train_loss": -6.111845970153809, "global_step": 72495, "epoch": 1726} {"train_loss": -5.981215476989746, "global_step": 72496, "epoch": 1726} {"train_loss": -6.050156593322754, "global_step": 72497, "epoch": 1726} {"train_loss": -6.176837921142578, "global_step": 72498, "epoch": 1726} {"train_loss": -5.954875946044922, "global_step": 72499, "epoch": 1726} {"train_loss": -6.011891841888428, "global_step": 72500, "epoch": 1726} {"train_loss": -6.038928985595703, "global_step": 72501, "epoch": 1726} {"train_loss": -6.01666259765625, "global_step": 72502, "epoch": 1726} {"train_loss": -5.949296951293945, "global_step": 72503, "epoch": 1726} {"train_loss": -6.006847381591797, "global_step": 72504, "epoch": 1726} {"train_loss": -5.977828025817871, "global_step": 72505, "epoch": 1726} {"train_loss": -6.082712173461914, "global_step": 72506, "epoch": 1726} {"train_loss": -6.112326622009277, "global_step": 72507, "epoch": 1726} {"train_loss": -5.934837341308594, "global_step": 72508, "epoch": 1726} {"train_loss": -6.10236930847168, "global_step": 72509, "epoch": 1726} {"train_loss": -6.016298294067383, "global_step": 72510, "epoch": 1726} {"train_loss": -6.195211410522461, "global_step": 72511, "epoch": 1726} {"train_loss": -6.201613426208496, "global_step": 72512, "epoch": 1726} {"train_loss": -6.053876876831055, "global_step": 72513, "epoch": 1726} {"train_loss": -6.135113716125488, "global_step": 72514, "epoch": 1726} {"train_loss": -6.032198905944824, "global_step": 72515, "epoch": 1726} {"train_loss": -6.037512302398682, "global_step": 72516, "epoch": 1726} {"train_loss": -5.998935699462891, "global_step": 72517, "epoch": 1726} {"train_loss": -6.032896041870117, "global_step": 72518, "epoch": 1726} {"train_loss": -6.1414031982421875, "global_step": 72519, "epoch": 1726} {"train_loss": -5.9948835372924805, "global_step": 72520, "epoch": 1726} {"train_loss": -5.971953392028809, "global_step": 72521, "epoch": 1726} {"train_loss": -6.212918281555176, "global_step": 72522, "epoch": 1726} {"train_loss": -6.014939308166504, "global_step": 72523, "epoch": 1726} {"train_loss": -5.943150043487549, "global_step": 72524, "epoch": 1726} {"train_loss": -6.0378875732421875, "global_step": 72525, "epoch": 1726} {"train_loss": -6.091068267822266, "global_step": 72526, "epoch": 1726} {"train_loss": -6.141300201416016, "global_step": 72527, "epoch": 1726} {"train_loss": -6.029784202575684, "global_step": 72528, "epoch": 1726} {"train_loss": -6.045825958251953, "global_step": 72529, "epoch": 1726} {"train_loss": -6.053054332733154, "global_step": 72530, "epoch": 1726} {"train_loss": -5.946283340454102, "global_step": 72531, "epoch": 1726} {"train_loss": -5.9384965896606445, "global_step": 72532, "epoch": 1726} {"train_loss": -6.0413190977913995, "global_step": 72533, "epoch": 1726, "val_loss": 74647.2265625} {"train_loss": -5.911405563354492, "global_step": 72534, "epoch": 1727} {"train_loss": -6.095887184143066, "global_step": 72535, "epoch": 1727} {"train_loss": -5.9052839279174805, "global_step": 72536, "epoch": 1727} {"train_loss": -5.951609134674072, "global_step": 72537, "epoch": 1727} {"train_loss": -5.912096977233887, "global_step": 72538, "epoch": 1727} {"train_loss": -5.987358570098877, "global_step": 72539, "epoch": 1727} {"train_loss": -6.006715774536133, "global_step": 72540, "epoch": 1727} {"train_loss": -5.969085693359375, "global_step": 72541, "epoch": 1727} {"train_loss": -6.151522636413574, "global_step": 72542, "epoch": 1727} {"train_loss": -6.071420669555664, "global_step": 72543, "epoch": 1727} {"train_loss": -6.012534141540527, "global_step": 72544, "epoch": 1727} {"train_loss": -6.025421142578125, "global_step": 72545, "epoch": 1727} {"train_loss": -5.97542667388916, "global_step": 72546, "epoch": 1727} {"train_loss": -6.0468878746032715, "global_step": 72547, "epoch": 1727} {"train_loss": -6.040136337280273, "global_step": 72548, "epoch": 1727} {"train_loss": -6.051246643066406, "global_step": 72549, "epoch": 1727} {"train_loss": -6.202274322509766, "global_step": 72550, "epoch": 1727} {"train_loss": -5.990503787994385, "global_step": 72551, "epoch": 1727} {"train_loss": -5.990396499633789, "global_step": 72552, "epoch": 1727} {"train_loss": -5.992252826690674, "global_step": 72553, "epoch": 1727} {"train_loss": -6.062319278717041, "global_step": 72554, "epoch": 1727} {"train_loss": -6.014814376831055, "global_step": 72555, "epoch": 1727} {"train_loss": -6.055911064147949, "global_step": 72556, "epoch": 1727} {"train_loss": -6.044617176055908, "global_step": 72557, "epoch": 1727} {"train_loss": -6.120223045349121, "global_step": 72558, "epoch": 1727} {"train_loss": -6.05002498626709, "global_step": 72559, "epoch": 1727} {"train_loss": -6.019562721252441, "global_step": 72560, "epoch": 1727} {"train_loss": -6.04364013671875, "global_step": 72561, "epoch": 1727} {"train_loss": -6.070392608642578, "global_step": 72562, "epoch": 1727} {"train_loss": -6.092874050140381, "global_step": 72563, "epoch": 1727} {"train_loss": -6.068750381469727, "global_step": 72564, "epoch": 1727} {"train_loss": -6.125131607055664, "global_step": 72565, "epoch": 1727} {"train_loss": -6.1920166015625, "global_step": 72566, "epoch": 1727} {"train_loss": -6.02441930770874, "global_step": 72567, "epoch": 1727} {"train_loss": -6.087658882141113, "global_step": 72568, "epoch": 1727} {"train_loss": -6.069699287414551, "global_step": 72569, "epoch": 1727} {"train_loss": -6.007862091064453, "global_step": 72570, "epoch": 1727} {"train_loss": -5.986722469329834, "global_step": 72571, "epoch": 1727} {"train_loss": -5.999263763427734, "global_step": 72572, "epoch": 1727} {"train_loss": -5.925439834594727, "global_step": 72573, "epoch": 1727} {"train_loss": -6.1615309715271, "global_step": 72574, "epoch": 1727} {"train_loss": -6.038080817177182, "global_step": 72575, "epoch": 1727, "val_loss": 74959.7578125} {"train_loss": -6.048450469970703, "global_step": 72576, "epoch": 1728} {"train_loss": -6.106377601623535, "global_step": 72577, "epoch": 1728} {"train_loss": -5.845075607299805, "global_step": 72578, "epoch": 1728} {"train_loss": -6.045453071594238, "global_step": 72579, "epoch": 1728} {"train_loss": -5.9658403396606445, "global_step": 72580, "epoch": 1728} {"train_loss": -6.058384418487549, "global_step": 72581, "epoch": 1728} {"train_loss": -6.10460090637207, "global_step": 72582, "epoch": 1728} {"train_loss": -6.1884965896606445, "global_step": 72583, "epoch": 1728} {"train_loss": -6.078255653381348, "global_step": 72584, "epoch": 1728} {"train_loss": -6.068630695343018, "global_step": 72585, "epoch": 1728} {"train_loss": -5.938653945922852, "global_step": 72586, "epoch": 1728} {"train_loss": -6.075477123260498, "global_step": 72587, "epoch": 1728} {"train_loss": -6.006402015686035, "global_step": 72588, "epoch": 1728} {"train_loss": -6.017268180847168, "global_step": 72589, "epoch": 1728} {"train_loss": -6.079768180847168, "global_step": 72590, "epoch": 1728} {"train_loss": -5.984583377838135, "global_step": 72591, "epoch": 1728} {"train_loss": -6.110274314880371, "global_step": 72592, "epoch": 1728} {"train_loss": -6.090549468994141, "global_step": 72593, "epoch": 1728} {"train_loss": -6.067944526672363, "global_step": 72594, "epoch": 1728} {"train_loss": -5.999053478240967, "global_step": 72595, "epoch": 1728} {"train_loss": -6.210392951965332, "global_step": 72596, "epoch": 1728} {"train_loss": -6.076142311096191, "global_step": 72597, "epoch": 1728} {"train_loss": -6.163688659667969, "global_step": 72598, "epoch": 1728} {"train_loss": -6.0508341789245605, "global_step": 72599, "epoch": 1728} {"train_loss": -6.134257793426514, "global_step": 72600, "epoch": 1728} {"train_loss": -6.102731704711914, "global_step": 72601, "epoch": 1728} {"train_loss": -5.960752010345459, "global_step": 72602, "epoch": 1728} {"train_loss": -6.142636299133301, "global_step": 72603, "epoch": 1728} {"train_loss": -6.098318099975586, "global_step": 72604, "epoch": 1728} {"train_loss": -5.9115214347839355, "global_step": 72605, "epoch": 1728} {"train_loss": -6.269222259521484, "global_step": 72606, "epoch": 1728} {"train_loss": -5.90327787399292, "global_step": 72607, "epoch": 1728} {"train_loss": -5.847979545593262, "global_step": 72608, "epoch": 1728} {"train_loss": -6.117134094238281, "global_step": 72609, "epoch": 1728} {"train_loss": -5.972612380981445, "global_step": 72610, "epoch": 1728} {"train_loss": -5.928571701049805, "global_step": 72611, "epoch": 1728} {"train_loss": -6.017258644104004, "global_step": 72612, "epoch": 1728} {"train_loss": -5.899472236633301, "global_step": 72613, "epoch": 1728} {"train_loss": -6.120122909545898, "global_step": 72614, "epoch": 1728} {"train_loss": -6.003778457641602, "global_step": 72615, "epoch": 1728} {"train_loss": -5.935352802276611, "global_step": 72616, "epoch": 1728} {"train_loss": -6.043492816743397, "global_step": 72617, "epoch": 1728, "val_loss": 74967.9453125} {"train_loss": -6.011290550231934, "global_step": 72618, "epoch": 1729} {"train_loss": -6.033788681030273, "global_step": 72619, "epoch": 1729} {"train_loss": -6.056190013885498, "global_step": 72620, "epoch": 1729} {"train_loss": -6.001893997192383, "global_step": 72621, "epoch": 1729} {"train_loss": -6.090825080871582, "global_step": 72622, "epoch": 1729} {"train_loss": -5.979867458343506, "global_step": 72623, "epoch": 1729} {"train_loss": -6.024937629699707, "global_step": 72624, "epoch": 1729} {"train_loss": -6.026906490325928, "global_step": 72625, "epoch": 1729} {"train_loss": -6.104598045349121, "global_step": 72626, "epoch": 1729} {"train_loss": -6.13257360458374, "global_step": 72627, "epoch": 1729} {"train_loss": -6.0548295974731445, "global_step": 72628, "epoch": 1729} {"train_loss": -6.009574890136719, "global_step": 72629, "epoch": 1729} {"train_loss": -6.103482723236084, "global_step": 72630, "epoch": 1729} {"train_loss": -6.0984907150268555, "global_step": 72631, "epoch": 1729} {"train_loss": -5.991456508636475, "global_step": 72632, "epoch": 1729} {"train_loss": -6.094771385192871, "global_step": 72633, "epoch": 1729} {"train_loss": -6.171021938323975, "global_step": 72634, "epoch": 1729} {"train_loss": -6.080390930175781, "global_step": 72635, "epoch": 1729} {"train_loss": -5.947502136230469, "global_step": 72636, "epoch": 1729} {"train_loss": -6.001395225524902, "global_step": 72637, "epoch": 1729} {"train_loss": -6.0061798095703125, "global_step": 72638, "epoch": 1729} {"train_loss": -5.99127197265625, "global_step": 72639, "epoch": 1729} {"train_loss": -6.0279130935668945, "global_step": 72640, "epoch": 1729} {"train_loss": -6.136664867401123, "global_step": 72641, "epoch": 1729} {"train_loss": -6.063520908355713, "global_step": 72642, "epoch": 1729} {"train_loss": -6.147695064544678, "global_step": 72643, "epoch": 1729} {"train_loss": -6.137049674987793, "global_step": 72644, "epoch": 1729} {"train_loss": -6.153478622436523, "global_step": 72645, "epoch": 1729} {"train_loss": -6.068264007568359, "global_step": 72646, "epoch": 1729} {"train_loss": -6.042289733886719, "global_step": 72647, "epoch": 1729} {"train_loss": -6.123348236083984, "global_step": 72648, "epoch": 1729} {"train_loss": -6.122365951538086, "global_step": 72649, "epoch": 1729} {"train_loss": -5.952948093414307, "global_step": 72650, "epoch": 1729} {"train_loss": -6.04733943939209, "global_step": 72651, "epoch": 1729} {"train_loss": -6.042205810546875, "global_step": 72652, "epoch": 1729} {"train_loss": -6.03341007232666, "global_step": 72653, "epoch": 1729} {"train_loss": -6.062661170959473, "global_step": 72654, "epoch": 1729} {"train_loss": -6.185053825378418, "global_step": 72655, "epoch": 1729} {"train_loss": -6.152311325073242, "global_step": 72656, "epoch": 1729} {"train_loss": -5.97998046875, "global_step": 72657, "epoch": 1729} {"train_loss": -6.050298690795898, "global_step": 72658, "epoch": 1729} {"train_loss": -6.060936405545189, "global_step": 72659, "epoch": 1729, "val_loss": 74822.578125} {"train_loss": -5.986828327178955, "global_step": 72660, "epoch": 1730} {"train_loss": -6.130387306213379, "global_step": 72661, "epoch": 1730} {"train_loss": -6.124664306640625, "global_step": 72662, "epoch": 1730} {"train_loss": -5.936821937561035, "global_step": 72663, "epoch": 1730} {"train_loss": -5.949191093444824, "global_step": 72664, "epoch": 1730} {"train_loss": -6.039976596832275, "global_step": 72665, "epoch": 1730} {"train_loss": -6.098657608032227, "global_step": 72666, "epoch": 1730} {"train_loss": -6.09536075592041, "global_step": 72667, "epoch": 1730} {"train_loss": -5.893250465393066, "global_step": 72668, "epoch": 1730} {"train_loss": -5.996506214141846, "global_step": 72669, "epoch": 1730} {"train_loss": -6.091108322143555, "global_step": 72670, "epoch": 1730} {"train_loss": -6.007696628570557, "global_step": 72671, "epoch": 1730} {"train_loss": -6.122982501983643, "global_step": 72672, "epoch": 1730} {"train_loss": -6.104631423950195, "global_step": 72673, "epoch": 1730} {"train_loss": -5.999107360839844, "global_step": 72674, "epoch": 1730} {"train_loss": -6.080575466156006, "global_step": 72675, "epoch": 1730} {"train_loss": -6.036152362823486, "global_step": 72676, "epoch": 1730} {"train_loss": -6.005499362945557, "global_step": 72677, "epoch": 1730} {"train_loss": -5.985622882843018, "global_step": 72678, "epoch": 1730} {"train_loss": -6.033657073974609, "global_step": 72679, "epoch": 1730} {"train_loss": -5.9913740158081055, "global_step": 72680, "epoch": 1730} {"train_loss": -6.126567840576172, "global_step": 72681, "epoch": 1730} {"train_loss": -6.123699188232422, "global_step": 72682, "epoch": 1730} {"train_loss": -6.164676666259766, "global_step": 72683, "epoch": 1730} {"train_loss": -6.034897327423096, "global_step": 72684, "epoch": 1730} {"train_loss": -5.964491844177246, "global_step": 72685, "epoch": 1730} {"train_loss": -6.058456897735596, "global_step": 72686, "epoch": 1730} {"train_loss": -6.108633995056152, "global_step": 72687, "epoch": 1730} {"train_loss": -6.042956829071045, "global_step": 72688, "epoch": 1730} {"train_loss": -6.037485122680664, "global_step": 72689, "epoch": 1730} {"train_loss": -6.123653411865234, "global_step": 72690, "epoch": 1730} {"train_loss": -6.083773612976074, "global_step": 72691, "epoch": 1730} {"train_loss": -5.919751167297363, "global_step": 72692, "epoch": 1730} {"train_loss": -6.01824951171875, "global_step": 72693, "epoch": 1730} {"train_loss": -6.027674674987793, "global_step": 72694, "epoch": 1730} {"train_loss": -6.152436256408691, "global_step": 72695, "epoch": 1730} {"train_loss": -6.01772403717041, "global_step": 72696, "epoch": 1730} {"train_loss": -5.934456825256348, "global_step": 72697, "epoch": 1730} {"train_loss": -6.050254821777344, "global_step": 72698, "epoch": 1730} {"train_loss": -6.09998893737793, "global_step": 72699, "epoch": 1730} {"train_loss": -5.984249114990234, "global_step": 72700, "epoch": 1730} {"train_loss": -6.04546586672465, "global_step": 72701, "epoch": 1730, "val_loss": 74905.96875} {"train_loss": -6.007951736450195, "global_step": 72702, "epoch": 1731} {"train_loss": -6.117342948913574, "global_step": 72703, "epoch": 1731} {"train_loss": -6.05064058303833, "global_step": 72704, "epoch": 1731} {"train_loss": -6.068134307861328, "global_step": 72705, "epoch": 1731} {"train_loss": -6.058789253234863, "global_step": 72706, "epoch": 1731} {"train_loss": -6.081037998199463, "global_step": 72707, "epoch": 1731} {"train_loss": -5.994805335998535, "global_step": 72708, "epoch": 1731} {"train_loss": -6.015778541564941, "global_step": 72709, "epoch": 1731} {"train_loss": -6.140172004699707, "global_step": 72710, "epoch": 1731} {"train_loss": -5.936521530151367, "global_step": 72711, "epoch": 1731} {"train_loss": -6.035889625549316, "global_step": 72712, "epoch": 1731} {"train_loss": -6.041110515594482, "global_step": 72713, "epoch": 1731} {"train_loss": -6.120089054107666, "global_step": 72714, "epoch": 1731} {"train_loss": -5.961028099060059, "global_step": 72715, "epoch": 1731} {"train_loss": -6.097329616546631, "global_step": 72716, "epoch": 1731} {"train_loss": -6.129082679748535, "global_step": 72717, "epoch": 1731} {"train_loss": -6.036897659301758, "global_step": 72718, "epoch": 1731} {"train_loss": -6.02069091796875, "global_step": 72719, "epoch": 1731} {"train_loss": -5.996694087982178, "global_step": 72720, "epoch": 1731} {"train_loss": -5.952776908874512, "global_step": 72721, "epoch": 1731} {"train_loss": -6.087225914001465, "global_step": 72722, "epoch": 1731} {"train_loss": -5.850341320037842, "global_step": 72723, "epoch": 1731} {"train_loss": -6.062958240509033, "global_step": 72724, "epoch": 1731} {"train_loss": -5.876010894775391, "global_step": 72725, "epoch": 1731} {"train_loss": -5.904489517211914, "global_step": 72726, "epoch": 1731} {"train_loss": -6.165083885192871, "global_step": 72727, "epoch": 1731} {"train_loss": -5.722458839416504, "global_step": 72728, "epoch": 1731} {"train_loss": -6.114623546600342, "global_step": 72729, "epoch": 1731} {"train_loss": -5.900109767913818, "global_step": 72730, "epoch": 1731} {"train_loss": -5.987502098083496, "global_step": 72731, "epoch": 1731} {"train_loss": -6.026493072509766, "global_step": 72732, "epoch": 1731} {"train_loss": -5.997032165527344, "global_step": 72733, "epoch": 1731} {"train_loss": -5.995967864990234, "global_step": 72734, "epoch": 1731} {"train_loss": -6.020283222198486, "global_step": 72735, "epoch": 1731} {"train_loss": -5.990670680999756, "global_step": 72736, "epoch": 1731} {"train_loss": -5.920853137969971, "global_step": 72737, "epoch": 1731} {"train_loss": -6.140213966369629, "global_step": 72738, "epoch": 1731} {"train_loss": -5.988373756408691, "global_step": 72739, "epoch": 1731} {"train_loss": -6.075791358947754, "global_step": 72740, "epoch": 1731} {"train_loss": -6.021286964416504, "global_step": 72741, "epoch": 1731} {"train_loss": -5.837348937988281, "global_step": 72742, "epoch": 1731} {"train_loss": -6.0136684122539705, "global_step": 72743, "epoch": 1731, "val_loss": 74891.953125} {"train_loss": -6.169415473937988, "global_step": 72744, "epoch": 1732} {"train_loss": -6.061556339263916, "global_step": 72745, "epoch": 1732} {"train_loss": -5.970743179321289, "global_step": 72746, "epoch": 1732} {"train_loss": -5.904043197631836, "global_step": 72747, "epoch": 1732} {"train_loss": -6.07921838760376, "global_step": 72748, "epoch": 1732} {"train_loss": -6.145188331604004, "global_step": 72749, "epoch": 1732} {"train_loss": -6.058741569519043, "global_step": 72750, "epoch": 1732} {"train_loss": -5.995821952819824, "global_step": 72751, "epoch": 1732} {"train_loss": -6.007498741149902, "global_step": 72752, "epoch": 1732} {"train_loss": -5.979445457458496, "global_step": 72753, "epoch": 1732} {"train_loss": -6.124373435974121, "global_step": 72754, "epoch": 1732} {"train_loss": -6.039538860321045, "global_step": 72755, "epoch": 1732} {"train_loss": -6.1186628341674805, "global_step": 72756, "epoch": 1732} {"train_loss": -5.951028823852539, "global_step": 72757, "epoch": 1732} {"train_loss": -6.045315742492676, "global_step": 72758, "epoch": 1732} {"train_loss": -6.12217903137207, "global_step": 72759, "epoch": 1732} {"train_loss": -5.899644374847412, "global_step": 72760, "epoch": 1732} {"train_loss": -5.965201377868652, "global_step": 72761, "epoch": 1732} {"train_loss": -6.1243438720703125, "global_step": 72762, "epoch": 1732} {"train_loss": -6.057012557983398, "global_step": 72763, "epoch": 1732} {"train_loss": -5.944011688232422, "global_step": 72764, "epoch": 1732} {"train_loss": -5.996045112609863, "global_step": 72765, "epoch": 1732} {"train_loss": -5.860151767730713, "global_step": 72766, "epoch": 1732} {"train_loss": -5.985567569732666, "global_step": 72767, "epoch": 1732} {"train_loss": -5.970380783081055, "global_step": 72768, "epoch": 1732} {"train_loss": -5.873974323272705, "global_step": 72769, "epoch": 1732} {"train_loss": -6.09650993347168, "global_step": 72770, "epoch": 1732} {"train_loss": -6.0082879066467285, "global_step": 72771, "epoch": 1732} {"train_loss": -6.046748161315918, "global_step": 72772, "epoch": 1732} {"train_loss": -6.041347026824951, "global_step": 72773, "epoch": 1732} {"train_loss": -6.0603437423706055, "global_step": 72774, "epoch": 1732} {"train_loss": -5.960850715637207, "global_step": 72775, "epoch": 1732} {"train_loss": -5.976099967956543, "global_step": 72776, "epoch": 1732} {"train_loss": -6.009629249572754, "global_step": 72777, "epoch": 1732} {"train_loss": -6.0289812088012695, "global_step": 72778, "epoch": 1732} {"train_loss": -6.135345458984375, "global_step": 72779, "epoch": 1732} {"train_loss": -5.9807915687561035, "global_step": 72780, "epoch": 1732} {"train_loss": -6.066800117492676, "global_step": 72781, "epoch": 1732} {"train_loss": -6.070900917053223, "global_step": 72782, "epoch": 1732} {"train_loss": -5.947266578674316, "global_step": 72783, "epoch": 1732} {"train_loss": -6.083593368530273, "global_step": 72784, "epoch": 1732} {"train_loss": -6.026867366972423, "global_step": 72785, "epoch": 1732, "val_loss": 74995.359375} {"train_loss": -6.122602462768555, "global_step": 72786, "epoch": 1733} {"train_loss": -6.100678443908691, "global_step": 72787, "epoch": 1733} {"train_loss": -6.059385299682617, "global_step": 72788, "epoch": 1733} {"train_loss": -6.086153984069824, "global_step": 72789, "epoch": 1733} {"train_loss": -6.004196643829346, "global_step": 72790, "epoch": 1733} {"train_loss": -6.144713401794434, "global_step": 72791, "epoch": 1733} {"train_loss": -6.050334453582764, "global_step": 72792, "epoch": 1733} {"train_loss": -6.046648025512695, "global_step": 72793, "epoch": 1733} {"train_loss": -6.122316837310791, "global_step": 72794, "epoch": 1733} {"train_loss": -6.148009300231934, "global_step": 72795, "epoch": 1733} {"train_loss": -6.050383567810059, "global_step": 72796, "epoch": 1733} {"train_loss": -5.95208215713501, "global_step": 72797, "epoch": 1733} {"train_loss": -6.071254730224609, "global_step": 72798, "epoch": 1733} {"train_loss": -6.088807582855225, "global_step": 72799, "epoch": 1733} {"train_loss": -5.996650218963623, "global_step": 72800, "epoch": 1733} {"train_loss": -6.066220760345459, "global_step": 72801, "epoch": 1733} {"train_loss": -6.114131927490234, "global_step": 72802, "epoch": 1733} {"train_loss": -6.009586334228516, "global_step": 72803, "epoch": 1733} {"train_loss": -6.085516452789307, "global_step": 72804, "epoch": 1733} {"train_loss": -6.1267805099487305, "global_step": 72805, "epoch": 1733} {"train_loss": -5.980189323425293, "global_step": 72806, "epoch": 1733} {"train_loss": -6.017937183380127, "global_step": 72807, "epoch": 1733} {"train_loss": -6.015294075012207, "global_step": 72808, "epoch": 1733} {"train_loss": -6.033016204833984, "global_step": 72809, "epoch": 1733} {"train_loss": -5.8948516845703125, "global_step": 72810, "epoch": 1733} {"train_loss": -5.969485282897949, "global_step": 72811, "epoch": 1733} {"train_loss": -6.111812591552734, "global_step": 72812, "epoch": 1733} {"train_loss": -6.019628047943115, "global_step": 72813, "epoch": 1733} {"train_loss": -6.030259132385254, "global_step": 72814, "epoch": 1733} {"train_loss": -6.004637241363525, "global_step": 72815, "epoch": 1733} {"train_loss": -6.086864471435547, "global_step": 72816, "epoch": 1733} {"train_loss": -5.978287220001221, "global_step": 72817, "epoch": 1733} {"train_loss": -6.1504974365234375, "global_step": 72818, "epoch": 1733} {"train_loss": -6.076825141906738, "global_step": 72819, "epoch": 1733} {"train_loss": -6.0389404296875, "global_step": 72820, "epoch": 1733} {"train_loss": -6.027640342712402, "global_step": 72821, "epoch": 1733} {"train_loss": -6.121850967407227, "global_step": 72822, "epoch": 1733} {"train_loss": -5.995771408081055, "global_step": 72823, "epoch": 1733} {"train_loss": -6.1445136070251465, "global_step": 72824, "epoch": 1733} {"train_loss": -6.135759353637695, "global_step": 72825, "epoch": 1733} {"train_loss": -6.081789016723633, "global_step": 72826, "epoch": 1733} {"train_loss": -6.056805565243676, "global_step": 72827, "epoch": 1733, "val_loss": 74925.7109375} {"train_loss": -6.039855003356934, "global_step": 72828, "epoch": 1734} {"train_loss": -6.058964729309082, "global_step": 72829, "epoch": 1734} {"train_loss": -6.006890296936035, "global_step": 72830, "epoch": 1734} {"train_loss": -5.921170234680176, "global_step": 72831, "epoch": 1734} {"train_loss": -6.202674865722656, "global_step": 72832, "epoch": 1734} {"train_loss": -6.173834323883057, "global_step": 72833, "epoch": 1734} {"train_loss": -6.061647891998291, "global_step": 72834, "epoch": 1734} {"train_loss": -6.078712463378906, "global_step": 72835, "epoch": 1734} {"train_loss": -6.054106712341309, "global_step": 72836, "epoch": 1734} {"train_loss": -6.074826240539551, "global_step": 72837, "epoch": 1734} {"train_loss": -6.097355365753174, "global_step": 72838, "epoch": 1734} {"train_loss": -6.115789413452148, "global_step": 72839, "epoch": 1734} {"train_loss": -6.09044885635376, "global_step": 72840, "epoch": 1734} {"train_loss": -6.207805633544922, "global_step": 72841, "epoch": 1734} {"train_loss": -5.991316795349121, "global_step": 72842, "epoch": 1734} {"train_loss": -6.031031608581543, "global_step": 72843, "epoch": 1734} {"train_loss": -6.192025184631348, "global_step": 72844, "epoch": 1734} {"train_loss": -5.9918999671936035, "global_step": 72845, "epoch": 1734} {"train_loss": -6.034427642822266, "global_step": 72846, "epoch": 1734} {"train_loss": -6.030486106872559, "global_step": 72847, "epoch": 1734} {"train_loss": -6.1910014152526855, "global_step": 72848, "epoch": 1734} {"train_loss": -6.046248912811279, "global_step": 72849, "epoch": 1734} {"train_loss": -6.192842483520508, "global_step": 72850, "epoch": 1734} {"train_loss": -6.106749534606934, "global_step": 72851, "epoch": 1734} {"train_loss": -6.168512344360352, "global_step": 72852, "epoch": 1734} {"train_loss": -6.030778884887695, "global_step": 72853, "epoch": 1734} {"train_loss": -5.89085578918457, "global_step": 72854, "epoch": 1734} {"train_loss": -5.964267730712891, "global_step": 72855, "epoch": 1734} {"train_loss": -6.04377555847168, "global_step": 72856, "epoch": 1734} {"train_loss": -6.03150749206543, "global_step": 72857, "epoch": 1734} {"train_loss": -6.105824947357178, "global_step": 72858, "epoch": 1734} {"train_loss": -6.1833882331848145, "global_step": 72859, "epoch": 1734} {"train_loss": -6.0118913650512695, "global_step": 72860, "epoch": 1734} {"train_loss": -6.0869140625, "global_step": 72861, "epoch": 1734} {"train_loss": -6.031452178955078, "global_step": 72862, "epoch": 1734} {"train_loss": -6.034021377563477, "global_step": 72863, "epoch": 1734} {"train_loss": -6.039433479309082, "global_step": 72864, "epoch": 1734} {"train_loss": -6.0374836921691895, "global_step": 72865, "epoch": 1734} {"train_loss": -6.020109176635742, "global_step": 72866, "epoch": 1734} {"train_loss": -6.068992614746094, "global_step": 72867, "epoch": 1734} {"train_loss": -6.015820503234863, "global_step": 72868, "epoch": 1734} {"train_loss": -6.065907217207409, "global_step": 72869, "epoch": 1734, "val_loss": 74913.8046875} {"train_loss": -5.957775592803955, "global_step": 72870, "epoch": 1735} {"train_loss": -6.091992378234863, "global_step": 72871, "epoch": 1735} {"train_loss": -5.930461883544922, "global_step": 72872, "epoch": 1735} {"train_loss": -5.892075538635254, "global_step": 72873, "epoch": 1735} {"train_loss": -6.128778457641602, "global_step": 72874, "epoch": 1735} {"train_loss": -6.039880752563477, "global_step": 72875, "epoch": 1735} {"train_loss": -6.130598068237305, "global_step": 72876, "epoch": 1735} {"train_loss": -5.948481559753418, "global_step": 72877, "epoch": 1735} {"train_loss": -6.086206436157227, "global_step": 72878, "epoch": 1735} {"train_loss": -6.010830402374268, "global_step": 72879, "epoch": 1735} {"train_loss": -6.040224552154541, "global_step": 72880, "epoch": 1735} {"train_loss": -6.042824745178223, "global_step": 72881, "epoch": 1735} {"train_loss": -6.124270915985107, "global_step": 72882, "epoch": 1735} {"train_loss": -6.100839614868164, "global_step": 72883, "epoch": 1735} {"train_loss": -6.122737407684326, "global_step": 72884, "epoch": 1735} {"train_loss": -6.041605472564697, "global_step": 72885, "epoch": 1735} {"train_loss": -6.105170249938965, "global_step": 72886, "epoch": 1735} {"train_loss": -6.107419013977051, "global_step": 72887, "epoch": 1735} {"train_loss": -6.107874870300293, "global_step": 72888, "epoch": 1735} {"train_loss": -6.124084949493408, "global_step": 72889, "epoch": 1735} {"train_loss": -6.108776569366455, "global_step": 72890, "epoch": 1735} {"train_loss": -6.09921932220459, "global_step": 72891, "epoch": 1735} {"train_loss": -6.094582557678223, "global_step": 72892, "epoch": 1735} {"train_loss": -6.053225994110107, "global_step": 72893, "epoch": 1735} {"train_loss": -6.0481672286987305, "global_step": 72894, "epoch": 1735} {"train_loss": -6.06827449798584, "global_step": 72895, "epoch": 1735} {"train_loss": -5.952934265136719, "global_step": 72896, "epoch": 1735} {"train_loss": -6.036768913269043, "global_step": 72897, "epoch": 1735} {"train_loss": -6.158125877380371, "global_step": 72898, "epoch": 1735} {"train_loss": -5.967911720275879, "global_step": 72899, "epoch": 1735} {"train_loss": -6.235272407531738, "global_step": 72900, "epoch": 1735} {"train_loss": -5.955970764160156, "global_step": 72901, "epoch": 1735} {"train_loss": -5.95673942565918, "global_step": 72902, "epoch": 1735} {"train_loss": -6.039886474609375, "global_step": 72903, "epoch": 1735} {"train_loss": -6.052310943603516, "global_step": 72904, "epoch": 1735} {"train_loss": -6.018806457519531, "global_step": 72905, "epoch": 1735} {"train_loss": -5.980741500854492, "global_step": 72906, "epoch": 1735} {"train_loss": -6.084460258483887, "global_step": 72907, "epoch": 1735} {"train_loss": -5.994380950927734, "global_step": 72908, "epoch": 1735} {"train_loss": -5.992918968200684, "global_step": 72909, "epoch": 1735} {"train_loss": -6.01806640625, "global_step": 72910, "epoch": 1735} {"train_loss": -6.052250669116066, "global_step": 72911, "epoch": 1735, "val_loss": 75145.09375} {"train_loss": -6.002141952514648, "global_step": 72912, "epoch": 1736} {"train_loss": -6.053345680236816, "global_step": 72913, "epoch": 1736} {"train_loss": -5.91696834564209, "global_step": 72914, "epoch": 1736} {"train_loss": -6.042055606842041, "global_step": 72915, "epoch": 1736} {"train_loss": -6.080191612243652, "global_step": 72916, "epoch": 1736} {"train_loss": -5.907075881958008, "global_step": 72917, "epoch": 1736} {"train_loss": -6.081625461578369, "global_step": 72918, "epoch": 1736} {"train_loss": -6.177988052368164, "global_step": 72919, "epoch": 1736} {"train_loss": -6.063501358032227, "global_step": 72920, "epoch": 1736} {"train_loss": -6.119290828704834, "global_step": 72921, "epoch": 1736} {"train_loss": -6.114343166351318, "global_step": 72922, "epoch": 1736} {"train_loss": -6.109095573425293, "global_step": 72923, "epoch": 1736} {"train_loss": -5.980645179748535, "global_step": 72924, "epoch": 1736} {"train_loss": -6.012128829956055, "global_step": 72925, "epoch": 1736} {"train_loss": -6.066424369812012, "global_step": 72926, "epoch": 1736} {"train_loss": -6.043319225311279, "global_step": 72927, "epoch": 1736} {"train_loss": -6.211355686187744, "global_step": 72928, "epoch": 1736} {"train_loss": -5.969241142272949, "global_step": 72929, "epoch": 1736} {"train_loss": -6.023679733276367, "global_step": 72930, "epoch": 1736} {"train_loss": -5.9804229736328125, "global_step": 72931, "epoch": 1736} {"train_loss": -6.151846885681152, "global_step": 72932, "epoch": 1736} {"train_loss": -6.1281890869140625, "global_step": 72933, "epoch": 1736} {"train_loss": -6.114766597747803, "global_step": 72934, "epoch": 1736} {"train_loss": -6.063037872314453, "global_step": 72935, "epoch": 1736} {"train_loss": -6.083338737487793, "global_step": 72936, "epoch": 1736} {"train_loss": -6.046653747558594, "global_step": 72937, "epoch": 1736} {"train_loss": -6.019824028015137, "global_step": 72938, "epoch": 1736} {"train_loss": -6.080848217010498, "global_step": 72939, "epoch": 1736} {"train_loss": -6.0576395988464355, "global_step": 72940, "epoch": 1736} {"train_loss": -5.956714630126953, "global_step": 72941, "epoch": 1736} {"train_loss": -5.962305068969727, "global_step": 72942, "epoch": 1736} {"train_loss": -6.0050153732299805, "global_step": 72943, "epoch": 1736} {"train_loss": -6.028135299682617, "global_step": 72944, "epoch": 1736} {"train_loss": -5.995409965515137, "global_step": 72945, "epoch": 1736} {"train_loss": -6.138618469238281, "global_step": 72946, "epoch": 1736} {"train_loss": -6.078969478607178, "global_step": 72947, "epoch": 1736} {"train_loss": -5.967034339904785, "global_step": 72948, "epoch": 1736} {"train_loss": -5.970566749572754, "global_step": 72949, "epoch": 1736} {"train_loss": -6.1809844970703125, "global_step": 72950, "epoch": 1736} {"train_loss": -6.108233451843262, "global_step": 72951, "epoch": 1736} {"train_loss": -6.074450492858887, "global_step": 72952, "epoch": 1736} {"train_loss": -6.055859474908738, "global_step": 72953, "epoch": 1736, "val_loss": 74971.0546875} {"train_loss": -6.130314350128174, "global_step": 72954, "epoch": 1737} {"train_loss": -6.159016132354736, "global_step": 72955, "epoch": 1737} {"train_loss": -6.223196983337402, "global_step": 72956, "epoch": 1737} {"train_loss": -6.043495178222656, "global_step": 72957, "epoch": 1737} {"train_loss": -6.067741870880127, "global_step": 72958, "epoch": 1737} {"train_loss": -6.01451301574707, "global_step": 72959, "epoch": 1737} {"train_loss": -6.087376594543457, "global_step": 72960, "epoch": 1737} {"train_loss": -6.153991222381592, "global_step": 72961, "epoch": 1737} {"train_loss": -6.151254177093506, "global_step": 72962, "epoch": 1737} {"train_loss": -6.025750160217285, "global_step": 72963, "epoch": 1737} {"train_loss": -6.12925910949707, "global_step": 72964, "epoch": 1737} {"train_loss": -6.038482189178467, "global_step": 72965, "epoch": 1737} {"train_loss": -6.032835006713867, "global_step": 72966, "epoch": 1737} {"train_loss": -6.1338276863098145, "global_step": 72967, "epoch": 1737} {"train_loss": -6.080516815185547, "global_step": 72968, "epoch": 1737} {"train_loss": -6.123651504516602, "global_step": 72969, "epoch": 1737} {"train_loss": -6.096251487731934, "global_step": 72970, "epoch": 1737} {"train_loss": -6.039440631866455, "global_step": 72971, "epoch": 1737} {"train_loss": -5.99763298034668, "global_step": 72972, "epoch": 1737} {"train_loss": -5.990774631500244, "global_step": 72973, "epoch": 1737} {"train_loss": -6.058201789855957, "global_step": 72974, "epoch": 1737} {"train_loss": -5.972964286804199, "global_step": 72975, "epoch": 1737} {"train_loss": -5.874843597412109, "global_step": 72976, "epoch": 1737} {"train_loss": -6.143409729003906, "global_step": 72977, "epoch": 1737} {"train_loss": -6.141444206237793, "global_step": 72978, "epoch": 1737} {"train_loss": -6.155679225921631, "global_step": 72979, "epoch": 1737} {"train_loss": -5.925109386444092, "global_step": 72980, "epoch": 1737} {"train_loss": -6.016490936279297, "global_step": 72981, "epoch": 1737} {"train_loss": -5.990616798400879, "global_step": 72982, "epoch": 1737} {"train_loss": -6.011835098266602, "global_step": 72983, "epoch": 1737} {"train_loss": -6.002077102661133, "global_step": 72984, "epoch": 1737} {"train_loss": -6.1451239585876465, "global_step": 72985, "epoch": 1737} {"train_loss": -5.933535575866699, "global_step": 72986, "epoch": 1737} {"train_loss": -6.089702129364014, "global_step": 72987, "epoch": 1737} {"train_loss": -5.879843711853027, "global_step": 72988, "epoch": 1737} {"train_loss": -6.082427024841309, "global_step": 72989, "epoch": 1737} {"train_loss": -6.083440780639648, "global_step": 72990, "epoch": 1737} {"train_loss": -6.1172590255737305, "global_step": 72991, "epoch": 1737} {"train_loss": -6.104800224304199, "global_step": 72992, "epoch": 1737} {"train_loss": -6.124024391174316, "global_step": 72993, "epoch": 1737} {"train_loss": -6.116851329803467, "global_step": 72994, "epoch": 1737} {"train_loss": -6.065010059447515, "global_step": 72995, "epoch": 1737, "val_loss": 75045.921875} {"train_loss": -6.063323020935059, "global_step": 72996, "epoch": 1738} {"train_loss": -6.126638889312744, "global_step": 72997, "epoch": 1738} {"train_loss": -6.027880668640137, "global_step": 72998, "epoch": 1738} {"train_loss": -6.055149078369141, "global_step": 72999, "epoch": 1738} {"train_loss": -6.069526672363281, "global_step": 73000, "epoch": 1738} {"train_loss": -6.158696174621582, "global_step": 73001, "epoch": 1738} {"train_loss": -6.072525501251221, "global_step": 73002, "epoch": 1738} {"train_loss": -6.176016330718994, "global_step": 73003, "epoch": 1738} {"train_loss": -6.022757053375244, "global_step": 73004, "epoch": 1738} {"train_loss": -6.061756134033203, "global_step": 73005, "epoch": 1738} {"train_loss": -6.042487621307373, "global_step": 73006, "epoch": 1738} {"train_loss": -5.993497371673584, "global_step": 73007, "epoch": 1738} {"train_loss": -6.076744079589844, "global_step": 73008, "epoch": 1738} {"train_loss": -5.9060587882995605, "global_step": 73009, "epoch": 1738} {"train_loss": -6.126433849334717, "global_step": 73010, "epoch": 1738} {"train_loss": -6.047740936279297, "global_step": 73011, "epoch": 1738} {"train_loss": -5.974187850952148, "global_step": 73012, "epoch": 1738} {"train_loss": -5.929797172546387, "global_step": 73013, "epoch": 1738} {"train_loss": -6.036005973815918, "global_step": 73014, "epoch": 1738} {"train_loss": -6.073366641998291, "global_step": 73015, "epoch": 1738} {"train_loss": -5.994058132171631, "global_step": 73016, "epoch": 1738} {"train_loss": -6.132637023925781, "global_step": 73017, "epoch": 1738} {"train_loss": -5.92167329788208, "global_step": 73018, "epoch": 1738} {"train_loss": -6.023207664489746, "global_step": 73019, "epoch": 1738} {"train_loss": -6.1110615730285645, "global_step": 73020, "epoch": 1738} {"train_loss": -6.035186290740967, "global_step": 73021, "epoch": 1738} {"train_loss": -6.083252906799316, "global_step": 73022, "epoch": 1738} {"train_loss": -6.034730911254883, "global_step": 73023, "epoch": 1738} {"train_loss": -6.030864715576172, "global_step": 73024, "epoch": 1738} {"train_loss": -6.0897626876831055, "global_step": 73025, "epoch": 1738} {"train_loss": -6.094785690307617, "global_step": 73026, "epoch": 1738} {"train_loss": -6.171255111694336, "global_step": 73027, "epoch": 1738} {"train_loss": -5.969085216522217, "global_step": 73028, "epoch": 1738} {"train_loss": -6.128423690795898, "global_step": 73029, "epoch": 1738} {"train_loss": -6.021101951599121, "global_step": 73030, "epoch": 1738} {"train_loss": -6.111977577209473, "global_step": 73031, "epoch": 1738} {"train_loss": -6.12421178817749, "global_step": 73032, "epoch": 1738} {"train_loss": -5.95284366607666, "global_step": 73033, "epoch": 1738} {"train_loss": -6.002254486083984, "global_step": 73034, "epoch": 1738} {"train_loss": -5.996742248535156, "global_step": 73035, "epoch": 1738} {"train_loss": -6.098450660705566, "global_step": 73036, "epoch": 1738} {"train_loss": -6.053062314078922, "global_step": 73037, "epoch": 1738, "val_loss": 75035.1796875} {"train_loss": -5.968631744384766, "global_step": 73038, "epoch": 1739} {"train_loss": -6.018679618835449, "global_step": 73039, "epoch": 1739} {"train_loss": -6.067734718322754, "global_step": 73040, "epoch": 1739} {"train_loss": -6.097312927246094, "global_step": 73041, "epoch": 1739} {"train_loss": -6.1036200523376465, "global_step": 73042, "epoch": 1739} {"train_loss": -6.123486518859863, "global_step": 73043, "epoch": 1739} {"train_loss": -6.116336822509766, "global_step": 73044, "epoch": 1739} {"train_loss": -5.968785285949707, "global_step": 73045, "epoch": 1739} {"train_loss": -6.177751541137695, "global_step": 73046, "epoch": 1739} {"train_loss": -6.039967060089111, "global_step": 73047, "epoch": 1739} {"train_loss": -6.03998327255249, "global_step": 73048, "epoch": 1739} {"train_loss": -5.985408782958984, "global_step": 73049, "epoch": 1739} {"train_loss": -5.9148149490356445, "global_step": 73050, "epoch": 1739} {"train_loss": -6.088447570800781, "global_step": 73051, "epoch": 1739} {"train_loss": -6.099111557006836, "global_step": 73052, "epoch": 1739} {"train_loss": -6.0032639503479, "global_step": 73053, "epoch": 1739} {"train_loss": -6.030807971954346, "global_step": 73054, "epoch": 1739} {"train_loss": -6.118330001831055, "global_step": 73055, "epoch": 1739} {"train_loss": -5.873045921325684, "global_step": 73056, "epoch": 1739} {"train_loss": -6.116410255432129, "global_step": 73057, "epoch": 1739} {"train_loss": -6.05942440032959, "global_step": 73058, "epoch": 1739} {"train_loss": -5.927070140838623, "global_step": 73059, "epoch": 1739} {"train_loss": -6.0470075607299805, "global_step": 73060, "epoch": 1739} {"train_loss": -6.01586389541626, "global_step": 73061, "epoch": 1739} {"train_loss": -6.053922653198242, "global_step": 73062, "epoch": 1739} {"train_loss": -5.986903190612793, "global_step": 73063, "epoch": 1739} {"train_loss": -6.027624607086182, "global_step": 73064, "epoch": 1739} {"train_loss": -6.074633598327637, "global_step": 73065, "epoch": 1739} {"train_loss": -6.0187482833862305, "global_step": 73066, "epoch": 1739} {"train_loss": -5.9979400634765625, "global_step": 73067, "epoch": 1739} {"train_loss": -6.066464424133301, "global_step": 73068, "epoch": 1739} {"train_loss": -6.022131443023682, "global_step": 73069, "epoch": 1739} {"train_loss": -6.107149124145508, "global_step": 73070, "epoch": 1739} {"train_loss": -6.052209854125977, "global_step": 73071, "epoch": 1739} {"train_loss": -6.107928276062012, "global_step": 73072, "epoch": 1739} {"train_loss": -6.077005386352539, "global_step": 73073, "epoch": 1739} {"train_loss": -6.052595138549805, "global_step": 73074, "epoch": 1739} {"train_loss": -5.990001678466797, "global_step": 73075, "epoch": 1739} {"train_loss": -6.07086181640625, "global_step": 73076, "epoch": 1739} {"train_loss": -5.97957706451416, "global_step": 73077, "epoch": 1739} {"train_loss": -5.949711799621582, "global_step": 73078, "epoch": 1739} {"train_loss": -6.040533667518979, "global_step": 73079, "epoch": 1739, "val_loss": 74924.7578125} {"train_loss": -6.075337886810303, "global_step": 73080, "epoch": 1740} {"train_loss": -5.97491979598999, "global_step": 73081, "epoch": 1740} {"train_loss": -6.222700595855713, "global_step": 73082, "epoch": 1740} {"train_loss": -6.0126776695251465, "global_step": 73083, "epoch": 1740} {"train_loss": -6.0659637451171875, "global_step": 73084, "epoch": 1740} {"train_loss": -5.873441219329834, "global_step": 73085, "epoch": 1740} {"train_loss": -6.0980401039123535, "global_step": 73086, "epoch": 1740} {"train_loss": -5.997500896453857, "global_step": 73087, "epoch": 1740} {"train_loss": -6.072747230529785, "global_step": 73088, "epoch": 1740} {"train_loss": -5.962326526641846, "global_step": 73089, "epoch": 1740} {"train_loss": -5.954318046569824, "global_step": 73090, "epoch": 1740} {"train_loss": -6.090363502502441, "global_step": 73091, "epoch": 1740} {"train_loss": -6.011308670043945, "global_step": 73092, "epoch": 1740} {"train_loss": -6.1204352378845215, "global_step": 73093, "epoch": 1740} {"train_loss": -6.016129016876221, "global_step": 73094, "epoch": 1740} {"train_loss": -6.196390151977539, "global_step": 73095, "epoch": 1740} {"train_loss": -5.986757755279541, "global_step": 73096, "epoch": 1740} {"train_loss": -5.981809616088867, "global_step": 73097, "epoch": 1740} {"train_loss": -6.115997314453125, "global_step": 73098, "epoch": 1740} {"train_loss": -6.043835163116455, "global_step": 73099, "epoch": 1740} {"train_loss": -6.0943498611450195, "global_step": 73100, "epoch": 1740} {"train_loss": -6.110598564147949, "global_step": 73101, "epoch": 1740} {"train_loss": -5.873208045959473, "global_step": 73102, "epoch": 1740} {"train_loss": -6.108928203582764, "global_step": 73103, "epoch": 1740} {"train_loss": -5.943222999572754, "global_step": 73104, "epoch": 1740} {"train_loss": -5.758127212524414, "global_step": 73105, "epoch": 1740} {"train_loss": -5.994020462036133, "global_step": 73106, "epoch": 1740} {"train_loss": -5.835145950317383, "global_step": 73107, "epoch": 1740} {"train_loss": -6.093259334564209, "global_step": 73108, "epoch": 1740} {"train_loss": -5.924073219299316, "global_step": 73109, "epoch": 1740} {"train_loss": -6.026542663574219, "global_step": 73110, "epoch": 1740} {"train_loss": -6.023856163024902, "global_step": 73111, "epoch": 1740} {"train_loss": -5.976743221282959, "global_step": 73112, "epoch": 1740} {"train_loss": -5.910459041595459, "global_step": 73113, "epoch": 1740} {"train_loss": -5.825652122497559, "global_step": 73114, "epoch": 1740} {"train_loss": -5.978822231292725, "global_step": 73115, "epoch": 1740} {"train_loss": -5.892528057098389, "global_step": 73116, "epoch": 1740} {"train_loss": -5.978145599365234, "global_step": 73117, "epoch": 1740} {"train_loss": -6.015032768249512, "global_step": 73118, "epoch": 1740} {"train_loss": -6.007868766784668, "global_step": 73119, "epoch": 1740} {"train_loss": -6.007967948913574, "global_step": 73120, "epoch": 1740} {"train_loss": -6.0029539948418025, "global_step": 73121, "epoch": 1740, "val_loss": 75061.7109375} {"train_loss": -6.001097679138184, "global_step": 73122, "epoch": 1741} {"train_loss": -6.061478137969971, "global_step": 73123, "epoch": 1741} {"train_loss": -5.969444751739502, "global_step": 73124, "epoch": 1741} {"train_loss": -5.939817905426025, "global_step": 73125, "epoch": 1741} {"train_loss": -6.026115894317627, "global_step": 73126, "epoch": 1741} {"train_loss": -6.205706596374512, "global_step": 73127, "epoch": 1741} {"train_loss": -6.058707237243652, "global_step": 73128, "epoch": 1741} {"train_loss": -6.109259605407715, "global_step": 73129, "epoch": 1741} {"train_loss": -6.153450012207031, "global_step": 73130, "epoch": 1741} {"train_loss": -6.031085014343262, "global_step": 73131, "epoch": 1741} {"train_loss": -6.014543056488037, "global_step": 73132, "epoch": 1741} {"train_loss": -5.990489482879639, "global_step": 73133, "epoch": 1741} {"train_loss": -6.0357770919799805, "global_step": 73134, "epoch": 1741} {"train_loss": -6.032613277435303, "global_step": 73135, "epoch": 1741} {"train_loss": -6.071802139282227, "global_step": 73136, "epoch": 1741} {"train_loss": -6.139187812805176, "global_step": 73137, "epoch": 1741} {"train_loss": -5.923674583435059, "global_step": 73138, "epoch": 1741} {"train_loss": -6.115675449371338, "global_step": 73139, "epoch": 1741} {"train_loss": -6.139476776123047, "global_step": 73140, "epoch": 1741} {"train_loss": -5.964006423950195, "global_step": 73141, "epoch": 1741} {"train_loss": -6.113049507141113, "global_step": 73142, "epoch": 1741} {"train_loss": -5.984794616699219, "global_step": 73143, "epoch": 1741} {"train_loss": -6.0111870765686035, "global_step": 73144, "epoch": 1741} {"train_loss": -5.878448009490967, "global_step": 73145, "epoch": 1741} {"train_loss": -5.991953372955322, "global_step": 73146, "epoch": 1741} {"train_loss": -6.008976936340332, "global_step": 73147, "epoch": 1741} {"train_loss": -6.002171516418457, "global_step": 73148, "epoch": 1741} {"train_loss": -5.934342384338379, "global_step": 73149, "epoch": 1741} {"train_loss": -5.819591045379639, "global_step": 73150, "epoch": 1741} {"train_loss": -5.966529369354248, "global_step": 73151, "epoch": 1741} {"train_loss": -6.004409313201904, "global_step": 73152, "epoch": 1741} {"train_loss": -6.024053573608398, "global_step": 73153, "epoch": 1741} {"train_loss": -5.970075607299805, "global_step": 73154, "epoch": 1741} {"train_loss": -5.981112480163574, "global_step": 73155, "epoch": 1741} {"train_loss": -5.9894537925720215, "global_step": 73156, "epoch": 1741} {"train_loss": -6.001265525817871, "global_step": 73157, "epoch": 1741} {"train_loss": -5.907246112823486, "global_step": 73158, "epoch": 1741} {"train_loss": -6.062607288360596, "global_step": 73159, "epoch": 1741} {"train_loss": -6.007948875427246, "global_step": 73160, "epoch": 1741} {"train_loss": -6.0145769119262695, "global_step": 73161, "epoch": 1741} {"train_loss": -6.094564437866211, "global_step": 73162, "epoch": 1741} {"train_loss": -6.017679623195103, "global_step": 73163, "epoch": 1741, "val_loss": 74737.03125} {"train_loss": -6.050629615783691, "global_step": 73164, "epoch": 1742} {"train_loss": -6.035736083984375, "global_step": 73165, "epoch": 1742} {"train_loss": -5.953915596008301, "global_step": 73166, "epoch": 1742} {"train_loss": -6.0563554763793945, "global_step": 73167, "epoch": 1742} {"train_loss": -6.041833877563477, "global_step": 73168, "epoch": 1742} {"train_loss": -5.988704681396484, "global_step": 73169, "epoch": 1742} {"train_loss": -5.989774703979492, "global_step": 73170, "epoch": 1742} {"train_loss": -5.867602348327637, "global_step": 73171, "epoch": 1742} {"train_loss": -6.0775837898254395, "global_step": 73172, "epoch": 1742} {"train_loss": -6.059895992279053, "global_step": 73173, "epoch": 1742} {"train_loss": -6.022939205169678, "global_step": 73174, "epoch": 1742} {"train_loss": -6.061061859130859, "global_step": 73175, "epoch": 1742} {"train_loss": -6.142444133758545, "global_step": 73176, "epoch": 1742} {"train_loss": -6.059958457946777, "global_step": 73177, "epoch": 1742} {"train_loss": -5.945523262023926, "global_step": 73178, "epoch": 1742} {"train_loss": -6.070369243621826, "global_step": 73179, "epoch": 1742} {"train_loss": -6.144148349761963, "global_step": 73180, "epoch": 1742} {"train_loss": -6.111034393310547, "global_step": 73181, "epoch": 1742} {"train_loss": -6.05849552154541, "global_step": 73182, "epoch": 1742} {"train_loss": -6.145985126495361, "global_step": 73183, "epoch": 1742} {"train_loss": -6.143091201782227, "global_step": 73184, "epoch": 1742} {"train_loss": -6.092153549194336, "global_step": 73185, "epoch": 1742} {"train_loss": -6.111200332641602, "global_step": 73186, "epoch": 1742} {"train_loss": -6.055224418640137, "global_step": 73187, "epoch": 1742} {"train_loss": -5.869456768035889, "global_step": 73188, "epoch": 1742} {"train_loss": -6.0399556159973145, "global_step": 73189, "epoch": 1742} {"train_loss": -6.0962066650390625, "global_step": 73190, "epoch": 1742} {"train_loss": -6.147021293640137, "global_step": 73191, "epoch": 1742} {"train_loss": -6.03253173828125, "global_step": 73192, "epoch": 1742} {"train_loss": -6.164940357208252, "global_step": 73193, "epoch": 1742} {"train_loss": -6.110931873321533, "global_step": 73194, "epoch": 1742} {"train_loss": -6.045597076416016, "global_step": 73195, "epoch": 1742} {"train_loss": -6.199069499969482, "global_step": 73196, "epoch": 1742} {"train_loss": -6.057717323303223, "global_step": 73197, "epoch": 1742} {"train_loss": -6.056404113769531, "global_step": 73198, "epoch": 1742} {"train_loss": -6.132023811340332, "global_step": 73199, "epoch": 1742} {"train_loss": -5.946620941162109, "global_step": 73200, "epoch": 1742} {"train_loss": -5.953313827514648, "global_step": 73201, "epoch": 1742} {"train_loss": -5.955409526824951, "global_step": 73202, "epoch": 1742} {"train_loss": -5.927395343780518, "global_step": 73203, "epoch": 1742} {"train_loss": -5.982231140136719, "global_step": 73204, "epoch": 1742} {"train_loss": -6.0460366521562845, "global_step": 73205, "epoch": 1742, "val_loss": 75017.0078125} {"train_loss": -6.017545700073242, "global_step": 73206, "epoch": 1743} {"train_loss": -6.057903289794922, "global_step": 73207, "epoch": 1743} {"train_loss": -6.15540885925293, "global_step": 73208, "epoch": 1743} {"train_loss": -6.000075340270996, "global_step": 73209, "epoch": 1743} {"train_loss": -6.105496883392334, "global_step": 73210, "epoch": 1743} {"train_loss": -6.093961715698242, "global_step": 73211, "epoch": 1743} {"train_loss": -5.936786651611328, "global_step": 73212, "epoch": 1743} {"train_loss": -6.100513458251953, "global_step": 73213, "epoch": 1743} {"train_loss": -6.0303239822387695, "global_step": 73214, "epoch": 1743} {"train_loss": -6.044592380523682, "global_step": 73215, "epoch": 1743} {"train_loss": -6.022554397583008, "global_step": 73216, "epoch": 1743} {"train_loss": -6.001760005950928, "global_step": 73217, "epoch": 1743} {"train_loss": -6.048306941986084, "global_step": 73218, "epoch": 1743} {"train_loss": -5.994766712188721, "global_step": 73219, "epoch": 1743} {"train_loss": -6.010237693786621, "global_step": 73220, "epoch": 1743} {"train_loss": -6.066494941711426, "global_step": 73221, "epoch": 1743} {"train_loss": -6.012804985046387, "global_step": 73222, "epoch": 1743} {"train_loss": -6.0553083419799805, "global_step": 73223, "epoch": 1743} {"train_loss": -6.000726699829102, "global_step": 73224, "epoch": 1743} {"train_loss": -6.130763053894043, "global_step": 73225, "epoch": 1743} {"train_loss": -6.007691383361816, "global_step": 73226, "epoch": 1743} {"train_loss": -6.14530086517334, "global_step": 73227, "epoch": 1743} {"train_loss": -6.074557304382324, "global_step": 73228, "epoch": 1743} {"train_loss": -6.141237258911133, "global_step": 73229, "epoch": 1743} {"train_loss": -5.9194841384887695, "global_step": 73230, "epoch": 1743} {"train_loss": -5.996120929718018, "global_step": 73231, "epoch": 1743} {"train_loss": -6.0194244384765625, "global_step": 73232, "epoch": 1743} {"train_loss": -6.075384140014648, "global_step": 73233, "epoch": 1743} {"train_loss": -6.09329891204834, "global_step": 73234, "epoch": 1743} {"train_loss": -5.915703773498535, "global_step": 73235, "epoch": 1743} {"train_loss": -5.9959821701049805, "global_step": 73236, "epoch": 1743} {"train_loss": -6.059381008148193, "global_step": 73237, "epoch": 1743} {"train_loss": -5.819317817687988, "global_step": 73238, "epoch": 1743} {"train_loss": -5.986175537109375, "global_step": 73239, "epoch": 1743} {"train_loss": -6.189797401428223, "global_step": 73240, "epoch": 1743} {"train_loss": -6.103428840637207, "global_step": 73241, "epoch": 1743} {"train_loss": -6.079754829406738, "global_step": 73242, "epoch": 1743} {"train_loss": -5.907436370849609, "global_step": 73243, "epoch": 1743} {"train_loss": -5.9023637771606445, "global_step": 73244, "epoch": 1743} {"train_loss": -6.0917768478393555, "global_step": 73245, "epoch": 1743} {"train_loss": -6.040597438812256, "global_step": 73246, "epoch": 1743} {"train_loss": -6.03800614674886, "global_step": 73247, "epoch": 1743, "val_loss": 74760.3046875} {"train_loss": -6.082195281982422, "global_step": 73248, "epoch": 1744} {"train_loss": -5.949960708618164, "global_step": 73249, "epoch": 1744} {"train_loss": -6.081056594848633, "global_step": 73250, "epoch": 1744} {"train_loss": -6.071170806884766, "global_step": 73251, "epoch": 1744} {"train_loss": -6.127471923828125, "global_step": 73252, "epoch": 1744} {"train_loss": -6.2092132568359375, "global_step": 73253, "epoch": 1744} {"train_loss": -6.139090538024902, "global_step": 73254, "epoch": 1744} {"train_loss": -6.168991565704346, "global_step": 73255, "epoch": 1744} {"train_loss": -6.091171741485596, "global_step": 73256, "epoch": 1744} {"train_loss": -5.980120658874512, "global_step": 73257, "epoch": 1744} {"train_loss": -6.029229164123535, "global_step": 73258, "epoch": 1744} {"train_loss": -6.013757705688477, "global_step": 73259, "epoch": 1744} {"train_loss": -6.018170356750488, "global_step": 73260, "epoch": 1744} {"train_loss": -5.98631477355957, "global_step": 73261, "epoch": 1744} {"train_loss": -5.996217727661133, "global_step": 73262, "epoch": 1744} {"train_loss": -6.081083297729492, "global_step": 73263, "epoch": 1744} {"train_loss": -5.966686248779297, "global_step": 73264, "epoch": 1744} {"train_loss": -6.037518501281738, "global_step": 73265, "epoch": 1744} {"train_loss": -5.945954322814941, "global_step": 73266, "epoch": 1744} {"train_loss": -6.037853240966797, "global_step": 73267, "epoch": 1744} {"train_loss": -5.99918270111084, "global_step": 73268, "epoch": 1744} {"train_loss": -6.071219444274902, "global_step": 73269, "epoch": 1744} {"train_loss": -6.001058578491211, "global_step": 73270, "epoch": 1744} {"train_loss": -6.0948967933654785, "global_step": 73271, "epoch": 1744} {"train_loss": -6.032613754272461, "global_step": 73272, "epoch": 1744} {"train_loss": -5.9163432121276855, "global_step": 73273, "epoch": 1744} {"train_loss": -5.991318225860596, "global_step": 73274, "epoch": 1744} {"train_loss": -6.042356491088867, "global_step": 73275, "epoch": 1744} {"train_loss": -5.992075443267822, "global_step": 73276, "epoch": 1744} {"train_loss": -6.081766605377197, "global_step": 73277, "epoch": 1744} {"train_loss": -6.01630973815918, "global_step": 73278, "epoch": 1744} {"train_loss": -6.051512718200684, "global_step": 73279, "epoch": 1744} {"train_loss": -5.993913650512695, "global_step": 73280, "epoch": 1744} {"train_loss": -6.066364288330078, "global_step": 73281, "epoch": 1744} {"train_loss": -6.195448875427246, "global_step": 73282, "epoch": 1744} {"train_loss": -6.069876670837402, "global_step": 73283, "epoch": 1744} {"train_loss": -6.10835599899292, "global_step": 73284, "epoch": 1744} {"train_loss": -5.993882179260254, "global_step": 73285, "epoch": 1744} {"train_loss": -6.144054889678955, "global_step": 73286, "epoch": 1744} {"train_loss": -6.154999732971191, "global_step": 73287, "epoch": 1744} {"train_loss": -6.090874195098877, "global_step": 73288, "epoch": 1744} {"train_loss": -6.0506190458933515, "global_step": 73289, "epoch": 1744, "val_loss": 75134.2890625} {"train_loss": -6.067295551300049, "global_step": 73290, "epoch": 1745} {"train_loss": -6.082993507385254, "global_step": 73291, "epoch": 1745} {"train_loss": -6.068535804748535, "global_step": 73292, "epoch": 1745} {"train_loss": -5.995409965515137, "global_step": 73293, "epoch": 1745} {"train_loss": -6.028002738952637, "global_step": 73294, "epoch": 1745} {"train_loss": -6.122721195220947, "global_step": 73295, "epoch": 1745} {"train_loss": -6.0849928855896, "global_step": 73296, "epoch": 1745} {"train_loss": -6.01336669921875, "global_step": 73297, "epoch": 1745} {"train_loss": -6.003176689147949, "global_step": 73298, "epoch": 1745} {"train_loss": -6.04646110534668, "global_step": 73299, "epoch": 1745} {"train_loss": -6.077947616577148, "global_step": 73300, "epoch": 1745} {"train_loss": -6.04025936126709, "global_step": 73301, "epoch": 1745} {"train_loss": -5.905776023864746, "global_step": 73302, "epoch": 1745} {"train_loss": -6.0756425857543945, "global_step": 73303, "epoch": 1745} {"train_loss": -6.08013916015625, "global_step": 73304, "epoch": 1745} {"train_loss": -5.937506675720215, "global_step": 73305, "epoch": 1745} {"train_loss": -5.981302261352539, "global_step": 73306, "epoch": 1745} {"train_loss": -6.030060291290283, "global_step": 73307, "epoch": 1745} {"train_loss": -6.106040954589844, "global_step": 73308, "epoch": 1745} {"train_loss": -6.056430816650391, "global_step": 73309, "epoch": 1745} {"train_loss": -6.087377071380615, "global_step": 73310, "epoch": 1745} {"train_loss": -6.075138092041016, "global_step": 73311, "epoch": 1745} {"train_loss": -6.146504878997803, "global_step": 73312, "epoch": 1745} {"train_loss": -6.177391052246094, "global_step": 73313, "epoch": 1745} {"train_loss": -6.058750152587891, "global_step": 73314, "epoch": 1745} {"train_loss": -5.99172306060791, "global_step": 73315, "epoch": 1745} {"train_loss": -6.018978118896484, "global_step": 73316, "epoch": 1745} {"train_loss": -5.986915588378906, "global_step": 73317, "epoch": 1745} {"train_loss": -6.005151748657227, "global_step": 73318, "epoch": 1745} {"train_loss": -6.149934768676758, "global_step": 73319, "epoch": 1745} {"train_loss": -6.185510635375977, "global_step": 73320, "epoch": 1745} {"train_loss": -5.985970497131348, "global_step": 73321, "epoch": 1745} {"train_loss": -6.130583763122559, "global_step": 73322, "epoch": 1745} {"train_loss": -6.08564567565918, "global_step": 73323, "epoch": 1745} {"train_loss": -6.177329063415527, "global_step": 73324, "epoch": 1745} {"train_loss": -6.026286602020264, "global_step": 73325, "epoch": 1745} {"train_loss": -6.131440162658691, "global_step": 73326, "epoch": 1745} {"train_loss": -6.055079460144043, "global_step": 73327, "epoch": 1745} {"train_loss": -6.076720714569092, "global_step": 73328, "epoch": 1745} {"train_loss": -6.04814338684082, "global_step": 73329, "epoch": 1745} {"train_loss": -5.9831647872924805, "global_step": 73330, "epoch": 1745} {"train_loss": -6.057580402919224, "global_step": 73331, "epoch": 1745, "val_loss": 74662.5078125} {"train_loss": -6.080476760864258, "global_step": 73332, "epoch": 1746} {"train_loss": -6.036195755004883, "global_step": 73333, "epoch": 1746} {"train_loss": -6.067113399505615, "global_step": 73334, "epoch": 1746} {"train_loss": -6.063477516174316, "global_step": 73335, "epoch": 1746} {"train_loss": -6.032162666320801, "global_step": 73336, "epoch": 1746} {"train_loss": -5.99467658996582, "global_step": 73337, "epoch": 1746} {"train_loss": -6.037201881408691, "global_step": 73338, "epoch": 1746} {"train_loss": -6.053845405578613, "global_step": 73339, "epoch": 1746} {"train_loss": -5.971695423126221, "global_step": 73340, "epoch": 1746} {"train_loss": -6.109226703643799, "global_step": 73341, "epoch": 1746} {"train_loss": -5.861639022827148, "global_step": 73342, "epoch": 1746} {"train_loss": -6.03587007522583, "global_step": 73343, "epoch": 1746} {"train_loss": -5.887759685516357, "global_step": 73344, "epoch": 1746} {"train_loss": -5.918767929077148, "global_step": 73345, "epoch": 1746} {"train_loss": -6.096645355224609, "global_step": 73346, "epoch": 1746} {"train_loss": -5.953257083892822, "global_step": 73347, "epoch": 1746} {"train_loss": -6.016278266906738, "global_step": 73348, "epoch": 1746} {"train_loss": -5.799176216125488, "global_step": 73349, "epoch": 1746} {"train_loss": -5.898734092712402, "global_step": 73350, "epoch": 1746} {"train_loss": -5.971148490905762, "global_step": 73351, "epoch": 1746} {"train_loss": -6.004490852355957, "global_step": 73352, "epoch": 1746} {"train_loss": -6.050525665283203, "global_step": 73353, "epoch": 1746} {"train_loss": -5.993095874786377, "global_step": 73354, "epoch": 1746} {"train_loss": -6.082782745361328, "global_step": 73355, "epoch": 1746} {"train_loss": -6.014399528503418, "global_step": 73356, "epoch": 1746} {"train_loss": -6.011545658111572, "global_step": 73357, "epoch": 1746} {"train_loss": -6.010351181030273, "global_step": 73358, "epoch": 1746} {"train_loss": -6.177077293395996, "global_step": 73359, "epoch": 1746} {"train_loss": -6.010345935821533, "global_step": 73360, "epoch": 1746} {"train_loss": -6.009504318237305, "global_step": 73361, "epoch": 1746} {"train_loss": -6.012862205505371, "global_step": 73362, "epoch": 1746} {"train_loss": -6.06687593460083, "global_step": 73363, "epoch": 1746} {"train_loss": -6.090706825256348, "global_step": 73364, "epoch": 1746} {"train_loss": -6.024416446685791, "global_step": 73365, "epoch": 1746} {"train_loss": -6.113149642944336, "global_step": 73366, "epoch": 1746} {"train_loss": -6.059304237365723, "global_step": 73367, "epoch": 1746} {"train_loss": -6.168902397155762, "global_step": 73368, "epoch": 1746} {"train_loss": -6.100153923034668, "global_step": 73369, "epoch": 1746} {"train_loss": -6.096304416656494, "global_step": 73370, "epoch": 1746} {"train_loss": -6.069400787353516, "global_step": 73371, "epoch": 1746} {"train_loss": -5.98890495300293, "global_step": 73372, "epoch": 1746} {"train_loss": -6.025292646317255, "global_step": 73373, "epoch": 1746, "val_loss": 75330.15625} {"train_loss": -6.140227317810059, "global_step": 73374, "epoch": 1747} {"train_loss": -6.1216912269592285, "global_step": 73375, "epoch": 1747} {"train_loss": -6.1744489669799805, "global_step": 73376, "epoch": 1747} {"train_loss": -6.0659990310668945, "global_step": 73377, "epoch": 1747} {"train_loss": -6.074247360229492, "global_step": 73378, "epoch": 1747} {"train_loss": -6.137349605560303, "global_step": 73379, "epoch": 1747} {"train_loss": -6.1462602615356445, "global_step": 73380, "epoch": 1747} {"train_loss": -6.057889938354492, "global_step": 73381, "epoch": 1747} {"train_loss": -6.074213027954102, "global_step": 73382, "epoch": 1747} {"train_loss": -6.057806015014648, "global_step": 73383, "epoch": 1747} {"train_loss": -6.077542781829834, "global_step": 73384, "epoch": 1747} {"train_loss": -6.134882926940918, "global_step": 73385, "epoch": 1747} {"train_loss": -6.142942905426025, "global_step": 73386, "epoch": 1747} {"train_loss": -6.046206474304199, "global_step": 73387, "epoch": 1747} {"train_loss": -6.000455856323242, "global_step": 73388, "epoch": 1747} {"train_loss": -6.120298862457275, "global_step": 73389, "epoch": 1747} {"train_loss": -6.146185874938965, "global_step": 73390, "epoch": 1747} {"train_loss": -5.987735748291016, "global_step": 73391, "epoch": 1747} {"train_loss": -6.005279541015625, "global_step": 73392, "epoch": 1747} {"train_loss": -6.066075325012207, "global_step": 73393, "epoch": 1747} {"train_loss": -6.2150559425354, "global_step": 73394, "epoch": 1747} {"train_loss": -6.060277462005615, "global_step": 73395, "epoch": 1747} {"train_loss": -6.066586494445801, "global_step": 73396, "epoch": 1747} {"train_loss": -6.138350486755371, "global_step": 73397, "epoch": 1747} {"train_loss": -6.154927730560303, "global_step": 73398, "epoch": 1747} {"train_loss": -6.070474624633789, "global_step": 73399, "epoch": 1747} {"train_loss": -6.025945663452148, "global_step": 73400, "epoch": 1747} {"train_loss": -6.165716171264648, "global_step": 73401, "epoch": 1747} {"train_loss": -6.069314002990723, "global_step": 73402, "epoch": 1747} {"train_loss": -6.003625869750977, "global_step": 73403, "epoch": 1747} {"train_loss": -6.0380859375, "global_step": 73404, "epoch": 1747} {"train_loss": -5.963840961456299, "global_step": 73405, "epoch": 1747} {"train_loss": -6.045653820037842, "global_step": 73406, "epoch": 1747} {"train_loss": -5.911314010620117, "global_step": 73407, "epoch": 1747} {"train_loss": -5.906056880950928, "global_step": 73408, "epoch": 1747} {"train_loss": -6.020538806915283, "global_step": 73409, "epoch": 1747} {"train_loss": -6.140293121337891, "global_step": 73410, "epoch": 1747} {"train_loss": -6.090646743774414, "global_step": 73411, "epoch": 1747} {"train_loss": -5.99064826965332, "global_step": 73412, "epoch": 1747} {"train_loss": -6.117164611816406, "global_step": 73413, "epoch": 1747} {"train_loss": -5.999667644500732, "global_step": 73414, "epoch": 1747} {"train_loss": -6.070442154293969, "global_step": 73415, "epoch": 1747, "val_loss": 75126.8203125} {"train_loss": -6.086565017700195, "global_step": 73416, "epoch": 1748} {"train_loss": -6.041666030883789, "global_step": 73417, "epoch": 1748} {"train_loss": -6.052515506744385, "global_step": 73418, "epoch": 1748} {"train_loss": -5.930994033813477, "global_step": 73419, "epoch": 1748} {"train_loss": -6.087811470031738, "global_step": 73420, "epoch": 1748} {"train_loss": -5.958247184753418, "global_step": 73421, "epoch": 1748} {"train_loss": -5.989135265350342, "global_step": 73422, "epoch": 1748} {"train_loss": -5.971973419189453, "global_step": 73423, "epoch": 1748} {"train_loss": -6.148829460144043, "global_step": 73424, "epoch": 1748} {"train_loss": -5.856416702270508, "global_step": 73425, "epoch": 1748} {"train_loss": -6.101236343383789, "global_step": 73426, "epoch": 1748} {"train_loss": -6.032437801361084, "global_step": 73427, "epoch": 1748} {"train_loss": -5.95660400390625, "global_step": 73428, "epoch": 1748} {"train_loss": -6.035845756530762, "global_step": 73429, "epoch": 1748} {"train_loss": -6.108558654785156, "global_step": 73430, "epoch": 1748} {"train_loss": -5.981313705444336, "global_step": 73431, "epoch": 1748} {"train_loss": -6.095393657684326, "global_step": 73432, "epoch": 1748} {"train_loss": -5.99385404586792, "global_step": 73433, "epoch": 1748} {"train_loss": -6.037007808685303, "global_step": 73434, "epoch": 1748} {"train_loss": -6.054269790649414, "global_step": 73435, "epoch": 1748} {"train_loss": -6.0450286865234375, "global_step": 73436, "epoch": 1748} {"train_loss": -6.067592144012451, "global_step": 73437, "epoch": 1748} {"train_loss": -5.958351135253906, "global_step": 73438, "epoch": 1748} {"train_loss": -6.136917591094971, "global_step": 73439, "epoch": 1748} {"train_loss": -5.993653297424316, "global_step": 73440, "epoch": 1748} {"train_loss": -6.030063152313232, "global_step": 73441, "epoch": 1748} {"train_loss": -6.169140338897705, "global_step": 73442, "epoch": 1748} {"train_loss": -6.077797889709473, "global_step": 73443, "epoch": 1748} {"train_loss": -6.020058631896973, "global_step": 73444, "epoch": 1748} {"train_loss": -6.05930233001709, "global_step": 73445, "epoch": 1748} {"train_loss": -6.057952880859375, "global_step": 73446, "epoch": 1748} {"train_loss": -6.109421253204346, "global_step": 73447, "epoch": 1748} {"train_loss": -6.034076690673828, "global_step": 73448, "epoch": 1748} {"train_loss": -6.130536079406738, "global_step": 73449, "epoch": 1748} {"train_loss": -6.184049606323242, "global_step": 73450, "epoch": 1748} {"train_loss": -6.113868713378906, "global_step": 73451, "epoch": 1748} {"train_loss": -6.152942657470703, "global_step": 73452, "epoch": 1748} {"train_loss": -6.236800670623779, "global_step": 73453, "epoch": 1748} {"train_loss": -6.16436767578125, "global_step": 73454, "epoch": 1748} {"train_loss": -6.00615119934082, "global_step": 73455, "epoch": 1748} {"train_loss": -6.059295177459717, "global_step": 73456, "epoch": 1748} {"train_loss": -6.055301484607515, "global_step": 73457, "epoch": 1748, "val_loss": 75018.140625} {"train_loss": -5.956846714019775, "global_step": 73458, "epoch": 1749} {"train_loss": -6.144953727722168, "global_step": 73459, "epoch": 1749} {"train_loss": -5.936514854431152, "global_step": 73460, "epoch": 1749} {"train_loss": -6.060373306274414, "global_step": 73461, "epoch": 1749} {"train_loss": -6.0908002853393555, "global_step": 73462, "epoch": 1749} {"train_loss": -5.9163899421691895, "global_step": 73463, "epoch": 1749} {"train_loss": -5.994792461395264, "global_step": 73464, "epoch": 1749} {"train_loss": -6.026109218597412, "global_step": 73465, "epoch": 1749} {"train_loss": -5.906215667724609, "global_step": 73466, "epoch": 1749} {"train_loss": -6.013355255126953, "global_step": 73467, "epoch": 1749} {"train_loss": -5.996598720550537, "global_step": 73468, "epoch": 1749} {"train_loss": -5.984355926513672, "global_step": 73469, "epoch": 1749} {"train_loss": -6.067776679992676, "global_step": 73470, "epoch": 1749} {"train_loss": -5.933226585388184, "global_step": 73471, "epoch": 1749} {"train_loss": -5.99212646484375, "global_step": 73472, "epoch": 1749} {"train_loss": -6.036099910736084, "global_step": 73473, "epoch": 1749} {"train_loss": -5.975688457489014, "global_step": 73474, "epoch": 1749} {"train_loss": -5.968059539794922, "global_step": 73475, "epoch": 1749} {"train_loss": -5.946329116821289, "global_step": 73476, "epoch": 1749} {"train_loss": -5.920535564422607, "global_step": 73477, "epoch": 1749} {"train_loss": -6.066086769104004, "global_step": 73478, "epoch": 1749} {"train_loss": -5.94585657119751, "global_step": 73479, "epoch": 1749} {"train_loss": -6.132112503051758, "global_step": 73480, "epoch": 1749} {"train_loss": -6.031378269195557, "global_step": 73481, "epoch": 1749} {"train_loss": -5.991684913635254, "global_step": 73482, "epoch": 1749} {"train_loss": -6.127488136291504, "global_step": 73483, "epoch": 1749} {"train_loss": -6.127288341522217, "global_step": 73484, "epoch": 1749} {"train_loss": -6.089269161224365, "global_step": 73485, "epoch": 1749} {"train_loss": -6.217694282531738, "global_step": 73486, "epoch": 1749} {"train_loss": -6.069652557373047, "global_step": 73487, "epoch": 1749} {"train_loss": -6.187787055969238, "global_step": 73488, "epoch": 1749} {"train_loss": -6.169046401977539, "global_step": 73489, "epoch": 1749} {"train_loss": -5.968543529510498, "global_step": 73490, "epoch": 1749} {"train_loss": -6.103248596191406, "global_step": 73491, "epoch": 1749} {"train_loss": -6.012214183807373, "global_step": 73492, "epoch": 1749} {"train_loss": -5.947587966918945, "global_step": 73493, "epoch": 1749} {"train_loss": -6.115194797515869, "global_step": 73494, "epoch": 1749} {"train_loss": -5.98638916015625, "global_step": 73495, "epoch": 1749} {"train_loss": -5.9946489334106445, "global_step": 73496, "epoch": 1749} {"train_loss": -6.250837326049805, "global_step": 73497, "epoch": 1749} {"train_loss": -6.018168926239014, "global_step": 73498, "epoch": 1749} {"train_loss": -6.035334178379604, "global_step": 73499, "epoch": 1749, "val_loss": 74848.515625} {"train_loss": -6.092846393585205, "global_step": 73500, "epoch": 1750} {"train_loss": -6.027287483215332, "global_step": 73501, "epoch": 1750} {"train_loss": -6.11759090423584, "global_step": 73502, "epoch": 1750} {"train_loss": -6.065394401550293, "global_step": 73503, "epoch": 1750} {"train_loss": -6.125812530517578, "global_step": 73504, "epoch": 1750} {"train_loss": -6.082885265350342, "global_step": 73505, "epoch": 1750} {"train_loss": -6.06056022644043, "global_step": 73506, "epoch": 1750} {"train_loss": -6.062453269958496, "global_step": 73507, "epoch": 1750} {"train_loss": -6.168153762817383, "global_step": 73508, "epoch": 1750} {"train_loss": -6.192991256713867, "global_step": 73509, "epoch": 1750} {"train_loss": -6.069019794464111, "global_step": 73510, "epoch": 1750} {"train_loss": -6.022984981536865, "global_step": 73511, "epoch": 1750} {"train_loss": -6.008231163024902, "global_step": 73512, "epoch": 1750} {"train_loss": -6.042919158935547, "global_step": 73513, "epoch": 1750} {"train_loss": -6.05963134765625, "global_step": 73514, "epoch": 1750} {"train_loss": -6.098655700683594, "global_step": 73515, "epoch": 1750} {"train_loss": -6.055834770202637, "global_step": 73516, "epoch": 1750} {"train_loss": -5.985950469970703, "global_step": 73517, "epoch": 1750} {"train_loss": -5.937530994415283, "global_step": 73518, "epoch": 1750} {"train_loss": -6.082365989685059, "global_step": 73519, "epoch": 1750} {"train_loss": -5.884378910064697, "global_step": 73520, "epoch": 1750} {"train_loss": -6.044910907745361, "global_step": 73521, "epoch": 1750} {"train_loss": -6.08583927154541, "global_step": 73522, "epoch": 1750} {"train_loss": -6.032574653625488, "global_step": 73523, "epoch": 1750} {"train_loss": -6.093940734863281, "global_step": 73524, "epoch": 1750} {"train_loss": -6.015458106994629, "global_step": 73525, "epoch": 1750} {"train_loss": -6.114796161651611, "global_step": 73526, "epoch": 1750} {"train_loss": -6.020014762878418, "global_step": 73527, "epoch": 1750} {"train_loss": -6.083629608154297, "global_step": 73528, "epoch": 1750} {"train_loss": -5.97028923034668, "global_step": 73529, "epoch": 1750} {"train_loss": -6.0978827476501465, "global_step": 73530, "epoch": 1750} {"train_loss": -6.024344444274902, "global_step": 73531, "epoch": 1750} {"train_loss": -6.1329498291015625, "global_step": 73532, "epoch": 1750} {"train_loss": -6.081541538238525, "global_step": 73533, "epoch": 1750} {"train_loss": -6.087190628051758, "global_step": 73534, "epoch": 1750} {"train_loss": -6.037315368652344, "global_step": 73535, "epoch": 1750} {"train_loss": -6.021673202514648, "global_step": 73536, "epoch": 1750} {"train_loss": -6.0427985191345215, "global_step": 73537, "epoch": 1750} {"train_loss": -6.057251453399658, "global_step": 73538, "epoch": 1750} {"train_loss": -6.025391578674316, "global_step": 73539, "epoch": 1750} {"train_loss": -6.127311706542969, "global_step": 73540, "epoch": 1750} {"train_loss": -6.0619806335085915, "global_step": 73541, "epoch": 1750, "train/sim_max_reward_0": 0.42105493921352194, "train/sim_max_reward_1": 0.8562293564181156, "train/sim_max_reward_2": 0.6400144683408471, "train/sim_max_reward_3": 0.16534733746693292, "train/sim_max_reward_4": 0.8895383247080343, "train/sim_max_reward_5": 0.8895372992723842, "test/sim_max_reward_4500000": 0.7828618055833798, "test/sim_max_reward_4500001": 0.9370808040044569, "test/sim_max_reward_4500002": 0.9397197270958748, "test/sim_max_reward_4500003": 0.7625604366144498, "test/sim_max_reward_4500004": 0.7964293315790725, "test/sim_max_reward_4500005": 0.4173281341443589, "test/sim_max_reward_4500006": 0.9411068124550028, "test/sim_max_reward_4500007": 0.4181248081366393, "test/sim_max_reward_4500008": 0.30712925833881866, "test/sim_max_reward_4500009": 0.8457338330166022, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.3913012307329689, "test/sim_max_reward_4500012": 0.9642302365629638, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.35907745432252236, "test/sim_max_reward_4500015": 0.7075674685274242, "test/sim_max_reward_4500016": 0.9779062241029147, "test/sim_max_reward_4500017": 0.15801533845190155, "test/sim_max_reward_4500018": 0.061458535893920696, "test/sim_max_reward_4500019": 0.8603433844516207, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.7956753495297718, "test/sim_max_reward_4500023": 0.8806247810918744, "test/sim_max_reward_4500024": 0.9452334863167399, "test/sim_max_reward_4500025": 0.5605043795957984, "test/sim_max_reward_4500026": 0.8430551108625103, "test/sim_max_reward_4500027": 0.5577703183353871, "test/sim_max_reward_4500028": 0.21027889726038357, "test/sim_max_reward_4500029": 0.1982643678411678, "test/sim_max_reward_4500030": 0.971413715971315, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.42152155411762104, "test/sim_max_reward_4500033": 0.03514128038367187, "test/sim_max_reward_4500034": 0.7481333285310723, "test/sim_max_reward_4500035": 0.9491595244810483, "test/sim_max_reward_4500036": 0.36815382181296796, "test/sim_max_reward_4500037": 0.9696313741934238, "test/sim_max_reward_4500038": 0.2949983371752231, "test/sim_max_reward_4500039": 0.9383835648905502, "test/sim_max_reward_4500040": 0.9799786938973405, "test/sim_max_reward_4500041": 0.9203049419002765, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.18665880458868578, "test/sim_max_reward_4500044": 0.14666291236867998, "test/sim_max_reward_4500045": 0.834466373574181, "test/sim_max_reward_4500046": 0.6683599454945033, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6436202875699726, "test/mean_score": 0.5814957867347835, "val_loss": 74927.1015625} {"train_loss": -6.07310676574707, "global_step": 73542, "epoch": 1751} {"train_loss": -6.177906513214111, "global_step": 73543, "epoch": 1751} {"train_loss": -5.99332857131958, "global_step": 73544, "epoch": 1751} {"train_loss": -6.169570446014404, "global_step": 73545, "epoch": 1751} {"train_loss": -6.14996337890625, "global_step": 73546, "epoch": 1751} {"train_loss": -6.053257942199707, "global_step": 73547, "epoch": 1751} {"train_loss": -6.011414527893066, "global_step": 73548, "epoch": 1751} {"train_loss": -6.0719075202941895, "global_step": 73549, "epoch": 1751} {"train_loss": -6.172272682189941, "global_step": 73550, "epoch": 1751} {"train_loss": -6.229666709899902, "global_step": 73551, "epoch": 1751} {"train_loss": -6.100988388061523, "global_step": 73552, "epoch": 1751} {"train_loss": -6.208479881286621, "global_step": 73553, "epoch": 1751} {"train_loss": -6.096460342407227, "global_step": 73554, "epoch": 1751} {"train_loss": -6.137770652770996, "global_step": 73555, "epoch": 1751} {"train_loss": -6.009738445281982, "global_step": 73556, "epoch": 1751} {"train_loss": -6.171717166900635, "global_step": 73557, "epoch": 1751} {"train_loss": -6.153208255767822, "global_step": 73558, "epoch": 1751} {"train_loss": -6.237771987915039, "global_step": 73559, "epoch": 1751} {"train_loss": -6.19144868850708, "global_step": 73560, "epoch": 1751} {"train_loss": -6.138500690460205, "global_step": 73561, "epoch": 1751} {"train_loss": -6.112149238586426, "global_step": 73562, "epoch": 1751} {"train_loss": -6.0799384117126465, "global_step": 73563, "epoch": 1751} {"train_loss": -6.131113529205322, "global_step": 73564, "epoch": 1751} {"train_loss": -6.193143844604492, "global_step": 73565, "epoch": 1751} {"train_loss": -6.0553083419799805, "global_step": 73566, "epoch": 1751} {"train_loss": -6.1003804206848145, "global_step": 73567, "epoch": 1751} {"train_loss": -6.135849952697754, "global_step": 73568, "epoch": 1751} {"train_loss": -6.082276821136475, "global_step": 73569, "epoch": 1751} {"train_loss": -6.13326358795166, "global_step": 73570, "epoch": 1751} {"train_loss": -6.041998863220215, "global_step": 73571, "epoch": 1751} {"train_loss": -5.8989057540893555, "global_step": 73572, "epoch": 1751} {"train_loss": -5.986370086669922, "global_step": 73573, "epoch": 1751} {"train_loss": -6.058690071105957, "global_step": 73574, "epoch": 1751} {"train_loss": -5.906909942626953, "global_step": 73575, "epoch": 1751} {"train_loss": -5.9449462890625, "global_step": 73576, "epoch": 1751} {"train_loss": -6.074649810791016, "global_step": 73577, "epoch": 1751} {"train_loss": -5.868445873260498, "global_step": 73578, "epoch": 1751} {"train_loss": -5.868752956390381, "global_step": 73579, "epoch": 1751} {"train_loss": -6.0381693840026855, "global_step": 73580, "epoch": 1751} {"train_loss": -5.856802940368652, "global_step": 73581, "epoch": 1751} {"train_loss": -6.010612487792969, "global_step": 73582, "epoch": 1751} {"train_loss": -6.0727775891621905, "global_step": 73583, "epoch": 1751, "val_loss": 74980.8984375} {"train_loss": -6.075015068054199, "global_step": 73584, "epoch": 1752} {"train_loss": -6.130739212036133, "global_step": 73585, "epoch": 1752} {"train_loss": -5.905255317687988, "global_step": 73586, "epoch": 1752} {"train_loss": -6.0089311599731445, "global_step": 73587, "epoch": 1752} {"train_loss": -5.924935340881348, "global_step": 73588, "epoch": 1752} {"train_loss": -6.1191277503967285, "global_step": 73589, "epoch": 1752} {"train_loss": -5.97934627532959, "global_step": 73590, "epoch": 1752} {"train_loss": -6.098235130310059, "global_step": 73591, "epoch": 1752} {"train_loss": -6.107968330383301, "global_step": 73592, "epoch": 1752} {"train_loss": -6.1041483879089355, "global_step": 73593, "epoch": 1752} {"train_loss": -5.911717891693115, "global_step": 73594, "epoch": 1752} {"train_loss": -6.0621795654296875, "global_step": 73595, "epoch": 1752} {"train_loss": -5.952479839324951, "global_step": 73596, "epoch": 1752} {"train_loss": -5.956523895263672, "global_step": 73597, "epoch": 1752} {"train_loss": -6.113346099853516, "global_step": 73598, "epoch": 1752} {"train_loss": -5.852845668792725, "global_step": 73599, "epoch": 1752} {"train_loss": -6.040766716003418, "global_step": 73600, "epoch": 1752} {"train_loss": -6.009607315063477, "global_step": 73601, "epoch": 1752} {"train_loss": -6.076336860656738, "global_step": 73602, "epoch": 1752} {"train_loss": -5.9645891189575195, "global_step": 73603, "epoch": 1752} {"train_loss": -6.0491533279418945, "global_step": 73604, "epoch": 1752} {"train_loss": -5.9596943855285645, "global_step": 73605, "epoch": 1752} {"train_loss": -5.941891670227051, "global_step": 73606, "epoch": 1752} {"train_loss": -6.09962272644043, "global_step": 73607, "epoch": 1752} {"train_loss": -6.0054473876953125, "global_step": 73608, "epoch": 1752} {"train_loss": -5.9554619789123535, "global_step": 73609, "epoch": 1752} {"train_loss": -5.987825393676758, "global_step": 73610, "epoch": 1752} {"train_loss": -6.035327911376953, "global_step": 73611, "epoch": 1752} {"train_loss": -6.001404762268066, "global_step": 73612, "epoch": 1752} {"train_loss": -5.885331153869629, "global_step": 73613, "epoch": 1752} {"train_loss": -6.111339569091797, "global_step": 73614, "epoch": 1752} {"train_loss": -5.9179277420043945, "global_step": 73615, "epoch": 1752} {"train_loss": -6.033566951751709, "global_step": 73616, "epoch": 1752} {"train_loss": -6.065969467163086, "global_step": 73617, "epoch": 1752} {"train_loss": -5.995748519897461, "global_step": 73618, "epoch": 1752} {"train_loss": -5.948144435882568, "global_step": 73619, "epoch": 1752} {"train_loss": -6.093982696533203, "global_step": 73620, "epoch": 1752} {"train_loss": -6.097334861755371, "global_step": 73621, "epoch": 1752} {"train_loss": -6.006431579589844, "global_step": 73622, "epoch": 1752} {"train_loss": -5.941738128662109, "global_step": 73623, "epoch": 1752} {"train_loss": -6.099496841430664, "global_step": 73624, "epoch": 1752} {"train_loss": -6.014660596847534, "global_step": 73625, "epoch": 1752, "val_loss": 74782.2109375} {"train_loss": -5.984849452972412, "global_step": 73626, "epoch": 1753} {"train_loss": -6.060770034790039, "global_step": 73627, "epoch": 1753} {"train_loss": -6.12357234954834, "global_step": 73628, "epoch": 1753} {"train_loss": -6.064516067504883, "global_step": 73629, "epoch": 1753} {"train_loss": -6.000771522521973, "global_step": 73630, "epoch": 1753} {"train_loss": -6.076878547668457, "global_step": 73631, "epoch": 1753} {"train_loss": -6.07197380065918, "global_step": 73632, "epoch": 1753} {"train_loss": -6.087082862854004, "global_step": 73633, "epoch": 1753} {"train_loss": -6.002985000610352, "global_step": 73634, "epoch": 1753} {"train_loss": -6.053692817687988, "global_step": 73635, "epoch": 1753} {"train_loss": -6.048503875732422, "global_step": 73636, "epoch": 1753} {"train_loss": -6.073116302490234, "global_step": 73637, "epoch": 1753} {"train_loss": -6.087228298187256, "global_step": 73638, "epoch": 1753} {"train_loss": -6.147003173828125, "global_step": 73639, "epoch": 1753} {"train_loss": -6.117720603942871, "global_step": 73640, "epoch": 1753} {"train_loss": -6.17993688583374, "global_step": 73641, "epoch": 1753} {"train_loss": -6.124391555786133, "global_step": 73642, "epoch": 1753} {"train_loss": -6.132160186767578, "global_step": 73643, "epoch": 1753} {"train_loss": -5.975482940673828, "global_step": 73644, "epoch": 1753} {"train_loss": -6.105505466461182, "global_step": 73645, "epoch": 1753} {"train_loss": -6.007805824279785, "global_step": 73646, "epoch": 1753} {"train_loss": -6.040907859802246, "global_step": 73647, "epoch": 1753} {"train_loss": -6.118975639343262, "global_step": 73648, "epoch": 1753} {"train_loss": -6.078873634338379, "global_step": 73649, "epoch": 1753} {"train_loss": -5.898846626281738, "global_step": 73650, "epoch": 1753} {"train_loss": -5.968679428100586, "global_step": 73651, "epoch": 1753} {"train_loss": -6.073956489562988, "global_step": 73652, "epoch": 1753} {"train_loss": -6.020018577575684, "global_step": 73653, "epoch": 1753} {"train_loss": -6.1049652099609375, "global_step": 73654, "epoch": 1753} {"train_loss": -6.148271560668945, "global_step": 73655, "epoch": 1753} {"train_loss": -6.0700178146362305, "global_step": 73656, "epoch": 1753} {"train_loss": -6.1028289794921875, "global_step": 73657, "epoch": 1753} {"train_loss": -5.941046714782715, "global_step": 73658, "epoch": 1753} {"train_loss": -6.179186820983887, "global_step": 73659, "epoch": 1753} {"train_loss": -6.05772590637207, "global_step": 73660, "epoch": 1753} {"train_loss": -6.064438343048096, "global_step": 73661, "epoch": 1753} {"train_loss": -5.904102325439453, "global_step": 73662, "epoch": 1753} {"train_loss": -6.015948295593262, "global_step": 73663, "epoch": 1753} {"train_loss": -5.861347198486328, "global_step": 73664, "epoch": 1753} {"train_loss": -6.073371410369873, "global_step": 73665, "epoch": 1753} {"train_loss": -6.139704704284668, "global_step": 73666, "epoch": 1753} {"train_loss": -6.058515332994007, "global_step": 73667, "epoch": 1753, "val_loss": 74865.6953125} {"train_loss": -5.960515975952148, "global_step": 73668, "epoch": 1754} {"train_loss": -5.974071025848389, "global_step": 73669, "epoch": 1754} {"train_loss": -6.213949203491211, "global_step": 73670, "epoch": 1754} {"train_loss": -6.0275750160217285, "global_step": 73671, "epoch": 1754} {"train_loss": -5.996166229248047, "global_step": 73672, "epoch": 1754} {"train_loss": -5.914511203765869, "global_step": 73673, "epoch": 1754} {"train_loss": -6.032281875610352, "global_step": 73674, "epoch": 1754} {"train_loss": -6.124996185302734, "global_step": 73675, "epoch": 1754} {"train_loss": -5.975152969360352, "global_step": 73676, "epoch": 1754} {"train_loss": -6.045706748962402, "global_step": 73677, "epoch": 1754} {"train_loss": -5.929596900939941, "global_step": 73678, "epoch": 1754} {"train_loss": -5.997900009155273, "global_step": 73679, "epoch": 1754} {"train_loss": -6.131344795227051, "global_step": 73680, "epoch": 1754} {"train_loss": -5.926137924194336, "global_step": 73681, "epoch": 1754} {"train_loss": -6.060302734375, "global_step": 73682, "epoch": 1754} {"train_loss": -6.046114921569824, "global_step": 73683, "epoch": 1754} {"train_loss": -5.991964340209961, "global_step": 73684, "epoch": 1754} {"train_loss": -6.044689178466797, "global_step": 73685, "epoch": 1754} {"train_loss": -6.053069114685059, "global_step": 73686, "epoch": 1754} {"train_loss": -6.094498634338379, "global_step": 73687, "epoch": 1754} {"train_loss": -6.112110614776611, "global_step": 73688, "epoch": 1754} {"train_loss": -5.944096565246582, "global_step": 73689, "epoch": 1754} {"train_loss": -6.044136047363281, "global_step": 73690, "epoch": 1754} {"train_loss": -6.045199394226074, "global_step": 73691, "epoch": 1754} {"train_loss": -6.103057861328125, "global_step": 73692, "epoch": 1754} {"train_loss": -6.067012786865234, "global_step": 73693, "epoch": 1754} {"train_loss": -6.094020843505859, "global_step": 73694, "epoch": 1754} {"train_loss": -6.062958717346191, "global_step": 73695, "epoch": 1754} {"train_loss": -6.1416521072387695, "global_step": 73696, "epoch": 1754} {"train_loss": -6.238925933837891, "global_step": 73697, "epoch": 1754} {"train_loss": -6.167885780334473, "global_step": 73698, "epoch": 1754} {"train_loss": -6.170260429382324, "global_step": 73699, "epoch": 1754} {"train_loss": -6.057231426239014, "global_step": 73700, "epoch": 1754} {"train_loss": -6.0023088455200195, "global_step": 73701, "epoch": 1754} {"train_loss": -6.0145039558410645, "global_step": 73702, "epoch": 1754} {"train_loss": -6.105609893798828, "global_step": 73703, "epoch": 1754} {"train_loss": -6.10544490814209, "global_step": 73704, "epoch": 1754} {"train_loss": -5.950760841369629, "global_step": 73705, "epoch": 1754} {"train_loss": -6.214272975921631, "global_step": 73706, "epoch": 1754} {"train_loss": -6.112349510192871, "global_step": 73707, "epoch": 1754} {"train_loss": -6.080246925354004, "global_step": 73708, "epoch": 1754} {"train_loss": -6.058932690393357, "global_step": 73709, "epoch": 1754, "val_loss": 75044.421875} {"train_loss": -6.0869011878967285, "global_step": 73710, "epoch": 1755} {"train_loss": -6.054008483886719, "global_step": 73711, "epoch": 1755} {"train_loss": -6.053605079650879, "global_step": 73712, "epoch": 1755} {"train_loss": -6.154252052307129, "global_step": 73713, "epoch": 1755} {"train_loss": -5.999687194824219, "global_step": 73714, "epoch": 1755} {"train_loss": -6.130809783935547, "global_step": 73715, "epoch": 1755} {"train_loss": -6.078461647033691, "global_step": 73716, "epoch": 1755} {"train_loss": -6.084463596343994, "global_step": 73717, "epoch": 1755} {"train_loss": -6.009137153625488, "global_step": 73718, "epoch": 1755} {"train_loss": -6.070103645324707, "global_step": 73719, "epoch": 1755} {"train_loss": -6.055468559265137, "global_step": 73720, "epoch": 1755} {"train_loss": -5.968116760253906, "global_step": 73721, "epoch": 1755} {"train_loss": -6.161162853240967, "global_step": 73722, "epoch": 1755} {"train_loss": -5.84335994720459, "global_step": 73723, "epoch": 1755} {"train_loss": -5.968073844909668, "global_step": 73724, "epoch": 1755} {"train_loss": -6.00483512878418, "global_step": 73725, "epoch": 1755} {"train_loss": -5.9851579666137695, "global_step": 73726, "epoch": 1755} {"train_loss": -5.938521385192871, "global_step": 73727, "epoch": 1755} {"train_loss": -5.995379447937012, "global_step": 73728, "epoch": 1755} {"train_loss": -5.994391918182373, "global_step": 73729, "epoch": 1755} {"train_loss": -6.077425003051758, "global_step": 73730, "epoch": 1755} {"train_loss": -5.990542411804199, "global_step": 73731, "epoch": 1755} {"train_loss": -5.89257287979126, "global_step": 73732, "epoch": 1755} {"train_loss": -6.0153326988220215, "global_step": 73733, "epoch": 1755} {"train_loss": -5.857715606689453, "global_step": 73734, "epoch": 1755} {"train_loss": -5.981391906738281, "global_step": 73735, "epoch": 1755} {"train_loss": -5.941356658935547, "global_step": 73736, "epoch": 1755} {"train_loss": -5.907562255859375, "global_step": 73737, "epoch": 1755} {"train_loss": -5.964780807495117, "global_step": 73738, "epoch": 1755} {"train_loss": -6.029628753662109, "global_step": 73739, "epoch": 1755} {"train_loss": -6.088743209838867, "global_step": 73740, "epoch": 1755} {"train_loss": -5.924124717712402, "global_step": 73741, "epoch": 1755} {"train_loss": -6.047383785247803, "global_step": 73742, "epoch": 1755} {"train_loss": -5.938769340515137, "global_step": 73743, "epoch": 1755} {"train_loss": -5.959319114685059, "global_step": 73744, "epoch": 1755} {"train_loss": -6.1562700271606445, "global_step": 73745, "epoch": 1755} {"train_loss": -5.9162211418151855, "global_step": 73746, "epoch": 1755} {"train_loss": -6.019038200378418, "global_step": 73747, "epoch": 1755} {"train_loss": -6.024224758148193, "global_step": 73748, "epoch": 1755} {"train_loss": -6.094078540802002, "global_step": 73749, "epoch": 1755} {"train_loss": -6.060705184936523, "global_step": 73750, "epoch": 1755} {"train_loss": -6.014344862529209, "global_step": 73751, "epoch": 1755, "val_loss": 74926.2109375} {"train_loss": -6.0973968505859375, "global_step": 73752, "epoch": 1756} {"train_loss": -5.948306083679199, "global_step": 73753, "epoch": 1756} {"train_loss": -5.918013572692871, "global_step": 73754, "epoch": 1756} {"train_loss": -6.073054313659668, "global_step": 73755, "epoch": 1756} {"train_loss": -5.902542591094971, "global_step": 73756, "epoch": 1756} {"train_loss": -6.194753646850586, "global_step": 73757, "epoch": 1756} {"train_loss": -5.978728771209717, "global_step": 73758, "epoch": 1756} {"train_loss": -6.084001064300537, "global_step": 73759, "epoch": 1756} {"train_loss": -5.832489967346191, "global_step": 73760, "epoch": 1756} {"train_loss": -6.034618377685547, "global_step": 73761, "epoch": 1756} {"train_loss": -6.110635757446289, "global_step": 73762, "epoch": 1756} {"train_loss": -6.055471420288086, "global_step": 73763, "epoch": 1756} {"train_loss": -5.986915588378906, "global_step": 73764, "epoch": 1756} {"train_loss": -6.155143737792969, "global_step": 73765, "epoch": 1756} {"train_loss": -6.099187850952148, "global_step": 73766, "epoch": 1756} {"train_loss": -6.09287166595459, "global_step": 73767, "epoch": 1756} {"train_loss": -6.070365905761719, "global_step": 73768, "epoch": 1756} {"train_loss": -6.074224948883057, "global_step": 73769, "epoch": 1756} {"train_loss": -6.127762317657471, "global_step": 73770, "epoch": 1756} {"train_loss": -6.133070945739746, "global_step": 73771, "epoch": 1756} {"train_loss": -6.063576698303223, "global_step": 73772, "epoch": 1756} {"train_loss": -6.035078048706055, "global_step": 73773, "epoch": 1756} {"train_loss": -6.077297210693359, "global_step": 73774, "epoch": 1756} {"train_loss": -6.10988187789917, "global_step": 73775, "epoch": 1756} {"train_loss": -6.149103164672852, "global_step": 73776, "epoch": 1756} {"train_loss": -6.0604472160339355, "global_step": 73777, "epoch": 1756} {"train_loss": -6.148549556732178, "global_step": 73778, "epoch": 1756} {"train_loss": -6.1717939376831055, "global_step": 73779, "epoch": 1756} {"train_loss": -6.10209846496582, "global_step": 73780, "epoch": 1756} {"train_loss": -6.121888160705566, "global_step": 73781, "epoch": 1756} {"train_loss": -6.06113862991333, "global_step": 73782, "epoch": 1756} {"train_loss": -6.0967864990234375, "global_step": 73783, "epoch": 1756} {"train_loss": -6.142425537109375, "global_step": 73784, "epoch": 1756} {"train_loss": -6.055647850036621, "global_step": 73785, "epoch": 1756} {"train_loss": -6.136839389801025, "global_step": 73786, "epoch": 1756} {"train_loss": -6.148802757263184, "global_step": 73787, "epoch": 1756} {"train_loss": -6.049938201904297, "global_step": 73788, "epoch": 1756} {"train_loss": -6.093770980834961, "global_step": 73789, "epoch": 1756} {"train_loss": -6.014060020446777, "global_step": 73790, "epoch": 1756} {"train_loss": -6.039137840270996, "global_step": 73791, "epoch": 1756} {"train_loss": -5.990131378173828, "global_step": 73792, "epoch": 1756} {"train_loss": -6.0680911881583075, "global_step": 73793, "epoch": 1756, "val_loss": 75033.9453125} {"train_loss": -6.0773210525512695, "global_step": 73794, "epoch": 1757} {"train_loss": -6.051939010620117, "global_step": 73795, "epoch": 1757} {"train_loss": -6.1233086585998535, "global_step": 73796, "epoch": 1757} {"train_loss": -6.013111114501953, "global_step": 73797, "epoch": 1757} {"train_loss": -6.083265781402588, "global_step": 73798, "epoch": 1757} {"train_loss": -6.127176761627197, "global_step": 73799, "epoch": 1757} {"train_loss": -6.030939102172852, "global_step": 73800, "epoch": 1757} {"train_loss": -6.1823320388793945, "global_step": 73801, "epoch": 1757} {"train_loss": -6.13740348815918, "global_step": 73802, "epoch": 1757} {"train_loss": -6.030017375946045, "global_step": 73803, "epoch": 1757} {"train_loss": -6.083931922912598, "global_step": 73804, "epoch": 1757} {"train_loss": -5.975778102874756, "global_step": 73805, "epoch": 1757} {"train_loss": -5.967351913452148, "global_step": 73806, "epoch": 1757} {"train_loss": -6.025737762451172, "global_step": 73807, "epoch": 1757} {"train_loss": -5.99052619934082, "global_step": 73808, "epoch": 1757} {"train_loss": -6.091795921325684, "global_step": 73809, "epoch": 1757} {"train_loss": -6.156309604644775, "global_step": 73810, "epoch": 1757} {"train_loss": -6.0993123054504395, "global_step": 73811, "epoch": 1757} {"train_loss": -6.143806457519531, "global_step": 73812, "epoch": 1757} {"train_loss": -5.997477054595947, "global_step": 73813, "epoch": 1757} {"train_loss": -6.070751667022705, "global_step": 73814, "epoch": 1757} {"train_loss": -6.013886451721191, "global_step": 73815, "epoch": 1757} {"train_loss": -6.13870906829834, "global_step": 73816, "epoch": 1757} {"train_loss": -6.000461101531982, "global_step": 73817, "epoch": 1757} {"train_loss": -6.006543159484863, "global_step": 73818, "epoch": 1757} {"train_loss": -5.820474624633789, "global_step": 73819, "epoch": 1757} {"train_loss": -5.877418041229248, "global_step": 73820, "epoch": 1757} {"train_loss": -5.905952453613281, "global_step": 73821, "epoch": 1757} {"train_loss": -5.9876203536987305, "global_step": 73822, "epoch": 1757} {"train_loss": -6.109274864196777, "global_step": 73823, "epoch": 1757} {"train_loss": -5.8986921310424805, "global_step": 73824, "epoch": 1757} {"train_loss": -5.974152565002441, "global_step": 73825, "epoch": 1757} {"train_loss": -6.011824607849121, "global_step": 73826, "epoch": 1757} {"train_loss": -5.968238830566406, "global_step": 73827, "epoch": 1757} {"train_loss": -6.02415132522583, "global_step": 73828, "epoch": 1757} {"train_loss": -6.0372700691223145, "global_step": 73829, "epoch": 1757} {"train_loss": -5.967579364776611, "global_step": 73830, "epoch": 1757} {"train_loss": -6.025048732757568, "global_step": 73831, "epoch": 1757} {"train_loss": -6.129742622375488, "global_step": 73832, "epoch": 1757} {"train_loss": -6.078508377075195, "global_step": 73833, "epoch": 1757} {"train_loss": -5.9936370849609375, "global_step": 73834, "epoch": 1757} {"train_loss": -6.033736921492077, "global_step": 73835, "epoch": 1757, "val_loss": 75086.375} {"train_loss": -6.128771781921387, "global_step": 73836, "epoch": 1758} {"train_loss": -5.987713813781738, "global_step": 73837, "epoch": 1758} {"train_loss": -6.077653884887695, "global_step": 73838, "epoch": 1758} {"train_loss": -6.01806116104126, "global_step": 73839, "epoch": 1758} {"train_loss": -5.942712783813477, "global_step": 73840, "epoch": 1758} {"train_loss": -6.136168479919434, "global_step": 73841, "epoch": 1758} {"train_loss": -5.99713134765625, "global_step": 73842, "epoch": 1758} {"train_loss": -6.106593132019043, "global_step": 73843, "epoch": 1758} {"train_loss": -6.003403663635254, "global_step": 73844, "epoch": 1758} {"train_loss": -5.944092750549316, "global_step": 73845, "epoch": 1758} {"train_loss": -5.926284313201904, "global_step": 73846, "epoch": 1758} {"train_loss": -6.041820526123047, "global_step": 73847, "epoch": 1758} {"train_loss": -5.976641654968262, "global_step": 73848, "epoch": 1758} {"train_loss": -6.100409507751465, "global_step": 73849, "epoch": 1758} {"train_loss": -6.009991645812988, "global_step": 73850, "epoch": 1758} {"train_loss": -6.101463794708252, "global_step": 73851, "epoch": 1758} {"train_loss": -6.124348163604736, "global_step": 73852, "epoch": 1758} {"train_loss": -6.017066478729248, "global_step": 73853, "epoch": 1758} {"train_loss": -6.041652679443359, "global_step": 73854, "epoch": 1758} {"train_loss": -6.066650390625, "global_step": 73855, "epoch": 1758} {"train_loss": -6.04498291015625, "global_step": 73856, "epoch": 1758} {"train_loss": -6.075072288513184, "global_step": 73857, "epoch": 1758} {"train_loss": -6.067723274230957, "global_step": 73858, "epoch": 1758} {"train_loss": -6.203734397888184, "global_step": 73859, "epoch": 1758} {"train_loss": -6.101916313171387, "global_step": 73860, "epoch": 1758} {"train_loss": -6.1348161697387695, "global_step": 73861, "epoch": 1758} {"train_loss": -6.070503234863281, "global_step": 73862, "epoch": 1758} {"train_loss": -6.070003509521484, "global_step": 73863, "epoch": 1758} {"train_loss": -6.088944911956787, "global_step": 73864, "epoch": 1758} {"train_loss": -5.913942337036133, "global_step": 73865, "epoch": 1758} {"train_loss": -6.128968238830566, "global_step": 73866, "epoch": 1758} {"train_loss": -5.975156307220459, "global_step": 73867, "epoch": 1758} {"train_loss": -6.108967304229736, "global_step": 73868, "epoch": 1758} {"train_loss": -6.0687456130981445, "global_step": 73869, "epoch": 1758} {"train_loss": -6.137625217437744, "global_step": 73870, "epoch": 1758} {"train_loss": -6.079835414886475, "global_step": 73871, "epoch": 1758} {"train_loss": -6.144140243530273, "global_step": 73872, "epoch": 1758} {"train_loss": -6.07857084274292, "global_step": 73873, "epoch": 1758} {"train_loss": -5.971996307373047, "global_step": 73874, "epoch": 1758} {"train_loss": -6.073287010192871, "global_step": 73875, "epoch": 1758} {"train_loss": -6.064016819000244, "global_step": 73876, "epoch": 1758} {"train_loss": -6.057781934738159, "global_step": 73877, "epoch": 1758, "val_loss": 74766.0078125} {"train_loss": -5.992560386657715, "global_step": 73878, "epoch": 1759} {"train_loss": -6.1595916748046875, "global_step": 73879, "epoch": 1759} {"train_loss": -6.148246765136719, "global_step": 73880, "epoch": 1759} {"train_loss": -6.18028450012207, "global_step": 73881, "epoch": 1759} {"train_loss": -6.044764041900635, "global_step": 73882, "epoch": 1759} {"train_loss": -5.992773056030273, "global_step": 73883, "epoch": 1759} {"train_loss": -6.118371963500977, "global_step": 73884, "epoch": 1759} {"train_loss": -6.178533554077148, "global_step": 73885, "epoch": 1759} {"train_loss": -6.066221237182617, "global_step": 73886, "epoch": 1759} {"train_loss": -6.189683437347412, "global_step": 73887, "epoch": 1759} {"train_loss": -5.927717208862305, "global_step": 73888, "epoch": 1759} {"train_loss": -6.2201948165893555, "global_step": 73889, "epoch": 1759} {"train_loss": -6.140486717224121, "global_step": 73890, "epoch": 1759} {"train_loss": -6.132111549377441, "global_step": 73891, "epoch": 1759} {"train_loss": -6.11380672454834, "global_step": 73892, "epoch": 1759} {"train_loss": -6.029755592346191, "global_step": 73893, "epoch": 1759} {"train_loss": -6.0283989906311035, "global_step": 73894, "epoch": 1759} {"train_loss": -6.101771354675293, "global_step": 73895, "epoch": 1759} {"train_loss": -6.06226921081543, "global_step": 73896, "epoch": 1759} {"train_loss": -5.991946697235107, "global_step": 73897, "epoch": 1759} {"train_loss": -5.977166652679443, "global_step": 73898, "epoch": 1759} {"train_loss": -6.102844715118408, "global_step": 73899, "epoch": 1759} {"train_loss": -6.104804039001465, "global_step": 73900, "epoch": 1759} {"train_loss": -6.001562118530273, "global_step": 73901, "epoch": 1759} {"train_loss": -6.103005409240723, "global_step": 73902, "epoch": 1759} {"train_loss": -6.043095588684082, "global_step": 73903, "epoch": 1759} {"train_loss": -5.964870452880859, "global_step": 73904, "epoch": 1759} {"train_loss": -6.076617240905762, "global_step": 73905, "epoch": 1759} {"train_loss": -5.990197658538818, "global_step": 73906, "epoch": 1759} {"train_loss": -6.080257415771484, "global_step": 73907, "epoch": 1759} {"train_loss": -6.133198261260986, "global_step": 73908, "epoch": 1759} {"train_loss": -5.904300689697266, "global_step": 73909, "epoch": 1759} {"train_loss": -6.043025970458984, "global_step": 73910, "epoch": 1759} {"train_loss": -6.145265579223633, "global_step": 73911, "epoch": 1759} {"train_loss": -6.050751686096191, "global_step": 73912, "epoch": 1759} {"train_loss": -6.0199480056762695, "global_step": 73913, "epoch": 1759} {"train_loss": -6.189167022705078, "global_step": 73914, "epoch": 1759} {"train_loss": -6.083662033081055, "global_step": 73915, "epoch": 1759} {"train_loss": -6.11476469039917, "global_step": 73916, "epoch": 1759} {"train_loss": -6.08205509185791, "global_step": 73917, "epoch": 1759} {"train_loss": -6.122095108032227, "global_step": 73918, "epoch": 1759} {"train_loss": -6.077548163277762, "global_step": 73919, "epoch": 1759, "val_loss": 74752.0} {"train_loss": -6.227284908294678, "global_step": 73920, "epoch": 1760} {"train_loss": -6.146417140960693, "global_step": 73921, "epoch": 1760} {"train_loss": -5.967314720153809, "global_step": 73922, "epoch": 1760} {"train_loss": -5.977014541625977, "global_step": 73923, "epoch": 1760} {"train_loss": -6.113337516784668, "global_step": 73924, "epoch": 1760} {"train_loss": -6.132000923156738, "global_step": 73925, "epoch": 1760} {"train_loss": -5.997797012329102, "global_step": 73926, "epoch": 1760} {"train_loss": -6.071926116943359, "global_step": 73927, "epoch": 1760} {"train_loss": -6.233548641204834, "global_step": 73928, "epoch": 1760} {"train_loss": -6.068410873413086, "global_step": 73929, "epoch": 1760} {"train_loss": -6.087405204772949, "global_step": 73930, "epoch": 1760} {"train_loss": -5.982486724853516, "global_step": 73931, "epoch": 1760} {"train_loss": -6.058526515960693, "global_step": 73932, "epoch": 1760} {"train_loss": -6.205127239227295, "global_step": 73933, "epoch": 1760} {"train_loss": -5.98799991607666, "global_step": 73934, "epoch": 1760} {"train_loss": -6.1583662033081055, "global_step": 73935, "epoch": 1760} {"train_loss": -6.081499099731445, "global_step": 73936, "epoch": 1760} {"train_loss": -5.936575889587402, "global_step": 73937, "epoch": 1760} {"train_loss": -6.111719131469727, "global_step": 73938, "epoch": 1760} {"train_loss": -6.024656295776367, "global_step": 73939, "epoch": 1760} {"train_loss": -5.9683518409729, "global_step": 73940, "epoch": 1760} {"train_loss": -6.022799491882324, "global_step": 73941, "epoch": 1760} {"train_loss": -6.117369651794434, "global_step": 73942, "epoch": 1760} {"train_loss": -6.108858108520508, "global_step": 73943, "epoch": 1760} {"train_loss": -5.98048210144043, "global_step": 73944, "epoch": 1760} {"train_loss": -5.975415229797363, "global_step": 73945, "epoch": 1760} {"train_loss": -6.006500720977783, "global_step": 73946, "epoch": 1760} {"train_loss": -6.074789524078369, "global_step": 73947, "epoch": 1760} {"train_loss": -6.149188041687012, "global_step": 73948, "epoch": 1760} {"train_loss": -6.028720855712891, "global_step": 73949, "epoch": 1760} {"train_loss": -5.964492321014404, "global_step": 73950, "epoch": 1760} {"train_loss": -6.040469169616699, "global_step": 73951, "epoch": 1760} {"train_loss": -5.905351161956787, "global_step": 73952, "epoch": 1760} {"train_loss": -5.854809761047363, "global_step": 73953, "epoch": 1760} {"train_loss": -5.883260726928711, "global_step": 73954, "epoch": 1760} {"train_loss": -5.928094863891602, "global_step": 73955, "epoch": 1760} {"train_loss": -6.0112504959106445, "global_step": 73956, "epoch": 1760} {"train_loss": -5.8924665451049805, "global_step": 73957, "epoch": 1760} {"train_loss": -5.837015628814697, "global_step": 73958, "epoch": 1760} {"train_loss": -5.918888568878174, "global_step": 73959, "epoch": 1760} {"train_loss": -6.162141799926758, "global_step": 73960, "epoch": 1760} {"train_loss": -6.031975939160302, "global_step": 73961, "epoch": 1760, "val_loss": 75050.3203125} {"train_loss": -6.033533096313477, "global_step": 73962, "epoch": 1761} {"train_loss": -5.9414777755737305, "global_step": 73963, "epoch": 1761} {"train_loss": -6.0391435623168945, "global_step": 73964, "epoch": 1761} {"train_loss": -6.004702568054199, "global_step": 73965, "epoch": 1761} {"train_loss": -6.0010223388671875, "global_step": 73966, "epoch": 1761} {"train_loss": -5.965982437133789, "global_step": 73967, "epoch": 1761} {"train_loss": -6.099665641784668, "global_step": 73968, "epoch": 1761} {"train_loss": -5.978371620178223, "global_step": 73969, "epoch": 1761} {"train_loss": -5.894001007080078, "global_step": 73970, "epoch": 1761} {"train_loss": -5.8819780349731445, "global_step": 73971, "epoch": 1761} {"train_loss": -6.010792255401611, "global_step": 73972, "epoch": 1761} {"train_loss": -6.159530162811279, "global_step": 73973, "epoch": 1761} {"train_loss": -6.023038864135742, "global_step": 73974, "epoch": 1761} {"train_loss": -6.138768196105957, "global_step": 73975, "epoch": 1761} {"train_loss": -6.081921577453613, "global_step": 73976, "epoch": 1761} {"train_loss": -6.151843547821045, "global_step": 73977, "epoch": 1761} {"train_loss": -5.958889484405518, "global_step": 73978, "epoch": 1761} {"train_loss": -5.981051445007324, "global_step": 73979, "epoch": 1761} {"train_loss": -6.082035541534424, "global_step": 73980, "epoch": 1761} {"train_loss": -5.993613243103027, "global_step": 73981, "epoch": 1761} {"train_loss": -6.060563087463379, "global_step": 73982, "epoch": 1761} {"train_loss": -5.909546375274658, "global_step": 73983, "epoch": 1761} {"train_loss": -5.959516525268555, "global_step": 73984, "epoch": 1761} {"train_loss": -6.029224395751953, "global_step": 73985, "epoch": 1761} {"train_loss": -5.998108863830566, "global_step": 73986, "epoch": 1761} {"train_loss": -6.071672439575195, "global_step": 73987, "epoch": 1761} {"train_loss": -6.0543293952941895, "global_step": 73988, "epoch": 1761} {"train_loss": -5.983610153198242, "global_step": 73989, "epoch": 1761} {"train_loss": -5.954500198364258, "global_step": 73990, "epoch": 1761} {"train_loss": -6.027087688446045, "global_step": 73991, "epoch": 1761} {"train_loss": -6.028183460235596, "global_step": 73992, "epoch": 1761} {"train_loss": -6.044745445251465, "global_step": 73993, "epoch": 1761} {"train_loss": -6.096554756164551, "global_step": 73994, "epoch": 1761} {"train_loss": -6.005821228027344, "global_step": 73995, "epoch": 1761} {"train_loss": -6.0692853927612305, "global_step": 73996, "epoch": 1761} {"train_loss": -6.154749870300293, "global_step": 73997, "epoch": 1761} {"train_loss": -6.0406599044799805, "global_step": 73998, "epoch": 1761} {"train_loss": -6.212339878082275, "global_step": 73999, "epoch": 1761} {"train_loss": -5.98178243637085, "global_step": 74000, "epoch": 1761} {"train_loss": -6.052890300750732, "global_step": 74001, "epoch": 1761} {"train_loss": -5.957892417907715, "global_step": 74002, "epoch": 1761} {"train_loss": -6.027883541016352, "global_step": 74003, "epoch": 1761, "val_loss": 74872.5234375} {"train_loss": -6.20878267288208, "global_step": 74004, "epoch": 1762} {"train_loss": -6.07595157623291, "global_step": 74005, "epoch": 1762} {"train_loss": -6.0956950187683105, "global_step": 74006, "epoch": 1762} {"train_loss": -6.162446022033691, "global_step": 74007, "epoch": 1762} {"train_loss": -6.140081405639648, "global_step": 74008, "epoch": 1762} {"train_loss": -6.141650199890137, "global_step": 74009, "epoch": 1762} {"train_loss": -6.048092842102051, "global_step": 74010, "epoch": 1762} {"train_loss": -6.1271491050720215, "global_step": 74011, "epoch": 1762} {"train_loss": -6.060910224914551, "global_step": 74012, "epoch": 1762} {"train_loss": -6.096712589263916, "global_step": 74013, "epoch": 1762} {"train_loss": -6.227128982543945, "global_step": 74014, "epoch": 1762} {"train_loss": -6.126848220825195, "global_step": 74015, "epoch": 1762} {"train_loss": -5.943594455718994, "global_step": 74016, "epoch": 1762} {"train_loss": -6.106658935546875, "global_step": 74017, "epoch": 1762} {"train_loss": -6.0926513671875, "global_step": 74018, "epoch": 1762} {"train_loss": -6.10725212097168, "global_step": 74019, "epoch": 1762} {"train_loss": -5.983544826507568, "global_step": 74020, "epoch": 1762} {"train_loss": -6.156444549560547, "global_step": 74021, "epoch": 1762} {"train_loss": -5.998339653015137, "global_step": 74022, "epoch": 1762} {"train_loss": -6.108977317810059, "global_step": 74023, "epoch": 1762} {"train_loss": -6.128525733947754, "global_step": 74024, "epoch": 1762} {"train_loss": -6.157336235046387, "global_step": 74025, "epoch": 1762} {"train_loss": -6.112692356109619, "global_step": 74026, "epoch": 1762} {"train_loss": -6.12024450302124, "global_step": 74027, "epoch": 1762} {"train_loss": -6.097921848297119, "global_step": 74028, "epoch": 1762} {"train_loss": -6.035404205322266, "global_step": 74029, "epoch": 1762} {"train_loss": -6.234675884246826, "global_step": 74030, "epoch": 1762} {"train_loss": -5.946112632751465, "global_step": 74031, "epoch": 1762} {"train_loss": -6.065529823303223, "global_step": 74032, "epoch": 1762} {"train_loss": -6.093061923980713, "global_step": 74033, "epoch": 1762} {"train_loss": -5.977499008178711, "global_step": 74034, "epoch": 1762} {"train_loss": -6.0512285232543945, "global_step": 74035, "epoch": 1762} {"train_loss": -6.02126407623291, "global_step": 74036, "epoch": 1762} {"train_loss": -6.052585601806641, "global_step": 74037, "epoch": 1762} {"train_loss": -6.024138450622559, "global_step": 74038, "epoch": 1762} {"train_loss": -6.155021667480469, "global_step": 74039, "epoch": 1762} {"train_loss": -6.1385626792907715, "global_step": 74040, "epoch": 1762} {"train_loss": -6.015110492706299, "global_step": 74041, "epoch": 1762} {"train_loss": -6.042688846588135, "global_step": 74042, "epoch": 1762} {"train_loss": -6.036444664001465, "global_step": 74043, "epoch": 1762} {"train_loss": -6.1282196044921875, "global_step": 74044, "epoch": 1762} {"train_loss": -6.08990604536874, "global_step": 74045, "epoch": 1762, "val_loss": 74911.890625} {"train_loss": -6.114421844482422, "global_step": 74046, "epoch": 1763} {"train_loss": -6.1843366622924805, "global_step": 74047, "epoch": 1763} {"train_loss": -6.204110145568848, "global_step": 74048, "epoch": 1763} {"train_loss": -6.101316452026367, "global_step": 74049, "epoch": 1763} {"train_loss": -6.14447021484375, "global_step": 74050, "epoch": 1763} {"train_loss": -6.1446638107299805, "global_step": 74051, "epoch": 1763} {"train_loss": -6.090528964996338, "global_step": 74052, "epoch": 1763} {"train_loss": -6.011170387268066, "global_step": 74053, "epoch": 1763} {"train_loss": -6.05191707611084, "global_step": 74054, "epoch": 1763} {"train_loss": -5.978634357452393, "global_step": 74055, "epoch": 1763} {"train_loss": -6.173739910125732, "global_step": 74056, "epoch": 1763} {"train_loss": -6.008334159851074, "global_step": 74057, "epoch": 1763} {"train_loss": -6.012587070465088, "global_step": 74058, "epoch": 1763} {"train_loss": -6.144395351409912, "global_step": 74059, "epoch": 1763} {"train_loss": -6.197492599487305, "global_step": 74060, "epoch": 1763} {"train_loss": -6.035984039306641, "global_step": 74061, "epoch": 1763} {"train_loss": -6.225088596343994, "global_step": 74062, "epoch": 1763} {"train_loss": -6.000009536743164, "global_step": 74063, "epoch": 1763} {"train_loss": -6.067174911499023, "global_step": 74064, "epoch": 1763} {"train_loss": -6.036447525024414, "global_step": 74065, "epoch": 1763} {"train_loss": -6.1569929122924805, "global_step": 74066, "epoch": 1763} {"train_loss": -6.051719665527344, "global_step": 74067, "epoch": 1763} {"train_loss": -6.078151702880859, "global_step": 74068, "epoch": 1763} {"train_loss": -5.997988700866699, "global_step": 74069, "epoch": 1763} {"train_loss": -6.030066013336182, "global_step": 74070, "epoch": 1763} {"train_loss": -6.028286933898926, "global_step": 74071, "epoch": 1763} {"train_loss": -6.042980194091797, "global_step": 74072, "epoch": 1763} {"train_loss": -6.058162689208984, "global_step": 74073, "epoch": 1763} {"train_loss": -6.112292289733887, "global_step": 74074, "epoch": 1763} {"train_loss": -5.92000675201416, "global_step": 74075, "epoch": 1763} {"train_loss": -6.093531131744385, "global_step": 74076, "epoch": 1763} {"train_loss": -5.901276588439941, "global_step": 74077, "epoch": 1763} {"train_loss": -6.003485679626465, "global_step": 74078, "epoch": 1763} {"train_loss": -5.7613205909729, "global_step": 74079, "epoch": 1763} {"train_loss": -5.945869445800781, "global_step": 74080, "epoch": 1763} {"train_loss": -6.024042129516602, "global_step": 74081, "epoch": 1763} {"train_loss": -5.945986747741699, "global_step": 74082, "epoch": 1763} {"train_loss": -5.955319404602051, "global_step": 74083, "epoch": 1763} {"train_loss": -6.000711917877197, "global_step": 74084, "epoch": 1763} {"train_loss": -6.1362152099609375, "global_step": 74085, "epoch": 1763} {"train_loss": -6.0498480796813965, "global_step": 74086, "epoch": 1763} {"train_loss": -6.0546389647892545, "global_step": 74087, "epoch": 1763, "val_loss": 75564.671875} {"train_loss": -5.896372318267822, "global_step": 74088, "epoch": 1764} {"train_loss": -5.825397491455078, "global_step": 74089, "epoch": 1764} {"train_loss": -5.955759048461914, "global_step": 74090, "epoch": 1764} {"train_loss": -5.85442590713501, "global_step": 74091, "epoch": 1764} {"train_loss": -5.841468334197998, "global_step": 74092, "epoch": 1764} {"train_loss": -5.941330909729004, "global_step": 74093, "epoch": 1764} {"train_loss": -5.817164897918701, "global_step": 74094, "epoch": 1764} {"train_loss": -5.93501091003418, "global_step": 74095, "epoch": 1764} {"train_loss": -5.916845798492432, "global_step": 74096, "epoch": 1764} {"train_loss": -6.039059638977051, "global_step": 74097, "epoch": 1764} {"train_loss": -5.8589982986450195, "global_step": 74098, "epoch": 1764} {"train_loss": -5.8813796043396, "global_step": 74099, "epoch": 1764} {"train_loss": -6.003529071807861, "global_step": 74100, "epoch": 1764} {"train_loss": -6.0408735275268555, "global_step": 74101, "epoch": 1764} {"train_loss": -5.946770668029785, "global_step": 74102, "epoch": 1764} {"train_loss": -6.094691753387451, "global_step": 74103, "epoch": 1764} {"train_loss": -5.983771324157715, "global_step": 74104, "epoch": 1764} {"train_loss": -6.082188606262207, "global_step": 74105, "epoch": 1764} {"train_loss": -6.088757514953613, "global_step": 74106, "epoch": 1764} {"train_loss": -5.939597129821777, "global_step": 74107, "epoch": 1764} {"train_loss": -6.11606502532959, "global_step": 74108, "epoch": 1764} {"train_loss": -5.979313850402832, "global_step": 74109, "epoch": 1764} {"train_loss": -6.0565032958984375, "global_step": 74110, "epoch": 1764} {"train_loss": -6.078083038330078, "global_step": 74111, "epoch": 1764} {"train_loss": -6.055847644805908, "global_step": 74112, "epoch": 1764} {"train_loss": -6.068431377410889, "global_step": 74113, "epoch": 1764} {"train_loss": -6.000957489013672, "global_step": 74114, "epoch": 1764} {"train_loss": -6.018327236175537, "global_step": 74115, "epoch": 1764} {"train_loss": -6.013978958129883, "global_step": 74116, "epoch": 1764} {"train_loss": -6.091364860534668, "global_step": 74117, "epoch": 1764} {"train_loss": -6.085679531097412, "global_step": 74118, "epoch": 1764} {"train_loss": -6.178617000579834, "global_step": 74119, "epoch": 1764} {"train_loss": -6.09412956237793, "global_step": 74120, "epoch": 1764} {"train_loss": -6.13877010345459, "global_step": 74121, "epoch": 1764} {"train_loss": -6.085376262664795, "global_step": 74122, "epoch": 1764} {"train_loss": -6.095369338989258, "global_step": 74123, "epoch": 1764} {"train_loss": -6.1389875411987305, "global_step": 74124, "epoch": 1764} {"train_loss": -6.067184925079346, "global_step": 74125, "epoch": 1764} {"train_loss": -6.0080037117004395, "global_step": 74126, "epoch": 1764} {"train_loss": -5.961143970489502, "global_step": 74127, "epoch": 1764} {"train_loss": -6.076854228973389, "global_step": 74128, "epoch": 1764} {"train_loss": -6.009139163153512, "global_step": 74129, "epoch": 1764, "val_loss": 74995.859375} {"train_loss": -5.923558712005615, "global_step": 74130, "epoch": 1765} {"train_loss": -6.172206878662109, "global_step": 74131, "epoch": 1765} {"train_loss": -5.896684169769287, "global_step": 74132, "epoch": 1765} {"train_loss": -5.9527482986450195, "global_step": 74133, "epoch": 1765} {"train_loss": -5.9333930015563965, "global_step": 74134, "epoch": 1765} {"train_loss": -5.945476531982422, "global_step": 74135, "epoch": 1765} {"train_loss": -5.990336894989014, "global_step": 74136, "epoch": 1765} {"train_loss": -5.94716215133667, "global_step": 74137, "epoch": 1765} {"train_loss": -5.8807244300842285, "global_step": 74138, "epoch": 1765} {"train_loss": -6.086207389831543, "global_step": 74139, "epoch": 1765} {"train_loss": -5.85095739364624, "global_step": 74140, "epoch": 1765} {"train_loss": -6.044190883636475, "global_step": 74141, "epoch": 1765} {"train_loss": -5.9407782554626465, "global_step": 74142, "epoch": 1765} {"train_loss": -5.914931297302246, "global_step": 74143, "epoch": 1765} {"train_loss": -6.181394577026367, "global_step": 74144, "epoch": 1765} {"train_loss": -5.974645614624023, "global_step": 74145, "epoch": 1765} {"train_loss": -6.043521404266357, "global_step": 74146, "epoch": 1765} {"train_loss": -5.9880828857421875, "global_step": 74147, "epoch": 1765} {"train_loss": -6.129493713378906, "global_step": 74148, "epoch": 1765} {"train_loss": -6.066495895385742, "global_step": 74149, "epoch": 1765} {"train_loss": -6.0474700927734375, "global_step": 74150, "epoch": 1765} {"train_loss": -6.070631504058838, "global_step": 74151, "epoch": 1765} {"train_loss": -6.084928035736084, "global_step": 74152, "epoch": 1765} {"train_loss": -6.0920867919921875, "global_step": 74153, "epoch": 1765} {"train_loss": -6.0824737548828125, "global_step": 74154, "epoch": 1765} {"train_loss": -6.077057361602783, "global_step": 74155, "epoch": 1765} {"train_loss": -6.049247741699219, "global_step": 74156, "epoch": 1765} {"train_loss": -5.9994096755981445, "global_step": 74157, "epoch": 1765} {"train_loss": -6.036865234375, "global_step": 74158, "epoch": 1765} {"train_loss": -6.060546875, "global_step": 74159, "epoch": 1765} {"train_loss": -6.154844284057617, "global_step": 74160, "epoch": 1765} {"train_loss": -6.145576477050781, "global_step": 74161, "epoch": 1765} {"train_loss": -6.098428726196289, "global_step": 74162, "epoch": 1765} {"train_loss": -6.082278728485107, "global_step": 74163, "epoch": 1765} {"train_loss": -6.0527448654174805, "global_step": 74164, "epoch": 1765} {"train_loss": -6.175866603851318, "global_step": 74165, "epoch": 1765} {"train_loss": -5.973127365112305, "global_step": 74166, "epoch": 1765} {"train_loss": -6.076869010925293, "global_step": 74167, "epoch": 1765} {"train_loss": -6.045525074005127, "global_step": 74168, "epoch": 1765} {"train_loss": -6.052081108093262, "global_step": 74169, "epoch": 1765} {"train_loss": -6.062448501586914, "global_step": 74170, "epoch": 1765} {"train_loss": -6.035570553370884, "global_step": 74171, "epoch": 1765, "val_loss": 74956.328125} {"train_loss": -6.090930461883545, "global_step": 74172, "epoch": 1766} {"train_loss": -6.12513542175293, "global_step": 74173, "epoch": 1766} {"train_loss": -6.106433868408203, "global_step": 74174, "epoch": 1766} {"train_loss": -6.09529972076416, "global_step": 74175, "epoch": 1766} {"train_loss": -6.111355781555176, "global_step": 74176, "epoch": 1766} {"train_loss": -5.936598777770996, "global_step": 74177, "epoch": 1766} {"train_loss": -5.871504783630371, "global_step": 74178, "epoch": 1766} {"train_loss": -6.151054382324219, "global_step": 74179, "epoch": 1766} {"train_loss": -6.138376235961914, "global_step": 74180, "epoch": 1766} {"train_loss": -6.025523662567139, "global_step": 74181, "epoch": 1766} {"train_loss": -6.191920757293701, "global_step": 74182, "epoch": 1766} {"train_loss": -6.1074700355529785, "global_step": 74183, "epoch": 1766} {"train_loss": -6.091289520263672, "global_step": 74184, "epoch": 1766} {"train_loss": -6.07465934753418, "global_step": 74185, "epoch": 1766} {"train_loss": -6.194726943969727, "global_step": 74186, "epoch": 1766} {"train_loss": -6.10911750793457, "global_step": 74187, "epoch": 1766} {"train_loss": -6.071156024932861, "global_step": 74188, "epoch": 1766} {"train_loss": -6.059727668762207, "global_step": 74189, "epoch": 1766} {"train_loss": -5.9637370109558105, "global_step": 74190, "epoch": 1766} {"train_loss": -6.054385185241699, "global_step": 74191, "epoch": 1766} {"train_loss": -6.044550895690918, "global_step": 74192, "epoch": 1766} {"train_loss": -6.080258369445801, "global_step": 74193, "epoch": 1766} {"train_loss": -5.93472957611084, "global_step": 74194, "epoch": 1766} {"train_loss": -6.0910139083862305, "global_step": 74195, "epoch": 1766} {"train_loss": -6.184187412261963, "global_step": 74196, "epoch": 1766} {"train_loss": -6.125257968902588, "global_step": 74197, "epoch": 1766} {"train_loss": -6.116706848144531, "global_step": 74198, "epoch": 1766} {"train_loss": -6.105068206787109, "global_step": 74199, "epoch": 1766} {"train_loss": -5.977686405181885, "global_step": 74200, "epoch": 1766} {"train_loss": -6.149070739746094, "global_step": 74201, "epoch": 1766} {"train_loss": -6.07227087020874, "global_step": 74202, "epoch": 1766} {"train_loss": -6.1674981117248535, "global_step": 74203, "epoch": 1766} {"train_loss": -6.115009307861328, "global_step": 74204, "epoch": 1766} {"train_loss": -6.089913845062256, "global_step": 74205, "epoch": 1766} {"train_loss": -5.9998779296875, "global_step": 74206, "epoch": 1766} {"train_loss": -6.181635856628418, "global_step": 74207, "epoch": 1766} {"train_loss": -6.026372909545898, "global_step": 74208, "epoch": 1766} {"train_loss": -6.1450910568237305, "global_step": 74209, "epoch": 1766} {"train_loss": -6.092581748962402, "global_step": 74210, "epoch": 1766} {"train_loss": -5.871138095855713, "global_step": 74211, "epoch": 1766} {"train_loss": -6.101130962371826, "global_step": 74212, "epoch": 1766} {"train_loss": -6.080947421845936, "global_step": 74213, "epoch": 1766, "val_loss": 74833.5078125} {"train_loss": -6.059966087341309, "global_step": 74214, "epoch": 1767} {"train_loss": -6.028489589691162, "global_step": 74215, "epoch": 1767} {"train_loss": -5.979286193847656, "global_step": 74216, "epoch": 1767} {"train_loss": -5.977035999298096, "global_step": 74217, "epoch": 1767} {"train_loss": -6.054810523986816, "global_step": 74218, "epoch": 1767} {"train_loss": -5.986089706420898, "global_step": 74219, "epoch": 1767} {"train_loss": -6.043540000915527, "global_step": 74220, "epoch": 1767} {"train_loss": -6.098091125488281, "global_step": 74221, "epoch": 1767} {"train_loss": -6.097493648529053, "global_step": 74222, "epoch": 1767} {"train_loss": -6.336878776550293, "global_step": 74223, "epoch": 1767} {"train_loss": -6.154621601104736, "global_step": 74224, "epoch": 1767} {"train_loss": -6.14249849319458, "global_step": 74225, "epoch": 1767} {"train_loss": -6.090914726257324, "global_step": 74226, "epoch": 1767} {"train_loss": -6.117090225219727, "global_step": 74227, "epoch": 1767} {"train_loss": -6.2369585037231445, "global_step": 74228, "epoch": 1767} {"train_loss": -6.136351108551025, "global_step": 74229, "epoch": 1767} {"train_loss": -6.108096122741699, "global_step": 74230, "epoch": 1767} {"train_loss": -6.280823707580566, "global_step": 74231, "epoch": 1767} {"train_loss": -6.064136505126953, "global_step": 74232, "epoch": 1767} {"train_loss": -6.073911666870117, "global_step": 74233, "epoch": 1767} {"train_loss": -5.920996189117432, "global_step": 74234, "epoch": 1767} {"train_loss": -5.881389617919922, "global_step": 74235, "epoch": 1767} {"train_loss": -6.0536298751831055, "global_step": 74236, "epoch": 1767} {"train_loss": -6.1577558517456055, "global_step": 74237, "epoch": 1767} {"train_loss": -5.994189262390137, "global_step": 74238, "epoch": 1767} {"train_loss": -6.04686164855957, "global_step": 74239, "epoch": 1767} {"train_loss": -6.120064735412598, "global_step": 74240, "epoch": 1767} {"train_loss": -6.073456287384033, "global_step": 74241, "epoch": 1767} {"train_loss": -6.120381832122803, "global_step": 74242, "epoch": 1767} {"train_loss": -6.091433525085449, "global_step": 74243, "epoch": 1767} {"train_loss": -6.106247425079346, "global_step": 74244, "epoch": 1767} {"train_loss": -6.15745735168457, "global_step": 74245, "epoch": 1767} {"train_loss": -6.102594375610352, "global_step": 74246, "epoch": 1767} {"train_loss": -6.090064525604248, "global_step": 74247, "epoch": 1767} {"train_loss": -6.144353866577148, "global_step": 74248, "epoch": 1767} {"train_loss": -6.076231956481934, "global_step": 74249, "epoch": 1767} {"train_loss": -6.079380989074707, "global_step": 74250, "epoch": 1767} {"train_loss": -6.011862277984619, "global_step": 74251, "epoch": 1767} {"train_loss": -6.0224761962890625, "global_step": 74252, "epoch": 1767} {"train_loss": -6.102959632873535, "global_step": 74253, "epoch": 1767} {"train_loss": -6.086012840270996, "global_step": 74254, "epoch": 1767} {"train_loss": -6.083389021101452, "global_step": 74255, "epoch": 1767, "val_loss": 75116.859375} {"train_loss": -6.100582122802734, "global_step": 74256, "epoch": 1768} {"train_loss": -6.032049655914307, "global_step": 74257, "epoch": 1768} {"train_loss": -5.992425918579102, "global_step": 74258, "epoch": 1768} {"train_loss": -6.008378028869629, "global_step": 74259, "epoch": 1768} {"train_loss": -6.123653411865234, "global_step": 74260, "epoch": 1768} {"train_loss": -6.049964427947998, "global_step": 74261, "epoch": 1768} {"train_loss": -6.113860607147217, "global_step": 74262, "epoch": 1768} {"train_loss": -5.961135387420654, "global_step": 74263, "epoch": 1768} {"train_loss": -6.005630016326904, "global_step": 74264, "epoch": 1768} {"train_loss": -5.962826251983643, "global_step": 74265, "epoch": 1768} {"train_loss": -6.012646675109863, "global_step": 74266, "epoch": 1768} {"train_loss": -6.110864162445068, "global_step": 74267, "epoch": 1768} {"train_loss": -6.056257247924805, "global_step": 74268, "epoch": 1768} {"train_loss": -6.071527481079102, "global_step": 74269, "epoch": 1768} {"train_loss": -6.088008403778076, "global_step": 74270, "epoch": 1768} {"train_loss": -6.0752973556518555, "global_step": 74271, "epoch": 1768} {"train_loss": -6.000144958496094, "global_step": 74272, "epoch": 1768} {"train_loss": -5.994043350219727, "global_step": 74273, "epoch": 1768} {"train_loss": -6.163479328155518, "global_step": 74274, "epoch": 1768} {"train_loss": -6.110658645629883, "global_step": 74275, "epoch": 1768} {"train_loss": -6.051836013793945, "global_step": 74276, "epoch": 1768} {"train_loss": -6.070965766906738, "global_step": 74277, "epoch": 1768} {"train_loss": -6.2205376625061035, "global_step": 74278, "epoch": 1768} {"train_loss": -6.168959617614746, "global_step": 74279, "epoch": 1768} {"train_loss": -6.152410507202148, "global_step": 74280, "epoch": 1768} {"train_loss": -6.13565731048584, "global_step": 74281, "epoch": 1768} {"train_loss": -6.111906051635742, "global_step": 74282, "epoch": 1768} {"train_loss": -6.108704090118408, "global_step": 74283, "epoch": 1768} {"train_loss": -6.099147319793701, "global_step": 74284, "epoch": 1768} {"train_loss": -5.988008499145508, "global_step": 74285, "epoch": 1768} {"train_loss": -6.233719825744629, "global_step": 74286, "epoch": 1768} {"train_loss": -6.124249458312988, "global_step": 74287, "epoch": 1768} {"train_loss": -6.113900184631348, "global_step": 74288, "epoch": 1768} {"train_loss": -6.130171775817871, "global_step": 74289, "epoch": 1768} {"train_loss": -6.058135509490967, "global_step": 74290, "epoch": 1768} {"train_loss": -6.154756546020508, "global_step": 74291, "epoch": 1768} {"train_loss": -6.077673435211182, "global_step": 74292, "epoch": 1768} {"train_loss": -6.090580940246582, "global_step": 74293, "epoch": 1768} {"train_loss": -6.093498229980469, "global_step": 74294, "epoch": 1768} {"train_loss": -6.042178153991699, "global_step": 74295, "epoch": 1768} {"train_loss": -6.107062339782715, "global_step": 74296, "epoch": 1768} {"train_loss": -6.084208227339245, "global_step": 74297, "epoch": 1768, "val_loss": 74995.609375} {"train_loss": -6.045371055603027, "global_step": 74298, "epoch": 1769} {"train_loss": -6.128589630126953, "global_step": 74299, "epoch": 1769} {"train_loss": -6.036107063293457, "global_step": 74300, "epoch": 1769} {"train_loss": -6.05471134185791, "global_step": 74301, "epoch": 1769} {"train_loss": -6.027617454528809, "global_step": 74302, "epoch": 1769} {"train_loss": -6.046634674072266, "global_step": 74303, "epoch": 1769} {"train_loss": -6.125507354736328, "global_step": 74304, "epoch": 1769} {"train_loss": -6.089554786682129, "global_step": 74305, "epoch": 1769} {"train_loss": -6.022327423095703, "global_step": 74306, "epoch": 1769} {"train_loss": -6.082953453063965, "global_step": 74307, "epoch": 1769} {"train_loss": -6.107149600982666, "global_step": 74308, "epoch": 1769} {"train_loss": -6.206704139709473, "global_step": 74309, "epoch": 1769} {"train_loss": -6.079571723937988, "global_step": 74310, "epoch": 1769} {"train_loss": -6.04811429977417, "global_step": 74311, "epoch": 1769} {"train_loss": -6.064332008361816, "global_step": 74312, "epoch": 1769} {"train_loss": -6.123442649841309, "global_step": 74313, "epoch": 1769} {"train_loss": -6.101375579833984, "global_step": 74314, "epoch": 1769} {"train_loss": -6.186671257019043, "global_step": 74315, "epoch": 1769} {"train_loss": -6.104981422424316, "global_step": 74316, "epoch": 1769} {"train_loss": -6.258672714233398, "global_step": 74317, "epoch": 1769} {"train_loss": -6.099064826965332, "global_step": 74318, "epoch": 1769} {"train_loss": -6.042187690734863, "global_step": 74319, "epoch": 1769} {"train_loss": -6.097235679626465, "global_step": 74320, "epoch": 1769} {"train_loss": -6.163298606872559, "global_step": 74321, "epoch": 1769} {"train_loss": -6.142419815063477, "global_step": 74322, "epoch": 1769} {"train_loss": -6.153063774108887, "global_step": 74323, "epoch": 1769} {"train_loss": -6.08837890625, "global_step": 74324, "epoch": 1769} {"train_loss": -6.126312255859375, "global_step": 74325, "epoch": 1769} {"train_loss": -6.068603515625, "global_step": 74326, "epoch": 1769} {"train_loss": -5.9146504402160645, "global_step": 74327, "epoch": 1769} {"train_loss": -5.9406514167785645, "global_step": 74328, "epoch": 1769} {"train_loss": -6.06167459487915, "global_step": 74329, "epoch": 1769} {"train_loss": -6.099082946777344, "global_step": 74330, "epoch": 1769} {"train_loss": -6.134079456329346, "global_step": 74331, "epoch": 1769} {"train_loss": -5.982689380645752, "global_step": 74332, "epoch": 1769} {"train_loss": -5.959012985229492, "global_step": 74333, "epoch": 1769} {"train_loss": -6.152060508728027, "global_step": 74334, "epoch": 1769} {"train_loss": -5.983504772186279, "global_step": 74335, "epoch": 1769} {"train_loss": -6.138789653778076, "global_step": 74336, "epoch": 1769} {"train_loss": -6.1220879554748535, "global_step": 74337, "epoch": 1769} {"train_loss": -6.0760111808776855, "global_step": 74338, "epoch": 1769} {"train_loss": -6.0885471275874545, "global_step": 74339, "epoch": 1769, "val_loss": 74603.4609375} {"train_loss": -6.078005790710449, "global_step": 74340, "epoch": 1770} {"train_loss": -6.100778579711914, "global_step": 74341, "epoch": 1770} {"train_loss": -6.037578582763672, "global_step": 74342, "epoch": 1770} {"train_loss": -6.138741493225098, "global_step": 74343, "epoch": 1770} {"train_loss": -6.148399353027344, "global_step": 74344, "epoch": 1770} {"train_loss": -5.982800483703613, "global_step": 74345, "epoch": 1770} {"train_loss": -6.072052001953125, "global_step": 74346, "epoch": 1770} {"train_loss": -5.905537128448486, "global_step": 74347, "epoch": 1770} {"train_loss": -6.086710453033447, "global_step": 74348, "epoch": 1770} {"train_loss": -5.980779647827148, "global_step": 74349, "epoch": 1770} {"train_loss": -6.0916571617126465, "global_step": 74350, "epoch": 1770} {"train_loss": -6.043349266052246, "global_step": 74351, "epoch": 1770} {"train_loss": -6.179909706115723, "global_step": 74352, "epoch": 1770} {"train_loss": -6.062412738800049, "global_step": 74353, "epoch": 1770} {"train_loss": -6.113154411315918, "global_step": 74354, "epoch": 1770} {"train_loss": -6.139793395996094, "global_step": 74355, "epoch": 1770} {"train_loss": -6.1011643409729, "global_step": 74356, "epoch": 1770} {"train_loss": -6.091916084289551, "global_step": 74357, "epoch": 1770} {"train_loss": -5.94108772277832, "global_step": 74358, "epoch": 1770} {"train_loss": -6.065255165100098, "global_step": 74359, "epoch": 1770} {"train_loss": -5.985105514526367, "global_step": 74360, "epoch": 1770} {"train_loss": -6.075356483459473, "global_step": 74361, "epoch": 1770} {"train_loss": -6.130279541015625, "global_step": 74362, "epoch": 1770} {"train_loss": -6.020097732543945, "global_step": 74363, "epoch": 1770} {"train_loss": -6.094333648681641, "global_step": 74364, "epoch": 1770} {"train_loss": -5.9936323165893555, "global_step": 74365, "epoch": 1770} {"train_loss": -5.901376724243164, "global_step": 74366, "epoch": 1770} {"train_loss": -6.083932876586914, "global_step": 74367, "epoch": 1770} {"train_loss": -5.797263145446777, "global_step": 74368, "epoch": 1770} {"train_loss": -6.09000301361084, "global_step": 74369, "epoch": 1770} {"train_loss": -5.835936069488525, "global_step": 74370, "epoch": 1770} {"train_loss": -6.040615081787109, "global_step": 74371, "epoch": 1770} {"train_loss": -5.985918998718262, "global_step": 74372, "epoch": 1770} {"train_loss": -6.015607833862305, "global_step": 74373, "epoch": 1770} {"train_loss": -6.022630214691162, "global_step": 74374, "epoch": 1770} {"train_loss": -6.079397201538086, "global_step": 74375, "epoch": 1770} {"train_loss": -6.030857563018799, "global_step": 74376, "epoch": 1770} {"train_loss": -5.964446067810059, "global_step": 74377, "epoch": 1770} {"train_loss": -5.997182846069336, "global_step": 74378, "epoch": 1770} {"train_loss": -6.058142185211182, "global_step": 74379, "epoch": 1770} {"train_loss": -6.103877067565918, "global_step": 74380, "epoch": 1770} {"train_loss": -6.039831581569853, "global_step": 74381, "epoch": 1770, "val_loss": 75079.78125} {"train_loss": -6.020145416259766, "global_step": 74382, "epoch": 1771} {"train_loss": -5.937133312225342, "global_step": 74383, "epoch": 1771} {"train_loss": -6.131422996520996, "global_step": 74384, "epoch": 1771} {"train_loss": -5.9958295822143555, "global_step": 74385, "epoch": 1771} {"train_loss": -5.983064651489258, "global_step": 74386, "epoch": 1771} {"train_loss": -5.992458820343018, "global_step": 74387, "epoch": 1771} {"train_loss": -6.062002182006836, "global_step": 74388, "epoch": 1771} {"train_loss": -5.973766326904297, "global_step": 74389, "epoch": 1771} {"train_loss": -6.084330081939697, "global_step": 74390, "epoch": 1771} {"train_loss": -5.840998649597168, "global_step": 74391, "epoch": 1771} {"train_loss": -5.995302200317383, "global_step": 74392, "epoch": 1771} {"train_loss": -6.119683265686035, "global_step": 74393, "epoch": 1771} {"train_loss": -6.146183967590332, "global_step": 74394, "epoch": 1771} {"train_loss": -6.091997146606445, "global_step": 74395, "epoch": 1771} {"train_loss": -6.1172776222229, "global_step": 74396, "epoch": 1771} {"train_loss": -6.057391166687012, "global_step": 74397, "epoch": 1771} {"train_loss": -6.058727264404297, "global_step": 74398, "epoch": 1771} {"train_loss": -6.014416694641113, "global_step": 74399, "epoch": 1771} {"train_loss": -5.923334121704102, "global_step": 74400, "epoch": 1771} {"train_loss": -5.928430557250977, "global_step": 74401, "epoch": 1771} {"train_loss": -6.187557220458984, "global_step": 74402, "epoch": 1771} {"train_loss": -5.8318634033203125, "global_step": 74403, "epoch": 1771} {"train_loss": -6.094964981079102, "global_step": 74404, "epoch": 1771} {"train_loss": -6.037257194519043, "global_step": 74405, "epoch": 1771} {"train_loss": -5.949039936065674, "global_step": 74406, "epoch": 1771} {"train_loss": -6.158562660217285, "global_step": 74407, "epoch": 1771} {"train_loss": -5.957058906555176, "global_step": 74408, "epoch": 1771} {"train_loss": -6.012679576873779, "global_step": 74409, "epoch": 1771} {"train_loss": -6.034769535064697, "global_step": 74410, "epoch": 1771} {"train_loss": -6.101956367492676, "global_step": 74411, "epoch": 1771} {"train_loss": -6.043828964233398, "global_step": 74412, "epoch": 1771} {"train_loss": -6.088848114013672, "global_step": 74413, "epoch": 1771} {"train_loss": -6.050743103027344, "global_step": 74414, "epoch": 1771} {"train_loss": -6.111480712890625, "global_step": 74415, "epoch": 1771} {"train_loss": -6.107776641845703, "global_step": 74416, "epoch": 1771} {"train_loss": -6.075667381286621, "global_step": 74417, "epoch": 1771} {"train_loss": -6.057138442993164, "global_step": 74418, "epoch": 1771} {"train_loss": -5.983981132507324, "global_step": 74419, "epoch": 1771} {"train_loss": -6.101865768432617, "global_step": 74420, "epoch": 1771} {"train_loss": -6.0210676193237305, "global_step": 74421, "epoch": 1771} {"train_loss": -6.069253921508789, "global_step": 74422, "epoch": 1771} {"train_loss": -6.037116323198591, "global_step": 74423, "epoch": 1771, "val_loss": 74823.8515625} {"train_loss": -6.14150857925415, "global_step": 74424, "epoch": 1772} {"train_loss": -6.0795817375183105, "global_step": 74425, "epoch": 1772} {"train_loss": -6.131911277770996, "global_step": 74426, "epoch": 1772} {"train_loss": -5.994418621063232, "global_step": 74427, "epoch": 1772} {"train_loss": -6.14698600769043, "global_step": 74428, "epoch": 1772} {"train_loss": -6.1012773513793945, "global_step": 74429, "epoch": 1772} {"train_loss": -6.120486259460449, "global_step": 74430, "epoch": 1772} {"train_loss": -6.058659076690674, "global_step": 74431, "epoch": 1772} {"train_loss": -6.054687023162842, "global_step": 74432, "epoch": 1772} {"train_loss": -6.110223770141602, "global_step": 74433, "epoch": 1772} {"train_loss": -5.941594123840332, "global_step": 74434, "epoch": 1772} {"train_loss": -6.012398719787598, "global_step": 74435, "epoch": 1772} {"train_loss": -6.013848304748535, "global_step": 74436, "epoch": 1772} {"train_loss": -6.046444892883301, "global_step": 74437, "epoch": 1772} {"train_loss": -6.261361122131348, "global_step": 74438, "epoch": 1772} {"train_loss": -6.00427770614624, "global_step": 74439, "epoch": 1772} {"train_loss": -6.078891277313232, "global_step": 74440, "epoch": 1772} {"train_loss": -6.042619705200195, "global_step": 74441, "epoch": 1772} {"train_loss": -6.077678680419922, "global_step": 74442, "epoch": 1772} {"train_loss": -6.050479412078857, "global_step": 74443, "epoch": 1772} {"train_loss": -6.033304691314697, "global_step": 74444, "epoch": 1772} {"train_loss": -6.04308557510376, "global_step": 74445, "epoch": 1772} {"train_loss": -6.089869499206543, "global_step": 74446, "epoch": 1772} {"train_loss": -5.967830657958984, "global_step": 74447, "epoch": 1772} {"train_loss": -6.021594047546387, "global_step": 74448, "epoch": 1772} {"train_loss": -6.006110191345215, "global_step": 74449, "epoch": 1772} {"train_loss": -6.105170726776123, "global_step": 74450, "epoch": 1772} {"train_loss": -5.845371723175049, "global_step": 74451, "epoch": 1772} {"train_loss": -6.110884666442871, "global_step": 74452, "epoch": 1772} {"train_loss": -5.917695045471191, "global_step": 74453, "epoch": 1772} {"train_loss": -6.008967399597168, "global_step": 74454, "epoch": 1772} {"train_loss": -5.917154312133789, "global_step": 74455, "epoch": 1772} {"train_loss": -5.920862197875977, "global_step": 74456, "epoch": 1772} {"train_loss": -5.959068298339844, "global_step": 74457, "epoch": 1772} {"train_loss": -5.933557987213135, "global_step": 74458, "epoch": 1772} {"train_loss": -5.959403038024902, "global_step": 74459, "epoch": 1772} {"train_loss": -5.99807071685791, "global_step": 74460, "epoch": 1772} {"train_loss": -6.171041011810303, "global_step": 74461, "epoch": 1772} {"train_loss": -5.841196060180664, "global_step": 74462, "epoch": 1772} {"train_loss": -5.951278209686279, "global_step": 74463, "epoch": 1772} {"train_loss": -6.027538299560547, "global_step": 74464, "epoch": 1772} {"train_loss": -6.03159118833996, "global_step": 74465, "epoch": 1772, "val_loss": 75233.1171875} {"train_loss": -6.006647109985352, "global_step": 74466, "epoch": 1773} {"train_loss": -6.054965972900391, "global_step": 74467, "epoch": 1773} {"train_loss": -5.973535537719727, "global_step": 74468, "epoch": 1773} {"train_loss": -5.977191925048828, "global_step": 74469, "epoch": 1773} {"train_loss": -5.9802069664001465, "global_step": 74470, "epoch": 1773} {"train_loss": -5.894808292388916, "global_step": 74471, "epoch": 1773} {"train_loss": -6.015469551086426, "global_step": 74472, "epoch": 1773} {"train_loss": -6.1324005126953125, "global_step": 74473, "epoch": 1773} {"train_loss": -5.974928855895996, "global_step": 74474, "epoch": 1773} {"train_loss": -6.143364429473877, "global_step": 74475, "epoch": 1773} {"train_loss": -5.884993076324463, "global_step": 74476, "epoch": 1773} {"train_loss": -5.95871639251709, "global_step": 74477, "epoch": 1773} {"train_loss": -6.0126447677612305, "global_step": 74478, "epoch": 1773} {"train_loss": -5.954853057861328, "global_step": 74479, "epoch": 1773} {"train_loss": -6.008852005004883, "global_step": 74480, "epoch": 1773} {"train_loss": -6.040434837341309, "global_step": 74481, "epoch": 1773} {"train_loss": -5.971722602844238, "global_step": 74482, "epoch": 1773} {"train_loss": -6.114734649658203, "global_step": 74483, "epoch": 1773} {"train_loss": -6.012125015258789, "global_step": 74484, "epoch": 1773} {"train_loss": -6.071462631225586, "global_step": 74485, "epoch": 1773} {"train_loss": -6.129334449768066, "global_step": 74486, "epoch": 1773} {"train_loss": -5.993128776550293, "global_step": 74487, "epoch": 1773} {"train_loss": -6.078460216522217, "global_step": 74488, "epoch": 1773} {"train_loss": -6.0354766845703125, "global_step": 74489, "epoch": 1773} {"train_loss": -6.0357232093811035, "global_step": 74490, "epoch": 1773} {"train_loss": -6.149340629577637, "global_step": 74491, "epoch": 1773} {"train_loss": -6.030984401702881, "global_step": 74492, "epoch": 1773} {"train_loss": -6.043517112731934, "global_step": 74493, "epoch": 1773} {"train_loss": -6.0063581466674805, "global_step": 74494, "epoch": 1773} {"train_loss": -6.15070915222168, "global_step": 74495, "epoch": 1773} {"train_loss": -5.963016510009766, "global_step": 74496, "epoch": 1773} {"train_loss": -6.086592674255371, "global_step": 74497, "epoch": 1773} {"train_loss": -6.158013343811035, "global_step": 74498, "epoch": 1773} {"train_loss": -6.131309509277344, "global_step": 74499, "epoch": 1773} {"train_loss": -6.129050254821777, "global_step": 74500, "epoch": 1773} {"train_loss": -6.115540027618408, "global_step": 74501, "epoch": 1773} {"train_loss": -6.146624565124512, "global_step": 74502, "epoch": 1773} {"train_loss": -5.998200416564941, "global_step": 74503, "epoch": 1773} {"train_loss": -6.069075584411621, "global_step": 74504, "epoch": 1773} {"train_loss": -5.987959861755371, "global_step": 74505, "epoch": 1773} {"train_loss": -6.105027198791504, "global_step": 74506, "epoch": 1773} {"train_loss": -6.041277817317417, "global_step": 74507, "epoch": 1773, "val_loss": 74596.8515625} {"train_loss": -6.059220314025879, "global_step": 74508, "epoch": 1774} {"train_loss": -6.087754726409912, "global_step": 74509, "epoch": 1774} {"train_loss": -6.050968647003174, "global_step": 74510, "epoch": 1774} {"train_loss": -6.0224995613098145, "global_step": 74511, "epoch": 1774} {"train_loss": -6.172657489776611, "global_step": 74512, "epoch": 1774} {"train_loss": -6.112638473510742, "global_step": 74513, "epoch": 1774} {"train_loss": -6.131175518035889, "global_step": 74514, "epoch": 1774} {"train_loss": -6.035279273986816, "global_step": 74515, "epoch": 1774} {"train_loss": -6.056962490081787, "global_step": 74516, "epoch": 1774} {"train_loss": -6.02630615234375, "global_step": 74517, "epoch": 1774} {"train_loss": -5.980995178222656, "global_step": 74518, "epoch": 1774} {"train_loss": -6.130786895751953, "global_step": 74519, "epoch": 1774} {"train_loss": -6.117183208465576, "global_step": 74520, "epoch": 1774} {"train_loss": -5.912871360778809, "global_step": 74521, "epoch": 1774} {"train_loss": -6.204706192016602, "global_step": 74522, "epoch": 1774} {"train_loss": -6.07283353805542, "global_step": 74523, "epoch": 1774} {"train_loss": -6.181510925292969, "global_step": 74524, "epoch": 1774} {"train_loss": -6.0762834548950195, "global_step": 74525, "epoch": 1774} {"train_loss": -6.04807186126709, "global_step": 74526, "epoch": 1774} {"train_loss": -6.0878424644470215, "global_step": 74527, "epoch": 1774} {"train_loss": -6.098321914672852, "global_step": 74528, "epoch": 1774} {"train_loss": -5.915543079376221, "global_step": 74529, "epoch": 1774} {"train_loss": -6.219212532043457, "global_step": 74530, "epoch": 1774} {"train_loss": -5.90703010559082, "global_step": 74531, "epoch": 1774} {"train_loss": -5.92905855178833, "global_step": 74532, "epoch": 1774} {"train_loss": -6.1002678871154785, "global_step": 74533, "epoch": 1774} {"train_loss": -5.926778316497803, "global_step": 74534, "epoch": 1774} {"train_loss": -5.974883079528809, "global_step": 74535, "epoch": 1774} {"train_loss": -5.972007751464844, "global_step": 74536, "epoch": 1774} {"train_loss": -5.988074779510498, "global_step": 74537, "epoch": 1774} {"train_loss": -6.129532814025879, "global_step": 74538, "epoch": 1774} {"train_loss": -6.063492774963379, "global_step": 74539, "epoch": 1774} {"train_loss": -6.105090618133545, "global_step": 74540, "epoch": 1774} {"train_loss": -6.008710861206055, "global_step": 74541, "epoch": 1774} {"train_loss": -6.177290439605713, "global_step": 74542, "epoch": 1774} {"train_loss": -6.1291046142578125, "global_step": 74543, "epoch": 1774} {"train_loss": -6.021689414978027, "global_step": 74544, "epoch": 1774} {"train_loss": -5.9580559730529785, "global_step": 74545, "epoch": 1774} {"train_loss": -6.10414457321167, "global_step": 74546, "epoch": 1774} {"train_loss": -6.11241340637207, "global_step": 74547, "epoch": 1774} {"train_loss": -6.07588529586792, "global_step": 74548, "epoch": 1774} {"train_loss": -6.0572784174056284, "global_step": 74549, "epoch": 1774, "val_loss": 74840.234375} {"train_loss": -6.188140869140625, "global_step": 74550, "epoch": 1775} {"train_loss": -6.106406211853027, "global_step": 74551, "epoch": 1775} {"train_loss": -6.070396423339844, "global_step": 74552, "epoch": 1775} {"train_loss": -6.070713996887207, "global_step": 74553, "epoch": 1775} {"train_loss": -6.125825881958008, "global_step": 74554, "epoch": 1775} {"train_loss": -6.222751140594482, "global_step": 74555, "epoch": 1775} {"train_loss": -6.101943016052246, "global_step": 74556, "epoch": 1775} {"train_loss": -6.000617027282715, "global_step": 74557, "epoch": 1775} {"train_loss": -6.030745506286621, "global_step": 74558, "epoch": 1775} {"train_loss": -5.9919891357421875, "global_step": 74559, "epoch": 1775} {"train_loss": -5.845264434814453, "global_step": 74560, "epoch": 1775} {"train_loss": -5.996375560760498, "global_step": 74561, "epoch": 1775} {"train_loss": -6.066173553466797, "global_step": 74562, "epoch": 1775} {"train_loss": -5.967947959899902, "global_step": 74563, "epoch": 1775} {"train_loss": -6.094854354858398, "global_step": 74564, "epoch": 1775} {"train_loss": -5.9577836990356445, "global_step": 74565, "epoch": 1775} {"train_loss": -6.156055450439453, "global_step": 74566, "epoch": 1775} {"train_loss": -6.0152482986450195, "global_step": 74567, "epoch": 1775} {"train_loss": -6.185873985290527, "global_step": 74568, "epoch": 1775} {"train_loss": -6.183648586273193, "global_step": 74569, "epoch": 1775} {"train_loss": -5.888340950012207, "global_step": 74570, "epoch": 1775} {"train_loss": -6.076321601867676, "global_step": 74571, "epoch": 1775} {"train_loss": -5.952674388885498, "global_step": 74572, "epoch": 1775} {"train_loss": -5.815929889678955, "global_step": 74573, "epoch": 1775} {"train_loss": -6.024371147155762, "global_step": 74574, "epoch": 1775} {"train_loss": -6.009544849395752, "global_step": 74575, "epoch": 1775} {"train_loss": -6.076663970947266, "global_step": 74576, "epoch": 1775} {"train_loss": -6.045404434204102, "global_step": 74577, "epoch": 1775} {"train_loss": -6.081154823303223, "global_step": 74578, "epoch": 1775} {"train_loss": -6.056657791137695, "global_step": 74579, "epoch": 1775} {"train_loss": -5.843240261077881, "global_step": 74580, "epoch": 1775} {"train_loss": -6.133256912231445, "global_step": 74581, "epoch": 1775} {"train_loss": -6.074995040893555, "global_step": 74582, "epoch": 1775} {"train_loss": -6.0598859786987305, "global_step": 74583, "epoch": 1775} {"train_loss": -5.940033912658691, "global_step": 74584, "epoch": 1775} {"train_loss": -5.9664387702941895, "global_step": 74585, "epoch": 1775} {"train_loss": -5.974705696105957, "global_step": 74586, "epoch": 1775} {"train_loss": -6.112797737121582, "global_step": 74587, "epoch": 1775} {"train_loss": -5.9908366203308105, "global_step": 74588, "epoch": 1775} {"train_loss": -6.088531494140625, "global_step": 74589, "epoch": 1775} {"train_loss": -6.020547866821289, "global_step": 74590, "epoch": 1775} {"train_loss": -6.04334214755467, "global_step": 74591, "epoch": 1775, "val_loss": 75147.9921875} {"train_loss": -6.149603366851807, "global_step": 74592, "epoch": 1776} {"train_loss": -6.096744537353516, "global_step": 74593, "epoch": 1776} {"train_loss": -6.059065818786621, "global_step": 74594, "epoch": 1776} {"train_loss": -6.133360862731934, "global_step": 74595, "epoch": 1776} {"train_loss": -6.0348286628723145, "global_step": 74596, "epoch": 1776} {"train_loss": -5.98610782623291, "global_step": 74597, "epoch": 1776} {"train_loss": -6.007609844207764, "global_step": 74598, "epoch": 1776} {"train_loss": -6.185341835021973, "global_step": 74599, "epoch": 1776} {"train_loss": -6.012521266937256, "global_step": 74600, "epoch": 1776} {"train_loss": -5.958366394042969, "global_step": 74601, "epoch": 1776} {"train_loss": -6.035699367523193, "global_step": 74602, "epoch": 1776} {"train_loss": -6.079930782318115, "global_step": 74603, "epoch": 1776} {"train_loss": -6.02886962890625, "global_step": 74604, "epoch": 1776} {"train_loss": -6.05380392074585, "global_step": 74605, "epoch": 1776} {"train_loss": -5.987514495849609, "global_step": 74606, "epoch": 1776} {"train_loss": -6.046940803527832, "global_step": 74607, "epoch": 1776} {"train_loss": -5.89133358001709, "global_step": 74608, "epoch": 1776} {"train_loss": -6.099093914031982, "global_step": 74609, "epoch": 1776} {"train_loss": -6.0340166091918945, "global_step": 74610, "epoch": 1776} {"train_loss": -6.04905366897583, "global_step": 74611, "epoch": 1776} {"train_loss": -6.032351493835449, "global_step": 74612, "epoch": 1776} {"train_loss": -6.0286712646484375, "global_step": 74613, "epoch": 1776} {"train_loss": -6.044314384460449, "global_step": 74614, "epoch": 1776} {"train_loss": -6.247343063354492, "global_step": 74615, "epoch": 1776} {"train_loss": -6.0031208992004395, "global_step": 74616, "epoch": 1776} {"train_loss": -6.153772354125977, "global_step": 74617, "epoch": 1776} {"train_loss": -5.934537887573242, "global_step": 74618, "epoch": 1776} {"train_loss": -6.046548366546631, "global_step": 74619, "epoch": 1776} {"train_loss": -6.157391548156738, "global_step": 74620, "epoch": 1776} {"train_loss": -6.077103137969971, "global_step": 74621, "epoch": 1776} {"train_loss": -6.06825065612793, "global_step": 74622, "epoch": 1776} {"train_loss": -6.098095893859863, "global_step": 74623, "epoch": 1776} {"train_loss": -6.072381973266602, "global_step": 74624, "epoch": 1776} {"train_loss": -6.021929740905762, "global_step": 74625, "epoch": 1776} {"train_loss": -6.059387683868408, "global_step": 74626, "epoch": 1776} {"train_loss": -6.110306739807129, "global_step": 74627, "epoch": 1776} {"train_loss": -6.107923984527588, "global_step": 74628, "epoch": 1776} {"train_loss": -6.209110736846924, "global_step": 74629, "epoch": 1776} {"train_loss": -6.084624290466309, "global_step": 74630, "epoch": 1776} {"train_loss": -6.1208295822143555, "global_step": 74631, "epoch": 1776} {"train_loss": -6.1375274658203125, "global_step": 74632, "epoch": 1776} {"train_loss": -6.064791225251698, "global_step": 74633, "epoch": 1776, "val_loss": 74804.5390625} {"train_loss": -6.068291187286377, "global_step": 74634, "epoch": 1777} {"train_loss": -6.146381378173828, "global_step": 74635, "epoch": 1777} {"train_loss": -6.034554481506348, "global_step": 74636, "epoch": 1777} {"train_loss": -6.108119964599609, "global_step": 74637, "epoch": 1777} {"train_loss": -6.053756237030029, "global_step": 74638, "epoch": 1777} {"train_loss": -6.051041603088379, "global_step": 74639, "epoch": 1777} {"train_loss": -6.216427803039551, "global_step": 74640, "epoch": 1777} {"train_loss": -6.097145080566406, "global_step": 74641, "epoch": 1777} {"train_loss": -6.09737491607666, "global_step": 74642, "epoch": 1777} {"train_loss": -6.155784606933594, "global_step": 74643, "epoch": 1777} {"train_loss": -5.974586486816406, "global_step": 74644, "epoch": 1777} {"train_loss": -5.922207355499268, "global_step": 74645, "epoch": 1777} {"train_loss": -5.913845062255859, "global_step": 74646, "epoch": 1777} {"train_loss": -5.953061103820801, "global_step": 74647, "epoch": 1777} {"train_loss": -6.0057477951049805, "global_step": 74648, "epoch": 1777} {"train_loss": -5.992158889770508, "global_step": 74649, "epoch": 1777} {"train_loss": -6.032983779907227, "global_step": 74650, "epoch": 1777} {"train_loss": -5.903443336486816, "global_step": 74651, "epoch": 1777} {"train_loss": -6.010533809661865, "global_step": 74652, "epoch": 1777} {"train_loss": -6.011710166931152, "global_step": 74653, "epoch": 1777} {"train_loss": -6.023794651031494, "global_step": 74654, "epoch": 1777} {"train_loss": -6.004683494567871, "global_step": 74655, "epoch": 1777} {"train_loss": -6.102669715881348, "global_step": 74656, "epoch": 1777} {"train_loss": -6.016376495361328, "global_step": 74657, "epoch": 1777} {"train_loss": -5.953645706176758, "global_step": 74658, "epoch": 1777} {"train_loss": -5.9739861488342285, "global_step": 74659, "epoch": 1777} {"train_loss": -6.047858238220215, "global_step": 74660, "epoch": 1777} {"train_loss": -5.87437105178833, "global_step": 74661, "epoch": 1777} {"train_loss": -5.970416069030762, "global_step": 74662, "epoch": 1777} {"train_loss": -5.961682319641113, "global_step": 74663, "epoch": 1777} {"train_loss": -6.008505821228027, "global_step": 74664, "epoch": 1777} {"train_loss": -6.025239944458008, "global_step": 74665, "epoch": 1777} {"train_loss": -6.0256500244140625, "global_step": 74666, "epoch": 1777} {"train_loss": -5.988114356994629, "global_step": 74667, "epoch": 1777} {"train_loss": -6.0767436027526855, "global_step": 74668, "epoch": 1777} {"train_loss": -5.884929180145264, "global_step": 74669, "epoch": 1777} {"train_loss": -6.035865783691406, "global_step": 74670, "epoch": 1777} {"train_loss": -5.887242317199707, "global_step": 74671, "epoch": 1777} {"train_loss": -5.895541191101074, "global_step": 74672, "epoch": 1777} {"train_loss": -6.055435657501221, "global_step": 74673, "epoch": 1777} {"train_loss": -6.133634567260742, "global_step": 74674, "epoch": 1777} {"train_loss": -6.018324681690761, "global_step": 74675, "epoch": 1777, "val_loss": 74705.0859375} {"train_loss": -6.010038375854492, "global_step": 74676, "epoch": 1778} {"train_loss": -6.074483871459961, "global_step": 74677, "epoch": 1778} {"train_loss": -6.009640693664551, "global_step": 74678, "epoch": 1778} {"train_loss": -6.030634880065918, "global_step": 74679, "epoch": 1778} {"train_loss": -6.054497718811035, "global_step": 74680, "epoch": 1778} {"train_loss": -6.098718166351318, "global_step": 74681, "epoch": 1778} {"train_loss": -6.2469329833984375, "global_step": 74682, "epoch": 1778} {"train_loss": -5.979147911071777, "global_step": 74683, "epoch": 1778} {"train_loss": -6.091245651245117, "global_step": 74684, "epoch": 1778} {"train_loss": -6.1846771240234375, "global_step": 74685, "epoch": 1778} {"train_loss": -5.886778354644775, "global_step": 74686, "epoch": 1778} {"train_loss": -6.070530891418457, "global_step": 74687, "epoch": 1778} {"train_loss": -6.101743698120117, "global_step": 74688, "epoch": 1778} {"train_loss": -6.045958518981934, "global_step": 74689, "epoch": 1778} {"train_loss": -6.240715026855469, "global_step": 74690, "epoch": 1778} {"train_loss": -6.145620822906494, "global_step": 74691, "epoch": 1778} {"train_loss": -6.105189323425293, "global_step": 74692, "epoch": 1778} {"train_loss": -6.070623397827148, "global_step": 74693, "epoch": 1778} {"train_loss": -6.118645668029785, "global_step": 74694, "epoch": 1778} {"train_loss": -6.010325908660889, "global_step": 74695, "epoch": 1778} {"train_loss": -6.151932716369629, "global_step": 74696, "epoch": 1778} {"train_loss": -6.163856506347656, "global_step": 74697, "epoch": 1778} {"train_loss": -6.198962688446045, "global_step": 74698, "epoch": 1778} {"train_loss": -6.014544486999512, "global_step": 74699, "epoch": 1778} {"train_loss": -6.098110675811768, "global_step": 74700, "epoch": 1778} {"train_loss": -5.986833572387695, "global_step": 74701, "epoch": 1778} {"train_loss": -5.957130432128906, "global_step": 74702, "epoch": 1778} {"train_loss": -6.133963108062744, "global_step": 74703, "epoch": 1778} {"train_loss": -6.105709552764893, "global_step": 74704, "epoch": 1778} {"train_loss": -6.1203460693359375, "global_step": 74705, "epoch": 1778} {"train_loss": -6.018294334411621, "global_step": 74706, "epoch": 1778} {"train_loss": -6.109526634216309, "global_step": 74707, "epoch": 1778} {"train_loss": -6.169902801513672, "global_step": 74708, "epoch": 1778} {"train_loss": -6.11685037612915, "global_step": 74709, "epoch": 1778} {"train_loss": -6.0221099853515625, "global_step": 74710, "epoch": 1778} {"train_loss": -5.9730048179626465, "global_step": 74711, "epoch": 1778} {"train_loss": -6.163738250732422, "global_step": 74712, "epoch": 1778} {"train_loss": -6.128007411956787, "global_step": 74713, "epoch": 1778} {"train_loss": -6.058769226074219, "global_step": 74714, "epoch": 1778} {"train_loss": -6.133674621582031, "global_step": 74715, "epoch": 1778} {"train_loss": -6.191822052001953, "global_step": 74716, "epoch": 1778} {"train_loss": -6.0862952300480435, "global_step": 74717, "epoch": 1778, "val_loss": 74904.328125} {"train_loss": -6.123403549194336, "global_step": 74718, "epoch": 1779} {"train_loss": -6.175046443939209, "global_step": 74719, "epoch": 1779} {"train_loss": -6.08128547668457, "global_step": 74720, "epoch": 1779} {"train_loss": -6.046157360076904, "global_step": 74721, "epoch": 1779} {"train_loss": -6.0298357009887695, "global_step": 74722, "epoch": 1779} {"train_loss": -6.0406174659729, "global_step": 74723, "epoch": 1779} {"train_loss": -6.101004123687744, "global_step": 74724, "epoch": 1779} {"train_loss": -5.9862213134765625, "global_step": 74725, "epoch": 1779} {"train_loss": -5.980141639709473, "global_step": 74726, "epoch": 1779} {"train_loss": -5.997015953063965, "global_step": 74727, "epoch": 1779} {"train_loss": -6.035299777984619, "global_step": 74728, "epoch": 1779} {"train_loss": -6.127220153808594, "global_step": 74729, "epoch": 1779} {"train_loss": -6.029302597045898, "global_step": 74730, "epoch": 1779} {"train_loss": -6.126802444458008, "global_step": 74731, "epoch": 1779} {"train_loss": -6.051383972167969, "global_step": 74732, "epoch": 1779} {"train_loss": -5.974505424499512, "global_step": 74733, "epoch": 1779} {"train_loss": -6.088212966918945, "global_step": 74734, "epoch": 1779} {"train_loss": -6.164996147155762, "global_step": 74735, "epoch": 1779} {"train_loss": -5.957448959350586, "global_step": 74736, "epoch": 1779} {"train_loss": -6.101806640625, "global_step": 74737, "epoch": 1779} {"train_loss": -6.145455360412598, "global_step": 74738, "epoch": 1779} {"train_loss": -6.0124969482421875, "global_step": 74739, "epoch": 1779} {"train_loss": -6.233181476593018, "global_step": 74740, "epoch": 1779} {"train_loss": -5.928844451904297, "global_step": 74741, "epoch": 1779} {"train_loss": -6.02593469619751, "global_step": 74742, "epoch": 1779} {"train_loss": -5.942891597747803, "global_step": 74743, "epoch": 1779} {"train_loss": -6.078495025634766, "global_step": 74744, "epoch": 1779} {"train_loss": -5.961799621582031, "global_step": 74745, "epoch": 1779} {"train_loss": -6.091382026672363, "global_step": 74746, "epoch": 1779} {"train_loss": -5.900440692901611, "global_step": 74747, "epoch": 1779} {"train_loss": -6.108592510223389, "global_step": 74748, "epoch": 1779} {"train_loss": -5.957248687744141, "global_step": 74749, "epoch": 1779} {"train_loss": -5.959444046020508, "global_step": 74750, "epoch": 1779} {"train_loss": -6.007350921630859, "global_step": 74751, "epoch": 1779} {"train_loss": -5.923800468444824, "global_step": 74752, "epoch": 1779} {"train_loss": -6.007515907287598, "global_step": 74753, "epoch": 1779} {"train_loss": -5.9731125831604, "global_step": 74754, "epoch": 1779} {"train_loss": -5.944234848022461, "global_step": 74755, "epoch": 1779} {"train_loss": -6.0428361892700195, "global_step": 74756, "epoch": 1779} {"train_loss": -6.06461763381958, "global_step": 74757, "epoch": 1779} {"train_loss": -6.157546520233154, "global_step": 74758, "epoch": 1779} {"train_loss": -6.043148086184547, "global_step": 74759, "epoch": 1779, "val_loss": 74925.953125} {"train_loss": -6.091762542724609, "global_step": 74760, "epoch": 1780} {"train_loss": -6.04693078994751, "global_step": 74761, "epoch": 1780} {"train_loss": -6.061328887939453, "global_step": 74762, "epoch": 1780} {"train_loss": -6.096540927886963, "global_step": 74763, "epoch": 1780} {"train_loss": -6.05402135848999, "global_step": 74764, "epoch": 1780} {"train_loss": -6.100814342498779, "global_step": 74765, "epoch": 1780} {"train_loss": -6.03946590423584, "global_step": 74766, "epoch": 1780} {"train_loss": -6.09246826171875, "global_step": 74767, "epoch": 1780} {"train_loss": -6.057309150695801, "global_step": 74768, "epoch": 1780} {"train_loss": -6.044417381286621, "global_step": 74769, "epoch": 1780} {"train_loss": -6.048046112060547, "global_step": 74770, "epoch": 1780} {"train_loss": -6.050961494445801, "global_step": 74771, "epoch": 1780} {"train_loss": -6.118672847747803, "global_step": 74772, "epoch": 1780} {"train_loss": -5.97188663482666, "global_step": 74773, "epoch": 1780} {"train_loss": -6.125378131866455, "global_step": 74774, "epoch": 1780} {"train_loss": -6.134769439697266, "global_step": 74775, "epoch": 1780} {"train_loss": -6.09555196762085, "global_step": 74776, "epoch": 1780} {"train_loss": -6.117061614990234, "global_step": 74777, "epoch": 1780} {"train_loss": -6.100107192993164, "global_step": 74778, "epoch": 1780} {"train_loss": -6.20082426071167, "global_step": 74779, "epoch": 1780} {"train_loss": -5.981109619140625, "global_step": 74780, "epoch": 1780} {"train_loss": -6.0657057762146, "global_step": 74781, "epoch": 1780} {"train_loss": -6.126320838928223, "global_step": 74782, "epoch": 1780} {"train_loss": -5.988136291503906, "global_step": 74783, "epoch": 1780} {"train_loss": -6.182013034820557, "global_step": 74784, "epoch": 1780} {"train_loss": -6.18227481842041, "global_step": 74785, "epoch": 1780} {"train_loss": -6.08579683303833, "global_step": 74786, "epoch": 1780} {"train_loss": -6.116553783416748, "global_step": 74787, "epoch": 1780} {"train_loss": -6.066479682922363, "global_step": 74788, "epoch": 1780} {"train_loss": -6.083354949951172, "global_step": 74789, "epoch": 1780} {"train_loss": -6.093153953552246, "global_step": 74790, "epoch": 1780} {"train_loss": -6.113476276397705, "global_step": 74791, "epoch": 1780} {"train_loss": -6.1275835037231445, "global_step": 74792, "epoch": 1780} {"train_loss": -6.191470623016357, "global_step": 74793, "epoch": 1780} {"train_loss": -6.020402908325195, "global_step": 74794, "epoch": 1780} {"train_loss": -6.156432628631592, "global_step": 74795, "epoch": 1780} {"train_loss": -6.1441802978515625, "global_step": 74796, "epoch": 1780} {"train_loss": -5.9924774169921875, "global_step": 74797, "epoch": 1780} {"train_loss": -6.068765640258789, "global_step": 74798, "epoch": 1780} {"train_loss": -5.987344741821289, "global_step": 74799, "epoch": 1780} {"train_loss": -5.999567031860352, "global_step": 74800, "epoch": 1780} {"train_loss": -6.082726013092768, "global_step": 74801, "epoch": 1780, "val_loss": 74871.6953125} {"train_loss": -6.10909366607666, "global_step": 74802, "epoch": 1781} {"train_loss": -6.112514495849609, "global_step": 74803, "epoch": 1781} {"train_loss": -6.1347126960754395, "global_step": 74804, "epoch": 1781} {"train_loss": -6.068409442901611, "global_step": 74805, "epoch": 1781} {"train_loss": -6.039496898651123, "global_step": 74806, "epoch": 1781} {"train_loss": -6.203132629394531, "global_step": 74807, "epoch": 1781} {"train_loss": -6.149510383605957, "global_step": 74808, "epoch": 1781} {"train_loss": -6.073394298553467, "global_step": 74809, "epoch": 1781} {"train_loss": -6.030147552490234, "global_step": 74810, "epoch": 1781} {"train_loss": -6.095066070556641, "global_step": 74811, "epoch": 1781} {"train_loss": -6.04445743560791, "global_step": 74812, "epoch": 1781} {"train_loss": -6.08241081237793, "global_step": 74813, "epoch": 1781} {"train_loss": -6.037854194641113, "global_step": 74814, "epoch": 1781} {"train_loss": -6.177154541015625, "global_step": 74815, "epoch": 1781} {"train_loss": -6.097061634063721, "global_step": 74816, "epoch": 1781} {"train_loss": -6.108870983123779, "global_step": 74817, "epoch": 1781} {"train_loss": -6.116365432739258, "global_step": 74818, "epoch": 1781} {"train_loss": -6.0426130294799805, "global_step": 74819, "epoch": 1781} {"train_loss": -6.103554725646973, "global_step": 74820, "epoch": 1781} {"train_loss": -6.140154838562012, "global_step": 74821, "epoch": 1781} {"train_loss": -6.038866996765137, "global_step": 74822, "epoch": 1781} {"train_loss": -6.004703521728516, "global_step": 74823, "epoch": 1781} {"train_loss": -5.973641872406006, "global_step": 74824, "epoch": 1781} {"train_loss": -5.9988908767700195, "global_step": 74825, "epoch": 1781} {"train_loss": -6.205559253692627, "global_step": 74826, "epoch": 1781} {"train_loss": -6.126145362854004, "global_step": 74827, "epoch": 1781} {"train_loss": -6.058221817016602, "global_step": 74828, "epoch": 1781} {"train_loss": -6.147976398468018, "global_step": 74829, "epoch": 1781} {"train_loss": -6.138740539550781, "global_step": 74830, "epoch": 1781} {"train_loss": -6.067900657653809, "global_step": 74831, "epoch": 1781} {"train_loss": -6.003960609436035, "global_step": 74832, "epoch": 1781} {"train_loss": -6.046953201293945, "global_step": 74833, "epoch": 1781} {"train_loss": -6.099836826324463, "global_step": 74834, "epoch": 1781} {"train_loss": -6.125138282775879, "global_step": 74835, "epoch": 1781} {"train_loss": -6.1306471824646, "global_step": 74836, "epoch": 1781} {"train_loss": -5.998226165771484, "global_step": 74837, "epoch": 1781} {"train_loss": -6.047218322753906, "global_step": 74838, "epoch": 1781} {"train_loss": -5.938099384307861, "global_step": 74839, "epoch": 1781} {"train_loss": -6.186781883239746, "global_step": 74840, "epoch": 1781} {"train_loss": -6.102240562438965, "global_step": 74841, "epoch": 1781} {"train_loss": -6.175102233886719, "global_step": 74842, "epoch": 1781} {"train_loss": -6.083457220168341, "global_step": 74843, "epoch": 1781, "val_loss": 74918.9921875} {"train_loss": -6.0207200050354, "global_step": 74844, "epoch": 1782} {"train_loss": -6.121874809265137, "global_step": 74845, "epoch": 1782} {"train_loss": -6.0295305252075195, "global_step": 74846, "epoch": 1782} {"train_loss": -6.176366806030273, "global_step": 74847, "epoch": 1782} {"train_loss": -6.09674072265625, "global_step": 74848, "epoch": 1782} {"train_loss": -5.980070114135742, "global_step": 74849, "epoch": 1782} {"train_loss": -6.1616973876953125, "global_step": 74850, "epoch": 1782} {"train_loss": -6.2204694747924805, "global_step": 74851, "epoch": 1782} {"train_loss": -6.031177043914795, "global_step": 74852, "epoch": 1782} {"train_loss": -6.162403106689453, "global_step": 74853, "epoch": 1782} {"train_loss": -6.062353610992432, "global_step": 74854, "epoch": 1782} {"train_loss": -6.140408992767334, "global_step": 74855, "epoch": 1782} {"train_loss": -6.093520164489746, "global_step": 74856, "epoch": 1782} {"train_loss": -6.148170471191406, "global_step": 74857, "epoch": 1782} {"train_loss": -6.072049140930176, "global_step": 74858, "epoch": 1782} {"train_loss": -6.098919868469238, "global_step": 74859, "epoch": 1782} {"train_loss": -6.171818733215332, "global_step": 74860, "epoch": 1782} {"train_loss": -6.044350624084473, "global_step": 74861, "epoch": 1782} {"train_loss": -6.0999298095703125, "global_step": 74862, "epoch": 1782} {"train_loss": -6.063033103942871, "global_step": 74863, "epoch": 1782} {"train_loss": -6.0366950035095215, "global_step": 74864, "epoch": 1782} {"train_loss": -6.019621849060059, "global_step": 74865, "epoch": 1782} {"train_loss": -6.00861120223999, "global_step": 74866, "epoch": 1782} {"train_loss": -5.973498344421387, "global_step": 74867, "epoch": 1782} {"train_loss": -6.077444076538086, "global_step": 74868, "epoch": 1782} {"train_loss": -6.12800931930542, "global_step": 74869, "epoch": 1782} {"train_loss": -6.043573379516602, "global_step": 74870, "epoch": 1782} {"train_loss": -6.127718925476074, "global_step": 74871, "epoch": 1782} {"train_loss": -6.120627403259277, "global_step": 74872, "epoch": 1782} {"train_loss": -6.115147590637207, "global_step": 74873, "epoch": 1782} {"train_loss": -6.024889945983887, "global_step": 74874, "epoch": 1782} {"train_loss": -6.113077163696289, "global_step": 74875, "epoch": 1782} {"train_loss": -6.136172771453857, "global_step": 74876, "epoch": 1782} {"train_loss": -6.153839111328125, "global_step": 74877, "epoch": 1782} {"train_loss": -6.031128883361816, "global_step": 74878, "epoch": 1782} {"train_loss": -6.058699131011963, "global_step": 74879, "epoch": 1782} {"train_loss": -6.0952911376953125, "global_step": 74880, "epoch": 1782} {"train_loss": -6.011194229125977, "global_step": 74881, "epoch": 1782} {"train_loss": -6.002668380737305, "global_step": 74882, "epoch": 1782} {"train_loss": -6.051532745361328, "global_step": 74883, "epoch": 1782} {"train_loss": -6.19212532043457, "global_step": 74884, "epoch": 1782} {"train_loss": -6.08547728402274, "global_step": 74885, "epoch": 1782, "val_loss": 74575.8515625} {"train_loss": -6.06495475769043, "global_step": 74886, "epoch": 1783} {"train_loss": -6.07056999206543, "global_step": 74887, "epoch": 1783} {"train_loss": -6.035306453704834, "global_step": 74888, "epoch": 1783} {"train_loss": -6.049873352050781, "global_step": 74889, "epoch": 1783} {"train_loss": -5.956411838531494, "global_step": 74890, "epoch": 1783} {"train_loss": -6.188380241394043, "global_step": 74891, "epoch": 1783} {"train_loss": -5.889049530029297, "global_step": 74892, "epoch": 1783} {"train_loss": -6.055506229400635, "global_step": 74893, "epoch": 1783} {"train_loss": -5.9257307052612305, "global_step": 74894, "epoch": 1783} {"train_loss": -6.100663185119629, "global_step": 74895, "epoch": 1783} {"train_loss": -6.00169563293457, "global_step": 74896, "epoch": 1783} {"train_loss": -6.152723789215088, "global_step": 74897, "epoch": 1783} {"train_loss": -6.021324157714844, "global_step": 74898, "epoch": 1783} {"train_loss": -6.0472941398620605, "global_step": 74899, "epoch": 1783} {"train_loss": -6.106975555419922, "global_step": 74900, "epoch": 1783} {"train_loss": -6.058111190795898, "global_step": 74901, "epoch": 1783} {"train_loss": -6.1035566329956055, "global_step": 74902, "epoch": 1783} {"train_loss": -6.089344501495361, "global_step": 74903, "epoch": 1783} {"train_loss": -6.0799689292907715, "global_step": 74904, "epoch": 1783} {"train_loss": -6.071294784545898, "global_step": 74905, "epoch": 1783} {"train_loss": -6.115176200866699, "global_step": 74906, "epoch": 1783} {"train_loss": -6.086208820343018, "global_step": 74907, "epoch": 1783} {"train_loss": -6.016168594360352, "global_step": 74908, "epoch": 1783} {"train_loss": -6.167693138122559, "global_step": 74909, "epoch": 1783} {"train_loss": -6.111371040344238, "global_step": 74910, "epoch": 1783} {"train_loss": -6.049254894256592, "global_step": 74911, "epoch": 1783} {"train_loss": -6.190422058105469, "global_step": 74912, "epoch": 1783} {"train_loss": -6.141962051391602, "global_step": 74913, "epoch": 1783} {"train_loss": -6.167662620544434, "global_step": 74914, "epoch": 1783} {"train_loss": -6.091596603393555, "global_step": 74915, "epoch": 1783} {"train_loss": -6.204033851623535, "global_step": 74916, "epoch": 1783} {"train_loss": -5.968463897705078, "global_step": 74917, "epoch": 1783} {"train_loss": -6.0641326904296875, "global_step": 74918, "epoch": 1783} {"train_loss": -6.01137638092041, "global_step": 74919, "epoch": 1783} {"train_loss": -6.0046916007995605, "global_step": 74920, "epoch": 1783} {"train_loss": -5.9300689697265625, "global_step": 74921, "epoch": 1783} {"train_loss": -5.936570644378662, "global_step": 74922, "epoch": 1783} {"train_loss": -5.90706205368042, "global_step": 74923, "epoch": 1783} {"train_loss": -6.0459113121032715, "global_step": 74924, "epoch": 1783} {"train_loss": -5.943052291870117, "global_step": 74925, "epoch": 1783} {"train_loss": -6.041785717010498, "global_step": 74926, "epoch": 1783} {"train_loss": -6.054811568487258, "global_step": 74927, "epoch": 1783, "val_loss": 74958.5078125} {"train_loss": -5.942935943603516, "global_step": 74928, "epoch": 1784} {"train_loss": -6.079032897949219, "global_step": 74929, "epoch": 1784} {"train_loss": -6.051272392272949, "global_step": 74930, "epoch": 1784} {"train_loss": -6.115731239318848, "global_step": 74931, "epoch": 1784} {"train_loss": -5.965619087219238, "global_step": 74932, "epoch": 1784} {"train_loss": -6.015891075134277, "global_step": 74933, "epoch": 1784} {"train_loss": -6.0874786376953125, "global_step": 74934, "epoch": 1784} {"train_loss": -5.949267387390137, "global_step": 74935, "epoch": 1784} {"train_loss": -5.906923294067383, "global_step": 74936, "epoch": 1784} {"train_loss": -6.081942558288574, "global_step": 74937, "epoch": 1784} {"train_loss": -6.0059895515441895, "global_step": 74938, "epoch": 1784} {"train_loss": -6.015551567077637, "global_step": 74939, "epoch": 1784} {"train_loss": -5.838150978088379, "global_step": 74940, "epoch": 1784} {"train_loss": -5.8938398361206055, "global_step": 74941, "epoch": 1784} {"train_loss": -6.006422996520996, "global_step": 74942, "epoch": 1784} {"train_loss": -6.063372611999512, "global_step": 74943, "epoch": 1784} {"train_loss": -6.109912872314453, "global_step": 74944, "epoch": 1784} {"train_loss": -6.026120185852051, "global_step": 74945, "epoch": 1784} {"train_loss": -6.008553981781006, "global_step": 74946, "epoch": 1784} {"train_loss": -5.989302635192871, "global_step": 74947, "epoch": 1784} {"train_loss": -6.034575462341309, "global_step": 74948, "epoch": 1784} {"train_loss": -6.089542865753174, "global_step": 74949, "epoch": 1784} {"train_loss": -5.982529640197754, "global_step": 74950, "epoch": 1784} {"train_loss": -5.938602447509766, "global_step": 74951, "epoch": 1784} {"train_loss": -6.134357929229736, "global_step": 74952, "epoch": 1784} {"train_loss": -5.951290130615234, "global_step": 74953, "epoch": 1784} {"train_loss": -6.116314888000488, "global_step": 74954, "epoch": 1784} {"train_loss": -5.969244956970215, "global_step": 74955, "epoch": 1784} {"train_loss": -6.046499252319336, "global_step": 74956, "epoch": 1784} {"train_loss": -5.98000431060791, "global_step": 74957, "epoch": 1784} {"train_loss": -6.007864952087402, "global_step": 74958, "epoch": 1784} {"train_loss": -5.871400833129883, "global_step": 74959, "epoch": 1784} {"train_loss": -5.994930267333984, "global_step": 74960, "epoch": 1784} {"train_loss": -6.202824592590332, "global_step": 74961, "epoch": 1784} {"train_loss": -5.856870174407959, "global_step": 74962, "epoch": 1784} {"train_loss": -6.115675926208496, "global_step": 74963, "epoch": 1784} {"train_loss": -6.038565635681152, "global_step": 74964, "epoch": 1784} {"train_loss": -6.124771595001221, "global_step": 74965, "epoch": 1784} {"train_loss": -6.065548896789551, "global_step": 74966, "epoch": 1784} {"train_loss": -6.027083873748779, "global_step": 74967, "epoch": 1784} {"train_loss": -6.125091552734375, "global_step": 74968, "epoch": 1784} {"train_loss": -6.01659833817255, "global_step": 74969, "epoch": 1784, "val_loss": 74731.3125} {"train_loss": -6.120209693908691, "global_step": 74970, "epoch": 1785} {"train_loss": -6.067481994628906, "global_step": 74971, "epoch": 1785} {"train_loss": -6.197473526000977, "global_step": 74972, "epoch": 1785} {"train_loss": -6.012126445770264, "global_step": 74973, "epoch": 1785} {"train_loss": -5.970800399780273, "global_step": 74974, "epoch": 1785} {"train_loss": -6.102808952331543, "global_step": 74975, "epoch": 1785} {"train_loss": -6.035486221313477, "global_step": 74976, "epoch": 1785} {"train_loss": -5.958104133605957, "global_step": 74977, "epoch": 1785} {"train_loss": -6.0632781982421875, "global_step": 74978, "epoch": 1785} {"train_loss": -6.03598690032959, "global_step": 74979, "epoch": 1785} {"train_loss": -5.947990417480469, "global_step": 74980, "epoch": 1785} {"train_loss": -6.076732635498047, "global_step": 74981, "epoch": 1785} {"train_loss": -6.090651035308838, "global_step": 74982, "epoch": 1785} {"train_loss": -5.979837894439697, "global_step": 74983, "epoch": 1785} {"train_loss": -6.134177207946777, "global_step": 74984, "epoch": 1785} {"train_loss": -6.101152420043945, "global_step": 74985, "epoch": 1785} {"train_loss": -6.050114154815674, "global_step": 74986, "epoch": 1785} {"train_loss": -6.071928977966309, "global_step": 74987, "epoch": 1785} {"train_loss": -6.1472554206848145, "global_step": 74988, "epoch": 1785} {"train_loss": -6.1216583251953125, "global_step": 74989, "epoch": 1785} {"train_loss": -6.014224529266357, "global_step": 74990, "epoch": 1785} {"train_loss": -5.9877777099609375, "global_step": 74991, "epoch": 1785} {"train_loss": -5.93611478805542, "global_step": 74992, "epoch": 1785} {"train_loss": -6.0540547370910645, "global_step": 74993, "epoch": 1785} {"train_loss": -6.117501258850098, "global_step": 74994, "epoch": 1785} {"train_loss": -6.113283634185791, "global_step": 74995, "epoch": 1785} {"train_loss": -6.140712738037109, "global_step": 74996, "epoch": 1785} {"train_loss": -6.188406944274902, "global_step": 74997, "epoch": 1785} {"train_loss": -6.026005268096924, "global_step": 74998, "epoch": 1785} {"train_loss": -6.15972375869751, "global_step": 74999, "epoch": 1785} {"train_loss": -6.038672924041748, "global_step": 75000, "epoch": 1785} {"train_loss": -6.149645805358887, "global_step": 75001, "epoch": 1785} {"train_loss": -6.101921558380127, "global_step": 75002, "epoch": 1785} {"train_loss": -6.093073844909668, "global_step": 75003, "epoch": 1785} {"train_loss": -6.03947639465332, "global_step": 75004, "epoch": 1785} {"train_loss": -6.11910343170166, "global_step": 75005, "epoch": 1785} {"train_loss": -6.134720802307129, "global_step": 75006, "epoch": 1785} {"train_loss": -6.112757682800293, "global_step": 75007, "epoch": 1785} {"train_loss": -6.141334533691406, "global_step": 75008, "epoch": 1785} {"train_loss": -6.004061698913574, "global_step": 75009, "epoch": 1785} {"train_loss": -6.0735578536987305, "global_step": 75010, "epoch": 1785} {"train_loss": -6.075517972310384, "global_step": 75011, "epoch": 1785, "val_loss": 74871.625} {"train_loss": -6.169954299926758, "global_step": 75012, "epoch": 1786} {"train_loss": -6.112845420837402, "global_step": 75013, "epoch": 1786} {"train_loss": -6.205609321594238, "global_step": 75014, "epoch": 1786} {"train_loss": -5.9987897872924805, "global_step": 75015, "epoch": 1786} {"train_loss": -6.123575687408447, "global_step": 75016, "epoch": 1786} {"train_loss": -6.263520240783691, "global_step": 75017, "epoch": 1786} {"train_loss": -6.144474506378174, "global_step": 75018, "epoch": 1786} {"train_loss": -6.1428632736206055, "global_step": 75019, "epoch": 1786} {"train_loss": -6.03621244430542, "global_step": 75020, "epoch": 1786} {"train_loss": -5.966235160827637, "global_step": 75021, "epoch": 1786} {"train_loss": -6.179446220397949, "global_step": 75022, "epoch": 1786} {"train_loss": -6.0530290603637695, "global_step": 75023, "epoch": 1786} {"train_loss": -6.196185111999512, "global_step": 75024, "epoch": 1786} {"train_loss": -6.015639305114746, "global_step": 75025, "epoch": 1786} {"train_loss": -6.020328521728516, "global_step": 75026, "epoch": 1786} {"train_loss": -6.119842529296875, "global_step": 75027, "epoch": 1786} {"train_loss": -6.144391059875488, "global_step": 75028, "epoch": 1786} {"train_loss": -6.038273811340332, "global_step": 75029, "epoch": 1786} {"train_loss": -6.2073750495910645, "global_step": 75030, "epoch": 1786} {"train_loss": -6.044281005859375, "global_step": 75031, "epoch": 1786} {"train_loss": -6.116274833679199, "global_step": 75032, "epoch": 1786} {"train_loss": -6.0982208251953125, "global_step": 75033, "epoch": 1786} {"train_loss": -6.196396827697754, "global_step": 75034, "epoch": 1786} {"train_loss": -6.040256977081299, "global_step": 75035, "epoch": 1786} {"train_loss": -6.192716598510742, "global_step": 75036, "epoch": 1786} {"train_loss": -6.016989707946777, "global_step": 75037, "epoch": 1786} {"train_loss": -5.8943915367126465, "global_step": 75038, "epoch": 1786} {"train_loss": -6.099490642547607, "global_step": 75039, "epoch": 1786} {"train_loss": -6.11767578125, "global_step": 75040, "epoch": 1786} {"train_loss": -6.0231428146362305, "global_step": 75041, "epoch": 1786} {"train_loss": -6.035771369934082, "global_step": 75042, "epoch": 1786} {"train_loss": -6.038566589355469, "global_step": 75043, "epoch": 1786} {"train_loss": -5.986107349395752, "global_step": 75044, "epoch": 1786} {"train_loss": -6.181934356689453, "global_step": 75045, "epoch": 1786} {"train_loss": -6.069563388824463, "global_step": 75046, "epoch": 1786} {"train_loss": -6.031922340393066, "global_step": 75047, "epoch": 1786} {"train_loss": -6.024993896484375, "global_step": 75048, "epoch": 1786} {"train_loss": -5.914898872375488, "global_step": 75049, "epoch": 1786} {"train_loss": -6.058437824249268, "global_step": 75050, "epoch": 1786} {"train_loss": -5.996079444885254, "global_step": 75051, "epoch": 1786} {"train_loss": -5.920205116271973, "global_step": 75052, "epoch": 1786} {"train_loss": -6.079275630769276, "global_step": 75053, "epoch": 1786, "val_loss": 74964.828125} {"train_loss": -6.11724853515625, "global_step": 75054, "epoch": 1787} {"train_loss": -5.931975364685059, "global_step": 75055, "epoch": 1787} {"train_loss": -6.075926303863525, "global_step": 75056, "epoch": 1787} {"train_loss": -6.021109104156494, "global_step": 75057, "epoch": 1787} {"train_loss": -6.091249465942383, "global_step": 75058, "epoch": 1787} {"train_loss": -6.04866361618042, "global_step": 75059, "epoch": 1787} {"train_loss": -6.041141510009766, "global_step": 75060, "epoch": 1787} {"train_loss": -6.031754970550537, "global_step": 75061, "epoch": 1787} {"train_loss": -6.095931053161621, "global_step": 75062, "epoch": 1787} {"train_loss": -6.065579891204834, "global_step": 75063, "epoch": 1787} {"train_loss": -5.955343246459961, "global_step": 75064, "epoch": 1787} {"train_loss": -6.019354343414307, "global_step": 75065, "epoch": 1787} {"train_loss": -5.974437713623047, "global_step": 75066, "epoch": 1787} {"train_loss": -6.049444198608398, "global_step": 75067, "epoch": 1787} {"train_loss": -6.0605387687683105, "global_step": 75068, "epoch": 1787} {"train_loss": -6.033239364624023, "global_step": 75069, "epoch": 1787} {"train_loss": -6.1059489250183105, "global_step": 75070, "epoch": 1787} {"train_loss": -6.092771530151367, "global_step": 75071, "epoch": 1787} {"train_loss": -6.065974235534668, "global_step": 75072, "epoch": 1787} {"train_loss": -6.098282337188721, "global_step": 75073, "epoch": 1787} {"train_loss": -5.976250171661377, "global_step": 75074, "epoch": 1787} {"train_loss": -5.946500778198242, "global_step": 75075, "epoch": 1787} {"train_loss": -5.967459678649902, "global_step": 75076, "epoch": 1787} {"train_loss": -5.96350622177124, "global_step": 75077, "epoch": 1787} {"train_loss": -5.9983086585998535, "global_step": 75078, "epoch": 1787} {"train_loss": -6.082071781158447, "global_step": 75079, "epoch": 1787} {"train_loss": -6.103837966918945, "global_step": 75080, "epoch": 1787} {"train_loss": -6.085760116577148, "global_step": 75081, "epoch": 1787} {"train_loss": -6.014735221862793, "global_step": 75082, "epoch": 1787} {"train_loss": -6.0987443923950195, "global_step": 75083, "epoch": 1787} {"train_loss": -6.006101131439209, "global_step": 75084, "epoch": 1787} {"train_loss": -6.147735595703125, "global_step": 75085, "epoch": 1787} {"train_loss": -6.074525356292725, "global_step": 75086, "epoch": 1787} {"train_loss": -6.133262634277344, "global_step": 75087, "epoch": 1787} {"train_loss": -6.063542366027832, "global_step": 75088, "epoch": 1787} {"train_loss": -6.089389801025391, "global_step": 75089, "epoch": 1787} {"train_loss": -6.217477798461914, "global_step": 75090, "epoch": 1787} {"train_loss": -6.164547443389893, "global_step": 75091, "epoch": 1787} {"train_loss": -5.971286296844482, "global_step": 75092, "epoch": 1787} {"train_loss": -5.942282676696777, "global_step": 75093, "epoch": 1787} {"train_loss": -6.088677406311035, "global_step": 75094, "epoch": 1787} {"train_loss": -6.049455143156505, "global_step": 75095, "epoch": 1787, "val_loss": 74903.5390625} {"train_loss": -6.062121391296387, "global_step": 75096, "epoch": 1788} {"train_loss": -6.049370765686035, "global_step": 75097, "epoch": 1788} {"train_loss": -5.996500015258789, "global_step": 75098, "epoch": 1788} {"train_loss": -6.059460639953613, "global_step": 75099, "epoch": 1788} {"train_loss": -6.0761613845825195, "global_step": 75100, "epoch": 1788} {"train_loss": -6.0700764656066895, "global_step": 75101, "epoch": 1788} {"train_loss": -5.96710205078125, "global_step": 75102, "epoch": 1788} {"train_loss": -6.108338356018066, "global_step": 75103, "epoch": 1788} {"train_loss": -5.900205612182617, "global_step": 75104, "epoch": 1788} {"train_loss": -6.021450996398926, "global_step": 75105, "epoch": 1788} {"train_loss": -5.9862589836120605, "global_step": 75106, "epoch": 1788} {"train_loss": -6.099783897399902, "global_step": 75107, "epoch": 1788} {"train_loss": -5.996213436126709, "global_step": 75108, "epoch": 1788} {"train_loss": -6.036400318145752, "global_step": 75109, "epoch": 1788} {"train_loss": -6.054819107055664, "global_step": 75110, "epoch": 1788} {"train_loss": -6.061985969543457, "global_step": 75111, "epoch": 1788} {"train_loss": -6.065743923187256, "global_step": 75112, "epoch": 1788} {"train_loss": -6.0634846687316895, "global_step": 75113, "epoch": 1788} {"train_loss": -6.154173374176025, "global_step": 75114, "epoch": 1788} {"train_loss": -5.961968421936035, "global_step": 75115, "epoch": 1788} {"train_loss": -5.9864983558654785, "global_step": 75116, "epoch": 1788} {"train_loss": -6.12743616104126, "global_step": 75117, "epoch": 1788} {"train_loss": -5.941939353942871, "global_step": 75118, "epoch": 1788} {"train_loss": -6.110321998596191, "global_step": 75119, "epoch": 1788} {"train_loss": -6.071515083312988, "global_step": 75120, "epoch": 1788} {"train_loss": -6.0431647300720215, "global_step": 75121, "epoch": 1788} {"train_loss": -6.0751729011535645, "global_step": 75122, "epoch": 1788} {"train_loss": -6.007634162902832, "global_step": 75123, "epoch": 1788} {"train_loss": -6.258155822753906, "global_step": 75124, "epoch": 1788} {"train_loss": -6.197035789489746, "global_step": 75125, "epoch": 1788} {"train_loss": -6.155634880065918, "global_step": 75126, "epoch": 1788} {"train_loss": -6.014297962188721, "global_step": 75127, "epoch": 1788} {"train_loss": -6.119780540466309, "global_step": 75128, "epoch": 1788} {"train_loss": -6.052951335906982, "global_step": 75129, "epoch": 1788} {"train_loss": -6.085784435272217, "global_step": 75130, "epoch": 1788} {"train_loss": -6.079208850860596, "global_step": 75131, "epoch": 1788} {"train_loss": -5.974316120147705, "global_step": 75132, "epoch": 1788} {"train_loss": -5.9520463943481445, "global_step": 75133, "epoch": 1788} {"train_loss": -6.011205673217773, "global_step": 75134, "epoch": 1788} {"train_loss": -6.093895435333252, "global_step": 75135, "epoch": 1788} {"train_loss": -5.959001064300537, "global_step": 75136, "epoch": 1788} {"train_loss": -6.048988523937407, "global_step": 75137, "epoch": 1788, "val_loss": 74814.234375} {"train_loss": -5.86695671081543, "global_step": 75138, "epoch": 1789} {"train_loss": -6.118961334228516, "global_step": 75139, "epoch": 1789} {"train_loss": -5.942503929138184, "global_step": 75140, "epoch": 1789} {"train_loss": -6.068552017211914, "global_step": 75141, "epoch": 1789} {"train_loss": -5.907418727874756, "global_step": 75142, "epoch": 1789} {"train_loss": -5.887528419494629, "global_step": 75143, "epoch": 1789} {"train_loss": -6.041691780090332, "global_step": 75144, "epoch": 1789} {"train_loss": -5.9976301193237305, "global_step": 75145, "epoch": 1789} {"train_loss": -6.103572368621826, "global_step": 75146, "epoch": 1789} {"train_loss": -6.061709403991699, "global_step": 75147, "epoch": 1789} {"train_loss": -6.046287536621094, "global_step": 75148, "epoch": 1789} {"train_loss": -6.0632429122924805, "global_step": 75149, "epoch": 1789} {"train_loss": -5.829315662384033, "global_step": 75150, "epoch": 1789} {"train_loss": -6.05070686340332, "global_step": 75151, "epoch": 1789} {"train_loss": -6.045627593994141, "global_step": 75152, "epoch": 1789} {"train_loss": -5.9884185791015625, "global_step": 75153, "epoch": 1789} {"train_loss": -6.08884334564209, "global_step": 75154, "epoch": 1789} {"train_loss": -6.081326961517334, "global_step": 75155, "epoch": 1789} {"train_loss": -6.073948383331299, "global_step": 75156, "epoch": 1789} {"train_loss": -6.066173076629639, "global_step": 75157, "epoch": 1789} {"train_loss": -6.085952281951904, "global_step": 75158, "epoch": 1789} {"train_loss": -6.077445030212402, "global_step": 75159, "epoch": 1789} {"train_loss": -6.073912620544434, "global_step": 75160, "epoch": 1789} {"train_loss": -6.096127510070801, "global_step": 75161, "epoch": 1789} {"train_loss": -6.030223369598389, "global_step": 75162, "epoch": 1789} {"train_loss": -5.948707580566406, "global_step": 75163, "epoch": 1789} {"train_loss": -6.055600166320801, "global_step": 75164, "epoch": 1789} {"train_loss": -5.94243049621582, "global_step": 75165, "epoch": 1789} {"train_loss": -6.025522232055664, "global_step": 75166, "epoch": 1789} {"train_loss": -6.03429651260376, "global_step": 75167, "epoch": 1789} {"train_loss": -5.973359107971191, "global_step": 75168, "epoch": 1789} {"train_loss": -5.9086761474609375, "global_step": 75169, "epoch": 1789} {"train_loss": -6.140447616577148, "global_step": 75170, "epoch": 1789} {"train_loss": -5.937508583068848, "global_step": 75171, "epoch": 1789} {"train_loss": -6.034802436828613, "global_step": 75172, "epoch": 1789} {"train_loss": -5.920898914337158, "global_step": 75173, "epoch": 1789} {"train_loss": -6.106996536254883, "global_step": 75174, "epoch": 1789} {"train_loss": -5.9633002281188965, "global_step": 75175, "epoch": 1789} {"train_loss": -6.020646095275879, "global_step": 75176, "epoch": 1789} {"train_loss": -6.036338806152344, "global_step": 75177, "epoch": 1789} {"train_loss": -6.0291008949279785, "global_step": 75178, "epoch": 1789} {"train_loss": -6.020203760692051, "global_step": 75179, "epoch": 1789, "val_loss": 74972.859375} {"train_loss": -5.933322429656982, "global_step": 75180, "epoch": 1790} {"train_loss": -6.030747413635254, "global_step": 75181, "epoch": 1790} {"train_loss": -6.020157337188721, "global_step": 75182, "epoch": 1790} {"train_loss": -5.988559722900391, "global_step": 75183, "epoch": 1790} {"train_loss": -6.0600152015686035, "global_step": 75184, "epoch": 1790} {"train_loss": -6.061864852905273, "global_step": 75185, "epoch": 1790} {"train_loss": -5.954585075378418, "global_step": 75186, "epoch": 1790} {"train_loss": -6.102194786071777, "global_step": 75187, "epoch": 1790} {"train_loss": -6.072048664093018, "global_step": 75188, "epoch": 1790} {"train_loss": -6.100998878479004, "global_step": 75189, "epoch": 1790} {"train_loss": -6.116851806640625, "global_step": 75190, "epoch": 1790} {"train_loss": -6.146895408630371, "global_step": 75191, "epoch": 1790} {"train_loss": -6.138585090637207, "global_step": 75192, "epoch": 1790} {"train_loss": -5.918554306030273, "global_step": 75193, "epoch": 1790} {"train_loss": -5.938568115234375, "global_step": 75194, "epoch": 1790} {"train_loss": -6.071717739105225, "global_step": 75195, "epoch": 1790} {"train_loss": -6.022612571716309, "global_step": 75196, "epoch": 1790} {"train_loss": -6.071524620056152, "global_step": 75197, "epoch": 1790} {"train_loss": -6.0847320556640625, "global_step": 75198, "epoch": 1790} {"train_loss": -6.042446136474609, "global_step": 75199, "epoch": 1790} {"train_loss": -6.163265228271484, "global_step": 75200, "epoch": 1790} {"train_loss": -6.071507930755615, "global_step": 75201, "epoch": 1790} {"train_loss": -6.018575668334961, "global_step": 75202, "epoch": 1790} {"train_loss": -6.1271491050720215, "global_step": 75203, "epoch": 1790} {"train_loss": -6.18556547164917, "global_step": 75204, "epoch": 1790} {"train_loss": -6.162080764770508, "global_step": 75205, "epoch": 1790} {"train_loss": -5.986310005187988, "global_step": 75206, "epoch": 1790} {"train_loss": -5.978455543518066, "global_step": 75207, "epoch": 1790} {"train_loss": -6.147302627563477, "global_step": 75208, "epoch": 1790} {"train_loss": -6.189486980438232, "global_step": 75209, "epoch": 1790} {"train_loss": -6.164346694946289, "global_step": 75210, "epoch": 1790} {"train_loss": -5.9557952880859375, "global_step": 75211, "epoch": 1790} {"train_loss": -6.152597427368164, "global_step": 75212, "epoch": 1790} {"train_loss": -6.032848834991455, "global_step": 75213, "epoch": 1790} {"train_loss": -6.19551944732666, "global_step": 75214, "epoch": 1790} {"train_loss": -6.094799041748047, "global_step": 75215, "epoch": 1790} {"train_loss": -6.189361095428467, "global_step": 75216, "epoch": 1790} {"train_loss": -6.136658668518066, "global_step": 75217, "epoch": 1790} {"train_loss": -6.091436386108398, "global_step": 75218, "epoch": 1790} {"train_loss": -6.1226806640625, "global_step": 75219, "epoch": 1790} {"train_loss": -6.104434967041016, "global_step": 75220, "epoch": 1790} {"train_loss": -6.079966499691918, "global_step": 75221, "epoch": 1790, "val_loss": 74816.328125} {"train_loss": -6.138547897338867, "global_step": 75222, "epoch": 1791} {"train_loss": -6.073657989501953, "global_step": 75223, "epoch": 1791} {"train_loss": -6.17664909362793, "global_step": 75224, "epoch": 1791} {"train_loss": -5.986234664916992, "global_step": 75225, "epoch": 1791} {"train_loss": -6.088740348815918, "global_step": 75226, "epoch": 1791} {"train_loss": -6.218341827392578, "global_step": 75227, "epoch": 1791} {"train_loss": -6.135818004608154, "global_step": 75228, "epoch": 1791} {"train_loss": -6.05487060546875, "global_step": 75229, "epoch": 1791} {"train_loss": -6.085826873779297, "global_step": 75230, "epoch": 1791} {"train_loss": -6.076378345489502, "global_step": 75231, "epoch": 1791} {"train_loss": -6.098044395446777, "global_step": 75232, "epoch": 1791} {"train_loss": -6.202023983001709, "global_step": 75233, "epoch": 1791} {"train_loss": -6.221558094024658, "global_step": 75234, "epoch": 1791} {"train_loss": -6.088659286499023, "global_step": 75235, "epoch": 1791} {"train_loss": -6.1982526779174805, "global_step": 75236, "epoch": 1791} {"train_loss": -6.032321453094482, "global_step": 75237, "epoch": 1791} {"train_loss": -6.103215217590332, "global_step": 75238, "epoch": 1791} {"train_loss": -6.037761688232422, "global_step": 75239, "epoch": 1791} {"train_loss": -6.070138931274414, "global_step": 75240, "epoch": 1791} {"train_loss": -6.055147171020508, "global_step": 75241, "epoch": 1791} {"train_loss": -6.2029218673706055, "global_step": 75242, "epoch": 1791} {"train_loss": -6.08277702331543, "global_step": 75243, "epoch": 1791} {"train_loss": -6.07442569732666, "global_step": 75244, "epoch": 1791} {"train_loss": -6.149178504943848, "global_step": 75245, "epoch": 1791} {"train_loss": -6.132806777954102, "global_step": 75246, "epoch": 1791} {"train_loss": -6.037442207336426, "global_step": 75247, "epoch": 1791} {"train_loss": -6.09393310546875, "global_step": 75248, "epoch": 1791} {"train_loss": -6.087594509124756, "global_step": 75249, "epoch": 1791} {"train_loss": -6.104318141937256, "global_step": 75250, "epoch": 1791} {"train_loss": -5.991048812866211, "global_step": 75251, "epoch": 1791} {"train_loss": -6.071597576141357, "global_step": 75252, "epoch": 1791} {"train_loss": -6.091670513153076, "global_step": 75253, "epoch": 1791} {"train_loss": -6.110579490661621, "global_step": 75254, "epoch": 1791} {"train_loss": -6.107773780822754, "global_step": 75255, "epoch": 1791} {"train_loss": -6.111239433288574, "global_step": 75256, "epoch": 1791} {"train_loss": -6.069102764129639, "global_step": 75257, "epoch": 1791} {"train_loss": -6.021799087524414, "global_step": 75258, "epoch": 1791} {"train_loss": -6.110817909240723, "global_step": 75259, "epoch": 1791} {"train_loss": -6.044266700744629, "global_step": 75260, "epoch": 1791} {"train_loss": -6.088953018188477, "global_step": 75261, "epoch": 1791} {"train_loss": -5.982204437255859, "global_step": 75262, "epoch": 1791} {"train_loss": -6.097219932646978, "global_step": 75263, "epoch": 1791, "val_loss": 74647.2890625} {"train_loss": -6.123195648193359, "global_step": 75264, "epoch": 1792} {"train_loss": -6.047785758972168, "global_step": 75265, "epoch": 1792} {"train_loss": -6.121186256408691, "global_step": 75266, "epoch": 1792} {"train_loss": -6.176674842834473, "global_step": 75267, "epoch": 1792} {"train_loss": -6.0899739265441895, "global_step": 75268, "epoch": 1792} {"train_loss": -6.031624794006348, "global_step": 75269, "epoch": 1792} {"train_loss": -6.073387145996094, "global_step": 75270, "epoch": 1792} {"train_loss": -6.032541275024414, "global_step": 75271, "epoch": 1792} {"train_loss": -6.148712158203125, "global_step": 75272, "epoch": 1792} {"train_loss": -5.917384624481201, "global_step": 75273, "epoch": 1792} {"train_loss": -6.194296360015869, "global_step": 75274, "epoch": 1792} {"train_loss": -5.898375511169434, "global_step": 75275, "epoch": 1792} {"train_loss": -5.912170886993408, "global_step": 75276, "epoch": 1792} {"train_loss": -5.915573596954346, "global_step": 75277, "epoch": 1792} {"train_loss": -6.0125555992126465, "global_step": 75278, "epoch": 1792} {"train_loss": -6.010028839111328, "global_step": 75279, "epoch": 1792} {"train_loss": -6.150236129760742, "global_step": 75280, "epoch": 1792} {"train_loss": -6.119597434997559, "global_step": 75281, "epoch": 1792} {"train_loss": -5.946634292602539, "global_step": 75282, "epoch": 1792} {"train_loss": -6.049411773681641, "global_step": 75283, "epoch": 1792} {"train_loss": -6.196444511413574, "global_step": 75284, "epoch": 1792} {"train_loss": -5.997436046600342, "global_step": 75285, "epoch": 1792} {"train_loss": -6.007855415344238, "global_step": 75286, "epoch": 1792} {"train_loss": -6.0645036697387695, "global_step": 75287, "epoch": 1792} {"train_loss": -6.006068706512451, "global_step": 75288, "epoch": 1792} {"train_loss": -6.079557418823242, "global_step": 75289, "epoch": 1792} {"train_loss": -6.062143325805664, "global_step": 75290, "epoch": 1792} {"train_loss": -6.049267768859863, "global_step": 75291, "epoch": 1792} {"train_loss": -6.139997482299805, "global_step": 75292, "epoch": 1792} {"train_loss": -6.095658779144287, "global_step": 75293, "epoch": 1792} {"train_loss": -6.058346271514893, "global_step": 75294, "epoch": 1792} {"train_loss": -6.03702449798584, "global_step": 75295, "epoch": 1792} {"train_loss": -6.146819591522217, "global_step": 75296, "epoch": 1792} {"train_loss": -6.009112358093262, "global_step": 75297, "epoch": 1792} {"train_loss": -6.0027618408203125, "global_step": 75298, "epoch": 1792} {"train_loss": -6.143684387207031, "global_step": 75299, "epoch": 1792} {"train_loss": -6.075070381164551, "global_step": 75300, "epoch": 1792} {"train_loss": -6.020665168762207, "global_step": 75301, "epoch": 1792} {"train_loss": -6.047728538513184, "global_step": 75302, "epoch": 1792} {"train_loss": -6.097909927368164, "global_step": 75303, "epoch": 1792} {"train_loss": -6.106508255004883, "global_step": 75304, "epoch": 1792} {"train_loss": -6.058947313399542, "global_step": 75305, "epoch": 1792, "val_loss": 75025.9453125} {"train_loss": -6.085660934448242, "global_step": 75306, "epoch": 1793} {"train_loss": -6.148509979248047, "global_step": 75307, "epoch": 1793} {"train_loss": -5.982738494873047, "global_step": 75308, "epoch": 1793} {"train_loss": -6.093006610870361, "global_step": 75309, "epoch": 1793} {"train_loss": -6.0394978523254395, "global_step": 75310, "epoch": 1793} {"train_loss": -6.168737888336182, "global_step": 75311, "epoch": 1793} {"train_loss": -6.0904645919799805, "global_step": 75312, "epoch": 1793} {"train_loss": -6.048730373382568, "global_step": 75313, "epoch": 1793} {"train_loss": -6.037991523742676, "global_step": 75314, "epoch": 1793} {"train_loss": -6.044877052307129, "global_step": 75315, "epoch": 1793} {"train_loss": -6.065028190612793, "global_step": 75316, "epoch": 1793} {"train_loss": -6.09457540512085, "global_step": 75317, "epoch": 1793} {"train_loss": -6.151823997497559, "global_step": 75318, "epoch": 1793} {"train_loss": -5.9881911277771, "global_step": 75319, "epoch": 1793} {"train_loss": -6.044833183288574, "global_step": 75320, "epoch": 1793} {"train_loss": -6.056797027587891, "global_step": 75321, "epoch": 1793} {"train_loss": -5.970395565032959, "global_step": 75322, "epoch": 1793} {"train_loss": -6.097933769226074, "global_step": 75323, "epoch": 1793} {"train_loss": -6.094901084899902, "global_step": 75324, "epoch": 1793} {"train_loss": -6.006922721862793, "global_step": 75325, "epoch": 1793} {"train_loss": -6.006182670593262, "global_step": 75326, "epoch": 1793} {"train_loss": -6.129429817199707, "global_step": 75327, "epoch": 1793} {"train_loss": -5.934652328491211, "global_step": 75328, "epoch": 1793} {"train_loss": -6.092922210693359, "global_step": 75329, "epoch": 1793} {"train_loss": -6.014292240142822, "global_step": 75330, "epoch": 1793} {"train_loss": -6.133718013763428, "global_step": 75331, "epoch": 1793} {"train_loss": -6.079710960388184, "global_step": 75332, "epoch": 1793} {"train_loss": -6.024658203125, "global_step": 75333, "epoch": 1793} {"train_loss": -6.167292594909668, "global_step": 75334, "epoch": 1793} {"train_loss": -6.11342716217041, "global_step": 75335, "epoch": 1793} {"train_loss": -6.11407995223999, "global_step": 75336, "epoch": 1793} {"train_loss": -6.041720390319824, "global_step": 75337, "epoch": 1793} {"train_loss": -6.149227619171143, "global_step": 75338, "epoch": 1793} {"train_loss": -6.072812557220459, "global_step": 75339, "epoch": 1793} {"train_loss": -6.102341651916504, "global_step": 75340, "epoch": 1793} {"train_loss": -6.0811614990234375, "global_step": 75341, "epoch": 1793} {"train_loss": -6.159797191619873, "global_step": 75342, "epoch": 1793} {"train_loss": -5.966342449188232, "global_step": 75343, "epoch": 1793} {"train_loss": -6.11762809753418, "global_step": 75344, "epoch": 1793} {"train_loss": -6.2111310958862305, "global_step": 75345, "epoch": 1793} {"train_loss": -5.94125509262085, "global_step": 75346, "epoch": 1793} {"train_loss": -6.074062131700062, "global_step": 75347, "epoch": 1793, "val_loss": 75095.3125} {"train_loss": -6.03492546081543, "global_step": 75348, "epoch": 1794} {"train_loss": -6.00489616394043, "global_step": 75349, "epoch": 1794} {"train_loss": -6.126189708709717, "global_step": 75350, "epoch": 1794} {"train_loss": -6.040815830230713, "global_step": 75351, "epoch": 1794} {"train_loss": -6.19670295715332, "global_step": 75352, "epoch": 1794} {"train_loss": -6.174002170562744, "global_step": 75353, "epoch": 1794} {"train_loss": -6.158257007598877, "global_step": 75354, "epoch": 1794} {"train_loss": -6.112020492553711, "global_step": 75355, "epoch": 1794} {"train_loss": -6.076346397399902, "global_step": 75356, "epoch": 1794} {"train_loss": -6.146397590637207, "global_step": 75357, "epoch": 1794} {"train_loss": -6.111269950866699, "global_step": 75358, "epoch": 1794} {"train_loss": -6.096489906311035, "global_step": 75359, "epoch": 1794} {"train_loss": -6.090033531188965, "global_step": 75360, "epoch": 1794} {"train_loss": -6.053322792053223, "global_step": 75361, "epoch": 1794} {"train_loss": -6.025633335113525, "global_step": 75362, "epoch": 1794} {"train_loss": -6.071348190307617, "global_step": 75363, "epoch": 1794} {"train_loss": -6.101729393005371, "global_step": 75364, "epoch": 1794} {"train_loss": -6.0836968421936035, "global_step": 75365, "epoch": 1794} {"train_loss": -6.1405029296875, "global_step": 75366, "epoch": 1794} {"train_loss": -6.100719451904297, "global_step": 75367, "epoch": 1794} {"train_loss": -6.183515548706055, "global_step": 75368, "epoch": 1794} {"train_loss": -5.946852684020996, "global_step": 75369, "epoch": 1794} {"train_loss": -6.09244441986084, "global_step": 75370, "epoch": 1794} {"train_loss": -6.0571699142456055, "global_step": 75371, "epoch": 1794} {"train_loss": -6.141819477081299, "global_step": 75372, "epoch": 1794} {"train_loss": -6.080541610717773, "global_step": 75373, "epoch": 1794} {"train_loss": -6.079366683959961, "global_step": 75374, "epoch": 1794} {"train_loss": -6.097352981567383, "global_step": 75375, "epoch": 1794} {"train_loss": -6.02524995803833, "global_step": 75376, "epoch": 1794} {"train_loss": -6.103673458099365, "global_step": 75377, "epoch": 1794} {"train_loss": -6.146576881408691, "global_step": 75378, "epoch": 1794} {"train_loss": -6.066113471984863, "global_step": 75379, "epoch": 1794} {"train_loss": -6.097302436828613, "global_step": 75380, "epoch": 1794} {"train_loss": -6.068355560302734, "global_step": 75381, "epoch": 1794} {"train_loss": -6.099429130554199, "global_step": 75382, "epoch": 1794} {"train_loss": -6.151430130004883, "global_step": 75383, "epoch": 1794} {"train_loss": -6.135245323181152, "global_step": 75384, "epoch": 1794} {"train_loss": -6.057833671569824, "global_step": 75385, "epoch": 1794} {"train_loss": -6.091433525085449, "global_step": 75386, "epoch": 1794} {"train_loss": -6.064596176147461, "global_step": 75387, "epoch": 1794} {"train_loss": -5.994600296020508, "global_step": 75388, "epoch": 1794} {"train_loss": -6.091350623539516, "global_step": 75389, "epoch": 1794, "val_loss": 74873.625} {"train_loss": -6.090358257293701, "global_step": 75390, "epoch": 1795} {"train_loss": -6.061778545379639, "global_step": 75391, "epoch": 1795} {"train_loss": -6.015836715698242, "global_step": 75392, "epoch": 1795} {"train_loss": -6.131495475769043, "global_step": 75393, "epoch": 1795} {"train_loss": -6.069789409637451, "global_step": 75394, "epoch": 1795} {"train_loss": -6.0186686515808105, "global_step": 75395, "epoch": 1795} {"train_loss": -6.101372241973877, "global_step": 75396, "epoch": 1795} {"train_loss": -6.142697811126709, "global_step": 75397, "epoch": 1795} {"train_loss": -6.097912788391113, "global_step": 75398, "epoch": 1795} {"train_loss": -6.105244159698486, "global_step": 75399, "epoch": 1795} {"train_loss": -6.082607269287109, "global_step": 75400, "epoch": 1795} {"train_loss": -6.04959774017334, "global_step": 75401, "epoch": 1795} {"train_loss": -6.22251558303833, "global_step": 75402, "epoch": 1795} {"train_loss": -6.111043930053711, "global_step": 75403, "epoch": 1795} {"train_loss": -6.134629249572754, "global_step": 75404, "epoch": 1795} {"train_loss": -6.077800750732422, "global_step": 75405, "epoch": 1795} {"train_loss": -6.15730094909668, "global_step": 75406, "epoch": 1795} {"train_loss": -6.062786102294922, "global_step": 75407, "epoch": 1795} {"train_loss": -6.112077713012695, "global_step": 75408, "epoch": 1795} {"train_loss": -5.986297607421875, "global_step": 75409, "epoch": 1795} {"train_loss": -6.1940107345581055, "global_step": 75410, "epoch": 1795} {"train_loss": -6.112224578857422, "global_step": 75411, "epoch": 1795} {"train_loss": -6.094160079956055, "global_step": 75412, "epoch": 1795} {"train_loss": -6.246348857879639, "global_step": 75413, "epoch": 1795} {"train_loss": -5.9716291427612305, "global_step": 75414, "epoch": 1795} {"train_loss": -6.036598205566406, "global_step": 75415, "epoch": 1795} {"train_loss": -6.020956993103027, "global_step": 75416, "epoch": 1795} {"train_loss": -6.105721950531006, "global_step": 75417, "epoch": 1795} {"train_loss": -6.073859214782715, "global_step": 75418, "epoch": 1795} {"train_loss": -6.08203649520874, "global_step": 75419, "epoch": 1795} {"train_loss": -6.126089572906494, "global_step": 75420, "epoch": 1795} {"train_loss": -6.259263038635254, "global_step": 75421, "epoch": 1795} {"train_loss": -6.1085052490234375, "global_step": 75422, "epoch": 1795} {"train_loss": -6.054512023925781, "global_step": 75423, "epoch": 1795} {"train_loss": -6.216209411621094, "global_step": 75424, "epoch": 1795} {"train_loss": -6.156881809234619, "global_step": 75425, "epoch": 1795} {"train_loss": -6.0531721115112305, "global_step": 75426, "epoch": 1795} {"train_loss": -6.09804630279541, "global_step": 75427, "epoch": 1795} {"train_loss": -6.101640701293945, "global_step": 75428, "epoch": 1795} {"train_loss": -6.151230812072754, "global_step": 75429, "epoch": 1795} {"train_loss": -6.14518404006958, "global_step": 75430, "epoch": 1795} {"train_loss": -6.104235410690308, "global_step": 75431, "epoch": 1795, "val_loss": 74965.171875} {"train_loss": -6.035947799682617, "global_step": 75432, "epoch": 1796} {"train_loss": -6.155375957489014, "global_step": 75433, "epoch": 1796} {"train_loss": -6.1268463134765625, "global_step": 75434, "epoch": 1796} {"train_loss": -6.026642799377441, "global_step": 75435, "epoch": 1796} {"train_loss": -6.1056928634643555, "global_step": 75436, "epoch": 1796} {"train_loss": -6.144284725189209, "global_step": 75437, "epoch": 1796} {"train_loss": -6.038799285888672, "global_step": 75438, "epoch": 1796} {"train_loss": -6.025934219360352, "global_step": 75439, "epoch": 1796} {"train_loss": -6.035494327545166, "global_step": 75440, "epoch": 1796} {"train_loss": -6.095147132873535, "global_step": 75441, "epoch": 1796} {"train_loss": -5.975022315979004, "global_step": 75442, "epoch": 1796} {"train_loss": -6.1279706954956055, "global_step": 75443, "epoch": 1796} {"train_loss": -6.032668113708496, "global_step": 75444, "epoch": 1796} {"train_loss": -6.152778625488281, "global_step": 75445, "epoch": 1796} {"train_loss": -6.143497943878174, "global_step": 75446, "epoch": 1796} {"train_loss": -5.997683525085449, "global_step": 75447, "epoch": 1796} {"train_loss": -6.091827392578125, "global_step": 75448, "epoch": 1796} {"train_loss": -6.149080276489258, "global_step": 75449, "epoch": 1796} {"train_loss": -6.035434722900391, "global_step": 75450, "epoch": 1796} {"train_loss": -6.193100929260254, "global_step": 75451, "epoch": 1796} {"train_loss": -6.172912120819092, "global_step": 75452, "epoch": 1796} {"train_loss": -6.189390182495117, "global_step": 75453, "epoch": 1796} {"train_loss": -6.080193042755127, "global_step": 75454, "epoch": 1796} {"train_loss": -6.1869330406188965, "global_step": 75455, "epoch": 1796} {"train_loss": -6.065784931182861, "global_step": 75456, "epoch": 1796} {"train_loss": -6.136061668395996, "global_step": 75457, "epoch": 1796} {"train_loss": -6.075098037719727, "global_step": 75458, "epoch": 1796} {"train_loss": -6.176031589508057, "global_step": 75459, "epoch": 1796} {"train_loss": -6.0062785148620605, "global_step": 75460, "epoch": 1796} {"train_loss": -6.068415641784668, "global_step": 75461, "epoch": 1796} {"train_loss": -6.059023857116699, "global_step": 75462, "epoch": 1796} {"train_loss": -6.029152870178223, "global_step": 75463, "epoch": 1796} {"train_loss": -6.11253547668457, "global_step": 75464, "epoch": 1796} {"train_loss": -6.092349052429199, "global_step": 75465, "epoch": 1796} {"train_loss": -5.951772212982178, "global_step": 75466, "epoch": 1796} {"train_loss": -5.982478618621826, "global_step": 75467, "epoch": 1796} {"train_loss": -6.095372200012207, "global_step": 75468, "epoch": 1796} {"train_loss": -6.047449111938477, "global_step": 75469, "epoch": 1796} {"train_loss": -6.041380882263184, "global_step": 75470, "epoch": 1796} {"train_loss": -6.035499572753906, "global_step": 75471, "epoch": 1796} {"train_loss": -6.125455379486084, "global_step": 75472, "epoch": 1796} {"train_loss": -6.0834401335035055, "global_step": 75473, "epoch": 1796, "val_loss": 75080.359375} {"train_loss": -6.099188804626465, "global_step": 75474, "epoch": 1797} {"train_loss": -6.0480194091796875, "global_step": 75475, "epoch": 1797} {"train_loss": -5.9850172996521, "global_step": 75476, "epoch": 1797} {"train_loss": -6.07380485534668, "global_step": 75477, "epoch": 1797} {"train_loss": -6.0735297203063965, "global_step": 75478, "epoch": 1797} {"train_loss": -6.018481731414795, "global_step": 75479, "epoch": 1797} {"train_loss": -6.077528953552246, "global_step": 75480, "epoch": 1797} {"train_loss": -5.979966163635254, "global_step": 75481, "epoch": 1797} {"train_loss": -6.109657287597656, "global_step": 75482, "epoch": 1797} {"train_loss": -5.985664367675781, "global_step": 75483, "epoch": 1797} {"train_loss": -6.038851261138916, "global_step": 75484, "epoch": 1797} {"train_loss": -6.035757064819336, "global_step": 75485, "epoch": 1797} {"train_loss": -5.992230415344238, "global_step": 75486, "epoch": 1797} {"train_loss": -6.119872570037842, "global_step": 75487, "epoch": 1797} {"train_loss": -6.115354537963867, "global_step": 75488, "epoch": 1797} {"train_loss": -6.079089164733887, "global_step": 75489, "epoch": 1797} {"train_loss": -5.992763042449951, "global_step": 75490, "epoch": 1797} {"train_loss": -6.067354679107666, "global_step": 75491, "epoch": 1797} {"train_loss": -6.103361129760742, "global_step": 75492, "epoch": 1797} {"train_loss": -5.981778621673584, "global_step": 75493, "epoch": 1797} {"train_loss": -6.199946880340576, "global_step": 75494, "epoch": 1797} {"train_loss": -6.087341785430908, "global_step": 75495, "epoch": 1797} {"train_loss": -6.053802967071533, "global_step": 75496, "epoch": 1797} {"train_loss": -6.110537528991699, "global_step": 75497, "epoch": 1797} {"train_loss": -6.106298446655273, "global_step": 75498, "epoch": 1797} {"train_loss": -6.189200401306152, "global_step": 75499, "epoch": 1797} {"train_loss": -6.054460525512695, "global_step": 75500, "epoch": 1797} {"train_loss": -6.062396049499512, "global_step": 75501, "epoch": 1797} {"train_loss": -6.092779636383057, "global_step": 75502, "epoch": 1797} {"train_loss": -6.144253253936768, "global_step": 75503, "epoch": 1797} {"train_loss": -6.015603542327881, "global_step": 75504, "epoch": 1797} {"train_loss": -6.078447341918945, "global_step": 75505, "epoch": 1797} {"train_loss": -6.03593635559082, "global_step": 75506, "epoch": 1797} {"train_loss": -6.163051605224609, "global_step": 75507, "epoch": 1797} {"train_loss": -6.076347351074219, "global_step": 75508, "epoch": 1797} {"train_loss": -6.181946754455566, "global_step": 75509, "epoch": 1797} {"train_loss": -6.037957191467285, "global_step": 75510, "epoch": 1797} {"train_loss": -6.18898868560791, "global_step": 75511, "epoch": 1797} {"train_loss": -5.946660041809082, "global_step": 75512, "epoch": 1797} {"train_loss": -5.982593536376953, "global_step": 75513, "epoch": 1797} {"train_loss": -6.032156944274902, "global_step": 75514, "epoch": 1797} {"train_loss": -6.071849834351313, "global_step": 75515, "epoch": 1797, "val_loss": 74850.9453125} {"train_loss": -6.153207778930664, "global_step": 75516, "epoch": 1798} {"train_loss": -6.132390975952148, "global_step": 75517, "epoch": 1798} {"train_loss": -6.160180568695068, "global_step": 75518, "epoch": 1798} {"train_loss": -6.100582122802734, "global_step": 75519, "epoch": 1798} {"train_loss": -6.043704986572266, "global_step": 75520, "epoch": 1798} {"train_loss": -6.006431579589844, "global_step": 75521, "epoch": 1798} {"train_loss": -6.075397968292236, "global_step": 75522, "epoch": 1798} {"train_loss": -6.024038791656494, "global_step": 75523, "epoch": 1798} {"train_loss": -6.017239570617676, "global_step": 75524, "epoch": 1798} {"train_loss": -5.807857990264893, "global_step": 75525, "epoch": 1798} {"train_loss": -6.1046037673950195, "global_step": 75526, "epoch": 1798} {"train_loss": -5.922125816345215, "global_step": 75527, "epoch": 1798} {"train_loss": -5.945450305938721, "global_step": 75528, "epoch": 1798} {"train_loss": -6.134910583496094, "global_step": 75529, "epoch": 1798} {"train_loss": -6.010509967803955, "global_step": 75530, "epoch": 1798} {"train_loss": -5.960472106933594, "global_step": 75531, "epoch": 1798} {"train_loss": -6.018226146697998, "global_step": 75532, "epoch": 1798} {"train_loss": -5.94766902923584, "global_step": 75533, "epoch": 1798} {"train_loss": -5.921314239501953, "global_step": 75534, "epoch": 1798} {"train_loss": -6.074778079986572, "global_step": 75535, "epoch": 1798} {"train_loss": -6.004452228546143, "global_step": 75536, "epoch": 1798} {"train_loss": -5.968235492706299, "global_step": 75537, "epoch": 1798} {"train_loss": -6.135736465454102, "global_step": 75538, "epoch": 1798} {"train_loss": -5.939976215362549, "global_step": 75539, "epoch": 1798} {"train_loss": -6.191690444946289, "global_step": 75540, "epoch": 1798} {"train_loss": -6.0711140632629395, "global_step": 75541, "epoch": 1798} {"train_loss": -5.93448543548584, "global_step": 75542, "epoch": 1798} {"train_loss": -6.167726516723633, "global_step": 75543, "epoch": 1798} {"train_loss": -6.079732894897461, "global_step": 75544, "epoch": 1798} {"train_loss": -5.991593360900879, "global_step": 75545, "epoch": 1798} {"train_loss": -6.071538925170898, "global_step": 75546, "epoch": 1798} {"train_loss": -5.945159912109375, "global_step": 75547, "epoch": 1798} {"train_loss": -6.138365745544434, "global_step": 75548, "epoch": 1798} {"train_loss": -6.023449897766113, "global_step": 75549, "epoch": 1798} {"train_loss": -6.11091423034668, "global_step": 75550, "epoch": 1798} {"train_loss": -6.035737991333008, "global_step": 75551, "epoch": 1798} {"train_loss": -6.058904647827148, "global_step": 75552, "epoch": 1798} {"train_loss": -6.000339508056641, "global_step": 75553, "epoch": 1798} {"train_loss": -6.042733192443848, "global_step": 75554, "epoch": 1798} {"train_loss": -5.995831489562988, "global_step": 75555, "epoch": 1798} {"train_loss": -6.126458644866943, "global_step": 75556, "epoch": 1798} {"train_loss": -6.0428498813084195, "global_step": 75557, "epoch": 1798, "val_loss": 75242.0625} {"train_loss": -6.001501560211182, "global_step": 75558, "epoch": 1799} {"train_loss": -6.1624908447265625, "global_step": 75559, "epoch": 1799} {"train_loss": -6.114773273468018, "global_step": 75560, "epoch": 1799} {"train_loss": -6.100589752197266, "global_step": 75561, "epoch": 1799} {"train_loss": -6.270016193389893, "global_step": 75562, "epoch": 1799} {"train_loss": -6.117639064788818, "global_step": 75563, "epoch": 1799} {"train_loss": -6.109076499938965, "global_step": 75564, "epoch": 1799} {"train_loss": -6.1754374504089355, "global_step": 75565, "epoch": 1799} {"train_loss": -6.127922534942627, "global_step": 75566, "epoch": 1799} {"train_loss": -6.1421356201171875, "global_step": 75567, "epoch": 1799} {"train_loss": -5.950107574462891, "global_step": 75568, "epoch": 1799} {"train_loss": -6.104825973510742, "global_step": 75569, "epoch": 1799} {"train_loss": -6.075220584869385, "global_step": 75570, "epoch": 1799} {"train_loss": -6.044313907623291, "global_step": 75571, "epoch": 1799} {"train_loss": -6.081058979034424, "global_step": 75572, "epoch": 1799} {"train_loss": -6.013616561889648, "global_step": 75573, "epoch": 1799} {"train_loss": -6.090391635894775, "global_step": 75574, "epoch": 1799} {"train_loss": -6.058348178863525, "global_step": 75575, "epoch": 1799} {"train_loss": -6.055006980895996, "global_step": 75576, "epoch": 1799} {"train_loss": -6.063871383666992, "global_step": 75577, "epoch": 1799} {"train_loss": -5.996706485748291, "global_step": 75578, "epoch": 1799} {"train_loss": -6.09666109085083, "global_step": 75579, "epoch": 1799} {"train_loss": -5.954307556152344, "global_step": 75580, "epoch": 1799} {"train_loss": -6.058193206787109, "global_step": 75581, "epoch": 1799} {"train_loss": -5.941976547241211, "global_step": 75582, "epoch": 1799} {"train_loss": -6.010707855224609, "global_step": 75583, "epoch": 1799} {"train_loss": -6.019651412963867, "global_step": 75584, "epoch": 1799} {"train_loss": -6.089469909667969, "global_step": 75585, "epoch": 1799} {"train_loss": -6.013124942779541, "global_step": 75586, "epoch": 1799} {"train_loss": -6.183699607849121, "global_step": 75587, "epoch": 1799} {"train_loss": -6.08467960357666, "global_step": 75588, "epoch": 1799} {"train_loss": -5.909937858581543, "global_step": 75589, "epoch": 1799} {"train_loss": -6.049592971801758, "global_step": 75590, "epoch": 1799} {"train_loss": -6.04502010345459, "global_step": 75591, "epoch": 1799} {"train_loss": -5.985706329345703, "global_step": 75592, "epoch": 1799} {"train_loss": -6.17603874206543, "global_step": 75593, "epoch": 1799} {"train_loss": -6.170348167419434, "global_step": 75594, "epoch": 1799} {"train_loss": -6.046733856201172, "global_step": 75595, "epoch": 1799} {"train_loss": -6.046124458312988, "global_step": 75596, "epoch": 1799} {"train_loss": -6.0509233474731445, "global_step": 75597, "epoch": 1799} {"train_loss": -6.1776556968688965, "global_step": 75598, "epoch": 1799} {"train_loss": -6.0726438249860495, "global_step": 75599, "epoch": 1799, "val_loss": 74700.6953125} {"train_loss": -6.21858549118042, "global_step": 75600, "epoch": 1800} {"train_loss": -6.12175178527832, "global_step": 75601, "epoch": 1800} {"train_loss": -6.088179588317871, "global_step": 75602, "epoch": 1800} {"train_loss": -6.103575706481934, "global_step": 75603, "epoch": 1800} {"train_loss": -6.06828498840332, "global_step": 75604, "epoch": 1800} {"train_loss": -5.982353210449219, "global_step": 75605, "epoch": 1800} {"train_loss": -5.986748695373535, "global_step": 75606, "epoch": 1800} {"train_loss": -6.1617751121521, "global_step": 75607, "epoch": 1800} {"train_loss": -5.947381019592285, "global_step": 75608, "epoch": 1800} {"train_loss": -5.968293190002441, "global_step": 75609, "epoch": 1800} {"train_loss": -5.962344646453857, "global_step": 75610, "epoch": 1800} {"train_loss": -6.0131330490112305, "global_step": 75611, "epoch": 1800} {"train_loss": -6.123037815093994, "global_step": 75612, "epoch": 1800} {"train_loss": -6.0063252449035645, "global_step": 75613, "epoch": 1800} {"train_loss": -6.0938615798950195, "global_step": 75614, "epoch": 1800} {"train_loss": -6.213230609893799, "global_step": 75615, "epoch": 1800} {"train_loss": -6.1175737380981445, "global_step": 75616, "epoch": 1800} {"train_loss": -6.099833965301514, "global_step": 75617, "epoch": 1800} {"train_loss": -6.043057441711426, "global_step": 75618, "epoch": 1800} {"train_loss": -6.057951927185059, "global_step": 75619, "epoch": 1800} {"train_loss": -6.0387163162231445, "global_step": 75620, "epoch": 1800} {"train_loss": -6.0534586906433105, "global_step": 75621, "epoch": 1800} {"train_loss": -6.0996503829956055, "global_step": 75622, "epoch": 1800} {"train_loss": -6.035011291503906, "global_step": 75623, "epoch": 1800} {"train_loss": -6.063223361968994, "global_step": 75624, "epoch": 1800} {"train_loss": -6.058660984039307, "global_step": 75625, "epoch": 1800} {"train_loss": -5.9626264572143555, "global_step": 75626, "epoch": 1800} {"train_loss": -6.161470890045166, "global_step": 75627, "epoch": 1800} {"train_loss": -6.15333366394043, "global_step": 75628, "epoch": 1800} {"train_loss": -6.125582218170166, "global_step": 75629, "epoch": 1800} {"train_loss": -5.982189178466797, "global_step": 75630, "epoch": 1800} {"train_loss": -6.0445051193237305, "global_step": 75631, "epoch": 1800} {"train_loss": -6.079807281494141, "global_step": 75632, "epoch": 1800} {"train_loss": -6.065221309661865, "global_step": 75633, "epoch": 1800} {"train_loss": -6.125816822052002, "global_step": 75634, "epoch": 1800} {"train_loss": -6.082200527191162, "global_step": 75635, "epoch": 1800} {"train_loss": -6.023482322692871, "global_step": 75636, "epoch": 1800} {"train_loss": -5.951987266540527, "global_step": 75637, "epoch": 1800} {"train_loss": -6.005952835083008, "global_step": 75638, "epoch": 1800} {"train_loss": -6.1515302658081055, "global_step": 75639, "epoch": 1800} {"train_loss": -6.157138347625732, "global_step": 75640, "epoch": 1800} {"train_loss": -6.069114775884719, "global_step": 75641, "epoch": 1800, "train/sim_max_reward_0": 0.4593659396208935, "train/sim_max_reward_1": 0.3709111247902654, "train/sim_max_reward_2": 0.47498770840599025, "train/sim_max_reward_3": 0.14380523019027294, "train/sim_max_reward_4": 0.9039169157594789, "train/sim_max_reward_5": 0.5923380125291872, "test/sim_max_reward_4500000": 0.34831421585560635, "test/sim_max_reward_4500001": 0.7294476369252463, "test/sim_max_reward_4500002": 0.8135792754344102, "test/sim_max_reward_4500003": 0.7549149167859376, "test/sim_max_reward_4500004": 0.11327834851304927, "test/sim_max_reward_4500005": 0.8875909285094006, "test/sim_max_reward_4500006": 0.9979010160247086, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.2822517715445442, "test/sim_max_reward_4500009": 0.8180222509792444, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.8545937062609825, "test/sim_max_reward_4500012": 0.9416705452941392, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.9202490197773522, "test/sim_max_reward_4500015": 0.8518198657083266, "test/sim_max_reward_4500016": 0.6480740989775816, "test/sim_max_reward_4500017": 0.038854750893526954, "test/sim_max_reward_4500018": 0.033846908444458916, "test/sim_max_reward_4500019": 0.8889710186167161, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.5671352148641613, "test/sim_max_reward_4500022": 0.4313497669250719, "test/sim_max_reward_4500023": 0.5620651051963672, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.0429797523996541, "test/sim_max_reward_4500026": 0.9807766673103488, "test/sim_max_reward_4500027": 0.5427219634414308, "test/sim_max_reward_4500028": 0.18854199966061133, "test/sim_max_reward_4500029": 0.1684625160821273, "test/sim_max_reward_4500030": 0.8821785659458865, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.10571549018252703, "test/sim_max_reward_4500033": 0.8504802775574993, "test/sim_max_reward_4500034": 0.8456358555608973, "test/sim_max_reward_4500035": 0.9251122096002797, "test/sim_max_reward_4500036": 0.9536133131194694, "test/sim_max_reward_4500037": 0.48537135036701917, "test/sim_max_reward_4500038": 1.0, "test/sim_max_reward_4500039": 0.8350016767788959, "test/sim_max_reward_4500040": 0.8199462113718496, "test/sim_max_reward_4500041": 0.9068403312723524, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.18767635831491963, "test/sim_max_reward_4500044": 0.9288630885482623, "test/sim_max_reward_4500045": 0.4821389084573613, "test/sim_max_reward_4500046": 0.9405407444236291, "test/sim_max_reward_4500047": 0.8319740002987529, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.4908874885493481, "test/mean_score": 0.5482188258146938, "val_loss": 74982.28125} {"train_loss": -6.0106706619262695, "global_step": 75642, "epoch": 1801} {"train_loss": -6.004673004150391, "global_step": 75643, "epoch": 1801} {"train_loss": -6.25616455078125, "global_step": 75644, "epoch": 1801} {"train_loss": -6.085341453552246, "global_step": 75645, "epoch": 1801} {"train_loss": -6.0456438064575195, "global_step": 75646, "epoch": 1801} {"train_loss": -6.114285469055176, "global_step": 75647, "epoch": 1801} {"train_loss": -6.078320503234863, "global_step": 75648, "epoch": 1801} {"train_loss": -6.213860511779785, "global_step": 75649, "epoch": 1801} {"train_loss": -6.062854290008545, "global_step": 75650, "epoch": 1801} {"train_loss": -6.1342973709106445, "global_step": 75651, "epoch": 1801} {"train_loss": -6.114428520202637, "global_step": 75652, "epoch": 1801} {"train_loss": -5.986643314361572, "global_step": 75653, "epoch": 1801} {"train_loss": -6.019111633300781, "global_step": 75654, "epoch": 1801} {"train_loss": -5.9715166091918945, "global_step": 75655, "epoch": 1801} {"train_loss": -6.1058349609375, "global_step": 75656, "epoch": 1801} {"train_loss": -6.133803367614746, "global_step": 75657, "epoch": 1801} {"train_loss": -6.119051456451416, "global_step": 75658, "epoch": 1801} {"train_loss": -6.115608215332031, "global_step": 75659, "epoch": 1801} {"train_loss": -6.060905933380127, "global_step": 75660, "epoch": 1801} {"train_loss": -6.09930419921875, "global_step": 75661, "epoch": 1801} {"train_loss": -6.026538848876953, "global_step": 75662, "epoch": 1801} {"train_loss": -6.138907432556152, "global_step": 75663, "epoch": 1801} {"train_loss": -6.0985260009765625, "global_step": 75664, "epoch": 1801} {"train_loss": -6.036861419677734, "global_step": 75665, "epoch": 1801} {"train_loss": -6.187971115112305, "global_step": 75666, "epoch": 1801} {"train_loss": -6.129014015197754, "global_step": 75667, "epoch": 1801} {"train_loss": -5.926210403442383, "global_step": 75668, "epoch": 1801} {"train_loss": -6.080913066864014, "global_step": 75669, "epoch": 1801} {"train_loss": -6.137975692749023, "global_step": 75670, "epoch": 1801} {"train_loss": -6.093093395233154, "global_step": 75671, "epoch": 1801} {"train_loss": -6.090960502624512, "global_step": 75672, "epoch": 1801} {"train_loss": -6.133528232574463, "global_step": 75673, "epoch": 1801} {"train_loss": -6.099538803100586, "global_step": 75674, "epoch": 1801} {"train_loss": -6.193154811859131, "global_step": 75675, "epoch": 1801} {"train_loss": -6.1456122398376465, "global_step": 75676, "epoch": 1801} {"train_loss": -6.140613555908203, "global_step": 75677, "epoch": 1801} {"train_loss": -6.063385009765625, "global_step": 75678, "epoch": 1801} {"train_loss": -6.135105133056641, "global_step": 75679, "epoch": 1801} {"train_loss": -6.166851997375488, "global_step": 75680, "epoch": 1801} {"train_loss": -6.053324222564697, "global_step": 75681, "epoch": 1801} {"train_loss": -6.1060967445373535, "global_step": 75682, "epoch": 1801} {"train_loss": -6.0943862143017, "global_step": 75683, "epoch": 1801, "val_loss": 74806.9921875} {"train_loss": -6.164525985717773, "global_step": 75684, "epoch": 1802} {"train_loss": -6.203702926635742, "global_step": 75685, "epoch": 1802} {"train_loss": -6.200159072875977, "global_step": 75686, "epoch": 1802} {"train_loss": -6.073564529418945, "global_step": 75687, "epoch": 1802} {"train_loss": -6.020959854125977, "global_step": 75688, "epoch": 1802} {"train_loss": -6.091466903686523, "global_step": 75689, "epoch": 1802} {"train_loss": -6.140766143798828, "global_step": 75690, "epoch": 1802} {"train_loss": -6.046278953552246, "global_step": 75691, "epoch": 1802} {"train_loss": -6.0573883056640625, "global_step": 75692, "epoch": 1802} {"train_loss": -6.1104254722595215, "global_step": 75693, "epoch": 1802} {"train_loss": -6.032121181488037, "global_step": 75694, "epoch": 1802} {"train_loss": -6.080450057983398, "global_step": 75695, "epoch": 1802} {"train_loss": -5.998538970947266, "global_step": 75696, "epoch": 1802} {"train_loss": -5.976579189300537, "global_step": 75697, "epoch": 1802} {"train_loss": -6.056924819946289, "global_step": 75698, "epoch": 1802} {"train_loss": -6.042710304260254, "global_step": 75699, "epoch": 1802} {"train_loss": -6.100520133972168, "global_step": 75700, "epoch": 1802} {"train_loss": -5.8717041015625, "global_step": 75701, "epoch": 1802} {"train_loss": -6.039934158325195, "global_step": 75702, "epoch": 1802} {"train_loss": -6.076661109924316, "global_step": 75703, "epoch": 1802} {"train_loss": -5.997953414916992, "global_step": 75704, "epoch": 1802} {"train_loss": -6.088961601257324, "global_step": 75705, "epoch": 1802} {"train_loss": -6.059504508972168, "global_step": 75706, "epoch": 1802} {"train_loss": -5.992002487182617, "global_step": 75707, "epoch": 1802} {"train_loss": -6.052951812744141, "global_step": 75708, "epoch": 1802} {"train_loss": -6.082076072692871, "global_step": 75709, "epoch": 1802} {"train_loss": -5.971897125244141, "global_step": 75710, "epoch": 1802} {"train_loss": -5.968445777893066, "global_step": 75711, "epoch": 1802} {"train_loss": -5.996452331542969, "global_step": 75712, "epoch": 1802} {"train_loss": -6.115560531616211, "global_step": 75713, "epoch": 1802} {"train_loss": -6.051227569580078, "global_step": 75714, "epoch": 1802} {"train_loss": -6.090092658996582, "global_step": 75715, "epoch": 1802} {"train_loss": -6.054286003112793, "global_step": 75716, "epoch": 1802} {"train_loss": -6.2621917724609375, "global_step": 75717, "epoch": 1802} {"train_loss": -5.971060752868652, "global_step": 75718, "epoch": 1802} {"train_loss": -6.074254989624023, "global_step": 75719, "epoch": 1802} {"train_loss": -6.21712589263916, "global_step": 75720, "epoch": 1802} {"train_loss": -6.1289777755737305, "global_step": 75721, "epoch": 1802} {"train_loss": -6.01067590713501, "global_step": 75722, "epoch": 1802} {"train_loss": -6.155261039733887, "global_step": 75723, "epoch": 1802} {"train_loss": -5.984508514404297, "global_step": 75724, "epoch": 1802} {"train_loss": -6.068474826358614, "global_step": 75725, "epoch": 1802, "val_loss": 75073.28125} {"train_loss": -6.043641567230225, "global_step": 75726, "epoch": 1803} {"train_loss": -6.008184432983398, "global_step": 75727, "epoch": 1803} {"train_loss": -6.2351393699646, "global_step": 75728, "epoch": 1803} {"train_loss": -6.05081033706665, "global_step": 75729, "epoch": 1803} {"train_loss": -5.8733696937561035, "global_step": 75730, "epoch": 1803} {"train_loss": -6.171078681945801, "global_step": 75731, "epoch": 1803} {"train_loss": -5.95199728012085, "global_step": 75732, "epoch": 1803} {"train_loss": -5.986391067504883, "global_step": 75733, "epoch": 1803} {"train_loss": -6.047059535980225, "global_step": 75734, "epoch": 1803} {"train_loss": -6.025195598602295, "global_step": 75735, "epoch": 1803} {"train_loss": -6.067144393920898, "global_step": 75736, "epoch": 1803} {"train_loss": -6.0033135414123535, "global_step": 75737, "epoch": 1803} {"train_loss": -6.089596748352051, "global_step": 75738, "epoch": 1803} {"train_loss": -6.069952964782715, "global_step": 75739, "epoch": 1803} {"train_loss": -6.0623979568481445, "global_step": 75740, "epoch": 1803} {"train_loss": -6.091743469238281, "global_step": 75741, "epoch": 1803} {"train_loss": -6.091482162475586, "global_step": 75742, "epoch": 1803} {"train_loss": -6.082637786865234, "global_step": 75743, "epoch": 1803} {"train_loss": -6.010839462280273, "global_step": 75744, "epoch": 1803} {"train_loss": -6.120194435119629, "global_step": 75745, "epoch": 1803} {"train_loss": -6.210520267486572, "global_step": 75746, "epoch": 1803} {"train_loss": -6.137726783752441, "global_step": 75747, "epoch": 1803} {"train_loss": -5.976248741149902, "global_step": 75748, "epoch": 1803} {"train_loss": -6.000794887542725, "global_step": 75749, "epoch": 1803} {"train_loss": -6.180968284606934, "global_step": 75750, "epoch": 1803} {"train_loss": -6.0159196853637695, "global_step": 75751, "epoch": 1803} {"train_loss": -5.802751541137695, "global_step": 75752, "epoch": 1803} {"train_loss": -6.023370265960693, "global_step": 75753, "epoch": 1803} {"train_loss": -5.950917720794678, "global_step": 75754, "epoch": 1803} {"train_loss": -5.958928108215332, "global_step": 75755, "epoch": 1803} {"train_loss": -6.033769607543945, "global_step": 75756, "epoch": 1803} {"train_loss": -5.975688934326172, "global_step": 75757, "epoch": 1803} {"train_loss": -5.979959487915039, "global_step": 75758, "epoch": 1803} {"train_loss": -6.024133205413818, "global_step": 75759, "epoch": 1803} {"train_loss": -5.922726631164551, "global_step": 75760, "epoch": 1803} {"train_loss": -5.9795403480529785, "global_step": 75761, "epoch": 1803} {"train_loss": -6.095207691192627, "global_step": 75762, "epoch": 1803} {"train_loss": -5.982504367828369, "global_step": 75763, "epoch": 1803} {"train_loss": -5.811147212982178, "global_step": 75764, "epoch": 1803} {"train_loss": -6.045384407043457, "global_step": 75765, "epoch": 1803} {"train_loss": -5.934089660644531, "global_step": 75766, "epoch": 1803} {"train_loss": -6.0280929065886, "global_step": 75767, "epoch": 1803, "val_loss": 75010.0078125} {"train_loss": -6.103853225708008, "global_step": 75768, "epoch": 1804} {"train_loss": -5.948792457580566, "global_step": 75769, "epoch": 1804} {"train_loss": -6.0216875076293945, "global_step": 75770, "epoch": 1804} {"train_loss": -5.988035202026367, "global_step": 75771, "epoch": 1804} {"train_loss": -6.0198822021484375, "global_step": 75772, "epoch": 1804} {"train_loss": -6.005496978759766, "global_step": 75773, "epoch": 1804} {"train_loss": -6.0503644943237305, "global_step": 75774, "epoch": 1804} {"train_loss": -6.031874179840088, "global_step": 75775, "epoch": 1804} {"train_loss": -5.996985912322998, "global_step": 75776, "epoch": 1804} {"train_loss": -6.070706844329834, "global_step": 75777, "epoch": 1804} {"train_loss": -5.954620361328125, "global_step": 75778, "epoch": 1804} {"train_loss": -6.090732097625732, "global_step": 75779, "epoch": 1804} {"train_loss": -6.2001190185546875, "global_step": 75780, "epoch": 1804} {"train_loss": -6.125348091125488, "global_step": 75781, "epoch": 1804} {"train_loss": -6.0809807777404785, "global_step": 75782, "epoch": 1804} {"train_loss": -6.038509368896484, "global_step": 75783, "epoch": 1804} {"train_loss": -6.051125526428223, "global_step": 75784, "epoch": 1804} {"train_loss": -6.010754585266113, "global_step": 75785, "epoch": 1804} {"train_loss": -6.096820831298828, "global_step": 75786, "epoch": 1804} {"train_loss": -6.140063285827637, "global_step": 75787, "epoch": 1804} {"train_loss": -6.044491767883301, "global_step": 75788, "epoch": 1804} {"train_loss": -6.042372703552246, "global_step": 75789, "epoch": 1804} {"train_loss": -6.122867584228516, "global_step": 75790, "epoch": 1804} {"train_loss": -6.085356712341309, "global_step": 75791, "epoch": 1804} {"train_loss": -6.089341163635254, "global_step": 75792, "epoch": 1804} {"train_loss": -6.10697078704834, "global_step": 75793, "epoch": 1804} {"train_loss": -6.0845561027526855, "global_step": 75794, "epoch": 1804} {"train_loss": -6.089977264404297, "global_step": 75795, "epoch": 1804} {"train_loss": -6.163524627685547, "global_step": 75796, "epoch": 1804} {"train_loss": -6.167055130004883, "global_step": 75797, "epoch": 1804} {"train_loss": -6.191634178161621, "global_step": 75798, "epoch": 1804} {"train_loss": -6.127753257751465, "global_step": 75799, "epoch": 1804} {"train_loss": -5.992354393005371, "global_step": 75800, "epoch": 1804} {"train_loss": -6.177584648132324, "global_step": 75801, "epoch": 1804} {"train_loss": -6.076217174530029, "global_step": 75802, "epoch": 1804} {"train_loss": -6.086399078369141, "global_step": 75803, "epoch": 1804} {"train_loss": -6.129726886749268, "global_step": 75804, "epoch": 1804} {"train_loss": -6.110817909240723, "global_step": 75805, "epoch": 1804} {"train_loss": -6.1883039474487305, "global_step": 75806, "epoch": 1804} {"train_loss": -6.074449062347412, "global_step": 75807, "epoch": 1804} {"train_loss": -6.069222450256348, "global_step": 75808, "epoch": 1804} {"train_loss": -6.080704552786691, "global_step": 75809, "epoch": 1804, "val_loss": 74893.296875} {"train_loss": -6.072458267211914, "global_step": 75810, "epoch": 1805} {"train_loss": -6.061888694763184, "global_step": 75811, "epoch": 1805} {"train_loss": -6.058909893035889, "global_step": 75812, "epoch": 1805} {"train_loss": -6.101468086242676, "global_step": 75813, "epoch": 1805} {"train_loss": -6.071104526519775, "global_step": 75814, "epoch": 1805} {"train_loss": -6.3047099113464355, "global_step": 75815, "epoch": 1805} {"train_loss": -6.030816078186035, "global_step": 75816, "epoch": 1805} {"train_loss": -6.157290935516357, "global_step": 75817, "epoch": 1805} {"train_loss": -6.008683681488037, "global_step": 75818, "epoch": 1805} {"train_loss": -6.2443928718566895, "global_step": 75819, "epoch": 1805} {"train_loss": -5.980888366699219, "global_step": 75820, "epoch": 1805} {"train_loss": -6.042657852172852, "global_step": 75821, "epoch": 1805} {"train_loss": -6.0456767082214355, "global_step": 75822, "epoch": 1805} {"train_loss": -6.120002746582031, "global_step": 75823, "epoch": 1805} {"train_loss": -6.033329010009766, "global_step": 75824, "epoch": 1805} {"train_loss": -6.079336166381836, "global_step": 75825, "epoch": 1805} {"train_loss": -6.02345609664917, "global_step": 75826, "epoch": 1805} {"train_loss": -6.181194305419922, "global_step": 75827, "epoch": 1805} {"train_loss": -5.993748664855957, "global_step": 75828, "epoch": 1805} {"train_loss": -6.072541236877441, "global_step": 75829, "epoch": 1805} {"train_loss": -6.053940773010254, "global_step": 75830, "epoch": 1805} {"train_loss": -6.057892799377441, "global_step": 75831, "epoch": 1805} {"train_loss": -6.071933269500732, "global_step": 75832, "epoch": 1805} {"train_loss": -6.073858737945557, "global_step": 75833, "epoch": 1805} {"train_loss": -6.11387300491333, "global_step": 75834, "epoch": 1805} {"train_loss": -6.084756851196289, "global_step": 75835, "epoch": 1805} {"train_loss": -6.189640522003174, "global_step": 75836, "epoch": 1805} {"train_loss": -6.159193992614746, "global_step": 75837, "epoch": 1805} {"train_loss": -6.127283096313477, "global_step": 75838, "epoch": 1805} {"train_loss": -6.205595970153809, "global_step": 75839, "epoch": 1805} {"train_loss": -6.158598899841309, "global_step": 75840, "epoch": 1805} {"train_loss": -6.165600776672363, "global_step": 75841, "epoch": 1805} {"train_loss": -6.2163496017456055, "global_step": 75842, "epoch": 1805} {"train_loss": -6.108992099761963, "global_step": 75843, "epoch": 1805} {"train_loss": -6.214625358581543, "global_step": 75844, "epoch": 1805} {"train_loss": -6.137473106384277, "global_step": 75845, "epoch": 1805} {"train_loss": -6.056910514831543, "global_step": 75846, "epoch": 1805} {"train_loss": -6.149763584136963, "global_step": 75847, "epoch": 1805} {"train_loss": -6.1437177658081055, "global_step": 75848, "epoch": 1805} {"train_loss": -6.210904121398926, "global_step": 75849, "epoch": 1805} {"train_loss": -6.048050880432129, "global_step": 75850, "epoch": 1805} {"train_loss": -6.109733672369094, "global_step": 75851, "epoch": 1805, "val_loss": 75037.734375} {"train_loss": -6.07423210144043, "global_step": 75852, "epoch": 1806} {"train_loss": -6.072470664978027, "global_step": 75853, "epoch": 1806} {"train_loss": -6.133762359619141, "global_step": 75854, "epoch": 1806} {"train_loss": -5.992797374725342, "global_step": 75855, "epoch": 1806} {"train_loss": -6.096101760864258, "global_step": 75856, "epoch": 1806} {"train_loss": -5.962697982788086, "global_step": 75857, "epoch": 1806} {"train_loss": -6.04154109954834, "global_step": 75858, "epoch": 1806} {"train_loss": -6.074284553527832, "global_step": 75859, "epoch": 1806} {"train_loss": -6.180719375610352, "global_step": 75860, "epoch": 1806} {"train_loss": -6.048013687133789, "global_step": 75861, "epoch": 1806} {"train_loss": -6.1800642013549805, "global_step": 75862, "epoch": 1806} {"train_loss": -6.143955707550049, "global_step": 75863, "epoch": 1806} {"train_loss": -6.0576252937316895, "global_step": 75864, "epoch": 1806} {"train_loss": -5.911118984222412, "global_step": 75865, "epoch": 1806} {"train_loss": -6.045041561126709, "global_step": 75866, "epoch": 1806} {"train_loss": -6.123447418212891, "global_step": 75867, "epoch": 1806} {"train_loss": -6.129063129425049, "global_step": 75868, "epoch": 1806} {"train_loss": -6.144743919372559, "global_step": 75869, "epoch": 1806} {"train_loss": -6.068718433380127, "global_step": 75870, "epoch": 1806} {"train_loss": -6.143219470977783, "global_step": 75871, "epoch": 1806} {"train_loss": -6.1364030838012695, "global_step": 75872, "epoch": 1806} {"train_loss": -6.1433820724487305, "global_step": 75873, "epoch": 1806} {"train_loss": -6.1562275886535645, "global_step": 75874, "epoch": 1806} {"train_loss": -6.083845138549805, "global_step": 75875, "epoch": 1806} {"train_loss": -6.105339050292969, "global_step": 75876, "epoch": 1806} {"train_loss": -6.207630157470703, "global_step": 75877, "epoch": 1806} {"train_loss": -6.146305561065674, "global_step": 75878, "epoch": 1806} {"train_loss": -6.085705757141113, "global_step": 75879, "epoch": 1806} {"train_loss": -6.118221282958984, "global_step": 75880, "epoch": 1806} {"train_loss": -6.094101428985596, "global_step": 75881, "epoch": 1806} {"train_loss": -6.060164451599121, "global_step": 75882, "epoch": 1806} {"train_loss": -6.116069793701172, "global_step": 75883, "epoch": 1806} {"train_loss": -6.097182273864746, "global_step": 75884, "epoch": 1806} {"train_loss": -6.200630187988281, "global_step": 75885, "epoch": 1806} {"train_loss": -6.144646644592285, "global_step": 75886, "epoch": 1806} {"train_loss": -6.09538459777832, "global_step": 75887, "epoch": 1806} {"train_loss": -6.126621246337891, "global_step": 75888, "epoch": 1806} {"train_loss": -6.104517936706543, "global_step": 75889, "epoch": 1806} {"train_loss": -6.103860378265381, "global_step": 75890, "epoch": 1806} {"train_loss": -6.060085296630859, "global_step": 75891, "epoch": 1806} {"train_loss": -6.275036811828613, "global_step": 75892, "epoch": 1806} {"train_loss": -6.102530661083403, "global_step": 75893, "epoch": 1806, "val_loss": 75037.78125} {"train_loss": -6.216271877288818, "global_step": 75894, "epoch": 1807} {"train_loss": -6.127804279327393, "global_step": 75895, "epoch": 1807} {"train_loss": -6.048992156982422, "global_step": 75896, "epoch": 1807} {"train_loss": -6.071846961975098, "global_step": 75897, "epoch": 1807} {"train_loss": -6.133143424987793, "global_step": 75898, "epoch": 1807} {"train_loss": -6.016327381134033, "global_step": 75899, "epoch": 1807} {"train_loss": -6.163699626922607, "global_step": 75900, "epoch": 1807} {"train_loss": -6.156826019287109, "global_step": 75901, "epoch": 1807} {"train_loss": -6.022810935974121, "global_step": 75902, "epoch": 1807} {"train_loss": -6.067399978637695, "global_step": 75903, "epoch": 1807} {"train_loss": -6.0459723472595215, "global_step": 75904, "epoch": 1807} {"train_loss": -6.100508689880371, "global_step": 75905, "epoch": 1807} {"train_loss": -6.103278636932373, "global_step": 75906, "epoch": 1807} {"train_loss": -6.024580955505371, "global_step": 75907, "epoch": 1807} {"train_loss": -6.138193130493164, "global_step": 75908, "epoch": 1807} {"train_loss": -5.958192825317383, "global_step": 75909, "epoch": 1807} {"train_loss": -5.9822998046875, "global_step": 75910, "epoch": 1807} {"train_loss": -6.101553916931152, "global_step": 75911, "epoch": 1807} {"train_loss": -6.09067440032959, "global_step": 75912, "epoch": 1807} {"train_loss": -6.0741777420043945, "global_step": 75913, "epoch": 1807} {"train_loss": -6.163070201873779, "global_step": 75914, "epoch": 1807} {"train_loss": -5.890480041503906, "global_step": 75915, "epoch": 1807} {"train_loss": -6.078187942504883, "global_step": 75916, "epoch": 1807} {"train_loss": -6.009853363037109, "global_step": 75917, "epoch": 1807} {"train_loss": -5.993337154388428, "global_step": 75918, "epoch": 1807} {"train_loss": -6.0913310050964355, "global_step": 75919, "epoch": 1807} {"train_loss": -5.975142478942871, "global_step": 75920, "epoch": 1807} {"train_loss": -6.134818077087402, "global_step": 75921, "epoch": 1807} {"train_loss": -6.05351448059082, "global_step": 75922, "epoch": 1807} {"train_loss": -5.937506675720215, "global_step": 75923, "epoch": 1807} {"train_loss": -6.127948760986328, "global_step": 75924, "epoch": 1807} {"train_loss": -6.1078081130981445, "global_step": 75925, "epoch": 1807} {"train_loss": -6.070130825042725, "global_step": 75926, "epoch": 1807} {"train_loss": -6.057420253753662, "global_step": 75927, "epoch": 1807} {"train_loss": -6.093893051147461, "global_step": 75928, "epoch": 1807} {"train_loss": -6.083682537078857, "global_step": 75929, "epoch": 1807} {"train_loss": -6.16986083984375, "global_step": 75930, "epoch": 1807} {"train_loss": -6.182640075683594, "global_step": 75931, "epoch": 1807} {"train_loss": -6.1484904289245605, "global_step": 75932, "epoch": 1807} {"train_loss": -6.182126998901367, "global_step": 75933, "epoch": 1807} {"train_loss": -6.001752853393555, "global_step": 75934, "epoch": 1807} {"train_loss": -6.077450218654814, "global_step": 75935, "epoch": 1807, "val_loss": 74990.7265625} {"train_loss": -6.22231388092041, "global_step": 75936, "epoch": 1808} {"train_loss": -5.9427690505981445, "global_step": 75937, "epoch": 1808} {"train_loss": -5.968944072723389, "global_step": 75938, "epoch": 1808} {"train_loss": -5.995692729949951, "global_step": 75939, "epoch": 1808} {"train_loss": -6.126272201538086, "global_step": 75940, "epoch": 1808} {"train_loss": -6.139129638671875, "global_step": 75941, "epoch": 1808} {"train_loss": -6.106492042541504, "global_step": 75942, "epoch": 1808} {"train_loss": -5.993041038513184, "global_step": 75943, "epoch": 1808} {"train_loss": -6.0753607749938965, "global_step": 75944, "epoch": 1808} {"train_loss": -6.079826354980469, "global_step": 75945, "epoch": 1808} {"train_loss": -6.154754638671875, "global_step": 75946, "epoch": 1808} {"train_loss": -6.052927017211914, "global_step": 75947, "epoch": 1808} {"train_loss": -6.232797622680664, "global_step": 75948, "epoch": 1808} {"train_loss": -6.094494342803955, "global_step": 75949, "epoch": 1808} {"train_loss": -6.086785316467285, "global_step": 75950, "epoch": 1808} {"train_loss": -6.12917423248291, "global_step": 75951, "epoch": 1808} {"train_loss": -6.0542402267456055, "global_step": 75952, "epoch": 1808} {"train_loss": -6.1509904861450195, "global_step": 75953, "epoch": 1808} {"train_loss": -6.056624412536621, "global_step": 75954, "epoch": 1808} {"train_loss": -6.206151008605957, "global_step": 75955, "epoch": 1808} {"train_loss": -6.074877738952637, "global_step": 75956, "epoch": 1808} {"train_loss": -6.045594215393066, "global_step": 75957, "epoch": 1808} {"train_loss": -6.194457054138184, "global_step": 75958, "epoch": 1808} {"train_loss": -6.046943664550781, "global_step": 75959, "epoch": 1808} {"train_loss": -6.122167587280273, "global_step": 75960, "epoch": 1808} {"train_loss": -6.142417907714844, "global_step": 75961, "epoch": 1808} {"train_loss": -6.106108665466309, "global_step": 75962, "epoch": 1808} {"train_loss": -5.985166549682617, "global_step": 75963, "epoch": 1808} {"train_loss": -6.009523868560791, "global_step": 75964, "epoch": 1808} {"train_loss": -5.976137161254883, "global_step": 75965, "epoch": 1808} {"train_loss": -6.139867782592773, "global_step": 75966, "epoch": 1808} {"train_loss": -6.156144618988037, "global_step": 75967, "epoch": 1808} {"train_loss": -5.9630279541015625, "global_step": 75968, "epoch": 1808} {"train_loss": -5.98222541809082, "global_step": 75969, "epoch": 1808} {"train_loss": -6.159636497497559, "global_step": 75970, "epoch": 1808} {"train_loss": -5.904350757598877, "global_step": 75971, "epoch": 1808} {"train_loss": -6.0733866691589355, "global_step": 75972, "epoch": 1808} {"train_loss": -6.097142219543457, "global_step": 75973, "epoch": 1808} {"train_loss": -6.105079174041748, "global_step": 75974, "epoch": 1808} {"train_loss": -6.147190093994141, "global_step": 75975, "epoch": 1808} {"train_loss": -6.037965297698975, "global_step": 75976, "epoch": 1808} {"train_loss": -6.08128065154666, "global_step": 75977, "epoch": 1808, "val_loss": 75213.6875} {"train_loss": -6.050693511962891, "global_step": 75978, "epoch": 1809} {"train_loss": -6.192575931549072, "global_step": 75979, "epoch": 1809} {"train_loss": -6.141576766967773, "global_step": 75980, "epoch": 1809} {"train_loss": -6.082130432128906, "global_step": 75981, "epoch": 1809} {"train_loss": -5.865208625793457, "global_step": 75982, "epoch": 1809} {"train_loss": -6.129265785217285, "global_step": 75983, "epoch": 1809} {"train_loss": -6.011838436126709, "global_step": 75984, "epoch": 1809} {"train_loss": -6.106612205505371, "global_step": 75985, "epoch": 1809} {"train_loss": -6.093799591064453, "global_step": 75986, "epoch": 1809} {"train_loss": -6.143401145935059, "global_step": 75987, "epoch": 1809} {"train_loss": -6.002007961273193, "global_step": 75988, "epoch": 1809} {"train_loss": -6.110992431640625, "global_step": 75989, "epoch": 1809} {"train_loss": -6.08823823928833, "global_step": 75990, "epoch": 1809} {"train_loss": -6.232933044433594, "global_step": 75991, "epoch": 1809} {"train_loss": -6.155950546264648, "global_step": 75992, "epoch": 1809} {"train_loss": -6.204009532928467, "global_step": 75993, "epoch": 1809} {"train_loss": -6.1515398025512695, "global_step": 75994, "epoch": 1809} {"train_loss": -6.062102317810059, "global_step": 75995, "epoch": 1809} {"train_loss": -6.017299652099609, "global_step": 75996, "epoch": 1809} {"train_loss": -6.012301445007324, "global_step": 75997, "epoch": 1809} {"train_loss": -6.138309955596924, "global_step": 75998, "epoch": 1809} {"train_loss": -6.0039777755737305, "global_step": 75999, "epoch": 1809} {"train_loss": -6.063762187957764, "global_step": 76000, "epoch": 1809} {"train_loss": -6.078124046325684, "global_step": 76001, "epoch": 1809} {"train_loss": -5.932435035705566, "global_step": 76002, "epoch": 1809} {"train_loss": -6.114380836486816, "global_step": 76003, "epoch": 1809} {"train_loss": -5.937464237213135, "global_step": 76004, "epoch": 1809} {"train_loss": -5.906003952026367, "global_step": 76005, "epoch": 1809} {"train_loss": -6.062080383300781, "global_step": 76006, "epoch": 1809} {"train_loss": -6.141143321990967, "global_step": 76007, "epoch": 1809} {"train_loss": -5.964685916900635, "global_step": 76008, "epoch": 1809} {"train_loss": -6.166050910949707, "global_step": 76009, "epoch": 1809} {"train_loss": -5.976773262023926, "global_step": 76010, "epoch": 1809} {"train_loss": -6.1438446044921875, "global_step": 76011, "epoch": 1809} {"train_loss": -6.008747100830078, "global_step": 76012, "epoch": 1809} {"train_loss": -6.03511381149292, "global_step": 76013, "epoch": 1809} {"train_loss": -6.092235088348389, "global_step": 76014, "epoch": 1809} {"train_loss": -6.093898773193359, "global_step": 76015, "epoch": 1809} {"train_loss": -5.992861747741699, "global_step": 76016, "epoch": 1809} {"train_loss": -5.979533672332764, "global_step": 76017, "epoch": 1809} {"train_loss": -6.018221855163574, "global_step": 76018, "epoch": 1809} {"train_loss": -6.066800060726347, "global_step": 76019, "epoch": 1809, "val_loss": 74856.875} {"train_loss": -6.011233329772949, "global_step": 76020, "epoch": 1810} {"train_loss": -5.986172676086426, "global_step": 76021, "epoch": 1810} {"train_loss": -6.074209213256836, "global_step": 76022, "epoch": 1810} {"train_loss": -6.060234069824219, "global_step": 76023, "epoch": 1810} {"train_loss": -5.953271865844727, "global_step": 76024, "epoch": 1810} {"train_loss": -5.982316970825195, "global_step": 76025, "epoch": 1810} {"train_loss": -6.098663330078125, "global_step": 76026, "epoch": 1810} {"train_loss": -6.184529781341553, "global_step": 76027, "epoch": 1810} {"train_loss": -6.171791076660156, "global_step": 76028, "epoch": 1810} {"train_loss": -6.131966590881348, "global_step": 76029, "epoch": 1810} {"train_loss": -6.043034553527832, "global_step": 76030, "epoch": 1810} {"train_loss": -5.957825660705566, "global_step": 76031, "epoch": 1810} {"train_loss": -6.064168453216553, "global_step": 76032, "epoch": 1810} {"train_loss": -5.953861236572266, "global_step": 76033, "epoch": 1810} {"train_loss": -6.125782012939453, "global_step": 76034, "epoch": 1810} {"train_loss": -5.955751419067383, "global_step": 76035, "epoch": 1810} {"train_loss": -6.035438060760498, "global_step": 76036, "epoch": 1810} {"train_loss": -6.18803596496582, "global_step": 76037, "epoch": 1810} {"train_loss": -6.064364433288574, "global_step": 76038, "epoch": 1810} {"train_loss": -6.181479454040527, "global_step": 76039, "epoch": 1810} {"train_loss": -6.075603485107422, "global_step": 76040, "epoch": 1810} {"train_loss": -6.045832633972168, "global_step": 76041, "epoch": 1810} {"train_loss": -6.1575822830200195, "global_step": 76042, "epoch": 1810} {"train_loss": -6.210848331451416, "global_step": 76043, "epoch": 1810} {"train_loss": -6.0971903800964355, "global_step": 76044, "epoch": 1810} {"train_loss": -6.070345878601074, "global_step": 76045, "epoch": 1810} {"train_loss": -6.116670608520508, "global_step": 76046, "epoch": 1810} {"train_loss": -6.114259719848633, "global_step": 76047, "epoch": 1810} {"train_loss": -6.117212772369385, "global_step": 76048, "epoch": 1810} {"train_loss": -6.168516159057617, "global_step": 76049, "epoch": 1810} {"train_loss": -6.092859268188477, "global_step": 76050, "epoch": 1810} {"train_loss": -6.117794990539551, "global_step": 76051, "epoch": 1810} {"train_loss": -6.157517910003662, "global_step": 76052, "epoch": 1810} {"train_loss": -6.187875747680664, "global_step": 76053, "epoch": 1810} {"train_loss": -6.094768524169922, "global_step": 76054, "epoch": 1810} {"train_loss": -6.063286304473877, "global_step": 76055, "epoch": 1810} {"train_loss": -6.236087799072266, "global_step": 76056, "epoch": 1810} {"train_loss": -6.057334899902344, "global_step": 76057, "epoch": 1810} {"train_loss": -6.056957244873047, "global_step": 76058, "epoch": 1810} {"train_loss": -6.147756576538086, "global_step": 76059, "epoch": 1810} {"train_loss": -6.023077011108398, "global_step": 76060, "epoch": 1810} {"train_loss": -6.0868702956608365, "global_step": 76061, "epoch": 1810, "val_loss": 74644.484375} {"train_loss": -6.050933361053467, "global_step": 76062, "epoch": 1811} {"train_loss": -6.1709794998168945, "global_step": 76063, "epoch": 1811} {"train_loss": -6.167840003967285, "global_step": 76064, "epoch": 1811} {"train_loss": -5.972749710083008, "global_step": 76065, "epoch": 1811} {"train_loss": -6.17176628112793, "global_step": 76066, "epoch": 1811} {"train_loss": -6.018117904663086, "global_step": 76067, "epoch": 1811} {"train_loss": -6.268770217895508, "global_step": 76068, "epoch": 1811} {"train_loss": -6.1536054611206055, "global_step": 76069, "epoch": 1811} {"train_loss": -6.140613555908203, "global_step": 76070, "epoch": 1811} {"train_loss": -6.020400047302246, "global_step": 76071, "epoch": 1811} {"train_loss": -6.195239543914795, "global_step": 76072, "epoch": 1811} {"train_loss": -6.058844089508057, "global_step": 76073, "epoch": 1811} {"train_loss": -6.270763397216797, "global_step": 76074, "epoch": 1811} {"train_loss": -6.1230149269104, "global_step": 76075, "epoch": 1811} {"train_loss": -6.0927886962890625, "global_step": 76076, "epoch": 1811} {"train_loss": -6.202570915222168, "global_step": 76077, "epoch": 1811} {"train_loss": -6.058687210083008, "global_step": 76078, "epoch": 1811} {"train_loss": -6.156003475189209, "global_step": 76079, "epoch": 1811} {"train_loss": -6.033833026885986, "global_step": 76080, "epoch": 1811} {"train_loss": -6.089447021484375, "global_step": 76081, "epoch": 1811} {"train_loss": -6.121236801147461, "global_step": 76082, "epoch": 1811} {"train_loss": -6.097832202911377, "global_step": 76083, "epoch": 1811} {"train_loss": -6.2028303146362305, "global_step": 76084, "epoch": 1811} {"train_loss": -6.1308698654174805, "global_step": 76085, "epoch": 1811} {"train_loss": -6.254727363586426, "global_step": 76086, "epoch": 1811} {"train_loss": -6.021100997924805, "global_step": 76087, "epoch": 1811} {"train_loss": -6.17997407913208, "global_step": 76088, "epoch": 1811} {"train_loss": -6.1305694580078125, "global_step": 76089, "epoch": 1811} {"train_loss": -6.063956260681152, "global_step": 76090, "epoch": 1811} {"train_loss": -6.105558395385742, "global_step": 76091, "epoch": 1811} {"train_loss": -5.999267578125, "global_step": 76092, "epoch": 1811} {"train_loss": -6.145689487457275, "global_step": 76093, "epoch": 1811} {"train_loss": -6.078083038330078, "global_step": 76094, "epoch": 1811} {"train_loss": -6.093244552612305, "global_step": 76095, "epoch": 1811} {"train_loss": -6.119274139404297, "global_step": 76096, "epoch": 1811} {"train_loss": -6.094935894012451, "global_step": 76097, "epoch": 1811} {"train_loss": -6.22645378112793, "global_step": 76098, "epoch": 1811} {"train_loss": -6.164752960205078, "global_step": 76099, "epoch": 1811} {"train_loss": -6.159079551696777, "global_step": 76100, "epoch": 1811} {"train_loss": -6.050850868225098, "global_step": 76101, "epoch": 1811} {"train_loss": -6.10683536529541, "global_step": 76102, "epoch": 1811} {"train_loss": -6.121953657695225, "global_step": 76103, "epoch": 1811, "val_loss": 74826.609375} {"train_loss": -5.970987796783447, "global_step": 76104, "epoch": 1812} {"train_loss": -6.049428939819336, "global_step": 76105, "epoch": 1812} {"train_loss": -6.124892234802246, "global_step": 76106, "epoch": 1812} {"train_loss": -6.056890964508057, "global_step": 76107, "epoch": 1812} {"train_loss": -5.952958583831787, "global_step": 76108, "epoch": 1812} {"train_loss": -6.041707992553711, "global_step": 76109, "epoch": 1812} {"train_loss": -6.096905708312988, "global_step": 76110, "epoch": 1812} {"train_loss": -5.972663879394531, "global_step": 76111, "epoch": 1812} {"train_loss": -6.035707473754883, "global_step": 76112, "epoch": 1812} {"train_loss": -6.017152309417725, "global_step": 76113, "epoch": 1812} {"train_loss": -6.049141883850098, "global_step": 76114, "epoch": 1812} {"train_loss": -6.002035617828369, "global_step": 76115, "epoch": 1812} {"train_loss": -6.148399829864502, "global_step": 76116, "epoch": 1812} {"train_loss": -6.068253517150879, "global_step": 76117, "epoch": 1812} {"train_loss": -6.031015396118164, "global_step": 76118, "epoch": 1812} {"train_loss": -6.103795051574707, "global_step": 76119, "epoch": 1812} {"train_loss": -6.057620048522949, "global_step": 76120, "epoch": 1812} {"train_loss": -6.198507785797119, "global_step": 76121, "epoch": 1812} {"train_loss": -6.014434814453125, "global_step": 76122, "epoch": 1812} {"train_loss": -6.053745269775391, "global_step": 76123, "epoch": 1812} {"train_loss": -6.145286560058594, "global_step": 76124, "epoch": 1812} {"train_loss": -6.091103553771973, "global_step": 76125, "epoch": 1812} {"train_loss": -6.082953453063965, "global_step": 76126, "epoch": 1812} {"train_loss": -6.134270668029785, "global_step": 76127, "epoch": 1812} {"train_loss": -6.1624627113342285, "global_step": 76128, "epoch": 1812} {"train_loss": -6.116304874420166, "global_step": 76129, "epoch": 1812} {"train_loss": -6.113193988800049, "global_step": 76130, "epoch": 1812} {"train_loss": -6.030076026916504, "global_step": 76131, "epoch": 1812} {"train_loss": -6.138799667358398, "global_step": 76132, "epoch": 1812} {"train_loss": -6.04787015914917, "global_step": 76133, "epoch": 1812} {"train_loss": -6.039766311645508, "global_step": 76134, "epoch": 1812} {"train_loss": -6.121325492858887, "global_step": 76135, "epoch": 1812} {"train_loss": -6.072636127471924, "global_step": 76136, "epoch": 1812} {"train_loss": -6.127127647399902, "global_step": 76137, "epoch": 1812} {"train_loss": -6.096358776092529, "global_step": 76138, "epoch": 1812} {"train_loss": -6.088138103485107, "global_step": 76139, "epoch": 1812} {"train_loss": -6.138551712036133, "global_step": 76140, "epoch": 1812} {"train_loss": -6.073732376098633, "global_step": 76141, "epoch": 1812} {"train_loss": -6.083122253417969, "global_step": 76142, "epoch": 1812} {"train_loss": -5.89987850189209, "global_step": 76143, "epoch": 1812} {"train_loss": -6.115322589874268, "global_step": 76144, "epoch": 1812} {"train_loss": -6.073845057260423, "global_step": 76145, "epoch": 1812, "val_loss": 74854.28125} {"train_loss": -6.123689651489258, "global_step": 76146, "epoch": 1813} {"train_loss": -6.09232234954834, "global_step": 76147, "epoch": 1813} {"train_loss": -6.026411056518555, "global_step": 76148, "epoch": 1813} {"train_loss": -6.087625503540039, "global_step": 76149, "epoch": 1813} {"train_loss": -6.226376533508301, "global_step": 76150, "epoch": 1813} {"train_loss": -6.265315532684326, "global_step": 76151, "epoch": 1813} {"train_loss": -6.015842437744141, "global_step": 76152, "epoch": 1813} {"train_loss": -6.074501991271973, "global_step": 76153, "epoch": 1813} {"train_loss": -6.024005889892578, "global_step": 76154, "epoch": 1813} {"train_loss": -6.0982136726379395, "global_step": 76155, "epoch": 1813} {"train_loss": -6.150723934173584, "global_step": 76156, "epoch": 1813} {"train_loss": -5.865572929382324, "global_step": 76157, "epoch": 1813} {"train_loss": -6.1334028244018555, "global_step": 76158, "epoch": 1813} {"train_loss": -6.144344329833984, "global_step": 76159, "epoch": 1813} {"train_loss": -6.094744682312012, "global_step": 76160, "epoch": 1813} {"train_loss": -6.122733116149902, "global_step": 76161, "epoch": 1813} {"train_loss": -6.119503974914551, "global_step": 76162, "epoch": 1813} {"train_loss": -6.012419700622559, "global_step": 76163, "epoch": 1813} {"train_loss": -6.1033220291137695, "global_step": 76164, "epoch": 1813} {"train_loss": -6.0214080810546875, "global_step": 76165, "epoch": 1813} {"train_loss": -6.075168609619141, "global_step": 76166, "epoch": 1813} {"train_loss": -6.0625410079956055, "global_step": 76167, "epoch": 1813} {"train_loss": -6.029813766479492, "global_step": 76168, "epoch": 1813} {"train_loss": -6.13315486907959, "global_step": 76169, "epoch": 1813} {"train_loss": -6.059554100036621, "global_step": 76170, "epoch": 1813} {"train_loss": -6.150160789489746, "global_step": 76171, "epoch": 1813} {"train_loss": -5.982542037963867, "global_step": 76172, "epoch": 1813} {"train_loss": -6.065152645111084, "global_step": 76173, "epoch": 1813} {"train_loss": -6.132654666900635, "global_step": 76174, "epoch": 1813} {"train_loss": -6.069422245025635, "global_step": 76175, "epoch": 1813} {"train_loss": -6.141849517822266, "global_step": 76176, "epoch": 1813} {"train_loss": -6.004274368286133, "global_step": 76177, "epoch": 1813} {"train_loss": -6.0821943283081055, "global_step": 76178, "epoch": 1813} {"train_loss": -6.115891933441162, "global_step": 76179, "epoch": 1813} {"train_loss": -6.134160041809082, "global_step": 76180, "epoch": 1813} {"train_loss": -6.0555500984191895, "global_step": 76181, "epoch": 1813} {"train_loss": -6.1532721519470215, "global_step": 76182, "epoch": 1813} {"train_loss": -6.057093620300293, "global_step": 76183, "epoch": 1813} {"train_loss": -6.006982803344727, "global_step": 76184, "epoch": 1813} {"train_loss": -5.997341632843018, "global_step": 76185, "epoch": 1813} {"train_loss": -6.004584312438965, "global_step": 76186, "epoch": 1813} {"train_loss": -6.081737609136672, "global_step": 76187, "epoch": 1813, "val_loss": 74647.4375} {"train_loss": -6.092430114746094, "global_step": 76188, "epoch": 1814} {"train_loss": -5.941938877105713, "global_step": 76189, "epoch": 1814} {"train_loss": -6.074278354644775, "global_step": 76190, "epoch": 1814} {"train_loss": -6.061405658721924, "global_step": 76191, "epoch": 1814} {"train_loss": -6.0410661697387695, "global_step": 76192, "epoch": 1814} {"train_loss": -6.071575164794922, "global_step": 76193, "epoch": 1814} {"train_loss": -5.97384786605835, "global_step": 76194, "epoch": 1814} {"train_loss": -5.991365432739258, "global_step": 76195, "epoch": 1814} {"train_loss": -6.074702262878418, "global_step": 76196, "epoch": 1814} {"train_loss": -5.893748760223389, "global_step": 76197, "epoch": 1814} {"train_loss": -6.094366073608398, "global_step": 76198, "epoch": 1814} {"train_loss": -5.990664482116699, "global_step": 76199, "epoch": 1814} {"train_loss": -6.010383129119873, "global_step": 76200, "epoch": 1814} {"train_loss": -6.138360023498535, "global_step": 76201, "epoch": 1814} {"train_loss": -6.059874057769775, "global_step": 76202, "epoch": 1814} {"train_loss": -5.938453674316406, "global_step": 76203, "epoch": 1814} {"train_loss": -6.06119966506958, "global_step": 76204, "epoch": 1814} {"train_loss": -6.028831481933594, "global_step": 76205, "epoch": 1814} {"train_loss": -6.133340835571289, "global_step": 76206, "epoch": 1814} {"train_loss": -5.918482303619385, "global_step": 76207, "epoch": 1814} {"train_loss": -6.086604118347168, "global_step": 76208, "epoch": 1814} {"train_loss": -6.043827056884766, "global_step": 76209, "epoch": 1814} {"train_loss": -6.0412092208862305, "global_step": 76210, "epoch": 1814} {"train_loss": -6.050441741943359, "global_step": 76211, "epoch": 1814} {"train_loss": -6.033215522766113, "global_step": 76212, "epoch": 1814} {"train_loss": -6.12862491607666, "global_step": 76213, "epoch": 1814} {"train_loss": -6.017585754394531, "global_step": 76214, "epoch": 1814} {"train_loss": -6.007637023925781, "global_step": 76215, "epoch": 1814} {"train_loss": -6.062044143676758, "global_step": 76216, "epoch": 1814} {"train_loss": -6.05043888092041, "global_step": 76217, "epoch": 1814} {"train_loss": -6.191363334655762, "global_step": 76218, "epoch": 1814} {"train_loss": -5.969588279724121, "global_step": 76219, "epoch": 1814} {"train_loss": -6.007946014404297, "global_step": 76220, "epoch": 1814} {"train_loss": -5.929096221923828, "global_step": 76221, "epoch": 1814} {"train_loss": -6.169682025909424, "global_step": 76222, "epoch": 1814} {"train_loss": -6.110076427459717, "global_step": 76223, "epoch": 1814} {"train_loss": -6.078232765197754, "global_step": 76224, "epoch": 1814} {"train_loss": -6.1032915115356445, "global_step": 76225, "epoch": 1814} {"train_loss": -6.024568557739258, "global_step": 76226, "epoch": 1814} {"train_loss": -5.89202356338501, "global_step": 76227, "epoch": 1814} {"train_loss": -6.086547374725342, "global_step": 76228, "epoch": 1814} {"train_loss": -6.036155995868501, "global_step": 76229, "epoch": 1814, "val_loss": 75075.109375} {"train_loss": -6.0841064453125, "global_step": 76230, "epoch": 1815} {"train_loss": -5.979586601257324, "global_step": 76231, "epoch": 1815} {"train_loss": -6.060368061065674, "global_step": 76232, "epoch": 1815} {"train_loss": -6.088659763336182, "global_step": 76233, "epoch": 1815} {"train_loss": -5.963479042053223, "global_step": 76234, "epoch": 1815} {"train_loss": -6.09261417388916, "global_step": 76235, "epoch": 1815} {"train_loss": -6.048583030700684, "global_step": 76236, "epoch": 1815} {"train_loss": -6.080038070678711, "global_step": 76237, "epoch": 1815} {"train_loss": -5.927694797515869, "global_step": 76238, "epoch": 1815} {"train_loss": -6.102195739746094, "global_step": 76239, "epoch": 1815} {"train_loss": -6.064488410949707, "global_step": 76240, "epoch": 1815} {"train_loss": -6.143338203430176, "global_step": 76241, "epoch": 1815} {"train_loss": -6.042567729949951, "global_step": 76242, "epoch": 1815} {"train_loss": -6.076862812042236, "global_step": 76243, "epoch": 1815} {"train_loss": -6.1180877685546875, "global_step": 76244, "epoch": 1815} {"train_loss": -6.03802490234375, "global_step": 76245, "epoch": 1815} {"train_loss": -6.25199556350708, "global_step": 76246, "epoch": 1815} {"train_loss": -5.975081443786621, "global_step": 76247, "epoch": 1815} {"train_loss": -6.022939682006836, "global_step": 76248, "epoch": 1815} {"train_loss": -6.113280296325684, "global_step": 76249, "epoch": 1815} {"train_loss": -6.2184271812438965, "global_step": 76250, "epoch": 1815} {"train_loss": -6.067270278930664, "global_step": 76251, "epoch": 1815} {"train_loss": -6.136662483215332, "global_step": 76252, "epoch": 1815} {"train_loss": -5.990787506103516, "global_step": 76253, "epoch": 1815} {"train_loss": -6.099780082702637, "global_step": 76254, "epoch": 1815} {"train_loss": -6.07758092880249, "global_step": 76255, "epoch": 1815} {"train_loss": -6.093654632568359, "global_step": 76256, "epoch": 1815} {"train_loss": -6.074951171875, "global_step": 76257, "epoch": 1815} {"train_loss": -6.1385016441345215, "global_step": 76258, "epoch": 1815} {"train_loss": -6.077548980712891, "global_step": 76259, "epoch": 1815} {"train_loss": -6.185145378112793, "global_step": 76260, "epoch": 1815} {"train_loss": -6.170413017272949, "global_step": 76261, "epoch": 1815} {"train_loss": -6.091059684753418, "global_step": 76262, "epoch": 1815} {"train_loss": -6.0849080085754395, "global_step": 76263, "epoch": 1815} {"train_loss": -6.131007194519043, "global_step": 76264, "epoch": 1815} {"train_loss": -6.167300224304199, "global_step": 76265, "epoch": 1815} {"train_loss": -6.08045768737793, "global_step": 76266, "epoch": 1815} {"train_loss": -6.036835670471191, "global_step": 76267, "epoch": 1815} {"train_loss": -6.0884809494018555, "global_step": 76268, "epoch": 1815} {"train_loss": -6.1341776847839355, "global_step": 76269, "epoch": 1815} {"train_loss": -6.1840667724609375, "global_step": 76270, "epoch": 1815} {"train_loss": -6.08779780069987, "global_step": 76271, "epoch": 1815, "val_loss": 74889.96875} {"train_loss": -6.096960067749023, "global_step": 76272, "epoch": 1816} {"train_loss": -6.174262046813965, "global_step": 76273, "epoch": 1816} {"train_loss": -6.157196998596191, "global_step": 76274, "epoch": 1816} {"train_loss": -6.168745994567871, "global_step": 76275, "epoch": 1816} {"train_loss": -6.113880157470703, "global_step": 76276, "epoch": 1816} {"train_loss": -6.049193382263184, "global_step": 76277, "epoch": 1816} {"train_loss": -6.120703220367432, "global_step": 76278, "epoch": 1816} {"train_loss": -6.095907211303711, "global_step": 76279, "epoch": 1816} {"train_loss": -6.089437484741211, "global_step": 76280, "epoch": 1816} {"train_loss": -6.184101104736328, "global_step": 76281, "epoch": 1816} {"train_loss": -6.162829399108887, "global_step": 76282, "epoch": 1816} {"train_loss": -6.141480922698975, "global_step": 76283, "epoch": 1816} {"train_loss": -6.115233421325684, "global_step": 76284, "epoch": 1816} {"train_loss": -6.1053571701049805, "global_step": 76285, "epoch": 1816} {"train_loss": -5.983930587768555, "global_step": 76286, "epoch": 1816} {"train_loss": -6.080690383911133, "global_step": 76287, "epoch": 1816} {"train_loss": -6.097031593322754, "global_step": 76288, "epoch": 1816} {"train_loss": -5.996460914611816, "global_step": 76289, "epoch": 1816} {"train_loss": -6.0329999923706055, "global_step": 76290, "epoch": 1816} {"train_loss": -6.020325183868408, "global_step": 76291, "epoch": 1816} {"train_loss": -6.083020210266113, "global_step": 76292, "epoch": 1816} {"train_loss": -6.059029579162598, "global_step": 76293, "epoch": 1816} {"train_loss": -6.131195068359375, "global_step": 76294, "epoch": 1816} {"train_loss": -6.179222583770752, "global_step": 76295, "epoch": 1816} {"train_loss": -6.043412208557129, "global_step": 76296, "epoch": 1816} {"train_loss": -5.947668075561523, "global_step": 76297, "epoch": 1816} {"train_loss": -6.0743255615234375, "global_step": 76298, "epoch": 1816} {"train_loss": -6.050124168395996, "global_step": 76299, "epoch": 1816} {"train_loss": -6.060177803039551, "global_step": 76300, "epoch": 1816} {"train_loss": -6.074418544769287, "global_step": 76301, "epoch": 1816} {"train_loss": -6.049120903015137, "global_step": 76302, "epoch": 1816} {"train_loss": -6.102306365966797, "global_step": 76303, "epoch": 1816} {"train_loss": -5.985005855560303, "global_step": 76304, "epoch": 1816} {"train_loss": -6.0654497146606445, "global_step": 76305, "epoch": 1816} {"train_loss": -6.139492988586426, "global_step": 76306, "epoch": 1816} {"train_loss": -6.077870845794678, "global_step": 76307, "epoch": 1816} {"train_loss": -5.967413425445557, "global_step": 76308, "epoch": 1816} {"train_loss": -5.9785919189453125, "global_step": 76309, "epoch": 1816} {"train_loss": -6.03528356552124, "global_step": 76310, "epoch": 1816} {"train_loss": -6.058879852294922, "global_step": 76311, "epoch": 1816} {"train_loss": -6.173853874206543, "global_step": 76312, "epoch": 1816} {"train_loss": -6.080199480056763, "global_step": 76313, "epoch": 1816, "val_loss": 74752.8046875} {"train_loss": -6.138053894042969, "global_step": 76314, "epoch": 1817} {"train_loss": -6.000065326690674, "global_step": 76315, "epoch": 1817} {"train_loss": -6.16488790512085, "global_step": 76316, "epoch": 1817} {"train_loss": -6.2605156898498535, "global_step": 76317, "epoch": 1817} {"train_loss": -6.081830978393555, "global_step": 76318, "epoch": 1817} {"train_loss": -6.065077304840088, "global_step": 76319, "epoch": 1817} {"train_loss": -6.126025199890137, "global_step": 76320, "epoch": 1817} {"train_loss": -6.022075653076172, "global_step": 76321, "epoch": 1817} {"train_loss": -6.135196208953857, "global_step": 76322, "epoch": 1817} {"train_loss": -6.175272464752197, "global_step": 76323, "epoch": 1817} {"train_loss": -6.096719264984131, "global_step": 76324, "epoch": 1817} {"train_loss": -6.138833999633789, "global_step": 76325, "epoch": 1817} {"train_loss": -6.112512588500977, "global_step": 76326, "epoch": 1817} {"train_loss": -6.054709434509277, "global_step": 76327, "epoch": 1817} {"train_loss": -5.978115081787109, "global_step": 76328, "epoch": 1817} {"train_loss": -6.144796371459961, "global_step": 76329, "epoch": 1817} {"train_loss": -6.044153213500977, "global_step": 76330, "epoch": 1817} {"train_loss": -5.987173080444336, "global_step": 76331, "epoch": 1817} {"train_loss": -6.204591751098633, "global_step": 76332, "epoch": 1817} {"train_loss": -6.108929634094238, "global_step": 76333, "epoch": 1817} {"train_loss": -6.057676315307617, "global_step": 76334, "epoch": 1817} {"train_loss": -6.182865142822266, "global_step": 76335, "epoch": 1817} {"train_loss": -6.1422810554504395, "global_step": 76336, "epoch": 1817} {"train_loss": -6.254520893096924, "global_step": 76337, "epoch": 1817} {"train_loss": -5.914391994476318, "global_step": 76338, "epoch": 1817} {"train_loss": -6.0760698318481445, "global_step": 76339, "epoch": 1817} {"train_loss": -5.9995951652526855, "global_step": 76340, "epoch": 1817} {"train_loss": -5.9728851318359375, "global_step": 76341, "epoch": 1817} {"train_loss": -6.222621440887451, "global_step": 76342, "epoch": 1817} {"train_loss": -6.056541442871094, "global_step": 76343, "epoch": 1817} {"train_loss": -6.0757856369018555, "global_step": 76344, "epoch": 1817} {"train_loss": -6.156495094299316, "global_step": 76345, "epoch": 1817} {"train_loss": -6.1214399337768555, "global_step": 76346, "epoch": 1817} {"train_loss": -6.15303897857666, "global_step": 76347, "epoch": 1817} {"train_loss": -6.191264629364014, "global_step": 76348, "epoch": 1817} {"train_loss": -6.030087471008301, "global_step": 76349, "epoch": 1817} {"train_loss": -6.015737533569336, "global_step": 76350, "epoch": 1817} {"train_loss": -6.143442630767822, "global_step": 76351, "epoch": 1817} {"train_loss": -6.1753435134887695, "global_step": 76352, "epoch": 1817} {"train_loss": -6.106369972229004, "global_step": 76353, "epoch": 1817} {"train_loss": -6.0927019119262695, "global_step": 76354, "epoch": 1817} {"train_loss": -6.101824578784761, "global_step": 76355, "epoch": 1817, "val_loss": 75172.109375} {"train_loss": -6.0993499755859375, "global_step": 76356, "epoch": 1818} {"train_loss": -6.140095233917236, "global_step": 76357, "epoch": 1818} {"train_loss": -6.054193019866943, "global_step": 76358, "epoch": 1818} {"train_loss": -6.047293186187744, "global_step": 76359, "epoch": 1818} {"train_loss": -5.8646650314331055, "global_step": 76360, "epoch": 1818} {"train_loss": -6.143407821655273, "global_step": 76361, "epoch": 1818} {"train_loss": -6.009739875793457, "global_step": 76362, "epoch": 1818} {"train_loss": -5.996874809265137, "global_step": 76363, "epoch": 1818} {"train_loss": -6.139750003814697, "global_step": 76364, "epoch": 1818} {"train_loss": -5.970659255981445, "global_step": 76365, "epoch": 1818} {"train_loss": -6.030641555786133, "global_step": 76366, "epoch": 1818} {"train_loss": -6.002753257751465, "global_step": 76367, "epoch": 1818} {"train_loss": -6.011109352111816, "global_step": 76368, "epoch": 1818} {"train_loss": -6.003918647766113, "global_step": 76369, "epoch": 1818} {"train_loss": -6.019281387329102, "global_step": 76370, "epoch": 1818} {"train_loss": -6.037555694580078, "global_step": 76371, "epoch": 1818} {"train_loss": -5.913402557373047, "global_step": 76372, "epoch": 1818} {"train_loss": -6.087665557861328, "global_step": 76373, "epoch": 1818} {"train_loss": -5.945338249206543, "global_step": 76374, "epoch": 1818} {"train_loss": -6.076282024383545, "global_step": 76375, "epoch": 1818} {"train_loss": -6.040591239929199, "global_step": 76376, "epoch": 1818} {"train_loss": -6.066866874694824, "global_step": 76377, "epoch": 1818} {"train_loss": -6.163610935211182, "global_step": 76378, "epoch": 1818} {"train_loss": -6.078851222991943, "global_step": 76379, "epoch": 1818} {"train_loss": -6.088979721069336, "global_step": 76380, "epoch": 1818} {"train_loss": -6.086268901824951, "global_step": 76381, "epoch": 1818} {"train_loss": -6.131537437438965, "global_step": 76382, "epoch": 1818} {"train_loss": -6.1520586013793945, "global_step": 76383, "epoch": 1818} {"train_loss": -6.0999345779418945, "global_step": 76384, "epoch": 1818} {"train_loss": -5.988076210021973, "global_step": 76385, "epoch": 1818} {"train_loss": -6.175714492797852, "global_step": 76386, "epoch": 1818} {"train_loss": -5.983304500579834, "global_step": 76387, "epoch": 1818} {"train_loss": -6.1030731201171875, "global_step": 76388, "epoch": 1818} {"train_loss": -6.086820602416992, "global_step": 76389, "epoch": 1818} {"train_loss": -6.035362243652344, "global_step": 76390, "epoch": 1818} {"train_loss": -6.146697521209717, "global_step": 76391, "epoch": 1818} {"train_loss": -5.989506721496582, "global_step": 76392, "epoch": 1818} {"train_loss": -6.046745300292969, "global_step": 76393, "epoch": 1818} {"train_loss": -6.172663688659668, "global_step": 76394, "epoch": 1818} {"train_loss": -6.144258499145508, "global_step": 76395, "epoch": 1818} {"train_loss": -6.118041515350342, "global_step": 76396, "epoch": 1818} {"train_loss": -6.064177445002964, "global_step": 76397, "epoch": 1818, "val_loss": 74766.5} {"train_loss": -6.096405029296875, "global_step": 76398, "epoch": 1819} {"train_loss": -6.092106342315674, "global_step": 76399, "epoch": 1819} {"train_loss": -6.24107551574707, "global_step": 76400, "epoch": 1819} {"train_loss": -6.063728332519531, "global_step": 76401, "epoch": 1819} {"train_loss": -6.112425327301025, "global_step": 76402, "epoch": 1819} {"train_loss": -6.154755592346191, "global_step": 76403, "epoch": 1819} {"train_loss": -6.2130937576293945, "global_step": 76404, "epoch": 1819} {"train_loss": -6.093283176422119, "global_step": 76405, "epoch": 1819} {"train_loss": -6.19500732421875, "global_step": 76406, "epoch": 1819} {"train_loss": -6.091625213623047, "global_step": 76407, "epoch": 1819} {"train_loss": -6.011936664581299, "global_step": 76408, "epoch": 1819} {"train_loss": -6.13942289352417, "global_step": 76409, "epoch": 1819} {"train_loss": -6.1979875564575195, "global_step": 76410, "epoch": 1819} {"train_loss": -6.096951007843018, "global_step": 76411, "epoch": 1819} {"train_loss": -6.272654056549072, "global_step": 76412, "epoch": 1819} {"train_loss": -6.109419822692871, "global_step": 76413, "epoch": 1819} {"train_loss": -6.034727573394775, "global_step": 76414, "epoch": 1819} {"train_loss": -5.993518829345703, "global_step": 76415, "epoch": 1819} {"train_loss": -6.058290481567383, "global_step": 76416, "epoch": 1819} {"train_loss": -6.171961784362793, "global_step": 76417, "epoch": 1819} {"train_loss": -6.064360618591309, "global_step": 76418, "epoch": 1819} {"train_loss": -6.094961166381836, "global_step": 76419, "epoch": 1819} {"train_loss": -6.137563228607178, "global_step": 76420, "epoch": 1819} {"train_loss": -6.018953800201416, "global_step": 76421, "epoch": 1819} {"train_loss": -6.001823902130127, "global_step": 76422, "epoch": 1819} {"train_loss": -6.142303466796875, "global_step": 76423, "epoch": 1819} {"train_loss": -6.12763786315918, "global_step": 76424, "epoch": 1819} {"train_loss": -6.104286193847656, "global_step": 76425, "epoch": 1819} {"train_loss": -5.951417446136475, "global_step": 76426, "epoch": 1819} {"train_loss": -6.032092094421387, "global_step": 76427, "epoch": 1819} {"train_loss": -6.209132194519043, "global_step": 76428, "epoch": 1819} {"train_loss": -6.049488067626953, "global_step": 76429, "epoch": 1819} {"train_loss": -6.09470272064209, "global_step": 76430, "epoch": 1819} {"train_loss": -6.080507278442383, "global_step": 76431, "epoch": 1819} {"train_loss": -6.128902912139893, "global_step": 76432, "epoch": 1819} {"train_loss": -6.050729751586914, "global_step": 76433, "epoch": 1819} {"train_loss": -6.077994346618652, "global_step": 76434, "epoch": 1819} {"train_loss": -6.150411128997803, "global_step": 76435, "epoch": 1819} {"train_loss": -6.217833518981934, "global_step": 76436, "epoch": 1819} {"train_loss": -6.096494674682617, "global_step": 76437, "epoch": 1819} {"train_loss": -6.12906551361084, "global_step": 76438, "epoch": 1819} {"train_loss": -6.10317385764349, "global_step": 76439, "epoch": 1819, "val_loss": 74744.8046875} {"train_loss": -6.038440227508545, "global_step": 76440, "epoch": 1820} {"train_loss": -6.002531051635742, "global_step": 76441, "epoch": 1820} {"train_loss": -6.117692470550537, "global_step": 76442, "epoch": 1820} {"train_loss": -6.128793716430664, "global_step": 76443, "epoch": 1820} {"train_loss": -6.1790313720703125, "global_step": 76444, "epoch": 1820} {"train_loss": -6.012779235839844, "global_step": 76445, "epoch": 1820} {"train_loss": -6.0976128578186035, "global_step": 76446, "epoch": 1820} {"train_loss": -6.190741539001465, "global_step": 76447, "epoch": 1820} {"train_loss": -6.250123977661133, "global_step": 76448, "epoch": 1820} {"train_loss": -6.151841163635254, "global_step": 76449, "epoch": 1820} {"train_loss": -6.124973297119141, "global_step": 76450, "epoch": 1820} {"train_loss": -6.167360782623291, "global_step": 76451, "epoch": 1820} {"train_loss": -6.20235538482666, "global_step": 76452, "epoch": 1820} {"train_loss": -6.060466289520264, "global_step": 76453, "epoch": 1820} {"train_loss": -6.068655014038086, "global_step": 76454, "epoch": 1820} {"train_loss": -6.2577362060546875, "global_step": 76455, "epoch": 1820} {"train_loss": -6.151460647583008, "global_step": 76456, "epoch": 1820} {"train_loss": -6.138839244842529, "global_step": 76457, "epoch": 1820} {"train_loss": -6.124030113220215, "global_step": 76458, "epoch": 1820} {"train_loss": -6.054385662078857, "global_step": 76459, "epoch": 1820} {"train_loss": -6.0898261070251465, "global_step": 76460, "epoch": 1820} {"train_loss": -6.168370246887207, "global_step": 76461, "epoch": 1820} {"train_loss": -6.109104156494141, "global_step": 76462, "epoch": 1820} {"train_loss": -6.078144073486328, "global_step": 76463, "epoch": 1820} {"train_loss": -6.105857849121094, "global_step": 76464, "epoch": 1820} {"train_loss": -6.076202392578125, "global_step": 76465, "epoch": 1820} {"train_loss": -6.030597686767578, "global_step": 76466, "epoch": 1820} {"train_loss": -6.103732585906982, "global_step": 76467, "epoch": 1820} {"train_loss": -5.980290412902832, "global_step": 76468, "epoch": 1820} {"train_loss": -5.961172103881836, "global_step": 76469, "epoch": 1820} {"train_loss": -6.138912200927734, "global_step": 76470, "epoch": 1820} {"train_loss": -6.077070236206055, "global_step": 76471, "epoch": 1820} {"train_loss": -5.905574798583984, "global_step": 76472, "epoch": 1820} {"train_loss": -6.18512487411499, "global_step": 76473, "epoch": 1820} {"train_loss": -6.237163543701172, "global_step": 76474, "epoch": 1820} {"train_loss": -5.984360694885254, "global_step": 76475, "epoch": 1820} {"train_loss": -6.077329158782959, "global_step": 76476, "epoch": 1820} {"train_loss": -6.0206217765808105, "global_step": 76477, "epoch": 1820} {"train_loss": -6.046328544616699, "global_step": 76478, "epoch": 1820} {"train_loss": -6.130720138549805, "global_step": 76479, "epoch": 1820} {"train_loss": -5.962344646453857, "global_step": 76480, "epoch": 1820} {"train_loss": -6.099409228279477, "global_step": 76481, "epoch": 1820, "val_loss": 74806.4921875} {"train_loss": -6.157907962799072, "global_step": 76482, "epoch": 1821} {"train_loss": -6.116429328918457, "global_step": 76483, "epoch": 1821} {"train_loss": -6.148136138916016, "global_step": 76484, "epoch": 1821} {"train_loss": -6.164118766784668, "global_step": 76485, "epoch": 1821} {"train_loss": -6.0775146484375, "global_step": 76486, "epoch": 1821} {"train_loss": -6.103711128234863, "global_step": 76487, "epoch": 1821} {"train_loss": -6.167351722717285, "global_step": 76488, "epoch": 1821} {"train_loss": -6.053874969482422, "global_step": 76489, "epoch": 1821} {"train_loss": -6.141543388366699, "global_step": 76490, "epoch": 1821} {"train_loss": -6.12054443359375, "global_step": 76491, "epoch": 1821} {"train_loss": -6.084444999694824, "global_step": 76492, "epoch": 1821} {"train_loss": -5.966803073883057, "global_step": 76493, "epoch": 1821} {"train_loss": -6.156002044677734, "global_step": 76494, "epoch": 1821} {"train_loss": -5.986215591430664, "global_step": 76495, "epoch": 1821} {"train_loss": -6.028908729553223, "global_step": 76496, "epoch": 1821} {"train_loss": -6.0790205001831055, "global_step": 76497, "epoch": 1821} {"train_loss": -6.030370235443115, "global_step": 76498, "epoch": 1821} {"train_loss": -6.0807390213012695, "global_step": 76499, "epoch": 1821} {"train_loss": -6.168376922607422, "global_step": 76500, "epoch": 1821} {"train_loss": -6.101409912109375, "global_step": 76501, "epoch": 1821} {"train_loss": -6.058714389801025, "global_step": 76502, "epoch": 1821} {"train_loss": -6.141666412353516, "global_step": 76503, "epoch": 1821} {"train_loss": -6.106925964355469, "global_step": 76504, "epoch": 1821} {"train_loss": -6.097376823425293, "global_step": 76505, "epoch": 1821} {"train_loss": -6.151049613952637, "global_step": 76506, "epoch": 1821} {"train_loss": -6.033703327178955, "global_step": 76507, "epoch": 1821} {"train_loss": -6.154512882232666, "global_step": 76508, "epoch": 1821} {"train_loss": -6.2374091148376465, "global_step": 76509, "epoch": 1821} {"train_loss": -6.08077335357666, "global_step": 76510, "epoch": 1821} {"train_loss": -5.9756669998168945, "global_step": 76511, "epoch": 1821} {"train_loss": -6.248717784881592, "global_step": 76512, "epoch": 1821} {"train_loss": -6.118078708648682, "global_step": 76513, "epoch": 1821} {"train_loss": -6.124971389770508, "global_step": 76514, "epoch": 1821} {"train_loss": -6.068887710571289, "global_step": 76515, "epoch": 1821} {"train_loss": -6.0098371505737305, "global_step": 76516, "epoch": 1821} {"train_loss": -6.127720832824707, "global_step": 76517, "epoch": 1821} {"train_loss": -6.065055847167969, "global_step": 76518, "epoch": 1821} {"train_loss": -6.038590908050537, "global_step": 76519, "epoch": 1821} {"train_loss": -5.966488838195801, "global_step": 76520, "epoch": 1821} {"train_loss": -6.024564743041992, "global_step": 76521, "epoch": 1821} {"train_loss": -5.988807678222656, "global_step": 76522, "epoch": 1821} {"train_loss": -6.094016790390015, "global_step": 76523, "epoch": 1821, "val_loss": 75307.703125} {"train_loss": -6.140893936157227, "global_step": 76524, "epoch": 1822} {"train_loss": -5.993598937988281, "global_step": 76525, "epoch": 1822} {"train_loss": -6.068723678588867, "global_step": 76526, "epoch": 1822} {"train_loss": -5.9981207847595215, "global_step": 76527, "epoch": 1822} {"train_loss": -6.045411109924316, "global_step": 76528, "epoch": 1822} {"train_loss": -6.069062232971191, "global_step": 76529, "epoch": 1822} {"train_loss": -6.009897232055664, "global_step": 76530, "epoch": 1822} {"train_loss": -6.075308799743652, "global_step": 76531, "epoch": 1822} {"train_loss": -6.086511135101318, "global_step": 76532, "epoch": 1822} {"train_loss": -6.127578258514404, "global_step": 76533, "epoch": 1822} {"train_loss": -6.097779750823975, "global_step": 76534, "epoch": 1822} {"train_loss": -5.998841285705566, "global_step": 76535, "epoch": 1822} {"train_loss": -6.042635917663574, "global_step": 76536, "epoch": 1822} {"train_loss": -6.103497505187988, "global_step": 76537, "epoch": 1822} {"train_loss": -6.098465919494629, "global_step": 76538, "epoch": 1822} {"train_loss": -6.055600166320801, "global_step": 76539, "epoch": 1822} {"train_loss": -6.066811561584473, "global_step": 76540, "epoch": 1822} {"train_loss": -6.080232620239258, "global_step": 76541, "epoch": 1822} {"train_loss": -6.090696334838867, "global_step": 76542, "epoch": 1822} {"train_loss": -5.8804192543029785, "global_step": 76543, "epoch": 1822} {"train_loss": -6.0416107177734375, "global_step": 76544, "epoch": 1822} {"train_loss": -5.954623699188232, "global_step": 76545, "epoch": 1822} {"train_loss": -6.038717269897461, "global_step": 76546, "epoch": 1822} {"train_loss": -6.136684894561768, "global_step": 76547, "epoch": 1822} {"train_loss": -5.968546390533447, "global_step": 76548, "epoch": 1822} {"train_loss": -6.096867084503174, "global_step": 76549, "epoch": 1822} {"train_loss": -6.070345878601074, "global_step": 76550, "epoch": 1822} {"train_loss": -6.071738243103027, "global_step": 76551, "epoch": 1822} {"train_loss": -6.136620998382568, "global_step": 76552, "epoch": 1822} {"train_loss": -6.045220851898193, "global_step": 76553, "epoch": 1822} {"train_loss": -6.038664817810059, "global_step": 76554, "epoch": 1822} {"train_loss": -6.03489875793457, "global_step": 76555, "epoch": 1822} {"train_loss": -6.063343048095703, "global_step": 76556, "epoch": 1822} {"train_loss": -6.079611778259277, "global_step": 76557, "epoch": 1822} {"train_loss": -6.125921249389648, "global_step": 76558, "epoch": 1822} {"train_loss": -6.068752288818359, "global_step": 76559, "epoch": 1822} {"train_loss": -6.050294399261475, "global_step": 76560, "epoch": 1822} {"train_loss": -6.162372589111328, "global_step": 76561, "epoch": 1822} {"train_loss": -6.071174621582031, "global_step": 76562, "epoch": 1822} {"train_loss": -6.124579429626465, "global_step": 76563, "epoch": 1822} {"train_loss": -6.005701541900635, "global_step": 76564, "epoch": 1822} {"train_loss": -6.058274655115037, "global_step": 76565, "epoch": 1822, "val_loss": 74962.890625} {"train_loss": -6.070051670074463, "global_step": 76566, "epoch": 1823} {"train_loss": -5.967987060546875, "global_step": 76567, "epoch": 1823} {"train_loss": -6.151378631591797, "global_step": 76568, "epoch": 1823} {"train_loss": -5.967853546142578, "global_step": 76569, "epoch": 1823} {"train_loss": -6.099056720733643, "global_step": 76570, "epoch": 1823} {"train_loss": -6.193160057067871, "global_step": 76571, "epoch": 1823} {"train_loss": -6.136471748352051, "global_step": 76572, "epoch": 1823} {"train_loss": -6.180870056152344, "global_step": 76573, "epoch": 1823} {"train_loss": -5.844845294952393, "global_step": 76574, "epoch": 1823} {"train_loss": -6.1208930015563965, "global_step": 76575, "epoch": 1823} {"train_loss": -6.052712440490723, "global_step": 76576, "epoch": 1823} {"train_loss": -6.087635517120361, "global_step": 76577, "epoch": 1823} {"train_loss": -5.9655961990356445, "global_step": 76578, "epoch": 1823} {"train_loss": -6.003872394561768, "global_step": 76579, "epoch": 1823} {"train_loss": -6.006539344787598, "global_step": 76580, "epoch": 1823} {"train_loss": -6.010303497314453, "global_step": 76581, "epoch": 1823} {"train_loss": -6.1099653244018555, "global_step": 76582, "epoch": 1823} {"train_loss": -6.1596856117248535, "global_step": 76583, "epoch": 1823} {"train_loss": -6.082258224487305, "global_step": 76584, "epoch": 1823} {"train_loss": -6.194615364074707, "global_step": 76585, "epoch": 1823} {"train_loss": -6.116062164306641, "global_step": 76586, "epoch": 1823} {"train_loss": -5.965547561645508, "global_step": 76587, "epoch": 1823} {"train_loss": -6.128723621368408, "global_step": 76588, "epoch": 1823} {"train_loss": -6.146789073944092, "global_step": 76589, "epoch": 1823} {"train_loss": -6.0157928466796875, "global_step": 76590, "epoch": 1823} {"train_loss": -6.074453830718994, "global_step": 76591, "epoch": 1823} {"train_loss": -6.199883937835693, "global_step": 76592, "epoch": 1823} {"train_loss": -6.072260856628418, "global_step": 76593, "epoch": 1823} {"train_loss": -6.295985221862793, "global_step": 76594, "epoch": 1823} {"train_loss": -6.089963912963867, "global_step": 76595, "epoch": 1823} {"train_loss": -6.111169338226318, "global_step": 76596, "epoch": 1823} {"train_loss": -6.136195182800293, "global_step": 76597, "epoch": 1823} {"train_loss": -6.101770877838135, "global_step": 76598, "epoch": 1823} {"train_loss": -6.067290782928467, "global_step": 76599, "epoch": 1823} {"train_loss": -6.122857093811035, "global_step": 76600, "epoch": 1823} {"train_loss": -6.030804634094238, "global_step": 76601, "epoch": 1823} {"train_loss": -6.015636920928955, "global_step": 76602, "epoch": 1823} {"train_loss": -6.075614929199219, "global_step": 76603, "epoch": 1823} {"train_loss": -6.069201469421387, "global_step": 76604, "epoch": 1823} {"train_loss": -6.1634297370910645, "global_step": 76605, "epoch": 1823} {"train_loss": -6.113762855529785, "global_step": 76606, "epoch": 1823} {"train_loss": -6.08525139944894, "global_step": 76607, "epoch": 1823, "val_loss": 75096.0546875} {"train_loss": -6.107476234436035, "global_step": 76608, "epoch": 1824} {"train_loss": -6.090055465698242, "global_step": 76609, "epoch": 1824} {"train_loss": -5.9602813720703125, "global_step": 76610, "epoch": 1824} {"train_loss": -6.205429553985596, "global_step": 76611, "epoch": 1824} {"train_loss": -5.981114864349365, "global_step": 76612, "epoch": 1824} {"train_loss": -6.118155479431152, "global_step": 76613, "epoch": 1824} {"train_loss": -6.116408348083496, "global_step": 76614, "epoch": 1824} {"train_loss": -5.998385906219482, "global_step": 76615, "epoch": 1824} {"train_loss": -6.125417232513428, "global_step": 76616, "epoch": 1824} {"train_loss": -6.006901264190674, "global_step": 76617, "epoch": 1824} {"train_loss": -6.090169429779053, "global_step": 76618, "epoch": 1824} {"train_loss": -6.0265727043151855, "global_step": 76619, "epoch": 1824} {"train_loss": -6.072882652282715, "global_step": 76620, "epoch": 1824} {"train_loss": -6.173195838928223, "global_step": 76621, "epoch": 1824} {"train_loss": -5.95445442199707, "global_step": 76622, "epoch": 1824} {"train_loss": -6.090479850769043, "global_step": 76623, "epoch": 1824} {"train_loss": -6.026698589324951, "global_step": 76624, "epoch": 1824} {"train_loss": -6.0211992263793945, "global_step": 76625, "epoch": 1824} {"train_loss": -5.976906776428223, "global_step": 76626, "epoch": 1824} {"train_loss": -6.047794342041016, "global_step": 76627, "epoch": 1824} {"train_loss": -6.092951774597168, "global_step": 76628, "epoch": 1824} {"train_loss": -6.0886616706848145, "global_step": 76629, "epoch": 1824} {"train_loss": -6.115321159362793, "global_step": 76630, "epoch": 1824} {"train_loss": -6.1426496505737305, "global_step": 76631, "epoch": 1824} {"train_loss": -6.00628137588501, "global_step": 76632, "epoch": 1824} {"train_loss": -6.136719226837158, "global_step": 76633, "epoch": 1824} {"train_loss": -6.0908355712890625, "global_step": 76634, "epoch": 1824} {"train_loss": -6.113565444946289, "global_step": 76635, "epoch": 1824} {"train_loss": -6.110169410705566, "global_step": 76636, "epoch": 1824} {"train_loss": -6.113062381744385, "global_step": 76637, "epoch": 1824} {"train_loss": -6.135993480682373, "global_step": 76638, "epoch": 1824} {"train_loss": -6.033574104309082, "global_step": 76639, "epoch": 1824} {"train_loss": -6.087202072143555, "global_step": 76640, "epoch": 1824} {"train_loss": -6.191474437713623, "global_step": 76641, "epoch": 1824} {"train_loss": -6.226813316345215, "global_step": 76642, "epoch": 1824} {"train_loss": -6.216036796569824, "global_step": 76643, "epoch": 1824} {"train_loss": -6.0567827224731445, "global_step": 76644, "epoch": 1824} {"train_loss": -6.161744117736816, "global_step": 76645, "epoch": 1824} {"train_loss": -6.1084723472595215, "global_step": 76646, "epoch": 1824} {"train_loss": -6.126323699951172, "global_step": 76647, "epoch": 1824} {"train_loss": -6.20525598526001, "global_step": 76648, "epoch": 1824} {"train_loss": -6.092173871539888, "global_step": 76649, "epoch": 1824, "val_loss": 75153.5390625} {"train_loss": -6.104556560516357, "global_step": 76650, "epoch": 1825} {"train_loss": -6.098283767700195, "global_step": 76651, "epoch": 1825} {"train_loss": -6.112591743469238, "global_step": 76652, "epoch": 1825} {"train_loss": -6.127472877502441, "global_step": 76653, "epoch": 1825} {"train_loss": -6.063777446746826, "global_step": 76654, "epoch": 1825} {"train_loss": -6.124045372009277, "global_step": 76655, "epoch": 1825} {"train_loss": -6.056636810302734, "global_step": 76656, "epoch": 1825} {"train_loss": -6.101155757904053, "global_step": 76657, "epoch": 1825} {"train_loss": -6.020881652832031, "global_step": 76658, "epoch": 1825} {"train_loss": -6.101749420166016, "global_step": 76659, "epoch": 1825} {"train_loss": -6.053098678588867, "global_step": 76660, "epoch": 1825} {"train_loss": -6.262588977813721, "global_step": 76661, "epoch": 1825} {"train_loss": -6.0286054611206055, "global_step": 76662, "epoch": 1825} {"train_loss": -6.076068878173828, "global_step": 76663, "epoch": 1825} {"train_loss": -6.003523826599121, "global_step": 76664, "epoch": 1825} {"train_loss": -6.041750907897949, "global_step": 76665, "epoch": 1825} {"train_loss": -6.213991165161133, "global_step": 76666, "epoch": 1825} {"train_loss": -6.199801445007324, "global_step": 76667, "epoch": 1825} {"train_loss": -6.077611923217773, "global_step": 76668, "epoch": 1825} {"train_loss": -6.134615421295166, "global_step": 76669, "epoch": 1825} {"train_loss": -6.167639255523682, "global_step": 76670, "epoch": 1825} {"train_loss": -6.110257148742676, "global_step": 76671, "epoch": 1825} {"train_loss": -5.987148284912109, "global_step": 76672, "epoch": 1825} {"train_loss": -6.107278823852539, "global_step": 76673, "epoch": 1825} {"train_loss": -6.122262954711914, "global_step": 76674, "epoch": 1825} {"train_loss": -6.0314154624938965, "global_step": 76675, "epoch": 1825} {"train_loss": -6.14607048034668, "global_step": 76676, "epoch": 1825} {"train_loss": -6.073265552520752, "global_step": 76677, "epoch": 1825} {"train_loss": -6.0335373878479, "global_step": 76678, "epoch": 1825} {"train_loss": -6.186407566070557, "global_step": 76679, "epoch": 1825} {"train_loss": -6.018138885498047, "global_step": 76680, "epoch": 1825} {"train_loss": -6.065812587738037, "global_step": 76681, "epoch": 1825} {"train_loss": -6.140969753265381, "global_step": 76682, "epoch": 1825} {"train_loss": -6.095491886138916, "global_step": 76683, "epoch": 1825} {"train_loss": -6.114007949829102, "global_step": 76684, "epoch": 1825} {"train_loss": -6.078874588012695, "global_step": 76685, "epoch": 1825} {"train_loss": -5.9288554191589355, "global_step": 76686, "epoch": 1825} {"train_loss": -6.052206516265869, "global_step": 76687, "epoch": 1825} {"train_loss": -6.038606643676758, "global_step": 76688, "epoch": 1825} {"train_loss": -6.07646369934082, "global_step": 76689, "epoch": 1825} {"train_loss": -6.011431694030762, "global_step": 76690, "epoch": 1825} {"train_loss": -6.08642670086452, "global_step": 76691, "epoch": 1825, "val_loss": 75079.6640625} {"train_loss": -6.112558364868164, "global_step": 76692, "epoch": 1826} {"train_loss": -6.171091079711914, "global_step": 76693, "epoch": 1826} {"train_loss": -6.088139533996582, "global_step": 76694, "epoch": 1826} {"train_loss": -6.207951545715332, "global_step": 76695, "epoch": 1826} {"train_loss": -6.083059310913086, "global_step": 76696, "epoch": 1826} {"train_loss": -6.152649879455566, "global_step": 76697, "epoch": 1826} {"train_loss": -6.065792083740234, "global_step": 76698, "epoch": 1826} {"train_loss": -6.123558044433594, "global_step": 76699, "epoch": 1826} {"train_loss": -6.078940391540527, "global_step": 76700, "epoch": 1826} {"train_loss": -5.966808319091797, "global_step": 76701, "epoch": 1826} {"train_loss": -6.291670799255371, "global_step": 76702, "epoch": 1826} {"train_loss": -6.0319390296936035, "global_step": 76703, "epoch": 1826} {"train_loss": -6.005880355834961, "global_step": 76704, "epoch": 1826} {"train_loss": -5.97309684753418, "global_step": 76705, "epoch": 1826} {"train_loss": -5.925302028656006, "global_step": 76706, "epoch": 1826} {"train_loss": -6.03972053527832, "global_step": 76707, "epoch": 1826} {"train_loss": -6.061501502990723, "global_step": 76708, "epoch": 1826} {"train_loss": -5.968189239501953, "global_step": 76709, "epoch": 1826} {"train_loss": -6.035711288452148, "global_step": 76710, "epoch": 1826} {"train_loss": -6.030918121337891, "global_step": 76711, "epoch": 1826} {"train_loss": -6.205531597137451, "global_step": 76712, "epoch": 1826} {"train_loss": -6.126676559448242, "global_step": 76713, "epoch": 1826} {"train_loss": -5.931772708892822, "global_step": 76714, "epoch": 1826} {"train_loss": -6.17694091796875, "global_step": 76715, "epoch": 1826} {"train_loss": -6.0975341796875, "global_step": 76716, "epoch": 1826} {"train_loss": -6.084395885467529, "global_step": 76717, "epoch": 1826} {"train_loss": -5.964255332946777, "global_step": 76718, "epoch": 1826} {"train_loss": -6.075570106506348, "global_step": 76719, "epoch": 1826} {"train_loss": -6.057360649108887, "global_step": 76720, "epoch": 1826} {"train_loss": -6.024094581604004, "global_step": 76721, "epoch": 1826} {"train_loss": -6.013241291046143, "global_step": 76722, "epoch": 1826} {"train_loss": -5.939462661743164, "global_step": 76723, "epoch": 1826} {"train_loss": -6.095871925354004, "global_step": 76724, "epoch": 1826} {"train_loss": -6.050528049468994, "global_step": 76725, "epoch": 1826} {"train_loss": -6.051591873168945, "global_step": 76726, "epoch": 1826} {"train_loss": -6.07896614074707, "global_step": 76727, "epoch": 1826} {"train_loss": -6.01308536529541, "global_step": 76728, "epoch": 1826} {"train_loss": -5.999512672424316, "global_step": 76729, "epoch": 1826} {"train_loss": -6.054152488708496, "global_step": 76730, "epoch": 1826} {"train_loss": -6.18726921081543, "global_step": 76731, "epoch": 1826} {"train_loss": -6.1819305419921875, "global_step": 76732, "epoch": 1826} {"train_loss": -6.070630834216163, "global_step": 76733, "epoch": 1826, "val_loss": 74952.734375} {"train_loss": -6.038710594177246, "global_step": 76734, "epoch": 1827} {"train_loss": -6.093143463134766, "global_step": 76735, "epoch": 1827} {"train_loss": -6.1938796043396, "global_step": 76736, "epoch": 1827} {"train_loss": -6.1623454093933105, "global_step": 76737, "epoch": 1827} {"train_loss": -5.968646049499512, "global_step": 76738, "epoch": 1827} {"train_loss": -6.319025993347168, "global_step": 76739, "epoch": 1827} {"train_loss": -6.165439605712891, "global_step": 76740, "epoch": 1827} {"train_loss": -6.147189140319824, "global_step": 76741, "epoch": 1827} {"train_loss": -6.115659236907959, "global_step": 76742, "epoch": 1827} {"train_loss": -6.079623222351074, "global_step": 76743, "epoch": 1827} {"train_loss": -5.929327011108398, "global_step": 76744, "epoch": 1827} {"train_loss": -6.197649002075195, "global_step": 76745, "epoch": 1827} {"train_loss": -6.0721635818481445, "global_step": 76746, "epoch": 1827} {"train_loss": -6.091814041137695, "global_step": 76747, "epoch": 1827} {"train_loss": -6.078279972076416, "global_step": 76748, "epoch": 1827} {"train_loss": -6.132142066955566, "global_step": 76749, "epoch": 1827} {"train_loss": -6.028292179107666, "global_step": 76750, "epoch": 1827} {"train_loss": -6.072122097015381, "global_step": 76751, "epoch": 1827} {"train_loss": -6.109114170074463, "global_step": 76752, "epoch": 1827} {"train_loss": -6.039285659790039, "global_step": 76753, "epoch": 1827} {"train_loss": -6.100354194641113, "global_step": 76754, "epoch": 1827} {"train_loss": -6.193233966827393, "global_step": 76755, "epoch": 1827} {"train_loss": -6.095625400543213, "global_step": 76756, "epoch": 1827} {"train_loss": -6.093842029571533, "global_step": 76757, "epoch": 1827} {"train_loss": -6.000768661499023, "global_step": 76758, "epoch": 1827} {"train_loss": -6.210816383361816, "global_step": 76759, "epoch": 1827} {"train_loss": -6.0427656173706055, "global_step": 76760, "epoch": 1827} {"train_loss": -6.049064636230469, "global_step": 76761, "epoch": 1827} {"train_loss": -6.138824462890625, "global_step": 76762, "epoch": 1827} {"train_loss": -6.07773494720459, "global_step": 76763, "epoch": 1827} {"train_loss": -6.071995735168457, "global_step": 76764, "epoch": 1827} {"train_loss": -6.015847206115723, "global_step": 76765, "epoch": 1827} {"train_loss": -6.0851898193359375, "global_step": 76766, "epoch": 1827} {"train_loss": -6.0566253662109375, "global_step": 76767, "epoch": 1827} {"train_loss": -6.0048627853393555, "global_step": 76768, "epoch": 1827} {"train_loss": -6.065973281860352, "global_step": 76769, "epoch": 1827} {"train_loss": -6.1222615242004395, "global_step": 76770, "epoch": 1827} {"train_loss": -6.131297588348389, "global_step": 76771, "epoch": 1827} {"train_loss": -6.106846332550049, "global_step": 76772, "epoch": 1827} {"train_loss": -6.142548561096191, "global_step": 76773, "epoch": 1827} {"train_loss": -6.115018844604492, "global_step": 76774, "epoch": 1827} {"train_loss": -6.094017392113095, "global_step": 76775, "epoch": 1827, "val_loss": 74980.6015625} {"train_loss": -6.132500648498535, "global_step": 76776, "epoch": 1828} {"train_loss": -6.105393886566162, "global_step": 76777, "epoch": 1828} {"train_loss": -6.04360294342041, "global_step": 76778, "epoch": 1828} {"train_loss": -6.118438720703125, "global_step": 76779, "epoch": 1828} {"train_loss": -6.145464897155762, "global_step": 76780, "epoch": 1828} {"train_loss": -5.997803211212158, "global_step": 76781, "epoch": 1828} {"train_loss": -6.115857124328613, "global_step": 76782, "epoch": 1828} {"train_loss": -5.945314884185791, "global_step": 76783, "epoch": 1828} {"train_loss": -6.082406044006348, "global_step": 76784, "epoch": 1828} {"train_loss": -6.0114827156066895, "global_step": 76785, "epoch": 1828} {"train_loss": -5.982613563537598, "global_step": 76786, "epoch": 1828} {"train_loss": -5.9879608154296875, "global_step": 76787, "epoch": 1828} {"train_loss": -6.015350341796875, "global_step": 76788, "epoch": 1828} {"train_loss": -6.050539970397949, "global_step": 76789, "epoch": 1828} {"train_loss": -6.043027400970459, "global_step": 76790, "epoch": 1828} {"train_loss": -6.093294143676758, "global_step": 76791, "epoch": 1828} {"train_loss": -6.078563690185547, "global_step": 76792, "epoch": 1828} {"train_loss": -5.9462480545043945, "global_step": 76793, "epoch": 1828} {"train_loss": -5.996833801269531, "global_step": 76794, "epoch": 1828} {"train_loss": -5.934951305389404, "global_step": 76795, "epoch": 1828} {"train_loss": -6.095198631286621, "global_step": 76796, "epoch": 1828} {"train_loss": -6.039853096008301, "global_step": 76797, "epoch": 1828} {"train_loss": -5.969862937927246, "global_step": 76798, "epoch": 1828} {"train_loss": -6.045444488525391, "global_step": 76799, "epoch": 1828} {"train_loss": -6.131822109222412, "global_step": 76800, "epoch": 1828} {"train_loss": -5.9513444900512695, "global_step": 76801, "epoch": 1828} {"train_loss": -6.080399513244629, "global_step": 76802, "epoch": 1828} {"train_loss": -6.009280204772949, "global_step": 76803, "epoch": 1828} {"train_loss": -6.022249221801758, "global_step": 76804, "epoch": 1828} {"train_loss": -6.067702293395996, "global_step": 76805, "epoch": 1828} {"train_loss": -5.990226745605469, "global_step": 76806, "epoch": 1828} {"train_loss": -6.0642805099487305, "global_step": 76807, "epoch": 1828} {"train_loss": -6.025577545166016, "global_step": 76808, "epoch": 1828} {"train_loss": -6.0792741775512695, "global_step": 76809, "epoch": 1828} {"train_loss": -6.102064609527588, "global_step": 76810, "epoch": 1828} {"train_loss": -6.07246732711792, "global_step": 76811, "epoch": 1828} {"train_loss": -6.128762722015381, "global_step": 76812, "epoch": 1828} {"train_loss": -6.143179893493652, "global_step": 76813, "epoch": 1828} {"train_loss": -5.971261501312256, "global_step": 76814, "epoch": 1828} {"train_loss": -6.130509376525879, "global_step": 76815, "epoch": 1828} {"train_loss": -6.089177131652832, "global_step": 76816, "epoch": 1828} {"train_loss": -6.051754837944394, "global_step": 76817, "epoch": 1828, "val_loss": 74718.2890625} {"train_loss": -6.049254417419434, "global_step": 76818, "epoch": 1829} {"train_loss": -6.022384166717529, "global_step": 76819, "epoch": 1829} {"train_loss": -5.956384181976318, "global_step": 76820, "epoch": 1829} {"train_loss": -6.10275411605835, "global_step": 76821, "epoch": 1829} {"train_loss": -6.0074310302734375, "global_step": 76822, "epoch": 1829} {"train_loss": -6.02449893951416, "global_step": 76823, "epoch": 1829} {"train_loss": -6.068508148193359, "global_step": 76824, "epoch": 1829} {"train_loss": -5.982387542724609, "global_step": 76825, "epoch": 1829} {"train_loss": -6.047201633453369, "global_step": 76826, "epoch": 1829} {"train_loss": -5.985669136047363, "global_step": 76827, "epoch": 1829} {"train_loss": -5.902012825012207, "global_step": 76828, "epoch": 1829} {"train_loss": -6.0901641845703125, "global_step": 76829, "epoch": 1829} {"train_loss": -6.078226089477539, "global_step": 76830, "epoch": 1829} {"train_loss": -6.001321792602539, "global_step": 76831, "epoch": 1829} {"train_loss": -6.0659990310668945, "global_step": 76832, "epoch": 1829} {"train_loss": -6.082986831665039, "global_step": 76833, "epoch": 1829} {"train_loss": -6.225502014160156, "global_step": 76834, "epoch": 1829} {"train_loss": -5.969724655151367, "global_step": 76835, "epoch": 1829} {"train_loss": -6.1332478523254395, "global_step": 76836, "epoch": 1829} {"train_loss": -6.078725814819336, "global_step": 76837, "epoch": 1829} {"train_loss": -5.955732822418213, "global_step": 76838, "epoch": 1829} {"train_loss": -6.094631195068359, "global_step": 76839, "epoch": 1829} {"train_loss": -6.087795734405518, "global_step": 76840, "epoch": 1829} {"train_loss": -6.0800676345825195, "global_step": 76841, "epoch": 1829} {"train_loss": -6.042605400085449, "global_step": 76842, "epoch": 1829} {"train_loss": -6.000395774841309, "global_step": 76843, "epoch": 1829} {"train_loss": -6.060430526733398, "global_step": 76844, "epoch": 1829} {"train_loss": -5.995571136474609, "global_step": 76845, "epoch": 1829} {"train_loss": -5.971498012542725, "global_step": 76846, "epoch": 1829} {"train_loss": -6.073182106018066, "global_step": 76847, "epoch": 1829} {"train_loss": -6.083016395568848, "global_step": 76848, "epoch": 1829} {"train_loss": -5.9606428146362305, "global_step": 76849, "epoch": 1829} {"train_loss": -5.965502738952637, "global_step": 76850, "epoch": 1829} {"train_loss": -6.099768161773682, "global_step": 76851, "epoch": 1829} {"train_loss": -6.123233795166016, "global_step": 76852, "epoch": 1829} {"train_loss": -5.890474796295166, "global_step": 76853, "epoch": 1829} {"train_loss": -6.190503120422363, "global_step": 76854, "epoch": 1829} {"train_loss": -6.114293098449707, "global_step": 76855, "epoch": 1829} {"train_loss": -6.072661876678467, "global_step": 76856, "epoch": 1829} {"train_loss": -6.16508150100708, "global_step": 76857, "epoch": 1829} {"train_loss": -6.110825061798096, "global_step": 76858, "epoch": 1829} {"train_loss": -6.050829717091152, "global_step": 76859, "epoch": 1829, "val_loss": 75477.1328125} {"train_loss": -6.092914581298828, "global_step": 76860, "epoch": 1830} {"train_loss": -6.065939426422119, "global_step": 76861, "epoch": 1830} {"train_loss": -6.043926239013672, "global_step": 76862, "epoch": 1830} {"train_loss": -6.124881744384766, "global_step": 76863, "epoch": 1830} {"train_loss": -6.097511291503906, "global_step": 76864, "epoch": 1830} {"train_loss": -6.06318998336792, "global_step": 76865, "epoch": 1830} {"train_loss": -6.168778896331787, "global_step": 76866, "epoch": 1830} {"train_loss": -6.118109226226807, "global_step": 76867, "epoch": 1830} {"train_loss": -5.994635581970215, "global_step": 76868, "epoch": 1830} {"train_loss": -6.1646728515625, "global_step": 76869, "epoch": 1830} {"train_loss": -6.177011013031006, "global_step": 76870, "epoch": 1830} {"train_loss": -6.109689712524414, "global_step": 76871, "epoch": 1830} {"train_loss": -6.095947265625, "global_step": 76872, "epoch": 1830} {"train_loss": -6.006170272827148, "global_step": 76873, "epoch": 1830} {"train_loss": -6.053464412689209, "global_step": 76874, "epoch": 1830} {"train_loss": -6.018962383270264, "global_step": 76875, "epoch": 1830} {"train_loss": -5.986850738525391, "global_step": 76876, "epoch": 1830} {"train_loss": -6.078878402709961, "global_step": 76877, "epoch": 1830} {"train_loss": -6.072966575622559, "global_step": 76878, "epoch": 1830} {"train_loss": -6.046214580535889, "global_step": 76879, "epoch": 1830} {"train_loss": -6.138909816741943, "global_step": 76880, "epoch": 1830} {"train_loss": -6.064151763916016, "global_step": 76881, "epoch": 1830} {"train_loss": -6.1117119789123535, "global_step": 76882, "epoch": 1830} {"train_loss": -6.094549179077148, "global_step": 76883, "epoch": 1830} {"train_loss": -5.969655990600586, "global_step": 76884, "epoch": 1830} {"train_loss": -6.0474958419799805, "global_step": 76885, "epoch": 1830} {"train_loss": -6.118841171264648, "global_step": 76886, "epoch": 1830} {"train_loss": -5.921051979064941, "global_step": 76887, "epoch": 1830} {"train_loss": -6.063979625701904, "global_step": 76888, "epoch": 1830} {"train_loss": -6.092791557312012, "global_step": 76889, "epoch": 1830} {"train_loss": -6.073774814605713, "global_step": 76890, "epoch": 1830} {"train_loss": -6.060324192047119, "global_step": 76891, "epoch": 1830} {"train_loss": -6.147036552429199, "global_step": 76892, "epoch": 1830} {"train_loss": -6.095737457275391, "global_step": 76893, "epoch": 1830} {"train_loss": -6.158342361450195, "global_step": 76894, "epoch": 1830} {"train_loss": -5.992303371429443, "global_step": 76895, "epoch": 1830} {"train_loss": -6.16483211517334, "global_step": 76896, "epoch": 1830} {"train_loss": -6.067210674285889, "global_step": 76897, "epoch": 1830} {"train_loss": -6.106851577758789, "global_step": 76898, "epoch": 1830} {"train_loss": -6.1442975997924805, "global_step": 76899, "epoch": 1830} {"train_loss": -6.044897079467773, "global_step": 76900, "epoch": 1830} {"train_loss": -6.082108770098005, "global_step": 76901, "epoch": 1830, "val_loss": 74811.4453125} {"train_loss": -6.176071643829346, "global_step": 76902, "epoch": 1831} {"train_loss": -6.123707294464111, "global_step": 76903, "epoch": 1831} {"train_loss": -6.103683948516846, "global_step": 76904, "epoch": 1831} {"train_loss": -6.160755634307861, "global_step": 76905, "epoch": 1831} {"train_loss": -6.127004623413086, "global_step": 76906, "epoch": 1831} {"train_loss": -6.106354713439941, "global_step": 76907, "epoch": 1831} {"train_loss": -6.066728591918945, "global_step": 76908, "epoch": 1831} {"train_loss": -6.118434906005859, "global_step": 76909, "epoch": 1831} {"train_loss": -6.124179840087891, "global_step": 76910, "epoch": 1831} {"train_loss": -6.146366119384766, "global_step": 76911, "epoch": 1831} {"train_loss": -6.161707878112793, "global_step": 76912, "epoch": 1831} {"train_loss": -5.977972984313965, "global_step": 76913, "epoch": 1831} {"train_loss": -6.070918083190918, "global_step": 76914, "epoch": 1831} {"train_loss": -6.215771198272705, "global_step": 76915, "epoch": 1831} {"train_loss": -6.169826507568359, "global_step": 76916, "epoch": 1831} {"train_loss": -6.1210479736328125, "global_step": 76917, "epoch": 1831} {"train_loss": -6.0497517585754395, "global_step": 76918, "epoch": 1831} {"train_loss": -6.078009128570557, "global_step": 76919, "epoch": 1831} {"train_loss": -6.150423049926758, "global_step": 76920, "epoch": 1831} {"train_loss": -6.145057201385498, "global_step": 76921, "epoch": 1831} {"train_loss": -6.062786102294922, "global_step": 76922, "epoch": 1831} {"train_loss": -6.045836448669434, "global_step": 76923, "epoch": 1831} {"train_loss": -5.9297261238098145, "global_step": 76924, "epoch": 1831} {"train_loss": -6.091615676879883, "global_step": 76925, "epoch": 1831} {"train_loss": -6.102814674377441, "global_step": 76926, "epoch": 1831} {"train_loss": -6.168663024902344, "global_step": 76927, "epoch": 1831} {"train_loss": -6.103979110717773, "global_step": 76928, "epoch": 1831} {"train_loss": -6.040891647338867, "global_step": 76929, "epoch": 1831} {"train_loss": -6.201421737670898, "global_step": 76930, "epoch": 1831} {"train_loss": -6.126615047454834, "global_step": 76931, "epoch": 1831} {"train_loss": -6.150265693664551, "global_step": 76932, "epoch": 1831} {"train_loss": -5.956148147583008, "global_step": 76933, "epoch": 1831} {"train_loss": -6.044096946716309, "global_step": 76934, "epoch": 1831} {"train_loss": -6.070175647735596, "global_step": 76935, "epoch": 1831} {"train_loss": -6.046374320983887, "global_step": 76936, "epoch": 1831} {"train_loss": -6.036102294921875, "global_step": 76937, "epoch": 1831} {"train_loss": -6.0861616134643555, "global_step": 76938, "epoch": 1831} {"train_loss": -6.05185604095459, "global_step": 76939, "epoch": 1831} {"train_loss": -6.095766067504883, "global_step": 76940, "epoch": 1831} {"train_loss": -6.10076904296875, "global_step": 76941, "epoch": 1831} {"train_loss": -6.079291343688965, "global_step": 76942, "epoch": 1831} {"train_loss": -6.0938285532451815, "global_step": 76943, "epoch": 1831, "val_loss": 75027.03125} {"train_loss": -6.009496688842773, "global_step": 76944, "epoch": 1832} {"train_loss": -6.208580017089844, "global_step": 76945, "epoch": 1832} {"train_loss": -6.029636859893799, "global_step": 76946, "epoch": 1832} {"train_loss": -6.114472389221191, "global_step": 76947, "epoch": 1832} {"train_loss": -6.130231857299805, "global_step": 76948, "epoch": 1832} {"train_loss": -6.169647693634033, "global_step": 76949, "epoch": 1832} {"train_loss": -5.999211311340332, "global_step": 76950, "epoch": 1832} {"train_loss": -6.058835029602051, "global_step": 76951, "epoch": 1832} {"train_loss": -6.144227027893066, "global_step": 76952, "epoch": 1832} {"train_loss": -6.02459716796875, "global_step": 76953, "epoch": 1832} {"train_loss": -6.186892032623291, "global_step": 76954, "epoch": 1832} {"train_loss": -5.981781482696533, "global_step": 76955, "epoch": 1832} {"train_loss": -6.056668281555176, "global_step": 76956, "epoch": 1832} {"train_loss": -6.158572196960449, "global_step": 76957, "epoch": 1832} {"train_loss": -6.1065168380737305, "global_step": 76958, "epoch": 1832} {"train_loss": -6.105121612548828, "global_step": 76959, "epoch": 1832} {"train_loss": -5.993264198303223, "global_step": 76960, "epoch": 1832} {"train_loss": -6.113672256469727, "global_step": 76961, "epoch": 1832} {"train_loss": -6.1686248779296875, "global_step": 76962, "epoch": 1832} {"train_loss": -6.135868072509766, "global_step": 76963, "epoch": 1832} {"train_loss": -6.067719459533691, "global_step": 76964, "epoch": 1832} {"train_loss": -6.163595199584961, "global_step": 76965, "epoch": 1832} {"train_loss": -6.135619163513184, "global_step": 76966, "epoch": 1832} {"train_loss": -6.121150016784668, "global_step": 76967, "epoch": 1832} {"train_loss": -6.129078388214111, "global_step": 76968, "epoch": 1832} {"train_loss": -6.063430309295654, "global_step": 76969, "epoch": 1832} {"train_loss": -6.153077125549316, "global_step": 76970, "epoch": 1832} {"train_loss": -6.132006645202637, "global_step": 76971, "epoch": 1832} {"train_loss": -6.1537933349609375, "global_step": 76972, "epoch": 1832} {"train_loss": -6.0607829093933105, "global_step": 76973, "epoch": 1832} {"train_loss": -5.98423957824707, "global_step": 76974, "epoch": 1832} {"train_loss": -6.019365310668945, "global_step": 76975, "epoch": 1832} {"train_loss": -5.989511013031006, "global_step": 76976, "epoch": 1832} {"train_loss": -6.101798057556152, "global_step": 76977, "epoch": 1832} {"train_loss": -6.056096076965332, "global_step": 76978, "epoch": 1832} {"train_loss": -6.092489719390869, "global_step": 76979, "epoch": 1832} {"train_loss": -6.147518634796143, "global_step": 76980, "epoch": 1832} {"train_loss": -6.125122547149658, "global_step": 76981, "epoch": 1832} {"train_loss": -6.109965801239014, "global_step": 76982, "epoch": 1832} {"train_loss": -6.0796003341674805, "global_step": 76983, "epoch": 1832} {"train_loss": -6.112839698791504, "global_step": 76984, "epoch": 1832} {"train_loss": -6.095943269275484, "global_step": 76985, "epoch": 1832, "val_loss": 75325.6015625} {"train_loss": -5.980250835418701, "global_step": 76986, "epoch": 1833} {"train_loss": -6.092365264892578, "global_step": 76987, "epoch": 1833} {"train_loss": -6.087662696838379, "global_step": 76988, "epoch": 1833} {"train_loss": -6.115231037139893, "global_step": 76989, "epoch": 1833} {"train_loss": -6.170602321624756, "global_step": 76990, "epoch": 1833} {"train_loss": -6.174905300140381, "global_step": 76991, "epoch": 1833} {"train_loss": -6.0084052085876465, "global_step": 76992, "epoch": 1833} {"train_loss": -6.13460636138916, "global_step": 76993, "epoch": 1833} {"train_loss": -6.008697986602783, "global_step": 76994, "epoch": 1833} {"train_loss": -6.045580863952637, "global_step": 76995, "epoch": 1833} {"train_loss": -6.113692283630371, "global_step": 76996, "epoch": 1833} {"train_loss": -6.099925518035889, "global_step": 76997, "epoch": 1833} {"train_loss": -5.988369941711426, "global_step": 76998, "epoch": 1833} {"train_loss": -5.979778289794922, "global_step": 76999, "epoch": 1833} {"train_loss": -6.209882736206055, "global_step": 77000, "epoch": 1833} {"train_loss": -5.978600025177002, "global_step": 77001, "epoch": 1833} {"train_loss": -6.197842597961426, "global_step": 77002, "epoch": 1833} {"train_loss": -6.162239074707031, "global_step": 77003, "epoch": 1833} {"train_loss": -6.200780868530273, "global_step": 77004, "epoch": 1833} {"train_loss": -6.057589530944824, "global_step": 77005, "epoch": 1833} {"train_loss": -6.124472618103027, "global_step": 77006, "epoch": 1833} {"train_loss": -6.117654800415039, "global_step": 77007, "epoch": 1833} {"train_loss": -6.079143047332764, "global_step": 77008, "epoch": 1833} {"train_loss": -6.045316696166992, "global_step": 77009, "epoch": 1833} {"train_loss": -6.107019424438477, "global_step": 77010, "epoch": 1833} {"train_loss": -6.078032493591309, "global_step": 77011, "epoch": 1833} {"train_loss": -5.964663505554199, "global_step": 77012, "epoch": 1833} {"train_loss": -6.037693023681641, "global_step": 77013, "epoch": 1833} {"train_loss": -6.0148468017578125, "global_step": 77014, "epoch": 1833} {"train_loss": -6.063952445983887, "global_step": 77015, "epoch": 1833} {"train_loss": -6.050373554229736, "global_step": 77016, "epoch": 1833} {"train_loss": -6.053800582885742, "global_step": 77017, "epoch": 1833} {"train_loss": -5.962859630584717, "global_step": 77018, "epoch": 1833} {"train_loss": -6.090597152709961, "global_step": 77019, "epoch": 1833} {"train_loss": -5.856640338897705, "global_step": 77020, "epoch": 1833} {"train_loss": -6.095165252685547, "global_step": 77021, "epoch": 1833} {"train_loss": -6.056454658508301, "global_step": 77022, "epoch": 1833} {"train_loss": -6.026309967041016, "global_step": 77023, "epoch": 1833} {"train_loss": -6.13724422454834, "global_step": 77024, "epoch": 1833} {"train_loss": -5.985262393951416, "global_step": 77025, "epoch": 1833} {"train_loss": -6.153092384338379, "global_step": 77026, "epoch": 1833} {"train_loss": -6.070584115527925, "global_step": 77027, "epoch": 1833, "val_loss": 74982.5625} {"train_loss": -6.030295372009277, "global_step": 77028, "epoch": 1834} {"train_loss": -5.964896202087402, "global_step": 77029, "epoch": 1834} {"train_loss": -6.101571083068848, "global_step": 77030, "epoch": 1834} {"train_loss": -6.038105010986328, "global_step": 77031, "epoch": 1834} {"train_loss": -6.122162818908691, "global_step": 77032, "epoch": 1834} {"train_loss": -6.197983741760254, "global_step": 77033, "epoch": 1834} {"train_loss": -6.189640998840332, "global_step": 77034, "epoch": 1834} {"train_loss": -6.110038757324219, "global_step": 77035, "epoch": 1834} {"train_loss": -6.146256446838379, "global_step": 77036, "epoch": 1834} {"train_loss": -6.119085311889648, "global_step": 77037, "epoch": 1834} {"train_loss": -6.09249210357666, "global_step": 77038, "epoch": 1834} {"train_loss": -6.099420547485352, "global_step": 77039, "epoch": 1834} {"train_loss": -6.082043647766113, "global_step": 77040, "epoch": 1834} {"train_loss": -6.081070899963379, "global_step": 77041, "epoch": 1834} {"train_loss": -5.919408798217773, "global_step": 77042, "epoch": 1834} {"train_loss": -6.044291019439697, "global_step": 77043, "epoch": 1834} {"train_loss": -5.945891380310059, "global_step": 77044, "epoch": 1834} {"train_loss": -5.978691577911377, "global_step": 77045, "epoch": 1834} {"train_loss": -6.168620586395264, "global_step": 77046, "epoch": 1834} {"train_loss": -6.038076400756836, "global_step": 77047, "epoch": 1834} {"train_loss": -5.968628883361816, "global_step": 77048, "epoch": 1834} {"train_loss": -6.125339508056641, "global_step": 77049, "epoch": 1834} {"train_loss": -6.000321865081787, "global_step": 77050, "epoch": 1834} {"train_loss": -5.8587236404418945, "global_step": 77051, "epoch": 1834} {"train_loss": -6.12724494934082, "global_step": 77052, "epoch": 1834} {"train_loss": -6.112619400024414, "global_step": 77053, "epoch": 1834} {"train_loss": -6.095309257507324, "global_step": 77054, "epoch": 1834} {"train_loss": -6.032386779785156, "global_step": 77055, "epoch": 1834} {"train_loss": -5.964799880981445, "global_step": 77056, "epoch": 1834} {"train_loss": -6.167367935180664, "global_step": 77057, "epoch": 1834} {"train_loss": -6.087217330932617, "global_step": 77058, "epoch": 1834} {"train_loss": -6.092437744140625, "global_step": 77059, "epoch": 1834} {"train_loss": -6.176803112030029, "global_step": 77060, "epoch": 1834} {"train_loss": -5.974322319030762, "global_step": 77061, "epoch": 1834} {"train_loss": -6.13885498046875, "global_step": 77062, "epoch": 1834} {"train_loss": -6.1051411628723145, "global_step": 77063, "epoch": 1834} {"train_loss": -5.958834648132324, "global_step": 77064, "epoch": 1834} {"train_loss": -6.013652324676514, "global_step": 77065, "epoch": 1834} {"train_loss": -6.091454982757568, "global_step": 77066, "epoch": 1834} {"train_loss": -6.102790355682373, "global_step": 77067, "epoch": 1834} {"train_loss": -6.080242156982422, "global_step": 77068, "epoch": 1834} {"train_loss": -6.066477117084322, "global_step": 77069, "epoch": 1834, "val_loss": 74774.71875} {"train_loss": -6.146240234375, "global_step": 77070, "epoch": 1835} {"train_loss": -6.095134735107422, "global_step": 77071, "epoch": 1835} {"train_loss": -6.041008949279785, "global_step": 77072, "epoch": 1835} {"train_loss": -6.060846328735352, "global_step": 77073, "epoch": 1835} {"train_loss": -6.045815467834473, "global_step": 77074, "epoch": 1835} {"train_loss": -6.0052032470703125, "global_step": 77075, "epoch": 1835} {"train_loss": -6.057360649108887, "global_step": 77076, "epoch": 1835} {"train_loss": -6.29341983795166, "global_step": 77077, "epoch": 1835} {"train_loss": -6.084693908691406, "global_step": 77078, "epoch": 1835} {"train_loss": -5.999181747436523, "global_step": 77079, "epoch": 1835} {"train_loss": -5.993016242980957, "global_step": 77080, "epoch": 1835} {"train_loss": -6.157708168029785, "global_step": 77081, "epoch": 1835} {"train_loss": -6.1033453941345215, "global_step": 77082, "epoch": 1835} {"train_loss": -6.074974536895752, "global_step": 77083, "epoch": 1835} {"train_loss": -6.087191104888916, "global_step": 77084, "epoch": 1835} {"train_loss": -6.035763263702393, "global_step": 77085, "epoch": 1835} {"train_loss": -5.996155261993408, "global_step": 77086, "epoch": 1835} {"train_loss": -6.084368705749512, "global_step": 77087, "epoch": 1835} {"train_loss": -6.050292015075684, "global_step": 77088, "epoch": 1835} {"train_loss": -6.121116638183594, "global_step": 77089, "epoch": 1835} {"train_loss": -6.181164741516113, "global_step": 77090, "epoch": 1835} {"train_loss": -6.031907081604004, "global_step": 77091, "epoch": 1835} {"train_loss": -6.080971717834473, "global_step": 77092, "epoch": 1835} {"train_loss": -6.035802841186523, "global_step": 77093, "epoch": 1835} {"train_loss": -6.054384231567383, "global_step": 77094, "epoch": 1835} {"train_loss": -6.156403064727783, "global_step": 77095, "epoch": 1835} {"train_loss": -6.062687873840332, "global_step": 77096, "epoch": 1835} {"train_loss": -6.196689605712891, "global_step": 77097, "epoch": 1835} {"train_loss": -6.140684127807617, "global_step": 77098, "epoch": 1835} {"train_loss": -6.063389778137207, "global_step": 77099, "epoch": 1835} {"train_loss": -6.024634838104248, "global_step": 77100, "epoch": 1835} {"train_loss": -6.003506660461426, "global_step": 77101, "epoch": 1835} {"train_loss": -6.095155715942383, "global_step": 77102, "epoch": 1835} {"train_loss": -6.104012966156006, "global_step": 77103, "epoch": 1835} {"train_loss": -6.118365287780762, "global_step": 77104, "epoch": 1835} {"train_loss": -6.178474426269531, "global_step": 77105, "epoch": 1835} {"train_loss": -6.072179794311523, "global_step": 77106, "epoch": 1835} {"train_loss": -6.227660655975342, "global_step": 77107, "epoch": 1835} {"train_loss": -5.977319240570068, "global_step": 77108, "epoch": 1835} {"train_loss": -5.920919418334961, "global_step": 77109, "epoch": 1835} {"train_loss": -6.177114963531494, "global_step": 77110, "epoch": 1835} {"train_loss": -6.086560987290882, "global_step": 77111, "epoch": 1835, "val_loss": 75461.0546875} {"train_loss": -6.033370494842529, "global_step": 77112, "epoch": 1836} {"train_loss": -6.159425735473633, "global_step": 77113, "epoch": 1836} {"train_loss": -5.980829238891602, "global_step": 77114, "epoch": 1836} {"train_loss": -6.034193992614746, "global_step": 77115, "epoch": 1836} {"train_loss": -6.161323547363281, "global_step": 77116, "epoch": 1836} {"train_loss": -5.946828842163086, "global_step": 77117, "epoch": 1836} {"train_loss": -6.023922443389893, "global_step": 77118, "epoch": 1836} {"train_loss": -6.1799702644348145, "global_step": 77119, "epoch": 1836} {"train_loss": -5.977862358093262, "global_step": 77120, "epoch": 1836} {"train_loss": -6.115765571594238, "global_step": 77121, "epoch": 1836} {"train_loss": -6.016952037811279, "global_step": 77122, "epoch": 1836} {"train_loss": -6.176664352416992, "global_step": 77123, "epoch": 1836} {"train_loss": -6.039763927459717, "global_step": 77124, "epoch": 1836} {"train_loss": -6.014049053192139, "global_step": 77125, "epoch": 1836} {"train_loss": -6.072274208068848, "global_step": 77126, "epoch": 1836} {"train_loss": -5.912362098693848, "global_step": 77127, "epoch": 1836} {"train_loss": -6.137218952178955, "global_step": 77128, "epoch": 1836} {"train_loss": -6.0822343826293945, "global_step": 77129, "epoch": 1836} {"train_loss": -6.15949821472168, "global_step": 77130, "epoch": 1836} {"train_loss": -6.0065717697143555, "global_step": 77131, "epoch": 1836} {"train_loss": -6.118219375610352, "global_step": 77132, "epoch": 1836} {"train_loss": -6.068210124969482, "global_step": 77133, "epoch": 1836} {"train_loss": -5.999839782714844, "global_step": 77134, "epoch": 1836} {"train_loss": -6.03306245803833, "global_step": 77135, "epoch": 1836} {"train_loss": -6.117085933685303, "global_step": 77136, "epoch": 1836} {"train_loss": -6.175331115722656, "global_step": 77137, "epoch": 1836} {"train_loss": -6.089291572570801, "global_step": 77138, "epoch": 1836} {"train_loss": -6.303765296936035, "global_step": 77139, "epoch": 1836} {"train_loss": -6.102235794067383, "global_step": 77140, "epoch": 1836} {"train_loss": -6.237815856933594, "global_step": 77141, "epoch": 1836} {"train_loss": -6.095545768737793, "global_step": 77142, "epoch": 1836} {"train_loss": -6.1615447998046875, "global_step": 77143, "epoch": 1836} {"train_loss": -6.079291343688965, "global_step": 77144, "epoch": 1836} {"train_loss": -6.091283321380615, "global_step": 77145, "epoch": 1836} {"train_loss": -6.055865287780762, "global_step": 77146, "epoch": 1836} {"train_loss": -6.241330146789551, "global_step": 77147, "epoch": 1836} {"train_loss": -6.018959999084473, "global_step": 77148, "epoch": 1836} {"train_loss": -6.042516231536865, "global_step": 77149, "epoch": 1836} {"train_loss": -6.1268181800842285, "global_step": 77150, "epoch": 1836} {"train_loss": -6.201021671295166, "global_step": 77151, "epoch": 1836} {"train_loss": -6.130043983459473, "global_step": 77152, "epoch": 1836} {"train_loss": -6.089035374777658, "global_step": 77153, "epoch": 1836, "val_loss": 75162.828125} {"train_loss": -6.0615363121032715, "global_step": 77154, "epoch": 1837} {"train_loss": -6.234611511230469, "global_step": 77155, "epoch": 1837} {"train_loss": -6.057182788848877, "global_step": 77156, "epoch": 1837} {"train_loss": -6.126034736633301, "global_step": 77157, "epoch": 1837} {"train_loss": -6.0816264152526855, "global_step": 77158, "epoch": 1837} {"train_loss": -6.134532451629639, "global_step": 77159, "epoch": 1837} {"train_loss": -6.117165565490723, "global_step": 77160, "epoch": 1837} {"train_loss": -6.1112565994262695, "global_step": 77161, "epoch": 1837} {"train_loss": -6.238088130950928, "global_step": 77162, "epoch": 1837} {"train_loss": -6.164659023284912, "global_step": 77163, "epoch": 1837} {"train_loss": -6.168609619140625, "global_step": 77164, "epoch": 1837} {"train_loss": -6.040219306945801, "global_step": 77165, "epoch": 1837} {"train_loss": -6.1079230308532715, "global_step": 77166, "epoch": 1837} {"train_loss": -6.16534423828125, "global_step": 77167, "epoch": 1837} {"train_loss": -6.081469535827637, "global_step": 77168, "epoch": 1837} {"train_loss": -6.1773858070373535, "global_step": 77169, "epoch": 1837} {"train_loss": -6.176713943481445, "global_step": 77170, "epoch": 1837} {"train_loss": -6.111020088195801, "global_step": 77171, "epoch": 1837} {"train_loss": -6.095993518829346, "global_step": 77172, "epoch": 1837} {"train_loss": -6.146127223968506, "global_step": 77173, "epoch": 1837} {"train_loss": -6.021027565002441, "global_step": 77174, "epoch": 1837} {"train_loss": -6.103496551513672, "global_step": 77175, "epoch": 1837} {"train_loss": -5.960241317749023, "global_step": 77176, "epoch": 1837} {"train_loss": -6.039609909057617, "global_step": 77177, "epoch": 1837} {"train_loss": -6.162240028381348, "global_step": 77178, "epoch": 1837} {"train_loss": -6.082304000854492, "global_step": 77179, "epoch": 1837} {"train_loss": -6.06738805770874, "global_step": 77180, "epoch": 1837} {"train_loss": -6.049510955810547, "global_step": 77181, "epoch": 1837} {"train_loss": -6.1213788986206055, "global_step": 77182, "epoch": 1837} {"train_loss": -5.977603912353516, "global_step": 77183, "epoch": 1837} {"train_loss": -6.120846748352051, "global_step": 77184, "epoch": 1837} {"train_loss": -6.221890449523926, "global_step": 77185, "epoch": 1837} {"train_loss": -6.0510358810424805, "global_step": 77186, "epoch": 1837} {"train_loss": -6.193093776702881, "global_step": 77187, "epoch": 1837} {"train_loss": -6.132071495056152, "global_step": 77188, "epoch": 1837} {"train_loss": -6.067097187042236, "global_step": 77189, "epoch": 1837} {"train_loss": -6.118526935577393, "global_step": 77190, "epoch": 1837} {"train_loss": -6.083565711975098, "global_step": 77191, "epoch": 1837} {"train_loss": -6.124448299407959, "global_step": 77192, "epoch": 1837} {"train_loss": -6.031479835510254, "global_step": 77193, "epoch": 1837} {"train_loss": -6.099776268005371, "global_step": 77194, "epoch": 1837} {"train_loss": -6.109239952904837, "global_step": 77195, "epoch": 1837, "val_loss": 74900.375} {"train_loss": -6.214808464050293, "global_step": 77196, "epoch": 1838} {"train_loss": -6.156583786010742, "global_step": 77197, "epoch": 1838} {"train_loss": -6.289233207702637, "global_step": 77198, "epoch": 1838} {"train_loss": -6.121736526489258, "global_step": 77199, "epoch": 1838} {"train_loss": -6.111148834228516, "global_step": 77200, "epoch": 1838} {"train_loss": -6.121362686157227, "global_step": 77201, "epoch": 1838} {"train_loss": -6.170156478881836, "global_step": 77202, "epoch": 1838} {"train_loss": -6.201777935028076, "global_step": 77203, "epoch": 1838} {"train_loss": -6.144256591796875, "global_step": 77204, "epoch": 1838} {"train_loss": -6.159786701202393, "global_step": 77205, "epoch": 1838} {"train_loss": -6.127842426300049, "global_step": 77206, "epoch": 1838} {"train_loss": -6.12652587890625, "global_step": 77207, "epoch": 1838} {"train_loss": -6.149849891662598, "global_step": 77208, "epoch": 1838} {"train_loss": -6.1447343826293945, "global_step": 77209, "epoch": 1838} {"train_loss": -6.012357711791992, "global_step": 77210, "epoch": 1838} {"train_loss": -6.196664810180664, "global_step": 77211, "epoch": 1838} {"train_loss": -6.1203813552856445, "global_step": 77212, "epoch": 1838} {"train_loss": -6.15083122253418, "global_step": 77213, "epoch": 1838} {"train_loss": -6.145632743835449, "global_step": 77214, "epoch": 1838} {"train_loss": -6.097939491271973, "global_step": 77215, "epoch": 1838} {"train_loss": -6.009995460510254, "global_step": 77216, "epoch": 1838} {"train_loss": -6.028769493103027, "global_step": 77217, "epoch": 1838} {"train_loss": -6.146518230438232, "global_step": 77218, "epoch": 1838} {"train_loss": -6.098196029663086, "global_step": 77219, "epoch": 1838} {"train_loss": -6.128854751586914, "global_step": 77220, "epoch": 1838} {"train_loss": -6.00126838684082, "global_step": 77221, "epoch": 1838} {"train_loss": -6.13397741317749, "global_step": 77222, "epoch": 1838} {"train_loss": -6.13514518737793, "global_step": 77223, "epoch": 1838} {"train_loss": -6.0572004318237305, "global_step": 77224, "epoch": 1838} {"train_loss": -6.003684043884277, "global_step": 77225, "epoch": 1838} {"train_loss": -6.006734848022461, "global_step": 77226, "epoch": 1838} {"train_loss": -6.111759185791016, "global_step": 77227, "epoch": 1838} {"train_loss": -6.179311752319336, "global_step": 77228, "epoch": 1838} {"train_loss": -6.123812198638916, "global_step": 77229, "epoch": 1838} {"train_loss": -5.960062026977539, "global_step": 77230, "epoch": 1838} {"train_loss": -6.015439033508301, "global_step": 77231, "epoch": 1838} {"train_loss": -5.976321220397949, "global_step": 77232, "epoch": 1838} {"train_loss": -6.034998893737793, "global_step": 77233, "epoch": 1838} {"train_loss": -6.132805824279785, "global_step": 77234, "epoch": 1838} {"train_loss": -6.04798698425293, "global_step": 77235, "epoch": 1838} {"train_loss": -6.060493469238281, "global_step": 77236, "epoch": 1838} {"train_loss": -6.103000550043015, "global_step": 77237, "epoch": 1838, "val_loss": 74711.4375} {"train_loss": -6.187383651733398, "global_step": 77238, "epoch": 1839} {"train_loss": -6.083270072937012, "global_step": 77239, "epoch": 1839} {"train_loss": -6.173089981079102, "global_step": 77240, "epoch": 1839} {"train_loss": -6.143674373626709, "global_step": 77241, "epoch": 1839} {"train_loss": -5.987928867340088, "global_step": 77242, "epoch": 1839} {"train_loss": -5.946657657623291, "global_step": 77243, "epoch": 1839} {"train_loss": -6.009200572967529, "global_step": 77244, "epoch": 1839} {"train_loss": -6.171463489532471, "global_step": 77245, "epoch": 1839} {"train_loss": -6.149998664855957, "global_step": 77246, "epoch": 1839} {"train_loss": -6.109989166259766, "global_step": 77247, "epoch": 1839} {"train_loss": -6.059434413909912, "global_step": 77248, "epoch": 1839} {"train_loss": -6.195917129516602, "global_step": 77249, "epoch": 1839} {"train_loss": -6.109151363372803, "global_step": 77250, "epoch": 1839} {"train_loss": -6.157513618469238, "global_step": 77251, "epoch": 1839} {"train_loss": -6.00093412399292, "global_step": 77252, "epoch": 1839} {"train_loss": -6.143317222595215, "global_step": 77253, "epoch": 1839} {"train_loss": -6.128063678741455, "global_step": 77254, "epoch": 1839} {"train_loss": -6.012768745422363, "global_step": 77255, "epoch": 1839} {"train_loss": -6.257875442504883, "global_step": 77256, "epoch": 1839} {"train_loss": -6.332920074462891, "global_step": 77257, "epoch": 1839} {"train_loss": -6.201785087585449, "global_step": 77258, "epoch": 1839} {"train_loss": -6.068112373352051, "global_step": 77259, "epoch": 1839} {"train_loss": -6.169844150543213, "global_step": 77260, "epoch": 1839} {"train_loss": -6.098110198974609, "global_step": 77261, "epoch": 1839} {"train_loss": -6.119103908538818, "global_step": 77262, "epoch": 1839} {"train_loss": -6.0867462158203125, "global_step": 77263, "epoch": 1839} {"train_loss": -6.039811134338379, "global_step": 77264, "epoch": 1839} {"train_loss": -6.140143394470215, "global_step": 77265, "epoch": 1839} {"train_loss": -6.037964344024658, "global_step": 77266, "epoch": 1839} {"train_loss": -6.014713764190674, "global_step": 77267, "epoch": 1839} {"train_loss": -6.094856262207031, "global_step": 77268, "epoch": 1839} {"train_loss": -6.179086685180664, "global_step": 77269, "epoch": 1839} {"train_loss": -6.077732086181641, "global_step": 77270, "epoch": 1839} {"train_loss": -6.038066387176514, "global_step": 77271, "epoch": 1839} {"train_loss": -6.1261491775512695, "global_step": 77272, "epoch": 1839} {"train_loss": -6.035768508911133, "global_step": 77273, "epoch": 1839} {"train_loss": -6.016110420227051, "global_step": 77274, "epoch": 1839} {"train_loss": -6.127760887145996, "global_step": 77275, "epoch": 1839} {"train_loss": -6.02284049987793, "global_step": 77276, "epoch": 1839} {"train_loss": -6.158360004425049, "global_step": 77277, "epoch": 1839} {"train_loss": -6.115828514099121, "global_step": 77278, "epoch": 1839} {"train_loss": -6.105832451865787, "global_step": 77279, "epoch": 1839, "val_loss": 74955.2109375} {"train_loss": -6.115077972412109, "global_step": 77280, "epoch": 1840} {"train_loss": -6.006358623504639, "global_step": 77281, "epoch": 1840} {"train_loss": -6.155783176422119, "global_step": 77282, "epoch": 1840} {"train_loss": -6.11332893371582, "global_step": 77283, "epoch": 1840} {"train_loss": -6.1529154777526855, "global_step": 77284, "epoch": 1840} {"train_loss": -6.07735538482666, "global_step": 77285, "epoch": 1840} {"train_loss": -6.067102909088135, "global_step": 77286, "epoch": 1840} {"train_loss": -6.10734748840332, "global_step": 77287, "epoch": 1840} {"train_loss": -6.121501922607422, "global_step": 77288, "epoch": 1840} {"train_loss": -6.075725555419922, "global_step": 77289, "epoch": 1840} {"train_loss": -6.003635406494141, "global_step": 77290, "epoch": 1840} {"train_loss": -6.06712532043457, "global_step": 77291, "epoch": 1840} {"train_loss": -6.157305717468262, "global_step": 77292, "epoch": 1840} {"train_loss": -6.049821376800537, "global_step": 77293, "epoch": 1840} {"train_loss": -6.111142158508301, "global_step": 77294, "epoch": 1840} {"train_loss": -6.182912826538086, "global_step": 77295, "epoch": 1840} {"train_loss": -6.079297065734863, "global_step": 77296, "epoch": 1840} {"train_loss": -6.106390476226807, "global_step": 77297, "epoch": 1840} {"train_loss": -6.017423629760742, "global_step": 77298, "epoch": 1840} {"train_loss": -5.9487624168396, "global_step": 77299, "epoch": 1840} {"train_loss": -6.064155578613281, "global_step": 77300, "epoch": 1840} {"train_loss": -6.022010803222656, "global_step": 77301, "epoch": 1840} {"train_loss": -6.074395179748535, "global_step": 77302, "epoch": 1840} {"train_loss": -6.147855281829834, "global_step": 77303, "epoch": 1840} {"train_loss": -6.1924896240234375, "global_step": 77304, "epoch": 1840} {"train_loss": -6.041468620300293, "global_step": 77305, "epoch": 1840} {"train_loss": -6.134953498840332, "global_step": 77306, "epoch": 1840} {"train_loss": -6.042013645172119, "global_step": 77307, "epoch": 1840} {"train_loss": -6.21501350402832, "global_step": 77308, "epoch": 1840} {"train_loss": -6.130751609802246, "global_step": 77309, "epoch": 1840} {"train_loss": -6.055074691772461, "global_step": 77310, "epoch": 1840} {"train_loss": -6.071839809417725, "global_step": 77311, "epoch": 1840} {"train_loss": -6.234838008880615, "global_step": 77312, "epoch": 1840} {"train_loss": -6.05259895324707, "global_step": 77313, "epoch": 1840} {"train_loss": -6.081759452819824, "global_step": 77314, "epoch": 1840} {"train_loss": -6.146293640136719, "global_step": 77315, "epoch": 1840} {"train_loss": -6.08952522277832, "global_step": 77316, "epoch": 1840} {"train_loss": -6.134925842285156, "global_step": 77317, "epoch": 1840} {"train_loss": -6.103150367736816, "global_step": 77318, "epoch": 1840} {"train_loss": -6.155548572540283, "global_step": 77319, "epoch": 1840} {"train_loss": -6.100596904754639, "global_step": 77320, "epoch": 1840} {"train_loss": -6.10020433153425, "global_step": 77321, "epoch": 1840, "val_loss": 75096.8984375} {"train_loss": -6.1296539306640625, "global_step": 77322, "epoch": 1841} {"train_loss": -6.060094833374023, "global_step": 77323, "epoch": 1841} {"train_loss": -6.1338653564453125, "global_step": 77324, "epoch": 1841} {"train_loss": -6.109689235687256, "global_step": 77325, "epoch": 1841} {"train_loss": -6.1174516677856445, "global_step": 77326, "epoch": 1841} {"train_loss": -6.098706245422363, "global_step": 77327, "epoch": 1841} {"train_loss": -6.271622657775879, "global_step": 77328, "epoch": 1841} {"train_loss": -6.015774726867676, "global_step": 77329, "epoch": 1841} {"train_loss": -6.020969867706299, "global_step": 77330, "epoch": 1841} {"train_loss": -6.211214065551758, "global_step": 77331, "epoch": 1841} {"train_loss": -6.134737968444824, "global_step": 77332, "epoch": 1841} {"train_loss": -6.149326324462891, "global_step": 77333, "epoch": 1841} {"train_loss": -6.007341384887695, "global_step": 77334, "epoch": 1841} {"train_loss": -6.235813140869141, "global_step": 77335, "epoch": 1841} {"train_loss": -6.084338665008545, "global_step": 77336, "epoch": 1841} {"train_loss": -5.992624759674072, "global_step": 77337, "epoch": 1841} {"train_loss": -6.093367576599121, "global_step": 77338, "epoch": 1841} {"train_loss": -6.082036018371582, "global_step": 77339, "epoch": 1841} {"train_loss": -6.094132423400879, "global_step": 77340, "epoch": 1841} {"train_loss": -6.145978927612305, "global_step": 77341, "epoch": 1841} {"train_loss": -6.015957355499268, "global_step": 77342, "epoch": 1841} {"train_loss": -6.126019477844238, "global_step": 77343, "epoch": 1841} {"train_loss": -6.14984130859375, "global_step": 77344, "epoch": 1841} {"train_loss": -6.175110816955566, "global_step": 77345, "epoch": 1841} {"train_loss": -6.150207996368408, "global_step": 77346, "epoch": 1841} {"train_loss": -6.055814743041992, "global_step": 77347, "epoch": 1841} {"train_loss": -6.039215087890625, "global_step": 77348, "epoch": 1841} {"train_loss": -6.145157814025879, "global_step": 77349, "epoch": 1841} {"train_loss": -6.086815357208252, "global_step": 77350, "epoch": 1841} {"train_loss": -6.1666388511657715, "global_step": 77351, "epoch": 1841} {"train_loss": -6.101574420928955, "global_step": 77352, "epoch": 1841} {"train_loss": -5.909743309020996, "global_step": 77353, "epoch": 1841} {"train_loss": -6.0701985359191895, "global_step": 77354, "epoch": 1841} {"train_loss": -6.162235260009766, "global_step": 77355, "epoch": 1841} {"train_loss": -6.176760673522949, "global_step": 77356, "epoch": 1841} {"train_loss": -6.074649333953857, "global_step": 77357, "epoch": 1841} {"train_loss": -6.101533889770508, "global_step": 77358, "epoch": 1841} {"train_loss": -6.042421340942383, "global_step": 77359, "epoch": 1841} {"train_loss": -6.148519515991211, "global_step": 77360, "epoch": 1841} {"train_loss": -6.072719573974609, "global_step": 77361, "epoch": 1841} {"train_loss": -6.1090826988220215, "global_step": 77362, "epoch": 1841} {"train_loss": -6.106095189139957, "global_step": 77363, "epoch": 1841, "val_loss": 75122.484375} {"train_loss": -6.155574798583984, "global_step": 77364, "epoch": 1842} {"train_loss": -6.1128973960876465, "global_step": 77365, "epoch": 1842} {"train_loss": -6.072633743286133, "global_step": 77366, "epoch": 1842} {"train_loss": -6.127405166625977, "global_step": 77367, "epoch": 1842} {"train_loss": -6.112459659576416, "global_step": 77368, "epoch": 1842} {"train_loss": -6.042557239532471, "global_step": 77369, "epoch": 1842} {"train_loss": -6.164732933044434, "global_step": 77370, "epoch": 1842} {"train_loss": -6.242739677429199, "global_step": 77371, "epoch": 1842} {"train_loss": -6.084627151489258, "global_step": 77372, "epoch": 1842} {"train_loss": -6.106267929077148, "global_step": 77373, "epoch": 1842} {"train_loss": -6.247281074523926, "global_step": 77374, "epoch": 1842} {"train_loss": -6.1444549560546875, "global_step": 77375, "epoch": 1842} {"train_loss": -6.100949287414551, "global_step": 77376, "epoch": 1842} {"train_loss": -6.209485054016113, "global_step": 77377, "epoch": 1842} {"train_loss": -6.127222061157227, "global_step": 77378, "epoch": 1842} {"train_loss": -6.0193190574646, "global_step": 77379, "epoch": 1842} {"train_loss": -6.119861125946045, "global_step": 77380, "epoch": 1842} {"train_loss": -6.093074798583984, "global_step": 77381, "epoch": 1842} {"train_loss": -6.059453964233398, "global_step": 77382, "epoch": 1842} {"train_loss": -6.080783843994141, "global_step": 77383, "epoch": 1842} {"train_loss": -6.081050872802734, "global_step": 77384, "epoch": 1842} {"train_loss": -6.133622169494629, "global_step": 77385, "epoch": 1842} {"train_loss": -6.090176582336426, "global_step": 77386, "epoch": 1842} {"train_loss": -5.990942001342773, "global_step": 77387, "epoch": 1842} {"train_loss": -6.108498573303223, "global_step": 77388, "epoch": 1842} {"train_loss": -6.080527305603027, "global_step": 77389, "epoch": 1842} {"train_loss": -6.136574745178223, "global_step": 77390, "epoch": 1842} {"train_loss": -6.2059431076049805, "global_step": 77391, "epoch": 1842} {"train_loss": -6.085494041442871, "global_step": 77392, "epoch": 1842} {"train_loss": -6.236454486846924, "global_step": 77393, "epoch": 1842} {"train_loss": -6.111362457275391, "global_step": 77394, "epoch": 1842} {"train_loss": -6.0148749351501465, "global_step": 77395, "epoch": 1842} {"train_loss": -6.20751428604126, "global_step": 77396, "epoch": 1842} {"train_loss": -6.008769989013672, "global_step": 77397, "epoch": 1842} {"train_loss": -6.099788188934326, "global_step": 77398, "epoch": 1842} {"train_loss": -6.081529140472412, "global_step": 77399, "epoch": 1842} {"train_loss": -6.079833984375, "global_step": 77400, "epoch": 1842} {"train_loss": -6.225156307220459, "global_step": 77401, "epoch": 1842} {"train_loss": -6.094468116760254, "global_step": 77402, "epoch": 1842} {"train_loss": -6.10572624206543, "global_step": 77403, "epoch": 1842} {"train_loss": -6.034947872161865, "global_step": 77404, "epoch": 1842} {"train_loss": -6.116413854417347, "global_step": 77405, "epoch": 1842, "val_loss": 74760.125} {"train_loss": -6.108363151550293, "global_step": 77406, "epoch": 1843} {"train_loss": -6.023612976074219, "global_step": 77407, "epoch": 1843} {"train_loss": -6.142813682556152, "global_step": 77408, "epoch": 1843} {"train_loss": -6.113175868988037, "global_step": 77409, "epoch": 1843} {"train_loss": -6.193815231323242, "global_step": 77410, "epoch": 1843} {"train_loss": -6.18170166015625, "global_step": 77411, "epoch": 1843} {"train_loss": -6.191832065582275, "global_step": 77412, "epoch": 1843} {"train_loss": -6.17751407623291, "global_step": 77413, "epoch": 1843} {"train_loss": -6.072988033294678, "global_step": 77414, "epoch": 1843} {"train_loss": -6.095898628234863, "global_step": 77415, "epoch": 1843} {"train_loss": -6.072003364562988, "global_step": 77416, "epoch": 1843} {"train_loss": -6.034096717834473, "global_step": 77417, "epoch": 1843} {"train_loss": -6.165478706359863, "global_step": 77418, "epoch": 1843} {"train_loss": -6.086483001708984, "global_step": 77419, "epoch": 1843} {"train_loss": -6.081794738769531, "global_step": 77420, "epoch": 1843} {"train_loss": -6.039885520935059, "global_step": 77421, "epoch": 1843} {"train_loss": -6.076220512390137, "global_step": 77422, "epoch": 1843} {"train_loss": -6.060980796813965, "global_step": 77423, "epoch": 1843} {"train_loss": -6.210726737976074, "global_step": 77424, "epoch": 1843} {"train_loss": -6.136166572570801, "global_step": 77425, "epoch": 1843} {"train_loss": -6.106398582458496, "global_step": 77426, "epoch": 1843} {"train_loss": -6.031464576721191, "global_step": 77427, "epoch": 1843} {"train_loss": -6.103171348571777, "global_step": 77428, "epoch": 1843} {"train_loss": -6.131082057952881, "global_step": 77429, "epoch": 1843} {"train_loss": -6.148217678070068, "global_step": 77430, "epoch": 1843} {"train_loss": -6.219005584716797, "global_step": 77431, "epoch": 1843} {"train_loss": -6.140210151672363, "global_step": 77432, "epoch": 1843} {"train_loss": -6.19217586517334, "global_step": 77433, "epoch": 1843} {"train_loss": -6.0402679443359375, "global_step": 77434, "epoch": 1843} {"train_loss": -6.175619125366211, "global_step": 77435, "epoch": 1843} {"train_loss": -6.235321998596191, "global_step": 77436, "epoch": 1843} {"train_loss": -6.020319938659668, "global_step": 77437, "epoch": 1843} {"train_loss": -6.048282623291016, "global_step": 77438, "epoch": 1843} {"train_loss": -6.074132442474365, "global_step": 77439, "epoch": 1843} {"train_loss": -6.124556541442871, "global_step": 77440, "epoch": 1843} {"train_loss": -6.110705375671387, "global_step": 77441, "epoch": 1843} {"train_loss": -6.131497859954834, "global_step": 77442, "epoch": 1843} {"train_loss": -6.090967178344727, "global_step": 77443, "epoch": 1843} {"train_loss": -6.184270858764648, "global_step": 77444, "epoch": 1843} {"train_loss": -6.059940814971924, "global_step": 77445, "epoch": 1843} {"train_loss": -6.186936855316162, "global_step": 77446, "epoch": 1843} {"train_loss": -6.120429402305966, "global_step": 77447, "epoch": 1843, "val_loss": 74869.6015625} {"train_loss": -6.259934425354004, "global_step": 77448, "epoch": 1844} {"train_loss": -6.238123893737793, "global_step": 77449, "epoch": 1844} {"train_loss": -6.076597213745117, "global_step": 77450, "epoch": 1844} {"train_loss": -6.179128170013428, "global_step": 77451, "epoch": 1844} {"train_loss": -6.115556240081787, "global_step": 77452, "epoch": 1844} {"train_loss": -6.262214660644531, "global_step": 77453, "epoch": 1844} {"train_loss": -6.009227275848389, "global_step": 77454, "epoch": 1844} {"train_loss": -6.226802825927734, "global_step": 77455, "epoch": 1844} {"train_loss": -6.170955657958984, "global_step": 77456, "epoch": 1844} {"train_loss": -6.2118072509765625, "global_step": 77457, "epoch": 1844} {"train_loss": -6.058502197265625, "global_step": 77458, "epoch": 1844} {"train_loss": -6.176882743835449, "global_step": 77459, "epoch": 1844} {"train_loss": -6.069996356964111, "global_step": 77460, "epoch": 1844} {"train_loss": -5.9856367111206055, "global_step": 77461, "epoch": 1844} {"train_loss": -6.048923492431641, "global_step": 77462, "epoch": 1844} {"train_loss": -6.121129989624023, "global_step": 77463, "epoch": 1844} {"train_loss": -6.138009071350098, "global_step": 77464, "epoch": 1844} {"train_loss": -6.200839996337891, "global_step": 77465, "epoch": 1844} {"train_loss": -6.117674827575684, "global_step": 77466, "epoch": 1844} {"train_loss": -6.064470291137695, "global_step": 77467, "epoch": 1844} {"train_loss": -6.096975803375244, "global_step": 77468, "epoch": 1844} {"train_loss": -6.15270471572876, "global_step": 77469, "epoch": 1844} {"train_loss": -6.090468406677246, "global_step": 77470, "epoch": 1844} {"train_loss": -6.117311954498291, "global_step": 77471, "epoch": 1844} {"train_loss": -6.148796558380127, "global_step": 77472, "epoch": 1844} {"train_loss": -6.155917167663574, "global_step": 77473, "epoch": 1844} {"train_loss": -5.998495101928711, "global_step": 77474, "epoch": 1844} {"train_loss": -6.227817535400391, "global_step": 77475, "epoch": 1844} {"train_loss": -6.160189628601074, "global_step": 77476, "epoch": 1844} {"train_loss": -6.010654926300049, "global_step": 77477, "epoch": 1844} {"train_loss": -6.232415199279785, "global_step": 77478, "epoch": 1844} {"train_loss": -6.149382591247559, "global_step": 77479, "epoch": 1844} {"train_loss": -5.998403549194336, "global_step": 77480, "epoch": 1844} {"train_loss": -6.160857677459717, "global_step": 77481, "epoch": 1844} {"train_loss": -6.137419700622559, "global_step": 77482, "epoch": 1844} {"train_loss": -6.090226650238037, "global_step": 77483, "epoch": 1844} {"train_loss": -6.151503086090088, "global_step": 77484, "epoch": 1844} {"train_loss": -6.08404541015625, "global_step": 77485, "epoch": 1844} {"train_loss": -6.098003387451172, "global_step": 77486, "epoch": 1844} {"train_loss": -6.1527252197265625, "global_step": 77487, "epoch": 1844} {"train_loss": -5.885644912719727, "global_step": 77488, "epoch": 1844} {"train_loss": -6.119889236631847, "global_step": 77489, "epoch": 1844, "val_loss": 74972.125} {"train_loss": -6.026886463165283, "global_step": 77490, "epoch": 1845} {"train_loss": -5.990798473358154, "global_step": 77491, "epoch": 1845} {"train_loss": -6.0930867195129395, "global_step": 77492, "epoch": 1845} {"train_loss": -6.16159725189209, "global_step": 77493, "epoch": 1845} {"train_loss": -6.039279460906982, "global_step": 77494, "epoch": 1845} {"train_loss": -6.053024768829346, "global_step": 77495, "epoch": 1845} {"train_loss": -6.007575511932373, "global_step": 77496, "epoch": 1845} {"train_loss": -6.1058759689331055, "global_step": 77497, "epoch": 1845} {"train_loss": -6.05360746383667, "global_step": 77498, "epoch": 1845} {"train_loss": -6.1189799308776855, "global_step": 77499, "epoch": 1845} {"train_loss": -6.044501304626465, "global_step": 77500, "epoch": 1845} {"train_loss": -6.0730814933776855, "global_step": 77501, "epoch": 1845} {"train_loss": -6.049476623535156, "global_step": 77502, "epoch": 1845} {"train_loss": -5.992145538330078, "global_step": 77503, "epoch": 1845} {"train_loss": -6.110661506652832, "global_step": 77504, "epoch": 1845} {"train_loss": -6.1192803382873535, "global_step": 77505, "epoch": 1845} {"train_loss": -6.166420936584473, "global_step": 77506, "epoch": 1845} {"train_loss": -6.170445442199707, "global_step": 77507, "epoch": 1845} {"train_loss": -6.188167572021484, "global_step": 77508, "epoch": 1845} {"train_loss": -6.088430404663086, "global_step": 77509, "epoch": 1845} {"train_loss": -6.12347412109375, "global_step": 77510, "epoch": 1845} {"train_loss": -6.136763095855713, "global_step": 77511, "epoch": 1845} {"train_loss": -6.024455547332764, "global_step": 77512, "epoch": 1845} {"train_loss": -6.174679279327393, "global_step": 77513, "epoch": 1845} {"train_loss": -6.015332221984863, "global_step": 77514, "epoch": 1845} {"train_loss": -6.023079872131348, "global_step": 77515, "epoch": 1845} {"train_loss": -6.106253623962402, "global_step": 77516, "epoch": 1845} {"train_loss": -6.2047271728515625, "global_step": 77517, "epoch": 1845} {"train_loss": -5.9932451248168945, "global_step": 77518, "epoch": 1845} {"train_loss": -6.10049295425415, "global_step": 77519, "epoch": 1845} {"train_loss": -6.115663528442383, "global_step": 77520, "epoch": 1845} {"train_loss": -6.1233086585998535, "global_step": 77521, "epoch": 1845} {"train_loss": -6.125775337219238, "global_step": 77522, "epoch": 1845} {"train_loss": -6.024199962615967, "global_step": 77523, "epoch": 1845} {"train_loss": -6.218048095703125, "global_step": 77524, "epoch": 1845} {"train_loss": -6.129611015319824, "global_step": 77525, "epoch": 1845} {"train_loss": -6.089484214782715, "global_step": 77526, "epoch": 1845} {"train_loss": -5.95021915435791, "global_step": 77527, "epoch": 1845} {"train_loss": -6.017565727233887, "global_step": 77528, "epoch": 1845} {"train_loss": -6.162955284118652, "global_step": 77529, "epoch": 1845} {"train_loss": -6.043292045593262, "global_step": 77530, "epoch": 1845} {"train_loss": -6.0851925781794955, "global_step": 77531, "epoch": 1845, "val_loss": 74721.203125} {"train_loss": -5.994467735290527, "global_step": 77532, "epoch": 1846} {"train_loss": -6.138803482055664, "global_step": 77533, "epoch": 1846} {"train_loss": -6.190228462219238, "global_step": 77534, "epoch": 1846} {"train_loss": -6.247757911682129, "global_step": 77535, "epoch": 1846} {"train_loss": -6.124546051025391, "global_step": 77536, "epoch": 1846} {"train_loss": -6.080230712890625, "global_step": 77537, "epoch": 1846} {"train_loss": -6.078321933746338, "global_step": 77538, "epoch": 1846} {"train_loss": -6.233855247497559, "global_step": 77539, "epoch": 1846} {"train_loss": -6.112984657287598, "global_step": 77540, "epoch": 1846} {"train_loss": -6.091111183166504, "global_step": 77541, "epoch": 1846} {"train_loss": -6.096033096313477, "global_step": 77542, "epoch": 1846} {"train_loss": -6.010288238525391, "global_step": 77543, "epoch": 1846} {"train_loss": -6.143557548522949, "global_step": 77544, "epoch": 1846} {"train_loss": -6.008474826812744, "global_step": 77545, "epoch": 1846} {"train_loss": -6.157238960266113, "global_step": 77546, "epoch": 1846} {"train_loss": -6.1039719581604, "global_step": 77547, "epoch": 1846} {"train_loss": -6.173083305358887, "global_step": 77548, "epoch": 1846} {"train_loss": -5.975017547607422, "global_step": 77549, "epoch": 1846} {"train_loss": -5.977888107299805, "global_step": 77550, "epoch": 1846} {"train_loss": -6.125668525695801, "global_step": 77551, "epoch": 1846} {"train_loss": -6.102014064788818, "global_step": 77552, "epoch": 1846} {"train_loss": -6.157289505004883, "global_step": 77553, "epoch": 1846} {"train_loss": -6.136754035949707, "global_step": 77554, "epoch": 1846} {"train_loss": -6.115573883056641, "global_step": 77555, "epoch": 1846} {"train_loss": -6.13105583190918, "global_step": 77556, "epoch": 1846} {"train_loss": -6.074948787689209, "global_step": 77557, "epoch": 1846} {"train_loss": -6.184858322143555, "global_step": 77558, "epoch": 1846} {"train_loss": -6.134836196899414, "global_step": 77559, "epoch": 1846} {"train_loss": -6.083286762237549, "global_step": 77560, "epoch": 1846} {"train_loss": -6.082683086395264, "global_step": 77561, "epoch": 1846} {"train_loss": -6.074753761291504, "global_step": 77562, "epoch": 1846} {"train_loss": -5.992276191711426, "global_step": 77563, "epoch": 1846} {"train_loss": -6.076606750488281, "global_step": 77564, "epoch": 1846} {"train_loss": -5.997506141662598, "global_step": 77565, "epoch": 1846} {"train_loss": -6.035907745361328, "global_step": 77566, "epoch": 1846} {"train_loss": -6.058377265930176, "global_step": 77567, "epoch": 1846} {"train_loss": -6.160472869873047, "global_step": 77568, "epoch": 1846} {"train_loss": -6.108340740203857, "global_step": 77569, "epoch": 1846} {"train_loss": -6.080550193786621, "global_step": 77570, "epoch": 1846} {"train_loss": -5.92064905166626, "global_step": 77571, "epoch": 1846} {"train_loss": -6.117428779602051, "global_step": 77572, "epoch": 1846} {"train_loss": -6.09631822222755, "global_step": 77573, "epoch": 1846, "val_loss": 75157.53125} {"train_loss": -6.112316131591797, "global_step": 77574, "epoch": 1847} {"train_loss": -6.124646186828613, "global_step": 77575, "epoch": 1847} {"train_loss": -6.117462635040283, "global_step": 77576, "epoch": 1847} {"train_loss": -6.16069221496582, "global_step": 77577, "epoch": 1847} {"train_loss": -6.097452640533447, "global_step": 77578, "epoch": 1847} {"train_loss": -6.0649261474609375, "global_step": 77579, "epoch": 1847} {"train_loss": -6.271333694458008, "global_step": 77580, "epoch": 1847} {"train_loss": -6.15479850769043, "global_step": 77581, "epoch": 1847} {"train_loss": -6.046533107757568, "global_step": 77582, "epoch": 1847} {"train_loss": -6.089692115783691, "global_step": 77583, "epoch": 1847} {"train_loss": -6.17406702041626, "global_step": 77584, "epoch": 1847} {"train_loss": -6.159444332122803, "global_step": 77585, "epoch": 1847} {"train_loss": -6.193052291870117, "global_step": 77586, "epoch": 1847} {"train_loss": -6.188162803649902, "global_step": 77587, "epoch": 1847} {"train_loss": -6.1610002517700195, "global_step": 77588, "epoch": 1847} {"train_loss": -6.046974182128906, "global_step": 77589, "epoch": 1847} {"train_loss": -6.117405414581299, "global_step": 77590, "epoch": 1847} {"train_loss": -5.996256351470947, "global_step": 77591, "epoch": 1847} {"train_loss": -6.072971820831299, "global_step": 77592, "epoch": 1847} {"train_loss": -6.0361738204956055, "global_step": 77593, "epoch": 1847} {"train_loss": -6.1256914138793945, "global_step": 77594, "epoch": 1847} {"train_loss": -6.138415336608887, "global_step": 77595, "epoch": 1847} {"train_loss": -5.921688556671143, "global_step": 77596, "epoch": 1847} {"train_loss": -6.048233985900879, "global_step": 77597, "epoch": 1847} {"train_loss": -6.097790718078613, "global_step": 77598, "epoch": 1847} {"train_loss": -6.0539445877075195, "global_step": 77599, "epoch": 1847} {"train_loss": -6.014252185821533, "global_step": 77600, "epoch": 1847} {"train_loss": -5.890722751617432, "global_step": 77601, "epoch": 1847} {"train_loss": -5.83974552154541, "global_step": 77602, "epoch": 1847} {"train_loss": -6.074469566345215, "global_step": 77603, "epoch": 1847} {"train_loss": -6.039464950561523, "global_step": 77604, "epoch": 1847} {"train_loss": -6.02174186706543, "global_step": 77605, "epoch": 1847} {"train_loss": -6.090850830078125, "global_step": 77606, "epoch": 1847} {"train_loss": -5.944864273071289, "global_step": 77607, "epoch": 1847} {"train_loss": -6.040168762207031, "global_step": 77608, "epoch": 1847} {"train_loss": -5.92889928817749, "global_step": 77609, "epoch": 1847} {"train_loss": -5.9434590339660645, "global_step": 77610, "epoch": 1847} {"train_loss": -6.08017635345459, "global_step": 77611, "epoch": 1847} {"train_loss": -5.918222904205322, "global_step": 77612, "epoch": 1847} {"train_loss": -6.066300868988037, "global_step": 77613, "epoch": 1847} {"train_loss": -5.932100296020508, "global_step": 77614, "epoch": 1847} {"train_loss": -6.0639640263148715, "global_step": 77615, "epoch": 1847, "val_loss": 75171.546875} {"train_loss": -6.0023698806762695, "global_step": 77616, "epoch": 1848} {"train_loss": -6.036478519439697, "global_step": 77617, "epoch": 1848} {"train_loss": -6.018842697143555, "global_step": 77618, "epoch": 1848} {"train_loss": -6.14570426940918, "global_step": 77619, "epoch": 1848} {"train_loss": -6.026920318603516, "global_step": 77620, "epoch": 1848} {"train_loss": -5.989189624786377, "global_step": 77621, "epoch": 1848} {"train_loss": -6.167909145355225, "global_step": 77622, "epoch": 1848} {"train_loss": -6.004793167114258, "global_step": 77623, "epoch": 1848} {"train_loss": -6.0581583976745605, "global_step": 77624, "epoch": 1848} {"train_loss": -6.17758846282959, "global_step": 77625, "epoch": 1848} {"train_loss": -6.07259464263916, "global_step": 77626, "epoch": 1848} {"train_loss": -6.106257438659668, "global_step": 77627, "epoch": 1848} {"train_loss": -6.092612266540527, "global_step": 77628, "epoch": 1848} {"train_loss": -6.095612525939941, "global_step": 77629, "epoch": 1848} {"train_loss": -6.10228157043457, "global_step": 77630, "epoch": 1848} {"train_loss": -6.175042629241943, "global_step": 77631, "epoch": 1848} {"train_loss": -6.208110809326172, "global_step": 77632, "epoch": 1848} {"train_loss": -6.214014530181885, "global_step": 77633, "epoch": 1848} {"train_loss": -6.058582305908203, "global_step": 77634, "epoch": 1848} {"train_loss": -6.060019493103027, "global_step": 77635, "epoch": 1848} {"train_loss": -6.016839027404785, "global_step": 77636, "epoch": 1848} {"train_loss": -6.145185947418213, "global_step": 77637, "epoch": 1848} {"train_loss": -6.225873947143555, "global_step": 77638, "epoch": 1848} {"train_loss": -6.0608601570129395, "global_step": 77639, "epoch": 1848} {"train_loss": -6.123964309692383, "global_step": 77640, "epoch": 1848} {"train_loss": -6.029329776763916, "global_step": 77641, "epoch": 1848} {"train_loss": -6.005544185638428, "global_step": 77642, "epoch": 1848} {"train_loss": -5.969599723815918, "global_step": 77643, "epoch": 1848} {"train_loss": -6.165848731994629, "global_step": 77644, "epoch": 1848} {"train_loss": -6.006019592285156, "global_step": 77645, "epoch": 1848} {"train_loss": -6.099345684051514, "global_step": 77646, "epoch": 1848} {"train_loss": -6.03573751449585, "global_step": 77647, "epoch": 1848} {"train_loss": -6.042149543762207, "global_step": 77648, "epoch": 1848} {"train_loss": -6.054257869720459, "global_step": 77649, "epoch": 1848} {"train_loss": -6.033520221710205, "global_step": 77650, "epoch": 1848} {"train_loss": -6.125037670135498, "global_step": 77651, "epoch": 1848} {"train_loss": -6.062724590301514, "global_step": 77652, "epoch": 1848} {"train_loss": -6.126786231994629, "global_step": 77653, "epoch": 1848} {"train_loss": -6.138016700744629, "global_step": 77654, "epoch": 1848} {"train_loss": -5.986461639404297, "global_step": 77655, "epoch": 1848} {"train_loss": -6.040354251861572, "global_step": 77656, "epoch": 1848} {"train_loss": -6.082020577930269, "global_step": 77657, "epoch": 1848, "val_loss": 74661.78125} {"train_loss": -6.093502044677734, "global_step": 77658, "epoch": 1849} {"train_loss": -6.000103950500488, "global_step": 77659, "epoch": 1849} {"train_loss": -6.029098033905029, "global_step": 77660, "epoch": 1849} {"train_loss": -6.0695271492004395, "global_step": 77661, "epoch": 1849} {"train_loss": -6.154356002807617, "global_step": 77662, "epoch": 1849} {"train_loss": -5.9609055519104, "global_step": 77663, "epoch": 1849} {"train_loss": -6.0607218742370605, "global_step": 77664, "epoch": 1849} {"train_loss": -6.115800857543945, "global_step": 77665, "epoch": 1849} {"train_loss": -6.14108943939209, "global_step": 77666, "epoch": 1849} {"train_loss": -6.064810752868652, "global_step": 77667, "epoch": 1849} {"train_loss": -6.1856489181518555, "global_step": 77668, "epoch": 1849} {"train_loss": -6.154496192932129, "global_step": 77669, "epoch": 1849} {"train_loss": -6.154463768005371, "global_step": 77670, "epoch": 1849} {"train_loss": -6.042232513427734, "global_step": 77671, "epoch": 1849} {"train_loss": -6.148890495300293, "global_step": 77672, "epoch": 1849} {"train_loss": -6.123772621154785, "global_step": 77673, "epoch": 1849} {"train_loss": -6.172402381896973, "global_step": 77674, "epoch": 1849} {"train_loss": -6.195962905883789, "global_step": 77675, "epoch": 1849} {"train_loss": -6.042242050170898, "global_step": 77676, "epoch": 1849} {"train_loss": -6.1591949462890625, "global_step": 77677, "epoch": 1849} {"train_loss": -6.101235389709473, "global_step": 77678, "epoch": 1849} {"train_loss": -6.1231608390808105, "global_step": 77679, "epoch": 1849} {"train_loss": -6.103606224060059, "global_step": 77680, "epoch": 1849} {"train_loss": -6.133946418762207, "global_step": 77681, "epoch": 1849} {"train_loss": -6.019118309020996, "global_step": 77682, "epoch": 1849} {"train_loss": -6.142102241516113, "global_step": 77683, "epoch": 1849} {"train_loss": -5.996604919433594, "global_step": 77684, "epoch": 1849} {"train_loss": -6.066983222961426, "global_step": 77685, "epoch": 1849} {"train_loss": -6.046669960021973, "global_step": 77686, "epoch": 1849} {"train_loss": -6.10154914855957, "global_step": 77687, "epoch": 1849} {"train_loss": -6.275888919830322, "global_step": 77688, "epoch": 1849} {"train_loss": -6.013218879699707, "global_step": 77689, "epoch": 1849} {"train_loss": -6.105197906494141, "global_step": 77690, "epoch": 1849} {"train_loss": -6.0558905601501465, "global_step": 77691, "epoch": 1849} {"train_loss": -6.087693214416504, "global_step": 77692, "epoch": 1849} {"train_loss": -6.006183624267578, "global_step": 77693, "epoch": 1849} {"train_loss": -6.115633010864258, "global_step": 77694, "epoch": 1849} {"train_loss": -6.106385231018066, "global_step": 77695, "epoch": 1849} {"train_loss": -6.090597629547119, "global_step": 77696, "epoch": 1849} {"train_loss": -6.104034423828125, "global_step": 77697, "epoch": 1849} {"train_loss": -6.1283159255981445, "global_step": 77698, "epoch": 1849} {"train_loss": -6.096511761347453, "global_step": 77699, "epoch": 1849, "val_loss": 74803.265625} {"train_loss": -6.151224136352539, "global_step": 77700, "epoch": 1850} {"train_loss": -6.108433246612549, "global_step": 77701, "epoch": 1850} {"train_loss": -6.078466415405273, "global_step": 77702, "epoch": 1850} {"train_loss": -6.052824974060059, "global_step": 77703, "epoch": 1850} {"train_loss": -5.939783573150635, "global_step": 77704, "epoch": 1850} {"train_loss": -6.151848793029785, "global_step": 77705, "epoch": 1850} {"train_loss": -6.059014320373535, "global_step": 77706, "epoch": 1850} {"train_loss": -6.011211395263672, "global_step": 77707, "epoch": 1850} {"train_loss": -6.212197303771973, "global_step": 77708, "epoch": 1850} {"train_loss": -5.925966262817383, "global_step": 77709, "epoch": 1850} {"train_loss": -6.129115104675293, "global_step": 77710, "epoch": 1850} {"train_loss": -6.0171356201171875, "global_step": 77711, "epoch": 1850} {"train_loss": -6.11867618560791, "global_step": 77712, "epoch": 1850} {"train_loss": -6.0917158126831055, "global_step": 77713, "epoch": 1850} {"train_loss": -5.985658168792725, "global_step": 77714, "epoch": 1850} {"train_loss": -6.022346496582031, "global_step": 77715, "epoch": 1850} {"train_loss": -5.970347881317139, "global_step": 77716, "epoch": 1850} {"train_loss": -6.232757568359375, "global_step": 77717, "epoch": 1850} {"train_loss": -6.0162248611450195, "global_step": 77718, "epoch": 1850} {"train_loss": -6.093608379364014, "global_step": 77719, "epoch": 1850} {"train_loss": -6.029963970184326, "global_step": 77720, "epoch": 1850} {"train_loss": -6.162376403808594, "global_step": 77721, "epoch": 1850} {"train_loss": -6.109614849090576, "global_step": 77722, "epoch": 1850} {"train_loss": -6.201457977294922, "global_step": 77723, "epoch": 1850} {"train_loss": -6.046712875366211, "global_step": 77724, "epoch": 1850} {"train_loss": -6.180970191955566, "global_step": 77725, "epoch": 1850} {"train_loss": -6.170273780822754, "global_step": 77726, "epoch": 1850} {"train_loss": -6.200337886810303, "global_step": 77727, "epoch": 1850} {"train_loss": -6.166360378265381, "global_step": 77728, "epoch": 1850} {"train_loss": -6.001243591308594, "global_step": 77729, "epoch": 1850} {"train_loss": -6.135018348693848, "global_step": 77730, "epoch": 1850} {"train_loss": -6.265051364898682, "global_step": 77731, "epoch": 1850} {"train_loss": -6.106518268585205, "global_step": 77732, "epoch": 1850} {"train_loss": -6.1744384765625, "global_step": 77733, "epoch": 1850} {"train_loss": -6.113278388977051, "global_step": 77734, "epoch": 1850} {"train_loss": -6.064087867736816, "global_step": 77735, "epoch": 1850} {"train_loss": -6.1293416023254395, "global_step": 77736, "epoch": 1850} {"train_loss": -6.115701675415039, "global_step": 77737, "epoch": 1850} {"train_loss": -6.1498942375183105, "global_step": 77738, "epoch": 1850} {"train_loss": -6.206136226654053, "global_step": 77739, "epoch": 1850} {"train_loss": -6.073064804077148, "global_step": 77740, "epoch": 1850} {"train_loss": -6.10065948395502, "global_step": 77741, "epoch": 1850, "train/sim_max_reward_0": 0.6590008770813806, "train/sim_max_reward_1": 0.9124048024040071, "train/sim_max_reward_2": 0.21333627762245921, "train/sim_max_reward_3": 0.1408660111174851, "train/sim_max_reward_4": 0.9003318690189084, "train/sim_max_reward_5": 0.8371794966706914, "test/sim_max_reward_4500000": 0.42992449281993456, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.786635389678195, "test/sim_max_reward_4500003": 0.8067069096971409, "test/sim_max_reward_4500004": 0.4473065366337754, "test/sim_max_reward_4500005": 0.3951342575961945, "test/sim_max_reward_4500006": 0.9461165920415215, "test/sim_max_reward_4500007": 0.40343072676702085, "test/sim_max_reward_4500008": 0.15712365284072222, "test/sim_max_reward_4500009": 0.9934459453804014, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.384361283952074, "test/sim_max_reward_4500012": 0.05952748138904909, "test/sim_max_reward_4500013": 0.001667619704353123, "test/sim_max_reward_4500014": 0.3745324060243907, "test/sim_max_reward_4500015": 0.04781148072562116, "test/sim_max_reward_4500016": 0.9165864535851858, "test/sim_max_reward_4500017": 0.05063104588308876, "test/sim_max_reward_4500018": 0.3243083032898816, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.8381755143142581, "test/sim_max_reward_4500021": 0.9600703447183809, "test/sim_max_reward_4500022": 0.9021660016197305, "test/sim_max_reward_4500023": 0.8452407670106256, "test/sim_max_reward_4500024": 0.8567456401380059, "test/sim_max_reward_4500025": 9.587102314505429e-05, "test/sim_max_reward_4500026": 0.9238042883606338, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.0484743654483636, "test/sim_max_reward_4500030": 0.9583484159745486, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05274732172940062, "test/sim_max_reward_4500033": 0.9091953385938951, "test/sim_max_reward_4500034": 1.0, "test/sim_max_reward_4500035": 0.732372933319549, "test/sim_max_reward_4500036": 0.3624109961058175, "test/sim_max_reward_4500037": 0.8020636983881936, "test/sim_max_reward_4500038": 0.8570703219198625, "test/sim_max_reward_4500039": 0.9633622924383787, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.2952074920521712, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.2148123190629423, "test/sim_max_reward_4500044": 0.9258845219091761, "test/sim_max_reward_4500045": 0.7673220612204742, "test/sim_max_reward_4500046": 0.7698081132381168, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9643051550762091, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6105198889858219, "test/mean_score": 0.5216103817397969, "val_loss": 75012.6015625} {"train_loss": -6.18870735168457, "global_step": 77742, "epoch": 1851} {"train_loss": -6.22442626953125, "global_step": 77743, "epoch": 1851} {"train_loss": -6.069429874420166, "global_step": 77744, "epoch": 1851} {"train_loss": -6.070757865905762, "global_step": 77745, "epoch": 1851} {"train_loss": -6.072995185852051, "global_step": 77746, "epoch": 1851} {"train_loss": -6.221271514892578, "global_step": 77747, "epoch": 1851} {"train_loss": -6.083510398864746, "global_step": 77748, "epoch": 1851} {"train_loss": -5.997772693634033, "global_step": 77749, "epoch": 1851} {"train_loss": -6.159656524658203, "global_step": 77750, "epoch": 1851} {"train_loss": -6.091396331787109, "global_step": 77751, "epoch": 1851} {"train_loss": -6.125987529754639, "global_step": 77752, "epoch": 1851} {"train_loss": -6.152606010437012, "global_step": 77753, "epoch": 1851} {"train_loss": -6.045950889587402, "global_step": 77754, "epoch": 1851} {"train_loss": -6.152036666870117, "global_step": 77755, "epoch": 1851} {"train_loss": -6.133944511413574, "global_step": 77756, "epoch": 1851} {"train_loss": -6.221266746520996, "global_step": 77757, "epoch": 1851} {"train_loss": -6.178285598754883, "global_step": 77758, "epoch": 1851} {"train_loss": -6.231402397155762, "global_step": 77759, "epoch": 1851} {"train_loss": -6.173108100891113, "global_step": 77760, "epoch": 1851} {"train_loss": -6.224773406982422, "global_step": 77761, "epoch": 1851} {"train_loss": -6.040509223937988, "global_step": 77762, "epoch": 1851} {"train_loss": -6.139601707458496, "global_step": 77763, "epoch": 1851} {"train_loss": -6.1574387550354, "global_step": 77764, "epoch": 1851} {"train_loss": -6.0868096351623535, "global_step": 77765, "epoch": 1851} {"train_loss": -6.125657081604004, "global_step": 77766, "epoch": 1851} {"train_loss": -6.123499870300293, "global_step": 77767, "epoch": 1851} {"train_loss": -6.202781677246094, "global_step": 77768, "epoch": 1851} {"train_loss": -6.2331085205078125, "global_step": 77769, "epoch": 1851} {"train_loss": -6.188207149505615, "global_step": 77770, "epoch": 1851} {"train_loss": -6.031152725219727, "global_step": 77771, "epoch": 1851} {"train_loss": -6.023101806640625, "global_step": 77772, "epoch": 1851} {"train_loss": -6.100625514984131, "global_step": 77773, "epoch": 1851} {"train_loss": -6.2062249183654785, "global_step": 77774, "epoch": 1851} {"train_loss": -6.12428092956543, "global_step": 77775, "epoch": 1851} {"train_loss": -5.988730430603027, "global_step": 77776, "epoch": 1851} {"train_loss": -6.096490859985352, "global_step": 77777, "epoch": 1851} {"train_loss": -6.187871932983398, "global_step": 77778, "epoch": 1851} {"train_loss": -6.008240222930908, "global_step": 77779, "epoch": 1851} {"train_loss": -6.17830753326416, "global_step": 77780, "epoch": 1851} {"train_loss": -6.298770427703857, "global_step": 77781, "epoch": 1851} {"train_loss": -6.051792144775391, "global_step": 77782, "epoch": 1851} {"train_loss": -6.131300835382371, "global_step": 77783, "epoch": 1851, "val_loss": 74926.1484375} {"train_loss": -6.087480068206787, "global_step": 77784, "epoch": 1852} {"train_loss": -6.057122230529785, "global_step": 77785, "epoch": 1852} {"train_loss": -6.1204118728637695, "global_step": 77786, "epoch": 1852} {"train_loss": -6.0820207595825195, "global_step": 77787, "epoch": 1852} {"train_loss": -6.137324333190918, "global_step": 77788, "epoch": 1852} {"train_loss": -6.1504130363464355, "global_step": 77789, "epoch": 1852} {"train_loss": -6.212940692901611, "global_step": 77790, "epoch": 1852} {"train_loss": -6.012676239013672, "global_step": 77791, "epoch": 1852} {"train_loss": -6.210537433624268, "global_step": 77792, "epoch": 1852} {"train_loss": -6.146037578582764, "global_step": 77793, "epoch": 1852} {"train_loss": -6.0917744636535645, "global_step": 77794, "epoch": 1852} {"train_loss": -6.0880231857299805, "global_step": 77795, "epoch": 1852} {"train_loss": -6.028033256530762, "global_step": 77796, "epoch": 1852} {"train_loss": -6.054973602294922, "global_step": 77797, "epoch": 1852} {"train_loss": -6.035591125488281, "global_step": 77798, "epoch": 1852} {"train_loss": -6.018877983093262, "global_step": 77799, "epoch": 1852} {"train_loss": -6.092031478881836, "global_step": 77800, "epoch": 1852} {"train_loss": -6.073239803314209, "global_step": 77801, "epoch": 1852} {"train_loss": -5.97674560546875, "global_step": 77802, "epoch": 1852} {"train_loss": -6.053797721862793, "global_step": 77803, "epoch": 1852} {"train_loss": -6.04930305480957, "global_step": 77804, "epoch": 1852} {"train_loss": -6.036518096923828, "global_step": 77805, "epoch": 1852} {"train_loss": -6.059211730957031, "global_step": 77806, "epoch": 1852} {"train_loss": -6.012218475341797, "global_step": 77807, "epoch": 1852} {"train_loss": -6.102594375610352, "global_step": 77808, "epoch": 1852} {"train_loss": -6.037010192871094, "global_step": 77809, "epoch": 1852} {"train_loss": -6.083893299102783, "global_step": 77810, "epoch": 1852} {"train_loss": -6.026352882385254, "global_step": 77811, "epoch": 1852} {"train_loss": -6.062074184417725, "global_step": 77812, "epoch": 1852} {"train_loss": -6.096319198608398, "global_step": 77813, "epoch": 1852} {"train_loss": -5.933155059814453, "global_step": 77814, "epoch": 1852} {"train_loss": -6.057774066925049, "global_step": 77815, "epoch": 1852} {"train_loss": -5.9090576171875, "global_step": 77816, "epoch": 1852} {"train_loss": -6.147802829742432, "global_step": 77817, "epoch": 1852} {"train_loss": -6.0173234939575195, "global_step": 77818, "epoch": 1852} {"train_loss": -6.1175713539123535, "global_step": 77819, "epoch": 1852} {"train_loss": -6.069544792175293, "global_step": 77820, "epoch": 1852} {"train_loss": -6.085577011108398, "global_step": 77821, "epoch": 1852} {"train_loss": -5.934910297393799, "global_step": 77822, "epoch": 1852} {"train_loss": -5.986630439758301, "global_step": 77823, "epoch": 1852} {"train_loss": -6.040284156799316, "global_step": 77824, "epoch": 1852} {"train_loss": -6.0630640756516225, "global_step": 77825, "epoch": 1852, "val_loss": 74985.3515625} {"train_loss": -6.025245666503906, "global_step": 77826, "epoch": 1853} {"train_loss": -6.069192409515381, "global_step": 77827, "epoch": 1853} {"train_loss": -5.943583011627197, "global_step": 77828, "epoch": 1853} {"train_loss": -6.058258056640625, "global_step": 77829, "epoch": 1853} {"train_loss": -6.066720008850098, "global_step": 77830, "epoch": 1853} {"train_loss": -6.048225402832031, "global_step": 77831, "epoch": 1853} {"train_loss": -6.118600845336914, "global_step": 77832, "epoch": 1853} {"train_loss": -6.087434768676758, "global_step": 77833, "epoch": 1853} {"train_loss": -6.105670928955078, "global_step": 77834, "epoch": 1853} {"train_loss": -6.062598705291748, "global_step": 77835, "epoch": 1853} {"train_loss": -6.084096431732178, "global_step": 77836, "epoch": 1853} {"train_loss": -6.073185920715332, "global_step": 77837, "epoch": 1853} {"train_loss": -6.059269905090332, "global_step": 77838, "epoch": 1853} {"train_loss": -6.031782150268555, "global_step": 77839, "epoch": 1853} {"train_loss": -6.117154121398926, "global_step": 77840, "epoch": 1853} {"train_loss": -6.112433433532715, "global_step": 77841, "epoch": 1853} {"train_loss": -6.158656120300293, "global_step": 77842, "epoch": 1853} {"train_loss": -6.042116165161133, "global_step": 77843, "epoch": 1853} {"train_loss": -6.211893081665039, "global_step": 77844, "epoch": 1853} {"train_loss": -6.075077533721924, "global_step": 77845, "epoch": 1853} {"train_loss": -6.145659446716309, "global_step": 77846, "epoch": 1853} {"train_loss": -6.05006742477417, "global_step": 77847, "epoch": 1853} {"train_loss": -6.169726371765137, "global_step": 77848, "epoch": 1853} {"train_loss": -6.170544624328613, "global_step": 77849, "epoch": 1853} {"train_loss": -6.049280643463135, "global_step": 77850, "epoch": 1853} {"train_loss": -6.133447647094727, "global_step": 77851, "epoch": 1853} {"train_loss": -6.121659278869629, "global_step": 77852, "epoch": 1853} {"train_loss": -6.121390342712402, "global_step": 77853, "epoch": 1853} {"train_loss": -6.185477256774902, "global_step": 77854, "epoch": 1853} {"train_loss": -6.162170886993408, "global_step": 77855, "epoch": 1853} {"train_loss": -6.030099868774414, "global_step": 77856, "epoch": 1853} {"train_loss": -6.1504716873168945, "global_step": 77857, "epoch": 1853} {"train_loss": -6.315126419067383, "global_step": 77858, "epoch": 1853} {"train_loss": -6.090326309204102, "global_step": 77859, "epoch": 1853} {"train_loss": -6.196355819702148, "global_step": 77860, "epoch": 1853} {"train_loss": -6.214267730712891, "global_step": 77861, "epoch": 1853} {"train_loss": -6.154944896697998, "global_step": 77862, "epoch": 1853} {"train_loss": -6.120735168457031, "global_step": 77863, "epoch": 1853} {"train_loss": -6.162197589874268, "global_step": 77864, "epoch": 1853} {"train_loss": -6.136814117431641, "global_step": 77865, "epoch": 1853} {"train_loss": -6.012316703796387, "global_step": 77866, "epoch": 1853} {"train_loss": -6.108274834496634, "global_step": 77867, "epoch": 1853, "val_loss": 75018.9453125} {"train_loss": -5.964992523193359, "global_step": 77868, "epoch": 1854} {"train_loss": -6.07360315322876, "global_step": 77869, "epoch": 1854} {"train_loss": -6.152449607849121, "global_step": 77870, "epoch": 1854} {"train_loss": -5.980344295501709, "global_step": 77871, "epoch": 1854} {"train_loss": -6.130215644836426, "global_step": 77872, "epoch": 1854} {"train_loss": -6.078010559082031, "global_step": 77873, "epoch": 1854} {"train_loss": -6.253026008605957, "global_step": 77874, "epoch": 1854} {"train_loss": -6.1159162521362305, "global_step": 77875, "epoch": 1854} {"train_loss": -6.100552082061768, "global_step": 77876, "epoch": 1854} {"train_loss": -6.111698627471924, "global_step": 77877, "epoch": 1854} {"train_loss": -6.091386795043945, "global_step": 77878, "epoch": 1854} {"train_loss": -6.1194167137146, "global_step": 77879, "epoch": 1854} {"train_loss": -5.986547470092773, "global_step": 77880, "epoch": 1854} {"train_loss": -6.125678539276123, "global_step": 77881, "epoch": 1854} {"train_loss": -6.124938488006592, "global_step": 77882, "epoch": 1854} {"train_loss": -6.2225236892700195, "global_step": 77883, "epoch": 1854} {"train_loss": -6.177091121673584, "global_step": 77884, "epoch": 1854} {"train_loss": -5.981868743896484, "global_step": 77885, "epoch": 1854} {"train_loss": -6.182538986206055, "global_step": 77886, "epoch": 1854} {"train_loss": -6.181295871734619, "global_step": 77887, "epoch": 1854} {"train_loss": -6.162643909454346, "global_step": 77888, "epoch": 1854} {"train_loss": -6.175541400909424, "global_step": 77889, "epoch": 1854} {"train_loss": -6.048813819885254, "global_step": 77890, "epoch": 1854} {"train_loss": -6.063921928405762, "global_step": 77891, "epoch": 1854} {"train_loss": -6.108708381652832, "global_step": 77892, "epoch": 1854} {"train_loss": -6.014553070068359, "global_step": 77893, "epoch": 1854} {"train_loss": -6.049559116363525, "global_step": 77894, "epoch": 1854} {"train_loss": -5.942156791687012, "global_step": 77895, "epoch": 1854} {"train_loss": -6.016100883483887, "global_step": 77896, "epoch": 1854} {"train_loss": -6.020603179931641, "global_step": 77897, "epoch": 1854} {"train_loss": -6.088706970214844, "global_step": 77898, "epoch": 1854} {"train_loss": -6.1365227699279785, "global_step": 77899, "epoch": 1854} {"train_loss": -6.099846839904785, "global_step": 77900, "epoch": 1854} {"train_loss": -6.107295036315918, "global_step": 77901, "epoch": 1854} {"train_loss": -6.035000801086426, "global_step": 77902, "epoch": 1854} {"train_loss": -6.0508270263671875, "global_step": 77903, "epoch": 1854} {"train_loss": -6.128546237945557, "global_step": 77904, "epoch": 1854} {"train_loss": -6.073060989379883, "global_step": 77905, "epoch": 1854} {"train_loss": -6.215639114379883, "global_step": 77906, "epoch": 1854} {"train_loss": -6.1486029624938965, "global_step": 77907, "epoch": 1854} {"train_loss": -6.111837863922119, "global_step": 77908, "epoch": 1854} {"train_loss": -6.094492106210618, "global_step": 77909, "epoch": 1854, "val_loss": 75112.2890625} {"train_loss": -6.1478071212768555, "global_step": 77910, "epoch": 1855} {"train_loss": -6.122960090637207, "global_step": 77911, "epoch": 1855} {"train_loss": -6.15595817565918, "global_step": 77912, "epoch": 1855} {"train_loss": -6.131713390350342, "global_step": 77913, "epoch": 1855} {"train_loss": -6.120239734649658, "global_step": 77914, "epoch": 1855} {"train_loss": -6.073259353637695, "global_step": 77915, "epoch": 1855} {"train_loss": -6.3043622970581055, "global_step": 77916, "epoch": 1855} {"train_loss": -6.1328020095825195, "global_step": 77917, "epoch": 1855} {"train_loss": -6.247715950012207, "global_step": 77918, "epoch": 1855} {"train_loss": -6.147199630737305, "global_step": 77919, "epoch": 1855} {"train_loss": -6.030759811401367, "global_step": 77920, "epoch": 1855} {"train_loss": -6.115620136260986, "global_step": 77921, "epoch": 1855} {"train_loss": -6.238802909851074, "global_step": 77922, "epoch": 1855} {"train_loss": -5.99138879776001, "global_step": 77923, "epoch": 1855} {"train_loss": -6.138670921325684, "global_step": 77924, "epoch": 1855} {"train_loss": -6.088027477264404, "global_step": 77925, "epoch": 1855} {"train_loss": -6.119695663452148, "global_step": 77926, "epoch": 1855} {"train_loss": -6.1440749168396, "global_step": 77927, "epoch": 1855} {"train_loss": -6.051128387451172, "global_step": 77928, "epoch": 1855} {"train_loss": -6.101562023162842, "global_step": 77929, "epoch": 1855} {"train_loss": -6.0557026863098145, "global_step": 77930, "epoch": 1855} {"train_loss": -6.176950931549072, "global_step": 77931, "epoch": 1855} {"train_loss": -6.166213035583496, "global_step": 77932, "epoch": 1855} {"train_loss": -6.059147834777832, "global_step": 77933, "epoch": 1855} {"train_loss": -6.03162956237793, "global_step": 77934, "epoch": 1855} {"train_loss": -6.139340400695801, "global_step": 77935, "epoch": 1855} {"train_loss": -6.113478183746338, "global_step": 77936, "epoch": 1855} {"train_loss": -6.159279823303223, "global_step": 77937, "epoch": 1855} {"train_loss": -6.116392135620117, "global_step": 77938, "epoch": 1855} {"train_loss": -6.213417053222656, "global_step": 77939, "epoch": 1855} {"train_loss": -6.108860015869141, "global_step": 77940, "epoch": 1855} {"train_loss": -6.035225868225098, "global_step": 77941, "epoch": 1855} {"train_loss": -6.153648376464844, "global_step": 77942, "epoch": 1855} {"train_loss": -6.083857536315918, "global_step": 77943, "epoch": 1855} {"train_loss": -6.128936767578125, "global_step": 77944, "epoch": 1855} {"train_loss": -6.145402908325195, "global_step": 77945, "epoch": 1855} {"train_loss": -6.151928424835205, "global_step": 77946, "epoch": 1855} {"train_loss": -6.096683502197266, "global_step": 77947, "epoch": 1855} {"train_loss": -6.181027412414551, "global_step": 77948, "epoch": 1855} {"train_loss": -6.086615562438965, "global_step": 77949, "epoch": 1855} {"train_loss": -6.0025129318237305, "global_step": 77950, "epoch": 1855} {"train_loss": -6.122552111035302, "global_step": 77951, "epoch": 1855, "val_loss": 74938.640625} {"train_loss": -6.086686134338379, "global_step": 77952, "epoch": 1856} {"train_loss": -6.07200813293457, "global_step": 77953, "epoch": 1856} {"train_loss": -6.026202201843262, "global_step": 77954, "epoch": 1856} {"train_loss": -6.088940620422363, "global_step": 77955, "epoch": 1856} {"train_loss": -5.9995927810668945, "global_step": 77956, "epoch": 1856} {"train_loss": -6.072007656097412, "global_step": 77957, "epoch": 1856} {"train_loss": -6.209040641784668, "global_step": 77958, "epoch": 1856} {"train_loss": -6.053956031799316, "global_step": 77959, "epoch": 1856} {"train_loss": -6.105407238006592, "global_step": 77960, "epoch": 1856} {"train_loss": -6.200223922729492, "global_step": 77961, "epoch": 1856} {"train_loss": -6.002843856811523, "global_step": 77962, "epoch": 1856} {"train_loss": -6.034145355224609, "global_step": 77963, "epoch": 1856} {"train_loss": -6.085195064544678, "global_step": 77964, "epoch": 1856} {"train_loss": -6.151120662689209, "global_step": 77965, "epoch": 1856} {"train_loss": -6.130721569061279, "global_step": 77966, "epoch": 1856} {"train_loss": -6.066675186157227, "global_step": 77967, "epoch": 1856} {"train_loss": -6.138460159301758, "global_step": 77968, "epoch": 1856} {"train_loss": -6.141729831695557, "global_step": 77969, "epoch": 1856} {"train_loss": -6.161717414855957, "global_step": 77970, "epoch": 1856} {"train_loss": -6.125308513641357, "global_step": 77971, "epoch": 1856} {"train_loss": -6.128851890563965, "global_step": 77972, "epoch": 1856} {"train_loss": -6.039441108703613, "global_step": 77973, "epoch": 1856} {"train_loss": -6.174946308135986, "global_step": 77974, "epoch": 1856} {"train_loss": -6.104926109313965, "global_step": 77975, "epoch": 1856} {"train_loss": -6.038965225219727, "global_step": 77976, "epoch": 1856} {"train_loss": -6.2846360206604, "global_step": 77977, "epoch": 1856} {"train_loss": -6.180075645446777, "global_step": 77978, "epoch": 1856} {"train_loss": -6.187854766845703, "global_step": 77979, "epoch": 1856} {"train_loss": -6.0436530113220215, "global_step": 77980, "epoch": 1856} {"train_loss": -6.148381233215332, "global_step": 77981, "epoch": 1856} {"train_loss": -6.106171131134033, "global_step": 77982, "epoch": 1856} {"train_loss": -6.125080108642578, "global_step": 77983, "epoch": 1856} {"train_loss": -6.133716583251953, "global_step": 77984, "epoch": 1856} {"train_loss": -6.06369686126709, "global_step": 77985, "epoch": 1856} {"train_loss": -6.132192611694336, "global_step": 77986, "epoch": 1856} {"train_loss": -6.156115531921387, "global_step": 77987, "epoch": 1856} {"train_loss": -6.1435394287109375, "global_step": 77988, "epoch": 1856} {"train_loss": -6.133443832397461, "global_step": 77989, "epoch": 1856} {"train_loss": -5.999940395355225, "global_step": 77990, "epoch": 1856} {"train_loss": -6.087224006652832, "global_step": 77991, "epoch": 1856} {"train_loss": -6.083843231201172, "global_step": 77992, "epoch": 1856} {"train_loss": -6.110563698269072, "global_step": 77993, "epoch": 1856, "val_loss": 75013.0390625} {"train_loss": -5.9815497398376465, "global_step": 77994, "epoch": 1857} {"train_loss": -6.094998836517334, "global_step": 77995, "epoch": 1857} {"train_loss": -6.140071868896484, "global_step": 77996, "epoch": 1857} {"train_loss": -6.09623908996582, "global_step": 77997, "epoch": 1857} {"train_loss": -6.130247116088867, "global_step": 77998, "epoch": 1857} {"train_loss": -6.006814956665039, "global_step": 77999, "epoch": 1857} {"train_loss": -6.1126604080200195, "global_step": 78000, "epoch": 1857} {"train_loss": -6.2084808349609375, "global_step": 78001, "epoch": 1857} {"train_loss": -6.1208014488220215, "global_step": 78002, "epoch": 1857} {"train_loss": -6.1401166915893555, "global_step": 78003, "epoch": 1857} {"train_loss": -6.150899887084961, "global_step": 78004, "epoch": 1857} {"train_loss": -6.228248119354248, "global_step": 78005, "epoch": 1857} {"train_loss": -6.078021049499512, "global_step": 78006, "epoch": 1857} {"train_loss": -6.149563312530518, "global_step": 78007, "epoch": 1857} {"train_loss": -6.006418704986572, "global_step": 78008, "epoch": 1857} {"train_loss": -6.079840660095215, "global_step": 78009, "epoch": 1857} {"train_loss": -6.217633247375488, "global_step": 78010, "epoch": 1857} {"train_loss": -6.077146530151367, "global_step": 78011, "epoch": 1857} {"train_loss": -6.139813423156738, "global_step": 78012, "epoch": 1857} {"train_loss": -6.081098556518555, "global_step": 78013, "epoch": 1857} {"train_loss": -6.15699577331543, "global_step": 78014, "epoch": 1857} {"train_loss": -6.088104248046875, "global_step": 78015, "epoch": 1857} {"train_loss": -6.052523136138916, "global_step": 78016, "epoch": 1857} {"train_loss": -6.140480041503906, "global_step": 78017, "epoch": 1857} {"train_loss": -6.104781627655029, "global_step": 78018, "epoch": 1857} {"train_loss": -6.054961204528809, "global_step": 78019, "epoch": 1857} {"train_loss": -6.006017684936523, "global_step": 78020, "epoch": 1857} {"train_loss": -6.090366363525391, "global_step": 78021, "epoch": 1857} {"train_loss": -6.041333198547363, "global_step": 78022, "epoch": 1857} {"train_loss": -6.081635475158691, "global_step": 78023, "epoch": 1857} {"train_loss": -6.1449737548828125, "global_step": 78024, "epoch": 1857} {"train_loss": -6.084390640258789, "global_step": 78025, "epoch": 1857} {"train_loss": -6.096966743469238, "global_step": 78026, "epoch": 1857} {"train_loss": -6.028412818908691, "global_step": 78027, "epoch": 1857} {"train_loss": -6.076338291168213, "global_step": 78028, "epoch": 1857} {"train_loss": -6.131749153137207, "global_step": 78029, "epoch": 1857} {"train_loss": -6.126041412353516, "global_step": 78030, "epoch": 1857} {"train_loss": -5.979753017425537, "global_step": 78031, "epoch": 1857} {"train_loss": -6.011877059936523, "global_step": 78032, "epoch": 1857} {"train_loss": -5.91715145111084, "global_step": 78033, "epoch": 1857} {"train_loss": -6.006073951721191, "global_step": 78034, "epoch": 1857} {"train_loss": -6.087510994502476, "global_step": 78035, "epoch": 1857, "val_loss": 74725.265625} {"train_loss": -6.166572093963623, "global_step": 78036, "epoch": 1858} {"train_loss": -6.087137222290039, "global_step": 78037, "epoch": 1858} {"train_loss": -6.076234340667725, "global_step": 78038, "epoch": 1858} {"train_loss": -6.201058864593506, "global_step": 78039, "epoch": 1858} {"train_loss": -6.024167060852051, "global_step": 78040, "epoch": 1858} {"train_loss": -6.094986915588379, "global_step": 78041, "epoch": 1858} {"train_loss": -6.198658466339111, "global_step": 78042, "epoch": 1858} {"train_loss": -6.023556232452393, "global_step": 78043, "epoch": 1858} {"train_loss": -6.13483190536499, "global_step": 78044, "epoch": 1858} {"train_loss": -6.101602554321289, "global_step": 78045, "epoch": 1858} {"train_loss": -6.099504470825195, "global_step": 78046, "epoch": 1858} {"train_loss": -6.003651142120361, "global_step": 78047, "epoch": 1858} {"train_loss": -6.032014846801758, "global_step": 78048, "epoch": 1858} {"train_loss": -6.168724536895752, "global_step": 78049, "epoch": 1858} {"train_loss": -5.98213005065918, "global_step": 78050, "epoch": 1858} {"train_loss": -6.061155319213867, "global_step": 78051, "epoch": 1858} {"train_loss": -6.084310531616211, "global_step": 78052, "epoch": 1858} {"train_loss": -6.037546157836914, "global_step": 78053, "epoch": 1858} {"train_loss": -6.145543098449707, "global_step": 78054, "epoch": 1858} {"train_loss": -6.0046162605285645, "global_step": 78055, "epoch": 1858} {"train_loss": -6.051168918609619, "global_step": 78056, "epoch": 1858} {"train_loss": -6.133561134338379, "global_step": 78057, "epoch": 1858} {"train_loss": -6.103042125701904, "global_step": 78058, "epoch": 1858} {"train_loss": -6.046067237854004, "global_step": 78059, "epoch": 1858} {"train_loss": -6.158698081970215, "global_step": 78060, "epoch": 1858} {"train_loss": -5.9471516609191895, "global_step": 78061, "epoch": 1858} {"train_loss": -6.157500267028809, "global_step": 78062, "epoch": 1858} {"train_loss": -6.13104248046875, "global_step": 78063, "epoch": 1858} {"train_loss": -6.127772331237793, "global_step": 78064, "epoch": 1858} {"train_loss": -6.035007476806641, "global_step": 78065, "epoch": 1858} {"train_loss": -6.188692092895508, "global_step": 78066, "epoch": 1858} {"train_loss": -5.913808822631836, "global_step": 78067, "epoch": 1858} {"train_loss": -6.101546287536621, "global_step": 78068, "epoch": 1858} {"train_loss": -6.163087368011475, "global_step": 78069, "epoch": 1858} {"train_loss": -6.035741329193115, "global_step": 78070, "epoch": 1858} {"train_loss": -6.153810977935791, "global_step": 78071, "epoch": 1858} {"train_loss": -6.1049909591674805, "global_step": 78072, "epoch": 1858} {"train_loss": -6.173117637634277, "global_step": 78073, "epoch": 1858} {"train_loss": -6.215604782104492, "global_step": 78074, "epoch": 1858} {"train_loss": -6.246849060058594, "global_step": 78075, "epoch": 1858} {"train_loss": -6.091108798980713, "global_step": 78076, "epoch": 1858} {"train_loss": -6.100273858933222, "global_step": 78077, "epoch": 1858, "val_loss": 74931.078125} {"train_loss": -5.986124038696289, "global_step": 78078, "epoch": 1859} {"train_loss": -6.159958362579346, "global_step": 78079, "epoch": 1859} {"train_loss": -6.057724952697754, "global_step": 78080, "epoch": 1859} {"train_loss": -6.163508415222168, "global_step": 78081, "epoch": 1859} {"train_loss": -6.083654403686523, "global_step": 78082, "epoch": 1859} {"train_loss": -6.0178327560424805, "global_step": 78083, "epoch": 1859} {"train_loss": -6.064882278442383, "global_step": 78084, "epoch": 1859} {"train_loss": -6.121841907501221, "global_step": 78085, "epoch": 1859} {"train_loss": -6.214582443237305, "global_step": 78086, "epoch": 1859} {"train_loss": -6.280742168426514, "global_step": 78087, "epoch": 1859} {"train_loss": -6.098990440368652, "global_step": 78088, "epoch": 1859} {"train_loss": -6.230247497558594, "global_step": 78089, "epoch": 1859} {"train_loss": -6.155302047729492, "global_step": 78090, "epoch": 1859} {"train_loss": -6.026366710662842, "global_step": 78091, "epoch": 1859} {"train_loss": -6.220096588134766, "global_step": 78092, "epoch": 1859} {"train_loss": -6.175266265869141, "global_step": 78093, "epoch": 1859} {"train_loss": -6.144521713256836, "global_step": 78094, "epoch": 1859} {"train_loss": -6.053644180297852, "global_step": 78095, "epoch": 1859} {"train_loss": -6.044252395629883, "global_step": 78096, "epoch": 1859} {"train_loss": -6.185832977294922, "global_step": 78097, "epoch": 1859} {"train_loss": -6.123879432678223, "global_step": 78098, "epoch": 1859} {"train_loss": -5.995509147644043, "global_step": 78099, "epoch": 1859} {"train_loss": -6.179908275604248, "global_step": 78100, "epoch": 1859} {"train_loss": -6.1320881843566895, "global_step": 78101, "epoch": 1859} {"train_loss": -6.024366855621338, "global_step": 78102, "epoch": 1859} {"train_loss": -6.265083312988281, "global_step": 78103, "epoch": 1859} {"train_loss": -6.0904951095581055, "global_step": 78104, "epoch": 1859} {"train_loss": -6.007061004638672, "global_step": 78105, "epoch": 1859} {"train_loss": -6.077632904052734, "global_step": 78106, "epoch": 1859} {"train_loss": -5.929898262023926, "global_step": 78107, "epoch": 1859} {"train_loss": -6.116372108459473, "global_step": 78108, "epoch": 1859} {"train_loss": -6.156317710876465, "global_step": 78109, "epoch": 1859} {"train_loss": -6.093459129333496, "global_step": 78110, "epoch": 1859} {"train_loss": -6.122411727905273, "global_step": 78111, "epoch": 1859} {"train_loss": -6.134548187255859, "global_step": 78112, "epoch": 1859} {"train_loss": -6.213284492492676, "global_step": 78113, "epoch": 1859} {"train_loss": -5.996696472167969, "global_step": 78114, "epoch": 1859} {"train_loss": -6.155918598175049, "global_step": 78115, "epoch": 1859} {"train_loss": -6.114323139190674, "global_step": 78116, "epoch": 1859} {"train_loss": -6.033059120178223, "global_step": 78117, "epoch": 1859} {"train_loss": -6.1429924964904785, "global_step": 78118, "epoch": 1859} {"train_loss": -6.110838572184245, "global_step": 78119, "epoch": 1859, "val_loss": 74668.0859375} {"train_loss": -6.072532653808594, "global_step": 78120, "epoch": 1860} {"train_loss": -6.052870750427246, "global_step": 78121, "epoch": 1860} {"train_loss": -6.13763427734375, "global_step": 78122, "epoch": 1860} {"train_loss": -6.15766716003418, "global_step": 78123, "epoch": 1860} {"train_loss": -6.205206871032715, "global_step": 78124, "epoch": 1860} {"train_loss": -6.136314392089844, "global_step": 78125, "epoch": 1860} {"train_loss": -6.106467247009277, "global_step": 78126, "epoch": 1860} {"train_loss": -6.156558036804199, "global_step": 78127, "epoch": 1860} {"train_loss": -6.146197319030762, "global_step": 78128, "epoch": 1860} {"train_loss": -6.1217145919799805, "global_step": 78129, "epoch": 1860} {"train_loss": -6.135865211486816, "global_step": 78130, "epoch": 1860} {"train_loss": -6.044666290283203, "global_step": 78131, "epoch": 1860} {"train_loss": -6.106382369995117, "global_step": 78132, "epoch": 1860} {"train_loss": -6.091573715209961, "global_step": 78133, "epoch": 1860} {"train_loss": -6.013659477233887, "global_step": 78134, "epoch": 1860} {"train_loss": -6.128951549530029, "global_step": 78135, "epoch": 1860} {"train_loss": -6.018945693969727, "global_step": 78136, "epoch": 1860} {"train_loss": -6.113688945770264, "global_step": 78137, "epoch": 1860} {"train_loss": -6.009252548217773, "global_step": 78138, "epoch": 1860} {"train_loss": -6.111751556396484, "global_step": 78139, "epoch": 1860} {"train_loss": -6.096994400024414, "global_step": 78140, "epoch": 1860} {"train_loss": -6.110344886779785, "global_step": 78141, "epoch": 1860} {"train_loss": -6.0999274253845215, "global_step": 78142, "epoch": 1860} {"train_loss": -6.080912113189697, "global_step": 78143, "epoch": 1860} {"train_loss": -6.042698860168457, "global_step": 78144, "epoch": 1860} {"train_loss": -6.098571300506592, "global_step": 78145, "epoch": 1860} {"train_loss": -6.175968170166016, "global_step": 78146, "epoch": 1860} {"train_loss": -6.06282901763916, "global_step": 78147, "epoch": 1860} {"train_loss": -6.121540546417236, "global_step": 78148, "epoch": 1860} {"train_loss": -6.214876174926758, "global_step": 78149, "epoch": 1860} {"train_loss": -6.175136566162109, "global_step": 78150, "epoch": 1860} {"train_loss": -6.049746513366699, "global_step": 78151, "epoch": 1860} {"train_loss": -6.065422534942627, "global_step": 78152, "epoch": 1860} {"train_loss": -6.070956230163574, "global_step": 78153, "epoch": 1860} {"train_loss": -6.189857006072998, "global_step": 78154, "epoch": 1860} {"train_loss": -6.144378662109375, "global_step": 78155, "epoch": 1860} {"train_loss": -6.009152412414551, "global_step": 78156, "epoch": 1860} {"train_loss": -6.169639587402344, "global_step": 78157, "epoch": 1860} {"train_loss": -6.0241498947143555, "global_step": 78158, "epoch": 1860} {"train_loss": -6.121929168701172, "global_step": 78159, "epoch": 1860} {"train_loss": -6.024130821228027, "global_step": 78160, "epoch": 1860} {"train_loss": -6.103277138301304, "global_step": 78161, "epoch": 1860, "val_loss": 75031.4453125} {"train_loss": -6.105565071105957, "global_step": 78162, "epoch": 1861} {"train_loss": -5.978396415710449, "global_step": 78163, "epoch": 1861} {"train_loss": -6.088847637176514, "global_step": 78164, "epoch": 1861} {"train_loss": -6.109335899353027, "global_step": 78165, "epoch": 1861} {"train_loss": -6.01426887512207, "global_step": 78166, "epoch": 1861} {"train_loss": -6.095343589782715, "global_step": 78167, "epoch": 1861} {"train_loss": -6.092917442321777, "global_step": 78168, "epoch": 1861} {"train_loss": -6.120818614959717, "global_step": 78169, "epoch": 1861} {"train_loss": -6.1188812255859375, "global_step": 78170, "epoch": 1861} {"train_loss": -6.0978288650512695, "global_step": 78171, "epoch": 1861} {"train_loss": -6.257548809051514, "global_step": 78172, "epoch": 1861} {"train_loss": -6.215752124786377, "global_step": 78173, "epoch": 1861} {"train_loss": -6.043240547180176, "global_step": 78174, "epoch": 1861} {"train_loss": -6.061931610107422, "global_step": 78175, "epoch": 1861} {"train_loss": -6.153489112854004, "global_step": 78176, "epoch": 1861} {"train_loss": -6.113096237182617, "global_step": 78177, "epoch": 1861} {"train_loss": -6.23291015625, "global_step": 78178, "epoch": 1861} {"train_loss": -6.108332633972168, "global_step": 78179, "epoch": 1861} {"train_loss": -6.048388957977295, "global_step": 78180, "epoch": 1861} {"train_loss": -6.040544509887695, "global_step": 78181, "epoch": 1861} {"train_loss": -6.043977737426758, "global_step": 78182, "epoch": 1861} {"train_loss": -6.159682273864746, "global_step": 78183, "epoch": 1861} {"train_loss": -6.146651744842529, "global_step": 78184, "epoch": 1861} {"train_loss": -6.012679576873779, "global_step": 78185, "epoch": 1861} {"train_loss": -5.92308235168457, "global_step": 78186, "epoch": 1861} {"train_loss": -5.969173431396484, "global_step": 78187, "epoch": 1861} {"train_loss": -6.024265289306641, "global_step": 78188, "epoch": 1861} {"train_loss": -5.912911415100098, "global_step": 78189, "epoch": 1861} {"train_loss": -6.100414276123047, "global_step": 78190, "epoch": 1861} {"train_loss": -5.978393077850342, "global_step": 78191, "epoch": 1861} {"train_loss": -6.0528435707092285, "global_step": 78192, "epoch": 1861} {"train_loss": -5.854305267333984, "global_step": 78193, "epoch": 1861} {"train_loss": -6.092248439788818, "global_step": 78194, "epoch": 1861} {"train_loss": -5.967655181884766, "global_step": 78195, "epoch": 1861} {"train_loss": -6.081730842590332, "global_step": 78196, "epoch": 1861} {"train_loss": -5.95914888381958, "global_step": 78197, "epoch": 1861} {"train_loss": -6.0825958251953125, "global_step": 78198, "epoch": 1861} {"train_loss": -6.066055774688721, "global_step": 78199, "epoch": 1861} {"train_loss": -6.0118818283081055, "global_step": 78200, "epoch": 1861} {"train_loss": -6.07657527923584, "global_step": 78201, "epoch": 1861} {"train_loss": -6.0235419273376465, "global_step": 78202, "epoch": 1861} {"train_loss": -6.064343963350568, "global_step": 78203, "epoch": 1861, "val_loss": 74933.7109375} {"train_loss": -6.025433540344238, "global_step": 78204, "epoch": 1862} {"train_loss": -5.999227046966553, "global_step": 78205, "epoch": 1862} {"train_loss": -5.980833053588867, "global_step": 78206, "epoch": 1862} {"train_loss": -6.089473724365234, "global_step": 78207, "epoch": 1862} {"train_loss": -6.092083930969238, "global_step": 78208, "epoch": 1862} {"train_loss": -5.9993462562561035, "global_step": 78209, "epoch": 1862} {"train_loss": -6.027741432189941, "global_step": 78210, "epoch": 1862} {"train_loss": -6.171767234802246, "global_step": 78211, "epoch": 1862} {"train_loss": -6.143623352050781, "global_step": 78212, "epoch": 1862} {"train_loss": -5.999151706695557, "global_step": 78213, "epoch": 1862} {"train_loss": -6.055474281311035, "global_step": 78214, "epoch": 1862} {"train_loss": -5.990644454956055, "global_step": 78215, "epoch": 1862} {"train_loss": -6.035216808319092, "global_step": 78216, "epoch": 1862} {"train_loss": -6.023787021636963, "global_step": 78217, "epoch": 1862} {"train_loss": -5.956104278564453, "global_step": 78218, "epoch": 1862} {"train_loss": -5.988691329956055, "global_step": 78219, "epoch": 1862} {"train_loss": -6.065487861633301, "global_step": 78220, "epoch": 1862} {"train_loss": -6.042861461639404, "global_step": 78221, "epoch": 1862} {"train_loss": -5.916146278381348, "global_step": 78222, "epoch": 1862} {"train_loss": -6.058178901672363, "global_step": 78223, "epoch": 1862} {"train_loss": -5.959079742431641, "global_step": 78224, "epoch": 1862} {"train_loss": -6.1073455810546875, "global_step": 78225, "epoch": 1862} {"train_loss": -6.056585788726807, "global_step": 78226, "epoch": 1862} {"train_loss": -6.093767166137695, "global_step": 78227, "epoch": 1862} {"train_loss": -5.958346366882324, "global_step": 78228, "epoch": 1862} {"train_loss": -6.00991678237915, "global_step": 78229, "epoch": 1862} {"train_loss": -5.889633655548096, "global_step": 78230, "epoch": 1862} {"train_loss": -5.951428413391113, "global_step": 78231, "epoch": 1862} {"train_loss": -5.941032409667969, "global_step": 78232, "epoch": 1862} {"train_loss": -6.086285591125488, "global_step": 78233, "epoch": 1862} {"train_loss": -6.114997386932373, "global_step": 78234, "epoch": 1862} {"train_loss": -6.108046531677246, "global_step": 78235, "epoch": 1862} {"train_loss": -6.184143543243408, "global_step": 78236, "epoch": 1862} {"train_loss": -5.916615962982178, "global_step": 78237, "epoch": 1862} {"train_loss": -6.038928031921387, "global_step": 78238, "epoch": 1862} {"train_loss": -6.011320114135742, "global_step": 78239, "epoch": 1862} {"train_loss": -6.121364116668701, "global_step": 78240, "epoch": 1862} {"train_loss": -6.137938499450684, "global_step": 78241, "epoch": 1862} {"train_loss": -6.086601257324219, "global_step": 78242, "epoch": 1862} {"train_loss": -6.048725128173828, "global_step": 78243, "epoch": 1862} {"train_loss": -6.084284782409668, "global_step": 78244, "epoch": 1862} {"train_loss": -6.03978233110337, "global_step": 78245, "epoch": 1862, "val_loss": 75157.0546875} {"train_loss": -6.0508012771606445, "global_step": 78246, "epoch": 1863} {"train_loss": -6.195694923400879, "global_step": 78247, "epoch": 1863} {"train_loss": -5.963719844818115, "global_step": 78248, "epoch": 1863} {"train_loss": -6.133365154266357, "global_step": 78249, "epoch": 1863} {"train_loss": -6.111926555633545, "global_step": 78250, "epoch": 1863} {"train_loss": -6.043632507324219, "global_step": 78251, "epoch": 1863} {"train_loss": -6.017586708068848, "global_step": 78252, "epoch": 1863} {"train_loss": -5.942935943603516, "global_step": 78253, "epoch": 1863} {"train_loss": -6.0599260330200195, "global_step": 78254, "epoch": 1863} {"train_loss": -6.167350769042969, "global_step": 78255, "epoch": 1863} {"train_loss": -6.205624580383301, "global_step": 78256, "epoch": 1863} {"train_loss": -6.11769962310791, "global_step": 78257, "epoch": 1863} {"train_loss": -6.047486782073975, "global_step": 78258, "epoch": 1863} {"train_loss": -5.987569808959961, "global_step": 78259, "epoch": 1863} {"train_loss": -6.039133071899414, "global_step": 78260, "epoch": 1863} {"train_loss": -6.103209495544434, "global_step": 78261, "epoch": 1863} {"train_loss": -6.072649002075195, "global_step": 78262, "epoch": 1863} {"train_loss": -6.208039283752441, "global_step": 78263, "epoch": 1863} {"train_loss": -6.109972953796387, "global_step": 78264, "epoch": 1863} {"train_loss": -6.103211402893066, "global_step": 78265, "epoch": 1863} {"train_loss": -6.103686332702637, "global_step": 78266, "epoch": 1863} {"train_loss": -6.026541233062744, "global_step": 78267, "epoch": 1863} {"train_loss": -6.0457587242126465, "global_step": 78268, "epoch": 1863} {"train_loss": -6.142990589141846, "global_step": 78269, "epoch": 1863} {"train_loss": -6.08762788772583, "global_step": 78270, "epoch": 1863} {"train_loss": -5.964422702789307, "global_step": 78271, "epoch": 1863} {"train_loss": -6.101382255554199, "global_step": 78272, "epoch": 1863} {"train_loss": -6.135648727416992, "global_step": 78273, "epoch": 1863} {"train_loss": -6.10308837890625, "global_step": 78274, "epoch": 1863} {"train_loss": -6.153380393981934, "global_step": 78275, "epoch": 1863} {"train_loss": -6.117652893066406, "global_step": 78276, "epoch": 1863} {"train_loss": -6.151985168457031, "global_step": 78277, "epoch": 1863} {"train_loss": -6.127397537231445, "global_step": 78278, "epoch": 1863} {"train_loss": -5.990225791931152, "global_step": 78279, "epoch": 1863} {"train_loss": -6.046879768371582, "global_step": 78280, "epoch": 1863} {"train_loss": -6.035719871520996, "global_step": 78281, "epoch": 1863} {"train_loss": -5.956615447998047, "global_step": 78282, "epoch": 1863} {"train_loss": -6.149423599243164, "global_step": 78283, "epoch": 1863} {"train_loss": -6.2184953689575195, "global_step": 78284, "epoch": 1863} {"train_loss": -6.146847724914551, "global_step": 78285, "epoch": 1863} {"train_loss": -5.973566055297852, "global_step": 78286, "epoch": 1863} {"train_loss": -6.087642170134044, "global_step": 78287, "epoch": 1863, "val_loss": 75362.015625} {"train_loss": -5.840268135070801, "global_step": 78288, "epoch": 1864} {"train_loss": -6.054193496704102, "global_step": 78289, "epoch": 1864} {"train_loss": -6.08742618560791, "global_step": 78290, "epoch": 1864} {"train_loss": -6.0244855880737305, "global_step": 78291, "epoch": 1864} {"train_loss": -6.031832695007324, "global_step": 78292, "epoch": 1864} {"train_loss": -6.029354095458984, "global_step": 78293, "epoch": 1864} {"train_loss": -6.0897908210754395, "global_step": 78294, "epoch": 1864} {"train_loss": -6.098611831665039, "global_step": 78295, "epoch": 1864} {"train_loss": -6.158177852630615, "global_step": 78296, "epoch": 1864} {"train_loss": -6.1714372634887695, "global_step": 78297, "epoch": 1864} {"train_loss": -6.038534164428711, "global_step": 78298, "epoch": 1864} {"train_loss": -6.095556259155273, "global_step": 78299, "epoch": 1864} {"train_loss": -6.091694355010986, "global_step": 78300, "epoch": 1864} {"train_loss": -6.13535213470459, "global_step": 78301, "epoch": 1864} {"train_loss": -6.089199066162109, "global_step": 78302, "epoch": 1864} {"train_loss": -6.065210342407227, "global_step": 78303, "epoch": 1864} {"train_loss": -6.02182674407959, "global_step": 78304, "epoch": 1864} {"train_loss": -6.095273494720459, "global_step": 78305, "epoch": 1864} {"train_loss": -6.108279228210449, "global_step": 78306, "epoch": 1864} {"train_loss": -6.074193000793457, "global_step": 78307, "epoch": 1864} {"train_loss": -6.152910232543945, "global_step": 78308, "epoch": 1864} {"train_loss": -6.0711283683776855, "global_step": 78309, "epoch": 1864} {"train_loss": -6.154289245605469, "global_step": 78310, "epoch": 1864} {"train_loss": -6.021700382232666, "global_step": 78311, "epoch": 1864} {"train_loss": -6.132603645324707, "global_step": 78312, "epoch": 1864} {"train_loss": -6.125222206115723, "global_step": 78313, "epoch": 1864} {"train_loss": -6.08467960357666, "global_step": 78314, "epoch": 1864} {"train_loss": -6.125832557678223, "global_step": 78315, "epoch": 1864} {"train_loss": -6.053932189941406, "global_step": 78316, "epoch": 1864} {"train_loss": -6.071532249450684, "global_step": 78317, "epoch": 1864} {"train_loss": -6.111016273498535, "global_step": 78318, "epoch": 1864} {"train_loss": -6.109576225280762, "global_step": 78319, "epoch": 1864} {"train_loss": -6.135929584503174, "global_step": 78320, "epoch": 1864} {"train_loss": -6.19509220123291, "global_step": 78321, "epoch": 1864} {"train_loss": -6.118244647979736, "global_step": 78322, "epoch": 1864} {"train_loss": -6.260932922363281, "global_step": 78323, "epoch": 1864} {"train_loss": -6.184111595153809, "global_step": 78324, "epoch": 1864} {"train_loss": -6.1534013748168945, "global_step": 78325, "epoch": 1864} {"train_loss": -6.096997261047363, "global_step": 78326, "epoch": 1864} {"train_loss": -6.142969131469727, "global_step": 78327, "epoch": 1864} {"train_loss": -6.179476261138916, "global_step": 78328, "epoch": 1864} {"train_loss": -6.098615635009039, "global_step": 78329, "epoch": 1864, "val_loss": 74818.1484375} {"train_loss": -6.149982452392578, "global_step": 78330, "epoch": 1865} {"train_loss": -6.122424602508545, "global_step": 78331, "epoch": 1865} {"train_loss": -6.171627044677734, "global_step": 78332, "epoch": 1865} {"train_loss": -6.0707807540893555, "global_step": 78333, "epoch": 1865} {"train_loss": -6.161258220672607, "global_step": 78334, "epoch": 1865} {"train_loss": -6.064598083496094, "global_step": 78335, "epoch": 1865} {"train_loss": -5.985696792602539, "global_step": 78336, "epoch": 1865} {"train_loss": -6.197943687438965, "global_step": 78337, "epoch": 1865} {"train_loss": -6.142061710357666, "global_step": 78338, "epoch": 1865} {"train_loss": -6.125730514526367, "global_step": 78339, "epoch": 1865} {"train_loss": -6.195827484130859, "global_step": 78340, "epoch": 1865} {"train_loss": -6.222695827484131, "global_step": 78341, "epoch": 1865} {"train_loss": -6.16551399230957, "global_step": 78342, "epoch": 1865} {"train_loss": -6.0584306716918945, "global_step": 78343, "epoch": 1865} {"train_loss": -6.149303436279297, "global_step": 78344, "epoch": 1865} {"train_loss": -6.197182655334473, "global_step": 78345, "epoch": 1865} {"train_loss": -6.152822971343994, "global_step": 78346, "epoch": 1865} {"train_loss": -6.134357452392578, "global_step": 78347, "epoch": 1865} {"train_loss": -6.121642112731934, "global_step": 78348, "epoch": 1865} {"train_loss": -6.093080520629883, "global_step": 78349, "epoch": 1865} {"train_loss": -6.058854579925537, "global_step": 78350, "epoch": 1865} {"train_loss": -6.217170715332031, "global_step": 78351, "epoch": 1865} {"train_loss": -6.091728210449219, "global_step": 78352, "epoch": 1865} {"train_loss": -6.144370079040527, "global_step": 78353, "epoch": 1865} {"train_loss": -6.085519313812256, "global_step": 78354, "epoch": 1865} {"train_loss": -6.210792064666748, "global_step": 78355, "epoch": 1865} {"train_loss": -6.12652587890625, "global_step": 78356, "epoch": 1865} {"train_loss": -6.063179969787598, "global_step": 78357, "epoch": 1865} {"train_loss": -6.143878936767578, "global_step": 78358, "epoch": 1865} {"train_loss": -6.187829494476318, "global_step": 78359, "epoch": 1865} {"train_loss": -6.233508110046387, "global_step": 78360, "epoch": 1865} {"train_loss": -6.11317253112793, "global_step": 78361, "epoch": 1865} {"train_loss": -6.183233737945557, "global_step": 78362, "epoch": 1865} {"train_loss": -6.11646842956543, "global_step": 78363, "epoch": 1865} {"train_loss": -6.031468868255615, "global_step": 78364, "epoch": 1865} {"train_loss": -6.04647159576416, "global_step": 78365, "epoch": 1865} {"train_loss": -6.12483549118042, "global_step": 78366, "epoch": 1865} {"train_loss": -6.034175872802734, "global_step": 78367, "epoch": 1865} {"train_loss": -6.108935832977295, "global_step": 78368, "epoch": 1865} {"train_loss": -6.144690036773682, "global_step": 78369, "epoch": 1865} {"train_loss": -6.116472244262695, "global_step": 78370, "epoch": 1865} {"train_loss": -6.128274429412115, "global_step": 78371, "epoch": 1865, "val_loss": 75252.6640625} {"train_loss": -6.046994209289551, "global_step": 78372, "epoch": 1866} {"train_loss": -6.044627666473389, "global_step": 78373, "epoch": 1866} {"train_loss": -6.072862148284912, "global_step": 78374, "epoch": 1866} {"train_loss": -5.992464065551758, "global_step": 78375, "epoch": 1866} {"train_loss": -6.06955623626709, "global_step": 78376, "epoch": 1866} {"train_loss": -6.101877689361572, "global_step": 78377, "epoch": 1866} {"train_loss": -6.050443649291992, "global_step": 78378, "epoch": 1866} {"train_loss": -6.069129467010498, "global_step": 78379, "epoch": 1866} {"train_loss": -6.197720527648926, "global_step": 78380, "epoch": 1866} {"train_loss": -6.168892860412598, "global_step": 78381, "epoch": 1866} {"train_loss": -6.180272102355957, "global_step": 78382, "epoch": 1866} {"train_loss": -6.2336106300354, "global_step": 78383, "epoch": 1866} {"train_loss": -6.24819278717041, "global_step": 78384, "epoch": 1866} {"train_loss": -6.202930450439453, "global_step": 78385, "epoch": 1866} {"train_loss": -6.211572647094727, "global_step": 78386, "epoch": 1866} {"train_loss": -6.247637748718262, "global_step": 78387, "epoch": 1866} {"train_loss": -6.235381126403809, "global_step": 78388, "epoch": 1866} {"train_loss": -6.1915812492370605, "global_step": 78389, "epoch": 1866} {"train_loss": -6.080711364746094, "global_step": 78390, "epoch": 1866} {"train_loss": -6.2265706062316895, "global_step": 78391, "epoch": 1866} {"train_loss": -6.1572041511535645, "global_step": 78392, "epoch": 1866} {"train_loss": -6.078312397003174, "global_step": 78393, "epoch": 1866} {"train_loss": -6.180459976196289, "global_step": 78394, "epoch": 1866} {"train_loss": -6.186712265014648, "global_step": 78395, "epoch": 1866} {"train_loss": -6.135038375854492, "global_step": 78396, "epoch": 1866} {"train_loss": -6.191695690155029, "global_step": 78397, "epoch": 1866} {"train_loss": -6.181412220001221, "global_step": 78398, "epoch": 1866} {"train_loss": -6.100805282592773, "global_step": 78399, "epoch": 1866} {"train_loss": -6.097881317138672, "global_step": 78400, "epoch": 1866} {"train_loss": -5.955408573150635, "global_step": 78401, "epoch": 1866} {"train_loss": -6.011186599731445, "global_step": 78402, "epoch": 1866} {"train_loss": -6.0338029861450195, "global_step": 78403, "epoch": 1866} {"train_loss": -6.019504070281982, "global_step": 78404, "epoch": 1866} {"train_loss": -6.102010726928711, "global_step": 78405, "epoch": 1866} {"train_loss": -6.1053056716918945, "global_step": 78406, "epoch": 1866} {"train_loss": -6.043715476989746, "global_step": 78407, "epoch": 1866} {"train_loss": -6.088197231292725, "global_step": 78408, "epoch": 1866} {"train_loss": -5.990170478820801, "global_step": 78409, "epoch": 1866} {"train_loss": -6.102993011474609, "global_step": 78410, "epoch": 1866} {"train_loss": -6.167636871337891, "global_step": 78411, "epoch": 1866} {"train_loss": -6.016510963439941, "global_step": 78412, "epoch": 1866} {"train_loss": -6.115392139979771, "global_step": 78413, "epoch": 1866, "val_loss": 74867.7578125} {"train_loss": -6.122447967529297, "global_step": 78414, "epoch": 1867} {"train_loss": -6.038503646850586, "global_step": 78415, "epoch": 1867} {"train_loss": -6.099493980407715, "global_step": 78416, "epoch": 1867} {"train_loss": -6.140673637390137, "global_step": 78417, "epoch": 1867} {"train_loss": -6.144421577453613, "global_step": 78418, "epoch": 1867} {"train_loss": -6.201934337615967, "global_step": 78419, "epoch": 1867} {"train_loss": -6.173640251159668, "global_step": 78420, "epoch": 1867} {"train_loss": -6.121466636657715, "global_step": 78421, "epoch": 1867} {"train_loss": -6.152897834777832, "global_step": 78422, "epoch": 1867} {"train_loss": -6.080883979797363, "global_step": 78423, "epoch": 1867} {"train_loss": -6.182533264160156, "global_step": 78424, "epoch": 1867} {"train_loss": -6.1601762771606445, "global_step": 78425, "epoch": 1867} {"train_loss": -6.051933288574219, "global_step": 78426, "epoch": 1867} {"train_loss": -6.266345024108887, "global_step": 78427, "epoch": 1867} {"train_loss": -6.073349952697754, "global_step": 78428, "epoch": 1867} {"train_loss": -6.085394382476807, "global_step": 78429, "epoch": 1867} {"train_loss": -6.21431827545166, "global_step": 78430, "epoch": 1867} {"train_loss": -6.242262840270996, "global_step": 78431, "epoch": 1867} {"train_loss": -6.1284685134887695, "global_step": 78432, "epoch": 1867} {"train_loss": -6.116026878356934, "global_step": 78433, "epoch": 1867} {"train_loss": -6.075949192047119, "global_step": 78434, "epoch": 1867} {"train_loss": -6.142728805541992, "global_step": 78435, "epoch": 1867} {"train_loss": -6.116586685180664, "global_step": 78436, "epoch": 1867} {"train_loss": -6.280905723571777, "global_step": 78437, "epoch": 1867} {"train_loss": -6.157298564910889, "global_step": 78438, "epoch": 1867} {"train_loss": -6.11475944519043, "global_step": 78439, "epoch": 1867} {"train_loss": -6.106143951416016, "global_step": 78440, "epoch": 1867} {"train_loss": -5.880552768707275, "global_step": 78441, "epoch": 1867} {"train_loss": -6.080024719238281, "global_step": 78442, "epoch": 1867} {"train_loss": -5.999406814575195, "global_step": 78443, "epoch": 1867} {"train_loss": -6.1354875564575195, "global_step": 78444, "epoch": 1867} {"train_loss": -6.154587268829346, "global_step": 78445, "epoch": 1867} {"train_loss": -6.173388481140137, "global_step": 78446, "epoch": 1867} {"train_loss": -6.137083053588867, "global_step": 78447, "epoch": 1867} {"train_loss": -6.081024169921875, "global_step": 78448, "epoch": 1867} {"train_loss": -6.009646415710449, "global_step": 78449, "epoch": 1867} {"train_loss": -6.089424133300781, "global_step": 78450, "epoch": 1867} {"train_loss": -6.1671142578125, "global_step": 78451, "epoch": 1867} {"train_loss": -6.089600563049316, "global_step": 78452, "epoch": 1867} {"train_loss": -6.171969413757324, "global_step": 78453, "epoch": 1867} {"train_loss": -6.095771789550781, "global_step": 78454, "epoch": 1867} {"train_loss": -6.118988014402843, "global_step": 78455, "epoch": 1867, "val_loss": 75002.109375} {"train_loss": -6.125649452209473, "global_step": 78456, "epoch": 1868} {"train_loss": -5.981119632720947, "global_step": 78457, "epoch": 1868} {"train_loss": -6.025580406188965, "global_step": 78458, "epoch": 1868} {"train_loss": -6.1474432945251465, "global_step": 78459, "epoch": 1868} {"train_loss": -6.084339141845703, "global_step": 78460, "epoch": 1868} {"train_loss": -6.190608501434326, "global_step": 78461, "epoch": 1868} {"train_loss": -6.051514148712158, "global_step": 78462, "epoch": 1868} {"train_loss": -6.139939785003662, "global_step": 78463, "epoch": 1868} {"train_loss": -6.218147277832031, "global_step": 78464, "epoch": 1868} {"train_loss": -6.1239776611328125, "global_step": 78465, "epoch": 1868} {"train_loss": -6.065667152404785, "global_step": 78466, "epoch": 1868} {"train_loss": -5.944196701049805, "global_step": 78467, "epoch": 1868} {"train_loss": -6.061232566833496, "global_step": 78468, "epoch": 1868} {"train_loss": -6.201339244842529, "global_step": 78469, "epoch": 1868} {"train_loss": -6.029140949249268, "global_step": 78470, "epoch": 1868} {"train_loss": -6.0947675704956055, "global_step": 78471, "epoch": 1868} {"train_loss": -6.131144046783447, "global_step": 78472, "epoch": 1868} {"train_loss": -5.9941205978393555, "global_step": 78473, "epoch": 1868} {"train_loss": -6.091294288635254, "global_step": 78474, "epoch": 1868} {"train_loss": -6.205549716949463, "global_step": 78475, "epoch": 1868} {"train_loss": -6.051713466644287, "global_step": 78476, "epoch": 1868} {"train_loss": -6.088663101196289, "global_step": 78477, "epoch": 1868} {"train_loss": -6.184442043304443, "global_step": 78478, "epoch": 1868} {"train_loss": -6.12734842300415, "global_step": 78479, "epoch": 1868} {"train_loss": -6.049334526062012, "global_step": 78480, "epoch": 1868} {"train_loss": -6.052761077880859, "global_step": 78481, "epoch": 1868} {"train_loss": -6.1985626220703125, "global_step": 78482, "epoch": 1868} {"train_loss": -6.138821601867676, "global_step": 78483, "epoch": 1868} {"train_loss": -6.007378578186035, "global_step": 78484, "epoch": 1868} {"train_loss": -6.162405967712402, "global_step": 78485, "epoch": 1868} {"train_loss": -6.134160041809082, "global_step": 78486, "epoch": 1868} {"train_loss": -6.181124687194824, "global_step": 78487, "epoch": 1868} {"train_loss": -6.255607604980469, "global_step": 78488, "epoch": 1868} {"train_loss": -6.161827564239502, "global_step": 78489, "epoch": 1868} {"train_loss": -6.119931697845459, "global_step": 78490, "epoch": 1868} {"train_loss": -5.926244735717773, "global_step": 78491, "epoch": 1868} {"train_loss": -6.144383430480957, "global_step": 78492, "epoch": 1868} {"train_loss": -6.117974758148193, "global_step": 78493, "epoch": 1868} {"train_loss": -6.151124954223633, "global_step": 78494, "epoch": 1868} {"train_loss": -6.134554862976074, "global_step": 78495, "epoch": 1868} {"train_loss": -6.145827293395996, "global_step": 78496, "epoch": 1868} {"train_loss": -6.107649496623448, "global_step": 78497, "epoch": 1868, "val_loss": 74993.1796875} {"train_loss": -6.212353706359863, "global_step": 78498, "epoch": 1869} {"train_loss": -6.0434675216674805, "global_step": 78499, "epoch": 1869} {"train_loss": -6.047821998596191, "global_step": 78500, "epoch": 1869} {"train_loss": -6.009035110473633, "global_step": 78501, "epoch": 1869} {"train_loss": -6.1548380851745605, "global_step": 78502, "epoch": 1869} {"train_loss": -6.172277450561523, "global_step": 78503, "epoch": 1869} {"train_loss": -6.07401704788208, "global_step": 78504, "epoch": 1869} {"train_loss": -6.136029243469238, "global_step": 78505, "epoch": 1869} {"train_loss": -6.133693695068359, "global_step": 78506, "epoch": 1869} {"train_loss": -6.1365861892700195, "global_step": 78507, "epoch": 1869} {"train_loss": -6.21239709854126, "global_step": 78508, "epoch": 1869} {"train_loss": -6.1728644371032715, "global_step": 78509, "epoch": 1869} {"train_loss": -6.088086128234863, "global_step": 78510, "epoch": 1869} {"train_loss": -6.153125286102295, "global_step": 78511, "epoch": 1869} {"train_loss": -6.17728328704834, "global_step": 78512, "epoch": 1869} {"train_loss": -6.10474157333374, "global_step": 78513, "epoch": 1869} {"train_loss": -6.136453628540039, "global_step": 78514, "epoch": 1869} {"train_loss": -6.196037292480469, "global_step": 78515, "epoch": 1869} {"train_loss": -5.999006271362305, "global_step": 78516, "epoch": 1869} {"train_loss": -6.011103630065918, "global_step": 78517, "epoch": 1869} {"train_loss": -6.18812370300293, "global_step": 78518, "epoch": 1869} {"train_loss": -6.139280319213867, "global_step": 78519, "epoch": 1869} {"train_loss": -6.141626358032227, "global_step": 78520, "epoch": 1869} {"train_loss": -6.058950424194336, "global_step": 78521, "epoch": 1869} {"train_loss": -6.11311149597168, "global_step": 78522, "epoch": 1869} {"train_loss": -6.1902923583984375, "global_step": 78523, "epoch": 1869} {"train_loss": -6.144660949707031, "global_step": 78524, "epoch": 1869} {"train_loss": -6.230268478393555, "global_step": 78525, "epoch": 1869} {"train_loss": -6.050379753112793, "global_step": 78526, "epoch": 1869} {"train_loss": -6.230890274047852, "global_step": 78527, "epoch": 1869} {"train_loss": -6.232033729553223, "global_step": 78528, "epoch": 1869} {"train_loss": -6.198932647705078, "global_step": 78529, "epoch": 1869} {"train_loss": -6.047233581542969, "global_step": 78530, "epoch": 1869} {"train_loss": -6.160877227783203, "global_step": 78531, "epoch": 1869} {"train_loss": -6.137693881988525, "global_step": 78532, "epoch": 1869} {"train_loss": -6.076336860656738, "global_step": 78533, "epoch": 1869} {"train_loss": -6.214482307434082, "global_step": 78534, "epoch": 1869} {"train_loss": -6.158560752868652, "global_step": 78535, "epoch": 1869} {"train_loss": -6.318124771118164, "global_step": 78536, "epoch": 1869} {"train_loss": -6.114290237426758, "global_step": 78537, "epoch": 1869} {"train_loss": -5.986322402954102, "global_step": 78538, "epoch": 1869} {"train_loss": -6.133982760565622, "global_step": 78539, "epoch": 1869, "val_loss": 75085.96875} {"train_loss": -6.0496063232421875, "global_step": 78540, "epoch": 1870} {"train_loss": -6.073643684387207, "global_step": 78541, "epoch": 1870} {"train_loss": -6.069965362548828, "global_step": 78542, "epoch": 1870} {"train_loss": -6.126195907592773, "global_step": 78543, "epoch": 1870} {"train_loss": -6.058254241943359, "global_step": 78544, "epoch": 1870} {"train_loss": -6.051684379577637, "global_step": 78545, "epoch": 1870} {"train_loss": -6.149504661560059, "global_step": 78546, "epoch": 1870} {"train_loss": -6.124345779418945, "global_step": 78547, "epoch": 1870} {"train_loss": -6.154168128967285, "global_step": 78548, "epoch": 1870} {"train_loss": -6.135616302490234, "global_step": 78549, "epoch": 1870} {"train_loss": -6.074517726898193, "global_step": 78550, "epoch": 1870} {"train_loss": -6.082271099090576, "global_step": 78551, "epoch": 1870} {"train_loss": -6.201949596405029, "global_step": 78552, "epoch": 1870} {"train_loss": -6.142707347869873, "global_step": 78553, "epoch": 1870} {"train_loss": -6.048929691314697, "global_step": 78554, "epoch": 1870} {"train_loss": -6.122859477996826, "global_step": 78555, "epoch": 1870} {"train_loss": -6.140401363372803, "global_step": 78556, "epoch": 1870} {"train_loss": -6.1959381103515625, "global_step": 78557, "epoch": 1870} {"train_loss": -6.095278739929199, "global_step": 78558, "epoch": 1870} {"train_loss": -6.100967884063721, "global_step": 78559, "epoch": 1870} {"train_loss": -6.142158508300781, "global_step": 78560, "epoch": 1870} {"train_loss": -6.206844806671143, "global_step": 78561, "epoch": 1870} {"train_loss": -6.030806541442871, "global_step": 78562, "epoch": 1870} {"train_loss": -6.1461567878723145, "global_step": 78563, "epoch": 1870} {"train_loss": -6.081056594848633, "global_step": 78564, "epoch": 1870} {"train_loss": -6.201575756072998, "global_step": 78565, "epoch": 1870} {"train_loss": -6.263245582580566, "global_step": 78566, "epoch": 1870} {"train_loss": -6.112256050109863, "global_step": 78567, "epoch": 1870} {"train_loss": -6.258664608001709, "global_step": 78568, "epoch": 1870} {"train_loss": -6.145822525024414, "global_step": 78569, "epoch": 1870} {"train_loss": -6.185580253601074, "global_step": 78570, "epoch": 1870} {"train_loss": -6.086714267730713, "global_step": 78571, "epoch": 1870} {"train_loss": -6.221559524536133, "global_step": 78572, "epoch": 1870} {"train_loss": -6.131089210510254, "global_step": 78573, "epoch": 1870} {"train_loss": -6.141359329223633, "global_step": 78574, "epoch": 1870} {"train_loss": -6.064338207244873, "global_step": 78575, "epoch": 1870} {"train_loss": -6.263579368591309, "global_step": 78576, "epoch": 1870} {"train_loss": -6.108131408691406, "global_step": 78577, "epoch": 1870} {"train_loss": -6.102001667022705, "global_step": 78578, "epoch": 1870} {"train_loss": -6.019937515258789, "global_step": 78579, "epoch": 1870} {"train_loss": -6.130122661590576, "global_step": 78580, "epoch": 1870} {"train_loss": -6.127089682079497, "global_step": 78581, "epoch": 1870, "val_loss": 75025.859375} {"train_loss": -6.190786361694336, "global_step": 78582, "epoch": 1871} {"train_loss": -6.114806652069092, "global_step": 78583, "epoch": 1871} {"train_loss": -6.162857532501221, "global_step": 78584, "epoch": 1871} {"train_loss": -6.122734546661377, "global_step": 78585, "epoch": 1871} {"train_loss": -6.005049705505371, "global_step": 78586, "epoch": 1871} {"train_loss": -6.108404159545898, "global_step": 78587, "epoch": 1871} {"train_loss": -6.137338638305664, "global_step": 78588, "epoch": 1871} {"train_loss": -6.121416091918945, "global_step": 78589, "epoch": 1871} {"train_loss": -6.239028453826904, "global_step": 78590, "epoch": 1871} {"train_loss": -6.055004119873047, "global_step": 78591, "epoch": 1871} {"train_loss": -6.143522262573242, "global_step": 78592, "epoch": 1871} {"train_loss": -6.033686637878418, "global_step": 78593, "epoch": 1871} {"train_loss": -6.2019147872924805, "global_step": 78594, "epoch": 1871} {"train_loss": -6.196371555328369, "global_step": 78595, "epoch": 1871} {"train_loss": -6.05872917175293, "global_step": 78596, "epoch": 1871} {"train_loss": -6.0908203125, "global_step": 78597, "epoch": 1871} {"train_loss": -6.042848587036133, "global_step": 78598, "epoch": 1871} {"train_loss": -6.060060977935791, "global_step": 78599, "epoch": 1871} {"train_loss": -6.21306037902832, "global_step": 78600, "epoch": 1871} {"train_loss": -6.153753280639648, "global_step": 78601, "epoch": 1871} {"train_loss": -6.122220039367676, "global_step": 78602, "epoch": 1871} {"train_loss": -6.147124290466309, "global_step": 78603, "epoch": 1871} {"train_loss": -6.106083869934082, "global_step": 78604, "epoch": 1871} {"train_loss": -6.20262336730957, "global_step": 78605, "epoch": 1871} {"train_loss": -6.1597185134887695, "global_step": 78606, "epoch": 1871} {"train_loss": -5.953855991363525, "global_step": 78607, "epoch": 1871} {"train_loss": -5.937379837036133, "global_step": 78608, "epoch": 1871} {"train_loss": -6.1279096603393555, "global_step": 78609, "epoch": 1871} {"train_loss": -6.000679016113281, "global_step": 78610, "epoch": 1871} {"train_loss": -6.037086009979248, "global_step": 78611, "epoch": 1871} {"train_loss": -6.12841796875, "global_step": 78612, "epoch": 1871} {"train_loss": -6.032716751098633, "global_step": 78613, "epoch": 1871} {"train_loss": -6.167213439941406, "global_step": 78614, "epoch": 1871} {"train_loss": -5.9993391036987305, "global_step": 78615, "epoch": 1871} {"train_loss": -6.102663993835449, "global_step": 78616, "epoch": 1871} {"train_loss": -6.076777458190918, "global_step": 78617, "epoch": 1871} {"train_loss": -6.089886665344238, "global_step": 78618, "epoch": 1871} {"train_loss": -6.128406047821045, "global_step": 78619, "epoch": 1871} {"train_loss": -6.222657203674316, "global_step": 78620, "epoch": 1871} {"train_loss": -6.111879825592041, "global_step": 78621, "epoch": 1871} {"train_loss": -6.1093902587890625, "global_step": 78622, "epoch": 1871} {"train_loss": -6.106268439974103, "global_step": 78623, "epoch": 1871, "val_loss": 75089.0546875} {"train_loss": -6.146942138671875, "global_step": 78624, "epoch": 1872} {"train_loss": -6.156767845153809, "global_step": 78625, "epoch": 1872} {"train_loss": -6.119959831237793, "global_step": 78626, "epoch": 1872} {"train_loss": -6.158026695251465, "global_step": 78627, "epoch": 1872} {"train_loss": -6.070950984954834, "global_step": 78628, "epoch": 1872} {"train_loss": -6.117587089538574, "global_step": 78629, "epoch": 1872} {"train_loss": -6.137202262878418, "global_step": 78630, "epoch": 1872} {"train_loss": -6.045267105102539, "global_step": 78631, "epoch": 1872} {"train_loss": -6.162006378173828, "global_step": 78632, "epoch": 1872} {"train_loss": -6.191473960876465, "global_step": 78633, "epoch": 1872} {"train_loss": -6.104278087615967, "global_step": 78634, "epoch": 1872} {"train_loss": -6.103174209594727, "global_step": 78635, "epoch": 1872} {"train_loss": -6.195566177368164, "global_step": 78636, "epoch": 1872} {"train_loss": -6.082089424133301, "global_step": 78637, "epoch": 1872} {"train_loss": -5.964585304260254, "global_step": 78638, "epoch": 1872} {"train_loss": -6.097936630249023, "global_step": 78639, "epoch": 1872} {"train_loss": -6.073554992675781, "global_step": 78640, "epoch": 1872} {"train_loss": -6.1005377769470215, "global_step": 78641, "epoch": 1872} {"train_loss": -5.9776225090026855, "global_step": 78642, "epoch": 1872} {"train_loss": -5.98020076751709, "global_step": 78643, "epoch": 1872} {"train_loss": -6.114152908325195, "global_step": 78644, "epoch": 1872} {"train_loss": -5.897265434265137, "global_step": 78645, "epoch": 1872} {"train_loss": -5.99377965927124, "global_step": 78646, "epoch": 1872} {"train_loss": -6.084872245788574, "global_step": 78647, "epoch": 1872} {"train_loss": -6.0110063552856445, "global_step": 78648, "epoch": 1872} {"train_loss": -6.067623138427734, "global_step": 78649, "epoch": 1872} {"train_loss": -5.968200206756592, "global_step": 78650, "epoch": 1872} {"train_loss": -6.198387145996094, "global_step": 78651, "epoch": 1872} {"train_loss": -5.964970588684082, "global_step": 78652, "epoch": 1872} {"train_loss": -6.066343784332275, "global_step": 78653, "epoch": 1872} {"train_loss": -6.019026756286621, "global_step": 78654, "epoch": 1872} {"train_loss": -6.188004016876221, "global_step": 78655, "epoch": 1872} {"train_loss": -6.176906585693359, "global_step": 78656, "epoch": 1872} {"train_loss": -5.996919631958008, "global_step": 78657, "epoch": 1872} {"train_loss": -6.109783172607422, "global_step": 78658, "epoch": 1872} {"train_loss": -5.977265357971191, "global_step": 78659, "epoch": 1872} {"train_loss": -6.1417131423950195, "global_step": 78660, "epoch": 1872} {"train_loss": -5.9857354164123535, "global_step": 78661, "epoch": 1872} {"train_loss": -6.173715114593506, "global_step": 78662, "epoch": 1872} {"train_loss": -6.246260643005371, "global_step": 78663, "epoch": 1872} {"train_loss": -6.124232292175293, "global_step": 78664, "epoch": 1872} {"train_loss": -6.084687414623442, "global_step": 78665, "epoch": 1872, "val_loss": 74544.0390625} {"train_loss": -6.031878471374512, "global_step": 78666, "epoch": 1873} {"train_loss": -6.056840419769287, "global_step": 78667, "epoch": 1873} {"train_loss": -6.1635003089904785, "global_step": 78668, "epoch": 1873} {"train_loss": -6.181382179260254, "global_step": 78669, "epoch": 1873} {"train_loss": -6.209042549133301, "global_step": 78670, "epoch": 1873} {"train_loss": -6.152417182922363, "global_step": 78671, "epoch": 1873} {"train_loss": -6.103691101074219, "global_step": 78672, "epoch": 1873} {"train_loss": -6.189406394958496, "global_step": 78673, "epoch": 1873} {"train_loss": -6.140545845031738, "global_step": 78674, "epoch": 1873} {"train_loss": -6.218362808227539, "global_step": 78675, "epoch": 1873} {"train_loss": -6.155364990234375, "global_step": 78676, "epoch": 1873} {"train_loss": -6.165101051330566, "global_step": 78677, "epoch": 1873} {"train_loss": -6.179815769195557, "global_step": 78678, "epoch": 1873} {"train_loss": -6.130731582641602, "global_step": 78679, "epoch": 1873} {"train_loss": -6.127484321594238, "global_step": 78680, "epoch": 1873} {"train_loss": -6.054556846618652, "global_step": 78681, "epoch": 1873} {"train_loss": -6.110806465148926, "global_step": 78682, "epoch": 1873} {"train_loss": -6.1314802169799805, "global_step": 78683, "epoch": 1873} {"train_loss": -6.268975257873535, "global_step": 78684, "epoch": 1873} {"train_loss": -6.137598514556885, "global_step": 78685, "epoch": 1873} {"train_loss": -6.030573844909668, "global_step": 78686, "epoch": 1873} {"train_loss": -5.992751121520996, "global_step": 78687, "epoch": 1873} {"train_loss": -6.160085201263428, "global_step": 78688, "epoch": 1873} {"train_loss": -6.207576751708984, "global_step": 78689, "epoch": 1873} {"train_loss": -5.94105339050293, "global_step": 78690, "epoch": 1873} {"train_loss": -6.080757141113281, "global_step": 78691, "epoch": 1873} {"train_loss": -6.124691486358643, "global_step": 78692, "epoch": 1873} {"train_loss": -6.093209266662598, "global_step": 78693, "epoch": 1873} {"train_loss": -6.101853370666504, "global_step": 78694, "epoch": 1873} {"train_loss": -6.194311141967773, "global_step": 78695, "epoch": 1873} {"train_loss": -6.128626823425293, "global_step": 78696, "epoch": 1873} {"train_loss": -6.178960800170898, "global_step": 78697, "epoch": 1873} {"train_loss": -6.173704147338867, "global_step": 78698, "epoch": 1873} {"train_loss": -6.132676601409912, "global_step": 78699, "epoch": 1873} {"train_loss": -5.964987277984619, "global_step": 78700, "epoch": 1873} {"train_loss": -6.1625871658325195, "global_step": 78701, "epoch": 1873} {"train_loss": -6.142157077789307, "global_step": 78702, "epoch": 1873} {"train_loss": -6.068497657775879, "global_step": 78703, "epoch": 1873} {"train_loss": -6.1319684982299805, "global_step": 78704, "epoch": 1873} {"train_loss": -6.164454460144043, "global_step": 78705, "epoch": 1873} {"train_loss": -6.1598801612854, "global_step": 78706, "epoch": 1873} {"train_loss": -6.128689436685471, "global_step": 78707, "epoch": 1873, "val_loss": 74985.3125} {"train_loss": -6.152757167816162, "global_step": 78708, "epoch": 1874} {"train_loss": -6.182614803314209, "global_step": 78709, "epoch": 1874} {"train_loss": -6.111124038696289, "global_step": 78710, "epoch": 1874} {"train_loss": -6.050511360168457, "global_step": 78711, "epoch": 1874} {"train_loss": -6.050982475280762, "global_step": 78712, "epoch": 1874} {"train_loss": -6.1094770431518555, "global_step": 78713, "epoch": 1874} {"train_loss": -6.086905479431152, "global_step": 78714, "epoch": 1874} {"train_loss": -6.221318244934082, "global_step": 78715, "epoch": 1874} {"train_loss": -6.043826103210449, "global_step": 78716, "epoch": 1874} {"train_loss": -6.0233917236328125, "global_step": 78717, "epoch": 1874} {"train_loss": -6.21435022354126, "global_step": 78718, "epoch": 1874} {"train_loss": -6.175383567810059, "global_step": 78719, "epoch": 1874} {"train_loss": -6.176002502441406, "global_step": 78720, "epoch": 1874} {"train_loss": -6.221869468688965, "global_step": 78721, "epoch": 1874} {"train_loss": -6.064651012420654, "global_step": 78722, "epoch": 1874} {"train_loss": -6.11318302154541, "global_step": 78723, "epoch": 1874} {"train_loss": -6.153388023376465, "global_step": 78724, "epoch": 1874} {"train_loss": -6.103391170501709, "global_step": 78725, "epoch": 1874} {"train_loss": -6.1551666259765625, "global_step": 78726, "epoch": 1874} {"train_loss": -6.085769176483154, "global_step": 78727, "epoch": 1874} {"train_loss": -6.149369239807129, "global_step": 78728, "epoch": 1874} {"train_loss": -6.104470252990723, "global_step": 78729, "epoch": 1874} {"train_loss": -6.121443271636963, "global_step": 78730, "epoch": 1874} {"train_loss": -6.2143707275390625, "global_step": 78731, "epoch": 1874} {"train_loss": -6.1084394454956055, "global_step": 78732, "epoch": 1874} {"train_loss": -6.031984806060791, "global_step": 78733, "epoch": 1874} {"train_loss": -6.012045860290527, "global_step": 78734, "epoch": 1874} {"train_loss": -6.172151565551758, "global_step": 78735, "epoch": 1874} {"train_loss": -6.134025573730469, "global_step": 78736, "epoch": 1874} {"train_loss": -6.234781265258789, "global_step": 78737, "epoch": 1874} {"train_loss": -6.184568405151367, "global_step": 78738, "epoch": 1874} {"train_loss": -6.151121616363525, "global_step": 78739, "epoch": 1874} {"train_loss": -6.07590389251709, "global_step": 78740, "epoch": 1874} {"train_loss": -6.124027252197266, "global_step": 78741, "epoch": 1874} {"train_loss": -6.2183990478515625, "global_step": 78742, "epoch": 1874} {"train_loss": -6.094627857208252, "global_step": 78743, "epoch": 1874} {"train_loss": -6.1454057693481445, "global_step": 78744, "epoch": 1874} {"train_loss": -6.2584075927734375, "global_step": 78745, "epoch": 1874} {"train_loss": -6.1745147705078125, "global_step": 78746, "epoch": 1874} {"train_loss": -6.075265884399414, "global_step": 78747, "epoch": 1874} {"train_loss": -6.023775577545166, "global_step": 78748, "epoch": 1874} {"train_loss": -6.132246505646479, "global_step": 78749, "epoch": 1874, "val_loss": 75090.5703125} {"train_loss": -6.195611953735352, "global_step": 78750, "epoch": 1875} {"train_loss": -6.213299751281738, "global_step": 78751, "epoch": 1875} {"train_loss": -6.178300857543945, "global_step": 78752, "epoch": 1875} {"train_loss": -6.193938255310059, "global_step": 78753, "epoch": 1875} {"train_loss": -6.122084140777588, "global_step": 78754, "epoch": 1875} {"train_loss": -6.127647399902344, "global_step": 78755, "epoch": 1875} {"train_loss": -6.1727094650268555, "global_step": 78756, "epoch": 1875} {"train_loss": -5.955232620239258, "global_step": 78757, "epoch": 1875} {"train_loss": -6.166101455688477, "global_step": 78758, "epoch": 1875} {"train_loss": -6.178501605987549, "global_step": 78759, "epoch": 1875} {"train_loss": -6.233119487762451, "global_step": 78760, "epoch": 1875} {"train_loss": -6.166177749633789, "global_step": 78761, "epoch": 1875} {"train_loss": -6.229076385498047, "global_step": 78762, "epoch": 1875} {"train_loss": -6.086508274078369, "global_step": 78763, "epoch": 1875} {"train_loss": -6.153717517852783, "global_step": 78764, "epoch": 1875} {"train_loss": -6.0688629150390625, "global_step": 78765, "epoch": 1875} {"train_loss": -6.151456832885742, "global_step": 78766, "epoch": 1875} {"train_loss": -6.034010410308838, "global_step": 78767, "epoch": 1875} {"train_loss": -6.275931358337402, "global_step": 78768, "epoch": 1875} {"train_loss": -5.944858551025391, "global_step": 78769, "epoch": 1875} {"train_loss": -6.122057914733887, "global_step": 78770, "epoch": 1875} {"train_loss": -6.059456825256348, "global_step": 78771, "epoch": 1875} {"train_loss": -6.139493465423584, "global_step": 78772, "epoch": 1875} {"train_loss": -6.172398567199707, "global_step": 78773, "epoch": 1875} {"train_loss": -6.081289291381836, "global_step": 78774, "epoch": 1875} {"train_loss": -6.157346725463867, "global_step": 78775, "epoch": 1875} {"train_loss": -6.02951717376709, "global_step": 78776, "epoch": 1875} {"train_loss": -6.251989364624023, "global_step": 78777, "epoch": 1875} {"train_loss": -6.0525102615356445, "global_step": 78778, "epoch": 1875} {"train_loss": -6.075213432312012, "global_step": 78779, "epoch": 1875} {"train_loss": -6.149725437164307, "global_step": 78780, "epoch": 1875} {"train_loss": -6.07214879989624, "global_step": 78781, "epoch": 1875} {"train_loss": -6.1349287033081055, "global_step": 78782, "epoch": 1875} {"train_loss": -5.951963424682617, "global_step": 78783, "epoch": 1875} {"train_loss": -6.082569599151611, "global_step": 78784, "epoch": 1875} {"train_loss": -6.111852645874023, "global_step": 78785, "epoch": 1875} {"train_loss": -6.124899864196777, "global_step": 78786, "epoch": 1875} {"train_loss": -6.09849739074707, "global_step": 78787, "epoch": 1875} {"train_loss": -6.049595832824707, "global_step": 78788, "epoch": 1875} {"train_loss": -5.969916343688965, "global_step": 78789, "epoch": 1875} {"train_loss": -6.204920291900635, "global_step": 78790, "epoch": 1875} {"train_loss": -6.122888860248384, "global_step": 78791, "epoch": 1875, "val_loss": 74876.9765625} {"train_loss": -6.101081848144531, "global_step": 78792, "epoch": 1876} {"train_loss": -6.127350807189941, "global_step": 78793, "epoch": 1876} {"train_loss": -6.12312650680542, "global_step": 78794, "epoch": 1876} {"train_loss": -6.140086650848389, "global_step": 78795, "epoch": 1876} {"train_loss": -6.270204544067383, "global_step": 78796, "epoch": 1876} {"train_loss": -6.038741111755371, "global_step": 78797, "epoch": 1876} {"train_loss": -6.181766033172607, "global_step": 78798, "epoch": 1876} {"train_loss": -6.183990001678467, "global_step": 78799, "epoch": 1876} {"train_loss": -6.170945167541504, "global_step": 78800, "epoch": 1876} {"train_loss": -6.130728721618652, "global_step": 78801, "epoch": 1876} {"train_loss": -6.2240495681762695, "global_step": 78802, "epoch": 1876} {"train_loss": -6.001830577850342, "global_step": 78803, "epoch": 1876} {"train_loss": -6.146862983703613, "global_step": 78804, "epoch": 1876} {"train_loss": -6.131429672241211, "global_step": 78805, "epoch": 1876} {"train_loss": -6.051795959472656, "global_step": 78806, "epoch": 1876} {"train_loss": -6.036272048950195, "global_step": 78807, "epoch": 1876} {"train_loss": -6.093130588531494, "global_step": 78808, "epoch": 1876} {"train_loss": -6.090080261230469, "global_step": 78809, "epoch": 1876} {"train_loss": -6.144265174865723, "global_step": 78810, "epoch": 1876} {"train_loss": -5.986026763916016, "global_step": 78811, "epoch": 1876} {"train_loss": -6.200811386108398, "global_step": 78812, "epoch": 1876} {"train_loss": -6.075016498565674, "global_step": 78813, "epoch": 1876} {"train_loss": -5.979846000671387, "global_step": 78814, "epoch": 1876} {"train_loss": -6.062009334564209, "global_step": 78815, "epoch": 1876} {"train_loss": -6.047552108764648, "global_step": 78816, "epoch": 1876} {"train_loss": -5.995205402374268, "global_step": 78817, "epoch": 1876} {"train_loss": -6.269852638244629, "global_step": 78818, "epoch": 1876} {"train_loss": -6.149312496185303, "global_step": 78819, "epoch": 1876} {"train_loss": -6.137031555175781, "global_step": 78820, "epoch": 1876} {"train_loss": -6.042473316192627, "global_step": 78821, "epoch": 1876} {"train_loss": -5.998933792114258, "global_step": 78822, "epoch": 1876} {"train_loss": -6.149996757507324, "global_step": 78823, "epoch": 1876} {"train_loss": -5.981710433959961, "global_step": 78824, "epoch": 1876} {"train_loss": -5.886041641235352, "global_step": 78825, "epoch": 1876} {"train_loss": -5.9375505447387695, "global_step": 78826, "epoch": 1876} {"train_loss": -5.971744060516357, "global_step": 78827, "epoch": 1876} {"train_loss": -6.039330959320068, "global_step": 78828, "epoch": 1876} {"train_loss": -5.988325119018555, "global_step": 78829, "epoch": 1876} {"train_loss": -6.073446750640869, "global_step": 78830, "epoch": 1876} {"train_loss": -6.147432327270508, "global_step": 78831, "epoch": 1876} {"train_loss": -6.081429481506348, "global_step": 78832, "epoch": 1876} {"train_loss": -6.085271472022647, "global_step": 78833, "epoch": 1876, "val_loss": 75414.0390625} {"train_loss": -6.007635116577148, "global_step": 78834, "epoch": 1877} {"train_loss": -6.056558132171631, "global_step": 78835, "epoch": 1877} {"train_loss": -6.0983076095581055, "global_step": 78836, "epoch": 1877} {"train_loss": -6.026224136352539, "global_step": 78837, "epoch": 1877} {"train_loss": -6.017024993896484, "global_step": 78838, "epoch": 1877} {"train_loss": -6.057426929473877, "global_step": 78839, "epoch": 1877} {"train_loss": -5.909303665161133, "global_step": 78840, "epoch": 1877} {"train_loss": -6.18385124206543, "global_step": 78841, "epoch": 1877} {"train_loss": -6.07418155670166, "global_step": 78842, "epoch": 1877} {"train_loss": -6.053563594818115, "global_step": 78843, "epoch": 1877} {"train_loss": -6.051407814025879, "global_step": 78844, "epoch": 1877} {"train_loss": -6.098369598388672, "global_step": 78845, "epoch": 1877} {"train_loss": -6.109438419342041, "global_step": 78846, "epoch": 1877} {"train_loss": -6.0640130043029785, "global_step": 78847, "epoch": 1877} {"train_loss": -6.047693252563477, "global_step": 78848, "epoch": 1877} {"train_loss": -6.157188892364502, "global_step": 78849, "epoch": 1877} {"train_loss": -6.1442060470581055, "global_step": 78850, "epoch": 1877} {"train_loss": -6.179827690124512, "global_step": 78851, "epoch": 1877} {"train_loss": -6.14694881439209, "global_step": 78852, "epoch": 1877} {"train_loss": -6.129917144775391, "global_step": 78853, "epoch": 1877} {"train_loss": -6.224564075469971, "global_step": 78854, "epoch": 1877} {"train_loss": -6.020050048828125, "global_step": 78855, "epoch": 1877} {"train_loss": -6.119600772857666, "global_step": 78856, "epoch": 1877} {"train_loss": -6.0982184410095215, "global_step": 78857, "epoch": 1877} {"train_loss": -6.138724327087402, "global_step": 78858, "epoch": 1877} {"train_loss": -6.3081889152526855, "global_step": 78859, "epoch": 1877} {"train_loss": -6.005679607391357, "global_step": 78860, "epoch": 1877} {"train_loss": -6.127782821655273, "global_step": 78861, "epoch": 1877} {"train_loss": -6.228784561157227, "global_step": 78862, "epoch": 1877} {"train_loss": -6.267817497253418, "global_step": 78863, "epoch": 1877} {"train_loss": -6.133106231689453, "global_step": 78864, "epoch": 1877} {"train_loss": -6.149043560028076, "global_step": 78865, "epoch": 1877} {"train_loss": -6.11181640625, "global_step": 78866, "epoch": 1877} {"train_loss": -6.190361022949219, "global_step": 78867, "epoch": 1877} {"train_loss": -6.169459342956543, "global_step": 78868, "epoch": 1877} {"train_loss": -6.186884880065918, "global_step": 78869, "epoch": 1877} {"train_loss": -6.032839298248291, "global_step": 78870, "epoch": 1877} {"train_loss": -5.907285690307617, "global_step": 78871, "epoch": 1877} {"train_loss": -6.12928581237793, "global_step": 78872, "epoch": 1877} {"train_loss": -6.136928081512451, "global_step": 78873, "epoch": 1877} {"train_loss": -6.185737133026123, "global_step": 78874, "epoch": 1877} {"train_loss": -6.1084695770626976, "global_step": 78875, "epoch": 1877, "val_loss": 75178.2421875} {"train_loss": -6.186458110809326, "global_step": 78876, "epoch": 1878} {"train_loss": -6.131860733032227, "global_step": 78877, "epoch": 1878} {"train_loss": -6.1766557693481445, "global_step": 78878, "epoch": 1878} {"train_loss": -6.061419486999512, "global_step": 78879, "epoch": 1878} {"train_loss": -6.04046106338501, "global_step": 78880, "epoch": 1878} {"train_loss": -6.113290786743164, "global_step": 78881, "epoch": 1878} {"train_loss": -5.937077522277832, "global_step": 78882, "epoch": 1878} {"train_loss": -6.086019515991211, "global_step": 78883, "epoch": 1878} {"train_loss": -6.13910436630249, "global_step": 78884, "epoch": 1878} {"train_loss": -6.01161003112793, "global_step": 78885, "epoch": 1878} {"train_loss": -6.167635917663574, "global_step": 78886, "epoch": 1878} {"train_loss": -6.035393714904785, "global_step": 78887, "epoch": 1878} {"train_loss": -6.039129257202148, "global_step": 78888, "epoch": 1878} {"train_loss": -6.063307285308838, "global_step": 78889, "epoch": 1878} {"train_loss": -6.0404486656188965, "global_step": 78890, "epoch": 1878} {"train_loss": -6.120067596435547, "global_step": 78891, "epoch": 1878} {"train_loss": -6.0884294509887695, "global_step": 78892, "epoch": 1878} {"train_loss": -6.050485610961914, "global_step": 78893, "epoch": 1878} {"train_loss": -6.062263488769531, "global_step": 78894, "epoch": 1878} {"train_loss": -6.148088455200195, "global_step": 78895, "epoch": 1878} {"train_loss": -6.051265716552734, "global_step": 78896, "epoch": 1878} {"train_loss": -6.080095291137695, "global_step": 78897, "epoch": 1878} {"train_loss": -6.079952716827393, "global_step": 78898, "epoch": 1878} {"train_loss": -6.055054664611816, "global_step": 78899, "epoch": 1878} {"train_loss": -6.047733306884766, "global_step": 78900, "epoch": 1878} {"train_loss": -6.038693428039551, "global_step": 78901, "epoch": 1878} {"train_loss": -6.091869354248047, "global_step": 78902, "epoch": 1878} {"train_loss": -6.027676582336426, "global_step": 78903, "epoch": 1878} {"train_loss": -5.979296684265137, "global_step": 78904, "epoch": 1878} {"train_loss": -6.1012372970581055, "global_step": 78905, "epoch": 1878} {"train_loss": -6.1025543212890625, "global_step": 78906, "epoch": 1878} {"train_loss": -6.159420967102051, "global_step": 78907, "epoch": 1878} {"train_loss": -6.079018592834473, "global_step": 78908, "epoch": 1878} {"train_loss": -6.009346008300781, "global_step": 78909, "epoch": 1878} {"train_loss": -6.1573166847229, "global_step": 78910, "epoch": 1878} {"train_loss": -6.040823936462402, "global_step": 78911, "epoch": 1878} {"train_loss": -6.094046592712402, "global_step": 78912, "epoch": 1878} {"train_loss": -6.079391956329346, "global_step": 78913, "epoch": 1878} {"train_loss": -5.977290153503418, "global_step": 78914, "epoch": 1878} {"train_loss": -5.975485324859619, "global_step": 78915, "epoch": 1878} {"train_loss": -6.062804222106934, "global_step": 78916, "epoch": 1878} {"train_loss": -6.074742646444411, "global_step": 78917, "epoch": 1878, "val_loss": 75085.234375} {"train_loss": -6.147336959838867, "global_step": 78918, "epoch": 1879} {"train_loss": -6.056906700134277, "global_step": 78919, "epoch": 1879} {"train_loss": -6.133265972137451, "global_step": 78920, "epoch": 1879} {"train_loss": -6.2222065925598145, "global_step": 78921, "epoch": 1879} {"train_loss": -6.163069248199463, "global_step": 78922, "epoch": 1879} {"train_loss": -6.233043670654297, "global_step": 78923, "epoch": 1879} {"train_loss": -6.168861389160156, "global_step": 78924, "epoch": 1879} {"train_loss": -6.032477855682373, "global_step": 78925, "epoch": 1879} {"train_loss": -6.226030349731445, "global_step": 78926, "epoch": 1879} {"train_loss": -6.130006313323975, "global_step": 78927, "epoch": 1879} {"train_loss": -6.100380897521973, "global_step": 78928, "epoch": 1879} {"train_loss": -5.892807483673096, "global_step": 78929, "epoch": 1879} {"train_loss": -6.141292572021484, "global_step": 78930, "epoch": 1879} {"train_loss": -6.169300079345703, "global_step": 78931, "epoch": 1879} {"train_loss": -6.119076728820801, "global_step": 78932, "epoch": 1879} {"train_loss": -6.140767574310303, "global_step": 78933, "epoch": 1879} {"train_loss": -6.22471809387207, "global_step": 78934, "epoch": 1879} {"train_loss": -6.090000629425049, "global_step": 78935, "epoch": 1879} {"train_loss": -6.15579080581665, "global_step": 78936, "epoch": 1879} {"train_loss": -6.128175258636475, "global_step": 78937, "epoch": 1879} {"train_loss": -6.065001010894775, "global_step": 78938, "epoch": 1879} {"train_loss": -6.066143989562988, "global_step": 78939, "epoch": 1879} {"train_loss": -6.1852569580078125, "global_step": 78940, "epoch": 1879} {"train_loss": -6.20747184753418, "global_step": 78941, "epoch": 1879} {"train_loss": -6.16485595703125, "global_step": 78942, "epoch": 1879} {"train_loss": -5.976922988891602, "global_step": 78943, "epoch": 1879} {"train_loss": -6.1858673095703125, "global_step": 78944, "epoch": 1879} {"train_loss": -6.210134029388428, "global_step": 78945, "epoch": 1879} {"train_loss": -6.063192367553711, "global_step": 78946, "epoch": 1879} {"train_loss": -6.178830146789551, "global_step": 78947, "epoch": 1879} {"train_loss": -6.208542823791504, "global_step": 78948, "epoch": 1879} {"train_loss": -6.017301559448242, "global_step": 78949, "epoch": 1879} {"train_loss": -6.089541435241699, "global_step": 78950, "epoch": 1879} {"train_loss": -6.140697479248047, "global_step": 78951, "epoch": 1879} {"train_loss": -6.117964744567871, "global_step": 78952, "epoch": 1879} {"train_loss": -6.143657684326172, "global_step": 78953, "epoch": 1879} {"train_loss": -6.1373114585876465, "global_step": 78954, "epoch": 1879} {"train_loss": -6.108369827270508, "global_step": 78955, "epoch": 1879} {"train_loss": -6.216802597045898, "global_step": 78956, "epoch": 1879} {"train_loss": -6.016351222991943, "global_step": 78957, "epoch": 1879} {"train_loss": -6.102682590484619, "global_step": 78958, "epoch": 1879} {"train_loss": -6.129011097408476, "global_step": 78959, "epoch": 1879, "val_loss": 74884.125} {"train_loss": -6.154888153076172, "global_step": 78960, "epoch": 1880} {"train_loss": -6.165428638458252, "global_step": 78961, "epoch": 1880} {"train_loss": -6.056118965148926, "global_step": 78962, "epoch": 1880} {"train_loss": -6.188933372497559, "global_step": 78963, "epoch": 1880} {"train_loss": -6.098984241485596, "global_step": 78964, "epoch": 1880} {"train_loss": -6.04360294342041, "global_step": 78965, "epoch": 1880} {"train_loss": -6.149280071258545, "global_step": 78966, "epoch": 1880} {"train_loss": -6.201010704040527, "global_step": 78967, "epoch": 1880} {"train_loss": -6.122324466705322, "global_step": 78968, "epoch": 1880} {"train_loss": -6.205775260925293, "global_step": 78969, "epoch": 1880} {"train_loss": -6.168912887573242, "global_step": 78970, "epoch": 1880} {"train_loss": -6.192930698394775, "global_step": 78971, "epoch": 1880} {"train_loss": -6.052176475524902, "global_step": 78972, "epoch": 1880} {"train_loss": -6.1681084632873535, "global_step": 78973, "epoch": 1880} {"train_loss": -6.112408638000488, "global_step": 78974, "epoch": 1880} {"train_loss": -6.092606544494629, "global_step": 78975, "epoch": 1880} {"train_loss": -6.040014266967773, "global_step": 78976, "epoch": 1880} {"train_loss": -6.0636444091796875, "global_step": 78977, "epoch": 1880} {"train_loss": -5.9950714111328125, "global_step": 78978, "epoch": 1880} {"train_loss": -6.070645332336426, "global_step": 78979, "epoch": 1880} {"train_loss": -6.180535316467285, "global_step": 78980, "epoch": 1880} {"train_loss": -6.073338508605957, "global_step": 78981, "epoch": 1880} {"train_loss": -6.297362327575684, "global_step": 78982, "epoch": 1880} {"train_loss": -6.191059589385986, "global_step": 78983, "epoch": 1880} {"train_loss": -6.2132487297058105, "global_step": 78984, "epoch": 1880} {"train_loss": -6.090915203094482, "global_step": 78985, "epoch": 1880} {"train_loss": -6.185883522033691, "global_step": 78986, "epoch": 1880} {"train_loss": -6.013463020324707, "global_step": 78987, "epoch": 1880} {"train_loss": -6.105828285217285, "global_step": 78988, "epoch": 1880} {"train_loss": -6.177568435668945, "global_step": 78989, "epoch": 1880} {"train_loss": -6.270359039306641, "global_step": 78990, "epoch": 1880} {"train_loss": -6.207110404968262, "global_step": 78991, "epoch": 1880} {"train_loss": -6.141852855682373, "global_step": 78992, "epoch": 1880} {"train_loss": -6.092634201049805, "global_step": 78993, "epoch": 1880} {"train_loss": -6.034079074859619, "global_step": 78994, "epoch": 1880} {"train_loss": -6.182872772216797, "global_step": 78995, "epoch": 1880} {"train_loss": -6.095476150512695, "global_step": 78996, "epoch": 1880} {"train_loss": -6.12905740737915, "global_step": 78997, "epoch": 1880} {"train_loss": -6.057033538818359, "global_step": 78998, "epoch": 1880} {"train_loss": -6.147496700286865, "global_step": 78999, "epoch": 1880} {"train_loss": -6.178612232208252, "global_step": 79000, "epoch": 1880} {"train_loss": -6.130370435260591, "global_step": 79001, "epoch": 1880, "val_loss": 75027.921875} {"train_loss": -6.02711296081543, "global_step": 79002, "epoch": 1881} {"train_loss": -6.063514709472656, "global_step": 79003, "epoch": 1881} {"train_loss": -5.929671287536621, "global_step": 79004, "epoch": 1881} {"train_loss": -6.085119724273682, "global_step": 79005, "epoch": 1881} {"train_loss": -5.94544792175293, "global_step": 79006, "epoch": 1881} {"train_loss": -6.1780548095703125, "global_step": 79007, "epoch": 1881} {"train_loss": -6.015301704406738, "global_step": 79008, "epoch": 1881} {"train_loss": -6.174616813659668, "global_step": 79009, "epoch": 1881} {"train_loss": -6.021883964538574, "global_step": 79010, "epoch": 1881} {"train_loss": -6.007326126098633, "global_step": 79011, "epoch": 1881} {"train_loss": -6.051321506500244, "global_step": 79012, "epoch": 1881} {"train_loss": -6.077474117279053, "global_step": 79013, "epoch": 1881} {"train_loss": -5.967634201049805, "global_step": 79014, "epoch": 1881} {"train_loss": -6.006555557250977, "global_step": 79015, "epoch": 1881} {"train_loss": -6.118990898132324, "global_step": 79016, "epoch": 1881} {"train_loss": -5.9439191818237305, "global_step": 79017, "epoch": 1881} {"train_loss": -5.95509672164917, "global_step": 79018, "epoch": 1881} {"train_loss": -6.081575870513916, "global_step": 79019, "epoch": 1881} {"train_loss": -5.97396183013916, "global_step": 79020, "epoch": 1881} {"train_loss": -6.167245864868164, "global_step": 79021, "epoch": 1881} {"train_loss": -6.054798603057861, "global_step": 79022, "epoch": 1881} {"train_loss": -6.093921661376953, "global_step": 79023, "epoch": 1881} {"train_loss": -5.966962814331055, "global_step": 79024, "epoch": 1881} {"train_loss": -6.129687309265137, "global_step": 79025, "epoch": 1881} {"train_loss": -6.089216709136963, "global_step": 79026, "epoch": 1881} {"train_loss": -6.117947578430176, "global_step": 79027, "epoch": 1881} {"train_loss": -6.204964637756348, "global_step": 79028, "epoch": 1881} {"train_loss": -6.07466983795166, "global_step": 79029, "epoch": 1881} {"train_loss": -6.190979957580566, "global_step": 79030, "epoch": 1881} {"train_loss": -6.087618350982666, "global_step": 79031, "epoch": 1881} {"train_loss": -5.996798992156982, "global_step": 79032, "epoch": 1881} {"train_loss": -6.137377738952637, "global_step": 79033, "epoch": 1881} {"train_loss": -6.1371355056762695, "global_step": 79034, "epoch": 1881} {"train_loss": -6.174473762512207, "global_step": 79035, "epoch": 1881} {"train_loss": -6.112899303436279, "global_step": 79036, "epoch": 1881} {"train_loss": -5.963378429412842, "global_step": 79037, "epoch": 1881} {"train_loss": -6.216201305389404, "global_step": 79038, "epoch": 1881} {"train_loss": -6.103377342224121, "global_step": 79039, "epoch": 1881} {"train_loss": -5.960997581481934, "global_step": 79040, "epoch": 1881} {"train_loss": -6.144824981689453, "global_step": 79041, "epoch": 1881} {"train_loss": -5.907516002655029, "global_step": 79042, "epoch": 1881} {"train_loss": -6.065393618174961, "global_step": 79043, "epoch": 1881, "val_loss": 75418.5859375} {"train_loss": -6.088444232940674, "global_step": 79044, "epoch": 1882} {"train_loss": -5.966489791870117, "global_step": 79045, "epoch": 1882} {"train_loss": -6.19895076751709, "global_step": 79046, "epoch": 1882} {"train_loss": -6.066227912902832, "global_step": 79047, "epoch": 1882} {"train_loss": -6.193339824676514, "global_step": 79048, "epoch": 1882} {"train_loss": -6.135563373565674, "global_step": 79049, "epoch": 1882} {"train_loss": -6.08935546875, "global_step": 79050, "epoch": 1882} {"train_loss": -6.038713455200195, "global_step": 79051, "epoch": 1882} {"train_loss": -6.099902153015137, "global_step": 79052, "epoch": 1882} {"train_loss": -6.064414024353027, "global_step": 79053, "epoch": 1882} {"train_loss": -6.176912784576416, "global_step": 79054, "epoch": 1882} {"train_loss": -6.026484489440918, "global_step": 79055, "epoch": 1882} {"train_loss": -6.148584365844727, "global_step": 79056, "epoch": 1882} {"train_loss": -5.980427265167236, "global_step": 79057, "epoch": 1882} {"train_loss": -6.052530765533447, "global_step": 79058, "epoch": 1882} {"train_loss": -6.163003921508789, "global_step": 79059, "epoch": 1882} {"train_loss": -6.05536413192749, "global_step": 79060, "epoch": 1882} {"train_loss": -6.107540130615234, "global_step": 79061, "epoch": 1882} {"train_loss": -5.971417427062988, "global_step": 79062, "epoch": 1882} {"train_loss": -6.086440086364746, "global_step": 79063, "epoch": 1882} {"train_loss": -6.101239204406738, "global_step": 79064, "epoch": 1882} {"train_loss": -6.088018417358398, "global_step": 79065, "epoch": 1882} {"train_loss": -6.148709297180176, "global_step": 79066, "epoch": 1882} {"train_loss": -5.943173885345459, "global_step": 79067, "epoch": 1882} {"train_loss": -6.041635513305664, "global_step": 79068, "epoch": 1882} {"train_loss": -6.027868747711182, "global_step": 79069, "epoch": 1882} {"train_loss": -6.168753623962402, "global_step": 79070, "epoch": 1882} {"train_loss": -5.930905342102051, "global_step": 79071, "epoch": 1882} {"train_loss": -5.931623458862305, "global_step": 79072, "epoch": 1882} {"train_loss": -6.071917533874512, "global_step": 79073, "epoch": 1882} {"train_loss": -6.083216667175293, "global_step": 79074, "epoch": 1882} {"train_loss": -6.0728254318237305, "global_step": 79075, "epoch": 1882} {"train_loss": -6.0088958740234375, "global_step": 79076, "epoch": 1882} {"train_loss": -6.149720191955566, "global_step": 79077, "epoch": 1882} {"train_loss": -5.9259490966796875, "global_step": 79078, "epoch": 1882} {"train_loss": -6.040364742279053, "global_step": 79079, "epoch": 1882} {"train_loss": -5.9047346115112305, "global_step": 79080, "epoch": 1882} {"train_loss": -6.205881595611572, "global_step": 79081, "epoch": 1882} {"train_loss": -5.812002182006836, "global_step": 79082, "epoch": 1882} {"train_loss": -5.9840826988220215, "global_step": 79083, "epoch": 1882} {"train_loss": -5.9947309494018555, "global_step": 79084, "epoch": 1882} {"train_loss": -6.060225248336792, "global_step": 79085, "epoch": 1882, "val_loss": 75257.640625} {"train_loss": -5.94689416885376, "global_step": 79086, "epoch": 1883} {"train_loss": -5.974099636077881, "global_step": 79087, "epoch": 1883} {"train_loss": -5.970423221588135, "global_step": 79088, "epoch": 1883} {"train_loss": -6.0025739669799805, "global_step": 79089, "epoch": 1883} {"train_loss": -5.979398727416992, "global_step": 79090, "epoch": 1883} {"train_loss": -6.158972263336182, "global_step": 79091, "epoch": 1883} {"train_loss": -6.011948585510254, "global_step": 79092, "epoch": 1883} {"train_loss": -6.163853645324707, "global_step": 79093, "epoch": 1883} {"train_loss": -6.059561252593994, "global_step": 79094, "epoch": 1883} {"train_loss": -6.053339958190918, "global_step": 79095, "epoch": 1883} {"train_loss": -6.1670026779174805, "global_step": 79096, "epoch": 1883} {"train_loss": -6.184299468994141, "global_step": 79097, "epoch": 1883} {"train_loss": -6.177750587463379, "global_step": 79098, "epoch": 1883} {"train_loss": -6.119518280029297, "global_step": 79099, "epoch": 1883} {"train_loss": -6.145455360412598, "global_step": 79100, "epoch": 1883} {"train_loss": -6.165736675262451, "global_step": 79101, "epoch": 1883} {"train_loss": -6.145217418670654, "global_step": 79102, "epoch": 1883} {"train_loss": -6.199431896209717, "global_step": 79103, "epoch": 1883} {"train_loss": -6.220863342285156, "global_step": 79104, "epoch": 1883} {"train_loss": -6.131293773651123, "global_step": 79105, "epoch": 1883} {"train_loss": -6.119117736816406, "global_step": 79106, "epoch": 1883} {"train_loss": -6.129095554351807, "global_step": 79107, "epoch": 1883} {"train_loss": -6.218274116516113, "global_step": 79108, "epoch": 1883} {"train_loss": -6.180315971374512, "global_step": 79109, "epoch": 1883} {"train_loss": -6.182010650634766, "global_step": 79110, "epoch": 1883} {"train_loss": -6.053664684295654, "global_step": 79111, "epoch": 1883} {"train_loss": -6.040611267089844, "global_step": 79112, "epoch": 1883} {"train_loss": -6.087216854095459, "global_step": 79113, "epoch": 1883} {"train_loss": -6.0634660720825195, "global_step": 79114, "epoch": 1883} {"train_loss": -6.131331443786621, "global_step": 79115, "epoch": 1883} {"train_loss": -6.120375633239746, "global_step": 79116, "epoch": 1883} {"train_loss": -6.07262659072876, "global_step": 79117, "epoch": 1883} {"train_loss": -6.1165056228637695, "global_step": 79118, "epoch": 1883} {"train_loss": -6.039281845092773, "global_step": 79119, "epoch": 1883} {"train_loss": -6.064122200012207, "global_step": 79120, "epoch": 1883} {"train_loss": -6.025564193725586, "global_step": 79121, "epoch": 1883} {"train_loss": -6.209763526916504, "global_step": 79122, "epoch": 1883} {"train_loss": -6.16611385345459, "global_step": 79123, "epoch": 1883} {"train_loss": -6.038583755493164, "global_step": 79124, "epoch": 1883} {"train_loss": -6.097840309143066, "global_step": 79125, "epoch": 1883} {"train_loss": -6.200833320617676, "global_step": 79126, "epoch": 1883} {"train_loss": -6.106486672446842, "global_step": 79127, "epoch": 1883, "val_loss": 74751.1015625} {"train_loss": -6.107368469238281, "global_step": 79128, "epoch": 1884} {"train_loss": -6.1662797927856445, "global_step": 79129, "epoch": 1884} {"train_loss": -6.0934929847717285, "global_step": 79130, "epoch": 1884} {"train_loss": -6.200271129608154, "global_step": 79131, "epoch": 1884} {"train_loss": -6.173570156097412, "global_step": 79132, "epoch": 1884} {"train_loss": -6.045101165771484, "global_step": 79133, "epoch": 1884} {"train_loss": -6.124022960662842, "global_step": 79134, "epoch": 1884} {"train_loss": -6.055839538574219, "global_step": 79135, "epoch": 1884} {"train_loss": -6.11710786819458, "global_step": 79136, "epoch": 1884} {"train_loss": -6.1689348220825195, "global_step": 79137, "epoch": 1884} {"train_loss": -6.1843390464782715, "global_step": 79138, "epoch": 1884} {"train_loss": -6.137329578399658, "global_step": 79139, "epoch": 1884} {"train_loss": -6.109566688537598, "global_step": 79140, "epoch": 1884} {"train_loss": -6.23298454284668, "global_step": 79141, "epoch": 1884} {"train_loss": -6.201948165893555, "global_step": 79142, "epoch": 1884} {"train_loss": -6.135422706604004, "global_step": 79143, "epoch": 1884} {"train_loss": -6.08236837387085, "global_step": 79144, "epoch": 1884} {"train_loss": -6.116593837738037, "global_step": 79145, "epoch": 1884} {"train_loss": -6.140984535217285, "global_step": 79146, "epoch": 1884} {"train_loss": -6.192476272583008, "global_step": 79147, "epoch": 1884} {"train_loss": -6.06477165222168, "global_step": 79148, "epoch": 1884} {"train_loss": -6.082921981811523, "global_step": 79149, "epoch": 1884} {"train_loss": -6.171494483947754, "global_step": 79150, "epoch": 1884} {"train_loss": -6.236146450042725, "global_step": 79151, "epoch": 1884} {"train_loss": -6.156163215637207, "global_step": 79152, "epoch": 1884} {"train_loss": -6.165701866149902, "global_step": 79153, "epoch": 1884} {"train_loss": -6.160861968994141, "global_step": 79154, "epoch": 1884} {"train_loss": -6.141814231872559, "global_step": 79155, "epoch": 1884} {"train_loss": -6.105589866638184, "global_step": 79156, "epoch": 1884} {"train_loss": -6.171904563903809, "global_step": 79157, "epoch": 1884} {"train_loss": -6.019073486328125, "global_step": 79158, "epoch": 1884} {"train_loss": -6.123934745788574, "global_step": 79159, "epoch": 1884} {"train_loss": -6.044830322265625, "global_step": 79160, "epoch": 1884} {"train_loss": -6.125637531280518, "global_step": 79161, "epoch": 1884} {"train_loss": -6.335776329040527, "global_step": 79162, "epoch": 1884} {"train_loss": -6.06799840927124, "global_step": 79163, "epoch": 1884} {"train_loss": -6.159327507019043, "global_step": 79164, "epoch": 1884} {"train_loss": -6.1261701583862305, "global_step": 79165, "epoch": 1884} {"train_loss": -6.1252946853637695, "global_step": 79166, "epoch": 1884} {"train_loss": -6.253793716430664, "global_step": 79167, "epoch": 1884} {"train_loss": -6.056617736816406, "global_step": 79168, "epoch": 1884} {"train_loss": -6.136948290325346, "global_step": 79169, "epoch": 1884, "val_loss": 74893.28125} {"train_loss": -6.119889259338379, "global_step": 79170, "epoch": 1885} {"train_loss": -6.0458269119262695, "global_step": 79171, "epoch": 1885} {"train_loss": -6.28459358215332, "global_step": 79172, "epoch": 1885} {"train_loss": -6.21923303604126, "global_step": 79173, "epoch": 1885} {"train_loss": -6.142889976501465, "global_step": 79174, "epoch": 1885} {"train_loss": -6.280613899230957, "global_step": 79175, "epoch": 1885} {"train_loss": -6.1756062507629395, "global_step": 79176, "epoch": 1885} {"train_loss": -5.97898006439209, "global_step": 79177, "epoch": 1885} {"train_loss": -6.161298751831055, "global_step": 79178, "epoch": 1885} {"train_loss": -6.118903160095215, "global_step": 79179, "epoch": 1885} {"train_loss": -6.1542158126831055, "global_step": 79180, "epoch": 1885} {"train_loss": -6.102156639099121, "global_step": 79181, "epoch": 1885} {"train_loss": -6.109686851501465, "global_step": 79182, "epoch": 1885} {"train_loss": -6.191630840301514, "global_step": 79183, "epoch": 1885} {"train_loss": -6.077537536621094, "global_step": 79184, "epoch": 1885} {"train_loss": -6.094115257263184, "global_step": 79185, "epoch": 1885} {"train_loss": -5.989821910858154, "global_step": 79186, "epoch": 1885} {"train_loss": -6.037053108215332, "global_step": 79187, "epoch": 1885} {"train_loss": -6.102077007293701, "global_step": 79188, "epoch": 1885} {"train_loss": -6.146254539489746, "global_step": 79189, "epoch": 1885} {"train_loss": -6.184133052825928, "global_step": 79190, "epoch": 1885} {"train_loss": -6.1149797439575195, "global_step": 79191, "epoch": 1885} {"train_loss": -6.182050704956055, "global_step": 79192, "epoch": 1885} {"train_loss": -6.046386241912842, "global_step": 79193, "epoch": 1885} {"train_loss": -6.05219841003418, "global_step": 79194, "epoch": 1885} {"train_loss": -6.145792007446289, "global_step": 79195, "epoch": 1885} {"train_loss": -6.2345757484436035, "global_step": 79196, "epoch": 1885} {"train_loss": -6.2073469161987305, "global_step": 79197, "epoch": 1885} {"train_loss": -6.149158954620361, "global_step": 79198, "epoch": 1885} {"train_loss": -6.262213706970215, "global_step": 79199, "epoch": 1885} {"train_loss": -6.137618064880371, "global_step": 79200, "epoch": 1885} {"train_loss": -6.179351806640625, "global_step": 79201, "epoch": 1885} {"train_loss": -6.070224761962891, "global_step": 79202, "epoch": 1885} {"train_loss": -6.1096882820129395, "global_step": 79203, "epoch": 1885} {"train_loss": -6.035118103027344, "global_step": 79204, "epoch": 1885} {"train_loss": -6.132143497467041, "global_step": 79205, "epoch": 1885} {"train_loss": -6.154374122619629, "global_step": 79206, "epoch": 1885} {"train_loss": -6.2130537033081055, "global_step": 79207, "epoch": 1885} {"train_loss": -6.077923774719238, "global_step": 79208, "epoch": 1885} {"train_loss": -6.048421859741211, "global_step": 79209, "epoch": 1885} {"train_loss": -6.044764995574951, "global_step": 79210, "epoch": 1885} {"train_loss": -6.129124016988845, "global_step": 79211, "epoch": 1885, "val_loss": 75593.078125} {"train_loss": -5.957664489746094, "global_step": 79212, "epoch": 1886} {"train_loss": -6.124284744262695, "global_step": 79213, "epoch": 1886} {"train_loss": -6.172616958618164, "global_step": 79214, "epoch": 1886} {"train_loss": -6.010825157165527, "global_step": 79215, "epoch": 1886} {"train_loss": -6.218102931976318, "global_step": 79216, "epoch": 1886} {"train_loss": -6.00545597076416, "global_step": 79217, "epoch": 1886} {"train_loss": -6.0280985832214355, "global_step": 79218, "epoch": 1886} {"train_loss": -6.126194953918457, "global_step": 79219, "epoch": 1886} {"train_loss": -6.0411577224731445, "global_step": 79220, "epoch": 1886} {"train_loss": -5.897873401641846, "global_step": 79221, "epoch": 1886} {"train_loss": -6.087141990661621, "global_step": 79222, "epoch": 1886} {"train_loss": -6.0321173667907715, "global_step": 79223, "epoch": 1886} {"train_loss": -6.100541591644287, "global_step": 79224, "epoch": 1886} {"train_loss": -6.071471691131592, "global_step": 79225, "epoch": 1886} {"train_loss": -6.207919120788574, "global_step": 79226, "epoch": 1886} {"train_loss": -6.1559929847717285, "global_step": 79227, "epoch": 1886} {"train_loss": -6.112480163574219, "global_step": 79228, "epoch": 1886} {"train_loss": -6.103087425231934, "global_step": 79229, "epoch": 1886} {"train_loss": -6.179423809051514, "global_step": 79230, "epoch": 1886} {"train_loss": -6.105995178222656, "global_step": 79231, "epoch": 1886} {"train_loss": -6.162266254425049, "global_step": 79232, "epoch": 1886} {"train_loss": -6.123542785644531, "global_step": 79233, "epoch": 1886} {"train_loss": -5.9956254959106445, "global_step": 79234, "epoch": 1886} {"train_loss": -6.043034553527832, "global_step": 79235, "epoch": 1886} {"train_loss": -6.207377910614014, "global_step": 79236, "epoch": 1886} {"train_loss": -6.0954132080078125, "global_step": 79237, "epoch": 1886} {"train_loss": -6.111106872558594, "global_step": 79238, "epoch": 1886} {"train_loss": -6.125832557678223, "global_step": 79239, "epoch": 1886} {"train_loss": -6.1667890548706055, "global_step": 79240, "epoch": 1886} {"train_loss": -6.118398189544678, "global_step": 79241, "epoch": 1886} {"train_loss": -6.209948539733887, "global_step": 79242, "epoch": 1886} {"train_loss": -6.061833381652832, "global_step": 79243, "epoch": 1886} {"train_loss": -6.117086887359619, "global_step": 79244, "epoch": 1886} {"train_loss": -6.035167694091797, "global_step": 79245, "epoch": 1886} {"train_loss": -5.991166114807129, "global_step": 79246, "epoch": 1886} {"train_loss": -6.082085609436035, "global_step": 79247, "epoch": 1886} {"train_loss": -6.09332275390625, "global_step": 79248, "epoch": 1886} {"train_loss": -6.079379081726074, "global_step": 79249, "epoch": 1886} {"train_loss": -6.124454021453857, "global_step": 79250, "epoch": 1886} {"train_loss": -6.080019474029541, "global_step": 79251, "epoch": 1886} {"train_loss": -6.123676300048828, "global_step": 79252, "epoch": 1886} {"train_loss": -6.096232505071731, "global_step": 79253, "epoch": 1886, "val_loss": 74681.8046875} {"train_loss": -6.261534214019775, "global_step": 79254, "epoch": 1887} {"train_loss": -6.075810432434082, "global_step": 79255, "epoch": 1887} {"train_loss": -6.17464542388916, "global_step": 79256, "epoch": 1887} {"train_loss": -6.174246311187744, "global_step": 79257, "epoch": 1887} {"train_loss": -6.164684772491455, "global_step": 79258, "epoch": 1887} {"train_loss": -6.159944534301758, "global_step": 79259, "epoch": 1887} {"train_loss": -6.16632080078125, "global_step": 79260, "epoch": 1887} {"train_loss": -6.099542140960693, "global_step": 79261, "epoch": 1887} {"train_loss": -6.142858028411865, "global_step": 79262, "epoch": 1887} {"train_loss": -6.146213531494141, "global_step": 79263, "epoch": 1887} {"train_loss": -6.04561710357666, "global_step": 79264, "epoch": 1887} {"train_loss": -6.082241058349609, "global_step": 79265, "epoch": 1887} {"train_loss": -5.994755268096924, "global_step": 79266, "epoch": 1887} {"train_loss": -6.141387939453125, "global_step": 79267, "epoch": 1887} {"train_loss": -6.172656536102295, "global_step": 79268, "epoch": 1887} {"train_loss": -6.1096625328063965, "global_step": 79269, "epoch": 1887} {"train_loss": -6.179969787597656, "global_step": 79270, "epoch": 1887} {"train_loss": -6.148290634155273, "global_step": 79271, "epoch": 1887} {"train_loss": -6.19575309753418, "global_step": 79272, "epoch": 1887} {"train_loss": -6.245285987854004, "global_step": 79273, "epoch": 1887} {"train_loss": -6.060065269470215, "global_step": 79274, "epoch": 1887} {"train_loss": -6.237567901611328, "global_step": 79275, "epoch": 1887} {"train_loss": -6.123989105224609, "global_step": 79276, "epoch": 1887} {"train_loss": -5.993614196777344, "global_step": 79277, "epoch": 1887} {"train_loss": -6.041272163391113, "global_step": 79278, "epoch": 1887} {"train_loss": -5.947025299072266, "global_step": 79279, "epoch": 1887} {"train_loss": -6.131308555603027, "global_step": 79280, "epoch": 1887} {"train_loss": -6.072007179260254, "global_step": 79281, "epoch": 1887} {"train_loss": -5.913125991821289, "global_step": 79282, "epoch": 1887} {"train_loss": -6.104788780212402, "global_step": 79283, "epoch": 1887} {"train_loss": -6.113239288330078, "global_step": 79284, "epoch": 1887} {"train_loss": -5.98936653137207, "global_step": 79285, "epoch": 1887} {"train_loss": -6.118076324462891, "global_step": 79286, "epoch": 1887} {"train_loss": -6.184657096862793, "global_step": 79287, "epoch": 1887} {"train_loss": -6.162755012512207, "global_step": 79288, "epoch": 1887} {"train_loss": -5.944143295288086, "global_step": 79289, "epoch": 1887} {"train_loss": -6.1814470291137695, "global_step": 79290, "epoch": 1887} {"train_loss": -6.088837146759033, "global_step": 79291, "epoch": 1887} {"train_loss": -6.050820827484131, "global_step": 79292, "epoch": 1887} {"train_loss": -6.089024066925049, "global_step": 79293, "epoch": 1887} {"train_loss": -6.079721450805664, "global_step": 79294, "epoch": 1887} {"train_loss": -6.108592510223389, "global_step": 79295, "epoch": 1887, "val_loss": 75203.78125} {"train_loss": -6.105809211730957, "global_step": 79296, "epoch": 1888} {"train_loss": -6.086538314819336, "global_step": 79297, "epoch": 1888} {"train_loss": -6.13068962097168, "global_step": 79298, "epoch": 1888} {"train_loss": -6.0621161460876465, "global_step": 79299, "epoch": 1888} {"train_loss": -6.115879058837891, "global_step": 79300, "epoch": 1888} {"train_loss": -6.104294776916504, "global_step": 79301, "epoch": 1888} {"train_loss": -6.062142848968506, "global_step": 79302, "epoch": 1888} {"train_loss": -6.136220932006836, "global_step": 79303, "epoch": 1888} {"train_loss": -6.167820930480957, "global_step": 79304, "epoch": 1888} {"train_loss": -6.1566877365112305, "global_step": 79305, "epoch": 1888} {"train_loss": -6.129870891571045, "global_step": 79306, "epoch": 1888} {"train_loss": -6.145847320556641, "global_step": 79307, "epoch": 1888} {"train_loss": -6.217629432678223, "global_step": 79308, "epoch": 1888} {"train_loss": -6.163840293884277, "global_step": 79309, "epoch": 1888} {"train_loss": -6.173134803771973, "global_step": 79310, "epoch": 1888} {"train_loss": -6.2285003662109375, "global_step": 79311, "epoch": 1888} {"train_loss": -6.104750633239746, "global_step": 79312, "epoch": 1888} {"train_loss": -6.063541412353516, "global_step": 79313, "epoch": 1888} {"train_loss": -6.248834609985352, "global_step": 79314, "epoch": 1888} {"train_loss": -6.147507667541504, "global_step": 79315, "epoch": 1888} {"train_loss": -6.111428737640381, "global_step": 79316, "epoch": 1888} {"train_loss": -6.11956787109375, "global_step": 79317, "epoch": 1888} {"train_loss": -6.221688270568848, "global_step": 79318, "epoch": 1888} {"train_loss": -6.280591011047363, "global_step": 79319, "epoch": 1888} {"train_loss": -6.092724800109863, "global_step": 79320, "epoch": 1888} {"train_loss": -6.026639938354492, "global_step": 79321, "epoch": 1888} {"train_loss": -6.162810325622559, "global_step": 79322, "epoch": 1888} {"train_loss": -6.094219207763672, "global_step": 79323, "epoch": 1888} {"train_loss": -6.106541633605957, "global_step": 79324, "epoch": 1888} {"train_loss": -6.185606002807617, "global_step": 79325, "epoch": 1888} {"train_loss": -6.164068222045898, "global_step": 79326, "epoch": 1888} {"train_loss": -6.259397506713867, "global_step": 79327, "epoch": 1888} {"train_loss": -6.110353946685791, "global_step": 79328, "epoch": 1888} {"train_loss": -5.920310020446777, "global_step": 79329, "epoch": 1888} {"train_loss": -6.083835124969482, "global_step": 79330, "epoch": 1888} {"train_loss": -6.187443733215332, "global_step": 79331, "epoch": 1888} {"train_loss": -6.067692756652832, "global_step": 79332, "epoch": 1888} {"train_loss": -6.172102928161621, "global_step": 79333, "epoch": 1888} {"train_loss": -6.0947265625, "global_step": 79334, "epoch": 1888} {"train_loss": -6.199031829833984, "global_step": 79335, "epoch": 1888} {"train_loss": -6.113219738006592, "global_step": 79336, "epoch": 1888} {"train_loss": -6.136057796932402, "global_step": 79337, "epoch": 1888, "val_loss": 74937.1875} {"train_loss": -6.2034807205200195, "global_step": 79338, "epoch": 1889} {"train_loss": -6.143241882324219, "global_step": 79339, "epoch": 1889} {"train_loss": -6.1466827392578125, "global_step": 79340, "epoch": 1889} {"train_loss": -6.185232639312744, "global_step": 79341, "epoch": 1889} {"train_loss": -6.092632293701172, "global_step": 79342, "epoch": 1889} {"train_loss": -6.278294563293457, "global_step": 79343, "epoch": 1889} {"train_loss": -6.173426151275635, "global_step": 79344, "epoch": 1889} {"train_loss": -6.157754898071289, "global_step": 79345, "epoch": 1889} {"train_loss": -6.220851421356201, "global_step": 79346, "epoch": 1889} {"train_loss": -6.20200777053833, "global_step": 79347, "epoch": 1889} {"train_loss": -6.276803493499756, "global_step": 79348, "epoch": 1889} {"train_loss": -6.182487487792969, "global_step": 79349, "epoch": 1889} {"train_loss": -6.237628936767578, "global_step": 79350, "epoch": 1889} {"train_loss": -6.166032791137695, "global_step": 79351, "epoch": 1889} {"train_loss": -5.963445663452148, "global_step": 79352, "epoch": 1889} {"train_loss": -6.139739036560059, "global_step": 79353, "epoch": 1889} {"train_loss": -6.101997375488281, "global_step": 79354, "epoch": 1889} {"train_loss": -6.120321273803711, "global_step": 79355, "epoch": 1889} {"train_loss": -6.053279399871826, "global_step": 79356, "epoch": 1889} {"train_loss": -6.134942054748535, "global_step": 79357, "epoch": 1889} {"train_loss": -5.996292591094971, "global_step": 79358, "epoch": 1889} {"train_loss": -6.216907978057861, "global_step": 79359, "epoch": 1889} {"train_loss": -6.088784217834473, "global_step": 79360, "epoch": 1889} {"train_loss": -6.161406517028809, "global_step": 79361, "epoch": 1889} {"train_loss": -6.192559242248535, "global_step": 79362, "epoch": 1889} {"train_loss": -6.06235408782959, "global_step": 79363, "epoch": 1889} {"train_loss": -6.182573318481445, "global_step": 79364, "epoch": 1889} {"train_loss": -6.091041564941406, "global_step": 79365, "epoch": 1889} {"train_loss": -6.006527900695801, "global_step": 79366, "epoch": 1889} {"train_loss": -6.147494316101074, "global_step": 79367, "epoch": 1889} {"train_loss": -6.1042633056640625, "global_step": 79368, "epoch": 1889} {"train_loss": -6.020169258117676, "global_step": 79369, "epoch": 1889} {"train_loss": -5.971673965454102, "global_step": 79370, "epoch": 1889} {"train_loss": -6.119413375854492, "global_step": 79371, "epoch": 1889} {"train_loss": -6.130377292633057, "global_step": 79372, "epoch": 1889} {"train_loss": -6.068770408630371, "global_step": 79373, "epoch": 1889} {"train_loss": -5.976205825805664, "global_step": 79374, "epoch": 1889} {"train_loss": -6.205305576324463, "global_step": 79375, "epoch": 1889} {"train_loss": -6.1855292320251465, "global_step": 79376, "epoch": 1889} {"train_loss": -6.110008716583252, "global_step": 79377, "epoch": 1889} {"train_loss": -6.1775007247924805, "global_step": 79378, "epoch": 1889} {"train_loss": -6.130163521993728, "global_step": 79379, "epoch": 1889, "val_loss": 74986.9375} {"train_loss": -6.1344451904296875, "global_step": 79380, "epoch": 1890} {"train_loss": -6.125555038452148, "global_step": 79381, "epoch": 1890} {"train_loss": -6.180017471313477, "global_step": 79382, "epoch": 1890} {"train_loss": -6.169022083282471, "global_step": 79383, "epoch": 1890} {"train_loss": -6.039634704589844, "global_step": 79384, "epoch": 1890} {"train_loss": -6.140280246734619, "global_step": 79385, "epoch": 1890} {"train_loss": -6.091997146606445, "global_step": 79386, "epoch": 1890} {"train_loss": -6.2464823722839355, "global_step": 79387, "epoch": 1890} {"train_loss": -6.072820663452148, "global_step": 79388, "epoch": 1890} {"train_loss": -6.120241641998291, "global_step": 79389, "epoch": 1890} {"train_loss": -6.016643524169922, "global_step": 79390, "epoch": 1890} {"train_loss": -6.008975028991699, "global_step": 79391, "epoch": 1890} {"train_loss": -6.2467427253723145, "global_step": 79392, "epoch": 1890} {"train_loss": -5.946999549865723, "global_step": 79393, "epoch": 1890} {"train_loss": -6.161343574523926, "global_step": 79394, "epoch": 1890} {"train_loss": -6.090712547302246, "global_step": 79395, "epoch": 1890} {"train_loss": -6.130576133728027, "global_step": 79396, "epoch": 1890} {"train_loss": -6.190303802490234, "global_step": 79397, "epoch": 1890} {"train_loss": -6.162836074829102, "global_step": 79398, "epoch": 1890} {"train_loss": -6.155550956726074, "global_step": 79399, "epoch": 1890} {"train_loss": -6.23858642578125, "global_step": 79400, "epoch": 1890} {"train_loss": -6.131763458251953, "global_step": 79401, "epoch": 1890} {"train_loss": -6.015763282775879, "global_step": 79402, "epoch": 1890} {"train_loss": -6.12753963470459, "global_step": 79403, "epoch": 1890} {"train_loss": -6.145981788635254, "global_step": 79404, "epoch": 1890} {"train_loss": -6.157271862030029, "global_step": 79405, "epoch": 1890} {"train_loss": -6.145261764526367, "global_step": 79406, "epoch": 1890} {"train_loss": -6.0740556716918945, "global_step": 79407, "epoch": 1890} {"train_loss": -6.1030073165893555, "global_step": 79408, "epoch": 1890} {"train_loss": -5.950479507446289, "global_step": 79409, "epoch": 1890} {"train_loss": -6.083212852478027, "global_step": 79410, "epoch": 1890} {"train_loss": -6.001867294311523, "global_step": 79411, "epoch": 1890} {"train_loss": -6.044073104858398, "global_step": 79412, "epoch": 1890} {"train_loss": -5.9638800621032715, "global_step": 79413, "epoch": 1890} {"train_loss": -5.9547834396362305, "global_step": 79414, "epoch": 1890} {"train_loss": -5.993104934692383, "global_step": 79415, "epoch": 1890} {"train_loss": -6.152317523956299, "global_step": 79416, "epoch": 1890} {"train_loss": -6.089541435241699, "global_step": 79417, "epoch": 1890} {"train_loss": -6.033806800842285, "global_step": 79418, "epoch": 1890} {"train_loss": -6.264659881591797, "global_step": 79419, "epoch": 1890} {"train_loss": -6.101654529571533, "global_step": 79420, "epoch": 1890} {"train_loss": -6.102524223781767, "global_step": 79421, "epoch": 1890, "val_loss": 75283.921875} {"train_loss": -6.085297107696533, "global_step": 79422, "epoch": 1891} {"train_loss": -6.08236026763916, "global_step": 79423, "epoch": 1891} {"train_loss": -6.039896011352539, "global_step": 79424, "epoch": 1891} {"train_loss": -6.10194206237793, "global_step": 79425, "epoch": 1891} {"train_loss": -6.0612993240356445, "global_step": 79426, "epoch": 1891} {"train_loss": -6.0992279052734375, "global_step": 79427, "epoch": 1891} {"train_loss": -6.19331169128418, "global_step": 79428, "epoch": 1891} {"train_loss": -6.078970909118652, "global_step": 79429, "epoch": 1891} {"train_loss": -6.178299903869629, "global_step": 79430, "epoch": 1891} {"train_loss": -6.161690711975098, "global_step": 79431, "epoch": 1891} {"train_loss": -6.11088752746582, "global_step": 79432, "epoch": 1891} {"train_loss": -6.038984298706055, "global_step": 79433, "epoch": 1891} {"train_loss": -6.195169448852539, "global_step": 79434, "epoch": 1891} {"train_loss": -6.23539400100708, "global_step": 79435, "epoch": 1891} {"train_loss": -6.141341686248779, "global_step": 79436, "epoch": 1891} {"train_loss": -6.1562700271606445, "global_step": 79437, "epoch": 1891} {"train_loss": -6.185678958892822, "global_step": 79438, "epoch": 1891} {"train_loss": -6.124458312988281, "global_step": 79439, "epoch": 1891} {"train_loss": -6.1851019859313965, "global_step": 79440, "epoch": 1891} {"train_loss": -6.137903213500977, "global_step": 79441, "epoch": 1891} {"train_loss": -5.987494468688965, "global_step": 79442, "epoch": 1891} {"train_loss": -6.102836608886719, "global_step": 79443, "epoch": 1891} {"train_loss": -6.219823837280273, "global_step": 79444, "epoch": 1891} {"train_loss": -6.265352249145508, "global_step": 79445, "epoch": 1891} {"train_loss": -6.075328826904297, "global_step": 79446, "epoch": 1891} {"train_loss": -6.14068603515625, "global_step": 79447, "epoch": 1891} {"train_loss": -6.142297744750977, "global_step": 79448, "epoch": 1891} {"train_loss": -6.002498626708984, "global_step": 79449, "epoch": 1891} {"train_loss": -6.14422607421875, "global_step": 79450, "epoch": 1891} {"train_loss": -6.1379899978637695, "global_step": 79451, "epoch": 1891} {"train_loss": -6.127111434936523, "global_step": 79452, "epoch": 1891} {"train_loss": -6.151065826416016, "global_step": 79453, "epoch": 1891} {"train_loss": -6.133947849273682, "global_step": 79454, "epoch": 1891} {"train_loss": -6.122231483459473, "global_step": 79455, "epoch": 1891} {"train_loss": -6.1117448806762695, "global_step": 79456, "epoch": 1891} {"train_loss": -6.22462272644043, "global_step": 79457, "epoch": 1891} {"train_loss": -6.159821033477783, "global_step": 79458, "epoch": 1891} {"train_loss": -6.01666784286499, "global_step": 79459, "epoch": 1891} {"train_loss": -6.077919006347656, "global_step": 79460, "epoch": 1891} {"train_loss": -5.979644775390625, "global_step": 79461, "epoch": 1891} {"train_loss": -5.993280410766602, "global_step": 79462, "epoch": 1891} {"train_loss": -6.119334504717872, "global_step": 79463, "epoch": 1891, "val_loss": 74829.375} {"train_loss": -6.10011100769043, "global_step": 79464, "epoch": 1892} {"train_loss": -6.070693492889404, "global_step": 79465, "epoch": 1892} {"train_loss": -6.065708160400391, "global_step": 79466, "epoch": 1892} {"train_loss": -6.089221477508545, "global_step": 79467, "epoch": 1892} {"train_loss": -6.113913059234619, "global_step": 79468, "epoch": 1892} {"train_loss": -6.039724826812744, "global_step": 79469, "epoch": 1892} {"train_loss": -6.119629859924316, "global_step": 79470, "epoch": 1892} {"train_loss": -6.122224807739258, "global_step": 79471, "epoch": 1892} {"train_loss": -6.0417585372924805, "global_step": 79472, "epoch": 1892} {"train_loss": -6.2618303298950195, "global_step": 79473, "epoch": 1892} {"train_loss": -6.170995712280273, "global_step": 79474, "epoch": 1892} {"train_loss": -6.042807102203369, "global_step": 79475, "epoch": 1892} {"train_loss": -6.121533393859863, "global_step": 79476, "epoch": 1892} {"train_loss": -6.1014628410339355, "global_step": 79477, "epoch": 1892} {"train_loss": -6.053839206695557, "global_step": 79478, "epoch": 1892} {"train_loss": -6.0644025802612305, "global_step": 79479, "epoch": 1892} {"train_loss": -6.08350944519043, "global_step": 79480, "epoch": 1892} {"train_loss": -6.105206489562988, "global_step": 79481, "epoch": 1892} {"train_loss": -5.971492767333984, "global_step": 79482, "epoch": 1892} {"train_loss": -5.999168395996094, "global_step": 79483, "epoch": 1892} {"train_loss": -6.136446952819824, "global_step": 79484, "epoch": 1892} {"train_loss": -6.047046661376953, "global_step": 79485, "epoch": 1892} {"train_loss": -6.1641998291015625, "global_step": 79486, "epoch": 1892} {"train_loss": -6.0540452003479, "global_step": 79487, "epoch": 1892} {"train_loss": -6.105234146118164, "global_step": 79488, "epoch": 1892} {"train_loss": -6.248115539550781, "global_step": 79489, "epoch": 1892} {"train_loss": -6.154783248901367, "global_step": 79490, "epoch": 1892} {"train_loss": -6.115530967712402, "global_step": 79491, "epoch": 1892} {"train_loss": -6.217336177825928, "global_step": 79492, "epoch": 1892} {"train_loss": -6.124117374420166, "global_step": 79493, "epoch": 1892} {"train_loss": -6.240776062011719, "global_step": 79494, "epoch": 1892} {"train_loss": -6.146458625793457, "global_step": 79495, "epoch": 1892} {"train_loss": -6.115333557128906, "global_step": 79496, "epoch": 1892} {"train_loss": -6.213216781616211, "global_step": 79497, "epoch": 1892} {"train_loss": -6.186762809753418, "global_step": 79498, "epoch": 1892} {"train_loss": -6.116340637207031, "global_step": 79499, "epoch": 1892} {"train_loss": -6.110782623291016, "global_step": 79500, "epoch": 1892} {"train_loss": -6.103890419006348, "global_step": 79501, "epoch": 1892} {"train_loss": -6.215273380279541, "global_step": 79502, "epoch": 1892} {"train_loss": -6.147555351257324, "global_step": 79503, "epoch": 1892} {"train_loss": -6.143684387207031, "global_step": 79504, "epoch": 1892} {"train_loss": -6.118849084490821, "global_step": 79505, "epoch": 1892, "val_loss": 75144.7578125} {"train_loss": -6.190577507019043, "global_step": 79506, "epoch": 1893} {"train_loss": -6.135160446166992, "global_step": 79507, "epoch": 1893} {"train_loss": -6.156578063964844, "global_step": 79508, "epoch": 1893} {"train_loss": -6.289647579193115, "global_step": 79509, "epoch": 1893} {"train_loss": -6.07687520980835, "global_step": 79510, "epoch": 1893} {"train_loss": -6.227385520935059, "global_step": 79511, "epoch": 1893} {"train_loss": -6.071491241455078, "global_step": 79512, "epoch": 1893} {"train_loss": -6.21713399887085, "global_step": 79513, "epoch": 1893} {"train_loss": -6.083107948303223, "global_step": 79514, "epoch": 1893} {"train_loss": -6.263771057128906, "global_step": 79515, "epoch": 1893} {"train_loss": -6.141999244689941, "global_step": 79516, "epoch": 1893} {"train_loss": -6.132077693939209, "global_step": 79517, "epoch": 1893} {"train_loss": -6.01548957824707, "global_step": 79518, "epoch": 1893} {"train_loss": -6.1908488273620605, "global_step": 79519, "epoch": 1893} {"train_loss": -6.125396728515625, "global_step": 79520, "epoch": 1893} {"train_loss": -6.0912275314331055, "global_step": 79521, "epoch": 1893} {"train_loss": -6.020124435424805, "global_step": 79522, "epoch": 1893} {"train_loss": -6.138457298278809, "global_step": 79523, "epoch": 1893} {"train_loss": -6.025067329406738, "global_step": 79524, "epoch": 1893} {"train_loss": -6.18533992767334, "global_step": 79525, "epoch": 1893} {"train_loss": -6.017744064331055, "global_step": 79526, "epoch": 1893} {"train_loss": -6.05828857421875, "global_step": 79527, "epoch": 1893} {"train_loss": -6.093912124633789, "global_step": 79528, "epoch": 1893} {"train_loss": -6.141052722930908, "global_step": 79529, "epoch": 1893} {"train_loss": -6.149635314941406, "global_step": 79530, "epoch": 1893} {"train_loss": -6.0842413902282715, "global_step": 79531, "epoch": 1893} {"train_loss": -6.087238311767578, "global_step": 79532, "epoch": 1893} {"train_loss": -6.109198093414307, "global_step": 79533, "epoch": 1893} {"train_loss": -6.164012908935547, "global_step": 79534, "epoch": 1893} {"train_loss": -6.042086124420166, "global_step": 79535, "epoch": 1893} {"train_loss": -6.1991071701049805, "global_step": 79536, "epoch": 1893} {"train_loss": -6.092389106750488, "global_step": 79537, "epoch": 1893} {"train_loss": -6.220168590545654, "global_step": 79538, "epoch": 1893} {"train_loss": -6.115948677062988, "global_step": 79539, "epoch": 1893} {"train_loss": -6.06833028793335, "global_step": 79540, "epoch": 1893} {"train_loss": -6.279195785522461, "global_step": 79541, "epoch": 1893} {"train_loss": -6.061573028564453, "global_step": 79542, "epoch": 1893} {"train_loss": -6.040439128875732, "global_step": 79543, "epoch": 1893} {"train_loss": -5.9957966804504395, "global_step": 79544, "epoch": 1893} {"train_loss": -6.168783187866211, "global_step": 79545, "epoch": 1893} {"train_loss": -6.169081687927246, "global_step": 79546, "epoch": 1893} {"train_loss": -6.126340355191912, "global_step": 79547, "epoch": 1893, "val_loss": 74913.65625} {"train_loss": -6.114377975463867, "global_step": 79548, "epoch": 1894} {"train_loss": -6.143872261047363, "global_step": 79549, "epoch": 1894} {"train_loss": -6.081997871398926, "global_step": 79550, "epoch": 1894} {"train_loss": -6.222507476806641, "global_step": 79551, "epoch": 1894} {"train_loss": -6.1357316970825195, "global_step": 79552, "epoch": 1894} {"train_loss": -6.31204080581665, "global_step": 79553, "epoch": 1894} {"train_loss": -6.141012191772461, "global_step": 79554, "epoch": 1894} {"train_loss": -6.160200119018555, "global_step": 79555, "epoch": 1894} {"train_loss": -6.071767807006836, "global_step": 79556, "epoch": 1894} {"train_loss": -6.195883274078369, "global_step": 79557, "epoch": 1894} {"train_loss": -6.159891128540039, "global_step": 79558, "epoch": 1894} {"train_loss": -6.044010162353516, "global_step": 79559, "epoch": 1894} {"train_loss": -6.13871955871582, "global_step": 79560, "epoch": 1894} {"train_loss": -6.12446403503418, "global_step": 79561, "epoch": 1894} {"train_loss": -6.036418914794922, "global_step": 79562, "epoch": 1894} {"train_loss": -6.217262268066406, "global_step": 79563, "epoch": 1894} {"train_loss": -6.098505973815918, "global_step": 79564, "epoch": 1894} {"train_loss": -6.09738826751709, "global_step": 79565, "epoch": 1894} {"train_loss": -6.086625099182129, "global_step": 79566, "epoch": 1894} {"train_loss": -6.187720775604248, "global_step": 79567, "epoch": 1894} {"train_loss": -6.0584540367126465, "global_step": 79568, "epoch": 1894} {"train_loss": -6.067224502563477, "global_step": 79569, "epoch": 1894} {"train_loss": -6.111814975738525, "global_step": 79570, "epoch": 1894} {"train_loss": -6.089747428894043, "global_step": 79571, "epoch": 1894} {"train_loss": -6.162360191345215, "global_step": 79572, "epoch": 1894} {"train_loss": -5.968192100524902, "global_step": 79573, "epoch": 1894} {"train_loss": -6.178681373596191, "global_step": 79574, "epoch": 1894} {"train_loss": -5.977011680603027, "global_step": 79575, "epoch": 1894} {"train_loss": -6.075469017028809, "global_step": 79576, "epoch": 1894} {"train_loss": -6.120868682861328, "global_step": 79577, "epoch": 1894} {"train_loss": -6.0286407470703125, "global_step": 79578, "epoch": 1894} {"train_loss": -6.1056108474731445, "global_step": 79579, "epoch": 1894} {"train_loss": -6.014950275421143, "global_step": 79580, "epoch": 1894} {"train_loss": -6.086179256439209, "global_step": 79581, "epoch": 1894} {"train_loss": -6.154958724975586, "global_step": 79582, "epoch": 1894} {"train_loss": -6.134065628051758, "global_step": 79583, "epoch": 1894} {"train_loss": -6.171832084655762, "global_step": 79584, "epoch": 1894} {"train_loss": -6.029397010803223, "global_step": 79585, "epoch": 1894} {"train_loss": -6.122491836547852, "global_step": 79586, "epoch": 1894} {"train_loss": -6.190783500671387, "global_step": 79587, "epoch": 1894} {"train_loss": -6.090732574462891, "global_step": 79588, "epoch": 1894} {"train_loss": -6.115958611170451, "global_step": 79589, "epoch": 1894, "val_loss": 75087.375} {"train_loss": -5.96021842956543, "global_step": 79590, "epoch": 1895} {"train_loss": -6.097684383392334, "global_step": 79591, "epoch": 1895} {"train_loss": -6.210012435913086, "global_step": 79592, "epoch": 1895} {"train_loss": -6.093792915344238, "global_step": 79593, "epoch": 1895} {"train_loss": -6.132373809814453, "global_step": 79594, "epoch": 1895} {"train_loss": -6.036135673522949, "global_step": 79595, "epoch": 1895} {"train_loss": -6.1803364753723145, "global_step": 79596, "epoch": 1895} {"train_loss": -6.1880974769592285, "global_step": 79597, "epoch": 1895} {"train_loss": -6.131031036376953, "global_step": 79598, "epoch": 1895} {"train_loss": -6.17185640335083, "global_step": 79599, "epoch": 1895} {"train_loss": -6.181112289428711, "global_step": 79600, "epoch": 1895} {"train_loss": -6.0375657081604, "global_step": 79601, "epoch": 1895} {"train_loss": -6.196259498596191, "global_step": 79602, "epoch": 1895} {"train_loss": -6.077356815338135, "global_step": 79603, "epoch": 1895} {"train_loss": -6.05025577545166, "global_step": 79604, "epoch": 1895} {"train_loss": -6.157917499542236, "global_step": 79605, "epoch": 1895} {"train_loss": -6.0705060958862305, "global_step": 79606, "epoch": 1895} {"train_loss": -6.056096076965332, "global_step": 79607, "epoch": 1895} {"train_loss": -6.165853023529053, "global_step": 79608, "epoch": 1895} {"train_loss": -6.099481582641602, "global_step": 79609, "epoch": 1895} {"train_loss": -6.114702224731445, "global_step": 79610, "epoch": 1895} {"train_loss": -6.162105083465576, "global_step": 79611, "epoch": 1895} {"train_loss": -6.210928440093994, "global_step": 79612, "epoch": 1895} {"train_loss": -6.178864002227783, "global_step": 79613, "epoch": 1895} {"train_loss": -6.201164245605469, "global_step": 79614, "epoch": 1895} {"train_loss": -6.138813018798828, "global_step": 79615, "epoch": 1895} {"train_loss": -6.152092933654785, "global_step": 79616, "epoch": 1895} {"train_loss": -6.031222343444824, "global_step": 79617, "epoch": 1895} {"train_loss": -6.205892562866211, "global_step": 79618, "epoch": 1895} {"train_loss": -6.249967575073242, "global_step": 79619, "epoch": 1895} {"train_loss": -6.004088401794434, "global_step": 79620, "epoch": 1895} {"train_loss": -6.139401435852051, "global_step": 79621, "epoch": 1895} {"train_loss": -6.1745524406433105, "global_step": 79622, "epoch": 1895} {"train_loss": -6.217095375061035, "global_step": 79623, "epoch": 1895} {"train_loss": -6.112955093383789, "global_step": 79624, "epoch": 1895} {"train_loss": -6.031014442443848, "global_step": 79625, "epoch": 1895} {"train_loss": -6.2189412117004395, "global_step": 79626, "epoch": 1895} {"train_loss": -5.9588518142700195, "global_step": 79627, "epoch": 1895} {"train_loss": -6.070621490478516, "global_step": 79628, "epoch": 1895} {"train_loss": -6.070214748382568, "global_step": 79629, "epoch": 1895} {"train_loss": -6.017469882965088, "global_step": 79630, "epoch": 1895} {"train_loss": -6.122084515435355, "global_step": 79631, "epoch": 1895, "val_loss": 75391.7421875} {"train_loss": -5.96175479888916, "global_step": 79632, "epoch": 1896} {"train_loss": -6.105186462402344, "global_step": 79633, "epoch": 1896} {"train_loss": -6.115627288818359, "global_step": 79634, "epoch": 1896} {"train_loss": -6.136055946350098, "global_step": 79635, "epoch": 1896} {"train_loss": -6.11163330078125, "global_step": 79636, "epoch": 1896} {"train_loss": -6.101421356201172, "global_step": 79637, "epoch": 1896} {"train_loss": -6.0011162757873535, "global_step": 79638, "epoch": 1896} {"train_loss": -6.0463361740112305, "global_step": 79639, "epoch": 1896} {"train_loss": -6.115066051483154, "global_step": 79640, "epoch": 1896} {"train_loss": -6.11030387878418, "global_step": 79641, "epoch": 1896} {"train_loss": -6.202596664428711, "global_step": 79642, "epoch": 1896} {"train_loss": -6.1760406494140625, "global_step": 79643, "epoch": 1896} {"train_loss": -6.181196689605713, "global_step": 79644, "epoch": 1896} {"train_loss": -6.184193134307861, "global_step": 79645, "epoch": 1896} {"train_loss": -6.071386814117432, "global_step": 79646, "epoch": 1896} {"train_loss": -6.027955532073975, "global_step": 79647, "epoch": 1896} {"train_loss": -6.223966598510742, "global_step": 79648, "epoch": 1896} {"train_loss": -6.129091262817383, "global_step": 79649, "epoch": 1896} {"train_loss": -6.104269027709961, "global_step": 79650, "epoch": 1896} {"train_loss": -6.023426055908203, "global_step": 79651, "epoch": 1896} {"train_loss": -6.111286163330078, "global_step": 79652, "epoch": 1896} {"train_loss": -5.918711185455322, "global_step": 79653, "epoch": 1896} {"train_loss": -6.076314926147461, "global_step": 79654, "epoch": 1896} {"train_loss": -6.11129093170166, "global_step": 79655, "epoch": 1896} {"train_loss": -6.1817426681518555, "global_step": 79656, "epoch": 1896} {"train_loss": -6.1681694984436035, "global_step": 79657, "epoch": 1896} {"train_loss": -6.132619857788086, "global_step": 79658, "epoch": 1896} {"train_loss": -6.091853141784668, "global_step": 79659, "epoch": 1896} {"train_loss": -6.078350067138672, "global_step": 79660, "epoch": 1896} {"train_loss": -6.163703441619873, "global_step": 79661, "epoch": 1896} {"train_loss": -6.250219345092773, "global_step": 79662, "epoch": 1896} {"train_loss": -6.182405471801758, "global_step": 79663, "epoch": 1896} {"train_loss": -6.035009384155273, "global_step": 79664, "epoch": 1896} {"train_loss": -6.145747184753418, "global_step": 79665, "epoch": 1896} {"train_loss": -6.059947490692139, "global_step": 79666, "epoch": 1896} {"train_loss": -6.218044281005859, "global_step": 79667, "epoch": 1896} {"train_loss": -6.17266321182251, "global_step": 79668, "epoch": 1896} {"train_loss": -6.053234577178955, "global_step": 79669, "epoch": 1896} {"train_loss": -6.082326889038086, "global_step": 79670, "epoch": 1896} {"train_loss": -6.200863838195801, "global_step": 79671, "epoch": 1896} {"train_loss": -6.130349159240723, "global_step": 79672, "epoch": 1896} {"train_loss": -6.114122197741554, "global_step": 79673, "epoch": 1896, "val_loss": 75241.7421875} {"train_loss": -6.139707565307617, "global_step": 79674, "epoch": 1897} {"train_loss": -6.061805725097656, "global_step": 79675, "epoch": 1897} {"train_loss": -6.05718469619751, "global_step": 79676, "epoch": 1897} {"train_loss": -5.972520351409912, "global_step": 79677, "epoch": 1897} {"train_loss": -6.230925559997559, "global_step": 79678, "epoch": 1897} {"train_loss": -5.957497596740723, "global_step": 79679, "epoch": 1897} {"train_loss": -6.1027021408081055, "global_step": 79680, "epoch": 1897} {"train_loss": -6.173436164855957, "global_step": 79681, "epoch": 1897} {"train_loss": -5.967693328857422, "global_step": 79682, "epoch": 1897} {"train_loss": -6.272834300994873, "global_step": 79683, "epoch": 1897} {"train_loss": -6.174430847167969, "global_step": 79684, "epoch": 1897} {"train_loss": -6.076805591583252, "global_step": 79685, "epoch": 1897} {"train_loss": -6.168977737426758, "global_step": 79686, "epoch": 1897} {"train_loss": -6.101410865783691, "global_step": 79687, "epoch": 1897} {"train_loss": -6.121129989624023, "global_step": 79688, "epoch": 1897} {"train_loss": -6.308762073516846, "global_step": 79689, "epoch": 1897} {"train_loss": -6.049812316894531, "global_step": 79690, "epoch": 1897} {"train_loss": -6.131063461303711, "global_step": 79691, "epoch": 1897} {"train_loss": -6.226408958435059, "global_step": 79692, "epoch": 1897} {"train_loss": -6.0849809646606445, "global_step": 79693, "epoch": 1897} {"train_loss": -6.215816020965576, "global_step": 79694, "epoch": 1897} {"train_loss": -6.188377380371094, "global_step": 79695, "epoch": 1897} {"train_loss": -6.13783597946167, "global_step": 79696, "epoch": 1897} {"train_loss": -6.145965576171875, "global_step": 79697, "epoch": 1897} {"train_loss": -6.166584014892578, "global_step": 79698, "epoch": 1897} {"train_loss": -6.121151924133301, "global_step": 79699, "epoch": 1897} {"train_loss": -6.142014503479004, "global_step": 79700, "epoch": 1897} {"train_loss": -6.048102378845215, "global_step": 79701, "epoch": 1897} {"train_loss": -6.178515911102295, "global_step": 79702, "epoch": 1897} {"train_loss": -6.228137016296387, "global_step": 79703, "epoch": 1897} {"train_loss": -6.202077388763428, "global_step": 79704, "epoch": 1897} {"train_loss": -6.149740219116211, "global_step": 79705, "epoch": 1897} {"train_loss": -6.027339458465576, "global_step": 79706, "epoch": 1897} {"train_loss": -6.202714920043945, "global_step": 79707, "epoch": 1897} {"train_loss": -6.086177349090576, "global_step": 79708, "epoch": 1897} {"train_loss": -6.166640281677246, "global_step": 79709, "epoch": 1897} {"train_loss": -6.197583198547363, "global_step": 79710, "epoch": 1897} {"train_loss": -6.130091667175293, "global_step": 79711, "epoch": 1897} {"train_loss": -6.098091125488281, "global_step": 79712, "epoch": 1897} {"train_loss": -6.053926467895508, "global_step": 79713, "epoch": 1897} {"train_loss": -6.161227226257324, "global_step": 79714, "epoch": 1897} {"train_loss": -6.13305003302438, "global_step": 79715, "epoch": 1897, "val_loss": 74819.4296875} {"train_loss": -6.219324111938477, "global_step": 79716, "epoch": 1898} {"train_loss": -6.130460739135742, "global_step": 79717, "epoch": 1898} {"train_loss": -6.065703392028809, "global_step": 79718, "epoch": 1898} {"train_loss": -6.040065288543701, "global_step": 79719, "epoch": 1898} {"train_loss": -6.073502540588379, "global_step": 79720, "epoch": 1898} {"train_loss": -6.0842437744140625, "global_step": 79721, "epoch": 1898} {"train_loss": -6.091936111450195, "global_step": 79722, "epoch": 1898} {"train_loss": -6.164812088012695, "global_step": 79723, "epoch": 1898} {"train_loss": -6.119049072265625, "global_step": 79724, "epoch": 1898} {"train_loss": -6.2461748123168945, "global_step": 79725, "epoch": 1898} {"train_loss": -6.155518531799316, "global_step": 79726, "epoch": 1898} {"train_loss": -6.087324142456055, "global_step": 79727, "epoch": 1898} {"train_loss": -6.141621112823486, "global_step": 79728, "epoch": 1898} {"train_loss": -6.189508438110352, "global_step": 79729, "epoch": 1898} {"train_loss": -6.102214813232422, "global_step": 79730, "epoch": 1898} {"train_loss": -6.1405029296875, "global_step": 79731, "epoch": 1898} {"train_loss": -6.02925968170166, "global_step": 79732, "epoch": 1898} {"train_loss": -6.160582542419434, "global_step": 79733, "epoch": 1898} {"train_loss": -6.076180458068848, "global_step": 79734, "epoch": 1898} {"train_loss": -6.172122955322266, "global_step": 79735, "epoch": 1898} {"train_loss": -6.181035041809082, "global_step": 79736, "epoch": 1898} {"train_loss": -6.310389518737793, "global_step": 79737, "epoch": 1898} {"train_loss": -6.009490966796875, "global_step": 79738, "epoch": 1898} {"train_loss": -6.1834259033203125, "global_step": 79739, "epoch": 1898} {"train_loss": -6.102141380310059, "global_step": 79740, "epoch": 1898} {"train_loss": -6.013741493225098, "global_step": 79741, "epoch": 1898} {"train_loss": -5.985440254211426, "global_step": 79742, "epoch": 1898} {"train_loss": -6.094621658325195, "global_step": 79743, "epoch": 1898} {"train_loss": -6.0792741775512695, "global_step": 79744, "epoch": 1898} {"train_loss": -6.1047539710998535, "global_step": 79745, "epoch": 1898} {"train_loss": -6.108574390411377, "global_step": 79746, "epoch": 1898} {"train_loss": -5.989328384399414, "global_step": 79747, "epoch": 1898} {"train_loss": -5.961784362792969, "global_step": 79748, "epoch": 1898} {"train_loss": -6.2472686767578125, "global_step": 79749, "epoch": 1898} {"train_loss": -6.190425872802734, "global_step": 79750, "epoch": 1898} {"train_loss": -6.13676118850708, "global_step": 79751, "epoch": 1898} {"train_loss": -6.091740131378174, "global_step": 79752, "epoch": 1898} {"train_loss": -6.098721981048584, "global_step": 79753, "epoch": 1898} {"train_loss": -6.016110420227051, "global_step": 79754, "epoch": 1898} {"train_loss": -6.160898685455322, "global_step": 79755, "epoch": 1898} {"train_loss": -6.129997253417969, "global_step": 79756, "epoch": 1898} {"train_loss": -6.112065179007394, "global_step": 79757, "epoch": 1898, "val_loss": 74828.84375} {"train_loss": -6.08450984954834, "global_step": 79758, "epoch": 1899} {"train_loss": -5.985992908477783, "global_step": 79759, "epoch": 1899} {"train_loss": -6.199462890625, "global_step": 79760, "epoch": 1899} {"train_loss": -6.124964237213135, "global_step": 79761, "epoch": 1899} {"train_loss": -6.002354621887207, "global_step": 79762, "epoch": 1899} {"train_loss": -6.127331256866455, "global_step": 79763, "epoch": 1899} {"train_loss": -6.198650360107422, "global_step": 79764, "epoch": 1899} {"train_loss": -6.116779804229736, "global_step": 79765, "epoch": 1899} {"train_loss": -6.046152114868164, "global_step": 79766, "epoch": 1899} {"train_loss": -6.097321510314941, "global_step": 79767, "epoch": 1899} {"train_loss": -6.227128982543945, "global_step": 79768, "epoch": 1899} {"train_loss": -5.942967891693115, "global_step": 79769, "epoch": 1899} {"train_loss": -6.016491413116455, "global_step": 79770, "epoch": 1899} {"train_loss": -6.142117500305176, "global_step": 79771, "epoch": 1899} {"train_loss": -6.1273345947265625, "global_step": 79772, "epoch": 1899} {"train_loss": -6.160730361938477, "global_step": 79773, "epoch": 1899} {"train_loss": -6.147557258605957, "global_step": 79774, "epoch": 1899} {"train_loss": -6.085693836212158, "global_step": 79775, "epoch": 1899} {"train_loss": -6.228795051574707, "global_step": 79776, "epoch": 1899} {"train_loss": -6.223905563354492, "global_step": 79777, "epoch": 1899} {"train_loss": -6.169565677642822, "global_step": 79778, "epoch": 1899} {"train_loss": -6.003987789154053, "global_step": 79779, "epoch": 1899} {"train_loss": -6.077868461608887, "global_step": 79780, "epoch": 1899} {"train_loss": -6.195309638977051, "global_step": 79781, "epoch": 1899} {"train_loss": -6.009626388549805, "global_step": 79782, "epoch": 1899} {"train_loss": -6.096689224243164, "global_step": 79783, "epoch": 1899} {"train_loss": -6.134676933288574, "global_step": 79784, "epoch": 1899} {"train_loss": -6.171544551849365, "global_step": 79785, "epoch": 1899} {"train_loss": -6.04701566696167, "global_step": 79786, "epoch": 1899} {"train_loss": -6.049376010894775, "global_step": 79787, "epoch": 1899} {"train_loss": -6.029204368591309, "global_step": 79788, "epoch": 1899} {"train_loss": -6.233753204345703, "global_step": 79789, "epoch": 1899} {"train_loss": -6.008557319641113, "global_step": 79790, "epoch": 1899} {"train_loss": -6.047219276428223, "global_step": 79791, "epoch": 1899} {"train_loss": -6.060460090637207, "global_step": 79792, "epoch": 1899} {"train_loss": -5.892267227172852, "global_step": 79793, "epoch": 1899} {"train_loss": -6.170544624328613, "global_step": 79794, "epoch": 1899} {"train_loss": -6.110681533813477, "global_step": 79795, "epoch": 1899} {"train_loss": -6.101383209228516, "global_step": 79796, "epoch": 1899} {"train_loss": -6.013095855712891, "global_step": 79797, "epoch": 1899} {"train_loss": -5.975698947906494, "global_step": 79798, "epoch": 1899} {"train_loss": -6.093651340121315, "global_step": 79799, "epoch": 1899, "val_loss": 75291.671875} {"train_loss": -6.006215572357178, "global_step": 79800, "epoch": 1900} {"train_loss": -6.1243696212768555, "global_step": 79801, "epoch": 1900} {"train_loss": -6.091057300567627, "global_step": 79802, "epoch": 1900} {"train_loss": -6.067873477935791, "global_step": 79803, "epoch": 1900} {"train_loss": -6.152308940887451, "global_step": 79804, "epoch": 1900} {"train_loss": -6.118707656860352, "global_step": 79805, "epoch": 1900} {"train_loss": -6.145860195159912, "global_step": 79806, "epoch": 1900} {"train_loss": -6.236185550689697, "global_step": 79807, "epoch": 1900} {"train_loss": -6.182281017303467, "global_step": 79808, "epoch": 1900} {"train_loss": -5.870274066925049, "global_step": 79809, "epoch": 1900} {"train_loss": -6.142728805541992, "global_step": 79810, "epoch": 1900} {"train_loss": -6.094013690948486, "global_step": 79811, "epoch": 1900} {"train_loss": -6.146496295928955, "global_step": 79812, "epoch": 1900} {"train_loss": -6.1152777671813965, "global_step": 79813, "epoch": 1900} {"train_loss": -6.03704309463501, "global_step": 79814, "epoch": 1900} {"train_loss": -6.076075553894043, "global_step": 79815, "epoch": 1900} {"train_loss": -6.096818923950195, "global_step": 79816, "epoch": 1900} {"train_loss": -6.173305988311768, "global_step": 79817, "epoch": 1900} {"train_loss": -6.1289896965026855, "global_step": 79818, "epoch": 1900} {"train_loss": -6.0591278076171875, "global_step": 79819, "epoch": 1900} {"train_loss": -6.125820159912109, "global_step": 79820, "epoch": 1900} {"train_loss": -6.021885871887207, "global_step": 79821, "epoch": 1900} {"train_loss": -6.113952159881592, "global_step": 79822, "epoch": 1900} {"train_loss": -5.907680988311768, "global_step": 79823, "epoch": 1900} {"train_loss": -5.946755886077881, "global_step": 79824, "epoch": 1900} {"train_loss": -6.1247663497924805, "global_step": 79825, "epoch": 1900} {"train_loss": -6.0381951332092285, "global_step": 79826, "epoch": 1900} {"train_loss": -6.047334671020508, "global_step": 79827, "epoch": 1900} {"train_loss": -6.082211494445801, "global_step": 79828, "epoch": 1900} {"train_loss": -6.285878658294678, "global_step": 79829, "epoch": 1900} {"train_loss": -6.066884517669678, "global_step": 79830, "epoch": 1900} {"train_loss": -6.114694595336914, "global_step": 79831, "epoch": 1900} {"train_loss": -6.035595893859863, "global_step": 79832, "epoch": 1900} {"train_loss": -6.046230792999268, "global_step": 79833, "epoch": 1900} {"train_loss": -6.037353992462158, "global_step": 79834, "epoch": 1900} {"train_loss": -6.240472793579102, "global_step": 79835, "epoch": 1900} {"train_loss": -6.022342681884766, "global_step": 79836, "epoch": 1900} {"train_loss": -6.047850608825684, "global_step": 79837, "epoch": 1900} {"train_loss": -6.027650833129883, "global_step": 79838, "epoch": 1900} {"train_loss": -6.132120132446289, "global_step": 79839, "epoch": 1900} {"train_loss": -6.085373878479004, "global_step": 79840, "epoch": 1900} {"train_loss": -6.088856810615177, "global_step": 79841, "epoch": 1900, "train/sim_max_reward_0": 0.7386763085821803, "train/sim_max_reward_1": 0.9008359822803058, "train/sim_max_reward_2": 0.5586807172308371, "train/sim_max_reward_3": 0.06888168639912233, "train/sim_max_reward_4": 0.5208663476067374, "train/sim_max_reward_5": 0.9034304296728203, "test/sim_max_reward_4500000": 0.701020827906196, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9930307049046797, "test/sim_max_reward_4500003": 0.8722001086803719, "test/sim_max_reward_4500004": 0.14397396419227426, "test/sim_max_reward_4500005": 0.9655100782734781, "test/sim_max_reward_4500006": 0.8228642657313552, "test/sim_max_reward_4500007": 0.3708673803044842, "test/sim_max_reward_4500008": 0.1684462801972122, "test/sim_max_reward_4500009": 0.9831655683619899, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.6006806313365007, "test/sim_max_reward_4500012": 0.4986558570517973, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.3754338845898334, "test/sim_max_reward_4500015": 0.4984371548123794, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.05644667640597634, "test/sim_max_reward_4500018": 0.3970216612052077, "test/sim_max_reward_4500019": 0.9259478026368271, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.7362720259249987, "test/sim_max_reward_4500023": 0.990933988596786, "test/sim_max_reward_4500024": 0.9601692965413623, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.8451562845160958, "test/sim_max_reward_4500027": 0.9944037191342366, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.1479323640917061, "test/sim_max_reward_4500030": 0.8531321404640893, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05976030547703129, "test/sim_max_reward_4500033": 0.9717319351937601, "test/sim_max_reward_4500034": 0.786861392776976, "test/sim_max_reward_4500035": 0.9405087862427013, "test/sim_max_reward_4500036": 0.3871372426674964, "test/sim_max_reward_4500037": 0.9958124678484173, "test/sim_max_reward_4500038": 0.30078029762105896, "test/sim_max_reward_4500039": 0.7372748638504222, "test/sim_max_reward_4500040": 0.8991953156179018, "test/sim_max_reward_4500041": 0.8428261301015677, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.8868779794066933, "test/sim_max_reward_4500044": 0.8447874448321436, "test/sim_max_reward_4500045": 0.5039249751724656, "test/sim_max_reward_4500046": 0.8058897683326256, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9240882197337236, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6152285786286672, "test/mean_score": 0.5403464211337233, "val_loss": 74861.78125} {"train_loss": -6.1602091789245605, "global_step": 79842, "epoch": 1901} {"train_loss": -6.127051830291748, "global_step": 79843, "epoch": 1901} {"train_loss": -6.238343238830566, "global_step": 79844, "epoch": 1901} {"train_loss": -6.205695629119873, "global_step": 79845, "epoch": 1901} {"train_loss": -6.049044609069824, "global_step": 79846, "epoch": 1901} {"train_loss": -6.010777473449707, "global_step": 79847, "epoch": 1901} {"train_loss": -6.086134910583496, "global_step": 79848, "epoch": 1901} {"train_loss": -6.008169651031494, "global_step": 79849, "epoch": 1901} {"train_loss": -6.110279560089111, "global_step": 79850, "epoch": 1901} {"train_loss": -6.156931400299072, "global_step": 79851, "epoch": 1901} {"train_loss": -6.091350555419922, "global_step": 79852, "epoch": 1901} {"train_loss": -6.07308292388916, "global_step": 79853, "epoch": 1901} {"train_loss": -6.049830913543701, "global_step": 79854, "epoch": 1901} {"train_loss": -6.121760368347168, "global_step": 79855, "epoch": 1901} {"train_loss": -6.023138999938965, "global_step": 79856, "epoch": 1901} {"train_loss": -6.154439926147461, "global_step": 79857, "epoch": 1901} {"train_loss": -6.132298946380615, "global_step": 79858, "epoch": 1901} {"train_loss": -6.061429977416992, "global_step": 79859, "epoch": 1901} {"train_loss": -6.061826229095459, "global_step": 79860, "epoch": 1901} {"train_loss": -6.099041938781738, "global_step": 79861, "epoch": 1901} {"train_loss": -6.180832386016846, "global_step": 79862, "epoch": 1901} {"train_loss": -6.154972076416016, "global_step": 79863, "epoch": 1901} {"train_loss": -6.039162635803223, "global_step": 79864, "epoch": 1901} {"train_loss": -6.062575817108154, "global_step": 79865, "epoch": 1901} {"train_loss": -6.086210250854492, "global_step": 79866, "epoch": 1901} {"train_loss": -6.021236896514893, "global_step": 79867, "epoch": 1901} {"train_loss": -6.0992913246154785, "global_step": 79868, "epoch": 1901} {"train_loss": -6.200551986694336, "global_step": 79869, "epoch": 1901} {"train_loss": -6.124597549438477, "global_step": 79870, "epoch": 1901} {"train_loss": -6.160120010375977, "global_step": 79871, "epoch": 1901} {"train_loss": -6.0244035720825195, "global_step": 79872, "epoch": 1901} {"train_loss": -5.969513893127441, "global_step": 79873, "epoch": 1901} {"train_loss": -5.985013008117676, "global_step": 79874, "epoch": 1901} {"train_loss": -6.131687164306641, "global_step": 79875, "epoch": 1901} {"train_loss": -6.249786376953125, "global_step": 79876, "epoch": 1901} {"train_loss": -6.082935333251953, "global_step": 79877, "epoch": 1901} {"train_loss": -6.222886085510254, "global_step": 79878, "epoch": 1901} {"train_loss": -6.035882949829102, "global_step": 79879, "epoch": 1901} {"train_loss": -6.08945894241333, "global_step": 79880, "epoch": 1901} {"train_loss": -6.0989203453063965, "global_step": 79881, "epoch": 1901} {"train_loss": -6.2065253257751465, "global_step": 79882, "epoch": 1901} {"train_loss": -6.105118762879145, "global_step": 79883, "epoch": 1901, "val_loss": 74913.28125} {"train_loss": -6.095355987548828, "global_step": 79884, "epoch": 1902} {"train_loss": -6.149724960327148, "global_step": 79885, "epoch": 1902} {"train_loss": -6.188480377197266, "global_step": 79886, "epoch": 1902} {"train_loss": -6.173379898071289, "global_step": 79887, "epoch": 1902} {"train_loss": -6.183553695678711, "global_step": 79888, "epoch": 1902} {"train_loss": -6.124565124511719, "global_step": 79889, "epoch": 1902} {"train_loss": -6.211297512054443, "global_step": 79890, "epoch": 1902} {"train_loss": -6.244682312011719, "global_step": 79891, "epoch": 1902} {"train_loss": -6.140323638916016, "global_step": 79892, "epoch": 1902} {"train_loss": -6.201075553894043, "global_step": 79893, "epoch": 1902} {"train_loss": -6.10611629486084, "global_step": 79894, "epoch": 1902} {"train_loss": -6.258786201477051, "global_step": 79895, "epoch": 1902} {"train_loss": -6.168227195739746, "global_step": 79896, "epoch": 1902} {"train_loss": -6.218420028686523, "global_step": 79897, "epoch": 1902} {"train_loss": -6.245230674743652, "global_step": 79898, "epoch": 1902} {"train_loss": -5.966423988342285, "global_step": 79899, "epoch": 1902} {"train_loss": -6.27935791015625, "global_step": 79900, "epoch": 1902} {"train_loss": -6.21270227432251, "global_step": 79901, "epoch": 1902} {"train_loss": -6.174659729003906, "global_step": 79902, "epoch": 1902} {"train_loss": -6.132359504699707, "global_step": 79903, "epoch": 1902} {"train_loss": -6.213012218475342, "global_step": 79904, "epoch": 1902} {"train_loss": -6.131680488586426, "global_step": 79905, "epoch": 1902} {"train_loss": -6.136589527130127, "global_step": 79906, "epoch": 1902} {"train_loss": -6.056990146636963, "global_step": 79907, "epoch": 1902} {"train_loss": -6.235109806060791, "global_step": 79908, "epoch": 1902} {"train_loss": -6.045820236206055, "global_step": 79909, "epoch": 1902} {"train_loss": -6.099842071533203, "global_step": 79910, "epoch": 1902} {"train_loss": -6.085131645202637, "global_step": 79911, "epoch": 1902} {"train_loss": -6.106385707855225, "global_step": 79912, "epoch": 1902} {"train_loss": -6.1862969398498535, "global_step": 79913, "epoch": 1902} {"train_loss": -6.086357116699219, "global_step": 79914, "epoch": 1902} {"train_loss": -6.264259338378906, "global_step": 79915, "epoch": 1902} {"train_loss": -6.11492919921875, "global_step": 79916, "epoch": 1902} {"train_loss": -6.072298526763916, "global_step": 79917, "epoch": 1902} {"train_loss": -6.065563201904297, "global_step": 79918, "epoch": 1902} {"train_loss": -6.124150276184082, "global_step": 79919, "epoch": 1902} {"train_loss": -6.053679466247559, "global_step": 79920, "epoch": 1902} {"train_loss": -6.044110298156738, "global_step": 79921, "epoch": 1902} {"train_loss": -6.097496032714844, "global_step": 79922, "epoch": 1902} {"train_loss": -6.096457481384277, "global_step": 79923, "epoch": 1902} {"train_loss": -6.021683692932129, "global_step": 79924, "epoch": 1902} {"train_loss": -6.140081223987398, "global_step": 79925, "epoch": 1902, "val_loss": 74959.109375} {"train_loss": -6.2565016746521, "global_step": 79926, "epoch": 1903} {"train_loss": -6.07840633392334, "global_step": 79927, "epoch": 1903} {"train_loss": -6.143909454345703, "global_step": 79928, "epoch": 1903} {"train_loss": -6.143545150756836, "global_step": 79929, "epoch": 1903} {"train_loss": -6.223529815673828, "global_step": 79930, "epoch": 1903} {"train_loss": -6.03972053527832, "global_step": 79931, "epoch": 1903} {"train_loss": -6.035383224487305, "global_step": 79932, "epoch": 1903} {"train_loss": -6.033750534057617, "global_step": 79933, "epoch": 1903} {"train_loss": -6.230063438415527, "global_step": 79934, "epoch": 1903} {"train_loss": -6.049378395080566, "global_step": 79935, "epoch": 1903} {"train_loss": -6.079751968383789, "global_step": 79936, "epoch": 1903} {"train_loss": -6.105742454528809, "global_step": 79937, "epoch": 1903} {"train_loss": -6.09149169921875, "global_step": 79938, "epoch": 1903} {"train_loss": -6.040545463562012, "global_step": 79939, "epoch": 1903} {"train_loss": -6.162164211273193, "global_step": 79940, "epoch": 1903} {"train_loss": -6.052739143371582, "global_step": 79941, "epoch": 1903} {"train_loss": -6.132570266723633, "global_step": 79942, "epoch": 1903} {"train_loss": -6.189507484436035, "global_step": 79943, "epoch": 1903} {"train_loss": -6.152036666870117, "global_step": 79944, "epoch": 1903} {"train_loss": -6.23206090927124, "global_step": 79945, "epoch": 1903} {"train_loss": -6.065707206726074, "global_step": 79946, "epoch": 1903} {"train_loss": -6.149441242218018, "global_step": 79947, "epoch": 1903} {"train_loss": -6.115460395812988, "global_step": 79948, "epoch": 1903} {"train_loss": -6.197085857391357, "global_step": 79949, "epoch": 1903} {"train_loss": -6.126082897186279, "global_step": 79950, "epoch": 1903} {"train_loss": -6.022458076477051, "global_step": 79951, "epoch": 1903} {"train_loss": -6.201938629150391, "global_step": 79952, "epoch": 1903} {"train_loss": -6.160051345825195, "global_step": 79953, "epoch": 1903} {"train_loss": -6.014754295349121, "global_step": 79954, "epoch": 1903} {"train_loss": -6.139847755432129, "global_step": 79955, "epoch": 1903} {"train_loss": -6.1092329025268555, "global_step": 79956, "epoch": 1903} {"train_loss": -6.143102645874023, "global_step": 79957, "epoch": 1903} {"train_loss": -5.99207878112793, "global_step": 79958, "epoch": 1903} {"train_loss": -6.08225154876709, "global_step": 79959, "epoch": 1903} {"train_loss": -6.111310005187988, "global_step": 79960, "epoch": 1903} {"train_loss": -6.059741020202637, "global_step": 79961, "epoch": 1903} {"train_loss": -6.0145721435546875, "global_step": 79962, "epoch": 1903} {"train_loss": -6.197971343994141, "global_step": 79963, "epoch": 1903} {"train_loss": -6.06174373626709, "global_step": 79964, "epoch": 1903} {"train_loss": -6.114900588989258, "global_step": 79965, "epoch": 1903} {"train_loss": -6.18502140045166, "global_step": 79966, "epoch": 1903} {"train_loss": -6.1154417878105525, "global_step": 79967, "epoch": 1903, "val_loss": 74845.484375} {"train_loss": -6.148001194000244, "global_step": 79968, "epoch": 1904} {"train_loss": -6.223085403442383, "global_step": 79969, "epoch": 1904} {"train_loss": -6.072229385375977, "global_step": 79970, "epoch": 1904} {"train_loss": -6.108896732330322, "global_step": 79971, "epoch": 1904} {"train_loss": -6.306787490844727, "global_step": 79972, "epoch": 1904} {"train_loss": -6.142671585083008, "global_step": 79973, "epoch": 1904} {"train_loss": -6.2652387619018555, "global_step": 79974, "epoch": 1904} {"train_loss": -6.129955768585205, "global_step": 79975, "epoch": 1904} {"train_loss": -6.161328315734863, "global_step": 79976, "epoch": 1904} {"train_loss": -6.2043046951293945, "global_step": 79977, "epoch": 1904} {"train_loss": -6.088474273681641, "global_step": 79978, "epoch": 1904} {"train_loss": -6.164624214172363, "global_step": 79979, "epoch": 1904} {"train_loss": -6.214544773101807, "global_step": 79980, "epoch": 1904} {"train_loss": -6.112756729125977, "global_step": 79981, "epoch": 1904} {"train_loss": -6.161497116088867, "global_step": 79982, "epoch": 1904} {"train_loss": -6.137821197509766, "global_step": 79983, "epoch": 1904} {"train_loss": -6.136207580566406, "global_step": 79984, "epoch": 1904} {"train_loss": -6.073578357696533, "global_step": 79985, "epoch": 1904} {"train_loss": -6.135459899902344, "global_step": 79986, "epoch": 1904} {"train_loss": -6.1504411697387695, "global_step": 79987, "epoch": 1904} {"train_loss": -6.166259765625, "global_step": 79988, "epoch": 1904} {"train_loss": -6.136181831359863, "global_step": 79989, "epoch": 1904} {"train_loss": -6.103504180908203, "global_step": 79990, "epoch": 1904} {"train_loss": -6.215507507324219, "global_step": 79991, "epoch": 1904} {"train_loss": -6.079977989196777, "global_step": 79992, "epoch": 1904} {"train_loss": -6.1403398513793945, "global_step": 79993, "epoch": 1904} {"train_loss": -6.047090530395508, "global_step": 79994, "epoch": 1904} {"train_loss": -6.128910064697266, "global_step": 79995, "epoch": 1904} {"train_loss": -6.082111835479736, "global_step": 79996, "epoch": 1904} {"train_loss": -6.224574089050293, "global_step": 79997, "epoch": 1904} {"train_loss": -6.106454372406006, "global_step": 79998, "epoch": 1904} {"train_loss": -6.070411682128906, "global_step": 79999, "epoch": 1904} {"train_loss": -6.10793399810791, "global_step": 80000, "epoch": 1904} {"train_loss": -6.140833377838135, "global_step": 80001, "epoch": 1904} {"train_loss": -6.183132171630859, "global_step": 80002, "epoch": 1904} {"train_loss": -6.171174049377441, "global_step": 80003, "epoch": 1904} {"train_loss": -6.109768867492676, "global_step": 80004, "epoch": 1904} {"train_loss": -6.181258201599121, "global_step": 80005, "epoch": 1904} {"train_loss": -6.315393447875977, "global_step": 80006, "epoch": 1904} {"train_loss": -6.113697528839111, "global_step": 80007, "epoch": 1904} {"train_loss": -6.191694736480713, "global_step": 80008, "epoch": 1904} {"train_loss": -6.150886910302298, "global_step": 80009, "epoch": 1904, "val_loss": 75426.6953125} {"train_loss": -6.297290802001953, "global_step": 80010, "epoch": 1905} {"train_loss": -6.184094429016113, "global_step": 80011, "epoch": 1905} {"train_loss": -6.141884803771973, "global_step": 80012, "epoch": 1905} {"train_loss": -6.110328674316406, "global_step": 80013, "epoch": 1905} {"train_loss": -6.183969020843506, "global_step": 80014, "epoch": 1905} {"train_loss": -6.1103105545043945, "global_step": 80015, "epoch": 1905} {"train_loss": -6.1413798332214355, "global_step": 80016, "epoch": 1905} {"train_loss": -6.164039611816406, "global_step": 80017, "epoch": 1905} {"train_loss": -6.18131160736084, "global_step": 80018, "epoch": 1905} {"train_loss": -6.146644592285156, "global_step": 80019, "epoch": 1905} {"train_loss": -6.211078643798828, "global_step": 80020, "epoch": 1905} {"train_loss": -6.07322883605957, "global_step": 80021, "epoch": 1905} {"train_loss": -6.242430686950684, "global_step": 80022, "epoch": 1905} {"train_loss": -6.1901350021362305, "global_step": 80023, "epoch": 1905} {"train_loss": -6.127441883087158, "global_step": 80024, "epoch": 1905} {"train_loss": -6.134486198425293, "global_step": 80025, "epoch": 1905} {"train_loss": -6.165782928466797, "global_step": 80026, "epoch": 1905} {"train_loss": -6.162508010864258, "global_step": 80027, "epoch": 1905} {"train_loss": -6.175099849700928, "global_step": 80028, "epoch": 1905} {"train_loss": -6.1787919998168945, "global_step": 80029, "epoch": 1905} {"train_loss": -6.01111364364624, "global_step": 80030, "epoch": 1905} {"train_loss": -6.122320175170898, "global_step": 80031, "epoch": 1905} {"train_loss": -5.934244155883789, "global_step": 80032, "epoch": 1905} {"train_loss": -5.915308952331543, "global_step": 80033, "epoch": 1905} {"train_loss": -6.2726826667785645, "global_step": 80034, "epoch": 1905} {"train_loss": -5.98974084854126, "global_step": 80035, "epoch": 1905} {"train_loss": -6.163549900054932, "global_step": 80036, "epoch": 1905} {"train_loss": -6.0910797119140625, "global_step": 80037, "epoch": 1905} {"train_loss": -6.000884532928467, "global_step": 80038, "epoch": 1905} {"train_loss": -6.072589874267578, "global_step": 80039, "epoch": 1905} {"train_loss": -6.1422810554504395, "global_step": 80040, "epoch": 1905} {"train_loss": -6.100491523742676, "global_step": 80041, "epoch": 1905} {"train_loss": -6.159491062164307, "global_step": 80042, "epoch": 1905} {"train_loss": -6.109261512756348, "global_step": 80043, "epoch": 1905} {"train_loss": -6.23695707321167, "global_step": 80044, "epoch": 1905} {"train_loss": -6.15958309173584, "global_step": 80045, "epoch": 1905} {"train_loss": -6.111016273498535, "global_step": 80046, "epoch": 1905} {"train_loss": -6.272526741027832, "global_step": 80047, "epoch": 1905} {"train_loss": -6.065235137939453, "global_step": 80048, "epoch": 1905} {"train_loss": -6.121706962585449, "global_step": 80049, "epoch": 1905} {"train_loss": -6.116589546203613, "global_step": 80050, "epoch": 1905} {"train_loss": -6.130613099961054, "global_step": 80051, "epoch": 1905, "val_loss": 74970.5} {"train_loss": -6.301595687866211, "global_step": 80052, "epoch": 1906} {"train_loss": -5.908735275268555, "global_step": 80053, "epoch": 1906} {"train_loss": -6.066248416900635, "global_step": 80054, "epoch": 1906} {"train_loss": -6.128523349761963, "global_step": 80055, "epoch": 1906} {"train_loss": -6.123477458953857, "global_step": 80056, "epoch": 1906} {"train_loss": -6.1299567222595215, "global_step": 80057, "epoch": 1906} {"train_loss": -6.2559614181518555, "global_step": 80058, "epoch": 1906} {"train_loss": -6.10568904876709, "global_step": 80059, "epoch": 1906} {"train_loss": -6.182183265686035, "global_step": 80060, "epoch": 1906} {"train_loss": -6.106191635131836, "global_step": 80061, "epoch": 1906} {"train_loss": -6.130108833312988, "global_step": 80062, "epoch": 1906} {"train_loss": -6.15332555770874, "global_step": 80063, "epoch": 1906} {"train_loss": -6.0597991943359375, "global_step": 80064, "epoch": 1906} {"train_loss": -6.182380199432373, "global_step": 80065, "epoch": 1906} {"train_loss": -6.114151954650879, "global_step": 80066, "epoch": 1906} {"train_loss": -6.165633201599121, "global_step": 80067, "epoch": 1906} {"train_loss": -6.241371154785156, "global_step": 80068, "epoch": 1906} {"train_loss": -6.131458759307861, "global_step": 80069, "epoch": 1906} {"train_loss": -6.134113311767578, "global_step": 80070, "epoch": 1906} {"train_loss": -6.249885082244873, "global_step": 80071, "epoch": 1906} {"train_loss": -6.215524673461914, "global_step": 80072, "epoch": 1906} {"train_loss": -6.169255256652832, "global_step": 80073, "epoch": 1906} {"train_loss": -6.192342758178711, "global_step": 80074, "epoch": 1906} {"train_loss": -6.2205119132995605, "global_step": 80075, "epoch": 1906} {"train_loss": -6.2307353019714355, "global_step": 80076, "epoch": 1906} {"train_loss": -6.161999702453613, "global_step": 80077, "epoch": 1906} {"train_loss": -6.224935054779053, "global_step": 80078, "epoch": 1906} {"train_loss": -6.139654159545898, "global_step": 80079, "epoch": 1906} {"train_loss": -6.080760478973389, "global_step": 80080, "epoch": 1906} {"train_loss": -6.126178741455078, "global_step": 80081, "epoch": 1906} {"train_loss": -6.147839546203613, "global_step": 80082, "epoch": 1906} {"train_loss": -6.115009307861328, "global_step": 80083, "epoch": 1906} {"train_loss": -6.253844738006592, "global_step": 80084, "epoch": 1906} {"train_loss": -6.022812843322754, "global_step": 80085, "epoch": 1906} {"train_loss": -6.134751319885254, "global_step": 80086, "epoch": 1906} {"train_loss": -6.19823694229126, "global_step": 80087, "epoch": 1906} {"train_loss": -6.098052978515625, "global_step": 80088, "epoch": 1906} {"train_loss": -6.173476219177246, "global_step": 80089, "epoch": 1906} {"train_loss": -6.185095310211182, "global_step": 80090, "epoch": 1906} {"train_loss": -6.149340629577637, "global_step": 80091, "epoch": 1906} {"train_loss": -6.02860689163208, "global_step": 80092, "epoch": 1906} {"train_loss": -6.148920059204102, "global_step": 80093, "epoch": 1906, "val_loss": 75141.7890625} {"train_loss": -6.118670463562012, "global_step": 80094, "epoch": 1907} {"train_loss": -6.209355354309082, "global_step": 80095, "epoch": 1907} {"train_loss": -6.077422142028809, "global_step": 80096, "epoch": 1907} {"train_loss": -6.062511444091797, "global_step": 80097, "epoch": 1907} {"train_loss": -6.187981605529785, "global_step": 80098, "epoch": 1907} {"train_loss": -6.058650970458984, "global_step": 80099, "epoch": 1907} {"train_loss": -6.0527729988098145, "global_step": 80100, "epoch": 1907} {"train_loss": -6.147310256958008, "global_step": 80101, "epoch": 1907} {"train_loss": -6.18367862701416, "global_step": 80102, "epoch": 1907} {"train_loss": -6.1511640548706055, "global_step": 80103, "epoch": 1907} {"train_loss": -6.183650016784668, "global_step": 80104, "epoch": 1907} {"train_loss": -6.0535502433776855, "global_step": 80105, "epoch": 1907} {"train_loss": -6.202600479125977, "global_step": 80106, "epoch": 1907} {"train_loss": -6.232291221618652, "global_step": 80107, "epoch": 1907} {"train_loss": -6.160271644592285, "global_step": 80108, "epoch": 1907} {"train_loss": -6.185146808624268, "global_step": 80109, "epoch": 1907} {"train_loss": -6.162970542907715, "global_step": 80110, "epoch": 1907} {"train_loss": -6.111655235290527, "global_step": 80111, "epoch": 1907} {"train_loss": -6.18532657623291, "global_step": 80112, "epoch": 1907} {"train_loss": -6.1916608810424805, "global_step": 80113, "epoch": 1907} {"train_loss": -6.121627330780029, "global_step": 80114, "epoch": 1907} {"train_loss": -6.2576189041137695, "global_step": 80115, "epoch": 1907} {"train_loss": -6.133327484130859, "global_step": 80116, "epoch": 1907} {"train_loss": -6.107609272003174, "global_step": 80117, "epoch": 1907} {"train_loss": -6.018863677978516, "global_step": 80118, "epoch": 1907} {"train_loss": -6.0165510177612305, "global_step": 80119, "epoch": 1907} {"train_loss": -6.111218452453613, "global_step": 80120, "epoch": 1907} {"train_loss": -6.185976982116699, "global_step": 80121, "epoch": 1907} {"train_loss": -6.195463180541992, "global_step": 80122, "epoch": 1907} {"train_loss": -6.167068958282471, "global_step": 80123, "epoch": 1907} {"train_loss": -6.0701494216918945, "global_step": 80124, "epoch": 1907} {"train_loss": -6.009278297424316, "global_step": 80125, "epoch": 1907} {"train_loss": -6.099112510681152, "global_step": 80126, "epoch": 1907} {"train_loss": -6.047018051147461, "global_step": 80127, "epoch": 1907} {"train_loss": -6.052038669586182, "global_step": 80128, "epoch": 1907} {"train_loss": -6.033331871032715, "global_step": 80129, "epoch": 1907} {"train_loss": -6.132079601287842, "global_step": 80130, "epoch": 1907} {"train_loss": -6.0704121589660645, "global_step": 80131, "epoch": 1907} {"train_loss": -5.983867168426514, "global_step": 80132, "epoch": 1907} {"train_loss": -6.120527267456055, "global_step": 80133, "epoch": 1907} {"train_loss": -6.135560989379883, "global_step": 80134, "epoch": 1907} {"train_loss": -6.123127483186268, "global_step": 80135, "epoch": 1907, "val_loss": 75259.96875} {"train_loss": -6.141579627990723, "global_step": 80136, "epoch": 1908} {"train_loss": -6.1240057945251465, "global_step": 80137, "epoch": 1908} {"train_loss": -6.109778881072998, "global_step": 80138, "epoch": 1908} {"train_loss": -6.154605865478516, "global_step": 80139, "epoch": 1908} {"train_loss": -6.061825752258301, "global_step": 80140, "epoch": 1908} {"train_loss": -6.157238960266113, "global_step": 80141, "epoch": 1908} {"train_loss": -6.120564937591553, "global_step": 80142, "epoch": 1908} {"train_loss": -6.081899642944336, "global_step": 80143, "epoch": 1908} {"train_loss": -6.000012397766113, "global_step": 80144, "epoch": 1908} {"train_loss": -6.0943498611450195, "global_step": 80145, "epoch": 1908} {"train_loss": -6.238954544067383, "global_step": 80146, "epoch": 1908} {"train_loss": -6.129655838012695, "global_step": 80147, "epoch": 1908} {"train_loss": -6.102632999420166, "global_step": 80148, "epoch": 1908} {"train_loss": -5.972615718841553, "global_step": 80149, "epoch": 1908} {"train_loss": -6.2056403160095215, "global_step": 80150, "epoch": 1908} {"train_loss": -6.049642086029053, "global_step": 80151, "epoch": 1908} {"train_loss": -6.146424293518066, "global_step": 80152, "epoch": 1908} {"train_loss": -6.143038749694824, "global_step": 80153, "epoch": 1908} {"train_loss": -6.373246669769287, "global_step": 80154, "epoch": 1908} {"train_loss": -6.066381454467773, "global_step": 80155, "epoch": 1908} {"train_loss": -6.017322540283203, "global_step": 80156, "epoch": 1908} {"train_loss": -6.1898698806762695, "global_step": 80157, "epoch": 1908} {"train_loss": -6.138086318969727, "global_step": 80158, "epoch": 1908} {"train_loss": -6.216439723968506, "global_step": 80159, "epoch": 1908} {"train_loss": -5.995170593261719, "global_step": 80160, "epoch": 1908} {"train_loss": -6.174175262451172, "global_step": 80161, "epoch": 1908} {"train_loss": -6.238832950592041, "global_step": 80162, "epoch": 1908} {"train_loss": -6.027612209320068, "global_step": 80163, "epoch": 1908} {"train_loss": -6.204460144042969, "global_step": 80164, "epoch": 1908} {"train_loss": -6.057342052459717, "global_step": 80165, "epoch": 1908} {"train_loss": -6.152338981628418, "global_step": 80166, "epoch": 1908} {"train_loss": -6.262829780578613, "global_step": 80167, "epoch": 1908} {"train_loss": -6.2323455810546875, "global_step": 80168, "epoch": 1908} {"train_loss": -6.158252239227295, "global_step": 80169, "epoch": 1908} {"train_loss": -6.142219066619873, "global_step": 80170, "epoch": 1908} {"train_loss": -6.125292778015137, "global_step": 80171, "epoch": 1908} {"train_loss": -6.275076866149902, "global_step": 80172, "epoch": 1908} {"train_loss": -6.115696907043457, "global_step": 80173, "epoch": 1908} {"train_loss": -6.192451477050781, "global_step": 80174, "epoch": 1908} {"train_loss": -6.246854782104492, "global_step": 80175, "epoch": 1908} {"train_loss": -6.107417583465576, "global_step": 80176, "epoch": 1908} {"train_loss": -6.140654552550543, "global_step": 80177, "epoch": 1908, "val_loss": 75051.7734375} {"train_loss": -6.272133827209473, "global_step": 80178, "epoch": 1909} {"train_loss": -6.189343452453613, "global_step": 80179, "epoch": 1909} {"train_loss": -6.221680641174316, "global_step": 80180, "epoch": 1909} {"train_loss": -6.158702850341797, "global_step": 80181, "epoch": 1909} {"train_loss": -6.228814601898193, "global_step": 80182, "epoch": 1909} {"train_loss": -6.169841289520264, "global_step": 80183, "epoch": 1909} {"train_loss": -6.124228000640869, "global_step": 80184, "epoch": 1909} {"train_loss": -6.076462745666504, "global_step": 80185, "epoch": 1909} {"train_loss": -6.032566070556641, "global_step": 80186, "epoch": 1909} {"train_loss": -6.20536994934082, "global_step": 80187, "epoch": 1909} {"train_loss": -6.137060165405273, "global_step": 80188, "epoch": 1909} {"train_loss": -6.067517280578613, "global_step": 80189, "epoch": 1909} {"train_loss": -6.015636444091797, "global_step": 80190, "epoch": 1909} {"train_loss": -6.157750129699707, "global_step": 80191, "epoch": 1909} {"train_loss": -6.153243541717529, "global_step": 80192, "epoch": 1909} {"train_loss": -6.168444633483887, "global_step": 80193, "epoch": 1909} {"train_loss": -6.120543003082275, "global_step": 80194, "epoch": 1909} {"train_loss": -6.139341354370117, "global_step": 80195, "epoch": 1909} {"train_loss": -6.031380653381348, "global_step": 80196, "epoch": 1909} {"train_loss": -6.292244911193848, "global_step": 80197, "epoch": 1909} {"train_loss": -6.066640853881836, "global_step": 80198, "epoch": 1909} {"train_loss": -6.2495927810668945, "global_step": 80199, "epoch": 1909} {"train_loss": -6.139218330383301, "global_step": 80200, "epoch": 1909} {"train_loss": -6.084753036499023, "global_step": 80201, "epoch": 1909} {"train_loss": -6.196641445159912, "global_step": 80202, "epoch": 1909} {"train_loss": -6.099762916564941, "global_step": 80203, "epoch": 1909} {"train_loss": -6.097789764404297, "global_step": 80204, "epoch": 1909} {"train_loss": -6.0743794441223145, "global_step": 80205, "epoch": 1909} {"train_loss": -6.190332412719727, "global_step": 80206, "epoch": 1909} {"train_loss": -6.1945881843566895, "global_step": 80207, "epoch": 1909} {"train_loss": -6.062598705291748, "global_step": 80208, "epoch": 1909} {"train_loss": -6.064939498901367, "global_step": 80209, "epoch": 1909} {"train_loss": -6.162310600280762, "global_step": 80210, "epoch": 1909} {"train_loss": -6.160931587219238, "global_step": 80211, "epoch": 1909} {"train_loss": -5.999385356903076, "global_step": 80212, "epoch": 1909} {"train_loss": -6.230677127838135, "global_step": 80213, "epoch": 1909} {"train_loss": -6.0279083251953125, "global_step": 80214, "epoch": 1909} {"train_loss": -6.051137924194336, "global_step": 80215, "epoch": 1909} {"train_loss": -6.00908088684082, "global_step": 80216, "epoch": 1909} {"train_loss": -6.132937908172607, "global_step": 80217, "epoch": 1909} {"train_loss": -6.1932759284973145, "global_step": 80218, "epoch": 1909} {"train_loss": -6.129914056687128, "global_step": 80219, "epoch": 1909, "val_loss": 75256.265625} {"train_loss": -6.101444721221924, "global_step": 80220, "epoch": 1910} {"train_loss": -6.146795272827148, "global_step": 80221, "epoch": 1910} {"train_loss": -6.016061782836914, "global_step": 80222, "epoch": 1910} {"train_loss": -6.15023136138916, "global_step": 80223, "epoch": 1910} {"train_loss": -5.963723182678223, "global_step": 80224, "epoch": 1910} {"train_loss": -6.141707420349121, "global_step": 80225, "epoch": 1910} {"train_loss": -6.188272476196289, "global_step": 80226, "epoch": 1910} {"train_loss": -6.133805274963379, "global_step": 80227, "epoch": 1910} {"train_loss": -5.997277736663818, "global_step": 80228, "epoch": 1910} {"train_loss": -6.146671772003174, "global_step": 80229, "epoch": 1910} {"train_loss": -6.103470802307129, "global_step": 80230, "epoch": 1910} {"train_loss": -6.147857666015625, "global_step": 80231, "epoch": 1910} {"train_loss": -6.023678302764893, "global_step": 80232, "epoch": 1910} {"train_loss": -6.124909400939941, "global_step": 80233, "epoch": 1910} {"train_loss": -6.0570573806762695, "global_step": 80234, "epoch": 1910} {"train_loss": -6.04191780090332, "global_step": 80235, "epoch": 1910} {"train_loss": -6.077726364135742, "global_step": 80236, "epoch": 1910} {"train_loss": -6.06117582321167, "global_step": 80237, "epoch": 1910} {"train_loss": -6.095149993896484, "global_step": 80238, "epoch": 1910} {"train_loss": -6.0625715255737305, "global_step": 80239, "epoch": 1910} {"train_loss": -5.9879255294799805, "global_step": 80240, "epoch": 1910} {"train_loss": -6.1044769287109375, "global_step": 80241, "epoch": 1910} {"train_loss": -6.144230842590332, "global_step": 80242, "epoch": 1910} {"train_loss": -6.216166973114014, "global_step": 80243, "epoch": 1910} {"train_loss": -5.995811462402344, "global_step": 80244, "epoch": 1910} {"train_loss": -6.098576068878174, "global_step": 80245, "epoch": 1910} {"train_loss": -6.144477844238281, "global_step": 80246, "epoch": 1910} {"train_loss": -6.052080154418945, "global_step": 80247, "epoch": 1910} {"train_loss": -6.204276084899902, "global_step": 80248, "epoch": 1910} {"train_loss": -6.096396446228027, "global_step": 80249, "epoch": 1910} {"train_loss": -6.119897842407227, "global_step": 80250, "epoch": 1910} {"train_loss": -6.2093963623046875, "global_step": 80251, "epoch": 1910} {"train_loss": -6.08547306060791, "global_step": 80252, "epoch": 1910} {"train_loss": -6.119643211364746, "global_step": 80253, "epoch": 1910} {"train_loss": -6.235678672790527, "global_step": 80254, "epoch": 1910} {"train_loss": -6.1446075439453125, "global_step": 80255, "epoch": 1910} {"train_loss": -6.112354278564453, "global_step": 80256, "epoch": 1910} {"train_loss": -6.16340446472168, "global_step": 80257, "epoch": 1910} {"train_loss": -6.099386215209961, "global_step": 80258, "epoch": 1910} {"train_loss": -6.028268814086914, "global_step": 80259, "epoch": 1910} {"train_loss": -6.192889213562012, "global_step": 80260, "epoch": 1910} {"train_loss": -6.105694645927066, "global_step": 80261, "epoch": 1910, "val_loss": 75092.2734375} {"train_loss": -6.0589118003845215, "global_step": 80262, "epoch": 1911} {"train_loss": -6.045666694641113, "global_step": 80263, "epoch": 1911} {"train_loss": -6.116160869598389, "global_step": 80264, "epoch": 1911} {"train_loss": -6.137282371520996, "global_step": 80265, "epoch": 1911} {"train_loss": -6.121816635131836, "global_step": 80266, "epoch": 1911} {"train_loss": -6.006967067718506, "global_step": 80267, "epoch": 1911} {"train_loss": -6.210875511169434, "global_step": 80268, "epoch": 1911} {"train_loss": -6.177638053894043, "global_step": 80269, "epoch": 1911} {"train_loss": -6.153261661529541, "global_step": 80270, "epoch": 1911} {"train_loss": -6.20637321472168, "global_step": 80271, "epoch": 1911} {"train_loss": -6.136457443237305, "global_step": 80272, "epoch": 1911} {"train_loss": -6.218499183654785, "global_step": 80273, "epoch": 1911} {"train_loss": -6.25535774230957, "global_step": 80274, "epoch": 1911} {"train_loss": -6.144982814788818, "global_step": 80275, "epoch": 1911} {"train_loss": -6.083256721496582, "global_step": 80276, "epoch": 1911} {"train_loss": -6.139529228210449, "global_step": 80277, "epoch": 1911} {"train_loss": -6.167309284210205, "global_step": 80278, "epoch": 1911} {"train_loss": -6.1127519607543945, "global_step": 80279, "epoch": 1911} {"train_loss": -6.191125869750977, "global_step": 80280, "epoch": 1911} {"train_loss": -6.145042419433594, "global_step": 80281, "epoch": 1911} {"train_loss": -6.220393180847168, "global_step": 80282, "epoch": 1911} {"train_loss": -6.130423069000244, "global_step": 80283, "epoch": 1911} {"train_loss": -6.167594909667969, "global_step": 80284, "epoch": 1911} {"train_loss": -6.245194435119629, "global_step": 80285, "epoch": 1911} {"train_loss": -6.218118667602539, "global_step": 80286, "epoch": 1911} {"train_loss": -6.066974639892578, "global_step": 80287, "epoch": 1911} {"train_loss": -6.128330230712891, "global_step": 80288, "epoch": 1911} {"train_loss": -6.186539173126221, "global_step": 80289, "epoch": 1911} {"train_loss": -6.1715593338012695, "global_step": 80290, "epoch": 1911} {"train_loss": -6.187618255615234, "global_step": 80291, "epoch": 1911} {"train_loss": -6.166934490203857, "global_step": 80292, "epoch": 1911} {"train_loss": -6.158967018127441, "global_step": 80293, "epoch": 1911} {"train_loss": -6.141067981719971, "global_step": 80294, "epoch": 1911} {"train_loss": -6.078876495361328, "global_step": 80295, "epoch": 1911} {"train_loss": -6.26458740234375, "global_step": 80296, "epoch": 1911} {"train_loss": -6.07053804397583, "global_step": 80297, "epoch": 1911} {"train_loss": -6.0169267654418945, "global_step": 80298, "epoch": 1911} {"train_loss": -6.128023147583008, "global_step": 80299, "epoch": 1911} {"train_loss": -6.166803359985352, "global_step": 80300, "epoch": 1911} {"train_loss": -6.107084274291992, "global_step": 80301, "epoch": 1911} {"train_loss": -6.09096622467041, "global_step": 80302, "epoch": 1911} {"train_loss": -6.143127770650954, "global_step": 80303, "epoch": 1911, "val_loss": 75169.0} {"train_loss": -6.018685817718506, "global_step": 80304, "epoch": 1912} {"train_loss": -6.108872413635254, "global_step": 80305, "epoch": 1912} {"train_loss": -6.102782726287842, "global_step": 80306, "epoch": 1912} {"train_loss": -6.178443908691406, "global_step": 80307, "epoch": 1912} {"train_loss": -6.101455211639404, "global_step": 80308, "epoch": 1912} {"train_loss": -6.190167427062988, "global_step": 80309, "epoch": 1912} {"train_loss": -6.09112024307251, "global_step": 80310, "epoch": 1912} {"train_loss": -6.151865005493164, "global_step": 80311, "epoch": 1912} {"train_loss": -6.098316192626953, "global_step": 80312, "epoch": 1912} {"train_loss": -6.0912933349609375, "global_step": 80313, "epoch": 1912} {"train_loss": -6.131098747253418, "global_step": 80314, "epoch": 1912} {"train_loss": -6.097965240478516, "global_step": 80315, "epoch": 1912} {"train_loss": -6.09042501449585, "global_step": 80316, "epoch": 1912} {"train_loss": -6.18129825592041, "global_step": 80317, "epoch": 1912} {"train_loss": -6.044090747833252, "global_step": 80318, "epoch": 1912} {"train_loss": -6.123360633850098, "global_step": 80319, "epoch": 1912} {"train_loss": -6.122437477111816, "global_step": 80320, "epoch": 1912} {"train_loss": -6.1060614585876465, "global_step": 80321, "epoch": 1912} {"train_loss": -6.149003028869629, "global_step": 80322, "epoch": 1912} {"train_loss": -6.091753959655762, "global_step": 80323, "epoch": 1912} {"train_loss": -6.1300153732299805, "global_step": 80324, "epoch": 1912} {"train_loss": -6.104195594787598, "global_step": 80325, "epoch": 1912} {"train_loss": -6.1633477210998535, "global_step": 80326, "epoch": 1912} {"train_loss": -6.058003902435303, "global_step": 80327, "epoch": 1912} {"train_loss": -6.031253814697266, "global_step": 80328, "epoch": 1912} {"train_loss": -6.002089500427246, "global_step": 80329, "epoch": 1912} {"train_loss": -6.13309383392334, "global_step": 80330, "epoch": 1912} {"train_loss": -6.065810203552246, "global_step": 80331, "epoch": 1912} {"train_loss": -5.971477508544922, "global_step": 80332, "epoch": 1912} {"train_loss": -6.167091369628906, "global_step": 80333, "epoch": 1912} {"train_loss": -6.044621467590332, "global_step": 80334, "epoch": 1912} {"train_loss": -6.1582841873168945, "global_step": 80335, "epoch": 1912} {"train_loss": -6.109962463378906, "global_step": 80336, "epoch": 1912} {"train_loss": -6.005586624145508, "global_step": 80337, "epoch": 1912} {"train_loss": -6.1690673828125, "global_step": 80338, "epoch": 1912} {"train_loss": -6.095418930053711, "global_step": 80339, "epoch": 1912} {"train_loss": -6.2388505935668945, "global_step": 80340, "epoch": 1912} {"train_loss": -6.133785247802734, "global_step": 80341, "epoch": 1912} {"train_loss": -6.170515060424805, "global_step": 80342, "epoch": 1912} {"train_loss": -6.107377052307129, "global_step": 80343, "epoch": 1912} {"train_loss": -6.243904113769531, "global_step": 80344, "epoch": 1912} {"train_loss": -6.109686238425119, "global_step": 80345, "epoch": 1912, "val_loss": 74870.53125} {"train_loss": -6.158180236816406, "global_step": 80346, "epoch": 1913} {"train_loss": -6.203642845153809, "global_step": 80347, "epoch": 1913} {"train_loss": -6.065624713897705, "global_step": 80348, "epoch": 1913} {"train_loss": -6.168056488037109, "global_step": 80349, "epoch": 1913} {"train_loss": -6.236342430114746, "global_step": 80350, "epoch": 1913} {"train_loss": -6.123123645782471, "global_step": 80351, "epoch": 1913} {"train_loss": -6.131719589233398, "global_step": 80352, "epoch": 1913} {"train_loss": -6.07198429107666, "global_step": 80353, "epoch": 1913} {"train_loss": -6.155900478363037, "global_step": 80354, "epoch": 1913} {"train_loss": -6.0660529136657715, "global_step": 80355, "epoch": 1913} {"train_loss": -6.054459095001221, "global_step": 80356, "epoch": 1913} {"train_loss": -6.138324737548828, "global_step": 80357, "epoch": 1913} {"train_loss": -6.07846736907959, "global_step": 80358, "epoch": 1913} {"train_loss": -6.080281734466553, "global_step": 80359, "epoch": 1913} {"train_loss": -6.085765838623047, "global_step": 80360, "epoch": 1913} {"train_loss": -6.139825820922852, "global_step": 80361, "epoch": 1913} {"train_loss": -6.161273002624512, "global_step": 80362, "epoch": 1913} {"train_loss": -6.0822343826293945, "global_step": 80363, "epoch": 1913} {"train_loss": -6.250239849090576, "global_step": 80364, "epoch": 1913} {"train_loss": -6.09003210067749, "global_step": 80365, "epoch": 1913} {"train_loss": -6.171324729919434, "global_step": 80366, "epoch": 1913} {"train_loss": -6.068266868591309, "global_step": 80367, "epoch": 1913} {"train_loss": -6.190629005432129, "global_step": 80368, "epoch": 1913} {"train_loss": -6.1271796226501465, "global_step": 80369, "epoch": 1913} {"train_loss": -6.236976623535156, "global_step": 80370, "epoch": 1913} {"train_loss": -6.248217582702637, "global_step": 80371, "epoch": 1913} {"train_loss": -6.195696830749512, "global_step": 80372, "epoch": 1913} {"train_loss": -6.070927619934082, "global_step": 80373, "epoch": 1913} {"train_loss": -6.139275550842285, "global_step": 80374, "epoch": 1913} {"train_loss": -6.10107421875, "global_step": 80375, "epoch": 1913} {"train_loss": -6.203307628631592, "global_step": 80376, "epoch": 1913} {"train_loss": -6.087615013122559, "global_step": 80377, "epoch": 1913} {"train_loss": -6.0462446212768555, "global_step": 80378, "epoch": 1913} {"train_loss": -6.311459541320801, "global_step": 80379, "epoch": 1913} {"train_loss": -6.1012749671936035, "global_step": 80380, "epoch": 1913} {"train_loss": -6.087834358215332, "global_step": 80381, "epoch": 1913} {"train_loss": -6.102645397186279, "global_step": 80382, "epoch": 1913} {"train_loss": -5.9777679443359375, "global_step": 80383, "epoch": 1913} {"train_loss": -6.0138092041015625, "global_step": 80384, "epoch": 1913} {"train_loss": -6.058345794677734, "global_step": 80385, "epoch": 1913} {"train_loss": -6.045867919921875, "global_step": 80386, "epoch": 1913} {"train_loss": -6.125715936933245, "global_step": 80387, "epoch": 1913, "val_loss": 75178.984375} {"train_loss": -6.08812141418457, "global_step": 80388, "epoch": 1914} {"train_loss": -5.993618011474609, "global_step": 80389, "epoch": 1914} {"train_loss": -6.002107620239258, "global_step": 80390, "epoch": 1914} {"train_loss": -6.124276638031006, "global_step": 80391, "epoch": 1914} {"train_loss": -6.156561851501465, "global_step": 80392, "epoch": 1914} {"train_loss": -6.1003594398498535, "global_step": 80393, "epoch": 1914} {"train_loss": -6.1767473220825195, "global_step": 80394, "epoch": 1914} {"train_loss": -6.048883438110352, "global_step": 80395, "epoch": 1914} {"train_loss": -6.084099769592285, "global_step": 80396, "epoch": 1914} {"train_loss": -6.0514068603515625, "global_step": 80397, "epoch": 1914} {"train_loss": -6.1263427734375, "global_step": 80398, "epoch": 1914} {"train_loss": -5.999441146850586, "global_step": 80399, "epoch": 1914} {"train_loss": -6.094196319580078, "global_step": 80400, "epoch": 1914} {"train_loss": -6.096578598022461, "global_step": 80401, "epoch": 1914} {"train_loss": -6.235804080963135, "global_step": 80402, "epoch": 1914} {"train_loss": -6.123274803161621, "global_step": 80403, "epoch": 1914} {"train_loss": -6.146697044372559, "global_step": 80404, "epoch": 1914} {"train_loss": -6.141969203948975, "global_step": 80405, "epoch": 1914} {"train_loss": -6.123431205749512, "global_step": 80406, "epoch": 1914} {"train_loss": -6.236348628997803, "global_step": 80407, "epoch": 1914} {"train_loss": -6.115820407867432, "global_step": 80408, "epoch": 1914} {"train_loss": -6.166706562042236, "global_step": 80409, "epoch": 1914} {"train_loss": -6.113528251647949, "global_step": 80410, "epoch": 1914} {"train_loss": -6.207951068878174, "global_step": 80411, "epoch": 1914} {"train_loss": -6.139408111572266, "global_step": 80412, "epoch": 1914} {"train_loss": -6.272683143615723, "global_step": 80413, "epoch": 1914} {"train_loss": -6.166258811950684, "global_step": 80414, "epoch": 1914} {"train_loss": -6.232638359069824, "global_step": 80415, "epoch": 1914} {"train_loss": -6.097848892211914, "global_step": 80416, "epoch": 1914} {"train_loss": -6.162040710449219, "global_step": 80417, "epoch": 1914} {"train_loss": -6.181624889373779, "global_step": 80418, "epoch": 1914} {"train_loss": -6.236322402954102, "global_step": 80419, "epoch": 1914} {"train_loss": -6.2493085861206055, "global_step": 80420, "epoch": 1914} {"train_loss": -6.23537540435791, "global_step": 80421, "epoch": 1914} {"train_loss": -6.170207977294922, "global_step": 80422, "epoch": 1914} {"train_loss": -5.997780799865723, "global_step": 80423, "epoch": 1914} {"train_loss": -6.13485860824585, "global_step": 80424, "epoch": 1914} {"train_loss": -6.205417156219482, "global_step": 80425, "epoch": 1914} {"train_loss": -6.058342933654785, "global_step": 80426, "epoch": 1914} {"train_loss": -6.000487327575684, "global_step": 80427, "epoch": 1914} {"train_loss": -6.121435165405273, "global_step": 80428, "epoch": 1914} {"train_loss": -6.133140779676891, "global_step": 80429, "epoch": 1914, "val_loss": 75071.8359375} {"train_loss": -6.121026039123535, "global_step": 80430, "epoch": 1915} {"train_loss": -6.119402885437012, "global_step": 80431, "epoch": 1915} {"train_loss": -6.160677909851074, "global_step": 80432, "epoch": 1915} {"train_loss": -6.05922794342041, "global_step": 80433, "epoch": 1915} {"train_loss": -6.079106330871582, "global_step": 80434, "epoch": 1915} {"train_loss": -6.151951789855957, "global_step": 80435, "epoch": 1915} {"train_loss": -6.155314922332764, "global_step": 80436, "epoch": 1915} {"train_loss": -6.280886650085449, "global_step": 80437, "epoch": 1915} {"train_loss": -6.101472854614258, "global_step": 80438, "epoch": 1915} {"train_loss": -6.116707801818848, "global_step": 80439, "epoch": 1915} {"train_loss": -6.101056098937988, "global_step": 80440, "epoch": 1915} {"train_loss": -6.078027725219727, "global_step": 80441, "epoch": 1915} {"train_loss": -6.091216087341309, "global_step": 80442, "epoch": 1915} {"train_loss": -6.2015838623046875, "global_step": 80443, "epoch": 1915} {"train_loss": -6.123174667358398, "global_step": 80444, "epoch": 1915} {"train_loss": -6.262779235839844, "global_step": 80445, "epoch": 1915} {"train_loss": -6.214582443237305, "global_step": 80446, "epoch": 1915} {"train_loss": -6.192673683166504, "global_step": 80447, "epoch": 1915} {"train_loss": -6.216604232788086, "global_step": 80448, "epoch": 1915} {"train_loss": -6.226279258728027, "global_step": 80449, "epoch": 1915} {"train_loss": -6.210238456726074, "global_step": 80450, "epoch": 1915} {"train_loss": -6.137144088745117, "global_step": 80451, "epoch": 1915} {"train_loss": -6.074029922485352, "global_step": 80452, "epoch": 1915} {"train_loss": -6.173699378967285, "global_step": 80453, "epoch": 1915} {"train_loss": -6.047662258148193, "global_step": 80454, "epoch": 1915} {"train_loss": -6.0938005447387695, "global_step": 80455, "epoch": 1915} {"train_loss": -6.203228950500488, "global_step": 80456, "epoch": 1915} {"train_loss": -6.1103081703186035, "global_step": 80457, "epoch": 1915} {"train_loss": -6.11649751663208, "global_step": 80458, "epoch": 1915} {"train_loss": -6.028914451599121, "global_step": 80459, "epoch": 1915} {"train_loss": -6.038638114929199, "global_step": 80460, "epoch": 1915} {"train_loss": -6.123826026916504, "global_step": 80461, "epoch": 1915} {"train_loss": -6.011965274810791, "global_step": 80462, "epoch": 1915} {"train_loss": -6.150579929351807, "global_step": 80463, "epoch": 1915} {"train_loss": -6.05444860458374, "global_step": 80464, "epoch": 1915} {"train_loss": -5.973935127258301, "global_step": 80465, "epoch": 1915} {"train_loss": -6.024598121643066, "global_step": 80466, "epoch": 1915} {"train_loss": -6.060613632202148, "global_step": 80467, "epoch": 1915} {"train_loss": -6.0693488121032715, "global_step": 80468, "epoch": 1915} {"train_loss": -6.032804489135742, "global_step": 80469, "epoch": 1915} {"train_loss": -6.119278907775879, "global_step": 80470, "epoch": 1915} {"train_loss": -6.118048622494652, "global_step": 80471, "epoch": 1915, "val_loss": 75060.953125} {"train_loss": -6.165650367736816, "global_step": 80472, "epoch": 1916} {"train_loss": -6.118609428405762, "global_step": 80473, "epoch": 1916} {"train_loss": -6.113612174987793, "global_step": 80474, "epoch": 1916} {"train_loss": -6.087545871734619, "global_step": 80475, "epoch": 1916} {"train_loss": -6.151668548583984, "global_step": 80476, "epoch": 1916} {"train_loss": -6.144105911254883, "global_step": 80477, "epoch": 1916} {"train_loss": -6.060063362121582, "global_step": 80478, "epoch": 1916} {"train_loss": -6.170366287231445, "global_step": 80479, "epoch": 1916} {"train_loss": -6.200937271118164, "global_step": 80480, "epoch": 1916} {"train_loss": -6.234298229217529, "global_step": 80481, "epoch": 1916} {"train_loss": -6.173186302185059, "global_step": 80482, "epoch": 1916} {"train_loss": -6.142637252807617, "global_step": 80483, "epoch": 1916} {"train_loss": -6.267358303070068, "global_step": 80484, "epoch": 1916} {"train_loss": -6.17851448059082, "global_step": 80485, "epoch": 1916} {"train_loss": -6.108905792236328, "global_step": 80486, "epoch": 1916} {"train_loss": -6.131086349487305, "global_step": 80487, "epoch": 1916} {"train_loss": -6.114182472229004, "global_step": 80488, "epoch": 1916} {"train_loss": -6.183267593383789, "global_step": 80489, "epoch": 1916} {"train_loss": -6.1860880851745605, "global_step": 80490, "epoch": 1916} {"train_loss": -6.24845027923584, "global_step": 80491, "epoch": 1916} {"train_loss": -6.099004745483398, "global_step": 80492, "epoch": 1916} {"train_loss": -6.1523261070251465, "global_step": 80493, "epoch": 1916} {"train_loss": -6.121264457702637, "global_step": 80494, "epoch": 1916} {"train_loss": -6.0897932052612305, "global_step": 80495, "epoch": 1916} {"train_loss": -6.094030857086182, "global_step": 80496, "epoch": 1916} {"train_loss": -6.165122032165527, "global_step": 80497, "epoch": 1916} {"train_loss": -6.210152626037598, "global_step": 80498, "epoch": 1916} {"train_loss": -6.083883285522461, "global_step": 80499, "epoch": 1916} {"train_loss": -6.149574279785156, "global_step": 80500, "epoch": 1916} {"train_loss": -6.271198272705078, "global_step": 80501, "epoch": 1916} {"train_loss": -6.07912015914917, "global_step": 80502, "epoch": 1916} {"train_loss": -6.056710720062256, "global_step": 80503, "epoch": 1916} {"train_loss": -6.186514854431152, "global_step": 80504, "epoch": 1916} {"train_loss": -6.14671516418457, "global_step": 80505, "epoch": 1916} {"train_loss": -6.136186122894287, "global_step": 80506, "epoch": 1916} {"train_loss": -6.129436492919922, "global_step": 80507, "epoch": 1916} {"train_loss": -6.176184177398682, "global_step": 80508, "epoch": 1916} {"train_loss": -6.277944087982178, "global_step": 80509, "epoch": 1916} {"train_loss": -6.101856708526611, "global_step": 80510, "epoch": 1916} {"train_loss": -6.043283939361572, "global_step": 80511, "epoch": 1916} {"train_loss": -6.161210060119629, "global_step": 80512, "epoch": 1916} {"train_loss": -6.148974600292387, "global_step": 80513, "epoch": 1916, "val_loss": 74875.40625} {"train_loss": -6.050347805023193, "global_step": 80514, "epoch": 1917} {"train_loss": -6.167333602905273, "global_step": 80515, "epoch": 1917} {"train_loss": -6.219521522521973, "global_step": 80516, "epoch": 1917} {"train_loss": -6.042858123779297, "global_step": 80517, "epoch": 1917} {"train_loss": -6.198822021484375, "global_step": 80518, "epoch": 1917} {"train_loss": -6.114860534667969, "global_step": 80519, "epoch": 1917} {"train_loss": -6.085146903991699, "global_step": 80520, "epoch": 1917} {"train_loss": -6.131443023681641, "global_step": 80521, "epoch": 1917} {"train_loss": -5.905704498291016, "global_step": 80522, "epoch": 1917} {"train_loss": -6.133966445922852, "global_step": 80523, "epoch": 1917} {"train_loss": -6.2465033531188965, "global_step": 80524, "epoch": 1917} {"train_loss": -6.169598579406738, "global_step": 80525, "epoch": 1917} {"train_loss": -6.106377601623535, "global_step": 80526, "epoch": 1917} {"train_loss": -6.10611629486084, "global_step": 80527, "epoch": 1917} {"train_loss": -6.162364482879639, "global_step": 80528, "epoch": 1917} {"train_loss": -6.236865043640137, "global_step": 80529, "epoch": 1917} {"train_loss": -6.204798698425293, "global_step": 80530, "epoch": 1917} {"train_loss": -6.221651077270508, "global_step": 80531, "epoch": 1917} {"train_loss": -6.135859489440918, "global_step": 80532, "epoch": 1917} {"train_loss": -6.168997764587402, "global_step": 80533, "epoch": 1917} {"train_loss": -6.162784576416016, "global_step": 80534, "epoch": 1917} {"train_loss": -6.178910255432129, "global_step": 80535, "epoch": 1917} {"train_loss": -6.0386810302734375, "global_step": 80536, "epoch": 1917} {"train_loss": -6.196659088134766, "global_step": 80537, "epoch": 1917} {"train_loss": -6.187521934509277, "global_step": 80538, "epoch": 1917} {"train_loss": -6.232619762420654, "global_step": 80539, "epoch": 1917} {"train_loss": -6.098039150238037, "global_step": 80540, "epoch": 1917} {"train_loss": -6.161290645599365, "global_step": 80541, "epoch": 1917} {"train_loss": -6.199739456176758, "global_step": 80542, "epoch": 1917} {"train_loss": -6.1535563468933105, "global_step": 80543, "epoch": 1917} {"train_loss": -6.0081787109375, "global_step": 80544, "epoch": 1917} {"train_loss": -6.140691757202148, "global_step": 80545, "epoch": 1917} {"train_loss": -6.123848915100098, "global_step": 80546, "epoch": 1917} {"train_loss": -6.227540969848633, "global_step": 80547, "epoch": 1917} {"train_loss": -6.127384185791016, "global_step": 80548, "epoch": 1917} {"train_loss": -6.091275215148926, "global_step": 80549, "epoch": 1917} {"train_loss": -6.2649688720703125, "global_step": 80550, "epoch": 1917} {"train_loss": -6.146442890167236, "global_step": 80551, "epoch": 1917} {"train_loss": -6.053913116455078, "global_step": 80552, "epoch": 1917} {"train_loss": -6.185447692871094, "global_step": 80553, "epoch": 1917} {"train_loss": -6.193539619445801, "global_step": 80554, "epoch": 1917} {"train_loss": -6.143542584918794, "global_step": 80555, "epoch": 1917, "val_loss": 74969.1484375} {"train_loss": -6.066584587097168, "global_step": 80556, "epoch": 1918} {"train_loss": -6.205089569091797, "global_step": 80557, "epoch": 1918} {"train_loss": -6.127568244934082, "global_step": 80558, "epoch": 1918} {"train_loss": -6.058459758758545, "global_step": 80559, "epoch": 1918} {"train_loss": -6.134661674499512, "global_step": 80560, "epoch": 1918} {"train_loss": -6.061535835266113, "global_step": 80561, "epoch": 1918} {"train_loss": -6.170657157897949, "global_step": 80562, "epoch": 1918} {"train_loss": -6.108928680419922, "global_step": 80563, "epoch": 1918} {"train_loss": -6.13389253616333, "global_step": 80564, "epoch": 1918} {"train_loss": -6.2738542556762695, "global_step": 80565, "epoch": 1918} {"train_loss": -6.046019554138184, "global_step": 80566, "epoch": 1918} {"train_loss": -5.989536285400391, "global_step": 80567, "epoch": 1918} {"train_loss": -6.175840377807617, "global_step": 80568, "epoch": 1918} {"train_loss": -6.02182674407959, "global_step": 80569, "epoch": 1918} {"train_loss": -6.018784523010254, "global_step": 80570, "epoch": 1918} {"train_loss": -6.023448944091797, "global_step": 80571, "epoch": 1918} {"train_loss": -6.036322593688965, "global_step": 80572, "epoch": 1918} {"train_loss": -6.169118881225586, "global_step": 80573, "epoch": 1918} {"train_loss": -5.99730920791626, "global_step": 80574, "epoch": 1918} {"train_loss": -6.091654300689697, "global_step": 80575, "epoch": 1918} {"train_loss": -6.102411270141602, "global_step": 80576, "epoch": 1918} {"train_loss": -5.9110846519470215, "global_step": 80577, "epoch": 1918} {"train_loss": -5.983111381530762, "global_step": 80578, "epoch": 1918} {"train_loss": -6.010006904602051, "global_step": 80579, "epoch": 1918} {"train_loss": -6.168971538543701, "global_step": 80580, "epoch": 1918} {"train_loss": -5.9695234298706055, "global_step": 80581, "epoch": 1918} {"train_loss": -6.234634876251221, "global_step": 80582, "epoch": 1918} {"train_loss": -6.014614105224609, "global_step": 80583, "epoch": 1918} {"train_loss": -6.147152900695801, "global_step": 80584, "epoch": 1918} {"train_loss": -6.094165802001953, "global_step": 80585, "epoch": 1918} {"train_loss": -6.213350296020508, "global_step": 80586, "epoch": 1918} {"train_loss": -6.020197868347168, "global_step": 80587, "epoch": 1918} {"train_loss": -6.159255504608154, "global_step": 80588, "epoch": 1918} {"train_loss": -6.055059432983398, "global_step": 80589, "epoch": 1918} {"train_loss": -6.2297210693359375, "global_step": 80590, "epoch": 1918} {"train_loss": -6.101663112640381, "global_step": 80591, "epoch": 1918} {"train_loss": -6.13498067855835, "global_step": 80592, "epoch": 1918} {"train_loss": -6.119874954223633, "global_step": 80593, "epoch": 1918} {"train_loss": -6.039238929748535, "global_step": 80594, "epoch": 1918} {"train_loss": -6.20149040222168, "global_step": 80595, "epoch": 1918} {"train_loss": -6.162113189697266, "global_step": 80596, "epoch": 1918} {"train_loss": -6.098500229063488, "global_step": 80597, "epoch": 1918, "val_loss": 74724.46875} {"train_loss": -6.107988357543945, "global_step": 80598, "epoch": 1919} {"train_loss": -6.202391624450684, "global_step": 80599, "epoch": 1919} {"train_loss": -6.08848762512207, "global_step": 80600, "epoch": 1919} {"train_loss": -6.147525787353516, "global_step": 80601, "epoch": 1919} {"train_loss": -6.126913070678711, "global_step": 80602, "epoch": 1919} {"train_loss": -6.1960344314575195, "global_step": 80603, "epoch": 1919} {"train_loss": -6.182003021240234, "global_step": 80604, "epoch": 1919} {"train_loss": -6.282183647155762, "global_step": 80605, "epoch": 1919} {"train_loss": -6.17439079284668, "global_step": 80606, "epoch": 1919} {"train_loss": -6.207759857177734, "global_step": 80607, "epoch": 1919} {"train_loss": -6.175965309143066, "global_step": 80608, "epoch": 1919} {"train_loss": -6.1819963455200195, "global_step": 80609, "epoch": 1919} {"train_loss": -6.234724521636963, "global_step": 80610, "epoch": 1919} {"train_loss": -6.234559059143066, "global_step": 80611, "epoch": 1919} {"train_loss": -6.188225746154785, "global_step": 80612, "epoch": 1919} {"train_loss": -6.036293983459473, "global_step": 80613, "epoch": 1919} {"train_loss": -6.167839050292969, "global_step": 80614, "epoch": 1919} {"train_loss": -6.175139904022217, "global_step": 80615, "epoch": 1919} {"train_loss": -6.201169490814209, "global_step": 80616, "epoch": 1919} {"train_loss": -6.2024688720703125, "global_step": 80617, "epoch": 1919} {"train_loss": -6.200183868408203, "global_step": 80618, "epoch": 1919} {"train_loss": -5.98248291015625, "global_step": 80619, "epoch": 1919} {"train_loss": -6.036249160766602, "global_step": 80620, "epoch": 1919} {"train_loss": -6.1020612716674805, "global_step": 80621, "epoch": 1919} {"train_loss": -6.199879169464111, "global_step": 80622, "epoch": 1919} {"train_loss": -6.095733642578125, "global_step": 80623, "epoch": 1919} {"train_loss": -6.157965660095215, "global_step": 80624, "epoch": 1919} {"train_loss": -6.278014659881592, "global_step": 80625, "epoch": 1919} {"train_loss": -6.037858486175537, "global_step": 80626, "epoch": 1919} {"train_loss": -6.204190254211426, "global_step": 80627, "epoch": 1919} {"train_loss": -6.212543964385986, "global_step": 80628, "epoch": 1919} {"train_loss": -6.252027988433838, "global_step": 80629, "epoch": 1919} {"train_loss": -6.144246578216553, "global_step": 80630, "epoch": 1919} {"train_loss": -6.19468355178833, "global_step": 80631, "epoch": 1919} {"train_loss": -6.200832366943359, "global_step": 80632, "epoch": 1919} {"train_loss": -6.036391735076904, "global_step": 80633, "epoch": 1919} {"train_loss": -6.172163963317871, "global_step": 80634, "epoch": 1919} {"train_loss": -6.074234962463379, "global_step": 80635, "epoch": 1919} {"train_loss": -6.189000606536865, "global_step": 80636, "epoch": 1919} {"train_loss": -6.189376354217529, "global_step": 80637, "epoch": 1919} {"train_loss": -6.151465892791748, "global_step": 80638, "epoch": 1919} {"train_loss": -6.160196508680071, "global_step": 80639, "epoch": 1919, "val_loss": 75190.3125} {"train_loss": -5.996936798095703, "global_step": 80640, "epoch": 1920} {"train_loss": -6.136404991149902, "global_step": 80641, "epoch": 1920} {"train_loss": -6.126490592956543, "global_step": 80642, "epoch": 1920} {"train_loss": -6.121711254119873, "global_step": 80643, "epoch": 1920} {"train_loss": -5.914737224578857, "global_step": 80644, "epoch": 1920} {"train_loss": -6.0519561767578125, "global_step": 80645, "epoch": 1920} {"train_loss": -6.087935447692871, "global_step": 80646, "epoch": 1920} {"train_loss": -6.092630863189697, "global_step": 80647, "epoch": 1920} {"train_loss": -5.968868255615234, "global_step": 80648, "epoch": 1920} {"train_loss": -6.227515697479248, "global_step": 80649, "epoch": 1920} {"train_loss": -6.061423301696777, "global_step": 80650, "epoch": 1920} {"train_loss": -6.149256706237793, "global_step": 80651, "epoch": 1920} {"train_loss": -6.076471328735352, "global_step": 80652, "epoch": 1920} {"train_loss": -6.0379109382629395, "global_step": 80653, "epoch": 1920} {"train_loss": -6.129955291748047, "global_step": 80654, "epoch": 1920} {"train_loss": -5.996011734008789, "global_step": 80655, "epoch": 1920} {"train_loss": -6.184398174285889, "global_step": 80656, "epoch": 1920} {"train_loss": -6.121187210083008, "global_step": 80657, "epoch": 1920} {"train_loss": -6.166914939880371, "global_step": 80658, "epoch": 1920} {"train_loss": -6.120273590087891, "global_step": 80659, "epoch": 1920} {"train_loss": -6.134174823760986, "global_step": 80660, "epoch": 1920} {"train_loss": -6.160219192504883, "global_step": 80661, "epoch": 1920} {"train_loss": -6.160811424255371, "global_step": 80662, "epoch": 1920} {"train_loss": -6.212165355682373, "global_step": 80663, "epoch": 1920} {"train_loss": -6.19191312789917, "global_step": 80664, "epoch": 1920} {"train_loss": -6.0484619140625, "global_step": 80665, "epoch": 1920} {"train_loss": -6.046217441558838, "global_step": 80666, "epoch": 1920} {"train_loss": -5.987476348876953, "global_step": 80667, "epoch": 1920} {"train_loss": -6.186986923217773, "global_step": 80668, "epoch": 1920} {"train_loss": -6.199185371398926, "global_step": 80669, "epoch": 1920} {"train_loss": -5.949291229248047, "global_step": 80670, "epoch": 1920} {"train_loss": -6.229072570800781, "global_step": 80671, "epoch": 1920} {"train_loss": -6.1497626304626465, "global_step": 80672, "epoch": 1920} {"train_loss": -6.090588569641113, "global_step": 80673, "epoch": 1920} {"train_loss": -6.134766578674316, "global_step": 80674, "epoch": 1920} {"train_loss": -6.111911296844482, "global_step": 80675, "epoch": 1920} {"train_loss": -6.207295894622803, "global_step": 80676, "epoch": 1920} {"train_loss": -6.209777355194092, "global_step": 80677, "epoch": 1920} {"train_loss": -6.014830589294434, "global_step": 80678, "epoch": 1920} {"train_loss": -6.277254104614258, "global_step": 80679, "epoch": 1920} {"train_loss": -6.117737770080566, "global_step": 80680, "epoch": 1920} {"train_loss": -6.116285051618304, "global_step": 80681, "epoch": 1920, "val_loss": 75117.6484375} {"train_loss": -6.1761474609375, "global_step": 80682, "epoch": 1921} {"train_loss": -6.173826217651367, "global_step": 80683, "epoch": 1921} {"train_loss": -6.198183059692383, "global_step": 80684, "epoch": 1921} {"train_loss": -6.182941436767578, "global_step": 80685, "epoch": 1921} {"train_loss": -6.242402076721191, "global_step": 80686, "epoch": 1921} {"train_loss": -6.141941070556641, "global_step": 80687, "epoch": 1921} {"train_loss": -6.178290367126465, "global_step": 80688, "epoch": 1921} {"train_loss": -6.241591453552246, "global_step": 80689, "epoch": 1921} {"train_loss": -6.122427940368652, "global_step": 80690, "epoch": 1921} {"train_loss": -6.145017147064209, "global_step": 80691, "epoch": 1921} {"train_loss": -6.154380798339844, "global_step": 80692, "epoch": 1921} {"train_loss": -6.061155319213867, "global_step": 80693, "epoch": 1921} {"train_loss": -6.129542827606201, "global_step": 80694, "epoch": 1921} {"train_loss": -6.042834281921387, "global_step": 80695, "epoch": 1921} {"train_loss": -6.201796531677246, "global_step": 80696, "epoch": 1921} {"train_loss": -6.0315985679626465, "global_step": 80697, "epoch": 1921} {"train_loss": -6.201694965362549, "global_step": 80698, "epoch": 1921} {"train_loss": -6.148148536682129, "global_step": 80699, "epoch": 1921} {"train_loss": -6.150386810302734, "global_step": 80700, "epoch": 1921} {"train_loss": -6.049463272094727, "global_step": 80701, "epoch": 1921} {"train_loss": -6.217119216918945, "global_step": 80702, "epoch": 1921} {"train_loss": -6.106562614440918, "global_step": 80703, "epoch": 1921} {"train_loss": -6.044593811035156, "global_step": 80704, "epoch": 1921} {"train_loss": -6.240694046020508, "global_step": 80705, "epoch": 1921} {"train_loss": -6.072224140167236, "global_step": 80706, "epoch": 1921} {"train_loss": -6.027065277099609, "global_step": 80707, "epoch": 1921} {"train_loss": -6.158301830291748, "global_step": 80708, "epoch": 1921} {"train_loss": -6.0917463302612305, "global_step": 80709, "epoch": 1921} {"train_loss": -6.039297103881836, "global_step": 80710, "epoch": 1921} {"train_loss": -6.121150970458984, "global_step": 80711, "epoch": 1921} {"train_loss": -6.074963569641113, "global_step": 80712, "epoch": 1921} {"train_loss": -6.085005760192871, "global_step": 80713, "epoch": 1921} {"train_loss": -5.987118244171143, "global_step": 80714, "epoch": 1921} {"train_loss": -6.1147003173828125, "global_step": 80715, "epoch": 1921} {"train_loss": -6.202090263366699, "global_step": 80716, "epoch": 1921} {"train_loss": -6.110738754272461, "global_step": 80717, "epoch": 1921} {"train_loss": -6.108755111694336, "global_step": 80718, "epoch": 1921} {"train_loss": -6.045045375823975, "global_step": 80719, "epoch": 1921} {"train_loss": -6.008255481719971, "global_step": 80720, "epoch": 1921} {"train_loss": -6.104819297790527, "global_step": 80721, "epoch": 1921} {"train_loss": -6.037164688110352, "global_step": 80722, "epoch": 1921} {"train_loss": -6.122677575974238, "global_step": 80723, "epoch": 1921, "val_loss": 74830.8984375} {"train_loss": -6.220502853393555, "global_step": 80724, "epoch": 1922} {"train_loss": -6.183119773864746, "global_step": 80725, "epoch": 1922} {"train_loss": -6.025786399841309, "global_step": 80726, "epoch": 1922} {"train_loss": -6.114884853363037, "global_step": 80727, "epoch": 1922} {"train_loss": -6.201108932495117, "global_step": 80728, "epoch": 1922} {"train_loss": -6.2083282470703125, "global_step": 80729, "epoch": 1922} {"train_loss": -6.122583389282227, "global_step": 80730, "epoch": 1922} {"train_loss": -6.15321159362793, "global_step": 80731, "epoch": 1922} {"train_loss": -6.1981916427612305, "global_step": 80732, "epoch": 1922} {"train_loss": -6.1631059646606445, "global_step": 80733, "epoch": 1922} {"train_loss": -6.158011436462402, "global_step": 80734, "epoch": 1922} {"train_loss": -6.235651969909668, "global_step": 80735, "epoch": 1922} {"train_loss": -6.068811416625977, "global_step": 80736, "epoch": 1922} {"train_loss": -6.03785514831543, "global_step": 80737, "epoch": 1922} {"train_loss": -6.16064977645874, "global_step": 80738, "epoch": 1922} {"train_loss": -6.076770782470703, "global_step": 80739, "epoch": 1922} {"train_loss": -6.124143600463867, "global_step": 80740, "epoch": 1922} {"train_loss": -6.251010894775391, "global_step": 80741, "epoch": 1922} {"train_loss": -6.065023422241211, "global_step": 80742, "epoch": 1922} {"train_loss": -5.998913288116455, "global_step": 80743, "epoch": 1922} {"train_loss": -6.052350997924805, "global_step": 80744, "epoch": 1922} {"train_loss": -5.847064971923828, "global_step": 80745, "epoch": 1922} {"train_loss": -6.125482559204102, "global_step": 80746, "epoch": 1922} {"train_loss": -6.062641143798828, "global_step": 80747, "epoch": 1922} {"train_loss": -6.097324371337891, "global_step": 80748, "epoch": 1922} {"train_loss": -6.163532257080078, "global_step": 80749, "epoch": 1922} {"train_loss": -5.987779140472412, "global_step": 80750, "epoch": 1922} {"train_loss": -6.170056343078613, "global_step": 80751, "epoch": 1922} {"train_loss": -6.067574501037598, "global_step": 80752, "epoch": 1922} {"train_loss": -6.137162685394287, "global_step": 80753, "epoch": 1922} {"train_loss": -6.205717086791992, "global_step": 80754, "epoch": 1922} {"train_loss": -6.087162017822266, "global_step": 80755, "epoch": 1922} {"train_loss": -6.2134013175964355, "global_step": 80756, "epoch": 1922} {"train_loss": -6.199044227600098, "global_step": 80757, "epoch": 1922} {"train_loss": -6.274451732635498, "global_step": 80758, "epoch": 1922} {"train_loss": -6.239188194274902, "global_step": 80759, "epoch": 1922} {"train_loss": -6.094625473022461, "global_step": 80760, "epoch": 1922} {"train_loss": -6.100886344909668, "global_step": 80761, "epoch": 1922} {"train_loss": -6.073230743408203, "global_step": 80762, "epoch": 1922} {"train_loss": -5.993719577789307, "global_step": 80763, "epoch": 1922} {"train_loss": -6.228727340698242, "global_step": 80764, "epoch": 1922} {"train_loss": -6.128845703034174, "global_step": 80765, "epoch": 1922, "val_loss": 74955.34375} {"train_loss": -6.200141429901123, "global_step": 80766, "epoch": 1923} {"train_loss": -6.0637898445129395, "global_step": 80767, "epoch": 1923} {"train_loss": -6.068017959594727, "global_step": 80768, "epoch": 1923} {"train_loss": -6.138426303863525, "global_step": 80769, "epoch": 1923} {"train_loss": -6.160008430480957, "global_step": 80770, "epoch": 1923} {"train_loss": -6.24589729309082, "global_step": 80771, "epoch": 1923} {"train_loss": -6.073655128479004, "global_step": 80772, "epoch": 1923} {"train_loss": -5.998412609100342, "global_step": 80773, "epoch": 1923} {"train_loss": -6.070713996887207, "global_step": 80774, "epoch": 1923} {"train_loss": -6.092139720916748, "global_step": 80775, "epoch": 1923} {"train_loss": -6.196659088134766, "global_step": 80776, "epoch": 1923} {"train_loss": -6.094971656799316, "global_step": 80777, "epoch": 1923} {"train_loss": -6.0236334800720215, "global_step": 80778, "epoch": 1923} {"train_loss": -6.173863410949707, "global_step": 80779, "epoch": 1923} {"train_loss": -5.975943565368652, "global_step": 80780, "epoch": 1923} {"train_loss": -6.282768249511719, "global_step": 80781, "epoch": 1923} {"train_loss": -6.118193626403809, "global_step": 80782, "epoch": 1923} {"train_loss": -6.036618709564209, "global_step": 80783, "epoch": 1923} {"train_loss": -6.1183695793151855, "global_step": 80784, "epoch": 1923} {"train_loss": -6.02752685546875, "global_step": 80785, "epoch": 1923} {"train_loss": -6.149378776550293, "global_step": 80786, "epoch": 1923} {"train_loss": -5.993000507354736, "global_step": 80787, "epoch": 1923} {"train_loss": -6.091867446899414, "global_step": 80788, "epoch": 1923} {"train_loss": -6.095918655395508, "global_step": 80789, "epoch": 1923} {"train_loss": -6.08674430847168, "global_step": 80790, "epoch": 1923} {"train_loss": -6.15947151184082, "global_step": 80791, "epoch": 1923} {"train_loss": -6.240588665008545, "global_step": 80792, "epoch": 1923} {"train_loss": -6.145471572875977, "global_step": 80793, "epoch": 1923} {"train_loss": -6.199521541595459, "global_step": 80794, "epoch": 1923} {"train_loss": -6.294750213623047, "global_step": 80795, "epoch": 1923} {"train_loss": -6.1273698806762695, "global_step": 80796, "epoch": 1923} {"train_loss": -6.2926530838012695, "global_step": 80797, "epoch": 1923} {"train_loss": -6.139188289642334, "global_step": 80798, "epoch": 1923} {"train_loss": -6.062178134918213, "global_step": 80799, "epoch": 1923} {"train_loss": -6.148854732513428, "global_step": 80800, "epoch": 1923} {"train_loss": -6.198631286621094, "global_step": 80801, "epoch": 1923} {"train_loss": -6.200916290283203, "global_step": 80802, "epoch": 1923} {"train_loss": -6.201388835906982, "global_step": 80803, "epoch": 1923} {"train_loss": -6.074563026428223, "global_step": 80804, "epoch": 1923} {"train_loss": -6.069343090057373, "global_step": 80805, "epoch": 1923} {"train_loss": -6.1447954177856445, "global_step": 80806, "epoch": 1923} {"train_loss": -6.129564217158726, "global_step": 80807, "epoch": 1923, "val_loss": 75105.4765625} {"train_loss": -6.0027666091918945, "global_step": 80808, "epoch": 1924} {"train_loss": -6.172319412231445, "global_step": 80809, "epoch": 1924} {"train_loss": -6.039357662200928, "global_step": 80810, "epoch": 1924} {"train_loss": -6.070661544799805, "global_step": 80811, "epoch": 1924} {"train_loss": -6.001821517944336, "global_step": 80812, "epoch": 1924} {"train_loss": -6.060336112976074, "global_step": 80813, "epoch": 1924} {"train_loss": -6.089394569396973, "global_step": 80814, "epoch": 1924} {"train_loss": -6.028938293457031, "global_step": 80815, "epoch": 1924} {"train_loss": -6.168481826782227, "global_step": 80816, "epoch": 1924} {"train_loss": -6.034151077270508, "global_step": 80817, "epoch": 1924} {"train_loss": -6.147921562194824, "global_step": 80818, "epoch": 1924} {"train_loss": -6.076509475708008, "global_step": 80819, "epoch": 1924} {"train_loss": -6.144828796386719, "global_step": 80820, "epoch": 1924} {"train_loss": -6.083556175231934, "global_step": 80821, "epoch": 1924} {"train_loss": -6.026913166046143, "global_step": 80822, "epoch": 1924} {"train_loss": -6.102302551269531, "global_step": 80823, "epoch": 1924} {"train_loss": -6.204575061798096, "global_step": 80824, "epoch": 1924} {"train_loss": -6.2126784324646, "global_step": 80825, "epoch": 1924} {"train_loss": -6.006714820861816, "global_step": 80826, "epoch": 1924} {"train_loss": -6.1142964363098145, "global_step": 80827, "epoch": 1924} {"train_loss": -6.082190036773682, "global_step": 80828, "epoch": 1924} {"train_loss": -6.201047420501709, "global_step": 80829, "epoch": 1924} {"train_loss": -6.211945533752441, "global_step": 80830, "epoch": 1924} {"train_loss": -5.985505104064941, "global_step": 80831, "epoch": 1924} {"train_loss": -6.073446273803711, "global_step": 80832, "epoch": 1924} {"train_loss": -6.1250901222229, "global_step": 80833, "epoch": 1924} {"train_loss": -6.173190116882324, "global_step": 80834, "epoch": 1924} {"train_loss": -6.187652111053467, "global_step": 80835, "epoch": 1924} {"train_loss": -6.131805896759033, "global_step": 80836, "epoch": 1924} {"train_loss": -6.215750694274902, "global_step": 80837, "epoch": 1924} {"train_loss": -6.144340515136719, "global_step": 80838, "epoch": 1924} {"train_loss": -6.011199951171875, "global_step": 80839, "epoch": 1924} {"train_loss": -6.1197357177734375, "global_step": 80840, "epoch": 1924} {"train_loss": -6.19057559967041, "global_step": 80841, "epoch": 1924} {"train_loss": -6.050089359283447, "global_step": 80842, "epoch": 1924} {"train_loss": -6.064023971557617, "global_step": 80843, "epoch": 1924} {"train_loss": -6.1506757736206055, "global_step": 80844, "epoch": 1924} {"train_loss": -5.959832668304443, "global_step": 80845, "epoch": 1924} {"train_loss": -6.082029342651367, "global_step": 80846, "epoch": 1924} {"train_loss": -6.088381767272949, "global_step": 80847, "epoch": 1924} {"train_loss": -6.1335062980651855, "global_step": 80848, "epoch": 1924} {"train_loss": -6.101314578737531, "global_step": 80849, "epoch": 1924, "val_loss": 75232.28125} {"train_loss": -6.231775283813477, "global_step": 80850, "epoch": 1925} {"train_loss": -6.087663173675537, "global_step": 80851, "epoch": 1925} {"train_loss": -6.143400192260742, "global_step": 80852, "epoch": 1925} {"train_loss": -6.0505757331848145, "global_step": 80853, "epoch": 1925} {"train_loss": -6.020804405212402, "global_step": 80854, "epoch": 1925} {"train_loss": -5.985630989074707, "global_step": 80855, "epoch": 1925} {"train_loss": -6.161635875701904, "global_step": 80856, "epoch": 1925} {"train_loss": -6.222126007080078, "global_step": 80857, "epoch": 1925} {"train_loss": -6.2791314125061035, "global_step": 80858, "epoch": 1925} {"train_loss": -6.145211219787598, "global_step": 80859, "epoch": 1925} {"train_loss": -6.215450286865234, "global_step": 80860, "epoch": 1925} {"train_loss": -6.169368743896484, "global_step": 80861, "epoch": 1925} {"train_loss": -5.998193740844727, "global_step": 80862, "epoch": 1925} {"train_loss": -6.075007438659668, "global_step": 80863, "epoch": 1925} {"train_loss": -6.0924072265625, "global_step": 80864, "epoch": 1925} {"train_loss": -6.068556785583496, "global_step": 80865, "epoch": 1925} {"train_loss": -6.158297061920166, "global_step": 80866, "epoch": 1925} {"train_loss": -6.168557167053223, "global_step": 80867, "epoch": 1925} {"train_loss": -6.051403045654297, "global_step": 80868, "epoch": 1925} {"train_loss": -6.18985652923584, "global_step": 80869, "epoch": 1925} {"train_loss": -6.137446403503418, "global_step": 80870, "epoch": 1925} {"train_loss": -6.073861122131348, "global_step": 80871, "epoch": 1925} {"train_loss": -6.122081279754639, "global_step": 80872, "epoch": 1925} {"train_loss": -6.120222091674805, "global_step": 80873, "epoch": 1925} {"train_loss": -6.157168865203857, "global_step": 80874, "epoch": 1925} {"train_loss": -6.147885799407959, "global_step": 80875, "epoch": 1925} {"train_loss": -6.104055404663086, "global_step": 80876, "epoch": 1925} {"train_loss": -6.045949459075928, "global_step": 80877, "epoch": 1925} {"train_loss": -6.155773162841797, "global_step": 80878, "epoch": 1925} {"train_loss": -6.1437788009643555, "global_step": 80879, "epoch": 1925} {"train_loss": -6.053996562957764, "global_step": 80880, "epoch": 1925} {"train_loss": -6.1887335777282715, "global_step": 80881, "epoch": 1925} {"train_loss": -6.192790985107422, "global_step": 80882, "epoch": 1925} {"train_loss": -6.047067642211914, "global_step": 80883, "epoch": 1925} {"train_loss": -6.215387344360352, "global_step": 80884, "epoch": 1925} {"train_loss": -6.113234043121338, "global_step": 80885, "epoch": 1925} {"train_loss": -6.130683898925781, "global_step": 80886, "epoch": 1925} {"train_loss": -6.182553291320801, "global_step": 80887, "epoch": 1925} {"train_loss": -6.120708465576172, "global_step": 80888, "epoch": 1925} {"train_loss": -6.15386962890625, "global_step": 80889, "epoch": 1925} {"train_loss": -6.070324897766113, "global_step": 80890, "epoch": 1925} {"train_loss": -6.127158392043341, "global_step": 80891, "epoch": 1925, "val_loss": 74922.640625} {"train_loss": -6.102079391479492, "global_step": 80892, "epoch": 1926} {"train_loss": -6.129757881164551, "global_step": 80893, "epoch": 1926} {"train_loss": -6.191201686859131, "global_step": 80894, "epoch": 1926} {"train_loss": -5.9803948402404785, "global_step": 80895, "epoch": 1926} {"train_loss": -6.126808166503906, "global_step": 80896, "epoch": 1926} {"train_loss": -6.109136581420898, "global_step": 80897, "epoch": 1926} {"train_loss": -6.190836429595947, "global_step": 80898, "epoch": 1926} {"train_loss": -6.210038185119629, "global_step": 80899, "epoch": 1926} {"train_loss": -6.047426223754883, "global_step": 80900, "epoch": 1926} {"train_loss": -6.132193088531494, "global_step": 80901, "epoch": 1926} {"train_loss": -6.054935455322266, "global_step": 80902, "epoch": 1926} {"train_loss": -6.014255523681641, "global_step": 80903, "epoch": 1926} {"train_loss": -6.249329566955566, "global_step": 80904, "epoch": 1926} {"train_loss": -6.223183631896973, "global_step": 80905, "epoch": 1926} {"train_loss": -5.999111175537109, "global_step": 80906, "epoch": 1926} {"train_loss": -6.073225498199463, "global_step": 80907, "epoch": 1926} {"train_loss": -6.204946994781494, "global_step": 80908, "epoch": 1926} {"train_loss": -6.157188415527344, "global_step": 80909, "epoch": 1926} {"train_loss": -6.294519424438477, "global_step": 80910, "epoch": 1926} {"train_loss": -6.167386531829834, "global_step": 80911, "epoch": 1926} {"train_loss": -6.2218475341796875, "global_step": 80912, "epoch": 1926} {"train_loss": -6.1226887702941895, "global_step": 80913, "epoch": 1926} {"train_loss": -6.239130020141602, "global_step": 80914, "epoch": 1926} {"train_loss": -6.169816017150879, "global_step": 80915, "epoch": 1926} {"train_loss": -6.22209358215332, "global_step": 80916, "epoch": 1926} {"train_loss": -6.177929878234863, "global_step": 80917, "epoch": 1926} {"train_loss": -6.083913803100586, "global_step": 80918, "epoch": 1926} {"train_loss": -6.1851677894592285, "global_step": 80919, "epoch": 1926} {"train_loss": -6.187257766723633, "global_step": 80920, "epoch": 1926} {"train_loss": -5.991016864776611, "global_step": 80921, "epoch": 1926} {"train_loss": -6.210698127746582, "global_step": 80922, "epoch": 1926} {"train_loss": -6.118015289306641, "global_step": 80923, "epoch": 1926} {"train_loss": -6.071974277496338, "global_step": 80924, "epoch": 1926} {"train_loss": -6.133011341094971, "global_step": 80925, "epoch": 1926} {"train_loss": -6.146366119384766, "global_step": 80926, "epoch": 1926} {"train_loss": -6.237682342529297, "global_step": 80927, "epoch": 1926} {"train_loss": -6.194455146789551, "global_step": 80928, "epoch": 1926} {"train_loss": -6.155040740966797, "global_step": 80929, "epoch": 1926} {"train_loss": -6.088632583618164, "global_step": 80930, "epoch": 1926} {"train_loss": -6.094130992889404, "global_step": 80931, "epoch": 1926} {"train_loss": -6.149781227111816, "global_step": 80932, "epoch": 1926} {"train_loss": -6.1459613754635765, "global_step": 80933, "epoch": 1926, "val_loss": 75135.3984375} {"train_loss": -6.127497673034668, "global_step": 80934, "epoch": 1927} {"train_loss": -6.1109938621521, "global_step": 80935, "epoch": 1927} {"train_loss": -6.243567943572998, "global_step": 80936, "epoch": 1927} {"train_loss": -6.136568069458008, "global_step": 80937, "epoch": 1927} {"train_loss": -6.246881484985352, "global_step": 80938, "epoch": 1927} {"train_loss": -6.247344493865967, "global_step": 80939, "epoch": 1927} {"train_loss": -6.061244010925293, "global_step": 80940, "epoch": 1927} {"train_loss": -6.162830829620361, "global_step": 80941, "epoch": 1927} {"train_loss": -6.137110233306885, "global_step": 80942, "epoch": 1927} {"train_loss": -5.978253364562988, "global_step": 80943, "epoch": 1927} {"train_loss": -6.123781204223633, "global_step": 80944, "epoch": 1927} {"train_loss": -6.138369560241699, "global_step": 80945, "epoch": 1927} {"train_loss": -6.12922477722168, "global_step": 80946, "epoch": 1927} {"train_loss": -6.127253532409668, "global_step": 80947, "epoch": 1927} {"train_loss": -6.035495281219482, "global_step": 80948, "epoch": 1927} {"train_loss": -5.992247581481934, "global_step": 80949, "epoch": 1927} {"train_loss": -6.054794788360596, "global_step": 80950, "epoch": 1927} {"train_loss": -6.034065246582031, "global_step": 80951, "epoch": 1927} {"train_loss": -6.214481353759766, "global_step": 80952, "epoch": 1927} {"train_loss": -6.125042915344238, "global_step": 80953, "epoch": 1927} {"train_loss": -6.157015800476074, "global_step": 80954, "epoch": 1927} {"train_loss": -5.975022315979004, "global_step": 80955, "epoch": 1927} {"train_loss": -6.197288513183594, "global_step": 80956, "epoch": 1927} {"train_loss": -6.156154632568359, "global_step": 80957, "epoch": 1927} {"train_loss": -6.096587181091309, "global_step": 80958, "epoch": 1927} {"train_loss": -6.1448822021484375, "global_step": 80959, "epoch": 1927} {"train_loss": -6.258463382720947, "global_step": 80960, "epoch": 1927} {"train_loss": -6.166803359985352, "global_step": 80961, "epoch": 1927} {"train_loss": -6.129604339599609, "global_step": 80962, "epoch": 1927} {"train_loss": -6.0247416496276855, "global_step": 80963, "epoch": 1927} {"train_loss": -6.077109336853027, "global_step": 80964, "epoch": 1927} {"train_loss": -6.056180953979492, "global_step": 80965, "epoch": 1927} {"train_loss": -6.166626930236816, "global_step": 80966, "epoch": 1927} {"train_loss": -6.142624855041504, "global_step": 80967, "epoch": 1927} {"train_loss": -6.202694892883301, "global_step": 80968, "epoch": 1927} {"train_loss": -6.222985744476318, "global_step": 80969, "epoch": 1927} {"train_loss": -6.144009590148926, "global_step": 80970, "epoch": 1927} {"train_loss": -6.10463809967041, "global_step": 80971, "epoch": 1927} {"train_loss": -6.143074989318848, "global_step": 80972, "epoch": 1927} {"train_loss": -6.178150177001953, "global_step": 80973, "epoch": 1927} {"train_loss": -6.14961051940918, "global_step": 80974, "epoch": 1927} {"train_loss": -6.13227965718224, "global_step": 80975, "epoch": 1927, "val_loss": 74653.90625} {"train_loss": -6.187382698059082, "global_step": 80976, "epoch": 1928} {"train_loss": -6.138594627380371, "global_step": 80977, "epoch": 1928} {"train_loss": -6.110827922821045, "global_step": 80978, "epoch": 1928} {"train_loss": -6.180775165557861, "global_step": 80979, "epoch": 1928} {"train_loss": -6.266005516052246, "global_step": 80980, "epoch": 1928} {"train_loss": -6.28464412689209, "global_step": 80981, "epoch": 1928} {"train_loss": -6.186642646789551, "global_step": 80982, "epoch": 1928} {"train_loss": -6.294273853302002, "global_step": 80983, "epoch": 1928} {"train_loss": -6.097630500793457, "global_step": 80984, "epoch": 1928} {"train_loss": -6.252302169799805, "global_step": 80985, "epoch": 1928} {"train_loss": -6.302455902099609, "global_step": 80986, "epoch": 1928} {"train_loss": -6.018728256225586, "global_step": 80987, "epoch": 1928} {"train_loss": -6.276524066925049, "global_step": 80988, "epoch": 1928} {"train_loss": -6.191250801086426, "global_step": 80989, "epoch": 1928} {"train_loss": -6.046073913574219, "global_step": 80990, "epoch": 1928} {"train_loss": -6.074930191040039, "global_step": 80991, "epoch": 1928} {"train_loss": -6.206871509552002, "global_step": 80992, "epoch": 1928} {"train_loss": -6.100456714630127, "global_step": 80993, "epoch": 1928} {"train_loss": -6.051006317138672, "global_step": 80994, "epoch": 1928} {"train_loss": -6.206372261047363, "global_step": 80995, "epoch": 1928} {"train_loss": -6.042177200317383, "global_step": 80996, "epoch": 1928} {"train_loss": -6.067649841308594, "global_step": 80997, "epoch": 1928} {"train_loss": -6.037680625915527, "global_step": 80998, "epoch": 1928} {"train_loss": -6.058594226837158, "global_step": 80999, "epoch": 1928} {"train_loss": -6.0696868896484375, "global_step": 81000, "epoch": 1928} {"train_loss": -6.137569904327393, "global_step": 81001, "epoch": 1928} {"train_loss": -6.329274654388428, "global_step": 81002, "epoch": 1928} {"train_loss": -6.1475396156311035, "global_step": 81003, "epoch": 1928} {"train_loss": -6.204744338989258, "global_step": 81004, "epoch": 1928} {"train_loss": -6.266811370849609, "global_step": 81005, "epoch": 1928} {"train_loss": -6.088488578796387, "global_step": 81006, "epoch": 1928} {"train_loss": -6.05978536605835, "global_step": 81007, "epoch": 1928} {"train_loss": -6.112807273864746, "global_step": 81008, "epoch": 1928} {"train_loss": -5.968570232391357, "global_step": 81009, "epoch": 1928} {"train_loss": -6.1122331619262695, "global_step": 81010, "epoch": 1928} {"train_loss": -6.1246113777160645, "global_step": 81011, "epoch": 1928} {"train_loss": -6.140669822692871, "global_step": 81012, "epoch": 1928} {"train_loss": -6.058332443237305, "global_step": 81013, "epoch": 1928} {"train_loss": -6.212953090667725, "global_step": 81014, "epoch": 1928} {"train_loss": -6.105886459350586, "global_step": 81015, "epoch": 1928} {"train_loss": -6.057491302490234, "global_step": 81016, "epoch": 1928} {"train_loss": -6.146669376464117, "global_step": 81017, "epoch": 1928, "val_loss": 75095.34375} {"train_loss": -6.082272529602051, "global_step": 81018, "epoch": 1929} {"train_loss": -6.032207489013672, "global_step": 81019, "epoch": 1929} {"train_loss": -6.165590286254883, "global_step": 81020, "epoch": 1929} {"train_loss": -6.162735462188721, "global_step": 81021, "epoch": 1929} {"train_loss": -6.209521293640137, "global_step": 81022, "epoch": 1929} {"train_loss": -6.176458358764648, "global_step": 81023, "epoch": 1929} {"train_loss": -6.079697132110596, "global_step": 81024, "epoch": 1929} {"train_loss": -6.110475540161133, "global_step": 81025, "epoch": 1929} {"train_loss": -6.239654541015625, "global_step": 81026, "epoch": 1929} {"train_loss": -6.041818618774414, "global_step": 81027, "epoch": 1929} {"train_loss": -6.0695648193359375, "global_step": 81028, "epoch": 1929} {"train_loss": -6.047986030578613, "global_step": 81029, "epoch": 1929} {"train_loss": -6.199090003967285, "global_step": 81030, "epoch": 1929} {"train_loss": -6.146542072296143, "global_step": 81031, "epoch": 1929} {"train_loss": -6.135549068450928, "global_step": 81032, "epoch": 1929} {"train_loss": -6.044466972351074, "global_step": 81033, "epoch": 1929} {"train_loss": -6.13074254989624, "global_step": 81034, "epoch": 1929} {"train_loss": -6.081202507019043, "global_step": 81035, "epoch": 1929} {"train_loss": -6.206327438354492, "global_step": 81036, "epoch": 1929} {"train_loss": -6.017653942108154, "global_step": 81037, "epoch": 1929} {"train_loss": -6.203634738922119, "global_step": 81038, "epoch": 1929} {"train_loss": -6.187061309814453, "global_step": 81039, "epoch": 1929} {"train_loss": -6.15822696685791, "global_step": 81040, "epoch": 1929} {"train_loss": -6.035330772399902, "global_step": 81041, "epoch": 1929} {"train_loss": -6.157380104064941, "global_step": 81042, "epoch": 1929} {"train_loss": -6.21512508392334, "global_step": 81043, "epoch": 1929} {"train_loss": -6.192798614501953, "global_step": 81044, "epoch": 1929} {"train_loss": -6.197453498840332, "global_step": 81045, "epoch": 1929} {"train_loss": -6.029952526092529, "global_step": 81046, "epoch": 1929} {"train_loss": -6.292330741882324, "global_step": 81047, "epoch": 1929} {"train_loss": -6.2421159744262695, "global_step": 81048, "epoch": 1929} {"train_loss": -6.096227645874023, "global_step": 81049, "epoch": 1929} {"train_loss": -6.082884788513184, "global_step": 81050, "epoch": 1929} {"train_loss": -6.262018203735352, "global_step": 81051, "epoch": 1929} {"train_loss": -6.250847816467285, "global_step": 81052, "epoch": 1929} {"train_loss": -6.176431655883789, "global_step": 81053, "epoch": 1929} {"train_loss": -6.169735908508301, "global_step": 81054, "epoch": 1929} {"train_loss": -6.261853218078613, "global_step": 81055, "epoch": 1929} {"train_loss": -6.232372760772705, "global_step": 81056, "epoch": 1929} {"train_loss": -6.09397554397583, "global_step": 81057, "epoch": 1929} {"train_loss": -6.207401752471924, "global_step": 81058, "epoch": 1929} {"train_loss": -6.150374162764776, "global_step": 81059, "epoch": 1929, "val_loss": 74931.7421875} {"train_loss": -6.166572570800781, "global_step": 81060, "epoch": 1930} {"train_loss": -6.252752304077148, "global_step": 81061, "epoch": 1930} {"train_loss": -6.072270393371582, "global_step": 81062, "epoch": 1930} {"train_loss": -6.1305437088012695, "global_step": 81063, "epoch": 1930} {"train_loss": -6.212754249572754, "global_step": 81064, "epoch": 1930} {"train_loss": -6.016025543212891, "global_step": 81065, "epoch": 1930} {"train_loss": -6.03464937210083, "global_step": 81066, "epoch": 1930} {"train_loss": -6.2031941413879395, "global_step": 81067, "epoch": 1930} {"train_loss": -6.205700874328613, "global_step": 81068, "epoch": 1930} {"train_loss": -6.117635726928711, "global_step": 81069, "epoch": 1930} {"train_loss": -6.177584648132324, "global_step": 81070, "epoch": 1930} {"train_loss": -6.1433868408203125, "global_step": 81071, "epoch": 1930} {"train_loss": -6.149839401245117, "global_step": 81072, "epoch": 1930} {"train_loss": -6.129964351654053, "global_step": 81073, "epoch": 1930} {"train_loss": -6.29671573638916, "global_step": 81074, "epoch": 1930} {"train_loss": -6.142369270324707, "global_step": 81075, "epoch": 1930} {"train_loss": -6.089731216430664, "global_step": 81076, "epoch": 1930} {"train_loss": -6.1739068031311035, "global_step": 81077, "epoch": 1930} {"train_loss": -6.088207244873047, "global_step": 81078, "epoch": 1930} {"train_loss": -6.141089916229248, "global_step": 81079, "epoch": 1930} {"train_loss": -6.154688835144043, "global_step": 81080, "epoch": 1930} {"train_loss": -6.110349178314209, "global_step": 81081, "epoch": 1930} {"train_loss": -6.210938453674316, "global_step": 81082, "epoch": 1930} {"train_loss": -6.05232048034668, "global_step": 81083, "epoch": 1930} {"train_loss": -6.190390586853027, "global_step": 81084, "epoch": 1930} {"train_loss": -6.180413246154785, "global_step": 81085, "epoch": 1930} {"train_loss": -6.074640274047852, "global_step": 81086, "epoch": 1930} {"train_loss": -6.213695526123047, "global_step": 81087, "epoch": 1930} {"train_loss": -6.048844337463379, "global_step": 81088, "epoch": 1930} {"train_loss": -6.160930156707764, "global_step": 81089, "epoch": 1930} {"train_loss": -6.164442539215088, "global_step": 81090, "epoch": 1930} {"train_loss": -6.045732498168945, "global_step": 81091, "epoch": 1930} {"train_loss": -6.161147117614746, "global_step": 81092, "epoch": 1930} {"train_loss": -6.08078145980835, "global_step": 81093, "epoch": 1930} {"train_loss": -6.122437477111816, "global_step": 81094, "epoch": 1930} {"train_loss": -5.988683700561523, "global_step": 81095, "epoch": 1930} {"train_loss": -6.016812324523926, "global_step": 81096, "epoch": 1930} {"train_loss": -6.048724174499512, "global_step": 81097, "epoch": 1930} {"train_loss": -6.164862155914307, "global_step": 81098, "epoch": 1930} {"train_loss": -6.14061164855957, "global_step": 81099, "epoch": 1930} {"train_loss": -5.949959754943848, "global_step": 81100, "epoch": 1930} {"train_loss": -6.128162168321156, "global_step": 81101, "epoch": 1930, "val_loss": 74835.046875} {"train_loss": -6.149954795837402, "global_step": 81102, "epoch": 1931} {"train_loss": -6.199808120727539, "global_step": 81103, "epoch": 1931} {"train_loss": -6.274903774261475, "global_step": 81104, "epoch": 1931} {"train_loss": -6.136478424072266, "global_step": 81105, "epoch": 1931} {"train_loss": -6.186222553253174, "global_step": 81106, "epoch": 1931} {"train_loss": -6.311197280883789, "global_step": 81107, "epoch": 1931} {"train_loss": -6.220356464385986, "global_step": 81108, "epoch": 1931} {"train_loss": -6.180578231811523, "global_step": 81109, "epoch": 1931} {"train_loss": -6.24110746383667, "global_step": 81110, "epoch": 1931} {"train_loss": -6.302267074584961, "global_step": 81111, "epoch": 1931} {"train_loss": -6.109177589416504, "global_step": 81112, "epoch": 1931} {"train_loss": -6.179469108581543, "global_step": 81113, "epoch": 1931} {"train_loss": -6.221138954162598, "global_step": 81114, "epoch": 1931} {"train_loss": -6.056148529052734, "global_step": 81115, "epoch": 1931} {"train_loss": -6.155582427978516, "global_step": 81116, "epoch": 1931} {"train_loss": -6.247343063354492, "global_step": 81117, "epoch": 1931} {"train_loss": -6.074406623840332, "global_step": 81118, "epoch": 1931} {"train_loss": -6.185343265533447, "global_step": 81119, "epoch": 1931} {"train_loss": -6.18507719039917, "global_step": 81120, "epoch": 1931} {"train_loss": -6.221550941467285, "global_step": 81121, "epoch": 1931} {"train_loss": -6.130648612976074, "global_step": 81122, "epoch": 1931} {"train_loss": -6.172258377075195, "global_step": 81123, "epoch": 1931} {"train_loss": -6.151054382324219, "global_step": 81124, "epoch": 1931} {"train_loss": -6.149774551391602, "global_step": 81125, "epoch": 1931} {"train_loss": -6.116503715515137, "global_step": 81126, "epoch": 1931} {"train_loss": -6.10823917388916, "global_step": 81127, "epoch": 1931} {"train_loss": -6.102625370025635, "global_step": 81128, "epoch": 1931} {"train_loss": -6.143065452575684, "global_step": 81129, "epoch": 1931} {"train_loss": -6.174589157104492, "global_step": 81130, "epoch": 1931} {"train_loss": -6.130866527557373, "global_step": 81131, "epoch": 1931} {"train_loss": -6.155215263366699, "global_step": 81132, "epoch": 1931} {"train_loss": -6.0955810546875, "global_step": 81133, "epoch": 1931} {"train_loss": -6.162405014038086, "global_step": 81134, "epoch": 1931} {"train_loss": -6.247263431549072, "global_step": 81135, "epoch": 1931} {"train_loss": -6.124742031097412, "global_step": 81136, "epoch": 1931} {"train_loss": -6.089086532592773, "global_step": 81137, "epoch": 1931} {"train_loss": -6.185427188873291, "global_step": 81138, "epoch": 1931} {"train_loss": -6.163119792938232, "global_step": 81139, "epoch": 1931} {"train_loss": -6.151420593261719, "global_step": 81140, "epoch": 1931} {"train_loss": -6.234419822692871, "global_step": 81141, "epoch": 1931} {"train_loss": -5.946035861968994, "global_step": 81142, "epoch": 1931} {"train_loss": -6.163613387516567, "global_step": 81143, "epoch": 1931, "val_loss": 75162.1484375} {"train_loss": -6.214142322540283, "global_step": 81144, "epoch": 1932} {"train_loss": -6.162668704986572, "global_step": 81145, "epoch": 1932} {"train_loss": -6.169931411743164, "global_step": 81146, "epoch": 1932} {"train_loss": -6.167514801025391, "global_step": 81147, "epoch": 1932} {"train_loss": -6.119271755218506, "global_step": 81148, "epoch": 1932} {"train_loss": -6.141602516174316, "global_step": 81149, "epoch": 1932} {"train_loss": -6.0245513916015625, "global_step": 81150, "epoch": 1932} {"train_loss": -6.105457305908203, "global_step": 81151, "epoch": 1932} {"train_loss": -6.1964921951293945, "global_step": 81152, "epoch": 1932} {"train_loss": -6.095649719238281, "global_step": 81153, "epoch": 1932} {"train_loss": -6.046289920806885, "global_step": 81154, "epoch": 1932} {"train_loss": -6.172691345214844, "global_step": 81155, "epoch": 1932} {"train_loss": -6.058724403381348, "global_step": 81156, "epoch": 1932} {"train_loss": -6.13161563873291, "global_step": 81157, "epoch": 1932} {"train_loss": -6.199516296386719, "global_step": 81158, "epoch": 1932} {"train_loss": -6.206457138061523, "global_step": 81159, "epoch": 1932} {"train_loss": -6.105477333068848, "global_step": 81160, "epoch": 1932} {"train_loss": -6.126371383666992, "global_step": 81161, "epoch": 1932} {"train_loss": -6.0429840087890625, "global_step": 81162, "epoch": 1932} {"train_loss": -6.155345916748047, "global_step": 81163, "epoch": 1932} {"train_loss": -6.091485023498535, "global_step": 81164, "epoch": 1932} {"train_loss": -6.130898475646973, "global_step": 81165, "epoch": 1932} {"train_loss": -6.1829094886779785, "global_step": 81166, "epoch": 1932} {"train_loss": -6.17462682723999, "global_step": 81167, "epoch": 1932} {"train_loss": -6.1689558029174805, "global_step": 81168, "epoch": 1932} {"train_loss": -6.141961574554443, "global_step": 81169, "epoch": 1932} {"train_loss": -6.150075912475586, "global_step": 81170, "epoch": 1932} {"train_loss": -6.151374340057373, "global_step": 81171, "epoch": 1932} {"train_loss": -6.244932174682617, "global_step": 81172, "epoch": 1932} {"train_loss": -6.192430019378662, "global_step": 81173, "epoch": 1932} {"train_loss": -6.125223159790039, "global_step": 81174, "epoch": 1932} {"train_loss": -6.159790515899658, "global_step": 81175, "epoch": 1932} {"train_loss": -6.258623123168945, "global_step": 81176, "epoch": 1932} {"train_loss": -6.0881218910217285, "global_step": 81177, "epoch": 1932} {"train_loss": -6.0943803787231445, "global_step": 81178, "epoch": 1932} {"train_loss": -6.112030506134033, "global_step": 81179, "epoch": 1932} {"train_loss": -6.180111408233643, "global_step": 81180, "epoch": 1932} {"train_loss": -6.074029445648193, "global_step": 81181, "epoch": 1932} {"train_loss": -6.0569939613342285, "global_step": 81182, "epoch": 1932} {"train_loss": -5.979311466217041, "global_step": 81183, "epoch": 1932} {"train_loss": -6.105360984802246, "global_step": 81184, "epoch": 1932} {"train_loss": -6.133059319995699, "global_step": 81185, "epoch": 1932, "val_loss": 75195.421875} {"train_loss": -6.069657325744629, "global_step": 81186, "epoch": 1933} {"train_loss": -6.140931129455566, "global_step": 81187, "epoch": 1933} {"train_loss": -6.084307670593262, "global_step": 81188, "epoch": 1933} {"train_loss": -6.128718376159668, "global_step": 81189, "epoch": 1933} {"train_loss": -6.270022392272949, "global_step": 81190, "epoch": 1933} {"train_loss": -6.267238616943359, "global_step": 81191, "epoch": 1933} {"train_loss": -6.178353786468506, "global_step": 81192, "epoch": 1933} {"train_loss": -6.168650150299072, "global_step": 81193, "epoch": 1933} {"train_loss": -6.0905070304870605, "global_step": 81194, "epoch": 1933} {"train_loss": -6.150946617126465, "global_step": 81195, "epoch": 1933} {"train_loss": -6.126748561859131, "global_step": 81196, "epoch": 1933} {"train_loss": -6.223699569702148, "global_step": 81197, "epoch": 1933} {"train_loss": -6.207489967346191, "global_step": 81198, "epoch": 1933} {"train_loss": -6.127250671386719, "global_step": 81199, "epoch": 1933} {"train_loss": -6.145870685577393, "global_step": 81200, "epoch": 1933} {"train_loss": -6.04676628112793, "global_step": 81201, "epoch": 1933} {"train_loss": -6.199359893798828, "global_step": 81202, "epoch": 1933} {"train_loss": -6.158329010009766, "global_step": 81203, "epoch": 1933} {"train_loss": -6.035962104797363, "global_step": 81204, "epoch": 1933} {"train_loss": -6.090327739715576, "global_step": 81205, "epoch": 1933} {"train_loss": -6.063279151916504, "global_step": 81206, "epoch": 1933} {"train_loss": -6.152895927429199, "global_step": 81207, "epoch": 1933} {"train_loss": -5.994931697845459, "global_step": 81208, "epoch": 1933} {"train_loss": -5.9788103103637695, "global_step": 81209, "epoch": 1933} {"train_loss": -6.121466636657715, "global_step": 81210, "epoch": 1933} {"train_loss": -6.240598678588867, "global_step": 81211, "epoch": 1933} {"train_loss": -6.142279148101807, "global_step": 81212, "epoch": 1933} {"train_loss": -6.089272499084473, "global_step": 81213, "epoch": 1933} {"train_loss": -6.286211013793945, "global_step": 81214, "epoch": 1933} {"train_loss": -6.140959739685059, "global_step": 81215, "epoch": 1933} {"train_loss": -6.108431816101074, "global_step": 81216, "epoch": 1933} {"train_loss": -5.928252220153809, "global_step": 81217, "epoch": 1933} {"train_loss": -6.0078630447387695, "global_step": 81218, "epoch": 1933} {"train_loss": -6.163846969604492, "global_step": 81219, "epoch": 1933} {"train_loss": -6.1077117919921875, "global_step": 81220, "epoch": 1933} {"train_loss": -6.155316352844238, "global_step": 81221, "epoch": 1933} {"train_loss": -6.012944221496582, "global_step": 81222, "epoch": 1933} {"train_loss": -6.1266326904296875, "global_step": 81223, "epoch": 1933} {"train_loss": -6.130796432495117, "global_step": 81224, "epoch": 1933} {"train_loss": -6.193864345550537, "global_step": 81225, "epoch": 1933} {"train_loss": -6.174568176269531, "global_step": 81226, "epoch": 1933} {"train_loss": -6.128651482718332, "global_step": 81227, "epoch": 1933, "val_loss": 75083.21875} {"train_loss": -6.148520469665527, "global_step": 81228, "epoch": 1934} {"train_loss": -6.178624153137207, "global_step": 81229, "epoch": 1934} {"train_loss": -6.12799072265625, "global_step": 81230, "epoch": 1934} {"train_loss": -6.132175445556641, "global_step": 81231, "epoch": 1934} {"train_loss": -6.05436897277832, "global_step": 81232, "epoch": 1934} {"train_loss": -6.248148441314697, "global_step": 81233, "epoch": 1934} {"train_loss": -6.291295051574707, "global_step": 81234, "epoch": 1934} {"train_loss": -6.085389137268066, "global_step": 81235, "epoch": 1934} {"train_loss": -6.178447246551514, "global_step": 81236, "epoch": 1934} {"train_loss": -6.28265380859375, "global_step": 81237, "epoch": 1934} {"train_loss": -6.233415126800537, "global_step": 81238, "epoch": 1934} {"train_loss": -6.25213623046875, "global_step": 81239, "epoch": 1934} {"train_loss": -6.186483383178711, "global_step": 81240, "epoch": 1934} {"train_loss": -6.16495418548584, "global_step": 81241, "epoch": 1934} {"train_loss": -6.174161911010742, "global_step": 81242, "epoch": 1934} {"train_loss": -6.272510051727295, "global_step": 81243, "epoch": 1934} {"train_loss": -6.199100494384766, "global_step": 81244, "epoch": 1934} {"train_loss": -6.229420185089111, "global_step": 81245, "epoch": 1934} {"train_loss": -6.134051322937012, "global_step": 81246, "epoch": 1934} {"train_loss": -6.252631187438965, "global_step": 81247, "epoch": 1934} {"train_loss": -6.122637748718262, "global_step": 81248, "epoch": 1934} {"train_loss": -6.201566696166992, "global_step": 81249, "epoch": 1934} {"train_loss": -6.1210856437683105, "global_step": 81250, "epoch": 1934} {"train_loss": -6.090705871582031, "global_step": 81251, "epoch": 1934} {"train_loss": -6.269461631774902, "global_step": 81252, "epoch": 1934} {"train_loss": -6.179925918579102, "global_step": 81253, "epoch": 1934} {"train_loss": -6.105989933013916, "global_step": 81254, "epoch": 1934} {"train_loss": -6.246266841888428, "global_step": 81255, "epoch": 1934} {"train_loss": -6.166386127471924, "global_step": 81256, "epoch": 1934} {"train_loss": -6.171535491943359, "global_step": 81257, "epoch": 1934} {"train_loss": -6.173131942749023, "global_step": 81258, "epoch": 1934} {"train_loss": -6.125699520111084, "global_step": 81259, "epoch": 1934} {"train_loss": -6.139249801635742, "global_step": 81260, "epoch": 1934} {"train_loss": -6.130208969116211, "global_step": 81261, "epoch": 1934} {"train_loss": -6.065190315246582, "global_step": 81262, "epoch": 1934} {"train_loss": -6.131649971008301, "global_step": 81263, "epoch": 1934} {"train_loss": -6.229898452758789, "global_step": 81264, "epoch": 1934} {"train_loss": -6.161809921264648, "global_step": 81265, "epoch": 1934} {"train_loss": -6.055141448974609, "global_step": 81266, "epoch": 1934} {"train_loss": -6.17767333984375, "global_step": 81267, "epoch": 1934} {"train_loss": -6.290889263153076, "global_step": 81268, "epoch": 1934} {"train_loss": -6.172572976066952, "global_step": 81269, "epoch": 1934, "val_loss": 74997.8984375} {"train_loss": -6.272409915924072, "global_step": 81270, "epoch": 1935} {"train_loss": -6.330687046051025, "global_step": 81271, "epoch": 1935} {"train_loss": -6.209537029266357, "global_step": 81272, "epoch": 1935} {"train_loss": -6.103326320648193, "global_step": 81273, "epoch": 1935} {"train_loss": -6.165828704833984, "global_step": 81274, "epoch": 1935} {"train_loss": -6.148229598999023, "global_step": 81275, "epoch": 1935} {"train_loss": -6.1441850662231445, "global_step": 81276, "epoch": 1935} {"train_loss": -6.173412799835205, "global_step": 81277, "epoch": 1935} {"train_loss": -6.0816240310668945, "global_step": 81278, "epoch": 1935} {"train_loss": -6.191091060638428, "global_step": 81279, "epoch": 1935} {"train_loss": -6.155600547790527, "global_step": 81280, "epoch": 1935} {"train_loss": -6.174497604370117, "global_step": 81281, "epoch": 1935} {"train_loss": -6.1302690505981445, "global_step": 81282, "epoch": 1935} {"train_loss": -6.196987152099609, "global_step": 81283, "epoch": 1935} {"train_loss": -6.157144069671631, "global_step": 81284, "epoch": 1935} {"train_loss": -6.188693523406982, "global_step": 81285, "epoch": 1935} {"train_loss": -6.0454325675964355, "global_step": 81286, "epoch": 1935} {"train_loss": -6.16117000579834, "global_step": 81287, "epoch": 1935} {"train_loss": -6.107621192932129, "global_step": 81288, "epoch": 1935} {"train_loss": -6.139230728149414, "global_step": 81289, "epoch": 1935} {"train_loss": -6.161028861999512, "global_step": 81290, "epoch": 1935} {"train_loss": -6.1430134773254395, "global_step": 81291, "epoch": 1935} {"train_loss": -6.218830108642578, "global_step": 81292, "epoch": 1935} {"train_loss": -6.133084297180176, "global_step": 81293, "epoch": 1935} {"train_loss": -6.049297332763672, "global_step": 81294, "epoch": 1935} {"train_loss": -6.148561477661133, "global_step": 81295, "epoch": 1935} {"train_loss": -6.134766101837158, "global_step": 81296, "epoch": 1935} {"train_loss": -6.078406810760498, "global_step": 81297, "epoch": 1935} {"train_loss": -6.217238426208496, "global_step": 81298, "epoch": 1935} {"train_loss": -6.121695518493652, "global_step": 81299, "epoch": 1935} {"train_loss": -6.172870635986328, "global_step": 81300, "epoch": 1935} {"train_loss": -6.068417072296143, "global_step": 81301, "epoch": 1935} {"train_loss": -6.13969612121582, "global_step": 81302, "epoch": 1935} {"train_loss": -6.180840492248535, "global_step": 81303, "epoch": 1935} {"train_loss": -6.244063854217529, "global_step": 81304, "epoch": 1935} {"train_loss": -6.1230058670043945, "global_step": 81305, "epoch": 1935} {"train_loss": -6.177845001220703, "global_step": 81306, "epoch": 1935} {"train_loss": -6.020816326141357, "global_step": 81307, "epoch": 1935} {"train_loss": -6.181699275970459, "global_step": 81308, "epoch": 1935} {"train_loss": -6.070773124694824, "global_step": 81309, "epoch": 1935} {"train_loss": -6.151370525360107, "global_step": 81310, "epoch": 1935} {"train_loss": -6.148614247639974, "global_step": 81311, "epoch": 1935, "val_loss": 75078.71875} {"train_loss": -6.088583469390869, "global_step": 81312, "epoch": 1936} {"train_loss": -6.140566825866699, "global_step": 81313, "epoch": 1936} {"train_loss": -6.099944591522217, "global_step": 81314, "epoch": 1936} {"train_loss": -6.019989013671875, "global_step": 81315, "epoch": 1936} {"train_loss": -6.150485992431641, "global_step": 81316, "epoch": 1936} {"train_loss": -6.024411678314209, "global_step": 81317, "epoch": 1936} {"train_loss": -6.086524963378906, "global_step": 81318, "epoch": 1936} {"train_loss": -6.117639064788818, "global_step": 81319, "epoch": 1936} {"train_loss": -6.186189651489258, "global_step": 81320, "epoch": 1936} {"train_loss": -6.209453105926514, "global_step": 81321, "epoch": 1936} {"train_loss": -6.058536529541016, "global_step": 81322, "epoch": 1936} {"train_loss": -6.224864482879639, "global_step": 81323, "epoch": 1936} {"train_loss": -6.1386518478393555, "global_step": 81324, "epoch": 1936} {"train_loss": -6.182943344116211, "global_step": 81325, "epoch": 1936} {"train_loss": -6.118999004364014, "global_step": 81326, "epoch": 1936} {"train_loss": -6.182660102844238, "global_step": 81327, "epoch": 1936} {"train_loss": -6.229083061218262, "global_step": 81328, "epoch": 1936} {"train_loss": -6.178535461425781, "global_step": 81329, "epoch": 1936} {"train_loss": -6.170896530151367, "global_step": 81330, "epoch": 1936} {"train_loss": -6.171194076538086, "global_step": 81331, "epoch": 1936} {"train_loss": -6.199428558349609, "global_step": 81332, "epoch": 1936} {"train_loss": -6.131705284118652, "global_step": 81333, "epoch": 1936} {"train_loss": -6.108155250549316, "global_step": 81334, "epoch": 1936} {"train_loss": -6.2973198890686035, "global_step": 81335, "epoch": 1936} {"train_loss": -6.1338911056518555, "global_step": 81336, "epoch": 1936} {"train_loss": -6.203774929046631, "global_step": 81337, "epoch": 1936} {"train_loss": -6.276324272155762, "global_step": 81338, "epoch": 1936} {"train_loss": -6.04154109954834, "global_step": 81339, "epoch": 1936} {"train_loss": -6.254745006561279, "global_step": 81340, "epoch": 1936} {"train_loss": -6.186363697052002, "global_step": 81341, "epoch": 1936} {"train_loss": -6.0767974853515625, "global_step": 81342, "epoch": 1936} {"train_loss": -6.205852508544922, "global_step": 81343, "epoch": 1936} {"train_loss": -6.292108535766602, "global_step": 81344, "epoch": 1936} {"train_loss": -6.129452228546143, "global_step": 81345, "epoch": 1936} {"train_loss": -6.1113409996032715, "global_step": 81346, "epoch": 1936} {"train_loss": -6.207690238952637, "global_step": 81347, "epoch": 1936} {"train_loss": -6.157140731811523, "global_step": 81348, "epoch": 1936} {"train_loss": -6.142404556274414, "global_step": 81349, "epoch": 1936} {"train_loss": -6.088639259338379, "global_step": 81350, "epoch": 1936} {"train_loss": -6.208529472351074, "global_step": 81351, "epoch": 1936} {"train_loss": -6.16174840927124, "global_step": 81352, "epoch": 1936} {"train_loss": -6.156468981788272, "global_step": 81353, "epoch": 1936, "val_loss": 74958.8125} {"train_loss": -6.066402912139893, "global_step": 81354, "epoch": 1937} {"train_loss": -6.106237411499023, "global_step": 81355, "epoch": 1937} {"train_loss": -6.079073905944824, "global_step": 81356, "epoch": 1937} {"train_loss": -6.100215911865234, "global_step": 81357, "epoch": 1937} {"train_loss": -6.009820938110352, "global_step": 81358, "epoch": 1937} {"train_loss": -6.148266315460205, "global_step": 81359, "epoch": 1937} {"train_loss": -6.156191825866699, "global_step": 81360, "epoch": 1937} {"train_loss": -6.219965934753418, "global_step": 81361, "epoch": 1937} {"train_loss": -6.103042125701904, "global_step": 81362, "epoch": 1937} {"train_loss": -6.190868377685547, "global_step": 81363, "epoch": 1937} {"train_loss": -6.149868011474609, "global_step": 81364, "epoch": 1937} {"train_loss": -6.030345916748047, "global_step": 81365, "epoch": 1937} {"train_loss": -6.137552261352539, "global_step": 81366, "epoch": 1937} {"train_loss": -6.0649566650390625, "global_step": 81367, "epoch": 1937} {"train_loss": -6.163026809692383, "global_step": 81368, "epoch": 1937} {"train_loss": -6.182957172393799, "global_step": 81369, "epoch": 1937} {"train_loss": -6.181062698364258, "global_step": 81370, "epoch": 1937} {"train_loss": -6.124228477478027, "global_step": 81371, "epoch": 1937} {"train_loss": -6.080332279205322, "global_step": 81372, "epoch": 1937} {"train_loss": -6.116748809814453, "global_step": 81373, "epoch": 1937} {"train_loss": -6.2190446853637695, "global_step": 81374, "epoch": 1937} {"train_loss": -6.122559070587158, "global_step": 81375, "epoch": 1937} {"train_loss": -6.181549072265625, "global_step": 81376, "epoch": 1937} {"train_loss": -6.097413063049316, "global_step": 81377, "epoch": 1937} {"train_loss": -6.0900983810424805, "global_step": 81378, "epoch": 1937} {"train_loss": -6.149250507354736, "global_step": 81379, "epoch": 1937} {"train_loss": -6.227062225341797, "global_step": 81380, "epoch": 1937} {"train_loss": -6.23225736618042, "global_step": 81381, "epoch": 1937} {"train_loss": -6.162325382232666, "global_step": 81382, "epoch": 1937} {"train_loss": -6.121910095214844, "global_step": 81383, "epoch": 1937} {"train_loss": -6.057494163513184, "global_step": 81384, "epoch": 1937} {"train_loss": -6.140089988708496, "global_step": 81385, "epoch": 1937} {"train_loss": -6.200735092163086, "global_step": 81386, "epoch": 1937} {"train_loss": -6.159938812255859, "global_step": 81387, "epoch": 1937} {"train_loss": -6.196743011474609, "global_step": 81388, "epoch": 1937} {"train_loss": -6.129769325256348, "global_step": 81389, "epoch": 1937} {"train_loss": -6.210027694702148, "global_step": 81390, "epoch": 1937} {"train_loss": -6.142861366271973, "global_step": 81391, "epoch": 1937} {"train_loss": -6.176631927490234, "global_step": 81392, "epoch": 1937} {"train_loss": -6.194772720336914, "global_step": 81393, "epoch": 1937} {"train_loss": -6.1135663986206055, "global_step": 81394, "epoch": 1937} {"train_loss": -6.143100965590704, "global_step": 81395, "epoch": 1937, "val_loss": 74920.5625} {"train_loss": -6.113222599029541, "global_step": 81396, "epoch": 1938} {"train_loss": -6.148591995239258, "global_step": 81397, "epoch": 1938} {"train_loss": -6.106507301330566, "global_step": 81398, "epoch": 1938} {"train_loss": -6.269374847412109, "global_step": 81399, "epoch": 1938} {"train_loss": -6.115970611572266, "global_step": 81400, "epoch": 1938} {"train_loss": -6.15889310836792, "global_step": 81401, "epoch": 1938} {"train_loss": -6.161496162414551, "global_step": 81402, "epoch": 1938} {"train_loss": -6.124678134918213, "global_step": 81403, "epoch": 1938} {"train_loss": -6.163081645965576, "global_step": 81404, "epoch": 1938} {"train_loss": -6.046553611755371, "global_step": 81405, "epoch": 1938} {"train_loss": -6.060589790344238, "global_step": 81406, "epoch": 1938} {"train_loss": -6.203461647033691, "global_step": 81407, "epoch": 1938} {"train_loss": -6.1426544189453125, "global_step": 81408, "epoch": 1938} {"train_loss": -6.1620306968688965, "global_step": 81409, "epoch": 1938} {"train_loss": -6.175961971282959, "global_step": 81410, "epoch": 1938} {"train_loss": -6.172310829162598, "global_step": 81411, "epoch": 1938} {"train_loss": -6.173251628875732, "global_step": 81412, "epoch": 1938} {"train_loss": -6.1575608253479, "global_step": 81413, "epoch": 1938} {"train_loss": -6.148112773895264, "global_step": 81414, "epoch": 1938} {"train_loss": -6.154417037963867, "global_step": 81415, "epoch": 1938} {"train_loss": -5.9814453125, "global_step": 81416, "epoch": 1938} {"train_loss": -6.086682319641113, "global_step": 81417, "epoch": 1938} {"train_loss": -6.114121437072754, "global_step": 81418, "epoch": 1938} {"train_loss": -6.127318382263184, "global_step": 81419, "epoch": 1938} {"train_loss": -6.162111282348633, "global_step": 81420, "epoch": 1938} {"train_loss": -6.198823928833008, "global_step": 81421, "epoch": 1938} {"train_loss": -6.140748977661133, "global_step": 81422, "epoch": 1938} {"train_loss": -6.107905387878418, "global_step": 81423, "epoch": 1938} {"train_loss": -6.259613037109375, "global_step": 81424, "epoch": 1938} {"train_loss": -6.149544715881348, "global_step": 81425, "epoch": 1938} {"train_loss": -6.189674377441406, "global_step": 81426, "epoch": 1938} {"train_loss": -6.1173295974731445, "global_step": 81427, "epoch": 1938} {"train_loss": -6.188176155090332, "global_step": 81428, "epoch": 1938} {"train_loss": -6.2321929931640625, "global_step": 81429, "epoch": 1938} {"train_loss": -6.104592800140381, "global_step": 81430, "epoch": 1938} {"train_loss": -6.227709770202637, "global_step": 81431, "epoch": 1938} {"train_loss": -6.1139092445373535, "global_step": 81432, "epoch": 1938} {"train_loss": -6.045415878295898, "global_step": 81433, "epoch": 1938} {"train_loss": -6.11067533493042, "global_step": 81434, "epoch": 1938} {"train_loss": -6.165333271026611, "global_step": 81435, "epoch": 1938} {"train_loss": -6.084025859832764, "global_step": 81436, "epoch": 1938} {"train_loss": -6.144699051266625, "global_step": 81437, "epoch": 1938, "val_loss": 74951.78125} {"train_loss": -6.139427661895752, "global_step": 81438, "epoch": 1939} {"train_loss": -6.066926002502441, "global_step": 81439, "epoch": 1939} {"train_loss": -6.22159481048584, "global_step": 81440, "epoch": 1939} {"train_loss": -6.1926493644714355, "global_step": 81441, "epoch": 1939} {"train_loss": -6.065342903137207, "global_step": 81442, "epoch": 1939} {"train_loss": -6.055782794952393, "global_step": 81443, "epoch": 1939} {"train_loss": -5.927568435668945, "global_step": 81444, "epoch": 1939} {"train_loss": -6.15920877456665, "global_step": 81445, "epoch": 1939} {"train_loss": -6.164404392242432, "global_step": 81446, "epoch": 1939} {"train_loss": -6.232024669647217, "global_step": 81447, "epoch": 1939} {"train_loss": -6.121635437011719, "global_step": 81448, "epoch": 1939} {"train_loss": -6.200479984283447, "global_step": 81449, "epoch": 1939} {"train_loss": -6.077165126800537, "global_step": 81450, "epoch": 1939} {"train_loss": -6.167304039001465, "global_step": 81451, "epoch": 1939} {"train_loss": -6.08509635925293, "global_step": 81452, "epoch": 1939} {"train_loss": -6.130261421203613, "global_step": 81453, "epoch": 1939} {"train_loss": -6.111337184906006, "global_step": 81454, "epoch": 1939} {"train_loss": -6.158339023590088, "global_step": 81455, "epoch": 1939} {"train_loss": -6.076967239379883, "global_step": 81456, "epoch": 1939} {"train_loss": -6.100250244140625, "global_step": 81457, "epoch": 1939} {"train_loss": -6.166641712188721, "global_step": 81458, "epoch": 1939} {"train_loss": -6.111042022705078, "global_step": 81459, "epoch": 1939} {"train_loss": -6.094185829162598, "global_step": 81460, "epoch": 1939} {"train_loss": -6.089573383331299, "global_step": 81461, "epoch": 1939} {"train_loss": -6.166069030761719, "global_step": 81462, "epoch": 1939} {"train_loss": -6.102383613586426, "global_step": 81463, "epoch": 1939} {"train_loss": -6.164693355560303, "global_step": 81464, "epoch": 1939} {"train_loss": -6.129295825958252, "global_step": 81465, "epoch": 1939} {"train_loss": -6.298255920410156, "global_step": 81466, "epoch": 1939} {"train_loss": -6.006137847900391, "global_step": 81467, "epoch": 1939} {"train_loss": -6.074469566345215, "global_step": 81468, "epoch": 1939} {"train_loss": -6.284237861633301, "global_step": 81469, "epoch": 1939} {"train_loss": -6.123193740844727, "global_step": 81470, "epoch": 1939} {"train_loss": -6.17447566986084, "global_step": 81471, "epoch": 1939} {"train_loss": -6.144644737243652, "global_step": 81472, "epoch": 1939} {"train_loss": -6.149682998657227, "global_step": 81473, "epoch": 1939} {"train_loss": -6.196773052215576, "global_step": 81474, "epoch": 1939} {"train_loss": -6.203536510467529, "global_step": 81475, "epoch": 1939} {"train_loss": -6.267475128173828, "global_step": 81476, "epoch": 1939} {"train_loss": -6.2060227394104, "global_step": 81477, "epoch": 1939} {"train_loss": -6.213968276977539, "global_step": 81478, "epoch": 1939} {"train_loss": -6.141146273840041, "global_step": 81479, "epoch": 1939, "val_loss": 75427.0546875} {"train_loss": -6.131940841674805, "global_step": 81480, "epoch": 1940} {"train_loss": -6.144347190856934, "global_step": 81481, "epoch": 1940} {"train_loss": -6.150463581085205, "global_step": 81482, "epoch": 1940} {"train_loss": -6.184537887573242, "global_step": 81483, "epoch": 1940} {"train_loss": -6.1502227783203125, "global_step": 81484, "epoch": 1940} {"train_loss": -6.074888706207275, "global_step": 81485, "epoch": 1940} {"train_loss": -6.118645668029785, "global_step": 81486, "epoch": 1940} {"train_loss": -6.190171718597412, "global_step": 81487, "epoch": 1940} {"train_loss": -6.133082866668701, "global_step": 81488, "epoch": 1940} {"train_loss": -6.066764831542969, "global_step": 81489, "epoch": 1940} {"train_loss": -5.995080947875977, "global_step": 81490, "epoch": 1940} {"train_loss": -6.070276737213135, "global_step": 81491, "epoch": 1940} {"train_loss": -6.208239555358887, "global_step": 81492, "epoch": 1940} {"train_loss": -6.1063079833984375, "global_step": 81493, "epoch": 1940} {"train_loss": -6.197267055511475, "global_step": 81494, "epoch": 1940} {"train_loss": -6.07911491394043, "global_step": 81495, "epoch": 1940} {"train_loss": -6.079134464263916, "global_step": 81496, "epoch": 1940} {"train_loss": -6.1512956619262695, "global_step": 81497, "epoch": 1940} {"train_loss": -6.136768817901611, "global_step": 81498, "epoch": 1940} {"train_loss": -6.075953483581543, "global_step": 81499, "epoch": 1940} {"train_loss": -6.182212829589844, "global_step": 81500, "epoch": 1940} {"train_loss": -6.13346004486084, "global_step": 81501, "epoch": 1940} {"train_loss": -6.1482086181640625, "global_step": 81502, "epoch": 1940} {"train_loss": -6.160697937011719, "global_step": 81503, "epoch": 1940} {"train_loss": -6.063043594360352, "global_step": 81504, "epoch": 1940} {"train_loss": -6.150421619415283, "global_step": 81505, "epoch": 1940} {"train_loss": -6.020705699920654, "global_step": 81506, "epoch": 1940} {"train_loss": -6.030617713928223, "global_step": 81507, "epoch": 1940} {"train_loss": -6.273219108581543, "global_step": 81508, "epoch": 1940} {"train_loss": -6.026409149169922, "global_step": 81509, "epoch": 1940} {"train_loss": -6.092350959777832, "global_step": 81510, "epoch": 1940} {"train_loss": -6.227998733520508, "global_step": 81511, "epoch": 1940} {"train_loss": -5.975496292114258, "global_step": 81512, "epoch": 1940} {"train_loss": -6.011076927185059, "global_step": 81513, "epoch": 1940} {"train_loss": -6.085235595703125, "global_step": 81514, "epoch": 1940} {"train_loss": -6.146705627441406, "global_step": 81515, "epoch": 1940} {"train_loss": -5.924980163574219, "global_step": 81516, "epoch": 1940} {"train_loss": -6.10997200012207, "global_step": 81517, "epoch": 1940} {"train_loss": -6.101302623748779, "global_step": 81518, "epoch": 1940} {"train_loss": -6.077126502990723, "global_step": 81519, "epoch": 1940} {"train_loss": -6.138738632202148, "global_step": 81520, "epoch": 1940} {"train_loss": -6.110320772443499, "global_step": 81521, "epoch": 1940, "val_loss": 75632.421875} {"train_loss": -6.030318737030029, "global_step": 81522, "epoch": 1941} {"train_loss": -6.061672210693359, "global_step": 81523, "epoch": 1941} {"train_loss": -5.930448532104492, "global_step": 81524, "epoch": 1941} {"train_loss": -6.049871921539307, "global_step": 81525, "epoch": 1941} {"train_loss": -6.198379039764404, "global_step": 81526, "epoch": 1941} {"train_loss": -5.954414367675781, "global_step": 81527, "epoch": 1941} {"train_loss": -6.121756076812744, "global_step": 81528, "epoch": 1941} {"train_loss": -6.093649864196777, "global_step": 81529, "epoch": 1941} {"train_loss": -6.1974663734436035, "global_step": 81530, "epoch": 1941} {"train_loss": -6.181870460510254, "global_step": 81531, "epoch": 1941} {"train_loss": -6.208075523376465, "global_step": 81532, "epoch": 1941} {"train_loss": -6.182839870452881, "global_step": 81533, "epoch": 1941} {"train_loss": -5.995490074157715, "global_step": 81534, "epoch": 1941} {"train_loss": -6.213406085968018, "global_step": 81535, "epoch": 1941} {"train_loss": -6.1464715003967285, "global_step": 81536, "epoch": 1941} {"train_loss": -6.222268104553223, "global_step": 81537, "epoch": 1941} {"train_loss": -6.119246959686279, "global_step": 81538, "epoch": 1941} {"train_loss": -6.332531929016113, "global_step": 81539, "epoch": 1941} {"train_loss": -6.176707744598389, "global_step": 81540, "epoch": 1941} {"train_loss": -6.222228050231934, "global_step": 81541, "epoch": 1941} {"train_loss": -6.138359069824219, "global_step": 81542, "epoch": 1941} {"train_loss": -6.203055381774902, "global_step": 81543, "epoch": 1941} {"train_loss": -6.167392730712891, "global_step": 81544, "epoch": 1941} {"train_loss": -6.248592376708984, "global_step": 81545, "epoch": 1941} {"train_loss": -6.237834453582764, "global_step": 81546, "epoch": 1941} {"train_loss": -6.074824333190918, "global_step": 81547, "epoch": 1941} {"train_loss": -6.181567668914795, "global_step": 81548, "epoch": 1941} {"train_loss": -6.2152557373046875, "global_step": 81549, "epoch": 1941} {"train_loss": -6.224270820617676, "global_step": 81550, "epoch": 1941} {"train_loss": -6.167217254638672, "global_step": 81551, "epoch": 1941} {"train_loss": -6.179871559143066, "global_step": 81552, "epoch": 1941} {"train_loss": -6.016957759857178, "global_step": 81553, "epoch": 1941} {"train_loss": -6.279848098754883, "global_step": 81554, "epoch": 1941} {"train_loss": -6.14140510559082, "global_step": 81555, "epoch": 1941} {"train_loss": -6.202322959899902, "global_step": 81556, "epoch": 1941} {"train_loss": -6.049491882324219, "global_step": 81557, "epoch": 1941} {"train_loss": -6.179864406585693, "global_step": 81558, "epoch": 1941} {"train_loss": -6.133210182189941, "global_step": 81559, "epoch": 1941} {"train_loss": -6.060744285583496, "global_step": 81560, "epoch": 1941} {"train_loss": -6.024759292602539, "global_step": 81561, "epoch": 1941} {"train_loss": -6.13853645324707, "global_step": 81562, "epoch": 1941} {"train_loss": -6.141362780616397, "global_step": 81563, "epoch": 1941, "val_loss": 75544.171875} {"train_loss": -6.102327346801758, "global_step": 81564, "epoch": 1942} {"train_loss": -6.0905632972717285, "global_step": 81565, "epoch": 1942} {"train_loss": -6.196108341217041, "global_step": 81566, "epoch": 1942} {"train_loss": -6.1384124755859375, "global_step": 81567, "epoch": 1942} {"train_loss": -6.2209062576293945, "global_step": 81568, "epoch": 1942} {"train_loss": -6.203595161437988, "global_step": 81569, "epoch": 1942} {"train_loss": -6.038969039916992, "global_step": 81570, "epoch": 1942} {"train_loss": -6.210938453674316, "global_step": 81571, "epoch": 1942} {"train_loss": -6.194340705871582, "global_step": 81572, "epoch": 1942} {"train_loss": -6.152612686157227, "global_step": 81573, "epoch": 1942} {"train_loss": -6.208189964294434, "global_step": 81574, "epoch": 1942} {"train_loss": -6.0359954833984375, "global_step": 81575, "epoch": 1942} {"train_loss": -6.202309608459473, "global_step": 81576, "epoch": 1942} {"train_loss": -6.339189529418945, "global_step": 81577, "epoch": 1942} {"train_loss": -6.150121688842773, "global_step": 81578, "epoch": 1942} {"train_loss": -6.198885917663574, "global_step": 81579, "epoch": 1942} {"train_loss": -6.250456809997559, "global_step": 81580, "epoch": 1942} {"train_loss": -6.286823272705078, "global_step": 81581, "epoch": 1942} {"train_loss": -6.078343391418457, "global_step": 81582, "epoch": 1942} {"train_loss": -6.285196304321289, "global_step": 81583, "epoch": 1942} {"train_loss": -6.06771183013916, "global_step": 81584, "epoch": 1942} {"train_loss": -6.138298034667969, "global_step": 81585, "epoch": 1942} {"train_loss": -6.076787948608398, "global_step": 81586, "epoch": 1942} {"train_loss": -6.038888931274414, "global_step": 81587, "epoch": 1942} {"train_loss": -6.1737799644470215, "global_step": 81588, "epoch": 1942} {"train_loss": -6.137160778045654, "global_step": 81589, "epoch": 1942} {"train_loss": -6.139962196350098, "global_step": 81590, "epoch": 1942} {"train_loss": -6.042047500610352, "global_step": 81591, "epoch": 1942} {"train_loss": -6.144115924835205, "global_step": 81592, "epoch": 1942} {"train_loss": -6.0270490646362305, "global_step": 81593, "epoch": 1942} {"train_loss": -6.196163654327393, "global_step": 81594, "epoch": 1942} {"train_loss": -6.164728164672852, "global_step": 81595, "epoch": 1942} {"train_loss": -6.15949010848999, "global_step": 81596, "epoch": 1942} {"train_loss": -6.153965950012207, "global_step": 81597, "epoch": 1942} {"train_loss": -6.2212419509887695, "global_step": 81598, "epoch": 1942} {"train_loss": -6.235973358154297, "global_step": 81599, "epoch": 1942} {"train_loss": -6.147231578826904, "global_step": 81600, "epoch": 1942} {"train_loss": -6.150906562805176, "global_step": 81601, "epoch": 1942} {"train_loss": -6.172048568725586, "global_step": 81602, "epoch": 1942} {"train_loss": -6.142415523529053, "global_step": 81603, "epoch": 1942} {"train_loss": -6.286759376525879, "global_step": 81604, "epoch": 1942} {"train_loss": -6.163012981414795, "global_step": 81605, "epoch": 1942, "val_loss": 75279.1953125} {"train_loss": -6.068889617919922, "global_step": 81606, "epoch": 1943} {"train_loss": -6.183680534362793, "global_step": 81607, "epoch": 1943} {"train_loss": -6.134858131408691, "global_step": 81608, "epoch": 1943} {"train_loss": -6.143986701965332, "global_step": 81609, "epoch": 1943} {"train_loss": -6.190427303314209, "global_step": 81610, "epoch": 1943} {"train_loss": -6.1464033126831055, "global_step": 81611, "epoch": 1943} {"train_loss": -6.113961219787598, "global_step": 81612, "epoch": 1943} {"train_loss": -6.217198371887207, "global_step": 81613, "epoch": 1943} {"train_loss": -6.0486297607421875, "global_step": 81614, "epoch": 1943} {"train_loss": -6.164514064788818, "global_step": 81615, "epoch": 1943} {"train_loss": -6.16337776184082, "global_step": 81616, "epoch": 1943} {"train_loss": -6.157585144042969, "global_step": 81617, "epoch": 1943} {"train_loss": -6.185169219970703, "global_step": 81618, "epoch": 1943} {"train_loss": -6.155624866485596, "global_step": 81619, "epoch": 1943} {"train_loss": -6.131879806518555, "global_step": 81620, "epoch": 1943} {"train_loss": -6.161149501800537, "global_step": 81621, "epoch": 1943} {"train_loss": -6.030572891235352, "global_step": 81622, "epoch": 1943} {"train_loss": -6.127321243286133, "global_step": 81623, "epoch": 1943} {"train_loss": -6.076572895050049, "global_step": 81624, "epoch": 1943} {"train_loss": -6.050923824310303, "global_step": 81625, "epoch": 1943} {"train_loss": -6.178930759429932, "global_step": 81626, "epoch": 1943} {"train_loss": -6.027219772338867, "global_step": 81627, "epoch": 1943} {"train_loss": -5.9258503913879395, "global_step": 81628, "epoch": 1943} {"train_loss": -6.158998489379883, "global_step": 81629, "epoch": 1943} {"train_loss": -6.118769645690918, "global_step": 81630, "epoch": 1943} {"train_loss": -5.957508087158203, "global_step": 81631, "epoch": 1943} {"train_loss": -6.093074798583984, "global_step": 81632, "epoch": 1943} {"train_loss": -6.102819442749023, "global_step": 81633, "epoch": 1943} {"train_loss": -6.015078544616699, "global_step": 81634, "epoch": 1943} {"train_loss": -6.22074556350708, "global_step": 81635, "epoch": 1943} {"train_loss": -6.049437999725342, "global_step": 81636, "epoch": 1943} {"train_loss": -6.162908554077148, "global_step": 81637, "epoch": 1943} {"train_loss": -6.157224655151367, "global_step": 81638, "epoch": 1943} {"train_loss": -5.969429016113281, "global_step": 81639, "epoch": 1943} {"train_loss": -6.209496974945068, "global_step": 81640, "epoch": 1943} {"train_loss": -6.14164924621582, "global_step": 81641, "epoch": 1943} {"train_loss": -6.262742042541504, "global_step": 81642, "epoch": 1943} {"train_loss": -6.050859451293945, "global_step": 81643, "epoch": 1943} {"train_loss": -6.059038162231445, "global_step": 81644, "epoch": 1943} {"train_loss": -6.245934009552002, "global_step": 81645, "epoch": 1943} {"train_loss": -6.119699478149414, "global_step": 81646, "epoch": 1943} {"train_loss": -6.118763537633987, "global_step": 81647, "epoch": 1943, "val_loss": 74981.1953125} {"train_loss": -6.021884918212891, "global_step": 81648, "epoch": 1944} {"train_loss": -6.265644550323486, "global_step": 81649, "epoch": 1944} {"train_loss": -6.227715492248535, "global_step": 81650, "epoch": 1944} {"train_loss": -6.096665382385254, "global_step": 81651, "epoch": 1944} {"train_loss": -6.047358512878418, "global_step": 81652, "epoch": 1944} {"train_loss": -6.168585777282715, "global_step": 81653, "epoch": 1944} {"train_loss": -6.222962856292725, "global_step": 81654, "epoch": 1944} {"train_loss": -6.253964424133301, "global_step": 81655, "epoch": 1944} {"train_loss": -6.1692657470703125, "global_step": 81656, "epoch": 1944} {"train_loss": -6.167171955108643, "global_step": 81657, "epoch": 1944} {"train_loss": -6.160042762756348, "global_step": 81658, "epoch": 1944} {"train_loss": -6.143756866455078, "global_step": 81659, "epoch": 1944} {"train_loss": -6.110762119293213, "global_step": 81660, "epoch": 1944} {"train_loss": -6.099203586578369, "global_step": 81661, "epoch": 1944} {"train_loss": -6.208009719848633, "global_step": 81662, "epoch": 1944} {"train_loss": -6.063934803009033, "global_step": 81663, "epoch": 1944} {"train_loss": -6.259302616119385, "global_step": 81664, "epoch": 1944} {"train_loss": -6.212047100067139, "global_step": 81665, "epoch": 1944} {"train_loss": -6.148003578186035, "global_step": 81666, "epoch": 1944} {"train_loss": -6.083191394805908, "global_step": 81667, "epoch": 1944} {"train_loss": -6.093302249908447, "global_step": 81668, "epoch": 1944} {"train_loss": -6.1323065757751465, "global_step": 81669, "epoch": 1944} {"train_loss": -6.185244560241699, "global_step": 81670, "epoch": 1944} {"train_loss": -6.155695915222168, "global_step": 81671, "epoch": 1944} {"train_loss": -6.102020263671875, "global_step": 81672, "epoch": 1944} {"train_loss": -6.1868438720703125, "global_step": 81673, "epoch": 1944} {"train_loss": -6.0882744789123535, "global_step": 81674, "epoch": 1944} {"train_loss": -6.1295905113220215, "global_step": 81675, "epoch": 1944} {"train_loss": -6.134544372558594, "global_step": 81676, "epoch": 1944} {"train_loss": -6.2274861335754395, "global_step": 81677, "epoch": 1944} {"train_loss": -6.132903099060059, "global_step": 81678, "epoch": 1944} {"train_loss": -6.200404167175293, "global_step": 81679, "epoch": 1944} {"train_loss": -6.2114973068237305, "global_step": 81680, "epoch": 1944} {"train_loss": -6.250253677368164, "global_step": 81681, "epoch": 1944} {"train_loss": -6.239800453186035, "global_step": 81682, "epoch": 1944} {"train_loss": -6.1016011238098145, "global_step": 81683, "epoch": 1944} {"train_loss": -6.140974044799805, "global_step": 81684, "epoch": 1944} {"train_loss": -6.17816686630249, "global_step": 81685, "epoch": 1944} {"train_loss": -6.155296802520752, "global_step": 81686, "epoch": 1944} {"train_loss": -6.22499418258667, "global_step": 81687, "epoch": 1944} {"train_loss": -6.304871082305908, "global_step": 81688, "epoch": 1944} {"train_loss": -6.161349183037167, "global_step": 81689, "epoch": 1944, "val_loss": 74931.53125} {"train_loss": -6.215089797973633, "global_step": 81690, "epoch": 1945} {"train_loss": -6.136709213256836, "global_step": 81691, "epoch": 1945} {"train_loss": -6.245097637176514, "global_step": 81692, "epoch": 1945} {"train_loss": -6.143678665161133, "global_step": 81693, "epoch": 1945} {"train_loss": -6.202038764953613, "global_step": 81694, "epoch": 1945} {"train_loss": -6.058891773223877, "global_step": 81695, "epoch": 1945} {"train_loss": -6.125152587890625, "global_step": 81696, "epoch": 1945} {"train_loss": -6.128745079040527, "global_step": 81697, "epoch": 1945} {"train_loss": -6.099220275878906, "global_step": 81698, "epoch": 1945} {"train_loss": -6.046132564544678, "global_step": 81699, "epoch": 1945} {"train_loss": -6.216317176818848, "global_step": 81700, "epoch": 1945} {"train_loss": -5.9944610595703125, "global_step": 81701, "epoch": 1945} {"train_loss": -6.157052040100098, "global_step": 81702, "epoch": 1945} {"train_loss": -6.200692176818848, "global_step": 81703, "epoch": 1945} {"train_loss": -6.226388454437256, "global_step": 81704, "epoch": 1945} {"train_loss": -6.231431007385254, "global_step": 81705, "epoch": 1945} {"train_loss": -6.202600479125977, "global_step": 81706, "epoch": 1945} {"train_loss": -6.049549579620361, "global_step": 81707, "epoch": 1945} {"train_loss": -6.054953575134277, "global_step": 81708, "epoch": 1945} {"train_loss": -6.0174407958984375, "global_step": 81709, "epoch": 1945} {"train_loss": -6.134456634521484, "global_step": 81710, "epoch": 1945} {"train_loss": -6.084041595458984, "global_step": 81711, "epoch": 1945} {"train_loss": -6.0422844886779785, "global_step": 81712, "epoch": 1945} {"train_loss": -6.269906997680664, "global_step": 81713, "epoch": 1945} {"train_loss": -6.237604141235352, "global_step": 81714, "epoch": 1945} {"train_loss": -6.069417953491211, "global_step": 81715, "epoch": 1945} {"train_loss": -6.230722427368164, "global_step": 81716, "epoch": 1945} {"train_loss": -6.095520973205566, "global_step": 81717, "epoch": 1945} {"train_loss": -6.173439979553223, "global_step": 81718, "epoch": 1945} {"train_loss": -6.201423645019531, "global_step": 81719, "epoch": 1945} {"train_loss": -6.192115306854248, "global_step": 81720, "epoch": 1945} {"train_loss": -6.164813041687012, "global_step": 81721, "epoch": 1945} {"train_loss": -6.16335391998291, "global_step": 81722, "epoch": 1945} {"train_loss": -6.160926342010498, "global_step": 81723, "epoch": 1945} {"train_loss": -6.106689453125, "global_step": 81724, "epoch": 1945} {"train_loss": -6.227158069610596, "global_step": 81725, "epoch": 1945} {"train_loss": -6.249142646789551, "global_step": 81726, "epoch": 1945} {"train_loss": -6.0019636154174805, "global_step": 81727, "epoch": 1945} {"train_loss": -6.093947410583496, "global_step": 81728, "epoch": 1945} {"train_loss": -6.189578056335449, "global_step": 81729, "epoch": 1945} {"train_loss": -5.997073173522949, "global_step": 81730, "epoch": 1945} {"train_loss": -6.141757658549717, "global_step": 81731, "epoch": 1945, "val_loss": 75077.5859375} {"train_loss": -6.125002384185791, "global_step": 81732, "epoch": 1946} {"train_loss": -6.142868995666504, "global_step": 81733, "epoch": 1946} {"train_loss": -6.119596481323242, "global_step": 81734, "epoch": 1946} {"train_loss": -6.019972801208496, "global_step": 81735, "epoch": 1946} {"train_loss": -6.0913496017456055, "global_step": 81736, "epoch": 1946} {"train_loss": -6.089418411254883, "global_step": 81737, "epoch": 1946} {"train_loss": -6.147784233093262, "global_step": 81738, "epoch": 1946} {"train_loss": -6.161176681518555, "global_step": 81739, "epoch": 1946} {"train_loss": -6.153290271759033, "global_step": 81740, "epoch": 1946} {"train_loss": -6.052013397216797, "global_step": 81741, "epoch": 1946} {"train_loss": -6.000497341156006, "global_step": 81742, "epoch": 1946} {"train_loss": -6.068645477294922, "global_step": 81743, "epoch": 1946} {"train_loss": -6.144367218017578, "global_step": 81744, "epoch": 1946} {"train_loss": -6.128635883331299, "global_step": 81745, "epoch": 1946} {"train_loss": -6.1585235595703125, "global_step": 81746, "epoch": 1946} {"train_loss": -6.1379313468933105, "global_step": 81747, "epoch": 1946} {"train_loss": -6.160426616668701, "global_step": 81748, "epoch": 1946} {"train_loss": -6.239350318908691, "global_step": 81749, "epoch": 1946} {"train_loss": -6.175497055053711, "global_step": 81750, "epoch": 1946} {"train_loss": -6.2234320640563965, "global_step": 81751, "epoch": 1946} {"train_loss": -6.082390785217285, "global_step": 81752, "epoch": 1946} {"train_loss": -6.217571258544922, "global_step": 81753, "epoch": 1946} {"train_loss": -6.209758758544922, "global_step": 81754, "epoch": 1946} {"train_loss": -6.194849014282227, "global_step": 81755, "epoch": 1946} {"train_loss": -6.020850658416748, "global_step": 81756, "epoch": 1946} {"train_loss": -6.3065314292907715, "global_step": 81757, "epoch": 1946} {"train_loss": -6.232682228088379, "global_step": 81758, "epoch": 1946} {"train_loss": -6.0847578048706055, "global_step": 81759, "epoch": 1946} {"train_loss": -6.160799980163574, "global_step": 81760, "epoch": 1946} {"train_loss": -6.138352394104004, "global_step": 81761, "epoch": 1946} {"train_loss": -6.236009120941162, "global_step": 81762, "epoch": 1946} {"train_loss": -6.133855819702148, "global_step": 81763, "epoch": 1946} {"train_loss": -6.136154651641846, "global_step": 81764, "epoch": 1946} {"train_loss": -6.262813568115234, "global_step": 81765, "epoch": 1946} {"train_loss": -6.112146854400635, "global_step": 81766, "epoch": 1946} {"train_loss": -6.177798271179199, "global_step": 81767, "epoch": 1946} {"train_loss": -6.202166557312012, "global_step": 81768, "epoch": 1946} {"train_loss": -6.117929458618164, "global_step": 81769, "epoch": 1946} {"train_loss": -6.257876396179199, "global_step": 81770, "epoch": 1946} {"train_loss": -6.066262245178223, "global_step": 81771, "epoch": 1946} {"train_loss": -6.220198631286621, "global_step": 81772, "epoch": 1946} {"train_loss": -6.151186375390916, "global_step": 81773, "epoch": 1946, "val_loss": 75123.859375} {"train_loss": -6.105930805206299, "global_step": 81774, "epoch": 1947} {"train_loss": -6.209308624267578, "global_step": 81775, "epoch": 1947} {"train_loss": -6.125520706176758, "global_step": 81776, "epoch": 1947} {"train_loss": -6.125774383544922, "global_step": 81777, "epoch": 1947} {"train_loss": -6.215239524841309, "global_step": 81778, "epoch": 1947} {"train_loss": -6.225500583648682, "global_step": 81779, "epoch": 1947} {"train_loss": -6.256068706512451, "global_step": 81780, "epoch": 1947} {"train_loss": -6.115046501159668, "global_step": 81781, "epoch": 1947} {"train_loss": -6.059587478637695, "global_step": 81782, "epoch": 1947} {"train_loss": -6.127241611480713, "global_step": 81783, "epoch": 1947} {"train_loss": -6.1905741691589355, "global_step": 81784, "epoch": 1947} {"train_loss": -6.154266834259033, "global_step": 81785, "epoch": 1947} {"train_loss": -6.223565578460693, "global_step": 81786, "epoch": 1947} {"train_loss": -6.114681243896484, "global_step": 81787, "epoch": 1947} {"train_loss": -6.231107711791992, "global_step": 81788, "epoch": 1947} {"train_loss": -6.208917617797852, "global_step": 81789, "epoch": 1947} {"train_loss": -6.1712212562561035, "global_step": 81790, "epoch": 1947} {"train_loss": -6.096549034118652, "global_step": 81791, "epoch": 1947} {"train_loss": -6.095602035522461, "global_step": 81792, "epoch": 1947} {"train_loss": -6.201692581176758, "global_step": 81793, "epoch": 1947} {"train_loss": -6.124615669250488, "global_step": 81794, "epoch": 1947} {"train_loss": -6.1421661376953125, "global_step": 81795, "epoch": 1947} {"train_loss": -6.08795166015625, "global_step": 81796, "epoch": 1947} {"train_loss": -6.002744674682617, "global_step": 81797, "epoch": 1947} {"train_loss": -6.1042633056640625, "global_step": 81798, "epoch": 1947} {"train_loss": -6.136035919189453, "global_step": 81799, "epoch": 1947} {"train_loss": -5.990907669067383, "global_step": 81800, "epoch": 1947} {"train_loss": -6.159404754638672, "global_step": 81801, "epoch": 1947} {"train_loss": -6.185689926147461, "global_step": 81802, "epoch": 1947} {"train_loss": -6.1724934577941895, "global_step": 81803, "epoch": 1947} {"train_loss": -6.053773880004883, "global_step": 81804, "epoch": 1947} {"train_loss": -6.154047012329102, "global_step": 81805, "epoch": 1947} {"train_loss": -6.101675033569336, "global_step": 81806, "epoch": 1947} {"train_loss": -6.105898857116699, "global_step": 81807, "epoch": 1947} {"train_loss": -6.221499443054199, "global_step": 81808, "epoch": 1947} {"train_loss": -6.045236587524414, "global_step": 81809, "epoch": 1947} {"train_loss": -6.101018905639648, "global_step": 81810, "epoch": 1947} {"train_loss": -6.069958209991455, "global_step": 81811, "epoch": 1947} {"train_loss": -6.183710098266602, "global_step": 81812, "epoch": 1947} {"train_loss": -6.093750953674316, "global_step": 81813, "epoch": 1947} {"train_loss": -6.07936954498291, "global_step": 81814, "epoch": 1947} {"train_loss": -6.136633396148682, "global_step": 81815, "epoch": 1947, "val_loss": 75157.2890625} {"train_loss": -6.052774429321289, "global_step": 81816, "epoch": 1948} {"train_loss": -6.079896926879883, "global_step": 81817, "epoch": 1948} {"train_loss": -6.1613640785217285, "global_step": 81818, "epoch": 1948} {"train_loss": -6.182869911193848, "global_step": 81819, "epoch": 1948} {"train_loss": -6.226941108703613, "global_step": 81820, "epoch": 1948} {"train_loss": -6.198247909545898, "global_step": 81821, "epoch": 1948} {"train_loss": -6.119594097137451, "global_step": 81822, "epoch": 1948} {"train_loss": -6.162548065185547, "global_step": 81823, "epoch": 1948} {"train_loss": -6.191179275512695, "global_step": 81824, "epoch": 1948} {"train_loss": -6.165117263793945, "global_step": 81825, "epoch": 1948} {"train_loss": -6.157386779785156, "global_step": 81826, "epoch": 1948} {"train_loss": -6.191726207733154, "global_step": 81827, "epoch": 1948} {"train_loss": -6.2883100509643555, "global_step": 81828, "epoch": 1948} {"train_loss": -6.156167984008789, "global_step": 81829, "epoch": 1948} {"train_loss": -6.215970039367676, "global_step": 81830, "epoch": 1948} {"train_loss": -6.150992393493652, "global_step": 81831, "epoch": 1948} {"train_loss": -6.177170753479004, "global_step": 81832, "epoch": 1948} {"train_loss": -6.179792404174805, "global_step": 81833, "epoch": 1948} {"train_loss": -6.209693908691406, "global_step": 81834, "epoch": 1948} {"train_loss": -6.060792446136475, "global_step": 81835, "epoch": 1948} {"train_loss": -6.049001693725586, "global_step": 81836, "epoch": 1948} {"train_loss": -6.1452531814575195, "global_step": 81837, "epoch": 1948} {"train_loss": -6.0987443923950195, "global_step": 81838, "epoch": 1948} {"train_loss": -6.1486687660217285, "global_step": 81839, "epoch": 1948} {"train_loss": -6.109745979309082, "global_step": 81840, "epoch": 1948} {"train_loss": -6.178641319274902, "global_step": 81841, "epoch": 1948} {"train_loss": -5.997244358062744, "global_step": 81842, "epoch": 1948} {"train_loss": -6.216464042663574, "global_step": 81843, "epoch": 1948} {"train_loss": -6.079617023468018, "global_step": 81844, "epoch": 1948} {"train_loss": -6.036529064178467, "global_step": 81845, "epoch": 1948} {"train_loss": -6.238093376159668, "global_step": 81846, "epoch": 1948} {"train_loss": -6.150933742523193, "global_step": 81847, "epoch": 1948} {"train_loss": -6.067929267883301, "global_step": 81848, "epoch": 1948} {"train_loss": -5.991347312927246, "global_step": 81849, "epoch": 1948} {"train_loss": -6.232295989990234, "global_step": 81850, "epoch": 1948} {"train_loss": -6.22487735748291, "global_step": 81851, "epoch": 1948} {"train_loss": -6.156167030334473, "global_step": 81852, "epoch": 1948} {"train_loss": -6.171523094177246, "global_step": 81853, "epoch": 1948} {"train_loss": -6.107308387756348, "global_step": 81854, "epoch": 1948} {"train_loss": -6.142889976501465, "global_step": 81855, "epoch": 1948} {"train_loss": -6.0630693435668945, "global_step": 81856, "epoch": 1948} {"train_loss": -6.144648404348464, "global_step": 81857, "epoch": 1948, "val_loss": 74953.875} {"train_loss": -6.114656448364258, "global_step": 81858, "epoch": 1949} {"train_loss": -6.218937397003174, "global_step": 81859, "epoch": 1949} {"train_loss": -6.2835588455200195, "global_step": 81860, "epoch": 1949} {"train_loss": -6.200933456420898, "global_step": 81861, "epoch": 1949} {"train_loss": -6.2653703689575195, "global_step": 81862, "epoch": 1949} {"train_loss": -6.17487096786499, "global_step": 81863, "epoch": 1949} {"train_loss": -6.143411636352539, "global_step": 81864, "epoch": 1949} {"train_loss": -6.1517333984375, "global_step": 81865, "epoch": 1949} {"train_loss": -6.282861709594727, "global_step": 81866, "epoch": 1949} {"train_loss": -6.305788993835449, "global_step": 81867, "epoch": 1949} {"train_loss": -6.273882865905762, "global_step": 81868, "epoch": 1949} {"train_loss": -6.107154369354248, "global_step": 81869, "epoch": 1949} {"train_loss": -6.217340469360352, "global_step": 81870, "epoch": 1949} {"train_loss": -6.137428283691406, "global_step": 81871, "epoch": 1949} {"train_loss": -6.206821441650391, "global_step": 81872, "epoch": 1949} {"train_loss": -6.257777690887451, "global_step": 81873, "epoch": 1949} {"train_loss": -6.080416679382324, "global_step": 81874, "epoch": 1949} {"train_loss": -6.049750328063965, "global_step": 81875, "epoch": 1949} {"train_loss": -6.119387149810791, "global_step": 81876, "epoch": 1949} {"train_loss": -6.2671732902526855, "global_step": 81877, "epoch": 1949} {"train_loss": -6.030004501342773, "global_step": 81878, "epoch": 1949} {"train_loss": -6.1288676261901855, "global_step": 81879, "epoch": 1949} {"train_loss": -6.1913838386535645, "global_step": 81880, "epoch": 1949} {"train_loss": -6.148507118225098, "global_step": 81881, "epoch": 1949} {"train_loss": -6.19642972946167, "global_step": 81882, "epoch": 1949} {"train_loss": -5.957734107971191, "global_step": 81883, "epoch": 1949} {"train_loss": -6.106525897979736, "global_step": 81884, "epoch": 1949} {"train_loss": -6.134792327880859, "global_step": 81885, "epoch": 1949} {"train_loss": -6.271723747253418, "global_step": 81886, "epoch": 1949} {"train_loss": -6.1678996086120605, "global_step": 81887, "epoch": 1949} {"train_loss": -6.127436637878418, "global_step": 81888, "epoch": 1949} {"train_loss": -6.0949482917785645, "global_step": 81889, "epoch": 1949} {"train_loss": -6.189714431762695, "global_step": 81890, "epoch": 1949} {"train_loss": -6.0351362228393555, "global_step": 81891, "epoch": 1949} {"train_loss": -6.108931064605713, "global_step": 81892, "epoch": 1949} {"train_loss": -6.081007957458496, "global_step": 81893, "epoch": 1949} {"train_loss": -6.189977645874023, "global_step": 81894, "epoch": 1949} {"train_loss": -6.031219482421875, "global_step": 81895, "epoch": 1949} {"train_loss": -6.0496134757995605, "global_step": 81896, "epoch": 1949} {"train_loss": -6.11712121963501, "global_step": 81897, "epoch": 1949} {"train_loss": -6.151815414428711, "global_step": 81898, "epoch": 1949} {"train_loss": -6.154900868733724, "global_step": 81899, "epoch": 1949, "val_loss": 75050.5546875} {"train_loss": -6.0950026512146, "global_step": 81900, "epoch": 1950} {"train_loss": -6.154602527618408, "global_step": 81901, "epoch": 1950} {"train_loss": -6.186027526855469, "global_step": 81902, "epoch": 1950} {"train_loss": -6.190128326416016, "global_step": 81903, "epoch": 1950} {"train_loss": -6.189248085021973, "global_step": 81904, "epoch": 1950} {"train_loss": -6.095717430114746, "global_step": 81905, "epoch": 1950} {"train_loss": -6.05806303024292, "global_step": 81906, "epoch": 1950} {"train_loss": -6.106536865234375, "global_step": 81907, "epoch": 1950} {"train_loss": -6.184597015380859, "global_step": 81908, "epoch": 1950} {"train_loss": -6.094128608703613, "global_step": 81909, "epoch": 1950} {"train_loss": -6.165580749511719, "global_step": 81910, "epoch": 1950} {"train_loss": -6.169726371765137, "global_step": 81911, "epoch": 1950} {"train_loss": -6.221595764160156, "global_step": 81912, "epoch": 1950} {"train_loss": -6.084394454956055, "global_step": 81913, "epoch": 1950} {"train_loss": -6.144579887390137, "global_step": 81914, "epoch": 1950} {"train_loss": -6.197732925415039, "global_step": 81915, "epoch": 1950} {"train_loss": -6.073773384094238, "global_step": 81916, "epoch": 1950} {"train_loss": -6.221783638000488, "global_step": 81917, "epoch": 1950} {"train_loss": -6.191884994506836, "global_step": 81918, "epoch": 1950} {"train_loss": -6.077695846557617, "global_step": 81919, "epoch": 1950} {"train_loss": -6.312709808349609, "global_step": 81920, "epoch": 1950} {"train_loss": -6.202704429626465, "global_step": 81921, "epoch": 1950} {"train_loss": -6.158927917480469, "global_step": 81922, "epoch": 1950} {"train_loss": -6.164202690124512, "global_step": 81923, "epoch": 1950} {"train_loss": -6.136676788330078, "global_step": 81924, "epoch": 1950} {"train_loss": -6.1405205726623535, "global_step": 81925, "epoch": 1950} {"train_loss": -6.259366035461426, "global_step": 81926, "epoch": 1950} {"train_loss": -6.1718034744262695, "global_step": 81927, "epoch": 1950} {"train_loss": -6.060647964477539, "global_step": 81928, "epoch": 1950} {"train_loss": -6.203271865844727, "global_step": 81929, "epoch": 1950} {"train_loss": -6.1891069412231445, "global_step": 81930, "epoch": 1950} {"train_loss": -6.133683204650879, "global_step": 81931, "epoch": 1950} {"train_loss": -6.186664581298828, "global_step": 81932, "epoch": 1950} {"train_loss": -6.04893684387207, "global_step": 81933, "epoch": 1950} {"train_loss": -6.289119243621826, "global_step": 81934, "epoch": 1950} {"train_loss": -6.174385070800781, "global_step": 81935, "epoch": 1950} {"train_loss": -5.993645668029785, "global_step": 81936, "epoch": 1950} {"train_loss": -6.136504173278809, "global_step": 81937, "epoch": 1950} {"train_loss": -6.108615875244141, "global_step": 81938, "epoch": 1950} {"train_loss": -6.071910858154297, "global_step": 81939, "epoch": 1950} {"train_loss": -6.174555778503418, "global_step": 81940, "epoch": 1950} {"train_loss": -6.150707460585094, "global_step": 81941, "epoch": 1950, "train/sim_max_reward_0": 0.23708319432352065, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.701755139382145, "train/sim_max_reward_3": 0.15504492247314744, "train/sim_max_reward_4": 0.9594273730230753, "train/sim_max_reward_5": 0.7870168744919361, "test/sim_max_reward_4500000": 0.31951024937066624, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9007074302661295, "test/sim_max_reward_4500003": 0.9920136625396518, "test/sim_max_reward_4500004": 0.7726908316898141, "test/sim_max_reward_4500005": 0.3686983641533242, "test/sim_max_reward_4500006": 0.9373207863906912, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.61686717645858, "test/sim_max_reward_4500009": 0.9855228814325496, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.6282497451188891, "test/sim_max_reward_4500012": 0.9752407751308491, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.38301539879191887, "test/sim_max_reward_4500015": 0.8951990397294408, "test/sim_max_reward_4500016": 0.4585662961216456, "test/sim_max_reward_4500017": 0.08864741993971527, "test/sim_max_reward_4500018": 0.40922930703562715, "test/sim_max_reward_4500019": 0.47054652694852483, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8472551521483838, "test/sim_max_reward_4500022": 0.9752086009636006, "test/sim_max_reward_4500023": 0.9990560914495309, "test/sim_max_reward_4500024": 0.8795607427490135, "test/sim_max_reward_4500025": 0.5218006734474679, "test/sim_max_reward_4500026": 0.8575143862617035, "test/sim_max_reward_4500027": 0.9786005080142338, "test/sim_max_reward_4500028": 0.18993199263220123, "test/sim_max_reward_4500029": 0.13052630248911623, "test/sim_max_reward_4500030": 0.9856763819586919, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.9330473765699523, "test/sim_max_reward_4500033": 0.851348275739229, "test/sim_max_reward_4500034": 0.773604730999154, "test/sim_max_reward_4500035": 0.8427001806535296, "test/sim_max_reward_4500036": 0.9052473015558996, "test/sim_max_reward_4500037": 0.942038646847312, "test/sim_max_reward_4500038": 0.9561020048395545, "test/sim_max_reward_4500039": 0.9737123638516676, "test/sim_max_reward_4500040": 0.9963747309061807, "test/sim_max_reward_4500041": 0.3883932253428649, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.13672292294140145, "test/sim_max_reward_4500044": 0.7804092525592063, "test/sim_max_reward_4500045": 0.38850837522061016, "test/sim_max_reward_4500046": 0.7967981002223757, "test/sim_max_reward_4500047": 0.9332650556011306, "test/sim_max_reward_4500048": 0.0064131436247492745, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6400545839489707, "test/mean_score": 0.6038856411843373, "val_loss": 75116.59375} {"train_loss": -6.168207168579102, "global_step": 81942, "epoch": 1951} {"train_loss": -6.128171920776367, "global_step": 81943, "epoch": 1951} {"train_loss": -6.098118782043457, "global_step": 81944, "epoch": 1951} {"train_loss": -6.161198616027832, "global_step": 81945, "epoch": 1951} {"train_loss": -6.139374256134033, "global_step": 81946, "epoch": 1951} {"train_loss": -6.159093856811523, "global_step": 81947, "epoch": 1951} {"train_loss": -6.18312931060791, "global_step": 81948, "epoch": 1951} {"train_loss": -6.130145072937012, "global_step": 81949, "epoch": 1951} {"train_loss": -6.153532981872559, "global_step": 81950, "epoch": 1951} {"train_loss": -6.242703437805176, "global_step": 81951, "epoch": 1951} {"train_loss": -6.1286420822143555, "global_step": 81952, "epoch": 1951} {"train_loss": -6.160703182220459, "global_step": 81953, "epoch": 1951} {"train_loss": -6.121979713439941, "global_step": 81954, "epoch": 1951} {"train_loss": -6.213427543640137, "global_step": 81955, "epoch": 1951} {"train_loss": -6.15387487411499, "global_step": 81956, "epoch": 1951} {"train_loss": -6.141182899475098, "global_step": 81957, "epoch": 1951} {"train_loss": -6.226245403289795, "global_step": 81958, "epoch": 1951} {"train_loss": -6.108555793762207, "global_step": 81959, "epoch": 1951} {"train_loss": -6.199975490570068, "global_step": 81960, "epoch": 1951} {"train_loss": -6.168396949768066, "global_step": 81961, "epoch": 1951} {"train_loss": -6.264737129211426, "global_step": 81962, "epoch": 1951} {"train_loss": -6.04615592956543, "global_step": 81963, "epoch": 1951} {"train_loss": -6.0992937088012695, "global_step": 81964, "epoch": 1951} {"train_loss": -6.170644760131836, "global_step": 81965, "epoch": 1951} {"train_loss": -6.117805480957031, "global_step": 81966, "epoch": 1951} {"train_loss": -6.265091419219971, "global_step": 81967, "epoch": 1951} {"train_loss": -6.234488010406494, "global_step": 81968, "epoch": 1951} {"train_loss": -6.281911373138428, "global_step": 81969, "epoch": 1951} {"train_loss": -6.259105205535889, "global_step": 81970, "epoch": 1951} {"train_loss": -6.140486717224121, "global_step": 81971, "epoch": 1951} {"train_loss": -6.261227130889893, "global_step": 81972, "epoch": 1951} {"train_loss": -6.087034225463867, "global_step": 81973, "epoch": 1951} {"train_loss": -6.170404434204102, "global_step": 81974, "epoch": 1951} {"train_loss": -6.216030120849609, "global_step": 81975, "epoch": 1951} {"train_loss": -6.222949028015137, "global_step": 81976, "epoch": 1951} {"train_loss": -6.05682897567749, "global_step": 81977, "epoch": 1951} {"train_loss": -6.302881240844727, "global_step": 81978, "epoch": 1951} {"train_loss": -6.175436973571777, "global_step": 81979, "epoch": 1951} {"train_loss": -6.185675144195557, "global_step": 81980, "epoch": 1951} {"train_loss": -6.251482963562012, "global_step": 81981, "epoch": 1951} {"train_loss": -5.983654022216797, "global_step": 81982, "epoch": 1951} {"train_loss": -6.168343112582252, "global_step": 81983, "epoch": 1951, "val_loss": 75046.5} {"train_loss": -6.119797706604004, "global_step": 81984, "epoch": 1952} {"train_loss": -6.152215003967285, "global_step": 81985, "epoch": 1952} {"train_loss": -6.371591567993164, "global_step": 81986, "epoch": 1952} {"train_loss": -6.148558616638184, "global_step": 81987, "epoch": 1952} {"train_loss": -6.198930740356445, "global_step": 81988, "epoch": 1952} {"train_loss": -6.199224472045898, "global_step": 81989, "epoch": 1952} {"train_loss": -6.143312454223633, "global_step": 81990, "epoch": 1952} {"train_loss": -6.195473670959473, "global_step": 81991, "epoch": 1952} {"train_loss": -6.146572589874268, "global_step": 81992, "epoch": 1952} {"train_loss": -6.21888542175293, "global_step": 81993, "epoch": 1952} {"train_loss": -6.209425926208496, "global_step": 81994, "epoch": 1952} {"train_loss": -6.1472272872924805, "global_step": 81995, "epoch": 1952} {"train_loss": -6.1298017501831055, "global_step": 81996, "epoch": 1952} {"train_loss": -6.086931228637695, "global_step": 81997, "epoch": 1952} {"train_loss": -6.1335906982421875, "global_step": 81998, "epoch": 1952} {"train_loss": -6.130864143371582, "global_step": 81999, "epoch": 1952} {"train_loss": -6.039365768432617, "global_step": 82000, "epoch": 1952} {"train_loss": -6.208356857299805, "global_step": 82001, "epoch": 1952} {"train_loss": -6.249392032623291, "global_step": 82002, "epoch": 1952} {"train_loss": -6.1145195960998535, "global_step": 82003, "epoch": 1952} {"train_loss": -6.230140686035156, "global_step": 82004, "epoch": 1952} {"train_loss": -6.194883346557617, "global_step": 82005, "epoch": 1952} {"train_loss": -6.029125213623047, "global_step": 82006, "epoch": 1952} {"train_loss": -6.091619968414307, "global_step": 82007, "epoch": 1952} {"train_loss": -6.084747314453125, "global_step": 82008, "epoch": 1952} {"train_loss": -6.010290622711182, "global_step": 82009, "epoch": 1952} {"train_loss": -6.062121391296387, "global_step": 82010, "epoch": 1952} {"train_loss": -6.108619689941406, "global_step": 82011, "epoch": 1952} {"train_loss": -6.063981056213379, "global_step": 82012, "epoch": 1952} {"train_loss": -6.08512020111084, "global_step": 82013, "epoch": 1952} {"train_loss": -6.1527628898620605, "global_step": 82014, "epoch": 1952} {"train_loss": -6.237796306610107, "global_step": 82015, "epoch": 1952} {"train_loss": -6.113286018371582, "global_step": 82016, "epoch": 1952} {"train_loss": -6.254427909851074, "global_step": 82017, "epoch": 1952} {"train_loss": -6.323164939880371, "global_step": 82018, "epoch": 1952} {"train_loss": -6.188455581665039, "global_step": 82019, "epoch": 1952} {"train_loss": -6.292703628540039, "global_step": 82020, "epoch": 1952} {"train_loss": -6.113645553588867, "global_step": 82021, "epoch": 1952} {"train_loss": -6.087276458740234, "global_step": 82022, "epoch": 1952} {"train_loss": -6.191647052764893, "global_step": 82023, "epoch": 1952} {"train_loss": -6.1526336669921875, "global_step": 82024, "epoch": 1952} {"train_loss": -6.157709927785964, "global_step": 82025, "epoch": 1952, "val_loss": 74892.7734375} {"train_loss": -6.1242995262146, "global_step": 82026, "epoch": 1953} {"train_loss": -6.264589309692383, "global_step": 82027, "epoch": 1953} {"train_loss": -6.165604591369629, "global_step": 82028, "epoch": 1953} {"train_loss": -6.154545783996582, "global_step": 82029, "epoch": 1953} {"train_loss": -6.168431282043457, "global_step": 82030, "epoch": 1953} {"train_loss": -6.244246482849121, "global_step": 82031, "epoch": 1953} {"train_loss": -6.279026985168457, "global_step": 82032, "epoch": 1953} {"train_loss": -6.1141743659973145, "global_step": 82033, "epoch": 1953} {"train_loss": -6.185877799987793, "global_step": 82034, "epoch": 1953} {"train_loss": -6.2267303466796875, "global_step": 82035, "epoch": 1953} {"train_loss": -6.206349849700928, "global_step": 82036, "epoch": 1953} {"train_loss": -6.215171813964844, "global_step": 82037, "epoch": 1953} {"train_loss": -6.0820441246032715, "global_step": 82038, "epoch": 1953} {"train_loss": -6.125460624694824, "global_step": 82039, "epoch": 1953} {"train_loss": -6.247471332550049, "global_step": 82040, "epoch": 1953} {"train_loss": -6.16937255859375, "global_step": 82041, "epoch": 1953} {"train_loss": -6.137417316436768, "global_step": 82042, "epoch": 1953} {"train_loss": -6.025883197784424, "global_step": 82043, "epoch": 1953} {"train_loss": -6.034453392028809, "global_step": 82044, "epoch": 1953} {"train_loss": -6.085193634033203, "global_step": 82045, "epoch": 1953} {"train_loss": -6.07087516784668, "global_step": 82046, "epoch": 1953} {"train_loss": -5.989371299743652, "global_step": 82047, "epoch": 1953} {"train_loss": -6.078801155090332, "global_step": 82048, "epoch": 1953} {"train_loss": -6.186337947845459, "global_step": 82049, "epoch": 1953} {"train_loss": -6.116020679473877, "global_step": 82050, "epoch": 1953} {"train_loss": -6.033312797546387, "global_step": 82051, "epoch": 1953} {"train_loss": -6.191653251647949, "global_step": 82052, "epoch": 1953} {"train_loss": -6.195529937744141, "global_step": 82053, "epoch": 1953} {"train_loss": -6.209511756896973, "global_step": 82054, "epoch": 1953} {"train_loss": -6.085916996002197, "global_step": 82055, "epoch": 1953} {"train_loss": -6.144486427307129, "global_step": 82056, "epoch": 1953} {"train_loss": -6.1206817626953125, "global_step": 82057, "epoch": 1953} {"train_loss": -6.046073913574219, "global_step": 82058, "epoch": 1953} {"train_loss": -6.110119819641113, "global_step": 82059, "epoch": 1953} {"train_loss": -6.1879072189331055, "global_step": 82060, "epoch": 1953} {"train_loss": -6.296834945678711, "global_step": 82061, "epoch": 1953} {"train_loss": -6.150256156921387, "global_step": 82062, "epoch": 1953} {"train_loss": -6.104479789733887, "global_step": 82063, "epoch": 1953} {"train_loss": -6.155057907104492, "global_step": 82064, "epoch": 1953} {"train_loss": -6.237714767456055, "global_step": 82065, "epoch": 1953} {"train_loss": -6.203489303588867, "global_step": 82066, "epoch": 1953} {"train_loss": -6.152358214060466, "global_step": 82067, "epoch": 1953, "val_loss": 74749.8984375} {"train_loss": -6.025360107421875, "global_step": 82068, "epoch": 1954} {"train_loss": -6.143375396728516, "global_step": 82069, "epoch": 1954} {"train_loss": -6.262462615966797, "global_step": 82070, "epoch": 1954} {"train_loss": -6.147504806518555, "global_step": 82071, "epoch": 1954} {"train_loss": -6.292906761169434, "global_step": 82072, "epoch": 1954} {"train_loss": -6.124508857727051, "global_step": 82073, "epoch": 1954} {"train_loss": -6.237298011779785, "global_step": 82074, "epoch": 1954} {"train_loss": -6.207330703735352, "global_step": 82075, "epoch": 1954} {"train_loss": -6.000485420227051, "global_step": 82076, "epoch": 1954} {"train_loss": -6.14707612991333, "global_step": 82077, "epoch": 1954} {"train_loss": -6.173563480377197, "global_step": 82078, "epoch": 1954} {"train_loss": -6.092179775238037, "global_step": 82079, "epoch": 1954} {"train_loss": -6.232423782348633, "global_step": 82080, "epoch": 1954} {"train_loss": -6.05509090423584, "global_step": 82081, "epoch": 1954} {"train_loss": -6.104928016662598, "global_step": 82082, "epoch": 1954} {"train_loss": -6.230785846710205, "global_step": 82083, "epoch": 1954} {"train_loss": -6.109687328338623, "global_step": 82084, "epoch": 1954} {"train_loss": -6.189962387084961, "global_step": 82085, "epoch": 1954} {"train_loss": -6.216435432434082, "global_step": 82086, "epoch": 1954} {"train_loss": -6.096494197845459, "global_step": 82087, "epoch": 1954} {"train_loss": -6.122984886169434, "global_step": 82088, "epoch": 1954} {"train_loss": -6.131534576416016, "global_step": 82089, "epoch": 1954} {"train_loss": -6.290156364440918, "global_step": 82090, "epoch": 1954} {"train_loss": -6.1338396072387695, "global_step": 82091, "epoch": 1954} {"train_loss": -6.14134407043457, "global_step": 82092, "epoch": 1954} {"train_loss": -6.119140625, "global_step": 82093, "epoch": 1954} {"train_loss": -6.1297383308410645, "global_step": 82094, "epoch": 1954} {"train_loss": -6.2086591720581055, "global_step": 82095, "epoch": 1954} {"train_loss": -6.2403059005737305, "global_step": 82096, "epoch": 1954} {"train_loss": -6.030421733856201, "global_step": 82097, "epoch": 1954} {"train_loss": -6.1795148849487305, "global_step": 82098, "epoch": 1954} {"train_loss": -6.236732482910156, "global_step": 82099, "epoch": 1954} {"train_loss": -6.1039628982543945, "global_step": 82100, "epoch": 1954} {"train_loss": -6.190390586853027, "global_step": 82101, "epoch": 1954} {"train_loss": -6.131040573120117, "global_step": 82102, "epoch": 1954} {"train_loss": -6.093357563018799, "global_step": 82103, "epoch": 1954} {"train_loss": -6.126775741577148, "global_step": 82104, "epoch": 1954} {"train_loss": -6.102121353149414, "global_step": 82105, "epoch": 1954} {"train_loss": -6.2165608406066895, "global_step": 82106, "epoch": 1954} {"train_loss": -6.074950218200684, "global_step": 82107, "epoch": 1954} {"train_loss": -6.223416328430176, "global_step": 82108, "epoch": 1954} {"train_loss": -6.155048109236217, "global_step": 82109, "epoch": 1954, "val_loss": 75053.359375} {"train_loss": -6.087162017822266, "global_step": 82110, "epoch": 1955} {"train_loss": -6.131426811218262, "global_step": 82111, "epoch": 1955} {"train_loss": -6.172370910644531, "global_step": 82112, "epoch": 1955} {"train_loss": -6.0689287185668945, "global_step": 82113, "epoch": 1955} {"train_loss": -6.159467697143555, "global_step": 82114, "epoch": 1955} {"train_loss": -6.048801422119141, "global_step": 82115, "epoch": 1955} {"train_loss": -6.0438618659973145, "global_step": 82116, "epoch": 1955} {"train_loss": -6.118607521057129, "global_step": 82117, "epoch": 1955} {"train_loss": -6.109521865844727, "global_step": 82118, "epoch": 1955} {"train_loss": -6.101949691772461, "global_step": 82119, "epoch": 1955} {"train_loss": -6.150350570678711, "global_step": 82120, "epoch": 1955} {"train_loss": -6.186881065368652, "global_step": 82121, "epoch": 1955} {"train_loss": -6.250790119171143, "global_step": 82122, "epoch": 1955} {"train_loss": -6.261833667755127, "global_step": 82123, "epoch": 1955} {"train_loss": -6.051366329193115, "global_step": 82124, "epoch": 1955} {"train_loss": -6.2526373863220215, "global_step": 82125, "epoch": 1955} {"train_loss": -6.216103553771973, "global_step": 82126, "epoch": 1955} {"train_loss": -6.091813087463379, "global_step": 82127, "epoch": 1955} {"train_loss": -6.242056846618652, "global_step": 82128, "epoch": 1955} {"train_loss": -6.032581806182861, "global_step": 82129, "epoch": 1955} {"train_loss": -6.098695755004883, "global_step": 82130, "epoch": 1955} {"train_loss": -6.145298480987549, "global_step": 82131, "epoch": 1955} {"train_loss": -6.194587707519531, "global_step": 82132, "epoch": 1955} {"train_loss": -6.257949352264404, "global_step": 82133, "epoch": 1955} {"train_loss": -6.118591785430908, "global_step": 82134, "epoch": 1955} {"train_loss": -6.268191337585449, "global_step": 82135, "epoch": 1955} {"train_loss": -6.019521713256836, "global_step": 82136, "epoch": 1955} {"train_loss": -6.056787014007568, "global_step": 82137, "epoch": 1955} {"train_loss": -6.092578887939453, "global_step": 82138, "epoch": 1955} {"train_loss": -6.046228885650635, "global_step": 82139, "epoch": 1955} {"train_loss": -6.05710506439209, "global_step": 82140, "epoch": 1955} {"train_loss": -6.11783504486084, "global_step": 82141, "epoch": 1955} {"train_loss": -6.226746082305908, "global_step": 82142, "epoch": 1955} {"train_loss": -6.160378456115723, "global_step": 82143, "epoch": 1955} {"train_loss": -6.252601146697998, "global_step": 82144, "epoch": 1955} {"train_loss": -6.198038101196289, "global_step": 82145, "epoch": 1955} {"train_loss": -6.151918411254883, "global_step": 82146, "epoch": 1955} {"train_loss": -6.02978515625, "global_step": 82147, "epoch": 1955} {"train_loss": -6.150146484375, "global_step": 82148, "epoch": 1955} {"train_loss": -6.113368988037109, "global_step": 82149, "epoch": 1955} {"train_loss": -6.043998718261719, "global_step": 82150, "epoch": 1955} {"train_loss": -6.136313268116543, "global_step": 82151, "epoch": 1955, "val_loss": 75190.6796875} {"train_loss": -6.032777786254883, "global_step": 82152, "epoch": 1956} {"train_loss": -6.10809326171875, "global_step": 82153, "epoch": 1956} {"train_loss": -6.224107265472412, "global_step": 82154, "epoch": 1956} {"train_loss": -6.138258934020996, "global_step": 82155, "epoch": 1956} {"train_loss": -6.169586658477783, "global_step": 82156, "epoch": 1956} {"train_loss": -6.093395233154297, "global_step": 82157, "epoch": 1956} {"train_loss": -6.165250301361084, "global_step": 82158, "epoch": 1956} {"train_loss": -6.1958489418029785, "global_step": 82159, "epoch": 1956} {"train_loss": -6.1368408203125, "global_step": 82160, "epoch": 1956} {"train_loss": -6.172053813934326, "global_step": 82161, "epoch": 1956} {"train_loss": -6.159669876098633, "global_step": 82162, "epoch": 1956} {"train_loss": -6.160231590270996, "global_step": 82163, "epoch": 1956} {"train_loss": -6.091769218444824, "global_step": 82164, "epoch": 1956} {"train_loss": -6.137556552886963, "global_step": 82165, "epoch": 1956} {"train_loss": -6.252720832824707, "global_step": 82166, "epoch": 1956} {"train_loss": -6.0838165283203125, "global_step": 82167, "epoch": 1956} {"train_loss": -6.19997501373291, "global_step": 82168, "epoch": 1956} {"train_loss": -6.177236557006836, "global_step": 82169, "epoch": 1956} {"train_loss": -6.128787517547607, "global_step": 82170, "epoch": 1956} {"train_loss": -6.254914283752441, "global_step": 82171, "epoch": 1956} {"train_loss": -6.022390365600586, "global_step": 82172, "epoch": 1956} {"train_loss": -6.105045318603516, "global_step": 82173, "epoch": 1956} {"train_loss": -5.999748706817627, "global_step": 82174, "epoch": 1956} {"train_loss": -6.211708068847656, "global_step": 82175, "epoch": 1956} {"train_loss": -6.117886543273926, "global_step": 82176, "epoch": 1956} {"train_loss": -5.987212181091309, "global_step": 82177, "epoch": 1956} {"train_loss": -6.173212051391602, "global_step": 82178, "epoch": 1956} {"train_loss": -6.047910690307617, "global_step": 82179, "epoch": 1956} {"train_loss": -6.086047172546387, "global_step": 82180, "epoch": 1956} {"train_loss": -6.032013893127441, "global_step": 82181, "epoch": 1956} {"train_loss": -6.06776762008667, "global_step": 82182, "epoch": 1956} {"train_loss": -6.147006988525391, "global_step": 82183, "epoch": 1956} {"train_loss": -6.157052993774414, "global_step": 82184, "epoch": 1956} {"train_loss": -6.15223503112793, "global_step": 82185, "epoch": 1956} {"train_loss": -6.245922088623047, "global_step": 82186, "epoch": 1956} {"train_loss": -6.201127052307129, "global_step": 82187, "epoch": 1956} {"train_loss": -6.177195072174072, "global_step": 82188, "epoch": 1956} {"train_loss": -6.166202545166016, "global_step": 82189, "epoch": 1956} {"train_loss": -6.100143909454346, "global_step": 82190, "epoch": 1956} {"train_loss": -6.052246570587158, "global_step": 82191, "epoch": 1956} {"train_loss": -6.156919479370117, "global_step": 82192, "epoch": 1956} {"train_loss": -6.133824246270316, "global_step": 82193, "epoch": 1956, "val_loss": 75072.328125} {"train_loss": -6.164690017700195, "global_step": 82194, "epoch": 1957} {"train_loss": -6.084824562072754, "global_step": 82195, "epoch": 1957} {"train_loss": -6.121363162994385, "global_step": 82196, "epoch": 1957} {"train_loss": -6.063329219818115, "global_step": 82197, "epoch": 1957} {"train_loss": -6.082793235778809, "global_step": 82198, "epoch": 1957} {"train_loss": -6.197836399078369, "global_step": 82199, "epoch": 1957} {"train_loss": -6.147392272949219, "global_step": 82200, "epoch": 1957} {"train_loss": -6.214895248413086, "global_step": 82201, "epoch": 1957} {"train_loss": -6.091129302978516, "global_step": 82202, "epoch": 1957} {"train_loss": -6.098876953125, "global_step": 82203, "epoch": 1957} {"train_loss": -6.146245002746582, "global_step": 82204, "epoch": 1957} {"train_loss": -6.193276882171631, "global_step": 82205, "epoch": 1957} {"train_loss": -6.02641487121582, "global_step": 82206, "epoch": 1957} {"train_loss": -6.137240886688232, "global_step": 82207, "epoch": 1957} {"train_loss": -6.1045379638671875, "global_step": 82208, "epoch": 1957} {"train_loss": -6.098978042602539, "global_step": 82209, "epoch": 1957} {"train_loss": -6.278936386108398, "global_step": 82210, "epoch": 1957} {"train_loss": -6.087025165557861, "global_step": 82211, "epoch": 1957} {"train_loss": -6.0668840408325195, "global_step": 82212, "epoch": 1957} {"train_loss": -6.175221920013428, "global_step": 82213, "epoch": 1957} {"train_loss": -6.214930534362793, "global_step": 82214, "epoch": 1957} {"train_loss": -6.142560958862305, "global_step": 82215, "epoch": 1957} {"train_loss": -6.081881046295166, "global_step": 82216, "epoch": 1957} {"train_loss": -6.2487921714782715, "global_step": 82217, "epoch": 1957} {"train_loss": -6.246410846710205, "global_step": 82218, "epoch": 1957} {"train_loss": -6.180768966674805, "global_step": 82219, "epoch": 1957} {"train_loss": -6.208576202392578, "global_step": 82220, "epoch": 1957} {"train_loss": -6.1263532638549805, "global_step": 82221, "epoch": 1957} {"train_loss": -6.201539993286133, "global_step": 82222, "epoch": 1957} {"train_loss": -6.118748664855957, "global_step": 82223, "epoch": 1957} {"train_loss": -6.180540561676025, "global_step": 82224, "epoch": 1957} {"train_loss": -6.259093761444092, "global_step": 82225, "epoch": 1957} {"train_loss": -6.15408992767334, "global_step": 82226, "epoch": 1957} {"train_loss": -6.165027141571045, "global_step": 82227, "epoch": 1957} {"train_loss": -6.118380069732666, "global_step": 82228, "epoch": 1957} {"train_loss": -6.276349067687988, "global_step": 82229, "epoch": 1957} {"train_loss": -6.046392917633057, "global_step": 82230, "epoch": 1957} {"train_loss": -6.032339572906494, "global_step": 82231, "epoch": 1957} {"train_loss": -6.118105888366699, "global_step": 82232, "epoch": 1957} {"train_loss": -6.24202299118042, "global_step": 82233, "epoch": 1957} {"train_loss": -6.2042365074157715, "global_step": 82234, "epoch": 1957} {"train_loss": -6.151219731285458, "global_step": 82235, "epoch": 1957, "val_loss": 74941.328125} {"train_loss": -6.254238605499268, "global_step": 82236, "epoch": 1958} {"train_loss": -6.316420078277588, "global_step": 82237, "epoch": 1958} {"train_loss": -6.079756736755371, "global_step": 82238, "epoch": 1958} {"train_loss": -6.0769195556640625, "global_step": 82239, "epoch": 1958} {"train_loss": -6.24498176574707, "global_step": 82240, "epoch": 1958} {"train_loss": -6.345526218414307, "global_step": 82241, "epoch": 1958} {"train_loss": -6.255248069763184, "global_step": 82242, "epoch": 1958} {"train_loss": -6.1809539794921875, "global_step": 82243, "epoch": 1958} {"train_loss": -6.143656253814697, "global_step": 82244, "epoch": 1958} {"train_loss": -6.161157131195068, "global_step": 82245, "epoch": 1958} {"train_loss": -6.207590103149414, "global_step": 82246, "epoch": 1958} {"train_loss": -6.085206985473633, "global_step": 82247, "epoch": 1958} {"train_loss": -6.268239498138428, "global_step": 82248, "epoch": 1958} {"train_loss": -6.097019195556641, "global_step": 82249, "epoch": 1958} {"train_loss": -6.264604091644287, "global_step": 82250, "epoch": 1958} {"train_loss": -6.2013397216796875, "global_step": 82251, "epoch": 1958} {"train_loss": -6.161864280700684, "global_step": 82252, "epoch": 1958} {"train_loss": -6.165809154510498, "global_step": 82253, "epoch": 1958} {"train_loss": -6.132336616516113, "global_step": 82254, "epoch": 1958} {"train_loss": -6.191400527954102, "global_step": 82255, "epoch": 1958} {"train_loss": -5.954755783081055, "global_step": 82256, "epoch": 1958} {"train_loss": -6.136040687561035, "global_step": 82257, "epoch": 1958} {"train_loss": -6.133710861206055, "global_step": 82258, "epoch": 1958} {"train_loss": -6.234005928039551, "global_step": 82259, "epoch": 1958} {"train_loss": -6.239872932434082, "global_step": 82260, "epoch": 1958} {"train_loss": -6.214181900024414, "global_step": 82261, "epoch": 1958} {"train_loss": -6.141669750213623, "global_step": 82262, "epoch": 1958} {"train_loss": -6.181227684020996, "global_step": 82263, "epoch": 1958} {"train_loss": -6.135092735290527, "global_step": 82264, "epoch": 1958} {"train_loss": -6.246490001678467, "global_step": 82265, "epoch": 1958} {"train_loss": -6.0737385749816895, "global_step": 82266, "epoch": 1958} {"train_loss": -6.1687912940979, "global_step": 82267, "epoch": 1958} {"train_loss": -6.183935165405273, "global_step": 82268, "epoch": 1958} {"train_loss": -6.170557022094727, "global_step": 82269, "epoch": 1958} {"train_loss": -6.098990440368652, "global_step": 82270, "epoch": 1958} {"train_loss": -6.296584606170654, "global_step": 82271, "epoch": 1958} {"train_loss": -6.1780571937561035, "global_step": 82272, "epoch": 1958} {"train_loss": -6.188631057739258, "global_step": 82273, "epoch": 1958} {"train_loss": -6.219066619873047, "global_step": 82274, "epoch": 1958} {"train_loss": -6.196812629699707, "global_step": 82275, "epoch": 1958} {"train_loss": -6.052126884460449, "global_step": 82276, "epoch": 1958} {"train_loss": -6.175274201801845, "global_step": 82277, "epoch": 1958, "val_loss": 74872.6875} {"train_loss": -6.080434799194336, "global_step": 82278, "epoch": 1959} {"train_loss": -6.144749641418457, "global_step": 82279, "epoch": 1959} {"train_loss": -6.158471584320068, "global_step": 82280, "epoch": 1959} {"train_loss": -6.253579139709473, "global_step": 82281, "epoch": 1959} {"train_loss": -6.133175373077393, "global_step": 82282, "epoch": 1959} {"train_loss": -6.096404075622559, "global_step": 82283, "epoch": 1959} {"train_loss": -6.119917392730713, "global_step": 82284, "epoch": 1959} {"train_loss": -6.026324272155762, "global_step": 82285, "epoch": 1959} {"train_loss": -6.080053329467773, "global_step": 82286, "epoch": 1959} {"train_loss": -6.135712623596191, "global_step": 82287, "epoch": 1959} {"train_loss": -6.066774845123291, "global_step": 82288, "epoch": 1959} {"train_loss": -6.132898807525635, "global_step": 82289, "epoch": 1959} {"train_loss": -6.179296970367432, "global_step": 82290, "epoch": 1959} {"train_loss": -6.123693466186523, "global_step": 82291, "epoch": 1959} {"train_loss": -6.173137664794922, "global_step": 82292, "epoch": 1959} {"train_loss": -6.242508888244629, "global_step": 82293, "epoch": 1959} {"train_loss": -6.289587020874023, "global_step": 82294, "epoch": 1959} {"train_loss": -5.999578475952148, "global_step": 82295, "epoch": 1959} {"train_loss": -6.214507102966309, "global_step": 82296, "epoch": 1959} {"train_loss": -6.052036762237549, "global_step": 82297, "epoch": 1959} {"train_loss": -6.106407165527344, "global_step": 82298, "epoch": 1959} {"train_loss": -6.10886287689209, "global_step": 82299, "epoch": 1959} {"train_loss": -6.249495029449463, "global_step": 82300, "epoch": 1959} {"train_loss": -6.071101188659668, "global_step": 82301, "epoch": 1959} {"train_loss": -6.154264450073242, "global_step": 82302, "epoch": 1959} {"train_loss": -6.176652908325195, "global_step": 82303, "epoch": 1959} {"train_loss": -6.090860366821289, "global_step": 82304, "epoch": 1959} {"train_loss": -6.087886810302734, "global_step": 82305, "epoch": 1959} {"train_loss": -6.034873962402344, "global_step": 82306, "epoch": 1959} {"train_loss": -6.0477190017700195, "global_step": 82307, "epoch": 1959} {"train_loss": -5.900238990783691, "global_step": 82308, "epoch": 1959} {"train_loss": -6.115980625152588, "global_step": 82309, "epoch": 1959} {"train_loss": -6.057788848876953, "global_step": 82310, "epoch": 1959} {"train_loss": -5.989065170288086, "global_step": 82311, "epoch": 1959} {"train_loss": -6.086758136749268, "global_step": 82312, "epoch": 1959} {"train_loss": -6.026259899139404, "global_step": 82313, "epoch": 1959} {"train_loss": -6.091628074645996, "global_step": 82314, "epoch": 1959} {"train_loss": -6.056498050689697, "global_step": 82315, "epoch": 1959} {"train_loss": -6.123466491699219, "global_step": 82316, "epoch": 1959} {"train_loss": -5.958861827850342, "global_step": 82317, "epoch": 1959} {"train_loss": -6.135601043701172, "global_step": 82318, "epoch": 1959} {"train_loss": -6.1086426348913285, "global_step": 82319, "epoch": 1959, "val_loss": 74792.8828125} {"train_loss": -6.0591630935668945, "global_step": 82320, "epoch": 1960} {"train_loss": -6.064417839050293, "global_step": 82321, "epoch": 1960} {"train_loss": -6.063152313232422, "global_step": 82322, "epoch": 1960} {"train_loss": -5.997602939605713, "global_step": 82323, "epoch": 1960} {"train_loss": -6.104524612426758, "global_step": 82324, "epoch": 1960} {"train_loss": -6.133564472198486, "global_step": 82325, "epoch": 1960} {"train_loss": -5.9913530349731445, "global_step": 82326, "epoch": 1960} {"train_loss": -6.159414291381836, "global_step": 82327, "epoch": 1960} {"train_loss": -6.05112361907959, "global_step": 82328, "epoch": 1960} {"train_loss": -6.087578773498535, "global_step": 82329, "epoch": 1960} {"train_loss": -6.117066383361816, "global_step": 82330, "epoch": 1960} {"train_loss": -6.175535202026367, "global_step": 82331, "epoch": 1960} {"train_loss": -6.1863508224487305, "global_step": 82332, "epoch": 1960} {"train_loss": -6.114239692687988, "global_step": 82333, "epoch": 1960} {"train_loss": -6.186028480529785, "global_step": 82334, "epoch": 1960} {"train_loss": -6.0802001953125, "global_step": 82335, "epoch": 1960} {"train_loss": -6.139047622680664, "global_step": 82336, "epoch": 1960} {"train_loss": -6.114243984222412, "global_step": 82337, "epoch": 1960} {"train_loss": -6.142991542816162, "global_step": 82338, "epoch": 1960} {"train_loss": -6.27537727355957, "global_step": 82339, "epoch": 1960} {"train_loss": -6.094471454620361, "global_step": 82340, "epoch": 1960} {"train_loss": -6.099761962890625, "global_step": 82341, "epoch": 1960} {"train_loss": -6.236505031585693, "global_step": 82342, "epoch": 1960} {"train_loss": -6.170753002166748, "global_step": 82343, "epoch": 1960} {"train_loss": -6.1230010986328125, "global_step": 82344, "epoch": 1960} {"train_loss": -6.142878532409668, "global_step": 82345, "epoch": 1960} {"train_loss": -6.111321449279785, "global_step": 82346, "epoch": 1960} {"train_loss": -6.255537509918213, "global_step": 82347, "epoch": 1960} {"train_loss": -6.218860149383545, "global_step": 82348, "epoch": 1960} {"train_loss": -6.071880340576172, "global_step": 82349, "epoch": 1960} {"train_loss": -6.057289123535156, "global_step": 82350, "epoch": 1960} {"train_loss": -6.200642108917236, "global_step": 82351, "epoch": 1960} {"train_loss": -6.216399192810059, "global_step": 82352, "epoch": 1960} {"train_loss": -6.086143493652344, "global_step": 82353, "epoch": 1960} {"train_loss": -6.156866073608398, "global_step": 82354, "epoch": 1960} {"train_loss": -6.138127326965332, "global_step": 82355, "epoch": 1960} {"train_loss": -6.066672325134277, "global_step": 82356, "epoch": 1960} {"train_loss": -6.146506309509277, "global_step": 82357, "epoch": 1960} {"train_loss": -6.1141676902771, "global_step": 82358, "epoch": 1960} {"train_loss": -6.312738418579102, "global_step": 82359, "epoch": 1960} {"train_loss": -6.099318504333496, "global_step": 82360, "epoch": 1960} {"train_loss": -6.130961157026745, "global_step": 82361, "epoch": 1960, "val_loss": 74823.28125} {"train_loss": -6.121742248535156, "global_step": 82362, "epoch": 1961} {"train_loss": -6.112387657165527, "global_step": 82363, "epoch": 1961} {"train_loss": -6.115118026733398, "global_step": 82364, "epoch": 1961} {"train_loss": -6.229544639587402, "global_step": 82365, "epoch": 1961} {"train_loss": -6.075340270996094, "global_step": 82366, "epoch": 1961} {"train_loss": -6.1719770431518555, "global_step": 82367, "epoch": 1961} {"train_loss": -6.234057426452637, "global_step": 82368, "epoch": 1961} {"train_loss": -6.253753185272217, "global_step": 82369, "epoch": 1961} {"train_loss": -6.2790656089782715, "global_step": 82370, "epoch": 1961} {"train_loss": -6.256739616394043, "global_step": 82371, "epoch": 1961} {"train_loss": -6.129644393920898, "global_step": 82372, "epoch": 1961} {"train_loss": -6.319436073303223, "global_step": 82373, "epoch": 1961} {"train_loss": -6.228621482849121, "global_step": 82374, "epoch": 1961} {"train_loss": -6.063060760498047, "global_step": 82375, "epoch": 1961} {"train_loss": -6.205460548400879, "global_step": 82376, "epoch": 1961} {"train_loss": -6.204671382904053, "global_step": 82377, "epoch": 1961} {"train_loss": -6.258444786071777, "global_step": 82378, "epoch": 1961} {"train_loss": -6.026161193847656, "global_step": 82379, "epoch": 1961} {"train_loss": -6.197364807128906, "global_step": 82380, "epoch": 1961} {"train_loss": -6.077924728393555, "global_step": 82381, "epoch": 1961} {"train_loss": -6.102067947387695, "global_step": 82382, "epoch": 1961} {"train_loss": -6.170391082763672, "global_step": 82383, "epoch": 1961} {"train_loss": -6.183137893676758, "global_step": 82384, "epoch": 1961} {"train_loss": -6.148940086364746, "global_step": 82385, "epoch": 1961} {"train_loss": -6.121025562286377, "global_step": 82386, "epoch": 1961} {"train_loss": -6.128000736236572, "global_step": 82387, "epoch": 1961} {"train_loss": -6.283017158508301, "global_step": 82388, "epoch": 1961} {"train_loss": -6.237933158874512, "global_step": 82389, "epoch": 1961} {"train_loss": -6.1394243240356445, "global_step": 82390, "epoch": 1961} {"train_loss": -6.188061714172363, "global_step": 82391, "epoch": 1961} {"train_loss": -6.1801371574401855, "global_step": 82392, "epoch": 1961} {"train_loss": -6.1029510498046875, "global_step": 82393, "epoch": 1961} {"train_loss": -6.22398567199707, "global_step": 82394, "epoch": 1961} {"train_loss": -6.166075706481934, "global_step": 82395, "epoch": 1961} {"train_loss": -6.214136123657227, "global_step": 82396, "epoch": 1961} {"train_loss": -6.06432580947876, "global_step": 82397, "epoch": 1961} {"train_loss": -6.111712455749512, "global_step": 82398, "epoch": 1961} {"train_loss": -6.19428825378418, "global_step": 82399, "epoch": 1961} {"train_loss": -6.118138313293457, "global_step": 82400, "epoch": 1961} {"train_loss": -6.161678314208984, "global_step": 82401, "epoch": 1961} {"train_loss": -6.141420841217041, "global_step": 82402, "epoch": 1961} {"train_loss": -6.170082035518828, "global_step": 82403, "epoch": 1961, "val_loss": 74963.53125} {"train_loss": -6.3200364112854, "global_step": 82404, "epoch": 1962} {"train_loss": -6.152956962585449, "global_step": 82405, "epoch": 1962} {"train_loss": -6.269432544708252, "global_step": 82406, "epoch": 1962} {"train_loss": -6.082799434661865, "global_step": 82407, "epoch": 1962} {"train_loss": -6.220394134521484, "global_step": 82408, "epoch": 1962} {"train_loss": -6.20451545715332, "global_step": 82409, "epoch": 1962} {"train_loss": -6.237401962280273, "global_step": 82410, "epoch": 1962} {"train_loss": -6.237465858459473, "global_step": 82411, "epoch": 1962} {"train_loss": -6.201295852661133, "global_step": 82412, "epoch": 1962} {"train_loss": -6.119117736816406, "global_step": 82413, "epoch": 1962} {"train_loss": -6.265105724334717, "global_step": 82414, "epoch": 1962} {"train_loss": -6.163045406341553, "global_step": 82415, "epoch": 1962} {"train_loss": -6.197085380554199, "global_step": 82416, "epoch": 1962} {"train_loss": -6.183736801147461, "global_step": 82417, "epoch": 1962} {"train_loss": -6.213335037231445, "global_step": 82418, "epoch": 1962} {"train_loss": -6.152386665344238, "global_step": 82419, "epoch": 1962} {"train_loss": -6.177127838134766, "global_step": 82420, "epoch": 1962} {"train_loss": -6.161488056182861, "global_step": 82421, "epoch": 1962} {"train_loss": -6.148601055145264, "global_step": 82422, "epoch": 1962} {"train_loss": -6.175476551055908, "global_step": 82423, "epoch": 1962} {"train_loss": -6.102258682250977, "global_step": 82424, "epoch": 1962} {"train_loss": -6.1619791984558105, "global_step": 82425, "epoch": 1962} {"train_loss": -6.248905181884766, "global_step": 82426, "epoch": 1962} {"train_loss": -6.232778072357178, "global_step": 82427, "epoch": 1962} {"train_loss": -6.183903694152832, "global_step": 82428, "epoch": 1962} {"train_loss": -6.0852251052856445, "global_step": 82429, "epoch": 1962} {"train_loss": -6.18147087097168, "global_step": 82430, "epoch": 1962} {"train_loss": -6.219247817993164, "global_step": 82431, "epoch": 1962} {"train_loss": -6.28807258605957, "global_step": 82432, "epoch": 1962} {"train_loss": -6.18829345703125, "global_step": 82433, "epoch": 1962} {"train_loss": -6.159242630004883, "global_step": 82434, "epoch": 1962} {"train_loss": -6.183376312255859, "global_step": 82435, "epoch": 1962} {"train_loss": -6.146407127380371, "global_step": 82436, "epoch": 1962} {"train_loss": -6.190884590148926, "global_step": 82437, "epoch": 1962} {"train_loss": -6.193293571472168, "global_step": 82438, "epoch": 1962} {"train_loss": -6.168045997619629, "global_step": 82439, "epoch": 1962} {"train_loss": -6.114765167236328, "global_step": 82440, "epoch": 1962} {"train_loss": -6.122643947601318, "global_step": 82441, "epoch": 1962} {"train_loss": -6.219818115234375, "global_step": 82442, "epoch": 1962} {"train_loss": -6.236908435821533, "global_step": 82443, "epoch": 1962} {"train_loss": -6.1453423500061035, "global_step": 82444, "epoch": 1962} {"train_loss": -6.1858647891453336, "global_step": 82445, "epoch": 1962, "val_loss": 74921.4609375} {"train_loss": -6.202515602111816, "global_step": 82446, "epoch": 1963} {"train_loss": -6.192809104919434, "global_step": 82447, "epoch": 1963} {"train_loss": -6.212194442749023, "global_step": 82448, "epoch": 1963} {"train_loss": -6.167913913726807, "global_step": 82449, "epoch": 1963} {"train_loss": -6.221680641174316, "global_step": 82450, "epoch": 1963} {"train_loss": -6.152701377868652, "global_step": 82451, "epoch": 1963} {"train_loss": -6.07474422454834, "global_step": 82452, "epoch": 1963} {"train_loss": -6.019957065582275, "global_step": 82453, "epoch": 1963} {"train_loss": -6.306095600128174, "global_step": 82454, "epoch": 1963} {"train_loss": -6.163236141204834, "global_step": 82455, "epoch": 1963} {"train_loss": -6.2196478843688965, "global_step": 82456, "epoch": 1963} {"train_loss": -6.0635881423950195, "global_step": 82457, "epoch": 1963} {"train_loss": -6.086932182312012, "global_step": 82458, "epoch": 1963} {"train_loss": -6.223172187805176, "global_step": 82459, "epoch": 1963} {"train_loss": -6.036807060241699, "global_step": 82460, "epoch": 1963} {"train_loss": -6.100587844848633, "global_step": 82461, "epoch": 1963} {"train_loss": -6.161133766174316, "global_step": 82462, "epoch": 1963} {"train_loss": -6.077954292297363, "global_step": 82463, "epoch": 1963} {"train_loss": -6.113160133361816, "global_step": 82464, "epoch": 1963} {"train_loss": -5.962745666503906, "global_step": 82465, "epoch": 1963} {"train_loss": -6.099123954772949, "global_step": 82466, "epoch": 1963} {"train_loss": -6.223847389221191, "global_step": 82467, "epoch": 1963} {"train_loss": -5.994531631469727, "global_step": 82468, "epoch": 1963} {"train_loss": -6.389314651489258, "global_step": 82469, "epoch": 1963} {"train_loss": -6.094304084777832, "global_step": 82470, "epoch": 1963} {"train_loss": -6.074265480041504, "global_step": 82471, "epoch": 1963} {"train_loss": -6.153809547424316, "global_step": 82472, "epoch": 1963} {"train_loss": -6.136051177978516, "global_step": 82473, "epoch": 1963} {"train_loss": -6.141704082489014, "global_step": 82474, "epoch": 1963} {"train_loss": -6.124316215515137, "global_step": 82475, "epoch": 1963} {"train_loss": -6.125889778137207, "global_step": 82476, "epoch": 1963} {"train_loss": -6.200986862182617, "global_step": 82477, "epoch": 1963} {"train_loss": -6.16085958480835, "global_step": 82478, "epoch": 1963} {"train_loss": -6.151679992675781, "global_step": 82479, "epoch": 1963} {"train_loss": -6.0823869705200195, "global_step": 82480, "epoch": 1963} {"train_loss": -6.090509414672852, "global_step": 82481, "epoch": 1963} {"train_loss": -6.195826530456543, "global_step": 82482, "epoch": 1963} {"train_loss": -6.088674545288086, "global_step": 82483, "epoch": 1963} {"train_loss": -6.117692947387695, "global_step": 82484, "epoch": 1963} {"train_loss": -6.079115867614746, "global_step": 82485, "epoch": 1963} {"train_loss": -6.152225494384766, "global_step": 82486, "epoch": 1963} {"train_loss": -6.137656745456514, "global_step": 82487, "epoch": 1963, "val_loss": 75012.9921875} {"train_loss": -6.184194087982178, "global_step": 82488, "epoch": 1964} {"train_loss": -6.106327056884766, "global_step": 82489, "epoch": 1964} {"train_loss": -6.236620903015137, "global_step": 82490, "epoch": 1964} {"train_loss": -6.205498695373535, "global_step": 82491, "epoch": 1964} {"train_loss": -6.07431697845459, "global_step": 82492, "epoch": 1964} {"train_loss": -6.218106269836426, "global_step": 82493, "epoch": 1964} {"train_loss": -6.074982643127441, "global_step": 82494, "epoch": 1964} {"train_loss": -6.222814083099365, "global_step": 82495, "epoch": 1964} {"train_loss": -6.174932956695557, "global_step": 82496, "epoch": 1964} {"train_loss": -6.228298187255859, "global_step": 82497, "epoch": 1964} {"train_loss": -6.114794731140137, "global_step": 82498, "epoch": 1964} {"train_loss": -6.207061767578125, "global_step": 82499, "epoch": 1964} {"train_loss": -6.114982604980469, "global_step": 82500, "epoch": 1964} {"train_loss": -6.042683124542236, "global_step": 82501, "epoch": 1964} {"train_loss": -6.10477352142334, "global_step": 82502, "epoch": 1964} {"train_loss": -6.16396427154541, "global_step": 82503, "epoch": 1964} {"train_loss": -6.129655838012695, "global_step": 82504, "epoch": 1964} {"train_loss": -6.255133152008057, "global_step": 82505, "epoch": 1964} {"train_loss": -6.08349609375, "global_step": 82506, "epoch": 1964} {"train_loss": -6.2382307052612305, "global_step": 82507, "epoch": 1964} {"train_loss": -6.04550838470459, "global_step": 82508, "epoch": 1964} {"train_loss": -6.126676559448242, "global_step": 82509, "epoch": 1964} {"train_loss": -6.06815242767334, "global_step": 82510, "epoch": 1964} {"train_loss": -6.060191631317139, "global_step": 82511, "epoch": 1964} {"train_loss": -6.183930397033691, "global_step": 82512, "epoch": 1964} {"train_loss": -6.206665992736816, "global_step": 82513, "epoch": 1964} {"train_loss": -6.209340572357178, "global_step": 82514, "epoch": 1964} {"train_loss": -6.05121374130249, "global_step": 82515, "epoch": 1964} {"train_loss": -6.185218811035156, "global_step": 82516, "epoch": 1964} {"train_loss": -6.06116247177124, "global_step": 82517, "epoch": 1964} {"train_loss": -6.175835609436035, "global_step": 82518, "epoch": 1964} {"train_loss": -6.124419212341309, "global_step": 82519, "epoch": 1964} {"train_loss": -6.182658672332764, "global_step": 82520, "epoch": 1964} {"train_loss": -6.158174514770508, "global_step": 82521, "epoch": 1964} {"train_loss": -6.117188930511475, "global_step": 82522, "epoch": 1964} {"train_loss": -6.110385417938232, "global_step": 82523, "epoch": 1964} {"train_loss": -6.127838134765625, "global_step": 82524, "epoch": 1964} {"train_loss": -6.122112274169922, "global_step": 82525, "epoch": 1964} {"train_loss": -6.122900485992432, "global_step": 82526, "epoch": 1964} {"train_loss": -6.122513771057129, "global_step": 82527, "epoch": 1964} {"train_loss": -6.195926189422607, "global_step": 82528, "epoch": 1964} {"train_loss": -6.145253033865066, "global_step": 82529, "epoch": 1964, "val_loss": 75349.8671875} {"train_loss": -6.151987075805664, "global_step": 82530, "epoch": 1965} {"train_loss": -6.198952674865723, "global_step": 82531, "epoch": 1965} {"train_loss": -6.16085147857666, "global_step": 82532, "epoch": 1965} {"train_loss": -6.059678077697754, "global_step": 82533, "epoch": 1965} {"train_loss": -6.217072486877441, "global_step": 82534, "epoch": 1965} {"train_loss": -6.1635589599609375, "global_step": 82535, "epoch": 1965} {"train_loss": -6.024129867553711, "global_step": 82536, "epoch": 1965} {"train_loss": -6.062110900878906, "global_step": 82537, "epoch": 1965} {"train_loss": -6.11706018447876, "global_step": 82538, "epoch": 1965} {"train_loss": -6.1295390129089355, "global_step": 82539, "epoch": 1965} {"train_loss": -5.963354110717773, "global_step": 82540, "epoch": 1965} {"train_loss": -6.150080680847168, "global_step": 82541, "epoch": 1965} {"train_loss": -6.0981125831604, "global_step": 82542, "epoch": 1965} {"train_loss": -6.025591850280762, "global_step": 82543, "epoch": 1965} {"train_loss": -6.1626434326171875, "global_step": 82544, "epoch": 1965} {"train_loss": -6.05607795715332, "global_step": 82545, "epoch": 1965} {"train_loss": -6.077043056488037, "global_step": 82546, "epoch": 1965} {"train_loss": -6.158535957336426, "global_step": 82547, "epoch": 1965} {"train_loss": -6.01079797744751, "global_step": 82548, "epoch": 1965} {"train_loss": -6.151561260223389, "global_step": 82549, "epoch": 1965} {"train_loss": -6.344785690307617, "global_step": 82550, "epoch": 1965} {"train_loss": -6.003665924072266, "global_step": 82551, "epoch": 1965} {"train_loss": -6.228985786437988, "global_step": 82552, "epoch": 1965} {"train_loss": -6.146899223327637, "global_step": 82553, "epoch": 1965} {"train_loss": -6.106122016906738, "global_step": 82554, "epoch": 1965} {"train_loss": -6.235077857971191, "global_step": 82555, "epoch": 1965} {"train_loss": -6.137423515319824, "global_step": 82556, "epoch": 1965} {"train_loss": -6.153590679168701, "global_step": 82557, "epoch": 1965} {"train_loss": -6.0921735763549805, "global_step": 82558, "epoch": 1965} {"train_loss": -6.177845001220703, "global_step": 82559, "epoch": 1965} {"train_loss": -6.189580917358398, "global_step": 82560, "epoch": 1965} {"train_loss": -6.079582214355469, "global_step": 82561, "epoch": 1965} {"train_loss": -6.24384880065918, "global_step": 82562, "epoch": 1965} {"train_loss": -6.237680435180664, "global_step": 82563, "epoch": 1965} {"train_loss": -6.20943021774292, "global_step": 82564, "epoch": 1965} {"train_loss": -6.071385383605957, "global_step": 82565, "epoch": 1965} {"train_loss": -6.164322853088379, "global_step": 82566, "epoch": 1965} {"train_loss": -6.200308799743652, "global_step": 82567, "epoch": 1965} {"train_loss": -6.238371849060059, "global_step": 82568, "epoch": 1965} {"train_loss": -6.264450550079346, "global_step": 82569, "epoch": 1965} {"train_loss": -6.284454822540283, "global_step": 82570, "epoch": 1965} {"train_loss": -6.145319132577805, "global_step": 82571, "epoch": 1965, "val_loss": 75207.578125} {"train_loss": -6.175849914550781, "global_step": 82572, "epoch": 1966} {"train_loss": -6.170995712280273, "global_step": 82573, "epoch": 1966} {"train_loss": -6.155660629272461, "global_step": 82574, "epoch": 1966} {"train_loss": -6.170743465423584, "global_step": 82575, "epoch": 1966} {"train_loss": -6.171348571777344, "global_step": 82576, "epoch": 1966} {"train_loss": -6.180347442626953, "global_step": 82577, "epoch": 1966} {"train_loss": -6.116888046264648, "global_step": 82578, "epoch": 1966} {"train_loss": -6.093968391418457, "global_step": 82579, "epoch": 1966} {"train_loss": -6.212547779083252, "global_step": 82580, "epoch": 1966} {"train_loss": -6.154974937438965, "global_step": 82581, "epoch": 1966} {"train_loss": -6.227594375610352, "global_step": 82582, "epoch": 1966} {"train_loss": -6.193474292755127, "global_step": 82583, "epoch": 1966} {"train_loss": -6.282824516296387, "global_step": 82584, "epoch": 1966} {"train_loss": -6.087066173553467, "global_step": 82585, "epoch": 1966} {"train_loss": -6.299633979797363, "global_step": 82586, "epoch": 1966} {"train_loss": -6.218292236328125, "global_step": 82587, "epoch": 1966} {"train_loss": -6.151700496673584, "global_step": 82588, "epoch": 1966} {"train_loss": -6.0745954513549805, "global_step": 82589, "epoch": 1966} {"train_loss": -6.1763458251953125, "global_step": 82590, "epoch": 1966} {"train_loss": -6.355706214904785, "global_step": 82591, "epoch": 1966} {"train_loss": -6.054984092712402, "global_step": 82592, "epoch": 1966} {"train_loss": -6.1087799072265625, "global_step": 82593, "epoch": 1966} {"train_loss": -6.143037796020508, "global_step": 82594, "epoch": 1966} {"train_loss": -6.297329902648926, "global_step": 82595, "epoch": 1966} {"train_loss": -6.148833274841309, "global_step": 82596, "epoch": 1966} {"train_loss": -6.099281311035156, "global_step": 82597, "epoch": 1966} {"train_loss": -6.114782333374023, "global_step": 82598, "epoch": 1966} {"train_loss": -6.165191650390625, "global_step": 82599, "epoch": 1966} {"train_loss": -6.185962677001953, "global_step": 82600, "epoch": 1966} {"train_loss": -6.063562393188477, "global_step": 82601, "epoch": 1966} {"train_loss": -6.192634582519531, "global_step": 82602, "epoch": 1966} {"train_loss": -6.009310245513916, "global_step": 82603, "epoch": 1966} {"train_loss": -5.993765830993652, "global_step": 82604, "epoch": 1966} {"train_loss": -6.114714622497559, "global_step": 82605, "epoch": 1966} {"train_loss": -6.152454376220703, "global_step": 82606, "epoch": 1966} {"train_loss": -6.053167343139648, "global_step": 82607, "epoch": 1966} {"train_loss": -6.143687725067139, "global_step": 82608, "epoch": 1966} {"train_loss": -6.122064590454102, "global_step": 82609, "epoch": 1966} {"train_loss": -6.0692243576049805, "global_step": 82610, "epoch": 1966} {"train_loss": -6.120062828063965, "global_step": 82611, "epoch": 1966} {"train_loss": -6.099198818206787, "global_step": 82612, "epoch": 1966} {"train_loss": -6.150199594951811, "global_step": 82613, "epoch": 1966, "val_loss": 75311.328125} {"train_loss": -6.193225860595703, "global_step": 82614, "epoch": 1967} {"train_loss": -6.1430253982543945, "global_step": 82615, "epoch": 1967} {"train_loss": -6.060059547424316, "global_step": 82616, "epoch": 1967} {"train_loss": -6.028934478759766, "global_step": 82617, "epoch": 1967} {"train_loss": -6.002945423126221, "global_step": 82618, "epoch": 1967} {"train_loss": -6.152651309967041, "global_step": 82619, "epoch": 1967} {"train_loss": -6.046541213989258, "global_step": 82620, "epoch": 1967} {"train_loss": -6.061678886413574, "global_step": 82621, "epoch": 1967} {"train_loss": -6.199999809265137, "global_step": 82622, "epoch": 1967} {"train_loss": -6.204410552978516, "global_step": 82623, "epoch": 1967} {"train_loss": -6.151558876037598, "global_step": 82624, "epoch": 1967} {"train_loss": -6.179443359375, "global_step": 82625, "epoch": 1967} {"train_loss": -6.151856899261475, "global_step": 82626, "epoch": 1967} {"train_loss": -6.058404922485352, "global_step": 82627, "epoch": 1967} {"train_loss": -6.193840026855469, "global_step": 82628, "epoch": 1967} {"train_loss": -6.18021297454834, "global_step": 82629, "epoch": 1967} {"train_loss": -6.209845542907715, "global_step": 82630, "epoch": 1967} {"train_loss": -6.068115234375, "global_step": 82631, "epoch": 1967} {"train_loss": -6.188937187194824, "global_step": 82632, "epoch": 1967} {"train_loss": -6.060817718505859, "global_step": 82633, "epoch": 1967} {"train_loss": -6.127137184143066, "global_step": 82634, "epoch": 1967} {"train_loss": -6.09588623046875, "global_step": 82635, "epoch": 1967} {"train_loss": -6.097652435302734, "global_step": 82636, "epoch": 1967} {"train_loss": -6.141149044036865, "global_step": 82637, "epoch": 1967} {"train_loss": -6.147619247436523, "global_step": 82638, "epoch": 1967} {"train_loss": -6.166960716247559, "global_step": 82639, "epoch": 1967} {"train_loss": -6.077555179595947, "global_step": 82640, "epoch": 1967} {"train_loss": -6.149542808532715, "global_step": 82641, "epoch": 1967} {"train_loss": -6.245084762573242, "global_step": 82642, "epoch": 1967} {"train_loss": -6.211666107177734, "global_step": 82643, "epoch": 1967} {"train_loss": -6.09827995300293, "global_step": 82644, "epoch": 1967} {"train_loss": -6.025383949279785, "global_step": 82645, "epoch": 1967} {"train_loss": -6.042016506195068, "global_step": 82646, "epoch": 1967} {"train_loss": -6.088052749633789, "global_step": 82647, "epoch": 1967} {"train_loss": -6.136887550354004, "global_step": 82648, "epoch": 1967} {"train_loss": -6.086660385131836, "global_step": 82649, "epoch": 1967} {"train_loss": -6.165555000305176, "global_step": 82650, "epoch": 1967} {"train_loss": -6.159811019897461, "global_step": 82651, "epoch": 1967} {"train_loss": -6.206151962280273, "global_step": 82652, "epoch": 1967} {"train_loss": -6.108678817749023, "global_step": 82653, "epoch": 1967} {"train_loss": -6.069256782531738, "global_step": 82654, "epoch": 1967} {"train_loss": -6.1270786580585295, "global_step": 82655, "epoch": 1967, "val_loss": 74918.5} {"train_loss": -6.205853462219238, "global_step": 82656, "epoch": 1968} {"train_loss": -6.0794782638549805, "global_step": 82657, "epoch": 1968} {"train_loss": -6.3132219314575195, "global_step": 82658, "epoch": 1968} {"train_loss": -6.088680267333984, "global_step": 82659, "epoch": 1968} {"train_loss": -6.103839874267578, "global_step": 82660, "epoch": 1968} {"train_loss": -6.151506423950195, "global_step": 82661, "epoch": 1968} {"train_loss": -6.057518482208252, "global_step": 82662, "epoch": 1968} {"train_loss": -6.162712097167969, "global_step": 82663, "epoch": 1968} {"train_loss": -6.1648945808410645, "global_step": 82664, "epoch": 1968} {"train_loss": -6.314605712890625, "global_step": 82665, "epoch": 1968} {"train_loss": -6.056941032409668, "global_step": 82666, "epoch": 1968} {"train_loss": -6.078681945800781, "global_step": 82667, "epoch": 1968} {"train_loss": -6.0659332275390625, "global_step": 82668, "epoch": 1968} {"train_loss": -6.022022724151611, "global_step": 82669, "epoch": 1968} {"train_loss": -6.095168590545654, "global_step": 82670, "epoch": 1968} {"train_loss": -5.8633904457092285, "global_step": 82671, "epoch": 1968} {"train_loss": -5.995782852172852, "global_step": 82672, "epoch": 1968} {"train_loss": -5.999868392944336, "global_step": 82673, "epoch": 1968} {"train_loss": -6.006823539733887, "global_step": 82674, "epoch": 1968} {"train_loss": -6.105961799621582, "global_step": 82675, "epoch": 1968} {"train_loss": -6.08559513092041, "global_step": 82676, "epoch": 1968} {"train_loss": -6.160772323608398, "global_step": 82677, "epoch": 1968} {"train_loss": -6.177403926849365, "global_step": 82678, "epoch": 1968} {"train_loss": -6.249128341674805, "global_step": 82679, "epoch": 1968} {"train_loss": -5.971467971801758, "global_step": 82680, "epoch": 1968} {"train_loss": -6.0679521560668945, "global_step": 82681, "epoch": 1968} {"train_loss": -6.132729530334473, "global_step": 82682, "epoch": 1968} {"train_loss": -6.0317792892456055, "global_step": 82683, "epoch": 1968} {"train_loss": -6.075679302215576, "global_step": 82684, "epoch": 1968} {"train_loss": -6.029996871948242, "global_step": 82685, "epoch": 1968} {"train_loss": -6.098836898803711, "global_step": 82686, "epoch": 1968} {"train_loss": -6.030771255493164, "global_step": 82687, "epoch": 1968} {"train_loss": -6.146473407745361, "global_step": 82688, "epoch": 1968} {"train_loss": -6.034361839294434, "global_step": 82689, "epoch": 1968} {"train_loss": -6.231634616851807, "global_step": 82690, "epoch": 1968} {"train_loss": -6.103045463562012, "global_step": 82691, "epoch": 1968} {"train_loss": -6.1525468826293945, "global_step": 82692, "epoch": 1968} {"train_loss": -6.133079528808594, "global_step": 82693, "epoch": 1968} {"train_loss": -6.17007303237915, "global_step": 82694, "epoch": 1968} {"train_loss": -6.248412132263184, "global_step": 82695, "epoch": 1968} {"train_loss": -6.1847124099731445, "global_step": 82696, "epoch": 1968} {"train_loss": -6.11098803792681, "global_step": 82697, "epoch": 1968, "val_loss": 74810.828125} {"train_loss": -6.1640801429748535, "global_step": 82698, "epoch": 1969} {"train_loss": -6.099390506744385, "global_step": 82699, "epoch": 1969} {"train_loss": -6.112051963806152, "global_step": 82700, "epoch": 1969} {"train_loss": -6.242537498474121, "global_step": 82701, "epoch": 1969} {"train_loss": -6.1506733894348145, "global_step": 82702, "epoch": 1969} {"train_loss": -6.031963348388672, "global_step": 82703, "epoch": 1969} {"train_loss": -6.1561408042907715, "global_step": 82704, "epoch": 1969} {"train_loss": -6.073321342468262, "global_step": 82705, "epoch": 1969} {"train_loss": -6.220877647399902, "global_step": 82706, "epoch": 1969} {"train_loss": -6.221211910247803, "global_step": 82707, "epoch": 1969} {"train_loss": -6.299426555633545, "global_step": 82708, "epoch": 1969} {"train_loss": -6.23673152923584, "global_step": 82709, "epoch": 1969} {"train_loss": -6.190404891967773, "global_step": 82710, "epoch": 1969} {"train_loss": -6.200717926025391, "global_step": 82711, "epoch": 1969} {"train_loss": -6.264091491699219, "global_step": 82712, "epoch": 1969} {"train_loss": -6.285475730895996, "global_step": 82713, "epoch": 1969} {"train_loss": -6.232174873352051, "global_step": 82714, "epoch": 1969} {"train_loss": -6.220582962036133, "global_step": 82715, "epoch": 1969} {"train_loss": -6.193906307220459, "global_step": 82716, "epoch": 1969} {"train_loss": -6.220333099365234, "global_step": 82717, "epoch": 1969} {"train_loss": -6.143359184265137, "global_step": 82718, "epoch": 1969} {"train_loss": -6.175341606140137, "global_step": 82719, "epoch": 1969} {"train_loss": -6.227415561676025, "global_step": 82720, "epoch": 1969} {"train_loss": -6.261936187744141, "global_step": 82721, "epoch": 1969} {"train_loss": -6.114882946014404, "global_step": 82722, "epoch": 1969} {"train_loss": -6.065876007080078, "global_step": 82723, "epoch": 1969} {"train_loss": -6.212658882141113, "global_step": 82724, "epoch": 1969} {"train_loss": -6.31908655166626, "global_step": 82725, "epoch": 1969} {"train_loss": -6.143904685974121, "global_step": 82726, "epoch": 1969} {"train_loss": -6.12177848815918, "global_step": 82727, "epoch": 1969} {"train_loss": -6.277491092681885, "global_step": 82728, "epoch": 1969} {"train_loss": -6.2152419090271, "global_step": 82729, "epoch": 1969} {"train_loss": -6.261804580688477, "global_step": 82730, "epoch": 1969} {"train_loss": -6.257234573364258, "global_step": 82731, "epoch": 1969} {"train_loss": -6.136880874633789, "global_step": 82732, "epoch": 1969} {"train_loss": -6.1833038330078125, "global_step": 82733, "epoch": 1969} {"train_loss": -6.220499515533447, "global_step": 82734, "epoch": 1969} {"train_loss": -6.151298999786377, "global_step": 82735, "epoch": 1969} {"train_loss": -6.215965270996094, "global_step": 82736, "epoch": 1969} {"train_loss": -6.222318649291992, "global_step": 82737, "epoch": 1969} {"train_loss": -6.070819854736328, "global_step": 82738, "epoch": 1969} {"train_loss": -6.191993577139718, "global_step": 82739, "epoch": 1969, "val_loss": 75005.2109375} {"train_loss": -6.2513298988342285, "global_step": 82740, "epoch": 1970} {"train_loss": -6.293267250061035, "global_step": 82741, "epoch": 1970} {"train_loss": -6.133275032043457, "global_step": 82742, "epoch": 1970} {"train_loss": -6.297204971313477, "global_step": 82743, "epoch": 1970} {"train_loss": -6.26669454574585, "global_step": 82744, "epoch": 1970} {"train_loss": -6.261081695556641, "global_step": 82745, "epoch": 1970} {"train_loss": -6.276390075683594, "global_step": 82746, "epoch": 1970} {"train_loss": -6.042859077453613, "global_step": 82747, "epoch": 1970} {"train_loss": -6.265839576721191, "global_step": 82748, "epoch": 1970} {"train_loss": -6.200416564941406, "global_step": 82749, "epoch": 1970} {"train_loss": -6.172066688537598, "global_step": 82750, "epoch": 1970} {"train_loss": -6.147178649902344, "global_step": 82751, "epoch": 1970} {"train_loss": -6.253720283508301, "global_step": 82752, "epoch": 1970} {"train_loss": -6.210292339324951, "global_step": 82753, "epoch": 1970} {"train_loss": -6.2575883865356445, "global_step": 82754, "epoch": 1970} {"train_loss": -6.201727867126465, "global_step": 82755, "epoch": 1970} {"train_loss": -6.0875139236450195, "global_step": 82756, "epoch": 1970} {"train_loss": -6.31899356842041, "global_step": 82757, "epoch": 1970} {"train_loss": -6.211574554443359, "global_step": 82758, "epoch": 1970} {"train_loss": -6.365830421447754, "global_step": 82759, "epoch": 1970} {"train_loss": -6.165874481201172, "global_step": 82760, "epoch": 1970} {"train_loss": -6.295592308044434, "global_step": 82761, "epoch": 1970} {"train_loss": -6.158562660217285, "global_step": 82762, "epoch": 1970} {"train_loss": -6.209123611450195, "global_step": 82763, "epoch": 1970} {"train_loss": -6.088171005249023, "global_step": 82764, "epoch": 1970} {"train_loss": -6.152325630187988, "global_step": 82765, "epoch": 1970} {"train_loss": -6.193840026855469, "global_step": 82766, "epoch": 1970} {"train_loss": -6.244179725646973, "global_step": 82767, "epoch": 1970} {"train_loss": -6.162413597106934, "global_step": 82768, "epoch": 1970} {"train_loss": -6.157434940338135, "global_step": 82769, "epoch": 1970} {"train_loss": -6.162923812866211, "global_step": 82770, "epoch": 1970} {"train_loss": -6.208380222320557, "global_step": 82771, "epoch": 1970} {"train_loss": -6.167965412139893, "global_step": 82772, "epoch": 1970} {"train_loss": -6.148465156555176, "global_step": 82773, "epoch": 1970} {"train_loss": -6.232712745666504, "global_step": 82774, "epoch": 1970} {"train_loss": -6.264494895935059, "global_step": 82775, "epoch": 1970} {"train_loss": -6.180419921875, "global_step": 82776, "epoch": 1970} {"train_loss": -6.222268104553223, "global_step": 82777, "epoch": 1970} {"train_loss": -6.201149940490723, "global_step": 82778, "epoch": 1970} {"train_loss": -6.1109395027160645, "global_step": 82779, "epoch": 1970} {"train_loss": -6.078689098358154, "global_step": 82780, "epoch": 1970} {"train_loss": -6.20223365511213, "global_step": 82781, "epoch": 1970, "val_loss": 75224.8515625} {"train_loss": -6.1790571212768555, "global_step": 82782, "epoch": 1971} {"train_loss": -6.224915981292725, "global_step": 82783, "epoch": 1971} {"train_loss": -6.271792411804199, "global_step": 82784, "epoch": 1971} {"train_loss": -6.212912082672119, "global_step": 82785, "epoch": 1971} {"train_loss": -6.228318214416504, "global_step": 82786, "epoch": 1971} {"train_loss": -6.212342262268066, "global_step": 82787, "epoch": 1971} {"train_loss": -6.235263347625732, "global_step": 82788, "epoch": 1971} {"train_loss": -6.208896636962891, "global_step": 82789, "epoch": 1971} {"train_loss": -6.133949279785156, "global_step": 82790, "epoch": 1971} {"train_loss": -6.013676643371582, "global_step": 82791, "epoch": 1971} {"train_loss": -6.1479878425598145, "global_step": 82792, "epoch": 1971} {"train_loss": -6.139801025390625, "global_step": 82793, "epoch": 1971} {"train_loss": -5.973340034484863, "global_step": 82794, "epoch": 1971} {"train_loss": -6.206906318664551, "global_step": 82795, "epoch": 1971} {"train_loss": -6.100371360778809, "global_step": 82796, "epoch": 1971} {"train_loss": -6.138583183288574, "global_step": 82797, "epoch": 1971} {"train_loss": -6.044540882110596, "global_step": 82798, "epoch": 1971} {"train_loss": -6.2199273109436035, "global_step": 82799, "epoch": 1971} {"train_loss": -6.167112827301025, "global_step": 82800, "epoch": 1971} {"train_loss": -6.145071506500244, "global_step": 82801, "epoch": 1971} {"train_loss": -6.185662746429443, "global_step": 82802, "epoch": 1971} {"train_loss": -6.280178070068359, "global_step": 82803, "epoch": 1971} {"train_loss": -6.067231178283691, "global_step": 82804, "epoch": 1971} {"train_loss": -6.107975482940674, "global_step": 82805, "epoch": 1971} {"train_loss": -6.120779037475586, "global_step": 82806, "epoch": 1971} {"train_loss": -6.125842094421387, "global_step": 82807, "epoch": 1971} {"train_loss": -6.347332954406738, "global_step": 82808, "epoch": 1971} {"train_loss": -6.229707717895508, "global_step": 82809, "epoch": 1971} {"train_loss": -6.195147514343262, "global_step": 82810, "epoch": 1971} {"train_loss": -6.187345504760742, "global_step": 82811, "epoch": 1971} {"train_loss": -6.335658550262451, "global_step": 82812, "epoch": 1971} {"train_loss": -6.226617336273193, "global_step": 82813, "epoch": 1971} {"train_loss": -6.126534461975098, "global_step": 82814, "epoch": 1971} {"train_loss": -6.099375247955322, "global_step": 82815, "epoch": 1971} {"train_loss": -6.161562919616699, "global_step": 82816, "epoch": 1971} {"train_loss": -6.199262619018555, "global_step": 82817, "epoch": 1971} {"train_loss": -6.174461364746094, "global_step": 82818, "epoch": 1971} {"train_loss": -6.0881171226501465, "global_step": 82819, "epoch": 1971} {"train_loss": -6.236189842224121, "global_step": 82820, "epoch": 1971} {"train_loss": -6.177303314208984, "global_step": 82821, "epoch": 1971} {"train_loss": -6.189408779144287, "global_step": 82822, "epoch": 1971} {"train_loss": -6.171681801478068, "global_step": 82823, "epoch": 1971, "val_loss": 75040.75} {"train_loss": -6.183608055114746, "global_step": 82824, "epoch": 1972} {"train_loss": -6.168829917907715, "global_step": 82825, "epoch": 1972} {"train_loss": -6.186506271362305, "global_step": 82826, "epoch": 1972} {"train_loss": -6.021971225738525, "global_step": 82827, "epoch": 1972} {"train_loss": -6.168633937835693, "global_step": 82828, "epoch": 1972} {"train_loss": -6.130486488342285, "global_step": 82829, "epoch": 1972} {"train_loss": -6.046737194061279, "global_step": 82830, "epoch": 1972} {"train_loss": -6.324104309082031, "global_step": 82831, "epoch": 1972} {"train_loss": -6.196468830108643, "global_step": 82832, "epoch": 1972} {"train_loss": -6.088297367095947, "global_step": 82833, "epoch": 1972} {"train_loss": -6.082108497619629, "global_step": 82834, "epoch": 1972} {"train_loss": -6.159358501434326, "global_step": 82835, "epoch": 1972} {"train_loss": -6.060837268829346, "global_step": 82836, "epoch": 1972} {"train_loss": -6.224986553192139, "global_step": 82837, "epoch": 1972} {"train_loss": -6.044229507446289, "global_step": 82838, "epoch": 1972} {"train_loss": -6.167411804199219, "global_step": 82839, "epoch": 1972} {"train_loss": -6.208763122558594, "global_step": 82840, "epoch": 1972} {"train_loss": -6.122316360473633, "global_step": 82841, "epoch": 1972} {"train_loss": -6.12424898147583, "global_step": 82842, "epoch": 1972} {"train_loss": -6.185368537902832, "global_step": 82843, "epoch": 1972} {"train_loss": -6.122786998748779, "global_step": 82844, "epoch": 1972} {"train_loss": -6.168684005737305, "global_step": 82845, "epoch": 1972} {"train_loss": -6.17750883102417, "global_step": 82846, "epoch": 1972} {"train_loss": -6.136940002441406, "global_step": 82847, "epoch": 1972} {"train_loss": -6.07364559173584, "global_step": 82848, "epoch": 1972} {"train_loss": -6.0970048904418945, "global_step": 82849, "epoch": 1972} {"train_loss": -6.164587020874023, "global_step": 82850, "epoch": 1972} {"train_loss": -6.242249488830566, "global_step": 82851, "epoch": 1972} {"train_loss": -6.128079414367676, "global_step": 82852, "epoch": 1972} {"train_loss": -6.04811954498291, "global_step": 82853, "epoch": 1972} {"train_loss": -6.196958541870117, "global_step": 82854, "epoch": 1972} {"train_loss": -6.116864204406738, "global_step": 82855, "epoch": 1972} {"train_loss": -6.15402364730835, "global_step": 82856, "epoch": 1972} {"train_loss": -6.132155418395996, "global_step": 82857, "epoch": 1972} {"train_loss": -6.218310356140137, "global_step": 82858, "epoch": 1972} {"train_loss": -6.168387413024902, "global_step": 82859, "epoch": 1972} {"train_loss": -6.192107200622559, "global_step": 82860, "epoch": 1972} {"train_loss": -6.201892852783203, "global_step": 82861, "epoch": 1972} {"train_loss": -6.22050666809082, "global_step": 82862, "epoch": 1972} {"train_loss": -6.126834869384766, "global_step": 82863, "epoch": 1972} {"train_loss": -6.327573299407959, "global_step": 82864, "epoch": 1972} {"train_loss": -6.155761798222859, "global_step": 82865, "epoch": 1972, "val_loss": 75088.03125} {"train_loss": -6.100870132446289, "global_step": 82866, "epoch": 1973} {"train_loss": -6.068719863891602, "global_step": 82867, "epoch": 1973} {"train_loss": -6.187410831451416, "global_step": 82868, "epoch": 1973} {"train_loss": -6.259776592254639, "global_step": 82869, "epoch": 1973} {"train_loss": -6.186705589294434, "global_step": 82870, "epoch": 1973} {"train_loss": -6.179279804229736, "global_step": 82871, "epoch": 1973} {"train_loss": -6.015718460083008, "global_step": 82872, "epoch": 1973} {"train_loss": -6.08290958404541, "global_step": 82873, "epoch": 1973} {"train_loss": -6.015188217163086, "global_step": 82874, "epoch": 1973} {"train_loss": -6.121888160705566, "global_step": 82875, "epoch": 1973} {"train_loss": -6.0580339431762695, "global_step": 82876, "epoch": 1973} {"train_loss": -6.166470527648926, "global_step": 82877, "epoch": 1973} {"train_loss": -6.173458099365234, "global_step": 82878, "epoch": 1973} {"train_loss": -5.937924385070801, "global_step": 82879, "epoch": 1973} {"train_loss": -6.146181106567383, "global_step": 82880, "epoch": 1973} {"train_loss": -6.239800930023193, "global_step": 82881, "epoch": 1973} {"train_loss": -6.117403984069824, "global_step": 82882, "epoch": 1973} {"train_loss": -6.135987758636475, "global_step": 82883, "epoch": 1973} {"train_loss": -6.040440559387207, "global_step": 82884, "epoch": 1973} {"train_loss": -6.090679168701172, "global_step": 82885, "epoch": 1973} {"train_loss": -6.045102119445801, "global_step": 82886, "epoch": 1973} {"train_loss": -6.1343793869018555, "global_step": 82887, "epoch": 1973} {"train_loss": -6.178403854370117, "global_step": 82888, "epoch": 1973} {"train_loss": -6.192187309265137, "global_step": 82889, "epoch": 1973} {"train_loss": -6.122476577758789, "global_step": 82890, "epoch": 1973} {"train_loss": -6.163952827453613, "global_step": 82891, "epoch": 1973} {"train_loss": -6.211005210876465, "global_step": 82892, "epoch": 1973} {"train_loss": -6.263607025146484, "global_step": 82893, "epoch": 1973} {"train_loss": -6.310214519500732, "global_step": 82894, "epoch": 1973} {"train_loss": -6.078702449798584, "global_step": 82895, "epoch": 1973} {"train_loss": -6.1912736892700195, "global_step": 82896, "epoch": 1973} {"train_loss": -6.090262413024902, "global_step": 82897, "epoch": 1973} {"train_loss": -6.173188209533691, "global_step": 82898, "epoch": 1973} {"train_loss": -6.213400840759277, "global_step": 82899, "epoch": 1973} {"train_loss": -6.207986831665039, "global_step": 82900, "epoch": 1973} {"train_loss": -6.25455379486084, "global_step": 82901, "epoch": 1973} {"train_loss": -6.244685173034668, "global_step": 82902, "epoch": 1973} {"train_loss": -6.019562721252441, "global_step": 82903, "epoch": 1973} {"train_loss": -6.199568748474121, "global_step": 82904, "epoch": 1973} {"train_loss": -6.149510383605957, "global_step": 82905, "epoch": 1973} {"train_loss": -6.363140106201172, "global_step": 82906, "epoch": 1973} {"train_loss": -6.149552367982411, "global_step": 82907, "epoch": 1973, "val_loss": 75232.3046875} {"train_loss": -6.226893424987793, "global_step": 82908, "epoch": 1974} {"train_loss": -6.1959638595581055, "global_step": 82909, "epoch": 1974} {"train_loss": -6.18550968170166, "global_step": 82910, "epoch": 1974} {"train_loss": -6.169219970703125, "global_step": 82911, "epoch": 1974} {"train_loss": -6.15514612197876, "global_step": 82912, "epoch": 1974} {"train_loss": -6.315347194671631, "global_step": 82913, "epoch": 1974} {"train_loss": -6.225685119628906, "global_step": 82914, "epoch": 1974} {"train_loss": -6.140815734863281, "global_step": 82915, "epoch": 1974} {"train_loss": -6.018461227416992, "global_step": 82916, "epoch": 1974} {"train_loss": -6.146623134613037, "global_step": 82917, "epoch": 1974} {"train_loss": -6.200259208679199, "global_step": 82918, "epoch": 1974} {"train_loss": -6.016580581665039, "global_step": 82919, "epoch": 1974} {"train_loss": -6.095620632171631, "global_step": 82920, "epoch": 1974} {"train_loss": -6.114279270172119, "global_step": 82921, "epoch": 1974} {"train_loss": -6.126972198486328, "global_step": 82922, "epoch": 1974} {"train_loss": -6.190984725952148, "global_step": 82923, "epoch": 1974} {"train_loss": -6.225447654724121, "global_step": 82924, "epoch": 1974} {"train_loss": -6.150921821594238, "global_step": 82925, "epoch": 1974} {"train_loss": -6.321336269378662, "global_step": 82926, "epoch": 1974} {"train_loss": -6.177430629730225, "global_step": 82927, "epoch": 1974} {"train_loss": -6.190060615539551, "global_step": 82928, "epoch": 1974} {"train_loss": -6.1724042892456055, "global_step": 82929, "epoch": 1974} {"train_loss": -6.219329833984375, "global_step": 82930, "epoch": 1974} {"train_loss": -6.140353202819824, "global_step": 82931, "epoch": 1974} {"train_loss": -6.096596717834473, "global_step": 82932, "epoch": 1974} {"train_loss": -6.208453178405762, "global_step": 82933, "epoch": 1974} {"train_loss": -6.011655807495117, "global_step": 82934, "epoch": 1974} {"train_loss": -6.114355087280273, "global_step": 82935, "epoch": 1974} {"train_loss": -6.175436019897461, "global_step": 82936, "epoch": 1974} {"train_loss": -6.2037458419799805, "global_step": 82937, "epoch": 1974} {"train_loss": -6.073399066925049, "global_step": 82938, "epoch": 1974} {"train_loss": -6.089522361755371, "global_step": 82939, "epoch": 1974} {"train_loss": -6.124459266662598, "global_step": 82940, "epoch": 1974} {"train_loss": -6.163766860961914, "global_step": 82941, "epoch": 1974} {"train_loss": -6.169736862182617, "global_step": 82942, "epoch": 1974} {"train_loss": -6.164783000946045, "global_step": 82943, "epoch": 1974} {"train_loss": -6.13626766204834, "global_step": 82944, "epoch": 1974} {"train_loss": -6.176504611968994, "global_step": 82945, "epoch": 1974} {"train_loss": -6.172307968139648, "global_step": 82946, "epoch": 1974} {"train_loss": -6.170010566711426, "global_step": 82947, "epoch": 1974} {"train_loss": -6.157339096069336, "global_step": 82948, "epoch": 1974} {"train_loss": -6.160860300064087, "global_step": 82949, "epoch": 1974, "val_loss": 75483.015625} {"train_loss": -6.105255126953125, "global_step": 82950, "epoch": 1975} {"train_loss": -6.169754505157471, "global_step": 82951, "epoch": 1975} {"train_loss": -6.177736282348633, "global_step": 82952, "epoch": 1975} {"train_loss": -6.176705360412598, "global_step": 82953, "epoch": 1975} {"train_loss": -6.279693603515625, "global_step": 82954, "epoch": 1975} {"train_loss": -6.215993881225586, "global_step": 82955, "epoch": 1975} {"train_loss": -6.076791763305664, "global_step": 82956, "epoch": 1975} {"train_loss": -6.322278022766113, "global_step": 82957, "epoch": 1975} {"train_loss": -6.189078330993652, "global_step": 82958, "epoch": 1975} {"train_loss": -6.2092790603637695, "global_step": 82959, "epoch": 1975} {"train_loss": -6.184958457946777, "global_step": 82960, "epoch": 1975} {"train_loss": -6.064810752868652, "global_step": 82961, "epoch": 1975} {"train_loss": -6.2749481201171875, "global_step": 82962, "epoch": 1975} {"train_loss": -6.1259541511535645, "global_step": 82963, "epoch": 1975} {"train_loss": -6.259310722351074, "global_step": 82964, "epoch": 1975} {"train_loss": -6.085789203643799, "global_step": 82965, "epoch": 1975} {"train_loss": -6.1276326179504395, "global_step": 82966, "epoch": 1975} {"train_loss": -6.147190093994141, "global_step": 82967, "epoch": 1975} {"train_loss": -6.073309421539307, "global_step": 82968, "epoch": 1975} {"train_loss": -6.169251918792725, "global_step": 82969, "epoch": 1975} {"train_loss": -6.192048072814941, "global_step": 82970, "epoch": 1975} {"train_loss": -6.2869157791137695, "global_step": 82971, "epoch": 1975} {"train_loss": -6.17791748046875, "global_step": 82972, "epoch": 1975} {"train_loss": -6.1054277420043945, "global_step": 82973, "epoch": 1975} {"train_loss": -6.129344940185547, "global_step": 82974, "epoch": 1975} {"train_loss": -6.11558723449707, "global_step": 82975, "epoch": 1975} {"train_loss": -6.204470634460449, "global_step": 82976, "epoch": 1975} {"train_loss": -6.273213863372803, "global_step": 82977, "epoch": 1975} {"train_loss": -6.159063339233398, "global_step": 82978, "epoch": 1975} {"train_loss": -6.177616119384766, "global_step": 82979, "epoch": 1975} {"train_loss": -6.142386436462402, "global_step": 82980, "epoch": 1975} {"train_loss": -6.214143753051758, "global_step": 82981, "epoch": 1975} {"train_loss": -6.145474433898926, "global_step": 82982, "epoch": 1975} {"train_loss": -6.010931968688965, "global_step": 82983, "epoch": 1975} {"train_loss": -6.166535377502441, "global_step": 82984, "epoch": 1975} {"train_loss": -6.151002883911133, "global_step": 82985, "epoch": 1975} {"train_loss": -6.1529388427734375, "global_step": 82986, "epoch": 1975} {"train_loss": -6.134681701660156, "global_step": 82987, "epoch": 1975} {"train_loss": -6.216062068939209, "global_step": 82988, "epoch": 1975} {"train_loss": -6.2769012451171875, "global_step": 82989, "epoch": 1975} {"train_loss": -6.229677200317383, "global_step": 82990, "epoch": 1975} {"train_loss": -6.17555046081543, "global_step": 82991, "epoch": 1975, "val_loss": 75000.5703125} {"train_loss": -6.197819232940674, "global_step": 82992, "epoch": 1976} {"train_loss": -6.132166385650635, "global_step": 82993, "epoch": 1976} {"train_loss": -6.146957874298096, "global_step": 82994, "epoch": 1976} {"train_loss": -6.1050333976745605, "global_step": 82995, "epoch": 1976} {"train_loss": -6.174541473388672, "global_step": 82996, "epoch": 1976} {"train_loss": -6.092748641967773, "global_step": 82997, "epoch": 1976} {"train_loss": -6.004792213439941, "global_step": 82998, "epoch": 1976} {"train_loss": -6.051018714904785, "global_step": 82999, "epoch": 1976} {"train_loss": -5.982047080993652, "global_step": 83000, "epoch": 1976} {"train_loss": -6.008184432983398, "global_step": 83001, "epoch": 1976} {"train_loss": -6.103141784667969, "global_step": 83002, "epoch": 1976} {"train_loss": -6.067412376403809, "global_step": 83003, "epoch": 1976} {"train_loss": -5.991729736328125, "global_step": 83004, "epoch": 1976} {"train_loss": -5.977484703063965, "global_step": 83005, "epoch": 1976} {"train_loss": -6.158810615539551, "global_step": 83006, "epoch": 1976} {"train_loss": -6.139671325683594, "global_step": 83007, "epoch": 1976} {"train_loss": -6.091238021850586, "global_step": 83008, "epoch": 1976} {"train_loss": -6.081366539001465, "global_step": 83009, "epoch": 1976} {"train_loss": -6.174674034118652, "global_step": 83010, "epoch": 1976} {"train_loss": -6.17317008972168, "global_step": 83011, "epoch": 1976} {"train_loss": -6.142095565795898, "global_step": 83012, "epoch": 1976} {"train_loss": -6.055285930633545, "global_step": 83013, "epoch": 1976} {"train_loss": -6.100646018981934, "global_step": 83014, "epoch": 1976} {"train_loss": -6.014338970184326, "global_step": 83015, "epoch": 1976} {"train_loss": -6.163193702697754, "global_step": 83016, "epoch": 1976} {"train_loss": -6.060749053955078, "global_step": 83017, "epoch": 1976} {"train_loss": -6.179182529449463, "global_step": 83018, "epoch": 1976} {"train_loss": -6.146892547607422, "global_step": 83019, "epoch": 1976} {"train_loss": -6.255096912384033, "global_step": 83020, "epoch": 1976} {"train_loss": -6.324982166290283, "global_step": 83021, "epoch": 1976} {"train_loss": -6.213238716125488, "global_step": 83022, "epoch": 1976} {"train_loss": -6.075483798980713, "global_step": 83023, "epoch": 1976} {"train_loss": -6.175207138061523, "global_step": 83024, "epoch": 1976} {"train_loss": -6.181905746459961, "global_step": 83025, "epoch": 1976} {"train_loss": -6.379133224487305, "global_step": 83026, "epoch": 1976} {"train_loss": -6.1330413818359375, "global_step": 83027, "epoch": 1976} {"train_loss": -6.106391906738281, "global_step": 83028, "epoch": 1976} {"train_loss": -6.162187576293945, "global_step": 83029, "epoch": 1976} {"train_loss": -6.220228672027588, "global_step": 83030, "epoch": 1976} {"train_loss": -6.21804666519165, "global_step": 83031, "epoch": 1976} {"train_loss": -6.113550186157227, "global_step": 83032, "epoch": 1976} {"train_loss": -6.130115259261358, "global_step": 83033, "epoch": 1976, "val_loss": 75040.4140625} {"train_loss": -6.233096599578857, "global_step": 83034, "epoch": 1977} {"train_loss": -6.13628625869751, "global_step": 83035, "epoch": 1977} {"train_loss": -6.2247724533081055, "global_step": 83036, "epoch": 1977} {"train_loss": -6.189546585083008, "global_step": 83037, "epoch": 1977} {"train_loss": -6.2594099044799805, "global_step": 83038, "epoch": 1977} {"train_loss": -6.149200916290283, "global_step": 83039, "epoch": 1977} {"train_loss": -6.165835857391357, "global_step": 83040, "epoch": 1977} {"train_loss": -6.140983581542969, "global_step": 83041, "epoch": 1977} {"train_loss": -6.1793012619018555, "global_step": 83042, "epoch": 1977} {"train_loss": -6.195399761199951, "global_step": 83043, "epoch": 1977} {"train_loss": -6.156768798828125, "global_step": 83044, "epoch": 1977} {"train_loss": -6.232253074645996, "global_step": 83045, "epoch": 1977} {"train_loss": -6.2242021560668945, "global_step": 83046, "epoch": 1977} {"train_loss": -6.248648643493652, "global_step": 83047, "epoch": 1977} {"train_loss": -6.128862380981445, "global_step": 83048, "epoch": 1977} {"train_loss": -6.207422733306885, "global_step": 83049, "epoch": 1977} {"train_loss": -6.221836090087891, "global_step": 83050, "epoch": 1977} {"train_loss": -6.195523262023926, "global_step": 83051, "epoch": 1977} {"train_loss": -6.317358016967773, "global_step": 83052, "epoch": 1977} {"train_loss": -6.299241065979004, "global_step": 83053, "epoch": 1977} {"train_loss": -6.220981597900391, "global_step": 83054, "epoch": 1977} {"train_loss": -6.201421737670898, "global_step": 83055, "epoch": 1977} {"train_loss": -6.259162425994873, "global_step": 83056, "epoch": 1977} {"train_loss": -6.155750274658203, "global_step": 83057, "epoch": 1977} {"train_loss": -6.201269149780273, "global_step": 83058, "epoch": 1977} {"train_loss": -6.24946403503418, "global_step": 83059, "epoch": 1977} {"train_loss": -6.178400039672852, "global_step": 83060, "epoch": 1977} {"train_loss": -6.133430004119873, "global_step": 83061, "epoch": 1977} {"train_loss": -6.226937294006348, "global_step": 83062, "epoch": 1977} {"train_loss": -6.0822367668151855, "global_step": 83063, "epoch": 1977} {"train_loss": -6.230541229248047, "global_step": 83064, "epoch": 1977} {"train_loss": -6.2212724685668945, "global_step": 83065, "epoch": 1977} {"train_loss": -6.064013481140137, "global_step": 83066, "epoch": 1977} {"train_loss": -6.198734283447266, "global_step": 83067, "epoch": 1977} {"train_loss": -6.081755638122559, "global_step": 83068, "epoch": 1977} {"train_loss": -6.116827964782715, "global_step": 83069, "epoch": 1977} {"train_loss": -6.156459808349609, "global_step": 83070, "epoch": 1977} {"train_loss": -6.199782848358154, "global_step": 83071, "epoch": 1977} {"train_loss": -6.1466264724731445, "global_step": 83072, "epoch": 1977} {"train_loss": -6.1057209968566895, "global_step": 83073, "epoch": 1977} {"train_loss": -6.1762495040893555, "global_step": 83074, "epoch": 1977} {"train_loss": -6.189097847257342, "global_step": 83075, "epoch": 1977, "val_loss": 75259.8515625} {"train_loss": -6.134737014770508, "global_step": 83076, "epoch": 1978} {"train_loss": -6.1612043380737305, "global_step": 83077, "epoch": 1978} {"train_loss": -6.2207183837890625, "global_step": 83078, "epoch": 1978} {"train_loss": -6.153520107269287, "global_step": 83079, "epoch": 1978} {"train_loss": -6.190523147583008, "global_step": 83080, "epoch": 1978} {"train_loss": -6.183004379272461, "global_step": 83081, "epoch": 1978} {"train_loss": -6.01710844039917, "global_step": 83082, "epoch": 1978} {"train_loss": -6.19959020614624, "global_step": 83083, "epoch": 1978} {"train_loss": -6.1608500480651855, "global_step": 83084, "epoch": 1978} {"train_loss": -5.987726211547852, "global_step": 83085, "epoch": 1978} {"train_loss": -6.219059467315674, "global_step": 83086, "epoch": 1978} {"train_loss": -6.16568660736084, "global_step": 83087, "epoch": 1978} {"train_loss": -6.154335021972656, "global_step": 83088, "epoch": 1978} {"train_loss": -6.122043609619141, "global_step": 83089, "epoch": 1978} {"train_loss": -6.172359943389893, "global_step": 83090, "epoch": 1978} {"train_loss": -6.135488033294678, "global_step": 83091, "epoch": 1978} {"train_loss": -5.936196804046631, "global_step": 83092, "epoch": 1978} {"train_loss": -6.098598480224609, "global_step": 83093, "epoch": 1978} {"train_loss": -6.133995532989502, "global_step": 83094, "epoch": 1978} {"train_loss": -5.941875457763672, "global_step": 83095, "epoch": 1978} {"train_loss": -6.161489009857178, "global_step": 83096, "epoch": 1978} {"train_loss": -6.015663146972656, "global_step": 83097, "epoch": 1978} {"train_loss": -6.198086738586426, "global_step": 83098, "epoch": 1978} {"train_loss": -6.060245990753174, "global_step": 83099, "epoch": 1978} {"train_loss": -6.1383748054504395, "global_step": 83100, "epoch": 1978} {"train_loss": -6.162842273712158, "global_step": 83101, "epoch": 1978} {"train_loss": -6.132840156555176, "global_step": 83102, "epoch": 1978} {"train_loss": -6.155974388122559, "global_step": 83103, "epoch": 1978} {"train_loss": -6.1108012199401855, "global_step": 83104, "epoch": 1978} {"train_loss": -6.214664459228516, "global_step": 83105, "epoch": 1978} {"train_loss": -6.172778129577637, "global_step": 83106, "epoch": 1978} {"train_loss": -6.2158403396606445, "global_step": 83107, "epoch": 1978} {"train_loss": -6.13120174407959, "global_step": 83108, "epoch": 1978} {"train_loss": -6.1478681564331055, "global_step": 83109, "epoch": 1978} {"train_loss": -6.148339748382568, "global_step": 83110, "epoch": 1978} {"train_loss": -6.11412239074707, "global_step": 83111, "epoch": 1978} {"train_loss": -6.210272789001465, "global_step": 83112, "epoch": 1978} {"train_loss": -6.112461090087891, "global_step": 83113, "epoch": 1978} {"train_loss": -6.119856357574463, "global_step": 83114, "epoch": 1978} {"train_loss": -6.262024879455566, "global_step": 83115, "epoch": 1978} {"train_loss": -6.1699323654174805, "global_step": 83116, "epoch": 1978} {"train_loss": -6.140102329708281, "global_step": 83117, "epoch": 1978, "val_loss": 75105.7421875} {"train_loss": -6.111093521118164, "global_step": 83118, "epoch": 1979} {"train_loss": -6.130336761474609, "global_step": 83119, "epoch": 1979} {"train_loss": -6.129286289215088, "global_step": 83120, "epoch": 1979} {"train_loss": -6.197016716003418, "global_step": 83121, "epoch": 1979} {"train_loss": -6.256790637969971, "global_step": 83122, "epoch": 1979} {"train_loss": -6.185657501220703, "global_step": 83123, "epoch": 1979} {"train_loss": -6.191981315612793, "global_step": 83124, "epoch": 1979} {"train_loss": -6.231424331665039, "global_step": 83125, "epoch": 1979} {"train_loss": -6.183774471282959, "global_step": 83126, "epoch": 1979} {"train_loss": -6.3028130531311035, "global_step": 83127, "epoch": 1979} {"train_loss": -6.202821731567383, "global_step": 83128, "epoch": 1979} {"train_loss": -6.182345867156982, "global_step": 83129, "epoch": 1979} {"train_loss": -6.21845817565918, "global_step": 83130, "epoch": 1979} {"train_loss": -6.161656379699707, "global_step": 83131, "epoch": 1979} {"train_loss": -6.143077850341797, "global_step": 83132, "epoch": 1979} {"train_loss": -6.116097450256348, "global_step": 83133, "epoch": 1979} {"train_loss": -6.155299186706543, "global_step": 83134, "epoch": 1979} {"train_loss": -6.030447959899902, "global_step": 83135, "epoch": 1979} {"train_loss": -6.098222732543945, "global_step": 83136, "epoch": 1979} {"train_loss": -6.291486740112305, "global_step": 83137, "epoch": 1979} {"train_loss": -5.99639892578125, "global_step": 83138, "epoch": 1979} {"train_loss": -6.04396915435791, "global_step": 83139, "epoch": 1979} {"train_loss": -6.204545974731445, "global_step": 83140, "epoch": 1979} {"train_loss": -6.017468452453613, "global_step": 83141, "epoch": 1979} {"train_loss": -6.060432434082031, "global_step": 83142, "epoch": 1979} {"train_loss": -6.039429664611816, "global_step": 83143, "epoch": 1979} {"train_loss": -6.073843955993652, "global_step": 83144, "epoch": 1979} {"train_loss": -6.060080528259277, "global_step": 83145, "epoch": 1979} {"train_loss": -6.20290994644165, "global_step": 83146, "epoch": 1979} {"train_loss": -6.026791572570801, "global_step": 83147, "epoch": 1979} {"train_loss": -6.094540596008301, "global_step": 83148, "epoch": 1979} {"train_loss": -6.160942077636719, "global_step": 83149, "epoch": 1979} {"train_loss": -6.106393814086914, "global_step": 83150, "epoch": 1979} {"train_loss": -6.106551170349121, "global_step": 83151, "epoch": 1979} {"train_loss": -6.173674583435059, "global_step": 83152, "epoch": 1979} {"train_loss": -6.127839088439941, "global_step": 83153, "epoch": 1979} {"train_loss": -6.1952362060546875, "global_step": 83154, "epoch": 1979} {"train_loss": -6.267089366912842, "global_step": 83155, "epoch": 1979} {"train_loss": -6.295462608337402, "global_step": 83156, "epoch": 1979} {"train_loss": -6.125149726867676, "global_step": 83157, "epoch": 1979} {"train_loss": -6.2083563804626465, "global_step": 83158, "epoch": 1979} {"train_loss": -6.1500364144643145, "global_step": 83159, "epoch": 1979, "val_loss": 75132.3046875} {"train_loss": -6.209412574768066, "global_step": 83160, "epoch": 1980} {"train_loss": -6.178736686706543, "global_step": 83161, "epoch": 1980} {"train_loss": -6.190291881561279, "global_step": 83162, "epoch": 1980} {"train_loss": -6.187786102294922, "global_step": 83163, "epoch": 1980} {"train_loss": -6.208640098571777, "global_step": 83164, "epoch": 1980} {"train_loss": -6.139168739318848, "global_step": 83165, "epoch": 1980} {"train_loss": -6.235168933868408, "global_step": 83166, "epoch": 1980} {"train_loss": -6.144306182861328, "global_step": 83167, "epoch": 1980} {"train_loss": -6.212409973144531, "global_step": 83168, "epoch": 1980} {"train_loss": -6.281858921051025, "global_step": 83169, "epoch": 1980} {"train_loss": -6.320731163024902, "global_step": 83170, "epoch": 1980} {"train_loss": -6.24024772644043, "global_step": 83171, "epoch": 1980} {"train_loss": -6.229306221008301, "global_step": 83172, "epoch": 1980} {"train_loss": -6.07931661605835, "global_step": 83173, "epoch": 1980} {"train_loss": -6.2282280921936035, "global_step": 83174, "epoch": 1980} {"train_loss": -6.046600341796875, "global_step": 83175, "epoch": 1980} {"train_loss": -6.143050670623779, "global_step": 83176, "epoch": 1980} {"train_loss": -6.121644020080566, "global_step": 83177, "epoch": 1980} {"train_loss": -6.078100204467773, "global_step": 83178, "epoch": 1980} {"train_loss": -6.047797679901123, "global_step": 83179, "epoch": 1980} {"train_loss": -6.172829627990723, "global_step": 83180, "epoch": 1980} {"train_loss": -6.044808387756348, "global_step": 83181, "epoch": 1980} {"train_loss": -5.8686065673828125, "global_step": 83182, "epoch": 1980} {"train_loss": -6.079181671142578, "global_step": 83183, "epoch": 1980} {"train_loss": -5.98143196105957, "global_step": 83184, "epoch": 1980} {"train_loss": -6.116559028625488, "global_step": 83185, "epoch": 1980} {"train_loss": -6.252830982208252, "global_step": 83186, "epoch": 1980} {"train_loss": -6.054859638214111, "global_step": 83187, "epoch": 1980} {"train_loss": -6.120466709136963, "global_step": 83188, "epoch": 1980} {"train_loss": -6.110330104827881, "global_step": 83189, "epoch": 1980} {"train_loss": -6.1957550048828125, "global_step": 83190, "epoch": 1980} {"train_loss": -5.889822959899902, "global_step": 83191, "epoch": 1980} {"train_loss": -6.164266586303711, "global_step": 83192, "epoch": 1980} {"train_loss": -6.165788650512695, "global_step": 83193, "epoch": 1980} {"train_loss": -6.102259159088135, "global_step": 83194, "epoch": 1980} {"train_loss": -6.058252334594727, "global_step": 83195, "epoch": 1980} {"train_loss": -6.162006378173828, "global_step": 83196, "epoch": 1980} {"train_loss": -6.011059761047363, "global_step": 83197, "epoch": 1980} {"train_loss": -6.176398277282715, "global_step": 83198, "epoch": 1980} {"train_loss": -6.124629020690918, "global_step": 83199, "epoch": 1980} {"train_loss": -6.169309616088867, "global_step": 83200, "epoch": 1980} {"train_loss": -6.135334162485032, "global_step": 83201, "epoch": 1980, "val_loss": 75040.140625} {"train_loss": -6.045003414154053, "global_step": 83202, "epoch": 1981} {"train_loss": -6.102731704711914, "global_step": 83203, "epoch": 1981} {"train_loss": -6.191669464111328, "global_step": 83204, "epoch": 1981} {"train_loss": -6.003432750701904, "global_step": 83205, "epoch": 1981} {"train_loss": -6.028582572937012, "global_step": 83206, "epoch": 1981} {"train_loss": -6.206104278564453, "global_step": 83207, "epoch": 1981} {"train_loss": -6.060763359069824, "global_step": 83208, "epoch": 1981} {"train_loss": -6.134097099304199, "global_step": 83209, "epoch": 1981} {"train_loss": -6.060934543609619, "global_step": 83210, "epoch": 1981} {"train_loss": -6.178705215454102, "global_step": 83211, "epoch": 1981} {"train_loss": -6.203234672546387, "global_step": 83212, "epoch": 1981} {"train_loss": -6.275379180908203, "global_step": 83213, "epoch": 1981} {"train_loss": -6.110952377319336, "global_step": 83214, "epoch": 1981} {"train_loss": -6.200782775878906, "global_step": 83215, "epoch": 1981} {"train_loss": -6.131476402282715, "global_step": 83216, "epoch": 1981} {"train_loss": -6.200723171234131, "global_step": 83217, "epoch": 1981} {"train_loss": -6.199460506439209, "global_step": 83218, "epoch": 1981} {"train_loss": -6.1069769859313965, "global_step": 83219, "epoch": 1981} {"train_loss": -6.2440056800842285, "global_step": 83220, "epoch": 1981} {"train_loss": -6.168996810913086, "global_step": 83221, "epoch": 1981} {"train_loss": -6.204158782958984, "global_step": 83222, "epoch": 1981} {"train_loss": -6.084257125854492, "global_step": 83223, "epoch": 1981} {"train_loss": -6.141243934631348, "global_step": 83224, "epoch": 1981} {"train_loss": -6.272395133972168, "global_step": 83225, "epoch": 1981} {"train_loss": -6.143211364746094, "global_step": 83226, "epoch": 1981} {"train_loss": -6.148477077484131, "global_step": 83227, "epoch": 1981} {"train_loss": -6.202203750610352, "global_step": 83228, "epoch": 1981} {"train_loss": -6.1748046875, "global_step": 83229, "epoch": 1981} {"train_loss": -6.188970565795898, "global_step": 83230, "epoch": 1981} {"train_loss": -6.129727363586426, "global_step": 83231, "epoch": 1981} {"train_loss": -6.21158504486084, "global_step": 83232, "epoch": 1981} {"train_loss": -6.172235488891602, "global_step": 83233, "epoch": 1981} {"train_loss": -6.232820510864258, "global_step": 83234, "epoch": 1981} {"train_loss": -6.197808265686035, "global_step": 83235, "epoch": 1981} {"train_loss": -6.1539506912231445, "global_step": 83236, "epoch": 1981} {"train_loss": -6.194220542907715, "global_step": 83237, "epoch": 1981} {"train_loss": -6.159337997436523, "global_step": 83238, "epoch": 1981} {"train_loss": -6.206398963928223, "global_step": 83239, "epoch": 1981} {"train_loss": -6.069976806640625, "global_step": 83240, "epoch": 1981} {"train_loss": -6.201935768127441, "global_step": 83241, "epoch": 1981} {"train_loss": -6.153188705444336, "global_step": 83242, "epoch": 1981} {"train_loss": -6.159497624351864, "global_step": 83243, "epoch": 1981, "val_loss": 75042.546875} {"train_loss": -6.142230033874512, "global_step": 83244, "epoch": 1982} {"train_loss": -6.145963191986084, "global_step": 83245, "epoch": 1982} {"train_loss": -6.2019944190979, "global_step": 83246, "epoch": 1982} {"train_loss": -6.1802544593811035, "global_step": 83247, "epoch": 1982} {"train_loss": -6.135345458984375, "global_step": 83248, "epoch": 1982} {"train_loss": -6.279885292053223, "global_step": 83249, "epoch": 1982} {"train_loss": -6.192956924438477, "global_step": 83250, "epoch": 1982} {"train_loss": -6.013033866882324, "global_step": 83251, "epoch": 1982} {"train_loss": -6.142065525054932, "global_step": 83252, "epoch": 1982} {"train_loss": -6.154308795928955, "global_step": 83253, "epoch": 1982} {"train_loss": -6.216671943664551, "global_step": 83254, "epoch": 1982} {"train_loss": -6.116631507873535, "global_step": 83255, "epoch": 1982} {"train_loss": -6.192596912384033, "global_step": 83256, "epoch": 1982} {"train_loss": -6.1435089111328125, "global_step": 83257, "epoch": 1982} {"train_loss": -6.176831245422363, "global_step": 83258, "epoch": 1982} {"train_loss": -6.164113998413086, "global_step": 83259, "epoch": 1982} {"train_loss": -6.207996845245361, "global_step": 83260, "epoch": 1982} {"train_loss": -6.092738628387451, "global_step": 83261, "epoch": 1982} {"train_loss": -6.1691813468933105, "global_step": 83262, "epoch": 1982} {"train_loss": -6.075711250305176, "global_step": 83263, "epoch": 1982} {"train_loss": -6.127610683441162, "global_step": 83264, "epoch": 1982} {"train_loss": -6.233681678771973, "global_step": 83265, "epoch": 1982} {"train_loss": -6.147589206695557, "global_step": 83266, "epoch": 1982} {"train_loss": -6.219555854797363, "global_step": 83267, "epoch": 1982} {"train_loss": -6.23093318939209, "global_step": 83268, "epoch": 1982} {"train_loss": -6.145964622497559, "global_step": 83269, "epoch": 1982} {"train_loss": -6.279191493988037, "global_step": 83270, "epoch": 1982} {"train_loss": -6.309791088104248, "global_step": 83271, "epoch": 1982} {"train_loss": -6.284078121185303, "global_step": 83272, "epoch": 1982} {"train_loss": -6.248051643371582, "global_step": 83273, "epoch": 1982} {"train_loss": -6.0569539070129395, "global_step": 83274, "epoch": 1982} {"train_loss": -6.179965019226074, "global_step": 83275, "epoch": 1982} {"train_loss": -6.214788436889648, "global_step": 83276, "epoch": 1982} {"train_loss": -6.089447975158691, "global_step": 83277, "epoch": 1982} {"train_loss": -6.215513229370117, "global_step": 83278, "epoch": 1982} {"train_loss": -6.140463829040527, "global_step": 83279, "epoch": 1982} {"train_loss": -6.108473777770996, "global_step": 83280, "epoch": 1982} {"train_loss": -6.129000186920166, "global_step": 83281, "epoch": 1982} {"train_loss": -6.139735221862793, "global_step": 83282, "epoch": 1982} {"train_loss": -6.186310768127441, "global_step": 83283, "epoch": 1982} {"train_loss": -6.2668867111206055, "global_step": 83284, "epoch": 1982} {"train_loss": -6.174469130379813, "global_step": 83285, "epoch": 1982, "val_loss": 75041.921875} {"train_loss": -6.289299011230469, "global_step": 83286, "epoch": 1983} {"train_loss": -6.253717422485352, "global_step": 83287, "epoch": 1983} {"train_loss": -6.2754716873168945, "global_step": 83288, "epoch": 1983} {"train_loss": -6.217177391052246, "global_step": 83289, "epoch": 1983} {"train_loss": -6.178009986877441, "global_step": 83290, "epoch": 1983} {"train_loss": -6.217161178588867, "global_step": 83291, "epoch": 1983} {"train_loss": -5.96243953704834, "global_step": 83292, "epoch": 1983} {"train_loss": -6.144612789154053, "global_step": 83293, "epoch": 1983} {"train_loss": -6.27362585067749, "global_step": 83294, "epoch": 1983} {"train_loss": -6.135972499847412, "global_step": 83295, "epoch": 1983} {"train_loss": -6.181374549865723, "global_step": 83296, "epoch": 1983} {"train_loss": -6.141812324523926, "global_step": 83297, "epoch": 1983} {"train_loss": -6.1197099685668945, "global_step": 83298, "epoch": 1983} {"train_loss": -6.251938343048096, "global_step": 83299, "epoch": 1983} {"train_loss": -6.249021530151367, "global_step": 83300, "epoch": 1983} {"train_loss": -6.165688514709473, "global_step": 83301, "epoch": 1983} {"train_loss": -6.036464691162109, "global_step": 83302, "epoch": 1983} {"train_loss": -6.129556655883789, "global_step": 83303, "epoch": 1983} {"train_loss": -6.0668134689331055, "global_step": 83304, "epoch": 1983} {"train_loss": -6.017100811004639, "global_step": 83305, "epoch": 1983} {"train_loss": -6.081675052642822, "global_step": 83306, "epoch": 1983} {"train_loss": -6.164098739624023, "global_step": 83307, "epoch": 1983} {"train_loss": -6.069161891937256, "global_step": 83308, "epoch": 1983} {"train_loss": -6.139603137969971, "global_step": 83309, "epoch": 1983} {"train_loss": -6.144872665405273, "global_step": 83310, "epoch": 1983} {"train_loss": -6.139006614685059, "global_step": 83311, "epoch": 1983} {"train_loss": -6.083459377288818, "global_step": 83312, "epoch": 1983} {"train_loss": -6.121367454528809, "global_step": 83313, "epoch": 1983} {"train_loss": -6.159937858581543, "global_step": 83314, "epoch": 1983} {"train_loss": -6.141214847564697, "global_step": 83315, "epoch": 1983} {"train_loss": -6.1832475662231445, "global_step": 83316, "epoch": 1983} {"train_loss": -6.168258190155029, "global_step": 83317, "epoch": 1983} {"train_loss": -6.092848777770996, "global_step": 83318, "epoch": 1983} {"train_loss": -6.154665946960449, "global_step": 83319, "epoch": 1983} {"train_loss": -6.331960678100586, "global_step": 83320, "epoch": 1983} {"train_loss": -6.087074279785156, "global_step": 83321, "epoch": 1983} {"train_loss": -6.3021159172058105, "global_step": 83322, "epoch": 1983} {"train_loss": -6.184351444244385, "global_step": 83323, "epoch": 1983} {"train_loss": -6.259615421295166, "global_step": 83324, "epoch": 1983} {"train_loss": -6.022635459899902, "global_step": 83325, "epoch": 1983} {"train_loss": -6.119771480560303, "global_step": 83326, "epoch": 1983} {"train_loss": -6.157964558828445, "global_step": 83327, "epoch": 1983, "val_loss": 75409.3984375} {"train_loss": -6.080305576324463, "global_step": 83328, "epoch": 1984} {"train_loss": -6.18730354309082, "global_step": 83329, "epoch": 1984} {"train_loss": -6.301824569702148, "global_step": 83330, "epoch": 1984} {"train_loss": -6.124547004699707, "global_step": 83331, "epoch": 1984} {"train_loss": -6.126123905181885, "global_step": 83332, "epoch": 1984} {"train_loss": -6.171307563781738, "global_step": 83333, "epoch": 1984} {"train_loss": -6.191584587097168, "global_step": 83334, "epoch": 1984} {"train_loss": -6.366493225097656, "global_step": 83335, "epoch": 1984} {"train_loss": -6.258618354797363, "global_step": 83336, "epoch": 1984} {"train_loss": -6.256153106689453, "global_step": 83337, "epoch": 1984} {"train_loss": -6.211314678192139, "global_step": 83338, "epoch": 1984} {"train_loss": -6.142152786254883, "global_step": 83339, "epoch": 1984} {"train_loss": -6.22049617767334, "global_step": 83340, "epoch": 1984} {"train_loss": -6.16305685043335, "global_step": 83341, "epoch": 1984} {"train_loss": -6.2658209800720215, "global_step": 83342, "epoch": 1984} {"train_loss": -6.180939674377441, "global_step": 83343, "epoch": 1984} {"train_loss": -6.205528736114502, "global_step": 83344, "epoch": 1984} {"train_loss": -6.31483268737793, "global_step": 83345, "epoch": 1984} {"train_loss": -6.127742290496826, "global_step": 83346, "epoch": 1984} {"train_loss": -6.193925857543945, "global_step": 83347, "epoch": 1984} {"train_loss": -6.154289245605469, "global_step": 83348, "epoch": 1984} {"train_loss": -6.159056663513184, "global_step": 83349, "epoch": 1984} {"train_loss": -6.219402313232422, "global_step": 83350, "epoch": 1984} {"train_loss": -6.201730728149414, "global_step": 83351, "epoch": 1984} {"train_loss": -6.130228042602539, "global_step": 83352, "epoch": 1984} {"train_loss": -6.298266410827637, "global_step": 83353, "epoch": 1984} {"train_loss": -6.218245983123779, "global_step": 83354, "epoch": 1984} {"train_loss": -6.042216777801514, "global_step": 83355, "epoch": 1984} {"train_loss": -6.136398792266846, "global_step": 83356, "epoch": 1984} {"train_loss": -6.096426010131836, "global_step": 83357, "epoch": 1984} {"train_loss": -6.089181423187256, "global_step": 83358, "epoch": 1984} {"train_loss": -6.224301338195801, "global_step": 83359, "epoch": 1984} {"train_loss": -6.111630916595459, "global_step": 83360, "epoch": 1984} {"train_loss": -6.147361755371094, "global_step": 83361, "epoch": 1984} {"train_loss": -6.15895938873291, "global_step": 83362, "epoch": 1984} {"train_loss": -6.115200996398926, "global_step": 83363, "epoch": 1984} {"train_loss": -6.178664207458496, "global_step": 83364, "epoch": 1984} {"train_loss": -6.176024436950684, "global_step": 83365, "epoch": 1984} {"train_loss": -6.102056503295898, "global_step": 83366, "epoch": 1984} {"train_loss": -6.178420066833496, "global_step": 83367, "epoch": 1984} {"train_loss": -6.102176666259766, "global_step": 83368, "epoch": 1984} {"train_loss": -6.1753310816628595, "global_step": 83369, "epoch": 1984, "val_loss": 75344.7421875} {"train_loss": -6.168468475341797, "global_step": 83370, "epoch": 1985} {"train_loss": -6.141502380371094, "global_step": 83371, "epoch": 1985} {"train_loss": -6.234254360198975, "global_step": 83372, "epoch": 1985} {"train_loss": -6.080245018005371, "global_step": 83373, "epoch": 1985} {"train_loss": -6.204064846038818, "global_step": 83374, "epoch": 1985} {"train_loss": -6.1296539306640625, "global_step": 83375, "epoch": 1985} {"train_loss": -6.1809539794921875, "global_step": 83376, "epoch": 1985} {"train_loss": -6.182504177093506, "global_step": 83377, "epoch": 1985} {"train_loss": -6.161998748779297, "global_step": 83378, "epoch": 1985} {"train_loss": -6.172764778137207, "global_step": 83379, "epoch": 1985} {"train_loss": -6.169353008270264, "global_step": 83380, "epoch": 1985} {"train_loss": -6.229520320892334, "global_step": 83381, "epoch": 1985} {"train_loss": -6.134574890136719, "global_step": 83382, "epoch": 1985} {"train_loss": -6.295398235321045, "global_step": 83383, "epoch": 1985} {"train_loss": -6.300370693206787, "global_step": 83384, "epoch": 1985} {"train_loss": -6.2236008644104, "global_step": 83385, "epoch": 1985} {"train_loss": -6.191412925720215, "global_step": 83386, "epoch": 1985} {"train_loss": -6.400524616241455, "global_step": 83387, "epoch": 1985} {"train_loss": -6.251832008361816, "global_step": 83388, "epoch": 1985} {"train_loss": -6.14140510559082, "global_step": 83389, "epoch": 1985} {"train_loss": -6.2522478103637695, "global_step": 83390, "epoch": 1985} {"train_loss": -6.236499786376953, "global_step": 83391, "epoch": 1985} {"train_loss": -6.131158828735352, "global_step": 83392, "epoch": 1985} {"train_loss": -6.2161126136779785, "global_step": 83393, "epoch": 1985} {"train_loss": -6.137852668762207, "global_step": 83394, "epoch": 1985} {"train_loss": -6.170758247375488, "global_step": 83395, "epoch": 1985} {"train_loss": -6.148163795471191, "global_step": 83396, "epoch": 1985} {"train_loss": -6.187186241149902, "global_step": 83397, "epoch": 1985} {"train_loss": -6.246165752410889, "global_step": 83398, "epoch": 1985} {"train_loss": -6.210880279541016, "global_step": 83399, "epoch": 1985} {"train_loss": -6.195364952087402, "global_step": 83400, "epoch": 1985} {"train_loss": -6.155486106872559, "global_step": 83401, "epoch": 1985} {"train_loss": -6.320859909057617, "global_step": 83402, "epoch": 1985} {"train_loss": -6.1825666427612305, "global_step": 83403, "epoch": 1985} {"train_loss": -6.241134166717529, "global_step": 83404, "epoch": 1985} {"train_loss": -6.164703369140625, "global_step": 83405, "epoch": 1985} {"train_loss": -6.115090370178223, "global_step": 83406, "epoch": 1985} {"train_loss": -6.251770496368408, "global_step": 83407, "epoch": 1985} {"train_loss": -6.245051383972168, "global_step": 83408, "epoch": 1985} {"train_loss": -6.17824125289917, "global_step": 83409, "epoch": 1985} {"train_loss": -6.151042938232422, "global_step": 83410, "epoch": 1985} {"train_loss": -6.1962324891771585, "global_step": 83411, "epoch": 1985, "val_loss": 75012.984375} {"train_loss": -6.205469608306885, "global_step": 83412, "epoch": 1986} {"train_loss": -6.248546600341797, "global_step": 83413, "epoch": 1986} {"train_loss": -6.322256088256836, "global_step": 83414, "epoch": 1986} {"train_loss": -6.220157146453857, "global_step": 83415, "epoch": 1986} {"train_loss": -6.065627098083496, "global_step": 83416, "epoch": 1986} {"train_loss": -6.140578746795654, "global_step": 83417, "epoch": 1986} {"train_loss": -6.134734630584717, "global_step": 83418, "epoch": 1986} {"train_loss": -6.1241559982299805, "global_step": 83419, "epoch": 1986} {"train_loss": -6.077782154083252, "global_step": 83420, "epoch": 1986} {"train_loss": -6.12923526763916, "global_step": 83421, "epoch": 1986} {"train_loss": -6.243149280548096, "global_step": 83422, "epoch": 1986} {"train_loss": -6.157444000244141, "global_step": 83423, "epoch": 1986} {"train_loss": -6.292450904846191, "global_step": 83424, "epoch": 1986} {"train_loss": -6.244558334350586, "global_step": 83425, "epoch": 1986} {"train_loss": -6.113497734069824, "global_step": 83426, "epoch": 1986} {"train_loss": -6.083410739898682, "global_step": 83427, "epoch": 1986} {"train_loss": -6.2271528244018555, "global_step": 83428, "epoch": 1986} {"train_loss": -6.140954494476318, "global_step": 83429, "epoch": 1986} {"train_loss": -6.174063205718994, "global_step": 83430, "epoch": 1986} {"train_loss": -6.194553375244141, "global_step": 83431, "epoch": 1986} {"train_loss": -6.193713188171387, "global_step": 83432, "epoch": 1986} {"train_loss": -6.097957611083984, "global_step": 83433, "epoch": 1986} {"train_loss": -6.243805885314941, "global_step": 83434, "epoch": 1986} {"train_loss": -6.239918231964111, "global_step": 83435, "epoch": 1986} {"train_loss": -6.1701483726501465, "global_step": 83436, "epoch": 1986} {"train_loss": -6.107445240020752, "global_step": 83437, "epoch": 1986} {"train_loss": -6.128523826599121, "global_step": 83438, "epoch": 1986} {"train_loss": -6.175871849060059, "global_step": 83439, "epoch": 1986} {"train_loss": -6.197285175323486, "global_step": 83440, "epoch": 1986} {"train_loss": -6.296483516693115, "global_step": 83441, "epoch": 1986} {"train_loss": -6.227929592132568, "global_step": 83442, "epoch": 1986} {"train_loss": -6.179689407348633, "global_step": 83443, "epoch": 1986} {"train_loss": -6.122644424438477, "global_step": 83444, "epoch": 1986} {"train_loss": -6.251428127288818, "global_step": 83445, "epoch": 1986} {"train_loss": -6.216897964477539, "global_step": 83446, "epoch": 1986} {"train_loss": -6.149772644042969, "global_step": 83447, "epoch": 1986} {"train_loss": -6.189682960510254, "global_step": 83448, "epoch": 1986} {"train_loss": -6.219078063964844, "global_step": 83449, "epoch": 1986} {"train_loss": -6.094764232635498, "global_step": 83450, "epoch": 1986} {"train_loss": -6.174306869506836, "global_step": 83451, "epoch": 1986} {"train_loss": -6.320322513580322, "global_step": 83452, "epoch": 1986} {"train_loss": -6.184203261420841, "global_step": 83453, "epoch": 1986, "val_loss": 75255.78125} {"train_loss": -6.190296173095703, "global_step": 83454, "epoch": 1987} {"train_loss": -6.2139739990234375, "global_step": 83455, "epoch": 1987} {"train_loss": -6.118746757507324, "global_step": 83456, "epoch": 1987} {"train_loss": -6.215257167816162, "global_step": 83457, "epoch": 1987} {"train_loss": -6.177173614501953, "global_step": 83458, "epoch": 1987} {"train_loss": -6.074544906616211, "global_step": 83459, "epoch": 1987} {"train_loss": -6.204776763916016, "global_step": 83460, "epoch": 1987} {"train_loss": -6.140775680541992, "global_step": 83461, "epoch": 1987} {"train_loss": -6.183445453643799, "global_step": 83462, "epoch": 1987} {"train_loss": -6.175743103027344, "global_step": 83463, "epoch": 1987} {"train_loss": -6.311318397521973, "global_step": 83464, "epoch": 1987} {"train_loss": -6.151917457580566, "global_step": 83465, "epoch": 1987} {"train_loss": -6.158880233764648, "global_step": 83466, "epoch": 1987} {"train_loss": -6.230605602264404, "global_step": 83467, "epoch": 1987} {"train_loss": -6.144708156585693, "global_step": 83468, "epoch": 1987} {"train_loss": -6.227849960327148, "global_step": 83469, "epoch": 1987} {"train_loss": -6.233259677886963, "global_step": 83470, "epoch": 1987} {"train_loss": -6.148375988006592, "global_step": 83471, "epoch": 1987} {"train_loss": -6.214889049530029, "global_step": 83472, "epoch": 1987} {"train_loss": -6.244595527648926, "global_step": 83473, "epoch": 1987} {"train_loss": -6.2143120765686035, "global_step": 83474, "epoch": 1987} {"train_loss": -6.210346221923828, "global_step": 83475, "epoch": 1987} {"train_loss": -6.138429641723633, "global_step": 83476, "epoch": 1987} {"train_loss": -6.178811073303223, "global_step": 83477, "epoch": 1987} {"train_loss": -6.106176376342773, "global_step": 83478, "epoch": 1987} {"train_loss": -6.164435863494873, "global_step": 83479, "epoch": 1987} {"train_loss": -6.260789394378662, "global_step": 83480, "epoch": 1987} {"train_loss": -6.157932281494141, "global_step": 83481, "epoch": 1987} {"train_loss": -6.172236919403076, "global_step": 83482, "epoch": 1987} {"train_loss": -6.128979206085205, "global_step": 83483, "epoch": 1987} {"train_loss": -6.17596435546875, "global_step": 83484, "epoch": 1987} {"train_loss": -6.253742694854736, "global_step": 83485, "epoch": 1987} {"train_loss": -6.154436111450195, "global_step": 83486, "epoch": 1987} {"train_loss": -6.022995471954346, "global_step": 83487, "epoch": 1987} {"train_loss": -6.088964462280273, "global_step": 83488, "epoch": 1987} {"train_loss": -6.1593194007873535, "global_step": 83489, "epoch": 1987} {"train_loss": -6.200088977813721, "global_step": 83490, "epoch": 1987} {"train_loss": -6.113382339477539, "global_step": 83491, "epoch": 1987} {"train_loss": -6.148106575012207, "global_step": 83492, "epoch": 1987} {"train_loss": -6.018345832824707, "global_step": 83493, "epoch": 1987} {"train_loss": -6.116815567016602, "global_step": 83494, "epoch": 1987} {"train_loss": -6.169664178575788, "global_step": 83495, "epoch": 1987, "val_loss": 75299.2421875} {"train_loss": -6.098537445068359, "global_step": 83496, "epoch": 1988} {"train_loss": -6.1054229736328125, "global_step": 83497, "epoch": 1988} {"train_loss": -6.109076499938965, "global_step": 83498, "epoch": 1988} {"train_loss": -6.125394821166992, "global_step": 83499, "epoch": 1988} {"train_loss": -6.074172496795654, "global_step": 83500, "epoch": 1988} {"train_loss": -6.115078926086426, "global_step": 83501, "epoch": 1988} {"train_loss": -6.104776859283447, "global_step": 83502, "epoch": 1988} {"train_loss": -6.1044230461120605, "global_step": 83503, "epoch": 1988} {"train_loss": -6.148853302001953, "global_step": 83504, "epoch": 1988} {"train_loss": -6.086939811706543, "global_step": 83505, "epoch": 1988} {"train_loss": -6.032332420349121, "global_step": 83506, "epoch": 1988} {"train_loss": -6.017952919006348, "global_step": 83507, "epoch": 1988} {"train_loss": -5.951984405517578, "global_step": 83508, "epoch": 1988} {"train_loss": -6.087869167327881, "global_step": 83509, "epoch": 1988} {"train_loss": -5.9475250244140625, "global_step": 83510, "epoch": 1988} {"train_loss": -6.215721607208252, "global_step": 83511, "epoch": 1988} {"train_loss": -6.109720706939697, "global_step": 83512, "epoch": 1988} {"train_loss": -6.2853922843933105, "global_step": 83513, "epoch": 1988} {"train_loss": -6.259305000305176, "global_step": 83514, "epoch": 1988} {"train_loss": -6.0782318115234375, "global_step": 83515, "epoch": 1988} {"train_loss": -6.128578186035156, "global_step": 83516, "epoch": 1988} {"train_loss": -6.0190229415893555, "global_step": 83517, "epoch": 1988} {"train_loss": -6.048603534698486, "global_step": 83518, "epoch": 1988} {"train_loss": -6.160060882568359, "global_step": 83519, "epoch": 1988} {"train_loss": -6.168454647064209, "global_step": 83520, "epoch": 1988} {"train_loss": -6.089423179626465, "global_step": 83521, "epoch": 1988} {"train_loss": -6.231595993041992, "global_step": 83522, "epoch": 1988} {"train_loss": -6.270529270172119, "global_step": 83523, "epoch": 1988} {"train_loss": -6.265931606292725, "global_step": 83524, "epoch": 1988} {"train_loss": -6.220808029174805, "global_step": 83525, "epoch": 1988} {"train_loss": -6.167564392089844, "global_step": 83526, "epoch": 1988} {"train_loss": -6.238061904907227, "global_step": 83527, "epoch": 1988} {"train_loss": -6.121634483337402, "global_step": 83528, "epoch": 1988} {"train_loss": -6.153217315673828, "global_step": 83529, "epoch": 1988} {"train_loss": -6.140251636505127, "global_step": 83530, "epoch": 1988} {"train_loss": -6.125635623931885, "global_step": 83531, "epoch": 1988} {"train_loss": -6.187747001647949, "global_step": 83532, "epoch": 1988} {"train_loss": -6.129105567932129, "global_step": 83533, "epoch": 1988} {"train_loss": -6.131772994995117, "global_step": 83534, "epoch": 1988} {"train_loss": -6.081088066101074, "global_step": 83535, "epoch": 1988} {"train_loss": -6.107568740844727, "global_step": 83536, "epoch": 1988} {"train_loss": -6.1270393416995095, "global_step": 83537, "epoch": 1988, "val_loss": 75030.75} {"train_loss": -6.121767044067383, "global_step": 83538, "epoch": 1989} {"train_loss": -6.158093452453613, "global_step": 83539, "epoch": 1989} {"train_loss": -6.039480209350586, "global_step": 83540, "epoch": 1989} {"train_loss": -6.235244274139404, "global_step": 83541, "epoch": 1989} {"train_loss": -6.009145736694336, "global_step": 83542, "epoch": 1989} {"train_loss": -6.150124549865723, "global_step": 83543, "epoch": 1989} {"train_loss": -6.173027038574219, "global_step": 83544, "epoch": 1989} {"train_loss": -6.223691940307617, "global_step": 83545, "epoch": 1989} {"train_loss": -6.196428298950195, "global_step": 83546, "epoch": 1989} {"train_loss": -6.1275739669799805, "global_step": 83547, "epoch": 1989} {"train_loss": -6.147669792175293, "global_step": 83548, "epoch": 1989} {"train_loss": -6.256956100463867, "global_step": 83549, "epoch": 1989} {"train_loss": -6.1727776527404785, "global_step": 83550, "epoch": 1989} {"train_loss": -6.267060279846191, "global_step": 83551, "epoch": 1989} {"train_loss": -6.175441741943359, "global_step": 83552, "epoch": 1989} {"train_loss": -6.1444621086120605, "global_step": 83553, "epoch": 1989} {"train_loss": -6.064233779907227, "global_step": 83554, "epoch": 1989} {"train_loss": -6.194535255432129, "global_step": 83555, "epoch": 1989} {"train_loss": -6.162402153015137, "global_step": 83556, "epoch": 1989} {"train_loss": -6.215583324432373, "global_step": 83557, "epoch": 1989} {"train_loss": -6.227377891540527, "global_step": 83558, "epoch": 1989} {"train_loss": -6.275796890258789, "global_step": 83559, "epoch": 1989} {"train_loss": -6.177867889404297, "global_step": 83560, "epoch": 1989} {"train_loss": -6.292140960693359, "global_step": 83561, "epoch": 1989} {"train_loss": -6.102365970611572, "global_step": 83562, "epoch": 1989} {"train_loss": -6.1961188316345215, "global_step": 83563, "epoch": 1989} {"train_loss": -6.374032497406006, "global_step": 83564, "epoch": 1989} {"train_loss": -6.2183003425598145, "global_step": 83565, "epoch": 1989} {"train_loss": -6.214030742645264, "global_step": 83566, "epoch": 1989} {"train_loss": -6.224259853363037, "global_step": 83567, "epoch": 1989} {"train_loss": -6.060644149780273, "global_step": 83568, "epoch": 1989} {"train_loss": -6.051702499389648, "global_step": 83569, "epoch": 1989} {"train_loss": -6.172738552093506, "global_step": 83570, "epoch": 1989} {"train_loss": -6.186222076416016, "global_step": 83571, "epoch": 1989} {"train_loss": -6.014679908752441, "global_step": 83572, "epoch": 1989} {"train_loss": -6.132458686828613, "global_step": 83573, "epoch": 1989} {"train_loss": -6.229936122894287, "global_step": 83574, "epoch": 1989} {"train_loss": -6.173708915710449, "global_step": 83575, "epoch": 1989} {"train_loss": -6.182989120483398, "global_step": 83576, "epoch": 1989} {"train_loss": -6.217175483703613, "global_step": 83577, "epoch": 1989} {"train_loss": -6.0826311111450195, "global_step": 83578, "epoch": 1989} {"train_loss": -6.168288140069871, "global_step": 83579, "epoch": 1989, "val_loss": 75202.5703125} {"train_loss": -6.243766784667969, "global_step": 83580, "epoch": 1990} {"train_loss": -6.20838737487793, "global_step": 83581, "epoch": 1990} {"train_loss": -6.083450794219971, "global_step": 83582, "epoch": 1990} {"train_loss": -6.161616325378418, "global_step": 83583, "epoch": 1990} {"train_loss": -6.201409816741943, "global_step": 83584, "epoch": 1990} {"train_loss": -6.03021240234375, "global_step": 83585, "epoch": 1990} {"train_loss": -6.193836212158203, "global_step": 83586, "epoch": 1990} {"train_loss": -6.191392421722412, "global_step": 83587, "epoch": 1990} {"train_loss": -6.00721549987793, "global_step": 83588, "epoch": 1990} {"train_loss": -6.142416954040527, "global_step": 83589, "epoch": 1990} {"train_loss": -6.089828968048096, "global_step": 83590, "epoch": 1990} {"train_loss": -6.0485124588012695, "global_step": 83591, "epoch": 1990} {"train_loss": -6.085393905639648, "global_step": 83592, "epoch": 1990} {"train_loss": -5.980807304382324, "global_step": 83593, "epoch": 1990} {"train_loss": -6.229686737060547, "global_step": 83594, "epoch": 1990} {"train_loss": -5.897664546966553, "global_step": 83595, "epoch": 1990} {"train_loss": -6.0587639808654785, "global_step": 83596, "epoch": 1990} {"train_loss": -6.08259916305542, "global_step": 83597, "epoch": 1990} {"train_loss": -5.924381256103516, "global_step": 83598, "epoch": 1990} {"train_loss": -6.024767875671387, "global_step": 83599, "epoch": 1990} {"train_loss": -6.187634468078613, "global_step": 83600, "epoch": 1990} {"train_loss": -6.1463422775268555, "global_step": 83601, "epoch": 1990} {"train_loss": -6.042050361633301, "global_step": 83602, "epoch": 1990} {"train_loss": -6.183824062347412, "global_step": 83603, "epoch": 1990} {"train_loss": -6.042363166809082, "global_step": 83604, "epoch": 1990} {"train_loss": -6.074974060058594, "global_step": 83605, "epoch": 1990} {"train_loss": -6.132724761962891, "global_step": 83606, "epoch": 1990} {"train_loss": -6.144176006317139, "global_step": 83607, "epoch": 1990} {"train_loss": -6.066155433654785, "global_step": 83608, "epoch": 1990} {"train_loss": -6.106109142303467, "global_step": 83609, "epoch": 1990} {"train_loss": -6.036805152893066, "global_step": 83610, "epoch": 1990} {"train_loss": -6.218821048736572, "global_step": 83611, "epoch": 1990} {"train_loss": -6.187319755554199, "global_step": 83612, "epoch": 1990} {"train_loss": -6.019449710845947, "global_step": 83613, "epoch": 1990} {"train_loss": -6.151304244995117, "global_step": 83614, "epoch": 1990} {"train_loss": -6.168814659118652, "global_step": 83615, "epoch": 1990} {"train_loss": -6.060144424438477, "global_step": 83616, "epoch": 1990} {"train_loss": -6.1159772872924805, "global_step": 83617, "epoch": 1990} {"train_loss": -6.288917064666748, "global_step": 83618, "epoch": 1990} {"train_loss": -6.2565765380859375, "global_step": 83619, "epoch": 1990} {"train_loss": -6.1393585205078125, "global_step": 83620, "epoch": 1990} {"train_loss": -6.117972873506092, "global_step": 83621, "epoch": 1990, "val_loss": 75274.78125} {"train_loss": -6.169749736785889, "global_step": 83622, "epoch": 1991} {"train_loss": -6.2166643142700195, "global_step": 83623, "epoch": 1991} {"train_loss": -6.155887603759766, "global_step": 83624, "epoch": 1991} {"train_loss": -6.170934677124023, "global_step": 83625, "epoch": 1991} {"train_loss": -6.118494033813477, "global_step": 83626, "epoch": 1991} {"train_loss": -6.263692855834961, "global_step": 83627, "epoch": 1991} {"train_loss": -6.1673583984375, "global_step": 83628, "epoch": 1991} {"train_loss": -6.330312728881836, "global_step": 83629, "epoch": 1991} {"train_loss": -6.056114196777344, "global_step": 83630, "epoch": 1991} {"train_loss": -6.1272735595703125, "global_step": 83631, "epoch": 1991} {"train_loss": -6.051994323730469, "global_step": 83632, "epoch": 1991} {"train_loss": -6.204914569854736, "global_step": 83633, "epoch": 1991} {"train_loss": -6.081288814544678, "global_step": 83634, "epoch": 1991} {"train_loss": -6.205290794372559, "global_step": 83635, "epoch": 1991} {"train_loss": -6.160492897033691, "global_step": 83636, "epoch": 1991} {"train_loss": -6.32476282119751, "global_step": 83637, "epoch": 1991} {"train_loss": -6.2046308517456055, "global_step": 83638, "epoch": 1991} {"train_loss": -6.1587233543396, "global_step": 83639, "epoch": 1991} {"train_loss": -6.119753837585449, "global_step": 83640, "epoch": 1991} {"train_loss": -6.30933952331543, "global_step": 83641, "epoch": 1991} {"train_loss": -6.136486053466797, "global_step": 83642, "epoch": 1991} {"train_loss": -6.245418548583984, "global_step": 83643, "epoch": 1991} {"train_loss": -6.305689811706543, "global_step": 83644, "epoch": 1991} {"train_loss": -6.138127326965332, "global_step": 83645, "epoch": 1991} {"train_loss": -6.184242248535156, "global_step": 83646, "epoch": 1991} {"train_loss": -6.197347164154053, "global_step": 83647, "epoch": 1991} {"train_loss": -6.192789077758789, "global_step": 83648, "epoch": 1991} {"train_loss": -6.21311092376709, "global_step": 83649, "epoch": 1991} {"train_loss": -6.258274078369141, "global_step": 83650, "epoch": 1991} {"train_loss": -6.260929107666016, "global_step": 83651, "epoch": 1991} {"train_loss": -6.120391368865967, "global_step": 83652, "epoch": 1991} {"train_loss": -6.225754261016846, "global_step": 83653, "epoch": 1991} {"train_loss": -6.223521709442139, "global_step": 83654, "epoch": 1991} {"train_loss": -6.100150108337402, "global_step": 83655, "epoch": 1991} {"train_loss": -6.159960746765137, "global_step": 83656, "epoch": 1991} {"train_loss": -6.167706489562988, "global_step": 83657, "epoch": 1991} {"train_loss": -6.03184700012207, "global_step": 83658, "epoch": 1991} {"train_loss": -6.216670513153076, "global_step": 83659, "epoch": 1991} {"train_loss": -6.071942329406738, "global_step": 83660, "epoch": 1991} {"train_loss": -6.082692623138428, "global_step": 83661, "epoch": 1991} {"train_loss": -6.208966255187988, "global_step": 83662, "epoch": 1991} {"train_loss": -6.17848937852042, "global_step": 83663, "epoch": 1991, "val_loss": 75309.6953125} {"train_loss": -6.146047592163086, "global_step": 83664, "epoch": 1992} {"train_loss": -6.039996147155762, "global_step": 83665, "epoch": 1992} {"train_loss": -6.127730369567871, "global_step": 83666, "epoch": 1992} {"train_loss": -6.245243072509766, "global_step": 83667, "epoch": 1992} {"train_loss": -6.063498020172119, "global_step": 83668, "epoch": 1992} {"train_loss": -6.198076248168945, "global_step": 83669, "epoch": 1992} {"train_loss": -6.204715728759766, "global_step": 83670, "epoch": 1992} {"train_loss": -6.220331192016602, "global_step": 83671, "epoch": 1992} {"train_loss": -6.117730617523193, "global_step": 83672, "epoch": 1992} {"train_loss": -6.151989459991455, "global_step": 83673, "epoch": 1992} {"train_loss": -6.085817813873291, "global_step": 83674, "epoch": 1992} {"train_loss": -6.162447929382324, "global_step": 83675, "epoch": 1992} {"train_loss": -6.176535606384277, "global_step": 83676, "epoch": 1992} {"train_loss": -6.140018463134766, "global_step": 83677, "epoch": 1992} {"train_loss": -6.189507484436035, "global_step": 83678, "epoch": 1992} {"train_loss": -6.136268138885498, "global_step": 83679, "epoch": 1992} {"train_loss": -6.136685848236084, "global_step": 83680, "epoch": 1992} {"train_loss": -6.270662784576416, "global_step": 83681, "epoch": 1992} {"train_loss": -6.121692657470703, "global_step": 83682, "epoch": 1992} {"train_loss": -6.1576385498046875, "global_step": 83683, "epoch": 1992} {"train_loss": -6.189340591430664, "global_step": 83684, "epoch": 1992} {"train_loss": -6.227484703063965, "global_step": 83685, "epoch": 1992} {"train_loss": -6.078316688537598, "global_step": 83686, "epoch": 1992} {"train_loss": -6.227332592010498, "global_step": 83687, "epoch": 1992} {"train_loss": -6.059085369110107, "global_step": 83688, "epoch": 1992} {"train_loss": -6.144353866577148, "global_step": 83689, "epoch": 1992} {"train_loss": -6.179430961608887, "global_step": 83690, "epoch": 1992} {"train_loss": -6.179924964904785, "global_step": 83691, "epoch": 1992} {"train_loss": -6.137503623962402, "global_step": 83692, "epoch": 1992} {"train_loss": -6.25545072555542, "global_step": 83693, "epoch": 1992} {"train_loss": -6.205849647521973, "global_step": 83694, "epoch": 1992} {"train_loss": -6.16409969329834, "global_step": 83695, "epoch": 1992} {"train_loss": -6.280228137969971, "global_step": 83696, "epoch": 1992} {"train_loss": -6.132784843444824, "global_step": 83697, "epoch": 1992} {"train_loss": -6.26002311706543, "global_step": 83698, "epoch": 1992} {"train_loss": -6.223982810974121, "global_step": 83699, "epoch": 1992} {"train_loss": -6.164936065673828, "global_step": 83700, "epoch": 1992} {"train_loss": -6.134407997131348, "global_step": 83701, "epoch": 1992} {"train_loss": -6.193426132202148, "global_step": 83702, "epoch": 1992} {"train_loss": -6.1415839195251465, "global_step": 83703, "epoch": 1992} {"train_loss": -6.176118850708008, "global_step": 83704, "epoch": 1992} {"train_loss": -6.167649530229115, "global_step": 83705, "epoch": 1992, "val_loss": 74788.4375} {"train_loss": -6.210638046264648, "global_step": 83706, "epoch": 1993} {"train_loss": -6.062356948852539, "global_step": 83707, "epoch": 1993} {"train_loss": -6.209017753601074, "global_step": 83708, "epoch": 1993} {"train_loss": -6.135550498962402, "global_step": 83709, "epoch": 1993} {"train_loss": -6.046596050262451, "global_step": 83710, "epoch": 1993} {"train_loss": -6.103668212890625, "global_step": 83711, "epoch": 1993} {"train_loss": -6.1986894607543945, "global_step": 83712, "epoch": 1993} {"train_loss": -6.126845359802246, "global_step": 83713, "epoch": 1993} {"train_loss": -6.162838935852051, "global_step": 83714, "epoch": 1993} {"train_loss": -6.186408996582031, "global_step": 83715, "epoch": 1993} {"train_loss": -6.190011978149414, "global_step": 83716, "epoch": 1993} {"train_loss": -6.209829807281494, "global_step": 83717, "epoch": 1993} {"train_loss": -6.104565620422363, "global_step": 83718, "epoch": 1993} {"train_loss": -6.246998310089111, "global_step": 83719, "epoch": 1993} {"train_loss": -6.216299057006836, "global_step": 83720, "epoch": 1993} {"train_loss": -6.178097724914551, "global_step": 83721, "epoch": 1993} {"train_loss": -6.159513473510742, "global_step": 83722, "epoch": 1993} {"train_loss": -6.3084821701049805, "global_step": 83723, "epoch": 1993} {"train_loss": -6.239977836608887, "global_step": 83724, "epoch": 1993} {"train_loss": -6.065431594848633, "global_step": 83725, "epoch": 1993} {"train_loss": -6.282987594604492, "global_step": 83726, "epoch": 1993} {"train_loss": -6.0587005615234375, "global_step": 83727, "epoch": 1993} {"train_loss": -6.1093316078186035, "global_step": 83728, "epoch": 1993} {"train_loss": -6.263136863708496, "global_step": 83729, "epoch": 1993} {"train_loss": -6.144867420196533, "global_step": 83730, "epoch": 1993} {"train_loss": -6.243927955627441, "global_step": 83731, "epoch": 1993} {"train_loss": -6.17222785949707, "global_step": 83732, "epoch": 1993} {"train_loss": -6.1378607749938965, "global_step": 83733, "epoch": 1993} {"train_loss": -6.072126865386963, "global_step": 83734, "epoch": 1993} {"train_loss": -6.1838483810424805, "global_step": 83735, "epoch": 1993} {"train_loss": -6.141632556915283, "global_step": 83736, "epoch": 1993} {"train_loss": -6.271969795227051, "global_step": 83737, "epoch": 1993} {"train_loss": -6.130193710327148, "global_step": 83738, "epoch": 1993} {"train_loss": -6.153592109680176, "global_step": 83739, "epoch": 1993} {"train_loss": -6.193130970001221, "global_step": 83740, "epoch": 1993} {"train_loss": -6.059510707855225, "global_step": 83741, "epoch": 1993} {"train_loss": -6.245414733886719, "global_step": 83742, "epoch": 1993} {"train_loss": -6.22266960144043, "global_step": 83743, "epoch": 1993} {"train_loss": -6.169658660888672, "global_step": 83744, "epoch": 1993} {"train_loss": -6.06429386138916, "global_step": 83745, "epoch": 1993} {"train_loss": -6.128311634063721, "global_step": 83746, "epoch": 1993} {"train_loss": -6.167705388296218, "global_step": 83747, "epoch": 1993, "val_loss": 75234.671875} {"train_loss": -6.147525787353516, "global_step": 83748, "epoch": 1994} {"train_loss": -6.241504192352295, "global_step": 83749, "epoch": 1994} {"train_loss": -6.189968109130859, "global_step": 83750, "epoch": 1994} {"train_loss": -6.16834831237793, "global_step": 83751, "epoch": 1994} {"train_loss": -6.149049758911133, "global_step": 83752, "epoch": 1994} {"train_loss": -6.133265495300293, "global_step": 83753, "epoch": 1994} {"train_loss": -6.2245774269104, "global_step": 83754, "epoch": 1994} {"train_loss": -6.117090702056885, "global_step": 83755, "epoch": 1994} {"train_loss": -6.13746976852417, "global_step": 83756, "epoch": 1994} {"train_loss": -6.165620803833008, "global_step": 83757, "epoch": 1994} {"train_loss": -6.171881198883057, "global_step": 83758, "epoch": 1994} {"train_loss": -6.215489387512207, "global_step": 83759, "epoch": 1994} {"train_loss": -6.216266632080078, "global_step": 83760, "epoch": 1994} {"train_loss": -6.092329025268555, "global_step": 83761, "epoch": 1994} {"train_loss": -6.199359893798828, "global_step": 83762, "epoch": 1994} {"train_loss": -6.19326114654541, "global_step": 83763, "epoch": 1994} {"train_loss": -6.172876834869385, "global_step": 83764, "epoch": 1994} {"train_loss": -6.157076835632324, "global_step": 83765, "epoch": 1994} {"train_loss": -6.168682098388672, "global_step": 83766, "epoch": 1994} {"train_loss": -6.025021553039551, "global_step": 83767, "epoch": 1994} {"train_loss": -6.167996406555176, "global_step": 83768, "epoch": 1994} {"train_loss": -6.241086959838867, "global_step": 83769, "epoch": 1994} {"train_loss": -6.195318698883057, "global_step": 83770, "epoch": 1994} {"train_loss": -6.307442665100098, "global_step": 83771, "epoch": 1994} {"train_loss": -6.196115493774414, "global_step": 83772, "epoch": 1994} {"train_loss": -6.130676746368408, "global_step": 83773, "epoch": 1994} {"train_loss": -6.1454644203186035, "global_step": 83774, "epoch": 1994} {"train_loss": -6.210735321044922, "global_step": 83775, "epoch": 1994} {"train_loss": -6.296998977661133, "global_step": 83776, "epoch": 1994} {"train_loss": -6.094611167907715, "global_step": 83777, "epoch": 1994} {"train_loss": -6.201208591461182, "global_step": 83778, "epoch": 1994} {"train_loss": -6.169839859008789, "global_step": 83779, "epoch": 1994} {"train_loss": -6.2522501945495605, "global_step": 83780, "epoch": 1994} {"train_loss": -6.207887649536133, "global_step": 83781, "epoch": 1994} {"train_loss": -6.101980209350586, "global_step": 83782, "epoch": 1994} {"train_loss": -6.326563835144043, "global_step": 83783, "epoch": 1994} {"train_loss": -6.276227951049805, "global_step": 83784, "epoch": 1994} {"train_loss": -6.134906768798828, "global_step": 83785, "epoch": 1994} {"train_loss": -6.200571060180664, "global_step": 83786, "epoch": 1994} {"train_loss": -6.249118804931641, "global_step": 83787, "epoch": 1994} {"train_loss": -6.1964616775512695, "global_step": 83788, "epoch": 1994} {"train_loss": -6.184325138727824, "global_step": 83789, "epoch": 1994, "val_loss": 74922.359375} {"train_loss": -6.259577751159668, "global_step": 83790, "epoch": 1995} {"train_loss": -6.2981719970703125, "global_step": 83791, "epoch": 1995} {"train_loss": -6.1112060546875, "global_step": 83792, "epoch": 1995} {"train_loss": -6.218216896057129, "global_step": 83793, "epoch": 1995} {"train_loss": -6.267952919006348, "global_step": 83794, "epoch": 1995} {"train_loss": -6.192576885223389, "global_step": 83795, "epoch": 1995} {"train_loss": -6.168648719787598, "global_step": 83796, "epoch": 1995} {"train_loss": -6.1041669845581055, "global_step": 83797, "epoch": 1995} {"train_loss": -6.231504917144775, "global_step": 83798, "epoch": 1995} {"train_loss": -6.17405891418457, "global_step": 83799, "epoch": 1995} {"train_loss": -6.182515621185303, "global_step": 83800, "epoch": 1995} {"train_loss": -6.2046074867248535, "global_step": 83801, "epoch": 1995} {"train_loss": -6.243782043457031, "global_step": 83802, "epoch": 1995} {"train_loss": -6.1419572830200195, "global_step": 83803, "epoch": 1995} {"train_loss": -6.263745307922363, "global_step": 83804, "epoch": 1995} {"train_loss": -6.161322116851807, "global_step": 83805, "epoch": 1995} {"train_loss": -6.131706237792969, "global_step": 83806, "epoch": 1995} {"train_loss": -6.18463659286499, "global_step": 83807, "epoch": 1995} {"train_loss": -6.158965110778809, "global_step": 83808, "epoch": 1995} {"train_loss": -6.377418518066406, "global_step": 83809, "epoch": 1995} {"train_loss": -6.161995887756348, "global_step": 83810, "epoch": 1995} {"train_loss": -6.280156135559082, "global_step": 83811, "epoch": 1995} {"train_loss": -6.210931301116943, "global_step": 83812, "epoch": 1995} {"train_loss": -6.286029815673828, "global_step": 83813, "epoch": 1995} {"train_loss": -6.240289688110352, "global_step": 83814, "epoch": 1995} {"train_loss": -6.204836845397949, "global_step": 83815, "epoch": 1995} {"train_loss": -6.1344804763793945, "global_step": 83816, "epoch": 1995} {"train_loss": -6.212118625640869, "global_step": 83817, "epoch": 1995} {"train_loss": -6.245151519775391, "global_step": 83818, "epoch": 1995} {"train_loss": -6.1738457679748535, "global_step": 83819, "epoch": 1995} {"train_loss": -6.074759006500244, "global_step": 83820, "epoch": 1995} {"train_loss": -6.175877094268799, "global_step": 83821, "epoch": 1995} {"train_loss": -6.200521469116211, "global_step": 83822, "epoch": 1995} {"train_loss": -6.14168643951416, "global_step": 83823, "epoch": 1995} {"train_loss": -6.170100212097168, "global_step": 83824, "epoch": 1995} {"train_loss": -6.1336469650268555, "global_step": 83825, "epoch": 1995} {"train_loss": -6.158696174621582, "global_step": 83826, "epoch": 1995} {"train_loss": -6.146556854248047, "global_step": 83827, "epoch": 1995} {"train_loss": -6.154840469360352, "global_step": 83828, "epoch": 1995} {"train_loss": -6.198215484619141, "global_step": 83829, "epoch": 1995} {"train_loss": -6.032628059387207, "global_step": 83830, "epoch": 1995} {"train_loss": -6.191237472352528, "global_step": 83831, "epoch": 1995, "val_loss": 75043.109375} {"train_loss": -6.235063076019287, "global_step": 83832, "epoch": 1996} {"train_loss": -6.187760353088379, "global_step": 83833, "epoch": 1996} {"train_loss": -6.156897068023682, "global_step": 83834, "epoch": 1996} {"train_loss": -6.127803325653076, "global_step": 83835, "epoch": 1996} {"train_loss": -6.159328460693359, "global_step": 83836, "epoch": 1996} {"train_loss": -6.120607852935791, "global_step": 83837, "epoch": 1996} {"train_loss": -6.15192985534668, "global_step": 83838, "epoch": 1996} {"train_loss": -6.218127250671387, "global_step": 83839, "epoch": 1996} {"train_loss": -6.1234893798828125, "global_step": 83840, "epoch": 1996} {"train_loss": -6.102837085723877, "global_step": 83841, "epoch": 1996} {"train_loss": -6.184947490692139, "global_step": 83842, "epoch": 1996} {"train_loss": -6.164280891418457, "global_step": 83843, "epoch": 1996} {"train_loss": -6.133458137512207, "global_step": 83844, "epoch": 1996} {"train_loss": -6.170173645019531, "global_step": 83845, "epoch": 1996} {"train_loss": -6.239107131958008, "global_step": 83846, "epoch": 1996} {"train_loss": -6.117942810058594, "global_step": 83847, "epoch": 1996} {"train_loss": -6.19147253036499, "global_step": 83848, "epoch": 1996} {"train_loss": -6.2230987548828125, "global_step": 83849, "epoch": 1996} {"train_loss": -6.215000152587891, "global_step": 83850, "epoch": 1996} {"train_loss": -6.216732978820801, "global_step": 83851, "epoch": 1996} {"train_loss": -6.200605392456055, "global_step": 83852, "epoch": 1996} {"train_loss": -6.279028415679932, "global_step": 83853, "epoch": 1996} {"train_loss": -6.246247291564941, "global_step": 83854, "epoch": 1996} {"train_loss": -6.168156623840332, "global_step": 83855, "epoch": 1996} {"train_loss": -6.1602678298950195, "global_step": 83856, "epoch": 1996} {"train_loss": -6.270473957061768, "global_step": 83857, "epoch": 1996} {"train_loss": -6.121288299560547, "global_step": 83858, "epoch": 1996} {"train_loss": -6.11568546295166, "global_step": 83859, "epoch": 1996} {"train_loss": -6.231771469116211, "global_step": 83860, "epoch": 1996} {"train_loss": -6.131082534790039, "global_step": 83861, "epoch": 1996} {"train_loss": -6.176501750946045, "global_step": 83862, "epoch": 1996} {"train_loss": -6.19671630859375, "global_step": 83863, "epoch": 1996} {"train_loss": -6.190361976623535, "global_step": 83864, "epoch": 1996} {"train_loss": -6.22226619720459, "global_step": 83865, "epoch": 1996} {"train_loss": -6.1708173751831055, "global_step": 83866, "epoch": 1996} {"train_loss": -6.150300025939941, "global_step": 83867, "epoch": 1996} {"train_loss": -6.11232852935791, "global_step": 83868, "epoch": 1996} {"train_loss": -6.092545509338379, "global_step": 83869, "epoch": 1996} {"train_loss": -6.136762619018555, "global_step": 83870, "epoch": 1996} {"train_loss": -6.069925308227539, "global_step": 83871, "epoch": 1996} {"train_loss": -6.142436981201172, "global_step": 83872, "epoch": 1996} {"train_loss": -6.168753317424229, "global_step": 83873, "epoch": 1996, "val_loss": 75559.7578125} {"train_loss": -5.926818370819092, "global_step": 83874, "epoch": 1997} {"train_loss": -6.194948673248291, "global_step": 83875, "epoch": 1997} {"train_loss": -6.075068473815918, "global_step": 83876, "epoch": 1997} {"train_loss": -6.192519664764404, "global_step": 83877, "epoch": 1997} {"train_loss": -6.11756706237793, "global_step": 83878, "epoch": 1997} {"train_loss": -6.2367095947265625, "global_step": 83879, "epoch": 1997} {"train_loss": -6.099851608276367, "global_step": 83880, "epoch": 1997} {"train_loss": -6.206966400146484, "global_step": 83881, "epoch": 1997} {"train_loss": -6.199319839477539, "global_step": 83882, "epoch": 1997} {"train_loss": -6.119623184204102, "global_step": 83883, "epoch": 1997} {"train_loss": -6.210953712463379, "global_step": 83884, "epoch": 1997} {"train_loss": -6.24606466293335, "global_step": 83885, "epoch": 1997} {"train_loss": -6.128814697265625, "global_step": 83886, "epoch": 1997} {"train_loss": -6.177088737487793, "global_step": 83887, "epoch": 1997} {"train_loss": -6.1678290367126465, "global_step": 83888, "epoch": 1997} {"train_loss": -6.135724067687988, "global_step": 83889, "epoch": 1997} {"train_loss": -6.25015926361084, "global_step": 83890, "epoch": 1997} {"train_loss": -6.090246200561523, "global_step": 83891, "epoch": 1997} {"train_loss": -6.271228790283203, "global_step": 83892, "epoch": 1997} {"train_loss": -6.145875930786133, "global_step": 83893, "epoch": 1997} {"train_loss": -6.257124900817871, "global_step": 83894, "epoch": 1997} {"train_loss": -6.225530624389648, "global_step": 83895, "epoch": 1997} {"train_loss": -6.232178688049316, "global_step": 83896, "epoch": 1997} {"train_loss": -6.213335037231445, "global_step": 83897, "epoch": 1997} {"train_loss": -6.247627258300781, "global_step": 83898, "epoch": 1997} {"train_loss": -6.159846782684326, "global_step": 83899, "epoch": 1997} {"train_loss": -6.367201805114746, "global_step": 83900, "epoch": 1997} {"train_loss": -6.178129196166992, "global_step": 83901, "epoch": 1997} {"train_loss": -6.212802886962891, "global_step": 83902, "epoch": 1997} {"train_loss": -6.1955976486206055, "global_step": 83903, "epoch": 1997} {"train_loss": -6.161723613739014, "global_step": 83904, "epoch": 1997} {"train_loss": -6.120913505554199, "global_step": 83905, "epoch": 1997} {"train_loss": -6.1084489822387695, "global_step": 83906, "epoch": 1997} {"train_loss": -6.084141731262207, "global_step": 83907, "epoch": 1997} {"train_loss": -6.1122822761535645, "global_step": 83908, "epoch": 1997} {"train_loss": -6.126911163330078, "global_step": 83909, "epoch": 1997} {"train_loss": -6.3114519119262695, "global_step": 83910, "epoch": 1997} {"train_loss": -6.156972885131836, "global_step": 83911, "epoch": 1997} {"train_loss": -6.034200668334961, "global_step": 83912, "epoch": 1997} {"train_loss": -6.145876884460449, "global_step": 83913, "epoch": 1997} {"train_loss": -6.291017532348633, "global_step": 83914, "epoch": 1997} {"train_loss": -6.1741750580923895, "global_step": 83915, "epoch": 1997, "val_loss": 75082.5390625} {"train_loss": -6.140791893005371, "global_step": 83916, "epoch": 1998} {"train_loss": -6.266587257385254, "global_step": 83917, "epoch": 1998} {"train_loss": -6.122453689575195, "global_step": 83918, "epoch": 1998} {"train_loss": -6.2358903884887695, "global_step": 83919, "epoch": 1998} {"train_loss": -6.1523237228393555, "global_step": 83920, "epoch": 1998} {"train_loss": -6.082695007324219, "global_step": 83921, "epoch": 1998} {"train_loss": -6.1486358642578125, "global_step": 83922, "epoch": 1998} {"train_loss": -6.068780899047852, "global_step": 83923, "epoch": 1998} {"train_loss": -6.230798721313477, "global_step": 83924, "epoch": 1998} {"train_loss": -6.1172637939453125, "global_step": 83925, "epoch": 1998} {"train_loss": -6.169582366943359, "global_step": 83926, "epoch": 1998} {"train_loss": -6.248955726623535, "global_step": 83927, "epoch": 1998} {"train_loss": -6.181146621704102, "global_step": 83928, "epoch": 1998} {"train_loss": -6.094226837158203, "global_step": 83929, "epoch": 1998} {"train_loss": -6.09716272354126, "global_step": 83930, "epoch": 1998} {"train_loss": -6.078113555908203, "global_step": 83931, "epoch": 1998} {"train_loss": -6.177819728851318, "global_step": 83932, "epoch": 1998} {"train_loss": -6.142467021942139, "global_step": 83933, "epoch": 1998} {"train_loss": -6.251228332519531, "global_step": 83934, "epoch": 1998} {"train_loss": -6.1708455085754395, "global_step": 83935, "epoch": 1998} {"train_loss": -6.015722751617432, "global_step": 83936, "epoch": 1998} {"train_loss": -6.067277431488037, "global_step": 83937, "epoch": 1998} {"train_loss": -6.217865943908691, "global_step": 83938, "epoch": 1998} {"train_loss": -6.187958717346191, "global_step": 83939, "epoch": 1998} {"train_loss": -6.053670406341553, "global_step": 83940, "epoch": 1998} {"train_loss": -6.050245761871338, "global_step": 83941, "epoch": 1998} {"train_loss": -6.268586158752441, "global_step": 83942, "epoch": 1998} {"train_loss": -6.087125778198242, "global_step": 83943, "epoch": 1998} {"train_loss": -6.170490264892578, "global_step": 83944, "epoch": 1998} {"train_loss": -6.21579647064209, "global_step": 83945, "epoch": 1998} {"train_loss": -6.09332275390625, "global_step": 83946, "epoch": 1998} {"train_loss": -6.103662490844727, "global_step": 83947, "epoch": 1998} {"train_loss": -6.238308429718018, "global_step": 83948, "epoch": 1998} {"train_loss": -6.153903007507324, "global_step": 83949, "epoch": 1998} {"train_loss": -6.168002128601074, "global_step": 83950, "epoch": 1998} {"train_loss": -6.181840896606445, "global_step": 83951, "epoch": 1998} {"train_loss": -6.238472938537598, "global_step": 83952, "epoch": 1998} {"train_loss": -6.197315216064453, "global_step": 83953, "epoch": 1998} {"train_loss": -6.249914646148682, "global_step": 83954, "epoch": 1998} {"train_loss": -6.166507720947266, "global_step": 83955, "epoch": 1998} {"train_loss": -6.279490947723389, "global_step": 83956, "epoch": 1998} {"train_loss": -6.16480142729623, "global_step": 83957, "epoch": 1998, "val_loss": 75371.7109375} {"train_loss": -6.275718688964844, "global_step": 83958, "epoch": 1999} {"train_loss": -6.054000377655029, "global_step": 83959, "epoch": 1999} {"train_loss": -6.12404727935791, "global_step": 83960, "epoch": 1999} {"train_loss": -6.1847453117370605, "global_step": 83961, "epoch": 1999} {"train_loss": -6.033918857574463, "global_step": 83962, "epoch": 1999} {"train_loss": -6.232662677764893, "global_step": 83963, "epoch": 1999} {"train_loss": -6.240907192230225, "global_step": 83964, "epoch": 1999} {"train_loss": -6.020805358886719, "global_step": 83965, "epoch": 1999} {"train_loss": -6.089683532714844, "global_step": 83966, "epoch": 1999} {"train_loss": -6.100509166717529, "global_step": 83967, "epoch": 1999} {"train_loss": -6.1874895095825195, "global_step": 83968, "epoch": 1999} {"train_loss": -6.229750633239746, "global_step": 83969, "epoch": 1999} {"train_loss": -6.239782333374023, "global_step": 83970, "epoch": 1999} {"train_loss": -6.1289591789245605, "global_step": 83971, "epoch": 1999} {"train_loss": -6.180659294128418, "global_step": 83972, "epoch": 1999} {"train_loss": -6.143234729766846, "global_step": 83973, "epoch": 1999} {"train_loss": -6.207932949066162, "global_step": 83974, "epoch": 1999} {"train_loss": -6.105646133422852, "global_step": 83975, "epoch": 1999} {"train_loss": -6.2203192710876465, "global_step": 83976, "epoch": 1999} {"train_loss": -6.199080467224121, "global_step": 83977, "epoch": 1999} {"train_loss": -6.100822448730469, "global_step": 83978, "epoch": 1999} {"train_loss": -6.170658111572266, "global_step": 83979, "epoch": 1999} {"train_loss": -6.173340797424316, "global_step": 83980, "epoch": 1999} {"train_loss": -6.124820709228516, "global_step": 83981, "epoch": 1999} {"train_loss": -6.294259548187256, "global_step": 83982, "epoch": 1999} {"train_loss": -6.173325538635254, "global_step": 83983, "epoch": 1999} {"train_loss": -6.174022674560547, "global_step": 83984, "epoch": 1999} {"train_loss": -6.236083507537842, "global_step": 83985, "epoch": 1999} {"train_loss": -6.128407955169678, "global_step": 83986, "epoch": 1999} {"train_loss": -6.219345569610596, "global_step": 83987, "epoch": 1999} {"train_loss": -6.164402961730957, "global_step": 83988, "epoch": 1999} {"train_loss": -6.218690872192383, "global_step": 83989, "epoch": 1999} {"train_loss": -6.241067886352539, "global_step": 83990, "epoch": 1999} {"train_loss": -6.280901908874512, "global_step": 83991, "epoch": 1999} {"train_loss": -6.126270294189453, "global_step": 83992, "epoch": 1999} {"train_loss": -6.12429666519165, "global_step": 83993, "epoch": 1999} {"train_loss": -6.13778829574585, "global_step": 83994, "epoch": 1999} {"train_loss": -6.180974960327148, "global_step": 83995, "epoch": 1999} {"train_loss": -6.057345390319824, "global_step": 83996, "epoch": 1999} {"train_loss": -6.217672348022461, "global_step": 83997, "epoch": 1999} {"train_loss": -6.233657360076904, "global_step": 83998, "epoch": 1999} {"train_loss": -6.170049338113694, "global_step": 83999, "epoch": 1999, "val_loss": 75005.46875} {"train_loss": -6.167606830596924, "global_step": 84000, "epoch": 2000} {"train_loss": -6.2660627365112305, "global_step": 84001, "epoch": 2000} {"train_loss": -6.177395820617676, "global_step": 84002, "epoch": 2000} {"train_loss": -6.2390923500061035, "global_step": 84003, "epoch": 2000} {"train_loss": -6.112804889678955, "global_step": 84004, "epoch": 2000} {"train_loss": -6.18394660949707, "global_step": 84005, "epoch": 2000} {"train_loss": -6.169212818145752, "global_step": 84006, "epoch": 2000} {"train_loss": -6.127790451049805, "global_step": 84007, "epoch": 2000} {"train_loss": -6.234147071838379, "global_step": 84008, "epoch": 2000} {"train_loss": -6.190312385559082, "global_step": 84009, "epoch": 2000} {"train_loss": -6.104001045227051, "global_step": 84010, "epoch": 2000} {"train_loss": -6.116443157196045, "global_step": 84011, "epoch": 2000} {"train_loss": -6.1204071044921875, "global_step": 84012, "epoch": 2000} {"train_loss": -6.178224563598633, "global_step": 84013, "epoch": 2000} {"train_loss": -6.158414840698242, "global_step": 84014, "epoch": 2000} {"train_loss": -6.176089763641357, "global_step": 84015, "epoch": 2000} {"train_loss": -6.218448638916016, "global_step": 84016, "epoch": 2000} {"train_loss": -6.232834815979004, "global_step": 84017, "epoch": 2000} {"train_loss": -6.151459217071533, "global_step": 84018, "epoch": 2000} {"train_loss": -6.278348922729492, "global_step": 84019, "epoch": 2000} {"train_loss": -6.2116923332214355, "global_step": 84020, "epoch": 2000} {"train_loss": -6.304347038269043, "global_step": 84021, "epoch": 2000} {"train_loss": -6.175094127655029, "global_step": 84022, "epoch": 2000} {"train_loss": -6.2184600830078125, "global_step": 84023, "epoch": 2000} {"train_loss": -6.226256370544434, "global_step": 84024, "epoch": 2000} {"train_loss": -6.194052696228027, "global_step": 84025, "epoch": 2000} {"train_loss": -6.11472749710083, "global_step": 84026, "epoch": 2000} {"train_loss": -6.2612433433532715, "global_step": 84027, "epoch": 2000} {"train_loss": -6.271848678588867, "global_step": 84028, "epoch": 2000} {"train_loss": -6.20472526550293, "global_step": 84029, "epoch": 2000} {"train_loss": -6.145800590515137, "global_step": 84030, "epoch": 2000} {"train_loss": -6.110506057739258, "global_step": 84031, "epoch": 2000} {"train_loss": -6.178283214569092, "global_step": 84032, "epoch": 2000} {"train_loss": -6.223424911499023, "global_step": 84033, "epoch": 2000} {"train_loss": -6.128852844238281, "global_step": 84034, "epoch": 2000} {"train_loss": -6.308524131774902, "global_step": 84035, "epoch": 2000} {"train_loss": -6.226580619812012, "global_step": 84036, "epoch": 2000} {"train_loss": -6.232985496520996, "global_step": 84037, "epoch": 2000} {"train_loss": -6.112320899963379, "global_step": 84038, "epoch": 2000} {"train_loss": -6.150177001953125, "global_step": 84039, "epoch": 2000} {"train_loss": -6.220612049102783, "global_step": 84040, "epoch": 2000} {"train_loss": -6.191892930439541, "global_step": 84041, "epoch": 2000, "train/sim_max_reward_0": 0.6521044650969328, "train/sim_max_reward_1": 0.6582398359471862, "train/sim_max_reward_2": 0.5563016168861807, "train/sim_max_reward_3": 0.14872255286270988, "train/sim_max_reward_4": 0.6541251163201505, "train/sim_max_reward_5": 0.9804467605587772, "test/sim_max_reward_4500000": 0.3250776170251892, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9192845192517006, "test/sim_max_reward_4500003": 0.7482551836054759, "test/sim_max_reward_4500004": 0.6189387672649593, "test/sim_max_reward_4500005": 0.23015284625442092, "test/sim_max_reward_4500006": 0.9289518619643329, "test/sim_max_reward_4500007": 0.8901549579918031, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.9407327960064444, "test/sim_max_reward_4500010": 0.9239876778589103, "test/sim_max_reward_4500011": 0.34042976898190175, "test/sim_max_reward_4500012": 0.8885168574429249, "test/sim_max_reward_4500013": 0.0003211241517190338, "test/sim_max_reward_4500014": 0.3809570775798933, "test/sim_max_reward_4500015": 0.9174555809896083, "test/sim_max_reward_4500016": 0.43804114316692994, "test/sim_max_reward_4500017": 0.04436094859612656, "test/sim_max_reward_4500018": 0.40256054067259617, "test/sim_max_reward_4500019": 0.8605725546465963, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9026899478200981, "test/sim_max_reward_4500022": 0.8313242699016856, "test/sim_max_reward_4500023": 0.7490889285850819, "test/sim_max_reward_4500024": 1.0, "test/sim_max_reward_4500025": 0.6058668467998312, "test/sim_max_reward_4500026": 0.9784676965893466, "test/sim_max_reward_4500027": 0.6428304063857896, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.10458975399139035, "test/sim_max_reward_4500030": 0.9113295100381219, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.41843683698091955, "test/sim_max_reward_4500033": 0.9968096309160549, "test/sim_max_reward_4500034": 0.7833745348134449, "test/sim_max_reward_4500035": 0.6642219126938335, "test/sim_max_reward_4500036": 0.9001146893228876, "test/sim_max_reward_4500037": 0.927165596120162, "test/sim_max_reward_4500038": 0.29785196181419693, "test/sim_max_reward_4500039": 0.0, "test/sim_max_reward_4500040": 0.606464932011878, "test/sim_max_reward_4500041": 0.9417830038819924, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.015169172486534595, "test/sim_max_reward_4500045": 0.39363584089160847, "test/sim_max_reward_4500046": 0.700571510654767, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6083233912786562, "test/mean_score": 0.5276231182807583, "val_loss": 75205.8515625} {"train_loss": -6.227611541748047, "global_step": 84042, "epoch": 2001} {"train_loss": -6.336517333984375, "global_step": 84043, "epoch": 2001} {"train_loss": -6.1727294921875, "global_step": 84044, "epoch": 2001} {"train_loss": -6.168837547302246, "global_step": 84045, "epoch": 2001} {"train_loss": -6.268378734588623, "global_step": 84046, "epoch": 2001} {"train_loss": -6.247272491455078, "global_step": 84047, "epoch": 2001} {"train_loss": -6.183600425720215, "global_step": 84048, "epoch": 2001} {"train_loss": -6.160619735717773, "global_step": 84049, "epoch": 2001} {"train_loss": -6.189492702484131, "global_step": 84050, "epoch": 2001} {"train_loss": -6.133967399597168, "global_step": 84051, "epoch": 2001} {"train_loss": -6.297388553619385, "global_step": 84052, "epoch": 2001} {"train_loss": -6.253927707672119, "global_step": 84053, "epoch": 2001} {"train_loss": -6.3181281089782715, "global_step": 84054, "epoch": 2001} {"train_loss": -6.129038333892822, "global_step": 84055, "epoch": 2001} {"train_loss": -6.236187934875488, "global_step": 84056, "epoch": 2001} {"train_loss": -6.212270259857178, "global_step": 84057, "epoch": 2001} {"train_loss": -6.2401533126831055, "global_step": 84058, "epoch": 2001} {"train_loss": -6.148858070373535, "global_step": 84059, "epoch": 2001} {"train_loss": -6.146306037902832, "global_step": 84060, "epoch": 2001} {"train_loss": -6.201111316680908, "global_step": 84061, "epoch": 2001} {"train_loss": -6.19935417175293, "global_step": 84062, "epoch": 2001} {"train_loss": -6.142210006713867, "global_step": 84063, "epoch": 2001} {"train_loss": -6.123842239379883, "global_step": 84064, "epoch": 2001} {"train_loss": -6.177979469299316, "global_step": 84065, "epoch": 2001} {"train_loss": -6.208683013916016, "global_step": 84066, "epoch": 2001} {"train_loss": -6.187127113342285, "global_step": 84067, "epoch": 2001} {"train_loss": -6.187112808227539, "global_step": 84068, "epoch": 2001} {"train_loss": -6.225370407104492, "global_step": 84069, "epoch": 2001} {"train_loss": -6.152629852294922, "global_step": 84070, "epoch": 2001} {"train_loss": -6.232258319854736, "global_step": 84071, "epoch": 2001} {"train_loss": -6.264200210571289, "global_step": 84072, "epoch": 2001} {"train_loss": -6.199770927429199, "global_step": 84073, "epoch": 2001} {"train_loss": -6.331934928894043, "global_step": 84074, "epoch": 2001} {"train_loss": -6.143352031707764, "global_step": 84075, "epoch": 2001} {"train_loss": -6.110257625579834, "global_step": 84076, "epoch": 2001} {"train_loss": -6.3353376388549805, "global_step": 84077, "epoch": 2001} {"train_loss": -6.096168518066406, "global_step": 84078, "epoch": 2001} {"train_loss": -6.0702009201049805, "global_step": 84079, "epoch": 2001} {"train_loss": -6.179924964904785, "global_step": 84080, "epoch": 2001} {"train_loss": -6.198267936706543, "global_step": 84081, "epoch": 2001} {"train_loss": -6.232117652893066, "global_step": 84082, "epoch": 2001} {"train_loss": -6.201107785815284, "global_step": 84083, "epoch": 2001, "val_loss": 75171.7578125} {"train_loss": -6.18842077255249, "global_step": 84084, "epoch": 2002} {"train_loss": -6.192975044250488, "global_step": 84085, "epoch": 2002} {"train_loss": -6.27644157409668, "global_step": 84086, "epoch": 2002} {"train_loss": -6.072448253631592, "global_step": 84087, "epoch": 2002} {"train_loss": -6.216065406799316, "global_step": 84088, "epoch": 2002} {"train_loss": -6.192715644836426, "global_step": 84089, "epoch": 2002} {"train_loss": -6.131850242614746, "global_step": 84090, "epoch": 2002} {"train_loss": -6.236788749694824, "global_step": 84091, "epoch": 2002} {"train_loss": -6.196658134460449, "global_step": 84092, "epoch": 2002} {"train_loss": -6.085407257080078, "global_step": 84093, "epoch": 2002} {"train_loss": -6.150312900543213, "global_step": 84094, "epoch": 2002} {"train_loss": -6.136147975921631, "global_step": 84095, "epoch": 2002} {"train_loss": -6.223177909851074, "global_step": 84096, "epoch": 2002} {"train_loss": -6.224762916564941, "global_step": 84097, "epoch": 2002} {"train_loss": -6.1563801765441895, "global_step": 84098, "epoch": 2002} {"train_loss": -6.001311302185059, "global_step": 84099, "epoch": 2002} {"train_loss": -6.180691719055176, "global_step": 84100, "epoch": 2002} {"train_loss": -6.177799701690674, "global_step": 84101, "epoch": 2002} {"train_loss": -6.245645523071289, "global_step": 84102, "epoch": 2002} {"train_loss": -6.141355991363525, "global_step": 84103, "epoch": 2002} {"train_loss": -6.046300411224365, "global_step": 84104, "epoch": 2002} {"train_loss": -6.1967668533325195, "global_step": 84105, "epoch": 2002} {"train_loss": -6.179627895355225, "global_step": 84106, "epoch": 2002} {"train_loss": -6.245229244232178, "global_step": 84107, "epoch": 2002} {"train_loss": -6.188812255859375, "global_step": 84108, "epoch": 2002} {"train_loss": -6.16952657699585, "global_step": 84109, "epoch": 2002} {"train_loss": -6.185795783996582, "global_step": 84110, "epoch": 2002} {"train_loss": -6.164097309112549, "global_step": 84111, "epoch": 2002} {"train_loss": -6.206248760223389, "global_step": 84112, "epoch": 2002} {"train_loss": -6.170639991760254, "global_step": 84113, "epoch": 2002} {"train_loss": -6.144968032836914, "global_step": 84114, "epoch": 2002} {"train_loss": -6.120176315307617, "global_step": 84115, "epoch": 2002} {"train_loss": -6.109246730804443, "global_step": 84116, "epoch": 2002} {"train_loss": -6.128603935241699, "global_step": 84117, "epoch": 2002} {"train_loss": -6.187779426574707, "global_step": 84118, "epoch": 2002} {"train_loss": -6.086984634399414, "global_step": 84119, "epoch": 2002} {"train_loss": -6.1074347496032715, "global_step": 84120, "epoch": 2002} {"train_loss": -6.184523105621338, "global_step": 84121, "epoch": 2002} {"train_loss": -6.194386005401611, "global_step": 84122, "epoch": 2002} {"train_loss": -6.223877906799316, "global_step": 84123, "epoch": 2002} {"train_loss": -6.065866470336914, "global_step": 84124, "epoch": 2002} {"train_loss": -6.16468528338841, "global_step": 84125, "epoch": 2002, "val_loss": 74967.2578125} {"train_loss": -6.241018295288086, "global_step": 84126, "epoch": 2003} {"train_loss": -6.185434341430664, "global_step": 84127, "epoch": 2003} {"train_loss": -6.326467514038086, "global_step": 84128, "epoch": 2003} {"train_loss": -6.284603118896484, "global_step": 84129, "epoch": 2003} {"train_loss": -6.298615455627441, "global_step": 84130, "epoch": 2003} {"train_loss": -6.205897808074951, "global_step": 84131, "epoch": 2003} {"train_loss": -6.1589484214782715, "global_step": 84132, "epoch": 2003} {"train_loss": -6.138637065887451, "global_step": 84133, "epoch": 2003} {"train_loss": -6.099935054779053, "global_step": 84134, "epoch": 2003} {"train_loss": -6.161543846130371, "global_step": 84135, "epoch": 2003} {"train_loss": -6.110074996948242, "global_step": 84136, "epoch": 2003} {"train_loss": -6.208325386047363, "global_step": 84137, "epoch": 2003} {"train_loss": -6.097247123718262, "global_step": 84138, "epoch": 2003} {"train_loss": -6.174311637878418, "global_step": 84139, "epoch": 2003} {"train_loss": -6.011322975158691, "global_step": 84140, "epoch": 2003} {"train_loss": -6.2599639892578125, "global_step": 84141, "epoch": 2003} {"train_loss": -6.124423027038574, "global_step": 84142, "epoch": 2003} {"train_loss": -6.1696577072143555, "global_step": 84143, "epoch": 2003} {"train_loss": -6.17386531829834, "global_step": 84144, "epoch": 2003} {"train_loss": -6.192148685455322, "global_step": 84145, "epoch": 2003} {"train_loss": -6.179084300994873, "global_step": 84146, "epoch": 2003} {"train_loss": -6.158962249755859, "global_step": 84147, "epoch": 2003} {"train_loss": -6.04893684387207, "global_step": 84148, "epoch": 2003} {"train_loss": -6.237096309661865, "global_step": 84149, "epoch": 2003} {"train_loss": -6.281095027923584, "global_step": 84150, "epoch": 2003} {"train_loss": -6.094429969787598, "global_step": 84151, "epoch": 2003} {"train_loss": -6.278432846069336, "global_step": 84152, "epoch": 2003} {"train_loss": -6.1108503341674805, "global_step": 84153, "epoch": 2003} {"train_loss": -6.129665374755859, "global_step": 84154, "epoch": 2003} {"train_loss": -6.093504905700684, "global_step": 84155, "epoch": 2003} {"train_loss": -6.199362277984619, "global_step": 84156, "epoch": 2003} {"train_loss": -6.161299705505371, "global_step": 84157, "epoch": 2003} {"train_loss": -6.1787919998168945, "global_step": 84158, "epoch": 2003} {"train_loss": -6.118204116821289, "global_step": 84159, "epoch": 2003} {"train_loss": -6.074310302734375, "global_step": 84160, "epoch": 2003} {"train_loss": -6.196717262268066, "global_step": 84161, "epoch": 2003} {"train_loss": -6.231060981750488, "global_step": 84162, "epoch": 2003} {"train_loss": -6.127047061920166, "global_step": 84163, "epoch": 2003} {"train_loss": -6.216297149658203, "global_step": 84164, "epoch": 2003} {"train_loss": -6.219069480895996, "global_step": 84165, "epoch": 2003} {"train_loss": -6.208813667297363, "global_step": 84166, "epoch": 2003} {"train_loss": -6.175160816737583, "global_step": 84167, "epoch": 2003, "val_loss": 75212.3515625} {"train_loss": -6.28482723236084, "global_step": 84168, "epoch": 2004} {"train_loss": -6.291688442230225, "global_step": 84169, "epoch": 2004} {"train_loss": -6.3085737228393555, "global_step": 84170, "epoch": 2004} {"train_loss": -6.251547813415527, "global_step": 84171, "epoch": 2004} {"train_loss": -6.176459312438965, "global_step": 84172, "epoch": 2004} {"train_loss": -6.21928071975708, "global_step": 84173, "epoch": 2004} {"train_loss": -6.098174095153809, "global_step": 84174, "epoch": 2004} {"train_loss": -6.054989337921143, "global_step": 84175, "epoch": 2004} {"train_loss": -6.138397693634033, "global_step": 84176, "epoch": 2004} {"train_loss": -6.123113632202148, "global_step": 84177, "epoch": 2004} {"train_loss": -6.16472053527832, "global_step": 84178, "epoch": 2004} {"train_loss": -6.235239028930664, "global_step": 84179, "epoch": 2004} {"train_loss": -6.139611721038818, "global_step": 84180, "epoch": 2004} {"train_loss": -6.377663612365723, "global_step": 84181, "epoch": 2004} {"train_loss": -6.294672012329102, "global_step": 84182, "epoch": 2004} {"train_loss": -6.234663009643555, "global_step": 84183, "epoch": 2004} {"train_loss": -6.099325656890869, "global_step": 84184, "epoch": 2004} {"train_loss": -6.196034908294678, "global_step": 84185, "epoch": 2004} {"train_loss": -6.031735897064209, "global_step": 84186, "epoch": 2004} {"train_loss": -6.104221343994141, "global_step": 84187, "epoch": 2004} {"train_loss": -6.30784797668457, "global_step": 84188, "epoch": 2004} {"train_loss": -6.125019073486328, "global_step": 84189, "epoch": 2004} {"train_loss": -6.105518817901611, "global_step": 84190, "epoch": 2004} {"train_loss": -6.161123275756836, "global_step": 84191, "epoch": 2004} {"train_loss": -6.132819175720215, "global_step": 84192, "epoch": 2004} {"train_loss": -6.144776821136475, "global_step": 84193, "epoch": 2004} {"train_loss": -6.279491424560547, "global_step": 84194, "epoch": 2004} {"train_loss": -6.187380313873291, "global_step": 84195, "epoch": 2004} {"train_loss": -6.174117565155029, "global_step": 84196, "epoch": 2004} {"train_loss": -6.171054363250732, "global_step": 84197, "epoch": 2004} {"train_loss": -6.245128631591797, "global_step": 84198, "epoch": 2004} {"train_loss": -6.181452751159668, "global_step": 84199, "epoch": 2004} {"train_loss": -6.098459243774414, "global_step": 84200, "epoch": 2004} {"train_loss": -6.17054557800293, "global_step": 84201, "epoch": 2004} {"train_loss": -6.167033672332764, "global_step": 84202, "epoch": 2004} {"train_loss": -6.181062698364258, "global_step": 84203, "epoch": 2004} {"train_loss": -6.314724922180176, "global_step": 84204, "epoch": 2004} {"train_loss": -6.259772300720215, "global_step": 84205, "epoch": 2004} {"train_loss": -6.084802627563477, "global_step": 84206, "epoch": 2004} {"train_loss": -6.143938064575195, "global_step": 84207, "epoch": 2004} {"train_loss": -6.26405143737793, "global_step": 84208, "epoch": 2004} {"train_loss": -6.1877017588842484, "global_step": 84209, "epoch": 2004, "val_loss": 75042.0546875} {"train_loss": -6.094918727874756, "global_step": 84210, "epoch": 2005} {"train_loss": -6.23917293548584, "global_step": 84211, "epoch": 2005} {"train_loss": -6.232497215270996, "global_step": 84212, "epoch": 2005} {"train_loss": -6.122230529785156, "global_step": 84213, "epoch": 2005} {"train_loss": -6.053092956542969, "global_step": 84214, "epoch": 2005} {"train_loss": -6.104524612426758, "global_step": 84215, "epoch": 2005} {"train_loss": -6.173493385314941, "global_step": 84216, "epoch": 2005} {"train_loss": -6.338051795959473, "global_step": 84217, "epoch": 2005} {"train_loss": -6.192005157470703, "global_step": 84218, "epoch": 2005} {"train_loss": -6.252197265625, "global_step": 84219, "epoch": 2005} {"train_loss": -6.190771102905273, "global_step": 84220, "epoch": 2005} {"train_loss": -6.2264251708984375, "global_step": 84221, "epoch": 2005} {"train_loss": -6.277299880981445, "global_step": 84222, "epoch": 2005} {"train_loss": -6.181883335113525, "global_step": 84223, "epoch": 2005} {"train_loss": -6.190848350524902, "global_step": 84224, "epoch": 2005} {"train_loss": -6.2484354972839355, "global_step": 84225, "epoch": 2005} {"train_loss": -6.237922668457031, "global_step": 84226, "epoch": 2005} {"train_loss": -6.107357025146484, "global_step": 84227, "epoch": 2005} {"train_loss": -6.226022243499756, "global_step": 84228, "epoch": 2005} {"train_loss": -6.106790542602539, "global_step": 84229, "epoch": 2005} {"train_loss": -6.183572292327881, "global_step": 84230, "epoch": 2005} {"train_loss": -6.254859924316406, "global_step": 84231, "epoch": 2005} {"train_loss": -6.130111217498779, "global_step": 84232, "epoch": 2005} {"train_loss": -6.1974287033081055, "global_step": 84233, "epoch": 2005} {"train_loss": -6.09267520904541, "global_step": 84234, "epoch": 2005} {"train_loss": -6.02320671081543, "global_step": 84235, "epoch": 2005} {"train_loss": -6.155294418334961, "global_step": 84236, "epoch": 2005} {"train_loss": -6.066330909729004, "global_step": 84237, "epoch": 2005} {"train_loss": -6.1703200340271, "global_step": 84238, "epoch": 2005} {"train_loss": -6.074261665344238, "global_step": 84239, "epoch": 2005} {"train_loss": -6.054654121398926, "global_step": 84240, "epoch": 2005} {"train_loss": -6.188180446624756, "global_step": 84241, "epoch": 2005} {"train_loss": -6.143978118896484, "global_step": 84242, "epoch": 2005} {"train_loss": -6.106297492980957, "global_step": 84243, "epoch": 2005} {"train_loss": -6.081618785858154, "global_step": 84244, "epoch": 2005} {"train_loss": -6.138207912445068, "global_step": 84245, "epoch": 2005} {"train_loss": -6.162757873535156, "global_step": 84246, "epoch": 2005} {"train_loss": -6.126157760620117, "global_step": 84247, "epoch": 2005} {"train_loss": -6.018842697143555, "global_step": 84248, "epoch": 2005} {"train_loss": -6.200058937072754, "global_step": 84249, "epoch": 2005} {"train_loss": -6.204281806945801, "global_step": 84250, "epoch": 2005} {"train_loss": -6.160098552703857, "global_step": 84251, "epoch": 2005, "val_loss": 75305.171875} {"train_loss": -6.232309341430664, "global_step": 84252, "epoch": 2006} {"train_loss": -6.155914306640625, "global_step": 84253, "epoch": 2006} {"train_loss": -6.204510688781738, "global_step": 84254, "epoch": 2006} {"train_loss": -6.099729537963867, "global_step": 84255, "epoch": 2006} {"train_loss": -6.211612701416016, "global_step": 84256, "epoch": 2006} {"train_loss": -6.318476676940918, "global_step": 84257, "epoch": 2006} {"train_loss": -6.192659854888916, "global_step": 84258, "epoch": 2006} {"train_loss": -6.144528865814209, "global_step": 84259, "epoch": 2006} {"train_loss": -6.240139961242676, "global_step": 84260, "epoch": 2006} {"train_loss": -6.147819519042969, "global_step": 84261, "epoch": 2006} {"train_loss": -6.318517684936523, "global_step": 84262, "epoch": 2006} {"train_loss": -6.033327579498291, "global_step": 84263, "epoch": 2006} {"train_loss": -6.128101825714111, "global_step": 84264, "epoch": 2006} {"train_loss": -6.068551540374756, "global_step": 84265, "epoch": 2006} {"train_loss": -6.194160461425781, "global_step": 84266, "epoch": 2006} {"train_loss": -6.2309160232543945, "global_step": 84267, "epoch": 2006} {"train_loss": -6.117328643798828, "global_step": 84268, "epoch": 2006} {"train_loss": -6.201621055603027, "global_step": 84269, "epoch": 2006} {"train_loss": -6.127134323120117, "global_step": 84270, "epoch": 2006} {"train_loss": -6.120414733886719, "global_step": 84271, "epoch": 2006} {"train_loss": -6.07280158996582, "global_step": 84272, "epoch": 2006} {"train_loss": -6.316303253173828, "global_step": 84273, "epoch": 2006} {"train_loss": -6.197131156921387, "global_step": 84274, "epoch": 2006} {"train_loss": -6.035553932189941, "global_step": 84275, "epoch": 2006} {"train_loss": -6.124883651733398, "global_step": 84276, "epoch": 2006} {"train_loss": -6.1165947914123535, "global_step": 84277, "epoch": 2006} {"train_loss": -6.066830158233643, "global_step": 84278, "epoch": 2006} {"train_loss": -6.262213706970215, "global_step": 84279, "epoch": 2006} {"train_loss": -6.053228378295898, "global_step": 84280, "epoch": 2006} {"train_loss": -6.089012622833252, "global_step": 84281, "epoch": 2006} {"train_loss": -6.214752674102783, "global_step": 84282, "epoch": 2006} {"train_loss": -6.054170608520508, "global_step": 84283, "epoch": 2006} {"train_loss": -6.207386016845703, "global_step": 84284, "epoch": 2006} {"train_loss": -6.076992034912109, "global_step": 84285, "epoch": 2006} {"train_loss": -6.172189712524414, "global_step": 84286, "epoch": 2006} {"train_loss": -6.0059404373168945, "global_step": 84287, "epoch": 2006} {"train_loss": -6.131592750549316, "global_step": 84288, "epoch": 2006} {"train_loss": -6.126661777496338, "global_step": 84289, "epoch": 2006} {"train_loss": -6.180226802825928, "global_step": 84290, "epoch": 2006} {"train_loss": -6.119817733764648, "global_step": 84291, "epoch": 2006} {"train_loss": -6.204748153686523, "global_step": 84292, "epoch": 2006} {"train_loss": -6.15197703951881, "global_step": 84293, "epoch": 2006, "val_loss": 75132.921875} {"train_loss": -6.219074249267578, "global_step": 84294, "epoch": 2007} {"train_loss": -6.130049705505371, "global_step": 84295, "epoch": 2007} {"train_loss": -6.123693466186523, "global_step": 84296, "epoch": 2007} {"train_loss": -6.18397331237793, "global_step": 84297, "epoch": 2007} {"train_loss": -6.16779899597168, "global_step": 84298, "epoch": 2007} {"train_loss": -6.164496421813965, "global_step": 84299, "epoch": 2007} {"train_loss": -6.206175804138184, "global_step": 84300, "epoch": 2007} {"train_loss": -6.262438774108887, "global_step": 84301, "epoch": 2007} {"train_loss": -6.233918190002441, "global_step": 84302, "epoch": 2007} {"train_loss": -6.24855899810791, "global_step": 84303, "epoch": 2007} {"train_loss": -6.298055648803711, "global_step": 84304, "epoch": 2007} {"train_loss": -6.112109184265137, "global_step": 84305, "epoch": 2007} {"train_loss": -6.166049957275391, "global_step": 84306, "epoch": 2007} {"train_loss": -6.066188812255859, "global_step": 84307, "epoch": 2007} {"train_loss": -6.178975582122803, "global_step": 84308, "epoch": 2007} {"train_loss": -6.24120569229126, "global_step": 84309, "epoch": 2007} {"train_loss": -6.246799468994141, "global_step": 84310, "epoch": 2007} {"train_loss": -6.250332355499268, "global_step": 84311, "epoch": 2007} {"train_loss": -6.296412467956543, "global_step": 84312, "epoch": 2007} {"train_loss": -6.175986289978027, "global_step": 84313, "epoch": 2007} {"train_loss": -6.275381088256836, "global_step": 84314, "epoch": 2007} {"train_loss": -6.1930131912231445, "global_step": 84315, "epoch": 2007} {"train_loss": -6.172757625579834, "global_step": 84316, "epoch": 2007} {"train_loss": -6.123303413391113, "global_step": 84317, "epoch": 2007} {"train_loss": -6.186574935913086, "global_step": 84318, "epoch": 2007} {"train_loss": -6.070558071136475, "global_step": 84319, "epoch": 2007} {"train_loss": -6.170718669891357, "global_step": 84320, "epoch": 2007} {"train_loss": -6.180292129516602, "global_step": 84321, "epoch": 2007} {"train_loss": -6.135383605957031, "global_step": 84322, "epoch": 2007} {"train_loss": -6.124815940856934, "global_step": 84323, "epoch": 2007} {"train_loss": -6.348273277282715, "global_step": 84324, "epoch": 2007} {"train_loss": -6.188699722290039, "global_step": 84325, "epoch": 2007} {"train_loss": -6.089531898498535, "global_step": 84326, "epoch": 2007} {"train_loss": -6.251151084899902, "global_step": 84327, "epoch": 2007} {"train_loss": -6.078497886657715, "global_step": 84328, "epoch": 2007} {"train_loss": -6.231841564178467, "global_step": 84329, "epoch": 2007} {"train_loss": -6.285495758056641, "global_step": 84330, "epoch": 2007} {"train_loss": -6.108200550079346, "global_step": 84331, "epoch": 2007} {"train_loss": -6.243345260620117, "global_step": 84332, "epoch": 2007} {"train_loss": -6.181677341461182, "global_step": 84333, "epoch": 2007} {"train_loss": -6.079987525939941, "global_step": 84334, "epoch": 2007} {"train_loss": -6.187601475488572, "global_step": 84335, "epoch": 2007, "val_loss": 74956.375} {"train_loss": -6.243581295013428, "global_step": 84336, "epoch": 2008} {"train_loss": -6.256913185119629, "global_step": 84337, "epoch": 2008} {"train_loss": -6.240936279296875, "global_step": 84338, "epoch": 2008} {"train_loss": -6.21511173248291, "global_step": 84339, "epoch": 2008} {"train_loss": -6.213876247406006, "global_step": 84340, "epoch": 2008} {"train_loss": -6.155605316162109, "global_step": 84341, "epoch": 2008} {"train_loss": -6.279886245727539, "global_step": 84342, "epoch": 2008} {"train_loss": -6.063655376434326, "global_step": 84343, "epoch": 2008} {"train_loss": -6.011568069458008, "global_step": 84344, "epoch": 2008} {"train_loss": -6.161217212677002, "global_step": 84345, "epoch": 2008} {"train_loss": -6.176891326904297, "global_step": 84346, "epoch": 2008} {"train_loss": -6.039944648742676, "global_step": 84347, "epoch": 2008} {"train_loss": -6.170997619628906, "global_step": 84348, "epoch": 2008} {"train_loss": -6.271716117858887, "global_step": 84349, "epoch": 2008} {"train_loss": -6.263611793518066, "global_step": 84350, "epoch": 2008} {"train_loss": -6.07627010345459, "global_step": 84351, "epoch": 2008} {"train_loss": -6.248873233795166, "global_step": 84352, "epoch": 2008} {"train_loss": -6.136631011962891, "global_step": 84353, "epoch": 2008} {"train_loss": -6.0803303718566895, "global_step": 84354, "epoch": 2008} {"train_loss": -6.145752429962158, "global_step": 84355, "epoch": 2008} {"train_loss": -6.211020469665527, "global_step": 84356, "epoch": 2008} {"train_loss": -6.199001312255859, "global_step": 84357, "epoch": 2008} {"train_loss": -6.154200553894043, "global_step": 84358, "epoch": 2008} {"train_loss": -6.223298072814941, "global_step": 84359, "epoch": 2008} {"train_loss": -6.231523513793945, "global_step": 84360, "epoch": 2008} {"train_loss": -6.195367813110352, "global_step": 84361, "epoch": 2008} {"train_loss": -6.283615589141846, "global_step": 84362, "epoch": 2008} {"train_loss": -6.167196273803711, "global_step": 84363, "epoch": 2008} {"train_loss": -6.074749946594238, "global_step": 84364, "epoch": 2008} {"train_loss": -6.239286422729492, "global_step": 84365, "epoch": 2008} {"train_loss": -6.150629997253418, "global_step": 84366, "epoch": 2008} {"train_loss": -6.212409496307373, "global_step": 84367, "epoch": 2008} {"train_loss": -6.151042461395264, "global_step": 84368, "epoch": 2008} {"train_loss": -6.233928680419922, "global_step": 84369, "epoch": 2008} {"train_loss": -6.110878944396973, "global_step": 84370, "epoch": 2008} {"train_loss": -6.111532688140869, "global_step": 84371, "epoch": 2008} {"train_loss": -6.168704032897949, "global_step": 84372, "epoch": 2008} {"train_loss": -6.3554792404174805, "global_step": 84373, "epoch": 2008} {"train_loss": -6.263818740844727, "global_step": 84374, "epoch": 2008} {"train_loss": -6.204129219055176, "global_step": 84375, "epoch": 2008} {"train_loss": -6.2207536697387695, "global_step": 84376, "epoch": 2008} {"train_loss": -6.184439999716623, "global_step": 84377, "epoch": 2008, "val_loss": 74981.265625} {"train_loss": -6.339564323425293, "global_step": 84378, "epoch": 2009} {"train_loss": -6.098162651062012, "global_step": 84379, "epoch": 2009} {"train_loss": -6.184004306793213, "global_step": 84380, "epoch": 2009} {"train_loss": -6.252272129058838, "global_step": 84381, "epoch": 2009} {"train_loss": -6.178641319274902, "global_step": 84382, "epoch": 2009} {"train_loss": -6.216968059539795, "global_step": 84383, "epoch": 2009} {"train_loss": -6.144367218017578, "global_step": 84384, "epoch": 2009} {"train_loss": -6.255653381347656, "global_step": 84385, "epoch": 2009} {"train_loss": -6.324891090393066, "global_step": 84386, "epoch": 2009} {"train_loss": -6.100615501403809, "global_step": 84387, "epoch": 2009} {"train_loss": -6.300542831420898, "global_step": 84388, "epoch": 2009} {"train_loss": -6.225749492645264, "global_step": 84389, "epoch": 2009} {"train_loss": -6.169699668884277, "global_step": 84390, "epoch": 2009} {"train_loss": -6.233049392700195, "global_step": 84391, "epoch": 2009} {"train_loss": -6.031818389892578, "global_step": 84392, "epoch": 2009} {"train_loss": -6.2295918464660645, "global_step": 84393, "epoch": 2009} {"train_loss": -6.056593894958496, "global_step": 84394, "epoch": 2009} {"train_loss": -6.178762912750244, "global_step": 84395, "epoch": 2009} {"train_loss": -6.191178798675537, "global_step": 84396, "epoch": 2009} {"train_loss": -6.052371978759766, "global_step": 84397, "epoch": 2009} {"train_loss": -6.1675567626953125, "global_step": 84398, "epoch": 2009} {"train_loss": -6.172906398773193, "global_step": 84399, "epoch": 2009} {"train_loss": -6.062971115112305, "global_step": 84400, "epoch": 2009} {"train_loss": -6.220926284790039, "global_step": 84401, "epoch": 2009} {"train_loss": -6.140752792358398, "global_step": 84402, "epoch": 2009} {"train_loss": -6.121258735656738, "global_step": 84403, "epoch": 2009} {"train_loss": -6.145583629608154, "global_step": 84404, "epoch": 2009} {"train_loss": -5.988290786743164, "global_step": 84405, "epoch": 2009} {"train_loss": -6.1004638671875, "global_step": 84406, "epoch": 2009} {"train_loss": -6.168846130371094, "global_step": 84407, "epoch": 2009} {"train_loss": -6.021113872528076, "global_step": 84408, "epoch": 2009} {"train_loss": -6.1171555519104, "global_step": 84409, "epoch": 2009} {"train_loss": -6.134855270385742, "global_step": 84410, "epoch": 2009} {"train_loss": -6.185715198516846, "global_step": 84411, "epoch": 2009} {"train_loss": -6.1597700119018555, "global_step": 84412, "epoch": 2009} {"train_loss": -6.031872749328613, "global_step": 84413, "epoch": 2009} {"train_loss": -6.208624839782715, "global_step": 84414, "epoch": 2009} {"train_loss": -6.1720805168151855, "global_step": 84415, "epoch": 2009} {"train_loss": -6.246915817260742, "global_step": 84416, "epoch": 2009} {"train_loss": -6.168610572814941, "global_step": 84417, "epoch": 2009} {"train_loss": -6.129111289978027, "global_step": 84418, "epoch": 2009} {"train_loss": -6.159768831162226, "global_step": 84419, "epoch": 2009, "val_loss": 75476.4375} {"train_loss": -6.01951789855957, "global_step": 84420, "epoch": 2010} {"train_loss": -6.1037116050720215, "global_step": 84421, "epoch": 2010} {"train_loss": -6.064348220825195, "global_step": 84422, "epoch": 2010} {"train_loss": -6.124292373657227, "global_step": 84423, "epoch": 2010} {"train_loss": -6.027441024780273, "global_step": 84424, "epoch": 2010} {"train_loss": -6.245820999145508, "global_step": 84425, "epoch": 2010} {"train_loss": -6.042253494262695, "global_step": 84426, "epoch": 2010} {"train_loss": -5.954399108886719, "global_step": 84427, "epoch": 2010} {"train_loss": -6.255127906799316, "global_step": 84428, "epoch": 2010} {"train_loss": -5.979853630065918, "global_step": 84429, "epoch": 2010} {"train_loss": -6.1896071434021, "global_step": 84430, "epoch": 2010} {"train_loss": -6.043397903442383, "global_step": 84431, "epoch": 2010} {"train_loss": -6.059444427490234, "global_step": 84432, "epoch": 2010} {"train_loss": -6.116060256958008, "global_step": 84433, "epoch": 2010} {"train_loss": -6.146991729736328, "global_step": 84434, "epoch": 2010} {"train_loss": -6.157303333282471, "global_step": 84435, "epoch": 2010} {"train_loss": -6.179783344268799, "global_step": 84436, "epoch": 2010} {"train_loss": -6.09676456451416, "global_step": 84437, "epoch": 2010} {"train_loss": -6.197908401489258, "global_step": 84438, "epoch": 2010} {"train_loss": -6.05952787399292, "global_step": 84439, "epoch": 2010} {"train_loss": -6.1512017250061035, "global_step": 84440, "epoch": 2010} {"train_loss": -6.187901496887207, "global_step": 84441, "epoch": 2010} {"train_loss": -6.109241485595703, "global_step": 84442, "epoch": 2010} {"train_loss": -6.203839302062988, "global_step": 84443, "epoch": 2010} {"train_loss": -6.098919868469238, "global_step": 84444, "epoch": 2010} {"train_loss": -6.019615173339844, "global_step": 84445, "epoch": 2010} {"train_loss": -6.274222373962402, "global_step": 84446, "epoch": 2010} {"train_loss": -6.119356155395508, "global_step": 84447, "epoch": 2010} {"train_loss": -6.113580703735352, "global_step": 84448, "epoch": 2010} {"train_loss": -6.110255241394043, "global_step": 84449, "epoch": 2010} {"train_loss": -6.17842960357666, "global_step": 84450, "epoch": 2010} {"train_loss": -6.196481704711914, "global_step": 84451, "epoch": 2010} {"train_loss": -6.001343727111816, "global_step": 84452, "epoch": 2010} {"train_loss": -6.227418899536133, "global_step": 84453, "epoch": 2010} {"train_loss": -6.194916725158691, "global_step": 84454, "epoch": 2010} {"train_loss": -6.030073165893555, "global_step": 84455, "epoch": 2010} {"train_loss": -6.204901695251465, "global_step": 84456, "epoch": 2010} {"train_loss": -6.108345985412598, "global_step": 84457, "epoch": 2010} {"train_loss": -6.267274856567383, "global_step": 84458, "epoch": 2010} {"train_loss": -6.1657023429870605, "global_step": 84459, "epoch": 2010} {"train_loss": -6.2070112228393555, "global_step": 84460, "epoch": 2010} {"train_loss": -6.130279643195016, "global_step": 84461, "epoch": 2010, "val_loss": 75003.96875} {"train_loss": -6.05180025100708, "global_step": 84462, "epoch": 2011} {"train_loss": -6.2383880615234375, "global_step": 84463, "epoch": 2011} {"train_loss": -6.16689920425415, "global_step": 84464, "epoch": 2011} {"train_loss": -6.121170997619629, "global_step": 84465, "epoch": 2011} {"train_loss": -6.23529052734375, "global_step": 84466, "epoch": 2011} {"train_loss": -6.178938388824463, "global_step": 84467, "epoch": 2011} {"train_loss": -6.196237564086914, "global_step": 84468, "epoch": 2011} {"train_loss": -6.174315452575684, "global_step": 84469, "epoch": 2011} {"train_loss": -6.1800856590271, "global_step": 84470, "epoch": 2011} {"train_loss": -6.145817756652832, "global_step": 84471, "epoch": 2011} {"train_loss": -6.141422748565674, "global_step": 84472, "epoch": 2011} {"train_loss": -6.2028913497924805, "global_step": 84473, "epoch": 2011} {"train_loss": -6.21623420715332, "global_step": 84474, "epoch": 2011} {"train_loss": -6.13006591796875, "global_step": 84475, "epoch": 2011} {"train_loss": -6.273670673370361, "global_step": 84476, "epoch": 2011} {"train_loss": -6.181234359741211, "global_step": 84477, "epoch": 2011} {"train_loss": -6.267921447753906, "global_step": 84478, "epoch": 2011} {"train_loss": -6.137260437011719, "global_step": 84479, "epoch": 2011} {"train_loss": -6.083648204803467, "global_step": 84480, "epoch": 2011} {"train_loss": -6.106847763061523, "global_step": 84481, "epoch": 2011} {"train_loss": -6.2531023025512695, "global_step": 84482, "epoch": 2011} {"train_loss": -6.056946754455566, "global_step": 84483, "epoch": 2011} {"train_loss": -6.207252025604248, "global_step": 84484, "epoch": 2011} {"train_loss": -6.172870635986328, "global_step": 84485, "epoch": 2011} {"train_loss": -6.071813583374023, "global_step": 84486, "epoch": 2011} {"train_loss": -6.189330577850342, "global_step": 84487, "epoch": 2011} {"train_loss": -6.020665645599365, "global_step": 84488, "epoch": 2011} {"train_loss": -6.215586185455322, "global_step": 84489, "epoch": 2011} {"train_loss": -6.143204212188721, "global_step": 84490, "epoch": 2011} {"train_loss": -6.257854461669922, "global_step": 84491, "epoch": 2011} {"train_loss": -6.132233142852783, "global_step": 84492, "epoch": 2011} {"train_loss": -6.124970436096191, "global_step": 84493, "epoch": 2011} {"train_loss": -6.170411586761475, "global_step": 84494, "epoch": 2011} {"train_loss": -6.132885932922363, "global_step": 84495, "epoch": 2011} {"train_loss": -6.015410900115967, "global_step": 84496, "epoch": 2011} {"train_loss": -6.132945537567139, "global_step": 84497, "epoch": 2011} {"train_loss": -6.219513416290283, "global_step": 84498, "epoch": 2011} {"train_loss": -6.248280048370361, "global_step": 84499, "epoch": 2011} {"train_loss": -6.257861137390137, "global_step": 84500, "epoch": 2011} {"train_loss": -6.180936813354492, "global_step": 84501, "epoch": 2011} {"train_loss": -6.247724533081055, "global_step": 84502, "epoch": 2011} {"train_loss": -6.169485569000244, "global_step": 84503, "epoch": 2011, "val_loss": 75143.4453125} {"train_loss": -6.1845245361328125, "global_step": 84504, "epoch": 2012} {"train_loss": -6.174867153167725, "global_step": 84505, "epoch": 2012} {"train_loss": -6.302597999572754, "global_step": 84506, "epoch": 2012} {"train_loss": -6.296568870544434, "global_step": 84507, "epoch": 2012} {"train_loss": -6.113121509552002, "global_step": 84508, "epoch": 2012} {"train_loss": -6.100733757019043, "global_step": 84509, "epoch": 2012} {"train_loss": -6.20084285736084, "global_step": 84510, "epoch": 2012} {"train_loss": -6.2565412521362305, "global_step": 84511, "epoch": 2012} {"train_loss": -6.165220260620117, "global_step": 84512, "epoch": 2012} {"train_loss": -6.2181525230407715, "global_step": 84513, "epoch": 2012} {"train_loss": -6.155450820922852, "global_step": 84514, "epoch": 2012} {"train_loss": -6.161150932312012, "global_step": 84515, "epoch": 2012} {"train_loss": -6.205572128295898, "global_step": 84516, "epoch": 2012} {"train_loss": -6.139087677001953, "global_step": 84517, "epoch": 2012} {"train_loss": -6.213033199310303, "global_step": 84518, "epoch": 2012} {"train_loss": -6.226569175720215, "global_step": 84519, "epoch": 2012} {"train_loss": -6.135004043579102, "global_step": 84520, "epoch": 2012} {"train_loss": -6.255381107330322, "global_step": 84521, "epoch": 2012} {"train_loss": -6.238870620727539, "global_step": 84522, "epoch": 2012} {"train_loss": -6.201800346374512, "global_step": 84523, "epoch": 2012} {"train_loss": -6.143554210662842, "global_step": 84524, "epoch": 2012} {"train_loss": -6.022256851196289, "global_step": 84525, "epoch": 2012} {"train_loss": -6.115297317504883, "global_step": 84526, "epoch": 2012} {"train_loss": -6.224075794219971, "global_step": 84527, "epoch": 2012} {"train_loss": -6.08383846282959, "global_step": 84528, "epoch": 2012} {"train_loss": -6.098670959472656, "global_step": 84529, "epoch": 2012} {"train_loss": -6.197231769561768, "global_step": 84530, "epoch": 2012} {"train_loss": -5.9932684898376465, "global_step": 84531, "epoch": 2012} {"train_loss": -6.109552383422852, "global_step": 84532, "epoch": 2012} {"train_loss": -6.1653056144714355, "global_step": 84533, "epoch": 2012} {"train_loss": -6.129826545715332, "global_step": 84534, "epoch": 2012} {"train_loss": -6.144692897796631, "global_step": 84535, "epoch": 2012} {"train_loss": -6.12394905090332, "global_step": 84536, "epoch": 2012} {"train_loss": -6.10987663269043, "global_step": 84537, "epoch": 2012} {"train_loss": -6.0459136962890625, "global_step": 84538, "epoch": 2012} {"train_loss": -6.092825889587402, "global_step": 84539, "epoch": 2012} {"train_loss": -6.232001304626465, "global_step": 84540, "epoch": 2012} {"train_loss": -6.180927753448486, "global_step": 84541, "epoch": 2012} {"train_loss": -6.225713729858398, "global_step": 84542, "epoch": 2012} {"train_loss": -6.231757164001465, "global_step": 84543, "epoch": 2012} {"train_loss": -6.150835037231445, "global_step": 84544, "epoch": 2012} {"train_loss": -6.167198158445812, "global_step": 84545, "epoch": 2012, "val_loss": 74788.3359375} {"train_loss": -6.262790679931641, "global_step": 84546, "epoch": 2013} {"train_loss": -6.162497520446777, "global_step": 84547, "epoch": 2013} {"train_loss": -6.237814903259277, "global_step": 84548, "epoch": 2013} {"train_loss": -6.1090497970581055, "global_step": 84549, "epoch": 2013} {"train_loss": -6.217766761779785, "global_step": 84550, "epoch": 2013} {"train_loss": -6.112951755523682, "global_step": 84551, "epoch": 2013} {"train_loss": -5.92813777923584, "global_step": 84552, "epoch": 2013} {"train_loss": -6.276902198791504, "global_step": 84553, "epoch": 2013} {"train_loss": -6.132053852081299, "global_step": 84554, "epoch": 2013} {"train_loss": -6.121192932128906, "global_step": 84555, "epoch": 2013} {"train_loss": -6.208983898162842, "global_step": 84556, "epoch": 2013} {"train_loss": -6.188185691833496, "global_step": 84557, "epoch": 2013} {"train_loss": -6.2530927658081055, "global_step": 84558, "epoch": 2013} {"train_loss": -6.237931251525879, "global_step": 84559, "epoch": 2013} {"train_loss": -6.031566619873047, "global_step": 84560, "epoch": 2013} {"train_loss": -6.17971134185791, "global_step": 84561, "epoch": 2013} {"train_loss": -6.168347358703613, "global_step": 84562, "epoch": 2013} {"train_loss": -6.1040873527526855, "global_step": 84563, "epoch": 2013} {"train_loss": -6.219461441040039, "global_step": 84564, "epoch": 2013} {"train_loss": -6.071120738983154, "global_step": 84565, "epoch": 2013} {"train_loss": -6.209590435028076, "global_step": 84566, "epoch": 2013} {"train_loss": -6.300244331359863, "global_step": 84567, "epoch": 2013} {"train_loss": -6.05849027633667, "global_step": 84568, "epoch": 2013} {"train_loss": -6.167161464691162, "global_step": 84569, "epoch": 2013} {"train_loss": -6.22828483581543, "global_step": 84570, "epoch": 2013} {"train_loss": -6.157478332519531, "global_step": 84571, "epoch": 2013} {"train_loss": -6.2130231857299805, "global_step": 84572, "epoch": 2013} {"train_loss": -6.011362075805664, "global_step": 84573, "epoch": 2013} {"train_loss": -6.134255409240723, "global_step": 84574, "epoch": 2013} {"train_loss": -6.107616424560547, "global_step": 84575, "epoch": 2013} {"train_loss": -6.119159698486328, "global_step": 84576, "epoch": 2013} {"train_loss": -6.279299736022949, "global_step": 84577, "epoch": 2013} {"train_loss": -6.153879165649414, "global_step": 84578, "epoch": 2013} {"train_loss": -6.139585494995117, "global_step": 84579, "epoch": 2013} {"train_loss": -6.156508445739746, "global_step": 84580, "epoch": 2013} {"train_loss": -6.166411399841309, "global_step": 84581, "epoch": 2013} {"train_loss": -6.268719673156738, "global_step": 84582, "epoch": 2013} {"train_loss": -6.212897777557373, "global_step": 84583, "epoch": 2013} {"train_loss": -6.210297107696533, "global_step": 84584, "epoch": 2013} {"train_loss": -6.2050042152404785, "global_step": 84585, "epoch": 2013} {"train_loss": -6.220067024230957, "global_step": 84586, "epoch": 2013} {"train_loss": -6.16666655313401, "global_step": 84587, "epoch": 2013, "val_loss": 74974.96875} {"train_loss": -6.2381792068481445, "global_step": 84588, "epoch": 2014} {"train_loss": -6.302855491638184, "global_step": 84589, "epoch": 2014} {"train_loss": -6.280947685241699, "global_step": 84590, "epoch": 2014} {"train_loss": -6.117175102233887, "global_step": 84591, "epoch": 2014} {"train_loss": -6.261943817138672, "global_step": 84592, "epoch": 2014} {"train_loss": -6.323238372802734, "global_step": 84593, "epoch": 2014} {"train_loss": -6.159886360168457, "global_step": 84594, "epoch": 2014} {"train_loss": -6.193125247955322, "global_step": 84595, "epoch": 2014} {"train_loss": -6.181545257568359, "global_step": 84596, "epoch": 2014} {"train_loss": -6.193817138671875, "global_step": 84597, "epoch": 2014} {"train_loss": -6.155856132507324, "global_step": 84598, "epoch": 2014} {"train_loss": -6.129971504211426, "global_step": 84599, "epoch": 2014} {"train_loss": -6.153229713439941, "global_step": 84600, "epoch": 2014} {"train_loss": -6.250755310058594, "global_step": 84601, "epoch": 2014} {"train_loss": -6.225724220275879, "global_step": 84602, "epoch": 2014} {"train_loss": -6.236299514770508, "global_step": 84603, "epoch": 2014} {"train_loss": -6.2255096435546875, "global_step": 84604, "epoch": 2014} {"train_loss": -6.112923622131348, "global_step": 84605, "epoch": 2014} {"train_loss": -6.256302833557129, "global_step": 84606, "epoch": 2014} {"train_loss": -6.144658088684082, "global_step": 84607, "epoch": 2014} {"train_loss": -6.171849727630615, "global_step": 84608, "epoch": 2014} {"train_loss": -6.320326805114746, "global_step": 84609, "epoch": 2014} {"train_loss": -6.145368576049805, "global_step": 84610, "epoch": 2014} {"train_loss": -6.294692039489746, "global_step": 84611, "epoch": 2014} {"train_loss": -6.134793281555176, "global_step": 84612, "epoch": 2014} {"train_loss": -6.119232177734375, "global_step": 84613, "epoch": 2014} {"train_loss": -6.242400169372559, "global_step": 84614, "epoch": 2014} {"train_loss": -6.153289794921875, "global_step": 84615, "epoch": 2014} {"train_loss": -6.116146564483643, "global_step": 84616, "epoch": 2014} {"train_loss": -6.201498985290527, "global_step": 84617, "epoch": 2014} {"train_loss": -6.151946067810059, "global_step": 84618, "epoch": 2014} {"train_loss": -6.272368907928467, "global_step": 84619, "epoch": 2014} {"train_loss": -6.179989814758301, "global_step": 84620, "epoch": 2014} {"train_loss": -6.171698570251465, "global_step": 84621, "epoch": 2014} {"train_loss": -6.146777153015137, "global_step": 84622, "epoch": 2014} {"train_loss": -6.023862838745117, "global_step": 84623, "epoch": 2014} {"train_loss": -6.082151889801025, "global_step": 84624, "epoch": 2014} {"train_loss": -6.139887809753418, "global_step": 84625, "epoch": 2014} {"train_loss": -6.226818084716797, "global_step": 84626, "epoch": 2014} {"train_loss": -6.18135404586792, "global_step": 84627, "epoch": 2014} {"train_loss": -6.085005760192871, "global_step": 84628, "epoch": 2014} {"train_loss": -6.185422148023333, "global_step": 84629, "epoch": 2014, "val_loss": 75113.28125} {"train_loss": -6.091315746307373, "global_step": 84630, "epoch": 2015} {"train_loss": -6.188638687133789, "global_step": 84631, "epoch": 2015} {"train_loss": -6.1982316970825195, "global_step": 84632, "epoch": 2015} {"train_loss": -6.043942928314209, "global_step": 84633, "epoch": 2015} {"train_loss": -6.138677597045898, "global_step": 84634, "epoch": 2015} {"train_loss": -6.097585201263428, "global_step": 84635, "epoch": 2015} {"train_loss": -6.110285758972168, "global_step": 84636, "epoch": 2015} {"train_loss": -6.059052467346191, "global_step": 84637, "epoch": 2015} {"train_loss": -6.0978007316589355, "global_step": 84638, "epoch": 2015} {"train_loss": -6.1536970138549805, "global_step": 84639, "epoch": 2015} {"train_loss": -6.151060104370117, "global_step": 84640, "epoch": 2015} {"train_loss": -6.167525768280029, "global_step": 84641, "epoch": 2015} {"train_loss": -6.124759674072266, "global_step": 84642, "epoch": 2015} {"train_loss": -6.086999893188477, "global_step": 84643, "epoch": 2015} {"train_loss": -6.152831554412842, "global_step": 84644, "epoch": 2015} {"train_loss": -6.224360466003418, "global_step": 84645, "epoch": 2015} {"train_loss": -6.1840667724609375, "global_step": 84646, "epoch": 2015} {"train_loss": -6.294173240661621, "global_step": 84647, "epoch": 2015} {"train_loss": -6.203736782073975, "global_step": 84648, "epoch": 2015} {"train_loss": -6.057095527648926, "global_step": 84649, "epoch": 2015} {"train_loss": -6.195069313049316, "global_step": 84650, "epoch": 2015} {"train_loss": -6.152113914489746, "global_step": 84651, "epoch": 2015} {"train_loss": -6.266822814941406, "global_step": 84652, "epoch": 2015} {"train_loss": -6.136782169342041, "global_step": 84653, "epoch": 2015} {"train_loss": -6.2193779945373535, "global_step": 84654, "epoch": 2015} {"train_loss": -6.297980785369873, "global_step": 84655, "epoch": 2015} {"train_loss": -6.280696868896484, "global_step": 84656, "epoch": 2015} {"train_loss": -6.1912055015563965, "global_step": 84657, "epoch": 2015} {"train_loss": -6.281826972961426, "global_step": 84658, "epoch": 2015} {"train_loss": -6.089768409729004, "global_step": 84659, "epoch": 2015} {"train_loss": -6.20217227935791, "global_step": 84660, "epoch": 2015} {"train_loss": -6.071872711181641, "global_step": 84661, "epoch": 2015} {"train_loss": -6.11787223815918, "global_step": 84662, "epoch": 2015} {"train_loss": -6.278416156768799, "global_step": 84663, "epoch": 2015} {"train_loss": -6.126774311065674, "global_step": 84664, "epoch": 2015} {"train_loss": -6.112886428833008, "global_step": 84665, "epoch": 2015} {"train_loss": -6.222628593444824, "global_step": 84666, "epoch": 2015} {"train_loss": -6.19932746887207, "global_step": 84667, "epoch": 2015} {"train_loss": -6.1132965087890625, "global_step": 84668, "epoch": 2015} {"train_loss": -6.220086097717285, "global_step": 84669, "epoch": 2015} {"train_loss": -6.213930130004883, "global_step": 84670, "epoch": 2015} {"train_loss": -6.165274381637573, "global_step": 84671, "epoch": 2015, "val_loss": 75201.671875} {"train_loss": -6.181329727172852, "global_step": 84672, "epoch": 2016} {"train_loss": -6.232877731323242, "global_step": 84673, "epoch": 2016} {"train_loss": -6.173533916473389, "global_step": 84674, "epoch": 2016} {"train_loss": -6.2463459968566895, "global_step": 84675, "epoch": 2016} {"train_loss": -6.263083457946777, "global_step": 84676, "epoch": 2016} {"train_loss": -6.197853088378906, "global_step": 84677, "epoch": 2016} {"train_loss": -6.1733808517456055, "global_step": 84678, "epoch": 2016} {"train_loss": -6.180873870849609, "global_step": 84679, "epoch": 2016} {"train_loss": -6.183498382568359, "global_step": 84680, "epoch": 2016} {"train_loss": -6.271517753601074, "global_step": 84681, "epoch": 2016} {"train_loss": -6.161541938781738, "global_step": 84682, "epoch": 2016} {"train_loss": -6.273379325866699, "global_step": 84683, "epoch": 2016} {"train_loss": -6.2298383712768555, "global_step": 84684, "epoch": 2016} {"train_loss": -6.132966995239258, "global_step": 84685, "epoch": 2016} {"train_loss": -6.256505966186523, "global_step": 84686, "epoch": 2016} {"train_loss": -6.221784591674805, "global_step": 84687, "epoch": 2016} {"train_loss": -6.180274486541748, "global_step": 84688, "epoch": 2016} {"train_loss": -6.244056701660156, "global_step": 84689, "epoch": 2016} {"train_loss": -6.304770469665527, "global_step": 84690, "epoch": 2016} {"train_loss": -6.219196319580078, "global_step": 84691, "epoch": 2016} {"train_loss": -6.2980852127075195, "global_step": 84692, "epoch": 2016} {"train_loss": -6.080489158630371, "global_step": 84693, "epoch": 2016} {"train_loss": -6.27900505065918, "global_step": 84694, "epoch": 2016} {"train_loss": -6.213770866394043, "global_step": 84695, "epoch": 2016} {"train_loss": -6.1446733474731445, "global_step": 84696, "epoch": 2016} {"train_loss": -6.163874626159668, "global_step": 84697, "epoch": 2016} {"train_loss": -6.252738952636719, "global_step": 84698, "epoch": 2016} {"train_loss": -6.307107925415039, "global_step": 84699, "epoch": 2016} {"train_loss": -6.161773681640625, "global_step": 84700, "epoch": 2016} {"train_loss": -6.19782829284668, "global_step": 84701, "epoch": 2016} {"train_loss": -6.2971720695495605, "global_step": 84702, "epoch": 2016} {"train_loss": -6.210829734802246, "global_step": 84703, "epoch": 2016} {"train_loss": -6.214677810668945, "global_step": 84704, "epoch": 2016} {"train_loss": -6.149401664733887, "global_step": 84705, "epoch": 2016} {"train_loss": -6.205667018890381, "global_step": 84706, "epoch": 2016} {"train_loss": -6.181397914886475, "global_step": 84707, "epoch": 2016} {"train_loss": -6.193669319152832, "global_step": 84708, "epoch": 2016} {"train_loss": -6.197227954864502, "global_step": 84709, "epoch": 2016} {"train_loss": -6.09730339050293, "global_step": 84710, "epoch": 2016} {"train_loss": -6.260498046875, "global_step": 84711, "epoch": 2016} {"train_loss": -6.100421905517578, "global_step": 84712, "epoch": 2016} {"train_loss": -6.211875154858544, "global_step": 84713, "epoch": 2016, "val_loss": 75328.0} {"train_loss": -6.261557579040527, "global_step": 84714, "epoch": 2017} {"train_loss": -6.228412628173828, "global_step": 84715, "epoch": 2017} {"train_loss": -6.240471839904785, "global_step": 84716, "epoch": 2017} {"train_loss": -6.162478446960449, "global_step": 84717, "epoch": 2017} {"train_loss": -6.220458507537842, "global_step": 84718, "epoch": 2017} {"train_loss": -6.298245429992676, "global_step": 84719, "epoch": 2017} {"train_loss": -6.205918312072754, "global_step": 84720, "epoch": 2017} {"train_loss": -6.17653751373291, "global_step": 84721, "epoch": 2017} {"train_loss": -6.137313365936279, "global_step": 84722, "epoch": 2017} {"train_loss": -6.1033477783203125, "global_step": 84723, "epoch": 2017} {"train_loss": -6.159670829772949, "global_step": 84724, "epoch": 2017} {"train_loss": -6.15144157409668, "global_step": 84725, "epoch": 2017} {"train_loss": -6.19440221786499, "global_step": 84726, "epoch": 2017} {"train_loss": -6.107108116149902, "global_step": 84727, "epoch": 2017} {"train_loss": -6.226921081542969, "global_step": 84728, "epoch": 2017} {"train_loss": -6.171971321105957, "global_step": 84729, "epoch": 2017} {"train_loss": -6.294709205627441, "global_step": 84730, "epoch": 2017} {"train_loss": -6.3215436935424805, "global_step": 84731, "epoch": 2017} {"train_loss": -6.231212615966797, "global_step": 84732, "epoch": 2017} {"train_loss": -6.231773376464844, "global_step": 84733, "epoch": 2017} {"train_loss": -6.127891540527344, "global_step": 84734, "epoch": 2017} {"train_loss": -6.21865177154541, "global_step": 84735, "epoch": 2017} {"train_loss": -6.105633735656738, "global_step": 84736, "epoch": 2017} {"train_loss": -6.2229413986206055, "global_step": 84737, "epoch": 2017} {"train_loss": -6.190506935119629, "global_step": 84738, "epoch": 2017} {"train_loss": -6.258412837982178, "global_step": 84739, "epoch": 2017} {"train_loss": -6.114309787750244, "global_step": 84740, "epoch": 2017} {"train_loss": -6.244091033935547, "global_step": 84741, "epoch": 2017} {"train_loss": -6.1341962814331055, "global_step": 84742, "epoch": 2017} {"train_loss": -6.204671859741211, "global_step": 84743, "epoch": 2017} {"train_loss": -6.281769752502441, "global_step": 84744, "epoch": 2017} {"train_loss": -6.252087593078613, "global_step": 84745, "epoch": 2017} {"train_loss": -6.177417755126953, "global_step": 84746, "epoch": 2017} {"train_loss": -6.193102836608887, "global_step": 84747, "epoch": 2017} {"train_loss": -6.320659637451172, "global_step": 84748, "epoch": 2017} {"train_loss": -6.186485767364502, "global_step": 84749, "epoch": 2017} {"train_loss": -6.172901153564453, "global_step": 84750, "epoch": 2017} {"train_loss": -6.193632125854492, "global_step": 84751, "epoch": 2017} {"train_loss": -6.195768356323242, "global_step": 84752, "epoch": 2017} {"train_loss": -6.1212310791015625, "global_step": 84753, "epoch": 2017} {"train_loss": -6.159665107727051, "global_step": 84754, "epoch": 2017} {"train_loss": -6.199891226632254, "global_step": 84755, "epoch": 2017, "val_loss": 75227.5546875} {"train_loss": -6.2939581871032715, "global_step": 84756, "epoch": 2018} {"train_loss": -6.076870918273926, "global_step": 84757, "epoch": 2018} {"train_loss": -6.086897373199463, "global_step": 84758, "epoch": 2018} {"train_loss": -6.26849365234375, "global_step": 84759, "epoch": 2018} {"train_loss": -6.202012062072754, "global_step": 84760, "epoch": 2018} {"train_loss": -6.137687683105469, "global_step": 84761, "epoch": 2018} {"train_loss": -6.073692798614502, "global_step": 84762, "epoch": 2018} {"train_loss": -6.238531112670898, "global_step": 84763, "epoch": 2018} {"train_loss": -6.064101219177246, "global_step": 84764, "epoch": 2018} {"train_loss": -6.079748153686523, "global_step": 84765, "epoch": 2018} {"train_loss": -6.045212745666504, "global_step": 84766, "epoch": 2018} {"train_loss": -6.046903610229492, "global_step": 84767, "epoch": 2018} {"train_loss": -6.151801586151123, "global_step": 84768, "epoch": 2018} {"train_loss": -6.072558403015137, "global_step": 84769, "epoch": 2018} {"train_loss": -6.110395431518555, "global_step": 84770, "epoch": 2018} {"train_loss": -6.077250003814697, "global_step": 84771, "epoch": 2018} {"train_loss": -6.038837432861328, "global_step": 84772, "epoch": 2018} {"train_loss": -6.107570648193359, "global_step": 84773, "epoch": 2018} {"train_loss": -6.054897308349609, "global_step": 84774, "epoch": 2018} {"train_loss": -6.053761005401611, "global_step": 84775, "epoch": 2018} {"train_loss": -6.055567741394043, "global_step": 84776, "epoch": 2018} {"train_loss": -6.22232723236084, "global_step": 84777, "epoch": 2018} {"train_loss": -6.069771766662598, "global_step": 84778, "epoch": 2018} {"train_loss": -6.129389762878418, "global_step": 84779, "epoch": 2018} {"train_loss": -6.133955955505371, "global_step": 84780, "epoch": 2018} {"train_loss": -6.1094865798950195, "global_step": 84781, "epoch": 2018} {"train_loss": -6.250448226928711, "global_step": 84782, "epoch": 2018} {"train_loss": -6.049826145172119, "global_step": 84783, "epoch": 2018} {"train_loss": -6.079739570617676, "global_step": 84784, "epoch": 2018} {"train_loss": -6.164224624633789, "global_step": 84785, "epoch": 2018} {"train_loss": -6.18820858001709, "global_step": 84786, "epoch": 2018} {"train_loss": -6.186469078063965, "global_step": 84787, "epoch": 2018} {"train_loss": -6.107684135437012, "global_step": 84788, "epoch": 2018} {"train_loss": -6.128966808319092, "global_step": 84789, "epoch": 2018} {"train_loss": -6.187233924865723, "global_step": 84790, "epoch": 2018} {"train_loss": -6.102566719055176, "global_step": 84791, "epoch": 2018} {"train_loss": -6.244072914123535, "global_step": 84792, "epoch": 2018} {"train_loss": -6.028456687927246, "global_step": 84793, "epoch": 2018} {"train_loss": -6.036712646484375, "global_step": 84794, "epoch": 2018} {"train_loss": -6.094017028808594, "global_step": 84795, "epoch": 2018} {"train_loss": -6.167844772338867, "global_step": 84796, "epoch": 2018} {"train_loss": -6.124039116359892, "global_step": 84797, "epoch": 2018, "val_loss": 75197.4765625} {"train_loss": -6.148195266723633, "global_step": 84798, "epoch": 2019} {"train_loss": -6.123763561248779, "global_step": 84799, "epoch": 2019} {"train_loss": -6.122051239013672, "global_step": 84800, "epoch": 2019} {"train_loss": -6.136956214904785, "global_step": 84801, "epoch": 2019} {"train_loss": -6.160120487213135, "global_step": 84802, "epoch": 2019} {"train_loss": -6.1737446784973145, "global_step": 84803, "epoch": 2019} {"train_loss": -6.092101097106934, "global_step": 84804, "epoch": 2019} {"train_loss": -6.143683433532715, "global_step": 84805, "epoch": 2019} {"train_loss": -6.161516189575195, "global_step": 84806, "epoch": 2019} {"train_loss": -6.2228240966796875, "global_step": 84807, "epoch": 2019} {"train_loss": -5.932073593139648, "global_step": 84808, "epoch": 2019} {"train_loss": -6.224762916564941, "global_step": 84809, "epoch": 2019} {"train_loss": -5.8969855308532715, "global_step": 84810, "epoch": 2019} {"train_loss": -6.1838226318359375, "global_step": 84811, "epoch": 2019} {"train_loss": -5.919886112213135, "global_step": 84812, "epoch": 2019} {"train_loss": -6.10704231262207, "global_step": 84813, "epoch": 2019} {"train_loss": -6.050838470458984, "global_step": 84814, "epoch": 2019} {"train_loss": -6.216577529907227, "global_step": 84815, "epoch": 2019} {"train_loss": -5.966534614562988, "global_step": 84816, "epoch": 2019} {"train_loss": -6.179825782775879, "global_step": 84817, "epoch": 2019} {"train_loss": -6.131736755371094, "global_step": 84818, "epoch": 2019} {"train_loss": -6.179242134094238, "global_step": 84819, "epoch": 2019} {"train_loss": -6.256866455078125, "global_step": 84820, "epoch": 2019} {"train_loss": -6.00825309753418, "global_step": 84821, "epoch": 2019} {"train_loss": -6.117898464202881, "global_step": 84822, "epoch": 2019} {"train_loss": -6.120017051696777, "global_step": 84823, "epoch": 2019} {"train_loss": -6.134491920471191, "global_step": 84824, "epoch": 2019} {"train_loss": -6.164356231689453, "global_step": 84825, "epoch": 2019} {"train_loss": -6.135303497314453, "global_step": 84826, "epoch": 2019} {"train_loss": -6.1969709396362305, "global_step": 84827, "epoch": 2019} {"train_loss": -6.198371887207031, "global_step": 84828, "epoch": 2019} {"train_loss": -6.134689807891846, "global_step": 84829, "epoch": 2019} {"train_loss": -6.211012840270996, "global_step": 84830, "epoch": 2019} {"train_loss": -6.173182487487793, "global_step": 84831, "epoch": 2019} {"train_loss": -6.239266395568848, "global_step": 84832, "epoch": 2019} {"train_loss": -6.269514083862305, "global_step": 84833, "epoch": 2019} {"train_loss": -6.064962863922119, "global_step": 84834, "epoch": 2019} {"train_loss": -6.087456703186035, "global_step": 84835, "epoch": 2019} {"train_loss": -6.199576377868652, "global_step": 84836, "epoch": 2019} {"train_loss": -6.126105785369873, "global_step": 84837, "epoch": 2019} {"train_loss": -6.107990741729736, "global_step": 84838, "epoch": 2019} {"train_loss": -6.132406280154274, "global_step": 84839, "epoch": 2019, "val_loss": 75015.8515625} {"train_loss": -6.294182777404785, "global_step": 84840, "epoch": 2020} {"train_loss": -6.304724216461182, "global_step": 84841, "epoch": 2020} {"train_loss": -6.2266082763671875, "global_step": 84842, "epoch": 2020} {"train_loss": -6.209636688232422, "global_step": 84843, "epoch": 2020} {"train_loss": -6.1122517585754395, "global_step": 84844, "epoch": 2020} {"train_loss": -6.237356662750244, "global_step": 84845, "epoch": 2020} {"train_loss": -6.390987873077393, "global_step": 84846, "epoch": 2020} {"train_loss": -6.217310905456543, "global_step": 84847, "epoch": 2020} {"train_loss": -6.239994049072266, "global_step": 84848, "epoch": 2020} {"train_loss": -6.312535285949707, "global_step": 84849, "epoch": 2020} {"train_loss": -6.200684547424316, "global_step": 84850, "epoch": 2020} {"train_loss": -6.141406536102295, "global_step": 84851, "epoch": 2020} {"train_loss": -6.2107343673706055, "global_step": 84852, "epoch": 2020} {"train_loss": -6.250633239746094, "global_step": 84853, "epoch": 2020} {"train_loss": -6.187712669372559, "global_step": 84854, "epoch": 2020} {"train_loss": -6.193480014801025, "global_step": 84855, "epoch": 2020} {"train_loss": -6.257664680480957, "global_step": 84856, "epoch": 2020} {"train_loss": -6.2709126472473145, "global_step": 84857, "epoch": 2020} {"train_loss": -6.096980094909668, "global_step": 84858, "epoch": 2020} {"train_loss": -6.308361053466797, "global_step": 84859, "epoch": 2020} {"train_loss": -6.263503074645996, "global_step": 84860, "epoch": 2020} {"train_loss": -6.150991916656494, "global_step": 84861, "epoch": 2020} {"train_loss": -6.289103031158447, "global_step": 84862, "epoch": 2020} {"train_loss": -6.134698390960693, "global_step": 84863, "epoch": 2020} {"train_loss": -6.030331611633301, "global_step": 84864, "epoch": 2020} {"train_loss": -6.327719211578369, "global_step": 84865, "epoch": 2020} {"train_loss": -5.967155456542969, "global_step": 84866, "epoch": 2020} {"train_loss": -6.251338005065918, "global_step": 84867, "epoch": 2020} {"train_loss": -6.225917816162109, "global_step": 84868, "epoch": 2020} {"train_loss": -6.270760536193848, "global_step": 84869, "epoch": 2020} {"train_loss": -6.285060882568359, "global_step": 84870, "epoch": 2020} {"train_loss": -6.154424667358398, "global_step": 84871, "epoch": 2020} {"train_loss": -6.201003074645996, "global_step": 84872, "epoch": 2020} {"train_loss": -6.19288444519043, "global_step": 84873, "epoch": 2020} {"train_loss": -6.181199550628662, "global_step": 84874, "epoch": 2020} {"train_loss": -6.164030075073242, "global_step": 84875, "epoch": 2020} {"train_loss": -6.140885829925537, "global_step": 84876, "epoch": 2020} {"train_loss": -6.195640563964844, "global_step": 84877, "epoch": 2020} {"train_loss": -6.186931610107422, "global_step": 84878, "epoch": 2020} {"train_loss": -6.088031768798828, "global_step": 84879, "epoch": 2020} {"train_loss": -6.142543315887451, "global_step": 84880, "epoch": 2020} {"train_loss": -6.2065159139179045, "global_step": 84881, "epoch": 2020, "val_loss": 75356.90625} {"train_loss": -6.269935131072998, "global_step": 84882, "epoch": 2021} {"train_loss": -6.241211414337158, "global_step": 84883, "epoch": 2021} {"train_loss": -6.223176956176758, "global_step": 84884, "epoch": 2021} {"train_loss": -6.078201770782471, "global_step": 84885, "epoch": 2021} {"train_loss": -6.24074649810791, "global_step": 84886, "epoch": 2021} {"train_loss": -6.200461387634277, "global_step": 84887, "epoch": 2021} {"train_loss": -6.216310501098633, "global_step": 84888, "epoch": 2021} {"train_loss": -6.196384429931641, "global_step": 84889, "epoch": 2021} {"train_loss": -6.245460033416748, "global_step": 84890, "epoch": 2021} {"train_loss": -6.285560607910156, "global_step": 84891, "epoch": 2021} {"train_loss": -6.33695125579834, "global_step": 84892, "epoch": 2021} {"train_loss": -6.09205961227417, "global_step": 84893, "epoch": 2021} {"train_loss": -6.118466377258301, "global_step": 84894, "epoch": 2021} {"train_loss": -6.275078296661377, "global_step": 84895, "epoch": 2021} {"train_loss": -6.231651306152344, "global_step": 84896, "epoch": 2021} {"train_loss": -6.136943817138672, "global_step": 84897, "epoch": 2021} {"train_loss": -6.229877948760986, "global_step": 84898, "epoch": 2021} {"train_loss": -6.2116498947143555, "global_step": 84899, "epoch": 2021} {"train_loss": -6.372679233551025, "global_step": 84900, "epoch": 2021} {"train_loss": -6.1620869636535645, "global_step": 84901, "epoch": 2021} {"train_loss": -6.132743835449219, "global_step": 84902, "epoch": 2021} {"train_loss": -6.116642951965332, "global_step": 84903, "epoch": 2021} {"train_loss": -6.263206958770752, "global_step": 84904, "epoch": 2021} {"train_loss": -6.0899763107299805, "global_step": 84905, "epoch": 2021} {"train_loss": -6.21064567565918, "global_step": 84906, "epoch": 2021} {"train_loss": -6.035362720489502, "global_step": 84907, "epoch": 2021} {"train_loss": -6.214489459991455, "global_step": 84908, "epoch": 2021} {"train_loss": -6.251869201660156, "global_step": 84909, "epoch": 2021} {"train_loss": -6.310976982116699, "global_step": 84910, "epoch": 2021} {"train_loss": -6.174862384796143, "global_step": 84911, "epoch": 2021} {"train_loss": -6.325294017791748, "global_step": 84912, "epoch": 2021} {"train_loss": -6.153125762939453, "global_step": 84913, "epoch": 2021} {"train_loss": -6.1530232429504395, "global_step": 84914, "epoch": 2021} {"train_loss": -6.200984954833984, "global_step": 84915, "epoch": 2021} {"train_loss": -6.126405239105225, "global_step": 84916, "epoch": 2021} {"train_loss": -6.138828277587891, "global_step": 84917, "epoch": 2021} {"train_loss": -6.169750213623047, "global_step": 84918, "epoch": 2021} {"train_loss": -6.148350715637207, "global_step": 84919, "epoch": 2021} {"train_loss": -6.239198684692383, "global_step": 84920, "epoch": 2021} {"train_loss": -6.060647010803223, "global_step": 84921, "epoch": 2021} {"train_loss": -6.234715461730957, "global_step": 84922, "epoch": 2021} {"train_loss": -6.197054590497698, "global_step": 84923, "epoch": 2021, "val_loss": 75603.109375} {"train_loss": -6.01901912689209, "global_step": 84924, "epoch": 2022} {"train_loss": -6.077973365783691, "global_step": 84925, "epoch": 2022} {"train_loss": -6.185993671417236, "global_step": 84926, "epoch": 2022} {"train_loss": -6.108191013336182, "global_step": 84927, "epoch": 2022} {"train_loss": -6.2367072105407715, "global_step": 84928, "epoch": 2022} {"train_loss": -6.1738972663879395, "global_step": 84929, "epoch": 2022} {"train_loss": -6.158115386962891, "global_step": 84930, "epoch": 2022} {"train_loss": -6.161829948425293, "global_step": 84931, "epoch": 2022} {"train_loss": -6.258326530456543, "global_step": 84932, "epoch": 2022} {"train_loss": -6.108182907104492, "global_step": 84933, "epoch": 2022} {"train_loss": -6.190127849578857, "global_step": 84934, "epoch": 2022} {"train_loss": -6.0346879959106445, "global_step": 84935, "epoch": 2022} {"train_loss": -6.26768684387207, "global_step": 84936, "epoch": 2022} {"train_loss": -6.1825385093688965, "global_step": 84937, "epoch": 2022} {"train_loss": -6.154415607452393, "global_step": 84938, "epoch": 2022} {"train_loss": -6.248702049255371, "global_step": 84939, "epoch": 2022} {"train_loss": -6.095090866088867, "global_step": 84940, "epoch": 2022} {"train_loss": -6.269055366516113, "global_step": 84941, "epoch": 2022} {"train_loss": -6.195136547088623, "global_step": 84942, "epoch": 2022} {"train_loss": -6.179664611816406, "global_step": 84943, "epoch": 2022} {"train_loss": -6.361449241638184, "global_step": 84944, "epoch": 2022} {"train_loss": -6.281989574432373, "global_step": 84945, "epoch": 2022} {"train_loss": -6.154797077178955, "global_step": 84946, "epoch": 2022} {"train_loss": -6.192218780517578, "global_step": 84947, "epoch": 2022} {"train_loss": -6.078180313110352, "global_step": 84948, "epoch": 2022} {"train_loss": -6.169217586517334, "global_step": 84949, "epoch": 2022} {"train_loss": -6.188357353210449, "global_step": 84950, "epoch": 2022} {"train_loss": -6.285698890686035, "global_step": 84951, "epoch": 2022} {"train_loss": -6.326699256896973, "global_step": 84952, "epoch": 2022} {"train_loss": -6.234203338623047, "global_step": 84953, "epoch": 2022} {"train_loss": -6.325664520263672, "global_step": 84954, "epoch": 2022} {"train_loss": -6.179281234741211, "global_step": 84955, "epoch": 2022} {"train_loss": -6.262923717498779, "global_step": 84956, "epoch": 2022} {"train_loss": -6.148347854614258, "global_step": 84957, "epoch": 2022} {"train_loss": -6.102840900421143, "global_step": 84958, "epoch": 2022} {"train_loss": -6.163224220275879, "global_step": 84959, "epoch": 2022} {"train_loss": -6.228426456451416, "global_step": 84960, "epoch": 2022} {"train_loss": -6.365200996398926, "global_step": 84961, "epoch": 2022} {"train_loss": -6.174349784851074, "global_step": 84962, "epoch": 2022} {"train_loss": -6.230108737945557, "global_step": 84963, "epoch": 2022} {"train_loss": -6.256402969360352, "global_step": 84964, "epoch": 2022} {"train_loss": -6.195347661063785, "global_step": 84965, "epoch": 2022, "val_loss": 74643.640625} {"train_loss": -6.137587547302246, "global_step": 84966, "epoch": 2023} {"train_loss": -6.277800559997559, "global_step": 84967, "epoch": 2023} {"train_loss": -6.2410807609558105, "global_step": 84968, "epoch": 2023} {"train_loss": -6.311169624328613, "global_step": 84969, "epoch": 2023} {"train_loss": -6.178260803222656, "global_step": 84970, "epoch": 2023} {"train_loss": -6.260935306549072, "global_step": 84971, "epoch": 2023} {"train_loss": -6.21809196472168, "global_step": 84972, "epoch": 2023} {"train_loss": -6.277392387390137, "global_step": 84973, "epoch": 2023} {"train_loss": -6.135765075683594, "global_step": 84974, "epoch": 2023} {"train_loss": -6.206534385681152, "global_step": 84975, "epoch": 2023} {"train_loss": -6.2404584884643555, "global_step": 84976, "epoch": 2023} {"train_loss": -6.0645647048950195, "global_step": 84977, "epoch": 2023} {"train_loss": -6.09581995010376, "global_step": 84978, "epoch": 2023} {"train_loss": -6.190037250518799, "global_step": 84979, "epoch": 2023} {"train_loss": -6.044811725616455, "global_step": 84980, "epoch": 2023} {"train_loss": -6.1230010986328125, "global_step": 84981, "epoch": 2023} {"train_loss": -6.097507953643799, "global_step": 84982, "epoch": 2023} {"train_loss": -6.304138660430908, "global_step": 84983, "epoch": 2023} {"train_loss": -6.250399589538574, "global_step": 84984, "epoch": 2023} {"train_loss": -6.329376220703125, "global_step": 84985, "epoch": 2023} {"train_loss": -6.197274208068848, "global_step": 84986, "epoch": 2023} {"train_loss": -6.064084053039551, "global_step": 84987, "epoch": 2023} {"train_loss": -6.136844635009766, "global_step": 84988, "epoch": 2023} {"train_loss": -6.168515205383301, "global_step": 84989, "epoch": 2023} {"train_loss": -6.185959339141846, "global_step": 84990, "epoch": 2023} {"train_loss": -6.274441719055176, "global_step": 84991, "epoch": 2023} {"train_loss": -6.194581985473633, "global_step": 84992, "epoch": 2023} {"train_loss": -5.985595703125, "global_step": 84993, "epoch": 2023} {"train_loss": -6.2420196533203125, "global_step": 84994, "epoch": 2023} {"train_loss": -6.225549697875977, "global_step": 84995, "epoch": 2023} {"train_loss": -6.126377582550049, "global_step": 84996, "epoch": 2023} {"train_loss": -6.266915321350098, "global_step": 84997, "epoch": 2023} {"train_loss": -6.209802627563477, "global_step": 84998, "epoch": 2023} {"train_loss": -6.2426605224609375, "global_step": 84999, "epoch": 2023} {"train_loss": -6.207366943359375, "global_step": 85000, "epoch": 2023} {"train_loss": -6.135893821716309, "global_step": 85001, "epoch": 2023} {"train_loss": -6.105971336364746, "global_step": 85002, "epoch": 2023} {"train_loss": -6.218985080718994, "global_step": 85003, "epoch": 2023} {"train_loss": -6.196507453918457, "global_step": 85004, "epoch": 2023} {"train_loss": -6.2507171630859375, "global_step": 85005, "epoch": 2023} {"train_loss": -6.146652698516846, "global_step": 85006, "epoch": 2023} {"train_loss": -6.190360489345732, "global_step": 85007, "epoch": 2023, "val_loss": 75227.1640625} {"train_loss": -6.105044364929199, "global_step": 85008, "epoch": 2024} {"train_loss": -6.218061447143555, "global_step": 85009, "epoch": 2024} {"train_loss": -6.175784587860107, "global_step": 85010, "epoch": 2024} {"train_loss": -6.217940807342529, "global_step": 85011, "epoch": 2024} {"train_loss": -6.248945713043213, "global_step": 85012, "epoch": 2024} {"train_loss": -6.13715124130249, "global_step": 85013, "epoch": 2024} {"train_loss": -6.250360488891602, "global_step": 85014, "epoch": 2024} {"train_loss": -6.182828903198242, "global_step": 85015, "epoch": 2024} {"train_loss": -6.105267524719238, "global_step": 85016, "epoch": 2024} {"train_loss": -6.229795455932617, "global_step": 85017, "epoch": 2024} {"train_loss": -6.109570503234863, "global_step": 85018, "epoch": 2024} {"train_loss": -6.159173965454102, "global_step": 85019, "epoch": 2024} {"train_loss": -6.128877639770508, "global_step": 85020, "epoch": 2024} {"train_loss": -6.11446475982666, "global_step": 85021, "epoch": 2024} {"train_loss": -6.059436798095703, "global_step": 85022, "epoch": 2024} {"train_loss": -6.051772594451904, "global_step": 85023, "epoch": 2024} {"train_loss": -6.173803806304932, "global_step": 85024, "epoch": 2024} {"train_loss": -6.1443891525268555, "global_step": 85025, "epoch": 2024} {"train_loss": -5.996194362640381, "global_step": 85026, "epoch": 2024} {"train_loss": -6.306222915649414, "global_step": 85027, "epoch": 2024} {"train_loss": -6.078544616699219, "global_step": 85028, "epoch": 2024} {"train_loss": -6.281313419342041, "global_step": 85029, "epoch": 2024} {"train_loss": -6.1591057777404785, "global_step": 85030, "epoch": 2024} {"train_loss": -6.213774681091309, "global_step": 85031, "epoch": 2024} {"train_loss": -6.297044277191162, "global_step": 85032, "epoch": 2024} {"train_loss": -6.153205871582031, "global_step": 85033, "epoch": 2024} {"train_loss": -6.214454650878906, "global_step": 85034, "epoch": 2024} {"train_loss": -6.223568916320801, "global_step": 85035, "epoch": 2024} {"train_loss": -6.130062103271484, "global_step": 85036, "epoch": 2024} {"train_loss": -6.139317989349365, "global_step": 85037, "epoch": 2024} {"train_loss": -6.1682891845703125, "global_step": 85038, "epoch": 2024} {"train_loss": -6.158201217651367, "global_step": 85039, "epoch": 2024} {"train_loss": -6.236237525939941, "global_step": 85040, "epoch": 2024} {"train_loss": -6.17458963394165, "global_step": 85041, "epoch": 2024} {"train_loss": -6.070765018463135, "global_step": 85042, "epoch": 2024} {"train_loss": -6.204799175262451, "global_step": 85043, "epoch": 2024} {"train_loss": -6.152254104614258, "global_step": 85044, "epoch": 2024} {"train_loss": -6.213395118713379, "global_step": 85045, "epoch": 2024} {"train_loss": -6.306663513183594, "global_step": 85046, "epoch": 2024} {"train_loss": -6.120009422302246, "global_step": 85047, "epoch": 2024} {"train_loss": -6.08866024017334, "global_step": 85048, "epoch": 2024} {"train_loss": -6.170211814698719, "global_step": 85049, "epoch": 2024, "val_loss": 75251.6328125} {"train_loss": -6.153830528259277, "global_step": 85050, "epoch": 2025} {"train_loss": -6.182894229888916, "global_step": 85051, "epoch": 2025} {"train_loss": -6.0236077308654785, "global_step": 85052, "epoch": 2025} {"train_loss": -6.046987056732178, "global_step": 85053, "epoch": 2025} {"train_loss": -6.193902969360352, "global_step": 85054, "epoch": 2025} {"train_loss": -6.013904571533203, "global_step": 85055, "epoch": 2025} {"train_loss": -6.09628963470459, "global_step": 85056, "epoch": 2025} {"train_loss": -6.063543319702148, "global_step": 85057, "epoch": 2025} {"train_loss": -6.04844331741333, "global_step": 85058, "epoch": 2025} {"train_loss": -6.0426154136657715, "global_step": 85059, "epoch": 2025} {"train_loss": -6.146816253662109, "global_step": 85060, "epoch": 2025} {"train_loss": -6.12733268737793, "global_step": 85061, "epoch": 2025} {"train_loss": -6.231250762939453, "global_step": 85062, "epoch": 2025} {"train_loss": -6.033690452575684, "global_step": 85063, "epoch": 2025} {"train_loss": -6.176815032958984, "global_step": 85064, "epoch": 2025} {"train_loss": -6.07183837890625, "global_step": 85065, "epoch": 2025} {"train_loss": -6.1733880043029785, "global_step": 85066, "epoch": 2025} {"train_loss": -6.066089153289795, "global_step": 85067, "epoch": 2025} {"train_loss": -6.1801347732543945, "global_step": 85068, "epoch": 2025} {"train_loss": -6.045507431030273, "global_step": 85069, "epoch": 2025} {"train_loss": -6.338840961456299, "global_step": 85070, "epoch": 2025} {"train_loss": -6.084021091461182, "global_step": 85071, "epoch": 2025} {"train_loss": -6.11687707901001, "global_step": 85072, "epoch": 2025} {"train_loss": -6.084815502166748, "global_step": 85073, "epoch": 2025} {"train_loss": -6.115223407745361, "global_step": 85074, "epoch": 2025} {"train_loss": -6.096642017364502, "global_step": 85075, "epoch": 2025} {"train_loss": -6.163103103637695, "global_step": 85076, "epoch": 2025} {"train_loss": -6.131484031677246, "global_step": 85077, "epoch": 2025} {"train_loss": -6.0913238525390625, "global_step": 85078, "epoch": 2025} {"train_loss": -6.132615089416504, "global_step": 85079, "epoch": 2025} {"train_loss": -6.245859146118164, "global_step": 85080, "epoch": 2025} {"train_loss": -6.1541900634765625, "global_step": 85081, "epoch": 2025} {"train_loss": -6.238061428070068, "global_step": 85082, "epoch": 2025} {"train_loss": -6.225622653961182, "global_step": 85083, "epoch": 2025} {"train_loss": -5.915174961090088, "global_step": 85084, "epoch": 2025} {"train_loss": -6.215223789215088, "global_step": 85085, "epoch": 2025} {"train_loss": -6.125682830810547, "global_step": 85086, "epoch": 2025} {"train_loss": -6.169585227966309, "global_step": 85087, "epoch": 2025} {"train_loss": -6.076372146606445, "global_step": 85088, "epoch": 2025} {"train_loss": -6.346506118774414, "global_step": 85089, "epoch": 2025} {"train_loss": -6.180795192718506, "global_step": 85090, "epoch": 2025} {"train_loss": -6.133618434270223, "global_step": 85091, "epoch": 2025, "val_loss": 75020.671875} {"train_loss": -6.278999328613281, "global_step": 85092, "epoch": 2026} {"train_loss": -6.086834907531738, "global_step": 85093, "epoch": 2026} {"train_loss": -6.113123416900635, "global_step": 85094, "epoch": 2026} {"train_loss": -6.118356704711914, "global_step": 85095, "epoch": 2026} {"train_loss": -6.219025135040283, "global_step": 85096, "epoch": 2026} {"train_loss": -6.300567150115967, "global_step": 85097, "epoch": 2026} {"train_loss": -6.157991409301758, "global_step": 85098, "epoch": 2026} {"train_loss": -6.2630510330200195, "global_step": 85099, "epoch": 2026} {"train_loss": -6.158912658691406, "global_step": 85100, "epoch": 2026} {"train_loss": -6.057303428649902, "global_step": 85101, "epoch": 2026} {"train_loss": -6.191438674926758, "global_step": 85102, "epoch": 2026} {"train_loss": -6.233388423919678, "global_step": 85103, "epoch": 2026} {"train_loss": -6.292697906494141, "global_step": 85104, "epoch": 2026} {"train_loss": -6.178842544555664, "global_step": 85105, "epoch": 2026} {"train_loss": -6.300017833709717, "global_step": 85106, "epoch": 2026} {"train_loss": -6.2323408126831055, "global_step": 85107, "epoch": 2026} {"train_loss": -6.245899677276611, "global_step": 85108, "epoch": 2026} {"train_loss": -6.276468276977539, "global_step": 85109, "epoch": 2026} {"train_loss": -6.195799827575684, "global_step": 85110, "epoch": 2026} {"train_loss": -6.257903099060059, "global_step": 85111, "epoch": 2026} {"train_loss": -6.145461559295654, "global_step": 85112, "epoch": 2026} {"train_loss": -6.265810966491699, "global_step": 85113, "epoch": 2026} {"train_loss": -6.303524971008301, "global_step": 85114, "epoch": 2026} {"train_loss": -6.180686950683594, "global_step": 85115, "epoch": 2026} {"train_loss": -6.210715293884277, "global_step": 85116, "epoch": 2026} {"train_loss": -6.249181747436523, "global_step": 85117, "epoch": 2026} {"train_loss": -6.2075958251953125, "global_step": 85118, "epoch": 2026} {"train_loss": -6.14095401763916, "global_step": 85119, "epoch": 2026} {"train_loss": -6.0824971199035645, "global_step": 85120, "epoch": 2026} {"train_loss": -6.119575500488281, "global_step": 85121, "epoch": 2026} {"train_loss": -6.106019020080566, "global_step": 85122, "epoch": 2026} {"train_loss": -6.19258975982666, "global_step": 85123, "epoch": 2026} {"train_loss": -6.153210163116455, "global_step": 85124, "epoch": 2026} {"train_loss": -6.234602928161621, "global_step": 85125, "epoch": 2026} {"train_loss": -6.12030029296875, "global_step": 85126, "epoch": 2026} {"train_loss": -6.068767070770264, "global_step": 85127, "epoch": 2026} {"train_loss": -6.1040143966674805, "global_step": 85128, "epoch": 2026} {"train_loss": -6.238364219665527, "global_step": 85129, "epoch": 2026} {"train_loss": -6.171664237976074, "global_step": 85130, "epoch": 2026} {"train_loss": -6.120650291442871, "global_step": 85131, "epoch": 2026} {"train_loss": -6.255760192871094, "global_step": 85132, "epoch": 2026} {"train_loss": -6.18952404885065, "global_step": 85133, "epoch": 2026, "val_loss": 75016.0625} {"train_loss": -6.04168701171875, "global_step": 85134, "epoch": 2027} {"train_loss": -6.265774250030518, "global_step": 85135, "epoch": 2027} {"train_loss": -6.14484977722168, "global_step": 85136, "epoch": 2027} {"train_loss": -6.169812202453613, "global_step": 85137, "epoch": 2027} {"train_loss": -6.202703475952148, "global_step": 85138, "epoch": 2027} {"train_loss": -6.097294807434082, "global_step": 85139, "epoch": 2027} {"train_loss": -6.281460762023926, "global_step": 85140, "epoch": 2027} {"train_loss": -6.152937889099121, "global_step": 85141, "epoch": 2027} {"train_loss": -6.172458648681641, "global_step": 85142, "epoch": 2027} {"train_loss": -6.222148895263672, "global_step": 85143, "epoch": 2027} {"train_loss": -6.174871444702148, "global_step": 85144, "epoch": 2027} {"train_loss": -6.230990409851074, "global_step": 85145, "epoch": 2027} {"train_loss": -6.262700080871582, "global_step": 85146, "epoch": 2027} {"train_loss": -6.096839904785156, "global_step": 85147, "epoch": 2027} {"train_loss": -6.27573299407959, "global_step": 85148, "epoch": 2027} {"train_loss": -6.235391616821289, "global_step": 85149, "epoch": 2027} {"train_loss": -6.164103031158447, "global_step": 85150, "epoch": 2027} {"train_loss": -6.224831581115723, "global_step": 85151, "epoch": 2027} {"train_loss": -6.246131896972656, "global_step": 85152, "epoch": 2027} {"train_loss": -6.1350507736206055, "global_step": 85153, "epoch": 2027} {"train_loss": -6.278274059295654, "global_step": 85154, "epoch": 2027} {"train_loss": -6.230243682861328, "global_step": 85155, "epoch": 2027} {"train_loss": -6.091230392456055, "global_step": 85156, "epoch": 2027} {"train_loss": -6.057033538818359, "global_step": 85157, "epoch": 2027} {"train_loss": -6.283978462219238, "global_step": 85158, "epoch": 2027} {"train_loss": -6.287338733673096, "global_step": 85159, "epoch": 2027} {"train_loss": -6.253652572631836, "global_step": 85160, "epoch": 2027} {"train_loss": -6.188312530517578, "global_step": 85161, "epoch": 2027} {"train_loss": -6.25594425201416, "global_step": 85162, "epoch": 2027} {"train_loss": -6.158718109130859, "global_step": 85163, "epoch": 2027} {"train_loss": -6.216208457946777, "global_step": 85164, "epoch": 2027} {"train_loss": -6.179055213928223, "global_step": 85165, "epoch": 2027} {"train_loss": -6.275003910064697, "global_step": 85166, "epoch": 2027} {"train_loss": -6.100412845611572, "global_step": 85167, "epoch": 2027} {"train_loss": -6.157384872436523, "global_step": 85168, "epoch": 2027} {"train_loss": -6.146419525146484, "global_step": 85169, "epoch": 2027} {"train_loss": -6.1839599609375, "global_step": 85170, "epoch": 2027} {"train_loss": -6.201617240905762, "global_step": 85171, "epoch": 2027} {"train_loss": -6.282172203063965, "global_step": 85172, "epoch": 2027} {"train_loss": -6.140829086303711, "global_step": 85173, "epoch": 2027} {"train_loss": -6.179318428039551, "global_step": 85174, "epoch": 2027} {"train_loss": -6.194486992699759, "global_step": 85175, "epoch": 2027, "val_loss": 75111.265625} {"train_loss": -6.347250461578369, "global_step": 85176, "epoch": 2028} {"train_loss": -6.246757507324219, "global_step": 85177, "epoch": 2028} {"train_loss": -6.229524612426758, "global_step": 85178, "epoch": 2028} {"train_loss": -6.179384231567383, "global_step": 85179, "epoch": 2028} {"train_loss": -6.112822532653809, "global_step": 85180, "epoch": 2028} {"train_loss": -6.197360515594482, "global_step": 85181, "epoch": 2028} {"train_loss": -6.225034713745117, "global_step": 85182, "epoch": 2028} {"train_loss": -6.186347961425781, "global_step": 85183, "epoch": 2028} {"train_loss": -6.2806830406188965, "global_step": 85184, "epoch": 2028} {"train_loss": -6.186978340148926, "global_step": 85185, "epoch": 2028} {"train_loss": -6.1794610023498535, "global_step": 85186, "epoch": 2028} {"train_loss": -6.041076183319092, "global_step": 85187, "epoch": 2028} {"train_loss": -6.2097487449646, "global_step": 85188, "epoch": 2028} {"train_loss": -6.125068664550781, "global_step": 85189, "epoch": 2028} {"train_loss": -6.214738368988037, "global_step": 85190, "epoch": 2028} {"train_loss": -6.2038774490356445, "global_step": 85191, "epoch": 2028} {"train_loss": -6.135774612426758, "global_step": 85192, "epoch": 2028} {"train_loss": -6.185214519500732, "global_step": 85193, "epoch": 2028} {"train_loss": -6.2839226722717285, "global_step": 85194, "epoch": 2028} {"train_loss": -6.29093074798584, "global_step": 85195, "epoch": 2028} {"train_loss": -6.152944564819336, "global_step": 85196, "epoch": 2028} {"train_loss": -6.183484077453613, "global_step": 85197, "epoch": 2028} {"train_loss": -6.247955322265625, "global_step": 85198, "epoch": 2028} {"train_loss": -6.078760147094727, "global_step": 85199, "epoch": 2028} {"train_loss": -6.247459411621094, "global_step": 85200, "epoch": 2028} {"train_loss": -6.2444305419921875, "global_step": 85201, "epoch": 2028} {"train_loss": -6.185471534729004, "global_step": 85202, "epoch": 2028} {"train_loss": -6.322040557861328, "global_step": 85203, "epoch": 2028} {"train_loss": -6.286642074584961, "global_step": 85204, "epoch": 2028} {"train_loss": -6.193868160247803, "global_step": 85205, "epoch": 2028} {"train_loss": -6.252438068389893, "global_step": 85206, "epoch": 2028} {"train_loss": -6.20830774307251, "global_step": 85207, "epoch": 2028} {"train_loss": -6.2224202156066895, "global_step": 85208, "epoch": 2028} {"train_loss": -6.273824691772461, "global_step": 85209, "epoch": 2028} {"train_loss": -6.1167449951171875, "global_step": 85210, "epoch": 2028} {"train_loss": -6.28068733215332, "global_step": 85211, "epoch": 2028} {"train_loss": -6.216272830963135, "global_step": 85212, "epoch": 2028} {"train_loss": -6.260704040527344, "global_step": 85213, "epoch": 2028} {"train_loss": -6.258142948150635, "global_step": 85214, "epoch": 2028} {"train_loss": -6.085041046142578, "global_step": 85215, "epoch": 2028} {"train_loss": -6.210747718811035, "global_step": 85216, "epoch": 2028} {"train_loss": -6.210782675516038, "global_step": 85217, "epoch": 2028, "val_loss": 75161.390625} {"train_loss": -6.206975936889648, "global_step": 85218, "epoch": 2029} {"train_loss": -6.283427715301514, "global_step": 85219, "epoch": 2029} {"train_loss": -6.216037273406982, "global_step": 85220, "epoch": 2029} {"train_loss": -6.250239372253418, "global_step": 85221, "epoch": 2029} {"train_loss": -6.270425319671631, "global_step": 85222, "epoch": 2029} {"train_loss": -6.118522644042969, "global_step": 85223, "epoch": 2029} {"train_loss": -6.219399929046631, "global_step": 85224, "epoch": 2029} {"train_loss": -6.199221611022949, "global_step": 85225, "epoch": 2029} {"train_loss": -6.3767242431640625, "global_step": 85226, "epoch": 2029} {"train_loss": -6.242297649383545, "global_step": 85227, "epoch": 2029} {"train_loss": -6.274228096008301, "global_step": 85228, "epoch": 2029} {"train_loss": -6.259937286376953, "global_step": 85229, "epoch": 2029} {"train_loss": -6.2350592613220215, "global_step": 85230, "epoch": 2029} {"train_loss": -6.229704856872559, "global_step": 85231, "epoch": 2029} {"train_loss": -6.278835773468018, "global_step": 85232, "epoch": 2029} {"train_loss": -6.21048641204834, "global_step": 85233, "epoch": 2029} {"train_loss": -6.289668083190918, "global_step": 85234, "epoch": 2029} {"train_loss": -6.164431571960449, "global_step": 85235, "epoch": 2029} {"train_loss": -6.278141498565674, "global_step": 85236, "epoch": 2029} {"train_loss": -6.256033897399902, "global_step": 85237, "epoch": 2029} {"train_loss": -6.249351501464844, "global_step": 85238, "epoch": 2029} {"train_loss": -6.173399925231934, "global_step": 85239, "epoch": 2029} {"train_loss": -6.250513553619385, "global_step": 85240, "epoch": 2029} {"train_loss": -6.10915470123291, "global_step": 85241, "epoch": 2029} {"train_loss": -6.184236526489258, "global_step": 85242, "epoch": 2029} {"train_loss": -6.233659744262695, "global_step": 85243, "epoch": 2029} {"train_loss": -6.107027053833008, "global_step": 85244, "epoch": 2029} {"train_loss": -6.141796112060547, "global_step": 85245, "epoch": 2029} {"train_loss": -6.130173683166504, "global_step": 85246, "epoch": 2029} {"train_loss": -6.0567097663879395, "global_step": 85247, "epoch": 2029} {"train_loss": -6.154214859008789, "global_step": 85248, "epoch": 2029} {"train_loss": -6.188113212585449, "global_step": 85249, "epoch": 2029} {"train_loss": -6.153378009796143, "global_step": 85250, "epoch": 2029} {"train_loss": -6.112573623657227, "global_step": 85251, "epoch": 2029} {"train_loss": -6.038782119750977, "global_step": 85252, "epoch": 2029} {"train_loss": -6.193925857543945, "global_step": 85253, "epoch": 2029} {"train_loss": -6.111220836639404, "global_step": 85254, "epoch": 2029} {"train_loss": -6.236396789550781, "global_step": 85255, "epoch": 2029} {"train_loss": -6.204824924468994, "global_step": 85256, "epoch": 2029} {"train_loss": -6.177519798278809, "global_step": 85257, "epoch": 2029} {"train_loss": -6.098172187805176, "global_step": 85258, "epoch": 2029} {"train_loss": -6.2004037243979315, "global_step": 85259, "epoch": 2029, "val_loss": 74846.8046875} {"train_loss": -6.253879070281982, "global_step": 85260, "epoch": 2030} {"train_loss": -6.188802242279053, "global_step": 85261, "epoch": 2030} {"train_loss": -6.17415714263916, "global_step": 85262, "epoch": 2030} {"train_loss": -6.22623348236084, "global_step": 85263, "epoch": 2030} {"train_loss": -6.163962364196777, "global_step": 85264, "epoch": 2030} {"train_loss": -6.150658130645752, "global_step": 85265, "epoch": 2030} {"train_loss": -6.2404632568359375, "global_step": 85266, "epoch": 2030} {"train_loss": -6.049960136413574, "global_step": 85267, "epoch": 2030} {"train_loss": -6.114923477172852, "global_step": 85268, "epoch": 2030} {"train_loss": -6.15206241607666, "global_step": 85269, "epoch": 2030} {"train_loss": -6.231337547302246, "global_step": 85270, "epoch": 2030} {"train_loss": -6.1272807121276855, "global_step": 85271, "epoch": 2030} {"train_loss": -6.190463542938232, "global_step": 85272, "epoch": 2030} {"train_loss": -6.038679122924805, "global_step": 85273, "epoch": 2030} {"train_loss": -6.0990753173828125, "global_step": 85274, "epoch": 2030} {"train_loss": -6.1693549156188965, "global_step": 85275, "epoch": 2030} {"train_loss": -6.116022109985352, "global_step": 85276, "epoch": 2030} {"train_loss": -6.189426422119141, "global_step": 85277, "epoch": 2030} {"train_loss": -6.164359092712402, "global_step": 85278, "epoch": 2030} {"train_loss": -6.228004455566406, "global_step": 85279, "epoch": 2030} {"train_loss": -5.9729509353637695, "global_step": 85280, "epoch": 2030} {"train_loss": -6.075519561767578, "global_step": 85281, "epoch": 2030} {"train_loss": -6.19553279876709, "global_step": 85282, "epoch": 2030} {"train_loss": -6.195324897766113, "global_step": 85283, "epoch": 2030} {"train_loss": -6.161044120788574, "global_step": 85284, "epoch": 2030} {"train_loss": -6.167050361633301, "global_step": 85285, "epoch": 2030} {"train_loss": -6.161714553833008, "global_step": 85286, "epoch": 2030} {"train_loss": -6.201687812805176, "global_step": 85287, "epoch": 2030} {"train_loss": -6.081047058105469, "global_step": 85288, "epoch": 2030} {"train_loss": -6.219721794128418, "global_step": 85289, "epoch": 2030} {"train_loss": -6.245754241943359, "global_step": 85290, "epoch": 2030} {"train_loss": -6.21419620513916, "global_step": 85291, "epoch": 2030} {"train_loss": -6.175045967102051, "global_step": 85292, "epoch": 2030} {"train_loss": -6.2026543617248535, "global_step": 85293, "epoch": 2030} {"train_loss": -6.174942493438721, "global_step": 85294, "epoch": 2030} {"train_loss": -6.201303482055664, "global_step": 85295, "epoch": 2030} {"train_loss": -6.249475479125977, "global_step": 85296, "epoch": 2030} {"train_loss": -6.318737983703613, "global_step": 85297, "epoch": 2030} {"train_loss": -6.10944938659668, "global_step": 85298, "epoch": 2030} {"train_loss": -6.223296165466309, "global_step": 85299, "epoch": 2030} {"train_loss": -6.159546852111816, "global_step": 85300, "epoch": 2030} {"train_loss": -6.170309134892055, "global_step": 85301, "epoch": 2030, "val_loss": 74970.84375} {"train_loss": -6.261387348175049, "global_step": 85302, "epoch": 2031} {"train_loss": -6.248330593109131, "global_step": 85303, "epoch": 2031} {"train_loss": -6.252511978149414, "global_step": 85304, "epoch": 2031} {"train_loss": -6.234978675842285, "global_step": 85305, "epoch": 2031} {"train_loss": -6.161408424377441, "global_step": 85306, "epoch": 2031} {"train_loss": -6.170098781585693, "global_step": 85307, "epoch": 2031} {"train_loss": -6.175436019897461, "global_step": 85308, "epoch": 2031} {"train_loss": -6.172680854797363, "global_step": 85309, "epoch": 2031} {"train_loss": -6.243248462677002, "global_step": 85310, "epoch": 2031} {"train_loss": -6.258455276489258, "global_step": 85311, "epoch": 2031} {"train_loss": -6.2593994140625, "global_step": 85312, "epoch": 2031} {"train_loss": -5.996126651763916, "global_step": 85313, "epoch": 2031} {"train_loss": -6.208683490753174, "global_step": 85314, "epoch": 2031} {"train_loss": -6.253454208374023, "global_step": 85315, "epoch": 2031} {"train_loss": -6.147095680236816, "global_step": 85316, "epoch": 2031} {"train_loss": -6.179244518280029, "global_step": 85317, "epoch": 2031} {"train_loss": -6.215474605560303, "global_step": 85318, "epoch": 2031} {"train_loss": -6.096590995788574, "global_step": 85319, "epoch": 2031} {"train_loss": -6.163675785064697, "global_step": 85320, "epoch": 2031} {"train_loss": -6.286721229553223, "global_step": 85321, "epoch": 2031} {"train_loss": -6.200322151184082, "global_step": 85322, "epoch": 2031} {"train_loss": -6.30892276763916, "global_step": 85323, "epoch": 2031} {"train_loss": -6.232664108276367, "global_step": 85324, "epoch": 2031} {"train_loss": -6.183844566345215, "global_step": 85325, "epoch": 2031} {"train_loss": -6.202713966369629, "global_step": 85326, "epoch": 2031} {"train_loss": -6.122171401977539, "global_step": 85327, "epoch": 2031} {"train_loss": -6.233817100524902, "global_step": 85328, "epoch": 2031} {"train_loss": -6.232362270355225, "global_step": 85329, "epoch": 2031} {"train_loss": -6.148481369018555, "global_step": 85330, "epoch": 2031} {"train_loss": -6.145902633666992, "global_step": 85331, "epoch": 2031} {"train_loss": -6.135059833526611, "global_step": 85332, "epoch": 2031} {"train_loss": -6.19693660736084, "global_step": 85333, "epoch": 2031} {"train_loss": -6.226109504699707, "global_step": 85334, "epoch": 2031} {"train_loss": -6.078318119049072, "global_step": 85335, "epoch": 2031} {"train_loss": -6.150216579437256, "global_step": 85336, "epoch": 2031} {"train_loss": -6.1236772537231445, "global_step": 85337, "epoch": 2031} {"train_loss": -6.28262996673584, "global_step": 85338, "epoch": 2031} {"train_loss": -6.137965202331543, "global_step": 85339, "epoch": 2031} {"train_loss": -6.187422752380371, "global_step": 85340, "epoch": 2031} {"train_loss": -6.190859794616699, "global_step": 85341, "epoch": 2031} {"train_loss": -6.1534271240234375, "global_step": 85342, "epoch": 2031} {"train_loss": -6.1937978494734995, "global_step": 85343, "epoch": 2031, "val_loss": 75219.125} {"train_loss": -6.312905311584473, "global_step": 85344, "epoch": 2032} {"train_loss": -6.267690181732178, "global_step": 85345, "epoch": 2032} {"train_loss": -6.17330265045166, "global_step": 85346, "epoch": 2032} {"train_loss": -6.1883673667907715, "global_step": 85347, "epoch": 2032} {"train_loss": -6.205977916717529, "global_step": 85348, "epoch": 2032} {"train_loss": -6.163765907287598, "global_step": 85349, "epoch": 2032} {"train_loss": -6.173943042755127, "global_step": 85350, "epoch": 2032} {"train_loss": -6.136284828186035, "global_step": 85351, "epoch": 2032} {"train_loss": -6.305948257446289, "global_step": 85352, "epoch": 2032} {"train_loss": -6.250935077667236, "global_step": 85353, "epoch": 2032} {"train_loss": -6.293937683105469, "global_step": 85354, "epoch": 2032} {"train_loss": -6.094933986663818, "global_step": 85355, "epoch": 2032} {"train_loss": -6.109736442565918, "global_step": 85356, "epoch": 2032} {"train_loss": -6.242404937744141, "global_step": 85357, "epoch": 2032} {"train_loss": -6.072439193725586, "global_step": 85358, "epoch": 2032} {"train_loss": -6.203675746917725, "global_step": 85359, "epoch": 2032} {"train_loss": -6.112310409545898, "global_step": 85360, "epoch": 2032} {"train_loss": -6.251099586486816, "global_step": 85361, "epoch": 2032} {"train_loss": -6.182797908782959, "global_step": 85362, "epoch": 2032} {"train_loss": -6.1179304122924805, "global_step": 85363, "epoch": 2032} {"train_loss": -6.214686393737793, "global_step": 85364, "epoch": 2032} {"train_loss": -6.1809844970703125, "global_step": 85365, "epoch": 2032} {"train_loss": -6.075784206390381, "global_step": 85366, "epoch": 2032} {"train_loss": -6.225503921508789, "global_step": 85367, "epoch": 2032} {"train_loss": -6.150280475616455, "global_step": 85368, "epoch": 2032} {"train_loss": -6.104811668395996, "global_step": 85369, "epoch": 2032} {"train_loss": -6.255898952484131, "global_step": 85370, "epoch": 2032} {"train_loss": -6.108294486999512, "global_step": 85371, "epoch": 2032} {"train_loss": -6.138282299041748, "global_step": 85372, "epoch": 2032} {"train_loss": -6.202426910400391, "global_step": 85373, "epoch": 2032} {"train_loss": -6.186431407928467, "global_step": 85374, "epoch": 2032} {"train_loss": -6.220202445983887, "global_step": 85375, "epoch": 2032} {"train_loss": -6.199448585510254, "global_step": 85376, "epoch": 2032} {"train_loss": -6.235865592956543, "global_step": 85377, "epoch": 2032} {"train_loss": -6.229099273681641, "global_step": 85378, "epoch": 2032} {"train_loss": -6.25752067565918, "global_step": 85379, "epoch": 2032} {"train_loss": -6.169439792633057, "global_step": 85380, "epoch": 2032} {"train_loss": -6.196089744567871, "global_step": 85381, "epoch": 2032} {"train_loss": -6.237833023071289, "global_step": 85382, "epoch": 2032} {"train_loss": -6.286356449127197, "global_step": 85383, "epoch": 2032} {"train_loss": -6.249370574951172, "global_step": 85384, "epoch": 2032} {"train_loss": -6.194467851093838, "global_step": 85385, "epoch": 2032, "val_loss": 75189.265625} {"train_loss": -6.148234844207764, "global_step": 85386, "epoch": 2033} {"train_loss": -6.331906795501709, "global_step": 85387, "epoch": 2033} {"train_loss": -6.123010635375977, "global_step": 85388, "epoch": 2033} {"train_loss": -6.201502323150635, "global_step": 85389, "epoch": 2033} {"train_loss": -6.199650764465332, "global_step": 85390, "epoch": 2033} {"train_loss": -6.151762962341309, "global_step": 85391, "epoch": 2033} {"train_loss": -6.070775985717773, "global_step": 85392, "epoch": 2033} {"train_loss": -6.30684757232666, "global_step": 85393, "epoch": 2033} {"train_loss": -6.1811628341674805, "global_step": 85394, "epoch": 2033} {"train_loss": -6.261775016784668, "global_step": 85395, "epoch": 2033} {"train_loss": -6.128068923950195, "global_step": 85396, "epoch": 2033} {"train_loss": -6.219107627868652, "global_step": 85397, "epoch": 2033} {"train_loss": -6.1163434982299805, "global_step": 85398, "epoch": 2033} {"train_loss": -6.170036792755127, "global_step": 85399, "epoch": 2033} {"train_loss": -6.162594318389893, "global_step": 85400, "epoch": 2033} {"train_loss": -6.103300094604492, "global_step": 85401, "epoch": 2033} {"train_loss": -6.063969135284424, "global_step": 85402, "epoch": 2033} {"train_loss": -6.251468658447266, "global_step": 85403, "epoch": 2033} {"train_loss": -6.075604438781738, "global_step": 85404, "epoch": 2033} {"train_loss": -6.174452781677246, "global_step": 85405, "epoch": 2033} {"train_loss": -6.164633750915527, "global_step": 85406, "epoch": 2033} {"train_loss": -6.033261775970459, "global_step": 85407, "epoch": 2033} {"train_loss": -6.242450714111328, "global_step": 85408, "epoch": 2033} {"train_loss": -6.139997482299805, "global_step": 85409, "epoch": 2033} {"train_loss": -6.150358200073242, "global_step": 85410, "epoch": 2033} {"train_loss": -6.173409461975098, "global_step": 85411, "epoch": 2033} {"train_loss": -6.156428337097168, "global_step": 85412, "epoch": 2033} {"train_loss": -6.211814880371094, "global_step": 85413, "epoch": 2033} {"train_loss": -6.143487930297852, "global_step": 85414, "epoch": 2033} {"train_loss": -6.106296539306641, "global_step": 85415, "epoch": 2033} {"train_loss": -6.2468109130859375, "global_step": 85416, "epoch": 2033} {"train_loss": -6.120400905609131, "global_step": 85417, "epoch": 2033} {"train_loss": -6.2219038009643555, "global_step": 85418, "epoch": 2033} {"train_loss": -6.1971306800842285, "global_step": 85419, "epoch": 2033} {"train_loss": -6.269367218017578, "global_step": 85420, "epoch": 2033} {"train_loss": -6.234980583190918, "global_step": 85421, "epoch": 2033} {"train_loss": -6.155529975891113, "global_step": 85422, "epoch": 2033} {"train_loss": -6.041896820068359, "global_step": 85423, "epoch": 2033} {"train_loss": -6.0393781661987305, "global_step": 85424, "epoch": 2033} {"train_loss": -6.156118392944336, "global_step": 85425, "epoch": 2033} {"train_loss": -6.246421813964844, "global_step": 85426, "epoch": 2033} {"train_loss": -6.16601730528332, "global_step": 85427, "epoch": 2033, "val_loss": 75309.453125} {"train_loss": -6.247971534729004, "global_step": 85428, "epoch": 2034} {"train_loss": -6.1017889976501465, "global_step": 85429, "epoch": 2034} {"train_loss": -6.09475040435791, "global_step": 85430, "epoch": 2034} {"train_loss": -6.320955276489258, "global_step": 85431, "epoch": 2034} {"train_loss": -6.086271286010742, "global_step": 85432, "epoch": 2034} {"train_loss": -6.168893814086914, "global_step": 85433, "epoch": 2034} {"train_loss": -6.108525276184082, "global_step": 85434, "epoch": 2034} {"train_loss": -6.232477188110352, "global_step": 85435, "epoch": 2034} {"train_loss": -6.2414374351501465, "global_step": 85436, "epoch": 2034} {"train_loss": -6.214025974273682, "global_step": 85437, "epoch": 2034} {"train_loss": -6.128465175628662, "global_step": 85438, "epoch": 2034} {"train_loss": -6.269504547119141, "global_step": 85439, "epoch": 2034} {"train_loss": -6.176361560821533, "global_step": 85440, "epoch": 2034} {"train_loss": -6.1140851974487305, "global_step": 85441, "epoch": 2034} {"train_loss": -6.224262237548828, "global_step": 85442, "epoch": 2034} {"train_loss": -6.152478218078613, "global_step": 85443, "epoch": 2034} {"train_loss": -6.0387067794799805, "global_step": 85444, "epoch": 2034} {"train_loss": -6.149433135986328, "global_step": 85445, "epoch": 2034} {"train_loss": -6.249171257019043, "global_step": 85446, "epoch": 2034} {"train_loss": -6.157695770263672, "global_step": 85447, "epoch": 2034} {"train_loss": -6.225432395935059, "global_step": 85448, "epoch": 2034} {"train_loss": -6.171813011169434, "global_step": 85449, "epoch": 2034} {"train_loss": -6.221088409423828, "global_step": 85450, "epoch": 2034} {"train_loss": -6.118445873260498, "global_step": 85451, "epoch": 2034} {"train_loss": -6.107641696929932, "global_step": 85452, "epoch": 2034} {"train_loss": -6.209107398986816, "global_step": 85453, "epoch": 2034} {"train_loss": -6.086214542388916, "global_step": 85454, "epoch": 2034} {"train_loss": -6.069365501403809, "global_step": 85455, "epoch": 2034} {"train_loss": -6.137454032897949, "global_step": 85456, "epoch": 2034} {"train_loss": -6.1574811935424805, "global_step": 85457, "epoch": 2034} {"train_loss": -6.142239570617676, "global_step": 85458, "epoch": 2034} {"train_loss": -6.296407222747803, "global_step": 85459, "epoch": 2034} {"train_loss": -6.165740013122559, "global_step": 85460, "epoch": 2034} {"train_loss": -6.173340797424316, "global_step": 85461, "epoch": 2034} {"train_loss": -6.226248264312744, "global_step": 85462, "epoch": 2034} {"train_loss": -6.181214332580566, "global_step": 85463, "epoch": 2034} {"train_loss": -6.341396808624268, "global_step": 85464, "epoch": 2034} {"train_loss": -6.26326847076416, "global_step": 85465, "epoch": 2034} {"train_loss": -6.140677452087402, "global_step": 85466, "epoch": 2034} {"train_loss": -6.125391960144043, "global_step": 85467, "epoch": 2034} {"train_loss": -6.151554107666016, "global_step": 85468, "epoch": 2034} {"train_loss": -6.175092538197835, "global_step": 85469, "epoch": 2034, "val_loss": 75374.4453125} {"train_loss": -6.06577205657959, "global_step": 85470, "epoch": 2035} {"train_loss": -6.195155143737793, "global_step": 85471, "epoch": 2035} {"train_loss": -6.1277666091918945, "global_step": 85472, "epoch": 2035} {"train_loss": -6.002940654754639, "global_step": 85473, "epoch": 2035} {"train_loss": -6.135636329650879, "global_step": 85474, "epoch": 2035} {"train_loss": -6.090600967407227, "global_step": 85475, "epoch": 2035} {"train_loss": -6.218895435333252, "global_step": 85476, "epoch": 2035} {"train_loss": -6.265923500061035, "global_step": 85477, "epoch": 2035} {"train_loss": -6.100691318511963, "global_step": 85478, "epoch": 2035} {"train_loss": -6.047806739807129, "global_step": 85479, "epoch": 2035} {"train_loss": -6.118946075439453, "global_step": 85480, "epoch": 2035} {"train_loss": -6.0469889640808105, "global_step": 85481, "epoch": 2035} {"train_loss": -6.065194129943848, "global_step": 85482, "epoch": 2035} {"train_loss": -6.268618583679199, "global_step": 85483, "epoch": 2035} {"train_loss": -6.078545570373535, "global_step": 85484, "epoch": 2035} {"train_loss": -6.231431007385254, "global_step": 85485, "epoch": 2035} {"train_loss": -6.157115936279297, "global_step": 85486, "epoch": 2035} {"train_loss": -6.177572250366211, "global_step": 85487, "epoch": 2035} {"train_loss": -6.216983795166016, "global_step": 85488, "epoch": 2035} {"train_loss": -6.280370712280273, "global_step": 85489, "epoch": 2035} {"train_loss": -6.085943222045898, "global_step": 85490, "epoch": 2035} {"train_loss": -6.18039608001709, "global_step": 85491, "epoch": 2035} {"train_loss": -6.1076250076293945, "global_step": 85492, "epoch": 2035} {"train_loss": -6.165720462799072, "global_step": 85493, "epoch": 2035} {"train_loss": -6.143581390380859, "global_step": 85494, "epoch": 2035} {"train_loss": -6.191740036010742, "global_step": 85495, "epoch": 2035} {"train_loss": -6.096690654754639, "global_step": 85496, "epoch": 2035} {"train_loss": -6.2349114418029785, "global_step": 85497, "epoch": 2035} {"train_loss": -6.260982990264893, "global_step": 85498, "epoch": 2035} {"train_loss": -6.2491455078125, "global_step": 85499, "epoch": 2035} {"train_loss": -6.252099990844727, "global_step": 85500, "epoch": 2035} {"train_loss": -6.248941421508789, "global_step": 85501, "epoch": 2035} {"train_loss": -6.208740711212158, "global_step": 85502, "epoch": 2035} {"train_loss": -6.249767303466797, "global_step": 85503, "epoch": 2035} {"train_loss": -6.26098108291626, "global_step": 85504, "epoch": 2035} {"train_loss": -6.300810813903809, "global_step": 85505, "epoch": 2035} {"train_loss": -6.1850786209106445, "global_step": 85506, "epoch": 2035} {"train_loss": -6.097711086273193, "global_step": 85507, "epoch": 2035} {"train_loss": -6.245153427124023, "global_step": 85508, "epoch": 2035} {"train_loss": -6.202554702758789, "global_step": 85509, "epoch": 2035} {"train_loss": -6.146627902984619, "global_step": 85510, "epoch": 2035} {"train_loss": -6.171938283102853, "global_step": 85511, "epoch": 2035, "val_loss": 75043.5625} {"train_loss": -6.13959264755249, "global_step": 85512, "epoch": 2036} {"train_loss": -6.175449371337891, "global_step": 85513, "epoch": 2036} {"train_loss": -6.159205436706543, "global_step": 85514, "epoch": 2036} {"train_loss": -6.20062255859375, "global_step": 85515, "epoch": 2036} {"train_loss": -6.1721649169921875, "global_step": 85516, "epoch": 2036} {"train_loss": -6.233890533447266, "global_step": 85517, "epoch": 2036} {"train_loss": -6.077653884887695, "global_step": 85518, "epoch": 2036} {"train_loss": -6.078402042388916, "global_step": 85519, "epoch": 2036} {"train_loss": -6.182626247406006, "global_step": 85520, "epoch": 2036} {"train_loss": -6.112271308898926, "global_step": 85521, "epoch": 2036} {"train_loss": -6.155148029327393, "global_step": 85522, "epoch": 2036} {"train_loss": -6.164039611816406, "global_step": 85523, "epoch": 2036} {"train_loss": -6.220686435699463, "global_step": 85524, "epoch": 2036} {"train_loss": -6.254148006439209, "global_step": 85525, "epoch": 2036} {"train_loss": -6.157644271850586, "global_step": 85526, "epoch": 2036} {"train_loss": -6.211802005767822, "global_step": 85527, "epoch": 2036} {"train_loss": -6.347421169281006, "global_step": 85528, "epoch": 2036} {"train_loss": -6.097976207733154, "global_step": 85529, "epoch": 2036} {"train_loss": -6.1511125564575195, "global_step": 85530, "epoch": 2036} {"train_loss": -6.190334796905518, "global_step": 85531, "epoch": 2036} {"train_loss": -6.195032596588135, "global_step": 85532, "epoch": 2036} {"train_loss": -6.202337265014648, "global_step": 85533, "epoch": 2036} {"train_loss": -6.277904033660889, "global_step": 85534, "epoch": 2036} {"train_loss": -6.159578323364258, "global_step": 85535, "epoch": 2036} {"train_loss": -6.21619176864624, "global_step": 85536, "epoch": 2036} {"train_loss": -6.221949100494385, "global_step": 85537, "epoch": 2036} {"train_loss": -6.095912933349609, "global_step": 85538, "epoch": 2036} {"train_loss": -6.298177719116211, "global_step": 85539, "epoch": 2036} {"train_loss": -6.236677169799805, "global_step": 85540, "epoch": 2036} {"train_loss": -6.214088439941406, "global_step": 85541, "epoch": 2036} {"train_loss": -6.204214096069336, "global_step": 85542, "epoch": 2036} {"train_loss": -6.254074573516846, "global_step": 85543, "epoch": 2036} {"train_loss": -6.230051040649414, "global_step": 85544, "epoch": 2036} {"train_loss": -6.121927738189697, "global_step": 85545, "epoch": 2036} {"train_loss": -6.19366455078125, "global_step": 85546, "epoch": 2036} {"train_loss": -6.11540412902832, "global_step": 85547, "epoch": 2036} {"train_loss": -6.237908840179443, "global_step": 85548, "epoch": 2036} {"train_loss": -6.2241082191467285, "global_step": 85549, "epoch": 2036} {"train_loss": -6.101600646972656, "global_step": 85550, "epoch": 2036} {"train_loss": -6.2535529136657715, "global_step": 85551, "epoch": 2036} {"train_loss": -6.089324474334717, "global_step": 85552, "epoch": 2036} {"train_loss": -6.184104669661749, "global_step": 85553, "epoch": 2036, "val_loss": 75166.890625} {"train_loss": -6.151036739349365, "global_step": 85554, "epoch": 2037} {"train_loss": -6.142647743225098, "global_step": 85555, "epoch": 2037} {"train_loss": -6.235167503356934, "global_step": 85556, "epoch": 2037} {"train_loss": -6.09615421295166, "global_step": 85557, "epoch": 2037} {"train_loss": -6.072597980499268, "global_step": 85558, "epoch": 2037} {"train_loss": -6.187832832336426, "global_step": 85559, "epoch": 2037} {"train_loss": -6.164853096008301, "global_step": 85560, "epoch": 2037} {"train_loss": -6.229030132293701, "global_step": 85561, "epoch": 2037} {"train_loss": -6.336526870727539, "global_step": 85562, "epoch": 2037} {"train_loss": -6.231678009033203, "global_step": 85563, "epoch": 2037} {"train_loss": -6.252187728881836, "global_step": 85564, "epoch": 2037} {"train_loss": -6.327702522277832, "global_step": 85565, "epoch": 2037} {"train_loss": -6.119840145111084, "global_step": 85566, "epoch": 2037} {"train_loss": -6.220451354980469, "global_step": 85567, "epoch": 2037} {"train_loss": -6.197395324707031, "global_step": 85568, "epoch": 2037} {"train_loss": -6.120510101318359, "global_step": 85569, "epoch": 2037} {"train_loss": -6.291277885437012, "global_step": 85570, "epoch": 2037} {"train_loss": -6.1546196937561035, "global_step": 85571, "epoch": 2037} {"train_loss": -6.163763999938965, "global_step": 85572, "epoch": 2037} {"train_loss": -6.090371131896973, "global_step": 85573, "epoch": 2037} {"train_loss": -6.086809158325195, "global_step": 85574, "epoch": 2037} {"train_loss": -6.125025749206543, "global_step": 85575, "epoch": 2037} {"train_loss": -6.0632734298706055, "global_step": 85576, "epoch": 2037} {"train_loss": -6.200468063354492, "global_step": 85577, "epoch": 2037} {"train_loss": -6.069003105163574, "global_step": 85578, "epoch": 2037} {"train_loss": -6.1171464920043945, "global_step": 85579, "epoch": 2037} {"train_loss": -6.125438690185547, "global_step": 85580, "epoch": 2037} {"train_loss": -6.118538856506348, "global_step": 85581, "epoch": 2037} {"train_loss": -6.211137294769287, "global_step": 85582, "epoch": 2037} {"train_loss": -6.1851420402526855, "global_step": 85583, "epoch": 2037} {"train_loss": -6.07159423828125, "global_step": 85584, "epoch": 2037} {"train_loss": -6.258666038513184, "global_step": 85585, "epoch": 2037} {"train_loss": -6.189479827880859, "global_step": 85586, "epoch": 2037} {"train_loss": -6.23840856552124, "global_step": 85587, "epoch": 2037} {"train_loss": -6.174500942230225, "global_step": 85588, "epoch": 2037} {"train_loss": -6.024422645568848, "global_step": 85589, "epoch": 2037} {"train_loss": -6.223600387573242, "global_step": 85590, "epoch": 2037} {"train_loss": -6.102023124694824, "global_step": 85591, "epoch": 2037} {"train_loss": -6.198798179626465, "global_step": 85592, "epoch": 2037} {"train_loss": -6.180120468139648, "global_step": 85593, "epoch": 2037} {"train_loss": -6.175010681152344, "global_step": 85594, "epoch": 2037} {"train_loss": -6.169548000608172, "global_step": 85595, "epoch": 2037, "val_loss": 74889.5} {"train_loss": -6.148408889770508, "global_step": 85596, "epoch": 2038} {"train_loss": -6.161612033843994, "global_step": 85597, "epoch": 2038} {"train_loss": -6.144249439239502, "global_step": 85598, "epoch": 2038} {"train_loss": -6.102438449859619, "global_step": 85599, "epoch": 2038} {"train_loss": -6.248325824737549, "global_step": 85600, "epoch": 2038} {"train_loss": -6.239194869995117, "global_step": 85601, "epoch": 2038} {"train_loss": -6.163507461547852, "global_step": 85602, "epoch": 2038} {"train_loss": -6.160908222198486, "global_step": 85603, "epoch": 2038} {"train_loss": -6.264782905578613, "global_step": 85604, "epoch": 2038} {"train_loss": -6.361354827880859, "global_step": 85605, "epoch": 2038} {"train_loss": -6.228287696838379, "global_step": 85606, "epoch": 2038} {"train_loss": -6.253750801086426, "global_step": 85607, "epoch": 2038} {"train_loss": -6.314377307891846, "global_step": 85608, "epoch": 2038} {"train_loss": -6.182727336883545, "global_step": 85609, "epoch": 2038} {"train_loss": -6.308876991271973, "global_step": 85610, "epoch": 2038} {"train_loss": -6.27933406829834, "global_step": 85611, "epoch": 2038} {"train_loss": -6.127295017242432, "global_step": 85612, "epoch": 2038} {"train_loss": -6.112462043762207, "global_step": 85613, "epoch": 2038} {"train_loss": -6.087291717529297, "global_step": 85614, "epoch": 2038} {"train_loss": -6.276556968688965, "global_step": 85615, "epoch": 2038} {"train_loss": -6.187492370605469, "global_step": 85616, "epoch": 2038} {"train_loss": -6.234141826629639, "global_step": 85617, "epoch": 2038} {"train_loss": -6.193451881408691, "global_step": 85618, "epoch": 2038} {"train_loss": -6.217225074768066, "global_step": 85619, "epoch": 2038} {"train_loss": -6.279224395751953, "global_step": 85620, "epoch": 2038} {"train_loss": -6.185464859008789, "global_step": 85621, "epoch": 2038} {"train_loss": -6.148130416870117, "global_step": 85622, "epoch": 2038} {"train_loss": -6.092994689941406, "global_step": 85623, "epoch": 2038} {"train_loss": -6.167250633239746, "global_step": 85624, "epoch": 2038} {"train_loss": -6.160319805145264, "global_step": 85625, "epoch": 2038} {"train_loss": -6.108774185180664, "global_step": 85626, "epoch": 2038} {"train_loss": -6.039585590362549, "global_step": 85627, "epoch": 2038} {"train_loss": -6.283137798309326, "global_step": 85628, "epoch": 2038} {"train_loss": -6.133413314819336, "global_step": 85629, "epoch": 2038} {"train_loss": -6.10739803314209, "global_step": 85630, "epoch": 2038} {"train_loss": -6.12191915512085, "global_step": 85631, "epoch": 2038} {"train_loss": -6.202981948852539, "global_step": 85632, "epoch": 2038} {"train_loss": -6.167392730712891, "global_step": 85633, "epoch": 2038} {"train_loss": -6.226353645324707, "global_step": 85634, "epoch": 2038} {"train_loss": -6.224937438964844, "global_step": 85635, "epoch": 2038} {"train_loss": -6.139773368835449, "global_step": 85636, "epoch": 2038} {"train_loss": -6.191927977970669, "global_step": 85637, "epoch": 2038, "val_loss": 75466.7734375} {"train_loss": -6.104841232299805, "global_step": 85638, "epoch": 2039} {"train_loss": -6.2272844314575195, "global_step": 85639, "epoch": 2039} {"train_loss": -6.090069770812988, "global_step": 85640, "epoch": 2039} {"train_loss": -6.261061668395996, "global_step": 85641, "epoch": 2039} {"train_loss": -6.137758255004883, "global_step": 85642, "epoch": 2039} {"train_loss": -6.200990676879883, "global_step": 85643, "epoch": 2039} {"train_loss": -6.108133792877197, "global_step": 85644, "epoch": 2039} {"train_loss": -6.105809688568115, "global_step": 85645, "epoch": 2039} {"train_loss": -6.133800506591797, "global_step": 85646, "epoch": 2039} {"train_loss": -6.2351179122924805, "global_step": 85647, "epoch": 2039} {"train_loss": -6.272090435028076, "global_step": 85648, "epoch": 2039} {"train_loss": -6.088754653930664, "global_step": 85649, "epoch": 2039} {"train_loss": -6.185877799987793, "global_step": 85650, "epoch": 2039} {"train_loss": -6.18382453918457, "global_step": 85651, "epoch": 2039} {"train_loss": -6.196878433227539, "global_step": 85652, "epoch": 2039} {"train_loss": -6.225893020629883, "global_step": 85653, "epoch": 2039} {"train_loss": -6.193753242492676, "global_step": 85654, "epoch": 2039} {"train_loss": -6.119932174682617, "global_step": 85655, "epoch": 2039} {"train_loss": -6.180027008056641, "global_step": 85656, "epoch": 2039} {"train_loss": -6.168464183807373, "global_step": 85657, "epoch": 2039} {"train_loss": -6.1539154052734375, "global_step": 85658, "epoch": 2039} {"train_loss": -6.277894020080566, "global_step": 85659, "epoch": 2039} {"train_loss": -6.150014400482178, "global_step": 85660, "epoch": 2039} {"train_loss": -6.206205368041992, "global_step": 85661, "epoch": 2039} {"train_loss": -6.323639392852783, "global_step": 85662, "epoch": 2039} {"train_loss": -6.2197442054748535, "global_step": 85663, "epoch": 2039} {"train_loss": -6.065752029418945, "global_step": 85664, "epoch": 2039} {"train_loss": -6.121272087097168, "global_step": 85665, "epoch": 2039} {"train_loss": -6.233358383178711, "global_step": 85666, "epoch": 2039} {"train_loss": -6.081320285797119, "global_step": 85667, "epoch": 2039} {"train_loss": -6.083527088165283, "global_step": 85668, "epoch": 2039} {"train_loss": -6.158855438232422, "global_step": 85669, "epoch": 2039} {"train_loss": -6.1902971267700195, "global_step": 85670, "epoch": 2039} {"train_loss": -6.206058502197266, "global_step": 85671, "epoch": 2039} {"train_loss": -6.119659423828125, "global_step": 85672, "epoch": 2039} {"train_loss": -6.109617233276367, "global_step": 85673, "epoch": 2039} {"train_loss": -6.303601264953613, "global_step": 85674, "epoch": 2039} {"train_loss": -6.184590816497803, "global_step": 85675, "epoch": 2039} {"train_loss": -6.242063522338867, "global_step": 85676, "epoch": 2039} {"train_loss": -6.214942455291748, "global_step": 85677, "epoch": 2039} {"train_loss": -6.122012138366699, "global_step": 85678, "epoch": 2039} {"train_loss": -6.176778202965146, "global_step": 85679, "epoch": 2039, "val_loss": 75221.421875} {"train_loss": -6.08329439163208, "global_step": 85680, "epoch": 2040} {"train_loss": -6.24241828918457, "global_step": 85681, "epoch": 2040} {"train_loss": -6.198136329650879, "global_step": 85682, "epoch": 2040} {"train_loss": -6.212184906005859, "global_step": 85683, "epoch": 2040} {"train_loss": -6.24940299987793, "global_step": 85684, "epoch": 2040} {"train_loss": -6.276780128479004, "global_step": 85685, "epoch": 2040} {"train_loss": -6.2641401290893555, "global_step": 85686, "epoch": 2040} {"train_loss": -6.23809814453125, "global_step": 85687, "epoch": 2040} {"train_loss": -6.2474846839904785, "global_step": 85688, "epoch": 2040} {"train_loss": -6.328207015991211, "global_step": 85689, "epoch": 2040} {"train_loss": -6.144674301147461, "global_step": 85690, "epoch": 2040} {"train_loss": -6.214153289794922, "global_step": 85691, "epoch": 2040} {"train_loss": -6.112419128417969, "global_step": 85692, "epoch": 2040} {"train_loss": -6.211735725402832, "global_step": 85693, "epoch": 2040} {"train_loss": -6.226256847381592, "global_step": 85694, "epoch": 2040} {"train_loss": -6.121208667755127, "global_step": 85695, "epoch": 2040} {"train_loss": -6.194557189941406, "global_step": 85696, "epoch": 2040} {"train_loss": -6.097203731536865, "global_step": 85697, "epoch": 2040} {"train_loss": -6.28413724899292, "global_step": 85698, "epoch": 2040} {"train_loss": -6.1833343505859375, "global_step": 85699, "epoch": 2040} {"train_loss": -6.139490127563477, "global_step": 85700, "epoch": 2040} {"train_loss": -6.245485305786133, "global_step": 85701, "epoch": 2040} {"train_loss": -6.229044437408447, "global_step": 85702, "epoch": 2040} {"train_loss": -6.227921485900879, "global_step": 85703, "epoch": 2040} {"train_loss": -6.209688186645508, "global_step": 85704, "epoch": 2040} {"train_loss": -6.207749366760254, "global_step": 85705, "epoch": 2040} {"train_loss": -6.276632308959961, "global_step": 85706, "epoch": 2040} {"train_loss": -6.024014472961426, "global_step": 85707, "epoch": 2040} {"train_loss": -6.258370876312256, "global_step": 85708, "epoch": 2040} {"train_loss": -6.189698696136475, "global_step": 85709, "epoch": 2040} {"train_loss": -6.285490989685059, "global_step": 85710, "epoch": 2040} {"train_loss": -6.24868106842041, "global_step": 85711, "epoch": 2040} {"train_loss": -6.155956268310547, "global_step": 85712, "epoch": 2040} {"train_loss": -6.164953231811523, "global_step": 85713, "epoch": 2040} {"train_loss": -6.2612762451171875, "global_step": 85714, "epoch": 2040} {"train_loss": -6.185009002685547, "global_step": 85715, "epoch": 2040} {"train_loss": -6.306589126586914, "global_step": 85716, "epoch": 2040} {"train_loss": -6.139979839324951, "global_step": 85717, "epoch": 2040} {"train_loss": -6.241084098815918, "global_step": 85718, "epoch": 2040} {"train_loss": -6.343711853027344, "global_step": 85719, "epoch": 2040} {"train_loss": -6.108180999755859, "global_step": 85720, "epoch": 2040} {"train_loss": -6.209175598053705, "global_step": 85721, "epoch": 2040, "val_loss": 75190.578125} {"train_loss": -6.148810386657715, "global_step": 85722, "epoch": 2041} {"train_loss": -6.224782943725586, "global_step": 85723, "epoch": 2041} {"train_loss": -6.1826395988464355, "global_step": 85724, "epoch": 2041} {"train_loss": -6.127355575561523, "global_step": 85725, "epoch": 2041} {"train_loss": -6.253829002380371, "global_step": 85726, "epoch": 2041} {"train_loss": -6.145029067993164, "global_step": 85727, "epoch": 2041} {"train_loss": -6.2286057472229, "global_step": 85728, "epoch": 2041} {"train_loss": -6.185647964477539, "global_step": 85729, "epoch": 2041} {"train_loss": -6.125262260437012, "global_step": 85730, "epoch": 2041} {"train_loss": -6.195379257202148, "global_step": 85731, "epoch": 2041} {"train_loss": -6.123067855834961, "global_step": 85732, "epoch": 2041} {"train_loss": -6.185148239135742, "global_step": 85733, "epoch": 2041} {"train_loss": -6.24483585357666, "global_step": 85734, "epoch": 2041} {"train_loss": -6.270564079284668, "global_step": 85735, "epoch": 2041} {"train_loss": -6.234890937805176, "global_step": 85736, "epoch": 2041} {"train_loss": -6.186357021331787, "global_step": 85737, "epoch": 2041} {"train_loss": -6.185526371002197, "global_step": 85738, "epoch": 2041} {"train_loss": -6.225278854370117, "global_step": 85739, "epoch": 2041} {"train_loss": -6.218160629272461, "global_step": 85740, "epoch": 2041} {"train_loss": -6.237583160400391, "global_step": 85741, "epoch": 2041} {"train_loss": -6.155378341674805, "global_step": 85742, "epoch": 2041} {"train_loss": -6.224037170410156, "global_step": 85743, "epoch": 2041} {"train_loss": -6.115156173706055, "global_step": 85744, "epoch": 2041} {"train_loss": -6.121905326843262, "global_step": 85745, "epoch": 2041} {"train_loss": -6.213094711303711, "global_step": 85746, "epoch": 2041} {"train_loss": -6.1889519691467285, "global_step": 85747, "epoch": 2041} {"train_loss": -6.062161445617676, "global_step": 85748, "epoch": 2041} {"train_loss": -6.155589580535889, "global_step": 85749, "epoch": 2041} {"train_loss": -6.224238872528076, "global_step": 85750, "epoch": 2041} {"train_loss": -6.126847267150879, "global_step": 85751, "epoch": 2041} {"train_loss": -6.2032084465026855, "global_step": 85752, "epoch": 2041} {"train_loss": -6.245907783508301, "global_step": 85753, "epoch": 2041} {"train_loss": -6.036001205444336, "global_step": 85754, "epoch": 2041} {"train_loss": -6.222985744476318, "global_step": 85755, "epoch": 2041} {"train_loss": -6.108922004699707, "global_step": 85756, "epoch": 2041} {"train_loss": -6.214110374450684, "global_step": 85757, "epoch": 2041} {"train_loss": -6.24920654296875, "global_step": 85758, "epoch": 2041} {"train_loss": -6.147290229797363, "global_step": 85759, "epoch": 2041} {"train_loss": -6.241004943847656, "global_step": 85760, "epoch": 2041} {"train_loss": -6.262604713439941, "global_step": 85761, "epoch": 2041} {"train_loss": -6.17926025390625, "global_step": 85762, "epoch": 2041} {"train_loss": -6.185763063884917, "global_step": 85763, "epoch": 2041, "val_loss": 75990.6640625} {"train_loss": -6.043183326721191, "global_step": 85764, "epoch": 2042} {"train_loss": -6.205727577209473, "global_step": 85765, "epoch": 2042} {"train_loss": -6.193819046020508, "global_step": 85766, "epoch": 2042} {"train_loss": -6.158560276031494, "global_step": 85767, "epoch": 2042} {"train_loss": -6.148092269897461, "global_step": 85768, "epoch": 2042} {"train_loss": -6.254914283752441, "global_step": 85769, "epoch": 2042} {"train_loss": -6.20694637298584, "global_step": 85770, "epoch": 2042} {"train_loss": -6.09676456451416, "global_step": 85771, "epoch": 2042} {"train_loss": -6.141200065612793, "global_step": 85772, "epoch": 2042} {"train_loss": -6.1503801345825195, "global_step": 85773, "epoch": 2042} {"train_loss": -6.116878509521484, "global_step": 85774, "epoch": 2042} {"train_loss": -6.111718654632568, "global_step": 85775, "epoch": 2042} {"train_loss": -6.183018684387207, "global_step": 85776, "epoch": 2042} {"train_loss": -6.140194892883301, "global_step": 85777, "epoch": 2042} {"train_loss": -6.205026626586914, "global_step": 85778, "epoch": 2042} {"train_loss": -6.275676250457764, "global_step": 85779, "epoch": 2042} {"train_loss": -6.105775356292725, "global_step": 85780, "epoch": 2042} {"train_loss": -6.167274475097656, "global_step": 85781, "epoch": 2042} {"train_loss": -6.196903228759766, "global_step": 85782, "epoch": 2042} {"train_loss": -6.192806243896484, "global_step": 85783, "epoch": 2042} {"train_loss": -6.215963363647461, "global_step": 85784, "epoch": 2042} {"train_loss": -6.161502838134766, "global_step": 85785, "epoch": 2042} {"train_loss": -6.268448829650879, "global_step": 85786, "epoch": 2042} {"train_loss": -6.189871788024902, "global_step": 85787, "epoch": 2042} {"train_loss": -6.113773345947266, "global_step": 85788, "epoch": 2042} {"train_loss": -6.104816436767578, "global_step": 85789, "epoch": 2042} {"train_loss": -6.2061076164245605, "global_step": 85790, "epoch": 2042} {"train_loss": -6.063692092895508, "global_step": 85791, "epoch": 2042} {"train_loss": -6.133694648742676, "global_step": 85792, "epoch": 2042} {"train_loss": -6.189154624938965, "global_step": 85793, "epoch": 2042} {"train_loss": -6.077821731567383, "global_step": 85794, "epoch": 2042} {"train_loss": -6.137687683105469, "global_step": 85795, "epoch": 2042} {"train_loss": -6.182476043701172, "global_step": 85796, "epoch": 2042} {"train_loss": -6.039741516113281, "global_step": 85797, "epoch": 2042} {"train_loss": -6.2433905601501465, "global_step": 85798, "epoch": 2042} {"train_loss": -6.201898574829102, "global_step": 85799, "epoch": 2042} {"train_loss": -6.224330425262451, "global_step": 85800, "epoch": 2042} {"train_loss": -6.213426113128662, "global_step": 85801, "epoch": 2042} {"train_loss": -6.083117485046387, "global_step": 85802, "epoch": 2042} {"train_loss": -6.175177574157715, "global_step": 85803, "epoch": 2042} {"train_loss": -6.094969749450684, "global_step": 85804, "epoch": 2042} {"train_loss": -6.163633142198835, "global_step": 85805, "epoch": 2042, "val_loss": 75030.8046875} {"train_loss": -6.124199867248535, "global_step": 85806, "epoch": 2043} {"train_loss": -6.137947082519531, "global_step": 85807, "epoch": 2043} {"train_loss": -6.195285797119141, "global_step": 85808, "epoch": 2043} {"train_loss": -6.170206069946289, "global_step": 85809, "epoch": 2043} {"train_loss": -6.130386829376221, "global_step": 85810, "epoch": 2043} {"train_loss": -6.244548797607422, "global_step": 85811, "epoch": 2043} {"train_loss": -6.274110317230225, "global_step": 85812, "epoch": 2043} {"train_loss": -6.238913536071777, "global_step": 85813, "epoch": 2043} {"train_loss": -6.3607587814331055, "global_step": 85814, "epoch": 2043} {"train_loss": -6.144049644470215, "global_step": 85815, "epoch": 2043} {"train_loss": -6.127123832702637, "global_step": 85816, "epoch": 2043} {"train_loss": -6.3398942947387695, "global_step": 85817, "epoch": 2043} {"train_loss": -6.146039009094238, "global_step": 85818, "epoch": 2043} {"train_loss": -6.3465657234191895, "global_step": 85819, "epoch": 2043} {"train_loss": -6.133908271789551, "global_step": 85820, "epoch": 2043} {"train_loss": -6.136641979217529, "global_step": 85821, "epoch": 2043} {"train_loss": -6.31397008895874, "global_step": 85822, "epoch": 2043} {"train_loss": -6.154702663421631, "global_step": 85823, "epoch": 2043} {"train_loss": -6.212249279022217, "global_step": 85824, "epoch": 2043} {"train_loss": -6.350218772888184, "global_step": 85825, "epoch": 2043} {"train_loss": -6.254368305206299, "global_step": 85826, "epoch": 2043} {"train_loss": -6.198428630828857, "global_step": 85827, "epoch": 2043} {"train_loss": -6.259545803070068, "global_step": 85828, "epoch": 2043} {"train_loss": -6.233538627624512, "global_step": 85829, "epoch": 2043} {"train_loss": -6.0865912437438965, "global_step": 85830, "epoch": 2043} {"train_loss": -6.170679092407227, "global_step": 85831, "epoch": 2043} {"train_loss": -6.06450891494751, "global_step": 85832, "epoch": 2043} {"train_loss": -6.405640602111816, "global_step": 85833, "epoch": 2043} {"train_loss": -6.237846374511719, "global_step": 85834, "epoch": 2043} {"train_loss": -6.219666481018066, "global_step": 85835, "epoch": 2043} {"train_loss": -6.228823184967041, "global_step": 85836, "epoch": 2043} {"train_loss": -6.221768379211426, "global_step": 85837, "epoch": 2043} {"train_loss": -6.268512725830078, "global_step": 85838, "epoch": 2043} {"train_loss": -6.232544898986816, "global_step": 85839, "epoch": 2043} {"train_loss": -6.300712585449219, "global_step": 85840, "epoch": 2043} {"train_loss": -6.150711536407471, "global_step": 85841, "epoch": 2043} {"train_loss": -6.1905436515808105, "global_step": 85842, "epoch": 2043} {"train_loss": -6.298654556274414, "global_step": 85843, "epoch": 2043} {"train_loss": -6.163938045501709, "global_step": 85844, "epoch": 2043} {"train_loss": -6.175554275512695, "global_step": 85845, "epoch": 2043} {"train_loss": -6.069118499755859, "global_step": 85846, "epoch": 2043} {"train_loss": -6.213789792287917, "global_step": 85847, "epoch": 2043, "val_loss": 75398.84375} {"train_loss": -6.093604564666748, "global_step": 85848, "epoch": 2044} {"train_loss": -6.268873691558838, "global_step": 85849, "epoch": 2044} {"train_loss": -6.240530014038086, "global_step": 85850, "epoch": 2044} {"train_loss": -6.093565940856934, "global_step": 85851, "epoch": 2044} {"train_loss": -6.195234298706055, "global_step": 85852, "epoch": 2044} {"train_loss": -6.090584754943848, "global_step": 85853, "epoch": 2044} {"train_loss": -6.20925235748291, "global_step": 85854, "epoch": 2044} {"train_loss": -6.283679008483887, "global_step": 85855, "epoch": 2044} {"train_loss": -6.184205532073975, "global_step": 85856, "epoch": 2044} {"train_loss": -6.129611492156982, "global_step": 85857, "epoch": 2044} {"train_loss": -6.221324920654297, "global_step": 85858, "epoch": 2044} {"train_loss": -6.147279739379883, "global_step": 85859, "epoch": 2044} {"train_loss": -6.196967601776123, "global_step": 85860, "epoch": 2044} {"train_loss": -6.160765647888184, "global_step": 85861, "epoch": 2044} {"train_loss": -6.165389060974121, "global_step": 85862, "epoch": 2044} {"train_loss": -6.275049209594727, "global_step": 85863, "epoch": 2044} {"train_loss": -6.264613151550293, "global_step": 85864, "epoch": 2044} {"train_loss": -6.093116760253906, "global_step": 85865, "epoch": 2044} {"train_loss": -6.197683334350586, "global_step": 85866, "epoch": 2044} {"train_loss": -6.181881904602051, "global_step": 85867, "epoch": 2044} {"train_loss": -6.170231342315674, "global_step": 85868, "epoch": 2044} {"train_loss": -6.228899955749512, "global_step": 85869, "epoch": 2044} {"train_loss": -6.194141387939453, "global_step": 85870, "epoch": 2044} {"train_loss": -6.215420722961426, "global_step": 85871, "epoch": 2044} {"train_loss": -6.237238883972168, "global_step": 85872, "epoch": 2044} {"train_loss": -6.136420249938965, "global_step": 85873, "epoch": 2044} {"train_loss": -6.307521343231201, "global_step": 85874, "epoch": 2044} {"train_loss": -6.139416694641113, "global_step": 85875, "epoch": 2044} {"train_loss": -6.254509449005127, "global_step": 85876, "epoch": 2044} {"train_loss": -6.282580852508545, "global_step": 85877, "epoch": 2044} {"train_loss": -6.307014465332031, "global_step": 85878, "epoch": 2044} {"train_loss": -6.42213249206543, "global_step": 85879, "epoch": 2044} {"train_loss": -6.220898628234863, "global_step": 85880, "epoch": 2044} {"train_loss": -6.276128768920898, "global_step": 85881, "epoch": 2044} {"train_loss": -6.172389984130859, "global_step": 85882, "epoch": 2044} {"train_loss": -6.143346786499023, "global_step": 85883, "epoch": 2044} {"train_loss": -6.243643760681152, "global_step": 85884, "epoch": 2044} {"train_loss": -6.252260208129883, "global_step": 85885, "epoch": 2044} {"train_loss": -6.238300800323486, "global_step": 85886, "epoch": 2044} {"train_loss": -6.147643089294434, "global_step": 85887, "epoch": 2044} {"train_loss": -6.265525817871094, "global_step": 85888, "epoch": 2044} {"train_loss": -6.210301104046049, "global_step": 85889, "epoch": 2044, "val_loss": 75195.78125} {"train_loss": -6.149279594421387, "global_step": 85890, "epoch": 2045} {"train_loss": -6.173434734344482, "global_step": 85891, "epoch": 2045} {"train_loss": -6.242263317108154, "global_step": 85892, "epoch": 2045} {"train_loss": -6.213007926940918, "global_step": 85893, "epoch": 2045} {"train_loss": -6.259325981140137, "global_step": 85894, "epoch": 2045} {"train_loss": -6.197932720184326, "global_step": 85895, "epoch": 2045} {"train_loss": -6.210237503051758, "global_step": 85896, "epoch": 2045} {"train_loss": -6.179498672485352, "global_step": 85897, "epoch": 2045} {"train_loss": -6.130511283874512, "global_step": 85898, "epoch": 2045} {"train_loss": -6.14143180847168, "global_step": 85899, "epoch": 2045} {"train_loss": -6.102053642272949, "global_step": 85900, "epoch": 2045} {"train_loss": -6.211454391479492, "global_step": 85901, "epoch": 2045} {"train_loss": -6.075355529785156, "global_step": 85902, "epoch": 2045} {"train_loss": -6.235634803771973, "global_step": 85903, "epoch": 2045} {"train_loss": -6.170321464538574, "global_step": 85904, "epoch": 2045} {"train_loss": -6.157922744750977, "global_step": 85905, "epoch": 2045} {"train_loss": -6.21987771987915, "global_step": 85906, "epoch": 2045} {"train_loss": -6.119490623474121, "global_step": 85907, "epoch": 2045} {"train_loss": -6.0957136154174805, "global_step": 85908, "epoch": 2045} {"train_loss": -6.215099334716797, "global_step": 85909, "epoch": 2045} {"train_loss": -6.253352642059326, "global_step": 85910, "epoch": 2045} {"train_loss": -6.209078311920166, "global_step": 85911, "epoch": 2045} {"train_loss": -6.265318870544434, "global_step": 85912, "epoch": 2045} {"train_loss": -6.131566047668457, "global_step": 85913, "epoch": 2045} {"train_loss": -6.225564956665039, "global_step": 85914, "epoch": 2045} {"train_loss": -6.228664875030518, "global_step": 85915, "epoch": 2045} {"train_loss": -6.130887985229492, "global_step": 85916, "epoch": 2045} {"train_loss": -6.1441650390625, "global_step": 85917, "epoch": 2045} {"train_loss": -6.1420745849609375, "global_step": 85918, "epoch": 2045} {"train_loss": -6.163545608520508, "global_step": 85919, "epoch": 2045} {"train_loss": -6.159922122955322, "global_step": 85920, "epoch": 2045} {"train_loss": -6.279848575592041, "global_step": 85921, "epoch": 2045} {"train_loss": -6.127007484436035, "global_step": 85922, "epoch": 2045} {"train_loss": -6.35172176361084, "global_step": 85923, "epoch": 2045} {"train_loss": -6.170738220214844, "global_step": 85924, "epoch": 2045} {"train_loss": -6.238556861877441, "global_step": 85925, "epoch": 2045} {"train_loss": -6.281464099884033, "global_step": 85926, "epoch": 2045} {"train_loss": -6.166029453277588, "global_step": 85927, "epoch": 2045} {"train_loss": -6.250580787658691, "global_step": 85928, "epoch": 2045} {"train_loss": -6.086642265319824, "global_step": 85929, "epoch": 2045} {"train_loss": -6.271177768707275, "global_step": 85930, "epoch": 2045} {"train_loss": -6.190338622956049, "global_step": 85931, "epoch": 2045, "val_loss": 75195.8125} {"train_loss": -6.209476470947266, "global_step": 85932, "epoch": 2046} {"train_loss": -6.186610698699951, "global_step": 85933, "epoch": 2046} {"train_loss": -6.346014976501465, "global_step": 85934, "epoch": 2046} {"train_loss": -6.271462440490723, "global_step": 85935, "epoch": 2046} {"train_loss": -6.157597064971924, "global_step": 85936, "epoch": 2046} {"train_loss": -6.258479118347168, "global_step": 85937, "epoch": 2046} {"train_loss": -6.2647705078125, "global_step": 85938, "epoch": 2046} {"train_loss": -6.221786975860596, "global_step": 85939, "epoch": 2046} {"train_loss": -6.191247463226318, "global_step": 85940, "epoch": 2046} {"train_loss": -6.275447845458984, "global_step": 85941, "epoch": 2046} {"train_loss": -6.252671718597412, "global_step": 85942, "epoch": 2046} {"train_loss": -6.185649871826172, "global_step": 85943, "epoch": 2046} {"train_loss": -6.205162048339844, "global_step": 85944, "epoch": 2046} {"train_loss": -6.183358669281006, "global_step": 85945, "epoch": 2046} {"train_loss": -6.259632110595703, "global_step": 85946, "epoch": 2046} {"train_loss": -6.233890533447266, "global_step": 85947, "epoch": 2046} {"train_loss": -6.141300201416016, "global_step": 85948, "epoch": 2046} {"train_loss": -6.33514404296875, "global_step": 85949, "epoch": 2046} {"train_loss": -6.2397260665893555, "global_step": 85950, "epoch": 2046} {"train_loss": -6.162313461303711, "global_step": 85951, "epoch": 2046} {"train_loss": -6.25447416305542, "global_step": 85952, "epoch": 2046} {"train_loss": -6.199554443359375, "global_step": 85953, "epoch": 2046} {"train_loss": -6.2346601486206055, "global_step": 85954, "epoch": 2046} {"train_loss": -6.183030605316162, "global_step": 85955, "epoch": 2046} {"train_loss": -6.132851600646973, "global_step": 85956, "epoch": 2046} {"train_loss": -6.073577880859375, "global_step": 85957, "epoch": 2046} {"train_loss": -6.191883087158203, "global_step": 85958, "epoch": 2046} {"train_loss": -6.308306694030762, "global_step": 85959, "epoch": 2046} {"train_loss": -6.2030930519104, "global_step": 85960, "epoch": 2046} {"train_loss": -6.156838893890381, "global_step": 85961, "epoch": 2046} {"train_loss": -6.227407932281494, "global_step": 85962, "epoch": 2046} {"train_loss": -6.152118682861328, "global_step": 85963, "epoch": 2046} {"train_loss": -6.280176162719727, "global_step": 85964, "epoch": 2046} {"train_loss": -6.166398048400879, "global_step": 85965, "epoch": 2046} {"train_loss": -6.186631202697754, "global_step": 85966, "epoch": 2046} {"train_loss": -6.174339771270752, "global_step": 85967, "epoch": 2046} {"train_loss": -6.214973449707031, "global_step": 85968, "epoch": 2046} {"train_loss": -6.166855812072754, "global_step": 85969, "epoch": 2046} {"train_loss": -6.197739124298096, "global_step": 85970, "epoch": 2046} {"train_loss": -6.100996494293213, "global_step": 85971, "epoch": 2046} {"train_loss": -5.999544143676758, "global_step": 85972, "epoch": 2046} {"train_loss": -6.205500852494013, "global_step": 85973, "epoch": 2046, "val_loss": 75226.28125} {"train_loss": -6.232030391693115, "global_step": 85974, "epoch": 2047} {"train_loss": -6.194910049438477, "global_step": 85975, "epoch": 2047} {"train_loss": -6.20552396774292, "global_step": 85976, "epoch": 2047} {"train_loss": -6.097998142242432, "global_step": 85977, "epoch": 2047} {"train_loss": -6.2238922119140625, "global_step": 85978, "epoch": 2047} {"train_loss": -6.162396430969238, "global_step": 85979, "epoch": 2047} {"train_loss": -6.146394729614258, "global_step": 85980, "epoch": 2047} {"train_loss": -6.249185562133789, "global_step": 85981, "epoch": 2047} {"train_loss": -6.23854923248291, "global_step": 85982, "epoch": 2047} {"train_loss": -6.222286701202393, "global_step": 85983, "epoch": 2047} {"train_loss": -6.27506685256958, "global_step": 85984, "epoch": 2047} {"train_loss": -6.162465572357178, "global_step": 85985, "epoch": 2047} {"train_loss": -6.249162673950195, "global_step": 85986, "epoch": 2047} {"train_loss": -6.298327445983887, "global_step": 85987, "epoch": 2047} {"train_loss": -6.159751892089844, "global_step": 85988, "epoch": 2047} {"train_loss": -6.161634922027588, "global_step": 85989, "epoch": 2047} {"train_loss": -6.0692901611328125, "global_step": 85990, "epoch": 2047} {"train_loss": -6.0637006759643555, "global_step": 85991, "epoch": 2047} {"train_loss": -6.199553489685059, "global_step": 85992, "epoch": 2047} {"train_loss": -6.139469146728516, "global_step": 85993, "epoch": 2047} {"train_loss": -6.0079755783081055, "global_step": 85994, "epoch": 2047} {"train_loss": -6.123016834259033, "global_step": 85995, "epoch": 2047} {"train_loss": -6.157628059387207, "global_step": 85996, "epoch": 2047} {"train_loss": -6.102883338928223, "global_step": 85997, "epoch": 2047} {"train_loss": -6.070990085601807, "global_step": 85998, "epoch": 2047} {"train_loss": -6.06117057800293, "global_step": 85999, "epoch": 2047} {"train_loss": -6.197053909301758, "global_step": 86000, "epoch": 2047} {"train_loss": -6.065051555633545, "global_step": 86001, "epoch": 2047} {"train_loss": -6.102603435516357, "global_step": 86002, "epoch": 2047} {"train_loss": -6.186654090881348, "global_step": 86003, "epoch": 2047} {"train_loss": -6.179043292999268, "global_step": 86004, "epoch": 2047} {"train_loss": -6.147843360900879, "global_step": 86005, "epoch": 2047} {"train_loss": -6.211057662963867, "global_step": 86006, "epoch": 2047} {"train_loss": -6.178962707519531, "global_step": 86007, "epoch": 2047} {"train_loss": -6.12330436706543, "global_step": 86008, "epoch": 2047} {"train_loss": -6.257421493530273, "global_step": 86009, "epoch": 2047} {"train_loss": -6.199763774871826, "global_step": 86010, "epoch": 2047} {"train_loss": -6.269198894500732, "global_step": 86011, "epoch": 2047} {"train_loss": -6.24640417098999, "global_step": 86012, "epoch": 2047} {"train_loss": -6.092293739318848, "global_step": 86013, "epoch": 2047} {"train_loss": -6.112309455871582, "global_step": 86014, "epoch": 2047} {"train_loss": -6.164541585104806, "global_step": 86015, "epoch": 2047, "val_loss": 75357.171875} {"train_loss": -5.992142200469971, "global_step": 86016, "epoch": 2048} {"train_loss": -6.2137346267700195, "global_step": 86017, "epoch": 2048} {"train_loss": -6.116466045379639, "global_step": 86018, "epoch": 2048} {"train_loss": -6.206809043884277, "global_step": 86019, "epoch": 2048} {"train_loss": -6.269679069519043, "global_step": 86020, "epoch": 2048} {"train_loss": -6.062492370605469, "global_step": 86021, "epoch": 2048} {"train_loss": -6.249711036682129, "global_step": 86022, "epoch": 2048} {"train_loss": -6.143551826477051, "global_step": 86023, "epoch": 2048} {"train_loss": -6.253117561340332, "global_step": 86024, "epoch": 2048} {"train_loss": -6.133406639099121, "global_step": 86025, "epoch": 2048} {"train_loss": -6.174630165100098, "global_step": 86026, "epoch": 2048} {"train_loss": -6.192083358764648, "global_step": 86027, "epoch": 2048} {"train_loss": -6.103864669799805, "global_step": 86028, "epoch": 2048} {"train_loss": -6.0383100509643555, "global_step": 86029, "epoch": 2048} {"train_loss": -6.176677227020264, "global_step": 86030, "epoch": 2048} {"train_loss": -6.082773208618164, "global_step": 86031, "epoch": 2048} {"train_loss": -6.16981315612793, "global_step": 86032, "epoch": 2048} {"train_loss": -6.086853981018066, "global_step": 86033, "epoch": 2048} {"train_loss": -6.136945724487305, "global_step": 86034, "epoch": 2048} {"train_loss": -6.093796253204346, "global_step": 86035, "epoch": 2048} {"train_loss": -6.271650314331055, "global_step": 86036, "epoch": 2048} {"train_loss": -6.150027275085449, "global_step": 86037, "epoch": 2048} {"train_loss": -6.236741065979004, "global_step": 86038, "epoch": 2048} {"train_loss": -6.194063663482666, "global_step": 86039, "epoch": 2048} {"train_loss": -6.108144283294678, "global_step": 86040, "epoch": 2048} {"train_loss": -6.208373069763184, "global_step": 86041, "epoch": 2048} {"train_loss": -6.2911224365234375, "global_step": 86042, "epoch": 2048} {"train_loss": -6.270386695861816, "global_step": 86043, "epoch": 2048} {"train_loss": -6.072909355163574, "global_step": 86044, "epoch": 2048} {"train_loss": -6.263404369354248, "global_step": 86045, "epoch": 2048} {"train_loss": -6.235087871551514, "global_step": 86046, "epoch": 2048} {"train_loss": -6.160492897033691, "global_step": 86047, "epoch": 2048} {"train_loss": -6.202730655670166, "global_step": 86048, "epoch": 2048} {"train_loss": -6.182198524475098, "global_step": 86049, "epoch": 2048} {"train_loss": -6.140193939208984, "global_step": 86050, "epoch": 2048} {"train_loss": -6.13897705078125, "global_step": 86051, "epoch": 2048} {"train_loss": -6.260151386260986, "global_step": 86052, "epoch": 2048} {"train_loss": -6.177016258239746, "global_step": 86053, "epoch": 2048} {"train_loss": -6.190179824829102, "global_step": 86054, "epoch": 2048} {"train_loss": -6.224852561950684, "global_step": 86055, "epoch": 2048} {"train_loss": -6.367624282836914, "global_step": 86056, "epoch": 2048} {"train_loss": -6.1778700578780406, "global_step": 86057, "epoch": 2048, "val_loss": 75526.859375} {"train_loss": -6.148930549621582, "global_step": 86058, "epoch": 2049} {"train_loss": -6.140843391418457, "global_step": 86059, "epoch": 2049} {"train_loss": -6.099191665649414, "global_step": 86060, "epoch": 2049} {"train_loss": -6.23132848739624, "global_step": 86061, "epoch": 2049} {"train_loss": -6.193449974060059, "global_step": 86062, "epoch": 2049} {"train_loss": -6.153398513793945, "global_step": 86063, "epoch": 2049} {"train_loss": -6.231023788452148, "global_step": 86064, "epoch": 2049} {"train_loss": -6.227995872497559, "global_step": 86065, "epoch": 2049} {"train_loss": -6.215319633483887, "global_step": 86066, "epoch": 2049} {"train_loss": -6.19182014465332, "global_step": 86067, "epoch": 2049} {"train_loss": -6.098795413970947, "global_step": 86068, "epoch": 2049} {"train_loss": -6.146520614624023, "global_step": 86069, "epoch": 2049} {"train_loss": -6.016059875488281, "global_step": 86070, "epoch": 2049} {"train_loss": -6.251824378967285, "global_step": 86071, "epoch": 2049} {"train_loss": -6.1527509689331055, "global_step": 86072, "epoch": 2049} {"train_loss": -6.196803092956543, "global_step": 86073, "epoch": 2049} {"train_loss": -6.223525047302246, "global_step": 86074, "epoch": 2049} {"train_loss": -6.260227203369141, "global_step": 86075, "epoch": 2049} {"train_loss": -6.102082252502441, "global_step": 86076, "epoch": 2049} {"train_loss": -6.105838775634766, "global_step": 86077, "epoch": 2049} {"train_loss": -6.2242231369018555, "global_step": 86078, "epoch": 2049} {"train_loss": -6.27315616607666, "global_step": 86079, "epoch": 2049} {"train_loss": -6.139684677124023, "global_step": 86080, "epoch": 2049} {"train_loss": -6.169384002685547, "global_step": 86081, "epoch": 2049} {"train_loss": -6.206000804901123, "global_step": 86082, "epoch": 2049} {"train_loss": -6.171221733093262, "global_step": 86083, "epoch": 2049} {"train_loss": -6.1641082763671875, "global_step": 86084, "epoch": 2049} {"train_loss": -6.285262584686279, "global_step": 86085, "epoch": 2049} {"train_loss": -6.324256896972656, "global_step": 86086, "epoch": 2049} {"train_loss": -6.270205497741699, "global_step": 86087, "epoch": 2049} {"train_loss": -6.22791862487793, "global_step": 86088, "epoch": 2049} {"train_loss": -6.184452056884766, "global_step": 86089, "epoch": 2049} {"train_loss": -6.272305965423584, "global_step": 86090, "epoch": 2049} {"train_loss": -6.204063415527344, "global_step": 86091, "epoch": 2049} {"train_loss": -6.24608850479126, "global_step": 86092, "epoch": 2049} {"train_loss": -6.1355671882629395, "global_step": 86093, "epoch": 2049} {"train_loss": -6.242227554321289, "global_step": 86094, "epoch": 2049} {"train_loss": -6.15634822845459, "global_step": 86095, "epoch": 2049} {"train_loss": -6.355258464813232, "global_step": 86096, "epoch": 2049} {"train_loss": -6.309922218322754, "global_step": 86097, "epoch": 2049} {"train_loss": -6.239073753356934, "global_step": 86098, "epoch": 2049} {"train_loss": -6.198514722642445, "global_step": 86099, "epoch": 2049, "val_loss": 75421.1328125} {"train_loss": -6.250344753265381, "global_step": 86100, "epoch": 2050} {"train_loss": -6.136241436004639, "global_step": 86101, "epoch": 2050} {"train_loss": -6.222589015960693, "global_step": 86102, "epoch": 2050} {"train_loss": -6.275444984436035, "global_step": 86103, "epoch": 2050} {"train_loss": -6.245940685272217, "global_step": 86104, "epoch": 2050} {"train_loss": -6.204043388366699, "global_step": 86105, "epoch": 2050} {"train_loss": -6.081920146942139, "global_step": 86106, "epoch": 2050} {"train_loss": -6.068617343902588, "global_step": 86107, "epoch": 2050} {"train_loss": -6.261564254760742, "global_step": 86108, "epoch": 2050} {"train_loss": -6.3426666259765625, "global_step": 86109, "epoch": 2050} {"train_loss": -6.112214088439941, "global_step": 86110, "epoch": 2050} {"train_loss": -6.1797332763671875, "global_step": 86111, "epoch": 2050} {"train_loss": -6.056151390075684, "global_step": 86112, "epoch": 2050} {"train_loss": -6.114203453063965, "global_step": 86113, "epoch": 2050} {"train_loss": -6.1376543045043945, "global_step": 86114, "epoch": 2050} {"train_loss": -6.028127670288086, "global_step": 86115, "epoch": 2050} {"train_loss": -6.144006252288818, "global_step": 86116, "epoch": 2050} {"train_loss": -6.189641952514648, "global_step": 86117, "epoch": 2050} {"train_loss": -6.15327262878418, "global_step": 86118, "epoch": 2050} {"train_loss": -6.177300453186035, "global_step": 86119, "epoch": 2050} {"train_loss": -6.223598480224609, "global_step": 86120, "epoch": 2050} {"train_loss": -6.141704559326172, "global_step": 86121, "epoch": 2050} {"train_loss": -6.151634216308594, "global_step": 86122, "epoch": 2050} {"train_loss": -6.236771583557129, "global_step": 86123, "epoch": 2050} {"train_loss": -6.165763854980469, "global_step": 86124, "epoch": 2050} {"train_loss": -6.107454299926758, "global_step": 86125, "epoch": 2050} {"train_loss": -6.194409370422363, "global_step": 86126, "epoch": 2050} {"train_loss": -6.112971305847168, "global_step": 86127, "epoch": 2050} {"train_loss": -6.323483467102051, "global_step": 86128, "epoch": 2050} {"train_loss": -6.202777862548828, "global_step": 86129, "epoch": 2050} {"train_loss": -6.213912010192871, "global_step": 86130, "epoch": 2050} {"train_loss": -6.092041015625, "global_step": 86131, "epoch": 2050} {"train_loss": -6.148265838623047, "global_step": 86132, "epoch": 2050} {"train_loss": -6.137998104095459, "global_step": 86133, "epoch": 2050} {"train_loss": -6.114088535308838, "global_step": 86134, "epoch": 2050} {"train_loss": -6.256263732910156, "global_step": 86135, "epoch": 2050} {"train_loss": -6.191733360290527, "global_step": 86136, "epoch": 2050} {"train_loss": -6.188344955444336, "global_step": 86137, "epoch": 2050} {"train_loss": -6.185016632080078, "global_step": 86138, "epoch": 2050} {"train_loss": -6.10022497177124, "global_step": 86139, "epoch": 2050} {"train_loss": -6.2335004806518555, "global_step": 86140, "epoch": 2050} {"train_loss": -6.173810811269851, "global_step": 86141, "epoch": 2050, "train/sim_max_reward_0": 0.3813509491822814, "train/sim_max_reward_1": 0.9308675549540314, "train/sim_max_reward_2": 0.6531456967827661, "train/sim_max_reward_3": 0.17402624483688756, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.7723855489500951, "test/sim_max_reward_4500000": 0.36502842914426714, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.5746167699392857, "test/sim_max_reward_4500003": 0.6847989826408128, "test/sim_max_reward_4500004": 0.8690109179122791, "test/sim_max_reward_4500005": 0.7177994570346472, "test/sim_max_reward_4500006": 0.880341381715876, "test/sim_max_reward_4500007": 0.9516265111881914, "test/sim_max_reward_4500008": 0.015477791191894151, "test/sim_max_reward_4500009": 0.2784458404306932, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.059829530371475606, "test/sim_max_reward_4500012": 0.018801599546271332, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.383233962322474, "test/sim_max_reward_4500015": 0.841322197934052, "test/sim_max_reward_4500016": 0.16371231711448184, "test/sim_max_reward_4500017": 0.16268765278655337, "test/sim_max_reward_4500018": 0.4036435764590088, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9609652429767435, "test/sim_max_reward_4500022": 1.0, "test/sim_max_reward_4500023": 0.9228170048106673, "test/sim_max_reward_4500024": 0.7734546037435989, "test/sim_max_reward_4500025": 0.0013672706443585165, "test/sim_max_reward_4500026": 0.9351251952560222, "test/sim_max_reward_4500027": 0.392558852275729, "test/sim_max_reward_4500028": 0.21876731629040275, "test/sim_max_reward_4500029": 0.11838383263571223, "test/sim_max_reward_4500030": 0.9490785275432273, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.15430069971016153, "test/sim_max_reward_4500033": 0.8258041333556804, "test/sim_max_reward_4500034": 0.8141230506195124, "test/sim_max_reward_4500035": 0.5267364768552345, "test/sim_max_reward_4500036": 0.44942947659464894, "test/sim_max_reward_4500037": 0.41575004540015753, "test/sim_max_reward_4500038": 0.8232266674790136, "test/sim_max_reward_4500039": 0.8541435718234394, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.927413727587491, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.1813366633525196, "test/sim_max_reward_4500044": 0.014048297186302326, "test/sim_max_reward_4500045": 0.4004825141630353, "test/sim_max_reward_4500046": 1.0, "test/sim_max_reward_4500047": 0.943976696127312, "test/sim_max_reward_4500048": 0.9558836543474556, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6519626657843436, "test/mean_score": 0.48693915428906875, "val_loss": 75159.9921875} {"train_loss": -6.174949645996094, "global_step": 86142, "epoch": 2051} {"train_loss": -6.264789581298828, "global_step": 86143, "epoch": 2051} {"train_loss": -6.166924953460693, "global_step": 86144, "epoch": 2051} {"train_loss": -6.216142654418945, "global_step": 86145, "epoch": 2051} {"train_loss": -6.2056403160095215, "global_step": 86146, "epoch": 2051} {"train_loss": -6.110105514526367, "global_step": 86147, "epoch": 2051} {"train_loss": -6.190212249755859, "global_step": 86148, "epoch": 2051} {"train_loss": -6.151594161987305, "global_step": 86149, "epoch": 2051} {"train_loss": -6.139911651611328, "global_step": 86150, "epoch": 2051} {"train_loss": -6.160033226013184, "global_step": 86151, "epoch": 2051} {"train_loss": -6.267689228057861, "global_step": 86152, "epoch": 2051} {"train_loss": -6.189709663391113, "global_step": 86153, "epoch": 2051} {"train_loss": -6.206568241119385, "global_step": 86154, "epoch": 2051} {"train_loss": -6.270700931549072, "global_step": 86155, "epoch": 2051} {"train_loss": -6.138994216918945, "global_step": 86156, "epoch": 2051} {"train_loss": -6.2019877433776855, "global_step": 86157, "epoch": 2051} {"train_loss": -6.230393409729004, "global_step": 86158, "epoch": 2051} {"train_loss": -6.110015869140625, "global_step": 86159, "epoch": 2051} {"train_loss": -6.241071701049805, "global_step": 86160, "epoch": 2051} {"train_loss": -6.200451850891113, "global_step": 86161, "epoch": 2051} {"train_loss": -6.265772819519043, "global_step": 86162, "epoch": 2051} {"train_loss": -6.18995475769043, "global_step": 86163, "epoch": 2051} {"train_loss": -6.220936298370361, "global_step": 86164, "epoch": 2051} {"train_loss": -6.269312858581543, "global_step": 86165, "epoch": 2051} {"train_loss": -6.216785430908203, "global_step": 86166, "epoch": 2051} {"train_loss": -6.186043739318848, "global_step": 86167, "epoch": 2051} {"train_loss": -6.108223915100098, "global_step": 86168, "epoch": 2051} {"train_loss": -6.127934455871582, "global_step": 86169, "epoch": 2051} {"train_loss": -6.167072296142578, "global_step": 86170, "epoch": 2051} {"train_loss": -6.161970138549805, "global_step": 86171, "epoch": 2051} {"train_loss": -6.121591091156006, "global_step": 86172, "epoch": 2051} {"train_loss": -6.231290817260742, "global_step": 86173, "epoch": 2051} {"train_loss": -6.167387008666992, "global_step": 86174, "epoch": 2051} {"train_loss": -6.120635986328125, "global_step": 86175, "epoch": 2051} {"train_loss": -6.27022647857666, "global_step": 86176, "epoch": 2051} {"train_loss": -6.216382026672363, "global_step": 86177, "epoch": 2051} {"train_loss": -6.150409698486328, "global_step": 86178, "epoch": 2051} {"train_loss": -6.146620750427246, "global_step": 86179, "epoch": 2051} {"train_loss": -6.195947647094727, "global_step": 86180, "epoch": 2051} {"train_loss": -6.212059020996094, "global_step": 86181, "epoch": 2051} {"train_loss": -6.231240272521973, "global_step": 86182, "epoch": 2051} {"train_loss": -6.191708632877895, "global_step": 86183, "epoch": 2051, "val_loss": 75411.125} {"train_loss": -6.105226516723633, "global_step": 86184, "epoch": 2052} {"train_loss": -6.144518852233887, "global_step": 86185, "epoch": 2052} {"train_loss": -6.173956871032715, "global_step": 86186, "epoch": 2052} {"train_loss": -6.221958160400391, "global_step": 86187, "epoch": 2052} {"train_loss": -6.152743816375732, "global_step": 86188, "epoch": 2052} {"train_loss": -6.152745246887207, "global_step": 86189, "epoch": 2052} {"train_loss": -6.165000915527344, "global_step": 86190, "epoch": 2052} {"train_loss": -6.155977249145508, "global_step": 86191, "epoch": 2052} {"train_loss": -6.194787979125977, "global_step": 86192, "epoch": 2052} {"train_loss": -6.267412185668945, "global_step": 86193, "epoch": 2052} {"train_loss": -6.115175247192383, "global_step": 86194, "epoch": 2052} {"train_loss": -6.132070064544678, "global_step": 86195, "epoch": 2052} {"train_loss": -6.106584548950195, "global_step": 86196, "epoch": 2052} {"train_loss": -6.0533223152160645, "global_step": 86197, "epoch": 2052} {"train_loss": -6.0749382972717285, "global_step": 86198, "epoch": 2052} {"train_loss": -6.036563873291016, "global_step": 86199, "epoch": 2052} {"train_loss": -6.163847923278809, "global_step": 86200, "epoch": 2052} {"train_loss": -6.25396728515625, "global_step": 86201, "epoch": 2052} {"train_loss": -6.129052639007568, "global_step": 86202, "epoch": 2052} {"train_loss": -6.06015682220459, "global_step": 86203, "epoch": 2052} {"train_loss": -6.146374702453613, "global_step": 86204, "epoch": 2052} {"train_loss": -6.123849868774414, "global_step": 86205, "epoch": 2052} {"train_loss": -6.143902778625488, "global_step": 86206, "epoch": 2052} {"train_loss": -6.304163932800293, "global_step": 86207, "epoch": 2052} {"train_loss": -6.200128078460693, "global_step": 86208, "epoch": 2052} {"train_loss": -5.978912830352783, "global_step": 86209, "epoch": 2052} {"train_loss": -6.235160827636719, "global_step": 86210, "epoch": 2052} {"train_loss": -6.154359340667725, "global_step": 86211, "epoch": 2052} {"train_loss": -6.1631083488464355, "global_step": 86212, "epoch": 2052} {"train_loss": -6.164185047149658, "global_step": 86213, "epoch": 2052} {"train_loss": -6.189896106719971, "global_step": 86214, "epoch": 2052} {"train_loss": -6.295110702514648, "global_step": 86215, "epoch": 2052} {"train_loss": -6.235011100769043, "global_step": 86216, "epoch": 2052} {"train_loss": -6.0720720291137695, "global_step": 86217, "epoch": 2052} {"train_loss": -6.266014575958252, "global_step": 86218, "epoch": 2052} {"train_loss": -6.244756698608398, "global_step": 86219, "epoch": 2052} {"train_loss": -6.232778072357178, "global_step": 86220, "epoch": 2052} {"train_loss": -6.356875419616699, "global_step": 86221, "epoch": 2052} {"train_loss": -6.170144557952881, "global_step": 86222, "epoch": 2052} {"train_loss": -6.22905969619751, "global_step": 86223, "epoch": 2052} {"train_loss": -6.243205547332764, "global_step": 86224, "epoch": 2052} {"train_loss": -6.171820538384574, "global_step": 86225, "epoch": 2052, "val_loss": 75129.3359375} {"train_loss": -6.191152572631836, "global_step": 86226, "epoch": 2053} {"train_loss": -6.257054328918457, "global_step": 86227, "epoch": 2053} {"train_loss": -6.2340898513793945, "global_step": 86228, "epoch": 2053} {"train_loss": -6.238397598266602, "global_step": 86229, "epoch": 2053} {"train_loss": -6.282979965209961, "global_step": 86230, "epoch": 2053} {"train_loss": -6.199395656585693, "global_step": 86231, "epoch": 2053} {"train_loss": -6.335140228271484, "global_step": 86232, "epoch": 2053} {"train_loss": -6.245889663696289, "global_step": 86233, "epoch": 2053} {"train_loss": -6.295884609222412, "global_step": 86234, "epoch": 2053} {"train_loss": -6.2661333084106445, "global_step": 86235, "epoch": 2053} {"train_loss": -6.261514186859131, "global_step": 86236, "epoch": 2053} {"train_loss": -6.152132034301758, "global_step": 86237, "epoch": 2053} {"train_loss": -6.13267707824707, "global_step": 86238, "epoch": 2053} {"train_loss": -6.199075698852539, "global_step": 86239, "epoch": 2053} {"train_loss": -6.132955074310303, "global_step": 86240, "epoch": 2053} {"train_loss": -6.276907920837402, "global_step": 86241, "epoch": 2053} {"train_loss": -6.2681450843811035, "global_step": 86242, "epoch": 2053} {"train_loss": -6.084867477416992, "global_step": 86243, "epoch": 2053} {"train_loss": -6.262275695800781, "global_step": 86244, "epoch": 2053} {"train_loss": -6.155455589294434, "global_step": 86245, "epoch": 2053} {"train_loss": -6.252989768981934, "global_step": 86246, "epoch": 2053} {"train_loss": -6.256020545959473, "global_step": 86247, "epoch": 2053} {"train_loss": -6.158441066741943, "global_step": 86248, "epoch": 2053} {"train_loss": -6.283151149749756, "global_step": 86249, "epoch": 2053} {"train_loss": -6.077535152435303, "global_step": 86250, "epoch": 2053} {"train_loss": -6.193880081176758, "global_step": 86251, "epoch": 2053} {"train_loss": -6.177126884460449, "global_step": 86252, "epoch": 2053} {"train_loss": -6.168583869934082, "global_step": 86253, "epoch": 2053} {"train_loss": -6.067965507507324, "global_step": 86254, "epoch": 2053} {"train_loss": -6.151320457458496, "global_step": 86255, "epoch": 2053} {"train_loss": -6.197669506072998, "global_step": 86256, "epoch": 2053} {"train_loss": -6.034435272216797, "global_step": 86257, "epoch": 2053} {"train_loss": -6.130152702331543, "global_step": 86258, "epoch": 2053} {"train_loss": -6.170238018035889, "global_step": 86259, "epoch": 2053} {"train_loss": -6.176848411560059, "global_step": 86260, "epoch": 2053} {"train_loss": -6.216568946838379, "global_step": 86261, "epoch": 2053} {"train_loss": -6.153112411499023, "global_step": 86262, "epoch": 2053} {"train_loss": -6.342576503753662, "global_step": 86263, "epoch": 2053} {"train_loss": -6.238003253936768, "global_step": 86264, "epoch": 2053} {"train_loss": -6.18149471282959, "global_step": 86265, "epoch": 2053} {"train_loss": -6.220178127288818, "global_step": 86266, "epoch": 2053} {"train_loss": -6.202607711156209, "global_step": 86267, "epoch": 2053, "val_loss": 75146.4453125} {"train_loss": -6.220602035522461, "global_step": 86268, "epoch": 2054} {"train_loss": -6.295641899108887, "global_step": 86269, "epoch": 2054} {"train_loss": -6.193285942077637, "global_step": 86270, "epoch": 2054} {"train_loss": -6.199058532714844, "global_step": 86271, "epoch": 2054} {"train_loss": -6.166093826293945, "global_step": 86272, "epoch": 2054} {"train_loss": -6.3546462059021, "global_step": 86273, "epoch": 2054} {"train_loss": -6.132758617401123, "global_step": 86274, "epoch": 2054} {"train_loss": -6.2821364402771, "global_step": 86275, "epoch": 2054} {"train_loss": -6.196049690246582, "global_step": 86276, "epoch": 2054} {"train_loss": -6.356564521789551, "global_step": 86277, "epoch": 2054} {"train_loss": -6.20067024230957, "global_step": 86278, "epoch": 2054} {"train_loss": -6.118162155151367, "global_step": 86279, "epoch": 2054} {"train_loss": -6.275352478027344, "global_step": 86280, "epoch": 2054} {"train_loss": -6.273778915405273, "global_step": 86281, "epoch": 2054} {"train_loss": -6.319632053375244, "global_step": 86282, "epoch": 2054} {"train_loss": -6.245916366577148, "global_step": 86283, "epoch": 2054} {"train_loss": -6.224452018737793, "global_step": 86284, "epoch": 2054} {"train_loss": -6.198094367980957, "global_step": 86285, "epoch": 2054} {"train_loss": -6.185597896575928, "global_step": 86286, "epoch": 2054} {"train_loss": -6.145378112792969, "global_step": 86287, "epoch": 2054} {"train_loss": -6.144942760467529, "global_step": 86288, "epoch": 2054} {"train_loss": -6.209388732910156, "global_step": 86289, "epoch": 2054} {"train_loss": -6.177984237670898, "global_step": 86290, "epoch": 2054} {"train_loss": -6.285213470458984, "global_step": 86291, "epoch": 2054} {"train_loss": -6.258228302001953, "global_step": 86292, "epoch": 2054} {"train_loss": -6.1523027420043945, "global_step": 86293, "epoch": 2054} {"train_loss": -6.113825798034668, "global_step": 86294, "epoch": 2054} {"train_loss": -6.232009410858154, "global_step": 86295, "epoch": 2054} {"train_loss": -6.13178014755249, "global_step": 86296, "epoch": 2054} {"train_loss": -6.089786529541016, "global_step": 86297, "epoch": 2054} {"train_loss": -6.246803283691406, "global_step": 86298, "epoch": 2054} {"train_loss": -6.209200382232666, "global_step": 86299, "epoch": 2054} {"train_loss": -6.154698848724365, "global_step": 86300, "epoch": 2054} {"train_loss": -6.138021469116211, "global_step": 86301, "epoch": 2054} {"train_loss": -6.037424087524414, "global_step": 86302, "epoch": 2054} {"train_loss": -6.227621078491211, "global_step": 86303, "epoch": 2054} {"train_loss": -5.987645149230957, "global_step": 86304, "epoch": 2054} {"train_loss": -6.069240093231201, "global_step": 86305, "epoch": 2054} {"train_loss": -6.18236780166626, "global_step": 86306, "epoch": 2054} {"train_loss": -6.000001907348633, "global_step": 86307, "epoch": 2054} {"train_loss": -6.1294145584106445, "global_step": 86308, "epoch": 2054} {"train_loss": -6.1909495535350985, "global_step": 86309, "epoch": 2054, "val_loss": 75375.8125} {"train_loss": -6.046498775482178, "global_step": 86310, "epoch": 2055} {"train_loss": -6.053253650665283, "global_step": 86311, "epoch": 2055} {"train_loss": -6.18010139465332, "global_step": 86312, "epoch": 2055} {"train_loss": -6.283604621887207, "global_step": 86313, "epoch": 2055} {"train_loss": -6.077258586883545, "global_step": 86314, "epoch": 2055} {"train_loss": -6.157420635223389, "global_step": 86315, "epoch": 2055} {"train_loss": -6.239890098571777, "global_step": 86316, "epoch": 2055} {"train_loss": -6.026157379150391, "global_step": 86317, "epoch": 2055} {"train_loss": -6.2454023361206055, "global_step": 86318, "epoch": 2055} {"train_loss": -6.140616416931152, "global_step": 86319, "epoch": 2055} {"train_loss": -6.259514331817627, "global_step": 86320, "epoch": 2055} {"train_loss": -6.194201946258545, "global_step": 86321, "epoch": 2055} {"train_loss": -6.050811767578125, "global_step": 86322, "epoch": 2055} {"train_loss": -6.091626167297363, "global_step": 86323, "epoch": 2055} {"train_loss": -6.136042594909668, "global_step": 86324, "epoch": 2055} {"train_loss": -6.036458969116211, "global_step": 86325, "epoch": 2055} {"train_loss": -6.079858303070068, "global_step": 86326, "epoch": 2055} {"train_loss": -6.10685396194458, "global_step": 86327, "epoch": 2055} {"train_loss": -6.188825607299805, "global_step": 86328, "epoch": 2055} {"train_loss": -6.181103706359863, "global_step": 86329, "epoch": 2055} {"train_loss": -6.319352149963379, "global_step": 86330, "epoch": 2055} {"train_loss": -6.02622652053833, "global_step": 86331, "epoch": 2055} {"train_loss": -6.128061294555664, "global_step": 86332, "epoch": 2055} {"train_loss": -6.2482757568359375, "global_step": 86333, "epoch": 2055} {"train_loss": -6.135279655456543, "global_step": 86334, "epoch": 2055} {"train_loss": -6.246025085449219, "global_step": 86335, "epoch": 2055} {"train_loss": -6.178694725036621, "global_step": 86336, "epoch": 2055} {"train_loss": -6.196588039398193, "global_step": 86337, "epoch": 2055} {"train_loss": -6.260773181915283, "global_step": 86338, "epoch": 2055} {"train_loss": -6.128695964813232, "global_step": 86339, "epoch": 2055} {"train_loss": -6.282303810119629, "global_step": 86340, "epoch": 2055} {"train_loss": -6.18327522277832, "global_step": 86341, "epoch": 2055} {"train_loss": -6.163735389709473, "global_step": 86342, "epoch": 2055} {"train_loss": -6.221919536590576, "global_step": 86343, "epoch": 2055} {"train_loss": -6.138251304626465, "global_step": 86344, "epoch": 2055} {"train_loss": -6.227505683898926, "global_step": 86345, "epoch": 2055} {"train_loss": -6.120832443237305, "global_step": 86346, "epoch": 2055} {"train_loss": -6.128499984741211, "global_step": 86347, "epoch": 2055} {"train_loss": -6.184206962585449, "global_step": 86348, "epoch": 2055} {"train_loss": -6.188206195831299, "global_step": 86349, "epoch": 2055} {"train_loss": -6.225522041320801, "global_step": 86350, "epoch": 2055} {"train_loss": -6.16505301566351, "global_step": 86351, "epoch": 2055, "val_loss": 75334.0234375} {"train_loss": -6.2325215339660645, "global_step": 86352, "epoch": 2056} {"train_loss": -6.112125396728516, "global_step": 86353, "epoch": 2056} {"train_loss": -6.184082508087158, "global_step": 86354, "epoch": 2056} {"train_loss": -6.247290134429932, "global_step": 86355, "epoch": 2056} {"train_loss": -6.1407470703125, "global_step": 86356, "epoch": 2056} {"train_loss": -6.212663650512695, "global_step": 86357, "epoch": 2056} {"train_loss": -6.309202194213867, "global_step": 86358, "epoch": 2056} {"train_loss": -6.200295448303223, "global_step": 86359, "epoch": 2056} {"train_loss": -6.17025089263916, "global_step": 86360, "epoch": 2056} {"train_loss": -6.1873674392700195, "global_step": 86361, "epoch": 2056} {"train_loss": -6.241212844848633, "global_step": 86362, "epoch": 2056} {"train_loss": -6.200349807739258, "global_step": 86363, "epoch": 2056} {"train_loss": -6.099405288696289, "global_step": 86364, "epoch": 2056} {"train_loss": -6.153288841247559, "global_step": 86365, "epoch": 2056} {"train_loss": -6.050958633422852, "global_step": 86366, "epoch": 2056} {"train_loss": -6.275823593139648, "global_step": 86367, "epoch": 2056} {"train_loss": -6.185486316680908, "global_step": 86368, "epoch": 2056} {"train_loss": -6.067044258117676, "global_step": 86369, "epoch": 2056} {"train_loss": -6.218791484832764, "global_step": 86370, "epoch": 2056} {"train_loss": -6.065540790557861, "global_step": 86371, "epoch": 2056} {"train_loss": -6.242444038391113, "global_step": 86372, "epoch": 2056} {"train_loss": -6.148900032043457, "global_step": 86373, "epoch": 2056} {"train_loss": -6.261689186096191, "global_step": 86374, "epoch": 2056} {"train_loss": -6.093079566955566, "global_step": 86375, "epoch": 2056} {"train_loss": -6.035500526428223, "global_step": 86376, "epoch": 2056} {"train_loss": -6.192484378814697, "global_step": 86377, "epoch": 2056} {"train_loss": -6.143891334533691, "global_step": 86378, "epoch": 2056} {"train_loss": -6.171775817871094, "global_step": 86379, "epoch": 2056} {"train_loss": -6.14599609375, "global_step": 86380, "epoch": 2056} {"train_loss": -6.227351188659668, "global_step": 86381, "epoch": 2056} {"train_loss": -6.1702446937561035, "global_step": 86382, "epoch": 2056} {"train_loss": -6.212559223175049, "global_step": 86383, "epoch": 2056} {"train_loss": -6.074261665344238, "global_step": 86384, "epoch": 2056} {"train_loss": -6.253884315490723, "global_step": 86385, "epoch": 2056} {"train_loss": -6.236448287963867, "global_step": 86386, "epoch": 2056} {"train_loss": -6.084888458251953, "global_step": 86387, "epoch": 2056} {"train_loss": -6.18259334564209, "global_step": 86388, "epoch": 2056} {"train_loss": -6.1824116706848145, "global_step": 86389, "epoch": 2056} {"train_loss": -6.2817792892456055, "global_step": 86390, "epoch": 2056} {"train_loss": -6.20970344543457, "global_step": 86391, "epoch": 2056} {"train_loss": -6.159919738769531, "global_step": 86392, "epoch": 2056} {"train_loss": -6.178954215276809, "global_step": 86393, "epoch": 2056, "val_loss": 75192.8203125} {"train_loss": -6.210681438446045, "global_step": 86394, "epoch": 2057} {"train_loss": -6.273532867431641, "global_step": 86395, "epoch": 2057} {"train_loss": -6.211615085601807, "global_step": 86396, "epoch": 2057} {"train_loss": -6.303218364715576, "global_step": 86397, "epoch": 2057} {"train_loss": -6.214344024658203, "global_step": 86398, "epoch": 2057} {"train_loss": -6.3097124099731445, "global_step": 86399, "epoch": 2057} {"train_loss": -6.147027492523193, "global_step": 86400, "epoch": 2057} {"train_loss": -6.255873203277588, "global_step": 86401, "epoch": 2057} {"train_loss": -6.298437118530273, "global_step": 86402, "epoch": 2057} {"train_loss": -6.2223968505859375, "global_step": 86403, "epoch": 2057} {"train_loss": -6.133981704711914, "global_step": 86404, "epoch": 2057} {"train_loss": -6.1790008544921875, "global_step": 86405, "epoch": 2057} {"train_loss": -6.265745162963867, "global_step": 86406, "epoch": 2057} {"train_loss": -6.2288498878479, "global_step": 86407, "epoch": 2057} {"train_loss": -6.134030342102051, "global_step": 86408, "epoch": 2057} {"train_loss": -6.250664234161377, "global_step": 86409, "epoch": 2057} {"train_loss": -6.299280166625977, "global_step": 86410, "epoch": 2057} {"train_loss": -6.301792621612549, "global_step": 86411, "epoch": 2057} {"train_loss": -6.157434463500977, "global_step": 86412, "epoch": 2057} {"train_loss": -6.308511734008789, "global_step": 86413, "epoch": 2057} {"train_loss": -6.342865467071533, "global_step": 86414, "epoch": 2057} {"train_loss": -6.358468532562256, "global_step": 86415, "epoch": 2057} {"train_loss": -6.246593952178955, "global_step": 86416, "epoch": 2057} {"train_loss": -6.218929290771484, "global_step": 86417, "epoch": 2057} {"train_loss": -6.150944709777832, "global_step": 86418, "epoch": 2057} {"train_loss": -6.330809116363525, "global_step": 86419, "epoch": 2057} {"train_loss": -6.187743186950684, "global_step": 86420, "epoch": 2057} {"train_loss": -6.272728443145752, "global_step": 86421, "epoch": 2057} {"train_loss": -6.1823577880859375, "global_step": 86422, "epoch": 2057} {"train_loss": -6.1037750244140625, "global_step": 86423, "epoch": 2057} {"train_loss": -6.173271179199219, "global_step": 86424, "epoch": 2057} {"train_loss": -6.244632720947266, "global_step": 86425, "epoch": 2057} {"train_loss": -6.094528675079346, "global_step": 86426, "epoch": 2057} {"train_loss": -6.220953464508057, "global_step": 86427, "epoch": 2057} {"train_loss": -6.1514692306518555, "global_step": 86428, "epoch": 2057} {"train_loss": -6.157780647277832, "global_step": 86429, "epoch": 2057} {"train_loss": -6.195321559906006, "global_step": 86430, "epoch": 2057} {"train_loss": -6.1298322677612305, "global_step": 86431, "epoch": 2057} {"train_loss": -6.244319915771484, "global_step": 86432, "epoch": 2057} {"train_loss": -6.298340797424316, "global_step": 86433, "epoch": 2057} {"train_loss": -6.21126651763916, "global_step": 86434, "epoch": 2057} {"train_loss": -6.223724138169062, "global_step": 86435, "epoch": 2057, "val_loss": 75085.671875} {"train_loss": -6.150611877441406, "global_step": 86436, "epoch": 2058} {"train_loss": -6.312047958374023, "global_step": 86437, "epoch": 2058} {"train_loss": -6.200944900512695, "global_step": 86438, "epoch": 2058} {"train_loss": -6.225093364715576, "global_step": 86439, "epoch": 2058} {"train_loss": -6.204845428466797, "global_step": 86440, "epoch": 2058} {"train_loss": -6.222834587097168, "global_step": 86441, "epoch": 2058} {"train_loss": -6.187488079071045, "global_step": 86442, "epoch": 2058} {"train_loss": -6.154585361480713, "global_step": 86443, "epoch": 2058} {"train_loss": -6.277402877807617, "global_step": 86444, "epoch": 2058} {"train_loss": -6.204745292663574, "global_step": 86445, "epoch": 2058} {"train_loss": -6.141721248626709, "global_step": 86446, "epoch": 2058} {"train_loss": -6.1635661125183105, "global_step": 86447, "epoch": 2058} {"train_loss": -6.195441246032715, "global_step": 86448, "epoch": 2058} {"train_loss": -6.261500358581543, "global_step": 86449, "epoch": 2058} {"train_loss": -6.238880634307861, "global_step": 86450, "epoch": 2058} {"train_loss": -6.243742942810059, "global_step": 86451, "epoch": 2058} {"train_loss": -6.188486576080322, "global_step": 86452, "epoch": 2058} {"train_loss": -6.160294532775879, "global_step": 86453, "epoch": 2058} {"train_loss": -6.286836624145508, "global_step": 86454, "epoch": 2058} {"train_loss": -6.270134925842285, "global_step": 86455, "epoch": 2058} {"train_loss": -6.151131629943848, "global_step": 86456, "epoch": 2058} {"train_loss": -6.161344528198242, "global_step": 86457, "epoch": 2058} {"train_loss": -6.228758335113525, "global_step": 86458, "epoch": 2058} {"train_loss": -6.1973466873168945, "global_step": 86459, "epoch": 2058} {"train_loss": -6.247086524963379, "global_step": 86460, "epoch": 2058} {"train_loss": -6.234600067138672, "global_step": 86461, "epoch": 2058} {"train_loss": -6.108007431030273, "global_step": 86462, "epoch": 2058} {"train_loss": -6.103199005126953, "global_step": 86463, "epoch": 2058} {"train_loss": -6.182217597961426, "global_step": 86464, "epoch": 2058} {"train_loss": -6.215664863586426, "global_step": 86465, "epoch": 2058} {"train_loss": -6.187382221221924, "global_step": 86466, "epoch": 2058} {"train_loss": -6.3138275146484375, "global_step": 86467, "epoch": 2058} {"train_loss": -6.136615753173828, "global_step": 86468, "epoch": 2058} {"train_loss": -6.0628838539123535, "global_step": 86469, "epoch": 2058} {"train_loss": -6.170748710632324, "global_step": 86470, "epoch": 2058} {"train_loss": -6.129866123199463, "global_step": 86471, "epoch": 2058} {"train_loss": -6.201702117919922, "global_step": 86472, "epoch": 2058} {"train_loss": -6.25533390045166, "global_step": 86473, "epoch": 2058} {"train_loss": -6.176060676574707, "global_step": 86474, "epoch": 2058} {"train_loss": -6.172926902770996, "global_step": 86475, "epoch": 2058} {"train_loss": -6.260319709777832, "global_step": 86476, "epoch": 2058} {"train_loss": -6.201889639809018, "global_step": 86477, "epoch": 2058, "val_loss": 74841.71875} {"train_loss": -6.198064804077148, "global_step": 86478, "epoch": 2059} {"train_loss": -6.291494369506836, "global_step": 86479, "epoch": 2059} {"train_loss": -6.186514377593994, "global_step": 86480, "epoch": 2059} {"train_loss": -6.206101894378662, "global_step": 86481, "epoch": 2059} {"train_loss": -6.226922988891602, "global_step": 86482, "epoch": 2059} {"train_loss": -6.24809455871582, "global_step": 86483, "epoch": 2059} {"train_loss": -6.257863998413086, "global_step": 86484, "epoch": 2059} {"train_loss": -6.1690216064453125, "global_step": 86485, "epoch": 2059} {"train_loss": -6.147652626037598, "global_step": 86486, "epoch": 2059} {"train_loss": -6.158687591552734, "global_step": 86487, "epoch": 2059} {"train_loss": -6.245100975036621, "global_step": 86488, "epoch": 2059} {"train_loss": -6.133289337158203, "global_step": 86489, "epoch": 2059} {"train_loss": -5.924947738647461, "global_step": 86490, "epoch": 2059} {"train_loss": -6.160988807678223, "global_step": 86491, "epoch": 2059} {"train_loss": -6.072334289550781, "global_step": 86492, "epoch": 2059} {"train_loss": -6.098392486572266, "global_step": 86493, "epoch": 2059} {"train_loss": -6.1280975341796875, "global_step": 86494, "epoch": 2059} {"train_loss": -5.974684238433838, "global_step": 86495, "epoch": 2059} {"train_loss": -6.106381416320801, "global_step": 86496, "epoch": 2059} {"train_loss": -5.957197189331055, "global_step": 86497, "epoch": 2059} {"train_loss": -6.24826717376709, "global_step": 86498, "epoch": 2059} {"train_loss": -5.9747209548950195, "global_step": 86499, "epoch": 2059} {"train_loss": -6.189325332641602, "global_step": 86500, "epoch": 2059} {"train_loss": -6.2305169105529785, "global_step": 86501, "epoch": 2059} {"train_loss": -6.150010108947754, "global_step": 86502, "epoch": 2059} {"train_loss": -6.238438606262207, "global_step": 86503, "epoch": 2059} {"train_loss": -6.222810745239258, "global_step": 86504, "epoch": 2059} {"train_loss": -6.1042985916137695, "global_step": 86505, "epoch": 2059} {"train_loss": -6.2845458984375, "global_step": 86506, "epoch": 2059} {"train_loss": -6.239798545837402, "global_step": 86507, "epoch": 2059} {"train_loss": -6.211362838745117, "global_step": 86508, "epoch": 2059} {"train_loss": -6.199190616607666, "global_step": 86509, "epoch": 2059} {"train_loss": -6.186699867248535, "global_step": 86510, "epoch": 2059} {"train_loss": -6.06417179107666, "global_step": 86511, "epoch": 2059} {"train_loss": -6.176497459411621, "global_step": 86512, "epoch": 2059} {"train_loss": -6.141923904418945, "global_step": 86513, "epoch": 2059} {"train_loss": -6.264972686767578, "global_step": 86514, "epoch": 2059} {"train_loss": -6.274372100830078, "global_step": 86515, "epoch": 2059} {"train_loss": -6.215730667114258, "global_step": 86516, "epoch": 2059} {"train_loss": -6.245794296264648, "global_step": 86517, "epoch": 2059} {"train_loss": -6.218526840209961, "global_step": 86518, "epoch": 2059} {"train_loss": -6.171728497459775, "global_step": 86519, "epoch": 2059, "val_loss": 75260.4453125} {"train_loss": -6.053330421447754, "global_step": 86520, "epoch": 2060} {"train_loss": -6.227914810180664, "global_step": 86521, "epoch": 2060} {"train_loss": -6.228458404541016, "global_step": 86522, "epoch": 2060} {"train_loss": -6.31266975402832, "global_step": 86523, "epoch": 2060} {"train_loss": -6.250853538513184, "global_step": 86524, "epoch": 2060} {"train_loss": -6.030289173126221, "global_step": 86525, "epoch": 2060} {"train_loss": -6.281200885772705, "global_step": 86526, "epoch": 2060} {"train_loss": -6.266399383544922, "global_step": 86527, "epoch": 2060} {"train_loss": -6.090002059936523, "global_step": 86528, "epoch": 2060} {"train_loss": -6.186574935913086, "global_step": 86529, "epoch": 2060} {"train_loss": -6.18984842300415, "global_step": 86530, "epoch": 2060} {"train_loss": -6.161388397216797, "global_step": 86531, "epoch": 2060} {"train_loss": -6.11208963394165, "global_step": 86532, "epoch": 2060} {"train_loss": -6.122045516967773, "global_step": 86533, "epoch": 2060} {"train_loss": -6.271455764770508, "global_step": 86534, "epoch": 2060} {"train_loss": -6.149764060974121, "global_step": 86535, "epoch": 2060} {"train_loss": -6.115622043609619, "global_step": 86536, "epoch": 2060} {"train_loss": -6.195425033569336, "global_step": 86537, "epoch": 2060} {"train_loss": -6.119671821594238, "global_step": 86538, "epoch": 2060} {"train_loss": -6.16575813293457, "global_step": 86539, "epoch": 2060} {"train_loss": -6.304457664489746, "global_step": 86540, "epoch": 2060} {"train_loss": -6.117501735687256, "global_step": 86541, "epoch": 2060} {"train_loss": -6.252783298492432, "global_step": 86542, "epoch": 2060} {"train_loss": -6.2081522941589355, "global_step": 86543, "epoch": 2060} {"train_loss": -6.223987579345703, "global_step": 86544, "epoch": 2060} {"train_loss": -6.213189125061035, "global_step": 86545, "epoch": 2060} {"train_loss": -6.155281066894531, "global_step": 86546, "epoch": 2060} {"train_loss": -6.308557510375977, "global_step": 86547, "epoch": 2060} {"train_loss": -6.130385398864746, "global_step": 86548, "epoch": 2060} {"train_loss": -6.216418266296387, "global_step": 86549, "epoch": 2060} {"train_loss": -6.164119720458984, "global_step": 86550, "epoch": 2060} {"train_loss": -6.206938743591309, "global_step": 86551, "epoch": 2060} {"train_loss": -6.35858154296875, "global_step": 86552, "epoch": 2060} {"train_loss": -6.179409027099609, "global_step": 86553, "epoch": 2060} {"train_loss": -6.196922302246094, "global_step": 86554, "epoch": 2060} {"train_loss": -6.3310394287109375, "global_step": 86555, "epoch": 2060} {"train_loss": -6.143969535827637, "global_step": 86556, "epoch": 2060} {"train_loss": -6.183037757873535, "global_step": 86557, "epoch": 2060} {"train_loss": -6.336860179901123, "global_step": 86558, "epoch": 2060} {"train_loss": -6.1343183517456055, "global_step": 86559, "epoch": 2060} {"train_loss": -6.164024353027344, "global_step": 86560, "epoch": 2060} {"train_loss": -6.19862041019258, "global_step": 86561, "epoch": 2060, "val_loss": 75138.5625} {"train_loss": -6.229892730712891, "global_step": 86562, "epoch": 2061} {"train_loss": -6.247026443481445, "global_step": 86563, "epoch": 2061} {"train_loss": -6.269054889678955, "global_step": 86564, "epoch": 2061} {"train_loss": -6.252903461456299, "global_step": 86565, "epoch": 2061} {"train_loss": -6.256564140319824, "global_step": 86566, "epoch": 2061} {"train_loss": -6.1346845626831055, "global_step": 86567, "epoch": 2061} {"train_loss": -6.1701860427856445, "global_step": 86568, "epoch": 2061} {"train_loss": -6.19425106048584, "global_step": 86569, "epoch": 2061} {"train_loss": -6.1537275314331055, "global_step": 86570, "epoch": 2061} {"train_loss": -6.168438911437988, "global_step": 86571, "epoch": 2061} {"train_loss": -6.235121250152588, "global_step": 86572, "epoch": 2061} {"train_loss": -6.160154342651367, "global_step": 86573, "epoch": 2061} {"train_loss": -6.15238094329834, "global_step": 86574, "epoch": 2061} {"train_loss": -6.226596832275391, "global_step": 86575, "epoch": 2061} {"train_loss": -6.247981548309326, "global_step": 86576, "epoch": 2061} {"train_loss": -6.208670616149902, "global_step": 86577, "epoch": 2061} {"train_loss": -6.274127006530762, "global_step": 86578, "epoch": 2061} {"train_loss": -6.199164390563965, "global_step": 86579, "epoch": 2061} {"train_loss": -6.16326379776001, "global_step": 86580, "epoch": 2061} {"train_loss": -6.191711902618408, "global_step": 86581, "epoch": 2061} {"train_loss": -6.273775100708008, "global_step": 86582, "epoch": 2061} {"train_loss": -6.28857421875, "global_step": 86583, "epoch": 2061} {"train_loss": -6.2381391525268555, "global_step": 86584, "epoch": 2061} {"train_loss": -6.149488925933838, "global_step": 86585, "epoch": 2061} {"train_loss": -6.1590399742126465, "global_step": 86586, "epoch": 2061} {"train_loss": -6.084225654602051, "global_step": 86587, "epoch": 2061} {"train_loss": -6.121855735778809, "global_step": 86588, "epoch": 2061} {"train_loss": -6.242938995361328, "global_step": 86589, "epoch": 2061} {"train_loss": -6.32369327545166, "global_step": 86590, "epoch": 2061} {"train_loss": -6.308944225311279, "global_step": 86591, "epoch": 2061} {"train_loss": -6.1162109375, "global_step": 86592, "epoch": 2061} {"train_loss": -6.193389892578125, "global_step": 86593, "epoch": 2061} {"train_loss": -6.166738986968994, "global_step": 86594, "epoch": 2061} {"train_loss": -6.260924339294434, "global_step": 86595, "epoch": 2061} {"train_loss": -6.181995391845703, "global_step": 86596, "epoch": 2061} {"train_loss": -6.250702381134033, "global_step": 86597, "epoch": 2061} {"train_loss": -6.185201644897461, "global_step": 86598, "epoch": 2061} {"train_loss": -6.31650447845459, "global_step": 86599, "epoch": 2061} {"train_loss": -6.249073505401611, "global_step": 86600, "epoch": 2061} {"train_loss": -6.127470016479492, "global_step": 86601, "epoch": 2061} {"train_loss": -6.178448677062988, "global_step": 86602, "epoch": 2061} {"train_loss": -6.206244491395497, "global_step": 86603, "epoch": 2061, "val_loss": 75465.234375} {"train_loss": -6.1673054695129395, "global_step": 86604, "epoch": 2062} {"train_loss": -6.133401870727539, "global_step": 86605, "epoch": 2062} {"train_loss": -6.209958076477051, "global_step": 86606, "epoch": 2062} {"train_loss": -6.270943641662598, "global_step": 86607, "epoch": 2062} {"train_loss": -6.193879127502441, "global_step": 86608, "epoch": 2062} {"train_loss": -6.32852029800415, "global_step": 86609, "epoch": 2062} {"train_loss": -6.096954345703125, "global_step": 86610, "epoch": 2062} {"train_loss": -6.2747297286987305, "global_step": 86611, "epoch": 2062} {"train_loss": -6.068992614746094, "global_step": 86612, "epoch": 2062} {"train_loss": -6.191450119018555, "global_step": 86613, "epoch": 2062} {"train_loss": -6.262872219085693, "global_step": 86614, "epoch": 2062} {"train_loss": -6.2607197761535645, "global_step": 86615, "epoch": 2062} {"train_loss": -6.243646621704102, "global_step": 86616, "epoch": 2062} {"train_loss": -6.240046977996826, "global_step": 86617, "epoch": 2062} {"train_loss": -6.3514299392700195, "global_step": 86618, "epoch": 2062} {"train_loss": -6.139795303344727, "global_step": 86619, "epoch": 2062} {"train_loss": -6.2709479331970215, "global_step": 86620, "epoch": 2062} {"train_loss": -6.313640594482422, "global_step": 86621, "epoch": 2062} {"train_loss": -6.231266975402832, "global_step": 86622, "epoch": 2062} {"train_loss": -6.214680194854736, "global_step": 86623, "epoch": 2062} {"train_loss": -6.281243324279785, "global_step": 86624, "epoch": 2062} {"train_loss": -6.172381401062012, "global_step": 86625, "epoch": 2062} {"train_loss": -6.193597793579102, "global_step": 86626, "epoch": 2062} {"train_loss": -6.187722682952881, "global_step": 86627, "epoch": 2062} {"train_loss": -6.221998691558838, "global_step": 86628, "epoch": 2062} {"train_loss": -6.119653701782227, "global_step": 86629, "epoch": 2062} {"train_loss": -6.20964241027832, "global_step": 86630, "epoch": 2062} {"train_loss": -6.333010673522949, "global_step": 86631, "epoch": 2062} {"train_loss": -6.26455545425415, "global_step": 86632, "epoch": 2062} {"train_loss": -6.283275604248047, "global_step": 86633, "epoch": 2062} {"train_loss": -6.198875427246094, "global_step": 86634, "epoch": 2062} {"train_loss": -6.21472692489624, "global_step": 86635, "epoch": 2062} {"train_loss": -6.13974666595459, "global_step": 86636, "epoch": 2062} {"train_loss": -6.210562229156494, "global_step": 86637, "epoch": 2062} {"train_loss": -6.0422563552856445, "global_step": 86638, "epoch": 2062} {"train_loss": -6.116939544677734, "global_step": 86639, "epoch": 2062} {"train_loss": -6.239645957946777, "global_step": 86640, "epoch": 2062} {"train_loss": -6.288844108581543, "global_step": 86641, "epoch": 2062} {"train_loss": -6.34730339050293, "global_step": 86642, "epoch": 2062} {"train_loss": -6.090944766998291, "global_step": 86643, "epoch": 2062} {"train_loss": -6.261160850524902, "global_step": 86644, "epoch": 2062} {"train_loss": -6.2168589887164885, "global_step": 86645, "epoch": 2062, "val_loss": 75021.4140625} {"train_loss": -6.216183185577393, "global_step": 86646, "epoch": 2063} {"train_loss": -6.090055465698242, "global_step": 86647, "epoch": 2063} {"train_loss": -6.247737884521484, "global_step": 86648, "epoch": 2063} {"train_loss": -6.223808765411377, "global_step": 86649, "epoch": 2063} {"train_loss": -6.198470592498779, "global_step": 86650, "epoch": 2063} {"train_loss": -6.2227888107299805, "global_step": 86651, "epoch": 2063} {"train_loss": -6.269676685333252, "global_step": 86652, "epoch": 2063} {"train_loss": -6.171957492828369, "global_step": 86653, "epoch": 2063} {"train_loss": -6.302313327789307, "global_step": 86654, "epoch": 2063} {"train_loss": -6.201681613922119, "global_step": 86655, "epoch": 2063} {"train_loss": -6.228020191192627, "global_step": 86656, "epoch": 2063} {"train_loss": -6.157453536987305, "global_step": 86657, "epoch": 2063} {"train_loss": -6.264150619506836, "global_step": 86658, "epoch": 2063} {"train_loss": -6.267484188079834, "global_step": 86659, "epoch": 2063} {"train_loss": -6.237668991088867, "global_step": 86660, "epoch": 2063} {"train_loss": -6.20601749420166, "global_step": 86661, "epoch": 2063} {"train_loss": -6.256539344787598, "global_step": 86662, "epoch": 2063} {"train_loss": -6.147899627685547, "global_step": 86663, "epoch": 2063} {"train_loss": -6.148514747619629, "global_step": 86664, "epoch": 2063} {"train_loss": -6.250994682312012, "global_step": 86665, "epoch": 2063} {"train_loss": -6.148264408111572, "global_step": 86666, "epoch": 2063} {"train_loss": -6.15479850769043, "global_step": 86667, "epoch": 2063} {"train_loss": -6.221268177032471, "global_step": 86668, "epoch": 2063} {"train_loss": -6.219632148742676, "global_step": 86669, "epoch": 2063} {"train_loss": -6.041271686553955, "global_step": 86670, "epoch": 2063} {"train_loss": -6.087143898010254, "global_step": 86671, "epoch": 2063} {"train_loss": -6.2654314041137695, "global_step": 86672, "epoch": 2063} {"train_loss": -6.114649772644043, "global_step": 86673, "epoch": 2063} {"train_loss": -6.03665828704834, "global_step": 86674, "epoch": 2063} {"train_loss": -6.21446418762207, "global_step": 86675, "epoch": 2063} {"train_loss": -6.18657112121582, "global_step": 86676, "epoch": 2063} {"train_loss": -6.155586242675781, "global_step": 86677, "epoch": 2063} {"train_loss": -6.15179967880249, "global_step": 86678, "epoch": 2063} {"train_loss": -6.065186500549316, "global_step": 86679, "epoch": 2063} {"train_loss": -6.229308128356934, "global_step": 86680, "epoch": 2063} {"train_loss": -6.1254048347473145, "global_step": 86681, "epoch": 2063} {"train_loss": -6.191356658935547, "global_step": 86682, "epoch": 2063} {"train_loss": -6.1821136474609375, "global_step": 86683, "epoch": 2063} {"train_loss": -6.150404453277588, "global_step": 86684, "epoch": 2063} {"train_loss": -6.0557708740234375, "global_step": 86685, "epoch": 2063} {"train_loss": -6.280484199523926, "global_step": 86686, "epoch": 2063} {"train_loss": -6.185449963524228, "global_step": 86687, "epoch": 2063, "val_loss": 75334.53125} {"train_loss": -6.173898696899414, "global_step": 86688, "epoch": 2064} {"train_loss": -6.115766525268555, "global_step": 86689, "epoch": 2064} {"train_loss": -6.161831855773926, "global_step": 86690, "epoch": 2064} {"train_loss": -6.139254570007324, "global_step": 86691, "epoch": 2064} {"train_loss": -6.254584312438965, "global_step": 86692, "epoch": 2064} {"train_loss": -6.18881893157959, "global_step": 86693, "epoch": 2064} {"train_loss": -6.078120708465576, "global_step": 86694, "epoch": 2064} {"train_loss": -6.194797515869141, "global_step": 86695, "epoch": 2064} {"train_loss": -6.135775566101074, "global_step": 86696, "epoch": 2064} {"train_loss": -6.145651817321777, "global_step": 86697, "epoch": 2064} {"train_loss": -6.233064651489258, "global_step": 86698, "epoch": 2064} {"train_loss": -6.367646217346191, "global_step": 86699, "epoch": 2064} {"train_loss": -6.262426376342773, "global_step": 86700, "epoch": 2064} {"train_loss": -6.342902183532715, "global_step": 86701, "epoch": 2064} {"train_loss": -6.298009872436523, "global_step": 86702, "epoch": 2064} {"train_loss": -6.218910217285156, "global_step": 86703, "epoch": 2064} {"train_loss": -6.210421562194824, "global_step": 86704, "epoch": 2064} {"train_loss": -6.139338493347168, "global_step": 86705, "epoch": 2064} {"train_loss": -6.284510135650635, "global_step": 86706, "epoch": 2064} {"train_loss": -6.213090896606445, "global_step": 86707, "epoch": 2064} {"train_loss": -6.277251243591309, "global_step": 86708, "epoch": 2064} {"train_loss": -6.261469841003418, "global_step": 86709, "epoch": 2064} {"train_loss": -6.149893760681152, "global_step": 86710, "epoch": 2064} {"train_loss": -6.18149471282959, "global_step": 86711, "epoch": 2064} {"train_loss": -6.038361549377441, "global_step": 86712, "epoch": 2064} {"train_loss": -6.177219867706299, "global_step": 86713, "epoch": 2064} {"train_loss": -6.219054698944092, "global_step": 86714, "epoch": 2064} {"train_loss": -6.111051082611084, "global_step": 86715, "epoch": 2064} {"train_loss": -6.070769786834717, "global_step": 86716, "epoch": 2064} {"train_loss": -6.216101169586182, "global_step": 86717, "epoch": 2064} {"train_loss": -6.160049915313721, "global_step": 86718, "epoch": 2064} {"train_loss": -6.153755187988281, "global_step": 86719, "epoch": 2064} {"train_loss": -6.205521583557129, "global_step": 86720, "epoch": 2064} {"train_loss": -6.256728172302246, "global_step": 86721, "epoch": 2064} {"train_loss": -6.116683006286621, "global_step": 86722, "epoch": 2064} {"train_loss": -6.212856292724609, "global_step": 86723, "epoch": 2064} {"train_loss": -6.185574054718018, "global_step": 86724, "epoch": 2064} {"train_loss": -6.199969291687012, "global_step": 86725, "epoch": 2064} {"train_loss": -6.179903030395508, "global_step": 86726, "epoch": 2064} {"train_loss": -6.206164360046387, "global_step": 86727, "epoch": 2064} {"train_loss": -6.299920082092285, "global_step": 86728, "epoch": 2064} {"train_loss": -6.195417313348679, "global_step": 86729, "epoch": 2064, "val_loss": 75113.9609375} {"train_loss": -6.336341857910156, "global_step": 86730, "epoch": 2065} {"train_loss": -6.1360368728637695, "global_step": 86731, "epoch": 2065} {"train_loss": -6.20359992980957, "global_step": 86732, "epoch": 2065} {"train_loss": -6.329127311706543, "global_step": 86733, "epoch": 2065} {"train_loss": -6.139289379119873, "global_step": 86734, "epoch": 2065} {"train_loss": -6.225798606872559, "global_step": 86735, "epoch": 2065} {"train_loss": -6.206864356994629, "global_step": 86736, "epoch": 2065} {"train_loss": -6.3232741355896, "global_step": 86737, "epoch": 2065} {"train_loss": -6.234376907348633, "global_step": 86738, "epoch": 2065} {"train_loss": -6.198655128479004, "global_step": 86739, "epoch": 2065} {"train_loss": -6.253569602966309, "global_step": 86740, "epoch": 2065} {"train_loss": -6.284000873565674, "global_step": 86741, "epoch": 2065} {"train_loss": -6.152880668640137, "global_step": 86742, "epoch": 2065} {"train_loss": -6.205654621124268, "global_step": 86743, "epoch": 2065} {"train_loss": -6.340221405029297, "global_step": 86744, "epoch": 2065} {"train_loss": -6.352395534515381, "global_step": 86745, "epoch": 2065} {"train_loss": -6.270619869232178, "global_step": 86746, "epoch": 2065} {"train_loss": -6.300379753112793, "global_step": 86747, "epoch": 2065} {"train_loss": -6.349923133850098, "global_step": 86748, "epoch": 2065} {"train_loss": -6.3805928230285645, "global_step": 86749, "epoch": 2065} {"train_loss": -6.35094690322876, "global_step": 86750, "epoch": 2065} {"train_loss": -6.145806312561035, "global_step": 86751, "epoch": 2065} {"train_loss": -6.2728424072265625, "global_step": 86752, "epoch": 2065} {"train_loss": -6.223187446594238, "global_step": 86753, "epoch": 2065} {"train_loss": -6.1819257736206055, "global_step": 86754, "epoch": 2065} {"train_loss": -6.100248336791992, "global_step": 86755, "epoch": 2065} {"train_loss": -6.160607814788818, "global_step": 86756, "epoch": 2065} {"train_loss": -6.161344528198242, "global_step": 86757, "epoch": 2065} {"train_loss": -6.153912544250488, "global_step": 86758, "epoch": 2065} {"train_loss": -6.061445713043213, "global_step": 86759, "epoch": 2065} {"train_loss": -6.213419437408447, "global_step": 86760, "epoch": 2065} {"train_loss": -6.249144554138184, "global_step": 86761, "epoch": 2065} {"train_loss": -6.130458354949951, "global_step": 86762, "epoch": 2065} {"train_loss": -6.220839500427246, "global_step": 86763, "epoch": 2065} {"train_loss": -6.212660789489746, "global_step": 86764, "epoch": 2065} {"train_loss": -6.214932441711426, "global_step": 86765, "epoch": 2065} {"train_loss": -6.170846939086914, "global_step": 86766, "epoch": 2065} {"train_loss": -6.249119758605957, "global_step": 86767, "epoch": 2065} {"train_loss": -6.238520622253418, "global_step": 86768, "epoch": 2065} {"train_loss": -6.327998638153076, "global_step": 86769, "epoch": 2065} {"train_loss": -6.260017395019531, "global_step": 86770, "epoch": 2065} {"train_loss": -6.231648763020833, "global_step": 86771, "epoch": 2065, "val_loss": 75482.953125} {"train_loss": -6.2369256019592285, "global_step": 86772, "epoch": 2066} {"train_loss": -6.281234264373779, "global_step": 86773, "epoch": 2066} {"train_loss": -6.257389068603516, "global_step": 86774, "epoch": 2066} {"train_loss": -6.294170379638672, "global_step": 86775, "epoch": 2066} {"train_loss": -6.174701690673828, "global_step": 86776, "epoch": 2066} {"train_loss": -6.243585586547852, "global_step": 86777, "epoch": 2066} {"train_loss": -6.203592300415039, "global_step": 86778, "epoch": 2066} {"train_loss": -6.309903144836426, "global_step": 86779, "epoch": 2066} {"train_loss": -6.1497392654418945, "global_step": 86780, "epoch": 2066} {"train_loss": -6.271330833435059, "global_step": 86781, "epoch": 2066} {"train_loss": -6.371155738830566, "global_step": 86782, "epoch": 2066} {"train_loss": -6.195401191711426, "global_step": 86783, "epoch": 2066} {"train_loss": -6.251855850219727, "global_step": 86784, "epoch": 2066} {"train_loss": -6.225318908691406, "global_step": 86785, "epoch": 2066} {"train_loss": -6.188138961791992, "global_step": 86786, "epoch": 2066} {"train_loss": -6.26300573348999, "global_step": 86787, "epoch": 2066} {"train_loss": -6.185611248016357, "global_step": 86788, "epoch": 2066} {"train_loss": -6.1531877517700195, "global_step": 86789, "epoch": 2066} {"train_loss": -6.06562614440918, "global_step": 86790, "epoch": 2066} {"train_loss": -6.132876396179199, "global_step": 86791, "epoch": 2066} {"train_loss": -6.21433687210083, "global_step": 86792, "epoch": 2066} {"train_loss": -6.246495723724365, "global_step": 86793, "epoch": 2066} {"train_loss": -6.250642776489258, "global_step": 86794, "epoch": 2066} {"train_loss": -6.228837013244629, "global_step": 86795, "epoch": 2066} {"train_loss": -6.149863243103027, "global_step": 86796, "epoch": 2066} {"train_loss": -6.084103584289551, "global_step": 86797, "epoch": 2066} {"train_loss": -6.146108627319336, "global_step": 86798, "epoch": 2066} {"train_loss": -6.160098552703857, "global_step": 86799, "epoch": 2066} {"train_loss": -6.166118621826172, "global_step": 86800, "epoch": 2066} {"train_loss": -6.187033653259277, "global_step": 86801, "epoch": 2066} {"train_loss": -6.134496212005615, "global_step": 86802, "epoch": 2066} {"train_loss": -6.21995210647583, "global_step": 86803, "epoch": 2066} {"train_loss": -6.3263654708862305, "global_step": 86804, "epoch": 2066} {"train_loss": -6.253002166748047, "global_step": 86805, "epoch": 2066} {"train_loss": -6.141083717346191, "global_step": 86806, "epoch": 2066} {"train_loss": -6.2789764404296875, "global_step": 86807, "epoch": 2066} {"train_loss": -6.187737464904785, "global_step": 86808, "epoch": 2066} {"train_loss": -6.1150922775268555, "global_step": 86809, "epoch": 2066} {"train_loss": -6.183477401733398, "global_step": 86810, "epoch": 2066} {"train_loss": -6.134235382080078, "global_step": 86811, "epoch": 2066} {"train_loss": -6.168370246887207, "global_step": 86812, "epoch": 2066} {"train_loss": -6.20364465032305, "global_step": 86813, "epoch": 2066, "val_loss": 75614.6484375} {"train_loss": -6.072577953338623, "global_step": 86814, "epoch": 2067} {"train_loss": -6.030668258666992, "global_step": 86815, "epoch": 2067} {"train_loss": -6.291668891906738, "global_step": 86816, "epoch": 2067} {"train_loss": -6.133700370788574, "global_step": 86817, "epoch": 2067} {"train_loss": -6.219263076782227, "global_step": 86818, "epoch": 2067} {"train_loss": -6.126288414001465, "global_step": 86819, "epoch": 2067} {"train_loss": -6.180288314819336, "global_step": 86820, "epoch": 2067} {"train_loss": -6.198328971862793, "global_step": 86821, "epoch": 2067} {"train_loss": -6.223133563995361, "global_step": 86822, "epoch": 2067} {"train_loss": -6.132930755615234, "global_step": 86823, "epoch": 2067} {"train_loss": -6.168301582336426, "global_step": 86824, "epoch": 2067} {"train_loss": -6.271694183349609, "global_step": 86825, "epoch": 2067} {"train_loss": -6.214832305908203, "global_step": 86826, "epoch": 2067} {"train_loss": -6.247025489807129, "global_step": 86827, "epoch": 2067} {"train_loss": -6.173750877380371, "global_step": 86828, "epoch": 2067} {"train_loss": -6.3000054359436035, "global_step": 86829, "epoch": 2067} {"train_loss": -6.1457905769348145, "global_step": 86830, "epoch": 2067} {"train_loss": -6.116006851196289, "global_step": 86831, "epoch": 2067} {"train_loss": -6.2071990966796875, "global_step": 86832, "epoch": 2067} {"train_loss": -6.287968635559082, "global_step": 86833, "epoch": 2067} {"train_loss": -6.256045341491699, "global_step": 86834, "epoch": 2067} {"train_loss": -6.289706230163574, "global_step": 86835, "epoch": 2067} {"train_loss": -6.247664451599121, "global_step": 86836, "epoch": 2067} {"train_loss": -6.12557315826416, "global_step": 86837, "epoch": 2067} {"train_loss": -6.199796199798584, "global_step": 86838, "epoch": 2067} {"train_loss": -6.158960819244385, "global_step": 86839, "epoch": 2067} {"train_loss": -6.223570823669434, "global_step": 86840, "epoch": 2067} {"train_loss": -6.340374946594238, "global_step": 86841, "epoch": 2067} {"train_loss": -6.206433296203613, "global_step": 86842, "epoch": 2067} {"train_loss": -6.355670928955078, "global_step": 86843, "epoch": 2067} {"train_loss": -6.094595909118652, "global_step": 86844, "epoch": 2067} {"train_loss": -6.23473596572876, "global_step": 86845, "epoch": 2067} {"train_loss": -6.264589309692383, "global_step": 86846, "epoch": 2067} {"train_loss": -6.149757385253906, "global_step": 86847, "epoch": 2067} {"train_loss": -6.152586460113525, "global_step": 86848, "epoch": 2067} {"train_loss": -6.23154354095459, "global_step": 86849, "epoch": 2067} {"train_loss": -6.257361888885498, "global_step": 86850, "epoch": 2067} {"train_loss": -6.252593994140625, "global_step": 86851, "epoch": 2067} {"train_loss": -6.276843070983887, "global_step": 86852, "epoch": 2067} {"train_loss": -6.216083526611328, "global_step": 86853, "epoch": 2067} {"train_loss": -6.2151594161987305, "global_step": 86854, "epoch": 2067} {"train_loss": -6.206763097218105, "global_step": 86855, "epoch": 2067, "val_loss": 75347.046875} {"train_loss": -6.157441139221191, "global_step": 86856, "epoch": 2068} {"train_loss": -6.299765586853027, "global_step": 86857, "epoch": 2068} {"train_loss": -6.218852996826172, "global_step": 86858, "epoch": 2068} {"train_loss": -6.26131010055542, "global_step": 86859, "epoch": 2068} {"train_loss": -6.252693176269531, "global_step": 86860, "epoch": 2068} {"train_loss": -6.1839680671691895, "global_step": 86861, "epoch": 2068} {"train_loss": -6.312081813812256, "global_step": 86862, "epoch": 2068} {"train_loss": -6.12553596496582, "global_step": 86863, "epoch": 2068} {"train_loss": -6.252384185791016, "global_step": 86864, "epoch": 2068} {"train_loss": -6.326455593109131, "global_step": 86865, "epoch": 2068} {"train_loss": -6.191648960113525, "global_step": 86866, "epoch": 2068} {"train_loss": -6.2396392822265625, "global_step": 86867, "epoch": 2068} {"train_loss": -6.2849273681640625, "global_step": 86868, "epoch": 2068} {"train_loss": -6.112858772277832, "global_step": 86869, "epoch": 2068} {"train_loss": -6.2365522384643555, "global_step": 86870, "epoch": 2068} {"train_loss": -6.261143684387207, "global_step": 86871, "epoch": 2068} {"train_loss": -6.150217533111572, "global_step": 86872, "epoch": 2068} {"train_loss": -6.1967949867248535, "global_step": 86873, "epoch": 2068} {"train_loss": -6.060919284820557, "global_step": 86874, "epoch": 2068} {"train_loss": -6.164920330047607, "global_step": 86875, "epoch": 2068} {"train_loss": -6.233123779296875, "global_step": 86876, "epoch": 2068} {"train_loss": -6.154496669769287, "global_step": 86877, "epoch": 2068} {"train_loss": -6.093510627746582, "global_step": 86878, "epoch": 2068} {"train_loss": -6.160427570343018, "global_step": 86879, "epoch": 2068} {"train_loss": -6.233124732971191, "global_step": 86880, "epoch": 2068} {"train_loss": -6.117473602294922, "global_step": 86881, "epoch": 2068} {"train_loss": -6.17335319519043, "global_step": 86882, "epoch": 2068} {"train_loss": -6.132945537567139, "global_step": 86883, "epoch": 2068} {"train_loss": -6.126562118530273, "global_step": 86884, "epoch": 2068} {"train_loss": -6.1972198486328125, "global_step": 86885, "epoch": 2068} {"train_loss": -6.076066017150879, "global_step": 86886, "epoch": 2068} {"train_loss": -6.1365156173706055, "global_step": 86887, "epoch": 2068} {"train_loss": -6.224156856536865, "global_step": 86888, "epoch": 2068} {"train_loss": -6.204662322998047, "global_step": 86889, "epoch": 2068} {"train_loss": -6.184538841247559, "global_step": 86890, "epoch": 2068} {"train_loss": -6.117691993713379, "global_step": 86891, "epoch": 2068} {"train_loss": -6.264966011047363, "global_step": 86892, "epoch": 2068} {"train_loss": -6.159614562988281, "global_step": 86893, "epoch": 2068} {"train_loss": -6.227002143859863, "global_step": 86894, "epoch": 2068} {"train_loss": -6.063684463500977, "global_step": 86895, "epoch": 2068} {"train_loss": -6.134716987609863, "global_step": 86896, "epoch": 2068} {"train_loss": -6.191805748712449, "global_step": 86897, "epoch": 2068, "val_loss": 75238.78125} {"train_loss": -6.103711128234863, "global_step": 86898, "epoch": 2069} {"train_loss": -6.302001953125, "global_step": 86899, "epoch": 2069} {"train_loss": -6.2665791511535645, "global_step": 86900, "epoch": 2069} {"train_loss": -6.0719733238220215, "global_step": 86901, "epoch": 2069} {"train_loss": -6.122446060180664, "global_step": 86902, "epoch": 2069} {"train_loss": -6.142526149749756, "global_step": 86903, "epoch": 2069} {"train_loss": -6.26834774017334, "global_step": 86904, "epoch": 2069} {"train_loss": -6.125054836273193, "global_step": 86905, "epoch": 2069} {"train_loss": -6.205085754394531, "global_step": 86906, "epoch": 2069} {"train_loss": -6.269928455352783, "global_step": 86907, "epoch": 2069} {"train_loss": -6.2092695236206055, "global_step": 86908, "epoch": 2069} {"train_loss": -6.203067779541016, "global_step": 86909, "epoch": 2069} {"train_loss": -6.17289924621582, "global_step": 86910, "epoch": 2069} {"train_loss": -6.198517799377441, "global_step": 86911, "epoch": 2069} {"train_loss": -6.1867265701293945, "global_step": 86912, "epoch": 2069} {"train_loss": -6.165507793426514, "global_step": 86913, "epoch": 2069} {"train_loss": -6.202889442443848, "global_step": 86914, "epoch": 2069} {"train_loss": -6.265872955322266, "global_step": 86915, "epoch": 2069} {"train_loss": -6.137197971343994, "global_step": 86916, "epoch": 2069} {"train_loss": -6.183842658996582, "global_step": 86917, "epoch": 2069} {"train_loss": -6.250761032104492, "global_step": 86918, "epoch": 2069} {"train_loss": -6.153592109680176, "global_step": 86919, "epoch": 2069} {"train_loss": -6.145948886871338, "global_step": 86920, "epoch": 2069} {"train_loss": -6.176069259643555, "global_step": 86921, "epoch": 2069} {"train_loss": -6.176580429077148, "global_step": 86922, "epoch": 2069} {"train_loss": -6.279667854309082, "global_step": 86923, "epoch": 2069} {"train_loss": -6.226289749145508, "global_step": 86924, "epoch": 2069} {"train_loss": -6.137114524841309, "global_step": 86925, "epoch": 2069} {"train_loss": -6.226778984069824, "global_step": 86926, "epoch": 2069} {"train_loss": -6.079567909240723, "global_step": 86927, "epoch": 2069} {"train_loss": -6.249238967895508, "global_step": 86928, "epoch": 2069} {"train_loss": -6.163496971130371, "global_step": 86929, "epoch": 2069} {"train_loss": -6.174663543701172, "global_step": 86930, "epoch": 2069} {"train_loss": -6.23942756652832, "global_step": 86931, "epoch": 2069} {"train_loss": -6.111100673675537, "global_step": 86932, "epoch": 2069} {"train_loss": -6.307180404663086, "global_step": 86933, "epoch": 2069} {"train_loss": -6.272647857666016, "global_step": 86934, "epoch": 2069} {"train_loss": -6.013959884643555, "global_step": 86935, "epoch": 2069} {"train_loss": -6.158067226409912, "global_step": 86936, "epoch": 2069} {"train_loss": -6.254278182983398, "global_step": 86937, "epoch": 2069} {"train_loss": -6.31892204284668, "global_step": 86938, "epoch": 2069} {"train_loss": -6.196361598514375, "global_step": 86939, "epoch": 2069, "val_loss": 75289.9375} {"train_loss": -6.186845779418945, "global_step": 86940, "epoch": 2070} {"train_loss": -6.2422308921813965, "global_step": 86941, "epoch": 2070} {"train_loss": -6.396218299865723, "global_step": 86942, "epoch": 2070} {"train_loss": -6.247549533843994, "global_step": 86943, "epoch": 2070} {"train_loss": -6.280588626861572, "global_step": 86944, "epoch": 2070} {"train_loss": -6.326235771179199, "global_step": 86945, "epoch": 2070} {"train_loss": -6.107966899871826, "global_step": 86946, "epoch": 2070} {"train_loss": -6.272263050079346, "global_step": 86947, "epoch": 2070} {"train_loss": -6.311495780944824, "global_step": 86948, "epoch": 2070} {"train_loss": -6.317660808563232, "global_step": 86949, "epoch": 2070} {"train_loss": -6.158838272094727, "global_step": 86950, "epoch": 2070} {"train_loss": -6.302788734436035, "global_step": 86951, "epoch": 2070} {"train_loss": -6.3552141189575195, "global_step": 86952, "epoch": 2070} {"train_loss": -6.278048038482666, "global_step": 86953, "epoch": 2070} {"train_loss": -6.248490333557129, "global_step": 86954, "epoch": 2070} {"train_loss": -6.270663261413574, "global_step": 86955, "epoch": 2070} {"train_loss": -6.148284912109375, "global_step": 86956, "epoch": 2070} {"train_loss": -6.178103923797607, "global_step": 86957, "epoch": 2070} {"train_loss": -6.195544242858887, "global_step": 86958, "epoch": 2070} {"train_loss": -6.1290483474731445, "global_step": 86959, "epoch": 2070} {"train_loss": -6.211082935333252, "global_step": 86960, "epoch": 2070} {"train_loss": -6.27136754989624, "global_step": 86961, "epoch": 2070} {"train_loss": -6.292614936828613, "global_step": 86962, "epoch": 2070} {"train_loss": -6.16661262512207, "global_step": 86963, "epoch": 2070} {"train_loss": -6.292901039123535, "global_step": 86964, "epoch": 2070} {"train_loss": -6.317799091339111, "global_step": 86965, "epoch": 2070} {"train_loss": -6.1297454833984375, "global_step": 86966, "epoch": 2070} {"train_loss": -6.1954026222229, "global_step": 86967, "epoch": 2070} {"train_loss": -6.2168474197387695, "global_step": 86968, "epoch": 2070} {"train_loss": -6.248874664306641, "global_step": 86969, "epoch": 2070} {"train_loss": -6.288603782653809, "global_step": 86970, "epoch": 2070} {"train_loss": -6.365326881408691, "global_step": 86971, "epoch": 2070} {"train_loss": -6.172231674194336, "global_step": 86972, "epoch": 2070} {"train_loss": -6.16359806060791, "global_step": 86973, "epoch": 2070} {"train_loss": -6.0523247718811035, "global_step": 86974, "epoch": 2070} {"train_loss": -6.221718788146973, "global_step": 86975, "epoch": 2070} {"train_loss": -6.127405166625977, "global_step": 86976, "epoch": 2070} {"train_loss": -6.027739524841309, "global_step": 86977, "epoch": 2070} {"train_loss": -6.2895827293396, "global_step": 86978, "epoch": 2070} {"train_loss": -5.983462810516357, "global_step": 86979, "epoch": 2070} {"train_loss": -6.13514518737793, "global_step": 86980, "epoch": 2070} {"train_loss": -6.22015076591855, "global_step": 86981, "epoch": 2070, "val_loss": 75194.453125} {"train_loss": -6.1651692390441895, "global_step": 86982, "epoch": 2071} {"train_loss": -6.1648430824279785, "global_step": 86983, "epoch": 2071} {"train_loss": -6.126895904541016, "global_step": 86984, "epoch": 2071} {"train_loss": -6.201239585876465, "global_step": 86985, "epoch": 2071} {"train_loss": -6.136284828186035, "global_step": 86986, "epoch": 2071} {"train_loss": -6.112361907958984, "global_step": 86987, "epoch": 2071} {"train_loss": -6.151802062988281, "global_step": 86988, "epoch": 2071} {"train_loss": -6.2119550704956055, "global_step": 86989, "epoch": 2071} {"train_loss": -6.102653503417969, "global_step": 86990, "epoch": 2071} {"train_loss": -6.072812557220459, "global_step": 86991, "epoch": 2071} {"train_loss": -6.185492038726807, "global_step": 86992, "epoch": 2071} {"train_loss": -6.264114856719971, "global_step": 86993, "epoch": 2071} {"train_loss": -6.149319171905518, "global_step": 86994, "epoch": 2071} {"train_loss": -6.269772052764893, "global_step": 86995, "epoch": 2071} {"train_loss": -6.131546974182129, "global_step": 86996, "epoch": 2071} {"train_loss": -6.187820911407471, "global_step": 86997, "epoch": 2071} {"train_loss": -6.200594902038574, "global_step": 86998, "epoch": 2071} {"train_loss": -6.087221145629883, "global_step": 86999, "epoch": 2071} {"train_loss": -6.221374034881592, "global_step": 87000, "epoch": 2071} {"train_loss": -6.30588436126709, "global_step": 87001, "epoch": 2071} {"train_loss": -6.091546058654785, "global_step": 87002, "epoch": 2071} {"train_loss": -6.008950710296631, "global_step": 87003, "epoch": 2071} {"train_loss": -6.168532371520996, "global_step": 87004, "epoch": 2071} {"train_loss": -6.092741012573242, "global_step": 87005, "epoch": 2071} {"train_loss": -6.079898357391357, "global_step": 87006, "epoch": 2071} {"train_loss": -6.2631754875183105, "global_step": 87007, "epoch": 2071} {"train_loss": -6.093575477600098, "global_step": 87008, "epoch": 2071} {"train_loss": -6.164660453796387, "global_step": 87009, "epoch": 2071} {"train_loss": -6.187135696411133, "global_step": 87010, "epoch": 2071} {"train_loss": -6.156460285186768, "global_step": 87011, "epoch": 2071} {"train_loss": -6.187258720397949, "global_step": 87012, "epoch": 2071} {"train_loss": -6.0758376121521, "global_step": 87013, "epoch": 2071} {"train_loss": -6.2788591384887695, "global_step": 87014, "epoch": 2071} {"train_loss": -6.1851701736450195, "global_step": 87015, "epoch": 2071} {"train_loss": -6.167032241821289, "global_step": 87016, "epoch": 2071} {"train_loss": -6.119485855102539, "global_step": 87017, "epoch": 2071} {"train_loss": -6.119508266448975, "global_step": 87018, "epoch": 2071} {"train_loss": -6.16037654876709, "global_step": 87019, "epoch": 2071} {"train_loss": -6.198909282684326, "global_step": 87020, "epoch": 2071} {"train_loss": -6.121531963348389, "global_step": 87021, "epoch": 2071} {"train_loss": -6.200072765350342, "global_step": 87022, "epoch": 2071} {"train_loss": -6.164041451045445, "global_step": 87023, "epoch": 2071, "val_loss": 75504.5390625} {"train_loss": -6.17466926574707, "global_step": 87024, "epoch": 2072} {"train_loss": -6.304854393005371, "global_step": 87025, "epoch": 2072} {"train_loss": -6.121763706207275, "global_step": 87026, "epoch": 2072} {"train_loss": -6.233731269836426, "global_step": 87027, "epoch": 2072} {"train_loss": -6.359354019165039, "global_step": 87028, "epoch": 2072} {"train_loss": -6.250729560852051, "global_step": 87029, "epoch": 2072} {"train_loss": -6.1852641105651855, "global_step": 87030, "epoch": 2072} {"train_loss": -6.126680374145508, "global_step": 87031, "epoch": 2072} {"train_loss": -6.253061771392822, "global_step": 87032, "epoch": 2072} {"train_loss": -6.2802276611328125, "global_step": 87033, "epoch": 2072} {"train_loss": -6.3735246658325195, "global_step": 87034, "epoch": 2072} {"train_loss": -6.192899703979492, "global_step": 87035, "epoch": 2072} {"train_loss": -6.303056716918945, "global_step": 87036, "epoch": 2072} {"train_loss": -6.21878719329834, "global_step": 87037, "epoch": 2072} {"train_loss": -6.123823642730713, "global_step": 87038, "epoch": 2072} {"train_loss": -6.20643949508667, "global_step": 87039, "epoch": 2072} {"train_loss": -6.291872501373291, "global_step": 87040, "epoch": 2072} {"train_loss": -6.222012996673584, "global_step": 87041, "epoch": 2072} {"train_loss": -6.137932300567627, "global_step": 87042, "epoch": 2072} {"train_loss": -6.203230381011963, "global_step": 87043, "epoch": 2072} {"train_loss": -6.230185508728027, "global_step": 87044, "epoch": 2072} {"train_loss": -6.165739059448242, "global_step": 87045, "epoch": 2072} {"train_loss": -6.26704216003418, "global_step": 87046, "epoch": 2072} {"train_loss": -6.154614448547363, "global_step": 87047, "epoch": 2072} {"train_loss": -6.264497756958008, "global_step": 87048, "epoch": 2072} {"train_loss": -6.354988098144531, "global_step": 87049, "epoch": 2072} {"train_loss": -6.112856864929199, "global_step": 87050, "epoch": 2072} {"train_loss": -6.203212738037109, "global_step": 87051, "epoch": 2072} {"train_loss": -6.199451446533203, "global_step": 87052, "epoch": 2072} {"train_loss": -6.262872695922852, "global_step": 87053, "epoch": 2072} {"train_loss": -6.07784366607666, "global_step": 87054, "epoch": 2072} {"train_loss": -6.12922477722168, "global_step": 87055, "epoch": 2072} {"train_loss": -6.215521812438965, "global_step": 87056, "epoch": 2072} {"train_loss": -6.207397937774658, "global_step": 87057, "epoch": 2072} {"train_loss": -6.268335342407227, "global_step": 87058, "epoch": 2072} {"train_loss": -6.196000099182129, "global_step": 87059, "epoch": 2072} {"train_loss": -6.175508499145508, "global_step": 87060, "epoch": 2072} {"train_loss": -6.350467205047607, "global_step": 87061, "epoch": 2072} {"train_loss": -6.203084945678711, "global_step": 87062, "epoch": 2072} {"train_loss": -6.227394104003906, "global_step": 87063, "epoch": 2072} {"train_loss": -6.290727615356445, "global_step": 87064, "epoch": 2072} {"train_loss": -6.22401609874907, "global_step": 87065, "epoch": 2072, "val_loss": 75060.6796875} {"train_loss": -6.251626968383789, "global_step": 87066, "epoch": 2073} {"train_loss": -6.390407562255859, "global_step": 87067, "epoch": 2073} {"train_loss": -6.31389045715332, "global_step": 87068, "epoch": 2073} {"train_loss": -6.200555801391602, "global_step": 87069, "epoch": 2073} {"train_loss": -6.274258136749268, "global_step": 87070, "epoch": 2073} {"train_loss": -6.057395935058594, "global_step": 87071, "epoch": 2073} {"train_loss": -6.0674543380737305, "global_step": 87072, "epoch": 2073} {"train_loss": -6.260093688964844, "global_step": 87073, "epoch": 2073} {"train_loss": -6.162415504455566, "global_step": 87074, "epoch": 2073} {"train_loss": -6.1265339851379395, "global_step": 87075, "epoch": 2073} {"train_loss": -6.188298225402832, "global_step": 87076, "epoch": 2073} {"train_loss": -6.019062042236328, "global_step": 87077, "epoch": 2073} {"train_loss": -6.212296485900879, "global_step": 87078, "epoch": 2073} {"train_loss": -6.149245262145996, "global_step": 87079, "epoch": 2073} {"train_loss": -6.2050981521606445, "global_step": 87080, "epoch": 2073} {"train_loss": -6.185359001159668, "global_step": 87081, "epoch": 2073} {"train_loss": -6.00294303894043, "global_step": 87082, "epoch": 2073} {"train_loss": -6.15256929397583, "global_step": 87083, "epoch": 2073} {"train_loss": -6.194023132324219, "global_step": 87084, "epoch": 2073} {"train_loss": -6.13166618347168, "global_step": 87085, "epoch": 2073} {"train_loss": -6.192795753479004, "global_step": 87086, "epoch": 2073} {"train_loss": -6.262343406677246, "global_step": 87087, "epoch": 2073} {"train_loss": -6.092061519622803, "global_step": 87088, "epoch": 2073} {"train_loss": -6.226722717285156, "global_step": 87089, "epoch": 2073} {"train_loss": -6.17078971862793, "global_step": 87090, "epoch": 2073} {"train_loss": -6.150093078613281, "global_step": 87091, "epoch": 2073} {"train_loss": -6.291984558105469, "global_step": 87092, "epoch": 2073} {"train_loss": -6.197830677032471, "global_step": 87093, "epoch": 2073} {"train_loss": -6.200997352600098, "global_step": 87094, "epoch": 2073} {"train_loss": -6.096243858337402, "global_step": 87095, "epoch": 2073} {"train_loss": -6.242268085479736, "global_step": 87096, "epoch": 2073} {"train_loss": -6.303676128387451, "global_step": 87097, "epoch": 2073} {"train_loss": -6.238777160644531, "global_step": 87098, "epoch": 2073} {"train_loss": -6.02229642868042, "global_step": 87099, "epoch": 2073} {"train_loss": -6.264308929443359, "global_step": 87100, "epoch": 2073} {"train_loss": -6.024717330932617, "global_step": 87101, "epoch": 2073} {"train_loss": -6.225886344909668, "global_step": 87102, "epoch": 2073} {"train_loss": -6.148416996002197, "global_step": 87103, "epoch": 2073} {"train_loss": -6.16523551940918, "global_step": 87104, "epoch": 2073} {"train_loss": -6.221027374267578, "global_step": 87105, "epoch": 2073} {"train_loss": -6.19376277923584, "global_step": 87106, "epoch": 2073} {"train_loss": -6.183895576567877, "global_step": 87107, "epoch": 2073, "val_loss": 75010.734375} {"train_loss": -6.181244373321533, "global_step": 87108, "epoch": 2074} {"train_loss": -6.123291015625, "global_step": 87109, "epoch": 2074} {"train_loss": -6.331588268280029, "global_step": 87110, "epoch": 2074} {"train_loss": -6.195910453796387, "global_step": 87111, "epoch": 2074} {"train_loss": -6.333271026611328, "global_step": 87112, "epoch": 2074} {"train_loss": -6.265014171600342, "global_step": 87113, "epoch": 2074} {"train_loss": -6.203088283538818, "global_step": 87114, "epoch": 2074} {"train_loss": -6.181044101715088, "global_step": 87115, "epoch": 2074} {"train_loss": -6.169057846069336, "global_step": 87116, "epoch": 2074} {"train_loss": -6.171945571899414, "global_step": 87117, "epoch": 2074} {"train_loss": -6.173227787017822, "global_step": 87118, "epoch": 2074} {"train_loss": -6.181561470031738, "global_step": 87119, "epoch": 2074} {"train_loss": -6.248814105987549, "global_step": 87120, "epoch": 2074} {"train_loss": -6.2613205909729, "global_step": 87121, "epoch": 2074} {"train_loss": -6.116555690765381, "global_step": 87122, "epoch": 2074} {"train_loss": -6.140681266784668, "global_step": 87123, "epoch": 2074} {"train_loss": -6.185833930969238, "global_step": 87124, "epoch": 2074} {"train_loss": -6.288174152374268, "global_step": 87125, "epoch": 2074} {"train_loss": -6.105152130126953, "global_step": 87126, "epoch": 2074} {"train_loss": -6.106779098510742, "global_step": 87127, "epoch": 2074} {"train_loss": -6.2259039878845215, "global_step": 87128, "epoch": 2074} {"train_loss": -6.132040977478027, "global_step": 87129, "epoch": 2074} {"train_loss": -6.234058380126953, "global_step": 87130, "epoch": 2074} {"train_loss": -6.280611991882324, "global_step": 87131, "epoch": 2074} {"train_loss": -6.262791633605957, "global_step": 87132, "epoch": 2074} {"train_loss": -6.217989921569824, "global_step": 87133, "epoch": 2074} {"train_loss": -6.214363098144531, "global_step": 87134, "epoch": 2074} {"train_loss": -6.2191877365112305, "global_step": 87135, "epoch": 2074} {"train_loss": -6.182685852050781, "global_step": 87136, "epoch": 2074} {"train_loss": -6.289758682250977, "global_step": 87137, "epoch": 2074} {"train_loss": -6.299630165100098, "global_step": 87138, "epoch": 2074} {"train_loss": -6.186474800109863, "global_step": 87139, "epoch": 2074} {"train_loss": -6.193145751953125, "global_step": 87140, "epoch": 2074} {"train_loss": -6.257008075714111, "global_step": 87141, "epoch": 2074} {"train_loss": -6.270625591278076, "global_step": 87142, "epoch": 2074} {"train_loss": -6.295127868652344, "global_step": 87143, "epoch": 2074} {"train_loss": -6.108793258666992, "global_step": 87144, "epoch": 2074} {"train_loss": -6.197244167327881, "global_step": 87145, "epoch": 2074} {"train_loss": -6.24788236618042, "global_step": 87146, "epoch": 2074} {"train_loss": -6.222780704498291, "global_step": 87147, "epoch": 2074} {"train_loss": -6.263680934906006, "global_step": 87148, "epoch": 2074} {"train_loss": -6.214763300759452, "global_step": 87149, "epoch": 2074, "val_loss": 75422.3125} {"train_loss": -6.165693283081055, "global_step": 87150, "epoch": 2075} {"train_loss": -6.175105094909668, "global_step": 87151, "epoch": 2075} {"train_loss": -6.222100734710693, "global_step": 87152, "epoch": 2075} {"train_loss": -6.25411319732666, "global_step": 87153, "epoch": 2075} {"train_loss": -6.241919994354248, "global_step": 87154, "epoch": 2075} {"train_loss": -6.274318218231201, "global_step": 87155, "epoch": 2075} {"train_loss": -6.193105697631836, "global_step": 87156, "epoch": 2075} {"train_loss": -6.237669944763184, "global_step": 87157, "epoch": 2075} {"train_loss": -6.202045917510986, "global_step": 87158, "epoch": 2075} {"train_loss": -6.263025283813477, "global_step": 87159, "epoch": 2075} {"train_loss": -6.165290355682373, "global_step": 87160, "epoch": 2075} {"train_loss": -6.187143802642822, "global_step": 87161, "epoch": 2075} {"train_loss": -6.230608940124512, "global_step": 87162, "epoch": 2075} {"train_loss": -6.1247944831848145, "global_step": 87163, "epoch": 2075} {"train_loss": -6.125652313232422, "global_step": 87164, "epoch": 2075} {"train_loss": -6.186763286590576, "global_step": 87165, "epoch": 2075} {"train_loss": -6.244837284088135, "global_step": 87166, "epoch": 2075} {"train_loss": -6.2725443840026855, "global_step": 87167, "epoch": 2075} {"train_loss": -6.127211570739746, "global_step": 87168, "epoch": 2075} {"train_loss": -6.132477760314941, "global_step": 87169, "epoch": 2075} {"train_loss": -6.18357515335083, "global_step": 87170, "epoch": 2075} {"train_loss": -5.995404243469238, "global_step": 87171, "epoch": 2075} {"train_loss": -6.2048540115356445, "global_step": 87172, "epoch": 2075} {"train_loss": -6.110824108123779, "global_step": 87173, "epoch": 2075} {"train_loss": -6.315279960632324, "global_step": 87174, "epoch": 2075} {"train_loss": -6.132360458374023, "global_step": 87175, "epoch": 2075} {"train_loss": -6.243936538696289, "global_step": 87176, "epoch": 2075} {"train_loss": -6.185323715209961, "global_step": 87177, "epoch": 2075} {"train_loss": -6.141345977783203, "global_step": 87178, "epoch": 2075} {"train_loss": -6.173634052276611, "global_step": 87179, "epoch": 2075} {"train_loss": -6.185565948486328, "global_step": 87180, "epoch": 2075} {"train_loss": -6.2492852210998535, "global_step": 87181, "epoch": 2075} {"train_loss": -6.327583312988281, "global_step": 87182, "epoch": 2075} {"train_loss": -6.151459693908691, "global_step": 87183, "epoch": 2075} {"train_loss": -6.223293304443359, "global_step": 87184, "epoch": 2075} {"train_loss": -6.309426307678223, "global_step": 87185, "epoch": 2075} {"train_loss": -6.308367729187012, "global_step": 87186, "epoch": 2075} {"train_loss": -6.330716609954834, "global_step": 87187, "epoch": 2075} {"train_loss": -6.174167633056641, "global_step": 87188, "epoch": 2075} {"train_loss": -6.204320907592773, "global_step": 87189, "epoch": 2075} {"train_loss": -6.175406455993652, "global_step": 87190, "epoch": 2075} {"train_loss": -6.202984469277518, "global_step": 87191, "epoch": 2075, "val_loss": 75302.234375} {"train_loss": -6.2642822265625, "global_step": 87192, "epoch": 2076} {"train_loss": -6.266231536865234, "global_step": 87193, "epoch": 2076} {"train_loss": -6.24681282043457, "global_step": 87194, "epoch": 2076} {"train_loss": -6.272384166717529, "global_step": 87195, "epoch": 2076} {"train_loss": -6.221074104309082, "global_step": 87196, "epoch": 2076} {"train_loss": -6.22096061706543, "global_step": 87197, "epoch": 2076} {"train_loss": -6.330027103424072, "global_step": 87198, "epoch": 2076} {"train_loss": -6.220001220703125, "global_step": 87199, "epoch": 2076} {"train_loss": -6.205780029296875, "global_step": 87200, "epoch": 2076} {"train_loss": -6.246225357055664, "global_step": 87201, "epoch": 2076} {"train_loss": -6.219322681427002, "global_step": 87202, "epoch": 2076} {"train_loss": -6.2021026611328125, "global_step": 87203, "epoch": 2076} {"train_loss": -6.222064971923828, "global_step": 87204, "epoch": 2076} {"train_loss": -6.2700605392456055, "global_step": 87205, "epoch": 2076} {"train_loss": -6.257184982299805, "global_step": 87206, "epoch": 2076} {"train_loss": -6.292388916015625, "global_step": 87207, "epoch": 2076} {"train_loss": -6.178772926330566, "global_step": 87208, "epoch": 2076} {"train_loss": -6.146796226501465, "global_step": 87209, "epoch": 2076} {"train_loss": -6.316343307495117, "global_step": 87210, "epoch": 2076} {"train_loss": -6.161269187927246, "global_step": 87211, "epoch": 2076} {"train_loss": -6.157737731933594, "global_step": 87212, "epoch": 2076} {"train_loss": -6.14640998840332, "global_step": 87213, "epoch": 2076} {"train_loss": -6.099926471710205, "global_step": 87214, "epoch": 2076} {"train_loss": -6.20818567276001, "global_step": 87215, "epoch": 2076} {"train_loss": -6.141474723815918, "global_step": 87216, "epoch": 2076} {"train_loss": -6.3324480056762695, "global_step": 87217, "epoch": 2076} {"train_loss": -6.067456245422363, "global_step": 87218, "epoch": 2076} {"train_loss": -6.1788787841796875, "global_step": 87219, "epoch": 2076} {"train_loss": -6.130059719085693, "global_step": 87220, "epoch": 2076} {"train_loss": -6.111616134643555, "global_step": 87221, "epoch": 2076} {"train_loss": -6.1666579246521, "global_step": 87222, "epoch": 2076} {"train_loss": -6.188546180725098, "global_step": 87223, "epoch": 2076} {"train_loss": -6.212069511413574, "global_step": 87224, "epoch": 2076} {"train_loss": -6.129811763763428, "global_step": 87225, "epoch": 2076} {"train_loss": -6.2003254890441895, "global_step": 87226, "epoch": 2076} {"train_loss": -6.199427127838135, "global_step": 87227, "epoch": 2076} {"train_loss": -6.171664237976074, "global_step": 87228, "epoch": 2076} {"train_loss": -6.283035755157471, "global_step": 87229, "epoch": 2076} {"train_loss": -6.228665351867676, "global_step": 87230, "epoch": 2076} {"train_loss": -6.1079607009887695, "global_step": 87231, "epoch": 2076} {"train_loss": -6.224212646484375, "global_step": 87232, "epoch": 2076} {"train_loss": -6.207325254167829, "global_step": 87233, "epoch": 2076, "val_loss": 75105.8046875} {"train_loss": -6.262162208557129, "global_step": 87234, "epoch": 2077} {"train_loss": -6.220232009887695, "global_step": 87235, "epoch": 2077} {"train_loss": -6.256360054016113, "global_step": 87236, "epoch": 2077} {"train_loss": -6.2247090339660645, "global_step": 87237, "epoch": 2077} {"train_loss": -6.217380523681641, "global_step": 87238, "epoch": 2077} {"train_loss": -6.25167179107666, "global_step": 87239, "epoch": 2077} {"train_loss": -6.209174156188965, "global_step": 87240, "epoch": 2077} {"train_loss": -6.273347854614258, "global_step": 87241, "epoch": 2077} {"train_loss": -6.174592018127441, "global_step": 87242, "epoch": 2077} {"train_loss": -6.192051887512207, "global_step": 87243, "epoch": 2077} {"train_loss": -6.2394208908081055, "global_step": 87244, "epoch": 2077} {"train_loss": -6.098130226135254, "global_step": 87245, "epoch": 2077} {"train_loss": -6.209008693695068, "global_step": 87246, "epoch": 2077} {"train_loss": -6.1484880447387695, "global_step": 87247, "epoch": 2077} {"train_loss": -6.111532211303711, "global_step": 87248, "epoch": 2077} {"train_loss": -6.122706413269043, "global_step": 87249, "epoch": 2077} {"train_loss": -6.254820823669434, "global_step": 87250, "epoch": 2077} {"train_loss": -6.186666488647461, "global_step": 87251, "epoch": 2077} {"train_loss": -6.140803337097168, "global_step": 87252, "epoch": 2077} {"train_loss": -6.228010654449463, "global_step": 87253, "epoch": 2077} {"train_loss": -6.086893558502197, "global_step": 87254, "epoch": 2077} {"train_loss": -6.061605453491211, "global_step": 87255, "epoch": 2077} {"train_loss": -6.10234260559082, "global_step": 87256, "epoch": 2077} {"train_loss": -6.1119489669799805, "global_step": 87257, "epoch": 2077} {"train_loss": -6.19759464263916, "global_step": 87258, "epoch": 2077} {"train_loss": -6.271300315856934, "global_step": 87259, "epoch": 2077} {"train_loss": -6.21069860458374, "global_step": 87260, "epoch": 2077} {"train_loss": -6.227652072906494, "global_step": 87261, "epoch": 2077} {"train_loss": -6.1762919425964355, "global_step": 87262, "epoch": 2077} {"train_loss": -6.183849811553955, "global_step": 87263, "epoch": 2077} {"train_loss": -6.017026901245117, "global_step": 87264, "epoch": 2077} {"train_loss": -6.1218366622924805, "global_step": 87265, "epoch": 2077} {"train_loss": -6.27519416809082, "global_step": 87266, "epoch": 2077} {"train_loss": -6.152299880981445, "global_step": 87267, "epoch": 2077} {"train_loss": -6.17392110824585, "global_step": 87268, "epoch": 2077} {"train_loss": -6.1465325355529785, "global_step": 87269, "epoch": 2077} {"train_loss": -6.237359046936035, "global_step": 87270, "epoch": 2077} {"train_loss": -6.26113224029541, "global_step": 87271, "epoch": 2077} {"train_loss": -6.117615699768066, "global_step": 87272, "epoch": 2077} {"train_loss": -6.115466117858887, "global_step": 87273, "epoch": 2077} {"train_loss": -6.2280049324035645, "global_step": 87274, "epoch": 2077} {"train_loss": -6.184830143338158, "global_step": 87275, "epoch": 2077, "val_loss": 75256.9375} {"train_loss": -6.184722423553467, "global_step": 87276, "epoch": 2078} {"train_loss": -6.296015739440918, "global_step": 87277, "epoch": 2078} {"train_loss": -6.210155963897705, "global_step": 87278, "epoch": 2078} {"train_loss": -6.374819755554199, "global_step": 87279, "epoch": 2078} {"train_loss": -6.311793327331543, "global_step": 87280, "epoch": 2078} {"train_loss": -6.195103645324707, "global_step": 87281, "epoch": 2078} {"train_loss": -6.1967949867248535, "global_step": 87282, "epoch": 2078} {"train_loss": -6.194456100463867, "global_step": 87283, "epoch": 2078} {"train_loss": -6.272430419921875, "global_step": 87284, "epoch": 2078} {"train_loss": -6.350585460662842, "global_step": 87285, "epoch": 2078} {"train_loss": -6.208934783935547, "global_step": 87286, "epoch": 2078} {"train_loss": -6.161450386047363, "global_step": 87287, "epoch": 2078} {"train_loss": -6.172845840454102, "global_step": 87288, "epoch": 2078} {"train_loss": -6.147337436676025, "global_step": 87289, "epoch": 2078} {"train_loss": -6.168299674987793, "global_step": 87290, "epoch": 2078} {"train_loss": -6.278188705444336, "global_step": 87291, "epoch": 2078} {"train_loss": -6.194742202758789, "global_step": 87292, "epoch": 2078} {"train_loss": -6.347958564758301, "global_step": 87293, "epoch": 2078} {"train_loss": -6.26829195022583, "global_step": 87294, "epoch": 2078} {"train_loss": -6.138166427612305, "global_step": 87295, "epoch": 2078} {"train_loss": -6.2395477294921875, "global_step": 87296, "epoch": 2078} {"train_loss": -6.205050945281982, "global_step": 87297, "epoch": 2078} {"train_loss": -6.27348518371582, "global_step": 87298, "epoch": 2078} {"train_loss": -6.195072174072266, "global_step": 87299, "epoch": 2078} {"train_loss": -6.181617259979248, "global_step": 87300, "epoch": 2078} {"train_loss": -6.315667152404785, "global_step": 87301, "epoch": 2078} {"train_loss": -6.175915718078613, "global_step": 87302, "epoch": 2078} {"train_loss": -6.182137489318848, "global_step": 87303, "epoch": 2078} {"train_loss": -6.3413519859313965, "global_step": 87304, "epoch": 2078} {"train_loss": -6.156744956970215, "global_step": 87305, "epoch": 2078} {"train_loss": -6.113077163696289, "global_step": 87306, "epoch": 2078} {"train_loss": -6.266830921173096, "global_step": 87307, "epoch": 2078} {"train_loss": -6.233222961425781, "global_step": 87308, "epoch": 2078} {"train_loss": -6.135058403015137, "global_step": 87309, "epoch": 2078} {"train_loss": -6.269554138183594, "global_step": 87310, "epoch": 2078} {"train_loss": -6.161877155303955, "global_step": 87311, "epoch": 2078} {"train_loss": -6.1811933517456055, "global_step": 87312, "epoch": 2078} {"train_loss": -6.149168491363525, "global_step": 87313, "epoch": 2078} {"train_loss": -6.110274314880371, "global_step": 87314, "epoch": 2078} {"train_loss": -6.204032897949219, "global_step": 87315, "epoch": 2078} {"train_loss": -6.22274923324585, "global_step": 87316, "epoch": 2078} {"train_loss": -6.217366286686489, "global_step": 87317, "epoch": 2078, "val_loss": 75161.6484375} {"train_loss": -6.282183647155762, "global_step": 87318, "epoch": 2079} {"train_loss": -6.149827003479004, "global_step": 87319, "epoch": 2079} {"train_loss": -6.244698524475098, "global_step": 87320, "epoch": 2079} {"train_loss": -6.227846145629883, "global_step": 87321, "epoch": 2079} {"train_loss": -6.164292335510254, "global_step": 87322, "epoch": 2079} {"train_loss": -6.261814117431641, "global_step": 87323, "epoch": 2079} {"train_loss": -6.170559406280518, "global_step": 87324, "epoch": 2079} {"train_loss": -6.127280235290527, "global_step": 87325, "epoch": 2079} {"train_loss": -6.29136323928833, "global_step": 87326, "epoch": 2079} {"train_loss": -6.226465702056885, "global_step": 87327, "epoch": 2079} {"train_loss": -6.3633928298950195, "global_step": 87328, "epoch": 2079} {"train_loss": -6.315981388092041, "global_step": 87329, "epoch": 2079} {"train_loss": -6.164064407348633, "global_step": 87330, "epoch": 2079} {"train_loss": -6.140219211578369, "global_step": 87331, "epoch": 2079} {"train_loss": -6.155810356140137, "global_step": 87332, "epoch": 2079} {"train_loss": -6.266688823699951, "global_step": 87333, "epoch": 2079} {"train_loss": -6.130695343017578, "global_step": 87334, "epoch": 2079} {"train_loss": -6.240240097045898, "global_step": 87335, "epoch": 2079} {"train_loss": -6.1757330894470215, "global_step": 87336, "epoch": 2079} {"train_loss": -6.266960144042969, "global_step": 87337, "epoch": 2079} {"train_loss": -6.127139568328857, "global_step": 87338, "epoch": 2079} {"train_loss": -6.242885589599609, "global_step": 87339, "epoch": 2079} {"train_loss": -6.188066482543945, "global_step": 87340, "epoch": 2079} {"train_loss": -6.1108245849609375, "global_step": 87341, "epoch": 2079} {"train_loss": -6.160153388977051, "global_step": 87342, "epoch": 2079} {"train_loss": -6.190001487731934, "global_step": 87343, "epoch": 2079} {"train_loss": -6.2383527755737305, "global_step": 87344, "epoch": 2079} {"train_loss": -6.271206855773926, "global_step": 87345, "epoch": 2079} {"train_loss": -6.032227993011475, "global_step": 87346, "epoch": 2079} {"train_loss": -6.1779937744140625, "global_step": 87347, "epoch": 2079} {"train_loss": -6.080378532409668, "global_step": 87348, "epoch": 2079} {"train_loss": -6.142331123352051, "global_step": 87349, "epoch": 2079} {"train_loss": -6.153977394104004, "global_step": 87350, "epoch": 2079} {"train_loss": -6.200843334197998, "global_step": 87351, "epoch": 2079} {"train_loss": -6.184358596801758, "global_step": 87352, "epoch": 2079} {"train_loss": -6.242071628570557, "global_step": 87353, "epoch": 2079} {"train_loss": -6.355160713195801, "global_step": 87354, "epoch": 2079} {"train_loss": -6.140203475952148, "global_step": 87355, "epoch": 2079} {"train_loss": -6.076155662536621, "global_step": 87356, "epoch": 2079} {"train_loss": -6.170121192932129, "global_step": 87357, "epoch": 2079} {"train_loss": -6.096534729003906, "global_step": 87358, "epoch": 2079} {"train_loss": -6.19604366166251, "global_step": 87359, "epoch": 2079, "val_loss": 75740.2734375} {"train_loss": -6.0866522789001465, "global_step": 87360, "epoch": 2080} {"train_loss": -6.209451675415039, "global_step": 87361, "epoch": 2080} {"train_loss": -6.185325622558594, "global_step": 87362, "epoch": 2080} {"train_loss": -5.987675666809082, "global_step": 87363, "epoch": 2080} {"train_loss": -6.1627068519592285, "global_step": 87364, "epoch": 2080} {"train_loss": -6.096010208129883, "global_step": 87365, "epoch": 2080} {"train_loss": -6.1246256828308105, "global_step": 87366, "epoch": 2080} {"train_loss": -6.228976726531982, "global_step": 87367, "epoch": 2080} {"train_loss": -6.148684024810791, "global_step": 87368, "epoch": 2080} {"train_loss": -6.215297698974609, "global_step": 87369, "epoch": 2080} {"train_loss": -6.1586408615112305, "global_step": 87370, "epoch": 2080} {"train_loss": -6.254888534545898, "global_step": 87371, "epoch": 2080} {"train_loss": -6.179457664489746, "global_step": 87372, "epoch": 2080} {"train_loss": -6.094178199768066, "global_step": 87373, "epoch": 2080} {"train_loss": -6.268257141113281, "global_step": 87374, "epoch": 2080} {"train_loss": -6.165524482727051, "global_step": 87375, "epoch": 2080} {"train_loss": -6.314917087554932, "global_step": 87376, "epoch": 2080} {"train_loss": -6.256016731262207, "global_step": 87377, "epoch": 2080} {"train_loss": -6.233279228210449, "global_step": 87378, "epoch": 2080} {"train_loss": -6.339712619781494, "global_step": 87379, "epoch": 2080} {"train_loss": -6.202951431274414, "global_step": 87380, "epoch": 2080} {"train_loss": -6.27323055267334, "global_step": 87381, "epoch": 2080} {"train_loss": -6.21475076675415, "global_step": 87382, "epoch": 2080} {"train_loss": -6.343387603759766, "global_step": 87383, "epoch": 2080} {"train_loss": -6.272426128387451, "global_step": 87384, "epoch": 2080} {"train_loss": -6.3226776123046875, "global_step": 87385, "epoch": 2080} {"train_loss": -6.197014808654785, "global_step": 87386, "epoch": 2080} {"train_loss": -6.236080646514893, "global_step": 87387, "epoch": 2080} {"train_loss": -6.2395219802856445, "global_step": 87388, "epoch": 2080} {"train_loss": -6.200139999389648, "global_step": 87389, "epoch": 2080} {"train_loss": -6.083288192749023, "global_step": 87390, "epoch": 2080} {"train_loss": -6.195728302001953, "global_step": 87391, "epoch": 2080} {"train_loss": -6.200827121734619, "global_step": 87392, "epoch": 2080} {"train_loss": -6.287126541137695, "global_step": 87393, "epoch": 2080} {"train_loss": -6.073663234710693, "global_step": 87394, "epoch": 2080} {"train_loss": -6.141388893127441, "global_step": 87395, "epoch": 2080} {"train_loss": -6.128203392028809, "global_step": 87396, "epoch": 2080} {"train_loss": -6.166292190551758, "global_step": 87397, "epoch": 2080} {"train_loss": -6.14351749420166, "global_step": 87398, "epoch": 2080} {"train_loss": -6.239696025848389, "global_step": 87399, "epoch": 2080} {"train_loss": -6.182293891906738, "global_step": 87400, "epoch": 2080} {"train_loss": -6.195924134481521, "global_step": 87401, "epoch": 2080, "val_loss": 75306.0390625} {"train_loss": -6.2528862953186035, "global_step": 87402, "epoch": 2081} {"train_loss": -6.221268653869629, "global_step": 87403, "epoch": 2081} {"train_loss": -6.074006080627441, "global_step": 87404, "epoch": 2081} {"train_loss": -6.277519226074219, "global_step": 87405, "epoch": 2081} {"train_loss": -6.175868511199951, "global_step": 87406, "epoch": 2081} {"train_loss": -6.191023826599121, "global_step": 87407, "epoch": 2081} {"train_loss": -6.349769115447998, "global_step": 87408, "epoch": 2081} {"train_loss": -6.050676345825195, "global_step": 87409, "epoch": 2081} {"train_loss": -6.230694770812988, "global_step": 87410, "epoch": 2081} {"train_loss": -6.126758575439453, "global_step": 87411, "epoch": 2081} {"train_loss": -6.202406883239746, "global_step": 87412, "epoch": 2081} {"train_loss": -6.347841262817383, "global_step": 87413, "epoch": 2081} {"train_loss": -6.184151649475098, "global_step": 87414, "epoch": 2081} {"train_loss": -6.352561950683594, "global_step": 87415, "epoch": 2081} {"train_loss": -6.0823564529418945, "global_step": 87416, "epoch": 2081} {"train_loss": -6.197042465209961, "global_step": 87417, "epoch": 2081} {"train_loss": -6.093083381652832, "global_step": 87418, "epoch": 2081} {"train_loss": -6.212346076965332, "global_step": 87419, "epoch": 2081} {"train_loss": -6.294559478759766, "global_step": 87420, "epoch": 2081} {"train_loss": -6.156556606292725, "global_step": 87421, "epoch": 2081} {"train_loss": -6.096220970153809, "global_step": 87422, "epoch": 2081} {"train_loss": -6.248722553253174, "global_step": 87423, "epoch": 2081} {"train_loss": -6.173672676086426, "global_step": 87424, "epoch": 2081} {"train_loss": -6.142126083374023, "global_step": 87425, "epoch": 2081} {"train_loss": -6.323368549346924, "global_step": 87426, "epoch": 2081} {"train_loss": -6.0794453620910645, "global_step": 87427, "epoch": 2081} {"train_loss": -6.242267608642578, "global_step": 87428, "epoch": 2081} {"train_loss": -6.246125221252441, "global_step": 87429, "epoch": 2081} {"train_loss": -6.076652526855469, "global_step": 87430, "epoch": 2081} {"train_loss": -6.155773639678955, "global_step": 87431, "epoch": 2081} {"train_loss": -6.172889709472656, "global_step": 87432, "epoch": 2081} {"train_loss": -6.088996887207031, "global_step": 87433, "epoch": 2081} {"train_loss": -6.160703659057617, "global_step": 87434, "epoch": 2081} {"train_loss": -6.194034576416016, "global_step": 87435, "epoch": 2081} {"train_loss": -6.1306352615356445, "global_step": 87436, "epoch": 2081} {"train_loss": -5.9725141525268555, "global_step": 87437, "epoch": 2081} {"train_loss": -6.215192794799805, "global_step": 87438, "epoch": 2081} {"train_loss": -6.053988456726074, "global_step": 87439, "epoch": 2081} {"train_loss": -6.052966117858887, "global_step": 87440, "epoch": 2081} {"train_loss": -6.108842849731445, "global_step": 87441, "epoch": 2081} {"train_loss": -6.147006034851074, "global_step": 87442, "epoch": 2081} {"train_loss": -6.174988837469192, "global_step": 87443, "epoch": 2081, "val_loss": 75109.5078125} {"train_loss": -6.139219760894775, "global_step": 87444, "epoch": 2082} {"train_loss": -6.260857582092285, "global_step": 87445, "epoch": 2082} {"train_loss": -6.135697364807129, "global_step": 87446, "epoch": 2082} {"train_loss": -6.241172790527344, "global_step": 87447, "epoch": 2082} {"train_loss": -6.244682312011719, "global_step": 87448, "epoch": 2082} {"train_loss": -6.028741836547852, "global_step": 87449, "epoch": 2082} {"train_loss": -6.098140716552734, "global_step": 87450, "epoch": 2082} {"train_loss": -6.191503524780273, "global_step": 87451, "epoch": 2082} {"train_loss": -6.190489292144775, "global_step": 87452, "epoch": 2082} {"train_loss": -6.228843688964844, "global_step": 87453, "epoch": 2082} {"train_loss": -6.16792106628418, "global_step": 87454, "epoch": 2082} {"train_loss": -6.254255294799805, "global_step": 87455, "epoch": 2082} {"train_loss": -6.196742057800293, "global_step": 87456, "epoch": 2082} {"train_loss": -6.279772758483887, "global_step": 87457, "epoch": 2082} {"train_loss": -6.342044830322266, "global_step": 87458, "epoch": 2082} {"train_loss": -6.107087135314941, "global_step": 87459, "epoch": 2082} {"train_loss": -6.198805332183838, "global_step": 87460, "epoch": 2082} {"train_loss": -6.369260787963867, "global_step": 87461, "epoch": 2082} {"train_loss": -6.294575214385986, "global_step": 87462, "epoch": 2082} {"train_loss": -6.217436790466309, "global_step": 87463, "epoch": 2082} {"train_loss": -6.146280288696289, "global_step": 87464, "epoch": 2082} {"train_loss": -6.219431400299072, "global_step": 87465, "epoch": 2082} {"train_loss": -6.370143890380859, "global_step": 87466, "epoch": 2082} {"train_loss": -6.298867225646973, "global_step": 87467, "epoch": 2082} {"train_loss": -6.027245998382568, "global_step": 87468, "epoch": 2082} {"train_loss": -6.228953838348389, "global_step": 87469, "epoch": 2082} {"train_loss": -6.219028949737549, "global_step": 87470, "epoch": 2082} {"train_loss": -6.1507978439331055, "global_step": 87471, "epoch": 2082} {"train_loss": -6.202777862548828, "global_step": 87472, "epoch": 2082} {"train_loss": -6.3124566078186035, "global_step": 87473, "epoch": 2082} {"train_loss": -6.066471576690674, "global_step": 87474, "epoch": 2082} {"train_loss": -6.2448577880859375, "global_step": 87475, "epoch": 2082} {"train_loss": -6.162235260009766, "global_step": 87476, "epoch": 2082} {"train_loss": -6.138659954071045, "global_step": 87477, "epoch": 2082} {"train_loss": -6.16325569152832, "global_step": 87478, "epoch": 2082} {"train_loss": -6.199835777282715, "global_step": 87479, "epoch": 2082} {"train_loss": -6.217791557312012, "global_step": 87480, "epoch": 2082} {"train_loss": -6.147207736968994, "global_step": 87481, "epoch": 2082} {"train_loss": -6.111554145812988, "global_step": 87482, "epoch": 2082} {"train_loss": -6.220183849334717, "global_step": 87483, "epoch": 2082} {"train_loss": -6.2774434089660645, "global_step": 87484, "epoch": 2082} {"train_loss": -6.2046594733283635, "global_step": 87485, "epoch": 2082, "val_loss": 75089.734375} {"train_loss": -6.219210624694824, "global_step": 87486, "epoch": 2083} {"train_loss": -6.273312091827393, "global_step": 87487, "epoch": 2083} {"train_loss": -6.199991703033447, "global_step": 87488, "epoch": 2083} {"train_loss": -6.242806434631348, "global_step": 87489, "epoch": 2083} {"train_loss": -6.229270935058594, "global_step": 87490, "epoch": 2083} {"train_loss": -6.1797685623168945, "global_step": 87491, "epoch": 2083} {"train_loss": -6.333243370056152, "global_step": 87492, "epoch": 2083} {"train_loss": -6.097893238067627, "global_step": 87493, "epoch": 2083} {"train_loss": -6.118086814880371, "global_step": 87494, "epoch": 2083} {"train_loss": -6.225914001464844, "global_step": 87495, "epoch": 2083} {"train_loss": -6.100316047668457, "global_step": 87496, "epoch": 2083} {"train_loss": -6.289076328277588, "global_step": 87497, "epoch": 2083} {"train_loss": -6.242905616760254, "global_step": 87498, "epoch": 2083} {"train_loss": -6.07021951675415, "global_step": 87499, "epoch": 2083} {"train_loss": -6.307873725891113, "global_step": 87500, "epoch": 2083} {"train_loss": -6.1857757568359375, "global_step": 87501, "epoch": 2083} {"train_loss": -6.147272109985352, "global_step": 87502, "epoch": 2083} {"train_loss": -6.303916931152344, "global_step": 87503, "epoch": 2083} {"train_loss": -6.1129889488220215, "global_step": 87504, "epoch": 2083} {"train_loss": -6.2679338455200195, "global_step": 87505, "epoch": 2083} {"train_loss": -6.289818286895752, "global_step": 87506, "epoch": 2083} {"train_loss": -6.242371559143066, "global_step": 87507, "epoch": 2083} {"train_loss": -6.113005638122559, "global_step": 87508, "epoch": 2083} {"train_loss": -6.218014717102051, "global_step": 87509, "epoch": 2083} {"train_loss": -6.207392692565918, "global_step": 87510, "epoch": 2083} {"train_loss": -6.218949317932129, "global_step": 87511, "epoch": 2083} {"train_loss": -6.186083793640137, "global_step": 87512, "epoch": 2083} {"train_loss": -6.201127052307129, "global_step": 87513, "epoch": 2083} {"train_loss": -6.148260116577148, "global_step": 87514, "epoch": 2083} {"train_loss": -6.19520378112793, "global_step": 87515, "epoch": 2083} {"train_loss": -6.193671226501465, "global_step": 87516, "epoch": 2083} {"train_loss": -6.261582374572754, "global_step": 87517, "epoch": 2083} {"train_loss": -6.16616678237915, "global_step": 87518, "epoch": 2083} {"train_loss": -6.148045539855957, "global_step": 87519, "epoch": 2083} {"train_loss": -6.184317588806152, "global_step": 87520, "epoch": 2083} {"train_loss": -6.206014633178711, "global_step": 87521, "epoch": 2083} {"train_loss": -6.270205497741699, "global_step": 87522, "epoch": 2083} {"train_loss": -6.191636085510254, "global_step": 87523, "epoch": 2083} {"train_loss": -6.331762313842773, "global_step": 87524, "epoch": 2083} {"train_loss": -6.234798908233643, "global_step": 87525, "epoch": 2083} {"train_loss": -6.124730110168457, "global_step": 87526, "epoch": 2083} {"train_loss": -6.204886141277495, "global_step": 87527, "epoch": 2083, "val_loss": 75206.6015625} {"train_loss": -6.141061782836914, "global_step": 87528, "epoch": 2084} {"train_loss": -6.277244567871094, "global_step": 87529, "epoch": 2084} {"train_loss": -6.195113182067871, "global_step": 87530, "epoch": 2084} {"train_loss": -6.27928352355957, "global_step": 87531, "epoch": 2084} {"train_loss": -6.151687145233154, "global_step": 87532, "epoch": 2084} {"train_loss": -6.2678937911987305, "global_step": 87533, "epoch": 2084} {"train_loss": -6.244421005249023, "global_step": 87534, "epoch": 2084} {"train_loss": -6.117154121398926, "global_step": 87535, "epoch": 2084} {"train_loss": -6.197072982788086, "global_step": 87536, "epoch": 2084} {"train_loss": -6.300070285797119, "global_step": 87537, "epoch": 2084} {"train_loss": -6.298964977264404, "global_step": 87538, "epoch": 2084} {"train_loss": -6.29482364654541, "global_step": 87539, "epoch": 2084} {"train_loss": -6.169851303100586, "global_step": 87540, "epoch": 2084} {"train_loss": -6.297128200531006, "global_step": 87541, "epoch": 2084} {"train_loss": -6.283642292022705, "global_step": 87542, "epoch": 2084} {"train_loss": -6.234394073486328, "global_step": 87543, "epoch": 2084} {"train_loss": -6.274653911590576, "global_step": 87544, "epoch": 2084} {"train_loss": -6.244598388671875, "global_step": 87545, "epoch": 2084} {"train_loss": -6.195487022399902, "global_step": 87546, "epoch": 2084} {"train_loss": -6.073841571807861, "global_step": 87547, "epoch": 2084} {"train_loss": -6.127253532409668, "global_step": 87548, "epoch": 2084} {"train_loss": -6.080045700073242, "global_step": 87549, "epoch": 2084} {"train_loss": -6.318298816680908, "global_step": 87550, "epoch": 2084} {"train_loss": -6.192761421203613, "global_step": 87551, "epoch": 2084} {"train_loss": -6.2040300369262695, "global_step": 87552, "epoch": 2084} {"train_loss": -6.172991752624512, "global_step": 87553, "epoch": 2084} {"train_loss": -6.263982772827148, "global_step": 87554, "epoch": 2084} {"train_loss": -6.25246524810791, "global_step": 87555, "epoch": 2084} {"train_loss": -6.252595901489258, "global_step": 87556, "epoch": 2084} {"train_loss": -6.359412670135498, "global_step": 87557, "epoch": 2084} {"train_loss": -6.260818958282471, "global_step": 87558, "epoch": 2084} {"train_loss": -6.217583656311035, "global_step": 87559, "epoch": 2084} {"train_loss": -6.2412872314453125, "global_step": 87560, "epoch": 2084} {"train_loss": -6.285028457641602, "global_step": 87561, "epoch": 2084} {"train_loss": -6.310757637023926, "global_step": 87562, "epoch": 2084} {"train_loss": -6.225959300994873, "global_step": 87563, "epoch": 2084} {"train_loss": -6.05820369720459, "global_step": 87564, "epoch": 2084} {"train_loss": -6.351885795593262, "global_step": 87565, "epoch": 2084} {"train_loss": -6.27680778503418, "global_step": 87566, "epoch": 2084} {"train_loss": -6.142805099487305, "global_step": 87567, "epoch": 2084} {"train_loss": -6.217512130737305, "global_step": 87568, "epoch": 2084} {"train_loss": -6.226622206824167, "global_step": 87569, "epoch": 2084, "val_loss": 75349.6171875} {"train_loss": -6.157558917999268, "global_step": 87570, "epoch": 2085} {"train_loss": -6.29860782623291, "global_step": 87571, "epoch": 2085} {"train_loss": -6.216518402099609, "global_step": 87572, "epoch": 2085} {"train_loss": -6.332899570465088, "global_step": 87573, "epoch": 2085} {"train_loss": -6.211175441741943, "global_step": 87574, "epoch": 2085} {"train_loss": -6.22477388381958, "global_step": 87575, "epoch": 2085} {"train_loss": -6.211711883544922, "global_step": 87576, "epoch": 2085} {"train_loss": -6.244570255279541, "global_step": 87577, "epoch": 2085} {"train_loss": -6.276480674743652, "global_step": 87578, "epoch": 2085} {"train_loss": -6.135025978088379, "global_step": 87579, "epoch": 2085} {"train_loss": -6.184426307678223, "global_step": 87580, "epoch": 2085} {"train_loss": -6.214376449584961, "global_step": 87581, "epoch": 2085} {"train_loss": -6.161843299865723, "global_step": 87582, "epoch": 2085} {"train_loss": -6.139575958251953, "global_step": 87583, "epoch": 2085} {"train_loss": -6.145749092102051, "global_step": 87584, "epoch": 2085} {"train_loss": -6.133040904998779, "global_step": 87585, "epoch": 2085} {"train_loss": -6.2565813064575195, "global_step": 87586, "epoch": 2085} {"train_loss": -6.258850574493408, "global_step": 87587, "epoch": 2085} {"train_loss": -6.137738227844238, "global_step": 87588, "epoch": 2085} {"train_loss": -6.21062707901001, "global_step": 87589, "epoch": 2085} {"train_loss": -6.293943405151367, "global_step": 87590, "epoch": 2085} {"train_loss": -6.26819372177124, "global_step": 87591, "epoch": 2085} {"train_loss": -6.315772533416748, "global_step": 87592, "epoch": 2085} {"train_loss": -6.278599262237549, "global_step": 87593, "epoch": 2085} {"train_loss": -6.176208019256592, "global_step": 87594, "epoch": 2085} {"train_loss": -6.202441215515137, "global_step": 87595, "epoch": 2085} {"train_loss": -6.195921897888184, "global_step": 87596, "epoch": 2085} {"train_loss": -6.295340538024902, "global_step": 87597, "epoch": 2085} {"train_loss": -6.269708633422852, "global_step": 87598, "epoch": 2085} {"train_loss": -6.2011003494262695, "global_step": 87599, "epoch": 2085} {"train_loss": -6.111325740814209, "global_step": 87600, "epoch": 2085} {"train_loss": -6.296701431274414, "global_step": 87601, "epoch": 2085} {"train_loss": -6.301982879638672, "global_step": 87602, "epoch": 2085} {"train_loss": -6.275087356567383, "global_step": 87603, "epoch": 2085} {"train_loss": -6.079024314880371, "global_step": 87604, "epoch": 2085} {"train_loss": -6.20941162109375, "global_step": 87605, "epoch": 2085} {"train_loss": -6.185506820678711, "global_step": 87606, "epoch": 2085} {"train_loss": -6.232460021972656, "global_step": 87607, "epoch": 2085} {"train_loss": -6.179523468017578, "global_step": 87608, "epoch": 2085} {"train_loss": -6.155776500701904, "global_step": 87609, "epoch": 2085} {"train_loss": -6.189182758331299, "global_step": 87610, "epoch": 2085} {"train_loss": -6.214994861966088, "global_step": 87611, "epoch": 2085, "val_loss": 75317.53125} {"train_loss": -6.154716491699219, "global_step": 87612, "epoch": 2086} {"train_loss": -6.254116535186768, "global_step": 87613, "epoch": 2086} {"train_loss": -6.1280412673950195, "global_step": 87614, "epoch": 2086} {"train_loss": -6.255388259887695, "global_step": 87615, "epoch": 2086} {"train_loss": -6.0189924240112305, "global_step": 87616, "epoch": 2086} {"train_loss": -6.231781005859375, "global_step": 87617, "epoch": 2086} {"train_loss": -6.0202155113220215, "global_step": 87618, "epoch": 2086} {"train_loss": -6.230221271514893, "global_step": 87619, "epoch": 2086} {"train_loss": -6.208423614501953, "global_step": 87620, "epoch": 2086} {"train_loss": -6.052520751953125, "global_step": 87621, "epoch": 2086} {"train_loss": -6.394186019897461, "global_step": 87622, "epoch": 2086} {"train_loss": -6.132854461669922, "global_step": 87623, "epoch": 2086} {"train_loss": -5.941275119781494, "global_step": 87624, "epoch": 2086} {"train_loss": -6.275476455688477, "global_step": 87625, "epoch": 2086} {"train_loss": -5.961358070373535, "global_step": 87626, "epoch": 2086} {"train_loss": -6.130695343017578, "global_step": 87627, "epoch": 2086} {"train_loss": -6.052174091339111, "global_step": 87628, "epoch": 2086} {"train_loss": -6.065694808959961, "global_step": 87629, "epoch": 2086} {"train_loss": -6.200836181640625, "global_step": 87630, "epoch": 2086} {"train_loss": -6.161009788513184, "global_step": 87631, "epoch": 2086} {"train_loss": -6.096723556518555, "global_step": 87632, "epoch": 2086} {"train_loss": -6.097431182861328, "global_step": 87633, "epoch": 2086} {"train_loss": -6.12135124206543, "global_step": 87634, "epoch": 2086} {"train_loss": -6.096979141235352, "global_step": 87635, "epoch": 2086} {"train_loss": -5.96588659286499, "global_step": 87636, "epoch": 2086} {"train_loss": -6.118719100952148, "global_step": 87637, "epoch": 2086} {"train_loss": -6.1096649169921875, "global_step": 87638, "epoch": 2086} {"train_loss": -6.20115852355957, "global_step": 87639, "epoch": 2086} {"train_loss": -6.1024885177612305, "global_step": 87640, "epoch": 2086} {"train_loss": -6.2490739822387695, "global_step": 87641, "epoch": 2086} {"train_loss": -6.189800262451172, "global_step": 87642, "epoch": 2086} {"train_loss": -6.208942890167236, "global_step": 87643, "epoch": 2086} {"train_loss": -6.258327484130859, "global_step": 87644, "epoch": 2086} {"train_loss": -6.210393905639648, "global_step": 87645, "epoch": 2086} {"train_loss": -6.112754821777344, "global_step": 87646, "epoch": 2086} {"train_loss": -6.100867748260498, "global_step": 87647, "epoch": 2086} {"train_loss": -6.303112030029297, "global_step": 87648, "epoch": 2086} {"train_loss": -6.143681049346924, "global_step": 87649, "epoch": 2086} {"train_loss": -6.272207260131836, "global_step": 87650, "epoch": 2086} {"train_loss": -6.249715805053711, "global_step": 87651, "epoch": 2086} {"train_loss": -6.205097198486328, "global_step": 87652, "epoch": 2086} {"train_loss": -6.153872353690011, "global_step": 87653, "epoch": 2086, "val_loss": 75066.5546875} {"train_loss": -6.233251094818115, "global_step": 87654, "epoch": 2087} {"train_loss": -6.190010070800781, "global_step": 87655, "epoch": 2087} {"train_loss": -6.171292304992676, "global_step": 87656, "epoch": 2087} {"train_loss": -6.210050582885742, "global_step": 87657, "epoch": 2087} {"train_loss": -6.1897687911987305, "global_step": 87658, "epoch": 2087} {"train_loss": -6.285366058349609, "global_step": 87659, "epoch": 2087} {"train_loss": -6.31092643737793, "global_step": 87660, "epoch": 2087} {"train_loss": -6.311835289001465, "global_step": 87661, "epoch": 2087} {"train_loss": -6.201776504516602, "global_step": 87662, "epoch": 2087} {"train_loss": -6.321072578430176, "global_step": 87663, "epoch": 2087} {"train_loss": -6.157990455627441, "global_step": 87664, "epoch": 2087} {"train_loss": -6.310550689697266, "global_step": 87665, "epoch": 2087} {"train_loss": -6.282304763793945, "global_step": 87666, "epoch": 2087} {"train_loss": -6.221729278564453, "global_step": 87667, "epoch": 2087} {"train_loss": -6.283537864685059, "global_step": 87668, "epoch": 2087} {"train_loss": -6.260327339172363, "global_step": 87669, "epoch": 2087} {"train_loss": -6.0980119705200195, "global_step": 87670, "epoch": 2087} {"train_loss": -6.134165287017822, "global_step": 87671, "epoch": 2087} {"train_loss": -6.271511554718018, "global_step": 87672, "epoch": 2087} {"train_loss": -6.162481784820557, "global_step": 87673, "epoch": 2087} {"train_loss": -6.235185623168945, "global_step": 87674, "epoch": 2087} {"train_loss": -6.247697353363037, "global_step": 87675, "epoch": 2087} {"train_loss": -6.0848917961120605, "global_step": 87676, "epoch": 2087} {"train_loss": -6.223568916320801, "global_step": 87677, "epoch": 2087} {"train_loss": -6.241241931915283, "global_step": 87678, "epoch": 2087} {"train_loss": -6.067552089691162, "global_step": 87679, "epoch": 2087} {"train_loss": -6.231252670288086, "global_step": 87680, "epoch": 2087} {"train_loss": -6.300829887390137, "global_step": 87681, "epoch": 2087} {"train_loss": -6.145087718963623, "global_step": 87682, "epoch": 2087} {"train_loss": -6.202749729156494, "global_step": 87683, "epoch": 2087} {"train_loss": -6.247757434844971, "global_step": 87684, "epoch": 2087} {"train_loss": -6.172945976257324, "global_step": 87685, "epoch": 2087} {"train_loss": -6.146552085876465, "global_step": 87686, "epoch": 2087} {"train_loss": -6.234045028686523, "global_step": 87687, "epoch": 2087} {"train_loss": -6.294888973236084, "global_step": 87688, "epoch": 2087} {"train_loss": -6.074450492858887, "global_step": 87689, "epoch": 2087} {"train_loss": -6.284132480621338, "global_step": 87690, "epoch": 2087} {"train_loss": -6.064922332763672, "global_step": 87691, "epoch": 2087} {"train_loss": -6.280096054077148, "global_step": 87692, "epoch": 2087} {"train_loss": -6.208015441894531, "global_step": 87693, "epoch": 2087} {"train_loss": -6.368963241577148, "global_step": 87694, "epoch": 2087} {"train_loss": -6.217337982995169, "global_step": 87695, "epoch": 2087, "val_loss": 75448.9140625} {"train_loss": -6.308526515960693, "global_step": 87696, "epoch": 2088} {"train_loss": -6.271234512329102, "global_step": 87697, "epoch": 2088} {"train_loss": -6.311717987060547, "global_step": 87698, "epoch": 2088} {"train_loss": -6.231330871582031, "global_step": 87699, "epoch": 2088} {"train_loss": -6.136189937591553, "global_step": 87700, "epoch": 2088} {"train_loss": -6.2357177734375, "global_step": 87701, "epoch": 2088} {"train_loss": -6.113441467285156, "global_step": 87702, "epoch": 2088} {"train_loss": -6.114048004150391, "global_step": 87703, "epoch": 2088} {"train_loss": -6.293605327606201, "global_step": 87704, "epoch": 2088} {"train_loss": -6.274614334106445, "global_step": 87705, "epoch": 2088} {"train_loss": -6.3010077476501465, "global_step": 87706, "epoch": 2088} {"train_loss": -6.270897388458252, "global_step": 87707, "epoch": 2088} {"train_loss": -6.135595798492432, "global_step": 87708, "epoch": 2088} {"train_loss": -6.241451263427734, "global_step": 87709, "epoch": 2088} {"train_loss": -6.255041599273682, "global_step": 87710, "epoch": 2088} {"train_loss": -6.309065818786621, "global_step": 87711, "epoch": 2088} {"train_loss": -6.266206741333008, "global_step": 87712, "epoch": 2088} {"train_loss": -6.238537788391113, "global_step": 87713, "epoch": 2088} {"train_loss": -6.19687557220459, "global_step": 87714, "epoch": 2088} {"train_loss": -6.280102729797363, "global_step": 87715, "epoch": 2088} {"train_loss": -6.336398124694824, "global_step": 87716, "epoch": 2088} {"train_loss": -6.254807949066162, "global_step": 87717, "epoch": 2088} {"train_loss": -6.182247161865234, "global_step": 87718, "epoch": 2088} {"train_loss": -6.356701850891113, "global_step": 87719, "epoch": 2088} {"train_loss": -6.299806594848633, "global_step": 87720, "epoch": 2088} {"train_loss": -6.094122886657715, "global_step": 87721, "epoch": 2088} {"train_loss": -6.254079818725586, "global_step": 87722, "epoch": 2088} {"train_loss": -6.268991947174072, "global_step": 87723, "epoch": 2088} {"train_loss": -6.180884838104248, "global_step": 87724, "epoch": 2088} {"train_loss": -6.281386375427246, "global_step": 87725, "epoch": 2088} {"train_loss": -6.207743167877197, "global_step": 87726, "epoch": 2088} {"train_loss": -6.23356819152832, "global_step": 87727, "epoch": 2088} {"train_loss": -6.370089054107666, "global_step": 87728, "epoch": 2088} {"train_loss": -6.165388107299805, "global_step": 87729, "epoch": 2088} {"train_loss": -6.327725410461426, "global_step": 87730, "epoch": 2088} {"train_loss": -6.337477684020996, "global_step": 87731, "epoch": 2088} {"train_loss": -6.161036968231201, "global_step": 87732, "epoch": 2088} {"train_loss": -6.233721733093262, "global_step": 87733, "epoch": 2088} {"train_loss": -6.216250896453857, "global_step": 87734, "epoch": 2088} {"train_loss": -6.38211727142334, "global_step": 87735, "epoch": 2088} {"train_loss": -6.293116569519043, "global_step": 87736, "epoch": 2088} {"train_loss": -6.247659172330584, "global_step": 87737, "epoch": 2088, "val_loss": 75398.203125} {"train_loss": -6.190939426422119, "global_step": 87738, "epoch": 2089} {"train_loss": -6.287750244140625, "global_step": 87739, "epoch": 2089} {"train_loss": -6.181224822998047, "global_step": 87740, "epoch": 2089} {"train_loss": -6.236847877502441, "global_step": 87741, "epoch": 2089} {"train_loss": -6.258114814758301, "global_step": 87742, "epoch": 2089} {"train_loss": -6.124234199523926, "global_step": 87743, "epoch": 2089} {"train_loss": -6.354988098144531, "global_step": 87744, "epoch": 2089} {"train_loss": -6.196188926696777, "global_step": 87745, "epoch": 2089} {"train_loss": -6.274608612060547, "global_step": 87746, "epoch": 2089} {"train_loss": -6.168341159820557, "global_step": 87747, "epoch": 2089} {"train_loss": -6.142011642456055, "global_step": 87748, "epoch": 2089} {"train_loss": -6.2272820472717285, "global_step": 87749, "epoch": 2089} {"train_loss": -6.351360321044922, "global_step": 87750, "epoch": 2089} {"train_loss": -6.114011287689209, "global_step": 87751, "epoch": 2089} {"train_loss": -6.204292297363281, "global_step": 87752, "epoch": 2089} {"train_loss": -6.144076347351074, "global_step": 87753, "epoch": 2089} {"train_loss": -6.277950286865234, "global_step": 87754, "epoch": 2089} {"train_loss": -6.255547523498535, "global_step": 87755, "epoch": 2089} {"train_loss": -6.172863006591797, "global_step": 87756, "epoch": 2089} {"train_loss": -6.24339485168457, "global_step": 87757, "epoch": 2089} {"train_loss": -6.157826900482178, "global_step": 87758, "epoch": 2089} {"train_loss": -6.277702331542969, "global_step": 87759, "epoch": 2089} {"train_loss": -6.164999008178711, "global_step": 87760, "epoch": 2089} {"train_loss": -6.236453056335449, "global_step": 87761, "epoch": 2089} {"train_loss": -6.228888034820557, "global_step": 87762, "epoch": 2089} {"train_loss": -6.177765846252441, "global_step": 87763, "epoch": 2089} {"train_loss": -6.327793121337891, "global_step": 87764, "epoch": 2089} {"train_loss": -6.202167987823486, "global_step": 87765, "epoch": 2089} {"train_loss": -6.085343837738037, "global_step": 87766, "epoch": 2089} {"train_loss": -6.274501800537109, "global_step": 87767, "epoch": 2089} {"train_loss": -6.160549163818359, "global_step": 87768, "epoch": 2089} {"train_loss": -6.092179298400879, "global_step": 87769, "epoch": 2089} {"train_loss": -6.121819496154785, "global_step": 87770, "epoch": 2089} {"train_loss": -6.130797386169434, "global_step": 87771, "epoch": 2089} {"train_loss": -6.124778747558594, "global_step": 87772, "epoch": 2089} {"train_loss": -6.134253978729248, "global_step": 87773, "epoch": 2089} {"train_loss": -6.274664878845215, "global_step": 87774, "epoch": 2089} {"train_loss": -6.147131443023682, "global_step": 87775, "epoch": 2089} {"train_loss": -6.306161880493164, "global_step": 87776, "epoch": 2089} {"train_loss": -6.151885986328125, "global_step": 87777, "epoch": 2089} {"train_loss": -6.31730318069458, "global_step": 87778, "epoch": 2089} {"train_loss": -6.2085019406818205, "global_step": 87779, "epoch": 2089, "val_loss": 75012.6484375} {"train_loss": -6.132773399353027, "global_step": 87780, "epoch": 2090} {"train_loss": -6.175952434539795, "global_step": 87781, "epoch": 2090} {"train_loss": -6.141786098480225, "global_step": 87782, "epoch": 2090} {"train_loss": -6.235865116119385, "global_step": 87783, "epoch": 2090} {"train_loss": -6.238248825073242, "global_step": 87784, "epoch": 2090} {"train_loss": -6.227947235107422, "global_step": 87785, "epoch": 2090} {"train_loss": -6.178687572479248, "global_step": 87786, "epoch": 2090} {"train_loss": -6.266380310058594, "global_step": 87787, "epoch": 2090} {"train_loss": -6.250730514526367, "global_step": 87788, "epoch": 2090} {"train_loss": -6.353802680969238, "global_step": 87789, "epoch": 2090} {"train_loss": -6.236331462860107, "global_step": 87790, "epoch": 2090} {"train_loss": -6.179903984069824, "global_step": 87791, "epoch": 2090} {"train_loss": -6.264720439910889, "global_step": 87792, "epoch": 2090} {"train_loss": -6.160113334655762, "global_step": 87793, "epoch": 2090} {"train_loss": -6.140507698059082, "global_step": 87794, "epoch": 2090} {"train_loss": -6.1986284255981445, "global_step": 87795, "epoch": 2090} {"train_loss": -6.231657028198242, "global_step": 87796, "epoch": 2090} {"train_loss": -6.270451545715332, "global_step": 87797, "epoch": 2090} {"train_loss": -6.215968132019043, "global_step": 87798, "epoch": 2090} {"train_loss": -6.140264511108398, "global_step": 87799, "epoch": 2090} {"train_loss": -6.203151226043701, "global_step": 87800, "epoch": 2090} {"train_loss": -6.191072463989258, "global_step": 87801, "epoch": 2090} {"train_loss": -6.277382850646973, "global_step": 87802, "epoch": 2090} {"train_loss": -6.236849308013916, "global_step": 87803, "epoch": 2090} {"train_loss": -6.152523994445801, "global_step": 87804, "epoch": 2090} {"train_loss": -6.271188735961914, "global_step": 87805, "epoch": 2090} {"train_loss": -6.1433868408203125, "global_step": 87806, "epoch": 2090} {"train_loss": -6.101911544799805, "global_step": 87807, "epoch": 2090} {"train_loss": -6.163023948669434, "global_step": 87808, "epoch": 2090} {"train_loss": -6.160839557647705, "global_step": 87809, "epoch": 2090} {"train_loss": -6.1220598220825195, "global_step": 87810, "epoch": 2090} {"train_loss": -6.177184104919434, "global_step": 87811, "epoch": 2090} {"train_loss": -6.252443313598633, "global_step": 87812, "epoch": 2090} {"train_loss": -6.211043834686279, "global_step": 87813, "epoch": 2090} {"train_loss": -6.232893943786621, "global_step": 87814, "epoch": 2090} {"train_loss": -6.239579200744629, "global_step": 87815, "epoch": 2090} {"train_loss": -6.204486846923828, "global_step": 87816, "epoch": 2090} {"train_loss": -6.189787864685059, "global_step": 87817, "epoch": 2090} {"train_loss": -6.178627967834473, "global_step": 87818, "epoch": 2090} {"train_loss": -6.285073757171631, "global_step": 87819, "epoch": 2090} {"train_loss": -6.171597480773926, "global_step": 87820, "epoch": 2090} {"train_loss": -6.206686190196446, "global_step": 87821, "epoch": 2090, "val_loss": 75376.0625} {"train_loss": -6.260651588439941, "global_step": 87822, "epoch": 2091} {"train_loss": -6.208182334899902, "global_step": 87823, "epoch": 2091} {"train_loss": -6.201286315917969, "global_step": 87824, "epoch": 2091} {"train_loss": -6.236703872680664, "global_step": 87825, "epoch": 2091} {"train_loss": -6.258856773376465, "global_step": 87826, "epoch": 2091} {"train_loss": -6.256854057312012, "global_step": 87827, "epoch": 2091} {"train_loss": -6.274181842803955, "global_step": 87828, "epoch": 2091} {"train_loss": -6.283952713012695, "global_step": 87829, "epoch": 2091} {"train_loss": -6.285123825073242, "global_step": 87830, "epoch": 2091} {"train_loss": -6.298523902893066, "global_step": 87831, "epoch": 2091} {"train_loss": -6.211972236633301, "global_step": 87832, "epoch": 2091} {"train_loss": -6.119054794311523, "global_step": 87833, "epoch": 2091} {"train_loss": -6.187924385070801, "global_step": 87834, "epoch": 2091} {"train_loss": -6.217020034790039, "global_step": 87835, "epoch": 2091} {"train_loss": -6.0491251945495605, "global_step": 87836, "epoch": 2091} {"train_loss": -6.171848297119141, "global_step": 87837, "epoch": 2091} {"train_loss": -6.1231489181518555, "global_step": 87838, "epoch": 2091} {"train_loss": -6.193734645843506, "global_step": 87839, "epoch": 2091} {"train_loss": -6.140939235687256, "global_step": 87840, "epoch": 2091} {"train_loss": -6.251850605010986, "global_step": 87841, "epoch": 2091} {"train_loss": -6.201789855957031, "global_step": 87842, "epoch": 2091} {"train_loss": -6.153116226196289, "global_step": 87843, "epoch": 2091} {"train_loss": -6.0880513191223145, "global_step": 87844, "epoch": 2091} {"train_loss": -6.273393154144287, "global_step": 87845, "epoch": 2091} {"train_loss": -6.1608195304870605, "global_step": 87846, "epoch": 2091} {"train_loss": -6.164088249206543, "global_step": 87847, "epoch": 2091} {"train_loss": -6.1957244873046875, "global_step": 87848, "epoch": 2091} {"train_loss": -6.157973289489746, "global_step": 87849, "epoch": 2091} {"train_loss": -6.18580436706543, "global_step": 87850, "epoch": 2091} {"train_loss": -6.044286251068115, "global_step": 87851, "epoch": 2091} {"train_loss": -6.275681495666504, "global_step": 87852, "epoch": 2091} {"train_loss": -6.1382293701171875, "global_step": 87853, "epoch": 2091} {"train_loss": -6.193353176116943, "global_step": 87854, "epoch": 2091} {"train_loss": -6.10307502746582, "global_step": 87855, "epoch": 2091} {"train_loss": -6.156298637390137, "global_step": 87856, "epoch": 2091} {"train_loss": -6.247228622436523, "global_step": 87857, "epoch": 2091} {"train_loss": -6.272398948669434, "global_step": 87858, "epoch": 2091} {"train_loss": -6.165942192077637, "global_step": 87859, "epoch": 2091} {"train_loss": -6.1164631843566895, "global_step": 87860, "epoch": 2091} {"train_loss": -6.1165900230407715, "global_step": 87861, "epoch": 2091} {"train_loss": -6.207418441772461, "global_step": 87862, "epoch": 2091} {"train_loss": -6.191621610096523, "global_step": 87863, "epoch": 2091, "val_loss": 75166.3046875} {"train_loss": -6.045662879943848, "global_step": 87864, "epoch": 2092} {"train_loss": -6.198812484741211, "global_step": 87865, "epoch": 2092} {"train_loss": -6.260893821716309, "global_step": 87866, "epoch": 2092} {"train_loss": -6.275794982910156, "global_step": 87867, "epoch": 2092} {"train_loss": -6.260891914367676, "global_step": 87868, "epoch": 2092} {"train_loss": -6.268506050109863, "global_step": 87869, "epoch": 2092} {"train_loss": -6.1610870361328125, "global_step": 87870, "epoch": 2092} {"train_loss": -6.220760822296143, "global_step": 87871, "epoch": 2092} {"train_loss": -6.323935508728027, "global_step": 87872, "epoch": 2092} {"train_loss": -6.1925225257873535, "global_step": 87873, "epoch": 2092} {"train_loss": -6.194431781768799, "global_step": 87874, "epoch": 2092} {"train_loss": -6.175933837890625, "global_step": 87875, "epoch": 2092} {"train_loss": -6.163323879241943, "global_step": 87876, "epoch": 2092} {"train_loss": -6.089880466461182, "global_step": 87877, "epoch": 2092} {"train_loss": -6.284180641174316, "global_step": 87878, "epoch": 2092} {"train_loss": -6.317030906677246, "global_step": 87879, "epoch": 2092} {"train_loss": -6.06960391998291, "global_step": 87880, "epoch": 2092} {"train_loss": -6.130401134490967, "global_step": 87881, "epoch": 2092} {"train_loss": -6.297253608703613, "global_step": 87882, "epoch": 2092} {"train_loss": -6.249266624450684, "global_step": 87883, "epoch": 2092} {"train_loss": -6.172952175140381, "global_step": 87884, "epoch": 2092} {"train_loss": -6.257330894470215, "global_step": 87885, "epoch": 2092} {"train_loss": -6.215724468231201, "global_step": 87886, "epoch": 2092} {"train_loss": -6.4050140380859375, "global_step": 87887, "epoch": 2092} {"train_loss": -6.173779010772705, "global_step": 87888, "epoch": 2092} {"train_loss": -6.1947526931762695, "global_step": 87889, "epoch": 2092} {"train_loss": -6.342035293579102, "global_step": 87890, "epoch": 2092} {"train_loss": -6.149712562561035, "global_step": 87891, "epoch": 2092} {"train_loss": -6.136842250823975, "global_step": 87892, "epoch": 2092} {"train_loss": -6.279951095581055, "global_step": 87893, "epoch": 2092} {"train_loss": -6.33363151550293, "global_step": 87894, "epoch": 2092} {"train_loss": -6.260112762451172, "global_step": 87895, "epoch": 2092} {"train_loss": -6.160199165344238, "global_step": 87896, "epoch": 2092} {"train_loss": -6.230819225311279, "global_step": 87897, "epoch": 2092} {"train_loss": -6.281944274902344, "global_step": 87898, "epoch": 2092} {"train_loss": -6.286751747131348, "global_step": 87899, "epoch": 2092} {"train_loss": -6.3069562911987305, "global_step": 87900, "epoch": 2092} {"train_loss": -6.240891456604004, "global_step": 87901, "epoch": 2092} {"train_loss": -6.265300273895264, "global_step": 87902, "epoch": 2092} {"train_loss": -6.239871025085449, "global_step": 87903, "epoch": 2092} {"train_loss": -6.241876125335693, "global_step": 87904, "epoch": 2092} {"train_loss": -6.228977907271612, "global_step": 87905, "epoch": 2092, "val_loss": 75286.5390625} {"train_loss": -6.199426651000977, "global_step": 87906, "epoch": 2093} {"train_loss": -6.374859809875488, "global_step": 87907, "epoch": 2093} {"train_loss": -6.305085182189941, "global_step": 87908, "epoch": 2093} {"train_loss": -6.313390254974365, "global_step": 87909, "epoch": 2093} {"train_loss": -6.346289157867432, "global_step": 87910, "epoch": 2093} {"train_loss": -6.296724319458008, "global_step": 87911, "epoch": 2093} {"train_loss": -6.209508895874023, "global_step": 87912, "epoch": 2093} {"train_loss": -6.285871982574463, "global_step": 87913, "epoch": 2093} {"train_loss": -6.298300266265869, "global_step": 87914, "epoch": 2093} {"train_loss": -6.2693376541137695, "global_step": 87915, "epoch": 2093} {"train_loss": -6.188506126403809, "global_step": 87916, "epoch": 2093} {"train_loss": -6.237981796264648, "global_step": 87917, "epoch": 2093} {"train_loss": -6.2906951904296875, "global_step": 87918, "epoch": 2093} {"train_loss": -6.2390875816345215, "global_step": 87919, "epoch": 2093} {"train_loss": -6.196528434753418, "global_step": 87920, "epoch": 2093} {"train_loss": -6.325323104858398, "global_step": 87921, "epoch": 2093} {"train_loss": -6.370795249938965, "global_step": 87922, "epoch": 2093} {"train_loss": -6.291839599609375, "global_step": 87923, "epoch": 2093} {"train_loss": -6.260015487670898, "global_step": 87924, "epoch": 2093} {"train_loss": -6.283802032470703, "global_step": 87925, "epoch": 2093} {"train_loss": -6.17436408996582, "global_step": 87926, "epoch": 2093} {"train_loss": -6.351207733154297, "global_step": 87927, "epoch": 2093} {"train_loss": -6.209677219390869, "global_step": 87928, "epoch": 2093} {"train_loss": -6.23403263092041, "global_step": 87929, "epoch": 2093} {"train_loss": -6.2486419677734375, "global_step": 87930, "epoch": 2093} {"train_loss": -6.143418312072754, "global_step": 87931, "epoch": 2093} {"train_loss": -6.187197685241699, "global_step": 87932, "epoch": 2093} {"train_loss": -6.233860492706299, "global_step": 87933, "epoch": 2093} {"train_loss": -6.178192615509033, "global_step": 87934, "epoch": 2093} {"train_loss": -6.091320037841797, "global_step": 87935, "epoch": 2093} {"train_loss": -6.137265205383301, "global_step": 87936, "epoch": 2093} {"train_loss": -5.9932403564453125, "global_step": 87937, "epoch": 2093} {"train_loss": -5.982300758361816, "global_step": 87938, "epoch": 2093} {"train_loss": -6.036038398742676, "global_step": 87939, "epoch": 2093} {"train_loss": -6.2246294021606445, "global_step": 87940, "epoch": 2093} {"train_loss": -6.242493629455566, "global_step": 87941, "epoch": 2093} {"train_loss": -6.1278862953186035, "global_step": 87942, "epoch": 2093} {"train_loss": -6.304821491241455, "global_step": 87943, "epoch": 2093} {"train_loss": -6.143871307373047, "global_step": 87944, "epoch": 2093} {"train_loss": -6.110783100128174, "global_step": 87945, "epoch": 2093} {"train_loss": -6.205787181854248, "global_step": 87946, "epoch": 2093} {"train_loss": -6.221843889781407, "global_step": 87947, "epoch": 2093, "val_loss": 75387.5546875} {"train_loss": -6.110724449157715, "global_step": 87948, "epoch": 2094} {"train_loss": -6.2178802490234375, "global_step": 87949, "epoch": 2094} {"train_loss": -6.128171920776367, "global_step": 87950, "epoch": 2094} {"train_loss": -6.089161396026611, "global_step": 87951, "epoch": 2094} {"train_loss": -6.276082515716553, "global_step": 87952, "epoch": 2094} {"train_loss": -6.108516693115234, "global_step": 87953, "epoch": 2094} {"train_loss": -6.207876205444336, "global_step": 87954, "epoch": 2094} {"train_loss": -6.17628812789917, "global_step": 87955, "epoch": 2094} {"train_loss": -6.264992713928223, "global_step": 87956, "epoch": 2094} {"train_loss": -6.1101250648498535, "global_step": 87957, "epoch": 2094} {"train_loss": -6.147242546081543, "global_step": 87958, "epoch": 2094} {"train_loss": -6.118141174316406, "global_step": 87959, "epoch": 2094} {"train_loss": -6.142758369445801, "global_step": 87960, "epoch": 2094} {"train_loss": -6.236818790435791, "global_step": 87961, "epoch": 2094} {"train_loss": -6.27241325378418, "global_step": 87962, "epoch": 2094} {"train_loss": -6.192017555236816, "global_step": 87963, "epoch": 2094} {"train_loss": -6.166360378265381, "global_step": 87964, "epoch": 2094} {"train_loss": -6.234926700592041, "global_step": 87965, "epoch": 2094} {"train_loss": -6.176436424255371, "global_step": 87966, "epoch": 2094} {"train_loss": -6.176877975463867, "global_step": 87967, "epoch": 2094} {"train_loss": -6.218293190002441, "global_step": 87968, "epoch": 2094} {"train_loss": -6.121466636657715, "global_step": 87969, "epoch": 2094} {"train_loss": -6.1968231201171875, "global_step": 87970, "epoch": 2094} {"train_loss": -6.106064796447754, "global_step": 87971, "epoch": 2094} {"train_loss": -6.158689498901367, "global_step": 87972, "epoch": 2094} {"train_loss": -6.291139125823975, "global_step": 87973, "epoch": 2094} {"train_loss": -6.123350143432617, "global_step": 87974, "epoch": 2094} {"train_loss": -6.235647201538086, "global_step": 87975, "epoch": 2094} {"train_loss": -6.113818168640137, "global_step": 87976, "epoch": 2094} {"train_loss": -6.149626731872559, "global_step": 87977, "epoch": 2094} {"train_loss": -6.277085304260254, "global_step": 87978, "epoch": 2094} {"train_loss": -6.264581203460693, "global_step": 87979, "epoch": 2094} {"train_loss": -6.199075698852539, "global_step": 87980, "epoch": 2094} {"train_loss": -6.254260063171387, "global_step": 87981, "epoch": 2094} {"train_loss": -6.163273811340332, "global_step": 87982, "epoch": 2094} {"train_loss": -6.252301216125488, "global_step": 87983, "epoch": 2094} {"train_loss": -6.02706241607666, "global_step": 87984, "epoch": 2094} {"train_loss": -6.1561737060546875, "global_step": 87985, "epoch": 2094} {"train_loss": -6.1331353187561035, "global_step": 87986, "epoch": 2094} {"train_loss": -6.284749507904053, "global_step": 87987, "epoch": 2094} {"train_loss": -6.148524761199951, "global_step": 87988, "epoch": 2094} {"train_loss": -6.18186971119472, "global_step": 87989, "epoch": 2094, "val_loss": 75349.921875} {"train_loss": -6.100170135498047, "global_step": 87990, "epoch": 2095} {"train_loss": -6.1351823806762695, "global_step": 87991, "epoch": 2095} {"train_loss": -6.235910415649414, "global_step": 87992, "epoch": 2095} {"train_loss": -6.220854759216309, "global_step": 87993, "epoch": 2095} {"train_loss": -6.312857627868652, "global_step": 87994, "epoch": 2095} {"train_loss": -6.143023490905762, "global_step": 87995, "epoch": 2095} {"train_loss": -6.237921237945557, "global_step": 87996, "epoch": 2095} {"train_loss": -6.1493377685546875, "global_step": 87997, "epoch": 2095} {"train_loss": -6.129790306091309, "global_step": 87998, "epoch": 2095} {"train_loss": -6.251887321472168, "global_step": 87999, "epoch": 2095} {"train_loss": -6.241495132446289, "global_step": 88000, "epoch": 2095} {"train_loss": -6.287186145782471, "global_step": 88001, "epoch": 2095} {"train_loss": -6.249406814575195, "global_step": 88002, "epoch": 2095} {"train_loss": -6.307160377502441, "global_step": 88003, "epoch": 2095} {"train_loss": -6.138422966003418, "global_step": 88004, "epoch": 2095} {"train_loss": -6.251794815063477, "global_step": 88005, "epoch": 2095} {"train_loss": -6.163976669311523, "global_step": 88006, "epoch": 2095} {"train_loss": -6.223407745361328, "global_step": 88007, "epoch": 2095} {"train_loss": -6.233359336853027, "global_step": 88008, "epoch": 2095} {"train_loss": -6.226089954376221, "global_step": 88009, "epoch": 2095} {"train_loss": -6.178019046783447, "global_step": 88010, "epoch": 2095} {"train_loss": -6.191281795501709, "global_step": 88011, "epoch": 2095} {"train_loss": -6.186838150024414, "global_step": 88012, "epoch": 2095} {"train_loss": -6.187339782714844, "global_step": 88013, "epoch": 2095} {"train_loss": -6.185938835144043, "global_step": 88014, "epoch": 2095} {"train_loss": -6.214443206787109, "global_step": 88015, "epoch": 2095} {"train_loss": -6.138273239135742, "global_step": 88016, "epoch": 2095} {"train_loss": -6.231712818145752, "global_step": 88017, "epoch": 2095} {"train_loss": -6.35116720199585, "global_step": 88018, "epoch": 2095} {"train_loss": -6.263824462890625, "global_step": 88019, "epoch": 2095} {"train_loss": -6.254377365112305, "global_step": 88020, "epoch": 2095} {"train_loss": -6.191398620605469, "global_step": 88021, "epoch": 2095} {"train_loss": -6.304342746734619, "global_step": 88022, "epoch": 2095} {"train_loss": -6.330201148986816, "global_step": 88023, "epoch": 2095} {"train_loss": -6.200380325317383, "global_step": 88024, "epoch": 2095} {"train_loss": -6.1197614669799805, "global_step": 88025, "epoch": 2095} {"train_loss": -6.309566974639893, "global_step": 88026, "epoch": 2095} {"train_loss": -6.2359209060668945, "global_step": 88027, "epoch": 2095} {"train_loss": -6.348058700561523, "global_step": 88028, "epoch": 2095} {"train_loss": -6.235212326049805, "global_step": 88029, "epoch": 2095} {"train_loss": -6.314393043518066, "global_step": 88030, "epoch": 2095} {"train_loss": -6.222558759507679, "global_step": 88031, "epoch": 2095, "val_loss": 75386.7578125} {"train_loss": -6.263246536254883, "global_step": 88032, "epoch": 2096} {"train_loss": -6.244178771972656, "global_step": 88033, "epoch": 2096} {"train_loss": -6.24201774597168, "global_step": 88034, "epoch": 2096} {"train_loss": -6.266278266906738, "global_step": 88035, "epoch": 2096} {"train_loss": -6.205801010131836, "global_step": 88036, "epoch": 2096} {"train_loss": -6.301340103149414, "global_step": 88037, "epoch": 2096} {"train_loss": -6.244166374206543, "global_step": 88038, "epoch": 2096} {"train_loss": -6.269369125366211, "global_step": 88039, "epoch": 2096} {"train_loss": -6.255981922149658, "global_step": 88040, "epoch": 2096} {"train_loss": -6.312375068664551, "global_step": 88041, "epoch": 2096} {"train_loss": -6.470019340515137, "global_step": 88042, "epoch": 2096} {"train_loss": -6.223901748657227, "global_step": 88043, "epoch": 2096} {"train_loss": -6.295202732086182, "global_step": 88044, "epoch": 2096} {"train_loss": -6.275213241577148, "global_step": 88045, "epoch": 2096} {"train_loss": -6.228656768798828, "global_step": 88046, "epoch": 2096} {"train_loss": -6.223771095275879, "global_step": 88047, "epoch": 2096} {"train_loss": -6.087256908416748, "global_step": 88048, "epoch": 2096} {"train_loss": -6.312163352966309, "global_step": 88049, "epoch": 2096} {"train_loss": -6.294110298156738, "global_step": 88050, "epoch": 2096} {"train_loss": -6.18798828125, "global_step": 88051, "epoch": 2096} {"train_loss": -6.307433605194092, "global_step": 88052, "epoch": 2096} {"train_loss": -6.235268592834473, "global_step": 88053, "epoch": 2096} {"train_loss": -6.326693534851074, "global_step": 88054, "epoch": 2096} {"train_loss": -6.320940971374512, "global_step": 88055, "epoch": 2096} {"train_loss": -6.226437568664551, "global_step": 88056, "epoch": 2096} {"train_loss": -6.136612415313721, "global_step": 88057, "epoch": 2096} {"train_loss": -6.348079681396484, "global_step": 88058, "epoch": 2096} {"train_loss": -6.371114253997803, "global_step": 88059, "epoch": 2096} {"train_loss": -6.188360214233398, "global_step": 88060, "epoch": 2096} {"train_loss": -6.145115852355957, "global_step": 88061, "epoch": 2096} {"train_loss": -6.3413166999816895, "global_step": 88062, "epoch": 2096} {"train_loss": -6.217799663543701, "global_step": 88063, "epoch": 2096} {"train_loss": -6.266018390655518, "global_step": 88064, "epoch": 2096} {"train_loss": -6.255302906036377, "global_step": 88065, "epoch": 2096} {"train_loss": -6.21433162689209, "global_step": 88066, "epoch": 2096} {"train_loss": -6.293553829193115, "global_step": 88067, "epoch": 2096} {"train_loss": -6.206941604614258, "global_step": 88068, "epoch": 2096} {"train_loss": -6.274736404418945, "global_step": 88069, "epoch": 2096} {"train_loss": -6.178271770477295, "global_step": 88070, "epoch": 2096} {"train_loss": -6.3302178382873535, "global_step": 88071, "epoch": 2096} {"train_loss": -6.191113471984863, "global_step": 88072, "epoch": 2096} {"train_loss": -6.256768203917003, "global_step": 88073, "epoch": 2096, "val_loss": 75157.6015625} {"train_loss": -6.346657752990723, "global_step": 88074, "epoch": 2097} {"train_loss": -6.232485771179199, "global_step": 88075, "epoch": 2097} {"train_loss": -6.252632141113281, "global_step": 88076, "epoch": 2097} {"train_loss": -6.2987260818481445, "global_step": 88077, "epoch": 2097} {"train_loss": -6.13728141784668, "global_step": 88078, "epoch": 2097} {"train_loss": -6.1284074783325195, "global_step": 88079, "epoch": 2097} {"train_loss": -6.166194438934326, "global_step": 88080, "epoch": 2097} {"train_loss": -6.245596885681152, "global_step": 88081, "epoch": 2097} {"train_loss": -6.215470314025879, "global_step": 88082, "epoch": 2097} {"train_loss": -6.2432379722595215, "global_step": 88083, "epoch": 2097} {"train_loss": -6.271817207336426, "global_step": 88084, "epoch": 2097} {"train_loss": -6.168641090393066, "global_step": 88085, "epoch": 2097} {"train_loss": -6.242647171020508, "global_step": 88086, "epoch": 2097} {"train_loss": -6.214364051818848, "global_step": 88087, "epoch": 2097} {"train_loss": -6.092442989349365, "global_step": 88088, "epoch": 2097} {"train_loss": -6.124632835388184, "global_step": 88089, "epoch": 2097} {"train_loss": -5.949141502380371, "global_step": 88090, "epoch": 2097} {"train_loss": -6.154601097106934, "global_step": 88091, "epoch": 2097} {"train_loss": -6.160984992980957, "global_step": 88092, "epoch": 2097} {"train_loss": -6.159026145935059, "global_step": 88093, "epoch": 2097} {"train_loss": -6.165593147277832, "global_step": 88094, "epoch": 2097} {"train_loss": -6.277621269226074, "global_step": 88095, "epoch": 2097} {"train_loss": -6.25857400894165, "global_step": 88096, "epoch": 2097} {"train_loss": -6.066607475280762, "global_step": 88097, "epoch": 2097} {"train_loss": -6.321554183959961, "global_step": 88098, "epoch": 2097} {"train_loss": -6.193456649780273, "global_step": 88099, "epoch": 2097} {"train_loss": -6.240924835205078, "global_step": 88100, "epoch": 2097} {"train_loss": -6.361559867858887, "global_step": 88101, "epoch": 2097} {"train_loss": -6.059259414672852, "global_step": 88102, "epoch": 2097} {"train_loss": -6.219883918762207, "global_step": 88103, "epoch": 2097} {"train_loss": -6.1764326095581055, "global_step": 88104, "epoch": 2097} {"train_loss": -6.2913079261779785, "global_step": 88105, "epoch": 2097} {"train_loss": -6.184929847717285, "global_step": 88106, "epoch": 2097} {"train_loss": -6.192668437957764, "global_step": 88107, "epoch": 2097} {"train_loss": -6.33535623550415, "global_step": 88108, "epoch": 2097} {"train_loss": -6.167228698730469, "global_step": 88109, "epoch": 2097} {"train_loss": -6.159252166748047, "global_step": 88110, "epoch": 2097} {"train_loss": -6.163785934448242, "global_step": 88111, "epoch": 2097} {"train_loss": -6.090423583984375, "global_step": 88112, "epoch": 2097} {"train_loss": -6.2578582763671875, "global_step": 88113, "epoch": 2097} {"train_loss": -6.239356994628906, "global_step": 88114, "epoch": 2097} {"train_loss": -6.200071845735822, "global_step": 88115, "epoch": 2097, "val_loss": 75219.109375} {"train_loss": -6.187658786773682, "global_step": 88116, "epoch": 2098} {"train_loss": -6.150932312011719, "global_step": 88117, "epoch": 2098} {"train_loss": -6.292619705200195, "global_step": 88118, "epoch": 2098} {"train_loss": -6.159523010253906, "global_step": 88119, "epoch": 2098} {"train_loss": -6.358127593994141, "global_step": 88120, "epoch": 2098} {"train_loss": -6.287934303283691, "global_step": 88121, "epoch": 2098} {"train_loss": -6.321128845214844, "global_step": 88122, "epoch": 2098} {"train_loss": -6.26235294342041, "global_step": 88123, "epoch": 2098} {"train_loss": -6.182052135467529, "global_step": 88124, "epoch": 2098} {"train_loss": -6.311148643493652, "global_step": 88125, "epoch": 2098} {"train_loss": -6.196991920471191, "global_step": 88126, "epoch": 2098} {"train_loss": -6.172405242919922, "global_step": 88127, "epoch": 2098} {"train_loss": -6.187263488769531, "global_step": 88128, "epoch": 2098} {"train_loss": -6.215177536010742, "global_step": 88129, "epoch": 2098} {"train_loss": -6.342101573944092, "global_step": 88130, "epoch": 2098} {"train_loss": -6.184488773345947, "global_step": 88131, "epoch": 2098} {"train_loss": -6.287942409515381, "global_step": 88132, "epoch": 2098} {"train_loss": -6.208162307739258, "global_step": 88133, "epoch": 2098} {"train_loss": -6.209053039550781, "global_step": 88134, "epoch": 2098} {"train_loss": -6.3029961585998535, "global_step": 88135, "epoch": 2098} {"train_loss": -6.184328556060791, "global_step": 88136, "epoch": 2098} {"train_loss": -6.270810127258301, "global_step": 88137, "epoch": 2098} {"train_loss": -6.218048095703125, "global_step": 88138, "epoch": 2098} {"train_loss": -6.162813186645508, "global_step": 88139, "epoch": 2098} {"train_loss": -6.2200751304626465, "global_step": 88140, "epoch": 2098} {"train_loss": -6.270845413208008, "global_step": 88141, "epoch": 2098} {"train_loss": -6.200184345245361, "global_step": 88142, "epoch": 2098} {"train_loss": -6.254358291625977, "global_step": 88143, "epoch": 2098} {"train_loss": -6.087979316711426, "global_step": 88144, "epoch": 2098} {"train_loss": -6.1376495361328125, "global_step": 88145, "epoch": 2098} {"train_loss": -6.07999849319458, "global_step": 88146, "epoch": 2098} {"train_loss": -6.324128150939941, "global_step": 88147, "epoch": 2098} {"train_loss": -6.157318115234375, "global_step": 88148, "epoch": 2098} {"train_loss": -6.141400337219238, "global_step": 88149, "epoch": 2098} {"train_loss": -6.233741760253906, "global_step": 88150, "epoch": 2098} {"train_loss": -6.178815841674805, "global_step": 88151, "epoch": 2098} {"train_loss": -6.113469123840332, "global_step": 88152, "epoch": 2098} {"train_loss": -6.191906452178955, "global_step": 88153, "epoch": 2098} {"train_loss": -6.244871139526367, "global_step": 88154, "epoch": 2098} {"train_loss": -6.2547149658203125, "global_step": 88155, "epoch": 2098} {"train_loss": -6.228055000305176, "global_step": 88156, "epoch": 2098} {"train_loss": -6.21604645819891, "global_step": 88157, "epoch": 2098, "val_loss": 75494.3671875} {"train_loss": -6.14811897277832, "global_step": 88158, "epoch": 2099} {"train_loss": -6.16938591003418, "global_step": 88159, "epoch": 2099} {"train_loss": -6.180468559265137, "global_step": 88160, "epoch": 2099} {"train_loss": -6.229253768920898, "global_step": 88161, "epoch": 2099} {"train_loss": -6.173140525817871, "global_step": 88162, "epoch": 2099} {"train_loss": -6.284159183502197, "global_step": 88163, "epoch": 2099} {"train_loss": -6.2488694190979, "global_step": 88164, "epoch": 2099} {"train_loss": -6.272675514221191, "global_step": 88165, "epoch": 2099} {"train_loss": -6.244444847106934, "global_step": 88166, "epoch": 2099} {"train_loss": -6.189671993255615, "global_step": 88167, "epoch": 2099} {"train_loss": -6.23405647277832, "global_step": 88168, "epoch": 2099} {"train_loss": -6.154448986053467, "global_step": 88169, "epoch": 2099} {"train_loss": -6.316414833068848, "global_step": 88170, "epoch": 2099} {"train_loss": -6.1170196533203125, "global_step": 88171, "epoch": 2099} {"train_loss": -6.255997657775879, "global_step": 88172, "epoch": 2099} {"train_loss": -6.308786869049072, "global_step": 88173, "epoch": 2099} {"train_loss": -6.0902299880981445, "global_step": 88174, "epoch": 2099} {"train_loss": -6.340625762939453, "global_step": 88175, "epoch": 2099} {"train_loss": -6.242667198181152, "global_step": 88176, "epoch": 2099} {"train_loss": -6.268163681030273, "global_step": 88177, "epoch": 2099} {"train_loss": -6.108618259429932, "global_step": 88178, "epoch": 2099} {"train_loss": -6.264472961425781, "global_step": 88179, "epoch": 2099} {"train_loss": -6.16776180267334, "global_step": 88180, "epoch": 2099} {"train_loss": -6.2017412185668945, "global_step": 88181, "epoch": 2099} {"train_loss": -6.154998302459717, "global_step": 88182, "epoch": 2099} {"train_loss": -6.240224838256836, "global_step": 88183, "epoch": 2099} {"train_loss": -6.216197967529297, "global_step": 88184, "epoch": 2099} {"train_loss": -6.248777389526367, "global_step": 88185, "epoch": 2099} {"train_loss": -6.24833869934082, "global_step": 88186, "epoch": 2099} {"train_loss": -6.283613681793213, "global_step": 88187, "epoch": 2099} {"train_loss": -6.256187915802002, "global_step": 88188, "epoch": 2099} {"train_loss": -6.081670761108398, "global_step": 88189, "epoch": 2099} {"train_loss": -6.267999172210693, "global_step": 88190, "epoch": 2099} {"train_loss": -6.343900203704834, "global_step": 88191, "epoch": 2099} {"train_loss": -6.248620986938477, "global_step": 88192, "epoch": 2099} {"train_loss": -6.294319152832031, "global_step": 88193, "epoch": 2099} {"train_loss": -6.197915554046631, "global_step": 88194, "epoch": 2099} {"train_loss": -6.172780513763428, "global_step": 88195, "epoch": 2099} {"train_loss": -6.147274971008301, "global_step": 88196, "epoch": 2099} {"train_loss": -6.201437950134277, "global_step": 88197, "epoch": 2099} {"train_loss": -6.3023681640625, "global_step": 88198, "epoch": 2099} {"train_loss": -6.222424177896409, "global_step": 88199, "epoch": 2099, "val_loss": 75148.640625} {"train_loss": -6.280043125152588, "global_step": 88200, "epoch": 2100} {"train_loss": -6.212589263916016, "global_step": 88201, "epoch": 2100} {"train_loss": -6.3115715980529785, "global_step": 88202, "epoch": 2100} {"train_loss": -6.229659557342529, "global_step": 88203, "epoch": 2100} {"train_loss": -6.379036903381348, "global_step": 88204, "epoch": 2100} {"train_loss": -6.222552299499512, "global_step": 88205, "epoch": 2100} {"train_loss": -6.19534969329834, "global_step": 88206, "epoch": 2100} {"train_loss": -6.206007957458496, "global_step": 88207, "epoch": 2100} {"train_loss": -6.163741111755371, "global_step": 88208, "epoch": 2100} {"train_loss": -6.2508225440979, "global_step": 88209, "epoch": 2100} {"train_loss": -6.246722221374512, "global_step": 88210, "epoch": 2100} {"train_loss": -6.183734893798828, "global_step": 88211, "epoch": 2100} {"train_loss": -6.230727195739746, "global_step": 88212, "epoch": 2100} {"train_loss": -6.3109660148620605, "global_step": 88213, "epoch": 2100} {"train_loss": -6.273843765258789, "global_step": 88214, "epoch": 2100} {"train_loss": -6.170456886291504, "global_step": 88215, "epoch": 2100} {"train_loss": -6.283941268920898, "global_step": 88216, "epoch": 2100} {"train_loss": -6.248799800872803, "global_step": 88217, "epoch": 2100} {"train_loss": -6.199639320373535, "global_step": 88218, "epoch": 2100} {"train_loss": -6.158420562744141, "global_step": 88219, "epoch": 2100} {"train_loss": -6.306832313537598, "global_step": 88220, "epoch": 2100} {"train_loss": -6.153653144836426, "global_step": 88221, "epoch": 2100} {"train_loss": -6.297532558441162, "global_step": 88222, "epoch": 2100} {"train_loss": -6.321926593780518, "global_step": 88223, "epoch": 2100} {"train_loss": -6.270245552062988, "global_step": 88224, "epoch": 2100} {"train_loss": -6.252492904663086, "global_step": 88225, "epoch": 2100} {"train_loss": -6.296927452087402, "global_step": 88226, "epoch": 2100} {"train_loss": -6.141435623168945, "global_step": 88227, "epoch": 2100} {"train_loss": -6.230868339538574, "global_step": 88228, "epoch": 2100} {"train_loss": -6.154542446136475, "global_step": 88229, "epoch": 2100} {"train_loss": -6.211923599243164, "global_step": 88230, "epoch": 2100} {"train_loss": -6.196529388427734, "global_step": 88231, "epoch": 2100} {"train_loss": -6.279910087585449, "global_step": 88232, "epoch": 2100} {"train_loss": -6.288045883178711, "global_step": 88233, "epoch": 2100} {"train_loss": -6.185019493103027, "global_step": 88234, "epoch": 2100} {"train_loss": -6.216538429260254, "global_step": 88235, "epoch": 2100} {"train_loss": -6.223379135131836, "global_step": 88236, "epoch": 2100} {"train_loss": -6.210104465484619, "global_step": 88237, "epoch": 2100} {"train_loss": -6.187919616699219, "global_step": 88238, "epoch": 2100} {"train_loss": -6.189302444458008, "global_step": 88239, "epoch": 2100} {"train_loss": -6.297591209411621, "global_step": 88240, "epoch": 2100} {"train_loss": -6.234243358884539, "global_step": 88241, "epoch": 2100, "train/sim_max_reward_0": 0.9788336964564671, "train/sim_max_reward_1": 0.9211018894846951, "train/sim_max_reward_2": 0.3446031518573926, "train/sim_max_reward_3": 0.17148870869512256, "train/sim_max_reward_4": 0.7840427244368371, "train/sim_max_reward_5": 0.7850108205625359, "test/sim_max_reward_4500000": 0.46994802274595004, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8999434146124325, "test/sim_max_reward_4500003": 0.9843697161024155, "test/sim_max_reward_4500004": 0.6863753157860157, "test/sim_max_reward_4500005": 0.8269667693026646, "test/sim_max_reward_4500006": 0.9985865808105009, "test/sim_max_reward_4500007": 0.8863132038146083, "test/sim_max_reward_4500008": 0.9789012744717902, "test/sim_max_reward_4500009": 0.9398966224682149, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.883010349350077, "test/sim_max_reward_4500012": 0.936780222109371, "test/sim_max_reward_4500013": 0.014619352810507488, "test/sim_max_reward_4500014": 0.4635791365479204, "test/sim_max_reward_4500015": 0.6281371262013864, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.036842596073563126, "test/sim_max_reward_4500018": 0.8273871878282969, "test/sim_max_reward_4500019": 0.9011335079005837, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8072527901200262, "test/sim_max_reward_4500022": 0.9751376038858974, "test/sim_max_reward_4500023": 0.9990416606876895, "test/sim_max_reward_4500024": 0.9651067429655383, "test/sim_max_reward_4500025": 0.5057073741684802, "test/sim_max_reward_4500026": 0.9546672602718064, "test/sim_max_reward_4500027": 0.9232451357830543, "test/sim_max_reward_4500028": 0.21811988790204176, "test/sim_max_reward_4500029": 0.08415772814752749, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.2086672730435356, "test/sim_max_reward_4500033": 0.9595170044849816, "test/sim_max_reward_4500034": 0.8282029997938154, "test/sim_max_reward_4500035": 0.9018872975952705, "test/sim_max_reward_4500036": 0.3923560683152688, "test/sim_max_reward_4500037": 0.7580228423455225, "test/sim_max_reward_4500038": 0.6768400742376138, "test/sim_max_reward_4500039": 0.8857806790246858, "test/sim_max_reward_4500040": 0.9683566025703294, "test/sim_max_reward_4500041": 0.9335521043509698, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.06814234302634363, "test/sim_max_reward_4500044": 0.30323673126960865, "test/sim_max_reward_4500045": 0.9360513852741232, "test/sim_max_reward_4500046": 0.846726730099092, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.06405224406467919, "train/mean_score": 0.6641801652488417, "test/mean_score": 0.6108832624085757, "val_loss": 75319.6484375} {"train_loss": -6.2759480476379395, "global_step": 88242, "epoch": 2101} {"train_loss": -6.242691516876221, "global_step": 88243, "epoch": 2101} {"train_loss": -6.287370681762695, "global_step": 88244, "epoch": 2101} {"train_loss": -6.2657575607299805, "global_step": 88245, "epoch": 2101} {"train_loss": -6.201158046722412, "global_step": 88246, "epoch": 2101} {"train_loss": -6.245491981506348, "global_step": 88247, "epoch": 2101} {"train_loss": -6.3023481369018555, "global_step": 88248, "epoch": 2101} {"train_loss": -6.220017910003662, "global_step": 88249, "epoch": 2101} {"train_loss": -6.253719806671143, "global_step": 88250, "epoch": 2101} {"train_loss": -6.370086193084717, "global_step": 88251, "epoch": 2101} {"train_loss": -6.181429862976074, "global_step": 88252, "epoch": 2101} {"train_loss": -6.2072296142578125, "global_step": 88253, "epoch": 2101} {"train_loss": -6.268984317779541, "global_step": 88254, "epoch": 2101} {"train_loss": -6.301137924194336, "global_step": 88255, "epoch": 2101} {"train_loss": -6.046843528747559, "global_step": 88256, "epoch": 2101} {"train_loss": -6.135908126831055, "global_step": 88257, "epoch": 2101} {"train_loss": -6.246020317077637, "global_step": 88258, "epoch": 2101} {"train_loss": -6.208614826202393, "global_step": 88259, "epoch": 2101} {"train_loss": -6.272231578826904, "global_step": 88260, "epoch": 2101} {"train_loss": -6.225378036499023, "global_step": 88261, "epoch": 2101} {"train_loss": -6.1771745681762695, "global_step": 88262, "epoch": 2101} {"train_loss": -6.19087553024292, "global_step": 88263, "epoch": 2101} {"train_loss": -6.329105377197266, "global_step": 88264, "epoch": 2101} {"train_loss": -6.129024505615234, "global_step": 88265, "epoch": 2101} {"train_loss": -6.269890308380127, "global_step": 88266, "epoch": 2101} {"train_loss": -6.296599388122559, "global_step": 88267, "epoch": 2101} {"train_loss": -6.2467498779296875, "global_step": 88268, "epoch": 2101} {"train_loss": -6.159605979919434, "global_step": 88269, "epoch": 2101} {"train_loss": -6.224411964416504, "global_step": 88270, "epoch": 2101} {"train_loss": -6.135807037353516, "global_step": 88271, "epoch": 2101} {"train_loss": -6.142874717712402, "global_step": 88272, "epoch": 2101} {"train_loss": -6.15605354309082, "global_step": 88273, "epoch": 2101} {"train_loss": -6.2140278816223145, "global_step": 88274, "epoch": 2101} {"train_loss": -6.2115254402160645, "global_step": 88275, "epoch": 2101} {"train_loss": -6.2949066162109375, "global_step": 88276, "epoch": 2101} {"train_loss": -6.114112854003906, "global_step": 88277, "epoch": 2101} {"train_loss": -6.267660140991211, "global_step": 88278, "epoch": 2101} {"train_loss": -6.092179298400879, "global_step": 88279, "epoch": 2101} {"train_loss": -6.318872451782227, "global_step": 88280, "epoch": 2101} {"train_loss": -6.147002220153809, "global_step": 88281, "epoch": 2101} {"train_loss": -6.171622276306152, "global_step": 88282, "epoch": 2101} {"train_loss": -6.220013754708426, "global_step": 88283, "epoch": 2101, "val_loss": 75346.6015625} {"train_loss": -6.087455749511719, "global_step": 88284, "epoch": 2102} {"train_loss": -6.189055442810059, "global_step": 88285, "epoch": 2102} {"train_loss": -6.184083938598633, "global_step": 88286, "epoch": 2102} {"train_loss": -6.229565143585205, "global_step": 88287, "epoch": 2102} {"train_loss": -6.203907489776611, "global_step": 88288, "epoch": 2102} {"train_loss": -6.277637004852295, "global_step": 88289, "epoch": 2102} {"train_loss": -6.287272930145264, "global_step": 88290, "epoch": 2102} {"train_loss": -6.168064594268799, "global_step": 88291, "epoch": 2102} {"train_loss": -6.163053512573242, "global_step": 88292, "epoch": 2102} {"train_loss": -6.265308380126953, "global_step": 88293, "epoch": 2102} {"train_loss": -6.231658935546875, "global_step": 88294, "epoch": 2102} {"train_loss": -6.098828315734863, "global_step": 88295, "epoch": 2102} {"train_loss": -6.223048210144043, "global_step": 88296, "epoch": 2102} {"train_loss": -6.201030731201172, "global_step": 88297, "epoch": 2102} {"train_loss": -6.142209053039551, "global_step": 88298, "epoch": 2102} {"train_loss": -6.150373458862305, "global_step": 88299, "epoch": 2102} {"train_loss": -6.198112487792969, "global_step": 88300, "epoch": 2102} {"train_loss": -6.273270130157471, "global_step": 88301, "epoch": 2102} {"train_loss": -6.151384353637695, "global_step": 88302, "epoch": 2102} {"train_loss": -6.260933876037598, "global_step": 88303, "epoch": 2102} {"train_loss": -6.348465919494629, "global_step": 88304, "epoch": 2102} {"train_loss": -6.208953857421875, "global_step": 88305, "epoch": 2102} {"train_loss": -6.2798004150390625, "global_step": 88306, "epoch": 2102} {"train_loss": -6.271998882293701, "global_step": 88307, "epoch": 2102} {"train_loss": -6.2818779945373535, "global_step": 88308, "epoch": 2102} {"train_loss": -6.232816696166992, "global_step": 88309, "epoch": 2102} {"train_loss": -6.184403419494629, "global_step": 88310, "epoch": 2102} {"train_loss": -6.229366302490234, "global_step": 88311, "epoch": 2102} {"train_loss": -6.228396415710449, "global_step": 88312, "epoch": 2102} {"train_loss": -6.219104766845703, "global_step": 88313, "epoch": 2102} {"train_loss": -6.348045349121094, "global_step": 88314, "epoch": 2102} {"train_loss": -6.286334037780762, "global_step": 88315, "epoch": 2102} {"train_loss": -6.19185209274292, "global_step": 88316, "epoch": 2102} {"train_loss": -6.181207656860352, "global_step": 88317, "epoch": 2102} {"train_loss": -6.196505546569824, "global_step": 88318, "epoch": 2102} {"train_loss": -6.26606559753418, "global_step": 88319, "epoch": 2102} {"train_loss": -6.319003105163574, "global_step": 88320, "epoch": 2102} {"train_loss": -6.238140106201172, "global_step": 88321, "epoch": 2102} {"train_loss": -6.277588844299316, "global_step": 88322, "epoch": 2102} {"train_loss": -6.224809169769287, "global_step": 88323, "epoch": 2102} {"train_loss": -6.128703594207764, "global_step": 88324, "epoch": 2102} {"train_loss": -6.224375679379418, "global_step": 88325, "epoch": 2102, "val_loss": 75254.7421875} {"train_loss": -6.257932662963867, "global_step": 88326, "epoch": 2103} {"train_loss": -6.358570098876953, "global_step": 88327, "epoch": 2103} {"train_loss": -6.455165863037109, "global_step": 88328, "epoch": 2103} {"train_loss": -6.228588104248047, "global_step": 88329, "epoch": 2103} {"train_loss": -6.216909408569336, "global_step": 88330, "epoch": 2103} {"train_loss": -6.278560638427734, "global_step": 88331, "epoch": 2103} {"train_loss": -6.1701202392578125, "global_step": 88332, "epoch": 2103} {"train_loss": -6.247814178466797, "global_step": 88333, "epoch": 2103} {"train_loss": -6.273159027099609, "global_step": 88334, "epoch": 2103} {"train_loss": -6.300811290740967, "global_step": 88335, "epoch": 2103} {"train_loss": -6.250881671905518, "global_step": 88336, "epoch": 2103} {"train_loss": -6.256381034851074, "global_step": 88337, "epoch": 2103} {"train_loss": -6.315041542053223, "global_step": 88338, "epoch": 2103} {"train_loss": -6.1864333152771, "global_step": 88339, "epoch": 2103} {"train_loss": -6.252345561981201, "global_step": 88340, "epoch": 2103} {"train_loss": -6.266192436218262, "global_step": 88341, "epoch": 2103} {"train_loss": -6.194602966308594, "global_step": 88342, "epoch": 2103} {"train_loss": -6.152197360992432, "global_step": 88343, "epoch": 2103} {"train_loss": -6.136753082275391, "global_step": 88344, "epoch": 2103} {"train_loss": -6.166499137878418, "global_step": 88345, "epoch": 2103} {"train_loss": -6.24377965927124, "global_step": 88346, "epoch": 2103} {"train_loss": -6.100752353668213, "global_step": 88347, "epoch": 2103} {"train_loss": -6.263529300689697, "global_step": 88348, "epoch": 2103} {"train_loss": -6.163804054260254, "global_step": 88349, "epoch": 2103} {"train_loss": -6.105344772338867, "global_step": 88350, "epoch": 2103} {"train_loss": -6.341352462768555, "global_step": 88351, "epoch": 2103} {"train_loss": -6.144078254699707, "global_step": 88352, "epoch": 2103} {"train_loss": -6.305663108825684, "global_step": 88353, "epoch": 2103} {"train_loss": -6.338620185852051, "global_step": 88354, "epoch": 2103} {"train_loss": -6.239583969116211, "global_step": 88355, "epoch": 2103} {"train_loss": -6.280702590942383, "global_step": 88356, "epoch": 2103} {"train_loss": -6.293530464172363, "global_step": 88357, "epoch": 2103} {"train_loss": -6.205580711364746, "global_step": 88358, "epoch": 2103} {"train_loss": -6.405559062957764, "global_step": 88359, "epoch": 2103} {"train_loss": -6.329565048217773, "global_step": 88360, "epoch": 2103} {"train_loss": -6.2762250900268555, "global_step": 88361, "epoch": 2103} {"train_loss": -6.214408874511719, "global_step": 88362, "epoch": 2103} {"train_loss": -6.290212631225586, "global_step": 88363, "epoch": 2103} {"train_loss": -6.299867153167725, "global_step": 88364, "epoch": 2103} {"train_loss": -6.299416542053223, "global_step": 88365, "epoch": 2103} {"train_loss": -6.285397529602051, "global_step": 88366, "epoch": 2103} {"train_loss": -6.252461535590036, "global_step": 88367, "epoch": 2103, "val_loss": 75272.765625} {"train_loss": -6.289489269256592, "global_step": 88368, "epoch": 2104} {"train_loss": -6.215260982513428, "global_step": 88369, "epoch": 2104} {"train_loss": -6.3233561515808105, "global_step": 88370, "epoch": 2104} {"train_loss": -6.2960309982299805, "global_step": 88371, "epoch": 2104} {"train_loss": -6.244162559509277, "global_step": 88372, "epoch": 2104} {"train_loss": -6.3572797775268555, "global_step": 88373, "epoch": 2104} {"train_loss": -6.078193664550781, "global_step": 88374, "epoch": 2104} {"train_loss": -6.175322532653809, "global_step": 88375, "epoch": 2104} {"train_loss": -6.267012596130371, "global_step": 88376, "epoch": 2104} {"train_loss": -6.182891845703125, "global_step": 88377, "epoch": 2104} {"train_loss": -6.220037460327148, "global_step": 88378, "epoch": 2104} {"train_loss": -6.259978294372559, "global_step": 88379, "epoch": 2104} {"train_loss": -6.275784015655518, "global_step": 88380, "epoch": 2104} {"train_loss": -6.2227325439453125, "global_step": 88381, "epoch": 2104} {"train_loss": -6.379950046539307, "global_step": 88382, "epoch": 2104} {"train_loss": -6.193693161010742, "global_step": 88383, "epoch": 2104} {"train_loss": -6.293493747711182, "global_step": 88384, "epoch": 2104} {"train_loss": -6.2069478034973145, "global_step": 88385, "epoch": 2104} {"train_loss": -6.302854537963867, "global_step": 88386, "epoch": 2104} {"train_loss": -6.204402446746826, "global_step": 88387, "epoch": 2104} {"train_loss": -6.289114952087402, "global_step": 88388, "epoch": 2104} {"train_loss": -6.353430271148682, "global_step": 88389, "epoch": 2104} {"train_loss": -6.217104911804199, "global_step": 88390, "epoch": 2104} {"train_loss": -6.197394371032715, "global_step": 88391, "epoch": 2104} {"train_loss": -6.252498626708984, "global_step": 88392, "epoch": 2104} {"train_loss": -6.1967878341674805, "global_step": 88393, "epoch": 2104} {"train_loss": -6.15041446685791, "global_step": 88394, "epoch": 2104} {"train_loss": -6.144308090209961, "global_step": 88395, "epoch": 2104} {"train_loss": -6.216320514678955, "global_step": 88396, "epoch": 2104} {"train_loss": -6.243267059326172, "global_step": 88397, "epoch": 2104} {"train_loss": -6.325259208679199, "global_step": 88398, "epoch": 2104} {"train_loss": -6.247530937194824, "global_step": 88399, "epoch": 2104} {"train_loss": -6.206116199493408, "global_step": 88400, "epoch": 2104} {"train_loss": -6.256317615509033, "global_step": 88401, "epoch": 2104} {"train_loss": -6.225939750671387, "global_step": 88402, "epoch": 2104} {"train_loss": -6.250502109527588, "global_step": 88403, "epoch": 2104} {"train_loss": -6.332149982452393, "global_step": 88404, "epoch": 2104} {"train_loss": -6.199995040893555, "global_step": 88405, "epoch": 2104} {"train_loss": -6.15555477142334, "global_step": 88406, "epoch": 2104} {"train_loss": -6.322032928466797, "global_step": 88407, "epoch": 2104} {"train_loss": -6.270333290100098, "global_step": 88408, "epoch": 2104} {"train_loss": -6.244433947971889, "global_step": 88409, "epoch": 2104, "val_loss": 75424.140625} {"train_loss": -6.29313325881958, "global_step": 88410, "epoch": 2105} {"train_loss": -6.310532569885254, "global_step": 88411, "epoch": 2105} {"train_loss": -6.287630081176758, "global_step": 88412, "epoch": 2105} {"train_loss": -6.299682140350342, "global_step": 88413, "epoch": 2105} {"train_loss": -6.172740936279297, "global_step": 88414, "epoch": 2105} {"train_loss": -6.236428260803223, "global_step": 88415, "epoch": 2105} {"train_loss": -6.286684036254883, "global_step": 88416, "epoch": 2105} {"train_loss": -6.228538513183594, "global_step": 88417, "epoch": 2105} {"train_loss": -6.299496650695801, "global_step": 88418, "epoch": 2105} {"train_loss": -6.341299533843994, "global_step": 88419, "epoch": 2105} {"train_loss": -6.190366268157959, "global_step": 88420, "epoch": 2105} {"train_loss": -6.271306991577148, "global_step": 88421, "epoch": 2105} {"train_loss": -6.234257221221924, "global_step": 88422, "epoch": 2105} {"train_loss": -6.261702060699463, "global_step": 88423, "epoch": 2105} {"train_loss": -6.31156063079834, "global_step": 88424, "epoch": 2105} {"train_loss": -6.235010147094727, "global_step": 88425, "epoch": 2105} {"train_loss": -6.256915092468262, "global_step": 88426, "epoch": 2105} {"train_loss": -6.1932268142700195, "global_step": 88427, "epoch": 2105} {"train_loss": -6.293880939483643, "global_step": 88428, "epoch": 2105} {"train_loss": -6.286980628967285, "global_step": 88429, "epoch": 2105} {"train_loss": -6.134096622467041, "global_step": 88430, "epoch": 2105} {"train_loss": -6.261143684387207, "global_step": 88431, "epoch": 2105} {"train_loss": -6.245391845703125, "global_step": 88432, "epoch": 2105} {"train_loss": -6.2457380294799805, "global_step": 88433, "epoch": 2105} {"train_loss": -6.1663408279418945, "global_step": 88434, "epoch": 2105} {"train_loss": -6.240550994873047, "global_step": 88435, "epoch": 2105} {"train_loss": -6.14843225479126, "global_step": 88436, "epoch": 2105} {"train_loss": -6.184501647949219, "global_step": 88437, "epoch": 2105} {"train_loss": -6.250587463378906, "global_step": 88438, "epoch": 2105} {"train_loss": -6.215124607086182, "global_step": 88439, "epoch": 2105} {"train_loss": -6.228616237640381, "global_step": 88440, "epoch": 2105} {"train_loss": -6.226052761077881, "global_step": 88441, "epoch": 2105} {"train_loss": -6.188150405883789, "global_step": 88442, "epoch": 2105} {"train_loss": -6.1109161376953125, "global_step": 88443, "epoch": 2105} {"train_loss": -6.246088981628418, "global_step": 88444, "epoch": 2105} {"train_loss": -6.1495466232299805, "global_step": 88445, "epoch": 2105} {"train_loss": -6.074978828430176, "global_step": 88446, "epoch": 2105} {"train_loss": -6.274921417236328, "global_step": 88447, "epoch": 2105} {"train_loss": -6.261381149291992, "global_step": 88448, "epoch": 2105} {"train_loss": -6.1153693199157715, "global_step": 88449, "epoch": 2105} {"train_loss": -6.130786895751953, "global_step": 88450, "epoch": 2105} {"train_loss": -6.228129262015933, "global_step": 88451, "epoch": 2105, "val_loss": 75166.1328125} {"train_loss": -6.104595184326172, "global_step": 88452, "epoch": 2106} {"train_loss": -6.187267780303955, "global_step": 88453, "epoch": 2106} {"train_loss": -6.12030553817749, "global_step": 88454, "epoch": 2106} {"train_loss": -6.139378547668457, "global_step": 88455, "epoch": 2106} {"train_loss": -6.277926445007324, "global_step": 88456, "epoch": 2106} {"train_loss": -6.101954936981201, "global_step": 88457, "epoch": 2106} {"train_loss": -6.077554702758789, "global_step": 88458, "epoch": 2106} {"train_loss": -6.218362808227539, "global_step": 88459, "epoch": 2106} {"train_loss": -6.339029312133789, "global_step": 88460, "epoch": 2106} {"train_loss": -6.139017105102539, "global_step": 88461, "epoch": 2106} {"train_loss": -6.03635311126709, "global_step": 88462, "epoch": 2106} {"train_loss": -6.144577980041504, "global_step": 88463, "epoch": 2106} {"train_loss": -6.144586563110352, "global_step": 88464, "epoch": 2106} {"train_loss": -6.08402156829834, "global_step": 88465, "epoch": 2106} {"train_loss": -6.180080890655518, "global_step": 88466, "epoch": 2106} {"train_loss": -6.110445499420166, "global_step": 88467, "epoch": 2106} {"train_loss": -6.062831878662109, "global_step": 88468, "epoch": 2106} {"train_loss": -6.2314372062683105, "global_step": 88469, "epoch": 2106} {"train_loss": -6.167015075683594, "global_step": 88470, "epoch": 2106} {"train_loss": -6.299877166748047, "global_step": 88471, "epoch": 2106} {"train_loss": -6.168074607849121, "global_step": 88472, "epoch": 2106} {"train_loss": -6.139279365539551, "global_step": 88473, "epoch": 2106} {"train_loss": -6.296504020690918, "global_step": 88474, "epoch": 2106} {"train_loss": -6.250774383544922, "global_step": 88475, "epoch": 2106} {"train_loss": -6.130043029785156, "global_step": 88476, "epoch": 2106} {"train_loss": -6.316657543182373, "global_step": 88477, "epoch": 2106} {"train_loss": -6.352568626403809, "global_step": 88478, "epoch": 2106} {"train_loss": -6.1485490798950195, "global_step": 88479, "epoch": 2106} {"train_loss": -6.219365119934082, "global_step": 88480, "epoch": 2106} {"train_loss": -6.254586219787598, "global_step": 88481, "epoch": 2106} {"train_loss": -6.210577964782715, "global_step": 88482, "epoch": 2106} {"train_loss": -6.173258304595947, "global_step": 88483, "epoch": 2106} {"train_loss": -6.108593940734863, "global_step": 88484, "epoch": 2106} {"train_loss": -6.217428207397461, "global_step": 88485, "epoch": 2106} {"train_loss": -6.199878692626953, "global_step": 88486, "epoch": 2106} {"train_loss": -6.174125671386719, "global_step": 88487, "epoch": 2106} {"train_loss": -6.182799339294434, "global_step": 88488, "epoch": 2106} {"train_loss": -6.298704147338867, "global_step": 88489, "epoch": 2106} {"train_loss": -6.256261348724365, "global_step": 88490, "epoch": 2106} {"train_loss": -6.115267753601074, "global_step": 88491, "epoch": 2106} {"train_loss": -6.204200744628906, "global_step": 88492, "epoch": 2106} {"train_loss": -6.185580196834746, "global_step": 88493, "epoch": 2106, "val_loss": 75190.546875} {"train_loss": -6.263643264770508, "global_step": 88494, "epoch": 2107} {"train_loss": -6.362581729888916, "global_step": 88495, "epoch": 2107} {"train_loss": -6.260222911834717, "global_step": 88496, "epoch": 2107} {"train_loss": -6.142576217651367, "global_step": 88497, "epoch": 2107} {"train_loss": -6.147481918334961, "global_step": 88498, "epoch": 2107} {"train_loss": -6.107841491699219, "global_step": 88499, "epoch": 2107} {"train_loss": -6.2863383293151855, "global_step": 88500, "epoch": 2107} {"train_loss": -6.174990177154541, "global_step": 88501, "epoch": 2107} {"train_loss": -6.199857711791992, "global_step": 88502, "epoch": 2107} {"train_loss": -6.256528854370117, "global_step": 88503, "epoch": 2107} {"train_loss": -6.151798248291016, "global_step": 88504, "epoch": 2107} {"train_loss": -6.226975440979004, "global_step": 88505, "epoch": 2107} {"train_loss": -6.15761661529541, "global_step": 88506, "epoch": 2107} {"train_loss": -6.212754726409912, "global_step": 88507, "epoch": 2107} {"train_loss": -6.224724769592285, "global_step": 88508, "epoch": 2107} {"train_loss": -6.122937202453613, "global_step": 88509, "epoch": 2107} {"train_loss": -6.202897071838379, "global_step": 88510, "epoch": 2107} {"train_loss": -6.173821449279785, "global_step": 88511, "epoch": 2107} {"train_loss": -6.203063488006592, "global_step": 88512, "epoch": 2107} {"train_loss": -6.166118144989014, "global_step": 88513, "epoch": 2107} {"train_loss": -6.2088189125061035, "global_step": 88514, "epoch": 2107} {"train_loss": -6.235827445983887, "global_step": 88515, "epoch": 2107} {"train_loss": -6.166881084442139, "global_step": 88516, "epoch": 2107} {"train_loss": -6.319077014923096, "global_step": 88517, "epoch": 2107} {"train_loss": -6.295167922973633, "global_step": 88518, "epoch": 2107} {"train_loss": -6.174026966094971, "global_step": 88519, "epoch": 2107} {"train_loss": -6.22554349899292, "global_step": 88520, "epoch": 2107} {"train_loss": -6.127399444580078, "global_step": 88521, "epoch": 2107} {"train_loss": -6.144962787628174, "global_step": 88522, "epoch": 2107} {"train_loss": -6.277219772338867, "global_step": 88523, "epoch": 2107} {"train_loss": -6.109993934631348, "global_step": 88524, "epoch": 2107} {"train_loss": -6.247115135192871, "global_step": 88525, "epoch": 2107} {"train_loss": -6.222485542297363, "global_step": 88526, "epoch": 2107} {"train_loss": -6.12614107131958, "global_step": 88527, "epoch": 2107} {"train_loss": -6.2220377922058105, "global_step": 88528, "epoch": 2107} {"train_loss": -6.204285144805908, "global_step": 88529, "epoch": 2107} {"train_loss": -6.2048187255859375, "global_step": 88530, "epoch": 2107} {"train_loss": -6.284722328186035, "global_step": 88531, "epoch": 2107} {"train_loss": -6.217888832092285, "global_step": 88532, "epoch": 2107} {"train_loss": -6.028652191162109, "global_step": 88533, "epoch": 2107} {"train_loss": -6.298713684082031, "global_step": 88534, "epoch": 2107} {"train_loss": -6.204450391587757, "global_step": 88535, "epoch": 2107, "val_loss": 75314.4609375} {"train_loss": -6.194762706756592, "global_step": 88536, "epoch": 2108} {"train_loss": -6.274410247802734, "global_step": 88537, "epoch": 2108} {"train_loss": -6.426479339599609, "global_step": 88538, "epoch": 2108} {"train_loss": -6.1746015548706055, "global_step": 88539, "epoch": 2108} {"train_loss": -6.167666435241699, "global_step": 88540, "epoch": 2108} {"train_loss": -6.133092403411865, "global_step": 88541, "epoch": 2108} {"train_loss": -6.178311347961426, "global_step": 88542, "epoch": 2108} {"train_loss": -6.143436908721924, "global_step": 88543, "epoch": 2108} {"train_loss": -6.290559768676758, "global_step": 88544, "epoch": 2108} {"train_loss": -6.253201007843018, "global_step": 88545, "epoch": 2108} {"train_loss": -6.106653690338135, "global_step": 88546, "epoch": 2108} {"train_loss": -6.268848896026611, "global_step": 88547, "epoch": 2108} {"train_loss": -6.088408470153809, "global_step": 88548, "epoch": 2108} {"train_loss": -6.11314582824707, "global_step": 88549, "epoch": 2108} {"train_loss": -6.18949031829834, "global_step": 88550, "epoch": 2108} {"train_loss": -6.180281162261963, "global_step": 88551, "epoch": 2108} {"train_loss": -6.190194606781006, "global_step": 88552, "epoch": 2108} {"train_loss": -6.2371907234191895, "global_step": 88553, "epoch": 2108} {"train_loss": -6.25364875793457, "global_step": 88554, "epoch": 2108} {"train_loss": -6.332592010498047, "global_step": 88555, "epoch": 2108} {"train_loss": -6.186763763427734, "global_step": 88556, "epoch": 2108} {"train_loss": -6.2197675704956055, "global_step": 88557, "epoch": 2108} {"train_loss": -6.248233795166016, "global_step": 88558, "epoch": 2108} {"train_loss": -6.09561824798584, "global_step": 88559, "epoch": 2108} {"train_loss": -6.0154314041137695, "global_step": 88560, "epoch": 2108} {"train_loss": -6.198853492736816, "global_step": 88561, "epoch": 2108} {"train_loss": -6.32890510559082, "global_step": 88562, "epoch": 2108} {"train_loss": -6.189526557922363, "global_step": 88563, "epoch": 2108} {"train_loss": -6.1570892333984375, "global_step": 88564, "epoch": 2108} {"train_loss": -6.227528095245361, "global_step": 88565, "epoch": 2108} {"train_loss": -6.280525207519531, "global_step": 88566, "epoch": 2108} {"train_loss": -6.260002136230469, "global_step": 88567, "epoch": 2108} {"train_loss": -6.203161239624023, "global_step": 88568, "epoch": 2108} {"train_loss": -6.146732330322266, "global_step": 88569, "epoch": 2108} {"train_loss": -6.236777305603027, "global_step": 88570, "epoch": 2108} {"train_loss": -6.3048095703125, "global_step": 88571, "epoch": 2108} {"train_loss": -6.130072593688965, "global_step": 88572, "epoch": 2108} {"train_loss": -6.238731384277344, "global_step": 88573, "epoch": 2108} {"train_loss": -6.1921281814575195, "global_step": 88574, "epoch": 2108} {"train_loss": -6.224915504455566, "global_step": 88575, "epoch": 2108} {"train_loss": -6.220389366149902, "global_step": 88576, "epoch": 2108} {"train_loss": -6.20636180468968, "global_step": 88577, "epoch": 2108, "val_loss": 75418.3984375} {"train_loss": -6.352262496948242, "global_step": 88578, "epoch": 2109} {"train_loss": -6.137758255004883, "global_step": 88579, "epoch": 2109} {"train_loss": -6.303681373596191, "global_step": 88580, "epoch": 2109} {"train_loss": -6.2698140144348145, "global_step": 88581, "epoch": 2109} {"train_loss": -6.211017608642578, "global_step": 88582, "epoch": 2109} {"train_loss": -6.238691329956055, "global_step": 88583, "epoch": 2109} {"train_loss": -6.260759353637695, "global_step": 88584, "epoch": 2109} {"train_loss": -6.2234673500061035, "global_step": 88585, "epoch": 2109} {"train_loss": -6.26081657409668, "global_step": 88586, "epoch": 2109} {"train_loss": -6.293592929840088, "global_step": 88587, "epoch": 2109} {"train_loss": -6.2817792892456055, "global_step": 88588, "epoch": 2109} {"train_loss": -6.079780578613281, "global_step": 88589, "epoch": 2109} {"train_loss": -6.257865905761719, "global_step": 88590, "epoch": 2109} {"train_loss": -6.142572402954102, "global_step": 88591, "epoch": 2109} {"train_loss": -6.206420421600342, "global_step": 88592, "epoch": 2109} {"train_loss": -6.295575141906738, "global_step": 88593, "epoch": 2109} {"train_loss": -6.270499229431152, "global_step": 88594, "epoch": 2109} {"train_loss": -6.29127311706543, "global_step": 88595, "epoch": 2109} {"train_loss": -6.253671646118164, "global_step": 88596, "epoch": 2109} {"train_loss": -6.365663528442383, "global_step": 88597, "epoch": 2109} {"train_loss": -6.321051120758057, "global_step": 88598, "epoch": 2109} {"train_loss": -6.214056015014648, "global_step": 88599, "epoch": 2109} {"train_loss": -6.237037658691406, "global_step": 88600, "epoch": 2109} {"train_loss": -6.246017932891846, "global_step": 88601, "epoch": 2109} {"train_loss": -6.288381099700928, "global_step": 88602, "epoch": 2109} {"train_loss": -6.299073696136475, "global_step": 88603, "epoch": 2109} {"train_loss": -6.22499418258667, "global_step": 88604, "epoch": 2109} {"train_loss": -6.163693428039551, "global_step": 88605, "epoch": 2109} {"train_loss": -6.164126396179199, "global_step": 88606, "epoch": 2109} {"train_loss": -6.206451892852783, "global_step": 88607, "epoch": 2109} {"train_loss": -6.170479774475098, "global_step": 88608, "epoch": 2109} {"train_loss": -6.369519233703613, "global_step": 88609, "epoch": 2109} {"train_loss": -6.157834053039551, "global_step": 88610, "epoch": 2109} {"train_loss": -6.19807243347168, "global_step": 88611, "epoch": 2109} {"train_loss": -6.246757507324219, "global_step": 88612, "epoch": 2109} {"train_loss": -6.213923454284668, "global_step": 88613, "epoch": 2109} {"train_loss": -6.3115410804748535, "global_step": 88614, "epoch": 2109} {"train_loss": -6.3271026611328125, "global_step": 88615, "epoch": 2109} {"train_loss": -6.257450103759766, "global_step": 88616, "epoch": 2109} {"train_loss": -6.251132965087891, "global_step": 88617, "epoch": 2109} {"train_loss": -6.339073181152344, "global_step": 88618, "epoch": 2109} {"train_loss": -6.247916085379464, "global_step": 88619, "epoch": 2109, "val_loss": 75010.28125} {"train_loss": -6.309744358062744, "global_step": 88620, "epoch": 2110} {"train_loss": -6.285116195678711, "global_step": 88621, "epoch": 2110} {"train_loss": -6.283294677734375, "global_step": 88622, "epoch": 2110} {"train_loss": -6.22283411026001, "global_step": 88623, "epoch": 2110} {"train_loss": -6.294384956359863, "global_step": 88624, "epoch": 2110} {"train_loss": -6.276820659637451, "global_step": 88625, "epoch": 2110} {"train_loss": -6.277892112731934, "global_step": 88626, "epoch": 2110} {"train_loss": -6.338979721069336, "global_step": 88627, "epoch": 2110} {"train_loss": -6.187369346618652, "global_step": 88628, "epoch": 2110} {"train_loss": -6.202258110046387, "global_step": 88629, "epoch": 2110} {"train_loss": -6.228909015655518, "global_step": 88630, "epoch": 2110} {"train_loss": -6.259037971496582, "global_step": 88631, "epoch": 2110} {"train_loss": -6.245807647705078, "global_step": 88632, "epoch": 2110} {"train_loss": -6.140007019042969, "global_step": 88633, "epoch": 2110} {"train_loss": -6.294806480407715, "global_step": 88634, "epoch": 2110} {"train_loss": -6.249454498291016, "global_step": 88635, "epoch": 2110} {"train_loss": -6.1258544921875, "global_step": 88636, "epoch": 2110} {"train_loss": -6.168006420135498, "global_step": 88637, "epoch": 2110} {"train_loss": -6.160346984863281, "global_step": 88638, "epoch": 2110} {"train_loss": -6.178291320800781, "global_step": 88639, "epoch": 2110} {"train_loss": -6.2304582595825195, "global_step": 88640, "epoch": 2110} {"train_loss": -6.255190849304199, "global_step": 88641, "epoch": 2110} {"train_loss": -6.13655424118042, "global_step": 88642, "epoch": 2110} {"train_loss": -6.199907302856445, "global_step": 88643, "epoch": 2110} {"train_loss": -6.070948123931885, "global_step": 88644, "epoch": 2110} {"train_loss": -6.229709148406982, "global_step": 88645, "epoch": 2110} {"train_loss": -6.38847541809082, "global_step": 88646, "epoch": 2110} {"train_loss": -6.126350402832031, "global_step": 88647, "epoch": 2110} {"train_loss": -6.239983081817627, "global_step": 88648, "epoch": 2110} {"train_loss": -6.21420955657959, "global_step": 88649, "epoch": 2110} {"train_loss": -6.193525314331055, "global_step": 88650, "epoch": 2110} {"train_loss": -6.211647033691406, "global_step": 88651, "epoch": 2110} {"train_loss": -6.216187477111816, "global_step": 88652, "epoch": 2110} {"train_loss": -6.178908348083496, "global_step": 88653, "epoch": 2110} {"train_loss": -6.172043800354004, "global_step": 88654, "epoch": 2110} {"train_loss": -6.244353294372559, "global_step": 88655, "epoch": 2110} {"train_loss": -6.192208290100098, "global_step": 88656, "epoch": 2110} {"train_loss": -6.20328950881958, "global_step": 88657, "epoch": 2110} {"train_loss": -6.122212886810303, "global_step": 88658, "epoch": 2110} {"train_loss": -6.09855842590332, "global_step": 88659, "epoch": 2110} {"train_loss": -6.211842060089111, "global_step": 88660, "epoch": 2110} {"train_loss": -6.2203185104188465, "global_step": 88661, "epoch": 2110, "val_loss": 75351.140625} {"train_loss": -6.266561508178711, "global_step": 88662, "epoch": 2111} {"train_loss": -6.396872043609619, "global_step": 88663, "epoch": 2111} {"train_loss": -6.186420440673828, "global_step": 88664, "epoch": 2111} {"train_loss": -6.099292755126953, "global_step": 88665, "epoch": 2111} {"train_loss": -6.246387481689453, "global_step": 88666, "epoch": 2111} {"train_loss": -6.169290542602539, "global_step": 88667, "epoch": 2111} {"train_loss": -6.266160488128662, "global_step": 88668, "epoch": 2111} {"train_loss": -6.278387069702148, "global_step": 88669, "epoch": 2111} {"train_loss": -6.137942314147949, "global_step": 88670, "epoch": 2111} {"train_loss": -6.106912136077881, "global_step": 88671, "epoch": 2111} {"train_loss": -6.241582870483398, "global_step": 88672, "epoch": 2111} {"train_loss": -6.272403717041016, "global_step": 88673, "epoch": 2111} {"train_loss": -6.258172035217285, "global_step": 88674, "epoch": 2111} {"train_loss": -6.285964012145996, "global_step": 88675, "epoch": 2111} {"train_loss": -6.236255645751953, "global_step": 88676, "epoch": 2111} {"train_loss": -6.361937522888184, "global_step": 88677, "epoch": 2111} {"train_loss": -6.333674430847168, "global_step": 88678, "epoch": 2111} {"train_loss": -6.2636284828186035, "global_step": 88679, "epoch": 2111} {"train_loss": -6.248260974884033, "global_step": 88680, "epoch": 2111} {"train_loss": -6.212794303894043, "global_step": 88681, "epoch": 2111} {"train_loss": -6.227583885192871, "global_step": 88682, "epoch": 2111} {"train_loss": -6.168137550354004, "global_step": 88683, "epoch": 2111} {"train_loss": -6.239809036254883, "global_step": 88684, "epoch": 2111} {"train_loss": -6.252378940582275, "global_step": 88685, "epoch": 2111} {"train_loss": -6.286713123321533, "global_step": 88686, "epoch": 2111} {"train_loss": -6.354361534118652, "global_step": 88687, "epoch": 2111} {"train_loss": -6.269964694976807, "global_step": 88688, "epoch": 2111} {"train_loss": -6.139183044433594, "global_step": 88689, "epoch": 2111} {"train_loss": -6.294494152069092, "global_step": 88690, "epoch": 2111} {"train_loss": -6.290538787841797, "global_step": 88691, "epoch": 2111} {"train_loss": -6.146297454833984, "global_step": 88692, "epoch": 2111} {"train_loss": -6.144280910491943, "global_step": 88693, "epoch": 2111} {"train_loss": -6.208528518676758, "global_step": 88694, "epoch": 2111} {"train_loss": -6.264475345611572, "global_step": 88695, "epoch": 2111} {"train_loss": -6.201691627502441, "global_step": 88696, "epoch": 2111} {"train_loss": -6.190126419067383, "global_step": 88697, "epoch": 2111} {"train_loss": -6.2369160652160645, "global_step": 88698, "epoch": 2111} {"train_loss": -6.1701531410217285, "global_step": 88699, "epoch": 2111} {"train_loss": -6.24139928817749, "global_step": 88700, "epoch": 2111} {"train_loss": -6.242217540740967, "global_step": 88701, "epoch": 2111} {"train_loss": -6.2483673095703125, "global_step": 88702, "epoch": 2111} {"train_loss": -6.236113094148182, "global_step": 88703, "epoch": 2111, "val_loss": 75450.3359375} {"train_loss": -6.191549301147461, "global_step": 88704, "epoch": 2112} {"train_loss": -6.2037811279296875, "global_step": 88705, "epoch": 2112} {"train_loss": -6.385610580444336, "global_step": 88706, "epoch": 2112} {"train_loss": -6.1612868309021, "global_step": 88707, "epoch": 2112} {"train_loss": -6.2835187911987305, "global_step": 88708, "epoch": 2112} {"train_loss": -6.3087310791015625, "global_step": 88709, "epoch": 2112} {"train_loss": -6.265026092529297, "global_step": 88710, "epoch": 2112} {"train_loss": -6.2632317543029785, "global_step": 88711, "epoch": 2112} {"train_loss": -6.333189010620117, "global_step": 88712, "epoch": 2112} {"train_loss": -6.346382141113281, "global_step": 88713, "epoch": 2112} {"train_loss": -6.204563617706299, "global_step": 88714, "epoch": 2112} {"train_loss": -6.21669864654541, "global_step": 88715, "epoch": 2112} {"train_loss": -6.215432167053223, "global_step": 88716, "epoch": 2112} {"train_loss": -6.355350017547607, "global_step": 88717, "epoch": 2112} {"train_loss": -6.122330665588379, "global_step": 88718, "epoch": 2112} {"train_loss": -6.121372699737549, "global_step": 88719, "epoch": 2112} {"train_loss": -6.235986709594727, "global_step": 88720, "epoch": 2112} {"train_loss": -6.07182502746582, "global_step": 88721, "epoch": 2112} {"train_loss": -5.987333297729492, "global_step": 88722, "epoch": 2112} {"train_loss": -6.237833023071289, "global_step": 88723, "epoch": 2112} {"train_loss": -5.997803688049316, "global_step": 88724, "epoch": 2112} {"train_loss": -5.965175628662109, "global_step": 88725, "epoch": 2112} {"train_loss": -6.253172397613525, "global_step": 88726, "epoch": 2112} {"train_loss": -6.04587459564209, "global_step": 88727, "epoch": 2112} {"train_loss": -6.087187767028809, "global_step": 88728, "epoch": 2112} {"train_loss": -6.083471298217773, "global_step": 88729, "epoch": 2112} {"train_loss": -6.1494903564453125, "global_step": 88730, "epoch": 2112} {"train_loss": -6.135069847106934, "global_step": 88731, "epoch": 2112} {"train_loss": -6.196868896484375, "global_step": 88732, "epoch": 2112} {"train_loss": -6.204929828643799, "global_step": 88733, "epoch": 2112} {"train_loss": -6.206570625305176, "global_step": 88734, "epoch": 2112} {"train_loss": -6.152565956115723, "global_step": 88735, "epoch": 2112} {"train_loss": -6.1859130859375, "global_step": 88736, "epoch": 2112} {"train_loss": -6.195852279663086, "global_step": 88737, "epoch": 2112} {"train_loss": -6.188607215881348, "global_step": 88738, "epoch": 2112} {"train_loss": -6.172605514526367, "global_step": 88739, "epoch": 2112} {"train_loss": -6.1918230056762695, "global_step": 88740, "epoch": 2112} {"train_loss": -6.323607444763184, "global_step": 88741, "epoch": 2112} {"train_loss": -6.173188209533691, "global_step": 88742, "epoch": 2112} {"train_loss": -6.2053375244140625, "global_step": 88743, "epoch": 2112} {"train_loss": -6.185787677764893, "global_step": 88744, "epoch": 2112} {"train_loss": -6.189322108314151, "global_step": 88745, "epoch": 2112, "val_loss": 75053.8515625} {"train_loss": -6.204212188720703, "global_step": 88746, "epoch": 2113} {"train_loss": -6.191583156585693, "global_step": 88747, "epoch": 2113} {"train_loss": -6.307431221008301, "global_step": 88748, "epoch": 2113} {"train_loss": -6.329842567443848, "global_step": 88749, "epoch": 2113} {"train_loss": -6.217679023742676, "global_step": 88750, "epoch": 2113} {"train_loss": -6.191714286804199, "global_step": 88751, "epoch": 2113} {"train_loss": -6.320975303649902, "global_step": 88752, "epoch": 2113} {"train_loss": -6.2259521484375, "global_step": 88753, "epoch": 2113} {"train_loss": -6.1869916915893555, "global_step": 88754, "epoch": 2113} {"train_loss": -6.258519649505615, "global_step": 88755, "epoch": 2113} {"train_loss": -6.149105548858643, "global_step": 88756, "epoch": 2113} {"train_loss": -6.4381184577941895, "global_step": 88757, "epoch": 2113} {"train_loss": -6.247344017028809, "global_step": 88758, "epoch": 2113} {"train_loss": -6.394248008728027, "global_step": 88759, "epoch": 2113} {"train_loss": -6.300065040588379, "global_step": 88760, "epoch": 2113} {"train_loss": -6.177095890045166, "global_step": 88761, "epoch": 2113} {"train_loss": -6.245143890380859, "global_step": 88762, "epoch": 2113} {"train_loss": -6.0904107093811035, "global_step": 88763, "epoch": 2113} {"train_loss": -6.156959533691406, "global_step": 88764, "epoch": 2113} {"train_loss": -6.237177848815918, "global_step": 88765, "epoch": 2113} {"train_loss": -6.233732223510742, "global_step": 88766, "epoch": 2113} {"train_loss": -6.214749336242676, "global_step": 88767, "epoch": 2113} {"train_loss": -6.266678333282471, "global_step": 88768, "epoch": 2113} {"train_loss": -6.156784534454346, "global_step": 88769, "epoch": 2113} {"train_loss": -6.116391181945801, "global_step": 88770, "epoch": 2113} {"train_loss": -6.275265693664551, "global_step": 88771, "epoch": 2113} {"train_loss": -6.249261379241943, "global_step": 88772, "epoch": 2113} {"train_loss": -6.183158874511719, "global_step": 88773, "epoch": 2113} {"train_loss": -6.345885276794434, "global_step": 88774, "epoch": 2113} {"train_loss": -6.2271342277526855, "global_step": 88775, "epoch": 2113} {"train_loss": -6.198444366455078, "global_step": 88776, "epoch": 2113} {"train_loss": -6.152905464172363, "global_step": 88777, "epoch": 2113} {"train_loss": -6.225352764129639, "global_step": 88778, "epoch": 2113} {"train_loss": -6.141392707824707, "global_step": 88779, "epoch": 2113} {"train_loss": -6.137265205383301, "global_step": 88780, "epoch": 2113} {"train_loss": -6.33126163482666, "global_step": 88781, "epoch": 2113} {"train_loss": -6.175126075744629, "global_step": 88782, "epoch": 2113} {"train_loss": -6.213318824768066, "global_step": 88783, "epoch": 2113} {"train_loss": -6.1856770515441895, "global_step": 88784, "epoch": 2113} {"train_loss": -6.286576271057129, "global_step": 88785, "epoch": 2113} {"train_loss": -6.158616542816162, "global_step": 88786, "epoch": 2113} {"train_loss": -6.228447073981876, "global_step": 88787, "epoch": 2113, "val_loss": 75138.9609375} {"train_loss": -6.15582275390625, "global_step": 88788, "epoch": 2114} {"train_loss": -6.242178440093994, "global_step": 88789, "epoch": 2114} {"train_loss": -6.161614418029785, "global_step": 88790, "epoch": 2114} {"train_loss": -6.171086311340332, "global_step": 88791, "epoch": 2114} {"train_loss": -6.169179916381836, "global_step": 88792, "epoch": 2114} {"train_loss": -6.123172283172607, "global_step": 88793, "epoch": 2114} {"train_loss": -6.277438640594482, "global_step": 88794, "epoch": 2114} {"train_loss": -6.147278785705566, "global_step": 88795, "epoch": 2114} {"train_loss": -6.252242088317871, "global_step": 88796, "epoch": 2114} {"train_loss": -6.116809844970703, "global_step": 88797, "epoch": 2114} {"train_loss": -6.332267761230469, "global_step": 88798, "epoch": 2114} {"train_loss": -6.033530235290527, "global_step": 88799, "epoch": 2114} {"train_loss": -6.137247085571289, "global_step": 88800, "epoch": 2114} {"train_loss": -6.216319561004639, "global_step": 88801, "epoch": 2114} {"train_loss": -6.106313705444336, "global_step": 88802, "epoch": 2114} {"train_loss": -6.264944076538086, "global_step": 88803, "epoch": 2114} {"train_loss": -6.270510673522949, "global_step": 88804, "epoch": 2114} {"train_loss": -6.285233974456787, "global_step": 88805, "epoch": 2114} {"train_loss": -6.295695781707764, "global_step": 88806, "epoch": 2114} {"train_loss": -6.164800643920898, "global_step": 88807, "epoch": 2114} {"train_loss": -6.2537841796875, "global_step": 88808, "epoch": 2114} {"train_loss": -6.260532379150391, "global_step": 88809, "epoch": 2114} {"train_loss": -6.240256309509277, "global_step": 88810, "epoch": 2114} {"train_loss": -6.187971115112305, "global_step": 88811, "epoch": 2114} {"train_loss": -6.272765636444092, "global_step": 88812, "epoch": 2114} {"train_loss": -6.28986930847168, "global_step": 88813, "epoch": 2114} {"train_loss": -6.276622295379639, "global_step": 88814, "epoch": 2114} {"train_loss": -6.302611351013184, "global_step": 88815, "epoch": 2114} {"train_loss": -6.209441184997559, "global_step": 88816, "epoch": 2114} {"train_loss": -6.347848415374756, "global_step": 88817, "epoch": 2114} {"train_loss": -6.076064109802246, "global_step": 88818, "epoch": 2114} {"train_loss": -6.2091779708862305, "global_step": 88819, "epoch": 2114} {"train_loss": -6.268003463745117, "global_step": 88820, "epoch": 2114} {"train_loss": -6.33244514465332, "global_step": 88821, "epoch": 2114} {"train_loss": -6.309895038604736, "global_step": 88822, "epoch": 2114} {"train_loss": -6.28429651260376, "global_step": 88823, "epoch": 2114} {"train_loss": -6.275762557983398, "global_step": 88824, "epoch": 2114} {"train_loss": -6.253606796264648, "global_step": 88825, "epoch": 2114} {"train_loss": -6.2076568603515625, "global_step": 88826, "epoch": 2114} {"train_loss": -6.299589157104492, "global_step": 88827, "epoch": 2114} {"train_loss": -6.280083179473877, "global_step": 88828, "epoch": 2114} {"train_loss": -6.228290648687453, "global_step": 88829, "epoch": 2114, "val_loss": 75611.7421875} {"train_loss": -6.185946464538574, "global_step": 88830, "epoch": 2115} {"train_loss": -6.31870174407959, "global_step": 88831, "epoch": 2115} {"train_loss": -6.126778602600098, "global_step": 88832, "epoch": 2115} {"train_loss": -6.101380825042725, "global_step": 88833, "epoch": 2115} {"train_loss": -6.338412284851074, "global_step": 88834, "epoch": 2115} {"train_loss": -6.166734218597412, "global_step": 88835, "epoch": 2115} {"train_loss": -6.267287254333496, "global_step": 88836, "epoch": 2115} {"train_loss": -6.290102958679199, "global_step": 88837, "epoch": 2115} {"train_loss": -6.152205467224121, "global_step": 88838, "epoch": 2115} {"train_loss": -6.2907843589782715, "global_step": 88839, "epoch": 2115} {"train_loss": -6.239205837249756, "global_step": 88840, "epoch": 2115} {"train_loss": -6.338141918182373, "global_step": 88841, "epoch": 2115} {"train_loss": -6.206096172332764, "global_step": 88842, "epoch": 2115} {"train_loss": -6.247142791748047, "global_step": 88843, "epoch": 2115} {"train_loss": -6.27423620223999, "global_step": 88844, "epoch": 2115} {"train_loss": -6.234858512878418, "global_step": 88845, "epoch": 2115} {"train_loss": -6.207210063934326, "global_step": 88846, "epoch": 2115} {"train_loss": -6.243669509887695, "global_step": 88847, "epoch": 2115} {"train_loss": -6.174017906188965, "global_step": 88848, "epoch": 2115} {"train_loss": -6.169409275054932, "global_step": 88849, "epoch": 2115} {"train_loss": -6.223413467407227, "global_step": 88850, "epoch": 2115} {"train_loss": -6.224161148071289, "global_step": 88851, "epoch": 2115} {"train_loss": -6.22580623626709, "global_step": 88852, "epoch": 2115} {"train_loss": -6.2476396560668945, "global_step": 88853, "epoch": 2115} {"train_loss": -6.2527241706848145, "global_step": 88854, "epoch": 2115} {"train_loss": -6.230517387390137, "global_step": 88855, "epoch": 2115} {"train_loss": -6.324258804321289, "global_step": 88856, "epoch": 2115} {"train_loss": -6.248851776123047, "global_step": 88857, "epoch": 2115} {"train_loss": -6.223142623901367, "global_step": 88858, "epoch": 2115} {"train_loss": -6.263476371765137, "global_step": 88859, "epoch": 2115} {"train_loss": -6.33880090713501, "global_step": 88860, "epoch": 2115} {"train_loss": -6.225872993469238, "global_step": 88861, "epoch": 2115} {"train_loss": -6.265336036682129, "global_step": 88862, "epoch": 2115} {"train_loss": -6.329840660095215, "global_step": 88863, "epoch": 2115} {"train_loss": -6.309723854064941, "global_step": 88864, "epoch": 2115} {"train_loss": -6.199449062347412, "global_step": 88865, "epoch": 2115} {"train_loss": -6.299178123474121, "global_step": 88866, "epoch": 2115} {"train_loss": -6.108387470245361, "global_step": 88867, "epoch": 2115} {"train_loss": -6.241997718811035, "global_step": 88868, "epoch": 2115} {"train_loss": -6.25611686706543, "global_step": 88869, "epoch": 2115} {"train_loss": -6.20860481262207, "global_step": 88870, "epoch": 2115} {"train_loss": -6.239934024356661, "global_step": 88871, "epoch": 2115, "val_loss": 75359.9453125} {"train_loss": -6.255033493041992, "global_step": 88872, "epoch": 2116} {"train_loss": -6.203460693359375, "global_step": 88873, "epoch": 2116} {"train_loss": -6.10988187789917, "global_step": 88874, "epoch": 2116} {"train_loss": -6.1240763664245605, "global_step": 88875, "epoch": 2116} {"train_loss": -6.2616353034973145, "global_step": 88876, "epoch": 2116} {"train_loss": -6.173342227935791, "global_step": 88877, "epoch": 2116} {"train_loss": -6.089804649353027, "global_step": 88878, "epoch": 2116} {"train_loss": -6.332961082458496, "global_step": 88879, "epoch": 2116} {"train_loss": -6.201269149780273, "global_step": 88880, "epoch": 2116} {"train_loss": -6.235286235809326, "global_step": 88881, "epoch": 2116} {"train_loss": -6.262209415435791, "global_step": 88882, "epoch": 2116} {"train_loss": -6.280381202697754, "global_step": 88883, "epoch": 2116} {"train_loss": -6.093698501586914, "global_step": 88884, "epoch": 2116} {"train_loss": -6.194467544555664, "global_step": 88885, "epoch": 2116} {"train_loss": -6.127686977386475, "global_step": 88886, "epoch": 2116} {"train_loss": -6.194375991821289, "global_step": 88887, "epoch": 2116} {"train_loss": -6.275280475616455, "global_step": 88888, "epoch": 2116} {"train_loss": -6.131718635559082, "global_step": 88889, "epoch": 2116} {"train_loss": -6.240720748901367, "global_step": 88890, "epoch": 2116} {"train_loss": -6.2378082275390625, "global_step": 88891, "epoch": 2116} {"train_loss": -6.275125980377197, "global_step": 88892, "epoch": 2116} {"train_loss": -6.214084625244141, "global_step": 88893, "epoch": 2116} {"train_loss": -6.239002227783203, "global_step": 88894, "epoch": 2116} {"train_loss": -6.198002338409424, "global_step": 88895, "epoch": 2116} {"train_loss": -6.23869514465332, "global_step": 88896, "epoch": 2116} {"train_loss": -6.18153190612793, "global_step": 88897, "epoch": 2116} {"train_loss": -6.149669170379639, "global_step": 88898, "epoch": 2116} {"train_loss": -6.303269386291504, "global_step": 88899, "epoch": 2116} {"train_loss": -6.167870998382568, "global_step": 88900, "epoch": 2116} {"train_loss": -6.244762420654297, "global_step": 88901, "epoch": 2116} {"train_loss": -6.2319746017456055, "global_step": 88902, "epoch": 2116} {"train_loss": -6.316494941711426, "global_step": 88903, "epoch": 2116} {"train_loss": -6.313854217529297, "global_step": 88904, "epoch": 2116} {"train_loss": -6.1138458251953125, "global_step": 88905, "epoch": 2116} {"train_loss": -6.238139629364014, "global_step": 88906, "epoch": 2116} {"train_loss": -6.372540473937988, "global_step": 88907, "epoch": 2116} {"train_loss": -6.271063327789307, "global_step": 88908, "epoch": 2116} {"train_loss": -6.154746055603027, "global_step": 88909, "epoch": 2116} {"train_loss": -6.173932075500488, "global_step": 88910, "epoch": 2116} {"train_loss": -6.332488059997559, "global_step": 88911, "epoch": 2116} {"train_loss": -6.268125534057617, "global_step": 88912, "epoch": 2116} {"train_loss": -6.219553595497494, "global_step": 88913, "epoch": 2116, "val_loss": 75085.7109375} {"train_loss": -6.243975639343262, "global_step": 88914, "epoch": 2117} {"train_loss": -6.271557331085205, "global_step": 88915, "epoch": 2117} {"train_loss": -6.243960857391357, "global_step": 88916, "epoch": 2117} {"train_loss": -6.310500621795654, "global_step": 88917, "epoch": 2117} {"train_loss": -6.219409942626953, "global_step": 88918, "epoch": 2117} {"train_loss": -6.2678728103637695, "global_step": 88919, "epoch": 2117} {"train_loss": -6.257668495178223, "global_step": 88920, "epoch": 2117} {"train_loss": -6.424692153930664, "global_step": 88921, "epoch": 2117} {"train_loss": -6.1203742027282715, "global_step": 88922, "epoch": 2117} {"train_loss": -6.311797142028809, "global_step": 88923, "epoch": 2117} {"train_loss": -6.34161901473999, "global_step": 88924, "epoch": 2117} {"train_loss": -6.141513824462891, "global_step": 88925, "epoch": 2117} {"train_loss": -6.213136196136475, "global_step": 88926, "epoch": 2117} {"train_loss": -6.244875907897949, "global_step": 88927, "epoch": 2117} {"train_loss": -6.2758989334106445, "global_step": 88928, "epoch": 2117} {"train_loss": -6.16808557510376, "global_step": 88929, "epoch": 2117} {"train_loss": -6.262073516845703, "global_step": 88930, "epoch": 2117} {"train_loss": -6.174129486083984, "global_step": 88931, "epoch": 2117} {"train_loss": -6.252191066741943, "global_step": 88932, "epoch": 2117} {"train_loss": -6.2502946853637695, "global_step": 88933, "epoch": 2117} {"train_loss": -6.263555526733398, "global_step": 88934, "epoch": 2117} {"train_loss": -6.335521697998047, "global_step": 88935, "epoch": 2117} {"train_loss": -6.2848286628723145, "global_step": 88936, "epoch": 2117} {"train_loss": -6.35105562210083, "global_step": 88937, "epoch": 2117} {"train_loss": -6.28916072845459, "global_step": 88938, "epoch": 2117} {"train_loss": -6.211462497711182, "global_step": 88939, "epoch": 2117} {"train_loss": -6.264157295227051, "global_step": 88940, "epoch": 2117} {"train_loss": -6.266417503356934, "global_step": 88941, "epoch": 2117} {"train_loss": -6.1922430992126465, "global_step": 88942, "epoch": 2117} {"train_loss": -6.175621032714844, "global_step": 88943, "epoch": 2117} {"train_loss": -6.165987968444824, "global_step": 88944, "epoch": 2117} {"train_loss": -6.1588897705078125, "global_step": 88945, "epoch": 2117} {"train_loss": -6.227988243103027, "global_step": 88946, "epoch": 2117} {"train_loss": -6.193026542663574, "global_step": 88947, "epoch": 2117} {"train_loss": -6.35075569152832, "global_step": 88948, "epoch": 2117} {"train_loss": -6.274992942810059, "global_step": 88949, "epoch": 2117} {"train_loss": -6.202510356903076, "global_step": 88950, "epoch": 2117} {"train_loss": -6.309404373168945, "global_step": 88951, "epoch": 2117} {"train_loss": -6.254674911499023, "global_step": 88952, "epoch": 2117} {"train_loss": -6.083727836608887, "global_step": 88953, "epoch": 2117} {"train_loss": -6.201213359832764, "global_step": 88954, "epoch": 2117} {"train_loss": -6.244983411970592, "global_step": 88955, "epoch": 2117, "val_loss": 75118.828125} {"train_loss": -6.196913242340088, "global_step": 88956, "epoch": 2118} {"train_loss": -6.32299280166626, "global_step": 88957, "epoch": 2118} {"train_loss": -6.27137565612793, "global_step": 88958, "epoch": 2118} {"train_loss": -6.271988868713379, "global_step": 88959, "epoch": 2118} {"train_loss": -6.183595657348633, "global_step": 88960, "epoch": 2118} {"train_loss": -6.184370994567871, "global_step": 88961, "epoch": 2118} {"train_loss": -6.239738464355469, "global_step": 88962, "epoch": 2118} {"train_loss": -6.07675838470459, "global_step": 88963, "epoch": 2118} {"train_loss": -6.261198043823242, "global_step": 88964, "epoch": 2118} {"train_loss": -6.159806251525879, "global_step": 88965, "epoch": 2118} {"train_loss": -6.175066947937012, "global_step": 88966, "epoch": 2118} {"train_loss": -6.155155181884766, "global_step": 88967, "epoch": 2118} {"train_loss": -5.979622840881348, "global_step": 88968, "epoch": 2118} {"train_loss": -6.276794910430908, "global_step": 88969, "epoch": 2118} {"train_loss": -6.225285530090332, "global_step": 88970, "epoch": 2118} {"train_loss": -6.104428291320801, "global_step": 88971, "epoch": 2118} {"train_loss": -6.217019081115723, "global_step": 88972, "epoch": 2118} {"train_loss": -6.069982051849365, "global_step": 88973, "epoch": 2118} {"train_loss": -6.171450614929199, "global_step": 88974, "epoch": 2118} {"train_loss": -6.294864654541016, "global_step": 88975, "epoch": 2118} {"train_loss": -6.0902252197265625, "global_step": 88976, "epoch": 2118} {"train_loss": -6.2015380859375, "global_step": 88977, "epoch": 2118} {"train_loss": -6.093162536621094, "global_step": 88978, "epoch": 2118} {"train_loss": -6.323196887969971, "global_step": 88979, "epoch": 2118} {"train_loss": -6.181035995483398, "global_step": 88980, "epoch": 2118} {"train_loss": -6.152846813201904, "global_step": 88981, "epoch": 2118} {"train_loss": -6.316115379333496, "global_step": 88982, "epoch": 2118} {"train_loss": -6.20698881149292, "global_step": 88983, "epoch": 2118} {"train_loss": -6.2081403732299805, "global_step": 88984, "epoch": 2118} {"train_loss": -6.3853349685668945, "global_step": 88985, "epoch": 2118} {"train_loss": -6.143869400024414, "global_step": 88986, "epoch": 2118} {"train_loss": -6.314957618713379, "global_step": 88987, "epoch": 2118} {"train_loss": -6.198852062225342, "global_step": 88988, "epoch": 2118} {"train_loss": -6.220221519470215, "global_step": 88989, "epoch": 2118} {"train_loss": -6.164800643920898, "global_step": 88990, "epoch": 2118} {"train_loss": -6.188565254211426, "global_step": 88991, "epoch": 2118} {"train_loss": -6.223943710327148, "global_step": 88992, "epoch": 2118} {"train_loss": -6.247732639312744, "global_step": 88993, "epoch": 2118} {"train_loss": -6.25742244720459, "global_step": 88994, "epoch": 2118} {"train_loss": -6.187188148498535, "global_step": 88995, "epoch": 2118} {"train_loss": -6.199717044830322, "global_step": 88996, "epoch": 2118} {"train_loss": -6.20545760790507, "global_step": 88997, "epoch": 2118, "val_loss": 75332.1015625} {"train_loss": -6.213735580444336, "global_step": 88998, "epoch": 2119} {"train_loss": -6.2844438552856445, "global_step": 88999, "epoch": 2119} {"train_loss": -6.326037406921387, "global_step": 89000, "epoch": 2119} {"train_loss": -6.250267028808594, "global_step": 89001, "epoch": 2119} {"train_loss": -6.232275009155273, "global_step": 89002, "epoch": 2119} {"train_loss": -6.258631706237793, "global_step": 89003, "epoch": 2119} {"train_loss": -6.301133155822754, "global_step": 89004, "epoch": 2119} {"train_loss": -6.278280258178711, "global_step": 89005, "epoch": 2119} {"train_loss": -6.193007469177246, "global_step": 89006, "epoch": 2119} {"train_loss": -6.181407928466797, "global_step": 89007, "epoch": 2119} {"train_loss": -6.238176345825195, "global_step": 89008, "epoch": 2119} {"train_loss": -6.258271217346191, "global_step": 89009, "epoch": 2119} {"train_loss": -6.28621768951416, "global_step": 89010, "epoch": 2119} {"train_loss": -6.366648197174072, "global_step": 89011, "epoch": 2119} {"train_loss": -6.333308219909668, "global_step": 89012, "epoch": 2119} {"train_loss": -6.304867267608643, "global_step": 89013, "epoch": 2119} {"train_loss": -6.2557373046875, "global_step": 89014, "epoch": 2119} {"train_loss": -6.2138872146606445, "global_step": 89015, "epoch": 2119} {"train_loss": -6.2908172607421875, "global_step": 89016, "epoch": 2119} {"train_loss": -6.278070449829102, "global_step": 89017, "epoch": 2119} {"train_loss": -6.270293235778809, "global_step": 89018, "epoch": 2119} {"train_loss": -6.145033836364746, "global_step": 89019, "epoch": 2119} {"train_loss": -6.200064659118652, "global_step": 89020, "epoch": 2119} {"train_loss": -6.263774394989014, "global_step": 89021, "epoch": 2119} {"train_loss": -6.1870646476745605, "global_step": 89022, "epoch": 2119} {"train_loss": -6.307343482971191, "global_step": 89023, "epoch": 2119} {"train_loss": -6.263435363769531, "global_step": 89024, "epoch": 2119} {"train_loss": -6.393145561218262, "global_step": 89025, "epoch": 2119} {"train_loss": -6.148689270019531, "global_step": 89026, "epoch": 2119} {"train_loss": -6.185461044311523, "global_step": 89027, "epoch": 2119} {"train_loss": -6.209201812744141, "global_step": 89028, "epoch": 2119} {"train_loss": -6.2859392166137695, "global_step": 89029, "epoch": 2119} {"train_loss": -6.070450305938721, "global_step": 89030, "epoch": 2119} {"train_loss": -6.258487224578857, "global_step": 89031, "epoch": 2119} {"train_loss": -6.028951644897461, "global_step": 89032, "epoch": 2119} {"train_loss": -6.082818508148193, "global_step": 89033, "epoch": 2119} {"train_loss": -6.027307033538818, "global_step": 89034, "epoch": 2119} {"train_loss": -6.184345245361328, "global_step": 89035, "epoch": 2119} {"train_loss": -6.21873140335083, "global_step": 89036, "epoch": 2119} {"train_loss": -6.068228721618652, "global_step": 89037, "epoch": 2119} {"train_loss": -6.268572807312012, "global_step": 89038, "epoch": 2119} {"train_loss": -6.223085051491147, "global_step": 89039, "epoch": 2119, "val_loss": 75651.625} {"train_loss": -6.194379806518555, "global_step": 89040, "epoch": 2120} {"train_loss": -6.184514999389648, "global_step": 89041, "epoch": 2120} {"train_loss": -6.242319583892822, "global_step": 89042, "epoch": 2120} {"train_loss": -6.244348526000977, "global_step": 89043, "epoch": 2120} {"train_loss": -6.143774509429932, "global_step": 89044, "epoch": 2120} {"train_loss": -6.169122695922852, "global_step": 89045, "epoch": 2120} {"train_loss": -6.222624778747559, "global_step": 89046, "epoch": 2120} {"train_loss": -6.197642803192139, "global_step": 89047, "epoch": 2120} {"train_loss": -6.203851222991943, "global_step": 89048, "epoch": 2120} {"train_loss": -6.221827507019043, "global_step": 89049, "epoch": 2120} {"train_loss": -6.174111366271973, "global_step": 89050, "epoch": 2120} {"train_loss": -6.271475791931152, "global_step": 89051, "epoch": 2120} {"train_loss": -6.2499589920043945, "global_step": 89052, "epoch": 2120} {"train_loss": -6.214406967163086, "global_step": 89053, "epoch": 2120} {"train_loss": -6.2582688331604, "global_step": 89054, "epoch": 2120} {"train_loss": -6.2179694175720215, "global_step": 89055, "epoch": 2120} {"train_loss": -6.210407257080078, "global_step": 89056, "epoch": 2120} {"train_loss": -6.114771842956543, "global_step": 89057, "epoch": 2120} {"train_loss": -6.250558376312256, "global_step": 89058, "epoch": 2120} {"train_loss": -6.182184219360352, "global_step": 89059, "epoch": 2120} {"train_loss": -6.0401835441589355, "global_step": 89060, "epoch": 2120} {"train_loss": -6.198174476623535, "global_step": 89061, "epoch": 2120} {"train_loss": -6.239153861999512, "global_step": 89062, "epoch": 2120} {"train_loss": -6.1093034744262695, "global_step": 89063, "epoch": 2120} {"train_loss": -6.276456356048584, "global_step": 89064, "epoch": 2120} {"train_loss": -6.104073524475098, "global_step": 89065, "epoch": 2120} {"train_loss": -6.162139892578125, "global_step": 89066, "epoch": 2120} {"train_loss": -6.282820701599121, "global_step": 89067, "epoch": 2120} {"train_loss": -6.127820014953613, "global_step": 89068, "epoch": 2120} {"train_loss": -6.239091873168945, "global_step": 89069, "epoch": 2120} {"train_loss": -6.337746620178223, "global_step": 89070, "epoch": 2120} {"train_loss": -6.173719882965088, "global_step": 89071, "epoch": 2120} {"train_loss": -6.229432582855225, "global_step": 89072, "epoch": 2120} {"train_loss": -6.304460525512695, "global_step": 89073, "epoch": 2120} {"train_loss": -6.24484920501709, "global_step": 89074, "epoch": 2120} {"train_loss": -6.250796794891357, "global_step": 89075, "epoch": 2120} {"train_loss": -6.152458667755127, "global_step": 89076, "epoch": 2120} {"train_loss": -6.221837997436523, "global_step": 89077, "epoch": 2120} {"train_loss": -6.314306259155273, "global_step": 89078, "epoch": 2120} {"train_loss": -6.231912612915039, "global_step": 89079, "epoch": 2120} {"train_loss": -6.133451461791992, "global_step": 89080, "epoch": 2120} {"train_loss": -6.209410406294323, "global_step": 89081, "epoch": 2120, "val_loss": 75354.109375} {"train_loss": -6.246840476989746, "global_step": 89082, "epoch": 2121} {"train_loss": -6.1711273193359375, "global_step": 89083, "epoch": 2121} {"train_loss": -6.265454292297363, "global_step": 89084, "epoch": 2121} {"train_loss": -6.1900715827941895, "global_step": 89085, "epoch": 2121} {"train_loss": -6.260954856872559, "global_step": 89086, "epoch": 2121} {"train_loss": -6.187230110168457, "global_step": 89087, "epoch": 2121} {"train_loss": -6.189615249633789, "global_step": 89088, "epoch": 2121} {"train_loss": -6.217108726501465, "global_step": 89089, "epoch": 2121} {"train_loss": -6.160357475280762, "global_step": 89090, "epoch": 2121} {"train_loss": -6.325626373291016, "global_step": 89091, "epoch": 2121} {"train_loss": -6.134667873382568, "global_step": 89092, "epoch": 2121} {"train_loss": -6.123796463012695, "global_step": 89093, "epoch": 2121} {"train_loss": -6.224679470062256, "global_step": 89094, "epoch": 2121} {"train_loss": -6.218069076538086, "global_step": 89095, "epoch": 2121} {"train_loss": -6.141240119934082, "global_step": 89096, "epoch": 2121} {"train_loss": -6.2418131828308105, "global_step": 89097, "epoch": 2121} {"train_loss": -6.183709144592285, "global_step": 89098, "epoch": 2121} {"train_loss": -6.311287879943848, "global_step": 89099, "epoch": 2121} {"train_loss": -6.162644386291504, "global_step": 89100, "epoch": 2121} {"train_loss": -6.226712226867676, "global_step": 89101, "epoch": 2121} {"train_loss": -6.217013359069824, "global_step": 89102, "epoch": 2121} {"train_loss": -6.10107946395874, "global_step": 89103, "epoch": 2121} {"train_loss": -6.155487060546875, "global_step": 89104, "epoch": 2121} {"train_loss": -6.304596424102783, "global_step": 89105, "epoch": 2121} {"train_loss": -6.074402809143066, "global_step": 89106, "epoch": 2121} {"train_loss": -6.207046985626221, "global_step": 89107, "epoch": 2121} {"train_loss": -6.097489356994629, "global_step": 89108, "epoch": 2121} {"train_loss": -6.190672874450684, "global_step": 89109, "epoch": 2121} {"train_loss": -6.313347816467285, "global_step": 89110, "epoch": 2121} {"train_loss": -6.2663187980651855, "global_step": 89111, "epoch": 2121} {"train_loss": -6.229386329650879, "global_step": 89112, "epoch": 2121} {"train_loss": -6.216212272644043, "global_step": 89113, "epoch": 2121} {"train_loss": -6.076115608215332, "global_step": 89114, "epoch": 2121} {"train_loss": -6.2423176765441895, "global_step": 89115, "epoch": 2121} {"train_loss": -6.25588846206665, "global_step": 89116, "epoch": 2121} {"train_loss": -6.216386795043945, "global_step": 89117, "epoch": 2121} {"train_loss": -6.232785224914551, "global_step": 89118, "epoch": 2121} {"train_loss": -6.397087574005127, "global_step": 89119, "epoch": 2121} {"train_loss": -6.181303024291992, "global_step": 89120, "epoch": 2121} {"train_loss": -6.305887222290039, "global_step": 89121, "epoch": 2121} {"train_loss": -6.209532737731934, "global_step": 89122, "epoch": 2121} {"train_loss": -6.2119298208327525, "global_step": 89123, "epoch": 2121, "val_loss": 75174.359375} {"train_loss": -6.232813835144043, "global_step": 89124, "epoch": 2122} {"train_loss": -6.26183557510376, "global_step": 89125, "epoch": 2122} {"train_loss": -6.072787761688232, "global_step": 89126, "epoch": 2122} {"train_loss": -6.215048789978027, "global_step": 89127, "epoch": 2122} {"train_loss": -6.2833452224731445, "global_step": 89128, "epoch": 2122} {"train_loss": -6.272351264953613, "global_step": 89129, "epoch": 2122} {"train_loss": -6.291533470153809, "global_step": 89130, "epoch": 2122} {"train_loss": -6.228896141052246, "global_step": 89131, "epoch": 2122} {"train_loss": -6.304648399353027, "global_step": 89132, "epoch": 2122} {"train_loss": -6.332663059234619, "global_step": 89133, "epoch": 2122} {"train_loss": -6.263874530792236, "global_step": 89134, "epoch": 2122} {"train_loss": -6.199941635131836, "global_step": 89135, "epoch": 2122} {"train_loss": -6.247791290283203, "global_step": 89136, "epoch": 2122} {"train_loss": -6.2432475090026855, "global_step": 89137, "epoch": 2122} {"train_loss": -6.2851715087890625, "global_step": 89138, "epoch": 2122} {"train_loss": -6.188179969787598, "global_step": 89139, "epoch": 2122} {"train_loss": -6.242961883544922, "global_step": 89140, "epoch": 2122} {"train_loss": -6.188626289367676, "global_step": 89141, "epoch": 2122} {"train_loss": -6.185019016265869, "global_step": 89142, "epoch": 2122} {"train_loss": -6.30747127532959, "global_step": 89143, "epoch": 2122} {"train_loss": -6.157918930053711, "global_step": 89144, "epoch": 2122} {"train_loss": -6.343701362609863, "global_step": 89145, "epoch": 2122} {"train_loss": -6.304680824279785, "global_step": 89146, "epoch": 2122} {"train_loss": -6.165902137756348, "global_step": 89147, "epoch": 2122} {"train_loss": -6.256412506103516, "global_step": 89148, "epoch": 2122} {"train_loss": -6.193877696990967, "global_step": 89149, "epoch": 2122} {"train_loss": -6.309487342834473, "global_step": 89150, "epoch": 2122} {"train_loss": -6.242734432220459, "global_step": 89151, "epoch": 2122} {"train_loss": -6.217076301574707, "global_step": 89152, "epoch": 2122} {"train_loss": -6.26133918762207, "global_step": 89153, "epoch": 2122} {"train_loss": -6.203145980834961, "global_step": 89154, "epoch": 2122} {"train_loss": -6.186432838439941, "global_step": 89155, "epoch": 2122} {"train_loss": -6.1670451164245605, "global_step": 89156, "epoch": 2122} {"train_loss": -6.153206825256348, "global_step": 89157, "epoch": 2122} {"train_loss": -6.070582389831543, "global_step": 89158, "epoch": 2122} {"train_loss": -6.285099983215332, "global_step": 89159, "epoch": 2122} {"train_loss": -6.260719299316406, "global_step": 89160, "epoch": 2122} {"train_loss": -6.225815773010254, "global_step": 89161, "epoch": 2122} {"train_loss": -6.301796913146973, "global_step": 89162, "epoch": 2122} {"train_loss": -6.272443771362305, "global_step": 89163, "epoch": 2122} {"train_loss": -6.178520202636719, "global_step": 89164, "epoch": 2122} {"train_loss": -6.234470810209002, "global_step": 89165, "epoch": 2122, "val_loss": 75318.671875} {"train_loss": -6.282133102416992, "global_step": 89166, "epoch": 2123} {"train_loss": -6.065509796142578, "global_step": 89167, "epoch": 2123} {"train_loss": -6.175935745239258, "global_step": 89168, "epoch": 2123} {"train_loss": -6.110707759857178, "global_step": 89169, "epoch": 2123} {"train_loss": -6.212441921234131, "global_step": 89170, "epoch": 2123} {"train_loss": -6.313161849975586, "global_step": 89171, "epoch": 2123} {"train_loss": -6.139621734619141, "global_step": 89172, "epoch": 2123} {"train_loss": -6.195072174072266, "global_step": 89173, "epoch": 2123} {"train_loss": -6.269083023071289, "global_step": 89174, "epoch": 2123} {"train_loss": -6.253353118896484, "global_step": 89175, "epoch": 2123} {"train_loss": -6.245662689208984, "global_step": 89176, "epoch": 2123} {"train_loss": -6.283675670623779, "global_step": 89177, "epoch": 2123} {"train_loss": -6.27193546295166, "global_step": 89178, "epoch": 2123} {"train_loss": -6.13460636138916, "global_step": 89179, "epoch": 2123} {"train_loss": -6.2367939949035645, "global_step": 89180, "epoch": 2123} {"train_loss": -6.34157657623291, "global_step": 89181, "epoch": 2123} {"train_loss": -6.276727676391602, "global_step": 89182, "epoch": 2123} {"train_loss": -6.179383277893066, "global_step": 89183, "epoch": 2123} {"train_loss": -6.141789436340332, "global_step": 89184, "epoch": 2123} {"train_loss": -6.268446922302246, "global_step": 89185, "epoch": 2123} {"train_loss": -6.286041259765625, "global_step": 89186, "epoch": 2123} {"train_loss": -6.286937713623047, "global_step": 89187, "epoch": 2123} {"train_loss": -6.319350242614746, "global_step": 89188, "epoch": 2123} {"train_loss": -6.337479591369629, "global_step": 89189, "epoch": 2123} {"train_loss": -6.380701065063477, "global_step": 89190, "epoch": 2123} {"train_loss": -6.236444473266602, "global_step": 89191, "epoch": 2123} {"train_loss": -6.211948394775391, "global_step": 89192, "epoch": 2123} {"train_loss": -6.315862655639648, "global_step": 89193, "epoch": 2123} {"train_loss": -6.249457836151123, "global_step": 89194, "epoch": 2123} {"train_loss": -6.280149936676025, "global_step": 89195, "epoch": 2123} {"train_loss": -6.247012138366699, "global_step": 89196, "epoch": 2123} {"train_loss": -6.270432472229004, "global_step": 89197, "epoch": 2123} {"train_loss": -6.221691608428955, "global_step": 89198, "epoch": 2123} {"train_loss": -6.3090057373046875, "global_step": 89199, "epoch": 2123} {"train_loss": -6.23852014541626, "global_step": 89200, "epoch": 2123} {"train_loss": -6.322897434234619, "global_step": 89201, "epoch": 2123} {"train_loss": -6.177005290985107, "global_step": 89202, "epoch": 2123} {"train_loss": -6.229527473449707, "global_step": 89203, "epoch": 2123} {"train_loss": -6.263637542724609, "global_step": 89204, "epoch": 2123} {"train_loss": -6.219520568847656, "global_step": 89205, "epoch": 2123} {"train_loss": -6.247565269470215, "global_step": 89206, "epoch": 2123} {"train_loss": -6.2442726748330255, "global_step": 89207, "epoch": 2123, "val_loss": 75173.375} {"train_loss": -6.2864203453063965, "global_step": 89208, "epoch": 2124} {"train_loss": -6.237349033355713, "global_step": 89209, "epoch": 2124} {"train_loss": -6.169340133666992, "global_step": 89210, "epoch": 2124} {"train_loss": -6.248867034912109, "global_step": 89211, "epoch": 2124} {"train_loss": -6.227836608886719, "global_step": 89212, "epoch": 2124} {"train_loss": -6.2676100730896, "global_step": 89213, "epoch": 2124} {"train_loss": -6.361835479736328, "global_step": 89214, "epoch": 2124} {"train_loss": -6.329356670379639, "global_step": 89215, "epoch": 2124} {"train_loss": -6.2112226486206055, "global_step": 89216, "epoch": 2124} {"train_loss": -6.126071453094482, "global_step": 89217, "epoch": 2124} {"train_loss": -6.169186115264893, "global_step": 89218, "epoch": 2124} {"train_loss": -6.151253700256348, "global_step": 89219, "epoch": 2124} {"train_loss": -6.229876518249512, "global_step": 89220, "epoch": 2124} {"train_loss": -6.210714817047119, "global_step": 89221, "epoch": 2124} {"train_loss": -6.230775833129883, "global_step": 89222, "epoch": 2124} {"train_loss": -6.077482223510742, "global_step": 89223, "epoch": 2124} {"train_loss": -6.126569747924805, "global_step": 89224, "epoch": 2124} {"train_loss": -6.262253284454346, "global_step": 89225, "epoch": 2124} {"train_loss": -6.290346145629883, "global_step": 89226, "epoch": 2124} {"train_loss": -6.311025619506836, "global_step": 89227, "epoch": 2124} {"train_loss": -6.241154670715332, "global_step": 89228, "epoch": 2124} {"train_loss": -6.137896537780762, "global_step": 89229, "epoch": 2124} {"train_loss": -6.237875938415527, "global_step": 89230, "epoch": 2124} {"train_loss": -6.1505351066589355, "global_step": 89231, "epoch": 2124} {"train_loss": -6.252536296844482, "global_step": 89232, "epoch": 2124} {"train_loss": -6.291103839874268, "global_step": 89233, "epoch": 2124} {"train_loss": -6.213601112365723, "global_step": 89234, "epoch": 2124} {"train_loss": -6.342034339904785, "global_step": 89235, "epoch": 2124} {"train_loss": -6.205469131469727, "global_step": 89236, "epoch": 2124} {"train_loss": -6.220915794372559, "global_step": 89237, "epoch": 2124} {"train_loss": -6.220166206359863, "global_step": 89238, "epoch": 2124} {"train_loss": -6.252827167510986, "global_step": 89239, "epoch": 2124} {"train_loss": -6.184848785400391, "global_step": 89240, "epoch": 2124} {"train_loss": -6.3208909034729, "global_step": 89241, "epoch": 2124} {"train_loss": -6.175093650817871, "global_step": 89242, "epoch": 2124} {"train_loss": -6.191717147827148, "global_step": 89243, "epoch": 2124} {"train_loss": -6.307465553283691, "global_step": 89244, "epoch": 2124} {"train_loss": -6.108268737792969, "global_step": 89245, "epoch": 2124} {"train_loss": -6.27595329284668, "global_step": 89246, "epoch": 2124} {"train_loss": -6.252444267272949, "global_step": 89247, "epoch": 2124} {"train_loss": -6.217337131500244, "global_step": 89248, "epoch": 2124} {"train_loss": -6.229536669594901, "global_step": 89249, "epoch": 2124, "val_loss": 75317.46875} {"train_loss": -6.161913871765137, "global_step": 89250, "epoch": 2125} {"train_loss": -6.251767158508301, "global_step": 89251, "epoch": 2125} {"train_loss": -6.184216499328613, "global_step": 89252, "epoch": 2125} {"train_loss": -6.21210241317749, "global_step": 89253, "epoch": 2125} {"train_loss": -6.2744035720825195, "global_step": 89254, "epoch": 2125} {"train_loss": -6.203178882598877, "global_step": 89255, "epoch": 2125} {"train_loss": -6.255892276763916, "global_step": 89256, "epoch": 2125} {"train_loss": -6.199797630310059, "global_step": 89257, "epoch": 2125} {"train_loss": -6.320303916931152, "global_step": 89258, "epoch": 2125} {"train_loss": -6.191446304321289, "global_step": 89259, "epoch": 2125} {"train_loss": -6.27518367767334, "global_step": 89260, "epoch": 2125} {"train_loss": -6.177656650543213, "global_step": 89261, "epoch": 2125} {"train_loss": -6.245654106140137, "global_step": 89262, "epoch": 2125} {"train_loss": -6.26591682434082, "global_step": 89263, "epoch": 2125} {"train_loss": -6.269491672515869, "global_step": 89264, "epoch": 2125} {"train_loss": -6.234700679779053, "global_step": 89265, "epoch": 2125} {"train_loss": -6.235182762145996, "global_step": 89266, "epoch": 2125} {"train_loss": -6.370636940002441, "global_step": 89267, "epoch": 2125} {"train_loss": -6.291437149047852, "global_step": 89268, "epoch": 2125} {"train_loss": -6.273041725158691, "global_step": 89269, "epoch": 2125} {"train_loss": -6.1696624755859375, "global_step": 89270, "epoch": 2125} {"train_loss": -6.243319511413574, "global_step": 89271, "epoch": 2125} {"train_loss": -6.329432487487793, "global_step": 89272, "epoch": 2125} {"train_loss": -6.2585859298706055, "global_step": 89273, "epoch": 2125} {"train_loss": -6.264162063598633, "global_step": 89274, "epoch": 2125} {"train_loss": -6.1851348876953125, "global_step": 89275, "epoch": 2125} {"train_loss": -6.2563652992248535, "global_step": 89276, "epoch": 2125} {"train_loss": -6.314698219299316, "global_step": 89277, "epoch": 2125} {"train_loss": -6.312509536743164, "global_step": 89278, "epoch": 2125} {"train_loss": -6.184578895568848, "global_step": 89279, "epoch": 2125} {"train_loss": -6.286961555480957, "global_step": 89280, "epoch": 2125} {"train_loss": -6.109755516052246, "global_step": 89281, "epoch": 2125} {"train_loss": -6.246070861816406, "global_step": 89282, "epoch": 2125} {"train_loss": -6.348966598510742, "global_step": 89283, "epoch": 2125} {"train_loss": -6.311863899230957, "global_step": 89284, "epoch": 2125} {"train_loss": -6.232614994049072, "global_step": 89285, "epoch": 2125} {"train_loss": -6.275740623474121, "global_step": 89286, "epoch": 2125} {"train_loss": -6.259390354156494, "global_step": 89287, "epoch": 2125} {"train_loss": -6.206640243530273, "global_step": 89288, "epoch": 2125} {"train_loss": -6.226803302764893, "global_step": 89289, "epoch": 2125} {"train_loss": -6.2419047355651855, "global_step": 89290, "epoch": 2125} {"train_loss": -6.244484470004127, "global_step": 89291, "epoch": 2125, "val_loss": 75475.6328125} {"train_loss": -6.193902969360352, "global_step": 89292, "epoch": 2126} {"train_loss": -6.222303867340088, "global_step": 89293, "epoch": 2126} {"train_loss": -6.260119438171387, "global_step": 89294, "epoch": 2126} {"train_loss": -6.209344863891602, "global_step": 89295, "epoch": 2126} {"train_loss": -6.159588813781738, "global_step": 89296, "epoch": 2126} {"train_loss": -6.074282646179199, "global_step": 89297, "epoch": 2126} {"train_loss": -6.186053276062012, "global_step": 89298, "epoch": 2126} {"train_loss": -6.094130992889404, "global_step": 89299, "epoch": 2126} {"train_loss": -6.2683424949646, "global_step": 89300, "epoch": 2126} {"train_loss": -6.224262714385986, "global_step": 89301, "epoch": 2126} {"train_loss": -6.223163604736328, "global_step": 89302, "epoch": 2126} {"train_loss": -6.19488525390625, "global_step": 89303, "epoch": 2126} {"train_loss": -6.168875217437744, "global_step": 89304, "epoch": 2126} {"train_loss": -6.093320846557617, "global_step": 89305, "epoch": 2126} {"train_loss": -6.197565078735352, "global_step": 89306, "epoch": 2126} {"train_loss": -6.1453022956848145, "global_step": 89307, "epoch": 2126} {"train_loss": -6.256204605102539, "global_step": 89308, "epoch": 2126} {"train_loss": -6.282540798187256, "global_step": 89309, "epoch": 2126} {"train_loss": -6.208103179931641, "global_step": 89310, "epoch": 2126} {"train_loss": -6.084292888641357, "global_step": 89311, "epoch": 2126} {"train_loss": -6.215590000152588, "global_step": 89312, "epoch": 2126} {"train_loss": -6.220177173614502, "global_step": 89313, "epoch": 2126} {"train_loss": -6.170208930969238, "global_step": 89314, "epoch": 2126} {"train_loss": -6.154427528381348, "global_step": 89315, "epoch": 2126} {"train_loss": -6.275415420532227, "global_step": 89316, "epoch": 2126} {"train_loss": -6.279783248901367, "global_step": 89317, "epoch": 2126} {"train_loss": -6.143458366394043, "global_step": 89318, "epoch": 2126} {"train_loss": -6.257942199707031, "global_step": 89319, "epoch": 2126} {"train_loss": -6.202748775482178, "global_step": 89320, "epoch": 2126} {"train_loss": -6.271169662475586, "global_step": 89321, "epoch": 2126} {"train_loss": -6.316720008850098, "global_step": 89322, "epoch": 2126} {"train_loss": -6.145583629608154, "global_step": 89323, "epoch": 2126} {"train_loss": -6.316305637359619, "global_step": 89324, "epoch": 2126} {"train_loss": -6.152477264404297, "global_step": 89325, "epoch": 2126} {"train_loss": -6.066178321838379, "global_step": 89326, "epoch": 2126} {"train_loss": -6.13897705078125, "global_step": 89327, "epoch": 2126} {"train_loss": -6.210529327392578, "global_step": 89328, "epoch": 2126} {"train_loss": -6.1417741775512695, "global_step": 89329, "epoch": 2126} {"train_loss": -6.140696048736572, "global_step": 89330, "epoch": 2126} {"train_loss": -6.124248504638672, "global_step": 89331, "epoch": 2126} {"train_loss": -6.113266944885254, "global_step": 89332, "epoch": 2126} {"train_loss": -6.1894800662994385, "global_step": 89333, "epoch": 2126, "val_loss": 75336.5703125} {"train_loss": -6.174516677856445, "global_step": 89334, "epoch": 2127} {"train_loss": -6.251046180725098, "global_step": 89335, "epoch": 2127} {"train_loss": -6.263064384460449, "global_step": 89336, "epoch": 2127} {"train_loss": -6.0972580909729, "global_step": 89337, "epoch": 2127} {"train_loss": -6.268247127532959, "global_step": 89338, "epoch": 2127} {"train_loss": -6.236541748046875, "global_step": 89339, "epoch": 2127} {"train_loss": -6.305758476257324, "global_step": 89340, "epoch": 2127} {"train_loss": -6.08924674987793, "global_step": 89341, "epoch": 2127} {"train_loss": -6.166808128356934, "global_step": 89342, "epoch": 2127} {"train_loss": -6.241780757904053, "global_step": 89343, "epoch": 2127} {"train_loss": -6.143838405609131, "global_step": 89344, "epoch": 2127} {"train_loss": -6.263978958129883, "global_step": 89345, "epoch": 2127} {"train_loss": -6.173589706420898, "global_step": 89346, "epoch": 2127} {"train_loss": -5.956513404846191, "global_step": 89347, "epoch": 2127} {"train_loss": -6.045784950256348, "global_step": 89348, "epoch": 2127} {"train_loss": -6.027328014373779, "global_step": 89349, "epoch": 2127} {"train_loss": -6.214119911193848, "global_step": 89350, "epoch": 2127} {"train_loss": -5.906362533569336, "global_step": 89351, "epoch": 2127} {"train_loss": -6.2859086990356445, "global_step": 89352, "epoch": 2127} {"train_loss": -6.150001049041748, "global_step": 89353, "epoch": 2127} {"train_loss": -6.124349117279053, "global_step": 89354, "epoch": 2127} {"train_loss": -6.21723747253418, "global_step": 89355, "epoch": 2127} {"train_loss": -6.234553337097168, "global_step": 89356, "epoch": 2127} {"train_loss": -6.076984882354736, "global_step": 89357, "epoch": 2127} {"train_loss": -6.211264610290527, "global_step": 89358, "epoch": 2127} {"train_loss": -6.270328521728516, "global_step": 89359, "epoch": 2127} {"train_loss": -6.154172420501709, "global_step": 89360, "epoch": 2127} {"train_loss": -6.292882442474365, "global_step": 89361, "epoch": 2127} {"train_loss": -6.227715969085693, "global_step": 89362, "epoch": 2127} {"train_loss": -6.1989006996154785, "global_step": 89363, "epoch": 2127} {"train_loss": -6.199092388153076, "global_step": 89364, "epoch": 2127} {"train_loss": -6.2212677001953125, "global_step": 89365, "epoch": 2127} {"train_loss": -6.277285575866699, "global_step": 89366, "epoch": 2127} {"train_loss": -6.227313995361328, "global_step": 89367, "epoch": 2127} {"train_loss": -6.1961259841918945, "global_step": 89368, "epoch": 2127} {"train_loss": -6.084786891937256, "global_step": 89369, "epoch": 2127} {"train_loss": -6.192668914794922, "global_step": 89370, "epoch": 2127} {"train_loss": -6.178287982940674, "global_step": 89371, "epoch": 2127} {"train_loss": -6.279473781585693, "global_step": 89372, "epoch": 2127} {"train_loss": -6.296259880065918, "global_step": 89373, "epoch": 2127} {"train_loss": -6.21608829498291, "global_step": 89374, "epoch": 2127} {"train_loss": -6.1922079267955965, "global_step": 89375, "epoch": 2127, "val_loss": 75293.3984375} {"train_loss": -6.335563659667969, "global_step": 89376, "epoch": 2128} {"train_loss": -6.309365749359131, "global_step": 89377, "epoch": 2128} {"train_loss": -6.31748104095459, "global_step": 89378, "epoch": 2128} {"train_loss": -6.206554412841797, "global_step": 89379, "epoch": 2128} {"train_loss": -6.2501115798950195, "global_step": 89380, "epoch": 2128} {"train_loss": -6.2445292472839355, "global_step": 89381, "epoch": 2128} {"train_loss": -6.242684841156006, "global_step": 89382, "epoch": 2128} {"train_loss": -6.1669921875, "global_step": 89383, "epoch": 2128} {"train_loss": -6.259871959686279, "global_step": 89384, "epoch": 2128} {"train_loss": -6.177446365356445, "global_step": 89385, "epoch": 2128} {"train_loss": -6.263410568237305, "global_step": 89386, "epoch": 2128} {"train_loss": -6.2487568855285645, "global_step": 89387, "epoch": 2128} {"train_loss": -6.30842924118042, "global_step": 89388, "epoch": 2128} {"train_loss": -6.203415393829346, "global_step": 89389, "epoch": 2128} {"train_loss": -6.339905261993408, "global_step": 89390, "epoch": 2128} {"train_loss": -6.0973052978515625, "global_step": 89391, "epoch": 2128} {"train_loss": -6.2594780921936035, "global_step": 89392, "epoch": 2128} {"train_loss": -6.1471052169799805, "global_step": 89393, "epoch": 2128} {"train_loss": -6.266368865966797, "global_step": 89394, "epoch": 2128} {"train_loss": -6.199989318847656, "global_step": 89395, "epoch": 2128} {"train_loss": -6.286384582519531, "global_step": 89396, "epoch": 2128} {"train_loss": -6.272172451019287, "global_step": 89397, "epoch": 2128} {"train_loss": -6.166806221008301, "global_step": 89398, "epoch": 2128} {"train_loss": -6.1678147315979, "global_step": 89399, "epoch": 2128} {"train_loss": -6.324790954589844, "global_step": 89400, "epoch": 2128} {"train_loss": -6.254863739013672, "global_step": 89401, "epoch": 2128} {"train_loss": -6.163421630859375, "global_step": 89402, "epoch": 2128} {"train_loss": -6.199948310852051, "global_step": 89403, "epoch": 2128} {"train_loss": -6.231868743896484, "global_step": 89404, "epoch": 2128} {"train_loss": -6.140166759490967, "global_step": 89405, "epoch": 2128} {"train_loss": -6.281709671020508, "global_step": 89406, "epoch": 2128} {"train_loss": -6.239103317260742, "global_step": 89407, "epoch": 2128} {"train_loss": -6.275093078613281, "global_step": 89408, "epoch": 2128} {"train_loss": -6.274830341339111, "global_step": 89409, "epoch": 2128} {"train_loss": -6.243593215942383, "global_step": 89410, "epoch": 2128} {"train_loss": -6.120139122009277, "global_step": 89411, "epoch": 2128} {"train_loss": -6.2091875076293945, "global_step": 89412, "epoch": 2128} {"train_loss": -6.2484893798828125, "global_step": 89413, "epoch": 2128} {"train_loss": -6.223967552185059, "global_step": 89414, "epoch": 2128} {"train_loss": -6.229128360748291, "global_step": 89415, "epoch": 2128} {"train_loss": -6.242807388305664, "global_step": 89416, "epoch": 2128} {"train_loss": -6.232602085386004, "global_step": 89417, "epoch": 2128, "val_loss": 75468.625} {"train_loss": -6.243476867675781, "global_step": 89418, "epoch": 2129} {"train_loss": -6.262627601623535, "global_step": 89419, "epoch": 2129} {"train_loss": -6.289421081542969, "global_step": 89420, "epoch": 2129} {"train_loss": -6.141531944274902, "global_step": 89421, "epoch": 2129} {"train_loss": -6.307589530944824, "global_step": 89422, "epoch": 2129} {"train_loss": -6.254973411560059, "global_step": 89423, "epoch": 2129} {"train_loss": -6.17674446105957, "global_step": 89424, "epoch": 2129} {"train_loss": -6.203646659851074, "global_step": 89425, "epoch": 2129} {"train_loss": -6.219470977783203, "global_step": 89426, "epoch": 2129} {"train_loss": -6.243992805480957, "global_step": 89427, "epoch": 2129} {"train_loss": -6.2535786628723145, "global_step": 89428, "epoch": 2129} {"train_loss": -6.179880619049072, "global_step": 89429, "epoch": 2129} {"train_loss": -6.3793487548828125, "global_step": 89430, "epoch": 2129} {"train_loss": -6.297556400299072, "global_step": 89431, "epoch": 2129} {"train_loss": -6.137063026428223, "global_step": 89432, "epoch": 2129} {"train_loss": -6.231316566467285, "global_step": 89433, "epoch": 2129} {"train_loss": -6.217470169067383, "global_step": 89434, "epoch": 2129} {"train_loss": -6.014869689941406, "global_step": 89435, "epoch": 2129} {"train_loss": -6.212704658508301, "global_step": 89436, "epoch": 2129} {"train_loss": -6.147459506988525, "global_step": 89437, "epoch": 2129} {"train_loss": -6.142346382141113, "global_step": 89438, "epoch": 2129} {"train_loss": -6.182503700256348, "global_step": 89439, "epoch": 2129} {"train_loss": -6.053521156311035, "global_step": 89440, "epoch": 2129} {"train_loss": -6.21361780166626, "global_step": 89441, "epoch": 2129} {"train_loss": -6.238356113433838, "global_step": 89442, "epoch": 2129} {"train_loss": -6.1590576171875, "global_step": 89443, "epoch": 2129} {"train_loss": -6.240705966949463, "global_step": 89444, "epoch": 2129} {"train_loss": -6.246410369873047, "global_step": 89445, "epoch": 2129} {"train_loss": -6.192266464233398, "global_step": 89446, "epoch": 2129} {"train_loss": -6.274800777435303, "global_step": 89447, "epoch": 2129} {"train_loss": -6.281337261199951, "global_step": 89448, "epoch": 2129} {"train_loss": -6.067593097686768, "global_step": 89449, "epoch": 2129} {"train_loss": -6.1516432762146, "global_step": 89450, "epoch": 2129} {"train_loss": -6.258692741394043, "global_step": 89451, "epoch": 2129} {"train_loss": -6.222835540771484, "global_step": 89452, "epoch": 2129} {"train_loss": -6.168667793273926, "global_step": 89453, "epoch": 2129} {"train_loss": -6.3097825050354, "global_step": 89454, "epoch": 2129} {"train_loss": -6.236034393310547, "global_step": 89455, "epoch": 2129} {"train_loss": -6.226729393005371, "global_step": 89456, "epoch": 2129} {"train_loss": -6.212924957275391, "global_step": 89457, "epoch": 2129} {"train_loss": -6.283392906188965, "global_step": 89458, "epoch": 2129} {"train_loss": -6.213284685498192, "global_step": 89459, "epoch": 2129, "val_loss": 75176.3515625} {"train_loss": -6.250320911407471, "global_step": 89460, "epoch": 2130} {"train_loss": -6.252886772155762, "global_step": 89461, "epoch": 2130} {"train_loss": -6.161375999450684, "global_step": 89462, "epoch": 2130} {"train_loss": -6.318833827972412, "global_step": 89463, "epoch": 2130} {"train_loss": -6.422741413116455, "global_step": 89464, "epoch": 2130} {"train_loss": -6.124082088470459, "global_step": 89465, "epoch": 2130} {"train_loss": -6.245431423187256, "global_step": 89466, "epoch": 2130} {"train_loss": -6.290393829345703, "global_step": 89467, "epoch": 2130} {"train_loss": -6.250977039337158, "global_step": 89468, "epoch": 2130} {"train_loss": -6.307718276977539, "global_step": 89469, "epoch": 2130} {"train_loss": -6.273116111755371, "global_step": 89470, "epoch": 2130} {"train_loss": -6.381616115570068, "global_step": 89471, "epoch": 2130} {"train_loss": -6.117778778076172, "global_step": 89472, "epoch": 2130} {"train_loss": -6.2429304122924805, "global_step": 89473, "epoch": 2130} {"train_loss": -6.058932781219482, "global_step": 89474, "epoch": 2130} {"train_loss": -6.287720680236816, "global_step": 89475, "epoch": 2130} {"train_loss": -6.114267826080322, "global_step": 89476, "epoch": 2130} {"train_loss": -6.0866379737854, "global_step": 89477, "epoch": 2130} {"train_loss": -6.281233310699463, "global_step": 89478, "epoch": 2130} {"train_loss": -6.071946620941162, "global_step": 89479, "epoch": 2130} {"train_loss": -6.029549598693848, "global_step": 89480, "epoch": 2130} {"train_loss": -6.28046178817749, "global_step": 89481, "epoch": 2130} {"train_loss": -6.159362316131592, "global_step": 89482, "epoch": 2130} {"train_loss": -6.233836650848389, "global_step": 89483, "epoch": 2130} {"train_loss": -6.15878963470459, "global_step": 89484, "epoch": 2130} {"train_loss": -6.150884628295898, "global_step": 89485, "epoch": 2130} {"train_loss": -6.217073440551758, "global_step": 89486, "epoch": 2130} {"train_loss": -6.1144304275512695, "global_step": 89487, "epoch": 2130} {"train_loss": -6.179283618927002, "global_step": 89488, "epoch": 2130} {"train_loss": -6.161630630493164, "global_step": 89489, "epoch": 2130} {"train_loss": -6.184843063354492, "global_step": 89490, "epoch": 2130} {"train_loss": -6.134418487548828, "global_step": 89491, "epoch": 2130} {"train_loss": -6.141909599304199, "global_step": 89492, "epoch": 2130} {"train_loss": -6.238380432128906, "global_step": 89493, "epoch": 2130} {"train_loss": -6.227894306182861, "global_step": 89494, "epoch": 2130} {"train_loss": -6.206042766571045, "global_step": 89495, "epoch": 2130} {"train_loss": -6.144798278808594, "global_step": 89496, "epoch": 2130} {"train_loss": -6.274852752685547, "global_step": 89497, "epoch": 2130} {"train_loss": -6.131522178649902, "global_step": 89498, "epoch": 2130} {"train_loss": -6.213812828063965, "global_step": 89499, "epoch": 2130} {"train_loss": -6.180312156677246, "global_step": 89500, "epoch": 2130} {"train_loss": -6.202721232459659, "global_step": 89501, "epoch": 2130, "val_loss": 75407.625} {"train_loss": -6.220485210418701, "global_step": 89502, "epoch": 2131} {"train_loss": -6.294513702392578, "global_step": 89503, "epoch": 2131} {"train_loss": -6.221491813659668, "global_step": 89504, "epoch": 2131} {"train_loss": -6.201459884643555, "global_step": 89505, "epoch": 2131} {"train_loss": -6.09722900390625, "global_step": 89506, "epoch": 2131} {"train_loss": -6.222670555114746, "global_step": 89507, "epoch": 2131} {"train_loss": -6.233817100524902, "global_step": 89508, "epoch": 2131} {"train_loss": -6.2183074951171875, "global_step": 89509, "epoch": 2131} {"train_loss": -6.131999969482422, "global_step": 89510, "epoch": 2131} {"train_loss": -6.235411643981934, "global_step": 89511, "epoch": 2131} {"train_loss": -6.187023639678955, "global_step": 89512, "epoch": 2131} {"train_loss": -6.196933746337891, "global_step": 89513, "epoch": 2131} {"train_loss": -6.257530689239502, "global_step": 89514, "epoch": 2131} {"train_loss": -6.202395439147949, "global_step": 89515, "epoch": 2131} {"train_loss": -6.147169589996338, "global_step": 89516, "epoch": 2131} {"train_loss": -6.084353446960449, "global_step": 89517, "epoch": 2131} {"train_loss": -6.3248982429504395, "global_step": 89518, "epoch": 2131} {"train_loss": -6.105682373046875, "global_step": 89519, "epoch": 2131} {"train_loss": -6.1883320808410645, "global_step": 89520, "epoch": 2131} {"train_loss": -6.440329551696777, "global_step": 89521, "epoch": 2131} {"train_loss": -6.030343055725098, "global_step": 89522, "epoch": 2131} {"train_loss": -6.24654483795166, "global_step": 89523, "epoch": 2131} {"train_loss": -6.173305511474609, "global_step": 89524, "epoch": 2131} {"train_loss": -6.230003356933594, "global_step": 89525, "epoch": 2131} {"train_loss": -6.108266353607178, "global_step": 89526, "epoch": 2131} {"train_loss": -6.245029926300049, "global_step": 89527, "epoch": 2131} {"train_loss": -6.2621588706970215, "global_step": 89528, "epoch": 2131} {"train_loss": -6.226433277130127, "global_step": 89529, "epoch": 2131} {"train_loss": -6.327217102050781, "global_step": 89530, "epoch": 2131} {"train_loss": -6.219006538391113, "global_step": 89531, "epoch": 2131} {"train_loss": -6.338953495025635, "global_step": 89532, "epoch": 2131} {"train_loss": -6.297978401184082, "global_step": 89533, "epoch": 2131} {"train_loss": -6.215137481689453, "global_step": 89534, "epoch": 2131} {"train_loss": -6.165355205535889, "global_step": 89535, "epoch": 2131} {"train_loss": -6.263716220855713, "global_step": 89536, "epoch": 2131} {"train_loss": -6.280747413635254, "global_step": 89537, "epoch": 2131} {"train_loss": -6.204301834106445, "global_step": 89538, "epoch": 2131} {"train_loss": -6.308732986450195, "global_step": 89539, "epoch": 2131} {"train_loss": -6.149165153503418, "global_step": 89540, "epoch": 2131} {"train_loss": -6.219942092895508, "global_step": 89541, "epoch": 2131} {"train_loss": -6.286684989929199, "global_step": 89542, "epoch": 2131} {"train_loss": -6.216474090303693, "global_step": 89543, "epoch": 2131, "val_loss": 75720.234375} {"train_loss": -6.166828155517578, "global_step": 89544, "epoch": 2132} {"train_loss": -6.2729926109313965, "global_step": 89545, "epoch": 2132} {"train_loss": -6.076535224914551, "global_step": 89546, "epoch": 2132} {"train_loss": -6.263936996459961, "global_step": 89547, "epoch": 2132} {"train_loss": -6.156371116638184, "global_step": 89548, "epoch": 2132} {"train_loss": -6.0947265625, "global_step": 89549, "epoch": 2132} {"train_loss": -6.22381591796875, "global_step": 89550, "epoch": 2132} {"train_loss": -6.1616950035095215, "global_step": 89551, "epoch": 2132} {"train_loss": -6.14764404296875, "global_step": 89552, "epoch": 2132} {"train_loss": -6.171972274780273, "global_step": 89553, "epoch": 2132} {"train_loss": -6.1056132316589355, "global_step": 89554, "epoch": 2132} {"train_loss": -6.1844024658203125, "global_step": 89555, "epoch": 2132} {"train_loss": -6.094411849975586, "global_step": 89556, "epoch": 2132} {"train_loss": -6.175117492675781, "global_step": 89557, "epoch": 2132} {"train_loss": -6.222527503967285, "global_step": 89558, "epoch": 2132} {"train_loss": -6.0280232429504395, "global_step": 89559, "epoch": 2132} {"train_loss": -6.040881156921387, "global_step": 89560, "epoch": 2132} {"train_loss": -6.081151008605957, "global_step": 89561, "epoch": 2132} {"train_loss": -6.208329677581787, "global_step": 89562, "epoch": 2132} {"train_loss": -6.093246936798096, "global_step": 89563, "epoch": 2132} {"train_loss": -6.158700942993164, "global_step": 89564, "epoch": 2132} {"train_loss": -6.230102062225342, "global_step": 89565, "epoch": 2132} {"train_loss": -6.131984710693359, "global_step": 89566, "epoch": 2132} {"train_loss": -6.235964775085449, "global_step": 89567, "epoch": 2132} {"train_loss": -6.235527038574219, "global_step": 89568, "epoch": 2132} {"train_loss": -6.241783142089844, "global_step": 89569, "epoch": 2132} {"train_loss": -6.142581939697266, "global_step": 89570, "epoch": 2132} {"train_loss": -6.275056838989258, "global_step": 89571, "epoch": 2132} {"train_loss": -6.231105327606201, "global_step": 89572, "epoch": 2132} {"train_loss": -6.285874843597412, "global_step": 89573, "epoch": 2132} {"train_loss": -6.199425220489502, "global_step": 89574, "epoch": 2132} {"train_loss": -6.288134574890137, "global_step": 89575, "epoch": 2132} {"train_loss": -6.260467052459717, "global_step": 89576, "epoch": 2132} {"train_loss": -6.245384216308594, "global_step": 89577, "epoch": 2132} {"train_loss": -6.223111152648926, "global_step": 89578, "epoch": 2132} {"train_loss": -6.189818382263184, "global_step": 89579, "epoch": 2132} {"train_loss": -6.092508316040039, "global_step": 89580, "epoch": 2132} {"train_loss": -6.257749557495117, "global_step": 89581, "epoch": 2132} {"train_loss": -6.2592878341674805, "global_step": 89582, "epoch": 2132} {"train_loss": -6.187991142272949, "global_step": 89583, "epoch": 2132} {"train_loss": -6.160891532897949, "global_step": 89584, "epoch": 2132} {"train_loss": -6.1847444375356035, "global_step": 89585, "epoch": 2132, "val_loss": 75382.3671875} {"train_loss": -6.247766494750977, "global_step": 89586, "epoch": 2133} {"train_loss": -6.200258255004883, "global_step": 89587, "epoch": 2133} {"train_loss": -6.2456159591674805, "global_step": 89588, "epoch": 2133} {"train_loss": -6.2367448806762695, "global_step": 89589, "epoch": 2133} {"train_loss": -6.125794887542725, "global_step": 89590, "epoch": 2133} {"train_loss": -6.079558849334717, "global_step": 89591, "epoch": 2133} {"train_loss": -6.087571144104004, "global_step": 89592, "epoch": 2133} {"train_loss": -6.2141499519348145, "global_step": 89593, "epoch": 2133} {"train_loss": -6.187738418579102, "global_step": 89594, "epoch": 2133} {"train_loss": -6.188932418823242, "global_step": 89595, "epoch": 2133} {"train_loss": -6.110539436340332, "global_step": 89596, "epoch": 2133} {"train_loss": -6.18772554397583, "global_step": 89597, "epoch": 2133} {"train_loss": -6.012990951538086, "global_step": 89598, "epoch": 2133} {"train_loss": -6.0015950202941895, "global_step": 89599, "epoch": 2133} {"train_loss": -6.182242393493652, "global_step": 89600, "epoch": 2133} {"train_loss": -6.172351360321045, "global_step": 89601, "epoch": 2133} {"train_loss": -6.23651123046875, "global_step": 89602, "epoch": 2133} {"train_loss": -6.2883758544921875, "global_step": 89603, "epoch": 2133} {"train_loss": -6.191982269287109, "global_step": 89604, "epoch": 2133} {"train_loss": -6.10554313659668, "global_step": 89605, "epoch": 2133} {"train_loss": -6.256425380706787, "global_step": 89606, "epoch": 2133} {"train_loss": -6.196856498718262, "global_step": 89607, "epoch": 2133} {"train_loss": -6.133448123931885, "global_step": 89608, "epoch": 2133} {"train_loss": -6.129545211791992, "global_step": 89609, "epoch": 2133} {"train_loss": -6.26173210144043, "global_step": 89610, "epoch": 2133} {"train_loss": -6.180157661437988, "global_step": 89611, "epoch": 2133} {"train_loss": -6.307538986206055, "global_step": 89612, "epoch": 2133} {"train_loss": -6.225006580352783, "global_step": 89613, "epoch": 2133} {"train_loss": -6.330552101135254, "global_step": 89614, "epoch": 2133} {"train_loss": -6.247165679931641, "global_step": 89615, "epoch": 2133} {"train_loss": -6.187743186950684, "global_step": 89616, "epoch": 2133} {"train_loss": -6.287373065948486, "global_step": 89617, "epoch": 2133} {"train_loss": -6.337162971496582, "global_step": 89618, "epoch": 2133} {"train_loss": -6.153413772583008, "global_step": 89619, "epoch": 2133} {"train_loss": -6.17301082611084, "global_step": 89620, "epoch": 2133} {"train_loss": -6.2848615646362305, "global_step": 89621, "epoch": 2133} {"train_loss": -6.165165901184082, "global_step": 89622, "epoch": 2133} {"train_loss": -6.341302871704102, "global_step": 89623, "epoch": 2133} {"train_loss": -6.344387531280518, "global_step": 89624, "epoch": 2133} {"train_loss": -6.248829364776611, "global_step": 89625, "epoch": 2133} {"train_loss": -6.317697525024414, "global_step": 89626, "epoch": 2133} {"train_loss": -6.20701881817409, "global_step": 89627, "epoch": 2133, "val_loss": 75005.8984375} {"train_loss": -6.360299110412598, "global_step": 89628, "epoch": 2134} {"train_loss": -6.408355712890625, "global_step": 89629, "epoch": 2134} {"train_loss": -6.377819061279297, "global_step": 89630, "epoch": 2134} {"train_loss": -6.252266883850098, "global_step": 89631, "epoch": 2134} {"train_loss": -6.357964515686035, "global_step": 89632, "epoch": 2134} {"train_loss": -6.207669258117676, "global_step": 89633, "epoch": 2134} {"train_loss": -6.22587251663208, "global_step": 89634, "epoch": 2134} {"train_loss": -6.242713928222656, "global_step": 89635, "epoch": 2134} {"train_loss": -6.301664352416992, "global_step": 89636, "epoch": 2134} {"train_loss": -6.210228443145752, "global_step": 89637, "epoch": 2134} {"train_loss": -6.1717119216918945, "global_step": 89638, "epoch": 2134} {"train_loss": -6.244650840759277, "global_step": 89639, "epoch": 2134} {"train_loss": -6.056614398956299, "global_step": 89640, "epoch": 2134} {"train_loss": -6.2185516357421875, "global_step": 89641, "epoch": 2134} {"train_loss": -6.319056510925293, "global_step": 89642, "epoch": 2134} {"train_loss": -6.153824806213379, "global_step": 89643, "epoch": 2134} {"train_loss": -6.257742404937744, "global_step": 89644, "epoch": 2134} {"train_loss": -6.313472747802734, "global_step": 89645, "epoch": 2134} {"train_loss": -6.355582237243652, "global_step": 89646, "epoch": 2134} {"train_loss": -6.305249214172363, "global_step": 89647, "epoch": 2134} {"train_loss": -6.1919965744018555, "global_step": 89648, "epoch": 2134} {"train_loss": -6.2568840980529785, "global_step": 89649, "epoch": 2134} {"train_loss": -6.178237438201904, "global_step": 89650, "epoch": 2134} {"train_loss": -6.205401420593262, "global_step": 89651, "epoch": 2134} {"train_loss": -6.152130603790283, "global_step": 89652, "epoch": 2134} {"train_loss": -6.2871994972229, "global_step": 89653, "epoch": 2134} {"train_loss": -6.139700889587402, "global_step": 89654, "epoch": 2134} {"train_loss": -6.286796569824219, "global_step": 89655, "epoch": 2134} {"train_loss": -6.26210355758667, "global_step": 89656, "epoch": 2134} {"train_loss": -6.179230690002441, "global_step": 89657, "epoch": 2134} {"train_loss": -6.282792091369629, "global_step": 89658, "epoch": 2134} {"train_loss": -6.318174362182617, "global_step": 89659, "epoch": 2134} {"train_loss": -6.246498107910156, "global_step": 89660, "epoch": 2134} {"train_loss": -6.226858615875244, "global_step": 89661, "epoch": 2134} {"train_loss": -6.346523284912109, "global_step": 89662, "epoch": 2134} {"train_loss": -6.206264495849609, "global_step": 89663, "epoch": 2134} {"train_loss": -6.208304405212402, "global_step": 89664, "epoch": 2134} {"train_loss": -6.306517124176025, "global_step": 89665, "epoch": 2134} {"train_loss": -6.260110855102539, "global_step": 89666, "epoch": 2134} {"train_loss": -6.238062858581543, "global_step": 89667, "epoch": 2134} {"train_loss": -6.175211429595947, "global_step": 89668, "epoch": 2134} {"train_loss": -6.24767678124564, "global_step": 89669, "epoch": 2134, "val_loss": 75100.2734375} {"train_loss": -6.312045097351074, "global_step": 89670, "epoch": 2135} {"train_loss": -6.236855506896973, "global_step": 89671, "epoch": 2135} {"train_loss": -6.0821003913879395, "global_step": 89672, "epoch": 2135} {"train_loss": -6.31315803527832, "global_step": 89673, "epoch": 2135} {"train_loss": -6.271792411804199, "global_step": 89674, "epoch": 2135} {"train_loss": -6.212561130523682, "global_step": 89675, "epoch": 2135} {"train_loss": -6.162322521209717, "global_step": 89676, "epoch": 2135} {"train_loss": -6.346177101135254, "global_step": 89677, "epoch": 2135} {"train_loss": -6.240936756134033, "global_step": 89678, "epoch": 2135} {"train_loss": -6.143960475921631, "global_step": 89679, "epoch": 2135} {"train_loss": -6.247217655181885, "global_step": 89680, "epoch": 2135} {"train_loss": -6.139161109924316, "global_step": 89681, "epoch": 2135} {"train_loss": -6.281810283660889, "global_step": 89682, "epoch": 2135} {"train_loss": -6.263147354125977, "global_step": 89683, "epoch": 2135} {"train_loss": -6.157522678375244, "global_step": 89684, "epoch": 2135} {"train_loss": -6.265503883361816, "global_step": 89685, "epoch": 2135} {"train_loss": -6.048951148986816, "global_step": 89686, "epoch": 2135} {"train_loss": -6.216216087341309, "global_step": 89687, "epoch": 2135} {"train_loss": -6.195652961730957, "global_step": 89688, "epoch": 2135} {"train_loss": -6.213742256164551, "global_step": 89689, "epoch": 2135} {"train_loss": -6.150289535522461, "global_step": 89690, "epoch": 2135} {"train_loss": -6.229065895080566, "global_step": 89691, "epoch": 2135} {"train_loss": -6.235831260681152, "global_step": 89692, "epoch": 2135} {"train_loss": -6.308812618255615, "global_step": 89693, "epoch": 2135} {"train_loss": -6.234062194824219, "global_step": 89694, "epoch": 2135} {"train_loss": -6.296249866485596, "global_step": 89695, "epoch": 2135} {"train_loss": -6.265731334686279, "global_step": 89696, "epoch": 2135} {"train_loss": -6.232950687408447, "global_step": 89697, "epoch": 2135} {"train_loss": -6.32176399230957, "global_step": 89698, "epoch": 2135} {"train_loss": -6.1927080154418945, "global_step": 89699, "epoch": 2135} {"train_loss": -6.3173370361328125, "global_step": 89700, "epoch": 2135} {"train_loss": -6.234844207763672, "global_step": 89701, "epoch": 2135} {"train_loss": -6.25311803817749, "global_step": 89702, "epoch": 2135} {"train_loss": -6.259984970092773, "global_step": 89703, "epoch": 2135} {"train_loss": -6.164897918701172, "global_step": 89704, "epoch": 2135} {"train_loss": -6.265794277191162, "global_step": 89705, "epoch": 2135} {"train_loss": -6.339604377746582, "global_step": 89706, "epoch": 2135} {"train_loss": -6.167451858520508, "global_step": 89707, "epoch": 2135} {"train_loss": -6.2846574783325195, "global_step": 89708, "epoch": 2135} {"train_loss": -6.165936470031738, "global_step": 89709, "epoch": 2135} {"train_loss": -6.317716121673584, "global_step": 89710, "epoch": 2135} {"train_loss": -6.235648461750576, "global_step": 89711, "epoch": 2135, "val_loss": 75376.1640625} {"train_loss": -6.2493367195129395, "global_step": 89712, "epoch": 2136} {"train_loss": -6.298445701599121, "global_step": 89713, "epoch": 2136} {"train_loss": -6.268425941467285, "global_step": 89714, "epoch": 2136} {"train_loss": -6.273158073425293, "global_step": 89715, "epoch": 2136} {"train_loss": -6.279109001159668, "global_step": 89716, "epoch": 2136} {"train_loss": -6.25225305557251, "global_step": 89717, "epoch": 2136} {"train_loss": -6.2148518562316895, "global_step": 89718, "epoch": 2136} {"train_loss": -6.221598148345947, "global_step": 89719, "epoch": 2136} {"train_loss": -6.306569576263428, "global_step": 89720, "epoch": 2136} {"train_loss": -6.167109489440918, "global_step": 89721, "epoch": 2136} {"train_loss": -6.206502914428711, "global_step": 89722, "epoch": 2136} {"train_loss": -6.258057594299316, "global_step": 89723, "epoch": 2136} {"train_loss": -6.326940536499023, "global_step": 89724, "epoch": 2136} {"train_loss": -6.142324924468994, "global_step": 89725, "epoch": 2136} {"train_loss": -6.276849746704102, "global_step": 89726, "epoch": 2136} {"train_loss": -6.268218994140625, "global_step": 89727, "epoch": 2136} {"train_loss": -6.262750625610352, "global_step": 89728, "epoch": 2136} {"train_loss": -6.2694292068481445, "global_step": 89729, "epoch": 2136} {"train_loss": -6.286778450012207, "global_step": 89730, "epoch": 2136} {"train_loss": -6.226009845733643, "global_step": 89731, "epoch": 2136} {"train_loss": -6.174439430236816, "global_step": 89732, "epoch": 2136} {"train_loss": -6.301270484924316, "global_step": 89733, "epoch": 2136} {"train_loss": -6.386056900024414, "global_step": 89734, "epoch": 2136} {"train_loss": -6.304062366485596, "global_step": 89735, "epoch": 2136} {"train_loss": -6.379230499267578, "global_step": 89736, "epoch": 2136} {"train_loss": -6.244419097900391, "global_step": 89737, "epoch": 2136} {"train_loss": -6.208095550537109, "global_step": 89738, "epoch": 2136} {"train_loss": -6.30302619934082, "global_step": 89739, "epoch": 2136} {"train_loss": -6.251164436340332, "global_step": 89740, "epoch": 2136} {"train_loss": -6.276147365570068, "global_step": 89741, "epoch": 2136} {"train_loss": -6.296121597290039, "global_step": 89742, "epoch": 2136} {"train_loss": -6.343900203704834, "global_step": 89743, "epoch": 2136} {"train_loss": -6.3770599365234375, "global_step": 89744, "epoch": 2136} {"train_loss": -6.097141742706299, "global_step": 89745, "epoch": 2136} {"train_loss": -6.342986106872559, "global_step": 89746, "epoch": 2136} {"train_loss": -6.298022270202637, "global_step": 89747, "epoch": 2136} {"train_loss": -6.184417247772217, "global_step": 89748, "epoch": 2136} {"train_loss": -6.2441534996032715, "global_step": 89749, "epoch": 2136} {"train_loss": -6.294206619262695, "global_step": 89750, "epoch": 2136} {"train_loss": -6.377423286437988, "global_step": 89751, "epoch": 2136} {"train_loss": -6.1962785720825195, "global_step": 89752, "epoch": 2136} {"train_loss": -6.269863196781704, "global_step": 89753, "epoch": 2136, "val_loss": 75351.375} {"train_loss": -6.367891788482666, "global_step": 89754, "epoch": 2137} {"train_loss": -6.150464057922363, "global_step": 89755, "epoch": 2137} {"train_loss": -6.214663505554199, "global_step": 89756, "epoch": 2137} {"train_loss": -6.27803897857666, "global_step": 89757, "epoch": 2137} {"train_loss": -6.202045917510986, "global_step": 89758, "epoch": 2137} {"train_loss": -6.21830940246582, "global_step": 89759, "epoch": 2137} {"train_loss": -6.350667953491211, "global_step": 89760, "epoch": 2137} {"train_loss": -6.271089553833008, "global_step": 89761, "epoch": 2137} {"train_loss": -6.162546634674072, "global_step": 89762, "epoch": 2137} {"train_loss": -6.2255659103393555, "global_step": 89763, "epoch": 2137} {"train_loss": -6.205913543701172, "global_step": 89764, "epoch": 2137} {"train_loss": -6.2490997314453125, "global_step": 89765, "epoch": 2137} {"train_loss": -6.364609718322754, "global_step": 89766, "epoch": 2137} {"train_loss": -6.077969551086426, "global_step": 89767, "epoch": 2137} {"train_loss": -6.268951416015625, "global_step": 89768, "epoch": 2137} {"train_loss": -6.126840591430664, "global_step": 89769, "epoch": 2137} {"train_loss": -6.253955841064453, "global_step": 89770, "epoch": 2137} {"train_loss": -6.2541961669921875, "global_step": 89771, "epoch": 2137} {"train_loss": -6.152746200561523, "global_step": 89772, "epoch": 2137} {"train_loss": -6.16480016708374, "global_step": 89773, "epoch": 2137} {"train_loss": -6.135354995727539, "global_step": 89774, "epoch": 2137} {"train_loss": -6.249758720397949, "global_step": 89775, "epoch": 2137} {"train_loss": -6.159468173980713, "global_step": 89776, "epoch": 2137} {"train_loss": -6.097497940063477, "global_step": 89777, "epoch": 2137} {"train_loss": -6.218012809753418, "global_step": 89778, "epoch": 2137} {"train_loss": -6.127858638763428, "global_step": 89779, "epoch": 2137} {"train_loss": -6.251871109008789, "global_step": 89780, "epoch": 2137} {"train_loss": -6.220342636108398, "global_step": 89781, "epoch": 2137} {"train_loss": -6.295980453491211, "global_step": 89782, "epoch": 2137} {"train_loss": -6.099582672119141, "global_step": 89783, "epoch": 2137} {"train_loss": -6.361597061157227, "global_step": 89784, "epoch": 2137} {"train_loss": -6.258427143096924, "global_step": 89785, "epoch": 2137} {"train_loss": -6.314852714538574, "global_step": 89786, "epoch": 2137} {"train_loss": -6.287390232086182, "global_step": 89787, "epoch": 2137} {"train_loss": -6.105992317199707, "global_step": 89788, "epoch": 2137} {"train_loss": -6.26901912689209, "global_step": 89789, "epoch": 2137} {"train_loss": -6.269145965576172, "global_step": 89790, "epoch": 2137} {"train_loss": -6.300600051879883, "global_step": 89791, "epoch": 2137} {"train_loss": -6.175860404968262, "global_step": 89792, "epoch": 2137} {"train_loss": -6.2433881759643555, "global_step": 89793, "epoch": 2137} {"train_loss": -6.169168472290039, "global_step": 89794, "epoch": 2137} {"train_loss": -6.224197353635516, "global_step": 89795, "epoch": 2137, "val_loss": 75231.21875} {"train_loss": -6.349127292633057, "global_step": 89796, "epoch": 2138} {"train_loss": -6.314437389373779, "global_step": 89797, "epoch": 2138} {"train_loss": -6.157525539398193, "global_step": 89798, "epoch": 2138} {"train_loss": -6.299263954162598, "global_step": 89799, "epoch": 2138} {"train_loss": -6.226217269897461, "global_step": 89800, "epoch": 2138} {"train_loss": -6.254812240600586, "global_step": 89801, "epoch": 2138} {"train_loss": -6.264691352844238, "global_step": 89802, "epoch": 2138} {"train_loss": -6.14992618560791, "global_step": 89803, "epoch": 2138} {"train_loss": -6.158843040466309, "global_step": 89804, "epoch": 2138} {"train_loss": -6.13161563873291, "global_step": 89805, "epoch": 2138} {"train_loss": -6.331686019897461, "global_step": 89806, "epoch": 2138} {"train_loss": -6.207353591918945, "global_step": 89807, "epoch": 2138} {"train_loss": -6.368491172790527, "global_step": 89808, "epoch": 2138} {"train_loss": -6.266764163970947, "global_step": 89809, "epoch": 2138} {"train_loss": -6.1558074951171875, "global_step": 89810, "epoch": 2138} {"train_loss": -6.201046466827393, "global_step": 89811, "epoch": 2138} {"train_loss": -6.150184631347656, "global_step": 89812, "epoch": 2138} {"train_loss": -6.179635047912598, "global_step": 89813, "epoch": 2138} {"train_loss": -6.179943084716797, "global_step": 89814, "epoch": 2138} {"train_loss": -6.16901969909668, "global_step": 89815, "epoch": 2138} {"train_loss": -6.375065326690674, "global_step": 89816, "epoch": 2138} {"train_loss": -6.333999156951904, "global_step": 89817, "epoch": 2138} {"train_loss": -6.133198261260986, "global_step": 89818, "epoch": 2138} {"train_loss": -6.275198459625244, "global_step": 89819, "epoch": 2138} {"train_loss": -6.242709159851074, "global_step": 89820, "epoch": 2138} {"train_loss": -6.181760311126709, "global_step": 89821, "epoch": 2138} {"train_loss": -6.11210298538208, "global_step": 89822, "epoch": 2138} {"train_loss": -6.197216987609863, "global_step": 89823, "epoch": 2138} {"train_loss": -6.194124221801758, "global_step": 89824, "epoch": 2138} {"train_loss": -6.244090557098389, "global_step": 89825, "epoch": 2138} {"train_loss": -6.184757232666016, "global_step": 89826, "epoch": 2138} {"train_loss": -6.186519622802734, "global_step": 89827, "epoch": 2138} {"train_loss": -6.243735313415527, "global_step": 89828, "epoch": 2138} {"train_loss": -6.152797698974609, "global_step": 89829, "epoch": 2138} {"train_loss": -6.268367767333984, "global_step": 89830, "epoch": 2138} {"train_loss": -6.221802711486816, "global_step": 89831, "epoch": 2138} {"train_loss": -6.2115559577941895, "global_step": 89832, "epoch": 2138} {"train_loss": -6.138453483581543, "global_step": 89833, "epoch": 2138} {"train_loss": -6.085852146148682, "global_step": 89834, "epoch": 2138} {"train_loss": -6.140823841094971, "global_step": 89835, "epoch": 2138} {"train_loss": -6.174228668212891, "global_step": 89836, "epoch": 2138} {"train_loss": -6.211579845065162, "global_step": 89837, "epoch": 2138, "val_loss": 75355.25} {"train_loss": -6.168834686279297, "global_step": 89838, "epoch": 2139} {"train_loss": -6.170008659362793, "global_step": 89839, "epoch": 2139} {"train_loss": -6.271875381469727, "global_step": 89840, "epoch": 2139} {"train_loss": -6.138079643249512, "global_step": 89841, "epoch": 2139} {"train_loss": -6.156362533569336, "global_step": 89842, "epoch": 2139} {"train_loss": -6.285391807556152, "global_step": 89843, "epoch": 2139} {"train_loss": -6.174685001373291, "global_step": 89844, "epoch": 2139} {"train_loss": -6.207144737243652, "global_step": 89845, "epoch": 2139} {"train_loss": -6.158108234405518, "global_step": 89846, "epoch": 2139} {"train_loss": -6.2401533126831055, "global_step": 89847, "epoch": 2139} {"train_loss": -6.053859710693359, "global_step": 89848, "epoch": 2139} {"train_loss": -6.309840202331543, "global_step": 89849, "epoch": 2139} {"train_loss": -6.2917327880859375, "global_step": 89850, "epoch": 2139} {"train_loss": -6.206347465515137, "global_step": 89851, "epoch": 2139} {"train_loss": -6.252274990081787, "global_step": 89852, "epoch": 2139} {"train_loss": -6.241184234619141, "global_step": 89853, "epoch": 2139} {"train_loss": -6.247383117675781, "global_step": 89854, "epoch": 2139} {"train_loss": -6.131284236907959, "global_step": 89855, "epoch": 2139} {"train_loss": -6.243921756744385, "global_step": 89856, "epoch": 2139} {"train_loss": -6.097772598266602, "global_step": 89857, "epoch": 2139} {"train_loss": -6.229917526245117, "global_step": 89858, "epoch": 2139} {"train_loss": -6.157683849334717, "global_step": 89859, "epoch": 2139} {"train_loss": -6.1925764083862305, "global_step": 89860, "epoch": 2139} {"train_loss": -6.364649772644043, "global_step": 89861, "epoch": 2139} {"train_loss": -6.187795639038086, "global_step": 89862, "epoch": 2139} {"train_loss": -6.183137893676758, "global_step": 89863, "epoch": 2139} {"train_loss": -6.3254289627075195, "global_step": 89864, "epoch": 2139} {"train_loss": -6.289207458496094, "global_step": 89865, "epoch": 2139} {"train_loss": -6.175078392028809, "global_step": 89866, "epoch": 2139} {"train_loss": -6.2669148445129395, "global_step": 89867, "epoch": 2139} {"train_loss": -6.286462783813477, "global_step": 89868, "epoch": 2139} {"train_loss": -6.297828674316406, "global_step": 89869, "epoch": 2139} {"train_loss": -6.280832290649414, "global_step": 89870, "epoch": 2139} {"train_loss": -6.246380805969238, "global_step": 89871, "epoch": 2139} {"train_loss": -6.328946113586426, "global_step": 89872, "epoch": 2139} {"train_loss": -6.122230052947998, "global_step": 89873, "epoch": 2139} {"train_loss": -6.131354331970215, "global_step": 89874, "epoch": 2139} {"train_loss": -6.117018699645996, "global_step": 89875, "epoch": 2139} {"train_loss": -6.226759910583496, "global_step": 89876, "epoch": 2139} {"train_loss": -6.186175346374512, "global_step": 89877, "epoch": 2139} {"train_loss": -6.135684013366699, "global_step": 89878, "epoch": 2139} {"train_loss": -6.212397234780448, "global_step": 89879, "epoch": 2139, "val_loss": 75257.171875} {"train_loss": -6.282271385192871, "global_step": 89880, "epoch": 2140} {"train_loss": -6.280829429626465, "global_step": 89881, "epoch": 2140} {"train_loss": -6.266134262084961, "global_step": 89882, "epoch": 2140} {"train_loss": -6.2013840675354, "global_step": 89883, "epoch": 2140} {"train_loss": -6.1520819664001465, "global_step": 89884, "epoch": 2140} {"train_loss": -6.236418724060059, "global_step": 89885, "epoch": 2140} {"train_loss": -6.2505340576171875, "global_step": 89886, "epoch": 2140} {"train_loss": -6.109310626983643, "global_step": 89887, "epoch": 2140} {"train_loss": -6.275026321411133, "global_step": 89888, "epoch": 2140} {"train_loss": -6.195664882659912, "global_step": 89889, "epoch": 2140} {"train_loss": -6.1712446212768555, "global_step": 89890, "epoch": 2140} {"train_loss": -6.28439998626709, "global_step": 89891, "epoch": 2140} {"train_loss": -6.215303421020508, "global_step": 89892, "epoch": 2140} {"train_loss": -6.261806488037109, "global_step": 89893, "epoch": 2140} {"train_loss": -6.1776041984558105, "global_step": 89894, "epoch": 2140} {"train_loss": -6.258063316345215, "global_step": 89895, "epoch": 2140} {"train_loss": -6.305910587310791, "global_step": 89896, "epoch": 2140} {"train_loss": -6.035174369812012, "global_step": 89897, "epoch": 2140} {"train_loss": -6.306933403015137, "global_step": 89898, "epoch": 2140} {"train_loss": -6.256818771362305, "global_step": 89899, "epoch": 2140} {"train_loss": -6.0201416015625, "global_step": 89900, "epoch": 2140} {"train_loss": -6.281733989715576, "global_step": 89901, "epoch": 2140} {"train_loss": -6.214581489562988, "global_step": 89902, "epoch": 2140} {"train_loss": -6.1560187339782715, "global_step": 89903, "epoch": 2140} {"train_loss": -6.270760536193848, "global_step": 89904, "epoch": 2140} {"train_loss": -6.144693374633789, "global_step": 89905, "epoch": 2140} {"train_loss": -6.210126876831055, "global_step": 89906, "epoch": 2140} {"train_loss": -6.090867519378662, "global_step": 89907, "epoch": 2140} {"train_loss": -6.206562042236328, "global_step": 89908, "epoch": 2140} {"train_loss": -6.159665584564209, "global_step": 89909, "epoch": 2140} {"train_loss": -6.3402581214904785, "global_step": 89910, "epoch": 2140} {"train_loss": -6.185280799865723, "global_step": 89911, "epoch": 2140} {"train_loss": -6.225641250610352, "global_step": 89912, "epoch": 2140} {"train_loss": -6.325888156890869, "global_step": 89913, "epoch": 2140} {"train_loss": -6.181830883026123, "global_step": 89914, "epoch": 2140} {"train_loss": -6.2343034744262695, "global_step": 89915, "epoch": 2140} {"train_loss": -6.239954948425293, "global_step": 89916, "epoch": 2140} {"train_loss": -6.225167274475098, "global_step": 89917, "epoch": 2140} {"train_loss": -6.248810768127441, "global_step": 89918, "epoch": 2140} {"train_loss": -6.229840278625488, "global_step": 89919, "epoch": 2140} {"train_loss": -6.199517726898193, "global_step": 89920, "epoch": 2140} {"train_loss": -6.215132134301322, "global_step": 89921, "epoch": 2140, "val_loss": 75461.4375} {"train_loss": -6.231633186340332, "global_step": 89922, "epoch": 2141} {"train_loss": -6.167879104614258, "global_step": 89923, "epoch": 2141} {"train_loss": -6.25400972366333, "global_step": 89924, "epoch": 2141} {"train_loss": -6.26987361907959, "global_step": 89925, "epoch": 2141} {"train_loss": -6.218488693237305, "global_step": 89926, "epoch": 2141} {"train_loss": -6.297670841217041, "global_step": 89927, "epoch": 2141} {"train_loss": -6.269106864929199, "global_step": 89928, "epoch": 2141} {"train_loss": -6.271692276000977, "global_step": 89929, "epoch": 2141} {"train_loss": -6.231133460998535, "global_step": 89930, "epoch": 2141} {"train_loss": -6.260725498199463, "global_step": 89931, "epoch": 2141} {"train_loss": -6.27488899230957, "global_step": 89932, "epoch": 2141} {"train_loss": -6.225645542144775, "global_step": 89933, "epoch": 2141} {"train_loss": -6.220771789550781, "global_step": 89934, "epoch": 2141} {"train_loss": -6.267571449279785, "global_step": 89935, "epoch": 2141} {"train_loss": -6.266063690185547, "global_step": 89936, "epoch": 2141} {"train_loss": -6.249530792236328, "global_step": 89937, "epoch": 2141} {"train_loss": -6.27714729309082, "global_step": 89938, "epoch": 2141} {"train_loss": -6.173723220825195, "global_step": 89939, "epoch": 2141} {"train_loss": -6.413761138916016, "global_step": 89940, "epoch": 2141} {"train_loss": -6.140801429748535, "global_step": 89941, "epoch": 2141} {"train_loss": -6.301797866821289, "global_step": 89942, "epoch": 2141} {"train_loss": -6.306180477142334, "global_step": 89943, "epoch": 2141} {"train_loss": -6.386742115020752, "global_step": 89944, "epoch": 2141} {"train_loss": -6.401259899139404, "global_step": 89945, "epoch": 2141} {"train_loss": -6.179405212402344, "global_step": 89946, "epoch": 2141} {"train_loss": -6.2504658699035645, "global_step": 89947, "epoch": 2141} {"train_loss": -6.250300407409668, "global_step": 89948, "epoch": 2141} {"train_loss": -6.283013343811035, "global_step": 89949, "epoch": 2141} {"train_loss": -6.160038948059082, "global_step": 89950, "epoch": 2141} {"train_loss": -6.160642147064209, "global_step": 89951, "epoch": 2141} {"train_loss": -6.283432960510254, "global_step": 89952, "epoch": 2141} {"train_loss": -6.2641096115112305, "global_step": 89953, "epoch": 2141} {"train_loss": -6.082502365112305, "global_step": 89954, "epoch": 2141} {"train_loss": -6.263514518737793, "global_step": 89955, "epoch": 2141} {"train_loss": -6.077099800109863, "global_step": 89956, "epoch": 2141} {"train_loss": -6.218250274658203, "global_step": 89957, "epoch": 2141} {"train_loss": -6.196746826171875, "global_step": 89958, "epoch": 2141} {"train_loss": -6.1740312576293945, "global_step": 89959, "epoch": 2141} {"train_loss": -6.3256683349609375, "global_step": 89960, "epoch": 2141} {"train_loss": -6.274312496185303, "global_step": 89961, "epoch": 2141} {"train_loss": -6.317910671234131, "global_step": 89962, "epoch": 2141} {"train_loss": -6.24640028817313, "global_step": 89963, "epoch": 2141, "val_loss": 75355.046875} {"train_loss": -6.391160011291504, "global_step": 89964, "epoch": 2142} {"train_loss": -6.247177600860596, "global_step": 89965, "epoch": 2142} {"train_loss": -6.233565330505371, "global_step": 89966, "epoch": 2142} {"train_loss": -6.223372459411621, "global_step": 89967, "epoch": 2142} {"train_loss": -6.108142375946045, "global_step": 89968, "epoch": 2142} {"train_loss": -6.211893558502197, "global_step": 89969, "epoch": 2142} {"train_loss": -6.167603969573975, "global_step": 89970, "epoch": 2142} {"train_loss": -6.220356464385986, "global_step": 89971, "epoch": 2142} {"train_loss": -6.350246906280518, "global_step": 89972, "epoch": 2142} {"train_loss": -6.173557281494141, "global_step": 89973, "epoch": 2142} {"train_loss": -6.215086936950684, "global_step": 89974, "epoch": 2142} {"train_loss": -6.291959762573242, "global_step": 89975, "epoch": 2142} {"train_loss": -6.187560081481934, "global_step": 89976, "epoch": 2142} {"train_loss": -6.246338367462158, "global_step": 89977, "epoch": 2142} {"train_loss": -6.240139007568359, "global_step": 89978, "epoch": 2142} {"train_loss": -6.273069381713867, "global_step": 89979, "epoch": 2142} {"train_loss": -6.35299015045166, "global_step": 89980, "epoch": 2142} {"train_loss": -6.21258020401001, "global_step": 89981, "epoch": 2142} {"train_loss": -6.30396032333374, "global_step": 89982, "epoch": 2142} {"train_loss": -6.249286651611328, "global_step": 89983, "epoch": 2142} {"train_loss": -6.3178300857543945, "global_step": 89984, "epoch": 2142} {"train_loss": -6.192054271697998, "global_step": 89985, "epoch": 2142} {"train_loss": -6.326130390167236, "global_step": 89986, "epoch": 2142} {"train_loss": -6.22760009765625, "global_step": 89987, "epoch": 2142} {"train_loss": -6.146234035491943, "global_step": 89988, "epoch": 2142} {"train_loss": -6.318836212158203, "global_step": 89989, "epoch": 2142} {"train_loss": -6.144404411315918, "global_step": 89990, "epoch": 2142} {"train_loss": -6.229297161102295, "global_step": 89991, "epoch": 2142} {"train_loss": -6.304917335510254, "global_step": 89992, "epoch": 2142} {"train_loss": -6.341573238372803, "global_step": 89993, "epoch": 2142} {"train_loss": -6.2740912437438965, "global_step": 89994, "epoch": 2142} {"train_loss": -6.3863067626953125, "global_step": 89995, "epoch": 2142} {"train_loss": -6.212991237640381, "global_step": 89996, "epoch": 2142} {"train_loss": -6.243833065032959, "global_step": 89997, "epoch": 2142} {"train_loss": -6.3156585693359375, "global_step": 89998, "epoch": 2142} {"train_loss": -6.266777038574219, "global_step": 89999, "epoch": 2142} {"train_loss": -6.271384239196777, "global_step": 90000, "epoch": 2142} {"train_loss": -6.152983665466309, "global_step": 90001, "epoch": 2142} {"train_loss": -6.243001461029053, "global_step": 90002, "epoch": 2142} {"train_loss": -6.224449157714844, "global_step": 90003, "epoch": 2142} {"train_loss": -6.314939498901367, "global_step": 90004, "epoch": 2142} {"train_loss": -6.253124838783627, "global_step": 90005, "epoch": 2142, "val_loss": 75440.6953125} {"train_loss": -6.108346939086914, "global_step": 90006, "epoch": 2143} {"train_loss": -6.270231246948242, "global_step": 90007, "epoch": 2143} {"train_loss": -6.240888595581055, "global_step": 90008, "epoch": 2143} {"train_loss": -6.292939186096191, "global_step": 90009, "epoch": 2143} {"train_loss": -6.3944315910339355, "global_step": 90010, "epoch": 2143} {"train_loss": -6.279629707336426, "global_step": 90011, "epoch": 2143} {"train_loss": -6.1782684326171875, "global_step": 90012, "epoch": 2143} {"train_loss": -6.3402252197265625, "global_step": 90013, "epoch": 2143} {"train_loss": -6.268611431121826, "global_step": 90014, "epoch": 2143} {"train_loss": -6.247891426086426, "global_step": 90015, "epoch": 2143} {"train_loss": -6.305509567260742, "global_step": 90016, "epoch": 2143} {"train_loss": -6.157066345214844, "global_step": 90017, "epoch": 2143} {"train_loss": -6.264880180358887, "global_step": 90018, "epoch": 2143} {"train_loss": -6.217889785766602, "global_step": 90019, "epoch": 2143} {"train_loss": -6.217555999755859, "global_step": 90020, "epoch": 2143} {"train_loss": -6.287593841552734, "global_step": 90021, "epoch": 2143} {"train_loss": -6.120697021484375, "global_step": 90022, "epoch": 2143} {"train_loss": -6.311492919921875, "global_step": 90023, "epoch": 2143} {"train_loss": -6.304193496704102, "global_step": 90024, "epoch": 2143} {"train_loss": -6.258256912231445, "global_step": 90025, "epoch": 2143} {"train_loss": -6.299128532409668, "global_step": 90026, "epoch": 2143} {"train_loss": -6.265108108520508, "global_step": 90027, "epoch": 2143} {"train_loss": -6.159956932067871, "global_step": 90028, "epoch": 2143} {"train_loss": -6.3325605392456055, "global_step": 90029, "epoch": 2143} {"train_loss": -6.30940055847168, "global_step": 90030, "epoch": 2143} {"train_loss": -6.261202812194824, "global_step": 90031, "epoch": 2143} {"train_loss": -6.253087520599365, "global_step": 90032, "epoch": 2143} {"train_loss": -6.245984077453613, "global_step": 90033, "epoch": 2143} {"train_loss": -6.24616813659668, "global_step": 90034, "epoch": 2143} {"train_loss": -6.280612468719482, "global_step": 90035, "epoch": 2143} {"train_loss": -6.211430549621582, "global_step": 90036, "epoch": 2143} {"train_loss": -6.20828914642334, "global_step": 90037, "epoch": 2143} {"train_loss": -6.207064628601074, "global_step": 90038, "epoch": 2143} {"train_loss": -6.2559380531311035, "global_step": 90039, "epoch": 2143} {"train_loss": -6.249935150146484, "global_step": 90040, "epoch": 2143} {"train_loss": -6.308553218841553, "global_step": 90041, "epoch": 2143} {"train_loss": -6.2317280769348145, "global_step": 90042, "epoch": 2143} {"train_loss": -6.160787582397461, "global_step": 90043, "epoch": 2143} {"train_loss": -6.2252092361450195, "global_step": 90044, "epoch": 2143} {"train_loss": -6.216526508331299, "global_step": 90045, "epoch": 2143} {"train_loss": -6.21334171295166, "global_step": 90046, "epoch": 2143} {"train_loss": -6.247629721959432, "global_step": 90047, "epoch": 2143, "val_loss": 75591.765625} {"train_loss": -6.208126068115234, "global_step": 90048, "epoch": 2144} {"train_loss": -6.199721813201904, "global_step": 90049, "epoch": 2144} {"train_loss": -6.231959819793701, "global_step": 90050, "epoch": 2144} {"train_loss": -6.353692054748535, "global_step": 90051, "epoch": 2144} {"train_loss": -6.318341255187988, "global_step": 90052, "epoch": 2144} {"train_loss": -6.353353023529053, "global_step": 90053, "epoch": 2144} {"train_loss": -6.299164772033691, "global_step": 90054, "epoch": 2144} {"train_loss": -6.304894924163818, "global_step": 90055, "epoch": 2144} {"train_loss": -6.240607261657715, "global_step": 90056, "epoch": 2144} {"train_loss": -6.204476356506348, "global_step": 90057, "epoch": 2144} {"train_loss": -6.251703262329102, "global_step": 90058, "epoch": 2144} {"train_loss": -6.255077838897705, "global_step": 90059, "epoch": 2144} {"train_loss": -6.018267631530762, "global_step": 90060, "epoch": 2144} {"train_loss": -6.3020806312561035, "global_step": 90061, "epoch": 2144} {"train_loss": -6.083924770355225, "global_step": 90062, "epoch": 2144} {"train_loss": -6.162423610687256, "global_step": 90063, "epoch": 2144} {"train_loss": -6.216741561889648, "global_step": 90064, "epoch": 2144} {"train_loss": -6.062289237976074, "global_step": 90065, "epoch": 2144} {"train_loss": -6.2313055992126465, "global_step": 90066, "epoch": 2144} {"train_loss": -6.242156982421875, "global_step": 90067, "epoch": 2144} {"train_loss": -6.104585647583008, "global_step": 90068, "epoch": 2144} {"train_loss": -6.218539714813232, "global_step": 90069, "epoch": 2144} {"train_loss": -6.143232345581055, "global_step": 90070, "epoch": 2144} {"train_loss": -6.1903839111328125, "global_step": 90071, "epoch": 2144} {"train_loss": -6.2749342918396, "global_step": 90072, "epoch": 2144} {"train_loss": -6.121299743652344, "global_step": 90073, "epoch": 2144} {"train_loss": -6.296021461486816, "global_step": 90074, "epoch": 2144} {"train_loss": -6.31998872756958, "global_step": 90075, "epoch": 2144} {"train_loss": -6.301183700561523, "global_step": 90076, "epoch": 2144} {"train_loss": -6.339630603790283, "global_step": 90077, "epoch": 2144} {"train_loss": -6.305206298828125, "global_step": 90078, "epoch": 2144} {"train_loss": -6.186065673828125, "global_step": 90079, "epoch": 2144} {"train_loss": -6.15071439743042, "global_step": 90080, "epoch": 2144} {"train_loss": -6.262162685394287, "global_step": 90081, "epoch": 2144} {"train_loss": -6.2260026931762695, "global_step": 90082, "epoch": 2144} {"train_loss": -6.229569911956787, "global_step": 90083, "epoch": 2144} {"train_loss": -6.221147537231445, "global_step": 90084, "epoch": 2144} {"train_loss": -6.358611106872559, "global_step": 90085, "epoch": 2144} {"train_loss": -6.166131019592285, "global_step": 90086, "epoch": 2144} {"train_loss": -6.203097820281982, "global_step": 90087, "epoch": 2144} {"train_loss": -6.302432537078857, "global_step": 90088, "epoch": 2144} {"train_loss": -6.230894747234526, "global_step": 90089, "epoch": 2144, "val_loss": 75254.3828125} {"train_loss": -6.218689918518066, "global_step": 90090, "epoch": 2145} {"train_loss": -6.274553298950195, "global_step": 90091, "epoch": 2145} {"train_loss": -6.245664596557617, "global_step": 90092, "epoch": 2145} {"train_loss": -6.314541339874268, "global_step": 90093, "epoch": 2145} {"train_loss": -6.279184341430664, "global_step": 90094, "epoch": 2145} {"train_loss": -6.302298545837402, "global_step": 90095, "epoch": 2145} {"train_loss": -6.159912586212158, "global_step": 90096, "epoch": 2145} {"train_loss": -6.190130233764648, "global_step": 90097, "epoch": 2145} {"train_loss": -6.276178359985352, "global_step": 90098, "epoch": 2145} {"train_loss": -6.274714469909668, "global_step": 90099, "epoch": 2145} {"train_loss": -6.186501502990723, "global_step": 90100, "epoch": 2145} {"train_loss": -6.321704864501953, "global_step": 90101, "epoch": 2145} {"train_loss": -6.167959690093994, "global_step": 90102, "epoch": 2145} {"train_loss": -6.229820251464844, "global_step": 90103, "epoch": 2145} {"train_loss": -6.1653289794921875, "global_step": 90104, "epoch": 2145} {"train_loss": -6.245353698730469, "global_step": 90105, "epoch": 2145} {"train_loss": -6.154435157775879, "global_step": 90106, "epoch": 2145} {"train_loss": -6.257621765136719, "global_step": 90107, "epoch": 2145} {"train_loss": -6.055115699768066, "global_step": 90108, "epoch": 2145} {"train_loss": -6.1237897872924805, "global_step": 90109, "epoch": 2145} {"train_loss": -6.155320644378662, "global_step": 90110, "epoch": 2145} {"train_loss": -6.244002342224121, "global_step": 90111, "epoch": 2145} {"train_loss": -6.2622270584106445, "global_step": 90112, "epoch": 2145} {"train_loss": -6.124818801879883, "global_step": 90113, "epoch": 2145} {"train_loss": -6.291881561279297, "global_step": 90114, "epoch": 2145} {"train_loss": -6.123659610748291, "global_step": 90115, "epoch": 2145} {"train_loss": -6.21259069442749, "global_step": 90116, "epoch": 2145} {"train_loss": -6.182753086090088, "global_step": 90117, "epoch": 2145} {"train_loss": -6.300188064575195, "global_step": 90118, "epoch": 2145} {"train_loss": -6.166003704071045, "global_step": 90119, "epoch": 2145} {"train_loss": -6.181299209594727, "global_step": 90120, "epoch": 2145} {"train_loss": -6.252610206604004, "global_step": 90121, "epoch": 2145} {"train_loss": -6.408946514129639, "global_step": 90122, "epoch": 2145} {"train_loss": -6.271689414978027, "global_step": 90123, "epoch": 2145} {"train_loss": -6.306460857391357, "global_step": 90124, "epoch": 2145} {"train_loss": -6.234490394592285, "global_step": 90125, "epoch": 2145} {"train_loss": -6.221177101135254, "global_step": 90126, "epoch": 2145} {"train_loss": -6.2646989822387695, "global_step": 90127, "epoch": 2145} {"train_loss": -6.248469829559326, "global_step": 90128, "epoch": 2145} {"train_loss": -6.25527286529541, "global_step": 90129, "epoch": 2145} {"train_loss": -6.044201850891113, "global_step": 90130, "epoch": 2145} {"train_loss": -6.225285053253174, "global_step": 90131, "epoch": 2145, "val_loss": 75439.5} {"train_loss": -6.243568420410156, "global_step": 90132, "epoch": 2146} {"train_loss": -6.192625999450684, "global_step": 90133, "epoch": 2146} {"train_loss": -6.15418815612793, "global_step": 90134, "epoch": 2146} {"train_loss": -6.243888854980469, "global_step": 90135, "epoch": 2146} {"train_loss": -6.117426872253418, "global_step": 90136, "epoch": 2146} {"train_loss": -6.305973052978516, "global_step": 90137, "epoch": 2146} {"train_loss": -6.171352386474609, "global_step": 90138, "epoch": 2146} {"train_loss": -6.1637163162231445, "global_step": 90139, "epoch": 2146} {"train_loss": -6.265378952026367, "global_step": 90140, "epoch": 2146} {"train_loss": -6.095476150512695, "global_step": 90141, "epoch": 2146} {"train_loss": -6.320459365844727, "global_step": 90142, "epoch": 2146} {"train_loss": -6.212839603424072, "global_step": 90143, "epoch": 2146} {"train_loss": -6.181128025054932, "global_step": 90144, "epoch": 2146} {"train_loss": -6.2457966804504395, "global_step": 90145, "epoch": 2146} {"train_loss": -6.282597541809082, "global_step": 90146, "epoch": 2146} {"train_loss": -6.218019485473633, "global_step": 90147, "epoch": 2146} {"train_loss": -6.247086524963379, "global_step": 90148, "epoch": 2146} {"train_loss": -6.192625045776367, "global_step": 90149, "epoch": 2146} {"train_loss": -6.160523414611816, "global_step": 90150, "epoch": 2146} {"train_loss": -6.169498443603516, "global_step": 90151, "epoch": 2146} {"train_loss": -6.208802700042725, "global_step": 90152, "epoch": 2146} {"train_loss": -6.075412273406982, "global_step": 90153, "epoch": 2146} {"train_loss": -6.234888553619385, "global_step": 90154, "epoch": 2146} {"train_loss": -6.185403823852539, "global_step": 90155, "epoch": 2146} {"train_loss": -6.213179111480713, "global_step": 90156, "epoch": 2146} {"train_loss": -6.1398115158081055, "global_step": 90157, "epoch": 2146} {"train_loss": -6.057760238647461, "global_step": 90158, "epoch": 2146} {"train_loss": -6.223126411437988, "global_step": 90159, "epoch": 2146} {"train_loss": -6.307408809661865, "global_step": 90160, "epoch": 2146} {"train_loss": -6.2361249923706055, "global_step": 90161, "epoch": 2146} {"train_loss": -6.215388774871826, "global_step": 90162, "epoch": 2146} {"train_loss": -6.195981025695801, "global_step": 90163, "epoch": 2146} {"train_loss": -6.151150703430176, "global_step": 90164, "epoch": 2146} {"train_loss": -6.19410514831543, "global_step": 90165, "epoch": 2146} {"train_loss": -6.17669677734375, "global_step": 90166, "epoch": 2146} {"train_loss": -6.112318992614746, "global_step": 90167, "epoch": 2146} {"train_loss": -6.194618225097656, "global_step": 90168, "epoch": 2146} {"train_loss": -6.216719627380371, "global_step": 90169, "epoch": 2146} {"train_loss": -6.236449241638184, "global_step": 90170, "epoch": 2146} {"train_loss": -6.361940383911133, "global_step": 90171, "epoch": 2146} {"train_loss": -6.1673479080200195, "global_step": 90172, "epoch": 2146} {"train_loss": -6.202566907519386, "global_step": 90173, "epoch": 2146, "val_loss": 75572.6328125} {"train_loss": -6.193082809448242, "global_step": 90174, "epoch": 2147} {"train_loss": -6.241817474365234, "global_step": 90175, "epoch": 2147} {"train_loss": -6.17070198059082, "global_step": 90176, "epoch": 2147} {"train_loss": -6.151959419250488, "global_step": 90177, "epoch": 2147} {"train_loss": -6.233375549316406, "global_step": 90178, "epoch": 2147} {"train_loss": -6.255978107452393, "global_step": 90179, "epoch": 2147} {"train_loss": -6.245530128479004, "global_step": 90180, "epoch": 2147} {"train_loss": -6.236860752105713, "global_step": 90181, "epoch": 2147} {"train_loss": -6.094043731689453, "global_step": 90182, "epoch": 2147} {"train_loss": -6.145968437194824, "global_step": 90183, "epoch": 2147} {"train_loss": -6.182534217834473, "global_step": 90184, "epoch": 2147} {"train_loss": -6.283244609832764, "global_step": 90185, "epoch": 2147} {"train_loss": -6.174863338470459, "global_step": 90186, "epoch": 2147} {"train_loss": -6.290416717529297, "global_step": 90187, "epoch": 2147} {"train_loss": -6.335561275482178, "global_step": 90188, "epoch": 2147} {"train_loss": -6.237380027770996, "global_step": 90189, "epoch": 2147} {"train_loss": -6.160252571105957, "global_step": 90190, "epoch": 2147} {"train_loss": -6.310932636260986, "global_step": 90191, "epoch": 2147} {"train_loss": -6.1594061851501465, "global_step": 90192, "epoch": 2147} {"train_loss": -6.198309421539307, "global_step": 90193, "epoch": 2147} {"train_loss": -6.238602638244629, "global_step": 90194, "epoch": 2147} {"train_loss": -6.312854766845703, "global_step": 90195, "epoch": 2147} {"train_loss": -6.278654098510742, "global_step": 90196, "epoch": 2147} {"train_loss": -6.23878812789917, "global_step": 90197, "epoch": 2147} {"train_loss": -6.126979827880859, "global_step": 90198, "epoch": 2147} {"train_loss": -6.388766288757324, "global_step": 90199, "epoch": 2147} {"train_loss": -6.386826038360596, "global_step": 90200, "epoch": 2147} {"train_loss": -6.366942405700684, "global_step": 90201, "epoch": 2147} {"train_loss": -6.252483367919922, "global_step": 90202, "epoch": 2147} {"train_loss": -6.314886569976807, "global_step": 90203, "epoch": 2147} {"train_loss": -6.318515300750732, "global_step": 90204, "epoch": 2147} {"train_loss": -6.253615379333496, "global_step": 90205, "epoch": 2147} {"train_loss": -6.157476425170898, "global_step": 90206, "epoch": 2147} {"train_loss": -6.2239885330200195, "global_step": 90207, "epoch": 2147} {"train_loss": -6.371364593505859, "global_step": 90208, "epoch": 2147} {"train_loss": -6.2928266525268555, "global_step": 90209, "epoch": 2147} {"train_loss": -6.246823310852051, "global_step": 90210, "epoch": 2147} {"train_loss": -6.233163833618164, "global_step": 90211, "epoch": 2147} {"train_loss": -6.287957191467285, "global_step": 90212, "epoch": 2147} {"train_loss": -6.247224807739258, "global_step": 90213, "epoch": 2147} {"train_loss": -6.340570449829102, "global_step": 90214, "epoch": 2147} {"train_loss": -6.251139720280965, "global_step": 90215, "epoch": 2147, "val_loss": 75510.828125} {"train_loss": -6.337141036987305, "global_step": 90216, "epoch": 2148} {"train_loss": -6.337472438812256, "global_step": 90217, "epoch": 2148} {"train_loss": -6.282438278198242, "global_step": 90218, "epoch": 2148} {"train_loss": -6.3134918212890625, "global_step": 90219, "epoch": 2148} {"train_loss": -6.307655334472656, "global_step": 90220, "epoch": 2148} {"train_loss": -6.294565200805664, "global_step": 90221, "epoch": 2148} {"train_loss": -6.1888957023620605, "global_step": 90222, "epoch": 2148} {"train_loss": -6.176936149597168, "global_step": 90223, "epoch": 2148} {"train_loss": -6.266266345977783, "global_step": 90224, "epoch": 2148} {"train_loss": -6.335411071777344, "global_step": 90225, "epoch": 2148} {"train_loss": -6.320280075073242, "global_step": 90226, "epoch": 2148} {"train_loss": -6.259727954864502, "global_step": 90227, "epoch": 2148} {"train_loss": -6.245779991149902, "global_step": 90228, "epoch": 2148} {"train_loss": -6.217050075531006, "global_step": 90229, "epoch": 2148} {"train_loss": -6.077980041503906, "global_step": 90230, "epoch": 2148} {"train_loss": -6.1508965492248535, "global_step": 90231, "epoch": 2148} {"train_loss": -6.188138961791992, "global_step": 90232, "epoch": 2148} {"train_loss": -6.066526412963867, "global_step": 90233, "epoch": 2148} {"train_loss": -6.2190842628479, "global_step": 90234, "epoch": 2148} {"train_loss": -6.229933261871338, "global_step": 90235, "epoch": 2148} {"train_loss": -6.183712959289551, "global_step": 90236, "epoch": 2148} {"train_loss": -6.197977066040039, "global_step": 90237, "epoch": 2148} {"train_loss": -6.246756553649902, "global_step": 90238, "epoch": 2148} {"train_loss": -6.2116804122924805, "global_step": 90239, "epoch": 2148} {"train_loss": -6.12974739074707, "global_step": 90240, "epoch": 2148} {"train_loss": -6.119402885437012, "global_step": 90241, "epoch": 2148} {"train_loss": -6.1886305809021, "global_step": 90242, "epoch": 2148} {"train_loss": -6.153460502624512, "global_step": 90243, "epoch": 2148} {"train_loss": -6.190255165100098, "global_step": 90244, "epoch": 2148} {"train_loss": -6.131170272827148, "global_step": 90245, "epoch": 2148} {"train_loss": -6.186195373535156, "global_step": 90246, "epoch": 2148} {"train_loss": -6.222404479980469, "global_step": 90247, "epoch": 2148} {"train_loss": -6.283067226409912, "global_step": 90248, "epoch": 2148} {"train_loss": -6.228699207305908, "global_step": 90249, "epoch": 2148} {"train_loss": -6.156233787536621, "global_step": 90250, "epoch": 2148} {"train_loss": -6.222766876220703, "global_step": 90251, "epoch": 2148} {"train_loss": -6.190258979797363, "global_step": 90252, "epoch": 2148} {"train_loss": -6.1773200035095215, "global_step": 90253, "epoch": 2148} {"train_loss": -6.200927734375, "global_step": 90254, "epoch": 2148} {"train_loss": -6.217997074127197, "global_step": 90255, "epoch": 2148} {"train_loss": -6.170266151428223, "global_step": 90256, "epoch": 2148} {"train_loss": -6.214054391497657, "global_step": 90257, "epoch": 2148, "val_loss": 75347.7421875} {"train_loss": -6.181617736816406, "global_step": 90258, "epoch": 2149} {"train_loss": -6.144067764282227, "global_step": 90259, "epoch": 2149} {"train_loss": -6.208135604858398, "global_step": 90260, "epoch": 2149} {"train_loss": -6.25296688079834, "global_step": 90261, "epoch": 2149} {"train_loss": -6.162020683288574, "global_step": 90262, "epoch": 2149} {"train_loss": -6.160005569458008, "global_step": 90263, "epoch": 2149} {"train_loss": -6.177117347717285, "global_step": 90264, "epoch": 2149} {"train_loss": -6.2554473876953125, "global_step": 90265, "epoch": 2149} {"train_loss": -6.191439628601074, "global_step": 90266, "epoch": 2149} {"train_loss": -6.264309883117676, "global_step": 90267, "epoch": 2149} {"train_loss": -6.360214710235596, "global_step": 90268, "epoch": 2149} {"train_loss": -6.229619026184082, "global_step": 90269, "epoch": 2149} {"train_loss": -6.281776428222656, "global_step": 90270, "epoch": 2149} {"train_loss": -6.247151851654053, "global_step": 90271, "epoch": 2149} {"train_loss": -6.1421990394592285, "global_step": 90272, "epoch": 2149} {"train_loss": -6.2327117919921875, "global_step": 90273, "epoch": 2149} {"train_loss": -6.175813674926758, "global_step": 90274, "epoch": 2149} {"train_loss": -6.2624101638793945, "global_step": 90275, "epoch": 2149} {"train_loss": -6.311131477355957, "global_step": 90276, "epoch": 2149} {"train_loss": -6.119540214538574, "global_step": 90277, "epoch": 2149} {"train_loss": -6.374738693237305, "global_step": 90278, "epoch": 2149} {"train_loss": -6.243528366088867, "global_step": 90279, "epoch": 2149} {"train_loss": -6.249391555786133, "global_step": 90280, "epoch": 2149} {"train_loss": -6.3834004402160645, "global_step": 90281, "epoch": 2149} {"train_loss": -6.252869606018066, "global_step": 90282, "epoch": 2149} {"train_loss": -6.206385612487793, "global_step": 90283, "epoch": 2149} {"train_loss": -6.3231048583984375, "global_step": 90284, "epoch": 2149} {"train_loss": -6.185312271118164, "global_step": 90285, "epoch": 2149} {"train_loss": -6.266391754150391, "global_step": 90286, "epoch": 2149} {"train_loss": -6.177697658538818, "global_step": 90287, "epoch": 2149} {"train_loss": -6.126433372497559, "global_step": 90288, "epoch": 2149} {"train_loss": -6.244853973388672, "global_step": 90289, "epoch": 2149} {"train_loss": -6.073159694671631, "global_step": 90290, "epoch": 2149} {"train_loss": -6.2338457107543945, "global_step": 90291, "epoch": 2149} {"train_loss": -6.195049285888672, "global_step": 90292, "epoch": 2149} {"train_loss": -6.248926162719727, "global_step": 90293, "epoch": 2149} {"train_loss": -6.212562561035156, "global_step": 90294, "epoch": 2149} {"train_loss": -6.31326150894165, "global_step": 90295, "epoch": 2149} {"train_loss": -6.272432327270508, "global_step": 90296, "epoch": 2149} {"train_loss": -6.402602672576904, "global_step": 90297, "epoch": 2149} {"train_loss": -6.309453010559082, "global_step": 90298, "epoch": 2149} {"train_loss": -6.236075775963919, "global_step": 90299, "epoch": 2149, "val_loss": 75501.5234375} {"train_loss": -6.332126617431641, "global_step": 90300, "epoch": 2150} {"train_loss": -6.268610000610352, "global_step": 90301, "epoch": 2150} {"train_loss": -6.279910087585449, "global_step": 90302, "epoch": 2150} {"train_loss": -6.1836161613464355, "global_step": 90303, "epoch": 2150} {"train_loss": -6.165162086486816, "global_step": 90304, "epoch": 2150} {"train_loss": -6.156640529632568, "global_step": 90305, "epoch": 2150} {"train_loss": -6.263679504394531, "global_step": 90306, "epoch": 2150} {"train_loss": -6.216446876525879, "global_step": 90307, "epoch": 2150} {"train_loss": -6.240376949310303, "global_step": 90308, "epoch": 2150} {"train_loss": -6.317317485809326, "global_step": 90309, "epoch": 2150} {"train_loss": -6.220569133758545, "global_step": 90310, "epoch": 2150} {"train_loss": -6.2585296630859375, "global_step": 90311, "epoch": 2150} {"train_loss": -6.322066307067871, "global_step": 90312, "epoch": 2150} {"train_loss": -6.261963844299316, "global_step": 90313, "epoch": 2150} {"train_loss": -6.13553524017334, "global_step": 90314, "epoch": 2150} {"train_loss": -6.113027095794678, "global_step": 90315, "epoch": 2150} {"train_loss": -6.113254547119141, "global_step": 90316, "epoch": 2150} {"train_loss": -6.192488670349121, "global_step": 90317, "epoch": 2150} {"train_loss": -6.37558126449585, "global_step": 90318, "epoch": 2150} {"train_loss": -6.125177383422852, "global_step": 90319, "epoch": 2150} {"train_loss": -6.305401802062988, "global_step": 90320, "epoch": 2150} {"train_loss": -6.2903289794921875, "global_step": 90321, "epoch": 2150} {"train_loss": -6.247123718261719, "global_step": 90322, "epoch": 2150} {"train_loss": -6.150599479675293, "global_step": 90323, "epoch": 2150} {"train_loss": -6.186186790466309, "global_step": 90324, "epoch": 2150} {"train_loss": -6.2714362144470215, "global_step": 90325, "epoch": 2150} {"train_loss": -6.199775695800781, "global_step": 90326, "epoch": 2150} {"train_loss": -6.171041965484619, "global_step": 90327, "epoch": 2150} {"train_loss": -6.308041572570801, "global_step": 90328, "epoch": 2150} {"train_loss": -6.215812683105469, "global_step": 90329, "epoch": 2150} {"train_loss": -6.182762145996094, "global_step": 90330, "epoch": 2150} {"train_loss": -6.072315216064453, "global_step": 90331, "epoch": 2150} {"train_loss": -6.2135539054870605, "global_step": 90332, "epoch": 2150} {"train_loss": -6.239436626434326, "global_step": 90333, "epoch": 2150} {"train_loss": -6.200224876403809, "global_step": 90334, "epoch": 2150} {"train_loss": -6.343849182128906, "global_step": 90335, "epoch": 2150} {"train_loss": -6.198611259460449, "global_step": 90336, "epoch": 2150} {"train_loss": -6.1762895584106445, "global_step": 90337, "epoch": 2150} {"train_loss": -6.268697261810303, "global_step": 90338, "epoch": 2150} {"train_loss": -6.268276214599609, "global_step": 90339, "epoch": 2150} {"train_loss": -6.136270523071289, "global_step": 90340, "epoch": 2150} {"train_loss": -6.2232794761657715, "global_step": 90341, "epoch": 2150, "train/sim_max_reward_0": 0.9519551389392485, "train/sim_max_reward_1": 0.2535966296921336, "train/sim_max_reward_2": 0.3304183890941186, "train/sim_max_reward_3": 0.13344365801102212, "train/sim_max_reward_4": 0.8997235640454689, "train/sim_max_reward_5": 0.9911188939497274, "test/sim_max_reward_4500000": 0.3429771368440797, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.491737460840886, "test/sim_max_reward_4500003": 0.45121476362810464, "test/sim_max_reward_4500004": 0.9162142468815456, "test/sim_max_reward_4500005": 0.15143552314323233, "test/sim_max_reward_4500006": 0.9370710758968079, "test/sim_max_reward_4500007": 0.9467511333415183, "test/sim_max_reward_4500008": 0.848433008185379, "test/sim_max_reward_4500009": 0.05351037025338449, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 0.8280701908680808, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.15483997160136176, "test/sim_max_reward_4500016": 0.5507631720545619, "test/sim_max_reward_4500017": 0.08918330249815111, "test/sim_max_reward_4500018": 0.38504243343730993, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.9271296769678822, "test/sim_max_reward_4500023": 0.9173886834216978, "test/sim_max_reward_4500024": 0.7647747311646808, "test/sim_max_reward_4500025": 0.5094966340755197, "test/sim_max_reward_4500026": 0.9770311842797501, "test/sim_max_reward_4500027": 0.9403030557187111, "test/sim_max_reward_4500028": 0.19089954956358196, "test/sim_max_reward_4500029": 0.11297178454048235, "test/sim_max_reward_4500030": 0.30494278312951933, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.08499882852362987, "test/sim_max_reward_4500033": 0.831454903892124, "test/sim_max_reward_4500034": 0.6549928208612167, "test/sim_max_reward_4500035": 0.606675035782118, "test/sim_max_reward_4500036": 0.7866518086670148, "test/sim_max_reward_4500037": 0.6870094923390739, "test/sim_max_reward_4500038": 0.2888243502622983, "test/sim_max_reward_4500039": 0.9851803459108913, "test/sim_max_reward_4500040": 0.9069554935168385, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.15603901020222563, "test/sim_max_reward_4500044": 0.37936902393406097, "test/sim_max_reward_4500045": 0.16284261214676857, "test/sim_max_reward_4500046": 0.8630252758033297, "test/sim_max_reward_4500047": 0.9370876970298625, "test/sim_max_reward_4500048": 0.9304988497246895, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5933760456219531, "test/mean_score": 0.5415245413888492, "val_loss": 75252.171875} {"train_loss": -6.230390548706055, "global_step": 90342, "epoch": 2151} {"train_loss": -6.263184547424316, "global_step": 90343, "epoch": 2151} {"train_loss": -6.2202677726745605, "global_step": 90344, "epoch": 2151} {"train_loss": -6.1211442947387695, "global_step": 90345, "epoch": 2151} {"train_loss": -6.21867561340332, "global_step": 90346, "epoch": 2151} {"train_loss": -6.22902774810791, "global_step": 90347, "epoch": 2151} {"train_loss": -6.280963897705078, "global_step": 90348, "epoch": 2151} {"train_loss": -6.2104692459106445, "global_step": 90349, "epoch": 2151} {"train_loss": -6.294271945953369, "global_step": 90350, "epoch": 2151} {"train_loss": -6.3340654373168945, "global_step": 90351, "epoch": 2151} {"train_loss": -6.220381736755371, "global_step": 90352, "epoch": 2151} {"train_loss": -6.182765007019043, "global_step": 90353, "epoch": 2151} {"train_loss": -6.355620384216309, "global_step": 90354, "epoch": 2151} {"train_loss": -6.130486011505127, "global_step": 90355, "epoch": 2151} {"train_loss": -6.1194868087768555, "global_step": 90356, "epoch": 2151} {"train_loss": -6.124387264251709, "global_step": 90357, "epoch": 2151} {"train_loss": -6.1979522705078125, "global_step": 90358, "epoch": 2151} {"train_loss": -6.174688339233398, "global_step": 90359, "epoch": 2151} {"train_loss": -6.201393127441406, "global_step": 90360, "epoch": 2151} {"train_loss": -6.10728645324707, "global_step": 90361, "epoch": 2151} {"train_loss": -6.095198631286621, "global_step": 90362, "epoch": 2151} {"train_loss": -6.310491561889648, "global_step": 90363, "epoch": 2151} {"train_loss": -6.086009502410889, "global_step": 90364, "epoch": 2151} {"train_loss": -6.162711143493652, "global_step": 90365, "epoch": 2151} {"train_loss": -6.147337913513184, "global_step": 90366, "epoch": 2151} {"train_loss": -6.097177505493164, "global_step": 90367, "epoch": 2151} {"train_loss": -6.238368034362793, "global_step": 90368, "epoch": 2151} {"train_loss": -6.338397026062012, "global_step": 90369, "epoch": 2151} {"train_loss": -6.189282417297363, "global_step": 90370, "epoch": 2151} {"train_loss": -6.141446590423584, "global_step": 90371, "epoch": 2151} {"train_loss": -6.360259056091309, "global_step": 90372, "epoch": 2151} {"train_loss": -6.237237930297852, "global_step": 90373, "epoch": 2151} {"train_loss": -6.317390441894531, "global_step": 90374, "epoch": 2151} {"train_loss": -6.3577070236206055, "global_step": 90375, "epoch": 2151} {"train_loss": -6.251501083374023, "global_step": 90376, "epoch": 2151} {"train_loss": -6.303903579711914, "global_step": 90377, "epoch": 2151} {"train_loss": -6.3608293533325195, "global_step": 90378, "epoch": 2151} {"train_loss": -6.220821380615234, "global_step": 90379, "epoch": 2151} {"train_loss": -6.339092254638672, "global_step": 90380, "epoch": 2151} {"train_loss": -6.217262268066406, "global_step": 90381, "epoch": 2151} {"train_loss": -6.185139179229736, "global_step": 90382, "epoch": 2151} {"train_loss": -6.224325032461257, "global_step": 90383, "epoch": 2151, "val_loss": 75420.21875} {"train_loss": -6.20658016204834, "global_step": 90384, "epoch": 2152} {"train_loss": -6.228887557983398, "global_step": 90385, "epoch": 2152} {"train_loss": -6.208898067474365, "global_step": 90386, "epoch": 2152} {"train_loss": -6.287049293518066, "global_step": 90387, "epoch": 2152} {"train_loss": -6.263556003570557, "global_step": 90388, "epoch": 2152} {"train_loss": -6.276298522949219, "global_step": 90389, "epoch": 2152} {"train_loss": -6.2008056640625, "global_step": 90390, "epoch": 2152} {"train_loss": -6.321935176849365, "global_step": 90391, "epoch": 2152} {"train_loss": -6.242509841918945, "global_step": 90392, "epoch": 2152} {"train_loss": -6.312684535980225, "global_step": 90393, "epoch": 2152} {"train_loss": -6.249904632568359, "global_step": 90394, "epoch": 2152} {"train_loss": -6.229702949523926, "global_step": 90395, "epoch": 2152} {"train_loss": -6.333681106567383, "global_step": 90396, "epoch": 2152} {"train_loss": -6.4014739990234375, "global_step": 90397, "epoch": 2152} {"train_loss": -6.292704105377197, "global_step": 90398, "epoch": 2152} {"train_loss": -6.341007232666016, "global_step": 90399, "epoch": 2152} {"train_loss": -6.2354631423950195, "global_step": 90400, "epoch": 2152} {"train_loss": -6.283792495727539, "global_step": 90401, "epoch": 2152} {"train_loss": -6.303347587585449, "global_step": 90402, "epoch": 2152} {"train_loss": -6.301231384277344, "global_step": 90403, "epoch": 2152} {"train_loss": -6.310731887817383, "global_step": 90404, "epoch": 2152} {"train_loss": -6.2229509353637695, "global_step": 90405, "epoch": 2152} {"train_loss": -6.206930160522461, "global_step": 90406, "epoch": 2152} {"train_loss": -6.231340408325195, "global_step": 90407, "epoch": 2152} {"train_loss": -6.227365016937256, "global_step": 90408, "epoch": 2152} {"train_loss": -6.1663031578063965, "global_step": 90409, "epoch": 2152} {"train_loss": -6.2544050216674805, "global_step": 90410, "epoch": 2152} {"train_loss": -6.202417850494385, "global_step": 90411, "epoch": 2152} {"train_loss": -6.079638481140137, "global_step": 90412, "epoch": 2152} {"train_loss": -6.223968029022217, "global_step": 90413, "epoch": 2152} {"train_loss": -6.164332389831543, "global_step": 90414, "epoch": 2152} {"train_loss": -6.16197395324707, "global_step": 90415, "epoch": 2152} {"train_loss": -6.1850266456604, "global_step": 90416, "epoch": 2152} {"train_loss": -6.316391944885254, "global_step": 90417, "epoch": 2152} {"train_loss": -6.252254486083984, "global_step": 90418, "epoch": 2152} {"train_loss": -6.218411922454834, "global_step": 90419, "epoch": 2152} {"train_loss": -6.209156513214111, "global_step": 90420, "epoch": 2152} {"train_loss": -6.247615814208984, "global_step": 90421, "epoch": 2152} {"train_loss": -6.213953971862793, "global_step": 90422, "epoch": 2152} {"train_loss": -6.128931045532227, "global_step": 90423, "epoch": 2152} {"train_loss": -6.103292942047119, "global_step": 90424, "epoch": 2152} {"train_loss": -6.2437354155949185, "global_step": 90425, "epoch": 2152, "val_loss": 75520.34375} {"train_loss": -6.033592224121094, "global_step": 90426, "epoch": 2153} {"train_loss": -6.199082374572754, "global_step": 90427, "epoch": 2153} {"train_loss": -6.203665733337402, "global_step": 90428, "epoch": 2153} {"train_loss": -6.1654863357543945, "global_step": 90429, "epoch": 2153} {"train_loss": -6.300721168518066, "global_step": 90430, "epoch": 2153} {"train_loss": -6.265734672546387, "global_step": 90431, "epoch": 2153} {"train_loss": -6.335393905639648, "global_step": 90432, "epoch": 2153} {"train_loss": -6.307384014129639, "global_step": 90433, "epoch": 2153} {"train_loss": -6.297693252563477, "global_step": 90434, "epoch": 2153} {"train_loss": -6.250795841217041, "global_step": 90435, "epoch": 2153} {"train_loss": -6.180042266845703, "global_step": 90436, "epoch": 2153} {"train_loss": -6.19704532623291, "global_step": 90437, "epoch": 2153} {"train_loss": -6.197959899902344, "global_step": 90438, "epoch": 2153} {"train_loss": -6.261219501495361, "global_step": 90439, "epoch": 2153} {"train_loss": -6.280172348022461, "global_step": 90440, "epoch": 2153} {"train_loss": -6.117822170257568, "global_step": 90441, "epoch": 2153} {"train_loss": -6.215378761291504, "global_step": 90442, "epoch": 2153} {"train_loss": -6.240111827850342, "global_step": 90443, "epoch": 2153} {"train_loss": -6.141515731811523, "global_step": 90444, "epoch": 2153} {"train_loss": -6.141847133636475, "global_step": 90445, "epoch": 2153} {"train_loss": -6.2029829025268555, "global_step": 90446, "epoch": 2153} {"train_loss": -6.247772216796875, "global_step": 90447, "epoch": 2153} {"train_loss": -6.237756729125977, "global_step": 90448, "epoch": 2153} {"train_loss": -6.194314956665039, "global_step": 90449, "epoch": 2153} {"train_loss": -6.174933433532715, "global_step": 90450, "epoch": 2153} {"train_loss": -6.237028121948242, "global_step": 90451, "epoch": 2153} {"train_loss": -6.251443862915039, "global_step": 90452, "epoch": 2153} {"train_loss": -6.187198638916016, "global_step": 90453, "epoch": 2153} {"train_loss": -6.212454319000244, "global_step": 90454, "epoch": 2153} {"train_loss": -6.135546684265137, "global_step": 90455, "epoch": 2153} {"train_loss": -6.127728462219238, "global_step": 90456, "epoch": 2153} {"train_loss": -6.278201103210449, "global_step": 90457, "epoch": 2153} {"train_loss": -5.969548225402832, "global_step": 90458, "epoch": 2153} {"train_loss": -6.11436653137207, "global_step": 90459, "epoch": 2153} {"train_loss": -6.311924934387207, "global_step": 90460, "epoch": 2153} {"train_loss": -6.151330947875977, "global_step": 90461, "epoch": 2153} {"train_loss": -6.179240703582764, "global_step": 90462, "epoch": 2153} {"train_loss": -6.016067981719971, "global_step": 90463, "epoch": 2153} {"train_loss": -6.2807512283325195, "global_step": 90464, "epoch": 2153} {"train_loss": -6.222202301025391, "global_step": 90465, "epoch": 2153} {"train_loss": -6.340002059936523, "global_step": 90466, "epoch": 2153} {"train_loss": -6.204006058829171, "global_step": 90467, "epoch": 2153, "val_loss": 75446.1875} {"train_loss": -6.229542255401611, "global_step": 90468, "epoch": 2154} {"train_loss": -6.154603958129883, "global_step": 90469, "epoch": 2154} {"train_loss": -6.262020111083984, "global_step": 90470, "epoch": 2154} {"train_loss": -6.265141487121582, "global_step": 90471, "epoch": 2154} {"train_loss": -6.282073020935059, "global_step": 90472, "epoch": 2154} {"train_loss": -6.341890811920166, "global_step": 90473, "epoch": 2154} {"train_loss": -6.2868804931640625, "global_step": 90474, "epoch": 2154} {"train_loss": -6.25068473815918, "global_step": 90475, "epoch": 2154} {"train_loss": -6.198934555053711, "global_step": 90476, "epoch": 2154} {"train_loss": -6.236349105834961, "global_step": 90477, "epoch": 2154} {"train_loss": -6.3804731369018555, "global_step": 90478, "epoch": 2154} {"train_loss": -6.223015308380127, "global_step": 90479, "epoch": 2154} {"train_loss": -6.355856418609619, "global_step": 90480, "epoch": 2154} {"train_loss": -6.305769920349121, "global_step": 90481, "epoch": 2154} {"train_loss": -6.216066837310791, "global_step": 90482, "epoch": 2154} {"train_loss": -6.285769462585449, "global_step": 90483, "epoch": 2154} {"train_loss": -6.3046722412109375, "global_step": 90484, "epoch": 2154} {"train_loss": -6.181175708770752, "global_step": 90485, "epoch": 2154} {"train_loss": -6.233226776123047, "global_step": 90486, "epoch": 2154} {"train_loss": -6.23818302154541, "global_step": 90487, "epoch": 2154} {"train_loss": -6.287436485290527, "global_step": 90488, "epoch": 2154} {"train_loss": -6.205455780029297, "global_step": 90489, "epoch": 2154} {"train_loss": -6.340984344482422, "global_step": 90490, "epoch": 2154} {"train_loss": -6.225512504577637, "global_step": 90491, "epoch": 2154} {"train_loss": -6.175189971923828, "global_step": 90492, "epoch": 2154} {"train_loss": -6.319437503814697, "global_step": 90493, "epoch": 2154} {"train_loss": -6.241004467010498, "global_step": 90494, "epoch": 2154} {"train_loss": -6.219440460205078, "global_step": 90495, "epoch": 2154} {"train_loss": -6.172120571136475, "global_step": 90496, "epoch": 2154} {"train_loss": -6.275813579559326, "global_step": 90497, "epoch": 2154} {"train_loss": -6.24748420715332, "global_step": 90498, "epoch": 2154} {"train_loss": -6.146770477294922, "global_step": 90499, "epoch": 2154} {"train_loss": -6.274301528930664, "global_step": 90500, "epoch": 2154} {"train_loss": -6.146167755126953, "global_step": 90501, "epoch": 2154} {"train_loss": -6.255853652954102, "global_step": 90502, "epoch": 2154} {"train_loss": -6.249702453613281, "global_step": 90503, "epoch": 2154} {"train_loss": -6.1479387283325195, "global_step": 90504, "epoch": 2154} {"train_loss": -6.274914741516113, "global_step": 90505, "epoch": 2154} {"train_loss": -6.167688846588135, "global_step": 90506, "epoch": 2154} {"train_loss": -6.229318618774414, "global_step": 90507, "epoch": 2154} {"train_loss": -6.306179046630859, "global_step": 90508, "epoch": 2154} {"train_loss": -6.247534116109212, "global_step": 90509, "epoch": 2154, "val_loss": 75538.734375} {"train_loss": -6.347817420959473, "global_step": 90510, "epoch": 2155} {"train_loss": -6.224210739135742, "global_step": 90511, "epoch": 2155} {"train_loss": -6.321455955505371, "global_step": 90512, "epoch": 2155} {"train_loss": -6.3037309646606445, "global_step": 90513, "epoch": 2155} {"train_loss": -6.211366176605225, "global_step": 90514, "epoch": 2155} {"train_loss": -6.2689313888549805, "global_step": 90515, "epoch": 2155} {"train_loss": -6.300147533416748, "global_step": 90516, "epoch": 2155} {"train_loss": -6.206584930419922, "global_step": 90517, "epoch": 2155} {"train_loss": -6.201292037963867, "global_step": 90518, "epoch": 2155} {"train_loss": -6.32102108001709, "global_step": 90519, "epoch": 2155} {"train_loss": -6.226181983947754, "global_step": 90520, "epoch": 2155} {"train_loss": -6.285759925842285, "global_step": 90521, "epoch": 2155} {"train_loss": -6.290304660797119, "global_step": 90522, "epoch": 2155} {"train_loss": -6.231890678405762, "global_step": 90523, "epoch": 2155} {"train_loss": -6.338463306427002, "global_step": 90524, "epoch": 2155} {"train_loss": -6.245931625366211, "global_step": 90525, "epoch": 2155} {"train_loss": -6.164831638336182, "global_step": 90526, "epoch": 2155} {"train_loss": -6.209774971008301, "global_step": 90527, "epoch": 2155} {"train_loss": -6.236602783203125, "global_step": 90528, "epoch": 2155} {"train_loss": -6.244114398956299, "global_step": 90529, "epoch": 2155} {"train_loss": -6.289802551269531, "global_step": 90530, "epoch": 2155} {"train_loss": -6.327747344970703, "global_step": 90531, "epoch": 2155} {"train_loss": -6.237430572509766, "global_step": 90532, "epoch": 2155} {"train_loss": -6.14597749710083, "global_step": 90533, "epoch": 2155} {"train_loss": -6.32075309753418, "global_step": 90534, "epoch": 2155} {"train_loss": -6.259261131286621, "global_step": 90535, "epoch": 2155} {"train_loss": -6.1356401443481445, "global_step": 90536, "epoch": 2155} {"train_loss": -6.198334217071533, "global_step": 90537, "epoch": 2155} {"train_loss": -6.342353820800781, "global_step": 90538, "epoch": 2155} {"train_loss": -6.235419750213623, "global_step": 90539, "epoch": 2155} {"train_loss": -6.15512228012085, "global_step": 90540, "epoch": 2155} {"train_loss": -6.305696487426758, "global_step": 90541, "epoch": 2155} {"train_loss": -6.148677825927734, "global_step": 90542, "epoch": 2155} {"train_loss": -6.265260696411133, "global_step": 90543, "epoch": 2155} {"train_loss": -6.250863075256348, "global_step": 90544, "epoch": 2155} {"train_loss": -6.07828426361084, "global_step": 90545, "epoch": 2155} {"train_loss": -6.244972229003906, "global_step": 90546, "epoch": 2155} {"train_loss": -6.255213737487793, "global_step": 90547, "epoch": 2155} {"train_loss": -6.220221519470215, "global_step": 90548, "epoch": 2155} {"train_loss": -6.178650856018066, "global_step": 90549, "epoch": 2155} {"train_loss": -6.2626190185546875, "global_step": 90550, "epoch": 2155} {"train_loss": -6.242657320840018, "global_step": 90551, "epoch": 2155, "val_loss": 75345.828125} {"train_loss": -6.252066135406494, "global_step": 90552, "epoch": 2156} {"train_loss": -6.200420379638672, "global_step": 90553, "epoch": 2156} {"train_loss": -6.291736125946045, "global_step": 90554, "epoch": 2156} {"train_loss": -6.223957061767578, "global_step": 90555, "epoch": 2156} {"train_loss": -6.317775726318359, "global_step": 90556, "epoch": 2156} {"train_loss": -6.295351028442383, "global_step": 90557, "epoch": 2156} {"train_loss": -6.205061912536621, "global_step": 90558, "epoch": 2156} {"train_loss": -6.214845657348633, "global_step": 90559, "epoch": 2156} {"train_loss": -6.284579753875732, "global_step": 90560, "epoch": 2156} {"train_loss": -6.274600982666016, "global_step": 90561, "epoch": 2156} {"train_loss": -6.21480655670166, "global_step": 90562, "epoch": 2156} {"train_loss": -6.244715690612793, "global_step": 90563, "epoch": 2156} {"train_loss": -6.157084941864014, "global_step": 90564, "epoch": 2156} {"train_loss": -6.147737979888916, "global_step": 90565, "epoch": 2156} {"train_loss": -6.288613796234131, "global_step": 90566, "epoch": 2156} {"train_loss": -6.123344421386719, "global_step": 90567, "epoch": 2156} {"train_loss": -6.39743709564209, "global_step": 90568, "epoch": 2156} {"train_loss": -6.331635475158691, "global_step": 90569, "epoch": 2156} {"train_loss": -6.283520698547363, "global_step": 90570, "epoch": 2156} {"train_loss": -6.259349822998047, "global_step": 90571, "epoch": 2156} {"train_loss": -6.264596939086914, "global_step": 90572, "epoch": 2156} {"train_loss": -6.134329795837402, "global_step": 90573, "epoch": 2156} {"train_loss": -6.298370361328125, "global_step": 90574, "epoch": 2156} {"train_loss": -6.162905693054199, "global_step": 90575, "epoch": 2156} {"train_loss": -6.2746710777282715, "global_step": 90576, "epoch": 2156} {"train_loss": -6.260280132293701, "global_step": 90577, "epoch": 2156} {"train_loss": -6.146737098693848, "global_step": 90578, "epoch": 2156} {"train_loss": -6.374521255493164, "global_step": 90579, "epoch": 2156} {"train_loss": -6.241092681884766, "global_step": 90580, "epoch": 2156} {"train_loss": -6.107473373413086, "global_step": 90581, "epoch": 2156} {"train_loss": -6.429988861083984, "global_step": 90582, "epoch": 2156} {"train_loss": -6.135831832885742, "global_step": 90583, "epoch": 2156} {"train_loss": -6.305418014526367, "global_step": 90584, "epoch": 2156} {"train_loss": -6.2236328125, "global_step": 90585, "epoch": 2156} {"train_loss": -6.149471282958984, "global_step": 90586, "epoch": 2156} {"train_loss": -6.183993339538574, "global_step": 90587, "epoch": 2156} {"train_loss": -6.293086051940918, "global_step": 90588, "epoch": 2156} {"train_loss": -6.313055515289307, "global_step": 90589, "epoch": 2156} {"train_loss": -6.279740333557129, "global_step": 90590, "epoch": 2156} {"train_loss": -6.333548545837402, "global_step": 90591, "epoch": 2156} {"train_loss": -6.30683708190918, "global_step": 90592, "epoch": 2156} {"train_loss": -6.250570592426119, "global_step": 90593, "epoch": 2156, "val_loss": 75613.6796875} {"train_loss": -6.131893157958984, "global_step": 90594, "epoch": 2157} {"train_loss": -6.278280258178711, "global_step": 90595, "epoch": 2157} {"train_loss": -6.295287132263184, "global_step": 90596, "epoch": 2157} {"train_loss": -6.225573539733887, "global_step": 90597, "epoch": 2157} {"train_loss": -6.349043846130371, "global_step": 90598, "epoch": 2157} {"train_loss": -6.348575592041016, "global_step": 90599, "epoch": 2157} {"train_loss": -6.283487319946289, "global_step": 90600, "epoch": 2157} {"train_loss": -6.312002658843994, "global_step": 90601, "epoch": 2157} {"train_loss": -6.286863327026367, "global_step": 90602, "epoch": 2157} {"train_loss": -6.3016252517700195, "global_step": 90603, "epoch": 2157} {"train_loss": -6.2371320724487305, "global_step": 90604, "epoch": 2157} {"train_loss": -6.2517008781433105, "global_step": 90605, "epoch": 2157} {"train_loss": -6.283815383911133, "global_step": 90606, "epoch": 2157} {"train_loss": -6.259860038757324, "global_step": 90607, "epoch": 2157} {"train_loss": -6.331676483154297, "global_step": 90608, "epoch": 2157} {"train_loss": -6.161969184875488, "global_step": 90609, "epoch": 2157} {"train_loss": -6.250317096710205, "global_step": 90610, "epoch": 2157} {"train_loss": -6.325444221496582, "global_step": 90611, "epoch": 2157} {"train_loss": -6.248813629150391, "global_step": 90612, "epoch": 2157} {"train_loss": -6.2386627197265625, "global_step": 90613, "epoch": 2157} {"train_loss": -6.219642162322998, "global_step": 90614, "epoch": 2157} {"train_loss": -6.229021072387695, "global_step": 90615, "epoch": 2157} {"train_loss": -6.3137407302856445, "global_step": 90616, "epoch": 2157} {"train_loss": -6.292355537414551, "global_step": 90617, "epoch": 2157} {"train_loss": -6.200595855712891, "global_step": 90618, "epoch": 2157} {"train_loss": -6.283438682556152, "global_step": 90619, "epoch": 2157} {"train_loss": -6.232489585876465, "global_step": 90620, "epoch": 2157} {"train_loss": -6.206487655639648, "global_step": 90621, "epoch": 2157} {"train_loss": -6.276840686798096, "global_step": 90622, "epoch": 2157} {"train_loss": -6.323758125305176, "global_step": 90623, "epoch": 2157} {"train_loss": -6.239871978759766, "global_step": 90624, "epoch": 2157} {"train_loss": -6.290234565734863, "global_step": 90625, "epoch": 2157} {"train_loss": -6.215576171875, "global_step": 90626, "epoch": 2157} {"train_loss": -6.430595397949219, "global_step": 90627, "epoch": 2157} {"train_loss": -6.295650482177734, "global_step": 90628, "epoch": 2157} {"train_loss": -6.268406867980957, "global_step": 90629, "epoch": 2157} {"train_loss": -6.239362716674805, "global_step": 90630, "epoch": 2157} {"train_loss": -6.2799506187438965, "global_step": 90631, "epoch": 2157} {"train_loss": -6.23964786529541, "global_step": 90632, "epoch": 2157} {"train_loss": -6.420137882232666, "global_step": 90633, "epoch": 2157} {"train_loss": -6.2252326011657715, "global_step": 90634, "epoch": 2157} {"train_loss": -6.270351273672921, "global_step": 90635, "epoch": 2157, "val_loss": 75261.671875} {"train_loss": -6.213303565979004, "global_step": 90636, "epoch": 2158} {"train_loss": -6.300431251525879, "global_step": 90637, "epoch": 2158} {"train_loss": -6.324542045593262, "global_step": 90638, "epoch": 2158} {"train_loss": -6.243121147155762, "global_step": 90639, "epoch": 2158} {"train_loss": -6.3520379066467285, "global_step": 90640, "epoch": 2158} {"train_loss": -6.273371696472168, "global_step": 90641, "epoch": 2158} {"train_loss": -6.367362022399902, "global_step": 90642, "epoch": 2158} {"train_loss": -6.2043256759643555, "global_step": 90643, "epoch": 2158} {"train_loss": -6.276106834411621, "global_step": 90644, "epoch": 2158} {"train_loss": -6.197668552398682, "global_step": 90645, "epoch": 2158} {"train_loss": -6.364099502563477, "global_step": 90646, "epoch": 2158} {"train_loss": -6.296205997467041, "global_step": 90647, "epoch": 2158} {"train_loss": -6.22360372543335, "global_step": 90648, "epoch": 2158} {"train_loss": -6.249658584594727, "global_step": 90649, "epoch": 2158} {"train_loss": -6.310784339904785, "global_step": 90650, "epoch": 2158} {"train_loss": -6.334510326385498, "global_step": 90651, "epoch": 2158} {"train_loss": -6.312706470489502, "global_step": 90652, "epoch": 2158} {"train_loss": -6.266185760498047, "global_step": 90653, "epoch": 2158} {"train_loss": -6.226117134094238, "global_step": 90654, "epoch": 2158} {"train_loss": -6.256111145019531, "global_step": 90655, "epoch": 2158} {"train_loss": -6.292853355407715, "global_step": 90656, "epoch": 2158} {"train_loss": -6.325111389160156, "global_step": 90657, "epoch": 2158} {"train_loss": -6.3289361000061035, "global_step": 90658, "epoch": 2158} {"train_loss": -6.238387107849121, "global_step": 90659, "epoch": 2158} {"train_loss": -6.22266960144043, "global_step": 90660, "epoch": 2158} {"train_loss": -6.345369338989258, "global_step": 90661, "epoch": 2158} {"train_loss": -6.307244300842285, "global_step": 90662, "epoch": 2158} {"train_loss": -6.155697822570801, "global_step": 90663, "epoch": 2158} {"train_loss": -6.182024955749512, "global_step": 90664, "epoch": 2158} {"train_loss": -6.2433295249938965, "global_step": 90665, "epoch": 2158} {"train_loss": -6.211904525756836, "global_step": 90666, "epoch": 2158} {"train_loss": -6.180515766143799, "global_step": 90667, "epoch": 2158} {"train_loss": -6.123958587646484, "global_step": 90668, "epoch": 2158} {"train_loss": -6.221920490264893, "global_step": 90669, "epoch": 2158} {"train_loss": -6.282303333282471, "global_step": 90670, "epoch": 2158} {"train_loss": -6.172242164611816, "global_step": 90671, "epoch": 2158} {"train_loss": -6.269255638122559, "global_step": 90672, "epoch": 2158} {"train_loss": -6.379499435424805, "global_step": 90673, "epoch": 2158} {"train_loss": -6.201366901397705, "global_step": 90674, "epoch": 2158} {"train_loss": -6.283205032348633, "global_step": 90675, "epoch": 2158} {"train_loss": -6.165058135986328, "global_step": 90676, "epoch": 2158} {"train_loss": -6.259375322432745, "global_step": 90677, "epoch": 2158, "val_loss": 75559.4140625} {"train_loss": -6.2853851318359375, "global_step": 90678, "epoch": 2159} {"train_loss": -6.24307918548584, "global_step": 90679, "epoch": 2159} {"train_loss": -6.270441055297852, "global_step": 90680, "epoch": 2159} {"train_loss": -6.167877197265625, "global_step": 90681, "epoch": 2159} {"train_loss": -6.279809951782227, "global_step": 90682, "epoch": 2159} {"train_loss": -6.278980255126953, "global_step": 90683, "epoch": 2159} {"train_loss": -6.360409736633301, "global_step": 90684, "epoch": 2159} {"train_loss": -6.410145282745361, "global_step": 90685, "epoch": 2159} {"train_loss": -6.240856170654297, "global_step": 90686, "epoch": 2159} {"train_loss": -6.220686435699463, "global_step": 90687, "epoch": 2159} {"train_loss": -6.166237831115723, "global_step": 90688, "epoch": 2159} {"train_loss": -6.3845014572143555, "global_step": 90689, "epoch": 2159} {"train_loss": -6.142823219299316, "global_step": 90690, "epoch": 2159} {"train_loss": -6.274460315704346, "global_step": 90691, "epoch": 2159} {"train_loss": -6.22690486907959, "global_step": 90692, "epoch": 2159} {"train_loss": -6.342792987823486, "global_step": 90693, "epoch": 2159} {"train_loss": -6.234963417053223, "global_step": 90694, "epoch": 2159} {"train_loss": -6.253996849060059, "global_step": 90695, "epoch": 2159} {"train_loss": -6.187089443206787, "global_step": 90696, "epoch": 2159} {"train_loss": -6.225571632385254, "global_step": 90697, "epoch": 2159} {"train_loss": -6.403697967529297, "global_step": 90698, "epoch": 2159} {"train_loss": -6.26011848449707, "global_step": 90699, "epoch": 2159} {"train_loss": -6.332764625549316, "global_step": 90700, "epoch": 2159} {"train_loss": -6.187708854675293, "global_step": 90701, "epoch": 2159} {"train_loss": -6.235204696655273, "global_step": 90702, "epoch": 2159} {"train_loss": -6.287149429321289, "global_step": 90703, "epoch": 2159} {"train_loss": -6.297507286071777, "global_step": 90704, "epoch": 2159} {"train_loss": -6.301146984100342, "global_step": 90705, "epoch": 2159} {"train_loss": -6.3654327392578125, "global_step": 90706, "epoch": 2159} {"train_loss": -6.129998207092285, "global_step": 90707, "epoch": 2159} {"train_loss": -6.166177272796631, "global_step": 90708, "epoch": 2159} {"train_loss": -6.217008590698242, "global_step": 90709, "epoch": 2159} {"train_loss": -6.083930015563965, "global_step": 90710, "epoch": 2159} {"train_loss": -6.326106071472168, "global_step": 90711, "epoch": 2159} {"train_loss": -6.186014175415039, "global_step": 90712, "epoch": 2159} {"train_loss": -6.081754684448242, "global_step": 90713, "epoch": 2159} {"train_loss": -6.269850730895996, "global_step": 90714, "epoch": 2159} {"train_loss": -6.18904447555542, "global_step": 90715, "epoch": 2159} {"train_loss": -6.226351737976074, "global_step": 90716, "epoch": 2159} {"train_loss": -6.110056400299072, "global_step": 90717, "epoch": 2159} {"train_loss": -6.263094902038574, "global_step": 90718, "epoch": 2159} {"train_loss": -6.244481109437489, "global_step": 90719, "epoch": 2159, "val_loss": 75480.4140625} {"train_loss": -6.321925163269043, "global_step": 90720, "epoch": 2160} {"train_loss": -6.187458038330078, "global_step": 90721, "epoch": 2160} {"train_loss": -6.154346942901611, "global_step": 90722, "epoch": 2160} {"train_loss": -6.256843090057373, "global_step": 90723, "epoch": 2160} {"train_loss": -6.304849624633789, "global_step": 90724, "epoch": 2160} {"train_loss": -6.289087295532227, "global_step": 90725, "epoch": 2160} {"train_loss": -6.30773401260376, "global_step": 90726, "epoch": 2160} {"train_loss": -6.0851545333862305, "global_step": 90727, "epoch": 2160} {"train_loss": -6.367640972137451, "global_step": 90728, "epoch": 2160} {"train_loss": -6.282130241394043, "global_step": 90729, "epoch": 2160} {"train_loss": -6.174908638000488, "global_step": 90730, "epoch": 2160} {"train_loss": -6.285134315490723, "global_step": 90731, "epoch": 2160} {"train_loss": -6.068813800811768, "global_step": 90732, "epoch": 2160} {"train_loss": -6.217411041259766, "global_step": 90733, "epoch": 2160} {"train_loss": -6.223169326782227, "global_step": 90734, "epoch": 2160} {"train_loss": -6.2487897872924805, "global_step": 90735, "epoch": 2160} {"train_loss": -6.255115509033203, "global_step": 90736, "epoch": 2160} {"train_loss": -6.340280532836914, "global_step": 90737, "epoch": 2160} {"train_loss": -6.276671409606934, "global_step": 90738, "epoch": 2160} {"train_loss": -6.147130012512207, "global_step": 90739, "epoch": 2160} {"train_loss": -6.249354362487793, "global_step": 90740, "epoch": 2160} {"train_loss": -6.295557022094727, "global_step": 90741, "epoch": 2160} {"train_loss": -6.318869590759277, "global_step": 90742, "epoch": 2160} {"train_loss": -6.319976806640625, "global_step": 90743, "epoch": 2160} {"train_loss": -6.24061393737793, "global_step": 90744, "epoch": 2160} {"train_loss": -6.256525993347168, "global_step": 90745, "epoch": 2160} {"train_loss": -6.360140800476074, "global_step": 90746, "epoch": 2160} {"train_loss": -6.3105573654174805, "global_step": 90747, "epoch": 2160} {"train_loss": -6.190720558166504, "global_step": 90748, "epoch": 2160} {"train_loss": -6.14597749710083, "global_step": 90749, "epoch": 2160} {"train_loss": -6.2426371574401855, "global_step": 90750, "epoch": 2160} {"train_loss": -6.384390830993652, "global_step": 90751, "epoch": 2160} {"train_loss": -6.238697052001953, "global_step": 90752, "epoch": 2160} {"train_loss": -6.216178894042969, "global_step": 90753, "epoch": 2160} {"train_loss": -6.226123332977295, "global_step": 90754, "epoch": 2160} {"train_loss": -6.344520092010498, "global_step": 90755, "epoch": 2160} {"train_loss": -6.240237712860107, "global_step": 90756, "epoch": 2160} {"train_loss": -6.2323899269104, "global_step": 90757, "epoch": 2160} {"train_loss": -6.229189872741699, "global_step": 90758, "epoch": 2160} {"train_loss": -6.13129997253418, "global_step": 90759, "epoch": 2160} {"train_loss": -6.190047740936279, "global_step": 90760, "epoch": 2160} {"train_loss": -6.244705132075718, "global_step": 90761, "epoch": 2160, "val_loss": 75165.59375} {"train_loss": -6.366466999053955, "global_step": 90762, "epoch": 2161} {"train_loss": -6.220477104187012, "global_step": 90763, "epoch": 2161} {"train_loss": -6.2132954597473145, "global_step": 90764, "epoch": 2161} {"train_loss": -6.2706990242004395, "global_step": 90765, "epoch": 2161} {"train_loss": -6.198145389556885, "global_step": 90766, "epoch": 2161} {"train_loss": -6.239556789398193, "global_step": 90767, "epoch": 2161} {"train_loss": -6.249153137207031, "global_step": 90768, "epoch": 2161} {"train_loss": -6.242550849914551, "global_step": 90769, "epoch": 2161} {"train_loss": -6.190729141235352, "global_step": 90770, "epoch": 2161} {"train_loss": -6.256850242614746, "global_step": 90771, "epoch": 2161} {"train_loss": -6.3050618171691895, "global_step": 90772, "epoch": 2161} {"train_loss": -6.279066562652588, "global_step": 90773, "epoch": 2161} {"train_loss": -6.357504367828369, "global_step": 90774, "epoch": 2161} {"train_loss": -6.394439697265625, "global_step": 90775, "epoch": 2161} {"train_loss": -6.198904991149902, "global_step": 90776, "epoch": 2161} {"train_loss": -6.2576375007629395, "global_step": 90777, "epoch": 2161} {"train_loss": -6.1715216636657715, "global_step": 90778, "epoch": 2161} {"train_loss": -6.293929576873779, "global_step": 90779, "epoch": 2161} {"train_loss": -6.2539448738098145, "global_step": 90780, "epoch": 2161} {"train_loss": -6.1275129318237305, "global_step": 90781, "epoch": 2161} {"train_loss": -6.278007507324219, "global_step": 90782, "epoch": 2161} {"train_loss": -6.2811760902404785, "global_step": 90783, "epoch": 2161} {"train_loss": -6.294076919555664, "global_step": 90784, "epoch": 2161} {"train_loss": -6.387073516845703, "global_step": 90785, "epoch": 2161} {"train_loss": -6.168837547302246, "global_step": 90786, "epoch": 2161} {"train_loss": -6.269732475280762, "global_step": 90787, "epoch": 2161} {"train_loss": -6.183967590332031, "global_step": 90788, "epoch": 2161} {"train_loss": -6.227517604827881, "global_step": 90789, "epoch": 2161} {"train_loss": -6.295468330383301, "global_step": 90790, "epoch": 2161} {"train_loss": -6.248552322387695, "global_step": 90791, "epoch": 2161} {"train_loss": -6.4121904373168945, "global_step": 90792, "epoch": 2161} {"train_loss": -6.230863571166992, "global_step": 90793, "epoch": 2161} {"train_loss": -6.337960243225098, "global_step": 90794, "epoch": 2161} {"train_loss": -6.210048675537109, "global_step": 90795, "epoch": 2161} {"train_loss": -6.282868385314941, "global_step": 90796, "epoch": 2161} {"train_loss": -6.345816135406494, "global_step": 90797, "epoch": 2161} {"train_loss": -6.257189750671387, "global_step": 90798, "epoch": 2161} {"train_loss": -6.273077011108398, "global_step": 90799, "epoch": 2161} {"train_loss": -6.183938026428223, "global_step": 90800, "epoch": 2161} {"train_loss": -6.252955436706543, "global_step": 90801, "epoch": 2161} {"train_loss": -6.219809532165527, "global_step": 90802, "epoch": 2161} {"train_loss": -6.261527810777936, "global_step": 90803, "epoch": 2161, "val_loss": 75290.921875} {"train_loss": -6.298293113708496, "global_step": 90804, "epoch": 2162} {"train_loss": -6.279857158660889, "global_step": 90805, "epoch": 2162} {"train_loss": -6.2799458503723145, "global_step": 90806, "epoch": 2162} {"train_loss": -6.240792274475098, "global_step": 90807, "epoch": 2162} {"train_loss": -6.280700206756592, "global_step": 90808, "epoch": 2162} {"train_loss": -6.2551164627075195, "global_step": 90809, "epoch": 2162} {"train_loss": -6.193648815155029, "global_step": 90810, "epoch": 2162} {"train_loss": -6.180957317352295, "global_step": 90811, "epoch": 2162} {"train_loss": -6.193953514099121, "global_step": 90812, "epoch": 2162} {"train_loss": -6.329339981079102, "global_step": 90813, "epoch": 2162} {"train_loss": -6.200194358825684, "global_step": 90814, "epoch": 2162} {"train_loss": -6.2852020263671875, "global_step": 90815, "epoch": 2162} {"train_loss": -6.307161331176758, "global_step": 90816, "epoch": 2162} {"train_loss": -6.153944969177246, "global_step": 90817, "epoch": 2162} {"train_loss": -6.210620880126953, "global_step": 90818, "epoch": 2162} {"train_loss": -6.267299175262451, "global_step": 90819, "epoch": 2162} {"train_loss": -6.367525100708008, "global_step": 90820, "epoch": 2162} {"train_loss": -6.347369194030762, "global_step": 90821, "epoch": 2162} {"train_loss": -6.23070764541626, "global_step": 90822, "epoch": 2162} {"train_loss": -6.377404689788818, "global_step": 90823, "epoch": 2162} {"train_loss": -6.371503829956055, "global_step": 90824, "epoch": 2162} {"train_loss": -6.19194221496582, "global_step": 90825, "epoch": 2162} {"train_loss": -6.281895637512207, "global_step": 90826, "epoch": 2162} {"train_loss": -6.253046035766602, "global_step": 90827, "epoch": 2162} {"train_loss": -6.340569496154785, "global_step": 90828, "epoch": 2162} {"train_loss": -6.300210952758789, "global_step": 90829, "epoch": 2162} {"train_loss": -6.348421096801758, "global_step": 90830, "epoch": 2162} {"train_loss": -6.329494476318359, "global_step": 90831, "epoch": 2162} {"train_loss": -6.2542524337768555, "global_step": 90832, "epoch": 2162} {"train_loss": -6.291288375854492, "global_step": 90833, "epoch": 2162} {"train_loss": -6.3406171798706055, "global_step": 90834, "epoch": 2162} {"train_loss": -6.326524257659912, "global_step": 90835, "epoch": 2162} {"train_loss": -6.223324775695801, "global_step": 90836, "epoch": 2162} {"train_loss": -6.230639457702637, "global_step": 90837, "epoch": 2162} {"train_loss": -6.331586837768555, "global_step": 90838, "epoch": 2162} {"train_loss": -6.265398025512695, "global_step": 90839, "epoch": 2162} {"train_loss": -6.252025127410889, "global_step": 90840, "epoch": 2162} {"train_loss": -6.291009902954102, "global_step": 90841, "epoch": 2162} {"train_loss": -6.208460330963135, "global_step": 90842, "epoch": 2162} {"train_loss": -6.346230506896973, "global_step": 90843, "epoch": 2162} {"train_loss": -6.298098087310791, "global_step": 90844, "epoch": 2162} {"train_loss": -6.274511745997837, "global_step": 90845, "epoch": 2162, "val_loss": 75589.5859375} {"train_loss": -6.33432674407959, "global_step": 90846, "epoch": 2163} {"train_loss": -6.1897430419921875, "global_step": 90847, "epoch": 2163} {"train_loss": -6.166661739349365, "global_step": 90848, "epoch": 2163} {"train_loss": -6.229531288146973, "global_step": 90849, "epoch": 2163} {"train_loss": -6.174250602722168, "global_step": 90850, "epoch": 2163} {"train_loss": -6.273010730743408, "global_step": 90851, "epoch": 2163} {"train_loss": -6.267916679382324, "global_step": 90852, "epoch": 2163} {"train_loss": -6.29088020324707, "global_step": 90853, "epoch": 2163} {"train_loss": -6.177369117736816, "global_step": 90854, "epoch": 2163} {"train_loss": -6.181315898895264, "global_step": 90855, "epoch": 2163} {"train_loss": -6.303835868835449, "global_step": 90856, "epoch": 2163} {"train_loss": -6.135239124298096, "global_step": 90857, "epoch": 2163} {"train_loss": -6.277557373046875, "global_step": 90858, "epoch": 2163} {"train_loss": -6.1857805252075195, "global_step": 90859, "epoch": 2163} {"train_loss": -6.31004524230957, "global_step": 90860, "epoch": 2163} {"train_loss": -6.188411235809326, "global_step": 90861, "epoch": 2163} {"train_loss": -6.312394142150879, "global_step": 90862, "epoch": 2163} {"train_loss": -6.207162857055664, "global_step": 90863, "epoch": 2163} {"train_loss": -6.34184455871582, "global_step": 90864, "epoch": 2163} {"train_loss": -6.257834434509277, "global_step": 90865, "epoch": 2163} {"train_loss": -6.09754753112793, "global_step": 90866, "epoch": 2163} {"train_loss": -6.264503002166748, "global_step": 90867, "epoch": 2163} {"train_loss": -6.276822090148926, "global_step": 90868, "epoch": 2163} {"train_loss": -6.146684646606445, "global_step": 90869, "epoch": 2163} {"train_loss": -6.142568588256836, "global_step": 90870, "epoch": 2163} {"train_loss": -6.292297840118408, "global_step": 90871, "epoch": 2163} {"train_loss": -6.196810722351074, "global_step": 90872, "epoch": 2163} {"train_loss": -6.2515997886657715, "global_step": 90873, "epoch": 2163} {"train_loss": -6.249780654907227, "global_step": 90874, "epoch": 2163} {"train_loss": -6.173954963684082, "global_step": 90875, "epoch": 2163} {"train_loss": -6.282313346862793, "global_step": 90876, "epoch": 2163} {"train_loss": -6.149631500244141, "global_step": 90877, "epoch": 2163} {"train_loss": -6.153345108032227, "global_step": 90878, "epoch": 2163} {"train_loss": -6.293854713439941, "global_step": 90879, "epoch": 2163} {"train_loss": -6.216404438018799, "global_step": 90880, "epoch": 2163} {"train_loss": -6.352872848510742, "global_step": 90881, "epoch": 2163} {"train_loss": -6.214461326599121, "global_step": 90882, "epoch": 2163} {"train_loss": -6.2238287925720215, "global_step": 90883, "epoch": 2163} {"train_loss": -6.350069999694824, "global_step": 90884, "epoch": 2163} {"train_loss": -6.265328407287598, "global_step": 90885, "epoch": 2163} {"train_loss": -6.229076385498047, "global_step": 90886, "epoch": 2163} {"train_loss": -6.2336824507940385, "global_step": 90887, "epoch": 2163, "val_loss": 75505.390625} {"train_loss": -6.2686767578125, "global_step": 90888, "epoch": 2164} {"train_loss": -6.254840850830078, "global_step": 90889, "epoch": 2164} {"train_loss": -6.265959739685059, "global_step": 90890, "epoch": 2164} {"train_loss": -6.173086643218994, "global_step": 90891, "epoch": 2164} {"train_loss": -6.265559196472168, "global_step": 90892, "epoch": 2164} {"train_loss": -6.302370548248291, "global_step": 90893, "epoch": 2164} {"train_loss": -6.226901054382324, "global_step": 90894, "epoch": 2164} {"train_loss": -6.239663124084473, "global_step": 90895, "epoch": 2164} {"train_loss": -6.243110179901123, "global_step": 90896, "epoch": 2164} {"train_loss": -6.257397651672363, "global_step": 90897, "epoch": 2164} {"train_loss": -6.185359954833984, "global_step": 90898, "epoch": 2164} {"train_loss": -6.267265319824219, "global_step": 90899, "epoch": 2164} {"train_loss": -6.185915946960449, "global_step": 90900, "epoch": 2164} {"train_loss": -6.195113182067871, "global_step": 90901, "epoch": 2164} {"train_loss": -6.214838981628418, "global_step": 90902, "epoch": 2164} {"train_loss": -6.28313684463501, "global_step": 90903, "epoch": 2164} {"train_loss": -6.253970146179199, "global_step": 90904, "epoch": 2164} {"train_loss": -6.332723617553711, "global_step": 90905, "epoch": 2164} {"train_loss": -6.355318069458008, "global_step": 90906, "epoch": 2164} {"train_loss": -6.267666816711426, "global_step": 90907, "epoch": 2164} {"train_loss": -6.275637149810791, "global_step": 90908, "epoch": 2164} {"train_loss": -6.257116794586182, "global_step": 90909, "epoch": 2164} {"train_loss": -6.3277764320373535, "global_step": 90910, "epoch": 2164} {"train_loss": -6.333331108093262, "global_step": 90911, "epoch": 2164} {"train_loss": -6.2478814125061035, "global_step": 90912, "epoch": 2164} {"train_loss": -6.424006462097168, "global_step": 90913, "epoch": 2164} {"train_loss": -6.390856742858887, "global_step": 90914, "epoch": 2164} {"train_loss": -6.266341209411621, "global_step": 90915, "epoch": 2164} {"train_loss": -6.3477020263671875, "global_step": 90916, "epoch": 2164} {"train_loss": -6.1601338386535645, "global_step": 90917, "epoch": 2164} {"train_loss": -6.113186836242676, "global_step": 90918, "epoch": 2164} {"train_loss": -6.192858695983887, "global_step": 90919, "epoch": 2164} {"train_loss": -6.368139266967773, "global_step": 90920, "epoch": 2164} {"train_loss": -6.1541876792907715, "global_step": 90921, "epoch": 2164} {"train_loss": -6.176360130310059, "global_step": 90922, "epoch": 2164} {"train_loss": -6.213102340698242, "global_step": 90923, "epoch": 2164} {"train_loss": -6.139039993286133, "global_step": 90924, "epoch": 2164} {"train_loss": -6.394852638244629, "global_step": 90925, "epoch": 2164} {"train_loss": -6.273079872131348, "global_step": 90926, "epoch": 2164} {"train_loss": -6.166062831878662, "global_step": 90927, "epoch": 2164} {"train_loss": -6.286396503448486, "global_step": 90928, "epoch": 2164} {"train_loss": -6.257374740782238, "global_step": 90929, "epoch": 2164, "val_loss": 75540.921875} {"train_loss": -6.26965856552124, "global_step": 90930, "epoch": 2165} {"train_loss": -6.290129661560059, "global_step": 90931, "epoch": 2165} {"train_loss": -6.331745147705078, "global_step": 90932, "epoch": 2165} {"train_loss": -6.269695281982422, "global_step": 90933, "epoch": 2165} {"train_loss": -6.3337016105651855, "global_step": 90934, "epoch": 2165} {"train_loss": -6.342257499694824, "global_step": 90935, "epoch": 2165} {"train_loss": -6.138849258422852, "global_step": 90936, "epoch": 2165} {"train_loss": -6.273608207702637, "global_step": 90937, "epoch": 2165} {"train_loss": -6.292541027069092, "global_step": 90938, "epoch": 2165} {"train_loss": -6.225364685058594, "global_step": 90939, "epoch": 2165} {"train_loss": -6.2634687423706055, "global_step": 90940, "epoch": 2165} {"train_loss": -6.11322546005249, "global_step": 90941, "epoch": 2165} {"train_loss": -6.330170631408691, "global_step": 90942, "epoch": 2165} {"train_loss": -6.248061180114746, "global_step": 90943, "epoch": 2165} {"train_loss": -6.263432502746582, "global_step": 90944, "epoch": 2165} {"train_loss": -6.255127906799316, "global_step": 90945, "epoch": 2165} {"train_loss": -6.252716541290283, "global_step": 90946, "epoch": 2165} {"train_loss": -6.140003204345703, "global_step": 90947, "epoch": 2165} {"train_loss": -6.348339080810547, "global_step": 90948, "epoch": 2165} {"train_loss": -6.318663597106934, "global_step": 90949, "epoch": 2165} {"train_loss": -6.261518478393555, "global_step": 90950, "epoch": 2165} {"train_loss": -6.264279365539551, "global_step": 90951, "epoch": 2165} {"train_loss": -6.26814079284668, "global_step": 90952, "epoch": 2165} {"train_loss": -6.197460651397705, "global_step": 90953, "epoch": 2165} {"train_loss": -6.129194736480713, "global_step": 90954, "epoch": 2165} {"train_loss": -6.205699920654297, "global_step": 90955, "epoch": 2165} {"train_loss": -6.206458568572998, "global_step": 90956, "epoch": 2165} {"train_loss": -6.171205043792725, "global_step": 90957, "epoch": 2165} {"train_loss": -6.289126396179199, "global_step": 90958, "epoch": 2165} {"train_loss": -6.090915679931641, "global_step": 90959, "epoch": 2165} {"train_loss": -6.087222576141357, "global_step": 90960, "epoch": 2165} {"train_loss": -6.205741882324219, "global_step": 90961, "epoch": 2165} {"train_loss": -6.202954292297363, "global_step": 90962, "epoch": 2165} {"train_loss": -6.270994186401367, "global_step": 90963, "epoch": 2165} {"train_loss": -6.23682975769043, "global_step": 90964, "epoch": 2165} {"train_loss": -6.214473724365234, "global_step": 90965, "epoch": 2165} {"train_loss": -6.085320472717285, "global_step": 90966, "epoch": 2165} {"train_loss": -6.329799652099609, "global_step": 90967, "epoch": 2165} {"train_loss": -6.265542984008789, "global_step": 90968, "epoch": 2165} {"train_loss": -6.278064727783203, "global_step": 90969, "epoch": 2165} {"train_loss": -6.282858848571777, "global_step": 90970, "epoch": 2165} {"train_loss": -6.242518390927996, "global_step": 90971, "epoch": 2165, "val_loss": 75207.5859375} {"train_loss": -6.218832015991211, "global_step": 90972, "epoch": 2166} {"train_loss": -6.177862167358398, "global_step": 90973, "epoch": 2166} {"train_loss": -6.31071138381958, "global_step": 90974, "epoch": 2166} {"train_loss": -6.193265914916992, "global_step": 90975, "epoch": 2166} {"train_loss": -6.359679222106934, "global_step": 90976, "epoch": 2166} {"train_loss": -6.275712966918945, "global_step": 90977, "epoch": 2166} {"train_loss": -6.403380393981934, "global_step": 90978, "epoch": 2166} {"train_loss": -6.451873779296875, "global_step": 90979, "epoch": 2166} {"train_loss": -6.188706398010254, "global_step": 90980, "epoch": 2166} {"train_loss": -6.260434627532959, "global_step": 90981, "epoch": 2166} {"train_loss": -6.27998161315918, "global_step": 90982, "epoch": 2166} {"train_loss": -6.231481075286865, "global_step": 90983, "epoch": 2166} {"train_loss": -6.166414737701416, "global_step": 90984, "epoch": 2166} {"train_loss": -6.237403869628906, "global_step": 90985, "epoch": 2166} {"train_loss": -6.358882904052734, "global_step": 90986, "epoch": 2166} {"train_loss": -6.262444019317627, "global_step": 90987, "epoch": 2166} {"train_loss": -6.372251987457275, "global_step": 90988, "epoch": 2166} {"train_loss": -6.294106483459473, "global_step": 90989, "epoch": 2166} {"train_loss": -6.107082366943359, "global_step": 90990, "epoch": 2166} {"train_loss": -6.180957794189453, "global_step": 90991, "epoch": 2166} {"train_loss": -6.3120927810668945, "global_step": 90992, "epoch": 2166} {"train_loss": -6.3266191482543945, "global_step": 90993, "epoch": 2166} {"train_loss": -6.197623252868652, "global_step": 90994, "epoch": 2166} {"train_loss": -6.180196762084961, "global_step": 90995, "epoch": 2166} {"train_loss": -6.317899703979492, "global_step": 90996, "epoch": 2166} {"train_loss": -6.23163366317749, "global_step": 90997, "epoch": 2166} {"train_loss": -6.204257965087891, "global_step": 90998, "epoch": 2166} {"train_loss": -6.358734130859375, "global_step": 90999, "epoch": 2166} {"train_loss": -6.255640029907227, "global_step": 91000, "epoch": 2166} {"train_loss": -6.090211868286133, "global_step": 91001, "epoch": 2166} {"train_loss": -6.397181510925293, "global_step": 91002, "epoch": 2166} {"train_loss": -6.178887367248535, "global_step": 91003, "epoch": 2166} {"train_loss": -6.225706577301025, "global_step": 91004, "epoch": 2166} {"train_loss": -6.302978515625, "global_step": 91005, "epoch": 2166} {"train_loss": -6.133989334106445, "global_step": 91006, "epoch": 2166} {"train_loss": -6.2498040199279785, "global_step": 91007, "epoch": 2166} {"train_loss": -6.275527000427246, "global_step": 91008, "epoch": 2166} {"train_loss": -6.210351467132568, "global_step": 91009, "epoch": 2166} {"train_loss": -6.362287998199463, "global_step": 91010, "epoch": 2166} {"train_loss": -6.2462921142578125, "global_step": 91011, "epoch": 2166} {"train_loss": -6.295304298400879, "global_step": 91012, "epoch": 2166} {"train_loss": -6.258931398391724, "global_step": 91013, "epoch": 2166, "val_loss": 75491.8046875} {"train_loss": -6.325834274291992, "global_step": 91014, "epoch": 2167} {"train_loss": -6.143996238708496, "global_step": 91015, "epoch": 2167} {"train_loss": -6.306910514831543, "global_step": 91016, "epoch": 2167} {"train_loss": -6.2273359298706055, "global_step": 91017, "epoch": 2167} {"train_loss": -6.276336669921875, "global_step": 91018, "epoch": 2167} {"train_loss": -6.1866865158081055, "global_step": 91019, "epoch": 2167} {"train_loss": -6.222087860107422, "global_step": 91020, "epoch": 2167} {"train_loss": -6.254124641418457, "global_step": 91021, "epoch": 2167} {"train_loss": -6.153334617614746, "global_step": 91022, "epoch": 2167} {"train_loss": -6.320080280303955, "global_step": 91023, "epoch": 2167} {"train_loss": -6.290242671966553, "global_step": 91024, "epoch": 2167} {"train_loss": -6.219567775726318, "global_step": 91025, "epoch": 2167} {"train_loss": -6.2160234451293945, "global_step": 91026, "epoch": 2167} {"train_loss": -6.313935279846191, "global_step": 91027, "epoch": 2167} {"train_loss": -6.199254035949707, "global_step": 91028, "epoch": 2167} {"train_loss": -6.275424957275391, "global_step": 91029, "epoch": 2167} {"train_loss": -6.152206897735596, "global_step": 91030, "epoch": 2167} {"train_loss": -6.331930160522461, "global_step": 91031, "epoch": 2167} {"train_loss": -6.276838779449463, "global_step": 91032, "epoch": 2167} {"train_loss": -6.22810697555542, "global_step": 91033, "epoch": 2167} {"train_loss": -6.270161151885986, "global_step": 91034, "epoch": 2167} {"train_loss": -6.3154706954956055, "global_step": 91035, "epoch": 2167} {"train_loss": -6.25274658203125, "global_step": 91036, "epoch": 2167} {"train_loss": -6.184756755828857, "global_step": 91037, "epoch": 2167} {"train_loss": -6.271604061126709, "global_step": 91038, "epoch": 2167} {"train_loss": -6.342683792114258, "global_step": 91039, "epoch": 2167} {"train_loss": -6.224765777587891, "global_step": 91040, "epoch": 2167} {"train_loss": -6.312150478363037, "global_step": 91041, "epoch": 2167} {"train_loss": -6.196949481964111, "global_step": 91042, "epoch": 2167} {"train_loss": -6.26190185546875, "global_step": 91043, "epoch": 2167} {"train_loss": -6.258106231689453, "global_step": 91044, "epoch": 2167} {"train_loss": -6.294098854064941, "global_step": 91045, "epoch": 2167} {"train_loss": -6.218740463256836, "global_step": 91046, "epoch": 2167} {"train_loss": -6.144109725952148, "global_step": 91047, "epoch": 2167} {"train_loss": -6.265687942504883, "global_step": 91048, "epoch": 2167} {"train_loss": -6.446201324462891, "global_step": 91049, "epoch": 2167} {"train_loss": -6.3539862632751465, "global_step": 91050, "epoch": 2167} {"train_loss": -6.308314323425293, "global_step": 91051, "epoch": 2167} {"train_loss": -6.403583526611328, "global_step": 91052, "epoch": 2167} {"train_loss": -6.376155376434326, "global_step": 91053, "epoch": 2167} {"train_loss": -6.180959701538086, "global_step": 91054, "epoch": 2167} {"train_loss": -6.265173719042823, "global_step": 91055, "epoch": 2167, "val_loss": 75542.71875} {"train_loss": -6.190088272094727, "global_step": 91056, "epoch": 2168} {"train_loss": -6.320810794830322, "global_step": 91057, "epoch": 2168} {"train_loss": -6.289409637451172, "global_step": 91058, "epoch": 2168} {"train_loss": -6.379645824432373, "global_step": 91059, "epoch": 2168} {"train_loss": -6.341694355010986, "global_step": 91060, "epoch": 2168} {"train_loss": -6.315971374511719, "global_step": 91061, "epoch": 2168} {"train_loss": -6.289052963256836, "global_step": 91062, "epoch": 2168} {"train_loss": -6.323533535003662, "global_step": 91063, "epoch": 2168} {"train_loss": -6.246068954467773, "global_step": 91064, "epoch": 2168} {"train_loss": -6.391124248504639, "global_step": 91065, "epoch": 2168} {"train_loss": -6.301905632019043, "global_step": 91066, "epoch": 2168} {"train_loss": -6.181680202484131, "global_step": 91067, "epoch": 2168} {"train_loss": -6.316056251525879, "global_step": 91068, "epoch": 2168} {"train_loss": -6.313162803649902, "global_step": 91069, "epoch": 2168} {"train_loss": -6.317404747009277, "global_step": 91070, "epoch": 2168} {"train_loss": -6.3556084632873535, "global_step": 91071, "epoch": 2168} {"train_loss": -6.35890007019043, "global_step": 91072, "epoch": 2168} {"train_loss": -6.281294822692871, "global_step": 91073, "epoch": 2168} {"train_loss": -6.223184585571289, "global_step": 91074, "epoch": 2168} {"train_loss": -6.31729793548584, "global_step": 91075, "epoch": 2168} {"train_loss": -6.340167999267578, "global_step": 91076, "epoch": 2168} {"train_loss": -6.265254020690918, "global_step": 91077, "epoch": 2168} {"train_loss": -6.285205841064453, "global_step": 91078, "epoch": 2168} {"train_loss": -6.34483528137207, "global_step": 91079, "epoch": 2168} {"train_loss": -6.235162258148193, "global_step": 91080, "epoch": 2168} {"train_loss": -6.262408256530762, "global_step": 91081, "epoch": 2168} {"train_loss": -6.345405101776123, "global_step": 91082, "epoch": 2168} {"train_loss": -6.378106117248535, "global_step": 91083, "epoch": 2168} {"train_loss": -6.324899673461914, "global_step": 91084, "epoch": 2168} {"train_loss": -6.2812652587890625, "global_step": 91085, "epoch": 2168} {"train_loss": -6.23881721496582, "global_step": 91086, "epoch": 2168} {"train_loss": -6.311645030975342, "global_step": 91087, "epoch": 2168} {"train_loss": -6.207815170288086, "global_step": 91088, "epoch": 2168} {"train_loss": -6.208297252655029, "global_step": 91089, "epoch": 2168} {"train_loss": -6.345155715942383, "global_step": 91090, "epoch": 2168} {"train_loss": -6.289763450622559, "global_step": 91091, "epoch": 2168} {"train_loss": -6.3745622634887695, "global_step": 91092, "epoch": 2168} {"train_loss": -6.281394004821777, "global_step": 91093, "epoch": 2168} {"train_loss": -6.183888912200928, "global_step": 91094, "epoch": 2168} {"train_loss": -6.18753719329834, "global_step": 91095, "epoch": 2168} {"train_loss": -6.240321636199951, "global_step": 91096, "epoch": 2168} {"train_loss": -6.293330113093059, "global_step": 91097, "epoch": 2168, "val_loss": 75525.1015625} {"train_loss": -6.236745357513428, "global_step": 91098, "epoch": 2169} {"train_loss": -6.211659908294678, "global_step": 91099, "epoch": 2169} {"train_loss": -6.248502731323242, "global_step": 91100, "epoch": 2169} {"train_loss": -6.228395938873291, "global_step": 91101, "epoch": 2169} {"train_loss": -6.257848739624023, "global_step": 91102, "epoch": 2169} {"train_loss": -6.308002471923828, "global_step": 91103, "epoch": 2169} {"train_loss": -6.311748504638672, "global_step": 91104, "epoch": 2169} {"train_loss": -6.304391860961914, "global_step": 91105, "epoch": 2169} {"train_loss": -6.355857849121094, "global_step": 91106, "epoch": 2169} {"train_loss": -6.272005558013916, "global_step": 91107, "epoch": 2169} {"train_loss": -6.246249198913574, "global_step": 91108, "epoch": 2169} {"train_loss": -6.235735893249512, "global_step": 91109, "epoch": 2169} {"train_loss": -6.322410583496094, "global_step": 91110, "epoch": 2169} {"train_loss": -6.397371292114258, "global_step": 91111, "epoch": 2169} {"train_loss": -6.2605977058410645, "global_step": 91112, "epoch": 2169} {"train_loss": -6.225069522857666, "global_step": 91113, "epoch": 2169} {"train_loss": -6.244112968444824, "global_step": 91114, "epoch": 2169} {"train_loss": -6.288270950317383, "global_step": 91115, "epoch": 2169} {"train_loss": -6.15839958190918, "global_step": 91116, "epoch": 2169} {"train_loss": -6.3241472244262695, "global_step": 91117, "epoch": 2169} {"train_loss": -6.289851665496826, "global_step": 91118, "epoch": 2169} {"train_loss": -6.207834243774414, "global_step": 91119, "epoch": 2169} {"train_loss": -6.302845001220703, "global_step": 91120, "epoch": 2169} {"train_loss": -6.222769737243652, "global_step": 91121, "epoch": 2169} {"train_loss": -6.347500801086426, "global_step": 91122, "epoch": 2169} {"train_loss": -6.259607315063477, "global_step": 91123, "epoch": 2169} {"train_loss": -6.213924407958984, "global_step": 91124, "epoch": 2169} {"train_loss": -6.282411575317383, "global_step": 91125, "epoch": 2169} {"train_loss": -6.323107719421387, "global_step": 91126, "epoch": 2169} {"train_loss": -6.326459884643555, "global_step": 91127, "epoch": 2169} {"train_loss": -6.250036239624023, "global_step": 91128, "epoch": 2169} {"train_loss": -6.238086700439453, "global_step": 91129, "epoch": 2169} {"train_loss": -6.269093036651611, "global_step": 91130, "epoch": 2169} {"train_loss": -6.1830549240112305, "global_step": 91131, "epoch": 2169} {"train_loss": -6.27695369720459, "global_step": 91132, "epoch": 2169} {"train_loss": -6.341933250427246, "global_step": 91133, "epoch": 2169} {"train_loss": -6.273191452026367, "global_step": 91134, "epoch": 2169} {"train_loss": -6.2344183921813965, "global_step": 91135, "epoch": 2169} {"train_loss": -6.24080228805542, "global_step": 91136, "epoch": 2169} {"train_loss": -6.249931812286377, "global_step": 91137, "epoch": 2169} {"train_loss": -6.292028903961182, "global_step": 91138, "epoch": 2169} {"train_loss": -6.271125214440482, "global_step": 91139, "epoch": 2169, "val_loss": 75389.4921875} {"train_loss": -6.360143661499023, "global_step": 91140, "epoch": 2170} {"train_loss": -6.28063440322876, "global_step": 91141, "epoch": 2170} {"train_loss": -6.41732120513916, "global_step": 91142, "epoch": 2170} {"train_loss": -6.284330368041992, "global_step": 91143, "epoch": 2170} {"train_loss": -6.277041435241699, "global_step": 91144, "epoch": 2170} {"train_loss": -6.126360893249512, "global_step": 91145, "epoch": 2170} {"train_loss": -6.255699157714844, "global_step": 91146, "epoch": 2170} {"train_loss": -6.225472450256348, "global_step": 91147, "epoch": 2170} {"train_loss": -6.129766464233398, "global_step": 91148, "epoch": 2170} {"train_loss": -6.184779644012451, "global_step": 91149, "epoch": 2170} {"train_loss": -6.230082035064697, "global_step": 91150, "epoch": 2170} {"train_loss": -6.227943420410156, "global_step": 91151, "epoch": 2170} {"train_loss": -6.257926940917969, "global_step": 91152, "epoch": 2170} {"train_loss": -6.270203113555908, "global_step": 91153, "epoch": 2170} {"train_loss": -6.23984432220459, "global_step": 91154, "epoch": 2170} {"train_loss": -6.344036102294922, "global_step": 91155, "epoch": 2170} {"train_loss": -6.349832057952881, "global_step": 91156, "epoch": 2170} {"train_loss": -6.161762237548828, "global_step": 91157, "epoch": 2170} {"train_loss": -6.215370178222656, "global_step": 91158, "epoch": 2170} {"train_loss": -6.307584285736084, "global_step": 91159, "epoch": 2170} {"train_loss": -6.249001979827881, "global_step": 91160, "epoch": 2170} {"train_loss": -6.295110702514648, "global_step": 91161, "epoch": 2170} {"train_loss": -6.284451484680176, "global_step": 91162, "epoch": 2170} {"train_loss": -6.215005874633789, "global_step": 91163, "epoch": 2170} {"train_loss": -6.216434478759766, "global_step": 91164, "epoch": 2170} {"train_loss": -6.188360691070557, "global_step": 91165, "epoch": 2170} {"train_loss": -6.2580461502075195, "global_step": 91166, "epoch": 2170} {"train_loss": -6.1630659103393555, "global_step": 91167, "epoch": 2170} {"train_loss": -6.315422058105469, "global_step": 91168, "epoch": 2170} {"train_loss": -6.234072685241699, "global_step": 91169, "epoch": 2170} {"train_loss": -6.281167030334473, "global_step": 91170, "epoch": 2170} {"train_loss": -6.299886703491211, "global_step": 91171, "epoch": 2170} {"train_loss": -6.282721519470215, "global_step": 91172, "epoch": 2170} {"train_loss": -6.284327030181885, "global_step": 91173, "epoch": 2170} {"train_loss": -6.2763824462890625, "global_step": 91174, "epoch": 2170} {"train_loss": -6.291504383087158, "global_step": 91175, "epoch": 2170} {"train_loss": -6.197472095489502, "global_step": 91176, "epoch": 2170} {"train_loss": -6.1209917068481445, "global_step": 91177, "epoch": 2170} {"train_loss": -6.250274658203125, "global_step": 91178, "epoch": 2170} {"train_loss": -6.141313552856445, "global_step": 91179, "epoch": 2170} {"train_loss": -6.233654022216797, "global_step": 91180, "epoch": 2170} {"train_loss": -6.246631406602406, "global_step": 91181, "epoch": 2170, "val_loss": 75465.109375} {"train_loss": -6.230297088623047, "global_step": 91182, "epoch": 2171} {"train_loss": -6.198386192321777, "global_step": 91183, "epoch": 2171} {"train_loss": -6.2953596115112305, "global_step": 91184, "epoch": 2171} {"train_loss": -6.340910911560059, "global_step": 91185, "epoch": 2171} {"train_loss": -6.262729644775391, "global_step": 91186, "epoch": 2171} {"train_loss": -6.285456657409668, "global_step": 91187, "epoch": 2171} {"train_loss": -6.202449798583984, "global_step": 91188, "epoch": 2171} {"train_loss": -6.284090042114258, "global_step": 91189, "epoch": 2171} {"train_loss": -6.242277145385742, "global_step": 91190, "epoch": 2171} {"train_loss": -6.3495378494262695, "global_step": 91191, "epoch": 2171} {"train_loss": -6.339652061462402, "global_step": 91192, "epoch": 2171} {"train_loss": -6.296638488769531, "global_step": 91193, "epoch": 2171} {"train_loss": -6.27492618560791, "global_step": 91194, "epoch": 2171} {"train_loss": -6.256136894226074, "global_step": 91195, "epoch": 2171} {"train_loss": -6.2217512130737305, "global_step": 91196, "epoch": 2171} {"train_loss": -6.304487228393555, "global_step": 91197, "epoch": 2171} {"train_loss": -6.354369640350342, "global_step": 91198, "epoch": 2171} {"train_loss": -6.264039039611816, "global_step": 91199, "epoch": 2171} {"train_loss": -6.199019908905029, "global_step": 91200, "epoch": 2171} {"train_loss": -6.226616859436035, "global_step": 91201, "epoch": 2171} {"train_loss": -6.265941619873047, "global_step": 91202, "epoch": 2171} {"train_loss": -6.400308609008789, "global_step": 91203, "epoch": 2171} {"train_loss": -6.180639743804932, "global_step": 91204, "epoch": 2171} {"train_loss": -6.252523422241211, "global_step": 91205, "epoch": 2171} {"train_loss": -6.252340316772461, "global_step": 91206, "epoch": 2171} {"train_loss": -6.294028282165527, "global_step": 91207, "epoch": 2171} {"train_loss": -6.270411968231201, "global_step": 91208, "epoch": 2171} {"train_loss": -6.198041915893555, "global_step": 91209, "epoch": 2171} {"train_loss": -6.157875061035156, "global_step": 91210, "epoch": 2171} {"train_loss": -6.23401403427124, "global_step": 91211, "epoch": 2171} {"train_loss": -6.283298492431641, "global_step": 91212, "epoch": 2171} {"train_loss": -6.3178582191467285, "global_step": 91213, "epoch": 2171} {"train_loss": -6.10202693939209, "global_step": 91214, "epoch": 2171} {"train_loss": -6.267517566680908, "global_step": 91215, "epoch": 2171} {"train_loss": -6.209724426269531, "global_step": 91216, "epoch": 2171} {"train_loss": -6.1405792236328125, "global_step": 91217, "epoch": 2171} {"train_loss": -6.285094261169434, "global_step": 91218, "epoch": 2171} {"train_loss": -6.146102428436279, "global_step": 91219, "epoch": 2171} {"train_loss": -6.029875755310059, "global_step": 91220, "epoch": 2171} {"train_loss": -6.156590461730957, "global_step": 91221, "epoch": 2171} {"train_loss": -6.157902240753174, "global_step": 91222, "epoch": 2171} {"train_loss": -6.2449969337100075, "global_step": 91223, "epoch": 2171, "val_loss": 75598.921875} {"train_loss": -6.109804153442383, "global_step": 91224, "epoch": 2172} {"train_loss": -6.1383514404296875, "global_step": 91225, "epoch": 2172} {"train_loss": -6.295072555541992, "global_step": 91226, "epoch": 2172} {"train_loss": -6.090024948120117, "global_step": 91227, "epoch": 2172} {"train_loss": -6.225368022918701, "global_step": 91228, "epoch": 2172} {"train_loss": -6.266465187072754, "global_step": 91229, "epoch": 2172} {"train_loss": -6.227754592895508, "global_step": 91230, "epoch": 2172} {"train_loss": -6.260650634765625, "global_step": 91231, "epoch": 2172} {"train_loss": -6.297170639038086, "global_step": 91232, "epoch": 2172} {"train_loss": -6.171247959136963, "global_step": 91233, "epoch": 2172} {"train_loss": -6.211240291595459, "global_step": 91234, "epoch": 2172} {"train_loss": -6.22331428527832, "global_step": 91235, "epoch": 2172} {"train_loss": -6.252305507659912, "global_step": 91236, "epoch": 2172} {"train_loss": -6.266257286071777, "global_step": 91237, "epoch": 2172} {"train_loss": -6.22975492477417, "global_step": 91238, "epoch": 2172} {"train_loss": -6.180324554443359, "global_step": 91239, "epoch": 2172} {"train_loss": -6.277242183685303, "global_step": 91240, "epoch": 2172} {"train_loss": -6.211794853210449, "global_step": 91241, "epoch": 2172} {"train_loss": -6.2019572257995605, "global_step": 91242, "epoch": 2172} {"train_loss": -6.380956649780273, "global_step": 91243, "epoch": 2172} {"train_loss": -6.327231407165527, "global_step": 91244, "epoch": 2172} {"train_loss": -6.198814868927002, "global_step": 91245, "epoch": 2172} {"train_loss": -6.256770133972168, "global_step": 91246, "epoch": 2172} {"train_loss": -6.384618759155273, "global_step": 91247, "epoch": 2172} {"train_loss": -6.123753070831299, "global_step": 91248, "epoch": 2172} {"train_loss": -6.33888053894043, "global_step": 91249, "epoch": 2172} {"train_loss": -6.269293785095215, "global_step": 91250, "epoch": 2172} {"train_loss": -6.2348527908325195, "global_step": 91251, "epoch": 2172} {"train_loss": -6.252223014831543, "global_step": 91252, "epoch": 2172} {"train_loss": -6.347663879394531, "global_step": 91253, "epoch": 2172} {"train_loss": -6.105655670166016, "global_step": 91254, "epoch": 2172} {"train_loss": -6.317946434020996, "global_step": 91255, "epoch": 2172} {"train_loss": -6.287450313568115, "global_step": 91256, "epoch": 2172} {"train_loss": -6.308967590332031, "global_step": 91257, "epoch": 2172} {"train_loss": -6.191248416900635, "global_step": 91258, "epoch": 2172} {"train_loss": -6.227595329284668, "global_step": 91259, "epoch": 2172} {"train_loss": -6.324243545532227, "global_step": 91260, "epoch": 2172} {"train_loss": -6.355090618133545, "global_step": 91261, "epoch": 2172} {"train_loss": -6.205498695373535, "global_step": 91262, "epoch": 2172} {"train_loss": -6.1773834228515625, "global_step": 91263, "epoch": 2172} {"train_loss": -6.188753128051758, "global_step": 91264, "epoch": 2172} {"train_loss": -6.24490077154977, "global_step": 91265, "epoch": 2172, "val_loss": 75481.6328125} {"train_loss": -6.236047744750977, "global_step": 91266, "epoch": 2173} {"train_loss": -6.312861919403076, "global_step": 91267, "epoch": 2173} {"train_loss": -6.3417229652404785, "global_step": 91268, "epoch": 2173} {"train_loss": -6.197127342224121, "global_step": 91269, "epoch": 2173} {"train_loss": -6.215730667114258, "global_step": 91270, "epoch": 2173} {"train_loss": -6.241698265075684, "global_step": 91271, "epoch": 2173} {"train_loss": -6.183243751525879, "global_step": 91272, "epoch": 2173} {"train_loss": -6.361641883850098, "global_step": 91273, "epoch": 2173} {"train_loss": -6.253219127655029, "global_step": 91274, "epoch": 2173} {"train_loss": -6.176515579223633, "global_step": 91275, "epoch": 2173} {"train_loss": -6.288365364074707, "global_step": 91276, "epoch": 2173} {"train_loss": -6.362103462219238, "global_step": 91277, "epoch": 2173} {"train_loss": -6.245126247406006, "global_step": 91278, "epoch": 2173} {"train_loss": -6.219429969787598, "global_step": 91279, "epoch": 2173} {"train_loss": -6.285280227661133, "global_step": 91280, "epoch": 2173} {"train_loss": -6.327299118041992, "global_step": 91281, "epoch": 2173} {"train_loss": -6.2913641929626465, "global_step": 91282, "epoch": 2173} {"train_loss": -6.240375518798828, "global_step": 91283, "epoch": 2173} {"train_loss": -6.300324440002441, "global_step": 91284, "epoch": 2173} {"train_loss": -6.198437690734863, "global_step": 91285, "epoch": 2173} {"train_loss": -6.264347076416016, "global_step": 91286, "epoch": 2173} {"train_loss": -6.145084857940674, "global_step": 91287, "epoch": 2173} {"train_loss": -6.244068622589111, "global_step": 91288, "epoch": 2173} {"train_loss": -6.209734916687012, "global_step": 91289, "epoch": 2173} {"train_loss": -6.179139137268066, "global_step": 91290, "epoch": 2173} {"train_loss": -6.231529712677002, "global_step": 91291, "epoch": 2173} {"train_loss": -6.335915565490723, "global_step": 91292, "epoch": 2173} {"train_loss": -6.156418323516846, "global_step": 91293, "epoch": 2173} {"train_loss": -6.162942886352539, "global_step": 91294, "epoch": 2173} {"train_loss": -6.1425628662109375, "global_step": 91295, "epoch": 2173} {"train_loss": -6.31953763961792, "global_step": 91296, "epoch": 2173} {"train_loss": -6.199929237365723, "global_step": 91297, "epoch": 2173} {"train_loss": -6.187227249145508, "global_step": 91298, "epoch": 2173} {"train_loss": -6.212467670440674, "global_step": 91299, "epoch": 2173} {"train_loss": -6.219486236572266, "global_step": 91300, "epoch": 2173} {"train_loss": -6.2306718826293945, "global_step": 91301, "epoch": 2173} {"train_loss": -6.185830116271973, "global_step": 91302, "epoch": 2173} {"train_loss": -6.265214920043945, "global_step": 91303, "epoch": 2173} {"train_loss": -6.303912162780762, "global_step": 91304, "epoch": 2173} {"train_loss": -6.2171196937561035, "global_step": 91305, "epoch": 2173} {"train_loss": -6.197673797607422, "global_step": 91306, "epoch": 2173} {"train_loss": -6.242399283817837, "global_step": 91307, "epoch": 2173, "val_loss": 75216.2421875} {"train_loss": -6.266798973083496, "global_step": 91308, "epoch": 2174} {"train_loss": -6.210131645202637, "global_step": 91309, "epoch": 2174} {"train_loss": -6.242839813232422, "global_step": 91310, "epoch": 2174} {"train_loss": -6.257002830505371, "global_step": 91311, "epoch": 2174} {"train_loss": -6.240138530731201, "global_step": 91312, "epoch": 2174} {"train_loss": -6.251053810119629, "global_step": 91313, "epoch": 2174} {"train_loss": -6.363563537597656, "global_step": 91314, "epoch": 2174} {"train_loss": -6.293551445007324, "global_step": 91315, "epoch": 2174} {"train_loss": -6.289783477783203, "global_step": 91316, "epoch": 2174} {"train_loss": -6.233709812164307, "global_step": 91317, "epoch": 2174} {"train_loss": -6.362757682800293, "global_step": 91318, "epoch": 2174} {"train_loss": -6.29322624206543, "global_step": 91319, "epoch": 2174} {"train_loss": -6.3326640129089355, "global_step": 91320, "epoch": 2174} {"train_loss": -6.266169548034668, "global_step": 91321, "epoch": 2174} {"train_loss": -6.307394027709961, "global_step": 91322, "epoch": 2174} {"train_loss": -6.219801902770996, "global_step": 91323, "epoch": 2174} {"train_loss": -6.4275617599487305, "global_step": 91324, "epoch": 2174} {"train_loss": -6.272758960723877, "global_step": 91325, "epoch": 2174} {"train_loss": -6.207163333892822, "global_step": 91326, "epoch": 2174} {"train_loss": -6.233790397644043, "global_step": 91327, "epoch": 2174} {"train_loss": -6.1980133056640625, "global_step": 91328, "epoch": 2174} {"train_loss": -6.195650100708008, "global_step": 91329, "epoch": 2174} {"train_loss": -6.191421031951904, "global_step": 91330, "epoch": 2174} {"train_loss": -6.236525535583496, "global_step": 91331, "epoch": 2174} {"train_loss": -6.3021392822265625, "global_step": 91332, "epoch": 2174} {"train_loss": -6.344548225402832, "global_step": 91333, "epoch": 2174} {"train_loss": -6.251204490661621, "global_step": 91334, "epoch": 2174} {"train_loss": -6.250125885009766, "global_step": 91335, "epoch": 2174} {"train_loss": -6.222775936126709, "global_step": 91336, "epoch": 2174} {"train_loss": -6.35968542098999, "global_step": 91337, "epoch": 2174} {"train_loss": -6.28106689453125, "global_step": 91338, "epoch": 2174} {"train_loss": -6.225049018859863, "global_step": 91339, "epoch": 2174} {"train_loss": -6.29840612411499, "global_step": 91340, "epoch": 2174} {"train_loss": -6.2306365966796875, "global_step": 91341, "epoch": 2174} {"train_loss": -6.2502617835998535, "global_step": 91342, "epoch": 2174} {"train_loss": -6.301051616668701, "global_step": 91343, "epoch": 2174} {"train_loss": -6.257092475891113, "global_step": 91344, "epoch": 2174} {"train_loss": -6.336014270782471, "global_step": 91345, "epoch": 2174} {"train_loss": -6.316082954406738, "global_step": 91346, "epoch": 2174} {"train_loss": -6.2773942947387695, "global_step": 91347, "epoch": 2174} {"train_loss": -6.3853559494018555, "global_step": 91348, "epoch": 2174} {"train_loss": -6.277187676656814, "global_step": 91349, "epoch": 2174, "val_loss": 75394.875} {"train_loss": -6.336981773376465, "global_step": 91350, "epoch": 2175} {"train_loss": -6.209730625152588, "global_step": 91351, "epoch": 2175} {"train_loss": -6.286538124084473, "global_step": 91352, "epoch": 2175} {"train_loss": -6.341047286987305, "global_step": 91353, "epoch": 2175} {"train_loss": -6.283318519592285, "global_step": 91354, "epoch": 2175} {"train_loss": -6.2897772789001465, "global_step": 91355, "epoch": 2175} {"train_loss": -6.256913185119629, "global_step": 91356, "epoch": 2175} {"train_loss": -6.251526832580566, "global_step": 91357, "epoch": 2175} {"train_loss": -6.359161376953125, "global_step": 91358, "epoch": 2175} {"train_loss": -6.178489685058594, "global_step": 91359, "epoch": 2175} {"train_loss": -6.37140417098999, "global_step": 91360, "epoch": 2175} {"train_loss": -6.135379791259766, "global_step": 91361, "epoch": 2175} {"train_loss": -6.252795219421387, "global_step": 91362, "epoch": 2175} {"train_loss": -6.162641525268555, "global_step": 91363, "epoch": 2175} {"train_loss": -6.1809868812561035, "global_step": 91364, "epoch": 2175} {"train_loss": -6.286558151245117, "global_step": 91365, "epoch": 2175} {"train_loss": -6.217765808105469, "global_step": 91366, "epoch": 2175} {"train_loss": -6.035910129547119, "global_step": 91367, "epoch": 2175} {"train_loss": -6.0918684005737305, "global_step": 91368, "epoch": 2175} {"train_loss": -6.127032279968262, "global_step": 91369, "epoch": 2175} {"train_loss": -6.145451545715332, "global_step": 91370, "epoch": 2175} {"train_loss": -6.249560356140137, "global_step": 91371, "epoch": 2175} {"train_loss": -6.314301490783691, "global_step": 91372, "epoch": 2175} {"train_loss": -6.1722283363342285, "global_step": 91373, "epoch": 2175} {"train_loss": -6.135311603546143, "global_step": 91374, "epoch": 2175} {"train_loss": -6.184115409851074, "global_step": 91375, "epoch": 2175} {"train_loss": -6.11745548248291, "global_step": 91376, "epoch": 2175} {"train_loss": -6.218393325805664, "global_step": 91377, "epoch": 2175} {"train_loss": -6.195926189422607, "global_step": 91378, "epoch": 2175} {"train_loss": -6.025500774383545, "global_step": 91379, "epoch": 2175} {"train_loss": -6.277228355407715, "global_step": 91380, "epoch": 2175} {"train_loss": -6.153862476348877, "global_step": 91381, "epoch": 2175} {"train_loss": -6.339835166931152, "global_step": 91382, "epoch": 2175} {"train_loss": -6.206426620483398, "global_step": 91383, "epoch": 2175} {"train_loss": -6.230738162994385, "global_step": 91384, "epoch": 2175} {"train_loss": -6.237688064575195, "global_step": 91385, "epoch": 2175} {"train_loss": -6.080852031707764, "global_step": 91386, "epoch": 2175} {"train_loss": -6.202588081359863, "global_step": 91387, "epoch": 2175} {"train_loss": -6.08342981338501, "global_step": 91388, "epoch": 2175} {"train_loss": -6.333244323730469, "global_step": 91389, "epoch": 2175} {"train_loss": -6.16370964050293, "global_step": 91390, "epoch": 2175} {"train_loss": -6.211435533705211, "global_step": 91391, "epoch": 2175, "val_loss": 75426.3671875} {"train_loss": -6.22305965423584, "global_step": 91392, "epoch": 2176} {"train_loss": -6.297778129577637, "global_step": 91393, "epoch": 2176} {"train_loss": -6.213332653045654, "global_step": 91394, "epoch": 2176} {"train_loss": -6.127279281616211, "global_step": 91395, "epoch": 2176} {"train_loss": -6.237220764160156, "global_step": 91396, "epoch": 2176} {"train_loss": -6.228179931640625, "global_step": 91397, "epoch": 2176} {"train_loss": -6.221602439880371, "global_step": 91398, "epoch": 2176} {"train_loss": -6.244732856750488, "global_step": 91399, "epoch": 2176} {"train_loss": -6.335432052612305, "global_step": 91400, "epoch": 2176} {"train_loss": -6.3328046798706055, "global_step": 91401, "epoch": 2176} {"train_loss": -6.294632911682129, "global_step": 91402, "epoch": 2176} {"train_loss": -6.206024169921875, "global_step": 91403, "epoch": 2176} {"train_loss": -6.27862548828125, "global_step": 91404, "epoch": 2176} {"train_loss": -6.287435531616211, "global_step": 91405, "epoch": 2176} {"train_loss": -6.250047206878662, "global_step": 91406, "epoch": 2176} {"train_loss": -6.338274955749512, "global_step": 91407, "epoch": 2176} {"train_loss": -6.167753219604492, "global_step": 91408, "epoch": 2176} {"train_loss": -6.239690780639648, "global_step": 91409, "epoch": 2176} {"train_loss": -6.262876033782959, "global_step": 91410, "epoch": 2176} {"train_loss": -6.220844268798828, "global_step": 91411, "epoch": 2176} {"train_loss": -6.267764091491699, "global_step": 91412, "epoch": 2176} {"train_loss": -6.284538269042969, "global_step": 91413, "epoch": 2176} {"train_loss": -6.173210144042969, "global_step": 91414, "epoch": 2176} {"train_loss": -6.1740288734436035, "global_step": 91415, "epoch": 2176} {"train_loss": -6.239026069641113, "global_step": 91416, "epoch": 2176} {"train_loss": -6.177298545837402, "global_step": 91417, "epoch": 2176} {"train_loss": -6.240016937255859, "global_step": 91418, "epoch": 2176} {"train_loss": -6.214698314666748, "global_step": 91419, "epoch": 2176} {"train_loss": -6.104591369628906, "global_step": 91420, "epoch": 2176} {"train_loss": -6.272183418273926, "global_step": 91421, "epoch": 2176} {"train_loss": -6.312573432922363, "global_step": 91422, "epoch": 2176} {"train_loss": -6.256452560424805, "global_step": 91423, "epoch": 2176} {"train_loss": -6.212410926818848, "global_step": 91424, "epoch": 2176} {"train_loss": -6.141201972961426, "global_step": 91425, "epoch": 2176} {"train_loss": -6.296152114868164, "global_step": 91426, "epoch": 2176} {"train_loss": -6.2658843994140625, "global_step": 91427, "epoch": 2176} {"train_loss": -6.231100559234619, "global_step": 91428, "epoch": 2176} {"train_loss": -6.2536420822143555, "global_step": 91429, "epoch": 2176} {"train_loss": -6.168084621429443, "global_step": 91430, "epoch": 2176} {"train_loss": -6.250434875488281, "global_step": 91431, "epoch": 2176} {"train_loss": -6.204812049865723, "global_step": 91432, "epoch": 2176} {"train_loss": -6.237394026347569, "global_step": 91433, "epoch": 2176, "val_loss": 75562.328125} {"train_loss": -6.276533126831055, "global_step": 91434, "epoch": 2177} {"train_loss": -6.234760284423828, "global_step": 91435, "epoch": 2177} {"train_loss": -6.023348808288574, "global_step": 91436, "epoch": 2177} {"train_loss": -6.345553398132324, "global_step": 91437, "epoch": 2177} {"train_loss": -6.2102885246276855, "global_step": 91438, "epoch": 2177} {"train_loss": -6.1999921798706055, "global_step": 91439, "epoch": 2177} {"train_loss": -6.158506393432617, "global_step": 91440, "epoch": 2177} {"train_loss": -6.261776924133301, "global_step": 91441, "epoch": 2177} {"train_loss": -6.176600933074951, "global_step": 91442, "epoch": 2177} {"train_loss": -6.277921676635742, "global_step": 91443, "epoch": 2177} {"train_loss": -6.344964981079102, "global_step": 91444, "epoch": 2177} {"train_loss": -6.154574394226074, "global_step": 91445, "epoch": 2177} {"train_loss": -6.230410575866699, "global_step": 91446, "epoch": 2177} {"train_loss": -6.286210060119629, "global_step": 91447, "epoch": 2177} {"train_loss": -6.2847394943237305, "global_step": 91448, "epoch": 2177} {"train_loss": -6.257134437561035, "global_step": 91449, "epoch": 2177} {"train_loss": -6.321043014526367, "global_step": 91450, "epoch": 2177} {"train_loss": -6.253498077392578, "global_step": 91451, "epoch": 2177} {"train_loss": -6.314034461975098, "global_step": 91452, "epoch": 2177} {"train_loss": -6.288397789001465, "global_step": 91453, "epoch": 2177} {"train_loss": -6.24832010269165, "global_step": 91454, "epoch": 2177} {"train_loss": -6.204415321350098, "global_step": 91455, "epoch": 2177} {"train_loss": -6.286710739135742, "global_step": 91456, "epoch": 2177} {"train_loss": -6.244305610656738, "global_step": 91457, "epoch": 2177} {"train_loss": -6.32123327255249, "global_step": 91458, "epoch": 2177} {"train_loss": -6.3033671379089355, "global_step": 91459, "epoch": 2177} {"train_loss": -6.316944122314453, "global_step": 91460, "epoch": 2177} {"train_loss": -6.395058631896973, "global_step": 91461, "epoch": 2177} {"train_loss": -6.34809684753418, "global_step": 91462, "epoch": 2177} {"train_loss": -6.320705413818359, "global_step": 91463, "epoch": 2177} {"train_loss": -6.280946254730225, "global_step": 91464, "epoch": 2177} {"train_loss": -6.397973537445068, "global_step": 91465, "epoch": 2177} {"train_loss": -6.319633483886719, "global_step": 91466, "epoch": 2177} {"train_loss": -6.354636192321777, "global_step": 91467, "epoch": 2177} {"train_loss": -6.2632951736450195, "global_step": 91468, "epoch": 2177} {"train_loss": -6.3292765617370605, "global_step": 91469, "epoch": 2177} {"train_loss": -6.293252944946289, "global_step": 91470, "epoch": 2177} {"train_loss": -6.22237491607666, "global_step": 91471, "epoch": 2177} {"train_loss": -6.3614888191223145, "global_step": 91472, "epoch": 2177} {"train_loss": -6.27303409576416, "global_step": 91473, "epoch": 2177} {"train_loss": -6.235049724578857, "global_step": 91474, "epoch": 2177} {"train_loss": -6.271023364294143, "global_step": 91475, "epoch": 2177, "val_loss": 75345.953125} {"train_loss": -6.254762172698975, "global_step": 91476, "epoch": 2178} {"train_loss": -6.267719745635986, "global_step": 91477, "epoch": 2178} {"train_loss": -6.170771598815918, "global_step": 91478, "epoch": 2178} {"train_loss": -6.293111801147461, "global_step": 91479, "epoch": 2178} {"train_loss": -6.321710586547852, "global_step": 91480, "epoch": 2178} {"train_loss": -6.2507476806640625, "global_step": 91481, "epoch": 2178} {"train_loss": -6.207371234893799, "global_step": 91482, "epoch": 2178} {"train_loss": -6.049927711486816, "global_step": 91483, "epoch": 2178} {"train_loss": -6.247095584869385, "global_step": 91484, "epoch": 2178} {"train_loss": -6.081976890563965, "global_step": 91485, "epoch": 2178} {"train_loss": -6.188858985900879, "global_step": 91486, "epoch": 2178} {"train_loss": -6.169623851776123, "global_step": 91487, "epoch": 2178} {"train_loss": -6.118376731872559, "global_step": 91488, "epoch": 2178} {"train_loss": -6.209102153778076, "global_step": 91489, "epoch": 2178} {"train_loss": -6.101007461547852, "global_step": 91490, "epoch": 2178} {"train_loss": -6.24680233001709, "global_step": 91491, "epoch": 2178} {"train_loss": -6.310447692871094, "global_step": 91492, "epoch": 2178} {"train_loss": -6.176902770996094, "global_step": 91493, "epoch": 2178} {"train_loss": -6.367245197296143, "global_step": 91494, "epoch": 2178} {"train_loss": -6.229283809661865, "global_step": 91495, "epoch": 2178} {"train_loss": -6.1698126792907715, "global_step": 91496, "epoch": 2178} {"train_loss": -6.100257873535156, "global_step": 91497, "epoch": 2178} {"train_loss": -6.2916789054870605, "global_step": 91498, "epoch": 2178} {"train_loss": -6.327916622161865, "global_step": 91499, "epoch": 2178} {"train_loss": -6.303122520446777, "global_step": 91500, "epoch": 2178} {"train_loss": -6.114377021789551, "global_step": 91501, "epoch": 2178} {"train_loss": -6.221800804138184, "global_step": 91502, "epoch": 2178} {"train_loss": -6.17067813873291, "global_step": 91503, "epoch": 2178} {"train_loss": -6.354280948638916, "global_step": 91504, "epoch": 2178} {"train_loss": -6.296749114990234, "global_step": 91505, "epoch": 2178} {"train_loss": -6.2292633056640625, "global_step": 91506, "epoch": 2178} {"train_loss": -6.288692474365234, "global_step": 91507, "epoch": 2178} {"train_loss": -6.194789409637451, "global_step": 91508, "epoch": 2178} {"train_loss": -6.269186973571777, "global_step": 91509, "epoch": 2178} {"train_loss": -6.211186408996582, "global_step": 91510, "epoch": 2178} {"train_loss": -6.277390480041504, "global_step": 91511, "epoch": 2178} {"train_loss": -6.305768966674805, "global_step": 91512, "epoch": 2178} {"train_loss": -6.313000679016113, "global_step": 91513, "epoch": 2178} {"train_loss": -6.410327434539795, "global_step": 91514, "epoch": 2178} {"train_loss": -6.352948188781738, "global_step": 91515, "epoch": 2178} {"train_loss": -6.260751724243164, "global_step": 91516, "epoch": 2178} {"train_loss": -6.236254816963559, "global_step": 91517, "epoch": 2178, "val_loss": 75384.4296875} {"train_loss": -6.197948932647705, "global_step": 91518, "epoch": 2179} {"train_loss": -6.312758445739746, "global_step": 91519, "epoch": 2179} {"train_loss": -6.234362602233887, "global_step": 91520, "epoch": 2179} {"train_loss": -6.1904096603393555, "global_step": 91521, "epoch": 2179} {"train_loss": -6.384957313537598, "global_step": 91522, "epoch": 2179} {"train_loss": -6.282198429107666, "global_step": 91523, "epoch": 2179} {"train_loss": -6.144750118255615, "global_step": 91524, "epoch": 2179} {"train_loss": -6.3983283042907715, "global_step": 91525, "epoch": 2179} {"train_loss": -6.375179767608643, "global_step": 91526, "epoch": 2179} {"train_loss": -6.214831829071045, "global_step": 91527, "epoch": 2179} {"train_loss": -6.209397792816162, "global_step": 91528, "epoch": 2179} {"train_loss": -6.307921409606934, "global_step": 91529, "epoch": 2179} {"train_loss": -6.286068916320801, "global_step": 91530, "epoch": 2179} {"train_loss": -6.404892921447754, "global_step": 91531, "epoch": 2179} {"train_loss": -6.299464225769043, "global_step": 91532, "epoch": 2179} {"train_loss": -6.350874423980713, "global_step": 91533, "epoch": 2179} {"train_loss": -6.310681343078613, "global_step": 91534, "epoch": 2179} {"train_loss": -6.245254039764404, "global_step": 91535, "epoch": 2179} {"train_loss": -6.174376487731934, "global_step": 91536, "epoch": 2179} {"train_loss": -6.289597988128662, "global_step": 91537, "epoch": 2179} {"train_loss": -6.331680774688721, "global_step": 91538, "epoch": 2179} {"train_loss": -6.239874839782715, "global_step": 91539, "epoch": 2179} {"train_loss": -6.185147285461426, "global_step": 91540, "epoch": 2179} {"train_loss": -6.310924530029297, "global_step": 91541, "epoch": 2179} {"train_loss": -6.351131439208984, "global_step": 91542, "epoch": 2179} {"train_loss": -6.329654693603516, "global_step": 91543, "epoch": 2179} {"train_loss": -6.239713668823242, "global_step": 91544, "epoch": 2179} {"train_loss": -6.207452774047852, "global_step": 91545, "epoch": 2179} {"train_loss": -6.19024658203125, "global_step": 91546, "epoch": 2179} {"train_loss": -6.386229515075684, "global_step": 91547, "epoch": 2179} {"train_loss": -6.276329040527344, "global_step": 91548, "epoch": 2179} {"train_loss": -6.257402420043945, "global_step": 91549, "epoch": 2179} {"train_loss": -6.335597991943359, "global_step": 91550, "epoch": 2179} {"train_loss": -6.216635704040527, "global_step": 91551, "epoch": 2179} {"train_loss": -6.119325160980225, "global_step": 91552, "epoch": 2179} {"train_loss": -6.292645454406738, "global_step": 91553, "epoch": 2179} {"train_loss": -6.248011112213135, "global_step": 91554, "epoch": 2179} {"train_loss": -6.229825973510742, "global_step": 91555, "epoch": 2179} {"train_loss": -6.378907203674316, "global_step": 91556, "epoch": 2179} {"train_loss": -6.27191162109375, "global_step": 91557, "epoch": 2179} {"train_loss": -6.304442405700684, "global_step": 91558, "epoch": 2179} {"train_loss": -6.276327224004836, "global_step": 91559, "epoch": 2179, "val_loss": 75411.3515625} {"train_loss": -6.258298873901367, "global_step": 91560, "epoch": 2180} {"train_loss": -6.293839454650879, "global_step": 91561, "epoch": 2180} {"train_loss": -6.1627397537231445, "global_step": 91562, "epoch": 2180} {"train_loss": -6.224239826202393, "global_step": 91563, "epoch": 2180} {"train_loss": -6.207145690917969, "global_step": 91564, "epoch": 2180} {"train_loss": -6.304213523864746, "global_step": 91565, "epoch": 2180} {"train_loss": -6.289191246032715, "global_step": 91566, "epoch": 2180} {"train_loss": -6.186634063720703, "global_step": 91567, "epoch": 2180} {"train_loss": -6.363530158996582, "global_step": 91568, "epoch": 2180} {"train_loss": -6.263615131378174, "global_step": 91569, "epoch": 2180} {"train_loss": -6.270259857177734, "global_step": 91570, "epoch": 2180} {"train_loss": -6.225057601928711, "global_step": 91571, "epoch": 2180} {"train_loss": -6.236094951629639, "global_step": 91572, "epoch": 2180} {"train_loss": -6.1663103103637695, "global_step": 91573, "epoch": 2180} {"train_loss": -6.243091583251953, "global_step": 91574, "epoch": 2180} {"train_loss": -6.236579418182373, "global_step": 91575, "epoch": 2180} {"train_loss": -6.291032791137695, "global_step": 91576, "epoch": 2180} {"train_loss": -6.358838081359863, "global_step": 91577, "epoch": 2180} {"train_loss": -6.2725982666015625, "global_step": 91578, "epoch": 2180} {"train_loss": -6.281661033630371, "global_step": 91579, "epoch": 2180} {"train_loss": -6.292826175689697, "global_step": 91580, "epoch": 2180} {"train_loss": -6.228043556213379, "global_step": 91581, "epoch": 2180} {"train_loss": -6.14968204498291, "global_step": 91582, "epoch": 2180} {"train_loss": -6.278727054595947, "global_step": 91583, "epoch": 2180} {"train_loss": -6.231066703796387, "global_step": 91584, "epoch": 2180} {"train_loss": -6.292430877685547, "global_step": 91585, "epoch": 2180} {"train_loss": -6.3376994132995605, "global_step": 91586, "epoch": 2180} {"train_loss": -6.242651462554932, "global_step": 91587, "epoch": 2180} {"train_loss": -6.109995365142822, "global_step": 91588, "epoch": 2180} {"train_loss": -6.294973373413086, "global_step": 91589, "epoch": 2180} {"train_loss": -6.245736598968506, "global_step": 91590, "epoch": 2180} {"train_loss": -6.259689807891846, "global_step": 91591, "epoch": 2180} {"train_loss": -6.293148040771484, "global_step": 91592, "epoch": 2180} {"train_loss": -6.411118507385254, "global_step": 91593, "epoch": 2180} {"train_loss": -6.273698806762695, "global_step": 91594, "epoch": 2180} {"train_loss": -6.253944396972656, "global_step": 91595, "epoch": 2180} {"train_loss": -6.23549222946167, "global_step": 91596, "epoch": 2180} {"train_loss": -6.286409854888916, "global_step": 91597, "epoch": 2180} {"train_loss": -6.211690902709961, "global_step": 91598, "epoch": 2180} {"train_loss": -6.2865705490112305, "global_step": 91599, "epoch": 2180} {"train_loss": -6.2246904373168945, "global_step": 91600, "epoch": 2180} {"train_loss": -6.258814414342244, "global_step": 91601, "epoch": 2180, "val_loss": 75158.6484375} {"train_loss": -6.300709247589111, "global_step": 91602, "epoch": 2181} {"train_loss": -6.3139238357543945, "global_step": 91603, "epoch": 2181} {"train_loss": -6.280528545379639, "global_step": 91604, "epoch": 2181} {"train_loss": -6.282023906707764, "global_step": 91605, "epoch": 2181} {"train_loss": -6.234565258026123, "global_step": 91606, "epoch": 2181} {"train_loss": -6.233597278594971, "global_step": 91607, "epoch": 2181} {"train_loss": -6.113290309906006, "global_step": 91608, "epoch": 2181} {"train_loss": -6.293355464935303, "global_step": 91609, "epoch": 2181} {"train_loss": -6.232256889343262, "global_step": 91610, "epoch": 2181} {"train_loss": -6.314984321594238, "global_step": 91611, "epoch": 2181} {"train_loss": -6.376847267150879, "global_step": 91612, "epoch": 2181} {"train_loss": -6.270936012268066, "global_step": 91613, "epoch": 2181} {"train_loss": -6.265132904052734, "global_step": 91614, "epoch": 2181} {"train_loss": -6.300793170928955, "global_step": 91615, "epoch": 2181} {"train_loss": -6.34568977355957, "global_step": 91616, "epoch": 2181} {"train_loss": -6.134744644165039, "global_step": 91617, "epoch": 2181} {"train_loss": -6.245972156524658, "global_step": 91618, "epoch": 2181} {"train_loss": -6.222651481628418, "global_step": 91619, "epoch": 2181} {"train_loss": -6.184844970703125, "global_step": 91620, "epoch": 2181} {"train_loss": -6.228920936584473, "global_step": 91621, "epoch": 2181} {"train_loss": -6.180380821228027, "global_step": 91622, "epoch": 2181} {"train_loss": -6.407155513763428, "global_step": 91623, "epoch": 2181} {"train_loss": -6.304703712463379, "global_step": 91624, "epoch": 2181} {"train_loss": -6.183282852172852, "global_step": 91625, "epoch": 2181} {"train_loss": -6.266072750091553, "global_step": 91626, "epoch": 2181} {"train_loss": -6.194982051849365, "global_step": 91627, "epoch": 2181} {"train_loss": -6.199603080749512, "global_step": 91628, "epoch": 2181} {"train_loss": -6.283012390136719, "global_step": 91629, "epoch": 2181} {"train_loss": -6.0674567222595215, "global_step": 91630, "epoch": 2181} {"train_loss": -6.140789031982422, "global_step": 91631, "epoch": 2181} {"train_loss": -6.132473468780518, "global_step": 91632, "epoch": 2181} {"train_loss": -6.183960437774658, "global_step": 91633, "epoch": 2181} {"train_loss": -6.295311450958252, "global_step": 91634, "epoch": 2181} {"train_loss": -6.223089694976807, "global_step": 91635, "epoch": 2181} {"train_loss": -6.287715911865234, "global_step": 91636, "epoch": 2181} {"train_loss": -6.223198890686035, "global_step": 91637, "epoch": 2181} {"train_loss": -6.340790748596191, "global_step": 91638, "epoch": 2181} {"train_loss": -6.17495059967041, "global_step": 91639, "epoch": 2181} {"train_loss": -6.166957855224609, "global_step": 91640, "epoch": 2181} {"train_loss": -6.247808456420898, "global_step": 91641, "epoch": 2181} {"train_loss": -6.23388671875, "global_step": 91642, "epoch": 2181} {"train_loss": -6.243983155205136, "global_step": 91643, "epoch": 2181, "val_loss": 75210.375} {"train_loss": -6.150988578796387, "global_step": 91644, "epoch": 2182} {"train_loss": -6.27675724029541, "global_step": 91645, "epoch": 2182} {"train_loss": -6.286062240600586, "global_step": 91646, "epoch": 2182} {"train_loss": -6.327770709991455, "global_step": 91647, "epoch": 2182} {"train_loss": -6.344874858856201, "global_step": 91648, "epoch": 2182} {"train_loss": -6.186050891876221, "global_step": 91649, "epoch": 2182} {"train_loss": -6.293972969055176, "global_step": 91650, "epoch": 2182} {"train_loss": -6.214888095855713, "global_step": 91651, "epoch": 2182} {"train_loss": -6.423033237457275, "global_step": 91652, "epoch": 2182} {"train_loss": -6.365839958190918, "global_step": 91653, "epoch": 2182} {"train_loss": -6.273500919342041, "global_step": 91654, "epoch": 2182} {"train_loss": -6.266423225402832, "global_step": 91655, "epoch": 2182} {"train_loss": -6.141199111938477, "global_step": 91656, "epoch": 2182} {"train_loss": -6.232105255126953, "global_step": 91657, "epoch": 2182} {"train_loss": -6.155943393707275, "global_step": 91658, "epoch": 2182} {"train_loss": -6.191352367401123, "global_step": 91659, "epoch": 2182} {"train_loss": -6.29012393951416, "global_step": 91660, "epoch": 2182} {"train_loss": -6.355669021606445, "global_step": 91661, "epoch": 2182} {"train_loss": -6.266668319702148, "global_step": 91662, "epoch": 2182} {"train_loss": -6.351296424865723, "global_step": 91663, "epoch": 2182} {"train_loss": -6.255576133728027, "global_step": 91664, "epoch": 2182} {"train_loss": -6.189282417297363, "global_step": 91665, "epoch": 2182} {"train_loss": -6.199358940124512, "global_step": 91666, "epoch": 2182} {"train_loss": -6.27685546875, "global_step": 91667, "epoch": 2182} {"train_loss": -6.21420955657959, "global_step": 91668, "epoch": 2182} {"train_loss": -6.165881633758545, "global_step": 91669, "epoch": 2182} {"train_loss": -6.334672927856445, "global_step": 91670, "epoch": 2182} {"train_loss": -6.254206657409668, "global_step": 91671, "epoch": 2182} {"train_loss": -6.32271671295166, "global_step": 91672, "epoch": 2182} {"train_loss": -6.258330821990967, "global_step": 91673, "epoch": 2182} {"train_loss": -6.373908042907715, "global_step": 91674, "epoch": 2182} {"train_loss": -6.113127708435059, "global_step": 91675, "epoch": 2182} {"train_loss": -6.284448146820068, "global_step": 91676, "epoch": 2182} {"train_loss": -6.209810256958008, "global_step": 91677, "epoch": 2182} {"train_loss": -6.290832042694092, "global_step": 91678, "epoch": 2182} {"train_loss": -6.307352542877197, "global_step": 91679, "epoch": 2182} {"train_loss": -6.286263942718506, "global_step": 91680, "epoch": 2182} {"train_loss": -6.237826347351074, "global_step": 91681, "epoch": 2182} {"train_loss": -6.173798084259033, "global_step": 91682, "epoch": 2182} {"train_loss": -6.304865837097168, "global_step": 91683, "epoch": 2182} {"train_loss": -6.2156572341918945, "global_step": 91684, "epoch": 2182} {"train_loss": -6.261024236679077, "global_step": 91685, "epoch": 2182, "val_loss": 75544.265625} {"train_loss": -6.238173961639404, "global_step": 91686, "epoch": 2183} {"train_loss": -6.206478118896484, "global_step": 91687, "epoch": 2183} {"train_loss": -6.265630722045898, "global_step": 91688, "epoch": 2183} {"train_loss": -6.247322082519531, "global_step": 91689, "epoch": 2183} {"train_loss": -6.3556013107299805, "global_step": 91690, "epoch": 2183} {"train_loss": -6.262434959411621, "global_step": 91691, "epoch": 2183} {"train_loss": -6.407995700836182, "global_step": 91692, "epoch": 2183} {"train_loss": -6.265785217285156, "global_step": 91693, "epoch": 2183} {"train_loss": -6.372740268707275, "global_step": 91694, "epoch": 2183} {"train_loss": -6.387028694152832, "global_step": 91695, "epoch": 2183} {"train_loss": -6.293517112731934, "global_step": 91696, "epoch": 2183} {"train_loss": -6.344867706298828, "global_step": 91697, "epoch": 2183} {"train_loss": -6.328858375549316, "global_step": 91698, "epoch": 2183} {"train_loss": -6.367776870727539, "global_step": 91699, "epoch": 2183} {"train_loss": -6.199126720428467, "global_step": 91700, "epoch": 2183} {"train_loss": -6.264603614807129, "global_step": 91701, "epoch": 2183} {"train_loss": -6.343294143676758, "global_step": 91702, "epoch": 2183} {"train_loss": -6.295494079589844, "global_step": 91703, "epoch": 2183} {"train_loss": -6.281411647796631, "global_step": 91704, "epoch": 2183} {"train_loss": -6.326623439788818, "global_step": 91705, "epoch": 2183} {"train_loss": -6.369663238525391, "global_step": 91706, "epoch": 2183} {"train_loss": -6.229377746582031, "global_step": 91707, "epoch": 2183} {"train_loss": -6.155032157897949, "global_step": 91708, "epoch": 2183} {"train_loss": -6.247718334197998, "global_step": 91709, "epoch": 2183} {"train_loss": -6.362287521362305, "global_step": 91710, "epoch": 2183} {"train_loss": -6.277409553527832, "global_step": 91711, "epoch": 2183} {"train_loss": -6.245972633361816, "global_step": 91712, "epoch": 2183} {"train_loss": -6.3388285636901855, "global_step": 91713, "epoch": 2183} {"train_loss": -6.398481369018555, "global_step": 91714, "epoch": 2183} {"train_loss": -6.251365661621094, "global_step": 91715, "epoch": 2183} {"train_loss": -6.311724662780762, "global_step": 91716, "epoch": 2183} {"train_loss": -6.243738174438477, "global_step": 91717, "epoch": 2183} {"train_loss": -6.262460708618164, "global_step": 91718, "epoch": 2183} {"train_loss": -6.3113203048706055, "global_step": 91719, "epoch": 2183} {"train_loss": -6.261239051818848, "global_step": 91720, "epoch": 2183} {"train_loss": -6.351351737976074, "global_step": 91721, "epoch": 2183} {"train_loss": -6.330765724182129, "global_step": 91722, "epoch": 2183} {"train_loss": -6.232190132141113, "global_step": 91723, "epoch": 2183} {"train_loss": -6.243539810180664, "global_step": 91724, "epoch": 2183} {"train_loss": -6.334317207336426, "global_step": 91725, "epoch": 2183} {"train_loss": -6.240818023681641, "global_step": 91726, "epoch": 2183} {"train_loss": -6.292445784523373, "global_step": 91727, "epoch": 2183, "val_loss": 75319.4375} {"train_loss": -6.3971638679504395, "global_step": 91728, "epoch": 2184} {"train_loss": -6.1983323097229, "global_step": 91729, "epoch": 2184} {"train_loss": -6.269412040710449, "global_step": 91730, "epoch": 2184} {"train_loss": -6.346905708312988, "global_step": 91731, "epoch": 2184} {"train_loss": -6.2605085372924805, "global_step": 91732, "epoch": 2184} {"train_loss": -6.253625869750977, "global_step": 91733, "epoch": 2184} {"train_loss": -6.066715240478516, "global_step": 91734, "epoch": 2184} {"train_loss": -6.292057037353516, "global_step": 91735, "epoch": 2184} {"train_loss": -6.268324851989746, "global_step": 91736, "epoch": 2184} {"train_loss": -6.201773643493652, "global_step": 91737, "epoch": 2184} {"train_loss": -6.283860206604004, "global_step": 91738, "epoch": 2184} {"train_loss": -6.285589218139648, "global_step": 91739, "epoch": 2184} {"train_loss": -6.149349212646484, "global_step": 91740, "epoch": 2184} {"train_loss": -6.300430774688721, "global_step": 91741, "epoch": 2184} {"train_loss": -6.126560211181641, "global_step": 91742, "epoch": 2184} {"train_loss": -6.318937301635742, "global_step": 91743, "epoch": 2184} {"train_loss": -6.15479850769043, "global_step": 91744, "epoch": 2184} {"train_loss": -6.317288398742676, "global_step": 91745, "epoch": 2184} {"train_loss": -6.257615089416504, "global_step": 91746, "epoch": 2184} {"train_loss": -6.110817909240723, "global_step": 91747, "epoch": 2184} {"train_loss": -6.361570358276367, "global_step": 91748, "epoch": 2184} {"train_loss": -6.231406211853027, "global_step": 91749, "epoch": 2184} {"train_loss": -6.141991138458252, "global_step": 91750, "epoch": 2184} {"train_loss": -6.252189636230469, "global_step": 91751, "epoch": 2184} {"train_loss": -6.174178123474121, "global_step": 91752, "epoch": 2184} {"train_loss": -6.2056660652160645, "global_step": 91753, "epoch": 2184} {"train_loss": -6.372230529785156, "global_step": 91754, "epoch": 2184} {"train_loss": -6.267505168914795, "global_step": 91755, "epoch": 2184} {"train_loss": -6.236385345458984, "global_step": 91756, "epoch": 2184} {"train_loss": -6.243730545043945, "global_step": 91757, "epoch": 2184} {"train_loss": -6.245471954345703, "global_step": 91758, "epoch": 2184} {"train_loss": -6.223525047302246, "global_step": 91759, "epoch": 2184} {"train_loss": -6.02626895904541, "global_step": 91760, "epoch": 2184} {"train_loss": -6.252358913421631, "global_step": 91761, "epoch": 2184} {"train_loss": -6.120642185211182, "global_step": 91762, "epoch": 2184} {"train_loss": -6.148365497589111, "global_step": 91763, "epoch": 2184} {"train_loss": -6.1983137130737305, "global_step": 91764, "epoch": 2184} {"train_loss": -6.289737701416016, "global_step": 91765, "epoch": 2184} {"train_loss": -6.274381160736084, "global_step": 91766, "epoch": 2184} {"train_loss": -6.237417221069336, "global_step": 91767, "epoch": 2184} {"train_loss": -6.270096778869629, "global_step": 91768, "epoch": 2184} {"train_loss": -6.233544747034709, "global_step": 91769, "epoch": 2184, "val_loss": 75396.4921875} {"train_loss": -6.3451008796691895, "global_step": 91770, "epoch": 2185} {"train_loss": -6.274008750915527, "global_step": 91771, "epoch": 2185} {"train_loss": -6.270820140838623, "global_step": 91772, "epoch": 2185} {"train_loss": -6.348820209503174, "global_step": 91773, "epoch": 2185} {"train_loss": -6.292933940887451, "global_step": 91774, "epoch": 2185} {"train_loss": -6.244253635406494, "global_step": 91775, "epoch": 2185} {"train_loss": -6.281394004821777, "global_step": 91776, "epoch": 2185} {"train_loss": -6.225564002990723, "global_step": 91777, "epoch": 2185} {"train_loss": -6.196208953857422, "global_step": 91778, "epoch": 2185} {"train_loss": -6.200662612915039, "global_step": 91779, "epoch": 2185} {"train_loss": -6.182790756225586, "global_step": 91780, "epoch": 2185} {"train_loss": -6.205783843994141, "global_step": 91781, "epoch": 2185} {"train_loss": -6.255726337432861, "global_step": 91782, "epoch": 2185} {"train_loss": -6.28695011138916, "global_step": 91783, "epoch": 2185} {"train_loss": -6.222696304321289, "global_step": 91784, "epoch": 2185} {"train_loss": -6.165301322937012, "global_step": 91785, "epoch": 2185} {"train_loss": -6.117432594299316, "global_step": 91786, "epoch": 2185} {"train_loss": -6.173446178436279, "global_step": 91787, "epoch": 2185} {"train_loss": -6.108675003051758, "global_step": 91788, "epoch": 2185} {"train_loss": -6.178081035614014, "global_step": 91789, "epoch": 2185} {"train_loss": -6.268301010131836, "global_step": 91790, "epoch": 2185} {"train_loss": -6.060929298400879, "global_step": 91791, "epoch": 2185} {"train_loss": -6.1273722648620605, "global_step": 91792, "epoch": 2185} {"train_loss": -6.020449638366699, "global_step": 91793, "epoch": 2185} {"train_loss": -6.138431549072266, "global_step": 91794, "epoch": 2185} {"train_loss": -6.097503662109375, "global_step": 91795, "epoch": 2185} {"train_loss": -6.048064708709717, "global_step": 91796, "epoch": 2185} {"train_loss": -6.192047119140625, "global_step": 91797, "epoch": 2185} {"train_loss": -6.17678165435791, "global_step": 91798, "epoch": 2185} {"train_loss": -6.105314254760742, "global_step": 91799, "epoch": 2185} {"train_loss": -6.202308654785156, "global_step": 91800, "epoch": 2185} {"train_loss": -6.154707908630371, "global_step": 91801, "epoch": 2185} {"train_loss": -6.211509704589844, "global_step": 91802, "epoch": 2185} {"train_loss": -6.2438249588012695, "global_step": 91803, "epoch": 2185} {"train_loss": -6.237253189086914, "global_step": 91804, "epoch": 2185} {"train_loss": -6.242565631866455, "global_step": 91805, "epoch": 2185} {"train_loss": -6.251502990722656, "global_step": 91806, "epoch": 2185} {"train_loss": -6.337507247924805, "global_step": 91807, "epoch": 2185} {"train_loss": -6.141210556030273, "global_step": 91808, "epoch": 2185} {"train_loss": -6.354006767272949, "global_step": 91809, "epoch": 2185} {"train_loss": -6.203143119812012, "global_step": 91810, "epoch": 2185} {"train_loss": -6.205020075752621, "global_step": 91811, "epoch": 2185, "val_loss": 75409.21875} {"train_loss": -6.281439304351807, "global_step": 91812, "epoch": 2186} {"train_loss": -6.2352094650268555, "global_step": 91813, "epoch": 2186} {"train_loss": -6.19081974029541, "global_step": 91814, "epoch": 2186} {"train_loss": -6.328437805175781, "global_step": 91815, "epoch": 2186} {"train_loss": -6.299571514129639, "global_step": 91816, "epoch": 2186} {"train_loss": -6.340566635131836, "global_step": 91817, "epoch": 2186} {"train_loss": -6.341824531555176, "global_step": 91818, "epoch": 2186} {"train_loss": -6.316831588745117, "global_step": 91819, "epoch": 2186} {"train_loss": -6.335699081420898, "global_step": 91820, "epoch": 2186} {"train_loss": -6.274082183837891, "global_step": 91821, "epoch": 2186} {"train_loss": -6.331259727478027, "global_step": 91822, "epoch": 2186} {"train_loss": -6.27924108505249, "global_step": 91823, "epoch": 2186} {"train_loss": -6.247591495513916, "global_step": 91824, "epoch": 2186} {"train_loss": -6.269595146179199, "global_step": 91825, "epoch": 2186} {"train_loss": -6.2776031494140625, "global_step": 91826, "epoch": 2186} {"train_loss": -6.2486467361450195, "global_step": 91827, "epoch": 2186} {"train_loss": -6.173950672149658, "global_step": 91828, "epoch": 2186} {"train_loss": -6.36967658996582, "global_step": 91829, "epoch": 2186} {"train_loss": -6.203198432922363, "global_step": 91830, "epoch": 2186} {"train_loss": -6.176530361175537, "global_step": 91831, "epoch": 2186} {"train_loss": -6.3014984130859375, "global_step": 91832, "epoch": 2186} {"train_loss": -6.2015910148620605, "global_step": 91833, "epoch": 2186} {"train_loss": -6.197072982788086, "global_step": 91834, "epoch": 2186} {"train_loss": -6.312417984008789, "global_step": 91835, "epoch": 2186} {"train_loss": -6.244058609008789, "global_step": 91836, "epoch": 2186} {"train_loss": -6.275843143463135, "global_step": 91837, "epoch": 2186} {"train_loss": -6.180413246154785, "global_step": 91838, "epoch": 2186} {"train_loss": -6.314334869384766, "global_step": 91839, "epoch": 2186} {"train_loss": -6.267852783203125, "global_step": 91840, "epoch": 2186} {"train_loss": -6.16880464553833, "global_step": 91841, "epoch": 2186} {"train_loss": -6.251815319061279, "global_step": 91842, "epoch": 2186} {"train_loss": -6.169777870178223, "global_step": 91843, "epoch": 2186} {"train_loss": -6.347783088684082, "global_step": 91844, "epoch": 2186} {"train_loss": -6.309322834014893, "global_step": 91845, "epoch": 2186} {"train_loss": -6.289172172546387, "global_step": 91846, "epoch": 2186} {"train_loss": -6.247627258300781, "global_step": 91847, "epoch": 2186} {"train_loss": -6.336812973022461, "global_step": 91848, "epoch": 2186} {"train_loss": -6.168366432189941, "global_step": 91849, "epoch": 2186} {"train_loss": -6.269228935241699, "global_step": 91850, "epoch": 2186} {"train_loss": -6.261912822723389, "global_step": 91851, "epoch": 2186} {"train_loss": -6.134088516235352, "global_step": 91852, "epoch": 2186} {"train_loss": -6.265064421154204, "global_step": 91853, "epoch": 2186, "val_loss": 75463.8203125} {"train_loss": -6.256823539733887, "global_step": 91854, "epoch": 2187} {"train_loss": -6.223021030426025, "global_step": 91855, "epoch": 2187} {"train_loss": -6.2408366203308105, "global_step": 91856, "epoch": 2187} {"train_loss": -6.188497066497803, "global_step": 91857, "epoch": 2187} {"train_loss": -6.278255462646484, "global_step": 91858, "epoch": 2187} {"train_loss": -6.155705451965332, "global_step": 91859, "epoch": 2187} {"train_loss": -6.195591926574707, "global_step": 91860, "epoch": 2187} {"train_loss": -6.310691833496094, "global_step": 91861, "epoch": 2187} {"train_loss": -6.130557537078857, "global_step": 91862, "epoch": 2187} {"train_loss": -6.151262283325195, "global_step": 91863, "epoch": 2187} {"train_loss": -6.249927520751953, "global_step": 91864, "epoch": 2187} {"train_loss": -6.195887565612793, "global_step": 91865, "epoch": 2187} {"train_loss": -6.252381324768066, "global_step": 91866, "epoch": 2187} {"train_loss": -6.299183368682861, "global_step": 91867, "epoch": 2187} {"train_loss": -6.257767677307129, "global_step": 91868, "epoch": 2187} {"train_loss": -6.33115816116333, "global_step": 91869, "epoch": 2187} {"train_loss": -6.135584354400635, "global_step": 91870, "epoch": 2187} {"train_loss": -6.244527816772461, "global_step": 91871, "epoch": 2187} {"train_loss": -6.351676940917969, "global_step": 91872, "epoch": 2187} {"train_loss": -6.372282981872559, "global_step": 91873, "epoch": 2187} {"train_loss": -6.376444339752197, "global_step": 91874, "epoch": 2187} {"train_loss": -6.226972579956055, "global_step": 91875, "epoch": 2187} {"train_loss": -6.224847316741943, "global_step": 91876, "epoch": 2187} {"train_loss": -6.176910400390625, "global_step": 91877, "epoch": 2187} {"train_loss": -6.327986717224121, "global_step": 91878, "epoch": 2187} {"train_loss": -6.287919998168945, "global_step": 91879, "epoch": 2187} {"train_loss": -6.225925445556641, "global_step": 91880, "epoch": 2187} {"train_loss": -6.262340545654297, "global_step": 91881, "epoch": 2187} {"train_loss": -6.28489351272583, "global_step": 91882, "epoch": 2187} {"train_loss": -6.275346279144287, "global_step": 91883, "epoch": 2187} {"train_loss": -6.049098491668701, "global_step": 91884, "epoch": 2187} {"train_loss": -6.213809967041016, "global_step": 91885, "epoch": 2187} {"train_loss": -6.2777419090271, "global_step": 91886, "epoch": 2187} {"train_loss": -6.261061668395996, "global_step": 91887, "epoch": 2187} {"train_loss": -6.298539161682129, "global_step": 91888, "epoch": 2187} {"train_loss": -6.04558801651001, "global_step": 91889, "epoch": 2187} {"train_loss": -6.261062145233154, "global_step": 91890, "epoch": 2187} {"train_loss": -6.212600231170654, "global_step": 91891, "epoch": 2187} {"train_loss": -6.203082084655762, "global_step": 91892, "epoch": 2187} {"train_loss": -6.199635028839111, "global_step": 91893, "epoch": 2187} {"train_loss": -6.320310115814209, "global_step": 91894, "epoch": 2187} {"train_loss": -6.240423509052822, "global_step": 91895, "epoch": 2187, "val_loss": 75322.2734375} {"train_loss": -6.2677459716796875, "global_step": 91896, "epoch": 2188} {"train_loss": -6.233536243438721, "global_step": 91897, "epoch": 2188} {"train_loss": -6.221042633056641, "global_step": 91898, "epoch": 2188} {"train_loss": -6.283020973205566, "global_step": 91899, "epoch": 2188} {"train_loss": -6.260810852050781, "global_step": 91900, "epoch": 2188} {"train_loss": -6.283606052398682, "global_step": 91901, "epoch": 2188} {"train_loss": -6.283140182495117, "global_step": 91902, "epoch": 2188} {"train_loss": -6.292873382568359, "global_step": 91903, "epoch": 2188} {"train_loss": -6.329980850219727, "global_step": 91904, "epoch": 2188} {"train_loss": -6.404058933258057, "global_step": 91905, "epoch": 2188} {"train_loss": -6.225071907043457, "global_step": 91906, "epoch": 2188} {"train_loss": -6.2182769775390625, "global_step": 91907, "epoch": 2188} {"train_loss": -6.164970874786377, "global_step": 91908, "epoch": 2188} {"train_loss": -6.302557945251465, "global_step": 91909, "epoch": 2188} {"train_loss": -6.139542579650879, "global_step": 91910, "epoch": 2188} {"train_loss": -6.290847301483154, "global_step": 91911, "epoch": 2188} {"train_loss": -6.310970306396484, "global_step": 91912, "epoch": 2188} {"train_loss": -6.2072319984436035, "global_step": 91913, "epoch": 2188} {"train_loss": -6.427772521972656, "global_step": 91914, "epoch": 2188} {"train_loss": -6.313354015350342, "global_step": 91915, "epoch": 2188} {"train_loss": -6.318563461303711, "global_step": 91916, "epoch": 2188} {"train_loss": -6.313266754150391, "global_step": 91917, "epoch": 2188} {"train_loss": -6.209024906158447, "global_step": 91918, "epoch": 2188} {"train_loss": -6.347607612609863, "global_step": 91919, "epoch": 2188} {"train_loss": -6.209900856018066, "global_step": 91920, "epoch": 2188} {"train_loss": -6.263769626617432, "global_step": 91921, "epoch": 2188} {"train_loss": -6.356544494628906, "global_step": 91922, "epoch": 2188} {"train_loss": -6.2714033126831055, "global_step": 91923, "epoch": 2188} {"train_loss": -6.172548294067383, "global_step": 91924, "epoch": 2188} {"train_loss": -6.300137042999268, "global_step": 91925, "epoch": 2188} {"train_loss": -6.317516326904297, "global_step": 91926, "epoch": 2188} {"train_loss": -6.299467086791992, "global_step": 91927, "epoch": 2188} {"train_loss": -6.24969482421875, "global_step": 91928, "epoch": 2188} {"train_loss": -6.292845726013184, "global_step": 91929, "epoch": 2188} {"train_loss": -6.299029350280762, "global_step": 91930, "epoch": 2188} {"train_loss": -6.328153133392334, "global_step": 91931, "epoch": 2188} {"train_loss": -6.225836753845215, "global_step": 91932, "epoch": 2188} {"train_loss": -6.352858543395996, "global_step": 91933, "epoch": 2188} {"train_loss": -6.343150615692139, "global_step": 91934, "epoch": 2188} {"train_loss": -6.184514045715332, "global_step": 91935, "epoch": 2188} {"train_loss": -6.2623467445373535, "global_step": 91936, "epoch": 2188} {"train_loss": -6.27871831258138, "global_step": 91937, "epoch": 2188, "val_loss": 75448.03125} {"train_loss": -6.3882951736450195, "global_step": 91938, "epoch": 2189} {"train_loss": -6.405055522918701, "global_step": 91939, "epoch": 2189} {"train_loss": -6.273241996765137, "global_step": 91940, "epoch": 2189} {"train_loss": -6.428646087646484, "global_step": 91941, "epoch": 2189} {"train_loss": -6.188945293426514, "global_step": 91942, "epoch": 2189} {"train_loss": -6.346088409423828, "global_step": 91943, "epoch": 2189} {"train_loss": -6.243104934692383, "global_step": 91944, "epoch": 2189} {"train_loss": -6.29404354095459, "global_step": 91945, "epoch": 2189} {"train_loss": -6.1998701095581055, "global_step": 91946, "epoch": 2189} {"train_loss": -6.31851053237915, "global_step": 91947, "epoch": 2189} {"train_loss": -6.296344757080078, "global_step": 91948, "epoch": 2189} {"train_loss": -6.328366279602051, "global_step": 91949, "epoch": 2189} {"train_loss": -6.4613189697265625, "global_step": 91950, "epoch": 2189} {"train_loss": -6.291090965270996, "global_step": 91951, "epoch": 2189} {"train_loss": -6.348620414733887, "global_step": 91952, "epoch": 2189} {"train_loss": -6.3649001121521, "global_step": 91953, "epoch": 2189} {"train_loss": -6.4288482666015625, "global_step": 91954, "epoch": 2189} {"train_loss": -6.299866676330566, "global_step": 91955, "epoch": 2189} {"train_loss": -6.330014705657959, "global_step": 91956, "epoch": 2189} {"train_loss": -6.282979488372803, "global_step": 91957, "epoch": 2189} {"train_loss": -6.244050025939941, "global_step": 91958, "epoch": 2189} {"train_loss": -6.286841869354248, "global_step": 91959, "epoch": 2189} {"train_loss": -6.305644989013672, "global_step": 91960, "epoch": 2189} {"train_loss": -6.243037223815918, "global_step": 91961, "epoch": 2189} {"train_loss": -6.336507320404053, "global_step": 91962, "epoch": 2189} {"train_loss": -6.317551612854004, "global_step": 91963, "epoch": 2189} {"train_loss": -6.325183391571045, "global_step": 91964, "epoch": 2189} {"train_loss": -6.316287994384766, "global_step": 91965, "epoch": 2189} {"train_loss": -6.337075710296631, "global_step": 91966, "epoch": 2189} {"train_loss": -6.427643775939941, "global_step": 91967, "epoch": 2189} {"train_loss": -6.319739818572998, "global_step": 91968, "epoch": 2189} {"train_loss": -6.262713432312012, "global_step": 91969, "epoch": 2189} {"train_loss": -6.191666603088379, "global_step": 91970, "epoch": 2189} {"train_loss": -6.200743198394775, "global_step": 91971, "epoch": 2189} {"train_loss": -6.37062406539917, "global_step": 91972, "epoch": 2189} {"train_loss": -6.307236671447754, "global_step": 91973, "epoch": 2189} {"train_loss": -6.369451999664307, "global_step": 91974, "epoch": 2189} {"train_loss": -6.191059589385986, "global_step": 91975, "epoch": 2189} {"train_loss": -6.262876033782959, "global_step": 91976, "epoch": 2189} {"train_loss": -6.395168304443359, "global_step": 91977, "epoch": 2189} {"train_loss": -6.194621562957764, "global_step": 91978, "epoch": 2189} {"train_loss": -6.309122596468244, "global_step": 91979, "epoch": 2189, "val_loss": 75477.953125} {"train_loss": -6.210082054138184, "global_step": 91980, "epoch": 2190} {"train_loss": -6.2651166915893555, "global_step": 91981, "epoch": 2190} {"train_loss": -6.330255508422852, "global_step": 91982, "epoch": 2190} {"train_loss": -6.301305770874023, "global_step": 91983, "epoch": 2190} {"train_loss": -6.2550859451293945, "global_step": 91984, "epoch": 2190} {"train_loss": -6.200170993804932, "global_step": 91985, "epoch": 2190} {"train_loss": -6.3117523193359375, "global_step": 91986, "epoch": 2190} {"train_loss": -6.308441638946533, "global_step": 91987, "epoch": 2190} {"train_loss": -6.194986343383789, "global_step": 91988, "epoch": 2190} {"train_loss": -6.230500221252441, "global_step": 91989, "epoch": 2190} {"train_loss": -6.14164924621582, "global_step": 91990, "epoch": 2190} {"train_loss": -6.241560935974121, "global_step": 91991, "epoch": 2190} {"train_loss": -6.2440338134765625, "global_step": 91992, "epoch": 2190} {"train_loss": -6.3651123046875, "global_step": 91993, "epoch": 2190} {"train_loss": -6.269880294799805, "global_step": 91994, "epoch": 2190} {"train_loss": -6.334281921386719, "global_step": 91995, "epoch": 2190} {"train_loss": -6.346715927124023, "global_step": 91996, "epoch": 2190} {"train_loss": -6.239209175109863, "global_step": 91997, "epoch": 2190} {"train_loss": -6.290849208831787, "global_step": 91998, "epoch": 2190} {"train_loss": -6.229578495025635, "global_step": 91999, "epoch": 2190} {"train_loss": -6.160361289978027, "global_step": 92000, "epoch": 2190} {"train_loss": -6.158857345581055, "global_step": 92001, "epoch": 2190} {"train_loss": -6.256610870361328, "global_step": 92002, "epoch": 2190} {"train_loss": -6.256964206695557, "global_step": 92003, "epoch": 2190} {"train_loss": -6.023716926574707, "global_step": 92004, "epoch": 2190} {"train_loss": -6.23842716217041, "global_step": 92005, "epoch": 2190} {"train_loss": -6.167369842529297, "global_step": 92006, "epoch": 2190} {"train_loss": -6.173999786376953, "global_step": 92007, "epoch": 2190} {"train_loss": -6.173017501831055, "global_step": 92008, "epoch": 2190} {"train_loss": -6.173943519592285, "global_step": 92009, "epoch": 2190} {"train_loss": -6.229086875915527, "global_step": 92010, "epoch": 2190} {"train_loss": -6.271358966827393, "global_step": 92011, "epoch": 2190} {"train_loss": -6.271860122680664, "global_step": 92012, "epoch": 2190} {"train_loss": -6.279305458068848, "global_step": 92013, "epoch": 2190} {"train_loss": -6.202398777008057, "global_step": 92014, "epoch": 2190} {"train_loss": -6.318410873413086, "global_step": 92015, "epoch": 2190} {"train_loss": -6.204991340637207, "global_step": 92016, "epoch": 2190} {"train_loss": -6.210156440734863, "global_step": 92017, "epoch": 2190} {"train_loss": -6.2503862380981445, "global_step": 92018, "epoch": 2190} {"train_loss": -6.456049919128418, "global_step": 92019, "epoch": 2190} {"train_loss": -6.206023693084717, "global_step": 92020, "epoch": 2190} {"train_loss": -6.2448736145382835, "global_step": 92021, "epoch": 2190, "val_loss": 75290.890625} {"train_loss": -6.350677013397217, "global_step": 92022, "epoch": 2191} {"train_loss": -6.28283166885376, "global_step": 92023, "epoch": 2191} {"train_loss": -6.309815406799316, "global_step": 92024, "epoch": 2191} {"train_loss": -6.251386642456055, "global_step": 92025, "epoch": 2191} {"train_loss": -6.201800346374512, "global_step": 92026, "epoch": 2191} {"train_loss": -6.368343353271484, "global_step": 92027, "epoch": 2191} {"train_loss": -6.199946403503418, "global_step": 92028, "epoch": 2191} {"train_loss": -6.4342193603515625, "global_step": 92029, "epoch": 2191} {"train_loss": -6.294434547424316, "global_step": 92030, "epoch": 2191} {"train_loss": -6.253363609313965, "global_step": 92031, "epoch": 2191} {"train_loss": -6.18248176574707, "global_step": 92032, "epoch": 2191} {"train_loss": -6.239604949951172, "global_step": 92033, "epoch": 2191} {"train_loss": -6.279081344604492, "global_step": 92034, "epoch": 2191} {"train_loss": -6.09603214263916, "global_step": 92035, "epoch": 2191} {"train_loss": -6.233546257019043, "global_step": 92036, "epoch": 2191} {"train_loss": -6.19820499420166, "global_step": 92037, "epoch": 2191} {"train_loss": -6.239073276519775, "global_step": 92038, "epoch": 2191} {"train_loss": -6.238246917724609, "global_step": 92039, "epoch": 2191} {"train_loss": -6.151273727416992, "global_step": 92040, "epoch": 2191} {"train_loss": -6.168651580810547, "global_step": 92041, "epoch": 2191} {"train_loss": -6.2293806076049805, "global_step": 92042, "epoch": 2191} {"train_loss": -6.3711018562316895, "global_step": 92043, "epoch": 2191} {"train_loss": -6.194011688232422, "global_step": 92044, "epoch": 2191} {"train_loss": -6.194565773010254, "global_step": 92045, "epoch": 2191} {"train_loss": -6.193876266479492, "global_step": 92046, "epoch": 2191} {"train_loss": -6.344782829284668, "global_step": 92047, "epoch": 2191} {"train_loss": -6.256349563598633, "global_step": 92048, "epoch": 2191} {"train_loss": -6.172712802886963, "global_step": 92049, "epoch": 2191} {"train_loss": -6.2242231369018555, "global_step": 92050, "epoch": 2191} {"train_loss": -6.252912521362305, "global_step": 92051, "epoch": 2191} {"train_loss": -6.1430344581604, "global_step": 92052, "epoch": 2191} {"train_loss": -6.30958366394043, "global_step": 92053, "epoch": 2191} {"train_loss": -6.3137898445129395, "global_step": 92054, "epoch": 2191} {"train_loss": -6.222658634185791, "global_step": 92055, "epoch": 2191} {"train_loss": -6.231800079345703, "global_step": 92056, "epoch": 2191} {"train_loss": -6.242744445800781, "global_step": 92057, "epoch": 2191} {"train_loss": -6.305891990661621, "global_step": 92058, "epoch": 2191} {"train_loss": -6.300820827484131, "global_step": 92059, "epoch": 2191} {"train_loss": -6.222052097320557, "global_step": 92060, "epoch": 2191} {"train_loss": -6.1931915283203125, "global_step": 92061, "epoch": 2191} {"train_loss": -6.304905891418457, "global_step": 92062, "epoch": 2191} {"train_loss": -6.252797694433303, "global_step": 92063, "epoch": 2191, "val_loss": 75391.8515625} {"train_loss": -6.354803085327148, "global_step": 92064, "epoch": 2192} {"train_loss": -6.318055152893066, "global_step": 92065, "epoch": 2192} {"train_loss": -6.362744331359863, "global_step": 92066, "epoch": 2192} {"train_loss": -6.343524932861328, "global_step": 92067, "epoch": 2192} {"train_loss": -6.1900529861450195, "global_step": 92068, "epoch": 2192} {"train_loss": -6.253190994262695, "global_step": 92069, "epoch": 2192} {"train_loss": -6.203539848327637, "global_step": 92070, "epoch": 2192} {"train_loss": -6.331843376159668, "global_step": 92071, "epoch": 2192} {"train_loss": -6.312221527099609, "global_step": 92072, "epoch": 2192} {"train_loss": -6.30621337890625, "global_step": 92073, "epoch": 2192} {"train_loss": -6.303433895111084, "global_step": 92074, "epoch": 2192} {"train_loss": -6.208081245422363, "global_step": 92075, "epoch": 2192} {"train_loss": -6.284290313720703, "global_step": 92076, "epoch": 2192} {"train_loss": -6.30193567276001, "global_step": 92077, "epoch": 2192} {"train_loss": -6.217837333679199, "global_step": 92078, "epoch": 2192} {"train_loss": -6.236396312713623, "global_step": 92079, "epoch": 2192} {"train_loss": -6.247552871704102, "global_step": 92080, "epoch": 2192} {"train_loss": -6.310202598571777, "global_step": 92081, "epoch": 2192} {"train_loss": -6.305940628051758, "global_step": 92082, "epoch": 2192} {"train_loss": -6.309406280517578, "global_step": 92083, "epoch": 2192} {"train_loss": -6.281253814697266, "global_step": 92084, "epoch": 2192} {"train_loss": -6.210063457489014, "global_step": 92085, "epoch": 2192} {"train_loss": -6.218827247619629, "global_step": 92086, "epoch": 2192} {"train_loss": -6.208235740661621, "global_step": 92087, "epoch": 2192} {"train_loss": -6.284551620483398, "global_step": 92088, "epoch": 2192} {"train_loss": -6.2483696937561035, "global_step": 92089, "epoch": 2192} {"train_loss": -6.37217378616333, "global_step": 92090, "epoch": 2192} {"train_loss": -6.2989397048950195, "global_step": 92091, "epoch": 2192} {"train_loss": -6.218348503112793, "global_step": 92092, "epoch": 2192} {"train_loss": -6.271555423736572, "global_step": 92093, "epoch": 2192} {"train_loss": -6.198406219482422, "global_step": 92094, "epoch": 2192} {"train_loss": -6.308703899383545, "global_step": 92095, "epoch": 2192} {"train_loss": -6.170519828796387, "global_step": 92096, "epoch": 2192} {"train_loss": -6.044824123382568, "global_step": 92097, "epoch": 2192} {"train_loss": -6.255207061767578, "global_step": 92098, "epoch": 2192} {"train_loss": -6.244568824768066, "global_step": 92099, "epoch": 2192} {"train_loss": -6.286805152893066, "global_step": 92100, "epoch": 2192} {"train_loss": -6.221588134765625, "global_step": 92101, "epoch": 2192} {"train_loss": -6.173347473144531, "global_step": 92102, "epoch": 2192} {"train_loss": -6.219786643981934, "global_step": 92103, "epoch": 2192} {"train_loss": -6.107135772705078, "global_step": 92104, "epoch": 2192} {"train_loss": -6.257250002452305, "global_step": 92105, "epoch": 2192, "val_loss": 75624.5234375} {"train_loss": -6.198592185974121, "global_step": 92106, "epoch": 2193} {"train_loss": -6.366290092468262, "global_step": 92107, "epoch": 2193} {"train_loss": -6.259316921234131, "global_step": 92108, "epoch": 2193} {"train_loss": -6.28553581237793, "global_step": 92109, "epoch": 2193} {"train_loss": -6.317482948303223, "global_step": 92110, "epoch": 2193} {"train_loss": -6.222321510314941, "global_step": 92111, "epoch": 2193} {"train_loss": -6.269059181213379, "global_step": 92112, "epoch": 2193} {"train_loss": -6.298649787902832, "global_step": 92113, "epoch": 2193} {"train_loss": -6.255316734313965, "global_step": 92114, "epoch": 2193} {"train_loss": -6.363715648651123, "global_step": 92115, "epoch": 2193} {"train_loss": -6.300981521606445, "global_step": 92116, "epoch": 2193} {"train_loss": -6.181706428527832, "global_step": 92117, "epoch": 2193} {"train_loss": -6.323901653289795, "global_step": 92118, "epoch": 2193} {"train_loss": -6.454183578491211, "global_step": 92119, "epoch": 2193} {"train_loss": -6.191315650939941, "global_step": 92120, "epoch": 2193} {"train_loss": -6.3413286209106445, "global_step": 92121, "epoch": 2193} {"train_loss": -6.208238124847412, "global_step": 92122, "epoch": 2193} {"train_loss": -6.260097503662109, "global_step": 92123, "epoch": 2193} {"train_loss": -6.351128101348877, "global_step": 92124, "epoch": 2193} {"train_loss": -6.291688919067383, "global_step": 92125, "epoch": 2193} {"train_loss": -6.27241325378418, "global_step": 92126, "epoch": 2193} {"train_loss": -6.168769359588623, "global_step": 92127, "epoch": 2193} {"train_loss": -6.209604263305664, "global_step": 92128, "epoch": 2193} {"train_loss": -6.089841365814209, "global_step": 92129, "epoch": 2193} {"train_loss": -6.232158660888672, "global_step": 92130, "epoch": 2193} {"train_loss": -6.267437934875488, "global_step": 92131, "epoch": 2193} {"train_loss": -6.252532482147217, "global_step": 92132, "epoch": 2193} {"train_loss": -6.215313911437988, "global_step": 92133, "epoch": 2193} {"train_loss": -6.118514537811279, "global_step": 92134, "epoch": 2193} {"train_loss": -6.2490081787109375, "global_step": 92135, "epoch": 2193} {"train_loss": -6.263369083404541, "global_step": 92136, "epoch": 2193} {"train_loss": -6.2658185958862305, "global_step": 92137, "epoch": 2193} {"train_loss": -6.3329758644104, "global_step": 92138, "epoch": 2193} {"train_loss": -6.304502964019775, "global_step": 92139, "epoch": 2193} {"train_loss": -6.302595138549805, "global_step": 92140, "epoch": 2193} {"train_loss": -6.262831687927246, "global_step": 92141, "epoch": 2193} {"train_loss": -6.1684746742248535, "global_step": 92142, "epoch": 2193} {"train_loss": -6.278939247131348, "global_step": 92143, "epoch": 2193} {"train_loss": -6.283761978149414, "global_step": 92144, "epoch": 2193} {"train_loss": -6.311821460723877, "global_step": 92145, "epoch": 2193} {"train_loss": -6.206874847412109, "global_step": 92146, "epoch": 2193} {"train_loss": -6.262492827006748, "global_step": 92147, "epoch": 2193, "val_loss": 75436.6875} {"train_loss": -6.15977144241333, "global_step": 92148, "epoch": 2194} {"train_loss": -6.227842330932617, "global_step": 92149, "epoch": 2194} {"train_loss": -6.232566833496094, "global_step": 92150, "epoch": 2194} {"train_loss": -6.321292877197266, "global_step": 92151, "epoch": 2194} {"train_loss": -6.2607221603393555, "global_step": 92152, "epoch": 2194} {"train_loss": -6.33387565612793, "global_step": 92153, "epoch": 2194} {"train_loss": -6.253116607666016, "global_step": 92154, "epoch": 2194} {"train_loss": -6.322447299957275, "global_step": 92155, "epoch": 2194} {"train_loss": -6.192405700683594, "global_step": 92156, "epoch": 2194} {"train_loss": -6.322643280029297, "global_step": 92157, "epoch": 2194} {"train_loss": -6.340363502502441, "global_step": 92158, "epoch": 2194} {"train_loss": -6.1653828620910645, "global_step": 92159, "epoch": 2194} {"train_loss": -6.341670989990234, "global_step": 92160, "epoch": 2194} {"train_loss": -6.191727638244629, "global_step": 92161, "epoch": 2194} {"train_loss": -6.2978315353393555, "global_step": 92162, "epoch": 2194} {"train_loss": -6.317111015319824, "global_step": 92163, "epoch": 2194} {"train_loss": -6.222961902618408, "global_step": 92164, "epoch": 2194} {"train_loss": -6.462953567504883, "global_step": 92165, "epoch": 2194} {"train_loss": -6.285294055938721, "global_step": 92166, "epoch": 2194} {"train_loss": -6.31390380859375, "global_step": 92167, "epoch": 2194} {"train_loss": -6.310057640075684, "global_step": 92168, "epoch": 2194} {"train_loss": -6.339861869812012, "global_step": 92169, "epoch": 2194} {"train_loss": -6.328371047973633, "global_step": 92170, "epoch": 2194} {"train_loss": -6.3118791580200195, "global_step": 92171, "epoch": 2194} {"train_loss": -6.278358459472656, "global_step": 92172, "epoch": 2194} {"train_loss": -6.228552341461182, "global_step": 92173, "epoch": 2194} {"train_loss": -6.260105133056641, "global_step": 92174, "epoch": 2194} {"train_loss": -6.237546443939209, "global_step": 92175, "epoch": 2194} {"train_loss": -6.2783522605896, "global_step": 92176, "epoch": 2194} {"train_loss": -6.302356719970703, "global_step": 92177, "epoch": 2194} {"train_loss": -6.272797584533691, "global_step": 92178, "epoch": 2194} {"train_loss": -6.173594951629639, "global_step": 92179, "epoch": 2194} {"train_loss": -6.262487411499023, "global_step": 92180, "epoch": 2194} {"train_loss": -6.311802387237549, "global_step": 92181, "epoch": 2194} {"train_loss": -6.314053535461426, "global_step": 92182, "epoch": 2194} {"train_loss": -6.36440896987915, "global_step": 92183, "epoch": 2194} {"train_loss": -6.3188276290893555, "global_step": 92184, "epoch": 2194} {"train_loss": -6.327704429626465, "global_step": 92185, "epoch": 2194} {"train_loss": -6.334515571594238, "global_step": 92186, "epoch": 2194} {"train_loss": -6.316084861755371, "global_step": 92187, "epoch": 2194} {"train_loss": -6.358936309814453, "global_step": 92188, "epoch": 2194} {"train_loss": -6.287556228183565, "global_step": 92189, "epoch": 2194, "val_loss": 75362.4921875} {"train_loss": -6.2895097732543945, "global_step": 92190, "epoch": 2195} {"train_loss": -6.380954742431641, "global_step": 92191, "epoch": 2195} {"train_loss": -6.397483825683594, "global_step": 92192, "epoch": 2195} {"train_loss": -6.3782877922058105, "global_step": 92193, "epoch": 2195} {"train_loss": -6.28016471862793, "global_step": 92194, "epoch": 2195} {"train_loss": -6.326962947845459, "global_step": 92195, "epoch": 2195} {"train_loss": -6.269145965576172, "global_step": 92196, "epoch": 2195} {"train_loss": -6.1737823486328125, "global_step": 92197, "epoch": 2195} {"train_loss": -6.274327754974365, "global_step": 92198, "epoch": 2195} {"train_loss": -6.325376510620117, "global_step": 92199, "epoch": 2195} {"train_loss": -6.236977577209473, "global_step": 92200, "epoch": 2195} {"train_loss": -6.246928691864014, "global_step": 92201, "epoch": 2195} {"train_loss": -6.322503566741943, "global_step": 92202, "epoch": 2195} {"train_loss": -6.304042339324951, "global_step": 92203, "epoch": 2195} {"train_loss": -6.257702827453613, "global_step": 92204, "epoch": 2195} {"train_loss": -6.227507591247559, "global_step": 92205, "epoch": 2195} {"train_loss": -6.304393291473389, "global_step": 92206, "epoch": 2195} {"train_loss": -6.032852649688721, "global_step": 92207, "epoch": 2195} {"train_loss": -6.236515045166016, "global_step": 92208, "epoch": 2195} {"train_loss": -6.212628364562988, "global_step": 92209, "epoch": 2195} {"train_loss": -6.082088947296143, "global_step": 92210, "epoch": 2195} {"train_loss": -6.24390983581543, "global_step": 92211, "epoch": 2195} {"train_loss": -6.034306526184082, "global_step": 92212, "epoch": 2195} {"train_loss": -6.192260265350342, "global_step": 92213, "epoch": 2195} {"train_loss": -6.2293500900268555, "global_step": 92214, "epoch": 2195} {"train_loss": -6.239914894104004, "global_step": 92215, "epoch": 2195} {"train_loss": -6.110971927642822, "global_step": 92216, "epoch": 2195} {"train_loss": -6.150505065917969, "global_step": 92217, "epoch": 2195} {"train_loss": -6.318196773529053, "global_step": 92218, "epoch": 2195} {"train_loss": -6.219517230987549, "global_step": 92219, "epoch": 2195} {"train_loss": -6.262365341186523, "global_step": 92220, "epoch": 2195} {"train_loss": -6.0765790939331055, "global_step": 92221, "epoch": 2195} {"train_loss": -6.246816635131836, "global_step": 92222, "epoch": 2195} {"train_loss": -6.237195014953613, "global_step": 92223, "epoch": 2195} {"train_loss": -6.181702613830566, "global_step": 92224, "epoch": 2195} {"train_loss": -6.083100318908691, "global_step": 92225, "epoch": 2195} {"train_loss": -6.313378810882568, "global_step": 92226, "epoch": 2195} {"train_loss": -6.199936866760254, "global_step": 92227, "epoch": 2195} {"train_loss": -6.2197418212890625, "global_step": 92228, "epoch": 2195} {"train_loss": -6.193367958068848, "global_step": 92229, "epoch": 2195} {"train_loss": -6.229987144470215, "global_step": 92230, "epoch": 2195} {"train_loss": -6.234828846795218, "global_step": 92231, "epoch": 2195, "val_loss": 75330.28125} {"train_loss": -6.286579132080078, "global_step": 92232, "epoch": 2196} {"train_loss": -6.338001728057861, "global_step": 92233, "epoch": 2196} {"train_loss": -6.287684440612793, "global_step": 92234, "epoch": 2196} {"train_loss": -6.200774669647217, "global_step": 92235, "epoch": 2196} {"train_loss": -6.180058479309082, "global_step": 92236, "epoch": 2196} {"train_loss": -6.200506210327148, "global_step": 92237, "epoch": 2196} {"train_loss": -6.226325035095215, "global_step": 92238, "epoch": 2196} {"train_loss": -6.336175918579102, "global_step": 92239, "epoch": 2196} {"train_loss": -6.270658016204834, "global_step": 92240, "epoch": 2196} {"train_loss": -6.267066478729248, "global_step": 92241, "epoch": 2196} {"train_loss": -6.293080806732178, "global_step": 92242, "epoch": 2196} {"train_loss": -6.158613204956055, "global_step": 92243, "epoch": 2196} {"train_loss": -6.195886135101318, "global_step": 92244, "epoch": 2196} {"train_loss": -6.270810127258301, "global_step": 92245, "epoch": 2196} {"train_loss": -6.142889022827148, "global_step": 92246, "epoch": 2196} {"train_loss": -6.3738627433776855, "global_step": 92247, "epoch": 2196} {"train_loss": -6.287762641906738, "global_step": 92248, "epoch": 2196} {"train_loss": -6.355166912078857, "global_step": 92249, "epoch": 2196} {"train_loss": -6.249194145202637, "global_step": 92250, "epoch": 2196} {"train_loss": -6.270798206329346, "global_step": 92251, "epoch": 2196} {"train_loss": -6.2696533203125, "global_step": 92252, "epoch": 2196} {"train_loss": -6.371721267700195, "global_step": 92253, "epoch": 2196} {"train_loss": -6.219226837158203, "global_step": 92254, "epoch": 2196} {"train_loss": -6.347739219665527, "global_step": 92255, "epoch": 2196} {"train_loss": -6.125324726104736, "global_step": 92256, "epoch": 2196} {"train_loss": -6.230151176452637, "global_step": 92257, "epoch": 2196} {"train_loss": -6.302425384521484, "global_step": 92258, "epoch": 2196} {"train_loss": -6.314469337463379, "global_step": 92259, "epoch": 2196} {"train_loss": -6.407066345214844, "global_step": 92260, "epoch": 2196} {"train_loss": -6.340540885925293, "global_step": 92261, "epoch": 2196} {"train_loss": -6.397331237792969, "global_step": 92262, "epoch": 2196} {"train_loss": -6.39432954788208, "global_step": 92263, "epoch": 2196} {"train_loss": -6.335452079772949, "global_step": 92264, "epoch": 2196} {"train_loss": -6.294108867645264, "global_step": 92265, "epoch": 2196} {"train_loss": -6.274537086486816, "global_step": 92266, "epoch": 2196} {"train_loss": -6.3121256828308105, "global_step": 92267, "epoch": 2196} {"train_loss": -6.207955837249756, "global_step": 92268, "epoch": 2196} {"train_loss": -6.179711818695068, "global_step": 92269, "epoch": 2196} {"train_loss": -6.303757667541504, "global_step": 92270, "epoch": 2196} {"train_loss": -6.270134925842285, "global_step": 92271, "epoch": 2196} {"train_loss": -6.219844818115234, "global_step": 92272, "epoch": 2196} {"train_loss": -6.275022222882225, "global_step": 92273, "epoch": 2196, "val_loss": 75288.765625} {"train_loss": -6.2973480224609375, "global_step": 92274, "epoch": 2197} {"train_loss": -6.276549816131592, "global_step": 92275, "epoch": 2197} {"train_loss": -6.297080039978027, "global_step": 92276, "epoch": 2197} {"train_loss": -6.245101451873779, "global_step": 92277, "epoch": 2197} {"train_loss": -6.3175458908081055, "global_step": 92278, "epoch": 2197} {"train_loss": -6.261115550994873, "global_step": 92279, "epoch": 2197} {"train_loss": -6.1672043800354, "global_step": 92280, "epoch": 2197} {"train_loss": -6.213792324066162, "global_step": 92281, "epoch": 2197} {"train_loss": -6.264623641967773, "global_step": 92282, "epoch": 2197} {"train_loss": -6.270785331726074, "global_step": 92283, "epoch": 2197} {"train_loss": -6.235088348388672, "global_step": 92284, "epoch": 2197} {"train_loss": -6.292952537536621, "global_step": 92285, "epoch": 2197} {"train_loss": -6.262889385223389, "global_step": 92286, "epoch": 2197} {"train_loss": -6.245142459869385, "global_step": 92287, "epoch": 2197} {"train_loss": -6.213474273681641, "global_step": 92288, "epoch": 2197} {"train_loss": -6.268001556396484, "global_step": 92289, "epoch": 2197} {"train_loss": -6.264806270599365, "global_step": 92290, "epoch": 2197} {"train_loss": -6.241870880126953, "global_step": 92291, "epoch": 2197} {"train_loss": -6.139998912811279, "global_step": 92292, "epoch": 2197} {"train_loss": -6.153503894805908, "global_step": 92293, "epoch": 2197} {"train_loss": -6.237866401672363, "global_step": 92294, "epoch": 2197} {"train_loss": -6.237615585327148, "global_step": 92295, "epoch": 2197} {"train_loss": -6.164722919464111, "global_step": 92296, "epoch": 2197} {"train_loss": -6.194173812866211, "global_step": 92297, "epoch": 2197} {"train_loss": -6.261741638183594, "global_step": 92298, "epoch": 2197} {"train_loss": -6.248477458953857, "global_step": 92299, "epoch": 2197} {"train_loss": -6.379403114318848, "global_step": 92300, "epoch": 2197} {"train_loss": -6.252213954925537, "global_step": 92301, "epoch": 2197} {"train_loss": -6.27457332611084, "global_step": 92302, "epoch": 2197} {"train_loss": -6.3412933349609375, "global_step": 92303, "epoch": 2197} {"train_loss": -6.183809757232666, "global_step": 92304, "epoch": 2197} {"train_loss": -6.284111499786377, "global_step": 92305, "epoch": 2197} {"train_loss": -6.266303062438965, "global_step": 92306, "epoch": 2197} {"train_loss": -6.250219821929932, "global_step": 92307, "epoch": 2197} {"train_loss": -6.334927558898926, "global_step": 92308, "epoch": 2197} {"train_loss": -6.354034423828125, "global_step": 92309, "epoch": 2197} {"train_loss": -6.284541130065918, "global_step": 92310, "epoch": 2197} {"train_loss": -6.21858024597168, "global_step": 92311, "epoch": 2197} {"train_loss": -6.281675338745117, "global_step": 92312, "epoch": 2197} {"train_loss": -6.274359703063965, "global_step": 92313, "epoch": 2197} {"train_loss": -6.2334089279174805, "global_step": 92314, "epoch": 2197} {"train_loss": -6.2550638403211325, "global_step": 92315, "epoch": 2197, "val_loss": 75377.8984375} {"train_loss": -6.227479934692383, "global_step": 92316, "epoch": 2198} {"train_loss": -6.212488651275635, "global_step": 92317, "epoch": 2198} {"train_loss": -6.1967973709106445, "global_step": 92318, "epoch": 2198} {"train_loss": -6.26142692565918, "global_step": 92319, "epoch": 2198} {"train_loss": -6.185460090637207, "global_step": 92320, "epoch": 2198} {"train_loss": -6.220893383026123, "global_step": 92321, "epoch": 2198} {"train_loss": -6.297800064086914, "global_step": 92322, "epoch": 2198} {"train_loss": -6.202310562133789, "global_step": 92323, "epoch": 2198} {"train_loss": -6.299144744873047, "global_step": 92324, "epoch": 2198} {"train_loss": -6.353996753692627, "global_step": 92325, "epoch": 2198} {"train_loss": -6.205133438110352, "global_step": 92326, "epoch": 2198} {"train_loss": -6.21568489074707, "global_step": 92327, "epoch": 2198} {"train_loss": -6.263933181762695, "global_step": 92328, "epoch": 2198} {"train_loss": -6.217103004455566, "global_step": 92329, "epoch": 2198} {"train_loss": -6.278059959411621, "global_step": 92330, "epoch": 2198} {"train_loss": -6.273492813110352, "global_step": 92331, "epoch": 2198} {"train_loss": -6.2842559814453125, "global_step": 92332, "epoch": 2198} {"train_loss": -6.281189441680908, "global_step": 92333, "epoch": 2198} {"train_loss": -6.2206525802612305, "global_step": 92334, "epoch": 2198} {"train_loss": -6.3621931076049805, "global_step": 92335, "epoch": 2198} {"train_loss": -6.097768783569336, "global_step": 92336, "epoch": 2198} {"train_loss": -6.281052589416504, "global_step": 92337, "epoch": 2198} {"train_loss": -6.249345302581787, "global_step": 92338, "epoch": 2198} {"train_loss": -6.202933311462402, "global_step": 92339, "epoch": 2198} {"train_loss": -6.223651885986328, "global_step": 92340, "epoch": 2198} {"train_loss": -6.2743072509765625, "global_step": 92341, "epoch": 2198} {"train_loss": -6.303439140319824, "global_step": 92342, "epoch": 2198} {"train_loss": -6.192190170288086, "global_step": 92343, "epoch": 2198} {"train_loss": -6.379184246063232, "global_step": 92344, "epoch": 2198} {"train_loss": -6.350088596343994, "global_step": 92345, "epoch": 2198} {"train_loss": -6.298160552978516, "global_step": 92346, "epoch": 2198} {"train_loss": -6.2685065269470215, "global_step": 92347, "epoch": 2198} {"train_loss": -6.289721488952637, "global_step": 92348, "epoch": 2198} {"train_loss": -6.256731033325195, "global_step": 92349, "epoch": 2198} {"train_loss": -6.267472743988037, "global_step": 92350, "epoch": 2198} {"train_loss": -6.335142135620117, "global_step": 92351, "epoch": 2198} {"train_loss": -6.326727390289307, "global_step": 92352, "epoch": 2198} {"train_loss": -6.253744125366211, "global_step": 92353, "epoch": 2198} {"train_loss": -6.282234191894531, "global_step": 92354, "epoch": 2198} {"train_loss": -6.130282878875732, "global_step": 92355, "epoch": 2198} {"train_loss": -6.087085723876953, "global_step": 92356, "epoch": 2198} {"train_loss": -6.252985795338948, "global_step": 92357, "epoch": 2198, "val_loss": 75531.890625} {"train_loss": -6.194005489349365, "global_step": 92358, "epoch": 2199} {"train_loss": -6.2505388259887695, "global_step": 92359, "epoch": 2199} {"train_loss": -6.3665571212768555, "global_step": 92360, "epoch": 2199} {"train_loss": -6.238315582275391, "global_step": 92361, "epoch": 2199} {"train_loss": -6.1184234619140625, "global_step": 92362, "epoch": 2199} {"train_loss": -6.211263656616211, "global_step": 92363, "epoch": 2199} {"train_loss": -6.221887588500977, "global_step": 92364, "epoch": 2199} {"train_loss": -6.1675519943237305, "global_step": 92365, "epoch": 2199} {"train_loss": -6.290889739990234, "global_step": 92366, "epoch": 2199} {"train_loss": -6.274383068084717, "global_step": 92367, "epoch": 2199} {"train_loss": -6.162147521972656, "global_step": 92368, "epoch": 2199} {"train_loss": -6.378000259399414, "global_step": 92369, "epoch": 2199} {"train_loss": -6.231662750244141, "global_step": 92370, "epoch": 2199} {"train_loss": -6.314231872558594, "global_step": 92371, "epoch": 2199} {"train_loss": -6.228696346282959, "global_step": 92372, "epoch": 2199} {"train_loss": -6.183256149291992, "global_step": 92373, "epoch": 2199} {"train_loss": -6.3155436515808105, "global_step": 92374, "epoch": 2199} {"train_loss": -6.253647804260254, "global_step": 92375, "epoch": 2199} {"train_loss": -6.2844743728637695, "global_step": 92376, "epoch": 2199} {"train_loss": -6.2155585289001465, "global_step": 92377, "epoch": 2199} {"train_loss": -6.194913864135742, "global_step": 92378, "epoch": 2199} {"train_loss": -6.2126145362854, "global_step": 92379, "epoch": 2199} {"train_loss": -6.214271545410156, "global_step": 92380, "epoch": 2199} {"train_loss": -6.219437599182129, "global_step": 92381, "epoch": 2199} {"train_loss": -6.270815849304199, "global_step": 92382, "epoch": 2199} {"train_loss": -6.244483470916748, "global_step": 92383, "epoch": 2199} {"train_loss": -6.349152565002441, "global_step": 92384, "epoch": 2199} {"train_loss": -6.122174263000488, "global_step": 92385, "epoch": 2199} {"train_loss": -6.1182403564453125, "global_step": 92386, "epoch": 2199} {"train_loss": -6.224712371826172, "global_step": 92387, "epoch": 2199} {"train_loss": -6.118359565734863, "global_step": 92388, "epoch": 2199} {"train_loss": -6.179740905761719, "global_step": 92389, "epoch": 2199} {"train_loss": -6.267793655395508, "global_step": 92390, "epoch": 2199} {"train_loss": -6.2203288078308105, "global_step": 92391, "epoch": 2199} {"train_loss": -6.146569728851318, "global_step": 92392, "epoch": 2199} {"train_loss": -6.1843366622924805, "global_step": 92393, "epoch": 2199} {"train_loss": -6.217557907104492, "global_step": 92394, "epoch": 2199} {"train_loss": -6.163957118988037, "global_step": 92395, "epoch": 2199} {"train_loss": -6.246335029602051, "global_step": 92396, "epoch": 2199} {"train_loss": -6.182743549346924, "global_step": 92397, "epoch": 2199} {"train_loss": -6.29187536239624, "global_step": 92398, "epoch": 2199} {"train_loss": -6.22720928419204, "global_step": 92399, "epoch": 2199, "val_loss": 75424.1640625} {"train_loss": -6.275049209594727, "global_step": 92400, "epoch": 2200} {"train_loss": -6.177928447723389, "global_step": 92401, "epoch": 2200} {"train_loss": -6.291161060333252, "global_step": 92402, "epoch": 2200} {"train_loss": -6.257612228393555, "global_step": 92403, "epoch": 2200} {"train_loss": -6.118668556213379, "global_step": 92404, "epoch": 2200} {"train_loss": -6.2437744140625, "global_step": 92405, "epoch": 2200} {"train_loss": -6.3688859939575195, "global_step": 92406, "epoch": 2200} {"train_loss": -6.277981758117676, "global_step": 92407, "epoch": 2200} {"train_loss": -6.286655426025391, "global_step": 92408, "epoch": 2200} {"train_loss": -6.191719055175781, "global_step": 92409, "epoch": 2200} {"train_loss": -6.22329044342041, "global_step": 92410, "epoch": 2200} {"train_loss": -6.285485744476318, "global_step": 92411, "epoch": 2200} {"train_loss": -6.372029781341553, "global_step": 92412, "epoch": 2200} {"train_loss": -6.182616233825684, "global_step": 92413, "epoch": 2200} {"train_loss": -6.159528732299805, "global_step": 92414, "epoch": 2200} {"train_loss": -6.326878547668457, "global_step": 92415, "epoch": 2200} {"train_loss": -6.296721935272217, "global_step": 92416, "epoch": 2200} {"train_loss": -6.339023113250732, "global_step": 92417, "epoch": 2200} {"train_loss": -6.166857719421387, "global_step": 92418, "epoch": 2200} {"train_loss": -6.241915702819824, "global_step": 92419, "epoch": 2200} {"train_loss": -6.181463241577148, "global_step": 92420, "epoch": 2200} {"train_loss": -6.161083221435547, "global_step": 92421, "epoch": 2200} {"train_loss": -6.171743869781494, "global_step": 92422, "epoch": 2200} {"train_loss": -6.351213455200195, "global_step": 92423, "epoch": 2200} {"train_loss": -6.306869029998779, "global_step": 92424, "epoch": 2200} {"train_loss": -6.335403919219971, "global_step": 92425, "epoch": 2200} {"train_loss": -6.336676597595215, "global_step": 92426, "epoch": 2200} {"train_loss": -6.3199262619018555, "global_step": 92427, "epoch": 2200} {"train_loss": -6.238225936889648, "global_step": 92428, "epoch": 2200} {"train_loss": -6.163558483123779, "global_step": 92429, "epoch": 2200} {"train_loss": -6.308534622192383, "global_step": 92430, "epoch": 2200} {"train_loss": -6.259120464324951, "global_step": 92431, "epoch": 2200} {"train_loss": -6.226198196411133, "global_step": 92432, "epoch": 2200} {"train_loss": -6.300378799438477, "global_step": 92433, "epoch": 2200} {"train_loss": -6.2161478996276855, "global_step": 92434, "epoch": 2200} {"train_loss": -6.307745456695557, "global_step": 92435, "epoch": 2200} {"train_loss": -6.2160186767578125, "global_step": 92436, "epoch": 2200} {"train_loss": -6.250414848327637, "global_step": 92437, "epoch": 2200} {"train_loss": -6.266843795776367, "global_step": 92438, "epoch": 2200} {"train_loss": -6.272921562194824, "global_step": 92439, "epoch": 2200} {"train_loss": -6.353481292724609, "global_step": 92440, "epoch": 2200} {"train_loss": -6.260287704921904, "global_step": 92441, "epoch": 2200, "train/sim_max_reward_0": 0.37560619932230854, "train/sim_max_reward_1": 0.9884108296786931, "train/sim_max_reward_2": 0.3294940940997978, "train/sim_max_reward_3": 0.4816115320413703, "train/sim_max_reward_4": 0.7111714852275156, "train/sim_max_reward_5": 0.7804948889874259, "test/sim_max_reward_4500000": 0.5184242461760452, "test/sim_max_reward_4500001": 0.9748004297674127, "test/sim_max_reward_4500002": 0.8876382988123496, "test/sim_max_reward_4500003": 0.9782651206179606, "test/sim_max_reward_4500004": 0.9257188438916495, "test/sim_max_reward_4500005": 0.9740753080977833, "test/sim_max_reward_4500006": 0.8082555613641318, "test/sim_max_reward_4500007": 0.8186139833574511, "test/sim_max_reward_4500008": 0.1283198362009869, "test/sim_max_reward_4500009": 0.04609475595638818, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.5448262074795077, "test/sim_max_reward_4500012": 0.94857320540147, "test/sim_max_reward_4500013": 0.011862230415725952, "test/sim_max_reward_4500014": 0.8014126138351789, "test/sim_max_reward_4500015": 0.748236131819755, "test/sim_max_reward_4500016": 0.18071985991109896, "test/sim_max_reward_4500017": 0.06238500791500672, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.9052388583818016, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9506909360552759, "test/sim_max_reward_4500022": 0.9485358161394033, "test/sim_max_reward_4500023": 0.9327967926960647, "test/sim_max_reward_4500024": 0.9867611250052961, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.7956752668593072, "test/sim_max_reward_4500027": 0.8926748548696868, "test/sim_max_reward_4500028": 0.18885804052782837, "test/sim_max_reward_4500029": 0.0416602759311165, "test/sim_max_reward_4500030": 0.9451039706770563, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9875884423806918, "test/sim_max_reward_4500034": 0.9570178530287736, "test/sim_max_reward_4500035": 0.7774987765754736, "test/sim_max_reward_4500036": 0.39656523287321127, "test/sim_max_reward_4500037": 0.40391686120780995, "test/sim_max_reward_4500038": 0.3126196067314641, "test/sim_max_reward_4500039": 0.9219257428807419, "test/sim_max_reward_4500040": 0.9405985051923145, "test/sim_max_reward_4500041": 0.529287333657752, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.28060030208296627, "test/sim_max_reward_4500044": 0.9620429063088092, "test/sim_max_reward_4500045": 0.8970277071818762, "test/sim_max_reward_4500046": 0.8292607287206921, "test/sim_max_reward_4500047": 0.029554474705588554, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.611131504892852, "test/mean_score": 0.5848134238269831, "val_loss": 75374.7578125} {"train_loss": -6.267862796783447, "global_step": 92442, "epoch": 2201} {"train_loss": -6.275359153747559, "global_step": 92443, "epoch": 2201} {"train_loss": -6.367781162261963, "global_step": 92444, "epoch": 2201} {"train_loss": -6.273728370666504, "global_step": 92445, "epoch": 2201} {"train_loss": -6.242537975311279, "global_step": 92446, "epoch": 2201} {"train_loss": -6.210938453674316, "global_step": 92447, "epoch": 2201} {"train_loss": -6.270997047424316, "global_step": 92448, "epoch": 2201} {"train_loss": -6.280996322631836, "global_step": 92449, "epoch": 2201} {"train_loss": -6.324080467224121, "global_step": 92450, "epoch": 2201} {"train_loss": -6.3365702629089355, "global_step": 92451, "epoch": 2201} {"train_loss": -6.237993240356445, "global_step": 92452, "epoch": 2201} {"train_loss": -6.336662292480469, "global_step": 92453, "epoch": 2201} {"train_loss": -6.393147945404053, "global_step": 92454, "epoch": 2201} {"train_loss": -6.2795023918151855, "global_step": 92455, "epoch": 2201} {"train_loss": -6.286457061767578, "global_step": 92456, "epoch": 2201} {"train_loss": -6.362555503845215, "global_step": 92457, "epoch": 2201} {"train_loss": -6.272857666015625, "global_step": 92458, "epoch": 2201} {"train_loss": -6.330693244934082, "global_step": 92459, "epoch": 2201} {"train_loss": -6.307891845703125, "global_step": 92460, "epoch": 2201} {"train_loss": -6.334849834442139, "global_step": 92461, "epoch": 2201} {"train_loss": -6.294405937194824, "global_step": 92462, "epoch": 2201} {"train_loss": -6.2514448165893555, "global_step": 92463, "epoch": 2201} {"train_loss": -6.3188605308532715, "global_step": 92464, "epoch": 2201} {"train_loss": -6.150077819824219, "global_step": 92465, "epoch": 2201} {"train_loss": -6.178094863891602, "global_step": 92466, "epoch": 2201} {"train_loss": -6.094061851501465, "global_step": 92467, "epoch": 2201} {"train_loss": -6.2139081954956055, "global_step": 92468, "epoch": 2201} {"train_loss": -6.225102424621582, "global_step": 92469, "epoch": 2201} {"train_loss": -6.190519332885742, "global_step": 92470, "epoch": 2201} {"train_loss": -6.308192253112793, "global_step": 92471, "epoch": 2201} {"train_loss": -6.248723983764648, "global_step": 92472, "epoch": 2201} {"train_loss": -6.376341819763184, "global_step": 92473, "epoch": 2201} {"train_loss": -6.281660079956055, "global_step": 92474, "epoch": 2201} {"train_loss": -6.219852924346924, "global_step": 92475, "epoch": 2201} {"train_loss": -6.286225318908691, "global_step": 92476, "epoch": 2201} {"train_loss": -6.079525947570801, "global_step": 92477, "epoch": 2201} {"train_loss": -6.230039596557617, "global_step": 92478, "epoch": 2201} {"train_loss": -6.110040664672852, "global_step": 92479, "epoch": 2201} {"train_loss": -6.194431304931641, "global_step": 92480, "epoch": 2201} {"train_loss": -6.2766313552856445, "global_step": 92481, "epoch": 2201} {"train_loss": -6.248139381408691, "global_step": 92482, "epoch": 2201} {"train_loss": -6.263366869517735, "global_step": 92483, "epoch": 2201, "val_loss": 75360.6953125} {"train_loss": -6.188718795776367, "global_step": 92484, "epoch": 2202} {"train_loss": -6.195279121398926, "global_step": 92485, "epoch": 2202} {"train_loss": -6.2716217041015625, "global_step": 92486, "epoch": 2202} {"train_loss": -6.170419216156006, "global_step": 92487, "epoch": 2202} {"train_loss": -6.12551212310791, "global_step": 92488, "epoch": 2202} {"train_loss": -6.268946647644043, "global_step": 92489, "epoch": 2202} {"train_loss": -6.150352478027344, "global_step": 92490, "epoch": 2202} {"train_loss": -6.2976884841918945, "global_step": 92491, "epoch": 2202} {"train_loss": -6.261556625366211, "global_step": 92492, "epoch": 2202} {"train_loss": -6.182040214538574, "global_step": 92493, "epoch": 2202} {"train_loss": -6.292853832244873, "global_step": 92494, "epoch": 2202} {"train_loss": -6.2865142822265625, "global_step": 92495, "epoch": 2202} {"train_loss": -6.104239463806152, "global_step": 92496, "epoch": 2202} {"train_loss": -6.296669006347656, "global_step": 92497, "epoch": 2202} {"train_loss": -6.26188850402832, "global_step": 92498, "epoch": 2202} {"train_loss": -6.244716644287109, "global_step": 92499, "epoch": 2202} {"train_loss": -6.3193864822387695, "global_step": 92500, "epoch": 2202} {"train_loss": -6.206231117248535, "global_step": 92501, "epoch": 2202} {"train_loss": -6.295285701751709, "global_step": 92502, "epoch": 2202} {"train_loss": -6.292759895324707, "global_step": 92503, "epoch": 2202} {"train_loss": -6.276570796966553, "global_step": 92504, "epoch": 2202} {"train_loss": -6.286707401275635, "global_step": 92505, "epoch": 2202} {"train_loss": -6.25928258895874, "global_step": 92506, "epoch": 2202} {"train_loss": -6.367105484008789, "global_step": 92507, "epoch": 2202} {"train_loss": -6.217920780181885, "global_step": 92508, "epoch": 2202} {"train_loss": -6.2463483810424805, "global_step": 92509, "epoch": 2202} {"train_loss": -6.298219203948975, "global_step": 92510, "epoch": 2202} {"train_loss": -6.207277297973633, "global_step": 92511, "epoch": 2202} {"train_loss": -6.363602161407471, "global_step": 92512, "epoch": 2202} {"train_loss": -6.314325332641602, "global_step": 92513, "epoch": 2202} {"train_loss": -6.300706386566162, "global_step": 92514, "epoch": 2202} {"train_loss": -6.329641342163086, "global_step": 92515, "epoch": 2202} {"train_loss": -6.344313621520996, "global_step": 92516, "epoch": 2202} {"train_loss": -6.329097747802734, "global_step": 92517, "epoch": 2202} {"train_loss": -6.339022636413574, "global_step": 92518, "epoch": 2202} {"train_loss": -6.270591735839844, "global_step": 92519, "epoch": 2202} {"train_loss": -6.24368953704834, "global_step": 92520, "epoch": 2202} {"train_loss": -6.353171348571777, "global_step": 92521, "epoch": 2202} {"train_loss": -6.399178981781006, "global_step": 92522, "epoch": 2202} {"train_loss": -6.297177791595459, "global_step": 92523, "epoch": 2202} {"train_loss": -6.365206718444824, "global_step": 92524, "epoch": 2202} {"train_loss": -6.271601608821324, "global_step": 92525, "epoch": 2202, "val_loss": 75359.9375} {"train_loss": -6.302400588989258, "global_step": 92526, "epoch": 2203} {"train_loss": -6.348649978637695, "global_step": 92527, "epoch": 2203} {"train_loss": -6.25755500793457, "global_step": 92528, "epoch": 2203} {"train_loss": -6.265344142913818, "global_step": 92529, "epoch": 2203} {"train_loss": -6.184055805206299, "global_step": 92530, "epoch": 2203} {"train_loss": -6.207974433898926, "global_step": 92531, "epoch": 2203} {"train_loss": -6.284250259399414, "global_step": 92532, "epoch": 2203} {"train_loss": -6.2755842208862305, "global_step": 92533, "epoch": 2203} {"train_loss": -6.227014541625977, "global_step": 92534, "epoch": 2203} {"train_loss": -6.263757705688477, "global_step": 92535, "epoch": 2203} {"train_loss": -6.295738220214844, "global_step": 92536, "epoch": 2203} {"train_loss": -6.300018310546875, "global_step": 92537, "epoch": 2203} {"train_loss": -6.172074317932129, "global_step": 92538, "epoch": 2203} {"train_loss": -6.202416896820068, "global_step": 92539, "epoch": 2203} {"train_loss": -6.465256690979004, "global_step": 92540, "epoch": 2203} {"train_loss": -6.24791145324707, "global_step": 92541, "epoch": 2203} {"train_loss": -6.21217679977417, "global_step": 92542, "epoch": 2203} {"train_loss": -6.300003528594971, "global_step": 92543, "epoch": 2203} {"train_loss": -6.3127593994140625, "global_step": 92544, "epoch": 2203} {"train_loss": -6.190810203552246, "global_step": 92545, "epoch": 2203} {"train_loss": -6.306936264038086, "global_step": 92546, "epoch": 2203} {"train_loss": -6.245779037475586, "global_step": 92547, "epoch": 2203} {"train_loss": -6.282264709472656, "global_step": 92548, "epoch": 2203} {"train_loss": -6.246542930603027, "global_step": 92549, "epoch": 2203} {"train_loss": -6.173008441925049, "global_step": 92550, "epoch": 2203} {"train_loss": -6.275540351867676, "global_step": 92551, "epoch": 2203} {"train_loss": -6.253785610198975, "global_step": 92552, "epoch": 2203} {"train_loss": -6.280539512634277, "global_step": 92553, "epoch": 2203} {"train_loss": -6.272125244140625, "global_step": 92554, "epoch": 2203} {"train_loss": -6.212057113647461, "global_step": 92555, "epoch": 2203} {"train_loss": -6.253666877746582, "global_step": 92556, "epoch": 2203} {"train_loss": -6.258664131164551, "global_step": 92557, "epoch": 2203} {"train_loss": -6.240687370300293, "global_step": 92558, "epoch": 2203} {"train_loss": -6.213733673095703, "global_step": 92559, "epoch": 2203} {"train_loss": -6.354172706604004, "global_step": 92560, "epoch": 2203} {"train_loss": -6.1716532707214355, "global_step": 92561, "epoch": 2203} {"train_loss": -6.303006649017334, "global_step": 92562, "epoch": 2203} {"train_loss": -6.208412170410156, "global_step": 92563, "epoch": 2203} {"train_loss": -6.278229713439941, "global_step": 92564, "epoch": 2203} {"train_loss": -6.2940826416015625, "global_step": 92565, "epoch": 2203} {"train_loss": -6.2384514808654785, "global_step": 92566, "epoch": 2203} {"train_loss": -6.261229991912842, "global_step": 92567, "epoch": 2203, "val_loss": 75553.484375} {"train_loss": -6.229844093322754, "global_step": 92568, "epoch": 2204} {"train_loss": -6.361170768737793, "global_step": 92569, "epoch": 2204} {"train_loss": -6.271879196166992, "global_step": 92570, "epoch": 2204} {"train_loss": -6.3238067626953125, "global_step": 92571, "epoch": 2204} {"train_loss": -6.317499160766602, "global_step": 92572, "epoch": 2204} {"train_loss": -6.299704551696777, "global_step": 92573, "epoch": 2204} {"train_loss": -6.31101131439209, "global_step": 92574, "epoch": 2204} {"train_loss": -6.389633655548096, "global_step": 92575, "epoch": 2204} {"train_loss": -6.336612701416016, "global_step": 92576, "epoch": 2204} {"train_loss": -6.246243476867676, "global_step": 92577, "epoch": 2204} {"train_loss": -6.398079872131348, "global_step": 92578, "epoch": 2204} {"train_loss": -6.210630893707275, "global_step": 92579, "epoch": 2204} {"train_loss": -6.326015472412109, "global_step": 92580, "epoch": 2204} {"train_loss": -6.26307487487793, "global_step": 92581, "epoch": 2204} {"train_loss": -6.244331359863281, "global_step": 92582, "epoch": 2204} {"train_loss": -6.1821675300598145, "global_step": 92583, "epoch": 2204} {"train_loss": -6.194766044616699, "global_step": 92584, "epoch": 2204} {"train_loss": -6.299612045288086, "global_step": 92585, "epoch": 2204} {"train_loss": -6.2841973304748535, "global_step": 92586, "epoch": 2204} {"train_loss": -6.1461687088012695, "global_step": 92587, "epoch": 2204} {"train_loss": -6.191517353057861, "global_step": 92588, "epoch": 2204} {"train_loss": -6.269498348236084, "global_step": 92589, "epoch": 2204} {"train_loss": -6.215237617492676, "global_step": 92590, "epoch": 2204} {"train_loss": -6.193186283111572, "global_step": 92591, "epoch": 2204} {"train_loss": -6.214872360229492, "global_step": 92592, "epoch": 2204} {"train_loss": -6.20682430267334, "global_step": 92593, "epoch": 2204} {"train_loss": -6.248784065246582, "global_step": 92594, "epoch": 2204} {"train_loss": -6.332798004150391, "global_step": 92595, "epoch": 2204} {"train_loss": -6.363777160644531, "global_step": 92596, "epoch": 2204} {"train_loss": -6.243857383728027, "global_step": 92597, "epoch": 2204} {"train_loss": -6.342994689941406, "global_step": 92598, "epoch": 2204} {"train_loss": -6.319367408752441, "global_step": 92599, "epoch": 2204} {"train_loss": -6.226290702819824, "global_step": 92600, "epoch": 2204} {"train_loss": -6.298003673553467, "global_step": 92601, "epoch": 2204} {"train_loss": -6.332973480224609, "global_step": 92602, "epoch": 2204} {"train_loss": -6.258040428161621, "global_step": 92603, "epoch": 2204} {"train_loss": -6.1870551109313965, "global_step": 92604, "epoch": 2204} {"train_loss": -6.285099029541016, "global_step": 92605, "epoch": 2204} {"train_loss": -6.286693096160889, "global_step": 92606, "epoch": 2204} {"train_loss": -6.388437271118164, "global_step": 92607, "epoch": 2204} {"train_loss": -6.332150459289551, "global_step": 92608, "epoch": 2204} {"train_loss": -6.277493726639521, "global_step": 92609, "epoch": 2204, "val_loss": 75178.4609375} {"train_loss": -6.208833694458008, "global_step": 92610, "epoch": 2205} {"train_loss": -6.250070095062256, "global_step": 92611, "epoch": 2205} {"train_loss": -6.262304782867432, "global_step": 92612, "epoch": 2205} {"train_loss": -6.344285011291504, "global_step": 92613, "epoch": 2205} {"train_loss": -6.260417938232422, "global_step": 92614, "epoch": 2205} {"train_loss": -6.216447830200195, "global_step": 92615, "epoch": 2205} {"train_loss": -6.252493381500244, "global_step": 92616, "epoch": 2205} {"train_loss": -6.188966751098633, "global_step": 92617, "epoch": 2205} {"train_loss": -6.341804504394531, "global_step": 92618, "epoch": 2205} {"train_loss": -6.406203269958496, "global_step": 92619, "epoch": 2205} {"train_loss": -6.318076133728027, "global_step": 92620, "epoch": 2205} {"train_loss": -6.303792953491211, "global_step": 92621, "epoch": 2205} {"train_loss": -6.255379676818848, "global_step": 92622, "epoch": 2205} {"train_loss": -6.231825828552246, "global_step": 92623, "epoch": 2205} {"train_loss": -6.373034954071045, "global_step": 92624, "epoch": 2205} {"train_loss": -6.201754570007324, "global_step": 92625, "epoch": 2205} {"train_loss": -6.246675968170166, "global_step": 92626, "epoch": 2205} {"train_loss": -6.37727165222168, "global_step": 92627, "epoch": 2205} {"train_loss": -6.331418991088867, "global_step": 92628, "epoch": 2205} {"train_loss": -6.269254207611084, "global_step": 92629, "epoch": 2205} {"train_loss": -6.352301597595215, "global_step": 92630, "epoch": 2205} {"train_loss": -6.318917274475098, "global_step": 92631, "epoch": 2205} {"train_loss": -6.351072311401367, "global_step": 92632, "epoch": 2205} {"train_loss": -6.391116142272949, "global_step": 92633, "epoch": 2205} {"train_loss": -6.202701568603516, "global_step": 92634, "epoch": 2205} {"train_loss": -6.379988193511963, "global_step": 92635, "epoch": 2205} {"train_loss": -6.278729438781738, "global_step": 92636, "epoch": 2205} {"train_loss": -6.184197902679443, "global_step": 92637, "epoch": 2205} {"train_loss": -6.2905378341674805, "global_step": 92638, "epoch": 2205} {"train_loss": -6.223991394042969, "global_step": 92639, "epoch": 2205} {"train_loss": -6.310746669769287, "global_step": 92640, "epoch": 2205} {"train_loss": -6.300961017608643, "global_step": 92641, "epoch": 2205} {"train_loss": -6.283750057220459, "global_step": 92642, "epoch": 2205} {"train_loss": -6.280830383300781, "global_step": 92643, "epoch": 2205} {"train_loss": -6.203788757324219, "global_step": 92644, "epoch": 2205} {"train_loss": -6.299837112426758, "global_step": 92645, "epoch": 2205} {"train_loss": -6.268874168395996, "global_step": 92646, "epoch": 2205} {"train_loss": -6.189547538757324, "global_step": 92647, "epoch": 2205} {"train_loss": -6.300724983215332, "global_step": 92648, "epoch": 2205} {"train_loss": -6.260002136230469, "global_step": 92649, "epoch": 2205} {"train_loss": -6.302605152130127, "global_step": 92650, "epoch": 2205} {"train_loss": -6.280961070741926, "global_step": 92651, "epoch": 2205, "val_loss": 75658.921875} {"train_loss": -6.31212043762207, "global_step": 92652, "epoch": 2206} {"train_loss": -6.336078643798828, "global_step": 92653, "epoch": 2206} {"train_loss": -6.218540191650391, "global_step": 92654, "epoch": 2206} {"train_loss": -6.285791397094727, "global_step": 92655, "epoch": 2206} {"train_loss": -6.283858776092529, "global_step": 92656, "epoch": 2206} {"train_loss": -6.147642135620117, "global_step": 92657, "epoch": 2206} {"train_loss": -6.0935516357421875, "global_step": 92658, "epoch": 2206} {"train_loss": -6.156681060791016, "global_step": 92659, "epoch": 2206} {"train_loss": -6.227202415466309, "global_step": 92660, "epoch": 2206} {"train_loss": -6.2735795974731445, "global_step": 92661, "epoch": 2206} {"train_loss": -6.26792573928833, "global_step": 92662, "epoch": 2206} {"train_loss": -6.167980670928955, "global_step": 92663, "epoch": 2206} {"train_loss": -6.210352897644043, "global_step": 92664, "epoch": 2206} {"train_loss": -6.2325310707092285, "global_step": 92665, "epoch": 2206} {"train_loss": -6.169578552246094, "global_step": 92666, "epoch": 2206} {"train_loss": -6.28755521774292, "global_step": 92667, "epoch": 2206} {"train_loss": -6.368978977203369, "global_step": 92668, "epoch": 2206} {"train_loss": -6.286576271057129, "global_step": 92669, "epoch": 2206} {"train_loss": -6.337228775024414, "global_step": 92670, "epoch": 2206} {"train_loss": -6.190654277801514, "global_step": 92671, "epoch": 2206} {"train_loss": -6.279293060302734, "global_step": 92672, "epoch": 2206} {"train_loss": -6.2828288078308105, "global_step": 92673, "epoch": 2206} {"train_loss": -6.332185745239258, "global_step": 92674, "epoch": 2206} {"train_loss": -6.171169757843018, "global_step": 92675, "epoch": 2206} {"train_loss": -6.260303020477295, "global_step": 92676, "epoch": 2206} {"train_loss": -6.0523457527160645, "global_step": 92677, "epoch": 2206} {"train_loss": -6.175575256347656, "global_step": 92678, "epoch": 2206} {"train_loss": -6.196080207824707, "global_step": 92679, "epoch": 2206} {"train_loss": -6.235626220703125, "global_step": 92680, "epoch": 2206} {"train_loss": -6.237682342529297, "global_step": 92681, "epoch": 2206} {"train_loss": -6.189456462860107, "global_step": 92682, "epoch": 2206} {"train_loss": -6.286189079284668, "global_step": 92683, "epoch": 2206} {"train_loss": -6.290544509887695, "global_step": 92684, "epoch": 2206} {"train_loss": -6.343910217285156, "global_step": 92685, "epoch": 2206} {"train_loss": -6.239927291870117, "global_step": 92686, "epoch": 2206} {"train_loss": -6.312279224395752, "global_step": 92687, "epoch": 2206} {"train_loss": -6.32420015335083, "global_step": 92688, "epoch": 2206} {"train_loss": -6.250341415405273, "global_step": 92689, "epoch": 2206} {"train_loss": -6.345985412597656, "global_step": 92690, "epoch": 2206} {"train_loss": -6.030440330505371, "global_step": 92691, "epoch": 2206} {"train_loss": -6.205105781555176, "global_step": 92692, "epoch": 2206} {"train_loss": -6.2444147155398415, "global_step": 92693, "epoch": 2206, "val_loss": 75365.734375} {"train_loss": -6.229486465454102, "global_step": 92694, "epoch": 2207} {"train_loss": -6.300782680511475, "global_step": 92695, "epoch": 2207} {"train_loss": -6.384727478027344, "global_step": 92696, "epoch": 2207} {"train_loss": -6.168362617492676, "global_step": 92697, "epoch": 2207} {"train_loss": -6.296188831329346, "global_step": 92698, "epoch": 2207} {"train_loss": -6.234347820281982, "global_step": 92699, "epoch": 2207} {"train_loss": -6.289692401885986, "global_step": 92700, "epoch": 2207} {"train_loss": -6.117751121520996, "global_step": 92701, "epoch": 2207} {"train_loss": -6.068906784057617, "global_step": 92702, "epoch": 2207} {"train_loss": -6.223952770233154, "global_step": 92703, "epoch": 2207} {"train_loss": -6.209622383117676, "global_step": 92704, "epoch": 2207} {"train_loss": -6.23520565032959, "global_step": 92705, "epoch": 2207} {"train_loss": -6.2286505699157715, "global_step": 92706, "epoch": 2207} {"train_loss": -6.313510417938232, "global_step": 92707, "epoch": 2207} {"train_loss": -6.227504730224609, "global_step": 92708, "epoch": 2207} {"train_loss": -6.353708267211914, "global_step": 92709, "epoch": 2207} {"train_loss": -6.241215705871582, "global_step": 92710, "epoch": 2207} {"train_loss": -6.183719635009766, "global_step": 92711, "epoch": 2207} {"train_loss": -6.247650623321533, "global_step": 92712, "epoch": 2207} {"train_loss": -6.293025016784668, "global_step": 92713, "epoch": 2207} {"train_loss": -6.259588718414307, "global_step": 92714, "epoch": 2207} {"train_loss": -6.336449146270752, "global_step": 92715, "epoch": 2207} {"train_loss": -6.111606597900391, "global_step": 92716, "epoch": 2207} {"train_loss": -6.219303607940674, "global_step": 92717, "epoch": 2207} {"train_loss": -6.268185615539551, "global_step": 92718, "epoch": 2207} {"train_loss": -6.271875381469727, "global_step": 92719, "epoch": 2207} {"train_loss": -6.332911968231201, "global_step": 92720, "epoch": 2207} {"train_loss": -6.283824443817139, "global_step": 92721, "epoch": 2207} {"train_loss": -6.360280513763428, "global_step": 92722, "epoch": 2207} {"train_loss": -6.224396705627441, "global_step": 92723, "epoch": 2207} {"train_loss": -6.257177352905273, "global_step": 92724, "epoch": 2207} {"train_loss": -6.328290939331055, "global_step": 92725, "epoch": 2207} {"train_loss": -6.383858680725098, "global_step": 92726, "epoch": 2207} {"train_loss": -6.319440841674805, "global_step": 92727, "epoch": 2207} {"train_loss": -6.249197483062744, "global_step": 92728, "epoch": 2207} {"train_loss": -6.2387800216674805, "global_step": 92729, "epoch": 2207} {"train_loss": -6.212707042694092, "global_step": 92730, "epoch": 2207} {"train_loss": -6.297284126281738, "global_step": 92731, "epoch": 2207} {"train_loss": -6.2344865798950195, "global_step": 92732, "epoch": 2207} {"train_loss": -6.335793972015381, "global_step": 92733, "epoch": 2207} {"train_loss": -6.287918567657471, "global_step": 92734, "epoch": 2207} {"train_loss": -6.26140756834121, "global_step": 92735, "epoch": 2207, "val_loss": 75605.234375} {"train_loss": -6.158809185028076, "global_step": 92736, "epoch": 2208} {"train_loss": -6.265128135681152, "global_step": 92737, "epoch": 2208} {"train_loss": -6.287356853485107, "global_step": 92738, "epoch": 2208} {"train_loss": -6.223596572875977, "global_step": 92739, "epoch": 2208} {"train_loss": -6.405967712402344, "global_step": 92740, "epoch": 2208} {"train_loss": -6.047607421875, "global_step": 92741, "epoch": 2208} {"train_loss": -6.196423530578613, "global_step": 92742, "epoch": 2208} {"train_loss": -6.376495361328125, "global_step": 92743, "epoch": 2208} {"train_loss": -6.239142417907715, "global_step": 92744, "epoch": 2208} {"train_loss": -6.400876045227051, "global_step": 92745, "epoch": 2208} {"train_loss": -6.34638786315918, "global_step": 92746, "epoch": 2208} {"train_loss": -6.276157379150391, "global_step": 92747, "epoch": 2208} {"train_loss": -6.141740322113037, "global_step": 92748, "epoch": 2208} {"train_loss": -6.2158637046813965, "global_step": 92749, "epoch": 2208} {"train_loss": -6.136397838592529, "global_step": 92750, "epoch": 2208} {"train_loss": -6.2424798011779785, "global_step": 92751, "epoch": 2208} {"train_loss": -6.263864517211914, "global_step": 92752, "epoch": 2208} {"train_loss": -6.1724419593811035, "global_step": 92753, "epoch": 2208} {"train_loss": -6.2225141525268555, "global_step": 92754, "epoch": 2208} {"train_loss": -6.319318771362305, "global_step": 92755, "epoch": 2208} {"train_loss": -6.189609527587891, "global_step": 92756, "epoch": 2208} {"train_loss": -6.198171615600586, "global_step": 92757, "epoch": 2208} {"train_loss": -6.248957633972168, "global_step": 92758, "epoch": 2208} {"train_loss": -6.316159725189209, "global_step": 92759, "epoch": 2208} {"train_loss": -6.24433708190918, "global_step": 92760, "epoch": 2208} {"train_loss": -6.370383262634277, "global_step": 92761, "epoch": 2208} {"train_loss": -6.321892738342285, "global_step": 92762, "epoch": 2208} {"train_loss": -6.313722610473633, "global_step": 92763, "epoch": 2208} {"train_loss": -6.148263454437256, "global_step": 92764, "epoch": 2208} {"train_loss": -6.285335063934326, "global_step": 92765, "epoch": 2208} {"train_loss": -6.224806785583496, "global_step": 92766, "epoch": 2208} {"train_loss": -6.274533271789551, "global_step": 92767, "epoch": 2208} {"train_loss": -6.274143695831299, "global_step": 92768, "epoch": 2208} {"train_loss": -6.197722434997559, "global_step": 92769, "epoch": 2208} {"train_loss": -6.274198532104492, "global_step": 92770, "epoch": 2208} {"train_loss": -6.345424175262451, "global_step": 92771, "epoch": 2208} {"train_loss": -6.231348514556885, "global_step": 92772, "epoch": 2208} {"train_loss": -6.408144474029541, "global_step": 92773, "epoch": 2208} {"train_loss": -6.277223587036133, "global_step": 92774, "epoch": 2208} {"train_loss": -6.261087417602539, "global_step": 92775, "epoch": 2208} {"train_loss": -6.282732009887695, "global_step": 92776, "epoch": 2208} {"train_loss": -6.25635195913769, "global_step": 92777, "epoch": 2208, "val_loss": 75442.6875} {"train_loss": -6.317069053649902, "global_step": 92778, "epoch": 2209} {"train_loss": -6.271275997161865, "global_step": 92779, "epoch": 2209} {"train_loss": -6.332782745361328, "global_step": 92780, "epoch": 2209} {"train_loss": -6.340701580047607, "global_step": 92781, "epoch": 2209} {"train_loss": -6.199929714202881, "global_step": 92782, "epoch": 2209} {"train_loss": -6.118646621704102, "global_step": 92783, "epoch": 2209} {"train_loss": -6.367500305175781, "global_step": 92784, "epoch": 2209} {"train_loss": -6.193359375, "global_step": 92785, "epoch": 2209} {"train_loss": -6.146260738372803, "global_step": 92786, "epoch": 2209} {"train_loss": -6.280551910400391, "global_step": 92787, "epoch": 2209} {"train_loss": -6.263014316558838, "global_step": 92788, "epoch": 2209} {"train_loss": -6.231179237365723, "global_step": 92789, "epoch": 2209} {"train_loss": -6.218348026275635, "global_step": 92790, "epoch": 2209} {"train_loss": -6.21748161315918, "global_step": 92791, "epoch": 2209} {"train_loss": -6.293069362640381, "global_step": 92792, "epoch": 2209} {"train_loss": -6.217127323150635, "global_step": 92793, "epoch": 2209} {"train_loss": -6.35342264175415, "global_step": 92794, "epoch": 2209} {"train_loss": -6.089602470397949, "global_step": 92795, "epoch": 2209} {"train_loss": -6.298862457275391, "global_step": 92796, "epoch": 2209} {"train_loss": -6.262871265411377, "global_step": 92797, "epoch": 2209} {"train_loss": -6.148705959320068, "global_step": 92798, "epoch": 2209} {"train_loss": -6.249733924865723, "global_step": 92799, "epoch": 2209} {"train_loss": -6.19611930847168, "global_step": 92800, "epoch": 2209} {"train_loss": -6.323081016540527, "global_step": 92801, "epoch": 2209} {"train_loss": -6.1650285720825195, "global_step": 92802, "epoch": 2209} {"train_loss": -6.237886428833008, "global_step": 92803, "epoch": 2209} {"train_loss": -6.285806179046631, "global_step": 92804, "epoch": 2209} {"train_loss": -6.3636016845703125, "global_step": 92805, "epoch": 2209} {"train_loss": -6.243712425231934, "global_step": 92806, "epoch": 2209} {"train_loss": -6.321789741516113, "global_step": 92807, "epoch": 2209} {"train_loss": -6.305523872375488, "global_step": 92808, "epoch": 2209} {"train_loss": -6.3553080558776855, "global_step": 92809, "epoch": 2209} {"train_loss": -6.300567626953125, "global_step": 92810, "epoch": 2209} {"train_loss": -6.123013019561768, "global_step": 92811, "epoch": 2209} {"train_loss": -6.277919292449951, "global_step": 92812, "epoch": 2209} {"train_loss": -6.334949970245361, "global_step": 92813, "epoch": 2209} {"train_loss": -6.330560684204102, "global_step": 92814, "epoch": 2209} {"train_loss": -6.368447303771973, "global_step": 92815, "epoch": 2209} {"train_loss": -6.266988277435303, "global_step": 92816, "epoch": 2209} {"train_loss": -6.29834508895874, "global_step": 92817, "epoch": 2209} {"train_loss": -6.097770690917969, "global_step": 92818, "epoch": 2209} {"train_loss": -6.25715446472168, "global_step": 92819, "epoch": 2209, "val_loss": 75322.515625} {"train_loss": -6.2328081130981445, "global_step": 92820, "epoch": 2210} {"train_loss": -6.329165458679199, "global_step": 92821, "epoch": 2210} {"train_loss": -6.267887115478516, "global_step": 92822, "epoch": 2210} {"train_loss": -6.256358623504639, "global_step": 92823, "epoch": 2210} {"train_loss": -6.131684303283691, "global_step": 92824, "epoch": 2210} {"train_loss": -6.269399642944336, "global_step": 92825, "epoch": 2210} {"train_loss": -6.278348922729492, "global_step": 92826, "epoch": 2210} {"train_loss": -6.265279769897461, "global_step": 92827, "epoch": 2210} {"train_loss": -6.340503692626953, "global_step": 92828, "epoch": 2210} {"train_loss": -6.367049217224121, "global_step": 92829, "epoch": 2210} {"train_loss": -6.3164167404174805, "global_step": 92830, "epoch": 2210} {"train_loss": -6.259681701660156, "global_step": 92831, "epoch": 2210} {"train_loss": -6.2955780029296875, "global_step": 92832, "epoch": 2210} {"train_loss": -6.345587253570557, "global_step": 92833, "epoch": 2210} {"train_loss": -6.307172775268555, "global_step": 92834, "epoch": 2210} {"train_loss": -6.318362236022949, "global_step": 92835, "epoch": 2210} {"train_loss": -6.363132953643799, "global_step": 92836, "epoch": 2210} {"train_loss": -6.3762359619140625, "global_step": 92837, "epoch": 2210} {"train_loss": -6.334156036376953, "global_step": 92838, "epoch": 2210} {"train_loss": -6.2302045822143555, "global_step": 92839, "epoch": 2210} {"train_loss": -6.2433953285217285, "global_step": 92840, "epoch": 2210} {"train_loss": -6.292368412017822, "global_step": 92841, "epoch": 2210} {"train_loss": -6.216510772705078, "global_step": 92842, "epoch": 2210} {"train_loss": -6.218287467956543, "global_step": 92843, "epoch": 2210} {"train_loss": -6.304294586181641, "global_step": 92844, "epoch": 2210} {"train_loss": -6.312562465667725, "global_step": 92845, "epoch": 2210} {"train_loss": -6.203103065490723, "global_step": 92846, "epoch": 2210} {"train_loss": -6.249975204467773, "global_step": 92847, "epoch": 2210} {"train_loss": -6.3017778396606445, "global_step": 92848, "epoch": 2210} {"train_loss": -6.331046104431152, "global_step": 92849, "epoch": 2210} {"train_loss": -6.274744033813477, "global_step": 92850, "epoch": 2210} {"train_loss": -6.197980880737305, "global_step": 92851, "epoch": 2210} {"train_loss": -6.316072463989258, "global_step": 92852, "epoch": 2210} {"train_loss": -6.259976863861084, "global_step": 92853, "epoch": 2210} {"train_loss": -6.196779727935791, "global_step": 92854, "epoch": 2210} {"train_loss": -6.304837226867676, "global_step": 92855, "epoch": 2210} {"train_loss": -6.244746208190918, "global_step": 92856, "epoch": 2210} {"train_loss": -6.365438461303711, "global_step": 92857, "epoch": 2210} {"train_loss": -6.297091960906982, "global_step": 92858, "epoch": 2210} {"train_loss": -6.186225891113281, "global_step": 92859, "epoch": 2210} {"train_loss": -6.321892738342285, "global_step": 92860, "epoch": 2210} {"train_loss": -6.280494689941406, "global_step": 92861, "epoch": 2210, "val_loss": 75593.375} {"train_loss": -6.253216743469238, "global_step": 92862, "epoch": 2211} {"train_loss": -6.256716728210449, "global_step": 92863, "epoch": 2211} {"train_loss": -6.345664024353027, "global_step": 92864, "epoch": 2211} {"train_loss": -6.358096122741699, "global_step": 92865, "epoch": 2211} {"train_loss": -6.356238842010498, "global_step": 92866, "epoch": 2211} {"train_loss": -6.454007148742676, "global_step": 92867, "epoch": 2211} {"train_loss": -6.224374771118164, "global_step": 92868, "epoch": 2211} {"train_loss": -6.243921279907227, "global_step": 92869, "epoch": 2211} {"train_loss": -6.195095062255859, "global_step": 92870, "epoch": 2211} {"train_loss": -6.2990522384643555, "global_step": 92871, "epoch": 2211} {"train_loss": -6.248394012451172, "global_step": 92872, "epoch": 2211} {"train_loss": -6.342732906341553, "global_step": 92873, "epoch": 2211} {"train_loss": -6.361031532287598, "global_step": 92874, "epoch": 2211} {"train_loss": -6.160600185394287, "global_step": 92875, "epoch": 2211} {"train_loss": -6.293384552001953, "global_step": 92876, "epoch": 2211} {"train_loss": -6.238284111022949, "global_step": 92877, "epoch": 2211} {"train_loss": -6.3059234619140625, "global_step": 92878, "epoch": 2211} {"train_loss": -6.3900837898254395, "global_step": 92879, "epoch": 2211} {"train_loss": -6.325514316558838, "global_step": 92880, "epoch": 2211} {"train_loss": -6.197661876678467, "global_step": 92881, "epoch": 2211} {"train_loss": -6.331296443939209, "global_step": 92882, "epoch": 2211} {"train_loss": -6.3741607666015625, "global_step": 92883, "epoch": 2211} {"train_loss": -6.203981876373291, "global_step": 92884, "epoch": 2211} {"train_loss": -6.35175895690918, "global_step": 92885, "epoch": 2211} {"train_loss": -6.208683013916016, "global_step": 92886, "epoch": 2211} {"train_loss": -6.30075740814209, "global_step": 92887, "epoch": 2211} {"train_loss": -6.197132110595703, "global_step": 92888, "epoch": 2211} {"train_loss": -6.164563179016113, "global_step": 92889, "epoch": 2211} {"train_loss": -6.275520324707031, "global_step": 92890, "epoch": 2211} {"train_loss": -6.155641078948975, "global_step": 92891, "epoch": 2211} {"train_loss": -6.336928844451904, "global_step": 92892, "epoch": 2211} {"train_loss": -6.317069053649902, "global_step": 92893, "epoch": 2211} {"train_loss": -6.219672203063965, "global_step": 92894, "epoch": 2211} {"train_loss": -6.294827461242676, "global_step": 92895, "epoch": 2211} {"train_loss": -6.174373626708984, "global_step": 92896, "epoch": 2211} {"train_loss": -6.129713535308838, "global_step": 92897, "epoch": 2211} {"train_loss": -6.266053199768066, "global_step": 92898, "epoch": 2211} {"train_loss": -6.276060104370117, "global_step": 92899, "epoch": 2211} {"train_loss": -6.227505683898926, "global_step": 92900, "epoch": 2211} {"train_loss": -6.289240837097168, "global_step": 92901, "epoch": 2211} {"train_loss": -6.283712387084961, "global_step": 92902, "epoch": 2211} {"train_loss": -6.272523017156692, "global_step": 92903, "epoch": 2211, "val_loss": 75628.4375} {"train_loss": -6.231078624725342, "global_step": 92904, "epoch": 2212} {"train_loss": -6.245326042175293, "global_step": 92905, "epoch": 2212} {"train_loss": -6.308291435241699, "global_step": 92906, "epoch": 2212} {"train_loss": -6.303940773010254, "global_step": 92907, "epoch": 2212} {"train_loss": -6.40092658996582, "global_step": 92908, "epoch": 2212} {"train_loss": -6.314376354217529, "global_step": 92909, "epoch": 2212} {"train_loss": -6.249664306640625, "global_step": 92910, "epoch": 2212} {"train_loss": -6.196019172668457, "global_step": 92911, "epoch": 2212} {"train_loss": -6.31614875793457, "global_step": 92912, "epoch": 2212} {"train_loss": -6.248571872711182, "global_step": 92913, "epoch": 2212} {"train_loss": -6.227596759796143, "global_step": 92914, "epoch": 2212} {"train_loss": -6.215554714202881, "global_step": 92915, "epoch": 2212} {"train_loss": -6.247084617614746, "global_step": 92916, "epoch": 2212} {"train_loss": -6.40001106262207, "global_step": 92917, "epoch": 2212} {"train_loss": -6.338283538818359, "global_step": 92918, "epoch": 2212} {"train_loss": -6.163995742797852, "global_step": 92919, "epoch": 2212} {"train_loss": -6.311011791229248, "global_step": 92920, "epoch": 2212} {"train_loss": -6.331572532653809, "global_step": 92921, "epoch": 2212} {"train_loss": -6.287710666656494, "global_step": 92922, "epoch": 2212} {"train_loss": -6.326111316680908, "global_step": 92923, "epoch": 2212} {"train_loss": -6.177544116973877, "global_step": 92924, "epoch": 2212} {"train_loss": -6.321674346923828, "global_step": 92925, "epoch": 2212} {"train_loss": -6.180717945098877, "global_step": 92926, "epoch": 2212} {"train_loss": -6.287238121032715, "global_step": 92927, "epoch": 2212} {"train_loss": -6.298584938049316, "global_step": 92928, "epoch": 2212} {"train_loss": -6.234622955322266, "global_step": 92929, "epoch": 2212} {"train_loss": -6.148894309997559, "global_step": 92930, "epoch": 2212} {"train_loss": -6.40823221206665, "global_step": 92931, "epoch": 2212} {"train_loss": -6.330617427825928, "global_step": 92932, "epoch": 2212} {"train_loss": -6.341597557067871, "global_step": 92933, "epoch": 2212} {"train_loss": -6.281030178070068, "global_step": 92934, "epoch": 2212} {"train_loss": -6.234519004821777, "global_step": 92935, "epoch": 2212} {"train_loss": -6.393721580505371, "global_step": 92936, "epoch": 2212} {"train_loss": -6.331271171569824, "global_step": 92937, "epoch": 2212} {"train_loss": -6.183424949645996, "global_step": 92938, "epoch": 2212} {"train_loss": -6.119180679321289, "global_step": 92939, "epoch": 2212} {"train_loss": -6.304276943206787, "global_step": 92940, "epoch": 2212} {"train_loss": -6.160366058349609, "global_step": 92941, "epoch": 2212} {"train_loss": -6.13078498840332, "global_step": 92942, "epoch": 2212} {"train_loss": -6.371374130249023, "global_step": 92943, "epoch": 2212} {"train_loss": -6.165528297424316, "global_step": 92944, "epoch": 2212} {"train_loss": -6.271787212008522, "global_step": 92945, "epoch": 2212, "val_loss": 75288.234375} {"train_loss": -6.209661483764648, "global_step": 92946, "epoch": 2213} {"train_loss": -6.357850074768066, "global_step": 92947, "epoch": 2213} {"train_loss": -6.351563930511475, "global_step": 92948, "epoch": 2213} {"train_loss": -6.325159072875977, "global_step": 92949, "epoch": 2213} {"train_loss": -6.240515232086182, "global_step": 92950, "epoch": 2213} {"train_loss": -6.308614730834961, "global_step": 92951, "epoch": 2213} {"train_loss": -6.3129801750183105, "global_step": 92952, "epoch": 2213} {"train_loss": -6.205836296081543, "global_step": 92953, "epoch": 2213} {"train_loss": -6.391406059265137, "global_step": 92954, "epoch": 2213} {"train_loss": -6.291430473327637, "global_step": 92955, "epoch": 2213} {"train_loss": -6.390035152435303, "global_step": 92956, "epoch": 2213} {"train_loss": -6.315863609313965, "global_step": 92957, "epoch": 2213} {"train_loss": -6.192133903503418, "global_step": 92958, "epoch": 2213} {"train_loss": -6.338538646697998, "global_step": 92959, "epoch": 2213} {"train_loss": -6.405683517456055, "global_step": 92960, "epoch": 2213} {"train_loss": -6.308359146118164, "global_step": 92961, "epoch": 2213} {"train_loss": -6.18919563293457, "global_step": 92962, "epoch": 2213} {"train_loss": -6.238211631774902, "global_step": 92963, "epoch": 2213} {"train_loss": -6.365558624267578, "global_step": 92964, "epoch": 2213} {"train_loss": -6.201465606689453, "global_step": 92965, "epoch": 2213} {"train_loss": -6.280184745788574, "global_step": 92966, "epoch": 2213} {"train_loss": -6.257246971130371, "global_step": 92967, "epoch": 2213} {"train_loss": -6.042051792144775, "global_step": 92968, "epoch": 2213} {"train_loss": -6.371612548828125, "global_step": 92969, "epoch": 2213} {"train_loss": -6.22066593170166, "global_step": 92970, "epoch": 2213} {"train_loss": -6.145000457763672, "global_step": 92971, "epoch": 2213} {"train_loss": -6.261324405670166, "global_step": 92972, "epoch": 2213} {"train_loss": -6.3172101974487305, "global_step": 92973, "epoch": 2213} {"train_loss": -6.307503700256348, "global_step": 92974, "epoch": 2213} {"train_loss": -6.265630722045898, "global_step": 92975, "epoch": 2213} {"train_loss": -6.2603349685668945, "global_step": 92976, "epoch": 2213} {"train_loss": -6.267194747924805, "global_step": 92977, "epoch": 2213} {"train_loss": -6.2462310791015625, "global_step": 92978, "epoch": 2213} {"train_loss": -6.247138500213623, "global_step": 92979, "epoch": 2213} {"train_loss": -6.379703521728516, "global_step": 92980, "epoch": 2213} {"train_loss": -6.289648056030273, "global_step": 92981, "epoch": 2213} {"train_loss": -6.321078300476074, "global_step": 92982, "epoch": 2213} {"train_loss": -6.367201805114746, "global_step": 92983, "epoch": 2213} {"train_loss": -6.354523658752441, "global_step": 92984, "epoch": 2213} {"train_loss": -6.3306498527526855, "global_step": 92985, "epoch": 2213} {"train_loss": -6.329567909240723, "global_step": 92986, "epoch": 2213} {"train_loss": -6.285585414795649, "global_step": 92987, "epoch": 2213, "val_loss": 75470.328125} {"train_loss": -6.273108005523682, "global_step": 92988, "epoch": 2214} {"train_loss": -6.306506156921387, "global_step": 92989, "epoch": 2214} {"train_loss": -6.402329921722412, "global_step": 92990, "epoch": 2214} {"train_loss": -6.2641706466674805, "global_step": 92991, "epoch": 2214} {"train_loss": -6.323441982269287, "global_step": 92992, "epoch": 2214} {"train_loss": -6.213318824768066, "global_step": 92993, "epoch": 2214} {"train_loss": -6.151939392089844, "global_step": 92994, "epoch": 2214} {"train_loss": -6.327192783355713, "global_step": 92995, "epoch": 2214} {"train_loss": -6.2321014404296875, "global_step": 92996, "epoch": 2214} {"train_loss": -6.457586765289307, "global_step": 92997, "epoch": 2214} {"train_loss": -6.19338846206665, "global_step": 92998, "epoch": 2214} {"train_loss": -6.364284515380859, "global_step": 92999, "epoch": 2214} {"train_loss": -6.349194526672363, "global_step": 93000, "epoch": 2214} {"train_loss": -6.389081954956055, "global_step": 93001, "epoch": 2214} {"train_loss": -6.334029197692871, "global_step": 93002, "epoch": 2214} {"train_loss": -6.305524826049805, "global_step": 93003, "epoch": 2214} {"train_loss": -6.351565361022949, "global_step": 93004, "epoch": 2214} {"train_loss": -6.359314918518066, "global_step": 93005, "epoch": 2214} {"train_loss": -6.2542524337768555, "global_step": 93006, "epoch": 2214} {"train_loss": -6.28558349609375, "global_step": 93007, "epoch": 2214} {"train_loss": -6.1742706298828125, "global_step": 93008, "epoch": 2214} {"train_loss": -6.292252063751221, "global_step": 93009, "epoch": 2214} {"train_loss": -6.473155975341797, "global_step": 93010, "epoch": 2214} {"train_loss": -6.4522600173950195, "global_step": 93011, "epoch": 2214} {"train_loss": -6.337632179260254, "global_step": 93012, "epoch": 2214} {"train_loss": -6.330536842346191, "global_step": 93013, "epoch": 2214} {"train_loss": -6.300157070159912, "global_step": 93014, "epoch": 2214} {"train_loss": -6.219949722290039, "global_step": 93015, "epoch": 2214} {"train_loss": -6.243854522705078, "global_step": 93016, "epoch": 2214} {"train_loss": -6.222847938537598, "global_step": 93017, "epoch": 2214} {"train_loss": -6.241372585296631, "global_step": 93018, "epoch": 2214} {"train_loss": -6.121238708496094, "global_step": 93019, "epoch": 2214} {"train_loss": -6.364562034606934, "global_step": 93020, "epoch": 2214} {"train_loss": -6.234287261962891, "global_step": 93021, "epoch": 2214} {"train_loss": -6.186883926391602, "global_step": 93022, "epoch": 2214} {"train_loss": -6.35636568069458, "global_step": 93023, "epoch": 2214} {"train_loss": -6.3010969161987305, "global_step": 93024, "epoch": 2214} {"train_loss": -6.274445056915283, "global_step": 93025, "epoch": 2214} {"train_loss": -6.194986820220947, "global_step": 93026, "epoch": 2214} {"train_loss": -6.281255722045898, "global_step": 93027, "epoch": 2214} {"train_loss": -6.275444984436035, "global_step": 93028, "epoch": 2214} {"train_loss": -6.292564392089844, "global_step": 93029, "epoch": 2214, "val_loss": 75535.6015625} {"train_loss": -6.28737211227417, "global_step": 93030, "epoch": 2215} {"train_loss": -6.265024185180664, "global_step": 93031, "epoch": 2215} {"train_loss": -6.250399589538574, "global_step": 93032, "epoch": 2215} {"train_loss": -6.266077995300293, "global_step": 93033, "epoch": 2215} {"train_loss": -6.261788368225098, "global_step": 93034, "epoch": 2215} {"train_loss": -6.302657127380371, "global_step": 93035, "epoch": 2215} {"train_loss": -6.271038055419922, "global_step": 93036, "epoch": 2215} {"train_loss": -6.360557556152344, "global_step": 93037, "epoch": 2215} {"train_loss": -6.280788421630859, "global_step": 93038, "epoch": 2215} {"train_loss": -6.284026145935059, "global_step": 93039, "epoch": 2215} {"train_loss": -6.328643321990967, "global_step": 93040, "epoch": 2215} {"train_loss": -6.17012357711792, "global_step": 93041, "epoch": 2215} {"train_loss": -6.270771026611328, "global_step": 93042, "epoch": 2215} {"train_loss": -6.3155927658081055, "global_step": 93043, "epoch": 2215} {"train_loss": -6.146903038024902, "global_step": 93044, "epoch": 2215} {"train_loss": -6.368351936340332, "global_step": 93045, "epoch": 2215} {"train_loss": -6.308809757232666, "global_step": 93046, "epoch": 2215} {"train_loss": -6.273406982421875, "global_step": 93047, "epoch": 2215} {"train_loss": -6.22895622253418, "global_step": 93048, "epoch": 2215} {"train_loss": -6.2368574142456055, "global_step": 93049, "epoch": 2215} {"train_loss": -6.179623126983643, "global_step": 93050, "epoch": 2215} {"train_loss": -6.291489601135254, "global_step": 93051, "epoch": 2215} {"train_loss": -6.316915512084961, "global_step": 93052, "epoch": 2215} {"train_loss": -6.300770282745361, "global_step": 93053, "epoch": 2215} {"train_loss": -6.30139684677124, "global_step": 93054, "epoch": 2215} {"train_loss": -6.1919708251953125, "global_step": 93055, "epoch": 2215} {"train_loss": -6.43967342376709, "global_step": 93056, "epoch": 2215} {"train_loss": -6.309382438659668, "global_step": 93057, "epoch": 2215} {"train_loss": -6.241271018981934, "global_step": 93058, "epoch": 2215} {"train_loss": -6.338671684265137, "global_step": 93059, "epoch": 2215} {"train_loss": -6.314762592315674, "global_step": 93060, "epoch": 2215} {"train_loss": -6.267512798309326, "global_step": 93061, "epoch": 2215} {"train_loss": -6.225536823272705, "global_step": 93062, "epoch": 2215} {"train_loss": -6.410518646240234, "global_step": 93063, "epoch": 2215} {"train_loss": -6.2235870361328125, "global_step": 93064, "epoch": 2215} {"train_loss": -6.322127342224121, "global_step": 93065, "epoch": 2215} {"train_loss": -6.215390682220459, "global_step": 93066, "epoch": 2215} {"train_loss": -6.273647308349609, "global_step": 93067, "epoch": 2215} {"train_loss": -6.317435264587402, "global_step": 93068, "epoch": 2215} {"train_loss": -6.231337070465088, "global_step": 93069, "epoch": 2215} {"train_loss": -6.3388495445251465, "global_step": 93070, "epoch": 2215} {"train_loss": -6.284277938661122, "global_step": 93071, "epoch": 2215, "val_loss": 75670.703125} {"train_loss": -6.2878193855285645, "global_step": 93072, "epoch": 2216} {"train_loss": -6.421080112457275, "global_step": 93073, "epoch": 2216} {"train_loss": -6.425823211669922, "global_step": 93074, "epoch": 2216} {"train_loss": -6.338224411010742, "global_step": 93075, "epoch": 2216} {"train_loss": -6.312314033508301, "global_step": 93076, "epoch": 2216} {"train_loss": -6.254636764526367, "global_step": 93077, "epoch": 2216} {"train_loss": -6.196779251098633, "global_step": 93078, "epoch": 2216} {"train_loss": -6.211991310119629, "global_step": 93079, "epoch": 2216} {"train_loss": -6.3075408935546875, "global_step": 93080, "epoch": 2216} {"train_loss": -6.247726917266846, "global_step": 93081, "epoch": 2216} {"train_loss": -6.12386417388916, "global_step": 93082, "epoch": 2216} {"train_loss": -6.206364631652832, "global_step": 93083, "epoch": 2216} {"train_loss": -6.358279705047607, "global_step": 93084, "epoch": 2216} {"train_loss": -6.207557678222656, "global_step": 93085, "epoch": 2216} {"train_loss": -6.283945083618164, "global_step": 93086, "epoch": 2216} {"train_loss": -6.335708141326904, "global_step": 93087, "epoch": 2216} {"train_loss": -6.162413597106934, "global_step": 93088, "epoch": 2216} {"train_loss": -6.360803127288818, "global_step": 93089, "epoch": 2216} {"train_loss": -6.250720024108887, "global_step": 93090, "epoch": 2216} {"train_loss": -6.167154788970947, "global_step": 93091, "epoch": 2216} {"train_loss": -6.323065757751465, "global_step": 93092, "epoch": 2216} {"train_loss": -6.192200183868408, "global_step": 93093, "epoch": 2216} {"train_loss": -6.180545330047607, "global_step": 93094, "epoch": 2216} {"train_loss": -6.307562351226807, "global_step": 93095, "epoch": 2216} {"train_loss": -6.1331377029418945, "global_step": 93096, "epoch": 2216} {"train_loss": -6.162238121032715, "global_step": 93097, "epoch": 2216} {"train_loss": -6.411933898925781, "global_step": 93098, "epoch": 2216} {"train_loss": -6.268653392791748, "global_step": 93099, "epoch": 2216} {"train_loss": -6.451474189758301, "global_step": 93100, "epoch": 2216} {"train_loss": -6.146940231323242, "global_step": 93101, "epoch": 2216} {"train_loss": -6.175384044647217, "global_step": 93102, "epoch": 2216} {"train_loss": -6.19217586517334, "global_step": 93103, "epoch": 2216} {"train_loss": -6.235878944396973, "global_step": 93104, "epoch": 2216} {"train_loss": -6.236566543579102, "global_step": 93105, "epoch": 2216} {"train_loss": -6.345499038696289, "global_step": 93106, "epoch": 2216} {"train_loss": -6.18063497543335, "global_step": 93107, "epoch": 2216} {"train_loss": -6.253663539886475, "global_step": 93108, "epoch": 2216} {"train_loss": -6.303109645843506, "global_step": 93109, "epoch": 2216} {"train_loss": -6.401594161987305, "global_step": 93110, "epoch": 2216} {"train_loss": -6.3288750648498535, "global_step": 93111, "epoch": 2216} {"train_loss": -6.263618469238281, "global_step": 93112, "epoch": 2216} {"train_loss": -6.268668265569778, "global_step": 93113, "epoch": 2216, "val_loss": 75363.6015625} {"train_loss": -6.285826683044434, "global_step": 93114, "epoch": 2217} {"train_loss": -6.232870101928711, "global_step": 93115, "epoch": 2217} {"train_loss": -6.372145175933838, "global_step": 93116, "epoch": 2217} {"train_loss": -6.222805023193359, "global_step": 93117, "epoch": 2217} {"train_loss": -6.237311363220215, "global_step": 93118, "epoch": 2217} {"train_loss": -6.17672061920166, "global_step": 93119, "epoch": 2217} {"train_loss": -6.278661727905273, "global_step": 93120, "epoch": 2217} {"train_loss": -6.31174373626709, "global_step": 93121, "epoch": 2217} {"train_loss": -6.168530464172363, "global_step": 93122, "epoch": 2217} {"train_loss": -6.1619672775268555, "global_step": 93123, "epoch": 2217} {"train_loss": -6.345247268676758, "global_step": 93124, "epoch": 2217} {"train_loss": -6.212843894958496, "global_step": 93125, "epoch": 2217} {"train_loss": -6.278779029846191, "global_step": 93126, "epoch": 2217} {"train_loss": -6.296794891357422, "global_step": 93127, "epoch": 2217} {"train_loss": -6.262047290802002, "global_step": 93128, "epoch": 2217} {"train_loss": -6.297517776489258, "global_step": 93129, "epoch": 2217} {"train_loss": -6.274328708648682, "global_step": 93130, "epoch": 2217} {"train_loss": -6.270251274108887, "global_step": 93131, "epoch": 2217} {"train_loss": -6.3756103515625, "global_step": 93132, "epoch": 2217} {"train_loss": -6.308784008026123, "global_step": 93133, "epoch": 2217} {"train_loss": -6.281623840332031, "global_step": 93134, "epoch": 2217} {"train_loss": -6.208385467529297, "global_step": 93135, "epoch": 2217} {"train_loss": -6.329469680786133, "global_step": 93136, "epoch": 2217} {"train_loss": -6.197835922241211, "global_step": 93137, "epoch": 2217} {"train_loss": -6.30714225769043, "global_step": 93138, "epoch": 2217} {"train_loss": -6.278688907623291, "global_step": 93139, "epoch": 2217} {"train_loss": -6.337075710296631, "global_step": 93140, "epoch": 2217} {"train_loss": -6.340984344482422, "global_step": 93141, "epoch": 2217} {"train_loss": -6.318632125854492, "global_step": 93142, "epoch": 2217} {"train_loss": -6.365728378295898, "global_step": 93143, "epoch": 2217} {"train_loss": -6.286392688751221, "global_step": 93144, "epoch": 2217} {"train_loss": -6.311817646026611, "global_step": 93145, "epoch": 2217} {"train_loss": -6.208881378173828, "global_step": 93146, "epoch": 2217} {"train_loss": -6.263465881347656, "global_step": 93147, "epoch": 2217} {"train_loss": -6.20589017868042, "global_step": 93148, "epoch": 2217} {"train_loss": -6.374711990356445, "global_step": 93149, "epoch": 2217} {"train_loss": -6.254141807556152, "global_step": 93150, "epoch": 2217} {"train_loss": -6.304968357086182, "global_step": 93151, "epoch": 2217} {"train_loss": -6.279439926147461, "global_step": 93152, "epoch": 2217} {"train_loss": -6.293048858642578, "global_step": 93153, "epoch": 2217} {"train_loss": -6.181361198425293, "global_step": 93154, "epoch": 2217} {"train_loss": -6.276884044919695, "global_step": 93155, "epoch": 2217, "val_loss": 75557.578125} {"train_loss": -6.128925323486328, "global_step": 93156, "epoch": 2218} {"train_loss": -6.201262950897217, "global_step": 93157, "epoch": 2218} {"train_loss": -6.387209415435791, "global_step": 93158, "epoch": 2218} {"train_loss": -6.243058204650879, "global_step": 93159, "epoch": 2218} {"train_loss": -6.259681224822998, "global_step": 93160, "epoch": 2218} {"train_loss": -6.258358955383301, "global_step": 93161, "epoch": 2218} {"train_loss": -6.2171149253845215, "global_step": 93162, "epoch": 2218} {"train_loss": -6.243939399719238, "global_step": 93163, "epoch": 2218} {"train_loss": -6.2400054931640625, "global_step": 93164, "epoch": 2218} {"train_loss": -6.246396541595459, "global_step": 93165, "epoch": 2218} {"train_loss": -6.3949689865112305, "global_step": 93166, "epoch": 2218} {"train_loss": -6.458911418914795, "global_step": 93167, "epoch": 2218} {"train_loss": -6.288878917694092, "global_step": 93168, "epoch": 2218} {"train_loss": -6.319231033325195, "global_step": 93169, "epoch": 2218} {"train_loss": -6.405301094055176, "global_step": 93170, "epoch": 2218} {"train_loss": -6.188547134399414, "global_step": 93171, "epoch": 2218} {"train_loss": -6.4474639892578125, "global_step": 93172, "epoch": 2218} {"train_loss": -6.141382217407227, "global_step": 93173, "epoch": 2218} {"train_loss": -6.264218330383301, "global_step": 93174, "epoch": 2218} {"train_loss": -6.340297222137451, "global_step": 93175, "epoch": 2218} {"train_loss": -6.270498275756836, "global_step": 93176, "epoch": 2218} {"train_loss": -6.2884111404418945, "global_step": 93177, "epoch": 2218} {"train_loss": -6.326225757598877, "global_step": 93178, "epoch": 2218} {"train_loss": -6.314974308013916, "global_step": 93179, "epoch": 2218} {"train_loss": -6.365386009216309, "global_step": 93180, "epoch": 2218} {"train_loss": -6.288162708282471, "global_step": 93181, "epoch": 2218} {"train_loss": -6.256302833557129, "global_step": 93182, "epoch": 2218} {"train_loss": -6.284767150878906, "global_step": 93183, "epoch": 2218} {"train_loss": -6.107793807983398, "global_step": 93184, "epoch": 2218} {"train_loss": -6.205991744995117, "global_step": 93185, "epoch": 2218} {"train_loss": -6.207735061645508, "global_step": 93186, "epoch": 2218} {"train_loss": -6.197277069091797, "global_step": 93187, "epoch": 2218} {"train_loss": -6.220974922180176, "global_step": 93188, "epoch": 2218} {"train_loss": -6.166245937347412, "global_step": 93189, "epoch": 2218} {"train_loss": -6.3557000160217285, "global_step": 93190, "epoch": 2218} {"train_loss": -6.272260665893555, "global_step": 93191, "epoch": 2218} {"train_loss": -6.281771659851074, "global_step": 93192, "epoch": 2218} {"train_loss": -6.4145050048828125, "global_step": 93193, "epoch": 2218} {"train_loss": -6.274332046508789, "global_step": 93194, "epoch": 2218} {"train_loss": -6.134131908416748, "global_step": 93195, "epoch": 2218} {"train_loss": -6.275193691253662, "global_step": 93196, "epoch": 2218} {"train_loss": -6.272999740782238, "global_step": 93197, "epoch": 2218, "val_loss": 75633.9375} {"train_loss": -6.271109104156494, "global_step": 93198, "epoch": 2219} {"train_loss": -6.1711273193359375, "global_step": 93199, "epoch": 2219} {"train_loss": -6.240032196044922, "global_step": 93200, "epoch": 2219} {"train_loss": -6.3289384841918945, "global_step": 93201, "epoch": 2219} {"train_loss": -6.245935440063477, "global_step": 93202, "epoch": 2219} {"train_loss": -6.234967231750488, "global_step": 93203, "epoch": 2219} {"train_loss": -6.075758934020996, "global_step": 93204, "epoch": 2219} {"train_loss": -6.323117256164551, "global_step": 93205, "epoch": 2219} {"train_loss": -6.2208051681518555, "global_step": 93206, "epoch": 2219} {"train_loss": -6.30101203918457, "global_step": 93207, "epoch": 2219} {"train_loss": -6.31034517288208, "global_step": 93208, "epoch": 2219} {"train_loss": -6.193071365356445, "global_step": 93209, "epoch": 2219} {"train_loss": -6.28780460357666, "global_step": 93210, "epoch": 2219} {"train_loss": -6.145783424377441, "global_step": 93211, "epoch": 2219} {"train_loss": -6.212677955627441, "global_step": 93212, "epoch": 2219} {"train_loss": -6.205146789550781, "global_step": 93213, "epoch": 2219} {"train_loss": -6.156270980834961, "global_step": 93214, "epoch": 2219} {"train_loss": -6.039182662963867, "global_step": 93215, "epoch": 2219} {"train_loss": -6.211040019989014, "global_step": 93216, "epoch": 2219} {"train_loss": -6.1642165184021, "global_step": 93217, "epoch": 2219} {"train_loss": -6.134299278259277, "global_step": 93218, "epoch": 2219} {"train_loss": -6.203913688659668, "global_step": 93219, "epoch": 2219} {"train_loss": -6.2440900802612305, "global_step": 93220, "epoch": 2219} {"train_loss": -6.222792625427246, "global_step": 93221, "epoch": 2219} {"train_loss": -6.148797035217285, "global_step": 93222, "epoch": 2219} {"train_loss": -6.206268310546875, "global_step": 93223, "epoch": 2219} {"train_loss": -6.191146373748779, "global_step": 93224, "epoch": 2219} {"train_loss": -6.1847920417785645, "global_step": 93225, "epoch": 2219} {"train_loss": -6.313492774963379, "global_step": 93226, "epoch": 2219} {"train_loss": -6.179043769836426, "global_step": 93227, "epoch": 2219} {"train_loss": -6.170243263244629, "global_step": 93228, "epoch": 2219} {"train_loss": -6.236225605010986, "global_step": 93229, "epoch": 2219} {"train_loss": -6.2875189781188965, "global_step": 93230, "epoch": 2219} {"train_loss": -6.332858562469482, "global_step": 93231, "epoch": 2219} {"train_loss": -6.298425674438477, "global_step": 93232, "epoch": 2219} {"train_loss": -6.0877885818481445, "global_step": 93233, "epoch": 2219} {"train_loss": -6.2226972579956055, "global_step": 93234, "epoch": 2219} {"train_loss": -6.211644649505615, "global_step": 93235, "epoch": 2219} {"train_loss": -6.338467597961426, "global_step": 93236, "epoch": 2219} {"train_loss": -6.318763732910156, "global_step": 93237, "epoch": 2219} {"train_loss": -6.234137535095215, "global_step": 93238, "epoch": 2219} {"train_loss": -6.223558630262103, "global_step": 93239, "epoch": 2219, "val_loss": 75380.5625} {"train_loss": -6.251731872558594, "global_step": 93240, "epoch": 2220} {"train_loss": -6.308220863342285, "global_step": 93241, "epoch": 2220} {"train_loss": -6.378296375274658, "global_step": 93242, "epoch": 2220} {"train_loss": -6.328539848327637, "global_step": 93243, "epoch": 2220} {"train_loss": -6.282567977905273, "global_step": 93244, "epoch": 2220} {"train_loss": -6.364429950714111, "global_step": 93245, "epoch": 2220} {"train_loss": -6.296680450439453, "global_step": 93246, "epoch": 2220} {"train_loss": -6.3148345947265625, "global_step": 93247, "epoch": 2220} {"train_loss": -6.340415000915527, "global_step": 93248, "epoch": 2220} {"train_loss": -6.224908828735352, "global_step": 93249, "epoch": 2220} {"train_loss": -6.354361534118652, "global_step": 93250, "epoch": 2220} {"train_loss": -6.281881332397461, "global_step": 93251, "epoch": 2220} {"train_loss": -6.339297294616699, "global_step": 93252, "epoch": 2220} {"train_loss": -6.301572799682617, "global_step": 93253, "epoch": 2220} {"train_loss": -6.298947334289551, "global_step": 93254, "epoch": 2220} {"train_loss": -6.32985782623291, "global_step": 93255, "epoch": 2220} {"train_loss": -6.385025978088379, "global_step": 93256, "epoch": 2220} {"train_loss": -6.241637229919434, "global_step": 93257, "epoch": 2220} {"train_loss": -6.266760349273682, "global_step": 93258, "epoch": 2220} {"train_loss": -6.414344787597656, "global_step": 93259, "epoch": 2220} {"train_loss": -6.243898868560791, "global_step": 93260, "epoch": 2220} {"train_loss": -6.201742172241211, "global_step": 93261, "epoch": 2220} {"train_loss": -6.29135799407959, "global_step": 93262, "epoch": 2220} {"train_loss": -6.343866348266602, "global_step": 93263, "epoch": 2220} {"train_loss": -6.147793769836426, "global_step": 93264, "epoch": 2220} {"train_loss": -6.382549285888672, "global_step": 93265, "epoch": 2220} {"train_loss": -6.214658737182617, "global_step": 93266, "epoch": 2220} {"train_loss": -6.1442975997924805, "global_step": 93267, "epoch": 2220} {"train_loss": -6.219427585601807, "global_step": 93268, "epoch": 2220} {"train_loss": -6.186240196228027, "global_step": 93269, "epoch": 2220} {"train_loss": -6.25752067565918, "global_step": 93270, "epoch": 2220} {"train_loss": -6.351918697357178, "global_step": 93271, "epoch": 2220} {"train_loss": -6.218111991882324, "global_step": 93272, "epoch": 2220} {"train_loss": -6.20033073425293, "global_step": 93273, "epoch": 2220} {"train_loss": -6.277416706085205, "global_step": 93274, "epoch": 2220} {"train_loss": -6.232494831085205, "global_step": 93275, "epoch": 2220} {"train_loss": -6.297898292541504, "global_step": 93276, "epoch": 2220} {"train_loss": -6.2636213302612305, "global_step": 93277, "epoch": 2220} {"train_loss": -6.239960670471191, "global_step": 93278, "epoch": 2220} {"train_loss": -6.23801851272583, "global_step": 93279, "epoch": 2220} {"train_loss": -6.253307819366455, "global_step": 93280, "epoch": 2220} {"train_loss": -6.279780285699027, "global_step": 93281, "epoch": 2220, "val_loss": 75181.125} {"train_loss": -6.290806770324707, "global_step": 93282, "epoch": 2221} {"train_loss": -6.308448791503906, "global_step": 93283, "epoch": 2221} {"train_loss": -6.265476703643799, "global_step": 93284, "epoch": 2221} {"train_loss": -6.3720293045043945, "global_step": 93285, "epoch": 2221} {"train_loss": -6.351873397827148, "global_step": 93286, "epoch": 2221} {"train_loss": -6.368791103363037, "global_step": 93287, "epoch": 2221} {"train_loss": -6.2181854248046875, "global_step": 93288, "epoch": 2221} {"train_loss": -6.267730712890625, "global_step": 93289, "epoch": 2221} {"train_loss": -6.3399786949157715, "global_step": 93290, "epoch": 2221} {"train_loss": -6.305313587188721, "global_step": 93291, "epoch": 2221} {"train_loss": -6.308736801147461, "global_step": 93292, "epoch": 2221} {"train_loss": -6.176231384277344, "global_step": 93293, "epoch": 2221} {"train_loss": -6.2541375160217285, "global_step": 93294, "epoch": 2221} {"train_loss": -6.199433326721191, "global_step": 93295, "epoch": 2221} {"train_loss": -6.105250358581543, "global_step": 93296, "epoch": 2221} {"train_loss": -6.157840728759766, "global_step": 93297, "epoch": 2221} {"train_loss": -6.240358829498291, "global_step": 93298, "epoch": 2221} {"train_loss": -6.225002288818359, "global_step": 93299, "epoch": 2221} {"train_loss": -6.313264846801758, "global_step": 93300, "epoch": 2221} {"train_loss": -6.121611595153809, "global_step": 93301, "epoch": 2221} {"train_loss": -6.157741069793701, "global_step": 93302, "epoch": 2221} {"train_loss": -6.183230400085449, "global_step": 93303, "epoch": 2221} {"train_loss": -6.303797245025635, "global_step": 93304, "epoch": 2221} {"train_loss": -6.128541946411133, "global_step": 93305, "epoch": 2221} {"train_loss": -6.235161781311035, "global_step": 93306, "epoch": 2221} {"train_loss": -6.306026458740234, "global_step": 93307, "epoch": 2221} {"train_loss": -6.193314075469971, "global_step": 93308, "epoch": 2221} {"train_loss": -6.157661437988281, "global_step": 93309, "epoch": 2221} {"train_loss": -6.249431610107422, "global_step": 93310, "epoch": 2221} {"train_loss": -6.14910364151001, "global_step": 93311, "epoch": 2221} {"train_loss": -6.252620697021484, "global_step": 93312, "epoch": 2221} {"train_loss": -6.276149272918701, "global_step": 93313, "epoch": 2221} {"train_loss": -6.407998085021973, "global_step": 93314, "epoch": 2221} {"train_loss": -6.253583908081055, "global_step": 93315, "epoch": 2221} {"train_loss": -6.2149200439453125, "global_step": 93316, "epoch": 2221} {"train_loss": -6.2471160888671875, "global_step": 93317, "epoch": 2221} {"train_loss": -6.238142967224121, "global_step": 93318, "epoch": 2221} {"train_loss": -6.216840744018555, "global_step": 93319, "epoch": 2221} {"train_loss": -6.194344520568848, "global_step": 93320, "epoch": 2221} {"train_loss": -6.208824157714844, "global_step": 93321, "epoch": 2221} {"train_loss": -6.268715858459473, "global_step": 93322, "epoch": 2221} {"train_loss": -6.247546048391433, "global_step": 93323, "epoch": 2221, "val_loss": 75483.6640625} {"train_loss": -6.3454999923706055, "global_step": 93324, "epoch": 2222} {"train_loss": -6.272841453552246, "global_step": 93325, "epoch": 2222} {"train_loss": -6.258450508117676, "global_step": 93326, "epoch": 2222} {"train_loss": -6.293999671936035, "global_step": 93327, "epoch": 2222} {"train_loss": -6.308992862701416, "global_step": 93328, "epoch": 2222} {"train_loss": -6.235598564147949, "global_step": 93329, "epoch": 2222} {"train_loss": -6.26163387298584, "global_step": 93330, "epoch": 2222} {"train_loss": -6.176444053649902, "global_step": 93331, "epoch": 2222} {"train_loss": -6.220762252807617, "global_step": 93332, "epoch": 2222} {"train_loss": -6.347362518310547, "global_step": 93333, "epoch": 2222} {"train_loss": -6.115615367889404, "global_step": 93334, "epoch": 2222} {"train_loss": -6.349059104919434, "global_step": 93335, "epoch": 2222} {"train_loss": -6.211589813232422, "global_step": 93336, "epoch": 2222} {"train_loss": -6.303656101226807, "global_step": 93337, "epoch": 2222} {"train_loss": -6.181796073913574, "global_step": 93338, "epoch": 2222} {"train_loss": -6.246744155883789, "global_step": 93339, "epoch": 2222} {"train_loss": -6.207314491271973, "global_step": 93340, "epoch": 2222} {"train_loss": -6.155628204345703, "global_step": 93341, "epoch": 2222} {"train_loss": -6.359730243682861, "global_step": 93342, "epoch": 2222} {"train_loss": -6.359746932983398, "global_step": 93343, "epoch": 2222} {"train_loss": -6.32730770111084, "global_step": 93344, "epoch": 2222} {"train_loss": -6.273138046264648, "global_step": 93345, "epoch": 2222} {"train_loss": -6.326091289520264, "global_step": 93346, "epoch": 2222} {"train_loss": -6.329231262207031, "global_step": 93347, "epoch": 2222} {"train_loss": -6.229122638702393, "global_step": 93348, "epoch": 2222} {"train_loss": -6.295536994934082, "global_step": 93349, "epoch": 2222} {"train_loss": -6.291524887084961, "global_step": 93350, "epoch": 2222} {"train_loss": -6.142603874206543, "global_step": 93351, "epoch": 2222} {"train_loss": -6.254754066467285, "global_step": 93352, "epoch": 2222} {"train_loss": -6.3173699378967285, "global_step": 93353, "epoch": 2222} {"train_loss": -6.2814531326293945, "global_step": 93354, "epoch": 2222} {"train_loss": -6.184727668762207, "global_step": 93355, "epoch": 2222} {"train_loss": -6.249263763427734, "global_step": 93356, "epoch": 2222} {"train_loss": -6.237060070037842, "global_step": 93357, "epoch": 2222} {"train_loss": -6.394855499267578, "global_step": 93358, "epoch": 2222} {"train_loss": -6.25851583480835, "global_step": 93359, "epoch": 2222} {"train_loss": -6.319944858551025, "global_step": 93360, "epoch": 2222} {"train_loss": -6.3437323570251465, "global_step": 93361, "epoch": 2222} {"train_loss": -6.335341453552246, "global_step": 93362, "epoch": 2222} {"train_loss": -6.220130920410156, "global_step": 93363, "epoch": 2222} {"train_loss": -6.2677154541015625, "global_step": 93364, "epoch": 2222} {"train_loss": -6.2712367829822355, "global_step": 93365, "epoch": 2222, "val_loss": 75304.921875} {"train_loss": -6.31614351272583, "global_step": 93366, "epoch": 2223} {"train_loss": -6.3296942710876465, "global_step": 93367, "epoch": 2223} {"train_loss": -6.241311073303223, "global_step": 93368, "epoch": 2223} {"train_loss": -6.4309163093566895, "global_step": 93369, "epoch": 2223} {"train_loss": -6.243795394897461, "global_step": 93370, "epoch": 2223} {"train_loss": -6.40318489074707, "global_step": 93371, "epoch": 2223} {"train_loss": -6.257521629333496, "global_step": 93372, "epoch": 2223} {"train_loss": -6.276195526123047, "global_step": 93373, "epoch": 2223} {"train_loss": -6.298226833343506, "global_step": 93374, "epoch": 2223} {"train_loss": -6.1909685134887695, "global_step": 93375, "epoch": 2223} {"train_loss": -6.333795070648193, "global_step": 93376, "epoch": 2223} {"train_loss": -6.130727767944336, "global_step": 93377, "epoch": 2223} {"train_loss": -6.330869197845459, "global_step": 93378, "epoch": 2223} {"train_loss": -6.290973663330078, "global_step": 93379, "epoch": 2223} {"train_loss": -6.3352460861206055, "global_step": 93380, "epoch": 2223} {"train_loss": -6.302677154541016, "global_step": 93381, "epoch": 2223} {"train_loss": -6.31632137298584, "global_step": 93382, "epoch": 2223} {"train_loss": -6.298953533172607, "global_step": 93383, "epoch": 2223} {"train_loss": -6.334763050079346, "global_step": 93384, "epoch": 2223} {"train_loss": -6.401086807250977, "global_step": 93385, "epoch": 2223} {"train_loss": -6.276126861572266, "global_step": 93386, "epoch": 2223} {"train_loss": -6.348006725311279, "global_step": 93387, "epoch": 2223} {"train_loss": -6.205741882324219, "global_step": 93388, "epoch": 2223} {"train_loss": -6.3037109375, "global_step": 93389, "epoch": 2223} {"train_loss": -6.401638507843018, "global_step": 93390, "epoch": 2223} {"train_loss": -6.299452781677246, "global_step": 93391, "epoch": 2223} {"train_loss": -6.4132795333862305, "global_step": 93392, "epoch": 2223} {"train_loss": -6.421070575714111, "global_step": 93393, "epoch": 2223} {"train_loss": -6.351178169250488, "global_step": 93394, "epoch": 2223} {"train_loss": -6.429475784301758, "global_step": 93395, "epoch": 2223} {"train_loss": -6.292010307312012, "global_step": 93396, "epoch": 2223} {"train_loss": -6.297496795654297, "global_step": 93397, "epoch": 2223} {"train_loss": -6.351375579833984, "global_step": 93398, "epoch": 2223} {"train_loss": -6.2497735023498535, "global_step": 93399, "epoch": 2223} {"train_loss": -6.291790962219238, "global_step": 93400, "epoch": 2223} {"train_loss": -6.270200252532959, "global_step": 93401, "epoch": 2223} {"train_loss": -6.310821533203125, "global_step": 93402, "epoch": 2223} {"train_loss": -6.1988067626953125, "global_step": 93403, "epoch": 2223} {"train_loss": -6.314080238342285, "global_step": 93404, "epoch": 2223} {"train_loss": -6.225379943847656, "global_step": 93405, "epoch": 2223} {"train_loss": -6.307010650634766, "global_step": 93406, "epoch": 2223} {"train_loss": -6.303596167337327, "global_step": 93407, "epoch": 2223, "val_loss": 75649.859375} {"train_loss": -6.20297908782959, "global_step": 93408, "epoch": 2224} {"train_loss": -6.350898742675781, "global_step": 93409, "epoch": 2224} {"train_loss": -6.333313941955566, "global_step": 93410, "epoch": 2224} {"train_loss": -6.249524116516113, "global_step": 93411, "epoch": 2224} {"train_loss": -6.267344951629639, "global_step": 93412, "epoch": 2224} {"train_loss": -6.279354572296143, "global_step": 93413, "epoch": 2224} {"train_loss": -6.190925121307373, "global_step": 93414, "epoch": 2224} {"train_loss": -6.343132019042969, "global_step": 93415, "epoch": 2224} {"train_loss": -6.204998016357422, "global_step": 93416, "epoch": 2224} {"train_loss": -6.313532829284668, "global_step": 93417, "epoch": 2224} {"train_loss": -6.20839262008667, "global_step": 93418, "epoch": 2224} {"train_loss": -6.23043155670166, "global_step": 93419, "epoch": 2224} {"train_loss": -6.290575981140137, "global_step": 93420, "epoch": 2224} {"train_loss": -6.20464563369751, "global_step": 93421, "epoch": 2224} {"train_loss": -6.239775657653809, "global_step": 93422, "epoch": 2224} {"train_loss": -6.032721042633057, "global_step": 93423, "epoch": 2224} {"train_loss": -6.227206230163574, "global_step": 93424, "epoch": 2224} {"train_loss": -6.253158092498779, "global_step": 93425, "epoch": 2224} {"train_loss": -6.1707587242126465, "global_step": 93426, "epoch": 2224} {"train_loss": -6.213027000427246, "global_step": 93427, "epoch": 2224} {"train_loss": -6.239253520965576, "global_step": 93428, "epoch": 2224} {"train_loss": -6.24834680557251, "global_step": 93429, "epoch": 2224} {"train_loss": -6.175685882568359, "global_step": 93430, "epoch": 2224} {"train_loss": -6.264021873474121, "global_step": 93431, "epoch": 2224} {"train_loss": -6.251539707183838, "global_step": 93432, "epoch": 2224} {"train_loss": -6.217288017272949, "global_step": 93433, "epoch": 2224} {"train_loss": -6.195598125457764, "global_step": 93434, "epoch": 2224} {"train_loss": -6.271247863769531, "global_step": 93435, "epoch": 2224} {"train_loss": -6.304002285003662, "global_step": 93436, "epoch": 2224} {"train_loss": -6.1573357582092285, "global_step": 93437, "epoch": 2224} {"train_loss": -6.195284366607666, "global_step": 93438, "epoch": 2224} {"train_loss": -6.179919242858887, "global_step": 93439, "epoch": 2224} {"train_loss": -6.116127014160156, "global_step": 93440, "epoch": 2224} {"train_loss": -6.365413665771484, "global_step": 93441, "epoch": 2224} {"train_loss": -6.28202486038208, "global_step": 93442, "epoch": 2224} {"train_loss": -6.2418694496154785, "global_step": 93443, "epoch": 2224} {"train_loss": -6.30405330657959, "global_step": 93444, "epoch": 2224} {"train_loss": -6.33810567855835, "global_step": 93445, "epoch": 2224} {"train_loss": -6.255189895629883, "global_step": 93446, "epoch": 2224} {"train_loss": -6.208773612976074, "global_step": 93447, "epoch": 2224} {"train_loss": -6.259063720703125, "global_step": 93448, "epoch": 2224} {"train_loss": -6.2421672230675105, "global_step": 93449, "epoch": 2224, "val_loss": 75608.6484375} {"train_loss": -6.266016006469727, "global_step": 93450, "epoch": 2225} {"train_loss": -6.281398296356201, "global_step": 93451, "epoch": 2225} {"train_loss": -6.295466423034668, "global_step": 93452, "epoch": 2225} {"train_loss": -6.3019843101501465, "global_step": 93453, "epoch": 2225} {"train_loss": -6.3794379234313965, "global_step": 93454, "epoch": 2225} {"train_loss": -6.25297737121582, "global_step": 93455, "epoch": 2225} {"train_loss": -6.290482521057129, "global_step": 93456, "epoch": 2225} {"train_loss": -6.446933746337891, "global_step": 93457, "epoch": 2225} {"train_loss": -6.285015106201172, "global_step": 93458, "epoch": 2225} {"train_loss": -6.406765937805176, "global_step": 93459, "epoch": 2225} {"train_loss": -6.310834884643555, "global_step": 93460, "epoch": 2225} {"train_loss": -6.280082702636719, "global_step": 93461, "epoch": 2225} {"train_loss": -6.210434913635254, "global_step": 93462, "epoch": 2225} {"train_loss": -6.385466575622559, "global_step": 93463, "epoch": 2225} {"train_loss": -6.220529079437256, "global_step": 93464, "epoch": 2225} {"train_loss": -6.372282028198242, "global_step": 93465, "epoch": 2225} {"train_loss": -6.366850852966309, "global_step": 93466, "epoch": 2225} {"train_loss": -6.344045639038086, "global_step": 93467, "epoch": 2225} {"train_loss": -6.466081142425537, "global_step": 93468, "epoch": 2225} {"train_loss": -6.159134864807129, "global_step": 93469, "epoch": 2225} {"train_loss": -6.348423957824707, "global_step": 93470, "epoch": 2225} {"train_loss": -6.2981672286987305, "global_step": 93471, "epoch": 2225} {"train_loss": -6.243007183074951, "global_step": 93472, "epoch": 2225} {"train_loss": -6.124938011169434, "global_step": 93473, "epoch": 2225} {"train_loss": -6.26325798034668, "global_step": 93474, "epoch": 2225} {"train_loss": -6.391463279724121, "global_step": 93475, "epoch": 2225} {"train_loss": -6.326315879821777, "global_step": 93476, "epoch": 2225} {"train_loss": -6.247537136077881, "global_step": 93477, "epoch": 2225} {"train_loss": -6.204901695251465, "global_step": 93478, "epoch": 2225} {"train_loss": -6.279328346252441, "global_step": 93479, "epoch": 2225} {"train_loss": -6.286764621734619, "global_step": 93480, "epoch": 2225} {"train_loss": -6.330352783203125, "global_step": 93481, "epoch": 2225} {"train_loss": -6.3531174659729, "global_step": 93482, "epoch": 2225} {"train_loss": -6.253800392150879, "global_step": 93483, "epoch": 2225} {"train_loss": -6.391903400421143, "global_step": 93484, "epoch": 2225} {"train_loss": -6.3336687088012695, "global_step": 93485, "epoch": 2225} {"train_loss": -6.297191619873047, "global_step": 93486, "epoch": 2225} {"train_loss": -6.3720808029174805, "global_step": 93487, "epoch": 2225} {"train_loss": -6.29417085647583, "global_step": 93488, "epoch": 2225} {"train_loss": -6.293668270111084, "global_step": 93489, "epoch": 2225} {"train_loss": -6.311654090881348, "global_step": 93490, "epoch": 2225} {"train_loss": -6.307382504145305, "global_step": 93491, "epoch": 2225, "val_loss": 75267.3125} {"train_loss": -6.265303611755371, "global_step": 93492, "epoch": 2226} {"train_loss": -6.252463340759277, "global_step": 93493, "epoch": 2226} {"train_loss": -6.456739902496338, "global_step": 93494, "epoch": 2226} {"train_loss": -6.445852279663086, "global_step": 93495, "epoch": 2226} {"train_loss": -6.235393524169922, "global_step": 93496, "epoch": 2226} {"train_loss": -6.282827377319336, "global_step": 93497, "epoch": 2226} {"train_loss": -6.327766418457031, "global_step": 93498, "epoch": 2226} {"train_loss": -6.3594069480896, "global_step": 93499, "epoch": 2226} {"train_loss": -6.323619842529297, "global_step": 93500, "epoch": 2226} {"train_loss": -6.30003547668457, "global_step": 93501, "epoch": 2226} {"train_loss": -6.310749530792236, "global_step": 93502, "epoch": 2226} {"train_loss": -6.282800197601318, "global_step": 93503, "epoch": 2226} {"train_loss": -6.265560150146484, "global_step": 93504, "epoch": 2226} {"train_loss": -6.226792335510254, "global_step": 93505, "epoch": 2226} {"train_loss": -6.2528228759765625, "global_step": 93506, "epoch": 2226} {"train_loss": -6.1680989265441895, "global_step": 93507, "epoch": 2226} {"train_loss": -6.27921199798584, "global_step": 93508, "epoch": 2226} {"train_loss": -6.335740089416504, "global_step": 93509, "epoch": 2226} {"train_loss": -6.288707733154297, "global_step": 93510, "epoch": 2226} {"train_loss": -6.329906940460205, "global_step": 93511, "epoch": 2226} {"train_loss": -6.31451416015625, "global_step": 93512, "epoch": 2226} {"train_loss": -6.332151889801025, "global_step": 93513, "epoch": 2226} {"train_loss": -6.226465702056885, "global_step": 93514, "epoch": 2226} {"train_loss": -6.4166154861450195, "global_step": 93515, "epoch": 2226} {"train_loss": -6.243317127227783, "global_step": 93516, "epoch": 2226} {"train_loss": -6.128334045410156, "global_step": 93517, "epoch": 2226} {"train_loss": -6.351111888885498, "global_step": 93518, "epoch": 2226} {"train_loss": -6.387367248535156, "global_step": 93519, "epoch": 2226} {"train_loss": -6.262022018432617, "global_step": 93520, "epoch": 2226} {"train_loss": -6.189162254333496, "global_step": 93521, "epoch": 2226} {"train_loss": -6.2081990242004395, "global_step": 93522, "epoch": 2226} {"train_loss": -6.307502746582031, "global_step": 93523, "epoch": 2226} {"train_loss": -6.179237365722656, "global_step": 93524, "epoch": 2226} {"train_loss": -6.287631988525391, "global_step": 93525, "epoch": 2226} {"train_loss": -6.310242652893066, "global_step": 93526, "epoch": 2226} {"train_loss": -6.286970615386963, "global_step": 93527, "epoch": 2226} {"train_loss": -6.272355079650879, "global_step": 93528, "epoch": 2226} {"train_loss": -6.27668571472168, "global_step": 93529, "epoch": 2226} {"train_loss": -6.320253372192383, "global_step": 93530, "epoch": 2226} {"train_loss": -6.281441688537598, "global_step": 93531, "epoch": 2226} {"train_loss": -6.295363426208496, "global_step": 93532, "epoch": 2226} {"train_loss": -6.290689627329509, "global_step": 93533, "epoch": 2226, "val_loss": 75831.1640625} {"train_loss": -6.364171981811523, "global_step": 93534, "epoch": 2227} {"train_loss": -6.224637985229492, "global_step": 93535, "epoch": 2227} {"train_loss": -6.2107672691345215, "global_step": 93536, "epoch": 2227} {"train_loss": -6.157137870788574, "global_step": 93537, "epoch": 2227} {"train_loss": -6.211003303527832, "global_step": 93538, "epoch": 2227} {"train_loss": -6.221055030822754, "global_step": 93539, "epoch": 2227} {"train_loss": -6.343601703643799, "global_step": 93540, "epoch": 2227} {"train_loss": -6.2739458084106445, "global_step": 93541, "epoch": 2227} {"train_loss": -6.230191707611084, "global_step": 93542, "epoch": 2227} {"train_loss": -6.226336479187012, "global_step": 93543, "epoch": 2227} {"train_loss": -6.273926734924316, "global_step": 93544, "epoch": 2227} {"train_loss": -6.20242977142334, "global_step": 93545, "epoch": 2227} {"train_loss": -6.3272705078125, "global_step": 93546, "epoch": 2227} {"train_loss": -6.216660499572754, "global_step": 93547, "epoch": 2227} {"train_loss": -6.33373498916626, "global_step": 93548, "epoch": 2227} {"train_loss": -6.365788459777832, "global_step": 93549, "epoch": 2227} {"train_loss": -6.248448848724365, "global_step": 93550, "epoch": 2227} {"train_loss": -6.318284034729004, "global_step": 93551, "epoch": 2227} {"train_loss": -6.258561134338379, "global_step": 93552, "epoch": 2227} {"train_loss": -6.131033420562744, "global_step": 93553, "epoch": 2227} {"train_loss": -6.247748374938965, "global_step": 93554, "epoch": 2227} {"train_loss": -6.274021148681641, "global_step": 93555, "epoch": 2227} {"train_loss": -6.2883124351501465, "global_step": 93556, "epoch": 2227} {"train_loss": -6.244424819946289, "global_step": 93557, "epoch": 2227} {"train_loss": -6.2009077072143555, "global_step": 93558, "epoch": 2227} {"train_loss": -6.216472625732422, "global_step": 93559, "epoch": 2227} {"train_loss": -6.3041887283325195, "global_step": 93560, "epoch": 2227} {"train_loss": -6.2621049880981445, "global_step": 93561, "epoch": 2227} {"train_loss": -6.191225051879883, "global_step": 93562, "epoch": 2227} {"train_loss": -6.289163589477539, "global_step": 93563, "epoch": 2227} {"train_loss": -6.291902542114258, "global_step": 93564, "epoch": 2227} {"train_loss": -6.2671003341674805, "global_step": 93565, "epoch": 2227} {"train_loss": -6.257722854614258, "global_step": 93566, "epoch": 2227} {"train_loss": -6.31387996673584, "global_step": 93567, "epoch": 2227} {"train_loss": -6.334485054016113, "global_step": 93568, "epoch": 2227} {"train_loss": -6.325356483459473, "global_step": 93569, "epoch": 2227} {"train_loss": -6.325313568115234, "global_step": 93570, "epoch": 2227} {"train_loss": -6.284439563751221, "global_step": 93571, "epoch": 2227} {"train_loss": -6.354501247406006, "global_step": 93572, "epoch": 2227} {"train_loss": -6.208512306213379, "global_step": 93573, "epoch": 2227} {"train_loss": -6.1034626960754395, "global_step": 93574, "epoch": 2227} {"train_loss": -6.261181388582502, "global_step": 93575, "epoch": 2227, "val_loss": 75618.6171875} {"train_loss": -6.152371406555176, "global_step": 93576, "epoch": 2228} {"train_loss": -6.236203193664551, "global_step": 93577, "epoch": 2228} {"train_loss": -6.415170669555664, "global_step": 93578, "epoch": 2228} {"train_loss": -6.265957832336426, "global_step": 93579, "epoch": 2228} {"train_loss": -6.292982578277588, "global_step": 93580, "epoch": 2228} {"train_loss": -6.2592620849609375, "global_step": 93581, "epoch": 2228} {"train_loss": -6.187604904174805, "global_step": 93582, "epoch": 2228} {"train_loss": -6.194458961486816, "global_step": 93583, "epoch": 2228} {"train_loss": -6.107362270355225, "global_step": 93584, "epoch": 2228} {"train_loss": -6.172604084014893, "global_step": 93585, "epoch": 2228} {"train_loss": -6.27114200592041, "global_step": 93586, "epoch": 2228} {"train_loss": -6.193758010864258, "global_step": 93587, "epoch": 2228} {"train_loss": -6.303247451782227, "global_step": 93588, "epoch": 2228} {"train_loss": -6.165863037109375, "global_step": 93589, "epoch": 2228} {"train_loss": -6.27316951751709, "global_step": 93590, "epoch": 2228} {"train_loss": -6.378458023071289, "global_step": 93591, "epoch": 2228} {"train_loss": -6.205188751220703, "global_step": 93592, "epoch": 2228} {"train_loss": -6.260319232940674, "global_step": 93593, "epoch": 2228} {"train_loss": -6.370260238647461, "global_step": 93594, "epoch": 2228} {"train_loss": -6.223015785217285, "global_step": 93595, "epoch": 2228} {"train_loss": -6.005845069885254, "global_step": 93596, "epoch": 2228} {"train_loss": -6.244793891906738, "global_step": 93597, "epoch": 2228} {"train_loss": -6.3173747062683105, "global_step": 93598, "epoch": 2228} {"train_loss": -6.205322742462158, "global_step": 93599, "epoch": 2228} {"train_loss": -6.336477756500244, "global_step": 93600, "epoch": 2228} {"train_loss": -6.158219337463379, "global_step": 93601, "epoch": 2228} {"train_loss": -6.218481063842773, "global_step": 93602, "epoch": 2228} {"train_loss": -6.139667510986328, "global_step": 93603, "epoch": 2228} {"train_loss": -6.326663017272949, "global_step": 93604, "epoch": 2228} {"train_loss": -6.167436122894287, "global_step": 93605, "epoch": 2228} {"train_loss": -6.233184337615967, "global_step": 93606, "epoch": 2228} {"train_loss": -6.119811058044434, "global_step": 93607, "epoch": 2228} {"train_loss": -6.294846057891846, "global_step": 93608, "epoch": 2228} {"train_loss": -6.263186931610107, "global_step": 93609, "epoch": 2228} {"train_loss": -6.230939865112305, "global_step": 93610, "epoch": 2228} {"train_loss": -6.149228572845459, "global_step": 93611, "epoch": 2228} {"train_loss": -6.286312103271484, "global_step": 93612, "epoch": 2228} {"train_loss": -6.308066368103027, "global_step": 93613, "epoch": 2228} {"train_loss": -6.283895492553711, "global_step": 93614, "epoch": 2228} {"train_loss": -6.031289577484131, "global_step": 93615, "epoch": 2228} {"train_loss": -6.286225318908691, "global_step": 93616, "epoch": 2228} {"train_loss": -6.2355128810519265, "global_step": 93617, "epoch": 2228, "val_loss": 75393.0703125} {"train_loss": -6.271803379058838, "global_step": 93618, "epoch": 2229} {"train_loss": -6.362171173095703, "global_step": 93619, "epoch": 2229} {"train_loss": -6.381868362426758, "global_step": 93620, "epoch": 2229} {"train_loss": -6.225298881530762, "global_step": 93621, "epoch": 2229} {"train_loss": -6.315006256103516, "global_step": 93622, "epoch": 2229} {"train_loss": -6.324129581451416, "global_step": 93623, "epoch": 2229} {"train_loss": -6.305715560913086, "global_step": 93624, "epoch": 2229} {"train_loss": -6.281185626983643, "global_step": 93625, "epoch": 2229} {"train_loss": -6.403566837310791, "global_step": 93626, "epoch": 2229} {"train_loss": -6.146738529205322, "global_step": 93627, "epoch": 2229} {"train_loss": -6.41741418838501, "global_step": 93628, "epoch": 2229} {"train_loss": -6.408500671386719, "global_step": 93629, "epoch": 2229} {"train_loss": -6.334394454956055, "global_step": 93630, "epoch": 2229} {"train_loss": -6.297749042510986, "global_step": 93631, "epoch": 2229} {"train_loss": -6.354767322540283, "global_step": 93632, "epoch": 2229} {"train_loss": -6.353337287902832, "global_step": 93633, "epoch": 2229} {"train_loss": -6.344852447509766, "global_step": 93634, "epoch": 2229} {"train_loss": -6.33286190032959, "global_step": 93635, "epoch": 2229} {"train_loss": -6.346238136291504, "global_step": 93636, "epoch": 2229} {"train_loss": -6.281710624694824, "global_step": 93637, "epoch": 2229} {"train_loss": -6.182670593261719, "global_step": 93638, "epoch": 2229} {"train_loss": -6.346523284912109, "global_step": 93639, "epoch": 2229} {"train_loss": -6.163656711578369, "global_step": 93640, "epoch": 2229} {"train_loss": -6.191393852233887, "global_step": 93641, "epoch": 2229} {"train_loss": -6.322721481323242, "global_step": 93642, "epoch": 2229} {"train_loss": -6.306487083435059, "global_step": 93643, "epoch": 2229} {"train_loss": -6.306351661682129, "global_step": 93644, "epoch": 2229} {"train_loss": -6.301311492919922, "global_step": 93645, "epoch": 2229} {"train_loss": -6.224209785461426, "global_step": 93646, "epoch": 2229} {"train_loss": -6.328588008880615, "global_step": 93647, "epoch": 2229} {"train_loss": -6.329980373382568, "global_step": 93648, "epoch": 2229} {"train_loss": -6.284427642822266, "global_step": 93649, "epoch": 2229} {"train_loss": -6.280223846435547, "global_step": 93650, "epoch": 2229} {"train_loss": -6.339831829071045, "global_step": 93651, "epoch": 2229} {"train_loss": -6.175000190734863, "global_step": 93652, "epoch": 2229} {"train_loss": -6.287015914916992, "global_step": 93653, "epoch": 2229} {"train_loss": -6.33815336227417, "global_step": 93654, "epoch": 2229} {"train_loss": -6.29433536529541, "global_step": 93655, "epoch": 2229} {"train_loss": -6.226539134979248, "global_step": 93656, "epoch": 2229} {"train_loss": -6.327244758605957, "global_step": 93657, "epoch": 2229} {"train_loss": -6.213270664215088, "global_step": 93658, "epoch": 2229} {"train_loss": -6.300232807795207, "global_step": 93659, "epoch": 2229, "val_loss": 75457.2890625} {"train_loss": -6.323664665222168, "global_step": 93660, "epoch": 2230} {"train_loss": -6.227337837219238, "global_step": 93661, "epoch": 2230} {"train_loss": -6.463422775268555, "global_step": 93662, "epoch": 2230} {"train_loss": -6.340034484863281, "global_step": 93663, "epoch": 2230} {"train_loss": -6.35325288772583, "global_step": 93664, "epoch": 2230} {"train_loss": -6.318244457244873, "global_step": 93665, "epoch": 2230} {"train_loss": -6.323510646820068, "global_step": 93666, "epoch": 2230} {"train_loss": -6.281959533691406, "global_step": 93667, "epoch": 2230} {"train_loss": -6.335492134094238, "global_step": 93668, "epoch": 2230} {"train_loss": -6.3037109375, "global_step": 93669, "epoch": 2230} {"train_loss": -6.267965316772461, "global_step": 93670, "epoch": 2230} {"train_loss": -6.289779186248779, "global_step": 93671, "epoch": 2230} {"train_loss": -6.23317813873291, "global_step": 93672, "epoch": 2230} {"train_loss": -6.259152412414551, "global_step": 93673, "epoch": 2230} {"train_loss": -6.280879020690918, "global_step": 93674, "epoch": 2230} {"train_loss": -6.428626537322998, "global_step": 93675, "epoch": 2230} {"train_loss": -6.281518936157227, "global_step": 93676, "epoch": 2230} {"train_loss": -6.192084312438965, "global_step": 93677, "epoch": 2230} {"train_loss": -6.1736931800842285, "global_step": 93678, "epoch": 2230} {"train_loss": -6.168062210083008, "global_step": 93679, "epoch": 2230} {"train_loss": -6.309854507446289, "global_step": 93680, "epoch": 2230} {"train_loss": -6.229443550109863, "global_step": 93681, "epoch": 2230} {"train_loss": -6.25428581237793, "global_step": 93682, "epoch": 2230} {"train_loss": -6.223796844482422, "global_step": 93683, "epoch": 2230} {"train_loss": -6.356085777282715, "global_step": 93684, "epoch": 2230} {"train_loss": -6.29897928237915, "global_step": 93685, "epoch": 2230} {"train_loss": -6.141050338745117, "global_step": 93686, "epoch": 2230} {"train_loss": -6.316169738769531, "global_step": 93687, "epoch": 2230} {"train_loss": -6.245517253875732, "global_step": 93688, "epoch": 2230} {"train_loss": -6.2712578773498535, "global_step": 93689, "epoch": 2230} {"train_loss": -6.288472652435303, "global_step": 93690, "epoch": 2230} {"train_loss": -6.2599334716796875, "global_step": 93691, "epoch": 2230} {"train_loss": -6.189205169677734, "global_step": 93692, "epoch": 2230} {"train_loss": -6.248147010803223, "global_step": 93693, "epoch": 2230} {"train_loss": -6.255651950836182, "global_step": 93694, "epoch": 2230} {"train_loss": -6.2563629150390625, "global_step": 93695, "epoch": 2230} {"train_loss": -6.112575531005859, "global_step": 93696, "epoch": 2230} {"train_loss": -6.263749599456787, "global_step": 93697, "epoch": 2230} {"train_loss": -6.307582855224609, "global_step": 93698, "epoch": 2230} {"train_loss": -6.26677942276001, "global_step": 93699, "epoch": 2230} {"train_loss": -6.442142486572266, "global_step": 93700, "epoch": 2230} {"train_loss": -6.278355144319081, "global_step": 93701, "epoch": 2230, "val_loss": 75431.7421875} {"train_loss": -6.290999412536621, "global_step": 93702, "epoch": 2231} {"train_loss": -6.360881328582764, "global_step": 93703, "epoch": 2231} {"train_loss": -6.341062545776367, "global_step": 93704, "epoch": 2231} {"train_loss": -6.213134765625, "global_step": 93705, "epoch": 2231} {"train_loss": -6.402000904083252, "global_step": 93706, "epoch": 2231} {"train_loss": -6.321135520935059, "global_step": 93707, "epoch": 2231} {"train_loss": -6.429963111877441, "global_step": 93708, "epoch": 2231} {"train_loss": -6.325217247009277, "global_step": 93709, "epoch": 2231} {"train_loss": -6.334576606750488, "global_step": 93710, "epoch": 2231} {"train_loss": -6.377301216125488, "global_step": 93711, "epoch": 2231} {"train_loss": -6.287495136260986, "global_step": 93712, "epoch": 2231} {"train_loss": -6.317854881286621, "global_step": 93713, "epoch": 2231} {"train_loss": -6.414388656616211, "global_step": 93714, "epoch": 2231} {"train_loss": -6.400915145874023, "global_step": 93715, "epoch": 2231} {"train_loss": -6.210252285003662, "global_step": 93716, "epoch": 2231} {"train_loss": -6.302588939666748, "global_step": 93717, "epoch": 2231} {"train_loss": -6.117290496826172, "global_step": 93718, "epoch": 2231} {"train_loss": -6.248159408569336, "global_step": 93719, "epoch": 2231} {"train_loss": -6.285584926605225, "global_step": 93720, "epoch": 2231} {"train_loss": -6.189121246337891, "global_step": 93721, "epoch": 2231} {"train_loss": -6.380636692047119, "global_step": 93722, "epoch": 2231} {"train_loss": -6.328211784362793, "global_step": 93723, "epoch": 2231} {"train_loss": -6.301666736602783, "global_step": 93724, "epoch": 2231} {"train_loss": -6.133494853973389, "global_step": 93725, "epoch": 2231} {"train_loss": -6.169075012207031, "global_step": 93726, "epoch": 2231} {"train_loss": -6.203778266906738, "global_step": 93727, "epoch": 2231} {"train_loss": -6.142168998718262, "global_step": 93728, "epoch": 2231} {"train_loss": -6.231637001037598, "global_step": 93729, "epoch": 2231} {"train_loss": -6.2458295822143555, "global_step": 93730, "epoch": 2231} {"train_loss": -6.123664855957031, "global_step": 93731, "epoch": 2231} {"train_loss": -6.210427284240723, "global_step": 93732, "epoch": 2231} {"train_loss": -6.188385963439941, "global_step": 93733, "epoch": 2231} {"train_loss": -6.231506824493408, "global_step": 93734, "epoch": 2231} {"train_loss": -6.165692329406738, "global_step": 93735, "epoch": 2231} {"train_loss": -6.119239807128906, "global_step": 93736, "epoch": 2231} {"train_loss": -6.315543174743652, "global_step": 93737, "epoch": 2231} {"train_loss": -6.271886825561523, "global_step": 93738, "epoch": 2231} {"train_loss": -6.300595760345459, "global_step": 93739, "epoch": 2231} {"train_loss": -6.268516540527344, "global_step": 93740, "epoch": 2231} {"train_loss": -6.215137958526611, "global_step": 93741, "epoch": 2231} {"train_loss": -6.352361679077148, "global_step": 93742, "epoch": 2231} {"train_loss": -6.2675605955578035, "global_step": 93743, "epoch": 2231, "val_loss": 75228.46875} {"train_loss": -6.289844512939453, "global_step": 93744, "epoch": 2232} {"train_loss": -6.1736578941345215, "global_step": 93745, "epoch": 2232} {"train_loss": -6.109206199645996, "global_step": 93746, "epoch": 2232} {"train_loss": -6.2451863288879395, "global_step": 93747, "epoch": 2232} {"train_loss": -6.149735450744629, "global_step": 93748, "epoch": 2232} {"train_loss": -6.366469383239746, "global_step": 93749, "epoch": 2232} {"train_loss": -6.292300224304199, "global_step": 93750, "epoch": 2232} {"train_loss": -6.308977127075195, "global_step": 93751, "epoch": 2232} {"train_loss": -6.209931373596191, "global_step": 93752, "epoch": 2232} {"train_loss": -6.361256122589111, "global_step": 93753, "epoch": 2232} {"train_loss": -6.243628025054932, "global_step": 93754, "epoch": 2232} {"train_loss": -6.242630481719971, "global_step": 93755, "epoch": 2232} {"train_loss": -6.32643985748291, "global_step": 93756, "epoch": 2232} {"train_loss": -6.22235631942749, "global_step": 93757, "epoch": 2232} {"train_loss": -6.163264274597168, "global_step": 93758, "epoch": 2232} {"train_loss": -6.351751327514648, "global_step": 93759, "epoch": 2232} {"train_loss": -6.155307769775391, "global_step": 93760, "epoch": 2232} {"train_loss": -6.320356369018555, "global_step": 93761, "epoch": 2232} {"train_loss": -6.181879043579102, "global_step": 93762, "epoch": 2232} {"train_loss": -6.188087463378906, "global_step": 93763, "epoch": 2232} {"train_loss": -6.278478622436523, "global_step": 93764, "epoch": 2232} {"train_loss": -6.350241661071777, "global_step": 93765, "epoch": 2232} {"train_loss": -6.266092300415039, "global_step": 93766, "epoch": 2232} {"train_loss": -6.352784633636475, "global_step": 93767, "epoch": 2232} {"train_loss": -6.324479103088379, "global_step": 93768, "epoch": 2232} {"train_loss": -6.219623565673828, "global_step": 93769, "epoch": 2232} {"train_loss": -6.358002662658691, "global_step": 93770, "epoch": 2232} {"train_loss": -6.24241828918457, "global_step": 93771, "epoch": 2232} {"train_loss": -6.23732852935791, "global_step": 93772, "epoch": 2232} {"train_loss": -6.263063430786133, "global_step": 93773, "epoch": 2232} {"train_loss": -6.252536773681641, "global_step": 93774, "epoch": 2232} {"train_loss": -6.297048091888428, "global_step": 93775, "epoch": 2232} {"train_loss": -6.251894950866699, "global_step": 93776, "epoch": 2232} {"train_loss": -6.314227104187012, "global_step": 93777, "epoch": 2232} {"train_loss": -6.404546737670898, "global_step": 93778, "epoch": 2232} {"train_loss": -6.2126688957214355, "global_step": 93779, "epoch": 2232} {"train_loss": -6.375903129577637, "global_step": 93780, "epoch": 2232} {"train_loss": -6.337960243225098, "global_step": 93781, "epoch": 2232} {"train_loss": -6.214630126953125, "global_step": 93782, "epoch": 2232} {"train_loss": -6.257561683654785, "global_step": 93783, "epoch": 2232} {"train_loss": -6.154665946960449, "global_step": 93784, "epoch": 2232} {"train_loss": -6.267330987112863, "global_step": 93785, "epoch": 2232, "val_loss": 75655.390625} {"train_loss": -6.211220741271973, "global_step": 93786, "epoch": 2233} {"train_loss": -6.273836135864258, "global_step": 93787, "epoch": 2233} {"train_loss": -6.233700752258301, "global_step": 93788, "epoch": 2233} {"train_loss": -6.304433822631836, "global_step": 93789, "epoch": 2233} {"train_loss": -6.251626968383789, "global_step": 93790, "epoch": 2233} {"train_loss": -6.257791996002197, "global_step": 93791, "epoch": 2233} {"train_loss": -6.398015975952148, "global_step": 93792, "epoch": 2233} {"train_loss": -6.24396276473999, "global_step": 93793, "epoch": 2233} {"train_loss": -6.323966979980469, "global_step": 93794, "epoch": 2233} {"train_loss": -6.366360664367676, "global_step": 93795, "epoch": 2233} {"train_loss": -6.2660813331604, "global_step": 93796, "epoch": 2233} {"train_loss": -6.314383506774902, "global_step": 93797, "epoch": 2233} {"train_loss": -6.243587493896484, "global_step": 93798, "epoch": 2233} {"train_loss": -6.253365993499756, "global_step": 93799, "epoch": 2233} {"train_loss": -6.249671936035156, "global_step": 93800, "epoch": 2233} {"train_loss": -6.229989051818848, "global_step": 93801, "epoch": 2233} {"train_loss": -6.287664413452148, "global_step": 93802, "epoch": 2233} {"train_loss": -6.234035968780518, "global_step": 93803, "epoch": 2233} {"train_loss": -6.2229533195495605, "global_step": 93804, "epoch": 2233} {"train_loss": -6.315180778503418, "global_step": 93805, "epoch": 2233} {"train_loss": -6.221460819244385, "global_step": 93806, "epoch": 2233} {"train_loss": -6.204119682312012, "global_step": 93807, "epoch": 2233} {"train_loss": -6.344286918640137, "global_step": 93808, "epoch": 2233} {"train_loss": -6.160686016082764, "global_step": 93809, "epoch": 2233} {"train_loss": -6.208555698394775, "global_step": 93810, "epoch": 2233} {"train_loss": -6.276568412780762, "global_step": 93811, "epoch": 2233} {"train_loss": -6.178735733032227, "global_step": 93812, "epoch": 2233} {"train_loss": -6.346797466278076, "global_step": 93813, "epoch": 2233} {"train_loss": -6.234561920166016, "global_step": 93814, "epoch": 2233} {"train_loss": -6.321227073669434, "global_step": 93815, "epoch": 2233} {"train_loss": -6.254532814025879, "global_step": 93816, "epoch": 2233} {"train_loss": -6.264934539794922, "global_step": 93817, "epoch": 2233} {"train_loss": -6.257934093475342, "global_step": 93818, "epoch": 2233} {"train_loss": -6.265168190002441, "global_step": 93819, "epoch": 2233} {"train_loss": -6.313805103302002, "global_step": 93820, "epoch": 2233} {"train_loss": -6.386665344238281, "global_step": 93821, "epoch": 2233} {"train_loss": -6.315209865570068, "global_step": 93822, "epoch": 2233} {"train_loss": -6.297111988067627, "global_step": 93823, "epoch": 2233} {"train_loss": -6.294863700866699, "global_step": 93824, "epoch": 2233} {"train_loss": -6.246560096740723, "global_step": 93825, "epoch": 2233} {"train_loss": -6.34352970123291, "global_step": 93826, "epoch": 2233} {"train_loss": -6.277161087308611, "global_step": 93827, "epoch": 2233, "val_loss": 75515.1953125} {"train_loss": -6.196732521057129, "global_step": 93828, "epoch": 2234} {"train_loss": -6.335479736328125, "global_step": 93829, "epoch": 2234} {"train_loss": -6.252284049987793, "global_step": 93830, "epoch": 2234} {"train_loss": -6.3317341804504395, "global_step": 93831, "epoch": 2234} {"train_loss": -6.363586902618408, "global_step": 93832, "epoch": 2234} {"train_loss": -6.34348726272583, "global_step": 93833, "epoch": 2234} {"train_loss": -6.352879047393799, "global_step": 93834, "epoch": 2234} {"train_loss": -6.265096187591553, "global_step": 93835, "epoch": 2234} {"train_loss": -6.3116912841796875, "global_step": 93836, "epoch": 2234} {"train_loss": -6.305323123931885, "global_step": 93837, "epoch": 2234} {"train_loss": -6.354923725128174, "global_step": 93838, "epoch": 2234} {"train_loss": -6.170042991638184, "global_step": 93839, "epoch": 2234} {"train_loss": -6.288725852966309, "global_step": 93840, "epoch": 2234} {"train_loss": -6.347886562347412, "global_step": 93841, "epoch": 2234} {"train_loss": -6.221985816955566, "global_step": 93842, "epoch": 2234} {"train_loss": -6.379813194274902, "global_step": 93843, "epoch": 2234} {"train_loss": -6.29358434677124, "global_step": 93844, "epoch": 2234} {"train_loss": -6.295955181121826, "global_step": 93845, "epoch": 2234} {"train_loss": -6.3215227127075195, "global_step": 93846, "epoch": 2234} {"train_loss": -6.3331708908081055, "global_step": 93847, "epoch": 2234} {"train_loss": -6.248039245605469, "global_step": 93848, "epoch": 2234} {"train_loss": -6.332569122314453, "global_step": 93849, "epoch": 2234} {"train_loss": -6.367934226989746, "global_step": 93850, "epoch": 2234} {"train_loss": -6.383444786071777, "global_step": 93851, "epoch": 2234} {"train_loss": -6.28676700592041, "global_step": 93852, "epoch": 2234} {"train_loss": -6.368039131164551, "global_step": 93853, "epoch": 2234} {"train_loss": -6.3263397216796875, "global_step": 93854, "epoch": 2234} {"train_loss": -6.289646148681641, "global_step": 93855, "epoch": 2234} {"train_loss": -6.363269805908203, "global_step": 93856, "epoch": 2234} {"train_loss": -6.294849395751953, "global_step": 93857, "epoch": 2234} {"train_loss": -6.272150039672852, "global_step": 93858, "epoch": 2234} {"train_loss": -6.255773544311523, "global_step": 93859, "epoch": 2234} {"train_loss": -6.351813316345215, "global_step": 93860, "epoch": 2234} {"train_loss": -6.390683650970459, "global_step": 93861, "epoch": 2234} {"train_loss": -6.390020370483398, "global_step": 93862, "epoch": 2234} {"train_loss": -6.249940872192383, "global_step": 93863, "epoch": 2234} {"train_loss": -6.2432379722595215, "global_step": 93864, "epoch": 2234} {"train_loss": -6.254831314086914, "global_step": 93865, "epoch": 2234} {"train_loss": -6.274184703826904, "global_step": 93866, "epoch": 2234} {"train_loss": -6.371335029602051, "global_step": 93867, "epoch": 2234} {"train_loss": -6.24822473526001, "global_step": 93868, "epoch": 2234} {"train_loss": -6.307239248639061, "global_step": 93869, "epoch": 2234, "val_loss": 75316.5546875} {"train_loss": -6.395060062408447, "global_step": 93870, "epoch": 2235} {"train_loss": -6.388795375823975, "global_step": 93871, "epoch": 2235} {"train_loss": -6.268621444702148, "global_step": 93872, "epoch": 2235} {"train_loss": -6.324566841125488, "global_step": 93873, "epoch": 2235} {"train_loss": -6.243763446807861, "global_step": 93874, "epoch": 2235} {"train_loss": -6.409842014312744, "global_step": 93875, "epoch": 2235} {"train_loss": -6.144614219665527, "global_step": 93876, "epoch": 2235} {"train_loss": -6.2887187004089355, "global_step": 93877, "epoch": 2235} {"train_loss": -6.262241840362549, "global_step": 93878, "epoch": 2235} {"train_loss": -6.399731159210205, "global_step": 93879, "epoch": 2235} {"train_loss": -6.401670455932617, "global_step": 93880, "epoch": 2235} {"train_loss": -6.351755142211914, "global_step": 93881, "epoch": 2235} {"train_loss": -6.364889144897461, "global_step": 93882, "epoch": 2235} {"train_loss": -6.227541446685791, "global_step": 93883, "epoch": 2235} {"train_loss": -6.292621612548828, "global_step": 93884, "epoch": 2235} {"train_loss": -6.294182300567627, "global_step": 93885, "epoch": 2235} {"train_loss": -6.346392631530762, "global_step": 93886, "epoch": 2235} {"train_loss": -6.245749473571777, "global_step": 93887, "epoch": 2235} {"train_loss": -6.4486212730407715, "global_step": 93888, "epoch": 2235} {"train_loss": -6.242159366607666, "global_step": 93889, "epoch": 2235} {"train_loss": -6.253267288208008, "global_step": 93890, "epoch": 2235} {"train_loss": -6.358517646789551, "global_step": 93891, "epoch": 2235} {"train_loss": -6.261794090270996, "global_step": 93892, "epoch": 2235} {"train_loss": -6.127603530883789, "global_step": 93893, "epoch": 2235} {"train_loss": -6.2339348793029785, "global_step": 93894, "epoch": 2235} {"train_loss": -6.283417224884033, "global_step": 93895, "epoch": 2235} {"train_loss": -6.043417930603027, "global_step": 93896, "epoch": 2235} {"train_loss": -6.13642692565918, "global_step": 93897, "epoch": 2235} {"train_loss": -6.14832878112793, "global_step": 93898, "epoch": 2235} {"train_loss": -6.131352424621582, "global_step": 93899, "epoch": 2235} {"train_loss": -6.226868629455566, "global_step": 93900, "epoch": 2235} {"train_loss": -6.281897068023682, "global_step": 93901, "epoch": 2235} {"train_loss": -6.212754249572754, "global_step": 93902, "epoch": 2235} {"train_loss": -6.219328880310059, "global_step": 93903, "epoch": 2235} {"train_loss": -6.229302883148193, "global_step": 93904, "epoch": 2235} {"train_loss": -6.178259372711182, "global_step": 93905, "epoch": 2235} {"train_loss": -6.207368850708008, "global_step": 93906, "epoch": 2235} {"train_loss": -6.168259620666504, "global_step": 93907, "epoch": 2235} {"train_loss": -6.408201694488525, "global_step": 93908, "epoch": 2235} {"train_loss": -6.311652183532715, "global_step": 93909, "epoch": 2235} {"train_loss": -6.2064337730407715, "global_step": 93910, "epoch": 2235} {"train_loss": -6.2693327608562655, "global_step": 93911, "epoch": 2235, "val_loss": 75587.3046875} {"train_loss": -6.372738361358643, "global_step": 93912, "epoch": 2236} {"train_loss": -6.338366508483887, "global_step": 93913, "epoch": 2236} {"train_loss": -6.3097734451293945, "global_step": 93914, "epoch": 2236} {"train_loss": -6.2492289543151855, "global_step": 93915, "epoch": 2236} {"train_loss": -6.191216945648193, "global_step": 93916, "epoch": 2236} {"train_loss": -6.218176364898682, "global_step": 93917, "epoch": 2236} {"train_loss": -6.401595115661621, "global_step": 93918, "epoch": 2236} {"train_loss": -6.277184009552002, "global_step": 93919, "epoch": 2236} {"train_loss": -6.346261024475098, "global_step": 93920, "epoch": 2236} {"train_loss": -6.264090538024902, "global_step": 93921, "epoch": 2236} {"train_loss": -6.342413902282715, "global_step": 93922, "epoch": 2236} {"train_loss": -6.377189636230469, "global_step": 93923, "epoch": 2236} {"train_loss": -6.306483745574951, "global_step": 93924, "epoch": 2236} {"train_loss": -6.302490711212158, "global_step": 93925, "epoch": 2236} {"train_loss": -6.326753616333008, "global_step": 93926, "epoch": 2236} {"train_loss": -6.410642623901367, "global_step": 93927, "epoch": 2236} {"train_loss": -6.288093566894531, "global_step": 93928, "epoch": 2236} {"train_loss": -6.397107124328613, "global_step": 93929, "epoch": 2236} {"train_loss": -6.384949684143066, "global_step": 93930, "epoch": 2236} {"train_loss": -6.4629974365234375, "global_step": 93931, "epoch": 2236} {"train_loss": -6.28987979888916, "global_step": 93932, "epoch": 2236} {"train_loss": -6.183653831481934, "global_step": 93933, "epoch": 2236} {"train_loss": -6.302829742431641, "global_step": 93934, "epoch": 2236} {"train_loss": -6.3121209144592285, "global_step": 93935, "epoch": 2236} {"train_loss": -6.205053329467773, "global_step": 93936, "epoch": 2236} {"train_loss": -6.303049087524414, "global_step": 93937, "epoch": 2236} {"train_loss": -6.38338565826416, "global_step": 93938, "epoch": 2236} {"train_loss": -6.277665138244629, "global_step": 93939, "epoch": 2236} {"train_loss": -6.2118377685546875, "global_step": 93940, "epoch": 2236} {"train_loss": -6.216545104980469, "global_step": 93941, "epoch": 2236} {"train_loss": -6.247954368591309, "global_step": 93942, "epoch": 2236} {"train_loss": -6.18125581741333, "global_step": 93943, "epoch": 2236} {"train_loss": -6.203576564788818, "global_step": 93944, "epoch": 2236} {"train_loss": -6.187505722045898, "global_step": 93945, "epoch": 2236} {"train_loss": -6.276662826538086, "global_step": 93946, "epoch": 2236} {"train_loss": -6.3195648193359375, "global_step": 93947, "epoch": 2236} {"train_loss": -6.284788131713867, "global_step": 93948, "epoch": 2236} {"train_loss": -6.167008399963379, "global_step": 93949, "epoch": 2236} {"train_loss": -6.317012310028076, "global_step": 93950, "epoch": 2236} {"train_loss": -6.211589336395264, "global_step": 93951, "epoch": 2236} {"train_loss": -6.278822422027588, "global_step": 93952, "epoch": 2236} {"train_loss": -6.291280326389131, "global_step": 93953, "epoch": 2236, "val_loss": 75566.75} {"train_loss": -6.276150226593018, "global_step": 93954, "epoch": 2237} {"train_loss": -6.245694160461426, "global_step": 93955, "epoch": 2237} {"train_loss": -6.258512496948242, "global_step": 93956, "epoch": 2237} {"train_loss": -6.1993207931518555, "global_step": 93957, "epoch": 2237} {"train_loss": -6.400503158569336, "global_step": 93958, "epoch": 2237} {"train_loss": -6.3428144454956055, "global_step": 93959, "epoch": 2237} {"train_loss": -6.307194709777832, "global_step": 93960, "epoch": 2237} {"train_loss": -6.421112060546875, "global_step": 93961, "epoch": 2237} {"train_loss": -6.338028907775879, "global_step": 93962, "epoch": 2237} {"train_loss": -6.312177658081055, "global_step": 93963, "epoch": 2237} {"train_loss": -6.300081253051758, "global_step": 93964, "epoch": 2237} {"train_loss": -6.374687194824219, "global_step": 93965, "epoch": 2237} {"train_loss": -6.249762535095215, "global_step": 93966, "epoch": 2237} {"train_loss": -6.281584739685059, "global_step": 93967, "epoch": 2237} {"train_loss": -6.194120407104492, "global_step": 93968, "epoch": 2237} {"train_loss": -6.207121849060059, "global_step": 93969, "epoch": 2237} {"train_loss": -6.203845024108887, "global_step": 93970, "epoch": 2237} {"train_loss": -6.360373497009277, "global_step": 93971, "epoch": 2237} {"train_loss": -6.239534378051758, "global_step": 93972, "epoch": 2237} {"train_loss": -6.2617268562316895, "global_step": 93973, "epoch": 2237} {"train_loss": -6.232909202575684, "global_step": 93974, "epoch": 2237} {"train_loss": -6.143441200256348, "global_step": 93975, "epoch": 2237} {"train_loss": -6.311751365661621, "global_step": 93976, "epoch": 2237} {"train_loss": -6.2665815353393555, "global_step": 93977, "epoch": 2237} {"train_loss": -6.235054969787598, "global_step": 93978, "epoch": 2237} {"train_loss": -6.30674409866333, "global_step": 93979, "epoch": 2237} {"train_loss": -6.316141128540039, "global_step": 93980, "epoch": 2237} {"train_loss": -6.2854108810424805, "global_step": 93981, "epoch": 2237} {"train_loss": -6.191075325012207, "global_step": 93982, "epoch": 2237} {"train_loss": -6.330001354217529, "global_step": 93983, "epoch": 2237} {"train_loss": -6.250434398651123, "global_step": 93984, "epoch": 2237} {"train_loss": -6.246263027191162, "global_step": 93985, "epoch": 2237} {"train_loss": -6.2498273849487305, "global_step": 93986, "epoch": 2237} {"train_loss": -6.074973106384277, "global_step": 93987, "epoch": 2237} {"train_loss": -6.335942268371582, "global_step": 93988, "epoch": 2237} {"train_loss": -6.226311683654785, "global_step": 93989, "epoch": 2237} {"train_loss": -6.257664680480957, "global_step": 93990, "epoch": 2237} {"train_loss": -6.287208080291748, "global_step": 93991, "epoch": 2237} {"train_loss": -6.308656692504883, "global_step": 93992, "epoch": 2237} {"train_loss": -6.322858810424805, "global_step": 93993, "epoch": 2237} {"train_loss": -6.342572212219238, "global_step": 93994, "epoch": 2237} {"train_loss": -6.27509643917992, "global_step": 93995, "epoch": 2237, "val_loss": 75499.625} {"train_loss": -6.371129989624023, "global_step": 93996, "epoch": 2238} {"train_loss": -6.300367832183838, "global_step": 93997, "epoch": 2238} {"train_loss": -6.275003433227539, "global_step": 93998, "epoch": 2238} {"train_loss": -6.350526332855225, "global_step": 93999, "epoch": 2238} {"train_loss": -6.282818794250488, "global_step": 94000, "epoch": 2238} {"train_loss": -6.294332504272461, "global_step": 94001, "epoch": 2238} {"train_loss": -6.334860324859619, "global_step": 94002, "epoch": 2238} {"train_loss": -6.241397857666016, "global_step": 94003, "epoch": 2238} {"train_loss": -6.225305557250977, "global_step": 94004, "epoch": 2238} {"train_loss": -6.249079704284668, "global_step": 94005, "epoch": 2238} {"train_loss": -6.3226847648620605, "global_step": 94006, "epoch": 2238} {"train_loss": -6.389691352844238, "global_step": 94007, "epoch": 2238} {"train_loss": -6.322032928466797, "global_step": 94008, "epoch": 2238} {"train_loss": -6.3926310539245605, "global_step": 94009, "epoch": 2238} {"train_loss": -6.313672065734863, "global_step": 94010, "epoch": 2238} {"train_loss": -6.341787338256836, "global_step": 94011, "epoch": 2238} {"train_loss": -6.3160810470581055, "global_step": 94012, "epoch": 2238} {"train_loss": -6.213166236877441, "global_step": 94013, "epoch": 2238} {"train_loss": -6.226672172546387, "global_step": 94014, "epoch": 2238} {"train_loss": -6.3911004066467285, "global_step": 94015, "epoch": 2238} {"train_loss": -6.268524169921875, "global_step": 94016, "epoch": 2238} {"train_loss": -6.380231857299805, "global_step": 94017, "epoch": 2238} {"train_loss": -6.2111616134643555, "global_step": 94018, "epoch": 2238} {"train_loss": -6.343037128448486, "global_step": 94019, "epoch": 2238} {"train_loss": -6.397397994995117, "global_step": 94020, "epoch": 2238} {"train_loss": -6.294337272644043, "global_step": 94021, "epoch": 2238} {"train_loss": -6.370528221130371, "global_step": 94022, "epoch": 2238} {"train_loss": -6.2474846839904785, "global_step": 94023, "epoch": 2238} {"train_loss": -6.309825420379639, "global_step": 94024, "epoch": 2238} {"train_loss": -6.380629539489746, "global_step": 94025, "epoch": 2238} {"train_loss": -6.273336410522461, "global_step": 94026, "epoch": 2238} {"train_loss": -6.182901859283447, "global_step": 94027, "epoch": 2238} {"train_loss": -6.196090221405029, "global_step": 94028, "epoch": 2238} {"train_loss": -6.131431579589844, "global_step": 94029, "epoch": 2238} {"train_loss": -6.294528007507324, "global_step": 94030, "epoch": 2238} {"train_loss": -6.342215538024902, "global_step": 94031, "epoch": 2238} {"train_loss": -6.2195820808410645, "global_step": 94032, "epoch": 2238} {"train_loss": -6.2695698738098145, "global_step": 94033, "epoch": 2238} {"train_loss": -6.2054338455200195, "global_step": 94034, "epoch": 2238} {"train_loss": -6.263132095336914, "global_step": 94035, "epoch": 2238} {"train_loss": -6.1745524406433105, "global_step": 94036, "epoch": 2238} {"train_loss": -6.293405214945476, "global_step": 94037, "epoch": 2238, "val_loss": 75555.6875} {"train_loss": -6.180865287780762, "global_step": 94038, "epoch": 2239} {"train_loss": -6.198713779449463, "global_step": 94039, "epoch": 2239} {"train_loss": -6.182883262634277, "global_step": 94040, "epoch": 2239} {"train_loss": -6.343299865722656, "global_step": 94041, "epoch": 2239} {"train_loss": -6.26291561126709, "global_step": 94042, "epoch": 2239} {"train_loss": -6.3062944412231445, "global_step": 94043, "epoch": 2239} {"train_loss": -6.187644958496094, "global_step": 94044, "epoch": 2239} {"train_loss": -6.379250526428223, "global_step": 94045, "epoch": 2239} {"train_loss": -6.320322036743164, "global_step": 94046, "epoch": 2239} {"train_loss": -6.237307548522949, "global_step": 94047, "epoch": 2239} {"train_loss": -6.305131435394287, "global_step": 94048, "epoch": 2239} {"train_loss": -6.4373779296875, "global_step": 94049, "epoch": 2239} {"train_loss": -6.282393455505371, "global_step": 94050, "epoch": 2239} {"train_loss": -6.352978706359863, "global_step": 94051, "epoch": 2239} {"train_loss": -6.165743350982666, "global_step": 94052, "epoch": 2239} {"train_loss": -6.3362274169921875, "global_step": 94053, "epoch": 2239} {"train_loss": -6.246527671813965, "global_step": 94054, "epoch": 2239} {"train_loss": -6.222371578216553, "global_step": 94055, "epoch": 2239} {"train_loss": -6.364669322967529, "global_step": 94056, "epoch": 2239} {"train_loss": -6.3363037109375, "global_step": 94057, "epoch": 2239} {"train_loss": -6.289660453796387, "global_step": 94058, "epoch": 2239} {"train_loss": -6.340934753417969, "global_step": 94059, "epoch": 2239} {"train_loss": -6.294447898864746, "global_step": 94060, "epoch": 2239} {"train_loss": -6.2122802734375, "global_step": 94061, "epoch": 2239} {"train_loss": -6.289172172546387, "global_step": 94062, "epoch": 2239} {"train_loss": -6.359193801879883, "global_step": 94063, "epoch": 2239} {"train_loss": -6.234999656677246, "global_step": 94064, "epoch": 2239} {"train_loss": -6.1872053146362305, "global_step": 94065, "epoch": 2239} {"train_loss": -6.395484924316406, "global_step": 94066, "epoch": 2239} {"train_loss": -6.237595558166504, "global_step": 94067, "epoch": 2239} {"train_loss": -6.336065769195557, "global_step": 94068, "epoch": 2239} {"train_loss": -6.237492561340332, "global_step": 94069, "epoch": 2239} {"train_loss": -6.2713518142700195, "global_step": 94070, "epoch": 2239} {"train_loss": -6.4367170333862305, "global_step": 94071, "epoch": 2239} {"train_loss": -6.2542619705200195, "global_step": 94072, "epoch": 2239} {"train_loss": -6.210638046264648, "global_step": 94073, "epoch": 2239} {"train_loss": -6.265958309173584, "global_step": 94074, "epoch": 2239} {"train_loss": -6.183979034423828, "global_step": 94075, "epoch": 2239} {"train_loss": -6.398731708526611, "global_step": 94076, "epoch": 2239} {"train_loss": -6.2810845375061035, "global_step": 94077, "epoch": 2239} {"train_loss": -6.17111873626709, "global_step": 94078, "epoch": 2239} {"train_loss": -6.278596480687459, "global_step": 94079, "epoch": 2239, "val_loss": 75550.4140625} {"train_loss": -6.222659111022949, "global_step": 94080, "epoch": 2240} {"train_loss": -6.3660054206848145, "global_step": 94081, "epoch": 2240} {"train_loss": -6.275543212890625, "global_step": 94082, "epoch": 2240} {"train_loss": -6.145058631896973, "global_step": 94083, "epoch": 2240} {"train_loss": -6.26810359954834, "global_step": 94084, "epoch": 2240} {"train_loss": -6.290462970733643, "global_step": 94085, "epoch": 2240} {"train_loss": -6.283223628997803, "global_step": 94086, "epoch": 2240} {"train_loss": -6.287215232849121, "global_step": 94087, "epoch": 2240} {"train_loss": -6.215582370758057, "global_step": 94088, "epoch": 2240} {"train_loss": -6.194705963134766, "global_step": 94089, "epoch": 2240} {"train_loss": -6.295709609985352, "global_step": 94090, "epoch": 2240} {"train_loss": -6.229499816894531, "global_step": 94091, "epoch": 2240} {"train_loss": -6.327445030212402, "global_step": 94092, "epoch": 2240} {"train_loss": -6.25053596496582, "global_step": 94093, "epoch": 2240} {"train_loss": -6.280865669250488, "global_step": 94094, "epoch": 2240} {"train_loss": -6.292160511016846, "global_step": 94095, "epoch": 2240} {"train_loss": -6.220080852508545, "global_step": 94096, "epoch": 2240} {"train_loss": -6.333400726318359, "global_step": 94097, "epoch": 2240} {"train_loss": -6.272678375244141, "global_step": 94098, "epoch": 2240} {"train_loss": -6.3754353523254395, "global_step": 94099, "epoch": 2240} {"train_loss": -6.32875919342041, "global_step": 94100, "epoch": 2240} {"train_loss": -6.348804473876953, "global_step": 94101, "epoch": 2240} {"train_loss": -6.184754848480225, "global_step": 94102, "epoch": 2240} {"train_loss": -6.30246639251709, "global_step": 94103, "epoch": 2240} {"train_loss": -6.314252853393555, "global_step": 94104, "epoch": 2240} {"train_loss": -6.448347091674805, "global_step": 94105, "epoch": 2240} {"train_loss": -6.339087963104248, "global_step": 94106, "epoch": 2240} {"train_loss": -6.290383338928223, "global_step": 94107, "epoch": 2240} {"train_loss": -6.289619445800781, "global_step": 94108, "epoch": 2240} {"train_loss": -6.2244110107421875, "global_step": 94109, "epoch": 2240} {"train_loss": -6.289974212646484, "global_step": 94110, "epoch": 2240} {"train_loss": -6.169852256774902, "global_step": 94111, "epoch": 2240} {"train_loss": -6.254422187805176, "global_step": 94112, "epoch": 2240} {"train_loss": -6.325736045837402, "global_step": 94113, "epoch": 2240} {"train_loss": -6.184377670288086, "global_step": 94114, "epoch": 2240} {"train_loss": -6.2341203689575195, "global_step": 94115, "epoch": 2240} {"train_loss": -6.244260787963867, "global_step": 94116, "epoch": 2240} {"train_loss": -6.201932907104492, "global_step": 94117, "epoch": 2240} {"train_loss": -6.153080463409424, "global_step": 94118, "epoch": 2240} {"train_loss": -6.202030181884766, "global_step": 94119, "epoch": 2240} {"train_loss": -6.340076923370361, "global_step": 94120, "epoch": 2240} {"train_loss": -6.265462114697411, "global_step": 94121, "epoch": 2240, "val_loss": 75506.25} {"train_loss": -6.284582138061523, "global_step": 94122, "epoch": 2241} {"train_loss": -6.198088645935059, "global_step": 94123, "epoch": 2241} {"train_loss": -6.216174125671387, "global_step": 94124, "epoch": 2241} {"train_loss": -6.260068416595459, "global_step": 94125, "epoch": 2241} {"train_loss": -6.300548076629639, "global_step": 94126, "epoch": 2241} {"train_loss": -6.2008376121521, "global_step": 94127, "epoch": 2241} {"train_loss": -6.279890537261963, "global_step": 94128, "epoch": 2241} {"train_loss": -6.32783317565918, "global_step": 94129, "epoch": 2241} {"train_loss": -6.22458553314209, "global_step": 94130, "epoch": 2241} {"train_loss": -6.4307756423950195, "global_step": 94131, "epoch": 2241} {"train_loss": -6.374026298522949, "global_step": 94132, "epoch": 2241} {"train_loss": -6.355236053466797, "global_step": 94133, "epoch": 2241} {"train_loss": -6.244470119476318, "global_step": 94134, "epoch": 2241} {"train_loss": -6.206371307373047, "global_step": 94135, "epoch": 2241} {"train_loss": -6.283008575439453, "global_step": 94136, "epoch": 2241} {"train_loss": -6.3614912033081055, "global_step": 94137, "epoch": 2241} {"train_loss": -6.259815216064453, "global_step": 94138, "epoch": 2241} {"train_loss": -6.1264753341674805, "global_step": 94139, "epoch": 2241} {"train_loss": -6.177377700805664, "global_step": 94140, "epoch": 2241} {"train_loss": -6.303431510925293, "global_step": 94141, "epoch": 2241} {"train_loss": -6.34073543548584, "global_step": 94142, "epoch": 2241} {"train_loss": -6.296985626220703, "global_step": 94143, "epoch": 2241} {"train_loss": -6.194567680358887, "global_step": 94144, "epoch": 2241} {"train_loss": -6.2809295654296875, "global_step": 94145, "epoch": 2241} {"train_loss": -6.354794979095459, "global_step": 94146, "epoch": 2241} {"train_loss": -6.33737850189209, "global_step": 94147, "epoch": 2241} {"train_loss": -6.25542688369751, "global_step": 94148, "epoch": 2241} {"train_loss": -6.337102890014648, "global_step": 94149, "epoch": 2241} {"train_loss": -6.345450401306152, "global_step": 94150, "epoch": 2241} {"train_loss": -6.2489471435546875, "global_step": 94151, "epoch": 2241} {"train_loss": -6.317758560180664, "global_step": 94152, "epoch": 2241} {"train_loss": -6.36652135848999, "global_step": 94153, "epoch": 2241} {"train_loss": -6.329145908355713, "global_step": 94154, "epoch": 2241} {"train_loss": -6.362345218658447, "global_step": 94155, "epoch": 2241} {"train_loss": -6.348381042480469, "global_step": 94156, "epoch": 2241} {"train_loss": -6.275346755981445, "global_step": 94157, "epoch": 2241} {"train_loss": -6.332175254821777, "global_step": 94158, "epoch": 2241} {"train_loss": -6.307075500488281, "global_step": 94159, "epoch": 2241} {"train_loss": -6.324023246765137, "global_step": 94160, "epoch": 2241} {"train_loss": -6.315974712371826, "global_step": 94161, "epoch": 2241} {"train_loss": -6.228926658630371, "global_step": 94162, "epoch": 2241} {"train_loss": -6.290856168383644, "global_step": 94163, "epoch": 2241, "val_loss": 75756.125} {"train_loss": -6.361886024475098, "global_step": 94164, "epoch": 2242} {"train_loss": -6.26020622253418, "global_step": 94165, "epoch": 2242} {"train_loss": -6.359318256378174, "global_step": 94166, "epoch": 2242} {"train_loss": -6.225420951843262, "global_step": 94167, "epoch": 2242} {"train_loss": -6.258536338806152, "global_step": 94168, "epoch": 2242} {"train_loss": -6.187114238739014, "global_step": 94169, "epoch": 2242} {"train_loss": -6.1101484298706055, "global_step": 94170, "epoch": 2242} {"train_loss": -6.231344223022461, "global_step": 94171, "epoch": 2242} {"train_loss": -6.140650272369385, "global_step": 94172, "epoch": 2242} {"train_loss": -6.098670482635498, "global_step": 94173, "epoch": 2242} {"train_loss": -6.312830924987793, "global_step": 94174, "epoch": 2242} {"train_loss": -6.15447998046875, "global_step": 94175, "epoch": 2242} {"train_loss": -6.274458885192871, "global_step": 94176, "epoch": 2242} {"train_loss": -6.232608795166016, "global_step": 94177, "epoch": 2242} {"train_loss": -6.21107816696167, "global_step": 94178, "epoch": 2242} {"train_loss": -6.282487869262695, "global_step": 94179, "epoch": 2242} {"train_loss": -6.364166259765625, "global_step": 94180, "epoch": 2242} {"train_loss": -6.17799186706543, "global_step": 94181, "epoch": 2242} {"train_loss": -6.175729751586914, "global_step": 94182, "epoch": 2242} {"train_loss": -6.399251461029053, "global_step": 94183, "epoch": 2242} {"train_loss": -6.215662956237793, "global_step": 94184, "epoch": 2242} {"train_loss": -6.24342155456543, "global_step": 94185, "epoch": 2242} {"train_loss": -6.191657066345215, "global_step": 94186, "epoch": 2242} {"train_loss": -6.280175685882568, "global_step": 94187, "epoch": 2242} {"train_loss": -6.304139137268066, "global_step": 94188, "epoch": 2242} {"train_loss": -6.234011173248291, "global_step": 94189, "epoch": 2242} {"train_loss": -6.283215522766113, "global_step": 94190, "epoch": 2242} {"train_loss": -6.320995807647705, "global_step": 94191, "epoch": 2242} {"train_loss": -6.301648139953613, "global_step": 94192, "epoch": 2242} {"train_loss": -6.347437858581543, "global_step": 94193, "epoch": 2242} {"train_loss": -6.17181396484375, "global_step": 94194, "epoch": 2242} {"train_loss": -6.289825439453125, "global_step": 94195, "epoch": 2242} {"train_loss": -6.332821846008301, "global_step": 94196, "epoch": 2242} {"train_loss": -6.321802139282227, "global_step": 94197, "epoch": 2242} {"train_loss": -6.200376510620117, "global_step": 94198, "epoch": 2242} {"train_loss": -6.32372522354126, "global_step": 94199, "epoch": 2242} {"train_loss": -6.234594345092773, "global_step": 94200, "epoch": 2242} {"train_loss": -6.255384922027588, "global_step": 94201, "epoch": 2242} {"train_loss": -6.09991455078125, "global_step": 94202, "epoch": 2242} {"train_loss": -6.335077285766602, "global_step": 94203, "epoch": 2242} {"train_loss": -6.390171051025391, "global_step": 94204, "epoch": 2242} {"train_loss": -6.254873014631725, "global_step": 94205, "epoch": 2242, "val_loss": 75501.9453125} {"train_loss": -6.300023555755615, "global_step": 94206, "epoch": 2243} {"train_loss": -6.316166400909424, "global_step": 94207, "epoch": 2243} {"train_loss": -6.319202899932861, "global_step": 94208, "epoch": 2243} {"train_loss": -6.163824558258057, "global_step": 94209, "epoch": 2243} {"train_loss": -6.238740921020508, "global_step": 94210, "epoch": 2243} {"train_loss": -6.345481872558594, "global_step": 94211, "epoch": 2243} {"train_loss": -6.281881332397461, "global_step": 94212, "epoch": 2243} {"train_loss": -6.294528961181641, "global_step": 94213, "epoch": 2243} {"train_loss": -6.334599494934082, "global_step": 94214, "epoch": 2243} {"train_loss": -6.344261169433594, "global_step": 94215, "epoch": 2243} {"train_loss": -6.22209358215332, "global_step": 94216, "epoch": 2243} {"train_loss": -6.289926052093506, "global_step": 94217, "epoch": 2243} {"train_loss": -6.32157039642334, "global_step": 94218, "epoch": 2243} {"train_loss": -6.384008407592773, "global_step": 94219, "epoch": 2243} {"train_loss": -6.234441757202148, "global_step": 94220, "epoch": 2243} {"train_loss": -6.22084903717041, "global_step": 94221, "epoch": 2243} {"train_loss": -6.370983600616455, "global_step": 94222, "epoch": 2243} {"train_loss": -6.271636962890625, "global_step": 94223, "epoch": 2243} {"train_loss": -6.12961483001709, "global_step": 94224, "epoch": 2243} {"train_loss": -6.340409755706787, "global_step": 94225, "epoch": 2243} {"train_loss": -6.276810646057129, "global_step": 94226, "epoch": 2243} {"train_loss": -6.1311845779418945, "global_step": 94227, "epoch": 2243} {"train_loss": -6.303536415100098, "global_step": 94228, "epoch": 2243} {"train_loss": -6.232850551605225, "global_step": 94229, "epoch": 2243} {"train_loss": -6.276165962219238, "global_step": 94230, "epoch": 2243} {"train_loss": -6.346966743469238, "global_step": 94231, "epoch": 2243} {"train_loss": -6.105201721191406, "global_step": 94232, "epoch": 2243} {"train_loss": -6.318674087524414, "global_step": 94233, "epoch": 2243} {"train_loss": -6.390974998474121, "global_step": 94234, "epoch": 2243} {"train_loss": -6.20626163482666, "global_step": 94235, "epoch": 2243} {"train_loss": -6.262773513793945, "global_step": 94236, "epoch": 2243} {"train_loss": -6.24704647064209, "global_step": 94237, "epoch": 2243} {"train_loss": -6.284436225891113, "global_step": 94238, "epoch": 2243} {"train_loss": -6.1453752517700195, "global_step": 94239, "epoch": 2243} {"train_loss": -6.204837799072266, "global_step": 94240, "epoch": 2243} {"train_loss": -6.32858943939209, "global_step": 94241, "epoch": 2243} {"train_loss": -6.180327892303467, "global_step": 94242, "epoch": 2243} {"train_loss": -6.322042465209961, "global_step": 94243, "epoch": 2243} {"train_loss": -6.422943115234375, "global_step": 94244, "epoch": 2243} {"train_loss": -6.193856239318848, "global_step": 94245, "epoch": 2243} {"train_loss": -6.135527610778809, "global_step": 94246, "epoch": 2243} {"train_loss": -6.273258992603847, "global_step": 94247, "epoch": 2243, "val_loss": 75490.5859375} {"train_loss": -6.266584873199463, "global_step": 94248, "epoch": 2244} {"train_loss": -6.381747245788574, "global_step": 94249, "epoch": 2244} {"train_loss": -6.2506866455078125, "global_step": 94250, "epoch": 2244} {"train_loss": -6.418990612030029, "global_step": 94251, "epoch": 2244} {"train_loss": -6.169801712036133, "global_step": 94252, "epoch": 2244} {"train_loss": -6.202922821044922, "global_step": 94253, "epoch": 2244} {"train_loss": -6.260623931884766, "global_step": 94254, "epoch": 2244} {"train_loss": -6.13771390914917, "global_step": 94255, "epoch": 2244} {"train_loss": -6.237727165222168, "global_step": 94256, "epoch": 2244} {"train_loss": -6.033302307128906, "global_step": 94257, "epoch": 2244} {"train_loss": -6.208184719085693, "global_step": 94258, "epoch": 2244} {"train_loss": -6.362194061279297, "global_step": 94259, "epoch": 2244} {"train_loss": -6.258488178253174, "global_step": 94260, "epoch": 2244} {"train_loss": -6.234589576721191, "global_step": 94261, "epoch": 2244} {"train_loss": -6.234942436218262, "global_step": 94262, "epoch": 2244} {"train_loss": -6.17717170715332, "global_step": 94263, "epoch": 2244} {"train_loss": -6.133655548095703, "global_step": 94264, "epoch": 2244} {"train_loss": -6.317025184631348, "global_step": 94265, "epoch": 2244} {"train_loss": -6.227813720703125, "global_step": 94266, "epoch": 2244} {"train_loss": -6.0836663246154785, "global_step": 94267, "epoch": 2244} {"train_loss": -6.242015838623047, "global_step": 94268, "epoch": 2244} {"train_loss": -6.204440116882324, "global_step": 94269, "epoch": 2244} {"train_loss": -6.318299293518066, "global_step": 94270, "epoch": 2244} {"train_loss": -6.282553195953369, "global_step": 94271, "epoch": 2244} {"train_loss": -6.221160888671875, "global_step": 94272, "epoch": 2244} {"train_loss": -6.243011474609375, "global_step": 94273, "epoch": 2244} {"train_loss": -6.242420196533203, "global_step": 94274, "epoch": 2244} {"train_loss": -6.202485084533691, "global_step": 94275, "epoch": 2244} {"train_loss": -6.359487056732178, "global_step": 94276, "epoch": 2244} {"train_loss": -6.228766441345215, "global_step": 94277, "epoch": 2244} {"train_loss": -6.221323013305664, "global_step": 94278, "epoch": 2244} {"train_loss": -6.204625129699707, "global_step": 94279, "epoch": 2244} {"train_loss": -6.332008361816406, "global_step": 94280, "epoch": 2244} {"train_loss": -6.299388885498047, "global_step": 94281, "epoch": 2244} {"train_loss": -6.375530242919922, "global_step": 94282, "epoch": 2244} {"train_loss": -6.150786876678467, "global_step": 94283, "epoch": 2244} {"train_loss": -6.228328704833984, "global_step": 94284, "epoch": 2244} {"train_loss": -6.195127487182617, "global_step": 94285, "epoch": 2244} {"train_loss": -6.1847028732299805, "global_step": 94286, "epoch": 2244} {"train_loss": -6.178140163421631, "global_step": 94287, "epoch": 2244} {"train_loss": -6.282707214355469, "global_step": 94288, "epoch": 2244} {"train_loss": -6.238355761482602, "global_step": 94289, "epoch": 2244, "val_loss": 75266.21875} {"train_loss": -6.259546279907227, "global_step": 94290, "epoch": 2245} {"train_loss": -6.15898323059082, "global_step": 94291, "epoch": 2245} {"train_loss": -6.3129167556762695, "global_step": 94292, "epoch": 2245} {"train_loss": -6.3192830085754395, "global_step": 94293, "epoch": 2245} {"train_loss": -6.231354713439941, "global_step": 94294, "epoch": 2245} {"train_loss": -6.251528739929199, "global_step": 94295, "epoch": 2245} {"train_loss": -6.212841510772705, "global_step": 94296, "epoch": 2245} {"train_loss": -6.273001194000244, "global_step": 94297, "epoch": 2245} {"train_loss": -6.3116960525512695, "global_step": 94298, "epoch": 2245} {"train_loss": -6.298275947570801, "global_step": 94299, "epoch": 2245} {"train_loss": -6.106043815612793, "global_step": 94300, "epoch": 2245} {"train_loss": -6.168815612792969, "global_step": 94301, "epoch": 2245} {"train_loss": -6.308795928955078, "global_step": 94302, "epoch": 2245} {"train_loss": -6.335838317871094, "global_step": 94303, "epoch": 2245} {"train_loss": -6.290560245513916, "global_step": 94304, "epoch": 2245} {"train_loss": -6.230197906494141, "global_step": 94305, "epoch": 2245} {"train_loss": -6.3215742111206055, "global_step": 94306, "epoch": 2245} {"train_loss": -6.256478309631348, "global_step": 94307, "epoch": 2245} {"train_loss": -6.258648872375488, "global_step": 94308, "epoch": 2245} {"train_loss": -6.297677040100098, "global_step": 94309, "epoch": 2245} {"train_loss": -6.237936973571777, "global_step": 94310, "epoch": 2245} {"train_loss": -6.3827619552612305, "global_step": 94311, "epoch": 2245} {"train_loss": -6.380767822265625, "global_step": 94312, "epoch": 2245} {"train_loss": -6.340677738189697, "global_step": 94313, "epoch": 2245} {"train_loss": -6.339420795440674, "global_step": 94314, "epoch": 2245} {"train_loss": -6.308454990386963, "global_step": 94315, "epoch": 2245} {"train_loss": -6.240453243255615, "global_step": 94316, "epoch": 2245} {"train_loss": -6.396300315856934, "global_step": 94317, "epoch": 2245} {"train_loss": -6.254727363586426, "global_step": 94318, "epoch": 2245} {"train_loss": -6.234832286834717, "global_step": 94319, "epoch": 2245} {"train_loss": -6.36752462387085, "global_step": 94320, "epoch": 2245} {"train_loss": -6.291613578796387, "global_step": 94321, "epoch": 2245} {"train_loss": -6.259378433227539, "global_step": 94322, "epoch": 2245} {"train_loss": -6.405067443847656, "global_step": 94323, "epoch": 2245} {"train_loss": -6.429732799530029, "global_step": 94324, "epoch": 2245} {"train_loss": -6.330267906188965, "global_step": 94325, "epoch": 2245} {"train_loss": -6.341404914855957, "global_step": 94326, "epoch": 2245} {"train_loss": -6.360965728759766, "global_step": 94327, "epoch": 2245} {"train_loss": -6.356684684753418, "global_step": 94328, "epoch": 2245} {"train_loss": -6.273547649383545, "global_step": 94329, "epoch": 2245} {"train_loss": -6.274632453918457, "global_step": 94330, "epoch": 2245} {"train_loss": -6.294408627918789, "global_step": 94331, "epoch": 2245, "val_loss": 75147.9921875} {"train_loss": -6.351601600646973, "global_step": 94332, "epoch": 2246} {"train_loss": -6.425033092498779, "global_step": 94333, "epoch": 2246} {"train_loss": -6.277235507965088, "global_step": 94334, "epoch": 2246} {"train_loss": -6.257724285125732, "global_step": 94335, "epoch": 2246} {"train_loss": -6.356276035308838, "global_step": 94336, "epoch": 2246} {"train_loss": -6.255568504333496, "global_step": 94337, "epoch": 2246} {"train_loss": -6.482551574707031, "global_step": 94338, "epoch": 2246} {"train_loss": -6.301363945007324, "global_step": 94339, "epoch": 2246} {"train_loss": -6.275145530700684, "global_step": 94340, "epoch": 2246} {"train_loss": -6.258640289306641, "global_step": 94341, "epoch": 2246} {"train_loss": -6.3151960372924805, "global_step": 94342, "epoch": 2246} {"train_loss": -6.376402854919434, "global_step": 94343, "epoch": 2246} {"train_loss": -6.423316955566406, "global_step": 94344, "epoch": 2246} {"train_loss": -6.32028341293335, "global_step": 94345, "epoch": 2246} {"train_loss": -6.399200439453125, "global_step": 94346, "epoch": 2246} {"train_loss": -6.290290355682373, "global_step": 94347, "epoch": 2246} {"train_loss": -6.320009231567383, "global_step": 94348, "epoch": 2246} {"train_loss": -6.307513236999512, "global_step": 94349, "epoch": 2246} {"train_loss": -6.301061630249023, "global_step": 94350, "epoch": 2246} {"train_loss": -6.375682353973389, "global_step": 94351, "epoch": 2246} {"train_loss": -6.411021709442139, "global_step": 94352, "epoch": 2246} {"train_loss": -6.273758888244629, "global_step": 94353, "epoch": 2246} {"train_loss": -6.331510543823242, "global_step": 94354, "epoch": 2246} {"train_loss": -6.298744201660156, "global_step": 94355, "epoch": 2246} {"train_loss": -6.337406158447266, "global_step": 94356, "epoch": 2246} {"train_loss": -6.379400253295898, "global_step": 94357, "epoch": 2246} {"train_loss": -6.297807693481445, "global_step": 94358, "epoch": 2246} {"train_loss": -6.473581314086914, "global_step": 94359, "epoch": 2246} {"train_loss": -6.3086748123168945, "global_step": 94360, "epoch": 2246} {"train_loss": -6.266895294189453, "global_step": 94361, "epoch": 2246} {"train_loss": -6.363421440124512, "global_step": 94362, "epoch": 2246} {"train_loss": -6.340033054351807, "global_step": 94363, "epoch": 2246} {"train_loss": -6.348721504211426, "global_step": 94364, "epoch": 2246} {"train_loss": -6.231636047363281, "global_step": 94365, "epoch": 2246} {"train_loss": -6.304271221160889, "global_step": 94366, "epoch": 2246} {"train_loss": -6.359389305114746, "global_step": 94367, "epoch": 2246} {"train_loss": -6.172698497772217, "global_step": 94368, "epoch": 2246} {"train_loss": -6.440077781677246, "global_step": 94369, "epoch": 2246} {"train_loss": -6.326890468597412, "global_step": 94370, "epoch": 2246} {"train_loss": -6.279789924621582, "global_step": 94371, "epoch": 2246} {"train_loss": -6.312132835388184, "global_step": 94372, "epoch": 2246} {"train_loss": -6.326210544222877, "global_step": 94373, "epoch": 2246, "val_loss": 75431.984375} {"train_loss": -6.414251804351807, "global_step": 94374, "epoch": 2247} {"train_loss": -6.256153583526611, "global_step": 94375, "epoch": 2247} {"train_loss": -6.310781478881836, "global_step": 94376, "epoch": 2247} {"train_loss": -6.303015232086182, "global_step": 94377, "epoch": 2247} {"train_loss": -6.269940376281738, "global_step": 94378, "epoch": 2247} {"train_loss": -6.283916473388672, "global_step": 94379, "epoch": 2247} {"train_loss": -6.251228332519531, "global_step": 94380, "epoch": 2247} {"train_loss": -6.281330108642578, "global_step": 94381, "epoch": 2247} {"train_loss": -6.319037437438965, "global_step": 94382, "epoch": 2247} {"train_loss": -6.285912036895752, "global_step": 94383, "epoch": 2247} {"train_loss": -6.292370319366455, "global_step": 94384, "epoch": 2247} {"train_loss": -6.314424514770508, "global_step": 94385, "epoch": 2247} {"train_loss": -6.31948184967041, "global_step": 94386, "epoch": 2247} {"train_loss": -6.270119667053223, "global_step": 94387, "epoch": 2247} {"train_loss": -6.323408126831055, "global_step": 94388, "epoch": 2247} {"train_loss": -6.246833324432373, "global_step": 94389, "epoch": 2247} {"train_loss": -6.304270267486572, "global_step": 94390, "epoch": 2247} {"train_loss": -6.2925615310668945, "global_step": 94391, "epoch": 2247} {"train_loss": -6.231642723083496, "global_step": 94392, "epoch": 2247} {"train_loss": -6.351254463195801, "global_step": 94393, "epoch": 2247} {"train_loss": -6.40802001953125, "global_step": 94394, "epoch": 2247} {"train_loss": -6.407243728637695, "global_step": 94395, "epoch": 2247} {"train_loss": -6.286221981048584, "global_step": 94396, "epoch": 2247} {"train_loss": -6.309689521789551, "global_step": 94397, "epoch": 2247} {"train_loss": -6.351324081420898, "global_step": 94398, "epoch": 2247} {"train_loss": -6.31564474105835, "global_step": 94399, "epoch": 2247} {"train_loss": -6.317943572998047, "global_step": 94400, "epoch": 2247} {"train_loss": -6.330939292907715, "global_step": 94401, "epoch": 2247} {"train_loss": -6.258833408355713, "global_step": 94402, "epoch": 2247} {"train_loss": -6.211127281188965, "global_step": 94403, "epoch": 2247} {"train_loss": -6.263642311096191, "global_step": 94404, "epoch": 2247} {"train_loss": -6.407567977905273, "global_step": 94405, "epoch": 2247} {"train_loss": -6.39669942855835, "global_step": 94406, "epoch": 2247} {"train_loss": -6.273535251617432, "global_step": 94407, "epoch": 2247} {"train_loss": -6.258257865905762, "global_step": 94408, "epoch": 2247} {"train_loss": -6.372396469116211, "global_step": 94409, "epoch": 2247} {"train_loss": -6.2524003982543945, "global_step": 94410, "epoch": 2247} {"train_loss": -6.290443420410156, "global_step": 94411, "epoch": 2247} {"train_loss": -6.37314510345459, "global_step": 94412, "epoch": 2247} {"train_loss": -6.216118335723877, "global_step": 94413, "epoch": 2247} {"train_loss": -6.274803161621094, "global_step": 94414, "epoch": 2247} {"train_loss": -6.302385262080601, "global_step": 94415, "epoch": 2247, "val_loss": 75805.921875} {"train_loss": -6.313234329223633, "global_step": 94416, "epoch": 2248} {"train_loss": -6.284584045410156, "global_step": 94417, "epoch": 2248} {"train_loss": -6.187868118286133, "global_step": 94418, "epoch": 2248} {"train_loss": -6.25540828704834, "global_step": 94419, "epoch": 2248} {"train_loss": -6.241120338439941, "global_step": 94420, "epoch": 2248} {"train_loss": -6.205771446228027, "global_step": 94421, "epoch": 2248} {"train_loss": -6.2801618576049805, "global_step": 94422, "epoch": 2248} {"train_loss": -6.180347442626953, "global_step": 94423, "epoch": 2248} {"train_loss": -6.385507583618164, "global_step": 94424, "epoch": 2248} {"train_loss": -6.356182098388672, "global_step": 94425, "epoch": 2248} {"train_loss": -6.341845512390137, "global_step": 94426, "epoch": 2248} {"train_loss": -6.3329033851623535, "global_step": 94427, "epoch": 2248} {"train_loss": -6.136455535888672, "global_step": 94428, "epoch": 2248} {"train_loss": -6.36004638671875, "global_step": 94429, "epoch": 2248} {"train_loss": -6.308642864227295, "global_step": 94430, "epoch": 2248} {"train_loss": -6.337035179138184, "global_step": 94431, "epoch": 2248} {"train_loss": -6.336635589599609, "global_step": 94432, "epoch": 2248} {"train_loss": -6.44444465637207, "global_step": 94433, "epoch": 2248} {"train_loss": -6.37992000579834, "global_step": 94434, "epoch": 2248} {"train_loss": -6.39437198638916, "global_step": 94435, "epoch": 2248} {"train_loss": -6.326072692871094, "global_step": 94436, "epoch": 2248} {"train_loss": -6.260950565338135, "global_step": 94437, "epoch": 2248} {"train_loss": -6.412154674530029, "global_step": 94438, "epoch": 2248} {"train_loss": -6.349580764770508, "global_step": 94439, "epoch": 2248} {"train_loss": -6.275759696960449, "global_step": 94440, "epoch": 2248} {"train_loss": -6.290493011474609, "global_step": 94441, "epoch": 2248} {"train_loss": -6.277530670166016, "global_step": 94442, "epoch": 2248} {"train_loss": -6.382264614105225, "global_step": 94443, "epoch": 2248} {"train_loss": -6.390517234802246, "global_step": 94444, "epoch": 2248} {"train_loss": -6.465723037719727, "global_step": 94445, "epoch": 2248} {"train_loss": -6.280327796936035, "global_step": 94446, "epoch": 2248} {"train_loss": -6.398981094360352, "global_step": 94447, "epoch": 2248} {"train_loss": -6.253705978393555, "global_step": 94448, "epoch": 2248} {"train_loss": -6.290241718292236, "global_step": 94449, "epoch": 2248} {"train_loss": -6.3698320388793945, "global_step": 94450, "epoch": 2248} {"train_loss": -6.320440769195557, "global_step": 94451, "epoch": 2248} {"train_loss": -6.3270039558410645, "global_step": 94452, "epoch": 2248} {"train_loss": -6.256890296936035, "global_step": 94453, "epoch": 2248} {"train_loss": -6.325842380523682, "global_step": 94454, "epoch": 2248} {"train_loss": -6.28809928894043, "global_step": 94455, "epoch": 2248} {"train_loss": -6.287440299987793, "global_step": 94456, "epoch": 2248} {"train_loss": -6.313506977898734, "global_step": 94457, "epoch": 2248, "val_loss": 75580.6953125} {"train_loss": -6.363661766052246, "global_step": 94458, "epoch": 2249} {"train_loss": -6.337677001953125, "global_step": 94459, "epoch": 2249} {"train_loss": -6.346061706542969, "global_step": 94460, "epoch": 2249} {"train_loss": -6.311648845672607, "global_step": 94461, "epoch": 2249} {"train_loss": -6.298742294311523, "global_step": 94462, "epoch": 2249} {"train_loss": -6.351964473724365, "global_step": 94463, "epoch": 2249} {"train_loss": -6.3930816650390625, "global_step": 94464, "epoch": 2249} {"train_loss": -6.387957572937012, "global_step": 94465, "epoch": 2249} {"train_loss": -6.280766010284424, "global_step": 94466, "epoch": 2249} {"train_loss": -6.316059112548828, "global_step": 94467, "epoch": 2249} {"train_loss": -6.39089822769165, "global_step": 94468, "epoch": 2249} {"train_loss": -6.33701753616333, "global_step": 94469, "epoch": 2249} {"train_loss": -6.285736083984375, "global_step": 94470, "epoch": 2249} {"train_loss": -6.266044616699219, "global_step": 94471, "epoch": 2249} {"train_loss": -6.427883148193359, "global_step": 94472, "epoch": 2249} {"train_loss": -6.347517013549805, "global_step": 94473, "epoch": 2249} {"train_loss": -6.276392936706543, "global_step": 94474, "epoch": 2249} {"train_loss": -6.285618782043457, "global_step": 94475, "epoch": 2249} {"train_loss": -6.336319446563721, "global_step": 94476, "epoch": 2249} {"train_loss": -6.172428607940674, "global_step": 94477, "epoch": 2249} {"train_loss": -6.286334991455078, "global_step": 94478, "epoch": 2249} {"train_loss": -6.255826473236084, "global_step": 94479, "epoch": 2249} {"train_loss": -6.24909782409668, "global_step": 94480, "epoch": 2249} {"train_loss": -6.40806770324707, "global_step": 94481, "epoch": 2249} {"train_loss": -6.277743339538574, "global_step": 94482, "epoch": 2249} {"train_loss": -6.297198295593262, "global_step": 94483, "epoch": 2249} {"train_loss": -6.249725341796875, "global_step": 94484, "epoch": 2249} {"train_loss": -6.3608784675598145, "global_step": 94485, "epoch": 2249} {"train_loss": -6.36373233795166, "global_step": 94486, "epoch": 2249} {"train_loss": -6.34434700012207, "global_step": 94487, "epoch": 2249} {"train_loss": -6.284053802490234, "global_step": 94488, "epoch": 2249} {"train_loss": -6.388861656188965, "global_step": 94489, "epoch": 2249} {"train_loss": -6.420255661010742, "global_step": 94490, "epoch": 2249} {"train_loss": -6.201806545257568, "global_step": 94491, "epoch": 2249} {"train_loss": -6.344675064086914, "global_step": 94492, "epoch": 2249} {"train_loss": -6.225085735321045, "global_step": 94493, "epoch": 2249} {"train_loss": -6.206316947937012, "global_step": 94494, "epoch": 2249} {"train_loss": -6.398204803466797, "global_step": 94495, "epoch": 2249} {"train_loss": -6.239779949188232, "global_step": 94496, "epoch": 2249} {"train_loss": -6.317452430725098, "global_step": 94497, "epoch": 2249} {"train_loss": -6.301714897155762, "global_step": 94498, "epoch": 2249} {"train_loss": -6.314204988025484, "global_step": 94499, "epoch": 2249, "val_loss": 75390.640625} {"train_loss": -6.310542583465576, "global_step": 94500, "epoch": 2250} {"train_loss": -6.307113170623779, "global_step": 94501, "epoch": 2250} {"train_loss": -6.252913475036621, "global_step": 94502, "epoch": 2250} {"train_loss": -6.371143817901611, "global_step": 94503, "epoch": 2250} {"train_loss": -6.413299083709717, "global_step": 94504, "epoch": 2250} {"train_loss": -6.269725799560547, "global_step": 94505, "epoch": 2250} {"train_loss": -6.355474472045898, "global_step": 94506, "epoch": 2250} {"train_loss": -6.287649154663086, "global_step": 94507, "epoch": 2250} {"train_loss": -6.224490165710449, "global_step": 94508, "epoch": 2250} {"train_loss": -6.189344882965088, "global_step": 94509, "epoch": 2250} {"train_loss": -6.322341442108154, "global_step": 94510, "epoch": 2250} {"train_loss": -6.32536506652832, "global_step": 94511, "epoch": 2250} {"train_loss": -6.284857749938965, "global_step": 94512, "epoch": 2250} {"train_loss": -6.289610862731934, "global_step": 94513, "epoch": 2250} {"train_loss": -6.341793060302734, "global_step": 94514, "epoch": 2250} {"train_loss": -6.254094123840332, "global_step": 94515, "epoch": 2250} {"train_loss": -6.292877197265625, "global_step": 94516, "epoch": 2250} {"train_loss": -6.174301624298096, "global_step": 94517, "epoch": 2250} {"train_loss": -6.254538059234619, "global_step": 94518, "epoch": 2250} {"train_loss": -6.336505889892578, "global_step": 94519, "epoch": 2250} {"train_loss": -6.183704376220703, "global_step": 94520, "epoch": 2250} {"train_loss": -6.338377952575684, "global_step": 94521, "epoch": 2250} {"train_loss": -6.353233337402344, "global_step": 94522, "epoch": 2250} {"train_loss": -6.214117050170898, "global_step": 94523, "epoch": 2250} {"train_loss": -6.347031593322754, "global_step": 94524, "epoch": 2250} {"train_loss": -6.380556106567383, "global_step": 94525, "epoch": 2250} {"train_loss": -6.259577751159668, "global_step": 94526, "epoch": 2250} {"train_loss": -6.333366870880127, "global_step": 94527, "epoch": 2250} {"train_loss": -6.352770805358887, "global_step": 94528, "epoch": 2250} {"train_loss": -6.2767653465271, "global_step": 94529, "epoch": 2250} {"train_loss": -6.38446044921875, "global_step": 94530, "epoch": 2250} {"train_loss": -6.3169121742248535, "global_step": 94531, "epoch": 2250} {"train_loss": -6.439756393432617, "global_step": 94532, "epoch": 2250} {"train_loss": -6.316924095153809, "global_step": 94533, "epoch": 2250} {"train_loss": -6.206430435180664, "global_step": 94534, "epoch": 2250} {"train_loss": -6.241330146789551, "global_step": 94535, "epoch": 2250} {"train_loss": -6.303356647491455, "global_step": 94536, "epoch": 2250} {"train_loss": -6.3251190185546875, "global_step": 94537, "epoch": 2250} {"train_loss": -6.262618064880371, "global_step": 94538, "epoch": 2250} {"train_loss": -6.309269428253174, "global_step": 94539, "epoch": 2250} {"train_loss": -6.2393646240234375, "global_step": 94540, "epoch": 2250} {"train_loss": -6.297072535469418, "global_step": 94541, "epoch": 2250, "train/sim_max_reward_0": 0.3962173295366464, "train/sim_max_reward_1": 0.6702661144591038, "train/sim_max_reward_2": 0.4914833962282126, "train/sim_max_reward_3": 0.1389962229586898, "train/sim_max_reward_4": 0.9835450367579419, "train/sim_max_reward_5": 1.0, "test/sim_max_reward_4500000": 0.48032342350453705, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.4633800689322785, "test/sim_max_reward_4500005": 0.9457972416470011, "test/sim_max_reward_4500006": 0.9508101952094697, "test/sim_max_reward_4500007": 0.9027935632819295, "test/sim_max_reward_4500008": 0.1778536544110381, "test/sim_max_reward_4500009": 0.9363861761752365, "test/sim_max_reward_4500010": 0.9389008005939723, "test/sim_max_reward_4500011": 0.39041409427516055, "test/sim_max_reward_4500012": 0.8884604463717987, "test/sim_max_reward_4500013": 0.0, "test/sim_max_reward_4500014": 0.37818455266573775, "test/sim_max_reward_4500015": 0.9094769538691201, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.2521745589399837, "test/sim_max_reward_4500018": 0.16073176218105734, "test/sim_max_reward_4500019": 0.7763729755808241, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.6250636022803994, "test/sim_max_reward_4500022": 0.9034132238189478, "test/sim_max_reward_4500023": 0.5279045202000835, "test/sim_max_reward_4500024": 0.7684389325177111, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.8998155690899496, "test/sim_max_reward_4500027": 0.42711062701129016, "test/sim_max_reward_4500028": 0.2005416771303583, "test/sim_max_reward_4500029": 0.22164174582774568, "test/sim_max_reward_4500030": 0.8215631155807086, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05374881488993434, "test/sim_max_reward_4500033": 0.953308515870041, "test/sim_max_reward_4500034": 1.0, "test/sim_max_reward_4500035": 0.8263577732564601, "test/sim_max_reward_4500036": 0.36063732975281737, "test/sim_max_reward_4500037": 0.826683548261979, "test/sim_max_reward_4500038": 0.3410758709134456, "test/sim_max_reward_4500039": 0.897263282416362, "test/sim_max_reward_4500040": 0.9016095802784757, "test/sim_max_reward_4500041": 0.9428832098506106, "test/sim_max_reward_4500042": 0.3115510671366396, "test/sim_max_reward_4500043": 0.5423736240388268, "test/sim_max_reward_4500044": 0.036642901876102314, "test/sim_max_reward_4500045": 0.15206356688731204, "test/sim_max_reward_4500046": 0.7295959101743623, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.02447067561458527, "train/mean_score": 0.6134180166567658, "test/mean_score": 0.5373072662075775, "val_loss": 75747.3515625} {"train_loss": -6.279278755187988, "global_step": 94542, "epoch": 2251} {"train_loss": -6.214319229125977, "global_step": 94543, "epoch": 2251} {"train_loss": -6.3009443283081055, "global_step": 94544, "epoch": 2251} {"train_loss": -6.278916835784912, "global_step": 94545, "epoch": 2251} {"train_loss": -6.269447326660156, "global_step": 94546, "epoch": 2251} {"train_loss": -6.327020645141602, "global_step": 94547, "epoch": 2251} {"train_loss": -6.288681983947754, "global_step": 94548, "epoch": 2251} {"train_loss": -6.1512298583984375, "global_step": 94549, "epoch": 2251} {"train_loss": -6.296586036682129, "global_step": 94550, "epoch": 2251} {"train_loss": -6.194953918457031, "global_step": 94551, "epoch": 2251} {"train_loss": -6.380709171295166, "global_step": 94552, "epoch": 2251} {"train_loss": -6.368525505065918, "global_step": 94553, "epoch": 2251} {"train_loss": -6.1879963874816895, "global_step": 94554, "epoch": 2251} {"train_loss": -6.310368537902832, "global_step": 94555, "epoch": 2251} {"train_loss": -6.247651100158691, "global_step": 94556, "epoch": 2251} {"train_loss": -6.292804718017578, "global_step": 94557, "epoch": 2251} {"train_loss": -6.327025890350342, "global_step": 94558, "epoch": 2251} {"train_loss": -6.249009132385254, "global_step": 94559, "epoch": 2251} {"train_loss": -6.323838710784912, "global_step": 94560, "epoch": 2251} {"train_loss": -6.237092018127441, "global_step": 94561, "epoch": 2251} {"train_loss": -6.246652126312256, "global_step": 94562, "epoch": 2251} {"train_loss": -6.235464572906494, "global_step": 94563, "epoch": 2251} {"train_loss": -6.29916524887085, "global_step": 94564, "epoch": 2251} {"train_loss": -6.142773151397705, "global_step": 94565, "epoch": 2251} {"train_loss": -6.196233749389648, "global_step": 94566, "epoch": 2251} {"train_loss": -6.258430480957031, "global_step": 94567, "epoch": 2251} {"train_loss": -6.117249011993408, "global_step": 94568, "epoch": 2251} {"train_loss": -6.262491703033447, "global_step": 94569, "epoch": 2251} {"train_loss": -6.218470096588135, "global_step": 94570, "epoch": 2251} {"train_loss": -6.18079948425293, "global_step": 94571, "epoch": 2251} {"train_loss": -6.242424011230469, "global_step": 94572, "epoch": 2251} {"train_loss": -6.223396301269531, "global_step": 94573, "epoch": 2251} {"train_loss": -6.259991645812988, "global_step": 94574, "epoch": 2251} {"train_loss": -6.19346284866333, "global_step": 94575, "epoch": 2251} {"train_loss": -6.14066743850708, "global_step": 94576, "epoch": 2251} {"train_loss": -6.1987810134887695, "global_step": 94577, "epoch": 2251} {"train_loss": -6.121413230895996, "global_step": 94578, "epoch": 2251} {"train_loss": -6.2575178146362305, "global_step": 94579, "epoch": 2251} {"train_loss": -6.370944976806641, "global_step": 94580, "epoch": 2251} {"train_loss": -6.274443626403809, "global_step": 94581, "epoch": 2251} {"train_loss": -6.2409515380859375, "global_step": 94582, "epoch": 2251} {"train_loss": -6.249073255629766, "global_step": 94583, "epoch": 2251, "val_loss": 75357.140625} {"train_loss": -6.314984321594238, "global_step": 94584, "epoch": 2252} {"train_loss": -6.229776859283447, "global_step": 94585, "epoch": 2252} {"train_loss": -6.352922439575195, "global_step": 94586, "epoch": 2252} {"train_loss": -6.385312557220459, "global_step": 94587, "epoch": 2252} {"train_loss": -6.362330913543701, "global_step": 94588, "epoch": 2252} {"train_loss": -6.1289167404174805, "global_step": 94589, "epoch": 2252} {"train_loss": -6.512754917144775, "global_step": 94590, "epoch": 2252} {"train_loss": -6.217423439025879, "global_step": 94591, "epoch": 2252} {"train_loss": -6.280010223388672, "global_step": 94592, "epoch": 2252} {"train_loss": -6.304839611053467, "global_step": 94593, "epoch": 2252} {"train_loss": -6.201487064361572, "global_step": 94594, "epoch": 2252} {"train_loss": -6.344213962554932, "global_step": 94595, "epoch": 2252} {"train_loss": -6.189393043518066, "global_step": 94596, "epoch": 2252} {"train_loss": -6.3274760246276855, "global_step": 94597, "epoch": 2252} {"train_loss": -6.267555236816406, "global_step": 94598, "epoch": 2252} {"train_loss": -6.279669761657715, "global_step": 94599, "epoch": 2252} {"train_loss": -6.24220085144043, "global_step": 94600, "epoch": 2252} {"train_loss": -6.128192901611328, "global_step": 94601, "epoch": 2252} {"train_loss": -6.34299898147583, "global_step": 94602, "epoch": 2252} {"train_loss": -6.191889762878418, "global_step": 94603, "epoch": 2252} {"train_loss": -6.296282768249512, "global_step": 94604, "epoch": 2252} {"train_loss": -6.258482456207275, "global_step": 94605, "epoch": 2252} {"train_loss": -6.326216697692871, "global_step": 94606, "epoch": 2252} {"train_loss": -6.262709140777588, "global_step": 94607, "epoch": 2252} {"train_loss": -6.380558967590332, "global_step": 94608, "epoch": 2252} {"train_loss": -6.311057090759277, "global_step": 94609, "epoch": 2252} {"train_loss": -6.44423246383667, "global_step": 94610, "epoch": 2252} {"train_loss": -6.238694667816162, "global_step": 94611, "epoch": 2252} {"train_loss": -6.233187675476074, "global_step": 94612, "epoch": 2252} {"train_loss": -6.3144636154174805, "global_step": 94613, "epoch": 2252} {"train_loss": -6.233604431152344, "global_step": 94614, "epoch": 2252} {"train_loss": -6.320874214172363, "global_step": 94615, "epoch": 2252} {"train_loss": -6.241884231567383, "global_step": 94616, "epoch": 2252} {"train_loss": -6.235379219055176, "global_step": 94617, "epoch": 2252} {"train_loss": -6.312226295471191, "global_step": 94618, "epoch": 2252} {"train_loss": -6.303131580352783, "global_step": 94619, "epoch": 2252} {"train_loss": -6.2889814376831055, "global_step": 94620, "epoch": 2252} {"train_loss": -6.473948955535889, "global_step": 94621, "epoch": 2252} {"train_loss": -6.332308769226074, "global_step": 94622, "epoch": 2252} {"train_loss": -6.278049945831299, "global_step": 94623, "epoch": 2252} {"train_loss": -6.231764793395996, "global_step": 94624, "epoch": 2252} {"train_loss": -6.289980536415463, "global_step": 94625, "epoch": 2252, "val_loss": 75237.296875} {"train_loss": -6.407341480255127, "global_step": 94626, "epoch": 2253} {"train_loss": -6.369500160217285, "global_step": 94627, "epoch": 2253} {"train_loss": -6.3611860275268555, "global_step": 94628, "epoch": 2253} {"train_loss": -6.377505779266357, "global_step": 94629, "epoch": 2253} {"train_loss": -6.238381385803223, "global_step": 94630, "epoch": 2253} {"train_loss": -6.3482561111450195, "global_step": 94631, "epoch": 2253} {"train_loss": -6.287485122680664, "global_step": 94632, "epoch": 2253} {"train_loss": -6.286647319793701, "global_step": 94633, "epoch": 2253} {"train_loss": -6.297842979431152, "global_step": 94634, "epoch": 2253} {"train_loss": -6.295427322387695, "global_step": 94635, "epoch": 2253} {"train_loss": -6.230353355407715, "global_step": 94636, "epoch": 2253} {"train_loss": -6.242986679077148, "global_step": 94637, "epoch": 2253} {"train_loss": -6.273482322692871, "global_step": 94638, "epoch": 2253} {"train_loss": -6.271113395690918, "global_step": 94639, "epoch": 2253} {"train_loss": -6.383213043212891, "global_step": 94640, "epoch": 2253} {"train_loss": -6.348447799682617, "global_step": 94641, "epoch": 2253} {"train_loss": -6.3307905197143555, "global_step": 94642, "epoch": 2253} {"train_loss": -6.305137634277344, "global_step": 94643, "epoch": 2253} {"train_loss": -6.384191989898682, "global_step": 94644, "epoch": 2253} {"train_loss": -6.330239295959473, "global_step": 94645, "epoch": 2253} {"train_loss": -6.298246383666992, "global_step": 94646, "epoch": 2253} {"train_loss": -6.230523586273193, "global_step": 94647, "epoch": 2253} {"train_loss": -6.449069499969482, "global_step": 94648, "epoch": 2253} {"train_loss": -6.315056800842285, "global_step": 94649, "epoch": 2253} {"train_loss": -6.301383018493652, "global_step": 94650, "epoch": 2253} {"train_loss": -6.297934532165527, "global_step": 94651, "epoch": 2253} {"train_loss": -6.169441223144531, "global_step": 94652, "epoch": 2253} {"train_loss": -6.327994346618652, "global_step": 94653, "epoch": 2253} {"train_loss": -6.32033109664917, "global_step": 94654, "epoch": 2253} {"train_loss": -6.240103244781494, "global_step": 94655, "epoch": 2253} {"train_loss": -6.28389835357666, "global_step": 94656, "epoch": 2253} {"train_loss": -6.233898162841797, "global_step": 94657, "epoch": 2253} {"train_loss": -6.3127336502075195, "global_step": 94658, "epoch": 2253} {"train_loss": -6.158568382263184, "global_step": 94659, "epoch": 2253} {"train_loss": -6.161273002624512, "global_step": 94660, "epoch": 2253} {"train_loss": -6.293534755706787, "global_step": 94661, "epoch": 2253} {"train_loss": -6.23015022277832, "global_step": 94662, "epoch": 2253} {"train_loss": -6.168643474578857, "global_step": 94663, "epoch": 2253} {"train_loss": -6.274068832397461, "global_step": 94664, "epoch": 2253} {"train_loss": -6.31697940826416, "global_step": 94665, "epoch": 2253} {"train_loss": -6.174359321594238, "global_step": 94666, "epoch": 2253} {"train_loss": -6.28816430909293, "global_step": 94667, "epoch": 2253, "val_loss": 75953.2265625} {"train_loss": -6.366059303283691, "global_step": 94668, "epoch": 2254} {"train_loss": -6.08226203918457, "global_step": 94669, "epoch": 2254} {"train_loss": -6.282657623291016, "global_step": 94670, "epoch": 2254} {"train_loss": -6.372792720794678, "global_step": 94671, "epoch": 2254} {"train_loss": -6.169346809387207, "global_step": 94672, "epoch": 2254} {"train_loss": -6.240813255310059, "global_step": 94673, "epoch": 2254} {"train_loss": -6.352870941162109, "global_step": 94674, "epoch": 2254} {"train_loss": -6.250336170196533, "global_step": 94675, "epoch": 2254} {"train_loss": -6.243354797363281, "global_step": 94676, "epoch": 2254} {"train_loss": -6.273284435272217, "global_step": 94677, "epoch": 2254} {"train_loss": -6.221330642700195, "global_step": 94678, "epoch": 2254} {"train_loss": -6.217235565185547, "global_step": 94679, "epoch": 2254} {"train_loss": -6.2695207595825195, "global_step": 94680, "epoch": 2254} {"train_loss": -6.296239852905273, "global_step": 94681, "epoch": 2254} {"train_loss": -6.295449256896973, "global_step": 94682, "epoch": 2254} {"train_loss": -6.303708553314209, "global_step": 94683, "epoch": 2254} {"train_loss": -6.274327754974365, "global_step": 94684, "epoch": 2254} {"train_loss": -6.282964706420898, "global_step": 94685, "epoch": 2254} {"train_loss": -6.258285045623779, "global_step": 94686, "epoch": 2254} {"train_loss": -6.227797985076904, "global_step": 94687, "epoch": 2254} {"train_loss": -6.265364646911621, "global_step": 94688, "epoch": 2254} {"train_loss": -6.321186065673828, "global_step": 94689, "epoch": 2254} {"train_loss": -6.38718843460083, "global_step": 94690, "epoch": 2254} {"train_loss": -6.313162803649902, "global_step": 94691, "epoch": 2254} {"train_loss": -6.230719566345215, "global_step": 94692, "epoch": 2254} {"train_loss": -6.206076622009277, "global_step": 94693, "epoch": 2254} {"train_loss": -6.283374786376953, "global_step": 94694, "epoch": 2254} {"train_loss": -6.303073883056641, "global_step": 94695, "epoch": 2254} {"train_loss": -6.274530410766602, "global_step": 94696, "epoch": 2254} {"train_loss": -6.340263843536377, "global_step": 94697, "epoch": 2254} {"train_loss": -6.362208366394043, "global_step": 94698, "epoch": 2254} {"train_loss": -6.253298759460449, "global_step": 94699, "epoch": 2254} {"train_loss": -6.319916725158691, "global_step": 94700, "epoch": 2254} {"train_loss": -6.3281025886535645, "global_step": 94701, "epoch": 2254} {"train_loss": -6.374074935913086, "global_step": 94702, "epoch": 2254} {"train_loss": -6.330721855163574, "global_step": 94703, "epoch": 2254} {"train_loss": -6.3346052169799805, "global_step": 94704, "epoch": 2254} {"train_loss": -6.310111999511719, "global_step": 94705, "epoch": 2254} {"train_loss": -6.319577693939209, "global_step": 94706, "epoch": 2254} {"train_loss": -6.339324951171875, "global_step": 94707, "epoch": 2254} {"train_loss": -6.236042022705078, "global_step": 94708, "epoch": 2254} {"train_loss": -6.28246419770377, "global_step": 94709, "epoch": 2254, "val_loss": 75435.203125} {"train_loss": -6.3208441734313965, "global_step": 94710, "epoch": 2255} {"train_loss": -6.222043991088867, "global_step": 94711, "epoch": 2255} {"train_loss": -6.2260870933532715, "global_step": 94712, "epoch": 2255} {"train_loss": -6.256653308868408, "global_step": 94713, "epoch": 2255} {"train_loss": -6.193297386169434, "global_step": 94714, "epoch": 2255} {"train_loss": -6.330080032348633, "global_step": 94715, "epoch": 2255} {"train_loss": -6.285734176635742, "global_step": 94716, "epoch": 2255} {"train_loss": -6.403873443603516, "global_step": 94717, "epoch": 2255} {"train_loss": -6.2673444747924805, "global_step": 94718, "epoch": 2255} {"train_loss": -6.170670986175537, "global_step": 94719, "epoch": 2255} {"train_loss": -6.302574157714844, "global_step": 94720, "epoch": 2255} {"train_loss": -6.409758567810059, "global_step": 94721, "epoch": 2255} {"train_loss": -6.331904411315918, "global_step": 94722, "epoch": 2255} {"train_loss": -6.311115264892578, "global_step": 94723, "epoch": 2255} {"train_loss": -6.270209789276123, "global_step": 94724, "epoch": 2255} {"train_loss": -6.3430399894714355, "global_step": 94725, "epoch": 2255} {"train_loss": -6.17681884765625, "global_step": 94726, "epoch": 2255} {"train_loss": -6.23326301574707, "global_step": 94727, "epoch": 2255} {"train_loss": -6.295955657958984, "global_step": 94728, "epoch": 2255} {"train_loss": -6.235896587371826, "global_step": 94729, "epoch": 2255} {"train_loss": -6.278408527374268, "global_step": 94730, "epoch": 2255} {"train_loss": -6.33322811126709, "global_step": 94731, "epoch": 2255} {"train_loss": -6.311656951904297, "global_step": 94732, "epoch": 2255} {"train_loss": -6.235202789306641, "global_step": 94733, "epoch": 2255} {"train_loss": -6.331942558288574, "global_step": 94734, "epoch": 2255} {"train_loss": -6.39103889465332, "global_step": 94735, "epoch": 2255} {"train_loss": -6.232301235198975, "global_step": 94736, "epoch": 2255} {"train_loss": -6.21461296081543, "global_step": 94737, "epoch": 2255} {"train_loss": -6.466330528259277, "global_step": 94738, "epoch": 2255} {"train_loss": -6.305591583251953, "global_step": 94739, "epoch": 2255} {"train_loss": -6.277410507202148, "global_step": 94740, "epoch": 2255} {"train_loss": -6.293023109436035, "global_step": 94741, "epoch": 2255} {"train_loss": -6.249293327331543, "global_step": 94742, "epoch": 2255} {"train_loss": -6.368461608886719, "global_step": 94743, "epoch": 2255} {"train_loss": -6.313874244689941, "global_step": 94744, "epoch": 2255} {"train_loss": -6.258936405181885, "global_step": 94745, "epoch": 2255} {"train_loss": -6.356891632080078, "global_step": 94746, "epoch": 2255} {"train_loss": -6.21470308303833, "global_step": 94747, "epoch": 2255} {"train_loss": -6.226379871368408, "global_step": 94748, "epoch": 2255} {"train_loss": -6.325451374053955, "global_step": 94749, "epoch": 2255} {"train_loss": -6.279914379119873, "global_step": 94750, "epoch": 2255} {"train_loss": -6.289048035939534, "global_step": 94751, "epoch": 2255, "val_loss": 75517.0625} {"train_loss": -6.224396705627441, "global_step": 94752, "epoch": 2256} {"train_loss": -6.282317161560059, "global_step": 94753, "epoch": 2256} {"train_loss": -6.294524669647217, "global_step": 94754, "epoch": 2256} {"train_loss": -6.291021823883057, "global_step": 94755, "epoch": 2256} {"train_loss": -6.357358932495117, "global_step": 94756, "epoch": 2256} {"train_loss": -6.222932815551758, "global_step": 94757, "epoch": 2256} {"train_loss": -6.370595932006836, "global_step": 94758, "epoch": 2256} {"train_loss": -6.234785079956055, "global_step": 94759, "epoch": 2256} {"train_loss": -6.229741096496582, "global_step": 94760, "epoch": 2256} {"train_loss": -6.337441921234131, "global_step": 94761, "epoch": 2256} {"train_loss": -6.376675128936768, "global_step": 94762, "epoch": 2256} {"train_loss": -6.324985504150391, "global_step": 94763, "epoch": 2256} {"train_loss": -6.395155429840088, "global_step": 94764, "epoch": 2256} {"train_loss": -6.321881294250488, "global_step": 94765, "epoch": 2256} {"train_loss": -6.3659539222717285, "global_step": 94766, "epoch": 2256} {"train_loss": -6.337179183959961, "global_step": 94767, "epoch": 2256} {"train_loss": -6.392521858215332, "global_step": 94768, "epoch": 2256} {"train_loss": -6.312300682067871, "global_step": 94769, "epoch": 2256} {"train_loss": -6.365073204040527, "global_step": 94770, "epoch": 2256} {"train_loss": -6.300954341888428, "global_step": 94771, "epoch": 2256} {"train_loss": -6.24687385559082, "global_step": 94772, "epoch": 2256} {"train_loss": -6.286288738250732, "global_step": 94773, "epoch": 2256} {"train_loss": -6.385532855987549, "global_step": 94774, "epoch": 2256} {"train_loss": -6.384244918823242, "global_step": 94775, "epoch": 2256} {"train_loss": -6.3690643310546875, "global_step": 94776, "epoch": 2256} {"train_loss": -6.3215765953063965, "global_step": 94777, "epoch": 2256} {"train_loss": -6.336540222167969, "global_step": 94778, "epoch": 2256} {"train_loss": -6.312186241149902, "global_step": 94779, "epoch": 2256} {"train_loss": -6.31728458404541, "global_step": 94780, "epoch": 2256} {"train_loss": -6.210832595825195, "global_step": 94781, "epoch": 2256} {"train_loss": -6.234166145324707, "global_step": 94782, "epoch": 2256} {"train_loss": -6.296084403991699, "global_step": 94783, "epoch": 2256} {"train_loss": -6.3482513427734375, "global_step": 94784, "epoch": 2256} {"train_loss": -6.325646877288818, "global_step": 94785, "epoch": 2256} {"train_loss": -6.463027000427246, "global_step": 94786, "epoch": 2256} {"train_loss": -6.3417253494262695, "global_step": 94787, "epoch": 2256} {"train_loss": -6.395544528961182, "global_step": 94788, "epoch": 2256} {"train_loss": -6.317282676696777, "global_step": 94789, "epoch": 2256} {"train_loss": -6.373244285583496, "global_step": 94790, "epoch": 2256} {"train_loss": -6.121219158172607, "global_step": 94791, "epoch": 2256} {"train_loss": -6.187557220458984, "global_step": 94792, "epoch": 2256} {"train_loss": -6.312788940611339, "global_step": 94793, "epoch": 2256, "val_loss": 75540.109375} {"train_loss": -6.297274589538574, "global_step": 94794, "epoch": 2257} {"train_loss": -6.25150728225708, "global_step": 94795, "epoch": 2257} {"train_loss": -6.312517166137695, "global_step": 94796, "epoch": 2257} {"train_loss": -6.200142860412598, "global_step": 94797, "epoch": 2257} {"train_loss": -6.3049235343933105, "global_step": 94798, "epoch": 2257} {"train_loss": -6.22695255279541, "global_step": 94799, "epoch": 2257} {"train_loss": -6.258270263671875, "global_step": 94800, "epoch": 2257} {"train_loss": -6.310531139373779, "global_step": 94801, "epoch": 2257} {"train_loss": -6.274332046508789, "global_step": 94802, "epoch": 2257} {"train_loss": -6.359973907470703, "global_step": 94803, "epoch": 2257} {"train_loss": -6.308219909667969, "global_step": 94804, "epoch": 2257} {"train_loss": -6.266961097717285, "global_step": 94805, "epoch": 2257} {"train_loss": -6.298931121826172, "global_step": 94806, "epoch": 2257} {"train_loss": -6.157015323638916, "global_step": 94807, "epoch": 2257} {"train_loss": -6.302032470703125, "global_step": 94808, "epoch": 2257} {"train_loss": -6.249640464782715, "global_step": 94809, "epoch": 2257} {"train_loss": -6.236924171447754, "global_step": 94810, "epoch": 2257} {"train_loss": -6.337855339050293, "global_step": 94811, "epoch": 2257} {"train_loss": -6.226925849914551, "global_step": 94812, "epoch": 2257} {"train_loss": -6.223697662353516, "global_step": 94813, "epoch": 2257} {"train_loss": -6.223371982574463, "global_step": 94814, "epoch": 2257} {"train_loss": -6.249538421630859, "global_step": 94815, "epoch": 2257} {"train_loss": -6.349491119384766, "global_step": 94816, "epoch": 2257} {"train_loss": -6.227983474731445, "global_step": 94817, "epoch": 2257} {"train_loss": -6.238907337188721, "global_step": 94818, "epoch": 2257} {"train_loss": -6.300234317779541, "global_step": 94819, "epoch": 2257} {"train_loss": -6.215234279632568, "global_step": 94820, "epoch": 2257} {"train_loss": -6.434149265289307, "global_step": 94821, "epoch": 2257} {"train_loss": -6.232569694519043, "global_step": 94822, "epoch": 2257} {"train_loss": -6.302115440368652, "global_step": 94823, "epoch": 2257} {"train_loss": -6.409217834472656, "global_step": 94824, "epoch": 2257} {"train_loss": -6.203830242156982, "global_step": 94825, "epoch": 2257} {"train_loss": -6.2812395095825195, "global_step": 94826, "epoch": 2257} {"train_loss": -6.280174732208252, "global_step": 94827, "epoch": 2257} {"train_loss": -6.336523056030273, "global_step": 94828, "epoch": 2257} {"train_loss": -6.383663177490234, "global_step": 94829, "epoch": 2257} {"train_loss": -6.3344926834106445, "global_step": 94830, "epoch": 2257} {"train_loss": -6.3192901611328125, "global_step": 94831, "epoch": 2257} {"train_loss": -6.261946201324463, "global_step": 94832, "epoch": 2257} {"train_loss": -6.365488529205322, "global_step": 94833, "epoch": 2257} {"train_loss": -6.322233200073242, "global_step": 94834, "epoch": 2257} {"train_loss": -6.284235443387713, "global_step": 94835, "epoch": 2257, "val_loss": 75307.0078125} {"train_loss": -6.321471691131592, "global_step": 94836, "epoch": 2258} {"train_loss": -6.19550085067749, "global_step": 94837, "epoch": 2258} {"train_loss": -6.331109046936035, "global_step": 94838, "epoch": 2258} {"train_loss": -6.356800079345703, "global_step": 94839, "epoch": 2258} {"train_loss": -6.314542770385742, "global_step": 94840, "epoch": 2258} {"train_loss": -6.436598777770996, "global_step": 94841, "epoch": 2258} {"train_loss": -6.27459716796875, "global_step": 94842, "epoch": 2258} {"train_loss": -6.291589736938477, "global_step": 94843, "epoch": 2258} {"train_loss": -6.389308452606201, "global_step": 94844, "epoch": 2258} {"train_loss": -6.275832653045654, "global_step": 94845, "epoch": 2258} {"train_loss": -6.332091331481934, "global_step": 94846, "epoch": 2258} {"train_loss": -6.292632579803467, "global_step": 94847, "epoch": 2258} {"train_loss": -6.219668388366699, "global_step": 94848, "epoch": 2258} {"train_loss": -6.190032005310059, "global_step": 94849, "epoch": 2258} {"train_loss": -6.232656002044678, "global_step": 94850, "epoch": 2258} {"train_loss": -6.354631423950195, "global_step": 94851, "epoch": 2258} {"train_loss": -6.35079288482666, "global_step": 94852, "epoch": 2258} {"train_loss": -6.330601692199707, "global_step": 94853, "epoch": 2258} {"train_loss": -6.367976665496826, "global_step": 94854, "epoch": 2258} {"train_loss": -6.15333366394043, "global_step": 94855, "epoch": 2258} {"train_loss": -6.371101379394531, "global_step": 94856, "epoch": 2258} {"train_loss": -6.3382248878479, "global_step": 94857, "epoch": 2258} {"train_loss": -6.308977127075195, "global_step": 94858, "epoch": 2258} {"train_loss": -6.205825328826904, "global_step": 94859, "epoch": 2258} {"train_loss": -6.29149055480957, "global_step": 94860, "epoch": 2258} {"train_loss": -6.259174346923828, "global_step": 94861, "epoch": 2258} {"train_loss": -6.251567363739014, "global_step": 94862, "epoch": 2258} {"train_loss": -6.475479602813721, "global_step": 94863, "epoch": 2258} {"train_loss": -6.2908477783203125, "global_step": 94864, "epoch": 2258} {"train_loss": -6.297926425933838, "global_step": 94865, "epoch": 2258} {"train_loss": -6.3257880210876465, "global_step": 94866, "epoch": 2258} {"train_loss": -6.365002632141113, "global_step": 94867, "epoch": 2258} {"train_loss": -6.391087055206299, "global_step": 94868, "epoch": 2258} {"train_loss": -6.391842842102051, "global_step": 94869, "epoch": 2258} {"train_loss": -6.368321418762207, "global_step": 94870, "epoch": 2258} {"train_loss": -6.313761234283447, "global_step": 94871, "epoch": 2258} {"train_loss": -6.247276782989502, "global_step": 94872, "epoch": 2258} {"train_loss": -6.176293849945068, "global_step": 94873, "epoch": 2258} {"train_loss": -6.195316791534424, "global_step": 94874, "epoch": 2258} {"train_loss": -6.2208476066589355, "global_step": 94875, "epoch": 2258} {"train_loss": -6.208183288574219, "global_step": 94876, "epoch": 2258} {"train_loss": -6.296262139365787, "global_step": 94877, "epoch": 2258, "val_loss": 75638.484375} {"train_loss": -6.282761573791504, "global_step": 94878, "epoch": 2259} {"train_loss": -6.198076248168945, "global_step": 94879, "epoch": 2259} {"train_loss": -6.287924289703369, "global_step": 94880, "epoch": 2259} {"train_loss": -6.372735023498535, "global_step": 94881, "epoch": 2259} {"train_loss": -6.289113998413086, "global_step": 94882, "epoch": 2259} {"train_loss": -6.305757999420166, "global_step": 94883, "epoch": 2259} {"train_loss": -6.346447944641113, "global_step": 94884, "epoch": 2259} {"train_loss": -6.3361496925354, "global_step": 94885, "epoch": 2259} {"train_loss": -6.196649551391602, "global_step": 94886, "epoch": 2259} {"train_loss": -6.437037467956543, "global_step": 94887, "epoch": 2259} {"train_loss": -6.31670618057251, "global_step": 94888, "epoch": 2259} {"train_loss": -6.3011298179626465, "global_step": 94889, "epoch": 2259} {"train_loss": -6.320539474487305, "global_step": 94890, "epoch": 2259} {"train_loss": -6.435976982116699, "global_step": 94891, "epoch": 2259} {"train_loss": -6.322607040405273, "global_step": 94892, "epoch": 2259} {"train_loss": -6.244007110595703, "global_step": 94893, "epoch": 2259} {"train_loss": -6.315299034118652, "global_step": 94894, "epoch": 2259} {"train_loss": -6.2630720138549805, "global_step": 94895, "epoch": 2259} {"train_loss": -6.272926330566406, "global_step": 94896, "epoch": 2259} {"train_loss": -6.269781112670898, "global_step": 94897, "epoch": 2259} {"train_loss": -6.215817451477051, "global_step": 94898, "epoch": 2259} {"train_loss": -6.259866714477539, "global_step": 94899, "epoch": 2259} {"train_loss": -6.293061256408691, "global_step": 94900, "epoch": 2259} {"train_loss": -6.211963653564453, "global_step": 94901, "epoch": 2259} {"train_loss": -6.15118408203125, "global_step": 94902, "epoch": 2259} {"train_loss": -6.164239406585693, "global_step": 94903, "epoch": 2259} {"train_loss": -6.276559352874756, "global_step": 94904, "epoch": 2259} {"train_loss": -6.251764297485352, "global_step": 94905, "epoch": 2259} {"train_loss": -6.188904762268066, "global_step": 94906, "epoch": 2259} {"train_loss": -6.200531959533691, "global_step": 94907, "epoch": 2259} {"train_loss": -6.269783020019531, "global_step": 94908, "epoch": 2259} {"train_loss": -6.412371635437012, "global_step": 94909, "epoch": 2259} {"train_loss": -6.254486560821533, "global_step": 94910, "epoch": 2259} {"train_loss": -6.231768608093262, "global_step": 94911, "epoch": 2259} {"train_loss": -6.188362121582031, "global_step": 94912, "epoch": 2259} {"train_loss": -6.1418070793151855, "global_step": 94913, "epoch": 2259} {"train_loss": -6.309019088745117, "global_step": 94914, "epoch": 2259} {"train_loss": -6.2802534103393555, "global_step": 94915, "epoch": 2259} {"train_loss": -6.263047218322754, "global_step": 94916, "epoch": 2259} {"train_loss": -6.3052754402160645, "global_step": 94917, "epoch": 2259} {"train_loss": -6.266424179077148, "global_step": 94918, "epoch": 2259} {"train_loss": -6.27740098181225, "global_step": 94919, "epoch": 2259, "val_loss": 75584.6640625} {"train_loss": -6.245645046234131, "global_step": 94920, "epoch": 2260} {"train_loss": -6.439578056335449, "global_step": 94921, "epoch": 2260} {"train_loss": -6.223433494567871, "global_step": 94922, "epoch": 2260} {"train_loss": -6.232296943664551, "global_step": 94923, "epoch": 2260} {"train_loss": -6.362628936767578, "global_step": 94924, "epoch": 2260} {"train_loss": -6.196267127990723, "global_step": 94925, "epoch": 2260} {"train_loss": -6.347039222717285, "global_step": 94926, "epoch": 2260} {"train_loss": -6.28842830657959, "global_step": 94927, "epoch": 2260} {"train_loss": -6.19462776184082, "global_step": 94928, "epoch": 2260} {"train_loss": -6.386649131774902, "global_step": 94929, "epoch": 2260} {"train_loss": -6.214476585388184, "global_step": 94930, "epoch": 2260} {"train_loss": -6.299961090087891, "global_step": 94931, "epoch": 2260} {"train_loss": -6.3105268478393555, "global_step": 94932, "epoch": 2260} {"train_loss": -6.240090370178223, "global_step": 94933, "epoch": 2260} {"train_loss": -6.397721290588379, "global_step": 94934, "epoch": 2260} {"train_loss": -6.330649375915527, "global_step": 94935, "epoch": 2260} {"train_loss": -6.177577972412109, "global_step": 94936, "epoch": 2260} {"train_loss": -6.309457302093506, "global_step": 94937, "epoch": 2260} {"train_loss": -6.197425842285156, "global_step": 94938, "epoch": 2260} {"train_loss": -6.363971710205078, "global_step": 94939, "epoch": 2260} {"train_loss": -6.284511566162109, "global_step": 94940, "epoch": 2260} {"train_loss": -6.131237506866455, "global_step": 94941, "epoch": 2260} {"train_loss": -6.211164474487305, "global_step": 94942, "epoch": 2260} {"train_loss": -6.175457954406738, "global_step": 94943, "epoch": 2260} {"train_loss": -6.36980676651001, "global_step": 94944, "epoch": 2260} {"train_loss": -6.159728527069092, "global_step": 94945, "epoch": 2260} {"train_loss": -6.252099990844727, "global_step": 94946, "epoch": 2260} {"train_loss": -6.27512788772583, "global_step": 94947, "epoch": 2260} {"train_loss": -6.295440196990967, "global_step": 94948, "epoch": 2260} {"train_loss": -6.238185405731201, "global_step": 94949, "epoch": 2260} {"train_loss": -6.438315391540527, "global_step": 94950, "epoch": 2260} {"train_loss": -6.217791557312012, "global_step": 94951, "epoch": 2260} {"train_loss": -6.347867012023926, "global_step": 94952, "epoch": 2260} {"train_loss": -6.291173934936523, "global_step": 94953, "epoch": 2260} {"train_loss": -6.383094787597656, "global_step": 94954, "epoch": 2260} {"train_loss": -6.205873489379883, "global_step": 94955, "epoch": 2260} {"train_loss": -6.234386444091797, "global_step": 94956, "epoch": 2260} {"train_loss": -6.275659561157227, "global_step": 94957, "epoch": 2260} {"train_loss": -6.257913589477539, "global_step": 94958, "epoch": 2260} {"train_loss": -6.148616790771484, "global_step": 94959, "epoch": 2260} {"train_loss": -6.2936201095581055, "global_step": 94960, "epoch": 2260} {"train_loss": -6.277095544905889, "global_step": 94961, "epoch": 2260, "val_loss": 75415.9921875} {"train_loss": -6.238125801086426, "global_step": 94962, "epoch": 2261} {"train_loss": -6.163264751434326, "global_step": 94963, "epoch": 2261} {"train_loss": -6.221386432647705, "global_step": 94964, "epoch": 2261} {"train_loss": -6.309723377227783, "global_step": 94965, "epoch": 2261} {"train_loss": -6.167095184326172, "global_step": 94966, "epoch": 2261} {"train_loss": -6.198403835296631, "global_step": 94967, "epoch": 2261} {"train_loss": -6.196698188781738, "global_step": 94968, "epoch": 2261} {"train_loss": -6.208546161651611, "global_step": 94969, "epoch": 2261} {"train_loss": -6.175987720489502, "global_step": 94970, "epoch": 2261} {"train_loss": -6.086562156677246, "global_step": 94971, "epoch": 2261} {"train_loss": -6.145407676696777, "global_step": 94972, "epoch": 2261} {"train_loss": -6.334342002868652, "global_step": 94973, "epoch": 2261} {"train_loss": -6.155266761779785, "global_step": 94974, "epoch": 2261} {"train_loss": -6.1858978271484375, "global_step": 94975, "epoch": 2261} {"train_loss": -6.089788436889648, "global_step": 94976, "epoch": 2261} {"train_loss": -6.212754249572754, "global_step": 94977, "epoch": 2261} {"train_loss": -6.206562042236328, "global_step": 94978, "epoch": 2261} {"train_loss": -6.254434585571289, "global_step": 94979, "epoch": 2261} {"train_loss": -6.159981727600098, "global_step": 94980, "epoch": 2261} {"train_loss": -6.3786540031433105, "global_step": 94981, "epoch": 2261} {"train_loss": -6.093742847442627, "global_step": 94982, "epoch": 2261} {"train_loss": -6.271987438201904, "global_step": 94983, "epoch": 2261} {"train_loss": -6.229267120361328, "global_step": 94984, "epoch": 2261} {"train_loss": -6.314424514770508, "global_step": 94985, "epoch": 2261} {"train_loss": -6.156347274780273, "global_step": 94986, "epoch": 2261} {"train_loss": -6.220841884613037, "global_step": 94987, "epoch": 2261} {"train_loss": -6.233454704284668, "global_step": 94988, "epoch": 2261} {"train_loss": -6.319500923156738, "global_step": 94989, "epoch": 2261} {"train_loss": -6.304780006408691, "global_step": 94990, "epoch": 2261} {"train_loss": -6.363930702209473, "global_step": 94991, "epoch": 2261} {"train_loss": -6.324426174163818, "global_step": 94992, "epoch": 2261} {"train_loss": -6.345494270324707, "global_step": 94993, "epoch": 2261} {"train_loss": -6.391986846923828, "global_step": 94994, "epoch": 2261} {"train_loss": -6.229486465454102, "global_step": 94995, "epoch": 2261} {"train_loss": -6.12152624130249, "global_step": 94996, "epoch": 2261} {"train_loss": -6.306379318237305, "global_step": 94997, "epoch": 2261} {"train_loss": -6.369180679321289, "global_step": 94998, "epoch": 2261} {"train_loss": -6.235538482666016, "global_step": 94999, "epoch": 2261} {"train_loss": -6.311740875244141, "global_step": 95000, "epoch": 2261} {"train_loss": -6.2198052406311035, "global_step": 95001, "epoch": 2261} {"train_loss": -6.443753242492676, "global_step": 95002, "epoch": 2261} {"train_loss": -6.242297535850888, "global_step": 95003, "epoch": 2261, "val_loss": 75613.8515625} {"train_loss": -6.420523643493652, "global_step": 95004, "epoch": 2262} {"train_loss": -6.216950416564941, "global_step": 95005, "epoch": 2262} {"train_loss": -6.35869836807251, "global_step": 95006, "epoch": 2262} {"train_loss": -6.313447952270508, "global_step": 95007, "epoch": 2262} {"train_loss": -6.274395942687988, "global_step": 95008, "epoch": 2262} {"train_loss": -6.292997360229492, "global_step": 95009, "epoch": 2262} {"train_loss": -6.3087873458862305, "global_step": 95010, "epoch": 2262} {"train_loss": -6.277308464050293, "global_step": 95011, "epoch": 2262} {"train_loss": -6.3148193359375, "global_step": 95012, "epoch": 2262} {"train_loss": -6.245815277099609, "global_step": 95013, "epoch": 2262} {"train_loss": -6.420142650604248, "global_step": 95014, "epoch": 2262} {"train_loss": -6.320186614990234, "global_step": 95015, "epoch": 2262} {"train_loss": -6.344759941101074, "global_step": 95016, "epoch": 2262} {"train_loss": -6.381468296051025, "global_step": 95017, "epoch": 2262} {"train_loss": -6.350654602050781, "global_step": 95018, "epoch": 2262} {"train_loss": -6.171085357666016, "global_step": 95019, "epoch": 2262} {"train_loss": -6.351802349090576, "global_step": 95020, "epoch": 2262} {"train_loss": -6.324531555175781, "global_step": 95021, "epoch": 2262} {"train_loss": -6.207719802856445, "global_step": 95022, "epoch": 2262} {"train_loss": -6.286959648132324, "global_step": 95023, "epoch": 2262} {"train_loss": -6.347868919372559, "global_step": 95024, "epoch": 2262} {"train_loss": -6.178330421447754, "global_step": 95025, "epoch": 2262} {"train_loss": -6.273773193359375, "global_step": 95026, "epoch": 2262} {"train_loss": -6.378322601318359, "global_step": 95027, "epoch": 2262} {"train_loss": -6.44773006439209, "global_step": 95028, "epoch": 2262} {"train_loss": -6.2044196128845215, "global_step": 95029, "epoch": 2262} {"train_loss": -6.338429927825928, "global_step": 95030, "epoch": 2262} {"train_loss": -6.289045810699463, "global_step": 95031, "epoch": 2262} {"train_loss": -6.2310471534729, "global_step": 95032, "epoch": 2262} {"train_loss": -6.354285717010498, "global_step": 95033, "epoch": 2262} {"train_loss": -6.280002593994141, "global_step": 95034, "epoch": 2262} {"train_loss": -6.24694299697876, "global_step": 95035, "epoch": 2262} {"train_loss": -6.246267318725586, "global_step": 95036, "epoch": 2262} {"train_loss": -6.212414264678955, "global_step": 95037, "epoch": 2262} {"train_loss": -6.188206672668457, "global_step": 95038, "epoch": 2262} {"train_loss": -6.371325492858887, "global_step": 95039, "epoch": 2262} {"train_loss": -6.289527893066406, "global_step": 95040, "epoch": 2262} {"train_loss": -6.26755952835083, "global_step": 95041, "epoch": 2262} {"train_loss": -6.2649030685424805, "global_step": 95042, "epoch": 2262} {"train_loss": -6.191954612731934, "global_step": 95043, "epoch": 2262} {"train_loss": -6.23008918762207, "global_step": 95044, "epoch": 2262} {"train_loss": -6.292399747031076, "global_step": 95045, "epoch": 2262, "val_loss": 75619.5703125} {"train_loss": -6.3812479972839355, "global_step": 95046, "epoch": 2263} {"train_loss": -6.287337303161621, "global_step": 95047, "epoch": 2263} {"train_loss": -6.371588706970215, "global_step": 95048, "epoch": 2263} {"train_loss": -6.414918899536133, "global_step": 95049, "epoch": 2263} {"train_loss": -6.358188152313232, "global_step": 95050, "epoch": 2263} {"train_loss": -6.357271194458008, "global_step": 95051, "epoch": 2263} {"train_loss": -6.318475723266602, "global_step": 95052, "epoch": 2263} {"train_loss": -6.198742866516113, "global_step": 95053, "epoch": 2263} {"train_loss": -6.311627388000488, "global_step": 95054, "epoch": 2263} {"train_loss": -6.339908123016357, "global_step": 95055, "epoch": 2263} {"train_loss": -6.223962306976318, "global_step": 95056, "epoch": 2263} {"train_loss": -6.29367733001709, "global_step": 95057, "epoch": 2263} {"train_loss": -6.213775157928467, "global_step": 95058, "epoch": 2263} {"train_loss": -6.270064830780029, "global_step": 95059, "epoch": 2263} {"train_loss": -6.343482971191406, "global_step": 95060, "epoch": 2263} {"train_loss": -6.222537040710449, "global_step": 95061, "epoch": 2263} {"train_loss": -6.311249732971191, "global_step": 95062, "epoch": 2263} {"train_loss": -6.215963840484619, "global_step": 95063, "epoch": 2263} {"train_loss": -6.217293739318848, "global_step": 95064, "epoch": 2263} {"train_loss": -6.32938814163208, "global_step": 95065, "epoch": 2263} {"train_loss": -6.242796421051025, "global_step": 95066, "epoch": 2263} {"train_loss": -6.209071636199951, "global_step": 95067, "epoch": 2263} {"train_loss": -6.1707258224487305, "global_step": 95068, "epoch": 2263} {"train_loss": -6.340433597564697, "global_step": 95069, "epoch": 2263} {"train_loss": -6.117804050445557, "global_step": 95070, "epoch": 2263} {"train_loss": -6.297900676727295, "global_step": 95071, "epoch": 2263} {"train_loss": -6.131102561950684, "global_step": 95072, "epoch": 2263} {"train_loss": -6.1918416023254395, "global_step": 95073, "epoch": 2263} {"train_loss": -6.370113849639893, "global_step": 95074, "epoch": 2263} {"train_loss": -6.232936859130859, "global_step": 95075, "epoch": 2263} {"train_loss": -6.430011749267578, "global_step": 95076, "epoch": 2263} {"train_loss": -6.172508716583252, "global_step": 95077, "epoch": 2263} {"train_loss": -6.32167387008667, "global_step": 95078, "epoch": 2263} {"train_loss": -6.342705726623535, "global_step": 95079, "epoch": 2263} {"train_loss": -6.279379844665527, "global_step": 95080, "epoch": 2263} {"train_loss": -6.279318809509277, "global_step": 95081, "epoch": 2263} {"train_loss": -6.231545448303223, "global_step": 95082, "epoch": 2263} {"train_loss": -6.129437446594238, "global_step": 95083, "epoch": 2263} {"train_loss": -6.238966464996338, "global_step": 95084, "epoch": 2263} {"train_loss": -6.337076663970947, "global_step": 95085, "epoch": 2263} {"train_loss": -6.222597122192383, "global_step": 95086, "epoch": 2263} {"train_loss": -6.2765174025581, "global_step": 95087, "epoch": 2263, "val_loss": 75582.6640625} {"train_loss": -6.355066299438477, "global_step": 95088, "epoch": 2264} {"train_loss": -6.314937591552734, "global_step": 95089, "epoch": 2264} {"train_loss": -6.340259552001953, "global_step": 95090, "epoch": 2264} {"train_loss": -6.34226655960083, "global_step": 95091, "epoch": 2264} {"train_loss": -6.2257866859436035, "global_step": 95092, "epoch": 2264} {"train_loss": -6.398123741149902, "global_step": 95093, "epoch": 2264} {"train_loss": -6.48403263092041, "global_step": 95094, "epoch": 2264} {"train_loss": -6.445040702819824, "global_step": 95095, "epoch": 2264} {"train_loss": -6.3982696533203125, "global_step": 95096, "epoch": 2264} {"train_loss": -6.390505790710449, "global_step": 95097, "epoch": 2264} {"train_loss": -6.2892560958862305, "global_step": 95098, "epoch": 2264} {"train_loss": -6.202284812927246, "global_step": 95099, "epoch": 2264} {"train_loss": -6.301249980926514, "global_step": 95100, "epoch": 2264} {"train_loss": -6.290184020996094, "global_step": 95101, "epoch": 2264} {"train_loss": -6.220702171325684, "global_step": 95102, "epoch": 2264} {"train_loss": -6.2696428298950195, "global_step": 95103, "epoch": 2264} {"train_loss": -6.26052188873291, "global_step": 95104, "epoch": 2264} {"train_loss": -6.319748878479004, "global_step": 95105, "epoch": 2264} {"train_loss": -6.196317195892334, "global_step": 95106, "epoch": 2264} {"train_loss": -6.274470806121826, "global_step": 95107, "epoch": 2264} {"train_loss": -6.214254856109619, "global_step": 95108, "epoch": 2264} {"train_loss": -6.234655380249023, "global_step": 95109, "epoch": 2264} {"train_loss": -6.3224897384643555, "global_step": 95110, "epoch": 2264} {"train_loss": -6.422693252563477, "global_step": 95111, "epoch": 2264} {"train_loss": -6.27410888671875, "global_step": 95112, "epoch": 2264} {"train_loss": -6.374125003814697, "global_step": 95113, "epoch": 2264} {"train_loss": -6.325682163238525, "global_step": 95114, "epoch": 2264} {"train_loss": -6.324922561645508, "global_step": 95115, "epoch": 2264} {"train_loss": -6.344621181488037, "global_step": 95116, "epoch": 2264} {"train_loss": -6.262094497680664, "global_step": 95117, "epoch": 2264} {"train_loss": -6.23320198059082, "global_step": 95118, "epoch": 2264} {"train_loss": -6.42483377456665, "global_step": 95119, "epoch": 2264} {"train_loss": -6.346155643463135, "global_step": 95120, "epoch": 2264} {"train_loss": -6.374163627624512, "global_step": 95121, "epoch": 2264} {"train_loss": -6.229680061340332, "global_step": 95122, "epoch": 2264} {"train_loss": -6.324244022369385, "global_step": 95123, "epoch": 2264} {"train_loss": -6.311832904815674, "global_step": 95124, "epoch": 2264} {"train_loss": -6.310553550720215, "global_step": 95125, "epoch": 2264} {"train_loss": -6.23978853225708, "global_step": 95126, "epoch": 2264} {"train_loss": -6.299572467803955, "global_step": 95127, "epoch": 2264} {"train_loss": -6.253612518310547, "global_step": 95128, "epoch": 2264} {"train_loss": -6.309216158730643, "global_step": 95129, "epoch": 2264, "val_loss": 75522.6484375} {"train_loss": -6.379525184631348, "global_step": 95130, "epoch": 2265} {"train_loss": -6.291872978210449, "global_step": 95131, "epoch": 2265} {"train_loss": -6.294527530670166, "global_step": 95132, "epoch": 2265} {"train_loss": -6.23826265335083, "global_step": 95133, "epoch": 2265} {"train_loss": -6.3079423904418945, "global_step": 95134, "epoch": 2265} {"train_loss": -6.213432788848877, "global_step": 95135, "epoch": 2265} {"train_loss": -6.280965805053711, "global_step": 95136, "epoch": 2265} {"train_loss": -6.409380912780762, "global_step": 95137, "epoch": 2265} {"train_loss": -6.230532169342041, "global_step": 95138, "epoch": 2265} {"train_loss": -6.286771774291992, "global_step": 95139, "epoch": 2265} {"train_loss": -6.349834442138672, "global_step": 95140, "epoch": 2265} {"train_loss": -6.3869476318359375, "global_step": 95141, "epoch": 2265} {"train_loss": -6.270875930786133, "global_step": 95142, "epoch": 2265} {"train_loss": -6.333812713623047, "global_step": 95143, "epoch": 2265} {"train_loss": -6.288230895996094, "global_step": 95144, "epoch": 2265} {"train_loss": -6.3676981925964355, "global_step": 95145, "epoch": 2265} {"train_loss": -6.221805095672607, "global_step": 95146, "epoch": 2265} {"train_loss": -6.307570457458496, "global_step": 95147, "epoch": 2265} {"train_loss": -6.376354694366455, "global_step": 95148, "epoch": 2265} {"train_loss": -6.311889171600342, "global_step": 95149, "epoch": 2265} {"train_loss": -6.333978176116943, "global_step": 95150, "epoch": 2265} {"train_loss": -6.3580121994018555, "global_step": 95151, "epoch": 2265} {"train_loss": -6.235400199890137, "global_step": 95152, "epoch": 2265} {"train_loss": -6.246681213378906, "global_step": 95153, "epoch": 2265} {"train_loss": -6.324247360229492, "global_step": 95154, "epoch": 2265} {"train_loss": -6.257508277893066, "global_step": 95155, "epoch": 2265} {"train_loss": -6.321045875549316, "global_step": 95156, "epoch": 2265} {"train_loss": -6.437493801116943, "global_step": 95157, "epoch": 2265} {"train_loss": -6.311284065246582, "global_step": 95158, "epoch": 2265} {"train_loss": -6.352644443511963, "global_step": 95159, "epoch": 2265} {"train_loss": -6.427513122558594, "global_step": 95160, "epoch": 2265} {"train_loss": -6.330263614654541, "global_step": 95161, "epoch": 2265} {"train_loss": -6.186454772949219, "global_step": 95162, "epoch": 2265} {"train_loss": -6.341779708862305, "global_step": 95163, "epoch": 2265} {"train_loss": -6.2456135749816895, "global_step": 95164, "epoch": 2265} {"train_loss": -6.404216766357422, "global_step": 95165, "epoch": 2265} {"train_loss": -6.362502574920654, "global_step": 95166, "epoch": 2265} {"train_loss": -6.404826641082764, "global_step": 95167, "epoch": 2265} {"train_loss": -6.294119834899902, "global_step": 95168, "epoch": 2265} {"train_loss": -6.234346866607666, "global_step": 95169, "epoch": 2265} {"train_loss": -6.307299613952637, "global_step": 95170, "epoch": 2265} {"train_loss": -6.3155479317619685, "global_step": 95171, "epoch": 2265, "val_loss": 75700.171875} {"train_loss": -6.272617340087891, "global_step": 95172, "epoch": 2266} {"train_loss": -6.283055782318115, "global_step": 95173, "epoch": 2266} {"train_loss": -6.331219673156738, "global_step": 95174, "epoch": 2266} {"train_loss": -6.267551898956299, "global_step": 95175, "epoch": 2266} {"train_loss": -6.392917633056641, "global_step": 95176, "epoch": 2266} {"train_loss": -6.264131546020508, "global_step": 95177, "epoch": 2266} {"train_loss": -6.278462886810303, "global_step": 95178, "epoch": 2266} {"train_loss": -6.349782466888428, "global_step": 95179, "epoch": 2266} {"train_loss": -6.403420448303223, "global_step": 95180, "epoch": 2266} {"train_loss": -6.260442733764648, "global_step": 95181, "epoch": 2266} {"train_loss": -6.24465799331665, "global_step": 95182, "epoch": 2266} {"train_loss": -6.151725769042969, "global_step": 95183, "epoch": 2266} {"train_loss": -6.287590026855469, "global_step": 95184, "epoch": 2266} {"train_loss": -6.394073486328125, "global_step": 95185, "epoch": 2266} {"train_loss": -6.281073570251465, "global_step": 95186, "epoch": 2266} {"train_loss": -6.281055450439453, "global_step": 95187, "epoch": 2266} {"train_loss": -6.323461532592773, "global_step": 95188, "epoch": 2266} {"train_loss": -6.337905406951904, "global_step": 95189, "epoch": 2266} {"train_loss": -6.233086109161377, "global_step": 95190, "epoch": 2266} {"train_loss": -6.193185806274414, "global_step": 95191, "epoch": 2266} {"train_loss": -6.348799705505371, "global_step": 95192, "epoch": 2266} {"train_loss": -6.296521186828613, "global_step": 95193, "epoch": 2266} {"train_loss": -6.118736267089844, "global_step": 95194, "epoch": 2266} {"train_loss": -6.360787391662598, "global_step": 95195, "epoch": 2266} {"train_loss": -6.1920671463012695, "global_step": 95196, "epoch": 2266} {"train_loss": -6.345244407653809, "global_step": 95197, "epoch": 2266} {"train_loss": -6.207782745361328, "global_step": 95198, "epoch": 2266} {"train_loss": -6.2436723709106445, "global_step": 95199, "epoch": 2266} {"train_loss": -6.374361038208008, "global_step": 95200, "epoch": 2266} {"train_loss": -6.317532539367676, "global_step": 95201, "epoch": 2266} {"train_loss": -6.252447128295898, "global_step": 95202, "epoch": 2266} {"train_loss": -6.245546340942383, "global_step": 95203, "epoch": 2266} {"train_loss": -6.3505754470825195, "global_step": 95204, "epoch": 2266} {"train_loss": -6.394122123718262, "global_step": 95205, "epoch": 2266} {"train_loss": -6.284658908843994, "global_step": 95206, "epoch": 2266} {"train_loss": -6.231781005859375, "global_step": 95207, "epoch": 2266} {"train_loss": -6.260441303253174, "global_step": 95208, "epoch": 2266} {"train_loss": -6.295293807983398, "global_step": 95209, "epoch": 2266} {"train_loss": -6.157660961151123, "global_step": 95210, "epoch": 2266} {"train_loss": -6.213803291320801, "global_step": 95211, "epoch": 2266} {"train_loss": -6.263635635375977, "global_step": 95212, "epoch": 2266} {"train_loss": -6.284739766802106, "global_step": 95213, "epoch": 2266, "val_loss": 75355.59375} {"train_loss": -6.26866340637207, "global_step": 95214, "epoch": 2267} {"train_loss": -6.281130313873291, "global_step": 95215, "epoch": 2267} {"train_loss": -6.250622749328613, "global_step": 95216, "epoch": 2267} {"train_loss": -6.266633987426758, "global_step": 95217, "epoch": 2267} {"train_loss": -6.245065212249756, "global_step": 95218, "epoch": 2267} {"train_loss": -6.310052871704102, "global_step": 95219, "epoch": 2267} {"train_loss": -6.403590202331543, "global_step": 95220, "epoch": 2267} {"train_loss": -6.396223068237305, "global_step": 95221, "epoch": 2267} {"train_loss": -6.326416015625, "global_step": 95222, "epoch": 2267} {"train_loss": -6.323329925537109, "global_step": 95223, "epoch": 2267} {"train_loss": -6.255373954772949, "global_step": 95224, "epoch": 2267} {"train_loss": -6.385998725891113, "global_step": 95225, "epoch": 2267} {"train_loss": -6.347347736358643, "global_step": 95226, "epoch": 2267} {"train_loss": -6.336298942565918, "global_step": 95227, "epoch": 2267} {"train_loss": -6.35821533203125, "global_step": 95228, "epoch": 2267} {"train_loss": -6.404759407043457, "global_step": 95229, "epoch": 2267} {"train_loss": -6.31674337387085, "global_step": 95230, "epoch": 2267} {"train_loss": -6.317513465881348, "global_step": 95231, "epoch": 2267} {"train_loss": -6.384361267089844, "global_step": 95232, "epoch": 2267} {"train_loss": -6.37291955947876, "global_step": 95233, "epoch": 2267} {"train_loss": -6.266953468322754, "global_step": 95234, "epoch": 2267} {"train_loss": -6.427148818969727, "global_step": 95235, "epoch": 2267} {"train_loss": -6.411087989807129, "global_step": 95236, "epoch": 2267} {"train_loss": -6.301695823669434, "global_step": 95237, "epoch": 2267} {"train_loss": -6.368155479431152, "global_step": 95238, "epoch": 2267} {"train_loss": -6.326957702636719, "global_step": 95239, "epoch": 2267} {"train_loss": -6.271791458129883, "global_step": 95240, "epoch": 2267} {"train_loss": -6.233380317687988, "global_step": 95241, "epoch": 2267} {"train_loss": -6.257503032684326, "global_step": 95242, "epoch": 2267} {"train_loss": -6.247384548187256, "global_step": 95243, "epoch": 2267} {"train_loss": -6.400833606719971, "global_step": 95244, "epoch": 2267} {"train_loss": -6.28859806060791, "global_step": 95245, "epoch": 2267} {"train_loss": -6.216858863830566, "global_step": 95246, "epoch": 2267} {"train_loss": -6.389332294464111, "global_step": 95247, "epoch": 2267} {"train_loss": -6.227641582489014, "global_step": 95248, "epoch": 2267} {"train_loss": -6.260231018066406, "global_step": 95249, "epoch": 2267} {"train_loss": -6.323971748352051, "global_step": 95250, "epoch": 2267} {"train_loss": -6.212308406829834, "global_step": 95251, "epoch": 2267} {"train_loss": -6.275623798370361, "global_step": 95252, "epoch": 2267} {"train_loss": -6.28469181060791, "global_step": 95253, "epoch": 2267} {"train_loss": -6.238654613494873, "global_step": 95254, "epoch": 2267} {"train_loss": -6.311685528073992, "global_step": 95255, "epoch": 2267, "val_loss": 75779.2734375} {"train_loss": -6.188591957092285, "global_step": 95256, "epoch": 2268} {"train_loss": -6.344391822814941, "global_step": 95257, "epoch": 2268} {"train_loss": -6.20123291015625, "global_step": 95258, "epoch": 2268} {"train_loss": -6.347992420196533, "global_step": 95259, "epoch": 2268} {"train_loss": -6.362377166748047, "global_step": 95260, "epoch": 2268} {"train_loss": -6.26115083694458, "global_step": 95261, "epoch": 2268} {"train_loss": -6.353936195373535, "global_step": 95262, "epoch": 2268} {"train_loss": -6.295604705810547, "global_step": 95263, "epoch": 2268} {"train_loss": -6.21013069152832, "global_step": 95264, "epoch": 2268} {"train_loss": -6.365983486175537, "global_step": 95265, "epoch": 2268} {"train_loss": -6.252917289733887, "global_step": 95266, "epoch": 2268} {"train_loss": -6.337871551513672, "global_step": 95267, "epoch": 2268} {"train_loss": -6.251494884490967, "global_step": 95268, "epoch": 2268} {"train_loss": -6.36700963973999, "global_step": 95269, "epoch": 2268} {"train_loss": -6.20283842086792, "global_step": 95270, "epoch": 2268} {"train_loss": -6.260628700256348, "global_step": 95271, "epoch": 2268} {"train_loss": -6.373729228973389, "global_step": 95272, "epoch": 2268} {"train_loss": -6.26576042175293, "global_step": 95273, "epoch": 2268} {"train_loss": -6.2717180252075195, "global_step": 95274, "epoch": 2268} {"train_loss": -6.304052829742432, "global_step": 95275, "epoch": 2268} {"train_loss": -6.251584053039551, "global_step": 95276, "epoch": 2268} {"train_loss": -6.348038673400879, "global_step": 95277, "epoch": 2268} {"train_loss": -6.30091667175293, "global_step": 95278, "epoch": 2268} {"train_loss": -6.3263959884643555, "global_step": 95279, "epoch": 2268} {"train_loss": -6.221149444580078, "global_step": 95280, "epoch": 2268} {"train_loss": -6.226568222045898, "global_step": 95281, "epoch": 2268} {"train_loss": -6.185931205749512, "global_step": 95282, "epoch": 2268} {"train_loss": -6.299918174743652, "global_step": 95283, "epoch": 2268} {"train_loss": -6.204230308532715, "global_step": 95284, "epoch": 2268} {"train_loss": -6.354717254638672, "global_step": 95285, "epoch": 2268} {"train_loss": -6.291898727416992, "global_step": 95286, "epoch": 2268} {"train_loss": -6.1952619552612305, "global_step": 95287, "epoch": 2268} {"train_loss": -6.209319591522217, "global_step": 95288, "epoch": 2268} {"train_loss": -6.146843910217285, "global_step": 95289, "epoch": 2268} {"train_loss": -6.312038421630859, "global_step": 95290, "epoch": 2268} {"train_loss": -6.249317169189453, "global_step": 95291, "epoch": 2268} {"train_loss": -6.216431617736816, "global_step": 95292, "epoch": 2268} {"train_loss": -6.186587333679199, "global_step": 95293, "epoch": 2268} {"train_loss": -6.172410011291504, "global_step": 95294, "epoch": 2268} {"train_loss": -6.262676239013672, "global_step": 95295, "epoch": 2268} {"train_loss": -6.15776252746582, "global_step": 95296, "epoch": 2268} {"train_loss": -6.26535279410226, "global_step": 95297, "epoch": 2268, "val_loss": 75974.1640625} {"train_loss": -6.063920021057129, "global_step": 95298, "epoch": 2269} {"train_loss": -6.161890983581543, "global_step": 95299, "epoch": 2269} {"train_loss": -6.297402381896973, "global_step": 95300, "epoch": 2269} {"train_loss": -6.323367118835449, "global_step": 95301, "epoch": 2269} {"train_loss": -6.298648357391357, "global_step": 95302, "epoch": 2269} {"train_loss": -6.33533239364624, "global_step": 95303, "epoch": 2269} {"train_loss": -6.213491916656494, "global_step": 95304, "epoch": 2269} {"train_loss": -6.422584056854248, "global_step": 95305, "epoch": 2269} {"train_loss": -6.390159606933594, "global_step": 95306, "epoch": 2269} {"train_loss": -6.380451202392578, "global_step": 95307, "epoch": 2269} {"train_loss": -6.31517219543457, "global_step": 95308, "epoch": 2269} {"train_loss": -6.271191596984863, "global_step": 95309, "epoch": 2269} {"train_loss": -6.158076763153076, "global_step": 95310, "epoch": 2269} {"train_loss": -6.245640754699707, "global_step": 95311, "epoch": 2269} {"train_loss": -6.287322998046875, "global_step": 95312, "epoch": 2269} {"train_loss": -6.307951927185059, "global_step": 95313, "epoch": 2269} {"train_loss": -6.325551986694336, "global_step": 95314, "epoch": 2269} {"train_loss": -6.28189754486084, "global_step": 95315, "epoch": 2269} {"train_loss": -6.378783226013184, "global_step": 95316, "epoch": 2269} {"train_loss": -6.376936912536621, "global_step": 95317, "epoch": 2269} {"train_loss": -6.214269161224365, "global_step": 95318, "epoch": 2269} {"train_loss": -6.439126968383789, "global_step": 95319, "epoch": 2269} {"train_loss": -6.382302284240723, "global_step": 95320, "epoch": 2269} {"train_loss": -6.304583549499512, "global_step": 95321, "epoch": 2269} {"train_loss": -6.317055702209473, "global_step": 95322, "epoch": 2269} {"train_loss": -6.315927505493164, "global_step": 95323, "epoch": 2269} {"train_loss": -6.323770046234131, "global_step": 95324, "epoch": 2269} {"train_loss": -6.240781784057617, "global_step": 95325, "epoch": 2269} {"train_loss": -6.206570625305176, "global_step": 95326, "epoch": 2269} {"train_loss": -6.286415100097656, "global_step": 95327, "epoch": 2269} {"train_loss": -6.331433296203613, "global_step": 95328, "epoch": 2269} {"train_loss": -6.312721252441406, "global_step": 95329, "epoch": 2269} {"train_loss": -6.284557819366455, "global_step": 95330, "epoch": 2269} {"train_loss": -6.366839408874512, "global_step": 95331, "epoch": 2269} {"train_loss": -6.3083577156066895, "global_step": 95332, "epoch": 2269} {"train_loss": -6.413753509521484, "global_step": 95333, "epoch": 2269} {"train_loss": -6.315949440002441, "global_step": 95334, "epoch": 2269} {"train_loss": -6.276602745056152, "global_step": 95335, "epoch": 2269} {"train_loss": -6.27398681640625, "global_step": 95336, "epoch": 2269} {"train_loss": -6.2702484130859375, "global_step": 95337, "epoch": 2269} {"train_loss": -6.225150108337402, "global_step": 95338, "epoch": 2269} {"train_loss": -6.299508844103132, "global_step": 95339, "epoch": 2269, "val_loss": 75766.046875} {"train_loss": -6.498003005981445, "global_step": 95340, "epoch": 2270} {"train_loss": -6.285544395446777, "global_step": 95341, "epoch": 2270} {"train_loss": -6.3010969161987305, "global_step": 95342, "epoch": 2270} {"train_loss": -6.387686729431152, "global_step": 95343, "epoch": 2270} {"train_loss": -6.349130630493164, "global_step": 95344, "epoch": 2270} {"train_loss": -6.342853546142578, "global_step": 95345, "epoch": 2270} {"train_loss": -6.272171974182129, "global_step": 95346, "epoch": 2270} {"train_loss": -6.448511600494385, "global_step": 95347, "epoch": 2270} {"train_loss": -6.396172523498535, "global_step": 95348, "epoch": 2270} {"train_loss": -6.218599319458008, "global_step": 95349, "epoch": 2270} {"train_loss": -6.278104305267334, "global_step": 95350, "epoch": 2270} {"train_loss": -6.283535957336426, "global_step": 95351, "epoch": 2270} {"train_loss": -6.428586006164551, "global_step": 95352, "epoch": 2270} {"train_loss": -6.304818153381348, "global_step": 95353, "epoch": 2270} {"train_loss": -6.28201150894165, "global_step": 95354, "epoch": 2270} {"train_loss": -6.2021589279174805, "global_step": 95355, "epoch": 2270} {"train_loss": -6.277523040771484, "global_step": 95356, "epoch": 2270} {"train_loss": -6.276392936706543, "global_step": 95357, "epoch": 2270} {"train_loss": -6.351925373077393, "global_step": 95358, "epoch": 2270} {"train_loss": -6.334282875061035, "global_step": 95359, "epoch": 2270} {"train_loss": -6.276034355163574, "global_step": 95360, "epoch": 2270} {"train_loss": -6.302363395690918, "global_step": 95361, "epoch": 2270} {"train_loss": -6.330865859985352, "global_step": 95362, "epoch": 2270} {"train_loss": -6.3804168701171875, "global_step": 95363, "epoch": 2270} {"train_loss": -6.371515274047852, "global_step": 95364, "epoch": 2270} {"train_loss": -6.375767230987549, "global_step": 95365, "epoch": 2270} {"train_loss": -6.237429618835449, "global_step": 95366, "epoch": 2270} {"train_loss": -6.3667402267456055, "global_step": 95367, "epoch": 2270} {"train_loss": -6.185529708862305, "global_step": 95368, "epoch": 2270} {"train_loss": -6.2612199783325195, "global_step": 95369, "epoch": 2270} {"train_loss": -6.336125373840332, "global_step": 95370, "epoch": 2270} {"train_loss": -6.242814064025879, "global_step": 95371, "epoch": 2270} {"train_loss": -6.337075233459473, "global_step": 95372, "epoch": 2270} {"train_loss": -6.332839012145996, "global_step": 95373, "epoch": 2270} {"train_loss": -6.253697872161865, "global_step": 95374, "epoch": 2270} {"train_loss": -6.284030914306641, "global_step": 95375, "epoch": 2270} {"train_loss": -6.295988082885742, "global_step": 95376, "epoch": 2270} {"train_loss": -6.347378730773926, "global_step": 95377, "epoch": 2270} {"train_loss": -6.363863945007324, "global_step": 95378, "epoch": 2270} {"train_loss": -6.284533500671387, "global_step": 95379, "epoch": 2270} {"train_loss": -6.315314292907715, "global_step": 95380, "epoch": 2270} {"train_loss": -6.315068358466739, "global_step": 95381, "epoch": 2270, "val_loss": 75721.25} {"train_loss": -6.407042503356934, "global_step": 95382, "epoch": 2271} {"train_loss": -6.396677494049072, "global_step": 95383, "epoch": 2271} {"train_loss": -6.327675819396973, "global_step": 95384, "epoch": 2271} {"train_loss": -6.300497055053711, "global_step": 95385, "epoch": 2271} {"train_loss": -6.215828895568848, "global_step": 95386, "epoch": 2271} {"train_loss": -6.374812602996826, "global_step": 95387, "epoch": 2271} {"train_loss": -6.283504962921143, "global_step": 95388, "epoch": 2271} {"train_loss": -6.479002952575684, "global_step": 95389, "epoch": 2271} {"train_loss": -6.310927391052246, "global_step": 95390, "epoch": 2271} {"train_loss": -6.320496559143066, "global_step": 95391, "epoch": 2271} {"train_loss": -6.35211706161499, "global_step": 95392, "epoch": 2271} {"train_loss": -6.319683074951172, "global_step": 95393, "epoch": 2271} {"train_loss": -6.276182174682617, "global_step": 95394, "epoch": 2271} {"train_loss": -6.322477340698242, "global_step": 95395, "epoch": 2271} {"train_loss": -6.296753883361816, "global_step": 95396, "epoch": 2271} {"train_loss": -6.275638580322266, "global_step": 95397, "epoch": 2271} {"train_loss": -6.264782905578613, "global_step": 95398, "epoch": 2271} {"train_loss": -6.305129051208496, "global_step": 95399, "epoch": 2271} {"train_loss": -6.331840515136719, "global_step": 95400, "epoch": 2271} {"train_loss": -6.300631523132324, "global_step": 95401, "epoch": 2271} {"train_loss": -6.361792087554932, "global_step": 95402, "epoch": 2271} {"train_loss": -6.291027545928955, "global_step": 95403, "epoch": 2271} {"train_loss": -6.346921920776367, "global_step": 95404, "epoch": 2271} {"train_loss": -6.318599700927734, "global_step": 95405, "epoch": 2271} {"train_loss": -6.291171550750732, "global_step": 95406, "epoch": 2271} {"train_loss": -6.510199546813965, "global_step": 95407, "epoch": 2271} {"train_loss": -6.288366317749023, "global_step": 95408, "epoch": 2271} {"train_loss": -6.338314056396484, "global_step": 95409, "epoch": 2271} {"train_loss": -6.404650688171387, "global_step": 95410, "epoch": 2271} {"train_loss": -6.371264457702637, "global_step": 95411, "epoch": 2271} {"train_loss": -6.352384567260742, "global_step": 95412, "epoch": 2271} {"train_loss": -6.422569751739502, "global_step": 95413, "epoch": 2271} {"train_loss": -6.313073635101318, "global_step": 95414, "epoch": 2271} {"train_loss": -6.342341899871826, "global_step": 95415, "epoch": 2271} {"train_loss": -6.326137542724609, "global_step": 95416, "epoch": 2271} {"train_loss": -6.29141092300415, "global_step": 95417, "epoch": 2271} {"train_loss": -6.372714996337891, "global_step": 95418, "epoch": 2271} {"train_loss": -6.35866641998291, "global_step": 95419, "epoch": 2271} {"train_loss": -6.384248733520508, "global_step": 95420, "epoch": 2271} {"train_loss": -6.3282599449157715, "global_step": 95421, "epoch": 2271} {"train_loss": -6.350547790527344, "global_step": 95422, "epoch": 2271} {"train_loss": -6.336998349144345, "global_step": 95423, "epoch": 2271, "val_loss": 75695.140625} {"train_loss": -6.277636528015137, "global_step": 95424, "epoch": 2272} {"train_loss": -6.507323265075684, "global_step": 95425, "epoch": 2272} {"train_loss": -6.351670742034912, "global_step": 95426, "epoch": 2272} {"train_loss": -6.303329944610596, "global_step": 95427, "epoch": 2272} {"train_loss": -6.412976264953613, "global_step": 95428, "epoch": 2272} {"train_loss": -6.376676559448242, "global_step": 95429, "epoch": 2272} {"train_loss": -6.28269100189209, "global_step": 95430, "epoch": 2272} {"train_loss": -6.411936283111572, "global_step": 95431, "epoch": 2272} {"train_loss": -6.289338111877441, "global_step": 95432, "epoch": 2272} {"train_loss": -6.269227981567383, "global_step": 95433, "epoch": 2272} {"train_loss": -6.366366863250732, "global_step": 95434, "epoch": 2272} {"train_loss": -6.3055267333984375, "global_step": 95435, "epoch": 2272} {"train_loss": -6.286638259887695, "global_step": 95436, "epoch": 2272} {"train_loss": -6.206007957458496, "global_step": 95437, "epoch": 2272} {"train_loss": -6.282901763916016, "global_step": 95438, "epoch": 2272} {"train_loss": -6.38018798828125, "global_step": 95439, "epoch": 2272} {"train_loss": -6.214282989501953, "global_step": 95440, "epoch": 2272} {"train_loss": -6.3318305015563965, "global_step": 95441, "epoch": 2272} {"train_loss": -6.193297386169434, "global_step": 95442, "epoch": 2272} {"train_loss": -6.227989196777344, "global_step": 95443, "epoch": 2272} {"train_loss": -6.223641395568848, "global_step": 95444, "epoch": 2272} {"train_loss": -6.147377967834473, "global_step": 95445, "epoch": 2272} {"train_loss": -6.170193195343018, "global_step": 95446, "epoch": 2272} {"train_loss": -6.241686820983887, "global_step": 95447, "epoch": 2272} {"train_loss": -6.306984901428223, "global_step": 95448, "epoch": 2272} {"train_loss": -6.174776077270508, "global_step": 95449, "epoch": 2272} {"train_loss": -6.268792152404785, "global_step": 95450, "epoch": 2272} {"train_loss": -6.175412178039551, "global_step": 95451, "epoch": 2272} {"train_loss": -6.288829803466797, "global_step": 95452, "epoch": 2272} {"train_loss": -6.271860122680664, "global_step": 95453, "epoch": 2272} {"train_loss": -6.200374603271484, "global_step": 95454, "epoch": 2272} {"train_loss": -6.35307502746582, "global_step": 95455, "epoch": 2272} {"train_loss": -6.309600830078125, "global_step": 95456, "epoch": 2272} {"train_loss": -6.263077735900879, "global_step": 95457, "epoch": 2272} {"train_loss": -6.314167022705078, "global_step": 95458, "epoch": 2272} {"train_loss": -6.240452766418457, "global_step": 95459, "epoch": 2272} {"train_loss": -6.312029838562012, "global_step": 95460, "epoch": 2272} {"train_loss": -6.287524700164795, "global_step": 95461, "epoch": 2272} {"train_loss": -6.23664665222168, "global_step": 95462, "epoch": 2272} {"train_loss": -6.336755752563477, "global_step": 95463, "epoch": 2272} {"train_loss": -6.295618057250977, "global_step": 95464, "epoch": 2272} {"train_loss": -6.286159742446173, "global_step": 95465, "epoch": 2272, "val_loss": 75908.7578125} {"train_loss": -6.23127555847168, "global_step": 95466, "epoch": 2273} {"train_loss": -6.282533645629883, "global_step": 95467, "epoch": 2273} {"train_loss": -6.409116744995117, "global_step": 95468, "epoch": 2273} {"train_loss": -6.3104658126831055, "global_step": 95469, "epoch": 2273} {"train_loss": -6.261414527893066, "global_step": 95470, "epoch": 2273} {"train_loss": -6.203708648681641, "global_step": 95471, "epoch": 2273} {"train_loss": -6.340181350708008, "global_step": 95472, "epoch": 2273} {"train_loss": -6.293723106384277, "global_step": 95473, "epoch": 2273} {"train_loss": -6.252346038818359, "global_step": 95474, "epoch": 2273} {"train_loss": -6.311359405517578, "global_step": 95475, "epoch": 2273} {"train_loss": -6.3459649085998535, "global_step": 95476, "epoch": 2273} {"train_loss": -6.439676761627197, "global_step": 95477, "epoch": 2273} {"train_loss": -6.333194732666016, "global_step": 95478, "epoch": 2273} {"train_loss": -6.301568031311035, "global_step": 95479, "epoch": 2273} {"train_loss": -6.332426071166992, "global_step": 95480, "epoch": 2273} {"train_loss": -6.295663833618164, "global_step": 95481, "epoch": 2273} {"train_loss": -6.256095886230469, "global_step": 95482, "epoch": 2273} {"train_loss": -6.250101566314697, "global_step": 95483, "epoch": 2273} {"train_loss": -6.375528812408447, "global_step": 95484, "epoch": 2273} {"train_loss": -6.3565216064453125, "global_step": 95485, "epoch": 2273} {"train_loss": -6.347233295440674, "global_step": 95486, "epoch": 2273} {"train_loss": -6.432081699371338, "global_step": 95487, "epoch": 2273} {"train_loss": -6.2802581787109375, "global_step": 95488, "epoch": 2273} {"train_loss": -6.2329325675964355, "global_step": 95489, "epoch": 2273} {"train_loss": -6.061001300811768, "global_step": 95490, "epoch": 2273} {"train_loss": -6.307721138000488, "global_step": 95491, "epoch": 2273} {"train_loss": -6.213589668273926, "global_step": 95492, "epoch": 2273} {"train_loss": -6.345270156860352, "global_step": 95493, "epoch": 2273} {"train_loss": -6.246860027313232, "global_step": 95494, "epoch": 2273} {"train_loss": -6.2801923751831055, "global_step": 95495, "epoch": 2273} {"train_loss": -6.311199188232422, "global_step": 95496, "epoch": 2273} {"train_loss": -6.42044734954834, "global_step": 95497, "epoch": 2273} {"train_loss": -6.345498085021973, "global_step": 95498, "epoch": 2273} {"train_loss": -6.311798095703125, "global_step": 95499, "epoch": 2273} {"train_loss": -6.340656280517578, "global_step": 95500, "epoch": 2273} {"train_loss": -6.306878089904785, "global_step": 95501, "epoch": 2273} {"train_loss": -6.3159027099609375, "global_step": 95502, "epoch": 2273} {"train_loss": -6.462226867675781, "global_step": 95503, "epoch": 2273} {"train_loss": -6.508678436279297, "global_step": 95504, "epoch": 2273} {"train_loss": -6.280746936798096, "global_step": 95505, "epoch": 2273} {"train_loss": -6.472632884979248, "global_step": 95506, "epoch": 2273} {"train_loss": -6.318381581987653, "global_step": 95507, "epoch": 2273, "val_loss": 75574.3984375} {"train_loss": -6.329296588897705, "global_step": 95508, "epoch": 2274} {"train_loss": -6.422759056091309, "global_step": 95509, "epoch": 2274} {"train_loss": -6.283511638641357, "global_step": 95510, "epoch": 2274} {"train_loss": -6.224413871765137, "global_step": 95511, "epoch": 2274} {"train_loss": -6.4232177734375, "global_step": 95512, "epoch": 2274} {"train_loss": -6.274044990539551, "global_step": 95513, "epoch": 2274} {"train_loss": -6.363104343414307, "global_step": 95514, "epoch": 2274} {"train_loss": -6.243494510650635, "global_step": 95515, "epoch": 2274} {"train_loss": -6.262242317199707, "global_step": 95516, "epoch": 2274} {"train_loss": -6.3394293785095215, "global_step": 95517, "epoch": 2274} {"train_loss": -6.395871162414551, "global_step": 95518, "epoch": 2274} {"train_loss": -6.263680458068848, "global_step": 95519, "epoch": 2274} {"train_loss": -6.304474830627441, "global_step": 95520, "epoch": 2274} {"train_loss": -6.338913917541504, "global_step": 95521, "epoch": 2274} {"train_loss": -6.2378249168396, "global_step": 95522, "epoch": 2274} {"train_loss": -6.296420574188232, "global_step": 95523, "epoch": 2274} {"train_loss": -6.299890041351318, "global_step": 95524, "epoch": 2274} {"train_loss": -6.397426128387451, "global_step": 95525, "epoch": 2274} {"train_loss": -6.215913772583008, "global_step": 95526, "epoch": 2274} {"train_loss": -6.364313125610352, "global_step": 95527, "epoch": 2274} {"train_loss": -6.26861572265625, "global_step": 95528, "epoch": 2274} {"train_loss": -6.2606658935546875, "global_step": 95529, "epoch": 2274} {"train_loss": -6.252140045166016, "global_step": 95530, "epoch": 2274} {"train_loss": -6.192988872528076, "global_step": 95531, "epoch": 2274} {"train_loss": -6.310422897338867, "global_step": 95532, "epoch": 2274} {"train_loss": -6.27347469329834, "global_step": 95533, "epoch": 2274} {"train_loss": -6.219090938568115, "global_step": 95534, "epoch": 2274} {"train_loss": -6.307561874389648, "global_step": 95535, "epoch": 2274} {"train_loss": -6.265920639038086, "global_step": 95536, "epoch": 2274} {"train_loss": -6.383806228637695, "global_step": 95537, "epoch": 2274} {"train_loss": -6.192285537719727, "global_step": 95538, "epoch": 2274} {"train_loss": -6.214153289794922, "global_step": 95539, "epoch": 2274} {"train_loss": -6.247096538543701, "global_step": 95540, "epoch": 2274} {"train_loss": -6.298645973205566, "global_step": 95541, "epoch": 2274} {"train_loss": -6.2740478515625, "global_step": 95542, "epoch": 2274} {"train_loss": -6.273474216461182, "global_step": 95543, "epoch": 2274} {"train_loss": -6.223952293395996, "global_step": 95544, "epoch": 2274} {"train_loss": -6.336249351501465, "global_step": 95545, "epoch": 2274} {"train_loss": -6.352989196777344, "global_step": 95546, "epoch": 2274} {"train_loss": -6.228266716003418, "global_step": 95547, "epoch": 2274} {"train_loss": -6.385805130004883, "global_step": 95548, "epoch": 2274} {"train_loss": -6.292285851069859, "global_step": 95549, "epoch": 2274, "val_loss": 75355.3125} {"train_loss": -6.294922828674316, "global_step": 95550, "epoch": 2275} {"train_loss": -6.321968078613281, "global_step": 95551, "epoch": 2275} {"train_loss": -6.266809463500977, "global_step": 95552, "epoch": 2275} {"train_loss": -6.3052191734313965, "global_step": 95553, "epoch": 2275} {"train_loss": -6.207852840423584, "global_step": 95554, "epoch": 2275} {"train_loss": -6.311641693115234, "global_step": 95555, "epoch": 2275} {"train_loss": -6.223814487457275, "global_step": 95556, "epoch": 2275} {"train_loss": -6.344731330871582, "global_step": 95557, "epoch": 2275} {"train_loss": -6.170355796813965, "global_step": 95558, "epoch": 2275} {"train_loss": -6.254697799682617, "global_step": 95559, "epoch": 2275} {"train_loss": -6.095486640930176, "global_step": 95560, "epoch": 2275} {"train_loss": -6.230686187744141, "global_step": 95561, "epoch": 2275} {"train_loss": -6.296082496643066, "global_step": 95562, "epoch": 2275} {"train_loss": -6.080647945404053, "global_step": 95563, "epoch": 2275} {"train_loss": -6.2188005447387695, "global_step": 95564, "epoch": 2275} {"train_loss": -6.214651107788086, "global_step": 95565, "epoch": 2275} {"train_loss": -6.2241668701171875, "global_step": 95566, "epoch": 2275} {"train_loss": -6.229233741760254, "global_step": 95567, "epoch": 2275} {"train_loss": -6.255585670471191, "global_step": 95568, "epoch": 2275} {"train_loss": -6.2779316902160645, "global_step": 95569, "epoch": 2275} {"train_loss": -6.27742862701416, "global_step": 95570, "epoch": 2275} {"train_loss": -6.230957508087158, "global_step": 95571, "epoch": 2275} {"train_loss": -6.276117324829102, "global_step": 95572, "epoch": 2275} {"train_loss": -6.320741176605225, "global_step": 95573, "epoch": 2275} {"train_loss": -6.264660358428955, "global_step": 95574, "epoch": 2275} {"train_loss": -6.270122528076172, "global_step": 95575, "epoch": 2275} {"train_loss": -6.298864364624023, "global_step": 95576, "epoch": 2275} {"train_loss": -6.491833686828613, "global_step": 95577, "epoch": 2275} {"train_loss": -6.317056179046631, "global_step": 95578, "epoch": 2275} {"train_loss": -6.401033401489258, "global_step": 95579, "epoch": 2275} {"train_loss": -6.2923502922058105, "global_step": 95580, "epoch": 2275} {"train_loss": -6.26375675201416, "global_step": 95581, "epoch": 2275} {"train_loss": -6.248100280761719, "global_step": 95582, "epoch": 2275} {"train_loss": -6.25993013381958, "global_step": 95583, "epoch": 2275} {"train_loss": -6.443783760070801, "global_step": 95584, "epoch": 2275} {"train_loss": -6.244089603424072, "global_step": 95585, "epoch": 2275} {"train_loss": -6.2177863121032715, "global_step": 95586, "epoch": 2275} {"train_loss": -6.164754390716553, "global_step": 95587, "epoch": 2275} {"train_loss": -6.211615562438965, "global_step": 95588, "epoch": 2275} {"train_loss": -6.372702121734619, "global_step": 95589, "epoch": 2275} {"train_loss": -6.293058395385742, "global_step": 95590, "epoch": 2275} {"train_loss": -6.268683649244762, "global_step": 95591, "epoch": 2275, "val_loss": 75829.484375} {"train_loss": -6.223553657531738, "global_step": 95592, "epoch": 2276} {"train_loss": -6.36376428604126, "global_step": 95593, "epoch": 2276} {"train_loss": -6.239776134490967, "global_step": 95594, "epoch": 2276} {"train_loss": -6.2625627517700195, "global_step": 95595, "epoch": 2276} {"train_loss": -6.36473274230957, "global_step": 95596, "epoch": 2276} {"train_loss": -6.338559150695801, "global_step": 95597, "epoch": 2276} {"train_loss": -6.3639984130859375, "global_step": 95598, "epoch": 2276} {"train_loss": -6.318033218383789, "global_step": 95599, "epoch": 2276} {"train_loss": -6.2447967529296875, "global_step": 95600, "epoch": 2276} {"train_loss": -6.306546211242676, "global_step": 95601, "epoch": 2276} {"train_loss": -6.367819786071777, "global_step": 95602, "epoch": 2276} {"train_loss": -6.33463716506958, "global_step": 95603, "epoch": 2276} {"train_loss": -6.323955535888672, "global_step": 95604, "epoch": 2276} {"train_loss": -6.317117214202881, "global_step": 95605, "epoch": 2276} {"train_loss": -6.169355392456055, "global_step": 95606, "epoch": 2276} {"train_loss": -6.2975616455078125, "global_step": 95607, "epoch": 2276} {"train_loss": -6.292705059051514, "global_step": 95608, "epoch": 2276} {"train_loss": -6.190204620361328, "global_step": 95609, "epoch": 2276} {"train_loss": -6.49439001083374, "global_step": 95610, "epoch": 2276} {"train_loss": -6.175217628479004, "global_step": 95611, "epoch": 2276} {"train_loss": -6.335690975189209, "global_step": 95612, "epoch": 2276} {"train_loss": -6.315281867980957, "global_step": 95613, "epoch": 2276} {"train_loss": -6.299874305725098, "global_step": 95614, "epoch": 2276} {"train_loss": -6.312042713165283, "global_step": 95615, "epoch": 2276} {"train_loss": -6.243662357330322, "global_step": 95616, "epoch": 2276} {"train_loss": -6.364500999450684, "global_step": 95617, "epoch": 2276} {"train_loss": -6.366092681884766, "global_step": 95618, "epoch": 2276} {"train_loss": -6.330395698547363, "global_step": 95619, "epoch": 2276} {"train_loss": -6.332736968994141, "global_step": 95620, "epoch": 2276} {"train_loss": -6.338953018188477, "global_step": 95621, "epoch": 2276} {"train_loss": -6.3679094314575195, "global_step": 95622, "epoch": 2276} {"train_loss": -6.313427925109863, "global_step": 95623, "epoch": 2276} {"train_loss": -6.388665676116943, "global_step": 95624, "epoch": 2276} {"train_loss": -6.340858459472656, "global_step": 95625, "epoch": 2276} {"train_loss": -6.216601371765137, "global_step": 95626, "epoch": 2276} {"train_loss": -6.403428077697754, "global_step": 95627, "epoch": 2276} {"train_loss": -6.259594917297363, "global_step": 95628, "epoch": 2276} {"train_loss": -6.326637268066406, "global_step": 95629, "epoch": 2276} {"train_loss": -6.214835166931152, "global_step": 95630, "epoch": 2276} {"train_loss": -6.249253273010254, "global_step": 95631, "epoch": 2276} {"train_loss": -6.3474016189575195, "global_step": 95632, "epoch": 2276} {"train_loss": -6.30819761185419, "global_step": 95633, "epoch": 2276, "val_loss": 75537.421875} {"train_loss": -6.32914400100708, "global_step": 95634, "epoch": 2277} {"train_loss": -6.3576860427856445, "global_step": 95635, "epoch": 2277} {"train_loss": -6.2775750160217285, "global_step": 95636, "epoch": 2277} {"train_loss": -6.3672404289245605, "global_step": 95637, "epoch": 2277} {"train_loss": -6.263509750366211, "global_step": 95638, "epoch": 2277} {"train_loss": -6.181906700134277, "global_step": 95639, "epoch": 2277} {"train_loss": -6.33983850479126, "global_step": 95640, "epoch": 2277} {"train_loss": -6.326177597045898, "global_step": 95641, "epoch": 2277} {"train_loss": -6.356025695800781, "global_step": 95642, "epoch": 2277} {"train_loss": -6.301619052886963, "global_step": 95643, "epoch": 2277} {"train_loss": -6.3699445724487305, "global_step": 95644, "epoch": 2277} {"train_loss": -6.362542629241943, "global_step": 95645, "epoch": 2277} {"train_loss": -6.365169525146484, "global_step": 95646, "epoch": 2277} {"train_loss": -6.239997863769531, "global_step": 95647, "epoch": 2277} {"train_loss": -6.282905101776123, "global_step": 95648, "epoch": 2277} {"train_loss": -6.411876678466797, "global_step": 95649, "epoch": 2277} {"train_loss": -6.308266639709473, "global_step": 95650, "epoch": 2277} {"train_loss": -6.195055961608887, "global_step": 95651, "epoch": 2277} {"train_loss": -6.172147274017334, "global_step": 95652, "epoch": 2277} {"train_loss": -6.343014717102051, "global_step": 95653, "epoch": 2277} {"train_loss": -6.254871368408203, "global_step": 95654, "epoch": 2277} {"train_loss": -6.346275806427002, "global_step": 95655, "epoch": 2277} {"train_loss": -6.2785515785217285, "global_step": 95656, "epoch": 2277} {"train_loss": -6.3941450119018555, "global_step": 95657, "epoch": 2277} {"train_loss": -6.4350481033325195, "global_step": 95658, "epoch": 2277} {"train_loss": -6.315989971160889, "global_step": 95659, "epoch": 2277} {"train_loss": -6.246430397033691, "global_step": 95660, "epoch": 2277} {"train_loss": -6.388837814331055, "global_step": 95661, "epoch": 2277} {"train_loss": -6.347768783569336, "global_step": 95662, "epoch": 2277} {"train_loss": -6.418323516845703, "global_step": 95663, "epoch": 2277} {"train_loss": -6.40003776550293, "global_step": 95664, "epoch": 2277} {"train_loss": -6.300332069396973, "global_step": 95665, "epoch": 2277} {"train_loss": -6.322597026824951, "global_step": 95666, "epoch": 2277} {"train_loss": -6.180510520935059, "global_step": 95667, "epoch": 2277} {"train_loss": -6.343812942504883, "global_step": 95668, "epoch": 2277} {"train_loss": -6.403367042541504, "global_step": 95669, "epoch": 2277} {"train_loss": -6.311875343322754, "global_step": 95670, "epoch": 2277} {"train_loss": -6.439474105834961, "global_step": 95671, "epoch": 2277} {"train_loss": -6.234416961669922, "global_step": 95672, "epoch": 2277} {"train_loss": -6.2793779373168945, "global_step": 95673, "epoch": 2277} {"train_loss": -6.37554931640625, "global_step": 95674, "epoch": 2277} {"train_loss": -6.320672988891602, "global_step": 95675, "epoch": 2277, "val_loss": 75612.7109375} {"train_loss": -6.362148284912109, "global_step": 95676, "epoch": 2278} {"train_loss": -6.248592376708984, "global_step": 95677, "epoch": 2278} {"train_loss": -6.285394191741943, "global_step": 95678, "epoch": 2278} {"train_loss": -6.3693671226501465, "global_step": 95679, "epoch": 2278} {"train_loss": -6.255921840667725, "global_step": 95680, "epoch": 2278} {"train_loss": -6.33365535736084, "global_step": 95681, "epoch": 2278} {"train_loss": -6.322955131530762, "global_step": 95682, "epoch": 2278} {"train_loss": -6.1976752281188965, "global_step": 95683, "epoch": 2278} {"train_loss": -6.247280597686768, "global_step": 95684, "epoch": 2278} {"train_loss": -6.243541717529297, "global_step": 95685, "epoch": 2278} {"train_loss": -6.40403413772583, "global_step": 95686, "epoch": 2278} {"train_loss": -6.327925682067871, "global_step": 95687, "epoch": 2278} {"train_loss": -6.420402526855469, "global_step": 95688, "epoch": 2278} {"train_loss": -6.283714294433594, "global_step": 95689, "epoch": 2278} {"train_loss": -6.328958988189697, "global_step": 95690, "epoch": 2278} {"train_loss": -6.1655378341674805, "global_step": 95691, "epoch": 2278} {"train_loss": -6.227649211883545, "global_step": 95692, "epoch": 2278} {"train_loss": -6.391358852386475, "global_step": 95693, "epoch": 2278} {"train_loss": -6.196263313293457, "global_step": 95694, "epoch": 2278} {"train_loss": -6.204196929931641, "global_step": 95695, "epoch": 2278} {"train_loss": -6.254403114318848, "global_step": 95696, "epoch": 2278} {"train_loss": -6.33409309387207, "global_step": 95697, "epoch": 2278} {"train_loss": -6.193828582763672, "global_step": 95698, "epoch": 2278} {"train_loss": -6.303466796875, "global_step": 95699, "epoch": 2278} {"train_loss": -6.257020950317383, "global_step": 95700, "epoch": 2278} {"train_loss": -6.217437267303467, "global_step": 95701, "epoch": 2278} {"train_loss": -6.174049377441406, "global_step": 95702, "epoch": 2278} {"train_loss": -6.233648300170898, "global_step": 95703, "epoch": 2278} {"train_loss": -6.227080345153809, "global_step": 95704, "epoch": 2278} {"train_loss": -6.228071689605713, "global_step": 95705, "epoch": 2278} {"train_loss": -6.260978698730469, "global_step": 95706, "epoch": 2278} {"train_loss": -6.149726867675781, "global_step": 95707, "epoch": 2278} {"train_loss": -6.147554397583008, "global_step": 95708, "epoch": 2278} {"train_loss": -6.219472885131836, "global_step": 95709, "epoch": 2278} {"train_loss": -6.386473655700684, "global_step": 95710, "epoch": 2278} {"train_loss": -6.320220947265625, "global_step": 95711, "epoch": 2278} {"train_loss": -6.212685585021973, "global_step": 95712, "epoch": 2278} {"train_loss": -6.232370376586914, "global_step": 95713, "epoch": 2278} {"train_loss": -6.2164506912231445, "global_step": 95714, "epoch": 2278} {"train_loss": -6.419997215270996, "global_step": 95715, "epoch": 2278} {"train_loss": -6.226495265960693, "global_step": 95716, "epoch": 2278} {"train_loss": -6.267692872456142, "global_step": 95717, "epoch": 2278, "val_loss": 75470.2890625} {"train_loss": -6.207816123962402, "global_step": 95718, "epoch": 2279} {"train_loss": -6.304300785064697, "global_step": 95719, "epoch": 2279} {"train_loss": -6.308063507080078, "global_step": 95720, "epoch": 2279} {"train_loss": -6.254335403442383, "global_step": 95721, "epoch": 2279} {"train_loss": -6.272916793823242, "global_step": 95722, "epoch": 2279} {"train_loss": -6.2681732177734375, "global_step": 95723, "epoch": 2279} {"train_loss": -6.39483642578125, "global_step": 95724, "epoch": 2279} {"train_loss": -6.400579929351807, "global_step": 95725, "epoch": 2279} {"train_loss": -6.274536609649658, "global_step": 95726, "epoch": 2279} {"train_loss": -6.252891540527344, "global_step": 95727, "epoch": 2279} {"train_loss": -6.262113571166992, "global_step": 95728, "epoch": 2279} {"train_loss": -6.276609897613525, "global_step": 95729, "epoch": 2279} {"train_loss": -6.340662956237793, "global_step": 95730, "epoch": 2279} {"train_loss": -6.185634136199951, "global_step": 95731, "epoch": 2279} {"train_loss": -6.292867660522461, "global_step": 95732, "epoch": 2279} {"train_loss": -6.290006637573242, "global_step": 95733, "epoch": 2279} {"train_loss": -6.325121879577637, "global_step": 95734, "epoch": 2279} {"train_loss": -6.331552505493164, "global_step": 95735, "epoch": 2279} {"train_loss": -6.323202133178711, "global_step": 95736, "epoch": 2279} {"train_loss": -6.3486647605896, "global_step": 95737, "epoch": 2279} {"train_loss": -6.332747459411621, "global_step": 95738, "epoch": 2279} {"train_loss": -6.270421028137207, "global_step": 95739, "epoch": 2279} {"train_loss": -6.317735195159912, "global_step": 95740, "epoch": 2279} {"train_loss": -6.383534908294678, "global_step": 95741, "epoch": 2279} {"train_loss": -6.277280330657959, "global_step": 95742, "epoch": 2279} {"train_loss": -6.301345348358154, "global_step": 95743, "epoch": 2279} {"train_loss": -6.350116729736328, "global_step": 95744, "epoch": 2279} {"train_loss": -6.275137424468994, "global_step": 95745, "epoch": 2279} {"train_loss": -6.394098281860352, "global_step": 95746, "epoch": 2279} {"train_loss": -6.263456344604492, "global_step": 95747, "epoch": 2279} {"train_loss": -6.367947101593018, "global_step": 95748, "epoch": 2279} {"train_loss": -6.272608757019043, "global_step": 95749, "epoch": 2279} {"train_loss": -6.344775199890137, "global_step": 95750, "epoch": 2279} {"train_loss": -6.296236038208008, "global_step": 95751, "epoch": 2279} {"train_loss": -6.315476894378662, "global_step": 95752, "epoch": 2279} {"train_loss": -6.308937072753906, "global_step": 95753, "epoch": 2279} {"train_loss": -6.327816963195801, "global_step": 95754, "epoch": 2279} {"train_loss": -6.291162490844727, "global_step": 95755, "epoch": 2279} {"train_loss": -6.315038681030273, "global_step": 95756, "epoch": 2279} {"train_loss": -6.22987174987793, "global_step": 95757, "epoch": 2279} {"train_loss": -6.287252426147461, "global_step": 95758, "epoch": 2279} {"train_loss": -6.304422401246571, "global_step": 95759, "epoch": 2279, "val_loss": 75687.0234375} {"train_loss": -6.275581359863281, "global_step": 95760, "epoch": 2280} {"train_loss": -6.309002876281738, "global_step": 95761, "epoch": 2280} {"train_loss": -6.391530513763428, "global_step": 95762, "epoch": 2280} {"train_loss": -6.27485990524292, "global_step": 95763, "epoch": 2280} {"train_loss": -6.313647270202637, "global_step": 95764, "epoch": 2280} {"train_loss": -6.278770923614502, "global_step": 95765, "epoch": 2280} {"train_loss": -6.322162628173828, "global_step": 95766, "epoch": 2280} {"train_loss": -6.347939491271973, "global_step": 95767, "epoch": 2280} {"train_loss": -6.284432888031006, "global_step": 95768, "epoch": 2280} {"train_loss": -6.276353359222412, "global_step": 95769, "epoch": 2280} {"train_loss": -6.236145973205566, "global_step": 95770, "epoch": 2280} {"train_loss": -6.218707084655762, "global_step": 95771, "epoch": 2280} {"train_loss": -6.31861686706543, "global_step": 95772, "epoch": 2280} {"train_loss": -6.38333797454834, "global_step": 95773, "epoch": 2280} {"train_loss": -6.329068183898926, "global_step": 95774, "epoch": 2280} {"train_loss": -6.386023044586182, "global_step": 95775, "epoch": 2280} {"train_loss": -6.304292678833008, "global_step": 95776, "epoch": 2280} {"train_loss": -6.223188877105713, "global_step": 95777, "epoch": 2280} {"train_loss": -6.1903157234191895, "global_step": 95778, "epoch": 2280} {"train_loss": -6.215936660766602, "global_step": 95779, "epoch": 2280} {"train_loss": -6.215542793273926, "global_step": 95780, "epoch": 2280} {"train_loss": -6.261505603790283, "global_step": 95781, "epoch": 2280} {"train_loss": -6.333833694458008, "global_step": 95782, "epoch": 2280} {"train_loss": -6.330465316772461, "global_step": 95783, "epoch": 2280} {"train_loss": -6.325445175170898, "global_step": 95784, "epoch": 2280} {"train_loss": -6.286006450653076, "global_step": 95785, "epoch": 2280} {"train_loss": -6.293301582336426, "global_step": 95786, "epoch": 2280} {"train_loss": -6.338343620300293, "global_step": 95787, "epoch": 2280} {"train_loss": -6.42002010345459, "global_step": 95788, "epoch": 2280} {"train_loss": -6.321084499359131, "global_step": 95789, "epoch": 2280} {"train_loss": -6.355246543884277, "global_step": 95790, "epoch": 2280} {"train_loss": -6.165375709533691, "global_step": 95791, "epoch": 2280} {"train_loss": -6.34587287902832, "global_step": 95792, "epoch": 2280} {"train_loss": -6.340445518493652, "global_step": 95793, "epoch": 2280} {"train_loss": -6.322680473327637, "global_step": 95794, "epoch": 2280} {"train_loss": -6.356400489807129, "global_step": 95795, "epoch": 2280} {"train_loss": -6.305837154388428, "global_step": 95796, "epoch": 2280} {"train_loss": -6.288437366485596, "global_step": 95797, "epoch": 2280} {"train_loss": -6.260053634643555, "global_step": 95798, "epoch": 2280} {"train_loss": -6.330828666687012, "global_step": 95799, "epoch": 2280} {"train_loss": -6.205452919006348, "global_step": 95800, "epoch": 2280} {"train_loss": -6.298642851057506, "global_step": 95801, "epoch": 2280, "val_loss": 75732.46875} {"train_loss": -6.269618988037109, "global_step": 95802, "epoch": 2281} {"train_loss": -6.165613174438477, "global_step": 95803, "epoch": 2281} {"train_loss": -6.17222785949707, "global_step": 95804, "epoch": 2281} {"train_loss": -6.318466663360596, "global_step": 95805, "epoch": 2281} {"train_loss": -6.290475845336914, "global_step": 95806, "epoch": 2281} {"train_loss": -6.325044631958008, "global_step": 95807, "epoch": 2281} {"train_loss": -6.259713649749756, "global_step": 95808, "epoch": 2281} {"train_loss": -6.271684169769287, "global_step": 95809, "epoch": 2281} {"train_loss": -6.212643623352051, "global_step": 95810, "epoch": 2281} {"train_loss": -6.309118270874023, "global_step": 95811, "epoch": 2281} {"train_loss": -6.2769880294799805, "global_step": 95812, "epoch": 2281} {"train_loss": -6.360545635223389, "global_step": 95813, "epoch": 2281} {"train_loss": -6.350000381469727, "global_step": 95814, "epoch": 2281} {"train_loss": -6.295792579650879, "global_step": 95815, "epoch": 2281} {"train_loss": -6.34934139251709, "global_step": 95816, "epoch": 2281} {"train_loss": -6.207586765289307, "global_step": 95817, "epoch": 2281} {"train_loss": -6.3306403160095215, "global_step": 95818, "epoch": 2281} {"train_loss": -6.3045654296875, "global_step": 95819, "epoch": 2281} {"train_loss": -6.2430925369262695, "global_step": 95820, "epoch": 2281} {"train_loss": -6.22625732421875, "global_step": 95821, "epoch": 2281} {"train_loss": -6.268253326416016, "global_step": 95822, "epoch": 2281} {"train_loss": -6.381613731384277, "global_step": 95823, "epoch": 2281} {"train_loss": -6.348934173583984, "global_step": 95824, "epoch": 2281} {"train_loss": -6.420585632324219, "global_step": 95825, "epoch": 2281} {"train_loss": -6.3385138511657715, "global_step": 95826, "epoch": 2281} {"train_loss": -6.453853130340576, "global_step": 95827, "epoch": 2281} {"train_loss": -6.244264125823975, "global_step": 95828, "epoch": 2281} {"train_loss": -6.28957462310791, "global_step": 95829, "epoch": 2281} {"train_loss": -6.47035026550293, "global_step": 95830, "epoch": 2281} {"train_loss": -6.322935104370117, "global_step": 95831, "epoch": 2281} {"train_loss": -6.203151702880859, "global_step": 95832, "epoch": 2281} {"train_loss": -6.407196998596191, "global_step": 95833, "epoch": 2281} {"train_loss": -6.4365739822387695, "global_step": 95834, "epoch": 2281} {"train_loss": -6.305995464324951, "global_step": 95835, "epoch": 2281} {"train_loss": -6.398167610168457, "global_step": 95836, "epoch": 2281} {"train_loss": -6.331445693969727, "global_step": 95837, "epoch": 2281} {"train_loss": -6.33077335357666, "global_step": 95838, "epoch": 2281} {"train_loss": -6.450617790222168, "global_step": 95839, "epoch": 2281} {"train_loss": -6.444234848022461, "global_step": 95840, "epoch": 2281} {"train_loss": -6.283679962158203, "global_step": 95841, "epoch": 2281} {"train_loss": -6.392972946166992, "global_step": 95842, "epoch": 2281} {"train_loss": -6.315530288787115, "global_step": 95843, "epoch": 2281, "val_loss": 75435.734375} {"train_loss": -6.375338554382324, "global_step": 95844, "epoch": 2282} {"train_loss": -6.40587043762207, "global_step": 95845, "epoch": 2282} {"train_loss": -6.247140884399414, "global_step": 95846, "epoch": 2282} {"train_loss": -6.448241233825684, "global_step": 95847, "epoch": 2282} {"train_loss": -6.368291854858398, "global_step": 95848, "epoch": 2282} {"train_loss": -6.39583158493042, "global_step": 95849, "epoch": 2282} {"train_loss": -6.3536376953125, "global_step": 95850, "epoch": 2282} {"train_loss": -6.375086784362793, "global_step": 95851, "epoch": 2282} {"train_loss": -6.344315528869629, "global_step": 95852, "epoch": 2282} {"train_loss": -6.443048477172852, "global_step": 95853, "epoch": 2282} {"train_loss": -6.340583801269531, "global_step": 95854, "epoch": 2282} {"train_loss": -6.359005451202393, "global_step": 95855, "epoch": 2282} {"train_loss": -6.391239643096924, "global_step": 95856, "epoch": 2282} {"train_loss": -6.434378147125244, "global_step": 95857, "epoch": 2282} {"train_loss": -6.333849906921387, "global_step": 95858, "epoch": 2282} {"train_loss": -6.433494567871094, "global_step": 95859, "epoch": 2282} {"train_loss": -6.377590179443359, "global_step": 95860, "epoch": 2282} {"train_loss": -6.317819595336914, "global_step": 95861, "epoch": 2282} {"train_loss": -6.38386869430542, "global_step": 95862, "epoch": 2282} {"train_loss": -6.3590850830078125, "global_step": 95863, "epoch": 2282} {"train_loss": -6.267274856567383, "global_step": 95864, "epoch": 2282} {"train_loss": -6.309882640838623, "global_step": 95865, "epoch": 2282} {"train_loss": -6.306183815002441, "global_step": 95866, "epoch": 2282} {"train_loss": -6.380634307861328, "global_step": 95867, "epoch": 2282} {"train_loss": -6.213076591491699, "global_step": 95868, "epoch": 2282} {"train_loss": -6.337873935699463, "global_step": 95869, "epoch": 2282} {"train_loss": -6.433123588562012, "global_step": 95870, "epoch": 2282} {"train_loss": -6.203830718994141, "global_step": 95871, "epoch": 2282} {"train_loss": -6.3262434005737305, "global_step": 95872, "epoch": 2282} {"train_loss": -6.277172088623047, "global_step": 95873, "epoch": 2282} {"train_loss": -6.267522811889648, "global_step": 95874, "epoch": 2282} {"train_loss": -6.2124104499816895, "global_step": 95875, "epoch": 2282} {"train_loss": -6.261600494384766, "global_step": 95876, "epoch": 2282} {"train_loss": -6.139618873596191, "global_step": 95877, "epoch": 2282} {"train_loss": -6.378233432769775, "global_step": 95878, "epoch": 2282} {"train_loss": -6.383745193481445, "global_step": 95879, "epoch": 2282} {"train_loss": -6.222341060638428, "global_step": 95880, "epoch": 2282} {"train_loss": -6.194591522216797, "global_step": 95881, "epoch": 2282} {"train_loss": -6.183306694030762, "global_step": 95882, "epoch": 2282} {"train_loss": -6.264603137969971, "global_step": 95883, "epoch": 2282} {"train_loss": -6.387761116027832, "global_step": 95884, "epoch": 2282} {"train_loss": -6.3256808916727705, "global_step": 95885, "epoch": 2282, "val_loss": 75578.2578125} {"train_loss": -6.332391262054443, "global_step": 95886, "epoch": 2283} {"train_loss": -6.294953346252441, "global_step": 95887, "epoch": 2283} {"train_loss": -6.234663963317871, "global_step": 95888, "epoch": 2283} {"train_loss": -6.436749458312988, "global_step": 95889, "epoch": 2283} {"train_loss": -6.332401275634766, "global_step": 95890, "epoch": 2283} {"train_loss": -6.365874290466309, "global_step": 95891, "epoch": 2283} {"train_loss": -6.252932548522949, "global_step": 95892, "epoch": 2283} {"train_loss": -6.463540077209473, "global_step": 95893, "epoch": 2283} {"train_loss": -6.389438152313232, "global_step": 95894, "epoch": 2283} {"train_loss": -6.321575164794922, "global_step": 95895, "epoch": 2283} {"train_loss": -6.338477611541748, "global_step": 95896, "epoch": 2283} {"train_loss": -6.2721734046936035, "global_step": 95897, "epoch": 2283} {"train_loss": -6.362150192260742, "global_step": 95898, "epoch": 2283} {"train_loss": -6.299879550933838, "global_step": 95899, "epoch": 2283} {"train_loss": -6.23760986328125, "global_step": 95900, "epoch": 2283} {"train_loss": -6.3756818771362305, "global_step": 95901, "epoch": 2283} {"train_loss": -6.343244552612305, "global_step": 95902, "epoch": 2283} {"train_loss": -6.446242332458496, "global_step": 95903, "epoch": 2283} {"train_loss": -6.374479293823242, "global_step": 95904, "epoch": 2283} {"train_loss": -6.432913780212402, "global_step": 95905, "epoch": 2283} {"train_loss": -6.146429061889648, "global_step": 95906, "epoch": 2283} {"train_loss": -6.406519412994385, "global_step": 95907, "epoch": 2283} {"train_loss": -6.405486583709717, "global_step": 95908, "epoch": 2283} {"train_loss": -6.331399917602539, "global_step": 95909, "epoch": 2283} {"train_loss": -6.373223781585693, "global_step": 95910, "epoch": 2283} {"train_loss": -6.237445831298828, "global_step": 95911, "epoch": 2283} {"train_loss": -6.2925920486450195, "global_step": 95912, "epoch": 2283} {"train_loss": -6.295844078063965, "global_step": 95913, "epoch": 2283} {"train_loss": -6.364318370819092, "global_step": 95914, "epoch": 2283} {"train_loss": -6.3630852699279785, "global_step": 95915, "epoch": 2283} {"train_loss": -6.341727256774902, "global_step": 95916, "epoch": 2283} {"train_loss": -6.2761077880859375, "global_step": 95917, "epoch": 2283} {"train_loss": -6.342972278594971, "global_step": 95918, "epoch": 2283} {"train_loss": -6.263273239135742, "global_step": 95919, "epoch": 2283} {"train_loss": -6.395453453063965, "global_step": 95920, "epoch": 2283} {"train_loss": -6.355688095092773, "global_step": 95921, "epoch": 2283} {"train_loss": -6.394046306610107, "global_step": 95922, "epoch": 2283} {"train_loss": -6.404664993286133, "global_step": 95923, "epoch": 2283} {"train_loss": -6.337327003479004, "global_step": 95924, "epoch": 2283} {"train_loss": -6.309351921081543, "global_step": 95925, "epoch": 2283} {"train_loss": -6.3818039894104, "global_step": 95926, "epoch": 2283} {"train_loss": -6.336352336974371, "global_step": 95927, "epoch": 2283, "val_loss": 75765.15625} {"train_loss": -6.213964939117432, "global_step": 95928, "epoch": 2284} {"train_loss": -6.274139404296875, "global_step": 95929, "epoch": 2284} {"train_loss": -6.286746978759766, "global_step": 95930, "epoch": 2284} {"train_loss": -6.123112678527832, "global_step": 95931, "epoch": 2284} {"train_loss": -6.392287731170654, "global_step": 95932, "epoch": 2284} {"train_loss": -6.189701557159424, "global_step": 95933, "epoch": 2284} {"train_loss": -6.243378639221191, "global_step": 95934, "epoch": 2284} {"train_loss": -6.250888347625732, "global_step": 95935, "epoch": 2284} {"train_loss": -6.185313701629639, "global_step": 95936, "epoch": 2284} {"train_loss": -6.365481376647949, "global_step": 95937, "epoch": 2284} {"train_loss": -6.200150966644287, "global_step": 95938, "epoch": 2284} {"train_loss": -6.269301414489746, "global_step": 95939, "epoch": 2284} {"train_loss": -6.449013710021973, "global_step": 95940, "epoch": 2284} {"train_loss": -6.139039516448975, "global_step": 95941, "epoch": 2284} {"train_loss": -6.306246280670166, "global_step": 95942, "epoch": 2284} {"train_loss": -6.146503448486328, "global_step": 95943, "epoch": 2284} {"train_loss": -6.307271957397461, "global_step": 95944, "epoch": 2284} {"train_loss": -6.144493579864502, "global_step": 95945, "epoch": 2284} {"train_loss": -6.409565448760986, "global_step": 95946, "epoch": 2284} {"train_loss": -6.154510974884033, "global_step": 95947, "epoch": 2284} {"train_loss": -6.267734527587891, "global_step": 95948, "epoch": 2284} {"train_loss": -6.253363132476807, "global_step": 95949, "epoch": 2284} {"train_loss": -6.200502395629883, "global_step": 95950, "epoch": 2284} {"train_loss": -6.521491527557373, "global_step": 95951, "epoch": 2284} {"train_loss": -6.2401885986328125, "global_step": 95952, "epoch": 2284} {"train_loss": -6.358176231384277, "global_step": 95953, "epoch": 2284} {"train_loss": -6.3522138595581055, "global_step": 95954, "epoch": 2284} {"train_loss": -6.3878092765808105, "global_step": 95955, "epoch": 2284} {"train_loss": -6.269157886505127, "global_step": 95956, "epoch": 2284} {"train_loss": -6.414703845977783, "global_step": 95957, "epoch": 2284} {"train_loss": -6.393092155456543, "global_step": 95958, "epoch": 2284} {"train_loss": -6.298052787780762, "global_step": 95959, "epoch": 2284} {"train_loss": -6.376491546630859, "global_step": 95960, "epoch": 2284} {"train_loss": -6.3809685707092285, "global_step": 95961, "epoch": 2284} {"train_loss": -6.423186302185059, "global_step": 95962, "epoch": 2284} {"train_loss": -6.275252819061279, "global_step": 95963, "epoch": 2284} {"train_loss": -6.425119876861572, "global_step": 95964, "epoch": 2284} {"train_loss": -6.309123992919922, "global_step": 95965, "epoch": 2284} {"train_loss": -6.256069183349609, "global_step": 95966, "epoch": 2284} {"train_loss": -6.458553314208984, "global_step": 95967, "epoch": 2284} {"train_loss": -6.33464241027832, "global_step": 95968, "epoch": 2284} {"train_loss": -6.3013107890174505, "global_step": 95969, "epoch": 2284, "val_loss": 75849.8359375} {"train_loss": -6.342673301696777, "global_step": 95970, "epoch": 2285} {"train_loss": -6.153687477111816, "global_step": 95971, "epoch": 2285} {"train_loss": -6.401012420654297, "global_step": 95972, "epoch": 2285} {"train_loss": -6.242338180541992, "global_step": 95973, "epoch": 2285} {"train_loss": -6.220292091369629, "global_step": 95974, "epoch": 2285} {"train_loss": -6.349555015563965, "global_step": 95975, "epoch": 2285} {"train_loss": -6.332047462463379, "global_step": 95976, "epoch": 2285} {"train_loss": -6.298978805541992, "global_step": 95977, "epoch": 2285} {"train_loss": -6.327375411987305, "global_step": 95978, "epoch": 2285} {"train_loss": -6.260370254516602, "global_step": 95979, "epoch": 2285} {"train_loss": -6.291046142578125, "global_step": 95980, "epoch": 2285} {"train_loss": -6.275589466094971, "global_step": 95981, "epoch": 2285} {"train_loss": -6.295294761657715, "global_step": 95982, "epoch": 2285} {"train_loss": -6.291102886199951, "global_step": 95983, "epoch": 2285} {"train_loss": -6.276203155517578, "global_step": 95984, "epoch": 2285} {"train_loss": -6.287714004516602, "global_step": 95985, "epoch": 2285} {"train_loss": -6.293473243713379, "global_step": 95986, "epoch": 2285} {"train_loss": -6.325486660003662, "global_step": 95987, "epoch": 2285} {"train_loss": -6.310491561889648, "global_step": 95988, "epoch": 2285} {"train_loss": -6.3589935302734375, "global_step": 95989, "epoch": 2285} {"train_loss": -6.214872360229492, "global_step": 95990, "epoch": 2285} {"train_loss": -6.2814836502075195, "global_step": 95991, "epoch": 2285} {"train_loss": -6.335360527038574, "global_step": 95992, "epoch": 2285} {"train_loss": -6.249455451965332, "global_step": 95993, "epoch": 2285} {"train_loss": -6.230452537536621, "global_step": 95994, "epoch": 2285} {"train_loss": -6.422235488891602, "global_step": 95995, "epoch": 2285} {"train_loss": -6.271814346313477, "global_step": 95996, "epoch": 2285} {"train_loss": -6.2319464683532715, "global_step": 95997, "epoch": 2285} {"train_loss": -6.331305503845215, "global_step": 95998, "epoch": 2285} {"train_loss": -6.423288822174072, "global_step": 95999, "epoch": 2285} {"train_loss": -6.2435526847839355, "global_step": 96000, "epoch": 2285} {"train_loss": -6.250368595123291, "global_step": 96001, "epoch": 2285} {"train_loss": -6.313077449798584, "global_step": 96002, "epoch": 2285} {"train_loss": -6.296008110046387, "global_step": 96003, "epoch": 2285} {"train_loss": -6.3356122970581055, "global_step": 96004, "epoch": 2285} {"train_loss": -6.194973945617676, "global_step": 96005, "epoch": 2285} {"train_loss": -6.200674533843994, "global_step": 96006, "epoch": 2285} {"train_loss": -6.223471641540527, "global_step": 96007, "epoch": 2285} {"train_loss": -6.273263931274414, "global_step": 96008, "epoch": 2285} {"train_loss": -6.227703094482422, "global_step": 96009, "epoch": 2285} {"train_loss": -6.411883354187012, "global_step": 96010, "epoch": 2285} {"train_loss": -6.287822189785185, "global_step": 96011, "epoch": 2285, "val_loss": 75492.3046875} {"train_loss": -6.252490043640137, "global_step": 96012, "epoch": 2286} {"train_loss": -6.360490798950195, "global_step": 96013, "epoch": 2286} {"train_loss": -6.259731769561768, "global_step": 96014, "epoch": 2286} {"train_loss": -6.405726909637451, "global_step": 96015, "epoch": 2286} {"train_loss": -6.332806587219238, "global_step": 96016, "epoch": 2286} {"train_loss": -6.270315170288086, "global_step": 96017, "epoch": 2286} {"train_loss": -6.3210768699646, "global_step": 96018, "epoch": 2286} {"train_loss": -6.258681297302246, "global_step": 96019, "epoch": 2286} {"train_loss": -6.411835193634033, "global_step": 96020, "epoch": 2286} {"train_loss": -6.362692356109619, "global_step": 96021, "epoch": 2286} {"train_loss": -6.252042293548584, "global_step": 96022, "epoch": 2286} {"train_loss": -6.3304948806762695, "global_step": 96023, "epoch": 2286} {"train_loss": -6.289755344390869, "global_step": 96024, "epoch": 2286} {"train_loss": -6.200986862182617, "global_step": 96025, "epoch": 2286} {"train_loss": -6.336341857910156, "global_step": 96026, "epoch": 2286} {"train_loss": -6.356612205505371, "global_step": 96027, "epoch": 2286} {"train_loss": -6.331231117248535, "global_step": 96028, "epoch": 2286} {"train_loss": -6.318862438201904, "global_step": 96029, "epoch": 2286} {"train_loss": -6.276332378387451, "global_step": 96030, "epoch": 2286} {"train_loss": -6.353209495544434, "global_step": 96031, "epoch": 2286} {"train_loss": -6.495399475097656, "global_step": 96032, "epoch": 2286} {"train_loss": -6.307580947875977, "global_step": 96033, "epoch": 2286} {"train_loss": -6.317025184631348, "global_step": 96034, "epoch": 2286} {"train_loss": -6.402109146118164, "global_step": 96035, "epoch": 2286} {"train_loss": -6.279445648193359, "global_step": 96036, "epoch": 2286} {"train_loss": -6.301201820373535, "global_step": 96037, "epoch": 2286} {"train_loss": -6.3255486488342285, "global_step": 96038, "epoch": 2286} {"train_loss": -6.299065589904785, "global_step": 96039, "epoch": 2286} {"train_loss": -6.2893829345703125, "global_step": 96040, "epoch": 2286} {"train_loss": -6.374495506286621, "global_step": 96041, "epoch": 2286} {"train_loss": -6.405844688415527, "global_step": 96042, "epoch": 2286} {"train_loss": -6.347126483917236, "global_step": 96043, "epoch": 2286} {"train_loss": -6.296487808227539, "global_step": 96044, "epoch": 2286} {"train_loss": -6.185528755187988, "global_step": 96045, "epoch": 2286} {"train_loss": -6.290822505950928, "global_step": 96046, "epoch": 2286} {"train_loss": -6.285847187042236, "global_step": 96047, "epoch": 2286} {"train_loss": -6.249307632446289, "global_step": 96048, "epoch": 2286} {"train_loss": -6.187503814697266, "global_step": 96049, "epoch": 2286} {"train_loss": -6.4184160232543945, "global_step": 96050, "epoch": 2286} {"train_loss": -6.262305736541748, "global_step": 96051, "epoch": 2286} {"train_loss": -6.215395927429199, "global_step": 96052, "epoch": 2286} {"train_loss": -6.313291402090163, "global_step": 96053, "epoch": 2286, "val_loss": 75376.9140625} {"train_loss": -6.361963272094727, "global_step": 96054, "epoch": 2287} {"train_loss": -6.333709716796875, "global_step": 96055, "epoch": 2287} {"train_loss": -6.260093688964844, "global_step": 96056, "epoch": 2287} {"train_loss": -6.240841865539551, "global_step": 96057, "epoch": 2287} {"train_loss": -6.1511993408203125, "global_step": 96058, "epoch": 2287} {"train_loss": -6.267398357391357, "global_step": 96059, "epoch": 2287} {"train_loss": -6.219336032867432, "global_step": 96060, "epoch": 2287} {"train_loss": -6.258169174194336, "global_step": 96061, "epoch": 2287} {"train_loss": -6.364541530609131, "global_step": 96062, "epoch": 2287} {"train_loss": -6.24669075012207, "global_step": 96063, "epoch": 2287} {"train_loss": -6.252594947814941, "global_step": 96064, "epoch": 2287} {"train_loss": -6.2351837158203125, "global_step": 96065, "epoch": 2287} {"train_loss": -6.19297981262207, "global_step": 96066, "epoch": 2287} {"train_loss": -6.287239074707031, "global_step": 96067, "epoch": 2287} {"train_loss": -6.251361846923828, "global_step": 96068, "epoch": 2287} {"train_loss": -6.236905097961426, "global_step": 96069, "epoch": 2287} {"train_loss": -6.272734642028809, "global_step": 96070, "epoch": 2287} {"train_loss": -5.960163116455078, "global_step": 96071, "epoch": 2287} {"train_loss": -6.223553657531738, "global_step": 96072, "epoch": 2287} {"train_loss": -6.173727035522461, "global_step": 96073, "epoch": 2287} {"train_loss": -6.214332580566406, "global_step": 96074, "epoch": 2287} {"train_loss": -6.255466938018799, "global_step": 96075, "epoch": 2287} {"train_loss": -6.29469633102417, "global_step": 96076, "epoch": 2287} {"train_loss": -6.262928485870361, "global_step": 96077, "epoch": 2287} {"train_loss": -6.238608360290527, "global_step": 96078, "epoch": 2287} {"train_loss": -6.343387603759766, "global_step": 96079, "epoch": 2287} {"train_loss": -6.440789222717285, "global_step": 96080, "epoch": 2287} {"train_loss": -6.249841690063477, "global_step": 96081, "epoch": 2287} {"train_loss": -6.345267295837402, "global_step": 96082, "epoch": 2287} {"train_loss": -6.289451599121094, "global_step": 96083, "epoch": 2287} {"train_loss": -6.348125457763672, "global_step": 96084, "epoch": 2287} {"train_loss": -6.383980751037598, "global_step": 96085, "epoch": 2287} {"train_loss": -6.36112117767334, "global_step": 96086, "epoch": 2287} {"train_loss": -6.393947124481201, "global_step": 96087, "epoch": 2287} {"train_loss": -6.286791801452637, "global_step": 96088, "epoch": 2287} {"train_loss": -6.342069625854492, "global_step": 96089, "epoch": 2287} {"train_loss": -6.353250980377197, "global_step": 96090, "epoch": 2287} {"train_loss": -6.403169631958008, "global_step": 96091, "epoch": 2287} {"train_loss": -6.314211845397949, "global_step": 96092, "epoch": 2287} {"train_loss": -6.351753234863281, "global_step": 96093, "epoch": 2287} {"train_loss": -6.482036590576172, "global_step": 96094, "epoch": 2287} {"train_loss": -6.287384839284988, "global_step": 96095, "epoch": 2287, "val_loss": 75544.6875} {"train_loss": -6.357314586639404, "global_step": 96096, "epoch": 2288} {"train_loss": -6.368651390075684, "global_step": 96097, "epoch": 2288} {"train_loss": -6.401287078857422, "global_step": 96098, "epoch": 2288} {"train_loss": -6.395610809326172, "global_step": 96099, "epoch": 2288} {"train_loss": -6.359260082244873, "global_step": 96100, "epoch": 2288} {"train_loss": -6.435325622558594, "global_step": 96101, "epoch": 2288} {"train_loss": -6.338942527770996, "global_step": 96102, "epoch": 2288} {"train_loss": -6.333499908447266, "global_step": 96103, "epoch": 2288} {"train_loss": -6.382895469665527, "global_step": 96104, "epoch": 2288} {"train_loss": -6.369856834411621, "global_step": 96105, "epoch": 2288} {"train_loss": -6.316185474395752, "global_step": 96106, "epoch": 2288} {"train_loss": -6.353001594543457, "global_step": 96107, "epoch": 2288} {"train_loss": -6.3752760887146, "global_step": 96108, "epoch": 2288} {"train_loss": -6.311654567718506, "global_step": 96109, "epoch": 2288} {"train_loss": -6.389276504516602, "global_step": 96110, "epoch": 2288} {"train_loss": -6.286980628967285, "global_step": 96111, "epoch": 2288} {"train_loss": -6.395756721496582, "global_step": 96112, "epoch": 2288} {"train_loss": -6.400705337524414, "global_step": 96113, "epoch": 2288} {"train_loss": -6.312005043029785, "global_step": 96114, "epoch": 2288} {"train_loss": -6.2653608322143555, "global_step": 96115, "epoch": 2288} {"train_loss": -6.22095251083374, "global_step": 96116, "epoch": 2288} {"train_loss": -6.289929389953613, "global_step": 96117, "epoch": 2288} {"train_loss": -6.236092567443848, "global_step": 96118, "epoch": 2288} {"train_loss": -6.320262908935547, "global_step": 96119, "epoch": 2288} {"train_loss": -6.277240753173828, "global_step": 96120, "epoch": 2288} {"train_loss": -6.395511627197266, "global_step": 96121, "epoch": 2288} {"train_loss": -6.263411045074463, "global_step": 96122, "epoch": 2288} {"train_loss": -6.272688388824463, "global_step": 96123, "epoch": 2288} {"train_loss": -6.319955825805664, "global_step": 96124, "epoch": 2288} {"train_loss": -6.29530668258667, "global_step": 96125, "epoch": 2288} {"train_loss": -6.3045148849487305, "global_step": 96126, "epoch": 2288} {"train_loss": -6.280911445617676, "global_step": 96127, "epoch": 2288} {"train_loss": -6.288267612457275, "global_step": 96128, "epoch": 2288} {"train_loss": -6.16960334777832, "global_step": 96129, "epoch": 2288} {"train_loss": -6.286816596984863, "global_step": 96130, "epoch": 2288} {"train_loss": -6.447563171386719, "global_step": 96131, "epoch": 2288} {"train_loss": -6.068025588989258, "global_step": 96132, "epoch": 2288} {"train_loss": -6.190967082977295, "global_step": 96133, "epoch": 2288} {"train_loss": -6.234440326690674, "global_step": 96134, "epoch": 2288} {"train_loss": -6.10943603515625, "global_step": 96135, "epoch": 2288} {"train_loss": -6.166642189025879, "global_step": 96136, "epoch": 2288} {"train_loss": -6.303626162665231, "global_step": 96137, "epoch": 2288, "val_loss": 75769.9609375} {"train_loss": -6.282866477966309, "global_step": 96138, "epoch": 2289} {"train_loss": -6.2393693923950195, "global_step": 96139, "epoch": 2289} {"train_loss": -6.109654426574707, "global_step": 96140, "epoch": 2289} {"train_loss": -6.290334701538086, "global_step": 96141, "epoch": 2289} {"train_loss": -6.291889190673828, "global_step": 96142, "epoch": 2289} {"train_loss": -6.212042808532715, "global_step": 96143, "epoch": 2289} {"train_loss": -6.241827964782715, "global_step": 96144, "epoch": 2289} {"train_loss": -6.367356300354004, "global_step": 96145, "epoch": 2289} {"train_loss": -6.33750057220459, "global_step": 96146, "epoch": 2289} {"train_loss": -6.236713886260986, "global_step": 96147, "epoch": 2289} {"train_loss": -6.254620552062988, "global_step": 96148, "epoch": 2289} {"train_loss": -6.347771644592285, "global_step": 96149, "epoch": 2289} {"train_loss": -6.145816802978516, "global_step": 96150, "epoch": 2289} {"train_loss": -6.391043186187744, "global_step": 96151, "epoch": 2289} {"train_loss": -6.396653652191162, "global_step": 96152, "epoch": 2289} {"train_loss": -6.338748931884766, "global_step": 96153, "epoch": 2289} {"train_loss": -6.39739990234375, "global_step": 96154, "epoch": 2289} {"train_loss": -6.30230188369751, "global_step": 96155, "epoch": 2289} {"train_loss": -6.33284854888916, "global_step": 96156, "epoch": 2289} {"train_loss": -6.307083606719971, "global_step": 96157, "epoch": 2289} {"train_loss": -6.459924697875977, "global_step": 96158, "epoch": 2289} {"train_loss": -6.202828407287598, "global_step": 96159, "epoch": 2289} {"train_loss": -6.289608001708984, "global_step": 96160, "epoch": 2289} {"train_loss": -6.269770622253418, "global_step": 96161, "epoch": 2289} {"train_loss": -6.190829277038574, "global_step": 96162, "epoch": 2289} {"train_loss": -6.293512344360352, "global_step": 96163, "epoch": 2289} {"train_loss": -6.3912353515625, "global_step": 96164, "epoch": 2289} {"train_loss": -6.22055721282959, "global_step": 96165, "epoch": 2289} {"train_loss": -6.29737663269043, "global_step": 96166, "epoch": 2289} {"train_loss": -6.459319114685059, "global_step": 96167, "epoch": 2289} {"train_loss": -6.323368549346924, "global_step": 96168, "epoch": 2289} {"train_loss": -6.308760643005371, "global_step": 96169, "epoch": 2289} {"train_loss": -6.334667205810547, "global_step": 96170, "epoch": 2289} {"train_loss": -6.339633941650391, "global_step": 96171, "epoch": 2289} {"train_loss": -6.391810894012451, "global_step": 96172, "epoch": 2289} {"train_loss": -6.249532699584961, "global_step": 96173, "epoch": 2289} {"train_loss": -6.274369239807129, "global_step": 96174, "epoch": 2289} {"train_loss": -6.408414363861084, "global_step": 96175, "epoch": 2289} {"train_loss": -6.385641574859619, "global_step": 96176, "epoch": 2289} {"train_loss": -6.292993068695068, "global_step": 96177, "epoch": 2289} {"train_loss": -6.243565559387207, "global_step": 96178, "epoch": 2289} {"train_loss": -6.3053102266220815, "global_step": 96179, "epoch": 2289, "val_loss": 75667.4375} {"train_loss": -6.320716381072998, "global_step": 96180, "epoch": 2290} {"train_loss": -6.352276802062988, "global_step": 96181, "epoch": 2290} {"train_loss": -6.305438995361328, "global_step": 96182, "epoch": 2290} {"train_loss": -6.276278495788574, "global_step": 96183, "epoch": 2290} {"train_loss": -6.345534324645996, "global_step": 96184, "epoch": 2290} {"train_loss": -6.315081596374512, "global_step": 96185, "epoch": 2290} {"train_loss": -6.4716596603393555, "global_step": 96186, "epoch": 2290} {"train_loss": -6.373538970947266, "global_step": 96187, "epoch": 2290} {"train_loss": -6.281948089599609, "global_step": 96188, "epoch": 2290} {"train_loss": -6.409322738647461, "global_step": 96189, "epoch": 2290} {"train_loss": -6.309125900268555, "global_step": 96190, "epoch": 2290} {"train_loss": -6.328805446624756, "global_step": 96191, "epoch": 2290} {"train_loss": -6.2407941818237305, "global_step": 96192, "epoch": 2290} {"train_loss": -6.391277313232422, "global_step": 96193, "epoch": 2290} {"train_loss": -6.3793134689331055, "global_step": 96194, "epoch": 2290} {"train_loss": -6.446023941040039, "global_step": 96195, "epoch": 2290} {"train_loss": -6.305580139160156, "global_step": 96196, "epoch": 2290} {"train_loss": -6.364869594573975, "global_step": 96197, "epoch": 2290} {"train_loss": -6.38926887512207, "global_step": 96198, "epoch": 2290} {"train_loss": -6.337014198303223, "global_step": 96199, "epoch": 2290} {"train_loss": -6.329851150512695, "global_step": 96200, "epoch": 2290} {"train_loss": -6.325555801391602, "global_step": 96201, "epoch": 2290} {"train_loss": -6.323241233825684, "global_step": 96202, "epoch": 2290} {"train_loss": -6.336671829223633, "global_step": 96203, "epoch": 2290} {"train_loss": -6.394183158874512, "global_step": 96204, "epoch": 2290} {"train_loss": -6.327666282653809, "global_step": 96205, "epoch": 2290} {"train_loss": -6.408270835876465, "global_step": 96206, "epoch": 2290} {"train_loss": -6.362335205078125, "global_step": 96207, "epoch": 2290} {"train_loss": -6.364132881164551, "global_step": 96208, "epoch": 2290} {"train_loss": -6.317938804626465, "global_step": 96209, "epoch": 2290} {"train_loss": -6.391811847686768, "global_step": 96210, "epoch": 2290} {"train_loss": -6.268196105957031, "global_step": 96211, "epoch": 2290} {"train_loss": -6.2977294921875, "global_step": 96212, "epoch": 2290} {"train_loss": -6.361300945281982, "global_step": 96213, "epoch": 2290} {"train_loss": -6.288480758666992, "global_step": 96214, "epoch": 2290} {"train_loss": -6.3998799324035645, "global_step": 96215, "epoch": 2290} {"train_loss": -6.325553894042969, "global_step": 96216, "epoch": 2290} {"train_loss": -6.20113468170166, "global_step": 96217, "epoch": 2290} {"train_loss": -6.361966609954834, "global_step": 96218, "epoch": 2290} {"train_loss": -6.41438102722168, "global_step": 96219, "epoch": 2290} {"train_loss": -6.26304292678833, "global_step": 96220, "epoch": 2290} {"train_loss": -6.3390217281523205, "global_step": 96221, "epoch": 2290, "val_loss": 75847.765625} {"train_loss": -6.236090660095215, "global_step": 96222, "epoch": 2291} {"train_loss": -6.263030052185059, "global_step": 96223, "epoch": 2291} {"train_loss": -6.24832010269165, "global_step": 96224, "epoch": 2291} {"train_loss": -6.206782341003418, "global_step": 96225, "epoch": 2291} {"train_loss": -6.278566360473633, "global_step": 96226, "epoch": 2291} {"train_loss": -6.236096382141113, "global_step": 96227, "epoch": 2291} {"train_loss": -6.266524314880371, "global_step": 96228, "epoch": 2291} {"train_loss": -6.283925533294678, "global_step": 96229, "epoch": 2291} {"train_loss": -6.310325622558594, "global_step": 96230, "epoch": 2291} {"train_loss": -5.997702121734619, "global_step": 96231, "epoch": 2291} {"train_loss": -6.243095397949219, "global_step": 96232, "epoch": 2291} {"train_loss": -6.014237403869629, "global_step": 96233, "epoch": 2291} {"train_loss": -6.129798889160156, "global_step": 96234, "epoch": 2291} {"train_loss": -6.136381149291992, "global_step": 96235, "epoch": 2291} {"train_loss": -6.036872386932373, "global_step": 96236, "epoch": 2291} {"train_loss": -6.2646379470825195, "global_step": 96237, "epoch": 2291} {"train_loss": -6.068086624145508, "global_step": 96238, "epoch": 2291} {"train_loss": -6.212110996246338, "global_step": 96239, "epoch": 2291} {"train_loss": -6.066937446594238, "global_step": 96240, "epoch": 2291} {"train_loss": -6.29710054397583, "global_step": 96241, "epoch": 2291} {"train_loss": -6.13649845123291, "global_step": 96242, "epoch": 2291} {"train_loss": -6.193028450012207, "global_step": 96243, "epoch": 2291} {"train_loss": -6.29469108581543, "global_step": 96244, "epoch": 2291} {"train_loss": -6.16790771484375, "global_step": 96245, "epoch": 2291} {"train_loss": -6.276302814483643, "global_step": 96246, "epoch": 2291} {"train_loss": -6.284672260284424, "global_step": 96247, "epoch": 2291} {"train_loss": -6.239556789398193, "global_step": 96248, "epoch": 2291} {"train_loss": -6.352636814117432, "global_step": 96249, "epoch": 2291} {"train_loss": -6.183776378631592, "global_step": 96250, "epoch": 2291} {"train_loss": -6.36988639831543, "global_step": 96251, "epoch": 2291} {"train_loss": -6.154495716094971, "global_step": 96252, "epoch": 2291} {"train_loss": -6.296267509460449, "global_step": 96253, "epoch": 2291} {"train_loss": -6.1094441413879395, "global_step": 96254, "epoch": 2291} {"train_loss": -6.2428765296936035, "global_step": 96255, "epoch": 2291} {"train_loss": -6.331687927246094, "global_step": 96256, "epoch": 2291} {"train_loss": -6.388790130615234, "global_step": 96257, "epoch": 2291} {"train_loss": -6.2016754150390625, "global_step": 96258, "epoch": 2291} {"train_loss": -6.3223161697387695, "global_step": 96259, "epoch": 2291} {"train_loss": -6.375811576843262, "global_step": 96260, "epoch": 2291} {"train_loss": -6.231393337249756, "global_step": 96261, "epoch": 2291} {"train_loss": -6.315025329589844, "global_step": 96262, "epoch": 2291} {"train_loss": -6.227313904535203, "global_step": 96263, "epoch": 2291, "val_loss": 75642.6484375} {"train_loss": -6.356233596801758, "global_step": 96264, "epoch": 2292} {"train_loss": -6.291841506958008, "global_step": 96265, "epoch": 2292} {"train_loss": -6.174310207366943, "global_step": 96266, "epoch": 2292} {"train_loss": -6.26082181930542, "global_step": 96267, "epoch": 2292} {"train_loss": -6.187485218048096, "global_step": 96268, "epoch": 2292} {"train_loss": -6.369817733764648, "global_step": 96269, "epoch": 2292} {"train_loss": -6.261868476867676, "global_step": 96270, "epoch": 2292} {"train_loss": -6.1268157958984375, "global_step": 96271, "epoch": 2292} {"train_loss": -6.156024932861328, "global_step": 96272, "epoch": 2292} {"train_loss": -6.235080718994141, "global_step": 96273, "epoch": 2292} {"train_loss": -6.293849945068359, "global_step": 96274, "epoch": 2292} {"train_loss": -5.95240592956543, "global_step": 96275, "epoch": 2292} {"train_loss": -6.295070648193359, "global_step": 96276, "epoch": 2292} {"train_loss": -6.117631912231445, "global_step": 96277, "epoch": 2292} {"train_loss": -6.185775279998779, "global_step": 96278, "epoch": 2292} {"train_loss": -6.304006576538086, "global_step": 96279, "epoch": 2292} {"train_loss": -6.124936103820801, "global_step": 96280, "epoch": 2292} {"train_loss": -6.340493202209473, "global_step": 96281, "epoch": 2292} {"train_loss": -6.021668434143066, "global_step": 96282, "epoch": 2292} {"train_loss": -6.297427654266357, "global_step": 96283, "epoch": 2292} {"train_loss": -6.193441390991211, "global_step": 96284, "epoch": 2292} {"train_loss": -6.328424453735352, "global_step": 96285, "epoch": 2292} {"train_loss": -6.156323432922363, "global_step": 96286, "epoch": 2292} {"train_loss": -6.292091369628906, "global_step": 96287, "epoch": 2292} {"train_loss": -6.09884786605835, "global_step": 96288, "epoch": 2292} {"train_loss": -6.148226737976074, "global_step": 96289, "epoch": 2292} {"train_loss": -6.271602630615234, "global_step": 96290, "epoch": 2292} {"train_loss": -6.255969047546387, "global_step": 96291, "epoch": 2292} {"train_loss": -6.263333797454834, "global_step": 96292, "epoch": 2292} {"train_loss": -6.133166313171387, "global_step": 96293, "epoch": 2292} {"train_loss": -6.215793609619141, "global_step": 96294, "epoch": 2292} {"train_loss": -6.21534538269043, "global_step": 96295, "epoch": 2292} {"train_loss": -6.322277545928955, "global_step": 96296, "epoch": 2292} {"train_loss": -6.293951034545898, "global_step": 96297, "epoch": 2292} {"train_loss": -6.24439811706543, "global_step": 96298, "epoch": 2292} {"train_loss": -6.245234489440918, "global_step": 96299, "epoch": 2292} {"train_loss": -6.332045555114746, "global_step": 96300, "epoch": 2292} {"train_loss": -6.198328018188477, "global_step": 96301, "epoch": 2292} {"train_loss": -6.234259128570557, "global_step": 96302, "epoch": 2292} {"train_loss": -6.378845691680908, "global_step": 96303, "epoch": 2292} {"train_loss": -6.2363128662109375, "global_step": 96304, "epoch": 2292} {"train_loss": -6.228998331796555, "global_step": 96305, "epoch": 2292, "val_loss": 76044.078125} {"train_loss": -6.37367582321167, "global_step": 96306, "epoch": 2293} {"train_loss": -6.189969062805176, "global_step": 96307, "epoch": 2293} {"train_loss": -6.2598490715026855, "global_step": 96308, "epoch": 2293} {"train_loss": -6.3359694480896, "global_step": 96309, "epoch": 2293} {"train_loss": -6.358948230743408, "global_step": 96310, "epoch": 2293} {"train_loss": -6.252282619476318, "global_step": 96311, "epoch": 2293} {"train_loss": -6.323302745819092, "global_step": 96312, "epoch": 2293} {"train_loss": -6.304577827453613, "global_step": 96313, "epoch": 2293} {"train_loss": -6.154368877410889, "global_step": 96314, "epoch": 2293} {"train_loss": -6.325217247009277, "global_step": 96315, "epoch": 2293} {"train_loss": -6.276841163635254, "global_step": 96316, "epoch": 2293} {"train_loss": -6.2264909744262695, "global_step": 96317, "epoch": 2293} {"train_loss": -6.316884994506836, "global_step": 96318, "epoch": 2293} {"train_loss": -6.261183261871338, "global_step": 96319, "epoch": 2293} {"train_loss": -6.397701740264893, "global_step": 96320, "epoch": 2293} {"train_loss": -6.29847526550293, "global_step": 96321, "epoch": 2293} {"train_loss": -6.25699520111084, "global_step": 96322, "epoch": 2293} {"train_loss": -6.288548469543457, "global_step": 96323, "epoch": 2293} {"train_loss": -6.2395830154418945, "global_step": 96324, "epoch": 2293} {"train_loss": -6.357119083404541, "global_step": 96325, "epoch": 2293} {"train_loss": -6.309413433074951, "global_step": 96326, "epoch": 2293} {"train_loss": -6.351728439331055, "global_step": 96327, "epoch": 2293} {"train_loss": -6.380056381225586, "global_step": 96328, "epoch": 2293} {"train_loss": -6.2920756340026855, "global_step": 96329, "epoch": 2293} {"train_loss": -6.49141788482666, "global_step": 96330, "epoch": 2293} {"train_loss": -6.416075706481934, "global_step": 96331, "epoch": 2293} {"train_loss": -6.306790351867676, "global_step": 96332, "epoch": 2293} {"train_loss": -6.327864646911621, "global_step": 96333, "epoch": 2293} {"train_loss": -6.273346424102783, "global_step": 96334, "epoch": 2293} {"train_loss": -6.582005023956299, "global_step": 96335, "epoch": 2293} {"train_loss": -6.437121391296387, "global_step": 96336, "epoch": 2293} {"train_loss": -6.400725364685059, "global_step": 96337, "epoch": 2293} {"train_loss": -6.248382568359375, "global_step": 96338, "epoch": 2293} {"train_loss": -6.290947914123535, "global_step": 96339, "epoch": 2293} {"train_loss": -6.368546485900879, "global_step": 96340, "epoch": 2293} {"train_loss": -6.411599636077881, "global_step": 96341, "epoch": 2293} {"train_loss": -6.384956359863281, "global_step": 96342, "epoch": 2293} {"train_loss": -6.324702739715576, "global_step": 96343, "epoch": 2293} {"train_loss": -6.231675148010254, "global_step": 96344, "epoch": 2293} {"train_loss": -6.342493057250977, "global_step": 96345, "epoch": 2293} {"train_loss": -6.312834739685059, "global_step": 96346, "epoch": 2293} {"train_loss": -6.325521253404164, "global_step": 96347, "epoch": 2293, "val_loss": 75552.8515625} {"train_loss": -6.2643890380859375, "global_step": 96348, "epoch": 2294} {"train_loss": -6.2177324295043945, "global_step": 96349, "epoch": 2294} {"train_loss": -6.347393035888672, "global_step": 96350, "epoch": 2294} {"train_loss": -6.4833784103393555, "global_step": 96351, "epoch": 2294} {"train_loss": -6.377099990844727, "global_step": 96352, "epoch": 2294} {"train_loss": -6.398011684417725, "global_step": 96353, "epoch": 2294} {"train_loss": -6.3114399909973145, "global_step": 96354, "epoch": 2294} {"train_loss": -6.358739852905273, "global_step": 96355, "epoch": 2294} {"train_loss": -6.2677531242370605, "global_step": 96356, "epoch": 2294} {"train_loss": -6.304701805114746, "global_step": 96357, "epoch": 2294} {"train_loss": -6.297677040100098, "global_step": 96358, "epoch": 2294} {"train_loss": -6.323668479919434, "global_step": 96359, "epoch": 2294} {"train_loss": -6.283365249633789, "global_step": 96360, "epoch": 2294} {"train_loss": -6.241939544677734, "global_step": 96361, "epoch": 2294} {"train_loss": -6.365868091583252, "global_step": 96362, "epoch": 2294} {"train_loss": -6.262033462524414, "global_step": 96363, "epoch": 2294} {"train_loss": -6.395756721496582, "global_step": 96364, "epoch": 2294} {"train_loss": -6.3040924072265625, "global_step": 96365, "epoch": 2294} {"train_loss": -6.308592319488525, "global_step": 96366, "epoch": 2294} {"train_loss": -6.371983051300049, "global_step": 96367, "epoch": 2294} {"train_loss": -6.294090270996094, "global_step": 96368, "epoch": 2294} {"train_loss": -6.312676429748535, "global_step": 96369, "epoch": 2294} {"train_loss": -6.321512222290039, "global_step": 96370, "epoch": 2294} {"train_loss": -6.403135776519775, "global_step": 96371, "epoch": 2294} {"train_loss": -6.281952857971191, "global_step": 96372, "epoch": 2294} {"train_loss": -6.342626094818115, "global_step": 96373, "epoch": 2294} {"train_loss": -6.3413472175598145, "global_step": 96374, "epoch": 2294} {"train_loss": -6.245692729949951, "global_step": 96375, "epoch": 2294} {"train_loss": -6.353443145751953, "global_step": 96376, "epoch": 2294} {"train_loss": -6.40507173538208, "global_step": 96377, "epoch": 2294} {"train_loss": -6.37027645111084, "global_step": 96378, "epoch": 2294} {"train_loss": -6.440910816192627, "global_step": 96379, "epoch": 2294} {"train_loss": -6.309913635253906, "global_step": 96380, "epoch": 2294} {"train_loss": -6.324782371520996, "global_step": 96381, "epoch": 2294} {"train_loss": -6.247610092163086, "global_step": 96382, "epoch": 2294} {"train_loss": -6.396387100219727, "global_step": 96383, "epoch": 2294} {"train_loss": -6.323026180267334, "global_step": 96384, "epoch": 2294} {"train_loss": -6.376579284667969, "global_step": 96385, "epoch": 2294} {"train_loss": -6.302301406860352, "global_step": 96386, "epoch": 2294} {"train_loss": -6.232505798339844, "global_step": 96387, "epoch": 2294} {"train_loss": -6.320964813232422, "global_step": 96388, "epoch": 2294} {"train_loss": -6.328102282115391, "global_step": 96389, "epoch": 2294, "val_loss": 75890.5625} {"train_loss": -6.3028693199157715, "global_step": 96390, "epoch": 2295} {"train_loss": -6.328412055969238, "global_step": 96391, "epoch": 2295} {"train_loss": -6.320079803466797, "global_step": 96392, "epoch": 2295} {"train_loss": -6.238825798034668, "global_step": 96393, "epoch": 2295} {"train_loss": -6.325244903564453, "global_step": 96394, "epoch": 2295} {"train_loss": -6.3317437171936035, "global_step": 96395, "epoch": 2295} {"train_loss": -6.280486583709717, "global_step": 96396, "epoch": 2295} {"train_loss": -6.424500465393066, "global_step": 96397, "epoch": 2295} {"train_loss": -6.3725690841674805, "global_step": 96398, "epoch": 2295} {"train_loss": -6.319446563720703, "global_step": 96399, "epoch": 2295} {"train_loss": -6.284379005432129, "global_step": 96400, "epoch": 2295} {"train_loss": -6.292104721069336, "global_step": 96401, "epoch": 2295} {"train_loss": -6.398083686828613, "global_step": 96402, "epoch": 2295} {"train_loss": -6.319579124450684, "global_step": 96403, "epoch": 2295} {"train_loss": -6.369389057159424, "global_step": 96404, "epoch": 2295} {"train_loss": -6.423231601715088, "global_step": 96405, "epoch": 2295} {"train_loss": -6.25766658782959, "global_step": 96406, "epoch": 2295} {"train_loss": -6.31766414642334, "global_step": 96407, "epoch": 2295} {"train_loss": -6.298090934753418, "global_step": 96408, "epoch": 2295} {"train_loss": -6.379827499389648, "global_step": 96409, "epoch": 2295} {"train_loss": -6.352911949157715, "global_step": 96410, "epoch": 2295} {"train_loss": -6.267805099487305, "global_step": 96411, "epoch": 2295} {"train_loss": -6.3480544090271, "global_step": 96412, "epoch": 2295} {"train_loss": -6.212299346923828, "global_step": 96413, "epoch": 2295} {"train_loss": -6.416678428649902, "global_step": 96414, "epoch": 2295} {"train_loss": -6.302947998046875, "global_step": 96415, "epoch": 2295} {"train_loss": -6.335697174072266, "global_step": 96416, "epoch": 2295} {"train_loss": -6.357309818267822, "global_step": 96417, "epoch": 2295} {"train_loss": -6.370350360870361, "global_step": 96418, "epoch": 2295} {"train_loss": -6.254127025604248, "global_step": 96419, "epoch": 2295} {"train_loss": -6.322756767272949, "global_step": 96420, "epoch": 2295} {"train_loss": -6.394192695617676, "global_step": 96421, "epoch": 2295} {"train_loss": -6.419678688049316, "global_step": 96422, "epoch": 2295} {"train_loss": -6.255121231079102, "global_step": 96423, "epoch": 2295} {"train_loss": -6.303033828735352, "global_step": 96424, "epoch": 2295} {"train_loss": -6.266541957855225, "global_step": 96425, "epoch": 2295} {"train_loss": -6.291302680969238, "global_step": 96426, "epoch": 2295} {"train_loss": -6.321943283081055, "global_step": 96427, "epoch": 2295} {"train_loss": -6.169658660888672, "global_step": 96428, "epoch": 2295} {"train_loss": -6.40008544921875, "global_step": 96429, "epoch": 2295} {"train_loss": -6.341383934020996, "global_step": 96430, "epoch": 2295} {"train_loss": -6.319918666567121, "global_step": 96431, "epoch": 2295, "val_loss": 75461.015625} {"train_loss": -6.1815900802612305, "global_step": 96432, "epoch": 2296} {"train_loss": -6.219508647918701, "global_step": 96433, "epoch": 2296} {"train_loss": -6.2420196533203125, "global_step": 96434, "epoch": 2296} {"train_loss": -6.415122985839844, "global_step": 96435, "epoch": 2296} {"train_loss": -6.16825532913208, "global_step": 96436, "epoch": 2296} {"train_loss": -6.347601890563965, "global_step": 96437, "epoch": 2296} {"train_loss": -6.2424492835998535, "global_step": 96438, "epoch": 2296} {"train_loss": -6.223845481872559, "global_step": 96439, "epoch": 2296} {"train_loss": -6.192987442016602, "global_step": 96440, "epoch": 2296} {"train_loss": -6.255496501922607, "global_step": 96441, "epoch": 2296} {"train_loss": -6.266695976257324, "global_step": 96442, "epoch": 2296} {"train_loss": -6.21585750579834, "global_step": 96443, "epoch": 2296} {"train_loss": -6.100984573364258, "global_step": 96444, "epoch": 2296} {"train_loss": -6.311611175537109, "global_step": 96445, "epoch": 2296} {"train_loss": -6.213191032409668, "global_step": 96446, "epoch": 2296} {"train_loss": -6.2353010177612305, "global_step": 96447, "epoch": 2296} {"train_loss": -6.269340991973877, "global_step": 96448, "epoch": 2296} {"train_loss": -6.290422439575195, "global_step": 96449, "epoch": 2296} {"train_loss": -6.334037780761719, "global_step": 96450, "epoch": 2296} {"train_loss": -6.351200103759766, "global_step": 96451, "epoch": 2296} {"train_loss": -6.256657600402832, "global_step": 96452, "epoch": 2296} {"train_loss": -6.419768333435059, "global_step": 96453, "epoch": 2296} {"train_loss": -6.363580226898193, "global_step": 96454, "epoch": 2296} {"train_loss": -6.329502105712891, "global_step": 96455, "epoch": 2296} {"train_loss": -6.221505165100098, "global_step": 96456, "epoch": 2296} {"train_loss": -6.335443496704102, "global_step": 96457, "epoch": 2296} {"train_loss": -6.3015875816345215, "global_step": 96458, "epoch": 2296} {"train_loss": -6.355709075927734, "global_step": 96459, "epoch": 2296} {"train_loss": -6.310478210449219, "global_step": 96460, "epoch": 2296} {"train_loss": -6.309680461883545, "global_step": 96461, "epoch": 2296} {"train_loss": -6.352568626403809, "global_step": 96462, "epoch": 2296} {"train_loss": -6.28800106048584, "global_step": 96463, "epoch": 2296} {"train_loss": -6.316549777984619, "global_step": 96464, "epoch": 2296} {"train_loss": -6.410928726196289, "global_step": 96465, "epoch": 2296} {"train_loss": -6.185639381408691, "global_step": 96466, "epoch": 2296} {"train_loss": -6.2198686599731445, "global_step": 96467, "epoch": 2296} {"train_loss": -6.318031311035156, "global_step": 96468, "epoch": 2296} {"train_loss": -6.462164878845215, "global_step": 96469, "epoch": 2296} {"train_loss": -6.315887451171875, "global_step": 96470, "epoch": 2296} {"train_loss": -6.30719518661499, "global_step": 96471, "epoch": 2296} {"train_loss": -6.342405319213867, "global_step": 96472, "epoch": 2296} {"train_loss": -6.287100712458293, "global_step": 96473, "epoch": 2296, "val_loss": 75687.96875} {"train_loss": -6.401784896850586, "global_step": 96474, "epoch": 2297} {"train_loss": -6.225622177124023, "global_step": 96475, "epoch": 2297} {"train_loss": -6.28353214263916, "global_step": 96476, "epoch": 2297} {"train_loss": -6.360955715179443, "global_step": 96477, "epoch": 2297} {"train_loss": -6.335333824157715, "global_step": 96478, "epoch": 2297} {"train_loss": -6.340889930725098, "global_step": 96479, "epoch": 2297} {"train_loss": -6.33817195892334, "global_step": 96480, "epoch": 2297} {"train_loss": -6.288211822509766, "global_step": 96481, "epoch": 2297} {"train_loss": -6.392670631408691, "global_step": 96482, "epoch": 2297} {"train_loss": -6.304592609405518, "global_step": 96483, "epoch": 2297} {"train_loss": -6.3813886642456055, "global_step": 96484, "epoch": 2297} {"train_loss": -6.321647644042969, "global_step": 96485, "epoch": 2297} {"train_loss": -6.357456684112549, "global_step": 96486, "epoch": 2297} {"train_loss": -6.308321475982666, "global_step": 96487, "epoch": 2297} {"train_loss": -6.228201866149902, "global_step": 96488, "epoch": 2297} {"train_loss": -6.334021091461182, "global_step": 96489, "epoch": 2297} {"train_loss": -6.406681060791016, "global_step": 96490, "epoch": 2297} {"train_loss": -6.213901996612549, "global_step": 96491, "epoch": 2297} {"train_loss": -6.424830913543701, "global_step": 96492, "epoch": 2297} {"train_loss": -6.29399299621582, "global_step": 96493, "epoch": 2297} {"train_loss": -6.300045013427734, "global_step": 96494, "epoch": 2297} {"train_loss": -6.243070125579834, "global_step": 96495, "epoch": 2297} {"train_loss": -6.270532608032227, "global_step": 96496, "epoch": 2297} {"train_loss": -6.2494425773620605, "global_step": 96497, "epoch": 2297} {"train_loss": -6.242043495178223, "global_step": 96498, "epoch": 2297} {"train_loss": -6.205327033996582, "global_step": 96499, "epoch": 2297} {"train_loss": -6.130887031555176, "global_step": 96500, "epoch": 2297} {"train_loss": -6.2590012550354, "global_step": 96501, "epoch": 2297} {"train_loss": -6.191562175750732, "global_step": 96502, "epoch": 2297} {"train_loss": -6.327359676361084, "global_step": 96503, "epoch": 2297} {"train_loss": -6.395705699920654, "global_step": 96504, "epoch": 2297} {"train_loss": -6.1892805099487305, "global_step": 96505, "epoch": 2297} {"train_loss": -6.329773902893066, "global_step": 96506, "epoch": 2297} {"train_loss": -6.3798441886901855, "global_step": 96507, "epoch": 2297} {"train_loss": -6.322052955627441, "global_step": 96508, "epoch": 2297} {"train_loss": -6.313455581665039, "global_step": 96509, "epoch": 2297} {"train_loss": -6.20540189743042, "global_step": 96510, "epoch": 2297} {"train_loss": -6.349699974060059, "global_step": 96511, "epoch": 2297} {"train_loss": -6.296242713928223, "global_step": 96512, "epoch": 2297} {"train_loss": -6.302483558654785, "global_step": 96513, "epoch": 2297} {"train_loss": -6.244924545288086, "global_step": 96514, "epoch": 2297} {"train_loss": -6.297494945071993, "global_step": 96515, "epoch": 2297, "val_loss": 75700.3203125} {"train_loss": -6.248897552490234, "global_step": 96516, "epoch": 2298} {"train_loss": -6.254719257354736, "global_step": 96517, "epoch": 2298} {"train_loss": -6.389528274536133, "global_step": 96518, "epoch": 2298} {"train_loss": -6.392942905426025, "global_step": 96519, "epoch": 2298} {"train_loss": -6.229608058929443, "global_step": 96520, "epoch": 2298} {"train_loss": -6.317280292510986, "global_step": 96521, "epoch": 2298} {"train_loss": -6.255270004272461, "global_step": 96522, "epoch": 2298} {"train_loss": -6.397378921508789, "global_step": 96523, "epoch": 2298} {"train_loss": -6.406442642211914, "global_step": 96524, "epoch": 2298} {"train_loss": -6.332986831665039, "global_step": 96525, "epoch": 2298} {"train_loss": -6.4804463386535645, "global_step": 96526, "epoch": 2298} {"train_loss": -6.297882556915283, "global_step": 96527, "epoch": 2298} {"train_loss": -6.308619499206543, "global_step": 96528, "epoch": 2298} {"train_loss": -6.36156702041626, "global_step": 96529, "epoch": 2298} {"train_loss": -6.332050323486328, "global_step": 96530, "epoch": 2298} {"train_loss": -6.305240631103516, "global_step": 96531, "epoch": 2298} {"train_loss": -6.446011543273926, "global_step": 96532, "epoch": 2298} {"train_loss": -6.326169013977051, "global_step": 96533, "epoch": 2298} {"train_loss": -6.424766540527344, "global_step": 96534, "epoch": 2298} {"train_loss": -6.338474273681641, "global_step": 96535, "epoch": 2298} {"train_loss": -6.374274253845215, "global_step": 96536, "epoch": 2298} {"train_loss": -6.466151237487793, "global_step": 96537, "epoch": 2298} {"train_loss": -6.371938705444336, "global_step": 96538, "epoch": 2298} {"train_loss": -6.333148956298828, "global_step": 96539, "epoch": 2298} {"train_loss": -6.37908411026001, "global_step": 96540, "epoch": 2298} {"train_loss": -6.35222053527832, "global_step": 96541, "epoch": 2298} {"train_loss": -6.387284278869629, "global_step": 96542, "epoch": 2298} {"train_loss": -6.315957069396973, "global_step": 96543, "epoch": 2298} {"train_loss": -6.36055326461792, "global_step": 96544, "epoch": 2298} {"train_loss": -6.159930229187012, "global_step": 96545, "epoch": 2298} {"train_loss": -6.311044692993164, "global_step": 96546, "epoch": 2298} {"train_loss": -6.283015251159668, "global_step": 96547, "epoch": 2298} {"train_loss": -5.9736762046813965, "global_step": 96548, "epoch": 2298} {"train_loss": -6.214024543762207, "global_step": 96549, "epoch": 2298} {"train_loss": -6.362274169921875, "global_step": 96550, "epoch": 2298} {"train_loss": -6.213202476501465, "global_step": 96551, "epoch": 2298} {"train_loss": -6.35803747177124, "global_step": 96552, "epoch": 2298} {"train_loss": -6.1776580810546875, "global_step": 96553, "epoch": 2298} {"train_loss": -6.322980880737305, "global_step": 96554, "epoch": 2298} {"train_loss": -6.209877967834473, "global_step": 96555, "epoch": 2298} {"train_loss": -6.088809967041016, "global_step": 96556, "epoch": 2298} {"train_loss": -6.313528832935152, "global_step": 96557, "epoch": 2298, "val_loss": 76053.3046875} {"train_loss": -6.185174942016602, "global_step": 96558, "epoch": 2299} {"train_loss": -6.268612384796143, "global_step": 96559, "epoch": 2299} {"train_loss": -6.248531341552734, "global_step": 96560, "epoch": 2299} {"train_loss": -6.212716579437256, "global_step": 96561, "epoch": 2299} {"train_loss": -6.366298675537109, "global_step": 96562, "epoch": 2299} {"train_loss": -6.165921211242676, "global_step": 96563, "epoch": 2299} {"train_loss": -6.197658061981201, "global_step": 96564, "epoch": 2299} {"train_loss": -6.1395063400268555, "global_step": 96565, "epoch": 2299} {"train_loss": -6.354808807373047, "global_step": 96566, "epoch": 2299} {"train_loss": -6.291805744171143, "global_step": 96567, "epoch": 2299} {"train_loss": -6.286243915557861, "global_step": 96568, "epoch": 2299} {"train_loss": -6.232043266296387, "global_step": 96569, "epoch": 2299} {"train_loss": -6.38374137878418, "global_step": 96570, "epoch": 2299} {"train_loss": -6.229736804962158, "global_step": 96571, "epoch": 2299} {"train_loss": -6.192305088043213, "global_step": 96572, "epoch": 2299} {"train_loss": -6.172459602355957, "global_step": 96573, "epoch": 2299} {"train_loss": -6.343966484069824, "global_step": 96574, "epoch": 2299} {"train_loss": -6.278214454650879, "global_step": 96575, "epoch": 2299} {"train_loss": -6.263943672180176, "global_step": 96576, "epoch": 2299} {"train_loss": -6.219203948974609, "global_step": 96577, "epoch": 2299} {"train_loss": -6.199072360992432, "global_step": 96578, "epoch": 2299} {"train_loss": -6.265358924865723, "global_step": 96579, "epoch": 2299} {"train_loss": -6.348638534545898, "global_step": 96580, "epoch": 2299} {"train_loss": -6.290959358215332, "global_step": 96581, "epoch": 2299} {"train_loss": -6.176813125610352, "global_step": 96582, "epoch": 2299} {"train_loss": -6.282942771911621, "global_step": 96583, "epoch": 2299} {"train_loss": -6.2150163650512695, "global_step": 96584, "epoch": 2299} {"train_loss": -6.116158485412598, "global_step": 96585, "epoch": 2299} {"train_loss": -6.153271198272705, "global_step": 96586, "epoch": 2299} {"train_loss": -6.206365585327148, "global_step": 96587, "epoch": 2299} {"train_loss": -6.214786052703857, "global_step": 96588, "epoch": 2299} {"train_loss": -6.107971668243408, "global_step": 96589, "epoch": 2299} {"train_loss": -6.218485355377197, "global_step": 96590, "epoch": 2299} {"train_loss": -6.116086483001709, "global_step": 96591, "epoch": 2299} {"train_loss": -6.168924331665039, "global_step": 96592, "epoch": 2299} {"train_loss": -6.132876396179199, "global_step": 96593, "epoch": 2299} {"train_loss": -6.167219161987305, "global_step": 96594, "epoch": 2299} {"train_loss": -5.919253826141357, "global_step": 96595, "epoch": 2299} {"train_loss": -6.215566635131836, "global_step": 96596, "epoch": 2299} {"train_loss": -6.147041320800781, "global_step": 96597, "epoch": 2299} {"train_loss": -6.299056053161621, "global_step": 96598, "epoch": 2299} {"train_loss": -6.219741242272513, "global_step": 96599, "epoch": 2299, "val_loss": 75624.3125} {"train_loss": -6.294245719909668, "global_step": 96600, "epoch": 2300} {"train_loss": -6.299029350280762, "global_step": 96601, "epoch": 2300} {"train_loss": -6.177393436431885, "global_step": 96602, "epoch": 2300} {"train_loss": -6.229591369628906, "global_step": 96603, "epoch": 2300} {"train_loss": -6.269611358642578, "global_step": 96604, "epoch": 2300} {"train_loss": -6.216799736022949, "global_step": 96605, "epoch": 2300} {"train_loss": -6.255363464355469, "global_step": 96606, "epoch": 2300} {"train_loss": -6.296875953674316, "global_step": 96607, "epoch": 2300} {"train_loss": -6.333327293395996, "global_step": 96608, "epoch": 2300} {"train_loss": -6.224352836608887, "global_step": 96609, "epoch": 2300} {"train_loss": -6.301759719848633, "global_step": 96610, "epoch": 2300} {"train_loss": -6.259333610534668, "global_step": 96611, "epoch": 2300} {"train_loss": -6.314337730407715, "global_step": 96612, "epoch": 2300} {"train_loss": -6.256564140319824, "global_step": 96613, "epoch": 2300} {"train_loss": -6.378777503967285, "global_step": 96614, "epoch": 2300} {"train_loss": -6.240538597106934, "global_step": 96615, "epoch": 2300} {"train_loss": -6.20613956451416, "global_step": 96616, "epoch": 2300} {"train_loss": -6.3251142501831055, "global_step": 96617, "epoch": 2300} {"train_loss": -6.301178932189941, "global_step": 96618, "epoch": 2300} {"train_loss": -6.340771198272705, "global_step": 96619, "epoch": 2300} {"train_loss": -6.299323558807373, "global_step": 96620, "epoch": 2300} {"train_loss": -6.309271812438965, "global_step": 96621, "epoch": 2300} {"train_loss": -6.3445844650268555, "global_step": 96622, "epoch": 2300} {"train_loss": -6.43051815032959, "global_step": 96623, "epoch": 2300} {"train_loss": -6.361104965209961, "global_step": 96624, "epoch": 2300} {"train_loss": -6.327486515045166, "global_step": 96625, "epoch": 2300} {"train_loss": -6.332161903381348, "global_step": 96626, "epoch": 2300} {"train_loss": -6.360873222351074, "global_step": 96627, "epoch": 2300} {"train_loss": -6.3050103187561035, "global_step": 96628, "epoch": 2300} {"train_loss": -6.325823783874512, "global_step": 96629, "epoch": 2300} {"train_loss": -6.279210090637207, "global_step": 96630, "epoch": 2300} {"train_loss": -6.323706150054932, "global_step": 96631, "epoch": 2300} {"train_loss": -6.415218830108643, "global_step": 96632, "epoch": 2300} {"train_loss": -6.278448104858398, "global_step": 96633, "epoch": 2300} {"train_loss": -6.3889055252075195, "global_step": 96634, "epoch": 2300} {"train_loss": -6.28541374206543, "global_step": 96635, "epoch": 2300} {"train_loss": -6.309825420379639, "global_step": 96636, "epoch": 2300} {"train_loss": -6.365571975708008, "global_step": 96637, "epoch": 2300} {"train_loss": -6.3248677253723145, "global_step": 96638, "epoch": 2300} {"train_loss": -6.342063903808594, "global_step": 96639, "epoch": 2300} {"train_loss": -6.1512017250061035, "global_step": 96640, "epoch": 2300} {"train_loss": -6.304908445903233, "global_step": 96641, "epoch": 2300, "train/sim_max_reward_0": 0.9125097886544818, "train/sim_max_reward_1": 0.8333318483706509, "train/sim_max_reward_2": 0.32442534752117175, "train/sim_max_reward_3": 0.8599783197058315, "train/sim_max_reward_4": 0.3176431889572424, "train/sim_max_reward_5": 0.8849646869582182, "test/sim_max_reward_4500000": 0.8476156489231087, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9680742480722836, "test/sim_max_reward_4500004": 0.18656544055348395, "test/sim_max_reward_4500005": 0.8073512956530589, "test/sim_max_reward_4500006": 0.9876678091688389, "test/sim_max_reward_4500007": 0.9845763737982668, "test/sim_max_reward_4500008": 0.30438960929982656, "test/sim_max_reward_4500009": 0.05353374066283431, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.8383040663936585, "test/sim_max_reward_4500012": 0.9725360770198006, "test/sim_max_reward_4500013": 0.02009269256700699, "test/sim_max_reward_4500014": 0.37773716570850724, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.026003035567297106, "test/sim_max_reward_4500018": 0.9796070748232483, "test/sim_max_reward_4500019": 0.9613394144569445, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9383180935229581, "test/sim_max_reward_4500022": 0.9558589526417597, "test/sim_max_reward_4500023": 0.9392031770894999, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9468022470712184, "test/sim_max_reward_4500026": 0.9863162540581037, "test/sim_max_reward_4500027": 0.8782667377642627, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.07037686006036144, "test/sim_max_reward_4500030": 0.9505133783760732, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0641120893556327, "test/sim_max_reward_4500033": 0.38466663323885325, "test/sim_max_reward_4500034": 0.8596480130059215, "test/sim_max_reward_4500035": 0.9863249831475104, "test/sim_max_reward_4500036": 0.4449282695116453, "test/sim_max_reward_4500037": 0.9526522474454789, "test/sim_max_reward_4500038": 0.984618054102326, "test/sim_max_reward_4500039": 0.9673459635924461, "test/sim_max_reward_4500040": 0.8750605589991471, "test/sim_max_reward_4500041": 0.9952003791815104, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.15224275556350286, "test/sim_max_reward_4500044": 0.3653931407285698, "test/sim_max_reward_4500045": 0.7729370579170834, "test/sim_max_reward_4500046": 0.8954759451946338, "test/sim_max_reward_4500047": 0.8995473891344057, "test/sim_max_reward_4500048": 0.9654345623996904, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.688808863361266, "test/mean_score": 0.5954959740344421, "val_loss": 75714.1484375} {"train_loss": -6.367247104644775, "global_step": 96642, "epoch": 2301} {"train_loss": -6.433650970458984, "global_step": 96643, "epoch": 2301} {"train_loss": -6.239617824554443, "global_step": 96644, "epoch": 2301} {"train_loss": -6.436140537261963, "global_step": 96645, "epoch": 2301} {"train_loss": -6.281982421875, "global_step": 96646, "epoch": 2301} {"train_loss": -6.326284408569336, "global_step": 96647, "epoch": 2301} {"train_loss": -6.331046104431152, "global_step": 96648, "epoch": 2301} {"train_loss": -6.379034519195557, "global_step": 96649, "epoch": 2301} {"train_loss": -6.344015598297119, "global_step": 96650, "epoch": 2301} {"train_loss": -6.234701156616211, "global_step": 96651, "epoch": 2301} {"train_loss": -6.27301025390625, "global_step": 96652, "epoch": 2301} {"train_loss": -6.255984306335449, "global_step": 96653, "epoch": 2301} {"train_loss": -6.295666694641113, "global_step": 96654, "epoch": 2301} {"train_loss": -6.277215957641602, "global_step": 96655, "epoch": 2301} {"train_loss": -6.267620086669922, "global_step": 96656, "epoch": 2301} {"train_loss": -6.296133995056152, "global_step": 96657, "epoch": 2301} {"train_loss": -6.305925369262695, "global_step": 96658, "epoch": 2301} {"train_loss": -6.288030624389648, "global_step": 96659, "epoch": 2301} {"train_loss": -6.483979225158691, "global_step": 96660, "epoch": 2301} {"train_loss": -6.342411041259766, "global_step": 96661, "epoch": 2301} {"train_loss": -6.355609893798828, "global_step": 96662, "epoch": 2301} {"train_loss": -6.295953273773193, "global_step": 96663, "epoch": 2301} {"train_loss": -6.414935111999512, "global_step": 96664, "epoch": 2301} {"train_loss": -6.300581932067871, "global_step": 96665, "epoch": 2301} {"train_loss": -6.313137054443359, "global_step": 96666, "epoch": 2301} {"train_loss": -6.326286792755127, "global_step": 96667, "epoch": 2301} {"train_loss": -6.379934310913086, "global_step": 96668, "epoch": 2301} {"train_loss": -6.321928977966309, "global_step": 96669, "epoch": 2301} {"train_loss": -6.3592448234558105, "global_step": 96670, "epoch": 2301} {"train_loss": -6.266148090362549, "global_step": 96671, "epoch": 2301} {"train_loss": -6.320955753326416, "global_step": 96672, "epoch": 2301} {"train_loss": -6.314813613891602, "global_step": 96673, "epoch": 2301} {"train_loss": -6.3107075691223145, "global_step": 96674, "epoch": 2301} {"train_loss": -6.360265254974365, "global_step": 96675, "epoch": 2301} {"train_loss": -6.39518928527832, "global_step": 96676, "epoch": 2301} {"train_loss": -6.395178318023682, "global_step": 96677, "epoch": 2301} {"train_loss": -6.34736442565918, "global_step": 96678, "epoch": 2301} {"train_loss": -6.242124557495117, "global_step": 96679, "epoch": 2301} {"train_loss": -6.311406135559082, "global_step": 96680, "epoch": 2301} {"train_loss": -6.36966609954834, "global_step": 96681, "epoch": 2301} {"train_loss": -6.268174648284912, "global_step": 96682, "epoch": 2301} {"train_loss": -6.329173076720465, "global_step": 96683, "epoch": 2301, "val_loss": 75504.25} {"train_loss": -6.369644641876221, "global_step": 96684, "epoch": 2302} {"train_loss": -6.4195356369018555, "global_step": 96685, "epoch": 2302} {"train_loss": -6.302811622619629, "global_step": 96686, "epoch": 2302} {"train_loss": -6.3424530029296875, "global_step": 96687, "epoch": 2302} {"train_loss": -6.357001304626465, "global_step": 96688, "epoch": 2302} {"train_loss": -6.384530067443848, "global_step": 96689, "epoch": 2302} {"train_loss": -6.390103340148926, "global_step": 96690, "epoch": 2302} {"train_loss": -6.401188850402832, "global_step": 96691, "epoch": 2302} {"train_loss": -6.302328109741211, "global_step": 96692, "epoch": 2302} {"train_loss": -6.2831244468688965, "global_step": 96693, "epoch": 2302} {"train_loss": -6.389678955078125, "global_step": 96694, "epoch": 2302} {"train_loss": -6.414422512054443, "global_step": 96695, "epoch": 2302} {"train_loss": -6.428473472595215, "global_step": 96696, "epoch": 2302} {"train_loss": -6.260984420776367, "global_step": 96697, "epoch": 2302} {"train_loss": -6.378291130065918, "global_step": 96698, "epoch": 2302} {"train_loss": -6.200545310974121, "global_step": 96699, "epoch": 2302} {"train_loss": -6.233316898345947, "global_step": 96700, "epoch": 2302} {"train_loss": -6.321887016296387, "global_step": 96701, "epoch": 2302} {"train_loss": -6.2009477615356445, "global_step": 96702, "epoch": 2302} {"train_loss": -6.286659240722656, "global_step": 96703, "epoch": 2302} {"train_loss": -6.1653547286987305, "global_step": 96704, "epoch": 2302} {"train_loss": -6.340308666229248, "global_step": 96705, "epoch": 2302} {"train_loss": -6.2829484939575195, "global_step": 96706, "epoch": 2302} {"train_loss": -6.289043426513672, "global_step": 96707, "epoch": 2302} {"train_loss": -6.289695739746094, "global_step": 96708, "epoch": 2302} {"train_loss": -6.333933353424072, "global_step": 96709, "epoch": 2302} {"train_loss": -6.288444519042969, "global_step": 96710, "epoch": 2302} {"train_loss": -6.1646013259887695, "global_step": 96711, "epoch": 2302} {"train_loss": -6.244159698486328, "global_step": 96712, "epoch": 2302} {"train_loss": -6.2693562507629395, "global_step": 96713, "epoch": 2302} {"train_loss": -6.331287860870361, "global_step": 96714, "epoch": 2302} {"train_loss": -6.338508129119873, "global_step": 96715, "epoch": 2302} {"train_loss": -6.394516468048096, "global_step": 96716, "epoch": 2302} {"train_loss": -6.381922245025635, "global_step": 96717, "epoch": 2302} {"train_loss": -6.304426670074463, "global_step": 96718, "epoch": 2302} {"train_loss": -6.371118068695068, "global_step": 96719, "epoch": 2302} {"train_loss": -6.372369766235352, "global_step": 96720, "epoch": 2302} {"train_loss": -6.114256381988525, "global_step": 96721, "epoch": 2302} {"train_loss": -6.2845258712768555, "global_step": 96722, "epoch": 2302} {"train_loss": -6.2915449142456055, "global_step": 96723, "epoch": 2302} {"train_loss": -6.366399765014648, "global_step": 96724, "epoch": 2302} {"train_loss": -6.314163877850487, "global_step": 96725, "epoch": 2302, "val_loss": 75682.8828125} {"train_loss": -6.281800746917725, "global_step": 96726, "epoch": 2303} {"train_loss": -6.264766693115234, "global_step": 96727, "epoch": 2303} {"train_loss": -6.263485431671143, "global_step": 96728, "epoch": 2303} {"train_loss": -6.270015716552734, "global_step": 96729, "epoch": 2303} {"train_loss": -6.294554233551025, "global_step": 96730, "epoch": 2303} {"train_loss": -6.271814823150635, "global_step": 96731, "epoch": 2303} {"train_loss": -6.324565410614014, "global_step": 96732, "epoch": 2303} {"train_loss": -6.187726974487305, "global_step": 96733, "epoch": 2303} {"train_loss": -6.194453239440918, "global_step": 96734, "epoch": 2303} {"train_loss": -6.2518110275268555, "global_step": 96735, "epoch": 2303} {"train_loss": -6.257894992828369, "global_step": 96736, "epoch": 2303} {"train_loss": -6.337821006774902, "global_step": 96737, "epoch": 2303} {"train_loss": -6.337233066558838, "global_step": 96738, "epoch": 2303} {"train_loss": -6.4834747314453125, "global_step": 96739, "epoch": 2303} {"train_loss": -6.262253761291504, "global_step": 96740, "epoch": 2303} {"train_loss": -6.349063873291016, "global_step": 96741, "epoch": 2303} {"train_loss": -6.345850944519043, "global_step": 96742, "epoch": 2303} {"train_loss": -6.369073867797852, "global_step": 96743, "epoch": 2303} {"train_loss": -6.314708709716797, "global_step": 96744, "epoch": 2303} {"train_loss": -6.328463554382324, "global_step": 96745, "epoch": 2303} {"train_loss": -6.295382499694824, "global_step": 96746, "epoch": 2303} {"train_loss": -6.287930488586426, "global_step": 96747, "epoch": 2303} {"train_loss": -6.400798797607422, "global_step": 96748, "epoch": 2303} {"train_loss": -6.261691570281982, "global_step": 96749, "epoch": 2303} {"train_loss": -6.273159980773926, "global_step": 96750, "epoch": 2303} {"train_loss": -6.353965759277344, "global_step": 96751, "epoch": 2303} {"train_loss": -6.284173965454102, "global_step": 96752, "epoch": 2303} {"train_loss": -6.377750396728516, "global_step": 96753, "epoch": 2303} {"train_loss": -6.282556533813477, "global_step": 96754, "epoch": 2303} {"train_loss": -6.3421478271484375, "global_step": 96755, "epoch": 2303} {"train_loss": -6.383457183837891, "global_step": 96756, "epoch": 2303} {"train_loss": -6.448672294616699, "global_step": 96757, "epoch": 2303} {"train_loss": -6.397366523742676, "global_step": 96758, "epoch": 2303} {"train_loss": -6.357841491699219, "global_step": 96759, "epoch": 2303} {"train_loss": -6.288514137268066, "global_step": 96760, "epoch": 2303} {"train_loss": -6.34920597076416, "global_step": 96761, "epoch": 2303} {"train_loss": -6.520047664642334, "global_step": 96762, "epoch": 2303} {"train_loss": -6.415216445922852, "global_step": 96763, "epoch": 2303} {"train_loss": -6.319326400756836, "global_step": 96764, "epoch": 2303} {"train_loss": -6.345280647277832, "global_step": 96765, "epoch": 2303} {"train_loss": -6.257070064544678, "global_step": 96766, "epoch": 2303} {"train_loss": -6.323582796823411, "global_step": 96767, "epoch": 2303, "val_loss": 75710.984375} {"train_loss": -6.414447784423828, "global_step": 96768, "epoch": 2304} {"train_loss": -6.387972354888916, "global_step": 96769, "epoch": 2304} {"train_loss": -6.3669610023498535, "global_step": 96770, "epoch": 2304} {"train_loss": -6.333410739898682, "global_step": 96771, "epoch": 2304} {"train_loss": -6.236318588256836, "global_step": 96772, "epoch": 2304} {"train_loss": -6.276016712188721, "global_step": 96773, "epoch": 2304} {"train_loss": -6.332468032836914, "global_step": 96774, "epoch": 2304} {"train_loss": -6.434426307678223, "global_step": 96775, "epoch": 2304} {"train_loss": -6.332614421844482, "global_step": 96776, "epoch": 2304} {"train_loss": -6.372563362121582, "global_step": 96777, "epoch": 2304} {"train_loss": -6.20731258392334, "global_step": 96778, "epoch": 2304} {"train_loss": -6.308518409729004, "global_step": 96779, "epoch": 2304} {"train_loss": -6.361436367034912, "global_step": 96780, "epoch": 2304} {"train_loss": -6.473660469055176, "global_step": 96781, "epoch": 2304} {"train_loss": -6.374255657196045, "global_step": 96782, "epoch": 2304} {"train_loss": -6.3076372146606445, "global_step": 96783, "epoch": 2304} {"train_loss": -6.294057846069336, "global_step": 96784, "epoch": 2304} {"train_loss": -6.330479145050049, "global_step": 96785, "epoch": 2304} {"train_loss": -6.374609470367432, "global_step": 96786, "epoch": 2304} {"train_loss": -6.365214824676514, "global_step": 96787, "epoch": 2304} {"train_loss": -6.225900650024414, "global_step": 96788, "epoch": 2304} {"train_loss": -6.229425430297852, "global_step": 96789, "epoch": 2304} {"train_loss": -6.274779796600342, "global_step": 96790, "epoch": 2304} {"train_loss": -6.386100769042969, "global_step": 96791, "epoch": 2304} {"train_loss": -6.28391170501709, "global_step": 96792, "epoch": 2304} {"train_loss": -6.365586757659912, "global_step": 96793, "epoch": 2304} {"train_loss": -6.426684379577637, "global_step": 96794, "epoch": 2304} {"train_loss": -6.294994354248047, "global_step": 96795, "epoch": 2304} {"train_loss": -6.470272064208984, "global_step": 96796, "epoch": 2304} {"train_loss": -6.386474609375, "global_step": 96797, "epoch": 2304} {"train_loss": -6.325362205505371, "global_step": 96798, "epoch": 2304} {"train_loss": -6.410473823547363, "global_step": 96799, "epoch": 2304} {"train_loss": -6.274755954742432, "global_step": 96800, "epoch": 2304} {"train_loss": -6.3661651611328125, "global_step": 96801, "epoch": 2304} {"train_loss": -6.43408727645874, "global_step": 96802, "epoch": 2304} {"train_loss": -6.2916364669799805, "global_step": 96803, "epoch": 2304} {"train_loss": -6.318001747131348, "global_step": 96804, "epoch": 2304} {"train_loss": -6.435480117797852, "global_step": 96805, "epoch": 2304} {"train_loss": -6.383716583251953, "global_step": 96806, "epoch": 2304} {"train_loss": -6.3600382804870605, "global_step": 96807, "epoch": 2304} {"train_loss": -6.266898155212402, "global_step": 96808, "epoch": 2304} {"train_loss": -6.343909695034935, "global_step": 96809, "epoch": 2304, "val_loss": 75762.3046875} {"train_loss": -6.193552017211914, "global_step": 96810, "epoch": 2305} {"train_loss": -6.28023624420166, "global_step": 96811, "epoch": 2305} {"train_loss": -6.388895511627197, "global_step": 96812, "epoch": 2305} {"train_loss": -6.287314414978027, "global_step": 96813, "epoch": 2305} {"train_loss": -6.339791297912598, "global_step": 96814, "epoch": 2305} {"train_loss": -6.226988315582275, "global_step": 96815, "epoch": 2305} {"train_loss": -6.205728530883789, "global_step": 96816, "epoch": 2305} {"train_loss": -6.209720134735107, "global_step": 96817, "epoch": 2305} {"train_loss": -6.2851409912109375, "global_step": 96818, "epoch": 2305} {"train_loss": -6.252327919006348, "global_step": 96819, "epoch": 2305} {"train_loss": -6.272324085235596, "global_step": 96820, "epoch": 2305} {"train_loss": -6.274882793426514, "global_step": 96821, "epoch": 2305} {"train_loss": -6.25277042388916, "global_step": 96822, "epoch": 2305} {"train_loss": -6.246331691741943, "global_step": 96823, "epoch": 2305} {"train_loss": -6.306524276733398, "global_step": 96824, "epoch": 2305} {"train_loss": -6.238626956939697, "global_step": 96825, "epoch": 2305} {"train_loss": -6.2886834144592285, "global_step": 96826, "epoch": 2305} {"train_loss": -6.2965497970581055, "global_step": 96827, "epoch": 2305} {"train_loss": -6.2620697021484375, "global_step": 96828, "epoch": 2305} {"train_loss": -6.323661804199219, "global_step": 96829, "epoch": 2305} {"train_loss": -6.393618583679199, "global_step": 96830, "epoch": 2305} {"train_loss": -6.240744590759277, "global_step": 96831, "epoch": 2305} {"train_loss": -6.272624492645264, "global_step": 96832, "epoch": 2305} {"train_loss": -6.135097503662109, "global_step": 96833, "epoch": 2305} {"train_loss": -6.322563171386719, "global_step": 96834, "epoch": 2305} {"train_loss": -6.408029556274414, "global_step": 96835, "epoch": 2305} {"train_loss": -6.382264614105225, "global_step": 96836, "epoch": 2305} {"train_loss": -6.424455642700195, "global_step": 96837, "epoch": 2305} {"train_loss": -6.258077144622803, "global_step": 96838, "epoch": 2305} {"train_loss": -6.2886505126953125, "global_step": 96839, "epoch": 2305} {"train_loss": -6.294641494750977, "global_step": 96840, "epoch": 2305} {"train_loss": -6.404046058654785, "global_step": 96841, "epoch": 2305} {"train_loss": -6.390733242034912, "global_step": 96842, "epoch": 2305} {"train_loss": -6.43107795715332, "global_step": 96843, "epoch": 2305} {"train_loss": -6.307011604309082, "global_step": 96844, "epoch": 2305} {"train_loss": -6.37082576751709, "global_step": 96845, "epoch": 2305} {"train_loss": -6.3105573654174805, "global_step": 96846, "epoch": 2305} {"train_loss": -6.354547500610352, "global_step": 96847, "epoch": 2305} {"train_loss": -6.411764144897461, "global_step": 96848, "epoch": 2305} {"train_loss": -6.345043182373047, "global_step": 96849, "epoch": 2305} {"train_loss": -6.262096405029297, "global_step": 96850, "epoch": 2305} {"train_loss": -6.306705293201265, "global_step": 96851, "epoch": 2305, "val_loss": 75681.0625} {"train_loss": -6.285407543182373, "global_step": 96852, "epoch": 2306} {"train_loss": -6.243804454803467, "global_step": 96853, "epoch": 2306} {"train_loss": -6.346033096313477, "global_step": 96854, "epoch": 2306} {"train_loss": -6.272771835327148, "global_step": 96855, "epoch": 2306} {"train_loss": -6.310496807098389, "global_step": 96856, "epoch": 2306} {"train_loss": -6.329301834106445, "global_step": 96857, "epoch": 2306} {"train_loss": -6.161797523498535, "global_step": 96858, "epoch": 2306} {"train_loss": -6.301443099975586, "global_step": 96859, "epoch": 2306} {"train_loss": -6.303295135498047, "global_step": 96860, "epoch": 2306} {"train_loss": -6.252185344696045, "global_step": 96861, "epoch": 2306} {"train_loss": -6.266657829284668, "global_step": 96862, "epoch": 2306} {"train_loss": -6.274112701416016, "global_step": 96863, "epoch": 2306} {"train_loss": -6.190746307373047, "global_step": 96864, "epoch": 2306} {"train_loss": -6.23277473449707, "global_step": 96865, "epoch": 2306} {"train_loss": -6.1919145584106445, "global_step": 96866, "epoch": 2306} {"train_loss": -6.156996726989746, "global_step": 96867, "epoch": 2306} {"train_loss": -6.265967845916748, "global_step": 96868, "epoch": 2306} {"train_loss": -6.251776695251465, "global_step": 96869, "epoch": 2306} {"train_loss": -6.275364875793457, "global_step": 96870, "epoch": 2306} {"train_loss": -6.254178047180176, "global_step": 96871, "epoch": 2306} {"train_loss": -6.183070182800293, "global_step": 96872, "epoch": 2306} {"train_loss": -6.286770343780518, "global_step": 96873, "epoch": 2306} {"train_loss": -6.263650894165039, "global_step": 96874, "epoch": 2306} {"train_loss": -6.289775371551514, "global_step": 96875, "epoch": 2306} {"train_loss": -6.253154754638672, "global_step": 96876, "epoch": 2306} {"train_loss": -6.233676910400391, "global_step": 96877, "epoch": 2306} {"train_loss": -6.2708892822265625, "global_step": 96878, "epoch": 2306} {"train_loss": -6.3593292236328125, "global_step": 96879, "epoch": 2306} {"train_loss": -6.401740074157715, "global_step": 96880, "epoch": 2306} {"train_loss": -6.2216691970825195, "global_step": 96881, "epoch": 2306} {"train_loss": -6.331366539001465, "global_step": 96882, "epoch": 2306} {"train_loss": -6.282800197601318, "global_step": 96883, "epoch": 2306} {"train_loss": -6.299821376800537, "global_step": 96884, "epoch": 2306} {"train_loss": -6.378515720367432, "global_step": 96885, "epoch": 2306} {"train_loss": -6.314835548400879, "global_step": 96886, "epoch": 2306} {"train_loss": -6.313276290893555, "global_step": 96887, "epoch": 2306} {"train_loss": -6.378586292266846, "global_step": 96888, "epoch": 2306} {"train_loss": -6.278491973876953, "global_step": 96889, "epoch": 2306} {"train_loss": -6.302811622619629, "global_step": 96890, "epoch": 2306} {"train_loss": -6.276798248291016, "global_step": 96891, "epoch": 2306} {"train_loss": -6.353851318359375, "global_step": 96892, "epoch": 2306} {"train_loss": -6.2802785237630205, "global_step": 96893, "epoch": 2306, "val_loss": 75666.4453125} {"train_loss": -6.337920188903809, "global_step": 96894, "epoch": 2307} {"train_loss": -6.30891752243042, "global_step": 96895, "epoch": 2307} {"train_loss": -6.345625400543213, "global_step": 96896, "epoch": 2307} {"train_loss": -6.2630157470703125, "global_step": 96897, "epoch": 2307} {"train_loss": -6.474846363067627, "global_step": 96898, "epoch": 2307} {"train_loss": -6.300737380981445, "global_step": 96899, "epoch": 2307} {"train_loss": -6.348502159118652, "global_step": 96900, "epoch": 2307} {"train_loss": -6.368130683898926, "global_step": 96901, "epoch": 2307} {"train_loss": -6.2867231369018555, "global_step": 96902, "epoch": 2307} {"train_loss": -6.346033096313477, "global_step": 96903, "epoch": 2307} {"train_loss": -6.324581146240234, "global_step": 96904, "epoch": 2307} {"train_loss": -6.365310192108154, "global_step": 96905, "epoch": 2307} {"train_loss": -6.333274841308594, "global_step": 96906, "epoch": 2307} {"train_loss": -6.310110092163086, "global_step": 96907, "epoch": 2307} {"train_loss": -6.429007530212402, "global_step": 96908, "epoch": 2307} {"train_loss": -6.2319746017456055, "global_step": 96909, "epoch": 2307} {"train_loss": -6.308786869049072, "global_step": 96910, "epoch": 2307} {"train_loss": -6.414249420166016, "global_step": 96911, "epoch": 2307} {"train_loss": -6.308834075927734, "global_step": 96912, "epoch": 2307} {"train_loss": -6.39463472366333, "global_step": 96913, "epoch": 2307} {"train_loss": -6.278573989868164, "global_step": 96914, "epoch": 2307} {"train_loss": -6.289441108703613, "global_step": 96915, "epoch": 2307} {"train_loss": -6.365540504455566, "global_step": 96916, "epoch": 2307} {"train_loss": -6.247071743011475, "global_step": 96917, "epoch": 2307} {"train_loss": -6.330112457275391, "global_step": 96918, "epoch": 2307} {"train_loss": -6.312342643737793, "global_step": 96919, "epoch": 2307} {"train_loss": -6.401308059692383, "global_step": 96920, "epoch": 2307} {"train_loss": -6.323878288269043, "global_step": 96921, "epoch": 2307} {"train_loss": -6.352967739105225, "global_step": 96922, "epoch": 2307} {"train_loss": -6.305544853210449, "global_step": 96923, "epoch": 2307} {"train_loss": -6.271015644073486, "global_step": 96924, "epoch": 2307} {"train_loss": -6.325615882873535, "global_step": 96925, "epoch": 2307} {"train_loss": -6.190442085266113, "global_step": 96926, "epoch": 2307} {"train_loss": -6.242457866668701, "global_step": 96927, "epoch": 2307} {"train_loss": -6.31941556930542, "global_step": 96928, "epoch": 2307} {"train_loss": -6.286956787109375, "global_step": 96929, "epoch": 2307} {"train_loss": -6.297442436218262, "global_step": 96930, "epoch": 2307} {"train_loss": -6.280269622802734, "global_step": 96931, "epoch": 2307} {"train_loss": -6.209720611572266, "global_step": 96932, "epoch": 2307} {"train_loss": -6.305131912231445, "global_step": 96933, "epoch": 2307} {"train_loss": -6.323731899261475, "global_step": 96934, "epoch": 2307} {"train_loss": -6.3159233047848655, "global_step": 96935, "epoch": 2307, "val_loss": 75510.9453125} {"train_loss": -6.274661064147949, "global_step": 96936, "epoch": 2308} {"train_loss": -6.217256546020508, "global_step": 96937, "epoch": 2308} {"train_loss": -6.331845760345459, "global_step": 96938, "epoch": 2308} {"train_loss": -6.34294319152832, "global_step": 96939, "epoch": 2308} {"train_loss": -6.192648410797119, "global_step": 96940, "epoch": 2308} {"train_loss": -6.194422721862793, "global_step": 96941, "epoch": 2308} {"train_loss": -6.281366348266602, "global_step": 96942, "epoch": 2308} {"train_loss": -6.162545680999756, "global_step": 96943, "epoch": 2308} {"train_loss": -6.286935806274414, "global_step": 96944, "epoch": 2308} {"train_loss": -6.117337226867676, "global_step": 96945, "epoch": 2308} {"train_loss": -6.215073585510254, "global_step": 96946, "epoch": 2308} {"train_loss": -6.018522262573242, "global_step": 96947, "epoch": 2308} {"train_loss": -6.2176103591918945, "global_step": 96948, "epoch": 2308} {"train_loss": -6.300048351287842, "global_step": 96949, "epoch": 2308} {"train_loss": -6.065749645233154, "global_step": 96950, "epoch": 2308} {"train_loss": -6.226709842681885, "global_step": 96951, "epoch": 2308} {"train_loss": -6.065734386444092, "global_step": 96952, "epoch": 2308} {"train_loss": -6.277278900146484, "global_step": 96953, "epoch": 2308} {"train_loss": -6.218717098236084, "global_step": 96954, "epoch": 2308} {"train_loss": -6.22421932220459, "global_step": 96955, "epoch": 2308} {"train_loss": -6.217019081115723, "global_step": 96956, "epoch": 2308} {"train_loss": -6.198061943054199, "global_step": 96957, "epoch": 2308} {"train_loss": -6.2229743003845215, "global_step": 96958, "epoch": 2308} {"train_loss": -6.374829292297363, "global_step": 96959, "epoch": 2308} {"train_loss": -6.1226348876953125, "global_step": 96960, "epoch": 2308} {"train_loss": -6.31056022644043, "global_step": 96961, "epoch": 2308} {"train_loss": -6.2671380043029785, "global_step": 96962, "epoch": 2308} {"train_loss": -6.348369121551514, "global_step": 96963, "epoch": 2308} {"train_loss": -6.176175117492676, "global_step": 96964, "epoch": 2308} {"train_loss": -6.322268486022949, "global_step": 96965, "epoch": 2308} {"train_loss": -6.298430442810059, "global_step": 96966, "epoch": 2308} {"train_loss": -6.33290433883667, "global_step": 96967, "epoch": 2308} {"train_loss": -6.226339340209961, "global_step": 96968, "epoch": 2308} {"train_loss": -6.207456111907959, "global_step": 96969, "epoch": 2308} {"train_loss": -6.443162441253662, "global_step": 96970, "epoch": 2308} {"train_loss": -6.162345886230469, "global_step": 96971, "epoch": 2308} {"train_loss": -6.272201061248779, "global_step": 96972, "epoch": 2308} {"train_loss": -6.237567901611328, "global_step": 96973, "epoch": 2308} {"train_loss": -6.3038740158081055, "global_step": 96974, "epoch": 2308} {"train_loss": -6.404661178588867, "global_step": 96975, "epoch": 2308} {"train_loss": -6.271791458129883, "global_step": 96976, "epoch": 2308} {"train_loss": -6.246243669873192, "global_step": 96977, "epoch": 2308, "val_loss": 75595.8984375} {"train_loss": -6.357476711273193, "global_step": 96978, "epoch": 2309} {"train_loss": -6.2956085205078125, "global_step": 96979, "epoch": 2309} {"train_loss": -6.417596817016602, "global_step": 96980, "epoch": 2309} {"train_loss": -6.284911632537842, "global_step": 96981, "epoch": 2309} {"train_loss": -6.331429481506348, "global_step": 96982, "epoch": 2309} {"train_loss": -6.458503246307373, "global_step": 96983, "epoch": 2309} {"train_loss": -6.301111698150635, "global_step": 96984, "epoch": 2309} {"train_loss": -6.326380729675293, "global_step": 96985, "epoch": 2309} {"train_loss": -6.377397537231445, "global_step": 96986, "epoch": 2309} {"train_loss": -6.402758598327637, "global_step": 96987, "epoch": 2309} {"train_loss": -6.394023895263672, "global_step": 96988, "epoch": 2309} {"train_loss": -6.345337867736816, "global_step": 96989, "epoch": 2309} {"train_loss": -6.329611778259277, "global_step": 96990, "epoch": 2309} {"train_loss": -6.425779342651367, "global_step": 96991, "epoch": 2309} {"train_loss": -6.37516450881958, "global_step": 96992, "epoch": 2309} {"train_loss": -6.44046688079834, "global_step": 96993, "epoch": 2309} {"train_loss": -6.306184768676758, "global_step": 96994, "epoch": 2309} {"train_loss": -6.359687328338623, "global_step": 96995, "epoch": 2309} {"train_loss": -6.374629974365234, "global_step": 96996, "epoch": 2309} {"train_loss": -6.324127197265625, "global_step": 96997, "epoch": 2309} {"train_loss": -6.329643249511719, "global_step": 96998, "epoch": 2309} {"train_loss": -6.439462184906006, "global_step": 96999, "epoch": 2309} {"train_loss": -6.385078430175781, "global_step": 97000, "epoch": 2309} {"train_loss": -6.38378381729126, "global_step": 97001, "epoch": 2309} {"train_loss": -6.352926254272461, "global_step": 97002, "epoch": 2309} {"train_loss": -6.259696960449219, "global_step": 97003, "epoch": 2309} {"train_loss": -6.238125801086426, "global_step": 97004, "epoch": 2309} {"train_loss": -6.352962493896484, "global_step": 97005, "epoch": 2309} {"train_loss": -6.332114219665527, "global_step": 97006, "epoch": 2309} {"train_loss": -6.375864028930664, "global_step": 97007, "epoch": 2309} {"train_loss": -6.270053863525391, "global_step": 97008, "epoch": 2309} {"train_loss": -6.36500358581543, "global_step": 97009, "epoch": 2309} {"train_loss": -6.283775806427002, "global_step": 97010, "epoch": 2309} {"train_loss": -6.263382911682129, "global_step": 97011, "epoch": 2309} {"train_loss": -6.318721771240234, "global_step": 97012, "epoch": 2309} {"train_loss": -6.314321517944336, "global_step": 97013, "epoch": 2309} {"train_loss": -6.352386474609375, "global_step": 97014, "epoch": 2309} {"train_loss": -6.1289963722229, "global_step": 97015, "epoch": 2309} {"train_loss": -6.375657558441162, "global_step": 97016, "epoch": 2309} {"train_loss": -6.393592834472656, "global_step": 97017, "epoch": 2309} {"train_loss": -6.32414436340332, "global_step": 97018, "epoch": 2309} {"train_loss": -6.343789577484131, "global_step": 97019, "epoch": 2309, "val_loss": 75810.546875} {"train_loss": -6.234631538391113, "global_step": 97020, "epoch": 2310} {"train_loss": -6.132687091827393, "global_step": 97021, "epoch": 2310} {"train_loss": -6.30404806137085, "global_step": 97022, "epoch": 2310} {"train_loss": -6.397480010986328, "global_step": 97023, "epoch": 2310} {"train_loss": -6.414841651916504, "global_step": 97024, "epoch": 2310} {"train_loss": -6.213228225708008, "global_step": 97025, "epoch": 2310} {"train_loss": -6.18772029876709, "global_step": 97026, "epoch": 2310} {"train_loss": -6.312467575073242, "global_step": 97027, "epoch": 2310} {"train_loss": -6.368444442749023, "global_step": 97028, "epoch": 2310} {"train_loss": -6.382282257080078, "global_step": 97029, "epoch": 2310} {"train_loss": -6.331987380981445, "global_step": 97030, "epoch": 2310} {"train_loss": -6.390128135681152, "global_step": 97031, "epoch": 2310} {"train_loss": -6.41847038269043, "global_step": 97032, "epoch": 2310} {"train_loss": -6.390167713165283, "global_step": 97033, "epoch": 2310} {"train_loss": -6.356484889984131, "global_step": 97034, "epoch": 2310} {"train_loss": -6.425213813781738, "global_step": 97035, "epoch": 2310} {"train_loss": -6.364246845245361, "global_step": 97036, "epoch": 2310} {"train_loss": -6.430331230163574, "global_step": 97037, "epoch": 2310} {"train_loss": -6.346795082092285, "global_step": 97038, "epoch": 2310} {"train_loss": -6.341141223907471, "global_step": 97039, "epoch": 2310} {"train_loss": -6.341573715209961, "global_step": 97040, "epoch": 2310} {"train_loss": -6.320780277252197, "global_step": 97041, "epoch": 2310} {"train_loss": -6.276084899902344, "global_step": 97042, "epoch": 2310} {"train_loss": -6.257255554199219, "global_step": 97043, "epoch": 2310} {"train_loss": -6.358150959014893, "global_step": 97044, "epoch": 2310} {"train_loss": -6.4128007888793945, "global_step": 97045, "epoch": 2310} {"train_loss": -6.27261209487915, "global_step": 97046, "epoch": 2310} {"train_loss": -6.359111785888672, "global_step": 97047, "epoch": 2310} {"train_loss": -6.355934143066406, "global_step": 97048, "epoch": 2310} {"train_loss": -6.283084392547607, "global_step": 97049, "epoch": 2310} {"train_loss": -6.274419784545898, "global_step": 97050, "epoch": 2310} {"train_loss": -6.340036392211914, "global_step": 97051, "epoch": 2310} {"train_loss": -6.204601764678955, "global_step": 97052, "epoch": 2310} {"train_loss": -6.325503349304199, "global_step": 97053, "epoch": 2310} {"train_loss": -6.310769081115723, "global_step": 97054, "epoch": 2310} {"train_loss": -6.34214973449707, "global_step": 97055, "epoch": 2310} {"train_loss": -6.400188446044922, "global_step": 97056, "epoch": 2310} {"train_loss": -6.336119651794434, "global_step": 97057, "epoch": 2310} {"train_loss": -6.331286430358887, "global_step": 97058, "epoch": 2310} {"train_loss": -6.403538227081299, "global_step": 97059, "epoch": 2310} {"train_loss": -6.2788543701171875, "global_step": 97060, "epoch": 2310} {"train_loss": -6.332747107460385, "global_step": 97061, "epoch": 2310, "val_loss": 75594.4140625} {"train_loss": -6.365884780883789, "global_step": 97062, "epoch": 2311} {"train_loss": -6.429863929748535, "global_step": 97063, "epoch": 2311} {"train_loss": -6.298912048339844, "global_step": 97064, "epoch": 2311} {"train_loss": -6.406241416931152, "global_step": 97065, "epoch": 2311} {"train_loss": -6.297550678253174, "global_step": 97066, "epoch": 2311} {"train_loss": -6.4186224937438965, "global_step": 97067, "epoch": 2311} {"train_loss": -6.4613447189331055, "global_step": 97068, "epoch": 2311} {"train_loss": -6.142640590667725, "global_step": 97069, "epoch": 2311} {"train_loss": -6.365522861480713, "global_step": 97070, "epoch": 2311} {"train_loss": -6.298550128936768, "global_step": 97071, "epoch": 2311} {"train_loss": -6.405851364135742, "global_step": 97072, "epoch": 2311} {"train_loss": -6.268649101257324, "global_step": 97073, "epoch": 2311} {"train_loss": -6.289638042449951, "global_step": 97074, "epoch": 2311} {"train_loss": -6.420775890350342, "global_step": 97075, "epoch": 2311} {"train_loss": -6.309858322143555, "global_step": 97076, "epoch": 2311} {"train_loss": -6.284661769866943, "global_step": 97077, "epoch": 2311} {"train_loss": -6.340579032897949, "global_step": 97078, "epoch": 2311} {"train_loss": -6.418468475341797, "global_step": 97079, "epoch": 2311} {"train_loss": -6.28120231628418, "global_step": 97080, "epoch": 2311} {"train_loss": -6.3967204093933105, "global_step": 97081, "epoch": 2311} {"train_loss": -6.361510753631592, "global_step": 97082, "epoch": 2311} {"train_loss": -6.305696487426758, "global_step": 97083, "epoch": 2311} {"train_loss": -6.403136730194092, "global_step": 97084, "epoch": 2311} {"train_loss": -6.331182479858398, "global_step": 97085, "epoch": 2311} {"train_loss": -6.337888717651367, "global_step": 97086, "epoch": 2311} {"train_loss": -6.293850898742676, "global_step": 97087, "epoch": 2311} {"train_loss": -6.280991554260254, "global_step": 97088, "epoch": 2311} {"train_loss": -6.377522945404053, "global_step": 97089, "epoch": 2311} {"train_loss": -6.248303413391113, "global_step": 97090, "epoch": 2311} {"train_loss": -6.283647537231445, "global_step": 97091, "epoch": 2311} {"train_loss": -6.3965911865234375, "global_step": 97092, "epoch": 2311} {"train_loss": -6.363280296325684, "global_step": 97093, "epoch": 2311} {"train_loss": -6.415319442749023, "global_step": 97094, "epoch": 2311} {"train_loss": -6.339911937713623, "global_step": 97095, "epoch": 2311} {"train_loss": -6.261412620544434, "global_step": 97096, "epoch": 2311} {"train_loss": -6.252880573272705, "global_step": 97097, "epoch": 2311} {"train_loss": -6.165390491485596, "global_step": 97098, "epoch": 2311} {"train_loss": -6.460634231567383, "global_step": 97099, "epoch": 2311} {"train_loss": -6.2371649742126465, "global_step": 97100, "epoch": 2311} {"train_loss": -6.2096710205078125, "global_step": 97101, "epoch": 2311} {"train_loss": -6.253269672393799, "global_step": 97102, "epoch": 2311} {"train_loss": -6.329131921132405, "global_step": 97103, "epoch": 2311, "val_loss": 75665.4765625} {"train_loss": -6.295365333557129, "global_step": 97104, "epoch": 2312} {"train_loss": -6.253350257873535, "global_step": 97105, "epoch": 2312} {"train_loss": -6.340458869934082, "global_step": 97106, "epoch": 2312} {"train_loss": -6.248255729675293, "global_step": 97107, "epoch": 2312} {"train_loss": -6.335808753967285, "global_step": 97108, "epoch": 2312} {"train_loss": -6.173295021057129, "global_step": 97109, "epoch": 2312} {"train_loss": -6.026801109313965, "global_step": 97110, "epoch": 2312} {"train_loss": -6.2563676834106445, "global_step": 97111, "epoch": 2312} {"train_loss": -6.158625602722168, "global_step": 97112, "epoch": 2312} {"train_loss": -6.1442551612854, "global_step": 97113, "epoch": 2312} {"train_loss": -6.1907477378845215, "global_step": 97114, "epoch": 2312} {"train_loss": -6.283047676086426, "global_step": 97115, "epoch": 2312} {"train_loss": -6.344862461090088, "global_step": 97116, "epoch": 2312} {"train_loss": -6.276601314544678, "global_step": 97117, "epoch": 2312} {"train_loss": -6.184417724609375, "global_step": 97118, "epoch": 2312} {"train_loss": -6.209986686706543, "global_step": 97119, "epoch": 2312} {"train_loss": -6.161870956420898, "global_step": 97120, "epoch": 2312} {"train_loss": -6.097001075744629, "global_step": 97121, "epoch": 2312} {"train_loss": -6.18868350982666, "global_step": 97122, "epoch": 2312} {"train_loss": -6.254560470581055, "global_step": 97123, "epoch": 2312} {"train_loss": -6.202127456665039, "global_step": 97124, "epoch": 2312} {"train_loss": -6.273677825927734, "global_step": 97125, "epoch": 2312} {"train_loss": -6.09274959564209, "global_step": 97126, "epoch": 2312} {"train_loss": -6.2292866706848145, "global_step": 97127, "epoch": 2312} {"train_loss": -6.330142498016357, "global_step": 97128, "epoch": 2312} {"train_loss": -6.362392425537109, "global_step": 97129, "epoch": 2312} {"train_loss": -6.259284019470215, "global_step": 97130, "epoch": 2312} {"train_loss": -6.207355976104736, "global_step": 97131, "epoch": 2312} {"train_loss": -6.230588912963867, "global_step": 97132, "epoch": 2312} {"train_loss": -6.339781761169434, "global_step": 97133, "epoch": 2312} {"train_loss": -6.185807704925537, "global_step": 97134, "epoch": 2312} {"train_loss": -6.301365852355957, "global_step": 97135, "epoch": 2312} {"train_loss": -6.266083717346191, "global_step": 97136, "epoch": 2312} {"train_loss": -6.275819778442383, "global_step": 97137, "epoch": 2312} {"train_loss": -6.25900936126709, "global_step": 97138, "epoch": 2312} {"train_loss": -6.370580673217773, "global_step": 97139, "epoch": 2312} {"train_loss": -6.256299018859863, "global_step": 97140, "epoch": 2312} {"train_loss": -6.244941234588623, "global_step": 97141, "epoch": 2312} {"train_loss": -6.2793426513671875, "global_step": 97142, "epoch": 2312} {"train_loss": -6.333795070648193, "global_step": 97143, "epoch": 2312} {"train_loss": -6.3393964767456055, "global_step": 97144, "epoch": 2312} {"train_loss": -6.248549813315982, "global_step": 97145, "epoch": 2312, "val_loss": 75440.0078125} {"train_loss": -6.2622222900390625, "global_step": 97146, "epoch": 2313} {"train_loss": -6.280793190002441, "global_step": 97147, "epoch": 2313} {"train_loss": -6.399479866027832, "global_step": 97148, "epoch": 2313} {"train_loss": -6.38715124130249, "global_step": 97149, "epoch": 2313} {"train_loss": -6.430737495422363, "global_step": 97150, "epoch": 2313} {"train_loss": -6.274444580078125, "global_step": 97151, "epoch": 2313} {"train_loss": -6.367814064025879, "global_step": 97152, "epoch": 2313} {"train_loss": -6.317516803741455, "global_step": 97153, "epoch": 2313} {"train_loss": -6.374469757080078, "global_step": 97154, "epoch": 2313} {"train_loss": -6.325603008270264, "global_step": 97155, "epoch": 2313} {"train_loss": -6.283121109008789, "global_step": 97156, "epoch": 2313} {"train_loss": -6.3345842361450195, "global_step": 97157, "epoch": 2313} {"train_loss": -6.232325553894043, "global_step": 97158, "epoch": 2313} {"train_loss": -6.37253475189209, "global_step": 97159, "epoch": 2313} {"train_loss": -6.29323148727417, "global_step": 97160, "epoch": 2313} {"train_loss": -6.3237690925598145, "global_step": 97161, "epoch": 2313} {"train_loss": -6.306945323944092, "global_step": 97162, "epoch": 2313} {"train_loss": -6.43351936340332, "global_step": 97163, "epoch": 2313} {"train_loss": -6.362439155578613, "global_step": 97164, "epoch": 2313} {"train_loss": -6.3526930809021, "global_step": 97165, "epoch": 2313} {"train_loss": -6.246611595153809, "global_step": 97166, "epoch": 2313} {"train_loss": -6.389438629150391, "global_step": 97167, "epoch": 2313} {"train_loss": -6.309042453765869, "global_step": 97168, "epoch": 2313} {"train_loss": -6.321569442749023, "global_step": 97169, "epoch": 2313} {"train_loss": -6.297552108764648, "global_step": 97170, "epoch": 2313} {"train_loss": -6.2991461753845215, "global_step": 97171, "epoch": 2313} {"train_loss": -6.34990930557251, "global_step": 97172, "epoch": 2313} {"train_loss": -6.321796417236328, "global_step": 97173, "epoch": 2313} {"train_loss": -6.3213934898376465, "global_step": 97174, "epoch": 2313} {"train_loss": -6.398288726806641, "global_step": 97175, "epoch": 2313} {"train_loss": -6.354518413543701, "global_step": 97176, "epoch": 2313} {"train_loss": -6.442076683044434, "global_step": 97177, "epoch": 2313} {"train_loss": -6.316549301147461, "global_step": 97178, "epoch": 2313} {"train_loss": -6.2900543212890625, "global_step": 97179, "epoch": 2313} {"train_loss": -6.327439785003662, "global_step": 97180, "epoch": 2313} {"train_loss": -6.376681327819824, "global_step": 97181, "epoch": 2313} {"train_loss": -6.380685329437256, "global_step": 97182, "epoch": 2313} {"train_loss": -6.321788787841797, "global_step": 97183, "epoch": 2313} {"train_loss": -6.2614545822143555, "global_step": 97184, "epoch": 2313} {"train_loss": -6.41028356552124, "global_step": 97185, "epoch": 2313} {"train_loss": -6.455287933349609, "global_step": 97186, "epoch": 2313} {"train_loss": -6.342623778751919, "global_step": 97187, "epoch": 2313, "val_loss": 75764.7578125} {"train_loss": -6.385536193847656, "global_step": 97188, "epoch": 2314} {"train_loss": -6.372535705566406, "global_step": 97189, "epoch": 2314} {"train_loss": -6.340977668762207, "global_step": 97190, "epoch": 2314} {"train_loss": -6.3316216468811035, "global_step": 97191, "epoch": 2314} {"train_loss": -6.2686076164245605, "global_step": 97192, "epoch": 2314} {"train_loss": -6.203177452087402, "global_step": 97193, "epoch": 2314} {"train_loss": -6.311715602874756, "global_step": 97194, "epoch": 2314} {"train_loss": -6.298196792602539, "global_step": 97195, "epoch": 2314} {"train_loss": -6.07240104675293, "global_step": 97196, "epoch": 2314} {"train_loss": -6.282759666442871, "global_step": 97197, "epoch": 2314} {"train_loss": -6.311796188354492, "global_step": 97198, "epoch": 2314} {"train_loss": -6.220402717590332, "global_step": 97199, "epoch": 2314} {"train_loss": -6.250063896179199, "global_step": 97200, "epoch": 2314} {"train_loss": -6.325213432312012, "global_step": 97201, "epoch": 2314} {"train_loss": -6.29449462890625, "global_step": 97202, "epoch": 2314} {"train_loss": -6.36112117767334, "global_step": 97203, "epoch": 2314} {"train_loss": -6.238858222961426, "global_step": 97204, "epoch": 2314} {"train_loss": -6.3344292640686035, "global_step": 97205, "epoch": 2314} {"train_loss": -6.227705955505371, "global_step": 97206, "epoch": 2314} {"train_loss": -6.294820785522461, "global_step": 97207, "epoch": 2314} {"train_loss": -6.3151679039001465, "global_step": 97208, "epoch": 2314} {"train_loss": -6.274483680725098, "global_step": 97209, "epoch": 2314} {"train_loss": -6.368817329406738, "global_step": 97210, "epoch": 2314} {"train_loss": -6.4122209548950195, "global_step": 97211, "epoch": 2314} {"train_loss": -6.367143154144287, "global_step": 97212, "epoch": 2314} {"train_loss": -6.181512355804443, "global_step": 97213, "epoch": 2314} {"train_loss": -6.22175407409668, "global_step": 97214, "epoch": 2314} {"train_loss": -6.317197322845459, "global_step": 97215, "epoch": 2314} {"train_loss": -6.214166164398193, "global_step": 97216, "epoch": 2314} {"train_loss": -6.232918739318848, "global_step": 97217, "epoch": 2314} {"train_loss": -6.241795539855957, "global_step": 97218, "epoch": 2314} {"train_loss": -6.22747802734375, "global_step": 97219, "epoch": 2314} {"train_loss": -6.316641807556152, "global_step": 97220, "epoch": 2314} {"train_loss": -6.214297771453857, "global_step": 97221, "epoch": 2314} {"train_loss": -6.31357479095459, "global_step": 97222, "epoch": 2314} {"train_loss": -6.214728355407715, "global_step": 97223, "epoch": 2314} {"train_loss": -6.228512763977051, "global_step": 97224, "epoch": 2314} {"train_loss": -6.283553123474121, "global_step": 97225, "epoch": 2314} {"train_loss": -6.395176887512207, "global_step": 97226, "epoch": 2314} {"train_loss": -6.336469650268555, "global_step": 97227, "epoch": 2314} {"train_loss": -6.351836681365967, "global_step": 97228, "epoch": 2314} {"train_loss": -6.287873358953567, "global_step": 97229, "epoch": 2314, "val_loss": 75725.3515625} {"train_loss": -6.29559326171875, "global_step": 97230, "epoch": 2315} {"train_loss": -6.391726493835449, "global_step": 97231, "epoch": 2315} {"train_loss": -6.262346267700195, "global_step": 97232, "epoch": 2315} {"train_loss": -6.37343692779541, "global_step": 97233, "epoch": 2315} {"train_loss": -6.29515266418457, "global_step": 97234, "epoch": 2315} {"train_loss": -6.264257907867432, "global_step": 97235, "epoch": 2315} {"train_loss": -6.3692097663879395, "global_step": 97236, "epoch": 2315} {"train_loss": -6.311712265014648, "global_step": 97237, "epoch": 2315} {"train_loss": -6.420440673828125, "global_step": 97238, "epoch": 2315} {"train_loss": -6.268771171569824, "global_step": 97239, "epoch": 2315} {"train_loss": -6.362860679626465, "global_step": 97240, "epoch": 2315} {"train_loss": -6.312582492828369, "global_step": 97241, "epoch": 2315} {"train_loss": -6.441964149475098, "global_step": 97242, "epoch": 2315} {"train_loss": -6.378053665161133, "global_step": 97243, "epoch": 2315} {"train_loss": -6.3114013671875, "global_step": 97244, "epoch": 2315} {"train_loss": -6.190659046173096, "global_step": 97245, "epoch": 2315} {"train_loss": -6.341498851776123, "global_step": 97246, "epoch": 2315} {"train_loss": -6.343500137329102, "global_step": 97247, "epoch": 2315} {"train_loss": -6.380167007446289, "global_step": 97248, "epoch": 2315} {"train_loss": -6.3044114112854, "global_step": 97249, "epoch": 2315} {"train_loss": -6.447516441345215, "global_step": 97250, "epoch": 2315} {"train_loss": -6.286629676818848, "global_step": 97251, "epoch": 2315} {"train_loss": -6.329941749572754, "global_step": 97252, "epoch": 2315} {"train_loss": -6.21412992477417, "global_step": 97253, "epoch": 2315} {"train_loss": -6.334557056427002, "global_step": 97254, "epoch": 2315} {"train_loss": -6.283692836761475, "global_step": 97255, "epoch": 2315} {"train_loss": -6.349245548248291, "global_step": 97256, "epoch": 2315} {"train_loss": -6.464582443237305, "global_step": 97257, "epoch": 2315} {"train_loss": -6.2646965980529785, "global_step": 97258, "epoch": 2315} {"train_loss": -6.360588550567627, "global_step": 97259, "epoch": 2315} {"train_loss": -6.293818950653076, "global_step": 97260, "epoch": 2315} {"train_loss": -6.294776916503906, "global_step": 97261, "epoch": 2315} {"train_loss": -6.3671135902404785, "global_step": 97262, "epoch": 2315} {"train_loss": -6.315942764282227, "global_step": 97263, "epoch": 2315} {"train_loss": -6.3323750495910645, "global_step": 97264, "epoch": 2315} {"train_loss": -6.248262405395508, "global_step": 97265, "epoch": 2315} {"train_loss": -6.212704658508301, "global_step": 97266, "epoch": 2315} {"train_loss": -6.278090000152588, "global_step": 97267, "epoch": 2315} {"train_loss": -6.116451740264893, "global_step": 97268, "epoch": 2315} {"train_loss": -6.3351640701293945, "global_step": 97269, "epoch": 2315} {"train_loss": -6.200649261474609, "global_step": 97270, "epoch": 2315} {"train_loss": -6.315655901318505, "global_step": 97271, "epoch": 2315, "val_loss": 76012.109375} {"train_loss": -6.273777008056641, "global_step": 97272, "epoch": 2316} {"train_loss": -6.37291145324707, "global_step": 97273, "epoch": 2316} {"train_loss": -6.271377086639404, "global_step": 97274, "epoch": 2316} {"train_loss": -6.236108303070068, "global_step": 97275, "epoch": 2316} {"train_loss": -6.379072189331055, "global_step": 97276, "epoch": 2316} {"train_loss": -6.283795356750488, "global_step": 97277, "epoch": 2316} {"train_loss": -6.305013179779053, "global_step": 97278, "epoch": 2316} {"train_loss": -6.319416046142578, "global_step": 97279, "epoch": 2316} {"train_loss": -6.287264823913574, "global_step": 97280, "epoch": 2316} {"train_loss": -6.390028476715088, "global_step": 97281, "epoch": 2316} {"train_loss": -6.278010368347168, "global_step": 97282, "epoch": 2316} {"train_loss": -6.409000396728516, "global_step": 97283, "epoch": 2316} {"train_loss": -6.291594505310059, "global_step": 97284, "epoch": 2316} {"train_loss": -6.255616188049316, "global_step": 97285, "epoch": 2316} {"train_loss": -6.372811317443848, "global_step": 97286, "epoch": 2316} {"train_loss": -6.250462532043457, "global_step": 97287, "epoch": 2316} {"train_loss": -6.228189468383789, "global_step": 97288, "epoch": 2316} {"train_loss": -6.2000837326049805, "global_step": 97289, "epoch": 2316} {"train_loss": -6.328035831451416, "global_step": 97290, "epoch": 2316} {"train_loss": -6.337854385375977, "global_step": 97291, "epoch": 2316} {"train_loss": -6.292953968048096, "global_step": 97292, "epoch": 2316} {"train_loss": -6.4147186279296875, "global_step": 97293, "epoch": 2316} {"train_loss": -6.3410139083862305, "global_step": 97294, "epoch": 2316} {"train_loss": -6.353379726409912, "global_step": 97295, "epoch": 2316} {"train_loss": -6.227932929992676, "global_step": 97296, "epoch": 2316} {"train_loss": -6.321009635925293, "global_step": 97297, "epoch": 2316} {"train_loss": -6.440832138061523, "global_step": 97298, "epoch": 2316} {"train_loss": -6.2632222175598145, "global_step": 97299, "epoch": 2316} {"train_loss": -6.3284759521484375, "global_step": 97300, "epoch": 2316} {"train_loss": -6.4341583251953125, "global_step": 97301, "epoch": 2316} {"train_loss": -6.30631685256958, "global_step": 97302, "epoch": 2316} {"train_loss": -6.325442314147949, "global_step": 97303, "epoch": 2316} {"train_loss": -6.344134330749512, "global_step": 97304, "epoch": 2316} {"train_loss": -6.35349178314209, "global_step": 97305, "epoch": 2316} {"train_loss": -6.398327827453613, "global_step": 97306, "epoch": 2316} {"train_loss": -6.3594160079956055, "global_step": 97307, "epoch": 2316} {"train_loss": -6.4000654220581055, "global_step": 97308, "epoch": 2316} {"train_loss": -6.2837982177734375, "global_step": 97309, "epoch": 2316} {"train_loss": -6.3813276290893555, "global_step": 97310, "epoch": 2316} {"train_loss": -6.280673980712891, "global_step": 97311, "epoch": 2316} {"train_loss": -6.437094688415527, "global_step": 97312, "epoch": 2316} {"train_loss": -6.32788101832072, "global_step": 97313, "epoch": 2316, "val_loss": 75586.1953125} {"train_loss": -6.321864128112793, "global_step": 97314, "epoch": 2317} {"train_loss": -6.355459213256836, "global_step": 97315, "epoch": 2317} {"train_loss": -6.323934555053711, "global_step": 97316, "epoch": 2317} {"train_loss": -6.335204124450684, "global_step": 97317, "epoch": 2317} {"train_loss": -6.366674423217773, "global_step": 97318, "epoch": 2317} {"train_loss": -6.262676239013672, "global_step": 97319, "epoch": 2317} {"train_loss": -6.236437797546387, "global_step": 97320, "epoch": 2317} {"train_loss": -6.226629257202148, "global_step": 97321, "epoch": 2317} {"train_loss": -6.385521411895752, "global_step": 97322, "epoch": 2317} {"train_loss": -6.413203239440918, "global_step": 97323, "epoch": 2317} {"train_loss": -6.386425018310547, "global_step": 97324, "epoch": 2317} {"train_loss": -6.449139595031738, "global_step": 97325, "epoch": 2317} {"train_loss": -6.331021308898926, "global_step": 97326, "epoch": 2317} {"train_loss": -6.361588001251221, "global_step": 97327, "epoch": 2317} {"train_loss": -6.3963212966918945, "global_step": 97328, "epoch": 2317} {"train_loss": -6.427013874053955, "global_step": 97329, "epoch": 2317} {"train_loss": -6.375235557556152, "global_step": 97330, "epoch": 2317} {"train_loss": -6.354353904724121, "global_step": 97331, "epoch": 2317} {"train_loss": -6.405956268310547, "global_step": 97332, "epoch": 2317} {"train_loss": -6.417402267456055, "global_step": 97333, "epoch": 2317} {"train_loss": -6.449568748474121, "global_step": 97334, "epoch": 2317} {"train_loss": -6.302948951721191, "global_step": 97335, "epoch": 2317} {"train_loss": -6.402560234069824, "global_step": 97336, "epoch": 2317} {"train_loss": -6.386922836303711, "global_step": 97337, "epoch": 2317} {"train_loss": -6.340407371520996, "global_step": 97338, "epoch": 2317} {"train_loss": -6.265655517578125, "global_step": 97339, "epoch": 2317} {"train_loss": -6.254029273986816, "global_step": 97340, "epoch": 2317} {"train_loss": -6.390084266662598, "global_step": 97341, "epoch": 2317} {"train_loss": -6.230881690979004, "global_step": 97342, "epoch": 2317} {"train_loss": -6.138789176940918, "global_step": 97343, "epoch": 2317} {"train_loss": -6.419025421142578, "global_step": 97344, "epoch": 2317} {"train_loss": -6.255270004272461, "global_step": 97345, "epoch": 2317} {"train_loss": -6.334286212921143, "global_step": 97346, "epoch": 2317} {"train_loss": -6.376694679260254, "global_step": 97347, "epoch": 2317} {"train_loss": -6.416588306427002, "global_step": 97348, "epoch": 2317} {"train_loss": -6.337794303894043, "global_step": 97349, "epoch": 2317} {"train_loss": -6.368351936340332, "global_step": 97350, "epoch": 2317} {"train_loss": -6.364099502563477, "global_step": 97351, "epoch": 2317} {"train_loss": -6.313111305236816, "global_step": 97352, "epoch": 2317} {"train_loss": -6.2778425216674805, "global_step": 97353, "epoch": 2317} {"train_loss": -6.343720436096191, "global_step": 97354, "epoch": 2317} {"train_loss": -6.344491947264898, "global_step": 97355, "epoch": 2317, "val_loss": 75654.03125} {"train_loss": -6.319714546203613, "global_step": 97356, "epoch": 2318} {"train_loss": -6.357456207275391, "global_step": 97357, "epoch": 2318} {"train_loss": -6.36475944519043, "global_step": 97358, "epoch": 2318} {"train_loss": -6.280534744262695, "global_step": 97359, "epoch": 2318} {"train_loss": -6.376308917999268, "global_step": 97360, "epoch": 2318} {"train_loss": -6.3893537521362305, "global_step": 97361, "epoch": 2318} {"train_loss": -6.35294246673584, "global_step": 97362, "epoch": 2318} {"train_loss": -6.305140495300293, "global_step": 97363, "epoch": 2318} {"train_loss": -6.301023483276367, "global_step": 97364, "epoch": 2318} {"train_loss": -6.308612823486328, "global_step": 97365, "epoch": 2318} {"train_loss": -6.286397933959961, "global_step": 97366, "epoch": 2318} {"train_loss": -6.444690704345703, "global_step": 97367, "epoch": 2318} {"train_loss": -6.302330017089844, "global_step": 97368, "epoch": 2318} {"train_loss": -6.296953201293945, "global_step": 97369, "epoch": 2318} {"train_loss": -6.2918548583984375, "global_step": 97370, "epoch": 2318} {"train_loss": -6.301680088043213, "global_step": 97371, "epoch": 2318} {"train_loss": -6.328567981719971, "global_step": 97372, "epoch": 2318} {"train_loss": -6.066434860229492, "global_step": 97373, "epoch": 2318} {"train_loss": -6.332900524139404, "global_step": 97374, "epoch": 2318} {"train_loss": -6.185798645019531, "global_step": 97375, "epoch": 2318} {"train_loss": -6.260817527770996, "global_step": 97376, "epoch": 2318} {"train_loss": -6.261261940002441, "global_step": 97377, "epoch": 2318} {"train_loss": -6.231479167938232, "global_step": 97378, "epoch": 2318} {"train_loss": -6.271396636962891, "global_step": 97379, "epoch": 2318} {"train_loss": -6.252202987670898, "global_step": 97380, "epoch": 2318} {"train_loss": -6.2931904792785645, "global_step": 97381, "epoch": 2318} {"train_loss": -6.214980125427246, "global_step": 97382, "epoch": 2318} {"train_loss": -6.264165878295898, "global_step": 97383, "epoch": 2318} {"train_loss": -6.460683822631836, "global_step": 97384, "epoch": 2318} {"train_loss": -6.170666694641113, "global_step": 97385, "epoch": 2318} {"train_loss": -6.357771396636963, "global_step": 97386, "epoch": 2318} {"train_loss": -6.299820423126221, "global_step": 97387, "epoch": 2318} {"train_loss": -6.303699493408203, "global_step": 97388, "epoch": 2318} {"train_loss": -6.3782501220703125, "global_step": 97389, "epoch": 2318} {"train_loss": -6.22782039642334, "global_step": 97390, "epoch": 2318} {"train_loss": -6.413665771484375, "global_step": 97391, "epoch": 2318} {"train_loss": -6.281394958496094, "global_step": 97392, "epoch": 2318} {"train_loss": -6.3159942626953125, "global_step": 97393, "epoch": 2318} {"train_loss": -6.325691223144531, "global_step": 97394, "epoch": 2318} {"train_loss": -6.273983478546143, "global_step": 97395, "epoch": 2318} {"train_loss": -6.378912925720215, "global_step": 97396, "epoch": 2318} {"train_loss": -6.304230088279361, "global_step": 97397, "epoch": 2318, "val_loss": 75868.46875} {"train_loss": -6.334913730621338, "global_step": 97398, "epoch": 2319} {"train_loss": -6.351556777954102, "global_step": 97399, "epoch": 2319} {"train_loss": -6.3746418952941895, "global_step": 97400, "epoch": 2319} {"train_loss": -6.33570671081543, "global_step": 97401, "epoch": 2319} {"train_loss": -6.292704105377197, "global_step": 97402, "epoch": 2319} {"train_loss": -6.476884841918945, "global_step": 97403, "epoch": 2319} {"train_loss": -6.289669990539551, "global_step": 97404, "epoch": 2319} {"train_loss": -6.356359481811523, "global_step": 97405, "epoch": 2319} {"train_loss": -6.260904312133789, "global_step": 97406, "epoch": 2319} {"train_loss": -6.288710117340088, "global_step": 97407, "epoch": 2319} {"train_loss": -6.300032615661621, "global_step": 97408, "epoch": 2319} {"train_loss": -6.383012771606445, "global_step": 97409, "epoch": 2319} {"train_loss": -6.245692253112793, "global_step": 97410, "epoch": 2319} {"train_loss": -6.422255992889404, "global_step": 97411, "epoch": 2319} {"train_loss": -6.266884803771973, "global_step": 97412, "epoch": 2319} {"train_loss": -6.3408308029174805, "global_step": 97413, "epoch": 2319} {"train_loss": -6.3012800216674805, "global_step": 97414, "epoch": 2319} {"train_loss": -6.227254867553711, "global_step": 97415, "epoch": 2319} {"train_loss": -6.314579010009766, "global_step": 97416, "epoch": 2319} {"train_loss": -6.330360412597656, "global_step": 97417, "epoch": 2319} {"train_loss": -6.236791133880615, "global_step": 97418, "epoch": 2319} {"train_loss": -6.466310501098633, "global_step": 97419, "epoch": 2319} {"train_loss": -6.338912010192871, "global_step": 97420, "epoch": 2319} {"train_loss": -6.314180850982666, "global_step": 97421, "epoch": 2319} {"train_loss": -6.351824760437012, "global_step": 97422, "epoch": 2319} {"train_loss": -6.280637264251709, "global_step": 97423, "epoch": 2319} {"train_loss": -6.307574272155762, "global_step": 97424, "epoch": 2319} {"train_loss": -6.337070465087891, "global_step": 97425, "epoch": 2319} {"train_loss": -6.414868354797363, "global_step": 97426, "epoch": 2319} {"train_loss": -6.223287105560303, "global_step": 97427, "epoch": 2319} {"train_loss": -6.3466010093688965, "global_step": 97428, "epoch": 2319} {"train_loss": -6.302765846252441, "global_step": 97429, "epoch": 2319} {"train_loss": -6.341119766235352, "global_step": 97430, "epoch": 2319} {"train_loss": -6.448218822479248, "global_step": 97431, "epoch": 2319} {"train_loss": -6.330955982208252, "global_step": 97432, "epoch": 2319} {"train_loss": -6.357198238372803, "global_step": 97433, "epoch": 2319} {"train_loss": -6.359760284423828, "global_step": 97434, "epoch": 2319} {"train_loss": -6.358433723449707, "global_step": 97435, "epoch": 2319} {"train_loss": -6.192833423614502, "global_step": 97436, "epoch": 2319} {"train_loss": -6.280669212341309, "global_step": 97437, "epoch": 2319} {"train_loss": -6.421748161315918, "global_step": 97438, "epoch": 2319} {"train_loss": -6.328989573887417, "global_step": 97439, "epoch": 2319, "val_loss": 75680.7890625} {"train_loss": -6.305126190185547, "global_step": 97440, "epoch": 2320} {"train_loss": -6.356550216674805, "global_step": 97441, "epoch": 2320} {"train_loss": -6.293527126312256, "global_step": 97442, "epoch": 2320} {"train_loss": -6.252309322357178, "global_step": 97443, "epoch": 2320} {"train_loss": -6.322356224060059, "global_step": 97444, "epoch": 2320} {"train_loss": -6.176628589630127, "global_step": 97445, "epoch": 2320} {"train_loss": -6.497757911682129, "global_step": 97446, "epoch": 2320} {"train_loss": -6.389513969421387, "global_step": 97447, "epoch": 2320} {"train_loss": -6.319120407104492, "global_step": 97448, "epoch": 2320} {"train_loss": -6.324831008911133, "global_step": 97449, "epoch": 2320} {"train_loss": -6.451498508453369, "global_step": 97450, "epoch": 2320} {"train_loss": -6.454974174499512, "global_step": 97451, "epoch": 2320} {"train_loss": -6.320407390594482, "global_step": 97452, "epoch": 2320} {"train_loss": -6.281651496887207, "global_step": 97453, "epoch": 2320} {"train_loss": -6.3238420486450195, "global_step": 97454, "epoch": 2320} {"train_loss": -6.309536933898926, "global_step": 97455, "epoch": 2320} {"train_loss": -6.270155429840088, "global_step": 97456, "epoch": 2320} {"train_loss": -6.267022132873535, "global_step": 97457, "epoch": 2320} {"train_loss": -6.2100019454956055, "global_step": 97458, "epoch": 2320} {"train_loss": -6.296848773956299, "global_step": 97459, "epoch": 2320} {"train_loss": -6.303366661071777, "global_step": 97460, "epoch": 2320} {"train_loss": -6.271629333496094, "global_step": 97461, "epoch": 2320} {"train_loss": -6.3916425704956055, "global_step": 97462, "epoch": 2320} {"train_loss": -6.409852981567383, "global_step": 97463, "epoch": 2320} {"train_loss": -6.313117027282715, "global_step": 97464, "epoch": 2320} {"train_loss": -6.42533016204834, "global_step": 97465, "epoch": 2320} {"train_loss": -6.392382621765137, "global_step": 97466, "epoch": 2320} {"train_loss": -6.38082218170166, "global_step": 97467, "epoch": 2320} {"train_loss": -6.310229778289795, "global_step": 97468, "epoch": 2320} {"train_loss": -6.370376110076904, "global_step": 97469, "epoch": 2320} {"train_loss": -6.332641124725342, "global_step": 97470, "epoch": 2320} {"train_loss": -6.283001899719238, "global_step": 97471, "epoch": 2320} {"train_loss": -6.32564640045166, "global_step": 97472, "epoch": 2320} {"train_loss": -6.316391944885254, "global_step": 97473, "epoch": 2320} {"train_loss": -6.225114822387695, "global_step": 97474, "epoch": 2320} {"train_loss": -6.324224948883057, "global_step": 97475, "epoch": 2320} {"train_loss": -6.286859035491943, "global_step": 97476, "epoch": 2320} {"train_loss": -6.295206546783447, "global_step": 97477, "epoch": 2320} {"train_loss": -6.233007431030273, "global_step": 97478, "epoch": 2320} {"train_loss": -6.346412658691406, "global_step": 97479, "epoch": 2320} {"train_loss": -6.238836288452148, "global_step": 97480, "epoch": 2320} {"train_loss": -6.322041534242176, "global_step": 97481, "epoch": 2320, "val_loss": 75608.6953125} {"train_loss": -6.263983249664307, "global_step": 97482, "epoch": 2321} {"train_loss": -6.254485607147217, "global_step": 97483, "epoch": 2321} {"train_loss": -6.304433822631836, "global_step": 97484, "epoch": 2321} {"train_loss": -6.265052795410156, "global_step": 97485, "epoch": 2321} {"train_loss": -6.234851837158203, "global_step": 97486, "epoch": 2321} {"train_loss": -6.356241226196289, "global_step": 97487, "epoch": 2321} {"train_loss": -6.299314022064209, "global_step": 97488, "epoch": 2321} {"train_loss": -6.250922203063965, "global_step": 97489, "epoch": 2321} {"train_loss": -6.474170684814453, "global_step": 97490, "epoch": 2321} {"train_loss": -6.184964656829834, "global_step": 97491, "epoch": 2321} {"train_loss": -6.270599842071533, "global_step": 97492, "epoch": 2321} {"train_loss": -6.329102039337158, "global_step": 97493, "epoch": 2321} {"train_loss": -6.218606472015381, "global_step": 97494, "epoch": 2321} {"train_loss": -6.3265252113342285, "global_step": 97495, "epoch": 2321} {"train_loss": -6.423548698425293, "global_step": 97496, "epoch": 2321} {"train_loss": -6.273104667663574, "global_step": 97497, "epoch": 2321} {"train_loss": -6.285031318664551, "global_step": 97498, "epoch": 2321} {"train_loss": -6.280578136444092, "global_step": 97499, "epoch": 2321} {"train_loss": -6.30793571472168, "global_step": 97500, "epoch": 2321} {"train_loss": -6.3008198738098145, "global_step": 97501, "epoch": 2321} {"train_loss": -6.24062442779541, "global_step": 97502, "epoch": 2321} {"train_loss": -6.307375431060791, "global_step": 97503, "epoch": 2321} {"train_loss": -6.413731098175049, "global_step": 97504, "epoch": 2321} {"train_loss": -6.278712749481201, "global_step": 97505, "epoch": 2321} {"train_loss": -6.397852897644043, "global_step": 97506, "epoch": 2321} {"train_loss": -6.202925205230713, "global_step": 97507, "epoch": 2321} {"train_loss": -6.308585166931152, "global_step": 97508, "epoch": 2321} {"train_loss": -6.29257869720459, "global_step": 97509, "epoch": 2321} {"train_loss": -6.241964817047119, "global_step": 97510, "epoch": 2321} {"train_loss": -6.303089141845703, "global_step": 97511, "epoch": 2321} {"train_loss": -6.322370529174805, "global_step": 97512, "epoch": 2321} {"train_loss": -6.344450950622559, "global_step": 97513, "epoch": 2321} {"train_loss": -6.298551559448242, "global_step": 97514, "epoch": 2321} {"train_loss": -6.312702655792236, "global_step": 97515, "epoch": 2321} {"train_loss": -6.325984001159668, "global_step": 97516, "epoch": 2321} {"train_loss": -6.226647853851318, "global_step": 97517, "epoch": 2321} {"train_loss": -6.361389636993408, "global_step": 97518, "epoch": 2321} {"train_loss": -6.291299343109131, "global_step": 97519, "epoch": 2321} {"train_loss": -6.1618852615356445, "global_step": 97520, "epoch": 2321} {"train_loss": -6.2070512771606445, "global_step": 97521, "epoch": 2321} {"train_loss": -6.275463104248047, "global_step": 97522, "epoch": 2321} {"train_loss": -6.289319855826242, "global_step": 97523, "epoch": 2321, "val_loss": 75899.515625} {"train_loss": -6.416646480560303, "global_step": 97524, "epoch": 2322} {"train_loss": -6.3217692375183105, "global_step": 97525, "epoch": 2322} {"train_loss": -6.2657623291015625, "global_step": 97526, "epoch": 2322} {"train_loss": -6.278112411499023, "global_step": 97527, "epoch": 2322} {"train_loss": -6.281402587890625, "global_step": 97528, "epoch": 2322} {"train_loss": -6.240633487701416, "global_step": 97529, "epoch": 2322} {"train_loss": -6.048977851867676, "global_step": 97530, "epoch": 2322} {"train_loss": -6.2569379806518555, "global_step": 97531, "epoch": 2322} {"train_loss": -6.103705883026123, "global_step": 97532, "epoch": 2322} {"train_loss": -6.370308876037598, "global_step": 97533, "epoch": 2322} {"train_loss": -6.139880180358887, "global_step": 97534, "epoch": 2322} {"train_loss": -6.284579277038574, "global_step": 97535, "epoch": 2322} {"train_loss": -6.138909339904785, "global_step": 97536, "epoch": 2322} {"train_loss": -6.229341506958008, "global_step": 97537, "epoch": 2322} {"train_loss": -6.237096309661865, "global_step": 97538, "epoch": 2322} {"train_loss": -6.156937599182129, "global_step": 97539, "epoch": 2322} {"train_loss": -6.296394348144531, "global_step": 97540, "epoch": 2322} {"train_loss": -6.2423014640808105, "global_step": 97541, "epoch": 2322} {"train_loss": -6.295448303222656, "global_step": 97542, "epoch": 2322} {"train_loss": -6.1535773277282715, "global_step": 97543, "epoch": 2322} {"train_loss": -6.247230529785156, "global_step": 97544, "epoch": 2322} {"train_loss": -6.411712646484375, "global_step": 97545, "epoch": 2322} {"train_loss": -6.256167411804199, "global_step": 97546, "epoch": 2322} {"train_loss": -6.321633338928223, "global_step": 97547, "epoch": 2322} {"train_loss": -6.194066047668457, "global_step": 97548, "epoch": 2322} {"train_loss": -6.3061017990112305, "global_step": 97549, "epoch": 2322} {"train_loss": -6.283829689025879, "global_step": 97550, "epoch": 2322} {"train_loss": -6.352292060852051, "global_step": 97551, "epoch": 2322} {"train_loss": -6.268307209014893, "global_step": 97552, "epoch": 2322} {"train_loss": -6.428695201873779, "global_step": 97553, "epoch": 2322} {"train_loss": -6.265105247497559, "global_step": 97554, "epoch": 2322} {"train_loss": -6.300154685974121, "global_step": 97555, "epoch": 2322} {"train_loss": -6.235482215881348, "global_step": 97556, "epoch": 2322} {"train_loss": -6.363356590270996, "global_step": 97557, "epoch": 2322} {"train_loss": -6.3043107986450195, "global_step": 97558, "epoch": 2322} {"train_loss": -6.254463195800781, "global_step": 97559, "epoch": 2322} {"train_loss": -6.3437910079956055, "global_step": 97560, "epoch": 2322} {"train_loss": -6.455133438110352, "global_step": 97561, "epoch": 2322} {"train_loss": -6.234012126922607, "global_step": 97562, "epoch": 2322} {"train_loss": -6.266275882720947, "global_step": 97563, "epoch": 2322} {"train_loss": -6.24649715423584, "global_step": 97564, "epoch": 2322} {"train_loss": -6.274124111448016, "global_step": 97565, "epoch": 2322, "val_loss": 75827.890625} {"train_loss": -6.221845626831055, "global_step": 97566, "epoch": 2323} {"train_loss": -6.423480987548828, "global_step": 97567, "epoch": 2323} {"train_loss": -6.346928596496582, "global_step": 97568, "epoch": 2323} {"train_loss": -6.345846176147461, "global_step": 97569, "epoch": 2323} {"train_loss": -6.382509231567383, "global_step": 97570, "epoch": 2323} {"train_loss": -6.256959915161133, "global_step": 97571, "epoch": 2323} {"train_loss": -6.260919094085693, "global_step": 97572, "epoch": 2323} {"train_loss": -6.4228105545043945, "global_step": 97573, "epoch": 2323} {"train_loss": -6.379975318908691, "global_step": 97574, "epoch": 2323} {"train_loss": -6.234496116638184, "global_step": 97575, "epoch": 2323} {"train_loss": -6.373134613037109, "global_step": 97576, "epoch": 2323} {"train_loss": -6.3319220542907715, "global_step": 97577, "epoch": 2323} {"train_loss": -6.321709632873535, "global_step": 97578, "epoch": 2323} {"train_loss": -6.283756256103516, "global_step": 97579, "epoch": 2323} {"train_loss": -6.324348449707031, "global_step": 97580, "epoch": 2323} {"train_loss": -6.278043746948242, "global_step": 97581, "epoch": 2323} {"train_loss": -6.363408088684082, "global_step": 97582, "epoch": 2323} {"train_loss": -6.30586576461792, "global_step": 97583, "epoch": 2323} {"train_loss": -6.2351579666137695, "global_step": 97584, "epoch": 2323} {"train_loss": -6.217252731323242, "global_step": 97585, "epoch": 2323} {"train_loss": -6.312037467956543, "global_step": 97586, "epoch": 2323} {"train_loss": -6.218692302703857, "global_step": 97587, "epoch": 2323} {"train_loss": -6.153019428253174, "global_step": 97588, "epoch": 2323} {"train_loss": -6.293283462524414, "global_step": 97589, "epoch": 2323} {"train_loss": -6.407593727111816, "global_step": 97590, "epoch": 2323} {"train_loss": -6.41396427154541, "global_step": 97591, "epoch": 2323} {"train_loss": -6.329653739929199, "global_step": 97592, "epoch": 2323} {"train_loss": -6.361825466156006, "global_step": 97593, "epoch": 2323} {"train_loss": -6.289103984832764, "global_step": 97594, "epoch": 2323} {"train_loss": -6.265939712524414, "global_step": 97595, "epoch": 2323} {"train_loss": -6.285527229309082, "global_step": 97596, "epoch": 2323} {"train_loss": -6.31614351272583, "global_step": 97597, "epoch": 2323} {"train_loss": -6.291358947753906, "global_step": 97598, "epoch": 2323} {"train_loss": -6.361729621887207, "global_step": 97599, "epoch": 2323} {"train_loss": -6.361845970153809, "global_step": 97600, "epoch": 2323} {"train_loss": -6.275363922119141, "global_step": 97601, "epoch": 2323} {"train_loss": -6.317850589752197, "global_step": 97602, "epoch": 2323} {"train_loss": -6.341771602630615, "global_step": 97603, "epoch": 2323} {"train_loss": -6.403135299682617, "global_step": 97604, "epoch": 2323} {"train_loss": -6.436731815338135, "global_step": 97605, "epoch": 2323} {"train_loss": -6.430801868438721, "global_step": 97606, "epoch": 2323} {"train_loss": -6.3204314935775034, "global_step": 97607, "epoch": 2323, "val_loss": 75805.21875} {"train_loss": -6.268832683563232, "global_step": 97608, "epoch": 2324} {"train_loss": -6.33293342590332, "global_step": 97609, "epoch": 2324} {"train_loss": -6.264927387237549, "global_step": 97610, "epoch": 2324} {"train_loss": -6.291323661804199, "global_step": 97611, "epoch": 2324} {"train_loss": -6.35045051574707, "global_step": 97612, "epoch": 2324} {"train_loss": -6.282125473022461, "global_step": 97613, "epoch": 2324} {"train_loss": -6.4091644287109375, "global_step": 97614, "epoch": 2324} {"train_loss": -6.459034442901611, "global_step": 97615, "epoch": 2324} {"train_loss": -6.288219451904297, "global_step": 97616, "epoch": 2324} {"train_loss": -6.267261505126953, "global_step": 97617, "epoch": 2324} {"train_loss": -6.196048259735107, "global_step": 97618, "epoch": 2324} {"train_loss": -6.347511291503906, "global_step": 97619, "epoch": 2324} {"train_loss": -6.406562805175781, "global_step": 97620, "epoch": 2324} {"train_loss": -6.329308986663818, "global_step": 97621, "epoch": 2324} {"train_loss": -6.334139823913574, "global_step": 97622, "epoch": 2324} {"train_loss": -6.242247104644775, "global_step": 97623, "epoch": 2324} {"train_loss": -6.38461971282959, "global_step": 97624, "epoch": 2324} {"train_loss": -6.398257255554199, "global_step": 97625, "epoch": 2324} {"train_loss": -6.259145736694336, "global_step": 97626, "epoch": 2324} {"train_loss": -6.39797306060791, "global_step": 97627, "epoch": 2324} {"train_loss": -6.342343330383301, "global_step": 97628, "epoch": 2324} {"train_loss": -6.302602767944336, "global_step": 97629, "epoch": 2324} {"train_loss": -6.382676124572754, "global_step": 97630, "epoch": 2324} {"train_loss": -6.39420223236084, "global_step": 97631, "epoch": 2324} {"train_loss": -6.353032112121582, "global_step": 97632, "epoch": 2324} {"train_loss": -6.279312610626221, "global_step": 97633, "epoch": 2324} {"train_loss": -6.265570640563965, "global_step": 97634, "epoch": 2324} {"train_loss": -6.375613212585449, "global_step": 97635, "epoch": 2324} {"train_loss": -6.360461235046387, "global_step": 97636, "epoch": 2324} {"train_loss": -6.392971992492676, "global_step": 97637, "epoch": 2324} {"train_loss": -6.397658348083496, "global_step": 97638, "epoch": 2324} {"train_loss": -6.246274948120117, "global_step": 97639, "epoch": 2324} {"train_loss": -6.348310947418213, "global_step": 97640, "epoch": 2324} {"train_loss": -6.21644926071167, "global_step": 97641, "epoch": 2324} {"train_loss": -6.38783073425293, "global_step": 97642, "epoch": 2324} {"train_loss": -6.241559982299805, "global_step": 97643, "epoch": 2324} {"train_loss": -6.3539886474609375, "global_step": 97644, "epoch": 2324} {"train_loss": -6.330158233642578, "global_step": 97645, "epoch": 2324} {"train_loss": -6.376341342926025, "global_step": 97646, "epoch": 2324} {"train_loss": -6.358437538146973, "global_step": 97647, "epoch": 2324} {"train_loss": -6.277707576751709, "global_step": 97648, "epoch": 2324} {"train_loss": -6.330799863452003, "global_step": 97649, "epoch": 2324, "val_loss": 75788.28125} {"train_loss": -6.442811012268066, "global_step": 97650, "epoch": 2325} {"train_loss": -6.263969421386719, "global_step": 97651, "epoch": 2325} {"train_loss": -6.293116569519043, "global_step": 97652, "epoch": 2325} {"train_loss": -6.323764801025391, "global_step": 97653, "epoch": 2325} {"train_loss": -6.245809555053711, "global_step": 97654, "epoch": 2325} {"train_loss": -6.264704704284668, "global_step": 97655, "epoch": 2325} {"train_loss": -6.264499664306641, "global_step": 97656, "epoch": 2325} {"train_loss": -6.316289901733398, "global_step": 97657, "epoch": 2325} {"train_loss": -6.311885833740234, "global_step": 97658, "epoch": 2325} {"train_loss": -6.431508541107178, "global_step": 97659, "epoch": 2325} {"train_loss": -6.258822441101074, "global_step": 97660, "epoch": 2325} {"train_loss": -6.303586006164551, "global_step": 97661, "epoch": 2325} {"train_loss": -6.293649673461914, "global_step": 97662, "epoch": 2325} {"train_loss": -6.328985214233398, "global_step": 97663, "epoch": 2325} {"train_loss": -6.386356353759766, "global_step": 97664, "epoch": 2325} {"train_loss": -6.38480806350708, "global_step": 97665, "epoch": 2325} {"train_loss": -6.254825592041016, "global_step": 97666, "epoch": 2325} {"train_loss": -6.4056172370910645, "global_step": 97667, "epoch": 2325} {"train_loss": -6.268167495727539, "global_step": 97668, "epoch": 2325} {"train_loss": -6.2855353355407715, "global_step": 97669, "epoch": 2325} {"train_loss": -6.18705940246582, "global_step": 97670, "epoch": 2325} {"train_loss": -6.292806625366211, "global_step": 97671, "epoch": 2325} {"train_loss": -6.424826622009277, "global_step": 97672, "epoch": 2325} {"train_loss": -6.335698127746582, "global_step": 97673, "epoch": 2325} {"train_loss": -6.426052570343018, "global_step": 97674, "epoch": 2325} {"train_loss": -6.319030284881592, "global_step": 97675, "epoch": 2325} {"train_loss": -6.390237331390381, "global_step": 97676, "epoch": 2325} {"train_loss": -6.291900634765625, "global_step": 97677, "epoch": 2325} {"train_loss": -6.3362226486206055, "global_step": 97678, "epoch": 2325} {"train_loss": -6.40625, "global_step": 97679, "epoch": 2325} {"train_loss": -6.236957550048828, "global_step": 97680, "epoch": 2325} {"train_loss": -6.300943851470947, "global_step": 97681, "epoch": 2325} {"train_loss": -6.412073135375977, "global_step": 97682, "epoch": 2325} {"train_loss": -6.283373832702637, "global_step": 97683, "epoch": 2325} {"train_loss": -6.203089714050293, "global_step": 97684, "epoch": 2325} {"train_loss": -6.262537956237793, "global_step": 97685, "epoch": 2325} {"train_loss": -6.3275909423828125, "global_step": 97686, "epoch": 2325} {"train_loss": -6.275643825531006, "global_step": 97687, "epoch": 2325} {"train_loss": -6.392134666442871, "global_step": 97688, "epoch": 2325} {"train_loss": -6.4056396484375, "global_step": 97689, "epoch": 2325} {"train_loss": -6.333287715911865, "global_step": 97690, "epoch": 2325} {"train_loss": -6.320730742954073, "global_step": 97691, "epoch": 2325, "val_loss": 75471.4765625} {"train_loss": -6.3146443367004395, "global_step": 97692, "epoch": 2326} {"train_loss": -6.256829261779785, "global_step": 97693, "epoch": 2326} {"train_loss": -6.415463447570801, "global_step": 97694, "epoch": 2326} {"train_loss": -6.28420352935791, "global_step": 97695, "epoch": 2326} {"train_loss": -6.428094863891602, "global_step": 97696, "epoch": 2326} {"train_loss": -6.344338893890381, "global_step": 97697, "epoch": 2326} {"train_loss": -6.3000168800354, "global_step": 97698, "epoch": 2326} {"train_loss": -6.371925354003906, "global_step": 97699, "epoch": 2326} {"train_loss": -6.44156551361084, "global_step": 97700, "epoch": 2326} {"train_loss": -6.379044532775879, "global_step": 97701, "epoch": 2326} {"train_loss": -6.228791236877441, "global_step": 97702, "epoch": 2326} {"train_loss": -6.326082706451416, "global_step": 97703, "epoch": 2326} {"train_loss": -6.232202529907227, "global_step": 97704, "epoch": 2326} {"train_loss": -6.417502403259277, "global_step": 97705, "epoch": 2326} {"train_loss": -6.457455635070801, "global_step": 97706, "epoch": 2326} {"train_loss": -6.394339561462402, "global_step": 97707, "epoch": 2326} {"train_loss": -6.457038879394531, "global_step": 97708, "epoch": 2326} {"train_loss": -6.2632598876953125, "global_step": 97709, "epoch": 2326} {"train_loss": -6.364802837371826, "global_step": 97710, "epoch": 2326} {"train_loss": -6.366148948669434, "global_step": 97711, "epoch": 2326} {"train_loss": -6.374007225036621, "global_step": 97712, "epoch": 2326} {"train_loss": -6.421125411987305, "global_step": 97713, "epoch": 2326} {"train_loss": -6.448301315307617, "global_step": 97714, "epoch": 2326} {"train_loss": -6.248668670654297, "global_step": 97715, "epoch": 2326} {"train_loss": -6.3907151222229, "global_step": 97716, "epoch": 2326} {"train_loss": -6.271454811096191, "global_step": 97717, "epoch": 2326} {"train_loss": -6.245088577270508, "global_step": 97718, "epoch": 2326} {"train_loss": -6.221840858459473, "global_step": 97719, "epoch": 2326} {"train_loss": -6.391241073608398, "global_step": 97720, "epoch": 2326} {"train_loss": -6.319007873535156, "global_step": 97721, "epoch": 2326} {"train_loss": -6.397357940673828, "global_step": 97722, "epoch": 2326} {"train_loss": -6.358616352081299, "global_step": 97723, "epoch": 2326} {"train_loss": -6.352155685424805, "global_step": 97724, "epoch": 2326} {"train_loss": -6.344974517822266, "global_step": 97725, "epoch": 2326} {"train_loss": -6.208538055419922, "global_step": 97726, "epoch": 2326} {"train_loss": -6.438412189483643, "global_step": 97727, "epoch": 2326} {"train_loss": -6.391408920288086, "global_step": 97728, "epoch": 2326} {"train_loss": -6.378287315368652, "global_step": 97729, "epoch": 2326} {"train_loss": -6.301542282104492, "global_step": 97730, "epoch": 2326} {"train_loss": -6.233726978302002, "global_step": 97731, "epoch": 2326} {"train_loss": -6.4638519287109375, "global_step": 97732, "epoch": 2326} {"train_loss": -6.345864931742351, "global_step": 97733, "epoch": 2326, "val_loss": 76073.4375} {"train_loss": -6.278173446655273, "global_step": 97734, "epoch": 2327} {"train_loss": -6.3891921043396, "global_step": 97735, "epoch": 2327} {"train_loss": -6.33513879776001, "global_step": 97736, "epoch": 2327} {"train_loss": -6.293553352355957, "global_step": 97737, "epoch": 2327} {"train_loss": -6.335783958435059, "global_step": 97738, "epoch": 2327} {"train_loss": -6.198768615722656, "global_step": 97739, "epoch": 2327} {"train_loss": -6.291476726531982, "global_step": 97740, "epoch": 2327} {"train_loss": -6.283147811889648, "global_step": 97741, "epoch": 2327} {"train_loss": -6.255703926086426, "global_step": 97742, "epoch": 2327} {"train_loss": -6.322366714477539, "global_step": 97743, "epoch": 2327} {"train_loss": -6.296048164367676, "global_step": 97744, "epoch": 2327} {"train_loss": -6.254515647888184, "global_step": 97745, "epoch": 2327} {"train_loss": -6.254685401916504, "global_step": 97746, "epoch": 2327} {"train_loss": -6.277595520019531, "global_step": 97747, "epoch": 2327} {"train_loss": -6.141024589538574, "global_step": 97748, "epoch": 2327} {"train_loss": -6.333477020263672, "global_step": 97749, "epoch": 2327} {"train_loss": -6.367705821990967, "global_step": 97750, "epoch": 2327} {"train_loss": -6.290459632873535, "global_step": 97751, "epoch": 2327} {"train_loss": -6.2626848220825195, "global_step": 97752, "epoch": 2327} {"train_loss": -6.377776145935059, "global_step": 97753, "epoch": 2327} {"train_loss": -6.215388774871826, "global_step": 97754, "epoch": 2327} {"train_loss": -6.3222503662109375, "global_step": 97755, "epoch": 2327} {"train_loss": -6.385498046875, "global_step": 97756, "epoch": 2327} {"train_loss": -6.290704727172852, "global_step": 97757, "epoch": 2327} {"train_loss": -6.283293724060059, "global_step": 97758, "epoch": 2327} {"train_loss": -6.3243818283081055, "global_step": 97759, "epoch": 2327} {"train_loss": -6.399308681488037, "global_step": 97760, "epoch": 2327} {"train_loss": -6.344374656677246, "global_step": 97761, "epoch": 2327} {"train_loss": -6.396450996398926, "global_step": 97762, "epoch": 2327} {"train_loss": -6.272019386291504, "global_step": 97763, "epoch": 2327} {"train_loss": -6.350704193115234, "global_step": 97764, "epoch": 2327} {"train_loss": -6.388386249542236, "global_step": 97765, "epoch": 2327} {"train_loss": -6.2225260734558105, "global_step": 97766, "epoch": 2327} {"train_loss": -6.347378730773926, "global_step": 97767, "epoch": 2327} {"train_loss": -6.44181489944458, "global_step": 97768, "epoch": 2327} {"train_loss": -6.380331039428711, "global_step": 97769, "epoch": 2327} {"train_loss": -6.244668006896973, "global_step": 97770, "epoch": 2327} {"train_loss": -6.295479774475098, "global_step": 97771, "epoch": 2327} {"train_loss": -6.326353073120117, "global_step": 97772, "epoch": 2327} {"train_loss": -6.282908916473389, "global_step": 97773, "epoch": 2327} {"train_loss": -6.345088005065918, "global_step": 97774, "epoch": 2327} {"train_loss": -6.309289977664039, "global_step": 97775, "epoch": 2327, "val_loss": 75756.734375} {"train_loss": -6.253664016723633, "global_step": 97776, "epoch": 2328} {"train_loss": -6.3556013107299805, "global_step": 97777, "epoch": 2328} {"train_loss": -6.343851089477539, "global_step": 97778, "epoch": 2328} {"train_loss": -6.312203407287598, "global_step": 97779, "epoch": 2328} {"train_loss": -6.377985954284668, "global_step": 97780, "epoch": 2328} {"train_loss": -6.379040241241455, "global_step": 97781, "epoch": 2328} {"train_loss": -6.277306079864502, "global_step": 97782, "epoch": 2328} {"train_loss": -6.333930015563965, "global_step": 97783, "epoch": 2328} {"train_loss": -6.241026878356934, "global_step": 97784, "epoch": 2328} {"train_loss": -6.406409740447998, "global_step": 97785, "epoch": 2328} {"train_loss": -6.314609527587891, "global_step": 97786, "epoch": 2328} {"train_loss": -6.310869216918945, "global_step": 97787, "epoch": 2328} {"train_loss": -6.244819641113281, "global_step": 97788, "epoch": 2328} {"train_loss": -6.33739709854126, "global_step": 97789, "epoch": 2328} {"train_loss": -6.260959625244141, "global_step": 97790, "epoch": 2328} {"train_loss": -6.242094993591309, "global_step": 97791, "epoch": 2328} {"train_loss": -6.453060626983643, "global_step": 97792, "epoch": 2328} {"train_loss": -6.302831649780273, "global_step": 97793, "epoch": 2328} {"train_loss": -6.265552520751953, "global_step": 97794, "epoch": 2328} {"train_loss": -6.362804412841797, "global_step": 97795, "epoch": 2328} {"train_loss": -6.324046611785889, "global_step": 97796, "epoch": 2328} {"train_loss": -6.307217597961426, "global_step": 97797, "epoch": 2328} {"train_loss": -6.316740036010742, "global_step": 97798, "epoch": 2328} {"train_loss": -6.227632999420166, "global_step": 97799, "epoch": 2328} {"train_loss": -6.258090972900391, "global_step": 97800, "epoch": 2328} {"train_loss": -6.347269058227539, "global_step": 97801, "epoch": 2328} {"train_loss": -6.3022308349609375, "global_step": 97802, "epoch": 2328} {"train_loss": -6.34521484375, "global_step": 97803, "epoch": 2328} {"train_loss": -6.250739097595215, "global_step": 97804, "epoch": 2328} {"train_loss": -6.300805568695068, "global_step": 97805, "epoch": 2328} {"train_loss": -6.317117691040039, "global_step": 97806, "epoch": 2328} {"train_loss": -6.355449676513672, "global_step": 97807, "epoch": 2328} {"train_loss": -6.232306957244873, "global_step": 97808, "epoch": 2328} {"train_loss": -6.28031063079834, "global_step": 97809, "epoch": 2328} {"train_loss": -6.31966495513916, "global_step": 97810, "epoch": 2328} {"train_loss": -6.330742835998535, "global_step": 97811, "epoch": 2328} {"train_loss": -6.44034481048584, "global_step": 97812, "epoch": 2328} {"train_loss": -6.307414531707764, "global_step": 97813, "epoch": 2328} {"train_loss": -6.31757926940918, "global_step": 97814, "epoch": 2328} {"train_loss": -6.247315406799316, "global_step": 97815, "epoch": 2328} {"train_loss": -6.38450813293457, "global_step": 97816, "epoch": 2328} {"train_loss": -6.314271892820086, "global_step": 97817, "epoch": 2328, "val_loss": 75872.8359375} {"train_loss": -6.390923976898193, "global_step": 97818, "epoch": 2329} {"train_loss": -6.324450492858887, "global_step": 97819, "epoch": 2329} {"train_loss": -6.292109966278076, "global_step": 97820, "epoch": 2329} {"train_loss": -6.252588272094727, "global_step": 97821, "epoch": 2329} {"train_loss": -6.167632102966309, "global_step": 97822, "epoch": 2329} {"train_loss": -6.337371826171875, "global_step": 97823, "epoch": 2329} {"train_loss": -6.327009677886963, "global_step": 97824, "epoch": 2329} {"train_loss": -6.379446029663086, "global_step": 97825, "epoch": 2329} {"train_loss": -6.421540260314941, "global_step": 97826, "epoch": 2329} {"train_loss": -6.38949728012085, "global_step": 97827, "epoch": 2329} {"train_loss": -6.346030235290527, "global_step": 97828, "epoch": 2329} {"train_loss": -6.332874298095703, "global_step": 97829, "epoch": 2329} {"train_loss": -6.332980155944824, "global_step": 97830, "epoch": 2329} {"train_loss": -6.351131916046143, "global_step": 97831, "epoch": 2329} {"train_loss": -6.472780227661133, "global_step": 97832, "epoch": 2329} {"train_loss": -6.361521244049072, "global_step": 97833, "epoch": 2329} {"train_loss": -6.269301414489746, "global_step": 97834, "epoch": 2329} {"train_loss": -6.441976547241211, "global_step": 97835, "epoch": 2329} {"train_loss": -6.384753227233887, "global_step": 97836, "epoch": 2329} {"train_loss": -6.363125801086426, "global_step": 97837, "epoch": 2329} {"train_loss": -6.280743598937988, "global_step": 97838, "epoch": 2329} {"train_loss": -6.340296745300293, "global_step": 97839, "epoch": 2329} {"train_loss": -6.455685138702393, "global_step": 97840, "epoch": 2329} {"train_loss": -6.3563995361328125, "global_step": 97841, "epoch": 2329} {"train_loss": -6.271875858306885, "global_step": 97842, "epoch": 2329} {"train_loss": -6.44779634475708, "global_step": 97843, "epoch": 2329} {"train_loss": -6.2689948081970215, "global_step": 97844, "epoch": 2329} {"train_loss": -6.309103965759277, "global_step": 97845, "epoch": 2329} {"train_loss": -6.311525821685791, "global_step": 97846, "epoch": 2329} {"train_loss": -6.17523193359375, "global_step": 97847, "epoch": 2329} {"train_loss": -6.39806604385376, "global_step": 97848, "epoch": 2329} {"train_loss": -6.17911434173584, "global_step": 97849, "epoch": 2329} {"train_loss": -6.1798624992370605, "global_step": 97850, "epoch": 2329} {"train_loss": -6.470841407775879, "global_step": 97851, "epoch": 2329} {"train_loss": -6.276374816894531, "global_step": 97852, "epoch": 2329} {"train_loss": -6.066997528076172, "global_step": 97853, "epoch": 2329} {"train_loss": -6.302350044250488, "global_step": 97854, "epoch": 2329} {"train_loss": -6.294562339782715, "global_step": 97855, "epoch": 2329} {"train_loss": -6.402216911315918, "global_step": 97856, "epoch": 2329} {"train_loss": -6.19335412979126, "global_step": 97857, "epoch": 2329} {"train_loss": -6.3163838386535645, "global_step": 97858, "epoch": 2329} {"train_loss": -6.322244916643415, "global_step": 97859, "epoch": 2329, "val_loss": 76013.1015625} {"train_loss": -6.260834693908691, "global_step": 97860, "epoch": 2330} {"train_loss": -6.263242244720459, "global_step": 97861, "epoch": 2330} {"train_loss": -6.121431350708008, "global_step": 97862, "epoch": 2330} {"train_loss": -6.205781936645508, "global_step": 97863, "epoch": 2330} {"train_loss": -6.296268463134766, "global_step": 97864, "epoch": 2330} {"train_loss": -6.2516889572143555, "global_step": 97865, "epoch": 2330} {"train_loss": -6.34346866607666, "global_step": 97866, "epoch": 2330} {"train_loss": -6.34013032913208, "global_step": 97867, "epoch": 2330} {"train_loss": -6.297595500946045, "global_step": 97868, "epoch": 2330} {"train_loss": -6.26397705078125, "global_step": 97869, "epoch": 2330} {"train_loss": -6.339535236358643, "global_step": 97870, "epoch": 2330} {"train_loss": -6.306118965148926, "global_step": 97871, "epoch": 2330} {"train_loss": -6.318160057067871, "global_step": 97872, "epoch": 2330} {"train_loss": -6.237948894500732, "global_step": 97873, "epoch": 2330} {"train_loss": -6.356205940246582, "global_step": 97874, "epoch": 2330} {"train_loss": -6.302986145019531, "global_step": 97875, "epoch": 2330} {"train_loss": -6.2337493896484375, "global_step": 97876, "epoch": 2330} {"train_loss": -6.36226749420166, "global_step": 97877, "epoch": 2330} {"train_loss": -6.379614353179932, "global_step": 97878, "epoch": 2330} {"train_loss": -6.31459903717041, "global_step": 97879, "epoch": 2330} {"train_loss": -6.313916206359863, "global_step": 97880, "epoch": 2330} {"train_loss": -6.3249969482421875, "global_step": 97881, "epoch": 2330} {"train_loss": -6.372611045837402, "global_step": 97882, "epoch": 2330} {"train_loss": -6.207520484924316, "global_step": 97883, "epoch": 2330} {"train_loss": -6.341931343078613, "global_step": 97884, "epoch": 2330} {"train_loss": -6.196170806884766, "global_step": 97885, "epoch": 2330} {"train_loss": -6.390590667724609, "global_step": 97886, "epoch": 2330} {"train_loss": -6.189823150634766, "global_step": 97887, "epoch": 2330} {"train_loss": -6.249904632568359, "global_step": 97888, "epoch": 2330} {"train_loss": -6.323705673217773, "global_step": 97889, "epoch": 2330} {"train_loss": -6.329453468322754, "global_step": 97890, "epoch": 2330} {"train_loss": -6.388113021850586, "global_step": 97891, "epoch": 2330} {"train_loss": -6.316948413848877, "global_step": 97892, "epoch": 2330} {"train_loss": -6.316039085388184, "global_step": 97893, "epoch": 2330} {"train_loss": -6.279637336730957, "global_step": 97894, "epoch": 2330} {"train_loss": -6.329634666442871, "global_step": 97895, "epoch": 2330} {"train_loss": -6.348729610443115, "global_step": 97896, "epoch": 2330} {"train_loss": -6.303088188171387, "global_step": 97897, "epoch": 2330} {"train_loss": -6.2623610496521, "global_step": 97898, "epoch": 2330} {"train_loss": -6.153966903686523, "global_step": 97899, "epoch": 2330} {"train_loss": -6.3495683670043945, "global_step": 97900, "epoch": 2330} {"train_loss": -6.29704745610555, "global_step": 97901, "epoch": 2330, "val_loss": 75611.484375} {"train_loss": -6.259821891784668, "global_step": 97902, "epoch": 2331} {"train_loss": -6.339090824127197, "global_step": 97903, "epoch": 2331} {"train_loss": -6.432351112365723, "global_step": 97904, "epoch": 2331} {"train_loss": -6.436649322509766, "global_step": 97905, "epoch": 2331} {"train_loss": -6.444968223571777, "global_step": 97906, "epoch": 2331} {"train_loss": -6.268111228942871, "global_step": 97907, "epoch": 2331} {"train_loss": -6.409832000732422, "global_step": 97908, "epoch": 2331} {"train_loss": -6.301572799682617, "global_step": 97909, "epoch": 2331} {"train_loss": -6.313469886779785, "global_step": 97910, "epoch": 2331} {"train_loss": -6.411667823791504, "global_step": 97911, "epoch": 2331} {"train_loss": -6.324543476104736, "global_step": 97912, "epoch": 2331} {"train_loss": -6.426596641540527, "global_step": 97913, "epoch": 2331} {"train_loss": -6.398022174835205, "global_step": 97914, "epoch": 2331} {"train_loss": -6.4083452224731445, "global_step": 97915, "epoch": 2331} {"train_loss": -6.341618061065674, "global_step": 97916, "epoch": 2331} {"train_loss": -6.26867151260376, "global_step": 97917, "epoch": 2331} {"train_loss": -6.326229572296143, "global_step": 97918, "epoch": 2331} {"train_loss": -6.427097320556641, "global_step": 97919, "epoch": 2331} {"train_loss": -6.376316070556641, "global_step": 97920, "epoch": 2331} {"train_loss": -6.321401119232178, "global_step": 97921, "epoch": 2331} {"train_loss": -6.444363594055176, "global_step": 97922, "epoch": 2331} {"train_loss": -6.26479434967041, "global_step": 97923, "epoch": 2331} {"train_loss": -6.274529457092285, "global_step": 97924, "epoch": 2331} {"train_loss": -6.369186878204346, "global_step": 97925, "epoch": 2331} {"train_loss": -6.285226821899414, "global_step": 97926, "epoch": 2331} {"train_loss": -6.335592269897461, "global_step": 97927, "epoch": 2331} {"train_loss": -6.3013105392456055, "global_step": 97928, "epoch": 2331} {"train_loss": -6.375765800476074, "global_step": 97929, "epoch": 2331} {"train_loss": -6.402314186096191, "global_step": 97930, "epoch": 2331} {"train_loss": -6.414422988891602, "global_step": 97931, "epoch": 2331} {"train_loss": -6.3778181076049805, "global_step": 97932, "epoch": 2331} {"train_loss": -6.367029190063477, "global_step": 97933, "epoch": 2331} {"train_loss": -6.2703986167907715, "global_step": 97934, "epoch": 2331} {"train_loss": -6.381208419799805, "global_step": 97935, "epoch": 2331} {"train_loss": -6.342482089996338, "global_step": 97936, "epoch": 2331} {"train_loss": -6.354813575744629, "global_step": 97937, "epoch": 2331} {"train_loss": -6.23093843460083, "global_step": 97938, "epoch": 2331} {"train_loss": -6.305136680603027, "global_step": 97939, "epoch": 2331} {"train_loss": -6.354208946228027, "global_step": 97940, "epoch": 2331} {"train_loss": -6.326615333557129, "global_step": 97941, "epoch": 2331} {"train_loss": -6.390589237213135, "global_step": 97942, "epoch": 2331} {"train_loss": -6.351405121031261, "global_step": 97943, "epoch": 2331, "val_loss": 75788.8984375} {"train_loss": -6.33979606628418, "global_step": 97944, "epoch": 2332} {"train_loss": -6.2997260093688965, "global_step": 97945, "epoch": 2332} {"train_loss": -6.387997627258301, "global_step": 97946, "epoch": 2332} {"train_loss": -6.321063041687012, "global_step": 97947, "epoch": 2332} {"train_loss": -6.333409786224365, "global_step": 97948, "epoch": 2332} {"train_loss": -6.265064239501953, "global_step": 97949, "epoch": 2332} {"train_loss": -6.435267448425293, "global_step": 97950, "epoch": 2332} {"train_loss": -6.374404430389404, "global_step": 97951, "epoch": 2332} {"train_loss": -6.413268089294434, "global_step": 97952, "epoch": 2332} {"train_loss": -6.411012649536133, "global_step": 97953, "epoch": 2332} {"train_loss": -6.432258129119873, "global_step": 97954, "epoch": 2332} {"train_loss": -6.325735092163086, "global_step": 97955, "epoch": 2332} {"train_loss": -6.399132251739502, "global_step": 97956, "epoch": 2332} {"train_loss": -6.299395561218262, "global_step": 97957, "epoch": 2332} {"train_loss": -6.380032062530518, "global_step": 97958, "epoch": 2332} {"train_loss": -6.392945766448975, "global_step": 97959, "epoch": 2332} {"train_loss": -6.330178737640381, "global_step": 97960, "epoch": 2332} {"train_loss": -6.486515998840332, "global_step": 97961, "epoch": 2332} {"train_loss": -6.382687568664551, "global_step": 97962, "epoch": 2332} {"train_loss": -6.3488569259643555, "global_step": 97963, "epoch": 2332} {"train_loss": -6.301555633544922, "global_step": 97964, "epoch": 2332} {"train_loss": -6.362527847290039, "global_step": 97965, "epoch": 2332} {"train_loss": -6.381589889526367, "global_step": 97966, "epoch": 2332} {"train_loss": -6.34295654296875, "global_step": 97967, "epoch": 2332} {"train_loss": -6.176066875457764, "global_step": 97968, "epoch": 2332} {"train_loss": -6.392640113830566, "global_step": 97969, "epoch": 2332} {"train_loss": -6.1550750732421875, "global_step": 97970, "epoch": 2332} {"train_loss": -6.230159759521484, "global_step": 97971, "epoch": 2332} {"train_loss": -6.336699485778809, "global_step": 97972, "epoch": 2332} {"train_loss": -6.1651201248168945, "global_step": 97973, "epoch": 2332} {"train_loss": -6.27432918548584, "global_step": 97974, "epoch": 2332} {"train_loss": -6.326337814331055, "global_step": 97975, "epoch": 2332} {"train_loss": -6.211580276489258, "global_step": 97976, "epoch": 2332} {"train_loss": -6.291240692138672, "global_step": 97977, "epoch": 2332} {"train_loss": -6.313758850097656, "global_step": 97978, "epoch": 2332} {"train_loss": -6.234432220458984, "global_step": 97979, "epoch": 2332} {"train_loss": -6.262469291687012, "global_step": 97980, "epoch": 2332} {"train_loss": -6.208589553833008, "global_step": 97981, "epoch": 2332} {"train_loss": -6.334206581115723, "global_step": 97982, "epoch": 2332} {"train_loss": -6.287892818450928, "global_step": 97983, "epoch": 2332} {"train_loss": -6.301984786987305, "global_step": 97984, "epoch": 2332} {"train_loss": -6.321828013374692, "global_step": 97985, "epoch": 2332, "val_loss": 75837.3984375} {"train_loss": -6.141450881958008, "global_step": 97986, "epoch": 2333} {"train_loss": -6.294790267944336, "global_step": 97987, "epoch": 2333} {"train_loss": -6.323392868041992, "global_step": 97988, "epoch": 2333} {"train_loss": -6.316177845001221, "global_step": 97989, "epoch": 2333} {"train_loss": -6.414806365966797, "global_step": 97990, "epoch": 2333} {"train_loss": -6.227633476257324, "global_step": 97991, "epoch": 2333} {"train_loss": -6.277064323425293, "global_step": 97992, "epoch": 2333} {"train_loss": -6.433176517486572, "global_step": 97993, "epoch": 2333} {"train_loss": -6.379870414733887, "global_step": 97994, "epoch": 2333} {"train_loss": -6.400835037231445, "global_step": 97995, "epoch": 2333} {"train_loss": -6.354455947875977, "global_step": 97996, "epoch": 2333} {"train_loss": -6.443699836730957, "global_step": 97997, "epoch": 2333} {"train_loss": -6.213596343994141, "global_step": 97998, "epoch": 2333} {"train_loss": -6.337810516357422, "global_step": 97999, "epoch": 2333} {"train_loss": -6.289702892303467, "global_step": 98000, "epoch": 2333} {"train_loss": -6.243040084838867, "global_step": 98001, "epoch": 2333} {"train_loss": -6.378655433654785, "global_step": 98002, "epoch": 2333} {"train_loss": -6.338073253631592, "global_step": 98003, "epoch": 2333} {"train_loss": -6.277668476104736, "global_step": 98004, "epoch": 2333} {"train_loss": -6.264319896697998, "global_step": 98005, "epoch": 2333} {"train_loss": -6.3627214431762695, "global_step": 98006, "epoch": 2333} {"train_loss": -6.271651268005371, "global_step": 98007, "epoch": 2333} {"train_loss": -6.3510847091674805, "global_step": 98008, "epoch": 2333} {"train_loss": -6.237208843231201, "global_step": 98009, "epoch": 2333} {"train_loss": -6.327549934387207, "global_step": 98010, "epoch": 2333} {"train_loss": -6.342990875244141, "global_step": 98011, "epoch": 2333} {"train_loss": -6.314691543579102, "global_step": 98012, "epoch": 2333} {"train_loss": -6.439256191253662, "global_step": 98013, "epoch": 2333} {"train_loss": -6.327735900878906, "global_step": 98014, "epoch": 2333} {"train_loss": -6.233762741088867, "global_step": 98015, "epoch": 2333} {"train_loss": -6.4195661544799805, "global_step": 98016, "epoch": 2333} {"train_loss": -6.24513053894043, "global_step": 98017, "epoch": 2333} {"train_loss": -6.383233070373535, "global_step": 98018, "epoch": 2333} {"train_loss": -6.342920303344727, "global_step": 98019, "epoch": 2333} {"train_loss": -6.279751300811768, "global_step": 98020, "epoch": 2333} {"train_loss": -6.4075212478637695, "global_step": 98021, "epoch": 2333} {"train_loss": -6.326979637145996, "global_step": 98022, "epoch": 2333} {"train_loss": -6.389335632324219, "global_step": 98023, "epoch": 2333} {"train_loss": -6.421333312988281, "global_step": 98024, "epoch": 2333} {"train_loss": -6.391488075256348, "global_step": 98025, "epoch": 2333} {"train_loss": -6.318894386291504, "global_step": 98026, "epoch": 2333} {"train_loss": -6.332714410055251, "global_step": 98027, "epoch": 2333, "val_loss": 75843.9453125} {"train_loss": -6.319777965545654, "global_step": 98028, "epoch": 2334} {"train_loss": -6.398458957672119, "global_step": 98029, "epoch": 2334} {"train_loss": -6.382369041442871, "global_step": 98030, "epoch": 2334} {"train_loss": -6.364439964294434, "global_step": 98031, "epoch": 2334} {"train_loss": -6.385366439819336, "global_step": 98032, "epoch": 2334} {"train_loss": -6.307425498962402, "global_step": 98033, "epoch": 2334} {"train_loss": -6.304100036621094, "global_step": 98034, "epoch": 2334} {"train_loss": -6.460323333740234, "global_step": 98035, "epoch": 2334} {"train_loss": -6.3824543952941895, "global_step": 98036, "epoch": 2334} {"train_loss": -6.522890090942383, "global_step": 98037, "epoch": 2334} {"train_loss": -6.330859184265137, "global_step": 98038, "epoch": 2334} {"train_loss": -6.251114845275879, "global_step": 98039, "epoch": 2334} {"train_loss": -6.384391784667969, "global_step": 98040, "epoch": 2334} {"train_loss": -6.3188796043396, "global_step": 98041, "epoch": 2334} {"train_loss": -6.401234149932861, "global_step": 98042, "epoch": 2334} {"train_loss": -6.216287136077881, "global_step": 98043, "epoch": 2334} {"train_loss": -6.37578821182251, "global_step": 98044, "epoch": 2334} {"train_loss": -6.392366409301758, "global_step": 98045, "epoch": 2334} {"train_loss": -6.2960968017578125, "global_step": 98046, "epoch": 2334} {"train_loss": -6.334423542022705, "global_step": 98047, "epoch": 2334} {"train_loss": -6.316200256347656, "global_step": 98048, "epoch": 2334} {"train_loss": -6.301007270812988, "global_step": 98049, "epoch": 2334} {"train_loss": -6.399463653564453, "global_step": 98050, "epoch": 2334} {"train_loss": -6.371971130371094, "global_step": 98051, "epoch": 2334} {"train_loss": -6.362128257751465, "global_step": 98052, "epoch": 2334} {"train_loss": -6.366053581237793, "global_step": 98053, "epoch": 2334} {"train_loss": -6.394444942474365, "global_step": 98054, "epoch": 2334} {"train_loss": -6.314939975738525, "global_step": 98055, "epoch": 2334} {"train_loss": -6.421886444091797, "global_step": 98056, "epoch": 2334} {"train_loss": -6.337708473205566, "global_step": 98057, "epoch": 2334} {"train_loss": -6.358956813812256, "global_step": 98058, "epoch": 2334} {"train_loss": -6.377132892608643, "global_step": 98059, "epoch": 2334} {"train_loss": -6.331951141357422, "global_step": 98060, "epoch": 2334} {"train_loss": -6.378225326538086, "global_step": 98061, "epoch": 2334} {"train_loss": -6.340387344360352, "global_step": 98062, "epoch": 2334} {"train_loss": -6.398351669311523, "global_step": 98063, "epoch": 2334} {"train_loss": -6.257065773010254, "global_step": 98064, "epoch": 2334} {"train_loss": -6.40237283706665, "global_step": 98065, "epoch": 2334} {"train_loss": -6.240798473358154, "global_step": 98066, "epoch": 2334} {"train_loss": -6.37332820892334, "global_step": 98067, "epoch": 2334} {"train_loss": -6.3545732498168945, "global_step": 98068, "epoch": 2334} {"train_loss": -6.353865419115339, "global_step": 98069, "epoch": 2334, "val_loss": 75661.2890625} {"train_loss": -6.296233177185059, "global_step": 98070, "epoch": 2335} {"train_loss": -6.331751823425293, "global_step": 98071, "epoch": 2335} {"train_loss": -6.4344611167907715, "global_step": 98072, "epoch": 2335} {"train_loss": -6.3833770751953125, "global_step": 98073, "epoch": 2335} {"train_loss": -6.3430094718933105, "global_step": 98074, "epoch": 2335} {"train_loss": -6.457982063293457, "global_step": 98075, "epoch": 2335} {"train_loss": -6.325277328491211, "global_step": 98076, "epoch": 2335} {"train_loss": -6.359194755554199, "global_step": 98077, "epoch": 2335} {"train_loss": -6.4087724685668945, "global_step": 98078, "epoch": 2335} {"train_loss": -6.445000171661377, "global_step": 98079, "epoch": 2335} {"train_loss": -6.454936981201172, "global_step": 98080, "epoch": 2335} {"train_loss": -6.399725437164307, "global_step": 98081, "epoch": 2335} {"train_loss": -6.342432022094727, "global_step": 98082, "epoch": 2335} {"train_loss": -6.373815059661865, "global_step": 98083, "epoch": 2335} {"train_loss": -6.506901741027832, "global_step": 98084, "epoch": 2335} {"train_loss": -6.409389019012451, "global_step": 98085, "epoch": 2335} {"train_loss": -6.4986443519592285, "global_step": 98086, "epoch": 2335} {"train_loss": -6.466076850891113, "global_step": 98087, "epoch": 2335} {"train_loss": -6.3238654136657715, "global_step": 98088, "epoch": 2335} {"train_loss": -6.281332015991211, "global_step": 98089, "epoch": 2335} {"train_loss": -6.3617377281188965, "global_step": 98090, "epoch": 2335} {"train_loss": -6.3156046867370605, "global_step": 98091, "epoch": 2335} {"train_loss": -6.2890520095825195, "global_step": 98092, "epoch": 2335} {"train_loss": -6.436887264251709, "global_step": 98093, "epoch": 2335} {"train_loss": -6.368844032287598, "global_step": 98094, "epoch": 2335} {"train_loss": -6.306257724761963, "global_step": 98095, "epoch": 2335} {"train_loss": -6.3585968017578125, "global_step": 98096, "epoch": 2335} {"train_loss": -6.3491926193237305, "global_step": 98097, "epoch": 2335} {"train_loss": -6.321172714233398, "global_step": 98098, "epoch": 2335} {"train_loss": -6.428153991699219, "global_step": 98099, "epoch": 2335} {"train_loss": -6.342916965484619, "global_step": 98100, "epoch": 2335} {"train_loss": -6.276318550109863, "global_step": 98101, "epoch": 2335} {"train_loss": -6.423779010772705, "global_step": 98102, "epoch": 2335} {"train_loss": -6.20971155166626, "global_step": 98103, "epoch": 2335} {"train_loss": -6.179029941558838, "global_step": 98104, "epoch": 2335} {"train_loss": -6.379136562347412, "global_step": 98105, "epoch": 2335} {"train_loss": -6.218079566955566, "global_step": 98106, "epoch": 2335} {"train_loss": -6.370483875274658, "global_step": 98107, "epoch": 2335} {"train_loss": -6.378329753875732, "global_step": 98108, "epoch": 2335} {"train_loss": -6.271951198577881, "global_step": 98109, "epoch": 2335} {"train_loss": -6.283551216125488, "global_step": 98110, "epoch": 2335} {"train_loss": -6.359679210753668, "global_step": 98111, "epoch": 2335, "val_loss": 75690.1640625} {"train_loss": -6.387999057769775, "global_step": 98112, "epoch": 2336} {"train_loss": -6.383171081542969, "global_step": 98113, "epoch": 2336} {"train_loss": -6.330845832824707, "global_step": 98114, "epoch": 2336} {"train_loss": -6.184259414672852, "global_step": 98115, "epoch": 2336} {"train_loss": -6.320890426635742, "global_step": 98116, "epoch": 2336} {"train_loss": -6.472146034240723, "global_step": 98117, "epoch": 2336} {"train_loss": -6.407917022705078, "global_step": 98118, "epoch": 2336} {"train_loss": -6.352132320404053, "global_step": 98119, "epoch": 2336} {"train_loss": -6.355513095855713, "global_step": 98120, "epoch": 2336} {"train_loss": -6.33567476272583, "global_step": 98121, "epoch": 2336} {"train_loss": -6.4072675704956055, "global_step": 98122, "epoch": 2336} {"train_loss": -6.409782886505127, "global_step": 98123, "epoch": 2336} {"train_loss": -6.43924617767334, "global_step": 98124, "epoch": 2336} {"train_loss": -6.426938533782959, "global_step": 98125, "epoch": 2336} {"train_loss": -6.312524795532227, "global_step": 98126, "epoch": 2336} {"train_loss": -6.377708911895752, "global_step": 98127, "epoch": 2336} {"train_loss": -6.326092720031738, "global_step": 98128, "epoch": 2336} {"train_loss": -6.371938228607178, "global_step": 98129, "epoch": 2336} {"train_loss": -6.4244537353515625, "global_step": 98130, "epoch": 2336} {"train_loss": -6.401803970336914, "global_step": 98131, "epoch": 2336} {"train_loss": -6.431397438049316, "global_step": 98132, "epoch": 2336} {"train_loss": -6.48209285736084, "global_step": 98133, "epoch": 2336} {"train_loss": -6.223738670349121, "global_step": 98134, "epoch": 2336} {"train_loss": -6.306976318359375, "global_step": 98135, "epoch": 2336} {"train_loss": -6.489476680755615, "global_step": 98136, "epoch": 2336} {"train_loss": -6.400093078613281, "global_step": 98137, "epoch": 2336} {"train_loss": -6.265756130218506, "global_step": 98138, "epoch": 2336} {"train_loss": -6.368535995483398, "global_step": 98139, "epoch": 2336} {"train_loss": -6.4280686378479, "global_step": 98140, "epoch": 2336} {"train_loss": -6.291945934295654, "global_step": 98141, "epoch": 2336} {"train_loss": -6.342442989349365, "global_step": 98142, "epoch": 2336} {"train_loss": -6.270174026489258, "global_step": 98143, "epoch": 2336} {"train_loss": -6.397110939025879, "global_step": 98144, "epoch": 2336} {"train_loss": -6.324507713317871, "global_step": 98145, "epoch": 2336} {"train_loss": -6.4063334465026855, "global_step": 98146, "epoch": 2336} {"train_loss": -6.315512180328369, "global_step": 98147, "epoch": 2336} {"train_loss": -6.401433944702148, "global_step": 98148, "epoch": 2336} {"train_loss": -6.338356018066406, "global_step": 98149, "epoch": 2336} {"train_loss": -6.323360919952393, "global_step": 98150, "epoch": 2336} {"train_loss": -6.257004737854004, "global_step": 98151, "epoch": 2336} {"train_loss": -6.216432571411133, "global_step": 98152, "epoch": 2336} {"train_loss": -6.355985380354381, "global_step": 98153, "epoch": 2336, "val_loss": 75726.3046875} {"train_loss": -6.227288246154785, "global_step": 98154, "epoch": 2337} {"train_loss": -6.298232555389404, "global_step": 98155, "epoch": 2337} {"train_loss": -6.281060218811035, "global_step": 98156, "epoch": 2337} {"train_loss": -6.389443874359131, "global_step": 98157, "epoch": 2337} {"train_loss": -6.366611003875732, "global_step": 98158, "epoch": 2337} {"train_loss": -6.279970169067383, "global_step": 98159, "epoch": 2337} {"train_loss": -6.314322471618652, "global_step": 98160, "epoch": 2337} {"train_loss": -6.286070823669434, "global_step": 98161, "epoch": 2337} {"train_loss": -6.340734958648682, "global_step": 98162, "epoch": 2337} {"train_loss": -6.372112274169922, "global_step": 98163, "epoch": 2337} {"train_loss": -6.344869613647461, "global_step": 98164, "epoch": 2337} {"train_loss": -6.394028663635254, "global_step": 98165, "epoch": 2337} {"train_loss": -6.228641510009766, "global_step": 98166, "epoch": 2337} {"train_loss": -6.296574115753174, "global_step": 98167, "epoch": 2337} {"train_loss": -6.335506439208984, "global_step": 98168, "epoch": 2337} {"train_loss": -6.3744425773620605, "global_step": 98169, "epoch": 2337} {"train_loss": -6.324153900146484, "global_step": 98170, "epoch": 2337} {"train_loss": -6.365650177001953, "global_step": 98171, "epoch": 2337} {"train_loss": -6.4031195640563965, "global_step": 98172, "epoch": 2337} {"train_loss": -6.323780059814453, "global_step": 98173, "epoch": 2337} {"train_loss": -6.365853786468506, "global_step": 98174, "epoch": 2337} {"train_loss": -6.309683322906494, "global_step": 98175, "epoch": 2337} {"train_loss": -6.418140411376953, "global_step": 98176, "epoch": 2337} {"train_loss": -6.287432670593262, "global_step": 98177, "epoch": 2337} {"train_loss": -6.283596038818359, "global_step": 98178, "epoch": 2337} {"train_loss": -6.374781608581543, "global_step": 98179, "epoch": 2337} {"train_loss": -6.464573860168457, "global_step": 98180, "epoch": 2337} {"train_loss": -6.257473945617676, "global_step": 98181, "epoch": 2337} {"train_loss": -6.294625282287598, "global_step": 98182, "epoch": 2337} {"train_loss": -6.337419509887695, "global_step": 98183, "epoch": 2337} {"train_loss": -6.235819339752197, "global_step": 98184, "epoch": 2337} {"train_loss": -6.354531288146973, "global_step": 98185, "epoch": 2337} {"train_loss": -6.334676742553711, "global_step": 98186, "epoch": 2337} {"train_loss": -6.37108039855957, "global_step": 98187, "epoch": 2337} {"train_loss": -6.2896904945373535, "global_step": 98188, "epoch": 2337} {"train_loss": -6.384883403778076, "global_step": 98189, "epoch": 2337} {"train_loss": -6.402839660644531, "global_step": 98190, "epoch": 2337} {"train_loss": -6.327997207641602, "global_step": 98191, "epoch": 2337} {"train_loss": -6.48880672454834, "global_step": 98192, "epoch": 2337} {"train_loss": -6.278522491455078, "global_step": 98193, "epoch": 2337} {"train_loss": -6.438817977905273, "global_step": 98194, "epoch": 2337} {"train_loss": -6.336990299678984, "global_step": 98195, "epoch": 2337, "val_loss": 75551.578125} {"train_loss": -6.313190937042236, "global_step": 98196, "epoch": 2338} {"train_loss": -6.395427703857422, "global_step": 98197, "epoch": 2338} {"train_loss": -6.3272600173950195, "global_step": 98198, "epoch": 2338} {"train_loss": -6.329293251037598, "global_step": 98199, "epoch": 2338} {"train_loss": -6.299955368041992, "global_step": 98200, "epoch": 2338} {"train_loss": -6.275519371032715, "global_step": 98201, "epoch": 2338} {"train_loss": -6.3102922439575195, "global_step": 98202, "epoch": 2338} {"train_loss": -6.269209861755371, "global_step": 98203, "epoch": 2338} {"train_loss": -6.393813610076904, "global_step": 98204, "epoch": 2338} {"train_loss": -6.374801158905029, "global_step": 98205, "epoch": 2338} {"train_loss": -6.312298774719238, "global_step": 98206, "epoch": 2338} {"train_loss": -6.35157585144043, "global_step": 98207, "epoch": 2338} {"train_loss": -6.392786979675293, "global_step": 98208, "epoch": 2338} {"train_loss": -6.278913497924805, "global_step": 98209, "epoch": 2338} {"train_loss": -6.378878593444824, "global_step": 98210, "epoch": 2338} {"train_loss": -6.343223571777344, "global_step": 98211, "epoch": 2338} {"train_loss": -6.248723983764648, "global_step": 98212, "epoch": 2338} {"train_loss": -6.361757278442383, "global_step": 98213, "epoch": 2338} {"train_loss": -6.377834320068359, "global_step": 98214, "epoch": 2338} {"train_loss": -6.324586868286133, "global_step": 98215, "epoch": 2338} {"train_loss": -6.2106781005859375, "global_step": 98216, "epoch": 2338} {"train_loss": -6.48964262008667, "global_step": 98217, "epoch": 2338} {"train_loss": -6.331997394561768, "global_step": 98218, "epoch": 2338} {"train_loss": -6.2446184158325195, "global_step": 98219, "epoch": 2338} {"train_loss": -6.312314033508301, "global_step": 98220, "epoch": 2338} {"train_loss": -6.227412223815918, "global_step": 98221, "epoch": 2338} {"train_loss": -6.292032241821289, "global_step": 98222, "epoch": 2338} {"train_loss": -6.259214401245117, "global_step": 98223, "epoch": 2338} {"train_loss": -6.3108320236206055, "global_step": 98224, "epoch": 2338} {"train_loss": -6.368094444274902, "global_step": 98225, "epoch": 2338} {"train_loss": -6.1716508865356445, "global_step": 98226, "epoch": 2338} {"train_loss": -6.3359785079956055, "global_step": 98227, "epoch": 2338} {"train_loss": -6.336789608001709, "global_step": 98228, "epoch": 2338} {"train_loss": -6.2583513259887695, "global_step": 98229, "epoch": 2338} {"train_loss": -6.317398548126221, "global_step": 98230, "epoch": 2338} {"train_loss": -6.341542720794678, "global_step": 98231, "epoch": 2338} {"train_loss": -6.270562648773193, "global_step": 98232, "epoch": 2338} {"train_loss": -6.382019519805908, "global_step": 98233, "epoch": 2338} {"train_loss": -6.450875282287598, "global_step": 98234, "epoch": 2338} {"train_loss": -6.317533493041992, "global_step": 98235, "epoch": 2338} {"train_loss": -6.351499557495117, "global_step": 98236, "epoch": 2338} {"train_loss": -6.322873070126488, "global_step": 98237, "epoch": 2338, "val_loss": 75842.4140625} {"train_loss": -6.315494060516357, "global_step": 98238, "epoch": 2339} {"train_loss": -6.363155841827393, "global_step": 98239, "epoch": 2339} {"train_loss": -6.227667808532715, "global_step": 98240, "epoch": 2339} {"train_loss": -6.393964767456055, "global_step": 98241, "epoch": 2339} {"train_loss": -6.4006266593933105, "global_step": 98242, "epoch": 2339} {"train_loss": -6.313385009765625, "global_step": 98243, "epoch": 2339} {"train_loss": -6.316555500030518, "global_step": 98244, "epoch": 2339} {"train_loss": -6.376265525817871, "global_step": 98245, "epoch": 2339} {"train_loss": -6.343863010406494, "global_step": 98246, "epoch": 2339} {"train_loss": -6.364287853240967, "global_step": 98247, "epoch": 2339} {"train_loss": -6.311829566955566, "global_step": 98248, "epoch": 2339} {"train_loss": -6.326859474182129, "global_step": 98249, "epoch": 2339} {"train_loss": -6.35362434387207, "global_step": 98250, "epoch": 2339} {"train_loss": -6.386865139007568, "global_step": 98251, "epoch": 2339} {"train_loss": -6.286751747131348, "global_step": 98252, "epoch": 2339} {"train_loss": -6.375, "global_step": 98253, "epoch": 2339} {"train_loss": -6.30767297744751, "global_step": 98254, "epoch": 2339} {"train_loss": -6.399869918823242, "global_step": 98255, "epoch": 2339} {"train_loss": -6.299679756164551, "global_step": 98256, "epoch": 2339} {"train_loss": -6.314433574676514, "global_step": 98257, "epoch": 2339} {"train_loss": -6.326663970947266, "global_step": 98258, "epoch": 2339} {"train_loss": -6.323105335235596, "global_step": 98259, "epoch": 2339} {"train_loss": -6.375171184539795, "global_step": 98260, "epoch": 2339} {"train_loss": -6.30857515335083, "global_step": 98261, "epoch": 2339} {"train_loss": -6.363112449645996, "global_step": 98262, "epoch": 2339} {"train_loss": -6.417935371398926, "global_step": 98263, "epoch": 2339} {"train_loss": -6.266356945037842, "global_step": 98264, "epoch": 2339} {"train_loss": -6.342061996459961, "global_step": 98265, "epoch": 2339} {"train_loss": -6.468626976013184, "global_step": 98266, "epoch": 2339} {"train_loss": -6.337207794189453, "global_step": 98267, "epoch": 2339} {"train_loss": -6.365710735321045, "global_step": 98268, "epoch": 2339} {"train_loss": -6.4110822677612305, "global_step": 98269, "epoch": 2339} {"train_loss": -6.300475120544434, "global_step": 98270, "epoch": 2339} {"train_loss": -6.38090705871582, "global_step": 98271, "epoch": 2339} {"train_loss": -6.351382255554199, "global_step": 98272, "epoch": 2339} {"train_loss": -6.348846435546875, "global_step": 98273, "epoch": 2339} {"train_loss": -6.276784896850586, "global_step": 98274, "epoch": 2339} {"train_loss": -6.364593505859375, "global_step": 98275, "epoch": 2339} {"train_loss": -6.281764984130859, "global_step": 98276, "epoch": 2339} {"train_loss": -6.2998433113098145, "global_step": 98277, "epoch": 2339} {"train_loss": -6.281883716583252, "global_step": 98278, "epoch": 2339} {"train_loss": -6.342419011252267, "global_step": 98279, "epoch": 2339, "val_loss": 75628.5703125} {"train_loss": -6.308830261230469, "global_step": 98280, "epoch": 2340} {"train_loss": -6.3573832511901855, "global_step": 98281, "epoch": 2340} {"train_loss": -6.394713401794434, "global_step": 98282, "epoch": 2340} {"train_loss": -6.263466835021973, "global_step": 98283, "epoch": 2340} {"train_loss": -6.3424072265625, "global_step": 98284, "epoch": 2340} {"train_loss": -6.4258928298950195, "global_step": 98285, "epoch": 2340} {"train_loss": -6.274209022521973, "global_step": 98286, "epoch": 2340} {"train_loss": -6.281083583831787, "global_step": 98287, "epoch": 2340} {"train_loss": -6.3831377029418945, "global_step": 98288, "epoch": 2340} {"train_loss": -6.3131890296936035, "global_step": 98289, "epoch": 2340} {"train_loss": -6.44892692565918, "global_step": 98290, "epoch": 2340} {"train_loss": -6.389699935913086, "global_step": 98291, "epoch": 2340} {"train_loss": -6.4009809494018555, "global_step": 98292, "epoch": 2340} {"train_loss": -6.300863742828369, "global_step": 98293, "epoch": 2340} {"train_loss": -6.343931674957275, "global_step": 98294, "epoch": 2340} {"train_loss": -6.257765769958496, "global_step": 98295, "epoch": 2340} {"train_loss": -6.385639190673828, "global_step": 98296, "epoch": 2340} {"train_loss": -6.34544038772583, "global_step": 98297, "epoch": 2340} {"train_loss": -6.419109344482422, "global_step": 98298, "epoch": 2340} {"train_loss": -6.359771728515625, "global_step": 98299, "epoch": 2340} {"train_loss": -6.350039958953857, "global_step": 98300, "epoch": 2340} {"train_loss": -6.278356552124023, "global_step": 98301, "epoch": 2340} {"train_loss": -6.319540023803711, "global_step": 98302, "epoch": 2340} {"train_loss": -6.277512073516846, "global_step": 98303, "epoch": 2340} {"train_loss": -6.401011943817139, "global_step": 98304, "epoch": 2340} {"train_loss": -6.321140766143799, "global_step": 98305, "epoch": 2340} {"train_loss": -6.392753601074219, "global_step": 98306, "epoch": 2340} {"train_loss": -6.406764507293701, "global_step": 98307, "epoch": 2340} {"train_loss": -6.370349884033203, "global_step": 98308, "epoch": 2340} {"train_loss": -6.182822227478027, "global_step": 98309, "epoch": 2340} {"train_loss": -6.430550575256348, "global_step": 98310, "epoch": 2340} {"train_loss": -6.358666896820068, "global_step": 98311, "epoch": 2340} {"train_loss": -6.266158103942871, "global_step": 98312, "epoch": 2340} {"train_loss": -6.260200500488281, "global_step": 98313, "epoch": 2340} {"train_loss": -6.3282060623168945, "global_step": 98314, "epoch": 2340} {"train_loss": -6.310628890991211, "global_step": 98315, "epoch": 2340} {"train_loss": -6.334649085998535, "global_step": 98316, "epoch": 2340} {"train_loss": -6.334175109863281, "global_step": 98317, "epoch": 2340} {"train_loss": -6.3420000076293945, "global_step": 98318, "epoch": 2340} {"train_loss": -6.167209625244141, "global_step": 98319, "epoch": 2340} {"train_loss": -6.230686664581299, "global_step": 98320, "epoch": 2340} {"train_loss": -6.330777872176397, "global_step": 98321, "epoch": 2340, "val_loss": 75442.796875} {"train_loss": -6.239284515380859, "global_step": 98322, "epoch": 2341} {"train_loss": -6.307474136352539, "global_step": 98323, "epoch": 2341} {"train_loss": -6.29612922668457, "global_step": 98324, "epoch": 2341} {"train_loss": -6.27714729309082, "global_step": 98325, "epoch": 2341} {"train_loss": -6.3262715339660645, "global_step": 98326, "epoch": 2341} {"train_loss": -6.302823066711426, "global_step": 98327, "epoch": 2341} {"train_loss": -6.22331428527832, "global_step": 98328, "epoch": 2341} {"train_loss": -6.339047431945801, "global_step": 98329, "epoch": 2341} {"train_loss": -6.386131763458252, "global_step": 98330, "epoch": 2341} {"train_loss": -6.327763557434082, "global_step": 98331, "epoch": 2341} {"train_loss": -6.164304733276367, "global_step": 98332, "epoch": 2341} {"train_loss": -6.279654502868652, "global_step": 98333, "epoch": 2341} {"train_loss": -6.302179336547852, "global_step": 98334, "epoch": 2341} {"train_loss": -6.265413284301758, "global_step": 98335, "epoch": 2341} {"train_loss": -6.232836723327637, "global_step": 98336, "epoch": 2341} {"train_loss": -6.22836971282959, "global_step": 98337, "epoch": 2341} {"train_loss": -6.363560676574707, "global_step": 98338, "epoch": 2341} {"train_loss": -6.20928430557251, "global_step": 98339, "epoch": 2341} {"train_loss": -6.288909912109375, "global_step": 98340, "epoch": 2341} {"train_loss": -6.237107276916504, "global_step": 98341, "epoch": 2341} {"train_loss": -6.306612968444824, "global_step": 98342, "epoch": 2341} {"train_loss": -6.351688385009766, "global_step": 98343, "epoch": 2341} {"train_loss": -6.285024642944336, "global_step": 98344, "epoch": 2341} {"train_loss": -6.364187717437744, "global_step": 98345, "epoch": 2341} {"train_loss": -6.302469730377197, "global_step": 98346, "epoch": 2341} {"train_loss": -6.269899845123291, "global_step": 98347, "epoch": 2341} {"train_loss": -6.277173042297363, "global_step": 98348, "epoch": 2341} {"train_loss": -6.3975934982299805, "global_step": 98349, "epoch": 2341} {"train_loss": -6.229548454284668, "global_step": 98350, "epoch": 2341} {"train_loss": -6.4090399742126465, "global_step": 98351, "epoch": 2341} {"train_loss": -6.445047378540039, "global_step": 98352, "epoch": 2341} {"train_loss": -6.361908912658691, "global_step": 98353, "epoch": 2341} {"train_loss": -6.4444260597229, "global_step": 98354, "epoch": 2341} {"train_loss": -6.275688171386719, "global_step": 98355, "epoch": 2341} {"train_loss": -6.285562515258789, "global_step": 98356, "epoch": 2341} {"train_loss": -6.360558986663818, "global_step": 98357, "epoch": 2341} {"train_loss": -6.41108512878418, "global_step": 98358, "epoch": 2341} {"train_loss": -6.387517929077148, "global_step": 98359, "epoch": 2341} {"train_loss": -6.380455017089844, "global_step": 98360, "epoch": 2341} {"train_loss": -6.275032997131348, "global_step": 98361, "epoch": 2341} {"train_loss": -6.309512138366699, "global_step": 98362, "epoch": 2341} {"train_loss": -6.311750173568726, "global_step": 98363, "epoch": 2341, "val_loss": 75621.515625} {"train_loss": -6.318739891052246, "global_step": 98364, "epoch": 2342} {"train_loss": -6.384696006774902, "global_step": 98365, "epoch": 2342} {"train_loss": -6.398522853851318, "global_step": 98366, "epoch": 2342} {"train_loss": -6.407951354980469, "global_step": 98367, "epoch": 2342} {"train_loss": -6.27495002746582, "global_step": 98368, "epoch": 2342} {"train_loss": -6.181716442108154, "global_step": 98369, "epoch": 2342} {"train_loss": -6.3362016677856445, "global_step": 98370, "epoch": 2342} {"train_loss": -6.1983842849731445, "global_step": 98371, "epoch": 2342} {"train_loss": -6.38092041015625, "global_step": 98372, "epoch": 2342} {"train_loss": -6.316096782684326, "global_step": 98373, "epoch": 2342} {"train_loss": -6.2248005867004395, "global_step": 98374, "epoch": 2342} {"train_loss": -6.426359176635742, "global_step": 98375, "epoch": 2342} {"train_loss": -6.3775482177734375, "global_step": 98376, "epoch": 2342} {"train_loss": -6.320652961730957, "global_step": 98377, "epoch": 2342} {"train_loss": -6.234626770019531, "global_step": 98378, "epoch": 2342} {"train_loss": -6.219831943511963, "global_step": 98379, "epoch": 2342} {"train_loss": -6.24442195892334, "global_step": 98380, "epoch": 2342} {"train_loss": -6.321516990661621, "global_step": 98381, "epoch": 2342} {"train_loss": -6.374950408935547, "global_step": 98382, "epoch": 2342} {"train_loss": -6.434041976928711, "global_step": 98383, "epoch": 2342} {"train_loss": -6.265891075134277, "global_step": 98384, "epoch": 2342} {"train_loss": -6.4068403244018555, "global_step": 98385, "epoch": 2342} {"train_loss": -6.383121490478516, "global_step": 98386, "epoch": 2342} {"train_loss": -6.449261665344238, "global_step": 98387, "epoch": 2342} {"train_loss": -6.397299766540527, "global_step": 98388, "epoch": 2342} {"train_loss": -6.2660746574401855, "global_step": 98389, "epoch": 2342} {"train_loss": -6.298933029174805, "global_step": 98390, "epoch": 2342} {"train_loss": -6.291940689086914, "global_step": 98391, "epoch": 2342} {"train_loss": -6.3546953201293945, "global_step": 98392, "epoch": 2342} {"train_loss": -6.339082717895508, "global_step": 98393, "epoch": 2342} {"train_loss": -6.342180252075195, "global_step": 98394, "epoch": 2342} {"train_loss": -6.303952693939209, "global_step": 98395, "epoch": 2342} {"train_loss": -6.369657516479492, "global_step": 98396, "epoch": 2342} {"train_loss": -6.318421363830566, "global_step": 98397, "epoch": 2342} {"train_loss": -6.348891258239746, "global_step": 98398, "epoch": 2342} {"train_loss": -6.347663879394531, "global_step": 98399, "epoch": 2342} {"train_loss": -6.540515422821045, "global_step": 98400, "epoch": 2342} {"train_loss": -6.436192512512207, "global_step": 98401, "epoch": 2342} {"train_loss": -6.385558128356934, "global_step": 98402, "epoch": 2342} {"train_loss": -6.277467727661133, "global_step": 98403, "epoch": 2342} {"train_loss": -6.331451892852783, "global_step": 98404, "epoch": 2342} {"train_loss": -6.336741776693435, "global_step": 98405, "epoch": 2342, "val_loss": 75832.734375} {"train_loss": -6.49234676361084, "global_step": 98406, "epoch": 2343} {"train_loss": -6.331695079803467, "global_step": 98407, "epoch": 2343} {"train_loss": -6.376049995422363, "global_step": 98408, "epoch": 2343} {"train_loss": -6.313698768615723, "global_step": 98409, "epoch": 2343} {"train_loss": -6.289902687072754, "global_step": 98410, "epoch": 2343} {"train_loss": -6.363581657409668, "global_step": 98411, "epoch": 2343} {"train_loss": -6.368401527404785, "global_step": 98412, "epoch": 2343} {"train_loss": -6.38978385925293, "global_step": 98413, "epoch": 2343} {"train_loss": -6.381150245666504, "global_step": 98414, "epoch": 2343} {"train_loss": -6.264871597290039, "global_step": 98415, "epoch": 2343} {"train_loss": -6.303502082824707, "global_step": 98416, "epoch": 2343} {"train_loss": -6.291585922241211, "global_step": 98417, "epoch": 2343} {"train_loss": -6.33618688583374, "global_step": 98418, "epoch": 2343} {"train_loss": -6.49418830871582, "global_step": 98419, "epoch": 2343} {"train_loss": -6.25340461730957, "global_step": 98420, "epoch": 2343} {"train_loss": -6.347068786621094, "global_step": 98421, "epoch": 2343} {"train_loss": -6.38079309463501, "global_step": 98422, "epoch": 2343} {"train_loss": -6.302132606506348, "global_step": 98423, "epoch": 2343} {"train_loss": -6.335420608520508, "global_step": 98424, "epoch": 2343} {"train_loss": -6.337950229644775, "global_step": 98425, "epoch": 2343} {"train_loss": -6.327789306640625, "global_step": 98426, "epoch": 2343} {"train_loss": -6.360805511474609, "global_step": 98427, "epoch": 2343} {"train_loss": -6.331442356109619, "global_step": 98428, "epoch": 2343} {"train_loss": -6.367684364318848, "global_step": 98429, "epoch": 2343} {"train_loss": -6.292860507965088, "global_step": 98430, "epoch": 2343} {"train_loss": -6.408830642700195, "global_step": 98431, "epoch": 2343} {"train_loss": -6.402792930603027, "global_step": 98432, "epoch": 2343} {"train_loss": -6.444193363189697, "global_step": 98433, "epoch": 2343} {"train_loss": -6.344884872436523, "global_step": 98434, "epoch": 2343} {"train_loss": -6.297776699066162, "global_step": 98435, "epoch": 2343} {"train_loss": -6.270230770111084, "global_step": 98436, "epoch": 2343} {"train_loss": -6.326605319976807, "global_step": 98437, "epoch": 2343} {"train_loss": -6.315160751342773, "global_step": 98438, "epoch": 2343} {"train_loss": -6.409161567687988, "global_step": 98439, "epoch": 2343} {"train_loss": -6.346226215362549, "global_step": 98440, "epoch": 2343} {"train_loss": -6.461824417114258, "global_step": 98441, "epoch": 2343} {"train_loss": -6.245901107788086, "global_step": 98442, "epoch": 2343} {"train_loss": -6.312552452087402, "global_step": 98443, "epoch": 2343} {"train_loss": -6.3760528564453125, "global_step": 98444, "epoch": 2343} {"train_loss": -6.404209136962891, "global_step": 98445, "epoch": 2343} {"train_loss": -6.294387340545654, "global_step": 98446, "epoch": 2343} {"train_loss": -6.348655337379093, "global_step": 98447, "epoch": 2343, "val_loss": 75614.640625} {"train_loss": -6.30840539932251, "global_step": 98448, "epoch": 2344} {"train_loss": -6.235883712768555, "global_step": 98449, "epoch": 2344} {"train_loss": -6.3099846839904785, "global_step": 98450, "epoch": 2344} {"train_loss": -6.423586368560791, "global_step": 98451, "epoch": 2344} {"train_loss": -6.367213249206543, "global_step": 98452, "epoch": 2344} {"train_loss": -6.362452030181885, "global_step": 98453, "epoch": 2344} {"train_loss": -6.302252769470215, "global_step": 98454, "epoch": 2344} {"train_loss": -6.406225204467773, "global_step": 98455, "epoch": 2344} {"train_loss": -6.32840633392334, "global_step": 98456, "epoch": 2344} {"train_loss": -6.540082931518555, "global_step": 98457, "epoch": 2344} {"train_loss": -6.3160014152526855, "global_step": 98458, "epoch": 2344} {"train_loss": -6.348775863647461, "global_step": 98459, "epoch": 2344} {"train_loss": -6.534861087799072, "global_step": 98460, "epoch": 2344} {"train_loss": -6.465041160583496, "global_step": 98461, "epoch": 2344} {"train_loss": -6.316784858703613, "global_step": 98462, "epoch": 2344} {"train_loss": -6.475074768066406, "global_step": 98463, "epoch": 2344} {"train_loss": -6.42362117767334, "global_step": 98464, "epoch": 2344} {"train_loss": -6.400310516357422, "global_step": 98465, "epoch": 2344} {"train_loss": -6.348970413208008, "global_step": 98466, "epoch": 2344} {"train_loss": -6.294933319091797, "global_step": 98467, "epoch": 2344} {"train_loss": -6.262703895568848, "global_step": 98468, "epoch": 2344} {"train_loss": -6.452253818511963, "global_step": 98469, "epoch": 2344} {"train_loss": -6.421910762786865, "global_step": 98470, "epoch": 2344} {"train_loss": -6.294827461242676, "global_step": 98471, "epoch": 2344} {"train_loss": -6.390657901763916, "global_step": 98472, "epoch": 2344} {"train_loss": -6.450699806213379, "global_step": 98473, "epoch": 2344} {"train_loss": -6.397966384887695, "global_step": 98474, "epoch": 2344} {"train_loss": -6.3273210525512695, "global_step": 98475, "epoch": 2344} {"train_loss": -6.426345348358154, "global_step": 98476, "epoch": 2344} {"train_loss": -6.282119274139404, "global_step": 98477, "epoch": 2344} {"train_loss": -6.246279239654541, "global_step": 98478, "epoch": 2344} {"train_loss": -6.333898544311523, "global_step": 98479, "epoch": 2344} {"train_loss": -6.223072528839111, "global_step": 98480, "epoch": 2344} {"train_loss": -6.1645188331604, "global_step": 98481, "epoch": 2344} {"train_loss": -6.318397521972656, "global_step": 98482, "epoch": 2344} {"train_loss": -6.249814033508301, "global_step": 98483, "epoch": 2344} {"train_loss": -6.235250473022461, "global_step": 98484, "epoch": 2344} {"train_loss": -6.317352294921875, "global_step": 98485, "epoch": 2344} {"train_loss": -6.441556453704834, "global_step": 98486, "epoch": 2344} {"train_loss": -6.2248711585998535, "global_step": 98487, "epoch": 2344} {"train_loss": -6.365604400634766, "global_step": 98488, "epoch": 2344} {"train_loss": -6.348301603680565, "global_step": 98489, "epoch": 2344, "val_loss": 75705.2734375} {"train_loss": -6.339728832244873, "global_step": 98490, "epoch": 2345} {"train_loss": -6.302316188812256, "global_step": 98491, "epoch": 2345} {"train_loss": -6.312648773193359, "global_step": 98492, "epoch": 2345} {"train_loss": -6.322476387023926, "global_step": 98493, "epoch": 2345} {"train_loss": -6.219785690307617, "global_step": 98494, "epoch": 2345} {"train_loss": -6.390646457672119, "global_step": 98495, "epoch": 2345} {"train_loss": -6.292767524719238, "global_step": 98496, "epoch": 2345} {"train_loss": -6.537250518798828, "global_step": 98497, "epoch": 2345} {"train_loss": -6.321666717529297, "global_step": 98498, "epoch": 2345} {"train_loss": -6.286849021911621, "global_step": 98499, "epoch": 2345} {"train_loss": -6.489309310913086, "global_step": 98500, "epoch": 2345} {"train_loss": -6.450071334838867, "global_step": 98501, "epoch": 2345} {"train_loss": -6.392106056213379, "global_step": 98502, "epoch": 2345} {"train_loss": -6.3528642654418945, "global_step": 98503, "epoch": 2345} {"train_loss": -6.354256629943848, "global_step": 98504, "epoch": 2345} {"train_loss": -6.361921310424805, "global_step": 98505, "epoch": 2345} {"train_loss": -6.445451736450195, "global_step": 98506, "epoch": 2345} {"train_loss": -6.28178596496582, "global_step": 98507, "epoch": 2345} {"train_loss": -6.239877700805664, "global_step": 98508, "epoch": 2345} {"train_loss": -6.347844123840332, "global_step": 98509, "epoch": 2345} {"train_loss": -6.258313179016113, "global_step": 98510, "epoch": 2345} {"train_loss": -6.2309041023254395, "global_step": 98511, "epoch": 2345} {"train_loss": -6.432909965515137, "global_step": 98512, "epoch": 2345} {"train_loss": -6.2156805992126465, "global_step": 98513, "epoch": 2345} {"train_loss": -6.327216625213623, "global_step": 98514, "epoch": 2345} {"train_loss": -6.363243103027344, "global_step": 98515, "epoch": 2345} {"train_loss": -6.261617183685303, "global_step": 98516, "epoch": 2345} {"train_loss": -6.321494102478027, "global_step": 98517, "epoch": 2345} {"train_loss": -6.3468828201293945, "global_step": 98518, "epoch": 2345} {"train_loss": -6.327444076538086, "global_step": 98519, "epoch": 2345} {"train_loss": -6.1572394371032715, "global_step": 98520, "epoch": 2345} {"train_loss": -6.269988059997559, "global_step": 98521, "epoch": 2345} {"train_loss": -6.290717124938965, "global_step": 98522, "epoch": 2345} {"train_loss": -6.39047908782959, "global_step": 98523, "epoch": 2345} {"train_loss": -6.392644882202148, "global_step": 98524, "epoch": 2345} {"train_loss": -6.287789344787598, "global_step": 98525, "epoch": 2345} {"train_loss": -6.339736461639404, "global_step": 98526, "epoch": 2345} {"train_loss": -6.277896881103516, "global_step": 98527, "epoch": 2345} {"train_loss": -6.402939319610596, "global_step": 98528, "epoch": 2345} {"train_loss": -6.3028082847595215, "global_step": 98529, "epoch": 2345} {"train_loss": -6.2494893074035645, "global_step": 98530, "epoch": 2345} {"train_loss": -6.330533879143851, "global_step": 98531, "epoch": 2345, "val_loss": 75799.8125} {"train_loss": -6.302518844604492, "global_step": 98532, "epoch": 2346} {"train_loss": -6.301449775695801, "global_step": 98533, "epoch": 2346} {"train_loss": -6.374349117279053, "global_step": 98534, "epoch": 2346} {"train_loss": -6.327025413513184, "global_step": 98535, "epoch": 2346} {"train_loss": -6.298636436462402, "global_step": 98536, "epoch": 2346} {"train_loss": -6.367830276489258, "global_step": 98537, "epoch": 2346} {"train_loss": -6.186091423034668, "global_step": 98538, "epoch": 2346} {"train_loss": -6.394842147827148, "global_step": 98539, "epoch": 2346} {"train_loss": -6.397647857666016, "global_step": 98540, "epoch": 2346} {"train_loss": -6.2689313888549805, "global_step": 98541, "epoch": 2346} {"train_loss": -6.361900329589844, "global_step": 98542, "epoch": 2346} {"train_loss": -6.381714820861816, "global_step": 98543, "epoch": 2346} {"train_loss": -6.337207317352295, "global_step": 98544, "epoch": 2346} {"train_loss": -6.356986999511719, "global_step": 98545, "epoch": 2346} {"train_loss": -6.3404130935668945, "global_step": 98546, "epoch": 2346} {"train_loss": -6.270626068115234, "global_step": 98547, "epoch": 2346} {"train_loss": -6.321809768676758, "global_step": 98548, "epoch": 2346} {"train_loss": -6.280648231506348, "global_step": 98549, "epoch": 2346} {"train_loss": -6.338963508605957, "global_step": 98550, "epoch": 2346} {"train_loss": -6.290918827056885, "global_step": 98551, "epoch": 2346} {"train_loss": -6.285697937011719, "global_step": 98552, "epoch": 2346} {"train_loss": -6.388404369354248, "global_step": 98553, "epoch": 2346} {"train_loss": -6.198617935180664, "global_step": 98554, "epoch": 2346} {"train_loss": -6.356936454772949, "global_step": 98555, "epoch": 2346} {"train_loss": -6.348653316497803, "global_step": 98556, "epoch": 2346} {"train_loss": -6.3409743309021, "global_step": 98557, "epoch": 2346} {"train_loss": -6.2502546310424805, "global_step": 98558, "epoch": 2346} {"train_loss": -6.305245399475098, "global_step": 98559, "epoch": 2346} {"train_loss": -6.339428901672363, "global_step": 98560, "epoch": 2346} {"train_loss": -6.308643341064453, "global_step": 98561, "epoch": 2346} {"train_loss": -6.311610221862793, "global_step": 98562, "epoch": 2346} {"train_loss": -6.382370471954346, "global_step": 98563, "epoch": 2346} {"train_loss": -6.410516738891602, "global_step": 98564, "epoch": 2346} {"train_loss": -6.181726932525635, "global_step": 98565, "epoch": 2346} {"train_loss": -6.172513961791992, "global_step": 98566, "epoch": 2346} {"train_loss": -6.318864822387695, "global_step": 98567, "epoch": 2346} {"train_loss": -6.326235294342041, "global_step": 98568, "epoch": 2346} {"train_loss": -6.390292167663574, "global_step": 98569, "epoch": 2346} {"train_loss": -6.442538738250732, "global_step": 98570, "epoch": 2346} {"train_loss": -6.384573936462402, "global_step": 98571, "epoch": 2346} {"train_loss": -6.281932353973389, "global_step": 98572, "epoch": 2346} {"train_loss": -6.322921446391514, "global_step": 98573, "epoch": 2346, "val_loss": 75890.8984375} {"train_loss": -6.219486236572266, "global_step": 98574, "epoch": 2347} {"train_loss": -6.286516189575195, "global_step": 98575, "epoch": 2347} {"train_loss": -6.430171012878418, "global_step": 98576, "epoch": 2347} {"train_loss": -6.356334686279297, "global_step": 98577, "epoch": 2347} {"train_loss": -6.313501358032227, "global_step": 98578, "epoch": 2347} {"train_loss": -6.337675094604492, "global_step": 98579, "epoch": 2347} {"train_loss": -6.2668843269348145, "global_step": 98580, "epoch": 2347} {"train_loss": -6.33376407623291, "global_step": 98581, "epoch": 2347} {"train_loss": -6.3933796882629395, "global_step": 98582, "epoch": 2347} {"train_loss": -6.3240861892700195, "global_step": 98583, "epoch": 2347} {"train_loss": -6.435445785522461, "global_step": 98584, "epoch": 2347} {"train_loss": -6.341681480407715, "global_step": 98585, "epoch": 2347} {"train_loss": -6.357261657714844, "global_step": 98586, "epoch": 2347} {"train_loss": -6.36696720123291, "global_step": 98587, "epoch": 2347} {"train_loss": -6.3140082359313965, "global_step": 98588, "epoch": 2347} {"train_loss": -6.411872863769531, "global_step": 98589, "epoch": 2347} {"train_loss": -6.394171714782715, "global_step": 98590, "epoch": 2347} {"train_loss": -6.273746490478516, "global_step": 98591, "epoch": 2347} {"train_loss": -6.16063117980957, "global_step": 98592, "epoch": 2347} {"train_loss": -6.251842498779297, "global_step": 98593, "epoch": 2347} {"train_loss": -6.336578369140625, "global_step": 98594, "epoch": 2347} {"train_loss": -6.303801536560059, "global_step": 98595, "epoch": 2347} {"train_loss": -6.31426477432251, "global_step": 98596, "epoch": 2347} {"train_loss": -6.297385215759277, "global_step": 98597, "epoch": 2347} {"train_loss": -6.2573747634887695, "global_step": 98598, "epoch": 2347} {"train_loss": -6.339160442352295, "global_step": 98599, "epoch": 2347} {"train_loss": -6.331350803375244, "global_step": 98600, "epoch": 2347} {"train_loss": -6.441123962402344, "global_step": 98601, "epoch": 2347} {"train_loss": -6.362013816833496, "global_step": 98602, "epoch": 2347} {"train_loss": -6.2901201248168945, "global_step": 98603, "epoch": 2347} {"train_loss": -6.348060131072998, "global_step": 98604, "epoch": 2347} {"train_loss": -6.415020942687988, "global_step": 98605, "epoch": 2347} {"train_loss": -6.31690788269043, "global_step": 98606, "epoch": 2347} {"train_loss": -6.3501081466674805, "global_step": 98607, "epoch": 2347} {"train_loss": -6.489231109619141, "global_step": 98608, "epoch": 2347} {"train_loss": -6.340862274169922, "global_step": 98609, "epoch": 2347} {"train_loss": -6.339128494262695, "global_step": 98610, "epoch": 2347} {"train_loss": -6.4500532150268555, "global_step": 98611, "epoch": 2347} {"train_loss": -6.417539596557617, "global_step": 98612, "epoch": 2347} {"train_loss": -6.214450836181641, "global_step": 98613, "epoch": 2347} {"train_loss": -6.221001148223877, "global_step": 98614, "epoch": 2347} {"train_loss": -6.337920370556059, "global_step": 98615, "epoch": 2347, "val_loss": 75936.34375} {"train_loss": -6.450123310089111, "global_step": 98616, "epoch": 2348} {"train_loss": -6.323474884033203, "global_step": 98617, "epoch": 2348} {"train_loss": -6.342235565185547, "global_step": 98618, "epoch": 2348} {"train_loss": -6.410609722137451, "global_step": 98619, "epoch": 2348} {"train_loss": -6.343405246734619, "global_step": 98620, "epoch": 2348} {"train_loss": -6.415355205535889, "global_step": 98621, "epoch": 2348} {"train_loss": -6.400305271148682, "global_step": 98622, "epoch": 2348} {"train_loss": -6.506442546844482, "global_step": 98623, "epoch": 2348} {"train_loss": -6.406137466430664, "global_step": 98624, "epoch": 2348} {"train_loss": -6.405355930328369, "global_step": 98625, "epoch": 2348} {"train_loss": -6.422034740447998, "global_step": 98626, "epoch": 2348} {"train_loss": -6.443296432495117, "global_step": 98627, "epoch": 2348} {"train_loss": -6.44871711730957, "global_step": 98628, "epoch": 2348} {"train_loss": -6.27964973449707, "global_step": 98629, "epoch": 2348} {"train_loss": -6.377179145812988, "global_step": 98630, "epoch": 2348} {"train_loss": -6.324034214019775, "global_step": 98631, "epoch": 2348} {"train_loss": -6.486136436462402, "global_step": 98632, "epoch": 2348} {"train_loss": -6.292108535766602, "global_step": 98633, "epoch": 2348} {"train_loss": -6.418567180633545, "global_step": 98634, "epoch": 2348} {"train_loss": -6.292065143585205, "global_step": 98635, "epoch": 2348} {"train_loss": -6.413480281829834, "global_step": 98636, "epoch": 2348} {"train_loss": -6.365056037902832, "global_step": 98637, "epoch": 2348} {"train_loss": -6.408207893371582, "global_step": 98638, "epoch": 2348} {"train_loss": -6.302637577056885, "global_step": 98639, "epoch": 2348} {"train_loss": -6.258800506591797, "global_step": 98640, "epoch": 2348} {"train_loss": -6.239421367645264, "global_step": 98641, "epoch": 2348} {"train_loss": -6.334871292114258, "global_step": 98642, "epoch": 2348} {"train_loss": -6.413204669952393, "global_step": 98643, "epoch": 2348} {"train_loss": -6.421669006347656, "global_step": 98644, "epoch": 2348} {"train_loss": -6.507734298706055, "global_step": 98645, "epoch": 2348} {"train_loss": -6.376809120178223, "global_step": 98646, "epoch": 2348} {"train_loss": -6.346985340118408, "global_step": 98647, "epoch": 2348} {"train_loss": -6.416354179382324, "global_step": 98648, "epoch": 2348} {"train_loss": -6.3035736083984375, "global_step": 98649, "epoch": 2348} {"train_loss": -6.247066497802734, "global_step": 98650, "epoch": 2348} {"train_loss": -6.453682899475098, "global_step": 98651, "epoch": 2348} {"train_loss": -6.4703216552734375, "global_step": 98652, "epoch": 2348} {"train_loss": -6.233827590942383, "global_step": 98653, "epoch": 2348} {"train_loss": -6.241388320922852, "global_step": 98654, "epoch": 2348} {"train_loss": -6.473508834838867, "global_step": 98655, "epoch": 2348} {"train_loss": -6.25861930847168, "global_step": 98656, "epoch": 2348} {"train_loss": -6.372213068462553, "global_step": 98657, "epoch": 2348, "val_loss": 75926.53125} {"train_loss": -6.368420124053955, "global_step": 98658, "epoch": 2349} {"train_loss": -6.438076019287109, "global_step": 98659, "epoch": 2349} {"train_loss": -6.238410949707031, "global_step": 98660, "epoch": 2349} {"train_loss": -6.341046333312988, "global_step": 98661, "epoch": 2349} {"train_loss": -6.551702976226807, "global_step": 98662, "epoch": 2349} {"train_loss": -6.421089172363281, "global_step": 98663, "epoch": 2349} {"train_loss": -6.350515365600586, "global_step": 98664, "epoch": 2349} {"train_loss": -6.435142993927002, "global_step": 98665, "epoch": 2349} {"train_loss": -6.431358337402344, "global_step": 98666, "epoch": 2349} {"train_loss": -6.363131046295166, "global_step": 98667, "epoch": 2349} {"train_loss": -6.362456321716309, "global_step": 98668, "epoch": 2349} {"train_loss": -6.396575450897217, "global_step": 98669, "epoch": 2349} {"train_loss": -6.360722064971924, "global_step": 98670, "epoch": 2349} {"train_loss": -6.281905174255371, "global_step": 98671, "epoch": 2349} {"train_loss": -6.388283729553223, "global_step": 98672, "epoch": 2349} {"train_loss": -6.2909650802612305, "global_step": 98673, "epoch": 2349} {"train_loss": -6.326016426086426, "global_step": 98674, "epoch": 2349} {"train_loss": -6.443720817565918, "global_step": 98675, "epoch": 2349} {"train_loss": -6.391973495483398, "global_step": 98676, "epoch": 2349} {"train_loss": -6.351133823394775, "global_step": 98677, "epoch": 2349} {"train_loss": -6.391032695770264, "global_step": 98678, "epoch": 2349} {"train_loss": -6.3818039894104, "global_step": 98679, "epoch": 2349} {"train_loss": -6.318264961242676, "global_step": 98680, "epoch": 2349} {"train_loss": -6.365366458892822, "global_step": 98681, "epoch": 2349} {"train_loss": -6.317520618438721, "global_step": 98682, "epoch": 2349} {"train_loss": -6.186545372009277, "global_step": 98683, "epoch": 2349} {"train_loss": -6.361347198486328, "global_step": 98684, "epoch": 2349} {"train_loss": -6.164239406585693, "global_step": 98685, "epoch": 2349} {"train_loss": -6.373785018920898, "global_step": 98686, "epoch": 2349} {"train_loss": -6.34018611907959, "global_step": 98687, "epoch": 2349} {"train_loss": -6.33460807800293, "global_step": 98688, "epoch": 2349} {"train_loss": -6.401076316833496, "global_step": 98689, "epoch": 2349} {"train_loss": -6.435999870300293, "global_step": 98690, "epoch": 2349} {"train_loss": -6.291978359222412, "global_step": 98691, "epoch": 2349} {"train_loss": -6.367610454559326, "global_step": 98692, "epoch": 2349} {"train_loss": -6.257059097290039, "global_step": 98693, "epoch": 2349} {"train_loss": -6.271603584289551, "global_step": 98694, "epoch": 2349} {"train_loss": -6.346164703369141, "global_step": 98695, "epoch": 2349} {"train_loss": -6.295750141143799, "global_step": 98696, "epoch": 2349} {"train_loss": -6.2821455001831055, "global_step": 98697, "epoch": 2349} {"train_loss": -6.456672668457031, "global_step": 98698, "epoch": 2349} {"train_loss": -6.352916955947876, "global_step": 98699, "epoch": 2349, "val_loss": 75865.9140625} {"train_loss": -6.374032020568848, "global_step": 98700, "epoch": 2350} {"train_loss": -6.402811527252197, "global_step": 98701, "epoch": 2350} {"train_loss": -6.255743980407715, "global_step": 98702, "epoch": 2350} {"train_loss": -6.3873372077941895, "global_step": 98703, "epoch": 2350} {"train_loss": -6.336225509643555, "global_step": 98704, "epoch": 2350} {"train_loss": -6.411688804626465, "global_step": 98705, "epoch": 2350} {"train_loss": -6.3450775146484375, "global_step": 98706, "epoch": 2350} {"train_loss": -6.376840591430664, "global_step": 98707, "epoch": 2350} {"train_loss": -6.430887699127197, "global_step": 98708, "epoch": 2350} {"train_loss": -6.361510753631592, "global_step": 98709, "epoch": 2350} {"train_loss": -6.3368940353393555, "global_step": 98710, "epoch": 2350} {"train_loss": -6.32356595993042, "global_step": 98711, "epoch": 2350} {"train_loss": -6.479975700378418, "global_step": 98712, "epoch": 2350} {"train_loss": -6.379167079925537, "global_step": 98713, "epoch": 2350} {"train_loss": -6.26288366317749, "global_step": 98714, "epoch": 2350} {"train_loss": -6.490448951721191, "global_step": 98715, "epoch": 2350} {"train_loss": -6.317660331726074, "global_step": 98716, "epoch": 2350} {"train_loss": -6.304919719696045, "global_step": 98717, "epoch": 2350} {"train_loss": -6.345171928405762, "global_step": 98718, "epoch": 2350} {"train_loss": -6.3566484451293945, "global_step": 98719, "epoch": 2350} {"train_loss": -6.309390068054199, "global_step": 98720, "epoch": 2350} {"train_loss": -6.290549278259277, "global_step": 98721, "epoch": 2350} {"train_loss": -6.290838241577148, "global_step": 98722, "epoch": 2350} {"train_loss": -6.231461048126221, "global_step": 98723, "epoch": 2350} {"train_loss": -6.283067226409912, "global_step": 98724, "epoch": 2350} {"train_loss": -6.402379035949707, "global_step": 98725, "epoch": 2350} {"train_loss": -6.296144485473633, "global_step": 98726, "epoch": 2350} {"train_loss": -6.348156929016113, "global_step": 98727, "epoch": 2350} {"train_loss": -6.45842981338501, "global_step": 98728, "epoch": 2350} {"train_loss": -6.280294418334961, "global_step": 98729, "epoch": 2350} {"train_loss": -6.184294700622559, "global_step": 98730, "epoch": 2350} {"train_loss": -6.188981056213379, "global_step": 98731, "epoch": 2350} {"train_loss": -6.341272830963135, "global_step": 98732, "epoch": 2350} {"train_loss": -6.325236797332764, "global_step": 98733, "epoch": 2350} {"train_loss": -6.398275375366211, "global_step": 98734, "epoch": 2350} {"train_loss": -6.370076656341553, "global_step": 98735, "epoch": 2350} {"train_loss": -6.372613906860352, "global_step": 98736, "epoch": 2350} {"train_loss": -6.36626672744751, "global_step": 98737, "epoch": 2350} {"train_loss": -6.337956428527832, "global_step": 98738, "epoch": 2350} {"train_loss": -6.369919776916504, "global_step": 98739, "epoch": 2350} {"train_loss": -6.3554887771606445, "global_step": 98740, "epoch": 2350} {"train_loss": -6.345195804323469, "global_step": 98741, "epoch": 2350, "train/sim_max_reward_0": 0.38077346925059535, "train/sim_max_reward_1": 0.8553859378695648, "train/sim_max_reward_2": 0.7246896042254584, "train/sim_max_reward_3": 0.1419980833323313, "train/sim_max_reward_4": 0.5991911924076118, "train/sim_max_reward_5": 0.8986676929916626, "test/sim_max_reward_4500000": 0.416690260394965, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.844975609396907, "test/sim_max_reward_4500003": 0.8162466590228178, "test/sim_max_reward_4500004": 0.9007077371243973, "test/sim_max_reward_4500005": 0.2508589178303062, "test/sim_max_reward_4500006": 0.9912362882961435, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.026632034137578975, "test/sim_max_reward_4500009": 1.0, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.43263676856205024, "test/sim_max_reward_4500012": 0.46910201883334407, "test/sim_max_reward_4500013": 0.007982554656023464, "test/sim_max_reward_4500014": 0.36814755013804595, "test/sim_max_reward_4500015": 0.9142031777534897, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.1445661133751209, "test/sim_max_reward_4500018": 0.3747931028213412, "test/sim_max_reward_4500019": 0.9274487585303572, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.7552023529719106, "test/sim_max_reward_4500022": 0.9068332258407336, "test/sim_max_reward_4500023": 0.8958205714047303, "test/sim_max_reward_4500024": 0.8689721276219889, "test/sim_max_reward_4500025": 0.0, "test/sim_max_reward_4500026": 0.9670003466093854, "test/sim_max_reward_4500027": 0.9869710446142897, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.08501373130601003, "test/sim_max_reward_4500030": 0.9716481512321917, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04715408503781925, "test/sim_max_reward_4500033": 0.7806560950738334, "test/sim_max_reward_4500034": 0.7153626129736587, "test/sim_max_reward_4500035": 0.871687245213416, "test/sim_max_reward_4500036": 0.4703745606184018, "test/sim_max_reward_4500037": 0.8591890344845211, "test/sim_max_reward_4500038": 0.9400673949444132, "test/sim_max_reward_4500039": 0.9290843130217797, "test/sim_max_reward_4500040": 0.903189942444498, "test/sim_max_reward_4500041": 0.9915547117828732, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.14679493680575217, "test/sim_max_reward_4500044": 0.8348240515414271, "test/sim_max_reward_4500045": 0.6717171294194036, "test/sim_max_reward_4500046": 0.5267778358339161, "test/sim_max_reward_4500047": 0.9276776158947619, "test/sim_max_reward_4500048": 0.9390633994523595, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6001176633462041, "test/mean_score": 0.5621405066593662, "val_loss": 75679.515625} {"train_loss": -6.347686767578125, "global_step": 98742, "epoch": 2351} {"train_loss": -6.38053035736084, "global_step": 98743, "epoch": 2351} {"train_loss": -6.406973838806152, "global_step": 98744, "epoch": 2351} {"train_loss": -6.295686721801758, "global_step": 98745, "epoch": 2351} {"train_loss": -6.449368476867676, "global_step": 98746, "epoch": 2351} {"train_loss": -6.377498626708984, "global_step": 98747, "epoch": 2351} {"train_loss": -6.454690933227539, "global_step": 98748, "epoch": 2351} {"train_loss": -6.362977027893066, "global_step": 98749, "epoch": 2351} {"train_loss": -6.367922782897949, "global_step": 98750, "epoch": 2351} {"train_loss": -6.418092727661133, "global_step": 98751, "epoch": 2351} {"train_loss": -6.3128662109375, "global_step": 98752, "epoch": 2351} {"train_loss": -6.423417568206787, "global_step": 98753, "epoch": 2351} {"train_loss": -6.445504665374756, "global_step": 98754, "epoch": 2351} {"train_loss": -6.271186828613281, "global_step": 98755, "epoch": 2351} {"train_loss": -6.336363315582275, "global_step": 98756, "epoch": 2351} {"train_loss": -6.275212287902832, "global_step": 98757, "epoch": 2351} {"train_loss": -6.408236503601074, "global_step": 98758, "epoch": 2351} {"train_loss": -6.431535720825195, "global_step": 98759, "epoch": 2351} {"train_loss": -6.309178352355957, "global_step": 98760, "epoch": 2351} {"train_loss": -6.396055698394775, "global_step": 98761, "epoch": 2351} {"train_loss": -6.291295528411865, "global_step": 98762, "epoch": 2351} {"train_loss": -6.224474906921387, "global_step": 98763, "epoch": 2351} {"train_loss": -6.30001974105835, "global_step": 98764, "epoch": 2351} {"train_loss": -6.379243850708008, "global_step": 98765, "epoch": 2351} {"train_loss": -6.2148590087890625, "global_step": 98766, "epoch": 2351} {"train_loss": -6.231523513793945, "global_step": 98767, "epoch": 2351} {"train_loss": -6.241503715515137, "global_step": 98768, "epoch": 2351} {"train_loss": -6.215555191040039, "global_step": 98769, "epoch": 2351} {"train_loss": -6.305820465087891, "global_step": 98770, "epoch": 2351} {"train_loss": -6.201977729797363, "global_step": 98771, "epoch": 2351} {"train_loss": -6.2659502029418945, "global_step": 98772, "epoch": 2351} {"train_loss": -6.358974933624268, "global_step": 98773, "epoch": 2351} {"train_loss": -6.261381149291992, "global_step": 98774, "epoch": 2351} {"train_loss": -6.342571258544922, "global_step": 98775, "epoch": 2351} {"train_loss": -6.233715534210205, "global_step": 98776, "epoch": 2351} {"train_loss": -6.218031883239746, "global_step": 98777, "epoch": 2351} {"train_loss": -6.215398788452148, "global_step": 98778, "epoch": 2351} {"train_loss": -6.220877647399902, "global_step": 98779, "epoch": 2351} {"train_loss": -6.338630676269531, "global_step": 98780, "epoch": 2351} {"train_loss": -6.264171600341797, "global_step": 98781, "epoch": 2351} {"train_loss": -6.261146068572998, "global_step": 98782, "epoch": 2351} {"train_loss": -6.31692301659357, "global_step": 98783, "epoch": 2351, "val_loss": 75766.875} {"train_loss": -6.4531660079956055, "global_step": 98784, "epoch": 2352} {"train_loss": -6.172030925750732, "global_step": 98785, "epoch": 2352} {"train_loss": -6.385327339172363, "global_step": 98786, "epoch": 2352} {"train_loss": -6.16596794128418, "global_step": 98787, "epoch": 2352} {"train_loss": -6.283404350280762, "global_step": 98788, "epoch": 2352} {"train_loss": -6.303219795227051, "global_step": 98789, "epoch": 2352} {"train_loss": -6.230218887329102, "global_step": 98790, "epoch": 2352} {"train_loss": -6.357274055480957, "global_step": 98791, "epoch": 2352} {"train_loss": -6.316481113433838, "global_step": 98792, "epoch": 2352} {"train_loss": -6.273947238922119, "global_step": 98793, "epoch": 2352} {"train_loss": -6.411569595336914, "global_step": 98794, "epoch": 2352} {"train_loss": -6.360198974609375, "global_step": 98795, "epoch": 2352} {"train_loss": -6.321214199066162, "global_step": 98796, "epoch": 2352} {"train_loss": -6.417842864990234, "global_step": 98797, "epoch": 2352} {"train_loss": -6.305793285369873, "global_step": 98798, "epoch": 2352} {"train_loss": -6.340843200683594, "global_step": 98799, "epoch": 2352} {"train_loss": -6.33447265625, "global_step": 98800, "epoch": 2352} {"train_loss": -6.363305568695068, "global_step": 98801, "epoch": 2352} {"train_loss": -6.397452354431152, "global_step": 98802, "epoch": 2352} {"train_loss": -6.416112422943115, "global_step": 98803, "epoch": 2352} {"train_loss": -6.362838268280029, "global_step": 98804, "epoch": 2352} {"train_loss": -6.358611106872559, "global_step": 98805, "epoch": 2352} {"train_loss": -6.276450157165527, "global_step": 98806, "epoch": 2352} {"train_loss": -6.3595428466796875, "global_step": 98807, "epoch": 2352} {"train_loss": -6.403195381164551, "global_step": 98808, "epoch": 2352} {"train_loss": -6.340828895568848, "global_step": 98809, "epoch": 2352} {"train_loss": -6.310469150543213, "global_step": 98810, "epoch": 2352} {"train_loss": -6.377565383911133, "global_step": 98811, "epoch": 2352} {"train_loss": -6.349265098571777, "global_step": 98812, "epoch": 2352} {"train_loss": -6.367140769958496, "global_step": 98813, "epoch": 2352} {"train_loss": -6.407384872436523, "global_step": 98814, "epoch": 2352} {"train_loss": -6.345073699951172, "global_step": 98815, "epoch": 2352} {"train_loss": -6.306028366088867, "global_step": 98816, "epoch": 2352} {"train_loss": -6.296682357788086, "global_step": 98817, "epoch": 2352} {"train_loss": -6.142224311828613, "global_step": 98818, "epoch": 2352} {"train_loss": -6.253117561340332, "global_step": 98819, "epoch": 2352} {"train_loss": -6.418007850646973, "global_step": 98820, "epoch": 2352} {"train_loss": -6.333220481872559, "global_step": 98821, "epoch": 2352} {"train_loss": -6.173982620239258, "global_step": 98822, "epoch": 2352} {"train_loss": -6.282379150390625, "global_step": 98823, "epoch": 2352} {"train_loss": -6.334536552429199, "global_step": 98824, "epoch": 2352} {"train_loss": -6.326551380611601, "global_step": 98825, "epoch": 2352, "val_loss": 76021.0625} {"train_loss": -6.330009937286377, "global_step": 98826, "epoch": 2353} {"train_loss": -6.403153419494629, "global_step": 98827, "epoch": 2353} {"train_loss": -6.299721717834473, "global_step": 98828, "epoch": 2353} {"train_loss": -6.373300075531006, "global_step": 98829, "epoch": 2353} {"train_loss": -6.402303695678711, "global_step": 98830, "epoch": 2353} {"train_loss": -6.367367744445801, "global_step": 98831, "epoch": 2353} {"train_loss": -6.365814685821533, "global_step": 98832, "epoch": 2353} {"train_loss": -6.335899829864502, "global_step": 98833, "epoch": 2353} {"train_loss": -6.527647972106934, "global_step": 98834, "epoch": 2353} {"train_loss": -6.464306354522705, "global_step": 98835, "epoch": 2353} {"train_loss": -6.335991859436035, "global_step": 98836, "epoch": 2353} {"train_loss": -6.385209083557129, "global_step": 98837, "epoch": 2353} {"train_loss": -6.340830326080322, "global_step": 98838, "epoch": 2353} {"train_loss": -6.372887134552002, "global_step": 98839, "epoch": 2353} {"train_loss": -6.304742813110352, "global_step": 98840, "epoch": 2353} {"train_loss": -6.370708465576172, "global_step": 98841, "epoch": 2353} {"train_loss": -6.399277687072754, "global_step": 98842, "epoch": 2353} {"train_loss": -6.307886123657227, "global_step": 98843, "epoch": 2353} {"train_loss": -6.409479141235352, "global_step": 98844, "epoch": 2353} {"train_loss": -6.36212682723999, "global_step": 98845, "epoch": 2353} {"train_loss": -6.385682582855225, "global_step": 98846, "epoch": 2353} {"train_loss": -6.323085784912109, "global_step": 98847, "epoch": 2353} {"train_loss": -6.406644821166992, "global_step": 98848, "epoch": 2353} {"train_loss": -6.340914726257324, "global_step": 98849, "epoch": 2353} {"train_loss": -6.273982048034668, "global_step": 98850, "epoch": 2353} {"train_loss": -6.3469319343566895, "global_step": 98851, "epoch": 2353} {"train_loss": -6.349294662475586, "global_step": 98852, "epoch": 2353} {"train_loss": -6.28265380859375, "global_step": 98853, "epoch": 2353} {"train_loss": -6.402188301086426, "global_step": 98854, "epoch": 2353} {"train_loss": -6.464695930480957, "global_step": 98855, "epoch": 2353} {"train_loss": -6.31229305267334, "global_step": 98856, "epoch": 2353} {"train_loss": -6.331404209136963, "global_step": 98857, "epoch": 2353} {"train_loss": -6.269070148468018, "global_step": 98858, "epoch": 2353} {"train_loss": -6.364879608154297, "global_step": 98859, "epoch": 2353} {"train_loss": -6.3360114097595215, "global_step": 98860, "epoch": 2353} {"train_loss": -6.392806053161621, "global_step": 98861, "epoch": 2353} {"train_loss": -6.32503080368042, "global_step": 98862, "epoch": 2353} {"train_loss": -6.376298427581787, "global_step": 98863, "epoch": 2353} {"train_loss": -6.378996849060059, "global_step": 98864, "epoch": 2353} {"train_loss": -6.349893569946289, "global_step": 98865, "epoch": 2353} {"train_loss": -6.2931928634643555, "global_step": 98866, "epoch": 2353} {"train_loss": -6.360526925041562, "global_step": 98867, "epoch": 2353, "val_loss": 75798.9453125} {"train_loss": -6.29981803894043, "global_step": 98868, "epoch": 2354} {"train_loss": -6.298584938049316, "global_step": 98869, "epoch": 2354} {"train_loss": -6.35833740234375, "global_step": 98870, "epoch": 2354} {"train_loss": -6.325479507446289, "global_step": 98871, "epoch": 2354} {"train_loss": -6.422858238220215, "global_step": 98872, "epoch": 2354} {"train_loss": -6.438230514526367, "global_step": 98873, "epoch": 2354} {"train_loss": -6.386064529418945, "global_step": 98874, "epoch": 2354} {"train_loss": -6.312854766845703, "global_step": 98875, "epoch": 2354} {"train_loss": -6.451042175292969, "global_step": 98876, "epoch": 2354} {"train_loss": -6.434430122375488, "global_step": 98877, "epoch": 2354} {"train_loss": -6.344262599945068, "global_step": 98878, "epoch": 2354} {"train_loss": -6.3695807456970215, "global_step": 98879, "epoch": 2354} {"train_loss": -6.398049354553223, "global_step": 98880, "epoch": 2354} {"train_loss": -6.377518653869629, "global_step": 98881, "epoch": 2354} {"train_loss": -6.370631217956543, "global_step": 98882, "epoch": 2354} {"train_loss": -6.3198418617248535, "global_step": 98883, "epoch": 2354} {"train_loss": -6.320647239685059, "global_step": 98884, "epoch": 2354} {"train_loss": -6.269980430603027, "global_step": 98885, "epoch": 2354} {"train_loss": -6.341826438903809, "global_step": 98886, "epoch": 2354} {"train_loss": -6.352645397186279, "global_step": 98887, "epoch": 2354} {"train_loss": -6.389321327209473, "global_step": 98888, "epoch": 2354} {"train_loss": -6.354916572570801, "global_step": 98889, "epoch": 2354} {"train_loss": -6.402640342712402, "global_step": 98890, "epoch": 2354} {"train_loss": -6.343405723571777, "global_step": 98891, "epoch": 2354} {"train_loss": -6.347230911254883, "global_step": 98892, "epoch": 2354} {"train_loss": -6.192870140075684, "global_step": 98893, "epoch": 2354} {"train_loss": -6.234619140625, "global_step": 98894, "epoch": 2354} {"train_loss": -6.345202922821045, "global_step": 98895, "epoch": 2354} {"train_loss": -6.321063041687012, "global_step": 98896, "epoch": 2354} {"train_loss": -6.214620590209961, "global_step": 98897, "epoch": 2354} {"train_loss": -6.392613410949707, "global_step": 98898, "epoch": 2354} {"train_loss": -6.260509490966797, "global_step": 98899, "epoch": 2354} {"train_loss": -6.364595413208008, "global_step": 98900, "epoch": 2354} {"train_loss": -6.353335380554199, "global_step": 98901, "epoch": 2354} {"train_loss": -6.301971435546875, "global_step": 98902, "epoch": 2354} {"train_loss": -6.420179843902588, "global_step": 98903, "epoch": 2354} {"train_loss": -6.224303722381592, "global_step": 98904, "epoch": 2354} {"train_loss": -6.33579683303833, "global_step": 98905, "epoch": 2354} {"train_loss": -6.331292152404785, "global_step": 98906, "epoch": 2354} {"train_loss": -6.350065231323242, "global_step": 98907, "epoch": 2354} {"train_loss": -6.3104987144470215, "global_step": 98908, "epoch": 2354} {"train_loss": -6.341717901683989, "global_step": 98909, "epoch": 2354, "val_loss": 75613.4453125} {"train_loss": -6.357883930206299, "global_step": 98910, "epoch": 2355} {"train_loss": -6.433144569396973, "global_step": 98911, "epoch": 2355} {"train_loss": -6.235011577606201, "global_step": 98912, "epoch": 2355} {"train_loss": -6.342108249664307, "global_step": 98913, "epoch": 2355} {"train_loss": -6.407047271728516, "global_step": 98914, "epoch": 2355} {"train_loss": -6.312812805175781, "global_step": 98915, "epoch": 2355} {"train_loss": -6.325711727142334, "global_step": 98916, "epoch": 2355} {"train_loss": -6.285131454467773, "global_step": 98917, "epoch": 2355} {"train_loss": -6.327640056610107, "global_step": 98918, "epoch": 2355} {"train_loss": -6.414355754852295, "global_step": 98919, "epoch": 2355} {"train_loss": -6.376236915588379, "global_step": 98920, "epoch": 2355} {"train_loss": -6.453542709350586, "global_step": 98921, "epoch": 2355} {"train_loss": -6.2760515213012695, "global_step": 98922, "epoch": 2355} {"train_loss": -6.357793807983398, "global_step": 98923, "epoch": 2355} {"train_loss": -6.396785736083984, "global_step": 98924, "epoch": 2355} {"train_loss": -6.35703182220459, "global_step": 98925, "epoch": 2355} {"train_loss": -6.279342174530029, "global_step": 98926, "epoch": 2355} {"train_loss": -6.372156143188477, "global_step": 98927, "epoch": 2355} {"train_loss": -6.3231706619262695, "global_step": 98928, "epoch": 2355} {"train_loss": -6.332209587097168, "global_step": 98929, "epoch": 2355} {"train_loss": -6.397307395935059, "global_step": 98930, "epoch": 2355} {"train_loss": -6.265810966491699, "global_step": 98931, "epoch": 2355} {"train_loss": -6.348115921020508, "global_step": 98932, "epoch": 2355} {"train_loss": -6.280043125152588, "global_step": 98933, "epoch": 2355} {"train_loss": -6.24210786819458, "global_step": 98934, "epoch": 2355} {"train_loss": -6.382376670837402, "global_step": 98935, "epoch": 2355} {"train_loss": -6.322851657867432, "global_step": 98936, "epoch": 2355} {"train_loss": -6.261409759521484, "global_step": 98937, "epoch": 2355} {"train_loss": -6.2503981590271, "global_step": 98938, "epoch": 2355} {"train_loss": -6.367518901824951, "global_step": 98939, "epoch": 2355} {"train_loss": -6.427093505859375, "global_step": 98940, "epoch": 2355} {"train_loss": -6.454715728759766, "global_step": 98941, "epoch": 2355} {"train_loss": -6.464907646179199, "global_step": 98942, "epoch": 2355} {"train_loss": -6.2898359298706055, "global_step": 98943, "epoch": 2355} {"train_loss": -6.467503547668457, "global_step": 98944, "epoch": 2355} {"train_loss": -6.347878456115723, "global_step": 98945, "epoch": 2355} {"train_loss": -6.383063793182373, "global_step": 98946, "epoch": 2355} {"train_loss": -6.356291770935059, "global_step": 98947, "epoch": 2355} {"train_loss": -6.3540191650390625, "global_step": 98948, "epoch": 2355} {"train_loss": -6.393894672393799, "global_step": 98949, "epoch": 2355} {"train_loss": -6.354024887084961, "global_step": 98950, "epoch": 2355} {"train_loss": -6.350491898400443, "global_step": 98951, "epoch": 2355, "val_loss": 75780.0} {"train_loss": -6.341561317443848, "global_step": 98952, "epoch": 2356} {"train_loss": -6.37443733215332, "global_step": 98953, "epoch": 2356} {"train_loss": -6.341253757476807, "global_step": 98954, "epoch": 2356} {"train_loss": -6.16940975189209, "global_step": 98955, "epoch": 2356} {"train_loss": -6.292163848876953, "global_step": 98956, "epoch": 2356} {"train_loss": -6.450592041015625, "global_step": 98957, "epoch": 2356} {"train_loss": -6.397115707397461, "global_step": 98958, "epoch": 2356} {"train_loss": -6.420523643493652, "global_step": 98959, "epoch": 2356} {"train_loss": -6.334590911865234, "global_step": 98960, "epoch": 2356} {"train_loss": -6.329341888427734, "global_step": 98961, "epoch": 2356} {"train_loss": -6.225156784057617, "global_step": 98962, "epoch": 2356} {"train_loss": -6.3326520919799805, "global_step": 98963, "epoch": 2356} {"train_loss": -6.352148056030273, "global_step": 98964, "epoch": 2356} {"train_loss": -6.414363861083984, "global_step": 98965, "epoch": 2356} {"train_loss": -6.449224472045898, "global_step": 98966, "epoch": 2356} {"train_loss": -6.360019683837891, "global_step": 98967, "epoch": 2356} {"train_loss": -6.314922332763672, "global_step": 98968, "epoch": 2356} {"train_loss": -6.344369888305664, "global_step": 98969, "epoch": 2356} {"train_loss": -6.142396926879883, "global_step": 98970, "epoch": 2356} {"train_loss": -6.172210693359375, "global_step": 98971, "epoch": 2356} {"train_loss": -6.377486228942871, "global_step": 98972, "epoch": 2356} {"train_loss": -6.2619781494140625, "global_step": 98973, "epoch": 2356} {"train_loss": -6.393803119659424, "global_step": 98974, "epoch": 2356} {"train_loss": -6.3409271240234375, "global_step": 98975, "epoch": 2356} {"train_loss": -6.141526222229004, "global_step": 98976, "epoch": 2356} {"train_loss": -6.367390155792236, "global_step": 98977, "epoch": 2356} {"train_loss": -6.227128982543945, "global_step": 98978, "epoch": 2356} {"train_loss": -6.375675201416016, "global_step": 98979, "epoch": 2356} {"train_loss": -6.328670978546143, "global_step": 98980, "epoch": 2356} {"train_loss": -6.282584190368652, "global_step": 98981, "epoch": 2356} {"train_loss": -6.350722312927246, "global_step": 98982, "epoch": 2356} {"train_loss": -6.206609725952148, "global_step": 98983, "epoch": 2356} {"train_loss": -6.286170959472656, "global_step": 98984, "epoch": 2356} {"train_loss": -6.251827239990234, "global_step": 98985, "epoch": 2356} {"train_loss": -6.329285621643066, "global_step": 98986, "epoch": 2356} {"train_loss": -6.1768479347229, "global_step": 98987, "epoch": 2356} {"train_loss": -6.149234771728516, "global_step": 98988, "epoch": 2356} {"train_loss": -6.270990371704102, "global_step": 98989, "epoch": 2356} {"train_loss": -6.116554260253906, "global_step": 98990, "epoch": 2356} {"train_loss": -6.298325061798096, "global_step": 98991, "epoch": 2356} {"train_loss": -6.337560653686523, "global_step": 98992, "epoch": 2356} {"train_loss": -6.300626573108492, "global_step": 98993, "epoch": 2356, "val_loss": 75793.2265625} {"train_loss": -6.287420272827148, "global_step": 98994, "epoch": 2357} {"train_loss": -6.329313278198242, "global_step": 98995, "epoch": 2357} {"train_loss": -6.257180213928223, "global_step": 98996, "epoch": 2357} {"train_loss": -6.161364555358887, "global_step": 98997, "epoch": 2357} {"train_loss": -6.188028335571289, "global_step": 98998, "epoch": 2357} {"train_loss": -6.272748947143555, "global_step": 98999, "epoch": 2357} {"train_loss": -6.184409141540527, "global_step": 99000, "epoch": 2357} {"train_loss": -6.376289367675781, "global_step": 99001, "epoch": 2357} {"train_loss": -6.202463150024414, "global_step": 99002, "epoch": 2357} {"train_loss": -6.411509990692139, "global_step": 99003, "epoch": 2357} {"train_loss": -6.1925458908081055, "global_step": 99004, "epoch": 2357} {"train_loss": -6.210713863372803, "global_step": 99005, "epoch": 2357} {"train_loss": -6.223776340484619, "global_step": 99006, "epoch": 2357} {"train_loss": -6.046479225158691, "global_step": 99007, "epoch": 2357} {"train_loss": -6.373615264892578, "global_step": 99008, "epoch": 2357} {"train_loss": -6.208752632141113, "global_step": 99009, "epoch": 2357} {"train_loss": -6.264970302581787, "global_step": 99010, "epoch": 2357} {"train_loss": -6.026808261871338, "global_step": 99011, "epoch": 2357} {"train_loss": -6.346764087677002, "global_step": 99012, "epoch": 2357} {"train_loss": -6.108933925628662, "global_step": 99013, "epoch": 2357} {"train_loss": -6.423614501953125, "global_step": 99014, "epoch": 2357} {"train_loss": -6.115643501281738, "global_step": 99015, "epoch": 2357} {"train_loss": -6.205802917480469, "global_step": 99016, "epoch": 2357} {"train_loss": -6.189624786376953, "global_step": 99017, "epoch": 2357} {"train_loss": -6.2172064781188965, "global_step": 99018, "epoch": 2357} {"train_loss": -6.305375099182129, "global_step": 99019, "epoch": 2357} {"train_loss": -6.32312536239624, "global_step": 99020, "epoch": 2357} {"train_loss": -6.238785266876221, "global_step": 99021, "epoch": 2357} {"train_loss": -6.258610248565674, "global_step": 99022, "epoch": 2357} {"train_loss": -6.303132057189941, "global_step": 99023, "epoch": 2357} {"train_loss": -6.217684268951416, "global_step": 99024, "epoch": 2357} {"train_loss": -6.308717727661133, "global_step": 99025, "epoch": 2357} {"train_loss": -6.302999973297119, "global_step": 99026, "epoch": 2357} {"train_loss": -6.268923759460449, "global_step": 99027, "epoch": 2357} {"train_loss": -6.22117805480957, "global_step": 99028, "epoch": 2357} {"train_loss": -6.370002269744873, "global_step": 99029, "epoch": 2357} {"train_loss": -6.2816853523254395, "global_step": 99030, "epoch": 2357} {"train_loss": -6.27898645401001, "global_step": 99031, "epoch": 2357} {"train_loss": -6.247891426086426, "global_step": 99032, "epoch": 2357} {"train_loss": -6.31480598449707, "global_step": 99033, "epoch": 2357} {"train_loss": -6.301631927490234, "global_step": 99034, "epoch": 2357} {"train_loss": -6.2537552288600375, "global_step": 99035, "epoch": 2357, "val_loss": 76154.9453125} {"train_loss": -6.223426342010498, "global_step": 99036, "epoch": 2358} {"train_loss": -6.236362457275391, "global_step": 99037, "epoch": 2358} {"train_loss": -6.321026802062988, "global_step": 99038, "epoch": 2358} {"train_loss": -6.332496166229248, "global_step": 99039, "epoch": 2358} {"train_loss": -6.298307418823242, "global_step": 99040, "epoch": 2358} {"train_loss": -6.340215682983398, "global_step": 99041, "epoch": 2358} {"train_loss": -6.284134864807129, "global_step": 99042, "epoch": 2358} {"train_loss": -6.295651435852051, "global_step": 99043, "epoch": 2358} {"train_loss": -6.2637481689453125, "global_step": 99044, "epoch": 2358} {"train_loss": -6.377850532531738, "global_step": 99045, "epoch": 2358} {"train_loss": -6.378745079040527, "global_step": 99046, "epoch": 2358} {"train_loss": -6.163538932800293, "global_step": 99047, "epoch": 2358} {"train_loss": -6.252570152282715, "global_step": 99048, "epoch": 2358} {"train_loss": -6.33317756652832, "global_step": 99049, "epoch": 2358} {"train_loss": -6.246192455291748, "global_step": 99050, "epoch": 2358} {"train_loss": -6.255102157592773, "global_step": 99051, "epoch": 2358} {"train_loss": -6.28070592880249, "global_step": 99052, "epoch": 2358} {"train_loss": -6.419336318969727, "global_step": 99053, "epoch": 2358} {"train_loss": -6.3100996017456055, "global_step": 99054, "epoch": 2358} {"train_loss": -6.367778778076172, "global_step": 99055, "epoch": 2358} {"train_loss": -6.246433734893799, "global_step": 99056, "epoch": 2358} {"train_loss": -6.446268081665039, "global_step": 99057, "epoch": 2358} {"train_loss": -6.321650981903076, "global_step": 99058, "epoch": 2358} {"train_loss": -6.255199909210205, "global_step": 99059, "epoch": 2358} {"train_loss": -6.236220359802246, "global_step": 99060, "epoch": 2358} {"train_loss": -6.301999092102051, "global_step": 99061, "epoch": 2358} {"train_loss": -6.299125671386719, "global_step": 99062, "epoch": 2358} {"train_loss": -6.307197093963623, "global_step": 99063, "epoch": 2358} {"train_loss": -6.3789143562316895, "global_step": 99064, "epoch": 2358} {"train_loss": -6.321802139282227, "global_step": 99065, "epoch": 2358} {"train_loss": -6.109426498413086, "global_step": 99066, "epoch": 2358} {"train_loss": -6.2967529296875, "global_step": 99067, "epoch": 2358} {"train_loss": -6.2437334060668945, "global_step": 99068, "epoch": 2358} {"train_loss": -6.394063949584961, "global_step": 99069, "epoch": 2358} {"train_loss": -6.349283218383789, "global_step": 99070, "epoch": 2358} {"train_loss": -6.448572158813477, "global_step": 99071, "epoch": 2358} {"train_loss": -6.29698371887207, "global_step": 99072, "epoch": 2358} {"train_loss": -6.426546573638916, "global_step": 99073, "epoch": 2358} {"train_loss": -6.294429302215576, "global_step": 99074, "epoch": 2358} {"train_loss": -6.211009979248047, "global_step": 99075, "epoch": 2358} {"train_loss": -6.3421196937561035, "global_step": 99076, "epoch": 2358} {"train_loss": -6.30931492078872, "global_step": 99077, "epoch": 2358, "val_loss": 75794.578125} {"train_loss": -6.429254531860352, "global_step": 99078, "epoch": 2359} {"train_loss": -6.269705772399902, "global_step": 99079, "epoch": 2359} {"train_loss": -6.299515724182129, "global_step": 99080, "epoch": 2359} {"train_loss": -6.279537677764893, "global_step": 99081, "epoch": 2359} {"train_loss": -6.2280097007751465, "global_step": 99082, "epoch": 2359} {"train_loss": -6.222506523132324, "global_step": 99083, "epoch": 2359} {"train_loss": -6.353907585144043, "global_step": 99084, "epoch": 2359} {"train_loss": -6.397745132446289, "global_step": 99085, "epoch": 2359} {"train_loss": -6.454657554626465, "global_step": 99086, "epoch": 2359} {"train_loss": -6.321843147277832, "global_step": 99087, "epoch": 2359} {"train_loss": -6.342148780822754, "global_step": 99088, "epoch": 2359} {"train_loss": -6.266347408294678, "global_step": 99089, "epoch": 2359} {"train_loss": -6.306452751159668, "global_step": 99090, "epoch": 2359} {"train_loss": -6.300443172454834, "global_step": 99091, "epoch": 2359} {"train_loss": -6.346220970153809, "global_step": 99092, "epoch": 2359} {"train_loss": -6.272729396820068, "global_step": 99093, "epoch": 2359} {"train_loss": -6.205504417419434, "global_step": 99094, "epoch": 2359} {"train_loss": -6.396186828613281, "global_step": 99095, "epoch": 2359} {"train_loss": -6.282977104187012, "global_step": 99096, "epoch": 2359} {"train_loss": -6.178463459014893, "global_step": 99097, "epoch": 2359} {"train_loss": -6.292689800262451, "global_step": 99098, "epoch": 2359} {"train_loss": -6.386581897735596, "global_step": 99099, "epoch": 2359} {"train_loss": -6.2644805908203125, "global_step": 99100, "epoch": 2359} {"train_loss": -6.3148193359375, "global_step": 99101, "epoch": 2359} {"train_loss": -6.335713863372803, "global_step": 99102, "epoch": 2359} {"train_loss": -6.351741790771484, "global_step": 99103, "epoch": 2359} {"train_loss": -6.351596355438232, "global_step": 99104, "epoch": 2359} {"train_loss": -6.39915132522583, "global_step": 99105, "epoch": 2359} {"train_loss": -6.356113910675049, "global_step": 99106, "epoch": 2359} {"train_loss": -6.438681125640869, "global_step": 99107, "epoch": 2359} {"train_loss": -6.328343391418457, "global_step": 99108, "epoch": 2359} {"train_loss": -6.43220329284668, "global_step": 99109, "epoch": 2359} {"train_loss": -6.332945823669434, "global_step": 99110, "epoch": 2359} {"train_loss": -6.266813278198242, "global_step": 99111, "epoch": 2359} {"train_loss": -6.345608234405518, "global_step": 99112, "epoch": 2359} {"train_loss": -6.523914337158203, "global_step": 99113, "epoch": 2359} {"train_loss": -6.253925323486328, "global_step": 99114, "epoch": 2359} {"train_loss": -6.3625898361206055, "global_step": 99115, "epoch": 2359} {"train_loss": -6.277217864990234, "global_step": 99116, "epoch": 2359} {"train_loss": -6.400027275085449, "global_step": 99117, "epoch": 2359} {"train_loss": -6.326854705810547, "global_step": 99118, "epoch": 2359} {"train_loss": -6.3313463642483665, "global_step": 99119, "epoch": 2359, "val_loss": 75859.0859375} {"train_loss": -6.3025803565979, "global_step": 99120, "epoch": 2360} {"train_loss": -6.2209577560424805, "global_step": 99121, "epoch": 2360} {"train_loss": -6.376613616943359, "global_step": 99122, "epoch": 2360} {"train_loss": -6.282772064208984, "global_step": 99123, "epoch": 2360} {"train_loss": -6.245816230773926, "global_step": 99124, "epoch": 2360} {"train_loss": -6.447659492492676, "global_step": 99125, "epoch": 2360} {"train_loss": -6.326645851135254, "global_step": 99126, "epoch": 2360} {"train_loss": -6.353195667266846, "global_step": 99127, "epoch": 2360} {"train_loss": -6.324752330780029, "global_step": 99128, "epoch": 2360} {"train_loss": -6.3354291915893555, "global_step": 99129, "epoch": 2360} {"train_loss": -6.292015075683594, "global_step": 99130, "epoch": 2360} {"train_loss": -6.2835187911987305, "global_step": 99131, "epoch": 2360} {"train_loss": -6.370640754699707, "global_step": 99132, "epoch": 2360} {"train_loss": -6.386049270629883, "global_step": 99133, "epoch": 2360} {"train_loss": -6.16895055770874, "global_step": 99134, "epoch": 2360} {"train_loss": -6.3432722091674805, "global_step": 99135, "epoch": 2360} {"train_loss": -6.2306413650512695, "global_step": 99136, "epoch": 2360} {"train_loss": -6.217643737792969, "global_step": 99137, "epoch": 2360} {"train_loss": -6.356237411499023, "global_step": 99138, "epoch": 2360} {"train_loss": -6.275300979614258, "global_step": 99139, "epoch": 2360} {"train_loss": -6.3825788497924805, "global_step": 99140, "epoch": 2360} {"train_loss": -6.248840808868408, "global_step": 99141, "epoch": 2360} {"train_loss": -6.328014373779297, "global_step": 99142, "epoch": 2360} {"train_loss": -6.319754123687744, "global_step": 99143, "epoch": 2360} {"train_loss": -6.329590797424316, "global_step": 99144, "epoch": 2360} {"train_loss": -6.318016529083252, "global_step": 99145, "epoch": 2360} {"train_loss": -6.28507137298584, "global_step": 99146, "epoch": 2360} {"train_loss": -6.281127452850342, "global_step": 99147, "epoch": 2360} {"train_loss": -6.371367931365967, "global_step": 99148, "epoch": 2360} {"train_loss": -6.237790107727051, "global_step": 99149, "epoch": 2360} {"train_loss": -6.314307689666748, "global_step": 99150, "epoch": 2360} {"train_loss": -6.135231971740723, "global_step": 99151, "epoch": 2360} {"train_loss": -6.141005039215088, "global_step": 99152, "epoch": 2360} {"train_loss": -6.285683631896973, "global_step": 99153, "epoch": 2360} {"train_loss": -6.300373077392578, "global_step": 99154, "epoch": 2360} {"train_loss": -6.174659729003906, "global_step": 99155, "epoch": 2360} {"train_loss": -6.282144546508789, "global_step": 99156, "epoch": 2360} {"train_loss": -6.043618202209473, "global_step": 99157, "epoch": 2360} {"train_loss": -6.138882637023926, "global_step": 99158, "epoch": 2360} {"train_loss": -6.185300827026367, "global_step": 99159, "epoch": 2360} {"train_loss": -6.16619873046875, "global_step": 99160, "epoch": 2360} {"train_loss": -6.2814896901448565, "global_step": 99161, "epoch": 2360, "val_loss": 76011.6015625} {"train_loss": -6.117821216583252, "global_step": 99162, "epoch": 2361} {"train_loss": -6.45115852355957, "global_step": 99163, "epoch": 2361} {"train_loss": -6.147345542907715, "global_step": 99164, "epoch": 2361} {"train_loss": -6.378778457641602, "global_step": 99165, "epoch": 2361} {"train_loss": -6.178531646728516, "global_step": 99166, "epoch": 2361} {"train_loss": -6.248199462890625, "global_step": 99167, "epoch": 2361} {"train_loss": -6.354809761047363, "global_step": 99168, "epoch": 2361} {"train_loss": -6.385546684265137, "global_step": 99169, "epoch": 2361} {"train_loss": -6.358526229858398, "global_step": 99170, "epoch": 2361} {"train_loss": -6.310116291046143, "global_step": 99171, "epoch": 2361} {"train_loss": -6.184842109680176, "global_step": 99172, "epoch": 2361} {"train_loss": -6.2460784912109375, "global_step": 99173, "epoch": 2361} {"train_loss": -6.278573036193848, "global_step": 99174, "epoch": 2361} {"train_loss": -6.335465431213379, "global_step": 99175, "epoch": 2361} {"train_loss": -6.4166998863220215, "global_step": 99176, "epoch": 2361} {"train_loss": -6.3835320472717285, "global_step": 99177, "epoch": 2361} {"train_loss": -6.3365607261657715, "global_step": 99178, "epoch": 2361} {"train_loss": -6.362090587615967, "global_step": 99179, "epoch": 2361} {"train_loss": -6.211138725280762, "global_step": 99180, "epoch": 2361} {"train_loss": -6.379870891571045, "global_step": 99181, "epoch": 2361} {"train_loss": -6.431550025939941, "global_step": 99182, "epoch": 2361} {"train_loss": -6.3980488777160645, "global_step": 99183, "epoch": 2361} {"train_loss": -6.491659164428711, "global_step": 99184, "epoch": 2361} {"train_loss": -6.459336280822754, "global_step": 99185, "epoch": 2361} {"train_loss": -6.458371639251709, "global_step": 99186, "epoch": 2361} {"train_loss": -6.352239608764648, "global_step": 99187, "epoch": 2361} {"train_loss": -6.3400163650512695, "global_step": 99188, "epoch": 2361} {"train_loss": -6.452030181884766, "global_step": 99189, "epoch": 2361} {"train_loss": -6.220541477203369, "global_step": 99190, "epoch": 2361} {"train_loss": -6.342670440673828, "global_step": 99191, "epoch": 2361} {"train_loss": -6.3834228515625, "global_step": 99192, "epoch": 2361} {"train_loss": -6.36760139465332, "global_step": 99193, "epoch": 2361} {"train_loss": -6.204387187957764, "global_step": 99194, "epoch": 2361} {"train_loss": -6.367761135101318, "global_step": 99195, "epoch": 2361} {"train_loss": -6.364340782165527, "global_step": 99196, "epoch": 2361} {"train_loss": -6.392799377441406, "global_step": 99197, "epoch": 2361} {"train_loss": -6.302109241485596, "global_step": 99198, "epoch": 2361} {"train_loss": -6.252009868621826, "global_step": 99199, "epoch": 2361} {"train_loss": -6.2222442626953125, "global_step": 99200, "epoch": 2361} {"train_loss": -6.390297889709473, "global_step": 99201, "epoch": 2361} {"train_loss": -6.292301177978516, "global_step": 99202, "epoch": 2361} {"train_loss": -6.328098512831188, "global_step": 99203, "epoch": 2361, "val_loss": 75731.1015625} {"train_loss": -6.44210147857666, "global_step": 99204, "epoch": 2362} {"train_loss": -6.371151447296143, "global_step": 99205, "epoch": 2362} {"train_loss": -6.311472415924072, "global_step": 99206, "epoch": 2362} {"train_loss": -6.292633533477783, "global_step": 99207, "epoch": 2362} {"train_loss": -6.335968494415283, "global_step": 99208, "epoch": 2362} {"train_loss": -6.3719635009765625, "global_step": 99209, "epoch": 2362} {"train_loss": -6.418490409851074, "global_step": 99210, "epoch": 2362} {"train_loss": -6.270932197570801, "global_step": 99211, "epoch": 2362} {"train_loss": -6.421665191650391, "global_step": 99212, "epoch": 2362} {"train_loss": -6.315184593200684, "global_step": 99213, "epoch": 2362} {"train_loss": -6.368163108825684, "global_step": 99214, "epoch": 2362} {"train_loss": -6.363433361053467, "global_step": 99215, "epoch": 2362} {"train_loss": -6.392214775085449, "global_step": 99216, "epoch": 2362} {"train_loss": -6.391993522644043, "global_step": 99217, "epoch": 2362} {"train_loss": -6.44397497177124, "global_step": 99218, "epoch": 2362} {"train_loss": -6.482354164123535, "global_step": 99219, "epoch": 2362} {"train_loss": -6.311139106750488, "global_step": 99220, "epoch": 2362} {"train_loss": -6.414381980895996, "global_step": 99221, "epoch": 2362} {"train_loss": -6.351079940795898, "global_step": 99222, "epoch": 2362} {"train_loss": -6.356125354766846, "global_step": 99223, "epoch": 2362} {"train_loss": -6.366397857666016, "global_step": 99224, "epoch": 2362} {"train_loss": -6.321752071380615, "global_step": 99225, "epoch": 2362} {"train_loss": -6.388261795043945, "global_step": 99226, "epoch": 2362} {"train_loss": -6.414979934692383, "global_step": 99227, "epoch": 2362} {"train_loss": -6.454085350036621, "global_step": 99228, "epoch": 2362} {"train_loss": -6.376787185668945, "global_step": 99229, "epoch": 2362} {"train_loss": -6.399452209472656, "global_step": 99230, "epoch": 2362} {"train_loss": -6.3605194091796875, "global_step": 99231, "epoch": 2362} {"train_loss": -6.379603862762451, "global_step": 99232, "epoch": 2362} {"train_loss": -6.364592552185059, "global_step": 99233, "epoch": 2362} {"train_loss": -6.339072227478027, "global_step": 99234, "epoch": 2362} {"train_loss": -6.4609174728393555, "global_step": 99235, "epoch": 2362} {"train_loss": -6.259150505065918, "global_step": 99236, "epoch": 2362} {"train_loss": -6.370091438293457, "global_step": 99237, "epoch": 2362} {"train_loss": -6.421406269073486, "global_step": 99238, "epoch": 2362} {"train_loss": -6.276409149169922, "global_step": 99239, "epoch": 2362} {"train_loss": -6.444572448730469, "global_step": 99240, "epoch": 2362} {"train_loss": -6.386068344116211, "global_step": 99241, "epoch": 2362} {"train_loss": -6.405098915100098, "global_step": 99242, "epoch": 2362} {"train_loss": -6.322694778442383, "global_step": 99243, "epoch": 2362} {"train_loss": -6.444548606872559, "global_step": 99244, "epoch": 2362} {"train_loss": -6.375028780528477, "global_step": 99245, "epoch": 2362, "val_loss": 75740.234375} {"train_loss": -6.4009785652160645, "global_step": 99246, "epoch": 2363} {"train_loss": -6.341319561004639, "global_step": 99247, "epoch": 2363} {"train_loss": -6.416470050811768, "global_step": 99248, "epoch": 2363} {"train_loss": -6.357539176940918, "global_step": 99249, "epoch": 2363} {"train_loss": -6.368680953979492, "global_step": 99250, "epoch": 2363} {"train_loss": -6.339723587036133, "global_step": 99251, "epoch": 2363} {"train_loss": -6.196255683898926, "global_step": 99252, "epoch": 2363} {"train_loss": -6.284815311431885, "global_step": 99253, "epoch": 2363} {"train_loss": -6.197648525238037, "global_step": 99254, "epoch": 2363} {"train_loss": -6.205541133880615, "global_step": 99255, "epoch": 2363} {"train_loss": -6.36103630065918, "global_step": 99256, "epoch": 2363} {"train_loss": -6.214687347412109, "global_step": 99257, "epoch": 2363} {"train_loss": -6.318286895751953, "global_step": 99258, "epoch": 2363} {"train_loss": -6.283810615539551, "global_step": 99259, "epoch": 2363} {"train_loss": -6.233400821685791, "global_step": 99260, "epoch": 2363} {"train_loss": -6.405081748962402, "global_step": 99261, "epoch": 2363} {"train_loss": -6.298800468444824, "global_step": 99262, "epoch": 2363} {"train_loss": -6.416728973388672, "global_step": 99263, "epoch": 2363} {"train_loss": -6.43483829498291, "global_step": 99264, "epoch": 2363} {"train_loss": -6.2737956047058105, "global_step": 99265, "epoch": 2363} {"train_loss": -6.3094482421875, "global_step": 99266, "epoch": 2363} {"train_loss": -6.413453102111816, "global_step": 99267, "epoch": 2363} {"train_loss": -6.2369585037231445, "global_step": 99268, "epoch": 2363} {"train_loss": -6.268177032470703, "global_step": 99269, "epoch": 2363} {"train_loss": -6.316553115844727, "global_step": 99270, "epoch": 2363} {"train_loss": -6.433835506439209, "global_step": 99271, "epoch": 2363} {"train_loss": -6.435027122497559, "global_step": 99272, "epoch": 2363} {"train_loss": -6.2253193855285645, "global_step": 99273, "epoch": 2363} {"train_loss": -6.372343063354492, "global_step": 99274, "epoch": 2363} {"train_loss": -6.248984336853027, "global_step": 99275, "epoch": 2363} {"train_loss": -6.479485988616943, "global_step": 99276, "epoch": 2363} {"train_loss": -6.350770950317383, "global_step": 99277, "epoch": 2363} {"train_loss": -6.321089744567871, "global_step": 99278, "epoch": 2363} {"train_loss": -6.229894161224365, "global_step": 99279, "epoch": 2363} {"train_loss": -6.369235038757324, "global_step": 99280, "epoch": 2363} {"train_loss": -6.336933612823486, "global_step": 99281, "epoch": 2363} {"train_loss": -6.311502456665039, "global_step": 99282, "epoch": 2363} {"train_loss": -6.362791061401367, "global_step": 99283, "epoch": 2363} {"train_loss": -6.26692533493042, "global_step": 99284, "epoch": 2363} {"train_loss": -6.334500789642334, "global_step": 99285, "epoch": 2363} {"train_loss": -6.389907360076904, "global_step": 99286, "epoch": 2363} {"train_loss": -6.325648637044997, "global_step": 99287, "epoch": 2363, "val_loss": 75634.6875} {"train_loss": -6.403509140014648, "global_step": 99288, "epoch": 2364} {"train_loss": -6.2873992919921875, "global_step": 99289, "epoch": 2364} {"train_loss": -6.399999141693115, "global_step": 99290, "epoch": 2364} {"train_loss": -6.316322326660156, "global_step": 99291, "epoch": 2364} {"train_loss": -6.357697486877441, "global_step": 99292, "epoch": 2364} {"train_loss": -6.481678009033203, "global_step": 99293, "epoch": 2364} {"train_loss": -6.40364933013916, "global_step": 99294, "epoch": 2364} {"train_loss": -6.450378894805908, "global_step": 99295, "epoch": 2364} {"train_loss": -6.264826774597168, "global_step": 99296, "epoch": 2364} {"train_loss": -6.345141410827637, "global_step": 99297, "epoch": 2364} {"train_loss": -6.360273361206055, "global_step": 99298, "epoch": 2364} {"train_loss": -6.242191314697266, "global_step": 99299, "epoch": 2364} {"train_loss": -6.360991477966309, "global_step": 99300, "epoch": 2364} {"train_loss": -6.36356258392334, "global_step": 99301, "epoch": 2364} {"train_loss": -6.4006476402282715, "global_step": 99302, "epoch": 2364} {"train_loss": -6.330131530761719, "global_step": 99303, "epoch": 2364} {"train_loss": -6.383703231811523, "global_step": 99304, "epoch": 2364} {"train_loss": -6.374454021453857, "global_step": 99305, "epoch": 2364} {"train_loss": -6.284289360046387, "global_step": 99306, "epoch": 2364} {"train_loss": -6.388542175292969, "global_step": 99307, "epoch": 2364} {"train_loss": -6.2782087326049805, "global_step": 99308, "epoch": 2364} {"train_loss": -6.325207710266113, "global_step": 99309, "epoch": 2364} {"train_loss": -6.294218063354492, "global_step": 99310, "epoch": 2364} {"train_loss": -6.410543441772461, "global_step": 99311, "epoch": 2364} {"train_loss": -6.4735260009765625, "global_step": 99312, "epoch": 2364} {"train_loss": -6.335920810699463, "global_step": 99313, "epoch": 2364} {"train_loss": -6.348916530609131, "global_step": 99314, "epoch": 2364} {"train_loss": -6.337540149688721, "global_step": 99315, "epoch": 2364} {"train_loss": -6.432079315185547, "global_step": 99316, "epoch": 2364} {"train_loss": -6.483557224273682, "global_step": 99317, "epoch": 2364} {"train_loss": -6.3596906661987305, "global_step": 99318, "epoch": 2364} {"train_loss": -6.336217880249023, "global_step": 99319, "epoch": 2364} {"train_loss": -6.360191345214844, "global_step": 99320, "epoch": 2364} {"train_loss": -6.438915252685547, "global_step": 99321, "epoch": 2364} {"train_loss": -6.429508209228516, "global_step": 99322, "epoch": 2364} {"train_loss": -6.406398296356201, "global_step": 99323, "epoch": 2364} {"train_loss": -6.403233528137207, "global_step": 99324, "epoch": 2364} {"train_loss": -6.336390972137451, "global_step": 99325, "epoch": 2364} {"train_loss": -6.435130596160889, "global_step": 99326, "epoch": 2364} {"train_loss": -6.2851481437683105, "global_step": 99327, "epoch": 2364} {"train_loss": -6.344891548156738, "global_step": 99328, "epoch": 2364} {"train_loss": -6.370845249720982, "global_step": 99329, "epoch": 2364, "val_loss": 75740.1796875} {"train_loss": -6.282764911651611, "global_step": 99330, "epoch": 2365} {"train_loss": -6.345276832580566, "global_step": 99331, "epoch": 2365} {"train_loss": -6.370772361755371, "global_step": 99332, "epoch": 2365} {"train_loss": -6.292304039001465, "global_step": 99333, "epoch": 2365} {"train_loss": -6.344038963317871, "global_step": 99334, "epoch": 2365} {"train_loss": -6.438424110412598, "global_step": 99335, "epoch": 2365} {"train_loss": -6.393009662628174, "global_step": 99336, "epoch": 2365} {"train_loss": -6.439800262451172, "global_step": 99337, "epoch": 2365} {"train_loss": -6.287161827087402, "global_step": 99338, "epoch": 2365} {"train_loss": -6.372106552124023, "global_step": 99339, "epoch": 2365} {"train_loss": -6.341167449951172, "global_step": 99340, "epoch": 2365} {"train_loss": -6.303012847900391, "global_step": 99341, "epoch": 2365} {"train_loss": -6.4898834228515625, "global_step": 99342, "epoch": 2365} {"train_loss": -6.3491692543029785, "global_step": 99343, "epoch": 2365} {"train_loss": -6.366863250732422, "global_step": 99344, "epoch": 2365} {"train_loss": -6.374617576599121, "global_step": 99345, "epoch": 2365} {"train_loss": -6.322721004486084, "global_step": 99346, "epoch": 2365} {"train_loss": -6.305681228637695, "global_step": 99347, "epoch": 2365} {"train_loss": -6.328702926635742, "global_step": 99348, "epoch": 2365} {"train_loss": -6.382791042327881, "global_step": 99349, "epoch": 2365} {"train_loss": -6.417679786682129, "global_step": 99350, "epoch": 2365} {"train_loss": -6.338736534118652, "global_step": 99351, "epoch": 2365} {"train_loss": -6.3692522048950195, "global_step": 99352, "epoch": 2365} {"train_loss": -6.349064826965332, "global_step": 99353, "epoch": 2365} {"train_loss": -6.317902565002441, "global_step": 99354, "epoch": 2365} {"train_loss": -6.3852057456970215, "global_step": 99355, "epoch": 2365} {"train_loss": -6.45867919921875, "global_step": 99356, "epoch": 2365} {"train_loss": -6.308394908905029, "global_step": 99357, "epoch": 2365} {"train_loss": -6.366913318634033, "global_step": 99358, "epoch": 2365} {"train_loss": -6.329878807067871, "global_step": 99359, "epoch": 2365} {"train_loss": -6.293234825134277, "global_step": 99360, "epoch": 2365} {"train_loss": -6.276171684265137, "global_step": 99361, "epoch": 2365} {"train_loss": -6.295594215393066, "global_step": 99362, "epoch": 2365} {"train_loss": -6.193330764770508, "global_step": 99363, "epoch": 2365} {"train_loss": -6.37955379486084, "global_step": 99364, "epoch": 2365} {"train_loss": -6.293148994445801, "global_step": 99365, "epoch": 2365} {"train_loss": -6.37803316116333, "global_step": 99366, "epoch": 2365} {"train_loss": -6.445562362670898, "global_step": 99367, "epoch": 2365} {"train_loss": -6.253761291503906, "global_step": 99368, "epoch": 2365} {"train_loss": -6.455507278442383, "global_step": 99369, "epoch": 2365} {"train_loss": -6.286184310913086, "global_step": 99370, "epoch": 2365} {"train_loss": -6.345565364474342, "global_step": 99371, "epoch": 2365, "val_loss": 75795.1484375} {"train_loss": -6.322542667388916, "global_step": 99372, "epoch": 2366} {"train_loss": -6.349932670593262, "global_step": 99373, "epoch": 2366} {"train_loss": -6.162527084350586, "global_step": 99374, "epoch": 2366} {"train_loss": -6.311685562133789, "global_step": 99375, "epoch": 2366} {"train_loss": -6.3290934562683105, "global_step": 99376, "epoch": 2366} {"train_loss": -6.4046406745910645, "global_step": 99377, "epoch": 2366} {"train_loss": -6.336493492126465, "global_step": 99378, "epoch": 2366} {"train_loss": -6.2767438888549805, "global_step": 99379, "epoch": 2366} {"train_loss": -6.350297451019287, "global_step": 99380, "epoch": 2366} {"train_loss": -6.275697231292725, "global_step": 99381, "epoch": 2366} {"train_loss": -6.387208938598633, "global_step": 99382, "epoch": 2366} {"train_loss": -6.315378189086914, "global_step": 99383, "epoch": 2366} {"train_loss": -6.426059722900391, "global_step": 99384, "epoch": 2366} {"train_loss": -6.341041564941406, "global_step": 99385, "epoch": 2366} {"train_loss": -6.454549789428711, "global_step": 99386, "epoch": 2366} {"train_loss": -6.317683696746826, "global_step": 99387, "epoch": 2366} {"train_loss": -6.288568019866943, "global_step": 99388, "epoch": 2366} {"train_loss": -6.4055986404418945, "global_step": 99389, "epoch": 2366} {"train_loss": -6.443014144897461, "global_step": 99390, "epoch": 2366} {"train_loss": -6.379031181335449, "global_step": 99391, "epoch": 2366} {"train_loss": -6.300140380859375, "global_step": 99392, "epoch": 2366} {"train_loss": -6.285850524902344, "global_step": 99393, "epoch": 2366} {"train_loss": -6.205243110656738, "global_step": 99394, "epoch": 2366} {"train_loss": -6.2840704917907715, "global_step": 99395, "epoch": 2366} {"train_loss": -6.408738136291504, "global_step": 99396, "epoch": 2366} {"train_loss": -6.347472190856934, "global_step": 99397, "epoch": 2366} {"train_loss": -6.302459716796875, "global_step": 99398, "epoch": 2366} {"train_loss": -6.367164611816406, "global_step": 99399, "epoch": 2366} {"train_loss": -6.437904357910156, "global_step": 99400, "epoch": 2366} {"train_loss": -6.347774505615234, "global_step": 99401, "epoch": 2366} {"train_loss": -6.409852027893066, "global_step": 99402, "epoch": 2366} {"train_loss": -6.249770164489746, "global_step": 99403, "epoch": 2366} {"train_loss": -6.353365898132324, "global_step": 99404, "epoch": 2366} {"train_loss": -6.293933391571045, "global_step": 99405, "epoch": 2366} {"train_loss": -6.256651878356934, "global_step": 99406, "epoch": 2366} {"train_loss": -6.345183372497559, "global_step": 99407, "epoch": 2366} {"train_loss": -6.285120964050293, "global_step": 99408, "epoch": 2366} {"train_loss": -6.452579498291016, "global_step": 99409, "epoch": 2366} {"train_loss": -6.36615514755249, "global_step": 99410, "epoch": 2366} {"train_loss": -6.348727226257324, "global_step": 99411, "epoch": 2366} {"train_loss": -6.412473678588867, "global_step": 99412, "epoch": 2366} {"train_loss": -6.340854008992513, "global_step": 99413, "epoch": 2366, "val_loss": 75900.8359375} {"train_loss": -6.3659987449646, "global_step": 99414, "epoch": 2367} {"train_loss": -6.368587493896484, "global_step": 99415, "epoch": 2367} {"train_loss": -6.3819122314453125, "global_step": 99416, "epoch": 2367} {"train_loss": -6.407196998596191, "global_step": 99417, "epoch": 2367} {"train_loss": -6.336127758026123, "global_step": 99418, "epoch": 2367} {"train_loss": -6.40844202041626, "global_step": 99419, "epoch": 2367} {"train_loss": -6.290248394012451, "global_step": 99420, "epoch": 2367} {"train_loss": -6.356232166290283, "global_step": 99421, "epoch": 2367} {"train_loss": -6.5125579833984375, "global_step": 99422, "epoch": 2367} {"train_loss": -6.352201461791992, "global_step": 99423, "epoch": 2367} {"train_loss": -6.338682174682617, "global_step": 99424, "epoch": 2367} {"train_loss": -6.350411415100098, "global_step": 99425, "epoch": 2367} {"train_loss": -6.455314636230469, "global_step": 99426, "epoch": 2367} {"train_loss": -6.455486297607422, "global_step": 99427, "epoch": 2367} {"train_loss": -6.370669841766357, "global_step": 99428, "epoch": 2367} {"train_loss": -6.243416786193848, "global_step": 99429, "epoch": 2367} {"train_loss": -6.456879615783691, "global_step": 99430, "epoch": 2367} {"train_loss": -6.359076023101807, "global_step": 99431, "epoch": 2367} {"train_loss": -6.457079887390137, "global_step": 99432, "epoch": 2367} {"train_loss": -6.387622356414795, "global_step": 99433, "epoch": 2367} {"train_loss": -6.360342502593994, "global_step": 99434, "epoch": 2367} {"train_loss": -6.37269401550293, "global_step": 99435, "epoch": 2367} {"train_loss": -6.361310005187988, "global_step": 99436, "epoch": 2367} {"train_loss": -6.2209625244140625, "global_step": 99437, "epoch": 2367} {"train_loss": -6.409195899963379, "global_step": 99438, "epoch": 2367} {"train_loss": -6.284377098083496, "global_step": 99439, "epoch": 2367} {"train_loss": -6.4027886390686035, "global_step": 99440, "epoch": 2367} {"train_loss": -6.370922088623047, "global_step": 99441, "epoch": 2367} {"train_loss": -6.461041450500488, "global_step": 99442, "epoch": 2367} {"train_loss": -6.328240871429443, "global_step": 99443, "epoch": 2367} {"train_loss": -6.335925102233887, "global_step": 99444, "epoch": 2367} {"train_loss": -6.401819229125977, "global_step": 99445, "epoch": 2367} {"train_loss": -6.200046539306641, "global_step": 99446, "epoch": 2367} {"train_loss": -6.395928859710693, "global_step": 99447, "epoch": 2367} {"train_loss": -6.384152889251709, "global_step": 99448, "epoch": 2367} {"train_loss": -6.401371955871582, "global_step": 99449, "epoch": 2367} {"train_loss": -6.434983253479004, "global_step": 99450, "epoch": 2367} {"train_loss": -6.346523284912109, "global_step": 99451, "epoch": 2367} {"train_loss": -6.4914469718933105, "global_step": 99452, "epoch": 2367} {"train_loss": -6.479853630065918, "global_step": 99453, "epoch": 2367} {"train_loss": -6.393555641174316, "global_step": 99454, "epoch": 2367} {"train_loss": -6.3760183084578745, "global_step": 99455, "epoch": 2367, "val_loss": 75868.5546875} {"train_loss": -6.408830642700195, "global_step": 99456, "epoch": 2368} {"train_loss": -6.454689979553223, "global_step": 99457, "epoch": 2368} {"train_loss": -6.526513576507568, "global_step": 99458, "epoch": 2368} {"train_loss": -6.420529365539551, "global_step": 99459, "epoch": 2368} {"train_loss": -6.355743408203125, "global_step": 99460, "epoch": 2368} {"train_loss": -6.323015213012695, "global_step": 99461, "epoch": 2368} {"train_loss": -6.291886329650879, "global_step": 99462, "epoch": 2368} {"train_loss": -6.323329925537109, "global_step": 99463, "epoch": 2368} {"train_loss": -6.291363716125488, "global_step": 99464, "epoch": 2368} {"train_loss": -6.211884498596191, "global_step": 99465, "epoch": 2368} {"train_loss": -6.264830589294434, "global_step": 99466, "epoch": 2368} {"train_loss": -6.340925216674805, "global_step": 99467, "epoch": 2368} {"train_loss": -6.401684761047363, "global_step": 99468, "epoch": 2368} {"train_loss": -6.272760391235352, "global_step": 99469, "epoch": 2368} {"train_loss": -6.200732231140137, "global_step": 99470, "epoch": 2368} {"train_loss": -6.335179328918457, "global_step": 99471, "epoch": 2368} {"train_loss": -6.218494415283203, "global_step": 99472, "epoch": 2368} {"train_loss": -6.199982166290283, "global_step": 99473, "epoch": 2368} {"train_loss": -6.2504472732543945, "global_step": 99474, "epoch": 2368} {"train_loss": -6.255441665649414, "global_step": 99475, "epoch": 2368} {"train_loss": -6.267123222351074, "global_step": 99476, "epoch": 2368} {"train_loss": -6.200629234313965, "global_step": 99477, "epoch": 2368} {"train_loss": -6.246947765350342, "global_step": 99478, "epoch": 2368} {"train_loss": -6.29762077331543, "global_step": 99479, "epoch": 2368} {"train_loss": -6.304104804992676, "global_step": 99480, "epoch": 2368} {"train_loss": -6.252135276794434, "global_step": 99481, "epoch": 2368} {"train_loss": -6.313397407531738, "global_step": 99482, "epoch": 2368} {"train_loss": -6.346050262451172, "global_step": 99483, "epoch": 2368} {"train_loss": -6.362577438354492, "global_step": 99484, "epoch": 2368} {"train_loss": -6.214877128601074, "global_step": 99485, "epoch": 2368} {"train_loss": -6.290963172912598, "global_step": 99486, "epoch": 2368} {"train_loss": -6.160966873168945, "global_step": 99487, "epoch": 2368} {"train_loss": -6.320974349975586, "global_step": 99488, "epoch": 2368} {"train_loss": -6.218897819519043, "global_step": 99489, "epoch": 2368} {"train_loss": -6.362881660461426, "global_step": 99490, "epoch": 2368} {"train_loss": -6.329105854034424, "global_step": 99491, "epoch": 2368} {"train_loss": -6.164882659912109, "global_step": 99492, "epoch": 2368} {"train_loss": -6.315547466278076, "global_step": 99493, "epoch": 2368} {"train_loss": -6.343077659606934, "global_step": 99494, "epoch": 2368} {"train_loss": -6.262979984283447, "global_step": 99495, "epoch": 2368} {"train_loss": -6.3175950050354, "global_step": 99496, "epoch": 2368} {"train_loss": -6.299312057949248, "global_step": 99497, "epoch": 2368, "val_loss": 75681.4765625} {"train_loss": -6.360245704650879, "global_step": 99498, "epoch": 2369} {"train_loss": -6.281512260437012, "global_step": 99499, "epoch": 2369} {"train_loss": -6.280655860900879, "global_step": 99500, "epoch": 2369} {"train_loss": -6.238881587982178, "global_step": 99501, "epoch": 2369} {"train_loss": -6.317372798919678, "global_step": 99502, "epoch": 2369} {"train_loss": -6.340736389160156, "global_step": 99503, "epoch": 2369} {"train_loss": -6.222500801086426, "global_step": 99504, "epoch": 2369} {"train_loss": -6.332761764526367, "global_step": 99505, "epoch": 2369} {"train_loss": -6.25112247467041, "global_step": 99506, "epoch": 2369} {"train_loss": -6.247326850891113, "global_step": 99507, "epoch": 2369} {"train_loss": -6.34943151473999, "global_step": 99508, "epoch": 2369} {"train_loss": -6.387775897979736, "global_step": 99509, "epoch": 2369} {"train_loss": -6.15609073638916, "global_step": 99510, "epoch": 2369} {"train_loss": -6.416141510009766, "global_step": 99511, "epoch": 2369} {"train_loss": -6.311174392700195, "global_step": 99512, "epoch": 2369} {"train_loss": -6.284502983093262, "global_step": 99513, "epoch": 2369} {"train_loss": -6.317173957824707, "global_step": 99514, "epoch": 2369} {"train_loss": -6.276284694671631, "global_step": 99515, "epoch": 2369} {"train_loss": -6.284555912017822, "global_step": 99516, "epoch": 2369} {"train_loss": -6.415070533752441, "global_step": 99517, "epoch": 2369} {"train_loss": -6.372396469116211, "global_step": 99518, "epoch": 2369} {"train_loss": -6.331040382385254, "global_step": 99519, "epoch": 2369} {"train_loss": -6.370511054992676, "global_step": 99520, "epoch": 2369} {"train_loss": -6.307417869567871, "global_step": 99521, "epoch": 2369} {"train_loss": -6.380944728851318, "global_step": 99522, "epoch": 2369} {"train_loss": -6.304157257080078, "global_step": 99523, "epoch": 2369} {"train_loss": -6.41084098815918, "global_step": 99524, "epoch": 2369} {"train_loss": -6.309389591217041, "global_step": 99525, "epoch": 2369} {"train_loss": -6.368063926696777, "global_step": 99526, "epoch": 2369} {"train_loss": -6.263432502746582, "global_step": 99527, "epoch": 2369} {"train_loss": -6.237349033355713, "global_step": 99528, "epoch": 2369} {"train_loss": -6.260778427124023, "global_step": 99529, "epoch": 2369} {"train_loss": -6.396028518676758, "global_step": 99530, "epoch": 2369} {"train_loss": -6.252891540527344, "global_step": 99531, "epoch": 2369} {"train_loss": -6.456748008728027, "global_step": 99532, "epoch": 2369} {"train_loss": -6.313117980957031, "global_step": 99533, "epoch": 2369} {"train_loss": -6.240111351013184, "global_step": 99534, "epoch": 2369} {"train_loss": -6.368791580200195, "global_step": 99535, "epoch": 2369} {"train_loss": -6.206262588500977, "global_step": 99536, "epoch": 2369} {"train_loss": -6.287680149078369, "global_step": 99537, "epoch": 2369} {"train_loss": -6.218878746032715, "global_step": 99538, "epoch": 2369} {"train_loss": -6.309554633640108, "global_step": 99539, "epoch": 2369, "val_loss": 76284.1640625} {"train_loss": -6.276430130004883, "global_step": 99540, "epoch": 2370} {"train_loss": -6.468953609466553, "global_step": 99541, "epoch": 2370} {"train_loss": -6.218064308166504, "global_step": 99542, "epoch": 2370} {"train_loss": -6.251898765563965, "global_step": 99543, "epoch": 2370} {"train_loss": -6.209727764129639, "global_step": 99544, "epoch": 2370} {"train_loss": -6.165928840637207, "global_step": 99545, "epoch": 2370} {"train_loss": -6.36475944519043, "global_step": 99546, "epoch": 2370} {"train_loss": -6.323287487030029, "global_step": 99547, "epoch": 2370} {"train_loss": -6.318078994750977, "global_step": 99548, "epoch": 2370} {"train_loss": -6.310004711151123, "global_step": 99549, "epoch": 2370} {"train_loss": -6.355770587921143, "global_step": 99550, "epoch": 2370} {"train_loss": -6.339822769165039, "global_step": 99551, "epoch": 2370} {"train_loss": -6.361048698425293, "global_step": 99552, "epoch": 2370} {"train_loss": -6.3409199714660645, "global_step": 99553, "epoch": 2370} {"train_loss": -6.16760778427124, "global_step": 99554, "epoch": 2370} {"train_loss": -6.4075775146484375, "global_step": 99555, "epoch": 2370} {"train_loss": -6.394521713256836, "global_step": 99556, "epoch": 2370} {"train_loss": -6.295403957366943, "global_step": 99557, "epoch": 2370} {"train_loss": -6.242927551269531, "global_step": 99558, "epoch": 2370} {"train_loss": -6.375555992126465, "global_step": 99559, "epoch": 2370} {"train_loss": -6.191613674163818, "global_step": 99560, "epoch": 2370} {"train_loss": -6.369582176208496, "global_step": 99561, "epoch": 2370} {"train_loss": -6.219123840332031, "global_step": 99562, "epoch": 2370} {"train_loss": -6.081581115722656, "global_step": 99563, "epoch": 2370} {"train_loss": -6.253857612609863, "global_step": 99564, "epoch": 2370} {"train_loss": -6.30154275894165, "global_step": 99565, "epoch": 2370} {"train_loss": -6.1876630783081055, "global_step": 99566, "epoch": 2370} {"train_loss": -6.343581676483154, "global_step": 99567, "epoch": 2370} {"train_loss": -6.381099700927734, "global_step": 99568, "epoch": 2370} {"train_loss": -6.262985706329346, "global_step": 99569, "epoch": 2370} {"train_loss": -6.3244781494140625, "global_step": 99570, "epoch": 2370} {"train_loss": -6.334516525268555, "global_step": 99571, "epoch": 2370} {"train_loss": -6.310013771057129, "global_step": 99572, "epoch": 2370} {"train_loss": -6.202744007110596, "global_step": 99573, "epoch": 2370} {"train_loss": -6.264616012573242, "global_step": 99574, "epoch": 2370} {"train_loss": -6.258526802062988, "global_step": 99575, "epoch": 2370} {"train_loss": -6.3631815910339355, "global_step": 99576, "epoch": 2370} {"train_loss": -6.403304576873779, "global_step": 99577, "epoch": 2370} {"train_loss": -6.298689365386963, "global_step": 99578, "epoch": 2370} {"train_loss": -6.2671308517456055, "global_step": 99579, "epoch": 2370} {"train_loss": -6.355477809906006, "global_step": 99580, "epoch": 2370} {"train_loss": -6.297460714975993, "global_step": 99581, "epoch": 2370, "val_loss": 75606.5546875} {"train_loss": -6.320126533508301, "global_step": 99582, "epoch": 2371} {"train_loss": -6.390496253967285, "global_step": 99583, "epoch": 2371} {"train_loss": -6.4188232421875, "global_step": 99584, "epoch": 2371} {"train_loss": -6.257365703582764, "global_step": 99585, "epoch": 2371} {"train_loss": -6.229257106781006, "global_step": 99586, "epoch": 2371} {"train_loss": -6.325799942016602, "global_step": 99587, "epoch": 2371} {"train_loss": -6.265261650085449, "global_step": 99588, "epoch": 2371} {"train_loss": -6.476317882537842, "global_step": 99589, "epoch": 2371} {"train_loss": -6.275324821472168, "global_step": 99590, "epoch": 2371} {"train_loss": -6.334178447723389, "global_step": 99591, "epoch": 2371} {"train_loss": -6.469466686248779, "global_step": 99592, "epoch": 2371} {"train_loss": -6.4075446128845215, "global_step": 99593, "epoch": 2371} {"train_loss": -6.300166130065918, "global_step": 99594, "epoch": 2371} {"train_loss": -6.310921669006348, "global_step": 99595, "epoch": 2371} {"train_loss": -6.306347846984863, "global_step": 99596, "epoch": 2371} {"train_loss": -6.352376937866211, "global_step": 99597, "epoch": 2371} {"train_loss": -6.294111251831055, "global_step": 99598, "epoch": 2371} {"train_loss": -6.446958065032959, "global_step": 99599, "epoch": 2371} {"train_loss": -6.341139793395996, "global_step": 99600, "epoch": 2371} {"train_loss": -6.394408226013184, "global_step": 99601, "epoch": 2371} {"train_loss": -6.417161464691162, "global_step": 99602, "epoch": 2371} {"train_loss": -6.329036235809326, "global_step": 99603, "epoch": 2371} {"train_loss": -6.252078533172607, "global_step": 99604, "epoch": 2371} {"train_loss": -6.438418865203857, "global_step": 99605, "epoch": 2371} {"train_loss": -6.366017818450928, "global_step": 99606, "epoch": 2371} {"train_loss": -6.431088447570801, "global_step": 99607, "epoch": 2371} {"train_loss": -6.38754940032959, "global_step": 99608, "epoch": 2371} {"train_loss": -6.444222450256348, "global_step": 99609, "epoch": 2371} {"train_loss": -6.508571624755859, "global_step": 99610, "epoch": 2371} {"train_loss": -6.285454750061035, "global_step": 99611, "epoch": 2371} {"train_loss": -6.408505916595459, "global_step": 99612, "epoch": 2371} {"train_loss": -6.386476516723633, "global_step": 99613, "epoch": 2371} {"train_loss": -6.34835147857666, "global_step": 99614, "epoch": 2371} {"train_loss": -6.370594024658203, "global_step": 99615, "epoch": 2371} {"train_loss": -6.264330863952637, "global_step": 99616, "epoch": 2371} {"train_loss": -6.379611968994141, "global_step": 99617, "epoch": 2371} {"train_loss": -6.369184494018555, "global_step": 99618, "epoch": 2371} {"train_loss": -6.282892227172852, "global_step": 99619, "epoch": 2371} {"train_loss": -6.215575695037842, "global_step": 99620, "epoch": 2371} {"train_loss": -6.457300186157227, "global_step": 99621, "epoch": 2371} {"train_loss": -6.413131237030029, "global_step": 99622, "epoch": 2371} {"train_loss": -6.359696706136067, "global_step": 99623, "epoch": 2371, "val_loss": 75675.546875} {"train_loss": -6.359109878540039, "global_step": 99624, "epoch": 2372} {"train_loss": -6.394129753112793, "global_step": 99625, "epoch": 2372} {"train_loss": -6.434878349304199, "global_step": 99626, "epoch": 2372} {"train_loss": -6.348513603210449, "global_step": 99627, "epoch": 2372} {"train_loss": -6.4365339279174805, "global_step": 99628, "epoch": 2372} {"train_loss": -6.400968551635742, "global_step": 99629, "epoch": 2372} {"train_loss": -6.391285419464111, "global_step": 99630, "epoch": 2372} {"train_loss": -6.387970924377441, "global_step": 99631, "epoch": 2372} {"train_loss": -6.380242347717285, "global_step": 99632, "epoch": 2372} {"train_loss": -6.379796981811523, "global_step": 99633, "epoch": 2372} {"train_loss": -6.335780143737793, "global_step": 99634, "epoch": 2372} {"train_loss": -6.506875514984131, "global_step": 99635, "epoch": 2372} {"train_loss": -6.3224897384643555, "global_step": 99636, "epoch": 2372} {"train_loss": -6.360227584838867, "global_step": 99637, "epoch": 2372} {"train_loss": -6.464489459991455, "global_step": 99638, "epoch": 2372} {"train_loss": -6.293058395385742, "global_step": 99639, "epoch": 2372} {"train_loss": -6.354086875915527, "global_step": 99640, "epoch": 2372} {"train_loss": -6.312375545501709, "global_step": 99641, "epoch": 2372} {"train_loss": -6.29207706451416, "global_step": 99642, "epoch": 2372} {"train_loss": -6.3636980056762695, "global_step": 99643, "epoch": 2372} {"train_loss": -6.275183200836182, "global_step": 99644, "epoch": 2372} {"train_loss": -6.247506141662598, "global_step": 99645, "epoch": 2372} {"train_loss": -6.256712436676025, "global_step": 99646, "epoch": 2372} {"train_loss": -6.443459510803223, "global_step": 99647, "epoch": 2372} {"train_loss": -6.348880767822266, "global_step": 99648, "epoch": 2372} {"train_loss": -6.377679824829102, "global_step": 99649, "epoch": 2372} {"train_loss": -6.3903961181640625, "global_step": 99650, "epoch": 2372} {"train_loss": -6.41114616394043, "global_step": 99651, "epoch": 2372} {"train_loss": -6.38179349899292, "global_step": 99652, "epoch": 2372} {"train_loss": -6.31121301651001, "global_step": 99653, "epoch": 2372} {"train_loss": -6.343329429626465, "global_step": 99654, "epoch": 2372} {"train_loss": -6.368238925933838, "global_step": 99655, "epoch": 2372} {"train_loss": -6.418521404266357, "global_step": 99656, "epoch": 2372} {"train_loss": -6.442859649658203, "global_step": 99657, "epoch": 2372} {"train_loss": -6.302145004272461, "global_step": 99658, "epoch": 2372} {"train_loss": -6.4075446128845215, "global_step": 99659, "epoch": 2372} {"train_loss": -6.438187122344971, "global_step": 99660, "epoch": 2372} {"train_loss": -6.3477983474731445, "global_step": 99661, "epoch": 2372} {"train_loss": -6.368509769439697, "global_step": 99662, "epoch": 2372} {"train_loss": -6.308874130249023, "global_step": 99663, "epoch": 2372} {"train_loss": -6.476411819458008, "global_step": 99664, "epoch": 2372} {"train_loss": -6.371245213917324, "global_step": 99665, "epoch": 2372, "val_loss": 75793.359375} {"train_loss": -6.418083190917969, "global_step": 99666, "epoch": 2373} {"train_loss": -6.319476127624512, "global_step": 99667, "epoch": 2373} {"train_loss": -6.342865943908691, "global_step": 99668, "epoch": 2373} {"train_loss": -6.418238639831543, "global_step": 99669, "epoch": 2373} {"train_loss": -6.347092151641846, "global_step": 99670, "epoch": 2373} {"train_loss": -6.318976402282715, "global_step": 99671, "epoch": 2373} {"train_loss": -6.505743503570557, "global_step": 99672, "epoch": 2373} {"train_loss": -6.423460483551025, "global_step": 99673, "epoch": 2373} {"train_loss": -6.4401140213012695, "global_step": 99674, "epoch": 2373} {"train_loss": -6.437459945678711, "global_step": 99675, "epoch": 2373} {"train_loss": -6.329466819763184, "global_step": 99676, "epoch": 2373} {"train_loss": -6.519218444824219, "global_step": 99677, "epoch": 2373} {"train_loss": -6.2698493003845215, "global_step": 99678, "epoch": 2373} {"train_loss": -6.285600185394287, "global_step": 99679, "epoch": 2373} {"train_loss": -6.454266548156738, "global_step": 99680, "epoch": 2373} {"train_loss": -6.300836563110352, "global_step": 99681, "epoch": 2373} {"train_loss": -6.352663993835449, "global_step": 99682, "epoch": 2373} {"train_loss": -6.44810152053833, "global_step": 99683, "epoch": 2373} {"train_loss": -6.334214210510254, "global_step": 99684, "epoch": 2373} {"train_loss": -6.326011657714844, "global_step": 99685, "epoch": 2373} {"train_loss": -6.395575523376465, "global_step": 99686, "epoch": 2373} {"train_loss": -6.216622352600098, "global_step": 99687, "epoch": 2373} {"train_loss": -6.2579345703125, "global_step": 99688, "epoch": 2373} {"train_loss": -6.362434387207031, "global_step": 99689, "epoch": 2373} {"train_loss": -6.407487392425537, "global_step": 99690, "epoch": 2373} {"train_loss": -6.331573486328125, "global_step": 99691, "epoch": 2373} {"train_loss": -6.290254592895508, "global_step": 99692, "epoch": 2373} {"train_loss": -6.393885612487793, "global_step": 99693, "epoch": 2373} {"train_loss": -6.358657360076904, "global_step": 99694, "epoch": 2373} {"train_loss": -6.3005475997924805, "global_step": 99695, "epoch": 2373} {"train_loss": -6.267065048217773, "global_step": 99696, "epoch": 2373} {"train_loss": -6.282632350921631, "global_step": 99697, "epoch": 2373} {"train_loss": -6.435437202453613, "global_step": 99698, "epoch": 2373} {"train_loss": -6.421172142028809, "global_step": 99699, "epoch": 2373} {"train_loss": -6.309287071228027, "global_step": 99700, "epoch": 2373} {"train_loss": -6.365184307098389, "global_step": 99701, "epoch": 2373} {"train_loss": -6.265785217285156, "global_step": 99702, "epoch": 2373} {"train_loss": -6.321619987487793, "global_step": 99703, "epoch": 2373} {"train_loss": -6.399110794067383, "global_step": 99704, "epoch": 2373} {"train_loss": -6.342801094055176, "global_step": 99705, "epoch": 2373} {"train_loss": -6.436600685119629, "global_step": 99706, "epoch": 2373} {"train_loss": -6.3585272289457775, "global_step": 99707, "epoch": 2373, "val_loss": 75996.8359375} {"train_loss": -6.401425361633301, "global_step": 99708, "epoch": 2374} {"train_loss": -6.36566686630249, "global_step": 99709, "epoch": 2374} {"train_loss": -6.3074188232421875, "global_step": 99710, "epoch": 2374} {"train_loss": -6.193215370178223, "global_step": 99711, "epoch": 2374} {"train_loss": -6.301178455352783, "global_step": 99712, "epoch": 2374} {"train_loss": -6.363465309143066, "global_step": 99713, "epoch": 2374} {"train_loss": -6.349000930786133, "global_step": 99714, "epoch": 2374} {"train_loss": -6.352636337280273, "global_step": 99715, "epoch": 2374} {"train_loss": -6.3700079917907715, "global_step": 99716, "epoch": 2374} {"train_loss": -6.390995025634766, "global_step": 99717, "epoch": 2374} {"train_loss": -6.3918304443359375, "global_step": 99718, "epoch": 2374} {"train_loss": -6.3176751136779785, "global_step": 99719, "epoch": 2374} {"train_loss": -6.408583641052246, "global_step": 99720, "epoch": 2374} {"train_loss": -6.252295970916748, "global_step": 99721, "epoch": 2374} {"train_loss": -6.3715901374816895, "global_step": 99722, "epoch": 2374} {"train_loss": -6.326547622680664, "global_step": 99723, "epoch": 2374} {"train_loss": -6.318124294281006, "global_step": 99724, "epoch": 2374} {"train_loss": -6.437763214111328, "global_step": 99725, "epoch": 2374} {"train_loss": -6.338731288909912, "global_step": 99726, "epoch": 2374} {"train_loss": -6.289492607116699, "global_step": 99727, "epoch": 2374} {"train_loss": -6.482851028442383, "global_step": 99728, "epoch": 2374} {"train_loss": -6.250576972961426, "global_step": 99729, "epoch": 2374} {"train_loss": -6.364361763000488, "global_step": 99730, "epoch": 2374} {"train_loss": -6.364612102508545, "global_step": 99731, "epoch": 2374} {"train_loss": -6.3674116134643555, "global_step": 99732, "epoch": 2374} {"train_loss": -6.4369797706604, "global_step": 99733, "epoch": 2374} {"train_loss": -6.265212059020996, "global_step": 99734, "epoch": 2374} {"train_loss": -6.303544521331787, "global_step": 99735, "epoch": 2374} {"train_loss": -6.353158950805664, "global_step": 99736, "epoch": 2374} {"train_loss": -6.384182453155518, "global_step": 99737, "epoch": 2374} {"train_loss": -6.3788604736328125, "global_step": 99738, "epoch": 2374} {"train_loss": -6.354801177978516, "global_step": 99739, "epoch": 2374} {"train_loss": -6.417346000671387, "global_step": 99740, "epoch": 2374} {"train_loss": -6.242629051208496, "global_step": 99741, "epoch": 2374} {"train_loss": -6.363931655883789, "global_step": 99742, "epoch": 2374} {"train_loss": -6.505609512329102, "global_step": 99743, "epoch": 2374} {"train_loss": -6.421119213104248, "global_step": 99744, "epoch": 2374} {"train_loss": -6.368081569671631, "global_step": 99745, "epoch": 2374} {"train_loss": -6.442027568817139, "global_step": 99746, "epoch": 2374} {"train_loss": -6.188716888427734, "global_step": 99747, "epoch": 2374} {"train_loss": -6.249579429626465, "global_step": 99748, "epoch": 2374} {"train_loss": -6.348810150509789, "global_step": 99749, "epoch": 2374, "val_loss": 75875.3984375} {"train_loss": -6.290548324584961, "global_step": 99750, "epoch": 2375} {"train_loss": -6.443227767944336, "global_step": 99751, "epoch": 2375} {"train_loss": -6.391908645629883, "global_step": 99752, "epoch": 2375} {"train_loss": -6.405478000640869, "global_step": 99753, "epoch": 2375} {"train_loss": -6.264917850494385, "global_step": 99754, "epoch": 2375} {"train_loss": -6.4067840576171875, "global_step": 99755, "epoch": 2375} {"train_loss": -6.377662658691406, "global_step": 99756, "epoch": 2375} {"train_loss": -6.465071678161621, "global_step": 99757, "epoch": 2375} {"train_loss": -6.361886024475098, "global_step": 99758, "epoch": 2375} {"train_loss": -6.267691612243652, "global_step": 99759, "epoch": 2375} {"train_loss": -6.228854179382324, "global_step": 99760, "epoch": 2375} {"train_loss": -6.3646626472473145, "global_step": 99761, "epoch": 2375} {"train_loss": -6.251128196716309, "global_step": 99762, "epoch": 2375} {"train_loss": -6.229710102081299, "global_step": 99763, "epoch": 2375} {"train_loss": -6.300599575042725, "global_step": 99764, "epoch": 2375} {"train_loss": -6.216542720794678, "global_step": 99765, "epoch": 2375} {"train_loss": -6.305581092834473, "global_step": 99766, "epoch": 2375} {"train_loss": -6.417292594909668, "global_step": 99767, "epoch": 2375} {"train_loss": -6.332228183746338, "global_step": 99768, "epoch": 2375} {"train_loss": -6.281285762786865, "global_step": 99769, "epoch": 2375} {"train_loss": -6.353842258453369, "global_step": 99770, "epoch": 2375} {"train_loss": -6.333909034729004, "global_step": 99771, "epoch": 2375} {"train_loss": -6.2909464836120605, "global_step": 99772, "epoch": 2375} {"train_loss": -6.290001392364502, "global_step": 99773, "epoch": 2375} {"train_loss": -6.2366485595703125, "global_step": 99774, "epoch": 2375} {"train_loss": -6.417809963226318, "global_step": 99775, "epoch": 2375} {"train_loss": -6.385801315307617, "global_step": 99776, "epoch": 2375} {"train_loss": -6.439857482910156, "global_step": 99777, "epoch": 2375} {"train_loss": -6.261795520782471, "global_step": 99778, "epoch": 2375} {"train_loss": -6.340432643890381, "global_step": 99779, "epoch": 2375} {"train_loss": -6.325325012207031, "global_step": 99780, "epoch": 2375} {"train_loss": -6.338884353637695, "global_step": 99781, "epoch": 2375} {"train_loss": -6.255348205566406, "global_step": 99782, "epoch": 2375} {"train_loss": -6.461661338806152, "global_step": 99783, "epoch": 2375} {"train_loss": -6.357391357421875, "global_step": 99784, "epoch": 2375} {"train_loss": -6.283648490905762, "global_step": 99785, "epoch": 2375} {"train_loss": -6.471656322479248, "global_step": 99786, "epoch": 2375} {"train_loss": -6.280045509338379, "global_step": 99787, "epoch": 2375} {"train_loss": -6.302394866943359, "global_step": 99788, "epoch": 2375} {"train_loss": -6.331350803375244, "global_step": 99789, "epoch": 2375} {"train_loss": -6.317929267883301, "global_step": 99790, "epoch": 2375} {"train_loss": -6.336367357344854, "global_step": 99791, "epoch": 2375, "val_loss": 76186.609375} {"train_loss": -6.380211353302002, "global_step": 99792, "epoch": 2376} {"train_loss": -6.276553153991699, "global_step": 99793, "epoch": 2376} {"train_loss": -6.4486494064331055, "global_step": 99794, "epoch": 2376} {"train_loss": -6.392270088195801, "global_step": 99795, "epoch": 2376} {"train_loss": -6.338661193847656, "global_step": 99796, "epoch": 2376} {"train_loss": -6.339745998382568, "global_step": 99797, "epoch": 2376} {"train_loss": -6.357524871826172, "global_step": 99798, "epoch": 2376} {"train_loss": -6.448192596435547, "global_step": 99799, "epoch": 2376} {"train_loss": -6.381323337554932, "global_step": 99800, "epoch": 2376} {"train_loss": -6.312358856201172, "global_step": 99801, "epoch": 2376} {"train_loss": -6.318099021911621, "global_step": 99802, "epoch": 2376} {"train_loss": -6.334405899047852, "global_step": 99803, "epoch": 2376} {"train_loss": -6.32308292388916, "global_step": 99804, "epoch": 2376} {"train_loss": -6.211855411529541, "global_step": 99805, "epoch": 2376} {"train_loss": -6.255954265594482, "global_step": 99806, "epoch": 2376} {"train_loss": -6.379490852355957, "global_step": 99807, "epoch": 2376} {"train_loss": -6.2710723876953125, "global_step": 99808, "epoch": 2376} {"train_loss": -6.376589775085449, "global_step": 99809, "epoch": 2376} {"train_loss": -6.274075508117676, "global_step": 99810, "epoch": 2376} {"train_loss": -6.222001552581787, "global_step": 99811, "epoch": 2376} {"train_loss": -6.39703369140625, "global_step": 99812, "epoch": 2376} {"train_loss": -6.238222122192383, "global_step": 99813, "epoch": 2376} {"train_loss": -6.36750602722168, "global_step": 99814, "epoch": 2376} {"train_loss": -6.405587196350098, "global_step": 99815, "epoch": 2376} {"train_loss": -6.349560737609863, "global_step": 99816, "epoch": 2376} {"train_loss": -6.414216995239258, "global_step": 99817, "epoch": 2376} {"train_loss": -6.457283973693848, "global_step": 99818, "epoch": 2376} {"train_loss": -6.353692054748535, "global_step": 99819, "epoch": 2376} {"train_loss": -6.351672172546387, "global_step": 99820, "epoch": 2376} {"train_loss": -6.24311637878418, "global_step": 99821, "epoch": 2376} {"train_loss": -6.314669609069824, "global_step": 99822, "epoch": 2376} {"train_loss": -6.332779884338379, "global_step": 99823, "epoch": 2376} {"train_loss": -6.315860748291016, "global_step": 99824, "epoch": 2376} {"train_loss": -6.345699310302734, "global_step": 99825, "epoch": 2376} {"train_loss": -6.232638359069824, "global_step": 99826, "epoch": 2376} {"train_loss": -6.3180341720581055, "global_step": 99827, "epoch": 2376} {"train_loss": -6.395224094390869, "global_step": 99828, "epoch": 2376} {"train_loss": -6.2601728439331055, "global_step": 99829, "epoch": 2376} {"train_loss": -6.362272262573242, "global_step": 99830, "epoch": 2376} {"train_loss": -6.335314750671387, "global_step": 99831, "epoch": 2376} {"train_loss": -6.349088191986084, "global_step": 99832, "epoch": 2376} {"train_loss": -6.335757403146653, "global_step": 99833, "epoch": 2376, "val_loss": 75821.09375} {"train_loss": -6.317720413208008, "global_step": 99834, "epoch": 2377} {"train_loss": -6.392022132873535, "global_step": 99835, "epoch": 2377} {"train_loss": -6.360979080200195, "global_step": 99836, "epoch": 2377} {"train_loss": -6.42364501953125, "global_step": 99837, "epoch": 2377} {"train_loss": -6.317817687988281, "global_step": 99838, "epoch": 2377} {"train_loss": -6.319428443908691, "global_step": 99839, "epoch": 2377} {"train_loss": -6.361441612243652, "global_step": 99840, "epoch": 2377} {"train_loss": -6.296992778778076, "global_step": 99841, "epoch": 2377} {"train_loss": -6.411419868469238, "global_step": 99842, "epoch": 2377} {"train_loss": -6.356317520141602, "global_step": 99843, "epoch": 2377} {"train_loss": -6.312901020050049, "global_step": 99844, "epoch": 2377} {"train_loss": -6.329739570617676, "global_step": 99845, "epoch": 2377} {"train_loss": -6.253128528594971, "global_step": 99846, "epoch": 2377} {"train_loss": -6.469607830047607, "global_step": 99847, "epoch": 2377} {"train_loss": -6.33203125, "global_step": 99848, "epoch": 2377} {"train_loss": -6.405350685119629, "global_step": 99849, "epoch": 2377} {"train_loss": -6.378448009490967, "global_step": 99850, "epoch": 2377} {"train_loss": -6.245316505432129, "global_step": 99851, "epoch": 2377} {"train_loss": -6.525419235229492, "global_step": 99852, "epoch": 2377} {"train_loss": -6.372829914093018, "global_step": 99853, "epoch": 2377} {"train_loss": -6.299317359924316, "global_step": 99854, "epoch": 2377} {"train_loss": -6.321536064147949, "global_step": 99855, "epoch": 2377} {"train_loss": -6.4435858726501465, "global_step": 99856, "epoch": 2377} {"train_loss": -6.263456344604492, "global_step": 99857, "epoch": 2377} {"train_loss": -6.4332661628723145, "global_step": 99858, "epoch": 2377} {"train_loss": -6.360324859619141, "global_step": 99859, "epoch": 2377} {"train_loss": -6.408515930175781, "global_step": 99860, "epoch": 2377} {"train_loss": -6.404440879821777, "global_step": 99861, "epoch": 2377} {"train_loss": -6.367198944091797, "global_step": 99862, "epoch": 2377} {"train_loss": -6.401061058044434, "global_step": 99863, "epoch": 2377} {"train_loss": -6.32735013961792, "global_step": 99864, "epoch": 2377} {"train_loss": -6.277166366577148, "global_step": 99865, "epoch": 2377} {"train_loss": -6.310103416442871, "global_step": 99866, "epoch": 2377} {"train_loss": -6.325412750244141, "global_step": 99867, "epoch": 2377} {"train_loss": -6.33176326751709, "global_step": 99868, "epoch": 2377} {"train_loss": -6.375465393066406, "global_step": 99869, "epoch": 2377} {"train_loss": -6.228614807128906, "global_step": 99870, "epoch": 2377} {"train_loss": -6.2651824951171875, "global_step": 99871, "epoch": 2377} {"train_loss": -6.270262718200684, "global_step": 99872, "epoch": 2377} {"train_loss": -6.3436384201049805, "global_step": 99873, "epoch": 2377} {"train_loss": -6.3790059089660645, "global_step": 99874, "epoch": 2377} {"train_loss": -6.347528287342617, "global_step": 99875, "epoch": 2377, "val_loss": 75954.5234375} {"train_loss": -6.470853805541992, "global_step": 99876, "epoch": 2378} {"train_loss": -6.28088903427124, "global_step": 99877, "epoch": 2378} {"train_loss": -6.3754801750183105, "global_step": 99878, "epoch": 2378} {"train_loss": -6.420069694519043, "global_step": 99879, "epoch": 2378} {"train_loss": -6.351585388183594, "global_step": 99880, "epoch": 2378} {"train_loss": -6.323923587799072, "global_step": 99881, "epoch": 2378} {"train_loss": -6.311686992645264, "global_step": 99882, "epoch": 2378} {"train_loss": -6.419473648071289, "global_step": 99883, "epoch": 2378} {"train_loss": -6.3951311111450195, "global_step": 99884, "epoch": 2378} {"train_loss": -6.408717632293701, "global_step": 99885, "epoch": 2378} {"train_loss": -6.3888654708862305, "global_step": 99886, "epoch": 2378} {"train_loss": -6.347522258758545, "global_step": 99887, "epoch": 2378} {"train_loss": -6.391963481903076, "global_step": 99888, "epoch": 2378} {"train_loss": -6.316066741943359, "global_step": 99889, "epoch": 2378} {"train_loss": -6.437136650085449, "global_step": 99890, "epoch": 2378} {"train_loss": -6.390942573547363, "global_step": 99891, "epoch": 2378} {"train_loss": -6.289573669433594, "global_step": 99892, "epoch": 2378} {"train_loss": -6.424533367156982, "global_step": 99893, "epoch": 2378} {"train_loss": -6.300367832183838, "global_step": 99894, "epoch": 2378} {"train_loss": -6.454408168792725, "global_step": 99895, "epoch": 2378} {"train_loss": -6.323833465576172, "global_step": 99896, "epoch": 2378} {"train_loss": -6.223121643066406, "global_step": 99897, "epoch": 2378} {"train_loss": -6.360457420349121, "global_step": 99898, "epoch": 2378} {"train_loss": -6.284929275512695, "global_step": 99899, "epoch": 2378} {"train_loss": -6.215427398681641, "global_step": 99900, "epoch": 2378} {"train_loss": -6.387248992919922, "global_step": 99901, "epoch": 2378} {"train_loss": -6.397310256958008, "global_step": 99902, "epoch": 2378} {"train_loss": -6.370461463928223, "global_step": 99903, "epoch": 2378} {"train_loss": -6.5036468505859375, "global_step": 99904, "epoch": 2378} {"train_loss": -6.2996368408203125, "global_step": 99905, "epoch": 2378} {"train_loss": -6.402520179748535, "global_step": 99906, "epoch": 2378} {"train_loss": -6.3470869064331055, "global_step": 99907, "epoch": 2378} {"train_loss": -6.4113240242004395, "global_step": 99908, "epoch": 2378} {"train_loss": -6.355583190917969, "global_step": 99909, "epoch": 2378} {"train_loss": -6.380396842956543, "global_step": 99910, "epoch": 2378} {"train_loss": -6.265952110290527, "global_step": 99911, "epoch": 2378} {"train_loss": -6.331492900848389, "global_step": 99912, "epoch": 2378} {"train_loss": -6.373559951782227, "global_step": 99913, "epoch": 2378} {"train_loss": -6.440368175506592, "global_step": 99914, "epoch": 2378} {"train_loss": -6.3528289794921875, "global_step": 99915, "epoch": 2378} {"train_loss": -6.440710067749023, "global_step": 99916, "epoch": 2378} {"train_loss": -6.365607999619984, "global_step": 99917, "epoch": 2378, "val_loss": 75691.7890625} {"train_loss": -6.396950721740723, "global_step": 99918, "epoch": 2379} {"train_loss": -6.303005695343018, "global_step": 99919, "epoch": 2379} {"train_loss": -6.358223915100098, "global_step": 99920, "epoch": 2379} {"train_loss": -6.443782329559326, "global_step": 99921, "epoch": 2379} {"train_loss": -6.419170379638672, "global_step": 99922, "epoch": 2379} {"train_loss": -6.3195576667785645, "global_step": 99923, "epoch": 2379} {"train_loss": -6.37980842590332, "global_step": 99924, "epoch": 2379} {"train_loss": -6.279415607452393, "global_step": 99925, "epoch": 2379} {"train_loss": -6.483852386474609, "global_step": 99926, "epoch": 2379} {"train_loss": -6.395957946777344, "global_step": 99927, "epoch": 2379} {"train_loss": -6.390363693237305, "global_step": 99928, "epoch": 2379} {"train_loss": -6.267521381378174, "global_step": 99929, "epoch": 2379} {"train_loss": -6.441077709197998, "global_step": 99930, "epoch": 2379} {"train_loss": -6.453125953674316, "global_step": 99931, "epoch": 2379} {"train_loss": -6.369101524353027, "global_step": 99932, "epoch": 2379} {"train_loss": -6.389919281005859, "global_step": 99933, "epoch": 2379} {"train_loss": -6.281313896179199, "global_step": 99934, "epoch": 2379} {"train_loss": -6.474827766418457, "global_step": 99935, "epoch": 2379} {"train_loss": -6.419707298278809, "global_step": 99936, "epoch": 2379} {"train_loss": -6.223967552185059, "global_step": 99937, "epoch": 2379} {"train_loss": -6.428866386413574, "global_step": 99938, "epoch": 2379} {"train_loss": -6.353982925415039, "global_step": 99939, "epoch": 2379} {"train_loss": -6.424406051635742, "global_step": 99940, "epoch": 2379} {"train_loss": -6.3364057540893555, "global_step": 99941, "epoch": 2379} {"train_loss": -6.492888450622559, "global_step": 99942, "epoch": 2379} {"train_loss": -6.3923845291137695, "global_step": 99943, "epoch": 2379} {"train_loss": -6.410710334777832, "global_step": 99944, "epoch": 2379} {"train_loss": -6.383810997009277, "global_step": 99945, "epoch": 2379} {"train_loss": -6.268204689025879, "global_step": 99946, "epoch": 2379} {"train_loss": -6.205473899841309, "global_step": 99947, "epoch": 2379} {"train_loss": -6.434982776641846, "global_step": 99948, "epoch": 2379} {"train_loss": -6.175188064575195, "global_step": 99949, "epoch": 2379} {"train_loss": -6.1191253662109375, "global_step": 99950, "epoch": 2379} {"train_loss": -6.247457504272461, "global_step": 99951, "epoch": 2379} {"train_loss": -6.366457462310791, "global_step": 99952, "epoch": 2379} {"train_loss": -6.26128625869751, "global_step": 99953, "epoch": 2379} {"train_loss": -6.297784805297852, "global_step": 99954, "epoch": 2379} {"train_loss": -6.319275856018066, "global_step": 99955, "epoch": 2379} {"train_loss": -6.3794989585876465, "global_step": 99956, "epoch": 2379} {"train_loss": -6.232207298278809, "global_step": 99957, "epoch": 2379} {"train_loss": -6.274370193481445, "global_step": 99958, "epoch": 2379} {"train_loss": -6.346137285232544, "global_step": 99959, "epoch": 2379, "val_loss": 75945.3203125} {"train_loss": -6.251140117645264, "global_step": 99960, "epoch": 2380} {"train_loss": -6.428383827209473, "global_step": 99961, "epoch": 2380} {"train_loss": -6.305276870727539, "global_step": 99962, "epoch": 2380} {"train_loss": -6.295229434967041, "global_step": 99963, "epoch": 2380} {"train_loss": -6.328672885894775, "global_step": 99964, "epoch": 2380} {"train_loss": -6.365420818328857, "global_step": 99965, "epoch": 2380} {"train_loss": -6.177582740783691, "global_step": 99966, "epoch": 2380} {"train_loss": -6.383339881896973, "global_step": 99967, "epoch": 2380} {"train_loss": -6.2863054275512695, "global_step": 99968, "epoch": 2380} {"train_loss": -6.256510257720947, "global_step": 99969, "epoch": 2380} {"train_loss": -6.3172430992126465, "global_step": 99970, "epoch": 2380} {"train_loss": -6.291356563568115, "global_step": 99971, "epoch": 2380} {"train_loss": -6.501811504364014, "global_step": 99972, "epoch": 2380} {"train_loss": -6.213067054748535, "global_step": 99973, "epoch": 2380} {"train_loss": -6.257223129272461, "global_step": 99974, "epoch": 2380} {"train_loss": -6.389913558959961, "global_step": 99975, "epoch": 2380} {"train_loss": -6.303928375244141, "global_step": 99976, "epoch": 2380} {"train_loss": -6.396961212158203, "global_step": 99977, "epoch": 2380} {"train_loss": -6.223536491394043, "global_step": 99978, "epoch": 2380} {"train_loss": -6.291357040405273, "global_step": 99979, "epoch": 2380} {"train_loss": -6.363417625427246, "global_step": 99980, "epoch": 2380} {"train_loss": -6.317681312561035, "global_step": 99981, "epoch": 2380} {"train_loss": -6.351482391357422, "global_step": 99982, "epoch": 2380} {"train_loss": -6.226254463195801, "global_step": 99983, "epoch": 2380} {"train_loss": -6.23576021194458, "global_step": 99984, "epoch": 2380} {"train_loss": -6.3736090660095215, "global_step": 99985, "epoch": 2380} {"train_loss": -6.270551681518555, "global_step": 99986, "epoch": 2380} {"train_loss": -6.292905807495117, "global_step": 99987, "epoch": 2380} {"train_loss": -6.319649696350098, "global_step": 99988, "epoch": 2380} {"train_loss": -6.425894737243652, "global_step": 99989, "epoch": 2380} {"train_loss": -6.354065895080566, "global_step": 99990, "epoch": 2380} {"train_loss": -6.420804023742676, "global_step": 99991, "epoch": 2380} {"train_loss": -6.403199672698975, "global_step": 99992, "epoch": 2380} {"train_loss": -6.437091827392578, "global_step": 99993, "epoch": 2380} {"train_loss": -6.353248596191406, "global_step": 99994, "epoch": 2380} {"train_loss": -6.330305099487305, "global_step": 99995, "epoch": 2380} {"train_loss": -6.362632751464844, "global_step": 99996, "epoch": 2380} {"train_loss": -6.3024983406066895, "global_step": 99997, "epoch": 2380} {"train_loss": -6.336416721343994, "global_step": 99998, "epoch": 2380} {"train_loss": -6.285482406616211, "global_step": 99999, "epoch": 2380} {"train_loss": -6.407985687255859, "global_step": 100000, "epoch": 2380} {"train_loss": -6.328548283804031, "global_step": 100001, "epoch": 2380, "val_loss": 76303.5546875} {"train_loss": -6.286101818084717, "global_step": 100002, "epoch": 2381} {"train_loss": -6.448460578918457, "global_step": 100003, "epoch": 2381} {"train_loss": -6.388257026672363, "global_step": 100004, "epoch": 2381} {"train_loss": -6.278462886810303, "global_step": 100005, "epoch": 2381} {"train_loss": -6.420387268066406, "global_step": 100006, "epoch": 2381} {"train_loss": -6.222098350524902, "global_step": 100007, "epoch": 2381} {"train_loss": -6.415210723876953, "global_step": 100008, "epoch": 2381} {"train_loss": -6.242755889892578, "global_step": 100009, "epoch": 2381} {"train_loss": -6.403050422668457, "global_step": 100010, "epoch": 2381} {"train_loss": -6.304924964904785, "global_step": 100011, "epoch": 2381} {"train_loss": -6.140900611877441, "global_step": 100012, "epoch": 2381} {"train_loss": -6.438050270080566, "global_step": 100013, "epoch": 2381} {"train_loss": -6.369919776916504, "global_step": 100014, "epoch": 2381} {"train_loss": -6.329302787780762, "global_step": 100015, "epoch": 2381} {"train_loss": -6.27044677734375, "global_step": 100016, "epoch": 2381} {"train_loss": -6.301597595214844, "global_step": 100017, "epoch": 2381} {"train_loss": -6.304879665374756, "global_step": 100018, "epoch": 2381} {"train_loss": -6.283669471740723, "global_step": 100019, "epoch": 2381} {"train_loss": -6.454497337341309, "global_step": 100020, "epoch": 2381} {"train_loss": -6.303848743438721, "global_step": 100021, "epoch": 2381} {"train_loss": -6.41342306137085, "global_step": 100022, "epoch": 2381} {"train_loss": -6.3528361320495605, "global_step": 100023, "epoch": 2381} {"train_loss": -6.353498935699463, "global_step": 100024, "epoch": 2381} {"train_loss": -6.3989129066467285, "global_step": 100025, "epoch": 2381} {"train_loss": -6.357638359069824, "global_step": 100026, "epoch": 2381} {"train_loss": -6.324484348297119, "global_step": 100027, "epoch": 2381} {"train_loss": -6.227649211883545, "global_step": 100028, "epoch": 2381} {"train_loss": -6.289254665374756, "global_step": 100029, "epoch": 2381} {"train_loss": -6.186296463012695, "global_step": 100030, "epoch": 2381} {"train_loss": -6.269782066345215, "global_step": 100031, "epoch": 2381} {"train_loss": -6.303004264831543, "global_step": 100032, "epoch": 2381} {"train_loss": -6.356873989105225, "global_step": 100033, "epoch": 2381} {"train_loss": -6.287851333618164, "global_step": 100034, "epoch": 2381} {"train_loss": -6.318634510040283, "global_step": 100035, "epoch": 2381} {"train_loss": -6.2928547859191895, "global_step": 100036, "epoch": 2381} {"train_loss": -6.312742233276367, "global_step": 100037, "epoch": 2381} {"train_loss": -6.412525653839111, "global_step": 100038, "epoch": 2381} {"train_loss": -6.32810640335083, "global_step": 100039, "epoch": 2381} {"train_loss": -6.4075517654418945, "global_step": 100040, "epoch": 2381} {"train_loss": -6.339715480804443, "global_step": 100041, "epoch": 2381} {"train_loss": -6.339666366577148, "global_step": 100042, "epoch": 2381} {"train_loss": -6.331197943006243, "global_step": 100043, "epoch": 2381, "val_loss": 76027.3671875} {"train_loss": -6.276628017425537, "global_step": 100044, "epoch": 2382} {"train_loss": -6.410308361053467, "global_step": 100045, "epoch": 2382} {"train_loss": -6.269536018371582, "global_step": 100046, "epoch": 2382} {"train_loss": -6.421475410461426, "global_step": 100047, "epoch": 2382} {"train_loss": -6.305773735046387, "global_step": 100048, "epoch": 2382} {"train_loss": -6.275136470794678, "global_step": 100049, "epoch": 2382} {"train_loss": -6.312291145324707, "global_step": 100050, "epoch": 2382} {"train_loss": -6.376969337463379, "global_step": 100051, "epoch": 2382} {"train_loss": -6.456943511962891, "global_step": 100052, "epoch": 2382} {"train_loss": -6.356395721435547, "global_step": 100053, "epoch": 2382} {"train_loss": -6.336050033569336, "global_step": 100054, "epoch": 2382} {"train_loss": -6.414157390594482, "global_step": 100055, "epoch": 2382} {"train_loss": -6.329017162322998, "global_step": 100056, "epoch": 2382} {"train_loss": -6.344560623168945, "global_step": 100057, "epoch": 2382} {"train_loss": -6.349905490875244, "global_step": 100058, "epoch": 2382} {"train_loss": -6.4833478927612305, "global_step": 100059, "epoch": 2382} {"train_loss": -6.388496398925781, "global_step": 100060, "epoch": 2382} {"train_loss": -6.263317108154297, "global_step": 100061, "epoch": 2382} {"train_loss": -6.464263916015625, "global_step": 100062, "epoch": 2382} {"train_loss": -6.499814510345459, "global_step": 100063, "epoch": 2382} {"train_loss": -6.338137626647949, "global_step": 100064, "epoch": 2382} {"train_loss": -6.379692077636719, "global_step": 100065, "epoch": 2382} {"train_loss": -6.406615257263184, "global_step": 100066, "epoch": 2382} {"train_loss": -6.300130844116211, "global_step": 100067, "epoch": 2382} {"train_loss": -6.457535743713379, "global_step": 100068, "epoch": 2382} {"train_loss": -6.411404609680176, "global_step": 100069, "epoch": 2382} {"train_loss": -6.373045921325684, "global_step": 100070, "epoch": 2382} {"train_loss": -6.397167205810547, "global_step": 100071, "epoch": 2382} {"train_loss": -6.3778886795043945, "global_step": 100072, "epoch": 2382} {"train_loss": -6.416808605194092, "global_step": 100073, "epoch": 2382} {"train_loss": -6.42372465133667, "global_step": 100074, "epoch": 2382} {"train_loss": -6.257635116577148, "global_step": 100075, "epoch": 2382} {"train_loss": -6.351913928985596, "global_step": 100076, "epoch": 2382} {"train_loss": -6.294349193572998, "global_step": 100077, "epoch": 2382} {"train_loss": -6.262707710266113, "global_step": 100078, "epoch": 2382} {"train_loss": -6.297128200531006, "global_step": 100079, "epoch": 2382} {"train_loss": -6.260390281677246, "global_step": 100080, "epoch": 2382} {"train_loss": -6.308313369750977, "global_step": 100081, "epoch": 2382} {"train_loss": -6.394437789916992, "global_step": 100082, "epoch": 2382} {"train_loss": -6.387267112731934, "global_step": 100083, "epoch": 2382} {"train_loss": -6.355703830718994, "global_step": 100084, "epoch": 2382} {"train_loss": -6.361122892016456, "global_step": 100085, "epoch": 2382, "val_loss": 75656.578125} {"train_loss": -6.361551284790039, "global_step": 100086, "epoch": 2383} {"train_loss": -6.463054180145264, "global_step": 100087, "epoch": 2383} {"train_loss": -6.381821632385254, "global_step": 100088, "epoch": 2383} {"train_loss": -6.33051061630249, "global_step": 100089, "epoch": 2383} {"train_loss": -6.31884765625, "global_step": 100090, "epoch": 2383} {"train_loss": -6.383639335632324, "global_step": 100091, "epoch": 2383} {"train_loss": -6.337625980377197, "global_step": 100092, "epoch": 2383} {"train_loss": -6.263811111450195, "global_step": 100093, "epoch": 2383} {"train_loss": -6.408295154571533, "global_step": 100094, "epoch": 2383} {"train_loss": -6.210333824157715, "global_step": 100095, "epoch": 2383} {"train_loss": -6.435962677001953, "global_step": 100096, "epoch": 2383} {"train_loss": -6.464733123779297, "global_step": 100097, "epoch": 2383} {"train_loss": -6.42219352722168, "global_step": 100098, "epoch": 2383} {"train_loss": -6.460692405700684, "global_step": 100099, "epoch": 2383} {"train_loss": -6.380422592163086, "global_step": 100100, "epoch": 2383} {"train_loss": -6.274201393127441, "global_step": 100101, "epoch": 2383} {"train_loss": -6.365687370300293, "global_step": 100102, "epoch": 2383} {"train_loss": -6.359095096588135, "global_step": 100103, "epoch": 2383} {"train_loss": -6.392868995666504, "global_step": 100104, "epoch": 2383} {"train_loss": -6.404087066650391, "global_step": 100105, "epoch": 2383} {"train_loss": -6.386258125305176, "global_step": 100106, "epoch": 2383} {"train_loss": -6.336164474487305, "global_step": 100107, "epoch": 2383} {"train_loss": -6.331109523773193, "global_step": 100108, "epoch": 2383} {"train_loss": -6.4351606369018555, "global_step": 100109, "epoch": 2383} {"train_loss": -6.418562889099121, "global_step": 100110, "epoch": 2383} {"train_loss": -6.289255619049072, "global_step": 100111, "epoch": 2383} {"train_loss": -6.407305717468262, "global_step": 100112, "epoch": 2383} {"train_loss": -6.266324520111084, "global_step": 100113, "epoch": 2383} {"train_loss": -6.342669486999512, "global_step": 100114, "epoch": 2383} {"train_loss": -6.478970527648926, "global_step": 100115, "epoch": 2383} {"train_loss": -6.172706127166748, "global_step": 100116, "epoch": 2383} {"train_loss": -6.307068824768066, "global_step": 100117, "epoch": 2383} {"train_loss": -6.360206604003906, "global_step": 100118, "epoch": 2383} {"train_loss": -6.309389114379883, "global_step": 100119, "epoch": 2383} {"train_loss": -6.33528995513916, "global_step": 100120, "epoch": 2383} {"train_loss": -6.345831871032715, "global_step": 100121, "epoch": 2383} {"train_loss": -6.373930931091309, "global_step": 100122, "epoch": 2383} {"train_loss": -6.293454170227051, "global_step": 100123, "epoch": 2383} {"train_loss": -6.4015960693359375, "global_step": 100124, "epoch": 2383} {"train_loss": -6.2365851402282715, "global_step": 100125, "epoch": 2383} {"train_loss": -6.348637580871582, "global_step": 100126, "epoch": 2383} {"train_loss": -6.356478350503104, "global_step": 100127, "epoch": 2383, "val_loss": 75791.6328125} {"train_loss": -6.281335830688477, "global_step": 100128, "epoch": 2384} {"train_loss": -6.431291580200195, "global_step": 100129, "epoch": 2384} {"train_loss": -6.368444442749023, "global_step": 100130, "epoch": 2384} {"train_loss": -6.461343288421631, "global_step": 100131, "epoch": 2384} {"train_loss": -6.257018566131592, "global_step": 100132, "epoch": 2384} {"train_loss": -6.326117038726807, "global_step": 100133, "epoch": 2384} {"train_loss": -6.3464789390563965, "global_step": 100134, "epoch": 2384} {"train_loss": -6.474193572998047, "global_step": 100135, "epoch": 2384} {"train_loss": -6.411210536956787, "global_step": 100136, "epoch": 2384} {"train_loss": -6.324836730957031, "global_step": 100137, "epoch": 2384} {"train_loss": -6.428269386291504, "global_step": 100138, "epoch": 2384} {"train_loss": -6.3810319900512695, "global_step": 100139, "epoch": 2384} {"train_loss": -6.489573001861572, "global_step": 100140, "epoch": 2384} {"train_loss": -6.388850212097168, "global_step": 100141, "epoch": 2384} {"train_loss": -6.397652626037598, "global_step": 100142, "epoch": 2384} {"train_loss": -6.347232818603516, "global_step": 100143, "epoch": 2384} {"train_loss": -6.299069404602051, "global_step": 100144, "epoch": 2384} {"train_loss": -6.427648544311523, "global_step": 100145, "epoch": 2384} {"train_loss": -6.404541969299316, "global_step": 100146, "epoch": 2384} {"train_loss": -6.309060096740723, "global_step": 100147, "epoch": 2384} {"train_loss": -6.387134552001953, "global_step": 100148, "epoch": 2384} {"train_loss": -6.3846635818481445, "global_step": 100149, "epoch": 2384} {"train_loss": -6.347711563110352, "global_step": 100150, "epoch": 2384} {"train_loss": -6.219298839569092, "global_step": 100151, "epoch": 2384} {"train_loss": -6.326967716217041, "global_step": 100152, "epoch": 2384} {"train_loss": -6.421271324157715, "global_step": 100153, "epoch": 2384} {"train_loss": -6.310030937194824, "global_step": 100154, "epoch": 2384} {"train_loss": -6.410162448883057, "global_step": 100155, "epoch": 2384} {"train_loss": -6.223564624786377, "global_step": 100156, "epoch": 2384} {"train_loss": -6.3342180252075195, "global_step": 100157, "epoch": 2384} {"train_loss": -6.3209123611450195, "global_step": 100158, "epoch": 2384} {"train_loss": -6.335840702056885, "global_step": 100159, "epoch": 2384} {"train_loss": -6.2974114418029785, "global_step": 100160, "epoch": 2384} {"train_loss": -6.349038600921631, "global_step": 100161, "epoch": 2384} {"train_loss": -6.38485050201416, "global_step": 100162, "epoch": 2384} {"train_loss": -6.401659965515137, "global_step": 100163, "epoch": 2384} {"train_loss": -6.375141143798828, "global_step": 100164, "epoch": 2384} {"train_loss": -6.4349565505981445, "global_step": 100165, "epoch": 2384} {"train_loss": -6.35743522644043, "global_step": 100166, "epoch": 2384} {"train_loss": -6.325283527374268, "global_step": 100167, "epoch": 2384} {"train_loss": -6.273393154144287, "global_step": 100168, "epoch": 2384} {"train_loss": -6.35985423269726, "global_step": 100169, "epoch": 2384, "val_loss": 75822.8359375} {"train_loss": -6.3284173011779785, "global_step": 100170, "epoch": 2385} {"train_loss": -6.37985897064209, "global_step": 100171, "epoch": 2385} {"train_loss": -6.442277908325195, "global_step": 100172, "epoch": 2385} {"train_loss": -6.384033203125, "global_step": 100173, "epoch": 2385} {"train_loss": -6.426718235015869, "global_step": 100174, "epoch": 2385} {"train_loss": -6.306602478027344, "global_step": 100175, "epoch": 2385} {"train_loss": -6.483634948730469, "global_step": 100176, "epoch": 2385} {"train_loss": -6.397940635681152, "global_step": 100177, "epoch": 2385} {"train_loss": -6.370654106140137, "global_step": 100178, "epoch": 2385} {"train_loss": -6.313948154449463, "global_step": 100179, "epoch": 2385} {"train_loss": -6.346926689147949, "global_step": 100180, "epoch": 2385} {"train_loss": -6.354988098144531, "global_step": 100181, "epoch": 2385} {"train_loss": -6.46772575378418, "global_step": 100182, "epoch": 2385} {"train_loss": -6.1986284255981445, "global_step": 100183, "epoch": 2385} {"train_loss": -6.472599029541016, "global_step": 100184, "epoch": 2385} {"train_loss": -6.6134843826293945, "global_step": 100185, "epoch": 2385} {"train_loss": -6.455000877380371, "global_step": 100186, "epoch": 2385} {"train_loss": -6.372158050537109, "global_step": 100187, "epoch": 2385} {"train_loss": -6.343776226043701, "global_step": 100188, "epoch": 2385} {"train_loss": -6.366326332092285, "global_step": 100189, "epoch": 2385} {"train_loss": -6.302082061767578, "global_step": 100190, "epoch": 2385} {"train_loss": -6.211966037750244, "global_step": 100191, "epoch": 2385} {"train_loss": -6.257258892059326, "global_step": 100192, "epoch": 2385} {"train_loss": -6.364580154418945, "global_step": 100193, "epoch": 2385} {"train_loss": -6.331799030303955, "global_step": 100194, "epoch": 2385} {"train_loss": -6.456444263458252, "global_step": 100195, "epoch": 2385} {"train_loss": -6.316246032714844, "global_step": 100196, "epoch": 2385} {"train_loss": -6.324950218200684, "global_step": 100197, "epoch": 2385} {"train_loss": -6.419750213623047, "global_step": 100198, "epoch": 2385} {"train_loss": -6.457995414733887, "global_step": 100199, "epoch": 2385} {"train_loss": -6.307556629180908, "global_step": 100200, "epoch": 2385} {"train_loss": -6.243132591247559, "global_step": 100201, "epoch": 2385} {"train_loss": -6.212357521057129, "global_step": 100202, "epoch": 2385} {"train_loss": -6.303676605224609, "global_step": 100203, "epoch": 2385} {"train_loss": -6.385447978973389, "global_step": 100204, "epoch": 2385} {"train_loss": -6.337584972381592, "global_step": 100205, "epoch": 2385} {"train_loss": -6.3423566818237305, "global_step": 100206, "epoch": 2385} {"train_loss": -6.351252555847168, "global_step": 100207, "epoch": 2385} {"train_loss": -6.386637210845947, "global_step": 100208, "epoch": 2385} {"train_loss": -6.416620254516602, "global_step": 100209, "epoch": 2385} {"train_loss": -6.291780471801758, "global_step": 100210, "epoch": 2385} {"train_loss": -6.3587556566510886, "global_step": 100211, "epoch": 2385, "val_loss": 75965.015625} {"train_loss": -6.281925201416016, "global_step": 100212, "epoch": 2386} {"train_loss": -6.3177571296691895, "global_step": 100213, "epoch": 2386} {"train_loss": -6.393938064575195, "global_step": 100214, "epoch": 2386} {"train_loss": -6.33386754989624, "global_step": 100215, "epoch": 2386} {"train_loss": -6.222664833068848, "global_step": 100216, "epoch": 2386} {"train_loss": -6.353489875793457, "global_step": 100217, "epoch": 2386} {"train_loss": -6.286088943481445, "global_step": 100218, "epoch": 2386} {"train_loss": -6.195084571838379, "global_step": 100219, "epoch": 2386} {"train_loss": -6.31220817565918, "global_step": 100220, "epoch": 2386} {"train_loss": -6.309227466583252, "global_step": 100221, "epoch": 2386} {"train_loss": -6.3806257247924805, "global_step": 100222, "epoch": 2386} {"train_loss": -6.367001533508301, "global_step": 100223, "epoch": 2386} {"train_loss": -6.297187805175781, "global_step": 100224, "epoch": 2386} {"train_loss": -6.414261817932129, "global_step": 100225, "epoch": 2386} {"train_loss": -6.425379753112793, "global_step": 100226, "epoch": 2386} {"train_loss": -6.336907386779785, "global_step": 100227, "epoch": 2386} {"train_loss": -6.467921733856201, "global_step": 100228, "epoch": 2386} {"train_loss": -6.265379428863525, "global_step": 100229, "epoch": 2386} {"train_loss": -6.368850231170654, "global_step": 100230, "epoch": 2386} {"train_loss": -6.200262546539307, "global_step": 100231, "epoch": 2386} {"train_loss": -6.458940029144287, "global_step": 100232, "epoch": 2386} {"train_loss": -6.308810234069824, "global_step": 100233, "epoch": 2386} {"train_loss": -6.362773895263672, "global_step": 100234, "epoch": 2386} {"train_loss": -6.338766098022461, "global_step": 100235, "epoch": 2386} {"train_loss": -6.287675380706787, "global_step": 100236, "epoch": 2386} {"train_loss": -6.3584394454956055, "global_step": 100237, "epoch": 2386} {"train_loss": -6.328049659729004, "global_step": 100238, "epoch": 2386} {"train_loss": -6.444634437561035, "global_step": 100239, "epoch": 2386} {"train_loss": -6.382371425628662, "global_step": 100240, "epoch": 2386} {"train_loss": -6.392565727233887, "global_step": 100241, "epoch": 2386} {"train_loss": -6.258317947387695, "global_step": 100242, "epoch": 2386} {"train_loss": -6.382731914520264, "global_step": 100243, "epoch": 2386} {"train_loss": -6.4049482345581055, "global_step": 100244, "epoch": 2386} {"train_loss": -6.273989200592041, "global_step": 100245, "epoch": 2386} {"train_loss": -6.337265491485596, "global_step": 100246, "epoch": 2386} {"train_loss": -6.388728618621826, "global_step": 100247, "epoch": 2386} {"train_loss": -6.290468692779541, "global_step": 100248, "epoch": 2386} {"train_loss": -6.348334312438965, "global_step": 100249, "epoch": 2386} {"train_loss": -6.274099826812744, "global_step": 100250, "epoch": 2386} {"train_loss": -6.185642719268799, "global_step": 100251, "epoch": 2386} {"train_loss": -6.304181098937988, "global_step": 100252, "epoch": 2386} {"train_loss": -6.330347140630086, "global_step": 100253, "epoch": 2386, "val_loss": 75886.7578125} {"train_loss": -6.455379009246826, "global_step": 100254, "epoch": 2387} {"train_loss": -6.341371536254883, "global_step": 100255, "epoch": 2387} {"train_loss": -6.407296657562256, "global_step": 100256, "epoch": 2387} {"train_loss": -6.409149169921875, "global_step": 100257, "epoch": 2387} {"train_loss": -6.440535545349121, "global_step": 100258, "epoch": 2387} {"train_loss": -6.336539268493652, "global_step": 100259, "epoch": 2387} {"train_loss": -6.363803863525391, "global_step": 100260, "epoch": 2387} {"train_loss": -6.3288068771362305, "global_step": 100261, "epoch": 2387} {"train_loss": -6.367671012878418, "global_step": 100262, "epoch": 2387} {"train_loss": -6.440946578979492, "global_step": 100263, "epoch": 2387} {"train_loss": -6.375120639801025, "global_step": 100264, "epoch": 2387} {"train_loss": -6.3810319900512695, "global_step": 100265, "epoch": 2387} {"train_loss": -6.4033613204956055, "global_step": 100266, "epoch": 2387} {"train_loss": -6.45627498626709, "global_step": 100267, "epoch": 2387} {"train_loss": -6.460499286651611, "global_step": 100268, "epoch": 2387} {"train_loss": -6.331780910491943, "global_step": 100269, "epoch": 2387} {"train_loss": -6.373383045196533, "global_step": 100270, "epoch": 2387} {"train_loss": -6.360763072967529, "global_step": 100271, "epoch": 2387} {"train_loss": -6.264491081237793, "global_step": 100272, "epoch": 2387} {"train_loss": -6.304976463317871, "global_step": 100273, "epoch": 2387} {"train_loss": -6.303208351135254, "global_step": 100274, "epoch": 2387} {"train_loss": -6.284627437591553, "global_step": 100275, "epoch": 2387} {"train_loss": -6.261328220367432, "global_step": 100276, "epoch": 2387} {"train_loss": -6.389723300933838, "global_step": 100277, "epoch": 2387} {"train_loss": -6.21640682220459, "global_step": 100278, "epoch": 2387} {"train_loss": -6.28846549987793, "global_step": 100279, "epoch": 2387} {"train_loss": -6.3289337158203125, "global_step": 100280, "epoch": 2387} {"train_loss": -6.158395290374756, "global_step": 100281, "epoch": 2387} {"train_loss": -6.416666507720947, "global_step": 100282, "epoch": 2387} {"train_loss": -6.408900260925293, "global_step": 100283, "epoch": 2387} {"train_loss": -6.1785712242126465, "global_step": 100284, "epoch": 2387} {"train_loss": -6.398193836212158, "global_step": 100285, "epoch": 2387} {"train_loss": -6.31866455078125, "global_step": 100286, "epoch": 2387} {"train_loss": -6.3187785148620605, "global_step": 100287, "epoch": 2387} {"train_loss": -6.2857561111450195, "global_step": 100288, "epoch": 2387} {"train_loss": -6.349187850952148, "global_step": 100289, "epoch": 2387} {"train_loss": -6.351553440093994, "global_step": 100290, "epoch": 2387} {"train_loss": -6.443748474121094, "global_step": 100291, "epoch": 2387} {"train_loss": -6.414487838745117, "global_step": 100292, "epoch": 2387} {"train_loss": -6.255456447601318, "global_step": 100293, "epoch": 2387} {"train_loss": -6.319490432739258, "global_step": 100294, "epoch": 2387} {"train_loss": -6.348972751980736, "global_step": 100295, "epoch": 2387, "val_loss": 75522.9140625} {"train_loss": -6.217613220214844, "global_step": 100296, "epoch": 2388} {"train_loss": -6.3684892654418945, "global_step": 100297, "epoch": 2388} {"train_loss": -6.326167583465576, "global_step": 100298, "epoch": 2388} {"train_loss": -6.360306739807129, "global_step": 100299, "epoch": 2388} {"train_loss": -6.4638495445251465, "global_step": 100300, "epoch": 2388} {"train_loss": -6.276120185852051, "global_step": 100301, "epoch": 2388} {"train_loss": -6.393612384796143, "global_step": 100302, "epoch": 2388} {"train_loss": -6.290324687957764, "global_step": 100303, "epoch": 2388} {"train_loss": -6.3067708015441895, "global_step": 100304, "epoch": 2388} {"train_loss": -6.417330265045166, "global_step": 100305, "epoch": 2388} {"train_loss": -6.346957206726074, "global_step": 100306, "epoch": 2388} {"train_loss": -6.394020080566406, "global_step": 100307, "epoch": 2388} {"train_loss": -6.297918319702148, "global_step": 100308, "epoch": 2388} {"train_loss": -6.349713325500488, "global_step": 100309, "epoch": 2388} {"train_loss": -6.441896438598633, "global_step": 100310, "epoch": 2388} {"train_loss": -6.353127479553223, "global_step": 100311, "epoch": 2388} {"train_loss": -6.278548717498779, "global_step": 100312, "epoch": 2388} {"train_loss": -6.4095587730407715, "global_step": 100313, "epoch": 2388} {"train_loss": -6.3888349533081055, "global_step": 100314, "epoch": 2388} {"train_loss": -6.374771595001221, "global_step": 100315, "epoch": 2388} {"train_loss": -6.254207134246826, "global_step": 100316, "epoch": 2388} {"train_loss": -6.3340373039245605, "global_step": 100317, "epoch": 2388} {"train_loss": -6.454730033874512, "global_step": 100318, "epoch": 2388} {"train_loss": -6.2685136795043945, "global_step": 100319, "epoch": 2388} {"train_loss": -6.445976734161377, "global_step": 100320, "epoch": 2388} {"train_loss": -6.233879089355469, "global_step": 100321, "epoch": 2388} {"train_loss": -6.221303939819336, "global_step": 100322, "epoch": 2388} {"train_loss": -6.427919387817383, "global_step": 100323, "epoch": 2388} {"train_loss": -6.302748203277588, "global_step": 100324, "epoch": 2388} {"train_loss": -6.308852195739746, "global_step": 100325, "epoch": 2388} {"train_loss": -6.229118824005127, "global_step": 100326, "epoch": 2388} {"train_loss": -6.311100959777832, "global_step": 100327, "epoch": 2388} {"train_loss": -6.2724480628967285, "global_step": 100328, "epoch": 2388} {"train_loss": -6.344040870666504, "global_step": 100329, "epoch": 2388} {"train_loss": -6.136173725128174, "global_step": 100330, "epoch": 2388} {"train_loss": -6.258140563964844, "global_step": 100331, "epoch": 2388} {"train_loss": -6.2210798263549805, "global_step": 100332, "epoch": 2388} {"train_loss": -6.2091264724731445, "global_step": 100333, "epoch": 2388} {"train_loss": -6.3525238037109375, "global_step": 100334, "epoch": 2388} {"train_loss": -6.282589912414551, "global_step": 100335, "epoch": 2388} {"train_loss": -6.243729114532471, "global_step": 100336, "epoch": 2388} {"train_loss": -6.321256819225493, "global_step": 100337, "epoch": 2388, "val_loss": 75752.03125} {"train_loss": -6.367772579193115, "global_step": 100338, "epoch": 2389} {"train_loss": -6.269637584686279, "global_step": 100339, "epoch": 2389} {"train_loss": -6.401066303253174, "global_step": 100340, "epoch": 2389} {"train_loss": -6.342467308044434, "global_step": 100341, "epoch": 2389} {"train_loss": -6.349283695220947, "global_step": 100342, "epoch": 2389} {"train_loss": -6.332675933837891, "global_step": 100343, "epoch": 2389} {"train_loss": -6.3618550300598145, "global_step": 100344, "epoch": 2389} {"train_loss": -6.405541896820068, "global_step": 100345, "epoch": 2389} {"train_loss": -6.368391036987305, "global_step": 100346, "epoch": 2389} {"train_loss": -6.38809061050415, "global_step": 100347, "epoch": 2389} {"train_loss": -6.347068786621094, "global_step": 100348, "epoch": 2389} {"train_loss": -6.420989990234375, "global_step": 100349, "epoch": 2389} {"train_loss": -6.486444473266602, "global_step": 100350, "epoch": 2389} {"train_loss": -6.482443809509277, "global_step": 100351, "epoch": 2389} {"train_loss": -6.364536762237549, "global_step": 100352, "epoch": 2389} {"train_loss": -6.404975891113281, "global_step": 100353, "epoch": 2389} {"train_loss": -6.495217800140381, "global_step": 100354, "epoch": 2389} {"train_loss": -6.347938060760498, "global_step": 100355, "epoch": 2389} {"train_loss": -6.353730201721191, "global_step": 100356, "epoch": 2389} {"train_loss": -6.401613235473633, "global_step": 100357, "epoch": 2389} {"train_loss": -6.35819673538208, "global_step": 100358, "epoch": 2389} {"train_loss": -6.367425441741943, "global_step": 100359, "epoch": 2389} {"train_loss": -6.323516845703125, "global_step": 100360, "epoch": 2389} {"train_loss": -6.442600250244141, "global_step": 100361, "epoch": 2389} {"train_loss": -6.336636066436768, "global_step": 100362, "epoch": 2389} {"train_loss": -6.330473899841309, "global_step": 100363, "epoch": 2389} {"train_loss": -6.191790580749512, "global_step": 100364, "epoch": 2389} {"train_loss": -6.439016342163086, "global_step": 100365, "epoch": 2389} {"train_loss": -6.254795551300049, "global_step": 100366, "epoch": 2389} {"train_loss": -6.344366073608398, "global_step": 100367, "epoch": 2389} {"train_loss": -6.486075401306152, "global_step": 100368, "epoch": 2389} {"train_loss": -6.194084644317627, "global_step": 100369, "epoch": 2389} {"train_loss": -6.300498962402344, "global_step": 100370, "epoch": 2389} {"train_loss": -6.351625442504883, "global_step": 100371, "epoch": 2389} {"train_loss": -6.2794599533081055, "global_step": 100372, "epoch": 2389} {"train_loss": -6.148433685302734, "global_step": 100373, "epoch": 2389} {"train_loss": -6.26630973815918, "global_step": 100374, "epoch": 2389} {"train_loss": -6.37855863571167, "global_step": 100375, "epoch": 2389} {"train_loss": -6.251029014587402, "global_step": 100376, "epoch": 2389} {"train_loss": -6.2456512451171875, "global_step": 100377, "epoch": 2389} {"train_loss": -6.274447441101074, "global_step": 100378, "epoch": 2389} {"train_loss": -6.345268930707659, "global_step": 100379, "epoch": 2389, "val_loss": 75845.7421875} {"train_loss": -6.335250377655029, "global_step": 100380, "epoch": 2390} {"train_loss": -6.360921859741211, "global_step": 100381, "epoch": 2390} {"train_loss": -6.265802383422852, "global_step": 100382, "epoch": 2390} {"train_loss": -6.3485918045043945, "global_step": 100383, "epoch": 2390} {"train_loss": -6.355803966522217, "global_step": 100384, "epoch": 2390} {"train_loss": -6.4434123039245605, "global_step": 100385, "epoch": 2390} {"train_loss": -6.356146335601807, "global_step": 100386, "epoch": 2390} {"train_loss": -6.412858009338379, "global_step": 100387, "epoch": 2390} {"train_loss": -6.308014869689941, "global_step": 100388, "epoch": 2390} {"train_loss": -6.341028690338135, "global_step": 100389, "epoch": 2390} {"train_loss": -6.39104700088501, "global_step": 100390, "epoch": 2390} {"train_loss": -6.279277324676514, "global_step": 100391, "epoch": 2390} {"train_loss": -6.192358016967773, "global_step": 100392, "epoch": 2390} {"train_loss": -6.400454521179199, "global_step": 100393, "epoch": 2390} {"train_loss": -6.310320854187012, "global_step": 100394, "epoch": 2390} {"train_loss": -6.171148777008057, "global_step": 100395, "epoch": 2390} {"train_loss": -6.305240631103516, "global_step": 100396, "epoch": 2390} {"train_loss": -6.345582962036133, "global_step": 100397, "epoch": 2390} {"train_loss": -6.380392074584961, "global_step": 100398, "epoch": 2390} {"train_loss": -6.386519432067871, "global_step": 100399, "epoch": 2390} {"train_loss": -6.323065757751465, "global_step": 100400, "epoch": 2390} {"train_loss": -6.393134117126465, "global_step": 100401, "epoch": 2390} {"train_loss": -6.301215648651123, "global_step": 100402, "epoch": 2390} {"train_loss": -6.327670097351074, "global_step": 100403, "epoch": 2390} {"train_loss": -6.328770637512207, "global_step": 100404, "epoch": 2390} {"train_loss": -6.359764099121094, "global_step": 100405, "epoch": 2390} {"train_loss": -6.282379627227783, "global_step": 100406, "epoch": 2390} {"train_loss": -6.397454261779785, "global_step": 100407, "epoch": 2390} {"train_loss": -6.366538047790527, "global_step": 100408, "epoch": 2390} {"train_loss": -6.284445762634277, "global_step": 100409, "epoch": 2390} {"train_loss": -6.4075541496276855, "global_step": 100410, "epoch": 2390} {"train_loss": -6.332354545593262, "global_step": 100411, "epoch": 2390} {"train_loss": -6.455633163452148, "global_step": 100412, "epoch": 2390} {"train_loss": -6.314226150512695, "global_step": 100413, "epoch": 2390} {"train_loss": -6.3902740478515625, "global_step": 100414, "epoch": 2390} {"train_loss": -6.191653251647949, "global_step": 100415, "epoch": 2390} {"train_loss": -6.303702354431152, "global_step": 100416, "epoch": 2390} {"train_loss": -6.322441101074219, "global_step": 100417, "epoch": 2390} {"train_loss": -6.41432523727417, "global_step": 100418, "epoch": 2390} {"train_loss": -6.356868743896484, "global_step": 100419, "epoch": 2390} {"train_loss": -6.492977142333984, "global_step": 100420, "epoch": 2390} {"train_loss": -6.342952909923735, "global_step": 100421, "epoch": 2390, "val_loss": 76064.0078125} {"train_loss": -6.345624923706055, "global_step": 100422, "epoch": 2391} {"train_loss": -6.442830562591553, "global_step": 100423, "epoch": 2391} {"train_loss": -6.486883163452148, "global_step": 100424, "epoch": 2391} {"train_loss": -6.427459716796875, "global_step": 100425, "epoch": 2391} {"train_loss": -6.426668167114258, "global_step": 100426, "epoch": 2391} {"train_loss": -6.301727771759033, "global_step": 100427, "epoch": 2391} {"train_loss": -6.47878885269165, "global_step": 100428, "epoch": 2391} {"train_loss": -6.351401329040527, "global_step": 100429, "epoch": 2391} {"train_loss": -6.41957950592041, "global_step": 100430, "epoch": 2391} {"train_loss": -6.4863481521606445, "global_step": 100431, "epoch": 2391} {"train_loss": -6.286432266235352, "global_step": 100432, "epoch": 2391} {"train_loss": -6.406599998474121, "global_step": 100433, "epoch": 2391} {"train_loss": -6.3670148849487305, "global_step": 100434, "epoch": 2391} {"train_loss": -6.312929630279541, "global_step": 100435, "epoch": 2391} {"train_loss": -6.3197245597839355, "global_step": 100436, "epoch": 2391} {"train_loss": -6.258999347686768, "global_step": 100437, "epoch": 2391} {"train_loss": -6.387576580047607, "global_step": 100438, "epoch": 2391} {"train_loss": -6.350525856018066, "global_step": 100439, "epoch": 2391} {"train_loss": -6.324580192565918, "global_step": 100440, "epoch": 2391} {"train_loss": -6.367414474487305, "global_step": 100441, "epoch": 2391} {"train_loss": -6.323916435241699, "global_step": 100442, "epoch": 2391} {"train_loss": -6.263583183288574, "global_step": 100443, "epoch": 2391} {"train_loss": -6.459171295166016, "global_step": 100444, "epoch": 2391} {"train_loss": -6.352788925170898, "global_step": 100445, "epoch": 2391} {"train_loss": -6.4553937911987305, "global_step": 100446, "epoch": 2391} {"train_loss": -6.380619525909424, "global_step": 100447, "epoch": 2391} {"train_loss": -6.310054779052734, "global_step": 100448, "epoch": 2391} {"train_loss": -6.38018798828125, "global_step": 100449, "epoch": 2391} {"train_loss": -6.282837867736816, "global_step": 100450, "epoch": 2391} {"train_loss": -6.378540992736816, "global_step": 100451, "epoch": 2391} {"train_loss": -6.2704386711120605, "global_step": 100452, "epoch": 2391} {"train_loss": -6.421429634094238, "global_step": 100453, "epoch": 2391} {"train_loss": -6.312655448913574, "global_step": 100454, "epoch": 2391} {"train_loss": -6.301580429077148, "global_step": 100455, "epoch": 2391} {"train_loss": -6.37494421005249, "global_step": 100456, "epoch": 2391} {"train_loss": -6.249670028686523, "global_step": 100457, "epoch": 2391} {"train_loss": -6.316690921783447, "global_step": 100458, "epoch": 2391} {"train_loss": -6.367728233337402, "global_step": 100459, "epoch": 2391} {"train_loss": -6.295210838317871, "global_step": 100460, "epoch": 2391} {"train_loss": -6.284823894500732, "global_step": 100461, "epoch": 2391} {"train_loss": -6.3030853271484375, "global_step": 100462, "epoch": 2391} {"train_loss": -6.358560562133789, "global_step": 100463, "epoch": 2391, "val_loss": 76166.46875} {"train_loss": -6.330162048339844, "global_step": 100464, "epoch": 2392} {"train_loss": -6.333613395690918, "global_step": 100465, "epoch": 2392} {"train_loss": -6.218003749847412, "global_step": 100466, "epoch": 2392} {"train_loss": -6.360646724700928, "global_step": 100467, "epoch": 2392} {"train_loss": -6.400533676147461, "global_step": 100468, "epoch": 2392} {"train_loss": -6.3524065017700195, "global_step": 100469, "epoch": 2392} {"train_loss": -6.369539260864258, "global_step": 100470, "epoch": 2392} {"train_loss": -6.3017120361328125, "global_step": 100471, "epoch": 2392} {"train_loss": -6.291141986846924, "global_step": 100472, "epoch": 2392} {"train_loss": -6.257248878479004, "global_step": 100473, "epoch": 2392} {"train_loss": -6.386085510253906, "global_step": 100474, "epoch": 2392} {"train_loss": -6.309506416320801, "global_step": 100475, "epoch": 2392} {"train_loss": -6.438458442687988, "global_step": 100476, "epoch": 2392} {"train_loss": -6.3377885818481445, "global_step": 100477, "epoch": 2392} {"train_loss": -6.269636631011963, "global_step": 100478, "epoch": 2392} {"train_loss": -6.383299350738525, "global_step": 100479, "epoch": 2392} {"train_loss": -6.273983955383301, "global_step": 100480, "epoch": 2392} {"train_loss": -6.331686496734619, "global_step": 100481, "epoch": 2392} {"train_loss": -6.26890754699707, "global_step": 100482, "epoch": 2392} {"train_loss": -6.3233184814453125, "global_step": 100483, "epoch": 2392} {"train_loss": -6.318846702575684, "global_step": 100484, "epoch": 2392} {"train_loss": -6.334557056427002, "global_step": 100485, "epoch": 2392} {"train_loss": -6.28934383392334, "global_step": 100486, "epoch": 2392} {"train_loss": -6.414231300354004, "global_step": 100487, "epoch": 2392} {"train_loss": -6.358608245849609, "global_step": 100488, "epoch": 2392} {"train_loss": -6.464068412780762, "global_step": 100489, "epoch": 2392} {"train_loss": -6.340137958526611, "global_step": 100490, "epoch": 2392} {"train_loss": -6.400179862976074, "global_step": 100491, "epoch": 2392} {"train_loss": -6.428831100463867, "global_step": 100492, "epoch": 2392} {"train_loss": -6.33642578125, "global_step": 100493, "epoch": 2392} {"train_loss": -6.37693452835083, "global_step": 100494, "epoch": 2392} {"train_loss": -6.322362899780273, "global_step": 100495, "epoch": 2392} {"train_loss": -6.378208160400391, "global_step": 100496, "epoch": 2392} {"train_loss": -6.416454792022705, "global_step": 100497, "epoch": 2392} {"train_loss": -6.374195098876953, "global_step": 100498, "epoch": 2392} {"train_loss": -6.461657524108887, "global_step": 100499, "epoch": 2392} {"train_loss": -6.259317398071289, "global_step": 100500, "epoch": 2392} {"train_loss": -6.299404621124268, "global_step": 100501, "epoch": 2392} {"train_loss": -6.336421489715576, "global_step": 100502, "epoch": 2392} {"train_loss": -6.315341949462891, "global_step": 100503, "epoch": 2392} {"train_loss": -6.261018753051758, "global_step": 100504, "epoch": 2392} {"train_loss": -6.337996255783808, "global_step": 100505, "epoch": 2392, "val_loss": 76471.640625} {"train_loss": -6.314705848693848, "global_step": 100506, "epoch": 2393} {"train_loss": -6.178072929382324, "global_step": 100507, "epoch": 2393} {"train_loss": -6.4663190841674805, "global_step": 100508, "epoch": 2393} {"train_loss": -6.2960920333862305, "global_step": 100509, "epoch": 2393} {"train_loss": -6.341517448425293, "global_step": 100510, "epoch": 2393} {"train_loss": -6.3253655433654785, "global_step": 100511, "epoch": 2393} {"train_loss": -6.245511531829834, "global_step": 100512, "epoch": 2393} {"train_loss": -6.43680477142334, "global_step": 100513, "epoch": 2393} {"train_loss": -6.320127964019775, "global_step": 100514, "epoch": 2393} {"train_loss": -6.38448429107666, "global_step": 100515, "epoch": 2393} {"train_loss": -6.352631092071533, "global_step": 100516, "epoch": 2393} {"train_loss": -6.292387008666992, "global_step": 100517, "epoch": 2393} {"train_loss": -6.510660171508789, "global_step": 100518, "epoch": 2393} {"train_loss": -6.295759201049805, "global_step": 100519, "epoch": 2393} {"train_loss": -6.310669898986816, "global_step": 100520, "epoch": 2393} {"train_loss": -6.309810638427734, "global_step": 100521, "epoch": 2393} {"train_loss": -6.3858842849731445, "global_step": 100522, "epoch": 2393} {"train_loss": -6.353392601013184, "global_step": 100523, "epoch": 2393} {"train_loss": -6.383317947387695, "global_step": 100524, "epoch": 2393} {"train_loss": -6.215776443481445, "global_step": 100525, "epoch": 2393} {"train_loss": -6.4350152015686035, "global_step": 100526, "epoch": 2393} {"train_loss": -6.351409912109375, "global_step": 100527, "epoch": 2393} {"train_loss": -6.430142402648926, "global_step": 100528, "epoch": 2393} {"train_loss": -6.276956558227539, "global_step": 100529, "epoch": 2393} {"train_loss": -6.40130615234375, "global_step": 100530, "epoch": 2393} {"train_loss": -6.381556034088135, "global_step": 100531, "epoch": 2393} {"train_loss": -6.30916690826416, "global_step": 100532, "epoch": 2393} {"train_loss": -6.394430160522461, "global_step": 100533, "epoch": 2393} {"train_loss": -6.423458576202393, "global_step": 100534, "epoch": 2393} {"train_loss": -6.289318561553955, "global_step": 100535, "epoch": 2393} {"train_loss": -6.356130599975586, "global_step": 100536, "epoch": 2393} {"train_loss": -6.319108009338379, "global_step": 100537, "epoch": 2393} {"train_loss": -6.457090377807617, "global_step": 100538, "epoch": 2393} {"train_loss": -6.431121826171875, "global_step": 100539, "epoch": 2393} {"train_loss": -6.318866729736328, "global_step": 100540, "epoch": 2393} {"train_loss": -6.408749103546143, "global_step": 100541, "epoch": 2393} {"train_loss": -6.36252498626709, "global_step": 100542, "epoch": 2393} {"train_loss": -6.393899917602539, "global_step": 100543, "epoch": 2393} {"train_loss": -6.370772361755371, "global_step": 100544, "epoch": 2393} {"train_loss": -6.383020401000977, "global_step": 100545, "epoch": 2393} {"train_loss": -6.518621921539307, "global_step": 100546, "epoch": 2393} {"train_loss": -6.359707083020892, "global_step": 100547, "epoch": 2393, "val_loss": 75718.375} {"train_loss": -6.343014717102051, "global_step": 100548, "epoch": 2394} {"train_loss": -6.445829391479492, "global_step": 100549, "epoch": 2394} {"train_loss": -6.357430934906006, "global_step": 100550, "epoch": 2394} {"train_loss": -6.3309102058410645, "global_step": 100551, "epoch": 2394} {"train_loss": -6.29707145690918, "global_step": 100552, "epoch": 2394} {"train_loss": -6.395441055297852, "global_step": 100553, "epoch": 2394} {"train_loss": -6.265989303588867, "global_step": 100554, "epoch": 2394} {"train_loss": -6.354781150817871, "global_step": 100555, "epoch": 2394} {"train_loss": -6.366305828094482, "global_step": 100556, "epoch": 2394} {"train_loss": -6.430030345916748, "global_step": 100557, "epoch": 2394} {"train_loss": -6.396044731140137, "global_step": 100558, "epoch": 2394} {"train_loss": -6.468797206878662, "global_step": 100559, "epoch": 2394} {"train_loss": -6.409760475158691, "global_step": 100560, "epoch": 2394} {"train_loss": -6.313703536987305, "global_step": 100561, "epoch": 2394} {"train_loss": -6.368332386016846, "global_step": 100562, "epoch": 2394} {"train_loss": -6.267375469207764, "global_step": 100563, "epoch": 2394} {"train_loss": -6.383142948150635, "global_step": 100564, "epoch": 2394} {"train_loss": -6.3459153175354, "global_step": 100565, "epoch": 2394} {"train_loss": -6.311432838439941, "global_step": 100566, "epoch": 2394} {"train_loss": -6.327246189117432, "global_step": 100567, "epoch": 2394} {"train_loss": -6.386114120483398, "global_step": 100568, "epoch": 2394} {"train_loss": -6.3013081550598145, "global_step": 100569, "epoch": 2394} {"train_loss": -6.387042045593262, "global_step": 100570, "epoch": 2394} {"train_loss": -6.303284645080566, "global_step": 100571, "epoch": 2394} {"train_loss": -6.257378101348877, "global_step": 100572, "epoch": 2394} {"train_loss": -6.266629219055176, "global_step": 100573, "epoch": 2394} {"train_loss": -6.309380531311035, "global_step": 100574, "epoch": 2394} {"train_loss": -6.295373439788818, "global_step": 100575, "epoch": 2394} {"train_loss": -6.331399917602539, "global_step": 100576, "epoch": 2394} {"train_loss": -6.217596054077148, "global_step": 100577, "epoch": 2394} {"train_loss": -6.287775039672852, "global_step": 100578, "epoch": 2394} {"train_loss": -6.379643440246582, "global_step": 100579, "epoch": 2394} {"train_loss": -6.329031944274902, "global_step": 100580, "epoch": 2394} {"train_loss": -6.441729545593262, "global_step": 100581, "epoch": 2394} {"train_loss": -6.328670501708984, "global_step": 100582, "epoch": 2394} {"train_loss": -6.33577823638916, "global_step": 100583, "epoch": 2394} {"train_loss": -6.3198699951171875, "global_step": 100584, "epoch": 2394} {"train_loss": -6.34758186340332, "global_step": 100585, "epoch": 2394} {"train_loss": -6.344488143920898, "global_step": 100586, "epoch": 2394} {"train_loss": -6.285485744476318, "global_step": 100587, "epoch": 2394} {"train_loss": -6.402063369750977, "global_step": 100588, "epoch": 2394} {"train_loss": -6.344232865742275, "global_step": 100589, "epoch": 2394, "val_loss": 75785.125} {"train_loss": -6.444915771484375, "global_step": 100590, "epoch": 2395} {"train_loss": -6.485203742980957, "global_step": 100591, "epoch": 2395} {"train_loss": -6.2889790534973145, "global_step": 100592, "epoch": 2395} {"train_loss": -6.3881120681762695, "global_step": 100593, "epoch": 2395} {"train_loss": -6.443737030029297, "global_step": 100594, "epoch": 2395} {"train_loss": -6.3566389083862305, "global_step": 100595, "epoch": 2395} {"train_loss": -6.277417182922363, "global_step": 100596, "epoch": 2395} {"train_loss": -6.432309150695801, "global_step": 100597, "epoch": 2395} {"train_loss": -6.351863384246826, "global_step": 100598, "epoch": 2395} {"train_loss": -6.331151962280273, "global_step": 100599, "epoch": 2395} {"train_loss": -6.359975814819336, "global_step": 100600, "epoch": 2395} {"train_loss": -6.361715316772461, "global_step": 100601, "epoch": 2395} {"train_loss": -6.467339515686035, "global_step": 100602, "epoch": 2395} {"train_loss": -6.49497127532959, "global_step": 100603, "epoch": 2395} {"train_loss": -6.532504081726074, "global_step": 100604, "epoch": 2395} {"train_loss": -6.366656303405762, "global_step": 100605, "epoch": 2395} {"train_loss": -6.445584297180176, "global_step": 100606, "epoch": 2395} {"train_loss": -6.386922836303711, "global_step": 100607, "epoch": 2395} {"train_loss": -6.318870544433594, "global_step": 100608, "epoch": 2395} {"train_loss": -6.416698932647705, "global_step": 100609, "epoch": 2395} {"train_loss": -6.348456859588623, "global_step": 100610, "epoch": 2395} {"train_loss": -6.279601097106934, "global_step": 100611, "epoch": 2395} {"train_loss": -6.369759559631348, "global_step": 100612, "epoch": 2395} {"train_loss": -6.3942108154296875, "global_step": 100613, "epoch": 2395} {"train_loss": -6.374425411224365, "global_step": 100614, "epoch": 2395} {"train_loss": -6.334344387054443, "global_step": 100615, "epoch": 2395} {"train_loss": -6.457389831542969, "global_step": 100616, "epoch": 2395} {"train_loss": -6.39088249206543, "global_step": 100617, "epoch": 2395} {"train_loss": -6.451574325561523, "global_step": 100618, "epoch": 2395} {"train_loss": -6.5253753662109375, "global_step": 100619, "epoch": 2395} {"train_loss": -6.423736572265625, "global_step": 100620, "epoch": 2395} {"train_loss": -6.395210266113281, "global_step": 100621, "epoch": 2395} {"train_loss": -6.380544662475586, "global_step": 100622, "epoch": 2395} {"train_loss": -6.352252006530762, "global_step": 100623, "epoch": 2395} {"train_loss": -6.45198917388916, "global_step": 100624, "epoch": 2395} {"train_loss": -6.4008378982543945, "global_step": 100625, "epoch": 2395} {"train_loss": -6.4163899421691895, "global_step": 100626, "epoch": 2395} {"train_loss": -6.320306777954102, "global_step": 100627, "epoch": 2395} {"train_loss": -6.350930690765381, "global_step": 100628, "epoch": 2395} {"train_loss": -6.285480499267578, "global_step": 100629, "epoch": 2395} {"train_loss": -6.451681137084961, "global_step": 100630, "epoch": 2395} {"train_loss": -6.389831997099376, "global_step": 100631, "epoch": 2395, "val_loss": 75660.9140625} {"train_loss": -6.396119594573975, "global_step": 100632, "epoch": 2396} {"train_loss": -6.344571113586426, "global_step": 100633, "epoch": 2396} {"train_loss": -6.397085666656494, "global_step": 100634, "epoch": 2396} {"train_loss": -6.3969855308532715, "global_step": 100635, "epoch": 2396} {"train_loss": -6.300920486450195, "global_step": 100636, "epoch": 2396} {"train_loss": -6.44792366027832, "global_step": 100637, "epoch": 2396} {"train_loss": -6.527233600616455, "global_step": 100638, "epoch": 2396} {"train_loss": -6.338105201721191, "global_step": 100639, "epoch": 2396} {"train_loss": -6.407753944396973, "global_step": 100640, "epoch": 2396} {"train_loss": -6.40866756439209, "global_step": 100641, "epoch": 2396} {"train_loss": -6.478670120239258, "global_step": 100642, "epoch": 2396} {"train_loss": -6.392613410949707, "global_step": 100643, "epoch": 2396} {"train_loss": -6.379169464111328, "global_step": 100644, "epoch": 2396} {"train_loss": -6.2956156730651855, "global_step": 100645, "epoch": 2396} {"train_loss": -6.281835556030273, "global_step": 100646, "epoch": 2396} {"train_loss": -6.397150039672852, "global_step": 100647, "epoch": 2396} {"train_loss": -6.327040195465088, "global_step": 100648, "epoch": 2396} {"train_loss": -6.349147319793701, "global_step": 100649, "epoch": 2396} {"train_loss": -6.337076187133789, "global_step": 100650, "epoch": 2396} {"train_loss": -6.269060134887695, "global_step": 100651, "epoch": 2396} {"train_loss": -6.308419704437256, "global_step": 100652, "epoch": 2396} {"train_loss": -6.441745758056641, "global_step": 100653, "epoch": 2396} {"train_loss": -6.470112323760986, "global_step": 100654, "epoch": 2396} {"train_loss": -6.396900177001953, "global_step": 100655, "epoch": 2396} {"train_loss": -6.3342742919921875, "global_step": 100656, "epoch": 2396} {"train_loss": -6.407774448394775, "global_step": 100657, "epoch": 2396} {"train_loss": -6.338229656219482, "global_step": 100658, "epoch": 2396} {"train_loss": -6.3585686683654785, "global_step": 100659, "epoch": 2396} {"train_loss": -6.285867691040039, "global_step": 100660, "epoch": 2396} {"train_loss": -6.334040641784668, "global_step": 100661, "epoch": 2396} {"train_loss": -6.374780654907227, "global_step": 100662, "epoch": 2396} {"train_loss": -6.352104187011719, "global_step": 100663, "epoch": 2396} {"train_loss": -6.352662086486816, "global_step": 100664, "epoch": 2396} {"train_loss": -6.289032936096191, "global_step": 100665, "epoch": 2396} {"train_loss": -6.280409812927246, "global_step": 100666, "epoch": 2396} {"train_loss": -6.392509937286377, "global_step": 100667, "epoch": 2396} {"train_loss": -6.388663291931152, "global_step": 100668, "epoch": 2396} {"train_loss": -6.385529518127441, "global_step": 100669, "epoch": 2396} {"train_loss": -6.358000755310059, "global_step": 100670, "epoch": 2396} {"train_loss": -6.380847930908203, "global_step": 100671, "epoch": 2396} {"train_loss": -6.349422454833984, "global_step": 100672, "epoch": 2396} {"train_loss": -6.365588051932199, "global_step": 100673, "epoch": 2396, "val_loss": 75816.6171875} {"train_loss": -6.345251083374023, "global_step": 100674, "epoch": 2397} {"train_loss": -6.326767444610596, "global_step": 100675, "epoch": 2397} {"train_loss": -6.334318161010742, "global_step": 100676, "epoch": 2397} {"train_loss": -6.369592666625977, "global_step": 100677, "epoch": 2397} {"train_loss": -6.317068099975586, "global_step": 100678, "epoch": 2397} {"train_loss": -6.371453285217285, "global_step": 100679, "epoch": 2397} {"train_loss": -6.325048446655273, "global_step": 100680, "epoch": 2397} {"train_loss": -6.359956741333008, "global_step": 100681, "epoch": 2397} {"train_loss": -6.377472877502441, "global_step": 100682, "epoch": 2397} {"train_loss": -6.495382308959961, "global_step": 100683, "epoch": 2397} {"train_loss": -6.335303783416748, "global_step": 100684, "epoch": 2397} {"train_loss": -6.296630859375, "global_step": 100685, "epoch": 2397} {"train_loss": -6.303597927093506, "global_step": 100686, "epoch": 2397} {"train_loss": -6.3222808837890625, "global_step": 100687, "epoch": 2397} {"train_loss": -6.406877517700195, "global_step": 100688, "epoch": 2397} {"train_loss": -6.368146896362305, "global_step": 100689, "epoch": 2397} {"train_loss": -6.306943893432617, "global_step": 100690, "epoch": 2397} {"train_loss": -6.443041801452637, "global_step": 100691, "epoch": 2397} {"train_loss": -6.386745452880859, "global_step": 100692, "epoch": 2397} {"train_loss": -6.339103698730469, "global_step": 100693, "epoch": 2397} {"train_loss": -6.358720779418945, "global_step": 100694, "epoch": 2397} {"train_loss": -6.470495700836182, "global_step": 100695, "epoch": 2397} {"train_loss": -6.410764694213867, "global_step": 100696, "epoch": 2397} {"train_loss": -6.32509183883667, "global_step": 100697, "epoch": 2397} {"train_loss": -6.406676292419434, "global_step": 100698, "epoch": 2397} {"train_loss": -6.2985148429870605, "global_step": 100699, "epoch": 2397} {"train_loss": -6.371766567230225, "global_step": 100700, "epoch": 2397} {"train_loss": -6.323920249938965, "global_step": 100701, "epoch": 2397} {"train_loss": -6.396629810333252, "global_step": 100702, "epoch": 2397} {"train_loss": -6.40960693359375, "global_step": 100703, "epoch": 2397} {"train_loss": -6.446515083312988, "global_step": 100704, "epoch": 2397} {"train_loss": -6.325285911560059, "global_step": 100705, "epoch": 2397} {"train_loss": -6.349548816680908, "global_step": 100706, "epoch": 2397} {"train_loss": -6.4820356369018555, "global_step": 100707, "epoch": 2397} {"train_loss": -6.374198913574219, "global_step": 100708, "epoch": 2397} {"train_loss": -6.340793132781982, "global_step": 100709, "epoch": 2397} {"train_loss": -6.297755718231201, "global_step": 100710, "epoch": 2397} {"train_loss": -6.482448577880859, "global_step": 100711, "epoch": 2397} {"train_loss": -6.326117515563965, "global_step": 100712, "epoch": 2397} {"train_loss": -6.413627624511719, "global_step": 100713, "epoch": 2397} {"train_loss": -6.368163108825684, "global_step": 100714, "epoch": 2397} {"train_loss": -6.3675817875635055, "global_step": 100715, "epoch": 2397, "val_loss": 75709.953125} {"train_loss": -6.309008598327637, "global_step": 100716, "epoch": 2398} {"train_loss": -6.362547874450684, "global_step": 100717, "epoch": 2398} {"train_loss": -6.380860805511475, "global_step": 100718, "epoch": 2398} {"train_loss": -6.363159656524658, "global_step": 100719, "epoch": 2398} {"train_loss": -6.279738903045654, "global_step": 100720, "epoch": 2398} {"train_loss": -6.401573181152344, "global_step": 100721, "epoch": 2398} {"train_loss": -6.2982683181762695, "global_step": 100722, "epoch": 2398} {"train_loss": -6.44058895111084, "global_step": 100723, "epoch": 2398} {"train_loss": -6.321541786193848, "global_step": 100724, "epoch": 2398} {"train_loss": -6.405824661254883, "global_step": 100725, "epoch": 2398} {"train_loss": -6.442744731903076, "global_step": 100726, "epoch": 2398} {"train_loss": -6.4392805099487305, "global_step": 100727, "epoch": 2398} {"train_loss": -6.396498203277588, "global_step": 100728, "epoch": 2398} {"train_loss": -6.398512363433838, "global_step": 100729, "epoch": 2398} {"train_loss": -6.346613883972168, "global_step": 100730, "epoch": 2398} {"train_loss": -6.347644329071045, "global_step": 100731, "epoch": 2398} {"train_loss": -6.309946060180664, "global_step": 100732, "epoch": 2398} {"train_loss": -6.410122394561768, "global_step": 100733, "epoch": 2398} {"train_loss": -6.44120454788208, "global_step": 100734, "epoch": 2398} {"train_loss": -6.369559288024902, "global_step": 100735, "epoch": 2398} {"train_loss": -6.226047515869141, "global_step": 100736, "epoch": 2398} {"train_loss": -6.409910202026367, "global_step": 100737, "epoch": 2398} {"train_loss": -6.44966983795166, "global_step": 100738, "epoch": 2398} {"train_loss": -6.485919952392578, "global_step": 100739, "epoch": 2398} {"train_loss": -6.429222106933594, "global_step": 100740, "epoch": 2398} {"train_loss": -6.432621002197266, "global_step": 100741, "epoch": 2398} {"train_loss": -6.453348636627197, "global_step": 100742, "epoch": 2398} {"train_loss": -6.495570182800293, "global_step": 100743, "epoch": 2398} {"train_loss": -6.451154708862305, "global_step": 100744, "epoch": 2398} {"train_loss": -6.390732288360596, "global_step": 100745, "epoch": 2398} {"train_loss": -6.329123497009277, "global_step": 100746, "epoch": 2398} {"train_loss": -6.361042499542236, "global_step": 100747, "epoch": 2398} {"train_loss": -6.465418815612793, "global_step": 100748, "epoch": 2398} {"train_loss": -6.378663063049316, "global_step": 100749, "epoch": 2398} {"train_loss": -6.420562744140625, "global_step": 100750, "epoch": 2398} {"train_loss": -6.302141189575195, "global_step": 100751, "epoch": 2398} {"train_loss": -6.457093238830566, "global_step": 100752, "epoch": 2398} {"train_loss": -6.26701021194458, "global_step": 100753, "epoch": 2398} {"train_loss": -6.437385559082031, "global_step": 100754, "epoch": 2398} {"train_loss": -6.419284343719482, "global_step": 100755, "epoch": 2398} {"train_loss": -6.39516544342041, "global_step": 100756, "epoch": 2398} {"train_loss": -6.39081004687718, "global_step": 100757, "epoch": 2398, "val_loss": 76314.609375} {"train_loss": -6.253115653991699, "global_step": 100758, "epoch": 2399} {"train_loss": -6.392036437988281, "global_step": 100759, "epoch": 2399} {"train_loss": -6.31217098236084, "global_step": 100760, "epoch": 2399} {"train_loss": -6.352203845977783, "global_step": 100761, "epoch": 2399} {"train_loss": -6.405670166015625, "global_step": 100762, "epoch": 2399} {"train_loss": -6.418776988983154, "global_step": 100763, "epoch": 2399} {"train_loss": -6.411784648895264, "global_step": 100764, "epoch": 2399} {"train_loss": -6.396328926086426, "global_step": 100765, "epoch": 2399} {"train_loss": -6.274998664855957, "global_step": 100766, "epoch": 2399} {"train_loss": -6.285611152648926, "global_step": 100767, "epoch": 2399} {"train_loss": -6.341422080993652, "global_step": 100768, "epoch": 2399} {"train_loss": -6.412507057189941, "global_step": 100769, "epoch": 2399} {"train_loss": -6.472059726715088, "global_step": 100770, "epoch": 2399} {"train_loss": -6.384934902191162, "global_step": 100771, "epoch": 2399} {"train_loss": -6.38213586807251, "global_step": 100772, "epoch": 2399} {"train_loss": -6.410429954528809, "global_step": 100773, "epoch": 2399} {"train_loss": -6.429795265197754, "global_step": 100774, "epoch": 2399} {"train_loss": -6.302519798278809, "global_step": 100775, "epoch": 2399} {"train_loss": -6.430955410003662, "global_step": 100776, "epoch": 2399} {"train_loss": -6.444173812866211, "global_step": 100777, "epoch": 2399} {"train_loss": -6.372129917144775, "global_step": 100778, "epoch": 2399} {"train_loss": -6.453673362731934, "global_step": 100779, "epoch": 2399} {"train_loss": -6.485762596130371, "global_step": 100780, "epoch": 2399} {"train_loss": -6.449270725250244, "global_step": 100781, "epoch": 2399} {"train_loss": -6.338747501373291, "global_step": 100782, "epoch": 2399} {"train_loss": -6.389535903930664, "global_step": 100783, "epoch": 2399} {"train_loss": -6.5201096534729, "global_step": 100784, "epoch": 2399} {"train_loss": -6.4539923667907715, "global_step": 100785, "epoch": 2399} {"train_loss": -6.392709732055664, "global_step": 100786, "epoch": 2399} {"train_loss": -6.503788471221924, "global_step": 100787, "epoch": 2399} {"train_loss": -6.414899826049805, "global_step": 100788, "epoch": 2399} {"train_loss": -6.337156772613525, "global_step": 100789, "epoch": 2399} {"train_loss": -6.536177635192871, "global_step": 100790, "epoch": 2399} {"train_loss": -6.345076560974121, "global_step": 100791, "epoch": 2399} {"train_loss": -6.318875312805176, "global_step": 100792, "epoch": 2399} {"train_loss": -6.466175079345703, "global_step": 100793, "epoch": 2399} {"train_loss": -6.4723124504089355, "global_step": 100794, "epoch": 2399} {"train_loss": -6.389368534088135, "global_step": 100795, "epoch": 2399} {"train_loss": -6.384576797485352, "global_step": 100796, "epoch": 2399} {"train_loss": -6.371539115905762, "global_step": 100797, "epoch": 2399} {"train_loss": -6.387699127197266, "global_step": 100798, "epoch": 2399} {"train_loss": -6.396738676797776, "global_step": 100799, "epoch": 2399, "val_loss": 75995.40625} {"train_loss": -6.4411187171936035, "global_step": 100800, "epoch": 2400} {"train_loss": -6.3380842208862305, "global_step": 100801, "epoch": 2400} {"train_loss": -6.362251281738281, "global_step": 100802, "epoch": 2400} {"train_loss": -6.32948112487793, "global_step": 100803, "epoch": 2400} {"train_loss": -6.275177955627441, "global_step": 100804, "epoch": 2400} {"train_loss": -6.324712753295898, "global_step": 100805, "epoch": 2400} {"train_loss": -6.425376892089844, "global_step": 100806, "epoch": 2400} {"train_loss": -6.433673858642578, "global_step": 100807, "epoch": 2400} {"train_loss": -6.4408650398254395, "global_step": 100808, "epoch": 2400} {"train_loss": -6.260139465332031, "global_step": 100809, "epoch": 2400} {"train_loss": -6.4748759269714355, "global_step": 100810, "epoch": 2400} {"train_loss": -6.448972702026367, "global_step": 100811, "epoch": 2400} {"train_loss": -6.330467224121094, "global_step": 100812, "epoch": 2400} {"train_loss": -6.410107135772705, "global_step": 100813, "epoch": 2400} {"train_loss": -6.435214996337891, "global_step": 100814, "epoch": 2400} {"train_loss": -6.290653228759766, "global_step": 100815, "epoch": 2400} {"train_loss": -6.4351959228515625, "global_step": 100816, "epoch": 2400} {"train_loss": -6.437605857849121, "global_step": 100817, "epoch": 2400} {"train_loss": -6.403606414794922, "global_step": 100818, "epoch": 2400} {"train_loss": -6.182007312774658, "global_step": 100819, "epoch": 2400} {"train_loss": -6.259230613708496, "global_step": 100820, "epoch": 2400} {"train_loss": -6.445992946624756, "global_step": 100821, "epoch": 2400} {"train_loss": -6.288898468017578, "global_step": 100822, "epoch": 2400} {"train_loss": -6.274134635925293, "global_step": 100823, "epoch": 2400} {"train_loss": -6.259817600250244, "global_step": 100824, "epoch": 2400} {"train_loss": -6.336277961730957, "global_step": 100825, "epoch": 2400} {"train_loss": -6.358077049255371, "global_step": 100826, "epoch": 2400} {"train_loss": -6.213153839111328, "global_step": 100827, "epoch": 2400} {"train_loss": -6.401529312133789, "global_step": 100828, "epoch": 2400} {"train_loss": -6.224819660186768, "global_step": 100829, "epoch": 2400} {"train_loss": -6.296730995178223, "global_step": 100830, "epoch": 2400} {"train_loss": -6.342535018920898, "global_step": 100831, "epoch": 2400} {"train_loss": -6.122105598449707, "global_step": 100832, "epoch": 2400} {"train_loss": -6.279511451721191, "global_step": 100833, "epoch": 2400} {"train_loss": -6.214123249053955, "global_step": 100834, "epoch": 2400} {"train_loss": -6.315969467163086, "global_step": 100835, "epoch": 2400} {"train_loss": -6.375522136688232, "global_step": 100836, "epoch": 2400} {"train_loss": -6.3116865158081055, "global_step": 100837, "epoch": 2400} {"train_loss": -6.341195106506348, "global_step": 100838, "epoch": 2400} {"train_loss": -6.227818489074707, "global_step": 100839, "epoch": 2400} {"train_loss": -6.313464164733887, "global_step": 100840, "epoch": 2400} {"train_loss": -6.332882733572097, "global_step": 100841, "epoch": 2400, "train/sim_max_reward_0": 0.8567772146980321, "train/sim_max_reward_1": 0.9480096500499817, "train/sim_max_reward_2": 0.3508196792656024, "train/sim_max_reward_3": 0.1326273805930576, "train/sim_max_reward_4": 0.7867749179457992, "train/sim_max_reward_5": 0.667085023323501, "test/sim_max_reward_4500000": 0.7796426340054784, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.6356912511544358, "test/sim_max_reward_4500003": 0.9419777173725079, "test/sim_max_reward_4500004": 0.9694549705052773, "test/sim_max_reward_4500005": 0.8123521460765512, "test/sim_max_reward_4500006": 0.8281921207012847, "test/sim_max_reward_4500007": 0.9416369113801094, "test/sim_max_reward_4500008": 0.7904147901582423, "test/sim_max_reward_4500009": 0.05348984679222091, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.5561906000968223, "test/sim_max_reward_4500012": 0.8087135253061147, "test/sim_max_reward_4500013": 0.0137639185693848, "test/sim_max_reward_4500014": 0.9681680412394272, "test/sim_max_reward_4500015": 0.9138833369162308, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.022302272164844938, "test/sim_max_reward_4500018": 0.9472432963688011, "test/sim_max_reward_4500019": 0.9776926117213152, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.5724257833312809, "test/sim_max_reward_4500022": 0.8530554871962912, "test/sim_max_reward_4500023": 0.8786443269773222, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.5367087843990339, "test/sim_max_reward_4500026": 0.9566215931071905, "test/sim_max_reward_4500027": 0.9908760844943977, "test/sim_max_reward_4500028": 0.2003482548186933, "test/sim_max_reward_4500029": 0.06855365199492193, "test/sim_max_reward_4500030": 0.9336811089818787, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.8540411386814518, "test/sim_max_reward_4500034": 0.05147534633315734, "test/sim_max_reward_4500035": 0.8429586384399065, "test/sim_max_reward_4500036": 0.3803493124194906, "test/sim_max_reward_4500037": 0.8111165198515342, "test/sim_max_reward_4500038": 0.31900544659028973, "test/sim_max_reward_4500039": 0.9293992858719917, "test/sim_max_reward_4500040": 0.9687546715614436, "test/sim_max_reward_4500041": 0.8879021303767719, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.23517588317159593, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.3467979064911359, "test/sim_max_reward_4500046": 0.9338705644277114, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.8922679910398792, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.623682310979329, "test/mean_score": 0.5298266639761852, "val_loss": 75665.4375} {"train_loss": -6.34575080871582, "global_step": 100842, "epoch": 2401} {"train_loss": -6.35226583480835, "global_step": 100843, "epoch": 2401} {"train_loss": -6.427018165588379, "global_step": 100844, "epoch": 2401} {"train_loss": -6.35975456237793, "global_step": 100845, "epoch": 2401} {"train_loss": -6.378742218017578, "global_step": 100846, "epoch": 2401} {"train_loss": -6.432114601135254, "global_step": 100847, "epoch": 2401} {"train_loss": -6.584826469421387, "global_step": 100848, "epoch": 2401} {"train_loss": -6.385340690612793, "global_step": 100849, "epoch": 2401} {"train_loss": -6.288629531860352, "global_step": 100850, "epoch": 2401} {"train_loss": -6.395696640014648, "global_step": 100851, "epoch": 2401} {"train_loss": -6.355988502502441, "global_step": 100852, "epoch": 2401} {"train_loss": -6.432289123535156, "global_step": 100853, "epoch": 2401} {"train_loss": -6.433200359344482, "global_step": 100854, "epoch": 2401} {"train_loss": -6.324064254760742, "global_step": 100855, "epoch": 2401} {"train_loss": -6.3786821365356445, "global_step": 100856, "epoch": 2401} {"train_loss": -6.46084451675415, "global_step": 100857, "epoch": 2401} {"train_loss": -6.401352882385254, "global_step": 100858, "epoch": 2401} {"train_loss": -6.376652717590332, "global_step": 100859, "epoch": 2401} {"train_loss": -6.331348419189453, "global_step": 100860, "epoch": 2401} {"train_loss": -6.301315784454346, "global_step": 100861, "epoch": 2401} {"train_loss": -6.225089073181152, "global_step": 100862, "epoch": 2401} {"train_loss": -6.330724716186523, "global_step": 100863, "epoch": 2401} {"train_loss": -6.339457988739014, "global_step": 100864, "epoch": 2401} {"train_loss": -6.261211395263672, "global_step": 100865, "epoch": 2401} {"train_loss": -6.388002395629883, "global_step": 100866, "epoch": 2401} {"train_loss": -6.356725215911865, "global_step": 100867, "epoch": 2401} {"train_loss": -6.246983528137207, "global_step": 100868, "epoch": 2401} {"train_loss": -6.181975841522217, "global_step": 100869, "epoch": 2401} {"train_loss": -6.312465667724609, "global_step": 100870, "epoch": 2401} {"train_loss": -6.320890426635742, "global_step": 100871, "epoch": 2401} {"train_loss": -6.381282806396484, "global_step": 100872, "epoch": 2401} {"train_loss": -6.3735809326171875, "global_step": 100873, "epoch": 2401} {"train_loss": -6.407425880432129, "global_step": 100874, "epoch": 2401} {"train_loss": -6.284181594848633, "global_step": 100875, "epoch": 2401} {"train_loss": -6.2900543212890625, "global_step": 100876, "epoch": 2401} {"train_loss": -6.376206398010254, "global_step": 100877, "epoch": 2401} {"train_loss": -6.323383331298828, "global_step": 100878, "epoch": 2401} {"train_loss": -6.27780818939209, "global_step": 100879, "epoch": 2401} {"train_loss": -6.2028656005859375, "global_step": 100880, "epoch": 2401} {"train_loss": -6.396745681762695, "global_step": 100881, "epoch": 2401} {"train_loss": -6.402889251708984, "global_step": 100882, "epoch": 2401} {"train_loss": -6.351647422427223, "global_step": 100883, "epoch": 2401, "val_loss": 75622.078125} {"train_loss": -6.310375213623047, "global_step": 100884, "epoch": 2402} {"train_loss": -6.328211784362793, "global_step": 100885, "epoch": 2402} {"train_loss": -6.406999111175537, "global_step": 100886, "epoch": 2402} {"train_loss": -6.435420513153076, "global_step": 100887, "epoch": 2402} {"train_loss": -6.3161516189575195, "global_step": 100888, "epoch": 2402} {"train_loss": -6.458384990692139, "global_step": 100889, "epoch": 2402} {"train_loss": -6.309658050537109, "global_step": 100890, "epoch": 2402} {"train_loss": -6.28727912902832, "global_step": 100891, "epoch": 2402} {"train_loss": -6.428747177124023, "global_step": 100892, "epoch": 2402} {"train_loss": -6.288993835449219, "global_step": 100893, "epoch": 2402} {"train_loss": -6.304112434387207, "global_step": 100894, "epoch": 2402} {"train_loss": -6.395810127258301, "global_step": 100895, "epoch": 2402} {"train_loss": -6.263097763061523, "global_step": 100896, "epoch": 2402} {"train_loss": -6.364026069641113, "global_step": 100897, "epoch": 2402} {"train_loss": -6.192753791809082, "global_step": 100898, "epoch": 2402} {"train_loss": -6.218856334686279, "global_step": 100899, "epoch": 2402} {"train_loss": -6.385158061981201, "global_step": 100900, "epoch": 2402} {"train_loss": -6.254171371459961, "global_step": 100901, "epoch": 2402} {"train_loss": -6.201257705688477, "global_step": 100902, "epoch": 2402} {"train_loss": -6.357594013214111, "global_step": 100903, "epoch": 2402} {"train_loss": -6.291017532348633, "global_step": 100904, "epoch": 2402} {"train_loss": -6.31092643737793, "global_step": 100905, "epoch": 2402} {"train_loss": -6.378376483917236, "global_step": 100906, "epoch": 2402} {"train_loss": -6.377537727355957, "global_step": 100907, "epoch": 2402} {"train_loss": -6.234619140625, "global_step": 100908, "epoch": 2402} {"train_loss": -6.298081398010254, "global_step": 100909, "epoch": 2402} {"train_loss": -6.239973068237305, "global_step": 100910, "epoch": 2402} {"train_loss": -6.366366386413574, "global_step": 100911, "epoch": 2402} {"train_loss": -6.393138408660889, "global_step": 100912, "epoch": 2402} {"train_loss": -6.4050984382629395, "global_step": 100913, "epoch": 2402} {"train_loss": -6.332332611083984, "global_step": 100914, "epoch": 2402} {"train_loss": -6.458250045776367, "global_step": 100915, "epoch": 2402} {"train_loss": -6.365519046783447, "global_step": 100916, "epoch": 2402} {"train_loss": -6.3218770027160645, "global_step": 100917, "epoch": 2402} {"train_loss": -6.323691368103027, "global_step": 100918, "epoch": 2402} {"train_loss": -6.360993385314941, "global_step": 100919, "epoch": 2402} {"train_loss": -6.305844306945801, "global_step": 100920, "epoch": 2402} {"train_loss": -6.33311653137207, "global_step": 100921, "epoch": 2402} {"train_loss": -6.389830589294434, "global_step": 100922, "epoch": 2402} {"train_loss": -6.341399192810059, "global_step": 100923, "epoch": 2402} {"train_loss": -6.316882610321045, "global_step": 100924, "epoch": 2402} {"train_loss": -6.333749351047334, "global_step": 100925, "epoch": 2402, "val_loss": 75903.3515625} {"train_loss": -6.285828590393066, "global_step": 100926, "epoch": 2403} {"train_loss": -6.349639892578125, "global_step": 100927, "epoch": 2403} {"train_loss": -6.414846420288086, "global_step": 100928, "epoch": 2403} {"train_loss": -6.353756904602051, "global_step": 100929, "epoch": 2403} {"train_loss": -6.448101997375488, "global_step": 100930, "epoch": 2403} {"train_loss": -6.424333572387695, "global_step": 100931, "epoch": 2403} {"train_loss": -6.37150764465332, "global_step": 100932, "epoch": 2403} {"train_loss": -6.267620086669922, "global_step": 100933, "epoch": 2403} {"train_loss": -6.3508124351501465, "global_step": 100934, "epoch": 2403} {"train_loss": -6.375743389129639, "global_step": 100935, "epoch": 2403} {"train_loss": -6.363244533538818, "global_step": 100936, "epoch": 2403} {"train_loss": -6.3843889236450195, "global_step": 100937, "epoch": 2403} {"train_loss": -6.150245666503906, "global_step": 100938, "epoch": 2403} {"train_loss": -6.328083038330078, "global_step": 100939, "epoch": 2403} {"train_loss": -6.2029290199279785, "global_step": 100940, "epoch": 2403} {"train_loss": -6.252303123474121, "global_step": 100941, "epoch": 2403} {"train_loss": -6.196377277374268, "global_step": 100942, "epoch": 2403} {"train_loss": -6.26690673828125, "global_step": 100943, "epoch": 2403} {"train_loss": -6.348328590393066, "global_step": 100944, "epoch": 2403} {"train_loss": -6.2340569496154785, "global_step": 100945, "epoch": 2403} {"train_loss": -6.403022766113281, "global_step": 100946, "epoch": 2403} {"train_loss": -6.177100658416748, "global_step": 100947, "epoch": 2403} {"train_loss": -6.2905731201171875, "global_step": 100948, "epoch": 2403} {"train_loss": -6.261484146118164, "global_step": 100949, "epoch": 2403} {"train_loss": -6.278861999511719, "global_step": 100950, "epoch": 2403} {"train_loss": -6.301327705383301, "global_step": 100951, "epoch": 2403} {"train_loss": -6.161677360534668, "global_step": 100952, "epoch": 2403} {"train_loss": -6.377819061279297, "global_step": 100953, "epoch": 2403} {"train_loss": -6.47526741027832, "global_step": 100954, "epoch": 2403} {"train_loss": -6.323249816894531, "global_step": 100955, "epoch": 2403} {"train_loss": -6.29074239730835, "global_step": 100956, "epoch": 2403} {"train_loss": -6.445289611816406, "global_step": 100957, "epoch": 2403} {"train_loss": -6.326521396636963, "global_step": 100958, "epoch": 2403} {"train_loss": -6.336133003234863, "global_step": 100959, "epoch": 2403} {"train_loss": -6.377917289733887, "global_step": 100960, "epoch": 2403} {"train_loss": -6.319465637207031, "global_step": 100961, "epoch": 2403} {"train_loss": -6.345606803894043, "global_step": 100962, "epoch": 2403} {"train_loss": -6.2737250328063965, "global_step": 100963, "epoch": 2403} {"train_loss": -6.322595119476318, "global_step": 100964, "epoch": 2403} {"train_loss": -6.354656219482422, "global_step": 100965, "epoch": 2403} {"train_loss": -6.399779319763184, "global_step": 100966, "epoch": 2403} {"train_loss": -6.321171124776204, "global_step": 100967, "epoch": 2403, "val_loss": 75736.3984375} {"train_loss": -6.413646697998047, "global_step": 100968, "epoch": 2404} {"train_loss": -6.30471134185791, "global_step": 100969, "epoch": 2404} {"train_loss": -6.431488037109375, "global_step": 100970, "epoch": 2404} {"train_loss": -6.413263320922852, "global_step": 100971, "epoch": 2404} {"train_loss": -6.389451026916504, "global_step": 100972, "epoch": 2404} {"train_loss": -6.4413557052612305, "global_step": 100973, "epoch": 2404} {"train_loss": -6.290229797363281, "global_step": 100974, "epoch": 2404} {"train_loss": -6.385354042053223, "global_step": 100975, "epoch": 2404} {"train_loss": -6.376711368560791, "global_step": 100976, "epoch": 2404} {"train_loss": -6.289368629455566, "global_step": 100977, "epoch": 2404} {"train_loss": -6.395354270935059, "global_step": 100978, "epoch": 2404} {"train_loss": -6.333459854125977, "global_step": 100979, "epoch": 2404} {"train_loss": -6.485095977783203, "global_step": 100980, "epoch": 2404} {"train_loss": -6.356888294219971, "global_step": 100981, "epoch": 2404} {"train_loss": -6.429508209228516, "global_step": 100982, "epoch": 2404} {"train_loss": -6.345873832702637, "global_step": 100983, "epoch": 2404} {"train_loss": -6.394916534423828, "global_step": 100984, "epoch": 2404} {"train_loss": -6.394407272338867, "global_step": 100985, "epoch": 2404} {"train_loss": -6.413212776184082, "global_step": 100986, "epoch": 2404} {"train_loss": -6.3995585441589355, "global_step": 100987, "epoch": 2404} {"train_loss": -6.407846927642822, "global_step": 100988, "epoch": 2404} {"train_loss": -6.330766677856445, "global_step": 100989, "epoch": 2404} {"train_loss": -6.356271266937256, "global_step": 100990, "epoch": 2404} {"train_loss": -6.383852005004883, "global_step": 100991, "epoch": 2404} {"train_loss": -6.459232807159424, "global_step": 100992, "epoch": 2404} {"train_loss": -6.470132827758789, "global_step": 100993, "epoch": 2404} {"train_loss": -6.364160537719727, "global_step": 100994, "epoch": 2404} {"train_loss": -6.478145599365234, "global_step": 100995, "epoch": 2404} {"train_loss": -6.4806952476501465, "global_step": 100996, "epoch": 2404} {"train_loss": -6.602914810180664, "global_step": 100997, "epoch": 2404} {"train_loss": -6.387096405029297, "global_step": 100998, "epoch": 2404} {"train_loss": -6.376101493835449, "global_step": 100999, "epoch": 2404} {"train_loss": -6.348519325256348, "global_step": 101000, "epoch": 2404} {"train_loss": -6.339041233062744, "global_step": 101001, "epoch": 2404} {"train_loss": -6.460328102111816, "global_step": 101002, "epoch": 2404} {"train_loss": -6.313640594482422, "global_step": 101003, "epoch": 2404} {"train_loss": -6.33762264251709, "global_step": 101004, "epoch": 2404} {"train_loss": -6.410421371459961, "global_step": 101005, "epoch": 2404} {"train_loss": -6.297513961791992, "global_step": 101006, "epoch": 2404} {"train_loss": -6.254751205444336, "global_step": 101007, "epoch": 2404} {"train_loss": -6.316370010375977, "global_step": 101008, "epoch": 2404} {"train_loss": -6.384897197995867, "global_step": 101009, "epoch": 2404, "val_loss": 75779.8671875} {"train_loss": -6.292279243469238, "global_step": 101010, "epoch": 2405} {"train_loss": -6.189024925231934, "global_step": 101011, "epoch": 2405} {"train_loss": -6.3755083084106445, "global_step": 101012, "epoch": 2405} {"train_loss": -6.413837432861328, "global_step": 101013, "epoch": 2405} {"train_loss": -6.249278545379639, "global_step": 101014, "epoch": 2405} {"train_loss": -6.313652038574219, "global_step": 101015, "epoch": 2405} {"train_loss": -6.267858982086182, "global_step": 101016, "epoch": 2405} {"train_loss": -6.32761287689209, "global_step": 101017, "epoch": 2405} {"train_loss": -6.414453506469727, "global_step": 101018, "epoch": 2405} {"train_loss": -6.453338623046875, "global_step": 101019, "epoch": 2405} {"train_loss": -6.2899885177612305, "global_step": 101020, "epoch": 2405} {"train_loss": -6.497809410095215, "global_step": 101021, "epoch": 2405} {"train_loss": -6.347658157348633, "global_step": 101022, "epoch": 2405} {"train_loss": -6.40390157699585, "global_step": 101023, "epoch": 2405} {"train_loss": -6.429211616516113, "global_step": 101024, "epoch": 2405} {"train_loss": -6.3191399574279785, "global_step": 101025, "epoch": 2405} {"train_loss": -6.2747344970703125, "global_step": 101026, "epoch": 2405} {"train_loss": -6.385013580322266, "global_step": 101027, "epoch": 2405} {"train_loss": -6.308990955352783, "global_step": 101028, "epoch": 2405} {"train_loss": -6.348346710205078, "global_step": 101029, "epoch": 2405} {"train_loss": -6.345200538635254, "global_step": 101030, "epoch": 2405} {"train_loss": -6.324746131896973, "global_step": 101031, "epoch": 2405} {"train_loss": -6.382267951965332, "global_step": 101032, "epoch": 2405} {"train_loss": -6.331720352172852, "global_step": 101033, "epoch": 2405} {"train_loss": -6.303648948669434, "global_step": 101034, "epoch": 2405} {"train_loss": -6.448816299438477, "global_step": 101035, "epoch": 2405} {"train_loss": -6.332963466644287, "global_step": 101036, "epoch": 2405} {"train_loss": -6.306879997253418, "global_step": 101037, "epoch": 2405} {"train_loss": -6.403624057769775, "global_step": 101038, "epoch": 2405} {"train_loss": -6.3502092361450195, "global_step": 101039, "epoch": 2405} {"train_loss": -6.3830366134643555, "global_step": 101040, "epoch": 2405} {"train_loss": -6.247788906097412, "global_step": 101041, "epoch": 2405} {"train_loss": -6.288127899169922, "global_step": 101042, "epoch": 2405} {"train_loss": -6.461542129516602, "global_step": 101043, "epoch": 2405} {"train_loss": -6.434576988220215, "global_step": 101044, "epoch": 2405} {"train_loss": -6.303827285766602, "global_step": 101045, "epoch": 2405} {"train_loss": -6.392634391784668, "global_step": 101046, "epoch": 2405} {"train_loss": -6.38441801071167, "global_step": 101047, "epoch": 2405} {"train_loss": -6.457893371582031, "global_step": 101048, "epoch": 2405} {"train_loss": -6.357165336608887, "global_step": 101049, "epoch": 2405} {"train_loss": -6.406041145324707, "global_step": 101050, "epoch": 2405} {"train_loss": -6.354757467905681, "global_step": 101051, "epoch": 2405, "val_loss": 75711.265625} {"train_loss": -6.429422855377197, "global_step": 101052, "epoch": 2406} {"train_loss": -6.470891952514648, "global_step": 101053, "epoch": 2406} {"train_loss": -6.387920379638672, "global_step": 101054, "epoch": 2406} {"train_loss": -6.268131256103516, "global_step": 101055, "epoch": 2406} {"train_loss": -6.428842067718506, "global_step": 101056, "epoch": 2406} {"train_loss": -6.370096206665039, "global_step": 101057, "epoch": 2406} {"train_loss": -6.367926597595215, "global_step": 101058, "epoch": 2406} {"train_loss": -6.409475326538086, "global_step": 101059, "epoch": 2406} {"train_loss": -6.463066101074219, "global_step": 101060, "epoch": 2406} {"train_loss": -6.2997660636901855, "global_step": 101061, "epoch": 2406} {"train_loss": -6.384396553039551, "global_step": 101062, "epoch": 2406} {"train_loss": -6.409197807312012, "global_step": 101063, "epoch": 2406} {"train_loss": -6.334937572479248, "global_step": 101064, "epoch": 2406} {"train_loss": -6.3924360275268555, "global_step": 101065, "epoch": 2406} {"train_loss": -6.345608711242676, "global_step": 101066, "epoch": 2406} {"train_loss": -6.449683666229248, "global_step": 101067, "epoch": 2406} {"train_loss": -6.424446105957031, "global_step": 101068, "epoch": 2406} {"train_loss": -6.414333343505859, "global_step": 101069, "epoch": 2406} {"train_loss": -6.393495082855225, "global_step": 101070, "epoch": 2406} {"train_loss": -6.253399848937988, "global_step": 101071, "epoch": 2406} {"train_loss": -6.314269065856934, "global_step": 101072, "epoch": 2406} {"train_loss": -6.33444881439209, "global_step": 101073, "epoch": 2406} {"train_loss": -6.424158096313477, "global_step": 101074, "epoch": 2406} {"train_loss": -6.413470268249512, "global_step": 101075, "epoch": 2406} {"train_loss": -6.445216178894043, "global_step": 101076, "epoch": 2406} {"train_loss": -6.336543560028076, "global_step": 101077, "epoch": 2406} {"train_loss": -6.393039703369141, "global_step": 101078, "epoch": 2406} {"train_loss": -6.298186302185059, "global_step": 101079, "epoch": 2406} {"train_loss": -6.379279136657715, "global_step": 101080, "epoch": 2406} {"train_loss": -6.390482425689697, "global_step": 101081, "epoch": 2406} {"train_loss": -6.308966636657715, "global_step": 101082, "epoch": 2406} {"train_loss": -6.400969505310059, "global_step": 101083, "epoch": 2406} {"train_loss": -6.293374061584473, "global_step": 101084, "epoch": 2406} {"train_loss": -6.292044639587402, "global_step": 101085, "epoch": 2406} {"train_loss": -6.360716819763184, "global_step": 101086, "epoch": 2406} {"train_loss": -6.3822407722473145, "global_step": 101087, "epoch": 2406} {"train_loss": -6.3966827392578125, "global_step": 101088, "epoch": 2406} {"train_loss": -6.363550186157227, "global_step": 101089, "epoch": 2406} {"train_loss": -6.394625663757324, "global_step": 101090, "epoch": 2406} {"train_loss": -6.3949198722839355, "global_step": 101091, "epoch": 2406} {"train_loss": -6.3957319259643555, "global_step": 101092, "epoch": 2406} {"train_loss": -6.378130799248105, "global_step": 101093, "epoch": 2406, "val_loss": 75405.8203125} {"train_loss": -6.379706382751465, "global_step": 101094, "epoch": 2407} {"train_loss": -6.431222438812256, "global_step": 101095, "epoch": 2407} {"train_loss": -6.356329917907715, "global_step": 101096, "epoch": 2407} {"train_loss": -6.3756422996521, "global_step": 101097, "epoch": 2407} {"train_loss": -6.458718299865723, "global_step": 101098, "epoch": 2407} {"train_loss": -6.470691680908203, "global_step": 101099, "epoch": 2407} {"train_loss": -6.355223655700684, "global_step": 101100, "epoch": 2407} {"train_loss": -6.337762832641602, "global_step": 101101, "epoch": 2407} {"train_loss": -6.360472679138184, "global_step": 101102, "epoch": 2407} {"train_loss": -6.1989665031433105, "global_step": 101103, "epoch": 2407} {"train_loss": -6.357021331787109, "global_step": 101104, "epoch": 2407} {"train_loss": -6.281526565551758, "global_step": 101105, "epoch": 2407} {"train_loss": -6.309101104736328, "global_step": 101106, "epoch": 2407} {"train_loss": -6.36773157119751, "global_step": 101107, "epoch": 2407} {"train_loss": -6.389429092407227, "global_step": 101108, "epoch": 2407} {"train_loss": -6.4700422286987305, "global_step": 101109, "epoch": 2407} {"train_loss": -6.40760612487793, "global_step": 101110, "epoch": 2407} {"train_loss": -6.401554584503174, "global_step": 101111, "epoch": 2407} {"train_loss": -6.49626350402832, "global_step": 101112, "epoch": 2407} {"train_loss": -6.266570091247559, "global_step": 101113, "epoch": 2407} {"train_loss": -6.383880138397217, "global_step": 101114, "epoch": 2407} {"train_loss": -6.349778175354004, "global_step": 101115, "epoch": 2407} {"train_loss": -6.3570098876953125, "global_step": 101116, "epoch": 2407} {"train_loss": -6.363482475280762, "global_step": 101117, "epoch": 2407} {"train_loss": -6.519567012786865, "global_step": 101118, "epoch": 2407} {"train_loss": -6.376762866973877, "global_step": 101119, "epoch": 2407} {"train_loss": -6.446430683135986, "global_step": 101120, "epoch": 2407} {"train_loss": -6.465513229370117, "global_step": 101121, "epoch": 2407} {"train_loss": -6.346190452575684, "global_step": 101122, "epoch": 2407} {"train_loss": -6.48757266998291, "global_step": 101123, "epoch": 2407} {"train_loss": -6.408679962158203, "global_step": 101124, "epoch": 2407} {"train_loss": -6.3655290603637695, "global_step": 101125, "epoch": 2407} {"train_loss": -6.2916436195373535, "global_step": 101126, "epoch": 2407} {"train_loss": -6.407680511474609, "global_step": 101127, "epoch": 2407} {"train_loss": -6.403415203094482, "global_step": 101128, "epoch": 2407} {"train_loss": -6.275822639465332, "global_step": 101129, "epoch": 2407} {"train_loss": -6.255624294281006, "global_step": 101130, "epoch": 2407} {"train_loss": -6.419581413269043, "global_step": 101131, "epoch": 2407} {"train_loss": -6.353536128997803, "global_step": 101132, "epoch": 2407} {"train_loss": -6.342398643493652, "global_step": 101133, "epoch": 2407} {"train_loss": -6.513847351074219, "global_step": 101134, "epoch": 2407} {"train_loss": -6.378056855428786, "global_step": 101135, "epoch": 2407, "val_loss": 76308.1015625} {"train_loss": -6.395151138305664, "global_step": 101136, "epoch": 2408} {"train_loss": -6.44428014755249, "global_step": 101137, "epoch": 2408} {"train_loss": -6.349031448364258, "global_step": 101138, "epoch": 2408} {"train_loss": -6.365959167480469, "global_step": 101139, "epoch": 2408} {"train_loss": -6.341628074645996, "global_step": 101140, "epoch": 2408} {"train_loss": -6.434346675872803, "global_step": 101141, "epoch": 2408} {"train_loss": -6.543856620788574, "global_step": 101142, "epoch": 2408} {"train_loss": -6.278919219970703, "global_step": 101143, "epoch": 2408} {"train_loss": -6.423076152801514, "global_step": 101144, "epoch": 2408} {"train_loss": -6.309666633605957, "global_step": 101145, "epoch": 2408} {"train_loss": -6.371027946472168, "global_step": 101146, "epoch": 2408} {"train_loss": -6.564207077026367, "global_step": 101147, "epoch": 2408} {"train_loss": -6.363048553466797, "global_step": 101148, "epoch": 2408} {"train_loss": -6.187277793884277, "global_step": 101149, "epoch": 2408} {"train_loss": -6.279744625091553, "global_step": 101150, "epoch": 2408} {"train_loss": -6.398293495178223, "global_step": 101151, "epoch": 2408} {"train_loss": -6.359953880310059, "global_step": 101152, "epoch": 2408} {"train_loss": -6.404969215393066, "global_step": 101153, "epoch": 2408} {"train_loss": -6.319916248321533, "global_step": 101154, "epoch": 2408} {"train_loss": -6.291913032531738, "global_step": 101155, "epoch": 2408} {"train_loss": -6.386662483215332, "global_step": 101156, "epoch": 2408} {"train_loss": -6.384305953979492, "global_step": 101157, "epoch": 2408} {"train_loss": -6.443352699279785, "global_step": 101158, "epoch": 2408} {"train_loss": -6.475467681884766, "global_step": 101159, "epoch": 2408} {"train_loss": -6.412387847900391, "global_step": 101160, "epoch": 2408} {"train_loss": -6.254790306091309, "global_step": 101161, "epoch": 2408} {"train_loss": -6.444558143615723, "global_step": 101162, "epoch": 2408} {"train_loss": -6.315646648406982, "global_step": 101163, "epoch": 2408} {"train_loss": -6.335256576538086, "global_step": 101164, "epoch": 2408} {"train_loss": -6.3011393547058105, "global_step": 101165, "epoch": 2408} {"train_loss": -6.385385513305664, "global_step": 101166, "epoch": 2408} {"train_loss": -6.425717830657959, "global_step": 101167, "epoch": 2408} {"train_loss": -6.346406936645508, "global_step": 101168, "epoch": 2408} {"train_loss": -6.424939155578613, "global_step": 101169, "epoch": 2408} {"train_loss": -6.339046001434326, "global_step": 101170, "epoch": 2408} {"train_loss": -6.3851141929626465, "global_step": 101171, "epoch": 2408} {"train_loss": -6.314572334289551, "global_step": 101172, "epoch": 2408} {"train_loss": -6.342121124267578, "global_step": 101173, "epoch": 2408} {"train_loss": -6.4069623947143555, "global_step": 101174, "epoch": 2408} {"train_loss": -6.259484767913818, "global_step": 101175, "epoch": 2408} {"train_loss": -6.238293647766113, "global_step": 101176, "epoch": 2408} {"train_loss": -6.367801257542202, "global_step": 101177, "epoch": 2408, "val_loss": 75726.1875} {"train_loss": -6.272829532623291, "global_step": 101178, "epoch": 2409} {"train_loss": -6.327465057373047, "global_step": 101179, "epoch": 2409} {"train_loss": -6.431484699249268, "global_step": 101180, "epoch": 2409} {"train_loss": -6.137598037719727, "global_step": 101181, "epoch": 2409} {"train_loss": -6.333121299743652, "global_step": 101182, "epoch": 2409} {"train_loss": -6.158474922180176, "global_step": 101183, "epoch": 2409} {"train_loss": -6.255170822143555, "global_step": 101184, "epoch": 2409} {"train_loss": -6.3920512199401855, "global_step": 101185, "epoch": 2409} {"train_loss": -6.305007457733154, "global_step": 101186, "epoch": 2409} {"train_loss": -6.3263959884643555, "global_step": 101187, "epoch": 2409} {"train_loss": -6.347836494445801, "global_step": 101188, "epoch": 2409} {"train_loss": -6.271444320678711, "global_step": 101189, "epoch": 2409} {"train_loss": -6.309018611907959, "global_step": 101190, "epoch": 2409} {"train_loss": -6.27766227722168, "global_step": 101191, "epoch": 2409} {"train_loss": -6.341156005859375, "global_step": 101192, "epoch": 2409} {"train_loss": -6.362934112548828, "global_step": 101193, "epoch": 2409} {"train_loss": -6.296894073486328, "global_step": 101194, "epoch": 2409} {"train_loss": -6.27545166015625, "global_step": 101195, "epoch": 2409} {"train_loss": -6.424541473388672, "global_step": 101196, "epoch": 2409} {"train_loss": -6.5017547607421875, "global_step": 101197, "epoch": 2409} {"train_loss": -6.452785491943359, "global_step": 101198, "epoch": 2409} {"train_loss": -6.199066162109375, "global_step": 101199, "epoch": 2409} {"train_loss": -6.3315653800964355, "global_step": 101200, "epoch": 2409} {"train_loss": -6.368525505065918, "global_step": 101201, "epoch": 2409} {"train_loss": -6.307296276092529, "global_step": 101202, "epoch": 2409} {"train_loss": -6.218541622161865, "global_step": 101203, "epoch": 2409} {"train_loss": -6.425565242767334, "global_step": 101204, "epoch": 2409} {"train_loss": -6.2494096755981445, "global_step": 101205, "epoch": 2409} {"train_loss": -6.313007354736328, "global_step": 101206, "epoch": 2409} {"train_loss": -6.450479030609131, "global_step": 101207, "epoch": 2409} {"train_loss": -6.425086498260498, "global_step": 101208, "epoch": 2409} {"train_loss": -6.357005596160889, "global_step": 101209, "epoch": 2409} {"train_loss": -6.267167091369629, "global_step": 101210, "epoch": 2409} {"train_loss": -6.319137096405029, "global_step": 101211, "epoch": 2409} {"train_loss": -6.289114952087402, "global_step": 101212, "epoch": 2409} {"train_loss": -6.326624870300293, "global_step": 101213, "epoch": 2409} {"train_loss": -6.346897602081299, "global_step": 101214, "epoch": 2409} {"train_loss": -6.346715927124023, "global_step": 101215, "epoch": 2409} {"train_loss": -6.435675621032715, "global_step": 101216, "epoch": 2409} {"train_loss": -6.336582183837891, "global_step": 101217, "epoch": 2409} {"train_loss": -6.2985053062438965, "global_step": 101218, "epoch": 2409} {"train_loss": -6.327285709835234, "global_step": 101219, "epoch": 2409, "val_loss": 75982.421875} {"train_loss": -6.317354679107666, "global_step": 101220, "epoch": 2410} {"train_loss": -6.397909164428711, "global_step": 101221, "epoch": 2410} {"train_loss": -6.3967719078063965, "global_step": 101222, "epoch": 2410} {"train_loss": -6.438440799713135, "global_step": 101223, "epoch": 2410} {"train_loss": -6.442144393920898, "global_step": 101224, "epoch": 2410} {"train_loss": -6.311095714569092, "global_step": 101225, "epoch": 2410} {"train_loss": -6.448053359985352, "global_step": 101226, "epoch": 2410} {"train_loss": -6.415740966796875, "global_step": 101227, "epoch": 2410} {"train_loss": -6.442697525024414, "global_step": 101228, "epoch": 2410} {"train_loss": -6.342712879180908, "global_step": 101229, "epoch": 2410} {"train_loss": -6.458346366882324, "global_step": 101230, "epoch": 2410} {"train_loss": -6.3588032722473145, "global_step": 101231, "epoch": 2410} {"train_loss": -6.491130828857422, "global_step": 101232, "epoch": 2410} {"train_loss": -6.345579147338867, "global_step": 101233, "epoch": 2410} {"train_loss": -6.395077705383301, "global_step": 101234, "epoch": 2410} {"train_loss": -6.4272260665893555, "global_step": 101235, "epoch": 2410} {"train_loss": -6.425631523132324, "global_step": 101236, "epoch": 2410} {"train_loss": -6.384125232696533, "global_step": 101237, "epoch": 2410} {"train_loss": -6.389534950256348, "global_step": 101238, "epoch": 2410} {"train_loss": -6.353059768676758, "global_step": 101239, "epoch": 2410} {"train_loss": -6.367963790893555, "global_step": 101240, "epoch": 2410} {"train_loss": -6.4630818367004395, "global_step": 101241, "epoch": 2410} {"train_loss": -6.4540815353393555, "global_step": 101242, "epoch": 2410} {"train_loss": -6.317217826843262, "global_step": 101243, "epoch": 2410} {"train_loss": -6.320608615875244, "global_step": 101244, "epoch": 2410} {"train_loss": -6.378686904907227, "global_step": 101245, "epoch": 2410} {"train_loss": -6.3024749755859375, "global_step": 101246, "epoch": 2410} {"train_loss": -6.359762191772461, "global_step": 101247, "epoch": 2410} {"train_loss": -6.322628498077393, "global_step": 101248, "epoch": 2410} {"train_loss": -6.378887176513672, "global_step": 101249, "epoch": 2410} {"train_loss": -6.357827186584473, "global_step": 101250, "epoch": 2410} {"train_loss": -6.329173564910889, "global_step": 101251, "epoch": 2410} {"train_loss": -6.361939430236816, "global_step": 101252, "epoch": 2410} {"train_loss": -6.310482978820801, "global_step": 101253, "epoch": 2410} {"train_loss": -6.37225866317749, "global_step": 101254, "epoch": 2410} {"train_loss": -6.3998703956604, "global_step": 101255, "epoch": 2410} {"train_loss": -6.350573539733887, "global_step": 101256, "epoch": 2410} {"train_loss": -6.303258895874023, "global_step": 101257, "epoch": 2410} {"train_loss": -6.575604438781738, "global_step": 101258, "epoch": 2410} {"train_loss": -6.333589553833008, "global_step": 101259, "epoch": 2410} {"train_loss": -6.265661239624023, "global_step": 101260, "epoch": 2410} {"train_loss": -6.380046208699544, "global_step": 101261, "epoch": 2410, "val_loss": 75689.25} {"train_loss": -6.4640679359436035, "global_step": 101262, "epoch": 2411} {"train_loss": -6.394396781921387, "global_step": 101263, "epoch": 2411} {"train_loss": -6.454632759094238, "global_step": 101264, "epoch": 2411} {"train_loss": -6.324584007263184, "global_step": 101265, "epoch": 2411} {"train_loss": -6.417143821716309, "global_step": 101266, "epoch": 2411} {"train_loss": -6.411580562591553, "global_step": 101267, "epoch": 2411} {"train_loss": -6.181636333465576, "global_step": 101268, "epoch": 2411} {"train_loss": -6.318655014038086, "global_step": 101269, "epoch": 2411} {"train_loss": -6.193335056304932, "global_step": 101270, "epoch": 2411} {"train_loss": -6.423219680786133, "global_step": 101271, "epoch": 2411} {"train_loss": -6.308464050292969, "global_step": 101272, "epoch": 2411} {"train_loss": -6.3028974533081055, "global_step": 101273, "epoch": 2411} {"train_loss": -6.259949684143066, "global_step": 101274, "epoch": 2411} {"train_loss": -6.460513591766357, "global_step": 101275, "epoch": 2411} {"train_loss": -6.332123756408691, "global_step": 101276, "epoch": 2411} {"train_loss": -6.338541030883789, "global_step": 101277, "epoch": 2411} {"train_loss": -6.384736061096191, "global_step": 101278, "epoch": 2411} {"train_loss": -6.301362037658691, "global_step": 101279, "epoch": 2411} {"train_loss": -6.321261405944824, "global_step": 101280, "epoch": 2411} {"train_loss": -6.379809856414795, "global_step": 101281, "epoch": 2411} {"train_loss": -6.349233627319336, "global_step": 101282, "epoch": 2411} {"train_loss": -6.342169761657715, "global_step": 101283, "epoch": 2411} {"train_loss": -6.486084938049316, "global_step": 101284, "epoch": 2411} {"train_loss": -6.302522659301758, "global_step": 101285, "epoch": 2411} {"train_loss": -6.426292896270752, "global_step": 101286, "epoch": 2411} {"train_loss": -6.358082294464111, "global_step": 101287, "epoch": 2411} {"train_loss": -6.286017417907715, "global_step": 101288, "epoch": 2411} {"train_loss": -6.377297878265381, "global_step": 101289, "epoch": 2411} {"train_loss": -6.2748847007751465, "global_step": 101290, "epoch": 2411} {"train_loss": -6.451570510864258, "global_step": 101291, "epoch": 2411} {"train_loss": -6.364353656768799, "global_step": 101292, "epoch": 2411} {"train_loss": -6.455949783325195, "global_step": 101293, "epoch": 2411} {"train_loss": -6.3406805992126465, "global_step": 101294, "epoch": 2411} {"train_loss": -6.360740661621094, "global_step": 101295, "epoch": 2411} {"train_loss": -6.337464332580566, "global_step": 101296, "epoch": 2411} {"train_loss": -6.360166549682617, "global_step": 101297, "epoch": 2411} {"train_loss": -6.495765686035156, "global_step": 101298, "epoch": 2411} {"train_loss": -6.477946758270264, "global_step": 101299, "epoch": 2411} {"train_loss": -6.343257904052734, "global_step": 101300, "epoch": 2411} {"train_loss": -6.4383111000061035, "global_step": 101301, "epoch": 2411} {"train_loss": -6.47531795501709, "global_step": 101302, "epoch": 2411} {"train_loss": -6.367370196751186, "global_step": 101303, "epoch": 2411, "val_loss": 75362.8828125} {"train_loss": -6.298580169677734, "global_step": 101304, "epoch": 2412} {"train_loss": -6.380659103393555, "global_step": 101305, "epoch": 2412} {"train_loss": -6.345799446105957, "global_step": 101306, "epoch": 2412} {"train_loss": -6.39553165435791, "global_step": 101307, "epoch": 2412} {"train_loss": -6.363051414489746, "global_step": 101308, "epoch": 2412} {"train_loss": -6.382589340209961, "global_step": 101309, "epoch": 2412} {"train_loss": -6.280211448669434, "global_step": 101310, "epoch": 2412} {"train_loss": -6.265119552612305, "global_step": 101311, "epoch": 2412} {"train_loss": -6.223830699920654, "global_step": 101312, "epoch": 2412} {"train_loss": -6.307926177978516, "global_step": 101313, "epoch": 2412} {"train_loss": -6.372248649597168, "global_step": 101314, "epoch": 2412} {"train_loss": -6.277889251708984, "global_step": 101315, "epoch": 2412} {"train_loss": -6.330917835235596, "global_step": 101316, "epoch": 2412} {"train_loss": -6.304170608520508, "global_step": 101317, "epoch": 2412} {"train_loss": -6.245580673217773, "global_step": 101318, "epoch": 2412} {"train_loss": -6.227432727813721, "global_step": 101319, "epoch": 2412} {"train_loss": -6.390773773193359, "global_step": 101320, "epoch": 2412} {"train_loss": -6.3198652267456055, "global_step": 101321, "epoch": 2412} {"train_loss": -6.359274864196777, "global_step": 101322, "epoch": 2412} {"train_loss": -6.303677558898926, "global_step": 101323, "epoch": 2412} {"train_loss": -6.338459014892578, "global_step": 101324, "epoch": 2412} {"train_loss": -6.307730197906494, "global_step": 101325, "epoch": 2412} {"train_loss": -6.3651885986328125, "global_step": 101326, "epoch": 2412} {"train_loss": -6.372841835021973, "global_step": 101327, "epoch": 2412} {"train_loss": -6.361472129821777, "global_step": 101328, "epoch": 2412} {"train_loss": -6.439558982849121, "global_step": 101329, "epoch": 2412} {"train_loss": -6.37539005279541, "global_step": 101330, "epoch": 2412} {"train_loss": -6.396121025085449, "global_step": 101331, "epoch": 2412} {"train_loss": -6.35801887512207, "global_step": 101332, "epoch": 2412} {"train_loss": -6.3999834060668945, "global_step": 101333, "epoch": 2412} {"train_loss": -6.349484443664551, "global_step": 101334, "epoch": 2412} {"train_loss": -6.431797027587891, "global_step": 101335, "epoch": 2412} {"train_loss": -6.476367950439453, "global_step": 101336, "epoch": 2412} {"train_loss": -6.4094672203063965, "global_step": 101337, "epoch": 2412} {"train_loss": -6.591488838195801, "global_step": 101338, "epoch": 2412} {"train_loss": -6.270811080932617, "global_step": 101339, "epoch": 2412} {"train_loss": -6.364657402038574, "global_step": 101340, "epoch": 2412} {"train_loss": -6.403559684753418, "global_step": 101341, "epoch": 2412} {"train_loss": -6.379674434661865, "global_step": 101342, "epoch": 2412} {"train_loss": -6.424792289733887, "global_step": 101343, "epoch": 2412} {"train_loss": -6.518772602081299, "global_step": 101344, "epoch": 2412} {"train_loss": -6.358930201757522, "global_step": 101345, "epoch": 2412, "val_loss": 75785.125} {"train_loss": -6.425339698791504, "global_step": 101346, "epoch": 2413} {"train_loss": -6.404774188995361, "global_step": 101347, "epoch": 2413} {"train_loss": -6.431632995605469, "global_step": 101348, "epoch": 2413} {"train_loss": -6.388853549957275, "global_step": 101349, "epoch": 2413} {"train_loss": -6.473417282104492, "global_step": 101350, "epoch": 2413} {"train_loss": -6.3414201736450195, "global_step": 101351, "epoch": 2413} {"train_loss": -6.384843349456787, "global_step": 101352, "epoch": 2413} {"train_loss": -6.388775825500488, "global_step": 101353, "epoch": 2413} {"train_loss": -6.394218444824219, "global_step": 101354, "epoch": 2413} {"train_loss": -6.418173789978027, "global_step": 101355, "epoch": 2413} {"train_loss": -6.4205121994018555, "global_step": 101356, "epoch": 2413} {"train_loss": -6.508419036865234, "global_step": 101357, "epoch": 2413} {"train_loss": -6.386404991149902, "global_step": 101358, "epoch": 2413} {"train_loss": -6.3700714111328125, "global_step": 101359, "epoch": 2413} {"train_loss": -6.39132022857666, "global_step": 101360, "epoch": 2413} {"train_loss": -6.4609375, "global_step": 101361, "epoch": 2413} {"train_loss": -6.459900379180908, "global_step": 101362, "epoch": 2413} {"train_loss": -6.418570518493652, "global_step": 101363, "epoch": 2413} {"train_loss": -6.3975067138671875, "global_step": 101364, "epoch": 2413} {"train_loss": -6.2892913818359375, "global_step": 101365, "epoch": 2413} {"train_loss": -6.40710973739624, "global_step": 101366, "epoch": 2413} {"train_loss": -6.386196136474609, "global_step": 101367, "epoch": 2413} {"train_loss": -6.410739898681641, "global_step": 101368, "epoch": 2413} {"train_loss": -6.4948835372924805, "global_step": 101369, "epoch": 2413} {"train_loss": -6.369807720184326, "global_step": 101370, "epoch": 2413} {"train_loss": -6.398977756500244, "global_step": 101371, "epoch": 2413} {"train_loss": -6.360959053039551, "global_step": 101372, "epoch": 2413} {"train_loss": -6.330914497375488, "global_step": 101373, "epoch": 2413} {"train_loss": -6.435356140136719, "global_step": 101374, "epoch": 2413} {"train_loss": -6.300176620483398, "global_step": 101375, "epoch": 2413} {"train_loss": -6.197201251983643, "global_step": 101376, "epoch": 2413} {"train_loss": -6.320499420166016, "global_step": 101377, "epoch": 2413} {"train_loss": -6.433560848236084, "global_step": 101378, "epoch": 2413} {"train_loss": -6.310972213745117, "global_step": 101379, "epoch": 2413} {"train_loss": -6.3778076171875, "global_step": 101380, "epoch": 2413} {"train_loss": -6.345780849456787, "global_step": 101381, "epoch": 2413} {"train_loss": -6.320039749145508, "global_step": 101382, "epoch": 2413} {"train_loss": -6.274442195892334, "global_step": 101383, "epoch": 2413} {"train_loss": -6.207621097564697, "global_step": 101384, "epoch": 2413} {"train_loss": -6.266264915466309, "global_step": 101385, "epoch": 2413} {"train_loss": -6.259493827819824, "global_step": 101386, "epoch": 2413} {"train_loss": -6.37241622379848, "global_step": 101387, "epoch": 2413, "val_loss": 75872.0625} {"train_loss": -6.420558929443359, "global_step": 101388, "epoch": 2414} {"train_loss": -6.325967788696289, "global_step": 101389, "epoch": 2414} {"train_loss": -6.256618022918701, "global_step": 101390, "epoch": 2414} {"train_loss": -6.34658145904541, "global_step": 101391, "epoch": 2414} {"train_loss": -6.30606746673584, "global_step": 101392, "epoch": 2414} {"train_loss": -6.45279598236084, "global_step": 101393, "epoch": 2414} {"train_loss": -6.3098249435424805, "global_step": 101394, "epoch": 2414} {"train_loss": -6.4494829177856445, "global_step": 101395, "epoch": 2414} {"train_loss": -6.441112995147705, "global_step": 101396, "epoch": 2414} {"train_loss": -6.36907958984375, "global_step": 101397, "epoch": 2414} {"train_loss": -6.384130001068115, "global_step": 101398, "epoch": 2414} {"train_loss": -6.430363655090332, "global_step": 101399, "epoch": 2414} {"train_loss": -6.40746545791626, "global_step": 101400, "epoch": 2414} {"train_loss": -6.47203254699707, "global_step": 101401, "epoch": 2414} {"train_loss": -6.364383697509766, "global_step": 101402, "epoch": 2414} {"train_loss": -6.53110408782959, "global_step": 101403, "epoch": 2414} {"train_loss": -6.328057289123535, "global_step": 101404, "epoch": 2414} {"train_loss": -6.283885955810547, "global_step": 101405, "epoch": 2414} {"train_loss": -6.460099220275879, "global_step": 101406, "epoch": 2414} {"train_loss": -6.430396556854248, "global_step": 101407, "epoch": 2414} {"train_loss": -6.306092739105225, "global_step": 101408, "epoch": 2414} {"train_loss": -6.2952561378479, "global_step": 101409, "epoch": 2414} {"train_loss": -6.349048614501953, "global_step": 101410, "epoch": 2414} {"train_loss": -6.386158466339111, "global_step": 101411, "epoch": 2414} {"train_loss": -6.197934627532959, "global_step": 101412, "epoch": 2414} {"train_loss": -6.327966690063477, "global_step": 101413, "epoch": 2414} {"train_loss": -6.306082248687744, "global_step": 101414, "epoch": 2414} {"train_loss": -6.338718414306641, "global_step": 101415, "epoch": 2414} {"train_loss": -6.3504533767700195, "global_step": 101416, "epoch": 2414} {"train_loss": -6.307222843170166, "global_step": 101417, "epoch": 2414} {"train_loss": -6.305792808532715, "global_step": 101418, "epoch": 2414} {"train_loss": -6.306928634643555, "global_step": 101419, "epoch": 2414} {"train_loss": -6.262753486633301, "global_step": 101420, "epoch": 2414} {"train_loss": -6.251587390899658, "global_step": 101421, "epoch": 2414} {"train_loss": -6.310529708862305, "global_step": 101422, "epoch": 2414} {"train_loss": -6.416644096374512, "global_step": 101423, "epoch": 2414} {"train_loss": -6.408384799957275, "global_step": 101424, "epoch": 2414} {"train_loss": -6.3198652267456055, "global_step": 101425, "epoch": 2414} {"train_loss": -6.260770797729492, "global_step": 101426, "epoch": 2414} {"train_loss": -6.291658401489258, "global_step": 101427, "epoch": 2414} {"train_loss": -6.239721298217773, "global_step": 101428, "epoch": 2414} {"train_loss": -6.347830386388869, "global_step": 101429, "epoch": 2414, "val_loss": 76011.3203125} {"train_loss": -6.444730758666992, "global_step": 101430, "epoch": 2415} {"train_loss": -6.310233116149902, "global_step": 101431, "epoch": 2415} {"train_loss": -6.237098217010498, "global_step": 101432, "epoch": 2415} {"train_loss": -6.333850860595703, "global_step": 101433, "epoch": 2415} {"train_loss": -6.447238922119141, "global_step": 101434, "epoch": 2415} {"train_loss": -6.428499221801758, "global_step": 101435, "epoch": 2415} {"train_loss": -6.269134998321533, "global_step": 101436, "epoch": 2415} {"train_loss": -6.327227592468262, "global_step": 101437, "epoch": 2415} {"train_loss": -6.393593788146973, "global_step": 101438, "epoch": 2415} {"train_loss": -6.267917633056641, "global_step": 101439, "epoch": 2415} {"train_loss": -6.368251800537109, "global_step": 101440, "epoch": 2415} {"train_loss": -6.4265546798706055, "global_step": 101441, "epoch": 2415} {"train_loss": -6.426411151885986, "global_step": 101442, "epoch": 2415} {"train_loss": -6.310001373291016, "global_step": 101443, "epoch": 2415} {"train_loss": -6.351483345031738, "global_step": 101444, "epoch": 2415} {"train_loss": -6.332849979400635, "global_step": 101445, "epoch": 2415} {"train_loss": -6.248208522796631, "global_step": 101446, "epoch": 2415} {"train_loss": -6.450892448425293, "global_step": 101447, "epoch": 2415} {"train_loss": -6.376239776611328, "global_step": 101448, "epoch": 2415} {"train_loss": -6.318448543548584, "global_step": 101449, "epoch": 2415} {"train_loss": -6.363681316375732, "global_step": 101450, "epoch": 2415} {"train_loss": -6.388313293457031, "global_step": 101451, "epoch": 2415} {"train_loss": -6.466680526733398, "global_step": 101452, "epoch": 2415} {"train_loss": -6.372920036315918, "global_step": 101453, "epoch": 2415} {"train_loss": -6.185398101806641, "global_step": 101454, "epoch": 2415} {"train_loss": -6.329065799713135, "global_step": 101455, "epoch": 2415} {"train_loss": -6.271342754364014, "global_step": 101456, "epoch": 2415} {"train_loss": -6.291492462158203, "global_step": 101457, "epoch": 2415} {"train_loss": -6.285212516784668, "global_step": 101458, "epoch": 2415} {"train_loss": -6.428740978240967, "global_step": 101459, "epoch": 2415} {"train_loss": -6.253627777099609, "global_step": 101460, "epoch": 2415} {"train_loss": -6.379694938659668, "global_step": 101461, "epoch": 2415} {"train_loss": -6.325784683227539, "global_step": 101462, "epoch": 2415} {"train_loss": -6.3972930908203125, "global_step": 101463, "epoch": 2415} {"train_loss": -6.409346580505371, "global_step": 101464, "epoch": 2415} {"train_loss": -6.334394931793213, "global_step": 101465, "epoch": 2415} {"train_loss": -6.412956237792969, "global_step": 101466, "epoch": 2415} {"train_loss": -6.293100357055664, "global_step": 101467, "epoch": 2415} {"train_loss": -6.456940650939941, "global_step": 101468, "epoch": 2415} {"train_loss": -6.415578842163086, "global_step": 101469, "epoch": 2415} {"train_loss": -6.4167704582214355, "global_step": 101470, "epoch": 2415} {"train_loss": -6.353129489081247, "global_step": 101471, "epoch": 2415, "val_loss": 75852.453125} {"train_loss": -6.449745178222656, "global_step": 101472, "epoch": 2416} {"train_loss": -6.321346282958984, "global_step": 101473, "epoch": 2416} {"train_loss": -6.374912261962891, "global_step": 101474, "epoch": 2416} {"train_loss": -6.270089626312256, "global_step": 101475, "epoch": 2416} {"train_loss": -6.42181396484375, "global_step": 101476, "epoch": 2416} {"train_loss": -6.402826309204102, "global_step": 101477, "epoch": 2416} {"train_loss": -6.499555587768555, "global_step": 101478, "epoch": 2416} {"train_loss": -6.436612606048584, "global_step": 101479, "epoch": 2416} {"train_loss": -6.354991912841797, "global_step": 101480, "epoch": 2416} {"train_loss": -6.329476356506348, "global_step": 101481, "epoch": 2416} {"train_loss": -6.370353698730469, "global_step": 101482, "epoch": 2416} {"train_loss": -6.310171604156494, "global_step": 101483, "epoch": 2416} {"train_loss": -6.3452959060668945, "global_step": 101484, "epoch": 2416} {"train_loss": -6.35836124420166, "global_step": 101485, "epoch": 2416} {"train_loss": -6.4384918212890625, "global_step": 101486, "epoch": 2416} {"train_loss": -6.403027534484863, "global_step": 101487, "epoch": 2416} {"train_loss": -6.349066734313965, "global_step": 101488, "epoch": 2416} {"train_loss": -6.255489826202393, "global_step": 101489, "epoch": 2416} {"train_loss": -6.383365154266357, "global_step": 101490, "epoch": 2416} {"train_loss": -6.410516262054443, "global_step": 101491, "epoch": 2416} {"train_loss": -6.410528182983398, "global_step": 101492, "epoch": 2416} {"train_loss": -6.462395191192627, "global_step": 101493, "epoch": 2416} {"train_loss": -6.473748683929443, "global_step": 101494, "epoch": 2416} {"train_loss": -6.275443077087402, "global_step": 101495, "epoch": 2416} {"train_loss": -6.253981590270996, "global_step": 101496, "epoch": 2416} {"train_loss": -6.401528835296631, "global_step": 101497, "epoch": 2416} {"train_loss": -6.280058860778809, "global_step": 101498, "epoch": 2416} {"train_loss": -6.333008289337158, "global_step": 101499, "epoch": 2416} {"train_loss": -6.416477203369141, "global_step": 101500, "epoch": 2416} {"train_loss": -6.2924394607543945, "global_step": 101501, "epoch": 2416} {"train_loss": -6.349804878234863, "global_step": 101502, "epoch": 2416} {"train_loss": -6.3893280029296875, "global_step": 101503, "epoch": 2416} {"train_loss": -6.358246803283691, "global_step": 101504, "epoch": 2416} {"train_loss": -6.3680291175842285, "global_step": 101505, "epoch": 2416} {"train_loss": -6.288179397583008, "global_step": 101506, "epoch": 2416} {"train_loss": -6.3528666496276855, "global_step": 101507, "epoch": 2416} {"train_loss": -6.253965854644775, "global_step": 101508, "epoch": 2416} {"train_loss": -6.329174041748047, "global_step": 101509, "epoch": 2416} {"train_loss": -6.377613544464111, "global_step": 101510, "epoch": 2416} {"train_loss": -6.41721248626709, "global_step": 101511, "epoch": 2416} {"train_loss": -6.281123638153076, "global_step": 101512, "epoch": 2416} {"train_loss": -6.35907108443124, "global_step": 101513, "epoch": 2416, "val_loss": 75854.2421875} {"train_loss": -6.318737983703613, "global_step": 101514, "epoch": 2417} {"train_loss": -6.428197860717773, "global_step": 101515, "epoch": 2417} {"train_loss": -6.346541404724121, "global_step": 101516, "epoch": 2417} {"train_loss": -6.350258827209473, "global_step": 101517, "epoch": 2417} {"train_loss": -6.4344940185546875, "global_step": 101518, "epoch": 2417} {"train_loss": -6.421468257904053, "global_step": 101519, "epoch": 2417} {"train_loss": -6.308377742767334, "global_step": 101520, "epoch": 2417} {"train_loss": -6.366238594055176, "global_step": 101521, "epoch": 2417} {"train_loss": -6.373654365539551, "global_step": 101522, "epoch": 2417} {"train_loss": -6.372834205627441, "global_step": 101523, "epoch": 2417} {"train_loss": -6.431778430938721, "global_step": 101524, "epoch": 2417} {"train_loss": -6.419650077819824, "global_step": 101525, "epoch": 2417} {"train_loss": -6.357666015625, "global_step": 101526, "epoch": 2417} {"train_loss": -6.387489318847656, "global_step": 101527, "epoch": 2417} {"train_loss": -6.310848236083984, "global_step": 101528, "epoch": 2417} {"train_loss": -6.277364253997803, "global_step": 101529, "epoch": 2417} {"train_loss": -6.288259506225586, "global_step": 101530, "epoch": 2417} {"train_loss": -6.368831157684326, "global_step": 101531, "epoch": 2417} {"train_loss": -6.434675693511963, "global_step": 101532, "epoch": 2417} {"train_loss": -6.242040157318115, "global_step": 101533, "epoch": 2417} {"train_loss": -6.297092437744141, "global_step": 101534, "epoch": 2417} {"train_loss": -6.28384256362915, "global_step": 101535, "epoch": 2417} {"train_loss": -6.310308933258057, "global_step": 101536, "epoch": 2417} {"train_loss": -6.270968914031982, "global_step": 101537, "epoch": 2417} {"train_loss": -6.348747253417969, "global_step": 101538, "epoch": 2417} {"train_loss": -6.290379524230957, "global_step": 101539, "epoch": 2417} {"train_loss": -6.387357711791992, "global_step": 101540, "epoch": 2417} {"train_loss": -6.355101585388184, "global_step": 101541, "epoch": 2417} {"train_loss": -6.324589729309082, "global_step": 101542, "epoch": 2417} {"train_loss": -6.365710258483887, "global_step": 101543, "epoch": 2417} {"train_loss": -6.423746109008789, "global_step": 101544, "epoch": 2417} {"train_loss": -6.3903703689575195, "global_step": 101545, "epoch": 2417} {"train_loss": -6.393991470336914, "global_step": 101546, "epoch": 2417} {"train_loss": -6.360387802124023, "global_step": 101547, "epoch": 2417} {"train_loss": -6.407060623168945, "global_step": 101548, "epoch": 2417} {"train_loss": -6.487419605255127, "global_step": 101549, "epoch": 2417} {"train_loss": -6.399891376495361, "global_step": 101550, "epoch": 2417} {"train_loss": -6.394859790802002, "global_step": 101551, "epoch": 2417} {"train_loss": -6.550323963165283, "global_step": 101552, "epoch": 2417} {"train_loss": -6.423955917358398, "global_step": 101553, "epoch": 2417} {"train_loss": -6.347897529602051, "global_step": 101554, "epoch": 2417} {"train_loss": -6.36764171009972, "global_step": 101555, "epoch": 2417, "val_loss": 75700.015625} {"train_loss": -6.400513172149658, "global_step": 101556, "epoch": 2418} {"train_loss": -6.420918941497803, "global_step": 101557, "epoch": 2418} {"train_loss": -6.43613338470459, "global_step": 101558, "epoch": 2418} {"train_loss": -6.36798095703125, "global_step": 101559, "epoch": 2418} {"train_loss": -6.362062931060791, "global_step": 101560, "epoch": 2418} {"train_loss": -6.387552261352539, "global_step": 101561, "epoch": 2418} {"train_loss": -6.398458480834961, "global_step": 101562, "epoch": 2418} {"train_loss": -6.462315559387207, "global_step": 101563, "epoch": 2418} {"train_loss": -6.4474568367004395, "global_step": 101564, "epoch": 2418} {"train_loss": -6.287062644958496, "global_step": 101565, "epoch": 2418} {"train_loss": -6.354243278503418, "global_step": 101566, "epoch": 2418} {"train_loss": -6.325102806091309, "global_step": 101567, "epoch": 2418} {"train_loss": -6.255166053771973, "global_step": 101568, "epoch": 2418} {"train_loss": -6.445791721343994, "global_step": 101569, "epoch": 2418} {"train_loss": -6.180764675140381, "global_step": 101570, "epoch": 2418} {"train_loss": -6.309856414794922, "global_step": 101571, "epoch": 2418} {"train_loss": -6.517389297485352, "global_step": 101572, "epoch": 2418} {"train_loss": -6.329880714416504, "global_step": 101573, "epoch": 2418} {"train_loss": -6.3989763259887695, "global_step": 101574, "epoch": 2418} {"train_loss": -6.415316581726074, "global_step": 101575, "epoch": 2418} {"train_loss": -6.228244781494141, "global_step": 101576, "epoch": 2418} {"train_loss": -6.319762229919434, "global_step": 101577, "epoch": 2418} {"train_loss": -6.364909648895264, "global_step": 101578, "epoch": 2418} {"train_loss": -6.455366134643555, "global_step": 101579, "epoch": 2418} {"train_loss": -6.293182373046875, "global_step": 101580, "epoch": 2418} {"train_loss": -6.394728660583496, "global_step": 101581, "epoch": 2418} {"train_loss": -6.350324630737305, "global_step": 101582, "epoch": 2418} {"train_loss": -6.348598957061768, "global_step": 101583, "epoch": 2418} {"train_loss": -6.29563045501709, "global_step": 101584, "epoch": 2418} {"train_loss": -6.378565788269043, "global_step": 101585, "epoch": 2418} {"train_loss": -6.2684502601623535, "global_step": 101586, "epoch": 2418} {"train_loss": -6.3153076171875, "global_step": 101587, "epoch": 2418} {"train_loss": -6.3798346519470215, "global_step": 101588, "epoch": 2418} {"train_loss": -6.416611671447754, "global_step": 101589, "epoch": 2418} {"train_loss": -6.389902114868164, "global_step": 101590, "epoch": 2418} {"train_loss": -6.4199018478393555, "global_step": 101591, "epoch": 2418} {"train_loss": -6.422224044799805, "global_step": 101592, "epoch": 2418} {"train_loss": -6.307803630828857, "global_step": 101593, "epoch": 2418} {"train_loss": -6.417708396911621, "global_step": 101594, "epoch": 2418} {"train_loss": -6.349793910980225, "global_step": 101595, "epoch": 2418} {"train_loss": -6.336709022521973, "global_step": 101596, "epoch": 2418} {"train_loss": -6.364385638918195, "global_step": 101597, "epoch": 2418, "val_loss": 76115.3984375} {"train_loss": -6.446382522583008, "global_step": 101598, "epoch": 2419} {"train_loss": -6.3939208984375, "global_step": 101599, "epoch": 2419} {"train_loss": -6.40405797958374, "global_step": 101600, "epoch": 2419} {"train_loss": -6.487730979919434, "global_step": 101601, "epoch": 2419} {"train_loss": -6.468601226806641, "global_step": 101602, "epoch": 2419} {"train_loss": -6.447292804718018, "global_step": 101603, "epoch": 2419} {"train_loss": -6.344509124755859, "global_step": 101604, "epoch": 2419} {"train_loss": -6.309686660766602, "global_step": 101605, "epoch": 2419} {"train_loss": -6.435575485229492, "global_step": 101606, "epoch": 2419} {"train_loss": -6.401493072509766, "global_step": 101607, "epoch": 2419} {"train_loss": -6.414386749267578, "global_step": 101608, "epoch": 2419} {"train_loss": -6.250548839569092, "global_step": 101609, "epoch": 2419} {"train_loss": -6.379031658172607, "global_step": 101610, "epoch": 2419} {"train_loss": -6.522122383117676, "global_step": 101611, "epoch": 2419} {"train_loss": -6.4038496017456055, "global_step": 101612, "epoch": 2419} {"train_loss": -6.3789873123168945, "global_step": 101613, "epoch": 2419} {"train_loss": -6.413081169128418, "global_step": 101614, "epoch": 2419} {"train_loss": -6.300714015960693, "global_step": 101615, "epoch": 2419} {"train_loss": -6.404055595397949, "global_step": 101616, "epoch": 2419} {"train_loss": -6.441386699676514, "global_step": 101617, "epoch": 2419} {"train_loss": -6.358323574066162, "global_step": 101618, "epoch": 2419} {"train_loss": -6.450329303741455, "global_step": 101619, "epoch": 2419} {"train_loss": -6.368130683898926, "global_step": 101620, "epoch": 2419} {"train_loss": -6.301118850708008, "global_step": 101621, "epoch": 2419} {"train_loss": -6.475465774536133, "global_step": 101622, "epoch": 2419} {"train_loss": -6.264171600341797, "global_step": 101623, "epoch": 2419} {"train_loss": -6.343620300292969, "global_step": 101624, "epoch": 2419} {"train_loss": -6.341207027435303, "global_step": 101625, "epoch": 2419} {"train_loss": -6.182724475860596, "global_step": 101626, "epoch": 2419} {"train_loss": -6.278815746307373, "global_step": 101627, "epoch": 2419} {"train_loss": -6.324336051940918, "global_step": 101628, "epoch": 2419} {"train_loss": -6.130884170532227, "global_step": 101629, "epoch": 2419} {"train_loss": -6.334165573120117, "global_step": 101630, "epoch": 2419} {"train_loss": -6.339752197265625, "global_step": 101631, "epoch": 2419} {"train_loss": -6.197103977203369, "global_step": 101632, "epoch": 2419} {"train_loss": -6.288296222686768, "global_step": 101633, "epoch": 2419} {"train_loss": -6.2450175285339355, "global_step": 101634, "epoch": 2419} {"train_loss": -6.408986568450928, "global_step": 101635, "epoch": 2419} {"train_loss": -6.332985877990723, "global_step": 101636, "epoch": 2419} {"train_loss": -6.207163333892822, "global_step": 101637, "epoch": 2419} {"train_loss": -6.345446586608887, "global_step": 101638, "epoch": 2419} {"train_loss": -6.354493152527582, "global_step": 101639, "epoch": 2419, "val_loss": 76155.703125} {"train_loss": -6.237766265869141, "global_step": 101640, "epoch": 2420} {"train_loss": -6.347492218017578, "global_step": 101641, "epoch": 2420} {"train_loss": -6.2118024826049805, "global_step": 101642, "epoch": 2420} {"train_loss": -6.31880521774292, "global_step": 101643, "epoch": 2420} {"train_loss": -6.171273231506348, "global_step": 101644, "epoch": 2420} {"train_loss": -6.245517730712891, "global_step": 101645, "epoch": 2420} {"train_loss": -6.303556442260742, "global_step": 101646, "epoch": 2420} {"train_loss": -6.280555725097656, "global_step": 101647, "epoch": 2420} {"train_loss": -6.319964408874512, "global_step": 101648, "epoch": 2420} {"train_loss": -6.428869247436523, "global_step": 101649, "epoch": 2420} {"train_loss": -6.1458940505981445, "global_step": 101650, "epoch": 2420} {"train_loss": -6.387272834777832, "global_step": 101651, "epoch": 2420} {"train_loss": -6.288809299468994, "global_step": 101652, "epoch": 2420} {"train_loss": -6.311968803405762, "global_step": 101653, "epoch": 2420} {"train_loss": -6.354178428649902, "global_step": 101654, "epoch": 2420} {"train_loss": -6.286049842834473, "global_step": 101655, "epoch": 2420} {"train_loss": -6.234307289123535, "global_step": 101656, "epoch": 2420} {"train_loss": -6.212221145629883, "global_step": 101657, "epoch": 2420} {"train_loss": -6.315840244293213, "global_step": 101658, "epoch": 2420} {"train_loss": -6.318423271179199, "global_step": 101659, "epoch": 2420} {"train_loss": -6.315167427062988, "global_step": 101660, "epoch": 2420} {"train_loss": -6.403021812438965, "global_step": 101661, "epoch": 2420} {"train_loss": -6.3454742431640625, "global_step": 101662, "epoch": 2420} {"train_loss": -6.262353897094727, "global_step": 101663, "epoch": 2420} {"train_loss": -6.458317756652832, "global_step": 101664, "epoch": 2420} {"train_loss": -6.414361953735352, "global_step": 101665, "epoch": 2420} {"train_loss": -6.313688278198242, "global_step": 101666, "epoch": 2420} {"train_loss": -6.443662643432617, "global_step": 101667, "epoch": 2420} {"train_loss": -6.255521774291992, "global_step": 101668, "epoch": 2420} {"train_loss": -6.454358100891113, "global_step": 101669, "epoch": 2420} {"train_loss": -6.46903133392334, "global_step": 101670, "epoch": 2420} {"train_loss": -6.375168800354004, "global_step": 101671, "epoch": 2420} {"train_loss": -6.383988380432129, "global_step": 101672, "epoch": 2420} {"train_loss": -6.266752243041992, "global_step": 101673, "epoch": 2420} {"train_loss": -6.563591003417969, "global_step": 101674, "epoch": 2420} {"train_loss": -6.398260116577148, "global_step": 101675, "epoch": 2420} {"train_loss": -6.366847038269043, "global_step": 101676, "epoch": 2420} {"train_loss": -6.483226776123047, "global_step": 101677, "epoch": 2420} {"train_loss": -6.4576005935668945, "global_step": 101678, "epoch": 2420} {"train_loss": -6.385357856750488, "global_step": 101679, "epoch": 2420} {"train_loss": -6.596211910247803, "global_step": 101680, "epoch": 2420} {"train_loss": -6.346042247045608, "global_step": 101681, "epoch": 2420, "val_loss": 75973.53125} {"train_loss": -6.495776176452637, "global_step": 101682, "epoch": 2421} {"train_loss": -6.569969654083252, "global_step": 101683, "epoch": 2421} {"train_loss": -6.382807731628418, "global_step": 101684, "epoch": 2421} {"train_loss": -6.450645446777344, "global_step": 101685, "epoch": 2421} {"train_loss": -6.456592559814453, "global_step": 101686, "epoch": 2421} {"train_loss": -6.307823181152344, "global_step": 101687, "epoch": 2421} {"train_loss": -6.382303237915039, "global_step": 101688, "epoch": 2421} {"train_loss": -6.351378917694092, "global_step": 101689, "epoch": 2421} {"train_loss": -6.459195613861084, "global_step": 101690, "epoch": 2421} {"train_loss": -6.29591703414917, "global_step": 101691, "epoch": 2421} {"train_loss": -6.401278495788574, "global_step": 101692, "epoch": 2421} {"train_loss": -6.4467949867248535, "global_step": 101693, "epoch": 2421} {"train_loss": -6.469353199005127, "global_step": 101694, "epoch": 2421} {"train_loss": -6.2045488357543945, "global_step": 101695, "epoch": 2421} {"train_loss": -6.3472981452941895, "global_step": 101696, "epoch": 2421} {"train_loss": -6.326114177703857, "global_step": 101697, "epoch": 2421} {"train_loss": -6.380125045776367, "global_step": 101698, "epoch": 2421} {"train_loss": -6.4948883056640625, "global_step": 101699, "epoch": 2421} {"train_loss": -6.4518890380859375, "global_step": 101700, "epoch": 2421} {"train_loss": -6.380387306213379, "global_step": 101701, "epoch": 2421} {"train_loss": -6.401214599609375, "global_step": 101702, "epoch": 2421} {"train_loss": -6.29499626159668, "global_step": 101703, "epoch": 2421} {"train_loss": -6.440394401550293, "global_step": 101704, "epoch": 2421} {"train_loss": -6.2480244636535645, "global_step": 101705, "epoch": 2421} {"train_loss": -6.383979320526123, "global_step": 101706, "epoch": 2421} {"train_loss": -6.401869773864746, "global_step": 101707, "epoch": 2421} {"train_loss": -6.261101722717285, "global_step": 101708, "epoch": 2421} {"train_loss": -6.319058418273926, "global_step": 101709, "epoch": 2421} {"train_loss": -6.235326290130615, "global_step": 101710, "epoch": 2421} {"train_loss": -6.241443634033203, "global_step": 101711, "epoch": 2421} {"train_loss": -6.410523891448975, "global_step": 101712, "epoch": 2421} {"train_loss": -6.310770511627197, "global_step": 101713, "epoch": 2421} {"train_loss": -6.34010124206543, "global_step": 101714, "epoch": 2421} {"train_loss": -6.383904933929443, "global_step": 101715, "epoch": 2421} {"train_loss": -6.286764144897461, "global_step": 101716, "epoch": 2421} {"train_loss": -6.396618366241455, "global_step": 101717, "epoch": 2421} {"train_loss": -6.375401496887207, "global_step": 101718, "epoch": 2421} {"train_loss": -6.32590389251709, "global_step": 101719, "epoch": 2421} {"train_loss": -6.370608329772949, "global_step": 101720, "epoch": 2421} {"train_loss": -6.322254180908203, "global_step": 101721, "epoch": 2421} {"train_loss": -6.337824821472168, "global_step": 101722, "epoch": 2421} {"train_loss": -6.364838350386846, "global_step": 101723, "epoch": 2421, "val_loss": 75566.671875} {"train_loss": -6.373394012451172, "global_step": 101724, "epoch": 2422} {"train_loss": -6.336824417114258, "global_step": 101725, "epoch": 2422} {"train_loss": -6.330309867858887, "global_step": 101726, "epoch": 2422} {"train_loss": -6.416965007781982, "global_step": 101727, "epoch": 2422} {"train_loss": -6.231964111328125, "global_step": 101728, "epoch": 2422} {"train_loss": -6.356107711791992, "global_step": 101729, "epoch": 2422} {"train_loss": -6.332594871520996, "global_step": 101730, "epoch": 2422} {"train_loss": -6.212824821472168, "global_step": 101731, "epoch": 2422} {"train_loss": -6.304904460906982, "global_step": 101732, "epoch": 2422} {"train_loss": -6.236438751220703, "global_step": 101733, "epoch": 2422} {"train_loss": -6.316718578338623, "global_step": 101734, "epoch": 2422} {"train_loss": -6.388758659362793, "global_step": 101735, "epoch": 2422} {"train_loss": -6.444108009338379, "global_step": 101736, "epoch": 2422} {"train_loss": -6.400707244873047, "global_step": 101737, "epoch": 2422} {"train_loss": -6.3503923416137695, "global_step": 101738, "epoch": 2422} {"train_loss": -6.377193450927734, "global_step": 101739, "epoch": 2422} {"train_loss": -6.38192081451416, "global_step": 101740, "epoch": 2422} {"train_loss": -6.353982448577881, "global_step": 101741, "epoch": 2422} {"train_loss": -6.473860740661621, "global_step": 101742, "epoch": 2422} {"train_loss": -6.396939277648926, "global_step": 101743, "epoch": 2422} {"train_loss": -6.47523307800293, "global_step": 101744, "epoch": 2422} {"train_loss": -6.331007957458496, "global_step": 101745, "epoch": 2422} {"train_loss": -6.510760307312012, "global_step": 101746, "epoch": 2422} {"train_loss": -6.418424606323242, "global_step": 101747, "epoch": 2422} {"train_loss": -6.396247863769531, "global_step": 101748, "epoch": 2422} {"train_loss": -6.403592109680176, "global_step": 101749, "epoch": 2422} {"train_loss": -6.342123031616211, "global_step": 101750, "epoch": 2422} {"train_loss": -6.378751277923584, "global_step": 101751, "epoch": 2422} {"train_loss": -6.424893856048584, "global_step": 101752, "epoch": 2422} {"train_loss": -6.373987674713135, "global_step": 101753, "epoch": 2422} {"train_loss": -6.374643325805664, "global_step": 101754, "epoch": 2422} {"train_loss": -6.482213020324707, "global_step": 101755, "epoch": 2422} {"train_loss": -6.469735145568848, "global_step": 101756, "epoch": 2422} {"train_loss": -6.430344581604004, "global_step": 101757, "epoch": 2422} {"train_loss": -6.534073352813721, "global_step": 101758, "epoch": 2422} {"train_loss": -6.40463924407959, "global_step": 101759, "epoch": 2422} {"train_loss": -6.487518787384033, "global_step": 101760, "epoch": 2422} {"train_loss": -6.3185553550720215, "global_step": 101761, "epoch": 2422} {"train_loss": -6.424516677856445, "global_step": 101762, "epoch": 2422} {"train_loss": -6.378089904785156, "global_step": 101763, "epoch": 2422} {"train_loss": -6.473757266998291, "global_step": 101764, "epoch": 2422} {"train_loss": -6.388278529757545, "global_step": 101765, "epoch": 2422, "val_loss": 75969.546875} {"train_loss": -6.40390682220459, "global_step": 101766, "epoch": 2423} {"train_loss": -6.351996421813965, "global_step": 101767, "epoch": 2423} {"train_loss": -6.2957611083984375, "global_step": 101768, "epoch": 2423} {"train_loss": -6.413294792175293, "global_step": 101769, "epoch": 2423} {"train_loss": -6.387579917907715, "global_step": 101770, "epoch": 2423} {"train_loss": -6.404667854309082, "global_step": 101771, "epoch": 2423} {"train_loss": -6.39044713973999, "global_step": 101772, "epoch": 2423} {"train_loss": -6.333300590515137, "global_step": 101773, "epoch": 2423} {"train_loss": -6.3050217628479, "global_step": 101774, "epoch": 2423} {"train_loss": -6.289124488830566, "global_step": 101775, "epoch": 2423} {"train_loss": -6.3236236572265625, "global_step": 101776, "epoch": 2423} {"train_loss": -6.454724311828613, "global_step": 101777, "epoch": 2423} {"train_loss": -6.3011860847473145, "global_step": 101778, "epoch": 2423} {"train_loss": -6.325552940368652, "global_step": 101779, "epoch": 2423} {"train_loss": -6.302680969238281, "global_step": 101780, "epoch": 2423} {"train_loss": -6.375936508178711, "global_step": 101781, "epoch": 2423} {"train_loss": -6.291516304016113, "global_step": 101782, "epoch": 2423} {"train_loss": -6.319096565246582, "global_step": 101783, "epoch": 2423} {"train_loss": -6.32924747467041, "global_step": 101784, "epoch": 2423} {"train_loss": -6.18498420715332, "global_step": 101785, "epoch": 2423} {"train_loss": -6.321424961090088, "global_step": 101786, "epoch": 2423} {"train_loss": -6.115177631378174, "global_step": 101787, "epoch": 2423} {"train_loss": -6.3492512702941895, "global_step": 101788, "epoch": 2423} {"train_loss": -6.306767463684082, "global_step": 101789, "epoch": 2423} {"train_loss": -6.320734024047852, "global_step": 101790, "epoch": 2423} {"train_loss": -6.230662822723389, "global_step": 101791, "epoch": 2423} {"train_loss": -6.294917583465576, "global_step": 101792, "epoch": 2423} {"train_loss": -6.222070693969727, "global_step": 101793, "epoch": 2423} {"train_loss": -6.353872299194336, "global_step": 101794, "epoch": 2423} {"train_loss": -6.263037204742432, "global_step": 101795, "epoch": 2423} {"train_loss": -6.2517852783203125, "global_step": 101796, "epoch": 2423} {"train_loss": -6.359502792358398, "global_step": 101797, "epoch": 2423} {"train_loss": -6.380674362182617, "global_step": 101798, "epoch": 2423} {"train_loss": -6.363572120666504, "global_step": 101799, "epoch": 2423} {"train_loss": -6.396368980407715, "global_step": 101800, "epoch": 2423} {"train_loss": -6.4018235206604, "global_step": 101801, "epoch": 2423} {"train_loss": -6.3466620445251465, "global_step": 101802, "epoch": 2423} {"train_loss": -6.301693916320801, "global_step": 101803, "epoch": 2423} {"train_loss": -6.431985855102539, "global_step": 101804, "epoch": 2423} {"train_loss": -6.3357648849487305, "global_step": 101805, "epoch": 2423} {"train_loss": -6.26638126373291, "global_step": 101806, "epoch": 2423} {"train_loss": -6.324512629281907, "global_step": 101807, "epoch": 2423, "val_loss": 75821.4609375} {"train_loss": -6.384259223937988, "global_step": 101808, "epoch": 2424} {"train_loss": -6.403608322143555, "global_step": 101809, "epoch": 2424} {"train_loss": -6.4356794357299805, "global_step": 101810, "epoch": 2424} {"train_loss": -6.296813011169434, "global_step": 101811, "epoch": 2424} {"train_loss": -6.2765679359436035, "global_step": 101812, "epoch": 2424} {"train_loss": -6.300212383270264, "global_step": 101813, "epoch": 2424} {"train_loss": -6.36201286315918, "global_step": 101814, "epoch": 2424} {"train_loss": -6.302677154541016, "global_step": 101815, "epoch": 2424} {"train_loss": -6.281679630279541, "global_step": 101816, "epoch": 2424} {"train_loss": -6.417275428771973, "global_step": 101817, "epoch": 2424} {"train_loss": -6.315676689147949, "global_step": 101818, "epoch": 2424} {"train_loss": -6.3471832275390625, "global_step": 101819, "epoch": 2424} {"train_loss": -6.361551284790039, "global_step": 101820, "epoch": 2424} {"train_loss": -6.265284061431885, "global_step": 101821, "epoch": 2424} {"train_loss": -6.293866157531738, "global_step": 101822, "epoch": 2424} {"train_loss": -6.265575885772705, "global_step": 101823, "epoch": 2424} {"train_loss": -6.308863639831543, "global_step": 101824, "epoch": 2424} {"train_loss": -6.408771514892578, "global_step": 101825, "epoch": 2424} {"train_loss": -6.436016082763672, "global_step": 101826, "epoch": 2424} {"train_loss": -6.283392906188965, "global_step": 101827, "epoch": 2424} {"train_loss": -6.456509590148926, "global_step": 101828, "epoch": 2424} {"train_loss": -6.354847431182861, "global_step": 101829, "epoch": 2424} {"train_loss": -6.32090425491333, "global_step": 101830, "epoch": 2424} {"train_loss": -6.390074253082275, "global_step": 101831, "epoch": 2424} {"train_loss": -6.318154335021973, "global_step": 101832, "epoch": 2424} {"train_loss": -6.320088863372803, "global_step": 101833, "epoch": 2424} {"train_loss": -6.3563151359558105, "global_step": 101834, "epoch": 2424} {"train_loss": -6.333560466766357, "global_step": 101835, "epoch": 2424} {"train_loss": -6.36240816116333, "global_step": 101836, "epoch": 2424} {"train_loss": -6.452764511108398, "global_step": 101837, "epoch": 2424} {"train_loss": -6.401226043701172, "global_step": 101838, "epoch": 2424} {"train_loss": -6.368203163146973, "global_step": 101839, "epoch": 2424} {"train_loss": -6.300597190856934, "global_step": 101840, "epoch": 2424} {"train_loss": -6.284826278686523, "global_step": 101841, "epoch": 2424} {"train_loss": -6.236020565032959, "global_step": 101842, "epoch": 2424} {"train_loss": -6.347442626953125, "global_step": 101843, "epoch": 2424} {"train_loss": -6.3437628746032715, "global_step": 101844, "epoch": 2424} {"train_loss": -6.253114223480225, "global_step": 101845, "epoch": 2424} {"train_loss": -6.324420928955078, "global_step": 101846, "epoch": 2424} {"train_loss": -6.330416679382324, "global_step": 101847, "epoch": 2424} {"train_loss": -6.2509002685546875, "global_step": 101848, "epoch": 2424} {"train_loss": -6.33724087760562, "global_step": 101849, "epoch": 2424, "val_loss": 75699.078125} {"train_loss": -6.3873467445373535, "global_step": 101850, "epoch": 2425} {"train_loss": -6.296928405761719, "global_step": 101851, "epoch": 2425} {"train_loss": -6.409756660461426, "global_step": 101852, "epoch": 2425} {"train_loss": -6.314791679382324, "global_step": 101853, "epoch": 2425} {"train_loss": -6.322602272033691, "global_step": 101854, "epoch": 2425} {"train_loss": -6.426446914672852, "global_step": 101855, "epoch": 2425} {"train_loss": -6.475105285644531, "global_step": 101856, "epoch": 2425} {"train_loss": -6.273842811584473, "global_step": 101857, "epoch": 2425} {"train_loss": -6.380007743835449, "global_step": 101858, "epoch": 2425} {"train_loss": -6.412041664123535, "global_step": 101859, "epoch": 2425} {"train_loss": -6.308999061584473, "global_step": 101860, "epoch": 2425} {"train_loss": -6.506081581115723, "global_step": 101861, "epoch": 2425} {"train_loss": -6.413958549499512, "global_step": 101862, "epoch": 2425} {"train_loss": -6.363194942474365, "global_step": 101863, "epoch": 2425} {"train_loss": -6.376089096069336, "global_step": 101864, "epoch": 2425} {"train_loss": -6.302001953125, "global_step": 101865, "epoch": 2425} {"train_loss": -6.469959259033203, "global_step": 101866, "epoch": 2425} {"train_loss": -6.238574981689453, "global_step": 101867, "epoch": 2425} {"train_loss": -6.521177768707275, "global_step": 101868, "epoch": 2425} {"train_loss": -6.414072036743164, "global_step": 101869, "epoch": 2425} {"train_loss": -6.489102840423584, "global_step": 101870, "epoch": 2425} {"train_loss": -6.422759056091309, "global_step": 101871, "epoch": 2425} {"train_loss": -6.314681529998779, "global_step": 101872, "epoch": 2425} {"train_loss": -6.370825290679932, "global_step": 101873, "epoch": 2425} {"train_loss": -6.435669898986816, "global_step": 101874, "epoch": 2425} {"train_loss": -6.369541168212891, "global_step": 101875, "epoch": 2425} {"train_loss": -6.485617637634277, "global_step": 101876, "epoch": 2425} {"train_loss": -6.303839683532715, "global_step": 101877, "epoch": 2425} {"train_loss": -6.320374488830566, "global_step": 101878, "epoch": 2425} {"train_loss": -6.288827419281006, "global_step": 101879, "epoch": 2425} {"train_loss": -6.263914108276367, "global_step": 101880, "epoch": 2425} {"train_loss": -6.362303256988525, "global_step": 101881, "epoch": 2425} {"train_loss": -6.318256378173828, "global_step": 101882, "epoch": 2425} {"train_loss": -6.3918962478637695, "global_step": 101883, "epoch": 2425} {"train_loss": -6.459258079528809, "global_step": 101884, "epoch": 2425} {"train_loss": -6.436052322387695, "global_step": 101885, "epoch": 2425} {"train_loss": -6.343294143676758, "global_step": 101886, "epoch": 2425} {"train_loss": -6.435343265533447, "global_step": 101887, "epoch": 2425} {"train_loss": -6.365789413452148, "global_step": 101888, "epoch": 2425} {"train_loss": -6.307612895965576, "global_step": 101889, "epoch": 2425} {"train_loss": -6.33134126663208, "global_step": 101890, "epoch": 2425} {"train_loss": -6.375684306735084, "global_step": 101891, "epoch": 2425, "val_loss": 75928.828125} {"train_loss": -6.342628479003906, "global_step": 101892, "epoch": 2426} {"train_loss": -6.431402683258057, "global_step": 101893, "epoch": 2426} {"train_loss": -6.398481369018555, "global_step": 101894, "epoch": 2426} {"train_loss": -6.447458744049072, "global_step": 101895, "epoch": 2426} {"train_loss": -6.423257827758789, "global_step": 101896, "epoch": 2426} {"train_loss": -6.347867012023926, "global_step": 101897, "epoch": 2426} {"train_loss": -6.521999359130859, "global_step": 101898, "epoch": 2426} {"train_loss": -6.408915042877197, "global_step": 101899, "epoch": 2426} {"train_loss": -6.361072540283203, "global_step": 101900, "epoch": 2426} {"train_loss": -6.609767913818359, "global_step": 101901, "epoch": 2426} {"train_loss": -6.444059371948242, "global_step": 101902, "epoch": 2426} {"train_loss": -6.357261657714844, "global_step": 101903, "epoch": 2426} {"train_loss": -6.372366905212402, "global_step": 101904, "epoch": 2426} {"train_loss": -6.506095886230469, "global_step": 101905, "epoch": 2426} {"train_loss": -6.365386962890625, "global_step": 101906, "epoch": 2426} {"train_loss": -6.451882362365723, "global_step": 101907, "epoch": 2426} {"train_loss": -6.468191146850586, "global_step": 101908, "epoch": 2426} {"train_loss": -6.320228576660156, "global_step": 101909, "epoch": 2426} {"train_loss": -6.478514671325684, "global_step": 101910, "epoch": 2426} {"train_loss": -6.380819320678711, "global_step": 101911, "epoch": 2426} {"train_loss": -6.407535076141357, "global_step": 101912, "epoch": 2426} {"train_loss": -6.317404270172119, "global_step": 101913, "epoch": 2426} {"train_loss": -6.3477349281311035, "global_step": 101914, "epoch": 2426} {"train_loss": -6.428183555603027, "global_step": 101915, "epoch": 2426} {"train_loss": -6.370237827301025, "global_step": 101916, "epoch": 2426} {"train_loss": -6.364124298095703, "global_step": 101917, "epoch": 2426} {"train_loss": -6.409549713134766, "global_step": 101918, "epoch": 2426} {"train_loss": -6.342897891998291, "global_step": 101919, "epoch": 2426} {"train_loss": -6.45412540435791, "global_step": 101920, "epoch": 2426} {"train_loss": -6.271884441375732, "global_step": 101921, "epoch": 2426} {"train_loss": -6.327139854431152, "global_step": 101922, "epoch": 2426} {"train_loss": -6.368138790130615, "global_step": 101923, "epoch": 2426} {"train_loss": -6.400876998901367, "global_step": 101924, "epoch": 2426} {"train_loss": -6.462790489196777, "global_step": 101925, "epoch": 2426} {"train_loss": -6.430406093597412, "global_step": 101926, "epoch": 2426} {"train_loss": -6.34279727935791, "global_step": 101927, "epoch": 2426} {"train_loss": -6.472655296325684, "global_step": 101928, "epoch": 2426} {"train_loss": -6.469176292419434, "global_step": 101929, "epoch": 2426} {"train_loss": -6.40178108215332, "global_step": 101930, "epoch": 2426} {"train_loss": -6.3249640464782715, "global_step": 101931, "epoch": 2426} {"train_loss": -6.4899187088012695, "global_step": 101932, "epoch": 2426} {"train_loss": -6.4035589808509465, "global_step": 101933, "epoch": 2426, "val_loss": 75731.1640625} {"train_loss": -6.372733116149902, "global_step": 101934, "epoch": 2427} {"train_loss": -6.240598678588867, "global_step": 101935, "epoch": 2427} {"train_loss": -6.3593244552612305, "global_step": 101936, "epoch": 2427} {"train_loss": -6.401883125305176, "global_step": 101937, "epoch": 2427} {"train_loss": -6.3561787605285645, "global_step": 101938, "epoch": 2427} {"train_loss": -6.555670738220215, "global_step": 101939, "epoch": 2427} {"train_loss": -6.504066467285156, "global_step": 101940, "epoch": 2427} {"train_loss": -6.390774250030518, "global_step": 101941, "epoch": 2427} {"train_loss": -6.4438700675964355, "global_step": 101942, "epoch": 2427} {"train_loss": -6.423224925994873, "global_step": 101943, "epoch": 2427} {"train_loss": -6.335136890411377, "global_step": 101944, "epoch": 2427} {"train_loss": -6.426558494567871, "global_step": 101945, "epoch": 2427} {"train_loss": -6.300334453582764, "global_step": 101946, "epoch": 2427} {"train_loss": -6.370426177978516, "global_step": 101947, "epoch": 2427} {"train_loss": -6.402654647827148, "global_step": 101948, "epoch": 2427} {"train_loss": -6.4128522872924805, "global_step": 101949, "epoch": 2427} {"train_loss": -6.3435564041137695, "global_step": 101950, "epoch": 2427} {"train_loss": -6.362338066101074, "global_step": 101951, "epoch": 2427} {"train_loss": -6.335500717163086, "global_step": 101952, "epoch": 2427} {"train_loss": -6.315657615661621, "global_step": 101953, "epoch": 2427} {"train_loss": -6.25726842880249, "global_step": 101954, "epoch": 2427} {"train_loss": -6.342662334442139, "global_step": 101955, "epoch": 2427} {"train_loss": -6.392428398132324, "global_step": 101956, "epoch": 2427} {"train_loss": -6.404999732971191, "global_step": 101957, "epoch": 2427} {"train_loss": -6.39537239074707, "global_step": 101958, "epoch": 2427} {"train_loss": -6.450305938720703, "global_step": 101959, "epoch": 2427} {"train_loss": -6.33944845199585, "global_step": 101960, "epoch": 2427} {"train_loss": -6.294188499450684, "global_step": 101961, "epoch": 2427} {"train_loss": -6.459274768829346, "global_step": 101962, "epoch": 2427} {"train_loss": -6.440598964691162, "global_step": 101963, "epoch": 2427} {"train_loss": -6.456075668334961, "global_step": 101964, "epoch": 2427} {"train_loss": -6.3559699058532715, "global_step": 101965, "epoch": 2427} {"train_loss": -6.377311706542969, "global_step": 101966, "epoch": 2427} {"train_loss": -6.449613094329834, "global_step": 101967, "epoch": 2427} {"train_loss": -6.395320415496826, "global_step": 101968, "epoch": 2427} {"train_loss": -6.504783630371094, "global_step": 101969, "epoch": 2427} {"train_loss": -6.255009174346924, "global_step": 101970, "epoch": 2427} {"train_loss": -6.273033142089844, "global_step": 101971, "epoch": 2427} {"train_loss": -6.437394618988037, "global_step": 101972, "epoch": 2427} {"train_loss": -6.273667335510254, "global_step": 101973, "epoch": 2427} {"train_loss": -6.246829509735107, "global_step": 101974, "epoch": 2427} {"train_loss": -6.3785649708339145, "global_step": 101975, "epoch": 2427, "val_loss": 75895.46875} {"train_loss": -6.4616241455078125, "global_step": 101976, "epoch": 2428} {"train_loss": -6.43399715423584, "global_step": 101977, "epoch": 2428} {"train_loss": -6.378669738769531, "global_step": 101978, "epoch": 2428} {"train_loss": -6.377344131469727, "global_step": 101979, "epoch": 2428} {"train_loss": -6.393551349639893, "global_step": 101980, "epoch": 2428} {"train_loss": -6.313364505767822, "global_step": 101981, "epoch": 2428} {"train_loss": -6.173567295074463, "global_step": 101982, "epoch": 2428} {"train_loss": -6.274316787719727, "global_step": 101983, "epoch": 2428} {"train_loss": -6.342831611633301, "global_step": 101984, "epoch": 2428} {"train_loss": -6.31038761138916, "global_step": 101985, "epoch": 2428} {"train_loss": -6.445976257324219, "global_step": 101986, "epoch": 2428} {"train_loss": -6.344156265258789, "global_step": 101987, "epoch": 2428} {"train_loss": -6.366377830505371, "global_step": 101988, "epoch": 2428} {"train_loss": -6.605348587036133, "global_step": 101989, "epoch": 2428} {"train_loss": -6.412900447845459, "global_step": 101990, "epoch": 2428} {"train_loss": -6.302690505981445, "global_step": 101991, "epoch": 2428} {"train_loss": -6.416927337646484, "global_step": 101992, "epoch": 2428} {"train_loss": -6.3756818771362305, "global_step": 101993, "epoch": 2428} {"train_loss": -6.333415985107422, "global_step": 101994, "epoch": 2428} {"train_loss": -6.401247978210449, "global_step": 101995, "epoch": 2428} {"train_loss": -6.118520259857178, "global_step": 101996, "epoch": 2428} {"train_loss": -6.418718338012695, "global_step": 101997, "epoch": 2428} {"train_loss": -6.322802543640137, "global_step": 101998, "epoch": 2428} {"train_loss": -6.148509979248047, "global_step": 101999, "epoch": 2428} {"train_loss": -6.364819526672363, "global_step": 102000, "epoch": 2428} {"train_loss": -6.225604057312012, "global_step": 102001, "epoch": 2428} {"train_loss": -6.215163230895996, "global_step": 102002, "epoch": 2428} {"train_loss": -6.266627311706543, "global_step": 102003, "epoch": 2428} {"train_loss": -6.350069046020508, "global_step": 102004, "epoch": 2428} {"train_loss": -6.169931411743164, "global_step": 102005, "epoch": 2428} {"train_loss": -6.246748924255371, "global_step": 102006, "epoch": 2428} {"train_loss": -6.190959453582764, "global_step": 102007, "epoch": 2428} {"train_loss": -6.333425521850586, "global_step": 102008, "epoch": 2428} {"train_loss": -6.21939754486084, "global_step": 102009, "epoch": 2428} {"train_loss": -6.165199279785156, "global_step": 102010, "epoch": 2428} {"train_loss": -6.182701110839844, "global_step": 102011, "epoch": 2428} {"train_loss": -6.296323776245117, "global_step": 102012, "epoch": 2428} {"train_loss": -6.213444232940674, "global_step": 102013, "epoch": 2428} {"train_loss": -6.257413864135742, "global_step": 102014, "epoch": 2428} {"train_loss": -6.199456691741943, "global_step": 102015, "epoch": 2428} {"train_loss": -6.349849700927734, "global_step": 102016, "epoch": 2428} {"train_loss": -6.312646809078398, "global_step": 102017, "epoch": 2428, "val_loss": 76118.8515625} {"train_loss": -6.267807960510254, "global_step": 102018, "epoch": 2429} {"train_loss": -6.372814178466797, "global_step": 102019, "epoch": 2429} {"train_loss": -6.318159580230713, "global_step": 102020, "epoch": 2429} {"train_loss": -6.324999809265137, "global_step": 102021, "epoch": 2429} {"train_loss": -6.292483806610107, "global_step": 102022, "epoch": 2429} {"train_loss": -6.206266403198242, "global_step": 102023, "epoch": 2429} {"train_loss": -6.330862998962402, "global_step": 102024, "epoch": 2429} {"train_loss": -6.30849552154541, "global_step": 102025, "epoch": 2429} {"train_loss": -6.366035461425781, "global_step": 102026, "epoch": 2429} {"train_loss": -6.28018856048584, "global_step": 102027, "epoch": 2429} {"train_loss": -6.444768905639648, "global_step": 102028, "epoch": 2429} {"train_loss": -6.290113925933838, "global_step": 102029, "epoch": 2429} {"train_loss": -6.2653913497924805, "global_step": 102030, "epoch": 2429} {"train_loss": -6.2982282638549805, "global_step": 102031, "epoch": 2429} {"train_loss": -6.408154487609863, "global_step": 102032, "epoch": 2429} {"train_loss": -6.404167175292969, "global_step": 102033, "epoch": 2429} {"train_loss": -6.461615562438965, "global_step": 102034, "epoch": 2429} {"train_loss": -6.34559965133667, "global_step": 102035, "epoch": 2429} {"train_loss": -6.483739852905273, "global_step": 102036, "epoch": 2429} {"train_loss": -6.416556358337402, "global_step": 102037, "epoch": 2429} {"train_loss": -6.33894157409668, "global_step": 102038, "epoch": 2429} {"train_loss": -6.405835151672363, "global_step": 102039, "epoch": 2429} {"train_loss": -6.347214698791504, "global_step": 102040, "epoch": 2429} {"train_loss": -6.352766513824463, "global_step": 102041, "epoch": 2429} {"train_loss": -6.392104148864746, "global_step": 102042, "epoch": 2429} {"train_loss": -6.327930450439453, "global_step": 102043, "epoch": 2429} {"train_loss": -6.561437129974365, "global_step": 102044, "epoch": 2429} {"train_loss": -6.433373928070068, "global_step": 102045, "epoch": 2429} {"train_loss": -6.3454108238220215, "global_step": 102046, "epoch": 2429} {"train_loss": -6.3429460525512695, "global_step": 102047, "epoch": 2429} {"train_loss": -6.4386749267578125, "global_step": 102048, "epoch": 2429} {"train_loss": -6.486518859863281, "global_step": 102049, "epoch": 2429} {"train_loss": -6.332780361175537, "global_step": 102050, "epoch": 2429} {"train_loss": -6.522204399108887, "global_step": 102051, "epoch": 2429} {"train_loss": -6.3252854347229, "global_step": 102052, "epoch": 2429} {"train_loss": -6.331104278564453, "global_step": 102053, "epoch": 2429} {"train_loss": -6.418816566467285, "global_step": 102054, "epoch": 2429} {"train_loss": -6.281512260437012, "global_step": 102055, "epoch": 2429} {"train_loss": -6.309254169464111, "global_step": 102056, "epoch": 2429} {"train_loss": -6.407671928405762, "global_step": 102057, "epoch": 2429} {"train_loss": -6.394305229187012, "global_step": 102058, "epoch": 2429} {"train_loss": -6.367533456711542, "global_step": 102059, "epoch": 2429, "val_loss": 75724.625} {"train_loss": -6.491220474243164, "global_step": 102060, "epoch": 2430} {"train_loss": -6.442950248718262, "global_step": 102061, "epoch": 2430} {"train_loss": -6.393908977508545, "global_step": 102062, "epoch": 2430} {"train_loss": -6.493403434753418, "global_step": 102063, "epoch": 2430} {"train_loss": -6.3731889724731445, "global_step": 102064, "epoch": 2430} {"train_loss": -6.2814812660217285, "global_step": 102065, "epoch": 2430} {"train_loss": -6.44658088684082, "global_step": 102066, "epoch": 2430} {"train_loss": -6.487227916717529, "global_step": 102067, "epoch": 2430} {"train_loss": -6.228695869445801, "global_step": 102068, "epoch": 2430} {"train_loss": -6.380563259124756, "global_step": 102069, "epoch": 2430} {"train_loss": -6.3061842918396, "global_step": 102070, "epoch": 2430} {"train_loss": -6.426085472106934, "global_step": 102071, "epoch": 2430} {"train_loss": -6.369715690612793, "global_step": 102072, "epoch": 2430} {"train_loss": -6.422453880310059, "global_step": 102073, "epoch": 2430} {"train_loss": -6.373438835144043, "global_step": 102074, "epoch": 2430} {"train_loss": -6.484080791473389, "global_step": 102075, "epoch": 2430} {"train_loss": -6.4024457931518555, "global_step": 102076, "epoch": 2430} {"train_loss": -6.3744964599609375, "global_step": 102077, "epoch": 2430} {"train_loss": -6.395060062408447, "global_step": 102078, "epoch": 2430} {"train_loss": -6.346080780029297, "global_step": 102079, "epoch": 2430} {"train_loss": -6.255771636962891, "global_step": 102080, "epoch": 2430} {"train_loss": -6.350778579711914, "global_step": 102081, "epoch": 2430} {"train_loss": -6.493072032928467, "global_step": 102082, "epoch": 2430} {"train_loss": -6.3803911209106445, "global_step": 102083, "epoch": 2430} {"train_loss": -6.386322021484375, "global_step": 102084, "epoch": 2430} {"train_loss": -6.385382652282715, "global_step": 102085, "epoch": 2430} {"train_loss": -6.360263347625732, "global_step": 102086, "epoch": 2430} {"train_loss": -6.438736915588379, "global_step": 102087, "epoch": 2430} {"train_loss": -6.443988800048828, "global_step": 102088, "epoch": 2430} {"train_loss": -6.31252908706665, "global_step": 102089, "epoch": 2430} {"train_loss": -6.266687870025635, "global_step": 102090, "epoch": 2430} {"train_loss": -6.252110958099365, "global_step": 102091, "epoch": 2430} {"train_loss": -6.4739837646484375, "global_step": 102092, "epoch": 2430} {"train_loss": -6.289921283721924, "global_step": 102093, "epoch": 2430} {"train_loss": -6.4771728515625, "global_step": 102094, "epoch": 2430} {"train_loss": -6.475383758544922, "global_step": 102095, "epoch": 2430} {"train_loss": -6.449368476867676, "global_step": 102096, "epoch": 2430} {"train_loss": -6.408209800720215, "global_step": 102097, "epoch": 2430} {"train_loss": -6.335682392120361, "global_step": 102098, "epoch": 2430} {"train_loss": -6.425220966339111, "global_step": 102099, "epoch": 2430} {"train_loss": -6.359234809875488, "global_step": 102100, "epoch": 2430} {"train_loss": -6.388422284807477, "global_step": 102101, "epoch": 2430, "val_loss": 75877.171875} {"train_loss": -6.413356304168701, "global_step": 102102, "epoch": 2431} {"train_loss": -6.320464134216309, "global_step": 102103, "epoch": 2431} {"train_loss": -6.482407093048096, "global_step": 102104, "epoch": 2431} {"train_loss": -6.520491600036621, "global_step": 102105, "epoch": 2431} {"train_loss": -6.303231239318848, "global_step": 102106, "epoch": 2431} {"train_loss": -6.393611431121826, "global_step": 102107, "epoch": 2431} {"train_loss": -6.41400146484375, "global_step": 102108, "epoch": 2431} {"train_loss": -6.362188339233398, "global_step": 102109, "epoch": 2431} {"train_loss": -6.345239639282227, "global_step": 102110, "epoch": 2431} {"train_loss": -6.513604164123535, "global_step": 102111, "epoch": 2431} {"train_loss": -6.144462585449219, "global_step": 102112, "epoch": 2431} {"train_loss": -6.285900115966797, "global_step": 102113, "epoch": 2431} {"train_loss": -6.3827128410339355, "global_step": 102114, "epoch": 2431} {"train_loss": -6.290560245513916, "global_step": 102115, "epoch": 2431} {"train_loss": -6.394477844238281, "global_step": 102116, "epoch": 2431} {"train_loss": -6.349138259887695, "global_step": 102117, "epoch": 2431} {"train_loss": -6.2084221839904785, "global_step": 102118, "epoch": 2431} {"train_loss": -6.244235038757324, "global_step": 102119, "epoch": 2431} {"train_loss": -6.448145866394043, "global_step": 102120, "epoch": 2431} {"train_loss": -6.497516632080078, "global_step": 102121, "epoch": 2431} {"train_loss": -6.559506416320801, "global_step": 102122, "epoch": 2431} {"train_loss": -6.351309776306152, "global_step": 102123, "epoch": 2431} {"train_loss": -6.2386884689331055, "global_step": 102124, "epoch": 2431} {"train_loss": -6.386585712432861, "global_step": 102125, "epoch": 2431} {"train_loss": -6.378623962402344, "global_step": 102126, "epoch": 2431} {"train_loss": -6.41853141784668, "global_step": 102127, "epoch": 2431} {"train_loss": -6.472006797790527, "global_step": 102128, "epoch": 2431} {"train_loss": -6.289481163024902, "global_step": 102129, "epoch": 2431} {"train_loss": -6.1904616355896, "global_step": 102130, "epoch": 2431} {"train_loss": -6.36711311340332, "global_step": 102131, "epoch": 2431} {"train_loss": -6.242692470550537, "global_step": 102132, "epoch": 2431} {"train_loss": -6.272353172302246, "global_step": 102133, "epoch": 2431} {"train_loss": -6.486394882202148, "global_step": 102134, "epoch": 2431} {"train_loss": -6.430768013000488, "global_step": 102135, "epoch": 2431} {"train_loss": -6.360240936279297, "global_step": 102136, "epoch": 2431} {"train_loss": -6.479574680328369, "global_step": 102137, "epoch": 2431} {"train_loss": -6.464857578277588, "global_step": 102138, "epoch": 2431} {"train_loss": -6.28178596496582, "global_step": 102139, "epoch": 2431} {"train_loss": -6.38746452331543, "global_step": 102140, "epoch": 2431} {"train_loss": -6.305537700653076, "global_step": 102141, "epoch": 2431} {"train_loss": -6.459298610687256, "global_step": 102142, "epoch": 2431} {"train_loss": -6.367746455328805, "global_step": 102143, "epoch": 2431, "val_loss": 75974.6640625} {"train_loss": -6.385312080383301, "global_step": 102144, "epoch": 2432} {"train_loss": -6.318539619445801, "global_step": 102145, "epoch": 2432} {"train_loss": -6.341848373413086, "global_step": 102146, "epoch": 2432} {"train_loss": -6.314340114593506, "global_step": 102147, "epoch": 2432} {"train_loss": -6.362879753112793, "global_step": 102148, "epoch": 2432} {"train_loss": -6.377595901489258, "global_step": 102149, "epoch": 2432} {"train_loss": -6.378680229187012, "global_step": 102150, "epoch": 2432} {"train_loss": -6.356542587280273, "global_step": 102151, "epoch": 2432} {"train_loss": -6.413786888122559, "global_step": 102152, "epoch": 2432} {"train_loss": -6.422908782958984, "global_step": 102153, "epoch": 2432} {"train_loss": -6.359878063201904, "global_step": 102154, "epoch": 2432} {"train_loss": -6.36382532119751, "global_step": 102155, "epoch": 2432} {"train_loss": -6.353725433349609, "global_step": 102156, "epoch": 2432} {"train_loss": -6.325401306152344, "global_step": 102157, "epoch": 2432} {"train_loss": -6.387607097625732, "global_step": 102158, "epoch": 2432} {"train_loss": -6.368289947509766, "global_step": 102159, "epoch": 2432} {"train_loss": -6.451595306396484, "global_step": 102160, "epoch": 2432} {"train_loss": -6.344962120056152, "global_step": 102161, "epoch": 2432} {"train_loss": -6.43281364440918, "global_step": 102162, "epoch": 2432} {"train_loss": -6.367608070373535, "global_step": 102163, "epoch": 2432} {"train_loss": -6.2888994216918945, "global_step": 102164, "epoch": 2432} {"train_loss": -6.340395927429199, "global_step": 102165, "epoch": 2432} {"train_loss": -6.383275985717773, "global_step": 102166, "epoch": 2432} {"train_loss": -6.298786163330078, "global_step": 102167, "epoch": 2432} {"train_loss": -6.340639114379883, "global_step": 102168, "epoch": 2432} {"train_loss": -6.349979400634766, "global_step": 102169, "epoch": 2432} {"train_loss": -6.386787414550781, "global_step": 102170, "epoch": 2432} {"train_loss": -6.285804748535156, "global_step": 102171, "epoch": 2432} {"train_loss": -6.3620147705078125, "global_step": 102172, "epoch": 2432} {"train_loss": -6.287459373474121, "global_step": 102173, "epoch": 2432} {"train_loss": -6.2713775634765625, "global_step": 102174, "epoch": 2432} {"train_loss": -6.393296718597412, "global_step": 102175, "epoch": 2432} {"train_loss": -6.34420108795166, "global_step": 102176, "epoch": 2432} {"train_loss": -6.407595157623291, "global_step": 102177, "epoch": 2432} {"train_loss": -6.281998634338379, "global_step": 102178, "epoch": 2432} {"train_loss": -6.268404960632324, "global_step": 102179, "epoch": 2432} {"train_loss": -6.458922386169434, "global_step": 102180, "epoch": 2432} {"train_loss": -6.433236598968506, "global_step": 102181, "epoch": 2432} {"train_loss": -6.3691205978393555, "global_step": 102182, "epoch": 2432} {"train_loss": -6.399317741394043, "global_step": 102183, "epoch": 2432} {"train_loss": -6.3527398109436035, "global_step": 102184, "epoch": 2432} {"train_loss": -6.361239887419201, "global_step": 102185, "epoch": 2432, "val_loss": 76178.53125} {"train_loss": -6.456944465637207, "global_step": 102186, "epoch": 2433} {"train_loss": -6.473570823669434, "global_step": 102187, "epoch": 2433} {"train_loss": -6.434545516967773, "global_step": 102188, "epoch": 2433} {"train_loss": -6.375332832336426, "global_step": 102189, "epoch": 2433} {"train_loss": -6.4579057693481445, "global_step": 102190, "epoch": 2433} {"train_loss": -6.466604232788086, "global_step": 102191, "epoch": 2433} {"train_loss": -6.40891695022583, "global_step": 102192, "epoch": 2433} {"train_loss": -6.404961585998535, "global_step": 102193, "epoch": 2433} {"train_loss": -6.446211814880371, "global_step": 102194, "epoch": 2433} {"train_loss": -6.353892803192139, "global_step": 102195, "epoch": 2433} {"train_loss": -6.419075965881348, "global_step": 102196, "epoch": 2433} {"train_loss": -6.337818622589111, "global_step": 102197, "epoch": 2433} {"train_loss": -6.375579833984375, "global_step": 102198, "epoch": 2433} {"train_loss": -6.427739143371582, "global_step": 102199, "epoch": 2433} {"train_loss": -6.361784934997559, "global_step": 102200, "epoch": 2433} {"train_loss": -6.404177665710449, "global_step": 102201, "epoch": 2433} {"train_loss": -6.474896430969238, "global_step": 102202, "epoch": 2433} {"train_loss": -6.420382499694824, "global_step": 102203, "epoch": 2433} {"train_loss": -6.341318130493164, "global_step": 102204, "epoch": 2433} {"train_loss": -6.509466171264648, "global_step": 102205, "epoch": 2433} {"train_loss": -6.3503265380859375, "global_step": 102206, "epoch": 2433} {"train_loss": -6.136795997619629, "global_step": 102207, "epoch": 2433} {"train_loss": -6.333357810974121, "global_step": 102208, "epoch": 2433} {"train_loss": -6.246550559997559, "global_step": 102209, "epoch": 2433} {"train_loss": -6.367077827453613, "global_step": 102210, "epoch": 2433} {"train_loss": -6.41827392578125, "global_step": 102211, "epoch": 2433} {"train_loss": -6.325514793395996, "global_step": 102212, "epoch": 2433} {"train_loss": -6.424577713012695, "global_step": 102213, "epoch": 2433} {"train_loss": -6.2634382247924805, "global_step": 102214, "epoch": 2433} {"train_loss": -6.38238525390625, "global_step": 102215, "epoch": 2433} {"train_loss": -6.355904579162598, "global_step": 102216, "epoch": 2433} {"train_loss": -6.308128833770752, "global_step": 102217, "epoch": 2433} {"train_loss": -6.444189071655273, "global_step": 102218, "epoch": 2433} {"train_loss": -6.365762710571289, "global_step": 102219, "epoch": 2433} {"train_loss": -6.402602195739746, "global_step": 102220, "epoch": 2433} {"train_loss": -6.436074733734131, "global_step": 102221, "epoch": 2433} {"train_loss": -6.519068241119385, "global_step": 102222, "epoch": 2433} {"train_loss": -6.483917713165283, "global_step": 102223, "epoch": 2433} {"train_loss": -6.373924255371094, "global_step": 102224, "epoch": 2433} {"train_loss": -6.514827728271484, "global_step": 102225, "epoch": 2433} {"train_loss": -6.4270124435424805, "global_step": 102226, "epoch": 2433} {"train_loss": -6.393725304376511, "global_step": 102227, "epoch": 2433, "val_loss": 76084.40625} {"train_loss": -6.468297004699707, "global_step": 102228, "epoch": 2434} {"train_loss": -6.449243545532227, "global_step": 102229, "epoch": 2434} {"train_loss": -6.448076248168945, "global_step": 102230, "epoch": 2434} {"train_loss": -6.35214376449585, "global_step": 102231, "epoch": 2434} {"train_loss": -6.387429237365723, "global_step": 102232, "epoch": 2434} {"train_loss": -6.4175190925598145, "global_step": 102233, "epoch": 2434} {"train_loss": -6.434535503387451, "global_step": 102234, "epoch": 2434} {"train_loss": -6.4068989753723145, "global_step": 102235, "epoch": 2434} {"train_loss": -6.409371376037598, "global_step": 102236, "epoch": 2434} {"train_loss": -6.463497161865234, "global_step": 102237, "epoch": 2434} {"train_loss": -6.319431781768799, "global_step": 102238, "epoch": 2434} {"train_loss": -6.408722877502441, "global_step": 102239, "epoch": 2434} {"train_loss": -6.376936912536621, "global_step": 102240, "epoch": 2434} {"train_loss": -6.258540153503418, "global_step": 102241, "epoch": 2434} {"train_loss": -6.340010643005371, "global_step": 102242, "epoch": 2434} {"train_loss": -6.400455474853516, "global_step": 102243, "epoch": 2434} {"train_loss": -6.394399642944336, "global_step": 102244, "epoch": 2434} {"train_loss": -6.377553939819336, "global_step": 102245, "epoch": 2434} {"train_loss": -6.344243049621582, "global_step": 102246, "epoch": 2434} {"train_loss": -6.383549690246582, "global_step": 102247, "epoch": 2434} {"train_loss": -6.344303131103516, "global_step": 102248, "epoch": 2434} {"train_loss": -6.364830017089844, "global_step": 102249, "epoch": 2434} {"train_loss": -6.3866448402404785, "global_step": 102250, "epoch": 2434} {"train_loss": -6.452271461486816, "global_step": 102251, "epoch": 2434} {"train_loss": -6.356780052185059, "global_step": 102252, "epoch": 2434} {"train_loss": -6.468191146850586, "global_step": 102253, "epoch": 2434} {"train_loss": -6.348461627960205, "global_step": 102254, "epoch": 2434} {"train_loss": -6.428542137145996, "global_step": 102255, "epoch": 2434} {"train_loss": -6.393563747406006, "global_step": 102256, "epoch": 2434} {"train_loss": -6.500522613525391, "global_step": 102257, "epoch": 2434} {"train_loss": -6.387228965759277, "global_step": 102258, "epoch": 2434} {"train_loss": -6.369537830352783, "global_step": 102259, "epoch": 2434} {"train_loss": -6.5018310546875, "global_step": 102260, "epoch": 2434} {"train_loss": -6.459833145141602, "global_step": 102261, "epoch": 2434} {"train_loss": -6.58428955078125, "global_step": 102262, "epoch": 2434} {"train_loss": -6.411785125732422, "global_step": 102263, "epoch": 2434} {"train_loss": -6.451169013977051, "global_step": 102264, "epoch": 2434} {"train_loss": -6.406799793243408, "global_step": 102265, "epoch": 2434} {"train_loss": -6.393148422241211, "global_step": 102266, "epoch": 2434} {"train_loss": -6.300653457641602, "global_step": 102267, "epoch": 2434} {"train_loss": -6.365967750549316, "global_step": 102268, "epoch": 2434} {"train_loss": -6.402679295766921, "global_step": 102269, "epoch": 2434, "val_loss": 75975.578125} {"train_loss": -6.428251266479492, "global_step": 102270, "epoch": 2435} {"train_loss": -6.3998003005981445, "global_step": 102271, "epoch": 2435} {"train_loss": -6.4417266845703125, "global_step": 102272, "epoch": 2435} {"train_loss": -6.442357063293457, "global_step": 102273, "epoch": 2435} {"train_loss": -6.346196174621582, "global_step": 102274, "epoch": 2435} {"train_loss": -6.304625988006592, "global_step": 102275, "epoch": 2435} {"train_loss": -6.465195178985596, "global_step": 102276, "epoch": 2435} {"train_loss": -6.513087749481201, "global_step": 102277, "epoch": 2435} {"train_loss": -6.436640739440918, "global_step": 102278, "epoch": 2435} {"train_loss": -6.416338920593262, "global_step": 102279, "epoch": 2435} {"train_loss": -6.483705997467041, "global_step": 102280, "epoch": 2435} {"train_loss": -6.316366195678711, "global_step": 102281, "epoch": 2435} {"train_loss": -6.405604362487793, "global_step": 102282, "epoch": 2435} {"train_loss": -6.457812786102295, "global_step": 102283, "epoch": 2435} {"train_loss": -6.342461585998535, "global_step": 102284, "epoch": 2435} {"train_loss": -6.452964782714844, "global_step": 102285, "epoch": 2435} {"train_loss": -6.551119327545166, "global_step": 102286, "epoch": 2435} {"train_loss": -6.292792320251465, "global_step": 102287, "epoch": 2435} {"train_loss": -6.45888614654541, "global_step": 102288, "epoch": 2435} {"train_loss": -6.339295387268066, "global_step": 102289, "epoch": 2435} {"train_loss": -6.314281463623047, "global_step": 102290, "epoch": 2435} {"train_loss": -6.3117780685424805, "global_step": 102291, "epoch": 2435} {"train_loss": -6.479707717895508, "global_step": 102292, "epoch": 2435} {"train_loss": -6.358912467956543, "global_step": 102293, "epoch": 2435} {"train_loss": -6.4601945877075195, "global_step": 102294, "epoch": 2435} {"train_loss": -6.2794036865234375, "global_step": 102295, "epoch": 2435} {"train_loss": -6.281703472137451, "global_step": 102296, "epoch": 2435} {"train_loss": -6.388502597808838, "global_step": 102297, "epoch": 2435} {"train_loss": -6.222227096557617, "global_step": 102298, "epoch": 2435} {"train_loss": -6.388769626617432, "global_step": 102299, "epoch": 2435} {"train_loss": -6.3167219161987305, "global_step": 102300, "epoch": 2435} {"train_loss": -6.324372291564941, "global_step": 102301, "epoch": 2435} {"train_loss": -6.331729888916016, "global_step": 102302, "epoch": 2435} {"train_loss": -6.482585906982422, "global_step": 102303, "epoch": 2435} {"train_loss": -6.383761405944824, "global_step": 102304, "epoch": 2435} {"train_loss": -6.305898666381836, "global_step": 102305, "epoch": 2435} {"train_loss": -6.32102632522583, "global_step": 102306, "epoch": 2435} {"train_loss": -6.311845779418945, "global_step": 102307, "epoch": 2435} {"train_loss": -6.313995361328125, "global_step": 102308, "epoch": 2435} {"train_loss": -6.329242706298828, "global_step": 102309, "epoch": 2435} {"train_loss": -6.329850196838379, "global_step": 102310, "epoch": 2435} {"train_loss": -6.377396197546096, "global_step": 102311, "epoch": 2435, "val_loss": 76062.359375} {"train_loss": -6.326866626739502, "global_step": 102312, "epoch": 2436} {"train_loss": -6.318663597106934, "global_step": 102313, "epoch": 2436} {"train_loss": -6.34564208984375, "global_step": 102314, "epoch": 2436} {"train_loss": -6.296844482421875, "global_step": 102315, "epoch": 2436} {"train_loss": -6.315090179443359, "global_step": 102316, "epoch": 2436} {"train_loss": -6.2978620529174805, "global_step": 102317, "epoch": 2436} {"train_loss": -6.331551551818848, "global_step": 102318, "epoch": 2436} {"train_loss": -6.292421340942383, "global_step": 102319, "epoch": 2436} {"train_loss": -6.397384166717529, "global_step": 102320, "epoch": 2436} {"train_loss": -6.388307571411133, "global_step": 102321, "epoch": 2436} {"train_loss": -6.343735694885254, "global_step": 102322, "epoch": 2436} {"train_loss": -6.329868793487549, "global_step": 102323, "epoch": 2436} {"train_loss": -6.360709190368652, "global_step": 102324, "epoch": 2436} {"train_loss": -6.439938545227051, "global_step": 102325, "epoch": 2436} {"train_loss": -6.324505805969238, "global_step": 102326, "epoch": 2436} {"train_loss": -6.497363090515137, "global_step": 102327, "epoch": 2436} {"train_loss": -6.386906623840332, "global_step": 102328, "epoch": 2436} {"train_loss": -6.3432769775390625, "global_step": 102329, "epoch": 2436} {"train_loss": -6.399613380432129, "global_step": 102330, "epoch": 2436} {"train_loss": -6.320545196533203, "global_step": 102331, "epoch": 2436} {"train_loss": -6.370160102844238, "global_step": 102332, "epoch": 2436} {"train_loss": -6.332893371582031, "global_step": 102333, "epoch": 2436} {"train_loss": -6.4326491355896, "global_step": 102334, "epoch": 2436} {"train_loss": -6.421543121337891, "global_step": 102335, "epoch": 2436} {"train_loss": -6.390484809875488, "global_step": 102336, "epoch": 2436} {"train_loss": -6.451201915740967, "global_step": 102337, "epoch": 2436} {"train_loss": -6.402554512023926, "global_step": 102338, "epoch": 2436} {"train_loss": -6.4481892585754395, "global_step": 102339, "epoch": 2436} {"train_loss": -6.410632133483887, "global_step": 102340, "epoch": 2436} {"train_loss": -6.337263584136963, "global_step": 102341, "epoch": 2436} {"train_loss": -6.405916213989258, "global_step": 102342, "epoch": 2436} {"train_loss": -6.360628128051758, "global_step": 102343, "epoch": 2436} {"train_loss": -6.363826274871826, "global_step": 102344, "epoch": 2436} {"train_loss": -6.376290321350098, "global_step": 102345, "epoch": 2436} {"train_loss": -6.283976078033447, "global_step": 102346, "epoch": 2436} {"train_loss": -6.383339881896973, "global_step": 102347, "epoch": 2436} {"train_loss": -6.319725036621094, "global_step": 102348, "epoch": 2436} {"train_loss": -6.332819938659668, "global_step": 102349, "epoch": 2436} {"train_loss": -6.3313422203063965, "global_step": 102350, "epoch": 2436} {"train_loss": -6.309459686279297, "global_step": 102351, "epoch": 2436} {"train_loss": -6.347119331359863, "global_step": 102352, "epoch": 2436} {"train_loss": -6.363805566515241, "global_step": 102353, "epoch": 2436, "val_loss": 75890.2109375} {"train_loss": -6.317194938659668, "global_step": 102354, "epoch": 2437} {"train_loss": -6.416991710662842, "global_step": 102355, "epoch": 2437} {"train_loss": -6.46497106552124, "global_step": 102356, "epoch": 2437} {"train_loss": -6.400370121002197, "global_step": 102357, "epoch": 2437} {"train_loss": -6.405308246612549, "global_step": 102358, "epoch": 2437} {"train_loss": -6.455357551574707, "global_step": 102359, "epoch": 2437} {"train_loss": -6.455179691314697, "global_step": 102360, "epoch": 2437} {"train_loss": -6.435181617736816, "global_step": 102361, "epoch": 2437} {"train_loss": -6.334339141845703, "global_step": 102362, "epoch": 2437} {"train_loss": -6.495222568511963, "global_step": 102363, "epoch": 2437} {"train_loss": -6.356395721435547, "global_step": 102364, "epoch": 2437} {"train_loss": -6.246006488800049, "global_step": 102365, "epoch": 2437} {"train_loss": -6.465778827667236, "global_step": 102366, "epoch": 2437} {"train_loss": -6.354689598083496, "global_step": 102367, "epoch": 2437} {"train_loss": -6.436216354370117, "global_step": 102368, "epoch": 2437} {"train_loss": -6.240447044372559, "global_step": 102369, "epoch": 2437} {"train_loss": -6.304897785186768, "global_step": 102370, "epoch": 2437} {"train_loss": -6.338097095489502, "global_step": 102371, "epoch": 2437} {"train_loss": -6.36566162109375, "global_step": 102372, "epoch": 2437} {"train_loss": -6.4251604080200195, "global_step": 102373, "epoch": 2437} {"train_loss": -6.331020355224609, "global_step": 102374, "epoch": 2437} {"train_loss": -6.257328510284424, "global_step": 102375, "epoch": 2437} {"train_loss": -6.442683219909668, "global_step": 102376, "epoch": 2437} {"train_loss": -6.230032920837402, "global_step": 102377, "epoch": 2437} {"train_loss": -6.3909430503845215, "global_step": 102378, "epoch": 2437} {"train_loss": -6.335847854614258, "global_step": 102379, "epoch": 2437} {"train_loss": -6.260632514953613, "global_step": 102380, "epoch": 2437} {"train_loss": -6.279707431793213, "global_step": 102381, "epoch": 2437} {"train_loss": -6.123180866241455, "global_step": 102382, "epoch": 2437} {"train_loss": -6.409448623657227, "global_step": 102383, "epoch": 2437} {"train_loss": -6.303343772888184, "global_step": 102384, "epoch": 2437} {"train_loss": -6.151119232177734, "global_step": 102385, "epoch": 2437} {"train_loss": -6.348745822906494, "global_step": 102386, "epoch": 2437} {"train_loss": -6.280109882354736, "global_step": 102387, "epoch": 2437} {"train_loss": -6.3293914794921875, "global_step": 102388, "epoch": 2437} {"train_loss": -6.183723449707031, "global_step": 102389, "epoch": 2437} {"train_loss": -6.462189674377441, "global_step": 102390, "epoch": 2437} {"train_loss": -6.269460678100586, "global_step": 102391, "epoch": 2437} {"train_loss": -6.400297164916992, "global_step": 102392, "epoch": 2437} {"train_loss": -6.259652137756348, "global_step": 102393, "epoch": 2437} {"train_loss": -6.27117395401001, "global_step": 102394, "epoch": 2437} {"train_loss": -6.3420850322360085, "global_step": 102395, "epoch": 2437, "val_loss": 76122.0390625} {"train_loss": -6.3443450927734375, "global_step": 102396, "epoch": 2438} {"train_loss": -6.390944004058838, "global_step": 102397, "epoch": 2438} {"train_loss": -6.297089576721191, "global_step": 102398, "epoch": 2438} {"train_loss": -6.463986873626709, "global_step": 102399, "epoch": 2438} {"train_loss": -6.36904239654541, "global_step": 102400, "epoch": 2438} {"train_loss": -6.39527702331543, "global_step": 102401, "epoch": 2438} {"train_loss": -6.522498607635498, "global_step": 102402, "epoch": 2438} {"train_loss": -6.19215202331543, "global_step": 102403, "epoch": 2438} {"train_loss": -6.389697074890137, "global_step": 102404, "epoch": 2438} {"train_loss": -6.50514030456543, "global_step": 102405, "epoch": 2438} {"train_loss": -6.300407409667969, "global_step": 102406, "epoch": 2438} {"train_loss": -6.386052131652832, "global_step": 102407, "epoch": 2438} {"train_loss": -6.331782341003418, "global_step": 102408, "epoch": 2438} {"train_loss": -6.4498291015625, "global_step": 102409, "epoch": 2438} {"train_loss": -6.289353847503662, "global_step": 102410, "epoch": 2438} {"train_loss": -6.40617561340332, "global_step": 102411, "epoch": 2438} {"train_loss": -6.397191047668457, "global_step": 102412, "epoch": 2438} {"train_loss": -6.464599609375, "global_step": 102413, "epoch": 2438} {"train_loss": -6.393836975097656, "global_step": 102414, "epoch": 2438} {"train_loss": -6.332058906555176, "global_step": 102415, "epoch": 2438} {"train_loss": -6.25942325592041, "global_step": 102416, "epoch": 2438} {"train_loss": -6.361912727355957, "global_step": 102417, "epoch": 2438} {"train_loss": -6.283254146575928, "global_step": 102418, "epoch": 2438} {"train_loss": -6.271726608276367, "global_step": 102419, "epoch": 2438} {"train_loss": -6.396646976470947, "global_step": 102420, "epoch": 2438} {"train_loss": -6.322131156921387, "global_step": 102421, "epoch": 2438} {"train_loss": -6.435290336608887, "global_step": 102422, "epoch": 2438} {"train_loss": -6.197242736816406, "global_step": 102423, "epoch": 2438} {"train_loss": -6.391458988189697, "global_step": 102424, "epoch": 2438} {"train_loss": -6.546879768371582, "global_step": 102425, "epoch": 2438} {"train_loss": -6.4528279304504395, "global_step": 102426, "epoch": 2438} {"train_loss": -6.281564712524414, "global_step": 102427, "epoch": 2438} {"train_loss": -6.357494354248047, "global_step": 102428, "epoch": 2438} {"train_loss": -6.323999404907227, "global_step": 102429, "epoch": 2438} {"train_loss": -6.363905906677246, "global_step": 102430, "epoch": 2438} {"train_loss": -6.458047389984131, "global_step": 102431, "epoch": 2438} {"train_loss": -6.381171226501465, "global_step": 102432, "epoch": 2438} {"train_loss": -6.364436149597168, "global_step": 102433, "epoch": 2438} {"train_loss": -6.360684394836426, "global_step": 102434, "epoch": 2438} {"train_loss": -6.307188034057617, "global_step": 102435, "epoch": 2438} {"train_loss": -6.304864883422852, "global_step": 102436, "epoch": 2438} {"train_loss": -6.3686316921597435, "global_step": 102437, "epoch": 2438, "val_loss": 75955.2421875} {"train_loss": -6.371173858642578, "global_step": 102438, "epoch": 2439} {"train_loss": -6.369074821472168, "global_step": 102439, "epoch": 2439} {"train_loss": -6.430211067199707, "global_step": 102440, "epoch": 2439} {"train_loss": -6.372213363647461, "global_step": 102441, "epoch": 2439} {"train_loss": -6.453635215759277, "global_step": 102442, "epoch": 2439} {"train_loss": -6.234485626220703, "global_step": 102443, "epoch": 2439} {"train_loss": -6.413022041320801, "global_step": 102444, "epoch": 2439} {"train_loss": -6.334078788757324, "global_step": 102445, "epoch": 2439} {"train_loss": -6.399157524108887, "global_step": 102446, "epoch": 2439} {"train_loss": -6.327669143676758, "global_step": 102447, "epoch": 2439} {"train_loss": -6.365124225616455, "global_step": 102448, "epoch": 2439} {"train_loss": -6.5027031898498535, "global_step": 102449, "epoch": 2439} {"train_loss": -6.255126953125, "global_step": 102450, "epoch": 2439} {"train_loss": -6.2599897384643555, "global_step": 102451, "epoch": 2439} {"train_loss": -6.438687324523926, "global_step": 102452, "epoch": 2439} {"train_loss": -6.373518943786621, "global_step": 102453, "epoch": 2439} {"train_loss": -6.424831390380859, "global_step": 102454, "epoch": 2439} {"train_loss": -6.4483137130737305, "global_step": 102455, "epoch": 2439} {"train_loss": -6.394384384155273, "global_step": 102456, "epoch": 2439} {"train_loss": -6.4400634765625, "global_step": 102457, "epoch": 2439} {"train_loss": -6.347531795501709, "global_step": 102458, "epoch": 2439} {"train_loss": -6.406329154968262, "global_step": 102459, "epoch": 2439} {"train_loss": -6.435398101806641, "global_step": 102460, "epoch": 2439} {"train_loss": -6.459853172302246, "global_step": 102461, "epoch": 2439} {"train_loss": -6.469437122344971, "global_step": 102462, "epoch": 2439} {"train_loss": -6.358806610107422, "global_step": 102463, "epoch": 2439} {"train_loss": -6.417874336242676, "global_step": 102464, "epoch": 2439} {"train_loss": -6.4093403816223145, "global_step": 102465, "epoch": 2439} {"train_loss": -6.307672023773193, "global_step": 102466, "epoch": 2439} {"train_loss": -6.396739482879639, "global_step": 102467, "epoch": 2439} {"train_loss": -6.255288600921631, "global_step": 102468, "epoch": 2439} {"train_loss": -6.3469977378845215, "global_step": 102469, "epoch": 2439} {"train_loss": -6.431761741638184, "global_step": 102470, "epoch": 2439} {"train_loss": -6.290755748748779, "global_step": 102471, "epoch": 2439} {"train_loss": -6.340648174285889, "global_step": 102472, "epoch": 2439} {"train_loss": -6.2661309242248535, "global_step": 102473, "epoch": 2439} {"train_loss": -6.246432781219482, "global_step": 102474, "epoch": 2439} {"train_loss": -6.435924530029297, "global_step": 102475, "epoch": 2439} {"train_loss": -6.15593957901001, "global_step": 102476, "epoch": 2439} {"train_loss": -6.348176002502441, "global_step": 102477, "epoch": 2439} {"train_loss": -6.225569725036621, "global_step": 102478, "epoch": 2439} {"train_loss": -6.3620837188902355, "global_step": 102479, "epoch": 2439, "val_loss": 76097.5} {"train_loss": -6.41628360748291, "global_step": 102480, "epoch": 2440} {"train_loss": -6.241189956665039, "global_step": 102481, "epoch": 2440} {"train_loss": -6.289482116699219, "global_step": 102482, "epoch": 2440} {"train_loss": -6.262333869934082, "global_step": 102483, "epoch": 2440} {"train_loss": -6.325666427612305, "global_step": 102484, "epoch": 2440} {"train_loss": -6.191343784332275, "global_step": 102485, "epoch": 2440} {"train_loss": -6.343618869781494, "global_step": 102486, "epoch": 2440} {"train_loss": -6.309098243713379, "global_step": 102487, "epoch": 2440} {"train_loss": -6.460564613342285, "global_step": 102488, "epoch": 2440} {"train_loss": -6.267852783203125, "global_step": 102489, "epoch": 2440} {"train_loss": -6.376673221588135, "global_step": 102490, "epoch": 2440} {"train_loss": -6.247597694396973, "global_step": 102491, "epoch": 2440} {"train_loss": -6.401871681213379, "global_step": 102492, "epoch": 2440} {"train_loss": -6.323685646057129, "global_step": 102493, "epoch": 2440} {"train_loss": -6.365283012390137, "global_step": 102494, "epoch": 2440} {"train_loss": -6.320733547210693, "global_step": 102495, "epoch": 2440} {"train_loss": -6.3879241943359375, "global_step": 102496, "epoch": 2440} {"train_loss": -6.432879447937012, "global_step": 102497, "epoch": 2440} {"train_loss": -6.2713541984558105, "global_step": 102498, "epoch": 2440} {"train_loss": -6.360886573791504, "global_step": 102499, "epoch": 2440} {"train_loss": -6.386802673339844, "global_step": 102500, "epoch": 2440} {"train_loss": -6.407141208648682, "global_step": 102501, "epoch": 2440} {"train_loss": -6.3278326988220215, "global_step": 102502, "epoch": 2440} {"train_loss": -6.377749443054199, "global_step": 102503, "epoch": 2440} {"train_loss": -6.334120750427246, "global_step": 102504, "epoch": 2440} {"train_loss": -6.397700309753418, "global_step": 102505, "epoch": 2440} {"train_loss": -6.286388397216797, "global_step": 102506, "epoch": 2440} {"train_loss": -6.394628047943115, "global_step": 102507, "epoch": 2440} {"train_loss": -6.2179460525512695, "global_step": 102508, "epoch": 2440} {"train_loss": -6.361013412475586, "global_step": 102509, "epoch": 2440} {"train_loss": -6.461756706237793, "global_step": 102510, "epoch": 2440} {"train_loss": -6.4110212326049805, "global_step": 102511, "epoch": 2440} {"train_loss": -6.419575214385986, "global_step": 102512, "epoch": 2440} {"train_loss": -6.462333679199219, "global_step": 102513, "epoch": 2440} {"train_loss": -6.325899124145508, "global_step": 102514, "epoch": 2440} {"train_loss": -6.456101417541504, "global_step": 102515, "epoch": 2440} {"train_loss": -6.355371475219727, "global_step": 102516, "epoch": 2440} {"train_loss": -6.405550003051758, "global_step": 102517, "epoch": 2440} {"train_loss": -6.331754684448242, "global_step": 102518, "epoch": 2440} {"train_loss": -6.360601425170898, "global_step": 102519, "epoch": 2440} {"train_loss": -6.4893951416015625, "global_step": 102520, "epoch": 2440} {"train_loss": -6.3567058472406295, "global_step": 102521, "epoch": 2440, "val_loss": 76171.328125} {"train_loss": -6.4992451667785645, "global_step": 102522, "epoch": 2441} {"train_loss": -6.342954635620117, "global_step": 102523, "epoch": 2441} {"train_loss": -6.331414699554443, "global_step": 102524, "epoch": 2441} {"train_loss": -6.297706604003906, "global_step": 102525, "epoch": 2441} {"train_loss": -6.364809513092041, "global_step": 102526, "epoch": 2441} {"train_loss": -6.299589157104492, "global_step": 102527, "epoch": 2441} {"train_loss": -6.471771240234375, "global_step": 102528, "epoch": 2441} {"train_loss": -6.264707565307617, "global_step": 102529, "epoch": 2441} {"train_loss": -6.3566741943359375, "global_step": 102530, "epoch": 2441} {"train_loss": -6.429100036621094, "global_step": 102531, "epoch": 2441} {"train_loss": -6.360395431518555, "global_step": 102532, "epoch": 2441} {"train_loss": -6.412999629974365, "global_step": 102533, "epoch": 2441} {"train_loss": -6.369704246520996, "global_step": 102534, "epoch": 2441} {"train_loss": -6.435691833496094, "global_step": 102535, "epoch": 2441} {"train_loss": -6.490312576293945, "global_step": 102536, "epoch": 2441} {"train_loss": -6.322673797607422, "global_step": 102537, "epoch": 2441} {"train_loss": -6.5308380126953125, "global_step": 102538, "epoch": 2441} {"train_loss": -6.349016189575195, "global_step": 102539, "epoch": 2441} {"train_loss": -6.251319885253906, "global_step": 102540, "epoch": 2441} {"train_loss": -6.311275482177734, "global_step": 102541, "epoch": 2441} {"train_loss": -6.222671985626221, "global_step": 102542, "epoch": 2441} {"train_loss": -6.336637496948242, "global_step": 102543, "epoch": 2441} {"train_loss": -6.36952018737793, "global_step": 102544, "epoch": 2441} {"train_loss": -6.335850715637207, "global_step": 102545, "epoch": 2441} {"train_loss": -6.444478988647461, "global_step": 102546, "epoch": 2441} {"train_loss": -6.367069244384766, "global_step": 102547, "epoch": 2441} {"train_loss": -6.31001091003418, "global_step": 102548, "epoch": 2441} {"train_loss": -6.378055572509766, "global_step": 102549, "epoch": 2441} {"train_loss": -6.42292594909668, "global_step": 102550, "epoch": 2441} {"train_loss": -6.317535400390625, "global_step": 102551, "epoch": 2441} {"train_loss": -6.28726863861084, "global_step": 102552, "epoch": 2441} {"train_loss": -6.373212814331055, "global_step": 102553, "epoch": 2441} {"train_loss": -6.378810882568359, "global_step": 102554, "epoch": 2441} {"train_loss": -6.431605815887451, "global_step": 102555, "epoch": 2441} {"train_loss": -6.334664344787598, "global_step": 102556, "epoch": 2441} {"train_loss": -6.351363182067871, "global_step": 102557, "epoch": 2441} {"train_loss": -6.335610866546631, "global_step": 102558, "epoch": 2441} {"train_loss": -6.392110824584961, "global_step": 102559, "epoch": 2441} {"train_loss": -6.359960556030273, "global_step": 102560, "epoch": 2441} {"train_loss": -6.455113410949707, "global_step": 102561, "epoch": 2441} {"train_loss": -6.298519611358643, "global_step": 102562, "epoch": 2441} {"train_loss": -6.365151348568144, "global_step": 102563, "epoch": 2441, "val_loss": 75697.515625} {"train_loss": -6.435044288635254, "global_step": 102564, "epoch": 2442} {"train_loss": -6.538476943969727, "global_step": 102565, "epoch": 2442} {"train_loss": -6.368043899536133, "global_step": 102566, "epoch": 2442} {"train_loss": -6.442355632781982, "global_step": 102567, "epoch": 2442} {"train_loss": -6.416055679321289, "global_step": 102568, "epoch": 2442} {"train_loss": -6.382440567016602, "global_step": 102569, "epoch": 2442} {"train_loss": -6.459393501281738, "global_step": 102570, "epoch": 2442} {"train_loss": -6.451645374298096, "global_step": 102571, "epoch": 2442} {"train_loss": -6.460578441619873, "global_step": 102572, "epoch": 2442} {"train_loss": -6.450231075286865, "global_step": 102573, "epoch": 2442} {"train_loss": -6.440382480621338, "global_step": 102574, "epoch": 2442} {"train_loss": -6.438930511474609, "global_step": 102575, "epoch": 2442} {"train_loss": -6.376077651977539, "global_step": 102576, "epoch": 2442} {"train_loss": -6.419712066650391, "global_step": 102577, "epoch": 2442} {"train_loss": -6.336620330810547, "global_step": 102578, "epoch": 2442} {"train_loss": -6.339804649353027, "global_step": 102579, "epoch": 2442} {"train_loss": -6.4166107177734375, "global_step": 102580, "epoch": 2442} {"train_loss": -6.396535873413086, "global_step": 102581, "epoch": 2442} {"train_loss": -6.282346725463867, "global_step": 102582, "epoch": 2442} {"train_loss": -6.405634880065918, "global_step": 102583, "epoch": 2442} {"train_loss": -6.407529830932617, "global_step": 102584, "epoch": 2442} {"train_loss": -6.44078254699707, "global_step": 102585, "epoch": 2442} {"train_loss": -6.441971778869629, "global_step": 102586, "epoch": 2442} {"train_loss": -6.404623031616211, "global_step": 102587, "epoch": 2442} {"train_loss": -6.416590213775635, "global_step": 102588, "epoch": 2442} {"train_loss": -6.376490592956543, "global_step": 102589, "epoch": 2442} {"train_loss": -6.322756767272949, "global_step": 102590, "epoch": 2442} {"train_loss": -6.4647746086120605, "global_step": 102591, "epoch": 2442} {"train_loss": -6.362149238586426, "global_step": 102592, "epoch": 2442} {"train_loss": -6.387954235076904, "global_step": 102593, "epoch": 2442} {"train_loss": -6.300149440765381, "global_step": 102594, "epoch": 2442} {"train_loss": -6.386315822601318, "global_step": 102595, "epoch": 2442} {"train_loss": -6.425981044769287, "global_step": 102596, "epoch": 2442} {"train_loss": -6.352937698364258, "global_step": 102597, "epoch": 2442} {"train_loss": -6.577325820922852, "global_step": 102598, "epoch": 2442} {"train_loss": -6.431085586547852, "global_step": 102599, "epoch": 2442} {"train_loss": -6.338840484619141, "global_step": 102600, "epoch": 2442} {"train_loss": -6.409799575805664, "global_step": 102601, "epoch": 2442} {"train_loss": -6.39125394821167, "global_step": 102602, "epoch": 2442} {"train_loss": -6.261965274810791, "global_step": 102603, "epoch": 2442} {"train_loss": -6.240629196166992, "global_step": 102604, "epoch": 2442} {"train_loss": -6.398818947020031, "global_step": 102605, "epoch": 2442, "val_loss": 76070.90625} {"train_loss": -6.457363128662109, "global_step": 102606, "epoch": 2443} {"train_loss": -6.33602237701416, "global_step": 102607, "epoch": 2443} {"train_loss": -6.47190523147583, "global_step": 102608, "epoch": 2443} {"train_loss": -6.188502311706543, "global_step": 102609, "epoch": 2443} {"train_loss": -6.255976676940918, "global_step": 102610, "epoch": 2443} {"train_loss": -6.274341583251953, "global_step": 102611, "epoch": 2443} {"train_loss": -6.17954158782959, "global_step": 102612, "epoch": 2443} {"train_loss": -6.360019207000732, "global_step": 102613, "epoch": 2443} {"train_loss": -6.410711288452148, "global_step": 102614, "epoch": 2443} {"train_loss": -6.4195556640625, "global_step": 102615, "epoch": 2443} {"train_loss": -6.3223490715026855, "global_step": 102616, "epoch": 2443} {"train_loss": -6.333700180053711, "global_step": 102617, "epoch": 2443} {"train_loss": -6.362929344177246, "global_step": 102618, "epoch": 2443} {"train_loss": -6.538034915924072, "global_step": 102619, "epoch": 2443} {"train_loss": -6.450295448303223, "global_step": 102620, "epoch": 2443} {"train_loss": -6.297372817993164, "global_step": 102621, "epoch": 2443} {"train_loss": -6.423696994781494, "global_step": 102622, "epoch": 2443} {"train_loss": -6.398343086242676, "global_step": 102623, "epoch": 2443} {"train_loss": -6.408787727355957, "global_step": 102624, "epoch": 2443} {"train_loss": -6.380006790161133, "global_step": 102625, "epoch": 2443} {"train_loss": -6.334234237670898, "global_step": 102626, "epoch": 2443} {"train_loss": -6.433377265930176, "global_step": 102627, "epoch": 2443} {"train_loss": -6.342390537261963, "global_step": 102628, "epoch": 2443} {"train_loss": -6.339655876159668, "global_step": 102629, "epoch": 2443} {"train_loss": -6.350203514099121, "global_step": 102630, "epoch": 2443} {"train_loss": -6.385778903961182, "global_step": 102631, "epoch": 2443} {"train_loss": -6.35906982421875, "global_step": 102632, "epoch": 2443} {"train_loss": -6.2155256271362305, "global_step": 102633, "epoch": 2443} {"train_loss": -6.414362907409668, "global_step": 102634, "epoch": 2443} {"train_loss": -6.3593339920043945, "global_step": 102635, "epoch": 2443} {"train_loss": -6.3280744552612305, "global_step": 102636, "epoch": 2443} {"train_loss": -6.388471603393555, "global_step": 102637, "epoch": 2443} {"train_loss": -6.330796241760254, "global_step": 102638, "epoch": 2443} {"train_loss": -6.376911163330078, "global_step": 102639, "epoch": 2443} {"train_loss": -6.466941833496094, "global_step": 102640, "epoch": 2443} {"train_loss": -6.221341133117676, "global_step": 102641, "epoch": 2443} {"train_loss": -6.459639549255371, "global_step": 102642, "epoch": 2443} {"train_loss": -6.357707977294922, "global_step": 102643, "epoch": 2443} {"train_loss": -6.336819648742676, "global_step": 102644, "epoch": 2443} {"train_loss": -6.351318836212158, "global_step": 102645, "epoch": 2443} {"train_loss": -6.378952503204346, "global_step": 102646, "epoch": 2443} {"train_loss": -6.35954897744315, "global_step": 102647, "epoch": 2443, "val_loss": 76364.8515625} {"train_loss": -6.224026679992676, "global_step": 102648, "epoch": 2444} {"train_loss": -6.315582275390625, "global_step": 102649, "epoch": 2444} {"train_loss": -6.280656814575195, "global_step": 102650, "epoch": 2444} {"train_loss": -6.339206695556641, "global_step": 102651, "epoch": 2444} {"train_loss": -6.226749420166016, "global_step": 102652, "epoch": 2444} {"train_loss": -6.28053617477417, "global_step": 102653, "epoch": 2444} {"train_loss": -6.177798271179199, "global_step": 102654, "epoch": 2444} {"train_loss": -6.208932876586914, "global_step": 102655, "epoch": 2444} {"train_loss": -6.2826056480407715, "global_step": 102656, "epoch": 2444} {"train_loss": -6.153624534606934, "global_step": 102657, "epoch": 2444} {"train_loss": -6.28555965423584, "global_step": 102658, "epoch": 2444} {"train_loss": -6.2977776527404785, "global_step": 102659, "epoch": 2444} {"train_loss": -6.388460159301758, "global_step": 102660, "epoch": 2444} {"train_loss": -6.2866291999816895, "global_step": 102661, "epoch": 2444} {"train_loss": -6.269781589508057, "global_step": 102662, "epoch": 2444} {"train_loss": -6.231879711151123, "global_step": 102663, "epoch": 2444} {"train_loss": -6.2204132080078125, "global_step": 102664, "epoch": 2444} {"train_loss": -6.242375373840332, "global_step": 102665, "epoch": 2444} {"train_loss": -6.203822612762451, "global_step": 102666, "epoch": 2444} {"train_loss": -6.348725318908691, "global_step": 102667, "epoch": 2444} {"train_loss": -6.206465721130371, "global_step": 102668, "epoch": 2444} {"train_loss": -6.296303749084473, "global_step": 102669, "epoch": 2444} {"train_loss": -6.287193298339844, "global_step": 102670, "epoch": 2444} {"train_loss": -6.208287239074707, "global_step": 102671, "epoch": 2444} {"train_loss": -6.304095268249512, "global_step": 102672, "epoch": 2444} {"train_loss": -6.1459760665893555, "global_step": 102673, "epoch": 2444} {"train_loss": -6.294659614562988, "global_step": 102674, "epoch": 2444} {"train_loss": -6.252000331878662, "global_step": 102675, "epoch": 2444} {"train_loss": -6.304327011108398, "global_step": 102676, "epoch": 2444} {"train_loss": -6.262904167175293, "global_step": 102677, "epoch": 2444} {"train_loss": -6.354477882385254, "global_step": 102678, "epoch": 2444} {"train_loss": -6.296382904052734, "global_step": 102679, "epoch": 2444} {"train_loss": -6.252089500427246, "global_step": 102680, "epoch": 2444} {"train_loss": -6.269797325134277, "global_step": 102681, "epoch": 2444} {"train_loss": -6.223613739013672, "global_step": 102682, "epoch": 2444} {"train_loss": -6.247890949249268, "global_step": 102683, "epoch": 2444} {"train_loss": -6.337013244628906, "global_step": 102684, "epoch": 2444} {"train_loss": -6.277271270751953, "global_step": 102685, "epoch": 2444} {"train_loss": -6.3621826171875, "global_step": 102686, "epoch": 2444} {"train_loss": -6.242531776428223, "global_step": 102687, "epoch": 2444} {"train_loss": -6.3562211990356445, "global_step": 102688, "epoch": 2444} {"train_loss": -6.2718673206511, "global_step": 102689, "epoch": 2444, "val_loss": 76228.3203125} {"train_loss": -6.30239725112915, "global_step": 102690, "epoch": 2445} {"train_loss": -6.345146179199219, "global_step": 102691, "epoch": 2445} {"train_loss": -6.3470916748046875, "global_step": 102692, "epoch": 2445} {"train_loss": -6.40515661239624, "global_step": 102693, "epoch": 2445} {"train_loss": -6.365499019622803, "global_step": 102694, "epoch": 2445} {"train_loss": -6.334403038024902, "global_step": 102695, "epoch": 2445} {"train_loss": -6.467715263366699, "global_step": 102696, "epoch": 2445} {"train_loss": -6.395359039306641, "global_step": 102697, "epoch": 2445} {"train_loss": -6.33452033996582, "global_step": 102698, "epoch": 2445} {"train_loss": -6.455222129821777, "global_step": 102699, "epoch": 2445} {"train_loss": -6.290139198303223, "global_step": 102700, "epoch": 2445} {"train_loss": -6.376034259796143, "global_step": 102701, "epoch": 2445} {"train_loss": -6.365802764892578, "global_step": 102702, "epoch": 2445} {"train_loss": -6.331539154052734, "global_step": 102703, "epoch": 2445} {"train_loss": -6.34187650680542, "global_step": 102704, "epoch": 2445} {"train_loss": -6.467284202575684, "global_step": 102705, "epoch": 2445} {"train_loss": -6.427868843078613, "global_step": 102706, "epoch": 2445} {"train_loss": -6.465249538421631, "global_step": 102707, "epoch": 2445} {"train_loss": -6.33167839050293, "global_step": 102708, "epoch": 2445} {"train_loss": -6.472029685974121, "global_step": 102709, "epoch": 2445} {"train_loss": -6.359447479248047, "global_step": 102710, "epoch": 2445} {"train_loss": -6.308221817016602, "global_step": 102711, "epoch": 2445} {"train_loss": -6.457705497741699, "global_step": 102712, "epoch": 2445} {"train_loss": -6.401771068572998, "global_step": 102713, "epoch": 2445} {"train_loss": -6.363216400146484, "global_step": 102714, "epoch": 2445} {"train_loss": -6.430500030517578, "global_step": 102715, "epoch": 2445} {"train_loss": -6.339792251586914, "global_step": 102716, "epoch": 2445} {"train_loss": -6.435543537139893, "global_step": 102717, "epoch": 2445} {"train_loss": -6.435957431793213, "global_step": 102718, "epoch": 2445} {"train_loss": -6.36992883682251, "global_step": 102719, "epoch": 2445} {"train_loss": -6.4086456298828125, "global_step": 102720, "epoch": 2445} {"train_loss": -6.443428993225098, "global_step": 102721, "epoch": 2445} {"train_loss": -6.346569538116455, "global_step": 102722, "epoch": 2445} {"train_loss": -6.315385341644287, "global_step": 102723, "epoch": 2445} {"train_loss": -6.466664791107178, "global_step": 102724, "epoch": 2445} {"train_loss": -6.361363410949707, "global_step": 102725, "epoch": 2445} {"train_loss": -6.349243640899658, "global_step": 102726, "epoch": 2445} {"train_loss": -6.2772626876831055, "global_step": 102727, "epoch": 2445} {"train_loss": -6.363729476928711, "global_step": 102728, "epoch": 2445} {"train_loss": -6.244930744171143, "global_step": 102729, "epoch": 2445} {"train_loss": -6.432581901550293, "global_step": 102730, "epoch": 2445} {"train_loss": -6.381849198114304, "global_step": 102731, "epoch": 2445, "val_loss": 76420.9453125} {"train_loss": -6.393863677978516, "global_step": 102732, "epoch": 2446} {"train_loss": -6.365739822387695, "global_step": 102733, "epoch": 2446} {"train_loss": -6.276216983795166, "global_step": 102734, "epoch": 2446} {"train_loss": -6.367121696472168, "global_step": 102735, "epoch": 2446} {"train_loss": -6.418933391571045, "global_step": 102736, "epoch": 2446} {"train_loss": -6.371097564697266, "global_step": 102737, "epoch": 2446} {"train_loss": -6.310793876647949, "global_step": 102738, "epoch": 2446} {"train_loss": -6.331418991088867, "global_step": 102739, "epoch": 2446} {"train_loss": -6.531782150268555, "global_step": 102740, "epoch": 2446} {"train_loss": -6.515659332275391, "global_step": 102741, "epoch": 2446} {"train_loss": -6.376965045928955, "global_step": 102742, "epoch": 2446} {"train_loss": -6.400341033935547, "global_step": 102743, "epoch": 2446} {"train_loss": -6.382810592651367, "global_step": 102744, "epoch": 2446} {"train_loss": -6.393562316894531, "global_step": 102745, "epoch": 2446} {"train_loss": -6.29634952545166, "global_step": 102746, "epoch": 2446} {"train_loss": -6.40535306930542, "global_step": 102747, "epoch": 2446} {"train_loss": -6.5026960372924805, "global_step": 102748, "epoch": 2446} {"train_loss": -6.444023609161377, "global_step": 102749, "epoch": 2446} {"train_loss": -6.396552085876465, "global_step": 102750, "epoch": 2446} {"train_loss": -6.443641185760498, "global_step": 102751, "epoch": 2446} {"train_loss": -6.420429706573486, "global_step": 102752, "epoch": 2446} {"train_loss": -6.336349010467529, "global_step": 102753, "epoch": 2446} {"train_loss": -6.444884300231934, "global_step": 102754, "epoch": 2446} {"train_loss": -6.37465763092041, "global_step": 102755, "epoch": 2446} {"train_loss": -6.329336166381836, "global_step": 102756, "epoch": 2446} {"train_loss": -6.460252285003662, "global_step": 102757, "epoch": 2446} {"train_loss": -6.355838298797607, "global_step": 102758, "epoch": 2446} {"train_loss": -6.335855007171631, "global_step": 102759, "epoch": 2446} {"train_loss": -6.442963600158691, "global_step": 102760, "epoch": 2446} {"train_loss": -6.405083656311035, "global_step": 102761, "epoch": 2446} {"train_loss": -6.403158187866211, "global_step": 102762, "epoch": 2446} {"train_loss": -6.426601409912109, "global_step": 102763, "epoch": 2446} {"train_loss": -6.540926456451416, "global_step": 102764, "epoch": 2446} {"train_loss": -6.341303825378418, "global_step": 102765, "epoch": 2446} {"train_loss": -6.471380233764648, "global_step": 102766, "epoch": 2446} {"train_loss": -6.42588996887207, "global_step": 102767, "epoch": 2446} {"train_loss": -6.4493408203125, "global_step": 102768, "epoch": 2446} {"train_loss": -6.493740081787109, "global_step": 102769, "epoch": 2446} {"train_loss": -6.379749774932861, "global_step": 102770, "epoch": 2446} {"train_loss": -6.466925621032715, "global_step": 102771, "epoch": 2446} {"train_loss": -6.33549165725708, "global_step": 102772, "epoch": 2446} {"train_loss": -6.403609048752558, "global_step": 102773, "epoch": 2446, "val_loss": 75734.9921875} {"train_loss": -6.442943572998047, "global_step": 102774, "epoch": 2447} {"train_loss": -6.425382614135742, "global_step": 102775, "epoch": 2447} {"train_loss": -6.5754194259643555, "global_step": 102776, "epoch": 2447} {"train_loss": -6.363447189331055, "global_step": 102777, "epoch": 2447} {"train_loss": -6.414623260498047, "global_step": 102778, "epoch": 2447} {"train_loss": -6.413984775543213, "global_step": 102779, "epoch": 2447} {"train_loss": -6.450857639312744, "global_step": 102780, "epoch": 2447} {"train_loss": -6.4608049392700195, "global_step": 102781, "epoch": 2447} {"train_loss": -6.448415756225586, "global_step": 102782, "epoch": 2447} {"train_loss": -6.608157157897949, "global_step": 102783, "epoch": 2447} {"train_loss": -6.36662483215332, "global_step": 102784, "epoch": 2447} {"train_loss": -6.388895034790039, "global_step": 102785, "epoch": 2447} {"train_loss": -6.463037014007568, "global_step": 102786, "epoch": 2447} {"train_loss": -6.448082447052002, "global_step": 102787, "epoch": 2447} {"train_loss": -6.394603729248047, "global_step": 102788, "epoch": 2447} {"train_loss": -6.279594421386719, "global_step": 102789, "epoch": 2447} {"train_loss": -6.333802223205566, "global_step": 102790, "epoch": 2447} {"train_loss": -6.418146133422852, "global_step": 102791, "epoch": 2447} {"train_loss": -6.435651779174805, "global_step": 102792, "epoch": 2447} {"train_loss": -6.335965156555176, "global_step": 102793, "epoch": 2447} {"train_loss": -6.444333076477051, "global_step": 102794, "epoch": 2447} {"train_loss": -6.237703323364258, "global_step": 102795, "epoch": 2447} {"train_loss": -6.508774280548096, "global_step": 102796, "epoch": 2447} {"train_loss": -6.2782392501831055, "global_step": 102797, "epoch": 2447} {"train_loss": -6.270197868347168, "global_step": 102798, "epoch": 2447} {"train_loss": -6.279404640197754, "global_step": 102799, "epoch": 2447} {"train_loss": -6.269735336303711, "global_step": 102800, "epoch": 2447} {"train_loss": -6.420816898345947, "global_step": 102801, "epoch": 2447} {"train_loss": -6.271846771240234, "global_step": 102802, "epoch": 2447} {"train_loss": -6.401612758636475, "global_step": 102803, "epoch": 2447} {"train_loss": -6.318795204162598, "global_step": 102804, "epoch": 2447} {"train_loss": -6.313467025756836, "global_step": 102805, "epoch": 2447} {"train_loss": -6.382447242736816, "global_step": 102806, "epoch": 2447} {"train_loss": -6.348971843719482, "global_step": 102807, "epoch": 2447} {"train_loss": -6.4105987548828125, "global_step": 102808, "epoch": 2447} {"train_loss": -6.344644546508789, "global_step": 102809, "epoch": 2447} {"train_loss": -6.459420204162598, "global_step": 102810, "epoch": 2447} {"train_loss": -6.3555145263671875, "global_step": 102811, "epoch": 2447} {"train_loss": -6.439985275268555, "global_step": 102812, "epoch": 2447} {"train_loss": -6.3853654861450195, "global_step": 102813, "epoch": 2447} {"train_loss": -6.417051315307617, "global_step": 102814, "epoch": 2447} {"train_loss": -6.392840941747029, "global_step": 102815, "epoch": 2447, "val_loss": 75638.75} {"train_loss": -6.432751655578613, "global_step": 102816, "epoch": 2448} {"train_loss": -6.3967604637146, "global_step": 102817, "epoch": 2448} {"train_loss": -6.502837181091309, "global_step": 102818, "epoch": 2448} {"train_loss": -6.479686737060547, "global_step": 102819, "epoch": 2448} {"train_loss": -6.383373260498047, "global_step": 102820, "epoch": 2448} {"train_loss": -6.548160552978516, "global_step": 102821, "epoch": 2448} {"train_loss": -6.41189432144165, "global_step": 102822, "epoch": 2448} {"train_loss": -6.440312385559082, "global_step": 102823, "epoch": 2448} {"train_loss": -6.341054916381836, "global_step": 102824, "epoch": 2448} {"train_loss": -6.391299247741699, "global_step": 102825, "epoch": 2448} {"train_loss": -6.376473426818848, "global_step": 102826, "epoch": 2448} {"train_loss": -6.414041996002197, "global_step": 102827, "epoch": 2448} {"train_loss": -6.420183181762695, "global_step": 102828, "epoch": 2448} {"train_loss": -6.450290679931641, "global_step": 102829, "epoch": 2448} {"train_loss": -6.405303001403809, "global_step": 102830, "epoch": 2448} {"train_loss": -6.233062267303467, "global_step": 102831, "epoch": 2448} {"train_loss": -6.339352130889893, "global_step": 102832, "epoch": 2448} {"train_loss": -6.363275527954102, "global_step": 102833, "epoch": 2448} {"train_loss": -6.409538269042969, "global_step": 102834, "epoch": 2448} {"train_loss": -6.404440879821777, "global_step": 102835, "epoch": 2448} {"train_loss": -6.484307289123535, "global_step": 102836, "epoch": 2448} {"train_loss": -6.348400592803955, "global_step": 102837, "epoch": 2448} {"train_loss": -6.425075531005859, "global_step": 102838, "epoch": 2448} {"train_loss": -6.327509880065918, "global_step": 102839, "epoch": 2448} {"train_loss": -6.48680305480957, "global_step": 102840, "epoch": 2448} {"train_loss": -6.351081371307373, "global_step": 102841, "epoch": 2448} {"train_loss": -6.388017654418945, "global_step": 102842, "epoch": 2448} {"train_loss": -6.457889556884766, "global_step": 102843, "epoch": 2448} {"train_loss": -6.292754650115967, "global_step": 102844, "epoch": 2448} {"train_loss": -6.393808841705322, "global_step": 102845, "epoch": 2448} {"train_loss": -6.2015790939331055, "global_step": 102846, "epoch": 2448} {"train_loss": -6.255692958831787, "global_step": 102847, "epoch": 2448} {"train_loss": -6.341737747192383, "global_step": 102848, "epoch": 2448} {"train_loss": -6.328300952911377, "global_step": 102849, "epoch": 2448} {"train_loss": -6.406641006469727, "global_step": 102850, "epoch": 2448} {"train_loss": -6.3539838790893555, "global_step": 102851, "epoch": 2448} {"train_loss": -6.326775550842285, "global_step": 102852, "epoch": 2448} {"train_loss": -6.380859851837158, "global_step": 102853, "epoch": 2448} {"train_loss": -6.391168594360352, "global_step": 102854, "epoch": 2448} {"train_loss": -6.320860862731934, "global_step": 102855, "epoch": 2448} {"train_loss": -6.397213459014893, "global_step": 102856, "epoch": 2448} {"train_loss": -6.385865688323975, "global_step": 102857, "epoch": 2448, "val_loss": 76324.9375} {"train_loss": -6.242639541625977, "global_step": 102858, "epoch": 2449} {"train_loss": -6.309284687042236, "global_step": 102859, "epoch": 2449} {"train_loss": -6.370954513549805, "global_step": 102860, "epoch": 2449} {"train_loss": -6.307055950164795, "global_step": 102861, "epoch": 2449} {"train_loss": -6.402041435241699, "global_step": 102862, "epoch": 2449} {"train_loss": -6.366320610046387, "global_step": 102863, "epoch": 2449} {"train_loss": -6.291609764099121, "global_step": 102864, "epoch": 2449} {"train_loss": -6.3907470703125, "global_step": 102865, "epoch": 2449} {"train_loss": -6.453451156616211, "global_step": 102866, "epoch": 2449} {"train_loss": -6.40294885635376, "global_step": 102867, "epoch": 2449} {"train_loss": -6.387635231018066, "global_step": 102868, "epoch": 2449} {"train_loss": -6.468364238739014, "global_step": 102869, "epoch": 2449} {"train_loss": -6.361161231994629, "global_step": 102870, "epoch": 2449} {"train_loss": -6.4115190505981445, "global_step": 102871, "epoch": 2449} {"train_loss": -6.393362522125244, "global_step": 102872, "epoch": 2449} {"train_loss": -6.358377456665039, "global_step": 102873, "epoch": 2449} {"train_loss": -6.344642639160156, "global_step": 102874, "epoch": 2449} {"train_loss": -6.372160911560059, "global_step": 102875, "epoch": 2449} {"train_loss": -6.36517333984375, "global_step": 102876, "epoch": 2449} {"train_loss": -6.3775410652160645, "global_step": 102877, "epoch": 2449} {"train_loss": -6.342569828033447, "global_step": 102878, "epoch": 2449} {"train_loss": -6.429013252258301, "global_step": 102879, "epoch": 2449} {"train_loss": -6.449746608734131, "global_step": 102880, "epoch": 2449} {"train_loss": -6.390965461730957, "global_step": 102881, "epoch": 2449} {"train_loss": -6.404348373413086, "global_step": 102882, "epoch": 2449} {"train_loss": -6.371959209442139, "global_step": 102883, "epoch": 2449} {"train_loss": -6.496855735778809, "global_step": 102884, "epoch": 2449} {"train_loss": -6.38140869140625, "global_step": 102885, "epoch": 2449} {"train_loss": -6.43963098526001, "global_step": 102886, "epoch": 2449} {"train_loss": -6.50132942199707, "global_step": 102887, "epoch": 2449} {"train_loss": -6.2351884841918945, "global_step": 102888, "epoch": 2449} {"train_loss": -6.3218231201171875, "global_step": 102889, "epoch": 2449} {"train_loss": -6.373991966247559, "global_step": 102890, "epoch": 2449} {"train_loss": -6.325962066650391, "global_step": 102891, "epoch": 2449} {"train_loss": -6.414900302886963, "global_step": 102892, "epoch": 2449} {"train_loss": -6.392563819885254, "global_step": 102893, "epoch": 2449} {"train_loss": -6.335729598999023, "global_step": 102894, "epoch": 2449} {"train_loss": -6.425248622894287, "global_step": 102895, "epoch": 2449} {"train_loss": -6.235122203826904, "global_step": 102896, "epoch": 2449} {"train_loss": -6.246737957000732, "global_step": 102897, "epoch": 2449} {"train_loss": -6.456003189086914, "global_step": 102898, "epoch": 2449} {"train_loss": -6.375371002015614, "global_step": 102899, "epoch": 2449, "val_loss": 76320.8515625} {"train_loss": -6.3795928955078125, "global_step": 102900, "epoch": 2450} {"train_loss": -6.515697479248047, "global_step": 102901, "epoch": 2450} {"train_loss": -6.475765228271484, "global_step": 102902, "epoch": 2450} {"train_loss": -6.2220869064331055, "global_step": 102903, "epoch": 2450} {"train_loss": -6.43333625793457, "global_step": 102904, "epoch": 2450} {"train_loss": -6.347716331481934, "global_step": 102905, "epoch": 2450} {"train_loss": -6.233142375946045, "global_step": 102906, "epoch": 2450} {"train_loss": -6.361931800842285, "global_step": 102907, "epoch": 2450} {"train_loss": -6.367607116699219, "global_step": 102908, "epoch": 2450} {"train_loss": -6.423043251037598, "global_step": 102909, "epoch": 2450} {"train_loss": -6.413098335266113, "global_step": 102910, "epoch": 2450} {"train_loss": -6.304612636566162, "global_step": 102911, "epoch": 2450} {"train_loss": -6.433900356292725, "global_step": 102912, "epoch": 2450} {"train_loss": -6.308871269226074, "global_step": 102913, "epoch": 2450} {"train_loss": -6.394986152648926, "global_step": 102914, "epoch": 2450} {"train_loss": -6.530142784118652, "global_step": 102915, "epoch": 2450} {"train_loss": -6.204885482788086, "global_step": 102916, "epoch": 2450} {"train_loss": -6.380985260009766, "global_step": 102917, "epoch": 2450} {"train_loss": -6.376755714416504, "global_step": 102918, "epoch": 2450} {"train_loss": -6.427628040313721, "global_step": 102919, "epoch": 2450} {"train_loss": -6.5047197341918945, "global_step": 102920, "epoch": 2450} {"train_loss": -6.402518272399902, "global_step": 102921, "epoch": 2450} {"train_loss": -6.364959716796875, "global_step": 102922, "epoch": 2450} {"train_loss": -6.302522659301758, "global_step": 102923, "epoch": 2450} {"train_loss": -6.335806369781494, "global_step": 102924, "epoch": 2450} {"train_loss": -6.392571449279785, "global_step": 102925, "epoch": 2450} {"train_loss": -6.383390426635742, "global_step": 102926, "epoch": 2450} {"train_loss": -6.4304022789001465, "global_step": 102927, "epoch": 2450} {"train_loss": -6.405858516693115, "global_step": 102928, "epoch": 2450} {"train_loss": -6.570206165313721, "global_step": 102929, "epoch": 2450} {"train_loss": -6.384590148925781, "global_step": 102930, "epoch": 2450} {"train_loss": -6.325576305389404, "global_step": 102931, "epoch": 2450} {"train_loss": -6.508776664733887, "global_step": 102932, "epoch": 2450} {"train_loss": -6.4041748046875, "global_step": 102933, "epoch": 2450} {"train_loss": -6.542598724365234, "global_step": 102934, "epoch": 2450} {"train_loss": -6.284468650817871, "global_step": 102935, "epoch": 2450} {"train_loss": -6.366786003112793, "global_step": 102936, "epoch": 2450} {"train_loss": -6.389603614807129, "global_step": 102937, "epoch": 2450} {"train_loss": -6.246699810028076, "global_step": 102938, "epoch": 2450} {"train_loss": -6.489562511444092, "global_step": 102939, "epoch": 2450} {"train_loss": -6.351019859313965, "global_step": 102940, "epoch": 2450} {"train_loss": -6.38422950108846, "global_step": 102941, "epoch": 2450, "train/sim_max_reward_0": 0.9339046700938067, "train/sim_max_reward_1": 0.8942707520382813, "train/sim_max_reward_2": 0.378020611266747, "train/sim_max_reward_3": 0.15154013321557433, "train/sim_max_reward_4": 0.3231431035170701, "train/sim_max_reward_5": 0.7572080053784539, "test/sim_max_reward_4500000": 0.3448659737418841, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9414305978041264, "test/sim_max_reward_4500003": 0.9031472811716823, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 0.9600175498798286, "test/sim_max_reward_4500006": 0.9689137376820123, "test/sim_max_reward_4500007": 0.9062026005570127, "test/sim_max_reward_4500008": 0.1316585324615754, "test/sim_max_reward_4500009": 0.9408943410481503, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.1330447816774011, "test/sim_max_reward_4500012": 0.7469010398018479, "test/sim_max_reward_4500013": 0.0018604864137267215, "test/sim_max_reward_4500014": 0.47668294715481435, "test/sim_max_reward_4500015": 0.4336065122016362, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.018933853246905212, "test/sim_max_reward_4500018": 0.38546906324479896, "test/sim_max_reward_4500019": 0.7924890796027706, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.6705033831730034, "test/sim_max_reward_4500022": 0.9502762275761882, "test/sim_max_reward_4500023": 0.8949835258043704, "test/sim_max_reward_4500024": 1.0, "test/sim_max_reward_4500025": 0.6153364299584876, "test/sim_max_reward_4500026": 1.0, "test/sim_max_reward_4500027": 0.6339451488240846, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.10767760405711152, "test/sim_max_reward_4500030": 0.9751542749195132, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.08595337649686322, "test/sim_max_reward_4500034": 0.06198818821703353, "test/sim_max_reward_4500035": 0.6245704242069978, "test/sim_max_reward_4500036": 0.5588845505939315, "test/sim_max_reward_4500037": 0.8895710014671515, "test/sim_max_reward_4500038": 0.3001206039704396, "test/sim_max_reward_4500039": 0.9690386284420265, "test/sim_max_reward_4500040": 0.8877124921721171, "test/sim_max_reward_4500041": 0.312940091445153, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.835324561368892, "test/sim_max_reward_4500044": 0.4905508134145973, "test/sim_max_reward_4500045": 0.6411485989990571, "test/sim_max_reward_4500046": 0.20235798610306804, "test/sim_max_reward_4500047": 0.9856070103428446, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5730145459183222, "test/mean_score": 0.5210886811268522, "val_loss": 75953.515625} {"train_loss": -6.35090446472168, "global_step": 102942, "epoch": 2451} {"train_loss": -6.404085159301758, "global_step": 102943, "epoch": 2451} {"train_loss": -6.276850700378418, "global_step": 102944, "epoch": 2451} {"train_loss": -6.3312177658081055, "global_step": 102945, "epoch": 2451} {"train_loss": -6.387757301330566, "global_step": 102946, "epoch": 2451} {"train_loss": -6.351736068725586, "global_step": 102947, "epoch": 2451} {"train_loss": -6.359921455383301, "global_step": 102948, "epoch": 2451} {"train_loss": -6.396635055541992, "global_step": 102949, "epoch": 2451} {"train_loss": -6.363615989685059, "global_step": 102950, "epoch": 2451} {"train_loss": -6.422174453735352, "global_step": 102951, "epoch": 2451} {"train_loss": -6.310299873352051, "global_step": 102952, "epoch": 2451} {"train_loss": -6.341182708740234, "global_step": 102953, "epoch": 2451} {"train_loss": -6.315982818603516, "global_step": 102954, "epoch": 2451} {"train_loss": -6.361881256103516, "global_step": 102955, "epoch": 2451} {"train_loss": -6.343137741088867, "global_step": 102956, "epoch": 2451} {"train_loss": -6.361356258392334, "global_step": 102957, "epoch": 2451} {"train_loss": -6.485508918762207, "global_step": 102958, "epoch": 2451} {"train_loss": -6.440000534057617, "global_step": 102959, "epoch": 2451} {"train_loss": -6.388519287109375, "global_step": 102960, "epoch": 2451} {"train_loss": -6.458613395690918, "global_step": 102961, "epoch": 2451} {"train_loss": -6.366796970367432, "global_step": 102962, "epoch": 2451} {"train_loss": -6.424093723297119, "global_step": 102963, "epoch": 2451} {"train_loss": -6.470141410827637, "global_step": 102964, "epoch": 2451} {"train_loss": -6.312653541564941, "global_step": 102965, "epoch": 2451} {"train_loss": -6.413661003112793, "global_step": 102966, "epoch": 2451} {"train_loss": -6.372591972351074, "global_step": 102967, "epoch": 2451} {"train_loss": -6.39976692199707, "global_step": 102968, "epoch": 2451} {"train_loss": -6.367844104766846, "global_step": 102969, "epoch": 2451} {"train_loss": -6.364655494689941, "global_step": 102970, "epoch": 2451} {"train_loss": -6.448565483093262, "global_step": 102971, "epoch": 2451} {"train_loss": -6.338748931884766, "global_step": 102972, "epoch": 2451} {"train_loss": -6.3674750328063965, "global_step": 102973, "epoch": 2451} {"train_loss": -6.383523464202881, "global_step": 102974, "epoch": 2451} {"train_loss": -6.417203903198242, "global_step": 102975, "epoch": 2451} {"train_loss": -6.353548526763916, "global_step": 102976, "epoch": 2451} {"train_loss": -6.31063175201416, "global_step": 102977, "epoch": 2451} {"train_loss": -6.401683330535889, "global_step": 102978, "epoch": 2451} {"train_loss": -6.365856170654297, "global_step": 102979, "epoch": 2451} {"train_loss": -6.3741350173950195, "global_step": 102980, "epoch": 2451} {"train_loss": -6.353604316711426, "global_step": 102981, "epoch": 2451} {"train_loss": -6.488242149353027, "global_step": 102982, "epoch": 2451} {"train_loss": -6.379433007467361, "global_step": 102983, "epoch": 2451, "val_loss": 75999.5390625} {"train_loss": -6.478853702545166, "global_step": 102984, "epoch": 2452} {"train_loss": -6.445505142211914, "global_step": 102985, "epoch": 2452} {"train_loss": -6.433969974517822, "global_step": 102986, "epoch": 2452} {"train_loss": -6.383071422576904, "global_step": 102987, "epoch": 2452} {"train_loss": -6.376421928405762, "global_step": 102988, "epoch": 2452} {"train_loss": -6.45472526550293, "global_step": 102989, "epoch": 2452} {"train_loss": -6.359161376953125, "global_step": 102990, "epoch": 2452} {"train_loss": -6.374864101409912, "global_step": 102991, "epoch": 2452} {"train_loss": -6.441115856170654, "global_step": 102992, "epoch": 2452} {"train_loss": -6.464179039001465, "global_step": 102993, "epoch": 2452} {"train_loss": -6.375809669494629, "global_step": 102994, "epoch": 2452} {"train_loss": -6.4578142166137695, "global_step": 102995, "epoch": 2452} {"train_loss": -6.4152512550354, "global_step": 102996, "epoch": 2452} {"train_loss": -6.396131992340088, "global_step": 102997, "epoch": 2452} {"train_loss": -6.318368911743164, "global_step": 102998, "epoch": 2452} {"train_loss": -6.35660457611084, "global_step": 102999, "epoch": 2452} {"train_loss": -6.292378902435303, "global_step": 103000, "epoch": 2452} {"train_loss": -6.276070594787598, "global_step": 103001, "epoch": 2452} {"train_loss": -6.433915615081787, "global_step": 103002, "epoch": 2452} {"train_loss": -6.387084007263184, "global_step": 103003, "epoch": 2452} {"train_loss": -6.284314155578613, "global_step": 103004, "epoch": 2452} {"train_loss": -6.338266372680664, "global_step": 103005, "epoch": 2452} {"train_loss": -6.344914436340332, "global_step": 103006, "epoch": 2452} {"train_loss": -6.292147636413574, "global_step": 103007, "epoch": 2452} {"train_loss": -6.397680759429932, "global_step": 103008, "epoch": 2452} {"train_loss": -6.461540699005127, "global_step": 103009, "epoch": 2452} {"train_loss": -6.437751770019531, "global_step": 103010, "epoch": 2452} {"train_loss": -6.460365295410156, "global_step": 103011, "epoch": 2452} {"train_loss": -6.386467933654785, "global_step": 103012, "epoch": 2452} {"train_loss": -6.514980316162109, "global_step": 103013, "epoch": 2452} {"train_loss": -6.340850830078125, "global_step": 103014, "epoch": 2452} {"train_loss": -6.379131317138672, "global_step": 103015, "epoch": 2452} {"train_loss": -6.380557060241699, "global_step": 103016, "epoch": 2452} {"train_loss": -6.424497604370117, "global_step": 103017, "epoch": 2452} {"train_loss": -6.320364475250244, "global_step": 103018, "epoch": 2452} {"train_loss": -6.327020645141602, "global_step": 103019, "epoch": 2452} {"train_loss": -6.509930610656738, "global_step": 103020, "epoch": 2452} {"train_loss": -6.358384132385254, "global_step": 103021, "epoch": 2452} {"train_loss": -6.395454406738281, "global_step": 103022, "epoch": 2452} {"train_loss": -6.4871039390563965, "global_step": 103023, "epoch": 2452} {"train_loss": -6.321637153625488, "global_step": 103024, "epoch": 2452} {"train_loss": -6.393244845526559, "global_step": 103025, "epoch": 2452, "val_loss": 75876.421875} {"train_loss": -6.436877727508545, "global_step": 103026, "epoch": 2453} {"train_loss": -6.3700714111328125, "global_step": 103027, "epoch": 2453} {"train_loss": -6.401765823364258, "global_step": 103028, "epoch": 2453} {"train_loss": -6.439455032348633, "global_step": 103029, "epoch": 2453} {"train_loss": -6.2692084312438965, "global_step": 103030, "epoch": 2453} {"train_loss": -6.31178617477417, "global_step": 103031, "epoch": 2453} {"train_loss": -6.356051445007324, "global_step": 103032, "epoch": 2453} {"train_loss": -6.215458869934082, "global_step": 103033, "epoch": 2453} {"train_loss": -6.425074577331543, "global_step": 103034, "epoch": 2453} {"train_loss": -6.409104347229004, "global_step": 103035, "epoch": 2453} {"train_loss": -6.447344779968262, "global_step": 103036, "epoch": 2453} {"train_loss": -6.466593265533447, "global_step": 103037, "epoch": 2453} {"train_loss": -6.3573079109191895, "global_step": 103038, "epoch": 2453} {"train_loss": -6.406907081604004, "global_step": 103039, "epoch": 2453} {"train_loss": -6.369202613830566, "global_step": 103040, "epoch": 2453} {"train_loss": -6.392340660095215, "global_step": 103041, "epoch": 2453} {"train_loss": -6.497071266174316, "global_step": 103042, "epoch": 2453} {"train_loss": -6.448830604553223, "global_step": 103043, "epoch": 2453} {"train_loss": -6.344815254211426, "global_step": 103044, "epoch": 2453} {"train_loss": -6.330226898193359, "global_step": 103045, "epoch": 2453} {"train_loss": -6.419830322265625, "global_step": 103046, "epoch": 2453} {"train_loss": -6.207002639770508, "global_step": 103047, "epoch": 2453} {"train_loss": -6.3719072341918945, "global_step": 103048, "epoch": 2453} {"train_loss": -6.396267890930176, "global_step": 103049, "epoch": 2453} {"train_loss": -6.2930827140808105, "global_step": 103050, "epoch": 2453} {"train_loss": -6.340964317321777, "global_step": 103051, "epoch": 2453} {"train_loss": -6.43229866027832, "global_step": 103052, "epoch": 2453} {"train_loss": -6.430384635925293, "global_step": 103053, "epoch": 2453} {"train_loss": -6.281229019165039, "global_step": 103054, "epoch": 2453} {"train_loss": -6.289166450500488, "global_step": 103055, "epoch": 2453} {"train_loss": -6.329005241394043, "global_step": 103056, "epoch": 2453} {"train_loss": -6.345345973968506, "global_step": 103057, "epoch": 2453} {"train_loss": -6.374664783477783, "global_step": 103058, "epoch": 2453} {"train_loss": -6.461700439453125, "global_step": 103059, "epoch": 2453} {"train_loss": -6.438699245452881, "global_step": 103060, "epoch": 2453} {"train_loss": -6.34264612197876, "global_step": 103061, "epoch": 2453} {"train_loss": -6.295629501342773, "global_step": 103062, "epoch": 2453} {"train_loss": -6.423769950866699, "global_step": 103063, "epoch": 2453} {"train_loss": -6.468282222747803, "global_step": 103064, "epoch": 2453} {"train_loss": -6.270881652832031, "global_step": 103065, "epoch": 2453} {"train_loss": -6.4701032638549805, "global_step": 103066, "epoch": 2453} {"train_loss": -6.37528615906125, "global_step": 103067, "epoch": 2453, "val_loss": 75940.890625} {"train_loss": -6.420775413513184, "global_step": 103068, "epoch": 2454} {"train_loss": -6.556136131286621, "global_step": 103069, "epoch": 2454} {"train_loss": -6.402980804443359, "global_step": 103070, "epoch": 2454} {"train_loss": -6.460559368133545, "global_step": 103071, "epoch": 2454} {"train_loss": -6.421658515930176, "global_step": 103072, "epoch": 2454} {"train_loss": -6.4569292068481445, "global_step": 103073, "epoch": 2454} {"train_loss": -6.302611351013184, "global_step": 103074, "epoch": 2454} {"train_loss": -6.389937877655029, "global_step": 103075, "epoch": 2454} {"train_loss": -6.340902805328369, "global_step": 103076, "epoch": 2454} {"train_loss": -6.54344367980957, "global_step": 103077, "epoch": 2454} {"train_loss": -6.379112243652344, "global_step": 103078, "epoch": 2454} {"train_loss": -6.408155918121338, "global_step": 103079, "epoch": 2454} {"train_loss": -6.467328071594238, "global_step": 103080, "epoch": 2454} {"train_loss": -6.328839302062988, "global_step": 103081, "epoch": 2454} {"train_loss": -6.437518119812012, "global_step": 103082, "epoch": 2454} {"train_loss": -6.550685405731201, "global_step": 103083, "epoch": 2454} {"train_loss": -6.412420749664307, "global_step": 103084, "epoch": 2454} {"train_loss": -6.411028861999512, "global_step": 103085, "epoch": 2454} {"train_loss": -6.474260330200195, "global_step": 103086, "epoch": 2454} {"train_loss": -6.44478702545166, "global_step": 103087, "epoch": 2454} {"train_loss": -6.3163886070251465, "global_step": 103088, "epoch": 2454} {"train_loss": -6.44954776763916, "global_step": 103089, "epoch": 2454} {"train_loss": -6.433383941650391, "global_step": 103090, "epoch": 2454} {"train_loss": -6.414988994598389, "global_step": 103091, "epoch": 2454} {"train_loss": -6.450938701629639, "global_step": 103092, "epoch": 2454} {"train_loss": -6.295699596405029, "global_step": 103093, "epoch": 2454} {"train_loss": -6.355710983276367, "global_step": 103094, "epoch": 2454} {"train_loss": -6.4425048828125, "global_step": 103095, "epoch": 2454} {"train_loss": -6.444948196411133, "global_step": 103096, "epoch": 2454} {"train_loss": -6.350340843200684, "global_step": 103097, "epoch": 2454} {"train_loss": -6.281432151794434, "global_step": 103098, "epoch": 2454} {"train_loss": -6.383705139160156, "global_step": 103099, "epoch": 2454} {"train_loss": -6.410383224487305, "global_step": 103100, "epoch": 2454} {"train_loss": -6.4911041259765625, "global_step": 103101, "epoch": 2454} {"train_loss": -6.340482711791992, "global_step": 103102, "epoch": 2454} {"train_loss": -6.390206336975098, "global_step": 103103, "epoch": 2454} {"train_loss": -6.437681198120117, "global_step": 103104, "epoch": 2454} {"train_loss": -6.413049697875977, "global_step": 103105, "epoch": 2454} {"train_loss": -6.456579208374023, "global_step": 103106, "epoch": 2454} {"train_loss": -6.392731666564941, "global_step": 103107, "epoch": 2454} {"train_loss": -6.368908405303955, "global_step": 103108, "epoch": 2454} {"train_loss": -6.415282113211496, "global_step": 103109, "epoch": 2454, "val_loss": 75736.6875} {"train_loss": -6.600468635559082, "global_step": 103110, "epoch": 2455} {"train_loss": -6.425223350524902, "global_step": 103111, "epoch": 2455} {"train_loss": -6.421745300292969, "global_step": 103112, "epoch": 2455} {"train_loss": -6.362614154815674, "global_step": 103113, "epoch": 2455} {"train_loss": -6.437600612640381, "global_step": 103114, "epoch": 2455} {"train_loss": -6.430573463439941, "global_step": 103115, "epoch": 2455} {"train_loss": -6.232368469238281, "global_step": 103116, "epoch": 2455} {"train_loss": -6.42710018157959, "global_step": 103117, "epoch": 2455} {"train_loss": -6.46757173538208, "global_step": 103118, "epoch": 2455} {"train_loss": -6.376506805419922, "global_step": 103119, "epoch": 2455} {"train_loss": -6.491655349731445, "global_step": 103120, "epoch": 2455} {"train_loss": -6.466056823730469, "global_step": 103121, "epoch": 2455} {"train_loss": -6.402773857116699, "global_step": 103122, "epoch": 2455} {"train_loss": -6.451545715332031, "global_step": 103123, "epoch": 2455} {"train_loss": -6.368288040161133, "global_step": 103124, "epoch": 2455} {"train_loss": -6.462104320526123, "global_step": 103125, "epoch": 2455} {"train_loss": -6.338535308837891, "global_step": 103126, "epoch": 2455} {"train_loss": -6.440181732177734, "global_step": 103127, "epoch": 2455} {"train_loss": -6.456867218017578, "global_step": 103128, "epoch": 2455} {"train_loss": -6.415136337280273, "global_step": 103129, "epoch": 2455} {"train_loss": -6.414547443389893, "global_step": 103130, "epoch": 2455} {"train_loss": -6.469367027282715, "global_step": 103131, "epoch": 2455} {"train_loss": -6.344748497009277, "global_step": 103132, "epoch": 2455} {"train_loss": -6.37926721572876, "global_step": 103133, "epoch": 2455} {"train_loss": -6.519563674926758, "global_step": 103134, "epoch": 2455} {"train_loss": -6.481539726257324, "global_step": 103135, "epoch": 2455} {"train_loss": -6.293123245239258, "global_step": 103136, "epoch": 2455} {"train_loss": -6.39348840713501, "global_step": 103137, "epoch": 2455} {"train_loss": -6.280451774597168, "global_step": 103138, "epoch": 2455} {"train_loss": -6.359827041625977, "global_step": 103139, "epoch": 2455} {"train_loss": -6.307939052581787, "global_step": 103140, "epoch": 2455} {"train_loss": -6.428945541381836, "global_step": 103141, "epoch": 2455} {"train_loss": -6.26481819152832, "global_step": 103142, "epoch": 2455} {"train_loss": -6.381436824798584, "global_step": 103143, "epoch": 2455} {"train_loss": -6.404845714569092, "global_step": 103144, "epoch": 2455} {"train_loss": -6.455618858337402, "global_step": 103145, "epoch": 2455} {"train_loss": -6.39702033996582, "global_step": 103146, "epoch": 2455} {"train_loss": -6.45710563659668, "global_step": 103147, "epoch": 2455} {"train_loss": -6.352266311645508, "global_step": 103148, "epoch": 2455} {"train_loss": -6.178656578063965, "global_step": 103149, "epoch": 2455} {"train_loss": -6.334233283996582, "global_step": 103150, "epoch": 2455} {"train_loss": -6.39912021727789, "global_step": 103151, "epoch": 2455, "val_loss": 75941.9609375} {"train_loss": -6.501611709594727, "global_step": 103152, "epoch": 2456} {"train_loss": -6.486837387084961, "global_step": 103153, "epoch": 2456} {"train_loss": -6.4523515701293945, "global_step": 103154, "epoch": 2456} {"train_loss": -6.4843974113464355, "global_step": 103155, "epoch": 2456} {"train_loss": -6.352808952331543, "global_step": 103156, "epoch": 2456} {"train_loss": -6.373222827911377, "global_step": 103157, "epoch": 2456} {"train_loss": -6.295656204223633, "global_step": 103158, "epoch": 2456} {"train_loss": -6.461532115936279, "global_step": 103159, "epoch": 2456} {"train_loss": -6.362034320831299, "global_step": 103160, "epoch": 2456} {"train_loss": -6.351862907409668, "global_step": 103161, "epoch": 2456} {"train_loss": -6.447739601135254, "global_step": 103162, "epoch": 2456} {"train_loss": -6.387972354888916, "global_step": 103163, "epoch": 2456} {"train_loss": -6.3884124755859375, "global_step": 103164, "epoch": 2456} {"train_loss": -6.465975761413574, "global_step": 103165, "epoch": 2456} {"train_loss": -6.434324741363525, "global_step": 103166, "epoch": 2456} {"train_loss": -6.392426490783691, "global_step": 103167, "epoch": 2456} {"train_loss": -6.375356674194336, "global_step": 103168, "epoch": 2456} {"train_loss": -6.441660404205322, "global_step": 103169, "epoch": 2456} {"train_loss": -6.421160697937012, "global_step": 103170, "epoch": 2456} {"train_loss": -6.468482494354248, "global_step": 103171, "epoch": 2456} {"train_loss": -6.403897285461426, "global_step": 103172, "epoch": 2456} {"train_loss": -6.486014366149902, "global_step": 103173, "epoch": 2456} {"train_loss": -6.47349214553833, "global_step": 103174, "epoch": 2456} {"train_loss": -6.392930030822754, "global_step": 103175, "epoch": 2456} {"train_loss": -6.333822727203369, "global_step": 103176, "epoch": 2456} {"train_loss": -6.344586372375488, "global_step": 103177, "epoch": 2456} {"train_loss": -6.516024589538574, "global_step": 103178, "epoch": 2456} {"train_loss": -6.411590576171875, "global_step": 103179, "epoch": 2456} {"train_loss": -6.363188743591309, "global_step": 103180, "epoch": 2456} {"train_loss": -6.439236640930176, "global_step": 103181, "epoch": 2456} {"train_loss": -6.424350738525391, "global_step": 103182, "epoch": 2456} {"train_loss": -6.327944278717041, "global_step": 103183, "epoch": 2456} {"train_loss": -6.363162517547607, "global_step": 103184, "epoch": 2456} {"train_loss": -6.396219730377197, "global_step": 103185, "epoch": 2456} {"train_loss": -6.2781782150268555, "global_step": 103186, "epoch": 2456} {"train_loss": -6.5170745849609375, "global_step": 103187, "epoch": 2456} {"train_loss": -6.433649063110352, "global_step": 103188, "epoch": 2456} {"train_loss": -6.275378704071045, "global_step": 103189, "epoch": 2456} {"train_loss": -6.155177116394043, "global_step": 103190, "epoch": 2456} {"train_loss": -6.368715286254883, "global_step": 103191, "epoch": 2456} {"train_loss": -6.443905830383301, "global_step": 103192, "epoch": 2456} {"train_loss": -6.400261617842174, "global_step": 103193, "epoch": 2456, "val_loss": 75950.7890625} {"train_loss": -6.402499198913574, "global_step": 103194, "epoch": 2457} {"train_loss": -6.298007965087891, "global_step": 103195, "epoch": 2457} {"train_loss": -6.380911827087402, "global_step": 103196, "epoch": 2457} {"train_loss": -6.3931050300598145, "global_step": 103197, "epoch": 2457} {"train_loss": -6.401643753051758, "global_step": 103198, "epoch": 2457} {"train_loss": -6.241551399230957, "global_step": 103199, "epoch": 2457} {"train_loss": -6.332718849182129, "global_step": 103200, "epoch": 2457} {"train_loss": -6.33299446105957, "global_step": 103201, "epoch": 2457} {"train_loss": -6.374271392822266, "global_step": 103202, "epoch": 2457} {"train_loss": -6.415119647979736, "global_step": 103203, "epoch": 2457} {"train_loss": -6.279381275177002, "global_step": 103204, "epoch": 2457} {"train_loss": -6.351675033569336, "global_step": 103205, "epoch": 2457} {"train_loss": -6.289571762084961, "global_step": 103206, "epoch": 2457} {"train_loss": -6.417951583862305, "global_step": 103207, "epoch": 2457} {"train_loss": -6.418733596801758, "global_step": 103208, "epoch": 2457} {"train_loss": -6.330230236053467, "global_step": 103209, "epoch": 2457} {"train_loss": -6.361491680145264, "global_step": 103210, "epoch": 2457} {"train_loss": -6.313729286193848, "global_step": 103211, "epoch": 2457} {"train_loss": -6.34890604019165, "global_step": 103212, "epoch": 2457} {"train_loss": -6.369906425476074, "global_step": 103213, "epoch": 2457} {"train_loss": -6.346769332885742, "global_step": 103214, "epoch": 2457} {"train_loss": -6.322983741760254, "global_step": 103215, "epoch": 2457} {"train_loss": -6.391226768493652, "global_step": 103216, "epoch": 2457} {"train_loss": -6.4358720779418945, "global_step": 103217, "epoch": 2457} {"train_loss": -6.147104263305664, "global_step": 103218, "epoch": 2457} {"train_loss": -6.341472625732422, "global_step": 103219, "epoch": 2457} {"train_loss": -6.32915735244751, "global_step": 103220, "epoch": 2457} {"train_loss": -6.298033237457275, "global_step": 103221, "epoch": 2457} {"train_loss": -6.32454776763916, "global_step": 103222, "epoch": 2457} {"train_loss": -6.318706035614014, "global_step": 103223, "epoch": 2457} {"train_loss": -6.437477111816406, "global_step": 103224, "epoch": 2457} {"train_loss": -6.375908374786377, "global_step": 103225, "epoch": 2457} {"train_loss": -6.386223793029785, "global_step": 103226, "epoch": 2457} {"train_loss": -6.388703346252441, "global_step": 103227, "epoch": 2457} {"train_loss": -6.2905378341674805, "global_step": 103228, "epoch": 2457} {"train_loss": -6.363090991973877, "global_step": 103229, "epoch": 2457} {"train_loss": -6.391148567199707, "global_step": 103230, "epoch": 2457} {"train_loss": -6.429216384887695, "global_step": 103231, "epoch": 2457} {"train_loss": -6.347539901733398, "global_step": 103232, "epoch": 2457} {"train_loss": -6.318417549133301, "global_step": 103233, "epoch": 2457} {"train_loss": -6.303153038024902, "global_step": 103234, "epoch": 2457} {"train_loss": -6.349026611873081, "global_step": 103235, "epoch": 2457, "val_loss": 76131.5859375} {"train_loss": -6.306461334228516, "global_step": 103236, "epoch": 2458} {"train_loss": -6.297970771789551, "global_step": 103237, "epoch": 2458} {"train_loss": -6.267767906188965, "global_step": 103238, "epoch": 2458} {"train_loss": -6.326496124267578, "global_step": 103239, "epoch": 2458} {"train_loss": -6.322174549102783, "global_step": 103240, "epoch": 2458} {"train_loss": -6.361883640289307, "global_step": 103241, "epoch": 2458} {"train_loss": -6.368783473968506, "global_step": 103242, "epoch": 2458} {"train_loss": -6.393385887145996, "global_step": 103243, "epoch": 2458} {"train_loss": -6.379244804382324, "global_step": 103244, "epoch": 2458} {"train_loss": -6.363285541534424, "global_step": 103245, "epoch": 2458} {"train_loss": -6.4971723556518555, "global_step": 103246, "epoch": 2458} {"train_loss": -6.509848117828369, "global_step": 103247, "epoch": 2458} {"train_loss": -6.304424285888672, "global_step": 103248, "epoch": 2458} {"train_loss": -6.286605358123779, "global_step": 103249, "epoch": 2458} {"train_loss": -6.338680267333984, "global_step": 103250, "epoch": 2458} {"train_loss": -6.468566417694092, "global_step": 103251, "epoch": 2458} {"train_loss": -6.338843822479248, "global_step": 103252, "epoch": 2458} {"train_loss": -6.437690734863281, "global_step": 103253, "epoch": 2458} {"train_loss": -6.398839950561523, "global_step": 103254, "epoch": 2458} {"train_loss": -6.3100666999816895, "global_step": 103255, "epoch": 2458} {"train_loss": -6.344338893890381, "global_step": 103256, "epoch": 2458} {"train_loss": -6.413763046264648, "global_step": 103257, "epoch": 2458} {"train_loss": -6.367241382598877, "global_step": 103258, "epoch": 2458} {"train_loss": -6.382362365722656, "global_step": 103259, "epoch": 2458} {"train_loss": -6.34075927734375, "global_step": 103260, "epoch": 2458} {"train_loss": -6.406529426574707, "global_step": 103261, "epoch": 2458} {"train_loss": -6.380145072937012, "global_step": 103262, "epoch": 2458} {"train_loss": -6.283408164978027, "global_step": 103263, "epoch": 2458} {"train_loss": -6.499002456665039, "global_step": 103264, "epoch": 2458} {"train_loss": -6.445767402648926, "global_step": 103265, "epoch": 2458} {"train_loss": -6.4417266845703125, "global_step": 103266, "epoch": 2458} {"train_loss": -6.418893814086914, "global_step": 103267, "epoch": 2458} {"train_loss": -6.5065765380859375, "global_step": 103268, "epoch": 2458} {"train_loss": -6.36902379989624, "global_step": 103269, "epoch": 2458} {"train_loss": -6.3570356369018555, "global_step": 103270, "epoch": 2458} {"train_loss": -6.451214790344238, "global_step": 103271, "epoch": 2458} {"train_loss": -6.35821533203125, "global_step": 103272, "epoch": 2458} {"train_loss": -6.364608287811279, "global_step": 103273, "epoch": 2458} {"train_loss": -6.296017646789551, "global_step": 103274, "epoch": 2458} {"train_loss": -6.346865653991699, "global_step": 103275, "epoch": 2458} {"train_loss": -6.3516693115234375, "global_step": 103276, "epoch": 2458} {"train_loss": -6.375642958141508, "global_step": 103277, "epoch": 2458, "val_loss": 75902.2890625} {"train_loss": -6.467873573303223, "global_step": 103278, "epoch": 2459} {"train_loss": -6.345733165740967, "global_step": 103279, "epoch": 2459} {"train_loss": -6.352189540863037, "global_step": 103280, "epoch": 2459} {"train_loss": -6.42271614074707, "global_step": 103281, "epoch": 2459} {"train_loss": -6.264257907867432, "global_step": 103282, "epoch": 2459} {"train_loss": -6.339846134185791, "global_step": 103283, "epoch": 2459} {"train_loss": -6.373748779296875, "global_step": 103284, "epoch": 2459} {"train_loss": -6.438390731811523, "global_step": 103285, "epoch": 2459} {"train_loss": -6.403056621551514, "global_step": 103286, "epoch": 2459} {"train_loss": -6.447788715362549, "global_step": 103287, "epoch": 2459} {"train_loss": -6.426143646240234, "global_step": 103288, "epoch": 2459} {"train_loss": -6.473918914794922, "global_step": 103289, "epoch": 2459} {"train_loss": -6.2184600830078125, "global_step": 103290, "epoch": 2459} {"train_loss": -6.394144058227539, "global_step": 103291, "epoch": 2459} {"train_loss": -6.480331897735596, "global_step": 103292, "epoch": 2459} {"train_loss": -6.266956329345703, "global_step": 103293, "epoch": 2459} {"train_loss": -6.46491003036499, "global_step": 103294, "epoch": 2459} {"train_loss": -6.368749141693115, "global_step": 103295, "epoch": 2459} {"train_loss": -6.370669364929199, "global_step": 103296, "epoch": 2459} {"train_loss": -6.369024276733398, "global_step": 103297, "epoch": 2459} {"train_loss": -6.282485008239746, "global_step": 103298, "epoch": 2459} {"train_loss": -6.433091640472412, "global_step": 103299, "epoch": 2459} {"train_loss": -6.294480800628662, "global_step": 103300, "epoch": 2459} {"train_loss": -6.350985050201416, "global_step": 103301, "epoch": 2459} {"train_loss": -6.355932712554932, "global_step": 103302, "epoch": 2459} {"train_loss": -6.2829718589782715, "global_step": 103303, "epoch": 2459} {"train_loss": -6.3717851638793945, "global_step": 103304, "epoch": 2459} {"train_loss": -6.398634433746338, "global_step": 103305, "epoch": 2459} {"train_loss": -6.403408050537109, "global_step": 103306, "epoch": 2459} {"train_loss": -6.250345230102539, "global_step": 103307, "epoch": 2459} {"train_loss": -6.386889934539795, "global_step": 103308, "epoch": 2459} {"train_loss": -6.470790863037109, "global_step": 103309, "epoch": 2459} {"train_loss": -6.46619987487793, "global_step": 103310, "epoch": 2459} {"train_loss": -6.368584632873535, "global_step": 103311, "epoch": 2459} {"train_loss": -6.471485137939453, "global_step": 103312, "epoch": 2459} {"train_loss": -6.381262302398682, "global_step": 103313, "epoch": 2459} {"train_loss": -6.381199359893799, "global_step": 103314, "epoch": 2459} {"train_loss": -6.359630107879639, "global_step": 103315, "epoch": 2459} {"train_loss": -6.330196380615234, "global_step": 103316, "epoch": 2459} {"train_loss": -6.339730262756348, "global_step": 103317, "epoch": 2459} {"train_loss": -6.280580520629883, "global_step": 103318, "epoch": 2459} {"train_loss": -6.373207591828846, "global_step": 103319, "epoch": 2459, "val_loss": 76059.2578125} {"train_loss": -6.362280368804932, "global_step": 103320, "epoch": 2460} {"train_loss": -6.407589912414551, "global_step": 103321, "epoch": 2460} {"train_loss": -6.366072654724121, "global_step": 103322, "epoch": 2460} {"train_loss": -6.359357833862305, "global_step": 103323, "epoch": 2460} {"train_loss": -6.375594139099121, "global_step": 103324, "epoch": 2460} {"train_loss": -6.487112045288086, "global_step": 103325, "epoch": 2460} {"train_loss": -6.436499118804932, "global_step": 103326, "epoch": 2460} {"train_loss": -6.490237712860107, "global_step": 103327, "epoch": 2460} {"train_loss": -6.301816940307617, "global_step": 103328, "epoch": 2460} {"train_loss": -6.450146675109863, "global_step": 103329, "epoch": 2460} {"train_loss": -6.537101745605469, "global_step": 103330, "epoch": 2460} {"train_loss": -6.253170013427734, "global_step": 103331, "epoch": 2460} {"train_loss": -6.522686958312988, "global_step": 103332, "epoch": 2460} {"train_loss": -6.422013282775879, "global_step": 103333, "epoch": 2460} {"train_loss": -6.424004554748535, "global_step": 103334, "epoch": 2460} {"train_loss": -6.356333255767822, "global_step": 103335, "epoch": 2460} {"train_loss": -6.366933822631836, "global_step": 103336, "epoch": 2460} {"train_loss": -6.4503302574157715, "global_step": 103337, "epoch": 2460} {"train_loss": -6.339965343475342, "global_step": 103338, "epoch": 2460} {"train_loss": -6.346135139465332, "global_step": 103339, "epoch": 2460} {"train_loss": -6.390912055969238, "global_step": 103340, "epoch": 2460} {"train_loss": -6.376852035522461, "global_step": 103341, "epoch": 2460} {"train_loss": -6.372859954833984, "global_step": 103342, "epoch": 2460} {"train_loss": -6.285207748413086, "global_step": 103343, "epoch": 2460} {"train_loss": -6.330041885375977, "global_step": 103344, "epoch": 2460} {"train_loss": -6.405279159545898, "global_step": 103345, "epoch": 2460} {"train_loss": -6.378894805908203, "global_step": 103346, "epoch": 2460} {"train_loss": -6.321823596954346, "global_step": 103347, "epoch": 2460} {"train_loss": -6.331981658935547, "global_step": 103348, "epoch": 2460} {"train_loss": -6.517606735229492, "global_step": 103349, "epoch": 2460} {"train_loss": -6.3735504150390625, "global_step": 103350, "epoch": 2460} {"train_loss": -6.370593070983887, "global_step": 103351, "epoch": 2460} {"train_loss": -6.327736854553223, "global_step": 103352, "epoch": 2460} {"train_loss": -6.496562957763672, "global_step": 103353, "epoch": 2460} {"train_loss": -6.29514217376709, "global_step": 103354, "epoch": 2460} {"train_loss": -6.382815837860107, "global_step": 103355, "epoch": 2460} {"train_loss": -6.33111047744751, "global_step": 103356, "epoch": 2460} {"train_loss": -6.394742965698242, "global_step": 103357, "epoch": 2460} {"train_loss": -6.463449478149414, "global_step": 103358, "epoch": 2460} {"train_loss": -6.4169535636901855, "global_step": 103359, "epoch": 2460} {"train_loss": -6.450166702270508, "global_step": 103360, "epoch": 2460} {"train_loss": -6.392248323985508, "global_step": 103361, "epoch": 2460, "val_loss": 75847.0390625} {"train_loss": -6.331212520599365, "global_step": 103362, "epoch": 2461} {"train_loss": -6.56770133972168, "global_step": 103363, "epoch": 2461} {"train_loss": -6.455559730529785, "global_step": 103364, "epoch": 2461} {"train_loss": -6.3022565841674805, "global_step": 103365, "epoch": 2461} {"train_loss": -6.4412407875061035, "global_step": 103366, "epoch": 2461} {"train_loss": -6.43609094619751, "global_step": 103367, "epoch": 2461} {"train_loss": -6.377139568328857, "global_step": 103368, "epoch": 2461} {"train_loss": -6.413613319396973, "global_step": 103369, "epoch": 2461} {"train_loss": -6.4810590744018555, "global_step": 103370, "epoch": 2461} {"train_loss": -6.4654951095581055, "global_step": 103371, "epoch": 2461} {"train_loss": -6.387699127197266, "global_step": 103372, "epoch": 2461} {"train_loss": -6.323592185974121, "global_step": 103373, "epoch": 2461} {"train_loss": -6.347245693206787, "global_step": 103374, "epoch": 2461} {"train_loss": -6.339491844177246, "global_step": 103375, "epoch": 2461} {"train_loss": -6.295571327209473, "global_step": 103376, "epoch": 2461} {"train_loss": -6.341666221618652, "global_step": 103377, "epoch": 2461} {"train_loss": -6.374594688415527, "global_step": 103378, "epoch": 2461} {"train_loss": -6.292089462280273, "global_step": 103379, "epoch": 2461} {"train_loss": -6.347957134246826, "global_step": 103380, "epoch": 2461} {"train_loss": -6.3891496658325195, "global_step": 103381, "epoch": 2461} {"train_loss": -6.372331142425537, "global_step": 103382, "epoch": 2461} {"train_loss": -6.38962459564209, "global_step": 103383, "epoch": 2461} {"train_loss": -6.378692626953125, "global_step": 103384, "epoch": 2461} {"train_loss": -6.437952995300293, "global_step": 103385, "epoch": 2461} {"train_loss": -6.362575531005859, "global_step": 103386, "epoch": 2461} {"train_loss": -6.359469413757324, "global_step": 103387, "epoch": 2461} {"train_loss": -6.215892791748047, "global_step": 103388, "epoch": 2461} {"train_loss": -6.484903812408447, "global_step": 103389, "epoch": 2461} {"train_loss": -6.454130172729492, "global_step": 103390, "epoch": 2461} {"train_loss": -6.316256046295166, "global_step": 103391, "epoch": 2461} {"train_loss": -6.419028282165527, "global_step": 103392, "epoch": 2461} {"train_loss": -6.396732330322266, "global_step": 103393, "epoch": 2461} {"train_loss": -6.516907215118408, "global_step": 103394, "epoch": 2461} {"train_loss": -6.419830799102783, "global_step": 103395, "epoch": 2461} {"train_loss": -6.471869468688965, "global_step": 103396, "epoch": 2461} {"train_loss": -6.38979434967041, "global_step": 103397, "epoch": 2461} {"train_loss": -6.422863006591797, "global_step": 103398, "epoch": 2461} {"train_loss": -6.418822765350342, "global_step": 103399, "epoch": 2461} {"train_loss": -6.478054046630859, "global_step": 103400, "epoch": 2461} {"train_loss": -6.423708438873291, "global_step": 103401, "epoch": 2461} {"train_loss": -6.234636306762695, "global_step": 103402, "epoch": 2461} {"train_loss": -6.390354746863956, "global_step": 103403, "epoch": 2461, "val_loss": 76082.921875} {"train_loss": -6.281965732574463, "global_step": 103404, "epoch": 2462} {"train_loss": -6.415338516235352, "global_step": 103405, "epoch": 2462} {"train_loss": -6.253559589385986, "global_step": 103406, "epoch": 2462} {"train_loss": -6.2447919845581055, "global_step": 103407, "epoch": 2462} {"train_loss": -6.350395202636719, "global_step": 103408, "epoch": 2462} {"train_loss": -6.344470977783203, "global_step": 103409, "epoch": 2462} {"train_loss": -6.420734405517578, "global_step": 103410, "epoch": 2462} {"train_loss": -6.282047271728516, "global_step": 103411, "epoch": 2462} {"train_loss": -6.36020040512085, "global_step": 103412, "epoch": 2462} {"train_loss": -6.3769731521606445, "global_step": 103413, "epoch": 2462} {"train_loss": -6.389976501464844, "global_step": 103414, "epoch": 2462} {"train_loss": -6.444931507110596, "global_step": 103415, "epoch": 2462} {"train_loss": -6.362458229064941, "global_step": 103416, "epoch": 2462} {"train_loss": -6.4008941650390625, "global_step": 103417, "epoch": 2462} {"train_loss": -6.430152893066406, "global_step": 103418, "epoch": 2462} {"train_loss": -6.46673583984375, "global_step": 103419, "epoch": 2462} {"train_loss": -6.343076705932617, "global_step": 103420, "epoch": 2462} {"train_loss": -6.376480579376221, "global_step": 103421, "epoch": 2462} {"train_loss": -6.5353498458862305, "global_step": 103422, "epoch": 2462} {"train_loss": -6.492881774902344, "global_step": 103423, "epoch": 2462} {"train_loss": -6.385139465332031, "global_step": 103424, "epoch": 2462} {"train_loss": -6.492923736572266, "global_step": 103425, "epoch": 2462} {"train_loss": -6.376568794250488, "global_step": 103426, "epoch": 2462} {"train_loss": -6.174496650695801, "global_step": 103427, "epoch": 2462} {"train_loss": -6.379267692565918, "global_step": 103428, "epoch": 2462} {"train_loss": -6.397855758666992, "global_step": 103429, "epoch": 2462} {"train_loss": -6.412225723266602, "global_step": 103430, "epoch": 2462} {"train_loss": -6.409607410430908, "global_step": 103431, "epoch": 2462} {"train_loss": -6.459977149963379, "global_step": 103432, "epoch": 2462} {"train_loss": -6.412687301635742, "global_step": 103433, "epoch": 2462} {"train_loss": -6.373568534851074, "global_step": 103434, "epoch": 2462} {"train_loss": -6.4987592697143555, "global_step": 103435, "epoch": 2462} {"train_loss": -6.269318580627441, "global_step": 103436, "epoch": 2462} {"train_loss": -6.42184591293335, "global_step": 103437, "epoch": 2462} {"train_loss": -6.329421043395996, "global_step": 103438, "epoch": 2462} {"train_loss": -6.400402545928955, "global_step": 103439, "epoch": 2462} {"train_loss": -6.396642684936523, "global_step": 103440, "epoch": 2462} {"train_loss": -6.392128944396973, "global_step": 103441, "epoch": 2462} {"train_loss": -6.4454851150512695, "global_step": 103442, "epoch": 2462} {"train_loss": -6.394042491912842, "global_step": 103443, "epoch": 2462} {"train_loss": -6.437345504760742, "global_step": 103444, "epoch": 2462} {"train_loss": -6.386548541841053, "global_step": 103445, "epoch": 2462, "val_loss": 76046.890625} {"train_loss": -6.240057468414307, "global_step": 103446, "epoch": 2463} {"train_loss": -6.359196662902832, "global_step": 103447, "epoch": 2463} {"train_loss": -6.327297210693359, "global_step": 103448, "epoch": 2463} {"train_loss": -6.271393775939941, "global_step": 103449, "epoch": 2463} {"train_loss": -6.254072189331055, "global_step": 103450, "epoch": 2463} {"train_loss": -6.502202987670898, "global_step": 103451, "epoch": 2463} {"train_loss": -6.417850494384766, "global_step": 103452, "epoch": 2463} {"train_loss": -6.4399871826171875, "global_step": 103453, "epoch": 2463} {"train_loss": -6.449674606323242, "global_step": 103454, "epoch": 2463} {"train_loss": -6.296332836151123, "global_step": 103455, "epoch": 2463} {"train_loss": -6.494438171386719, "global_step": 103456, "epoch": 2463} {"train_loss": -6.363184452056885, "global_step": 103457, "epoch": 2463} {"train_loss": -6.505232334136963, "global_step": 103458, "epoch": 2463} {"train_loss": -6.313694000244141, "global_step": 103459, "epoch": 2463} {"train_loss": -6.466279983520508, "global_step": 103460, "epoch": 2463} {"train_loss": -6.229363441467285, "global_step": 103461, "epoch": 2463} {"train_loss": -6.3887553215026855, "global_step": 103462, "epoch": 2463} {"train_loss": -6.447918891906738, "global_step": 103463, "epoch": 2463} {"train_loss": -6.512889385223389, "global_step": 103464, "epoch": 2463} {"train_loss": -6.405194282531738, "global_step": 103465, "epoch": 2463} {"train_loss": -6.428221702575684, "global_step": 103466, "epoch": 2463} {"train_loss": -6.471767902374268, "global_step": 103467, "epoch": 2463} {"train_loss": -6.392009258270264, "global_step": 103468, "epoch": 2463} {"train_loss": -6.474606990814209, "global_step": 103469, "epoch": 2463} {"train_loss": -6.343393802642822, "global_step": 103470, "epoch": 2463} {"train_loss": -6.520381450653076, "global_step": 103471, "epoch": 2463} {"train_loss": -6.390887260437012, "global_step": 103472, "epoch": 2463} {"train_loss": -6.48071813583374, "global_step": 103473, "epoch": 2463} {"train_loss": -6.364606857299805, "global_step": 103474, "epoch": 2463} {"train_loss": -6.416789531707764, "global_step": 103475, "epoch": 2463} {"train_loss": -6.337445259094238, "global_step": 103476, "epoch": 2463} {"train_loss": -6.426882266998291, "global_step": 103477, "epoch": 2463} {"train_loss": -6.386582374572754, "global_step": 103478, "epoch": 2463} {"train_loss": -6.353391647338867, "global_step": 103479, "epoch": 2463} {"train_loss": -6.38137674331665, "global_step": 103480, "epoch": 2463} {"train_loss": -6.460926055908203, "global_step": 103481, "epoch": 2463} {"train_loss": -6.363002777099609, "global_step": 103482, "epoch": 2463} {"train_loss": -6.362064361572266, "global_step": 103483, "epoch": 2463} {"train_loss": -6.332744598388672, "global_step": 103484, "epoch": 2463} {"train_loss": -6.509902000427246, "global_step": 103485, "epoch": 2463} {"train_loss": -6.535672187805176, "global_step": 103486, "epoch": 2463} {"train_loss": -6.3992511204310825, "global_step": 103487, "epoch": 2463, "val_loss": 76240.9140625} {"train_loss": -6.398959636688232, "global_step": 103488, "epoch": 2464} {"train_loss": -6.454062461853027, "global_step": 103489, "epoch": 2464} {"train_loss": -6.358021259307861, "global_step": 103490, "epoch": 2464} {"train_loss": -6.421757698059082, "global_step": 103491, "epoch": 2464} {"train_loss": -6.319046497344971, "global_step": 103492, "epoch": 2464} {"train_loss": -6.417014122009277, "global_step": 103493, "epoch": 2464} {"train_loss": -6.34757137298584, "global_step": 103494, "epoch": 2464} {"train_loss": -6.396664619445801, "global_step": 103495, "epoch": 2464} {"train_loss": -6.462532043457031, "global_step": 103496, "epoch": 2464} {"train_loss": -6.2870330810546875, "global_step": 103497, "epoch": 2464} {"train_loss": -6.377534866333008, "global_step": 103498, "epoch": 2464} {"train_loss": -6.396853446960449, "global_step": 103499, "epoch": 2464} {"train_loss": -6.372323036193848, "global_step": 103500, "epoch": 2464} {"train_loss": -6.369172096252441, "global_step": 103501, "epoch": 2464} {"train_loss": -6.363452911376953, "global_step": 103502, "epoch": 2464} {"train_loss": -6.35073184967041, "global_step": 103503, "epoch": 2464} {"train_loss": -6.454462051391602, "global_step": 103504, "epoch": 2464} {"train_loss": -6.2615580558776855, "global_step": 103505, "epoch": 2464} {"train_loss": -6.3959760665893555, "global_step": 103506, "epoch": 2464} {"train_loss": -6.467728137969971, "global_step": 103507, "epoch": 2464} {"train_loss": -6.467040061950684, "global_step": 103508, "epoch": 2464} {"train_loss": -6.366170406341553, "global_step": 103509, "epoch": 2464} {"train_loss": -6.507248878479004, "global_step": 103510, "epoch": 2464} {"train_loss": -6.352601051330566, "global_step": 103511, "epoch": 2464} {"train_loss": -6.36464262008667, "global_step": 103512, "epoch": 2464} {"train_loss": -6.4111328125, "global_step": 103513, "epoch": 2464} {"train_loss": -6.380612373352051, "global_step": 103514, "epoch": 2464} {"train_loss": -6.42111873626709, "global_step": 103515, "epoch": 2464} {"train_loss": -6.463809013366699, "global_step": 103516, "epoch": 2464} {"train_loss": -6.412655830383301, "global_step": 103517, "epoch": 2464} {"train_loss": -6.281712532043457, "global_step": 103518, "epoch": 2464} {"train_loss": -6.340458869934082, "global_step": 103519, "epoch": 2464} {"train_loss": -6.316496849060059, "global_step": 103520, "epoch": 2464} {"train_loss": -6.446466445922852, "global_step": 103521, "epoch": 2464} {"train_loss": -6.331838607788086, "global_step": 103522, "epoch": 2464} {"train_loss": -6.3878960609436035, "global_step": 103523, "epoch": 2464} {"train_loss": -6.401152610778809, "global_step": 103524, "epoch": 2464} {"train_loss": -6.334292888641357, "global_step": 103525, "epoch": 2464} {"train_loss": -6.3649187088012695, "global_step": 103526, "epoch": 2464} {"train_loss": -6.405607223510742, "global_step": 103527, "epoch": 2464} {"train_loss": -6.462428092956543, "global_step": 103528, "epoch": 2464} {"train_loss": -6.388597136452084, "global_step": 103529, "epoch": 2464, "val_loss": 75744.171875} {"train_loss": -6.406403541564941, "global_step": 103530, "epoch": 2465} {"train_loss": -6.408413887023926, "global_step": 103531, "epoch": 2465} {"train_loss": -6.353342533111572, "global_step": 103532, "epoch": 2465} {"train_loss": -6.520956993103027, "global_step": 103533, "epoch": 2465} {"train_loss": -6.270286560058594, "global_step": 103534, "epoch": 2465} {"train_loss": -6.410003662109375, "global_step": 103535, "epoch": 2465} {"train_loss": -6.438072204589844, "global_step": 103536, "epoch": 2465} {"train_loss": -6.412960052490234, "global_step": 103537, "epoch": 2465} {"train_loss": -6.39825439453125, "global_step": 103538, "epoch": 2465} {"train_loss": -6.349265098571777, "global_step": 103539, "epoch": 2465} {"train_loss": -6.271629333496094, "global_step": 103540, "epoch": 2465} {"train_loss": -6.422093868255615, "global_step": 103541, "epoch": 2465} {"train_loss": -6.293918609619141, "global_step": 103542, "epoch": 2465} {"train_loss": -6.385976791381836, "global_step": 103543, "epoch": 2465} {"train_loss": -6.336189270019531, "global_step": 103544, "epoch": 2465} {"train_loss": -6.5195698738098145, "global_step": 103545, "epoch": 2465} {"train_loss": -6.358691215515137, "global_step": 103546, "epoch": 2465} {"train_loss": -6.329545974731445, "global_step": 103547, "epoch": 2465} {"train_loss": -6.435965538024902, "global_step": 103548, "epoch": 2465} {"train_loss": -6.456471920013428, "global_step": 103549, "epoch": 2465} {"train_loss": -6.315505027770996, "global_step": 103550, "epoch": 2465} {"train_loss": -6.293222427368164, "global_step": 103551, "epoch": 2465} {"train_loss": -6.437200546264648, "global_step": 103552, "epoch": 2465} {"train_loss": -6.456871032714844, "global_step": 103553, "epoch": 2465} {"train_loss": -6.338061332702637, "global_step": 103554, "epoch": 2465} {"train_loss": -6.480420112609863, "global_step": 103555, "epoch": 2465} {"train_loss": -6.378265380859375, "global_step": 103556, "epoch": 2465} {"train_loss": -6.383947849273682, "global_step": 103557, "epoch": 2465} {"train_loss": -6.512141227722168, "global_step": 103558, "epoch": 2465} {"train_loss": -6.1792778968811035, "global_step": 103559, "epoch": 2465} {"train_loss": -6.331902503967285, "global_step": 103560, "epoch": 2465} {"train_loss": -6.460443019866943, "global_step": 103561, "epoch": 2465} {"train_loss": -6.109950065612793, "global_step": 103562, "epoch": 2465} {"train_loss": -6.421243667602539, "global_step": 103563, "epoch": 2465} {"train_loss": -6.291857719421387, "global_step": 103564, "epoch": 2465} {"train_loss": -6.317288398742676, "global_step": 103565, "epoch": 2465} {"train_loss": -6.429676532745361, "global_step": 103566, "epoch": 2465} {"train_loss": -6.281900405883789, "global_step": 103567, "epoch": 2465} {"train_loss": -6.368134498596191, "global_step": 103568, "epoch": 2465} {"train_loss": -6.257683753967285, "global_step": 103569, "epoch": 2465} {"train_loss": -6.356009483337402, "global_step": 103570, "epoch": 2465} {"train_loss": -6.371428682690575, "global_step": 103571, "epoch": 2465, "val_loss": 75873.6328125} {"train_loss": -6.372625350952148, "global_step": 103572, "epoch": 2466} {"train_loss": -6.470865249633789, "global_step": 103573, "epoch": 2466} {"train_loss": -6.338082313537598, "global_step": 103574, "epoch": 2466} {"train_loss": -6.37164306640625, "global_step": 103575, "epoch": 2466} {"train_loss": -6.379909515380859, "global_step": 103576, "epoch": 2466} {"train_loss": -6.4925947189331055, "global_step": 103577, "epoch": 2466} {"train_loss": -6.413575172424316, "global_step": 103578, "epoch": 2466} {"train_loss": -6.263687610626221, "global_step": 103579, "epoch": 2466} {"train_loss": -6.357682704925537, "global_step": 103580, "epoch": 2466} {"train_loss": -6.440266132354736, "global_step": 103581, "epoch": 2466} {"train_loss": -6.400683879852295, "global_step": 103582, "epoch": 2466} {"train_loss": -6.376211166381836, "global_step": 103583, "epoch": 2466} {"train_loss": -6.556066989898682, "global_step": 103584, "epoch": 2466} {"train_loss": -6.40630578994751, "global_step": 103585, "epoch": 2466} {"train_loss": -6.371120452880859, "global_step": 103586, "epoch": 2466} {"train_loss": -6.399080276489258, "global_step": 103587, "epoch": 2466} {"train_loss": -6.473883628845215, "global_step": 103588, "epoch": 2466} {"train_loss": -6.476116180419922, "global_step": 103589, "epoch": 2466} {"train_loss": -6.526090621948242, "global_step": 103590, "epoch": 2466} {"train_loss": -6.444596767425537, "global_step": 103591, "epoch": 2466} {"train_loss": -6.323511600494385, "global_step": 103592, "epoch": 2466} {"train_loss": -6.450949668884277, "global_step": 103593, "epoch": 2466} {"train_loss": -6.363593578338623, "global_step": 103594, "epoch": 2466} {"train_loss": -6.347294807434082, "global_step": 103595, "epoch": 2466} {"train_loss": -6.404074192047119, "global_step": 103596, "epoch": 2466} {"train_loss": -6.268317222595215, "global_step": 103597, "epoch": 2466} {"train_loss": -6.353820323944092, "global_step": 103598, "epoch": 2466} {"train_loss": -6.404252052307129, "global_step": 103599, "epoch": 2466} {"train_loss": -6.45140266418457, "global_step": 103600, "epoch": 2466} {"train_loss": -6.534391403198242, "global_step": 103601, "epoch": 2466} {"train_loss": -6.385879993438721, "global_step": 103602, "epoch": 2466} {"train_loss": -6.385237693786621, "global_step": 103603, "epoch": 2466} {"train_loss": -6.410946846008301, "global_step": 103604, "epoch": 2466} {"train_loss": -6.373881816864014, "global_step": 103605, "epoch": 2466} {"train_loss": -6.39859676361084, "global_step": 103606, "epoch": 2466} {"train_loss": -6.41751766204834, "global_step": 103607, "epoch": 2466} {"train_loss": -6.569397926330566, "global_step": 103608, "epoch": 2466} {"train_loss": -6.5068511962890625, "global_step": 103609, "epoch": 2466} {"train_loss": -6.42746114730835, "global_step": 103610, "epoch": 2466} {"train_loss": -6.445852279663086, "global_step": 103611, "epoch": 2466} {"train_loss": -6.405599117279053, "global_step": 103612, "epoch": 2466} {"train_loss": -6.412211951755342, "global_step": 103613, "epoch": 2466, "val_loss": 75977.484375} {"train_loss": -6.4909820556640625, "global_step": 103614, "epoch": 2467} {"train_loss": -6.419933319091797, "global_step": 103615, "epoch": 2467} {"train_loss": -6.393754005432129, "global_step": 103616, "epoch": 2467} {"train_loss": -6.443744659423828, "global_step": 103617, "epoch": 2467} {"train_loss": -6.475670337677002, "global_step": 103618, "epoch": 2467} {"train_loss": -6.4359588623046875, "global_step": 103619, "epoch": 2467} {"train_loss": -6.444894790649414, "global_step": 103620, "epoch": 2467} {"train_loss": -6.460613250732422, "global_step": 103621, "epoch": 2467} {"train_loss": -6.337196350097656, "global_step": 103622, "epoch": 2467} {"train_loss": -6.393676280975342, "global_step": 103623, "epoch": 2467} {"train_loss": -6.481419563293457, "global_step": 103624, "epoch": 2467} {"train_loss": -6.311746120452881, "global_step": 103625, "epoch": 2467} {"train_loss": -6.460392951965332, "global_step": 103626, "epoch": 2467} {"train_loss": -6.375, "global_step": 103627, "epoch": 2467} {"train_loss": -6.419207572937012, "global_step": 103628, "epoch": 2467} {"train_loss": -6.4120683670043945, "global_step": 103629, "epoch": 2467} {"train_loss": -6.437450408935547, "global_step": 103630, "epoch": 2467} {"train_loss": -6.392786979675293, "global_step": 103631, "epoch": 2467} {"train_loss": -6.4550652503967285, "global_step": 103632, "epoch": 2467} {"train_loss": -6.389366626739502, "global_step": 103633, "epoch": 2467} {"train_loss": -6.365627288818359, "global_step": 103634, "epoch": 2467} {"train_loss": -6.384626388549805, "global_step": 103635, "epoch": 2467} {"train_loss": -6.332390785217285, "global_step": 103636, "epoch": 2467} {"train_loss": -6.587080001831055, "global_step": 103637, "epoch": 2467} {"train_loss": -6.455267906188965, "global_step": 103638, "epoch": 2467} {"train_loss": -6.464815139770508, "global_step": 103639, "epoch": 2467} {"train_loss": -6.4485626220703125, "global_step": 103640, "epoch": 2467} {"train_loss": -6.421548366546631, "global_step": 103641, "epoch": 2467} {"train_loss": -6.469635009765625, "global_step": 103642, "epoch": 2467} {"train_loss": -6.312946796417236, "global_step": 103643, "epoch": 2467} {"train_loss": -6.4817352294921875, "global_step": 103644, "epoch": 2467} {"train_loss": -6.438984394073486, "global_step": 103645, "epoch": 2467} {"train_loss": -6.509112358093262, "global_step": 103646, "epoch": 2467} {"train_loss": -6.367353439331055, "global_step": 103647, "epoch": 2467} {"train_loss": -6.332334518432617, "global_step": 103648, "epoch": 2467} {"train_loss": -6.3467116355896, "global_step": 103649, "epoch": 2467} {"train_loss": -6.419260025024414, "global_step": 103650, "epoch": 2467} {"train_loss": -6.3437652587890625, "global_step": 103651, "epoch": 2467} {"train_loss": -6.435156345367432, "global_step": 103652, "epoch": 2467} {"train_loss": -6.518847465515137, "global_step": 103653, "epoch": 2467} {"train_loss": -6.380303859710693, "global_step": 103654, "epoch": 2467} {"train_loss": -6.421113525118146, "global_step": 103655, "epoch": 2467, "val_loss": 76056.8359375} {"train_loss": -6.393441200256348, "global_step": 103656, "epoch": 2468} {"train_loss": -6.355554103851318, "global_step": 103657, "epoch": 2468} {"train_loss": -6.444771766662598, "global_step": 103658, "epoch": 2468} {"train_loss": -6.379260063171387, "global_step": 103659, "epoch": 2468} {"train_loss": -6.398930549621582, "global_step": 103660, "epoch": 2468} {"train_loss": -6.369956970214844, "global_step": 103661, "epoch": 2468} {"train_loss": -6.351418972015381, "global_step": 103662, "epoch": 2468} {"train_loss": -6.352566719055176, "global_step": 103663, "epoch": 2468} {"train_loss": -6.321715831756592, "global_step": 103664, "epoch": 2468} {"train_loss": -6.322699546813965, "global_step": 103665, "epoch": 2468} {"train_loss": -6.396492004394531, "global_step": 103666, "epoch": 2468} {"train_loss": -6.371265411376953, "global_step": 103667, "epoch": 2468} {"train_loss": -6.395044326782227, "global_step": 103668, "epoch": 2468} {"train_loss": -6.522459506988525, "global_step": 103669, "epoch": 2468} {"train_loss": -6.314154148101807, "global_step": 103670, "epoch": 2468} {"train_loss": -6.414400577545166, "global_step": 103671, "epoch": 2468} {"train_loss": -6.488136291503906, "global_step": 103672, "epoch": 2468} {"train_loss": -6.3963189125061035, "global_step": 103673, "epoch": 2468} {"train_loss": -6.452146053314209, "global_step": 103674, "epoch": 2468} {"train_loss": -6.442481517791748, "global_step": 103675, "epoch": 2468} {"train_loss": -6.346168041229248, "global_step": 103676, "epoch": 2468} {"train_loss": -6.391669273376465, "global_step": 103677, "epoch": 2468} {"train_loss": -6.33012580871582, "global_step": 103678, "epoch": 2468} {"train_loss": -6.369557857513428, "global_step": 103679, "epoch": 2468} {"train_loss": -6.361196517944336, "global_step": 103680, "epoch": 2468} {"train_loss": -6.433011054992676, "global_step": 103681, "epoch": 2468} {"train_loss": -6.35880184173584, "global_step": 103682, "epoch": 2468} {"train_loss": -6.435614585876465, "global_step": 103683, "epoch": 2468} {"train_loss": -6.382823467254639, "global_step": 103684, "epoch": 2468} {"train_loss": -6.310667514801025, "global_step": 103685, "epoch": 2468} {"train_loss": -6.425264835357666, "global_step": 103686, "epoch": 2468} {"train_loss": -6.358818054199219, "global_step": 103687, "epoch": 2468} {"train_loss": -6.336895942687988, "global_step": 103688, "epoch": 2468} {"train_loss": -6.4253129959106445, "global_step": 103689, "epoch": 2468} {"train_loss": -6.352104663848877, "global_step": 103690, "epoch": 2468} {"train_loss": -6.338571548461914, "global_step": 103691, "epoch": 2468} {"train_loss": -6.421082973480225, "global_step": 103692, "epoch": 2468} {"train_loss": -6.432105541229248, "global_step": 103693, "epoch": 2468} {"train_loss": -6.425863742828369, "global_step": 103694, "epoch": 2468} {"train_loss": -6.512135982513428, "global_step": 103695, "epoch": 2468} {"train_loss": -6.529780387878418, "global_step": 103696, "epoch": 2468} {"train_loss": -6.395883446648007, "global_step": 103697, "epoch": 2468, "val_loss": 75985.609375} {"train_loss": -6.378393650054932, "global_step": 103698, "epoch": 2469} {"train_loss": -6.386260032653809, "global_step": 103699, "epoch": 2469} {"train_loss": -6.449429512023926, "global_step": 103700, "epoch": 2469} {"train_loss": -6.444348335266113, "global_step": 103701, "epoch": 2469} {"train_loss": -6.469464302062988, "global_step": 103702, "epoch": 2469} {"train_loss": -6.349753379821777, "global_step": 103703, "epoch": 2469} {"train_loss": -6.521638870239258, "global_step": 103704, "epoch": 2469} {"train_loss": -6.35004997253418, "global_step": 103705, "epoch": 2469} {"train_loss": -6.487565040588379, "global_step": 103706, "epoch": 2469} {"train_loss": -6.477255821228027, "global_step": 103707, "epoch": 2469} {"train_loss": -6.430694103240967, "global_step": 103708, "epoch": 2469} {"train_loss": -6.447381496429443, "global_step": 103709, "epoch": 2469} {"train_loss": -6.40340518951416, "global_step": 103710, "epoch": 2469} {"train_loss": -6.430839538574219, "global_step": 103711, "epoch": 2469} {"train_loss": -6.50213623046875, "global_step": 103712, "epoch": 2469} {"train_loss": -6.496865749359131, "global_step": 103713, "epoch": 2469} {"train_loss": -6.455849647521973, "global_step": 103714, "epoch": 2469} {"train_loss": -6.371485710144043, "global_step": 103715, "epoch": 2469} {"train_loss": -6.403800010681152, "global_step": 103716, "epoch": 2469} {"train_loss": -6.515618324279785, "global_step": 103717, "epoch": 2469} {"train_loss": -6.480203628540039, "global_step": 103718, "epoch": 2469} {"train_loss": -6.3318562507629395, "global_step": 103719, "epoch": 2469} {"train_loss": -6.346151351928711, "global_step": 103720, "epoch": 2469} {"train_loss": -6.444015026092529, "global_step": 103721, "epoch": 2469} {"train_loss": -6.417293071746826, "global_step": 103722, "epoch": 2469} {"train_loss": -6.341085433959961, "global_step": 103723, "epoch": 2469} {"train_loss": -6.394503593444824, "global_step": 103724, "epoch": 2469} {"train_loss": -6.490917682647705, "global_step": 103725, "epoch": 2469} {"train_loss": -6.340729236602783, "global_step": 103726, "epoch": 2469} {"train_loss": -6.325006484985352, "global_step": 103727, "epoch": 2469} {"train_loss": -6.407870769500732, "global_step": 103728, "epoch": 2469} {"train_loss": -6.355538368225098, "global_step": 103729, "epoch": 2469} {"train_loss": -6.396252632141113, "global_step": 103730, "epoch": 2469} {"train_loss": -6.4599504470825195, "global_step": 103731, "epoch": 2469} {"train_loss": -6.455163955688477, "global_step": 103732, "epoch": 2469} {"train_loss": -6.384626388549805, "global_step": 103733, "epoch": 2469} {"train_loss": -6.250290393829346, "global_step": 103734, "epoch": 2469} {"train_loss": -6.348528861999512, "global_step": 103735, "epoch": 2469} {"train_loss": -6.365657806396484, "global_step": 103736, "epoch": 2469} {"train_loss": -6.345462322235107, "global_step": 103737, "epoch": 2469} {"train_loss": -6.393052101135254, "global_step": 103738, "epoch": 2469} {"train_loss": -6.40862919035412, "global_step": 103739, "epoch": 2469, "val_loss": 76081.46875} {"train_loss": -6.341602325439453, "global_step": 103740, "epoch": 2470} {"train_loss": -6.380205154418945, "global_step": 103741, "epoch": 2470} {"train_loss": -6.342540740966797, "global_step": 103742, "epoch": 2470} {"train_loss": -6.356677532196045, "global_step": 103743, "epoch": 2470} {"train_loss": -6.365894317626953, "global_step": 103744, "epoch": 2470} {"train_loss": -6.450255870819092, "global_step": 103745, "epoch": 2470} {"train_loss": -6.430047988891602, "global_step": 103746, "epoch": 2470} {"train_loss": -6.364781379699707, "global_step": 103747, "epoch": 2470} {"train_loss": -6.372133255004883, "global_step": 103748, "epoch": 2470} {"train_loss": -6.433778762817383, "global_step": 103749, "epoch": 2470} {"train_loss": -6.451374530792236, "global_step": 103750, "epoch": 2470} {"train_loss": -6.39666223526001, "global_step": 103751, "epoch": 2470} {"train_loss": -6.371556758880615, "global_step": 103752, "epoch": 2470} {"train_loss": -6.390874862670898, "global_step": 103753, "epoch": 2470} {"train_loss": -6.287675857543945, "global_step": 103754, "epoch": 2470} {"train_loss": -6.479896068572998, "global_step": 103755, "epoch": 2470} {"train_loss": -6.39506721496582, "global_step": 103756, "epoch": 2470} {"train_loss": -6.281486511230469, "global_step": 103757, "epoch": 2470} {"train_loss": -6.318303108215332, "global_step": 103758, "epoch": 2470} {"train_loss": -6.451244354248047, "global_step": 103759, "epoch": 2470} {"train_loss": -6.334427833557129, "global_step": 103760, "epoch": 2470} {"train_loss": -6.339113712310791, "global_step": 103761, "epoch": 2470} {"train_loss": -6.514975547790527, "global_step": 103762, "epoch": 2470} {"train_loss": -6.435019016265869, "global_step": 103763, "epoch": 2470} {"train_loss": -6.4155073165893555, "global_step": 103764, "epoch": 2470} {"train_loss": -6.426496505737305, "global_step": 103765, "epoch": 2470} {"train_loss": -6.378419876098633, "global_step": 103766, "epoch": 2470} {"train_loss": -6.375212669372559, "global_step": 103767, "epoch": 2470} {"train_loss": -6.343400955200195, "global_step": 103768, "epoch": 2470} {"train_loss": -6.334073543548584, "global_step": 103769, "epoch": 2470} {"train_loss": -6.3759074211120605, "global_step": 103770, "epoch": 2470} {"train_loss": -6.287908554077148, "global_step": 103771, "epoch": 2470} {"train_loss": -6.2814202308654785, "global_step": 103772, "epoch": 2470} {"train_loss": -6.4442973136901855, "global_step": 103773, "epoch": 2470} {"train_loss": -6.304858684539795, "global_step": 103774, "epoch": 2470} {"train_loss": -6.388678073883057, "global_step": 103775, "epoch": 2470} {"train_loss": -6.20667839050293, "global_step": 103776, "epoch": 2470} {"train_loss": -6.5475358963012695, "global_step": 103777, "epoch": 2470} {"train_loss": -6.389284133911133, "global_step": 103778, "epoch": 2470} {"train_loss": -6.398775577545166, "global_step": 103779, "epoch": 2470} {"train_loss": -6.380186080932617, "global_step": 103780, "epoch": 2470} {"train_loss": -6.381634825751895, "global_step": 103781, "epoch": 2470, "val_loss": 75970.484375} {"train_loss": -6.4495038986206055, "global_step": 103782, "epoch": 2471} {"train_loss": -6.236870765686035, "global_step": 103783, "epoch": 2471} {"train_loss": -6.284311294555664, "global_step": 103784, "epoch": 2471} {"train_loss": -6.438284873962402, "global_step": 103785, "epoch": 2471} {"train_loss": -6.344137191772461, "global_step": 103786, "epoch": 2471} {"train_loss": -6.346871376037598, "global_step": 103787, "epoch": 2471} {"train_loss": -6.441123008728027, "global_step": 103788, "epoch": 2471} {"train_loss": -6.385245323181152, "global_step": 103789, "epoch": 2471} {"train_loss": -6.3752336502075195, "global_step": 103790, "epoch": 2471} {"train_loss": -6.340207099914551, "global_step": 103791, "epoch": 2471} {"train_loss": -6.383013725280762, "global_step": 103792, "epoch": 2471} {"train_loss": -6.185366630554199, "global_step": 103793, "epoch": 2471} {"train_loss": -6.17616081237793, "global_step": 103794, "epoch": 2471} {"train_loss": -6.276827812194824, "global_step": 103795, "epoch": 2471} {"train_loss": -6.280674934387207, "global_step": 103796, "epoch": 2471} {"train_loss": -6.29771089553833, "global_step": 103797, "epoch": 2471} {"train_loss": -6.362081050872803, "global_step": 103798, "epoch": 2471} {"train_loss": -6.392451286315918, "global_step": 103799, "epoch": 2471} {"train_loss": -6.371004104614258, "global_step": 103800, "epoch": 2471} {"train_loss": -6.337569713592529, "global_step": 103801, "epoch": 2471} {"train_loss": -6.44872522354126, "global_step": 103802, "epoch": 2471} {"train_loss": -6.371441841125488, "global_step": 103803, "epoch": 2471} {"train_loss": -6.264698028564453, "global_step": 103804, "epoch": 2471} {"train_loss": -6.386970520019531, "global_step": 103805, "epoch": 2471} {"train_loss": -6.273703575134277, "global_step": 103806, "epoch": 2471} {"train_loss": -6.472990989685059, "global_step": 103807, "epoch": 2471} {"train_loss": -6.282892227172852, "global_step": 103808, "epoch": 2471} {"train_loss": -6.348020553588867, "global_step": 103809, "epoch": 2471} {"train_loss": -6.289501190185547, "global_step": 103810, "epoch": 2471} {"train_loss": -6.335925102233887, "global_step": 103811, "epoch": 2471} {"train_loss": -6.37435245513916, "global_step": 103812, "epoch": 2471} {"train_loss": -6.350585460662842, "global_step": 103813, "epoch": 2471} {"train_loss": -6.359539985656738, "global_step": 103814, "epoch": 2471} {"train_loss": -6.2978925704956055, "global_step": 103815, "epoch": 2471} {"train_loss": -6.438386917114258, "global_step": 103816, "epoch": 2471} {"train_loss": -6.329216957092285, "global_step": 103817, "epoch": 2471} {"train_loss": -6.405928611755371, "global_step": 103818, "epoch": 2471} {"train_loss": -6.360602378845215, "global_step": 103819, "epoch": 2471} {"train_loss": -6.259068965911865, "global_step": 103820, "epoch": 2471} {"train_loss": -6.288127899169922, "global_step": 103821, "epoch": 2471} {"train_loss": -6.3927998542785645, "global_step": 103822, "epoch": 2471} {"train_loss": -6.340317328770955, "global_step": 103823, "epoch": 2471, "val_loss": 75907.3515625} {"train_loss": -6.376448631286621, "global_step": 103824, "epoch": 2472} {"train_loss": -6.422247409820557, "global_step": 103825, "epoch": 2472} {"train_loss": -6.345905303955078, "global_step": 103826, "epoch": 2472} {"train_loss": -6.291234970092773, "global_step": 103827, "epoch": 2472} {"train_loss": -6.357713222503662, "global_step": 103828, "epoch": 2472} {"train_loss": -6.431954860687256, "global_step": 103829, "epoch": 2472} {"train_loss": -6.237969398498535, "global_step": 103830, "epoch": 2472} {"train_loss": -6.357499122619629, "global_step": 103831, "epoch": 2472} {"train_loss": -6.3634796142578125, "global_step": 103832, "epoch": 2472} {"train_loss": -6.315638065338135, "global_step": 103833, "epoch": 2472} {"train_loss": -6.348910808563232, "global_step": 103834, "epoch": 2472} {"train_loss": -6.432137489318848, "global_step": 103835, "epoch": 2472} {"train_loss": -6.303396701812744, "global_step": 103836, "epoch": 2472} {"train_loss": -6.310098171234131, "global_step": 103837, "epoch": 2472} {"train_loss": -6.442586898803711, "global_step": 103838, "epoch": 2472} {"train_loss": -6.36492919921875, "global_step": 103839, "epoch": 2472} {"train_loss": -6.372188568115234, "global_step": 103840, "epoch": 2472} {"train_loss": -6.424918174743652, "global_step": 103841, "epoch": 2472} {"train_loss": -6.335086822509766, "global_step": 103842, "epoch": 2472} {"train_loss": -6.324295997619629, "global_step": 103843, "epoch": 2472} {"train_loss": -6.483623027801514, "global_step": 103844, "epoch": 2472} {"train_loss": -6.366763114929199, "global_step": 103845, "epoch": 2472} {"train_loss": -6.491036415100098, "global_step": 103846, "epoch": 2472} {"train_loss": -6.319817066192627, "global_step": 103847, "epoch": 2472} {"train_loss": -6.3478851318359375, "global_step": 103848, "epoch": 2472} {"train_loss": -6.390506744384766, "global_step": 103849, "epoch": 2472} {"train_loss": -6.213454246520996, "global_step": 103850, "epoch": 2472} {"train_loss": -6.355423927307129, "global_step": 103851, "epoch": 2472} {"train_loss": -6.391146659851074, "global_step": 103852, "epoch": 2472} {"train_loss": -6.324824333190918, "global_step": 103853, "epoch": 2472} {"train_loss": -6.371274471282959, "global_step": 103854, "epoch": 2472} {"train_loss": -6.275486469268799, "global_step": 103855, "epoch": 2472} {"train_loss": -6.421719551086426, "global_step": 103856, "epoch": 2472} {"train_loss": -6.460206508636475, "global_step": 103857, "epoch": 2472} {"train_loss": -6.1740312576293945, "global_step": 103858, "epoch": 2472} {"train_loss": -6.354523658752441, "global_step": 103859, "epoch": 2472} {"train_loss": -6.407404899597168, "global_step": 103860, "epoch": 2472} {"train_loss": -6.28419828414917, "global_step": 103861, "epoch": 2472} {"train_loss": -6.516266822814941, "global_step": 103862, "epoch": 2472} {"train_loss": -6.338864326477051, "global_step": 103863, "epoch": 2472} {"train_loss": -6.40938663482666, "global_step": 103864, "epoch": 2472} {"train_loss": -6.359771876108079, "global_step": 103865, "epoch": 2472, "val_loss": 75605.2578125} {"train_loss": -6.399503707885742, "global_step": 103866, "epoch": 2473} {"train_loss": -6.475639343261719, "global_step": 103867, "epoch": 2473} {"train_loss": -6.389302730560303, "global_step": 103868, "epoch": 2473} {"train_loss": -6.4235029220581055, "global_step": 103869, "epoch": 2473} {"train_loss": -6.382481575012207, "global_step": 103870, "epoch": 2473} {"train_loss": -6.46202278137207, "global_step": 103871, "epoch": 2473} {"train_loss": -6.430537223815918, "global_step": 103872, "epoch": 2473} {"train_loss": -6.4690093994140625, "global_step": 103873, "epoch": 2473} {"train_loss": -6.376060485839844, "global_step": 103874, "epoch": 2473} {"train_loss": -6.354036331176758, "global_step": 103875, "epoch": 2473} {"train_loss": -6.3267974853515625, "global_step": 103876, "epoch": 2473} {"train_loss": -6.4483747482299805, "global_step": 103877, "epoch": 2473} {"train_loss": -6.435216426849365, "global_step": 103878, "epoch": 2473} {"train_loss": -6.494985580444336, "global_step": 103879, "epoch": 2473} {"train_loss": -6.381649971008301, "global_step": 103880, "epoch": 2473} {"train_loss": -6.530558109283447, "global_step": 103881, "epoch": 2473} {"train_loss": -6.434512615203857, "global_step": 103882, "epoch": 2473} {"train_loss": -6.424567699432373, "global_step": 103883, "epoch": 2473} {"train_loss": -6.400486946105957, "global_step": 103884, "epoch": 2473} {"train_loss": -6.430728912353516, "global_step": 103885, "epoch": 2473} {"train_loss": -6.490324020385742, "global_step": 103886, "epoch": 2473} {"train_loss": -6.377436637878418, "global_step": 103887, "epoch": 2473} {"train_loss": -6.408560752868652, "global_step": 103888, "epoch": 2473} {"train_loss": -6.449639320373535, "global_step": 103889, "epoch": 2473} {"train_loss": -6.380395889282227, "global_step": 103890, "epoch": 2473} {"train_loss": -6.495647430419922, "global_step": 103891, "epoch": 2473} {"train_loss": -6.324891090393066, "global_step": 103892, "epoch": 2473} {"train_loss": -6.5195817947387695, "global_step": 103893, "epoch": 2473} {"train_loss": -6.387072563171387, "global_step": 103894, "epoch": 2473} {"train_loss": -6.559165000915527, "global_step": 103895, "epoch": 2473} {"train_loss": -6.509159088134766, "global_step": 103896, "epoch": 2473} {"train_loss": -6.447850227355957, "global_step": 103897, "epoch": 2473} {"train_loss": -6.42572021484375, "global_step": 103898, "epoch": 2473} {"train_loss": -6.490778923034668, "global_step": 103899, "epoch": 2473} {"train_loss": -6.378908157348633, "global_step": 103900, "epoch": 2473} {"train_loss": -6.4163665771484375, "global_step": 103901, "epoch": 2473} {"train_loss": -6.356137275695801, "global_step": 103902, "epoch": 2473} {"train_loss": -6.319308280944824, "global_step": 103903, "epoch": 2473} {"train_loss": -6.330389976501465, "global_step": 103904, "epoch": 2473} {"train_loss": -6.453865051269531, "global_step": 103905, "epoch": 2473} {"train_loss": -6.377425193786621, "global_step": 103906, "epoch": 2473} {"train_loss": -6.4208306812104725, "global_step": 103907, "epoch": 2473, "val_loss": 76115.46875} {"train_loss": -6.4688029289245605, "global_step": 103908, "epoch": 2474} {"train_loss": -6.395542144775391, "global_step": 103909, "epoch": 2474} {"train_loss": -6.4565958976745605, "global_step": 103910, "epoch": 2474} {"train_loss": -6.416248798370361, "global_step": 103911, "epoch": 2474} {"train_loss": -6.378523349761963, "global_step": 103912, "epoch": 2474} {"train_loss": -6.379693031311035, "global_step": 103913, "epoch": 2474} {"train_loss": -6.431906700134277, "global_step": 103914, "epoch": 2474} {"train_loss": -6.428921699523926, "global_step": 103915, "epoch": 2474} {"train_loss": -6.4311676025390625, "global_step": 103916, "epoch": 2474} {"train_loss": -6.37787389755249, "global_step": 103917, "epoch": 2474} {"train_loss": -6.316786766052246, "global_step": 103918, "epoch": 2474} {"train_loss": -6.343805313110352, "global_step": 103919, "epoch": 2474} {"train_loss": -6.437661170959473, "global_step": 103920, "epoch": 2474} {"train_loss": -6.478518486022949, "global_step": 103921, "epoch": 2474} {"train_loss": -6.478709697723389, "global_step": 103922, "epoch": 2474} {"train_loss": -6.435018539428711, "global_step": 103923, "epoch": 2474} {"train_loss": -6.385101318359375, "global_step": 103924, "epoch": 2474} {"train_loss": -6.56304931640625, "global_step": 103925, "epoch": 2474} {"train_loss": -6.492974758148193, "global_step": 103926, "epoch": 2474} {"train_loss": -6.397076606750488, "global_step": 103927, "epoch": 2474} {"train_loss": -6.451594829559326, "global_step": 103928, "epoch": 2474} {"train_loss": -6.4000420570373535, "global_step": 103929, "epoch": 2474} {"train_loss": -6.399499893188477, "global_step": 103930, "epoch": 2474} {"train_loss": -6.503289222717285, "global_step": 103931, "epoch": 2474} {"train_loss": -6.468481540679932, "global_step": 103932, "epoch": 2474} {"train_loss": -6.320371627807617, "global_step": 103933, "epoch": 2474} {"train_loss": -6.386935234069824, "global_step": 103934, "epoch": 2474} {"train_loss": -6.451544761657715, "global_step": 103935, "epoch": 2474} {"train_loss": -6.379560470581055, "global_step": 103936, "epoch": 2474} {"train_loss": -6.466500282287598, "global_step": 103937, "epoch": 2474} {"train_loss": -6.416417121887207, "global_step": 103938, "epoch": 2474} {"train_loss": -6.220653057098389, "global_step": 103939, "epoch": 2474} {"train_loss": -6.345105171203613, "global_step": 103940, "epoch": 2474} {"train_loss": -6.447384834289551, "global_step": 103941, "epoch": 2474} {"train_loss": -6.45731782913208, "global_step": 103942, "epoch": 2474} {"train_loss": -6.455938339233398, "global_step": 103943, "epoch": 2474} {"train_loss": -6.258443832397461, "global_step": 103944, "epoch": 2474} {"train_loss": -6.468880653381348, "global_step": 103945, "epoch": 2474} {"train_loss": -6.488463401794434, "global_step": 103946, "epoch": 2474} {"train_loss": -6.370391845703125, "global_step": 103947, "epoch": 2474} {"train_loss": -6.266552925109863, "global_step": 103948, "epoch": 2474} {"train_loss": -6.413700614656721, "global_step": 103949, "epoch": 2474, "val_loss": 76097.9921875} {"train_loss": -6.378335475921631, "global_step": 103950, "epoch": 2475} {"train_loss": -6.307442665100098, "global_step": 103951, "epoch": 2475} {"train_loss": -6.416553497314453, "global_step": 103952, "epoch": 2475} {"train_loss": -6.366729736328125, "global_step": 103953, "epoch": 2475} {"train_loss": -6.408985137939453, "global_step": 103954, "epoch": 2475} {"train_loss": -6.374792575836182, "global_step": 103955, "epoch": 2475} {"train_loss": -6.454010009765625, "global_step": 103956, "epoch": 2475} {"train_loss": -6.495934009552002, "global_step": 103957, "epoch": 2475} {"train_loss": -6.396488189697266, "global_step": 103958, "epoch": 2475} {"train_loss": -6.3941802978515625, "global_step": 103959, "epoch": 2475} {"train_loss": -6.355974197387695, "global_step": 103960, "epoch": 2475} {"train_loss": -6.424862861633301, "global_step": 103961, "epoch": 2475} {"train_loss": -6.260779857635498, "global_step": 103962, "epoch": 2475} {"train_loss": -6.409884452819824, "global_step": 103963, "epoch": 2475} {"train_loss": -6.38554048538208, "global_step": 103964, "epoch": 2475} {"train_loss": -6.338747024536133, "global_step": 103965, "epoch": 2475} {"train_loss": -6.4416584968566895, "global_step": 103966, "epoch": 2475} {"train_loss": -6.358066558837891, "global_step": 103967, "epoch": 2475} {"train_loss": -6.415197372436523, "global_step": 103968, "epoch": 2475} {"train_loss": -6.353761196136475, "global_step": 103969, "epoch": 2475} {"train_loss": -6.299724578857422, "global_step": 103970, "epoch": 2475} {"train_loss": -6.319332122802734, "global_step": 103971, "epoch": 2475} {"train_loss": -6.366756439208984, "global_step": 103972, "epoch": 2475} {"train_loss": -6.368836402893066, "global_step": 103973, "epoch": 2475} {"train_loss": -6.302013397216797, "global_step": 103974, "epoch": 2475} {"train_loss": -6.345889568328857, "global_step": 103975, "epoch": 2475} {"train_loss": -6.439187526702881, "global_step": 103976, "epoch": 2475} {"train_loss": -6.30068826675415, "global_step": 103977, "epoch": 2475} {"train_loss": -6.435218334197998, "global_step": 103978, "epoch": 2475} {"train_loss": -6.440934181213379, "global_step": 103979, "epoch": 2475} {"train_loss": -6.395936965942383, "global_step": 103980, "epoch": 2475} {"train_loss": -6.397790431976318, "global_step": 103981, "epoch": 2475} {"train_loss": -6.366827964782715, "global_step": 103982, "epoch": 2475} {"train_loss": -6.303808212280273, "global_step": 103983, "epoch": 2475} {"train_loss": -6.3577375411987305, "global_step": 103984, "epoch": 2475} {"train_loss": -6.478841781616211, "global_step": 103985, "epoch": 2475} {"train_loss": -6.450740337371826, "global_step": 103986, "epoch": 2475} {"train_loss": -6.362462997436523, "global_step": 103987, "epoch": 2475} {"train_loss": -6.4510321617126465, "global_step": 103988, "epoch": 2475} {"train_loss": -6.195922374725342, "global_step": 103989, "epoch": 2475} {"train_loss": -6.219944000244141, "global_step": 103990, "epoch": 2475} {"train_loss": -6.3778613067808605, "global_step": 103991, "epoch": 2475, "val_loss": 75901.53125} {"train_loss": -6.464649200439453, "global_step": 103992, "epoch": 2476} {"train_loss": -6.391232490539551, "global_step": 103993, "epoch": 2476} {"train_loss": -6.443178176879883, "global_step": 103994, "epoch": 2476} {"train_loss": -6.397700786590576, "global_step": 103995, "epoch": 2476} {"train_loss": -6.276534080505371, "global_step": 103996, "epoch": 2476} {"train_loss": -6.452630996704102, "global_step": 103997, "epoch": 2476} {"train_loss": -6.476332664489746, "global_step": 103998, "epoch": 2476} {"train_loss": -6.459364891052246, "global_step": 103999, "epoch": 2476} {"train_loss": -6.488957405090332, "global_step": 104000, "epoch": 2476} {"train_loss": -6.39666748046875, "global_step": 104001, "epoch": 2476} {"train_loss": -6.404345989227295, "global_step": 104002, "epoch": 2476} {"train_loss": -6.449940204620361, "global_step": 104003, "epoch": 2476} {"train_loss": -6.449809551239014, "global_step": 104004, "epoch": 2476} {"train_loss": -6.550440788269043, "global_step": 104005, "epoch": 2476} {"train_loss": -6.312160015106201, "global_step": 104006, "epoch": 2476} {"train_loss": -6.461389541625977, "global_step": 104007, "epoch": 2476} {"train_loss": -6.432156562805176, "global_step": 104008, "epoch": 2476} {"train_loss": -6.4405083656311035, "global_step": 104009, "epoch": 2476} {"train_loss": -6.353209972381592, "global_step": 104010, "epoch": 2476} {"train_loss": -6.526235580444336, "global_step": 104011, "epoch": 2476} {"train_loss": -6.49433708190918, "global_step": 104012, "epoch": 2476} {"train_loss": -6.52415132522583, "global_step": 104013, "epoch": 2476} {"train_loss": -6.325465202331543, "global_step": 104014, "epoch": 2476} {"train_loss": -6.5176215171813965, "global_step": 104015, "epoch": 2476} {"train_loss": -6.4423112869262695, "global_step": 104016, "epoch": 2476} {"train_loss": -6.4111762046813965, "global_step": 104017, "epoch": 2476} {"train_loss": -6.353116989135742, "global_step": 104018, "epoch": 2476} {"train_loss": -6.429988861083984, "global_step": 104019, "epoch": 2476} {"train_loss": -6.352331161499023, "global_step": 104020, "epoch": 2476} {"train_loss": -6.381598949432373, "global_step": 104021, "epoch": 2476} {"train_loss": -6.362714767456055, "global_step": 104022, "epoch": 2476} {"train_loss": -6.392870903015137, "global_step": 104023, "epoch": 2476} {"train_loss": -6.567691802978516, "global_step": 104024, "epoch": 2476} {"train_loss": -6.332509517669678, "global_step": 104025, "epoch": 2476} {"train_loss": -6.303386211395264, "global_step": 104026, "epoch": 2476} {"train_loss": -6.407503128051758, "global_step": 104027, "epoch": 2476} {"train_loss": -6.203784942626953, "global_step": 104028, "epoch": 2476} {"train_loss": -6.256562232971191, "global_step": 104029, "epoch": 2476} {"train_loss": -6.40379524230957, "global_step": 104030, "epoch": 2476} {"train_loss": -6.187019348144531, "global_step": 104031, "epoch": 2476} {"train_loss": -6.29470682144165, "global_step": 104032, "epoch": 2476} {"train_loss": -6.401413906188238, "global_step": 104033, "epoch": 2476, "val_loss": 76155.5390625} {"train_loss": -6.389202117919922, "global_step": 104034, "epoch": 2477} {"train_loss": -6.350872039794922, "global_step": 104035, "epoch": 2477} {"train_loss": -6.325497627258301, "global_step": 104036, "epoch": 2477} {"train_loss": -6.29173469543457, "global_step": 104037, "epoch": 2477} {"train_loss": -6.270534515380859, "global_step": 104038, "epoch": 2477} {"train_loss": -6.451767921447754, "global_step": 104039, "epoch": 2477} {"train_loss": -6.173577308654785, "global_step": 104040, "epoch": 2477} {"train_loss": -6.236329078674316, "global_step": 104041, "epoch": 2477} {"train_loss": -6.335844993591309, "global_step": 104042, "epoch": 2477} {"train_loss": -6.274374961853027, "global_step": 104043, "epoch": 2477} {"train_loss": -6.316790580749512, "global_step": 104044, "epoch": 2477} {"train_loss": -6.360116481781006, "global_step": 104045, "epoch": 2477} {"train_loss": -6.373680591583252, "global_step": 104046, "epoch": 2477} {"train_loss": -6.3118438720703125, "global_step": 104047, "epoch": 2477} {"train_loss": -6.334626197814941, "global_step": 104048, "epoch": 2477} {"train_loss": -6.311814785003662, "global_step": 104049, "epoch": 2477} {"train_loss": -6.374255657196045, "global_step": 104050, "epoch": 2477} {"train_loss": -6.49777889251709, "global_step": 104051, "epoch": 2477} {"train_loss": -6.341551780700684, "global_step": 104052, "epoch": 2477} {"train_loss": -6.377846717834473, "global_step": 104053, "epoch": 2477} {"train_loss": -6.42536735534668, "global_step": 104054, "epoch": 2477} {"train_loss": -6.409848690032959, "global_step": 104055, "epoch": 2477} {"train_loss": -6.397954940795898, "global_step": 104056, "epoch": 2477} {"train_loss": -6.343846797943115, "global_step": 104057, "epoch": 2477} {"train_loss": -6.375723838806152, "global_step": 104058, "epoch": 2477} {"train_loss": -6.398244857788086, "global_step": 104059, "epoch": 2477} {"train_loss": -6.371992111206055, "global_step": 104060, "epoch": 2477} {"train_loss": -6.36531925201416, "global_step": 104061, "epoch": 2477} {"train_loss": -6.4051032066345215, "global_step": 104062, "epoch": 2477} {"train_loss": -6.334248065948486, "global_step": 104063, "epoch": 2477} {"train_loss": -6.187707901000977, "global_step": 104064, "epoch": 2477} {"train_loss": -6.281466960906982, "global_step": 104065, "epoch": 2477} {"train_loss": -6.545345306396484, "global_step": 104066, "epoch": 2477} {"train_loss": -6.354562759399414, "global_step": 104067, "epoch": 2477} {"train_loss": -6.325481414794922, "global_step": 104068, "epoch": 2477} {"train_loss": -6.397181510925293, "global_step": 104069, "epoch": 2477} {"train_loss": -6.457691192626953, "global_step": 104070, "epoch": 2477} {"train_loss": -6.290609359741211, "global_step": 104071, "epoch": 2477} {"train_loss": -6.529812812805176, "global_step": 104072, "epoch": 2477} {"train_loss": -6.306468486785889, "global_step": 104073, "epoch": 2477} {"train_loss": -6.447946548461914, "global_step": 104074, "epoch": 2477} {"train_loss": -6.359595105761573, "global_step": 104075, "epoch": 2477, "val_loss": 76135.3515625} {"train_loss": -6.472362518310547, "global_step": 104076, "epoch": 2478} {"train_loss": -6.42057991027832, "global_step": 104077, "epoch": 2478} {"train_loss": -6.420434951782227, "global_step": 104078, "epoch": 2478} {"train_loss": -6.409855842590332, "global_step": 104079, "epoch": 2478} {"train_loss": -6.510212421417236, "global_step": 104080, "epoch": 2478} {"train_loss": -6.362533092498779, "global_step": 104081, "epoch": 2478} {"train_loss": -6.4004058837890625, "global_step": 104082, "epoch": 2478} {"train_loss": -6.42372989654541, "global_step": 104083, "epoch": 2478} {"train_loss": -6.455504417419434, "global_step": 104084, "epoch": 2478} {"train_loss": -6.452084541320801, "global_step": 104085, "epoch": 2478} {"train_loss": -6.449533462524414, "global_step": 104086, "epoch": 2478} {"train_loss": -6.461836814880371, "global_step": 104087, "epoch": 2478} {"train_loss": -6.4068603515625, "global_step": 104088, "epoch": 2478} {"train_loss": -6.474111557006836, "global_step": 104089, "epoch": 2478} {"train_loss": -6.4243364334106445, "global_step": 104090, "epoch": 2478} {"train_loss": -6.45046329498291, "global_step": 104091, "epoch": 2478} {"train_loss": -6.470239162445068, "global_step": 104092, "epoch": 2478} {"train_loss": -6.364500522613525, "global_step": 104093, "epoch": 2478} {"train_loss": -6.443800926208496, "global_step": 104094, "epoch": 2478} {"train_loss": -6.442861080169678, "global_step": 104095, "epoch": 2478} {"train_loss": -6.283514976501465, "global_step": 104096, "epoch": 2478} {"train_loss": -6.433960914611816, "global_step": 104097, "epoch": 2478} {"train_loss": -6.35621452331543, "global_step": 104098, "epoch": 2478} {"train_loss": -6.428794860839844, "global_step": 104099, "epoch": 2478} {"train_loss": -6.391571521759033, "global_step": 104100, "epoch": 2478} {"train_loss": -6.526843547821045, "global_step": 104101, "epoch": 2478} {"train_loss": -6.437224388122559, "global_step": 104102, "epoch": 2478} {"train_loss": -6.308704853057861, "global_step": 104103, "epoch": 2478} {"train_loss": -6.312005043029785, "global_step": 104104, "epoch": 2478} {"train_loss": -6.318268299102783, "global_step": 104105, "epoch": 2478} {"train_loss": -6.223272323608398, "global_step": 104106, "epoch": 2478} {"train_loss": -6.446396827697754, "global_step": 104107, "epoch": 2478} {"train_loss": -6.473081588745117, "global_step": 104108, "epoch": 2478} {"train_loss": -6.254581928253174, "global_step": 104109, "epoch": 2478} {"train_loss": -6.49814510345459, "global_step": 104110, "epoch": 2478} {"train_loss": -6.440097332000732, "global_step": 104111, "epoch": 2478} {"train_loss": -6.386852741241455, "global_step": 104112, "epoch": 2478} {"train_loss": -6.365334510803223, "global_step": 104113, "epoch": 2478} {"train_loss": -6.518918991088867, "global_step": 104114, "epoch": 2478} {"train_loss": -6.299400329589844, "global_step": 104115, "epoch": 2478} {"train_loss": -6.268292427062988, "global_step": 104116, "epoch": 2478} {"train_loss": -6.408236537660871, "global_step": 104117, "epoch": 2478, "val_loss": 75875.984375} {"train_loss": -6.334428787231445, "global_step": 104118, "epoch": 2479} {"train_loss": -6.489529132843018, "global_step": 104119, "epoch": 2479} {"train_loss": -6.459975242614746, "global_step": 104120, "epoch": 2479} {"train_loss": -6.456412315368652, "global_step": 104121, "epoch": 2479} {"train_loss": -6.536652088165283, "global_step": 104122, "epoch": 2479} {"train_loss": -6.304502487182617, "global_step": 104123, "epoch": 2479} {"train_loss": -6.350709915161133, "global_step": 104124, "epoch": 2479} {"train_loss": -6.410599708557129, "global_step": 104125, "epoch": 2479} {"train_loss": -6.379941940307617, "global_step": 104126, "epoch": 2479} {"train_loss": -6.236011505126953, "global_step": 104127, "epoch": 2479} {"train_loss": -6.321175575256348, "global_step": 104128, "epoch": 2479} {"train_loss": -6.363519668579102, "global_step": 104129, "epoch": 2479} {"train_loss": -6.2031660079956055, "global_step": 104130, "epoch": 2479} {"train_loss": -6.412568092346191, "global_step": 104131, "epoch": 2479} {"train_loss": -6.328623294830322, "global_step": 104132, "epoch": 2479} {"train_loss": -6.4235005378723145, "global_step": 104133, "epoch": 2479} {"train_loss": -6.491768836975098, "global_step": 104134, "epoch": 2479} {"train_loss": -6.413327217102051, "global_step": 104135, "epoch": 2479} {"train_loss": -6.3413262367248535, "global_step": 104136, "epoch": 2479} {"train_loss": -6.397304534912109, "global_step": 104137, "epoch": 2479} {"train_loss": -6.32476806640625, "global_step": 104138, "epoch": 2479} {"train_loss": -6.344547748565674, "global_step": 104139, "epoch": 2479} {"train_loss": -6.262279510498047, "global_step": 104140, "epoch": 2479} {"train_loss": -6.346470832824707, "global_step": 104141, "epoch": 2479} {"train_loss": -6.4382781982421875, "global_step": 104142, "epoch": 2479} {"train_loss": -6.266282081604004, "global_step": 104143, "epoch": 2479} {"train_loss": -6.354047775268555, "global_step": 104144, "epoch": 2479} {"train_loss": -6.322782039642334, "global_step": 104145, "epoch": 2479} {"train_loss": -6.4004716873168945, "global_step": 104146, "epoch": 2479} {"train_loss": -6.509462356567383, "global_step": 104147, "epoch": 2479} {"train_loss": -6.27604866027832, "global_step": 104148, "epoch": 2479} {"train_loss": -6.352175712585449, "global_step": 104149, "epoch": 2479} {"train_loss": -6.395150184631348, "global_step": 104150, "epoch": 2479} {"train_loss": -6.397667407989502, "global_step": 104151, "epoch": 2479} {"train_loss": -6.345351219177246, "global_step": 104152, "epoch": 2479} {"train_loss": -6.441476345062256, "global_step": 104153, "epoch": 2479} {"train_loss": -6.264634132385254, "global_step": 104154, "epoch": 2479} {"train_loss": -6.415118217468262, "global_step": 104155, "epoch": 2479} {"train_loss": -6.388764381408691, "global_step": 104156, "epoch": 2479} {"train_loss": -6.450845241546631, "global_step": 104157, "epoch": 2479} {"train_loss": -6.315629482269287, "global_step": 104158, "epoch": 2479} {"train_loss": -6.373013553165254, "global_step": 104159, "epoch": 2479, "val_loss": 75845.09375} {"train_loss": -6.36521053314209, "global_step": 104160, "epoch": 2480} {"train_loss": -6.274483680725098, "global_step": 104161, "epoch": 2480} {"train_loss": -6.413471221923828, "global_step": 104162, "epoch": 2480} {"train_loss": -6.319655418395996, "global_step": 104163, "epoch": 2480} {"train_loss": -6.480381011962891, "global_step": 104164, "epoch": 2480} {"train_loss": -6.3936262130737305, "global_step": 104165, "epoch": 2480} {"train_loss": -6.457357406616211, "global_step": 104166, "epoch": 2480} {"train_loss": -6.235957145690918, "global_step": 104167, "epoch": 2480} {"train_loss": -6.352364540100098, "global_step": 104168, "epoch": 2480} {"train_loss": -6.542586326599121, "global_step": 104169, "epoch": 2480} {"train_loss": -6.259477615356445, "global_step": 104170, "epoch": 2480} {"train_loss": -6.323651313781738, "global_step": 104171, "epoch": 2480} {"train_loss": -6.38683557510376, "global_step": 104172, "epoch": 2480} {"train_loss": -6.427590847015381, "global_step": 104173, "epoch": 2480} {"train_loss": -6.480947971343994, "global_step": 104174, "epoch": 2480} {"train_loss": -6.298232078552246, "global_step": 104175, "epoch": 2480} {"train_loss": -6.490762710571289, "global_step": 104176, "epoch": 2480} {"train_loss": -6.377851486206055, "global_step": 104177, "epoch": 2480} {"train_loss": -6.372648239135742, "global_step": 104178, "epoch": 2480} {"train_loss": -6.598433494567871, "global_step": 104179, "epoch": 2480} {"train_loss": -6.313930988311768, "global_step": 104180, "epoch": 2480} {"train_loss": -6.345572471618652, "global_step": 104181, "epoch": 2480} {"train_loss": -6.5359368324279785, "global_step": 104182, "epoch": 2480} {"train_loss": -6.324068546295166, "global_step": 104183, "epoch": 2480} {"train_loss": -6.274142265319824, "global_step": 104184, "epoch": 2480} {"train_loss": -6.44212007522583, "global_step": 104185, "epoch": 2480} {"train_loss": -6.3766350746154785, "global_step": 104186, "epoch": 2480} {"train_loss": -6.409249305725098, "global_step": 104187, "epoch": 2480} {"train_loss": -6.380335807800293, "global_step": 104188, "epoch": 2480} {"train_loss": -6.450127124786377, "global_step": 104189, "epoch": 2480} {"train_loss": -6.426236629486084, "global_step": 104190, "epoch": 2480} {"train_loss": -6.5148749351501465, "global_step": 104191, "epoch": 2480} {"train_loss": -6.463350296020508, "global_step": 104192, "epoch": 2480} {"train_loss": -6.41682243347168, "global_step": 104193, "epoch": 2480} {"train_loss": -6.426443099975586, "global_step": 104194, "epoch": 2480} {"train_loss": -6.421548843383789, "global_step": 104195, "epoch": 2480} {"train_loss": -6.444730758666992, "global_step": 104196, "epoch": 2480} {"train_loss": -6.311016082763672, "global_step": 104197, "epoch": 2480} {"train_loss": -6.370301723480225, "global_step": 104198, "epoch": 2480} {"train_loss": -6.407706260681152, "global_step": 104199, "epoch": 2480} {"train_loss": -6.330688953399658, "global_step": 104200, "epoch": 2480} {"train_loss": -6.3969016415732245, "global_step": 104201, "epoch": 2480, "val_loss": 75903.2890625} {"train_loss": -6.393363952636719, "global_step": 104202, "epoch": 2481} {"train_loss": -6.249527931213379, "global_step": 104203, "epoch": 2481} {"train_loss": -6.354875087738037, "global_step": 104204, "epoch": 2481} {"train_loss": -6.377038955688477, "global_step": 104205, "epoch": 2481} {"train_loss": -6.413453578948975, "global_step": 104206, "epoch": 2481} {"train_loss": -6.311575889587402, "global_step": 104207, "epoch": 2481} {"train_loss": -6.529644012451172, "global_step": 104208, "epoch": 2481} {"train_loss": -6.5208821296691895, "global_step": 104209, "epoch": 2481} {"train_loss": -6.405636310577393, "global_step": 104210, "epoch": 2481} {"train_loss": -6.411563873291016, "global_step": 104211, "epoch": 2481} {"train_loss": -6.3760199546813965, "global_step": 104212, "epoch": 2481} {"train_loss": -6.203332901000977, "global_step": 104213, "epoch": 2481} {"train_loss": -6.44078254699707, "global_step": 104214, "epoch": 2481} {"train_loss": -6.388822078704834, "global_step": 104215, "epoch": 2481} {"train_loss": -6.2742204666137695, "global_step": 104216, "epoch": 2481} {"train_loss": -6.47722053527832, "global_step": 104217, "epoch": 2481} {"train_loss": -6.303549289703369, "global_step": 104218, "epoch": 2481} {"train_loss": -6.413714408874512, "global_step": 104219, "epoch": 2481} {"train_loss": -6.46811580657959, "global_step": 104220, "epoch": 2481} {"train_loss": -6.271660327911377, "global_step": 104221, "epoch": 2481} {"train_loss": -6.404729843139648, "global_step": 104222, "epoch": 2481} {"train_loss": -6.336297035217285, "global_step": 104223, "epoch": 2481} {"train_loss": -6.47779655456543, "global_step": 104224, "epoch": 2481} {"train_loss": -6.328037261962891, "global_step": 104225, "epoch": 2481} {"train_loss": -6.262975692749023, "global_step": 104226, "epoch": 2481} {"train_loss": -6.3850507736206055, "global_step": 104227, "epoch": 2481} {"train_loss": -6.331830978393555, "global_step": 104228, "epoch": 2481} {"train_loss": -6.4749555587768555, "global_step": 104229, "epoch": 2481} {"train_loss": -6.452011585235596, "global_step": 104230, "epoch": 2481} {"train_loss": -6.349145412445068, "global_step": 104231, "epoch": 2481} {"train_loss": -6.458169937133789, "global_step": 104232, "epoch": 2481} {"train_loss": -6.50528621673584, "global_step": 104233, "epoch": 2481} {"train_loss": -6.379091262817383, "global_step": 104234, "epoch": 2481} {"train_loss": -6.474929332733154, "global_step": 104235, "epoch": 2481} {"train_loss": -6.335424900054932, "global_step": 104236, "epoch": 2481} {"train_loss": -6.44672155380249, "global_step": 104237, "epoch": 2481} {"train_loss": -6.393722057342529, "global_step": 104238, "epoch": 2481} {"train_loss": -6.411368370056152, "global_step": 104239, "epoch": 2481} {"train_loss": -6.50008487701416, "global_step": 104240, "epoch": 2481} {"train_loss": -6.311041831970215, "global_step": 104241, "epoch": 2481} {"train_loss": -6.431118965148926, "global_step": 104242, "epoch": 2481} {"train_loss": -6.389614332289923, "global_step": 104243, "epoch": 2481, "val_loss": 75903.734375} {"train_loss": -6.427600860595703, "global_step": 104244, "epoch": 2482} {"train_loss": -6.507575035095215, "global_step": 104245, "epoch": 2482} {"train_loss": -6.427788257598877, "global_step": 104246, "epoch": 2482} {"train_loss": -6.432955741882324, "global_step": 104247, "epoch": 2482} {"train_loss": -6.438653469085693, "global_step": 104248, "epoch": 2482} {"train_loss": -6.364828586578369, "global_step": 104249, "epoch": 2482} {"train_loss": -6.2654829025268555, "global_step": 104250, "epoch": 2482} {"train_loss": -6.428729057312012, "global_step": 104251, "epoch": 2482} {"train_loss": -6.423734664916992, "global_step": 104252, "epoch": 2482} {"train_loss": -6.334755897521973, "global_step": 104253, "epoch": 2482} {"train_loss": -6.449599266052246, "global_step": 104254, "epoch": 2482} {"train_loss": -6.350040912628174, "global_step": 104255, "epoch": 2482} {"train_loss": -6.426048755645752, "global_step": 104256, "epoch": 2482} {"train_loss": -6.487591743469238, "global_step": 104257, "epoch": 2482} {"train_loss": -6.449124336242676, "global_step": 104258, "epoch": 2482} {"train_loss": -6.461360931396484, "global_step": 104259, "epoch": 2482} {"train_loss": -6.451085090637207, "global_step": 104260, "epoch": 2482} {"train_loss": -6.348562240600586, "global_step": 104261, "epoch": 2482} {"train_loss": -6.405463218688965, "global_step": 104262, "epoch": 2482} {"train_loss": -6.442034721374512, "global_step": 104263, "epoch": 2482} {"train_loss": -6.4642229080200195, "global_step": 104264, "epoch": 2482} {"train_loss": -6.444888114929199, "global_step": 104265, "epoch": 2482} {"train_loss": -6.411893844604492, "global_step": 104266, "epoch": 2482} {"train_loss": -6.345803260803223, "global_step": 104267, "epoch": 2482} {"train_loss": -6.467977523803711, "global_step": 104268, "epoch": 2482} {"train_loss": -6.465951919555664, "global_step": 104269, "epoch": 2482} {"train_loss": -6.456608295440674, "global_step": 104270, "epoch": 2482} {"train_loss": -6.320452690124512, "global_step": 104271, "epoch": 2482} {"train_loss": -6.375132083892822, "global_step": 104272, "epoch": 2482} {"train_loss": -6.4062700271606445, "global_step": 104273, "epoch": 2482} {"train_loss": -6.459701061248779, "global_step": 104274, "epoch": 2482} {"train_loss": -6.388704299926758, "global_step": 104275, "epoch": 2482} {"train_loss": -6.397221565246582, "global_step": 104276, "epoch": 2482} {"train_loss": -6.438580513000488, "global_step": 104277, "epoch": 2482} {"train_loss": -6.486172199249268, "global_step": 104278, "epoch": 2482} {"train_loss": -6.452984809875488, "global_step": 104279, "epoch": 2482} {"train_loss": -6.477643013000488, "global_step": 104280, "epoch": 2482} {"train_loss": -6.537475109100342, "global_step": 104281, "epoch": 2482} {"train_loss": -6.406350612640381, "global_step": 104282, "epoch": 2482} {"train_loss": -6.3032426834106445, "global_step": 104283, "epoch": 2482} {"train_loss": -6.395208835601807, "global_step": 104284, "epoch": 2482} {"train_loss": -6.41667492049081, "global_step": 104285, "epoch": 2482, "val_loss": 76429.9921875} {"train_loss": -6.271734714508057, "global_step": 104286, "epoch": 2483} {"train_loss": -6.442964553833008, "global_step": 104287, "epoch": 2483} {"train_loss": -6.324860572814941, "global_step": 104288, "epoch": 2483} {"train_loss": -6.366146564483643, "global_step": 104289, "epoch": 2483} {"train_loss": -6.361318588256836, "global_step": 104290, "epoch": 2483} {"train_loss": -6.362974166870117, "global_step": 104291, "epoch": 2483} {"train_loss": -6.299494743347168, "global_step": 104292, "epoch": 2483} {"train_loss": -6.261528968811035, "global_step": 104293, "epoch": 2483} {"train_loss": -6.340806007385254, "global_step": 104294, "epoch": 2483} {"train_loss": -6.231689929962158, "global_step": 104295, "epoch": 2483} {"train_loss": -6.197286605834961, "global_step": 104296, "epoch": 2483} {"train_loss": -6.219623565673828, "global_step": 104297, "epoch": 2483} {"train_loss": -6.260365009307861, "global_step": 104298, "epoch": 2483} {"train_loss": -6.235893249511719, "global_step": 104299, "epoch": 2483} {"train_loss": -6.38693904876709, "global_step": 104300, "epoch": 2483} {"train_loss": -6.226064682006836, "global_step": 104301, "epoch": 2483} {"train_loss": -6.355299949645996, "global_step": 104302, "epoch": 2483} {"train_loss": -6.298827171325684, "global_step": 104303, "epoch": 2483} {"train_loss": -6.372413158416748, "global_step": 104304, "epoch": 2483} {"train_loss": -6.365916728973389, "global_step": 104305, "epoch": 2483} {"train_loss": -6.384946823120117, "global_step": 104306, "epoch": 2483} {"train_loss": -6.289926528930664, "global_step": 104307, "epoch": 2483} {"train_loss": -6.279688835144043, "global_step": 104308, "epoch": 2483} {"train_loss": -6.277835845947266, "global_step": 104309, "epoch": 2483} {"train_loss": -6.308418273925781, "global_step": 104310, "epoch": 2483} {"train_loss": -6.306759834289551, "global_step": 104311, "epoch": 2483} {"train_loss": -6.342429161071777, "global_step": 104312, "epoch": 2483} {"train_loss": -6.2825446128845215, "global_step": 104313, "epoch": 2483} {"train_loss": -6.325966835021973, "global_step": 104314, "epoch": 2483} {"train_loss": -6.49608039855957, "global_step": 104315, "epoch": 2483} {"train_loss": -6.388589382171631, "global_step": 104316, "epoch": 2483} {"train_loss": -6.417731285095215, "global_step": 104317, "epoch": 2483} {"train_loss": -6.314109802246094, "global_step": 104318, "epoch": 2483} {"train_loss": -6.298252105712891, "global_step": 104319, "epoch": 2483} {"train_loss": -6.420948028564453, "global_step": 104320, "epoch": 2483} {"train_loss": -6.277749061584473, "global_step": 104321, "epoch": 2483} {"train_loss": -6.387795448303223, "global_step": 104322, "epoch": 2483} {"train_loss": -6.409677505493164, "global_step": 104323, "epoch": 2483} {"train_loss": -6.321083068847656, "global_step": 104324, "epoch": 2483} {"train_loss": -6.387090682983398, "global_step": 104325, "epoch": 2483} {"train_loss": -6.3712029457092285, "global_step": 104326, "epoch": 2483} {"train_loss": -6.330309935978481, "global_step": 104327, "epoch": 2483, "val_loss": 75994.296875} {"train_loss": -6.402197360992432, "global_step": 104328, "epoch": 2484} {"train_loss": -6.447333812713623, "global_step": 104329, "epoch": 2484} {"train_loss": -6.470952033996582, "global_step": 104330, "epoch": 2484} {"train_loss": -6.45063591003418, "global_step": 104331, "epoch": 2484} {"train_loss": -6.518059730529785, "global_step": 104332, "epoch": 2484} {"train_loss": -6.4740447998046875, "global_step": 104333, "epoch": 2484} {"train_loss": -6.417292594909668, "global_step": 104334, "epoch": 2484} {"train_loss": -6.410182952880859, "global_step": 104335, "epoch": 2484} {"train_loss": -6.328394889831543, "global_step": 104336, "epoch": 2484} {"train_loss": -6.389278888702393, "global_step": 104337, "epoch": 2484} {"train_loss": -6.287377834320068, "global_step": 104338, "epoch": 2484} {"train_loss": -6.533411502838135, "global_step": 104339, "epoch": 2484} {"train_loss": -6.4421539306640625, "global_step": 104340, "epoch": 2484} {"train_loss": -6.450690269470215, "global_step": 104341, "epoch": 2484} {"train_loss": -6.396439552307129, "global_step": 104342, "epoch": 2484} {"train_loss": -6.328039646148682, "global_step": 104343, "epoch": 2484} {"train_loss": -6.408239364624023, "global_step": 104344, "epoch": 2484} {"train_loss": -6.418780326843262, "global_step": 104345, "epoch": 2484} {"train_loss": -6.454927921295166, "global_step": 104346, "epoch": 2484} {"train_loss": -6.435032844543457, "global_step": 104347, "epoch": 2484} {"train_loss": -6.394596099853516, "global_step": 104348, "epoch": 2484} {"train_loss": -6.307163715362549, "global_step": 104349, "epoch": 2484} {"train_loss": -6.444870948791504, "global_step": 104350, "epoch": 2484} {"train_loss": -6.467059135437012, "global_step": 104351, "epoch": 2484} {"train_loss": -6.3776655197143555, "global_step": 104352, "epoch": 2484} {"train_loss": -6.492403984069824, "global_step": 104353, "epoch": 2484} {"train_loss": -6.421864032745361, "global_step": 104354, "epoch": 2484} {"train_loss": -6.345064163208008, "global_step": 104355, "epoch": 2484} {"train_loss": -6.363129138946533, "global_step": 104356, "epoch": 2484} {"train_loss": -6.455051898956299, "global_step": 104357, "epoch": 2484} {"train_loss": -6.398571014404297, "global_step": 104358, "epoch": 2484} {"train_loss": -6.498595237731934, "global_step": 104359, "epoch": 2484} {"train_loss": -6.294013977050781, "global_step": 104360, "epoch": 2484} {"train_loss": -6.412863731384277, "global_step": 104361, "epoch": 2484} {"train_loss": -6.409669876098633, "global_step": 104362, "epoch": 2484} {"train_loss": -6.421989440917969, "global_step": 104363, "epoch": 2484} {"train_loss": -6.362724304199219, "global_step": 104364, "epoch": 2484} {"train_loss": -6.394223690032959, "global_step": 104365, "epoch": 2484} {"train_loss": -6.498400688171387, "global_step": 104366, "epoch": 2484} {"train_loss": -6.413076400756836, "global_step": 104367, "epoch": 2484} {"train_loss": -6.47670841217041, "global_step": 104368, "epoch": 2484} {"train_loss": -6.415896642775762, "global_step": 104369, "epoch": 2484, "val_loss": 76162.203125} {"train_loss": -6.38811731338501, "global_step": 104370, "epoch": 2485} {"train_loss": -6.359785079956055, "global_step": 104371, "epoch": 2485} {"train_loss": -6.470552444458008, "global_step": 104372, "epoch": 2485} {"train_loss": -6.2905731201171875, "global_step": 104373, "epoch": 2485} {"train_loss": -6.477385997772217, "global_step": 104374, "epoch": 2485} {"train_loss": -6.459347724914551, "global_step": 104375, "epoch": 2485} {"train_loss": -6.425931930541992, "global_step": 104376, "epoch": 2485} {"train_loss": -6.381120681762695, "global_step": 104377, "epoch": 2485} {"train_loss": -6.347911834716797, "global_step": 104378, "epoch": 2485} {"train_loss": -6.438122272491455, "global_step": 104379, "epoch": 2485} {"train_loss": -6.437607288360596, "global_step": 104380, "epoch": 2485} {"train_loss": -6.3262763023376465, "global_step": 104381, "epoch": 2485} {"train_loss": -6.373936653137207, "global_step": 104382, "epoch": 2485} {"train_loss": -6.277771949768066, "global_step": 104383, "epoch": 2485} {"train_loss": -6.473613262176514, "global_step": 104384, "epoch": 2485} {"train_loss": -6.495102882385254, "global_step": 104385, "epoch": 2485} {"train_loss": -6.33176326751709, "global_step": 104386, "epoch": 2485} {"train_loss": -6.516305923461914, "global_step": 104387, "epoch": 2485} {"train_loss": -6.382598400115967, "global_step": 104388, "epoch": 2485} {"train_loss": -6.377649784088135, "global_step": 104389, "epoch": 2485} {"train_loss": -6.478348731994629, "global_step": 104390, "epoch": 2485} {"train_loss": -6.494688034057617, "global_step": 104391, "epoch": 2485} {"train_loss": -6.447853088378906, "global_step": 104392, "epoch": 2485} {"train_loss": -6.383642196655273, "global_step": 104393, "epoch": 2485} {"train_loss": -6.401507377624512, "global_step": 104394, "epoch": 2485} {"train_loss": -6.44336462020874, "global_step": 104395, "epoch": 2485} {"train_loss": -6.422093391418457, "global_step": 104396, "epoch": 2485} {"train_loss": -6.363826751708984, "global_step": 104397, "epoch": 2485} {"train_loss": -6.268514633178711, "global_step": 104398, "epoch": 2485} {"train_loss": -6.367954730987549, "global_step": 104399, "epoch": 2485} {"train_loss": -6.355877876281738, "global_step": 104400, "epoch": 2485} {"train_loss": -6.3145432472229, "global_step": 104401, "epoch": 2485} {"train_loss": -6.404857158660889, "global_step": 104402, "epoch": 2485} {"train_loss": -6.400421142578125, "global_step": 104403, "epoch": 2485} {"train_loss": -6.251804351806641, "global_step": 104404, "epoch": 2485} {"train_loss": -6.484401702880859, "global_step": 104405, "epoch": 2485} {"train_loss": -6.293914794921875, "global_step": 104406, "epoch": 2485} {"train_loss": -6.323582649230957, "global_step": 104407, "epoch": 2485} {"train_loss": -6.40837287902832, "global_step": 104408, "epoch": 2485} {"train_loss": -6.439083099365234, "global_step": 104409, "epoch": 2485} {"train_loss": -6.464831352233887, "global_step": 104410, "epoch": 2485} {"train_loss": -6.398050535292852, "global_step": 104411, "epoch": 2485, "val_loss": 75640.828125} {"train_loss": -6.368758201599121, "global_step": 104412, "epoch": 2486} {"train_loss": -6.336594104766846, "global_step": 104413, "epoch": 2486} {"train_loss": -6.463152885437012, "global_step": 104414, "epoch": 2486} {"train_loss": -6.241381645202637, "global_step": 104415, "epoch": 2486} {"train_loss": -6.357962608337402, "global_step": 104416, "epoch": 2486} {"train_loss": -6.4610185623168945, "global_step": 104417, "epoch": 2486} {"train_loss": -6.348752021789551, "global_step": 104418, "epoch": 2486} {"train_loss": -6.367603302001953, "global_step": 104419, "epoch": 2486} {"train_loss": -6.362565517425537, "global_step": 104420, "epoch": 2486} {"train_loss": -6.437495231628418, "global_step": 104421, "epoch": 2486} {"train_loss": -6.383858680725098, "global_step": 104422, "epoch": 2486} {"train_loss": -6.4377312660217285, "global_step": 104423, "epoch": 2486} {"train_loss": -6.477551460266113, "global_step": 104424, "epoch": 2486} {"train_loss": -6.416048049926758, "global_step": 104425, "epoch": 2486} {"train_loss": -6.540770530700684, "global_step": 104426, "epoch": 2486} {"train_loss": -6.341402053833008, "global_step": 104427, "epoch": 2486} {"train_loss": -6.272366523742676, "global_step": 104428, "epoch": 2486} {"train_loss": -6.400425910949707, "global_step": 104429, "epoch": 2486} {"train_loss": -6.405460357666016, "global_step": 104430, "epoch": 2486} {"train_loss": -6.3465800285339355, "global_step": 104431, "epoch": 2486} {"train_loss": -6.322772979736328, "global_step": 104432, "epoch": 2486} {"train_loss": -6.403058052062988, "global_step": 104433, "epoch": 2486} {"train_loss": -6.362370491027832, "global_step": 104434, "epoch": 2486} {"train_loss": -6.482203483581543, "global_step": 104435, "epoch": 2486} {"train_loss": -6.356698989868164, "global_step": 104436, "epoch": 2486} {"train_loss": -6.419255256652832, "global_step": 104437, "epoch": 2486} {"train_loss": -6.46340274810791, "global_step": 104438, "epoch": 2486} {"train_loss": -6.400824546813965, "global_step": 104439, "epoch": 2486} {"train_loss": -6.317913055419922, "global_step": 104440, "epoch": 2486} {"train_loss": -6.390761375427246, "global_step": 104441, "epoch": 2486} {"train_loss": -6.454054832458496, "global_step": 104442, "epoch": 2486} {"train_loss": -6.458236217498779, "global_step": 104443, "epoch": 2486} {"train_loss": -6.411877632141113, "global_step": 104444, "epoch": 2486} {"train_loss": -6.443427085876465, "global_step": 104445, "epoch": 2486} {"train_loss": -6.303256034851074, "global_step": 104446, "epoch": 2486} {"train_loss": -6.395308017730713, "global_step": 104447, "epoch": 2486} {"train_loss": -6.469336986541748, "global_step": 104448, "epoch": 2486} {"train_loss": -6.397477149963379, "global_step": 104449, "epoch": 2486} {"train_loss": -6.490846633911133, "global_step": 104450, "epoch": 2486} {"train_loss": -6.493453025817871, "global_step": 104451, "epoch": 2486} {"train_loss": -6.400839805603027, "global_step": 104452, "epoch": 2486} {"train_loss": -6.400385084606352, "global_step": 104453, "epoch": 2486, "val_loss": 75944.125} {"train_loss": -6.480656623840332, "global_step": 104454, "epoch": 2487} {"train_loss": -6.437483787536621, "global_step": 104455, "epoch": 2487} {"train_loss": -6.311162948608398, "global_step": 104456, "epoch": 2487} {"train_loss": -6.4022369384765625, "global_step": 104457, "epoch": 2487} {"train_loss": -6.508712291717529, "global_step": 104458, "epoch": 2487} {"train_loss": -6.4055376052856445, "global_step": 104459, "epoch": 2487} {"train_loss": -6.449317455291748, "global_step": 104460, "epoch": 2487} {"train_loss": -6.53908634185791, "global_step": 104461, "epoch": 2487} {"train_loss": -6.544987678527832, "global_step": 104462, "epoch": 2487} {"train_loss": -6.4019622802734375, "global_step": 104463, "epoch": 2487} {"train_loss": -6.430034160614014, "global_step": 104464, "epoch": 2487} {"train_loss": -6.506878852844238, "global_step": 104465, "epoch": 2487} {"train_loss": -6.388299942016602, "global_step": 104466, "epoch": 2487} {"train_loss": -6.411892890930176, "global_step": 104467, "epoch": 2487} {"train_loss": -6.611789703369141, "global_step": 104468, "epoch": 2487} {"train_loss": -6.37587833404541, "global_step": 104469, "epoch": 2487} {"train_loss": -6.463513374328613, "global_step": 104470, "epoch": 2487} {"train_loss": -6.415052890777588, "global_step": 104471, "epoch": 2487} {"train_loss": -6.453434944152832, "global_step": 104472, "epoch": 2487} {"train_loss": -6.414853096008301, "global_step": 104473, "epoch": 2487} {"train_loss": -6.561820983886719, "global_step": 104474, "epoch": 2487} {"train_loss": -6.392220497131348, "global_step": 104475, "epoch": 2487} {"train_loss": -6.338665962219238, "global_step": 104476, "epoch": 2487} {"train_loss": -6.354703903198242, "global_step": 104477, "epoch": 2487} {"train_loss": -6.375295639038086, "global_step": 104478, "epoch": 2487} {"train_loss": -6.355733871459961, "global_step": 104479, "epoch": 2487} {"train_loss": -6.310989856719971, "global_step": 104480, "epoch": 2487} {"train_loss": -6.476778030395508, "global_step": 104481, "epoch": 2487} {"train_loss": -6.233809471130371, "global_step": 104482, "epoch": 2487} {"train_loss": -6.288620471954346, "global_step": 104483, "epoch": 2487} {"train_loss": -6.303873062133789, "global_step": 104484, "epoch": 2487} {"train_loss": -6.342333793640137, "global_step": 104485, "epoch": 2487} {"train_loss": -6.364082336425781, "global_step": 104486, "epoch": 2487} {"train_loss": -6.468685150146484, "global_step": 104487, "epoch": 2487} {"train_loss": -6.33922004699707, "global_step": 104488, "epoch": 2487} {"train_loss": -6.419499397277832, "global_step": 104489, "epoch": 2487} {"train_loss": -6.321275234222412, "global_step": 104490, "epoch": 2487} {"train_loss": -6.365730285644531, "global_step": 104491, "epoch": 2487} {"train_loss": -6.461541175842285, "global_step": 104492, "epoch": 2487} {"train_loss": -6.288593292236328, "global_step": 104493, "epoch": 2487} {"train_loss": -6.34737491607666, "global_step": 104494, "epoch": 2487} {"train_loss": -6.406789018994286, "global_step": 104495, "epoch": 2487, "val_loss": 76389.3046875} {"train_loss": -6.356029987335205, "global_step": 104496, "epoch": 2488} {"train_loss": -6.402307033538818, "global_step": 104497, "epoch": 2488} {"train_loss": -6.332996845245361, "global_step": 104498, "epoch": 2488} {"train_loss": -6.436859130859375, "global_step": 104499, "epoch": 2488} {"train_loss": -6.373642921447754, "global_step": 104500, "epoch": 2488} {"train_loss": -6.218522548675537, "global_step": 104501, "epoch": 2488} {"train_loss": -6.397682189941406, "global_step": 104502, "epoch": 2488} {"train_loss": -6.336854934692383, "global_step": 104503, "epoch": 2488} {"train_loss": -6.391847610473633, "global_step": 104504, "epoch": 2488} {"train_loss": -6.410938262939453, "global_step": 104505, "epoch": 2488} {"train_loss": -6.350805282592773, "global_step": 104506, "epoch": 2488} {"train_loss": -6.450457572937012, "global_step": 104507, "epoch": 2488} {"train_loss": -6.292442321777344, "global_step": 104508, "epoch": 2488} {"train_loss": -6.35341215133667, "global_step": 104509, "epoch": 2488} {"train_loss": -6.346332550048828, "global_step": 104510, "epoch": 2488} {"train_loss": -6.329353332519531, "global_step": 104511, "epoch": 2488} {"train_loss": -6.331058979034424, "global_step": 104512, "epoch": 2488} {"train_loss": -6.3804931640625, "global_step": 104513, "epoch": 2488} {"train_loss": -6.306515693664551, "global_step": 104514, "epoch": 2488} {"train_loss": -6.377424240112305, "global_step": 104515, "epoch": 2488} {"train_loss": -6.352325439453125, "global_step": 104516, "epoch": 2488} {"train_loss": -6.395997047424316, "global_step": 104517, "epoch": 2488} {"train_loss": -6.43929386138916, "global_step": 104518, "epoch": 2488} {"train_loss": -6.308718681335449, "global_step": 104519, "epoch": 2488} {"train_loss": -6.3564453125, "global_step": 104520, "epoch": 2488} {"train_loss": -6.44167423248291, "global_step": 104521, "epoch": 2488} {"train_loss": -6.351729869842529, "global_step": 104522, "epoch": 2488} {"train_loss": -6.433028221130371, "global_step": 104523, "epoch": 2488} {"train_loss": -6.472938060760498, "global_step": 104524, "epoch": 2488} {"train_loss": -6.4624528884887695, "global_step": 104525, "epoch": 2488} {"train_loss": -6.361613750457764, "global_step": 104526, "epoch": 2488} {"train_loss": -6.476932525634766, "global_step": 104527, "epoch": 2488} {"train_loss": -6.417570114135742, "global_step": 104528, "epoch": 2488} {"train_loss": -6.477804183959961, "global_step": 104529, "epoch": 2488} {"train_loss": -6.335594654083252, "global_step": 104530, "epoch": 2488} {"train_loss": -6.400588035583496, "global_step": 104531, "epoch": 2488} {"train_loss": -6.407261848449707, "global_step": 104532, "epoch": 2488} {"train_loss": -6.46215295791626, "global_step": 104533, "epoch": 2488} {"train_loss": -6.430413246154785, "global_step": 104534, "epoch": 2488} {"train_loss": -6.419659614562988, "global_step": 104535, "epoch": 2488} {"train_loss": -6.3383941650390625, "global_step": 104536, "epoch": 2488} {"train_loss": -6.383346375964937, "global_step": 104537, "epoch": 2488, "val_loss": 75971.375} {"train_loss": -6.38139533996582, "global_step": 104538, "epoch": 2489} {"train_loss": -6.540663719177246, "global_step": 104539, "epoch": 2489} {"train_loss": -6.434142112731934, "global_step": 104540, "epoch": 2489} {"train_loss": -6.406091213226318, "global_step": 104541, "epoch": 2489} {"train_loss": -6.475309371948242, "global_step": 104542, "epoch": 2489} {"train_loss": -6.461816787719727, "global_step": 104543, "epoch": 2489} {"train_loss": -6.422379493713379, "global_step": 104544, "epoch": 2489} {"train_loss": -6.367286682128906, "global_step": 104545, "epoch": 2489} {"train_loss": -6.415709972381592, "global_step": 104546, "epoch": 2489} {"train_loss": -6.321184158325195, "global_step": 104547, "epoch": 2489} {"train_loss": -6.441367149353027, "global_step": 104548, "epoch": 2489} {"train_loss": -6.40097713470459, "global_step": 104549, "epoch": 2489} {"train_loss": -6.4463605880737305, "global_step": 104550, "epoch": 2489} {"train_loss": -6.367884635925293, "global_step": 104551, "epoch": 2489} {"train_loss": -6.532280445098877, "global_step": 104552, "epoch": 2489} {"train_loss": -6.47894287109375, "global_step": 104553, "epoch": 2489} {"train_loss": -6.35344123840332, "global_step": 104554, "epoch": 2489} {"train_loss": -6.296360015869141, "global_step": 104555, "epoch": 2489} {"train_loss": -6.429810523986816, "global_step": 104556, "epoch": 2489} {"train_loss": -6.407352447509766, "global_step": 104557, "epoch": 2489} {"train_loss": -6.500916004180908, "global_step": 104558, "epoch": 2489} {"train_loss": -6.463815689086914, "global_step": 104559, "epoch": 2489} {"train_loss": -6.330406188964844, "global_step": 104560, "epoch": 2489} {"train_loss": -6.471830368041992, "global_step": 104561, "epoch": 2489} {"train_loss": -6.431666851043701, "global_step": 104562, "epoch": 2489} {"train_loss": -6.354974269866943, "global_step": 104563, "epoch": 2489} {"train_loss": -6.500909805297852, "global_step": 104564, "epoch": 2489} {"train_loss": -6.444851398468018, "global_step": 104565, "epoch": 2489} {"train_loss": -6.490395545959473, "global_step": 104566, "epoch": 2489} {"train_loss": -6.463852882385254, "global_step": 104567, "epoch": 2489} {"train_loss": -6.29460334777832, "global_step": 104568, "epoch": 2489} {"train_loss": -6.521145343780518, "global_step": 104569, "epoch": 2489} {"train_loss": -6.404867649078369, "global_step": 104570, "epoch": 2489} {"train_loss": -6.335298538208008, "global_step": 104571, "epoch": 2489} {"train_loss": -6.284274578094482, "global_step": 104572, "epoch": 2489} {"train_loss": -6.535137176513672, "global_step": 104573, "epoch": 2489} {"train_loss": -6.425591945648193, "global_step": 104574, "epoch": 2489} {"train_loss": -6.473374843597412, "global_step": 104575, "epoch": 2489} {"train_loss": -6.440983772277832, "global_step": 104576, "epoch": 2489} {"train_loss": -6.443835258483887, "global_step": 104577, "epoch": 2489} {"train_loss": -6.4458723068237305, "global_step": 104578, "epoch": 2489} {"train_loss": -6.422906273887271, "global_step": 104579, "epoch": 2489, "val_loss": 76056.1484375} {"train_loss": -6.448686599731445, "global_step": 104580, "epoch": 2490} {"train_loss": -6.464272975921631, "global_step": 104581, "epoch": 2490} {"train_loss": -6.440173625946045, "global_step": 104582, "epoch": 2490} {"train_loss": -6.379077911376953, "global_step": 104583, "epoch": 2490} {"train_loss": -6.375645637512207, "global_step": 104584, "epoch": 2490} {"train_loss": -6.386504173278809, "global_step": 104585, "epoch": 2490} {"train_loss": -6.445931911468506, "global_step": 104586, "epoch": 2490} {"train_loss": -6.36867618560791, "global_step": 104587, "epoch": 2490} {"train_loss": -6.41358757019043, "global_step": 104588, "epoch": 2490} {"train_loss": -6.445494651794434, "global_step": 104589, "epoch": 2490} {"train_loss": -6.4359235763549805, "global_step": 104590, "epoch": 2490} {"train_loss": -6.410226345062256, "global_step": 104591, "epoch": 2490} {"train_loss": -6.412375450134277, "global_step": 104592, "epoch": 2490} {"train_loss": -6.23015022277832, "global_step": 104593, "epoch": 2490} {"train_loss": -6.334597587585449, "global_step": 104594, "epoch": 2490} {"train_loss": -6.340731620788574, "global_step": 104595, "epoch": 2490} {"train_loss": -6.366690635681152, "global_step": 104596, "epoch": 2490} {"train_loss": -6.358154296875, "global_step": 104597, "epoch": 2490} {"train_loss": -6.308011531829834, "global_step": 104598, "epoch": 2490} {"train_loss": -6.553526878356934, "global_step": 104599, "epoch": 2490} {"train_loss": -6.247323989868164, "global_step": 104600, "epoch": 2490} {"train_loss": -6.264114856719971, "global_step": 104601, "epoch": 2490} {"train_loss": -6.369436264038086, "global_step": 104602, "epoch": 2490} {"train_loss": -6.416049003601074, "global_step": 104603, "epoch": 2490} {"train_loss": -6.517519950866699, "global_step": 104604, "epoch": 2490} {"train_loss": -6.46688175201416, "global_step": 104605, "epoch": 2490} {"train_loss": -6.392772674560547, "global_step": 104606, "epoch": 2490} {"train_loss": -6.324239253997803, "global_step": 104607, "epoch": 2490} {"train_loss": -6.567531108856201, "global_step": 104608, "epoch": 2490} {"train_loss": -6.356529235839844, "global_step": 104609, "epoch": 2490} {"train_loss": -6.501371383666992, "global_step": 104610, "epoch": 2490} {"train_loss": -6.414548873901367, "global_step": 104611, "epoch": 2490} {"train_loss": -6.388445854187012, "global_step": 104612, "epoch": 2490} {"train_loss": -6.406244277954102, "global_step": 104613, "epoch": 2490} {"train_loss": -6.463352203369141, "global_step": 104614, "epoch": 2490} {"train_loss": -6.4823455810546875, "global_step": 104615, "epoch": 2490} {"train_loss": -6.440816879272461, "global_step": 104616, "epoch": 2490} {"train_loss": -6.427435874938965, "global_step": 104617, "epoch": 2490} {"train_loss": -6.432255744934082, "global_step": 104618, "epoch": 2490} {"train_loss": -6.4231438636779785, "global_step": 104619, "epoch": 2490} {"train_loss": -6.546237945556641, "global_step": 104620, "epoch": 2490} {"train_loss": -6.410300708952404, "global_step": 104621, "epoch": 2490, "val_loss": 75954.8984375} {"train_loss": -6.535755157470703, "global_step": 104622, "epoch": 2491} {"train_loss": -6.452354431152344, "global_step": 104623, "epoch": 2491} {"train_loss": -6.429385185241699, "global_step": 104624, "epoch": 2491} {"train_loss": -6.447742462158203, "global_step": 104625, "epoch": 2491} {"train_loss": -6.357766628265381, "global_step": 104626, "epoch": 2491} {"train_loss": -6.361509323120117, "global_step": 104627, "epoch": 2491} {"train_loss": -6.437833786010742, "global_step": 104628, "epoch": 2491} {"train_loss": -6.4788970947265625, "global_step": 104629, "epoch": 2491} {"train_loss": -6.331096649169922, "global_step": 104630, "epoch": 2491} {"train_loss": -6.412442207336426, "global_step": 104631, "epoch": 2491} {"train_loss": -6.372713088989258, "global_step": 104632, "epoch": 2491} {"train_loss": -6.459127902984619, "global_step": 104633, "epoch": 2491} {"train_loss": -6.469775199890137, "global_step": 104634, "epoch": 2491} {"train_loss": -6.337156295776367, "global_step": 104635, "epoch": 2491} {"train_loss": -6.407101154327393, "global_step": 104636, "epoch": 2491} {"train_loss": -6.232368469238281, "global_step": 104637, "epoch": 2491} {"train_loss": -6.24347448348999, "global_step": 104638, "epoch": 2491} {"train_loss": -6.322431564331055, "global_step": 104639, "epoch": 2491} {"train_loss": -6.452095985412598, "global_step": 104640, "epoch": 2491} {"train_loss": -6.359477996826172, "global_step": 104641, "epoch": 2491} {"train_loss": -6.468443870544434, "global_step": 104642, "epoch": 2491} {"train_loss": -6.349127769470215, "global_step": 104643, "epoch": 2491} {"train_loss": -6.328191757202148, "global_step": 104644, "epoch": 2491} {"train_loss": -6.292087078094482, "global_step": 104645, "epoch": 2491} {"train_loss": -6.302139759063721, "global_step": 104646, "epoch": 2491} {"train_loss": -6.318766117095947, "global_step": 104647, "epoch": 2491} {"train_loss": -6.404162406921387, "global_step": 104648, "epoch": 2491} {"train_loss": -6.340500354766846, "global_step": 104649, "epoch": 2491} {"train_loss": -6.361839294433594, "global_step": 104650, "epoch": 2491} {"train_loss": -6.517755508422852, "global_step": 104651, "epoch": 2491} {"train_loss": -6.410874366760254, "global_step": 104652, "epoch": 2491} {"train_loss": -6.572648525238037, "global_step": 104653, "epoch": 2491} {"train_loss": -6.374240875244141, "global_step": 104654, "epoch": 2491} {"train_loss": -6.303690433502197, "global_step": 104655, "epoch": 2491} {"train_loss": -6.400210380554199, "global_step": 104656, "epoch": 2491} {"train_loss": -6.437197208404541, "global_step": 104657, "epoch": 2491} {"train_loss": -6.463862419128418, "global_step": 104658, "epoch": 2491} {"train_loss": -6.272165298461914, "global_step": 104659, "epoch": 2491} {"train_loss": -6.357067108154297, "global_step": 104660, "epoch": 2491} {"train_loss": -6.334142684936523, "global_step": 104661, "epoch": 2491} {"train_loss": -6.269505977630615, "global_step": 104662, "epoch": 2491} {"train_loss": -6.38602994737171, "global_step": 104663, "epoch": 2491, "val_loss": 76569.1796875} {"train_loss": -6.331745624542236, "global_step": 104664, "epoch": 2492} {"train_loss": -6.380642414093018, "global_step": 104665, "epoch": 2492} {"train_loss": -6.379563808441162, "global_step": 104666, "epoch": 2492} {"train_loss": -6.348043441772461, "global_step": 104667, "epoch": 2492} {"train_loss": -6.355380058288574, "global_step": 104668, "epoch": 2492} {"train_loss": -6.479106903076172, "global_step": 104669, "epoch": 2492} {"train_loss": -6.297929763793945, "global_step": 104670, "epoch": 2492} {"train_loss": -6.348701477050781, "global_step": 104671, "epoch": 2492} {"train_loss": -6.261834144592285, "global_step": 104672, "epoch": 2492} {"train_loss": -6.567164897918701, "global_step": 104673, "epoch": 2492} {"train_loss": -6.364895820617676, "global_step": 104674, "epoch": 2492} {"train_loss": -6.354609966278076, "global_step": 104675, "epoch": 2492} {"train_loss": -6.3861188888549805, "global_step": 104676, "epoch": 2492} {"train_loss": -6.501029968261719, "global_step": 104677, "epoch": 2492} {"train_loss": -6.381161689758301, "global_step": 104678, "epoch": 2492} {"train_loss": -6.30493688583374, "global_step": 104679, "epoch": 2492} {"train_loss": -6.39952278137207, "global_step": 104680, "epoch": 2492} {"train_loss": -6.390040397644043, "global_step": 104681, "epoch": 2492} {"train_loss": -6.4636383056640625, "global_step": 104682, "epoch": 2492} {"train_loss": -6.536144256591797, "global_step": 104683, "epoch": 2492} {"train_loss": -6.487055778503418, "global_step": 104684, "epoch": 2492} {"train_loss": -6.425436019897461, "global_step": 104685, "epoch": 2492} {"train_loss": -6.4250993728637695, "global_step": 104686, "epoch": 2492} {"train_loss": -6.451486587524414, "global_step": 104687, "epoch": 2492} {"train_loss": -6.401473045349121, "global_step": 104688, "epoch": 2492} {"train_loss": -6.450035572052002, "global_step": 104689, "epoch": 2492} {"train_loss": -6.430598258972168, "global_step": 104690, "epoch": 2492} {"train_loss": -6.435152053833008, "global_step": 104691, "epoch": 2492} {"train_loss": -6.426177978515625, "global_step": 104692, "epoch": 2492} {"train_loss": -6.519371032714844, "global_step": 104693, "epoch": 2492} {"train_loss": -6.426063537597656, "global_step": 104694, "epoch": 2492} {"train_loss": -6.3748674392700195, "global_step": 104695, "epoch": 2492} {"train_loss": -6.413480758666992, "global_step": 104696, "epoch": 2492} {"train_loss": -6.423802852630615, "global_step": 104697, "epoch": 2492} {"train_loss": -6.34720516204834, "global_step": 104698, "epoch": 2492} {"train_loss": -6.35129451751709, "global_step": 104699, "epoch": 2492} {"train_loss": -6.4784979820251465, "global_step": 104700, "epoch": 2492} {"train_loss": -6.372793674468994, "global_step": 104701, "epoch": 2492} {"train_loss": -6.452210426330566, "global_step": 104702, "epoch": 2492} {"train_loss": -6.385097503662109, "global_step": 104703, "epoch": 2492} {"train_loss": -6.266192436218262, "global_step": 104704, "epoch": 2492} {"train_loss": -6.403061072031657, "global_step": 104705, "epoch": 2492, "val_loss": 76090.859375} {"train_loss": -6.533610820770264, "global_step": 104706, "epoch": 2493} {"train_loss": -6.441809177398682, "global_step": 104707, "epoch": 2493} {"train_loss": -6.457289695739746, "global_step": 104708, "epoch": 2493} {"train_loss": -6.378134250640869, "global_step": 104709, "epoch": 2493} {"train_loss": -6.506499767303467, "global_step": 104710, "epoch": 2493} {"train_loss": -6.346052169799805, "global_step": 104711, "epoch": 2493} {"train_loss": -6.411798477172852, "global_step": 104712, "epoch": 2493} {"train_loss": -6.424292087554932, "global_step": 104713, "epoch": 2493} {"train_loss": -6.3282012939453125, "global_step": 104714, "epoch": 2493} {"train_loss": -6.2991790771484375, "global_step": 104715, "epoch": 2493} {"train_loss": -6.382504463195801, "global_step": 104716, "epoch": 2493} {"train_loss": -6.506930351257324, "global_step": 104717, "epoch": 2493} {"train_loss": -6.47279167175293, "global_step": 104718, "epoch": 2493} {"train_loss": -6.498002529144287, "global_step": 104719, "epoch": 2493} {"train_loss": -6.435707092285156, "global_step": 104720, "epoch": 2493} {"train_loss": -6.321229934692383, "global_step": 104721, "epoch": 2493} {"train_loss": -6.440880298614502, "global_step": 104722, "epoch": 2493} {"train_loss": -6.274285793304443, "global_step": 104723, "epoch": 2493} {"train_loss": -6.331426620483398, "global_step": 104724, "epoch": 2493} {"train_loss": -6.400400638580322, "global_step": 104725, "epoch": 2493} {"train_loss": -6.414165019989014, "global_step": 104726, "epoch": 2493} {"train_loss": -6.317135810852051, "global_step": 104727, "epoch": 2493} {"train_loss": -6.440131664276123, "global_step": 104728, "epoch": 2493} {"train_loss": -6.49387264251709, "global_step": 104729, "epoch": 2493} {"train_loss": -6.447238922119141, "global_step": 104730, "epoch": 2493} {"train_loss": -6.433036804199219, "global_step": 104731, "epoch": 2493} {"train_loss": -6.510207176208496, "global_step": 104732, "epoch": 2493} {"train_loss": -6.563795566558838, "global_step": 104733, "epoch": 2493} {"train_loss": -6.312052249908447, "global_step": 104734, "epoch": 2493} {"train_loss": -6.507552623748779, "global_step": 104735, "epoch": 2493} {"train_loss": -6.437280178070068, "global_step": 104736, "epoch": 2493} {"train_loss": -6.493800163269043, "global_step": 104737, "epoch": 2493} {"train_loss": -6.3928985595703125, "global_step": 104738, "epoch": 2493} {"train_loss": -6.431143760681152, "global_step": 104739, "epoch": 2493} {"train_loss": -6.371870040893555, "global_step": 104740, "epoch": 2493} {"train_loss": -6.464725494384766, "global_step": 104741, "epoch": 2493} {"train_loss": -6.542159080505371, "global_step": 104742, "epoch": 2493} {"train_loss": -6.3453850746154785, "global_step": 104743, "epoch": 2493} {"train_loss": -6.302680015563965, "global_step": 104744, "epoch": 2493} {"train_loss": -6.474119186401367, "global_step": 104745, "epoch": 2493} {"train_loss": -6.471107482910156, "global_step": 104746, "epoch": 2493} {"train_loss": -6.420327027638753, "global_step": 104747, "epoch": 2493, "val_loss": 76071.28125} {"train_loss": -6.503893852233887, "global_step": 104748, "epoch": 2494} {"train_loss": -6.414224147796631, "global_step": 104749, "epoch": 2494} {"train_loss": -6.341087341308594, "global_step": 104750, "epoch": 2494} {"train_loss": -6.409455299377441, "global_step": 104751, "epoch": 2494} {"train_loss": -6.375692367553711, "global_step": 104752, "epoch": 2494} {"train_loss": -6.496724605560303, "global_step": 104753, "epoch": 2494} {"train_loss": -6.390055179595947, "global_step": 104754, "epoch": 2494} {"train_loss": -6.528646945953369, "global_step": 104755, "epoch": 2494} {"train_loss": -6.442800045013428, "global_step": 104756, "epoch": 2494} {"train_loss": -6.355489730834961, "global_step": 104757, "epoch": 2494} {"train_loss": -6.3764753341674805, "global_step": 104758, "epoch": 2494} {"train_loss": -6.330660343170166, "global_step": 104759, "epoch": 2494} {"train_loss": -6.327897071838379, "global_step": 104760, "epoch": 2494} {"train_loss": -6.388466835021973, "global_step": 104761, "epoch": 2494} {"train_loss": -6.42484712600708, "global_step": 104762, "epoch": 2494} {"train_loss": -6.318238258361816, "global_step": 104763, "epoch": 2494} {"train_loss": -6.386109352111816, "global_step": 104764, "epoch": 2494} {"train_loss": -6.386202812194824, "global_step": 104765, "epoch": 2494} {"train_loss": -6.27028226852417, "global_step": 104766, "epoch": 2494} {"train_loss": -6.279730796813965, "global_step": 104767, "epoch": 2494} {"train_loss": -6.298410415649414, "global_step": 104768, "epoch": 2494} {"train_loss": -6.254319667816162, "global_step": 104769, "epoch": 2494} {"train_loss": -6.320298671722412, "global_step": 104770, "epoch": 2494} {"train_loss": -6.311387062072754, "global_step": 104771, "epoch": 2494} {"train_loss": -6.2879157066345215, "global_step": 104772, "epoch": 2494} {"train_loss": -6.398908615112305, "global_step": 104773, "epoch": 2494} {"train_loss": -6.395771026611328, "global_step": 104774, "epoch": 2494} {"train_loss": -6.373404502868652, "global_step": 104775, "epoch": 2494} {"train_loss": -6.393671035766602, "global_step": 104776, "epoch": 2494} {"train_loss": -6.4153523445129395, "global_step": 104777, "epoch": 2494} {"train_loss": -6.35492467880249, "global_step": 104778, "epoch": 2494} {"train_loss": -6.326155662536621, "global_step": 104779, "epoch": 2494} {"train_loss": -6.486330986022949, "global_step": 104780, "epoch": 2494} {"train_loss": -6.305275917053223, "global_step": 104781, "epoch": 2494} {"train_loss": -6.3620195388793945, "global_step": 104782, "epoch": 2494} {"train_loss": -6.414780616760254, "global_step": 104783, "epoch": 2494} {"train_loss": -6.320797920227051, "global_step": 104784, "epoch": 2494} {"train_loss": -6.465600967407227, "global_step": 104785, "epoch": 2494} {"train_loss": -6.400409698486328, "global_step": 104786, "epoch": 2494} {"train_loss": -6.29960823059082, "global_step": 104787, "epoch": 2494} {"train_loss": -6.388095378875732, "global_step": 104788, "epoch": 2494} {"train_loss": -6.3736389705113, "global_step": 104789, "epoch": 2494, "val_loss": 76036.15625} {"train_loss": -6.327366828918457, "global_step": 104790, "epoch": 2495} {"train_loss": -6.439288139343262, "global_step": 104791, "epoch": 2495} {"train_loss": -6.393903732299805, "global_step": 104792, "epoch": 2495} {"train_loss": -6.3798065185546875, "global_step": 104793, "epoch": 2495} {"train_loss": -6.486098289489746, "global_step": 104794, "epoch": 2495} {"train_loss": -6.459735870361328, "global_step": 104795, "epoch": 2495} {"train_loss": -6.268538475036621, "global_step": 104796, "epoch": 2495} {"train_loss": -6.444390773773193, "global_step": 104797, "epoch": 2495} {"train_loss": -6.365259170532227, "global_step": 104798, "epoch": 2495} {"train_loss": -6.4702229499816895, "global_step": 104799, "epoch": 2495} {"train_loss": -6.3992204666137695, "global_step": 104800, "epoch": 2495} {"train_loss": -6.399029731750488, "global_step": 104801, "epoch": 2495} {"train_loss": -6.476151466369629, "global_step": 104802, "epoch": 2495} {"train_loss": -6.232326030731201, "global_step": 104803, "epoch": 2495} {"train_loss": -6.392876625061035, "global_step": 104804, "epoch": 2495} {"train_loss": -6.399312973022461, "global_step": 104805, "epoch": 2495} {"train_loss": -6.475069046020508, "global_step": 104806, "epoch": 2495} {"train_loss": -6.462738990783691, "global_step": 104807, "epoch": 2495} {"train_loss": -6.426987171173096, "global_step": 104808, "epoch": 2495} {"train_loss": -6.249778747558594, "global_step": 104809, "epoch": 2495} {"train_loss": -6.476406097412109, "global_step": 104810, "epoch": 2495} {"train_loss": -6.3999810218811035, "global_step": 104811, "epoch": 2495} {"train_loss": -6.399648189544678, "global_step": 104812, "epoch": 2495} {"train_loss": -6.378775119781494, "global_step": 104813, "epoch": 2495} {"train_loss": -6.445619583129883, "global_step": 104814, "epoch": 2495} {"train_loss": -6.436047554016113, "global_step": 104815, "epoch": 2495} {"train_loss": -6.566106796264648, "global_step": 104816, "epoch": 2495} {"train_loss": -6.3981828689575195, "global_step": 104817, "epoch": 2495} {"train_loss": -6.447893142700195, "global_step": 104818, "epoch": 2495} {"train_loss": -6.296809196472168, "global_step": 104819, "epoch": 2495} {"train_loss": -6.379599571228027, "global_step": 104820, "epoch": 2495} {"train_loss": -6.433614730834961, "global_step": 104821, "epoch": 2495} {"train_loss": -6.37173318862915, "global_step": 104822, "epoch": 2495} {"train_loss": -6.445385932922363, "global_step": 104823, "epoch": 2495} {"train_loss": -6.331931114196777, "global_step": 104824, "epoch": 2495} {"train_loss": -6.395556926727295, "global_step": 104825, "epoch": 2495} {"train_loss": -6.391167163848877, "global_step": 104826, "epoch": 2495} {"train_loss": -6.4176483154296875, "global_step": 104827, "epoch": 2495} {"train_loss": -6.483175277709961, "global_step": 104828, "epoch": 2495} {"train_loss": -6.314759254455566, "global_step": 104829, "epoch": 2495} {"train_loss": -6.435629367828369, "global_step": 104830, "epoch": 2495} {"train_loss": -6.405651523953392, "global_step": 104831, "epoch": 2495, "val_loss": 76284.921875} {"train_loss": -6.341861248016357, "global_step": 104832, "epoch": 2496} {"train_loss": -6.467541694641113, "global_step": 104833, "epoch": 2496} {"train_loss": -6.468997001647949, "global_step": 104834, "epoch": 2496} {"train_loss": -6.4212446212768555, "global_step": 104835, "epoch": 2496} {"train_loss": -6.380128860473633, "global_step": 104836, "epoch": 2496} {"train_loss": -6.567718982696533, "global_step": 104837, "epoch": 2496} {"train_loss": -6.4929046630859375, "global_step": 104838, "epoch": 2496} {"train_loss": -6.294755935668945, "global_step": 104839, "epoch": 2496} {"train_loss": -6.513625144958496, "global_step": 104840, "epoch": 2496} {"train_loss": -6.406290054321289, "global_step": 104841, "epoch": 2496} {"train_loss": -6.383550643920898, "global_step": 104842, "epoch": 2496} {"train_loss": -6.39323091506958, "global_step": 104843, "epoch": 2496} {"train_loss": -6.364217758178711, "global_step": 104844, "epoch": 2496} {"train_loss": -6.445433616638184, "global_step": 104845, "epoch": 2496} {"train_loss": -6.302683353424072, "global_step": 104846, "epoch": 2496} {"train_loss": -6.35877799987793, "global_step": 104847, "epoch": 2496} {"train_loss": -6.398733139038086, "global_step": 104848, "epoch": 2496} {"train_loss": -6.251404762268066, "global_step": 104849, "epoch": 2496} {"train_loss": -6.37208890914917, "global_step": 104850, "epoch": 2496} {"train_loss": -6.401412487030029, "global_step": 104851, "epoch": 2496} {"train_loss": -6.35904598236084, "global_step": 104852, "epoch": 2496} {"train_loss": -6.354352951049805, "global_step": 104853, "epoch": 2496} {"train_loss": -6.498676776885986, "global_step": 104854, "epoch": 2496} {"train_loss": -6.481907844543457, "global_step": 104855, "epoch": 2496} {"train_loss": -6.369154930114746, "global_step": 104856, "epoch": 2496} {"train_loss": -6.420153617858887, "global_step": 104857, "epoch": 2496} {"train_loss": -6.31519889831543, "global_step": 104858, "epoch": 2496} {"train_loss": -6.297478675842285, "global_step": 104859, "epoch": 2496} {"train_loss": -6.405427932739258, "global_step": 104860, "epoch": 2496} {"train_loss": -6.447216987609863, "global_step": 104861, "epoch": 2496} {"train_loss": -6.224900245666504, "global_step": 104862, "epoch": 2496} {"train_loss": -6.316384315490723, "global_step": 104863, "epoch": 2496} {"train_loss": -6.328855514526367, "global_step": 104864, "epoch": 2496} {"train_loss": -6.391269683837891, "global_step": 104865, "epoch": 2496} {"train_loss": -6.357539653778076, "global_step": 104866, "epoch": 2496} {"train_loss": -6.232325553894043, "global_step": 104867, "epoch": 2496} {"train_loss": -6.37122106552124, "global_step": 104868, "epoch": 2496} {"train_loss": -6.223790168762207, "global_step": 104869, "epoch": 2496} {"train_loss": -6.325544357299805, "global_step": 104870, "epoch": 2496} {"train_loss": -6.509127616882324, "global_step": 104871, "epoch": 2496} {"train_loss": -6.369366645812988, "global_step": 104872, "epoch": 2496} {"train_loss": -6.381468738828387, "global_step": 104873, "epoch": 2496, "val_loss": 75976.7421875} {"train_loss": -6.394296646118164, "global_step": 104874, "epoch": 2497} {"train_loss": -6.36644172668457, "global_step": 104875, "epoch": 2497} {"train_loss": -6.469015121459961, "global_step": 104876, "epoch": 2497} {"train_loss": -6.397031784057617, "global_step": 104877, "epoch": 2497} {"train_loss": -6.3688859939575195, "global_step": 104878, "epoch": 2497} {"train_loss": -6.308962821960449, "global_step": 104879, "epoch": 2497} {"train_loss": -6.485116958618164, "global_step": 104880, "epoch": 2497} {"train_loss": -6.403120040893555, "global_step": 104881, "epoch": 2497} {"train_loss": -6.466619491577148, "global_step": 104882, "epoch": 2497} {"train_loss": -6.384477138519287, "global_step": 104883, "epoch": 2497} {"train_loss": -6.455204963684082, "global_step": 104884, "epoch": 2497} {"train_loss": -6.462856292724609, "global_step": 104885, "epoch": 2497} {"train_loss": -6.422089576721191, "global_step": 104886, "epoch": 2497} {"train_loss": -6.36258602142334, "global_step": 104887, "epoch": 2497} {"train_loss": -6.392358303070068, "global_step": 104888, "epoch": 2497} {"train_loss": -6.327736854553223, "global_step": 104889, "epoch": 2497} {"train_loss": -6.41949462890625, "global_step": 104890, "epoch": 2497} {"train_loss": -6.340237140655518, "global_step": 104891, "epoch": 2497} {"train_loss": -6.287967681884766, "global_step": 104892, "epoch": 2497} {"train_loss": -6.4610371589660645, "global_step": 104893, "epoch": 2497} {"train_loss": -6.275434494018555, "global_step": 104894, "epoch": 2497} {"train_loss": -6.323728561401367, "global_step": 104895, "epoch": 2497} {"train_loss": -6.445442199707031, "global_step": 104896, "epoch": 2497} {"train_loss": -6.473254203796387, "global_step": 104897, "epoch": 2497} {"train_loss": -6.375063419342041, "global_step": 104898, "epoch": 2497} {"train_loss": -6.483068466186523, "global_step": 104899, "epoch": 2497} {"train_loss": -6.3149919509887695, "global_step": 104900, "epoch": 2497} {"train_loss": -6.482239723205566, "global_step": 104901, "epoch": 2497} {"train_loss": -6.47071647644043, "global_step": 104902, "epoch": 2497} {"train_loss": -6.45660924911499, "global_step": 104903, "epoch": 2497} {"train_loss": -6.478137969970703, "global_step": 104904, "epoch": 2497} {"train_loss": -6.467128753662109, "global_step": 104905, "epoch": 2497} {"train_loss": -6.3830485343933105, "global_step": 104906, "epoch": 2497} {"train_loss": -6.498010158538818, "global_step": 104907, "epoch": 2497} {"train_loss": -6.475388050079346, "global_step": 104908, "epoch": 2497} {"train_loss": -6.468793869018555, "global_step": 104909, "epoch": 2497} {"train_loss": -6.4389848709106445, "global_step": 104910, "epoch": 2497} {"train_loss": -6.378639221191406, "global_step": 104911, "epoch": 2497} {"train_loss": -6.341469764709473, "global_step": 104912, "epoch": 2497} {"train_loss": -6.462466716766357, "global_step": 104913, "epoch": 2497} {"train_loss": -6.308045387268066, "global_step": 104914, "epoch": 2497} {"train_loss": -6.408161038444156, "global_step": 104915, "epoch": 2497, "val_loss": 75786.3515625} {"train_loss": -6.473826885223389, "global_step": 104916, "epoch": 2498} {"train_loss": -6.435522079467773, "global_step": 104917, "epoch": 2498} {"train_loss": -6.334094047546387, "global_step": 104918, "epoch": 2498} {"train_loss": -6.413266181945801, "global_step": 104919, "epoch": 2498} {"train_loss": -6.395043849945068, "global_step": 104920, "epoch": 2498} {"train_loss": -6.421778202056885, "global_step": 104921, "epoch": 2498} {"train_loss": -6.440072059631348, "global_step": 104922, "epoch": 2498} {"train_loss": -6.3093767166137695, "global_step": 104923, "epoch": 2498} {"train_loss": -6.42792272567749, "global_step": 104924, "epoch": 2498} {"train_loss": -6.3197922706604, "global_step": 104925, "epoch": 2498} {"train_loss": -6.266704082489014, "global_step": 104926, "epoch": 2498} {"train_loss": -6.297416687011719, "global_step": 104927, "epoch": 2498} {"train_loss": -6.295218467712402, "global_step": 104928, "epoch": 2498} {"train_loss": -6.40703010559082, "global_step": 104929, "epoch": 2498} {"train_loss": -6.430417060852051, "global_step": 104930, "epoch": 2498} {"train_loss": -6.3133955001831055, "global_step": 104931, "epoch": 2498} {"train_loss": -6.4138898849487305, "global_step": 104932, "epoch": 2498} {"train_loss": -6.317873001098633, "global_step": 104933, "epoch": 2498} {"train_loss": -6.2736310958862305, "global_step": 104934, "epoch": 2498} {"train_loss": -6.330923080444336, "global_step": 104935, "epoch": 2498} {"train_loss": -6.29251766204834, "global_step": 104936, "epoch": 2498} {"train_loss": -6.33173942565918, "global_step": 104937, "epoch": 2498} {"train_loss": -6.435393333435059, "global_step": 104938, "epoch": 2498} {"train_loss": -6.210958480834961, "global_step": 104939, "epoch": 2498} {"train_loss": -6.4501953125, "global_step": 104940, "epoch": 2498} {"train_loss": -6.303531646728516, "global_step": 104941, "epoch": 2498} {"train_loss": -6.406618118286133, "global_step": 104942, "epoch": 2498} {"train_loss": -6.41082763671875, "global_step": 104943, "epoch": 2498} {"train_loss": -6.415410995483398, "global_step": 104944, "epoch": 2498} {"train_loss": -6.278571128845215, "global_step": 104945, "epoch": 2498} {"train_loss": -6.462172985076904, "global_step": 104946, "epoch": 2498} {"train_loss": -6.2194504737854, "global_step": 104947, "epoch": 2498} {"train_loss": -6.398099899291992, "global_step": 104948, "epoch": 2498} {"train_loss": -6.429380416870117, "global_step": 104949, "epoch": 2498} {"train_loss": -6.225484848022461, "global_step": 104950, "epoch": 2498} {"train_loss": -6.435548782348633, "global_step": 104951, "epoch": 2498} {"train_loss": -6.4195637702941895, "global_step": 104952, "epoch": 2498} {"train_loss": -6.353634834289551, "global_step": 104953, "epoch": 2498} {"train_loss": -6.502691268920898, "global_step": 104954, "epoch": 2498} {"train_loss": -6.262402057647705, "global_step": 104955, "epoch": 2498} {"train_loss": -6.367097854614258, "global_step": 104956, "epoch": 2498} {"train_loss": -6.3649727389926, "global_step": 104957, "epoch": 2498, "val_loss": 76170.1640625} {"train_loss": -6.277104377746582, "global_step": 104958, "epoch": 2499} {"train_loss": -6.454741477966309, "global_step": 104959, "epoch": 2499} {"train_loss": -6.341496467590332, "global_step": 104960, "epoch": 2499} {"train_loss": -6.4124321937561035, "global_step": 104961, "epoch": 2499} {"train_loss": -6.305230140686035, "global_step": 104962, "epoch": 2499} {"train_loss": -6.293432712554932, "global_step": 104963, "epoch": 2499} {"train_loss": -6.428293704986572, "global_step": 104964, "epoch": 2499} {"train_loss": -6.402022361755371, "global_step": 104965, "epoch": 2499} {"train_loss": -6.360705852508545, "global_step": 104966, "epoch": 2499} {"train_loss": -6.361411094665527, "global_step": 104967, "epoch": 2499} {"train_loss": -6.392210006713867, "global_step": 104968, "epoch": 2499} {"train_loss": -6.489406108856201, "global_step": 104969, "epoch": 2499} {"train_loss": -6.344719886779785, "global_step": 104970, "epoch": 2499} {"train_loss": -6.356136322021484, "global_step": 104971, "epoch": 2499} {"train_loss": -6.360384464263916, "global_step": 104972, "epoch": 2499} {"train_loss": -6.326362133026123, "global_step": 104973, "epoch": 2499} {"train_loss": -6.493129730224609, "global_step": 104974, "epoch": 2499} {"train_loss": -6.359123706817627, "global_step": 104975, "epoch": 2499} {"train_loss": -6.325568199157715, "global_step": 104976, "epoch": 2499} {"train_loss": -6.403909206390381, "global_step": 104977, "epoch": 2499} {"train_loss": -6.334871292114258, "global_step": 104978, "epoch": 2499} {"train_loss": -6.442077159881592, "global_step": 104979, "epoch": 2499} {"train_loss": -6.451263427734375, "global_step": 104980, "epoch": 2499} {"train_loss": -6.366232872009277, "global_step": 104981, "epoch": 2499} {"train_loss": -6.467769622802734, "global_step": 104982, "epoch": 2499} {"train_loss": -6.4646077156066895, "global_step": 104983, "epoch": 2499} {"train_loss": -6.33773136138916, "global_step": 104984, "epoch": 2499} {"train_loss": -6.4419708251953125, "global_step": 104985, "epoch": 2499} {"train_loss": -6.5451130867004395, "global_step": 104986, "epoch": 2499} {"train_loss": -6.322754859924316, "global_step": 104987, "epoch": 2499} {"train_loss": -6.364896774291992, "global_step": 104988, "epoch": 2499} {"train_loss": -6.417817115783691, "global_step": 104989, "epoch": 2499} {"train_loss": -6.3636956214904785, "global_step": 104990, "epoch": 2499} {"train_loss": -6.362030029296875, "global_step": 104991, "epoch": 2499} {"train_loss": -6.4373698234558105, "global_step": 104992, "epoch": 2499} {"train_loss": -6.438472747802734, "global_step": 104993, "epoch": 2499} {"train_loss": -6.3389153480529785, "global_step": 104994, "epoch": 2499} {"train_loss": -6.4791259765625, "global_step": 104995, "epoch": 2499} {"train_loss": -6.459423065185547, "global_step": 104996, "epoch": 2499} {"train_loss": -6.259922027587891, "global_step": 104997, "epoch": 2499} {"train_loss": -6.33546257019043, "global_step": 104998, "epoch": 2499} {"train_loss": -6.391289483933222, "global_step": 104999, "epoch": 2499, "val_loss": 76324.40625} {"train_loss": -6.367388725280762, "global_step": 105000, "epoch": 2500} {"train_loss": -6.382399559020996, "global_step": 105001, "epoch": 2500} {"train_loss": -6.394097328186035, "global_step": 105002, "epoch": 2500} {"train_loss": -6.348917007446289, "global_step": 105003, "epoch": 2500} {"train_loss": -6.475893974304199, "global_step": 105004, "epoch": 2500} {"train_loss": -6.4612202644348145, "global_step": 105005, "epoch": 2500} {"train_loss": -6.513775825500488, "global_step": 105006, "epoch": 2500} {"train_loss": -6.26997184753418, "global_step": 105007, "epoch": 2500} {"train_loss": -6.3679914474487305, "global_step": 105008, "epoch": 2500} {"train_loss": -6.4318060874938965, "global_step": 105009, "epoch": 2500} {"train_loss": -6.45389986038208, "global_step": 105010, "epoch": 2500} {"train_loss": -6.432377815246582, "global_step": 105011, "epoch": 2500} {"train_loss": -6.3996357917785645, "global_step": 105012, "epoch": 2500} {"train_loss": -6.4199395179748535, "global_step": 105013, "epoch": 2500} {"train_loss": -6.430098533630371, "global_step": 105014, "epoch": 2500} {"train_loss": -6.450436592102051, "global_step": 105015, "epoch": 2500} {"train_loss": -6.429174423217773, "global_step": 105016, "epoch": 2500} {"train_loss": -6.408588409423828, "global_step": 105017, "epoch": 2500} {"train_loss": -6.370744228363037, "global_step": 105018, "epoch": 2500} {"train_loss": -6.352956771850586, "global_step": 105019, "epoch": 2500} {"train_loss": -6.410334587097168, "global_step": 105020, "epoch": 2500} {"train_loss": -6.411205768585205, "global_step": 105021, "epoch": 2500} {"train_loss": -6.341273307800293, "global_step": 105022, "epoch": 2500} {"train_loss": -6.404829978942871, "global_step": 105023, "epoch": 2500} {"train_loss": -6.327879428863525, "global_step": 105024, "epoch": 2500} {"train_loss": -6.4644622802734375, "global_step": 105025, "epoch": 2500} {"train_loss": -6.550431251525879, "global_step": 105026, "epoch": 2500} {"train_loss": -6.514376640319824, "global_step": 105027, "epoch": 2500} {"train_loss": -6.481175422668457, "global_step": 105028, "epoch": 2500} {"train_loss": -6.4818925857543945, "global_step": 105029, "epoch": 2500} {"train_loss": -6.370038032531738, "global_step": 105030, "epoch": 2500} {"train_loss": -6.430375576019287, "global_step": 105031, "epoch": 2500} {"train_loss": -6.355042934417725, "global_step": 105032, "epoch": 2500} {"train_loss": -6.418400287628174, "global_step": 105033, "epoch": 2500} {"train_loss": -6.391841888427734, "global_step": 105034, "epoch": 2500} {"train_loss": -6.325068473815918, "global_step": 105035, "epoch": 2500} {"train_loss": -6.387714385986328, "global_step": 105036, "epoch": 2500} {"train_loss": -6.411222457885742, "global_step": 105037, "epoch": 2500} {"train_loss": -6.502538204193115, "global_step": 105038, "epoch": 2500} {"train_loss": -6.495847225189209, "global_step": 105039, "epoch": 2500} {"train_loss": -6.421441555023193, "global_step": 105040, "epoch": 2500} {"train_loss": -6.41615400995527, "global_step": 105041, "epoch": 2500, "train/sim_max_reward_0": 0.946596251216973, "train/sim_max_reward_1": 0.8726773148499946, "train/sim_max_reward_2": 0.3090607799254261, "train/sim_max_reward_3": 0.13358324326745524, "train/sim_max_reward_4": 0.9650405558271798, "train/sim_max_reward_5": 0.8475847874290279, "test/sim_max_reward_4500000": 0.7030286311860209, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9598748504489241, "test/sim_max_reward_4500003": 0.8223168073548054, "test/sim_max_reward_4500004": 0.10649316687811029, "test/sim_max_reward_4500005": 0.8594136899904662, "test/sim_max_reward_4500006": 0.9375118845624629, "test/sim_max_reward_4500007": 0.8685114090974833, "test/sim_max_reward_4500008": 0.3888400116343124, "test/sim_max_reward_4500009": 0.7454578850966708, "test/sim_max_reward_4500010": 0.09345236712757407, "test/sim_max_reward_4500011": 0.8324852515069459, "test/sim_max_reward_4500012": 0.07789307620190676, "test/sim_max_reward_4500013": 0.0055873849898909365, "test/sim_max_reward_4500014": 0.46620380970328273, "test/sim_max_reward_4500015": 0.8466771904898962, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.15366152755406026, "test/sim_max_reward_4500018": 0.34484051303017765, "test/sim_max_reward_4500019": 0.866885411744118, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.6748461263788932, "test/sim_max_reward_4500022": 0.8755235439435155, "test/sim_max_reward_4500023": 0.9690732096059721, "test/sim_max_reward_4500024": 0.8358441419373499, "test/sim_max_reward_4500025": 0.00012375628920345408, "test/sim_max_reward_4500026": 0.9793360606198603, "test/sim_max_reward_4500027": 0.7999048190506872, "test/sim_max_reward_4500028": 0.19582934075748631, "test/sim_max_reward_4500029": 0.07433892140500593, "test/sim_max_reward_4500030": 0.9377913862113508, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.817402007638843, "test/sim_max_reward_4500034": 0.8272782128047494, "test/sim_max_reward_4500035": 0.9611238596728631, "test/sim_max_reward_4500036": 0.3814676003214424, "test/sim_max_reward_4500037": 0.8601598063753735, "test/sim_max_reward_4500038": 0.2930334651680533, "test/sim_max_reward_4500039": 0.9061809021777466, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.003921138494725515, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.017162403150193153, "test/sim_max_reward_4500045": 0.4147688829340382, "test/sim_max_reward_4500046": 0.7437871884038147, "test/sim_max_reward_4500047": 0.8921877938036937, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6790904887526761, "test/mean_score": 0.512534254669296, "val_loss": 76015.9453125} {"train_loss": -6.414511203765869, "global_step": 105042, "epoch": 2501} {"train_loss": -6.48493766784668, "global_step": 105043, "epoch": 2501} {"train_loss": -6.555821418762207, "global_step": 105044, "epoch": 2501} {"train_loss": -6.447919845581055, "global_step": 105045, "epoch": 2501} {"train_loss": -6.389066696166992, "global_step": 105046, "epoch": 2501} {"train_loss": -6.444190979003906, "global_step": 105047, "epoch": 2501} {"train_loss": -6.390676498413086, "global_step": 105048, "epoch": 2501} {"train_loss": -6.48008918762207, "global_step": 105049, "epoch": 2501} {"train_loss": -6.432981967926025, "global_step": 105050, "epoch": 2501} {"train_loss": -6.473400115966797, "global_step": 105051, "epoch": 2501} {"train_loss": -6.401091575622559, "global_step": 105052, "epoch": 2501} {"train_loss": -6.360284805297852, "global_step": 105053, "epoch": 2501} {"train_loss": -6.486558437347412, "global_step": 105054, "epoch": 2501} {"train_loss": -6.425206184387207, "global_step": 105055, "epoch": 2501} {"train_loss": -6.422252655029297, "global_step": 105056, "epoch": 2501} {"train_loss": -6.452654838562012, "global_step": 105057, "epoch": 2501} {"train_loss": -6.340405464172363, "global_step": 105058, "epoch": 2501} {"train_loss": -6.494967460632324, "global_step": 105059, "epoch": 2501} {"train_loss": -6.448124885559082, "global_step": 105060, "epoch": 2501} {"train_loss": -6.497073173522949, "global_step": 105061, "epoch": 2501} {"train_loss": -6.419325351715088, "global_step": 105062, "epoch": 2501} {"train_loss": -6.4723005294799805, "global_step": 105063, "epoch": 2501} {"train_loss": -6.525442123413086, "global_step": 105064, "epoch": 2501} {"train_loss": -6.320248126983643, "global_step": 105065, "epoch": 2501} {"train_loss": -6.347867965698242, "global_step": 105066, "epoch": 2501} {"train_loss": -6.455941677093506, "global_step": 105067, "epoch": 2501} {"train_loss": -6.374173641204834, "global_step": 105068, "epoch": 2501} {"train_loss": -6.396329879760742, "global_step": 105069, "epoch": 2501} {"train_loss": -6.3676533699035645, "global_step": 105070, "epoch": 2501} {"train_loss": -6.413559436798096, "global_step": 105071, "epoch": 2501} {"train_loss": -6.231331825256348, "global_step": 105072, "epoch": 2501} {"train_loss": -6.413403511047363, "global_step": 105073, "epoch": 2501} {"train_loss": -6.5288567543029785, "global_step": 105074, "epoch": 2501} {"train_loss": -6.514620304107666, "global_step": 105075, "epoch": 2501} {"train_loss": -6.487374305725098, "global_step": 105076, "epoch": 2501} {"train_loss": -6.3680853843688965, "global_step": 105077, "epoch": 2501} {"train_loss": -6.482544898986816, "global_step": 105078, "epoch": 2501} {"train_loss": -6.434566974639893, "global_step": 105079, "epoch": 2501} {"train_loss": -6.404803276062012, "global_step": 105080, "epoch": 2501} {"train_loss": -6.541376113891602, "global_step": 105081, "epoch": 2501} {"train_loss": -6.421311378479004, "global_step": 105082, "epoch": 2501} {"train_loss": -6.429461638132731, "global_step": 105083, "epoch": 2501, "val_loss": 76101.90625} {"train_loss": -6.4610748291015625, "global_step": 105084, "epoch": 2502} {"train_loss": -6.369132041931152, "global_step": 105085, "epoch": 2502} {"train_loss": -6.501695156097412, "global_step": 105086, "epoch": 2502} {"train_loss": -6.332833290100098, "global_step": 105087, "epoch": 2502} {"train_loss": -6.489917755126953, "global_step": 105088, "epoch": 2502} {"train_loss": -6.439441680908203, "global_step": 105089, "epoch": 2502} {"train_loss": -6.447127819061279, "global_step": 105090, "epoch": 2502} {"train_loss": -6.520018100738525, "global_step": 105091, "epoch": 2502} {"train_loss": -6.427892684936523, "global_step": 105092, "epoch": 2502} {"train_loss": -6.412052154541016, "global_step": 105093, "epoch": 2502} {"train_loss": -6.461981773376465, "global_step": 105094, "epoch": 2502} {"train_loss": -6.309964179992676, "global_step": 105095, "epoch": 2502} {"train_loss": -6.46401309967041, "global_step": 105096, "epoch": 2502} {"train_loss": -6.336513042449951, "global_step": 105097, "epoch": 2502} {"train_loss": -6.5883989334106445, "global_step": 105098, "epoch": 2502} {"train_loss": -6.476694583892822, "global_step": 105099, "epoch": 2502} {"train_loss": -6.385785102844238, "global_step": 105100, "epoch": 2502} {"train_loss": -6.440053939819336, "global_step": 105101, "epoch": 2502} {"train_loss": -6.436471939086914, "global_step": 105102, "epoch": 2502} {"train_loss": -6.359897613525391, "global_step": 105103, "epoch": 2502} {"train_loss": -6.381295204162598, "global_step": 105104, "epoch": 2502} {"train_loss": -6.360602378845215, "global_step": 105105, "epoch": 2502} {"train_loss": -6.357968330383301, "global_step": 105106, "epoch": 2502} {"train_loss": -6.307631492614746, "global_step": 105107, "epoch": 2502} {"train_loss": -6.335308074951172, "global_step": 105108, "epoch": 2502} {"train_loss": -6.266357421875, "global_step": 105109, "epoch": 2502} {"train_loss": -6.255197048187256, "global_step": 105110, "epoch": 2502} {"train_loss": -6.321187496185303, "global_step": 105111, "epoch": 2502} {"train_loss": -6.318041801452637, "global_step": 105112, "epoch": 2502} {"train_loss": -6.283002853393555, "global_step": 105113, "epoch": 2502} {"train_loss": -6.400334358215332, "global_step": 105114, "epoch": 2502} {"train_loss": -6.353763580322266, "global_step": 105115, "epoch": 2502} {"train_loss": -6.409686088562012, "global_step": 105116, "epoch": 2502} {"train_loss": -6.400097846984863, "global_step": 105117, "epoch": 2502} {"train_loss": -6.3522748947143555, "global_step": 105118, "epoch": 2502} {"train_loss": -6.3424835205078125, "global_step": 105119, "epoch": 2502} {"train_loss": -6.319194316864014, "global_step": 105120, "epoch": 2502} {"train_loss": -6.357553958892822, "global_step": 105121, "epoch": 2502} {"train_loss": -6.394305229187012, "global_step": 105122, "epoch": 2502} {"train_loss": -6.2687273025512695, "global_step": 105123, "epoch": 2502} {"train_loss": -6.4302778244018555, "global_step": 105124, "epoch": 2502} {"train_loss": -6.384752875282651, "global_step": 105125, "epoch": 2502, "val_loss": 75943.859375} {"train_loss": -6.356154918670654, "global_step": 105126, "epoch": 2503} {"train_loss": -6.279463768005371, "global_step": 105127, "epoch": 2503} {"train_loss": -6.45632266998291, "global_step": 105128, "epoch": 2503} {"train_loss": -6.324631214141846, "global_step": 105129, "epoch": 2503} {"train_loss": -6.339688301086426, "global_step": 105130, "epoch": 2503} {"train_loss": -6.495657920837402, "global_step": 105131, "epoch": 2503} {"train_loss": -6.442152500152588, "global_step": 105132, "epoch": 2503} {"train_loss": -6.437839508056641, "global_step": 105133, "epoch": 2503} {"train_loss": -6.327216148376465, "global_step": 105134, "epoch": 2503} {"train_loss": -6.4601287841796875, "global_step": 105135, "epoch": 2503} {"train_loss": -6.299771785736084, "global_step": 105136, "epoch": 2503} {"train_loss": -6.3631591796875, "global_step": 105137, "epoch": 2503} {"train_loss": -6.549086570739746, "global_step": 105138, "epoch": 2503} {"train_loss": -6.347503662109375, "global_step": 105139, "epoch": 2503} {"train_loss": -6.454479217529297, "global_step": 105140, "epoch": 2503} {"train_loss": -6.395220756530762, "global_step": 105141, "epoch": 2503} {"train_loss": -6.431365013122559, "global_step": 105142, "epoch": 2503} {"train_loss": -6.473916053771973, "global_step": 105143, "epoch": 2503} {"train_loss": -6.445252418518066, "global_step": 105144, "epoch": 2503} {"train_loss": -6.561606407165527, "global_step": 105145, "epoch": 2503} {"train_loss": -6.326725006103516, "global_step": 105146, "epoch": 2503} {"train_loss": -6.245332717895508, "global_step": 105147, "epoch": 2503} {"train_loss": -6.2483086585998535, "global_step": 105148, "epoch": 2503} {"train_loss": -6.402224063873291, "global_step": 105149, "epoch": 2503} {"train_loss": -6.284091949462891, "global_step": 105150, "epoch": 2503} {"train_loss": -6.318541526794434, "global_step": 105151, "epoch": 2503} {"train_loss": -6.316683769226074, "global_step": 105152, "epoch": 2503} {"train_loss": -6.222079277038574, "global_step": 105153, "epoch": 2503} {"train_loss": -6.259324073791504, "global_step": 105154, "epoch": 2503} {"train_loss": -6.311875343322754, "global_step": 105155, "epoch": 2503} {"train_loss": -6.21956729888916, "global_step": 105156, "epoch": 2503} {"train_loss": -6.310938835144043, "global_step": 105157, "epoch": 2503} {"train_loss": -6.213225364685059, "global_step": 105158, "epoch": 2503} {"train_loss": -6.218367576599121, "global_step": 105159, "epoch": 2503} {"train_loss": -6.472894668579102, "global_step": 105160, "epoch": 2503} {"train_loss": -6.226282119750977, "global_step": 105161, "epoch": 2503} {"train_loss": -6.360151290893555, "global_step": 105162, "epoch": 2503} {"train_loss": -6.237040042877197, "global_step": 105163, "epoch": 2503} {"train_loss": -6.318490028381348, "global_step": 105164, "epoch": 2503} {"train_loss": -6.4048542976379395, "global_step": 105165, "epoch": 2503} {"train_loss": -6.442867755889893, "global_step": 105166, "epoch": 2503} {"train_loss": -6.358155897685459, "global_step": 105167, "epoch": 2503, "val_loss": 76431.2265625} {"train_loss": -6.322164535522461, "global_step": 105168, "epoch": 2504} {"train_loss": -6.402649879455566, "global_step": 105169, "epoch": 2504} {"train_loss": -6.271490097045898, "global_step": 105170, "epoch": 2504} {"train_loss": -6.48472785949707, "global_step": 105171, "epoch": 2504} {"train_loss": -6.414039134979248, "global_step": 105172, "epoch": 2504} {"train_loss": -6.340140342712402, "global_step": 105173, "epoch": 2504} {"train_loss": -6.379873275756836, "global_step": 105174, "epoch": 2504} {"train_loss": -6.394659042358398, "global_step": 105175, "epoch": 2504} {"train_loss": -6.318828582763672, "global_step": 105176, "epoch": 2504} {"train_loss": -6.475870609283447, "global_step": 105177, "epoch": 2504} {"train_loss": -6.3774213790893555, "global_step": 105178, "epoch": 2504} {"train_loss": -6.430699348449707, "global_step": 105179, "epoch": 2504} {"train_loss": -6.37332820892334, "global_step": 105180, "epoch": 2504} {"train_loss": -6.502838134765625, "global_step": 105181, "epoch": 2504} {"train_loss": -6.431150913238525, "global_step": 105182, "epoch": 2504} {"train_loss": -6.553375244140625, "global_step": 105183, "epoch": 2504} {"train_loss": -6.34112548828125, "global_step": 105184, "epoch": 2504} {"train_loss": -6.498133659362793, "global_step": 105185, "epoch": 2504} {"train_loss": -6.509311199188232, "global_step": 105186, "epoch": 2504} {"train_loss": -6.458239555358887, "global_step": 105187, "epoch": 2504} {"train_loss": -6.473941326141357, "global_step": 105188, "epoch": 2504} {"train_loss": -6.467510223388672, "global_step": 105189, "epoch": 2504} {"train_loss": -6.55507755279541, "global_step": 105190, "epoch": 2504} {"train_loss": -6.209980010986328, "global_step": 105191, "epoch": 2504} {"train_loss": -6.443922996520996, "global_step": 105192, "epoch": 2504} {"train_loss": -6.4343414306640625, "global_step": 105193, "epoch": 2504} {"train_loss": -6.483270645141602, "global_step": 105194, "epoch": 2504} {"train_loss": -6.347797870635986, "global_step": 105195, "epoch": 2504} {"train_loss": -6.285508155822754, "global_step": 105196, "epoch": 2504} {"train_loss": -6.502194881439209, "global_step": 105197, "epoch": 2504} {"train_loss": -6.262584686279297, "global_step": 105198, "epoch": 2504} {"train_loss": -6.32231330871582, "global_step": 105199, "epoch": 2504} {"train_loss": -6.413389682769775, "global_step": 105200, "epoch": 2504} {"train_loss": -6.419642925262451, "global_step": 105201, "epoch": 2504} {"train_loss": -6.218334197998047, "global_step": 105202, "epoch": 2504} {"train_loss": -6.461091995239258, "global_step": 105203, "epoch": 2504} {"train_loss": -6.323385238647461, "global_step": 105204, "epoch": 2504} {"train_loss": -6.247125625610352, "global_step": 105205, "epoch": 2504} {"train_loss": -6.399776458740234, "global_step": 105206, "epoch": 2504} {"train_loss": -6.251733779907227, "global_step": 105207, "epoch": 2504} {"train_loss": -6.356199741363525, "global_step": 105208, "epoch": 2504} {"train_loss": -6.393910124188378, "global_step": 105209, "epoch": 2504, "val_loss": 76135.9765625} {"train_loss": -6.3808913230896, "global_step": 105210, "epoch": 2505} {"train_loss": -6.299269199371338, "global_step": 105211, "epoch": 2505} {"train_loss": -6.335009574890137, "global_step": 105212, "epoch": 2505} {"train_loss": -6.260971546173096, "global_step": 105213, "epoch": 2505} {"train_loss": -6.247394561767578, "global_step": 105214, "epoch": 2505} {"train_loss": -6.330719947814941, "global_step": 105215, "epoch": 2505} {"train_loss": -6.291705131530762, "global_step": 105216, "epoch": 2505} {"train_loss": -6.296449661254883, "global_step": 105217, "epoch": 2505} {"train_loss": -6.254197120666504, "global_step": 105218, "epoch": 2505} {"train_loss": -6.303201198577881, "global_step": 105219, "epoch": 2505} {"train_loss": -6.328467845916748, "global_step": 105220, "epoch": 2505} {"train_loss": -6.287241458892822, "global_step": 105221, "epoch": 2505} {"train_loss": -6.445959091186523, "global_step": 105222, "epoch": 2505} {"train_loss": -6.429576873779297, "global_step": 105223, "epoch": 2505} {"train_loss": -6.368263244628906, "global_step": 105224, "epoch": 2505} {"train_loss": -6.337902069091797, "global_step": 105225, "epoch": 2505} {"train_loss": -6.41491174697876, "global_step": 105226, "epoch": 2505} {"train_loss": -6.507099151611328, "global_step": 105227, "epoch": 2505} {"train_loss": -6.346785545349121, "global_step": 105228, "epoch": 2505} {"train_loss": -6.310712814331055, "global_step": 105229, "epoch": 2505} {"train_loss": -6.352786064147949, "global_step": 105230, "epoch": 2505} {"train_loss": -6.4040422439575195, "global_step": 105231, "epoch": 2505} {"train_loss": -6.3120832443237305, "global_step": 105232, "epoch": 2505} {"train_loss": -6.442289352416992, "global_step": 105233, "epoch": 2505} {"train_loss": -6.40538215637207, "global_step": 105234, "epoch": 2505} {"train_loss": -6.378389358520508, "global_step": 105235, "epoch": 2505} {"train_loss": -6.380249977111816, "global_step": 105236, "epoch": 2505} {"train_loss": -6.458834648132324, "global_step": 105237, "epoch": 2505} {"train_loss": -6.403077602386475, "global_step": 105238, "epoch": 2505} {"train_loss": -6.363434791564941, "global_step": 105239, "epoch": 2505} {"train_loss": -6.373377799987793, "global_step": 105240, "epoch": 2505} {"train_loss": -6.415464401245117, "global_step": 105241, "epoch": 2505} {"train_loss": -6.390940189361572, "global_step": 105242, "epoch": 2505} {"train_loss": -6.427560806274414, "global_step": 105243, "epoch": 2505} {"train_loss": -6.448690414428711, "global_step": 105244, "epoch": 2505} {"train_loss": -6.420835494995117, "global_step": 105245, "epoch": 2505} {"train_loss": -6.306526184082031, "global_step": 105246, "epoch": 2505} {"train_loss": -6.551215171813965, "global_step": 105247, "epoch": 2505} {"train_loss": -6.328943252563477, "global_step": 105248, "epoch": 2505} {"train_loss": -6.442624568939209, "global_step": 105249, "epoch": 2505} {"train_loss": -6.454953193664551, "global_step": 105250, "epoch": 2505} {"train_loss": -6.370385408401489, "global_step": 105251, "epoch": 2505, "val_loss": 76058.671875} {"train_loss": -6.395138740539551, "global_step": 105252, "epoch": 2506} {"train_loss": -6.373427867889404, "global_step": 105253, "epoch": 2506} {"train_loss": -6.465944290161133, "global_step": 105254, "epoch": 2506} {"train_loss": -6.405481338500977, "global_step": 105255, "epoch": 2506} {"train_loss": -6.3783650398254395, "global_step": 105256, "epoch": 2506} {"train_loss": -6.37525749206543, "global_step": 105257, "epoch": 2506} {"train_loss": -6.49237060546875, "global_step": 105258, "epoch": 2506} {"train_loss": -6.343874931335449, "global_step": 105259, "epoch": 2506} {"train_loss": -6.404843330383301, "global_step": 105260, "epoch": 2506} {"train_loss": -6.359630584716797, "global_step": 105261, "epoch": 2506} {"train_loss": -6.277422904968262, "global_step": 105262, "epoch": 2506} {"train_loss": -6.378022193908691, "global_step": 105263, "epoch": 2506} {"train_loss": -6.348806381225586, "global_step": 105264, "epoch": 2506} {"train_loss": -6.50438117980957, "global_step": 105265, "epoch": 2506} {"train_loss": -6.351969242095947, "global_step": 105266, "epoch": 2506} {"train_loss": -6.420983791351318, "global_step": 105267, "epoch": 2506} {"train_loss": -6.435747146606445, "global_step": 105268, "epoch": 2506} {"train_loss": -6.374449253082275, "global_step": 105269, "epoch": 2506} {"train_loss": -6.413538932800293, "global_step": 105270, "epoch": 2506} {"train_loss": -6.397237777709961, "global_step": 105271, "epoch": 2506} {"train_loss": -6.450502872467041, "global_step": 105272, "epoch": 2506} {"train_loss": -6.463660717010498, "global_step": 105273, "epoch": 2506} {"train_loss": -6.363272666931152, "global_step": 105274, "epoch": 2506} {"train_loss": -6.476675033569336, "global_step": 105275, "epoch": 2506} {"train_loss": -6.320463180541992, "global_step": 105276, "epoch": 2506} {"train_loss": -6.507475852966309, "global_step": 105277, "epoch": 2506} {"train_loss": -6.430934906005859, "global_step": 105278, "epoch": 2506} {"train_loss": -6.503896236419678, "global_step": 105279, "epoch": 2506} {"train_loss": -6.564748764038086, "global_step": 105280, "epoch": 2506} {"train_loss": -6.453366279602051, "global_step": 105281, "epoch": 2506} {"train_loss": -6.465395927429199, "global_step": 105282, "epoch": 2506} {"train_loss": -6.461310863494873, "global_step": 105283, "epoch": 2506} {"train_loss": -6.455097198486328, "global_step": 105284, "epoch": 2506} {"train_loss": -6.5796308517456055, "global_step": 105285, "epoch": 2506} {"train_loss": -6.449737071990967, "global_step": 105286, "epoch": 2506} {"train_loss": -6.370012283325195, "global_step": 105287, "epoch": 2506} {"train_loss": -6.313628673553467, "global_step": 105288, "epoch": 2506} {"train_loss": -6.420188903808594, "global_step": 105289, "epoch": 2506} {"train_loss": -6.413162708282471, "global_step": 105290, "epoch": 2506} {"train_loss": -6.456494331359863, "global_step": 105291, "epoch": 2506} {"train_loss": -6.260435104370117, "global_step": 105292, "epoch": 2506} {"train_loss": -6.414173466818673, "global_step": 105293, "epoch": 2506, "val_loss": 75799.5078125} {"train_loss": -6.370136260986328, "global_step": 105294, "epoch": 2507} {"train_loss": -6.314525127410889, "global_step": 105295, "epoch": 2507} {"train_loss": -6.39326286315918, "global_step": 105296, "epoch": 2507} {"train_loss": -6.439108848571777, "global_step": 105297, "epoch": 2507} {"train_loss": -6.3258209228515625, "global_step": 105298, "epoch": 2507} {"train_loss": -6.452158451080322, "global_step": 105299, "epoch": 2507} {"train_loss": -6.300299644470215, "global_step": 105300, "epoch": 2507} {"train_loss": -6.4811248779296875, "global_step": 105301, "epoch": 2507} {"train_loss": -6.3618621826171875, "global_step": 105302, "epoch": 2507} {"train_loss": -6.355398654937744, "global_step": 105303, "epoch": 2507} {"train_loss": -6.350170135498047, "global_step": 105304, "epoch": 2507} {"train_loss": -6.400338172912598, "global_step": 105305, "epoch": 2507} {"train_loss": -6.322073936462402, "global_step": 105306, "epoch": 2507} {"train_loss": -6.397588729858398, "global_step": 105307, "epoch": 2507} {"train_loss": -6.295485496520996, "global_step": 105308, "epoch": 2507} {"train_loss": -6.193131446838379, "global_step": 105309, "epoch": 2507} {"train_loss": -6.350174427032471, "global_step": 105310, "epoch": 2507} {"train_loss": -6.358685493469238, "global_step": 105311, "epoch": 2507} {"train_loss": -6.2869873046875, "global_step": 105312, "epoch": 2507} {"train_loss": -6.2178192138671875, "global_step": 105313, "epoch": 2507} {"train_loss": -6.452536582946777, "global_step": 105314, "epoch": 2507} {"train_loss": -6.360202789306641, "global_step": 105315, "epoch": 2507} {"train_loss": -6.261014938354492, "global_step": 105316, "epoch": 2507} {"train_loss": -6.233057975769043, "global_step": 105317, "epoch": 2507} {"train_loss": -6.361430644989014, "global_step": 105318, "epoch": 2507} {"train_loss": -6.398438453674316, "global_step": 105319, "epoch": 2507} {"train_loss": -6.437774658203125, "global_step": 105320, "epoch": 2507} {"train_loss": -6.430820465087891, "global_step": 105321, "epoch": 2507} {"train_loss": -6.477389335632324, "global_step": 105322, "epoch": 2507} {"train_loss": -6.409769058227539, "global_step": 105323, "epoch": 2507} {"train_loss": -6.41231632232666, "global_step": 105324, "epoch": 2507} {"train_loss": -6.456982612609863, "global_step": 105325, "epoch": 2507} {"train_loss": -6.347474575042725, "global_step": 105326, "epoch": 2507} {"train_loss": -6.423757553100586, "global_step": 105327, "epoch": 2507} {"train_loss": -6.521960258483887, "global_step": 105328, "epoch": 2507} {"train_loss": -6.44881534576416, "global_step": 105329, "epoch": 2507} {"train_loss": -6.443328380584717, "global_step": 105330, "epoch": 2507} {"train_loss": -6.474422454833984, "global_step": 105331, "epoch": 2507} {"train_loss": -6.481472492218018, "global_step": 105332, "epoch": 2507} {"train_loss": -6.4573469161987305, "global_step": 105333, "epoch": 2507} {"train_loss": -6.59594202041626, "global_step": 105334, "epoch": 2507} {"train_loss": -6.38625305039542, "global_step": 105335, "epoch": 2507, "val_loss": 75967.1875} {"train_loss": -6.43453311920166, "global_step": 105336, "epoch": 2508} {"train_loss": -6.4474382400512695, "global_step": 105337, "epoch": 2508} {"train_loss": -6.478099822998047, "global_step": 105338, "epoch": 2508} {"train_loss": -6.372570037841797, "global_step": 105339, "epoch": 2508} {"train_loss": -6.4375481605529785, "global_step": 105340, "epoch": 2508} {"train_loss": -6.464566230773926, "global_step": 105341, "epoch": 2508} {"train_loss": -6.432743072509766, "global_step": 105342, "epoch": 2508} {"train_loss": -6.20756196975708, "global_step": 105343, "epoch": 2508} {"train_loss": -6.243983268737793, "global_step": 105344, "epoch": 2508} {"train_loss": -6.3363447189331055, "global_step": 105345, "epoch": 2508} {"train_loss": -6.355295658111572, "global_step": 105346, "epoch": 2508} {"train_loss": -6.276595592498779, "global_step": 105347, "epoch": 2508} {"train_loss": -6.437488079071045, "global_step": 105348, "epoch": 2508} {"train_loss": -6.312567710876465, "global_step": 105349, "epoch": 2508} {"train_loss": -6.353294849395752, "global_step": 105350, "epoch": 2508} {"train_loss": -6.385969161987305, "global_step": 105351, "epoch": 2508} {"train_loss": -6.411468982696533, "global_step": 105352, "epoch": 2508} {"train_loss": -6.381519317626953, "global_step": 105353, "epoch": 2508} {"train_loss": -6.457677364349365, "global_step": 105354, "epoch": 2508} {"train_loss": -6.411930561065674, "global_step": 105355, "epoch": 2508} {"train_loss": -6.3553667068481445, "global_step": 105356, "epoch": 2508} {"train_loss": -6.394598007202148, "global_step": 105357, "epoch": 2508} {"train_loss": -6.409124374389648, "global_step": 105358, "epoch": 2508} {"train_loss": -6.459261894226074, "global_step": 105359, "epoch": 2508} {"train_loss": -6.499992370605469, "global_step": 105360, "epoch": 2508} {"train_loss": -6.418972969055176, "global_step": 105361, "epoch": 2508} {"train_loss": -6.531630516052246, "global_step": 105362, "epoch": 2508} {"train_loss": -6.531984329223633, "global_step": 105363, "epoch": 2508} {"train_loss": -6.267147064208984, "global_step": 105364, "epoch": 2508} {"train_loss": -6.468378067016602, "global_step": 105365, "epoch": 2508} {"train_loss": -6.451813697814941, "global_step": 105366, "epoch": 2508} {"train_loss": -6.439350128173828, "global_step": 105367, "epoch": 2508} {"train_loss": -6.321094512939453, "global_step": 105368, "epoch": 2508} {"train_loss": -6.447434425354004, "global_step": 105369, "epoch": 2508} {"train_loss": -6.428531169891357, "global_step": 105370, "epoch": 2508} {"train_loss": -6.463593006134033, "global_step": 105371, "epoch": 2508} {"train_loss": -6.286680221557617, "global_step": 105372, "epoch": 2508} {"train_loss": -6.41070032119751, "global_step": 105373, "epoch": 2508} {"train_loss": -6.4111328125, "global_step": 105374, "epoch": 2508} {"train_loss": -6.558071136474609, "global_step": 105375, "epoch": 2508} {"train_loss": -6.35103702545166, "global_step": 105376, "epoch": 2508} {"train_loss": -6.403695458457584, "global_step": 105377, "epoch": 2508, "val_loss": 76141.25} {"train_loss": -6.403473854064941, "global_step": 105378, "epoch": 2509} {"train_loss": -6.394360542297363, "global_step": 105379, "epoch": 2509} {"train_loss": -6.464578628540039, "global_step": 105380, "epoch": 2509} {"train_loss": -6.3365254402160645, "global_step": 105381, "epoch": 2509} {"train_loss": -6.42603874206543, "global_step": 105382, "epoch": 2509} {"train_loss": -6.423102378845215, "global_step": 105383, "epoch": 2509} {"train_loss": -6.436555862426758, "global_step": 105384, "epoch": 2509} {"train_loss": -6.49338436126709, "global_step": 105385, "epoch": 2509} {"train_loss": -6.4280686378479, "global_step": 105386, "epoch": 2509} {"train_loss": -6.329809188842773, "global_step": 105387, "epoch": 2509} {"train_loss": -6.525498390197754, "global_step": 105388, "epoch": 2509} {"train_loss": -6.303566932678223, "global_step": 105389, "epoch": 2509} {"train_loss": -6.349392890930176, "global_step": 105390, "epoch": 2509} {"train_loss": -6.425505638122559, "global_step": 105391, "epoch": 2509} {"train_loss": -6.39936637878418, "global_step": 105392, "epoch": 2509} {"train_loss": -6.544883728027344, "global_step": 105393, "epoch": 2509} {"train_loss": -6.413389682769775, "global_step": 105394, "epoch": 2509} {"train_loss": -6.351450443267822, "global_step": 105395, "epoch": 2509} {"train_loss": -6.375582695007324, "global_step": 105396, "epoch": 2509} {"train_loss": -6.290866851806641, "global_step": 105397, "epoch": 2509} {"train_loss": -6.384607315063477, "global_step": 105398, "epoch": 2509} {"train_loss": -6.504981517791748, "global_step": 105399, "epoch": 2509} {"train_loss": -6.409049987792969, "global_step": 105400, "epoch": 2509} {"train_loss": -6.441018581390381, "global_step": 105401, "epoch": 2509} {"train_loss": -6.408219814300537, "global_step": 105402, "epoch": 2509} {"train_loss": -6.5137858390808105, "global_step": 105403, "epoch": 2509} {"train_loss": -6.4270524978637695, "global_step": 105404, "epoch": 2509} {"train_loss": -6.380795478820801, "global_step": 105405, "epoch": 2509} {"train_loss": -6.467024803161621, "global_step": 105406, "epoch": 2509} {"train_loss": -6.401612281799316, "global_step": 105407, "epoch": 2509} {"train_loss": -6.478849411010742, "global_step": 105408, "epoch": 2509} {"train_loss": -6.458588600158691, "global_step": 105409, "epoch": 2509} {"train_loss": -6.452659606933594, "global_step": 105410, "epoch": 2509} {"train_loss": -6.454705238342285, "global_step": 105411, "epoch": 2509} {"train_loss": -6.459728240966797, "global_step": 105412, "epoch": 2509} {"train_loss": -6.401367664337158, "global_step": 105413, "epoch": 2509} {"train_loss": -6.534708023071289, "global_step": 105414, "epoch": 2509} {"train_loss": -6.330763816833496, "global_step": 105415, "epoch": 2509} {"train_loss": -6.510690689086914, "global_step": 105416, "epoch": 2509} {"train_loss": -6.422332763671875, "global_step": 105417, "epoch": 2509} {"train_loss": -6.376762390136719, "global_step": 105418, "epoch": 2509} {"train_loss": -6.424015919367473, "global_step": 105419, "epoch": 2509, "val_loss": 76232.1640625} {"train_loss": -6.415661811828613, "global_step": 105420, "epoch": 2510} {"train_loss": -6.456382751464844, "global_step": 105421, "epoch": 2510} {"train_loss": -6.41889762878418, "global_step": 105422, "epoch": 2510} {"train_loss": -6.458218097686768, "global_step": 105423, "epoch": 2510} {"train_loss": -6.557486534118652, "global_step": 105424, "epoch": 2510} {"train_loss": -6.474054336547852, "global_step": 105425, "epoch": 2510} {"train_loss": -6.361832618713379, "global_step": 105426, "epoch": 2510} {"train_loss": -6.404019355773926, "global_step": 105427, "epoch": 2510} {"train_loss": -6.35546875, "global_step": 105428, "epoch": 2510} {"train_loss": -6.407696723937988, "global_step": 105429, "epoch": 2510} {"train_loss": -6.416932106018066, "global_step": 105430, "epoch": 2510} {"train_loss": -6.413107872009277, "global_step": 105431, "epoch": 2510} {"train_loss": -6.381734848022461, "global_step": 105432, "epoch": 2510} {"train_loss": -6.4002861976623535, "global_step": 105433, "epoch": 2510} {"train_loss": -6.28967809677124, "global_step": 105434, "epoch": 2510} {"train_loss": -6.587910175323486, "global_step": 105435, "epoch": 2510} {"train_loss": -6.296459674835205, "global_step": 105436, "epoch": 2510} {"train_loss": -6.360670566558838, "global_step": 105437, "epoch": 2510} {"train_loss": -6.398904800415039, "global_step": 105438, "epoch": 2510} {"train_loss": -6.422603607177734, "global_step": 105439, "epoch": 2510} {"train_loss": -6.496039390563965, "global_step": 105440, "epoch": 2510} {"train_loss": -6.432324409484863, "global_step": 105441, "epoch": 2510} {"train_loss": -6.569293022155762, "global_step": 105442, "epoch": 2510} {"train_loss": -6.346032619476318, "global_step": 105443, "epoch": 2510} {"train_loss": -6.377017021179199, "global_step": 105444, "epoch": 2510} {"train_loss": -6.441489219665527, "global_step": 105445, "epoch": 2510} {"train_loss": -6.417935848236084, "global_step": 105446, "epoch": 2510} {"train_loss": -6.385128021240234, "global_step": 105447, "epoch": 2510} {"train_loss": -6.389620304107666, "global_step": 105448, "epoch": 2510} {"train_loss": -6.270549774169922, "global_step": 105449, "epoch": 2510} {"train_loss": -6.4583210945129395, "global_step": 105450, "epoch": 2510} {"train_loss": -6.480517864227295, "global_step": 105451, "epoch": 2510} {"train_loss": -6.391288757324219, "global_step": 105452, "epoch": 2510} {"train_loss": -6.3911333084106445, "global_step": 105453, "epoch": 2510} {"train_loss": -6.422630786895752, "global_step": 105454, "epoch": 2510} {"train_loss": -6.343097686767578, "global_step": 105455, "epoch": 2510} {"train_loss": -6.411567211151123, "global_step": 105456, "epoch": 2510} {"train_loss": -6.4518585205078125, "global_step": 105457, "epoch": 2510} {"train_loss": -6.441553115844727, "global_step": 105458, "epoch": 2510} {"train_loss": -6.41062593460083, "global_step": 105459, "epoch": 2510} {"train_loss": -6.495623588562012, "global_step": 105460, "epoch": 2510} {"train_loss": -6.419181494485764, "global_step": 105461, "epoch": 2510, "val_loss": 76166.8046875} {"train_loss": -6.5432634353637695, "global_step": 105462, "epoch": 2511} {"train_loss": -6.5202789306640625, "global_step": 105463, "epoch": 2511} {"train_loss": -6.430027961730957, "global_step": 105464, "epoch": 2511} {"train_loss": -6.438017845153809, "global_step": 105465, "epoch": 2511} {"train_loss": -6.361846923828125, "global_step": 105466, "epoch": 2511} {"train_loss": -6.513185501098633, "global_step": 105467, "epoch": 2511} {"train_loss": -6.411843299865723, "global_step": 105468, "epoch": 2511} {"train_loss": -6.3477935791015625, "global_step": 105469, "epoch": 2511} {"train_loss": -6.419744491577148, "global_step": 105470, "epoch": 2511} {"train_loss": -6.365231513977051, "global_step": 105471, "epoch": 2511} {"train_loss": -6.506354331970215, "global_step": 105472, "epoch": 2511} {"train_loss": -6.291385173797607, "global_step": 105473, "epoch": 2511} {"train_loss": -6.363649368286133, "global_step": 105474, "epoch": 2511} {"train_loss": -6.352015495300293, "global_step": 105475, "epoch": 2511} {"train_loss": -6.262823104858398, "global_step": 105476, "epoch": 2511} {"train_loss": -6.536938667297363, "global_step": 105477, "epoch": 2511} {"train_loss": -6.322687149047852, "global_step": 105478, "epoch": 2511} {"train_loss": -6.320316314697266, "global_step": 105479, "epoch": 2511} {"train_loss": -6.4042205810546875, "global_step": 105480, "epoch": 2511} {"train_loss": -6.351675510406494, "global_step": 105481, "epoch": 2511} {"train_loss": -6.473851203918457, "global_step": 105482, "epoch": 2511} {"train_loss": -6.394952297210693, "global_step": 105483, "epoch": 2511} {"train_loss": -6.328223705291748, "global_step": 105484, "epoch": 2511} {"train_loss": -6.475688934326172, "global_step": 105485, "epoch": 2511} {"train_loss": -6.282407760620117, "global_step": 105486, "epoch": 2511} {"train_loss": -6.437913417816162, "global_step": 105487, "epoch": 2511} {"train_loss": -6.387361526489258, "global_step": 105488, "epoch": 2511} {"train_loss": -6.2858500480651855, "global_step": 105489, "epoch": 2511} {"train_loss": -6.253157615661621, "global_step": 105490, "epoch": 2511} {"train_loss": -6.451545715332031, "global_step": 105491, "epoch": 2511} {"train_loss": -6.328523635864258, "global_step": 105492, "epoch": 2511} {"train_loss": -6.36603307723999, "global_step": 105493, "epoch": 2511} {"train_loss": -6.4426164627075195, "global_step": 105494, "epoch": 2511} {"train_loss": -6.413880348205566, "global_step": 105495, "epoch": 2511} {"train_loss": -6.410490036010742, "global_step": 105496, "epoch": 2511} {"train_loss": -6.568532466888428, "global_step": 105497, "epoch": 2511} {"train_loss": -6.302722930908203, "global_step": 105498, "epoch": 2511} {"train_loss": -6.43189811706543, "global_step": 105499, "epoch": 2511} {"train_loss": -6.380285739898682, "global_step": 105500, "epoch": 2511} {"train_loss": -6.308289051055908, "global_step": 105501, "epoch": 2511} {"train_loss": -6.402995586395264, "global_step": 105502, "epoch": 2511} {"train_loss": -6.394463981900897, "global_step": 105503, "epoch": 2511, "val_loss": 76157.3359375} {"train_loss": -6.4120965003967285, "global_step": 105504, "epoch": 2512} {"train_loss": -6.380929470062256, "global_step": 105505, "epoch": 2512} {"train_loss": -6.473576545715332, "global_step": 105506, "epoch": 2512} {"train_loss": -6.363913059234619, "global_step": 105507, "epoch": 2512} {"train_loss": -6.3244242668151855, "global_step": 105508, "epoch": 2512} {"train_loss": -6.493148326873779, "global_step": 105509, "epoch": 2512} {"train_loss": -6.41560173034668, "global_step": 105510, "epoch": 2512} {"train_loss": -6.524313449859619, "global_step": 105511, "epoch": 2512} {"train_loss": -6.401511192321777, "global_step": 105512, "epoch": 2512} {"train_loss": -6.4484710693359375, "global_step": 105513, "epoch": 2512} {"train_loss": -6.3901567459106445, "global_step": 105514, "epoch": 2512} {"train_loss": -6.444613456726074, "global_step": 105515, "epoch": 2512} {"train_loss": -6.542851448059082, "global_step": 105516, "epoch": 2512} {"train_loss": -6.412698745727539, "global_step": 105517, "epoch": 2512} {"train_loss": -6.477007865905762, "global_step": 105518, "epoch": 2512} {"train_loss": -6.364510536193848, "global_step": 105519, "epoch": 2512} {"train_loss": -6.374053001403809, "global_step": 105520, "epoch": 2512} {"train_loss": -6.326127052307129, "global_step": 105521, "epoch": 2512} {"train_loss": -6.3699846267700195, "global_step": 105522, "epoch": 2512} {"train_loss": -6.4927520751953125, "global_step": 105523, "epoch": 2512} {"train_loss": -6.430315971374512, "global_step": 105524, "epoch": 2512} {"train_loss": -6.426203727722168, "global_step": 105525, "epoch": 2512} {"train_loss": -6.456055164337158, "global_step": 105526, "epoch": 2512} {"train_loss": -6.41860294342041, "global_step": 105527, "epoch": 2512} {"train_loss": -6.4276580810546875, "global_step": 105528, "epoch": 2512} {"train_loss": -6.478096961975098, "global_step": 105529, "epoch": 2512} {"train_loss": -6.364719390869141, "global_step": 105530, "epoch": 2512} {"train_loss": -6.380448341369629, "global_step": 105531, "epoch": 2512} {"train_loss": -6.394585609436035, "global_step": 105532, "epoch": 2512} {"train_loss": -6.380577087402344, "global_step": 105533, "epoch": 2512} {"train_loss": -6.403374195098877, "global_step": 105534, "epoch": 2512} {"train_loss": -6.356719017028809, "global_step": 105535, "epoch": 2512} {"train_loss": -6.525677680969238, "global_step": 105536, "epoch": 2512} {"train_loss": -6.49530029296875, "global_step": 105537, "epoch": 2512} {"train_loss": -6.250499248504639, "global_step": 105538, "epoch": 2512} {"train_loss": -6.3888702392578125, "global_step": 105539, "epoch": 2512} {"train_loss": -6.433599472045898, "global_step": 105540, "epoch": 2512} {"train_loss": -6.325318336486816, "global_step": 105541, "epoch": 2512} {"train_loss": -6.443634510040283, "global_step": 105542, "epoch": 2512} {"train_loss": -6.354177474975586, "global_step": 105543, "epoch": 2512} {"train_loss": -6.470425128936768, "global_step": 105544, "epoch": 2512} {"train_loss": -6.4140124434516546, "global_step": 105545, "epoch": 2512, "val_loss": 75953.671875} {"train_loss": -6.417696952819824, "global_step": 105546, "epoch": 2513} {"train_loss": -6.406195163726807, "global_step": 105547, "epoch": 2513} {"train_loss": -6.340256214141846, "global_step": 105548, "epoch": 2513} {"train_loss": -6.3881516456604, "global_step": 105549, "epoch": 2513} {"train_loss": -6.366130828857422, "global_step": 105550, "epoch": 2513} {"train_loss": -6.431492328643799, "global_step": 105551, "epoch": 2513} {"train_loss": -6.499832630157471, "global_step": 105552, "epoch": 2513} {"train_loss": -6.505720138549805, "global_step": 105553, "epoch": 2513} {"train_loss": -6.49556827545166, "global_step": 105554, "epoch": 2513} {"train_loss": -6.527910232543945, "global_step": 105555, "epoch": 2513} {"train_loss": -6.477765083312988, "global_step": 105556, "epoch": 2513} {"train_loss": -6.393523693084717, "global_step": 105557, "epoch": 2513} {"train_loss": -6.473498344421387, "global_step": 105558, "epoch": 2513} {"train_loss": -6.502886772155762, "global_step": 105559, "epoch": 2513} {"train_loss": -6.400164604187012, "global_step": 105560, "epoch": 2513} {"train_loss": -6.4701337814331055, "global_step": 105561, "epoch": 2513} {"train_loss": -6.4845967292785645, "global_step": 105562, "epoch": 2513} {"train_loss": -6.372278213500977, "global_step": 105563, "epoch": 2513} {"train_loss": -6.435307025909424, "global_step": 105564, "epoch": 2513} {"train_loss": -6.4106292724609375, "global_step": 105565, "epoch": 2513} {"train_loss": -6.421746730804443, "global_step": 105566, "epoch": 2513} {"train_loss": -6.419241905212402, "global_step": 105567, "epoch": 2513} {"train_loss": -6.310975074768066, "global_step": 105568, "epoch": 2513} {"train_loss": -6.5347442626953125, "global_step": 105569, "epoch": 2513} {"train_loss": -6.519197940826416, "global_step": 105570, "epoch": 2513} {"train_loss": -6.406469821929932, "global_step": 105571, "epoch": 2513} {"train_loss": -6.380178451538086, "global_step": 105572, "epoch": 2513} {"train_loss": -6.599005222320557, "global_step": 105573, "epoch": 2513} {"train_loss": -6.559096336364746, "global_step": 105574, "epoch": 2513} {"train_loss": -6.463250160217285, "global_step": 105575, "epoch": 2513} {"train_loss": -6.539177894592285, "global_step": 105576, "epoch": 2513} {"train_loss": -6.351479530334473, "global_step": 105577, "epoch": 2513} {"train_loss": -6.417783737182617, "global_step": 105578, "epoch": 2513} {"train_loss": -6.433053493499756, "global_step": 105579, "epoch": 2513} {"train_loss": -6.375626087188721, "global_step": 105580, "epoch": 2513} {"train_loss": -6.502042293548584, "global_step": 105581, "epoch": 2513} {"train_loss": -6.425677299499512, "global_step": 105582, "epoch": 2513} {"train_loss": -6.440404415130615, "global_step": 105583, "epoch": 2513} {"train_loss": -6.387383460998535, "global_step": 105584, "epoch": 2513} {"train_loss": -6.55097770690918, "global_step": 105585, "epoch": 2513} {"train_loss": -6.378840446472168, "global_step": 105586, "epoch": 2513} {"train_loss": -6.444562412443615, "global_step": 105587, "epoch": 2513, "val_loss": 75944.8359375} {"train_loss": -6.425644874572754, "global_step": 105588, "epoch": 2514} {"train_loss": -6.522818088531494, "global_step": 105589, "epoch": 2514} {"train_loss": -6.519778251647949, "global_step": 105590, "epoch": 2514} {"train_loss": -6.471473217010498, "global_step": 105591, "epoch": 2514} {"train_loss": -6.371967315673828, "global_step": 105592, "epoch": 2514} {"train_loss": -6.475276947021484, "global_step": 105593, "epoch": 2514} {"train_loss": -6.394980430603027, "global_step": 105594, "epoch": 2514} {"train_loss": -6.5778093338012695, "global_step": 105595, "epoch": 2514} {"train_loss": -6.414645195007324, "global_step": 105596, "epoch": 2514} {"train_loss": -6.4464287757873535, "global_step": 105597, "epoch": 2514} {"train_loss": -6.4084391593933105, "global_step": 105598, "epoch": 2514} {"train_loss": -6.5102763175964355, "global_step": 105599, "epoch": 2514} {"train_loss": -6.49729061126709, "global_step": 105600, "epoch": 2514} {"train_loss": -6.432966709136963, "global_step": 105601, "epoch": 2514} {"train_loss": -6.296446800231934, "global_step": 105602, "epoch": 2514} {"train_loss": -6.519099712371826, "global_step": 105603, "epoch": 2514} {"train_loss": -6.50927734375, "global_step": 105604, "epoch": 2514} {"train_loss": -6.403739929199219, "global_step": 105605, "epoch": 2514} {"train_loss": -6.42283821105957, "global_step": 105606, "epoch": 2514} {"train_loss": -6.385010719299316, "global_step": 105607, "epoch": 2514} {"train_loss": -6.458625793457031, "global_step": 105608, "epoch": 2514} {"train_loss": -6.49160623550415, "global_step": 105609, "epoch": 2514} {"train_loss": -6.441457748413086, "global_step": 105610, "epoch": 2514} {"train_loss": -6.541616916656494, "global_step": 105611, "epoch": 2514} {"train_loss": -6.4347028732299805, "global_step": 105612, "epoch": 2514} {"train_loss": -6.363114356994629, "global_step": 105613, "epoch": 2514} {"train_loss": -6.468632698059082, "global_step": 105614, "epoch": 2514} {"train_loss": -6.402050018310547, "global_step": 105615, "epoch": 2514} {"train_loss": -6.502168655395508, "global_step": 105616, "epoch": 2514} {"train_loss": -6.335935115814209, "global_step": 105617, "epoch": 2514} {"train_loss": -6.383257865905762, "global_step": 105618, "epoch": 2514} {"train_loss": -6.3368730545043945, "global_step": 105619, "epoch": 2514} {"train_loss": -6.402423858642578, "global_step": 105620, "epoch": 2514} {"train_loss": -6.358996391296387, "global_step": 105621, "epoch": 2514} {"train_loss": -6.469938278198242, "global_step": 105622, "epoch": 2514} {"train_loss": -6.352970123291016, "global_step": 105623, "epoch": 2514} {"train_loss": -6.419412612915039, "global_step": 105624, "epoch": 2514} {"train_loss": -6.475381851196289, "global_step": 105625, "epoch": 2514} {"train_loss": -6.334593772888184, "global_step": 105626, "epoch": 2514} {"train_loss": -6.429862022399902, "global_step": 105627, "epoch": 2514} {"train_loss": -6.466300964355469, "global_step": 105628, "epoch": 2514} {"train_loss": -6.434710014434088, "global_step": 105629, "epoch": 2514, "val_loss": 76038.2265625} {"train_loss": -6.455181121826172, "global_step": 105630, "epoch": 2515} {"train_loss": -6.444029808044434, "global_step": 105631, "epoch": 2515} {"train_loss": -6.550545692443848, "global_step": 105632, "epoch": 2515} {"train_loss": -6.387930393218994, "global_step": 105633, "epoch": 2515} {"train_loss": -6.43513298034668, "global_step": 105634, "epoch": 2515} {"train_loss": -6.5803985595703125, "global_step": 105635, "epoch": 2515} {"train_loss": -6.358518600463867, "global_step": 105636, "epoch": 2515} {"train_loss": -6.240379333496094, "global_step": 105637, "epoch": 2515} {"train_loss": -6.4266510009765625, "global_step": 105638, "epoch": 2515} {"train_loss": -6.264091491699219, "global_step": 105639, "epoch": 2515} {"train_loss": -6.390629768371582, "global_step": 105640, "epoch": 2515} {"train_loss": -6.49839448928833, "global_step": 105641, "epoch": 2515} {"train_loss": -6.377364158630371, "global_step": 105642, "epoch": 2515} {"train_loss": -6.344229221343994, "global_step": 105643, "epoch": 2515} {"train_loss": -6.350919723510742, "global_step": 105644, "epoch": 2515} {"train_loss": -6.515131950378418, "global_step": 105645, "epoch": 2515} {"train_loss": -6.484606742858887, "global_step": 105646, "epoch": 2515} {"train_loss": -6.386569499969482, "global_step": 105647, "epoch": 2515} {"train_loss": -6.400518417358398, "global_step": 105648, "epoch": 2515} {"train_loss": -6.524965286254883, "global_step": 105649, "epoch": 2515} {"train_loss": -6.501021385192871, "global_step": 105650, "epoch": 2515} {"train_loss": -6.461879730224609, "global_step": 105651, "epoch": 2515} {"train_loss": -6.461220741271973, "global_step": 105652, "epoch": 2515} {"train_loss": -6.48955774307251, "global_step": 105653, "epoch": 2515} {"train_loss": -6.513772487640381, "global_step": 105654, "epoch": 2515} {"train_loss": -6.319883346557617, "global_step": 105655, "epoch": 2515} {"train_loss": -6.438770771026611, "global_step": 105656, "epoch": 2515} {"train_loss": -6.474638938903809, "global_step": 105657, "epoch": 2515} {"train_loss": -6.485869407653809, "global_step": 105658, "epoch": 2515} {"train_loss": -6.400309085845947, "global_step": 105659, "epoch": 2515} {"train_loss": -6.370642185211182, "global_step": 105660, "epoch": 2515} {"train_loss": -6.454375267028809, "global_step": 105661, "epoch": 2515} {"train_loss": -6.493289947509766, "global_step": 105662, "epoch": 2515} {"train_loss": -6.463376045227051, "global_step": 105663, "epoch": 2515} {"train_loss": -6.479709148406982, "global_step": 105664, "epoch": 2515} {"train_loss": -6.378537654876709, "global_step": 105665, "epoch": 2515} {"train_loss": -6.524866104125977, "global_step": 105666, "epoch": 2515} {"train_loss": -6.336838722229004, "global_step": 105667, "epoch": 2515} {"train_loss": -6.400481700897217, "global_step": 105668, "epoch": 2515} {"train_loss": -6.485081195831299, "global_step": 105669, "epoch": 2515} {"train_loss": -6.380755424499512, "global_step": 105670, "epoch": 2515} {"train_loss": -6.4326922325860885, "global_step": 105671, "epoch": 2515, "val_loss": 76281.7421875} {"train_loss": -6.438920021057129, "global_step": 105672, "epoch": 2516} {"train_loss": -6.468907356262207, "global_step": 105673, "epoch": 2516} {"train_loss": -6.462611675262451, "global_step": 105674, "epoch": 2516} {"train_loss": -6.478232383728027, "global_step": 105675, "epoch": 2516} {"train_loss": -6.612128257751465, "global_step": 105676, "epoch": 2516} {"train_loss": -6.490157127380371, "global_step": 105677, "epoch": 2516} {"train_loss": -6.337451934814453, "global_step": 105678, "epoch": 2516} {"train_loss": -6.459624290466309, "global_step": 105679, "epoch": 2516} {"train_loss": -6.444787979125977, "global_step": 105680, "epoch": 2516} {"train_loss": -6.450425624847412, "global_step": 105681, "epoch": 2516} {"train_loss": -6.44378662109375, "global_step": 105682, "epoch": 2516} {"train_loss": -6.5752387046813965, "global_step": 105683, "epoch": 2516} {"train_loss": -6.496411323547363, "global_step": 105684, "epoch": 2516} {"train_loss": -6.451488018035889, "global_step": 105685, "epoch": 2516} {"train_loss": -6.4700398445129395, "global_step": 105686, "epoch": 2516} {"train_loss": -6.464733123779297, "global_step": 105687, "epoch": 2516} {"train_loss": -6.46178674697876, "global_step": 105688, "epoch": 2516} {"train_loss": -6.436363220214844, "global_step": 105689, "epoch": 2516} {"train_loss": -6.509228706359863, "global_step": 105690, "epoch": 2516} {"train_loss": -6.407534599304199, "global_step": 105691, "epoch": 2516} {"train_loss": -6.542666912078857, "global_step": 105692, "epoch": 2516} {"train_loss": -6.50479793548584, "global_step": 105693, "epoch": 2516} {"train_loss": -6.416121482849121, "global_step": 105694, "epoch": 2516} {"train_loss": -6.458829879760742, "global_step": 105695, "epoch": 2516} {"train_loss": -6.442748069763184, "global_step": 105696, "epoch": 2516} {"train_loss": -6.420269966125488, "global_step": 105697, "epoch": 2516} {"train_loss": -6.469690322875977, "global_step": 105698, "epoch": 2516} {"train_loss": -6.350585460662842, "global_step": 105699, "epoch": 2516} {"train_loss": -6.3386454582214355, "global_step": 105700, "epoch": 2516} {"train_loss": -6.504612922668457, "global_step": 105701, "epoch": 2516} {"train_loss": -6.449847221374512, "global_step": 105702, "epoch": 2516} {"train_loss": -6.438350677490234, "global_step": 105703, "epoch": 2516} {"train_loss": -6.586919784545898, "global_step": 105704, "epoch": 2516} {"train_loss": -6.310596942901611, "global_step": 105705, "epoch": 2516} {"train_loss": -6.40573787689209, "global_step": 105706, "epoch": 2516} {"train_loss": -6.409302711486816, "global_step": 105707, "epoch": 2516} {"train_loss": -6.381932735443115, "global_step": 105708, "epoch": 2516} {"train_loss": -6.518722057342529, "global_step": 105709, "epoch": 2516} {"train_loss": -6.325355529785156, "global_step": 105710, "epoch": 2516} {"train_loss": -6.35123348236084, "global_step": 105711, "epoch": 2516} {"train_loss": -6.320341110229492, "global_step": 105712, "epoch": 2516} {"train_loss": -6.445047628311884, "global_step": 105713, "epoch": 2516, "val_loss": 76310.9921875} {"train_loss": -6.58359432220459, "global_step": 105714, "epoch": 2517} {"train_loss": -6.361687660217285, "global_step": 105715, "epoch": 2517} {"train_loss": -6.36271333694458, "global_step": 105716, "epoch": 2517} {"train_loss": -6.378045082092285, "global_step": 105717, "epoch": 2517} {"train_loss": -6.371936798095703, "global_step": 105718, "epoch": 2517} {"train_loss": -6.465967655181885, "global_step": 105719, "epoch": 2517} {"train_loss": -6.481844902038574, "global_step": 105720, "epoch": 2517} {"train_loss": -6.413780212402344, "global_step": 105721, "epoch": 2517} {"train_loss": -6.549967288970947, "global_step": 105722, "epoch": 2517} {"train_loss": -6.534788131713867, "global_step": 105723, "epoch": 2517} {"train_loss": -6.392066478729248, "global_step": 105724, "epoch": 2517} {"train_loss": -6.572046756744385, "global_step": 105725, "epoch": 2517} {"train_loss": -6.430942535400391, "global_step": 105726, "epoch": 2517} {"train_loss": -6.460352897644043, "global_step": 105727, "epoch": 2517} {"train_loss": -6.447657585144043, "global_step": 105728, "epoch": 2517} {"train_loss": -6.420783042907715, "global_step": 105729, "epoch": 2517} {"train_loss": -6.435248374938965, "global_step": 105730, "epoch": 2517} {"train_loss": -6.407427787780762, "global_step": 105731, "epoch": 2517} {"train_loss": -6.3935441970825195, "global_step": 105732, "epoch": 2517} {"train_loss": -6.312529563903809, "global_step": 105733, "epoch": 2517} {"train_loss": -6.361793041229248, "global_step": 105734, "epoch": 2517} {"train_loss": -6.391127586364746, "global_step": 105735, "epoch": 2517} {"train_loss": -6.268437385559082, "global_step": 105736, "epoch": 2517} {"train_loss": -6.425868988037109, "global_step": 105737, "epoch": 2517} {"train_loss": -6.310723304748535, "global_step": 105738, "epoch": 2517} {"train_loss": -6.331274032592773, "global_step": 105739, "epoch": 2517} {"train_loss": -6.378249645233154, "global_step": 105740, "epoch": 2517} {"train_loss": -6.168240547180176, "global_step": 105741, "epoch": 2517} {"train_loss": -6.327213287353516, "global_step": 105742, "epoch": 2517} {"train_loss": -6.221038818359375, "global_step": 105743, "epoch": 2517} {"train_loss": -6.296599388122559, "global_step": 105744, "epoch": 2517} {"train_loss": -6.264147758483887, "global_step": 105745, "epoch": 2517} {"train_loss": -6.25712776184082, "global_step": 105746, "epoch": 2517} {"train_loss": -6.195821285247803, "global_step": 105747, "epoch": 2517} {"train_loss": -6.4179840087890625, "global_step": 105748, "epoch": 2517} {"train_loss": -6.240997314453125, "global_step": 105749, "epoch": 2517} {"train_loss": -6.267199516296387, "global_step": 105750, "epoch": 2517} {"train_loss": -6.32581090927124, "global_step": 105751, "epoch": 2517} {"train_loss": -6.284584999084473, "global_step": 105752, "epoch": 2517} {"train_loss": -6.381051063537598, "global_step": 105753, "epoch": 2517} {"train_loss": -6.4309539794921875, "global_step": 105754, "epoch": 2517} {"train_loss": -6.371170146124704, "global_step": 105755, "epoch": 2517, "val_loss": 75796.078125} {"train_loss": -6.372622013092041, "global_step": 105756, "epoch": 2518} {"train_loss": -6.187222480773926, "global_step": 105757, "epoch": 2518} {"train_loss": -6.189848899841309, "global_step": 105758, "epoch": 2518} {"train_loss": -6.443582057952881, "global_step": 105759, "epoch": 2518} {"train_loss": -6.345353603363037, "global_step": 105760, "epoch": 2518} {"train_loss": -6.330313205718994, "global_step": 105761, "epoch": 2518} {"train_loss": -6.2968831062316895, "global_step": 105762, "epoch": 2518} {"train_loss": -6.462830543518066, "global_step": 105763, "epoch": 2518} {"train_loss": -6.42347526550293, "global_step": 105764, "epoch": 2518} {"train_loss": -6.3436384201049805, "global_step": 105765, "epoch": 2518} {"train_loss": -6.404670715332031, "global_step": 105766, "epoch": 2518} {"train_loss": -6.369543075561523, "global_step": 105767, "epoch": 2518} {"train_loss": -6.273149490356445, "global_step": 105768, "epoch": 2518} {"train_loss": -6.5713911056518555, "global_step": 105769, "epoch": 2518} {"train_loss": -6.424219131469727, "global_step": 105770, "epoch": 2518} {"train_loss": -6.461627006530762, "global_step": 105771, "epoch": 2518} {"train_loss": -6.436368942260742, "global_step": 105772, "epoch": 2518} {"train_loss": -6.440193176269531, "global_step": 105773, "epoch": 2518} {"train_loss": -6.417794704437256, "global_step": 105774, "epoch": 2518} {"train_loss": -6.365887641906738, "global_step": 105775, "epoch": 2518} {"train_loss": -6.488511085510254, "global_step": 105776, "epoch": 2518} {"train_loss": -6.448751926422119, "global_step": 105777, "epoch": 2518} {"train_loss": -6.389457702636719, "global_step": 105778, "epoch": 2518} {"train_loss": -6.456287384033203, "global_step": 105779, "epoch": 2518} {"train_loss": -6.401543617248535, "global_step": 105780, "epoch": 2518} {"train_loss": -6.449418067932129, "global_step": 105781, "epoch": 2518} {"train_loss": -6.281463146209717, "global_step": 105782, "epoch": 2518} {"train_loss": -6.356982231140137, "global_step": 105783, "epoch": 2518} {"train_loss": -6.417715549468994, "global_step": 105784, "epoch": 2518} {"train_loss": -6.4449462890625, "global_step": 105785, "epoch": 2518} {"train_loss": -6.5369553565979, "global_step": 105786, "epoch": 2518} {"train_loss": -6.320801734924316, "global_step": 105787, "epoch": 2518} {"train_loss": -6.364209175109863, "global_step": 105788, "epoch": 2518} {"train_loss": -6.364588737487793, "global_step": 105789, "epoch": 2518} {"train_loss": -6.377401351928711, "global_step": 105790, "epoch": 2518} {"train_loss": -6.338803768157959, "global_step": 105791, "epoch": 2518} {"train_loss": -6.336726188659668, "global_step": 105792, "epoch": 2518} {"train_loss": -6.3557329177856445, "global_step": 105793, "epoch": 2518} {"train_loss": -6.525521755218506, "global_step": 105794, "epoch": 2518} {"train_loss": -6.533926963806152, "global_step": 105795, "epoch": 2518} {"train_loss": -6.334464073181152, "global_step": 105796, "epoch": 2518} {"train_loss": -6.391917398997715, "global_step": 105797, "epoch": 2518, "val_loss": 76263.4453125} {"train_loss": -6.386046409606934, "global_step": 105798, "epoch": 2519} {"train_loss": -6.49677848815918, "global_step": 105799, "epoch": 2519} {"train_loss": -6.445992946624756, "global_step": 105800, "epoch": 2519} {"train_loss": -6.450334072113037, "global_step": 105801, "epoch": 2519} {"train_loss": -6.497941970825195, "global_step": 105802, "epoch": 2519} {"train_loss": -6.404939651489258, "global_step": 105803, "epoch": 2519} {"train_loss": -6.450090408325195, "global_step": 105804, "epoch": 2519} {"train_loss": -6.483495235443115, "global_step": 105805, "epoch": 2519} {"train_loss": -6.370648384094238, "global_step": 105806, "epoch": 2519} {"train_loss": -6.436187744140625, "global_step": 105807, "epoch": 2519} {"train_loss": -6.341334342956543, "global_step": 105808, "epoch": 2519} {"train_loss": -6.460999488830566, "global_step": 105809, "epoch": 2519} {"train_loss": -6.342964172363281, "global_step": 105810, "epoch": 2519} {"train_loss": -6.270843505859375, "global_step": 105811, "epoch": 2519} {"train_loss": -6.567380905151367, "global_step": 105812, "epoch": 2519} {"train_loss": -6.362246513366699, "global_step": 105813, "epoch": 2519} {"train_loss": -6.3720598220825195, "global_step": 105814, "epoch": 2519} {"train_loss": -6.501404762268066, "global_step": 105815, "epoch": 2519} {"train_loss": -6.419124603271484, "global_step": 105816, "epoch": 2519} {"train_loss": -6.386908531188965, "global_step": 105817, "epoch": 2519} {"train_loss": -6.360355854034424, "global_step": 105818, "epoch": 2519} {"train_loss": -6.47208833694458, "global_step": 105819, "epoch": 2519} {"train_loss": -6.463543891906738, "global_step": 105820, "epoch": 2519} {"train_loss": -6.379827976226807, "global_step": 105821, "epoch": 2519} {"train_loss": -6.513551235198975, "global_step": 105822, "epoch": 2519} {"train_loss": -6.499682426452637, "global_step": 105823, "epoch": 2519} {"train_loss": -6.3678083419799805, "global_step": 105824, "epoch": 2519} {"train_loss": -6.344616413116455, "global_step": 105825, "epoch": 2519} {"train_loss": -6.4663872718811035, "global_step": 105826, "epoch": 2519} {"train_loss": -6.388118267059326, "global_step": 105827, "epoch": 2519} {"train_loss": -6.394133567810059, "global_step": 105828, "epoch": 2519} {"train_loss": -6.409093379974365, "global_step": 105829, "epoch": 2519} {"train_loss": -6.391519546508789, "global_step": 105830, "epoch": 2519} {"train_loss": -6.303654670715332, "global_step": 105831, "epoch": 2519} {"train_loss": -6.359400749206543, "global_step": 105832, "epoch": 2519} {"train_loss": -6.480284690856934, "global_step": 105833, "epoch": 2519} {"train_loss": -6.447020530700684, "global_step": 105834, "epoch": 2519} {"train_loss": -6.400737762451172, "global_step": 105835, "epoch": 2519} {"train_loss": -6.245793342590332, "global_step": 105836, "epoch": 2519} {"train_loss": -6.271119117736816, "global_step": 105837, "epoch": 2519} {"train_loss": -6.457301139831543, "global_step": 105838, "epoch": 2519} {"train_loss": -6.408614919299171, "global_step": 105839, "epoch": 2519, "val_loss": 76073.953125} {"train_loss": -6.487685203552246, "global_step": 105840, "epoch": 2520} {"train_loss": -6.336289882659912, "global_step": 105841, "epoch": 2520} {"train_loss": -6.382201194763184, "global_step": 105842, "epoch": 2520} {"train_loss": -6.371549606323242, "global_step": 105843, "epoch": 2520} {"train_loss": -6.512294769287109, "global_step": 105844, "epoch": 2520} {"train_loss": -6.454442501068115, "global_step": 105845, "epoch": 2520} {"train_loss": -6.3492960929870605, "global_step": 105846, "epoch": 2520} {"train_loss": -6.392679214477539, "global_step": 105847, "epoch": 2520} {"train_loss": -6.358124732971191, "global_step": 105848, "epoch": 2520} {"train_loss": -6.391513824462891, "global_step": 105849, "epoch": 2520} {"train_loss": -6.448321342468262, "global_step": 105850, "epoch": 2520} {"train_loss": -6.426621437072754, "global_step": 105851, "epoch": 2520} {"train_loss": -6.429362773895264, "global_step": 105852, "epoch": 2520} {"train_loss": -6.524659156799316, "global_step": 105853, "epoch": 2520} {"train_loss": -6.490447044372559, "global_step": 105854, "epoch": 2520} {"train_loss": -6.39906120300293, "global_step": 105855, "epoch": 2520} {"train_loss": -6.566125392913818, "global_step": 105856, "epoch": 2520} {"train_loss": -6.467037677764893, "global_step": 105857, "epoch": 2520} {"train_loss": -6.421180725097656, "global_step": 105858, "epoch": 2520} {"train_loss": -6.527440547943115, "global_step": 105859, "epoch": 2520} {"train_loss": -6.403975963592529, "global_step": 105860, "epoch": 2520} {"train_loss": -6.5308403968811035, "global_step": 105861, "epoch": 2520} {"train_loss": -6.528154373168945, "global_step": 105862, "epoch": 2520} {"train_loss": -6.483736038208008, "global_step": 105863, "epoch": 2520} {"train_loss": -6.40648889541626, "global_step": 105864, "epoch": 2520} {"train_loss": -6.460283279418945, "global_step": 105865, "epoch": 2520} {"train_loss": -6.440659523010254, "global_step": 105866, "epoch": 2520} {"train_loss": -6.539031982421875, "global_step": 105867, "epoch": 2520} {"train_loss": -6.509890556335449, "global_step": 105868, "epoch": 2520} {"train_loss": -6.499860763549805, "global_step": 105869, "epoch": 2520} {"train_loss": -6.329350471496582, "global_step": 105870, "epoch": 2520} {"train_loss": -6.515763759613037, "global_step": 105871, "epoch": 2520} {"train_loss": -6.450572967529297, "global_step": 105872, "epoch": 2520} {"train_loss": -6.408438205718994, "global_step": 105873, "epoch": 2520} {"train_loss": -6.4543609619140625, "global_step": 105874, "epoch": 2520} {"train_loss": -6.4645891189575195, "global_step": 105875, "epoch": 2520} {"train_loss": -6.513054847717285, "global_step": 105876, "epoch": 2520} {"train_loss": -6.422014236450195, "global_step": 105877, "epoch": 2520} {"train_loss": -6.319245338439941, "global_step": 105878, "epoch": 2520} {"train_loss": -6.4992475509643555, "global_step": 105879, "epoch": 2520} {"train_loss": -6.379989147186279, "global_step": 105880, "epoch": 2520} {"train_loss": -6.446251721609206, "global_step": 105881, "epoch": 2520, "val_loss": 76230.234375} {"train_loss": -6.528621673583984, "global_step": 105882, "epoch": 2521} {"train_loss": -6.435506820678711, "global_step": 105883, "epoch": 2521} {"train_loss": -6.3139543533325195, "global_step": 105884, "epoch": 2521} {"train_loss": -6.4065961837768555, "global_step": 105885, "epoch": 2521} {"train_loss": -6.443155288696289, "global_step": 105886, "epoch": 2521} {"train_loss": -6.513769626617432, "global_step": 105887, "epoch": 2521} {"train_loss": -6.498488903045654, "global_step": 105888, "epoch": 2521} {"train_loss": -6.472135543823242, "global_step": 105889, "epoch": 2521} {"train_loss": -6.476201057434082, "global_step": 105890, "epoch": 2521} {"train_loss": -6.432868003845215, "global_step": 105891, "epoch": 2521} {"train_loss": -6.456064224243164, "global_step": 105892, "epoch": 2521} {"train_loss": -6.538521766662598, "global_step": 105893, "epoch": 2521} {"train_loss": -6.469171524047852, "global_step": 105894, "epoch": 2521} {"train_loss": -6.4003705978393555, "global_step": 105895, "epoch": 2521} {"train_loss": -6.425182342529297, "global_step": 105896, "epoch": 2521} {"train_loss": -6.448493957519531, "global_step": 105897, "epoch": 2521} {"train_loss": -6.376145839691162, "global_step": 105898, "epoch": 2521} {"train_loss": -6.45422887802124, "global_step": 105899, "epoch": 2521} {"train_loss": -6.380072593688965, "global_step": 105900, "epoch": 2521} {"train_loss": -6.445694923400879, "global_step": 105901, "epoch": 2521} {"train_loss": -6.39936637878418, "global_step": 105902, "epoch": 2521} {"train_loss": -6.3663434982299805, "global_step": 105903, "epoch": 2521} {"train_loss": -6.449134826660156, "global_step": 105904, "epoch": 2521} {"train_loss": -6.415975570678711, "global_step": 105905, "epoch": 2521} {"train_loss": -6.380755424499512, "global_step": 105906, "epoch": 2521} {"train_loss": -6.479014873504639, "global_step": 105907, "epoch": 2521} {"train_loss": -6.427181720733643, "global_step": 105908, "epoch": 2521} {"train_loss": -6.298616409301758, "global_step": 105909, "epoch": 2521} {"train_loss": -6.419489860534668, "global_step": 105910, "epoch": 2521} {"train_loss": -6.204919338226318, "global_step": 105911, "epoch": 2521} {"train_loss": -6.392584800720215, "global_step": 105912, "epoch": 2521} {"train_loss": -6.317667007446289, "global_step": 105913, "epoch": 2521} {"train_loss": -6.297367095947266, "global_step": 105914, "epoch": 2521} {"train_loss": -6.241557598114014, "global_step": 105915, "epoch": 2521} {"train_loss": -6.430077075958252, "global_step": 105916, "epoch": 2521} {"train_loss": -6.306290626525879, "global_step": 105917, "epoch": 2521} {"train_loss": -6.484752655029297, "global_step": 105918, "epoch": 2521} {"train_loss": -6.275738716125488, "global_step": 105919, "epoch": 2521} {"train_loss": -6.38153076171875, "global_step": 105920, "epoch": 2521} {"train_loss": -6.364315986633301, "global_step": 105921, "epoch": 2521} {"train_loss": -6.370763778686523, "global_step": 105922, "epoch": 2521} {"train_loss": -6.4039365109943205, "global_step": 105923, "epoch": 2521, "val_loss": 75896.171875} {"train_loss": -6.6105241775512695, "global_step": 105924, "epoch": 2522} {"train_loss": -6.2785210609436035, "global_step": 105925, "epoch": 2522} {"train_loss": -6.402756690979004, "global_step": 105926, "epoch": 2522} {"train_loss": -6.446640968322754, "global_step": 105927, "epoch": 2522} {"train_loss": -6.3350725173950195, "global_step": 105928, "epoch": 2522} {"train_loss": -6.45169734954834, "global_step": 105929, "epoch": 2522} {"train_loss": -6.4585723876953125, "global_step": 105930, "epoch": 2522} {"train_loss": -6.388606071472168, "global_step": 105931, "epoch": 2522} {"train_loss": -6.390617847442627, "global_step": 105932, "epoch": 2522} {"train_loss": -6.4695844650268555, "global_step": 105933, "epoch": 2522} {"train_loss": -6.351222038269043, "global_step": 105934, "epoch": 2522} {"train_loss": -6.267180442810059, "global_step": 105935, "epoch": 2522} {"train_loss": -6.39870548248291, "global_step": 105936, "epoch": 2522} {"train_loss": -6.28602409362793, "global_step": 105937, "epoch": 2522} {"train_loss": -6.364528179168701, "global_step": 105938, "epoch": 2522} {"train_loss": -6.389216423034668, "global_step": 105939, "epoch": 2522} {"train_loss": -6.369868278503418, "global_step": 105940, "epoch": 2522} {"train_loss": -6.369861602783203, "global_step": 105941, "epoch": 2522} {"train_loss": -6.274119853973389, "global_step": 105942, "epoch": 2522} {"train_loss": -6.405009746551514, "global_step": 105943, "epoch": 2522} {"train_loss": -6.245600700378418, "global_step": 105944, "epoch": 2522} {"train_loss": -6.332620620727539, "global_step": 105945, "epoch": 2522} {"train_loss": -6.281550884246826, "global_step": 105946, "epoch": 2522} {"train_loss": -6.435507297515869, "global_step": 105947, "epoch": 2522} {"train_loss": -6.377267837524414, "global_step": 105948, "epoch": 2522} {"train_loss": -6.283970355987549, "global_step": 105949, "epoch": 2522} {"train_loss": -6.387664318084717, "global_step": 105950, "epoch": 2522} {"train_loss": -6.2852463722229, "global_step": 105951, "epoch": 2522} {"train_loss": -6.361089706420898, "global_step": 105952, "epoch": 2522} {"train_loss": -6.388014793395996, "global_step": 105953, "epoch": 2522} {"train_loss": -6.451725959777832, "global_step": 105954, "epoch": 2522} {"train_loss": -6.472713470458984, "global_step": 105955, "epoch": 2522} {"train_loss": -6.487119674682617, "global_step": 105956, "epoch": 2522} {"train_loss": -6.315788269042969, "global_step": 105957, "epoch": 2522} {"train_loss": -6.470274925231934, "global_step": 105958, "epoch": 2522} {"train_loss": -6.3866753578186035, "global_step": 105959, "epoch": 2522} {"train_loss": -6.407637596130371, "global_step": 105960, "epoch": 2522} {"train_loss": -6.348173141479492, "global_step": 105961, "epoch": 2522} {"train_loss": -6.4565935134887695, "global_step": 105962, "epoch": 2522} {"train_loss": -6.4857330322265625, "global_step": 105963, "epoch": 2522} {"train_loss": -6.406846046447754, "global_step": 105964, "epoch": 2522} {"train_loss": -6.38563997404916, "global_step": 105965, "epoch": 2522, "val_loss": 75972.2890625} {"train_loss": -6.494063854217529, "global_step": 105966, "epoch": 2523} {"train_loss": -6.409627914428711, "global_step": 105967, "epoch": 2523} {"train_loss": -6.382843494415283, "global_step": 105968, "epoch": 2523} {"train_loss": -6.408559799194336, "global_step": 105969, "epoch": 2523} {"train_loss": -6.4683942794799805, "global_step": 105970, "epoch": 2523} {"train_loss": -6.48975944519043, "global_step": 105971, "epoch": 2523} {"train_loss": -6.326503276824951, "global_step": 105972, "epoch": 2523} {"train_loss": -6.502504825592041, "global_step": 105973, "epoch": 2523} {"train_loss": -6.417299270629883, "global_step": 105974, "epoch": 2523} {"train_loss": -6.436596870422363, "global_step": 105975, "epoch": 2523} {"train_loss": -6.3688249588012695, "global_step": 105976, "epoch": 2523} {"train_loss": -6.475214004516602, "global_step": 105977, "epoch": 2523} {"train_loss": -6.420509338378906, "global_step": 105978, "epoch": 2523} {"train_loss": -6.374946594238281, "global_step": 105979, "epoch": 2523} {"train_loss": -6.526636123657227, "global_step": 105980, "epoch": 2523} {"train_loss": -6.3509931564331055, "global_step": 105981, "epoch": 2523} {"train_loss": -6.330429553985596, "global_step": 105982, "epoch": 2523} {"train_loss": -6.364452838897705, "global_step": 105983, "epoch": 2523} {"train_loss": -6.213420867919922, "global_step": 105984, "epoch": 2523} {"train_loss": -6.484626293182373, "global_step": 105985, "epoch": 2523} {"train_loss": -6.367722511291504, "global_step": 105986, "epoch": 2523} {"train_loss": -6.348763942718506, "global_step": 105987, "epoch": 2523} {"train_loss": -6.398249626159668, "global_step": 105988, "epoch": 2523} {"train_loss": -6.409359455108643, "global_step": 105989, "epoch": 2523} {"train_loss": -6.458260536193848, "global_step": 105990, "epoch": 2523} {"train_loss": -6.467733860015869, "global_step": 105991, "epoch": 2523} {"train_loss": -6.384127616882324, "global_step": 105992, "epoch": 2523} {"train_loss": -6.498362064361572, "global_step": 105993, "epoch": 2523} {"train_loss": -6.346787929534912, "global_step": 105994, "epoch": 2523} {"train_loss": -6.427430152893066, "global_step": 105995, "epoch": 2523} {"train_loss": -6.450172424316406, "global_step": 105996, "epoch": 2523} {"train_loss": -6.362579822540283, "global_step": 105997, "epoch": 2523} {"train_loss": -6.323439121246338, "global_step": 105998, "epoch": 2523} {"train_loss": -6.3978800773620605, "global_step": 105999, "epoch": 2523} {"train_loss": -6.571396827697754, "global_step": 106000, "epoch": 2523} {"train_loss": -6.443589210510254, "global_step": 106001, "epoch": 2523} {"train_loss": -6.448834419250488, "global_step": 106002, "epoch": 2523} {"train_loss": -6.483212471008301, "global_step": 106003, "epoch": 2523} {"train_loss": -6.381022930145264, "global_step": 106004, "epoch": 2523} {"train_loss": -6.340211868286133, "global_step": 106005, "epoch": 2523} {"train_loss": -6.553050994873047, "global_step": 106006, "epoch": 2523} {"train_loss": -6.418911525181362, "global_step": 106007, "epoch": 2523, "val_loss": 75997.515625} {"train_loss": -6.5122785568237305, "global_step": 106008, "epoch": 2524} {"train_loss": -6.535423278808594, "global_step": 106009, "epoch": 2524} {"train_loss": -6.429327487945557, "global_step": 106010, "epoch": 2524} {"train_loss": -6.5200395584106445, "global_step": 106011, "epoch": 2524} {"train_loss": -6.552328109741211, "global_step": 106012, "epoch": 2524} {"train_loss": -6.5573577880859375, "global_step": 106013, "epoch": 2524} {"train_loss": -6.482106685638428, "global_step": 106014, "epoch": 2524} {"train_loss": -6.526307582855225, "global_step": 106015, "epoch": 2524} {"train_loss": -6.392977714538574, "global_step": 106016, "epoch": 2524} {"train_loss": -6.399716377258301, "global_step": 106017, "epoch": 2524} {"train_loss": -6.473049163818359, "global_step": 106018, "epoch": 2524} {"train_loss": -6.437624931335449, "global_step": 106019, "epoch": 2524} {"train_loss": -6.562651634216309, "global_step": 106020, "epoch": 2524} {"train_loss": -6.485846519470215, "global_step": 106021, "epoch": 2524} {"train_loss": -6.4090423583984375, "global_step": 106022, "epoch": 2524} {"train_loss": -6.367498397827148, "global_step": 106023, "epoch": 2524} {"train_loss": -6.540736198425293, "global_step": 106024, "epoch": 2524} {"train_loss": -6.495128631591797, "global_step": 106025, "epoch": 2524} {"train_loss": -6.34395170211792, "global_step": 106026, "epoch": 2524} {"train_loss": -6.4243574142456055, "global_step": 106027, "epoch": 2524} {"train_loss": -6.443971157073975, "global_step": 106028, "epoch": 2524} {"train_loss": -6.569660186767578, "global_step": 106029, "epoch": 2524} {"train_loss": -6.34201717376709, "global_step": 106030, "epoch": 2524} {"train_loss": -6.470793724060059, "global_step": 106031, "epoch": 2524} {"train_loss": -6.317356109619141, "global_step": 106032, "epoch": 2524} {"train_loss": -6.432373523712158, "global_step": 106033, "epoch": 2524} {"train_loss": -6.470571517944336, "global_step": 106034, "epoch": 2524} {"train_loss": -6.338964462280273, "global_step": 106035, "epoch": 2524} {"train_loss": -6.381908893585205, "global_step": 106036, "epoch": 2524} {"train_loss": -6.304391384124756, "global_step": 106037, "epoch": 2524} {"train_loss": -6.363966941833496, "global_step": 106038, "epoch": 2524} {"train_loss": -6.393062591552734, "global_step": 106039, "epoch": 2524} {"train_loss": -6.410029411315918, "global_step": 106040, "epoch": 2524} {"train_loss": -6.177925109863281, "global_step": 106041, "epoch": 2524} {"train_loss": -6.388942241668701, "global_step": 106042, "epoch": 2524} {"train_loss": -6.417713642120361, "global_step": 106043, "epoch": 2524} {"train_loss": -6.336041450500488, "global_step": 106044, "epoch": 2524} {"train_loss": -6.285625457763672, "global_step": 106045, "epoch": 2524} {"train_loss": -6.403444766998291, "global_step": 106046, "epoch": 2524} {"train_loss": -6.368130207061768, "global_step": 106047, "epoch": 2524} {"train_loss": -6.214280128479004, "global_step": 106048, "epoch": 2524} {"train_loss": -6.4203794456663585, "global_step": 106049, "epoch": 2524, "val_loss": 76229.015625} {"train_loss": -6.341764450073242, "global_step": 106050, "epoch": 2525} {"train_loss": -6.321566581726074, "global_step": 106051, "epoch": 2525} {"train_loss": -6.3764729499816895, "global_step": 106052, "epoch": 2525} {"train_loss": -6.288549423217773, "global_step": 106053, "epoch": 2525} {"train_loss": -6.496424674987793, "global_step": 106054, "epoch": 2525} {"train_loss": -6.282227039337158, "global_step": 106055, "epoch": 2525} {"train_loss": -6.318291664123535, "global_step": 106056, "epoch": 2525} {"train_loss": -6.410312652587891, "global_step": 106057, "epoch": 2525} {"train_loss": -6.323050498962402, "global_step": 106058, "epoch": 2525} {"train_loss": -6.357003211975098, "global_step": 106059, "epoch": 2525} {"train_loss": -6.3575921058654785, "global_step": 106060, "epoch": 2525} {"train_loss": -6.265668869018555, "global_step": 106061, "epoch": 2525} {"train_loss": -6.361865043640137, "global_step": 106062, "epoch": 2525} {"train_loss": -6.387951850891113, "global_step": 106063, "epoch": 2525} {"train_loss": -6.321324348449707, "global_step": 106064, "epoch": 2525} {"train_loss": -6.250217437744141, "global_step": 106065, "epoch": 2525} {"train_loss": -6.473890781402588, "global_step": 106066, "epoch": 2525} {"train_loss": -6.417168617248535, "global_step": 106067, "epoch": 2525} {"train_loss": -6.425789833068848, "global_step": 106068, "epoch": 2525} {"train_loss": -6.636654376983643, "global_step": 106069, "epoch": 2525} {"train_loss": -6.4334917068481445, "global_step": 106070, "epoch": 2525} {"train_loss": -6.322896957397461, "global_step": 106071, "epoch": 2525} {"train_loss": -6.486323833465576, "global_step": 106072, "epoch": 2525} {"train_loss": -6.3416643142700195, "global_step": 106073, "epoch": 2525} {"train_loss": -6.485222816467285, "global_step": 106074, "epoch": 2525} {"train_loss": -6.441952705383301, "global_step": 106075, "epoch": 2525} {"train_loss": -6.433911323547363, "global_step": 106076, "epoch": 2525} {"train_loss": -6.308135032653809, "global_step": 106077, "epoch": 2525} {"train_loss": -6.319815635681152, "global_step": 106078, "epoch": 2525} {"train_loss": -6.412041187286377, "global_step": 106079, "epoch": 2525} {"train_loss": -6.398194789886475, "global_step": 106080, "epoch": 2525} {"train_loss": -6.468039512634277, "global_step": 106081, "epoch": 2525} {"train_loss": -6.327272415161133, "global_step": 106082, "epoch": 2525} {"train_loss": -6.313041687011719, "global_step": 106083, "epoch": 2525} {"train_loss": -6.486710548400879, "global_step": 106084, "epoch": 2525} {"train_loss": -6.444169521331787, "global_step": 106085, "epoch": 2525} {"train_loss": -6.494889259338379, "global_step": 106086, "epoch": 2525} {"train_loss": -6.363191604614258, "global_step": 106087, "epoch": 2525} {"train_loss": -6.341145038604736, "global_step": 106088, "epoch": 2525} {"train_loss": -6.438050746917725, "global_step": 106089, "epoch": 2525} {"train_loss": -6.391414642333984, "global_step": 106090, "epoch": 2525} {"train_loss": -6.390439158394223, "global_step": 106091, "epoch": 2525, "val_loss": 76101.890625} {"train_loss": -6.481316089630127, "global_step": 106092, "epoch": 2526} {"train_loss": -6.509402275085449, "global_step": 106093, "epoch": 2526} {"train_loss": -6.43846321105957, "global_step": 106094, "epoch": 2526} {"train_loss": -6.485735893249512, "global_step": 106095, "epoch": 2526} {"train_loss": -6.296947956085205, "global_step": 106096, "epoch": 2526} {"train_loss": -6.417577743530273, "global_step": 106097, "epoch": 2526} {"train_loss": -6.507824420928955, "global_step": 106098, "epoch": 2526} {"train_loss": -6.377155303955078, "global_step": 106099, "epoch": 2526} {"train_loss": -6.2902703285217285, "global_step": 106100, "epoch": 2526} {"train_loss": -6.363402366638184, "global_step": 106101, "epoch": 2526} {"train_loss": -6.347133636474609, "global_step": 106102, "epoch": 2526} {"train_loss": -6.502214431762695, "global_step": 106103, "epoch": 2526} {"train_loss": -6.17215633392334, "global_step": 106104, "epoch": 2526} {"train_loss": -6.330339431762695, "global_step": 106105, "epoch": 2526} {"train_loss": -6.276914596557617, "global_step": 106106, "epoch": 2526} {"train_loss": -6.349684238433838, "global_step": 106107, "epoch": 2526} {"train_loss": -6.365251064300537, "global_step": 106108, "epoch": 2526} {"train_loss": -6.37353515625, "global_step": 106109, "epoch": 2526} {"train_loss": -6.451307773590088, "global_step": 106110, "epoch": 2526} {"train_loss": -6.284658432006836, "global_step": 106111, "epoch": 2526} {"train_loss": -6.541350364685059, "global_step": 106112, "epoch": 2526} {"train_loss": -6.4331769943237305, "global_step": 106113, "epoch": 2526} {"train_loss": -6.405638694763184, "global_step": 106114, "epoch": 2526} {"train_loss": -6.403818130493164, "global_step": 106115, "epoch": 2526} {"train_loss": -6.347597122192383, "global_step": 106116, "epoch": 2526} {"train_loss": -6.3826117515563965, "global_step": 106117, "epoch": 2526} {"train_loss": -6.441224575042725, "global_step": 106118, "epoch": 2526} {"train_loss": -6.564043998718262, "global_step": 106119, "epoch": 2526} {"train_loss": -6.389360427856445, "global_step": 106120, "epoch": 2526} {"train_loss": -6.481672286987305, "global_step": 106121, "epoch": 2526} {"train_loss": -6.398110389709473, "global_step": 106122, "epoch": 2526} {"train_loss": -6.365847110748291, "global_step": 106123, "epoch": 2526} {"train_loss": -6.494672775268555, "global_step": 106124, "epoch": 2526} {"train_loss": -6.398152828216553, "global_step": 106125, "epoch": 2526} {"train_loss": -6.3562703132629395, "global_step": 106126, "epoch": 2526} {"train_loss": -6.461729049682617, "global_step": 106127, "epoch": 2526} {"train_loss": -6.401592254638672, "global_step": 106128, "epoch": 2526} {"train_loss": -6.444029808044434, "global_step": 106129, "epoch": 2526} {"train_loss": -6.443257808685303, "global_step": 106130, "epoch": 2526} {"train_loss": -6.491055965423584, "global_step": 106131, "epoch": 2526} {"train_loss": -6.380640983581543, "global_step": 106132, "epoch": 2526} {"train_loss": -6.406487147013347, "global_step": 106133, "epoch": 2526, "val_loss": 76185.6640625} {"train_loss": -6.486600875854492, "global_step": 106134, "epoch": 2527} {"train_loss": -6.493204593658447, "global_step": 106135, "epoch": 2527} {"train_loss": -6.475811958312988, "global_step": 106136, "epoch": 2527} {"train_loss": -6.38780403137207, "global_step": 106137, "epoch": 2527} {"train_loss": -6.479619979858398, "global_step": 106138, "epoch": 2527} {"train_loss": -6.487268447875977, "global_step": 106139, "epoch": 2527} {"train_loss": -6.4653801918029785, "global_step": 106140, "epoch": 2527} {"train_loss": -6.346642971038818, "global_step": 106141, "epoch": 2527} {"train_loss": -6.418962478637695, "global_step": 106142, "epoch": 2527} {"train_loss": -6.2845330238342285, "global_step": 106143, "epoch": 2527} {"train_loss": -6.3595380783081055, "global_step": 106144, "epoch": 2527} {"train_loss": -6.286262512207031, "global_step": 106145, "epoch": 2527} {"train_loss": -6.353768825531006, "global_step": 106146, "epoch": 2527} {"train_loss": -6.349817276000977, "global_step": 106147, "epoch": 2527} {"train_loss": -6.450576305389404, "global_step": 106148, "epoch": 2527} {"train_loss": -6.153412342071533, "global_step": 106149, "epoch": 2527} {"train_loss": -6.265329360961914, "global_step": 106150, "epoch": 2527} {"train_loss": -6.284607887268066, "global_step": 106151, "epoch": 2527} {"train_loss": -6.201657295227051, "global_step": 106152, "epoch": 2527} {"train_loss": -6.246561050415039, "global_step": 106153, "epoch": 2527} {"train_loss": -6.191866874694824, "global_step": 106154, "epoch": 2527} {"train_loss": -6.303177833557129, "global_step": 106155, "epoch": 2527} {"train_loss": -6.3268818855285645, "global_step": 106156, "epoch": 2527} {"train_loss": -6.371326446533203, "global_step": 106157, "epoch": 2527} {"train_loss": -6.311408519744873, "global_step": 106158, "epoch": 2527} {"train_loss": -6.389545440673828, "global_step": 106159, "epoch": 2527} {"train_loss": -6.357820987701416, "global_step": 106160, "epoch": 2527} {"train_loss": -6.3919172286987305, "global_step": 106161, "epoch": 2527} {"train_loss": -6.370784282684326, "global_step": 106162, "epoch": 2527} {"train_loss": -6.508831977844238, "global_step": 106163, "epoch": 2527} {"train_loss": -6.431550025939941, "global_step": 106164, "epoch": 2527} {"train_loss": -6.362580299377441, "global_step": 106165, "epoch": 2527} {"train_loss": -6.392861366271973, "global_step": 106166, "epoch": 2527} {"train_loss": -6.4111328125, "global_step": 106167, "epoch": 2527} {"train_loss": -6.443251609802246, "global_step": 106168, "epoch": 2527} {"train_loss": -6.4249267578125, "global_step": 106169, "epoch": 2527} {"train_loss": -6.380105018615723, "global_step": 106170, "epoch": 2527} {"train_loss": -6.466279983520508, "global_step": 106171, "epoch": 2527} {"train_loss": -6.411821365356445, "global_step": 106172, "epoch": 2527} {"train_loss": -6.565288543701172, "global_step": 106173, "epoch": 2527} {"train_loss": -6.358918190002441, "global_step": 106174, "epoch": 2527} {"train_loss": -6.37747293426877, "global_step": 106175, "epoch": 2527, "val_loss": 75922.625} {"train_loss": -6.522385597229004, "global_step": 106176, "epoch": 2528} {"train_loss": -6.474175930023193, "global_step": 106177, "epoch": 2528} {"train_loss": -6.421980857849121, "global_step": 106178, "epoch": 2528} {"train_loss": -6.432785987854004, "global_step": 106179, "epoch": 2528} {"train_loss": -6.457298278808594, "global_step": 106180, "epoch": 2528} {"train_loss": -6.484841823577881, "global_step": 106181, "epoch": 2528} {"train_loss": -6.368253707885742, "global_step": 106182, "epoch": 2528} {"train_loss": -6.459912300109863, "global_step": 106183, "epoch": 2528} {"train_loss": -6.348937511444092, "global_step": 106184, "epoch": 2528} {"train_loss": -6.364921569824219, "global_step": 106185, "epoch": 2528} {"train_loss": -6.438556671142578, "global_step": 106186, "epoch": 2528} {"train_loss": -6.363231182098389, "global_step": 106187, "epoch": 2528} {"train_loss": -6.421075344085693, "global_step": 106188, "epoch": 2528} {"train_loss": -6.501668453216553, "global_step": 106189, "epoch": 2528} {"train_loss": -6.446206092834473, "global_step": 106190, "epoch": 2528} {"train_loss": -6.463292121887207, "global_step": 106191, "epoch": 2528} {"train_loss": -6.424577236175537, "global_step": 106192, "epoch": 2528} {"train_loss": -6.428377628326416, "global_step": 106193, "epoch": 2528} {"train_loss": -6.502806663513184, "global_step": 106194, "epoch": 2528} {"train_loss": -6.499666213989258, "global_step": 106195, "epoch": 2528} {"train_loss": -6.391240119934082, "global_step": 106196, "epoch": 2528} {"train_loss": -6.475193023681641, "global_step": 106197, "epoch": 2528} {"train_loss": -6.4518961906433105, "global_step": 106198, "epoch": 2528} {"train_loss": -6.6128740310668945, "global_step": 106199, "epoch": 2528} {"train_loss": -6.287248611450195, "global_step": 106200, "epoch": 2528} {"train_loss": -6.358620643615723, "global_step": 106201, "epoch": 2528} {"train_loss": -6.32708740234375, "global_step": 106202, "epoch": 2528} {"train_loss": -6.390690326690674, "global_step": 106203, "epoch": 2528} {"train_loss": -6.298255920410156, "global_step": 106204, "epoch": 2528} {"train_loss": -6.362740516662598, "global_step": 106205, "epoch": 2528} {"train_loss": -6.258179664611816, "global_step": 106206, "epoch": 2528} {"train_loss": -6.394298553466797, "global_step": 106207, "epoch": 2528} {"train_loss": -6.472492218017578, "global_step": 106208, "epoch": 2528} {"train_loss": -6.341440200805664, "global_step": 106209, "epoch": 2528} {"train_loss": -6.223686218261719, "global_step": 106210, "epoch": 2528} {"train_loss": -6.3786091804504395, "global_step": 106211, "epoch": 2528} {"train_loss": -6.315375328063965, "global_step": 106212, "epoch": 2528} {"train_loss": -6.45363712310791, "global_step": 106213, "epoch": 2528} {"train_loss": -6.130851745605469, "global_step": 106214, "epoch": 2528} {"train_loss": -6.321323394775391, "global_step": 106215, "epoch": 2528} {"train_loss": -6.29366397857666, "global_step": 106216, "epoch": 2528} {"train_loss": -6.398366065252395, "global_step": 106217, "epoch": 2528, "val_loss": 76447.2421875} {"train_loss": -6.359657287597656, "global_step": 106218, "epoch": 2529} {"train_loss": -6.2954912185668945, "global_step": 106219, "epoch": 2529} {"train_loss": -6.308055400848389, "global_step": 106220, "epoch": 2529} {"train_loss": -6.368859767913818, "global_step": 106221, "epoch": 2529} {"train_loss": -6.394753456115723, "global_step": 106222, "epoch": 2529} {"train_loss": -6.385373115539551, "global_step": 106223, "epoch": 2529} {"train_loss": -6.3023176193237305, "global_step": 106224, "epoch": 2529} {"train_loss": -6.355947971343994, "global_step": 106225, "epoch": 2529} {"train_loss": -6.386857032775879, "global_step": 106226, "epoch": 2529} {"train_loss": -6.354300022125244, "global_step": 106227, "epoch": 2529} {"train_loss": -6.408076286315918, "global_step": 106228, "epoch": 2529} {"train_loss": -6.442829132080078, "global_step": 106229, "epoch": 2529} {"train_loss": -6.3193254470825195, "global_step": 106230, "epoch": 2529} {"train_loss": -6.233511447906494, "global_step": 106231, "epoch": 2529} {"train_loss": -6.410132884979248, "global_step": 106232, "epoch": 2529} {"train_loss": -6.440067291259766, "global_step": 106233, "epoch": 2529} {"train_loss": -6.4838972091674805, "global_step": 106234, "epoch": 2529} {"train_loss": -6.522323131561279, "global_step": 106235, "epoch": 2529} {"train_loss": -6.45884895324707, "global_step": 106236, "epoch": 2529} {"train_loss": -6.328333854675293, "global_step": 106237, "epoch": 2529} {"train_loss": -6.415985107421875, "global_step": 106238, "epoch": 2529} {"train_loss": -6.543932914733887, "global_step": 106239, "epoch": 2529} {"train_loss": -6.417891502380371, "global_step": 106240, "epoch": 2529} {"train_loss": -6.4841814041137695, "global_step": 106241, "epoch": 2529} {"train_loss": -6.395401954650879, "global_step": 106242, "epoch": 2529} {"train_loss": -6.487161636352539, "global_step": 106243, "epoch": 2529} {"train_loss": -6.368168830871582, "global_step": 106244, "epoch": 2529} {"train_loss": -6.3668742179870605, "global_step": 106245, "epoch": 2529} {"train_loss": -6.412965297698975, "global_step": 106246, "epoch": 2529} {"train_loss": -6.426936149597168, "global_step": 106247, "epoch": 2529} {"train_loss": -6.440203666687012, "global_step": 106248, "epoch": 2529} {"train_loss": -6.500409126281738, "global_step": 106249, "epoch": 2529} {"train_loss": -6.4801812171936035, "global_step": 106250, "epoch": 2529} {"train_loss": -6.362277507781982, "global_step": 106251, "epoch": 2529} {"train_loss": -6.352635383605957, "global_step": 106252, "epoch": 2529} {"train_loss": -6.356558799743652, "global_step": 106253, "epoch": 2529} {"train_loss": -6.38490629196167, "global_step": 106254, "epoch": 2529} {"train_loss": -6.44553279876709, "global_step": 106255, "epoch": 2529} {"train_loss": -6.349540710449219, "global_step": 106256, "epoch": 2529} {"train_loss": -6.479609489440918, "global_step": 106257, "epoch": 2529} {"train_loss": -6.531907081604004, "global_step": 106258, "epoch": 2529} {"train_loss": -6.403878189268566, "global_step": 106259, "epoch": 2529, "val_loss": 76211.2578125} {"train_loss": -6.407961845397949, "global_step": 106260, "epoch": 2530} {"train_loss": -6.382254600524902, "global_step": 106261, "epoch": 2530} {"train_loss": -6.36582088470459, "global_step": 106262, "epoch": 2530} {"train_loss": -6.350320339202881, "global_step": 106263, "epoch": 2530} {"train_loss": -6.424110412597656, "global_step": 106264, "epoch": 2530} {"train_loss": -6.413942337036133, "global_step": 106265, "epoch": 2530} {"train_loss": -6.424753189086914, "global_step": 106266, "epoch": 2530} {"train_loss": -6.402005195617676, "global_step": 106267, "epoch": 2530} {"train_loss": -6.43356466293335, "global_step": 106268, "epoch": 2530} {"train_loss": -6.503273963928223, "global_step": 106269, "epoch": 2530} {"train_loss": -6.458469390869141, "global_step": 106270, "epoch": 2530} {"train_loss": -6.480541706085205, "global_step": 106271, "epoch": 2530} {"train_loss": -6.254330635070801, "global_step": 106272, "epoch": 2530} {"train_loss": -6.446835041046143, "global_step": 106273, "epoch": 2530} {"train_loss": -6.367240905761719, "global_step": 106274, "epoch": 2530} {"train_loss": -6.442021369934082, "global_step": 106275, "epoch": 2530} {"train_loss": -6.539830684661865, "global_step": 106276, "epoch": 2530} {"train_loss": -6.511415004730225, "global_step": 106277, "epoch": 2530} {"train_loss": -6.415250778198242, "global_step": 106278, "epoch": 2530} {"train_loss": -6.388428688049316, "global_step": 106279, "epoch": 2530} {"train_loss": -6.338351249694824, "global_step": 106280, "epoch": 2530} {"train_loss": -6.491127967834473, "global_step": 106281, "epoch": 2530} {"train_loss": -6.494565963745117, "global_step": 106282, "epoch": 2530} {"train_loss": -6.425991058349609, "global_step": 106283, "epoch": 2530} {"train_loss": -6.488282203674316, "global_step": 106284, "epoch": 2530} {"train_loss": -6.445173263549805, "global_step": 106285, "epoch": 2530} {"train_loss": -6.342848777770996, "global_step": 106286, "epoch": 2530} {"train_loss": -6.496756553649902, "global_step": 106287, "epoch": 2530} {"train_loss": -6.474651336669922, "global_step": 106288, "epoch": 2530} {"train_loss": -6.444924354553223, "global_step": 106289, "epoch": 2530} {"train_loss": -6.416751384735107, "global_step": 106290, "epoch": 2530} {"train_loss": -6.454006195068359, "global_step": 106291, "epoch": 2530} {"train_loss": -6.381397724151611, "global_step": 106292, "epoch": 2530} {"train_loss": -6.386834621429443, "global_step": 106293, "epoch": 2530} {"train_loss": -6.34420919418335, "global_step": 106294, "epoch": 2530} {"train_loss": -6.341039657592773, "global_step": 106295, "epoch": 2530} {"train_loss": -6.346953392028809, "global_step": 106296, "epoch": 2530} {"train_loss": -6.337301254272461, "global_step": 106297, "epoch": 2530} {"train_loss": -6.412670135498047, "global_step": 106298, "epoch": 2530} {"train_loss": -6.526780128479004, "global_step": 106299, "epoch": 2530} {"train_loss": -6.4664459228515625, "global_step": 106300, "epoch": 2530} {"train_loss": -6.422695273444766, "global_step": 106301, "epoch": 2530, "val_loss": 75997.171875} {"train_loss": -6.450970649719238, "global_step": 106302, "epoch": 2531} {"train_loss": -6.521774768829346, "global_step": 106303, "epoch": 2531} {"train_loss": -6.465121269226074, "global_step": 106304, "epoch": 2531} {"train_loss": -6.58442497253418, "global_step": 106305, "epoch": 2531} {"train_loss": -6.595482349395752, "global_step": 106306, "epoch": 2531} {"train_loss": -6.492504596710205, "global_step": 106307, "epoch": 2531} {"train_loss": -6.473949432373047, "global_step": 106308, "epoch": 2531} {"train_loss": -6.360496997833252, "global_step": 106309, "epoch": 2531} {"train_loss": -6.474015235900879, "global_step": 106310, "epoch": 2531} {"train_loss": -6.386025428771973, "global_step": 106311, "epoch": 2531} {"train_loss": -6.453097343444824, "global_step": 106312, "epoch": 2531} {"train_loss": -6.437958717346191, "global_step": 106313, "epoch": 2531} {"train_loss": -6.367015361785889, "global_step": 106314, "epoch": 2531} {"train_loss": -6.359380722045898, "global_step": 106315, "epoch": 2531} {"train_loss": -6.332036972045898, "global_step": 106316, "epoch": 2531} {"train_loss": -6.337814807891846, "global_step": 106317, "epoch": 2531} {"train_loss": -6.379239082336426, "global_step": 106318, "epoch": 2531} {"train_loss": -6.405145645141602, "global_step": 106319, "epoch": 2531} {"train_loss": -6.371079444885254, "global_step": 106320, "epoch": 2531} {"train_loss": -6.471936225891113, "global_step": 106321, "epoch": 2531} {"train_loss": -6.2789201736450195, "global_step": 106322, "epoch": 2531} {"train_loss": -6.296813488006592, "global_step": 106323, "epoch": 2531} {"train_loss": -6.399205684661865, "global_step": 106324, "epoch": 2531} {"train_loss": -6.3016676902771, "global_step": 106325, "epoch": 2531} {"train_loss": -6.405804634094238, "global_step": 106326, "epoch": 2531} {"train_loss": -6.398788928985596, "global_step": 106327, "epoch": 2531} {"train_loss": -6.178308963775635, "global_step": 106328, "epoch": 2531} {"train_loss": -6.398991584777832, "global_step": 106329, "epoch": 2531} {"train_loss": -6.444252014160156, "global_step": 106330, "epoch": 2531} {"train_loss": -6.396068096160889, "global_step": 106331, "epoch": 2531} {"train_loss": -6.5060133934021, "global_step": 106332, "epoch": 2531} {"train_loss": -6.409341812133789, "global_step": 106333, "epoch": 2531} {"train_loss": -6.447873115539551, "global_step": 106334, "epoch": 2531} {"train_loss": -6.413869857788086, "global_step": 106335, "epoch": 2531} {"train_loss": -6.466437339782715, "global_step": 106336, "epoch": 2531} {"train_loss": -6.353300094604492, "global_step": 106337, "epoch": 2531} {"train_loss": -6.499013900756836, "global_step": 106338, "epoch": 2531} {"train_loss": -6.446867942810059, "global_step": 106339, "epoch": 2531} {"train_loss": -6.323969841003418, "global_step": 106340, "epoch": 2531} {"train_loss": -6.421884059906006, "global_step": 106341, "epoch": 2531} {"train_loss": -6.372778415679932, "global_step": 106342, "epoch": 2531} {"train_loss": -6.411208709081014, "global_step": 106343, "epoch": 2531, "val_loss": 75972.3515625} {"train_loss": -6.4644694328308105, "global_step": 106344, "epoch": 2532} {"train_loss": -6.4162163734436035, "global_step": 106345, "epoch": 2532} {"train_loss": -6.539157867431641, "global_step": 106346, "epoch": 2532} {"train_loss": -6.453555107116699, "global_step": 106347, "epoch": 2532} {"train_loss": -6.476061820983887, "global_step": 106348, "epoch": 2532} {"train_loss": -6.465165138244629, "global_step": 106349, "epoch": 2532} {"train_loss": -6.428143501281738, "global_step": 106350, "epoch": 2532} {"train_loss": -6.445728302001953, "global_step": 106351, "epoch": 2532} {"train_loss": -6.4149861335754395, "global_step": 106352, "epoch": 2532} {"train_loss": -6.521688938140869, "global_step": 106353, "epoch": 2532} {"train_loss": -6.479155540466309, "global_step": 106354, "epoch": 2532} {"train_loss": -6.421863555908203, "global_step": 106355, "epoch": 2532} {"train_loss": -6.36988639831543, "global_step": 106356, "epoch": 2532} {"train_loss": -6.47224760055542, "global_step": 106357, "epoch": 2532} {"train_loss": -6.4285407066345215, "global_step": 106358, "epoch": 2532} {"train_loss": -6.4155073165893555, "global_step": 106359, "epoch": 2532} {"train_loss": -6.538139820098877, "global_step": 106360, "epoch": 2532} {"train_loss": -6.490505218505859, "global_step": 106361, "epoch": 2532} {"train_loss": -6.528120040893555, "global_step": 106362, "epoch": 2532} {"train_loss": -6.383798599243164, "global_step": 106363, "epoch": 2532} {"train_loss": -6.367917537689209, "global_step": 106364, "epoch": 2532} {"train_loss": -6.377669334411621, "global_step": 106365, "epoch": 2532} {"train_loss": -6.326310634613037, "global_step": 106366, "epoch": 2532} {"train_loss": -6.436891555786133, "global_step": 106367, "epoch": 2532} {"train_loss": -6.44902229309082, "global_step": 106368, "epoch": 2532} {"train_loss": -6.389820098876953, "global_step": 106369, "epoch": 2532} {"train_loss": -6.393505573272705, "global_step": 106370, "epoch": 2532} {"train_loss": -6.503838539123535, "global_step": 106371, "epoch": 2532} {"train_loss": -6.332128524780273, "global_step": 106372, "epoch": 2532} {"train_loss": -6.31910514831543, "global_step": 106373, "epoch": 2532} {"train_loss": -6.375894546508789, "global_step": 106374, "epoch": 2532} {"train_loss": -6.336129188537598, "global_step": 106375, "epoch": 2532} {"train_loss": -6.409253120422363, "global_step": 106376, "epoch": 2532} {"train_loss": -6.458758354187012, "global_step": 106377, "epoch": 2532} {"train_loss": -6.379528999328613, "global_step": 106378, "epoch": 2532} {"train_loss": -6.453853130340576, "global_step": 106379, "epoch": 2532} {"train_loss": -6.400249004364014, "global_step": 106380, "epoch": 2532} {"train_loss": -6.398177623748779, "global_step": 106381, "epoch": 2532} {"train_loss": -6.4598283767700195, "global_step": 106382, "epoch": 2532} {"train_loss": -6.463770389556885, "global_step": 106383, "epoch": 2532} {"train_loss": -6.4575347900390625, "global_step": 106384, "epoch": 2532} {"train_loss": -6.430964640208653, "global_step": 106385, "epoch": 2532, "val_loss": 76193.9453125} {"train_loss": -6.377123832702637, "global_step": 106386, "epoch": 2533} {"train_loss": -6.398045539855957, "global_step": 106387, "epoch": 2533} {"train_loss": -6.442215442657471, "global_step": 106388, "epoch": 2533} {"train_loss": -6.409034729003906, "global_step": 106389, "epoch": 2533} {"train_loss": -6.287324905395508, "global_step": 106390, "epoch": 2533} {"train_loss": -6.4602203369140625, "global_step": 106391, "epoch": 2533} {"train_loss": -6.238162040710449, "global_step": 106392, "epoch": 2533} {"train_loss": -6.4342474937438965, "global_step": 106393, "epoch": 2533} {"train_loss": -6.2333221435546875, "global_step": 106394, "epoch": 2533} {"train_loss": -6.465296745300293, "global_step": 106395, "epoch": 2533} {"train_loss": -6.431524753570557, "global_step": 106396, "epoch": 2533} {"train_loss": -6.268146514892578, "global_step": 106397, "epoch": 2533} {"train_loss": -6.4104814529418945, "global_step": 106398, "epoch": 2533} {"train_loss": -6.430287837982178, "global_step": 106399, "epoch": 2533} {"train_loss": -6.339018821716309, "global_step": 106400, "epoch": 2533} {"train_loss": -6.438482284545898, "global_step": 106401, "epoch": 2533} {"train_loss": -6.464969158172607, "global_step": 106402, "epoch": 2533} {"train_loss": -6.49886417388916, "global_step": 106403, "epoch": 2533} {"train_loss": -6.425284385681152, "global_step": 106404, "epoch": 2533} {"train_loss": -6.408490180969238, "global_step": 106405, "epoch": 2533} {"train_loss": -6.357292652130127, "global_step": 106406, "epoch": 2533} {"train_loss": -6.412290573120117, "global_step": 106407, "epoch": 2533} {"train_loss": -6.436161518096924, "global_step": 106408, "epoch": 2533} {"train_loss": -6.519107818603516, "global_step": 106409, "epoch": 2533} {"train_loss": -6.429783344268799, "global_step": 106410, "epoch": 2533} {"train_loss": -6.501446723937988, "global_step": 106411, "epoch": 2533} {"train_loss": -6.481264114379883, "global_step": 106412, "epoch": 2533} {"train_loss": -6.534721374511719, "global_step": 106413, "epoch": 2533} {"train_loss": -6.509284973144531, "global_step": 106414, "epoch": 2533} {"train_loss": -6.366457939147949, "global_step": 106415, "epoch": 2533} {"train_loss": -6.363408088684082, "global_step": 106416, "epoch": 2533} {"train_loss": -6.490900039672852, "global_step": 106417, "epoch": 2533} {"train_loss": -6.486550331115723, "global_step": 106418, "epoch": 2533} {"train_loss": -6.4683074951171875, "global_step": 106419, "epoch": 2533} {"train_loss": -6.4402289390563965, "global_step": 106420, "epoch": 2533} {"train_loss": -6.464269161224365, "global_step": 106421, "epoch": 2533} {"train_loss": -6.409518241882324, "global_step": 106422, "epoch": 2533} {"train_loss": -6.486952781677246, "global_step": 106423, "epoch": 2533} {"train_loss": -6.460070610046387, "global_step": 106424, "epoch": 2533} {"train_loss": -6.4206013679504395, "global_step": 106425, "epoch": 2533} {"train_loss": -6.500160217285156, "global_step": 106426, "epoch": 2533} {"train_loss": -6.428284701846895, "global_step": 106427, "epoch": 2533, "val_loss": 76082.2109375} {"train_loss": -6.48444128036499, "global_step": 106428, "epoch": 2534} {"train_loss": -6.4622907638549805, "global_step": 106429, "epoch": 2534} {"train_loss": -6.469931602478027, "global_step": 106430, "epoch": 2534} {"train_loss": -6.426909446716309, "global_step": 106431, "epoch": 2534} {"train_loss": -6.3675031661987305, "global_step": 106432, "epoch": 2534} {"train_loss": -6.38240909576416, "global_step": 106433, "epoch": 2534} {"train_loss": -6.448636054992676, "global_step": 106434, "epoch": 2534} {"train_loss": -6.417896747589111, "global_step": 106435, "epoch": 2534} {"train_loss": -6.432299613952637, "global_step": 106436, "epoch": 2534} {"train_loss": -6.445962905883789, "global_step": 106437, "epoch": 2534} {"train_loss": -6.418175220489502, "global_step": 106438, "epoch": 2534} {"train_loss": -6.432162284851074, "global_step": 106439, "epoch": 2534} {"train_loss": -6.424575328826904, "global_step": 106440, "epoch": 2534} {"train_loss": -6.453664302825928, "global_step": 106441, "epoch": 2534} {"train_loss": -6.295600891113281, "global_step": 106442, "epoch": 2534} {"train_loss": -6.403763771057129, "global_step": 106443, "epoch": 2534} {"train_loss": -6.385822296142578, "global_step": 106444, "epoch": 2534} {"train_loss": -6.444199562072754, "global_step": 106445, "epoch": 2534} {"train_loss": -6.254382133483887, "global_step": 106446, "epoch": 2534} {"train_loss": -6.33062744140625, "global_step": 106447, "epoch": 2534} {"train_loss": -6.329084873199463, "global_step": 106448, "epoch": 2534} {"train_loss": -6.303633213043213, "global_step": 106449, "epoch": 2534} {"train_loss": -6.340639114379883, "global_step": 106450, "epoch": 2534} {"train_loss": -6.467815399169922, "global_step": 106451, "epoch": 2534} {"train_loss": -6.402024269104004, "global_step": 106452, "epoch": 2534} {"train_loss": -6.274878978729248, "global_step": 106453, "epoch": 2534} {"train_loss": -6.371866226196289, "global_step": 106454, "epoch": 2534} {"train_loss": -6.3164472579956055, "global_step": 106455, "epoch": 2534} {"train_loss": -6.239002227783203, "global_step": 106456, "epoch": 2534} {"train_loss": -6.348323822021484, "global_step": 106457, "epoch": 2534} {"train_loss": -6.2233734130859375, "global_step": 106458, "epoch": 2534} {"train_loss": -6.374664306640625, "global_step": 106459, "epoch": 2534} {"train_loss": -6.208785057067871, "global_step": 106460, "epoch": 2534} {"train_loss": -6.42487096786499, "global_step": 106461, "epoch": 2534} {"train_loss": -6.442198753356934, "global_step": 106462, "epoch": 2534} {"train_loss": -6.247958183288574, "global_step": 106463, "epoch": 2534} {"train_loss": -6.498035430908203, "global_step": 106464, "epoch": 2534} {"train_loss": -6.325193405151367, "global_step": 106465, "epoch": 2534} {"train_loss": -6.441822052001953, "global_step": 106466, "epoch": 2534} {"train_loss": -6.349849224090576, "global_step": 106467, "epoch": 2534} {"train_loss": -6.332559585571289, "global_step": 106468, "epoch": 2534} {"train_loss": -6.378655047643752, "global_step": 106469, "epoch": 2534, "val_loss": 76003.21875} {"train_loss": -6.4584856033325195, "global_step": 106470, "epoch": 2535} {"train_loss": -6.368369102478027, "global_step": 106471, "epoch": 2535} {"train_loss": -6.345417499542236, "global_step": 106472, "epoch": 2535} {"train_loss": -6.430116653442383, "global_step": 106473, "epoch": 2535} {"train_loss": -6.416990756988525, "global_step": 106474, "epoch": 2535} {"train_loss": -6.352603912353516, "global_step": 106475, "epoch": 2535} {"train_loss": -6.386833190917969, "global_step": 106476, "epoch": 2535} {"train_loss": -6.370965003967285, "global_step": 106477, "epoch": 2535} {"train_loss": -6.384396076202393, "global_step": 106478, "epoch": 2535} {"train_loss": -6.473761081695557, "global_step": 106479, "epoch": 2535} {"train_loss": -6.575770378112793, "global_step": 106480, "epoch": 2535} {"train_loss": -6.540748596191406, "global_step": 106481, "epoch": 2535} {"train_loss": -6.3661956787109375, "global_step": 106482, "epoch": 2535} {"train_loss": -6.442131519317627, "global_step": 106483, "epoch": 2535} {"train_loss": -6.383975982666016, "global_step": 106484, "epoch": 2535} {"train_loss": -6.578830718994141, "global_step": 106485, "epoch": 2535} {"train_loss": -6.456190586090088, "global_step": 106486, "epoch": 2535} {"train_loss": -6.425045967102051, "global_step": 106487, "epoch": 2535} {"train_loss": -6.463829040527344, "global_step": 106488, "epoch": 2535} {"train_loss": -6.480892181396484, "global_step": 106489, "epoch": 2535} {"train_loss": -6.475819110870361, "global_step": 106490, "epoch": 2535} {"train_loss": -6.352702617645264, "global_step": 106491, "epoch": 2535} {"train_loss": -6.314233779907227, "global_step": 106492, "epoch": 2535} {"train_loss": -6.532419204711914, "global_step": 106493, "epoch": 2535} {"train_loss": -6.4328837394714355, "global_step": 106494, "epoch": 2535} {"train_loss": -6.47499942779541, "global_step": 106495, "epoch": 2535} {"train_loss": -6.532897472381592, "global_step": 106496, "epoch": 2535} {"train_loss": -6.473228454589844, "global_step": 106497, "epoch": 2535} {"train_loss": -6.30726432800293, "global_step": 106498, "epoch": 2535} {"train_loss": -6.504745960235596, "global_step": 106499, "epoch": 2535} {"train_loss": -6.459010601043701, "global_step": 106500, "epoch": 2535} {"train_loss": -6.436337471008301, "global_step": 106501, "epoch": 2535} {"train_loss": -6.393810272216797, "global_step": 106502, "epoch": 2535} {"train_loss": -6.43818473815918, "global_step": 106503, "epoch": 2535} {"train_loss": -6.5847063064575195, "global_step": 106504, "epoch": 2535} {"train_loss": -6.384993076324463, "global_step": 106505, "epoch": 2535} {"train_loss": -6.396533966064453, "global_step": 106506, "epoch": 2535} {"train_loss": -6.524165630340576, "global_step": 106507, "epoch": 2535} {"train_loss": -6.361231327056885, "global_step": 106508, "epoch": 2535} {"train_loss": -6.338767051696777, "global_step": 106509, "epoch": 2535} {"train_loss": -6.419256210327148, "global_step": 106510, "epoch": 2535} {"train_loss": -6.434803996767316, "global_step": 106511, "epoch": 2535, "val_loss": 76067.28125} {"train_loss": -6.54209041595459, "global_step": 106512, "epoch": 2536} {"train_loss": -6.3992509841918945, "global_step": 106513, "epoch": 2536} {"train_loss": -6.419468402862549, "global_step": 106514, "epoch": 2536} {"train_loss": -6.432296276092529, "global_step": 106515, "epoch": 2536} {"train_loss": -6.495617866516113, "global_step": 106516, "epoch": 2536} {"train_loss": -6.373529434204102, "global_step": 106517, "epoch": 2536} {"train_loss": -6.48200798034668, "global_step": 106518, "epoch": 2536} {"train_loss": -6.259797096252441, "global_step": 106519, "epoch": 2536} {"train_loss": -6.574241638183594, "global_step": 106520, "epoch": 2536} {"train_loss": -6.50200891494751, "global_step": 106521, "epoch": 2536} {"train_loss": -6.459536552429199, "global_step": 106522, "epoch": 2536} {"train_loss": -6.39455509185791, "global_step": 106523, "epoch": 2536} {"train_loss": -6.4724016189575195, "global_step": 106524, "epoch": 2536} {"train_loss": -6.424527168273926, "global_step": 106525, "epoch": 2536} {"train_loss": -6.4393157958984375, "global_step": 106526, "epoch": 2536} {"train_loss": -6.508094787597656, "global_step": 106527, "epoch": 2536} {"train_loss": -6.434978485107422, "global_step": 106528, "epoch": 2536} {"train_loss": -6.445199966430664, "global_step": 106529, "epoch": 2536} {"train_loss": -6.532281875610352, "global_step": 106530, "epoch": 2536} {"train_loss": -6.394617080688477, "global_step": 106531, "epoch": 2536} {"train_loss": -6.390603542327881, "global_step": 106532, "epoch": 2536} {"train_loss": -6.436327934265137, "global_step": 106533, "epoch": 2536} {"train_loss": -6.480864524841309, "global_step": 106534, "epoch": 2536} {"train_loss": -6.478052616119385, "global_step": 106535, "epoch": 2536} {"train_loss": -6.44963264465332, "global_step": 106536, "epoch": 2536} {"train_loss": -6.437808036804199, "global_step": 106537, "epoch": 2536} {"train_loss": -6.5062103271484375, "global_step": 106538, "epoch": 2536} {"train_loss": -6.3995513916015625, "global_step": 106539, "epoch": 2536} {"train_loss": -6.387698650360107, "global_step": 106540, "epoch": 2536} {"train_loss": -6.375543594360352, "global_step": 106541, "epoch": 2536} {"train_loss": -6.521655082702637, "global_step": 106542, "epoch": 2536} {"train_loss": -6.38687801361084, "global_step": 106543, "epoch": 2536} {"train_loss": -6.4332275390625, "global_step": 106544, "epoch": 2536} {"train_loss": -6.508519649505615, "global_step": 106545, "epoch": 2536} {"train_loss": -6.378686904907227, "global_step": 106546, "epoch": 2536} {"train_loss": -6.400946617126465, "global_step": 106547, "epoch": 2536} {"train_loss": -6.438663959503174, "global_step": 106548, "epoch": 2536} {"train_loss": -6.425522327423096, "global_step": 106549, "epoch": 2536} {"train_loss": -6.429816246032715, "global_step": 106550, "epoch": 2536} {"train_loss": -6.3950395584106445, "global_step": 106551, "epoch": 2536} {"train_loss": -6.360029220581055, "global_step": 106552, "epoch": 2536} {"train_loss": -6.440033696946644, "global_step": 106553, "epoch": 2536, "val_loss": 75945.03125} {"train_loss": -6.289055824279785, "global_step": 106554, "epoch": 2537} {"train_loss": -6.290136814117432, "global_step": 106555, "epoch": 2537} {"train_loss": -6.406609535217285, "global_step": 106556, "epoch": 2537} {"train_loss": -6.402635097503662, "global_step": 106557, "epoch": 2537} {"train_loss": -6.428034782409668, "global_step": 106558, "epoch": 2537} {"train_loss": -6.285652160644531, "global_step": 106559, "epoch": 2537} {"train_loss": -6.354961395263672, "global_step": 106560, "epoch": 2537} {"train_loss": -6.35531759262085, "global_step": 106561, "epoch": 2537} {"train_loss": -6.253194808959961, "global_step": 106562, "epoch": 2537} {"train_loss": -6.48861026763916, "global_step": 106563, "epoch": 2537} {"train_loss": -6.306797504425049, "global_step": 106564, "epoch": 2537} {"train_loss": -6.420953273773193, "global_step": 106565, "epoch": 2537} {"train_loss": -6.381160736083984, "global_step": 106566, "epoch": 2537} {"train_loss": -6.529596328735352, "global_step": 106567, "epoch": 2537} {"train_loss": -6.370716094970703, "global_step": 106568, "epoch": 2537} {"train_loss": -6.348114490509033, "global_step": 106569, "epoch": 2537} {"train_loss": -6.57382869720459, "global_step": 106570, "epoch": 2537} {"train_loss": -6.295788764953613, "global_step": 106571, "epoch": 2537} {"train_loss": -6.3834428787231445, "global_step": 106572, "epoch": 2537} {"train_loss": -6.52803897857666, "global_step": 106573, "epoch": 2537} {"train_loss": -6.3780436515808105, "global_step": 106574, "epoch": 2537} {"train_loss": -6.490795135498047, "global_step": 106575, "epoch": 2537} {"train_loss": -6.399405479431152, "global_step": 106576, "epoch": 2537} {"train_loss": -6.477624893188477, "global_step": 106577, "epoch": 2537} {"train_loss": -6.438837051391602, "global_step": 106578, "epoch": 2537} {"train_loss": -6.487241268157959, "global_step": 106579, "epoch": 2537} {"train_loss": -6.412978172302246, "global_step": 106580, "epoch": 2537} {"train_loss": -6.4613800048828125, "global_step": 106581, "epoch": 2537} {"train_loss": -6.514037132263184, "global_step": 106582, "epoch": 2537} {"train_loss": -6.3976898193359375, "global_step": 106583, "epoch": 2537} {"train_loss": -6.366672515869141, "global_step": 106584, "epoch": 2537} {"train_loss": -6.508026123046875, "global_step": 106585, "epoch": 2537} {"train_loss": -6.3941731452941895, "global_step": 106586, "epoch": 2537} {"train_loss": -6.407955169677734, "global_step": 106587, "epoch": 2537} {"train_loss": -6.562283992767334, "global_step": 106588, "epoch": 2537} {"train_loss": -6.4746880531311035, "global_step": 106589, "epoch": 2537} {"train_loss": -6.3739776611328125, "global_step": 106590, "epoch": 2537} {"train_loss": -6.375101089477539, "global_step": 106591, "epoch": 2537} {"train_loss": -6.330706596374512, "global_step": 106592, "epoch": 2537} {"train_loss": -6.4627532958984375, "global_step": 106593, "epoch": 2537} {"train_loss": -6.3661956787109375, "global_step": 106594, "epoch": 2537} {"train_loss": -6.4056815306345625, "global_step": 106595, "epoch": 2537, "val_loss": 76275.359375} {"train_loss": -6.381083965301514, "global_step": 106596, "epoch": 2538} {"train_loss": -6.456116199493408, "global_step": 106597, "epoch": 2538} {"train_loss": -6.450641632080078, "global_step": 106598, "epoch": 2538} {"train_loss": -6.336972236633301, "global_step": 106599, "epoch": 2538} {"train_loss": -6.468865394592285, "global_step": 106600, "epoch": 2538} {"train_loss": -6.369229793548584, "global_step": 106601, "epoch": 2538} {"train_loss": -6.411343574523926, "global_step": 106602, "epoch": 2538} {"train_loss": -6.348021507263184, "global_step": 106603, "epoch": 2538} {"train_loss": -6.452458381652832, "global_step": 106604, "epoch": 2538} {"train_loss": -6.286053657531738, "global_step": 106605, "epoch": 2538} {"train_loss": -6.376693248748779, "global_step": 106606, "epoch": 2538} {"train_loss": -6.285932540893555, "global_step": 106607, "epoch": 2538} {"train_loss": -6.339109420776367, "global_step": 106608, "epoch": 2538} {"train_loss": -6.419144153594971, "global_step": 106609, "epoch": 2538} {"train_loss": -6.417073726654053, "global_step": 106610, "epoch": 2538} {"train_loss": -6.4069085121154785, "global_step": 106611, "epoch": 2538} {"train_loss": -6.325399398803711, "global_step": 106612, "epoch": 2538} {"train_loss": -6.383804798126221, "global_step": 106613, "epoch": 2538} {"train_loss": -6.337226867675781, "global_step": 106614, "epoch": 2538} {"train_loss": -6.341700553894043, "global_step": 106615, "epoch": 2538} {"train_loss": -6.401893615722656, "global_step": 106616, "epoch": 2538} {"train_loss": -6.240139961242676, "global_step": 106617, "epoch": 2538} {"train_loss": -6.383644104003906, "global_step": 106618, "epoch": 2538} {"train_loss": -6.243468284606934, "global_step": 106619, "epoch": 2538} {"train_loss": -6.286561489105225, "global_step": 106620, "epoch": 2538} {"train_loss": -6.303800582885742, "global_step": 106621, "epoch": 2538} {"train_loss": -6.466217041015625, "global_step": 106622, "epoch": 2538} {"train_loss": -6.433070182800293, "global_step": 106623, "epoch": 2538} {"train_loss": -6.464389324188232, "global_step": 106624, "epoch": 2538} {"train_loss": -6.256827354431152, "global_step": 106625, "epoch": 2538} {"train_loss": -6.440019607543945, "global_step": 106626, "epoch": 2538} {"train_loss": -6.481797218322754, "global_step": 106627, "epoch": 2538} {"train_loss": -6.460172653198242, "global_step": 106628, "epoch": 2538} {"train_loss": -6.429388523101807, "global_step": 106629, "epoch": 2538} {"train_loss": -6.431267261505127, "global_step": 106630, "epoch": 2538} {"train_loss": -6.3784499168396, "global_step": 106631, "epoch": 2538} {"train_loss": -6.393283843994141, "global_step": 106632, "epoch": 2538} {"train_loss": -6.440088272094727, "global_step": 106633, "epoch": 2538} {"train_loss": -6.550123691558838, "global_step": 106634, "epoch": 2538} {"train_loss": -6.386005401611328, "global_step": 106635, "epoch": 2538} {"train_loss": -6.532994270324707, "global_step": 106636, "epoch": 2538} {"train_loss": -6.390610081808908, "global_step": 106637, "epoch": 2538, "val_loss": 75952.78125} {"train_loss": -6.470722198486328, "global_step": 106638, "epoch": 2539} {"train_loss": -6.438187599182129, "global_step": 106639, "epoch": 2539} {"train_loss": -6.493446350097656, "global_step": 106640, "epoch": 2539} {"train_loss": -6.4304890632629395, "global_step": 106641, "epoch": 2539} {"train_loss": -6.380791187286377, "global_step": 106642, "epoch": 2539} {"train_loss": -6.426102161407471, "global_step": 106643, "epoch": 2539} {"train_loss": -6.4581522941589355, "global_step": 106644, "epoch": 2539} {"train_loss": -6.480666637420654, "global_step": 106645, "epoch": 2539} {"train_loss": -6.437643051147461, "global_step": 106646, "epoch": 2539} {"train_loss": -6.439024925231934, "global_step": 106647, "epoch": 2539} {"train_loss": -6.468200206756592, "global_step": 106648, "epoch": 2539} {"train_loss": -6.417148590087891, "global_step": 106649, "epoch": 2539} {"train_loss": -6.474225997924805, "global_step": 106650, "epoch": 2539} {"train_loss": -6.293953895568848, "global_step": 106651, "epoch": 2539} {"train_loss": -6.471572399139404, "global_step": 106652, "epoch": 2539} {"train_loss": -6.457496166229248, "global_step": 106653, "epoch": 2539} {"train_loss": -6.5077972412109375, "global_step": 106654, "epoch": 2539} {"train_loss": -6.3232221603393555, "global_step": 106655, "epoch": 2539} {"train_loss": -6.5585126876831055, "global_step": 106656, "epoch": 2539} {"train_loss": -6.408428192138672, "global_step": 106657, "epoch": 2539} {"train_loss": -6.309516906738281, "global_step": 106658, "epoch": 2539} {"train_loss": -6.424563884735107, "global_step": 106659, "epoch": 2539} {"train_loss": -6.4236931800842285, "global_step": 106660, "epoch": 2539} {"train_loss": -6.319899082183838, "global_step": 106661, "epoch": 2539} {"train_loss": -6.265377521514893, "global_step": 106662, "epoch": 2539} {"train_loss": -6.441866397857666, "global_step": 106663, "epoch": 2539} {"train_loss": -6.353525161743164, "global_step": 106664, "epoch": 2539} {"train_loss": -6.438921928405762, "global_step": 106665, "epoch": 2539} {"train_loss": -6.392779350280762, "global_step": 106666, "epoch": 2539} {"train_loss": -6.372501373291016, "global_step": 106667, "epoch": 2539} {"train_loss": -6.5173845291137695, "global_step": 106668, "epoch": 2539} {"train_loss": -6.416886329650879, "global_step": 106669, "epoch": 2539} {"train_loss": -6.342151641845703, "global_step": 106670, "epoch": 2539} {"train_loss": -6.463929176330566, "global_step": 106671, "epoch": 2539} {"train_loss": -6.3449530601501465, "global_step": 106672, "epoch": 2539} {"train_loss": -6.350253105163574, "global_step": 106673, "epoch": 2539} {"train_loss": -6.4590959548950195, "global_step": 106674, "epoch": 2539} {"train_loss": -6.471673011779785, "global_step": 106675, "epoch": 2539} {"train_loss": -6.517786026000977, "global_step": 106676, "epoch": 2539} {"train_loss": -6.348962783813477, "global_step": 106677, "epoch": 2539} {"train_loss": -6.374264240264893, "global_step": 106678, "epoch": 2539} {"train_loss": -6.420004208882649, "global_step": 106679, "epoch": 2539, "val_loss": 75999.203125} {"train_loss": -6.405326843261719, "global_step": 106680, "epoch": 2540} {"train_loss": -6.482180595397949, "global_step": 106681, "epoch": 2540} {"train_loss": -6.468194007873535, "global_step": 106682, "epoch": 2540} {"train_loss": -6.537822723388672, "global_step": 106683, "epoch": 2540} {"train_loss": -6.517822265625, "global_step": 106684, "epoch": 2540} {"train_loss": -6.465123653411865, "global_step": 106685, "epoch": 2540} {"train_loss": -6.514834880828857, "global_step": 106686, "epoch": 2540} {"train_loss": -6.446718215942383, "global_step": 106687, "epoch": 2540} {"train_loss": -6.403111457824707, "global_step": 106688, "epoch": 2540} {"train_loss": -6.3982744216918945, "global_step": 106689, "epoch": 2540} {"train_loss": -6.483099937438965, "global_step": 106690, "epoch": 2540} {"train_loss": -6.481370449066162, "global_step": 106691, "epoch": 2540} {"train_loss": -6.320375442504883, "global_step": 106692, "epoch": 2540} {"train_loss": -6.368709564208984, "global_step": 106693, "epoch": 2540} {"train_loss": -6.371901512145996, "global_step": 106694, "epoch": 2540} {"train_loss": -6.331634521484375, "global_step": 106695, "epoch": 2540} {"train_loss": -6.434020042419434, "global_step": 106696, "epoch": 2540} {"train_loss": -6.3010454177856445, "global_step": 106697, "epoch": 2540} {"train_loss": -6.388693332672119, "global_step": 106698, "epoch": 2540} {"train_loss": -6.442630767822266, "global_step": 106699, "epoch": 2540} {"train_loss": -6.313925743103027, "global_step": 106700, "epoch": 2540} {"train_loss": -6.347389221191406, "global_step": 106701, "epoch": 2540} {"train_loss": -6.310450077056885, "global_step": 106702, "epoch": 2540} {"train_loss": -6.240509986877441, "global_step": 106703, "epoch": 2540} {"train_loss": -6.432872772216797, "global_step": 106704, "epoch": 2540} {"train_loss": -6.5180253982543945, "global_step": 106705, "epoch": 2540} {"train_loss": -6.40296745300293, "global_step": 106706, "epoch": 2540} {"train_loss": -6.335247039794922, "global_step": 106707, "epoch": 2540} {"train_loss": -6.408291816711426, "global_step": 106708, "epoch": 2540} {"train_loss": -6.325586795806885, "global_step": 106709, "epoch": 2540} {"train_loss": -6.516239643096924, "global_step": 106710, "epoch": 2540} {"train_loss": -6.333066940307617, "global_step": 106711, "epoch": 2540} {"train_loss": -6.388822078704834, "global_step": 106712, "epoch": 2540} {"train_loss": -6.315800666809082, "global_step": 106713, "epoch": 2540} {"train_loss": -6.3963518142700195, "global_step": 106714, "epoch": 2540} {"train_loss": -6.515964508056641, "global_step": 106715, "epoch": 2540} {"train_loss": -6.428340435028076, "global_step": 106716, "epoch": 2540} {"train_loss": -6.320216178894043, "global_step": 106717, "epoch": 2540} {"train_loss": -6.444518089294434, "global_step": 106718, "epoch": 2540} {"train_loss": -6.438152313232422, "global_step": 106719, "epoch": 2540} {"train_loss": -6.307858467102051, "global_step": 106720, "epoch": 2540} {"train_loss": -6.4080469608306885, "global_step": 106721, "epoch": 2540, "val_loss": 75983.1875} {"train_loss": -6.459035873413086, "global_step": 106722, "epoch": 2541} {"train_loss": -6.466124534606934, "global_step": 106723, "epoch": 2541} {"train_loss": -6.314496994018555, "global_step": 106724, "epoch": 2541} {"train_loss": -6.3496294021606445, "global_step": 106725, "epoch": 2541} {"train_loss": -6.281545639038086, "global_step": 106726, "epoch": 2541} {"train_loss": -6.419943809509277, "global_step": 106727, "epoch": 2541} {"train_loss": -6.5288872718811035, "global_step": 106728, "epoch": 2541} {"train_loss": -6.4625091552734375, "global_step": 106729, "epoch": 2541} {"train_loss": -6.4675612449646, "global_step": 106730, "epoch": 2541} {"train_loss": -6.422163009643555, "global_step": 106731, "epoch": 2541} {"train_loss": -6.458978176116943, "global_step": 106732, "epoch": 2541} {"train_loss": -6.451155185699463, "global_step": 106733, "epoch": 2541} {"train_loss": -6.478423118591309, "global_step": 106734, "epoch": 2541} {"train_loss": -6.408836841583252, "global_step": 106735, "epoch": 2541} {"train_loss": -6.40878963470459, "global_step": 106736, "epoch": 2541} {"train_loss": -6.413128852844238, "global_step": 106737, "epoch": 2541} {"train_loss": -6.348440170288086, "global_step": 106738, "epoch": 2541} {"train_loss": -6.333710193634033, "global_step": 106739, "epoch": 2541} {"train_loss": -6.452132225036621, "global_step": 106740, "epoch": 2541} {"train_loss": -6.441648960113525, "global_step": 106741, "epoch": 2541} {"train_loss": -6.370600700378418, "global_step": 106742, "epoch": 2541} {"train_loss": -6.345879554748535, "global_step": 106743, "epoch": 2541} {"train_loss": -6.423983097076416, "global_step": 106744, "epoch": 2541} {"train_loss": -6.32380485534668, "global_step": 106745, "epoch": 2541} {"train_loss": -6.322383880615234, "global_step": 106746, "epoch": 2541} {"train_loss": -6.539633750915527, "global_step": 106747, "epoch": 2541} {"train_loss": -6.526993751525879, "global_step": 106748, "epoch": 2541} {"train_loss": -6.323882579803467, "global_step": 106749, "epoch": 2541} {"train_loss": -6.394303321838379, "global_step": 106750, "epoch": 2541} {"train_loss": -6.422839164733887, "global_step": 106751, "epoch": 2541} {"train_loss": -6.340328216552734, "global_step": 106752, "epoch": 2541} {"train_loss": -6.319655418395996, "global_step": 106753, "epoch": 2541} {"train_loss": -6.49828577041626, "global_step": 106754, "epoch": 2541} {"train_loss": -6.538827419281006, "global_step": 106755, "epoch": 2541} {"train_loss": -6.491878509521484, "global_step": 106756, "epoch": 2541} {"train_loss": -6.435903549194336, "global_step": 106757, "epoch": 2541} {"train_loss": -6.382277488708496, "global_step": 106758, "epoch": 2541} {"train_loss": -6.592559814453125, "global_step": 106759, "epoch": 2541} {"train_loss": -6.546114921569824, "global_step": 106760, "epoch": 2541} {"train_loss": -6.538614273071289, "global_step": 106761, "epoch": 2541} {"train_loss": -6.454054832458496, "global_step": 106762, "epoch": 2541} {"train_loss": -6.425212826047625, "global_step": 106763, "epoch": 2541, "val_loss": 76187.5546875} {"train_loss": -6.441884994506836, "global_step": 106764, "epoch": 2542} {"train_loss": -6.545845985412598, "global_step": 106765, "epoch": 2542} {"train_loss": -6.3771867752075195, "global_step": 106766, "epoch": 2542} {"train_loss": -6.519224166870117, "global_step": 106767, "epoch": 2542} {"train_loss": -6.465203285217285, "global_step": 106768, "epoch": 2542} {"train_loss": -6.3884172439575195, "global_step": 106769, "epoch": 2542} {"train_loss": -6.584759712219238, "global_step": 106770, "epoch": 2542} {"train_loss": -6.387734413146973, "global_step": 106771, "epoch": 2542} {"train_loss": -6.421262741088867, "global_step": 106772, "epoch": 2542} {"train_loss": -6.397019386291504, "global_step": 106773, "epoch": 2542} {"train_loss": -6.365739822387695, "global_step": 106774, "epoch": 2542} {"train_loss": -6.265318870544434, "global_step": 106775, "epoch": 2542} {"train_loss": -6.4483137130737305, "global_step": 106776, "epoch": 2542} {"train_loss": -6.557989120483398, "global_step": 106777, "epoch": 2542} {"train_loss": -6.293267726898193, "global_step": 106778, "epoch": 2542} {"train_loss": -6.470789909362793, "global_step": 106779, "epoch": 2542} {"train_loss": -6.4817328453063965, "global_step": 106780, "epoch": 2542} {"train_loss": -6.316217422485352, "global_step": 106781, "epoch": 2542} {"train_loss": -6.465580940246582, "global_step": 106782, "epoch": 2542} {"train_loss": -6.306312561035156, "global_step": 106783, "epoch": 2542} {"train_loss": -6.408174514770508, "global_step": 106784, "epoch": 2542} {"train_loss": -6.381497859954834, "global_step": 106785, "epoch": 2542} {"train_loss": -6.434454441070557, "global_step": 106786, "epoch": 2542} {"train_loss": -6.444815635681152, "global_step": 106787, "epoch": 2542} {"train_loss": -6.44621467590332, "global_step": 106788, "epoch": 2542} {"train_loss": -6.352776527404785, "global_step": 106789, "epoch": 2542} {"train_loss": -6.217893600463867, "global_step": 106790, "epoch": 2542} {"train_loss": -6.316860198974609, "global_step": 106791, "epoch": 2542} {"train_loss": -6.2576494216918945, "global_step": 106792, "epoch": 2542} {"train_loss": -6.245579719543457, "global_step": 106793, "epoch": 2542} {"train_loss": -6.254162788391113, "global_step": 106794, "epoch": 2542} {"train_loss": -6.460230827331543, "global_step": 106795, "epoch": 2542} {"train_loss": -6.284140586853027, "global_step": 106796, "epoch": 2542} {"train_loss": -6.262258529663086, "global_step": 106797, "epoch": 2542} {"train_loss": -6.369568824768066, "global_step": 106798, "epoch": 2542} {"train_loss": -6.416199684143066, "global_step": 106799, "epoch": 2542} {"train_loss": -6.386727333068848, "global_step": 106800, "epoch": 2542} {"train_loss": -6.374978065490723, "global_step": 106801, "epoch": 2542} {"train_loss": -6.406263828277588, "global_step": 106802, "epoch": 2542} {"train_loss": -6.408233165740967, "global_step": 106803, "epoch": 2542} {"train_loss": -6.414756774902344, "global_step": 106804, "epoch": 2542} {"train_loss": -6.390775612422398, "global_step": 106805, "epoch": 2542, "val_loss": 76446.375} {"train_loss": -6.45975399017334, "global_step": 106806, "epoch": 2543} {"train_loss": -6.362248420715332, "global_step": 106807, "epoch": 2543} {"train_loss": -6.405245780944824, "global_step": 106808, "epoch": 2543} {"train_loss": -6.470685005187988, "global_step": 106809, "epoch": 2543} {"train_loss": -6.472018241882324, "global_step": 106810, "epoch": 2543} {"train_loss": -6.344050884246826, "global_step": 106811, "epoch": 2543} {"train_loss": -6.53962516784668, "global_step": 106812, "epoch": 2543} {"train_loss": -6.528491020202637, "global_step": 106813, "epoch": 2543} {"train_loss": -6.313498020172119, "global_step": 106814, "epoch": 2543} {"train_loss": -6.419794082641602, "global_step": 106815, "epoch": 2543} {"train_loss": -6.365120887756348, "global_step": 106816, "epoch": 2543} {"train_loss": -6.354039192199707, "global_step": 106817, "epoch": 2543} {"train_loss": -6.565829277038574, "global_step": 106818, "epoch": 2543} {"train_loss": -6.309625148773193, "global_step": 106819, "epoch": 2543} {"train_loss": -6.4267449378967285, "global_step": 106820, "epoch": 2543} {"train_loss": -6.548796653747559, "global_step": 106821, "epoch": 2543} {"train_loss": -6.502834320068359, "global_step": 106822, "epoch": 2543} {"train_loss": -6.451035499572754, "global_step": 106823, "epoch": 2543} {"train_loss": -6.3965911865234375, "global_step": 106824, "epoch": 2543} {"train_loss": -6.553461074829102, "global_step": 106825, "epoch": 2543} {"train_loss": -6.338550567626953, "global_step": 106826, "epoch": 2543} {"train_loss": -6.477992057800293, "global_step": 106827, "epoch": 2543} {"train_loss": -6.511241912841797, "global_step": 106828, "epoch": 2543} {"train_loss": -6.513827800750732, "global_step": 106829, "epoch": 2543} {"train_loss": -6.396259307861328, "global_step": 106830, "epoch": 2543} {"train_loss": -6.410829544067383, "global_step": 106831, "epoch": 2543} {"train_loss": -6.388031005859375, "global_step": 106832, "epoch": 2543} {"train_loss": -6.509150505065918, "global_step": 106833, "epoch": 2543} {"train_loss": -6.421744346618652, "global_step": 106834, "epoch": 2543} {"train_loss": -6.332406997680664, "global_step": 106835, "epoch": 2543} {"train_loss": -6.418398857116699, "global_step": 106836, "epoch": 2543} {"train_loss": -6.331125259399414, "global_step": 106837, "epoch": 2543} {"train_loss": -6.341082572937012, "global_step": 106838, "epoch": 2543} {"train_loss": -6.50159215927124, "global_step": 106839, "epoch": 2543} {"train_loss": -6.217273712158203, "global_step": 106840, "epoch": 2543} {"train_loss": -6.370237827301025, "global_step": 106841, "epoch": 2543} {"train_loss": -6.461063385009766, "global_step": 106842, "epoch": 2543} {"train_loss": -6.250624656677246, "global_step": 106843, "epoch": 2543} {"train_loss": -6.322864532470703, "global_step": 106844, "epoch": 2543} {"train_loss": -6.393328666687012, "global_step": 106845, "epoch": 2543} {"train_loss": -6.239981651306152, "global_step": 106846, "epoch": 2543} {"train_loss": -6.412830829620361, "global_step": 106847, "epoch": 2543, "val_loss": 75738.828125} {"train_loss": -6.416762351989746, "global_step": 106848, "epoch": 2544} {"train_loss": -6.430757999420166, "global_step": 106849, "epoch": 2544} {"train_loss": -6.307260990142822, "global_step": 106850, "epoch": 2544} {"train_loss": -6.424204349517822, "global_step": 106851, "epoch": 2544} {"train_loss": -6.458144187927246, "global_step": 106852, "epoch": 2544} {"train_loss": -6.424530029296875, "global_step": 106853, "epoch": 2544} {"train_loss": -6.380321502685547, "global_step": 106854, "epoch": 2544} {"train_loss": -6.2308831214904785, "global_step": 106855, "epoch": 2544} {"train_loss": -6.361735820770264, "global_step": 106856, "epoch": 2544} {"train_loss": -6.41936731338501, "global_step": 106857, "epoch": 2544} {"train_loss": -6.286410331726074, "global_step": 106858, "epoch": 2544} {"train_loss": -6.406949520111084, "global_step": 106859, "epoch": 2544} {"train_loss": -6.406394004821777, "global_step": 106860, "epoch": 2544} {"train_loss": -6.2689619064331055, "global_step": 106861, "epoch": 2544} {"train_loss": -6.329660415649414, "global_step": 106862, "epoch": 2544} {"train_loss": -6.198539733886719, "global_step": 106863, "epoch": 2544} {"train_loss": -6.269272327423096, "global_step": 106864, "epoch": 2544} {"train_loss": -6.418583869934082, "global_step": 106865, "epoch": 2544} {"train_loss": -6.274684906005859, "global_step": 106866, "epoch": 2544} {"train_loss": -6.3662872314453125, "global_step": 106867, "epoch": 2544} {"train_loss": -6.257079124450684, "global_step": 106868, "epoch": 2544} {"train_loss": -6.354537487030029, "global_step": 106869, "epoch": 2544} {"train_loss": -6.339929580688477, "global_step": 106870, "epoch": 2544} {"train_loss": -6.320581912994385, "global_step": 106871, "epoch": 2544} {"train_loss": -6.4252777099609375, "global_step": 106872, "epoch": 2544} {"train_loss": -6.287847518920898, "global_step": 106873, "epoch": 2544} {"train_loss": -6.433986663818359, "global_step": 106874, "epoch": 2544} {"train_loss": -6.406089782714844, "global_step": 106875, "epoch": 2544} {"train_loss": -6.385201930999756, "global_step": 106876, "epoch": 2544} {"train_loss": -6.255588531494141, "global_step": 106877, "epoch": 2544} {"train_loss": -6.402799606323242, "global_step": 106878, "epoch": 2544} {"train_loss": -6.388271331787109, "global_step": 106879, "epoch": 2544} {"train_loss": -6.451128005981445, "global_step": 106880, "epoch": 2544} {"train_loss": -6.338742256164551, "global_step": 106881, "epoch": 2544} {"train_loss": -6.620436191558838, "global_step": 106882, "epoch": 2544} {"train_loss": -6.565173149108887, "global_step": 106883, "epoch": 2544} {"train_loss": -6.405680179595947, "global_step": 106884, "epoch": 2544} {"train_loss": -6.550419807434082, "global_step": 106885, "epoch": 2544} {"train_loss": -6.412954330444336, "global_step": 106886, "epoch": 2544} {"train_loss": -6.561769485473633, "global_step": 106887, "epoch": 2544} {"train_loss": -6.439932346343994, "global_step": 106888, "epoch": 2544} {"train_loss": -6.3845948832375665, "global_step": 106889, "epoch": 2544, "val_loss": 75964.8203125} {"train_loss": -6.467912197113037, "global_step": 106890, "epoch": 2545} {"train_loss": -6.384875774383545, "global_step": 106891, "epoch": 2545} {"train_loss": -6.445749282836914, "global_step": 106892, "epoch": 2545} {"train_loss": -6.410432815551758, "global_step": 106893, "epoch": 2545} {"train_loss": -6.4027204513549805, "global_step": 106894, "epoch": 2545} {"train_loss": -6.464111804962158, "global_step": 106895, "epoch": 2545} {"train_loss": -6.437551498413086, "global_step": 106896, "epoch": 2545} {"train_loss": -6.441877365112305, "global_step": 106897, "epoch": 2545} {"train_loss": -6.559516906738281, "global_step": 106898, "epoch": 2545} {"train_loss": -6.331245422363281, "global_step": 106899, "epoch": 2545} {"train_loss": -6.381803512573242, "global_step": 106900, "epoch": 2545} {"train_loss": -6.373593330383301, "global_step": 106901, "epoch": 2545} {"train_loss": -6.3535614013671875, "global_step": 106902, "epoch": 2545} {"train_loss": -6.4024128913879395, "global_step": 106903, "epoch": 2545} {"train_loss": -6.399059772491455, "global_step": 106904, "epoch": 2545} {"train_loss": -6.46258544921875, "global_step": 106905, "epoch": 2545} {"train_loss": -6.519989490509033, "global_step": 106906, "epoch": 2545} {"train_loss": -6.436278820037842, "global_step": 106907, "epoch": 2545} {"train_loss": -6.493301868438721, "global_step": 106908, "epoch": 2545} {"train_loss": -6.523765563964844, "global_step": 106909, "epoch": 2545} {"train_loss": -6.351907730102539, "global_step": 106910, "epoch": 2545} {"train_loss": -6.545056343078613, "global_step": 106911, "epoch": 2545} {"train_loss": -6.500296592712402, "global_step": 106912, "epoch": 2545} {"train_loss": -6.5381693840026855, "global_step": 106913, "epoch": 2545} {"train_loss": -6.350564956665039, "global_step": 106914, "epoch": 2545} {"train_loss": -6.3896331787109375, "global_step": 106915, "epoch": 2545} {"train_loss": -6.53035831451416, "global_step": 106916, "epoch": 2545} {"train_loss": -6.378966808319092, "global_step": 106917, "epoch": 2545} {"train_loss": -6.483003616333008, "global_step": 106918, "epoch": 2545} {"train_loss": -6.490931510925293, "global_step": 106919, "epoch": 2545} {"train_loss": -6.341597080230713, "global_step": 106920, "epoch": 2545} {"train_loss": -6.450468063354492, "global_step": 106921, "epoch": 2545} {"train_loss": -6.483673095703125, "global_step": 106922, "epoch": 2545} {"train_loss": -6.566547393798828, "global_step": 106923, "epoch": 2545} {"train_loss": -6.52327299118042, "global_step": 106924, "epoch": 2545} {"train_loss": -6.527970314025879, "global_step": 106925, "epoch": 2545} {"train_loss": -6.465180397033691, "global_step": 106926, "epoch": 2545} {"train_loss": -6.455654144287109, "global_step": 106927, "epoch": 2545} {"train_loss": -6.503626346588135, "global_step": 106928, "epoch": 2545} {"train_loss": -6.40123987197876, "global_step": 106929, "epoch": 2545} {"train_loss": -6.501814842224121, "global_step": 106930, "epoch": 2545} {"train_loss": -6.449955769947597, "global_step": 106931, "epoch": 2545, "val_loss": 76256.328125} {"train_loss": -6.550889015197754, "global_step": 106932, "epoch": 2546} {"train_loss": -6.374631881713867, "global_step": 106933, "epoch": 2546} {"train_loss": -6.381622314453125, "global_step": 106934, "epoch": 2546} {"train_loss": -6.497878551483154, "global_step": 106935, "epoch": 2546} {"train_loss": -6.4745192527771, "global_step": 106936, "epoch": 2546} {"train_loss": -6.485409259796143, "global_step": 106937, "epoch": 2546} {"train_loss": -6.395697593688965, "global_step": 106938, "epoch": 2546} {"train_loss": -6.446708679199219, "global_step": 106939, "epoch": 2546} {"train_loss": -6.491909980773926, "global_step": 106940, "epoch": 2546} {"train_loss": -6.327139854431152, "global_step": 106941, "epoch": 2546} {"train_loss": -6.476888656616211, "global_step": 106942, "epoch": 2546} {"train_loss": -6.5380682945251465, "global_step": 106943, "epoch": 2546} {"train_loss": -6.490828514099121, "global_step": 106944, "epoch": 2546} {"train_loss": -6.374184608459473, "global_step": 106945, "epoch": 2546} {"train_loss": -6.514299392700195, "global_step": 106946, "epoch": 2546} {"train_loss": -6.435368537902832, "global_step": 106947, "epoch": 2546} {"train_loss": -6.284663200378418, "global_step": 106948, "epoch": 2546} {"train_loss": -6.429081916809082, "global_step": 106949, "epoch": 2546} {"train_loss": -6.350406646728516, "global_step": 106950, "epoch": 2546} {"train_loss": -6.3271894454956055, "global_step": 106951, "epoch": 2546} {"train_loss": -6.494373798370361, "global_step": 106952, "epoch": 2546} {"train_loss": -6.449272155761719, "global_step": 106953, "epoch": 2546} {"train_loss": -6.392338275909424, "global_step": 106954, "epoch": 2546} {"train_loss": -6.360032558441162, "global_step": 106955, "epoch": 2546} {"train_loss": -6.403655052185059, "global_step": 106956, "epoch": 2546} {"train_loss": -6.3528313636779785, "global_step": 106957, "epoch": 2546} {"train_loss": -6.401341915130615, "global_step": 106958, "epoch": 2546} {"train_loss": -6.272557258605957, "global_step": 106959, "epoch": 2546} {"train_loss": -6.296772003173828, "global_step": 106960, "epoch": 2546} {"train_loss": -6.420120716094971, "global_step": 106961, "epoch": 2546} {"train_loss": -6.358511924743652, "global_step": 106962, "epoch": 2546} {"train_loss": -6.472762584686279, "global_step": 106963, "epoch": 2546} {"train_loss": -6.404325485229492, "global_step": 106964, "epoch": 2546} {"train_loss": -6.368530750274658, "global_step": 106965, "epoch": 2546} {"train_loss": -6.465539932250977, "global_step": 106966, "epoch": 2546} {"train_loss": -6.323434829711914, "global_step": 106967, "epoch": 2546} {"train_loss": -6.320889472961426, "global_step": 106968, "epoch": 2546} {"train_loss": -6.371813774108887, "global_step": 106969, "epoch": 2546} {"train_loss": -6.398760795593262, "global_step": 106970, "epoch": 2546} {"train_loss": -6.465564727783203, "global_step": 106971, "epoch": 2546} {"train_loss": -6.384659767150879, "global_step": 106972, "epoch": 2546} {"train_loss": -6.407288528624035, "global_step": 106973, "epoch": 2546, "val_loss": 76296.7734375} {"train_loss": -6.439698219299316, "global_step": 106974, "epoch": 2547} {"train_loss": -6.426531791687012, "global_step": 106975, "epoch": 2547} {"train_loss": -6.4225311279296875, "global_step": 106976, "epoch": 2547} {"train_loss": -6.541719913482666, "global_step": 106977, "epoch": 2547} {"train_loss": -6.44944953918457, "global_step": 106978, "epoch": 2547} {"train_loss": -6.503395080566406, "global_step": 106979, "epoch": 2547} {"train_loss": -6.344733238220215, "global_step": 106980, "epoch": 2547} {"train_loss": -6.333162307739258, "global_step": 106981, "epoch": 2547} {"train_loss": -6.456558704376221, "global_step": 106982, "epoch": 2547} {"train_loss": -6.390653610229492, "global_step": 106983, "epoch": 2547} {"train_loss": -6.2959136962890625, "global_step": 106984, "epoch": 2547} {"train_loss": -6.36937952041626, "global_step": 106985, "epoch": 2547} {"train_loss": -6.481008529663086, "global_step": 106986, "epoch": 2547} {"train_loss": -6.52702522277832, "global_step": 106987, "epoch": 2547} {"train_loss": -6.388241767883301, "global_step": 106988, "epoch": 2547} {"train_loss": -6.435878753662109, "global_step": 106989, "epoch": 2547} {"train_loss": -6.368916988372803, "global_step": 106990, "epoch": 2547} {"train_loss": -6.462267875671387, "global_step": 106991, "epoch": 2547} {"train_loss": -6.5049333572387695, "global_step": 106992, "epoch": 2547} {"train_loss": -6.348322868347168, "global_step": 106993, "epoch": 2547} {"train_loss": -6.464673042297363, "global_step": 106994, "epoch": 2547} {"train_loss": -6.420520305633545, "global_step": 106995, "epoch": 2547} {"train_loss": -6.398049354553223, "global_step": 106996, "epoch": 2547} {"train_loss": -6.542919158935547, "global_step": 106997, "epoch": 2547} {"train_loss": -6.499951362609863, "global_step": 106998, "epoch": 2547} {"train_loss": -6.43494987487793, "global_step": 106999, "epoch": 2547} {"train_loss": -6.579591274261475, "global_step": 107000, "epoch": 2547} {"train_loss": -6.381390571594238, "global_step": 107001, "epoch": 2547} {"train_loss": -6.470728397369385, "global_step": 107002, "epoch": 2547} {"train_loss": -6.560332775115967, "global_step": 107003, "epoch": 2547} {"train_loss": -6.383111476898193, "global_step": 107004, "epoch": 2547} {"train_loss": -6.384355545043945, "global_step": 107005, "epoch": 2547} {"train_loss": -6.381312847137451, "global_step": 107006, "epoch": 2547} {"train_loss": -6.419078826904297, "global_step": 107007, "epoch": 2547} {"train_loss": -6.651558876037598, "global_step": 107008, "epoch": 2547} {"train_loss": -6.3398919105529785, "global_step": 107009, "epoch": 2547} {"train_loss": -6.393774032592773, "global_step": 107010, "epoch": 2547} {"train_loss": -6.361518383026123, "global_step": 107011, "epoch": 2547} {"train_loss": -6.298495292663574, "global_step": 107012, "epoch": 2547} {"train_loss": -6.457460880279541, "global_step": 107013, "epoch": 2547} {"train_loss": -6.543112754821777, "global_step": 107014, "epoch": 2547} {"train_loss": -6.436802977607364, "global_step": 107015, "epoch": 2547, "val_loss": 76215.03125} {"train_loss": -6.479233741760254, "global_step": 107016, "epoch": 2548} {"train_loss": -6.434711456298828, "global_step": 107017, "epoch": 2548} {"train_loss": -6.554651260375977, "global_step": 107018, "epoch": 2548} {"train_loss": -6.4864888191223145, "global_step": 107019, "epoch": 2548} {"train_loss": -6.37713098526001, "global_step": 107020, "epoch": 2548} {"train_loss": -6.54715633392334, "global_step": 107021, "epoch": 2548} {"train_loss": -6.347448825836182, "global_step": 107022, "epoch": 2548} {"train_loss": -6.431846618652344, "global_step": 107023, "epoch": 2548} {"train_loss": -6.514393329620361, "global_step": 107024, "epoch": 2548} {"train_loss": -6.499312400817871, "global_step": 107025, "epoch": 2548} {"train_loss": -6.317990303039551, "global_step": 107026, "epoch": 2548} {"train_loss": -6.411381721496582, "global_step": 107027, "epoch": 2548} {"train_loss": -6.402041435241699, "global_step": 107028, "epoch": 2548} {"train_loss": -6.316020965576172, "global_step": 107029, "epoch": 2548} {"train_loss": -6.450570106506348, "global_step": 107030, "epoch": 2548} {"train_loss": -6.440942764282227, "global_step": 107031, "epoch": 2548} {"train_loss": -6.300262451171875, "global_step": 107032, "epoch": 2548} {"train_loss": -6.47981595993042, "global_step": 107033, "epoch": 2548} {"train_loss": -6.484443187713623, "global_step": 107034, "epoch": 2548} {"train_loss": -6.350675582885742, "global_step": 107035, "epoch": 2548} {"train_loss": -6.500002384185791, "global_step": 107036, "epoch": 2548} {"train_loss": -6.391366958618164, "global_step": 107037, "epoch": 2548} {"train_loss": -6.344391345977783, "global_step": 107038, "epoch": 2548} {"train_loss": -6.383738994598389, "global_step": 107039, "epoch": 2548} {"train_loss": -6.481361389160156, "global_step": 107040, "epoch": 2548} {"train_loss": -6.3746562004089355, "global_step": 107041, "epoch": 2548} {"train_loss": -6.445561408996582, "global_step": 107042, "epoch": 2548} {"train_loss": -6.412295341491699, "global_step": 107043, "epoch": 2548} {"train_loss": -6.373570919036865, "global_step": 107044, "epoch": 2548} {"train_loss": -6.54494047164917, "global_step": 107045, "epoch": 2548} {"train_loss": -6.49517822265625, "global_step": 107046, "epoch": 2548} {"train_loss": -6.443075180053711, "global_step": 107047, "epoch": 2548} {"train_loss": -6.377755165100098, "global_step": 107048, "epoch": 2548} {"train_loss": -6.527416229248047, "global_step": 107049, "epoch": 2548} {"train_loss": -6.317364692687988, "global_step": 107050, "epoch": 2548} {"train_loss": -6.420293807983398, "global_step": 107051, "epoch": 2548} {"train_loss": -6.308401107788086, "global_step": 107052, "epoch": 2548} {"train_loss": -6.3270978927612305, "global_step": 107053, "epoch": 2548} {"train_loss": -6.409853458404541, "global_step": 107054, "epoch": 2548} {"train_loss": -6.420757293701172, "global_step": 107055, "epoch": 2548} {"train_loss": -6.4181365966796875, "global_step": 107056, "epoch": 2548} {"train_loss": -6.423228059496198, "global_step": 107057, "epoch": 2548, "val_loss": 76009.5078125} {"train_loss": -6.320003032684326, "global_step": 107058, "epoch": 2549} {"train_loss": -6.334122657775879, "global_step": 107059, "epoch": 2549} {"train_loss": -6.453823566436768, "global_step": 107060, "epoch": 2549} {"train_loss": -6.398162841796875, "global_step": 107061, "epoch": 2549} {"train_loss": -6.436448097229004, "global_step": 107062, "epoch": 2549} {"train_loss": -6.455109596252441, "global_step": 107063, "epoch": 2549} {"train_loss": -6.469087600708008, "global_step": 107064, "epoch": 2549} {"train_loss": -6.500739097595215, "global_step": 107065, "epoch": 2549} {"train_loss": -6.42858362197876, "global_step": 107066, "epoch": 2549} {"train_loss": -6.383991718292236, "global_step": 107067, "epoch": 2549} {"train_loss": -6.479214191436768, "global_step": 107068, "epoch": 2549} {"train_loss": -6.308173179626465, "global_step": 107069, "epoch": 2549} {"train_loss": -6.468569755554199, "global_step": 107070, "epoch": 2549} {"train_loss": -6.445346832275391, "global_step": 107071, "epoch": 2549} {"train_loss": -6.439083576202393, "global_step": 107072, "epoch": 2549} {"train_loss": -6.525844573974609, "global_step": 107073, "epoch": 2549} {"train_loss": -6.391232490539551, "global_step": 107074, "epoch": 2549} {"train_loss": -6.440039157867432, "global_step": 107075, "epoch": 2549} {"train_loss": -6.435690879821777, "global_step": 107076, "epoch": 2549} {"train_loss": -6.421200752258301, "global_step": 107077, "epoch": 2549} {"train_loss": -6.425205230712891, "global_step": 107078, "epoch": 2549} {"train_loss": -6.434064865112305, "global_step": 107079, "epoch": 2549} {"train_loss": -6.441773891448975, "global_step": 107080, "epoch": 2549} {"train_loss": -6.448312282562256, "global_step": 107081, "epoch": 2549} {"train_loss": -6.538678169250488, "global_step": 107082, "epoch": 2549} {"train_loss": -6.476985931396484, "global_step": 107083, "epoch": 2549} {"train_loss": -6.496363639831543, "global_step": 107084, "epoch": 2549} {"train_loss": -6.514949321746826, "global_step": 107085, "epoch": 2549} {"train_loss": -6.4697160720825195, "global_step": 107086, "epoch": 2549} {"train_loss": -6.512341499328613, "global_step": 107087, "epoch": 2549} {"train_loss": -6.5592145919799805, "global_step": 107088, "epoch": 2549} {"train_loss": -6.368565559387207, "global_step": 107089, "epoch": 2549} {"train_loss": -6.465485095977783, "global_step": 107090, "epoch": 2549} {"train_loss": -6.583889007568359, "global_step": 107091, "epoch": 2549} {"train_loss": -6.485630989074707, "global_step": 107092, "epoch": 2549} {"train_loss": -6.460987091064453, "global_step": 107093, "epoch": 2549} {"train_loss": -6.480313777923584, "global_step": 107094, "epoch": 2549} {"train_loss": -6.544229030609131, "global_step": 107095, "epoch": 2549} {"train_loss": -6.454387664794922, "global_step": 107096, "epoch": 2549} {"train_loss": -6.4808783531188965, "global_step": 107097, "epoch": 2549} {"train_loss": -6.512203216552734, "global_step": 107098, "epoch": 2549} {"train_loss": -6.454812152045114, "global_step": 107099, "epoch": 2549, "val_loss": 76282.859375} {"train_loss": -6.3621110916137695, "global_step": 107100, "epoch": 2550} {"train_loss": -6.4332733154296875, "global_step": 107101, "epoch": 2550} {"train_loss": -6.423534870147705, "global_step": 107102, "epoch": 2550} {"train_loss": -6.512947082519531, "global_step": 107103, "epoch": 2550} {"train_loss": -6.456015586853027, "global_step": 107104, "epoch": 2550} {"train_loss": -6.623071670532227, "global_step": 107105, "epoch": 2550} {"train_loss": -6.486590385437012, "global_step": 107106, "epoch": 2550} {"train_loss": -6.554227352142334, "global_step": 107107, "epoch": 2550} {"train_loss": -6.414717674255371, "global_step": 107108, "epoch": 2550} {"train_loss": -6.496492862701416, "global_step": 107109, "epoch": 2550} {"train_loss": -6.303783416748047, "global_step": 107110, "epoch": 2550} {"train_loss": -6.469881057739258, "global_step": 107111, "epoch": 2550} {"train_loss": -6.495378494262695, "global_step": 107112, "epoch": 2550} {"train_loss": -6.567054748535156, "global_step": 107113, "epoch": 2550} {"train_loss": -6.543601036071777, "global_step": 107114, "epoch": 2550} {"train_loss": -6.421201705932617, "global_step": 107115, "epoch": 2550} {"train_loss": -6.469734191894531, "global_step": 107116, "epoch": 2550} {"train_loss": -6.514267921447754, "global_step": 107117, "epoch": 2550} {"train_loss": -6.514006614685059, "global_step": 107118, "epoch": 2550} {"train_loss": -6.3531904220581055, "global_step": 107119, "epoch": 2550} {"train_loss": -6.455948829650879, "global_step": 107120, "epoch": 2550} {"train_loss": -6.47871208190918, "global_step": 107121, "epoch": 2550} {"train_loss": -6.485958099365234, "global_step": 107122, "epoch": 2550} {"train_loss": -6.4314117431640625, "global_step": 107123, "epoch": 2550} {"train_loss": -6.534375190734863, "global_step": 107124, "epoch": 2550} {"train_loss": -6.41671895980835, "global_step": 107125, "epoch": 2550} {"train_loss": -6.385882377624512, "global_step": 107126, "epoch": 2550} {"train_loss": -6.4626359939575195, "global_step": 107127, "epoch": 2550} {"train_loss": -6.464993000030518, "global_step": 107128, "epoch": 2550} {"train_loss": -6.391862392425537, "global_step": 107129, "epoch": 2550} {"train_loss": -6.5119524002075195, "global_step": 107130, "epoch": 2550} {"train_loss": -6.534114837646484, "global_step": 107131, "epoch": 2550} {"train_loss": -6.41459846496582, "global_step": 107132, "epoch": 2550} {"train_loss": -6.333423614501953, "global_step": 107133, "epoch": 2550} {"train_loss": -6.522378921508789, "global_step": 107134, "epoch": 2550} {"train_loss": -6.411740779876709, "global_step": 107135, "epoch": 2550} {"train_loss": -6.557966232299805, "global_step": 107136, "epoch": 2550} {"train_loss": -6.617371082305908, "global_step": 107137, "epoch": 2550} {"train_loss": -6.554093360900879, "global_step": 107138, "epoch": 2550} {"train_loss": -6.516453742980957, "global_step": 107139, "epoch": 2550} {"train_loss": -6.522523880004883, "global_step": 107140, "epoch": 2550} {"train_loss": -6.4741752942403155, "global_step": 107141, "epoch": 2550, "train/sim_max_reward_0": 0.8531133689221058, "train/sim_max_reward_1": 0.2834936618587029, "train/sim_max_reward_2": 0.2848869725987437, "train/sim_max_reward_3": 0.12939574819435398, "train/sim_max_reward_4": 0.22682499876719503, "train/sim_max_reward_5": 0.5733989886074795, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 1.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.8853097779972907, "test/sim_max_reward_4500005": 0.8980912522812561, "test/sim_max_reward_4500006": 0.9640621221065498, "test/sim_max_reward_4500007": 0.8106143676536608, "test/sim_max_reward_4500008": 0.15192242888968743, "test/sim_max_reward_4500009": 0.05347360667134372, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9896702372233335, "test/sim_max_reward_4500012": 0.8901992242881138, "test/sim_max_reward_4500013": 0.005610442551070666, "test/sim_max_reward_4500014": 0.3761358297641472, "test/sim_max_reward_4500015": 0.9408897948730442, "test/sim_max_reward_4500016": 0.0165212930764902, "test/sim_max_reward_4500017": 0.18442087313121516, "test/sim_max_reward_4500018": 0.4757650860328575, "test/sim_max_reward_4500019": 0.8986825716683767, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.5462865304685645, "test/sim_max_reward_4500022": 0.9622729395372975, "test/sim_max_reward_4500023": 0.8198411186287793, "test/sim_max_reward_4500024": 0.8702605900943028, "test/sim_max_reward_4500025": 0.838318358289851, "test/sim_max_reward_4500026": 0.9324278977483127, "test/sim_max_reward_4500027": 0.9904131461091347, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.06443207156903105, "test/sim_max_reward_4500030": 0.9954517186886566, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.5021024955959924, "test/sim_max_reward_4500034": 0.061568495847541455, "test/sim_max_reward_4500035": 0.5417511607136873, "test/sim_max_reward_4500036": 0.38955898303691966, "test/sim_max_reward_4500037": 0.9203974151871448, "test/sim_max_reward_4500038": 0.7995162453530088, "test/sim_max_reward_4500039": 0.9295575614797813, "test/sim_max_reward_4500040": 0.8079673753077878, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.67070016462385, "test/sim_max_reward_4500043": 0.21596951651942256, "test/sim_max_reward_4500044": 0.03147254166743657, "test/sim_max_reward_4500045": 0.9259187557430625, "test/sim_max_reward_4500046": 0.8279057003979139, "test/sim_max_reward_4500047": 0.942010695298207, "test/sim_max_reward_4500048": 0.8662434936793739, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.39185228982476356, "test/mean_score": 0.6050168095765683, "val_loss": 76030.5078125} {"train_loss": -6.469738483428955, "global_step": 107142, "epoch": 2551} {"train_loss": -6.455209732055664, "global_step": 107143, "epoch": 2551} {"train_loss": -6.478558540344238, "global_step": 107144, "epoch": 2551} {"train_loss": -6.446372985839844, "global_step": 107145, "epoch": 2551} {"train_loss": -6.586006164550781, "global_step": 107146, "epoch": 2551} {"train_loss": -6.5329365730285645, "global_step": 107147, "epoch": 2551} {"train_loss": -6.468907356262207, "global_step": 107148, "epoch": 2551} {"train_loss": -6.5106611251831055, "global_step": 107149, "epoch": 2551} {"train_loss": -6.404183864593506, "global_step": 107150, "epoch": 2551} {"train_loss": -6.482845306396484, "global_step": 107151, "epoch": 2551} {"train_loss": -6.299938678741455, "global_step": 107152, "epoch": 2551} {"train_loss": -6.511955261230469, "global_step": 107153, "epoch": 2551} {"train_loss": -6.484886169433594, "global_step": 107154, "epoch": 2551} {"train_loss": -6.360048294067383, "global_step": 107155, "epoch": 2551} {"train_loss": -6.465054512023926, "global_step": 107156, "epoch": 2551} {"train_loss": -6.471367835998535, "global_step": 107157, "epoch": 2551} {"train_loss": -6.421343803405762, "global_step": 107158, "epoch": 2551} {"train_loss": -6.328129768371582, "global_step": 107159, "epoch": 2551} {"train_loss": -6.340582847595215, "global_step": 107160, "epoch": 2551} {"train_loss": -6.406985282897949, "global_step": 107161, "epoch": 2551} {"train_loss": -6.401186943054199, "global_step": 107162, "epoch": 2551} {"train_loss": -6.482029438018799, "global_step": 107163, "epoch": 2551} {"train_loss": -6.317517280578613, "global_step": 107164, "epoch": 2551} {"train_loss": -6.47877311706543, "global_step": 107165, "epoch": 2551} {"train_loss": -6.3847761154174805, "global_step": 107166, "epoch": 2551} {"train_loss": -6.473673343658447, "global_step": 107167, "epoch": 2551} {"train_loss": -6.400633335113525, "global_step": 107168, "epoch": 2551} {"train_loss": -6.543980598449707, "global_step": 107169, "epoch": 2551} {"train_loss": -6.570208549499512, "global_step": 107170, "epoch": 2551} {"train_loss": -6.363593578338623, "global_step": 107171, "epoch": 2551} {"train_loss": -6.40946102142334, "global_step": 107172, "epoch": 2551} {"train_loss": -6.459665298461914, "global_step": 107173, "epoch": 2551} {"train_loss": -6.492331504821777, "global_step": 107174, "epoch": 2551} {"train_loss": -6.391522407531738, "global_step": 107175, "epoch": 2551} {"train_loss": -6.374982833862305, "global_step": 107176, "epoch": 2551} {"train_loss": -6.419687271118164, "global_step": 107177, "epoch": 2551} {"train_loss": -6.436638832092285, "global_step": 107178, "epoch": 2551} {"train_loss": -6.47902774810791, "global_step": 107179, "epoch": 2551} {"train_loss": -6.517148494720459, "global_step": 107180, "epoch": 2551} {"train_loss": -6.563571929931641, "global_step": 107181, "epoch": 2551} {"train_loss": -6.479671001434326, "global_step": 107182, "epoch": 2551} {"train_loss": -6.450644424983433, "global_step": 107183, "epoch": 2551, "val_loss": 76198.1796875} {"train_loss": -6.472561359405518, "global_step": 107184, "epoch": 2552} {"train_loss": -6.4105401039123535, "global_step": 107185, "epoch": 2552} {"train_loss": -6.413087368011475, "global_step": 107186, "epoch": 2552} {"train_loss": -6.37890625, "global_step": 107187, "epoch": 2552} {"train_loss": -6.368396759033203, "global_step": 107188, "epoch": 2552} {"train_loss": -6.30497932434082, "global_step": 107189, "epoch": 2552} {"train_loss": -6.428948402404785, "global_step": 107190, "epoch": 2552} {"train_loss": -6.3833818435668945, "global_step": 107191, "epoch": 2552} {"train_loss": -6.4473700523376465, "global_step": 107192, "epoch": 2552} {"train_loss": -6.355834007263184, "global_step": 107193, "epoch": 2552} {"train_loss": -6.313485145568848, "global_step": 107194, "epoch": 2552} {"train_loss": -6.412693500518799, "global_step": 107195, "epoch": 2552} {"train_loss": -6.504116058349609, "global_step": 107196, "epoch": 2552} {"train_loss": -6.4716691970825195, "global_step": 107197, "epoch": 2552} {"train_loss": -6.475839614868164, "global_step": 107198, "epoch": 2552} {"train_loss": -6.415060997009277, "global_step": 107199, "epoch": 2552} {"train_loss": -6.510738372802734, "global_step": 107200, "epoch": 2552} {"train_loss": -6.462050437927246, "global_step": 107201, "epoch": 2552} {"train_loss": -6.453763008117676, "global_step": 107202, "epoch": 2552} {"train_loss": -6.34859561920166, "global_step": 107203, "epoch": 2552} {"train_loss": -6.466719627380371, "global_step": 107204, "epoch": 2552} {"train_loss": -6.332822799682617, "global_step": 107205, "epoch": 2552} {"train_loss": -6.467238426208496, "global_step": 107206, "epoch": 2552} {"train_loss": -6.474287033081055, "global_step": 107207, "epoch": 2552} {"train_loss": -6.403948783874512, "global_step": 107208, "epoch": 2552} {"train_loss": -6.511745452880859, "global_step": 107209, "epoch": 2552} {"train_loss": -6.4302825927734375, "global_step": 107210, "epoch": 2552} {"train_loss": -6.511974811553955, "global_step": 107211, "epoch": 2552} {"train_loss": -6.525961399078369, "global_step": 107212, "epoch": 2552} {"train_loss": -6.352421760559082, "global_step": 107213, "epoch": 2552} {"train_loss": -6.305009841918945, "global_step": 107214, "epoch": 2552} {"train_loss": -6.385838031768799, "global_step": 107215, "epoch": 2552} {"train_loss": -6.480881690979004, "global_step": 107216, "epoch": 2552} {"train_loss": -6.330350875854492, "global_step": 107217, "epoch": 2552} {"train_loss": -6.4441070556640625, "global_step": 107218, "epoch": 2552} {"train_loss": -6.392438888549805, "global_step": 107219, "epoch": 2552} {"train_loss": -6.2657928466796875, "global_step": 107220, "epoch": 2552} {"train_loss": -6.355502128601074, "global_step": 107221, "epoch": 2552} {"train_loss": -6.492217540740967, "global_step": 107222, "epoch": 2552} {"train_loss": -6.192154884338379, "global_step": 107223, "epoch": 2552} {"train_loss": -6.339345932006836, "global_step": 107224, "epoch": 2552} {"train_loss": -6.409414109729585, "global_step": 107225, "epoch": 2552, "val_loss": 76618.0703125} {"train_loss": -6.340231418609619, "global_step": 107226, "epoch": 2553} {"train_loss": -6.413945198059082, "global_step": 107227, "epoch": 2553} {"train_loss": -6.432992935180664, "global_step": 107228, "epoch": 2553} {"train_loss": -6.319003105163574, "global_step": 107229, "epoch": 2553} {"train_loss": -6.394649505615234, "global_step": 107230, "epoch": 2553} {"train_loss": -6.346923351287842, "global_step": 107231, "epoch": 2553} {"train_loss": -6.462367534637451, "global_step": 107232, "epoch": 2553} {"train_loss": -6.380438327789307, "global_step": 107233, "epoch": 2553} {"train_loss": -6.479798316955566, "global_step": 107234, "epoch": 2553} {"train_loss": -6.488346099853516, "global_step": 107235, "epoch": 2553} {"train_loss": -6.308202743530273, "global_step": 107236, "epoch": 2553} {"train_loss": -6.472319602966309, "global_step": 107237, "epoch": 2553} {"train_loss": -6.498730659484863, "global_step": 107238, "epoch": 2553} {"train_loss": -6.399311065673828, "global_step": 107239, "epoch": 2553} {"train_loss": -6.31920051574707, "global_step": 107240, "epoch": 2553} {"train_loss": -6.462270259857178, "global_step": 107241, "epoch": 2553} {"train_loss": -6.5463337898254395, "global_step": 107242, "epoch": 2553} {"train_loss": -6.582428455352783, "global_step": 107243, "epoch": 2553} {"train_loss": -6.544398307800293, "global_step": 107244, "epoch": 2553} {"train_loss": -6.571409225463867, "global_step": 107245, "epoch": 2553} {"train_loss": -6.4099955558776855, "global_step": 107246, "epoch": 2553} {"train_loss": -6.497910022735596, "global_step": 107247, "epoch": 2553} {"train_loss": -6.487175464630127, "global_step": 107248, "epoch": 2553} {"train_loss": -6.487041473388672, "global_step": 107249, "epoch": 2553} {"train_loss": -6.506404876708984, "global_step": 107250, "epoch": 2553} {"train_loss": -6.499762535095215, "global_step": 107251, "epoch": 2553} {"train_loss": -6.290060043334961, "global_step": 107252, "epoch": 2553} {"train_loss": -6.376477241516113, "global_step": 107253, "epoch": 2553} {"train_loss": -6.42331600189209, "global_step": 107254, "epoch": 2553} {"train_loss": -6.457162857055664, "global_step": 107255, "epoch": 2553} {"train_loss": -6.353110313415527, "global_step": 107256, "epoch": 2553} {"train_loss": -6.41276741027832, "global_step": 107257, "epoch": 2553} {"train_loss": -6.343185901641846, "global_step": 107258, "epoch": 2553} {"train_loss": -6.454373359680176, "global_step": 107259, "epoch": 2553} {"train_loss": -6.464412212371826, "global_step": 107260, "epoch": 2553} {"train_loss": -6.359433174133301, "global_step": 107261, "epoch": 2553} {"train_loss": -6.414700031280518, "global_step": 107262, "epoch": 2553} {"train_loss": -6.210894584655762, "global_step": 107263, "epoch": 2553} {"train_loss": -6.377447605133057, "global_step": 107264, "epoch": 2553} {"train_loss": -6.455310821533203, "global_step": 107265, "epoch": 2553} {"train_loss": -6.468479156494141, "global_step": 107266, "epoch": 2553} {"train_loss": -6.42728160676502, "global_step": 107267, "epoch": 2553, "val_loss": 76702.6953125} {"train_loss": -6.297494888305664, "global_step": 107268, "epoch": 2554} {"train_loss": -6.584572792053223, "global_step": 107269, "epoch": 2554} {"train_loss": -6.475663185119629, "global_step": 107270, "epoch": 2554} {"train_loss": -6.413357734680176, "global_step": 107271, "epoch": 2554} {"train_loss": -6.412667274475098, "global_step": 107272, "epoch": 2554} {"train_loss": -6.445770740509033, "global_step": 107273, "epoch": 2554} {"train_loss": -6.502997875213623, "global_step": 107274, "epoch": 2554} {"train_loss": -6.448637008666992, "global_step": 107275, "epoch": 2554} {"train_loss": -6.237994194030762, "global_step": 107276, "epoch": 2554} {"train_loss": -6.449201583862305, "global_step": 107277, "epoch": 2554} {"train_loss": -6.456320762634277, "global_step": 107278, "epoch": 2554} {"train_loss": -6.454049110412598, "global_step": 107279, "epoch": 2554} {"train_loss": -6.362635135650635, "global_step": 107280, "epoch": 2554} {"train_loss": -6.476288318634033, "global_step": 107281, "epoch": 2554} {"train_loss": -6.423351764678955, "global_step": 107282, "epoch": 2554} {"train_loss": -6.47757625579834, "global_step": 107283, "epoch": 2554} {"train_loss": -6.350587844848633, "global_step": 107284, "epoch": 2554} {"train_loss": -6.444551467895508, "global_step": 107285, "epoch": 2554} {"train_loss": -6.2695417404174805, "global_step": 107286, "epoch": 2554} {"train_loss": -6.383077621459961, "global_step": 107287, "epoch": 2554} {"train_loss": -6.269463539123535, "global_step": 107288, "epoch": 2554} {"train_loss": -6.5782084465026855, "global_step": 107289, "epoch": 2554} {"train_loss": -6.322542190551758, "global_step": 107290, "epoch": 2554} {"train_loss": -6.317582130432129, "global_step": 107291, "epoch": 2554} {"train_loss": -6.337817192077637, "global_step": 107292, "epoch": 2554} {"train_loss": -6.401074409484863, "global_step": 107293, "epoch": 2554} {"train_loss": -6.306347846984863, "global_step": 107294, "epoch": 2554} {"train_loss": -6.485339164733887, "global_step": 107295, "epoch": 2554} {"train_loss": -6.25721549987793, "global_step": 107296, "epoch": 2554} {"train_loss": -6.3353729248046875, "global_step": 107297, "epoch": 2554} {"train_loss": -6.505982398986816, "global_step": 107298, "epoch": 2554} {"train_loss": -6.159082412719727, "global_step": 107299, "epoch": 2554} {"train_loss": -6.332211494445801, "global_step": 107300, "epoch": 2554} {"train_loss": -6.169252395629883, "global_step": 107301, "epoch": 2554} {"train_loss": -6.367152214050293, "global_step": 107302, "epoch": 2554} {"train_loss": -6.228501796722412, "global_step": 107303, "epoch": 2554} {"train_loss": -6.246729850769043, "global_step": 107304, "epoch": 2554} {"train_loss": -6.495292663574219, "global_step": 107305, "epoch": 2554} {"train_loss": -6.318458557128906, "global_step": 107306, "epoch": 2554} {"train_loss": -6.409493446350098, "global_step": 107307, "epoch": 2554} {"train_loss": -6.341523170471191, "global_step": 107308, "epoch": 2554} {"train_loss": -6.381031978698004, "global_step": 107309, "epoch": 2554, "val_loss": 76138.3515625} {"train_loss": -6.448962211608887, "global_step": 107310, "epoch": 2555} {"train_loss": -6.476317882537842, "global_step": 107311, "epoch": 2555} {"train_loss": -6.393535137176514, "global_step": 107312, "epoch": 2555} {"train_loss": -6.465247631072998, "global_step": 107313, "epoch": 2555} {"train_loss": -6.465237617492676, "global_step": 107314, "epoch": 2555} {"train_loss": -6.4531354904174805, "global_step": 107315, "epoch": 2555} {"train_loss": -6.416064262390137, "global_step": 107316, "epoch": 2555} {"train_loss": -6.442294597625732, "global_step": 107317, "epoch": 2555} {"train_loss": -6.457242488861084, "global_step": 107318, "epoch": 2555} {"train_loss": -6.378713607788086, "global_step": 107319, "epoch": 2555} {"train_loss": -6.366824150085449, "global_step": 107320, "epoch": 2555} {"train_loss": -6.483914375305176, "global_step": 107321, "epoch": 2555} {"train_loss": -6.41542387008667, "global_step": 107322, "epoch": 2555} {"train_loss": -6.407656669616699, "global_step": 107323, "epoch": 2555} {"train_loss": -6.480287551879883, "global_step": 107324, "epoch": 2555} {"train_loss": -6.441822528839111, "global_step": 107325, "epoch": 2555} {"train_loss": -6.373170852661133, "global_step": 107326, "epoch": 2555} {"train_loss": -6.359760284423828, "global_step": 107327, "epoch": 2555} {"train_loss": -6.526450157165527, "global_step": 107328, "epoch": 2555} {"train_loss": -6.380894184112549, "global_step": 107329, "epoch": 2555} {"train_loss": -6.351382255554199, "global_step": 107330, "epoch": 2555} {"train_loss": -6.270432949066162, "global_step": 107331, "epoch": 2555} {"train_loss": -6.3425798416137695, "global_step": 107332, "epoch": 2555} {"train_loss": -6.365416049957275, "global_step": 107333, "epoch": 2555} {"train_loss": -6.332706451416016, "global_step": 107334, "epoch": 2555} {"train_loss": -6.430788040161133, "global_step": 107335, "epoch": 2555} {"train_loss": -6.277822494506836, "global_step": 107336, "epoch": 2555} {"train_loss": -6.382863998413086, "global_step": 107337, "epoch": 2555} {"train_loss": -6.345122814178467, "global_step": 107338, "epoch": 2555} {"train_loss": -6.267878532409668, "global_step": 107339, "epoch": 2555} {"train_loss": -6.298890590667725, "global_step": 107340, "epoch": 2555} {"train_loss": -6.400955677032471, "global_step": 107341, "epoch": 2555} {"train_loss": -6.324938774108887, "global_step": 107342, "epoch": 2555} {"train_loss": -6.401729106903076, "global_step": 107343, "epoch": 2555} {"train_loss": -6.404477596282959, "global_step": 107344, "epoch": 2555} {"train_loss": -6.414116859436035, "global_step": 107345, "epoch": 2555} {"train_loss": -6.504298210144043, "global_step": 107346, "epoch": 2555} {"train_loss": -6.37164306640625, "global_step": 107347, "epoch": 2555} {"train_loss": -6.502527236938477, "global_step": 107348, "epoch": 2555} {"train_loss": -6.412528991699219, "global_step": 107349, "epoch": 2555} {"train_loss": -6.443757057189941, "global_step": 107350, "epoch": 2555} {"train_loss": -6.4023616427466985, "global_step": 107351, "epoch": 2555, "val_loss": 76094.5546875} {"train_loss": -6.440949440002441, "global_step": 107352, "epoch": 2556} {"train_loss": -6.583608150482178, "global_step": 107353, "epoch": 2556} {"train_loss": -6.416292190551758, "global_step": 107354, "epoch": 2556} {"train_loss": -6.450453758239746, "global_step": 107355, "epoch": 2556} {"train_loss": -6.406625747680664, "global_step": 107356, "epoch": 2556} {"train_loss": -6.473520278930664, "global_step": 107357, "epoch": 2556} {"train_loss": -6.472161769866943, "global_step": 107358, "epoch": 2556} {"train_loss": -6.476456642150879, "global_step": 107359, "epoch": 2556} {"train_loss": -6.49598503112793, "global_step": 107360, "epoch": 2556} {"train_loss": -6.511581897735596, "global_step": 107361, "epoch": 2556} {"train_loss": -6.278826713562012, "global_step": 107362, "epoch": 2556} {"train_loss": -6.545037746429443, "global_step": 107363, "epoch": 2556} {"train_loss": -6.355806350708008, "global_step": 107364, "epoch": 2556} {"train_loss": -6.4456281661987305, "global_step": 107365, "epoch": 2556} {"train_loss": -6.4250288009643555, "global_step": 107366, "epoch": 2556} {"train_loss": -6.36807918548584, "global_step": 107367, "epoch": 2556} {"train_loss": -6.4932026863098145, "global_step": 107368, "epoch": 2556} {"train_loss": -6.519773960113525, "global_step": 107369, "epoch": 2556} {"train_loss": -6.528984069824219, "global_step": 107370, "epoch": 2556} {"train_loss": -6.504462242126465, "global_step": 107371, "epoch": 2556} {"train_loss": -6.403922080993652, "global_step": 107372, "epoch": 2556} {"train_loss": -6.54527473449707, "global_step": 107373, "epoch": 2556} {"train_loss": -6.495277404785156, "global_step": 107374, "epoch": 2556} {"train_loss": -6.402021884918213, "global_step": 107375, "epoch": 2556} {"train_loss": -6.384723663330078, "global_step": 107376, "epoch": 2556} {"train_loss": -6.377999305725098, "global_step": 107377, "epoch": 2556} {"train_loss": -6.34682559967041, "global_step": 107378, "epoch": 2556} {"train_loss": -6.295108795166016, "global_step": 107379, "epoch": 2556} {"train_loss": -6.52333402633667, "global_step": 107380, "epoch": 2556} {"train_loss": -6.485123157501221, "global_step": 107381, "epoch": 2556} {"train_loss": -6.386120319366455, "global_step": 107382, "epoch": 2556} {"train_loss": -6.5453081130981445, "global_step": 107383, "epoch": 2556} {"train_loss": -6.509438514709473, "global_step": 107384, "epoch": 2556} {"train_loss": -6.386807441711426, "global_step": 107385, "epoch": 2556} {"train_loss": -6.358207702636719, "global_step": 107386, "epoch": 2556} {"train_loss": -6.557226181030273, "global_step": 107387, "epoch": 2556} {"train_loss": -6.366960525512695, "global_step": 107388, "epoch": 2556} {"train_loss": -6.445919036865234, "global_step": 107389, "epoch": 2556} {"train_loss": -6.557572364807129, "global_step": 107390, "epoch": 2556} {"train_loss": -6.330421447753906, "global_step": 107391, "epoch": 2556} {"train_loss": -6.40559196472168, "global_step": 107392, "epoch": 2556} {"train_loss": -6.44743858064924, "global_step": 107393, "epoch": 2556, "val_loss": 76155.1875} {"train_loss": -6.53065299987793, "global_step": 107394, "epoch": 2557} {"train_loss": -6.499446868896484, "global_step": 107395, "epoch": 2557} {"train_loss": -6.394824028015137, "global_step": 107396, "epoch": 2557} {"train_loss": -6.4915008544921875, "global_step": 107397, "epoch": 2557} {"train_loss": -6.509537220001221, "global_step": 107398, "epoch": 2557} {"train_loss": -6.380210876464844, "global_step": 107399, "epoch": 2557} {"train_loss": -6.446403503417969, "global_step": 107400, "epoch": 2557} {"train_loss": -6.5258708000183105, "global_step": 107401, "epoch": 2557} {"train_loss": -6.523606300354004, "global_step": 107402, "epoch": 2557} {"train_loss": -6.490052223205566, "global_step": 107403, "epoch": 2557} {"train_loss": -6.460926055908203, "global_step": 107404, "epoch": 2557} {"train_loss": -6.540462493896484, "global_step": 107405, "epoch": 2557} {"train_loss": -6.47553825378418, "global_step": 107406, "epoch": 2557} {"train_loss": -6.515318870544434, "global_step": 107407, "epoch": 2557} {"train_loss": -6.3930816650390625, "global_step": 107408, "epoch": 2557} {"train_loss": -6.507706642150879, "global_step": 107409, "epoch": 2557} {"train_loss": -6.510336399078369, "global_step": 107410, "epoch": 2557} {"train_loss": -6.571555137634277, "global_step": 107411, "epoch": 2557} {"train_loss": -6.39310884475708, "global_step": 107412, "epoch": 2557} {"train_loss": -6.46469259262085, "global_step": 107413, "epoch": 2557} {"train_loss": -6.486138343811035, "global_step": 107414, "epoch": 2557} {"train_loss": -6.393806457519531, "global_step": 107415, "epoch": 2557} {"train_loss": -6.458083152770996, "global_step": 107416, "epoch": 2557} {"train_loss": -6.613923072814941, "global_step": 107417, "epoch": 2557} {"train_loss": -6.46720027923584, "global_step": 107418, "epoch": 2557} {"train_loss": -6.490133285522461, "global_step": 107419, "epoch": 2557} {"train_loss": -6.422543048858643, "global_step": 107420, "epoch": 2557} {"train_loss": -6.363636016845703, "global_step": 107421, "epoch": 2557} {"train_loss": -6.360415458679199, "global_step": 107422, "epoch": 2557} {"train_loss": -6.356947898864746, "global_step": 107423, "epoch": 2557} {"train_loss": -6.456219673156738, "global_step": 107424, "epoch": 2557} {"train_loss": -6.474560737609863, "global_step": 107425, "epoch": 2557} {"train_loss": -6.28311824798584, "global_step": 107426, "epoch": 2557} {"train_loss": -6.449357032775879, "global_step": 107427, "epoch": 2557} {"train_loss": -6.274989128112793, "global_step": 107428, "epoch": 2557} {"train_loss": -6.365190505981445, "global_step": 107429, "epoch": 2557} {"train_loss": -6.336119174957275, "global_step": 107430, "epoch": 2557} {"train_loss": -6.437191963195801, "global_step": 107431, "epoch": 2557} {"train_loss": -6.378439903259277, "global_step": 107432, "epoch": 2557} {"train_loss": -6.487331390380859, "global_step": 107433, "epoch": 2557} {"train_loss": -6.501776695251465, "global_step": 107434, "epoch": 2557} {"train_loss": -6.454069058100383, "global_step": 107435, "epoch": 2557, "val_loss": 76123.4453125} {"train_loss": -6.441084384918213, "global_step": 107436, "epoch": 2558} {"train_loss": -6.352925777435303, "global_step": 107437, "epoch": 2558} {"train_loss": -6.384735107421875, "global_step": 107438, "epoch": 2558} {"train_loss": -6.325546741485596, "global_step": 107439, "epoch": 2558} {"train_loss": -6.421044826507568, "global_step": 107440, "epoch": 2558} {"train_loss": -6.5028228759765625, "global_step": 107441, "epoch": 2558} {"train_loss": -6.455519676208496, "global_step": 107442, "epoch": 2558} {"train_loss": -6.514793395996094, "global_step": 107443, "epoch": 2558} {"train_loss": -6.4307708740234375, "global_step": 107444, "epoch": 2558} {"train_loss": -6.420441627502441, "global_step": 107445, "epoch": 2558} {"train_loss": -6.364925861358643, "global_step": 107446, "epoch": 2558} {"train_loss": -6.510032653808594, "global_step": 107447, "epoch": 2558} {"train_loss": -6.467339038848877, "global_step": 107448, "epoch": 2558} {"train_loss": -6.504383087158203, "global_step": 107449, "epoch": 2558} {"train_loss": -6.515791893005371, "global_step": 107450, "epoch": 2558} {"train_loss": -6.538609504699707, "global_step": 107451, "epoch": 2558} {"train_loss": -6.354165077209473, "global_step": 107452, "epoch": 2558} {"train_loss": -6.465166091918945, "global_step": 107453, "epoch": 2558} {"train_loss": -6.278379440307617, "global_step": 107454, "epoch": 2558} {"train_loss": -6.491970062255859, "global_step": 107455, "epoch": 2558} {"train_loss": -6.3311357498168945, "global_step": 107456, "epoch": 2558} {"train_loss": -6.397008895874023, "global_step": 107457, "epoch": 2558} {"train_loss": -6.566837787628174, "global_step": 107458, "epoch": 2558} {"train_loss": -6.436542510986328, "global_step": 107459, "epoch": 2558} {"train_loss": -6.380197525024414, "global_step": 107460, "epoch": 2558} {"train_loss": -6.386775493621826, "global_step": 107461, "epoch": 2558} {"train_loss": -6.397937774658203, "global_step": 107462, "epoch": 2558} {"train_loss": -6.472459316253662, "global_step": 107463, "epoch": 2558} {"train_loss": -6.426731109619141, "global_step": 107464, "epoch": 2558} {"train_loss": -6.349246025085449, "global_step": 107465, "epoch": 2558} {"train_loss": -6.32846736907959, "global_step": 107466, "epoch": 2558} {"train_loss": -6.35821008682251, "global_step": 107467, "epoch": 2558} {"train_loss": -6.397418975830078, "global_step": 107468, "epoch": 2558} {"train_loss": -6.356481075286865, "global_step": 107469, "epoch": 2558} {"train_loss": -6.250267028808594, "global_step": 107470, "epoch": 2558} {"train_loss": -6.451721668243408, "global_step": 107471, "epoch": 2558} {"train_loss": -6.316102027893066, "global_step": 107472, "epoch": 2558} {"train_loss": -6.401493549346924, "global_step": 107473, "epoch": 2558} {"train_loss": -6.29327392578125, "global_step": 107474, "epoch": 2558} {"train_loss": -6.425230979919434, "global_step": 107475, "epoch": 2558} {"train_loss": -6.4781365394592285, "global_step": 107476, "epoch": 2558} {"train_loss": -6.410947981334868, "global_step": 107477, "epoch": 2558, "val_loss": 75792.1015625} {"train_loss": -6.349883079528809, "global_step": 107478, "epoch": 2559} {"train_loss": -6.4205169677734375, "global_step": 107479, "epoch": 2559} {"train_loss": -6.456269264221191, "global_step": 107480, "epoch": 2559} {"train_loss": -6.427874565124512, "global_step": 107481, "epoch": 2559} {"train_loss": -6.428868293762207, "global_step": 107482, "epoch": 2559} {"train_loss": -6.459690093994141, "global_step": 107483, "epoch": 2559} {"train_loss": -6.463369846343994, "global_step": 107484, "epoch": 2559} {"train_loss": -6.422875881195068, "global_step": 107485, "epoch": 2559} {"train_loss": -6.5319976806640625, "global_step": 107486, "epoch": 2559} {"train_loss": -6.497926712036133, "global_step": 107487, "epoch": 2559} {"train_loss": -6.332056999206543, "global_step": 107488, "epoch": 2559} {"train_loss": -6.412082672119141, "global_step": 107489, "epoch": 2559} {"train_loss": -6.369294166564941, "global_step": 107490, "epoch": 2559} {"train_loss": -6.450264930725098, "global_step": 107491, "epoch": 2559} {"train_loss": -6.409120082855225, "global_step": 107492, "epoch": 2559} {"train_loss": -6.340364456176758, "global_step": 107493, "epoch": 2559} {"train_loss": -6.506381988525391, "global_step": 107494, "epoch": 2559} {"train_loss": -6.401958465576172, "global_step": 107495, "epoch": 2559} {"train_loss": -6.49896240234375, "global_step": 107496, "epoch": 2559} {"train_loss": -6.206533432006836, "global_step": 107497, "epoch": 2559} {"train_loss": -6.435235977172852, "global_step": 107498, "epoch": 2559} {"train_loss": -6.4990410804748535, "global_step": 107499, "epoch": 2559} {"train_loss": -6.433242321014404, "global_step": 107500, "epoch": 2559} {"train_loss": -6.342817306518555, "global_step": 107501, "epoch": 2559} {"train_loss": -6.438098907470703, "global_step": 107502, "epoch": 2559} {"train_loss": -6.430714130401611, "global_step": 107503, "epoch": 2559} {"train_loss": -6.359081745147705, "global_step": 107504, "epoch": 2559} {"train_loss": -6.416533470153809, "global_step": 107505, "epoch": 2559} {"train_loss": -6.402949333190918, "global_step": 107506, "epoch": 2559} {"train_loss": -6.400927543640137, "global_step": 107507, "epoch": 2559} {"train_loss": -6.393435955047607, "global_step": 107508, "epoch": 2559} {"train_loss": -6.548254013061523, "global_step": 107509, "epoch": 2559} {"train_loss": -6.496737003326416, "global_step": 107510, "epoch": 2559} {"train_loss": -6.313073635101318, "global_step": 107511, "epoch": 2559} {"train_loss": -6.4011549949646, "global_step": 107512, "epoch": 2559} {"train_loss": -6.420999050140381, "global_step": 107513, "epoch": 2559} {"train_loss": -6.431681156158447, "global_step": 107514, "epoch": 2559} {"train_loss": -6.451517105102539, "global_step": 107515, "epoch": 2559} {"train_loss": -6.358397483825684, "global_step": 107516, "epoch": 2559} {"train_loss": -6.346673965454102, "global_step": 107517, "epoch": 2559} {"train_loss": -6.362434387207031, "global_step": 107518, "epoch": 2559} {"train_loss": -6.414747204099383, "global_step": 107519, "epoch": 2559, "val_loss": 76387.8046875} {"train_loss": -6.355917453765869, "global_step": 107520, "epoch": 2560} {"train_loss": -6.3145222663879395, "global_step": 107521, "epoch": 2560} {"train_loss": -6.4201860427856445, "global_step": 107522, "epoch": 2560} {"train_loss": -6.403408050537109, "global_step": 107523, "epoch": 2560} {"train_loss": -6.472975730895996, "global_step": 107524, "epoch": 2560} {"train_loss": -6.369495391845703, "global_step": 107525, "epoch": 2560} {"train_loss": -6.417445182800293, "global_step": 107526, "epoch": 2560} {"train_loss": -6.490246772766113, "global_step": 107527, "epoch": 2560} {"train_loss": -6.370170593261719, "global_step": 107528, "epoch": 2560} {"train_loss": -6.468541145324707, "global_step": 107529, "epoch": 2560} {"train_loss": -6.265688896179199, "global_step": 107530, "epoch": 2560} {"train_loss": -6.463242530822754, "global_step": 107531, "epoch": 2560} {"train_loss": -6.440822601318359, "global_step": 107532, "epoch": 2560} {"train_loss": -6.482419490814209, "global_step": 107533, "epoch": 2560} {"train_loss": -6.394073486328125, "global_step": 107534, "epoch": 2560} {"train_loss": -6.464461326599121, "global_step": 107535, "epoch": 2560} {"train_loss": -6.463630676269531, "global_step": 107536, "epoch": 2560} {"train_loss": -6.48848819732666, "global_step": 107537, "epoch": 2560} {"train_loss": -6.384548664093018, "global_step": 107538, "epoch": 2560} {"train_loss": -6.352834701538086, "global_step": 107539, "epoch": 2560} {"train_loss": -6.493885040283203, "global_step": 107540, "epoch": 2560} {"train_loss": -6.332981109619141, "global_step": 107541, "epoch": 2560} {"train_loss": -6.411383152008057, "global_step": 107542, "epoch": 2560} {"train_loss": -6.490850925445557, "global_step": 107543, "epoch": 2560} {"train_loss": -6.542966842651367, "global_step": 107544, "epoch": 2560} {"train_loss": -6.403469562530518, "global_step": 107545, "epoch": 2560} {"train_loss": -6.4045915603637695, "global_step": 107546, "epoch": 2560} {"train_loss": -6.525494575500488, "global_step": 107547, "epoch": 2560} {"train_loss": -6.507093906402588, "global_step": 107548, "epoch": 2560} {"train_loss": -6.516275405883789, "global_step": 107549, "epoch": 2560} {"train_loss": -6.473534107208252, "global_step": 107550, "epoch": 2560} {"train_loss": -6.468992233276367, "global_step": 107551, "epoch": 2560} {"train_loss": -6.537548065185547, "global_step": 107552, "epoch": 2560} {"train_loss": -6.3213701248168945, "global_step": 107553, "epoch": 2560} {"train_loss": -6.4896240234375, "global_step": 107554, "epoch": 2560} {"train_loss": -6.3327836990356445, "global_step": 107555, "epoch": 2560} {"train_loss": -6.512454986572266, "global_step": 107556, "epoch": 2560} {"train_loss": -6.427485942840576, "global_step": 107557, "epoch": 2560} {"train_loss": -6.275880813598633, "global_step": 107558, "epoch": 2560} {"train_loss": -6.466768264770508, "global_step": 107559, "epoch": 2560} {"train_loss": -6.430915832519531, "global_step": 107560, "epoch": 2560} {"train_loss": -6.434315851756504, "global_step": 107561, "epoch": 2560, "val_loss": 76294.53125} {"train_loss": -6.386767387390137, "global_step": 107562, "epoch": 2561} {"train_loss": -6.462696075439453, "global_step": 107563, "epoch": 2561} {"train_loss": -6.487443923950195, "global_step": 107564, "epoch": 2561} {"train_loss": -6.488496780395508, "global_step": 107565, "epoch": 2561} {"train_loss": -6.507819175720215, "global_step": 107566, "epoch": 2561} {"train_loss": -6.56151008605957, "global_step": 107567, "epoch": 2561} {"train_loss": -6.5516462326049805, "global_step": 107568, "epoch": 2561} {"train_loss": -6.449925422668457, "global_step": 107569, "epoch": 2561} {"train_loss": -6.440312385559082, "global_step": 107570, "epoch": 2561} {"train_loss": -6.475736618041992, "global_step": 107571, "epoch": 2561} {"train_loss": -6.560872554779053, "global_step": 107572, "epoch": 2561} {"train_loss": -6.393156051635742, "global_step": 107573, "epoch": 2561} {"train_loss": -6.484011650085449, "global_step": 107574, "epoch": 2561} {"train_loss": -6.586359024047852, "global_step": 107575, "epoch": 2561} {"train_loss": -6.496500015258789, "global_step": 107576, "epoch": 2561} {"train_loss": -6.402632713317871, "global_step": 107577, "epoch": 2561} {"train_loss": -6.355750560760498, "global_step": 107578, "epoch": 2561} {"train_loss": -6.515429973602295, "global_step": 107579, "epoch": 2561} {"train_loss": -6.423696994781494, "global_step": 107580, "epoch": 2561} {"train_loss": -6.5023956298828125, "global_step": 107581, "epoch": 2561} {"train_loss": -6.415320873260498, "global_step": 107582, "epoch": 2561} {"train_loss": -6.4824066162109375, "global_step": 107583, "epoch": 2561} {"train_loss": -6.4673871994018555, "global_step": 107584, "epoch": 2561} {"train_loss": -6.455728054046631, "global_step": 107585, "epoch": 2561} {"train_loss": -6.355016231536865, "global_step": 107586, "epoch": 2561} {"train_loss": -6.423504829406738, "global_step": 107587, "epoch": 2561} {"train_loss": -6.332752227783203, "global_step": 107588, "epoch": 2561} {"train_loss": -6.299622535705566, "global_step": 107589, "epoch": 2561} {"train_loss": -6.089685916900635, "global_step": 107590, "epoch": 2561} {"train_loss": -6.482907772064209, "global_step": 107591, "epoch": 2561} {"train_loss": -6.022782325744629, "global_step": 107592, "epoch": 2561} {"train_loss": -6.3495073318481445, "global_step": 107593, "epoch": 2561} {"train_loss": -6.118377685546875, "global_step": 107594, "epoch": 2561} {"train_loss": -6.420325756072998, "global_step": 107595, "epoch": 2561} {"train_loss": -6.167946815490723, "global_step": 107596, "epoch": 2561} {"train_loss": -6.372654914855957, "global_step": 107597, "epoch": 2561} {"train_loss": -6.257171630859375, "global_step": 107598, "epoch": 2561} {"train_loss": -6.428165435791016, "global_step": 107599, "epoch": 2561} {"train_loss": -6.4158430099487305, "global_step": 107600, "epoch": 2561} {"train_loss": -6.461350440979004, "global_step": 107601, "epoch": 2561} {"train_loss": -6.313530445098877, "global_step": 107602, "epoch": 2561} {"train_loss": -6.406631628672282, "global_step": 107603, "epoch": 2561, "val_loss": 76375.4375} {"train_loss": -6.5102081298828125, "global_step": 107604, "epoch": 2562} {"train_loss": -6.462580680847168, "global_step": 107605, "epoch": 2562} {"train_loss": -6.3965864181518555, "global_step": 107606, "epoch": 2562} {"train_loss": -6.408115386962891, "global_step": 107607, "epoch": 2562} {"train_loss": -6.493459701538086, "global_step": 107608, "epoch": 2562} {"train_loss": -6.462031364440918, "global_step": 107609, "epoch": 2562} {"train_loss": -6.358234405517578, "global_step": 107610, "epoch": 2562} {"train_loss": -6.415231227874756, "global_step": 107611, "epoch": 2562} {"train_loss": -6.307521820068359, "global_step": 107612, "epoch": 2562} {"train_loss": -6.440277099609375, "global_step": 107613, "epoch": 2562} {"train_loss": -6.600236892700195, "global_step": 107614, "epoch": 2562} {"train_loss": -6.306461334228516, "global_step": 107615, "epoch": 2562} {"train_loss": -6.465051651000977, "global_step": 107616, "epoch": 2562} {"train_loss": -6.449672698974609, "global_step": 107617, "epoch": 2562} {"train_loss": -6.466753959655762, "global_step": 107618, "epoch": 2562} {"train_loss": -6.466681480407715, "global_step": 107619, "epoch": 2562} {"train_loss": -6.38744592666626, "global_step": 107620, "epoch": 2562} {"train_loss": -6.356174468994141, "global_step": 107621, "epoch": 2562} {"train_loss": -6.477450370788574, "global_step": 107622, "epoch": 2562} {"train_loss": -6.458734512329102, "global_step": 107623, "epoch": 2562} {"train_loss": -6.494902610778809, "global_step": 107624, "epoch": 2562} {"train_loss": -6.372428894042969, "global_step": 107625, "epoch": 2562} {"train_loss": -6.449639320373535, "global_step": 107626, "epoch": 2562} {"train_loss": -6.463581085205078, "global_step": 107627, "epoch": 2562} {"train_loss": -6.4384846687316895, "global_step": 107628, "epoch": 2562} {"train_loss": -6.462132453918457, "global_step": 107629, "epoch": 2562} {"train_loss": -6.39530611038208, "global_step": 107630, "epoch": 2562} {"train_loss": -6.544835090637207, "global_step": 107631, "epoch": 2562} {"train_loss": -6.5116987228393555, "global_step": 107632, "epoch": 2562} {"train_loss": -6.3935441970825195, "global_step": 107633, "epoch": 2562} {"train_loss": -6.553249359130859, "global_step": 107634, "epoch": 2562} {"train_loss": -6.412801742553711, "global_step": 107635, "epoch": 2562} {"train_loss": -6.3715105056762695, "global_step": 107636, "epoch": 2562} {"train_loss": -6.473941802978516, "global_step": 107637, "epoch": 2562} {"train_loss": -6.417089462280273, "global_step": 107638, "epoch": 2562} {"train_loss": -6.457963943481445, "global_step": 107639, "epoch": 2562} {"train_loss": -6.508198261260986, "global_step": 107640, "epoch": 2562} {"train_loss": -6.247629165649414, "global_step": 107641, "epoch": 2562} {"train_loss": -6.252260684967041, "global_step": 107642, "epoch": 2562} {"train_loss": -6.4421563148498535, "global_step": 107643, "epoch": 2562} {"train_loss": -6.3573760986328125, "global_step": 107644, "epoch": 2562} {"train_loss": -6.4305328641619, "global_step": 107645, "epoch": 2562, "val_loss": 76247.3984375} {"train_loss": -6.497218132019043, "global_step": 107646, "epoch": 2563} {"train_loss": -6.334847927093506, "global_step": 107647, "epoch": 2563} {"train_loss": -6.432042121887207, "global_step": 107648, "epoch": 2563} {"train_loss": -6.426634788513184, "global_step": 107649, "epoch": 2563} {"train_loss": -6.558017253875732, "global_step": 107650, "epoch": 2563} {"train_loss": -6.474250793457031, "global_step": 107651, "epoch": 2563} {"train_loss": -6.309320449829102, "global_step": 107652, "epoch": 2563} {"train_loss": -6.395846366882324, "global_step": 107653, "epoch": 2563} {"train_loss": -6.481559753417969, "global_step": 107654, "epoch": 2563} {"train_loss": -6.420589447021484, "global_step": 107655, "epoch": 2563} {"train_loss": -6.535686016082764, "global_step": 107656, "epoch": 2563} {"train_loss": -6.429192543029785, "global_step": 107657, "epoch": 2563} {"train_loss": -6.457668304443359, "global_step": 107658, "epoch": 2563} {"train_loss": -6.392869472503662, "global_step": 107659, "epoch": 2563} {"train_loss": -6.312038421630859, "global_step": 107660, "epoch": 2563} {"train_loss": -6.4621357917785645, "global_step": 107661, "epoch": 2563} {"train_loss": -6.412650108337402, "global_step": 107662, "epoch": 2563} {"train_loss": -6.546929359436035, "global_step": 107663, "epoch": 2563} {"train_loss": -6.396317005157471, "global_step": 107664, "epoch": 2563} {"train_loss": -6.431815147399902, "global_step": 107665, "epoch": 2563} {"train_loss": -6.441843509674072, "global_step": 107666, "epoch": 2563} {"train_loss": -6.501377582550049, "global_step": 107667, "epoch": 2563} {"train_loss": -6.552029609680176, "global_step": 107668, "epoch": 2563} {"train_loss": -6.479161262512207, "global_step": 107669, "epoch": 2563} {"train_loss": -6.533487319946289, "global_step": 107670, "epoch": 2563} {"train_loss": -6.36026668548584, "global_step": 107671, "epoch": 2563} {"train_loss": -6.490575790405273, "global_step": 107672, "epoch": 2563} {"train_loss": -6.447673797607422, "global_step": 107673, "epoch": 2563} {"train_loss": -6.492673873901367, "global_step": 107674, "epoch": 2563} {"train_loss": -6.4163031578063965, "global_step": 107675, "epoch": 2563} {"train_loss": -6.443864822387695, "global_step": 107676, "epoch": 2563} {"train_loss": -6.382679462432861, "global_step": 107677, "epoch": 2563} {"train_loss": -6.448498249053955, "global_step": 107678, "epoch": 2563} {"train_loss": -6.458642959594727, "global_step": 107679, "epoch": 2563} {"train_loss": -6.47514533996582, "global_step": 107680, "epoch": 2563} {"train_loss": -6.477228164672852, "global_step": 107681, "epoch": 2563} {"train_loss": -6.398831367492676, "global_step": 107682, "epoch": 2563} {"train_loss": -6.347469329833984, "global_step": 107683, "epoch": 2563} {"train_loss": -6.480527400970459, "global_step": 107684, "epoch": 2563} {"train_loss": -6.403165817260742, "global_step": 107685, "epoch": 2563} {"train_loss": -6.411464691162109, "global_step": 107686, "epoch": 2563} {"train_loss": -6.443098352068946, "global_step": 107687, "epoch": 2563, "val_loss": 76321.1328125} {"train_loss": -6.505672931671143, "global_step": 107688, "epoch": 2564} {"train_loss": -6.464533805847168, "global_step": 107689, "epoch": 2564} {"train_loss": -6.505124568939209, "global_step": 107690, "epoch": 2564} {"train_loss": -6.538551330566406, "global_step": 107691, "epoch": 2564} {"train_loss": -6.429117679595947, "global_step": 107692, "epoch": 2564} {"train_loss": -6.483304023742676, "global_step": 107693, "epoch": 2564} {"train_loss": -6.396636009216309, "global_step": 107694, "epoch": 2564} {"train_loss": -6.394594669342041, "global_step": 107695, "epoch": 2564} {"train_loss": -6.512749671936035, "global_step": 107696, "epoch": 2564} {"train_loss": -6.327458381652832, "global_step": 107697, "epoch": 2564} {"train_loss": -6.526171684265137, "global_step": 107698, "epoch": 2564} {"train_loss": -6.42974853515625, "global_step": 107699, "epoch": 2564} {"train_loss": -6.536195755004883, "global_step": 107700, "epoch": 2564} {"train_loss": -6.301926612854004, "global_step": 107701, "epoch": 2564} {"train_loss": -6.52562141418457, "global_step": 107702, "epoch": 2564} {"train_loss": -6.471689224243164, "global_step": 107703, "epoch": 2564} {"train_loss": -6.316864967346191, "global_step": 107704, "epoch": 2564} {"train_loss": -6.576372146606445, "global_step": 107705, "epoch": 2564} {"train_loss": -6.4509968757629395, "global_step": 107706, "epoch": 2564} {"train_loss": -6.351492881774902, "global_step": 107707, "epoch": 2564} {"train_loss": -6.555624485015869, "global_step": 107708, "epoch": 2564} {"train_loss": -6.398096084594727, "global_step": 107709, "epoch": 2564} {"train_loss": -6.344264030456543, "global_step": 107710, "epoch": 2564} {"train_loss": -6.473705291748047, "global_step": 107711, "epoch": 2564} {"train_loss": -6.423697471618652, "global_step": 107712, "epoch": 2564} {"train_loss": -6.411593437194824, "global_step": 107713, "epoch": 2564} {"train_loss": -6.319310665130615, "global_step": 107714, "epoch": 2564} {"train_loss": -6.264623641967773, "global_step": 107715, "epoch": 2564} {"train_loss": -6.36200475692749, "global_step": 107716, "epoch": 2564} {"train_loss": -6.407810688018799, "global_step": 107717, "epoch": 2564} {"train_loss": -6.336348533630371, "global_step": 107718, "epoch": 2564} {"train_loss": -6.338281631469727, "global_step": 107719, "epoch": 2564} {"train_loss": -6.3096466064453125, "global_step": 107720, "epoch": 2564} {"train_loss": -6.387673377990723, "global_step": 107721, "epoch": 2564} {"train_loss": -6.301795959472656, "global_step": 107722, "epoch": 2564} {"train_loss": -6.383854866027832, "global_step": 107723, "epoch": 2564} {"train_loss": -6.307903289794922, "global_step": 107724, "epoch": 2564} {"train_loss": -6.450131416320801, "global_step": 107725, "epoch": 2564} {"train_loss": -6.358305931091309, "global_step": 107726, "epoch": 2564} {"train_loss": -6.240743637084961, "global_step": 107727, "epoch": 2564} {"train_loss": -6.4620208740234375, "global_step": 107728, "epoch": 2564} {"train_loss": -6.411093235015869, "global_step": 107729, "epoch": 2564, "val_loss": 76131.6875} {"train_loss": -6.505744457244873, "global_step": 107730, "epoch": 2565} {"train_loss": -6.354797840118408, "global_step": 107731, "epoch": 2565} {"train_loss": -6.438624382019043, "global_step": 107732, "epoch": 2565} {"train_loss": -6.3217549324035645, "global_step": 107733, "epoch": 2565} {"train_loss": -6.420646667480469, "global_step": 107734, "epoch": 2565} {"train_loss": -6.43927001953125, "global_step": 107735, "epoch": 2565} {"train_loss": -6.414812088012695, "global_step": 107736, "epoch": 2565} {"train_loss": -6.423151016235352, "global_step": 107737, "epoch": 2565} {"train_loss": -6.410951614379883, "global_step": 107738, "epoch": 2565} {"train_loss": -6.493141174316406, "global_step": 107739, "epoch": 2565} {"train_loss": -6.348178863525391, "global_step": 107740, "epoch": 2565} {"train_loss": -6.313271522521973, "global_step": 107741, "epoch": 2565} {"train_loss": -6.516704559326172, "global_step": 107742, "epoch": 2565} {"train_loss": -6.428997039794922, "global_step": 107743, "epoch": 2565} {"train_loss": -6.323924541473389, "global_step": 107744, "epoch": 2565} {"train_loss": -6.4316558837890625, "global_step": 107745, "epoch": 2565} {"train_loss": -6.338163375854492, "global_step": 107746, "epoch": 2565} {"train_loss": -6.350057601928711, "global_step": 107747, "epoch": 2565} {"train_loss": -6.499973297119141, "global_step": 107748, "epoch": 2565} {"train_loss": -6.307324409484863, "global_step": 107749, "epoch": 2565} {"train_loss": -6.319292068481445, "global_step": 107750, "epoch": 2565} {"train_loss": -6.410976409912109, "global_step": 107751, "epoch": 2565} {"train_loss": -6.440186500549316, "global_step": 107752, "epoch": 2565} {"train_loss": -6.475961685180664, "global_step": 107753, "epoch": 2565} {"train_loss": -6.471177101135254, "global_step": 107754, "epoch": 2565} {"train_loss": -6.4004621505737305, "global_step": 107755, "epoch": 2565} {"train_loss": -6.511897563934326, "global_step": 107756, "epoch": 2565} {"train_loss": -6.371331214904785, "global_step": 107757, "epoch": 2565} {"train_loss": -6.426078796386719, "global_step": 107758, "epoch": 2565} {"train_loss": -6.382870674133301, "global_step": 107759, "epoch": 2565} {"train_loss": -6.453340530395508, "global_step": 107760, "epoch": 2565} {"train_loss": -6.507349014282227, "global_step": 107761, "epoch": 2565} {"train_loss": -6.545724868774414, "global_step": 107762, "epoch": 2565} {"train_loss": -6.329544544219971, "global_step": 107763, "epoch": 2565} {"train_loss": -6.530003070831299, "global_step": 107764, "epoch": 2565} {"train_loss": -6.44255256652832, "global_step": 107765, "epoch": 2565} {"train_loss": -6.484116554260254, "global_step": 107766, "epoch": 2565} {"train_loss": -6.426790237426758, "global_step": 107767, "epoch": 2565} {"train_loss": -6.485708236694336, "global_step": 107768, "epoch": 2565} {"train_loss": -6.521029472351074, "global_step": 107769, "epoch": 2565} {"train_loss": -6.50755500793457, "global_step": 107770, "epoch": 2565} {"train_loss": -6.428947664442516, "global_step": 107771, "epoch": 2565, "val_loss": 76080.7265625} {"train_loss": -6.555058479309082, "global_step": 107772, "epoch": 2566} {"train_loss": -6.505670070648193, "global_step": 107773, "epoch": 2566} {"train_loss": -6.471933364868164, "global_step": 107774, "epoch": 2566} {"train_loss": -6.499578475952148, "global_step": 107775, "epoch": 2566} {"train_loss": -6.558102607727051, "global_step": 107776, "epoch": 2566} {"train_loss": -6.475794792175293, "global_step": 107777, "epoch": 2566} {"train_loss": -6.460522651672363, "global_step": 107778, "epoch": 2566} {"train_loss": -6.588808536529541, "global_step": 107779, "epoch": 2566} {"train_loss": -6.549348831176758, "global_step": 107780, "epoch": 2566} {"train_loss": -6.365610599517822, "global_step": 107781, "epoch": 2566} {"train_loss": -6.455601692199707, "global_step": 107782, "epoch": 2566} {"train_loss": -6.526326656341553, "global_step": 107783, "epoch": 2566} {"train_loss": -6.459000587463379, "global_step": 107784, "epoch": 2566} {"train_loss": -6.501941680908203, "global_step": 107785, "epoch": 2566} {"train_loss": -6.499467372894287, "global_step": 107786, "epoch": 2566} {"train_loss": -6.516770362854004, "global_step": 107787, "epoch": 2566} {"train_loss": -6.558513641357422, "global_step": 107788, "epoch": 2566} {"train_loss": -6.449742317199707, "global_step": 107789, "epoch": 2566} {"train_loss": -6.420154571533203, "global_step": 107790, "epoch": 2566} {"train_loss": -6.450687408447266, "global_step": 107791, "epoch": 2566} {"train_loss": -6.554308891296387, "global_step": 107792, "epoch": 2566} {"train_loss": -6.403848171234131, "global_step": 107793, "epoch": 2566} {"train_loss": -6.426668167114258, "global_step": 107794, "epoch": 2566} {"train_loss": -6.468898773193359, "global_step": 107795, "epoch": 2566} {"train_loss": -6.4548139572143555, "global_step": 107796, "epoch": 2566} {"train_loss": -6.212885856628418, "global_step": 107797, "epoch": 2566} {"train_loss": -6.477729797363281, "global_step": 107798, "epoch": 2566} {"train_loss": -6.485996723175049, "global_step": 107799, "epoch": 2566} {"train_loss": -6.3870015144348145, "global_step": 107800, "epoch": 2566} {"train_loss": -6.351151466369629, "global_step": 107801, "epoch": 2566} {"train_loss": -6.373262405395508, "global_step": 107802, "epoch": 2566} {"train_loss": -6.373070240020752, "global_step": 107803, "epoch": 2566} {"train_loss": -6.4595489501953125, "global_step": 107804, "epoch": 2566} {"train_loss": -6.394033432006836, "global_step": 107805, "epoch": 2566} {"train_loss": -6.410325050354004, "global_step": 107806, "epoch": 2566} {"train_loss": -6.346695423126221, "global_step": 107807, "epoch": 2566} {"train_loss": -6.386989593505859, "global_step": 107808, "epoch": 2566} {"train_loss": -6.321355819702148, "global_step": 107809, "epoch": 2566} {"train_loss": -6.530229568481445, "global_step": 107810, "epoch": 2566} {"train_loss": -6.4777679443359375, "global_step": 107811, "epoch": 2566} {"train_loss": -6.504384994506836, "global_step": 107812, "epoch": 2566} {"train_loss": -6.454213539759318, "global_step": 107813, "epoch": 2566, "val_loss": 75961.828125} {"train_loss": -6.463199138641357, "global_step": 107814, "epoch": 2567} {"train_loss": -6.458673000335693, "global_step": 107815, "epoch": 2567} {"train_loss": -6.359587669372559, "global_step": 107816, "epoch": 2567} {"train_loss": -6.454151153564453, "global_step": 107817, "epoch": 2567} {"train_loss": -6.3423895835876465, "global_step": 107818, "epoch": 2567} {"train_loss": -6.445365905761719, "global_step": 107819, "epoch": 2567} {"train_loss": -6.413434028625488, "global_step": 107820, "epoch": 2567} {"train_loss": -6.408220291137695, "global_step": 107821, "epoch": 2567} {"train_loss": -6.430743217468262, "global_step": 107822, "epoch": 2567} {"train_loss": -6.411442756652832, "global_step": 107823, "epoch": 2567} {"train_loss": -6.303326606750488, "global_step": 107824, "epoch": 2567} {"train_loss": -6.449048042297363, "global_step": 107825, "epoch": 2567} {"train_loss": -6.4633917808532715, "global_step": 107826, "epoch": 2567} {"train_loss": -6.4102888107299805, "global_step": 107827, "epoch": 2567} {"train_loss": -6.428389549255371, "global_step": 107828, "epoch": 2567} {"train_loss": -6.439643383026123, "global_step": 107829, "epoch": 2567} {"train_loss": -6.389827728271484, "global_step": 107830, "epoch": 2567} {"train_loss": -6.515435218811035, "global_step": 107831, "epoch": 2567} {"train_loss": -6.363105297088623, "global_step": 107832, "epoch": 2567} {"train_loss": -6.481009483337402, "global_step": 107833, "epoch": 2567} {"train_loss": -6.43931770324707, "global_step": 107834, "epoch": 2567} {"train_loss": -6.309806823730469, "global_step": 107835, "epoch": 2567} {"train_loss": -6.318058490753174, "global_step": 107836, "epoch": 2567} {"train_loss": -6.402751445770264, "global_step": 107837, "epoch": 2567} {"train_loss": -6.241940021514893, "global_step": 107838, "epoch": 2567} {"train_loss": -6.36716365814209, "global_step": 107839, "epoch": 2567} {"train_loss": -6.331028461456299, "global_step": 107840, "epoch": 2567} {"train_loss": -6.387968063354492, "global_step": 107841, "epoch": 2567} {"train_loss": -6.342859268188477, "global_step": 107842, "epoch": 2567} {"train_loss": -6.572140693664551, "global_step": 107843, "epoch": 2567} {"train_loss": -6.446780204772949, "global_step": 107844, "epoch": 2567} {"train_loss": -6.388581275939941, "global_step": 107845, "epoch": 2567} {"train_loss": -6.47064208984375, "global_step": 107846, "epoch": 2567} {"train_loss": -6.466560363769531, "global_step": 107847, "epoch": 2567} {"train_loss": -6.361507415771484, "global_step": 107848, "epoch": 2567} {"train_loss": -6.438909530639648, "global_step": 107849, "epoch": 2567} {"train_loss": -6.360550880432129, "global_step": 107850, "epoch": 2567} {"train_loss": -6.579652309417725, "global_step": 107851, "epoch": 2567} {"train_loss": -6.397076606750488, "global_step": 107852, "epoch": 2567} {"train_loss": -6.420804977416992, "global_step": 107853, "epoch": 2567} {"train_loss": -6.474814414978027, "global_step": 107854, "epoch": 2567} {"train_loss": -6.418250197455997, "global_step": 107855, "epoch": 2567, "val_loss": 75856.96875} {"train_loss": -6.43488883972168, "global_step": 107856, "epoch": 2568} {"train_loss": -6.544790267944336, "global_step": 107857, "epoch": 2568} {"train_loss": -6.429405689239502, "global_step": 107858, "epoch": 2568} {"train_loss": -6.4124274253845215, "global_step": 107859, "epoch": 2568} {"train_loss": -6.408069610595703, "global_step": 107860, "epoch": 2568} {"train_loss": -6.45863151550293, "global_step": 107861, "epoch": 2568} {"train_loss": -6.508026599884033, "global_step": 107862, "epoch": 2568} {"train_loss": -6.463548183441162, "global_step": 107863, "epoch": 2568} {"train_loss": -6.5201239585876465, "global_step": 107864, "epoch": 2568} {"train_loss": -6.4169020652771, "global_step": 107865, "epoch": 2568} {"train_loss": -6.468963146209717, "global_step": 107866, "epoch": 2568} {"train_loss": -6.368542194366455, "global_step": 107867, "epoch": 2568} {"train_loss": -6.462434768676758, "global_step": 107868, "epoch": 2568} {"train_loss": -6.525397777557373, "global_step": 107869, "epoch": 2568} {"train_loss": -6.508325576782227, "global_step": 107870, "epoch": 2568} {"train_loss": -6.425373077392578, "global_step": 107871, "epoch": 2568} {"train_loss": -6.4886884689331055, "global_step": 107872, "epoch": 2568} {"train_loss": -6.317593574523926, "global_step": 107873, "epoch": 2568} {"train_loss": -6.3613433837890625, "global_step": 107874, "epoch": 2568} {"train_loss": -6.493448257446289, "global_step": 107875, "epoch": 2568} {"train_loss": -6.328974723815918, "global_step": 107876, "epoch": 2568} {"train_loss": -6.576101303100586, "global_step": 107877, "epoch": 2568} {"train_loss": -6.536637306213379, "global_step": 107878, "epoch": 2568} {"train_loss": -6.394286155700684, "global_step": 107879, "epoch": 2568} {"train_loss": -6.348114967346191, "global_step": 107880, "epoch": 2568} {"train_loss": -6.503771781921387, "global_step": 107881, "epoch": 2568} {"train_loss": -6.441804885864258, "global_step": 107882, "epoch": 2568} {"train_loss": -6.4395599365234375, "global_step": 107883, "epoch": 2568} {"train_loss": -6.403075218200684, "global_step": 107884, "epoch": 2568} {"train_loss": -6.499416828155518, "global_step": 107885, "epoch": 2568} {"train_loss": -6.410151958465576, "global_step": 107886, "epoch": 2568} {"train_loss": -6.443751811981201, "global_step": 107887, "epoch": 2568} {"train_loss": -6.485857009887695, "global_step": 107888, "epoch": 2568} {"train_loss": -6.49819278717041, "global_step": 107889, "epoch": 2568} {"train_loss": -6.4968671798706055, "global_step": 107890, "epoch": 2568} {"train_loss": -6.497437000274658, "global_step": 107891, "epoch": 2568} {"train_loss": -6.406625747680664, "global_step": 107892, "epoch": 2568} {"train_loss": -6.55842924118042, "global_step": 107893, "epoch": 2568} {"train_loss": -6.475912094116211, "global_step": 107894, "epoch": 2568} {"train_loss": -6.440130233764648, "global_step": 107895, "epoch": 2568} {"train_loss": -6.530787467956543, "global_step": 107896, "epoch": 2568} {"train_loss": -6.454872506005423, "global_step": 107897, "epoch": 2568, "val_loss": 76004.0703125} {"train_loss": -6.481147766113281, "global_step": 107898, "epoch": 2569} {"train_loss": -6.521376609802246, "global_step": 107899, "epoch": 2569} {"train_loss": -6.354129791259766, "global_step": 107900, "epoch": 2569} {"train_loss": -6.510128498077393, "global_step": 107901, "epoch": 2569} {"train_loss": -6.306763648986816, "global_step": 107902, "epoch": 2569} {"train_loss": -6.497913360595703, "global_step": 107903, "epoch": 2569} {"train_loss": -6.362171173095703, "global_step": 107904, "epoch": 2569} {"train_loss": -6.249028205871582, "global_step": 107905, "epoch": 2569} {"train_loss": -6.464184761047363, "global_step": 107906, "epoch": 2569} {"train_loss": -6.224215507507324, "global_step": 107907, "epoch": 2569} {"train_loss": -6.350050926208496, "global_step": 107908, "epoch": 2569} {"train_loss": -6.433995246887207, "global_step": 107909, "epoch": 2569} {"train_loss": -6.464885234832764, "global_step": 107910, "epoch": 2569} {"train_loss": -6.476251125335693, "global_step": 107911, "epoch": 2569} {"train_loss": -6.309237480163574, "global_step": 107912, "epoch": 2569} {"train_loss": -6.491546630859375, "global_step": 107913, "epoch": 2569} {"train_loss": -6.218980312347412, "global_step": 107914, "epoch": 2569} {"train_loss": -6.390235424041748, "global_step": 107915, "epoch": 2569} {"train_loss": -6.441560745239258, "global_step": 107916, "epoch": 2569} {"train_loss": -6.3011980056762695, "global_step": 107917, "epoch": 2569} {"train_loss": -6.370906352996826, "global_step": 107918, "epoch": 2569} {"train_loss": -6.344335079193115, "global_step": 107919, "epoch": 2569} {"train_loss": -6.381521224975586, "global_step": 107920, "epoch": 2569} {"train_loss": -6.379463195800781, "global_step": 107921, "epoch": 2569} {"train_loss": -6.2794904708862305, "global_step": 107922, "epoch": 2569} {"train_loss": -6.501106262207031, "global_step": 107923, "epoch": 2569} {"train_loss": -6.51029109954834, "global_step": 107924, "epoch": 2569} {"train_loss": -6.288376808166504, "global_step": 107925, "epoch": 2569} {"train_loss": -6.5101189613342285, "global_step": 107926, "epoch": 2569} {"train_loss": -6.401339054107666, "global_step": 107927, "epoch": 2569} {"train_loss": -6.372501373291016, "global_step": 107928, "epoch": 2569} {"train_loss": -6.269835948944092, "global_step": 107929, "epoch": 2569} {"train_loss": -6.421478271484375, "global_step": 107930, "epoch": 2569} {"train_loss": -6.386228561401367, "global_step": 107931, "epoch": 2569} {"train_loss": -6.529858589172363, "global_step": 107932, "epoch": 2569} {"train_loss": -6.381450653076172, "global_step": 107933, "epoch": 2569} {"train_loss": -6.403709888458252, "global_step": 107934, "epoch": 2569} {"train_loss": -6.444920063018799, "global_step": 107935, "epoch": 2569} {"train_loss": -6.4695892333984375, "global_step": 107936, "epoch": 2569} {"train_loss": -6.40322732925415, "global_step": 107937, "epoch": 2569} {"train_loss": -6.429093837738037, "global_step": 107938, "epoch": 2569} {"train_loss": -6.400641384578886, "global_step": 107939, "epoch": 2569, "val_loss": 76219.5546875} {"train_loss": -6.5128374099731445, "global_step": 107940, "epoch": 2570} {"train_loss": -6.4322829246521, "global_step": 107941, "epoch": 2570} {"train_loss": -6.577068328857422, "global_step": 107942, "epoch": 2570} {"train_loss": -6.534841060638428, "global_step": 107943, "epoch": 2570} {"train_loss": -6.4760613441467285, "global_step": 107944, "epoch": 2570} {"train_loss": -6.421661376953125, "global_step": 107945, "epoch": 2570} {"train_loss": -6.541233062744141, "global_step": 107946, "epoch": 2570} {"train_loss": -6.384845733642578, "global_step": 107947, "epoch": 2570} {"train_loss": -6.434103965759277, "global_step": 107948, "epoch": 2570} {"train_loss": -6.515082836151123, "global_step": 107949, "epoch": 2570} {"train_loss": -6.446769714355469, "global_step": 107950, "epoch": 2570} {"train_loss": -6.506125450134277, "global_step": 107951, "epoch": 2570} {"train_loss": -6.445194244384766, "global_step": 107952, "epoch": 2570} {"train_loss": -6.3488054275512695, "global_step": 107953, "epoch": 2570} {"train_loss": -6.375467300415039, "global_step": 107954, "epoch": 2570} {"train_loss": -6.467572212219238, "global_step": 107955, "epoch": 2570} {"train_loss": -6.518588066101074, "global_step": 107956, "epoch": 2570} {"train_loss": -6.533947467803955, "global_step": 107957, "epoch": 2570} {"train_loss": -6.417052745819092, "global_step": 107958, "epoch": 2570} {"train_loss": -6.447741508483887, "global_step": 107959, "epoch": 2570} {"train_loss": -6.501107692718506, "global_step": 107960, "epoch": 2570} {"train_loss": -6.41281270980835, "global_step": 107961, "epoch": 2570} {"train_loss": -6.506265640258789, "global_step": 107962, "epoch": 2570} {"train_loss": -6.365461826324463, "global_step": 107963, "epoch": 2570} {"train_loss": -6.444944381713867, "global_step": 107964, "epoch": 2570} {"train_loss": -6.5468668937683105, "global_step": 107965, "epoch": 2570} {"train_loss": -6.483776569366455, "global_step": 107966, "epoch": 2570} {"train_loss": -6.442923069000244, "global_step": 107967, "epoch": 2570} {"train_loss": -6.451227188110352, "global_step": 107968, "epoch": 2570} {"train_loss": -6.338981628417969, "global_step": 107969, "epoch": 2570} {"train_loss": -6.352644920349121, "global_step": 107970, "epoch": 2570} {"train_loss": -6.441916465759277, "global_step": 107971, "epoch": 2570} {"train_loss": -6.269850730895996, "global_step": 107972, "epoch": 2570} {"train_loss": -6.4470534324646, "global_step": 107973, "epoch": 2570} {"train_loss": -6.348146438598633, "global_step": 107974, "epoch": 2570} {"train_loss": -6.255503177642822, "global_step": 107975, "epoch": 2570} {"train_loss": -6.370046615600586, "global_step": 107976, "epoch": 2570} {"train_loss": -6.3406782150268555, "global_step": 107977, "epoch": 2570} {"train_loss": -6.328642845153809, "global_step": 107978, "epoch": 2570} {"train_loss": -6.376803398132324, "global_step": 107979, "epoch": 2570} {"train_loss": -6.293124675750732, "global_step": 107980, "epoch": 2570} {"train_loss": -6.4275874978020076, "global_step": 107981, "epoch": 2570, "val_loss": 76386.5625} {"train_loss": -6.388090133666992, "global_step": 107982, "epoch": 2571} {"train_loss": -6.429293632507324, "global_step": 107983, "epoch": 2571} {"train_loss": -6.431339740753174, "global_step": 107984, "epoch": 2571} {"train_loss": -6.411500930786133, "global_step": 107985, "epoch": 2571} {"train_loss": -6.377805233001709, "global_step": 107986, "epoch": 2571} {"train_loss": -6.401039123535156, "global_step": 107987, "epoch": 2571} {"train_loss": -6.384176731109619, "global_step": 107988, "epoch": 2571} {"train_loss": -6.330413341522217, "global_step": 107989, "epoch": 2571} {"train_loss": -6.451828956604004, "global_step": 107990, "epoch": 2571} {"train_loss": -6.465025424957275, "global_step": 107991, "epoch": 2571} {"train_loss": -6.410059928894043, "global_step": 107992, "epoch": 2571} {"train_loss": -6.4126362800598145, "global_step": 107993, "epoch": 2571} {"train_loss": -6.544188499450684, "global_step": 107994, "epoch": 2571} {"train_loss": -6.360779762268066, "global_step": 107995, "epoch": 2571} {"train_loss": -6.474206924438477, "global_step": 107996, "epoch": 2571} {"train_loss": -6.412596702575684, "global_step": 107997, "epoch": 2571} {"train_loss": -6.369627475738525, "global_step": 107998, "epoch": 2571} {"train_loss": -6.452628135681152, "global_step": 107999, "epoch": 2571} {"train_loss": -6.422158241271973, "global_step": 108000, "epoch": 2571} {"train_loss": -6.442681312561035, "global_step": 108001, "epoch": 2571} {"train_loss": -6.335546016693115, "global_step": 108002, "epoch": 2571} {"train_loss": -6.391939163208008, "global_step": 108003, "epoch": 2571} {"train_loss": -6.354465007781982, "global_step": 108004, "epoch": 2571} {"train_loss": -6.506309509277344, "global_step": 108005, "epoch": 2571} {"train_loss": -6.319554328918457, "global_step": 108006, "epoch": 2571} {"train_loss": -6.348352432250977, "global_step": 108007, "epoch": 2571} {"train_loss": -6.339285850524902, "global_step": 108008, "epoch": 2571} {"train_loss": -6.450677394866943, "global_step": 108009, "epoch": 2571} {"train_loss": -6.369565010070801, "global_step": 108010, "epoch": 2571} {"train_loss": -6.3194122314453125, "global_step": 108011, "epoch": 2571} {"train_loss": -6.396027565002441, "global_step": 108012, "epoch": 2571} {"train_loss": -6.368224143981934, "global_step": 108013, "epoch": 2571} {"train_loss": -6.463332653045654, "global_step": 108014, "epoch": 2571} {"train_loss": -6.425137519836426, "global_step": 108015, "epoch": 2571} {"train_loss": -6.305467128753662, "global_step": 108016, "epoch": 2571} {"train_loss": -6.475132942199707, "global_step": 108017, "epoch": 2571} {"train_loss": -6.335137367248535, "global_step": 108018, "epoch": 2571} {"train_loss": -6.497629165649414, "global_step": 108019, "epoch": 2571} {"train_loss": -6.361025810241699, "global_step": 108020, "epoch": 2571} {"train_loss": -6.554670333862305, "global_step": 108021, "epoch": 2571} {"train_loss": -6.473330497741699, "global_step": 108022, "epoch": 2571} {"train_loss": -6.409262407393682, "global_step": 108023, "epoch": 2571, "val_loss": 76031.125} {"train_loss": -6.375190734863281, "global_step": 108024, "epoch": 2572} {"train_loss": -6.578397750854492, "global_step": 108025, "epoch": 2572} {"train_loss": -6.4959635734558105, "global_step": 108026, "epoch": 2572} {"train_loss": -6.428509712219238, "global_step": 108027, "epoch": 2572} {"train_loss": -6.407588958740234, "global_step": 108028, "epoch": 2572} {"train_loss": -6.542087554931641, "global_step": 108029, "epoch": 2572} {"train_loss": -6.4677581787109375, "global_step": 108030, "epoch": 2572} {"train_loss": -6.4801435470581055, "global_step": 108031, "epoch": 2572} {"train_loss": -6.5340728759765625, "global_step": 108032, "epoch": 2572} {"train_loss": -6.407136917114258, "global_step": 108033, "epoch": 2572} {"train_loss": -6.44489860534668, "global_step": 108034, "epoch": 2572} {"train_loss": -6.373936653137207, "global_step": 108035, "epoch": 2572} {"train_loss": -6.408187389373779, "global_step": 108036, "epoch": 2572} {"train_loss": -6.452404975891113, "global_step": 108037, "epoch": 2572} {"train_loss": -6.468576431274414, "global_step": 108038, "epoch": 2572} {"train_loss": -6.39127254486084, "global_step": 108039, "epoch": 2572} {"train_loss": -6.4802327156066895, "global_step": 108040, "epoch": 2572} {"train_loss": -6.355471611022949, "global_step": 108041, "epoch": 2572} {"train_loss": -6.400732040405273, "global_step": 108042, "epoch": 2572} {"train_loss": -6.467044830322266, "global_step": 108043, "epoch": 2572} {"train_loss": -6.510644912719727, "global_step": 108044, "epoch": 2572} {"train_loss": -6.38476037979126, "global_step": 108045, "epoch": 2572} {"train_loss": -6.481832981109619, "global_step": 108046, "epoch": 2572} {"train_loss": -6.495230674743652, "global_step": 108047, "epoch": 2572} {"train_loss": -6.302568435668945, "global_step": 108048, "epoch": 2572} {"train_loss": -6.3496503829956055, "global_step": 108049, "epoch": 2572} {"train_loss": -6.320429801940918, "global_step": 108050, "epoch": 2572} {"train_loss": -6.323910713195801, "global_step": 108051, "epoch": 2572} {"train_loss": -6.5054612159729, "global_step": 108052, "epoch": 2572} {"train_loss": -6.3536152839660645, "global_step": 108053, "epoch": 2572} {"train_loss": -6.408269882202148, "global_step": 108054, "epoch": 2572} {"train_loss": -6.38482141494751, "global_step": 108055, "epoch": 2572} {"train_loss": -6.322129249572754, "global_step": 108056, "epoch": 2572} {"train_loss": -6.365651607513428, "global_step": 108057, "epoch": 2572} {"train_loss": -6.3925557136535645, "global_step": 108058, "epoch": 2572} {"train_loss": -6.416007041931152, "global_step": 108059, "epoch": 2572} {"train_loss": -6.462832450866699, "global_step": 108060, "epoch": 2572} {"train_loss": -6.436283588409424, "global_step": 108061, "epoch": 2572} {"train_loss": -6.3666181564331055, "global_step": 108062, "epoch": 2572} {"train_loss": -6.488306045532227, "global_step": 108063, "epoch": 2572} {"train_loss": -6.383913516998291, "global_step": 108064, "epoch": 2572} {"train_loss": -6.426245655332293, "global_step": 108065, "epoch": 2572, "val_loss": 76317.1875} {"train_loss": -6.419626235961914, "global_step": 108066, "epoch": 2573} {"train_loss": -6.3470611572265625, "global_step": 108067, "epoch": 2573} {"train_loss": -6.4438581466674805, "global_step": 108068, "epoch": 2573} {"train_loss": -6.323686122894287, "global_step": 108069, "epoch": 2573} {"train_loss": -6.398739337921143, "global_step": 108070, "epoch": 2573} {"train_loss": -6.4261603355407715, "global_step": 108071, "epoch": 2573} {"train_loss": -6.403426170349121, "global_step": 108072, "epoch": 2573} {"train_loss": -6.440152168273926, "global_step": 108073, "epoch": 2573} {"train_loss": -6.488643646240234, "global_step": 108074, "epoch": 2573} {"train_loss": -6.409008979797363, "global_step": 108075, "epoch": 2573} {"train_loss": -6.401900291442871, "global_step": 108076, "epoch": 2573} {"train_loss": -6.451171875, "global_step": 108077, "epoch": 2573} {"train_loss": -6.412426948547363, "global_step": 108078, "epoch": 2573} {"train_loss": -6.387529373168945, "global_step": 108079, "epoch": 2573} {"train_loss": -6.304013252258301, "global_step": 108080, "epoch": 2573} {"train_loss": -6.384690284729004, "global_step": 108081, "epoch": 2573} {"train_loss": -6.375720977783203, "global_step": 108082, "epoch": 2573} {"train_loss": -6.398597717285156, "global_step": 108083, "epoch": 2573} {"train_loss": -6.41756010055542, "global_step": 108084, "epoch": 2573} {"train_loss": -6.39898681640625, "global_step": 108085, "epoch": 2573} {"train_loss": -6.382657051086426, "global_step": 108086, "epoch": 2573} {"train_loss": -6.322903633117676, "global_step": 108087, "epoch": 2573} {"train_loss": -6.416462421417236, "global_step": 108088, "epoch": 2573} {"train_loss": -6.3338623046875, "global_step": 108089, "epoch": 2573} {"train_loss": -6.314852237701416, "global_step": 108090, "epoch": 2573} {"train_loss": -6.415531635284424, "global_step": 108091, "epoch": 2573} {"train_loss": -6.278220176696777, "global_step": 108092, "epoch": 2573} {"train_loss": -6.267823219299316, "global_step": 108093, "epoch": 2573} {"train_loss": -6.344639778137207, "global_step": 108094, "epoch": 2573} {"train_loss": -6.330129146575928, "global_step": 108095, "epoch": 2573} {"train_loss": -6.390277862548828, "global_step": 108096, "epoch": 2573} {"train_loss": -6.404758453369141, "global_step": 108097, "epoch": 2573} {"train_loss": -6.273806571960449, "global_step": 108098, "epoch": 2573} {"train_loss": -6.428260803222656, "global_step": 108099, "epoch": 2573} {"train_loss": -6.496129035949707, "global_step": 108100, "epoch": 2573} {"train_loss": -6.377349853515625, "global_step": 108101, "epoch": 2573} {"train_loss": -6.473538875579834, "global_step": 108102, "epoch": 2573} {"train_loss": -6.526203155517578, "global_step": 108103, "epoch": 2573} {"train_loss": -6.518731117248535, "global_step": 108104, "epoch": 2573} {"train_loss": -6.344581604003906, "global_step": 108105, "epoch": 2573} {"train_loss": -6.394166946411133, "global_step": 108106, "epoch": 2573} {"train_loss": -6.395494642711821, "global_step": 108107, "epoch": 2573, "val_loss": 76266.171875} {"train_loss": -6.48563814163208, "global_step": 108108, "epoch": 2574} {"train_loss": -6.404330730438232, "global_step": 108109, "epoch": 2574} {"train_loss": -6.46224308013916, "global_step": 108110, "epoch": 2574} {"train_loss": -6.481661796569824, "global_step": 108111, "epoch": 2574} {"train_loss": -6.53478479385376, "global_step": 108112, "epoch": 2574} {"train_loss": -6.266009330749512, "global_step": 108113, "epoch": 2574} {"train_loss": -6.474971771240234, "global_step": 108114, "epoch": 2574} {"train_loss": -6.452672958374023, "global_step": 108115, "epoch": 2574} {"train_loss": -6.361837863922119, "global_step": 108116, "epoch": 2574} {"train_loss": -6.360448360443115, "global_step": 108117, "epoch": 2574} {"train_loss": -6.452875137329102, "global_step": 108118, "epoch": 2574} {"train_loss": -6.4503984451293945, "global_step": 108119, "epoch": 2574} {"train_loss": -6.504113674163818, "global_step": 108120, "epoch": 2574} {"train_loss": -6.361811637878418, "global_step": 108121, "epoch": 2574} {"train_loss": -6.465518951416016, "global_step": 108122, "epoch": 2574} {"train_loss": -6.513782501220703, "global_step": 108123, "epoch": 2574} {"train_loss": -6.41099739074707, "global_step": 108124, "epoch": 2574} {"train_loss": -6.5131402015686035, "global_step": 108125, "epoch": 2574} {"train_loss": -6.4060258865356445, "global_step": 108126, "epoch": 2574} {"train_loss": -6.327585220336914, "global_step": 108127, "epoch": 2574} {"train_loss": -6.510401725769043, "global_step": 108128, "epoch": 2574} {"train_loss": -6.4945502281188965, "global_step": 108129, "epoch": 2574} {"train_loss": -6.428833961486816, "global_step": 108130, "epoch": 2574} {"train_loss": -6.575192451477051, "global_step": 108131, "epoch": 2574} {"train_loss": -6.319466590881348, "global_step": 108132, "epoch": 2574} {"train_loss": -6.4076714515686035, "global_step": 108133, "epoch": 2574} {"train_loss": -6.379524230957031, "global_step": 108134, "epoch": 2574} {"train_loss": -6.543780326843262, "global_step": 108135, "epoch": 2574} {"train_loss": -6.495309829711914, "global_step": 108136, "epoch": 2574} {"train_loss": -6.482446670532227, "global_step": 108137, "epoch": 2574} {"train_loss": -6.51325798034668, "global_step": 108138, "epoch": 2574} {"train_loss": -6.406988143920898, "global_step": 108139, "epoch": 2574} {"train_loss": -6.559813976287842, "global_step": 108140, "epoch": 2574} {"train_loss": -6.458187103271484, "global_step": 108141, "epoch": 2574} {"train_loss": -6.489687442779541, "global_step": 108142, "epoch": 2574} {"train_loss": -6.567178249359131, "global_step": 108143, "epoch": 2574} {"train_loss": -6.358870506286621, "global_step": 108144, "epoch": 2574} {"train_loss": -6.61384391784668, "global_step": 108145, "epoch": 2574} {"train_loss": -6.44781494140625, "global_step": 108146, "epoch": 2574} {"train_loss": -6.500485420227051, "global_step": 108147, "epoch": 2574} {"train_loss": -6.537647247314453, "global_step": 108148, "epoch": 2574} {"train_loss": -6.458685954411824, "global_step": 108149, "epoch": 2574, "val_loss": 76168.96875} {"train_loss": -6.427960395812988, "global_step": 108150, "epoch": 2575} {"train_loss": -6.512820243835449, "global_step": 108151, "epoch": 2575} {"train_loss": -6.450944900512695, "global_step": 108152, "epoch": 2575} {"train_loss": -6.447187423706055, "global_step": 108153, "epoch": 2575} {"train_loss": -6.595623970031738, "global_step": 108154, "epoch": 2575} {"train_loss": -6.505557537078857, "global_step": 108155, "epoch": 2575} {"train_loss": -6.440845966339111, "global_step": 108156, "epoch": 2575} {"train_loss": -6.420978546142578, "global_step": 108157, "epoch": 2575} {"train_loss": -6.4416022300720215, "global_step": 108158, "epoch": 2575} {"train_loss": -6.494465351104736, "global_step": 108159, "epoch": 2575} {"train_loss": -6.357912540435791, "global_step": 108160, "epoch": 2575} {"train_loss": -6.458566665649414, "global_step": 108161, "epoch": 2575} {"train_loss": -6.428866386413574, "global_step": 108162, "epoch": 2575} {"train_loss": -6.540637969970703, "global_step": 108163, "epoch": 2575} {"train_loss": -6.521634578704834, "global_step": 108164, "epoch": 2575} {"train_loss": -6.359051704406738, "global_step": 108165, "epoch": 2575} {"train_loss": -6.485206604003906, "global_step": 108166, "epoch": 2575} {"train_loss": -6.520508766174316, "global_step": 108167, "epoch": 2575} {"train_loss": -6.419672966003418, "global_step": 108168, "epoch": 2575} {"train_loss": -6.518996715545654, "global_step": 108169, "epoch": 2575} {"train_loss": -6.479692459106445, "global_step": 108170, "epoch": 2575} {"train_loss": -6.400655269622803, "global_step": 108171, "epoch": 2575} {"train_loss": -6.513707160949707, "global_step": 108172, "epoch": 2575} {"train_loss": -6.606141090393066, "global_step": 108173, "epoch": 2575} {"train_loss": -6.409941673278809, "global_step": 108174, "epoch": 2575} {"train_loss": -6.489042282104492, "global_step": 108175, "epoch": 2575} {"train_loss": -6.326811790466309, "global_step": 108176, "epoch": 2575} {"train_loss": -6.550914287567139, "global_step": 108177, "epoch": 2575} {"train_loss": -6.473651885986328, "global_step": 108178, "epoch": 2575} {"train_loss": -6.394140720367432, "global_step": 108179, "epoch": 2575} {"train_loss": -6.467995643615723, "global_step": 108180, "epoch": 2575} {"train_loss": -6.437029838562012, "global_step": 108181, "epoch": 2575} {"train_loss": -6.332061767578125, "global_step": 108182, "epoch": 2575} {"train_loss": -6.46717643737793, "global_step": 108183, "epoch": 2575} {"train_loss": -6.428479194641113, "global_step": 108184, "epoch": 2575} {"train_loss": -6.419713973999023, "global_step": 108185, "epoch": 2575} {"train_loss": -6.528162956237793, "global_step": 108186, "epoch": 2575} {"train_loss": -6.393132209777832, "global_step": 108187, "epoch": 2575} {"train_loss": -6.471179008483887, "global_step": 108188, "epoch": 2575} {"train_loss": -6.3726630210876465, "global_step": 108189, "epoch": 2575} {"train_loss": -6.291116237640381, "global_step": 108190, "epoch": 2575} {"train_loss": -6.454325868969872, "global_step": 108191, "epoch": 2575, "val_loss": 76436.0546875} {"train_loss": -6.443399429321289, "global_step": 108192, "epoch": 2576} {"train_loss": -6.4657135009765625, "global_step": 108193, "epoch": 2576} {"train_loss": -6.431687355041504, "global_step": 108194, "epoch": 2576} {"train_loss": -6.507869720458984, "global_step": 108195, "epoch": 2576} {"train_loss": -6.538686752319336, "global_step": 108196, "epoch": 2576} {"train_loss": -6.381999969482422, "global_step": 108197, "epoch": 2576} {"train_loss": -6.458968639373779, "global_step": 108198, "epoch": 2576} {"train_loss": -6.388986110687256, "global_step": 108199, "epoch": 2576} {"train_loss": -6.513613700866699, "global_step": 108200, "epoch": 2576} {"train_loss": -6.496240615844727, "global_step": 108201, "epoch": 2576} {"train_loss": -6.529611587524414, "global_step": 108202, "epoch": 2576} {"train_loss": -6.315278053283691, "global_step": 108203, "epoch": 2576} {"train_loss": -6.469818115234375, "global_step": 108204, "epoch": 2576} {"train_loss": -6.396678447723389, "global_step": 108205, "epoch": 2576} {"train_loss": -6.441305637359619, "global_step": 108206, "epoch": 2576} {"train_loss": -6.442326545715332, "global_step": 108207, "epoch": 2576} {"train_loss": -6.3308892250061035, "global_step": 108208, "epoch": 2576} {"train_loss": -6.387163162231445, "global_step": 108209, "epoch": 2576} {"train_loss": -6.555044174194336, "global_step": 108210, "epoch": 2576} {"train_loss": -6.294051170349121, "global_step": 108211, "epoch": 2576} {"train_loss": -6.343454360961914, "global_step": 108212, "epoch": 2576} {"train_loss": -6.305697917938232, "global_step": 108213, "epoch": 2576} {"train_loss": -6.351831436157227, "global_step": 108214, "epoch": 2576} {"train_loss": -6.532520771026611, "global_step": 108215, "epoch": 2576} {"train_loss": -6.508308410644531, "global_step": 108216, "epoch": 2576} {"train_loss": -6.453303337097168, "global_step": 108217, "epoch": 2576} {"train_loss": -6.503913879394531, "global_step": 108218, "epoch": 2576} {"train_loss": -6.339972496032715, "global_step": 108219, "epoch": 2576} {"train_loss": -6.433725357055664, "global_step": 108220, "epoch": 2576} {"train_loss": -6.49680233001709, "global_step": 108221, "epoch": 2576} {"train_loss": -6.5026140213012695, "global_step": 108222, "epoch": 2576} {"train_loss": -6.296841621398926, "global_step": 108223, "epoch": 2576} {"train_loss": -6.364962100982666, "global_step": 108224, "epoch": 2576} {"train_loss": -6.3751935958862305, "global_step": 108225, "epoch": 2576} {"train_loss": -6.347014427185059, "global_step": 108226, "epoch": 2576} {"train_loss": -6.479963302612305, "global_step": 108227, "epoch": 2576} {"train_loss": -6.317160606384277, "global_step": 108228, "epoch": 2576} {"train_loss": -6.325626373291016, "global_step": 108229, "epoch": 2576} {"train_loss": -6.499660491943359, "global_step": 108230, "epoch": 2576} {"train_loss": -6.423976898193359, "global_step": 108231, "epoch": 2576} {"train_loss": -6.401821136474609, "global_step": 108232, "epoch": 2576} {"train_loss": -6.424756197702317, "global_step": 108233, "epoch": 2576, "val_loss": 76047.5546875} {"train_loss": -6.502618789672852, "global_step": 108234, "epoch": 2577} {"train_loss": -6.421196937561035, "global_step": 108235, "epoch": 2577} {"train_loss": -6.420527458190918, "global_step": 108236, "epoch": 2577} {"train_loss": -6.471186637878418, "global_step": 108237, "epoch": 2577} {"train_loss": -6.589088439941406, "global_step": 108238, "epoch": 2577} {"train_loss": -6.346120834350586, "global_step": 108239, "epoch": 2577} {"train_loss": -6.542023658752441, "global_step": 108240, "epoch": 2577} {"train_loss": -6.393307685852051, "global_step": 108241, "epoch": 2577} {"train_loss": -6.387430667877197, "global_step": 108242, "epoch": 2577} {"train_loss": -6.3970255851745605, "global_step": 108243, "epoch": 2577} {"train_loss": -6.484983444213867, "global_step": 108244, "epoch": 2577} {"train_loss": -6.517997741699219, "global_step": 108245, "epoch": 2577} {"train_loss": -6.498151779174805, "global_step": 108246, "epoch": 2577} {"train_loss": -6.388675689697266, "global_step": 108247, "epoch": 2577} {"train_loss": -6.451421737670898, "global_step": 108248, "epoch": 2577} {"train_loss": -6.546541690826416, "global_step": 108249, "epoch": 2577} {"train_loss": -6.3474931716918945, "global_step": 108250, "epoch": 2577} {"train_loss": -6.422863006591797, "global_step": 108251, "epoch": 2577} {"train_loss": -6.467068672180176, "global_step": 108252, "epoch": 2577} {"train_loss": -6.517763614654541, "global_step": 108253, "epoch": 2577} {"train_loss": -6.498387336730957, "global_step": 108254, "epoch": 2577} {"train_loss": -6.269893646240234, "global_step": 108255, "epoch": 2577} {"train_loss": -6.489137649536133, "global_step": 108256, "epoch": 2577} {"train_loss": -6.449746131896973, "global_step": 108257, "epoch": 2577} {"train_loss": -6.3971266746521, "global_step": 108258, "epoch": 2577} {"train_loss": -6.512440204620361, "global_step": 108259, "epoch": 2577} {"train_loss": -6.489058494567871, "global_step": 108260, "epoch": 2577} {"train_loss": -6.430379867553711, "global_step": 108261, "epoch": 2577} {"train_loss": -6.322277069091797, "global_step": 108262, "epoch": 2577} {"train_loss": -6.435678482055664, "global_step": 108263, "epoch": 2577} {"train_loss": -6.454958438873291, "global_step": 108264, "epoch": 2577} {"train_loss": -6.591153144836426, "global_step": 108265, "epoch": 2577} {"train_loss": -6.583073616027832, "global_step": 108266, "epoch": 2577} {"train_loss": -6.480000972747803, "global_step": 108267, "epoch": 2577} {"train_loss": -6.395986557006836, "global_step": 108268, "epoch": 2577} {"train_loss": -6.5094709396362305, "global_step": 108269, "epoch": 2577} {"train_loss": -6.373692989349365, "global_step": 108270, "epoch": 2577} {"train_loss": -6.469259262084961, "global_step": 108271, "epoch": 2577} {"train_loss": -6.499015808105469, "global_step": 108272, "epoch": 2577} {"train_loss": -6.342016220092773, "global_step": 108273, "epoch": 2577} {"train_loss": -6.406464576721191, "global_step": 108274, "epoch": 2577} {"train_loss": -6.453412589572725, "global_step": 108275, "epoch": 2577, "val_loss": 76187.203125} {"train_loss": -6.522479057312012, "global_step": 108276, "epoch": 2578} {"train_loss": -6.514960289001465, "global_step": 108277, "epoch": 2578} {"train_loss": -6.467217445373535, "global_step": 108278, "epoch": 2578} {"train_loss": -6.355576515197754, "global_step": 108279, "epoch": 2578} {"train_loss": -6.479208946228027, "global_step": 108280, "epoch": 2578} {"train_loss": -6.430859565734863, "global_step": 108281, "epoch": 2578} {"train_loss": -6.3989973068237305, "global_step": 108282, "epoch": 2578} {"train_loss": -6.359460830688477, "global_step": 108283, "epoch": 2578} {"train_loss": -6.3584184646606445, "global_step": 108284, "epoch": 2578} {"train_loss": -6.447582244873047, "global_step": 108285, "epoch": 2578} {"train_loss": -6.2994160652160645, "global_step": 108286, "epoch": 2578} {"train_loss": -6.410433769226074, "global_step": 108287, "epoch": 2578} {"train_loss": -6.387577056884766, "global_step": 108288, "epoch": 2578} {"train_loss": -6.366865158081055, "global_step": 108289, "epoch": 2578} {"train_loss": -6.364980697631836, "global_step": 108290, "epoch": 2578} {"train_loss": -6.557236671447754, "global_step": 108291, "epoch": 2578} {"train_loss": -6.279833793640137, "global_step": 108292, "epoch": 2578} {"train_loss": -6.306057453155518, "global_step": 108293, "epoch": 2578} {"train_loss": -6.486403465270996, "global_step": 108294, "epoch": 2578} {"train_loss": -6.357587814331055, "global_step": 108295, "epoch": 2578} {"train_loss": -6.472442150115967, "global_step": 108296, "epoch": 2578} {"train_loss": -6.472644805908203, "global_step": 108297, "epoch": 2578} {"train_loss": -6.573400974273682, "global_step": 108298, "epoch": 2578} {"train_loss": -6.567499160766602, "global_step": 108299, "epoch": 2578} {"train_loss": -6.508748531341553, "global_step": 108300, "epoch": 2578} {"train_loss": -6.520301342010498, "global_step": 108301, "epoch": 2578} {"train_loss": -6.4965434074401855, "global_step": 108302, "epoch": 2578} {"train_loss": -6.388636589050293, "global_step": 108303, "epoch": 2578} {"train_loss": -6.382467269897461, "global_step": 108304, "epoch": 2578} {"train_loss": -6.506046295166016, "global_step": 108305, "epoch": 2578} {"train_loss": -6.46861457824707, "global_step": 108306, "epoch": 2578} {"train_loss": -6.483081340789795, "global_step": 108307, "epoch": 2578} {"train_loss": -6.486984729766846, "global_step": 108308, "epoch": 2578} {"train_loss": -6.5841498374938965, "global_step": 108309, "epoch": 2578} {"train_loss": -6.603825092315674, "global_step": 108310, "epoch": 2578} {"train_loss": -6.459313869476318, "global_step": 108311, "epoch": 2578} {"train_loss": -6.595107078552246, "global_step": 108312, "epoch": 2578} {"train_loss": -6.460195064544678, "global_step": 108313, "epoch": 2578} {"train_loss": -6.40960693359375, "global_step": 108314, "epoch": 2578} {"train_loss": -6.429422378540039, "global_step": 108315, "epoch": 2578} {"train_loss": -6.472620964050293, "global_step": 108316, "epoch": 2578} {"train_loss": -6.451803059805007, "global_step": 108317, "epoch": 2578, "val_loss": 76008.96875} {"train_loss": -6.521661281585693, "global_step": 108318, "epoch": 2579} {"train_loss": -6.427628040313721, "global_step": 108319, "epoch": 2579} {"train_loss": -6.386935234069824, "global_step": 108320, "epoch": 2579} {"train_loss": -6.483185291290283, "global_step": 108321, "epoch": 2579} {"train_loss": -6.465928077697754, "global_step": 108322, "epoch": 2579} {"train_loss": -6.509283065795898, "global_step": 108323, "epoch": 2579} {"train_loss": -6.512578010559082, "global_step": 108324, "epoch": 2579} {"train_loss": -6.400607109069824, "global_step": 108325, "epoch": 2579} {"train_loss": -6.422170639038086, "global_step": 108326, "epoch": 2579} {"train_loss": -6.3695478439331055, "global_step": 108327, "epoch": 2579} {"train_loss": -6.407540321350098, "global_step": 108328, "epoch": 2579} {"train_loss": -6.408063888549805, "global_step": 108329, "epoch": 2579} {"train_loss": -6.293079376220703, "global_step": 108330, "epoch": 2579} {"train_loss": -6.39874267578125, "global_step": 108331, "epoch": 2579} {"train_loss": -6.3824462890625, "global_step": 108332, "epoch": 2579} {"train_loss": -6.337359428405762, "global_step": 108333, "epoch": 2579} {"train_loss": -6.327744483947754, "global_step": 108334, "epoch": 2579} {"train_loss": -6.443367958068848, "global_step": 108335, "epoch": 2579} {"train_loss": -6.521435737609863, "global_step": 108336, "epoch": 2579} {"train_loss": -6.365816593170166, "global_step": 108337, "epoch": 2579} {"train_loss": -6.459158897399902, "global_step": 108338, "epoch": 2579} {"train_loss": -6.288055419921875, "global_step": 108339, "epoch": 2579} {"train_loss": -6.488357067108154, "global_step": 108340, "epoch": 2579} {"train_loss": -6.373445987701416, "global_step": 108341, "epoch": 2579} {"train_loss": -6.388406276702881, "global_step": 108342, "epoch": 2579} {"train_loss": -6.343385219573975, "global_step": 108343, "epoch": 2579} {"train_loss": -6.4826765060424805, "global_step": 108344, "epoch": 2579} {"train_loss": -6.368062973022461, "global_step": 108345, "epoch": 2579} {"train_loss": -6.421898365020752, "global_step": 108346, "epoch": 2579} {"train_loss": -6.41316032409668, "global_step": 108347, "epoch": 2579} {"train_loss": -6.467897891998291, "global_step": 108348, "epoch": 2579} {"train_loss": -6.361988067626953, "global_step": 108349, "epoch": 2579} {"train_loss": -6.345734119415283, "global_step": 108350, "epoch": 2579} {"train_loss": -6.375210762023926, "global_step": 108351, "epoch": 2579} {"train_loss": -6.459017753601074, "global_step": 108352, "epoch": 2579} {"train_loss": -6.386722087860107, "global_step": 108353, "epoch": 2579} {"train_loss": -6.428969860076904, "global_step": 108354, "epoch": 2579} {"train_loss": -6.518828392028809, "global_step": 108355, "epoch": 2579} {"train_loss": -6.40781831741333, "global_step": 108356, "epoch": 2579} {"train_loss": -6.320310592651367, "global_step": 108357, "epoch": 2579} {"train_loss": -6.376119613647461, "global_step": 108358, "epoch": 2579} {"train_loss": -6.410835118520827, "global_step": 108359, "epoch": 2579, "val_loss": 76306.4375} {"train_loss": -6.369556427001953, "global_step": 108360, "epoch": 2580} {"train_loss": -6.540420055389404, "global_step": 108361, "epoch": 2580} {"train_loss": -6.427525520324707, "global_step": 108362, "epoch": 2580} {"train_loss": -6.438120365142822, "global_step": 108363, "epoch": 2580} {"train_loss": -6.397594451904297, "global_step": 108364, "epoch": 2580} {"train_loss": -6.508947372436523, "global_step": 108365, "epoch": 2580} {"train_loss": -6.3834123611450195, "global_step": 108366, "epoch": 2580} {"train_loss": -6.415608882904053, "global_step": 108367, "epoch": 2580} {"train_loss": -6.43433141708374, "global_step": 108368, "epoch": 2580} {"train_loss": -6.461550712585449, "global_step": 108369, "epoch": 2580} {"train_loss": -6.517780303955078, "global_step": 108370, "epoch": 2580} {"train_loss": -6.4445037841796875, "global_step": 108371, "epoch": 2580} {"train_loss": -6.413737773895264, "global_step": 108372, "epoch": 2580} {"train_loss": -6.481602668762207, "global_step": 108373, "epoch": 2580} {"train_loss": -6.489693641662598, "global_step": 108374, "epoch": 2580} {"train_loss": -6.43076229095459, "global_step": 108375, "epoch": 2580} {"train_loss": -6.392472267150879, "global_step": 108376, "epoch": 2580} {"train_loss": -6.420191764831543, "global_step": 108377, "epoch": 2580} {"train_loss": -6.436602592468262, "global_step": 108378, "epoch": 2580} {"train_loss": -6.5260467529296875, "global_step": 108379, "epoch": 2580} {"train_loss": -6.408712863922119, "global_step": 108380, "epoch": 2580} {"train_loss": -6.517459869384766, "global_step": 108381, "epoch": 2580} {"train_loss": -6.359960079193115, "global_step": 108382, "epoch": 2580} {"train_loss": -6.5086774826049805, "global_step": 108383, "epoch": 2580} {"train_loss": -6.456976890563965, "global_step": 108384, "epoch": 2580} {"train_loss": -6.471936225891113, "global_step": 108385, "epoch": 2580} {"train_loss": -6.507633209228516, "global_step": 108386, "epoch": 2580} {"train_loss": -6.4918293952941895, "global_step": 108387, "epoch": 2580} {"train_loss": -6.454380035400391, "global_step": 108388, "epoch": 2580} {"train_loss": -6.40725040435791, "global_step": 108389, "epoch": 2580} {"train_loss": -6.471687316894531, "global_step": 108390, "epoch": 2580} {"train_loss": -6.490854263305664, "global_step": 108391, "epoch": 2580} {"train_loss": -6.332699775695801, "global_step": 108392, "epoch": 2580} {"train_loss": -6.270415306091309, "global_step": 108393, "epoch": 2580} {"train_loss": -6.420906066894531, "global_step": 108394, "epoch": 2580} {"train_loss": -6.298969268798828, "global_step": 108395, "epoch": 2580} {"train_loss": -6.338850975036621, "global_step": 108396, "epoch": 2580} {"train_loss": -6.326421737670898, "global_step": 108397, "epoch": 2580} {"train_loss": -6.358708381652832, "global_step": 108398, "epoch": 2580} {"train_loss": -6.417987823486328, "global_step": 108399, "epoch": 2580} {"train_loss": -6.261210918426514, "global_step": 108400, "epoch": 2580} {"train_loss": -6.424562715348744, "global_step": 108401, "epoch": 2580, "val_loss": 76902.5} {"train_loss": -6.280577659606934, "global_step": 108402, "epoch": 2581} {"train_loss": -6.3382415771484375, "global_step": 108403, "epoch": 2581} {"train_loss": -6.352579593658447, "global_step": 108404, "epoch": 2581} {"train_loss": -6.321221828460693, "global_step": 108405, "epoch": 2581} {"train_loss": -6.413583278656006, "global_step": 108406, "epoch": 2581} {"train_loss": -6.395468711853027, "global_step": 108407, "epoch": 2581} {"train_loss": -6.461940765380859, "global_step": 108408, "epoch": 2581} {"train_loss": -6.366903305053711, "global_step": 108409, "epoch": 2581} {"train_loss": -6.400551795959473, "global_step": 108410, "epoch": 2581} {"train_loss": -6.349006175994873, "global_step": 108411, "epoch": 2581} {"train_loss": -6.381831169128418, "global_step": 108412, "epoch": 2581} {"train_loss": -6.440915107727051, "global_step": 108413, "epoch": 2581} {"train_loss": -6.387345314025879, "global_step": 108414, "epoch": 2581} {"train_loss": -6.462224960327148, "global_step": 108415, "epoch": 2581} {"train_loss": -6.283293724060059, "global_step": 108416, "epoch": 2581} {"train_loss": -6.329857349395752, "global_step": 108417, "epoch": 2581} {"train_loss": -6.432279586791992, "global_step": 108418, "epoch": 2581} {"train_loss": -6.404018402099609, "global_step": 108419, "epoch": 2581} {"train_loss": -6.44489049911499, "global_step": 108420, "epoch": 2581} {"train_loss": -6.414441108703613, "global_step": 108421, "epoch": 2581} {"train_loss": -6.410518169403076, "global_step": 108422, "epoch": 2581} {"train_loss": -6.420806407928467, "global_step": 108423, "epoch": 2581} {"train_loss": -6.309172630310059, "global_step": 108424, "epoch": 2581} {"train_loss": -6.312772750854492, "global_step": 108425, "epoch": 2581} {"train_loss": -6.35248327255249, "global_step": 108426, "epoch": 2581} {"train_loss": -6.238038063049316, "global_step": 108427, "epoch": 2581} {"train_loss": -6.3767547607421875, "global_step": 108428, "epoch": 2581} {"train_loss": -6.468153953552246, "global_step": 108429, "epoch": 2581} {"train_loss": -6.380386829376221, "global_step": 108430, "epoch": 2581} {"train_loss": -6.43521785736084, "global_step": 108431, "epoch": 2581} {"train_loss": -6.506792068481445, "global_step": 108432, "epoch": 2581} {"train_loss": -6.433357238769531, "global_step": 108433, "epoch": 2581} {"train_loss": -6.444650650024414, "global_step": 108434, "epoch": 2581} {"train_loss": -6.386340618133545, "global_step": 108435, "epoch": 2581} {"train_loss": -6.5088887214660645, "global_step": 108436, "epoch": 2581} {"train_loss": -6.4964823722839355, "global_step": 108437, "epoch": 2581} {"train_loss": -6.367683410644531, "global_step": 108438, "epoch": 2581} {"train_loss": -6.445381164550781, "global_step": 108439, "epoch": 2581} {"train_loss": -6.532658100128174, "global_step": 108440, "epoch": 2581} {"train_loss": -6.415395736694336, "global_step": 108441, "epoch": 2581} {"train_loss": -6.433107376098633, "global_step": 108442, "epoch": 2581} {"train_loss": -6.402506033579509, "global_step": 108443, "epoch": 2581, "val_loss": 76332.9765625} {"train_loss": -6.5641326904296875, "global_step": 108444, "epoch": 2582} {"train_loss": -6.503166198730469, "global_step": 108445, "epoch": 2582} {"train_loss": -6.407541275024414, "global_step": 108446, "epoch": 2582} {"train_loss": -6.4557905197143555, "global_step": 108447, "epoch": 2582} {"train_loss": -6.625545501708984, "global_step": 108448, "epoch": 2582} {"train_loss": -6.399959564208984, "global_step": 108449, "epoch": 2582} {"train_loss": -6.543194770812988, "global_step": 108450, "epoch": 2582} {"train_loss": -6.354687690734863, "global_step": 108451, "epoch": 2582} {"train_loss": -6.499426364898682, "global_step": 108452, "epoch": 2582} {"train_loss": -6.351616382598877, "global_step": 108453, "epoch": 2582} {"train_loss": -6.5161237716674805, "global_step": 108454, "epoch": 2582} {"train_loss": -6.5485687255859375, "global_step": 108455, "epoch": 2582} {"train_loss": -6.415800094604492, "global_step": 108456, "epoch": 2582} {"train_loss": -6.543793678283691, "global_step": 108457, "epoch": 2582} {"train_loss": -6.5381269454956055, "global_step": 108458, "epoch": 2582} {"train_loss": -6.511495590209961, "global_step": 108459, "epoch": 2582} {"train_loss": -6.465004920959473, "global_step": 108460, "epoch": 2582} {"train_loss": -6.4488325119018555, "global_step": 108461, "epoch": 2582} {"train_loss": -6.388561248779297, "global_step": 108462, "epoch": 2582} {"train_loss": -6.451302528381348, "global_step": 108463, "epoch": 2582} {"train_loss": -6.484257698059082, "global_step": 108464, "epoch": 2582} {"train_loss": -6.489528656005859, "global_step": 108465, "epoch": 2582} {"train_loss": -6.459299087524414, "global_step": 108466, "epoch": 2582} {"train_loss": -6.477497100830078, "global_step": 108467, "epoch": 2582} {"train_loss": -6.469553470611572, "global_step": 108468, "epoch": 2582} {"train_loss": -6.406269073486328, "global_step": 108469, "epoch": 2582} {"train_loss": -6.550643444061279, "global_step": 108470, "epoch": 2582} {"train_loss": -6.482105731964111, "global_step": 108471, "epoch": 2582} {"train_loss": -6.378646373748779, "global_step": 108472, "epoch": 2582} {"train_loss": -6.439017295837402, "global_step": 108473, "epoch": 2582} {"train_loss": -6.527731895446777, "global_step": 108474, "epoch": 2582} {"train_loss": -6.4793620109558105, "global_step": 108475, "epoch": 2582} {"train_loss": -6.371450424194336, "global_step": 108476, "epoch": 2582} {"train_loss": -6.448783874511719, "global_step": 108477, "epoch": 2582} {"train_loss": -6.429666519165039, "global_step": 108478, "epoch": 2582} {"train_loss": -6.482999324798584, "global_step": 108479, "epoch": 2582} {"train_loss": -6.412474155426025, "global_step": 108480, "epoch": 2582} {"train_loss": -6.400540351867676, "global_step": 108481, "epoch": 2582} {"train_loss": -6.488378524780273, "global_step": 108482, "epoch": 2582} {"train_loss": -6.412463188171387, "global_step": 108483, "epoch": 2582} {"train_loss": -6.4039387702941895, "global_step": 108484, "epoch": 2582} {"train_loss": -6.463565440404983, "global_step": 108485, "epoch": 2582, "val_loss": 76063.5546875} {"train_loss": -6.528191566467285, "global_step": 108486, "epoch": 2583} {"train_loss": -6.398993492126465, "global_step": 108487, "epoch": 2583} {"train_loss": -6.330554008483887, "global_step": 108488, "epoch": 2583} {"train_loss": -6.48330020904541, "global_step": 108489, "epoch": 2583} {"train_loss": -6.36361837387085, "global_step": 108490, "epoch": 2583} {"train_loss": -6.390805244445801, "global_step": 108491, "epoch": 2583} {"train_loss": -6.449985504150391, "global_step": 108492, "epoch": 2583} {"train_loss": -6.450830459594727, "global_step": 108493, "epoch": 2583} {"train_loss": -6.445359230041504, "global_step": 108494, "epoch": 2583} {"train_loss": -6.404705047607422, "global_step": 108495, "epoch": 2583} {"train_loss": -6.400669097900391, "global_step": 108496, "epoch": 2583} {"train_loss": -6.351210117340088, "global_step": 108497, "epoch": 2583} {"train_loss": -6.373661994934082, "global_step": 108498, "epoch": 2583} {"train_loss": -6.5092010498046875, "global_step": 108499, "epoch": 2583} {"train_loss": -6.477191925048828, "global_step": 108500, "epoch": 2583} {"train_loss": -6.547822952270508, "global_step": 108501, "epoch": 2583} {"train_loss": -6.432583808898926, "global_step": 108502, "epoch": 2583} {"train_loss": -6.397067546844482, "global_step": 108503, "epoch": 2583} {"train_loss": -6.538334846496582, "global_step": 108504, "epoch": 2583} {"train_loss": -6.412321090698242, "global_step": 108505, "epoch": 2583} {"train_loss": -6.411815643310547, "global_step": 108506, "epoch": 2583} {"train_loss": -6.533385276794434, "global_step": 108507, "epoch": 2583} {"train_loss": -6.465989112854004, "global_step": 108508, "epoch": 2583} {"train_loss": -6.4876627922058105, "global_step": 108509, "epoch": 2583} {"train_loss": -6.32701301574707, "global_step": 108510, "epoch": 2583} {"train_loss": -6.462533950805664, "global_step": 108511, "epoch": 2583} {"train_loss": -6.484894275665283, "global_step": 108512, "epoch": 2583} {"train_loss": -6.483098983764648, "global_step": 108513, "epoch": 2583} {"train_loss": -6.581188201904297, "global_step": 108514, "epoch": 2583} {"train_loss": -6.430356979370117, "global_step": 108515, "epoch": 2583} {"train_loss": -6.458679676055908, "global_step": 108516, "epoch": 2583} {"train_loss": -6.518248558044434, "global_step": 108517, "epoch": 2583} {"train_loss": -6.480645179748535, "global_step": 108518, "epoch": 2583} {"train_loss": -6.433137893676758, "global_step": 108519, "epoch": 2583} {"train_loss": -6.570003509521484, "global_step": 108520, "epoch": 2583} {"train_loss": -6.524320125579834, "global_step": 108521, "epoch": 2583} {"train_loss": -6.471980094909668, "global_step": 108522, "epoch": 2583} {"train_loss": -6.413398265838623, "global_step": 108523, "epoch": 2583} {"train_loss": -6.364840507507324, "global_step": 108524, "epoch": 2583} {"train_loss": -6.416928291320801, "global_step": 108525, "epoch": 2583} {"train_loss": -6.583102226257324, "global_step": 108526, "epoch": 2583} {"train_loss": -6.453662384124029, "global_step": 108527, "epoch": 2583, "val_loss": 76051.7421875} {"train_loss": -6.460879325866699, "global_step": 108528, "epoch": 2584} {"train_loss": -6.5859479904174805, "global_step": 108529, "epoch": 2584} {"train_loss": -6.53309440612793, "global_step": 108530, "epoch": 2584} {"train_loss": -6.558376312255859, "global_step": 108531, "epoch": 2584} {"train_loss": -6.354561805725098, "global_step": 108532, "epoch": 2584} {"train_loss": -6.590113639831543, "global_step": 108533, "epoch": 2584} {"train_loss": -6.460943222045898, "global_step": 108534, "epoch": 2584} {"train_loss": -6.453108787536621, "global_step": 108535, "epoch": 2584} {"train_loss": -6.4679856300354, "global_step": 108536, "epoch": 2584} {"train_loss": -6.4854326248168945, "global_step": 108537, "epoch": 2584} {"train_loss": -6.396742820739746, "global_step": 108538, "epoch": 2584} {"train_loss": -6.4330267906188965, "global_step": 108539, "epoch": 2584} {"train_loss": -6.3750786781311035, "global_step": 108540, "epoch": 2584} {"train_loss": -6.410959243774414, "global_step": 108541, "epoch": 2584} {"train_loss": -6.411536693572998, "global_step": 108542, "epoch": 2584} {"train_loss": -6.447978973388672, "global_step": 108543, "epoch": 2584} {"train_loss": -6.4687819480896, "global_step": 108544, "epoch": 2584} {"train_loss": -6.4243364334106445, "global_step": 108545, "epoch": 2584} {"train_loss": -6.482638359069824, "global_step": 108546, "epoch": 2584} {"train_loss": -6.541112899780273, "global_step": 108547, "epoch": 2584} {"train_loss": -6.4830169677734375, "global_step": 108548, "epoch": 2584} {"train_loss": -6.3718581199646, "global_step": 108549, "epoch": 2584} {"train_loss": -6.51555061340332, "global_step": 108550, "epoch": 2584} {"train_loss": -6.49635124206543, "global_step": 108551, "epoch": 2584} {"train_loss": -6.430350303649902, "global_step": 108552, "epoch": 2584} {"train_loss": -6.568414211273193, "global_step": 108553, "epoch": 2584} {"train_loss": -6.491269111633301, "global_step": 108554, "epoch": 2584} {"train_loss": -6.403276443481445, "global_step": 108555, "epoch": 2584} {"train_loss": -6.563751220703125, "global_step": 108556, "epoch": 2584} {"train_loss": -6.389761447906494, "global_step": 108557, "epoch": 2584} {"train_loss": -6.544678688049316, "global_step": 108558, "epoch": 2584} {"train_loss": -6.503169059753418, "global_step": 108559, "epoch": 2584} {"train_loss": -6.359675407409668, "global_step": 108560, "epoch": 2584} {"train_loss": -6.444860458374023, "global_step": 108561, "epoch": 2584} {"train_loss": -6.349472999572754, "global_step": 108562, "epoch": 2584} {"train_loss": -6.476961135864258, "global_step": 108563, "epoch": 2584} {"train_loss": -6.589455604553223, "global_step": 108564, "epoch": 2584} {"train_loss": -6.409104347229004, "global_step": 108565, "epoch": 2584} {"train_loss": -6.458491325378418, "global_step": 108566, "epoch": 2584} {"train_loss": -6.503713607788086, "global_step": 108567, "epoch": 2584} {"train_loss": -6.462713241577148, "global_step": 108568, "epoch": 2584} {"train_loss": -6.466181698299589, "global_step": 108569, "epoch": 2584, "val_loss": 76145.3984375} {"train_loss": -6.398933410644531, "global_step": 108570, "epoch": 2585} {"train_loss": -6.335272789001465, "global_step": 108571, "epoch": 2585} {"train_loss": -6.460299491882324, "global_step": 108572, "epoch": 2585} {"train_loss": -6.485352039337158, "global_step": 108573, "epoch": 2585} {"train_loss": -6.418063163757324, "global_step": 108574, "epoch": 2585} {"train_loss": -6.464776992797852, "global_step": 108575, "epoch": 2585} {"train_loss": -6.461175918579102, "global_step": 108576, "epoch": 2585} {"train_loss": -6.320050239562988, "global_step": 108577, "epoch": 2585} {"train_loss": -6.411949157714844, "global_step": 108578, "epoch": 2585} {"train_loss": -6.325031280517578, "global_step": 108579, "epoch": 2585} {"train_loss": -6.409909248352051, "global_step": 108580, "epoch": 2585} {"train_loss": -6.540956974029541, "global_step": 108581, "epoch": 2585} {"train_loss": -6.442813396453857, "global_step": 108582, "epoch": 2585} {"train_loss": -6.31406307220459, "global_step": 108583, "epoch": 2585} {"train_loss": -6.354569435119629, "global_step": 108584, "epoch": 2585} {"train_loss": -6.397182941436768, "global_step": 108585, "epoch": 2585} {"train_loss": -6.319394588470459, "global_step": 108586, "epoch": 2585} {"train_loss": -6.358877182006836, "global_step": 108587, "epoch": 2585} {"train_loss": -6.471248626708984, "global_step": 108588, "epoch": 2585} {"train_loss": -6.314363479614258, "global_step": 108589, "epoch": 2585} {"train_loss": -6.399378776550293, "global_step": 108590, "epoch": 2585} {"train_loss": -6.313438892364502, "global_step": 108591, "epoch": 2585} {"train_loss": -6.459897041320801, "global_step": 108592, "epoch": 2585} {"train_loss": -6.3497538566589355, "global_step": 108593, "epoch": 2585} {"train_loss": -6.329085350036621, "global_step": 108594, "epoch": 2585} {"train_loss": -6.440303802490234, "global_step": 108595, "epoch": 2585} {"train_loss": -6.235802173614502, "global_step": 108596, "epoch": 2585} {"train_loss": -6.407981872558594, "global_step": 108597, "epoch": 2585} {"train_loss": -6.406244277954102, "global_step": 108598, "epoch": 2585} {"train_loss": -6.327815532684326, "global_step": 108599, "epoch": 2585} {"train_loss": -6.537960529327393, "global_step": 108600, "epoch": 2585} {"train_loss": -6.478041648864746, "global_step": 108601, "epoch": 2585} {"train_loss": -6.541563034057617, "global_step": 108602, "epoch": 2585} {"train_loss": -6.4328227043151855, "global_step": 108603, "epoch": 2585} {"train_loss": -6.462470531463623, "global_step": 108604, "epoch": 2585} {"train_loss": -6.436160087585449, "global_step": 108605, "epoch": 2585} {"train_loss": -6.391537189483643, "global_step": 108606, "epoch": 2585} {"train_loss": -6.534858703613281, "global_step": 108607, "epoch": 2585} {"train_loss": -6.361924171447754, "global_step": 108608, "epoch": 2585} {"train_loss": -6.428489685058594, "global_step": 108609, "epoch": 2585} {"train_loss": -6.52771520614624, "global_step": 108610, "epoch": 2585} {"train_loss": -6.412081071308681, "global_step": 108611, "epoch": 2585, "val_loss": 76286.609375} {"train_loss": -6.505138397216797, "global_step": 108612, "epoch": 2586} {"train_loss": -6.439493656158447, "global_step": 108613, "epoch": 2586} {"train_loss": -6.497810363769531, "global_step": 108614, "epoch": 2586} {"train_loss": -6.549443244934082, "global_step": 108615, "epoch": 2586} {"train_loss": -6.449402809143066, "global_step": 108616, "epoch": 2586} {"train_loss": -6.480988502502441, "global_step": 108617, "epoch": 2586} {"train_loss": -6.497460842132568, "global_step": 108618, "epoch": 2586} {"train_loss": -6.515749931335449, "global_step": 108619, "epoch": 2586} {"train_loss": -6.461392879486084, "global_step": 108620, "epoch": 2586} {"train_loss": -6.447498798370361, "global_step": 108621, "epoch": 2586} {"train_loss": -6.572076797485352, "global_step": 108622, "epoch": 2586} {"train_loss": -6.458320617675781, "global_step": 108623, "epoch": 2586} {"train_loss": -6.460028648376465, "global_step": 108624, "epoch": 2586} {"train_loss": -6.444069862365723, "global_step": 108625, "epoch": 2586} {"train_loss": -6.521201133728027, "global_step": 108626, "epoch": 2586} {"train_loss": -6.586844444274902, "global_step": 108627, "epoch": 2586} {"train_loss": -6.343530178070068, "global_step": 108628, "epoch": 2586} {"train_loss": -6.4973859786987305, "global_step": 108629, "epoch": 2586} {"train_loss": -6.592041969299316, "global_step": 108630, "epoch": 2586} {"train_loss": -6.419299125671387, "global_step": 108631, "epoch": 2586} {"train_loss": -6.526877403259277, "global_step": 108632, "epoch": 2586} {"train_loss": -6.4268975257873535, "global_step": 108633, "epoch": 2586} {"train_loss": -6.474486351013184, "global_step": 108634, "epoch": 2586} {"train_loss": -6.5237908363342285, "global_step": 108635, "epoch": 2586} {"train_loss": -6.408441543579102, "global_step": 108636, "epoch": 2586} {"train_loss": -6.498345375061035, "global_step": 108637, "epoch": 2586} {"train_loss": -6.468942642211914, "global_step": 108638, "epoch": 2586} {"train_loss": -6.512726783752441, "global_step": 108639, "epoch": 2586} {"train_loss": -6.541706085205078, "global_step": 108640, "epoch": 2586} {"train_loss": -6.507080078125, "global_step": 108641, "epoch": 2586} {"train_loss": -6.5051164627075195, "global_step": 108642, "epoch": 2586} {"train_loss": -6.4726738929748535, "global_step": 108643, "epoch": 2586} {"train_loss": -6.495882511138916, "global_step": 108644, "epoch": 2586} {"train_loss": -6.415356636047363, "global_step": 108645, "epoch": 2586} {"train_loss": -6.426812171936035, "global_step": 108646, "epoch": 2586} {"train_loss": -6.409518241882324, "global_step": 108647, "epoch": 2586} {"train_loss": -6.563266754150391, "global_step": 108648, "epoch": 2586} {"train_loss": -6.441901206970215, "global_step": 108649, "epoch": 2586} {"train_loss": -6.462686061859131, "global_step": 108650, "epoch": 2586} {"train_loss": -6.540578842163086, "global_step": 108651, "epoch": 2586} {"train_loss": -6.456700325012207, "global_step": 108652, "epoch": 2586} {"train_loss": -6.484000103814261, "global_step": 108653, "epoch": 2586, "val_loss": 76073.5} {"train_loss": -6.586009502410889, "global_step": 108654, "epoch": 2587} {"train_loss": -6.423699378967285, "global_step": 108655, "epoch": 2587} {"train_loss": -6.567773342132568, "global_step": 108656, "epoch": 2587} {"train_loss": -6.442310333251953, "global_step": 108657, "epoch": 2587} {"train_loss": -6.430864334106445, "global_step": 108658, "epoch": 2587} {"train_loss": -6.478420257568359, "global_step": 108659, "epoch": 2587} {"train_loss": -6.453794956207275, "global_step": 108660, "epoch": 2587} {"train_loss": -6.424408912658691, "global_step": 108661, "epoch": 2587} {"train_loss": -6.5374250411987305, "global_step": 108662, "epoch": 2587} {"train_loss": -6.411513805389404, "global_step": 108663, "epoch": 2587} {"train_loss": -6.43717098236084, "global_step": 108664, "epoch": 2587} {"train_loss": -6.383298397064209, "global_step": 108665, "epoch": 2587} {"train_loss": -6.479530334472656, "global_step": 108666, "epoch": 2587} {"train_loss": -6.502229690551758, "global_step": 108667, "epoch": 2587} {"train_loss": -6.421985626220703, "global_step": 108668, "epoch": 2587} {"train_loss": -6.505137920379639, "global_step": 108669, "epoch": 2587} {"train_loss": -6.522948741912842, "global_step": 108670, "epoch": 2587} {"train_loss": -6.362135887145996, "global_step": 108671, "epoch": 2587} {"train_loss": -6.455278396606445, "global_step": 108672, "epoch": 2587} {"train_loss": -6.510578155517578, "global_step": 108673, "epoch": 2587} {"train_loss": -6.365367889404297, "global_step": 108674, "epoch": 2587} {"train_loss": -6.392260551452637, "global_step": 108675, "epoch": 2587} {"train_loss": -6.538908958435059, "global_step": 108676, "epoch": 2587} {"train_loss": -6.394505500793457, "global_step": 108677, "epoch": 2587} {"train_loss": -6.477802276611328, "global_step": 108678, "epoch": 2587} {"train_loss": -6.511575698852539, "global_step": 108679, "epoch": 2587} {"train_loss": -6.540471076965332, "global_step": 108680, "epoch": 2587} {"train_loss": -6.4523539543151855, "global_step": 108681, "epoch": 2587} {"train_loss": -6.366513729095459, "global_step": 108682, "epoch": 2587} {"train_loss": -6.479798316955566, "global_step": 108683, "epoch": 2587} {"train_loss": -6.466045379638672, "global_step": 108684, "epoch": 2587} {"train_loss": -6.4482645988464355, "global_step": 108685, "epoch": 2587} {"train_loss": -6.381282329559326, "global_step": 108686, "epoch": 2587} {"train_loss": -6.396697044372559, "global_step": 108687, "epoch": 2587} {"train_loss": -6.572603225708008, "global_step": 108688, "epoch": 2587} {"train_loss": -6.450282096862793, "global_step": 108689, "epoch": 2587} {"train_loss": -6.422534465789795, "global_step": 108690, "epoch": 2587} {"train_loss": -6.527385711669922, "global_step": 108691, "epoch": 2587} {"train_loss": -6.385837554931641, "global_step": 108692, "epoch": 2587} {"train_loss": -6.416046142578125, "global_step": 108693, "epoch": 2587} {"train_loss": -6.442183017730713, "global_step": 108694, "epoch": 2587} {"train_loss": -6.458643016361055, "global_step": 108695, "epoch": 2587, "val_loss": 76166.1015625} {"train_loss": -6.412282943725586, "global_step": 108696, "epoch": 2588} {"train_loss": -6.396085739135742, "global_step": 108697, "epoch": 2588} {"train_loss": -6.480202674865723, "global_step": 108698, "epoch": 2588} {"train_loss": -6.462989807128906, "global_step": 108699, "epoch": 2588} {"train_loss": -6.370031356811523, "global_step": 108700, "epoch": 2588} {"train_loss": -6.454465866088867, "global_step": 108701, "epoch": 2588} {"train_loss": -6.400269508361816, "global_step": 108702, "epoch": 2588} {"train_loss": -6.4468793869018555, "global_step": 108703, "epoch": 2588} {"train_loss": -6.401503562927246, "global_step": 108704, "epoch": 2588} {"train_loss": -6.428027153015137, "global_step": 108705, "epoch": 2588} {"train_loss": -6.406344413757324, "global_step": 108706, "epoch": 2588} {"train_loss": -6.399548530578613, "global_step": 108707, "epoch": 2588} {"train_loss": -6.355809688568115, "global_step": 108708, "epoch": 2588} {"train_loss": -6.457091331481934, "global_step": 108709, "epoch": 2588} {"train_loss": -6.407204627990723, "global_step": 108710, "epoch": 2588} {"train_loss": -6.421265602111816, "global_step": 108711, "epoch": 2588} {"train_loss": -6.446323394775391, "global_step": 108712, "epoch": 2588} {"train_loss": -6.449960708618164, "global_step": 108713, "epoch": 2588} {"train_loss": -6.420165538787842, "global_step": 108714, "epoch": 2588} {"train_loss": -6.296964645385742, "global_step": 108715, "epoch": 2588} {"train_loss": -6.305716514587402, "global_step": 108716, "epoch": 2588} {"train_loss": -6.416567325592041, "global_step": 108717, "epoch": 2588} {"train_loss": -6.467301368713379, "global_step": 108718, "epoch": 2588} {"train_loss": -6.412639617919922, "global_step": 108719, "epoch": 2588} {"train_loss": -6.413744926452637, "global_step": 108720, "epoch": 2588} {"train_loss": -6.507441520690918, "global_step": 108721, "epoch": 2588} {"train_loss": -6.518057823181152, "global_step": 108722, "epoch": 2588} {"train_loss": -6.469803333282471, "global_step": 108723, "epoch": 2588} {"train_loss": -6.497814178466797, "global_step": 108724, "epoch": 2588} {"train_loss": -6.3591718673706055, "global_step": 108725, "epoch": 2588} {"train_loss": -6.484480857849121, "global_step": 108726, "epoch": 2588} {"train_loss": -6.335115432739258, "global_step": 108727, "epoch": 2588} {"train_loss": -6.446115493774414, "global_step": 108728, "epoch": 2588} {"train_loss": -6.311676025390625, "global_step": 108729, "epoch": 2588} {"train_loss": -6.3198089599609375, "global_step": 108730, "epoch": 2588} {"train_loss": -6.509552001953125, "global_step": 108731, "epoch": 2588} {"train_loss": -6.345178604125977, "global_step": 108732, "epoch": 2588} {"train_loss": -6.375086784362793, "global_step": 108733, "epoch": 2588} {"train_loss": -6.2979936599731445, "global_step": 108734, "epoch": 2588} {"train_loss": -6.449335098266602, "global_step": 108735, "epoch": 2588} {"train_loss": -6.285293102264404, "global_step": 108736, "epoch": 2588} {"train_loss": -6.409308501652309, "global_step": 108737, "epoch": 2588, "val_loss": 76315.1640625} {"train_loss": -6.35286808013916, "global_step": 108738, "epoch": 2589} {"train_loss": -6.250333786010742, "global_step": 108739, "epoch": 2589} {"train_loss": -6.397980690002441, "global_step": 108740, "epoch": 2589} {"train_loss": -6.264096260070801, "global_step": 108741, "epoch": 2589} {"train_loss": -6.4500651359558105, "global_step": 108742, "epoch": 2589} {"train_loss": -6.184405326843262, "global_step": 108743, "epoch": 2589} {"train_loss": -6.401182174682617, "global_step": 108744, "epoch": 2589} {"train_loss": -6.226795196533203, "global_step": 108745, "epoch": 2589} {"train_loss": -6.399471282958984, "global_step": 108746, "epoch": 2589} {"train_loss": -6.4717912673950195, "global_step": 108747, "epoch": 2589} {"train_loss": -6.44189977645874, "global_step": 108748, "epoch": 2589} {"train_loss": -6.415176868438721, "global_step": 108749, "epoch": 2589} {"train_loss": -6.386534690856934, "global_step": 108750, "epoch": 2589} {"train_loss": -6.358245372772217, "global_step": 108751, "epoch": 2589} {"train_loss": -6.419302940368652, "global_step": 108752, "epoch": 2589} {"train_loss": -6.3924150466918945, "global_step": 108753, "epoch": 2589} {"train_loss": -6.403347969055176, "global_step": 108754, "epoch": 2589} {"train_loss": -6.426840782165527, "global_step": 108755, "epoch": 2589} {"train_loss": -6.345883369445801, "global_step": 108756, "epoch": 2589} {"train_loss": -6.451032638549805, "global_step": 108757, "epoch": 2589} {"train_loss": -6.438432216644287, "global_step": 108758, "epoch": 2589} {"train_loss": -6.49682092666626, "global_step": 108759, "epoch": 2589} {"train_loss": -6.617283821105957, "global_step": 108760, "epoch": 2589} {"train_loss": -6.48844051361084, "global_step": 108761, "epoch": 2589} {"train_loss": -6.373331069946289, "global_step": 108762, "epoch": 2589} {"train_loss": -6.593246936798096, "global_step": 108763, "epoch": 2589} {"train_loss": -6.490381240844727, "global_step": 108764, "epoch": 2589} {"train_loss": -6.499857425689697, "global_step": 108765, "epoch": 2589} {"train_loss": -6.528796195983887, "global_step": 108766, "epoch": 2589} {"train_loss": -6.413315773010254, "global_step": 108767, "epoch": 2589} {"train_loss": -6.5034942626953125, "global_step": 108768, "epoch": 2589} {"train_loss": -6.557379722595215, "global_step": 108769, "epoch": 2589} {"train_loss": -6.5941057205200195, "global_step": 108770, "epoch": 2589} {"train_loss": -6.349020481109619, "global_step": 108771, "epoch": 2589} {"train_loss": -6.510392189025879, "global_step": 108772, "epoch": 2589} {"train_loss": -6.3514862060546875, "global_step": 108773, "epoch": 2589} {"train_loss": -6.318262100219727, "global_step": 108774, "epoch": 2589} {"train_loss": -6.3940229415893555, "global_step": 108775, "epoch": 2589} {"train_loss": -6.513771057128906, "global_step": 108776, "epoch": 2589} {"train_loss": -6.455602645874023, "global_step": 108777, "epoch": 2589} {"train_loss": -6.259446144104004, "global_step": 108778, "epoch": 2589} {"train_loss": -6.423844916479928, "global_step": 108779, "epoch": 2589, "val_loss": 76729.96875} {"train_loss": -6.383266448974609, "global_step": 108780, "epoch": 2590} {"train_loss": -6.479299545288086, "global_step": 108781, "epoch": 2590} {"train_loss": -6.401205062866211, "global_step": 108782, "epoch": 2590} {"train_loss": -6.401512145996094, "global_step": 108783, "epoch": 2590} {"train_loss": -6.474958419799805, "global_step": 108784, "epoch": 2590} {"train_loss": -6.3991851806640625, "global_step": 108785, "epoch": 2590} {"train_loss": -6.496775150299072, "global_step": 108786, "epoch": 2590} {"train_loss": -6.5180511474609375, "global_step": 108787, "epoch": 2590} {"train_loss": -6.456395149230957, "global_step": 108788, "epoch": 2590} {"train_loss": -6.44594669342041, "global_step": 108789, "epoch": 2590} {"train_loss": -6.361766338348389, "global_step": 108790, "epoch": 2590} {"train_loss": -6.497153282165527, "global_step": 108791, "epoch": 2590} {"train_loss": -6.478532791137695, "global_step": 108792, "epoch": 2590} {"train_loss": -6.394209384918213, "global_step": 108793, "epoch": 2590} {"train_loss": -6.472354412078857, "global_step": 108794, "epoch": 2590} {"train_loss": -6.526783466339111, "global_step": 108795, "epoch": 2590} {"train_loss": -6.508444786071777, "global_step": 108796, "epoch": 2590} {"train_loss": -6.423727035522461, "global_step": 108797, "epoch": 2590} {"train_loss": -6.484708309173584, "global_step": 108798, "epoch": 2590} {"train_loss": -6.503252029418945, "global_step": 108799, "epoch": 2590} {"train_loss": -6.343613624572754, "global_step": 108800, "epoch": 2590} {"train_loss": -6.454267501831055, "global_step": 108801, "epoch": 2590} {"train_loss": -6.521399021148682, "global_step": 108802, "epoch": 2590} {"train_loss": -6.480142593383789, "global_step": 108803, "epoch": 2590} {"train_loss": -6.4664506912231445, "global_step": 108804, "epoch": 2590} {"train_loss": -6.420550346374512, "global_step": 108805, "epoch": 2590} {"train_loss": -6.451563358306885, "global_step": 108806, "epoch": 2590} {"train_loss": -6.443580150604248, "global_step": 108807, "epoch": 2590} {"train_loss": -6.448240280151367, "global_step": 108808, "epoch": 2590} {"train_loss": -6.592476844787598, "global_step": 108809, "epoch": 2590} {"train_loss": -6.499570369720459, "global_step": 108810, "epoch": 2590} {"train_loss": -6.314093589782715, "global_step": 108811, "epoch": 2590} {"train_loss": -6.5268964767456055, "global_step": 108812, "epoch": 2590} {"train_loss": -6.407847881317139, "global_step": 108813, "epoch": 2590} {"train_loss": -6.406494140625, "global_step": 108814, "epoch": 2590} {"train_loss": -6.389619827270508, "global_step": 108815, "epoch": 2590} {"train_loss": -6.502812385559082, "global_step": 108816, "epoch": 2590} {"train_loss": -6.475986957550049, "global_step": 108817, "epoch": 2590} {"train_loss": -6.512628555297852, "global_step": 108818, "epoch": 2590} {"train_loss": -6.4192423820495605, "global_step": 108819, "epoch": 2590} {"train_loss": -6.4346923828125, "global_step": 108820, "epoch": 2590} {"train_loss": -6.4518612793513705, "global_step": 108821, "epoch": 2590, "val_loss": 76489.640625} {"train_loss": -6.39914608001709, "global_step": 108822, "epoch": 2591} {"train_loss": -6.42779541015625, "global_step": 108823, "epoch": 2591} {"train_loss": -6.41328239440918, "global_step": 108824, "epoch": 2591} {"train_loss": -6.382389068603516, "global_step": 108825, "epoch": 2591} {"train_loss": -6.420321464538574, "global_step": 108826, "epoch": 2591} {"train_loss": -6.451755046844482, "global_step": 108827, "epoch": 2591} {"train_loss": -6.435307502746582, "global_step": 108828, "epoch": 2591} {"train_loss": -6.517354965209961, "global_step": 108829, "epoch": 2591} {"train_loss": -6.42021369934082, "global_step": 108830, "epoch": 2591} {"train_loss": -6.451311111450195, "global_step": 108831, "epoch": 2591} {"train_loss": -6.375178337097168, "global_step": 108832, "epoch": 2591} {"train_loss": -6.406085014343262, "global_step": 108833, "epoch": 2591} {"train_loss": -6.564083099365234, "global_step": 108834, "epoch": 2591} {"train_loss": -6.493557453155518, "global_step": 108835, "epoch": 2591} {"train_loss": -6.400095462799072, "global_step": 108836, "epoch": 2591} {"train_loss": -6.428735256195068, "global_step": 108837, "epoch": 2591} {"train_loss": -6.509091854095459, "global_step": 108838, "epoch": 2591} {"train_loss": -6.4701995849609375, "global_step": 108839, "epoch": 2591} {"train_loss": -6.503627300262451, "global_step": 108840, "epoch": 2591} {"train_loss": -6.420676231384277, "global_step": 108841, "epoch": 2591} {"train_loss": -6.555747985839844, "global_step": 108842, "epoch": 2591} {"train_loss": -6.525665283203125, "global_step": 108843, "epoch": 2591} {"train_loss": -6.421145439147949, "global_step": 108844, "epoch": 2591} {"train_loss": -6.364689826965332, "global_step": 108845, "epoch": 2591} {"train_loss": -6.3791728019714355, "global_step": 108846, "epoch": 2591} {"train_loss": -6.511081695556641, "global_step": 108847, "epoch": 2591} {"train_loss": -6.40029764175415, "global_step": 108848, "epoch": 2591} {"train_loss": -6.294805526733398, "global_step": 108849, "epoch": 2591} {"train_loss": -6.416934013366699, "global_step": 108850, "epoch": 2591} {"train_loss": -6.456036567687988, "global_step": 108851, "epoch": 2591} {"train_loss": -6.516415596008301, "global_step": 108852, "epoch": 2591} {"train_loss": -6.387151718139648, "global_step": 108853, "epoch": 2591} {"train_loss": -6.364589214324951, "global_step": 108854, "epoch": 2591} {"train_loss": -6.3215227127075195, "global_step": 108855, "epoch": 2591} {"train_loss": -6.416520595550537, "global_step": 108856, "epoch": 2591} {"train_loss": -6.326105117797852, "global_step": 108857, "epoch": 2591} {"train_loss": -6.429708480834961, "global_step": 108858, "epoch": 2591} {"train_loss": -6.3847856521606445, "global_step": 108859, "epoch": 2591} {"train_loss": -6.454357147216797, "global_step": 108860, "epoch": 2591} {"train_loss": -6.458341598510742, "global_step": 108861, "epoch": 2591} {"train_loss": -6.442025661468506, "global_step": 108862, "epoch": 2591} {"train_loss": -6.432197559447515, "global_step": 108863, "epoch": 2591, "val_loss": 76224.375} {"train_loss": -6.533061981201172, "global_step": 108864, "epoch": 2592} {"train_loss": -6.504279613494873, "global_step": 108865, "epoch": 2592} {"train_loss": -6.52888298034668, "global_step": 108866, "epoch": 2592} {"train_loss": -6.390532970428467, "global_step": 108867, "epoch": 2592} {"train_loss": -6.458072185516357, "global_step": 108868, "epoch": 2592} {"train_loss": -6.46035623550415, "global_step": 108869, "epoch": 2592} {"train_loss": -6.503674030303955, "global_step": 108870, "epoch": 2592} {"train_loss": -6.561166763305664, "global_step": 108871, "epoch": 2592} {"train_loss": -6.5198750495910645, "global_step": 108872, "epoch": 2592} {"train_loss": -6.615663051605225, "global_step": 108873, "epoch": 2592} {"train_loss": -6.51659631729126, "global_step": 108874, "epoch": 2592} {"train_loss": -6.423340320587158, "global_step": 108875, "epoch": 2592} {"train_loss": -6.430735111236572, "global_step": 108876, "epoch": 2592} {"train_loss": -6.474442958831787, "global_step": 108877, "epoch": 2592} {"train_loss": -6.413784027099609, "global_step": 108878, "epoch": 2592} {"train_loss": -6.494146823883057, "global_step": 108879, "epoch": 2592} {"train_loss": -6.307280540466309, "global_step": 108880, "epoch": 2592} {"train_loss": -6.353243350982666, "global_step": 108881, "epoch": 2592} {"train_loss": -6.396248817443848, "global_step": 108882, "epoch": 2592} {"train_loss": -6.247737884521484, "global_step": 108883, "epoch": 2592} {"train_loss": -6.545827388763428, "global_step": 108884, "epoch": 2592} {"train_loss": -6.453714370727539, "global_step": 108885, "epoch": 2592} {"train_loss": -6.308449745178223, "global_step": 108886, "epoch": 2592} {"train_loss": -6.4339599609375, "global_step": 108887, "epoch": 2592} {"train_loss": -6.521777153015137, "global_step": 108888, "epoch": 2592} {"train_loss": -6.392507553100586, "global_step": 108889, "epoch": 2592} {"train_loss": -6.450296401977539, "global_step": 108890, "epoch": 2592} {"train_loss": -6.400091171264648, "global_step": 108891, "epoch": 2592} {"train_loss": -6.507994651794434, "global_step": 108892, "epoch": 2592} {"train_loss": -6.388832092285156, "global_step": 108893, "epoch": 2592} {"train_loss": -6.387810707092285, "global_step": 108894, "epoch": 2592} {"train_loss": -6.3996381759643555, "global_step": 108895, "epoch": 2592} {"train_loss": -6.336328506469727, "global_step": 108896, "epoch": 2592} {"train_loss": -6.393296241760254, "global_step": 108897, "epoch": 2592} {"train_loss": -6.319165229797363, "global_step": 108898, "epoch": 2592} {"train_loss": -6.496630668640137, "global_step": 108899, "epoch": 2592} {"train_loss": -6.384082794189453, "global_step": 108900, "epoch": 2592} {"train_loss": -6.372412204742432, "global_step": 108901, "epoch": 2592} {"train_loss": -6.492048263549805, "global_step": 108902, "epoch": 2592} {"train_loss": -6.510339260101318, "global_step": 108903, "epoch": 2592} {"train_loss": -6.458433628082275, "global_step": 108904, "epoch": 2592} {"train_loss": -6.440783205486479, "global_step": 108905, "epoch": 2592, "val_loss": 75975.1953125} {"train_loss": -6.411684989929199, "global_step": 108906, "epoch": 2593} {"train_loss": -6.428528308868408, "global_step": 108907, "epoch": 2593} {"train_loss": -6.393459320068359, "global_step": 108908, "epoch": 2593} {"train_loss": -6.389125823974609, "global_step": 108909, "epoch": 2593} {"train_loss": -6.3836445808410645, "global_step": 108910, "epoch": 2593} {"train_loss": -6.40605354309082, "global_step": 108911, "epoch": 2593} {"train_loss": -6.473238945007324, "global_step": 108912, "epoch": 2593} {"train_loss": -6.4469451904296875, "global_step": 108913, "epoch": 2593} {"train_loss": -6.5163164138793945, "global_step": 108914, "epoch": 2593} {"train_loss": -6.418411731719971, "global_step": 108915, "epoch": 2593} {"train_loss": -6.4748969078063965, "global_step": 108916, "epoch": 2593} {"train_loss": -6.410548686981201, "global_step": 108917, "epoch": 2593} {"train_loss": -6.530069351196289, "global_step": 108918, "epoch": 2593} {"train_loss": -6.433012962341309, "global_step": 108919, "epoch": 2593} {"train_loss": -6.463581562042236, "global_step": 108920, "epoch": 2593} {"train_loss": -6.420551300048828, "global_step": 108921, "epoch": 2593} {"train_loss": -6.511519432067871, "global_step": 108922, "epoch": 2593} {"train_loss": -6.39247989654541, "global_step": 108923, "epoch": 2593} {"train_loss": -6.357886791229248, "global_step": 108924, "epoch": 2593} {"train_loss": -6.474254608154297, "global_step": 108925, "epoch": 2593} {"train_loss": -6.525382041931152, "global_step": 108926, "epoch": 2593} {"train_loss": -6.427248954772949, "global_step": 108927, "epoch": 2593} {"train_loss": -6.460206985473633, "global_step": 108928, "epoch": 2593} {"train_loss": -6.40457010269165, "global_step": 108929, "epoch": 2593} {"train_loss": -6.414228916168213, "global_step": 108930, "epoch": 2593} {"train_loss": -6.519601821899414, "global_step": 108931, "epoch": 2593} {"train_loss": -6.502777099609375, "global_step": 108932, "epoch": 2593} {"train_loss": -6.434415817260742, "global_step": 108933, "epoch": 2593} {"train_loss": -6.601655960083008, "global_step": 108934, "epoch": 2593} {"train_loss": -6.548195838928223, "global_step": 108935, "epoch": 2593} {"train_loss": -6.477469444274902, "global_step": 108936, "epoch": 2593} {"train_loss": -6.561398506164551, "global_step": 108937, "epoch": 2593} {"train_loss": -6.685863971710205, "global_step": 108938, "epoch": 2593} {"train_loss": -6.44144868850708, "global_step": 108939, "epoch": 2593} {"train_loss": -6.416401386260986, "global_step": 108940, "epoch": 2593} {"train_loss": -6.462522506713867, "global_step": 108941, "epoch": 2593} {"train_loss": -6.392845153808594, "global_step": 108942, "epoch": 2593} {"train_loss": -6.441577434539795, "global_step": 108943, "epoch": 2593} {"train_loss": -6.428062438964844, "global_step": 108944, "epoch": 2593} {"train_loss": -6.472050666809082, "global_step": 108945, "epoch": 2593} {"train_loss": -6.480367183685303, "global_step": 108946, "epoch": 2593} {"train_loss": -6.457704544067383, "global_step": 108947, "epoch": 2593, "val_loss": 75880.828125} {"train_loss": -6.496013164520264, "global_step": 108948, "epoch": 2594} {"train_loss": -6.416433334350586, "global_step": 108949, "epoch": 2594} {"train_loss": -6.365521430969238, "global_step": 108950, "epoch": 2594} {"train_loss": -6.428353786468506, "global_step": 108951, "epoch": 2594} {"train_loss": -6.37885046005249, "global_step": 108952, "epoch": 2594} {"train_loss": -6.536498069763184, "global_step": 108953, "epoch": 2594} {"train_loss": -6.371098518371582, "global_step": 108954, "epoch": 2594} {"train_loss": -6.316492080688477, "global_step": 108955, "epoch": 2594} {"train_loss": -6.453059196472168, "global_step": 108956, "epoch": 2594} {"train_loss": -6.368305206298828, "global_step": 108957, "epoch": 2594} {"train_loss": -6.348860740661621, "global_step": 108958, "epoch": 2594} {"train_loss": -6.455224990844727, "global_step": 108959, "epoch": 2594} {"train_loss": -6.416539192199707, "global_step": 108960, "epoch": 2594} {"train_loss": -6.452415466308594, "global_step": 108961, "epoch": 2594} {"train_loss": -6.482348918914795, "global_step": 108962, "epoch": 2594} {"train_loss": -6.419503211975098, "global_step": 108963, "epoch": 2594} {"train_loss": -6.527592658996582, "global_step": 108964, "epoch": 2594} {"train_loss": -6.420117378234863, "global_step": 108965, "epoch": 2594} {"train_loss": -6.327417373657227, "global_step": 108966, "epoch": 2594} {"train_loss": -6.409302711486816, "global_step": 108967, "epoch": 2594} {"train_loss": -6.533987522125244, "global_step": 108968, "epoch": 2594} {"train_loss": -6.344696521759033, "global_step": 108969, "epoch": 2594} {"train_loss": -6.4305925369262695, "global_step": 108970, "epoch": 2594} {"train_loss": -6.388400077819824, "global_step": 108971, "epoch": 2594} {"train_loss": -6.426983833312988, "global_step": 108972, "epoch": 2594} {"train_loss": -6.377093315124512, "global_step": 108973, "epoch": 2594} {"train_loss": -6.4342780113220215, "global_step": 108974, "epoch": 2594} {"train_loss": -6.369338512420654, "global_step": 108975, "epoch": 2594} {"train_loss": -6.451026916503906, "global_step": 108976, "epoch": 2594} {"train_loss": -6.268144607543945, "global_step": 108977, "epoch": 2594} {"train_loss": -6.4631218910217285, "global_step": 108978, "epoch": 2594} {"train_loss": -6.404101848602295, "global_step": 108979, "epoch": 2594} {"train_loss": -6.449197769165039, "global_step": 108980, "epoch": 2594} {"train_loss": -6.43273401260376, "global_step": 108981, "epoch": 2594} {"train_loss": -6.246472358703613, "global_step": 108982, "epoch": 2594} {"train_loss": -6.336566925048828, "global_step": 108983, "epoch": 2594} {"train_loss": -6.4102373123168945, "global_step": 108984, "epoch": 2594} {"train_loss": -6.283235549926758, "global_step": 108985, "epoch": 2594} {"train_loss": -6.413791656494141, "global_step": 108986, "epoch": 2594} {"train_loss": -6.391785621643066, "global_step": 108987, "epoch": 2594} {"train_loss": -6.390139102935791, "global_step": 108988, "epoch": 2594} {"train_loss": -6.404222420283726, "global_step": 108989, "epoch": 2594, "val_loss": 76134.6875} {"train_loss": -6.455783843994141, "global_step": 108990, "epoch": 2595} {"train_loss": -6.412149429321289, "global_step": 108991, "epoch": 2595} {"train_loss": -6.307003498077393, "global_step": 108992, "epoch": 2595} {"train_loss": -6.521345138549805, "global_step": 108993, "epoch": 2595} {"train_loss": -6.415978908538818, "global_step": 108994, "epoch": 2595} {"train_loss": -6.45916748046875, "global_step": 108995, "epoch": 2595} {"train_loss": -6.396083831787109, "global_step": 108996, "epoch": 2595} {"train_loss": -6.545342922210693, "global_step": 108997, "epoch": 2595} {"train_loss": -6.509608745574951, "global_step": 108998, "epoch": 2595} {"train_loss": -6.491005897521973, "global_step": 108999, "epoch": 2595} {"train_loss": -6.265377044677734, "global_step": 109000, "epoch": 2595} {"train_loss": -6.526247501373291, "global_step": 109001, "epoch": 2595} {"train_loss": -6.428356647491455, "global_step": 109002, "epoch": 2595} {"train_loss": -6.435842514038086, "global_step": 109003, "epoch": 2595} {"train_loss": -6.350580215454102, "global_step": 109004, "epoch": 2595} {"train_loss": -6.464986801147461, "global_step": 109005, "epoch": 2595} {"train_loss": -6.415248870849609, "global_step": 109006, "epoch": 2595} {"train_loss": -6.270336151123047, "global_step": 109007, "epoch": 2595} {"train_loss": -6.4548540115356445, "global_step": 109008, "epoch": 2595} {"train_loss": -6.324031352996826, "global_step": 109009, "epoch": 2595} {"train_loss": -6.406352996826172, "global_step": 109010, "epoch": 2595} {"train_loss": -6.345879554748535, "global_step": 109011, "epoch": 2595} {"train_loss": -6.353755950927734, "global_step": 109012, "epoch": 2595} {"train_loss": -6.315975666046143, "global_step": 109013, "epoch": 2595} {"train_loss": -6.4367899894714355, "global_step": 109014, "epoch": 2595} {"train_loss": -6.381516456604004, "global_step": 109015, "epoch": 2595} {"train_loss": -6.434572219848633, "global_step": 109016, "epoch": 2595} {"train_loss": -6.412954330444336, "global_step": 109017, "epoch": 2595} {"train_loss": -6.472850799560547, "global_step": 109018, "epoch": 2595} {"train_loss": -6.4508585929870605, "global_step": 109019, "epoch": 2595} {"train_loss": -6.315420150756836, "global_step": 109020, "epoch": 2595} {"train_loss": -6.326068878173828, "global_step": 109021, "epoch": 2595} {"train_loss": -6.409520149230957, "global_step": 109022, "epoch": 2595} {"train_loss": -6.367969512939453, "global_step": 109023, "epoch": 2595} {"train_loss": -6.479351997375488, "global_step": 109024, "epoch": 2595} {"train_loss": -6.4098968505859375, "global_step": 109025, "epoch": 2595} {"train_loss": -6.337664604187012, "global_step": 109026, "epoch": 2595} {"train_loss": -6.3403143882751465, "global_step": 109027, "epoch": 2595} {"train_loss": -6.427546977996826, "global_step": 109028, "epoch": 2595} {"train_loss": -6.4009552001953125, "global_step": 109029, "epoch": 2595} {"train_loss": -6.407590866088867, "global_step": 109030, "epoch": 2595} {"train_loss": -6.408625580015636, "global_step": 109031, "epoch": 2595, "val_loss": 76592.3359375} {"train_loss": -6.3922929763793945, "global_step": 109032, "epoch": 2596} {"train_loss": -6.406089782714844, "global_step": 109033, "epoch": 2596} {"train_loss": -6.465970993041992, "global_step": 109034, "epoch": 2596} {"train_loss": -6.353976726531982, "global_step": 109035, "epoch": 2596} {"train_loss": -6.533784866333008, "global_step": 109036, "epoch": 2596} {"train_loss": -6.347562789916992, "global_step": 109037, "epoch": 2596} {"train_loss": -6.41660213470459, "global_step": 109038, "epoch": 2596} {"train_loss": -6.451635837554932, "global_step": 109039, "epoch": 2596} {"train_loss": -6.388225555419922, "global_step": 109040, "epoch": 2596} {"train_loss": -6.4773406982421875, "global_step": 109041, "epoch": 2596} {"train_loss": -6.480738639831543, "global_step": 109042, "epoch": 2596} {"train_loss": -6.386930465698242, "global_step": 109043, "epoch": 2596} {"train_loss": -6.479432106018066, "global_step": 109044, "epoch": 2596} {"train_loss": -6.424359321594238, "global_step": 109045, "epoch": 2596} {"train_loss": -6.461699485778809, "global_step": 109046, "epoch": 2596} {"train_loss": -6.38070011138916, "global_step": 109047, "epoch": 2596} {"train_loss": -6.340209484100342, "global_step": 109048, "epoch": 2596} {"train_loss": -6.463396072387695, "global_step": 109049, "epoch": 2596} {"train_loss": -6.388009548187256, "global_step": 109050, "epoch": 2596} {"train_loss": -6.4037628173828125, "global_step": 109051, "epoch": 2596} {"train_loss": -6.351363182067871, "global_step": 109052, "epoch": 2596} {"train_loss": -6.406522750854492, "global_step": 109053, "epoch": 2596} {"train_loss": -6.437326908111572, "global_step": 109054, "epoch": 2596} {"train_loss": -6.418404579162598, "global_step": 109055, "epoch": 2596} {"train_loss": -6.375129699707031, "global_step": 109056, "epoch": 2596} {"train_loss": -6.372654914855957, "global_step": 109057, "epoch": 2596} {"train_loss": -6.3865556716918945, "global_step": 109058, "epoch": 2596} {"train_loss": -6.365302085876465, "global_step": 109059, "epoch": 2596} {"train_loss": -6.490592956542969, "global_step": 109060, "epoch": 2596} {"train_loss": -6.310741424560547, "global_step": 109061, "epoch": 2596} {"train_loss": -6.487713813781738, "global_step": 109062, "epoch": 2596} {"train_loss": -6.338398456573486, "global_step": 109063, "epoch": 2596} {"train_loss": -6.446907043457031, "global_step": 109064, "epoch": 2596} {"train_loss": -6.497100830078125, "global_step": 109065, "epoch": 2596} {"train_loss": -6.426721572875977, "global_step": 109066, "epoch": 2596} {"train_loss": -6.542880058288574, "global_step": 109067, "epoch": 2596} {"train_loss": -6.468905448913574, "global_step": 109068, "epoch": 2596} {"train_loss": -6.563594818115234, "global_step": 109069, "epoch": 2596} {"train_loss": -6.419003963470459, "global_step": 109070, "epoch": 2596} {"train_loss": -6.457849502563477, "global_step": 109071, "epoch": 2596} {"train_loss": -6.373313903808594, "global_step": 109072, "epoch": 2596} {"train_loss": -6.423890068417504, "global_step": 109073, "epoch": 2596, "val_loss": 76468.8125} {"train_loss": -6.468536376953125, "global_step": 109074, "epoch": 2597} {"train_loss": -6.476279258728027, "global_step": 109075, "epoch": 2597} {"train_loss": -6.576535224914551, "global_step": 109076, "epoch": 2597} {"train_loss": -6.409618377685547, "global_step": 109077, "epoch": 2597} {"train_loss": -6.400850296020508, "global_step": 109078, "epoch": 2597} {"train_loss": -6.496804237365723, "global_step": 109079, "epoch": 2597} {"train_loss": -6.557722091674805, "global_step": 109080, "epoch": 2597} {"train_loss": -6.464812278747559, "global_step": 109081, "epoch": 2597} {"train_loss": -6.260031223297119, "global_step": 109082, "epoch": 2597} {"train_loss": -6.438941955566406, "global_step": 109083, "epoch": 2597} {"train_loss": -6.3776774406433105, "global_step": 109084, "epoch": 2597} {"train_loss": -6.465217590332031, "global_step": 109085, "epoch": 2597} {"train_loss": -6.414650917053223, "global_step": 109086, "epoch": 2597} {"train_loss": -6.365128517150879, "global_step": 109087, "epoch": 2597} {"train_loss": -6.477663040161133, "global_step": 109088, "epoch": 2597} {"train_loss": -6.553808212280273, "global_step": 109089, "epoch": 2597} {"train_loss": -6.434312343597412, "global_step": 109090, "epoch": 2597} {"train_loss": -6.518104553222656, "global_step": 109091, "epoch": 2597} {"train_loss": -6.490818023681641, "global_step": 109092, "epoch": 2597} {"train_loss": -6.432437419891357, "global_step": 109093, "epoch": 2597} {"train_loss": -6.503786563873291, "global_step": 109094, "epoch": 2597} {"train_loss": -6.243398666381836, "global_step": 109095, "epoch": 2597} {"train_loss": -6.511785507202148, "global_step": 109096, "epoch": 2597} {"train_loss": -6.370195388793945, "global_step": 109097, "epoch": 2597} {"train_loss": -6.425948143005371, "global_step": 109098, "epoch": 2597} {"train_loss": -6.461440086364746, "global_step": 109099, "epoch": 2597} {"train_loss": -6.485299587249756, "global_step": 109100, "epoch": 2597} {"train_loss": -6.53589391708374, "global_step": 109101, "epoch": 2597} {"train_loss": -6.390793323516846, "global_step": 109102, "epoch": 2597} {"train_loss": -6.580889701843262, "global_step": 109103, "epoch": 2597} {"train_loss": -6.46940803527832, "global_step": 109104, "epoch": 2597} {"train_loss": -6.533280372619629, "global_step": 109105, "epoch": 2597} {"train_loss": -6.463929653167725, "global_step": 109106, "epoch": 2597} {"train_loss": -6.517782211303711, "global_step": 109107, "epoch": 2597} {"train_loss": -6.422576904296875, "global_step": 109108, "epoch": 2597} {"train_loss": -6.451392650604248, "global_step": 109109, "epoch": 2597} {"train_loss": -6.5290679931640625, "global_step": 109110, "epoch": 2597} {"train_loss": -6.528493881225586, "global_step": 109111, "epoch": 2597} {"train_loss": -6.4287309646606445, "global_step": 109112, "epoch": 2597} {"train_loss": -6.311389923095703, "global_step": 109113, "epoch": 2597} {"train_loss": -6.486061096191406, "global_step": 109114, "epoch": 2597} {"train_loss": -6.455081655865624, "global_step": 109115, "epoch": 2597, "val_loss": 76419.46875} {"train_loss": -6.394275665283203, "global_step": 109116, "epoch": 2598} {"train_loss": -6.495687961578369, "global_step": 109117, "epoch": 2598} {"train_loss": -6.425938606262207, "global_step": 109118, "epoch": 2598} {"train_loss": -6.540946960449219, "global_step": 109119, "epoch": 2598} {"train_loss": -6.466628074645996, "global_step": 109120, "epoch": 2598} {"train_loss": -6.486303329467773, "global_step": 109121, "epoch": 2598} {"train_loss": -6.48963737487793, "global_step": 109122, "epoch": 2598} {"train_loss": -6.454606533050537, "global_step": 109123, "epoch": 2598} {"train_loss": -6.500912666320801, "global_step": 109124, "epoch": 2598} {"train_loss": -6.47211217880249, "global_step": 109125, "epoch": 2598} {"train_loss": -6.423529624938965, "global_step": 109126, "epoch": 2598} {"train_loss": -6.58597469329834, "global_step": 109127, "epoch": 2598} {"train_loss": -6.466754913330078, "global_step": 109128, "epoch": 2598} {"train_loss": -6.447074890136719, "global_step": 109129, "epoch": 2598} {"train_loss": -6.573854446411133, "global_step": 109130, "epoch": 2598} {"train_loss": -6.449010848999023, "global_step": 109131, "epoch": 2598} {"train_loss": -6.381429672241211, "global_step": 109132, "epoch": 2598} {"train_loss": -6.493800640106201, "global_step": 109133, "epoch": 2598} {"train_loss": -6.479108810424805, "global_step": 109134, "epoch": 2598} {"train_loss": -6.554291248321533, "global_step": 109135, "epoch": 2598} {"train_loss": -6.491977691650391, "global_step": 109136, "epoch": 2598} {"train_loss": -6.430246353149414, "global_step": 109137, "epoch": 2598} {"train_loss": -6.478524208068848, "global_step": 109138, "epoch": 2598} {"train_loss": -6.419755935668945, "global_step": 109139, "epoch": 2598} {"train_loss": -6.307650566101074, "global_step": 109140, "epoch": 2598} {"train_loss": -6.421635627746582, "global_step": 109141, "epoch": 2598} {"train_loss": -6.425408363342285, "global_step": 109142, "epoch": 2598} {"train_loss": -6.385343551635742, "global_step": 109143, "epoch": 2598} {"train_loss": -6.462674617767334, "global_step": 109144, "epoch": 2598} {"train_loss": -6.318819046020508, "global_step": 109145, "epoch": 2598} {"train_loss": -6.270693778991699, "global_step": 109146, "epoch": 2598} {"train_loss": -6.39998197555542, "global_step": 109147, "epoch": 2598} {"train_loss": -6.394163131713867, "global_step": 109148, "epoch": 2598} {"train_loss": -6.326904296875, "global_step": 109149, "epoch": 2598} {"train_loss": -6.370666027069092, "global_step": 109150, "epoch": 2598} {"train_loss": -6.268550395965576, "global_step": 109151, "epoch": 2598} {"train_loss": -6.353737831115723, "global_step": 109152, "epoch": 2598} {"train_loss": -6.370460033416748, "global_step": 109153, "epoch": 2598} {"train_loss": -6.485354900360107, "global_step": 109154, "epoch": 2598} {"train_loss": -6.4120965003967285, "global_step": 109155, "epoch": 2598} {"train_loss": -6.404513835906982, "global_step": 109156, "epoch": 2598} {"train_loss": -6.434012220019386, "global_step": 109157, "epoch": 2598, "val_loss": 75928.1015625} {"train_loss": -6.415541172027588, "global_step": 109158, "epoch": 2599} {"train_loss": -6.432195663452148, "global_step": 109159, "epoch": 2599} {"train_loss": -6.574756622314453, "global_step": 109160, "epoch": 2599} {"train_loss": -6.402108669281006, "global_step": 109161, "epoch": 2599} {"train_loss": -6.443857192993164, "global_step": 109162, "epoch": 2599} {"train_loss": -6.530665397644043, "global_step": 109163, "epoch": 2599} {"train_loss": -6.412775993347168, "global_step": 109164, "epoch": 2599} {"train_loss": -6.4585490226745605, "global_step": 109165, "epoch": 2599} {"train_loss": -6.407644271850586, "global_step": 109166, "epoch": 2599} {"train_loss": -6.448140621185303, "global_step": 109167, "epoch": 2599} {"train_loss": -6.476795196533203, "global_step": 109168, "epoch": 2599} {"train_loss": -6.417642593383789, "global_step": 109169, "epoch": 2599} {"train_loss": -6.444492340087891, "global_step": 109170, "epoch": 2599} {"train_loss": -6.536170959472656, "global_step": 109171, "epoch": 2599} {"train_loss": -6.315615653991699, "global_step": 109172, "epoch": 2599} {"train_loss": -6.3329315185546875, "global_step": 109173, "epoch": 2599} {"train_loss": -6.470599174499512, "global_step": 109174, "epoch": 2599} {"train_loss": -6.43534517288208, "global_step": 109175, "epoch": 2599} {"train_loss": -6.663077354431152, "global_step": 109176, "epoch": 2599} {"train_loss": -6.433396816253662, "global_step": 109177, "epoch": 2599} {"train_loss": -6.529420852661133, "global_step": 109178, "epoch": 2599} {"train_loss": -6.429025650024414, "global_step": 109179, "epoch": 2599} {"train_loss": -6.42852783203125, "global_step": 109180, "epoch": 2599} {"train_loss": -6.385029315948486, "global_step": 109181, "epoch": 2599} {"train_loss": -6.391414642333984, "global_step": 109182, "epoch": 2599} {"train_loss": -6.412139415740967, "global_step": 109183, "epoch": 2599} {"train_loss": -6.514181613922119, "global_step": 109184, "epoch": 2599} {"train_loss": -6.411854267120361, "global_step": 109185, "epoch": 2599} {"train_loss": -6.567250728607178, "global_step": 109186, "epoch": 2599} {"train_loss": -6.497877597808838, "global_step": 109187, "epoch": 2599} {"train_loss": -6.43483829498291, "global_step": 109188, "epoch": 2599} {"train_loss": -6.555262088775635, "global_step": 109189, "epoch": 2599} {"train_loss": -6.3784685134887695, "global_step": 109190, "epoch": 2599} {"train_loss": -6.443068027496338, "global_step": 109191, "epoch": 2599} {"train_loss": -6.445575714111328, "global_step": 109192, "epoch": 2599} {"train_loss": -6.390063285827637, "global_step": 109193, "epoch": 2599} {"train_loss": -6.448683738708496, "global_step": 109194, "epoch": 2599} {"train_loss": -6.5384840965271, "global_step": 109195, "epoch": 2599} {"train_loss": -6.479453086853027, "global_step": 109196, "epoch": 2599} {"train_loss": -6.51759147644043, "global_step": 109197, "epoch": 2599} {"train_loss": -6.538219928741455, "global_step": 109198, "epoch": 2599} {"train_loss": -6.455955232892718, "global_step": 109199, "epoch": 2599, "val_loss": 76159.7578125} {"train_loss": -6.5279693603515625, "global_step": 109200, "epoch": 2600} {"train_loss": -6.460004806518555, "global_step": 109201, "epoch": 2600} {"train_loss": -6.5395097732543945, "global_step": 109202, "epoch": 2600} {"train_loss": -6.445426940917969, "global_step": 109203, "epoch": 2600} {"train_loss": -6.393039226531982, "global_step": 109204, "epoch": 2600} {"train_loss": -6.421116828918457, "global_step": 109205, "epoch": 2600} {"train_loss": -6.436206817626953, "global_step": 109206, "epoch": 2600} {"train_loss": -6.4313836097717285, "global_step": 109207, "epoch": 2600} {"train_loss": -6.549714088439941, "global_step": 109208, "epoch": 2600} {"train_loss": -6.52078914642334, "global_step": 109209, "epoch": 2600} {"train_loss": -6.380218982696533, "global_step": 109210, "epoch": 2600} {"train_loss": -6.579937934875488, "global_step": 109211, "epoch": 2600} {"train_loss": -6.408729076385498, "global_step": 109212, "epoch": 2600} {"train_loss": -6.482173442840576, "global_step": 109213, "epoch": 2600} {"train_loss": -6.350838661193848, "global_step": 109214, "epoch": 2600} {"train_loss": -6.413463592529297, "global_step": 109215, "epoch": 2600} {"train_loss": -6.5198073387146, "global_step": 109216, "epoch": 2600} {"train_loss": -6.3946428298950195, "global_step": 109217, "epoch": 2600} {"train_loss": -6.4682793617248535, "global_step": 109218, "epoch": 2600} {"train_loss": -6.513696670532227, "global_step": 109219, "epoch": 2600} {"train_loss": -6.5269904136657715, "global_step": 109220, "epoch": 2600} {"train_loss": -6.49653959274292, "global_step": 109221, "epoch": 2600} {"train_loss": -6.560966491699219, "global_step": 109222, "epoch": 2600} {"train_loss": -6.491666793823242, "global_step": 109223, "epoch": 2600} {"train_loss": -6.348825931549072, "global_step": 109224, "epoch": 2600} {"train_loss": -6.473005294799805, "global_step": 109225, "epoch": 2600} {"train_loss": -6.386322975158691, "global_step": 109226, "epoch": 2600} {"train_loss": -6.248888969421387, "global_step": 109227, "epoch": 2600} {"train_loss": -6.502330780029297, "global_step": 109228, "epoch": 2600} {"train_loss": -6.458658218383789, "global_step": 109229, "epoch": 2600} {"train_loss": -6.429440498352051, "global_step": 109230, "epoch": 2600} {"train_loss": -6.383605480194092, "global_step": 109231, "epoch": 2600} {"train_loss": -6.461967468261719, "global_step": 109232, "epoch": 2600} {"train_loss": -6.495510101318359, "global_step": 109233, "epoch": 2600} {"train_loss": -6.329671859741211, "global_step": 109234, "epoch": 2600} {"train_loss": -6.418335914611816, "global_step": 109235, "epoch": 2600} {"train_loss": -6.327149868011475, "global_step": 109236, "epoch": 2600} {"train_loss": -6.444428443908691, "global_step": 109237, "epoch": 2600} {"train_loss": -6.462204933166504, "global_step": 109238, "epoch": 2600} {"train_loss": -6.439385414123535, "global_step": 109239, "epoch": 2600} {"train_loss": -6.426812171936035, "global_step": 109240, "epoch": 2600} {"train_loss": -6.449084032149542, "global_step": 109241, "epoch": 2600, "train/sim_max_reward_0": 0.8746294271440459, "train/sim_max_reward_1": 0.9030858846699332, "train/sim_max_reward_2": 0.444737982914116, "train/sim_max_reward_3": 0.13740947459733688, "train/sim_max_reward_4": 0.8974249487536372, "train/sim_max_reward_5": 0.9908811460249596, "test/sim_max_reward_4500000": 0.965267562172715, "test/sim_max_reward_4500001": 0.9489339170745, "test/sim_max_reward_4500002": 0.9155599745278116, "test/sim_max_reward_4500003": 0.9391177733159498, "test/sim_max_reward_4500004": 1.0, "test/sim_max_reward_4500005": 0.9582854010224603, "test/sim_max_reward_4500006": 0.9421163594240965, "test/sim_max_reward_4500007": 0.8536800012202886, "test/sim_max_reward_4500008": 0.25337162996860135, "test/sim_max_reward_4500009": 0.053459430171863886, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9450177288300209, "test/sim_max_reward_4500012": 0.9741757820594118, "test/sim_max_reward_4500013": 0.01424277595488135, "test/sim_max_reward_4500014": 0.9099534772618703, "test/sim_max_reward_4500015": 0.9703375476629731, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.1945851576627448, "test/sim_max_reward_4500018": 0.45809911909588436, "test/sim_max_reward_4500019": 0.8817365749820634, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9386648396668151, "test/sim_max_reward_4500022": 0.9731537945404408, "test/sim_max_reward_4500023": 0.9677657373005112, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9302228524878207, "test/sim_max_reward_4500026": 0.9249037076851307, "test/sim_max_reward_4500027": 0.8872908523843963, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.08009164159379285, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.910578712081344, "test/sim_max_reward_4500034": 0.6931042774379209, "test/sim_max_reward_4500035": 0.9582482806821515, "test/sim_max_reward_4500036": 0.9514196506230079, "test/sim_max_reward_4500037": 0.9346356947709723, "test/sim_max_reward_4500038": 0.8958323345413914, "test/sim_max_reward_4500039": 1.0, "test/sim_max_reward_4500040": 0.9985743642979232, "test/sim_max_reward_4500041": 0.41318337537160604, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.7543020373403139, "test/sim_max_reward_4500044": 0.15077329532886896, "test/sim_max_reward_4500045": 0.4027262577692619, "test/sim_max_reward_4500046": 0.8921704859350559, "test/sim_max_reward_4500047": 0.9574295580744493, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.7080281440173382, "test/mean_score": 0.6413536543884164, "val_loss": 76132.6484375} {"train_loss": -6.4329328536987305, "global_step": 109242, "epoch": 2601} {"train_loss": -6.51529598236084, "global_step": 109243, "epoch": 2601} {"train_loss": -6.533088684082031, "global_step": 109244, "epoch": 2601} {"train_loss": -6.490019798278809, "global_step": 109245, "epoch": 2601} {"train_loss": -6.537600517272949, "global_step": 109246, "epoch": 2601} {"train_loss": -6.403059005737305, "global_step": 109247, "epoch": 2601} {"train_loss": -6.506682395935059, "global_step": 109248, "epoch": 2601} {"train_loss": -6.607649326324463, "global_step": 109249, "epoch": 2601} {"train_loss": -6.391010284423828, "global_step": 109250, "epoch": 2601} {"train_loss": -6.530308723449707, "global_step": 109251, "epoch": 2601} {"train_loss": -6.574583053588867, "global_step": 109252, "epoch": 2601} {"train_loss": -6.375033378601074, "global_step": 109253, "epoch": 2601} {"train_loss": -6.444095134735107, "global_step": 109254, "epoch": 2601} {"train_loss": -6.541428565979004, "global_step": 109255, "epoch": 2601} {"train_loss": -6.49846076965332, "global_step": 109256, "epoch": 2601} {"train_loss": -6.528447151184082, "global_step": 109257, "epoch": 2601} {"train_loss": -6.472835540771484, "global_step": 109258, "epoch": 2601} {"train_loss": -6.458091735839844, "global_step": 109259, "epoch": 2601} {"train_loss": -6.425380706787109, "global_step": 109260, "epoch": 2601} {"train_loss": -6.552157878875732, "global_step": 109261, "epoch": 2601} {"train_loss": -6.454837799072266, "global_step": 109262, "epoch": 2601} {"train_loss": -6.39677619934082, "global_step": 109263, "epoch": 2601} {"train_loss": -6.625960350036621, "global_step": 109264, "epoch": 2601} {"train_loss": -6.52271842956543, "global_step": 109265, "epoch": 2601} {"train_loss": -6.489562034606934, "global_step": 109266, "epoch": 2601} {"train_loss": -6.447461128234863, "global_step": 109267, "epoch": 2601} {"train_loss": -6.548942565917969, "global_step": 109268, "epoch": 2601} {"train_loss": -6.422955513000488, "global_step": 109269, "epoch": 2601} {"train_loss": -6.4218363761901855, "global_step": 109270, "epoch": 2601} {"train_loss": -6.550584316253662, "global_step": 109271, "epoch": 2601} {"train_loss": -6.413937568664551, "global_step": 109272, "epoch": 2601} {"train_loss": -6.581954002380371, "global_step": 109273, "epoch": 2601} {"train_loss": -6.552337646484375, "global_step": 109274, "epoch": 2601} {"train_loss": -6.484015464782715, "global_step": 109275, "epoch": 2601} {"train_loss": -6.570943832397461, "global_step": 109276, "epoch": 2601} {"train_loss": -6.380597114562988, "global_step": 109277, "epoch": 2601} {"train_loss": -6.47821569442749, "global_step": 109278, "epoch": 2601} {"train_loss": -6.524625301361084, "global_step": 109279, "epoch": 2601} {"train_loss": -6.440067291259766, "global_step": 109280, "epoch": 2601} {"train_loss": -6.493483543395996, "global_step": 109281, "epoch": 2601} {"train_loss": -6.438360214233398, "global_step": 109282, "epoch": 2601} {"train_loss": -6.486531325748989, "global_step": 109283, "epoch": 2601, "val_loss": 76483.1640625} {"train_loss": -6.375796318054199, "global_step": 109284, "epoch": 2602} {"train_loss": -6.447026252746582, "global_step": 109285, "epoch": 2602} {"train_loss": -6.409470081329346, "global_step": 109286, "epoch": 2602} {"train_loss": -6.3543243408203125, "global_step": 109287, "epoch": 2602} {"train_loss": -6.479081630706787, "global_step": 109288, "epoch": 2602} {"train_loss": -6.518290042877197, "global_step": 109289, "epoch": 2602} {"train_loss": -6.429208755493164, "global_step": 109290, "epoch": 2602} {"train_loss": -6.477149963378906, "global_step": 109291, "epoch": 2602} {"train_loss": -6.391148090362549, "global_step": 109292, "epoch": 2602} {"train_loss": -6.3941650390625, "global_step": 109293, "epoch": 2602} {"train_loss": -6.474145889282227, "global_step": 109294, "epoch": 2602} {"train_loss": -6.392689228057861, "global_step": 109295, "epoch": 2602} {"train_loss": -6.467459678649902, "global_step": 109296, "epoch": 2602} {"train_loss": -6.494039058685303, "global_step": 109297, "epoch": 2602} {"train_loss": -6.4047627449035645, "global_step": 109298, "epoch": 2602} {"train_loss": -6.547863960266113, "global_step": 109299, "epoch": 2602} {"train_loss": -6.329071044921875, "global_step": 109300, "epoch": 2602} {"train_loss": -6.477597236633301, "global_step": 109301, "epoch": 2602} {"train_loss": -6.434945106506348, "global_step": 109302, "epoch": 2602} {"train_loss": -6.359992504119873, "global_step": 109303, "epoch": 2602} {"train_loss": -6.4574432373046875, "global_step": 109304, "epoch": 2602} {"train_loss": -6.4551100730896, "global_step": 109305, "epoch": 2602} {"train_loss": -6.543036460876465, "global_step": 109306, "epoch": 2602} {"train_loss": -6.509001731872559, "global_step": 109307, "epoch": 2602} {"train_loss": -6.633684158325195, "global_step": 109308, "epoch": 2602} {"train_loss": -6.3700666427612305, "global_step": 109309, "epoch": 2602} {"train_loss": -6.368740081787109, "global_step": 109310, "epoch": 2602} {"train_loss": -6.42827033996582, "global_step": 109311, "epoch": 2602} {"train_loss": -6.44807243347168, "global_step": 109312, "epoch": 2602} {"train_loss": -6.368485927581787, "global_step": 109313, "epoch": 2602} {"train_loss": -6.287943363189697, "global_step": 109314, "epoch": 2602} {"train_loss": -6.370718002319336, "global_step": 109315, "epoch": 2602} {"train_loss": -6.342532157897949, "global_step": 109316, "epoch": 2602} {"train_loss": -6.426817893981934, "global_step": 109317, "epoch": 2602} {"train_loss": -6.326411247253418, "global_step": 109318, "epoch": 2602} {"train_loss": -6.4020891189575195, "global_step": 109319, "epoch": 2602} {"train_loss": -6.403525352478027, "global_step": 109320, "epoch": 2602} {"train_loss": -6.497237205505371, "global_step": 109321, "epoch": 2602} {"train_loss": -6.344198226928711, "global_step": 109322, "epoch": 2602} {"train_loss": -6.490630626678467, "global_step": 109323, "epoch": 2602} {"train_loss": -6.372902870178223, "global_step": 109324, "epoch": 2602} {"train_loss": -6.428032682055519, "global_step": 109325, "epoch": 2602, "val_loss": 76195.2578125} {"train_loss": -6.404902458190918, "global_step": 109326, "epoch": 2603} {"train_loss": -6.532164573669434, "global_step": 109327, "epoch": 2603} {"train_loss": -6.445279121398926, "global_step": 109328, "epoch": 2603} {"train_loss": -6.44615364074707, "global_step": 109329, "epoch": 2603} {"train_loss": -6.360725402832031, "global_step": 109330, "epoch": 2603} {"train_loss": -6.40067195892334, "global_step": 109331, "epoch": 2603} {"train_loss": -6.524317741394043, "global_step": 109332, "epoch": 2603} {"train_loss": -6.441220283508301, "global_step": 109333, "epoch": 2603} {"train_loss": -6.457587242126465, "global_step": 109334, "epoch": 2603} {"train_loss": -6.444742202758789, "global_step": 109335, "epoch": 2603} {"train_loss": -6.47252082824707, "global_step": 109336, "epoch": 2603} {"train_loss": -6.428396701812744, "global_step": 109337, "epoch": 2603} {"train_loss": -6.4414238929748535, "global_step": 109338, "epoch": 2603} {"train_loss": -6.362095355987549, "global_step": 109339, "epoch": 2603} {"train_loss": -6.4929399490356445, "global_step": 109340, "epoch": 2603} {"train_loss": -6.479414463043213, "global_step": 109341, "epoch": 2603} {"train_loss": -6.496103286743164, "global_step": 109342, "epoch": 2603} {"train_loss": -6.428206443786621, "global_step": 109343, "epoch": 2603} {"train_loss": -6.410190105438232, "global_step": 109344, "epoch": 2603} {"train_loss": -6.428771018981934, "global_step": 109345, "epoch": 2603} {"train_loss": -6.530289649963379, "global_step": 109346, "epoch": 2603} {"train_loss": -6.322404861450195, "global_step": 109347, "epoch": 2603} {"train_loss": -6.551565170288086, "global_step": 109348, "epoch": 2603} {"train_loss": -6.474542617797852, "global_step": 109349, "epoch": 2603} {"train_loss": -6.405735969543457, "global_step": 109350, "epoch": 2603} {"train_loss": -6.507335662841797, "global_step": 109351, "epoch": 2603} {"train_loss": -6.4480299949646, "global_step": 109352, "epoch": 2603} {"train_loss": -6.485056400299072, "global_step": 109353, "epoch": 2603} {"train_loss": -6.448514938354492, "global_step": 109354, "epoch": 2603} {"train_loss": -6.52406644821167, "global_step": 109355, "epoch": 2603} {"train_loss": -6.579366683959961, "global_step": 109356, "epoch": 2603} {"train_loss": -6.513649940490723, "global_step": 109357, "epoch": 2603} {"train_loss": -6.464642524719238, "global_step": 109358, "epoch": 2603} {"train_loss": -6.544029235839844, "global_step": 109359, "epoch": 2603} {"train_loss": -6.612282752990723, "global_step": 109360, "epoch": 2603} {"train_loss": -6.458925247192383, "global_step": 109361, "epoch": 2603} {"train_loss": -6.5226287841796875, "global_step": 109362, "epoch": 2603} {"train_loss": -6.509109973907471, "global_step": 109363, "epoch": 2603} {"train_loss": -6.426253795623779, "global_step": 109364, "epoch": 2603} {"train_loss": -6.421857833862305, "global_step": 109365, "epoch": 2603} {"train_loss": -6.512648582458496, "global_step": 109366, "epoch": 2603} {"train_loss": -6.46792957896278, "global_step": 109367, "epoch": 2603, "val_loss": 76237.2734375} {"train_loss": -6.488000869750977, "global_step": 109368, "epoch": 2604} {"train_loss": -6.49981689453125, "global_step": 109369, "epoch": 2604} {"train_loss": -6.267226219177246, "global_step": 109370, "epoch": 2604} {"train_loss": -6.487720966339111, "global_step": 109371, "epoch": 2604} {"train_loss": -6.544678688049316, "global_step": 109372, "epoch": 2604} {"train_loss": -6.25374698638916, "global_step": 109373, "epoch": 2604} {"train_loss": -6.500879287719727, "global_step": 109374, "epoch": 2604} {"train_loss": -6.511444568634033, "global_step": 109375, "epoch": 2604} {"train_loss": -6.481453895568848, "global_step": 109376, "epoch": 2604} {"train_loss": -6.343698501586914, "global_step": 109377, "epoch": 2604} {"train_loss": -6.4837164878845215, "global_step": 109378, "epoch": 2604} {"train_loss": -6.338309288024902, "global_step": 109379, "epoch": 2604} {"train_loss": -6.523629665374756, "global_step": 109380, "epoch": 2604} {"train_loss": -6.319316864013672, "global_step": 109381, "epoch": 2604} {"train_loss": -6.312177658081055, "global_step": 109382, "epoch": 2604} {"train_loss": -6.478988170623779, "global_step": 109383, "epoch": 2604} {"train_loss": -6.442811489105225, "global_step": 109384, "epoch": 2604} {"train_loss": -6.412923812866211, "global_step": 109385, "epoch": 2604} {"train_loss": -6.4637346267700195, "global_step": 109386, "epoch": 2604} {"train_loss": -6.346126556396484, "global_step": 109387, "epoch": 2604} {"train_loss": -6.495187759399414, "global_step": 109388, "epoch": 2604} {"train_loss": -6.350805759429932, "global_step": 109389, "epoch": 2604} {"train_loss": -6.515598297119141, "global_step": 109390, "epoch": 2604} {"train_loss": -6.412075042724609, "global_step": 109391, "epoch": 2604} {"train_loss": -6.529151439666748, "global_step": 109392, "epoch": 2604} {"train_loss": -6.458288192749023, "global_step": 109393, "epoch": 2604} {"train_loss": -6.470682621002197, "global_step": 109394, "epoch": 2604} {"train_loss": -6.56794548034668, "global_step": 109395, "epoch": 2604} {"train_loss": -6.5062479972839355, "global_step": 109396, "epoch": 2604} {"train_loss": -6.39592170715332, "global_step": 109397, "epoch": 2604} {"train_loss": -6.454690933227539, "global_step": 109398, "epoch": 2604} {"train_loss": -6.457926273345947, "global_step": 109399, "epoch": 2604} {"train_loss": -6.512842178344727, "global_step": 109400, "epoch": 2604} {"train_loss": -6.298879623413086, "global_step": 109401, "epoch": 2604} {"train_loss": -6.473514556884766, "global_step": 109402, "epoch": 2604} {"train_loss": -6.4344401359558105, "global_step": 109403, "epoch": 2604} {"train_loss": -6.508807182312012, "global_step": 109404, "epoch": 2604} {"train_loss": -6.550385475158691, "global_step": 109405, "epoch": 2604} {"train_loss": -6.544750213623047, "global_step": 109406, "epoch": 2604} {"train_loss": -6.504972457885742, "global_step": 109407, "epoch": 2604} {"train_loss": -6.431098461151123, "global_step": 109408, "epoch": 2604} {"train_loss": -6.4492592470986505, "global_step": 109409, "epoch": 2604, "val_loss": 75990.9375} {"train_loss": -6.492467403411865, "global_step": 109410, "epoch": 2605} {"train_loss": -6.528933525085449, "global_step": 109411, "epoch": 2605} {"train_loss": -6.495552062988281, "global_step": 109412, "epoch": 2605} {"train_loss": -6.5849080085754395, "global_step": 109413, "epoch": 2605} {"train_loss": -6.405977249145508, "global_step": 109414, "epoch": 2605} {"train_loss": -6.484155178070068, "global_step": 109415, "epoch": 2605} {"train_loss": -6.4476470947265625, "global_step": 109416, "epoch": 2605} {"train_loss": -6.573266506195068, "global_step": 109417, "epoch": 2605} {"train_loss": -6.612321853637695, "global_step": 109418, "epoch": 2605} {"train_loss": -6.533336639404297, "global_step": 109419, "epoch": 2605} {"train_loss": -6.4630937576293945, "global_step": 109420, "epoch": 2605} {"train_loss": -6.4576215744018555, "global_step": 109421, "epoch": 2605} {"train_loss": -6.518060684204102, "global_step": 109422, "epoch": 2605} {"train_loss": -6.468178749084473, "global_step": 109423, "epoch": 2605} {"train_loss": -6.438316345214844, "global_step": 109424, "epoch": 2605} {"train_loss": -6.49147891998291, "global_step": 109425, "epoch": 2605} {"train_loss": -6.40080451965332, "global_step": 109426, "epoch": 2605} {"train_loss": -6.500064849853516, "global_step": 109427, "epoch": 2605} {"train_loss": -6.560503005981445, "global_step": 109428, "epoch": 2605} {"train_loss": -6.476510047912598, "global_step": 109429, "epoch": 2605} {"train_loss": -6.491236209869385, "global_step": 109430, "epoch": 2605} {"train_loss": -6.360195159912109, "global_step": 109431, "epoch": 2605} {"train_loss": -6.612644195556641, "global_step": 109432, "epoch": 2605} {"train_loss": -6.576302528381348, "global_step": 109433, "epoch": 2605} {"train_loss": -6.416698455810547, "global_step": 109434, "epoch": 2605} {"train_loss": -6.59300422668457, "global_step": 109435, "epoch": 2605} {"train_loss": -6.441277503967285, "global_step": 109436, "epoch": 2605} {"train_loss": -6.405632972717285, "global_step": 109437, "epoch": 2605} {"train_loss": -6.588896751403809, "global_step": 109438, "epoch": 2605} {"train_loss": -6.475369453430176, "global_step": 109439, "epoch": 2605} {"train_loss": -6.505204200744629, "global_step": 109440, "epoch": 2605} {"train_loss": -6.4160475730896, "global_step": 109441, "epoch": 2605} {"train_loss": -6.4792938232421875, "global_step": 109442, "epoch": 2605} {"train_loss": -6.444986820220947, "global_step": 109443, "epoch": 2605} {"train_loss": -6.570362091064453, "global_step": 109444, "epoch": 2605} {"train_loss": -6.5085978507995605, "global_step": 109445, "epoch": 2605} {"train_loss": -6.3880228996276855, "global_step": 109446, "epoch": 2605} {"train_loss": -6.477482318878174, "global_step": 109447, "epoch": 2605} {"train_loss": -6.485759735107422, "global_step": 109448, "epoch": 2605} {"train_loss": -6.4014763832092285, "global_step": 109449, "epoch": 2605} {"train_loss": -6.478437423706055, "global_step": 109450, "epoch": 2605} {"train_loss": -6.490512473242624, "global_step": 109451, "epoch": 2605, "val_loss": 76198.078125} {"train_loss": -6.522923946380615, "global_step": 109452, "epoch": 2606} {"train_loss": -6.520850658416748, "global_step": 109453, "epoch": 2606} {"train_loss": -6.499410629272461, "global_step": 109454, "epoch": 2606} {"train_loss": -6.527584552764893, "global_step": 109455, "epoch": 2606} {"train_loss": -6.487459182739258, "global_step": 109456, "epoch": 2606} {"train_loss": -6.518087387084961, "global_step": 109457, "epoch": 2606} {"train_loss": -6.522485256195068, "global_step": 109458, "epoch": 2606} {"train_loss": -6.468648910522461, "global_step": 109459, "epoch": 2606} {"train_loss": -6.5893659591674805, "global_step": 109460, "epoch": 2606} {"train_loss": -6.4571638107299805, "global_step": 109461, "epoch": 2606} {"train_loss": -6.495235443115234, "global_step": 109462, "epoch": 2606} {"train_loss": -6.488272190093994, "global_step": 109463, "epoch": 2606} {"train_loss": -6.512350082397461, "global_step": 109464, "epoch": 2606} {"train_loss": -6.585700988769531, "global_step": 109465, "epoch": 2606} {"train_loss": -6.39107608795166, "global_step": 109466, "epoch": 2606} {"train_loss": -6.473089218139648, "global_step": 109467, "epoch": 2606} {"train_loss": -6.501041412353516, "global_step": 109468, "epoch": 2606} {"train_loss": -6.52338981628418, "global_step": 109469, "epoch": 2606} {"train_loss": -6.333319187164307, "global_step": 109470, "epoch": 2606} {"train_loss": -6.454428672790527, "global_step": 109471, "epoch": 2606} {"train_loss": -6.412710189819336, "global_step": 109472, "epoch": 2606} {"train_loss": -6.438046932220459, "global_step": 109473, "epoch": 2606} {"train_loss": -6.332729339599609, "global_step": 109474, "epoch": 2606} {"train_loss": -6.362769603729248, "global_step": 109475, "epoch": 2606} {"train_loss": -6.404984474182129, "global_step": 109476, "epoch": 2606} {"train_loss": -6.382049083709717, "global_step": 109477, "epoch": 2606} {"train_loss": -6.407712936401367, "global_step": 109478, "epoch": 2606} {"train_loss": -6.394524097442627, "global_step": 109479, "epoch": 2606} {"train_loss": -6.393021583557129, "global_step": 109480, "epoch": 2606} {"train_loss": -6.309200286865234, "global_step": 109481, "epoch": 2606} {"train_loss": -6.385488510131836, "global_step": 109482, "epoch": 2606} {"train_loss": -6.468558311462402, "global_step": 109483, "epoch": 2606} {"train_loss": -6.4772138595581055, "global_step": 109484, "epoch": 2606} {"train_loss": -6.533944129943848, "global_step": 109485, "epoch": 2606} {"train_loss": -6.401634216308594, "global_step": 109486, "epoch": 2606} {"train_loss": -6.439519882202148, "global_step": 109487, "epoch": 2606} {"train_loss": -6.361316680908203, "global_step": 109488, "epoch": 2606} {"train_loss": -6.532748222351074, "global_step": 109489, "epoch": 2606} {"train_loss": -6.35715389251709, "global_step": 109490, "epoch": 2606} {"train_loss": -6.3603315353393555, "global_step": 109491, "epoch": 2606} {"train_loss": -6.4353461265563965, "global_step": 109492, "epoch": 2606} {"train_loss": -6.450283765792847, "global_step": 109493, "epoch": 2606, "val_loss": 76415.6953125} {"train_loss": -6.447943687438965, "global_step": 109494, "epoch": 2607} {"train_loss": -6.490457534790039, "global_step": 109495, "epoch": 2607} {"train_loss": -6.461548805236816, "global_step": 109496, "epoch": 2607} {"train_loss": -6.4959516525268555, "global_step": 109497, "epoch": 2607} {"train_loss": -6.412424087524414, "global_step": 109498, "epoch": 2607} {"train_loss": -6.475050926208496, "global_step": 109499, "epoch": 2607} {"train_loss": -6.45096492767334, "global_step": 109500, "epoch": 2607} {"train_loss": -6.4463348388671875, "global_step": 109501, "epoch": 2607} {"train_loss": -6.383378982543945, "global_step": 109502, "epoch": 2607} {"train_loss": -6.554819107055664, "global_step": 109503, "epoch": 2607} {"train_loss": -6.538165092468262, "global_step": 109504, "epoch": 2607} {"train_loss": -6.501353740692139, "global_step": 109505, "epoch": 2607} {"train_loss": -6.480607032775879, "global_step": 109506, "epoch": 2607} {"train_loss": -6.503561973571777, "global_step": 109507, "epoch": 2607} {"train_loss": -6.280220985412598, "global_step": 109508, "epoch": 2607} {"train_loss": -6.3883209228515625, "global_step": 109509, "epoch": 2607} {"train_loss": -6.456544876098633, "global_step": 109510, "epoch": 2607} {"train_loss": -6.41927433013916, "global_step": 109511, "epoch": 2607} {"train_loss": -6.4360551834106445, "global_step": 109512, "epoch": 2607} {"train_loss": -6.437963485717773, "global_step": 109513, "epoch": 2607} {"train_loss": -6.372780799865723, "global_step": 109514, "epoch": 2607} {"train_loss": -6.585179328918457, "global_step": 109515, "epoch": 2607} {"train_loss": -6.315614700317383, "global_step": 109516, "epoch": 2607} {"train_loss": -6.433077812194824, "global_step": 109517, "epoch": 2607} {"train_loss": -6.437534332275391, "global_step": 109518, "epoch": 2607} {"train_loss": -6.387423515319824, "global_step": 109519, "epoch": 2607} {"train_loss": -6.504892349243164, "global_step": 109520, "epoch": 2607} {"train_loss": -6.480111598968506, "global_step": 109521, "epoch": 2607} {"train_loss": -6.353278160095215, "global_step": 109522, "epoch": 2607} {"train_loss": -6.43265962600708, "global_step": 109523, "epoch": 2607} {"train_loss": -6.371074199676514, "global_step": 109524, "epoch": 2607} {"train_loss": -6.392970085144043, "global_step": 109525, "epoch": 2607} {"train_loss": -6.3225555419921875, "global_step": 109526, "epoch": 2607} {"train_loss": -6.452866554260254, "global_step": 109527, "epoch": 2607} {"train_loss": -6.370335578918457, "global_step": 109528, "epoch": 2607} {"train_loss": -6.293169021606445, "global_step": 109529, "epoch": 2607} {"train_loss": -6.385622024536133, "global_step": 109530, "epoch": 2607} {"train_loss": -6.232352256774902, "global_step": 109531, "epoch": 2607} {"train_loss": -6.266759872436523, "global_step": 109532, "epoch": 2607} {"train_loss": -6.453914165496826, "global_step": 109533, "epoch": 2607} {"train_loss": -6.320590496063232, "global_step": 109534, "epoch": 2607} {"train_loss": -6.4187780902499245, "global_step": 109535, "epoch": 2607, "val_loss": 75968.28125} {"train_loss": -6.357434272766113, "global_step": 109536, "epoch": 2608} {"train_loss": -6.334654808044434, "global_step": 109537, "epoch": 2608} {"train_loss": -6.314329624176025, "global_step": 109538, "epoch": 2608} {"train_loss": -6.5301833152771, "global_step": 109539, "epoch": 2608} {"train_loss": -6.286946773529053, "global_step": 109540, "epoch": 2608} {"train_loss": -6.4356842041015625, "global_step": 109541, "epoch": 2608} {"train_loss": -6.3028974533081055, "global_step": 109542, "epoch": 2608} {"train_loss": -6.467907905578613, "global_step": 109543, "epoch": 2608} {"train_loss": -6.361954212188721, "global_step": 109544, "epoch": 2608} {"train_loss": -6.418705940246582, "global_step": 109545, "epoch": 2608} {"train_loss": -6.560918807983398, "global_step": 109546, "epoch": 2608} {"train_loss": -6.476740837097168, "global_step": 109547, "epoch": 2608} {"train_loss": -6.566737174987793, "global_step": 109548, "epoch": 2608} {"train_loss": -6.417757511138916, "global_step": 109549, "epoch": 2608} {"train_loss": -6.576196670532227, "global_step": 109550, "epoch": 2608} {"train_loss": -6.463242053985596, "global_step": 109551, "epoch": 2608} {"train_loss": -6.518596649169922, "global_step": 109552, "epoch": 2608} {"train_loss": -6.508849143981934, "global_step": 109553, "epoch": 2608} {"train_loss": -6.353999137878418, "global_step": 109554, "epoch": 2608} {"train_loss": -6.42006778717041, "global_step": 109555, "epoch": 2608} {"train_loss": -6.383844375610352, "global_step": 109556, "epoch": 2608} {"train_loss": -6.485405921936035, "global_step": 109557, "epoch": 2608} {"train_loss": -6.516599655151367, "global_step": 109558, "epoch": 2608} {"train_loss": -6.504334449768066, "global_step": 109559, "epoch": 2608} {"train_loss": -6.320552825927734, "global_step": 109560, "epoch": 2608} {"train_loss": -6.485674858093262, "global_step": 109561, "epoch": 2608} {"train_loss": -6.448883056640625, "global_step": 109562, "epoch": 2608} {"train_loss": -6.4069013595581055, "global_step": 109563, "epoch": 2608} {"train_loss": -6.514959335327148, "global_step": 109564, "epoch": 2608} {"train_loss": -6.466590881347656, "global_step": 109565, "epoch": 2608} {"train_loss": -6.374386310577393, "global_step": 109566, "epoch": 2608} {"train_loss": -6.52656364440918, "global_step": 109567, "epoch": 2608} {"train_loss": -6.469919204711914, "global_step": 109568, "epoch": 2608} {"train_loss": -6.3028764724731445, "global_step": 109569, "epoch": 2608} {"train_loss": -6.42120361328125, "global_step": 109570, "epoch": 2608} {"train_loss": -6.328972816467285, "global_step": 109571, "epoch": 2608} {"train_loss": -6.372912406921387, "global_step": 109572, "epoch": 2608} {"train_loss": -6.402525901794434, "global_step": 109573, "epoch": 2608} {"train_loss": -6.393308639526367, "global_step": 109574, "epoch": 2608} {"train_loss": -6.471531391143799, "global_step": 109575, "epoch": 2608} {"train_loss": -6.460701942443848, "global_step": 109576, "epoch": 2608} {"train_loss": -6.435274010612851, "global_step": 109577, "epoch": 2608, "val_loss": 76653.6875} {"train_loss": -6.471128463745117, "global_step": 109578, "epoch": 2609} {"train_loss": -6.520150184631348, "global_step": 109579, "epoch": 2609} {"train_loss": -6.335561275482178, "global_step": 109580, "epoch": 2609} {"train_loss": -6.58639669418335, "global_step": 109581, "epoch": 2609} {"train_loss": -6.4770402908325195, "global_step": 109582, "epoch": 2609} {"train_loss": -6.443882942199707, "global_step": 109583, "epoch": 2609} {"train_loss": -6.526216983795166, "global_step": 109584, "epoch": 2609} {"train_loss": -6.4338154792785645, "global_step": 109585, "epoch": 2609} {"train_loss": -6.341732978820801, "global_step": 109586, "epoch": 2609} {"train_loss": -6.429534435272217, "global_step": 109587, "epoch": 2609} {"train_loss": -6.409928321838379, "global_step": 109588, "epoch": 2609} {"train_loss": -6.458468437194824, "global_step": 109589, "epoch": 2609} {"train_loss": -6.468789577484131, "global_step": 109590, "epoch": 2609} {"train_loss": -6.470486164093018, "global_step": 109591, "epoch": 2609} {"train_loss": -6.394458770751953, "global_step": 109592, "epoch": 2609} {"train_loss": -6.422328948974609, "global_step": 109593, "epoch": 2609} {"train_loss": -6.338332176208496, "global_step": 109594, "epoch": 2609} {"train_loss": -6.587906837463379, "global_step": 109595, "epoch": 2609} {"train_loss": -6.33084774017334, "global_step": 109596, "epoch": 2609} {"train_loss": -6.189706802368164, "global_step": 109597, "epoch": 2609} {"train_loss": -6.506947040557861, "global_step": 109598, "epoch": 2609} {"train_loss": -6.275843143463135, "global_step": 109599, "epoch": 2609} {"train_loss": -6.450145721435547, "global_step": 109600, "epoch": 2609} {"train_loss": -6.4481000900268555, "global_step": 109601, "epoch": 2609} {"train_loss": -6.379311561584473, "global_step": 109602, "epoch": 2609} {"train_loss": -6.374197959899902, "global_step": 109603, "epoch": 2609} {"train_loss": -6.314130783081055, "global_step": 109604, "epoch": 2609} {"train_loss": -6.480874061584473, "global_step": 109605, "epoch": 2609} {"train_loss": -6.495222091674805, "global_step": 109606, "epoch": 2609} {"train_loss": -6.394248008728027, "global_step": 109607, "epoch": 2609} {"train_loss": -6.495246410369873, "global_step": 109608, "epoch": 2609} {"train_loss": -6.404474258422852, "global_step": 109609, "epoch": 2609} {"train_loss": -6.347967624664307, "global_step": 109610, "epoch": 2609} {"train_loss": -6.500750541687012, "global_step": 109611, "epoch": 2609} {"train_loss": -6.450289726257324, "global_step": 109612, "epoch": 2609} {"train_loss": -6.481104850769043, "global_step": 109613, "epoch": 2609} {"train_loss": -6.427002906799316, "global_step": 109614, "epoch": 2609} {"train_loss": -6.423757553100586, "global_step": 109615, "epoch": 2609} {"train_loss": -6.497905731201172, "global_step": 109616, "epoch": 2609} {"train_loss": -6.476859092712402, "global_step": 109617, "epoch": 2609} {"train_loss": -6.34831428527832, "global_step": 109618, "epoch": 2609} {"train_loss": -6.427984192257836, "global_step": 109619, "epoch": 2609, "val_loss": 76276.8671875} {"train_loss": -6.398114204406738, "global_step": 109620, "epoch": 2610} {"train_loss": -6.4289751052856445, "global_step": 109621, "epoch": 2610} {"train_loss": -6.227124214172363, "global_step": 109622, "epoch": 2610} {"train_loss": -6.460544109344482, "global_step": 109623, "epoch": 2610} {"train_loss": -6.360917091369629, "global_step": 109624, "epoch": 2610} {"train_loss": -6.41948127746582, "global_step": 109625, "epoch": 2610} {"train_loss": -6.391775131225586, "global_step": 109626, "epoch": 2610} {"train_loss": -6.578738689422607, "global_step": 109627, "epoch": 2610} {"train_loss": -6.475697994232178, "global_step": 109628, "epoch": 2610} {"train_loss": -6.389750003814697, "global_step": 109629, "epoch": 2610} {"train_loss": -6.388935089111328, "global_step": 109630, "epoch": 2610} {"train_loss": -6.488070011138916, "global_step": 109631, "epoch": 2610} {"train_loss": -6.428933143615723, "global_step": 109632, "epoch": 2610} {"train_loss": -6.523212909698486, "global_step": 109633, "epoch": 2610} {"train_loss": -6.559269428253174, "global_step": 109634, "epoch": 2610} {"train_loss": -6.469880104064941, "global_step": 109635, "epoch": 2610} {"train_loss": -6.403369903564453, "global_step": 109636, "epoch": 2610} {"train_loss": -6.448755264282227, "global_step": 109637, "epoch": 2610} {"train_loss": -6.514130592346191, "global_step": 109638, "epoch": 2610} {"train_loss": -6.494146347045898, "global_step": 109639, "epoch": 2610} {"train_loss": -6.322572231292725, "global_step": 109640, "epoch": 2610} {"train_loss": -6.534086227416992, "global_step": 109641, "epoch": 2610} {"train_loss": -6.406533241271973, "global_step": 109642, "epoch": 2610} {"train_loss": -6.401767730712891, "global_step": 109643, "epoch": 2610} {"train_loss": -6.428696632385254, "global_step": 109644, "epoch": 2610} {"train_loss": -6.324893951416016, "global_step": 109645, "epoch": 2610} {"train_loss": -6.568163871765137, "global_step": 109646, "epoch": 2610} {"train_loss": -6.47102165222168, "global_step": 109647, "epoch": 2610} {"train_loss": -6.475925445556641, "global_step": 109648, "epoch": 2610} {"train_loss": -6.4714508056640625, "global_step": 109649, "epoch": 2610} {"train_loss": -6.420832633972168, "global_step": 109650, "epoch": 2610} {"train_loss": -6.53591775894165, "global_step": 109651, "epoch": 2610} {"train_loss": -6.278255462646484, "global_step": 109652, "epoch": 2610} {"train_loss": -6.512683391571045, "global_step": 109653, "epoch": 2610} {"train_loss": -6.353760719299316, "global_step": 109654, "epoch": 2610} {"train_loss": -6.501212120056152, "global_step": 109655, "epoch": 2610} {"train_loss": -6.393131256103516, "global_step": 109656, "epoch": 2610} {"train_loss": -6.370058059692383, "global_step": 109657, "epoch": 2610} {"train_loss": -6.449985504150391, "global_step": 109658, "epoch": 2610} {"train_loss": -6.289568901062012, "global_step": 109659, "epoch": 2610} {"train_loss": -6.553378105163574, "global_step": 109660, "epoch": 2610} {"train_loss": -6.43662166595459, "global_step": 109661, "epoch": 2610, "val_loss": 76321.890625} {"train_loss": -6.398717880249023, "global_step": 109662, "epoch": 2611} {"train_loss": -6.528980731964111, "global_step": 109663, "epoch": 2611} {"train_loss": -6.408500671386719, "global_step": 109664, "epoch": 2611} {"train_loss": -6.429579734802246, "global_step": 109665, "epoch": 2611} {"train_loss": -6.436313629150391, "global_step": 109666, "epoch": 2611} {"train_loss": -6.416385650634766, "global_step": 109667, "epoch": 2611} {"train_loss": -6.4180402755737305, "global_step": 109668, "epoch": 2611} {"train_loss": -6.562413215637207, "global_step": 109669, "epoch": 2611} {"train_loss": -6.357877731323242, "global_step": 109670, "epoch": 2611} {"train_loss": -6.3570427894592285, "global_step": 109671, "epoch": 2611} {"train_loss": -6.4086503982543945, "global_step": 109672, "epoch": 2611} {"train_loss": -6.449463844299316, "global_step": 109673, "epoch": 2611} {"train_loss": -6.47901725769043, "global_step": 109674, "epoch": 2611} {"train_loss": -6.415884017944336, "global_step": 109675, "epoch": 2611} {"train_loss": -6.406268119812012, "global_step": 109676, "epoch": 2611} {"train_loss": -6.453215599060059, "global_step": 109677, "epoch": 2611} {"train_loss": -6.587023735046387, "global_step": 109678, "epoch": 2611} {"train_loss": -6.430460453033447, "global_step": 109679, "epoch": 2611} {"train_loss": -6.2354207038879395, "global_step": 109680, "epoch": 2611} {"train_loss": -6.455554962158203, "global_step": 109681, "epoch": 2611} {"train_loss": -6.343569755554199, "global_step": 109682, "epoch": 2611} {"train_loss": -6.469990253448486, "global_step": 109683, "epoch": 2611} {"train_loss": -6.4979095458984375, "global_step": 109684, "epoch": 2611} {"train_loss": -6.306347846984863, "global_step": 109685, "epoch": 2611} {"train_loss": -6.378146171569824, "global_step": 109686, "epoch": 2611} {"train_loss": -6.306220054626465, "global_step": 109687, "epoch": 2611} {"train_loss": -6.385103702545166, "global_step": 109688, "epoch": 2611} {"train_loss": -6.440699577331543, "global_step": 109689, "epoch": 2611} {"train_loss": -6.384370803833008, "global_step": 109690, "epoch": 2611} {"train_loss": -6.459964752197266, "global_step": 109691, "epoch": 2611} {"train_loss": -6.380146026611328, "global_step": 109692, "epoch": 2611} {"train_loss": -6.565248012542725, "global_step": 109693, "epoch": 2611} {"train_loss": -6.379848480224609, "global_step": 109694, "epoch": 2611} {"train_loss": -6.4557294845581055, "global_step": 109695, "epoch": 2611} {"train_loss": -6.536210536956787, "global_step": 109696, "epoch": 2611} {"train_loss": -6.446714401245117, "global_step": 109697, "epoch": 2611} {"train_loss": -6.459604263305664, "global_step": 109698, "epoch": 2611} {"train_loss": -6.478554725646973, "global_step": 109699, "epoch": 2611} {"train_loss": -6.452415943145752, "global_step": 109700, "epoch": 2611} {"train_loss": -6.411520957946777, "global_step": 109701, "epoch": 2611} {"train_loss": -6.337706565856934, "global_step": 109702, "epoch": 2611} {"train_loss": -6.428909824008033, "global_step": 109703, "epoch": 2611, "val_loss": 76378.234375} {"train_loss": -6.471698760986328, "global_step": 109704, "epoch": 2612} {"train_loss": -6.44390869140625, "global_step": 109705, "epoch": 2612} {"train_loss": -6.50657844543457, "global_step": 109706, "epoch": 2612} {"train_loss": -6.477577209472656, "global_step": 109707, "epoch": 2612} {"train_loss": -6.36776065826416, "global_step": 109708, "epoch": 2612} {"train_loss": -6.487015724182129, "global_step": 109709, "epoch": 2612} {"train_loss": -6.3592729568481445, "global_step": 109710, "epoch": 2612} {"train_loss": -6.406534671783447, "global_step": 109711, "epoch": 2612} {"train_loss": -6.569955825805664, "global_step": 109712, "epoch": 2612} {"train_loss": -6.41373348236084, "global_step": 109713, "epoch": 2612} {"train_loss": -6.50846004486084, "global_step": 109714, "epoch": 2612} {"train_loss": -6.492335796356201, "global_step": 109715, "epoch": 2612} {"train_loss": -6.4969329833984375, "global_step": 109716, "epoch": 2612} {"train_loss": -6.441595077514648, "global_step": 109717, "epoch": 2612} {"train_loss": -6.551230430603027, "global_step": 109718, "epoch": 2612} {"train_loss": -6.459606647491455, "global_step": 109719, "epoch": 2612} {"train_loss": -6.527247428894043, "global_step": 109720, "epoch": 2612} {"train_loss": -6.473870277404785, "global_step": 109721, "epoch": 2612} {"train_loss": -6.457121849060059, "global_step": 109722, "epoch": 2612} {"train_loss": -6.391460418701172, "global_step": 109723, "epoch": 2612} {"train_loss": -6.330377578735352, "global_step": 109724, "epoch": 2612} {"train_loss": -6.488935947418213, "global_step": 109725, "epoch": 2612} {"train_loss": -6.471413612365723, "global_step": 109726, "epoch": 2612} {"train_loss": -6.381191253662109, "global_step": 109727, "epoch": 2612} {"train_loss": -6.427176475524902, "global_step": 109728, "epoch": 2612} {"train_loss": -6.456099510192871, "global_step": 109729, "epoch": 2612} {"train_loss": -6.494711875915527, "global_step": 109730, "epoch": 2612} {"train_loss": -6.4368696212768555, "global_step": 109731, "epoch": 2612} {"train_loss": -6.428831100463867, "global_step": 109732, "epoch": 2612} {"train_loss": -6.311484336853027, "global_step": 109733, "epoch": 2612} {"train_loss": -6.432744979858398, "global_step": 109734, "epoch": 2612} {"train_loss": -6.463491439819336, "global_step": 109735, "epoch": 2612} {"train_loss": -6.281383037567139, "global_step": 109736, "epoch": 2612} {"train_loss": -6.3745012283325195, "global_step": 109737, "epoch": 2612} {"train_loss": -6.39459753036499, "global_step": 109738, "epoch": 2612} {"train_loss": -6.317212104797363, "global_step": 109739, "epoch": 2612} {"train_loss": -6.320218086242676, "global_step": 109740, "epoch": 2612} {"train_loss": -6.398833274841309, "global_step": 109741, "epoch": 2612} {"train_loss": -6.533257484436035, "global_step": 109742, "epoch": 2612} {"train_loss": -6.3966851234436035, "global_step": 109743, "epoch": 2612} {"train_loss": -6.380825996398926, "global_step": 109744, "epoch": 2612} {"train_loss": -6.435212487266178, "global_step": 109745, "epoch": 2612, "val_loss": 76166.0390625} {"train_loss": -6.37584924697876, "global_step": 109746, "epoch": 2613} {"train_loss": -6.5242719650268555, "global_step": 109747, "epoch": 2613} {"train_loss": -6.402643203735352, "global_step": 109748, "epoch": 2613} {"train_loss": -6.291481971740723, "global_step": 109749, "epoch": 2613} {"train_loss": -6.445311546325684, "global_step": 109750, "epoch": 2613} {"train_loss": -6.4895219802856445, "global_step": 109751, "epoch": 2613} {"train_loss": -6.438032150268555, "global_step": 109752, "epoch": 2613} {"train_loss": -6.436736583709717, "global_step": 109753, "epoch": 2613} {"train_loss": -6.500877857208252, "global_step": 109754, "epoch": 2613} {"train_loss": -6.366930961608887, "global_step": 109755, "epoch": 2613} {"train_loss": -6.389028549194336, "global_step": 109756, "epoch": 2613} {"train_loss": -6.438481330871582, "global_step": 109757, "epoch": 2613} {"train_loss": -6.252493381500244, "global_step": 109758, "epoch": 2613} {"train_loss": -6.354191780090332, "global_step": 109759, "epoch": 2613} {"train_loss": -6.378947734832764, "global_step": 109760, "epoch": 2613} {"train_loss": -6.403653621673584, "global_step": 109761, "epoch": 2613} {"train_loss": -6.421525001525879, "global_step": 109762, "epoch": 2613} {"train_loss": -6.222297668457031, "global_step": 109763, "epoch": 2613} {"train_loss": -6.495731353759766, "global_step": 109764, "epoch": 2613} {"train_loss": -6.302472114562988, "global_step": 109765, "epoch": 2613} {"train_loss": -6.4554123878479, "global_step": 109766, "epoch": 2613} {"train_loss": -6.3634233474731445, "global_step": 109767, "epoch": 2613} {"train_loss": -6.4546427726745605, "global_step": 109768, "epoch": 2613} {"train_loss": -6.417337894439697, "global_step": 109769, "epoch": 2613} {"train_loss": -6.467817306518555, "global_step": 109770, "epoch": 2613} {"train_loss": -6.402440071105957, "global_step": 109771, "epoch": 2613} {"train_loss": -6.5509934425354, "global_step": 109772, "epoch": 2613} {"train_loss": -6.415950775146484, "global_step": 109773, "epoch": 2613} {"train_loss": -6.40894889831543, "global_step": 109774, "epoch": 2613} {"train_loss": -6.481016159057617, "global_step": 109775, "epoch": 2613} {"train_loss": -6.47929573059082, "global_step": 109776, "epoch": 2613} {"train_loss": -6.435218811035156, "global_step": 109777, "epoch": 2613} {"train_loss": -6.567448139190674, "global_step": 109778, "epoch": 2613} {"train_loss": -6.573665618896484, "global_step": 109779, "epoch": 2613} {"train_loss": -6.408817291259766, "global_step": 109780, "epoch": 2613} {"train_loss": -6.509178161621094, "global_step": 109781, "epoch": 2613} {"train_loss": -6.540249824523926, "global_step": 109782, "epoch": 2613} {"train_loss": -6.47897481918335, "global_step": 109783, "epoch": 2613} {"train_loss": -6.577164649963379, "global_step": 109784, "epoch": 2613} {"train_loss": -6.412191867828369, "global_step": 109785, "epoch": 2613} {"train_loss": -6.3414306640625, "global_step": 109786, "epoch": 2613} {"train_loss": -6.430713891983032, "global_step": 109787, "epoch": 2613, "val_loss": 76085.25} {"train_loss": -6.455450057983398, "global_step": 109788, "epoch": 2614} {"train_loss": -6.488654613494873, "global_step": 109789, "epoch": 2614} {"train_loss": -6.438292026519775, "global_step": 109790, "epoch": 2614} {"train_loss": -6.319231033325195, "global_step": 109791, "epoch": 2614} {"train_loss": -6.634918689727783, "global_step": 109792, "epoch": 2614} {"train_loss": -6.430245399475098, "global_step": 109793, "epoch": 2614} {"train_loss": -6.485621452331543, "global_step": 109794, "epoch": 2614} {"train_loss": -6.50566291809082, "global_step": 109795, "epoch": 2614} {"train_loss": -6.392002582550049, "global_step": 109796, "epoch": 2614} {"train_loss": -6.449821472167969, "global_step": 109797, "epoch": 2614} {"train_loss": -6.525885105133057, "global_step": 109798, "epoch": 2614} {"train_loss": -6.511877059936523, "global_step": 109799, "epoch": 2614} {"train_loss": -6.478562831878662, "global_step": 109800, "epoch": 2614} {"train_loss": -6.425192356109619, "global_step": 109801, "epoch": 2614} {"train_loss": -6.451211929321289, "global_step": 109802, "epoch": 2614} {"train_loss": -6.510608673095703, "global_step": 109803, "epoch": 2614} {"train_loss": -6.484445095062256, "global_step": 109804, "epoch": 2614} {"train_loss": -6.375227928161621, "global_step": 109805, "epoch": 2614} {"train_loss": -6.4858903884887695, "global_step": 109806, "epoch": 2614} {"train_loss": -6.401147365570068, "global_step": 109807, "epoch": 2614} {"train_loss": -6.4423112869262695, "global_step": 109808, "epoch": 2614} {"train_loss": -6.449506759643555, "global_step": 109809, "epoch": 2614} {"train_loss": -6.424340724945068, "global_step": 109810, "epoch": 2614} {"train_loss": -6.428491115570068, "global_step": 109811, "epoch": 2614} {"train_loss": -6.472992897033691, "global_step": 109812, "epoch": 2614} {"train_loss": -6.406807899475098, "global_step": 109813, "epoch": 2614} {"train_loss": -6.294149875640869, "global_step": 109814, "epoch": 2614} {"train_loss": -6.460907936096191, "global_step": 109815, "epoch": 2614} {"train_loss": -6.360509872436523, "global_step": 109816, "epoch": 2614} {"train_loss": -6.297518730163574, "global_step": 109817, "epoch": 2614} {"train_loss": -6.501396656036377, "global_step": 109818, "epoch": 2614} {"train_loss": -6.338081359863281, "global_step": 109819, "epoch": 2614} {"train_loss": -6.357219219207764, "global_step": 109820, "epoch": 2614} {"train_loss": -6.129323482513428, "global_step": 109821, "epoch": 2614} {"train_loss": -6.493034362792969, "global_step": 109822, "epoch": 2614} {"train_loss": -6.397525787353516, "global_step": 109823, "epoch": 2614} {"train_loss": -6.313321113586426, "global_step": 109824, "epoch": 2614} {"train_loss": -6.313783168792725, "global_step": 109825, "epoch": 2614} {"train_loss": -6.458673477172852, "global_step": 109826, "epoch": 2614} {"train_loss": -6.383965969085693, "global_step": 109827, "epoch": 2614} {"train_loss": -6.224664688110352, "global_step": 109828, "epoch": 2614} {"train_loss": -6.4178483826773505, "global_step": 109829, "epoch": 2614, "val_loss": 76454.0859375} {"train_loss": -6.375303268432617, "global_step": 109830, "epoch": 2615} {"train_loss": -6.39048433303833, "global_step": 109831, "epoch": 2615} {"train_loss": -6.394499778747559, "global_step": 109832, "epoch": 2615} {"train_loss": -6.479671478271484, "global_step": 109833, "epoch": 2615} {"train_loss": -6.312808513641357, "global_step": 109834, "epoch": 2615} {"train_loss": -6.371706962585449, "global_step": 109835, "epoch": 2615} {"train_loss": -6.380284309387207, "global_step": 109836, "epoch": 2615} {"train_loss": -6.524637699127197, "global_step": 109837, "epoch": 2615} {"train_loss": -6.494781494140625, "global_step": 109838, "epoch": 2615} {"train_loss": -6.43748664855957, "global_step": 109839, "epoch": 2615} {"train_loss": -6.434755325317383, "global_step": 109840, "epoch": 2615} {"train_loss": -6.5066938400268555, "global_step": 109841, "epoch": 2615} {"train_loss": -6.485136985778809, "global_step": 109842, "epoch": 2615} {"train_loss": -6.422702789306641, "global_step": 109843, "epoch": 2615} {"train_loss": -6.395481109619141, "global_step": 109844, "epoch": 2615} {"train_loss": -6.503597259521484, "global_step": 109845, "epoch": 2615} {"train_loss": -6.540269374847412, "global_step": 109846, "epoch": 2615} {"train_loss": -6.378150463104248, "global_step": 109847, "epoch": 2615} {"train_loss": -6.514222145080566, "global_step": 109848, "epoch": 2615} {"train_loss": -6.489046573638916, "global_step": 109849, "epoch": 2615} {"train_loss": -6.4152750968933105, "global_step": 109850, "epoch": 2615} {"train_loss": -6.487483501434326, "global_step": 109851, "epoch": 2615} {"train_loss": -6.481752872467041, "global_step": 109852, "epoch": 2615} {"train_loss": -6.421433448791504, "global_step": 109853, "epoch": 2615} {"train_loss": -6.445793151855469, "global_step": 109854, "epoch": 2615} {"train_loss": -6.566204071044922, "global_step": 109855, "epoch": 2615} {"train_loss": -6.478270053863525, "global_step": 109856, "epoch": 2615} {"train_loss": -6.587217807769775, "global_step": 109857, "epoch": 2615} {"train_loss": -6.438169479370117, "global_step": 109858, "epoch": 2615} {"train_loss": -6.438041687011719, "global_step": 109859, "epoch": 2615} {"train_loss": -6.348372459411621, "global_step": 109860, "epoch": 2615} {"train_loss": -6.4824113845825195, "global_step": 109861, "epoch": 2615} {"train_loss": -6.366361618041992, "global_step": 109862, "epoch": 2615} {"train_loss": -6.461205005645752, "global_step": 109863, "epoch": 2615} {"train_loss": -6.398793697357178, "global_step": 109864, "epoch": 2615} {"train_loss": -6.3280558586120605, "global_step": 109865, "epoch": 2615} {"train_loss": -6.366009712219238, "global_step": 109866, "epoch": 2615} {"train_loss": -6.450997829437256, "global_step": 109867, "epoch": 2615} {"train_loss": -6.545934677124023, "global_step": 109868, "epoch": 2615} {"train_loss": -6.553061008453369, "global_step": 109869, "epoch": 2615} {"train_loss": -6.371687889099121, "global_step": 109870, "epoch": 2615} {"train_loss": -6.447180293855213, "global_step": 109871, "epoch": 2615, "val_loss": 76081.234375} {"train_loss": -6.492926597595215, "global_step": 109872, "epoch": 2616} {"train_loss": -6.523333549499512, "global_step": 109873, "epoch": 2616} {"train_loss": -6.348450660705566, "global_step": 109874, "epoch": 2616} {"train_loss": -6.525761604309082, "global_step": 109875, "epoch": 2616} {"train_loss": -6.401906967163086, "global_step": 109876, "epoch": 2616} {"train_loss": -6.493926048278809, "global_step": 109877, "epoch": 2616} {"train_loss": -6.4579315185546875, "global_step": 109878, "epoch": 2616} {"train_loss": -6.4597978591918945, "global_step": 109879, "epoch": 2616} {"train_loss": -6.518620491027832, "global_step": 109880, "epoch": 2616} {"train_loss": -6.506695747375488, "global_step": 109881, "epoch": 2616} {"train_loss": -6.45605993270874, "global_step": 109882, "epoch": 2616} {"train_loss": -6.513254642486572, "global_step": 109883, "epoch": 2616} {"train_loss": -6.548459053039551, "global_step": 109884, "epoch": 2616} {"train_loss": -6.507230758666992, "global_step": 109885, "epoch": 2616} {"train_loss": -6.532341480255127, "global_step": 109886, "epoch": 2616} {"train_loss": -6.564424514770508, "global_step": 109887, "epoch": 2616} {"train_loss": -6.470236301422119, "global_step": 109888, "epoch": 2616} {"train_loss": -6.495655059814453, "global_step": 109889, "epoch": 2616} {"train_loss": -6.358415603637695, "global_step": 109890, "epoch": 2616} {"train_loss": -6.476535320281982, "global_step": 109891, "epoch": 2616} {"train_loss": -6.364862442016602, "global_step": 109892, "epoch": 2616} {"train_loss": -6.479589462280273, "global_step": 109893, "epoch": 2616} {"train_loss": -6.5080766677856445, "global_step": 109894, "epoch": 2616} {"train_loss": -6.449790954589844, "global_step": 109895, "epoch": 2616} {"train_loss": -6.496857166290283, "global_step": 109896, "epoch": 2616} {"train_loss": -6.5059709548950195, "global_step": 109897, "epoch": 2616} {"train_loss": -6.51538610458374, "global_step": 109898, "epoch": 2616} {"train_loss": -6.47158670425415, "global_step": 109899, "epoch": 2616} {"train_loss": -6.5633649826049805, "global_step": 109900, "epoch": 2616} {"train_loss": -6.48907470703125, "global_step": 109901, "epoch": 2616} {"train_loss": -6.545454978942871, "global_step": 109902, "epoch": 2616} {"train_loss": -6.352635860443115, "global_step": 109903, "epoch": 2616} {"train_loss": -6.498366355895996, "global_step": 109904, "epoch": 2616} {"train_loss": -6.553319931030273, "global_step": 109905, "epoch": 2616} {"train_loss": -6.497685432434082, "global_step": 109906, "epoch": 2616} {"train_loss": -6.53138542175293, "global_step": 109907, "epoch": 2616} {"train_loss": -6.477144241333008, "global_step": 109908, "epoch": 2616} {"train_loss": -6.470964431762695, "global_step": 109909, "epoch": 2616} {"train_loss": -6.435598373413086, "global_step": 109910, "epoch": 2616} {"train_loss": -6.380091667175293, "global_step": 109911, "epoch": 2616} {"train_loss": -6.447118759155273, "global_step": 109912, "epoch": 2616} {"train_loss": -6.481278578440349, "global_step": 109913, "epoch": 2616, "val_loss": 76230.734375} {"train_loss": -6.44367790222168, "global_step": 109914, "epoch": 2617} {"train_loss": -6.617345333099365, "global_step": 109915, "epoch": 2617} {"train_loss": -6.408012866973877, "global_step": 109916, "epoch": 2617} {"train_loss": -6.3949103355407715, "global_step": 109917, "epoch": 2617} {"train_loss": -6.352899074554443, "global_step": 109918, "epoch": 2617} {"train_loss": -6.361338138580322, "global_step": 109919, "epoch": 2617} {"train_loss": -6.478795528411865, "global_step": 109920, "epoch": 2617} {"train_loss": -6.518022060394287, "global_step": 109921, "epoch": 2617} {"train_loss": -6.410652160644531, "global_step": 109922, "epoch": 2617} {"train_loss": -6.424509048461914, "global_step": 109923, "epoch": 2617} {"train_loss": -6.463881015777588, "global_step": 109924, "epoch": 2617} {"train_loss": -6.501049041748047, "global_step": 109925, "epoch": 2617} {"train_loss": -6.459181785583496, "global_step": 109926, "epoch": 2617} {"train_loss": -6.445145606994629, "global_step": 109927, "epoch": 2617} {"train_loss": -6.428831100463867, "global_step": 109928, "epoch": 2617} {"train_loss": -6.444998741149902, "global_step": 109929, "epoch": 2617} {"train_loss": -6.502705097198486, "global_step": 109930, "epoch": 2617} {"train_loss": -6.473055839538574, "global_step": 109931, "epoch": 2617} {"train_loss": -6.562546730041504, "global_step": 109932, "epoch": 2617} {"train_loss": -6.421936988830566, "global_step": 109933, "epoch": 2617} {"train_loss": -6.494478225708008, "global_step": 109934, "epoch": 2617} {"train_loss": -6.436367034912109, "global_step": 109935, "epoch": 2617} {"train_loss": -6.438228130340576, "global_step": 109936, "epoch": 2617} {"train_loss": -6.5550031661987305, "global_step": 109937, "epoch": 2617} {"train_loss": -6.423061370849609, "global_step": 109938, "epoch": 2617} {"train_loss": -6.5867486000061035, "global_step": 109939, "epoch": 2617} {"train_loss": -6.517763137817383, "global_step": 109940, "epoch": 2617} {"train_loss": -6.430689811706543, "global_step": 109941, "epoch": 2617} {"train_loss": -6.435938358306885, "global_step": 109942, "epoch": 2617} {"train_loss": -6.548538684844971, "global_step": 109943, "epoch": 2617} {"train_loss": -6.650730609893799, "global_step": 109944, "epoch": 2617} {"train_loss": -6.551383018493652, "global_step": 109945, "epoch": 2617} {"train_loss": -6.482711315155029, "global_step": 109946, "epoch": 2617} {"train_loss": -6.415655136108398, "global_step": 109947, "epoch": 2617} {"train_loss": -6.46845817565918, "global_step": 109948, "epoch": 2617} {"train_loss": -6.338266849517822, "global_step": 109949, "epoch": 2617} {"train_loss": -6.566192626953125, "global_step": 109950, "epoch": 2617} {"train_loss": -6.638646125793457, "global_step": 109951, "epoch": 2617} {"train_loss": -6.504406929016113, "global_step": 109952, "epoch": 2617} {"train_loss": -6.428086757659912, "global_step": 109953, "epoch": 2617} {"train_loss": -6.421082496643066, "global_step": 109954, "epoch": 2617} {"train_loss": -6.473809889384678, "global_step": 109955, "epoch": 2617, "val_loss": 76343.9140625} {"train_loss": -6.447070598602295, "global_step": 109956, "epoch": 2618} {"train_loss": -6.483468055725098, "global_step": 109957, "epoch": 2618} {"train_loss": -6.531632900238037, "global_step": 109958, "epoch": 2618} {"train_loss": -6.487061977386475, "global_step": 109959, "epoch": 2618} {"train_loss": -6.391313552856445, "global_step": 109960, "epoch": 2618} {"train_loss": -6.349835395812988, "global_step": 109961, "epoch": 2618} {"train_loss": -6.382350921630859, "global_step": 109962, "epoch": 2618} {"train_loss": -6.540075778961182, "global_step": 109963, "epoch": 2618} {"train_loss": -6.337726593017578, "global_step": 109964, "epoch": 2618} {"train_loss": -6.478036880493164, "global_step": 109965, "epoch": 2618} {"train_loss": -6.392050743103027, "global_step": 109966, "epoch": 2618} {"train_loss": -6.496851444244385, "global_step": 109967, "epoch": 2618} {"train_loss": -6.374025344848633, "global_step": 109968, "epoch": 2618} {"train_loss": -6.584610939025879, "global_step": 109969, "epoch": 2618} {"train_loss": -6.378498077392578, "global_step": 109970, "epoch": 2618} {"train_loss": -6.364609718322754, "global_step": 109971, "epoch": 2618} {"train_loss": -6.38275146484375, "global_step": 109972, "epoch": 2618} {"train_loss": -6.313767910003662, "global_step": 109973, "epoch": 2618} {"train_loss": -6.452761650085449, "global_step": 109974, "epoch": 2618} {"train_loss": -6.4031219482421875, "global_step": 109975, "epoch": 2618} {"train_loss": -6.394321918487549, "global_step": 109976, "epoch": 2618} {"train_loss": -6.439379692077637, "global_step": 109977, "epoch": 2618} {"train_loss": -6.451921463012695, "global_step": 109978, "epoch": 2618} {"train_loss": -6.5161309242248535, "global_step": 109979, "epoch": 2618} {"train_loss": -6.361666679382324, "global_step": 109980, "epoch": 2618} {"train_loss": -6.539623737335205, "global_step": 109981, "epoch": 2618} {"train_loss": -6.405172348022461, "global_step": 109982, "epoch": 2618} {"train_loss": -6.457584381103516, "global_step": 109983, "epoch": 2618} {"train_loss": -6.485271453857422, "global_step": 109984, "epoch": 2618} {"train_loss": -6.537195205688477, "global_step": 109985, "epoch": 2618} {"train_loss": -6.499448299407959, "global_step": 109986, "epoch": 2618} {"train_loss": -6.408500671386719, "global_step": 109987, "epoch": 2618} {"train_loss": -6.44088077545166, "global_step": 109988, "epoch": 2618} {"train_loss": -6.572601795196533, "global_step": 109989, "epoch": 2618} {"train_loss": -6.535791397094727, "global_step": 109990, "epoch": 2618} {"train_loss": -6.388103485107422, "global_step": 109991, "epoch": 2618} {"train_loss": -6.5650529861450195, "global_step": 109992, "epoch": 2618} {"train_loss": -6.428997039794922, "global_step": 109993, "epoch": 2618} {"train_loss": -6.523779392242432, "global_step": 109994, "epoch": 2618} {"train_loss": -6.409899711608887, "global_step": 109995, "epoch": 2618} {"train_loss": -6.478099346160889, "global_step": 109996, "epoch": 2618} {"train_loss": -6.451379560288929, "global_step": 109997, "epoch": 2618, "val_loss": 76327.921875} {"train_loss": -6.5290846824646, "global_step": 109998, "epoch": 2619} {"train_loss": -6.464777946472168, "global_step": 109999, "epoch": 2619} {"train_loss": -6.449124336242676, "global_step": 110000, "epoch": 2619} {"train_loss": -6.497277736663818, "global_step": 110001, "epoch": 2619} {"train_loss": -6.41121768951416, "global_step": 110002, "epoch": 2619} {"train_loss": -6.535970687866211, "global_step": 110003, "epoch": 2619} {"train_loss": -6.451424598693848, "global_step": 110004, "epoch": 2619} {"train_loss": -6.5265583992004395, "global_step": 110005, "epoch": 2619} {"train_loss": -6.496933460235596, "global_step": 110006, "epoch": 2619} {"train_loss": -6.4192585945129395, "global_step": 110007, "epoch": 2619} {"train_loss": -6.56868839263916, "global_step": 110008, "epoch": 2619} {"train_loss": -6.493369102478027, "global_step": 110009, "epoch": 2619} {"train_loss": -6.546132564544678, "global_step": 110010, "epoch": 2619} {"train_loss": -6.358968734741211, "global_step": 110011, "epoch": 2619} {"train_loss": -6.493513107299805, "global_step": 110012, "epoch": 2619} {"train_loss": -6.617351055145264, "global_step": 110013, "epoch": 2619} {"train_loss": -6.580338954925537, "global_step": 110014, "epoch": 2619} {"train_loss": -6.446693420410156, "global_step": 110015, "epoch": 2619} {"train_loss": -6.506802082061768, "global_step": 110016, "epoch": 2619} {"train_loss": -6.489837646484375, "global_step": 110017, "epoch": 2619} {"train_loss": -6.4719414710998535, "global_step": 110018, "epoch": 2619} {"train_loss": -6.483006000518799, "global_step": 110019, "epoch": 2619} {"train_loss": -6.452903747558594, "global_step": 110020, "epoch": 2619} {"train_loss": -6.501140117645264, "global_step": 110021, "epoch": 2619} {"train_loss": -6.529676914215088, "global_step": 110022, "epoch": 2619} {"train_loss": -6.467132568359375, "global_step": 110023, "epoch": 2619} {"train_loss": -6.536987781524658, "global_step": 110024, "epoch": 2619} {"train_loss": -6.562686920166016, "global_step": 110025, "epoch": 2619} {"train_loss": -6.404727935791016, "global_step": 110026, "epoch": 2619} {"train_loss": -6.517162322998047, "global_step": 110027, "epoch": 2619} {"train_loss": -6.376603603363037, "global_step": 110028, "epoch": 2619} {"train_loss": -6.350248336791992, "global_step": 110029, "epoch": 2619} {"train_loss": -6.440386772155762, "global_step": 110030, "epoch": 2619} {"train_loss": -6.478328227996826, "global_step": 110031, "epoch": 2619} {"train_loss": -6.558483600616455, "global_step": 110032, "epoch": 2619} {"train_loss": -6.581389427185059, "global_step": 110033, "epoch": 2619} {"train_loss": -6.474516868591309, "global_step": 110034, "epoch": 2619} {"train_loss": -6.558048248291016, "global_step": 110035, "epoch": 2619} {"train_loss": -6.402499198913574, "global_step": 110036, "epoch": 2619} {"train_loss": -6.438320159912109, "global_step": 110037, "epoch": 2619} {"train_loss": -6.523301601409912, "global_step": 110038, "epoch": 2619} {"train_loss": -6.487279846554711, "global_step": 110039, "epoch": 2619, "val_loss": 76231.03125} {"train_loss": -6.5318756103515625, "global_step": 110040, "epoch": 2620} {"train_loss": -6.557790756225586, "global_step": 110041, "epoch": 2620} {"train_loss": -6.581583499908447, "global_step": 110042, "epoch": 2620} {"train_loss": -6.546935081481934, "global_step": 110043, "epoch": 2620} {"train_loss": -6.505062580108643, "global_step": 110044, "epoch": 2620} {"train_loss": -6.465877532958984, "global_step": 110045, "epoch": 2620} {"train_loss": -6.566527366638184, "global_step": 110046, "epoch": 2620} {"train_loss": -6.418069839477539, "global_step": 110047, "epoch": 2620} {"train_loss": -6.547236442565918, "global_step": 110048, "epoch": 2620} {"train_loss": -6.526492118835449, "global_step": 110049, "epoch": 2620} {"train_loss": -6.553110122680664, "global_step": 110050, "epoch": 2620} {"train_loss": -6.52289342880249, "global_step": 110051, "epoch": 2620} {"train_loss": -6.543267726898193, "global_step": 110052, "epoch": 2620} {"train_loss": -6.589548110961914, "global_step": 110053, "epoch": 2620} {"train_loss": -6.483278274536133, "global_step": 110054, "epoch": 2620} {"train_loss": -6.503118515014648, "global_step": 110055, "epoch": 2620} {"train_loss": -6.526318550109863, "global_step": 110056, "epoch": 2620} {"train_loss": -6.512180328369141, "global_step": 110057, "epoch": 2620} {"train_loss": -6.587552070617676, "global_step": 110058, "epoch": 2620} {"train_loss": -6.480436325073242, "global_step": 110059, "epoch": 2620} {"train_loss": -6.390040397644043, "global_step": 110060, "epoch": 2620} {"train_loss": -6.557538032531738, "global_step": 110061, "epoch": 2620} {"train_loss": -6.499379634857178, "global_step": 110062, "epoch": 2620} {"train_loss": -6.492946624755859, "global_step": 110063, "epoch": 2620} {"train_loss": -6.4036407470703125, "global_step": 110064, "epoch": 2620} {"train_loss": -6.562731742858887, "global_step": 110065, "epoch": 2620} {"train_loss": -6.3498945236206055, "global_step": 110066, "epoch": 2620} {"train_loss": -6.4347662925720215, "global_step": 110067, "epoch": 2620} {"train_loss": -6.445866584777832, "global_step": 110068, "epoch": 2620} {"train_loss": -6.328001976013184, "global_step": 110069, "epoch": 2620} {"train_loss": -6.579697132110596, "global_step": 110070, "epoch": 2620} {"train_loss": -6.501437187194824, "global_step": 110071, "epoch": 2620} {"train_loss": -6.4029107093811035, "global_step": 110072, "epoch": 2620} {"train_loss": -6.516398906707764, "global_step": 110073, "epoch": 2620} {"train_loss": -6.530576229095459, "global_step": 110074, "epoch": 2620} {"train_loss": -6.340706825256348, "global_step": 110075, "epoch": 2620} {"train_loss": -6.508046627044678, "global_step": 110076, "epoch": 2620} {"train_loss": -6.383541107177734, "global_step": 110077, "epoch": 2620} {"train_loss": -6.476750373840332, "global_step": 110078, "epoch": 2620} {"train_loss": -6.435476779937744, "global_step": 110079, "epoch": 2620} {"train_loss": -6.5084309577941895, "global_step": 110080, "epoch": 2620} {"train_loss": -6.494064149402437, "global_step": 110081, "epoch": 2620, "val_loss": 76244.6796875} {"train_loss": -6.427811622619629, "global_step": 110082, "epoch": 2621} {"train_loss": -6.494374752044678, "global_step": 110083, "epoch": 2621} {"train_loss": -6.360861778259277, "global_step": 110084, "epoch": 2621} {"train_loss": -6.494417190551758, "global_step": 110085, "epoch": 2621} {"train_loss": -6.478935241699219, "global_step": 110086, "epoch": 2621} {"train_loss": -6.475356578826904, "global_step": 110087, "epoch": 2621} {"train_loss": -6.491733074188232, "global_step": 110088, "epoch": 2621} {"train_loss": -6.503787040710449, "global_step": 110089, "epoch": 2621} {"train_loss": -6.378895282745361, "global_step": 110090, "epoch": 2621} {"train_loss": -6.498297691345215, "global_step": 110091, "epoch": 2621} {"train_loss": -6.4344706535339355, "global_step": 110092, "epoch": 2621} {"train_loss": -6.458894729614258, "global_step": 110093, "epoch": 2621} {"train_loss": -6.335307598114014, "global_step": 110094, "epoch": 2621} {"train_loss": -6.4586052894592285, "global_step": 110095, "epoch": 2621} {"train_loss": -6.407962799072266, "global_step": 110096, "epoch": 2621} {"train_loss": -6.328458786010742, "global_step": 110097, "epoch": 2621} {"train_loss": -6.468519687652588, "global_step": 110098, "epoch": 2621} {"train_loss": -6.390071868896484, "global_step": 110099, "epoch": 2621} {"train_loss": -6.414439678192139, "global_step": 110100, "epoch": 2621} {"train_loss": -6.394805908203125, "global_step": 110101, "epoch": 2621} {"train_loss": -6.362161636352539, "global_step": 110102, "epoch": 2621} {"train_loss": -6.315408706665039, "global_step": 110103, "epoch": 2621} {"train_loss": -6.479855537414551, "global_step": 110104, "epoch": 2621} {"train_loss": -6.4046831130981445, "global_step": 110105, "epoch": 2621} {"train_loss": -6.441074848175049, "global_step": 110106, "epoch": 2621} {"train_loss": -6.5422868728637695, "global_step": 110107, "epoch": 2621} {"train_loss": -6.467238903045654, "global_step": 110108, "epoch": 2621} {"train_loss": -6.430853843688965, "global_step": 110109, "epoch": 2621} {"train_loss": -6.443478107452393, "global_step": 110110, "epoch": 2621} {"train_loss": -6.3082194328308105, "global_step": 110111, "epoch": 2621} {"train_loss": -6.478538513183594, "global_step": 110112, "epoch": 2621} {"train_loss": -6.52823543548584, "global_step": 110113, "epoch": 2621} {"train_loss": -6.377031326293945, "global_step": 110114, "epoch": 2621} {"train_loss": -6.3674540519714355, "global_step": 110115, "epoch": 2621} {"train_loss": -6.390292167663574, "global_step": 110116, "epoch": 2621} {"train_loss": -6.4370832443237305, "global_step": 110117, "epoch": 2621} {"train_loss": -6.502840042114258, "global_step": 110118, "epoch": 2621} {"train_loss": -6.45158576965332, "global_step": 110119, "epoch": 2621} {"train_loss": -6.494036674499512, "global_step": 110120, "epoch": 2621} {"train_loss": -6.406322479248047, "global_step": 110121, "epoch": 2621} {"train_loss": -6.319450378417969, "global_step": 110122, "epoch": 2621} {"train_loss": -6.430905205862863, "global_step": 110123, "epoch": 2621, "val_loss": 76468.515625} {"train_loss": -6.3535051345825195, "global_step": 110124, "epoch": 2622} {"train_loss": -6.508474826812744, "global_step": 110125, "epoch": 2622} {"train_loss": -6.546130180358887, "global_step": 110126, "epoch": 2622} {"train_loss": -6.460152626037598, "global_step": 110127, "epoch": 2622} {"train_loss": -6.462922096252441, "global_step": 110128, "epoch": 2622} {"train_loss": -6.374072551727295, "global_step": 110129, "epoch": 2622} {"train_loss": -6.3264007568359375, "global_step": 110130, "epoch": 2622} {"train_loss": -6.4913530349731445, "global_step": 110131, "epoch": 2622} {"train_loss": -6.438565254211426, "global_step": 110132, "epoch": 2622} {"train_loss": -6.499654769897461, "global_step": 110133, "epoch": 2622} {"train_loss": -6.5681915283203125, "global_step": 110134, "epoch": 2622} {"train_loss": -6.498709201812744, "global_step": 110135, "epoch": 2622} {"train_loss": -6.540632247924805, "global_step": 110136, "epoch": 2622} {"train_loss": -6.641716480255127, "global_step": 110137, "epoch": 2622} {"train_loss": -6.4896559715271, "global_step": 110138, "epoch": 2622} {"train_loss": -6.507667541503906, "global_step": 110139, "epoch": 2622} {"train_loss": -6.401363372802734, "global_step": 110140, "epoch": 2622} {"train_loss": -6.540613174438477, "global_step": 110141, "epoch": 2622} {"train_loss": -6.4541425704956055, "global_step": 110142, "epoch": 2622} {"train_loss": -6.465424537658691, "global_step": 110143, "epoch": 2622} {"train_loss": -6.404480457305908, "global_step": 110144, "epoch": 2622} {"train_loss": -6.40893030166626, "global_step": 110145, "epoch": 2622} {"train_loss": -6.558250904083252, "global_step": 110146, "epoch": 2622} {"train_loss": -6.572538375854492, "global_step": 110147, "epoch": 2622} {"train_loss": -6.43895149230957, "global_step": 110148, "epoch": 2622} {"train_loss": -6.525843620300293, "global_step": 110149, "epoch": 2622} {"train_loss": -6.536161422729492, "global_step": 110150, "epoch": 2622} {"train_loss": -6.390962600708008, "global_step": 110151, "epoch": 2622} {"train_loss": -6.565168857574463, "global_step": 110152, "epoch": 2622} {"train_loss": -6.461122989654541, "global_step": 110153, "epoch": 2622} {"train_loss": -6.447047233581543, "global_step": 110154, "epoch": 2622} {"train_loss": -6.442872047424316, "global_step": 110155, "epoch": 2622} {"train_loss": -6.5709228515625, "global_step": 110156, "epoch": 2622} {"train_loss": -6.497165203094482, "global_step": 110157, "epoch": 2622} {"train_loss": -6.442102432250977, "global_step": 110158, "epoch": 2622} {"train_loss": -6.47467041015625, "global_step": 110159, "epoch": 2622} {"train_loss": -6.426974296569824, "global_step": 110160, "epoch": 2622} {"train_loss": -6.427059173583984, "global_step": 110161, "epoch": 2622} {"train_loss": -6.498629570007324, "global_step": 110162, "epoch": 2622} {"train_loss": -6.504955291748047, "global_step": 110163, "epoch": 2622} {"train_loss": -6.441379547119141, "global_step": 110164, "epoch": 2622} {"train_loss": -6.476260423660278, "global_step": 110165, "epoch": 2622, "val_loss": 76546.9921875} {"train_loss": -6.487858772277832, "global_step": 110166, "epoch": 2623} {"train_loss": -6.443514347076416, "global_step": 110167, "epoch": 2623} {"train_loss": -6.274937629699707, "global_step": 110168, "epoch": 2623} {"train_loss": -6.610527992248535, "global_step": 110169, "epoch": 2623} {"train_loss": -6.379637241363525, "global_step": 110170, "epoch": 2623} {"train_loss": -6.584839820861816, "global_step": 110171, "epoch": 2623} {"train_loss": -6.510343074798584, "global_step": 110172, "epoch": 2623} {"train_loss": -6.447072982788086, "global_step": 110173, "epoch": 2623} {"train_loss": -6.581753730773926, "global_step": 110174, "epoch": 2623} {"train_loss": -6.443699836730957, "global_step": 110175, "epoch": 2623} {"train_loss": -6.551725387573242, "global_step": 110176, "epoch": 2623} {"train_loss": -6.520617485046387, "global_step": 110177, "epoch": 2623} {"train_loss": -6.367846488952637, "global_step": 110178, "epoch": 2623} {"train_loss": -6.5291290283203125, "global_step": 110179, "epoch": 2623} {"train_loss": -6.4704084396362305, "global_step": 110180, "epoch": 2623} {"train_loss": -6.472343921661377, "global_step": 110181, "epoch": 2623} {"train_loss": -6.44011116027832, "global_step": 110182, "epoch": 2623} {"train_loss": -6.522401332855225, "global_step": 110183, "epoch": 2623} {"train_loss": -6.517879486083984, "global_step": 110184, "epoch": 2623} {"train_loss": -6.567785739898682, "global_step": 110185, "epoch": 2623} {"train_loss": -6.367718696594238, "global_step": 110186, "epoch": 2623} {"train_loss": -6.536655902862549, "global_step": 110187, "epoch": 2623} {"train_loss": -6.465227127075195, "global_step": 110188, "epoch": 2623} {"train_loss": -6.575514793395996, "global_step": 110189, "epoch": 2623} {"train_loss": -6.460245132446289, "global_step": 110190, "epoch": 2623} {"train_loss": -6.392271041870117, "global_step": 110191, "epoch": 2623} {"train_loss": -6.510112285614014, "global_step": 110192, "epoch": 2623} {"train_loss": -6.49110746383667, "global_step": 110193, "epoch": 2623} {"train_loss": -6.326031684875488, "global_step": 110194, "epoch": 2623} {"train_loss": -6.44694185256958, "global_step": 110195, "epoch": 2623} {"train_loss": -6.447494983673096, "global_step": 110196, "epoch": 2623} {"train_loss": -6.314594745635986, "global_step": 110197, "epoch": 2623} {"train_loss": -6.4543280601501465, "global_step": 110198, "epoch": 2623} {"train_loss": -6.42503547668457, "global_step": 110199, "epoch": 2623} {"train_loss": -6.314423561096191, "global_step": 110200, "epoch": 2623} {"train_loss": -6.595000267028809, "global_step": 110201, "epoch": 2623} {"train_loss": -6.399509906768799, "global_step": 110202, "epoch": 2623} {"train_loss": -6.413336753845215, "global_step": 110203, "epoch": 2623} {"train_loss": -6.418449878692627, "global_step": 110204, "epoch": 2623} {"train_loss": -6.524443626403809, "global_step": 110205, "epoch": 2623} {"train_loss": -6.504162788391113, "global_step": 110206, "epoch": 2623} {"train_loss": -6.4672658670516245, "global_step": 110207, "epoch": 2623, "val_loss": 76132.265625} {"train_loss": -6.389102935791016, "global_step": 110208, "epoch": 2624} {"train_loss": -6.472385406494141, "global_step": 110209, "epoch": 2624} {"train_loss": -6.446547985076904, "global_step": 110210, "epoch": 2624} {"train_loss": -6.4707183837890625, "global_step": 110211, "epoch": 2624} {"train_loss": -6.397069454193115, "global_step": 110212, "epoch": 2624} {"train_loss": -6.403623580932617, "global_step": 110213, "epoch": 2624} {"train_loss": -6.513166427612305, "global_step": 110214, "epoch": 2624} {"train_loss": -6.5774993896484375, "global_step": 110215, "epoch": 2624} {"train_loss": -6.4568586349487305, "global_step": 110216, "epoch": 2624} {"train_loss": -6.468779563903809, "global_step": 110217, "epoch": 2624} {"train_loss": -6.440075874328613, "global_step": 110218, "epoch": 2624} {"train_loss": -6.440755844116211, "global_step": 110219, "epoch": 2624} {"train_loss": -6.458370208740234, "global_step": 110220, "epoch": 2624} {"train_loss": -6.429922103881836, "global_step": 110221, "epoch": 2624} {"train_loss": -6.487375259399414, "global_step": 110222, "epoch": 2624} {"train_loss": -6.6165452003479, "global_step": 110223, "epoch": 2624} {"train_loss": -6.541216850280762, "global_step": 110224, "epoch": 2624} {"train_loss": -6.443854331970215, "global_step": 110225, "epoch": 2624} {"train_loss": -6.5257415771484375, "global_step": 110226, "epoch": 2624} {"train_loss": -6.36739444732666, "global_step": 110227, "epoch": 2624} {"train_loss": -6.547168254852295, "global_step": 110228, "epoch": 2624} {"train_loss": -6.365896224975586, "global_step": 110229, "epoch": 2624} {"train_loss": -6.396953582763672, "global_step": 110230, "epoch": 2624} {"train_loss": -6.357198238372803, "global_step": 110231, "epoch": 2624} {"train_loss": -6.240461349487305, "global_step": 110232, "epoch": 2624} {"train_loss": -6.437472343444824, "global_step": 110233, "epoch": 2624} {"train_loss": -6.302112579345703, "global_step": 110234, "epoch": 2624} {"train_loss": -6.246135711669922, "global_step": 110235, "epoch": 2624} {"train_loss": -6.330837726593018, "global_step": 110236, "epoch": 2624} {"train_loss": -6.288209915161133, "global_step": 110237, "epoch": 2624} {"train_loss": -6.4767560958862305, "global_step": 110238, "epoch": 2624} {"train_loss": -6.399941444396973, "global_step": 110239, "epoch": 2624} {"train_loss": -6.434903144836426, "global_step": 110240, "epoch": 2624} {"train_loss": -6.423007965087891, "global_step": 110241, "epoch": 2624} {"train_loss": -6.391979217529297, "global_step": 110242, "epoch": 2624} {"train_loss": -6.319396018981934, "global_step": 110243, "epoch": 2624} {"train_loss": -6.5394415855407715, "global_step": 110244, "epoch": 2624} {"train_loss": -6.458868980407715, "global_step": 110245, "epoch": 2624} {"train_loss": -6.392702579498291, "global_step": 110246, "epoch": 2624} {"train_loss": -6.530572891235352, "global_step": 110247, "epoch": 2624} {"train_loss": -6.345249176025391, "global_step": 110248, "epoch": 2624} {"train_loss": -6.4297479674929665, "global_step": 110249, "epoch": 2624, "val_loss": 76299.1796875} {"train_loss": -6.39597749710083, "global_step": 110250, "epoch": 2625} {"train_loss": -6.353610038757324, "global_step": 110251, "epoch": 2625} {"train_loss": -6.412607192993164, "global_step": 110252, "epoch": 2625} {"train_loss": -6.428564548492432, "global_step": 110253, "epoch": 2625} {"train_loss": -6.427370071411133, "global_step": 110254, "epoch": 2625} {"train_loss": -6.417564392089844, "global_step": 110255, "epoch": 2625} {"train_loss": -6.300511360168457, "global_step": 110256, "epoch": 2625} {"train_loss": -6.5036468505859375, "global_step": 110257, "epoch": 2625} {"train_loss": -6.320974349975586, "global_step": 110258, "epoch": 2625} {"train_loss": -6.521552562713623, "global_step": 110259, "epoch": 2625} {"train_loss": -6.468619346618652, "global_step": 110260, "epoch": 2625} {"train_loss": -6.332124710083008, "global_step": 110261, "epoch": 2625} {"train_loss": -6.513651371002197, "global_step": 110262, "epoch": 2625} {"train_loss": -6.358623504638672, "global_step": 110263, "epoch": 2625} {"train_loss": -6.4289445877075195, "global_step": 110264, "epoch": 2625} {"train_loss": -6.376838684082031, "global_step": 110265, "epoch": 2625} {"train_loss": -6.365739822387695, "global_step": 110266, "epoch": 2625} {"train_loss": -6.462505340576172, "global_step": 110267, "epoch": 2625} {"train_loss": -6.468757152557373, "global_step": 110268, "epoch": 2625} {"train_loss": -6.487987041473389, "global_step": 110269, "epoch": 2625} {"train_loss": -6.34765100479126, "global_step": 110270, "epoch": 2625} {"train_loss": -6.341585159301758, "global_step": 110271, "epoch": 2625} {"train_loss": -6.307726860046387, "global_step": 110272, "epoch": 2625} {"train_loss": -6.374852657318115, "global_step": 110273, "epoch": 2625} {"train_loss": -6.445549011230469, "global_step": 110274, "epoch": 2625} {"train_loss": -6.337100028991699, "global_step": 110275, "epoch": 2625} {"train_loss": -6.461390972137451, "global_step": 110276, "epoch": 2625} {"train_loss": -6.322864532470703, "global_step": 110277, "epoch": 2625} {"train_loss": -6.362319469451904, "global_step": 110278, "epoch": 2625} {"train_loss": -6.413267612457275, "global_step": 110279, "epoch": 2625} {"train_loss": -6.494873046875, "global_step": 110280, "epoch": 2625} {"train_loss": -6.3816680908203125, "global_step": 110281, "epoch": 2625} {"train_loss": -6.242107391357422, "global_step": 110282, "epoch": 2625} {"train_loss": -6.45968770980835, "global_step": 110283, "epoch": 2625} {"train_loss": -6.390180587768555, "global_step": 110284, "epoch": 2625} {"train_loss": -6.386510372161865, "global_step": 110285, "epoch": 2625} {"train_loss": -6.417575836181641, "global_step": 110286, "epoch": 2625} {"train_loss": -6.284526824951172, "global_step": 110287, "epoch": 2625} {"train_loss": -6.450753211975098, "global_step": 110288, "epoch": 2625} {"train_loss": -6.343609809875488, "global_step": 110289, "epoch": 2625} {"train_loss": -6.441298007965088, "global_step": 110290, "epoch": 2625} {"train_loss": -6.397601207097371, "global_step": 110291, "epoch": 2625, "val_loss": 76360.3125} {"train_loss": -6.499147415161133, "global_step": 110292, "epoch": 2626} {"train_loss": -6.327716827392578, "global_step": 110293, "epoch": 2626} {"train_loss": -6.5340423583984375, "global_step": 110294, "epoch": 2626} {"train_loss": -6.425287246704102, "global_step": 110295, "epoch": 2626} {"train_loss": -6.433269500732422, "global_step": 110296, "epoch": 2626} {"train_loss": -6.463290214538574, "global_step": 110297, "epoch": 2626} {"train_loss": -6.445113182067871, "global_step": 110298, "epoch": 2626} {"train_loss": -6.478933334350586, "global_step": 110299, "epoch": 2626} {"train_loss": -6.272100925445557, "global_step": 110300, "epoch": 2626} {"train_loss": -6.320857048034668, "global_step": 110301, "epoch": 2626} {"train_loss": -6.492986679077148, "global_step": 110302, "epoch": 2626} {"train_loss": -6.47850227355957, "global_step": 110303, "epoch": 2626} {"train_loss": -6.442914009094238, "global_step": 110304, "epoch": 2626} {"train_loss": -6.430877685546875, "global_step": 110305, "epoch": 2626} {"train_loss": -6.436134338378906, "global_step": 110306, "epoch": 2626} {"train_loss": -6.3547139167785645, "global_step": 110307, "epoch": 2626} {"train_loss": -6.380311489105225, "global_step": 110308, "epoch": 2626} {"train_loss": -6.350712776184082, "global_step": 110309, "epoch": 2626} {"train_loss": -6.413783073425293, "global_step": 110310, "epoch": 2626} {"train_loss": -6.5657219886779785, "global_step": 110311, "epoch": 2626} {"train_loss": -6.413227081298828, "global_step": 110312, "epoch": 2626} {"train_loss": -6.476595878601074, "global_step": 110313, "epoch": 2626} {"train_loss": -6.432714462280273, "global_step": 110314, "epoch": 2626} {"train_loss": -6.585661888122559, "global_step": 110315, "epoch": 2626} {"train_loss": -6.3942551612854, "global_step": 110316, "epoch": 2626} {"train_loss": -6.535304546356201, "global_step": 110317, "epoch": 2626} {"train_loss": -6.429277420043945, "global_step": 110318, "epoch": 2626} {"train_loss": -6.524627685546875, "global_step": 110319, "epoch": 2626} {"train_loss": -6.4810566902160645, "global_step": 110320, "epoch": 2626} {"train_loss": -6.516921043395996, "global_step": 110321, "epoch": 2626} {"train_loss": -6.593323707580566, "global_step": 110322, "epoch": 2626} {"train_loss": -6.513430595397949, "global_step": 110323, "epoch": 2626} {"train_loss": -6.5049543380737305, "global_step": 110324, "epoch": 2626} {"train_loss": -6.39495849609375, "global_step": 110325, "epoch": 2626} {"train_loss": -6.49687385559082, "global_step": 110326, "epoch": 2626} {"train_loss": -6.512696266174316, "global_step": 110327, "epoch": 2626} {"train_loss": -6.536027431488037, "global_step": 110328, "epoch": 2626} {"train_loss": -6.457627296447754, "global_step": 110329, "epoch": 2626} {"train_loss": -6.50887393951416, "global_step": 110330, "epoch": 2626} {"train_loss": -6.470996856689453, "global_step": 110331, "epoch": 2626} {"train_loss": -6.476261615753174, "global_step": 110332, "epoch": 2626} {"train_loss": -6.454905021758306, "global_step": 110333, "epoch": 2626, "val_loss": 76244.9921875} {"train_loss": -6.627292633056641, "global_step": 110334, "epoch": 2627} {"train_loss": -6.44913911819458, "global_step": 110335, "epoch": 2627} {"train_loss": -6.521311283111572, "global_step": 110336, "epoch": 2627} {"train_loss": -6.586480617523193, "global_step": 110337, "epoch": 2627} {"train_loss": -6.543817520141602, "global_step": 110338, "epoch": 2627} {"train_loss": -6.463543891906738, "global_step": 110339, "epoch": 2627} {"train_loss": -6.585827350616455, "global_step": 110340, "epoch": 2627} {"train_loss": -6.462472915649414, "global_step": 110341, "epoch": 2627} {"train_loss": -6.439513683319092, "global_step": 110342, "epoch": 2627} {"train_loss": -6.602018356323242, "global_step": 110343, "epoch": 2627} {"train_loss": -6.502089023590088, "global_step": 110344, "epoch": 2627} {"train_loss": -6.606906890869141, "global_step": 110345, "epoch": 2627} {"train_loss": -6.463290214538574, "global_step": 110346, "epoch": 2627} {"train_loss": -6.439772129058838, "global_step": 110347, "epoch": 2627} {"train_loss": -6.510988235473633, "global_step": 110348, "epoch": 2627} {"train_loss": -6.519752502441406, "global_step": 110349, "epoch": 2627} {"train_loss": -6.443356990814209, "global_step": 110350, "epoch": 2627} {"train_loss": -6.431496620178223, "global_step": 110351, "epoch": 2627} {"train_loss": -6.562303066253662, "global_step": 110352, "epoch": 2627} {"train_loss": -6.5225419998168945, "global_step": 110353, "epoch": 2627} {"train_loss": -6.490588665008545, "global_step": 110354, "epoch": 2627} {"train_loss": -6.495096683502197, "global_step": 110355, "epoch": 2627} {"train_loss": -6.421344757080078, "global_step": 110356, "epoch": 2627} {"train_loss": -6.585666179656982, "global_step": 110357, "epoch": 2627} {"train_loss": -6.514062881469727, "global_step": 110358, "epoch": 2627} {"train_loss": -6.357339859008789, "global_step": 110359, "epoch": 2627} {"train_loss": -6.4440484046936035, "global_step": 110360, "epoch": 2627} {"train_loss": -6.501727104187012, "global_step": 110361, "epoch": 2627} {"train_loss": -6.402365684509277, "global_step": 110362, "epoch": 2627} {"train_loss": -6.4712443351745605, "global_step": 110363, "epoch": 2627} {"train_loss": -6.31789493560791, "global_step": 110364, "epoch": 2627} {"train_loss": -6.481067657470703, "global_step": 110365, "epoch": 2627} {"train_loss": -6.454529762268066, "global_step": 110366, "epoch": 2627} {"train_loss": -6.3166422843933105, "global_step": 110367, "epoch": 2627} {"train_loss": -6.563790798187256, "global_step": 110368, "epoch": 2627} {"train_loss": -6.433008670806885, "global_step": 110369, "epoch": 2627} {"train_loss": -6.538607120513916, "global_step": 110370, "epoch": 2627} {"train_loss": -6.405016899108887, "global_step": 110371, "epoch": 2627} {"train_loss": -6.476135730743408, "global_step": 110372, "epoch": 2627} {"train_loss": -6.392446517944336, "global_step": 110373, "epoch": 2627} {"train_loss": -6.445462226867676, "global_step": 110374, "epoch": 2627} {"train_loss": -6.479987916492281, "global_step": 110375, "epoch": 2627, "val_loss": 76184.578125} {"train_loss": -6.3781938552856445, "global_step": 110376, "epoch": 2628} {"train_loss": -6.423214912414551, "global_step": 110377, "epoch": 2628} {"train_loss": -6.346677780151367, "global_step": 110378, "epoch": 2628} {"train_loss": -6.4472808837890625, "global_step": 110379, "epoch": 2628} {"train_loss": -6.43993616104126, "global_step": 110380, "epoch": 2628} {"train_loss": -6.401608467102051, "global_step": 110381, "epoch": 2628} {"train_loss": -6.446824073791504, "global_step": 110382, "epoch": 2628} {"train_loss": -6.420249938964844, "global_step": 110383, "epoch": 2628} {"train_loss": -6.397537708282471, "global_step": 110384, "epoch": 2628} {"train_loss": -6.494749546051025, "global_step": 110385, "epoch": 2628} {"train_loss": -6.323892593383789, "global_step": 110386, "epoch": 2628} {"train_loss": -6.438455581665039, "global_step": 110387, "epoch": 2628} {"train_loss": -6.439443588256836, "global_step": 110388, "epoch": 2628} {"train_loss": -6.495599746704102, "global_step": 110389, "epoch": 2628} {"train_loss": -6.467874526977539, "global_step": 110390, "epoch": 2628} {"train_loss": -6.4471564292907715, "global_step": 110391, "epoch": 2628} {"train_loss": -6.502098083496094, "global_step": 110392, "epoch": 2628} {"train_loss": -6.426383018493652, "global_step": 110393, "epoch": 2628} {"train_loss": -6.51295280456543, "global_step": 110394, "epoch": 2628} {"train_loss": -6.47184944152832, "global_step": 110395, "epoch": 2628} {"train_loss": -6.560981750488281, "global_step": 110396, "epoch": 2628} {"train_loss": -6.4762797355651855, "global_step": 110397, "epoch": 2628} {"train_loss": -6.492591381072998, "global_step": 110398, "epoch": 2628} {"train_loss": -6.444745063781738, "global_step": 110399, "epoch": 2628} {"train_loss": -6.427608966827393, "global_step": 110400, "epoch": 2628} {"train_loss": -6.451250076293945, "global_step": 110401, "epoch": 2628} {"train_loss": -6.4876580238342285, "global_step": 110402, "epoch": 2628} {"train_loss": -6.452465534210205, "global_step": 110403, "epoch": 2628} {"train_loss": -6.473541736602783, "global_step": 110404, "epoch": 2628} {"train_loss": -6.496560096740723, "global_step": 110405, "epoch": 2628} {"train_loss": -6.432511806488037, "global_step": 110406, "epoch": 2628} {"train_loss": -6.419431209564209, "global_step": 110407, "epoch": 2628} {"train_loss": -6.456419944763184, "global_step": 110408, "epoch": 2628} {"train_loss": -6.336665630340576, "global_step": 110409, "epoch": 2628} {"train_loss": -6.3727617263793945, "global_step": 110410, "epoch": 2628} {"train_loss": -6.443302154541016, "global_step": 110411, "epoch": 2628} {"train_loss": -6.5043792724609375, "global_step": 110412, "epoch": 2628} {"train_loss": -6.485273838043213, "global_step": 110413, "epoch": 2628} {"train_loss": -6.3414225578308105, "global_step": 110414, "epoch": 2628} {"train_loss": -6.337775707244873, "global_step": 110415, "epoch": 2628} {"train_loss": -6.394922256469727, "global_step": 110416, "epoch": 2628} {"train_loss": -6.435549100240071, "global_step": 110417, "epoch": 2628, "val_loss": 76154.3515625} {"train_loss": -6.456174373626709, "global_step": 110418, "epoch": 2629} {"train_loss": -6.498603820800781, "global_step": 110419, "epoch": 2629} {"train_loss": -6.444805145263672, "global_step": 110420, "epoch": 2629} {"train_loss": -6.221798419952393, "global_step": 110421, "epoch": 2629} {"train_loss": -6.431674957275391, "global_step": 110422, "epoch": 2629} {"train_loss": -6.3062968254089355, "global_step": 110423, "epoch": 2629} {"train_loss": -6.487035751342773, "global_step": 110424, "epoch": 2629} {"train_loss": -6.451087951660156, "global_step": 110425, "epoch": 2629} {"train_loss": -6.383496284484863, "global_step": 110426, "epoch": 2629} {"train_loss": -6.44770622253418, "global_step": 110427, "epoch": 2629} {"train_loss": -6.445221900939941, "global_step": 110428, "epoch": 2629} {"train_loss": -6.455848693847656, "global_step": 110429, "epoch": 2629} {"train_loss": -6.604147911071777, "global_step": 110430, "epoch": 2629} {"train_loss": -6.409302711486816, "global_step": 110431, "epoch": 2629} {"train_loss": -6.455763339996338, "global_step": 110432, "epoch": 2629} {"train_loss": -6.399591445922852, "global_step": 110433, "epoch": 2629} {"train_loss": -6.463021755218506, "global_step": 110434, "epoch": 2629} {"train_loss": -6.535292625427246, "global_step": 110435, "epoch": 2629} {"train_loss": -6.394444465637207, "global_step": 110436, "epoch": 2629} {"train_loss": -6.521755218505859, "global_step": 110437, "epoch": 2629} {"train_loss": -6.393283367156982, "global_step": 110438, "epoch": 2629} {"train_loss": -6.562847137451172, "global_step": 110439, "epoch": 2629} {"train_loss": -6.482582092285156, "global_step": 110440, "epoch": 2629} {"train_loss": -6.482400894165039, "global_step": 110441, "epoch": 2629} {"train_loss": -6.593629837036133, "global_step": 110442, "epoch": 2629} {"train_loss": -6.503423690795898, "global_step": 110443, "epoch": 2629} {"train_loss": -6.524852275848389, "global_step": 110444, "epoch": 2629} {"train_loss": -6.482316493988037, "global_step": 110445, "epoch": 2629} {"train_loss": -6.46622371673584, "global_step": 110446, "epoch": 2629} {"train_loss": -6.476223945617676, "global_step": 110447, "epoch": 2629} {"train_loss": -6.547499656677246, "global_step": 110448, "epoch": 2629} {"train_loss": -6.617639541625977, "global_step": 110449, "epoch": 2629} {"train_loss": -6.538025856018066, "global_step": 110450, "epoch": 2629} {"train_loss": -6.526610374450684, "global_step": 110451, "epoch": 2629} {"train_loss": -6.461939811706543, "global_step": 110452, "epoch": 2629} {"train_loss": -6.5083327293396, "global_step": 110453, "epoch": 2629} {"train_loss": -6.48411750793457, "global_step": 110454, "epoch": 2629} {"train_loss": -6.3660101890563965, "global_step": 110455, "epoch": 2629} {"train_loss": -6.490428447723389, "global_step": 110456, "epoch": 2629} {"train_loss": -6.409607887268066, "global_step": 110457, "epoch": 2629} {"train_loss": -6.339420318603516, "global_step": 110458, "epoch": 2629} {"train_loss": -6.462961923508417, "global_step": 110459, "epoch": 2629, "val_loss": 76508.0859375} {"train_loss": -6.4966206550598145, "global_step": 110460, "epoch": 2630} {"train_loss": -6.241568088531494, "global_step": 110461, "epoch": 2630} {"train_loss": -6.459979057312012, "global_step": 110462, "epoch": 2630} {"train_loss": -6.537964820861816, "global_step": 110463, "epoch": 2630} {"train_loss": -6.405879020690918, "global_step": 110464, "epoch": 2630} {"train_loss": -6.497363567352295, "global_step": 110465, "epoch": 2630} {"train_loss": -6.403982639312744, "global_step": 110466, "epoch": 2630} {"train_loss": -6.517468452453613, "global_step": 110467, "epoch": 2630} {"train_loss": -6.414154052734375, "global_step": 110468, "epoch": 2630} {"train_loss": -6.4566731452941895, "global_step": 110469, "epoch": 2630} {"train_loss": -6.472043991088867, "global_step": 110470, "epoch": 2630} {"train_loss": -6.48716926574707, "global_step": 110471, "epoch": 2630} {"train_loss": -6.419827938079834, "global_step": 110472, "epoch": 2630} {"train_loss": -6.3836469650268555, "global_step": 110473, "epoch": 2630} {"train_loss": -6.500864028930664, "global_step": 110474, "epoch": 2630} {"train_loss": -6.323225021362305, "global_step": 110475, "epoch": 2630} {"train_loss": -6.4488325119018555, "global_step": 110476, "epoch": 2630} {"train_loss": -6.560124397277832, "global_step": 110477, "epoch": 2630} {"train_loss": -6.419656753540039, "global_step": 110478, "epoch": 2630} {"train_loss": -6.4615478515625, "global_step": 110479, "epoch": 2630} {"train_loss": -6.414856910705566, "global_step": 110480, "epoch": 2630} {"train_loss": -6.343006610870361, "global_step": 110481, "epoch": 2630} {"train_loss": -6.489452838897705, "global_step": 110482, "epoch": 2630} {"train_loss": -6.293203353881836, "global_step": 110483, "epoch": 2630} {"train_loss": -6.351066589355469, "global_step": 110484, "epoch": 2630} {"train_loss": -6.487779140472412, "global_step": 110485, "epoch": 2630} {"train_loss": -6.484395980834961, "global_step": 110486, "epoch": 2630} {"train_loss": -6.403515815734863, "global_step": 110487, "epoch": 2630} {"train_loss": -6.386594772338867, "global_step": 110488, "epoch": 2630} {"train_loss": -6.414836883544922, "global_step": 110489, "epoch": 2630} {"train_loss": -6.392409801483154, "global_step": 110490, "epoch": 2630} {"train_loss": -6.434653282165527, "global_step": 110491, "epoch": 2630} {"train_loss": -6.470522880554199, "global_step": 110492, "epoch": 2630} {"train_loss": -6.474853515625, "global_step": 110493, "epoch": 2630} {"train_loss": -6.574438571929932, "global_step": 110494, "epoch": 2630} {"train_loss": -6.290333271026611, "global_step": 110495, "epoch": 2630} {"train_loss": -6.5049848556518555, "global_step": 110496, "epoch": 2630} {"train_loss": -6.470982551574707, "global_step": 110497, "epoch": 2630} {"train_loss": -6.290706634521484, "global_step": 110498, "epoch": 2630} {"train_loss": -6.5237226486206055, "global_step": 110499, "epoch": 2630} {"train_loss": -6.264913082122803, "global_step": 110500, "epoch": 2630} {"train_loss": -6.42990315528143, "global_step": 110501, "epoch": 2630, "val_loss": 76314.984375} {"train_loss": -6.3919477462768555, "global_step": 110502, "epoch": 2631} {"train_loss": -6.43731689453125, "global_step": 110503, "epoch": 2631} {"train_loss": -6.4929609298706055, "global_step": 110504, "epoch": 2631} {"train_loss": -6.438150405883789, "global_step": 110505, "epoch": 2631} {"train_loss": -6.45078706741333, "global_step": 110506, "epoch": 2631} {"train_loss": -6.429816246032715, "global_step": 110507, "epoch": 2631} {"train_loss": -6.5689167976379395, "global_step": 110508, "epoch": 2631} {"train_loss": -6.398755073547363, "global_step": 110509, "epoch": 2631} {"train_loss": -6.520541191101074, "global_step": 110510, "epoch": 2631} {"train_loss": -6.411296844482422, "global_step": 110511, "epoch": 2631} {"train_loss": -6.487570762634277, "global_step": 110512, "epoch": 2631} {"train_loss": -6.391528129577637, "global_step": 110513, "epoch": 2631} {"train_loss": -6.404015064239502, "global_step": 110514, "epoch": 2631} {"train_loss": -6.477534294128418, "global_step": 110515, "epoch": 2631} {"train_loss": -6.447655200958252, "global_step": 110516, "epoch": 2631} {"train_loss": -6.401671886444092, "global_step": 110517, "epoch": 2631} {"train_loss": -6.457401752471924, "global_step": 110518, "epoch": 2631} {"train_loss": -6.584444046020508, "global_step": 110519, "epoch": 2631} {"train_loss": -6.467578887939453, "global_step": 110520, "epoch": 2631} {"train_loss": -6.424843788146973, "global_step": 110521, "epoch": 2631} {"train_loss": -6.445439338684082, "global_step": 110522, "epoch": 2631} {"train_loss": -6.524972438812256, "global_step": 110523, "epoch": 2631} {"train_loss": -6.479609966278076, "global_step": 110524, "epoch": 2631} {"train_loss": -6.370658874511719, "global_step": 110525, "epoch": 2631} {"train_loss": -6.476362228393555, "global_step": 110526, "epoch": 2631} {"train_loss": -6.520561218261719, "global_step": 110527, "epoch": 2631} {"train_loss": -6.502050399780273, "global_step": 110528, "epoch": 2631} {"train_loss": -6.629192352294922, "global_step": 110529, "epoch": 2631} {"train_loss": -6.465178966522217, "global_step": 110530, "epoch": 2631} {"train_loss": -6.50861930847168, "global_step": 110531, "epoch": 2631} {"train_loss": -6.339707374572754, "global_step": 110532, "epoch": 2631} {"train_loss": -6.436380863189697, "global_step": 110533, "epoch": 2631} {"train_loss": -6.4283447265625, "global_step": 110534, "epoch": 2631} {"train_loss": -6.445629119873047, "global_step": 110535, "epoch": 2631} {"train_loss": -6.547083854675293, "global_step": 110536, "epoch": 2631} {"train_loss": -6.43314266204834, "global_step": 110537, "epoch": 2631} {"train_loss": -6.426793098449707, "global_step": 110538, "epoch": 2631} {"train_loss": -6.500727653503418, "global_step": 110539, "epoch": 2631} {"train_loss": -6.52202033996582, "global_step": 110540, "epoch": 2631} {"train_loss": -6.484580039978027, "global_step": 110541, "epoch": 2631} {"train_loss": -6.419099807739258, "global_step": 110542, "epoch": 2631} {"train_loss": -6.46289552961077, "global_step": 110543, "epoch": 2631, "val_loss": 76286.0625} {"train_loss": -6.424310207366943, "global_step": 110544, "epoch": 2632} {"train_loss": -6.533829689025879, "global_step": 110545, "epoch": 2632} {"train_loss": -6.560441970825195, "global_step": 110546, "epoch": 2632} {"train_loss": -6.466217994689941, "global_step": 110547, "epoch": 2632} {"train_loss": -6.470439434051514, "global_step": 110548, "epoch": 2632} {"train_loss": -6.510393142700195, "global_step": 110549, "epoch": 2632} {"train_loss": -6.499996185302734, "global_step": 110550, "epoch": 2632} {"train_loss": -6.434451103210449, "global_step": 110551, "epoch": 2632} {"train_loss": -6.494231224060059, "global_step": 110552, "epoch": 2632} {"train_loss": -6.5835418701171875, "global_step": 110553, "epoch": 2632} {"train_loss": -6.375734329223633, "global_step": 110554, "epoch": 2632} {"train_loss": -6.435358047485352, "global_step": 110555, "epoch": 2632} {"train_loss": -6.519700050354004, "global_step": 110556, "epoch": 2632} {"train_loss": -6.482911586761475, "global_step": 110557, "epoch": 2632} {"train_loss": -6.395644187927246, "global_step": 110558, "epoch": 2632} {"train_loss": -6.494811058044434, "global_step": 110559, "epoch": 2632} {"train_loss": -6.497206687927246, "global_step": 110560, "epoch": 2632} {"train_loss": -6.474615097045898, "global_step": 110561, "epoch": 2632} {"train_loss": -6.5071306228637695, "global_step": 110562, "epoch": 2632} {"train_loss": -6.380777835845947, "global_step": 110563, "epoch": 2632} {"train_loss": -6.4886884689331055, "global_step": 110564, "epoch": 2632} {"train_loss": -6.5893425941467285, "global_step": 110565, "epoch": 2632} {"train_loss": -6.547662734985352, "global_step": 110566, "epoch": 2632} {"train_loss": -6.46708869934082, "global_step": 110567, "epoch": 2632} {"train_loss": -6.534910202026367, "global_step": 110568, "epoch": 2632} {"train_loss": -6.41297721862793, "global_step": 110569, "epoch": 2632} {"train_loss": -6.646810054779053, "global_step": 110570, "epoch": 2632} {"train_loss": -6.608371734619141, "global_step": 110571, "epoch": 2632} {"train_loss": -6.332794189453125, "global_step": 110572, "epoch": 2632} {"train_loss": -6.364860534667969, "global_step": 110573, "epoch": 2632} {"train_loss": -6.40693473815918, "global_step": 110574, "epoch": 2632} {"train_loss": -6.548813343048096, "global_step": 110575, "epoch": 2632} {"train_loss": -6.394331932067871, "global_step": 110576, "epoch": 2632} {"train_loss": -6.386035919189453, "global_step": 110577, "epoch": 2632} {"train_loss": -6.569273471832275, "global_step": 110578, "epoch": 2632} {"train_loss": -6.370604991912842, "global_step": 110579, "epoch": 2632} {"train_loss": -6.375945091247559, "global_step": 110580, "epoch": 2632} {"train_loss": -6.482574939727783, "global_step": 110581, "epoch": 2632} {"train_loss": -6.488555908203125, "global_step": 110582, "epoch": 2632} {"train_loss": -6.500206470489502, "global_step": 110583, "epoch": 2632} {"train_loss": -6.452178001403809, "global_step": 110584, "epoch": 2632} {"train_loss": -6.471693243299212, "global_step": 110585, "epoch": 2632, "val_loss": 76379.484375} {"train_loss": -6.471733093261719, "global_step": 110586, "epoch": 2633} {"train_loss": -6.478368759155273, "global_step": 110587, "epoch": 2633} {"train_loss": -6.314528465270996, "global_step": 110588, "epoch": 2633} {"train_loss": -6.446186065673828, "global_step": 110589, "epoch": 2633} {"train_loss": -6.543643951416016, "global_step": 110590, "epoch": 2633} {"train_loss": -6.524530410766602, "global_step": 110591, "epoch": 2633} {"train_loss": -6.413277626037598, "global_step": 110592, "epoch": 2633} {"train_loss": -6.464892387390137, "global_step": 110593, "epoch": 2633} {"train_loss": -6.468601703643799, "global_step": 110594, "epoch": 2633} {"train_loss": -6.57840633392334, "global_step": 110595, "epoch": 2633} {"train_loss": -6.52406120300293, "global_step": 110596, "epoch": 2633} {"train_loss": -6.401371002197266, "global_step": 110597, "epoch": 2633} {"train_loss": -6.504009246826172, "global_step": 110598, "epoch": 2633} {"train_loss": -6.5148396492004395, "global_step": 110599, "epoch": 2633} {"train_loss": -6.5160722732543945, "global_step": 110600, "epoch": 2633} {"train_loss": -6.53373908996582, "global_step": 110601, "epoch": 2633} {"train_loss": -6.437384128570557, "global_step": 110602, "epoch": 2633} {"train_loss": -6.549699783325195, "global_step": 110603, "epoch": 2633} {"train_loss": -6.555596351623535, "global_step": 110604, "epoch": 2633} {"train_loss": -6.505579948425293, "global_step": 110605, "epoch": 2633} {"train_loss": -6.473097324371338, "global_step": 110606, "epoch": 2633} {"train_loss": -6.58070707321167, "global_step": 110607, "epoch": 2633} {"train_loss": -6.365888595581055, "global_step": 110608, "epoch": 2633} {"train_loss": -6.47968864440918, "global_step": 110609, "epoch": 2633} {"train_loss": -6.512322902679443, "global_step": 110610, "epoch": 2633} {"train_loss": -6.482951641082764, "global_step": 110611, "epoch": 2633} {"train_loss": -6.603196144104004, "global_step": 110612, "epoch": 2633} {"train_loss": -6.384930610656738, "global_step": 110613, "epoch": 2633} {"train_loss": -6.570016860961914, "global_step": 110614, "epoch": 2633} {"train_loss": -6.562242031097412, "global_step": 110615, "epoch": 2633} {"train_loss": -6.523548126220703, "global_step": 110616, "epoch": 2633} {"train_loss": -6.521060943603516, "global_step": 110617, "epoch": 2633} {"train_loss": -6.493520259857178, "global_step": 110618, "epoch": 2633} {"train_loss": -6.496808052062988, "global_step": 110619, "epoch": 2633} {"train_loss": -6.587116718292236, "global_step": 110620, "epoch": 2633} {"train_loss": -6.499765396118164, "global_step": 110621, "epoch": 2633} {"train_loss": -6.48888635635376, "global_step": 110622, "epoch": 2633} {"train_loss": -6.529473781585693, "global_step": 110623, "epoch": 2633} {"train_loss": -6.521094799041748, "global_step": 110624, "epoch": 2633} {"train_loss": -6.394230365753174, "global_step": 110625, "epoch": 2633} {"train_loss": -6.5943603515625, "global_step": 110626, "epoch": 2633} {"train_loss": -6.49837387175787, "global_step": 110627, "epoch": 2633, "val_loss": 76339.0703125} {"train_loss": -6.464388370513916, "global_step": 110628, "epoch": 2634} {"train_loss": -6.454215049743652, "global_step": 110629, "epoch": 2634} {"train_loss": -6.548994064331055, "global_step": 110630, "epoch": 2634} {"train_loss": -6.66464376449585, "global_step": 110631, "epoch": 2634} {"train_loss": -6.605772018432617, "global_step": 110632, "epoch": 2634} {"train_loss": -6.433483600616455, "global_step": 110633, "epoch": 2634} {"train_loss": -6.517694473266602, "global_step": 110634, "epoch": 2634} {"train_loss": -6.4847211837768555, "global_step": 110635, "epoch": 2634} {"train_loss": -6.43419075012207, "global_step": 110636, "epoch": 2634} {"train_loss": -6.479306221008301, "global_step": 110637, "epoch": 2634} {"train_loss": -6.507335662841797, "global_step": 110638, "epoch": 2634} {"train_loss": -6.390636444091797, "global_step": 110639, "epoch": 2634} {"train_loss": -6.530220031738281, "global_step": 110640, "epoch": 2634} {"train_loss": -6.523034572601318, "global_step": 110641, "epoch": 2634} {"train_loss": -6.507513046264648, "global_step": 110642, "epoch": 2634} {"train_loss": -6.477987289428711, "global_step": 110643, "epoch": 2634} {"train_loss": -6.48931884765625, "global_step": 110644, "epoch": 2634} {"train_loss": -6.519123077392578, "global_step": 110645, "epoch": 2634} {"train_loss": -6.51932954788208, "global_step": 110646, "epoch": 2634} {"train_loss": -6.511022090911865, "global_step": 110647, "epoch": 2634} {"train_loss": -6.436253070831299, "global_step": 110648, "epoch": 2634} {"train_loss": -6.42761754989624, "global_step": 110649, "epoch": 2634} {"train_loss": -6.47669792175293, "global_step": 110650, "epoch": 2634} {"train_loss": -6.522406578063965, "global_step": 110651, "epoch": 2634} {"train_loss": -6.461813449859619, "global_step": 110652, "epoch": 2634} {"train_loss": -6.546740531921387, "global_step": 110653, "epoch": 2634} {"train_loss": -6.425116539001465, "global_step": 110654, "epoch": 2634} {"train_loss": -6.351327419281006, "global_step": 110655, "epoch": 2634} {"train_loss": -6.4462995529174805, "global_step": 110656, "epoch": 2634} {"train_loss": -6.374255657196045, "global_step": 110657, "epoch": 2634} {"train_loss": -6.497230529785156, "global_step": 110658, "epoch": 2634} {"train_loss": -6.277400493621826, "global_step": 110659, "epoch": 2634} {"train_loss": -6.435686111450195, "global_step": 110660, "epoch": 2634} {"train_loss": -6.448967933654785, "global_step": 110661, "epoch": 2634} {"train_loss": -6.328243255615234, "global_step": 110662, "epoch": 2634} {"train_loss": -6.330942153930664, "global_step": 110663, "epoch": 2634} {"train_loss": -6.390806198120117, "global_step": 110664, "epoch": 2634} {"train_loss": -6.436094760894775, "global_step": 110665, "epoch": 2634} {"train_loss": -6.481288909912109, "global_step": 110666, "epoch": 2634} {"train_loss": -6.326416015625, "global_step": 110667, "epoch": 2634} {"train_loss": -6.380738258361816, "global_step": 110668, "epoch": 2634} {"train_loss": -6.462801365625291, "global_step": 110669, "epoch": 2634, "val_loss": 76479.59375} {"train_loss": -6.3696746826171875, "global_step": 110670, "epoch": 2635} {"train_loss": -6.550606727600098, "global_step": 110671, "epoch": 2635} {"train_loss": -6.278106689453125, "global_step": 110672, "epoch": 2635} {"train_loss": -6.358518600463867, "global_step": 110673, "epoch": 2635} {"train_loss": -6.48148775100708, "global_step": 110674, "epoch": 2635} {"train_loss": -6.502923011779785, "global_step": 110675, "epoch": 2635} {"train_loss": -6.473085880279541, "global_step": 110676, "epoch": 2635} {"train_loss": -6.474987983703613, "global_step": 110677, "epoch": 2635} {"train_loss": -6.3658318519592285, "global_step": 110678, "epoch": 2635} {"train_loss": -6.482110977172852, "global_step": 110679, "epoch": 2635} {"train_loss": -6.424870014190674, "global_step": 110680, "epoch": 2635} {"train_loss": -6.454726219177246, "global_step": 110681, "epoch": 2635} {"train_loss": -6.38258695602417, "global_step": 110682, "epoch": 2635} {"train_loss": -6.49535608291626, "global_step": 110683, "epoch": 2635} {"train_loss": -6.633663177490234, "global_step": 110684, "epoch": 2635} {"train_loss": -6.536492347717285, "global_step": 110685, "epoch": 2635} {"train_loss": -6.383920669555664, "global_step": 110686, "epoch": 2635} {"train_loss": -6.490412712097168, "global_step": 110687, "epoch": 2635} {"train_loss": -6.507221221923828, "global_step": 110688, "epoch": 2635} {"train_loss": -6.440286636352539, "global_step": 110689, "epoch": 2635} {"train_loss": -6.44404411315918, "global_step": 110690, "epoch": 2635} {"train_loss": -6.439175605773926, "global_step": 110691, "epoch": 2635} {"train_loss": -6.342693328857422, "global_step": 110692, "epoch": 2635} {"train_loss": -6.416731834411621, "global_step": 110693, "epoch": 2635} {"train_loss": -6.481043338775635, "global_step": 110694, "epoch": 2635} {"train_loss": -6.451184272766113, "global_step": 110695, "epoch": 2635} {"train_loss": -6.50412654876709, "global_step": 110696, "epoch": 2635} {"train_loss": -6.420209884643555, "global_step": 110697, "epoch": 2635} {"train_loss": -6.416832447052002, "global_step": 110698, "epoch": 2635} {"train_loss": -6.4876708984375, "global_step": 110699, "epoch": 2635} {"train_loss": -6.416489601135254, "global_step": 110700, "epoch": 2635} {"train_loss": -6.466082572937012, "global_step": 110701, "epoch": 2635} {"train_loss": -6.438680648803711, "global_step": 110702, "epoch": 2635} {"train_loss": -6.456916809082031, "global_step": 110703, "epoch": 2635} {"train_loss": -6.411405086517334, "global_step": 110704, "epoch": 2635} {"train_loss": -6.4322381019592285, "global_step": 110705, "epoch": 2635} {"train_loss": -6.429067134857178, "global_step": 110706, "epoch": 2635} {"train_loss": -6.414543628692627, "global_step": 110707, "epoch": 2635} {"train_loss": -6.4008331298828125, "global_step": 110708, "epoch": 2635} {"train_loss": -6.467796802520752, "global_step": 110709, "epoch": 2635} {"train_loss": -6.569115161895752, "global_step": 110710, "epoch": 2635} {"train_loss": -6.447162503287906, "global_step": 110711, "epoch": 2635, "val_loss": 76390.2265625} {"train_loss": -6.446079730987549, "global_step": 110712, "epoch": 2636} {"train_loss": -6.472336769104004, "global_step": 110713, "epoch": 2636} {"train_loss": -6.580693244934082, "global_step": 110714, "epoch": 2636} {"train_loss": -6.525282859802246, "global_step": 110715, "epoch": 2636} {"train_loss": -6.5012593269348145, "global_step": 110716, "epoch": 2636} {"train_loss": -6.467885971069336, "global_step": 110717, "epoch": 2636} {"train_loss": -6.52243709564209, "global_step": 110718, "epoch": 2636} {"train_loss": -6.518326759338379, "global_step": 110719, "epoch": 2636} {"train_loss": -6.486296653747559, "global_step": 110720, "epoch": 2636} {"train_loss": -6.4411725997924805, "global_step": 110721, "epoch": 2636} {"train_loss": -6.424257755279541, "global_step": 110722, "epoch": 2636} {"train_loss": -6.4949750900268555, "global_step": 110723, "epoch": 2636} {"train_loss": -6.537230491638184, "global_step": 110724, "epoch": 2636} {"train_loss": -6.404325485229492, "global_step": 110725, "epoch": 2636} {"train_loss": -6.55283260345459, "global_step": 110726, "epoch": 2636} {"train_loss": -6.489687919616699, "global_step": 110727, "epoch": 2636} {"train_loss": -6.509889125823975, "global_step": 110728, "epoch": 2636} {"train_loss": -6.5177717208862305, "global_step": 110729, "epoch": 2636} {"train_loss": -6.468502044677734, "global_step": 110730, "epoch": 2636} {"train_loss": -6.502181053161621, "global_step": 110731, "epoch": 2636} {"train_loss": -6.41766881942749, "global_step": 110732, "epoch": 2636} {"train_loss": -6.548365592956543, "global_step": 110733, "epoch": 2636} {"train_loss": -6.555365562438965, "global_step": 110734, "epoch": 2636} {"train_loss": -6.489987373352051, "global_step": 110735, "epoch": 2636} {"train_loss": -6.551778793334961, "global_step": 110736, "epoch": 2636} {"train_loss": -6.507314682006836, "global_step": 110737, "epoch": 2636} {"train_loss": -6.497855186462402, "global_step": 110738, "epoch": 2636} {"train_loss": -6.4802961349487305, "global_step": 110739, "epoch": 2636} {"train_loss": -6.572572708129883, "global_step": 110740, "epoch": 2636} {"train_loss": -6.537171840667725, "global_step": 110741, "epoch": 2636} {"train_loss": -6.391746997833252, "global_step": 110742, "epoch": 2636} {"train_loss": -6.591499328613281, "global_step": 110743, "epoch": 2636} {"train_loss": -6.457606315612793, "global_step": 110744, "epoch": 2636} {"train_loss": -6.542744159698486, "global_step": 110745, "epoch": 2636} {"train_loss": -6.496400833129883, "global_step": 110746, "epoch": 2636} {"train_loss": -6.293582439422607, "global_step": 110747, "epoch": 2636} {"train_loss": -6.350683212280273, "global_step": 110748, "epoch": 2636} {"train_loss": -6.516148567199707, "global_step": 110749, "epoch": 2636} {"train_loss": -6.537235260009766, "global_step": 110750, "epoch": 2636} {"train_loss": -6.4078369140625, "global_step": 110751, "epoch": 2636} {"train_loss": -6.48048734664917, "global_step": 110752, "epoch": 2636} {"train_loss": -6.487794421968006, "global_step": 110753, "epoch": 2636, "val_loss": 76333.7890625} {"train_loss": -6.376031875610352, "global_step": 110754, "epoch": 2637} {"train_loss": -6.512523651123047, "global_step": 110755, "epoch": 2637} {"train_loss": -6.387235641479492, "global_step": 110756, "epoch": 2637} {"train_loss": -6.414382457733154, "global_step": 110757, "epoch": 2637} {"train_loss": -6.428544044494629, "global_step": 110758, "epoch": 2637} {"train_loss": -6.432730674743652, "global_step": 110759, "epoch": 2637} {"train_loss": -6.502196311950684, "global_step": 110760, "epoch": 2637} {"train_loss": -6.455103874206543, "global_step": 110761, "epoch": 2637} {"train_loss": -6.4662299156188965, "global_step": 110762, "epoch": 2637} {"train_loss": -6.554561614990234, "global_step": 110763, "epoch": 2637} {"train_loss": -6.579641342163086, "global_step": 110764, "epoch": 2637} {"train_loss": -6.435951232910156, "global_step": 110765, "epoch": 2637} {"train_loss": -6.5377397537231445, "global_step": 110766, "epoch": 2637} {"train_loss": -6.547162055969238, "global_step": 110767, "epoch": 2637} {"train_loss": -6.540225982666016, "global_step": 110768, "epoch": 2637} {"train_loss": -6.477906227111816, "global_step": 110769, "epoch": 2637} {"train_loss": -6.4581451416015625, "global_step": 110770, "epoch": 2637} {"train_loss": -6.457929611206055, "global_step": 110771, "epoch": 2637} {"train_loss": -6.505152702331543, "global_step": 110772, "epoch": 2637} {"train_loss": -6.445486068725586, "global_step": 110773, "epoch": 2637} {"train_loss": -6.4610185623168945, "global_step": 110774, "epoch": 2637} {"train_loss": -6.570683479309082, "global_step": 110775, "epoch": 2637} {"train_loss": -6.4060869216918945, "global_step": 110776, "epoch": 2637} {"train_loss": -6.595766067504883, "global_step": 110777, "epoch": 2637} {"train_loss": -6.467304229736328, "global_step": 110778, "epoch": 2637} {"train_loss": -6.521132946014404, "global_step": 110779, "epoch": 2637} {"train_loss": -6.568238258361816, "global_step": 110780, "epoch": 2637} {"train_loss": -6.522554397583008, "global_step": 110781, "epoch": 2637} {"train_loss": -6.523057460784912, "global_step": 110782, "epoch": 2637} {"train_loss": -6.380975723266602, "global_step": 110783, "epoch": 2637} {"train_loss": -6.521354675292969, "global_step": 110784, "epoch": 2637} {"train_loss": -6.501826286315918, "global_step": 110785, "epoch": 2637} {"train_loss": -6.507087707519531, "global_step": 110786, "epoch": 2637} {"train_loss": -6.513731956481934, "global_step": 110787, "epoch": 2637} {"train_loss": -6.553014755249023, "global_step": 110788, "epoch": 2637} {"train_loss": -6.425071716308594, "global_step": 110789, "epoch": 2637} {"train_loss": -6.486917495727539, "global_step": 110790, "epoch": 2637} {"train_loss": -6.5978217124938965, "global_step": 110791, "epoch": 2637} {"train_loss": -6.4603118896484375, "global_step": 110792, "epoch": 2637} {"train_loss": -6.488041877746582, "global_step": 110793, "epoch": 2637} {"train_loss": -6.449832439422607, "global_step": 110794, "epoch": 2637} {"train_loss": -6.4891084262302945, "global_step": 110795, "epoch": 2637, "val_loss": 76311.3125} {"train_loss": -6.480349540710449, "global_step": 110796, "epoch": 2638} {"train_loss": -6.59701681137085, "global_step": 110797, "epoch": 2638} {"train_loss": -6.518433570861816, "global_step": 110798, "epoch": 2638} {"train_loss": -6.52690315246582, "global_step": 110799, "epoch": 2638} {"train_loss": -6.507288932800293, "global_step": 110800, "epoch": 2638} {"train_loss": -6.663296222686768, "global_step": 110801, "epoch": 2638} {"train_loss": -6.542745113372803, "global_step": 110802, "epoch": 2638} {"train_loss": -6.458104133605957, "global_step": 110803, "epoch": 2638} {"train_loss": -6.41616153717041, "global_step": 110804, "epoch": 2638} {"train_loss": -6.45809268951416, "global_step": 110805, "epoch": 2638} {"train_loss": -6.550288200378418, "global_step": 110806, "epoch": 2638} {"train_loss": -6.424287796020508, "global_step": 110807, "epoch": 2638} {"train_loss": -6.576727867126465, "global_step": 110808, "epoch": 2638} {"train_loss": -6.483269691467285, "global_step": 110809, "epoch": 2638} {"train_loss": -6.372482776641846, "global_step": 110810, "epoch": 2638} {"train_loss": -6.572410583496094, "global_step": 110811, "epoch": 2638} {"train_loss": -6.441658020019531, "global_step": 110812, "epoch": 2638} {"train_loss": -6.468792915344238, "global_step": 110813, "epoch": 2638} {"train_loss": -6.3993353843688965, "global_step": 110814, "epoch": 2638} {"train_loss": -6.398813247680664, "global_step": 110815, "epoch": 2638} {"train_loss": -6.430965423583984, "global_step": 110816, "epoch": 2638} {"train_loss": -6.475589752197266, "global_step": 110817, "epoch": 2638} {"train_loss": -6.350958824157715, "global_step": 110818, "epoch": 2638} {"train_loss": -6.429574966430664, "global_step": 110819, "epoch": 2638} {"train_loss": -6.513467788696289, "global_step": 110820, "epoch": 2638} {"train_loss": -6.422446250915527, "global_step": 110821, "epoch": 2638} {"train_loss": -6.502854824066162, "global_step": 110822, "epoch": 2638} {"train_loss": -6.467540740966797, "global_step": 110823, "epoch": 2638} {"train_loss": -6.495423316955566, "global_step": 110824, "epoch": 2638} {"train_loss": -6.433111667633057, "global_step": 110825, "epoch": 2638} {"train_loss": -6.552364826202393, "global_step": 110826, "epoch": 2638} {"train_loss": -6.568995475769043, "global_step": 110827, "epoch": 2638} {"train_loss": -6.555235862731934, "global_step": 110828, "epoch": 2638} {"train_loss": -6.524437427520752, "global_step": 110829, "epoch": 2638} {"train_loss": -6.420839309692383, "global_step": 110830, "epoch": 2638} {"train_loss": -6.437678813934326, "global_step": 110831, "epoch": 2638} {"train_loss": -6.485048294067383, "global_step": 110832, "epoch": 2638} {"train_loss": -6.386889457702637, "global_step": 110833, "epoch": 2638} {"train_loss": -6.574543476104736, "global_step": 110834, "epoch": 2638} {"train_loss": -6.507396697998047, "global_step": 110835, "epoch": 2638} {"train_loss": -6.548213958740234, "global_step": 110836, "epoch": 2638} {"train_loss": -6.486514159611294, "global_step": 110837, "epoch": 2638, "val_loss": 76254.671875} {"train_loss": -6.650904178619385, "global_step": 110838, "epoch": 2639} {"train_loss": -6.485134124755859, "global_step": 110839, "epoch": 2639} {"train_loss": -6.517327308654785, "global_step": 110840, "epoch": 2639} {"train_loss": -6.438385486602783, "global_step": 110841, "epoch": 2639} {"train_loss": -6.466187477111816, "global_step": 110842, "epoch": 2639} {"train_loss": -6.4697160720825195, "global_step": 110843, "epoch": 2639} {"train_loss": -6.526932239532471, "global_step": 110844, "epoch": 2639} {"train_loss": -6.512441158294678, "global_step": 110845, "epoch": 2639} {"train_loss": -6.507566452026367, "global_step": 110846, "epoch": 2639} {"train_loss": -6.385537624359131, "global_step": 110847, "epoch": 2639} {"train_loss": -6.573871612548828, "global_step": 110848, "epoch": 2639} {"train_loss": -6.52345085144043, "global_step": 110849, "epoch": 2639} {"train_loss": -6.4751434326171875, "global_step": 110850, "epoch": 2639} {"train_loss": -6.397663593292236, "global_step": 110851, "epoch": 2639} {"train_loss": -6.542208194732666, "global_step": 110852, "epoch": 2639} {"train_loss": -6.586489677429199, "global_step": 110853, "epoch": 2639} {"train_loss": -6.525727272033691, "global_step": 110854, "epoch": 2639} {"train_loss": -6.447849273681641, "global_step": 110855, "epoch": 2639} {"train_loss": -6.398314952850342, "global_step": 110856, "epoch": 2639} {"train_loss": -6.374345779418945, "global_step": 110857, "epoch": 2639} {"train_loss": -6.340749740600586, "global_step": 110858, "epoch": 2639} {"train_loss": -6.572237014770508, "global_step": 110859, "epoch": 2639} {"train_loss": -6.301971435546875, "global_step": 110860, "epoch": 2639} {"train_loss": -6.349123954772949, "global_step": 110861, "epoch": 2639} {"train_loss": -6.430829048156738, "global_step": 110862, "epoch": 2639} {"train_loss": -6.312904357910156, "global_step": 110863, "epoch": 2639} {"train_loss": -6.436810493469238, "global_step": 110864, "epoch": 2639} {"train_loss": -6.30029821395874, "global_step": 110865, "epoch": 2639} {"train_loss": -6.459939002990723, "global_step": 110866, "epoch": 2639} {"train_loss": -6.3965349197387695, "global_step": 110867, "epoch": 2639} {"train_loss": -6.336030960083008, "global_step": 110868, "epoch": 2639} {"train_loss": -6.443169116973877, "global_step": 110869, "epoch": 2639} {"train_loss": -6.3375725746154785, "global_step": 110870, "epoch": 2639} {"train_loss": -6.447269439697266, "global_step": 110871, "epoch": 2639} {"train_loss": -6.385544776916504, "global_step": 110872, "epoch": 2639} {"train_loss": -6.360835552215576, "global_step": 110873, "epoch": 2639} {"train_loss": -6.43380069732666, "global_step": 110874, "epoch": 2639} {"train_loss": -6.403853416442871, "global_step": 110875, "epoch": 2639} {"train_loss": -6.410013198852539, "global_step": 110876, "epoch": 2639} {"train_loss": -6.453579425811768, "global_step": 110877, "epoch": 2639} {"train_loss": -6.420787811279297, "global_step": 110878, "epoch": 2639} {"train_loss": -6.441677729288737, "global_step": 110879, "epoch": 2639, "val_loss": 76415.9453125} {"train_loss": -6.510338306427002, "global_step": 110880, "epoch": 2640} {"train_loss": -6.327926158905029, "global_step": 110881, "epoch": 2640} {"train_loss": -6.48885440826416, "global_step": 110882, "epoch": 2640} {"train_loss": -6.40605354309082, "global_step": 110883, "epoch": 2640} {"train_loss": -6.411983966827393, "global_step": 110884, "epoch": 2640} {"train_loss": -6.316341400146484, "global_step": 110885, "epoch": 2640} {"train_loss": -6.4937543869018555, "global_step": 110886, "epoch": 2640} {"train_loss": -6.424768447875977, "global_step": 110887, "epoch": 2640} {"train_loss": -6.428564548492432, "global_step": 110888, "epoch": 2640} {"train_loss": -6.451460838317871, "global_step": 110889, "epoch": 2640} {"train_loss": -6.405298233032227, "global_step": 110890, "epoch": 2640} {"train_loss": -6.518688201904297, "global_step": 110891, "epoch": 2640} {"train_loss": -6.385006427764893, "global_step": 110892, "epoch": 2640} {"train_loss": -6.340811252593994, "global_step": 110893, "epoch": 2640} {"train_loss": -6.399595737457275, "global_step": 110894, "epoch": 2640} {"train_loss": -6.464643478393555, "global_step": 110895, "epoch": 2640} {"train_loss": -6.381017208099365, "global_step": 110896, "epoch": 2640} {"train_loss": -6.379482269287109, "global_step": 110897, "epoch": 2640} {"train_loss": -6.47070837020874, "global_step": 110898, "epoch": 2640} {"train_loss": -6.479395866394043, "global_step": 110899, "epoch": 2640} {"train_loss": -6.4157257080078125, "global_step": 110900, "epoch": 2640} {"train_loss": -6.448060035705566, "global_step": 110901, "epoch": 2640} {"train_loss": -6.415444850921631, "global_step": 110902, "epoch": 2640} {"train_loss": -6.498161315917969, "global_step": 110903, "epoch": 2640} {"train_loss": -6.514973163604736, "global_step": 110904, "epoch": 2640} {"train_loss": -6.403870105743408, "global_step": 110905, "epoch": 2640} {"train_loss": -6.458393573760986, "global_step": 110906, "epoch": 2640} {"train_loss": -6.44110107421875, "global_step": 110907, "epoch": 2640} {"train_loss": -6.569369316101074, "global_step": 110908, "epoch": 2640} {"train_loss": -6.455846309661865, "global_step": 110909, "epoch": 2640} {"train_loss": -6.41373348236084, "global_step": 110910, "epoch": 2640} {"train_loss": -6.482805252075195, "global_step": 110911, "epoch": 2640} {"train_loss": -6.3825531005859375, "global_step": 110912, "epoch": 2640} {"train_loss": -6.453349590301514, "global_step": 110913, "epoch": 2640} {"train_loss": -6.58287239074707, "global_step": 110914, "epoch": 2640} {"train_loss": -6.451692581176758, "global_step": 110915, "epoch": 2640} {"train_loss": -6.39410400390625, "global_step": 110916, "epoch": 2640} {"train_loss": -6.445484161376953, "global_step": 110917, "epoch": 2640} {"train_loss": -6.643057346343994, "global_step": 110918, "epoch": 2640} {"train_loss": -6.470182418823242, "global_step": 110919, "epoch": 2640} {"train_loss": -6.553203582763672, "global_step": 110920, "epoch": 2640} {"train_loss": -6.448911031087239, "global_step": 110921, "epoch": 2640, "val_loss": 76021.0390625} {"train_loss": -6.476863861083984, "global_step": 110922, "epoch": 2641} {"train_loss": -6.622995376586914, "global_step": 110923, "epoch": 2641} {"train_loss": -6.439375877380371, "global_step": 110924, "epoch": 2641} {"train_loss": -6.374478340148926, "global_step": 110925, "epoch": 2641} {"train_loss": -6.457751274108887, "global_step": 110926, "epoch": 2641} {"train_loss": -6.56583833694458, "global_step": 110927, "epoch": 2641} {"train_loss": -6.390183448791504, "global_step": 110928, "epoch": 2641} {"train_loss": -6.473089694976807, "global_step": 110929, "epoch": 2641} {"train_loss": -6.5420732498168945, "global_step": 110930, "epoch": 2641} {"train_loss": -6.438155651092529, "global_step": 110931, "epoch": 2641} {"train_loss": -6.417806625366211, "global_step": 110932, "epoch": 2641} {"train_loss": -6.44049072265625, "global_step": 110933, "epoch": 2641} {"train_loss": -6.468732833862305, "global_step": 110934, "epoch": 2641} {"train_loss": -6.55504035949707, "global_step": 110935, "epoch": 2641} {"train_loss": -6.421899795532227, "global_step": 110936, "epoch": 2641} {"train_loss": -6.381619453430176, "global_step": 110937, "epoch": 2641} {"train_loss": -6.588350296020508, "global_step": 110938, "epoch": 2641} {"train_loss": -6.47384786605835, "global_step": 110939, "epoch": 2641} {"train_loss": -6.404080390930176, "global_step": 110940, "epoch": 2641} {"train_loss": -6.4264936447143555, "global_step": 110941, "epoch": 2641} {"train_loss": -6.460619926452637, "global_step": 110942, "epoch": 2641} {"train_loss": -6.518095016479492, "global_step": 110943, "epoch": 2641} {"train_loss": -6.370701789855957, "global_step": 110944, "epoch": 2641} {"train_loss": -6.529274940490723, "global_step": 110945, "epoch": 2641} {"train_loss": -6.616717338562012, "global_step": 110946, "epoch": 2641} {"train_loss": -6.466513156890869, "global_step": 110947, "epoch": 2641} {"train_loss": -6.469396591186523, "global_step": 110948, "epoch": 2641} {"train_loss": -6.583909034729004, "global_step": 110949, "epoch": 2641} {"train_loss": -6.380541801452637, "global_step": 110950, "epoch": 2641} {"train_loss": -6.457406997680664, "global_step": 110951, "epoch": 2641} {"train_loss": -6.495689392089844, "global_step": 110952, "epoch": 2641} {"train_loss": -6.455651760101318, "global_step": 110953, "epoch": 2641} {"train_loss": -6.4527106285095215, "global_step": 110954, "epoch": 2641} {"train_loss": -6.464505195617676, "global_step": 110955, "epoch": 2641} {"train_loss": -6.527740478515625, "global_step": 110956, "epoch": 2641} {"train_loss": -6.593045234680176, "global_step": 110957, "epoch": 2641} {"train_loss": -6.48075008392334, "global_step": 110958, "epoch": 2641} {"train_loss": -6.438379287719727, "global_step": 110959, "epoch": 2641} {"train_loss": -6.426640510559082, "global_step": 110960, "epoch": 2641} {"train_loss": -6.533397197723389, "global_step": 110961, "epoch": 2641} {"train_loss": -6.377568244934082, "global_step": 110962, "epoch": 2641} {"train_loss": -6.476636568705241, "global_step": 110963, "epoch": 2641, "val_loss": 76462.578125} {"train_loss": -6.553307056427002, "global_step": 110964, "epoch": 2642} {"train_loss": -6.433421611785889, "global_step": 110965, "epoch": 2642} {"train_loss": -6.541887283325195, "global_step": 110966, "epoch": 2642} {"train_loss": -6.548285484313965, "global_step": 110967, "epoch": 2642} {"train_loss": -6.456323146820068, "global_step": 110968, "epoch": 2642} {"train_loss": -6.480257987976074, "global_step": 110969, "epoch": 2642} {"train_loss": -6.500466346740723, "global_step": 110970, "epoch": 2642} {"train_loss": -6.419275283813477, "global_step": 110971, "epoch": 2642} {"train_loss": -6.543856620788574, "global_step": 110972, "epoch": 2642} {"train_loss": -6.508959770202637, "global_step": 110973, "epoch": 2642} {"train_loss": -6.517949104309082, "global_step": 110974, "epoch": 2642} {"train_loss": -6.395529270172119, "global_step": 110975, "epoch": 2642} {"train_loss": -6.469026565551758, "global_step": 110976, "epoch": 2642} {"train_loss": -6.44113826751709, "global_step": 110977, "epoch": 2642} {"train_loss": -6.525209426879883, "global_step": 110978, "epoch": 2642} {"train_loss": -6.501990795135498, "global_step": 110979, "epoch": 2642} {"train_loss": -6.726141929626465, "global_step": 110980, "epoch": 2642} {"train_loss": -6.587881565093994, "global_step": 110981, "epoch": 2642} {"train_loss": -6.424930572509766, "global_step": 110982, "epoch": 2642} {"train_loss": -6.52484655380249, "global_step": 110983, "epoch": 2642} {"train_loss": -6.5850510597229, "global_step": 110984, "epoch": 2642} {"train_loss": -6.559568405151367, "global_step": 110985, "epoch": 2642} {"train_loss": -6.577492713928223, "global_step": 110986, "epoch": 2642} {"train_loss": -6.53317403793335, "global_step": 110987, "epoch": 2642} {"train_loss": -6.523133754730225, "global_step": 110988, "epoch": 2642} {"train_loss": -6.439277648925781, "global_step": 110989, "epoch": 2642} {"train_loss": -6.482217788696289, "global_step": 110990, "epoch": 2642} {"train_loss": -6.439402103424072, "global_step": 110991, "epoch": 2642} {"train_loss": -6.330066680908203, "global_step": 110992, "epoch": 2642} {"train_loss": -6.354450702667236, "global_step": 110993, "epoch": 2642} {"train_loss": -6.423894882202148, "global_step": 110994, "epoch": 2642} {"train_loss": -6.372127532958984, "global_step": 110995, "epoch": 2642} {"train_loss": -6.456857204437256, "global_step": 110996, "epoch": 2642} {"train_loss": -6.561888694763184, "global_step": 110997, "epoch": 2642} {"train_loss": -6.467545032501221, "global_step": 110998, "epoch": 2642} {"train_loss": -6.499624252319336, "global_step": 110999, "epoch": 2642} {"train_loss": -6.545690059661865, "global_step": 111000, "epoch": 2642} {"train_loss": -6.303966045379639, "global_step": 111001, "epoch": 2642} {"train_loss": -6.449060440063477, "global_step": 111002, "epoch": 2642} {"train_loss": -6.46889591217041, "global_step": 111003, "epoch": 2642} {"train_loss": -6.390424728393555, "global_step": 111004, "epoch": 2642} {"train_loss": -6.483567737397694, "global_step": 111005, "epoch": 2642, "val_loss": 76773.234375} {"train_loss": -6.317670822143555, "global_step": 111006, "epoch": 2643} {"train_loss": -6.27949333190918, "global_step": 111007, "epoch": 2643} {"train_loss": -6.462051868438721, "global_step": 111008, "epoch": 2643} {"train_loss": -6.4156084060668945, "global_step": 111009, "epoch": 2643} {"train_loss": -6.387592315673828, "global_step": 111010, "epoch": 2643} {"train_loss": -6.4331464767456055, "global_step": 111011, "epoch": 2643} {"train_loss": -6.4896440505981445, "global_step": 111012, "epoch": 2643} {"train_loss": -6.344195365905762, "global_step": 111013, "epoch": 2643} {"train_loss": -6.459510803222656, "global_step": 111014, "epoch": 2643} {"train_loss": -6.542525768280029, "global_step": 111015, "epoch": 2643} {"train_loss": -6.433060169219971, "global_step": 111016, "epoch": 2643} {"train_loss": -6.457552909851074, "global_step": 111017, "epoch": 2643} {"train_loss": -6.429797649383545, "global_step": 111018, "epoch": 2643} {"train_loss": -6.571715354919434, "global_step": 111019, "epoch": 2643} {"train_loss": -6.5222978591918945, "global_step": 111020, "epoch": 2643} {"train_loss": -6.338203430175781, "global_step": 111021, "epoch": 2643} {"train_loss": -6.5153045654296875, "global_step": 111022, "epoch": 2643} {"train_loss": -6.463128089904785, "global_step": 111023, "epoch": 2643} {"train_loss": -6.521298885345459, "global_step": 111024, "epoch": 2643} {"train_loss": -6.469455718994141, "global_step": 111025, "epoch": 2643} {"train_loss": -6.440321922302246, "global_step": 111026, "epoch": 2643} {"train_loss": -6.46458101272583, "global_step": 111027, "epoch": 2643} {"train_loss": -6.585391044616699, "global_step": 111028, "epoch": 2643} {"train_loss": -6.5003743171691895, "global_step": 111029, "epoch": 2643} {"train_loss": -6.473076820373535, "global_step": 111030, "epoch": 2643} {"train_loss": -6.462946891784668, "global_step": 111031, "epoch": 2643} {"train_loss": -6.446165084838867, "global_step": 111032, "epoch": 2643} {"train_loss": -6.533956527709961, "global_step": 111033, "epoch": 2643} {"train_loss": -6.456138610839844, "global_step": 111034, "epoch": 2643} {"train_loss": -6.534887313842773, "global_step": 111035, "epoch": 2643} {"train_loss": -6.433101177215576, "global_step": 111036, "epoch": 2643} {"train_loss": -6.590008735656738, "global_step": 111037, "epoch": 2643} {"train_loss": -6.574211597442627, "global_step": 111038, "epoch": 2643} {"train_loss": -6.333045959472656, "global_step": 111039, "epoch": 2643} {"train_loss": -6.508050441741943, "global_step": 111040, "epoch": 2643} {"train_loss": -6.503373622894287, "global_step": 111041, "epoch": 2643} {"train_loss": -6.399127006530762, "global_step": 111042, "epoch": 2643} {"train_loss": -6.484455585479736, "global_step": 111043, "epoch": 2643} {"train_loss": -6.437359809875488, "global_step": 111044, "epoch": 2643} {"train_loss": -6.467931270599365, "global_step": 111045, "epoch": 2643} {"train_loss": -6.607640743255615, "global_step": 111046, "epoch": 2643} {"train_loss": -6.468239205224173, "global_step": 111047, "epoch": 2643, "val_loss": 76392.390625} {"train_loss": -6.451776027679443, "global_step": 111048, "epoch": 2644} {"train_loss": -6.4686713218688965, "global_step": 111049, "epoch": 2644} {"train_loss": -6.438403129577637, "global_step": 111050, "epoch": 2644} {"train_loss": -6.39559268951416, "global_step": 111051, "epoch": 2644} {"train_loss": -6.442317485809326, "global_step": 111052, "epoch": 2644} {"train_loss": -6.528931617736816, "global_step": 111053, "epoch": 2644} {"train_loss": -6.3491973876953125, "global_step": 111054, "epoch": 2644} {"train_loss": -6.425293922424316, "global_step": 111055, "epoch": 2644} {"train_loss": -6.428049087524414, "global_step": 111056, "epoch": 2644} {"train_loss": -6.452516555786133, "global_step": 111057, "epoch": 2644} {"train_loss": -6.593840599060059, "global_step": 111058, "epoch": 2644} {"train_loss": -6.449126243591309, "global_step": 111059, "epoch": 2644} {"train_loss": -6.539877891540527, "global_step": 111060, "epoch": 2644} {"train_loss": -6.479287624359131, "global_step": 111061, "epoch": 2644} {"train_loss": -6.567156791687012, "global_step": 111062, "epoch": 2644} {"train_loss": -6.581110000610352, "global_step": 111063, "epoch": 2644} {"train_loss": -6.461676597595215, "global_step": 111064, "epoch": 2644} {"train_loss": -6.625494003295898, "global_step": 111065, "epoch": 2644} {"train_loss": -6.507389068603516, "global_step": 111066, "epoch": 2644} {"train_loss": -6.449700832366943, "global_step": 111067, "epoch": 2644} {"train_loss": -6.57109260559082, "global_step": 111068, "epoch": 2644} {"train_loss": -6.5770978927612305, "global_step": 111069, "epoch": 2644} {"train_loss": -6.511818885803223, "global_step": 111070, "epoch": 2644} {"train_loss": -6.609867095947266, "global_step": 111071, "epoch": 2644} {"train_loss": -6.552256107330322, "global_step": 111072, "epoch": 2644} {"train_loss": -6.463871479034424, "global_step": 111073, "epoch": 2644} {"train_loss": -6.566115379333496, "global_step": 111074, "epoch": 2644} {"train_loss": -6.513242721557617, "global_step": 111075, "epoch": 2644} {"train_loss": -6.48313045501709, "global_step": 111076, "epoch": 2644} {"train_loss": -6.596259117126465, "global_step": 111077, "epoch": 2644} {"train_loss": -6.527528762817383, "global_step": 111078, "epoch": 2644} {"train_loss": -6.532499313354492, "global_step": 111079, "epoch": 2644} {"train_loss": -6.442852020263672, "global_step": 111080, "epoch": 2644} {"train_loss": -6.489659786224365, "global_step": 111081, "epoch": 2644} {"train_loss": -6.493165016174316, "global_step": 111082, "epoch": 2644} {"train_loss": -6.406271934509277, "global_step": 111083, "epoch": 2644} {"train_loss": -6.4618449211120605, "global_step": 111084, "epoch": 2644} {"train_loss": -6.502920150756836, "global_step": 111085, "epoch": 2644} {"train_loss": -6.55783224105835, "global_step": 111086, "epoch": 2644} {"train_loss": -6.561678409576416, "global_step": 111087, "epoch": 2644} {"train_loss": -6.465843677520752, "global_step": 111088, "epoch": 2644} {"train_loss": -6.5003150417691185, "global_step": 111089, "epoch": 2644, "val_loss": 76474.5390625} {"train_loss": -6.449337959289551, "global_step": 111090, "epoch": 2645} {"train_loss": -6.45121431350708, "global_step": 111091, "epoch": 2645} {"train_loss": -6.44520902633667, "global_step": 111092, "epoch": 2645} {"train_loss": -6.454592704772949, "global_step": 111093, "epoch": 2645} {"train_loss": -6.455288410186768, "global_step": 111094, "epoch": 2645} {"train_loss": -6.452692985534668, "global_step": 111095, "epoch": 2645} {"train_loss": -6.537494659423828, "global_step": 111096, "epoch": 2645} {"train_loss": -6.437344551086426, "global_step": 111097, "epoch": 2645} {"train_loss": -6.334654808044434, "global_step": 111098, "epoch": 2645} {"train_loss": -6.485409736633301, "global_step": 111099, "epoch": 2645} {"train_loss": -6.453136444091797, "global_step": 111100, "epoch": 2645} {"train_loss": -6.510885238647461, "global_step": 111101, "epoch": 2645} {"train_loss": -6.4109601974487305, "global_step": 111102, "epoch": 2645} {"train_loss": -6.382883071899414, "global_step": 111103, "epoch": 2645} {"train_loss": -6.561084747314453, "global_step": 111104, "epoch": 2645} {"train_loss": -6.5778093338012695, "global_step": 111105, "epoch": 2645} {"train_loss": -6.367914199829102, "global_step": 111106, "epoch": 2645} {"train_loss": -6.449155807495117, "global_step": 111107, "epoch": 2645} {"train_loss": -6.388899803161621, "global_step": 111108, "epoch": 2645} {"train_loss": -6.52325439453125, "global_step": 111109, "epoch": 2645} {"train_loss": -6.4193315505981445, "global_step": 111110, "epoch": 2645} {"train_loss": -6.421018600463867, "global_step": 111111, "epoch": 2645} {"train_loss": -6.647889137268066, "global_step": 111112, "epoch": 2645} {"train_loss": -6.43684720993042, "global_step": 111113, "epoch": 2645} {"train_loss": -6.423189163208008, "global_step": 111114, "epoch": 2645} {"train_loss": -6.431197166442871, "global_step": 111115, "epoch": 2645} {"train_loss": -6.46762752532959, "global_step": 111116, "epoch": 2645} {"train_loss": -6.408869743347168, "global_step": 111117, "epoch": 2645} {"train_loss": -6.259065628051758, "global_step": 111118, "epoch": 2645} {"train_loss": -6.47615385055542, "global_step": 111119, "epoch": 2645} {"train_loss": -6.415627956390381, "global_step": 111120, "epoch": 2645} {"train_loss": -6.348290920257568, "global_step": 111121, "epoch": 2645} {"train_loss": -6.385961532592773, "global_step": 111122, "epoch": 2645} {"train_loss": -6.442892074584961, "global_step": 111123, "epoch": 2645} {"train_loss": -6.511465072631836, "global_step": 111124, "epoch": 2645} {"train_loss": -6.408523082733154, "global_step": 111125, "epoch": 2645} {"train_loss": -6.573625564575195, "global_step": 111126, "epoch": 2645} {"train_loss": -6.423462867736816, "global_step": 111127, "epoch": 2645} {"train_loss": -6.503230094909668, "global_step": 111128, "epoch": 2645} {"train_loss": -6.431678771972656, "global_step": 111129, "epoch": 2645} {"train_loss": -6.455120086669922, "global_step": 111130, "epoch": 2645} {"train_loss": -6.44872800509135, "global_step": 111131, "epoch": 2645, "val_loss": 76415.59375} {"train_loss": -6.442907810211182, "global_step": 111132, "epoch": 2646} {"train_loss": -6.439302444458008, "global_step": 111133, "epoch": 2646} {"train_loss": -6.459954738616943, "global_step": 111134, "epoch": 2646} {"train_loss": -6.456331729888916, "global_step": 111135, "epoch": 2646} {"train_loss": -6.414737224578857, "global_step": 111136, "epoch": 2646} {"train_loss": -6.541937828063965, "global_step": 111137, "epoch": 2646} {"train_loss": -6.514625072479248, "global_step": 111138, "epoch": 2646} {"train_loss": -6.3935747146606445, "global_step": 111139, "epoch": 2646} {"train_loss": -6.4467668533325195, "global_step": 111140, "epoch": 2646} {"train_loss": -6.4252753257751465, "global_step": 111141, "epoch": 2646} {"train_loss": -6.406238555908203, "global_step": 111142, "epoch": 2646} {"train_loss": -6.3988847732543945, "global_step": 111143, "epoch": 2646} {"train_loss": -6.4607954025268555, "global_step": 111144, "epoch": 2646} {"train_loss": -6.45950984954834, "global_step": 111145, "epoch": 2646} {"train_loss": -6.374384880065918, "global_step": 111146, "epoch": 2646} {"train_loss": -6.403055191040039, "global_step": 111147, "epoch": 2646} {"train_loss": -6.5121941566467285, "global_step": 111148, "epoch": 2646} {"train_loss": -6.340080261230469, "global_step": 111149, "epoch": 2646} {"train_loss": -6.487879753112793, "global_step": 111150, "epoch": 2646} {"train_loss": -6.464766025543213, "global_step": 111151, "epoch": 2646} {"train_loss": -6.500899791717529, "global_step": 111152, "epoch": 2646} {"train_loss": -6.593958854675293, "global_step": 111153, "epoch": 2646} {"train_loss": -6.497218608856201, "global_step": 111154, "epoch": 2646} {"train_loss": -6.524529457092285, "global_step": 111155, "epoch": 2646} {"train_loss": -6.537136554718018, "global_step": 111156, "epoch": 2646} {"train_loss": -6.587156295776367, "global_step": 111157, "epoch": 2646} {"train_loss": -6.50783634185791, "global_step": 111158, "epoch": 2646} {"train_loss": -6.475993633270264, "global_step": 111159, "epoch": 2646} {"train_loss": -6.471047878265381, "global_step": 111160, "epoch": 2646} {"train_loss": -6.499439239501953, "global_step": 111161, "epoch": 2646} {"train_loss": -6.45526123046875, "global_step": 111162, "epoch": 2646} {"train_loss": -6.491097450256348, "global_step": 111163, "epoch": 2646} {"train_loss": -6.4434709548950195, "global_step": 111164, "epoch": 2646} {"train_loss": -6.472858905792236, "global_step": 111165, "epoch": 2646} {"train_loss": -6.465304374694824, "global_step": 111166, "epoch": 2646} {"train_loss": -6.55046272277832, "global_step": 111167, "epoch": 2646} {"train_loss": -6.389702796936035, "global_step": 111168, "epoch": 2646} {"train_loss": -6.565670013427734, "global_step": 111169, "epoch": 2646} {"train_loss": -6.454524993896484, "global_step": 111170, "epoch": 2646} {"train_loss": -6.511241436004639, "global_step": 111171, "epoch": 2646} {"train_loss": -6.390515327453613, "global_step": 111172, "epoch": 2646} {"train_loss": -6.4725209304264615, "global_step": 111173, "epoch": 2646, "val_loss": 76387.2265625} {"train_loss": -6.559732437133789, "global_step": 111174, "epoch": 2647} {"train_loss": -6.494711875915527, "global_step": 111175, "epoch": 2647} {"train_loss": -6.534635543823242, "global_step": 111176, "epoch": 2647} {"train_loss": -6.453732013702393, "global_step": 111177, "epoch": 2647} {"train_loss": -6.398743629455566, "global_step": 111178, "epoch": 2647} {"train_loss": -6.531350612640381, "global_step": 111179, "epoch": 2647} {"train_loss": -6.531231880187988, "global_step": 111180, "epoch": 2647} {"train_loss": -6.4470744132995605, "global_step": 111181, "epoch": 2647} {"train_loss": -6.488947868347168, "global_step": 111182, "epoch": 2647} {"train_loss": -6.525395393371582, "global_step": 111183, "epoch": 2647} {"train_loss": -6.497554302215576, "global_step": 111184, "epoch": 2647} {"train_loss": -6.344335079193115, "global_step": 111185, "epoch": 2647} {"train_loss": -6.603589057922363, "global_step": 111186, "epoch": 2647} {"train_loss": -6.3561859130859375, "global_step": 111187, "epoch": 2647} {"train_loss": -6.524166107177734, "global_step": 111188, "epoch": 2647} {"train_loss": -6.450380802154541, "global_step": 111189, "epoch": 2647} {"train_loss": -6.5317583084106445, "global_step": 111190, "epoch": 2647} {"train_loss": -6.520513534545898, "global_step": 111191, "epoch": 2647} {"train_loss": -6.381760597229004, "global_step": 111192, "epoch": 2647} {"train_loss": -6.470690727233887, "global_step": 111193, "epoch": 2647} {"train_loss": -6.5403361320495605, "global_step": 111194, "epoch": 2647} {"train_loss": -6.303863048553467, "global_step": 111195, "epoch": 2647} {"train_loss": -6.5165510177612305, "global_step": 111196, "epoch": 2647} {"train_loss": -6.547693729400635, "global_step": 111197, "epoch": 2647} {"train_loss": -6.428895473480225, "global_step": 111198, "epoch": 2647} {"train_loss": -6.545947551727295, "global_step": 111199, "epoch": 2647} {"train_loss": -6.353678226470947, "global_step": 111200, "epoch": 2647} {"train_loss": -6.399561882019043, "global_step": 111201, "epoch": 2647} {"train_loss": -6.418203353881836, "global_step": 111202, "epoch": 2647} {"train_loss": -6.51446533203125, "global_step": 111203, "epoch": 2647} {"train_loss": -6.465441703796387, "global_step": 111204, "epoch": 2647} {"train_loss": -6.412829399108887, "global_step": 111205, "epoch": 2647} {"train_loss": -6.5155110359191895, "global_step": 111206, "epoch": 2647} {"train_loss": -6.466427326202393, "global_step": 111207, "epoch": 2647} {"train_loss": -6.423572540283203, "global_step": 111208, "epoch": 2647} {"train_loss": -6.392910957336426, "global_step": 111209, "epoch": 2647} {"train_loss": -6.497875213623047, "global_step": 111210, "epoch": 2647} {"train_loss": -6.522479057312012, "global_step": 111211, "epoch": 2647} {"train_loss": -6.4102559089660645, "global_step": 111212, "epoch": 2647} {"train_loss": -6.449692726135254, "global_step": 111213, "epoch": 2647} {"train_loss": -6.423996925354004, "global_step": 111214, "epoch": 2647} {"train_loss": -6.46643530754816, "global_step": 111215, "epoch": 2647, "val_loss": 76742.609375} {"train_loss": -6.533132553100586, "global_step": 111216, "epoch": 2648} {"train_loss": -6.2964324951171875, "global_step": 111217, "epoch": 2648} {"train_loss": -6.4366912841796875, "global_step": 111218, "epoch": 2648} {"train_loss": -6.423555374145508, "global_step": 111219, "epoch": 2648} {"train_loss": -6.474520206451416, "global_step": 111220, "epoch": 2648} {"train_loss": -6.457651138305664, "global_step": 111221, "epoch": 2648} {"train_loss": -6.449331283569336, "global_step": 111222, "epoch": 2648} {"train_loss": -6.470738410949707, "global_step": 111223, "epoch": 2648} {"train_loss": -6.342719078063965, "global_step": 111224, "epoch": 2648} {"train_loss": -6.2941203117370605, "global_step": 111225, "epoch": 2648} {"train_loss": -6.51821231842041, "global_step": 111226, "epoch": 2648} {"train_loss": -6.433207035064697, "global_step": 111227, "epoch": 2648} {"train_loss": -6.501690864562988, "global_step": 111228, "epoch": 2648} {"train_loss": -6.395307540893555, "global_step": 111229, "epoch": 2648} {"train_loss": -6.422863006591797, "global_step": 111230, "epoch": 2648} {"train_loss": -6.370512962341309, "global_step": 111231, "epoch": 2648} {"train_loss": -6.485783576965332, "global_step": 111232, "epoch": 2648} {"train_loss": -6.471857070922852, "global_step": 111233, "epoch": 2648} {"train_loss": -6.435551643371582, "global_step": 111234, "epoch": 2648} {"train_loss": -6.580405235290527, "global_step": 111235, "epoch": 2648} {"train_loss": -6.480563163757324, "global_step": 111236, "epoch": 2648} {"train_loss": -6.399899482727051, "global_step": 111237, "epoch": 2648} {"train_loss": -6.356935977935791, "global_step": 111238, "epoch": 2648} {"train_loss": -6.533132553100586, "global_step": 111239, "epoch": 2648} {"train_loss": -6.300359725952148, "global_step": 111240, "epoch": 2648} {"train_loss": -6.526827812194824, "global_step": 111241, "epoch": 2648} {"train_loss": -6.528983116149902, "global_step": 111242, "epoch": 2648} {"train_loss": -6.435052394866943, "global_step": 111243, "epoch": 2648} {"train_loss": -6.568790435791016, "global_step": 111244, "epoch": 2648} {"train_loss": -6.49691915512085, "global_step": 111245, "epoch": 2648} {"train_loss": -6.518881797790527, "global_step": 111246, "epoch": 2648} {"train_loss": -6.473265171051025, "global_step": 111247, "epoch": 2648} {"train_loss": -6.521613597869873, "global_step": 111248, "epoch": 2648} {"train_loss": -6.464558124542236, "global_step": 111249, "epoch": 2648} {"train_loss": -6.424105644226074, "global_step": 111250, "epoch": 2648} {"train_loss": -6.495279312133789, "global_step": 111251, "epoch": 2648} {"train_loss": -6.583498954772949, "global_step": 111252, "epoch": 2648} {"train_loss": -6.444073677062988, "global_step": 111253, "epoch": 2648} {"train_loss": -6.5364990234375, "global_step": 111254, "epoch": 2648} {"train_loss": -6.476305961608887, "global_step": 111255, "epoch": 2648} {"train_loss": -6.412232398986816, "global_step": 111256, "epoch": 2648} {"train_loss": -6.456780093056815, "global_step": 111257, "epoch": 2648, "val_loss": 76410.2421875} {"train_loss": -6.366583347320557, "global_step": 111258, "epoch": 2649} {"train_loss": -6.354159832000732, "global_step": 111259, "epoch": 2649} {"train_loss": -6.357097625732422, "global_step": 111260, "epoch": 2649} {"train_loss": -6.421100616455078, "global_step": 111261, "epoch": 2649} {"train_loss": -6.292803764343262, "global_step": 111262, "epoch": 2649} {"train_loss": -6.420526504516602, "global_step": 111263, "epoch": 2649} {"train_loss": -6.448005199432373, "global_step": 111264, "epoch": 2649} {"train_loss": -6.428915977478027, "global_step": 111265, "epoch": 2649} {"train_loss": -6.462065696716309, "global_step": 111266, "epoch": 2649} {"train_loss": -6.47552490234375, "global_step": 111267, "epoch": 2649} {"train_loss": -6.444475173950195, "global_step": 111268, "epoch": 2649} {"train_loss": -6.4222235679626465, "global_step": 111269, "epoch": 2649} {"train_loss": -6.490091323852539, "global_step": 111270, "epoch": 2649} {"train_loss": -6.336575508117676, "global_step": 111271, "epoch": 2649} {"train_loss": -6.408194065093994, "global_step": 111272, "epoch": 2649} {"train_loss": -6.414345741271973, "global_step": 111273, "epoch": 2649} {"train_loss": -6.556048393249512, "global_step": 111274, "epoch": 2649} {"train_loss": -6.590272903442383, "global_step": 111275, "epoch": 2649} {"train_loss": -6.46813440322876, "global_step": 111276, "epoch": 2649} {"train_loss": -6.4931640625, "global_step": 111277, "epoch": 2649} {"train_loss": -6.464677810668945, "global_step": 111278, "epoch": 2649} {"train_loss": -6.581830978393555, "global_step": 111279, "epoch": 2649} {"train_loss": -6.410904884338379, "global_step": 111280, "epoch": 2649} {"train_loss": -6.4681854248046875, "global_step": 111281, "epoch": 2649} {"train_loss": -6.463154315948486, "global_step": 111282, "epoch": 2649} {"train_loss": -6.481348991394043, "global_step": 111283, "epoch": 2649} {"train_loss": -6.6066789627075195, "global_step": 111284, "epoch": 2649} {"train_loss": -6.456615447998047, "global_step": 111285, "epoch": 2649} {"train_loss": -6.393545150756836, "global_step": 111286, "epoch": 2649} {"train_loss": -6.568946838378906, "global_step": 111287, "epoch": 2649} {"train_loss": -6.60319709777832, "global_step": 111288, "epoch": 2649} {"train_loss": -6.566339015960693, "global_step": 111289, "epoch": 2649} {"train_loss": -6.604043483734131, "global_step": 111290, "epoch": 2649} {"train_loss": -6.499270915985107, "global_step": 111291, "epoch": 2649} {"train_loss": -6.511895179748535, "global_step": 111292, "epoch": 2649} {"train_loss": -6.551959037780762, "global_step": 111293, "epoch": 2649} {"train_loss": -6.523670196533203, "global_step": 111294, "epoch": 2649} {"train_loss": -6.485748291015625, "global_step": 111295, "epoch": 2649} {"train_loss": -6.482770919799805, "global_step": 111296, "epoch": 2649} {"train_loss": -6.398872375488281, "global_step": 111297, "epoch": 2649} {"train_loss": -6.501971244812012, "global_step": 111298, "epoch": 2649} {"train_loss": -6.468046154294695, "global_step": 111299, "epoch": 2649, "val_loss": 76116.9765625} {"train_loss": -6.463078498840332, "global_step": 111300, "epoch": 2650} {"train_loss": -6.450961112976074, "global_step": 111301, "epoch": 2650} {"train_loss": -6.278820991516113, "global_step": 111302, "epoch": 2650} {"train_loss": -6.45542049407959, "global_step": 111303, "epoch": 2650} {"train_loss": -6.453247547149658, "global_step": 111304, "epoch": 2650} {"train_loss": -6.459829330444336, "global_step": 111305, "epoch": 2650} {"train_loss": -6.405271530151367, "global_step": 111306, "epoch": 2650} {"train_loss": -6.319136619567871, "global_step": 111307, "epoch": 2650} {"train_loss": -6.466340065002441, "global_step": 111308, "epoch": 2650} {"train_loss": -6.525153160095215, "global_step": 111309, "epoch": 2650} {"train_loss": -6.491386890411377, "global_step": 111310, "epoch": 2650} {"train_loss": -6.4331512451171875, "global_step": 111311, "epoch": 2650} {"train_loss": -6.69083309173584, "global_step": 111312, "epoch": 2650} {"train_loss": -6.465872764587402, "global_step": 111313, "epoch": 2650} {"train_loss": -6.482665061950684, "global_step": 111314, "epoch": 2650} {"train_loss": -6.539658546447754, "global_step": 111315, "epoch": 2650} {"train_loss": -6.441499710083008, "global_step": 111316, "epoch": 2650} {"train_loss": -6.427989482879639, "global_step": 111317, "epoch": 2650} {"train_loss": -6.35798454284668, "global_step": 111318, "epoch": 2650} {"train_loss": -6.361701965332031, "global_step": 111319, "epoch": 2650} {"train_loss": -6.422563076019287, "global_step": 111320, "epoch": 2650} {"train_loss": -6.519144058227539, "global_step": 111321, "epoch": 2650} {"train_loss": -6.382993698120117, "global_step": 111322, "epoch": 2650} {"train_loss": -6.545604705810547, "global_step": 111323, "epoch": 2650} {"train_loss": -6.453725814819336, "global_step": 111324, "epoch": 2650} {"train_loss": -6.456348896026611, "global_step": 111325, "epoch": 2650} {"train_loss": -6.507617473602295, "global_step": 111326, "epoch": 2650} {"train_loss": -6.5179057121276855, "global_step": 111327, "epoch": 2650} {"train_loss": -6.534557819366455, "global_step": 111328, "epoch": 2650} {"train_loss": -6.508221626281738, "global_step": 111329, "epoch": 2650} {"train_loss": -6.520490646362305, "global_step": 111330, "epoch": 2650} {"train_loss": -6.36989688873291, "global_step": 111331, "epoch": 2650} {"train_loss": -6.477025032043457, "global_step": 111332, "epoch": 2650} {"train_loss": -6.5669846534729, "global_step": 111333, "epoch": 2650} {"train_loss": -6.508060932159424, "global_step": 111334, "epoch": 2650} {"train_loss": -6.439558029174805, "global_step": 111335, "epoch": 2650} {"train_loss": -6.382477760314941, "global_step": 111336, "epoch": 2650} {"train_loss": -6.458920001983643, "global_step": 111337, "epoch": 2650} {"train_loss": -6.408819198608398, "global_step": 111338, "epoch": 2650} {"train_loss": -6.375821113586426, "global_step": 111339, "epoch": 2650} {"train_loss": -6.363044738769531, "global_step": 111340, "epoch": 2650} {"train_loss": -6.454175177074614, "global_step": 111341, "epoch": 2650, "train/sim_max_reward_0": 0.4671978993309261, "train/sim_max_reward_1": 0.9356547963021344, "train/sim_max_reward_2": 0.28469514240552424, "train/sim_max_reward_3": 0.13504889447667012, "train/sim_max_reward_4": 0.2903490499479736, "train/sim_max_reward_5": 0.8002679635927648, "test/sim_max_reward_4500000": 0.35140576014209024, "test/sim_max_reward_4500001": 0.8568442790286573, "test/sim_max_reward_4500002": 0.885237914552244, "test/sim_max_reward_4500003": 0.9041126614135622, "test/sim_max_reward_4500004": 0.1473535099646544, "test/sim_max_reward_4500005": 0.786512244703192, "test/sim_max_reward_4500006": 0.9408275745909691, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.2211564085910393, "test/sim_max_reward_4500009": 0.8492051748185734, "test/sim_max_reward_4500010": 0.004695276857650199, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 0.9150212922122131, "test/sim_max_reward_4500013": 0.006358024023050708, "test/sim_max_reward_4500014": 0.3176132386681689, "test/sim_max_reward_4500015": 0.7289217141091116, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.1992538746976683, "test/sim_max_reward_4500018": 0.8904243601504026, "test/sim_max_reward_4500019": 0.844560929892389, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9005834309916184, "test/sim_max_reward_4500022": 0.9626603729661947, "test/sim_max_reward_4500023": 0.9424925673004243, "test/sim_max_reward_4500024": 0.8043789546758779, "test/sim_max_reward_4500025": 0.3680992973972221, "test/sim_max_reward_4500026": 0.9548324765303374, "test/sim_max_reward_4500027": 0.9942362025865451, "test/sim_max_reward_4500028": 0.19225342440106574, "test/sim_max_reward_4500029": 0.04641451627333949, "test/sim_max_reward_4500030": 0.9758362149493135, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.051158440365813435, "test/sim_max_reward_4500033": 0.3274993816197386, "test/sim_max_reward_4500034": 0.8124414335806902, "test/sim_max_reward_4500035": 0.7742745016681092, "test/sim_max_reward_4500036": 0.9641029290284292, "test/sim_max_reward_4500037": 0.7614170108486505, "test/sim_max_reward_4500038": 0.3170243635141771, "test/sim_max_reward_4500039": 0.9363974811877689, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.9951244990770995, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.9791982499073877, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.3944053474118457, "test/sim_max_reward_4500046": 0.9994465438551248, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9767208337833744, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.48553562434266545, "test/mean_score": 0.5864097303782092, "val_loss": 76715.4609375} {"train_loss": -6.292880058288574, "global_step": 111342, "epoch": 2651} {"train_loss": -6.272790908813477, "global_step": 111343, "epoch": 2651} {"train_loss": -6.394129276275635, "global_step": 111344, "epoch": 2651} {"train_loss": -6.4319963455200195, "global_step": 111345, "epoch": 2651} {"train_loss": -6.268812656402588, "global_step": 111346, "epoch": 2651} {"train_loss": -6.438065052032471, "global_step": 111347, "epoch": 2651} {"train_loss": -6.327827453613281, "global_step": 111348, "epoch": 2651} {"train_loss": -6.420695781707764, "global_step": 111349, "epoch": 2651} {"train_loss": -6.358558654785156, "global_step": 111350, "epoch": 2651} {"train_loss": -6.351292610168457, "global_step": 111351, "epoch": 2651} {"train_loss": -6.403958320617676, "global_step": 111352, "epoch": 2651} {"train_loss": -6.415384292602539, "global_step": 111353, "epoch": 2651} {"train_loss": -6.333335876464844, "global_step": 111354, "epoch": 2651} {"train_loss": -6.38318395614624, "global_step": 111355, "epoch": 2651} {"train_loss": -6.366054534912109, "global_step": 111356, "epoch": 2651} {"train_loss": -6.326570510864258, "global_step": 111357, "epoch": 2651} {"train_loss": -6.538903713226318, "global_step": 111358, "epoch": 2651} {"train_loss": -6.471235275268555, "global_step": 111359, "epoch": 2651} {"train_loss": -6.435997486114502, "global_step": 111360, "epoch": 2651} {"train_loss": -6.35884952545166, "global_step": 111361, "epoch": 2651} {"train_loss": -6.452112674713135, "global_step": 111362, "epoch": 2651} {"train_loss": -6.413362503051758, "global_step": 111363, "epoch": 2651} {"train_loss": -6.454367637634277, "global_step": 111364, "epoch": 2651} {"train_loss": -6.446833610534668, "global_step": 111365, "epoch": 2651} {"train_loss": -6.383204460144043, "global_step": 111366, "epoch": 2651} {"train_loss": -6.571958541870117, "global_step": 111367, "epoch": 2651} {"train_loss": -6.585151672363281, "global_step": 111368, "epoch": 2651} {"train_loss": -6.510437965393066, "global_step": 111369, "epoch": 2651} {"train_loss": -6.403173446655273, "global_step": 111370, "epoch": 2651} {"train_loss": -6.567105293273926, "global_step": 111371, "epoch": 2651} {"train_loss": -6.460631370544434, "global_step": 111372, "epoch": 2651} {"train_loss": -6.575328826904297, "global_step": 111373, "epoch": 2651} {"train_loss": -6.490487098693848, "global_step": 111374, "epoch": 2651} {"train_loss": -6.452237129211426, "global_step": 111375, "epoch": 2651} {"train_loss": -6.530694007873535, "global_step": 111376, "epoch": 2651} {"train_loss": -6.643328666687012, "global_step": 111377, "epoch": 2651} {"train_loss": -6.371575355529785, "global_step": 111378, "epoch": 2651} {"train_loss": -6.363430500030518, "global_step": 111379, "epoch": 2651} {"train_loss": -6.398797988891602, "global_step": 111380, "epoch": 2651} {"train_loss": -6.4150590896606445, "global_step": 111381, "epoch": 2651} {"train_loss": -6.478250980377197, "global_step": 111382, "epoch": 2651} {"train_loss": -6.424836749122257, "global_step": 111383, "epoch": 2651, "val_loss": 76425.15625} {"train_loss": -6.527766704559326, "global_step": 111384, "epoch": 2652} {"train_loss": -6.318975448608398, "global_step": 111385, "epoch": 2652} {"train_loss": -6.394557952880859, "global_step": 111386, "epoch": 2652} {"train_loss": -6.419859886169434, "global_step": 111387, "epoch": 2652} {"train_loss": -6.389443397521973, "global_step": 111388, "epoch": 2652} {"train_loss": -6.497375011444092, "global_step": 111389, "epoch": 2652} {"train_loss": -6.559207916259766, "global_step": 111390, "epoch": 2652} {"train_loss": -6.45136833190918, "global_step": 111391, "epoch": 2652} {"train_loss": -6.365236759185791, "global_step": 111392, "epoch": 2652} {"train_loss": -6.47265625, "global_step": 111393, "epoch": 2652} {"train_loss": -6.564391136169434, "global_step": 111394, "epoch": 2652} {"train_loss": -6.464310169219971, "global_step": 111395, "epoch": 2652} {"train_loss": -6.585023880004883, "global_step": 111396, "epoch": 2652} {"train_loss": -6.440230369567871, "global_step": 111397, "epoch": 2652} {"train_loss": -6.512483596801758, "global_step": 111398, "epoch": 2652} {"train_loss": -6.487866401672363, "global_step": 111399, "epoch": 2652} {"train_loss": -6.488237380981445, "global_step": 111400, "epoch": 2652} {"train_loss": -6.565070152282715, "global_step": 111401, "epoch": 2652} {"train_loss": -6.456995010375977, "global_step": 111402, "epoch": 2652} {"train_loss": -6.450465202331543, "global_step": 111403, "epoch": 2652} {"train_loss": -6.477565288543701, "global_step": 111404, "epoch": 2652} {"train_loss": -6.610502243041992, "global_step": 111405, "epoch": 2652} {"train_loss": -6.5850701332092285, "global_step": 111406, "epoch": 2652} {"train_loss": -6.537134170532227, "global_step": 111407, "epoch": 2652} {"train_loss": -6.465275764465332, "global_step": 111408, "epoch": 2652} {"train_loss": -6.4105224609375, "global_step": 111409, "epoch": 2652} {"train_loss": -6.395270824432373, "global_step": 111410, "epoch": 2652} {"train_loss": -6.404592037200928, "global_step": 111411, "epoch": 2652} {"train_loss": -6.347289085388184, "global_step": 111412, "epoch": 2652} {"train_loss": -6.667738914489746, "global_step": 111413, "epoch": 2652} {"train_loss": -6.42865514755249, "global_step": 111414, "epoch": 2652} {"train_loss": -6.338750839233398, "global_step": 111415, "epoch": 2652} {"train_loss": -6.546448707580566, "global_step": 111416, "epoch": 2652} {"train_loss": -6.367147445678711, "global_step": 111417, "epoch": 2652} {"train_loss": -6.511421203613281, "global_step": 111418, "epoch": 2652} {"train_loss": -6.467387676239014, "global_step": 111419, "epoch": 2652} {"train_loss": -6.4659881591796875, "global_step": 111420, "epoch": 2652} {"train_loss": -6.5166015625, "global_step": 111421, "epoch": 2652} {"train_loss": -6.606121063232422, "global_step": 111422, "epoch": 2652} {"train_loss": -6.336995601654053, "global_step": 111423, "epoch": 2652} {"train_loss": -6.364577770233154, "global_step": 111424, "epoch": 2652} {"train_loss": -6.471535239900861, "global_step": 111425, "epoch": 2652, "val_loss": 76414.171875} {"train_loss": -6.491336822509766, "global_step": 111426, "epoch": 2653} {"train_loss": -6.427506446838379, "global_step": 111427, "epoch": 2653} {"train_loss": -6.553112506866455, "global_step": 111428, "epoch": 2653} {"train_loss": -6.392547130584717, "global_step": 111429, "epoch": 2653} {"train_loss": -6.543422222137451, "global_step": 111430, "epoch": 2653} {"train_loss": -6.426865577697754, "global_step": 111431, "epoch": 2653} {"train_loss": -6.341887474060059, "global_step": 111432, "epoch": 2653} {"train_loss": -6.433866500854492, "global_step": 111433, "epoch": 2653} {"train_loss": -6.467737197875977, "global_step": 111434, "epoch": 2653} {"train_loss": -6.550436973571777, "global_step": 111435, "epoch": 2653} {"train_loss": -6.411229610443115, "global_step": 111436, "epoch": 2653} {"train_loss": -6.565738201141357, "global_step": 111437, "epoch": 2653} {"train_loss": -6.627753257751465, "global_step": 111438, "epoch": 2653} {"train_loss": -6.432384967803955, "global_step": 111439, "epoch": 2653} {"train_loss": -6.433496475219727, "global_step": 111440, "epoch": 2653} {"train_loss": -6.50709342956543, "global_step": 111441, "epoch": 2653} {"train_loss": -6.474752426147461, "global_step": 111442, "epoch": 2653} {"train_loss": -6.508936882019043, "global_step": 111443, "epoch": 2653} {"train_loss": -6.574044227600098, "global_step": 111444, "epoch": 2653} {"train_loss": -6.469597816467285, "global_step": 111445, "epoch": 2653} {"train_loss": -6.493338108062744, "global_step": 111446, "epoch": 2653} {"train_loss": -6.506612777709961, "global_step": 111447, "epoch": 2653} {"train_loss": -6.483543872833252, "global_step": 111448, "epoch": 2653} {"train_loss": -6.609708786010742, "global_step": 111449, "epoch": 2653} {"train_loss": -6.482668399810791, "global_step": 111450, "epoch": 2653} {"train_loss": -6.393073081970215, "global_step": 111451, "epoch": 2653} {"train_loss": -6.5401153564453125, "global_step": 111452, "epoch": 2653} {"train_loss": -6.404953956604004, "global_step": 111453, "epoch": 2653} {"train_loss": -6.487834453582764, "global_step": 111454, "epoch": 2653} {"train_loss": -6.563686370849609, "global_step": 111455, "epoch": 2653} {"train_loss": -6.403896331787109, "global_step": 111456, "epoch": 2653} {"train_loss": -6.582284927368164, "global_step": 111457, "epoch": 2653} {"train_loss": -6.461731910705566, "global_step": 111458, "epoch": 2653} {"train_loss": -6.557038307189941, "global_step": 111459, "epoch": 2653} {"train_loss": -6.630981922149658, "global_step": 111460, "epoch": 2653} {"train_loss": -6.427184104919434, "global_step": 111461, "epoch": 2653} {"train_loss": -6.535449028015137, "global_step": 111462, "epoch": 2653} {"train_loss": -6.438061714172363, "global_step": 111463, "epoch": 2653} {"train_loss": -6.503596305847168, "global_step": 111464, "epoch": 2653} {"train_loss": -6.404417037963867, "global_step": 111465, "epoch": 2653} {"train_loss": -6.486642360687256, "global_step": 111466, "epoch": 2653} {"train_loss": -6.487305118924096, "global_step": 111467, "epoch": 2653, "val_loss": 76106.7734375} {"train_loss": -6.504245758056641, "global_step": 111468, "epoch": 2654} {"train_loss": -6.524664878845215, "global_step": 111469, "epoch": 2654} {"train_loss": -6.52775764465332, "global_step": 111470, "epoch": 2654} {"train_loss": -6.38242244720459, "global_step": 111471, "epoch": 2654} {"train_loss": -6.435980319976807, "global_step": 111472, "epoch": 2654} {"train_loss": -6.464447021484375, "global_step": 111473, "epoch": 2654} {"train_loss": -6.524911403656006, "global_step": 111474, "epoch": 2654} {"train_loss": -6.374089241027832, "global_step": 111475, "epoch": 2654} {"train_loss": -6.361021995544434, "global_step": 111476, "epoch": 2654} {"train_loss": -6.318549156188965, "global_step": 111477, "epoch": 2654} {"train_loss": -6.377452373504639, "global_step": 111478, "epoch": 2654} {"train_loss": -6.374956130981445, "global_step": 111479, "epoch": 2654} {"train_loss": -6.457780838012695, "global_step": 111480, "epoch": 2654} {"train_loss": -6.348570823669434, "global_step": 111481, "epoch": 2654} {"train_loss": -6.433950901031494, "global_step": 111482, "epoch": 2654} {"train_loss": -6.503929615020752, "global_step": 111483, "epoch": 2654} {"train_loss": -6.432188987731934, "global_step": 111484, "epoch": 2654} {"train_loss": -6.400732040405273, "global_step": 111485, "epoch": 2654} {"train_loss": -6.447746753692627, "global_step": 111486, "epoch": 2654} {"train_loss": -6.597105026245117, "global_step": 111487, "epoch": 2654} {"train_loss": -6.46455192565918, "global_step": 111488, "epoch": 2654} {"train_loss": -6.551078796386719, "global_step": 111489, "epoch": 2654} {"train_loss": -6.497653007507324, "global_step": 111490, "epoch": 2654} {"train_loss": -6.5430755615234375, "global_step": 111491, "epoch": 2654} {"train_loss": -6.467235088348389, "global_step": 111492, "epoch": 2654} {"train_loss": -6.45503044128418, "global_step": 111493, "epoch": 2654} {"train_loss": -6.4658026695251465, "global_step": 111494, "epoch": 2654} {"train_loss": -6.355055809020996, "global_step": 111495, "epoch": 2654} {"train_loss": -6.609793663024902, "global_step": 111496, "epoch": 2654} {"train_loss": -6.4685492515563965, "global_step": 111497, "epoch": 2654} {"train_loss": -6.493047714233398, "global_step": 111498, "epoch": 2654} {"train_loss": -6.5614166259765625, "global_step": 111499, "epoch": 2654} {"train_loss": -6.507862091064453, "global_step": 111500, "epoch": 2654} {"train_loss": -6.374699592590332, "global_step": 111501, "epoch": 2654} {"train_loss": -6.552743434906006, "global_step": 111502, "epoch": 2654} {"train_loss": -6.384197235107422, "global_step": 111503, "epoch": 2654} {"train_loss": -6.511302947998047, "global_step": 111504, "epoch": 2654} {"train_loss": -6.438865661621094, "global_step": 111505, "epoch": 2654} {"train_loss": -6.551360607147217, "global_step": 111506, "epoch": 2654} {"train_loss": -6.353904724121094, "global_step": 111507, "epoch": 2654} {"train_loss": -6.430228233337402, "global_step": 111508, "epoch": 2654} {"train_loss": -6.457381373360043, "global_step": 111509, "epoch": 2654, "val_loss": 76294.4609375} {"train_loss": -6.566091537475586, "global_step": 111510, "epoch": 2655} {"train_loss": -6.4304046630859375, "global_step": 111511, "epoch": 2655} {"train_loss": -6.400992393493652, "global_step": 111512, "epoch": 2655} {"train_loss": -6.488700866699219, "global_step": 111513, "epoch": 2655} {"train_loss": -6.429984092712402, "global_step": 111514, "epoch": 2655} {"train_loss": -6.428764343261719, "global_step": 111515, "epoch": 2655} {"train_loss": -6.519730567932129, "global_step": 111516, "epoch": 2655} {"train_loss": -6.506102561950684, "global_step": 111517, "epoch": 2655} {"train_loss": -6.528445243835449, "global_step": 111518, "epoch": 2655} {"train_loss": -6.616606712341309, "global_step": 111519, "epoch": 2655} {"train_loss": -6.393156051635742, "global_step": 111520, "epoch": 2655} {"train_loss": -6.502050876617432, "global_step": 111521, "epoch": 2655} {"train_loss": -6.552443504333496, "global_step": 111522, "epoch": 2655} {"train_loss": -6.527153968811035, "global_step": 111523, "epoch": 2655} {"train_loss": -6.520705223083496, "global_step": 111524, "epoch": 2655} {"train_loss": -6.597234725952148, "global_step": 111525, "epoch": 2655} {"train_loss": -6.579587936401367, "global_step": 111526, "epoch": 2655} {"train_loss": -6.499190330505371, "global_step": 111527, "epoch": 2655} {"train_loss": -6.4958295822143555, "global_step": 111528, "epoch": 2655} {"train_loss": -6.558742523193359, "global_step": 111529, "epoch": 2655} {"train_loss": -6.383975982666016, "global_step": 111530, "epoch": 2655} {"train_loss": -6.33070182800293, "global_step": 111531, "epoch": 2655} {"train_loss": -6.61767578125, "global_step": 111532, "epoch": 2655} {"train_loss": -6.440938472747803, "global_step": 111533, "epoch": 2655} {"train_loss": -6.37273645401001, "global_step": 111534, "epoch": 2655} {"train_loss": -6.492400169372559, "global_step": 111535, "epoch": 2655} {"train_loss": -6.484521865844727, "global_step": 111536, "epoch": 2655} {"train_loss": -6.455223083496094, "global_step": 111537, "epoch": 2655} {"train_loss": -6.5279693603515625, "global_step": 111538, "epoch": 2655} {"train_loss": -6.499660015106201, "global_step": 111539, "epoch": 2655} {"train_loss": -6.506629943847656, "global_step": 111540, "epoch": 2655} {"train_loss": -6.359462261199951, "global_step": 111541, "epoch": 2655} {"train_loss": -6.390532970428467, "global_step": 111542, "epoch": 2655} {"train_loss": -6.515622138977051, "global_step": 111543, "epoch": 2655} {"train_loss": -6.429693698883057, "global_step": 111544, "epoch": 2655} {"train_loss": -6.596582889556885, "global_step": 111545, "epoch": 2655} {"train_loss": -6.393691062927246, "global_step": 111546, "epoch": 2655} {"train_loss": -6.389181613922119, "global_step": 111547, "epoch": 2655} {"train_loss": -6.353964805603027, "global_step": 111548, "epoch": 2655} {"train_loss": -6.488465309143066, "global_step": 111549, "epoch": 2655} {"train_loss": -6.431136131286621, "global_step": 111550, "epoch": 2655} {"train_loss": -6.476670390083676, "global_step": 111551, "epoch": 2655, "val_loss": 76192.9609375} {"train_loss": -6.5168046951293945, "global_step": 111552, "epoch": 2656} {"train_loss": -6.4815673828125, "global_step": 111553, "epoch": 2656} {"train_loss": -6.509369850158691, "global_step": 111554, "epoch": 2656} {"train_loss": -6.45300817489624, "global_step": 111555, "epoch": 2656} {"train_loss": -6.418574333190918, "global_step": 111556, "epoch": 2656} {"train_loss": -6.623678207397461, "global_step": 111557, "epoch": 2656} {"train_loss": -6.36890983581543, "global_step": 111558, "epoch": 2656} {"train_loss": -6.476592063903809, "global_step": 111559, "epoch": 2656} {"train_loss": -6.381117820739746, "global_step": 111560, "epoch": 2656} {"train_loss": -6.475392818450928, "global_step": 111561, "epoch": 2656} {"train_loss": -6.465912818908691, "global_step": 111562, "epoch": 2656} {"train_loss": -6.500643730163574, "global_step": 111563, "epoch": 2656} {"train_loss": -6.438249588012695, "global_step": 111564, "epoch": 2656} {"train_loss": -6.463693618774414, "global_step": 111565, "epoch": 2656} {"train_loss": -6.4037580490112305, "global_step": 111566, "epoch": 2656} {"train_loss": -6.523634910583496, "global_step": 111567, "epoch": 2656} {"train_loss": -6.520429611206055, "global_step": 111568, "epoch": 2656} {"train_loss": -6.3939900398254395, "global_step": 111569, "epoch": 2656} {"train_loss": -6.433675765991211, "global_step": 111570, "epoch": 2656} {"train_loss": -6.44380521774292, "global_step": 111571, "epoch": 2656} {"train_loss": -6.441875457763672, "global_step": 111572, "epoch": 2656} {"train_loss": -6.522152900695801, "global_step": 111573, "epoch": 2656} {"train_loss": -6.419519424438477, "global_step": 111574, "epoch": 2656} {"train_loss": -6.541961669921875, "global_step": 111575, "epoch": 2656} {"train_loss": -6.520925521850586, "global_step": 111576, "epoch": 2656} {"train_loss": -6.494661808013916, "global_step": 111577, "epoch": 2656} {"train_loss": -6.564538955688477, "global_step": 111578, "epoch": 2656} {"train_loss": -6.550371170043945, "global_step": 111579, "epoch": 2656} {"train_loss": -6.433905124664307, "global_step": 111580, "epoch": 2656} {"train_loss": -6.3890910148620605, "global_step": 111581, "epoch": 2656} {"train_loss": -6.48513650894165, "global_step": 111582, "epoch": 2656} {"train_loss": -6.518640518188477, "global_step": 111583, "epoch": 2656} {"train_loss": -6.398619174957275, "global_step": 111584, "epoch": 2656} {"train_loss": -6.496634483337402, "global_step": 111585, "epoch": 2656} {"train_loss": -6.471625328063965, "global_step": 111586, "epoch": 2656} {"train_loss": -6.425148963928223, "global_step": 111587, "epoch": 2656} {"train_loss": -6.492841720581055, "global_step": 111588, "epoch": 2656} {"train_loss": -6.507632732391357, "global_step": 111589, "epoch": 2656} {"train_loss": -6.409602642059326, "global_step": 111590, "epoch": 2656} {"train_loss": -6.415342330932617, "global_step": 111591, "epoch": 2656} {"train_loss": -6.38642692565918, "global_step": 111592, "epoch": 2656} {"train_loss": -6.468798626036871, "global_step": 111593, "epoch": 2656, "val_loss": 76760.6015625} {"train_loss": -6.457175254821777, "global_step": 111594, "epoch": 2657} {"train_loss": -6.484396934509277, "global_step": 111595, "epoch": 2657} {"train_loss": -6.5407633781433105, "global_step": 111596, "epoch": 2657} {"train_loss": -6.508269309997559, "global_step": 111597, "epoch": 2657} {"train_loss": -6.480307579040527, "global_step": 111598, "epoch": 2657} {"train_loss": -6.515369415283203, "global_step": 111599, "epoch": 2657} {"train_loss": -6.553096771240234, "global_step": 111600, "epoch": 2657} {"train_loss": -6.505177974700928, "global_step": 111601, "epoch": 2657} {"train_loss": -6.500388145446777, "global_step": 111602, "epoch": 2657} {"train_loss": -6.47947883605957, "global_step": 111603, "epoch": 2657} {"train_loss": -6.426982879638672, "global_step": 111604, "epoch": 2657} {"train_loss": -6.359871864318848, "global_step": 111605, "epoch": 2657} {"train_loss": -6.569518089294434, "global_step": 111606, "epoch": 2657} {"train_loss": -6.450591087341309, "global_step": 111607, "epoch": 2657} {"train_loss": -6.343199729919434, "global_step": 111608, "epoch": 2657} {"train_loss": -6.503532886505127, "global_step": 111609, "epoch": 2657} {"train_loss": -6.460272789001465, "global_step": 111610, "epoch": 2657} {"train_loss": -6.374214172363281, "global_step": 111611, "epoch": 2657} {"train_loss": -6.445285320281982, "global_step": 111612, "epoch": 2657} {"train_loss": -6.531975746154785, "global_step": 111613, "epoch": 2657} {"train_loss": -6.383050441741943, "global_step": 111614, "epoch": 2657} {"train_loss": -6.403132438659668, "global_step": 111615, "epoch": 2657} {"train_loss": -6.499063491821289, "global_step": 111616, "epoch": 2657} {"train_loss": -6.497615337371826, "global_step": 111617, "epoch": 2657} {"train_loss": -6.499302864074707, "global_step": 111618, "epoch": 2657} {"train_loss": -6.535646438598633, "global_step": 111619, "epoch": 2657} {"train_loss": -6.467899799346924, "global_step": 111620, "epoch": 2657} {"train_loss": -6.3442888259887695, "global_step": 111621, "epoch": 2657} {"train_loss": -6.442617416381836, "global_step": 111622, "epoch": 2657} {"train_loss": -6.485194206237793, "global_step": 111623, "epoch": 2657} {"train_loss": -6.472014427185059, "global_step": 111624, "epoch": 2657} {"train_loss": -6.43580961227417, "global_step": 111625, "epoch": 2657} {"train_loss": -6.4364423751831055, "global_step": 111626, "epoch": 2657} {"train_loss": -6.521183490753174, "global_step": 111627, "epoch": 2657} {"train_loss": -6.504448413848877, "global_step": 111628, "epoch": 2657} {"train_loss": -6.521414756774902, "global_step": 111629, "epoch": 2657} {"train_loss": -6.435567378997803, "global_step": 111630, "epoch": 2657} {"train_loss": -6.4665422439575195, "global_step": 111631, "epoch": 2657} {"train_loss": -6.476861476898193, "global_step": 111632, "epoch": 2657} {"train_loss": -6.589481353759766, "global_step": 111633, "epoch": 2657} {"train_loss": -6.519900321960449, "global_step": 111634, "epoch": 2657} {"train_loss": -6.476273706981114, "global_step": 111635, "epoch": 2657, "val_loss": 76169.1796875} {"train_loss": -6.493288516998291, "global_step": 111636, "epoch": 2658} {"train_loss": -6.509365558624268, "global_step": 111637, "epoch": 2658} {"train_loss": -6.4716997146606445, "global_step": 111638, "epoch": 2658} {"train_loss": -6.517078399658203, "global_step": 111639, "epoch": 2658} {"train_loss": -6.484394073486328, "global_step": 111640, "epoch": 2658} {"train_loss": -6.438145637512207, "global_step": 111641, "epoch": 2658} {"train_loss": -6.480058670043945, "global_step": 111642, "epoch": 2658} {"train_loss": -6.508762359619141, "global_step": 111643, "epoch": 2658} {"train_loss": -6.546232223510742, "global_step": 111644, "epoch": 2658} {"train_loss": -6.548247337341309, "global_step": 111645, "epoch": 2658} {"train_loss": -6.431222915649414, "global_step": 111646, "epoch": 2658} {"train_loss": -6.5817108154296875, "global_step": 111647, "epoch": 2658} {"train_loss": -6.57666540145874, "global_step": 111648, "epoch": 2658} {"train_loss": -6.544795513153076, "global_step": 111649, "epoch": 2658} {"train_loss": -6.513294696807861, "global_step": 111650, "epoch": 2658} {"train_loss": -6.416315078735352, "global_step": 111651, "epoch": 2658} {"train_loss": -6.388885498046875, "global_step": 111652, "epoch": 2658} {"train_loss": -6.478869438171387, "global_step": 111653, "epoch": 2658} {"train_loss": -6.354252815246582, "global_step": 111654, "epoch": 2658} {"train_loss": -6.372173309326172, "global_step": 111655, "epoch": 2658} {"train_loss": -6.356306076049805, "global_step": 111656, "epoch": 2658} {"train_loss": -6.337405681610107, "global_step": 111657, "epoch": 2658} {"train_loss": -6.269378662109375, "global_step": 111658, "epoch": 2658} {"train_loss": -6.340521335601807, "global_step": 111659, "epoch": 2658} {"train_loss": -6.3358378410339355, "global_step": 111660, "epoch": 2658} {"train_loss": -6.382081031799316, "global_step": 111661, "epoch": 2658} {"train_loss": -6.260271072387695, "global_step": 111662, "epoch": 2658} {"train_loss": -6.394355773925781, "global_step": 111663, "epoch": 2658} {"train_loss": -6.358480453491211, "global_step": 111664, "epoch": 2658} {"train_loss": -6.2812418937683105, "global_step": 111665, "epoch": 2658} {"train_loss": -6.32745885848999, "global_step": 111666, "epoch": 2658} {"train_loss": -6.353940963745117, "global_step": 111667, "epoch": 2658} {"train_loss": -6.215724468231201, "global_step": 111668, "epoch": 2658} {"train_loss": -6.381829261779785, "global_step": 111669, "epoch": 2658} {"train_loss": -6.360177516937256, "global_step": 111670, "epoch": 2658} {"train_loss": -6.469735145568848, "global_step": 111671, "epoch": 2658} {"train_loss": -6.3492431640625, "global_step": 111672, "epoch": 2658} {"train_loss": -6.464705944061279, "global_step": 111673, "epoch": 2658} {"train_loss": -6.375600814819336, "global_step": 111674, "epoch": 2658} {"train_loss": -6.411735534667969, "global_step": 111675, "epoch": 2658} {"train_loss": -6.440844535827637, "global_step": 111676, "epoch": 2658} {"train_loss": -6.4216811543419245, "global_step": 111677, "epoch": 2658, "val_loss": 76360.0390625} {"train_loss": -6.35494327545166, "global_step": 111678, "epoch": 2659} {"train_loss": -6.507944583892822, "global_step": 111679, "epoch": 2659} {"train_loss": -6.39716911315918, "global_step": 111680, "epoch": 2659} {"train_loss": -6.557370185852051, "global_step": 111681, "epoch": 2659} {"train_loss": -6.501880645751953, "global_step": 111682, "epoch": 2659} {"train_loss": -6.475683212280273, "global_step": 111683, "epoch": 2659} {"train_loss": -6.515620231628418, "global_step": 111684, "epoch": 2659} {"train_loss": -6.466625213623047, "global_step": 111685, "epoch": 2659} {"train_loss": -6.504131317138672, "global_step": 111686, "epoch": 2659} {"train_loss": -6.4698100090026855, "global_step": 111687, "epoch": 2659} {"train_loss": -6.572471618652344, "global_step": 111688, "epoch": 2659} {"train_loss": -6.589601516723633, "global_step": 111689, "epoch": 2659} {"train_loss": -6.521425247192383, "global_step": 111690, "epoch": 2659} {"train_loss": -6.52496337890625, "global_step": 111691, "epoch": 2659} {"train_loss": -6.427818298339844, "global_step": 111692, "epoch": 2659} {"train_loss": -6.545464038848877, "global_step": 111693, "epoch": 2659} {"train_loss": -6.54821252822876, "global_step": 111694, "epoch": 2659} {"train_loss": -6.462521553039551, "global_step": 111695, "epoch": 2659} {"train_loss": -6.632791996002197, "global_step": 111696, "epoch": 2659} {"train_loss": -6.527621269226074, "global_step": 111697, "epoch": 2659} {"train_loss": -6.430807113647461, "global_step": 111698, "epoch": 2659} {"train_loss": -6.430099964141846, "global_step": 111699, "epoch": 2659} {"train_loss": -6.376914024353027, "global_step": 111700, "epoch": 2659} {"train_loss": -6.537763595581055, "global_step": 111701, "epoch": 2659} {"train_loss": -6.491328239440918, "global_step": 111702, "epoch": 2659} {"train_loss": -6.451747417449951, "global_step": 111703, "epoch": 2659} {"train_loss": -6.498536109924316, "global_step": 111704, "epoch": 2659} {"train_loss": -6.556827545166016, "global_step": 111705, "epoch": 2659} {"train_loss": -6.448409080505371, "global_step": 111706, "epoch": 2659} {"train_loss": -6.491004467010498, "global_step": 111707, "epoch": 2659} {"train_loss": -6.432223320007324, "global_step": 111708, "epoch": 2659} {"train_loss": -6.422361373901367, "global_step": 111709, "epoch": 2659} {"train_loss": -6.41934871673584, "global_step": 111710, "epoch": 2659} {"train_loss": -6.403171062469482, "global_step": 111711, "epoch": 2659} {"train_loss": -6.506482124328613, "global_step": 111712, "epoch": 2659} {"train_loss": -6.4697265625, "global_step": 111713, "epoch": 2659} {"train_loss": -6.446392059326172, "global_step": 111714, "epoch": 2659} {"train_loss": -6.498281478881836, "global_step": 111715, "epoch": 2659} {"train_loss": -6.4219770431518555, "global_step": 111716, "epoch": 2659} {"train_loss": -6.555992126464844, "global_step": 111717, "epoch": 2659} {"train_loss": -6.382687568664551, "global_step": 111718, "epoch": 2659} {"train_loss": -6.480537301018124, "global_step": 111719, "epoch": 2659, "val_loss": 76080.0859375} {"train_loss": -6.488014221191406, "global_step": 111720, "epoch": 2660} {"train_loss": -6.462334632873535, "global_step": 111721, "epoch": 2660} {"train_loss": -6.418635368347168, "global_step": 111722, "epoch": 2660} {"train_loss": -6.367241382598877, "global_step": 111723, "epoch": 2660} {"train_loss": -6.492725372314453, "global_step": 111724, "epoch": 2660} {"train_loss": -6.402552127838135, "global_step": 111725, "epoch": 2660} {"train_loss": -6.432279109954834, "global_step": 111726, "epoch": 2660} {"train_loss": -6.368288040161133, "global_step": 111727, "epoch": 2660} {"train_loss": -6.491236686706543, "global_step": 111728, "epoch": 2660} {"train_loss": -6.494759559631348, "global_step": 111729, "epoch": 2660} {"train_loss": -6.479282379150391, "global_step": 111730, "epoch": 2660} {"train_loss": -6.483748435974121, "global_step": 111731, "epoch": 2660} {"train_loss": -6.428648471832275, "global_step": 111732, "epoch": 2660} {"train_loss": -6.464044570922852, "global_step": 111733, "epoch": 2660} {"train_loss": -6.457961559295654, "global_step": 111734, "epoch": 2660} {"train_loss": -6.547389984130859, "global_step": 111735, "epoch": 2660} {"train_loss": -6.449244499206543, "global_step": 111736, "epoch": 2660} {"train_loss": -6.517406463623047, "global_step": 111737, "epoch": 2660} {"train_loss": -6.478917121887207, "global_step": 111738, "epoch": 2660} {"train_loss": -6.4370036125183105, "global_step": 111739, "epoch": 2660} {"train_loss": -6.435042381286621, "global_step": 111740, "epoch": 2660} {"train_loss": -6.393138408660889, "global_step": 111741, "epoch": 2660} {"train_loss": -6.383967399597168, "global_step": 111742, "epoch": 2660} {"train_loss": -6.618518352508545, "global_step": 111743, "epoch": 2660} {"train_loss": -6.554199695587158, "global_step": 111744, "epoch": 2660} {"train_loss": -6.6103515625, "global_step": 111745, "epoch": 2660} {"train_loss": -6.360847473144531, "global_step": 111746, "epoch": 2660} {"train_loss": -6.41726541519165, "global_step": 111747, "epoch": 2660} {"train_loss": -6.294838905334473, "global_step": 111748, "epoch": 2660} {"train_loss": -6.490382194519043, "global_step": 111749, "epoch": 2660} {"train_loss": -6.3644819259643555, "global_step": 111750, "epoch": 2660} {"train_loss": -6.443921089172363, "global_step": 111751, "epoch": 2660} {"train_loss": -6.236781120300293, "global_step": 111752, "epoch": 2660} {"train_loss": -6.322619438171387, "global_step": 111753, "epoch": 2660} {"train_loss": -6.326998710632324, "global_step": 111754, "epoch": 2660} {"train_loss": -6.403608322143555, "global_step": 111755, "epoch": 2660} {"train_loss": -6.586287975311279, "global_step": 111756, "epoch": 2660} {"train_loss": -6.472618103027344, "global_step": 111757, "epoch": 2660} {"train_loss": -6.448582649230957, "global_step": 111758, "epoch": 2660} {"train_loss": -6.385112285614014, "global_step": 111759, "epoch": 2660} {"train_loss": -6.438839912414551, "global_step": 111760, "epoch": 2660} {"train_loss": -6.441657974606469, "global_step": 111761, "epoch": 2660, "val_loss": 76101.75} {"train_loss": -6.418424606323242, "global_step": 111762, "epoch": 2661} {"train_loss": -6.583553314208984, "global_step": 111763, "epoch": 2661} {"train_loss": -6.439328193664551, "global_step": 111764, "epoch": 2661} {"train_loss": -6.479888916015625, "global_step": 111765, "epoch": 2661} {"train_loss": -6.5270586013793945, "global_step": 111766, "epoch": 2661} {"train_loss": -6.533030033111572, "global_step": 111767, "epoch": 2661} {"train_loss": -6.5363450050354, "global_step": 111768, "epoch": 2661} {"train_loss": -6.506389617919922, "global_step": 111769, "epoch": 2661} {"train_loss": -6.5603179931640625, "global_step": 111770, "epoch": 2661} {"train_loss": -6.58148193359375, "global_step": 111771, "epoch": 2661} {"train_loss": -6.365326881408691, "global_step": 111772, "epoch": 2661} {"train_loss": -6.678174018859863, "global_step": 111773, "epoch": 2661} {"train_loss": -6.300252914428711, "global_step": 111774, "epoch": 2661} {"train_loss": -6.444527626037598, "global_step": 111775, "epoch": 2661} {"train_loss": -6.505187034606934, "global_step": 111776, "epoch": 2661} {"train_loss": -6.4085798263549805, "global_step": 111777, "epoch": 2661} {"train_loss": -6.465595722198486, "global_step": 111778, "epoch": 2661} {"train_loss": -6.580156326293945, "global_step": 111779, "epoch": 2661} {"train_loss": -6.500556945800781, "global_step": 111780, "epoch": 2661} {"train_loss": -6.453551292419434, "global_step": 111781, "epoch": 2661} {"train_loss": -6.317997455596924, "global_step": 111782, "epoch": 2661} {"train_loss": -6.530077934265137, "global_step": 111783, "epoch": 2661} {"train_loss": -6.471012592315674, "global_step": 111784, "epoch": 2661} {"train_loss": -6.467130661010742, "global_step": 111785, "epoch": 2661} {"train_loss": -6.499185562133789, "global_step": 111786, "epoch": 2661} {"train_loss": -6.508664131164551, "global_step": 111787, "epoch": 2661} {"train_loss": -6.542549133300781, "global_step": 111788, "epoch": 2661} {"train_loss": -6.455848217010498, "global_step": 111789, "epoch": 2661} {"train_loss": -6.529369354248047, "global_step": 111790, "epoch": 2661} {"train_loss": -6.44449520111084, "global_step": 111791, "epoch": 2661} {"train_loss": -6.500054836273193, "global_step": 111792, "epoch": 2661} {"train_loss": -6.486292362213135, "global_step": 111793, "epoch": 2661} {"train_loss": -6.362025260925293, "global_step": 111794, "epoch": 2661} {"train_loss": -6.483281135559082, "global_step": 111795, "epoch": 2661} {"train_loss": -6.431166172027588, "global_step": 111796, "epoch": 2661} {"train_loss": -6.494616985321045, "global_step": 111797, "epoch": 2661} {"train_loss": -6.522758483886719, "global_step": 111798, "epoch": 2661} {"train_loss": -6.3914289474487305, "global_step": 111799, "epoch": 2661} {"train_loss": -6.581696510314941, "global_step": 111800, "epoch": 2661} {"train_loss": -6.478341102600098, "global_step": 111801, "epoch": 2661} {"train_loss": -6.433192253112793, "global_step": 111802, "epoch": 2661} {"train_loss": -6.483026788348243, "global_step": 111803, "epoch": 2661, "val_loss": 76368.46875} {"train_loss": -6.51851749420166, "global_step": 111804, "epoch": 2662} {"train_loss": -6.620316028594971, "global_step": 111805, "epoch": 2662} {"train_loss": -6.633531093597412, "global_step": 111806, "epoch": 2662} {"train_loss": -6.582467555999756, "global_step": 111807, "epoch": 2662} {"train_loss": -6.502872943878174, "global_step": 111808, "epoch": 2662} {"train_loss": -6.5120086669921875, "global_step": 111809, "epoch": 2662} {"train_loss": -6.368467330932617, "global_step": 111810, "epoch": 2662} {"train_loss": -6.560946464538574, "global_step": 111811, "epoch": 2662} {"train_loss": -6.453178405761719, "global_step": 111812, "epoch": 2662} {"train_loss": -6.4947190284729, "global_step": 111813, "epoch": 2662} {"train_loss": -6.452212333679199, "global_step": 111814, "epoch": 2662} {"train_loss": -6.571708679199219, "global_step": 111815, "epoch": 2662} {"train_loss": -6.607085704803467, "global_step": 111816, "epoch": 2662} {"train_loss": -6.588555335998535, "global_step": 111817, "epoch": 2662} {"train_loss": -6.6045050621032715, "global_step": 111818, "epoch": 2662} {"train_loss": -6.585392951965332, "global_step": 111819, "epoch": 2662} {"train_loss": -6.519622802734375, "global_step": 111820, "epoch": 2662} {"train_loss": -6.601569652557373, "global_step": 111821, "epoch": 2662} {"train_loss": -6.489163398742676, "global_step": 111822, "epoch": 2662} {"train_loss": -6.53411865234375, "global_step": 111823, "epoch": 2662} {"train_loss": -6.528634071350098, "global_step": 111824, "epoch": 2662} {"train_loss": -6.442683696746826, "global_step": 111825, "epoch": 2662} {"train_loss": -6.421466827392578, "global_step": 111826, "epoch": 2662} {"train_loss": -6.437713623046875, "global_step": 111827, "epoch": 2662} {"train_loss": -6.437310218811035, "global_step": 111828, "epoch": 2662} {"train_loss": -6.575345039367676, "global_step": 111829, "epoch": 2662} {"train_loss": -6.4164910316467285, "global_step": 111830, "epoch": 2662} {"train_loss": -6.4975738525390625, "global_step": 111831, "epoch": 2662} {"train_loss": -6.65799617767334, "global_step": 111832, "epoch": 2662} {"train_loss": -6.4325456619262695, "global_step": 111833, "epoch": 2662} {"train_loss": -6.442802906036377, "global_step": 111834, "epoch": 2662} {"train_loss": -6.476064205169678, "global_step": 111835, "epoch": 2662} {"train_loss": -6.419167518615723, "global_step": 111836, "epoch": 2662} {"train_loss": -6.326877593994141, "global_step": 111837, "epoch": 2662} {"train_loss": -6.53130578994751, "global_step": 111838, "epoch": 2662} {"train_loss": -6.462073802947998, "global_step": 111839, "epoch": 2662} {"train_loss": -6.317655563354492, "global_step": 111840, "epoch": 2662} {"train_loss": -6.5289626121521, "global_step": 111841, "epoch": 2662} {"train_loss": -6.474626064300537, "global_step": 111842, "epoch": 2662} {"train_loss": -6.5228962898254395, "global_step": 111843, "epoch": 2662} {"train_loss": -6.5397233963012695, "global_step": 111844, "epoch": 2662} {"train_loss": -6.504977782567342, "global_step": 111845, "epoch": 2662, "val_loss": 76419.640625} {"train_loss": -6.486584186553955, "global_step": 111846, "epoch": 2663} {"train_loss": -6.414175033569336, "global_step": 111847, "epoch": 2663} {"train_loss": -6.503024101257324, "global_step": 111848, "epoch": 2663} {"train_loss": -6.537710189819336, "global_step": 111849, "epoch": 2663} {"train_loss": -6.439674377441406, "global_step": 111850, "epoch": 2663} {"train_loss": -6.461033344268799, "global_step": 111851, "epoch": 2663} {"train_loss": -6.5543599128723145, "global_step": 111852, "epoch": 2663} {"train_loss": -6.421147346496582, "global_step": 111853, "epoch": 2663} {"train_loss": -6.459143161773682, "global_step": 111854, "epoch": 2663} {"train_loss": -6.423338413238525, "global_step": 111855, "epoch": 2663} {"train_loss": -6.369142532348633, "global_step": 111856, "epoch": 2663} {"train_loss": -6.404903411865234, "global_step": 111857, "epoch": 2663} {"train_loss": -6.3539886474609375, "global_step": 111858, "epoch": 2663} {"train_loss": -6.341495513916016, "global_step": 111859, "epoch": 2663} {"train_loss": -6.35867166519165, "global_step": 111860, "epoch": 2663} {"train_loss": -6.427638053894043, "global_step": 111861, "epoch": 2663} {"train_loss": -6.32296085357666, "global_step": 111862, "epoch": 2663} {"train_loss": -6.513824462890625, "global_step": 111863, "epoch": 2663} {"train_loss": -6.393148899078369, "global_step": 111864, "epoch": 2663} {"train_loss": -6.35268497467041, "global_step": 111865, "epoch": 2663} {"train_loss": -6.461340427398682, "global_step": 111866, "epoch": 2663} {"train_loss": -6.487696647644043, "global_step": 111867, "epoch": 2663} {"train_loss": -6.5383148193359375, "global_step": 111868, "epoch": 2663} {"train_loss": -6.471614837646484, "global_step": 111869, "epoch": 2663} {"train_loss": -6.363149642944336, "global_step": 111870, "epoch": 2663} {"train_loss": -6.501720428466797, "global_step": 111871, "epoch": 2663} {"train_loss": -6.579768180847168, "global_step": 111872, "epoch": 2663} {"train_loss": -6.544968605041504, "global_step": 111873, "epoch": 2663} {"train_loss": -6.4244232177734375, "global_step": 111874, "epoch": 2663} {"train_loss": -6.4636030197143555, "global_step": 111875, "epoch": 2663} {"train_loss": -6.408543109893799, "global_step": 111876, "epoch": 2663} {"train_loss": -6.512106895446777, "global_step": 111877, "epoch": 2663} {"train_loss": -6.543354034423828, "global_step": 111878, "epoch": 2663} {"train_loss": -6.425350189208984, "global_step": 111879, "epoch": 2663} {"train_loss": -6.522187232971191, "global_step": 111880, "epoch": 2663} {"train_loss": -6.493194580078125, "global_step": 111881, "epoch": 2663} {"train_loss": -6.462751388549805, "global_step": 111882, "epoch": 2663} {"train_loss": -6.575864791870117, "global_step": 111883, "epoch": 2663} {"train_loss": -6.522025108337402, "global_step": 111884, "epoch": 2663} {"train_loss": -6.455151557922363, "global_step": 111885, "epoch": 2663} {"train_loss": -6.514820098876953, "global_step": 111886, "epoch": 2663} {"train_loss": -6.45947265625, "global_step": 111887, "epoch": 2663, "val_loss": 76477.6875} {"train_loss": -6.472531318664551, "global_step": 111888, "epoch": 2664} {"train_loss": -6.466747760772705, "global_step": 111889, "epoch": 2664} {"train_loss": -6.593929290771484, "global_step": 111890, "epoch": 2664} {"train_loss": -6.532407760620117, "global_step": 111891, "epoch": 2664} {"train_loss": -6.377725124359131, "global_step": 111892, "epoch": 2664} {"train_loss": -6.488388538360596, "global_step": 111893, "epoch": 2664} {"train_loss": -6.44696044921875, "global_step": 111894, "epoch": 2664} {"train_loss": -6.626309871673584, "global_step": 111895, "epoch": 2664} {"train_loss": -6.502509117126465, "global_step": 111896, "epoch": 2664} {"train_loss": -6.584936618804932, "global_step": 111897, "epoch": 2664} {"train_loss": -6.470726013183594, "global_step": 111898, "epoch": 2664} {"train_loss": -6.482316493988037, "global_step": 111899, "epoch": 2664} {"train_loss": -6.654444694519043, "global_step": 111900, "epoch": 2664} {"train_loss": -6.580933094024658, "global_step": 111901, "epoch": 2664} {"train_loss": -6.359959125518799, "global_step": 111902, "epoch": 2664} {"train_loss": -6.523010730743408, "global_step": 111903, "epoch": 2664} {"train_loss": -6.413228511810303, "global_step": 111904, "epoch": 2664} {"train_loss": -6.423043727874756, "global_step": 111905, "epoch": 2664} {"train_loss": -6.452927589416504, "global_step": 111906, "epoch": 2664} {"train_loss": -6.60738468170166, "global_step": 111907, "epoch": 2664} {"train_loss": -6.504471778869629, "global_step": 111908, "epoch": 2664} {"train_loss": -6.4175310134887695, "global_step": 111909, "epoch": 2664} {"train_loss": -6.44028377532959, "global_step": 111910, "epoch": 2664} {"train_loss": -6.476963043212891, "global_step": 111911, "epoch": 2664} {"train_loss": -6.454612731933594, "global_step": 111912, "epoch": 2664} {"train_loss": -6.453566551208496, "global_step": 111913, "epoch": 2664} {"train_loss": -6.45910120010376, "global_step": 111914, "epoch": 2664} {"train_loss": -6.433848857879639, "global_step": 111915, "epoch": 2664} {"train_loss": -6.4843244552612305, "global_step": 111916, "epoch": 2664} {"train_loss": -6.426382064819336, "global_step": 111917, "epoch": 2664} {"train_loss": -6.489800930023193, "global_step": 111918, "epoch": 2664} {"train_loss": -6.394251823425293, "global_step": 111919, "epoch": 2664} {"train_loss": -6.458202362060547, "global_step": 111920, "epoch": 2664} {"train_loss": -6.2534990310668945, "global_step": 111921, "epoch": 2664} {"train_loss": -6.4220991134643555, "global_step": 111922, "epoch": 2664} {"train_loss": -6.572329521179199, "global_step": 111923, "epoch": 2664} {"train_loss": -6.613007545471191, "global_step": 111924, "epoch": 2664} {"train_loss": -6.499579429626465, "global_step": 111925, "epoch": 2664} {"train_loss": -6.439919471740723, "global_step": 111926, "epoch": 2664} {"train_loss": -6.5276288986206055, "global_step": 111927, "epoch": 2664} {"train_loss": -6.550506591796875, "global_step": 111928, "epoch": 2664} {"train_loss": -6.483466670626686, "global_step": 111929, "epoch": 2664, "val_loss": 76392.71875} {"train_loss": -6.5077104568481445, "global_step": 111930, "epoch": 2665} {"train_loss": -6.480659008026123, "global_step": 111931, "epoch": 2665} {"train_loss": -6.5895233154296875, "global_step": 111932, "epoch": 2665} {"train_loss": -6.481869220733643, "global_step": 111933, "epoch": 2665} {"train_loss": -6.513654708862305, "global_step": 111934, "epoch": 2665} {"train_loss": -6.5044708251953125, "global_step": 111935, "epoch": 2665} {"train_loss": -6.502719402313232, "global_step": 111936, "epoch": 2665} {"train_loss": -6.544388771057129, "global_step": 111937, "epoch": 2665} {"train_loss": -6.4491424560546875, "global_step": 111938, "epoch": 2665} {"train_loss": -6.509415626525879, "global_step": 111939, "epoch": 2665} {"train_loss": -6.497547626495361, "global_step": 111940, "epoch": 2665} {"train_loss": -6.507114410400391, "global_step": 111941, "epoch": 2665} {"train_loss": -6.532751560211182, "global_step": 111942, "epoch": 2665} {"train_loss": -6.642029285430908, "global_step": 111943, "epoch": 2665} {"train_loss": -6.571114540100098, "global_step": 111944, "epoch": 2665} {"train_loss": -6.430580139160156, "global_step": 111945, "epoch": 2665} {"train_loss": -6.565869331359863, "global_step": 111946, "epoch": 2665} {"train_loss": -6.444421291351318, "global_step": 111947, "epoch": 2665} {"train_loss": -6.462180137634277, "global_step": 111948, "epoch": 2665} {"train_loss": -6.438536643981934, "global_step": 111949, "epoch": 2665} {"train_loss": -6.424767017364502, "global_step": 111950, "epoch": 2665} {"train_loss": -6.467144012451172, "global_step": 111951, "epoch": 2665} {"train_loss": -6.420353412628174, "global_step": 111952, "epoch": 2665} {"train_loss": -6.469791412353516, "global_step": 111953, "epoch": 2665} {"train_loss": -6.415186882019043, "global_step": 111954, "epoch": 2665} {"train_loss": -6.4337615966796875, "global_step": 111955, "epoch": 2665} {"train_loss": -6.505407810211182, "global_step": 111956, "epoch": 2665} {"train_loss": -6.516190528869629, "global_step": 111957, "epoch": 2665} {"train_loss": -6.4309563636779785, "global_step": 111958, "epoch": 2665} {"train_loss": -6.372776031494141, "global_step": 111959, "epoch": 2665} {"train_loss": -6.405348777770996, "global_step": 111960, "epoch": 2665} {"train_loss": -6.434835910797119, "global_step": 111961, "epoch": 2665} {"train_loss": -6.44547700881958, "global_step": 111962, "epoch": 2665} {"train_loss": -6.547605514526367, "global_step": 111963, "epoch": 2665} {"train_loss": -6.48403263092041, "global_step": 111964, "epoch": 2665} {"train_loss": -6.335607528686523, "global_step": 111965, "epoch": 2665} {"train_loss": -6.503708839416504, "global_step": 111966, "epoch": 2665} {"train_loss": -6.473273277282715, "global_step": 111967, "epoch": 2665} {"train_loss": -6.337371826171875, "global_step": 111968, "epoch": 2665} {"train_loss": -6.416980743408203, "global_step": 111969, "epoch": 2665} {"train_loss": -6.344593048095703, "global_step": 111970, "epoch": 2665} {"train_loss": -6.4731108120509555, "global_step": 111971, "epoch": 2665, "val_loss": 76563.15625} {"train_loss": -6.307862281799316, "global_step": 111972, "epoch": 2666} {"train_loss": -6.5736494064331055, "global_step": 111973, "epoch": 2666} {"train_loss": -6.589545249938965, "global_step": 111974, "epoch": 2666} {"train_loss": -6.457577705383301, "global_step": 111975, "epoch": 2666} {"train_loss": -6.600094795227051, "global_step": 111976, "epoch": 2666} {"train_loss": -6.465383529663086, "global_step": 111977, "epoch": 2666} {"train_loss": -6.521516799926758, "global_step": 111978, "epoch": 2666} {"train_loss": -6.596894264221191, "global_step": 111979, "epoch": 2666} {"train_loss": -6.529201984405518, "global_step": 111980, "epoch": 2666} {"train_loss": -6.448121547698975, "global_step": 111981, "epoch": 2666} {"train_loss": -6.507045745849609, "global_step": 111982, "epoch": 2666} {"train_loss": -6.5542473793029785, "global_step": 111983, "epoch": 2666} {"train_loss": -6.459506034851074, "global_step": 111984, "epoch": 2666} {"train_loss": -6.5149030685424805, "global_step": 111985, "epoch": 2666} {"train_loss": -6.5483293533325195, "global_step": 111986, "epoch": 2666} {"train_loss": -6.4281086921691895, "global_step": 111987, "epoch": 2666} {"train_loss": -6.503226280212402, "global_step": 111988, "epoch": 2666} {"train_loss": -6.551149368286133, "global_step": 111989, "epoch": 2666} {"train_loss": -6.461127758026123, "global_step": 111990, "epoch": 2666} {"train_loss": -6.60340690612793, "global_step": 111991, "epoch": 2666} {"train_loss": -6.602132797241211, "global_step": 111992, "epoch": 2666} {"train_loss": -6.517441749572754, "global_step": 111993, "epoch": 2666} {"train_loss": -6.446826934814453, "global_step": 111994, "epoch": 2666} {"train_loss": -6.63387393951416, "global_step": 111995, "epoch": 2666} {"train_loss": -6.393364906311035, "global_step": 111996, "epoch": 2666} {"train_loss": -6.539068222045898, "global_step": 111997, "epoch": 2666} {"train_loss": -6.583855628967285, "global_step": 111998, "epoch": 2666} {"train_loss": -6.462693691253662, "global_step": 111999, "epoch": 2666} {"train_loss": -6.48606014251709, "global_step": 112000, "epoch": 2666} {"train_loss": -6.60321044921875, "global_step": 112001, "epoch": 2666} {"train_loss": -6.5953474044799805, "global_step": 112002, "epoch": 2666} {"train_loss": -6.46763801574707, "global_step": 112003, "epoch": 2666} {"train_loss": -6.374245643615723, "global_step": 112004, "epoch": 2666} {"train_loss": -6.524682521820068, "global_step": 112005, "epoch": 2666} {"train_loss": -6.498023986816406, "global_step": 112006, "epoch": 2666} {"train_loss": -6.4960527420043945, "global_step": 112007, "epoch": 2666} {"train_loss": -6.511768341064453, "global_step": 112008, "epoch": 2666} {"train_loss": -6.413573265075684, "global_step": 112009, "epoch": 2666} {"train_loss": -6.537166595458984, "global_step": 112010, "epoch": 2666} {"train_loss": -6.376784324645996, "global_step": 112011, "epoch": 2666} {"train_loss": -6.432011127471924, "global_step": 112012, "epoch": 2666} {"train_loss": -6.505323659806025, "global_step": 112013, "epoch": 2666, "val_loss": 76301.65625} {"train_loss": -6.492277145385742, "global_step": 112014, "epoch": 2667} {"train_loss": -6.433876991271973, "global_step": 112015, "epoch": 2667} {"train_loss": -6.443441390991211, "global_step": 112016, "epoch": 2667} {"train_loss": -6.551408290863037, "global_step": 112017, "epoch": 2667} {"train_loss": -6.546115875244141, "global_step": 112018, "epoch": 2667} {"train_loss": -6.591836929321289, "global_step": 112019, "epoch": 2667} {"train_loss": -6.433547019958496, "global_step": 112020, "epoch": 2667} {"train_loss": -6.456343173980713, "global_step": 112021, "epoch": 2667} {"train_loss": -6.435376167297363, "global_step": 112022, "epoch": 2667} {"train_loss": -6.4556193351745605, "global_step": 112023, "epoch": 2667} {"train_loss": -6.378973960876465, "global_step": 112024, "epoch": 2667} {"train_loss": -6.52182149887085, "global_step": 112025, "epoch": 2667} {"train_loss": -6.17510986328125, "global_step": 112026, "epoch": 2667} {"train_loss": -6.5320587158203125, "global_step": 112027, "epoch": 2667} {"train_loss": -6.45155143737793, "global_step": 112028, "epoch": 2667} {"train_loss": -6.459323883056641, "global_step": 112029, "epoch": 2667} {"train_loss": -6.527273178100586, "global_step": 112030, "epoch": 2667} {"train_loss": -6.421477794647217, "global_step": 112031, "epoch": 2667} {"train_loss": -6.3878326416015625, "global_step": 112032, "epoch": 2667} {"train_loss": -6.557999134063721, "global_step": 112033, "epoch": 2667} {"train_loss": -6.286782264709473, "global_step": 112034, "epoch": 2667} {"train_loss": -6.438838958740234, "global_step": 112035, "epoch": 2667} {"train_loss": -6.343255996704102, "global_step": 112036, "epoch": 2667} {"train_loss": -6.4666056632995605, "global_step": 112037, "epoch": 2667} {"train_loss": -6.44843864440918, "global_step": 112038, "epoch": 2667} {"train_loss": -6.425478458404541, "global_step": 112039, "epoch": 2667} {"train_loss": -6.406598091125488, "global_step": 112040, "epoch": 2667} {"train_loss": -6.402507781982422, "global_step": 112041, "epoch": 2667} {"train_loss": -6.4654107093811035, "global_step": 112042, "epoch": 2667} {"train_loss": -6.350138187408447, "global_step": 112043, "epoch": 2667} {"train_loss": -6.4366559982299805, "global_step": 112044, "epoch": 2667} {"train_loss": -6.455780506134033, "global_step": 112045, "epoch": 2667} {"train_loss": -6.477027893066406, "global_step": 112046, "epoch": 2667} {"train_loss": -6.4517059326171875, "global_step": 112047, "epoch": 2667} {"train_loss": -6.477752685546875, "global_step": 112048, "epoch": 2667} {"train_loss": -6.344688415527344, "global_step": 112049, "epoch": 2667} {"train_loss": -6.576772689819336, "global_step": 112050, "epoch": 2667} {"train_loss": -6.478606224060059, "global_step": 112051, "epoch": 2667} {"train_loss": -6.382846832275391, "global_step": 112052, "epoch": 2667} {"train_loss": -6.527492523193359, "global_step": 112053, "epoch": 2667} {"train_loss": -6.529664993286133, "global_step": 112054, "epoch": 2667} {"train_loss": -6.449860402515957, "global_step": 112055, "epoch": 2667, "val_loss": 76129.1640625} {"train_loss": -6.5836334228515625, "global_step": 112056, "epoch": 2668} {"train_loss": -6.545162200927734, "global_step": 112057, "epoch": 2668} {"train_loss": -6.5000386238098145, "global_step": 112058, "epoch": 2668} {"train_loss": -6.549618721008301, "global_step": 112059, "epoch": 2668} {"train_loss": -6.429237365722656, "global_step": 112060, "epoch": 2668} {"train_loss": -6.456128120422363, "global_step": 112061, "epoch": 2668} {"train_loss": -6.471219062805176, "global_step": 112062, "epoch": 2668} {"train_loss": -6.496246814727783, "global_step": 112063, "epoch": 2668} {"train_loss": -6.561070919036865, "global_step": 112064, "epoch": 2668} {"train_loss": -6.522672653198242, "global_step": 112065, "epoch": 2668} {"train_loss": -6.5464582443237305, "global_step": 112066, "epoch": 2668} {"train_loss": -6.420148849487305, "global_step": 112067, "epoch": 2668} {"train_loss": -6.562386989593506, "global_step": 112068, "epoch": 2668} {"train_loss": -6.489725112915039, "global_step": 112069, "epoch": 2668} {"train_loss": -6.569296836853027, "global_step": 112070, "epoch": 2668} {"train_loss": -6.544487476348877, "global_step": 112071, "epoch": 2668} {"train_loss": -6.455214977264404, "global_step": 112072, "epoch": 2668} {"train_loss": -6.538508892059326, "global_step": 112073, "epoch": 2668} {"train_loss": -6.557710647583008, "global_step": 112074, "epoch": 2668} {"train_loss": -6.546274185180664, "global_step": 112075, "epoch": 2668} {"train_loss": -6.549322128295898, "global_step": 112076, "epoch": 2668} {"train_loss": -6.586989402770996, "global_step": 112077, "epoch": 2668} {"train_loss": -6.475961685180664, "global_step": 112078, "epoch": 2668} {"train_loss": -6.419573783874512, "global_step": 112079, "epoch": 2668} {"train_loss": -6.571272373199463, "global_step": 112080, "epoch": 2668} {"train_loss": -6.491417407989502, "global_step": 112081, "epoch": 2668} {"train_loss": -6.465215682983398, "global_step": 112082, "epoch": 2668} {"train_loss": -6.53461217880249, "global_step": 112083, "epoch": 2668} {"train_loss": -6.483916759490967, "global_step": 112084, "epoch": 2668} {"train_loss": -6.422059059143066, "global_step": 112085, "epoch": 2668} {"train_loss": -6.3600568771362305, "global_step": 112086, "epoch": 2668} {"train_loss": -6.477973937988281, "global_step": 112087, "epoch": 2668} {"train_loss": -6.493456840515137, "global_step": 112088, "epoch": 2668} {"train_loss": -6.433941841125488, "global_step": 112089, "epoch": 2668} {"train_loss": -6.499289512634277, "global_step": 112090, "epoch": 2668} {"train_loss": -6.466082572937012, "global_step": 112091, "epoch": 2668} {"train_loss": -6.496789932250977, "global_step": 112092, "epoch": 2668} {"train_loss": -6.517770290374756, "global_step": 112093, "epoch": 2668} {"train_loss": -6.468593120574951, "global_step": 112094, "epoch": 2668} {"train_loss": -6.34492301940918, "global_step": 112095, "epoch": 2668} {"train_loss": -6.511194229125977, "global_step": 112096, "epoch": 2668} {"train_loss": -6.497190486817133, "global_step": 112097, "epoch": 2668, "val_loss": 76268.1015625} {"train_loss": -6.651956558227539, "global_step": 112098, "epoch": 2669} {"train_loss": -6.480403423309326, "global_step": 112099, "epoch": 2669} {"train_loss": -6.486886978149414, "global_step": 112100, "epoch": 2669} {"train_loss": -6.555184364318848, "global_step": 112101, "epoch": 2669} {"train_loss": -6.456742286682129, "global_step": 112102, "epoch": 2669} {"train_loss": -6.643562316894531, "global_step": 112103, "epoch": 2669} {"train_loss": -6.480486869812012, "global_step": 112104, "epoch": 2669} {"train_loss": -6.535647392272949, "global_step": 112105, "epoch": 2669} {"train_loss": -6.561265468597412, "global_step": 112106, "epoch": 2669} {"train_loss": -6.530605792999268, "global_step": 112107, "epoch": 2669} {"train_loss": -6.514045715332031, "global_step": 112108, "epoch": 2669} {"train_loss": -6.404046058654785, "global_step": 112109, "epoch": 2669} {"train_loss": -6.695152282714844, "global_step": 112110, "epoch": 2669} {"train_loss": -6.541177272796631, "global_step": 112111, "epoch": 2669} {"train_loss": -6.522675514221191, "global_step": 112112, "epoch": 2669} {"train_loss": -6.493098735809326, "global_step": 112113, "epoch": 2669} {"train_loss": -6.555529594421387, "global_step": 112114, "epoch": 2669} {"train_loss": -6.4904069900512695, "global_step": 112115, "epoch": 2669} {"train_loss": -6.407381534576416, "global_step": 112116, "epoch": 2669} {"train_loss": -6.380419731140137, "global_step": 112117, "epoch": 2669} {"train_loss": -6.625862121582031, "global_step": 112118, "epoch": 2669} {"train_loss": -6.448596000671387, "global_step": 112119, "epoch": 2669} {"train_loss": -6.484921455383301, "global_step": 112120, "epoch": 2669} {"train_loss": -6.609020233154297, "global_step": 112121, "epoch": 2669} {"train_loss": -6.442482948303223, "global_step": 112122, "epoch": 2669} {"train_loss": -6.449823379516602, "global_step": 112123, "epoch": 2669} {"train_loss": -6.428478717803955, "global_step": 112124, "epoch": 2669} {"train_loss": -6.536248683929443, "global_step": 112125, "epoch": 2669} {"train_loss": -6.404719352722168, "global_step": 112126, "epoch": 2669} {"train_loss": -6.495461463928223, "global_step": 112127, "epoch": 2669} {"train_loss": -6.573368072509766, "global_step": 112128, "epoch": 2669} {"train_loss": -6.505744934082031, "global_step": 112129, "epoch": 2669} {"train_loss": -6.405086994171143, "global_step": 112130, "epoch": 2669} {"train_loss": -6.386035919189453, "global_step": 112131, "epoch": 2669} {"train_loss": -6.547642707824707, "global_step": 112132, "epoch": 2669} {"train_loss": -6.545283317565918, "global_step": 112133, "epoch": 2669} {"train_loss": -6.383157730102539, "global_step": 112134, "epoch": 2669} {"train_loss": -6.448184013366699, "global_step": 112135, "epoch": 2669} {"train_loss": -6.480459690093994, "global_step": 112136, "epoch": 2669} {"train_loss": -6.450530529022217, "global_step": 112137, "epoch": 2669} {"train_loss": -6.490656852722168, "global_step": 112138, "epoch": 2669} {"train_loss": -6.503890310014997, "global_step": 112139, "epoch": 2669, "val_loss": 76869.0} {"train_loss": -6.391395568847656, "global_step": 112140, "epoch": 2670} {"train_loss": -6.313070297241211, "global_step": 112141, "epoch": 2670} {"train_loss": -6.462710380554199, "global_step": 112142, "epoch": 2670} {"train_loss": -6.365643501281738, "global_step": 112143, "epoch": 2670} {"train_loss": -6.460336685180664, "global_step": 112144, "epoch": 2670} {"train_loss": -6.427958965301514, "global_step": 112145, "epoch": 2670} {"train_loss": -6.608431816101074, "global_step": 112146, "epoch": 2670} {"train_loss": -6.472663402557373, "global_step": 112147, "epoch": 2670} {"train_loss": -6.410647392272949, "global_step": 112148, "epoch": 2670} {"train_loss": -6.544487953186035, "global_step": 112149, "epoch": 2670} {"train_loss": -6.4000325202941895, "global_step": 112150, "epoch": 2670} {"train_loss": -6.495262145996094, "global_step": 112151, "epoch": 2670} {"train_loss": -6.4875993728637695, "global_step": 112152, "epoch": 2670} {"train_loss": -6.538555145263672, "global_step": 112153, "epoch": 2670} {"train_loss": -6.471262454986572, "global_step": 112154, "epoch": 2670} {"train_loss": -6.502749919891357, "global_step": 112155, "epoch": 2670} {"train_loss": -6.533136367797852, "global_step": 112156, "epoch": 2670} {"train_loss": -6.505603790283203, "global_step": 112157, "epoch": 2670} {"train_loss": -6.423334121704102, "global_step": 112158, "epoch": 2670} {"train_loss": -6.408607482910156, "global_step": 112159, "epoch": 2670} {"train_loss": -6.49555778503418, "global_step": 112160, "epoch": 2670} {"train_loss": -6.4719696044921875, "global_step": 112161, "epoch": 2670} {"train_loss": -6.422122955322266, "global_step": 112162, "epoch": 2670} {"train_loss": -6.476606369018555, "global_step": 112163, "epoch": 2670} {"train_loss": -6.524570465087891, "global_step": 112164, "epoch": 2670} {"train_loss": -6.461971759796143, "global_step": 112165, "epoch": 2670} {"train_loss": -6.430605888366699, "global_step": 112166, "epoch": 2670} {"train_loss": -6.533987998962402, "global_step": 112167, "epoch": 2670} {"train_loss": -6.454814434051514, "global_step": 112168, "epoch": 2670} {"train_loss": -6.473723888397217, "global_step": 112169, "epoch": 2670} {"train_loss": -6.649392127990723, "global_step": 112170, "epoch": 2670} {"train_loss": -6.512947082519531, "global_step": 112171, "epoch": 2670} {"train_loss": -6.444588661193848, "global_step": 112172, "epoch": 2670} {"train_loss": -6.540709495544434, "global_step": 112173, "epoch": 2670} {"train_loss": -6.402571678161621, "global_step": 112174, "epoch": 2670} {"train_loss": -6.41566801071167, "global_step": 112175, "epoch": 2670} {"train_loss": -6.413035869598389, "global_step": 112176, "epoch": 2670} {"train_loss": -6.537468433380127, "global_step": 112177, "epoch": 2670} {"train_loss": -6.599338531494141, "global_step": 112178, "epoch": 2670} {"train_loss": -6.550476551055908, "global_step": 112179, "epoch": 2670} {"train_loss": -6.363864421844482, "global_step": 112180, "epoch": 2670} {"train_loss": -6.473535174415225, "global_step": 112181, "epoch": 2670, "val_loss": 76810.671875} {"train_loss": -6.497982501983643, "global_step": 112182, "epoch": 2671} {"train_loss": -6.456843852996826, "global_step": 112183, "epoch": 2671} {"train_loss": -6.465705871582031, "global_step": 112184, "epoch": 2671} {"train_loss": -6.473727226257324, "global_step": 112185, "epoch": 2671} {"train_loss": -6.4117431640625, "global_step": 112186, "epoch": 2671} {"train_loss": -6.408810615539551, "global_step": 112187, "epoch": 2671} {"train_loss": -6.457211971282959, "global_step": 112188, "epoch": 2671} {"train_loss": -6.322082996368408, "global_step": 112189, "epoch": 2671} {"train_loss": -6.552117347717285, "global_step": 112190, "epoch": 2671} {"train_loss": -6.4180450439453125, "global_step": 112191, "epoch": 2671} {"train_loss": -6.481539726257324, "global_step": 112192, "epoch": 2671} {"train_loss": -6.3651227951049805, "global_step": 112193, "epoch": 2671} {"train_loss": -6.435855865478516, "global_step": 112194, "epoch": 2671} {"train_loss": -6.463657379150391, "global_step": 112195, "epoch": 2671} {"train_loss": -6.516841411590576, "global_step": 112196, "epoch": 2671} {"train_loss": -6.469498634338379, "global_step": 112197, "epoch": 2671} {"train_loss": -6.5707807540893555, "global_step": 112198, "epoch": 2671} {"train_loss": -6.570053577423096, "global_step": 112199, "epoch": 2671} {"train_loss": -6.5591912269592285, "global_step": 112200, "epoch": 2671} {"train_loss": -6.51607608795166, "global_step": 112201, "epoch": 2671} {"train_loss": -6.501336574554443, "global_step": 112202, "epoch": 2671} {"train_loss": -6.506304740905762, "global_step": 112203, "epoch": 2671} {"train_loss": -6.524221420288086, "global_step": 112204, "epoch": 2671} {"train_loss": -6.52793025970459, "global_step": 112205, "epoch": 2671} {"train_loss": -6.508804798126221, "global_step": 112206, "epoch": 2671} {"train_loss": -6.526620864868164, "global_step": 112207, "epoch": 2671} {"train_loss": -6.49029541015625, "global_step": 112208, "epoch": 2671} {"train_loss": -6.42242431640625, "global_step": 112209, "epoch": 2671} {"train_loss": -6.502366065979004, "global_step": 112210, "epoch": 2671} {"train_loss": -6.418424606323242, "global_step": 112211, "epoch": 2671} {"train_loss": -6.5055952072143555, "global_step": 112212, "epoch": 2671} {"train_loss": -6.466442584991455, "global_step": 112213, "epoch": 2671} {"train_loss": -6.468596458435059, "global_step": 112214, "epoch": 2671} {"train_loss": -6.328524589538574, "global_step": 112215, "epoch": 2671} {"train_loss": -6.496706962585449, "global_step": 112216, "epoch": 2671} {"train_loss": -6.421128273010254, "global_step": 112217, "epoch": 2671} {"train_loss": -6.543712615966797, "global_step": 112218, "epoch": 2671} {"train_loss": -6.5149407386779785, "global_step": 112219, "epoch": 2671} {"train_loss": -6.557459831237793, "global_step": 112220, "epoch": 2671} {"train_loss": -6.476250648498535, "global_step": 112221, "epoch": 2671} {"train_loss": -6.479077339172363, "global_step": 112222, "epoch": 2671} {"train_loss": -6.478662070773897, "global_step": 112223, "epoch": 2671, "val_loss": 76169.1171875} {"train_loss": -6.495939254760742, "global_step": 112224, "epoch": 2672} {"train_loss": -6.4863481521606445, "global_step": 112225, "epoch": 2672} {"train_loss": -6.387592315673828, "global_step": 112226, "epoch": 2672} {"train_loss": -6.536770820617676, "global_step": 112227, "epoch": 2672} {"train_loss": -6.493463516235352, "global_step": 112228, "epoch": 2672} {"train_loss": -6.468439102172852, "global_step": 112229, "epoch": 2672} {"train_loss": -6.456295967102051, "global_step": 112230, "epoch": 2672} {"train_loss": -6.520748138427734, "global_step": 112231, "epoch": 2672} {"train_loss": -6.550598621368408, "global_step": 112232, "epoch": 2672} {"train_loss": -6.437142848968506, "global_step": 112233, "epoch": 2672} {"train_loss": -6.457625865936279, "global_step": 112234, "epoch": 2672} {"train_loss": -6.431187629699707, "global_step": 112235, "epoch": 2672} {"train_loss": -6.495361804962158, "global_step": 112236, "epoch": 2672} {"train_loss": -6.486169815063477, "global_step": 112237, "epoch": 2672} {"train_loss": -6.435920715332031, "global_step": 112238, "epoch": 2672} {"train_loss": -6.467568397521973, "global_step": 112239, "epoch": 2672} {"train_loss": -6.4619903564453125, "global_step": 112240, "epoch": 2672} {"train_loss": -6.376055717468262, "global_step": 112241, "epoch": 2672} {"train_loss": -6.444817543029785, "global_step": 112242, "epoch": 2672} {"train_loss": -6.437966346740723, "global_step": 112243, "epoch": 2672} {"train_loss": -6.386935234069824, "global_step": 112244, "epoch": 2672} {"train_loss": -6.476961612701416, "global_step": 112245, "epoch": 2672} {"train_loss": -6.482576847076416, "global_step": 112246, "epoch": 2672} {"train_loss": -6.438155174255371, "global_step": 112247, "epoch": 2672} {"train_loss": -6.400612831115723, "global_step": 112248, "epoch": 2672} {"train_loss": -6.461380958557129, "global_step": 112249, "epoch": 2672} {"train_loss": -6.461494445800781, "global_step": 112250, "epoch": 2672} {"train_loss": -6.44048547744751, "global_step": 112251, "epoch": 2672} {"train_loss": -6.568272113800049, "global_step": 112252, "epoch": 2672} {"train_loss": -6.4153151512146, "global_step": 112253, "epoch": 2672} {"train_loss": -6.470579624176025, "global_step": 112254, "epoch": 2672} {"train_loss": -6.385122299194336, "global_step": 112255, "epoch": 2672} {"train_loss": -6.538395881652832, "global_step": 112256, "epoch": 2672} {"train_loss": -6.392871379852295, "global_step": 112257, "epoch": 2672} {"train_loss": -6.382238864898682, "global_step": 112258, "epoch": 2672} {"train_loss": -6.340540409088135, "global_step": 112259, "epoch": 2672} {"train_loss": -6.325321674346924, "global_step": 112260, "epoch": 2672} {"train_loss": -6.467963218688965, "global_step": 112261, "epoch": 2672} {"train_loss": -6.428421497344971, "global_step": 112262, "epoch": 2672} {"train_loss": -6.322269916534424, "global_step": 112263, "epoch": 2672} {"train_loss": -6.486027717590332, "global_step": 112264, "epoch": 2672} {"train_loss": -6.447551136925107, "global_step": 112265, "epoch": 2672, "val_loss": 76380.5546875} {"train_loss": -6.388470649719238, "global_step": 112266, "epoch": 2673} {"train_loss": -6.412628173828125, "global_step": 112267, "epoch": 2673} {"train_loss": -6.42172384262085, "global_step": 112268, "epoch": 2673} {"train_loss": -6.420289039611816, "global_step": 112269, "epoch": 2673} {"train_loss": -6.434422492980957, "global_step": 112270, "epoch": 2673} {"train_loss": -6.430154800415039, "global_step": 112271, "epoch": 2673} {"train_loss": -6.5322465896606445, "global_step": 112272, "epoch": 2673} {"train_loss": -6.446603775024414, "global_step": 112273, "epoch": 2673} {"train_loss": -6.447298049926758, "global_step": 112274, "epoch": 2673} {"train_loss": -6.483610153198242, "global_step": 112275, "epoch": 2673} {"train_loss": -6.358695983886719, "global_step": 112276, "epoch": 2673} {"train_loss": -6.434954643249512, "global_step": 112277, "epoch": 2673} {"train_loss": -6.478543758392334, "global_step": 112278, "epoch": 2673} {"train_loss": -6.430030345916748, "global_step": 112279, "epoch": 2673} {"train_loss": -6.479525089263916, "global_step": 112280, "epoch": 2673} {"train_loss": -6.413546562194824, "global_step": 112281, "epoch": 2673} {"train_loss": -6.455156326293945, "global_step": 112282, "epoch": 2673} {"train_loss": -6.501517295837402, "global_step": 112283, "epoch": 2673} {"train_loss": -6.420884132385254, "global_step": 112284, "epoch": 2673} {"train_loss": -6.5222883224487305, "global_step": 112285, "epoch": 2673} {"train_loss": -6.440765857696533, "global_step": 112286, "epoch": 2673} {"train_loss": -6.464141845703125, "global_step": 112287, "epoch": 2673} {"train_loss": -6.507926940917969, "global_step": 112288, "epoch": 2673} {"train_loss": -6.407824516296387, "global_step": 112289, "epoch": 2673} {"train_loss": -6.48445987701416, "global_step": 112290, "epoch": 2673} {"train_loss": -6.484821319580078, "global_step": 112291, "epoch": 2673} {"train_loss": -6.515212535858154, "global_step": 112292, "epoch": 2673} {"train_loss": -6.49220609664917, "global_step": 112293, "epoch": 2673} {"train_loss": -6.455206871032715, "global_step": 112294, "epoch": 2673} {"train_loss": -6.545007705688477, "global_step": 112295, "epoch": 2673} {"train_loss": -6.448094367980957, "global_step": 112296, "epoch": 2673} {"train_loss": -6.509817123413086, "global_step": 112297, "epoch": 2673} {"train_loss": -6.489040374755859, "global_step": 112298, "epoch": 2673} {"train_loss": -6.464641571044922, "global_step": 112299, "epoch": 2673} {"train_loss": -6.39571475982666, "global_step": 112300, "epoch": 2673} {"train_loss": -6.439940929412842, "global_step": 112301, "epoch": 2673} {"train_loss": -6.383944511413574, "global_step": 112302, "epoch": 2673} {"train_loss": -6.3911237716674805, "global_step": 112303, "epoch": 2673} {"train_loss": -6.356997013092041, "global_step": 112304, "epoch": 2673} {"train_loss": -6.662140846252441, "global_step": 112305, "epoch": 2673} {"train_loss": -6.545633316040039, "global_step": 112306, "epoch": 2673} {"train_loss": -6.459902150290353, "global_step": 112307, "epoch": 2673, "val_loss": 76378.6953125} {"train_loss": -6.662675857543945, "global_step": 112308, "epoch": 2674} {"train_loss": -6.437469482421875, "global_step": 112309, "epoch": 2674} {"train_loss": -6.624660968780518, "global_step": 112310, "epoch": 2674} {"train_loss": -6.497535705566406, "global_step": 112311, "epoch": 2674} {"train_loss": -6.507992267608643, "global_step": 112312, "epoch": 2674} {"train_loss": -6.600102424621582, "global_step": 112313, "epoch": 2674} {"train_loss": -6.534937858581543, "global_step": 112314, "epoch": 2674} {"train_loss": -6.574405670166016, "global_step": 112315, "epoch": 2674} {"train_loss": -6.514862537384033, "global_step": 112316, "epoch": 2674} {"train_loss": -6.459616661071777, "global_step": 112317, "epoch": 2674} {"train_loss": -6.5738396644592285, "global_step": 112318, "epoch": 2674} {"train_loss": -6.559446811676025, "global_step": 112319, "epoch": 2674} {"train_loss": -6.399106025695801, "global_step": 112320, "epoch": 2674} {"train_loss": -6.468812465667725, "global_step": 112321, "epoch": 2674} {"train_loss": -6.440295219421387, "global_step": 112322, "epoch": 2674} {"train_loss": -6.449502944946289, "global_step": 112323, "epoch": 2674} {"train_loss": -6.607205390930176, "global_step": 112324, "epoch": 2674} {"train_loss": -6.619576454162598, "global_step": 112325, "epoch": 2674} {"train_loss": -6.44795036315918, "global_step": 112326, "epoch": 2674} {"train_loss": -6.538738250732422, "global_step": 112327, "epoch": 2674} {"train_loss": -6.422369003295898, "global_step": 112328, "epoch": 2674} {"train_loss": -6.572278022766113, "global_step": 112329, "epoch": 2674} {"train_loss": -6.473001480102539, "global_step": 112330, "epoch": 2674} {"train_loss": -6.5661821365356445, "global_step": 112331, "epoch": 2674} {"train_loss": -6.620159149169922, "global_step": 112332, "epoch": 2674} {"train_loss": -6.6281046867370605, "global_step": 112333, "epoch": 2674} {"train_loss": -6.510412693023682, "global_step": 112334, "epoch": 2674} {"train_loss": -6.582421779632568, "global_step": 112335, "epoch": 2674} {"train_loss": -6.450055122375488, "global_step": 112336, "epoch": 2674} {"train_loss": -6.483417510986328, "global_step": 112337, "epoch": 2674} {"train_loss": -6.451206684112549, "global_step": 112338, "epoch": 2674} {"train_loss": -6.450807571411133, "global_step": 112339, "epoch": 2674} {"train_loss": -6.454719543457031, "global_step": 112340, "epoch": 2674} {"train_loss": -6.6262898445129395, "global_step": 112341, "epoch": 2674} {"train_loss": -6.370650291442871, "global_step": 112342, "epoch": 2674} {"train_loss": -6.54875373840332, "global_step": 112343, "epoch": 2674} {"train_loss": -6.4983625411987305, "global_step": 112344, "epoch": 2674} {"train_loss": -6.382826805114746, "global_step": 112345, "epoch": 2674} {"train_loss": -6.4778618812561035, "global_step": 112346, "epoch": 2674} {"train_loss": -6.358510971069336, "global_step": 112347, "epoch": 2674} {"train_loss": -6.48314094543457, "global_step": 112348, "epoch": 2674} {"train_loss": -6.509687264760335, "global_step": 112349, "epoch": 2674, "val_loss": 76445.625} {"train_loss": -6.486477375030518, "global_step": 112350, "epoch": 2675} {"train_loss": -6.508007526397705, "global_step": 112351, "epoch": 2675} {"train_loss": -6.5483174324035645, "global_step": 112352, "epoch": 2675} {"train_loss": -6.617565155029297, "global_step": 112353, "epoch": 2675} {"train_loss": -6.523331642150879, "global_step": 112354, "epoch": 2675} {"train_loss": -6.51941442489624, "global_step": 112355, "epoch": 2675} {"train_loss": -6.4720458984375, "global_step": 112356, "epoch": 2675} {"train_loss": -6.466658592224121, "global_step": 112357, "epoch": 2675} {"train_loss": -6.567336082458496, "global_step": 112358, "epoch": 2675} {"train_loss": -6.543489456176758, "global_step": 112359, "epoch": 2675} {"train_loss": -6.5125732421875, "global_step": 112360, "epoch": 2675} {"train_loss": -6.477723121643066, "global_step": 112361, "epoch": 2675} {"train_loss": -6.598609924316406, "global_step": 112362, "epoch": 2675} {"train_loss": -6.521244525909424, "global_step": 112363, "epoch": 2675} {"train_loss": -6.629192352294922, "global_step": 112364, "epoch": 2675} {"train_loss": -6.604186058044434, "global_step": 112365, "epoch": 2675} {"train_loss": -6.6078643798828125, "global_step": 112366, "epoch": 2675} {"train_loss": -6.471776962280273, "global_step": 112367, "epoch": 2675} {"train_loss": -6.3918538093566895, "global_step": 112368, "epoch": 2675} {"train_loss": -6.4286041259765625, "global_step": 112369, "epoch": 2675} {"train_loss": -6.41612434387207, "global_step": 112370, "epoch": 2675} {"train_loss": -6.554660797119141, "global_step": 112371, "epoch": 2675} {"train_loss": -6.5103960037231445, "global_step": 112372, "epoch": 2675} {"train_loss": -6.436720371246338, "global_step": 112373, "epoch": 2675} {"train_loss": -6.517078399658203, "global_step": 112374, "epoch": 2675} {"train_loss": -6.40521240234375, "global_step": 112375, "epoch": 2675} {"train_loss": -6.592886924743652, "global_step": 112376, "epoch": 2675} {"train_loss": -6.397393226623535, "global_step": 112377, "epoch": 2675} {"train_loss": -6.352190971374512, "global_step": 112378, "epoch": 2675} {"train_loss": -6.332721710205078, "global_step": 112379, "epoch": 2675} {"train_loss": -6.5797119140625, "global_step": 112380, "epoch": 2675} {"train_loss": -6.395941734313965, "global_step": 112381, "epoch": 2675} {"train_loss": -6.511505126953125, "global_step": 112382, "epoch": 2675} {"train_loss": -6.487944602966309, "global_step": 112383, "epoch": 2675} {"train_loss": -6.470912456512451, "global_step": 112384, "epoch": 2675} {"train_loss": -6.525700092315674, "global_step": 112385, "epoch": 2675} {"train_loss": -6.564459800720215, "global_step": 112386, "epoch": 2675} {"train_loss": -6.519870758056641, "global_step": 112387, "epoch": 2675} {"train_loss": -6.51090145111084, "global_step": 112388, "epoch": 2675} {"train_loss": -6.608288764953613, "global_step": 112389, "epoch": 2675} {"train_loss": -6.479775905609131, "global_step": 112390, "epoch": 2675} {"train_loss": -6.5070729823339555, "global_step": 112391, "epoch": 2675, "val_loss": 76363.515625} {"train_loss": -6.489570140838623, "global_step": 112392, "epoch": 2676} {"train_loss": -6.468514442443848, "global_step": 112393, "epoch": 2676} {"train_loss": -6.4226274490356445, "global_step": 112394, "epoch": 2676} {"train_loss": -6.511448383331299, "global_step": 112395, "epoch": 2676} {"train_loss": -6.457826614379883, "global_step": 112396, "epoch": 2676} {"train_loss": -6.5669965744018555, "global_step": 112397, "epoch": 2676} {"train_loss": -6.49940824508667, "global_step": 112398, "epoch": 2676} {"train_loss": -6.578575134277344, "global_step": 112399, "epoch": 2676} {"train_loss": -6.520373344421387, "global_step": 112400, "epoch": 2676} {"train_loss": -6.483206748962402, "global_step": 112401, "epoch": 2676} {"train_loss": -6.426381587982178, "global_step": 112402, "epoch": 2676} {"train_loss": -6.518205642700195, "global_step": 112403, "epoch": 2676} {"train_loss": -6.6337056159973145, "global_step": 112404, "epoch": 2676} {"train_loss": -6.585331916809082, "global_step": 112405, "epoch": 2676} {"train_loss": -6.475493907928467, "global_step": 112406, "epoch": 2676} {"train_loss": -6.361128330230713, "global_step": 112407, "epoch": 2676} {"train_loss": -6.4902873039245605, "global_step": 112408, "epoch": 2676} {"train_loss": -6.4328999519348145, "global_step": 112409, "epoch": 2676} {"train_loss": -6.540638446807861, "global_step": 112410, "epoch": 2676} {"train_loss": -6.4364423751831055, "global_step": 112411, "epoch": 2676} {"train_loss": -6.653916358947754, "global_step": 112412, "epoch": 2676} {"train_loss": -6.531059265136719, "global_step": 112413, "epoch": 2676} {"train_loss": -6.488994121551514, "global_step": 112414, "epoch": 2676} {"train_loss": -6.482563495635986, "global_step": 112415, "epoch": 2676} {"train_loss": -6.609617233276367, "global_step": 112416, "epoch": 2676} {"train_loss": -6.520665168762207, "global_step": 112417, "epoch": 2676} {"train_loss": -6.432055473327637, "global_step": 112418, "epoch": 2676} {"train_loss": -6.531639099121094, "global_step": 112419, "epoch": 2676} {"train_loss": -6.493340492248535, "global_step": 112420, "epoch": 2676} {"train_loss": -6.540042877197266, "global_step": 112421, "epoch": 2676} {"train_loss": -6.489253997802734, "global_step": 112422, "epoch": 2676} {"train_loss": -6.473766326904297, "global_step": 112423, "epoch": 2676} {"train_loss": -6.525610446929932, "global_step": 112424, "epoch": 2676} {"train_loss": -6.5357561111450195, "global_step": 112425, "epoch": 2676} {"train_loss": -6.576560974121094, "global_step": 112426, "epoch": 2676} {"train_loss": -6.485733509063721, "global_step": 112427, "epoch": 2676} {"train_loss": -6.529400825500488, "global_step": 112428, "epoch": 2676} {"train_loss": -6.4058380126953125, "global_step": 112429, "epoch": 2676} {"train_loss": -6.5022077560424805, "global_step": 112430, "epoch": 2676} {"train_loss": -6.3128862380981445, "global_step": 112431, "epoch": 2676} {"train_loss": -6.423286437988281, "global_step": 112432, "epoch": 2676} {"train_loss": -6.49586372148423, "global_step": 112433, "epoch": 2676, "val_loss": 76668.09375} {"train_loss": -6.4117326736450195, "global_step": 112434, "epoch": 2677} {"train_loss": -6.39929723739624, "global_step": 112435, "epoch": 2677} {"train_loss": -6.442383766174316, "global_step": 112436, "epoch": 2677} {"train_loss": -6.501176834106445, "global_step": 112437, "epoch": 2677} {"train_loss": -6.45953893661499, "global_step": 112438, "epoch": 2677} {"train_loss": -6.498069763183594, "global_step": 112439, "epoch": 2677} {"train_loss": -6.545654296875, "global_step": 112440, "epoch": 2677} {"train_loss": -6.569057941436768, "global_step": 112441, "epoch": 2677} {"train_loss": -6.515108108520508, "global_step": 112442, "epoch": 2677} {"train_loss": -6.592686653137207, "global_step": 112443, "epoch": 2677} {"train_loss": -6.490217208862305, "global_step": 112444, "epoch": 2677} {"train_loss": -6.66447639465332, "global_step": 112445, "epoch": 2677} {"train_loss": -6.470483779907227, "global_step": 112446, "epoch": 2677} {"train_loss": -6.568532466888428, "global_step": 112447, "epoch": 2677} {"train_loss": -6.475886344909668, "global_step": 112448, "epoch": 2677} {"train_loss": -6.440473556518555, "global_step": 112449, "epoch": 2677} {"train_loss": -6.424062728881836, "global_step": 112450, "epoch": 2677} {"train_loss": -6.38614559173584, "global_step": 112451, "epoch": 2677} {"train_loss": -6.529120922088623, "global_step": 112452, "epoch": 2677} {"train_loss": -6.395510196685791, "global_step": 112453, "epoch": 2677} {"train_loss": -6.417947769165039, "global_step": 112454, "epoch": 2677} {"train_loss": -6.522191047668457, "global_step": 112455, "epoch": 2677} {"train_loss": -6.509955406188965, "global_step": 112456, "epoch": 2677} {"train_loss": -6.577230453491211, "global_step": 112457, "epoch": 2677} {"train_loss": -6.489197254180908, "global_step": 112458, "epoch": 2677} {"train_loss": -6.369610786437988, "global_step": 112459, "epoch": 2677} {"train_loss": -6.4590559005737305, "global_step": 112460, "epoch": 2677} {"train_loss": -6.616684913635254, "global_step": 112461, "epoch": 2677} {"train_loss": -6.511127948760986, "global_step": 112462, "epoch": 2677} {"train_loss": -6.531861305236816, "global_step": 112463, "epoch": 2677} {"train_loss": -6.495044708251953, "global_step": 112464, "epoch": 2677} {"train_loss": -6.461513519287109, "global_step": 112465, "epoch": 2677} {"train_loss": -6.4313836097717285, "global_step": 112466, "epoch": 2677} {"train_loss": -6.423922538757324, "global_step": 112467, "epoch": 2677} {"train_loss": -6.518552780151367, "global_step": 112468, "epoch": 2677} {"train_loss": -6.249880313873291, "global_step": 112469, "epoch": 2677} {"train_loss": -6.408740997314453, "global_step": 112470, "epoch": 2677} {"train_loss": -6.386166572570801, "global_step": 112471, "epoch": 2677} {"train_loss": -6.4408345222473145, "global_step": 112472, "epoch": 2677} {"train_loss": -6.434532165527344, "global_step": 112473, "epoch": 2677} {"train_loss": -6.316473960876465, "global_step": 112474, "epoch": 2677} {"train_loss": -6.468446425029209, "global_step": 112475, "epoch": 2677, "val_loss": 76149.375} {"train_loss": -6.426864147186279, "global_step": 112476, "epoch": 2678} {"train_loss": -6.38515567779541, "global_step": 112477, "epoch": 2678} {"train_loss": -6.411215782165527, "global_step": 112478, "epoch": 2678} {"train_loss": -6.436013221740723, "global_step": 112479, "epoch": 2678} {"train_loss": -6.422226428985596, "global_step": 112480, "epoch": 2678} {"train_loss": -6.450509548187256, "global_step": 112481, "epoch": 2678} {"train_loss": -6.40769100189209, "global_step": 112482, "epoch": 2678} {"train_loss": -6.570589065551758, "global_step": 112483, "epoch": 2678} {"train_loss": -6.342043399810791, "global_step": 112484, "epoch": 2678} {"train_loss": -6.480759620666504, "global_step": 112485, "epoch": 2678} {"train_loss": -6.501047611236572, "global_step": 112486, "epoch": 2678} {"train_loss": -6.452836513519287, "global_step": 112487, "epoch": 2678} {"train_loss": -6.452877998352051, "global_step": 112488, "epoch": 2678} {"train_loss": -6.439870357513428, "global_step": 112489, "epoch": 2678} {"train_loss": -6.447253227233887, "global_step": 112490, "epoch": 2678} {"train_loss": -6.504495143890381, "global_step": 112491, "epoch": 2678} {"train_loss": -6.368990421295166, "global_step": 112492, "epoch": 2678} {"train_loss": -6.389979362487793, "global_step": 112493, "epoch": 2678} {"train_loss": -6.499402046203613, "global_step": 112494, "epoch": 2678} {"train_loss": -6.533547878265381, "global_step": 112495, "epoch": 2678} {"train_loss": -6.516648292541504, "global_step": 112496, "epoch": 2678} {"train_loss": -6.516566276550293, "global_step": 112497, "epoch": 2678} {"train_loss": -6.424746990203857, "global_step": 112498, "epoch": 2678} {"train_loss": -6.609426498413086, "global_step": 112499, "epoch": 2678} {"train_loss": -6.578563213348389, "global_step": 112500, "epoch": 2678} {"train_loss": -6.487713813781738, "global_step": 112501, "epoch": 2678} {"train_loss": -6.558337211608887, "global_step": 112502, "epoch": 2678} {"train_loss": -6.537975311279297, "global_step": 112503, "epoch": 2678} {"train_loss": -6.588684558868408, "global_step": 112504, "epoch": 2678} {"train_loss": -6.4921064376831055, "global_step": 112505, "epoch": 2678} {"train_loss": -6.5256547927856445, "global_step": 112506, "epoch": 2678} {"train_loss": -6.527091026306152, "global_step": 112507, "epoch": 2678} {"train_loss": -6.421041488647461, "global_step": 112508, "epoch": 2678} {"train_loss": -6.484724998474121, "global_step": 112509, "epoch": 2678} {"train_loss": -6.4732184410095215, "global_step": 112510, "epoch": 2678} {"train_loss": -6.495858192443848, "global_step": 112511, "epoch": 2678} {"train_loss": -6.59619665145874, "global_step": 112512, "epoch": 2678} {"train_loss": -6.384458541870117, "global_step": 112513, "epoch": 2678} {"train_loss": -6.571040630340576, "global_step": 112514, "epoch": 2678} {"train_loss": -6.568089962005615, "global_step": 112515, "epoch": 2678} {"train_loss": -6.547369003295898, "global_step": 112516, "epoch": 2678} {"train_loss": -6.484047094980876, "global_step": 112517, "epoch": 2678, "val_loss": 76430.2578125} {"train_loss": -6.4341959953308105, "global_step": 112518, "epoch": 2679} {"train_loss": -6.448485374450684, "global_step": 112519, "epoch": 2679} {"train_loss": -6.514564514160156, "global_step": 112520, "epoch": 2679} {"train_loss": -6.479258060455322, "global_step": 112521, "epoch": 2679} {"train_loss": -6.5144572257995605, "global_step": 112522, "epoch": 2679} {"train_loss": -6.50715446472168, "global_step": 112523, "epoch": 2679} {"train_loss": -6.412250995635986, "global_step": 112524, "epoch": 2679} {"train_loss": -6.557945251464844, "global_step": 112525, "epoch": 2679} {"train_loss": -6.493237495422363, "global_step": 112526, "epoch": 2679} {"train_loss": -6.305647850036621, "global_step": 112527, "epoch": 2679} {"train_loss": -6.48689079284668, "global_step": 112528, "epoch": 2679} {"train_loss": -6.414004325866699, "global_step": 112529, "epoch": 2679} {"train_loss": -6.470463275909424, "global_step": 112530, "epoch": 2679} {"train_loss": -6.521954536437988, "global_step": 112531, "epoch": 2679} {"train_loss": -6.358292102813721, "global_step": 112532, "epoch": 2679} {"train_loss": -6.405858516693115, "global_step": 112533, "epoch": 2679} {"train_loss": -6.4232378005981445, "global_step": 112534, "epoch": 2679} {"train_loss": -6.5104241371154785, "global_step": 112535, "epoch": 2679} {"train_loss": -6.430906772613525, "global_step": 112536, "epoch": 2679} {"train_loss": -6.303194999694824, "global_step": 112537, "epoch": 2679} {"train_loss": -6.410159111022949, "global_step": 112538, "epoch": 2679} {"train_loss": -6.389008045196533, "global_step": 112539, "epoch": 2679} {"train_loss": -6.418485641479492, "global_step": 112540, "epoch": 2679} {"train_loss": -6.332505226135254, "global_step": 112541, "epoch": 2679} {"train_loss": -6.391564846038818, "global_step": 112542, "epoch": 2679} {"train_loss": -6.455498218536377, "global_step": 112543, "epoch": 2679} {"train_loss": -6.472015857696533, "global_step": 112544, "epoch": 2679} {"train_loss": -6.346027374267578, "global_step": 112545, "epoch": 2679} {"train_loss": -6.363649368286133, "global_step": 112546, "epoch": 2679} {"train_loss": -6.541964530944824, "global_step": 112547, "epoch": 2679} {"train_loss": -6.434311866760254, "global_step": 112548, "epoch": 2679} {"train_loss": -6.593788146972656, "global_step": 112549, "epoch": 2679} {"train_loss": -6.36464262008667, "global_step": 112550, "epoch": 2679} {"train_loss": -6.403851509094238, "global_step": 112551, "epoch": 2679} {"train_loss": -6.411301612854004, "global_step": 112552, "epoch": 2679} {"train_loss": -6.517266273498535, "global_step": 112553, "epoch": 2679} {"train_loss": -6.368209362030029, "global_step": 112554, "epoch": 2679} {"train_loss": -6.411914825439453, "global_step": 112555, "epoch": 2679} {"train_loss": -6.326435565948486, "global_step": 112556, "epoch": 2679} {"train_loss": -6.359742641448975, "global_step": 112557, "epoch": 2679} {"train_loss": -6.501883506774902, "global_step": 112558, "epoch": 2679} {"train_loss": -6.435245638801938, "global_step": 112559, "epoch": 2679, "val_loss": 76645.5390625} {"train_loss": -6.441557884216309, "global_step": 112560, "epoch": 2680} {"train_loss": -6.510822772979736, "global_step": 112561, "epoch": 2680} {"train_loss": -6.495265483856201, "global_step": 112562, "epoch": 2680} {"train_loss": -6.455116271972656, "global_step": 112563, "epoch": 2680} {"train_loss": -6.497422218322754, "global_step": 112564, "epoch": 2680} {"train_loss": -6.4339447021484375, "global_step": 112565, "epoch": 2680} {"train_loss": -6.472746849060059, "global_step": 112566, "epoch": 2680} {"train_loss": -6.451399803161621, "global_step": 112567, "epoch": 2680} {"train_loss": -6.479298114776611, "global_step": 112568, "epoch": 2680} {"train_loss": -6.50742769241333, "global_step": 112569, "epoch": 2680} {"train_loss": -6.504039287567139, "global_step": 112570, "epoch": 2680} {"train_loss": -6.366037368774414, "global_step": 112571, "epoch": 2680} {"train_loss": -6.440918922424316, "global_step": 112572, "epoch": 2680} {"train_loss": -6.395620346069336, "global_step": 112573, "epoch": 2680} {"train_loss": -6.4638285636901855, "global_step": 112574, "epoch": 2680} {"train_loss": -6.415866851806641, "global_step": 112575, "epoch": 2680} {"train_loss": -6.375300407409668, "global_step": 112576, "epoch": 2680} {"train_loss": -6.485583305358887, "global_step": 112577, "epoch": 2680} {"train_loss": -6.472261428833008, "global_step": 112578, "epoch": 2680} {"train_loss": -6.482090473175049, "global_step": 112579, "epoch": 2680} {"train_loss": -6.515754699707031, "global_step": 112580, "epoch": 2680} {"train_loss": -6.472467422485352, "global_step": 112581, "epoch": 2680} {"train_loss": -6.369833469390869, "global_step": 112582, "epoch": 2680} {"train_loss": -6.542576789855957, "global_step": 112583, "epoch": 2680} {"train_loss": -6.418469429016113, "global_step": 112584, "epoch": 2680} {"train_loss": -6.637707233428955, "global_step": 112585, "epoch": 2680} {"train_loss": -6.521687984466553, "global_step": 112586, "epoch": 2680} {"train_loss": -6.423150062561035, "global_step": 112587, "epoch": 2680} {"train_loss": -6.501737117767334, "global_step": 112588, "epoch": 2680} {"train_loss": -6.364887237548828, "global_step": 112589, "epoch": 2680} {"train_loss": -6.378530502319336, "global_step": 112590, "epoch": 2680} {"train_loss": -6.425653457641602, "global_step": 112591, "epoch": 2680} {"train_loss": -6.565528392791748, "global_step": 112592, "epoch": 2680} {"train_loss": -6.413846492767334, "global_step": 112593, "epoch": 2680} {"train_loss": -6.55069637298584, "global_step": 112594, "epoch": 2680} {"train_loss": -6.55709171295166, "global_step": 112595, "epoch": 2680} {"train_loss": -6.47498893737793, "global_step": 112596, "epoch": 2680} {"train_loss": -6.481691360473633, "global_step": 112597, "epoch": 2680} {"train_loss": -6.506805896759033, "global_step": 112598, "epoch": 2680} {"train_loss": -6.548513889312744, "global_step": 112599, "epoch": 2680} {"train_loss": -6.546283721923828, "global_step": 112600, "epoch": 2680} {"train_loss": -6.473771515346709, "global_step": 112601, "epoch": 2680, "val_loss": 76504.8203125} {"train_loss": -6.481263160705566, "global_step": 112602, "epoch": 2681} {"train_loss": -6.351309776306152, "global_step": 112603, "epoch": 2681} {"train_loss": -6.4248809814453125, "global_step": 112604, "epoch": 2681} {"train_loss": -6.400210857391357, "global_step": 112605, "epoch": 2681} {"train_loss": -6.589583396911621, "global_step": 112606, "epoch": 2681} {"train_loss": -6.441931247711182, "global_step": 112607, "epoch": 2681} {"train_loss": -6.5090742111206055, "global_step": 112608, "epoch": 2681} {"train_loss": -6.421139240264893, "global_step": 112609, "epoch": 2681} {"train_loss": -6.428070545196533, "global_step": 112610, "epoch": 2681} {"train_loss": -6.457201957702637, "global_step": 112611, "epoch": 2681} {"train_loss": -6.5559892654418945, "global_step": 112612, "epoch": 2681} {"train_loss": -6.445590972900391, "global_step": 112613, "epoch": 2681} {"train_loss": -6.541495323181152, "global_step": 112614, "epoch": 2681} {"train_loss": -6.408659934997559, "global_step": 112615, "epoch": 2681} {"train_loss": -6.38341760635376, "global_step": 112616, "epoch": 2681} {"train_loss": -6.560982704162598, "global_step": 112617, "epoch": 2681} {"train_loss": -6.538491249084473, "global_step": 112618, "epoch": 2681} {"train_loss": -6.461883068084717, "global_step": 112619, "epoch": 2681} {"train_loss": -6.438465118408203, "global_step": 112620, "epoch": 2681} {"train_loss": -6.614031791687012, "global_step": 112621, "epoch": 2681} {"train_loss": -6.525141716003418, "global_step": 112622, "epoch": 2681} {"train_loss": -6.501816749572754, "global_step": 112623, "epoch": 2681} {"train_loss": -6.535774230957031, "global_step": 112624, "epoch": 2681} {"train_loss": -6.567636966705322, "global_step": 112625, "epoch": 2681} {"train_loss": -6.567008972167969, "global_step": 112626, "epoch": 2681} {"train_loss": -6.511081218719482, "global_step": 112627, "epoch": 2681} {"train_loss": -6.5547356605529785, "global_step": 112628, "epoch": 2681} {"train_loss": -6.468136787414551, "global_step": 112629, "epoch": 2681} {"train_loss": -6.489134311676025, "global_step": 112630, "epoch": 2681} {"train_loss": -6.551198482513428, "global_step": 112631, "epoch": 2681} {"train_loss": -6.489694595336914, "global_step": 112632, "epoch": 2681} {"train_loss": -6.368531703948975, "global_step": 112633, "epoch": 2681} {"train_loss": -6.54746150970459, "global_step": 112634, "epoch": 2681} {"train_loss": -6.494815826416016, "global_step": 112635, "epoch": 2681} {"train_loss": -6.509352207183838, "global_step": 112636, "epoch": 2681} {"train_loss": -6.467487335205078, "global_step": 112637, "epoch": 2681} {"train_loss": -6.520658016204834, "global_step": 112638, "epoch": 2681} {"train_loss": -6.5663743019104, "global_step": 112639, "epoch": 2681} {"train_loss": -6.5453200340271, "global_step": 112640, "epoch": 2681} {"train_loss": -6.486877918243408, "global_step": 112641, "epoch": 2681} {"train_loss": -6.565217018127441, "global_step": 112642, "epoch": 2681} {"train_loss": -6.493627025967553, "global_step": 112643, "epoch": 2681, "val_loss": 76317.53125} {"train_loss": -6.4562458992004395, "global_step": 112644, "epoch": 2682} {"train_loss": -6.599105358123779, "global_step": 112645, "epoch": 2682} {"train_loss": -6.469712257385254, "global_step": 112646, "epoch": 2682} {"train_loss": -6.436330795288086, "global_step": 112647, "epoch": 2682} {"train_loss": -6.472532749176025, "global_step": 112648, "epoch": 2682} {"train_loss": -6.457765579223633, "global_step": 112649, "epoch": 2682} {"train_loss": -6.453698635101318, "global_step": 112650, "epoch": 2682} {"train_loss": -6.463062286376953, "global_step": 112651, "epoch": 2682} {"train_loss": -6.42069149017334, "global_step": 112652, "epoch": 2682} {"train_loss": -6.471372604370117, "global_step": 112653, "epoch": 2682} {"train_loss": -6.470121383666992, "global_step": 112654, "epoch": 2682} {"train_loss": -6.545212745666504, "global_step": 112655, "epoch": 2682} {"train_loss": -6.396173477172852, "global_step": 112656, "epoch": 2682} {"train_loss": -6.523609161376953, "global_step": 112657, "epoch": 2682} {"train_loss": -6.4852800369262695, "global_step": 112658, "epoch": 2682} {"train_loss": -6.482033729553223, "global_step": 112659, "epoch": 2682} {"train_loss": -6.4862565994262695, "global_step": 112660, "epoch": 2682} {"train_loss": -6.535577774047852, "global_step": 112661, "epoch": 2682} {"train_loss": -6.508245944976807, "global_step": 112662, "epoch": 2682} {"train_loss": -6.514334678649902, "global_step": 112663, "epoch": 2682} {"train_loss": -6.461796283721924, "global_step": 112664, "epoch": 2682} {"train_loss": -6.554986953735352, "global_step": 112665, "epoch": 2682} {"train_loss": -6.55134391784668, "global_step": 112666, "epoch": 2682} {"train_loss": -6.481131553649902, "global_step": 112667, "epoch": 2682} {"train_loss": -6.46544075012207, "global_step": 112668, "epoch": 2682} {"train_loss": -6.482799530029297, "global_step": 112669, "epoch": 2682} {"train_loss": -6.484767913818359, "global_step": 112670, "epoch": 2682} {"train_loss": -6.494748115539551, "global_step": 112671, "epoch": 2682} {"train_loss": -6.507447242736816, "global_step": 112672, "epoch": 2682} {"train_loss": -6.488395690917969, "global_step": 112673, "epoch": 2682} {"train_loss": -6.46600341796875, "global_step": 112674, "epoch": 2682} {"train_loss": -6.46562385559082, "global_step": 112675, "epoch": 2682} {"train_loss": -6.54827880859375, "global_step": 112676, "epoch": 2682} {"train_loss": -6.572660446166992, "global_step": 112677, "epoch": 2682} {"train_loss": -6.5758137702941895, "global_step": 112678, "epoch": 2682} {"train_loss": -6.54183292388916, "global_step": 112679, "epoch": 2682} {"train_loss": -6.546537399291992, "global_step": 112680, "epoch": 2682} {"train_loss": -6.57440185546875, "global_step": 112681, "epoch": 2682} {"train_loss": -6.640373706817627, "global_step": 112682, "epoch": 2682} {"train_loss": -6.5703935623168945, "global_step": 112683, "epoch": 2682} {"train_loss": -6.607511520385742, "global_step": 112684, "epoch": 2682} {"train_loss": -6.506084476198469, "global_step": 112685, "epoch": 2682, "val_loss": 76614.859375} {"train_loss": -6.320878982543945, "global_step": 112686, "epoch": 2683} {"train_loss": -6.510112762451172, "global_step": 112687, "epoch": 2683} {"train_loss": -6.2730560302734375, "global_step": 112688, "epoch": 2683} {"train_loss": -6.3964104652404785, "global_step": 112689, "epoch": 2683} {"train_loss": -6.511111259460449, "global_step": 112690, "epoch": 2683} {"train_loss": -6.524460315704346, "global_step": 112691, "epoch": 2683} {"train_loss": -6.517314910888672, "global_step": 112692, "epoch": 2683} {"train_loss": -6.505669593811035, "global_step": 112693, "epoch": 2683} {"train_loss": -6.3678693771362305, "global_step": 112694, "epoch": 2683} {"train_loss": -6.5092315673828125, "global_step": 112695, "epoch": 2683} {"train_loss": -6.442024230957031, "global_step": 112696, "epoch": 2683} {"train_loss": -6.520139217376709, "global_step": 112697, "epoch": 2683} {"train_loss": -6.507359504699707, "global_step": 112698, "epoch": 2683} {"train_loss": -6.579181671142578, "global_step": 112699, "epoch": 2683} {"train_loss": -6.401525497436523, "global_step": 112700, "epoch": 2683} {"train_loss": -6.489986896514893, "global_step": 112701, "epoch": 2683} {"train_loss": -6.6493611335754395, "global_step": 112702, "epoch": 2683} {"train_loss": -6.569636344909668, "global_step": 112703, "epoch": 2683} {"train_loss": -6.529157638549805, "global_step": 112704, "epoch": 2683} {"train_loss": -6.550994396209717, "global_step": 112705, "epoch": 2683} {"train_loss": -6.4561991691589355, "global_step": 112706, "epoch": 2683} {"train_loss": -6.4938645362854, "global_step": 112707, "epoch": 2683} {"train_loss": -6.539493560791016, "global_step": 112708, "epoch": 2683} {"train_loss": -6.546259880065918, "global_step": 112709, "epoch": 2683} {"train_loss": -6.407484531402588, "global_step": 112710, "epoch": 2683} {"train_loss": -6.5499091148376465, "global_step": 112711, "epoch": 2683} {"train_loss": -6.56104850769043, "global_step": 112712, "epoch": 2683} {"train_loss": -6.433060646057129, "global_step": 112713, "epoch": 2683} {"train_loss": -6.594844341278076, "global_step": 112714, "epoch": 2683} {"train_loss": -6.520019054412842, "global_step": 112715, "epoch": 2683} {"train_loss": -6.593453407287598, "global_step": 112716, "epoch": 2683} {"train_loss": -6.541354179382324, "global_step": 112717, "epoch": 2683} {"train_loss": -6.392998695373535, "global_step": 112718, "epoch": 2683} {"train_loss": -6.515732288360596, "global_step": 112719, "epoch": 2683} {"train_loss": -6.471259117126465, "global_step": 112720, "epoch": 2683} {"train_loss": -6.491634368896484, "global_step": 112721, "epoch": 2683} {"train_loss": -6.459461212158203, "global_step": 112722, "epoch": 2683} {"train_loss": -6.498387336730957, "global_step": 112723, "epoch": 2683} {"train_loss": -6.560688495635986, "global_step": 112724, "epoch": 2683} {"train_loss": -6.501726150512695, "global_step": 112725, "epoch": 2683} {"train_loss": -6.636091232299805, "global_step": 112726, "epoch": 2683} {"train_loss": -6.494129566919236, "global_step": 112727, "epoch": 2683, "val_loss": 76457.1875} {"train_loss": -6.469819068908691, "global_step": 112728, "epoch": 2684} {"train_loss": -6.482709884643555, "global_step": 112729, "epoch": 2684} {"train_loss": -6.496028423309326, "global_step": 112730, "epoch": 2684} {"train_loss": -6.419527053833008, "global_step": 112731, "epoch": 2684} {"train_loss": -6.504080772399902, "global_step": 112732, "epoch": 2684} {"train_loss": -6.452397346496582, "global_step": 112733, "epoch": 2684} {"train_loss": -6.486501693725586, "global_step": 112734, "epoch": 2684} {"train_loss": -6.437267780303955, "global_step": 112735, "epoch": 2684} {"train_loss": -6.386894702911377, "global_step": 112736, "epoch": 2684} {"train_loss": -6.428159713745117, "global_step": 112737, "epoch": 2684} {"train_loss": -6.460371017456055, "global_step": 112738, "epoch": 2684} {"train_loss": -6.562341690063477, "global_step": 112739, "epoch": 2684} {"train_loss": -6.454835891723633, "global_step": 112740, "epoch": 2684} {"train_loss": -6.474178314208984, "global_step": 112741, "epoch": 2684} {"train_loss": -6.54680871963501, "global_step": 112742, "epoch": 2684} {"train_loss": -6.52358341217041, "global_step": 112743, "epoch": 2684} {"train_loss": -6.504681587219238, "global_step": 112744, "epoch": 2684} {"train_loss": -6.534353256225586, "global_step": 112745, "epoch": 2684} {"train_loss": -6.450223922729492, "global_step": 112746, "epoch": 2684} {"train_loss": -6.481052875518799, "global_step": 112747, "epoch": 2684} {"train_loss": -6.4856719970703125, "global_step": 112748, "epoch": 2684} {"train_loss": -6.555190086364746, "global_step": 112749, "epoch": 2684} {"train_loss": -6.546489238739014, "global_step": 112750, "epoch": 2684} {"train_loss": -6.452113628387451, "global_step": 112751, "epoch": 2684} {"train_loss": -6.4955153465271, "global_step": 112752, "epoch": 2684} {"train_loss": -6.480927467346191, "global_step": 112753, "epoch": 2684} {"train_loss": -6.349555015563965, "global_step": 112754, "epoch": 2684} {"train_loss": -6.567488670349121, "global_step": 112755, "epoch": 2684} {"train_loss": -6.5151777267456055, "global_step": 112756, "epoch": 2684} {"train_loss": -6.475400924682617, "global_step": 112757, "epoch": 2684} {"train_loss": -6.473257064819336, "global_step": 112758, "epoch": 2684} {"train_loss": -6.411081790924072, "global_step": 112759, "epoch": 2684} {"train_loss": -6.504242897033691, "global_step": 112760, "epoch": 2684} {"train_loss": -6.550833702087402, "global_step": 112761, "epoch": 2684} {"train_loss": -6.524141311645508, "global_step": 112762, "epoch": 2684} {"train_loss": -6.5167107582092285, "global_step": 112763, "epoch": 2684} {"train_loss": -6.597299575805664, "global_step": 112764, "epoch": 2684} {"train_loss": -6.360442161560059, "global_step": 112765, "epoch": 2684} {"train_loss": -6.490462303161621, "global_step": 112766, "epoch": 2684} {"train_loss": -6.455697059631348, "global_step": 112767, "epoch": 2684} {"train_loss": -6.402929306030273, "global_step": 112768, "epoch": 2684} {"train_loss": -6.482158002399263, "global_step": 112769, "epoch": 2684, "val_loss": 76680.9140625} {"train_loss": -6.395672798156738, "global_step": 112770, "epoch": 2685} {"train_loss": -6.5424652099609375, "global_step": 112771, "epoch": 2685} {"train_loss": -6.526320457458496, "global_step": 112772, "epoch": 2685} {"train_loss": -6.625020980834961, "global_step": 112773, "epoch": 2685} {"train_loss": -6.370736122131348, "global_step": 112774, "epoch": 2685} {"train_loss": -6.501367568969727, "global_step": 112775, "epoch": 2685} {"train_loss": -6.383270263671875, "global_step": 112776, "epoch": 2685} {"train_loss": -6.540124893188477, "global_step": 112777, "epoch": 2685} {"train_loss": -6.450583457946777, "global_step": 112778, "epoch": 2685} {"train_loss": -6.545853614807129, "global_step": 112779, "epoch": 2685} {"train_loss": -6.477415084838867, "global_step": 112780, "epoch": 2685} {"train_loss": -6.339903354644775, "global_step": 112781, "epoch": 2685} {"train_loss": -6.594533443450928, "global_step": 112782, "epoch": 2685} {"train_loss": -6.4369635581970215, "global_step": 112783, "epoch": 2685} {"train_loss": -6.472266674041748, "global_step": 112784, "epoch": 2685} {"train_loss": -6.398322105407715, "global_step": 112785, "epoch": 2685} {"train_loss": -6.392237663269043, "global_step": 112786, "epoch": 2685} {"train_loss": -6.416717529296875, "global_step": 112787, "epoch": 2685} {"train_loss": -6.5808796882629395, "global_step": 112788, "epoch": 2685} {"train_loss": -6.481033802032471, "global_step": 112789, "epoch": 2685} {"train_loss": -6.492500305175781, "global_step": 112790, "epoch": 2685} {"train_loss": -6.4321675300598145, "global_step": 112791, "epoch": 2685} {"train_loss": -6.572813510894775, "global_step": 112792, "epoch": 2685} {"train_loss": -6.397121429443359, "global_step": 112793, "epoch": 2685} {"train_loss": -6.508723258972168, "global_step": 112794, "epoch": 2685} {"train_loss": -6.416589260101318, "global_step": 112795, "epoch": 2685} {"train_loss": -6.535763263702393, "global_step": 112796, "epoch": 2685} {"train_loss": -6.428778171539307, "global_step": 112797, "epoch": 2685} {"train_loss": -6.524413108825684, "global_step": 112798, "epoch": 2685} {"train_loss": -6.515124320983887, "global_step": 112799, "epoch": 2685} {"train_loss": -6.572704315185547, "global_step": 112800, "epoch": 2685} {"train_loss": -6.365943908691406, "global_step": 112801, "epoch": 2685} {"train_loss": -6.497929573059082, "global_step": 112802, "epoch": 2685} {"train_loss": -6.360179901123047, "global_step": 112803, "epoch": 2685} {"train_loss": -6.3323774337768555, "global_step": 112804, "epoch": 2685} {"train_loss": -6.491741180419922, "global_step": 112805, "epoch": 2685} {"train_loss": -6.4596028327941895, "global_step": 112806, "epoch": 2685} {"train_loss": -6.453412055969238, "global_step": 112807, "epoch": 2685} {"train_loss": -6.429282188415527, "global_step": 112808, "epoch": 2685} {"train_loss": -6.488890171051025, "global_step": 112809, "epoch": 2685} {"train_loss": -6.408421993255615, "global_step": 112810, "epoch": 2685} {"train_loss": -6.466857263020107, "global_step": 112811, "epoch": 2685, "val_loss": 76582.4765625} {"train_loss": -6.539374828338623, "global_step": 112812, "epoch": 2686} {"train_loss": -6.417278289794922, "global_step": 112813, "epoch": 2686} {"train_loss": -6.435019493103027, "global_step": 112814, "epoch": 2686} {"train_loss": -6.566839218139648, "global_step": 112815, "epoch": 2686} {"train_loss": -6.497409820556641, "global_step": 112816, "epoch": 2686} {"train_loss": -6.535933971405029, "global_step": 112817, "epoch": 2686} {"train_loss": -6.486902236938477, "global_step": 112818, "epoch": 2686} {"train_loss": -6.387403964996338, "global_step": 112819, "epoch": 2686} {"train_loss": -6.454190731048584, "global_step": 112820, "epoch": 2686} {"train_loss": -6.401059627532959, "global_step": 112821, "epoch": 2686} {"train_loss": -6.485468864440918, "global_step": 112822, "epoch": 2686} {"train_loss": -6.584220886230469, "global_step": 112823, "epoch": 2686} {"train_loss": -6.537143707275391, "global_step": 112824, "epoch": 2686} {"train_loss": -6.461295127868652, "global_step": 112825, "epoch": 2686} {"train_loss": -6.432118892669678, "global_step": 112826, "epoch": 2686} {"train_loss": -6.598808288574219, "global_step": 112827, "epoch": 2686} {"train_loss": -6.369017601013184, "global_step": 112828, "epoch": 2686} {"train_loss": -6.5378522872924805, "global_step": 112829, "epoch": 2686} {"train_loss": -6.566110610961914, "global_step": 112830, "epoch": 2686} {"train_loss": -6.481438636779785, "global_step": 112831, "epoch": 2686} {"train_loss": -6.538206100463867, "global_step": 112832, "epoch": 2686} {"train_loss": -6.465237617492676, "global_step": 112833, "epoch": 2686} {"train_loss": -6.614986419677734, "global_step": 112834, "epoch": 2686} {"train_loss": -6.417030334472656, "global_step": 112835, "epoch": 2686} {"train_loss": -6.531577110290527, "global_step": 112836, "epoch": 2686} {"train_loss": -6.528509616851807, "global_step": 112837, "epoch": 2686} {"train_loss": -6.463927268981934, "global_step": 112838, "epoch": 2686} {"train_loss": -6.570157051086426, "global_step": 112839, "epoch": 2686} {"train_loss": -6.434383392333984, "global_step": 112840, "epoch": 2686} {"train_loss": -6.524324417114258, "global_step": 112841, "epoch": 2686} {"train_loss": -6.519639492034912, "global_step": 112842, "epoch": 2686} {"train_loss": -6.5150909423828125, "global_step": 112843, "epoch": 2686} {"train_loss": -6.468459606170654, "global_step": 112844, "epoch": 2686} {"train_loss": -6.536383152008057, "global_step": 112845, "epoch": 2686} {"train_loss": -6.575656890869141, "global_step": 112846, "epoch": 2686} {"train_loss": -6.579702377319336, "global_step": 112847, "epoch": 2686} {"train_loss": -6.445487022399902, "global_step": 112848, "epoch": 2686} {"train_loss": -6.386543273925781, "global_step": 112849, "epoch": 2686} {"train_loss": -6.443884372711182, "global_step": 112850, "epoch": 2686} {"train_loss": -6.589321613311768, "global_step": 112851, "epoch": 2686} {"train_loss": -6.466427803039551, "global_step": 112852, "epoch": 2686} {"train_loss": -6.497959284555344, "global_step": 112853, "epoch": 2686, "val_loss": 76442.0} {"train_loss": -6.6637163162231445, "global_step": 112854, "epoch": 2687} {"train_loss": -6.395598411560059, "global_step": 112855, "epoch": 2687} {"train_loss": -6.455645561218262, "global_step": 112856, "epoch": 2687} {"train_loss": -6.423557758331299, "global_step": 112857, "epoch": 2687} {"train_loss": -6.568362236022949, "global_step": 112858, "epoch": 2687} {"train_loss": -6.5228495597839355, "global_step": 112859, "epoch": 2687} {"train_loss": -6.542875289916992, "global_step": 112860, "epoch": 2687} {"train_loss": -6.631364822387695, "global_step": 112861, "epoch": 2687} {"train_loss": -6.604198932647705, "global_step": 112862, "epoch": 2687} {"train_loss": -6.436671733856201, "global_step": 112863, "epoch": 2687} {"train_loss": -6.508270740509033, "global_step": 112864, "epoch": 2687} {"train_loss": -6.483976364135742, "global_step": 112865, "epoch": 2687} {"train_loss": -6.537823677062988, "global_step": 112866, "epoch": 2687} {"train_loss": -6.490413665771484, "global_step": 112867, "epoch": 2687} {"train_loss": -6.487926006317139, "global_step": 112868, "epoch": 2687} {"train_loss": -6.502566337585449, "global_step": 112869, "epoch": 2687} {"train_loss": -6.510157585144043, "global_step": 112870, "epoch": 2687} {"train_loss": -6.436901569366455, "global_step": 112871, "epoch": 2687} {"train_loss": -6.510334014892578, "global_step": 112872, "epoch": 2687} {"train_loss": -6.380368709564209, "global_step": 112873, "epoch": 2687} {"train_loss": -6.505184650421143, "global_step": 112874, "epoch": 2687} {"train_loss": -6.3382697105407715, "global_step": 112875, "epoch": 2687} {"train_loss": -6.376354217529297, "global_step": 112876, "epoch": 2687} {"train_loss": -6.586463928222656, "global_step": 112877, "epoch": 2687} {"train_loss": -6.319076061248779, "global_step": 112878, "epoch": 2687} {"train_loss": -6.384547233581543, "global_step": 112879, "epoch": 2687} {"train_loss": -6.453187465667725, "global_step": 112880, "epoch": 2687} {"train_loss": -6.278223037719727, "global_step": 112881, "epoch": 2687} {"train_loss": -6.586925029754639, "global_step": 112882, "epoch": 2687} {"train_loss": -6.414054870605469, "global_step": 112883, "epoch": 2687} {"train_loss": -6.463342666625977, "global_step": 112884, "epoch": 2687} {"train_loss": -6.4951958656311035, "global_step": 112885, "epoch": 2687} {"train_loss": -6.377254962921143, "global_step": 112886, "epoch": 2687} {"train_loss": -6.4699788093566895, "global_step": 112887, "epoch": 2687} {"train_loss": -6.389824390411377, "global_step": 112888, "epoch": 2687} {"train_loss": -6.429096221923828, "global_step": 112889, "epoch": 2687} {"train_loss": -6.38510799407959, "global_step": 112890, "epoch": 2687} {"train_loss": -6.429428577423096, "global_step": 112891, "epoch": 2687} {"train_loss": -6.53337287902832, "global_step": 112892, "epoch": 2687} {"train_loss": -6.459959030151367, "global_step": 112893, "epoch": 2687} {"train_loss": -6.502743721008301, "global_step": 112894, "epoch": 2687} {"train_loss": -6.468923784437633, "global_step": 112895, "epoch": 2687, "val_loss": 76521.859375} {"train_loss": -6.466280937194824, "global_step": 112896, "epoch": 2688} {"train_loss": -6.519284248352051, "global_step": 112897, "epoch": 2688} {"train_loss": -6.372956275939941, "global_step": 112898, "epoch": 2688} {"train_loss": -6.5417304039001465, "global_step": 112899, "epoch": 2688} {"train_loss": -6.549632549285889, "global_step": 112900, "epoch": 2688} {"train_loss": -6.396103858947754, "global_step": 112901, "epoch": 2688} {"train_loss": -6.44616174697876, "global_step": 112902, "epoch": 2688} {"train_loss": -6.497033596038818, "global_step": 112903, "epoch": 2688} {"train_loss": -6.5957841873168945, "global_step": 112904, "epoch": 2688} {"train_loss": -6.466137409210205, "global_step": 112905, "epoch": 2688} {"train_loss": -6.490399360656738, "global_step": 112906, "epoch": 2688} {"train_loss": -6.554564476013184, "global_step": 112907, "epoch": 2688} {"train_loss": -6.467662811279297, "global_step": 112908, "epoch": 2688} {"train_loss": -6.620777606964111, "global_step": 112909, "epoch": 2688} {"train_loss": -6.5484466552734375, "global_step": 112910, "epoch": 2688} {"train_loss": -6.577176094055176, "global_step": 112911, "epoch": 2688} {"train_loss": -6.436221122741699, "global_step": 112912, "epoch": 2688} {"train_loss": -6.566078186035156, "global_step": 112913, "epoch": 2688} {"train_loss": -6.554610252380371, "global_step": 112914, "epoch": 2688} {"train_loss": -6.561215877532959, "global_step": 112915, "epoch": 2688} {"train_loss": -6.517604827880859, "global_step": 112916, "epoch": 2688} {"train_loss": -6.5049333572387695, "global_step": 112917, "epoch": 2688} {"train_loss": -6.524911880493164, "global_step": 112918, "epoch": 2688} {"train_loss": -6.5251593589782715, "global_step": 112919, "epoch": 2688} {"train_loss": -6.4629340171813965, "global_step": 112920, "epoch": 2688} {"train_loss": -6.445112228393555, "global_step": 112921, "epoch": 2688} {"train_loss": -6.521449089050293, "global_step": 112922, "epoch": 2688} {"train_loss": -6.39033317565918, "global_step": 112923, "epoch": 2688} {"train_loss": -6.540997505187988, "global_step": 112924, "epoch": 2688} {"train_loss": -6.593304634094238, "global_step": 112925, "epoch": 2688} {"train_loss": -6.445139408111572, "global_step": 112926, "epoch": 2688} {"train_loss": -6.488351345062256, "global_step": 112927, "epoch": 2688} {"train_loss": -6.553910255432129, "global_step": 112928, "epoch": 2688} {"train_loss": -6.417269706726074, "global_step": 112929, "epoch": 2688} {"train_loss": -6.410477638244629, "global_step": 112930, "epoch": 2688} {"train_loss": -6.604859352111816, "global_step": 112931, "epoch": 2688} {"train_loss": -6.442031383514404, "global_step": 112932, "epoch": 2688} {"train_loss": -6.44264030456543, "global_step": 112933, "epoch": 2688} {"train_loss": -6.500218391418457, "global_step": 112934, "epoch": 2688} {"train_loss": -6.449526786804199, "global_step": 112935, "epoch": 2688} {"train_loss": -6.64345121383667, "global_step": 112936, "epoch": 2688} {"train_loss": -6.502793822969709, "global_step": 112937, "epoch": 2688, "val_loss": 76440.1640625} {"train_loss": -6.446019172668457, "global_step": 112938, "epoch": 2689} {"train_loss": -6.451014995574951, "global_step": 112939, "epoch": 2689} {"train_loss": -6.470733165740967, "global_step": 112940, "epoch": 2689} {"train_loss": -6.606414794921875, "global_step": 112941, "epoch": 2689} {"train_loss": -6.326873779296875, "global_step": 112942, "epoch": 2689} {"train_loss": -6.514495372772217, "global_step": 112943, "epoch": 2689} {"train_loss": -6.43330192565918, "global_step": 112944, "epoch": 2689} {"train_loss": -6.5469970703125, "global_step": 112945, "epoch": 2689} {"train_loss": -6.641531944274902, "global_step": 112946, "epoch": 2689} {"train_loss": -6.491357803344727, "global_step": 112947, "epoch": 2689} {"train_loss": -6.4133172035217285, "global_step": 112948, "epoch": 2689} {"train_loss": -6.503351211547852, "global_step": 112949, "epoch": 2689} {"train_loss": -6.488096237182617, "global_step": 112950, "epoch": 2689} {"train_loss": -6.509194850921631, "global_step": 112951, "epoch": 2689} {"train_loss": -6.603129863739014, "global_step": 112952, "epoch": 2689} {"train_loss": -6.455777168273926, "global_step": 112953, "epoch": 2689} {"train_loss": -6.5163960456848145, "global_step": 112954, "epoch": 2689} {"train_loss": -6.438488483428955, "global_step": 112955, "epoch": 2689} {"train_loss": -6.456465721130371, "global_step": 112956, "epoch": 2689} {"train_loss": -6.518609046936035, "global_step": 112957, "epoch": 2689} {"train_loss": -6.381465911865234, "global_step": 112958, "epoch": 2689} {"train_loss": -6.404415130615234, "global_step": 112959, "epoch": 2689} {"train_loss": -6.350134372711182, "global_step": 112960, "epoch": 2689} {"train_loss": -6.349308013916016, "global_step": 112961, "epoch": 2689} {"train_loss": -6.354952812194824, "global_step": 112962, "epoch": 2689} {"train_loss": -6.401755332946777, "global_step": 112963, "epoch": 2689} {"train_loss": -6.331143379211426, "global_step": 112964, "epoch": 2689} {"train_loss": -6.278437614440918, "global_step": 112965, "epoch": 2689} {"train_loss": -6.3175554275512695, "global_step": 112966, "epoch": 2689} {"train_loss": -6.390234470367432, "global_step": 112967, "epoch": 2689} {"train_loss": -6.4494853019714355, "global_step": 112968, "epoch": 2689} {"train_loss": -6.415840148925781, "global_step": 112969, "epoch": 2689} {"train_loss": -6.31875467300415, "global_step": 112970, "epoch": 2689} {"train_loss": -6.4187445640563965, "global_step": 112971, "epoch": 2689} {"train_loss": -6.266712188720703, "global_step": 112972, "epoch": 2689} {"train_loss": -6.411584854125977, "global_step": 112973, "epoch": 2689} {"train_loss": -6.300271034240723, "global_step": 112974, "epoch": 2689} {"train_loss": -6.30832052230835, "global_step": 112975, "epoch": 2689} {"train_loss": -6.393113136291504, "global_step": 112976, "epoch": 2689} {"train_loss": -6.440058708190918, "global_step": 112977, "epoch": 2689} {"train_loss": -6.405422210693359, "global_step": 112978, "epoch": 2689} {"train_loss": -6.426170678365798, "global_step": 112979, "epoch": 2689, "val_loss": 76412.7109375} {"train_loss": -6.456605434417725, "global_step": 112980, "epoch": 2690} {"train_loss": -6.321230888366699, "global_step": 112981, "epoch": 2690} {"train_loss": -6.442625522613525, "global_step": 112982, "epoch": 2690} {"train_loss": -6.348178386688232, "global_step": 112983, "epoch": 2690} {"train_loss": -6.457425117492676, "global_step": 112984, "epoch": 2690} {"train_loss": -6.462009429931641, "global_step": 112985, "epoch": 2690} {"train_loss": -6.49418830871582, "global_step": 112986, "epoch": 2690} {"train_loss": -6.463434219360352, "global_step": 112987, "epoch": 2690} {"train_loss": -6.506601333618164, "global_step": 112988, "epoch": 2690} {"train_loss": -6.583004951477051, "global_step": 112989, "epoch": 2690} {"train_loss": -6.483500957489014, "global_step": 112990, "epoch": 2690} {"train_loss": -6.456024169921875, "global_step": 112991, "epoch": 2690} {"train_loss": -6.519484996795654, "global_step": 112992, "epoch": 2690} {"train_loss": -6.518930912017822, "global_step": 112993, "epoch": 2690} {"train_loss": -6.505258560180664, "global_step": 112994, "epoch": 2690} {"train_loss": -6.37789249420166, "global_step": 112995, "epoch": 2690} {"train_loss": -6.445805549621582, "global_step": 112996, "epoch": 2690} {"train_loss": -6.474513053894043, "global_step": 112997, "epoch": 2690} {"train_loss": -6.45114278793335, "global_step": 112998, "epoch": 2690} {"train_loss": -6.474905490875244, "global_step": 112999, "epoch": 2690} {"train_loss": -6.465339660644531, "global_step": 113000, "epoch": 2690} {"train_loss": -6.438092231750488, "global_step": 113001, "epoch": 2690} {"train_loss": -6.427426815032959, "global_step": 113002, "epoch": 2690} {"train_loss": -6.49997091293335, "global_step": 113003, "epoch": 2690} {"train_loss": -6.4139862060546875, "global_step": 113004, "epoch": 2690} {"train_loss": -6.463408946990967, "global_step": 113005, "epoch": 2690} {"train_loss": -6.260398864746094, "global_step": 113006, "epoch": 2690} {"train_loss": -6.392651081085205, "global_step": 113007, "epoch": 2690} {"train_loss": -6.426934242248535, "global_step": 113008, "epoch": 2690} {"train_loss": -6.285701751708984, "global_step": 113009, "epoch": 2690} {"train_loss": -6.4444403648376465, "global_step": 113010, "epoch": 2690} {"train_loss": -6.337345600128174, "global_step": 113011, "epoch": 2690} {"train_loss": -6.468389987945557, "global_step": 113012, "epoch": 2690} {"train_loss": -6.489180564880371, "global_step": 113013, "epoch": 2690} {"train_loss": -6.329163551330566, "global_step": 113014, "epoch": 2690} {"train_loss": -6.595064163208008, "global_step": 113015, "epoch": 2690} {"train_loss": -6.3582634925842285, "global_step": 113016, "epoch": 2690} {"train_loss": -6.462302207946777, "global_step": 113017, "epoch": 2690} {"train_loss": -6.359110355377197, "global_step": 113018, "epoch": 2690} {"train_loss": -6.515930652618408, "global_step": 113019, "epoch": 2690} {"train_loss": -6.455175399780273, "global_step": 113020, "epoch": 2690} {"train_loss": -6.440435795556931, "global_step": 113021, "epoch": 2690, "val_loss": 76537.296875} {"train_loss": -6.426821231842041, "global_step": 113022, "epoch": 2691} {"train_loss": -6.514926910400391, "global_step": 113023, "epoch": 2691} {"train_loss": -6.396903991699219, "global_step": 113024, "epoch": 2691} {"train_loss": -6.53148078918457, "global_step": 113025, "epoch": 2691} {"train_loss": -6.612994194030762, "global_step": 113026, "epoch": 2691} {"train_loss": -6.447728157043457, "global_step": 113027, "epoch": 2691} {"train_loss": -6.544975280761719, "global_step": 113028, "epoch": 2691} {"train_loss": -6.506949424743652, "global_step": 113029, "epoch": 2691} {"train_loss": -6.398802280426025, "global_step": 113030, "epoch": 2691} {"train_loss": -6.535494804382324, "global_step": 113031, "epoch": 2691} {"train_loss": -6.419308662414551, "global_step": 113032, "epoch": 2691} {"train_loss": -6.380805015563965, "global_step": 113033, "epoch": 2691} {"train_loss": -6.446527481079102, "global_step": 113034, "epoch": 2691} {"train_loss": -6.439267635345459, "global_step": 113035, "epoch": 2691} {"train_loss": -6.486223220825195, "global_step": 113036, "epoch": 2691} {"train_loss": -6.505496501922607, "global_step": 113037, "epoch": 2691} {"train_loss": -6.44183349609375, "global_step": 113038, "epoch": 2691} {"train_loss": -6.526093482971191, "global_step": 113039, "epoch": 2691} {"train_loss": -6.431308746337891, "global_step": 113040, "epoch": 2691} {"train_loss": -6.5628461837768555, "global_step": 113041, "epoch": 2691} {"train_loss": -6.461015224456787, "global_step": 113042, "epoch": 2691} {"train_loss": -6.475996017456055, "global_step": 113043, "epoch": 2691} {"train_loss": -6.470406532287598, "global_step": 113044, "epoch": 2691} {"train_loss": -6.629395961761475, "global_step": 113045, "epoch": 2691} {"train_loss": -6.500212669372559, "global_step": 113046, "epoch": 2691} {"train_loss": -6.469599723815918, "global_step": 113047, "epoch": 2691} {"train_loss": -6.549206256866455, "global_step": 113048, "epoch": 2691} {"train_loss": -6.525262355804443, "global_step": 113049, "epoch": 2691} {"train_loss": -6.573281764984131, "global_step": 113050, "epoch": 2691} {"train_loss": -6.471698760986328, "global_step": 113051, "epoch": 2691} {"train_loss": -6.524539947509766, "global_step": 113052, "epoch": 2691} {"train_loss": -6.567582130432129, "global_step": 113053, "epoch": 2691} {"train_loss": -6.528816223144531, "global_step": 113054, "epoch": 2691} {"train_loss": -6.495076656341553, "global_step": 113055, "epoch": 2691} {"train_loss": -6.436546325683594, "global_step": 113056, "epoch": 2691} {"train_loss": -6.574542045593262, "global_step": 113057, "epoch": 2691} {"train_loss": -6.576457977294922, "global_step": 113058, "epoch": 2691} {"train_loss": -6.47841739654541, "global_step": 113059, "epoch": 2691} {"train_loss": -6.485466957092285, "global_step": 113060, "epoch": 2691} {"train_loss": -6.472463130950928, "global_step": 113061, "epoch": 2691} {"train_loss": -6.450753211975098, "global_step": 113062, "epoch": 2691} {"train_loss": -6.496052730651129, "global_step": 113063, "epoch": 2691, "val_loss": 76414.9453125} {"train_loss": -6.50563907623291, "global_step": 113064, "epoch": 2692} {"train_loss": -6.495859146118164, "global_step": 113065, "epoch": 2692} {"train_loss": -6.60335636138916, "global_step": 113066, "epoch": 2692} {"train_loss": -6.662555694580078, "global_step": 113067, "epoch": 2692} {"train_loss": -6.398606300354004, "global_step": 113068, "epoch": 2692} {"train_loss": -6.519732475280762, "global_step": 113069, "epoch": 2692} {"train_loss": -6.544551849365234, "global_step": 113070, "epoch": 2692} {"train_loss": -6.514579772949219, "global_step": 113071, "epoch": 2692} {"train_loss": -6.484846115112305, "global_step": 113072, "epoch": 2692} {"train_loss": -6.415463447570801, "global_step": 113073, "epoch": 2692} {"train_loss": -6.492270469665527, "global_step": 113074, "epoch": 2692} {"train_loss": -6.483174800872803, "global_step": 113075, "epoch": 2692} {"train_loss": -6.418895721435547, "global_step": 113076, "epoch": 2692} {"train_loss": -6.478370666503906, "global_step": 113077, "epoch": 2692} {"train_loss": -6.463693141937256, "global_step": 113078, "epoch": 2692} {"train_loss": -6.46248722076416, "global_step": 113079, "epoch": 2692} {"train_loss": -6.630814552307129, "global_step": 113080, "epoch": 2692} {"train_loss": -6.441074371337891, "global_step": 113081, "epoch": 2692} {"train_loss": -6.523089408874512, "global_step": 113082, "epoch": 2692} {"train_loss": -6.5011796951293945, "global_step": 113083, "epoch": 2692} {"train_loss": -6.572425365447998, "global_step": 113084, "epoch": 2692} {"train_loss": -6.432001113891602, "global_step": 113085, "epoch": 2692} {"train_loss": -6.554159164428711, "global_step": 113086, "epoch": 2692} {"train_loss": -6.443948745727539, "global_step": 113087, "epoch": 2692} {"train_loss": -6.468628883361816, "global_step": 113088, "epoch": 2692} {"train_loss": -6.554771423339844, "global_step": 113089, "epoch": 2692} {"train_loss": -6.427303314208984, "global_step": 113090, "epoch": 2692} {"train_loss": -6.507647514343262, "global_step": 113091, "epoch": 2692} {"train_loss": -6.572618007659912, "global_step": 113092, "epoch": 2692} {"train_loss": -6.530256271362305, "global_step": 113093, "epoch": 2692} {"train_loss": -6.535475254058838, "global_step": 113094, "epoch": 2692} {"train_loss": -6.452089309692383, "global_step": 113095, "epoch": 2692} {"train_loss": -6.417896270751953, "global_step": 113096, "epoch": 2692} {"train_loss": -6.541616439819336, "global_step": 113097, "epoch": 2692} {"train_loss": -6.553459167480469, "global_step": 113098, "epoch": 2692} {"train_loss": -6.5778422355651855, "global_step": 113099, "epoch": 2692} {"train_loss": -6.592421531677246, "global_step": 113100, "epoch": 2692} {"train_loss": -6.580991268157959, "global_step": 113101, "epoch": 2692} {"train_loss": -6.4616498947143555, "global_step": 113102, "epoch": 2692} {"train_loss": -6.436924934387207, "global_step": 113103, "epoch": 2692} {"train_loss": -6.58616828918457, "global_step": 113104, "epoch": 2692} {"train_loss": -6.505120277404785, "global_step": 113105, "epoch": 2692, "val_loss": 76322.1953125} {"train_loss": -6.5429582595825195, "global_step": 113106, "epoch": 2693} {"train_loss": -6.51869010925293, "global_step": 113107, "epoch": 2693} {"train_loss": -6.442920684814453, "global_step": 113108, "epoch": 2693} {"train_loss": -6.510314464569092, "global_step": 113109, "epoch": 2693} {"train_loss": -6.435661792755127, "global_step": 113110, "epoch": 2693} {"train_loss": -6.482911586761475, "global_step": 113111, "epoch": 2693} {"train_loss": -6.437422752380371, "global_step": 113112, "epoch": 2693} {"train_loss": -6.517620086669922, "global_step": 113113, "epoch": 2693} {"train_loss": -6.5108642578125, "global_step": 113114, "epoch": 2693} {"train_loss": -6.4181413650512695, "global_step": 113115, "epoch": 2693} {"train_loss": -6.426633834838867, "global_step": 113116, "epoch": 2693} {"train_loss": -6.5057854652404785, "global_step": 113117, "epoch": 2693} {"train_loss": -6.480059623718262, "global_step": 113118, "epoch": 2693} {"train_loss": -6.415172576904297, "global_step": 113119, "epoch": 2693} {"train_loss": -6.3959808349609375, "global_step": 113120, "epoch": 2693} {"train_loss": -6.437714099884033, "global_step": 113121, "epoch": 2693} {"train_loss": -6.54157829284668, "global_step": 113122, "epoch": 2693} {"train_loss": -6.441026210784912, "global_step": 113123, "epoch": 2693} {"train_loss": -6.496910572052002, "global_step": 113124, "epoch": 2693} {"train_loss": -6.540160655975342, "global_step": 113125, "epoch": 2693} {"train_loss": -6.494733810424805, "global_step": 113126, "epoch": 2693} {"train_loss": -6.528688430786133, "global_step": 113127, "epoch": 2693} {"train_loss": -6.376624584197998, "global_step": 113128, "epoch": 2693} {"train_loss": -6.518075466156006, "global_step": 113129, "epoch": 2693} {"train_loss": -6.491850852966309, "global_step": 113130, "epoch": 2693} {"train_loss": -6.534185409545898, "global_step": 113131, "epoch": 2693} {"train_loss": -6.428210735321045, "global_step": 113132, "epoch": 2693} {"train_loss": -6.63134765625, "global_step": 113133, "epoch": 2693} {"train_loss": -6.561887741088867, "global_step": 113134, "epoch": 2693} {"train_loss": -6.407198905944824, "global_step": 113135, "epoch": 2693} {"train_loss": -6.579895973205566, "global_step": 113136, "epoch": 2693} {"train_loss": -6.523744583129883, "global_step": 113137, "epoch": 2693} {"train_loss": -6.6223297119140625, "global_step": 113138, "epoch": 2693} {"train_loss": -6.34657096862793, "global_step": 113139, "epoch": 2693} {"train_loss": -6.485662460327148, "global_step": 113140, "epoch": 2693} {"train_loss": -6.467799663543701, "global_step": 113141, "epoch": 2693} {"train_loss": -6.4143171310424805, "global_step": 113142, "epoch": 2693} {"train_loss": -6.462754249572754, "global_step": 113143, "epoch": 2693} {"train_loss": -6.381975173950195, "global_step": 113144, "epoch": 2693} {"train_loss": -6.550073623657227, "global_step": 113145, "epoch": 2693} {"train_loss": -6.477250099182129, "global_step": 113146, "epoch": 2693} {"train_loss": -6.480074700855074, "global_step": 113147, "epoch": 2693, "val_loss": 76730.9140625} {"train_loss": -6.575019836425781, "global_step": 113148, "epoch": 2694} {"train_loss": -6.491247177124023, "global_step": 113149, "epoch": 2694} {"train_loss": -6.47885799407959, "global_step": 113150, "epoch": 2694} {"train_loss": -6.518784046173096, "global_step": 113151, "epoch": 2694} {"train_loss": -6.299193382263184, "global_step": 113152, "epoch": 2694} {"train_loss": -6.541619777679443, "global_step": 113153, "epoch": 2694} {"train_loss": -6.505284309387207, "global_step": 113154, "epoch": 2694} {"train_loss": -6.478601455688477, "global_step": 113155, "epoch": 2694} {"train_loss": -6.530889511108398, "global_step": 113156, "epoch": 2694} {"train_loss": -6.440083026885986, "global_step": 113157, "epoch": 2694} {"train_loss": -6.480571746826172, "global_step": 113158, "epoch": 2694} {"train_loss": -6.423606872558594, "global_step": 113159, "epoch": 2694} {"train_loss": -6.510465621948242, "global_step": 113160, "epoch": 2694} {"train_loss": -6.4666643142700195, "global_step": 113161, "epoch": 2694} {"train_loss": -6.380487442016602, "global_step": 113162, "epoch": 2694} {"train_loss": -6.50045108795166, "global_step": 113163, "epoch": 2694} {"train_loss": -6.5010480880737305, "global_step": 113164, "epoch": 2694} {"train_loss": -6.447683334350586, "global_step": 113165, "epoch": 2694} {"train_loss": -6.49909782409668, "global_step": 113166, "epoch": 2694} {"train_loss": -6.450788497924805, "global_step": 113167, "epoch": 2694} {"train_loss": -6.422130107879639, "global_step": 113168, "epoch": 2694} {"train_loss": -6.501903533935547, "global_step": 113169, "epoch": 2694} {"train_loss": -6.510066032409668, "global_step": 113170, "epoch": 2694} {"train_loss": -6.576618671417236, "global_step": 113171, "epoch": 2694} {"train_loss": -6.361324787139893, "global_step": 113172, "epoch": 2694} {"train_loss": -6.446296691894531, "global_step": 113173, "epoch": 2694} {"train_loss": -6.500476360321045, "global_step": 113174, "epoch": 2694} {"train_loss": -6.494541168212891, "global_step": 113175, "epoch": 2694} {"train_loss": -6.342493057250977, "global_step": 113176, "epoch": 2694} {"train_loss": -6.60700798034668, "global_step": 113177, "epoch": 2694} {"train_loss": -6.504988670349121, "global_step": 113178, "epoch": 2694} {"train_loss": -6.533103942871094, "global_step": 113179, "epoch": 2694} {"train_loss": -6.526008605957031, "global_step": 113180, "epoch": 2694} {"train_loss": -6.476256370544434, "global_step": 113181, "epoch": 2694} {"train_loss": -6.516473770141602, "global_step": 113182, "epoch": 2694} {"train_loss": -6.542549133300781, "global_step": 113183, "epoch": 2694} {"train_loss": -6.473012447357178, "global_step": 113184, "epoch": 2694} {"train_loss": -6.526332855224609, "global_step": 113185, "epoch": 2694} {"train_loss": -6.406963348388672, "global_step": 113186, "epoch": 2694} {"train_loss": -6.540850639343262, "global_step": 113187, "epoch": 2694} {"train_loss": -6.411867141723633, "global_step": 113188, "epoch": 2694} {"train_loss": -6.478715294883365, "global_step": 113189, "epoch": 2694, "val_loss": 76368.3515625} {"train_loss": -6.509166717529297, "global_step": 113190, "epoch": 2695} {"train_loss": -6.502982139587402, "global_step": 113191, "epoch": 2695} {"train_loss": -6.444598197937012, "global_step": 113192, "epoch": 2695} {"train_loss": -6.450911521911621, "global_step": 113193, "epoch": 2695} {"train_loss": -6.374978542327881, "global_step": 113194, "epoch": 2695} {"train_loss": -6.498623371124268, "global_step": 113195, "epoch": 2695} {"train_loss": -6.4662766456604, "global_step": 113196, "epoch": 2695} {"train_loss": -6.486664772033691, "global_step": 113197, "epoch": 2695} {"train_loss": -6.428921699523926, "global_step": 113198, "epoch": 2695} {"train_loss": -6.595908164978027, "global_step": 113199, "epoch": 2695} {"train_loss": -6.60446834564209, "global_step": 113200, "epoch": 2695} {"train_loss": -6.562555313110352, "global_step": 113201, "epoch": 2695} {"train_loss": -6.470325946807861, "global_step": 113202, "epoch": 2695} {"train_loss": -6.512063026428223, "global_step": 113203, "epoch": 2695} {"train_loss": -6.428513526916504, "global_step": 113204, "epoch": 2695} {"train_loss": -6.539458274841309, "global_step": 113205, "epoch": 2695} {"train_loss": -6.495750427246094, "global_step": 113206, "epoch": 2695} {"train_loss": -6.443904876708984, "global_step": 113207, "epoch": 2695} {"train_loss": -6.490338325500488, "global_step": 113208, "epoch": 2695} {"train_loss": -6.497673511505127, "global_step": 113209, "epoch": 2695} {"train_loss": -6.480899810791016, "global_step": 113210, "epoch": 2695} {"train_loss": -6.45942497253418, "global_step": 113211, "epoch": 2695} {"train_loss": -6.513134002685547, "global_step": 113212, "epoch": 2695} {"train_loss": -6.44063663482666, "global_step": 113213, "epoch": 2695} {"train_loss": -6.507376670837402, "global_step": 113214, "epoch": 2695} {"train_loss": -6.523523807525635, "global_step": 113215, "epoch": 2695} {"train_loss": -6.49787712097168, "global_step": 113216, "epoch": 2695} {"train_loss": -6.506026744842529, "global_step": 113217, "epoch": 2695} {"train_loss": -6.424839019775391, "global_step": 113218, "epoch": 2695} {"train_loss": -6.499152183532715, "global_step": 113219, "epoch": 2695} {"train_loss": -6.481682777404785, "global_step": 113220, "epoch": 2695} {"train_loss": -6.406825065612793, "global_step": 113221, "epoch": 2695} {"train_loss": -6.619190692901611, "global_step": 113222, "epoch": 2695} {"train_loss": -6.501165866851807, "global_step": 113223, "epoch": 2695} {"train_loss": -6.416085243225098, "global_step": 113224, "epoch": 2695} {"train_loss": -6.452791213989258, "global_step": 113225, "epoch": 2695} {"train_loss": -6.4403977394104, "global_step": 113226, "epoch": 2695} {"train_loss": -6.49614953994751, "global_step": 113227, "epoch": 2695} {"train_loss": -6.486818313598633, "global_step": 113228, "epoch": 2695} {"train_loss": -6.560442924499512, "global_step": 113229, "epoch": 2695} {"train_loss": -6.482423305511475, "global_step": 113230, "epoch": 2695} {"train_loss": -6.489387421380906, "global_step": 113231, "epoch": 2695, "val_loss": 76705.328125} {"train_loss": -6.573435306549072, "global_step": 113232, "epoch": 2696} {"train_loss": -6.542738437652588, "global_step": 113233, "epoch": 2696} {"train_loss": -6.5641021728515625, "global_step": 113234, "epoch": 2696} {"train_loss": -6.381380081176758, "global_step": 113235, "epoch": 2696} {"train_loss": -6.592269420623779, "global_step": 113236, "epoch": 2696} {"train_loss": -6.523387908935547, "global_step": 113237, "epoch": 2696} {"train_loss": -6.569949150085449, "global_step": 113238, "epoch": 2696} {"train_loss": -6.428328037261963, "global_step": 113239, "epoch": 2696} {"train_loss": -6.463960647583008, "global_step": 113240, "epoch": 2696} {"train_loss": -6.5150628089904785, "global_step": 113241, "epoch": 2696} {"train_loss": -6.457402229309082, "global_step": 113242, "epoch": 2696} {"train_loss": -6.569339275360107, "global_step": 113243, "epoch": 2696} {"train_loss": -6.439090728759766, "global_step": 113244, "epoch": 2696} {"train_loss": -6.465383529663086, "global_step": 113245, "epoch": 2696} {"train_loss": -6.395382881164551, "global_step": 113246, "epoch": 2696} {"train_loss": -6.570951461791992, "global_step": 113247, "epoch": 2696} {"train_loss": -6.255745887756348, "global_step": 113248, "epoch": 2696} {"train_loss": -6.396731376647949, "global_step": 113249, "epoch": 2696} {"train_loss": -6.400627136230469, "global_step": 113250, "epoch": 2696} {"train_loss": -6.271355628967285, "global_step": 113251, "epoch": 2696} {"train_loss": -6.497685432434082, "global_step": 113252, "epoch": 2696} {"train_loss": -6.436341285705566, "global_step": 113253, "epoch": 2696} {"train_loss": -6.406485557556152, "global_step": 113254, "epoch": 2696} {"train_loss": -6.368247985839844, "global_step": 113255, "epoch": 2696} {"train_loss": -6.379606246948242, "global_step": 113256, "epoch": 2696} {"train_loss": -6.381365776062012, "global_step": 113257, "epoch": 2696} {"train_loss": -6.328033924102783, "global_step": 113258, "epoch": 2696} {"train_loss": -6.465314865112305, "global_step": 113259, "epoch": 2696} {"train_loss": -6.3986406326293945, "global_step": 113260, "epoch": 2696} {"train_loss": -6.4279279708862305, "global_step": 113261, "epoch": 2696} {"train_loss": -6.422740936279297, "global_step": 113262, "epoch": 2696} {"train_loss": -6.437309741973877, "global_step": 113263, "epoch": 2696} {"train_loss": -6.479520797729492, "global_step": 113264, "epoch": 2696} {"train_loss": -6.552637100219727, "global_step": 113265, "epoch": 2696} {"train_loss": -6.455976963043213, "global_step": 113266, "epoch": 2696} {"train_loss": -6.415783882141113, "global_step": 113267, "epoch": 2696} {"train_loss": -6.556389808654785, "global_step": 113268, "epoch": 2696} {"train_loss": -6.325348854064941, "global_step": 113269, "epoch": 2696} {"train_loss": -6.539433002471924, "global_step": 113270, "epoch": 2696} {"train_loss": -6.465718746185303, "global_step": 113271, "epoch": 2696} {"train_loss": -6.405188083648682, "global_step": 113272, "epoch": 2696} {"train_loss": -6.45045230502174, "global_step": 113273, "epoch": 2696, "val_loss": 76734.5390625} {"train_loss": -6.391680717468262, "global_step": 113274, "epoch": 2697} {"train_loss": -6.573683261871338, "global_step": 113275, "epoch": 2697} {"train_loss": -6.2528181076049805, "global_step": 113276, "epoch": 2697} {"train_loss": -6.581258773803711, "global_step": 113277, "epoch": 2697} {"train_loss": -6.396346092224121, "global_step": 113278, "epoch": 2697} {"train_loss": -6.359288215637207, "global_step": 113279, "epoch": 2697} {"train_loss": -6.515433311462402, "global_step": 113280, "epoch": 2697} {"train_loss": -6.293456077575684, "global_step": 113281, "epoch": 2697} {"train_loss": -6.241297245025635, "global_step": 113282, "epoch": 2697} {"train_loss": -6.417572975158691, "global_step": 113283, "epoch": 2697} {"train_loss": -6.321232795715332, "global_step": 113284, "epoch": 2697} {"train_loss": -6.43195915222168, "global_step": 113285, "epoch": 2697} {"train_loss": -6.2633957862854, "global_step": 113286, "epoch": 2697} {"train_loss": -6.509588241577148, "global_step": 113287, "epoch": 2697} {"train_loss": -6.223860740661621, "global_step": 113288, "epoch": 2697} {"train_loss": -6.512321949005127, "global_step": 113289, "epoch": 2697} {"train_loss": -6.31906270980835, "global_step": 113290, "epoch": 2697} {"train_loss": -6.423866271972656, "global_step": 113291, "epoch": 2697} {"train_loss": -6.279243469238281, "global_step": 113292, "epoch": 2697} {"train_loss": -6.463317394256592, "global_step": 113293, "epoch": 2697} {"train_loss": -6.306292533874512, "global_step": 113294, "epoch": 2697} {"train_loss": -6.383946418762207, "global_step": 113295, "epoch": 2697} {"train_loss": -6.33309268951416, "global_step": 113296, "epoch": 2697} {"train_loss": -6.415143966674805, "global_step": 113297, "epoch": 2697} {"train_loss": -6.572296619415283, "global_step": 113298, "epoch": 2697} {"train_loss": -6.381955146789551, "global_step": 113299, "epoch": 2697} {"train_loss": -6.384268760681152, "global_step": 113300, "epoch": 2697} {"train_loss": -6.398738384246826, "global_step": 113301, "epoch": 2697} {"train_loss": -6.390992164611816, "global_step": 113302, "epoch": 2697} {"train_loss": -6.395061016082764, "global_step": 113303, "epoch": 2697} {"train_loss": -6.481783866882324, "global_step": 113304, "epoch": 2697} {"train_loss": -6.405903339385986, "global_step": 113305, "epoch": 2697} {"train_loss": -6.575211524963379, "global_step": 113306, "epoch": 2697} {"train_loss": -6.510997772216797, "global_step": 113307, "epoch": 2697} {"train_loss": -6.461188316345215, "global_step": 113308, "epoch": 2697} {"train_loss": -6.497347831726074, "global_step": 113309, "epoch": 2697} {"train_loss": -6.515651702880859, "global_step": 113310, "epoch": 2697} {"train_loss": -6.461672782897949, "global_step": 113311, "epoch": 2697} {"train_loss": -6.5228271484375, "global_step": 113312, "epoch": 2697} {"train_loss": -6.549106597900391, "global_step": 113313, "epoch": 2697} {"train_loss": -6.357966899871826, "global_step": 113314, "epoch": 2697} {"train_loss": -6.419251884732928, "global_step": 113315, "epoch": 2697, "val_loss": 76253.203125} {"train_loss": -6.491476058959961, "global_step": 113316, "epoch": 2698} {"train_loss": -6.509555816650391, "global_step": 113317, "epoch": 2698} {"train_loss": -6.485130310058594, "global_step": 113318, "epoch": 2698} {"train_loss": -6.439828872680664, "global_step": 113319, "epoch": 2698} {"train_loss": -6.590794563293457, "global_step": 113320, "epoch": 2698} {"train_loss": -6.533808708190918, "global_step": 113321, "epoch": 2698} {"train_loss": -6.507774829864502, "global_step": 113322, "epoch": 2698} {"train_loss": -6.50373649597168, "global_step": 113323, "epoch": 2698} {"train_loss": -6.482077598571777, "global_step": 113324, "epoch": 2698} {"train_loss": -6.389856338500977, "global_step": 113325, "epoch": 2698} {"train_loss": -6.424822807312012, "global_step": 113326, "epoch": 2698} {"train_loss": -6.547821998596191, "global_step": 113327, "epoch": 2698} {"train_loss": -6.484164237976074, "global_step": 113328, "epoch": 2698} {"train_loss": -6.505955219268799, "global_step": 113329, "epoch": 2698} {"train_loss": -6.398361682891846, "global_step": 113330, "epoch": 2698} {"train_loss": -6.439830780029297, "global_step": 113331, "epoch": 2698} {"train_loss": -6.4279375076293945, "global_step": 113332, "epoch": 2698} {"train_loss": -6.487308025360107, "global_step": 113333, "epoch": 2698} {"train_loss": -6.492160797119141, "global_step": 113334, "epoch": 2698} {"train_loss": -6.509471416473389, "global_step": 113335, "epoch": 2698} {"train_loss": -6.5089826583862305, "global_step": 113336, "epoch": 2698} {"train_loss": -6.276765823364258, "global_step": 113337, "epoch": 2698} {"train_loss": -6.337482929229736, "global_step": 113338, "epoch": 2698} {"train_loss": -6.41013240814209, "global_step": 113339, "epoch": 2698} {"train_loss": -6.580974578857422, "global_step": 113340, "epoch": 2698} {"train_loss": -6.620522499084473, "global_step": 113341, "epoch": 2698} {"train_loss": -6.430373191833496, "global_step": 113342, "epoch": 2698} {"train_loss": -6.454394340515137, "global_step": 113343, "epoch": 2698} {"train_loss": -6.341318607330322, "global_step": 113344, "epoch": 2698} {"train_loss": -6.416964530944824, "global_step": 113345, "epoch": 2698} {"train_loss": -6.557012557983398, "global_step": 113346, "epoch": 2698} {"train_loss": -6.5421600341796875, "global_step": 113347, "epoch": 2698} {"train_loss": -6.483521461486816, "global_step": 113348, "epoch": 2698} {"train_loss": -6.514876842498779, "global_step": 113349, "epoch": 2698} {"train_loss": -6.4040913581848145, "global_step": 113350, "epoch": 2698} {"train_loss": -6.510732173919678, "global_step": 113351, "epoch": 2698} {"train_loss": -6.420679092407227, "global_step": 113352, "epoch": 2698} {"train_loss": -6.419623851776123, "global_step": 113353, "epoch": 2698} {"train_loss": -6.429477691650391, "global_step": 113354, "epoch": 2698} {"train_loss": -6.4127044677734375, "global_step": 113355, "epoch": 2698} {"train_loss": -6.449974060058594, "global_step": 113356, "epoch": 2698} {"train_loss": -6.467972414834159, "global_step": 113357, "epoch": 2698, "val_loss": 76184.5546875} {"train_loss": -6.611177444458008, "global_step": 113358, "epoch": 2699} {"train_loss": -6.39198637008667, "global_step": 113359, "epoch": 2699} {"train_loss": -6.604320526123047, "global_step": 113360, "epoch": 2699} {"train_loss": -6.562553405761719, "global_step": 113361, "epoch": 2699} {"train_loss": -6.457859516143799, "global_step": 113362, "epoch": 2699} {"train_loss": -6.390280723571777, "global_step": 113363, "epoch": 2699} {"train_loss": -6.526605606079102, "global_step": 113364, "epoch": 2699} {"train_loss": -6.417057037353516, "global_step": 113365, "epoch": 2699} {"train_loss": -6.402247428894043, "global_step": 113366, "epoch": 2699} {"train_loss": -6.5079731941223145, "global_step": 113367, "epoch": 2699} {"train_loss": -6.435168266296387, "global_step": 113368, "epoch": 2699} {"train_loss": -6.478569984436035, "global_step": 113369, "epoch": 2699} {"train_loss": -6.584004878997803, "global_step": 113370, "epoch": 2699} {"train_loss": -6.52625846862793, "global_step": 113371, "epoch": 2699} {"train_loss": -6.589703559875488, "global_step": 113372, "epoch": 2699} {"train_loss": -6.4791765213012695, "global_step": 113373, "epoch": 2699} {"train_loss": -6.475268363952637, "global_step": 113374, "epoch": 2699} {"train_loss": -6.476198196411133, "global_step": 113375, "epoch": 2699} {"train_loss": -6.40974235534668, "global_step": 113376, "epoch": 2699} {"train_loss": -6.494571685791016, "global_step": 113377, "epoch": 2699} {"train_loss": -6.383522033691406, "global_step": 113378, "epoch": 2699} {"train_loss": -6.562071800231934, "global_step": 113379, "epoch": 2699} {"train_loss": -6.410637855529785, "global_step": 113380, "epoch": 2699} {"train_loss": -6.514866352081299, "global_step": 113381, "epoch": 2699} {"train_loss": -6.436676979064941, "global_step": 113382, "epoch": 2699} {"train_loss": -6.4675493240356445, "global_step": 113383, "epoch": 2699} {"train_loss": -6.50951623916626, "global_step": 113384, "epoch": 2699} {"train_loss": -6.398787498474121, "global_step": 113385, "epoch": 2699} {"train_loss": -6.495064735412598, "global_step": 113386, "epoch": 2699} {"train_loss": -6.414464950561523, "global_step": 113387, "epoch": 2699} {"train_loss": -6.449832916259766, "global_step": 113388, "epoch": 2699} {"train_loss": -6.556515216827393, "global_step": 113389, "epoch": 2699} {"train_loss": -6.5071868896484375, "global_step": 113390, "epoch": 2699} {"train_loss": -6.602975845336914, "global_step": 113391, "epoch": 2699} {"train_loss": -6.504890441894531, "global_step": 113392, "epoch": 2699} {"train_loss": -6.596071243286133, "global_step": 113393, "epoch": 2699} {"train_loss": -6.556693077087402, "global_step": 113394, "epoch": 2699} {"train_loss": -6.49620246887207, "global_step": 113395, "epoch": 2699} {"train_loss": -6.42502498626709, "global_step": 113396, "epoch": 2699} {"train_loss": -6.446207046508789, "global_step": 113397, "epoch": 2699} {"train_loss": -6.495279312133789, "global_step": 113398, "epoch": 2699} {"train_loss": -6.49048722357977, "global_step": 113399, "epoch": 2699, "val_loss": 76406.8203125} {"train_loss": -6.481534004211426, "global_step": 113400, "epoch": 2700} {"train_loss": -6.4810028076171875, "global_step": 113401, "epoch": 2700} {"train_loss": -6.508999347686768, "global_step": 113402, "epoch": 2700} {"train_loss": -6.4542999267578125, "global_step": 113403, "epoch": 2700} {"train_loss": -6.550819396972656, "global_step": 113404, "epoch": 2700} {"train_loss": -6.564363479614258, "global_step": 113405, "epoch": 2700} {"train_loss": -6.504853248596191, "global_step": 113406, "epoch": 2700} {"train_loss": -6.56393575668335, "global_step": 113407, "epoch": 2700} {"train_loss": -6.584392547607422, "global_step": 113408, "epoch": 2700} {"train_loss": -6.6212263107299805, "global_step": 113409, "epoch": 2700} {"train_loss": -6.580142974853516, "global_step": 113410, "epoch": 2700} {"train_loss": -6.506498336791992, "global_step": 113411, "epoch": 2700} {"train_loss": -6.449117660522461, "global_step": 113412, "epoch": 2700} {"train_loss": -6.542148113250732, "global_step": 113413, "epoch": 2700} {"train_loss": -6.456114768981934, "global_step": 113414, "epoch": 2700} {"train_loss": -6.59323263168335, "global_step": 113415, "epoch": 2700} {"train_loss": -6.528109073638916, "global_step": 113416, "epoch": 2700} {"train_loss": -6.572081089019775, "global_step": 113417, "epoch": 2700} {"train_loss": -6.588092803955078, "global_step": 113418, "epoch": 2700} {"train_loss": -6.493338584899902, "global_step": 113419, "epoch": 2700} {"train_loss": -6.637111663818359, "global_step": 113420, "epoch": 2700} {"train_loss": -6.544466495513916, "global_step": 113421, "epoch": 2700} {"train_loss": -6.635093688964844, "global_step": 113422, "epoch": 2700} {"train_loss": -6.51845645904541, "global_step": 113423, "epoch": 2700} {"train_loss": -6.403867244720459, "global_step": 113424, "epoch": 2700} {"train_loss": -6.588310241699219, "global_step": 113425, "epoch": 2700} {"train_loss": -6.480983734130859, "global_step": 113426, "epoch": 2700} {"train_loss": -6.544322490692139, "global_step": 113427, "epoch": 2700} {"train_loss": -6.5321364402771, "global_step": 113428, "epoch": 2700} {"train_loss": -6.502907752990723, "global_step": 113429, "epoch": 2700} {"train_loss": -6.576986312866211, "global_step": 113430, "epoch": 2700} {"train_loss": -6.5272393226623535, "global_step": 113431, "epoch": 2700} {"train_loss": -6.570873737335205, "global_step": 113432, "epoch": 2700} {"train_loss": -6.531961441040039, "global_step": 113433, "epoch": 2700} {"train_loss": -6.5748491287231445, "global_step": 113434, "epoch": 2700} {"train_loss": -6.391419410705566, "global_step": 113435, "epoch": 2700} {"train_loss": -6.4268798828125, "global_step": 113436, "epoch": 2700} {"train_loss": -6.4670891761779785, "global_step": 113437, "epoch": 2700} {"train_loss": -6.501111030578613, "global_step": 113438, "epoch": 2700} {"train_loss": -6.6106462478637695, "global_step": 113439, "epoch": 2700} {"train_loss": -6.506963729858398, "global_step": 113440, "epoch": 2700} {"train_loss": -6.529546635491507, "global_step": 113441, "epoch": 2700, "train/sim_max_reward_0": 0.40898631567313076, "train/sim_max_reward_1": 0.920628656298571, "train/sim_max_reward_2": 0.36178355297653514, "train/sim_max_reward_3": 0.11420651036125681, "train/sim_max_reward_4": 0.3007633196363414, "train/sim_max_reward_5": 0.8522823307776798, "test/sim_max_reward_4500000": 0.7260102496812884, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9714847664934525, "test/sim_max_reward_4500003": 0.8357955777531267, "test/sim_max_reward_4500004": 0.13921345409371239, "test/sim_max_reward_4500005": 0.26767524957053995, "test/sim_max_reward_4500006": 0.9572207965283718, "test/sim_max_reward_4500007": 0.8875508981562961, "test/sim_max_reward_4500008": 0.20686287060930758, "test/sim_max_reward_4500009": 0.05350619099653216, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9284474766074524, "test/sim_max_reward_4500012": 0.9298797308815114, "test/sim_max_reward_4500013": 0.013416465297712187, "test/sim_max_reward_4500014": 0.44836051465398175, "test/sim_max_reward_4500015": 0.9104160943758508, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.06682964894568638, "test/sim_max_reward_4500018": 0.4206620464602372, "test/sim_max_reward_4500019": 0.39496762743265895, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.7281432953931749, "test/sim_max_reward_4500022": 0.950840511735787, "test/sim_max_reward_4500023": 0.9352550882784373, "test/sim_max_reward_4500024": 0.4611861148386608, "test/sim_max_reward_4500025": 0.9035117766568823, "test/sim_max_reward_4500026": 0.3876288500392829, "test/sim_max_reward_4500027": 0.9980989774980942, "test/sim_max_reward_4500028": 0.19749323326543444, "test/sim_max_reward_4500029": 0.1108905413260223, "test/sim_max_reward_4500030": 0.9527170661521364, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.22307992646313993, "test/sim_max_reward_4500034": 0.09647048468721944, "test/sim_max_reward_4500035": 0.933437082282406, "test/sim_max_reward_4500036": 0.4058530038430891, "test/sim_max_reward_4500037": 0.9491266749059701, "test/sim_max_reward_4500038": 0.31163718217122127, "test/sim_max_reward_4500039": 0.9909648535871037, "test/sim_max_reward_4500040": 0.9460793970690632, "test/sim_max_reward_4500041": 0.761279975505245, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.48449348793496017, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9772456208472221, "test/sim_max_reward_4500046": 0.7233365603487784, "test/sim_max_reward_4500047": 0.9772910866566876, "test/sim_max_reward_4500048": 0.9104929998247902, "test/sim_max_reward_4500049": 0.024719416909944433, "train/mean_score": 0.4931084476205858, "test/mean_score": 0.5112725303194243, "val_loss": 76739.1640625} {"train_loss": -6.529030799865723, "global_step": 113442, "epoch": 2701} {"train_loss": -6.585669040679932, "global_step": 113443, "epoch": 2701} {"train_loss": -6.384438514709473, "global_step": 113444, "epoch": 2701} {"train_loss": -6.49009895324707, "global_step": 113445, "epoch": 2701} {"train_loss": -6.456149101257324, "global_step": 113446, "epoch": 2701} {"train_loss": -6.539313316345215, "global_step": 113447, "epoch": 2701} {"train_loss": -6.468021392822266, "global_step": 113448, "epoch": 2701} {"train_loss": -6.510890007019043, "global_step": 113449, "epoch": 2701} {"train_loss": -6.6159491539001465, "global_step": 113450, "epoch": 2701} {"train_loss": -6.585301399230957, "global_step": 113451, "epoch": 2701} {"train_loss": -6.496286392211914, "global_step": 113452, "epoch": 2701} {"train_loss": -6.5226545333862305, "global_step": 113453, "epoch": 2701} {"train_loss": -6.501382827758789, "global_step": 113454, "epoch": 2701} {"train_loss": -6.590083122253418, "global_step": 113455, "epoch": 2701} {"train_loss": -6.536726951599121, "global_step": 113456, "epoch": 2701} {"train_loss": -6.465911865234375, "global_step": 113457, "epoch": 2701} {"train_loss": -6.500885486602783, "global_step": 113458, "epoch": 2701} {"train_loss": -6.5323638916015625, "global_step": 113459, "epoch": 2701} {"train_loss": -6.389472007751465, "global_step": 113460, "epoch": 2701} {"train_loss": -6.436578750610352, "global_step": 113461, "epoch": 2701} {"train_loss": -6.543450355529785, "global_step": 113462, "epoch": 2701} {"train_loss": -6.454688549041748, "global_step": 113463, "epoch": 2701} {"train_loss": -6.4743757247924805, "global_step": 113464, "epoch": 2701} {"train_loss": -6.599862098693848, "global_step": 113465, "epoch": 2701} {"train_loss": -6.431670188903809, "global_step": 113466, "epoch": 2701} {"train_loss": -6.353896617889404, "global_step": 113467, "epoch": 2701} {"train_loss": -6.382386684417725, "global_step": 113468, "epoch": 2701} {"train_loss": -6.383249282836914, "global_step": 113469, "epoch": 2701} {"train_loss": -6.673242568969727, "global_step": 113470, "epoch": 2701} {"train_loss": -6.3394975662231445, "global_step": 113471, "epoch": 2701} {"train_loss": -6.461691379547119, "global_step": 113472, "epoch": 2701} {"train_loss": -6.5252838134765625, "global_step": 113473, "epoch": 2701} {"train_loss": -6.385862350463867, "global_step": 113474, "epoch": 2701} {"train_loss": -6.46169376373291, "global_step": 113475, "epoch": 2701} {"train_loss": -6.472089767456055, "global_step": 113476, "epoch": 2701} {"train_loss": -6.540140628814697, "global_step": 113477, "epoch": 2701} {"train_loss": -6.468741416931152, "global_step": 113478, "epoch": 2701} {"train_loss": -6.596550941467285, "global_step": 113479, "epoch": 2701} {"train_loss": -6.597994804382324, "global_step": 113480, "epoch": 2701} {"train_loss": -6.530671119689941, "global_step": 113481, "epoch": 2701} {"train_loss": -6.431502342224121, "global_step": 113482, "epoch": 2701} {"train_loss": -6.4942774432046075, "global_step": 113483, "epoch": 2701, "val_loss": 76430.6328125} {"train_loss": -6.45778226852417, "global_step": 113484, "epoch": 2702} {"train_loss": -6.536836624145508, "global_step": 113485, "epoch": 2702} {"train_loss": -6.490719318389893, "global_step": 113486, "epoch": 2702} {"train_loss": -6.455339431762695, "global_step": 113487, "epoch": 2702} {"train_loss": -6.533236026763916, "global_step": 113488, "epoch": 2702} {"train_loss": -6.518043518066406, "global_step": 113489, "epoch": 2702} {"train_loss": -6.48008918762207, "global_step": 113490, "epoch": 2702} {"train_loss": -6.489239692687988, "global_step": 113491, "epoch": 2702} {"train_loss": -6.597129821777344, "global_step": 113492, "epoch": 2702} {"train_loss": -6.598217487335205, "global_step": 113493, "epoch": 2702} {"train_loss": -6.509614944458008, "global_step": 113494, "epoch": 2702} {"train_loss": -6.388756275177002, "global_step": 113495, "epoch": 2702} {"train_loss": -6.422022342681885, "global_step": 113496, "epoch": 2702} {"train_loss": -6.582329750061035, "global_step": 113497, "epoch": 2702} {"train_loss": -6.4591779708862305, "global_step": 113498, "epoch": 2702} {"train_loss": -6.54691743850708, "global_step": 113499, "epoch": 2702} {"train_loss": -6.502760887145996, "global_step": 113500, "epoch": 2702} {"train_loss": -6.581602096557617, "global_step": 113501, "epoch": 2702} {"train_loss": -6.570347785949707, "global_step": 113502, "epoch": 2702} {"train_loss": -6.426985263824463, "global_step": 113503, "epoch": 2702} {"train_loss": -6.516526222229004, "global_step": 113504, "epoch": 2702} {"train_loss": -6.469537258148193, "global_step": 113505, "epoch": 2702} {"train_loss": -6.496064186096191, "global_step": 113506, "epoch": 2702} {"train_loss": -6.471168518066406, "global_step": 113507, "epoch": 2702} {"train_loss": -6.612802028656006, "global_step": 113508, "epoch": 2702} {"train_loss": -6.442943572998047, "global_step": 113509, "epoch": 2702} {"train_loss": -6.439372539520264, "global_step": 113510, "epoch": 2702} {"train_loss": -6.463513374328613, "global_step": 113511, "epoch": 2702} {"train_loss": -6.517505645751953, "global_step": 113512, "epoch": 2702} {"train_loss": -6.545144081115723, "global_step": 113513, "epoch": 2702} {"train_loss": -6.542888164520264, "global_step": 113514, "epoch": 2702} {"train_loss": -6.570969104766846, "global_step": 113515, "epoch": 2702} {"train_loss": -6.572275161743164, "global_step": 113516, "epoch": 2702} {"train_loss": -6.5456132888793945, "global_step": 113517, "epoch": 2702} {"train_loss": -6.626739025115967, "global_step": 113518, "epoch": 2702} {"train_loss": -6.516371726989746, "global_step": 113519, "epoch": 2702} {"train_loss": -6.537928581237793, "global_step": 113520, "epoch": 2702} {"train_loss": -6.582245349884033, "global_step": 113521, "epoch": 2702} {"train_loss": -6.596981048583984, "global_step": 113522, "epoch": 2702} {"train_loss": -6.648930072784424, "global_step": 113523, "epoch": 2702} {"train_loss": -6.53389835357666, "global_step": 113524, "epoch": 2702} {"train_loss": -6.522204274222965, "global_step": 113525, "epoch": 2702, "val_loss": 76457.2421875} {"train_loss": -6.653825759887695, "global_step": 113526, "epoch": 2703} {"train_loss": -6.519833564758301, "global_step": 113527, "epoch": 2703} {"train_loss": -6.460930824279785, "global_step": 113528, "epoch": 2703} {"train_loss": -6.411952495574951, "global_step": 113529, "epoch": 2703} {"train_loss": -6.6046648025512695, "global_step": 113530, "epoch": 2703} {"train_loss": -6.455426216125488, "global_step": 113531, "epoch": 2703} {"train_loss": -6.580626010894775, "global_step": 113532, "epoch": 2703} {"train_loss": -6.550775051116943, "global_step": 113533, "epoch": 2703} {"train_loss": -6.570362567901611, "global_step": 113534, "epoch": 2703} {"train_loss": -6.455199718475342, "global_step": 113535, "epoch": 2703} {"train_loss": -6.357476234436035, "global_step": 113536, "epoch": 2703} {"train_loss": -6.509887218475342, "global_step": 113537, "epoch": 2703} {"train_loss": -6.536995887756348, "global_step": 113538, "epoch": 2703} {"train_loss": -6.507373809814453, "global_step": 113539, "epoch": 2703} {"train_loss": -6.598299980163574, "global_step": 113540, "epoch": 2703} {"train_loss": -6.599599361419678, "global_step": 113541, "epoch": 2703} {"train_loss": -6.489790439605713, "global_step": 113542, "epoch": 2703} {"train_loss": -6.589814186096191, "global_step": 113543, "epoch": 2703} {"train_loss": -6.4141387939453125, "global_step": 113544, "epoch": 2703} {"train_loss": -6.484417915344238, "global_step": 113545, "epoch": 2703} {"train_loss": -6.592750549316406, "global_step": 113546, "epoch": 2703} {"train_loss": -6.454716205596924, "global_step": 113547, "epoch": 2703} {"train_loss": -6.479630947113037, "global_step": 113548, "epoch": 2703} {"train_loss": -6.381466865539551, "global_step": 113549, "epoch": 2703} {"train_loss": -6.4756951332092285, "global_step": 113550, "epoch": 2703} {"train_loss": -6.320050239562988, "global_step": 113551, "epoch": 2703} {"train_loss": -6.397409915924072, "global_step": 113552, "epoch": 2703} {"train_loss": -6.407113075256348, "global_step": 113553, "epoch": 2703} {"train_loss": -6.441090106964111, "global_step": 113554, "epoch": 2703} {"train_loss": -6.623598575592041, "global_step": 113555, "epoch": 2703} {"train_loss": -6.487674713134766, "global_step": 113556, "epoch": 2703} {"train_loss": -6.417263984680176, "global_step": 113557, "epoch": 2703} {"train_loss": -6.401019096374512, "global_step": 113558, "epoch": 2703} {"train_loss": -6.508631706237793, "global_step": 113559, "epoch": 2703} {"train_loss": -6.508477687835693, "global_step": 113560, "epoch": 2703} {"train_loss": -6.538585186004639, "global_step": 113561, "epoch": 2703} {"train_loss": -6.465451240539551, "global_step": 113562, "epoch": 2703} {"train_loss": -6.509195327758789, "global_step": 113563, "epoch": 2703} {"train_loss": -6.467967987060547, "global_step": 113564, "epoch": 2703} {"train_loss": -6.437078475952148, "global_step": 113565, "epoch": 2703} {"train_loss": -6.53438138961792, "global_step": 113566, "epoch": 2703} {"train_loss": -6.493664979934692, "global_step": 113567, "epoch": 2703, "val_loss": 76636.9921875} {"train_loss": -6.435982704162598, "global_step": 113568, "epoch": 2704} {"train_loss": -6.48335075378418, "global_step": 113569, "epoch": 2704} {"train_loss": -6.58707332611084, "global_step": 113570, "epoch": 2704} {"train_loss": -6.399387359619141, "global_step": 113571, "epoch": 2704} {"train_loss": -6.478830337524414, "global_step": 113572, "epoch": 2704} {"train_loss": -6.433022499084473, "global_step": 113573, "epoch": 2704} {"train_loss": -6.304524898529053, "global_step": 113574, "epoch": 2704} {"train_loss": -6.518730640411377, "global_step": 113575, "epoch": 2704} {"train_loss": -6.6206183433532715, "global_step": 113576, "epoch": 2704} {"train_loss": -6.47274112701416, "global_step": 113577, "epoch": 2704} {"train_loss": -6.511053085327148, "global_step": 113578, "epoch": 2704} {"train_loss": -6.419748306274414, "global_step": 113579, "epoch": 2704} {"train_loss": -6.5482025146484375, "global_step": 113580, "epoch": 2704} {"train_loss": -6.644808292388916, "global_step": 113581, "epoch": 2704} {"train_loss": -6.552360534667969, "global_step": 113582, "epoch": 2704} {"train_loss": -6.552804470062256, "global_step": 113583, "epoch": 2704} {"train_loss": -6.574787139892578, "global_step": 113584, "epoch": 2704} {"train_loss": -6.5375847816467285, "global_step": 113585, "epoch": 2704} {"train_loss": -6.477228164672852, "global_step": 113586, "epoch": 2704} {"train_loss": -6.497979164123535, "global_step": 113587, "epoch": 2704} {"train_loss": -6.422857761383057, "global_step": 113588, "epoch": 2704} {"train_loss": -6.4754462242126465, "global_step": 113589, "epoch": 2704} {"train_loss": -6.448551177978516, "global_step": 113590, "epoch": 2704} {"train_loss": -6.51179313659668, "global_step": 113591, "epoch": 2704} {"train_loss": -6.523473262786865, "global_step": 113592, "epoch": 2704} {"train_loss": -6.498813629150391, "global_step": 113593, "epoch": 2704} {"train_loss": -6.460668563842773, "global_step": 113594, "epoch": 2704} {"train_loss": -6.479650497436523, "global_step": 113595, "epoch": 2704} {"train_loss": -6.483038902282715, "global_step": 113596, "epoch": 2704} {"train_loss": -6.4225006103515625, "global_step": 113597, "epoch": 2704} {"train_loss": -6.336886882781982, "global_step": 113598, "epoch": 2704} {"train_loss": -6.382399559020996, "global_step": 113599, "epoch": 2704} {"train_loss": -6.2337327003479, "global_step": 113600, "epoch": 2704} {"train_loss": -6.431925296783447, "global_step": 113601, "epoch": 2704} {"train_loss": -6.292620658874512, "global_step": 113602, "epoch": 2704} {"train_loss": -6.323456764221191, "global_step": 113603, "epoch": 2704} {"train_loss": -6.311245918273926, "global_step": 113604, "epoch": 2704} {"train_loss": -6.448831081390381, "global_step": 113605, "epoch": 2704} {"train_loss": -6.376558780670166, "global_step": 113606, "epoch": 2704} {"train_loss": -6.619055271148682, "global_step": 113607, "epoch": 2704} {"train_loss": -6.383771896362305, "global_step": 113608, "epoch": 2704} {"train_loss": -6.461002236320859, "global_step": 113609, "epoch": 2704, "val_loss": 76539.484375} {"train_loss": -6.475595474243164, "global_step": 113610, "epoch": 2705} {"train_loss": -6.380252838134766, "global_step": 113611, "epoch": 2705} {"train_loss": -6.551706314086914, "global_step": 113612, "epoch": 2705} {"train_loss": -6.498291492462158, "global_step": 113613, "epoch": 2705} {"train_loss": -6.493011474609375, "global_step": 113614, "epoch": 2705} {"train_loss": -6.520336151123047, "global_step": 113615, "epoch": 2705} {"train_loss": -6.499129772186279, "global_step": 113616, "epoch": 2705} {"train_loss": -6.524088382720947, "global_step": 113617, "epoch": 2705} {"train_loss": -6.3628339767456055, "global_step": 113618, "epoch": 2705} {"train_loss": -6.465254783630371, "global_step": 113619, "epoch": 2705} {"train_loss": -6.5064377784729, "global_step": 113620, "epoch": 2705} {"train_loss": -6.567919731140137, "global_step": 113621, "epoch": 2705} {"train_loss": -6.420639991760254, "global_step": 113622, "epoch": 2705} {"train_loss": -6.470445156097412, "global_step": 113623, "epoch": 2705} {"train_loss": -6.451811790466309, "global_step": 113624, "epoch": 2705} {"train_loss": -6.493495941162109, "global_step": 113625, "epoch": 2705} {"train_loss": -6.39078950881958, "global_step": 113626, "epoch": 2705} {"train_loss": -6.5359697341918945, "global_step": 113627, "epoch": 2705} {"train_loss": -6.465580463409424, "global_step": 113628, "epoch": 2705} {"train_loss": -6.4052228927612305, "global_step": 113629, "epoch": 2705} {"train_loss": -6.4416656494140625, "global_step": 113630, "epoch": 2705} {"train_loss": -6.315649032592773, "global_step": 113631, "epoch": 2705} {"train_loss": -6.501770496368408, "global_step": 113632, "epoch": 2705} {"train_loss": -6.3418803215026855, "global_step": 113633, "epoch": 2705} {"train_loss": -6.410329818725586, "global_step": 113634, "epoch": 2705} {"train_loss": -6.46607780456543, "global_step": 113635, "epoch": 2705} {"train_loss": -6.481929779052734, "global_step": 113636, "epoch": 2705} {"train_loss": -6.551687717437744, "global_step": 113637, "epoch": 2705} {"train_loss": -6.522874355316162, "global_step": 113638, "epoch": 2705} {"train_loss": -6.497104167938232, "global_step": 113639, "epoch": 2705} {"train_loss": -6.51534366607666, "global_step": 113640, "epoch": 2705} {"train_loss": -6.496592044830322, "global_step": 113641, "epoch": 2705} {"train_loss": -6.430322647094727, "global_step": 113642, "epoch": 2705} {"train_loss": -6.350874900817871, "global_step": 113643, "epoch": 2705} {"train_loss": -6.485968589782715, "global_step": 113644, "epoch": 2705} {"train_loss": -6.4819793701171875, "global_step": 113645, "epoch": 2705} {"train_loss": -6.513055801391602, "global_step": 113646, "epoch": 2705} {"train_loss": -6.536085605621338, "global_step": 113647, "epoch": 2705} {"train_loss": -6.45604133605957, "global_step": 113648, "epoch": 2705} {"train_loss": -6.462821006774902, "global_step": 113649, "epoch": 2705} {"train_loss": -6.541635036468506, "global_step": 113650, "epoch": 2705} {"train_loss": -6.471745979218256, "global_step": 113651, "epoch": 2705, "val_loss": 76404.859375} {"train_loss": -6.506601810455322, "global_step": 113652, "epoch": 2706} {"train_loss": -6.430538177490234, "global_step": 113653, "epoch": 2706} {"train_loss": -6.442121505737305, "global_step": 113654, "epoch": 2706} {"train_loss": -6.478324890136719, "global_step": 113655, "epoch": 2706} {"train_loss": -6.550756454467773, "global_step": 113656, "epoch": 2706} {"train_loss": -6.453945159912109, "global_step": 113657, "epoch": 2706} {"train_loss": -6.523022651672363, "global_step": 113658, "epoch": 2706} {"train_loss": -6.591902256011963, "global_step": 113659, "epoch": 2706} {"train_loss": -6.458132743835449, "global_step": 113660, "epoch": 2706} {"train_loss": -6.411759376525879, "global_step": 113661, "epoch": 2706} {"train_loss": -6.58137845993042, "global_step": 113662, "epoch": 2706} {"train_loss": -6.573631286621094, "global_step": 113663, "epoch": 2706} {"train_loss": -6.573677062988281, "global_step": 113664, "epoch": 2706} {"train_loss": -6.593618392944336, "global_step": 113665, "epoch": 2706} {"train_loss": -6.449472427368164, "global_step": 113666, "epoch": 2706} {"train_loss": -6.453990936279297, "global_step": 113667, "epoch": 2706} {"train_loss": -6.433905601501465, "global_step": 113668, "epoch": 2706} {"train_loss": -6.627627849578857, "global_step": 113669, "epoch": 2706} {"train_loss": -6.41874885559082, "global_step": 113670, "epoch": 2706} {"train_loss": -6.511547088623047, "global_step": 113671, "epoch": 2706} {"train_loss": -6.452450752258301, "global_step": 113672, "epoch": 2706} {"train_loss": -6.421839714050293, "global_step": 113673, "epoch": 2706} {"train_loss": -6.360102653503418, "global_step": 113674, "epoch": 2706} {"train_loss": -6.396422386169434, "global_step": 113675, "epoch": 2706} {"train_loss": -6.543790340423584, "global_step": 113676, "epoch": 2706} {"train_loss": -6.444864273071289, "global_step": 113677, "epoch": 2706} {"train_loss": -6.379037857055664, "global_step": 113678, "epoch": 2706} {"train_loss": -6.446272850036621, "global_step": 113679, "epoch": 2706} {"train_loss": -6.364394187927246, "global_step": 113680, "epoch": 2706} {"train_loss": -6.374758720397949, "global_step": 113681, "epoch": 2706} {"train_loss": -6.466602325439453, "global_step": 113682, "epoch": 2706} {"train_loss": -6.439697265625, "global_step": 113683, "epoch": 2706} {"train_loss": -6.481498718261719, "global_step": 113684, "epoch": 2706} {"train_loss": -6.4978413581848145, "global_step": 113685, "epoch": 2706} {"train_loss": -6.542445182800293, "global_step": 113686, "epoch": 2706} {"train_loss": -6.3814215660095215, "global_step": 113687, "epoch": 2706} {"train_loss": -6.458991050720215, "global_step": 113688, "epoch": 2706} {"train_loss": -6.357786655426025, "global_step": 113689, "epoch": 2706} {"train_loss": -6.449874401092529, "global_step": 113690, "epoch": 2706} {"train_loss": -6.498440742492676, "global_step": 113691, "epoch": 2706} {"train_loss": -6.321547031402588, "global_step": 113692, "epoch": 2706} {"train_loss": -6.46810279573713, "global_step": 113693, "epoch": 2706, "val_loss": 76928.65625} {"train_loss": -6.385695457458496, "global_step": 113694, "epoch": 2707} {"train_loss": -6.392494201660156, "global_step": 113695, "epoch": 2707} {"train_loss": -6.49088716506958, "global_step": 113696, "epoch": 2707} {"train_loss": -6.356624603271484, "global_step": 113697, "epoch": 2707} {"train_loss": -6.501045227050781, "global_step": 113698, "epoch": 2707} {"train_loss": -6.517856597900391, "global_step": 113699, "epoch": 2707} {"train_loss": -6.476827621459961, "global_step": 113700, "epoch": 2707} {"train_loss": -6.452258586883545, "global_step": 113701, "epoch": 2707} {"train_loss": -6.355983734130859, "global_step": 113702, "epoch": 2707} {"train_loss": -6.455658912658691, "global_step": 113703, "epoch": 2707} {"train_loss": -6.505857944488525, "global_step": 113704, "epoch": 2707} {"train_loss": -6.434381008148193, "global_step": 113705, "epoch": 2707} {"train_loss": -6.402789115905762, "global_step": 113706, "epoch": 2707} {"train_loss": -6.370110034942627, "global_step": 113707, "epoch": 2707} {"train_loss": -6.5321736335754395, "global_step": 113708, "epoch": 2707} {"train_loss": -6.364518165588379, "global_step": 113709, "epoch": 2707} {"train_loss": -6.455389499664307, "global_step": 113710, "epoch": 2707} {"train_loss": -6.416926383972168, "global_step": 113711, "epoch": 2707} {"train_loss": -6.43263053894043, "global_step": 113712, "epoch": 2707} {"train_loss": -6.335957050323486, "global_step": 113713, "epoch": 2707} {"train_loss": -6.476418495178223, "global_step": 113714, "epoch": 2707} {"train_loss": -6.522936820983887, "global_step": 113715, "epoch": 2707} {"train_loss": -6.407478332519531, "global_step": 113716, "epoch": 2707} {"train_loss": -6.5112762451171875, "global_step": 113717, "epoch": 2707} {"train_loss": -6.294627666473389, "global_step": 113718, "epoch": 2707} {"train_loss": -6.417089462280273, "global_step": 113719, "epoch": 2707} {"train_loss": -6.341192245483398, "global_step": 113720, "epoch": 2707} {"train_loss": -6.487219333648682, "global_step": 113721, "epoch": 2707} {"train_loss": -6.455854415893555, "global_step": 113722, "epoch": 2707} {"train_loss": -6.485251426696777, "global_step": 113723, "epoch": 2707} {"train_loss": -6.482810020446777, "global_step": 113724, "epoch": 2707} {"train_loss": -6.318720817565918, "global_step": 113725, "epoch": 2707} {"train_loss": -6.4680376052856445, "global_step": 113726, "epoch": 2707} {"train_loss": -6.392639636993408, "global_step": 113727, "epoch": 2707} {"train_loss": -6.545586585998535, "global_step": 113728, "epoch": 2707} {"train_loss": -6.356698989868164, "global_step": 113729, "epoch": 2707} {"train_loss": -6.545661449432373, "global_step": 113730, "epoch": 2707} {"train_loss": -6.342125415802002, "global_step": 113731, "epoch": 2707} {"train_loss": -6.449333190917969, "global_step": 113732, "epoch": 2707} {"train_loss": -6.414244174957275, "global_step": 113733, "epoch": 2707} {"train_loss": -6.485490798950195, "global_step": 113734, "epoch": 2707} {"train_loss": -6.435925347464425, "global_step": 113735, "epoch": 2707, "val_loss": 76365.953125} {"train_loss": -6.514639377593994, "global_step": 113736, "epoch": 2708} {"train_loss": -6.533808708190918, "global_step": 113737, "epoch": 2708} {"train_loss": -6.482166767120361, "global_step": 113738, "epoch": 2708} {"train_loss": -6.459928512573242, "global_step": 113739, "epoch": 2708} {"train_loss": -6.5748443603515625, "global_step": 113740, "epoch": 2708} {"train_loss": -6.488781929016113, "global_step": 113741, "epoch": 2708} {"train_loss": -6.396108627319336, "global_step": 113742, "epoch": 2708} {"train_loss": -6.463902473449707, "global_step": 113743, "epoch": 2708} {"train_loss": -6.53086519241333, "global_step": 113744, "epoch": 2708} {"train_loss": -6.410027980804443, "global_step": 113745, "epoch": 2708} {"train_loss": -6.4741058349609375, "global_step": 113746, "epoch": 2708} {"train_loss": -6.516750335693359, "global_step": 113747, "epoch": 2708} {"train_loss": -6.467230319976807, "global_step": 113748, "epoch": 2708} {"train_loss": -6.439145088195801, "global_step": 113749, "epoch": 2708} {"train_loss": -6.540571212768555, "global_step": 113750, "epoch": 2708} {"train_loss": -6.503673076629639, "global_step": 113751, "epoch": 2708} {"train_loss": -6.436433792114258, "global_step": 113752, "epoch": 2708} {"train_loss": -6.418299674987793, "global_step": 113753, "epoch": 2708} {"train_loss": -6.442791938781738, "global_step": 113754, "epoch": 2708} {"train_loss": -6.397516250610352, "global_step": 113755, "epoch": 2708} {"train_loss": -6.434113025665283, "global_step": 113756, "epoch": 2708} {"train_loss": -6.537887096405029, "global_step": 113757, "epoch": 2708} {"train_loss": -6.485713958740234, "global_step": 113758, "epoch": 2708} {"train_loss": -6.581161975860596, "global_step": 113759, "epoch": 2708} {"train_loss": -6.459176540374756, "global_step": 113760, "epoch": 2708} {"train_loss": -6.53032112121582, "global_step": 113761, "epoch": 2708} {"train_loss": -6.402334213256836, "global_step": 113762, "epoch": 2708} {"train_loss": -6.498140811920166, "global_step": 113763, "epoch": 2708} {"train_loss": -6.427104949951172, "global_step": 113764, "epoch": 2708} {"train_loss": -6.379301071166992, "global_step": 113765, "epoch": 2708} {"train_loss": -6.453776836395264, "global_step": 113766, "epoch": 2708} {"train_loss": -6.369711875915527, "global_step": 113767, "epoch": 2708} {"train_loss": -6.502148151397705, "global_step": 113768, "epoch": 2708} {"train_loss": -6.578363418579102, "global_step": 113769, "epoch": 2708} {"train_loss": -6.4758830070495605, "global_step": 113770, "epoch": 2708} {"train_loss": -6.501079082489014, "global_step": 113771, "epoch": 2708} {"train_loss": -6.604132652282715, "global_step": 113772, "epoch": 2708} {"train_loss": -6.552145004272461, "global_step": 113773, "epoch": 2708} {"train_loss": -6.516679286956787, "global_step": 113774, "epoch": 2708} {"train_loss": -6.6169891357421875, "global_step": 113775, "epoch": 2708} {"train_loss": -6.504438400268555, "global_step": 113776, "epoch": 2708} {"train_loss": -6.488915432067144, "global_step": 113777, "epoch": 2708, "val_loss": 76396.6875} {"train_loss": -6.471207141876221, "global_step": 113778, "epoch": 2709} {"train_loss": -6.535215377807617, "global_step": 113779, "epoch": 2709} {"train_loss": -6.528553009033203, "global_step": 113780, "epoch": 2709} {"train_loss": -6.494633197784424, "global_step": 113781, "epoch": 2709} {"train_loss": -6.570047855377197, "global_step": 113782, "epoch": 2709} {"train_loss": -6.504251956939697, "global_step": 113783, "epoch": 2709} {"train_loss": -6.657247543334961, "global_step": 113784, "epoch": 2709} {"train_loss": -6.463827133178711, "global_step": 113785, "epoch": 2709} {"train_loss": -6.470470428466797, "global_step": 113786, "epoch": 2709} {"train_loss": -6.527803421020508, "global_step": 113787, "epoch": 2709} {"train_loss": -6.551929473876953, "global_step": 113788, "epoch": 2709} {"train_loss": -6.458332061767578, "global_step": 113789, "epoch": 2709} {"train_loss": -6.5167741775512695, "global_step": 113790, "epoch": 2709} {"train_loss": -6.3881096839904785, "global_step": 113791, "epoch": 2709} {"train_loss": -6.425802230834961, "global_step": 113792, "epoch": 2709} {"train_loss": -6.478766918182373, "global_step": 113793, "epoch": 2709} {"train_loss": -6.491962432861328, "global_step": 113794, "epoch": 2709} {"train_loss": -6.539245128631592, "global_step": 113795, "epoch": 2709} {"train_loss": -6.61761474609375, "global_step": 113796, "epoch": 2709} {"train_loss": -6.582130432128906, "global_step": 113797, "epoch": 2709} {"train_loss": -6.520359039306641, "global_step": 113798, "epoch": 2709} {"train_loss": -6.505700588226318, "global_step": 113799, "epoch": 2709} {"train_loss": -6.594608306884766, "global_step": 113800, "epoch": 2709} {"train_loss": -6.464447975158691, "global_step": 113801, "epoch": 2709} {"train_loss": -6.661484241485596, "global_step": 113802, "epoch": 2709} {"train_loss": -6.5560302734375, "global_step": 113803, "epoch": 2709} {"train_loss": -6.434466361999512, "global_step": 113804, "epoch": 2709} {"train_loss": -6.565059661865234, "global_step": 113805, "epoch": 2709} {"train_loss": -6.441682815551758, "global_step": 113806, "epoch": 2709} {"train_loss": -6.468949794769287, "global_step": 113807, "epoch": 2709} {"train_loss": -6.581395149230957, "global_step": 113808, "epoch": 2709} {"train_loss": -6.4543657302856445, "global_step": 113809, "epoch": 2709} {"train_loss": -6.482246398925781, "global_step": 113810, "epoch": 2709} {"train_loss": -6.567206382751465, "global_step": 113811, "epoch": 2709} {"train_loss": -6.513884544372559, "global_step": 113812, "epoch": 2709} {"train_loss": -6.616765975952148, "global_step": 113813, "epoch": 2709} {"train_loss": -6.560297966003418, "global_step": 113814, "epoch": 2709} {"train_loss": -6.653097629547119, "global_step": 113815, "epoch": 2709} {"train_loss": -6.529348373413086, "global_step": 113816, "epoch": 2709} {"train_loss": -6.533133506774902, "global_step": 113817, "epoch": 2709} {"train_loss": -6.412908554077148, "global_step": 113818, "epoch": 2709} {"train_loss": -6.52236008644104, "global_step": 113819, "epoch": 2709, "val_loss": 76243.0546875} {"train_loss": -6.491864204406738, "global_step": 113820, "epoch": 2710} {"train_loss": -6.556634426116943, "global_step": 113821, "epoch": 2710} {"train_loss": -6.474292755126953, "global_step": 113822, "epoch": 2710} {"train_loss": -6.460466384887695, "global_step": 113823, "epoch": 2710} {"train_loss": -6.461115837097168, "global_step": 113824, "epoch": 2710} {"train_loss": -6.452472686767578, "global_step": 113825, "epoch": 2710} {"train_loss": -6.567840099334717, "global_step": 113826, "epoch": 2710} {"train_loss": -6.483543872833252, "global_step": 113827, "epoch": 2710} {"train_loss": -6.461434841156006, "global_step": 113828, "epoch": 2710} {"train_loss": -6.523914337158203, "global_step": 113829, "epoch": 2710} {"train_loss": -6.563620567321777, "global_step": 113830, "epoch": 2710} {"train_loss": -6.564452171325684, "global_step": 113831, "epoch": 2710} {"train_loss": -6.497348785400391, "global_step": 113832, "epoch": 2710} {"train_loss": -6.545237064361572, "global_step": 113833, "epoch": 2710} {"train_loss": -6.560213565826416, "global_step": 113834, "epoch": 2710} {"train_loss": -6.533275604248047, "global_step": 113835, "epoch": 2710} {"train_loss": -6.630539894104004, "global_step": 113836, "epoch": 2710} {"train_loss": -6.4234161376953125, "global_step": 113837, "epoch": 2710} {"train_loss": -6.5139617919921875, "global_step": 113838, "epoch": 2710} {"train_loss": -6.507976055145264, "global_step": 113839, "epoch": 2710} {"train_loss": -6.594821929931641, "global_step": 113840, "epoch": 2710} {"train_loss": -6.529536724090576, "global_step": 113841, "epoch": 2710} {"train_loss": -6.612931251525879, "global_step": 113842, "epoch": 2710} {"train_loss": -6.5111565589904785, "global_step": 113843, "epoch": 2710} {"train_loss": -6.482536315917969, "global_step": 113844, "epoch": 2710} {"train_loss": -6.6063666343688965, "global_step": 113845, "epoch": 2710} {"train_loss": -6.492622375488281, "global_step": 113846, "epoch": 2710} {"train_loss": -6.554148197174072, "global_step": 113847, "epoch": 2710} {"train_loss": -6.492489814758301, "global_step": 113848, "epoch": 2710} {"train_loss": -6.572412490844727, "global_step": 113849, "epoch": 2710} {"train_loss": -6.536783218383789, "global_step": 113850, "epoch": 2710} {"train_loss": -6.5705671310424805, "global_step": 113851, "epoch": 2710} {"train_loss": -6.461263656616211, "global_step": 113852, "epoch": 2710} {"train_loss": -6.475182056427002, "global_step": 113853, "epoch": 2710} {"train_loss": -6.496104717254639, "global_step": 113854, "epoch": 2710} {"train_loss": -6.5337371826171875, "global_step": 113855, "epoch": 2710} {"train_loss": -6.5233049392700195, "global_step": 113856, "epoch": 2710} {"train_loss": -6.590240478515625, "global_step": 113857, "epoch": 2710} {"train_loss": -6.489501953125, "global_step": 113858, "epoch": 2710} {"train_loss": -6.5962677001953125, "global_step": 113859, "epoch": 2710} {"train_loss": -6.455218315124512, "global_step": 113860, "epoch": 2710} {"train_loss": -6.520335072562808, "global_step": 113861, "epoch": 2710, "val_loss": 76501.34375} {"train_loss": -6.526284217834473, "global_step": 113862, "epoch": 2711} {"train_loss": -6.512604236602783, "global_step": 113863, "epoch": 2711} {"train_loss": -6.458101272583008, "global_step": 113864, "epoch": 2711} {"train_loss": -6.53286075592041, "global_step": 113865, "epoch": 2711} {"train_loss": -6.263844013214111, "global_step": 113866, "epoch": 2711} {"train_loss": -6.63014030456543, "global_step": 113867, "epoch": 2711} {"train_loss": -6.436058044433594, "global_step": 113868, "epoch": 2711} {"train_loss": -6.431384086608887, "global_step": 113869, "epoch": 2711} {"train_loss": -6.549718856811523, "global_step": 113870, "epoch": 2711} {"train_loss": -6.554159164428711, "global_step": 113871, "epoch": 2711} {"train_loss": -6.467879295349121, "global_step": 113872, "epoch": 2711} {"train_loss": -6.550009250640869, "global_step": 113873, "epoch": 2711} {"train_loss": -6.546647071838379, "global_step": 113874, "epoch": 2711} {"train_loss": -6.558067798614502, "global_step": 113875, "epoch": 2711} {"train_loss": -6.4654154777526855, "global_step": 113876, "epoch": 2711} {"train_loss": -6.447303771972656, "global_step": 113877, "epoch": 2711} {"train_loss": -6.5287346839904785, "global_step": 113878, "epoch": 2711} {"train_loss": -6.395792007446289, "global_step": 113879, "epoch": 2711} {"train_loss": -6.605879783630371, "global_step": 113880, "epoch": 2711} {"train_loss": -6.479397773742676, "global_step": 113881, "epoch": 2711} {"train_loss": -6.487152099609375, "global_step": 113882, "epoch": 2711} {"train_loss": -6.58037805557251, "global_step": 113883, "epoch": 2711} {"train_loss": -6.4545698165893555, "global_step": 113884, "epoch": 2711} {"train_loss": -6.534967422485352, "global_step": 113885, "epoch": 2711} {"train_loss": -6.4555158615112305, "global_step": 113886, "epoch": 2711} {"train_loss": -6.40717887878418, "global_step": 113887, "epoch": 2711} {"train_loss": -6.506270408630371, "global_step": 113888, "epoch": 2711} {"train_loss": -6.4887237548828125, "global_step": 113889, "epoch": 2711} {"train_loss": -6.606139659881592, "global_step": 113890, "epoch": 2711} {"train_loss": -6.6239776611328125, "global_step": 113891, "epoch": 2711} {"train_loss": -6.582080364227295, "global_step": 113892, "epoch": 2711} {"train_loss": -6.578540802001953, "global_step": 113893, "epoch": 2711} {"train_loss": -6.590121269226074, "global_step": 113894, "epoch": 2711} {"train_loss": -6.4526166915893555, "global_step": 113895, "epoch": 2711} {"train_loss": -6.6185994148254395, "global_step": 113896, "epoch": 2711} {"train_loss": -6.516755104064941, "global_step": 113897, "epoch": 2711} {"train_loss": -6.5041184425354, "global_step": 113898, "epoch": 2711} {"train_loss": -6.578561782836914, "global_step": 113899, "epoch": 2711} {"train_loss": -6.48940372467041, "global_step": 113900, "epoch": 2711} {"train_loss": -6.361398696899414, "global_step": 113901, "epoch": 2711} {"train_loss": -6.51697301864624, "global_step": 113902, "epoch": 2711} {"train_loss": -6.506441865648542, "global_step": 113903, "epoch": 2711, "val_loss": 76854.828125} {"train_loss": -6.4184889793396, "global_step": 113904, "epoch": 2712} {"train_loss": -6.5787458419799805, "global_step": 113905, "epoch": 2712} {"train_loss": -6.472987651824951, "global_step": 113906, "epoch": 2712} {"train_loss": -6.391661167144775, "global_step": 113907, "epoch": 2712} {"train_loss": -6.554385185241699, "global_step": 113908, "epoch": 2712} {"train_loss": -6.281350135803223, "global_step": 113909, "epoch": 2712} {"train_loss": -6.445937156677246, "global_step": 113910, "epoch": 2712} {"train_loss": -6.54957389831543, "global_step": 113911, "epoch": 2712} {"train_loss": -6.288683891296387, "global_step": 113912, "epoch": 2712} {"train_loss": -6.555578708648682, "global_step": 113913, "epoch": 2712} {"train_loss": -6.4146199226379395, "global_step": 113914, "epoch": 2712} {"train_loss": -6.377551555633545, "global_step": 113915, "epoch": 2712} {"train_loss": -6.394972801208496, "global_step": 113916, "epoch": 2712} {"train_loss": -6.48072624206543, "global_step": 113917, "epoch": 2712} {"train_loss": -6.414593696594238, "global_step": 113918, "epoch": 2712} {"train_loss": -6.508998870849609, "global_step": 113919, "epoch": 2712} {"train_loss": -6.474020004272461, "global_step": 113920, "epoch": 2712} {"train_loss": -6.488669395446777, "global_step": 113921, "epoch": 2712} {"train_loss": -6.553591251373291, "global_step": 113922, "epoch": 2712} {"train_loss": -6.387380599975586, "global_step": 113923, "epoch": 2712} {"train_loss": -6.500457286834717, "global_step": 113924, "epoch": 2712} {"train_loss": -6.517810821533203, "global_step": 113925, "epoch": 2712} {"train_loss": -6.5046844482421875, "global_step": 113926, "epoch": 2712} {"train_loss": -6.521242141723633, "global_step": 113927, "epoch": 2712} {"train_loss": -6.4612579345703125, "global_step": 113928, "epoch": 2712} {"train_loss": -6.5068888664245605, "global_step": 113929, "epoch": 2712} {"train_loss": -6.485466957092285, "global_step": 113930, "epoch": 2712} {"train_loss": -6.551210403442383, "global_step": 113931, "epoch": 2712} {"train_loss": -6.503398418426514, "global_step": 113932, "epoch": 2712} {"train_loss": -6.504066467285156, "global_step": 113933, "epoch": 2712} {"train_loss": -6.491076469421387, "global_step": 113934, "epoch": 2712} {"train_loss": -6.4194512367248535, "global_step": 113935, "epoch": 2712} {"train_loss": -6.574048042297363, "global_step": 113936, "epoch": 2712} {"train_loss": -6.4771528244018555, "global_step": 113937, "epoch": 2712} {"train_loss": -6.537055015563965, "global_step": 113938, "epoch": 2712} {"train_loss": -6.451377868652344, "global_step": 113939, "epoch": 2712} {"train_loss": -6.443550109863281, "global_step": 113940, "epoch": 2712} {"train_loss": -6.3523969650268555, "global_step": 113941, "epoch": 2712} {"train_loss": -6.358417987823486, "global_step": 113942, "epoch": 2712} {"train_loss": -6.483330726623535, "global_step": 113943, "epoch": 2712} {"train_loss": -6.454198837280273, "global_step": 113944, "epoch": 2712} {"train_loss": -6.468057666506086, "global_step": 113945, "epoch": 2712, "val_loss": 76501.1484375} {"train_loss": -6.57048225402832, "global_step": 113946, "epoch": 2713} {"train_loss": -6.530910491943359, "global_step": 113947, "epoch": 2713} {"train_loss": -6.47135066986084, "global_step": 113948, "epoch": 2713} {"train_loss": -6.499468803405762, "global_step": 113949, "epoch": 2713} {"train_loss": -6.464417457580566, "global_step": 113950, "epoch": 2713} {"train_loss": -6.447400093078613, "global_step": 113951, "epoch": 2713} {"train_loss": -6.491085052490234, "global_step": 113952, "epoch": 2713} {"train_loss": -6.416913986206055, "global_step": 113953, "epoch": 2713} {"train_loss": -6.448064804077148, "global_step": 113954, "epoch": 2713} {"train_loss": -6.4567551612854, "global_step": 113955, "epoch": 2713} {"train_loss": -6.57293701171875, "global_step": 113956, "epoch": 2713} {"train_loss": -6.488265037536621, "global_step": 113957, "epoch": 2713} {"train_loss": -6.414070129394531, "global_step": 113958, "epoch": 2713} {"train_loss": -6.451835632324219, "global_step": 113959, "epoch": 2713} {"train_loss": -6.56743049621582, "global_step": 113960, "epoch": 2713} {"train_loss": -6.450934410095215, "global_step": 113961, "epoch": 2713} {"train_loss": -6.550381660461426, "global_step": 113962, "epoch": 2713} {"train_loss": -6.495014667510986, "global_step": 113963, "epoch": 2713} {"train_loss": -6.374902725219727, "global_step": 113964, "epoch": 2713} {"train_loss": -6.516702175140381, "global_step": 113965, "epoch": 2713} {"train_loss": -6.607987403869629, "global_step": 113966, "epoch": 2713} {"train_loss": -6.585075855255127, "global_step": 113967, "epoch": 2713} {"train_loss": -6.523674011230469, "global_step": 113968, "epoch": 2713} {"train_loss": -6.562402248382568, "global_step": 113969, "epoch": 2713} {"train_loss": -6.536301612854004, "global_step": 113970, "epoch": 2713} {"train_loss": -6.423974514007568, "global_step": 113971, "epoch": 2713} {"train_loss": -6.447800159454346, "global_step": 113972, "epoch": 2713} {"train_loss": -6.542875289916992, "global_step": 113973, "epoch": 2713} {"train_loss": -6.488471984863281, "global_step": 113974, "epoch": 2713} {"train_loss": -6.59705924987793, "global_step": 113975, "epoch": 2713} {"train_loss": -6.498662948608398, "global_step": 113976, "epoch": 2713} {"train_loss": -6.562281131744385, "global_step": 113977, "epoch": 2713} {"train_loss": -6.498518943786621, "global_step": 113978, "epoch": 2713} {"train_loss": -6.591655731201172, "global_step": 113979, "epoch": 2713} {"train_loss": -6.625473976135254, "global_step": 113980, "epoch": 2713} {"train_loss": -6.48026180267334, "global_step": 113981, "epoch": 2713} {"train_loss": -6.485445976257324, "global_step": 113982, "epoch": 2713} {"train_loss": -6.358126640319824, "global_step": 113983, "epoch": 2713} {"train_loss": -6.377760410308838, "global_step": 113984, "epoch": 2713} {"train_loss": -6.470400810241699, "global_step": 113985, "epoch": 2713} {"train_loss": -6.466198921203613, "global_step": 113986, "epoch": 2713} {"train_loss": -6.495325020381382, "global_step": 113987, "epoch": 2713, "val_loss": 76466.421875} {"train_loss": -6.424445152282715, "global_step": 113988, "epoch": 2714} {"train_loss": -6.556856155395508, "global_step": 113989, "epoch": 2714} {"train_loss": -6.502002239227295, "global_step": 113990, "epoch": 2714} {"train_loss": -6.437920570373535, "global_step": 113991, "epoch": 2714} {"train_loss": -6.516950607299805, "global_step": 113992, "epoch": 2714} {"train_loss": -6.536362648010254, "global_step": 113993, "epoch": 2714} {"train_loss": -6.5975189208984375, "global_step": 113994, "epoch": 2714} {"train_loss": -6.405953407287598, "global_step": 113995, "epoch": 2714} {"train_loss": -6.450300216674805, "global_step": 113996, "epoch": 2714} {"train_loss": -6.503994941711426, "global_step": 113997, "epoch": 2714} {"train_loss": -6.407205104827881, "global_step": 113998, "epoch": 2714} {"train_loss": -6.5709333419799805, "global_step": 113999, "epoch": 2714} {"train_loss": -6.573826789855957, "global_step": 114000, "epoch": 2714} {"train_loss": -6.4475998878479, "global_step": 114001, "epoch": 2714} {"train_loss": -6.427563667297363, "global_step": 114002, "epoch": 2714} {"train_loss": -6.364798545837402, "global_step": 114003, "epoch": 2714} {"train_loss": -6.532785892486572, "global_step": 114004, "epoch": 2714} {"train_loss": -6.576794624328613, "global_step": 114005, "epoch": 2714} {"train_loss": -6.543112754821777, "global_step": 114006, "epoch": 2714} {"train_loss": -6.427404880523682, "global_step": 114007, "epoch": 2714} {"train_loss": -6.536509037017822, "global_step": 114008, "epoch": 2714} {"train_loss": -6.545384883880615, "global_step": 114009, "epoch": 2714} {"train_loss": -6.521714210510254, "global_step": 114010, "epoch": 2714} {"train_loss": -6.424466133117676, "global_step": 114011, "epoch": 2714} {"train_loss": -6.453484535217285, "global_step": 114012, "epoch": 2714} {"train_loss": -6.559296131134033, "global_step": 114013, "epoch": 2714} {"train_loss": -6.4546589851379395, "global_step": 114014, "epoch": 2714} {"train_loss": -6.454838752746582, "global_step": 114015, "epoch": 2714} {"train_loss": -6.322749137878418, "global_step": 114016, "epoch": 2714} {"train_loss": -6.455842971801758, "global_step": 114017, "epoch": 2714} {"train_loss": -6.639534950256348, "global_step": 114018, "epoch": 2714} {"train_loss": -6.613007545471191, "global_step": 114019, "epoch": 2714} {"train_loss": -6.438878059387207, "global_step": 114020, "epoch": 2714} {"train_loss": -6.542972564697266, "global_step": 114021, "epoch": 2714} {"train_loss": -6.432255268096924, "global_step": 114022, "epoch": 2714} {"train_loss": -6.276247024536133, "global_step": 114023, "epoch": 2714} {"train_loss": -6.595118522644043, "global_step": 114024, "epoch": 2714} {"train_loss": -6.460968971252441, "global_step": 114025, "epoch": 2714} {"train_loss": -6.457047462463379, "global_step": 114026, "epoch": 2714} {"train_loss": -6.479623317718506, "global_step": 114027, "epoch": 2714} {"train_loss": -6.5207672119140625, "global_step": 114028, "epoch": 2714} {"train_loss": -6.483534245263963, "global_step": 114029, "epoch": 2714, "val_loss": 76447.1015625} {"train_loss": -6.538161277770996, "global_step": 114030, "epoch": 2715} {"train_loss": -6.534908771514893, "global_step": 114031, "epoch": 2715} {"train_loss": -6.630003929138184, "global_step": 114032, "epoch": 2715} {"train_loss": -6.487014293670654, "global_step": 114033, "epoch": 2715} {"train_loss": -6.4937944412231445, "global_step": 114034, "epoch": 2715} {"train_loss": -6.51737642288208, "global_step": 114035, "epoch": 2715} {"train_loss": -6.498014450073242, "global_step": 114036, "epoch": 2715} {"train_loss": -6.535462379455566, "global_step": 114037, "epoch": 2715} {"train_loss": -6.494121551513672, "global_step": 114038, "epoch": 2715} {"train_loss": -6.427338123321533, "global_step": 114039, "epoch": 2715} {"train_loss": -6.466133117675781, "global_step": 114040, "epoch": 2715} {"train_loss": -6.432002067565918, "global_step": 114041, "epoch": 2715} {"train_loss": -6.497833728790283, "global_step": 114042, "epoch": 2715} {"train_loss": -6.54495096206665, "global_step": 114043, "epoch": 2715} {"train_loss": -6.3982834815979, "global_step": 114044, "epoch": 2715} {"train_loss": -6.463461875915527, "global_step": 114045, "epoch": 2715} {"train_loss": -6.370863914489746, "global_step": 114046, "epoch": 2715} {"train_loss": -6.481097221374512, "global_step": 114047, "epoch": 2715} {"train_loss": -6.394612789154053, "global_step": 114048, "epoch": 2715} {"train_loss": -6.621124744415283, "global_step": 114049, "epoch": 2715} {"train_loss": -6.556321620941162, "global_step": 114050, "epoch": 2715} {"train_loss": -6.4375715255737305, "global_step": 114051, "epoch": 2715} {"train_loss": -6.53105354309082, "global_step": 114052, "epoch": 2715} {"train_loss": -6.5360283851623535, "global_step": 114053, "epoch": 2715} {"train_loss": -6.46992301940918, "global_step": 114054, "epoch": 2715} {"train_loss": -6.490412712097168, "global_step": 114055, "epoch": 2715} {"train_loss": -6.609925270080566, "global_step": 114056, "epoch": 2715} {"train_loss": -6.5679931640625, "global_step": 114057, "epoch": 2715} {"train_loss": -6.539326190948486, "global_step": 114058, "epoch": 2715} {"train_loss": -6.489290714263916, "global_step": 114059, "epoch": 2715} {"train_loss": -6.502669334411621, "global_step": 114060, "epoch": 2715} {"train_loss": -6.564709186553955, "global_step": 114061, "epoch": 2715} {"train_loss": -6.530435562133789, "global_step": 114062, "epoch": 2715} {"train_loss": -6.583852767944336, "global_step": 114063, "epoch": 2715} {"train_loss": -6.498407363891602, "global_step": 114064, "epoch": 2715} {"train_loss": -6.39639949798584, "global_step": 114065, "epoch": 2715} {"train_loss": -6.56248140335083, "global_step": 114066, "epoch": 2715} {"train_loss": -6.603086948394775, "global_step": 114067, "epoch": 2715} {"train_loss": -6.4680280685424805, "global_step": 114068, "epoch": 2715} {"train_loss": -6.449146270751953, "global_step": 114069, "epoch": 2715} {"train_loss": -6.478584289550781, "global_step": 114070, "epoch": 2715} {"train_loss": -6.5047665777660555, "global_step": 114071, "epoch": 2715, "val_loss": 76455.7421875} {"train_loss": -6.650845527648926, "global_step": 114072, "epoch": 2716} {"train_loss": -6.503392219543457, "global_step": 114073, "epoch": 2716} {"train_loss": -6.519222259521484, "global_step": 114074, "epoch": 2716} {"train_loss": -6.632939338684082, "global_step": 114075, "epoch": 2716} {"train_loss": -6.557178497314453, "global_step": 114076, "epoch": 2716} {"train_loss": -6.413196086883545, "global_step": 114077, "epoch": 2716} {"train_loss": -6.4656782150268555, "global_step": 114078, "epoch": 2716} {"train_loss": -6.479744911193848, "global_step": 114079, "epoch": 2716} {"train_loss": -6.535200119018555, "global_step": 114080, "epoch": 2716} {"train_loss": -6.492690086364746, "global_step": 114081, "epoch": 2716} {"train_loss": -6.624913215637207, "global_step": 114082, "epoch": 2716} {"train_loss": -6.453255653381348, "global_step": 114083, "epoch": 2716} {"train_loss": -6.5771026611328125, "global_step": 114084, "epoch": 2716} {"train_loss": -6.540613174438477, "global_step": 114085, "epoch": 2716} {"train_loss": -6.517030715942383, "global_step": 114086, "epoch": 2716} {"train_loss": -6.534769058227539, "global_step": 114087, "epoch": 2716} {"train_loss": -6.604915618896484, "global_step": 114088, "epoch": 2716} {"train_loss": -6.435489654541016, "global_step": 114089, "epoch": 2716} {"train_loss": -6.568987846374512, "global_step": 114090, "epoch": 2716} {"train_loss": -6.53756046295166, "global_step": 114091, "epoch": 2716} {"train_loss": -6.422581672668457, "global_step": 114092, "epoch": 2716} {"train_loss": -6.466269493103027, "global_step": 114093, "epoch": 2716} {"train_loss": -6.47377872467041, "global_step": 114094, "epoch": 2716} {"train_loss": -6.535985946655273, "global_step": 114095, "epoch": 2716} {"train_loss": -6.441385269165039, "global_step": 114096, "epoch": 2716} {"train_loss": -6.510248184204102, "global_step": 114097, "epoch": 2716} {"train_loss": -6.588680267333984, "global_step": 114098, "epoch": 2716} {"train_loss": -6.511329650878906, "global_step": 114099, "epoch": 2716} {"train_loss": -6.424161911010742, "global_step": 114100, "epoch": 2716} {"train_loss": -6.567522048950195, "global_step": 114101, "epoch": 2716} {"train_loss": -6.537106990814209, "global_step": 114102, "epoch": 2716} {"train_loss": -6.568164825439453, "global_step": 114103, "epoch": 2716} {"train_loss": -6.603408336639404, "global_step": 114104, "epoch": 2716} {"train_loss": -6.588413715362549, "global_step": 114105, "epoch": 2716} {"train_loss": -6.565566539764404, "global_step": 114106, "epoch": 2716} {"train_loss": -6.484066963195801, "global_step": 114107, "epoch": 2716} {"train_loss": -6.581687927246094, "global_step": 114108, "epoch": 2716} {"train_loss": -6.601048469543457, "global_step": 114109, "epoch": 2716} {"train_loss": -6.549117088317871, "global_step": 114110, "epoch": 2716} {"train_loss": -6.485621452331543, "global_step": 114111, "epoch": 2716} {"train_loss": -6.413475036621094, "global_step": 114112, "epoch": 2716} {"train_loss": -6.5263986473991755, "global_step": 114113, "epoch": 2716, "val_loss": 76462.359375} {"train_loss": -6.439176559448242, "global_step": 114114, "epoch": 2717} {"train_loss": -6.460992813110352, "global_step": 114115, "epoch": 2717} {"train_loss": -6.479533672332764, "global_step": 114116, "epoch": 2717} {"train_loss": -6.54667329788208, "global_step": 114117, "epoch": 2717} {"train_loss": -6.49018669128418, "global_step": 114118, "epoch": 2717} {"train_loss": -6.547468185424805, "global_step": 114119, "epoch": 2717} {"train_loss": -6.538275718688965, "global_step": 114120, "epoch": 2717} {"train_loss": -6.441836357116699, "global_step": 114121, "epoch": 2717} {"train_loss": -6.481540679931641, "global_step": 114122, "epoch": 2717} {"train_loss": -6.548429489135742, "global_step": 114123, "epoch": 2717} {"train_loss": -6.5124688148498535, "global_step": 114124, "epoch": 2717} {"train_loss": -6.5104756355285645, "global_step": 114125, "epoch": 2717} {"train_loss": -6.618806838989258, "global_step": 114126, "epoch": 2717} {"train_loss": -6.419643402099609, "global_step": 114127, "epoch": 2717} {"train_loss": -6.522878646850586, "global_step": 114128, "epoch": 2717} {"train_loss": -6.528197288513184, "global_step": 114129, "epoch": 2717} {"train_loss": -6.573590278625488, "global_step": 114130, "epoch": 2717} {"train_loss": -6.42119026184082, "global_step": 114131, "epoch": 2717} {"train_loss": -6.6255292892456055, "global_step": 114132, "epoch": 2717} {"train_loss": -6.568941116333008, "global_step": 114133, "epoch": 2717} {"train_loss": -6.600470066070557, "global_step": 114134, "epoch": 2717} {"train_loss": -6.488251686096191, "global_step": 114135, "epoch": 2717} {"train_loss": -6.4514665603637695, "global_step": 114136, "epoch": 2717} {"train_loss": -6.525224685668945, "global_step": 114137, "epoch": 2717} {"train_loss": -6.578978538513184, "global_step": 114138, "epoch": 2717} {"train_loss": -6.4359612464904785, "global_step": 114139, "epoch": 2717} {"train_loss": -6.487712383270264, "global_step": 114140, "epoch": 2717} {"train_loss": -6.536995887756348, "global_step": 114141, "epoch": 2717} {"train_loss": -6.549822807312012, "global_step": 114142, "epoch": 2717} {"train_loss": -6.435904502868652, "global_step": 114143, "epoch": 2717} {"train_loss": -6.463744163513184, "global_step": 114144, "epoch": 2717} {"train_loss": -6.4160943031311035, "global_step": 114145, "epoch": 2717} {"train_loss": -6.463902950286865, "global_step": 114146, "epoch": 2717} {"train_loss": -6.492763519287109, "global_step": 114147, "epoch": 2717} {"train_loss": -6.487317085266113, "global_step": 114148, "epoch": 2717} {"train_loss": -6.492461681365967, "global_step": 114149, "epoch": 2717} {"train_loss": -6.464927673339844, "global_step": 114150, "epoch": 2717} {"train_loss": -6.450567245483398, "global_step": 114151, "epoch": 2717} {"train_loss": -6.411993980407715, "global_step": 114152, "epoch": 2717} {"train_loss": -6.450466632843018, "global_step": 114153, "epoch": 2717} {"train_loss": -6.582036972045898, "global_step": 114154, "epoch": 2717} {"train_loss": -6.499638954798381, "global_step": 114155, "epoch": 2717, "val_loss": 76589.0625} {"train_loss": -6.256905555725098, "global_step": 114156, "epoch": 2718} {"train_loss": -6.439535140991211, "global_step": 114157, "epoch": 2718} {"train_loss": -6.318353652954102, "global_step": 114158, "epoch": 2718} {"train_loss": -6.526551246643066, "global_step": 114159, "epoch": 2718} {"train_loss": -6.370917797088623, "global_step": 114160, "epoch": 2718} {"train_loss": -6.464646816253662, "global_step": 114161, "epoch": 2718} {"train_loss": -6.33106803894043, "global_step": 114162, "epoch": 2718} {"train_loss": -6.4852800369262695, "global_step": 114163, "epoch": 2718} {"train_loss": -6.461957931518555, "global_step": 114164, "epoch": 2718} {"train_loss": -6.496426105499268, "global_step": 114165, "epoch": 2718} {"train_loss": -6.3762617111206055, "global_step": 114166, "epoch": 2718} {"train_loss": -6.5260114669799805, "global_step": 114167, "epoch": 2718} {"train_loss": -6.4008469581604, "global_step": 114168, "epoch": 2718} {"train_loss": -6.356475830078125, "global_step": 114169, "epoch": 2718} {"train_loss": -6.4369797706604, "global_step": 114170, "epoch": 2718} {"train_loss": -6.4526472091674805, "global_step": 114171, "epoch": 2718} {"train_loss": -6.428147315979004, "global_step": 114172, "epoch": 2718} {"train_loss": -6.471130847930908, "global_step": 114173, "epoch": 2718} {"train_loss": -6.522272109985352, "global_step": 114174, "epoch": 2718} {"train_loss": -6.502682685852051, "global_step": 114175, "epoch": 2718} {"train_loss": -6.4389753341674805, "global_step": 114176, "epoch": 2718} {"train_loss": -6.4643144607543945, "global_step": 114177, "epoch": 2718} {"train_loss": -6.530799865722656, "global_step": 114178, "epoch": 2718} {"train_loss": -6.549861907958984, "global_step": 114179, "epoch": 2718} {"train_loss": -6.438206672668457, "global_step": 114180, "epoch": 2718} {"train_loss": -6.362095832824707, "global_step": 114181, "epoch": 2718} {"train_loss": -6.525638580322266, "global_step": 114182, "epoch": 2718} {"train_loss": -6.459641933441162, "global_step": 114183, "epoch": 2718} {"train_loss": -6.452167510986328, "global_step": 114184, "epoch": 2718} {"train_loss": -6.459551811218262, "global_step": 114185, "epoch": 2718} {"train_loss": -6.541728496551514, "global_step": 114186, "epoch": 2718} {"train_loss": -6.491277694702148, "global_step": 114187, "epoch": 2718} {"train_loss": -6.528500556945801, "global_step": 114188, "epoch": 2718} {"train_loss": -6.537110805511475, "global_step": 114189, "epoch": 2718} {"train_loss": -6.556406497955322, "global_step": 114190, "epoch": 2718} {"train_loss": -6.362274169921875, "global_step": 114191, "epoch": 2718} {"train_loss": -6.473126411437988, "global_step": 114192, "epoch": 2718} {"train_loss": -6.527354717254639, "global_step": 114193, "epoch": 2718} {"train_loss": -6.531711578369141, "global_step": 114194, "epoch": 2718} {"train_loss": -6.479193210601807, "global_step": 114195, "epoch": 2718} {"train_loss": -6.465187072753906, "global_step": 114196, "epoch": 2718} {"train_loss": -6.45753136135283, "global_step": 114197, "epoch": 2718, "val_loss": 76253.0546875} {"train_loss": -6.592940807342529, "global_step": 114198, "epoch": 2719} {"train_loss": -6.3826904296875, "global_step": 114199, "epoch": 2719} {"train_loss": -6.537278652191162, "global_step": 114200, "epoch": 2719} {"train_loss": -6.523818016052246, "global_step": 114201, "epoch": 2719} {"train_loss": -6.408387184143066, "global_step": 114202, "epoch": 2719} {"train_loss": -6.53022575378418, "global_step": 114203, "epoch": 2719} {"train_loss": -6.5478925704956055, "global_step": 114204, "epoch": 2719} {"train_loss": -6.546065330505371, "global_step": 114205, "epoch": 2719} {"train_loss": -6.478612899780273, "global_step": 114206, "epoch": 2719} {"train_loss": -6.341278553009033, "global_step": 114207, "epoch": 2719} {"train_loss": -6.491768836975098, "global_step": 114208, "epoch": 2719} {"train_loss": -6.521443843841553, "global_step": 114209, "epoch": 2719} {"train_loss": -6.405584812164307, "global_step": 114210, "epoch": 2719} {"train_loss": -6.484003067016602, "global_step": 114211, "epoch": 2719} {"train_loss": -6.524541854858398, "global_step": 114212, "epoch": 2719} {"train_loss": -6.518291473388672, "global_step": 114213, "epoch": 2719} {"train_loss": -6.505769729614258, "global_step": 114214, "epoch": 2719} {"train_loss": -6.640320301055908, "global_step": 114215, "epoch": 2719} {"train_loss": -6.5421624183654785, "global_step": 114216, "epoch": 2719} {"train_loss": -6.583860397338867, "global_step": 114217, "epoch": 2719} {"train_loss": -6.575842380523682, "global_step": 114218, "epoch": 2719} {"train_loss": -6.529584884643555, "global_step": 114219, "epoch": 2719} {"train_loss": -6.610688209533691, "global_step": 114220, "epoch": 2719} {"train_loss": -6.480159759521484, "global_step": 114221, "epoch": 2719} {"train_loss": -6.488882541656494, "global_step": 114222, "epoch": 2719} {"train_loss": -6.459597110748291, "global_step": 114223, "epoch": 2719} {"train_loss": -6.4588518142700195, "global_step": 114224, "epoch": 2719} {"train_loss": -6.596290588378906, "global_step": 114225, "epoch": 2719} {"train_loss": -6.613978385925293, "global_step": 114226, "epoch": 2719} {"train_loss": -6.573302268981934, "global_step": 114227, "epoch": 2719} {"train_loss": -6.372621536254883, "global_step": 114228, "epoch": 2719} {"train_loss": -6.46437931060791, "global_step": 114229, "epoch": 2719} {"train_loss": -6.44453763961792, "global_step": 114230, "epoch": 2719} {"train_loss": -6.482424259185791, "global_step": 114231, "epoch": 2719} {"train_loss": -6.542288780212402, "global_step": 114232, "epoch": 2719} {"train_loss": -6.4519877433776855, "global_step": 114233, "epoch": 2719} {"train_loss": -6.611863613128662, "global_step": 114234, "epoch": 2719} {"train_loss": -6.4620771408081055, "global_step": 114235, "epoch": 2719} {"train_loss": -6.480181694030762, "global_step": 114236, "epoch": 2719} {"train_loss": -6.497515678405762, "global_step": 114237, "epoch": 2719} {"train_loss": -6.5906853675842285, "global_step": 114238, "epoch": 2719} {"train_loss": -6.509108815874372, "global_step": 114239, "epoch": 2719, "val_loss": 76456.328125} {"train_loss": -6.577190399169922, "global_step": 114240, "epoch": 2720} {"train_loss": -6.4929914474487305, "global_step": 114241, "epoch": 2720} {"train_loss": -6.561456680297852, "global_step": 114242, "epoch": 2720} {"train_loss": -6.654529094696045, "global_step": 114243, "epoch": 2720} {"train_loss": -6.466805458068848, "global_step": 114244, "epoch": 2720} {"train_loss": -6.557586669921875, "global_step": 114245, "epoch": 2720} {"train_loss": -6.533841133117676, "global_step": 114246, "epoch": 2720} {"train_loss": -6.451859474182129, "global_step": 114247, "epoch": 2720} {"train_loss": -6.452129364013672, "global_step": 114248, "epoch": 2720} {"train_loss": -6.462470054626465, "global_step": 114249, "epoch": 2720} {"train_loss": -6.555980682373047, "global_step": 114250, "epoch": 2720} {"train_loss": -6.588049411773682, "global_step": 114251, "epoch": 2720} {"train_loss": -6.550678253173828, "global_step": 114252, "epoch": 2720} {"train_loss": -6.570628643035889, "global_step": 114253, "epoch": 2720} {"train_loss": -6.504177093505859, "global_step": 114254, "epoch": 2720} {"train_loss": -6.5386786460876465, "global_step": 114255, "epoch": 2720} {"train_loss": -6.551014423370361, "global_step": 114256, "epoch": 2720} {"train_loss": -6.539149761199951, "global_step": 114257, "epoch": 2720} {"train_loss": -6.544247627258301, "global_step": 114258, "epoch": 2720} {"train_loss": -6.44485330581665, "global_step": 114259, "epoch": 2720} {"train_loss": -6.566941261291504, "global_step": 114260, "epoch": 2720} {"train_loss": -6.421448707580566, "global_step": 114261, "epoch": 2720} {"train_loss": -6.5263776779174805, "global_step": 114262, "epoch": 2720} {"train_loss": -6.576809883117676, "global_step": 114263, "epoch": 2720} {"train_loss": -6.480529308319092, "global_step": 114264, "epoch": 2720} {"train_loss": -6.6601409912109375, "global_step": 114265, "epoch": 2720} {"train_loss": -6.535701751708984, "global_step": 114266, "epoch": 2720} {"train_loss": -6.524637222290039, "global_step": 114267, "epoch": 2720} {"train_loss": -6.576591491699219, "global_step": 114268, "epoch": 2720} {"train_loss": -6.585427284240723, "global_step": 114269, "epoch": 2720} {"train_loss": -6.584364414215088, "global_step": 114270, "epoch": 2720} {"train_loss": -6.592522621154785, "global_step": 114271, "epoch": 2720} {"train_loss": -6.518638610839844, "global_step": 114272, "epoch": 2720} {"train_loss": -6.603803634643555, "global_step": 114273, "epoch": 2720} {"train_loss": -6.457306861877441, "global_step": 114274, "epoch": 2720} {"train_loss": -6.474464416503906, "global_step": 114275, "epoch": 2720} {"train_loss": -6.5716094970703125, "global_step": 114276, "epoch": 2720} {"train_loss": -6.520477294921875, "global_step": 114277, "epoch": 2720} {"train_loss": -6.427724361419678, "global_step": 114278, "epoch": 2720} {"train_loss": -6.572229385375977, "global_step": 114279, "epoch": 2720} {"train_loss": -6.495253562927246, "global_step": 114280, "epoch": 2720} {"train_loss": -6.530832018171038, "global_step": 114281, "epoch": 2720, "val_loss": 76654.3125} {"train_loss": -6.477625846862793, "global_step": 114282, "epoch": 2721} {"train_loss": -6.485559940338135, "global_step": 114283, "epoch": 2721} {"train_loss": -6.5660223960876465, "global_step": 114284, "epoch": 2721} {"train_loss": -6.56260871887207, "global_step": 114285, "epoch": 2721} {"train_loss": -6.485051155090332, "global_step": 114286, "epoch": 2721} {"train_loss": -6.381702423095703, "global_step": 114287, "epoch": 2721} {"train_loss": -6.4039459228515625, "global_step": 114288, "epoch": 2721} {"train_loss": -6.406698703765869, "global_step": 114289, "epoch": 2721} {"train_loss": -6.514740467071533, "global_step": 114290, "epoch": 2721} {"train_loss": -6.532327175140381, "global_step": 114291, "epoch": 2721} {"train_loss": -6.470425605773926, "global_step": 114292, "epoch": 2721} {"train_loss": -6.497137069702148, "global_step": 114293, "epoch": 2721} {"train_loss": -6.422356605529785, "global_step": 114294, "epoch": 2721} {"train_loss": -6.462131500244141, "global_step": 114295, "epoch": 2721} {"train_loss": -6.480072975158691, "global_step": 114296, "epoch": 2721} {"train_loss": -6.530211448669434, "global_step": 114297, "epoch": 2721} {"train_loss": -6.406981468200684, "global_step": 114298, "epoch": 2721} {"train_loss": -6.455035209655762, "global_step": 114299, "epoch": 2721} {"train_loss": -6.5438551902771, "global_step": 114300, "epoch": 2721} {"train_loss": -6.369951248168945, "global_step": 114301, "epoch": 2721} {"train_loss": -6.4907732009887695, "global_step": 114302, "epoch": 2721} {"train_loss": -6.379755020141602, "global_step": 114303, "epoch": 2721} {"train_loss": -6.435861587524414, "global_step": 114304, "epoch": 2721} {"train_loss": -6.450351715087891, "global_step": 114305, "epoch": 2721} {"train_loss": -6.455191612243652, "global_step": 114306, "epoch": 2721} {"train_loss": -6.4461822509765625, "global_step": 114307, "epoch": 2721} {"train_loss": -6.4398698806762695, "global_step": 114308, "epoch": 2721} {"train_loss": -6.472177505493164, "global_step": 114309, "epoch": 2721} {"train_loss": -6.4511189460754395, "global_step": 114310, "epoch": 2721} {"train_loss": -6.440357208251953, "global_step": 114311, "epoch": 2721} {"train_loss": -6.45721435546875, "global_step": 114312, "epoch": 2721} {"train_loss": -6.485963821411133, "global_step": 114313, "epoch": 2721} {"train_loss": -6.6115007400512695, "global_step": 114314, "epoch": 2721} {"train_loss": -6.418100357055664, "global_step": 114315, "epoch": 2721} {"train_loss": -6.511340141296387, "global_step": 114316, "epoch": 2721} {"train_loss": -6.563549995422363, "global_step": 114317, "epoch": 2721} {"train_loss": -6.551972389221191, "global_step": 114318, "epoch": 2721} {"train_loss": -6.49592399597168, "global_step": 114319, "epoch": 2721} {"train_loss": -6.483574867248535, "global_step": 114320, "epoch": 2721} {"train_loss": -6.595686912536621, "global_step": 114321, "epoch": 2721} {"train_loss": -6.4386677742004395, "global_step": 114322, "epoch": 2721} {"train_loss": -6.477223805018833, "global_step": 114323, "epoch": 2721, "val_loss": 76659.9921875} {"train_loss": -6.45146369934082, "global_step": 114324, "epoch": 2722} {"train_loss": -6.538402557373047, "global_step": 114325, "epoch": 2722} {"train_loss": -6.4828901290893555, "global_step": 114326, "epoch": 2722} {"train_loss": -6.524957180023193, "global_step": 114327, "epoch": 2722} {"train_loss": -6.569414138793945, "global_step": 114328, "epoch": 2722} {"train_loss": -6.5528717041015625, "global_step": 114329, "epoch": 2722} {"train_loss": -6.690378189086914, "global_step": 114330, "epoch": 2722} {"train_loss": -6.4857964515686035, "global_step": 114331, "epoch": 2722} {"train_loss": -6.526371955871582, "global_step": 114332, "epoch": 2722} {"train_loss": -6.438061714172363, "global_step": 114333, "epoch": 2722} {"train_loss": -6.608682155609131, "global_step": 114334, "epoch": 2722} {"train_loss": -6.571811199188232, "global_step": 114335, "epoch": 2722} {"train_loss": -6.59415340423584, "global_step": 114336, "epoch": 2722} {"train_loss": -6.466987609863281, "global_step": 114337, "epoch": 2722} {"train_loss": -6.615826606750488, "global_step": 114338, "epoch": 2722} {"train_loss": -6.557478427886963, "global_step": 114339, "epoch": 2722} {"train_loss": -6.39906120300293, "global_step": 114340, "epoch": 2722} {"train_loss": -6.5544328689575195, "global_step": 114341, "epoch": 2722} {"train_loss": -6.476747989654541, "global_step": 114342, "epoch": 2722} {"train_loss": -6.639278888702393, "global_step": 114343, "epoch": 2722} {"train_loss": -6.554347991943359, "global_step": 114344, "epoch": 2722} {"train_loss": -6.495081901550293, "global_step": 114345, "epoch": 2722} {"train_loss": -6.520545959472656, "global_step": 114346, "epoch": 2722} {"train_loss": -6.649837493896484, "global_step": 114347, "epoch": 2722} {"train_loss": -6.508616924285889, "global_step": 114348, "epoch": 2722} {"train_loss": -6.486014366149902, "global_step": 114349, "epoch": 2722} {"train_loss": -6.5160369873046875, "global_step": 114350, "epoch": 2722} {"train_loss": -6.5774335861206055, "global_step": 114351, "epoch": 2722} {"train_loss": -6.545052528381348, "global_step": 114352, "epoch": 2722} {"train_loss": -6.562979698181152, "global_step": 114353, "epoch": 2722} {"train_loss": -6.510934829711914, "global_step": 114354, "epoch": 2722} {"train_loss": -6.539162635803223, "global_step": 114355, "epoch": 2722} {"train_loss": -6.492868423461914, "global_step": 114356, "epoch": 2722} {"train_loss": -6.414822578430176, "global_step": 114357, "epoch": 2722} {"train_loss": -6.499041557312012, "global_step": 114358, "epoch": 2722} {"train_loss": -6.428622245788574, "global_step": 114359, "epoch": 2722} {"train_loss": -6.528655052185059, "global_step": 114360, "epoch": 2722} {"train_loss": -6.604998588562012, "global_step": 114361, "epoch": 2722} {"train_loss": -6.486997604370117, "global_step": 114362, "epoch": 2722} {"train_loss": -6.658034801483154, "global_step": 114363, "epoch": 2722} {"train_loss": -6.508450508117676, "global_step": 114364, "epoch": 2722} {"train_loss": -6.53366292090643, "global_step": 114365, "epoch": 2722, "val_loss": 76796.546875} {"train_loss": -6.505115985870361, "global_step": 114366, "epoch": 2723} {"train_loss": -6.438540458679199, "global_step": 114367, "epoch": 2723} {"train_loss": -6.508603096008301, "global_step": 114368, "epoch": 2723} {"train_loss": -6.4908342361450195, "global_step": 114369, "epoch": 2723} {"train_loss": -6.632651329040527, "global_step": 114370, "epoch": 2723} {"train_loss": -6.5180768966674805, "global_step": 114371, "epoch": 2723} {"train_loss": -6.5462965965271, "global_step": 114372, "epoch": 2723} {"train_loss": -6.4519853591918945, "global_step": 114373, "epoch": 2723} {"train_loss": -6.4431657791137695, "global_step": 114374, "epoch": 2723} {"train_loss": -6.601787090301514, "global_step": 114375, "epoch": 2723} {"train_loss": -6.470396995544434, "global_step": 114376, "epoch": 2723} {"train_loss": -6.43062162399292, "global_step": 114377, "epoch": 2723} {"train_loss": -6.567927837371826, "global_step": 114378, "epoch": 2723} {"train_loss": -6.378354549407959, "global_step": 114379, "epoch": 2723} {"train_loss": -6.578287124633789, "global_step": 114380, "epoch": 2723} {"train_loss": -6.544852256774902, "global_step": 114381, "epoch": 2723} {"train_loss": -6.506254196166992, "global_step": 114382, "epoch": 2723} {"train_loss": -6.597085952758789, "global_step": 114383, "epoch": 2723} {"train_loss": -6.585322380065918, "global_step": 114384, "epoch": 2723} {"train_loss": -6.583207607269287, "global_step": 114385, "epoch": 2723} {"train_loss": -6.52579927444458, "global_step": 114386, "epoch": 2723} {"train_loss": -6.402426719665527, "global_step": 114387, "epoch": 2723} {"train_loss": -6.6140360832214355, "global_step": 114388, "epoch": 2723} {"train_loss": -6.47780179977417, "global_step": 114389, "epoch": 2723} {"train_loss": -6.575981616973877, "global_step": 114390, "epoch": 2723} {"train_loss": -6.636946678161621, "global_step": 114391, "epoch": 2723} {"train_loss": -6.536627292633057, "global_step": 114392, "epoch": 2723} {"train_loss": -6.419818878173828, "global_step": 114393, "epoch": 2723} {"train_loss": -6.525523662567139, "global_step": 114394, "epoch": 2723} {"train_loss": -6.51731014251709, "global_step": 114395, "epoch": 2723} {"train_loss": -6.557925224304199, "global_step": 114396, "epoch": 2723} {"train_loss": -6.600572109222412, "global_step": 114397, "epoch": 2723} {"train_loss": -6.495776653289795, "global_step": 114398, "epoch": 2723} {"train_loss": -6.423282623291016, "global_step": 114399, "epoch": 2723} {"train_loss": -6.497801303863525, "global_step": 114400, "epoch": 2723} {"train_loss": -6.524020195007324, "global_step": 114401, "epoch": 2723} {"train_loss": -6.4208173751831055, "global_step": 114402, "epoch": 2723} {"train_loss": -6.4636430740356445, "global_step": 114403, "epoch": 2723} {"train_loss": -6.6044721603393555, "global_step": 114404, "epoch": 2723} {"train_loss": -6.407132625579834, "global_step": 114405, "epoch": 2723} {"train_loss": -6.429533004760742, "global_step": 114406, "epoch": 2723} {"train_loss": -6.51363528342474, "global_step": 114407, "epoch": 2723, "val_loss": 76520.296875} {"train_loss": -6.48761510848999, "global_step": 114408, "epoch": 2724} {"train_loss": -6.542152404785156, "global_step": 114409, "epoch": 2724} {"train_loss": -6.490929126739502, "global_step": 114410, "epoch": 2724} {"train_loss": -6.624196529388428, "global_step": 114411, "epoch": 2724} {"train_loss": -6.378637313842773, "global_step": 114412, "epoch": 2724} {"train_loss": -6.507408618927002, "global_step": 114413, "epoch": 2724} {"train_loss": -6.500842571258545, "global_step": 114414, "epoch": 2724} {"train_loss": -6.440831184387207, "global_step": 114415, "epoch": 2724} {"train_loss": -6.568886756896973, "global_step": 114416, "epoch": 2724} {"train_loss": -6.549346923828125, "global_step": 114417, "epoch": 2724} {"train_loss": -6.427382469177246, "global_step": 114418, "epoch": 2724} {"train_loss": -6.543787002563477, "global_step": 114419, "epoch": 2724} {"train_loss": -6.503284931182861, "global_step": 114420, "epoch": 2724} {"train_loss": -6.463649749755859, "global_step": 114421, "epoch": 2724} {"train_loss": -6.45136022567749, "global_step": 114422, "epoch": 2724} {"train_loss": -6.533329010009766, "global_step": 114423, "epoch": 2724} {"train_loss": -6.388771057128906, "global_step": 114424, "epoch": 2724} {"train_loss": -6.416090488433838, "global_step": 114425, "epoch": 2724} {"train_loss": -6.593419551849365, "global_step": 114426, "epoch": 2724} {"train_loss": -6.387576103210449, "global_step": 114427, "epoch": 2724} {"train_loss": -6.571874141693115, "global_step": 114428, "epoch": 2724} {"train_loss": -6.530669212341309, "global_step": 114429, "epoch": 2724} {"train_loss": -6.51202392578125, "global_step": 114430, "epoch": 2724} {"train_loss": -6.628109931945801, "global_step": 114431, "epoch": 2724} {"train_loss": -6.51973819732666, "global_step": 114432, "epoch": 2724} {"train_loss": -6.409763336181641, "global_step": 114433, "epoch": 2724} {"train_loss": -6.486527442932129, "global_step": 114434, "epoch": 2724} {"train_loss": -6.540502548217773, "global_step": 114435, "epoch": 2724} {"train_loss": -6.5821003913879395, "global_step": 114436, "epoch": 2724} {"train_loss": -6.40315055847168, "global_step": 114437, "epoch": 2724} {"train_loss": -6.425384521484375, "global_step": 114438, "epoch": 2724} {"train_loss": -6.54182243347168, "global_step": 114439, "epoch": 2724} {"train_loss": -6.469999313354492, "global_step": 114440, "epoch": 2724} {"train_loss": -6.547417640686035, "global_step": 114441, "epoch": 2724} {"train_loss": -6.488966941833496, "global_step": 114442, "epoch": 2724} {"train_loss": -6.550356864929199, "global_step": 114443, "epoch": 2724} {"train_loss": -6.435544013977051, "global_step": 114444, "epoch": 2724} {"train_loss": -6.486217498779297, "global_step": 114445, "epoch": 2724} {"train_loss": -6.5304365158081055, "global_step": 114446, "epoch": 2724} {"train_loss": -6.520049095153809, "global_step": 114447, "epoch": 2724} {"train_loss": -6.645720958709717, "global_step": 114448, "epoch": 2724} {"train_loss": -6.501364957718622, "global_step": 114449, "epoch": 2724, "val_loss": 76671.7109375} {"train_loss": -6.5736236572265625, "global_step": 114450, "epoch": 2725} {"train_loss": -6.4733076095581055, "global_step": 114451, "epoch": 2725} {"train_loss": -6.535345077514648, "global_step": 114452, "epoch": 2725} {"train_loss": -6.497366905212402, "global_step": 114453, "epoch": 2725} {"train_loss": -6.475329399108887, "global_step": 114454, "epoch": 2725} {"train_loss": -6.560918807983398, "global_step": 114455, "epoch": 2725} {"train_loss": -6.523627281188965, "global_step": 114456, "epoch": 2725} {"train_loss": -6.366145133972168, "global_step": 114457, "epoch": 2725} {"train_loss": -6.584772109985352, "global_step": 114458, "epoch": 2725} {"train_loss": -6.502623558044434, "global_step": 114459, "epoch": 2725} {"train_loss": -6.441880702972412, "global_step": 114460, "epoch": 2725} {"train_loss": -6.600180625915527, "global_step": 114461, "epoch": 2725} {"train_loss": -6.593153953552246, "global_step": 114462, "epoch": 2725} {"train_loss": -6.499078750610352, "global_step": 114463, "epoch": 2725} {"train_loss": -6.476611137390137, "global_step": 114464, "epoch": 2725} {"train_loss": -6.513724327087402, "global_step": 114465, "epoch": 2725} {"train_loss": -6.3647027015686035, "global_step": 114466, "epoch": 2725} {"train_loss": -6.4819111824035645, "global_step": 114467, "epoch": 2725} {"train_loss": -6.410955905914307, "global_step": 114468, "epoch": 2725} {"train_loss": -6.493803977966309, "global_step": 114469, "epoch": 2725} {"train_loss": -6.412199974060059, "global_step": 114470, "epoch": 2725} {"train_loss": -6.355711936950684, "global_step": 114471, "epoch": 2725} {"train_loss": -6.632330894470215, "global_step": 114472, "epoch": 2725} {"train_loss": -6.428379058837891, "global_step": 114473, "epoch": 2725} {"train_loss": -6.496786594390869, "global_step": 114474, "epoch": 2725} {"train_loss": -6.518128395080566, "global_step": 114475, "epoch": 2725} {"train_loss": -6.406128883361816, "global_step": 114476, "epoch": 2725} {"train_loss": -6.4924235343933105, "global_step": 114477, "epoch": 2725} {"train_loss": -6.413339138031006, "global_step": 114478, "epoch": 2725} {"train_loss": -6.446674346923828, "global_step": 114479, "epoch": 2725} {"train_loss": -6.445679664611816, "global_step": 114480, "epoch": 2725} {"train_loss": -6.384260177612305, "global_step": 114481, "epoch": 2725} {"train_loss": -6.395584583282471, "global_step": 114482, "epoch": 2725} {"train_loss": -6.5116071701049805, "global_step": 114483, "epoch": 2725} {"train_loss": -6.526309490203857, "global_step": 114484, "epoch": 2725} {"train_loss": -6.418454170227051, "global_step": 114485, "epoch": 2725} {"train_loss": -6.439237594604492, "global_step": 114486, "epoch": 2725} {"train_loss": -6.486043930053711, "global_step": 114487, "epoch": 2725} {"train_loss": -6.485940456390381, "global_step": 114488, "epoch": 2725} {"train_loss": -6.482902526855469, "global_step": 114489, "epoch": 2725} {"train_loss": -6.501201152801514, "global_step": 114490, "epoch": 2725} {"train_loss": -6.480750560760498, "global_step": 114491, "epoch": 2725, "val_loss": 76483.9921875} {"train_loss": -6.638880252838135, "global_step": 114492, "epoch": 2726} {"train_loss": -6.619531631469727, "global_step": 114493, "epoch": 2726} {"train_loss": -6.664595603942871, "global_step": 114494, "epoch": 2726} {"train_loss": -6.629249095916748, "global_step": 114495, "epoch": 2726} {"train_loss": -6.48052453994751, "global_step": 114496, "epoch": 2726} {"train_loss": -6.668310165405273, "global_step": 114497, "epoch": 2726} {"train_loss": -6.480277061462402, "global_step": 114498, "epoch": 2726} {"train_loss": -6.566714286804199, "global_step": 114499, "epoch": 2726} {"train_loss": -6.726766109466553, "global_step": 114500, "epoch": 2726} {"train_loss": -6.4411211013793945, "global_step": 114501, "epoch": 2726} {"train_loss": -6.503209590911865, "global_step": 114502, "epoch": 2726} {"train_loss": -6.5465826988220215, "global_step": 114503, "epoch": 2726} {"train_loss": -6.569462299346924, "global_step": 114504, "epoch": 2726} {"train_loss": -6.500941276550293, "global_step": 114505, "epoch": 2726} {"train_loss": -6.578924655914307, "global_step": 114506, "epoch": 2726} {"train_loss": -6.540625095367432, "global_step": 114507, "epoch": 2726} {"train_loss": -6.4659037590026855, "global_step": 114508, "epoch": 2726} {"train_loss": -6.451898574829102, "global_step": 114509, "epoch": 2726} {"train_loss": -6.493136882781982, "global_step": 114510, "epoch": 2726} {"train_loss": -6.571480751037598, "global_step": 114511, "epoch": 2726} {"train_loss": -6.481973648071289, "global_step": 114512, "epoch": 2726} {"train_loss": -6.472203254699707, "global_step": 114513, "epoch": 2726} {"train_loss": -6.461263656616211, "global_step": 114514, "epoch": 2726} {"train_loss": -6.478546142578125, "global_step": 114515, "epoch": 2726} {"train_loss": -6.4443583488464355, "global_step": 114516, "epoch": 2726} {"train_loss": -6.42918586730957, "global_step": 114517, "epoch": 2726} {"train_loss": -6.624701023101807, "global_step": 114518, "epoch": 2726} {"train_loss": -6.4825897216796875, "global_step": 114519, "epoch": 2726} {"train_loss": -6.442566394805908, "global_step": 114520, "epoch": 2726} {"train_loss": -6.5042829513549805, "global_step": 114521, "epoch": 2726} {"train_loss": -6.463982582092285, "global_step": 114522, "epoch": 2726} {"train_loss": -6.319370269775391, "global_step": 114523, "epoch": 2726} {"train_loss": -6.455869674682617, "global_step": 114524, "epoch": 2726} {"train_loss": -6.456171989440918, "global_step": 114525, "epoch": 2726} {"train_loss": -6.3089494705200195, "global_step": 114526, "epoch": 2726} {"train_loss": -6.46155309677124, "global_step": 114527, "epoch": 2726} {"train_loss": -6.53053617477417, "global_step": 114528, "epoch": 2726} {"train_loss": -6.563912868499756, "global_step": 114529, "epoch": 2726} {"train_loss": -6.377416133880615, "global_step": 114530, "epoch": 2726} {"train_loss": -6.4181108474731445, "global_step": 114531, "epoch": 2726} {"train_loss": -6.464057922363281, "global_step": 114532, "epoch": 2726} {"train_loss": -6.507752770469303, "global_step": 114533, "epoch": 2726, "val_loss": 76412.3359375} {"train_loss": -6.533260822296143, "global_step": 114534, "epoch": 2727} {"train_loss": -6.650623798370361, "global_step": 114535, "epoch": 2727} {"train_loss": -6.531607627868652, "global_step": 114536, "epoch": 2727} {"train_loss": -6.500746250152588, "global_step": 114537, "epoch": 2727} {"train_loss": -6.483859062194824, "global_step": 114538, "epoch": 2727} {"train_loss": -6.534416675567627, "global_step": 114539, "epoch": 2727} {"train_loss": -6.574087142944336, "global_step": 114540, "epoch": 2727} {"train_loss": -6.567866802215576, "global_step": 114541, "epoch": 2727} {"train_loss": -6.4738006591796875, "global_step": 114542, "epoch": 2727} {"train_loss": -6.5206298828125, "global_step": 114543, "epoch": 2727} {"train_loss": -6.513288974761963, "global_step": 114544, "epoch": 2727} {"train_loss": -6.5393781661987305, "global_step": 114545, "epoch": 2727} {"train_loss": -6.586225986480713, "global_step": 114546, "epoch": 2727} {"train_loss": -6.502041816711426, "global_step": 114547, "epoch": 2727} {"train_loss": -6.527891635894775, "global_step": 114548, "epoch": 2727} {"train_loss": -6.5862226486206055, "global_step": 114549, "epoch": 2727} {"train_loss": -6.536118984222412, "global_step": 114550, "epoch": 2727} {"train_loss": -6.536256790161133, "global_step": 114551, "epoch": 2727} {"train_loss": -6.586255073547363, "global_step": 114552, "epoch": 2727} {"train_loss": -6.494195938110352, "global_step": 114553, "epoch": 2727} {"train_loss": -6.448604106903076, "global_step": 114554, "epoch": 2727} {"train_loss": -6.5100178718566895, "global_step": 114555, "epoch": 2727} {"train_loss": -6.57697868347168, "global_step": 114556, "epoch": 2727} {"train_loss": -6.404082298278809, "global_step": 114557, "epoch": 2727} {"train_loss": -6.487368583679199, "global_step": 114558, "epoch": 2727} {"train_loss": -6.3344268798828125, "global_step": 114559, "epoch": 2727} {"train_loss": -6.476713180541992, "global_step": 114560, "epoch": 2727} {"train_loss": -6.449596881866455, "global_step": 114561, "epoch": 2727} {"train_loss": -6.528302192687988, "global_step": 114562, "epoch": 2727} {"train_loss": -6.296189308166504, "global_step": 114563, "epoch": 2727} {"train_loss": -6.460784912109375, "global_step": 114564, "epoch": 2727} {"train_loss": -6.5314621925354, "global_step": 114565, "epoch": 2727} {"train_loss": -6.319921016693115, "global_step": 114566, "epoch": 2727} {"train_loss": -6.264852523803711, "global_step": 114567, "epoch": 2727} {"train_loss": -6.399231910705566, "global_step": 114568, "epoch": 2727} {"train_loss": -6.396317005157471, "global_step": 114569, "epoch": 2727} {"train_loss": -6.516889572143555, "global_step": 114570, "epoch": 2727} {"train_loss": -6.514086723327637, "global_step": 114571, "epoch": 2727} {"train_loss": -6.490764617919922, "global_step": 114572, "epoch": 2727} {"train_loss": -6.461721420288086, "global_step": 114573, "epoch": 2727} {"train_loss": -6.536128520965576, "global_step": 114574, "epoch": 2727} {"train_loss": -6.496987592606318, "global_step": 114575, "epoch": 2727, "val_loss": 76692.7109375} {"train_loss": -6.643845558166504, "global_step": 114576, "epoch": 2728} {"train_loss": -6.655862808227539, "global_step": 114577, "epoch": 2728} {"train_loss": -6.547562599182129, "global_step": 114578, "epoch": 2728} {"train_loss": -6.660736083984375, "global_step": 114579, "epoch": 2728} {"train_loss": -6.532094955444336, "global_step": 114580, "epoch": 2728} {"train_loss": -6.430054187774658, "global_step": 114581, "epoch": 2728} {"train_loss": -6.589828968048096, "global_step": 114582, "epoch": 2728} {"train_loss": -6.590728282928467, "global_step": 114583, "epoch": 2728} {"train_loss": -6.580473899841309, "global_step": 114584, "epoch": 2728} {"train_loss": -6.496912002563477, "global_step": 114585, "epoch": 2728} {"train_loss": -6.425948619842529, "global_step": 114586, "epoch": 2728} {"train_loss": -6.466851234436035, "global_step": 114587, "epoch": 2728} {"train_loss": -6.461757659912109, "global_step": 114588, "epoch": 2728} {"train_loss": -6.420170783996582, "global_step": 114589, "epoch": 2728} {"train_loss": -6.595890045166016, "global_step": 114590, "epoch": 2728} {"train_loss": -6.44123649597168, "global_step": 114591, "epoch": 2728} {"train_loss": -6.515050888061523, "global_step": 114592, "epoch": 2728} {"train_loss": -6.598228454589844, "global_step": 114593, "epoch": 2728} {"train_loss": -6.555974960327148, "global_step": 114594, "epoch": 2728} {"train_loss": -6.488923072814941, "global_step": 114595, "epoch": 2728} {"train_loss": -6.261528491973877, "global_step": 114596, "epoch": 2728} {"train_loss": -6.554378986358643, "global_step": 114597, "epoch": 2728} {"train_loss": -6.58233642578125, "global_step": 114598, "epoch": 2728} {"train_loss": -6.577989101409912, "global_step": 114599, "epoch": 2728} {"train_loss": -6.432080268859863, "global_step": 114600, "epoch": 2728} {"train_loss": -6.495458126068115, "global_step": 114601, "epoch": 2728} {"train_loss": -6.376322269439697, "global_step": 114602, "epoch": 2728} {"train_loss": -6.445389747619629, "global_step": 114603, "epoch": 2728} {"train_loss": -6.441593170166016, "global_step": 114604, "epoch": 2728} {"train_loss": -6.463098526000977, "global_step": 114605, "epoch": 2728} {"train_loss": -6.487131118774414, "global_step": 114606, "epoch": 2728} {"train_loss": -6.428860187530518, "global_step": 114607, "epoch": 2728} {"train_loss": -6.411228179931641, "global_step": 114608, "epoch": 2728} {"train_loss": -6.482907295227051, "global_step": 114609, "epoch": 2728} {"train_loss": -6.493772506713867, "global_step": 114610, "epoch": 2728} {"train_loss": -6.55021858215332, "global_step": 114611, "epoch": 2728} {"train_loss": -6.475897789001465, "global_step": 114612, "epoch": 2728} {"train_loss": -6.55499792098999, "global_step": 114613, "epoch": 2728} {"train_loss": -6.476654052734375, "global_step": 114614, "epoch": 2728} {"train_loss": -6.411273956298828, "global_step": 114615, "epoch": 2728} {"train_loss": -6.499654293060303, "global_step": 114616, "epoch": 2728} {"train_loss": -6.502161116827102, "global_step": 114617, "epoch": 2728, "val_loss": 76330.734375} {"train_loss": -6.5058369636535645, "global_step": 114618, "epoch": 2729} {"train_loss": -6.552924156188965, "global_step": 114619, "epoch": 2729} {"train_loss": -6.498741626739502, "global_step": 114620, "epoch": 2729} {"train_loss": -6.445204734802246, "global_step": 114621, "epoch": 2729} {"train_loss": -6.595061779022217, "global_step": 114622, "epoch": 2729} {"train_loss": -6.588151931762695, "global_step": 114623, "epoch": 2729} {"train_loss": -6.414673805236816, "global_step": 114624, "epoch": 2729} {"train_loss": -6.609775543212891, "global_step": 114625, "epoch": 2729} {"train_loss": -6.448603630065918, "global_step": 114626, "epoch": 2729} {"train_loss": -6.593713760375977, "global_step": 114627, "epoch": 2729} {"train_loss": -6.570093154907227, "global_step": 114628, "epoch": 2729} {"train_loss": -6.496116638183594, "global_step": 114629, "epoch": 2729} {"train_loss": -6.458990573883057, "global_step": 114630, "epoch": 2729} {"train_loss": -6.529427528381348, "global_step": 114631, "epoch": 2729} {"train_loss": -6.496341705322266, "global_step": 114632, "epoch": 2729} {"train_loss": -6.571691513061523, "global_step": 114633, "epoch": 2729} {"train_loss": -6.630903720855713, "global_step": 114634, "epoch": 2729} {"train_loss": -6.490209102630615, "global_step": 114635, "epoch": 2729} {"train_loss": -6.511867523193359, "global_step": 114636, "epoch": 2729} {"train_loss": -6.554983139038086, "global_step": 114637, "epoch": 2729} {"train_loss": -6.671870231628418, "global_step": 114638, "epoch": 2729} {"train_loss": -6.639371871948242, "global_step": 114639, "epoch": 2729} {"train_loss": -6.604336261749268, "global_step": 114640, "epoch": 2729} {"train_loss": -6.535898685455322, "global_step": 114641, "epoch": 2729} {"train_loss": -6.523545265197754, "global_step": 114642, "epoch": 2729} {"train_loss": -6.487420082092285, "global_step": 114643, "epoch": 2729} {"train_loss": -6.610593318939209, "global_step": 114644, "epoch": 2729} {"train_loss": -6.544071197509766, "global_step": 114645, "epoch": 2729} {"train_loss": -6.496055603027344, "global_step": 114646, "epoch": 2729} {"train_loss": -6.501233100891113, "global_step": 114647, "epoch": 2729} {"train_loss": -6.505745887756348, "global_step": 114648, "epoch": 2729} {"train_loss": -6.357724189758301, "global_step": 114649, "epoch": 2729} {"train_loss": -6.521726131439209, "global_step": 114650, "epoch": 2729} {"train_loss": -6.429125785827637, "global_step": 114651, "epoch": 2729} {"train_loss": -6.353618621826172, "global_step": 114652, "epoch": 2729} {"train_loss": -6.494824409484863, "global_step": 114653, "epoch": 2729} {"train_loss": -6.468761444091797, "global_step": 114654, "epoch": 2729} {"train_loss": -6.541521072387695, "global_step": 114655, "epoch": 2729} {"train_loss": -6.5202836990356445, "global_step": 114656, "epoch": 2729} {"train_loss": -6.567196369171143, "global_step": 114657, "epoch": 2729} {"train_loss": -6.467960357666016, "global_step": 114658, "epoch": 2729} {"train_loss": -6.521027451469784, "global_step": 114659, "epoch": 2729, "val_loss": 76585.734375} {"train_loss": -6.522273540496826, "global_step": 114660, "epoch": 2730} {"train_loss": -6.436924934387207, "global_step": 114661, "epoch": 2730} {"train_loss": -6.483520030975342, "global_step": 114662, "epoch": 2730} {"train_loss": -6.47202205657959, "global_step": 114663, "epoch": 2730} {"train_loss": -6.390307426452637, "global_step": 114664, "epoch": 2730} {"train_loss": -6.578081130981445, "global_step": 114665, "epoch": 2730} {"train_loss": -6.432919025421143, "global_step": 114666, "epoch": 2730} {"train_loss": -6.546148300170898, "global_step": 114667, "epoch": 2730} {"train_loss": -6.543794631958008, "global_step": 114668, "epoch": 2730} {"train_loss": -6.480652809143066, "global_step": 114669, "epoch": 2730} {"train_loss": -6.491676330566406, "global_step": 114670, "epoch": 2730} {"train_loss": -6.433053016662598, "global_step": 114671, "epoch": 2730} {"train_loss": -6.417681694030762, "global_step": 114672, "epoch": 2730} {"train_loss": -6.609577178955078, "global_step": 114673, "epoch": 2730} {"train_loss": -6.43056058883667, "global_step": 114674, "epoch": 2730} {"train_loss": -6.4442853927612305, "global_step": 114675, "epoch": 2730} {"train_loss": -6.252490043640137, "global_step": 114676, "epoch": 2730} {"train_loss": -6.421525955200195, "global_step": 114677, "epoch": 2730} {"train_loss": -6.380516052246094, "global_step": 114678, "epoch": 2730} {"train_loss": -6.499516487121582, "global_step": 114679, "epoch": 2730} {"train_loss": -6.402338981628418, "global_step": 114680, "epoch": 2730} {"train_loss": -6.426779747009277, "global_step": 114681, "epoch": 2730} {"train_loss": -6.491726875305176, "global_step": 114682, "epoch": 2730} {"train_loss": -6.331315994262695, "global_step": 114683, "epoch": 2730} {"train_loss": -6.576001167297363, "global_step": 114684, "epoch": 2730} {"train_loss": -6.4797773361206055, "global_step": 114685, "epoch": 2730} {"train_loss": -6.489955902099609, "global_step": 114686, "epoch": 2730} {"train_loss": -6.576899528503418, "global_step": 114687, "epoch": 2730} {"train_loss": -6.530739784240723, "global_step": 114688, "epoch": 2730} {"train_loss": -6.516756534576416, "global_step": 114689, "epoch": 2730} {"train_loss": -6.5339226722717285, "global_step": 114690, "epoch": 2730} {"train_loss": -6.527308464050293, "global_step": 114691, "epoch": 2730} {"train_loss": -6.544150352478027, "global_step": 114692, "epoch": 2730} {"train_loss": -6.573824405670166, "global_step": 114693, "epoch": 2730} {"train_loss": -6.502487659454346, "global_step": 114694, "epoch": 2730} {"train_loss": -6.467235565185547, "global_step": 114695, "epoch": 2730} {"train_loss": -6.390322685241699, "global_step": 114696, "epoch": 2730} {"train_loss": -6.561771392822266, "global_step": 114697, "epoch": 2730} {"train_loss": -6.494278907775879, "global_step": 114698, "epoch": 2730} {"train_loss": -6.491518974304199, "global_step": 114699, "epoch": 2730} {"train_loss": -6.576910018920898, "global_step": 114700, "epoch": 2730} {"train_loss": -6.483786582946777, "global_step": 114701, "epoch": 2730, "val_loss": 76381.3203125} {"train_loss": -6.436602592468262, "global_step": 114702, "epoch": 2731} {"train_loss": -6.537172317504883, "global_step": 114703, "epoch": 2731} {"train_loss": -6.524733543395996, "global_step": 114704, "epoch": 2731} {"train_loss": -6.583446025848389, "global_step": 114705, "epoch": 2731} {"train_loss": -6.429871559143066, "global_step": 114706, "epoch": 2731} {"train_loss": -6.46970272064209, "global_step": 114707, "epoch": 2731} {"train_loss": -6.4928154945373535, "global_step": 114708, "epoch": 2731} {"train_loss": -6.45068359375, "global_step": 114709, "epoch": 2731} {"train_loss": -6.540544509887695, "global_step": 114710, "epoch": 2731} {"train_loss": -6.567783355712891, "global_step": 114711, "epoch": 2731} {"train_loss": -6.457559585571289, "global_step": 114712, "epoch": 2731} {"train_loss": -6.531416893005371, "global_step": 114713, "epoch": 2731} {"train_loss": -6.61815071105957, "global_step": 114714, "epoch": 2731} {"train_loss": -6.542413234710693, "global_step": 114715, "epoch": 2731} {"train_loss": -6.584183692932129, "global_step": 114716, "epoch": 2731} {"train_loss": -6.4903883934021, "global_step": 114717, "epoch": 2731} {"train_loss": -6.522675514221191, "global_step": 114718, "epoch": 2731} {"train_loss": -6.535280227661133, "global_step": 114719, "epoch": 2731} {"train_loss": -6.370354652404785, "global_step": 114720, "epoch": 2731} {"train_loss": -6.567442893981934, "global_step": 114721, "epoch": 2731} {"train_loss": -6.5198163986206055, "global_step": 114722, "epoch": 2731} {"train_loss": -6.511906623840332, "global_step": 114723, "epoch": 2731} {"train_loss": -6.558114051818848, "global_step": 114724, "epoch": 2731} {"train_loss": -6.560803413391113, "global_step": 114725, "epoch": 2731} {"train_loss": -6.4108500480651855, "global_step": 114726, "epoch": 2731} {"train_loss": -6.430827617645264, "global_step": 114727, "epoch": 2731} {"train_loss": -6.4964423179626465, "global_step": 114728, "epoch": 2731} {"train_loss": -6.486791610717773, "global_step": 114729, "epoch": 2731} {"train_loss": -6.492084503173828, "global_step": 114730, "epoch": 2731} {"train_loss": -6.558080673217773, "global_step": 114731, "epoch": 2731} {"train_loss": -6.534414768218994, "global_step": 114732, "epoch": 2731} {"train_loss": -6.456382751464844, "global_step": 114733, "epoch": 2731} {"train_loss": -6.586791038513184, "global_step": 114734, "epoch": 2731} {"train_loss": -6.521706581115723, "global_step": 114735, "epoch": 2731} {"train_loss": -6.55241060256958, "global_step": 114736, "epoch": 2731} {"train_loss": -6.534140110015869, "global_step": 114737, "epoch": 2731} {"train_loss": -6.56501579284668, "global_step": 114738, "epoch": 2731} {"train_loss": -6.583913326263428, "global_step": 114739, "epoch": 2731} {"train_loss": -6.510964393615723, "global_step": 114740, "epoch": 2731} {"train_loss": -6.498490810394287, "global_step": 114741, "epoch": 2731} {"train_loss": -6.396523475646973, "global_step": 114742, "epoch": 2731} {"train_loss": -6.513991673787435, "global_step": 114743, "epoch": 2731, "val_loss": 76629.328125} {"train_loss": -6.629836082458496, "global_step": 114744, "epoch": 2732} {"train_loss": -6.615814685821533, "global_step": 114745, "epoch": 2732} {"train_loss": -6.502829551696777, "global_step": 114746, "epoch": 2732} {"train_loss": -6.666727066040039, "global_step": 114747, "epoch": 2732} {"train_loss": -6.456329345703125, "global_step": 114748, "epoch": 2732} {"train_loss": -6.616463661193848, "global_step": 114749, "epoch": 2732} {"train_loss": -6.444823265075684, "global_step": 114750, "epoch": 2732} {"train_loss": -6.565793991088867, "global_step": 114751, "epoch": 2732} {"train_loss": -6.622611999511719, "global_step": 114752, "epoch": 2732} {"train_loss": -6.3870344161987305, "global_step": 114753, "epoch": 2732} {"train_loss": -6.574204444885254, "global_step": 114754, "epoch": 2732} {"train_loss": -6.433992862701416, "global_step": 114755, "epoch": 2732} {"train_loss": -6.469089984893799, "global_step": 114756, "epoch": 2732} {"train_loss": -6.456072807312012, "global_step": 114757, "epoch": 2732} {"train_loss": -6.3456854820251465, "global_step": 114758, "epoch": 2732} {"train_loss": -6.502773284912109, "global_step": 114759, "epoch": 2732} {"train_loss": -6.535624027252197, "global_step": 114760, "epoch": 2732} {"train_loss": -6.530370235443115, "global_step": 114761, "epoch": 2732} {"train_loss": -6.499213218688965, "global_step": 114762, "epoch": 2732} {"train_loss": -6.558789253234863, "global_step": 114763, "epoch": 2732} {"train_loss": -6.461170196533203, "global_step": 114764, "epoch": 2732} {"train_loss": -6.572676658630371, "global_step": 114765, "epoch": 2732} {"train_loss": -6.4415283203125, "global_step": 114766, "epoch": 2732} {"train_loss": -6.500843048095703, "global_step": 114767, "epoch": 2732} {"train_loss": -6.601404666900635, "global_step": 114768, "epoch": 2732} {"train_loss": -6.432432174682617, "global_step": 114769, "epoch": 2732} {"train_loss": -6.355575084686279, "global_step": 114770, "epoch": 2732} {"train_loss": -6.5241875648498535, "global_step": 114771, "epoch": 2732} {"train_loss": -6.449254035949707, "global_step": 114772, "epoch": 2732} {"train_loss": -6.430143356323242, "global_step": 114773, "epoch": 2732} {"train_loss": -6.571162223815918, "global_step": 114774, "epoch": 2732} {"train_loss": -6.348654270172119, "global_step": 114775, "epoch": 2732} {"train_loss": -6.487516403198242, "global_step": 114776, "epoch": 2732} {"train_loss": -6.515475273132324, "global_step": 114777, "epoch": 2732} {"train_loss": -6.554283618927002, "global_step": 114778, "epoch": 2732} {"train_loss": -6.342424392700195, "global_step": 114779, "epoch": 2732} {"train_loss": -6.4575300216674805, "global_step": 114780, "epoch": 2732} {"train_loss": -6.587048530578613, "global_step": 114781, "epoch": 2732} {"train_loss": -6.609311580657959, "global_step": 114782, "epoch": 2732} {"train_loss": -6.464597225189209, "global_step": 114783, "epoch": 2732} {"train_loss": -6.417245864868164, "global_step": 114784, "epoch": 2732} {"train_loss": -6.50376093955267, "global_step": 114785, "epoch": 2732, "val_loss": 77008.546875} {"train_loss": -6.40675163269043, "global_step": 114786, "epoch": 2733} {"train_loss": -6.586367130279541, "global_step": 114787, "epoch": 2733} {"train_loss": -6.424752235412598, "global_step": 114788, "epoch": 2733} {"train_loss": -6.5311598777771, "global_step": 114789, "epoch": 2733} {"train_loss": -6.570374011993408, "global_step": 114790, "epoch": 2733} {"train_loss": -6.557097434997559, "global_step": 114791, "epoch": 2733} {"train_loss": -6.59022331237793, "global_step": 114792, "epoch": 2733} {"train_loss": -6.492470741271973, "global_step": 114793, "epoch": 2733} {"train_loss": -6.596220970153809, "global_step": 114794, "epoch": 2733} {"train_loss": -6.424813747406006, "global_step": 114795, "epoch": 2733} {"train_loss": -6.485894203186035, "global_step": 114796, "epoch": 2733} {"train_loss": -6.502605438232422, "global_step": 114797, "epoch": 2733} {"train_loss": -6.382525444030762, "global_step": 114798, "epoch": 2733} {"train_loss": -6.362122535705566, "global_step": 114799, "epoch": 2733} {"train_loss": -6.349820137023926, "global_step": 114800, "epoch": 2733} {"train_loss": -6.41770601272583, "global_step": 114801, "epoch": 2733} {"train_loss": -6.361978530883789, "global_step": 114802, "epoch": 2733} {"train_loss": -6.5255279541015625, "global_step": 114803, "epoch": 2733} {"train_loss": -6.531494140625, "global_step": 114804, "epoch": 2733} {"train_loss": -6.4600090980529785, "global_step": 114805, "epoch": 2733} {"train_loss": -6.411397933959961, "global_step": 114806, "epoch": 2733} {"train_loss": -6.425602912902832, "global_step": 114807, "epoch": 2733} {"train_loss": -6.419375896453857, "global_step": 114808, "epoch": 2733} {"train_loss": -6.5132317543029785, "global_step": 114809, "epoch": 2733} {"train_loss": -6.406863212585449, "global_step": 114810, "epoch": 2733} {"train_loss": -6.532295227050781, "global_step": 114811, "epoch": 2733} {"train_loss": -6.358114242553711, "global_step": 114812, "epoch": 2733} {"train_loss": -6.574432373046875, "global_step": 114813, "epoch": 2733} {"train_loss": -6.301147937774658, "global_step": 114814, "epoch": 2733} {"train_loss": -6.441835403442383, "global_step": 114815, "epoch": 2733} {"train_loss": -6.419490814208984, "global_step": 114816, "epoch": 2733} {"train_loss": -6.412147521972656, "global_step": 114817, "epoch": 2733} {"train_loss": -6.513626575469971, "global_step": 114818, "epoch": 2733} {"train_loss": -6.40744686126709, "global_step": 114819, "epoch": 2733} {"train_loss": -6.399186134338379, "global_step": 114820, "epoch": 2733} {"train_loss": -6.386329650878906, "global_step": 114821, "epoch": 2733} {"train_loss": -6.4110517501831055, "global_step": 114822, "epoch": 2733} {"train_loss": -6.443632125854492, "global_step": 114823, "epoch": 2733} {"train_loss": -6.45363712310791, "global_step": 114824, "epoch": 2733} {"train_loss": -6.397809028625488, "global_step": 114825, "epoch": 2733} {"train_loss": -6.6068267822265625, "global_step": 114826, "epoch": 2733} {"train_loss": -6.4577495484125045, "global_step": 114827, "epoch": 2733, "val_loss": 76543.0390625} {"train_loss": -6.466037750244141, "global_step": 114828, "epoch": 2734} {"train_loss": -6.436580657958984, "global_step": 114829, "epoch": 2734} {"train_loss": -6.438955307006836, "global_step": 114830, "epoch": 2734} {"train_loss": -6.461984634399414, "global_step": 114831, "epoch": 2734} {"train_loss": -6.599967956542969, "global_step": 114832, "epoch": 2734} {"train_loss": -6.600263595581055, "global_step": 114833, "epoch": 2734} {"train_loss": -6.538700103759766, "global_step": 114834, "epoch": 2734} {"train_loss": -6.614891052246094, "global_step": 114835, "epoch": 2734} {"train_loss": -6.449271202087402, "global_step": 114836, "epoch": 2734} {"train_loss": -6.600127220153809, "global_step": 114837, "epoch": 2734} {"train_loss": -6.590799331665039, "global_step": 114838, "epoch": 2734} {"train_loss": -6.451476097106934, "global_step": 114839, "epoch": 2734} {"train_loss": -6.506715774536133, "global_step": 114840, "epoch": 2734} {"train_loss": -6.5991387367248535, "global_step": 114841, "epoch": 2734} {"train_loss": -6.478594779968262, "global_step": 114842, "epoch": 2734} {"train_loss": -6.582733631134033, "global_step": 114843, "epoch": 2734} {"train_loss": -6.492983341217041, "global_step": 114844, "epoch": 2734} {"train_loss": -6.384466648101807, "global_step": 114845, "epoch": 2734} {"train_loss": -6.556641578674316, "global_step": 114846, "epoch": 2734} {"train_loss": -6.511422157287598, "global_step": 114847, "epoch": 2734} {"train_loss": -6.614792346954346, "global_step": 114848, "epoch": 2734} {"train_loss": -6.455158233642578, "global_step": 114849, "epoch": 2734} {"train_loss": -6.421494960784912, "global_step": 114850, "epoch": 2734} {"train_loss": -6.578281402587891, "global_step": 114851, "epoch": 2734} {"train_loss": -6.402762413024902, "global_step": 114852, "epoch": 2734} {"train_loss": -6.607706546783447, "global_step": 114853, "epoch": 2734} {"train_loss": -6.492507457733154, "global_step": 114854, "epoch": 2734} {"train_loss": -6.508206367492676, "global_step": 114855, "epoch": 2734} {"train_loss": -6.571835517883301, "global_step": 114856, "epoch": 2734} {"train_loss": -6.548918724060059, "global_step": 114857, "epoch": 2734} {"train_loss": -6.558347702026367, "global_step": 114858, "epoch": 2734} {"train_loss": -6.580126762390137, "global_step": 114859, "epoch": 2734} {"train_loss": -6.4322919845581055, "global_step": 114860, "epoch": 2734} {"train_loss": -6.496830463409424, "global_step": 114861, "epoch": 2734} {"train_loss": -6.486660003662109, "global_step": 114862, "epoch": 2734} {"train_loss": -6.394265651702881, "global_step": 114863, "epoch": 2734} {"train_loss": -6.495968818664551, "global_step": 114864, "epoch": 2734} {"train_loss": -6.595297813415527, "global_step": 114865, "epoch": 2734} {"train_loss": -6.450540065765381, "global_step": 114866, "epoch": 2734} {"train_loss": -6.484749794006348, "global_step": 114867, "epoch": 2734} {"train_loss": -6.467836380004883, "global_step": 114868, "epoch": 2734} {"train_loss": -6.511490390414283, "global_step": 114869, "epoch": 2734, "val_loss": 76470.015625} {"train_loss": -6.6386847496032715, "global_step": 114870, "epoch": 2735} {"train_loss": -6.568719863891602, "global_step": 114871, "epoch": 2735} {"train_loss": -6.52687931060791, "global_step": 114872, "epoch": 2735} {"train_loss": -6.470182418823242, "global_step": 114873, "epoch": 2735} {"train_loss": -6.3942131996154785, "global_step": 114874, "epoch": 2735} {"train_loss": -6.566102981567383, "global_step": 114875, "epoch": 2735} {"train_loss": -6.4752678871154785, "global_step": 114876, "epoch": 2735} {"train_loss": -6.4820637702941895, "global_step": 114877, "epoch": 2735} {"train_loss": -6.588526248931885, "global_step": 114878, "epoch": 2735} {"train_loss": -6.556331634521484, "global_step": 114879, "epoch": 2735} {"train_loss": -6.495843887329102, "global_step": 114880, "epoch": 2735} {"train_loss": -6.585264205932617, "global_step": 114881, "epoch": 2735} {"train_loss": -6.473106861114502, "global_step": 114882, "epoch": 2735} {"train_loss": -6.5388898849487305, "global_step": 114883, "epoch": 2735} {"train_loss": -6.468201637268066, "global_step": 114884, "epoch": 2735} {"train_loss": -6.500781059265137, "global_step": 114885, "epoch": 2735} {"train_loss": -6.343090057373047, "global_step": 114886, "epoch": 2735} {"train_loss": -6.467232704162598, "global_step": 114887, "epoch": 2735} {"train_loss": -6.493742942810059, "global_step": 114888, "epoch": 2735} {"train_loss": -6.537165641784668, "global_step": 114889, "epoch": 2735} {"train_loss": -6.525568008422852, "global_step": 114890, "epoch": 2735} {"train_loss": -6.5088887214660645, "global_step": 114891, "epoch": 2735} {"train_loss": -6.493112564086914, "global_step": 114892, "epoch": 2735} {"train_loss": -6.453729629516602, "global_step": 114893, "epoch": 2735} {"train_loss": -6.508882522583008, "global_step": 114894, "epoch": 2735} {"train_loss": -6.4381818771362305, "global_step": 114895, "epoch": 2735} {"train_loss": -6.570553779602051, "global_step": 114896, "epoch": 2735} {"train_loss": -6.400618553161621, "global_step": 114897, "epoch": 2735} {"train_loss": -6.536300182342529, "global_step": 114898, "epoch": 2735} {"train_loss": -6.44648551940918, "global_step": 114899, "epoch": 2735} {"train_loss": -6.631421089172363, "global_step": 114900, "epoch": 2735} {"train_loss": -6.576973915100098, "global_step": 114901, "epoch": 2735} {"train_loss": -6.456059455871582, "global_step": 114902, "epoch": 2735} {"train_loss": -6.54270601272583, "global_step": 114903, "epoch": 2735} {"train_loss": -6.496260166168213, "global_step": 114904, "epoch": 2735} {"train_loss": -6.493717193603516, "global_step": 114905, "epoch": 2735} {"train_loss": -6.4290008544921875, "global_step": 114906, "epoch": 2735} {"train_loss": -6.480091094970703, "global_step": 114907, "epoch": 2735} {"train_loss": -6.469578742980957, "global_step": 114908, "epoch": 2735} {"train_loss": -6.512445449829102, "global_step": 114909, "epoch": 2735} {"train_loss": -6.463990211486816, "global_step": 114910, "epoch": 2735} {"train_loss": -6.500940175283523, "global_step": 114911, "epoch": 2735, "val_loss": 76713.2578125} {"train_loss": -6.497259140014648, "global_step": 114912, "epoch": 2736} {"train_loss": -6.3359246253967285, "global_step": 114913, "epoch": 2736} {"train_loss": -6.4433746337890625, "global_step": 114914, "epoch": 2736} {"train_loss": -6.532383918762207, "global_step": 114915, "epoch": 2736} {"train_loss": -6.449844837188721, "global_step": 114916, "epoch": 2736} {"train_loss": -6.4077253341674805, "global_step": 114917, "epoch": 2736} {"train_loss": -6.425642967224121, "global_step": 114918, "epoch": 2736} {"train_loss": -6.439640522003174, "global_step": 114919, "epoch": 2736} {"train_loss": -6.587615489959717, "global_step": 114920, "epoch": 2736} {"train_loss": -6.547411918640137, "global_step": 114921, "epoch": 2736} {"train_loss": -6.319296836853027, "global_step": 114922, "epoch": 2736} {"train_loss": -6.5176239013671875, "global_step": 114923, "epoch": 2736} {"train_loss": -6.468235492706299, "global_step": 114924, "epoch": 2736} {"train_loss": -6.500523090362549, "global_step": 114925, "epoch": 2736} {"train_loss": -6.548853874206543, "global_step": 114926, "epoch": 2736} {"train_loss": -6.491555213928223, "global_step": 114927, "epoch": 2736} {"train_loss": -6.489080905914307, "global_step": 114928, "epoch": 2736} {"train_loss": -6.503800392150879, "global_step": 114929, "epoch": 2736} {"train_loss": -6.5066704750061035, "global_step": 114930, "epoch": 2736} {"train_loss": -6.522463798522949, "global_step": 114931, "epoch": 2736} {"train_loss": -6.400773525238037, "global_step": 114932, "epoch": 2736} {"train_loss": -6.591281890869141, "global_step": 114933, "epoch": 2736} {"train_loss": -6.585624694824219, "global_step": 114934, "epoch": 2736} {"train_loss": -6.5737457275390625, "global_step": 114935, "epoch": 2736} {"train_loss": -6.501014709472656, "global_step": 114936, "epoch": 2736} {"train_loss": -6.528468132019043, "global_step": 114937, "epoch": 2736} {"train_loss": -6.507846355438232, "global_step": 114938, "epoch": 2736} {"train_loss": -6.4882612228393555, "global_step": 114939, "epoch": 2736} {"train_loss": -6.5239338874816895, "global_step": 114940, "epoch": 2736} {"train_loss": -6.610684394836426, "global_step": 114941, "epoch": 2736} {"train_loss": -6.565441131591797, "global_step": 114942, "epoch": 2736} {"train_loss": -6.557276248931885, "global_step": 114943, "epoch": 2736} {"train_loss": -6.601336479187012, "global_step": 114944, "epoch": 2736} {"train_loss": -6.461065292358398, "global_step": 114945, "epoch": 2736} {"train_loss": -6.474067687988281, "global_step": 114946, "epoch": 2736} {"train_loss": -6.668221473693848, "global_step": 114947, "epoch": 2736} {"train_loss": -6.3900651931762695, "global_step": 114948, "epoch": 2736} {"train_loss": -6.581895351409912, "global_step": 114949, "epoch": 2736} {"train_loss": -6.530911445617676, "global_step": 114950, "epoch": 2736} {"train_loss": -6.576659202575684, "global_step": 114951, "epoch": 2736} {"train_loss": -6.602644920349121, "global_step": 114952, "epoch": 2736} {"train_loss": -6.50944455464681, "global_step": 114953, "epoch": 2736, "val_loss": 76312.28125} {"train_loss": -6.4947028160095215, "global_step": 114954, "epoch": 2737} {"train_loss": -6.587456703186035, "global_step": 114955, "epoch": 2737} {"train_loss": -6.544829368591309, "global_step": 114956, "epoch": 2737} {"train_loss": -6.600114345550537, "global_step": 114957, "epoch": 2737} {"train_loss": -6.550815582275391, "global_step": 114958, "epoch": 2737} {"train_loss": -6.582283973693848, "global_step": 114959, "epoch": 2737} {"train_loss": -6.449286937713623, "global_step": 114960, "epoch": 2737} {"train_loss": -6.52392578125, "global_step": 114961, "epoch": 2737} {"train_loss": -6.586372375488281, "global_step": 114962, "epoch": 2737} {"train_loss": -6.638673305511475, "global_step": 114963, "epoch": 2737} {"train_loss": -6.573914527893066, "global_step": 114964, "epoch": 2737} {"train_loss": -6.587724208831787, "global_step": 114965, "epoch": 2737} {"train_loss": -6.562480449676514, "global_step": 114966, "epoch": 2737} {"train_loss": -6.527247428894043, "global_step": 114967, "epoch": 2737} {"train_loss": -6.469919204711914, "global_step": 114968, "epoch": 2737} {"train_loss": -6.5573930740356445, "global_step": 114969, "epoch": 2737} {"train_loss": -6.49268913269043, "global_step": 114970, "epoch": 2737} {"train_loss": -6.650208473205566, "global_step": 114971, "epoch": 2737} {"train_loss": -6.456537246704102, "global_step": 114972, "epoch": 2737} {"train_loss": -6.54945707321167, "global_step": 114973, "epoch": 2737} {"train_loss": -6.539284706115723, "global_step": 114974, "epoch": 2737} {"train_loss": -6.559968948364258, "global_step": 114975, "epoch": 2737} {"train_loss": -6.508519172668457, "global_step": 114976, "epoch": 2737} {"train_loss": -6.555911064147949, "global_step": 114977, "epoch": 2737} {"train_loss": -6.567963600158691, "global_step": 114978, "epoch": 2737} {"train_loss": -6.511853218078613, "global_step": 114979, "epoch": 2737} {"train_loss": -6.557159423828125, "global_step": 114980, "epoch": 2737} {"train_loss": -6.54429817199707, "global_step": 114981, "epoch": 2737} {"train_loss": -6.440125465393066, "global_step": 114982, "epoch": 2737} {"train_loss": -6.464377403259277, "global_step": 114983, "epoch": 2737} {"train_loss": -6.577305316925049, "global_step": 114984, "epoch": 2737} {"train_loss": -6.484060287475586, "global_step": 114985, "epoch": 2737} {"train_loss": -6.5698933601379395, "global_step": 114986, "epoch": 2737} {"train_loss": -6.528371810913086, "global_step": 114987, "epoch": 2737} {"train_loss": -6.448145866394043, "global_step": 114988, "epoch": 2737} {"train_loss": -6.542236804962158, "global_step": 114989, "epoch": 2737} {"train_loss": -6.386519432067871, "global_step": 114990, "epoch": 2737} {"train_loss": -6.533375263214111, "global_step": 114991, "epoch": 2737} {"train_loss": -6.53839111328125, "global_step": 114992, "epoch": 2737} {"train_loss": -6.5679121017456055, "global_step": 114993, "epoch": 2737} {"train_loss": -6.604989051818848, "global_step": 114994, "epoch": 2737} {"train_loss": -6.53120798156375, "global_step": 114995, "epoch": 2737, "val_loss": 76509.859375} {"train_loss": -6.6802167892456055, "global_step": 114996, "epoch": 2738} {"train_loss": -6.43739128112793, "global_step": 114997, "epoch": 2738} {"train_loss": -6.500429630279541, "global_step": 114998, "epoch": 2738} {"train_loss": -6.587813377380371, "global_step": 114999, "epoch": 2738} {"train_loss": -6.397520065307617, "global_step": 115000, "epoch": 2738} {"train_loss": -6.429633140563965, "global_step": 115001, "epoch": 2738} {"train_loss": -6.382623195648193, "global_step": 115002, "epoch": 2738} {"train_loss": -6.55207633972168, "global_step": 115003, "epoch": 2738} {"train_loss": -6.431863307952881, "global_step": 115004, "epoch": 2738} {"train_loss": -6.512980937957764, "global_step": 115005, "epoch": 2738} {"train_loss": -6.318730354309082, "global_step": 115006, "epoch": 2738} {"train_loss": -6.468045234680176, "global_step": 115007, "epoch": 2738} {"train_loss": -6.400945663452148, "global_step": 115008, "epoch": 2738} {"train_loss": -6.417667388916016, "global_step": 115009, "epoch": 2738} {"train_loss": -6.412786960601807, "global_step": 115010, "epoch": 2738} {"train_loss": -6.466782569885254, "global_step": 115011, "epoch": 2738} {"train_loss": -6.5331926345825195, "global_step": 115012, "epoch": 2738} {"train_loss": -6.423437595367432, "global_step": 115013, "epoch": 2738} {"train_loss": -6.476219177246094, "global_step": 115014, "epoch": 2738} {"train_loss": -6.380529403686523, "global_step": 115015, "epoch": 2738} {"train_loss": -6.644977569580078, "global_step": 115016, "epoch": 2738} {"train_loss": -6.391293525695801, "global_step": 115017, "epoch": 2738} {"train_loss": -6.559211730957031, "global_step": 115018, "epoch": 2738} {"train_loss": -6.442050457000732, "global_step": 115019, "epoch": 2738} {"train_loss": -6.579867362976074, "global_step": 115020, "epoch": 2738} {"train_loss": -6.478676795959473, "global_step": 115021, "epoch": 2738} {"train_loss": -6.41727352142334, "global_step": 115022, "epoch": 2738} {"train_loss": -6.535900115966797, "global_step": 115023, "epoch": 2738} {"train_loss": -6.439301013946533, "global_step": 115024, "epoch": 2738} {"train_loss": -6.568003177642822, "global_step": 115025, "epoch": 2738} {"train_loss": -6.420732498168945, "global_step": 115026, "epoch": 2738} {"train_loss": -6.595065593719482, "global_step": 115027, "epoch": 2738} {"train_loss": -6.52207088470459, "global_step": 115028, "epoch": 2738} {"train_loss": -6.433140277862549, "global_step": 115029, "epoch": 2738} {"train_loss": -6.44116735458374, "global_step": 115030, "epoch": 2738} {"train_loss": -6.415578842163086, "global_step": 115031, "epoch": 2738} {"train_loss": -6.650137901306152, "global_step": 115032, "epoch": 2738} {"train_loss": -6.41489315032959, "global_step": 115033, "epoch": 2738} {"train_loss": -6.527031898498535, "global_step": 115034, "epoch": 2738} {"train_loss": -6.455770492553711, "global_step": 115035, "epoch": 2738} {"train_loss": -6.411737442016602, "global_step": 115036, "epoch": 2738} {"train_loss": -6.473668836411976, "global_step": 115037, "epoch": 2738, "val_loss": 77332.4921875} {"train_loss": -6.27751350402832, "global_step": 115038, "epoch": 2739} {"train_loss": -6.341279029846191, "global_step": 115039, "epoch": 2739} {"train_loss": -6.397602558135986, "global_step": 115040, "epoch": 2739} {"train_loss": -6.478453636169434, "global_step": 115041, "epoch": 2739} {"train_loss": -6.360150337219238, "global_step": 115042, "epoch": 2739} {"train_loss": -6.482792854309082, "global_step": 115043, "epoch": 2739} {"train_loss": -6.479727268218994, "global_step": 115044, "epoch": 2739} {"train_loss": -6.464791774749756, "global_step": 115045, "epoch": 2739} {"train_loss": -6.386468887329102, "global_step": 115046, "epoch": 2739} {"train_loss": -6.291025638580322, "global_step": 115047, "epoch": 2739} {"train_loss": -6.396834373474121, "global_step": 115048, "epoch": 2739} {"train_loss": -6.3624267578125, "global_step": 115049, "epoch": 2739} {"train_loss": -6.5743207931518555, "global_step": 115050, "epoch": 2739} {"train_loss": -6.408100605010986, "global_step": 115051, "epoch": 2739} {"train_loss": -6.477639198303223, "global_step": 115052, "epoch": 2739} {"train_loss": -6.4203596115112305, "global_step": 115053, "epoch": 2739} {"train_loss": -6.379166603088379, "global_step": 115054, "epoch": 2739} {"train_loss": -6.47182035446167, "global_step": 115055, "epoch": 2739} {"train_loss": -6.583672523498535, "global_step": 115056, "epoch": 2739} {"train_loss": -6.454647064208984, "global_step": 115057, "epoch": 2739} {"train_loss": -6.5912933349609375, "global_step": 115058, "epoch": 2739} {"train_loss": -6.475894927978516, "global_step": 115059, "epoch": 2739} {"train_loss": -6.511443614959717, "global_step": 115060, "epoch": 2739} {"train_loss": -6.565300464630127, "global_step": 115061, "epoch": 2739} {"train_loss": -6.525511741638184, "global_step": 115062, "epoch": 2739} {"train_loss": -6.468995094299316, "global_step": 115063, "epoch": 2739} {"train_loss": -6.446463584899902, "global_step": 115064, "epoch": 2739} {"train_loss": -6.562970161437988, "global_step": 115065, "epoch": 2739} {"train_loss": -6.590124130249023, "global_step": 115066, "epoch": 2739} {"train_loss": -6.57405948638916, "global_step": 115067, "epoch": 2739} {"train_loss": -6.668001174926758, "global_step": 115068, "epoch": 2739} {"train_loss": -6.567646026611328, "global_step": 115069, "epoch": 2739} {"train_loss": -6.56959342956543, "global_step": 115070, "epoch": 2739} {"train_loss": -6.482325553894043, "global_step": 115071, "epoch": 2739} {"train_loss": -6.584656715393066, "global_step": 115072, "epoch": 2739} {"train_loss": -6.596157073974609, "global_step": 115073, "epoch": 2739} {"train_loss": -6.481256484985352, "global_step": 115074, "epoch": 2739} {"train_loss": -6.602300643920898, "global_step": 115075, "epoch": 2739} {"train_loss": -6.4929327964782715, "global_step": 115076, "epoch": 2739} {"train_loss": -6.5788960456848145, "global_step": 115077, "epoch": 2739} {"train_loss": -6.50749397277832, "global_step": 115078, "epoch": 2739} {"train_loss": -6.48226371265593, "global_step": 115079, "epoch": 2739, "val_loss": 76477.234375} {"train_loss": -6.567154884338379, "global_step": 115080, "epoch": 2740} {"train_loss": -6.569197654724121, "global_step": 115081, "epoch": 2740} {"train_loss": -6.374859809875488, "global_step": 115082, "epoch": 2740} {"train_loss": -6.468686103820801, "global_step": 115083, "epoch": 2740} {"train_loss": -6.514286994934082, "global_step": 115084, "epoch": 2740} {"train_loss": -6.59113073348999, "global_step": 115085, "epoch": 2740} {"train_loss": -6.442683219909668, "global_step": 115086, "epoch": 2740} {"train_loss": -6.424282073974609, "global_step": 115087, "epoch": 2740} {"train_loss": -6.437028408050537, "global_step": 115088, "epoch": 2740} {"train_loss": -6.537852764129639, "global_step": 115089, "epoch": 2740} {"train_loss": -6.524416446685791, "global_step": 115090, "epoch": 2740} {"train_loss": -6.494117736816406, "global_step": 115091, "epoch": 2740} {"train_loss": -6.387754917144775, "global_step": 115092, "epoch": 2740} {"train_loss": -6.382510662078857, "global_step": 115093, "epoch": 2740} {"train_loss": -6.502962112426758, "global_step": 115094, "epoch": 2740} {"train_loss": -6.379691123962402, "global_step": 115095, "epoch": 2740} {"train_loss": -6.463596343994141, "global_step": 115096, "epoch": 2740} {"train_loss": -6.411592483520508, "global_step": 115097, "epoch": 2740} {"train_loss": -6.459134101867676, "global_step": 115098, "epoch": 2740} {"train_loss": -6.513586521148682, "global_step": 115099, "epoch": 2740} {"train_loss": -6.558816909790039, "global_step": 115100, "epoch": 2740} {"train_loss": -6.616748332977295, "global_step": 115101, "epoch": 2740} {"train_loss": -6.442465305328369, "global_step": 115102, "epoch": 2740} {"train_loss": -6.575105667114258, "global_step": 115103, "epoch": 2740} {"train_loss": -6.4322075843811035, "global_step": 115104, "epoch": 2740} {"train_loss": -6.50384521484375, "global_step": 115105, "epoch": 2740} {"train_loss": -6.57603120803833, "global_step": 115106, "epoch": 2740} {"train_loss": -6.508058547973633, "global_step": 115107, "epoch": 2740} {"train_loss": -6.477755546569824, "global_step": 115108, "epoch": 2740} {"train_loss": -6.567707061767578, "global_step": 115109, "epoch": 2740} {"train_loss": -6.59848690032959, "global_step": 115110, "epoch": 2740} {"train_loss": -6.670188903808594, "global_step": 115111, "epoch": 2740} {"train_loss": -6.458574295043945, "global_step": 115112, "epoch": 2740} {"train_loss": -6.496638774871826, "global_step": 115113, "epoch": 2740} {"train_loss": -6.523021697998047, "global_step": 115114, "epoch": 2740} {"train_loss": -6.392525672912598, "global_step": 115115, "epoch": 2740} {"train_loss": -6.586767196655273, "global_step": 115116, "epoch": 2740} {"train_loss": -6.513978958129883, "global_step": 115117, "epoch": 2740} {"train_loss": -6.436840057373047, "global_step": 115118, "epoch": 2740} {"train_loss": -6.577329635620117, "global_step": 115119, "epoch": 2740} {"train_loss": -6.558216094970703, "global_step": 115120, "epoch": 2740} {"train_loss": -6.501277378627232, "global_step": 115121, "epoch": 2740, "val_loss": 76640.734375} {"train_loss": -6.468074321746826, "global_step": 115122, "epoch": 2741} {"train_loss": -6.486849784851074, "global_step": 115123, "epoch": 2741} {"train_loss": -6.593184947967529, "global_step": 115124, "epoch": 2741} {"train_loss": -6.531798839569092, "global_step": 115125, "epoch": 2741} {"train_loss": -6.59279203414917, "global_step": 115126, "epoch": 2741} {"train_loss": -6.449045658111572, "global_step": 115127, "epoch": 2741} {"train_loss": -6.411511421203613, "global_step": 115128, "epoch": 2741} {"train_loss": -6.576070308685303, "global_step": 115129, "epoch": 2741} {"train_loss": -6.479165077209473, "global_step": 115130, "epoch": 2741} {"train_loss": -6.41996955871582, "global_step": 115131, "epoch": 2741} {"train_loss": -6.413694381713867, "global_step": 115132, "epoch": 2741} {"train_loss": -6.441086769104004, "global_step": 115133, "epoch": 2741} {"train_loss": -6.41562557220459, "global_step": 115134, "epoch": 2741} {"train_loss": -6.5425214767456055, "global_step": 115135, "epoch": 2741} {"train_loss": -6.417444705963135, "global_step": 115136, "epoch": 2741} {"train_loss": -6.513827323913574, "global_step": 115137, "epoch": 2741} {"train_loss": -6.425252914428711, "global_step": 115138, "epoch": 2741} {"train_loss": -6.466748237609863, "global_step": 115139, "epoch": 2741} {"train_loss": -6.555515289306641, "global_step": 115140, "epoch": 2741} {"train_loss": -6.374307632446289, "global_step": 115141, "epoch": 2741} {"train_loss": -6.507053375244141, "global_step": 115142, "epoch": 2741} {"train_loss": -6.571138858795166, "global_step": 115143, "epoch": 2741} {"train_loss": -6.272297382354736, "global_step": 115144, "epoch": 2741} {"train_loss": -6.537073135375977, "global_step": 115145, "epoch": 2741} {"train_loss": -6.215428829193115, "global_step": 115146, "epoch": 2741} {"train_loss": -6.488065242767334, "global_step": 115147, "epoch": 2741} {"train_loss": -6.418374061584473, "global_step": 115148, "epoch": 2741} {"train_loss": -6.354702949523926, "global_step": 115149, "epoch": 2741} {"train_loss": -6.429356575012207, "global_step": 115150, "epoch": 2741} {"train_loss": -6.522341728210449, "global_step": 115151, "epoch": 2741} {"train_loss": -6.455465316772461, "global_step": 115152, "epoch": 2741} {"train_loss": -6.511514663696289, "global_step": 115153, "epoch": 2741} {"train_loss": -6.4920854568481445, "global_step": 115154, "epoch": 2741} {"train_loss": -6.496111869812012, "global_step": 115155, "epoch": 2741} {"train_loss": -6.5806989669799805, "global_step": 115156, "epoch": 2741} {"train_loss": -6.425809860229492, "global_step": 115157, "epoch": 2741} {"train_loss": -6.527295112609863, "global_step": 115158, "epoch": 2741} {"train_loss": -6.527606964111328, "global_step": 115159, "epoch": 2741} {"train_loss": -6.546853065490723, "global_step": 115160, "epoch": 2741} {"train_loss": -6.527081489562988, "global_step": 115161, "epoch": 2741} {"train_loss": -6.496532440185547, "global_step": 115162, "epoch": 2741} {"train_loss": -6.47825889360337, "global_step": 115163, "epoch": 2741, "val_loss": 76575.3125} {"train_loss": -6.546481132507324, "global_step": 115164, "epoch": 2742} {"train_loss": -6.621272563934326, "global_step": 115165, "epoch": 2742} {"train_loss": -6.4399285316467285, "global_step": 115166, "epoch": 2742} {"train_loss": -6.590451240539551, "global_step": 115167, "epoch": 2742} {"train_loss": -6.626197814941406, "global_step": 115168, "epoch": 2742} {"train_loss": -6.481969833374023, "global_step": 115169, "epoch": 2742} {"train_loss": -6.565481185913086, "global_step": 115170, "epoch": 2742} {"train_loss": -6.6369733810424805, "global_step": 115171, "epoch": 2742} {"train_loss": -6.525047302246094, "global_step": 115172, "epoch": 2742} {"train_loss": -6.5502543449401855, "global_step": 115173, "epoch": 2742} {"train_loss": -6.516947269439697, "global_step": 115174, "epoch": 2742} {"train_loss": -6.580889701843262, "global_step": 115175, "epoch": 2742} {"train_loss": -6.6445770263671875, "global_step": 115176, "epoch": 2742} {"train_loss": -6.502674102783203, "global_step": 115177, "epoch": 2742} {"train_loss": -6.566652297973633, "global_step": 115178, "epoch": 2742} {"train_loss": -6.4986252784729, "global_step": 115179, "epoch": 2742} {"train_loss": -6.4242472648620605, "global_step": 115180, "epoch": 2742} {"train_loss": -6.5647759437561035, "global_step": 115181, "epoch": 2742} {"train_loss": -6.4417009353637695, "global_step": 115182, "epoch": 2742} {"train_loss": -6.471026420593262, "global_step": 115183, "epoch": 2742} {"train_loss": -6.362917900085449, "global_step": 115184, "epoch": 2742} {"train_loss": -6.368651390075684, "global_step": 115185, "epoch": 2742} {"train_loss": -6.394564151763916, "global_step": 115186, "epoch": 2742} {"train_loss": -6.445443153381348, "global_step": 115187, "epoch": 2742} {"train_loss": -6.348094463348389, "global_step": 115188, "epoch": 2742} {"train_loss": -6.449105262756348, "global_step": 115189, "epoch": 2742} {"train_loss": -6.444660663604736, "global_step": 115190, "epoch": 2742} {"train_loss": -6.53217887878418, "global_step": 115191, "epoch": 2742} {"train_loss": -6.430086612701416, "global_step": 115192, "epoch": 2742} {"train_loss": -6.477232933044434, "global_step": 115193, "epoch": 2742} {"train_loss": -6.535016059875488, "global_step": 115194, "epoch": 2742} {"train_loss": -6.471322536468506, "global_step": 115195, "epoch": 2742} {"train_loss": -6.483463764190674, "global_step": 115196, "epoch": 2742} {"train_loss": -6.483895301818848, "global_step": 115197, "epoch": 2742} {"train_loss": -6.530041694641113, "global_step": 115198, "epoch": 2742} {"train_loss": -6.466849327087402, "global_step": 115199, "epoch": 2742} {"train_loss": -6.597823143005371, "global_step": 115200, "epoch": 2742} {"train_loss": -6.563775062561035, "global_step": 115201, "epoch": 2742} {"train_loss": -6.5211052894592285, "global_step": 115202, "epoch": 2742} {"train_loss": -6.460714340209961, "global_step": 115203, "epoch": 2742} {"train_loss": -6.585661888122559, "global_step": 115204, "epoch": 2742} {"train_loss": -6.505272729056222, "global_step": 115205, "epoch": 2742, "val_loss": 76370.8125} {"train_loss": -6.584890365600586, "global_step": 115206, "epoch": 2743} {"train_loss": -6.598194599151611, "global_step": 115207, "epoch": 2743} {"train_loss": -6.55836296081543, "global_step": 115208, "epoch": 2743} {"train_loss": -6.538717269897461, "global_step": 115209, "epoch": 2743} {"train_loss": -6.637210845947266, "global_step": 115210, "epoch": 2743} {"train_loss": -6.5360426902771, "global_step": 115211, "epoch": 2743} {"train_loss": -6.513883590698242, "global_step": 115212, "epoch": 2743} {"train_loss": -6.601223945617676, "global_step": 115213, "epoch": 2743} {"train_loss": -6.499856948852539, "global_step": 115214, "epoch": 2743} {"train_loss": -6.535423278808594, "global_step": 115215, "epoch": 2743} {"train_loss": -6.513134956359863, "global_step": 115216, "epoch": 2743} {"train_loss": -6.471652984619141, "global_step": 115217, "epoch": 2743} {"train_loss": -6.377351760864258, "global_step": 115218, "epoch": 2743} {"train_loss": -6.515786647796631, "global_step": 115219, "epoch": 2743} {"train_loss": -6.511319160461426, "global_step": 115220, "epoch": 2743} {"train_loss": -6.5165863037109375, "global_step": 115221, "epoch": 2743} {"train_loss": -6.611871719360352, "global_step": 115222, "epoch": 2743} {"train_loss": -6.472308158874512, "global_step": 115223, "epoch": 2743} {"train_loss": -6.6383771896362305, "global_step": 115224, "epoch": 2743} {"train_loss": -6.581525802612305, "global_step": 115225, "epoch": 2743} {"train_loss": -6.543193340301514, "global_step": 115226, "epoch": 2743} {"train_loss": -6.525166034698486, "global_step": 115227, "epoch": 2743} {"train_loss": -6.557986736297607, "global_step": 115228, "epoch": 2743} {"train_loss": -6.464787483215332, "global_step": 115229, "epoch": 2743} {"train_loss": -6.554019927978516, "global_step": 115230, "epoch": 2743} {"train_loss": -6.460148811340332, "global_step": 115231, "epoch": 2743} {"train_loss": -6.578607559204102, "global_step": 115232, "epoch": 2743} {"train_loss": -6.386815071105957, "global_step": 115233, "epoch": 2743} {"train_loss": -6.510119438171387, "global_step": 115234, "epoch": 2743} {"train_loss": -6.5065202713012695, "global_step": 115235, "epoch": 2743} {"train_loss": -6.455181121826172, "global_step": 115236, "epoch": 2743} {"train_loss": -6.637312412261963, "global_step": 115237, "epoch": 2743} {"train_loss": -6.492868423461914, "global_step": 115238, "epoch": 2743} {"train_loss": -6.48854923248291, "global_step": 115239, "epoch": 2743} {"train_loss": -6.525927543640137, "global_step": 115240, "epoch": 2743} {"train_loss": -6.460071086883545, "global_step": 115241, "epoch": 2743} {"train_loss": -6.481171607971191, "global_step": 115242, "epoch": 2743} {"train_loss": -6.540766716003418, "global_step": 115243, "epoch": 2743} {"train_loss": -6.471243858337402, "global_step": 115244, "epoch": 2743} {"train_loss": -6.546899795532227, "global_step": 115245, "epoch": 2743} {"train_loss": -6.570689678192139, "global_step": 115246, "epoch": 2743} {"train_loss": -6.5254040105002264, "global_step": 115247, "epoch": 2743, "val_loss": 76413.7734375} {"train_loss": -6.400235652923584, "global_step": 115248, "epoch": 2744} {"train_loss": -6.508275985717773, "global_step": 115249, "epoch": 2744} {"train_loss": -6.5781636238098145, "global_step": 115250, "epoch": 2744} {"train_loss": -6.5243144035339355, "global_step": 115251, "epoch": 2744} {"train_loss": -6.681540012359619, "global_step": 115252, "epoch": 2744} {"train_loss": -6.594627380371094, "global_step": 115253, "epoch": 2744} {"train_loss": -6.46868896484375, "global_step": 115254, "epoch": 2744} {"train_loss": -6.524297714233398, "global_step": 115255, "epoch": 2744} {"train_loss": -6.632003307342529, "global_step": 115256, "epoch": 2744} {"train_loss": -6.567536354064941, "global_step": 115257, "epoch": 2744} {"train_loss": -6.5453290939331055, "global_step": 115258, "epoch": 2744} {"train_loss": -6.5254130363464355, "global_step": 115259, "epoch": 2744} {"train_loss": -6.59030818939209, "global_step": 115260, "epoch": 2744} {"train_loss": -6.446215629577637, "global_step": 115261, "epoch": 2744} {"train_loss": -6.56740140914917, "global_step": 115262, "epoch": 2744} {"train_loss": -6.565239906311035, "global_step": 115263, "epoch": 2744} {"train_loss": -6.512166976928711, "global_step": 115264, "epoch": 2744} {"train_loss": -6.502208709716797, "global_step": 115265, "epoch": 2744} {"train_loss": -6.542389392852783, "global_step": 115266, "epoch": 2744} {"train_loss": -6.630125045776367, "global_step": 115267, "epoch": 2744} {"train_loss": -6.514157295227051, "global_step": 115268, "epoch": 2744} {"train_loss": -6.592685699462891, "global_step": 115269, "epoch": 2744} {"train_loss": -6.60501766204834, "global_step": 115270, "epoch": 2744} {"train_loss": -6.530766487121582, "global_step": 115271, "epoch": 2744} {"train_loss": -6.502870559692383, "global_step": 115272, "epoch": 2744} {"train_loss": -6.652173042297363, "global_step": 115273, "epoch": 2744} {"train_loss": -6.516768455505371, "global_step": 115274, "epoch": 2744} {"train_loss": -6.52216911315918, "global_step": 115275, "epoch": 2744} {"train_loss": -6.521061420440674, "global_step": 115276, "epoch": 2744} {"train_loss": -6.51905632019043, "global_step": 115277, "epoch": 2744} {"train_loss": -6.4990363121032715, "global_step": 115278, "epoch": 2744} {"train_loss": -6.485462665557861, "global_step": 115279, "epoch": 2744} {"train_loss": -6.581930637359619, "global_step": 115280, "epoch": 2744} {"train_loss": -6.510011196136475, "global_step": 115281, "epoch": 2744} {"train_loss": -6.454360008239746, "global_step": 115282, "epoch": 2744} {"train_loss": -6.53155517578125, "global_step": 115283, "epoch": 2744} {"train_loss": -6.5665435791015625, "global_step": 115284, "epoch": 2744} {"train_loss": -6.459965705871582, "global_step": 115285, "epoch": 2744} {"train_loss": -6.523385047912598, "global_step": 115286, "epoch": 2744} {"train_loss": -6.485245704650879, "global_step": 115287, "epoch": 2744} {"train_loss": -6.555131912231445, "global_step": 115288, "epoch": 2744} {"train_loss": -6.5392675286247615, "global_step": 115289, "epoch": 2744, "val_loss": 76803.8515625} {"train_loss": -6.598589897155762, "global_step": 115290, "epoch": 2745} {"train_loss": -6.517879962921143, "global_step": 115291, "epoch": 2745} {"train_loss": -6.5880208015441895, "global_step": 115292, "epoch": 2745} {"train_loss": -6.433619499206543, "global_step": 115293, "epoch": 2745} {"train_loss": -6.405834197998047, "global_step": 115294, "epoch": 2745} {"train_loss": -6.524365425109863, "global_step": 115295, "epoch": 2745} {"train_loss": -6.532572269439697, "global_step": 115296, "epoch": 2745} {"train_loss": -6.551875114440918, "global_step": 115297, "epoch": 2745} {"train_loss": -6.554766654968262, "global_step": 115298, "epoch": 2745} {"train_loss": -6.454050540924072, "global_step": 115299, "epoch": 2745} {"train_loss": -6.556024074554443, "global_step": 115300, "epoch": 2745} {"train_loss": -6.629372596740723, "global_step": 115301, "epoch": 2745} {"train_loss": -6.564310550689697, "global_step": 115302, "epoch": 2745} {"train_loss": -6.493746757507324, "global_step": 115303, "epoch": 2745} {"train_loss": -6.592578411102295, "global_step": 115304, "epoch": 2745} {"train_loss": -6.561266899108887, "global_step": 115305, "epoch": 2745} {"train_loss": -6.571713447570801, "global_step": 115306, "epoch": 2745} {"train_loss": -6.5717549324035645, "global_step": 115307, "epoch": 2745} {"train_loss": -6.506233215332031, "global_step": 115308, "epoch": 2745} {"train_loss": -6.548861503601074, "global_step": 115309, "epoch": 2745} {"train_loss": -6.531001091003418, "global_step": 115310, "epoch": 2745} {"train_loss": -6.575477600097656, "global_step": 115311, "epoch": 2745} {"train_loss": -6.4747419357299805, "global_step": 115312, "epoch": 2745} {"train_loss": -6.528587341308594, "global_step": 115313, "epoch": 2745} {"train_loss": -6.520652770996094, "global_step": 115314, "epoch": 2745} {"train_loss": -6.56630802154541, "global_step": 115315, "epoch": 2745} {"train_loss": -6.498748779296875, "global_step": 115316, "epoch": 2745} {"train_loss": -6.534601211547852, "global_step": 115317, "epoch": 2745} {"train_loss": -6.584559440612793, "global_step": 115318, "epoch": 2745} {"train_loss": -6.431153297424316, "global_step": 115319, "epoch": 2745} {"train_loss": -6.5496931076049805, "global_step": 115320, "epoch": 2745} {"train_loss": -6.518705368041992, "global_step": 115321, "epoch": 2745} {"train_loss": -6.416490077972412, "global_step": 115322, "epoch": 2745} {"train_loss": -6.463927268981934, "global_step": 115323, "epoch": 2745} {"train_loss": -6.415366172790527, "global_step": 115324, "epoch": 2745} {"train_loss": -6.506519317626953, "global_step": 115325, "epoch": 2745} {"train_loss": -6.483794212341309, "global_step": 115326, "epoch": 2745} {"train_loss": -6.538315773010254, "global_step": 115327, "epoch": 2745} {"train_loss": -6.550772666931152, "global_step": 115328, "epoch": 2745} {"train_loss": -6.541906356811523, "global_step": 115329, "epoch": 2745} {"train_loss": -6.488062858581543, "global_step": 115330, "epoch": 2745} {"train_loss": -6.521922781353905, "global_step": 115331, "epoch": 2745, "val_loss": 76533.5625} {"train_loss": -6.489102363586426, "global_step": 115332, "epoch": 2746} {"train_loss": -6.578245162963867, "global_step": 115333, "epoch": 2746} {"train_loss": -6.49794864654541, "global_step": 115334, "epoch": 2746} {"train_loss": -6.551426887512207, "global_step": 115335, "epoch": 2746} {"train_loss": -6.411550521850586, "global_step": 115336, "epoch": 2746} {"train_loss": -6.454770088195801, "global_step": 115337, "epoch": 2746} {"train_loss": -6.560603141784668, "global_step": 115338, "epoch": 2746} {"train_loss": -6.645823001861572, "global_step": 115339, "epoch": 2746} {"train_loss": -6.583644390106201, "global_step": 115340, "epoch": 2746} {"train_loss": -6.513059616088867, "global_step": 115341, "epoch": 2746} {"train_loss": -6.553963661193848, "global_step": 115342, "epoch": 2746} {"train_loss": -6.584355354309082, "global_step": 115343, "epoch": 2746} {"train_loss": -6.509263038635254, "global_step": 115344, "epoch": 2746} {"train_loss": -6.639474868774414, "global_step": 115345, "epoch": 2746} {"train_loss": -6.533750534057617, "global_step": 115346, "epoch": 2746} {"train_loss": -6.460230827331543, "global_step": 115347, "epoch": 2746} {"train_loss": -6.429778099060059, "global_step": 115348, "epoch": 2746} {"train_loss": -6.544898986816406, "global_step": 115349, "epoch": 2746} {"train_loss": -6.540970325469971, "global_step": 115350, "epoch": 2746} {"train_loss": -6.497077941894531, "global_step": 115351, "epoch": 2746} {"train_loss": -6.6050944328308105, "global_step": 115352, "epoch": 2746} {"train_loss": -6.514909744262695, "global_step": 115353, "epoch": 2746} {"train_loss": -6.558446407318115, "global_step": 115354, "epoch": 2746} {"train_loss": -6.478726387023926, "global_step": 115355, "epoch": 2746} {"train_loss": -6.620448112487793, "global_step": 115356, "epoch": 2746} {"train_loss": -6.53068733215332, "global_step": 115357, "epoch": 2746} {"train_loss": -6.573369026184082, "global_step": 115358, "epoch": 2746} {"train_loss": -6.55381441116333, "global_step": 115359, "epoch": 2746} {"train_loss": -6.566163063049316, "global_step": 115360, "epoch": 2746} {"train_loss": -6.516934394836426, "global_step": 115361, "epoch": 2746} {"train_loss": -6.574758529663086, "global_step": 115362, "epoch": 2746} {"train_loss": -6.527713775634766, "global_step": 115363, "epoch": 2746} {"train_loss": -6.514791488647461, "global_step": 115364, "epoch": 2746} {"train_loss": -6.457205295562744, "global_step": 115365, "epoch": 2746} {"train_loss": -6.518812656402588, "global_step": 115366, "epoch": 2746} {"train_loss": -6.5404887199401855, "global_step": 115367, "epoch": 2746} {"train_loss": -6.54913330078125, "global_step": 115368, "epoch": 2746} {"train_loss": -6.521884441375732, "global_step": 115369, "epoch": 2746} {"train_loss": -6.42908239364624, "global_step": 115370, "epoch": 2746} {"train_loss": -6.459282875061035, "global_step": 115371, "epoch": 2746} {"train_loss": -6.61994743347168, "global_step": 115372, "epoch": 2746} {"train_loss": -6.529447214944022, "global_step": 115373, "epoch": 2746, "val_loss": 76936.46875} {"train_loss": -6.51592493057251, "global_step": 115374, "epoch": 2747} {"train_loss": -6.458707809448242, "global_step": 115375, "epoch": 2747} {"train_loss": -6.468445777893066, "global_step": 115376, "epoch": 2747} {"train_loss": -6.480237007141113, "global_step": 115377, "epoch": 2747} {"train_loss": -6.700400352478027, "global_step": 115378, "epoch": 2747} {"train_loss": -6.540194988250732, "global_step": 115379, "epoch": 2747} {"train_loss": -6.525450706481934, "global_step": 115380, "epoch": 2747} {"train_loss": -6.621277809143066, "global_step": 115381, "epoch": 2747} {"train_loss": -6.647068977355957, "global_step": 115382, "epoch": 2747} {"train_loss": -6.4643073081970215, "global_step": 115383, "epoch": 2747} {"train_loss": -6.495151042938232, "global_step": 115384, "epoch": 2747} {"train_loss": -6.532536506652832, "global_step": 115385, "epoch": 2747} {"train_loss": -6.492162704467773, "global_step": 115386, "epoch": 2747} {"train_loss": -6.491559028625488, "global_step": 115387, "epoch": 2747} {"train_loss": -6.501946449279785, "global_step": 115388, "epoch": 2747} {"train_loss": -6.575002193450928, "global_step": 115389, "epoch": 2747} {"train_loss": -6.508584976196289, "global_step": 115390, "epoch": 2747} {"train_loss": -6.551823616027832, "global_step": 115391, "epoch": 2747} {"train_loss": -6.605562686920166, "global_step": 115392, "epoch": 2747} {"train_loss": -6.608997344970703, "global_step": 115393, "epoch": 2747} {"train_loss": -6.4090447425842285, "global_step": 115394, "epoch": 2747} {"train_loss": -6.441217422485352, "global_step": 115395, "epoch": 2747} {"train_loss": -6.422577857971191, "global_step": 115396, "epoch": 2747} {"train_loss": -6.652162075042725, "global_step": 115397, "epoch": 2747} {"train_loss": -6.57127046585083, "global_step": 115398, "epoch": 2747} {"train_loss": -6.532628059387207, "global_step": 115399, "epoch": 2747} {"train_loss": -6.4581098556518555, "global_step": 115400, "epoch": 2747} {"train_loss": -6.381570339202881, "global_step": 115401, "epoch": 2747} {"train_loss": -6.584179878234863, "global_step": 115402, "epoch": 2747} {"train_loss": -6.517624855041504, "global_step": 115403, "epoch": 2747} {"train_loss": -6.532001495361328, "global_step": 115404, "epoch": 2747} {"train_loss": -6.555947780609131, "global_step": 115405, "epoch": 2747} {"train_loss": -6.489716053009033, "global_step": 115406, "epoch": 2747} {"train_loss": -6.644060134887695, "global_step": 115407, "epoch": 2747} {"train_loss": -6.341001987457275, "global_step": 115408, "epoch": 2747} {"train_loss": -6.449103355407715, "global_step": 115409, "epoch": 2747} {"train_loss": -6.454616546630859, "global_step": 115410, "epoch": 2747} {"train_loss": -6.45950984954834, "global_step": 115411, "epoch": 2747} {"train_loss": -6.450558662414551, "global_step": 115412, "epoch": 2747} {"train_loss": -6.376986980438232, "global_step": 115413, "epoch": 2747} {"train_loss": -6.573781490325928, "global_step": 115414, "epoch": 2747} {"train_loss": -6.512291158948626, "global_step": 115415, "epoch": 2747, "val_loss": 76905.234375} {"train_loss": -6.560000896453857, "global_step": 115416, "epoch": 2748} {"train_loss": -6.6356964111328125, "global_step": 115417, "epoch": 2748} {"train_loss": -6.493171215057373, "global_step": 115418, "epoch": 2748} {"train_loss": -6.519110679626465, "global_step": 115419, "epoch": 2748} {"train_loss": -6.45998477935791, "global_step": 115420, "epoch": 2748} {"train_loss": -6.514061450958252, "global_step": 115421, "epoch": 2748} {"train_loss": -6.558706283569336, "global_step": 115422, "epoch": 2748} {"train_loss": -6.493293762207031, "global_step": 115423, "epoch": 2748} {"train_loss": -6.623693943023682, "global_step": 115424, "epoch": 2748} {"train_loss": -6.496238708496094, "global_step": 115425, "epoch": 2748} {"train_loss": -6.4892072677612305, "global_step": 115426, "epoch": 2748} {"train_loss": -6.585236549377441, "global_step": 115427, "epoch": 2748} {"train_loss": -6.629652500152588, "global_step": 115428, "epoch": 2748} {"train_loss": -6.488072872161865, "global_step": 115429, "epoch": 2748} {"train_loss": -6.547589302062988, "global_step": 115430, "epoch": 2748} {"train_loss": -6.533524513244629, "global_step": 115431, "epoch": 2748} {"train_loss": -6.518016815185547, "global_step": 115432, "epoch": 2748} {"train_loss": -6.516948699951172, "global_step": 115433, "epoch": 2748} {"train_loss": -6.489640235900879, "global_step": 115434, "epoch": 2748} {"train_loss": -6.483267784118652, "global_step": 115435, "epoch": 2748} {"train_loss": -6.438587665557861, "global_step": 115436, "epoch": 2748} {"train_loss": -6.495627403259277, "global_step": 115437, "epoch": 2748} {"train_loss": -6.542365550994873, "global_step": 115438, "epoch": 2748} {"train_loss": -6.470770835876465, "global_step": 115439, "epoch": 2748} {"train_loss": -6.547397613525391, "global_step": 115440, "epoch": 2748} {"train_loss": -6.4343037605285645, "global_step": 115441, "epoch": 2748} {"train_loss": -6.579744338989258, "global_step": 115442, "epoch": 2748} {"train_loss": -6.488048553466797, "global_step": 115443, "epoch": 2748} {"train_loss": -6.480222702026367, "global_step": 115444, "epoch": 2748} {"train_loss": -6.511427879333496, "global_step": 115445, "epoch": 2748} {"train_loss": -6.516689777374268, "global_step": 115446, "epoch": 2748} {"train_loss": -6.5786638259887695, "global_step": 115447, "epoch": 2748} {"train_loss": -6.594773292541504, "global_step": 115448, "epoch": 2748} {"train_loss": -6.575789451599121, "global_step": 115449, "epoch": 2748} {"train_loss": -6.444890975952148, "global_step": 115450, "epoch": 2748} {"train_loss": -6.580230712890625, "global_step": 115451, "epoch": 2748} {"train_loss": -6.561801433563232, "global_step": 115452, "epoch": 2748} {"train_loss": -6.505436897277832, "global_step": 115453, "epoch": 2748} {"train_loss": -6.5198588371276855, "global_step": 115454, "epoch": 2748} {"train_loss": -6.426431655883789, "global_step": 115455, "epoch": 2748} {"train_loss": -6.490479469299316, "global_step": 115456, "epoch": 2748} {"train_loss": -6.52122213726952, "global_step": 115457, "epoch": 2748, "val_loss": 76946.859375} {"train_loss": -6.469017505645752, "global_step": 115458, "epoch": 2749} {"train_loss": -6.552917003631592, "global_step": 115459, "epoch": 2749} {"train_loss": -6.547188758850098, "global_step": 115460, "epoch": 2749} {"train_loss": -6.638454437255859, "global_step": 115461, "epoch": 2749} {"train_loss": -6.439616680145264, "global_step": 115462, "epoch": 2749} {"train_loss": -6.548230171203613, "global_step": 115463, "epoch": 2749} {"train_loss": -6.503052711486816, "global_step": 115464, "epoch": 2749} {"train_loss": -6.5615081787109375, "global_step": 115465, "epoch": 2749} {"train_loss": -6.498785018920898, "global_step": 115466, "epoch": 2749} {"train_loss": -6.533114910125732, "global_step": 115467, "epoch": 2749} {"train_loss": -6.662867546081543, "global_step": 115468, "epoch": 2749} {"train_loss": -6.711833953857422, "global_step": 115469, "epoch": 2749} {"train_loss": -6.482974052429199, "global_step": 115470, "epoch": 2749} {"train_loss": -6.542248725891113, "global_step": 115471, "epoch": 2749} {"train_loss": -6.474034309387207, "global_step": 115472, "epoch": 2749} {"train_loss": -6.6422929763793945, "global_step": 115473, "epoch": 2749} {"train_loss": -6.6112213134765625, "global_step": 115474, "epoch": 2749} {"train_loss": -6.5164031982421875, "global_step": 115475, "epoch": 2749} {"train_loss": -6.490505218505859, "global_step": 115476, "epoch": 2749} {"train_loss": -6.627943992614746, "global_step": 115477, "epoch": 2749} {"train_loss": -6.469900608062744, "global_step": 115478, "epoch": 2749} {"train_loss": -6.547727108001709, "global_step": 115479, "epoch": 2749} {"train_loss": -6.66675329208374, "global_step": 115480, "epoch": 2749} {"train_loss": -6.544456481933594, "global_step": 115481, "epoch": 2749} {"train_loss": -6.398724555969238, "global_step": 115482, "epoch": 2749} {"train_loss": -6.474409103393555, "global_step": 115483, "epoch": 2749} {"train_loss": -6.525229454040527, "global_step": 115484, "epoch": 2749} {"train_loss": -6.5565385818481445, "global_step": 115485, "epoch": 2749} {"train_loss": -6.575997352600098, "global_step": 115486, "epoch": 2749} {"train_loss": -6.40120267868042, "global_step": 115487, "epoch": 2749} {"train_loss": -6.6288909912109375, "global_step": 115488, "epoch": 2749} {"train_loss": -6.488881587982178, "global_step": 115489, "epoch": 2749} {"train_loss": -6.602535247802734, "global_step": 115490, "epoch": 2749} {"train_loss": -6.440601825714111, "global_step": 115491, "epoch": 2749} {"train_loss": -6.572474479675293, "global_step": 115492, "epoch": 2749} {"train_loss": -6.645552635192871, "global_step": 115493, "epoch": 2749} {"train_loss": -6.5328850746154785, "global_step": 115494, "epoch": 2749} {"train_loss": -6.559300422668457, "global_step": 115495, "epoch": 2749} {"train_loss": -6.480088710784912, "global_step": 115496, "epoch": 2749} {"train_loss": -6.559447288513184, "global_step": 115497, "epoch": 2749} {"train_loss": -6.514493465423584, "global_step": 115498, "epoch": 2749} {"train_loss": -6.542313904989333, "global_step": 115499, "epoch": 2749, "val_loss": 76706.8046875} {"train_loss": -6.469792366027832, "global_step": 115500, "epoch": 2750} {"train_loss": -6.511958122253418, "global_step": 115501, "epoch": 2750} {"train_loss": -6.381398677825928, "global_step": 115502, "epoch": 2750} {"train_loss": -6.3844828605651855, "global_step": 115503, "epoch": 2750} {"train_loss": -6.350281715393066, "global_step": 115504, "epoch": 2750} {"train_loss": -6.472914695739746, "global_step": 115505, "epoch": 2750} {"train_loss": -6.5401291847229, "global_step": 115506, "epoch": 2750} {"train_loss": -6.4366021156311035, "global_step": 115507, "epoch": 2750} {"train_loss": -6.391690731048584, "global_step": 115508, "epoch": 2750} {"train_loss": -6.292741775512695, "global_step": 115509, "epoch": 2750} {"train_loss": -6.381074905395508, "global_step": 115510, "epoch": 2750} {"train_loss": -6.466636657714844, "global_step": 115511, "epoch": 2750} {"train_loss": -6.4468183517456055, "global_step": 115512, "epoch": 2750} {"train_loss": -6.46176815032959, "global_step": 115513, "epoch": 2750} {"train_loss": -6.46138858795166, "global_step": 115514, "epoch": 2750} {"train_loss": -6.467109203338623, "global_step": 115515, "epoch": 2750} {"train_loss": -6.392137050628662, "global_step": 115516, "epoch": 2750} {"train_loss": -6.419975280761719, "global_step": 115517, "epoch": 2750} {"train_loss": -6.437961101531982, "global_step": 115518, "epoch": 2750} {"train_loss": -6.491109848022461, "global_step": 115519, "epoch": 2750} {"train_loss": -6.3352460861206055, "global_step": 115520, "epoch": 2750} {"train_loss": -6.457900047302246, "global_step": 115521, "epoch": 2750} {"train_loss": -6.5801472663879395, "global_step": 115522, "epoch": 2750} {"train_loss": -6.468255043029785, "global_step": 115523, "epoch": 2750} {"train_loss": -6.545289039611816, "global_step": 115524, "epoch": 2750} {"train_loss": -6.548317909240723, "global_step": 115525, "epoch": 2750} {"train_loss": -6.488381862640381, "global_step": 115526, "epoch": 2750} {"train_loss": -6.47995662689209, "global_step": 115527, "epoch": 2750} {"train_loss": -6.430703163146973, "global_step": 115528, "epoch": 2750} {"train_loss": -6.546958923339844, "global_step": 115529, "epoch": 2750} {"train_loss": -6.568563461303711, "global_step": 115530, "epoch": 2750} {"train_loss": -6.49969482421875, "global_step": 115531, "epoch": 2750} {"train_loss": -6.420187950134277, "global_step": 115532, "epoch": 2750} {"train_loss": -6.558916091918945, "global_step": 115533, "epoch": 2750} {"train_loss": -6.51441764831543, "global_step": 115534, "epoch": 2750} {"train_loss": -6.612619876861572, "global_step": 115535, "epoch": 2750} {"train_loss": -6.557265758514404, "global_step": 115536, "epoch": 2750} {"train_loss": -6.37853479385376, "global_step": 115537, "epoch": 2750} {"train_loss": -6.496264457702637, "global_step": 115538, "epoch": 2750} {"train_loss": -6.464648246765137, "global_step": 115539, "epoch": 2750} {"train_loss": -6.6267499923706055, "global_step": 115540, "epoch": 2750} {"train_loss": -6.468911012013753, "global_step": 115541, "epoch": 2750, "train/sim_max_reward_0": 0.8799448566206811, "train/sim_max_reward_1": 0.9977873686715114, "train/sim_max_reward_2": 0.4668485886634191, "train/sim_max_reward_3": 0.15658132484458037, "train/sim_max_reward_4": 0.884031414201232, "train/sim_max_reward_5": 0.9166120402563696, "test/sim_max_reward_4500000": 0.9758281222613707, "test/sim_max_reward_4500001": 0.8726826152838645, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9949499230929475, "test/sim_max_reward_4500004": 0.14728545309862762, "test/sim_max_reward_4500005": 0.2624639794887017, "test/sim_max_reward_4500006": 0.9949561441257609, "test/sim_max_reward_4500007": 0.9569688628912525, "test/sim_max_reward_4500008": 0.28060048238104335, "test/sim_max_reward_4500009": 0.9060466748691408, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.06928980009302493, "test/sim_max_reward_4500012": 0.14699929956885094, "test/sim_max_reward_4500013": 0.009860670342931342, "test/sim_max_reward_4500014": 0.24782329450110988, "test/sim_max_reward_4500015": 0.8947317836612357, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.04176248988002679, "test/sim_max_reward_4500018": 0.9187690872849609, "test/sim_max_reward_4500019": 0.39496762743265895, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8711964472387185, "test/sim_max_reward_4500022": 0.42258381959512703, "test/sim_max_reward_4500023": 0.986524645805288, "test/sim_max_reward_4500024": 0.9293661497676484, "test/sim_max_reward_4500025": 0.9287087526768351, "test/sim_max_reward_4500026": 0.7452463542950428, "test/sim_max_reward_4500027": 0.9073073705628594, "test/sim_max_reward_4500028": 0.19364901856337666, "test/sim_max_reward_4500029": 0.2570437797211783, "test/sim_max_reward_4500030": 0.9512080434582533, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9880480600574109, "test/sim_max_reward_4500034": 0.87240630034971, "test/sim_max_reward_4500035": 0.5643729071105152, "test/sim_max_reward_4500036": 0.9036156243475545, "test/sim_max_reward_4500037": 0.9882734567655953, "test/sim_max_reward_4500038": 0.9715490550168349, "test/sim_max_reward_4500039": 0.8173602477560498, "test/sim_max_reward_4500040": 0.9112175843324131, "test/sim_max_reward_4500041": 0.4263565772058924, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.3408671829292147, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9788806969061316, "test/sim_max_reward_4500046": 0.9070851482771173, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 0.9673202838616745, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.7169675988762988, "test/mean_score": 0.5806533422916157, "val_loss": 76563.8203125} {"train_loss": -6.5507354736328125, "global_step": 115542, "epoch": 2751} {"train_loss": -6.461398124694824, "global_step": 115543, "epoch": 2751} {"train_loss": -6.655169486999512, "global_step": 115544, "epoch": 2751} {"train_loss": -6.628379821777344, "global_step": 115545, "epoch": 2751} {"train_loss": -6.576966285705566, "global_step": 115546, "epoch": 2751} {"train_loss": -6.587309837341309, "global_step": 115547, "epoch": 2751} {"train_loss": -6.501038074493408, "global_step": 115548, "epoch": 2751} {"train_loss": -6.56256103515625, "global_step": 115549, "epoch": 2751} {"train_loss": -6.619952201843262, "global_step": 115550, "epoch": 2751} {"train_loss": -6.629441261291504, "global_step": 115551, "epoch": 2751} {"train_loss": -6.491838455200195, "global_step": 115552, "epoch": 2751} {"train_loss": -6.622767925262451, "global_step": 115553, "epoch": 2751} {"train_loss": -6.6150922775268555, "global_step": 115554, "epoch": 2751} {"train_loss": -6.505492687225342, "global_step": 115555, "epoch": 2751} {"train_loss": -6.574158668518066, "global_step": 115556, "epoch": 2751} {"train_loss": -6.5370025634765625, "global_step": 115557, "epoch": 2751} {"train_loss": -6.588944435119629, "global_step": 115558, "epoch": 2751} {"train_loss": -6.539461135864258, "global_step": 115559, "epoch": 2751} {"train_loss": -6.590935707092285, "global_step": 115560, "epoch": 2751} {"train_loss": -6.587567329406738, "global_step": 115561, "epoch": 2751} {"train_loss": -6.4848833084106445, "global_step": 115562, "epoch": 2751} {"train_loss": -6.631887435913086, "global_step": 115563, "epoch": 2751} {"train_loss": -6.589113235473633, "global_step": 115564, "epoch": 2751} {"train_loss": -6.417385101318359, "global_step": 115565, "epoch": 2751} {"train_loss": -6.477025985717773, "global_step": 115566, "epoch": 2751} {"train_loss": -6.454141139984131, "global_step": 115567, "epoch": 2751} {"train_loss": -6.428730487823486, "global_step": 115568, "epoch": 2751} {"train_loss": -6.587378978729248, "global_step": 115569, "epoch": 2751} {"train_loss": -6.384120464324951, "global_step": 115570, "epoch": 2751} {"train_loss": -6.3556976318359375, "global_step": 115571, "epoch": 2751} {"train_loss": -6.489529609680176, "global_step": 115572, "epoch": 2751} {"train_loss": -6.368024826049805, "global_step": 115573, "epoch": 2751} {"train_loss": -6.432692527770996, "global_step": 115574, "epoch": 2751} {"train_loss": -6.622637748718262, "global_step": 115575, "epoch": 2751} {"train_loss": -6.494931221008301, "global_step": 115576, "epoch": 2751} {"train_loss": -6.614843368530273, "global_step": 115577, "epoch": 2751} {"train_loss": -6.5506439208984375, "global_step": 115578, "epoch": 2751} {"train_loss": -6.489171504974365, "global_step": 115579, "epoch": 2751} {"train_loss": -6.502490997314453, "global_step": 115580, "epoch": 2751} {"train_loss": -6.425258159637451, "global_step": 115581, "epoch": 2751} {"train_loss": -6.465973377227783, "global_step": 115582, "epoch": 2751} {"train_loss": -6.527170010975429, "global_step": 115583, "epoch": 2751, "val_loss": 76553.0078125} {"train_loss": -6.5476579666137695, "global_step": 115584, "epoch": 2752} {"train_loss": -6.50467586517334, "global_step": 115585, "epoch": 2752} {"train_loss": -6.564688205718994, "global_step": 115586, "epoch": 2752} {"train_loss": -6.7306365966796875, "global_step": 115587, "epoch": 2752} {"train_loss": -6.578215599060059, "global_step": 115588, "epoch": 2752} {"train_loss": -6.502824783325195, "global_step": 115589, "epoch": 2752} {"train_loss": -6.5665483474731445, "global_step": 115590, "epoch": 2752} {"train_loss": -6.59804630279541, "global_step": 115591, "epoch": 2752} {"train_loss": -6.609952926635742, "global_step": 115592, "epoch": 2752} {"train_loss": -6.535224437713623, "global_step": 115593, "epoch": 2752} {"train_loss": -6.574643135070801, "global_step": 115594, "epoch": 2752} {"train_loss": -6.640629768371582, "global_step": 115595, "epoch": 2752} {"train_loss": -6.5011186599731445, "global_step": 115596, "epoch": 2752} {"train_loss": -6.558370590209961, "global_step": 115597, "epoch": 2752} {"train_loss": -6.591951847076416, "global_step": 115598, "epoch": 2752} {"train_loss": -6.505784034729004, "global_step": 115599, "epoch": 2752} {"train_loss": -6.644831657409668, "global_step": 115600, "epoch": 2752} {"train_loss": -6.377516746520996, "global_step": 115601, "epoch": 2752} {"train_loss": -6.420037269592285, "global_step": 115602, "epoch": 2752} {"train_loss": -6.552725791931152, "global_step": 115603, "epoch": 2752} {"train_loss": -6.2105183601379395, "global_step": 115604, "epoch": 2752} {"train_loss": -6.477364540100098, "global_step": 115605, "epoch": 2752} {"train_loss": -6.398612976074219, "global_step": 115606, "epoch": 2752} {"train_loss": -6.360716819763184, "global_step": 115607, "epoch": 2752} {"train_loss": -6.525426864624023, "global_step": 115608, "epoch": 2752} {"train_loss": -6.420633316040039, "global_step": 115609, "epoch": 2752} {"train_loss": -6.394931793212891, "global_step": 115610, "epoch": 2752} {"train_loss": -6.482123374938965, "global_step": 115611, "epoch": 2752} {"train_loss": -6.383347034454346, "global_step": 115612, "epoch": 2752} {"train_loss": -6.45565128326416, "global_step": 115613, "epoch": 2752} {"train_loss": -6.410579681396484, "global_step": 115614, "epoch": 2752} {"train_loss": -6.485700607299805, "global_step": 115615, "epoch": 2752} {"train_loss": -6.4198503494262695, "global_step": 115616, "epoch": 2752} {"train_loss": -6.440908908843994, "global_step": 115617, "epoch": 2752} {"train_loss": -6.3410139083862305, "global_step": 115618, "epoch": 2752} {"train_loss": -6.430598258972168, "global_step": 115619, "epoch": 2752} {"train_loss": -6.3718767166137695, "global_step": 115620, "epoch": 2752} {"train_loss": -6.4395751953125, "global_step": 115621, "epoch": 2752} {"train_loss": -6.4807305335998535, "global_step": 115622, "epoch": 2752} {"train_loss": -6.47874116897583, "global_step": 115623, "epoch": 2752} {"train_loss": -6.420619964599609, "global_step": 115624, "epoch": 2752} {"train_loss": -6.485924788883755, "global_step": 115625, "epoch": 2752, "val_loss": 76805.84375} {"train_loss": -6.470047950744629, "global_step": 115626, "epoch": 2753} {"train_loss": -6.487227439880371, "global_step": 115627, "epoch": 2753} {"train_loss": -6.419987678527832, "global_step": 115628, "epoch": 2753} {"train_loss": -6.475404262542725, "global_step": 115629, "epoch": 2753} {"train_loss": -6.483465194702148, "global_step": 115630, "epoch": 2753} {"train_loss": -6.485916614532471, "global_step": 115631, "epoch": 2753} {"train_loss": -6.404675483703613, "global_step": 115632, "epoch": 2753} {"train_loss": -6.457717418670654, "global_step": 115633, "epoch": 2753} {"train_loss": -6.412787437438965, "global_step": 115634, "epoch": 2753} {"train_loss": -6.415870666503906, "global_step": 115635, "epoch": 2753} {"train_loss": -6.363576412200928, "global_step": 115636, "epoch": 2753} {"train_loss": -6.546667098999023, "global_step": 115637, "epoch": 2753} {"train_loss": -6.357439041137695, "global_step": 115638, "epoch": 2753} {"train_loss": -6.481295585632324, "global_step": 115639, "epoch": 2753} {"train_loss": -6.51131534576416, "global_step": 115640, "epoch": 2753} {"train_loss": -6.337958335876465, "global_step": 115641, "epoch": 2753} {"train_loss": -6.56259298324585, "global_step": 115642, "epoch": 2753} {"train_loss": -6.472448825836182, "global_step": 115643, "epoch": 2753} {"train_loss": -6.48956823348999, "global_step": 115644, "epoch": 2753} {"train_loss": -6.5167236328125, "global_step": 115645, "epoch": 2753} {"train_loss": -6.454658508300781, "global_step": 115646, "epoch": 2753} {"train_loss": -6.5389790534973145, "global_step": 115647, "epoch": 2753} {"train_loss": -6.49949312210083, "global_step": 115648, "epoch": 2753} {"train_loss": -6.4387922286987305, "global_step": 115649, "epoch": 2753} {"train_loss": -6.3856987953186035, "global_step": 115650, "epoch": 2753} {"train_loss": -6.472431182861328, "global_step": 115651, "epoch": 2753} {"train_loss": -6.438553333282471, "global_step": 115652, "epoch": 2753} {"train_loss": -6.417113304138184, "global_step": 115653, "epoch": 2753} {"train_loss": -6.492164611816406, "global_step": 115654, "epoch": 2753} {"train_loss": -6.3997955322265625, "global_step": 115655, "epoch": 2753} {"train_loss": -6.410004138946533, "global_step": 115656, "epoch": 2753} {"train_loss": -6.557662010192871, "global_step": 115657, "epoch": 2753} {"train_loss": -6.5006914138793945, "global_step": 115658, "epoch": 2753} {"train_loss": -6.535917282104492, "global_step": 115659, "epoch": 2753} {"train_loss": -6.528280258178711, "global_step": 115660, "epoch": 2753} {"train_loss": -6.387139320373535, "global_step": 115661, "epoch": 2753} {"train_loss": -6.479381561279297, "global_step": 115662, "epoch": 2753} {"train_loss": -6.617894649505615, "global_step": 115663, "epoch": 2753} {"train_loss": -6.548707962036133, "global_step": 115664, "epoch": 2753} {"train_loss": -6.521903991699219, "global_step": 115665, "epoch": 2753} {"train_loss": -6.552870750427246, "global_step": 115666, "epoch": 2753} {"train_loss": -6.471449908756075, "global_step": 115667, "epoch": 2753, "val_loss": 76595.890625} {"train_loss": -6.47341251373291, "global_step": 115668, "epoch": 2754} {"train_loss": -6.479063987731934, "global_step": 115669, "epoch": 2754} {"train_loss": -6.550325393676758, "global_step": 115670, "epoch": 2754} {"train_loss": -6.436416149139404, "global_step": 115671, "epoch": 2754} {"train_loss": -6.557351112365723, "global_step": 115672, "epoch": 2754} {"train_loss": -6.503101348876953, "global_step": 115673, "epoch": 2754} {"train_loss": -6.440079212188721, "global_step": 115674, "epoch": 2754} {"train_loss": -6.556977272033691, "global_step": 115675, "epoch": 2754} {"train_loss": -6.374722480773926, "global_step": 115676, "epoch": 2754} {"train_loss": -6.413824558258057, "global_step": 115677, "epoch": 2754} {"train_loss": -6.528937816619873, "global_step": 115678, "epoch": 2754} {"train_loss": -6.493656158447266, "global_step": 115679, "epoch": 2754} {"train_loss": -6.489823341369629, "global_step": 115680, "epoch": 2754} {"train_loss": -6.507155418395996, "global_step": 115681, "epoch": 2754} {"train_loss": -6.496608734130859, "global_step": 115682, "epoch": 2754} {"train_loss": -6.427740097045898, "global_step": 115683, "epoch": 2754} {"train_loss": -6.542087554931641, "global_step": 115684, "epoch": 2754} {"train_loss": -6.467233657836914, "global_step": 115685, "epoch": 2754} {"train_loss": -6.573314666748047, "global_step": 115686, "epoch": 2754} {"train_loss": -6.427773952484131, "global_step": 115687, "epoch": 2754} {"train_loss": -6.501560211181641, "global_step": 115688, "epoch": 2754} {"train_loss": -6.4543352127075195, "global_step": 115689, "epoch": 2754} {"train_loss": -6.512268543243408, "global_step": 115690, "epoch": 2754} {"train_loss": -6.4737443923950195, "global_step": 115691, "epoch": 2754} {"train_loss": -6.44703483581543, "global_step": 115692, "epoch": 2754} {"train_loss": -6.456831932067871, "global_step": 115693, "epoch": 2754} {"train_loss": -6.523238658905029, "global_step": 115694, "epoch": 2754} {"train_loss": -6.550471305847168, "global_step": 115695, "epoch": 2754} {"train_loss": -6.500685691833496, "global_step": 115696, "epoch": 2754} {"train_loss": -6.6409711837768555, "global_step": 115697, "epoch": 2754} {"train_loss": -6.526907920837402, "global_step": 115698, "epoch": 2754} {"train_loss": -6.512933731079102, "global_step": 115699, "epoch": 2754} {"train_loss": -6.549422264099121, "global_step": 115700, "epoch": 2754} {"train_loss": -6.397546291351318, "global_step": 115701, "epoch": 2754} {"train_loss": -6.548532485961914, "global_step": 115702, "epoch": 2754} {"train_loss": -6.482852935791016, "global_step": 115703, "epoch": 2754} {"train_loss": -6.503641605377197, "global_step": 115704, "epoch": 2754} {"train_loss": -6.502177715301514, "global_step": 115705, "epoch": 2754} {"train_loss": -6.513490676879883, "global_step": 115706, "epoch": 2754} {"train_loss": -6.471472263336182, "global_step": 115707, "epoch": 2754} {"train_loss": -6.492239952087402, "global_step": 115708, "epoch": 2754} {"train_loss": -6.4957747005280995, "global_step": 115709, "epoch": 2754, "val_loss": 76682.8984375} {"train_loss": -6.503237247467041, "global_step": 115710, "epoch": 2755} {"train_loss": -6.4674296379089355, "global_step": 115711, "epoch": 2755} {"train_loss": -6.594820022583008, "global_step": 115712, "epoch": 2755} {"train_loss": -6.543270587921143, "global_step": 115713, "epoch": 2755} {"train_loss": -6.487936973571777, "global_step": 115714, "epoch": 2755} {"train_loss": -6.39992618560791, "global_step": 115715, "epoch": 2755} {"train_loss": -6.4374213218688965, "global_step": 115716, "epoch": 2755} {"train_loss": -6.488740921020508, "global_step": 115717, "epoch": 2755} {"train_loss": -6.368758201599121, "global_step": 115718, "epoch": 2755} {"train_loss": -6.48486852645874, "global_step": 115719, "epoch": 2755} {"train_loss": -6.484185218811035, "global_step": 115720, "epoch": 2755} {"train_loss": -6.40991735458374, "global_step": 115721, "epoch": 2755} {"train_loss": -6.542431831359863, "global_step": 115722, "epoch": 2755} {"train_loss": -6.4354448318481445, "global_step": 115723, "epoch": 2755} {"train_loss": -6.470809459686279, "global_step": 115724, "epoch": 2755} {"train_loss": -6.482508182525635, "global_step": 115725, "epoch": 2755} {"train_loss": -6.541663646697998, "global_step": 115726, "epoch": 2755} {"train_loss": -6.390159606933594, "global_step": 115727, "epoch": 2755} {"train_loss": -6.477323532104492, "global_step": 115728, "epoch": 2755} {"train_loss": -6.642600059509277, "global_step": 115729, "epoch": 2755} {"train_loss": -6.48199462890625, "global_step": 115730, "epoch": 2755} {"train_loss": -6.506470203399658, "global_step": 115731, "epoch": 2755} {"train_loss": -6.511272430419922, "global_step": 115732, "epoch": 2755} {"train_loss": -6.443910598754883, "global_step": 115733, "epoch": 2755} {"train_loss": -6.4995293617248535, "global_step": 115734, "epoch": 2755} {"train_loss": -6.493432998657227, "global_step": 115735, "epoch": 2755} {"train_loss": -6.484389305114746, "global_step": 115736, "epoch": 2755} {"train_loss": -6.627549171447754, "global_step": 115737, "epoch": 2755} {"train_loss": -6.56679630279541, "global_step": 115738, "epoch": 2755} {"train_loss": -6.460626602172852, "global_step": 115739, "epoch": 2755} {"train_loss": -6.485457420349121, "global_step": 115740, "epoch": 2755} {"train_loss": -6.492006301879883, "global_step": 115741, "epoch": 2755} {"train_loss": -6.544909954071045, "global_step": 115742, "epoch": 2755} {"train_loss": -6.420612335205078, "global_step": 115743, "epoch": 2755} {"train_loss": -6.587904453277588, "global_step": 115744, "epoch": 2755} {"train_loss": -6.542624473571777, "global_step": 115745, "epoch": 2755} {"train_loss": -6.43592643737793, "global_step": 115746, "epoch": 2755} {"train_loss": -6.5132670402526855, "global_step": 115747, "epoch": 2755} {"train_loss": -6.442059516906738, "global_step": 115748, "epoch": 2755} {"train_loss": -6.490879535675049, "global_step": 115749, "epoch": 2755} {"train_loss": -6.544229507446289, "global_step": 115750, "epoch": 2755} {"train_loss": -6.492414338248117, "global_step": 115751, "epoch": 2755, "val_loss": 76336.6484375} {"train_loss": -6.501201629638672, "global_step": 115752, "epoch": 2756} {"train_loss": -6.517209053039551, "global_step": 115753, "epoch": 2756} {"train_loss": -6.479747772216797, "global_step": 115754, "epoch": 2756} {"train_loss": -6.455131530761719, "global_step": 115755, "epoch": 2756} {"train_loss": -6.480609893798828, "global_step": 115756, "epoch": 2756} {"train_loss": -6.54358434677124, "global_step": 115757, "epoch": 2756} {"train_loss": -6.462643623352051, "global_step": 115758, "epoch": 2756} {"train_loss": -6.475521564483643, "global_step": 115759, "epoch": 2756} {"train_loss": -6.517980098724365, "global_step": 115760, "epoch": 2756} {"train_loss": -6.437730312347412, "global_step": 115761, "epoch": 2756} {"train_loss": -6.547645568847656, "global_step": 115762, "epoch": 2756} {"train_loss": -6.6297760009765625, "global_step": 115763, "epoch": 2756} {"train_loss": -6.417088031768799, "global_step": 115764, "epoch": 2756} {"train_loss": -6.418548107147217, "global_step": 115765, "epoch": 2756} {"train_loss": -6.558427810668945, "global_step": 115766, "epoch": 2756} {"train_loss": -6.524566650390625, "global_step": 115767, "epoch": 2756} {"train_loss": -6.418625831604004, "global_step": 115768, "epoch": 2756} {"train_loss": -6.345593452453613, "global_step": 115769, "epoch": 2756} {"train_loss": -6.58286190032959, "global_step": 115770, "epoch": 2756} {"train_loss": -6.538804054260254, "global_step": 115771, "epoch": 2756} {"train_loss": -6.476809501647949, "global_step": 115772, "epoch": 2756} {"train_loss": -6.481116771697998, "global_step": 115773, "epoch": 2756} {"train_loss": -6.540720462799072, "global_step": 115774, "epoch": 2756} {"train_loss": -6.418645858764648, "global_step": 115775, "epoch": 2756} {"train_loss": -6.537693500518799, "global_step": 115776, "epoch": 2756} {"train_loss": -6.497715473175049, "global_step": 115777, "epoch": 2756} {"train_loss": -6.447909355163574, "global_step": 115778, "epoch": 2756} {"train_loss": -6.57484245300293, "global_step": 115779, "epoch": 2756} {"train_loss": -6.51490592956543, "global_step": 115780, "epoch": 2756} {"train_loss": -6.502181053161621, "global_step": 115781, "epoch": 2756} {"train_loss": -6.513002395629883, "global_step": 115782, "epoch": 2756} {"train_loss": -6.564953327178955, "global_step": 115783, "epoch": 2756} {"train_loss": -6.545463562011719, "global_step": 115784, "epoch": 2756} {"train_loss": -6.601189613342285, "global_step": 115785, "epoch": 2756} {"train_loss": -6.598165035247803, "global_step": 115786, "epoch": 2756} {"train_loss": -6.537480354309082, "global_step": 115787, "epoch": 2756} {"train_loss": -6.678752899169922, "global_step": 115788, "epoch": 2756} {"train_loss": -6.449328422546387, "global_step": 115789, "epoch": 2756} {"train_loss": -6.3466315269470215, "global_step": 115790, "epoch": 2756} {"train_loss": -6.366208553314209, "global_step": 115791, "epoch": 2756} {"train_loss": -6.532585144042969, "global_step": 115792, "epoch": 2756} {"train_loss": -6.504337390263875, "global_step": 115793, "epoch": 2756, "val_loss": 76716.3359375} {"train_loss": -6.657232284545898, "global_step": 115794, "epoch": 2757} {"train_loss": -6.50675106048584, "global_step": 115795, "epoch": 2757} {"train_loss": -6.546234130859375, "global_step": 115796, "epoch": 2757} {"train_loss": -6.462270736694336, "global_step": 115797, "epoch": 2757} {"train_loss": -6.470848083496094, "global_step": 115798, "epoch": 2757} {"train_loss": -6.59281063079834, "global_step": 115799, "epoch": 2757} {"train_loss": -6.4671711921691895, "global_step": 115800, "epoch": 2757} {"train_loss": -6.613121509552002, "global_step": 115801, "epoch": 2757} {"train_loss": -6.389448642730713, "global_step": 115802, "epoch": 2757} {"train_loss": -6.465091228485107, "global_step": 115803, "epoch": 2757} {"train_loss": -6.436917781829834, "global_step": 115804, "epoch": 2757} {"train_loss": -6.480845928192139, "global_step": 115805, "epoch": 2757} {"train_loss": -6.550246238708496, "global_step": 115806, "epoch": 2757} {"train_loss": -6.5251030921936035, "global_step": 115807, "epoch": 2757} {"train_loss": -6.457840442657471, "global_step": 115808, "epoch": 2757} {"train_loss": -6.556239128112793, "global_step": 115809, "epoch": 2757} {"train_loss": -6.511740684509277, "global_step": 115810, "epoch": 2757} {"train_loss": -6.485550880432129, "global_step": 115811, "epoch": 2757} {"train_loss": -6.551263809204102, "global_step": 115812, "epoch": 2757} {"train_loss": -6.586640357971191, "global_step": 115813, "epoch": 2757} {"train_loss": -6.55660343170166, "global_step": 115814, "epoch": 2757} {"train_loss": -6.476896286010742, "global_step": 115815, "epoch": 2757} {"train_loss": -6.409197807312012, "global_step": 115816, "epoch": 2757} {"train_loss": -6.623788833618164, "global_step": 115817, "epoch": 2757} {"train_loss": -6.44136905670166, "global_step": 115818, "epoch": 2757} {"train_loss": -6.529763698577881, "global_step": 115819, "epoch": 2757} {"train_loss": -6.37105655670166, "global_step": 115820, "epoch": 2757} {"train_loss": -6.574106216430664, "global_step": 115821, "epoch": 2757} {"train_loss": -6.48829460144043, "global_step": 115822, "epoch": 2757} {"train_loss": -6.449782371520996, "global_step": 115823, "epoch": 2757} {"train_loss": -6.661759376525879, "global_step": 115824, "epoch": 2757} {"train_loss": -6.4926862716674805, "global_step": 115825, "epoch": 2757} {"train_loss": -6.519224166870117, "global_step": 115826, "epoch": 2757} {"train_loss": -6.497115135192871, "global_step": 115827, "epoch": 2757} {"train_loss": -6.519220352172852, "global_step": 115828, "epoch": 2757} {"train_loss": -6.539868354797363, "global_step": 115829, "epoch": 2757} {"train_loss": -6.471044063568115, "global_step": 115830, "epoch": 2757} {"train_loss": -6.304901599884033, "global_step": 115831, "epoch": 2757} {"train_loss": -6.423593521118164, "global_step": 115832, "epoch": 2757} {"train_loss": -6.496706962585449, "global_step": 115833, "epoch": 2757} {"train_loss": -6.5802412033081055, "global_step": 115834, "epoch": 2757} {"train_loss": -6.502371231714885, "global_step": 115835, "epoch": 2757, "val_loss": 76898.96875} {"train_loss": -6.616415023803711, "global_step": 115836, "epoch": 2758} {"train_loss": -6.378907680511475, "global_step": 115837, "epoch": 2758} {"train_loss": -6.430453777313232, "global_step": 115838, "epoch": 2758} {"train_loss": -6.419062614440918, "global_step": 115839, "epoch": 2758} {"train_loss": -6.487536907196045, "global_step": 115840, "epoch": 2758} {"train_loss": -6.445879936218262, "global_step": 115841, "epoch": 2758} {"train_loss": -6.392621040344238, "global_step": 115842, "epoch": 2758} {"train_loss": -6.58070707321167, "global_step": 115843, "epoch": 2758} {"train_loss": -6.566763877868652, "global_step": 115844, "epoch": 2758} {"train_loss": -6.502621650695801, "global_step": 115845, "epoch": 2758} {"train_loss": -6.421740531921387, "global_step": 115846, "epoch": 2758} {"train_loss": -6.486263275146484, "global_step": 115847, "epoch": 2758} {"train_loss": -6.530879974365234, "global_step": 115848, "epoch": 2758} {"train_loss": -6.541955947875977, "global_step": 115849, "epoch": 2758} {"train_loss": -6.528929233551025, "global_step": 115850, "epoch": 2758} {"train_loss": -6.484912872314453, "global_step": 115851, "epoch": 2758} {"train_loss": -6.510313987731934, "global_step": 115852, "epoch": 2758} {"train_loss": -6.500363826751709, "global_step": 115853, "epoch": 2758} {"train_loss": -6.575164794921875, "global_step": 115854, "epoch": 2758} {"train_loss": -6.52616024017334, "global_step": 115855, "epoch": 2758} {"train_loss": -6.4578857421875, "global_step": 115856, "epoch": 2758} {"train_loss": -6.735254287719727, "global_step": 115857, "epoch": 2758} {"train_loss": -6.457613468170166, "global_step": 115858, "epoch": 2758} {"train_loss": -6.495369911193848, "global_step": 115859, "epoch": 2758} {"train_loss": -6.575565338134766, "global_step": 115860, "epoch": 2758} {"train_loss": -6.472580909729004, "global_step": 115861, "epoch": 2758} {"train_loss": -6.53481388092041, "global_step": 115862, "epoch": 2758} {"train_loss": -6.563138008117676, "global_step": 115863, "epoch": 2758} {"train_loss": -6.510746002197266, "global_step": 115864, "epoch": 2758} {"train_loss": -6.480185031890869, "global_step": 115865, "epoch": 2758} {"train_loss": -6.493419647216797, "global_step": 115866, "epoch": 2758} {"train_loss": -6.537456512451172, "global_step": 115867, "epoch": 2758} {"train_loss": -6.6667375564575195, "global_step": 115868, "epoch": 2758} {"train_loss": -6.607760429382324, "global_step": 115869, "epoch": 2758} {"train_loss": -6.503106594085693, "global_step": 115870, "epoch": 2758} {"train_loss": -6.510236740112305, "global_step": 115871, "epoch": 2758} {"train_loss": -6.603011131286621, "global_step": 115872, "epoch": 2758} {"train_loss": -6.576302528381348, "global_step": 115873, "epoch": 2758} {"train_loss": -6.59661865234375, "global_step": 115874, "epoch": 2758} {"train_loss": -6.669795989990234, "global_step": 115875, "epoch": 2758} {"train_loss": -6.4566264152526855, "global_step": 115876, "epoch": 2758} {"train_loss": -6.525410890579224, "global_step": 115877, "epoch": 2758, "val_loss": 76384.375} {"train_loss": -6.58003568649292, "global_step": 115878, "epoch": 2759} {"train_loss": -6.519448280334473, "global_step": 115879, "epoch": 2759} {"train_loss": -6.482063293457031, "global_step": 115880, "epoch": 2759} {"train_loss": -6.625288486480713, "global_step": 115881, "epoch": 2759} {"train_loss": -6.629279136657715, "global_step": 115882, "epoch": 2759} {"train_loss": -6.397215843200684, "global_step": 115883, "epoch": 2759} {"train_loss": -6.544653415679932, "global_step": 115884, "epoch": 2759} {"train_loss": -6.6072492599487305, "global_step": 115885, "epoch": 2759} {"train_loss": -6.489980697631836, "global_step": 115886, "epoch": 2759} {"train_loss": -6.575655937194824, "global_step": 115887, "epoch": 2759} {"train_loss": -6.646374702453613, "global_step": 115888, "epoch": 2759} {"train_loss": -6.466469764709473, "global_step": 115889, "epoch": 2759} {"train_loss": -6.640758991241455, "global_step": 115890, "epoch": 2759} {"train_loss": -6.5635552406311035, "global_step": 115891, "epoch": 2759} {"train_loss": -6.518159866333008, "global_step": 115892, "epoch": 2759} {"train_loss": -6.5952348709106445, "global_step": 115893, "epoch": 2759} {"train_loss": -6.590112686157227, "global_step": 115894, "epoch": 2759} {"train_loss": -6.455798149108887, "global_step": 115895, "epoch": 2759} {"train_loss": -6.389135837554932, "global_step": 115896, "epoch": 2759} {"train_loss": -6.517182350158691, "global_step": 115897, "epoch": 2759} {"train_loss": -6.610511302947998, "global_step": 115898, "epoch": 2759} {"train_loss": -6.423977851867676, "global_step": 115899, "epoch": 2759} {"train_loss": -6.605974197387695, "global_step": 115900, "epoch": 2759} {"train_loss": -6.43759822845459, "global_step": 115901, "epoch": 2759} {"train_loss": -6.530267715454102, "global_step": 115902, "epoch": 2759} {"train_loss": -6.45796012878418, "global_step": 115903, "epoch": 2759} {"train_loss": -6.549962997436523, "global_step": 115904, "epoch": 2759} {"train_loss": -6.608725547790527, "global_step": 115905, "epoch": 2759} {"train_loss": -6.498041152954102, "global_step": 115906, "epoch": 2759} {"train_loss": -6.552913188934326, "global_step": 115907, "epoch": 2759} {"train_loss": -6.5243120193481445, "global_step": 115908, "epoch": 2759} {"train_loss": -6.537405967712402, "global_step": 115909, "epoch": 2759} {"train_loss": -6.614620208740234, "global_step": 115910, "epoch": 2759} {"train_loss": -6.542304992675781, "global_step": 115911, "epoch": 2759} {"train_loss": -6.608445167541504, "global_step": 115912, "epoch": 2759} {"train_loss": -6.509599685668945, "global_step": 115913, "epoch": 2759} {"train_loss": -6.456110954284668, "global_step": 115914, "epoch": 2759} {"train_loss": -6.662649154663086, "global_step": 115915, "epoch": 2759} {"train_loss": -6.4630327224731445, "global_step": 115916, "epoch": 2759} {"train_loss": -6.430365085601807, "global_step": 115917, "epoch": 2759} {"train_loss": -6.487603187561035, "global_step": 115918, "epoch": 2759} {"train_loss": -6.534223272686913, "global_step": 115919, "epoch": 2759, "val_loss": 76830.6015625} {"train_loss": -6.507470607757568, "global_step": 115920, "epoch": 2760} {"train_loss": -6.551958084106445, "global_step": 115921, "epoch": 2760} {"train_loss": -6.403836250305176, "global_step": 115922, "epoch": 2760} {"train_loss": -6.5835371017456055, "global_step": 115923, "epoch": 2760} {"train_loss": -6.399739742279053, "global_step": 115924, "epoch": 2760} {"train_loss": -6.580530166625977, "global_step": 115925, "epoch": 2760} {"train_loss": -6.584854602813721, "global_step": 115926, "epoch": 2760} {"train_loss": -6.479663848876953, "global_step": 115927, "epoch": 2760} {"train_loss": -6.544098854064941, "global_step": 115928, "epoch": 2760} {"train_loss": -6.531628131866455, "global_step": 115929, "epoch": 2760} {"train_loss": -6.580843925476074, "global_step": 115930, "epoch": 2760} {"train_loss": -6.507251739501953, "global_step": 115931, "epoch": 2760} {"train_loss": -6.569787979125977, "global_step": 115932, "epoch": 2760} {"train_loss": -6.615794658660889, "global_step": 115933, "epoch": 2760} {"train_loss": -6.547306060791016, "global_step": 115934, "epoch": 2760} {"train_loss": -6.612318992614746, "global_step": 115935, "epoch": 2760} {"train_loss": -6.656767845153809, "global_step": 115936, "epoch": 2760} {"train_loss": -6.606992721557617, "global_step": 115937, "epoch": 2760} {"train_loss": -6.626886367797852, "global_step": 115938, "epoch": 2760} {"train_loss": -6.512476921081543, "global_step": 115939, "epoch": 2760} {"train_loss": -6.572661399841309, "global_step": 115940, "epoch": 2760} {"train_loss": -6.608227729797363, "global_step": 115941, "epoch": 2760} {"train_loss": -6.614562034606934, "global_step": 115942, "epoch": 2760} {"train_loss": -6.538991928100586, "global_step": 115943, "epoch": 2760} {"train_loss": -6.611130714416504, "global_step": 115944, "epoch": 2760} {"train_loss": -6.516210556030273, "global_step": 115945, "epoch": 2760} {"train_loss": -6.614538192749023, "global_step": 115946, "epoch": 2760} {"train_loss": -6.590940952301025, "global_step": 115947, "epoch": 2760} {"train_loss": -6.64277458190918, "global_step": 115948, "epoch": 2760} {"train_loss": -6.627380847930908, "global_step": 115949, "epoch": 2760} {"train_loss": -6.699612617492676, "global_step": 115950, "epoch": 2760} {"train_loss": -6.635309219360352, "global_step": 115951, "epoch": 2760} {"train_loss": -6.5860185623168945, "global_step": 115952, "epoch": 2760} {"train_loss": -6.512446403503418, "global_step": 115953, "epoch": 2760} {"train_loss": -6.568005561828613, "global_step": 115954, "epoch": 2760} {"train_loss": -6.453017234802246, "global_step": 115955, "epoch": 2760} {"train_loss": -6.433414459228516, "global_step": 115956, "epoch": 2760} {"train_loss": -6.637484550476074, "global_step": 115957, "epoch": 2760} {"train_loss": -6.62106466293335, "global_step": 115958, "epoch": 2760} {"train_loss": -6.468914031982422, "global_step": 115959, "epoch": 2760} {"train_loss": -6.62969446182251, "global_step": 115960, "epoch": 2760} {"train_loss": -6.564389592125302, "global_step": 115961, "epoch": 2760, "val_loss": 76634.078125} {"train_loss": -6.623416423797607, "global_step": 115962, "epoch": 2761} {"train_loss": -6.511466026306152, "global_step": 115963, "epoch": 2761} {"train_loss": -6.5824737548828125, "global_step": 115964, "epoch": 2761} {"train_loss": -6.6484832763671875, "global_step": 115965, "epoch": 2761} {"train_loss": -6.585231781005859, "global_step": 115966, "epoch": 2761} {"train_loss": -6.5709967613220215, "global_step": 115967, "epoch": 2761} {"train_loss": -6.503241062164307, "global_step": 115968, "epoch": 2761} {"train_loss": -6.477727890014648, "global_step": 115969, "epoch": 2761} {"train_loss": -6.599644660949707, "global_step": 115970, "epoch": 2761} {"train_loss": -6.54241943359375, "global_step": 115971, "epoch": 2761} {"train_loss": -6.375117301940918, "global_step": 115972, "epoch": 2761} {"train_loss": -6.577746391296387, "global_step": 115973, "epoch": 2761} {"train_loss": -6.490817546844482, "global_step": 115974, "epoch": 2761} {"train_loss": -6.481797218322754, "global_step": 115975, "epoch": 2761} {"train_loss": -6.563071250915527, "global_step": 115976, "epoch": 2761} {"train_loss": -6.530699729919434, "global_step": 115977, "epoch": 2761} {"train_loss": -6.4812188148498535, "global_step": 115978, "epoch": 2761} {"train_loss": -6.556118488311768, "global_step": 115979, "epoch": 2761} {"train_loss": -6.439990997314453, "global_step": 115980, "epoch": 2761} {"train_loss": -6.534834861755371, "global_step": 115981, "epoch": 2761} {"train_loss": -6.467129230499268, "global_step": 115982, "epoch": 2761} {"train_loss": -6.468102931976318, "global_step": 115983, "epoch": 2761} {"train_loss": -6.568568229675293, "global_step": 115984, "epoch": 2761} {"train_loss": -6.560274600982666, "global_step": 115985, "epoch": 2761} {"train_loss": -6.471173286437988, "global_step": 115986, "epoch": 2761} {"train_loss": -6.475013732910156, "global_step": 115987, "epoch": 2761} {"train_loss": -6.4758195877075195, "global_step": 115988, "epoch": 2761} {"train_loss": -6.548399925231934, "global_step": 115989, "epoch": 2761} {"train_loss": -6.422874450683594, "global_step": 115990, "epoch": 2761} {"train_loss": -6.501194000244141, "global_step": 115991, "epoch": 2761} {"train_loss": -6.623100757598877, "global_step": 115992, "epoch": 2761} {"train_loss": -6.527068138122559, "global_step": 115993, "epoch": 2761} {"train_loss": -6.480639457702637, "global_step": 115994, "epoch": 2761} {"train_loss": -6.476380825042725, "global_step": 115995, "epoch": 2761} {"train_loss": -6.487465858459473, "global_step": 115996, "epoch": 2761} {"train_loss": -6.640735149383545, "global_step": 115997, "epoch": 2761} {"train_loss": -6.556538105010986, "global_step": 115998, "epoch": 2761} {"train_loss": -6.520573616027832, "global_step": 115999, "epoch": 2761} {"train_loss": -6.537586212158203, "global_step": 116000, "epoch": 2761} {"train_loss": -6.501371383666992, "global_step": 116001, "epoch": 2761} {"train_loss": -6.4791998863220215, "global_step": 116002, "epoch": 2761} {"train_loss": -6.521834089642479, "global_step": 116003, "epoch": 2761, "val_loss": 76728.859375} {"train_loss": -6.525337219238281, "global_step": 116004, "epoch": 2762} {"train_loss": -6.385181427001953, "global_step": 116005, "epoch": 2762} {"train_loss": -6.641435623168945, "global_step": 116006, "epoch": 2762} {"train_loss": -6.562264919281006, "global_step": 116007, "epoch": 2762} {"train_loss": -6.53143835067749, "global_step": 116008, "epoch": 2762} {"train_loss": -6.498600959777832, "global_step": 116009, "epoch": 2762} {"train_loss": -6.542027473449707, "global_step": 116010, "epoch": 2762} {"train_loss": -6.523055076599121, "global_step": 116011, "epoch": 2762} {"train_loss": -6.5422868728637695, "global_step": 116012, "epoch": 2762} {"train_loss": -6.681741237640381, "global_step": 116013, "epoch": 2762} {"train_loss": -6.3337812423706055, "global_step": 116014, "epoch": 2762} {"train_loss": -6.550602436065674, "global_step": 116015, "epoch": 2762} {"train_loss": -6.596277713775635, "global_step": 116016, "epoch": 2762} {"train_loss": -6.395932197570801, "global_step": 116017, "epoch": 2762} {"train_loss": -6.472049713134766, "global_step": 116018, "epoch": 2762} {"train_loss": -6.475472927093506, "global_step": 116019, "epoch": 2762} {"train_loss": -6.5588459968566895, "global_step": 116020, "epoch": 2762} {"train_loss": -6.492542743682861, "global_step": 116021, "epoch": 2762} {"train_loss": -6.551675796508789, "global_step": 116022, "epoch": 2762} {"train_loss": -6.534144401550293, "global_step": 116023, "epoch": 2762} {"train_loss": -6.488005638122559, "global_step": 116024, "epoch": 2762} {"train_loss": -6.616515159606934, "global_step": 116025, "epoch": 2762} {"train_loss": -6.559485912322998, "global_step": 116026, "epoch": 2762} {"train_loss": -6.637999057769775, "global_step": 116027, "epoch": 2762} {"train_loss": -6.509451866149902, "global_step": 116028, "epoch": 2762} {"train_loss": -6.432985782623291, "global_step": 116029, "epoch": 2762} {"train_loss": -6.437836170196533, "global_step": 116030, "epoch": 2762} {"train_loss": -6.589107990264893, "global_step": 116031, "epoch": 2762} {"train_loss": -6.545490264892578, "global_step": 116032, "epoch": 2762} {"train_loss": -6.392348289489746, "global_step": 116033, "epoch": 2762} {"train_loss": -6.439634323120117, "global_step": 116034, "epoch": 2762} {"train_loss": -6.495021343231201, "global_step": 116035, "epoch": 2762} {"train_loss": -6.55466365814209, "global_step": 116036, "epoch": 2762} {"train_loss": -6.5178961753845215, "global_step": 116037, "epoch": 2762} {"train_loss": -6.500971794128418, "global_step": 116038, "epoch": 2762} {"train_loss": -6.455826759338379, "global_step": 116039, "epoch": 2762} {"train_loss": -6.471277236938477, "global_step": 116040, "epoch": 2762} {"train_loss": -6.470239639282227, "global_step": 116041, "epoch": 2762} {"train_loss": -6.567734718322754, "global_step": 116042, "epoch": 2762} {"train_loss": -6.511908531188965, "global_step": 116043, "epoch": 2762} {"train_loss": -6.477762699127197, "global_step": 116044, "epoch": 2762} {"train_loss": -6.517055170876639, "global_step": 116045, "epoch": 2762, "val_loss": 76448.515625} {"train_loss": -6.556305885314941, "global_step": 116046, "epoch": 2763} {"train_loss": -6.438813209533691, "global_step": 116047, "epoch": 2763} {"train_loss": -6.5015411376953125, "global_step": 116048, "epoch": 2763} {"train_loss": -6.570218086242676, "global_step": 116049, "epoch": 2763} {"train_loss": -6.510410308837891, "global_step": 116050, "epoch": 2763} {"train_loss": -6.593479156494141, "global_step": 116051, "epoch": 2763} {"train_loss": -6.566220760345459, "global_step": 116052, "epoch": 2763} {"train_loss": -6.53306770324707, "global_step": 116053, "epoch": 2763} {"train_loss": -6.471017837524414, "global_step": 116054, "epoch": 2763} {"train_loss": -6.645324230194092, "global_step": 116055, "epoch": 2763} {"train_loss": -6.493125915527344, "global_step": 116056, "epoch": 2763} {"train_loss": -6.443418025970459, "global_step": 116057, "epoch": 2763} {"train_loss": -6.521273612976074, "global_step": 116058, "epoch": 2763} {"train_loss": -6.5915422439575195, "global_step": 116059, "epoch": 2763} {"train_loss": -6.509756565093994, "global_step": 116060, "epoch": 2763} {"train_loss": -6.502527713775635, "global_step": 116061, "epoch": 2763} {"train_loss": -6.477777481079102, "global_step": 116062, "epoch": 2763} {"train_loss": -6.480450630187988, "global_step": 116063, "epoch": 2763} {"train_loss": -6.453660488128662, "global_step": 116064, "epoch": 2763} {"train_loss": -6.5275068283081055, "global_step": 116065, "epoch": 2763} {"train_loss": -6.429224967956543, "global_step": 116066, "epoch": 2763} {"train_loss": -6.555935382843018, "global_step": 116067, "epoch": 2763} {"train_loss": -6.429876804351807, "global_step": 116068, "epoch": 2763} {"train_loss": -6.471852779388428, "global_step": 116069, "epoch": 2763} {"train_loss": -6.504138946533203, "global_step": 116070, "epoch": 2763} {"train_loss": -6.28610372543335, "global_step": 116071, "epoch": 2763} {"train_loss": -6.4262189865112305, "global_step": 116072, "epoch": 2763} {"train_loss": -6.495848655700684, "global_step": 116073, "epoch": 2763} {"train_loss": -6.3854169845581055, "global_step": 116074, "epoch": 2763} {"train_loss": -6.478939533233643, "global_step": 116075, "epoch": 2763} {"train_loss": -6.438483238220215, "global_step": 116076, "epoch": 2763} {"train_loss": -6.510922431945801, "global_step": 116077, "epoch": 2763} {"train_loss": -6.448219299316406, "global_step": 116078, "epoch": 2763} {"train_loss": -6.609652996063232, "global_step": 116079, "epoch": 2763} {"train_loss": -6.489078521728516, "global_step": 116080, "epoch": 2763} {"train_loss": -6.572210311889648, "global_step": 116081, "epoch": 2763} {"train_loss": -6.457566261291504, "global_step": 116082, "epoch": 2763} {"train_loss": -6.354682445526123, "global_step": 116083, "epoch": 2763} {"train_loss": -6.583942413330078, "global_step": 116084, "epoch": 2763} {"train_loss": -6.407746315002441, "global_step": 116085, "epoch": 2763} {"train_loss": -6.441497802734375, "global_step": 116086, "epoch": 2763} {"train_loss": -6.489998249780564, "global_step": 116087, "epoch": 2763, "val_loss": 76611.875} {"train_loss": -6.579257965087891, "global_step": 116088, "epoch": 2764} {"train_loss": -6.503983497619629, "global_step": 116089, "epoch": 2764} {"train_loss": -6.425143241882324, "global_step": 116090, "epoch": 2764} {"train_loss": -6.5848517417907715, "global_step": 116091, "epoch": 2764} {"train_loss": -6.6252336502075195, "global_step": 116092, "epoch": 2764} {"train_loss": -6.509776592254639, "global_step": 116093, "epoch": 2764} {"train_loss": -6.530984401702881, "global_step": 116094, "epoch": 2764} {"train_loss": -6.4982781410217285, "global_step": 116095, "epoch": 2764} {"train_loss": -6.672154426574707, "global_step": 116096, "epoch": 2764} {"train_loss": -6.5084614753723145, "global_step": 116097, "epoch": 2764} {"train_loss": -6.475125789642334, "global_step": 116098, "epoch": 2764} {"train_loss": -6.363783836364746, "global_step": 116099, "epoch": 2764} {"train_loss": -6.517436981201172, "global_step": 116100, "epoch": 2764} {"train_loss": -6.37119197845459, "global_step": 116101, "epoch": 2764} {"train_loss": -6.477581024169922, "global_step": 116102, "epoch": 2764} {"train_loss": -6.506293296813965, "global_step": 116103, "epoch": 2764} {"train_loss": -6.415213584899902, "global_step": 116104, "epoch": 2764} {"train_loss": -6.412581443786621, "global_step": 116105, "epoch": 2764} {"train_loss": -6.589648246765137, "global_step": 116106, "epoch": 2764} {"train_loss": -6.375701904296875, "global_step": 116107, "epoch": 2764} {"train_loss": -6.521737098693848, "global_step": 116108, "epoch": 2764} {"train_loss": -6.474911689758301, "global_step": 116109, "epoch": 2764} {"train_loss": -6.4792160987854, "global_step": 116110, "epoch": 2764} {"train_loss": -6.464487552642822, "global_step": 116111, "epoch": 2764} {"train_loss": -6.380917072296143, "global_step": 116112, "epoch": 2764} {"train_loss": -6.4810590744018555, "global_step": 116113, "epoch": 2764} {"train_loss": -6.427721977233887, "global_step": 116114, "epoch": 2764} {"train_loss": -6.4747772216796875, "global_step": 116115, "epoch": 2764} {"train_loss": -6.447340965270996, "global_step": 116116, "epoch": 2764} {"train_loss": -6.494309425354004, "global_step": 116117, "epoch": 2764} {"train_loss": -6.569496154785156, "global_step": 116118, "epoch": 2764} {"train_loss": -6.526394844055176, "global_step": 116119, "epoch": 2764} {"train_loss": -6.522088527679443, "global_step": 116120, "epoch": 2764} {"train_loss": -6.423418045043945, "global_step": 116121, "epoch": 2764} {"train_loss": -6.487524032592773, "global_step": 116122, "epoch": 2764} {"train_loss": -6.596135139465332, "global_step": 116123, "epoch": 2764} {"train_loss": -6.506141185760498, "global_step": 116124, "epoch": 2764} {"train_loss": -6.593392372131348, "global_step": 116125, "epoch": 2764} {"train_loss": -6.362178802490234, "global_step": 116126, "epoch": 2764} {"train_loss": -6.567185401916504, "global_step": 116127, "epoch": 2764} {"train_loss": -6.591876983642578, "global_step": 116128, "epoch": 2764} {"train_loss": -6.499525058837164, "global_step": 116129, "epoch": 2764, "val_loss": 76545.875} {"train_loss": -6.56314754486084, "global_step": 116130, "epoch": 2765} {"train_loss": -6.572693824768066, "global_step": 116131, "epoch": 2765} {"train_loss": -6.515773773193359, "global_step": 116132, "epoch": 2765} {"train_loss": -6.622567176818848, "global_step": 116133, "epoch": 2765} {"train_loss": -6.512744903564453, "global_step": 116134, "epoch": 2765} {"train_loss": -6.597229957580566, "global_step": 116135, "epoch": 2765} {"train_loss": -6.5259222984313965, "global_step": 116136, "epoch": 2765} {"train_loss": -6.470304489135742, "global_step": 116137, "epoch": 2765} {"train_loss": -6.553123474121094, "global_step": 116138, "epoch": 2765} {"train_loss": -6.605526924133301, "global_step": 116139, "epoch": 2765} {"train_loss": -6.482122421264648, "global_step": 116140, "epoch": 2765} {"train_loss": -6.471344470977783, "global_step": 116141, "epoch": 2765} {"train_loss": -6.545623302459717, "global_step": 116142, "epoch": 2765} {"train_loss": -6.549493789672852, "global_step": 116143, "epoch": 2765} {"train_loss": -6.490767478942871, "global_step": 116144, "epoch": 2765} {"train_loss": -6.551400184631348, "global_step": 116145, "epoch": 2765} {"train_loss": -6.570443630218506, "global_step": 116146, "epoch": 2765} {"train_loss": -6.4642839431762695, "global_step": 116147, "epoch": 2765} {"train_loss": -6.567866325378418, "global_step": 116148, "epoch": 2765} {"train_loss": -6.622332572937012, "global_step": 116149, "epoch": 2765} {"train_loss": -6.547969818115234, "global_step": 116150, "epoch": 2765} {"train_loss": -6.633397102355957, "global_step": 116151, "epoch": 2765} {"train_loss": -6.476949214935303, "global_step": 116152, "epoch": 2765} {"train_loss": -6.508307456970215, "global_step": 116153, "epoch": 2765} {"train_loss": -6.495305061340332, "global_step": 116154, "epoch": 2765} {"train_loss": -6.441399574279785, "global_step": 116155, "epoch": 2765} {"train_loss": -6.578187942504883, "global_step": 116156, "epoch": 2765} {"train_loss": -6.509539604187012, "global_step": 116157, "epoch": 2765} {"train_loss": -6.502405643463135, "global_step": 116158, "epoch": 2765} {"train_loss": -6.503138065338135, "global_step": 116159, "epoch": 2765} {"train_loss": -6.48228645324707, "global_step": 116160, "epoch": 2765} {"train_loss": -6.479968547821045, "global_step": 116161, "epoch": 2765} {"train_loss": -6.578986644744873, "global_step": 116162, "epoch": 2765} {"train_loss": -6.615659236907959, "global_step": 116163, "epoch": 2765} {"train_loss": -6.528017044067383, "global_step": 116164, "epoch": 2765} {"train_loss": -6.546891689300537, "global_step": 116165, "epoch": 2765} {"train_loss": -6.547914505004883, "global_step": 116166, "epoch": 2765} {"train_loss": -6.581928730010986, "global_step": 116167, "epoch": 2765} {"train_loss": -6.587395668029785, "global_step": 116168, "epoch": 2765} {"train_loss": -6.550253391265869, "global_step": 116169, "epoch": 2765} {"train_loss": -6.594995975494385, "global_step": 116170, "epoch": 2765} {"train_loss": -6.540171418871198, "global_step": 116171, "epoch": 2765, "val_loss": 76575.625} {"train_loss": -6.590256690979004, "global_step": 116172, "epoch": 2766} {"train_loss": -6.56428337097168, "global_step": 116173, "epoch": 2766} {"train_loss": -6.610683441162109, "global_step": 116174, "epoch": 2766} {"train_loss": -6.534404754638672, "global_step": 116175, "epoch": 2766} {"train_loss": -6.471729755401611, "global_step": 116176, "epoch": 2766} {"train_loss": -6.512423515319824, "global_step": 116177, "epoch": 2766} {"train_loss": -6.624100685119629, "global_step": 116178, "epoch": 2766} {"train_loss": -6.332855701446533, "global_step": 116179, "epoch": 2766} {"train_loss": -6.59929084777832, "global_step": 116180, "epoch": 2766} {"train_loss": -6.48603630065918, "global_step": 116181, "epoch": 2766} {"train_loss": -6.484927654266357, "global_step": 116182, "epoch": 2766} {"train_loss": -6.514865875244141, "global_step": 116183, "epoch": 2766} {"train_loss": -6.495417594909668, "global_step": 116184, "epoch": 2766} {"train_loss": -6.474071502685547, "global_step": 116185, "epoch": 2766} {"train_loss": -6.409562587738037, "global_step": 116186, "epoch": 2766} {"train_loss": -6.483640670776367, "global_step": 116187, "epoch": 2766} {"train_loss": -6.425683498382568, "global_step": 116188, "epoch": 2766} {"train_loss": -6.459744453430176, "global_step": 116189, "epoch": 2766} {"train_loss": -6.34665584564209, "global_step": 116190, "epoch": 2766} {"train_loss": -6.506031036376953, "global_step": 116191, "epoch": 2766} {"train_loss": -6.443791389465332, "global_step": 116192, "epoch": 2766} {"train_loss": -6.385538101196289, "global_step": 116193, "epoch": 2766} {"train_loss": -6.588319778442383, "global_step": 116194, "epoch": 2766} {"train_loss": -6.452296257019043, "global_step": 116195, "epoch": 2766} {"train_loss": -6.449801445007324, "global_step": 116196, "epoch": 2766} {"train_loss": -6.576091766357422, "global_step": 116197, "epoch": 2766} {"train_loss": -6.403628349304199, "global_step": 116198, "epoch": 2766} {"train_loss": -6.560738563537598, "global_step": 116199, "epoch": 2766} {"train_loss": -6.452361583709717, "global_step": 116200, "epoch": 2766} {"train_loss": -6.436481475830078, "global_step": 116201, "epoch": 2766} {"train_loss": -6.532106876373291, "global_step": 116202, "epoch": 2766} {"train_loss": -6.46533203125, "global_step": 116203, "epoch": 2766} {"train_loss": -6.426505088806152, "global_step": 116204, "epoch": 2766} {"train_loss": -6.361313819885254, "global_step": 116205, "epoch": 2766} {"train_loss": -6.592802047729492, "global_step": 116206, "epoch": 2766} {"train_loss": -6.419353485107422, "global_step": 116207, "epoch": 2766} {"train_loss": -6.567453384399414, "global_step": 116208, "epoch": 2766} {"train_loss": -6.527665138244629, "global_step": 116209, "epoch": 2766} {"train_loss": -6.552535057067871, "global_step": 116210, "epoch": 2766} {"train_loss": -6.606312274932861, "global_step": 116211, "epoch": 2766} {"train_loss": -6.456951141357422, "global_step": 116212, "epoch": 2766} {"train_loss": -6.492398477735973, "global_step": 116213, "epoch": 2766, "val_loss": 76599.5390625} {"train_loss": -6.536745071411133, "global_step": 116214, "epoch": 2767} {"train_loss": -6.527920722961426, "global_step": 116215, "epoch": 2767} {"train_loss": -6.699180603027344, "global_step": 116216, "epoch": 2767} {"train_loss": -6.654019832611084, "global_step": 116217, "epoch": 2767} {"train_loss": -6.584223747253418, "global_step": 116218, "epoch": 2767} {"train_loss": -6.608880996704102, "global_step": 116219, "epoch": 2767} {"train_loss": -6.590118408203125, "global_step": 116220, "epoch": 2767} {"train_loss": -6.579333305358887, "global_step": 116221, "epoch": 2767} {"train_loss": -6.655583381652832, "global_step": 116222, "epoch": 2767} {"train_loss": -6.54929256439209, "global_step": 116223, "epoch": 2767} {"train_loss": -6.606505393981934, "global_step": 116224, "epoch": 2767} {"train_loss": -6.565042495727539, "global_step": 116225, "epoch": 2767} {"train_loss": -6.543965816497803, "global_step": 116226, "epoch": 2767} {"train_loss": -6.463842391967773, "global_step": 116227, "epoch": 2767} {"train_loss": -6.561429023742676, "global_step": 116228, "epoch": 2767} {"train_loss": -6.583953857421875, "global_step": 116229, "epoch": 2767} {"train_loss": -6.536877155303955, "global_step": 116230, "epoch": 2767} {"train_loss": -6.556195259094238, "global_step": 116231, "epoch": 2767} {"train_loss": -6.500876426696777, "global_step": 116232, "epoch": 2767} {"train_loss": -6.485208034515381, "global_step": 116233, "epoch": 2767} {"train_loss": -6.506235122680664, "global_step": 116234, "epoch": 2767} {"train_loss": -6.537636756896973, "global_step": 116235, "epoch": 2767} {"train_loss": -6.452136516571045, "global_step": 116236, "epoch": 2767} {"train_loss": -6.496350288391113, "global_step": 116237, "epoch": 2767} {"train_loss": -6.439889907836914, "global_step": 116238, "epoch": 2767} {"train_loss": -6.448872089385986, "global_step": 116239, "epoch": 2767} {"train_loss": -6.576885223388672, "global_step": 116240, "epoch": 2767} {"train_loss": -6.422313690185547, "global_step": 116241, "epoch": 2767} {"train_loss": -6.518684387207031, "global_step": 116242, "epoch": 2767} {"train_loss": -6.72078800201416, "global_step": 116243, "epoch": 2767} {"train_loss": -6.533407211303711, "global_step": 116244, "epoch": 2767} {"train_loss": -6.541607856750488, "global_step": 116245, "epoch": 2767} {"train_loss": -6.589350700378418, "global_step": 116246, "epoch": 2767} {"train_loss": -6.5687665939331055, "global_step": 116247, "epoch": 2767} {"train_loss": -6.609385967254639, "global_step": 116248, "epoch": 2767} {"train_loss": -6.612891674041748, "global_step": 116249, "epoch": 2767} {"train_loss": -6.6016998291015625, "global_step": 116250, "epoch": 2767} {"train_loss": -6.462565898895264, "global_step": 116251, "epoch": 2767} {"train_loss": -6.542387962341309, "global_step": 116252, "epoch": 2767} {"train_loss": -6.593625545501709, "global_step": 116253, "epoch": 2767} {"train_loss": -6.587278366088867, "global_step": 116254, "epoch": 2767} {"train_loss": -6.555940253393991, "global_step": 116255, "epoch": 2767, "val_loss": 76403.515625} {"train_loss": -6.605608940124512, "global_step": 116256, "epoch": 2768} {"train_loss": -6.542083740234375, "global_step": 116257, "epoch": 2768} {"train_loss": -6.555444717407227, "global_step": 116258, "epoch": 2768} {"train_loss": -6.573198318481445, "global_step": 116259, "epoch": 2768} {"train_loss": -6.588201999664307, "global_step": 116260, "epoch": 2768} {"train_loss": -6.599316596984863, "global_step": 116261, "epoch": 2768} {"train_loss": -6.446660041809082, "global_step": 116262, "epoch": 2768} {"train_loss": -6.496813774108887, "global_step": 116263, "epoch": 2768} {"train_loss": -6.483029842376709, "global_step": 116264, "epoch": 2768} {"train_loss": -6.64288330078125, "global_step": 116265, "epoch": 2768} {"train_loss": -6.562322616577148, "global_step": 116266, "epoch": 2768} {"train_loss": -6.662200450897217, "global_step": 116267, "epoch": 2768} {"train_loss": -6.4814653396606445, "global_step": 116268, "epoch": 2768} {"train_loss": -6.520084381103516, "global_step": 116269, "epoch": 2768} {"train_loss": -6.509984016418457, "global_step": 116270, "epoch": 2768} {"train_loss": -6.534637451171875, "global_step": 116271, "epoch": 2768} {"train_loss": -6.487457752227783, "global_step": 116272, "epoch": 2768} {"train_loss": -6.594194412231445, "global_step": 116273, "epoch": 2768} {"train_loss": -6.655959606170654, "global_step": 116274, "epoch": 2768} {"train_loss": -6.614538192749023, "global_step": 116275, "epoch": 2768} {"train_loss": -6.52191162109375, "global_step": 116276, "epoch": 2768} {"train_loss": -6.479700088500977, "global_step": 116277, "epoch": 2768} {"train_loss": -6.432827949523926, "global_step": 116278, "epoch": 2768} {"train_loss": -6.576376438140869, "global_step": 116279, "epoch": 2768} {"train_loss": -6.637167930603027, "global_step": 116280, "epoch": 2768} {"train_loss": -6.505242824554443, "global_step": 116281, "epoch": 2768} {"train_loss": -6.444110870361328, "global_step": 116282, "epoch": 2768} {"train_loss": -6.667181015014648, "global_step": 116283, "epoch": 2768} {"train_loss": -6.598252773284912, "global_step": 116284, "epoch": 2768} {"train_loss": -6.488926887512207, "global_step": 116285, "epoch": 2768} {"train_loss": -6.547487258911133, "global_step": 116286, "epoch": 2768} {"train_loss": -6.480045318603516, "global_step": 116287, "epoch": 2768} {"train_loss": -6.651426315307617, "global_step": 116288, "epoch": 2768} {"train_loss": -6.399955749511719, "global_step": 116289, "epoch": 2768} {"train_loss": -6.424982070922852, "global_step": 116290, "epoch": 2768} {"train_loss": -6.6036577224731445, "global_step": 116291, "epoch": 2768} {"train_loss": -6.418741703033447, "global_step": 116292, "epoch": 2768} {"train_loss": -6.691555023193359, "global_step": 116293, "epoch": 2768} {"train_loss": -6.506041526794434, "global_step": 116294, "epoch": 2768} {"train_loss": -6.429893493652344, "global_step": 116295, "epoch": 2768} {"train_loss": -6.549236297607422, "global_step": 116296, "epoch": 2768} {"train_loss": -6.540317626226516, "global_step": 116297, "epoch": 2768, "val_loss": 76812.328125} {"train_loss": -6.423255920410156, "global_step": 116298, "epoch": 2769} {"train_loss": -6.5092926025390625, "global_step": 116299, "epoch": 2769} {"train_loss": -6.529933929443359, "global_step": 116300, "epoch": 2769} {"train_loss": -6.584606170654297, "global_step": 116301, "epoch": 2769} {"train_loss": -6.662693023681641, "global_step": 116302, "epoch": 2769} {"train_loss": -6.566934585571289, "global_step": 116303, "epoch": 2769} {"train_loss": -6.541025161743164, "global_step": 116304, "epoch": 2769} {"train_loss": -6.6033220291137695, "global_step": 116305, "epoch": 2769} {"train_loss": -6.562509059906006, "global_step": 116306, "epoch": 2769} {"train_loss": -6.524704456329346, "global_step": 116307, "epoch": 2769} {"train_loss": -6.502418041229248, "global_step": 116308, "epoch": 2769} {"train_loss": -6.659106254577637, "global_step": 116309, "epoch": 2769} {"train_loss": -6.561252593994141, "global_step": 116310, "epoch": 2769} {"train_loss": -6.572922229766846, "global_step": 116311, "epoch": 2769} {"train_loss": -6.460446834564209, "global_step": 116312, "epoch": 2769} {"train_loss": -6.600494384765625, "global_step": 116313, "epoch": 2769} {"train_loss": -6.654045104980469, "global_step": 116314, "epoch": 2769} {"train_loss": -6.508408546447754, "global_step": 116315, "epoch": 2769} {"train_loss": -6.515252113342285, "global_step": 116316, "epoch": 2769} {"train_loss": -6.450697898864746, "global_step": 116317, "epoch": 2769} {"train_loss": -6.625378608703613, "global_step": 116318, "epoch": 2769} {"train_loss": -6.544834613800049, "global_step": 116319, "epoch": 2769} {"train_loss": -6.493449687957764, "global_step": 116320, "epoch": 2769} {"train_loss": -6.4269585609436035, "global_step": 116321, "epoch": 2769} {"train_loss": -6.518589973449707, "global_step": 116322, "epoch": 2769} {"train_loss": -6.543414115905762, "global_step": 116323, "epoch": 2769} {"train_loss": -6.574508190155029, "global_step": 116324, "epoch": 2769} {"train_loss": -6.505837440490723, "global_step": 116325, "epoch": 2769} {"train_loss": -6.469990253448486, "global_step": 116326, "epoch": 2769} {"train_loss": -6.469950199127197, "global_step": 116327, "epoch": 2769} {"train_loss": -6.443795680999756, "global_step": 116328, "epoch": 2769} {"train_loss": -6.576192855834961, "global_step": 116329, "epoch": 2769} {"train_loss": -6.4739227294921875, "global_step": 116330, "epoch": 2769} {"train_loss": -6.544137001037598, "global_step": 116331, "epoch": 2769} {"train_loss": -6.474126815795898, "global_step": 116332, "epoch": 2769} {"train_loss": -6.624333381652832, "global_step": 116333, "epoch": 2769} {"train_loss": -6.465765953063965, "global_step": 116334, "epoch": 2769} {"train_loss": -6.477009296417236, "global_step": 116335, "epoch": 2769} {"train_loss": -6.422371864318848, "global_step": 116336, "epoch": 2769} {"train_loss": -6.525750160217285, "global_step": 116337, "epoch": 2769} {"train_loss": -6.5446977615356445, "global_step": 116338, "epoch": 2769} {"train_loss": -6.530188708078294, "global_step": 116339, "epoch": 2769, "val_loss": 76615.2421875} {"train_loss": -6.5191545486450195, "global_step": 116340, "epoch": 2770} {"train_loss": -6.515795707702637, "global_step": 116341, "epoch": 2770} {"train_loss": -6.522283554077148, "global_step": 116342, "epoch": 2770} {"train_loss": -6.431602954864502, "global_step": 116343, "epoch": 2770} {"train_loss": -6.575352191925049, "global_step": 116344, "epoch": 2770} {"train_loss": -6.617629051208496, "global_step": 116345, "epoch": 2770} {"train_loss": -6.476161956787109, "global_step": 116346, "epoch": 2770} {"train_loss": -6.448998928070068, "global_step": 116347, "epoch": 2770} {"train_loss": -6.3787946701049805, "global_step": 116348, "epoch": 2770} {"train_loss": -6.478887557983398, "global_step": 116349, "epoch": 2770} {"train_loss": -6.4557294845581055, "global_step": 116350, "epoch": 2770} {"train_loss": -6.4950761795043945, "global_step": 116351, "epoch": 2770} {"train_loss": -6.432949066162109, "global_step": 116352, "epoch": 2770} {"train_loss": -6.543922424316406, "global_step": 116353, "epoch": 2770} {"train_loss": -6.526113033294678, "global_step": 116354, "epoch": 2770} {"train_loss": -6.428420066833496, "global_step": 116355, "epoch": 2770} {"train_loss": -6.643076419830322, "global_step": 116356, "epoch": 2770} {"train_loss": -6.370070457458496, "global_step": 116357, "epoch": 2770} {"train_loss": -6.497392654418945, "global_step": 116358, "epoch": 2770} {"train_loss": -6.522765159606934, "global_step": 116359, "epoch": 2770} {"train_loss": -6.473012924194336, "global_step": 116360, "epoch": 2770} {"train_loss": -6.416075706481934, "global_step": 116361, "epoch": 2770} {"train_loss": -6.530055999755859, "global_step": 116362, "epoch": 2770} {"train_loss": -6.457884788513184, "global_step": 116363, "epoch": 2770} {"train_loss": -6.442051887512207, "global_step": 116364, "epoch": 2770} {"train_loss": -6.504116058349609, "global_step": 116365, "epoch": 2770} {"train_loss": -6.3376641273498535, "global_step": 116366, "epoch": 2770} {"train_loss": -6.532220840454102, "global_step": 116367, "epoch": 2770} {"train_loss": -6.353499412536621, "global_step": 116368, "epoch": 2770} {"train_loss": -6.357561111450195, "global_step": 116369, "epoch": 2770} {"train_loss": -6.510157585144043, "global_step": 116370, "epoch": 2770} {"train_loss": -6.371035575866699, "global_step": 116371, "epoch": 2770} {"train_loss": -6.402320861816406, "global_step": 116372, "epoch": 2770} {"train_loss": -6.483246803283691, "global_step": 116373, "epoch": 2770} {"train_loss": -6.517379283905029, "global_step": 116374, "epoch": 2770} {"train_loss": -6.417151927947998, "global_step": 116375, "epoch": 2770} {"train_loss": -6.435670375823975, "global_step": 116376, "epoch": 2770} {"train_loss": -6.557470321655273, "global_step": 116377, "epoch": 2770} {"train_loss": -6.464129447937012, "global_step": 116378, "epoch": 2770} {"train_loss": -6.605576992034912, "global_step": 116379, "epoch": 2770} {"train_loss": -6.514420509338379, "global_step": 116380, "epoch": 2770} {"train_loss": -6.477096625736782, "global_step": 116381, "epoch": 2770, "val_loss": 76676.15625} {"train_loss": -6.586405277252197, "global_step": 116382, "epoch": 2771} {"train_loss": -6.446793556213379, "global_step": 116383, "epoch": 2771} {"train_loss": -6.6197004318237305, "global_step": 116384, "epoch": 2771} {"train_loss": -6.484658241271973, "global_step": 116385, "epoch": 2771} {"train_loss": -6.512548923492432, "global_step": 116386, "epoch": 2771} {"train_loss": -6.543712139129639, "global_step": 116387, "epoch": 2771} {"train_loss": -6.53911828994751, "global_step": 116388, "epoch": 2771} {"train_loss": -6.543150901794434, "global_step": 116389, "epoch": 2771} {"train_loss": -6.566590785980225, "global_step": 116390, "epoch": 2771} {"train_loss": -6.5264458656311035, "global_step": 116391, "epoch": 2771} {"train_loss": -6.471120357513428, "global_step": 116392, "epoch": 2771} {"train_loss": -6.632563591003418, "global_step": 116393, "epoch": 2771} {"train_loss": -6.585022926330566, "global_step": 116394, "epoch": 2771} {"train_loss": -6.63267183303833, "global_step": 116395, "epoch": 2771} {"train_loss": -6.525033950805664, "global_step": 116396, "epoch": 2771} {"train_loss": -6.488916397094727, "global_step": 116397, "epoch": 2771} {"train_loss": -6.549805641174316, "global_step": 116398, "epoch": 2771} {"train_loss": -6.584263324737549, "global_step": 116399, "epoch": 2771} {"train_loss": -6.502640724182129, "global_step": 116400, "epoch": 2771} {"train_loss": -6.464475631713867, "global_step": 116401, "epoch": 2771} {"train_loss": -6.504725456237793, "global_step": 116402, "epoch": 2771} {"train_loss": -6.636736869812012, "global_step": 116403, "epoch": 2771} {"train_loss": -6.364701271057129, "global_step": 116404, "epoch": 2771} {"train_loss": -6.437229156494141, "global_step": 116405, "epoch": 2771} {"train_loss": -6.522243022918701, "global_step": 116406, "epoch": 2771} {"train_loss": -6.395096778869629, "global_step": 116407, "epoch": 2771} {"train_loss": -6.556201934814453, "global_step": 116408, "epoch": 2771} {"train_loss": -6.4275054931640625, "global_step": 116409, "epoch": 2771} {"train_loss": -6.446377277374268, "global_step": 116410, "epoch": 2771} {"train_loss": -6.600813865661621, "global_step": 116411, "epoch": 2771} {"train_loss": -6.514829158782959, "global_step": 116412, "epoch": 2771} {"train_loss": -6.501948356628418, "global_step": 116413, "epoch": 2771} {"train_loss": -6.452502250671387, "global_step": 116414, "epoch": 2771} {"train_loss": -6.512297630310059, "global_step": 116415, "epoch": 2771} {"train_loss": -6.47873592376709, "global_step": 116416, "epoch": 2771} {"train_loss": -6.389159202575684, "global_step": 116417, "epoch": 2771} {"train_loss": -6.468555450439453, "global_step": 116418, "epoch": 2771} {"train_loss": -6.425055503845215, "global_step": 116419, "epoch": 2771} {"train_loss": -6.525163650512695, "global_step": 116420, "epoch": 2771} {"train_loss": -6.375302314758301, "global_step": 116421, "epoch": 2771} {"train_loss": -6.521029472351074, "global_step": 116422, "epoch": 2771} {"train_loss": -6.506634893871489, "global_step": 116423, "epoch": 2771, "val_loss": 77116.390625} {"train_loss": -6.350048065185547, "global_step": 116424, "epoch": 2772} {"train_loss": -6.408426284790039, "global_step": 116425, "epoch": 2772} {"train_loss": -6.287685394287109, "global_step": 116426, "epoch": 2772} {"train_loss": -6.433119773864746, "global_step": 116427, "epoch": 2772} {"train_loss": -6.374479293823242, "global_step": 116428, "epoch": 2772} {"train_loss": -6.640715599060059, "global_step": 116429, "epoch": 2772} {"train_loss": -6.328631401062012, "global_step": 116430, "epoch": 2772} {"train_loss": -6.559276580810547, "global_step": 116431, "epoch": 2772} {"train_loss": -6.372201919555664, "global_step": 116432, "epoch": 2772} {"train_loss": -6.508669853210449, "global_step": 116433, "epoch": 2772} {"train_loss": -6.463564872741699, "global_step": 116434, "epoch": 2772} {"train_loss": -6.528565406799316, "global_step": 116435, "epoch": 2772} {"train_loss": -6.457553386688232, "global_step": 116436, "epoch": 2772} {"train_loss": -6.449550628662109, "global_step": 116437, "epoch": 2772} {"train_loss": -6.380130767822266, "global_step": 116438, "epoch": 2772} {"train_loss": -6.458526611328125, "global_step": 116439, "epoch": 2772} {"train_loss": -6.423081398010254, "global_step": 116440, "epoch": 2772} {"train_loss": -6.453442573547363, "global_step": 116441, "epoch": 2772} {"train_loss": -6.435600280761719, "global_step": 116442, "epoch": 2772} {"train_loss": -6.416645526885986, "global_step": 116443, "epoch": 2772} {"train_loss": -6.601508140563965, "global_step": 116444, "epoch": 2772} {"train_loss": -6.599488258361816, "global_step": 116445, "epoch": 2772} {"train_loss": -6.439918518066406, "global_step": 116446, "epoch": 2772} {"train_loss": -6.588133811950684, "global_step": 116447, "epoch": 2772} {"train_loss": -6.487512588500977, "global_step": 116448, "epoch": 2772} {"train_loss": -6.529763221740723, "global_step": 116449, "epoch": 2772} {"train_loss": -6.506342887878418, "global_step": 116450, "epoch": 2772} {"train_loss": -6.471529006958008, "global_step": 116451, "epoch": 2772} {"train_loss": -6.444311141967773, "global_step": 116452, "epoch": 2772} {"train_loss": -6.5392584800720215, "global_step": 116453, "epoch": 2772} {"train_loss": -6.517287254333496, "global_step": 116454, "epoch": 2772} {"train_loss": -6.460677146911621, "global_step": 116455, "epoch": 2772} {"train_loss": -6.600438594818115, "global_step": 116456, "epoch": 2772} {"train_loss": -6.595619201660156, "global_step": 116457, "epoch": 2772} {"train_loss": -6.499716758728027, "global_step": 116458, "epoch": 2772} {"train_loss": -6.6618242263793945, "global_step": 116459, "epoch": 2772} {"train_loss": -6.425276756286621, "global_step": 116460, "epoch": 2772} {"train_loss": -6.5980682373046875, "global_step": 116461, "epoch": 2772} {"train_loss": -6.548891067504883, "global_step": 116462, "epoch": 2772} {"train_loss": -6.497579574584961, "global_step": 116463, "epoch": 2772} {"train_loss": -6.555550575256348, "global_step": 116464, "epoch": 2772} {"train_loss": -6.484576111748105, "global_step": 116465, "epoch": 2772, "val_loss": 76731.5625} {"train_loss": -6.568060874938965, "global_step": 116466, "epoch": 2773} {"train_loss": -6.593369960784912, "global_step": 116467, "epoch": 2773} {"train_loss": -6.420320987701416, "global_step": 116468, "epoch": 2773} {"train_loss": -6.596874237060547, "global_step": 116469, "epoch": 2773} {"train_loss": -6.587724685668945, "global_step": 116470, "epoch": 2773} {"train_loss": -6.559170722961426, "global_step": 116471, "epoch": 2773} {"train_loss": -6.490640163421631, "global_step": 116472, "epoch": 2773} {"train_loss": -6.701279640197754, "global_step": 116473, "epoch": 2773} {"train_loss": -6.4987406730651855, "global_step": 116474, "epoch": 2773} {"train_loss": -6.4793829917907715, "global_step": 116475, "epoch": 2773} {"train_loss": -6.518729209899902, "global_step": 116476, "epoch": 2773} {"train_loss": -6.568464756011963, "global_step": 116477, "epoch": 2773} {"train_loss": -6.507411956787109, "global_step": 116478, "epoch": 2773} {"train_loss": -6.488739967346191, "global_step": 116479, "epoch": 2773} {"train_loss": -6.591264724731445, "global_step": 116480, "epoch": 2773} {"train_loss": -6.542450904846191, "global_step": 116481, "epoch": 2773} {"train_loss": -6.460788726806641, "global_step": 116482, "epoch": 2773} {"train_loss": -6.499497890472412, "global_step": 116483, "epoch": 2773} {"train_loss": -6.593961715698242, "global_step": 116484, "epoch": 2773} {"train_loss": -6.480481147766113, "global_step": 116485, "epoch": 2773} {"train_loss": -6.534383773803711, "global_step": 116486, "epoch": 2773} {"train_loss": -6.544839859008789, "global_step": 116487, "epoch": 2773} {"train_loss": -6.520012378692627, "global_step": 116488, "epoch": 2773} {"train_loss": -6.689087867736816, "global_step": 116489, "epoch": 2773} {"train_loss": -6.570944786071777, "global_step": 116490, "epoch": 2773} {"train_loss": -6.533452033996582, "global_step": 116491, "epoch": 2773} {"train_loss": -6.556596755981445, "global_step": 116492, "epoch": 2773} {"train_loss": -6.55573844909668, "global_step": 116493, "epoch": 2773} {"train_loss": -6.355348587036133, "global_step": 116494, "epoch": 2773} {"train_loss": -6.474032402038574, "global_step": 116495, "epoch": 2773} {"train_loss": -6.480376243591309, "global_step": 116496, "epoch": 2773} {"train_loss": -6.362210273742676, "global_step": 116497, "epoch": 2773} {"train_loss": -6.534984588623047, "global_step": 116498, "epoch": 2773} {"train_loss": -6.571029186248779, "global_step": 116499, "epoch": 2773} {"train_loss": -6.51412296295166, "global_step": 116500, "epoch": 2773} {"train_loss": -6.507987976074219, "global_step": 116501, "epoch": 2773} {"train_loss": -6.449090003967285, "global_step": 116502, "epoch": 2773} {"train_loss": -6.479442596435547, "global_step": 116503, "epoch": 2773} {"train_loss": -6.524382591247559, "global_step": 116504, "epoch": 2773} {"train_loss": -6.516396522521973, "global_step": 116505, "epoch": 2773} {"train_loss": -6.410690784454346, "global_step": 116506, "epoch": 2773} {"train_loss": -6.522318771907261, "global_step": 116507, "epoch": 2773, "val_loss": 76610.71875} {"train_loss": -6.603488922119141, "global_step": 116508, "epoch": 2774} {"train_loss": -6.571268081665039, "global_step": 116509, "epoch": 2774} {"train_loss": -6.448860168457031, "global_step": 116510, "epoch": 2774} {"train_loss": -6.585138320922852, "global_step": 116511, "epoch": 2774} {"train_loss": -6.561912536621094, "global_step": 116512, "epoch": 2774} {"train_loss": -6.537708759307861, "global_step": 116513, "epoch": 2774} {"train_loss": -6.453580856323242, "global_step": 116514, "epoch": 2774} {"train_loss": -6.546026229858398, "global_step": 116515, "epoch": 2774} {"train_loss": -6.500140190124512, "global_step": 116516, "epoch": 2774} {"train_loss": -6.49715518951416, "global_step": 116517, "epoch": 2774} {"train_loss": -6.4643754959106445, "global_step": 116518, "epoch": 2774} {"train_loss": -6.421401023864746, "global_step": 116519, "epoch": 2774} {"train_loss": -6.558627128601074, "global_step": 116520, "epoch": 2774} {"train_loss": -6.33974552154541, "global_step": 116521, "epoch": 2774} {"train_loss": -6.476405620574951, "global_step": 116522, "epoch": 2774} {"train_loss": -6.559515476226807, "global_step": 116523, "epoch": 2774} {"train_loss": -6.447624683380127, "global_step": 116524, "epoch": 2774} {"train_loss": -6.459840774536133, "global_step": 116525, "epoch": 2774} {"train_loss": -6.556179046630859, "global_step": 116526, "epoch": 2774} {"train_loss": -6.463511943817139, "global_step": 116527, "epoch": 2774} {"train_loss": -6.439355850219727, "global_step": 116528, "epoch": 2774} {"train_loss": -6.510493278503418, "global_step": 116529, "epoch": 2774} {"train_loss": -6.479170799255371, "global_step": 116530, "epoch": 2774} {"train_loss": -6.464122772216797, "global_step": 116531, "epoch": 2774} {"train_loss": -6.457451820373535, "global_step": 116532, "epoch": 2774} {"train_loss": -6.594788074493408, "global_step": 116533, "epoch": 2774} {"train_loss": -6.567030906677246, "global_step": 116534, "epoch": 2774} {"train_loss": -6.487325668334961, "global_step": 116535, "epoch": 2774} {"train_loss": -6.435469627380371, "global_step": 116536, "epoch": 2774} {"train_loss": -6.503700256347656, "global_step": 116537, "epoch": 2774} {"train_loss": -6.3911237716674805, "global_step": 116538, "epoch": 2774} {"train_loss": -6.522638320922852, "global_step": 116539, "epoch": 2774} {"train_loss": -6.5461106300354, "global_step": 116540, "epoch": 2774} {"train_loss": -6.495243549346924, "global_step": 116541, "epoch": 2774} {"train_loss": -6.527436256408691, "global_step": 116542, "epoch": 2774} {"train_loss": -6.536747932434082, "global_step": 116543, "epoch": 2774} {"train_loss": -6.585472106933594, "global_step": 116544, "epoch": 2774} {"train_loss": -6.469764709472656, "global_step": 116545, "epoch": 2774} {"train_loss": -6.509127140045166, "global_step": 116546, "epoch": 2774} {"train_loss": -6.665532112121582, "global_step": 116547, "epoch": 2774} {"train_loss": -6.500475883483887, "global_step": 116548, "epoch": 2774} {"train_loss": -6.505753312792097, "global_step": 116549, "epoch": 2774, "val_loss": 76765.6875} {"train_loss": -6.546009540557861, "global_step": 116550, "epoch": 2775} {"train_loss": -6.4929585456848145, "global_step": 116551, "epoch": 2775} {"train_loss": -6.57725191116333, "global_step": 116552, "epoch": 2775} {"train_loss": -6.500507831573486, "global_step": 116553, "epoch": 2775} {"train_loss": -6.440775394439697, "global_step": 116554, "epoch": 2775} {"train_loss": -6.50407600402832, "global_step": 116555, "epoch": 2775} {"train_loss": -6.552955627441406, "global_step": 116556, "epoch": 2775} {"train_loss": -6.500425338745117, "global_step": 116557, "epoch": 2775} {"train_loss": -6.597295761108398, "global_step": 116558, "epoch": 2775} {"train_loss": -6.509608268737793, "global_step": 116559, "epoch": 2775} {"train_loss": -6.60274600982666, "global_step": 116560, "epoch": 2775} {"train_loss": -6.46842098236084, "global_step": 116561, "epoch": 2775} {"train_loss": -6.421158313751221, "global_step": 116562, "epoch": 2775} {"train_loss": -6.5620222091674805, "global_step": 116563, "epoch": 2775} {"train_loss": -6.480302810668945, "global_step": 116564, "epoch": 2775} {"train_loss": -6.477275848388672, "global_step": 116565, "epoch": 2775} {"train_loss": -6.558634281158447, "global_step": 116566, "epoch": 2775} {"train_loss": -6.500662803649902, "global_step": 116567, "epoch": 2775} {"train_loss": -6.461417198181152, "global_step": 116568, "epoch": 2775} {"train_loss": -6.469396591186523, "global_step": 116569, "epoch": 2775} {"train_loss": -6.653602600097656, "global_step": 116570, "epoch": 2775} {"train_loss": -6.564817428588867, "global_step": 116571, "epoch": 2775} {"train_loss": -6.494935035705566, "global_step": 116572, "epoch": 2775} {"train_loss": -6.552581310272217, "global_step": 116573, "epoch": 2775} {"train_loss": -6.474773406982422, "global_step": 116574, "epoch": 2775} {"train_loss": -6.530701637268066, "global_step": 116575, "epoch": 2775} {"train_loss": -6.592796802520752, "global_step": 116576, "epoch": 2775} {"train_loss": -6.624539375305176, "global_step": 116577, "epoch": 2775} {"train_loss": -6.543468952178955, "global_step": 116578, "epoch": 2775} {"train_loss": -6.516607284545898, "global_step": 116579, "epoch": 2775} {"train_loss": -6.536112308502197, "global_step": 116580, "epoch": 2775} {"train_loss": -6.537592887878418, "global_step": 116581, "epoch": 2775} {"train_loss": -6.615438461303711, "global_step": 116582, "epoch": 2775} {"train_loss": -6.568811893463135, "global_step": 116583, "epoch": 2775} {"train_loss": -6.436645984649658, "global_step": 116584, "epoch": 2775} {"train_loss": -6.440090179443359, "global_step": 116585, "epoch": 2775} {"train_loss": -6.46283483505249, "global_step": 116586, "epoch": 2775} {"train_loss": -6.4785614013671875, "global_step": 116587, "epoch": 2775} {"train_loss": -6.514693737030029, "global_step": 116588, "epoch": 2775} {"train_loss": -6.403411865234375, "global_step": 116589, "epoch": 2775} {"train_loss": -6.522002220153809, "global_step": 116590, "epoch": 2775} {"train_loss": -6.515746616181874, "global_step": 116591, "epoch": 2775, "val_loss": 76802.109375} {"train_loss": -6.618223190307617, "global_step": 116592, "epoch": 2776} {"train_loss": -6.4770002365112305, "global_step": 116593, "epoch": 2776} {"train_loss": -6.441030025482178, "global_step": 116594, "epoch": 2776} {"train_loss": -6.467270851135254, "global_step": 116595, "epoch": 2776} {"train_loss": -6.589241981506348, "global_step": 116596, "epoch": 2776} {"train_loss": -6.526398658752441, "global_step": 116597, "epoch": 2776} {"train_loss": -6.582902908325195, "global_step": 116598, "epoch": 2776} {"train_loss": -6.547308921813965, "global_step": 116599, "epoch": 2776} {"train_loss": -6.462092399597168, "global_step": 116600, "epoch": 2776} {"train_loss": -6.563571929931641, "global_step": 116601, "epoch": 2776} {"train_loss": -6.6199727058410645, "global_step": 116602, "epoch": 2776} {"train_loss": -6.604536533355713, "global_step": 116603, "epoch": 2776} {"train_loss": -6.582453727722168, "global_step": 116604, "epoch": 2776} {"train_loss": -6.650763988494873, "global_step": 116605, "epoch": 2776} {"train_loss": -6.486964225769043, "global_step": 116606, "epoch": 2776} {"train_loss": -6.480483531951904, "global_step": 116607, "epoch": 2776} {"train_loss": -6.509895324707031, "global_step": 116608, "epoch": 2776} {"train_loss": -6.476576805114746, "global_step": 116609, "epoch": 2776} {"train_loss": -6.4061598777771, "global_step": 116610, "epoch": 2776} {"train_loss": -6.493350028991699, "global_step": 116611, "epoch": 2776} {"train_loss": -6.397530555725098, "global_step": 116612, "epoch": 2776} {"train_loss": -6.569846153259277, "global_step": 116613, "epoch": 2776} {"train_loss": -6.480247497558594, "global_step": 116614, "epoch": 2776} {"train_loss": -6.503196716308594, "global_step": 116615, "epoch": 2776} {"train_loss": -6.602650165557861, "global_step": 116616, "epoch": 2776} {"train_loss": -6.423303604125977, "global_step": 116617, "epoch": 2776} {"train_loss": -6.496856212615967, "global_step": 116618, "epoch": 2776} {"train_loss": -6.599545478820801, "global_step": 116619, "epoch": 2776} {"train_loss": -6.576690196990967, "global_step": 116620, "epoch": 2776} {"train_loss": -6.492091178894043, "global_step": 116621, "epoch": 2776} {"train_loss": -6.512655258178711, "global_step": 116622, "epoch": 2776} {"train_loss": -6.499499797821045, "global_step": 116623, "epoch": 2776} {"train_loss": -6.49975061416626, "global_step": 116624, "epoch": 2776} {"train_loss": -6.47744083404541, "global_step": 116625, "epoch": 2776} {"train_loss": -6.5192365646362305, "global_step": 116626, "epoch": 2776} {"train_loss": -6.591701507568359, "global_step": 116627, "epoch": 2776} {"train_loss": -6.528478622436523, "global_step": 116628, "epoch": 2776} {"train_loss": -6.609285354614258, "global_step": 116629, "epoch": 2776} {"train_loss": -6.552631855010986, "global_step": 116630, "epoch": 2776} {"train_loss": -6.440530776977539, "global_step": 116631, "epoch": 2776} {"train_loss": -6.508933067321777, "global_step": 116632, "epoch": 2776} {"train_loss": -6.520780710946946, "global_step": 116633, "epoch": 2776, "val_loss": 76482.828125} {"train_loss": -6.623610496520996, "global_step": 116634, "epoch": 2777} {"train_loss": -6.575075149536133, "global_step": 116635, "epoch": 2777} {"train_loss": -6.349221229553223, "global_step": 116636, "epoch": 2777} {"train_loss": -6.57120418548584, "global_step": 116637, "epoch": 2777} {"train_loss": -6.555375099182129, "global_step": 116638, "epoch": 2777} {"train_loss": -6.485235214233398, "global_step": 116639, "epoch": 2777} {"train_loss": -6.549506664276123, "global_step": 116640, "epoch": 2777} {"train_loss": -6.437361240386963, "global_step": 116641, "epoch": 2777} {"train_loss": -6.5007405281066895, "global_step": 116642, "epoch": 2777} {"train_loss": -6.577343940734863, "global_step": 116643, "epoch": 2777} {"train_loss": -6.5184221267700195, "global_step": 116644, "epoch": 2777} {"train_loss": -6.541181564331055, "global_step": 116645, "epoch": 2777} {"train_loss": -6.5297088623046875, "global_step": 116646, "epoch": 2777} {"train_loss": -6.479913234710693, "global_step": 116647, "epoch": 2777} {"train_loss": -6.446015357971191, "global_step": 116648, "epoch": 2777} {"train_loss": -6.664543628692627, "global_step": 116649, "epoch": 2777} {"train_loss": -6.676179885864258, "global_step": 116650, "epoch": 2777} {"train_loss": -6.636518478393555, "global_step": 116651, "epoch": 2777} {"train_loss": -6.533669471740723, "global_step": 116652, "epoch": 2777} {"train_loss": -6.589774131774902, "global_step": 116653, "epoch": 2777} {"train_loss": -6.527004241943359, "global_step": 116654, "epoch": 2777} {"train_loss": -6.540010929107666, "global_step": 116655, "epoch": 2777} {"train_loss": -6.595362663269043, "global_step": 116656, "epoch": 2777} {"train_loss": -6.5708417892456055, "global_step": 116657, "epoch": 2777} {"train_loss": -6.603498935699463, "global_step": 116658, "epoch": 2777} {"train_loss": -6.633322238922119, "global_step": 116659, "epoch": 2777} {"train_loss": -6.621285915374756, "global_step": 116660, "epoch": 2777} {"train_loss": -6.60441780090332, "global_step": 116661, "epoch": 2777} {"train_loss": -6.547622203826904, "global_step": 116662, "epoch": 2777} {"train_loss": -6.413175582885742, "global_step": 116663, "epoch": 2777} {"train_loss": -6.553144454956055, "global_step": 116664, "epoch": 2777} {"train_loss": -6.539834499359131, "global_step": 116665, "epoch": 2777} {"train_loss": -6.579231262207031, "global_step": 116666, "epoch": 2777} {"train_loss": -6.646999359130859, "global_step": 116667, "epoch": 2777} {"train_loss": -6.525629043579102, "global_step": 116668, "epoch": 2777} {"train_loss": -6.539952278137207, "global_step": 116669, "epoch": 2777} {"train_loss": -6.377496719360352, "global_step": 116670, "epoch": 2777} {"train_loss": -6.455539703369141, "global_step": 116671, "epoch": 2777} {"train_loss": -6.569303512573242, "global_step": 116672, "epoch": 2777} {"train_loss": -6.521520137786865, "global_step": 116673, "epoch": 2777} {"train_loss": -6.633671760559082, "global_step": 116674, "epoch": 2777} {"train_loss": -6.542222965331304, "global_step": 116675, "epoch": 2777, "val_loss": 76673.7734375} {"train_loss": -6.472102165222168, "global_step": 116676, "epoch": 2778} {"train_loss": -6.469069480895996, "global_step": 116677, "epoch": 2778} {"train_loss": -6.474937438964844, "global_step": 116678, "epoch": 2778} {"train_loss": -6.545515060424805, "global_step": 116679, "epoch": 2778} {"train_loss": -6.57727575302124, "global_step": 116680, "epoch": 2778} {"train_loss": -6.525015830993652, "global_step": 116681, "epoch": 2778} {"train_loss": -6.585467338562012, "global_step": 116682, "epoch": 2778} {"train_loss": -6.5072021484375, "global_step": 116683, "epoch": 2778} {"train_loss": -6.452400207519531, "global_step": 116684, "epoch": 2778} {"train_loss": -6.605743408203125, "global_step": 116685, "epoch": 2778} {"train_loss": -6.4533281326293945, "global_step": 116686, "epoch": 2778} {"train_loss": -6.569856643676758, "global_step": 116687, "epoch": 2778} {"train_loss": -6.593715667724609, "global_step": 116688, "epoch": 2778} {"train_loss": -6.562786102294922, "global_step": 116689, "epoch": 2778} {"train_loss": -6.5475311279296875, "global_step": 116690, "epoch": 2778} {"train_loss": -6.5379252433776855, "global_step": 116691, "epoch": 2778} {"train_loss": -6.539167404174805, "global_step": 116692, "epoch": 2778} {"train_loss": -6.564812183380127, "global_step": 116693, "epoch": 2778} {"train_loss": -6.549775123596191, "global_step": 116694, "epoch": 2778} {"train_loss": -6.574116230010986, "global_step": 116695, "epoch": 2778} {"train_loss": -6.4975080490112305, "global_step": 116696, "epoch": 2778} {"train_loss": -6.608882904052734, "global_step": 116697, "epoch": 2778} {"train_loss": -6.521546363830566, "global_step": 116698, "epoch": 2778} {"train_loss": -6.640476226806641, "global_step": 116699, "epoch": 2778} {"train_loss": -6.49156379699707, "global_step": 116700, "epoch": 2778} {"train_loss": -6.637409210205078, "global_step": 116701, "epoch": 2778} {"train_loss": -6.550172328948975, "global_step": 116702, "epoch": 2778} {"train_loss": -6.34574556350708, "global_step": 116703, "epoch": 2778} {"train_loss": -6.551618576049805, "global_step": 116704, "epoch": 2778} {"train_loss": -6.59886360168457, "global_step": 116705, "epoch": 2778} {"train_loss": -6.4780988693237305, "global_step": 116706, "epoch": 2778} {"train_loss": -6.538985252380371, "global_step": 116707, "epoch": 2778} {"train_loss": -6.440826416015625, "global_step": 116708, "epoch": 2778} {"train_loss": -6.545548439025879, "global_step": 116709, "epoch": 2778} {"train_loss": -6.698951721191406, "global_step": 116710, "epoch": 2778} {"train_loss": -6.510265350341797, "global_step": 116711, "epoch": 2778} {"train_loss": -6.545231342315674, "global_step": 116712, "epoch": 2778} {"train_loss": -6.551348686218262, "global_step": 116713, "epoch": 2778} {"train_loss": -6.4893798828125, "global_step": 116714, "epoch": 2778} {"train_loss": -6.385270595550537, "global_step": 116715, "epoch": 2778} {"train_loss": -6.484143257141113, "global_step": 116716, "epoch": 2778} {"train_loss": -6.530967689695812, "global_step": 116717, "epoch": 2778, "val_loss": 76612.4375} {"train_loss": -6.543280124664307, "global_step": 116718, "epoch": 2779} {"train_loss": -6.633339881896973, "global_step": 116719, "epoch": 2779} {"train_loss": -6.499129772186279, "global_step": 116720, "epoch": 2779} {"train_loss": -6.629216194152832, "global_step": 116721, "epoch": 2779} {"train_loss": -6.464902877807617, "global_step": 116722, "epoch": 2779} {"train_loss": -6.515582084655762, "global_step": 116723, "epoch": 2779} {"train_loss": -6.563405990600586, "global_step": 116724, "epoch": 2779} {"train_loss": -6.589573860168457, "global_step": 116725, "epoch": 2779} {"train_loss": -6.546807289123535, "global_step": 116726, "epoch": 2779} {"train_loss": -6.534596920013428, "global_step": 116727, "epoch": 2779} {"train_loss": -6.42490291595459, "global_step": 116728, "epoch": 2779} {"train_loss": -6.507833480834961, "global_step": 116729, "epoch": 2779} {"train_loss": -6.389132022857666, "global_step": 116730, "epoch": 2779} {"train_loss": -6.55584716796875, "global_step": 116731, "epoch": 2779} {"train_loss": -6.594015121459961, "global_step": 116732, "epoch": 2779} {"train_loss": -6.4750823974609375, "global_step": 116733, "epoch": 2779} {"train_loss": -6.495035648345947, "global_step": 116734, "epoch": 2779} {"train_loss": -6.548664569854736, "global_step": 116735, "epoch": 2779} {"train_loss": -6.457854270935059, "global_step": 116736, "epoch": 2779} {"train_loss": -6.617825508117676, "global_step": 116737, "epoch": 2779} {"train_loss": -6.44003963470459, "global_step": 116738, "epoch": 2779} {"train_loss": -6.482957363128662, "global_step": 116739, "epoch": 2779} {"train_loss": -6.492891311645508, "global_step": 116740, "epoch": 2779} {"train_loss": -6.548490524291992, "global_step": 116741, "epoch": 2779} {"train_loss": -6.623913764953613, "global_step": 116742, "epoch": 2779} {"train_loss": -6.577339172363281, "global_step": 116743, "epoch": 2779} {"train_loss": -6.533405303955078, "global_step": 116744, "epoch": 2779} {"train_loss": -6.4332685470581055, "global_step": 116745, "epoch": 2779} {"train_loss": -6.527141571044922, "global_step": 116746, "epoch": 2779} {"train_loss": -6.488727569580078, "global_step": 116747, "epoch": 2779} {"train_loss": -6.522970199584961, "global_step": 116748, "epoch": 2779} {"train_loss": -6.491789817810059, "global_step": 116749, "epoch": 2779} {"train_loss": -6.4954752922058105, "global_step": 116750, "epoch": 2779} {"train_loss": -6.530447006225586, "global_step": 116751, "epoch": 2779} {"train_loss": -6.523471355438232, "global_step": 116752, "epoch": 2779} {"train_loss": -6.522071838378906, "global_step": 116753, "epoch": 2779} {"train_loss": -6.5201826095581055, "global_step": 116754, "epoch": 2779} {"train_loss": -6.531989574432373, "global_step": 116755, "epoch": 2779} {"train_loss": -6.449768543243408, "global_step": 116756, "epoch": 2779} {"train_loss": -6.432123184204102, "global_step": 116757, "epoch": 2779} {"train_loss": -6.495841026306152, "global_step": 116758, "epoch": 2779} {"train_loss": -6.517251843497867, "global_step": 116759, "epoch": 2779, "val_loss": 76384.875} {"train_loss": -6.618739128112793, "global_step": 116760, "epoch": 2780} {"train_loss": -6.51259708404541, "global_step": 116761, "epoch": 2780} {"train_loss": -6.464071273803711, "global_step": 116762, "epoch": 2780} {"train_loss": -6.450726509094238, "global_step": 116763, "epoch": 2780} {"train_loss": -6.651949882507324, "global_step": 116764, "epoch": 2780} {"train_loss": -6.545967102050781, "global_step": 116765, "epoch": 2780} {"train_loss": -6.550766944885254, "global_step": 116766, "epoch": 2780} {"train_loss": -6.586613655090332, "global_step": 116767, "epoch": 2780} {"train_loss": -6.564675331115723, "global_step": 116768, "epoch": 2780} {"train_loss": -6.60468864440918, "global_step": 116769, "epoch": 2780} {"train_loss": -6.50717830657959, "global_step": 116770, "epoch": 2780} {"train_loss": -6.4527177810668945, "global_step": 116771, "epoch": 2780} {"train_loss": -6.539649963378906, "global_step": 116772, "epoch": 2780} {"train_loss": -6.540850639343262, "global_step": 116773, "epoch": 2780} {"train_loss": -6.6082916259765625, "global_step": 116774, "epoch": 2780} {"train_loss": -6.5238494873046875, "global_step": 116775, "epoch": 2780} {"train_loss": -6.5345611572265625, "global_step": 116776, "epoch": 2780} {"train_loss": -6.510727882385254, "global_step": 116777, "epoch": 2780} {"train_loss": -6.635139465332031, "global_step": 116778, "epoch": 2780} {"train_loss": -6.410820484161377, "global_step": 116779, "epoch": 2780} {"train_loss": -6.468669891357422, "global_step": 116780, "epoch": 2780} {"train_loss": -6.529645919799805, "global_step": 116781, "epoch": 2780} {"train_loss": -6.549995422363281, "global_step": 116782, "epoch": 2780} {"train_loss": -6.591704368591309, "global_step": 116783, "epoch": 2780} {"train_loss": -6.52680778503418, "global_step": 116784, "epoch": 2780} {"train_loss": -6.467611312866211, "global_step": 116785, "epoch": 2780} {"train_loss": -6.513801574707031, "global_step": 116786, "epoch": 2780} {"train_loss": -6.480534553527832, "global_step": 116787, "epoch": 2780} {"train_loss": -6.4738240242004395, "global_step": 116788, "epoch": 2780} {"train_loss": -6.607922554016113, "global_step": 116789, "epoch": 2780} {"train_loss": -6.486934661865234, "global_step": 116790, "epoch": 2780} {"train_loss": -6.623658180236816, "global_step": 116791, "epoch": 2780} {"train_loss": -6.516397476196289, "global_step": 116792, "epoch": 2780} {"train_loss": -6.582649230957031, "global_step": 116793, "epoch": 2780} {"train_loss": -6.692877292633057, "global_step": 116794, "epoch": 2780} {"train_loss": -6.520273208618164, "global_step": 116795, "epoch": 2780} {"train_loss": -6.581794738769531, "global_step": 116796, "epoch": 2780} {"train_loss": -6.519012451171875, "global_step": 116797, "epoch": 2780} {"train_loss": -6.5588884353637695, "global_step": 116798, "epoch": 2780} {"train_loss": -6.565582275390625, "global_step": 116799, "epoch": 2780} {"train_loss": -6.6108551025390625, "global_step": 116800, "epoch": 2780} {"train_loss": -6.542845714659918, "global_step": 116801, "epoch": 2780, "val_loss": 76536.859375} {"train_loss": -6.656916618347168, "global_step": 116802, "epoch": 2781} {"train_loss": -6.479515075683594, "global_step": 116803, "epoch": 2781} {"train_loss": -6.66379976272583, "global_step": 116804, "epoch": 2781} {"train_loss": -6.529049396514893, "global_step": 116805, "epoch": 2781} {"train_loss": -6.61792516708374, "global_step": 116806, "epoch": 2781} {"train_loss": -6.592885971069336, "global_step": 116807, "epoch": 2781} {"train_loss": -6.649489402770996, "global_step": 116808, "epoch": 2781} {"train_loss": -6.516625881195068, "global_step": 116809, "epoch": 2781} {"train_loss": -6.542160987854004, "global_step": 116810, "epoch": 2781} {"train_loss": -6.536344528198242, "global_step": 116811, "epoch": 2781} {"train_loss": -6.488577842712402, "global_step": 116812, "epoch": 2781} {"train_loss": -6.528884410858154, "global_step": 116813, "epoch": 2781} {"train_loss": -6.5031538009643555, "global_step": 116814, "epoch": 2781} {"train_loss": -6.5064215660095215, "global_step": 116815, "epoch": 2781} {"train_loss": -6.594727993011475, "global_step": 116816, "epoch": 2781} {"train_loss": -6.419310569763184, "global_step": 116817, "epoch": 2781} {"train_loss": -6.508101463317871, "global_step": 116818, "epoch": 2781} {"train_loss": -6.5873026847839355, "global_step": 116819, "epoch": 2781} {"train_loss": -6.525993347167969, "global_step": 116820, "epoch": 2781} {"train_loss": -6.507896423339844, "global_step": 116821, "epoch": 2781} {"train_loss": -6.458386421203613, "global_step": 116822, "epoch": 2781} {"train_loss": -6.513251304626465, "global_step": 116823, "epoch": 2781} {"train_loss": -6.5615034103393555, "global_step": 116824, "epoch": 2781} {"train_loss": -6.647679805755615, "global_step": 116825, "epoch": 2781} {"train_loss": -6.519039154052734, "global_step": 116826, "epoch": 2781} {"train_loss": -6.556356430053711, "global_step": 116827, "epoch": 2781} {"train_loss": -6.44207763671875, "global_step": 116828, "epoch": 2781} {"train_loss": -6.545866012573242, "global_step": 116829, "epoch": 2781} {"train_loss": -6.507964134216309, "global_step": 116830, "epoch": 2781} {"train_loss": -6.582651138305664, "global_step": 116831, "epoch": 2781} {"train_loss": -6.515578746795654, "global_step": 116832, "epoch": 2781} {"train_loss": -6.507559776306152, "global_step": 116833, "epoch": 2781} {"train_loss": -6.54384708404541, "global_step": 116834, "epoch": 2781} {"train_loss": -6.483503341674805, "global_step": 116835, "epoch": 2781} {"train_loss": -6.604843616485596, "global_step": 116836, "epoch": 2781} {"train_loss": -6.468901634216309, "global_step": 116837, "epoch": 2781} {"train_loss": -6.5692243576049805, "global_step": 116838, "epoch": 2781} {"train_loss": -6.534008026123047, "global_step": 116839, "epoch": 2781} {"train_loss": -6.397911071777344, "global_step": 116840, "epoch": 2781} {"train_loss": -6.4861741065979, "global_step": 116841, "epoch": 2781} {"train_loss": -6.4115705490112305, "global_step": 116842, "epoch": 2781} {"train_loss": -6.531195299965995, "global_step": 116843, "epoch": 2781, "val_loss": 76483.359375} {"train_loss": -6.534759521484375, "global_step": 116844, "epoch": 2782} {"train_loss": -6.540279388427734, "global_step": 116845, "epoch": 2782} {"train_loss": -6.5101094245910645, "global_step": 116846, "epoch": 2782} {"train_loss": -6.596263885498047, "global_step": 116847, "epoch": 2782} {"train_loss": -6.579108238220215, "global_step": 116848, "epoch": 2782} {"train_loss": -6.585142135620117, "global_step": 116849, "epoch": 2782} {"train_loss": -6.525155067443848, "global_step": 116850, "epoch": 2782} {"train_loss": -6.424080848693848, "global_step": 116851, "epoch": 2782} {"train_loss": -6.512503623962402, "global_step": 116852, "epoch": 2782} {"train_loss": -6.361390113830566, "global_step": 116853, "epoch": 2782} {"train_loss": -6.393937110900879, "global_step": 116854, "epoch": 2782} {"train_loss": -6.453999042510986, "global_step": 116855, "epoch": 2782} {"train_loss": -6.501278877258301, "global_step": 116856, "epoch": 2782} {"train_loss": -6.395444869995117, "global_step": 116857, "epoch": 2782} {"train_loss": -6.4381208419799805, "global_step": 116858, "epoch": 2782} {"train_loss": -6.429597854614258, "global_step": 116859, "epoch": 2782} {"train_loss": -6.482888221740723, "global_step": 116860, "epoch": 2782} {"train_loss": -6.626128196716309, "global_step": 116861, "epoch": 2782} {"train_loss": -6.514922142028809, "global_step": 116862, "epoch": 2782} {"train_loss": -6.524123191833496, "global_step": 116863, "epoch": 2782} {"train_loss": -6.360598564147949, "global_step": 116864, "epoch": 2782} {"train_loss": -6.464441776275635, "global_step": 116865, "epoch": 2782} {"train_loss": -6.408145904541016, "global_step": 116866, "epoch": 2782} {"train_loss": -6.556713581085205, "global_step": 116867, "epoch": 2782} {"train_loss": -6.538891315460205, "global_step": 116868, "epoch": 2782} {"train_loss": -6.492225170135498, "global_step": 116869, "epoch": 2782} {"train_loss": -6.671597480773926, "global_step": 116870, "epoch": 2782} {"train_loss": -6.440042495727539, "global_step": 116871, "epoch": 2782} {"train_loss": -6.473747730255127, "global_step": 116872, "epoch": 2782} {"train_loss": -6.581130027770996, "global_step": 116873, "epoch": 2782} {"train_loss": -6.541706562042236, "global_step": 116874, "epoch": 2782} {"train_loss": -6.56524133682251, "global_step": 116875, "epoch": 2782} {"train_loss": -6.495705604553223, "global_step": 116876, "epoch": 2782} {"train_loss": -6.484361171722412, "global_step": 116877, "epoch": 2782} {"train_loss": -6.496549606323242, "global_step": 116878, "epoch": 2782} {"train_loss": -6.5403523445129395, "global_step": 116879, "epoch": 2782} {"train_loss": -6.546879768371582, "global_step": 116880, "epoch": 2782} {"train_loss": -6.545853137969971, "global_step": 116881, "epoch": 2782} {"train_loss": -6.526461601257324, "global_step": 116882, "epoch": 2782} {"train_loss": -6.528746604919434, "global_step": 116883, "epoch": 2782} {"train_loss": -6.463684558868408, "global_step": 116884, "epoch": 2782} {"train_loss": -6.501135508219401, "global_step": 116885, "epoch": 2782, "val_loss": 76379.4140625} {"train_loss": -6.626288890838623, "global_step": 116886, "epoch": 2783} {"train_loss": -6.583949565887451, "global_step": 116887, "epoch": 2783} {"train_loss": -6.520993232727051, "global_step": 116888, "epoch": 2783} {"train_loss": -6.587450981140137, "global_step": 116889, "epoch": 2783} {"train_loss": -6.559136390686035, "global_step": 116890, "epoch": 2783} {"train_loss": -6.653736114501953, "global_step": 116891, "epoch": 2783} {"train_loss": -6.508840560913086, "global_step": 116892, "epoch": 2783} {"train_loss": -6.59604024887085, "global_step": 116893, "epoch": 2783} {"train_loss": -6.4361772537231445, "global_step": 116894, "epoch": 2783} {"train_loss": -6.558438301086426, "global_step": 116895, "epoch": 2783} {"train_loss": -6.529082775115967, "global_step": 116896, "epoch": 2783} {"train_loss": -6.528112411499023, "global_step": 116897, "epoch": 2783} {"train_loss": -6.530794143676758, "global_step": 116898, "epoch": 2783} {"train_loss": -6.627216339111328, "global_step": 116899, "epoch": 2783} {"train_loss": -6.499107360839844, "global_step": 116900, "epoch": 2783} {"train_loss": -6.482966423034668, "global_step": 116901, "epoch": 2783} {"train_loss": -6.593326091766357, "global_step": 116902, "epoch": 2783} {"train_loss": -6.483155250549316, "global_step": 116903, "epoch": 2783} {"train_loss": -6.465945243835449, "global_step": 116904, "epoch": 2783} {"train_loss": -6.628458499908447, "global_step": 116905, "epoch": 2783} {"train_loss": -6.463947296142578, "global_step": 116906, "epoch": 2783} {"train_loss": -6.546662330627441, "global_step": 116907, "epoch": 2783} {"train_loss": -6.598254203796387, "global_step": 116908, "epoch": 2783} {"train_loss": -6.582658290863037, "global_step": 116909, "epoch": 2783} {"train_loss": -6.527835845947266, "global_step": 116910, "epoch": 2783} {"train_loss": -6.546714782714844, "global_step": 116911, "epoch": 2783} {"train_loss": -6.5854949951171875, "global_step": 116912, "epoch": 2783} {"train_loss": -6.564282417297363, "global_step": 116913, "epoch": 2783} {"train_loss": -6.538789749145508, "global_step": 116914, "epoch": 2783} {"train_loss": -6.5103535652160645, "global_step": 116915, "epoch": 2783} {"train_loss": -6.630370140075684, "global_step": 116916, "epoch": 2783} {"train_loss": -6.516914367675781, "global_step": 116917, "epoch": 2783} {"train_loss": -6.511763095855713, "global_step": 116918, "epoch": 2783} {"train_loss": -6.501120567321777, "global_step": 116919, "epoch": 2783} {"train_loss": -6.644463539123535, "global_step": 116920, "epoch": 2783} {"train_loss": -6.552874565124512, "global_step": 116921, "epoch": 2783} {"train_loss": -6.555019378662109, "global_step": 116922, "epoch": 2783} {"train_loss": -6.5170674324035645, "global_step": 116923, "epoch": 2783} {"train_loss": -6.541199684143066, "global_step": 116924, "epoch": 2783} {"train_loss": -6.491116046905518, "global_step": 116925, "epoch": 2783} {"train_loss": -6.59245491027832, "global_step": 116926, "epoch": 2783} {"train_loss": -6.549037070501418, "global_step": 116927, "epoch": 2783, "val_loss": 76398.359375} {"train_loss": -6.545908451080322, "global_step": 116928, "epoch": 2784} {"train_loss": -6.586559772491455, "global_step": 116929, "epoch": 2784} {"train_loss": -6.540950775146484, "global_step": 116930, "epoch": 2784} {"train_loss": -6.630576133728027, "global_step": 116931, "epoch": 2784} {"train_loss": -6.602207183837891, "global_step": 116932, "epoch": 2784} {"train_loss": -6.617980480194092, "global_step": 116933, "epoch": 2784} {"train_loss": -6.5176801681518555, "global_step": 116934, "epoch": 2784} {"train_loss": -6.540481090545654, "global_step": 116935, "epoch": 2784} {"train_loss": -6.535281658172607, "global_step": 116936, "epoch": 2784} {"train_loss": -6.657416820526123, "global_step": 116937, "epoch": 2784} {"train_loss": -6.539159774780273, "global_step": 116938, "epoch": 2784} {"train_loss": -6.5964741706848145, "global_step": 116939, "epoch": 2784} {"train_loss": -6.4788360595703125, "global_step": 116940, "epoch": 2784} {"train_loss": -6.565869331359863, "global_step": 116941, "epoch": 2784} {"train_loss": -6.517187118530273, "global_step": 116942, "epoch": 2784} {"train_loss": -6.5355706214904785, "global_step": 116943, "epoch": 2784} {"train_loss": -6.5673112869262695, "global_step": 116944, "epoch": 2784} {"train_loss": -6.5247015953063965, "global_step": 116945, "epoch": 2784} {"train_loss": -6.532123565673828, "global_step": 116946, "epoch": 2784} {"train_loss": -6.3533430099487305, "global_step": 116947, "epoch": 2784} {"train_loss": -6.5304694175720215, "global_step": 116948, "epoch": 2784} {"train_loss": -6.417803764343262, "global_step": 116949, "epoch": 2784} {"train_loss": -6.588061332702637, "global_step": 116950, "epoch": 2784} {"train_loss": -6.58324670791626, "global_step": 116951, "epoch": 2784} {"train_loss": -6.521097660064697, "global_step": 116952, "epoch": 2784} {"train_loss": -6.533574104309082, "global_step": 116953, "epoch": 2784} {"train_loss": -6.587657928466797, "global_step": 116954, "epoch": 2784} {"train_loss": -6.461849212646484, "global_step": 116955, "epoch": 2784} {"train_loss": -6.675933361053467, "global_step": 116956, "epoch": 2784} {"train_loss": -6.559848785400391, "global_step": 116957, "epoch": 2784} {"train_loss": -6.635894298553467, "global_step": 116958, "epoch": 2784} {"train_loss": -6.548039436340332, "global_step": 116959, "epoch": 2784} {"train_loss": -6.639552116394043, "global_step": 116960, "epoch": 2784} {"train_loss": -6.621759414672852, "global_step": 116961, "epoch": 2784} {"train_loss": -6.537540912628174, "global_step": 116962, "epoch": 2784} {"train_loss": -6.6106109619140625, "global_step": 116963, "epoch": 2784} {"train_loss": -6.459885597229004, "global_step": 116964, "epoch": 2784} {"train_loss": -6.613762378692627, "global_step": 116965, "epoch": 2784} {"train_loss": -6.548519611358643, "global_step": 116966, "epoch": 2784} {"train_loss": -6.510977745056152, "global_step": 116967, "epoch": 2784} {"train_loss": -6.592803001403809, "global_step": 116968, "epoch": 2784} {"train_loss": -6.556389059339251, "global_step": 116969, "epoch": 2784, "val_loss": 76511.109375} {"train_loss": -6.639467716217041, "global_step": 116970, "epoch": 2785} {"train_loss": -6.697773456573486, "global_step": 116971, "epoch": 2785} {"train_loss": -6.5073089599609375, "global_step": 116972, "epoch": 2785} {"train_loss": -6.647900581359863, "global_step": 116973, "epoch": 2785} {"train_loss": -6.576510429382324, "global_step": 116974, "epoch": 2785} {"train_loss": -6.57771635055542, "global_step": 116975, "epoch": 2785} {"train_loss": -6.691153049468994, "global_step": 116976, "epoch": 2785} {"train_loss": -6.5017595291137695, "global_step": 116977, "epoch": 2785} {"train_loss": -6.472018241882324, "global_step": 116978, "epoch": 2785} {"train_loss": -6.599470138549805, "global_step": 116979, "epoch": 2785} {"train_loss": -6.614508628845215, "global_step": 116980, "epoch": 2785} {"train_loss": -6.455607891082764, "global_step": 116981, "epoch": 2785} {"train_loss": -6.502859115600586, "global_step": 116982, "epoch": 2785} {"train_loss": -6.527445316314697, "global_step": 116983, "epoch": 2785} {"train_loss": -6.523499488830566, "global_step": 116984, "epoch": 2785} {"train_loss": -6.50993013381958, "global_step": 116985, "epoch": 2785} {"train_loss": -6.323645114898682, "global_step": 116986, "epoch": 2785} {"train_loss": -6.459455966949463, "global_step": 116987, "epoch": 2785} {"train_loss": -6.513575553894043, "global_step": 116988, "epoch": 2785} {"train_loss": -6.367060661315918, "global_step": 116989, "epoch": 2785} {"train_loss": -6.526257038116455, "global_step": 116990, "epoch": 2785} {"train_loss": -6.5287981033325195, "global_step": 116991, "epoch": 2785} {"train_loss": -6.559682846069336, "global_step": 116992, "epoch": 2785} {"train_loss": -6.432775497436523, "global_step": 116993, "epoch": 2785} {"train_loss": -6.475706100463867, "global_step": 116994, "epoch": 2785} {"train_loss": -6.617223739624023, "global_step": 116995, "epoch": 2785} {"train_loss": -6.624574661254883, "global_step": 116996, "epoch": 2785} {"train_loss": -6.431633949279785, "global_step": 116997, "epoch": 2785} {"train_loss": -6.466719627380371, "global_step": 116998, "epoch": 2785} {"train_loss": -6.633303642272949, "global_step": 116999, "epoch": 2785} {"train_loss": -6.555042266845703, "global_step": 117000, "epoch": 2785} {"train_loss": -6.422966957092285, "global_step": 117001, "epoch": 2785} {"train_loss": -6.419170379638672, "global_step": 117002, "epoch": 2785} {"train_loss": -6.625357627868652, "global_step": 117003, "epoch": 2785} {"train_loss": -6.606618881225586, "global_step": 117004, "epoch": 2785} {"train_loss": -6.402576446533203, "global_step": 117005, "epoch": 2785} {"train_loss": -6.590392112731934, "global_step": 117006, "epoch": 2785} {"train_loss": -6.539877891540527, "global_step": 117007, "epoch": 2785} {"train_loss": -6.498398780822754, "global_step": 117008, "epoch": 2785} {"train_loss": -6.447680950164795, "global_step": 117009, "epoch": 2785} {"train_loss": -6.467414855957031, "global_step": 117010, "epoch": 2785} {"train_loss": -6.525901794433594, "global_step": 117011, "epoch": 2785, "val_loss": 76396.5078125} {"train_loss": -6.542092323303223, "global_step": 117012, "epoch": 2786} {"train_loss": -6.487031936645508, "global_step": 117013, "epoch": 2786} {"train_loss": -6.523228645324707, "global_step": 117014, "epoch": 2786} {"train_loss": -6.6048126220703125, "global_step": 117015, "epoch": 2786} {"train_loss": -6.471356391906738, "global_step": 117016, "epoch": 2786} {"train_loss": -6.397002220153809, "global_step": 117017, "epoch": 2786} {"train_loss": -6.493838787078857, "global_step": 117018, "epoch": 2786} {"train_loss": -6.397050857543945, "global_step": 117019, "epoch": 2786} {"train_loss": -6.649960517883301, "global_step": 117020, "epoch": 2786} {"train_loss": -6.528373718261719, "global_step": 117021, "epoch": 2786} {"train_loss": -6.568136215209961, "global_step": 117022, "epoch": 2786} {"train_loss": -6.506936550140381, "global_step": 117023, "epoch": 2786} {"train_loss": -6.634495735168457, "global_step": 117024, "epoch": 2786} {"train_loss": -6.50987434387207, "global_step": 117025, "epoch": 2786} {"train_loss": -6.495849609375, "global_step": 117026, "epoch": 2786} {"train_loss": -6.543685436248779, "global_step": 117027, "epoch": 2786} {"train_loss": -6.511727333068848, "global_step": 117028, "epoch": 2786} {"train_loss": -6.542008399963379, "global_step": 117029, "epoch": 2786} {"train_loss": -6.5675811767578125, "global_step": 117030, "epoch": 2786} {"train_loss": -6.582605361938477, "global_step": 117031, "epoch": 2786} {"train_loss": -6.455251216888428, "global_step": 117032, "epoch": 2786} {"train_loss": -6.5901103019714355, "global_step": 117033, "epoch": 2786} {"train_loss": -6.52598762512207, "global_step": 117034, "epoch": 2786} {"train_loss": -6.559821128845215, "global_step": 117035, "epoch": 2786} {"train_loss": -6.577971458435059, "global_step": 117036, "epoch": 2786} {"train_loss": -6.510598182678223, "global_step": 117037, "epoch": 2786} {"train_loss": -6.595887184143066, "global_step": 117038, "epoch": 2786} {"train_loss": -6.513211250305176, "global_step": 117039, "epoch": 2786} {"train_loss": -6.4483866691589355, "global_step": 117040, "epoch": 2786} {"train_loss": -6.549873352050781, "global_step": 117041, "epoch": 2786} {"train_loss": -6.558314323425293, "global_step": 117042, "epoch": 2786} {"train_loss": -6.426780700683594, "global_step": 117043, "epoch": 2786} {"train_loss": -6.532214164733887, "global_step": 117044, "epoch": 2786} {"train_loss": -6.402158260345459, "global_step": 117045, "epoch": 2786} {"train_loss": -6.597339630126953, "global_step": 117046, "epoch": 2786} {"train_loss": -6.4585041999816895, "global_step": 117047, "epoch": 2786} {"train_loss": -6.438837051391602, "global_step": 117048, "epoch": 2786} {"train_loss": -6.440345764160156, "global_step": 117049, "epoch": 2786} {"train_loss": -6.469119071960449, "global_step": 117050, "epoch": 2786} {"train_loss": -6.623265266418457, "global_step": 117051, "epoch": 2786} {"train_loss": -6.447312355041504, "global_step": 117052, "epoch": 2786} {"train_loss": -6.517386629467919, "global_step": 117053, "epoch": 2786, "val_loss": 76841.9921875} {"train_loss": -6.555487632751465, "global_step": 117054, "epoch": 2787} {"train_loss": -6.5958662033081055, "global_step": 117055, "epoch": 2787} {"train_loss": -6.434836387634277, "global_step": 117056, "epoch": 2787} {"train_loss": -6.480787754058838, "global_step": 117057, "epoch": 2787} {"train_loss": -6.481672286987305, "global_step": 117058, "epoch": 2787} {"train_loss": -6.535027503967285, "global_step": 117059, "epoch": 2787} {"train_loss": -6.506128311157227, "global_step": 117060, "epoch": 2787} {"train_loss": -6.527215957641602, "global_step": 117061, "epoch": 2787} {"train_loss": -6.478311061859131, "global_step": 117062, "epoch": 2787} {"train_loss": -6.535202980041504, "global_step": 117063, "epoch": 2787} {"train_loss": -6.511212348937988, "global_step": 117064, "epoch": 2787} {"train_loss": -6.530686855316162, "global_step": 117065, "epoch": 2787} {"train_loss": -6.5143280029296875, "global_step": 117066, "epoch": 2787} {"train_loss": -6.57708740234375, "global_step": 117067, "epoch": 2787} {"train_loss": -6.526152610778809, "global_step": 117068, "epoch": 2787} {"train_loss": -6.484072685241699, "global_step": 117069, "epoch": 2787} {"train_loss": -6.4281768798828125, "global_step": 117070, "epoch": 2787} {"train_loss": -6.579780578613281, "global_step": 117071, "epoch": 2787} {"train_loss": -6.496754169464111, "global_step": 117072, "epoch": 2787} {"train_loss": -6.615963935852051, "global_step": 117073, "epoch": 2787} {"train_loss": -6.48210334777832, "global_step": 117074, "epoch": 2787} {"train_loss": -6.480472564697266, "global_step": 117075, "epoch": 2787} {"train_loss": -6.472190856933594, "global_step": 117076, "epoch": 2787} {"train_loss": -6.4875617027282715, "global_step": 117077, "epoch": 2787} {"train_loss": -6.520359516143799, "global_step": 117078, "epoch": 2787} {"train_loss": -6.545912265777588, "global_step": 117079, "epoch": 2787} {"train_loss": -6.434787750244141, "global_step": 117080, "epoch": 2787} {"train_loss": -6.472808361053467, "global_step": 117081, "epoch": 2787} {"train_loss": -6.420050621032715, "global_step": 117082, "epoch": 2787} {"train_loss": -6.328817367553711, "global_step": 117083, "epoch": 2787} {"train_loss": -6.505400657653809, "global_step": 117084, "epoch": 2787} {"train_loss": -6.442071914672852, "global_step": 117085, "epoch": 2787} {"train_loss": -6.423250198364258, "global_step": 117086, "epoch": 2787} {"train_loss": -6.603241920471191, "global_step": 117087, "epoch": 2787} {"train_loss": -6.491882801055908, "global_step": 117088, "epoch": 2787} {"train_loss": -6.416000843048096, "global_step": 117089, "epoch": 2787} {"train_loss": -6.600933074951172, "global_step": 117090, "epoch": 2787} {"train_loss": -6.558931827545166, "global_step": 117091, "epoch": 2787} {"train_loss": -6.542111396789551, "global_step": 117092, "epoch": 2787} {"train_loss": -6.489126205444336, "global_step": 117093, "epoch": 2787} {"train_loss": -6.447394371032715, "global_step": 117094, "epoch": 2787} {"train_loss": -6.501834540140061, "global_step": 117095, "epoch": 2787, "val_loss": 76657.390625} {"train_loss": -6.648388862609863, "global_step": 117096, "epoch": 2788} {"train_loss": -6.475734710693359, "global_step": 117097, "epoch": 2788} {"train_loss": -6.541652202606201, "global_step": 117098, "epoch": 2788} {"train_loss": -6.49233865737915, "global_step": 117099, "epoch": 2788} {"train_loss": -6.49598503112793, "global_step": 117100, "epoch": 2788} {"train_loss": -6.522776126861572, "global_step": 117101, "epoch": 2788} {"train_loss": -6.6577606201171875, "global_step": 117102, "epoch": 2788} {"train_loss": -6.6291046142578125, "global_step": 117103, "epoch": 2788} {"train_loss": -6.563056468963623, "global_step": 117104, "epoch": 2788} {"train_loss": -6.46658992767334, "global_step": 117105, "epoch": 2788} {"train_loss": -6.555474758148193, "global_step": 117106, "epoch": 2788} {"train_loss": -6.454606533050537, "global_step": 117107, "epoch": 2788} {"train_loss": -6.680811882019043, "global_step": 117108, "epoch": 2788} {"train_loss": -6.557919502258301, "global_step": 117109, "epoch": 2788} {"train_loss": -6.572290420532227, "global_step": 117110, "epoch": 2788} {"train_loss": -6.603470325469971, "global_step": 117111, "epoch": 2788} {"train_loss": -6.57530403137207, "global_step": 117112, "epoch": 2788} {"train_loss": -6.546809196472168, "global_step": 117113, "epoch": 2788} {"train_loss": -6.619571685791016, "global_step": 117114, "epoch": 2788} {"train_loss": -6.639481544494629, "global_step": 117115, "epoch": 2788} {"train_loss": -6.52949857711792, "global_step": 117116, "epoch": 2788} {"train_loss": -6.615644454956055, "global_step": 117117, "epoch": 2788} {"train_loss": -6.636013984680176, "global_step": 117118, "epoch": 2788} {"train_loss": -6.572639465332031, "global_step": 117119, "epoch": 2788} {"train_loss": -6.644540309906006, "global_step": 117120, "epoch": 2788} {"train_loss": -6.622547626495361, "global_step": 117121, "epoch": 2788} {"train_loss": -6.567348480224609, "global_step": 117122, "epoch": 2788} {"train_loss": -6.528876304626465, "global_step": 117123, "epoch": 2788} {"train_loss": -6.5799946784973145, "global_step": 117124, "epoch": 2788} {"train_loss": -6.551031112670898, "global_step": 117125, "epoch": 2788} {"train_loss": -6.546723365783691, "global_step": 117126, "epoch": 2788} {"train_loss": -6.5999579429626465, "global_step": 117127, "epoch": 2788} {"train_loss": -6.521946907043457, "global_step": 117128, "epoch": 2788} {"train_loss": -6.559025764465332, "global_step": 117129, "epoch": 2788} {"train_loss": -6.609053611755371, "global_step": 117130, "epoch": 2788} {"train_loss": -6.5320234298706055, "global_step": 117131, "epoch": 2788} {"train_loss": -6.496514320373535, "global_step": 117132, "epoch": 2788} {"train_loss": -6.54957914352417, "global_step": 117133, "epoch": 2788} {"train_loss": -6.520822525024414, "global_step": 117134, "epoch": 2788} {"train_loss": -6.546807289123535, "global_step": 117135, "epoch": 2788} {"train_loss": -6.677073001861572, "global_step": 117136, "epoch": 2788} {"train_loss": -6.568293764477684, "global_step": 117137, "epoch": 2788, "val_loss": 76764.8125} {"train_loss": -6.570842742919922, "global_step": 117138, "epoch": 2789} {"train_loss": -6.519534111022949, "global_step": 117139, "epoch": 2789} {"train_loss": -6.540014743804932, "global_step": 117140, "epoch": 2789} {"train_loss": -6.503239631652832, "global_step": 117141, "epoch": 2789} {"train_loss": -6.513060569763184, "global_step": 117142, "epoch": 2789} {"train_loss": -6.623112678527832, "global_step": 117143, "epoch": 2789} {"train_loss": -6.581506729125977, "global_step": 117144, "epoch": 2789} {"train_loss": -6.549459457397461, "global_step": 117145, "epoch": 2789} {"train_loss": -6.5986762046813965, "global_step": 117146, "epoch": 2789} {"train_loss": -6.474767684936523, "global_step": 117147, "epoch": 2789} {"train_loss": -6.48555850982666, "global_step": 117148, "epoch": 2789} {"train_loss": -6.4666032791137695, "global_step": 117149, "epoch": 2789} {"train_loss": -6.482092380523682, "global_step": 117150, "epoch": 2789} {"train_loss": -6.568633556365967, "global_step": 117151, "epoch": 2789} {"train_loss": -6.58126163482666, "global_step": 117152, "epoch": 2789} {"train_loss": -6.5489912033081055, "global_step": 117153, "epoch": 2789} {"train_loss": -6.523365020751953, "global_step": 117154, "epoch": 2789} {"train_loss": -6.549898624420166, "global_step": 117155, "epoch": 2789} {"train_loss": -6.51984977722168, "global_step": 117156, "epoch": 2789} {"train_loss": -6.469717979431152, "global_step": 117157, "epoch": 2789} {"train_loss": -6.443758010864258, "global_step": 117158, "epoch": 2789} {"train_loss": -6.669436454772949, "global_step": 117159, "epoch": 2789} {"train_loss": -6.6586198806762695, "global_step": 117160, "epoch": 2789} {"train_loss": -6.617925643920898, "global_step": 117161, "epoch": 2789} {"train_loss": -6.605940818786621, "global_step": 117162, "epoch": 2789} {"train_loss": -6.441391944885254, "global_step": 117163, "epoch": 2789} {"train_loss": -6.521825790405273, "global_step": 117164, "epoch": 2789} {"train_loss": -6.580761909484863, "global_step": 117165, "epoch": 2789} {"train_loss": -6.520581245422363, "global_step": 117166, "epoch": 2789} {"train_loss": -6.543117523193359, "global_step": 117167, "epoch": 2789} {"train_loss": -6.577965259552002, "global_step": 117168, "epoch": 2789} {"train_loss": -6.63435697555542, "global_step": 117169, "epoch": 2789} {"train_loss": -6.51881217956543, "global_step": 117170, "epoch": 2789} {"train_loss": -6.550836563110352, "global_step": 117171, "epoch": 2789} {"train_loss": -6.613194942474365, "global_step": 117172, "epoch": 2789} {"train_loss": -6.473912239074707, "global_step": 117173, "epoch": 2789} {"train_loss": -6.633507251739502, "global_step": 117174, "epoch": 2789} {"train_loss": -6.439369201660156, "global_step": 117175, "epoch": 2789} {"train_loss": -6.632648944854736, "global_step": 117176, "epoch": 2789} {"train_loss": -6.667413234710693, "global_step": 117177, "epoch": 2789} {"train_loss": -6.5918192863464355, "global_step": 117178, "epoch": 2789} {"train_loss": -6.550016823269072, "global_step": 117179, "epoch": 2789, "val_loss": 76696.421875} {"train_loss": -6.4841108322143555, "global_step": 117180, "epoch": 2790} {"train_loss": -6.577897071838379, "global_step": 117181, "epoch": 2790} {"train_loss": -6.558306694030762, "global_step": 117182, "epoch": 2790} {"train_loss": -6.47035551071167, "global_step": 117183, "epoch": 2790} {"train_loss": -6.468499183654785, "global_step": 117184, "epoch": 2790} {"train_loss": -6.618542671203613, "global_step": 117185, "epoch": 2790} {"train_loss": -6.52536678314209, "global_step": 117186, "epoch": 2790} {"train_loss": -6.408461570739746, "global_step": 117187, "epoch": 2790} {"train_loss": -6.53124475479126, "global_step": 117188, "epoch": 2790} {"train_loss": -6.612277030944824, "global_step": 117189, "epoch": 2790} {"train_loss": -6.523948669433594, "global_step": 117190, "epoch": 2790} {"train_loss": -6.596439838409424, "global_step": 117191, "epoch": 2790} {"train_loss": -6.53043270111084, "global_step": 117192, "epoch": 2790} {"train_loss": -6.492273807525635, "global_step": 117193, "epoch": 2790} {"train_loss": -6.56557035446167, "global_step": 117194, "epoch": 2790} {"train_loss": -6.563659191131592, "global_step": 117195, "epoch": 2790} {"train_loss": -6.526201248168945, "global_step": 117196, "epoch": 2790} {"train_loss": -6.5535759925842285, "global_step": 117197, "epoch": 2790} {"train_loss": -6.397370338439941, "global_step": 117198, "epoch": 2790} {"train_loss": -6.51317024230957, "global_step": 117199, "epoch": 2790} {"train_loss": -6.503376007080078, "global_step": 117200, "epoch": 2790} {"train_loss": -6.5025224685668945, "global_step": 117201, "epoch": 2790} {"train_loss": -6.546816825866699, "global_step": 117202, "epoch": 2790} {"train_loss": -6.519230842590332, "global_step": 117203, "epoch": 2790} {"train_loss": -6.558357238769531, "global_step": 117204, "epoch": 2790} {"train_loss": -6.566627502441406, "global_step": 117205, "epoch": 2790} {"train_loss": -6.4704132080078125, "global_step": 117206, "epoch": 2790} {"train_loss": -6.493902206420898, "global_step": 117207, "epoch": 2790} {"train_loss": -6.517177104949951, "global_step": 117208, "epoch": 2790} {"train_loss": -6.636366844177246, "global_step": 117209, "epoch": 2790} {"train_loss": -6.60237979888916, "global_step": 117210, "epoch": 2790} {"train_loss": -6.632779121398926, "global_step": 117211, "epoch": 2790} {"train_loss": -6.520809173583984, "global_step": 117212, "epoch": 2790} {"train_loss": -6.555065155029297, "global_step": 117213, "epoch": 2790} {"train_loss": -6.538673400878906, "global_step": 117214, "epoch": 2790} {"train_loss": -6.620314121246338, "global_step": 117215, "epoch": 2790} {"train_loss": -6.552827835083008, "global_step": 117216, "epoch": 2790} {"train_loss": -6.638472080230713, "global_step": 117217, "epoch": 2790} {"train_loss": -6.554628372192383, "global_step": 117218, "epoch": 2790} {"train_loss": -6.583283424377441, "global_step": 117219, "epoch": 2790} {"train_loss": -6.486120223999023, "global_step": 117220, "epoch": 2790} {"train_loss": -6.5366745335715155, "global_step": 117221, "epoch": 2790, "val_loss": 76617.859375} {"train_loss": -6.6371564865112305, "global_step": 117222, "epoch": 2791} {"train_loss": -6.584693908691406, "global_step": 117223, "epoch": 2791} {"train_loss": -6.6172566413879395, "global_step": 117224, "epoch": 2791} {"train_loss": -6.608356475830078, "global_step": 117225, "epoch": 2791} {"train_loss": -6.643287658691406, "global_step": 117226, "epoch": 2791} {"train_loss": -6.637326240539551, "global_step": 117227, "epoch": 2791} {"train_loss": -6.452905654907227, "global_step": 117228, "epoch": 2791} {"train_loss": -6.623342990875244, "global_step": 117229, "epoch": 2791} {"train_loss": -6.589486122131348, "global_step": 117230, "epoch": 2791} {"train_loss": -6.558591365814209, "global_step": 117231, "epoch": 2791} {"train_loss": -6.507370948791504, "global_step": 117232, "epoch": 2791} {"train_loss": -6.586639404296875, "global_step": 117233, "epoch": 2791} {"train_loss": -6.64799690246582, "global_step": 117234, "epoch": 2791} {"train_loss": -6.57548189163208, "global_step": 117235, "epoch": 2791} {"train_loss": -6.619290828704834, "global_step": 117236, "epoch": 2791} {"train_loss": -6.56460428237915, "global_step": 117237, "epoch": 2791} {"train_loss": -6.536716938018799, "global_step": 117238, "epoch": 2791} {"train_loss": -6.488577365875244, "global_step": 117239, "epoch": 2791} {"train_loss": -6.540762424468994, "global_step": 117240, "epoch": 2791} {"train_loss": -6.603902816772461, "global_step": 117241, "epoch": 2791} {"train_loss": -6.519421100616455, "global_step": 117242, "epoch": 2791} {"train_loss": -6.657926082611084, "global_step": 117243, "epoch": 2791} {"train_loss": -6.474552154541016, "global_step": 117244, "epoch": 2791} {"train_loss": -6.510009765625, "global_step": 117245, "epoch": 2791} {"train_loss": -6.607013702392578, "global_step": 117246, "epoch": 2791} {"train_loss": -6.518155574798584, "global_step": 117247, "epoch": 2791} {"train_loss": -6.507167816162109, "global_step": 117248, "epoch": 2791} {"train_loss": -6.588865280151367, "global_step": 117249, "epoch": 2791} {"train_loss": -6.541192531585693, "global_step": 117250, "epoch": 2791} {"train_loss": -6.55904483795166, "global_step": 117251, "epoch": 2791} {"train_loss": -6.474025726318359, "global_step": 117252, "epoch": 2791} {"train_loss": -6.505446434020996, "global_step": 117253, "epoch": 2791} {"train_loss": -6.701119422912598, "global_step": 117254, "epoch": 2791} {"train_loss": -6.53443717956543, "global_step": 117255, "epoch": 2791} {"train_loss": -6.486517429351807, "global_step": 117256, "epoch": 2791} {"train_loss": -6.568561553955078, "global_step": 117257, "epoch": 2791} {"train_loss": -6.518263816833496, "global_step": 117258, "epoch": 2791} {"train_loss": -6.451245307922363, "global_step": 117259, "epoch": 2791} {"train_loss": -6.5768914222717285, "global_step": 117260, "epoch": 2791} {"train_loss": -6.42290735244751, "global_step": 117261, "epoch": 2791} {"train_loss": -6.632196426391602, "global_step": 117262, "epoch": 2791} {"train_loss": -6.556628828956967, "global_step": 117263, "epoch": 2791, "val_loss": 76890.1015625} {"train_loss": -6.581235408782959, "global_step": 117264, "epoch": 2792} {"train_loss": -6.429636478424072, "global_step": 117265, "epoch": 2792} {"train_loss": -6.558990001678467, "global_step": 117266, "epoch": 2792} {"train_loss": -6.439432621002197, "global_step": 117267, "epoch": 2792} {"train_loss": -6.57018518447876, "global_step": 117268, "epoch": 2792} {"train_loss": -6.477041244506836, "global_step": 117269, "epoch": 2792} {"train_loss": -6.512852668762207, "global_step": 117270, "epoch": 2792} {"train_loss": -6.481137275695801, "global_step": 117271, "epoch": 2792} {"train_loss": -6.62537956237793, "global_step": 117272, "epoch": 2792} {"train_loss": -6.618862152099609, "global_step": 117273, "epoch": 2792} {"train_loss": -6.490307807922363, "global_step": 117274, "epoch": 2792} {"train_loss": -6.6713104248046875, "global_step": 117275, "epoch": 2792} {"train_loss": -6.536120414733887, "global_step": 117276, "epoch": 2792} {"train_loss": -6.462713718414307, "global_step": 117277, "epoch": 2792} {"train_loss": -6.47342586517334, "global_step": 117278, "epoch": 2792} {"train_loss": -6.462818622589111, "global_step": 117279, "epoch": 2792} {"train_loss": -6.549118995666504, "global_step": 117280, "epoch": 2792} {"train_loss": -6.479875564575195, "global_step": 117281, "epoch": 2792} {"train_loss": -6.606978416442871, "global_step": 117282, "epoch": 2792} {"train_loss": -6.4670915603637695, "global_step": 117283, "epoch": 2792} {"train_loss": -6.382482051849365, "global_step": 117284, "epoch": 2792} {"train_loss": -6.469104766845703, "global_step": 117285, "epoch": 2792} {"train_loss": -6.44809627532959, "global_step": 117286, "epoch": 2792} {"train_loss": -6.569886684417725, "global_step": 117287, "epoch": 2792} {"train_loss": -6.582380294799805, "global_step": 117288, "epoch": 2792} {"train_loss": -6.533056735992432, "global_step": 117289, "epoch": 2792} {"train_loss": -6.628684043884277, "global_step": 117290, "epoch": 2792} {"train_loss": -6.4876203536987305, "global_step": 117291, "epoch": 2792} {"train_loss": -6.449998378753662, "global_step": 117292, "epoch": 2792} {"train_loss": -6.501978397369385, "global_step": 117293, "epoch": 2792} {"train_loss": -6.477824687957764, "global_step": 117294, "epoch": 2792} {"train_loss": -6.6102094650268555, "global_step": 117295, "epoch": 2792} {"train_loss": -6.426895618438721, "global_step": 117296, "epoch": 2792} {"train_loss": -6.504505157470703, "global_step": 117297, "epoch": 2792} {"train_loss": -6.485230445861816, "global_step": 117298, "epoch": 2792} {"train_loss": -6.527054786682129, "global_step": 117299, "epoch": 2792} {"train_loss": -6.3418474197387695, "global_step": 117300, "epoch": 2792} {"train_loss": -6.397061347961426, "global_step": 117301, "epoch": 2792} {"train_loss": -6.458230972290039, "global_step": 117302, "epoch": 2792} {"train_loss": -6.453507423400879, "global_step": 117303, "epoch": 2792} {"train_loss": -6.449782371520996, "global_step": 117304, "epoch": 2792} {"train_loss": -6.504592816034953, "global_step": 117305, "epoch": 2792, "val_loss": 76711.1171875} {"train_loss": -6.408812522888184, "global_step": 117306, "epoch": 2793} {"train_loss": -6.611737251281738, "global_step": 117307, "epoch": 2793} {"train_loss": -6.459079742431641, "global_step": 117308, "epoch": 2793} {"train_loss": -6.513513088226318, "global_step": 117309, "epoch": 2793} {"train_loss": -6.556971549987793, "global_step": 117310, "epoch": 2793} {"train_loss": -6.49831485748291, "global_step": 117311, "epoch": 2793} {"train_loss": -6.386970043182373, "global_step": 117312, "epoch": 2793} {"train_loss": -6.543865203857422, "global_step": 117313, "epoch": 2793} {"train_loss": -6.534996032714844, "global_step": 117314, "epoch": 2793} {"train_loss": -6.515241622924805, "global_step": 117315, "epoch": 2793} {"train_loss": -6.613183975219727, "global_step": 117316, "epoch": 2793} {"train_loss": -6.520606517791748, "global_step": 117317, "epoch": 2793} {"train_loss": -6.6005754470825195, "global_step": 117318, "epoch": 2793} {"train_loss": -6.47876501083374, "global_step": 117319, "epoch": 2793} {"train_loss": -6.555874824523926, "global_step": 117320, "epoch": 2793} {"train_loss": -6.500115394592285, "global_step": 117321, "epoch": 2793} {"train_loss": -6.440102577209473, "global_step": 117322, "epoch": 2793} {"train_loss": -6.443761825561523, "global_step": 117323, "epoch": 2793} {"train_loss": -6.282619476318359, "global_step": 117324, "epoch": 2793} {"train_loss": -6.350703716278076, "global_step": 117325, "epoch": 2793} {"train_loss": -6.564220905303955, "global_step": 117326, "epoch": 2793} {"train_loss": -6.429917335510254, "global_step": 117327, "epoch": 2793} {"train_loss": -6.532310485839844, "global_step": 117328, "epoch": 2793} {"train_loss": -6.337711334228516, "global_step": 117329, "epoch": 2793} {"train_loss": -6.432001113891602, "global_step": 117330, "epoch": 2793} {"train_loss": -6.535995960235596, "global_step": 117331, "epoch": 2793} {"train_loss": -6.529046058654785, "global_step": 117332, "epoch": 2793} {"train_loss": -6.491507053375244, "global_step": 117333, "epoch": 2793} {"train_loss": -6.472546100616455, "global_step": 117334, "epoch": 2793} {"train_loss": -6.499403953552246, "global_step": 117335, "epoch": 2793} {"train_loss": -6.52480411529541, "global_step": 117336, "epoch": 2793} {"train_loss": -6.571467399597168, "global_step": 117337, "epoch": 2793} {"train_loss": -6.600953578948975, "global_step": 117338, "epoch": 2793} {"train_loss": -6.5075554847717285, "global_step": 117339, "epoch": 2793} {"train_loss": -6.576700210571289, "global_step": 117340, "epoch": 2793} {"train_loss": -6.544512748718262, "global_step": 117341, "epoch": 2793} {"train_loss": -6.682788848876953, "global_step": 117342, "epoch": 2793} {"train_loss": -6.5316691398620605, "global_step": 117343, "epoch": 2793} {"train_loss": -6.410566329956055, "global_step": 117344, "epoch": 2793} {"train_loss": -6.471109390258789, "global_step": 117345, "epoch": 2793} {"train_loss": -6.491334438323975, "global_step": 117346, "epoch": 2793} {"train_loss": -6.501942169098627, "global_step": 117347, "epoch": 2793, "val_loss": 76646.8359375} {"train_loss": -6.574033737182617, "global_step": 117348, "epoch": 2794} {"train_loss": -6.464001655578613, "global_step": 117349, "epoch": 2794} {"train_loss": -6.424961090087891, "global_step": 117350, "epoch": 2794} {"train_loss": -6.481623649597168, "global_step": 117351, "epoch": 2794} {"train_loss": -6.39766788482666, "global_step": 117352, "epoch": 2794} {"train_loss": -6.625247478485107, "global_step": 117353, "epoch": 2794} {"train_loss": -6.385504722595215, "global_step": 117354, "epoch": 2794} {"train_loss": -6.477533340454102, "global_step": 117355, "epoch": 2794} {"train_loss": -6.502256393432617, "global_step": 117356, "epoch": 2794} {"train_loss": -6.398695945739746, "global_step": 117357, "epoch": 2794} {"train_loss": -6.4471435546875, "global_step": 117358, "epoch": 2794} {"train_loss": -6.504395484924316, "global_step": 117359, "epoch": 2794} {"train_loss": -6.449784278869629, "global_step": 117360, "epoch": 2794} {"train_loss": -6.615448951721191, "global_step": 117361, "epoch": 2794} {"train_loss": -6.5723161697387695, "global_step": 117362, "epoch": 2794} {"train_loss": -6.479042053222656, "global_step": 117363, "epoch": 2794} {"train_loss": -6.533627986907959, "global_step": 117364, "epoch": 2794} {"train_loss": -6.451044082641602, "global_step": 117365, "epoch": 2794} {"train_loss": -6.497830390930176, "global_step": 117366, "epoch": 2794} {"train_loss": -6.597789764404297, "global_step": 117367, "epoch": 2794} {"train_loss": -6.430528163909912, "global_step": 117368, "epoch": 2794} {"train_loss": -6.540363311767578, "global_step": 117369, "epoch": 2794} {"train_loss": -6.513124465942383, "global_step": 117370, "epoch": 2794} {"train_loss": -6.457839012145996, "global_step": 117371, "epoch": 2794} {"train_loss": -6.49733304977417, "global_step": 117372, "epoch": 2794} {"train_loss": -6.546115875244141, "global_step": 117373, "epoch": 2794} {"train_loss": -6.396839141845703, "global_step": 117374, "epoch": 2794} {"train_loss": -6.467107772827148, "global_step": 117375, "epoch": 2794} {"train_loss": -6.529766082763672, "global_step": 117376, "epoch": 2794} {"train_loss": -6.581254959106445, "global_step": 117377, "epoch": 2794} {"train_loss": -6.506569862365723, "global_step": 117378, "epoch": 2794} {"train_loss": -6.507761478424072, "global_step": 117379, "epoch": 2794} {"train_loss": -6.580471515655518, "global_step": 117380, "epoch": 2794} {"train_loss": -6.4857072830200195, "global_step": 117381, "epoch": 2794} {"train_loss": -6.512282371520996, "global_step": 117382, "epoch": 2794} {"train_loss": -6.5774993896484375, "global_step": 117383, "epoch": 2794} {"train_loss": -6.5592451095581055, "global_step": 117384, "epoch": 2794} {"train_loss": -6.53400182723999, "global_step": 117385, "epoch": 2794} {"train_loss": -6.615110397338867, "global_step": 117386, "epoch": 2794} {"train_loss": -6.5433149337768555, "global_step": 117387, "epoch": 2794} {"train_loss": -6.499270439147949, "global_step": 117388, "epoch": 2794} {"train_loss": -6.508007764816284, "global_step": 117389, "epoch": 2794, "val_loss": 76690.015625} {"train_loss": -6.514494895935059, "global_step": 117390, "epoch": 2795} {"train_loss": -6.681707859039307, "global_step": 117391, "epoch": 2795} {"train_loss": -6.621014595031738, "global_step": 117392, "epoch": 2795} {"train_loss": -6.672222137451172, "global_step": 117393, "epoch": 2795} {"train_loss": -6.537174224853516, "global_step": 117394, "epoch": 2795} {"train_loss": -6.572540760040283, "global_step": 117395, "epoch": 2795} {"train_loss": -6.683192253112793, "global_step": 117396, "epoch": 2795} {"train_loss": -6.506969928741455, "global_step": 117397, "epoch": 2795} {"train_loss": -6.6157917976379395, "global_step": 117398, "epoch": 2795} {"train_loss": -6.559814453125, "global_step": 117399, "epoch": 2795} {"train_loss": -6.556476593017578, "global_step": 117400, "epoch": 2795} {"train_loss": -6.606815814971924, "global_step": 117401, "epoch": 2795} {"train_loss": -6.585725784301758, "global_step": 117402, "epoch": 2795} {"train_loss": -6.643772602081299, "global_step": 117403, "epoch": 2795} {"train_loss": -6.624187469482422, "global_step": 117404, "epoch": 2795} {"train_loss": -6.4952826499938965, "global_step": 117405, "epoch": 2795} {"train_loss": -6.536751747131348, "global_step": 117406, "epoch": 2795} {"train_loss": -6.564286231994629, "global_step": 117407, "epoch": 2795} {"train_loss": -6.584773063659668, "global_step": 117408, "epoch": 2795} {"train_loss": -6.582657814025879, "global_step": 117409, "epoch": 2795} {"train_loss": -6.511055946350098, "global_step": 117410, "epoch": 2795} {"train_loss": -6.616121292114258, "global_step": 117411, "epoch": 2795} {"train_loss": -6.420629501342773, "global_step": 117412, "epoch": 2795} {"train_loss": -6.538715362548828, "global_step": 117413, "epoch": 2795} {"train_loss": -6.510004997253418, "global_step": 117414, "epoch": 2795} {"train_loss": -6.4929914474487305, "global_step": 117415, "epoch": 2795} {"train_loss": -6.497422218322754, "global_step": 117416, "epoch": 2795} {"train_loss": -6.318589687347412, "global_step": 117417, "epoch": 2795} {"train_loss": -6.601804256439209, "global_step": 117418, "epoch": 2795} {"train_loss": -6.493743896484375, "global_step": 117419, "epoch": 2795} {"train_loss": -6.224329948425293, "global_step": 117420, "epoch": 2795} {"train_loss": -6.604767322540283, "global_step": 117421, "epoch": 2795} {"train_loss": -6.4155378341674805, "global_step": 117422, "epoch": 2795} {"train_loss": -6.355643272399902, "global_step": 117423, "epoch": 2795} {"train_loss": -6.5065226554870605, "global_step": 117424, "epoch": 2795} {"train_loss": -6.4569172859191895, "global_step": 117425, "epoch": 2795} {"train_loss": -6.437274932861328, "global_step": 117426, "epoch": 2795} {"train_loss": -6.259852886199951, "global_step": 117427, "epoch": 2795} {"train_loss": -6.535033226013184, "global_step": 117428, "epoch": 2795} {"train_loss": -6.451238632202148, "global_step": 117429, "epoch": 2795} {"train_loss": -6.461913108825684, "global_step": 117430, "epoch": 2795} {"train_loss": -6.524346714928036, "global_step": 117431, "epoch": 2795, "val_loss": 76804.3984375} {"train_loss": -6.430973052978516, "global_step": 117432, "epoch": 2796} {"train_loss": -6.637104511260986, "global_step": 117433, "epoch": 2796} {"train_loss": -6.469927787780762, "global_step": 117434, "epoch": 2796} {"train_loss": -6.598311424255371, "global_step": 117435, "epoch": 2796} {"train_loss": -6.571957588195801, "global_step": 117436, "epoch": 2796} {"train_loss": -6.533180236816406, "global_step": 117437, "epoch": 2796} {"train_loss": -6.48923397064209, "global_step": 117438, "epoch": 2796} {"train_loss": -6.530278205871582, "global_step": 117439, "epoch": 2796} {"train_loss": -6.567014217376709, "global_step": 117440, "epoch": 2796} {"train_loss": -6.536342620849609, "global_step": 117441, "epoch": 2796} {"train_loss": -6.635753631591797, "global_step": 117442, "epoch": 2796} {"train_loss": -6.503574371337891, "global_step": 117443, "epoch": 2796} {"train_loss": -6.493013858795166, "global_step": 117444, "epoch": 2796} {"train_loss": -6.500090599060059, "global_step": 117445, "epoch": 2796} {"train_loss": -6.638125419616699, "global_step": 117446, "epoch": 2796} {"train_loss": -6.483633995056152, "global_step": 117447, "epoch": 2796} {"train_loss": -6.605875015258789, "global_step": 117448, "epoch": 2796} {"train_loss": -6.48404598236084, "global_step": 117449, "epoch": 2796} {"train_loss": -6.501924514770508, "global_step": 117450, "epoch": 2796} {"train_loss": -6.553865432739258, "global_step": 117451, "epoch": 2796} {"train_loss": -6.419759750366211, "global_step": 117452, "epoch": 2796} {"train_loss": -6.539510726928711, "global_step": 117453, "epoch": 2796} {"train_loss": -6.397993087768555, "global_step": 117454, "epoch": 2796} {"train_loss": -6.52955436706543, "global_step": 117455, "epoch": 2796} {"train_loss": -6.471830368041992, "global_step": 117456, "epoch": 2796} {"train_loss": -6.544929504394531, "global_step": 117457, "epoch": 2796} {"train_loss": -6.493271827697754, "global_step": 117458, "epoch": 2796} {"train_loss": -6.600049018859863, "global_step": 117459, "epoch": 2796} {"train_loss": -6.548760890960693, "global_step": 117460, "epoch": 2796} {"train_loss": -6.413498401641846, "global_step": 117461, "epoch": 2796} {"train_loss": -6.479310989379883, "global_step": 117462, "epoch": 2796} {"train_loss": -6.537846565246582, "global_step": 117463, "epoch": 2796} {"train_loss": -6.497506141662598, "global_step": 117464, "epoch": 2796} {"train_loss": -6.474827289581299, "global_step": 117465, "epoch": 2796} {"train_loss": -6.625934600830078, "global_step": 117466, "epoch": 2796} {"train_loss": -6.328855514526367, "global_step": 117467, "epoch": 2796} {"train_loss": -6.5591888427734375, "global_step": 117468, "epoch": 2796} {"train_loss": -6.475320339202881, "global_step": 117469, "epoch": 2796} {"train_loss": -6.419437408447266, "global_step": 117470, "epoch": 2796} {"train_loss": -6.479995250701904, "global_step": 117471, "epoch": 2796} {"train_loss": -6.546903610229492, "global_step": 117472, "epoch": 2796} {"train_loss": -6.517692134493873, "global_step": 117473, "epoch": 2796, "val_loss": 76608.375} {"train_loss": -6.527137279510498, "global_step": 117474, "epoch": 2797} {"train_loss": -6.544559478759766, "global_step": 117475, "epoch": 2797} {"train_loss": -6.5887627601623535, "global_step": 117476, "epoch": 2797} {"train_loss": -6.498507499694824, "global_step": 117477, "epoch": 2797} {"train_loss": -6.553459167480469, "global_step": 117478, "epoch": 2797} {"train_loss": -6.447061538696289, "global_step": 117479, "epoch": 2797} {"train_loss": -6.470308303833008, "global_step": 117480, "epoch": 2797} {"train_loss": -6.420149803161621, "global_step": 117481, "epoch": 2797} {"train_loss": -6.499727249145508, "global_step": 117482, "epoch": 2797} {"train_loss": -6.515205383300781, "global_step": 117483, "epoch": 2797} {"train_loss": -6.439505577087402, "global_step": 117484, "epoch": 2797} {"train_loss": -6.557468414306641, "global_step": 117485, "epoch": 2797} {"train_loss": -6.406904220581055, "global_step": 117486, "epoch": 2797} {"train_loss": -6.365548133850098, "global_step": 117487, "epoch": 2797} {"train_loss": -6.542201042175293, "global_step": 117488, "epoch": 2797} {"train_loss": -6.543883800506592, "global_step": 117489, "epoch": 2797} {"train_loss": -6.473789691925049, "global_step": 117490, "epoch": 2797} {"train_loss": -6.554715156555176, "global_step": 117491, "epoch": 2797} {"train_loss": -6.559938430786133, "global_step": 117492, "epoch": 2797} {"train_loss": -6.578664779663086, "global_step": 117493, "epoch": 2797} {"train_loss": -6.517269611358643, "global_step": 117494, "epoch": 2797} {"train_loss": -6.454918384552002, "global_step": 117495, "epoch": 2797} {"train_loss": -6.45460319519043, "global_step": 117496, "epoch": 2797} {"train_loss": -6.598301410675049, "global_step": 117497, "epoch": 2797} {"train_loss": -6.489998817443848, "global_step": 117498, "epoch": 2797} {"train_loss": -6.376094818115234, "global_step": 117499, "epoch": 2797} {"train_loss": -6.421429634094238, "global_step": 117500, "epoch": 2797} {"train_loss": -6.50327730178833, "global_step": 117501, "epoch": 2797} {"train_loss": -6.393697738647461, "global_step": 117502, "epoch": 2797} {"train_loss": -6.599273681640625, "global_step": 117503, "epoch": 2797} {"train_loss": -6.459924697875977, "global_step": 117504, "epoch": 2797} {"train_loss": -6.433544158935547, "global_step": 117505, "epoch": 2797} {"train_loss": -6.59908390045166, "global_step": 117506, "epoch": 2797} {"train_loss": -6.622992038726807, "global_step": 117507, "epoch": 2797} {"train_loss": -6.585129261016846, "global_step": 117508, "epoch": 2797} {"train_loss": -6.6010332107543945, "global_step": 117509, "epoch": 2797} {"train_loss": -6.480118751525879, "global_step": 117510, "epoch": 2797} {"train_loss": -6.543798446655273, "global_step": 117511, "epoch": 2797} {"train_loss": -6.458518981933594, "global_step": 117512, "epoch": 2797} {"train_loss": -6.529569149017334, "global_step": 117513, "epoch": 2797} {"train_loss": -6.579463005065918, "global_step": 117514, "epoch": 2797} {"train_loss": -6.50561151050386, "global_step": 117515, "epoch": 2797, "val_loss": 76797.8203125} {"train_loss": -6.5614094734191895, "global_step": 117516, "epoch": 2798} {"train_loss": -6.4691009521484375, "global_step": 117517, "epoch": 2798} {"train_loss": -6.414517402648926, "global_step": 117518, "epoch": 2798} {"train_loss": -6.437822341918945, "global_step": 117519, "epoch": 2798} {"train_loss": -6.518745422363281, "global_step": 117520, "epoch": 2798} {"train_loss": -6.4052276611328125, "global_step": 117521, "epoch": 2798} {"train_loss": -6.47904634475708, "global_step": 117522, "epoch": 2798} {"train_loss": -6.468990325927734, "global_step": 117523, "epoch": 2798} {"train_loss": -6.434797763824463, "global_step": 117524, "epoch": 2798} {"train_loss": -6.391524791717529, "global_step": 117525, "epoch": 2798} {"train_loss": -6.443404197692871, "global_step": 117526, "epoch": 2798} {"train_loss": -6.5381622314453125, "global_step": 117527, "epoch": 2798} {"train_loss": -6.505344390869141, "global_step": 117528, "epoch": 2798} {"train_loss": -6.360839366912842, "global_step": 117529, "epoch": 2798} {"train_loss": -6.550054550170898, "global_step": 117530, "epoch": 2798} {"train_loss": -6.408868312835693, "global_step": 117531, "epoch": 2798} {"train_loss": -6.42869758605957, "global_step": 117532, "epoch": 2798} {"train_loss": -6.471069812774658, "global_step": 117533, "epoch": 2798} {"train_loss": -6.347824573516846, "global_step": 117534, "epoch": 2798} {"train_loss": -6.425224781036377, "global_step": 117535, "epoch": 2798} {"train_loss": -6.387683868408203, "global_step": 117536, "epoch": 2798} {"train_loss": -6.4505720138549805, "global_step": 117537, "epoch": 2798} {"train_loss": -6.457754135131836, "global_step": 117538, "epoch": 2798} {"train_loss": -6.345773696899414, "global_step": 117539, "epoch": 2798} {"train_loss": -6.487508773803711, "global_step": 117540, "epoch": 2798} {"train_loss": -6.519557476043701, "global_step": 117541, "epoch": 2798} {"train_loss": -6.562490940093994, "global_step": 117542, "epoch": 2798} {"train_loss": -6.5294318199157715, "global_step": 117543, "epoch": 2798} {"train_loss": -6.491334915161133, "global_step": 117544, "epoch": 2798} {"train_loss": -6.667966842651367, "global_step": 117545, "epoch": 2798} {"train_loss": -6.486377716064453, "global_step": 117546, "epoch": 2798} {"train_loss": -6.645866394042969, "global_step": 117547, "epoch": 2798} {"train_loss": -6.566802501678467, "global_step": 117548, "epoch": 2798} {"train_loss": -6.50498628616333, "global_step": 117549, "epoch": 2798} {"train_loss": -6.485276699066162, "global_step": 117550, "epoch": 2798} {"train_loss": -6.573042869567871, "global_step": 117551, "epoch": 2798} {"train_loss": -6.4959564208984375, "global_step": 117552, "epoch": 2798} {"train_loss": -6.570566177368164, "global_step": 117553, "epoch": 2798} {"train_loss": -6.643948078155518, "global_step": 117554, "epoch": 2798} {"train_loss": -6.475556373596191, "global_step": 117555, "epoch": 2798} {"train_loss": -6.562780380249023, "global_step": 117556, "epoch": 2798} {"train_loss": -6.489281904129755, "global_step": 117557, "epoch": 2798, "val_loss": 76881.6015625} {"train_loss": -6.471334934234619, "global_step": 117558, "epoch": 2799} {"train_loss": -6.614100456237793, "global_step": 117559, "epoch": 2799} {"train_loss": -6.481592178344727, "global_step": 117560, "epoch": 2799} {"train_loss": -6.4762282371521, "global_step": 117561, "epoch": 2799} {"train_loss": -6.714567184448242, "global_step": 117562, "epoch": 2799} {"train_loss": -6.430047988891602, "global_step": 117563, "epoch": 2799} {"train_loss": -6.561397552490234, "global_step": 117564, "epoch": 2799} {"train_loss": -6.5666351318359375, "global_step": 117565, "epoch": 2799} {"train_loss": -6.563432693481445, "global_step": 117566, "epoch": 2799} {"train_loss": -6.532419204711914, "global_step": 117567, "epoch": 2799} {"train_loss": -6.609963417053223, "global_step": 117568, "epoch": 2799} {"train_loss": -6.551849365234375, "global_step": 117569, "epoch": 2799} {"train_loss": -6.574215888977051, "global_step": 117570, "epoch": 2799} {"train_loss": -6.536763668060303, "global_step": 117571, "epoch": 2799} {"train_loss": -6.627708435058594, "global_step": 117572, "epoch": 2799} {"train_loss": -6.665725231170654, "global_step": 117573, "epoch": 2799} {"train_loss": -6.678357124328613, "global_step": 117574, "epoch": 2799} {"train_loss": -6.601986885070801, "global_step": 117575, "epoch": 2799} {"train_loss": -6.4653778076171875, "global_step": 117576, "epoch": 2799} {"train_loss": -6.513757228851318, "global_step": 117577, "epoch": 2799} {"train_loss": -6.631913661956787, "global_step": 117578, "epoch": 2799} {"train_loss": -6.680728435516357, "global_step": 117579, "epoch": 2799} {"train_loss": -6.603511333465576, "global_step": 117580, "epoch": 2799} {"train_loss": -6.501706123352051, "global_step": 117581, "epoch": 2799} {"train_loss": -6.549684524536133, "global_step": 117582, "epoch": 2799} {"train_loss": -6.635615825653076, "global_step": 117583, "epoch": 2799} {"train_loss": -6.572554588317871, "global_step": 117584, "epoch": 2799} {"train_loss": -6.613654136657715, "global_step": 117585, "epoch": 2799} {"train_loss": -6.648162364959717, "global_step": 117586, "epoch": 2799} {"train_loss": -6.529790878295898, "global_step": 117587, "epoch": 2799} {"train_loss": -6.58917760848999, "global_step": 117588, "epoch": 2799} {"train_loss": -6.546902179718018, "global_step": 117589, "epoch": 2799} {"train_loss": -6.614350318908691, "global_step": 117590, "epoch": 2799} {"train_loss": -6.591507911682129, "global_step": 117591, "epoch": 2799} {"train_loss": -6.4632158279418945, "global_step": 117592, "epoch": 2799} {"train_loss": -6.629090309143066, "global_step": 117593, "epoch": 2799} {"train_loss": -6.612022399902344, "global_step": 117594, "epoch": 2799} {"train_loss": -6.4813456535339355, "global_step": 117595, "epoch": 2799} {"train_loss": -6.482251167297363, "global_step": 117596, "epoch": 2799} {"train_loss": -6.346050262451172, "global_step": 117597, "epoch": 2799} {"train_loss": -6.609999656677246, "global_step": 117598, "epoch": 2799} {"train_loss": -6.5609238261268255, "global_step": 117599, "epoch": 2799, "val_loss": 76590.0078125} {"train_loss": -6.386957168579102, "global_step": 117600, "epoch": 2800} {"train_loss": -6.620960235595703, "global_step": 117601, "epoch": 2800} {"train_loss": -6.369075775146484, "global_step": 117602, "epoch": 2800} {"train_loss": -6.486682891845703, "global_step": 117603, "epoch": 2800} {"train_loss": -6.239952087402344, "global_step": 117604, "epoch": 2800} {"train_loss": -6.371318340301514, "global_step": 117605, "epoch": 2800} {"train_loss": -6.476802349090576, "global_step": 117606, "epoch": 2800} {"train_loss": -6.409669876098633, "global_step": 117607, "epoch": 2800} {"train_loss": -6.483546257019043, "global_step": 117608, "epoch": 2800} {"train_loss": -6.350351810455322, "global_step": 117609, "epoch": 2800} {"train_loss": -6.5092644691467285, "global_step": 117610, "epoch": 2800} {"train_loss": -6.403446197509766, "global_step": 117611, "epoch": 2800} {"train_loss": -6.399170875549316, "global_step": 117612, "epoch": 2800} {"train_loss": -6.466684341430664, "global_step": 117613, "epoch": 2800} {"train_loss": -6.5419921875, "global_step": 117614, "epoch": 2800} {"train_loss": -6.521262168884277, "global_step": 117615, "epoch": 2800} {"train_loss": -6.5129714012146, "global_step": 117616, "epoch": 2800} {"train_loss": -6.481194496154785, "global_step": 117617, "epoch": 2800} {"train_loss": -6.565186977386475, "global_step": 117618, "epoch": 2800} {"train_loss": -6.636227130889893, "global_step": 117619, "epoch": 2800} {"train_loss": -6.512887001037598, "global_step": 117620, "epoch": 2800} {"train_loss": -6.529990196228027, "global_step": 117621, "epoch": 2800} {"train_loss": -6.620663642883301, "global_step": 117622, "epoch": 2800} {"train_loss": -6.55040168762207, "global_step": 117623, "epoch": 2800} {"train_loss": -6.567389488220215, "global_step": 117624, "epoch": 2800} {"train_loss": -6.464177131652832, "global_step": 117625, "epoch": 2800} {"train_loss": -6.575375556945801, "global_step": 117626, "epoch": 2800} {"train_loss": -6.515315532684326, "global_step": 117627, "epoch": 2800} {"train_loss": -6.644474983215332, "global_step": 117628, "epoch": 2800} {"train_loss": -6.662117004394531, "global_step": 117629, "epoch": 2800} {"train_loss": -6.553227424621582, "global_step": 117630, "epoch": 2800} {"train_loss": -6.494603157043457, "global_step": 117631, "epoch": 2800} {"train_loss": -6.510923385620117, "global_step": 117632, "epoch": 2800} {"train_loss": -6.532975196838379, "global_step": 117633, "epoch": 2800} {"train_loss": -6.576569557189941, "global_step": 117634, "epoch": 2800} {"train_loss": -6.464479446411133, "global_step": 117635, "epoch": 2800} {"train_loss": -6.575777053833008, "global_step": 117636, "epoch": 2800} {"train_loss": -6.503695964813232, "global_step": 117637, "epoch": 2800} {"train_loss": -6.475412368774414, "global_step": 117638, "epoch": 2800} {"train_loss": -6.5400543212890625, "global_step": 117639, "epoch": 2800} {"train_loss": -6.590307235717773, "global_step": 117640, "epoch": 2800} {"train_loss": -6.505162159601848, "global_step": 117641, "epoch": 2800, "train/sim_max_reward_0": 0.8742667172771135, "train/sim_max_reward_1": 0.3043786982042404, "train/sim_max_reward_2": 0.31062019649653, "train/sim_max_reward_3": 0.14902706462779025, "train/sim_max_reward_4": 0.9780783534289422, "train/sim_max_reward_5": 0.9174535650281443, "test/sim_max_reward_4500000": 0.8926244067813496, "test/sim_max_reward_4500001": 0.9210306883382378, "test/sim_max_reward_4500002": 0.9199822729218737, "test/sim_max_reward_4500003": 0.8631734092237197, "test/sim_max_reward_4500004": 0.7874159968306068, "test/sim_max_reward_4500005": 0.3086657540678562, "test/sim_max_reward_4500006": 0.933818898707249, "test/sim_max_reward_4500007": 0.8458180533775118, "test/sim_max_reward_4500008": 0.9193879304973457, "test/sim_max_reward_4500009": 0.05357141661865009, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.7538394777245059, "test/sim_max_reward_4500012": 0.6807926135618821, "test/sim_max_reward_4500013": 0.011918859014675294, "test/sim_max_reward_4500014": 0.376862388782688, "test/sim_max_reward_4500015": 0.9368482633741759, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.31577224452814723, "test/sim_max_reward_4500018": 0.5962490468144848, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.9251217252851133, "test/sim_max_reward_4500023": 0.924010287352701, "test/sim_max_reward_4500024": 0.8817721207106265, "test/sim_max_reward_4500025": 0.681130793539384, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.9934366951182826, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.07352277127105501, "test/sim_max_reward_4500030": 0.926427408151534, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.056404729321481994, "test/sim_max_reward_4500033": 0.9457503636643716, "test/sim_max_reward_4500034": 0.8606140645288385, "test/sim_max_reward_4500035": 0.6836890685148135, "test/sim_max_reward_4500036": 0.973198996490795, "test/sim_max_reward_4500037": 0.8561184752103699, "test/sim_max_reward_4500038": 0.32718561112403366, "test/sim_max_reward_4500039": 0.957097347747731, "test/sim_max_reward_4500040": 0.9984084711979119, "test/sim_max_reward_4500041": 0.9317007512905421, "test/sim_max_reward_4500042": 0.01690775946687206, "test/sim_max_reward_4500043": 0.1687342958780495, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.7944815865165412, "test/sim_max_reward_4500046": 0.8180720614298582, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.8692148712065116, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5889707658437935, "test/mean_score": 0.5801786648426746, "val_loss": 76862.484375} {"train_loss": -6.512542724609375, "global_step": 117642, "epoch": 2801} {"train_loss": -6.513601303100586, "global_step": 117643, "epoch": 2801} {"train_loss": -6.579588413238525, "global_step": 117644, "epoch": 2801} {"train_loss": -6.633493423461914, "global_step": 117645, "epoch": 2801} {"train_loss": -6.4839348793029785, "global_step": 117646, "epoch": 2801} {"train_loss": -6.3979949951171875, "global_step": 117647, "epoch": 2801} {"train_loss": -6.435425758361816, "global_step": 117648, "epoch": 2801} {"train_loss": -6.554286003112793, "global_step": 117649, "epoch": 2801} {"train_loss": -6.546863555908203, "global_step": 117650, "epoch": 2801} {"train_loss": -6.396625995635986, "global_step": 117651, "epoch": 2801} {"train_loss": -6.571846008300781, "global_step": 117652, "epoch": 2801} {"train_loss": -6.180688381195068, "global_step": 117653, "epoch": 2801} {"train_loss": -6.416073799133301, "global_step": 117654, "epoch": 2801} {"train_loss": -6.3518877029418945, "global_step": 117655, "epoch": 2801} {"train_loss": -6.388202667236328, "global_step": 117656, "epoch": 2801} {"train_loss": -6.364081382751465, "global_step": 117657, "epoch": 2801} {"train_loss": -6.311962604522705, "global_step": 117658, "epoch": 2801} {"train_loss": -6.257901191711426, "global_step": 117659, "epoch": 2801} {"train_loss": -6.419844627380371, "global_step": 117660, "epoch": 2801} {"train_loss": -6.363760948181152, "global_step": 117661, "epoch": 2801} {"train_loss": -6.384542465209961, "global_step": 117662, "epoch": 2801} {"train_loss": -6.378612995147705, "global_step": 117663, "epoch": 2801} {"train_loss": -6.412993431091309, "global_step": 117664, "epoch": 2801} {"train_loss": -6.51218843460083, "global_step": 117665, "epoch": 2801} {"train_loss": -6.393895149230957, "global_step": 117666, "epoch": 2801} {"train_loss": -6.378282070159912, "global_step": 117667, "epoch": 2801} {"train_loss": -6.438271522521973, "global_step": 117668, "epoch": 2801} {"train_loss": -6.534562110900879, "global_step": 117669, "epoch": 2801} {"train_loss": -6.473231792449951, "global_step": 117670, "epoch": 2801} {"train_loss": -6.42653751373291, "global_step": 117671, "epoch": 2801} {"train_loss": -6.591543197631836, "global_step": 117672, "epoch": 2801} {"train_loss": -6.467078685760498, "global_step": 117673, "epoch": 2801} {"train_loss": -6.540626525878906, "global_step": 117674, "epoch": 2801} {"train_loss": -6.6112470626831055, "global_step": 117675, "epoch": 2801} {"train_loss": -6.4812092781066895, "global_step": 117676, "epoch": 2801} {"train_loss": -6.6077775955200195, "global_step": 117677, "epoch": 2801} {"train_loss": -6.5229597091674805, "global_step": 117678, "epoch": 2801} {"train_loss": -6.486437797546387, "global_step": 117679, "epoch": 2801} {"train_loss": -6.535172462463379, "global_step": 117680, "epoch": 2801} {"train_loss": -6.644219398498535, "global_step": 117681, "epoch": 2801} {"train_loss": -6.637718200683594, "global_step": 117682, "epoch": 2801} {"train_loss": -6.468777951740083, "global_step": 117683, "epoch": 2801, "val_loss": 76877.7265625} {"train_loss": -6.527588844299316, "global_step": 117684, "epoch": 2802} {"train_loss": -6.63374137878418, "global_step": 117685, "epoch": 2802} {"train_loss": -6.535636901855469, "global_step": 117686, "epoch": 2802} {"train_loss": -6.530649185180664, "global_step": 117687, "epoch": 2802} {"train_loss": -6.525440692901611, "global_step": 117688, "epoch": 2802} {"train_loss": -6.492347240447998, "global_step": 117689, "epoch": 2802} {"train_loss": -6.588712215423584, "global_step": 117690, "epoch": 2802} {"train_loss": -6.607597351074219, "global_step": 117691, "epoch": 2802} {"train_loss": -6.558923721313477, "global_step": 117692, "epoch": 2802} {"train_loss": -6.581867694854736, "global_step": 117693, "epoch": 2802} {"train_loss": -6.562590599060059, "global_step": 117694, "epoch": 2802} {"train_loss": -6.491789817810059, "global_step": 117695, "epoch": 2802} {"train_loss": -6.539859771728516, "global_step": 117696, "epoch": 2802} {"train_loss": -6.521573066711426, "global_step": 117697, "epoch": 2802} {"train_loss": -6.462120056152344, "global_step": 117698, "epoch": 2802} {"train_loss": -6.5411224365234375, "global_step": 117699, "epoch": 2802} {"train_loss": -6.55195426940918, "global_step": 117700, "epoch": 2802} {"train_loss": -6.590198040008545, "global_step": 117701, "epoch": 2802} {"train_loss": -6.485255241394043, "global_step": 117702, "epoch": 2802} {"train_loss": -6.601387023925781, "global_step": 117703, "epoch": 2802} {"train_loss": -6.602147102355957, "global_step": 117704, "epoch": 2802} {"train_loss": -6.499927043914795, "global_step": 117705, "epoch": 2802} {"train_loss": -6.566843032836914, "global_step": 117706, "epoch": 2802} {"train_loss": -6.642762184143066, "global_step": 117707, "epoch": 2802} {"train_loss": -6.619635581970215, "global_step": 117708, "epoch": 2802} {"train_loss": -6.432676315307617, "global_step": 117709, "epoch": 2802} {"train_loss": -6.623294830322266, "global_step": 117710, "epoch": 2802} {"train_loss": -6.629184722900391, "global_step": 117711, "epoch": 2802} {"train_loss": -6.399528980255127, "global_step": 117712, "epoch": 2802} {"train_loss": -6.498242378234863, "global_step": 117713, "epoch": 2802} {"train_loss": -6.461711883544922, "global_step": 117714, "epoch": 2802} {"train_loss": -6.620414733886719, "global_step": 117715, "epoch": 2802} {"train_loss": -6.519482612609863, "global_step": 117716, "epoch": 2802} {"train_loss": -6.559480667114258, "global_step": 117717, "epoch": 2802} {"train_loss": -6.53713321685791, "global_step": 117718, "epoch": 2802} {"train_loss": -6.62417459487915, "global_step": 117719, "epoch": 2802} {"train_loss": -6.473224639892578, "global_step": 117720, "epoch": 2802} {"train_loss": -6.566684722900391, "global_step": 117721, "epoch": 2802} {"train_loss": -6.520721435546875, "global_step": 117722, "epoch": 2802} {"train_loss": -6.676765441894531, "global_step": 117723, "epoch": 2802} {"train_loss": -6.663562774658203, "global_step": 117724, "epoch": 2802} {"train_loss": -6.553240401404245, "global_step": 117725, "epoch": 2802, "val_loss": 76741.8046875} {"train_loss": -6.5318756103515625, "global_step": 117726, "epoch": 2803} {"train_loss": -6.474647521972656, "global_step": 117727, "epoch": 2803} {"train_loss": -6.572121620178223, "global_step": 117728, "epoch": 2803} {"train_loss": -6.5820512771606445, "global_step": 117729, "epoch": 2803} {"train_loss": -6.48685359954834, "global_step": 117730, "epoch": 2803} {"train_loss": -6.550923824310303, "global_step": 117731, "epoch": 2803} {"train_loss": -6.474627494812012, "global_step": 117732, "epoch": 2803} {"train_loss": -6.587535381317139, "global_step": 117733, "epoch": 2803} {"train_loss": -6.614213943481445, "global_step": 117734, "epoch": 2803} {"train_loss": -6.615728378295898, "global_step": 117735, "epoch": 2803} {"train_loss": -6.545770168304443, "global_step": 117736, "epoch": 2803} {"train_loss": -6.489056587219238, "global_step": 117737, "epoch": 2803} {"train_loss": -6.48767614364624, "global_step": 117738, "epoch": 2803} {"train_loss": -6.583950042724609, "global_step": 117739, "epoch": 2803} {"train_loss": -6.595729827880859, "global_step": 117740, "epoch": 2803} {"train_loss": -6.376465797424316, "global_step": 117741, "epoch": 2803} {"train_loss": -6.526042938232422, "global_step": 117742, "epoch": 2803} {"train_loss": -6.348737716674805, "global_step": 117743, "epoch": 2803} {"train_loss": -6.535635948181152, "global_step": 117744, "epoch": 2803} {"train_loss": -6.402709007263184, "global_step": 117745, "epoch": 2803} {"train_loss": -6.508390426635742, "global_step": 117746, "epoch": 2803} {"train_loss": -6.459596633911133, "global_step": 117747, "epoch": 2803} {"train_loss": -6.5075531005859375, "global_step": 117748, "epoch": 2803} {"train_loss": -6.617801666259766, "global_step": 117749, "epoch": 2803} {"train_loss": -6.599884033203125, "global_step": 117750, "epoch": 2803} {"train_loss": -6.560606002807617, "global_step": 117751, "epoch": 2803} {"train_loss": -6.518052101135254, "global_step": 117752, "epoch": 2803} {"train_loss": -6.469778537750244, "global_step": 117753, "epoch": 2803} {"train_loss": -6.566950798034668, "global_step": 117754, "epoch": 2803} {"train_loss": -6.432057857513428, "global_step": 117755, "epoch": 2803} {"train_loss": -6.493085861206055, "global_step": 117756, "epoch": 2803} {"train_loss": -6.396443843841553, "global_step": 117757, "epoch": 2803} {"train_loss": -6.556143283843994, "global_step": 117758, "epoch": 2803} {"train_loss": -6.470452308654785, "global_step": 117759, "epoch": 2803} {"train_loss": -6.577376365661621, "global_step": 117760, "epoch": 2803} {"train_loss": -6.4872918128967285, "global_step": 117761, "epoch": 2803} {"train_loss": -6.524564743041992, "global_step": 117762, "epoch": 2803} {"train_loss": -6.5614752769470215, "global_step": 117763, "epoch": 2803} {"train_loss": -6.527613639831543, "global_step": 117764, "epoch": 2803} {"train_loss": -6.482028961181641, "global_step": 117765, "epoch": 2803} {"train_loss": -6.713505744934082, "global_step": 117766, "epoch": 2803} {"train_loss": -6.522076379685175, "global_step": 117767, "epoch": 2803, "val_loss": 76725.765625} {"train_loss": -6.514248847961426, "global_step": 117768, "epoch": 2804} {"train_loss": -6.731504440307617, "global_step": 117769, "epoch": 2804} {"train_loss": -6.507933139801025, "global_step": 117770, "epoch": 2804} {"train_loss": -6.429114818572998, "global_step": 117771, "epoch": 2804} {"train_loss": -6.728310585021973, "global_step": 117772, "epoch": 2804} {"train_loss": -6.441986560821533, "global_step": 117773, "epoch": 2804} {"train_loss": -6.578453540802002, "global_step": 117774, "epoch": 2804} {"train_loss": -6.536036968231201, "global_step": 117775, "epoch": 2804} {"train_loss": -6.525491714477539, "global_step": 117776, "epoch": 2804} {"train_loss": -6.593502998352051, "global_step": 117777, "epoch": 2804} {"train_loss": -6.458414554595947, "global_step": 117778, "epoch": 2804} {"train_loss": -6.563481330871582, "global_step": 117779, "epoch": 2804} {"train_loss": -6.4992170333862305, "global_step": 117780, "epoch": 2804} {"train_loss": -6.609988212585449, "global_step": 117781, "epoch": 2804} {"train_loss": -6.625308036804199, "global_step": 117782, "epoch": 2804} {"train_loss": -6.5977325439453125, "global_step": 117783, "epoch": 2804} {"train_loss": -6.728087425231934, "global_step": 117784, "epoch": 2804} {"train_loss": -6.556546688079834, "global_step": 117785, "epoch": 2804} {"train_loss": -6.6030426025390625, "global_step": 117786, "epoch": 2804} {"train_loss": -6.643446922302246, "global_step": 117787, "epoch": 2804} {"train_loss": -6.670527458190918, "global_step": 117788, "epoch": 2804} {"train_loss": -6.676050186157227, "global_step": 117789, "epoch": 2804} {"train_loss": -6.600538730621338, "global_step": 117790, "epoch": 2804} {"train_loss": -6.537721633911133, "global_step": 117791, "epoch": 2804} {"train_loss": -6.413612365722656, "global_step": 117792, "epoch": 2804} {"train_loss": -6.657908916473389, "global_step": 117793, "epoch": 2804} {"train_loss": -6.489884853363037, "global_step": 117794, "epoch": 2804} {"train_loss": -6.539799690246582, "global_step": 117795, "epoch": 2804} {"train_loss": -6.5746331214904785, "global_step": 117796, "epoch": 2804} {"train_loss": -6.562066555023193, "global_step": 117797, "epoch": 2804} {"train_loss": -6.634659290313721, "global_step": 117798, "epoch": 2804} {"train_loss": -6.600973129272461, "global_step": 117799, "epoch": 2804} {"train_loss": -6.5608906745910645, "global_step": 117800, "epoch": 2804} {"train_loss": -6.5822248458862305, "global_step": 117801, "epoch": 2804} {"train_loss": -6.591567516326904, "global_step": 117802, "epoch": 2804} {"train_loss": -6.65914249420166, "global_step": 117803, "epoch": 2804} {"train_loss": -6.5195841789245605, "global_step": 117804, "epoch": 2804} {"train_loss": -6.515061378479004, "global_step": 117805, "epoch": 2804} {"train_loss": -6.561251163482666, "global_step": 117806, "epoch": 2804} {"train_loss": -6.610230445861816, "global_step": 117807, "epoch": 2804} {"train_loss": -6.469969749450684, "global_step": 117808, "epoch": 2804} {"train_loss": -6.573086704526629, "global_step": 117809, "epoch": 2804, "val_loss": 77003.4453125} {"train_loss": -6.6234283447265625, "global_step": 117810, "epoch": 2805} {"train_loss": -6.564253330230713, "global_step": 117811, "epoch": 2805} {"train_loss": -6.574622631072998, "global_step": 117812, "epoch": 2805} {"train_loss": -6.519499778747559, "global_step": 117813, "epoch": 2805} {"train_loss": -6.4872307777404785, "global_step": 117814, "epoch": 2805} {"train_loss": -6.385631561279297, "global_step": 117815, "epoch": 2805} {"train_loss": -6.450687885284424, "global_step": 117816, "epoch": 2805} {"train_loss": -6.51024866104126, "global_step": 117817, "epoch": 2805} {"train_loss": -6.440587520599365, "global_step": 117818, "epoch": 2805} {"train_loss": -6.4857683181762695, "global_step": 117819, "epoch": 2805} {"train_loss": -6.433078765869141, "global_step": 117820, "epoch": 2805} {"train_loss": -6.358058452606201, "global_step": 117821, "epoch": 2805} {"train_loss": -6.465069770812988, "global_step": 117822, "epoch": 2805} {"train_loss": -6.3438801765441895, "global_step": 117823, "epoch": 2805} {"train_loss": -6.465157985687256, "global_step": 117824, "epoch": 2805} {"train_loss": -6.4170966148376465, "global_step": 117825, "epoch": 2805} {"train_loss": -6.296422481536865, "global_step": 117826, "epoch": 2805} {"train_loss": -6.533462047576904, "global_step": 117827, "epoch": 2805} {"train_loss": -6.428807258605957, "global_step": 117828, "epoch": 2805} {"train_loss": -6.4543256759643555, "global_step": 117829, "epoch": 2805} {"train_loss": -6.4357194900512695, "global_step": 117830, "epoch": 2805} {"train_loss": -6.450645923614502, "global_step": 117831, "epoch": 2805} {"train_loss": -6.357105255126953, "global_step": 117832, "epoch": 2805} {"train_loss": -6.439329147338867, "global_step": 117833, "epoch": 2805} {"train_loss": -6.520633697509766, "global_step": 117834, "epoch": 2805} {"train_loss": -6.581022262573242, "global_step": 117835, "epoch": 2805} {"train_loss": -6.478989124298096, "global_step": 117836, "epoch": 2805} {"train_loss": -6.5960798263549805, "global_step": 117837, "epoch": 2805} {"train_loss": -6.495621204376221, "global_step": 117838, "epoch": 2805} {"train_loss": -6.386369705200195, "global_step": 117839, "epoch": 2805} {"train_loss": -6.519292831420898, "global_step": 117840, "epoch": 2805} {"train_loss": -6.565154075622559, "global_step": 117841, "epoch": 2805} {"train_loss": -6.593709945678711, "global_step": 117842, "epoch": 2805} {"train_loss": -6.513692855834961, "global_step": 117843, "epoch": 2805} {"train_loss": -6.507667541503906, "global_step": 117844, "epoch": 2805} {"train_loss": -6.650969505310059, "global_step": 117845, "epoch": 2805} {"train_loss": -6.551249027252197, "global_step": 117846, "epoch": 2805} {"train_loss": -6.568572998046875, "global_step": 117847, "epoch": 2805} {"train_loss": -6.530092239379883, "global_step": 117848, "epoch": 2805} {"train_loss": -6.474809646606445, "global_step": 117849, "epoch": 2805} {"train_loss": -6.623943328857422, "global_step": 117850, "epoch": 2805} {"train_loss": -6.493819021043324, "global_step": 117851, "epoch": 2805, "val_loss": 76771.53125} {"train_loss": -6.515154838562012, "global_step": 117852, "epoch": 2806} {"train_loss": -6.489039421081543, "global_step": 117853, "epoch": 2806} {"train_loss": -6.474935531616211, "global_step": 117854, "epoch": 2806} {"train_loss": -6.564020156860352, "global_step": 117855, "epoch": 2806} {"train_loss": -6.527401924133301, "global_step": 117856, "epoch": 2806} {"train_loss": -6.532662391662598, "global_step": 117857, "epoch": 2806} {"train_loss": -6.669099807739258, "global_step": 117858, "epoch": 2806} {"train_loss": -6.667542934417725, "global_step": 117859, "epoch": 2806} {"train_loss": -6.573489665985107, "global_step": 117860, "epoch": 2806} {"train_loss": -6.541804790496826, "global_step": 117861, "epoch": 2806} {"train_loss": -6.486983299255371, "global_step": 117862, "epoch": 2806} {"train_loss": -6.59798526763916, "global_step": 117863, "epoch": 2806} {"train_loss": -6.65866231918335, "global_step": 117864, "epoch": 2806} {"train_loss": -6.506706237792969, "global_step": 117865, "epoch": 2806} {"train_loss": -6.583146572113037, "global_step": 117866, "epoch": 2806} {"train_loss": -6.439908027648926, "global_step": 117867, "epoch": 2806} {"train_loss": -6.416694164276123, "global_step": 117868, "epoch": 2806} {"train_loss": -6.651185512542725, "global_step": 117869, "epoch": 2806} {"train_loss": -6.543041229248047, "global_step": 117870, "epoch": 2806} {"train_loss": -6.519060134887695, "global_step": 117871, "epoch": 2806} {"train_loss": -6.561531066894531, "global_step": 117872, "epoch": 2806} {"train_loss": -6.624740123748779, "global_step": 117873, "epoch": 2806} {"train_loss": -6.570662498474121, "global_step": 117874, "epoch": 2806} {"train_loss": -6.550726890563965, "global_step": 117875, "epoch": 2806} {"train_loss": -6.54283332824707, "global_step": 117876, "epoch": 2806} {"train_loss": -6.594318389892578, "global_step": 117877, "epoch": 2806} {"train_loss": -6.564416885375977, "global_step": 117878, "epoch": 2806} {"train_loss": -6.6739959716796875, "global_step": 117879, "epoch": 2806} {"train_loss": -6.713173866271973, "global_step": 117880, "epoch": 2806} {"train_loss": -6.627783298492432, "global_step": 117881, "epoch": 2806} {"train_loss": -6.628843784332275, "global_step": 117882, "epoch": 2806} {"train_loss": -6.66023063659668, "global_step": 117883, "epoch": 2806} {"train_loss": -6.529149532318115, "global_step": 117884, "epoch": 2806} {"train_loss": -6.479369163513184, "global_step": 117885, "epoch": 2806} {"train_loss": -6.704513072967529, "global_step": 117886, "epoch": 2806} {"train_loss": -6.687039375305176, "global_step": 117887, "epoch": 2806} {"train_loss": -6.4615583419799805, "global_step": 117888, "epoch": 2806} {"train_loss": -6.592425346374512, "global_step": 117889, "epoch": 2806} {"train_loss": -6.509159088134766, "global_step": 117890, "epoch": 2806} {"train_loss": -6.4919586181640625, "global_step": 117891, "epoch": 2806} {"train_loss": -6.574556827545166, "global_step": 117892, "epoch": 2806} {"train_loss": -6.56806130636306, "global_step": 117893, "epoch": 2806, "val_loss": 76335.6484375} {"train_loss": -6.668405055999756, "global_step": 117894, "epoch": 2807} {"train_loss": -6.614080429077148, "global_step": 117895, "epoch": 2807} {"train_loss": -6.668279647827148, "global_step": 117896, "epoch": 2807} {"train_loss": -6.632965087890625, "global_step": 117897, "epoch": 2807} {"train_loss": -6.633171081542969, "global_step": 117898, "epoch": 2807} {"train_loss": -6.661479473114014, "global_step": 117899, "epoch": 2807} {"train_loss": -6.531064033508301, "global_step": 117900, "epoch": 2807} {"train_loss": -6.603152751922607, "global_step": 117901, "epoch": 2807} {"train_loss": -6.53853178024292, "global_step": 117902, "epoch": 2807} {"train_loss": -6.6579742431640625, "global_step": 117903, "epoch": 2807} {"train_loss": -6.560990810394287, "global_step": 117904, "epoch": 2807} {"train_loss": -6.5958051681518555, "global_step": 117905, "epoch": 2807} {"train_loss": -6.490832328796387, "global_step": 117906, "epoch": 2807} {"train_loss": -6.5435709953308105, "global_step": 117907, "epoch": 2807} {"train_loss": -6.589698791503906, "global_step": 117908, "epoch": 2807} {"train_loss": -6.621349811553955, "global_step": 117909, "epoch": 2807} {"train_loss": -6.543920516967773, "global_step": 117910, "epoch": 2807} {"train_loss": -6.530722141265869, "global_step": 117911, "epoch": 2807} {"train_loss": -6.657867908477783, "global_step": 117912, "epoch": 2807} {"train_loss": -6.525134086608887, "global_step": 117913, "epoch": 2807} {"train_loss": -6.577198028564453, "global_step": 117914, "epoch": 2807} {"train_loss": -6.63425874710083, "global_step": 117915, "epoch": 2807} {"train_loss": -6.578516006469727, "global_step": 117916, "epoch": 2807} {"train_loss": -6.5743088722229, "global_step": 117917, "epoch": 2807} {"train_loss": -6.537631988525391, "global_step": 117918, "epoch": 2807} {"train_loss": -6.637553691864014, "global_step": 117919, "epoch": 2807} {"train_loss": -6.659477710723877, "global_step": 117920, "epoch": 2807} {"train_loss": -6.648898601531982, "global_step": 117921, "epoch": 2807} {"train_loss": -6.623529434204102, "global_step": 117922, "epoch": 2807} {"train_loss": -6.550521373748779, "global_step": 117923, "epoch": 2807} {"train_loss": -6.502495765686035, "global_step": 117924, "epoch": 2807} {"train_loss": -6.4364423751831055, "global_step": 117925, "epoch": 2807} {"train_loss": -6.5642313957214355, "global_step": 117926, "epoch": 2807} {"train_loss": -6.582754135131836, "global_step": 117927, "epoch": 2807} {"train_loss": -6.536389350891113, "global_step": 117928, "epoch": 2807} {"train_loss": -6.478086471557617, "global_step": 117929, "epoch": 2807} {"train_loss": -6.511577606201172, "global_step": 117930, "epoch": 2807} {"train_loss": -6.638222694396973, "global_step": 117931, "epoch": 2807} {"train_loss": -6.528560638427734, "global_step": 117932, "epoch": 2807} {"train_loss": -6.586264610290527, "global_step": 117933, "epoch": 2807} {"train_loss": -6.528590202331543, "global_step": 117934, "epoch": 2807} {"train_loss": -6.577840963999431, "global_step": 117935, "epoch": 2807, "val_loss": 76961.125} {"train_loss": -6.665562629699707, "global_step": 117936, "epoch": 2808} {"train_loss": -6.543610572814941, "global_step": 117937, "epoch": 2808} {"train_loss": -6.544939994812012, "global_step": 117938, "epoch": 2808} {"train_loss": -6.558854103088379, "global_step": 117939, "epoch": 2808} {"train_loss": -6.605299949645996, "global_step": 117940, "epoch": 2808} {"train_loss": -6.616761684417725, "global_step": 117941, "epoch": 2808} {"train_loss": -6.502701759338379, "global_step": 117942, "epoch": 2808} {"train_loss": -6.550282001495361, "global_step": 117943, "epoch": 2808} {"train_loss": -6.524186611175537, "global_step": 117944, "epoch": 2808} {"train_loss": -6.653722763061523, "global_step": 117945, "epoch": 2808} {"train_loss": -6.657844543457031, "global_step": 117946, "epoch": 2808} {"train_loss": -6.501703262329102, "global_step": 117947, "epoch": 2808} {"train_loss": -6.622920989990234, "global_step": 117948, "epoch": 2808} {"train_loss": -6.516420364379883, "global_step": 117949, "epoch": 2808} {"train_loss": -6.530600547790527, "global_step": 117950, "epoch": 2808} {"train_loss": -6.558659553527832, "global_step": 117951, "epoch": 2808} {"train_loss": -6.4986677169799805, "global_step": 117952, "epoch": 2808} {"train_loss": -6.525582313537598, "global_step": 117953, "epoch": 2808} {"train_loss": -6.612193584442139, "global_step": 117954, "epoch": 2808} {"train_loss": -6.665090560913086, "global_step": 117955, "epoch": 2808} {"train_loss": -6.6174702644348145, "global_step": 117956, "epoch": 2808} {"train_loss": -6.549261093139648, "global_step": 117957, "epoch": 2808} {"train_loss": -6.557052135467529, "global_step": 117958, "epoch": 2808} {"train_loss": -6.460296630859375, "global_step": 117959, "epoch": 2808} {"train_loss": -6.5550217628479, "global_step": 117960, "epoch": 2808} {"train_loss": -6.457364559173584, "global_step": 117961, "epoch": 2808} {"train_loss": -6.502641677856445, "global_step": 117962, "epoch": 2808} {"train_loss": -6.467254638671875, "global_step": 117963, "epoch": 2808} {"train_loss": -6.6477556228637695, "global_step": 117964, "epoch": 2808} {"train_loss": -6.460859298706055, "global_step": 117965, "epoch": 2808} {"train_loss": -6.547005653381348, "global_step": 117966, "epoch": 2808} {"train_loss": -6.544058799743652, "global_step": 117967, "epoch": 2808} {"train_loss": -6.521702766418457, "global_step": 117968, "epoch": 2808} {"train_loss": -6.524827003479004, "global_step": 117969, "epoch": 2808} {"train_loss": -6.307797431945801, "global_step": 117970, "epoch": 2808} {"train_loss": -6.408117771148682, "global_step": 117971, "epoch": 2808} {"train_loss": -6.590007781982422, "global_step": 117972, "epoch": 2808} {"train_loss": -6.526923179626465, "global_step": 117973, "epoch": 2808} {"train_loss": -6.477710723876953, "global_step": 117974, "epoch": 2808} {"train_loss": -6.420210838317871, "global_step": 117975, "epoch": 2808} {"train_loss": -6.619324207305908, "global_step": 117976, "epoch": 2808} {"train_loss": -6.543205953779674, "global_step": 117977, "epoch": 2808, "val_loss": 77046.375} {"train_loss": -6.538072109222412, "global_step": 117978, "epoch": 2809} {"train_loss": -6.572960376739502, "global_step": 117979, "epoch": 2809} {"train_loss": -6.516785144805908, "global_step": 117980, "epoch": 2809} {"train_loss": -6.593706130981445, "global_step": 117981, "epoch": 2809} {"train_loss": -6.52999210357666, "global_step": 117982, "epoch": 2809} {"train_loss": -6.621294021606445, "global_step": 117983, "epoch": 2809} {"train_loss": -6.476894378662109, "global_step": 117984, "epoch": 2809} {"train_loss": -6.546744346618652, "global_step": 117985, "epoch": 2809} {"train_loss": -6.619311332702637, "global_step": 117986, "epoch": 2809} {"train_loss": -6.422232151031494, "global_step": 117987, "epoch": 2809} {"train_loss": -6.541879177093506, "global_step": 117988, "epoch": 2809} {"train_loss": -6.495908737182617, "global_step": 117989, "epoch": 2809} {"train_loss": -6.456830024719238, "global_step": 117990, "epoch": 2809} {"train_loss": -6.520860195159912, "global_step": 117991, "epoch": 2809} {"train_loss": -6.486254692077637, "global_step": 117992, "epoch": 2809} {"train_loss": -6.540924072265625, "global_step": 117993, "epoch": 2809} {"train_loss": -6.606729030609131, "global_step": 117994, "epoch": 2809} {"train_loss": -6.6228790283203125, "global_step": 117995, "epoch": 2809} {"train_loss": -6.576779365539551, "global_step": 117996, "epoch": 2809} {"train_loss": -6.53062105178833, "global_step": 117997, "epoch": 2809} {"train_loss": -6.561497688293457, "global_step": 117998, "epoch": 2809} {"train_loss": -6.591938495635986, "global_step": 117999, "epoch": 2809} {"train_loss": -6.54946231842041, "global_step": 118000, "epoch": 2809} {"train_loss": -6.543607711791992, "global_step": 118001, "epoch": 2809} {"train_loss": -6.571523666381836, "global_step": 118002, "epoch": 2809} {"train_loss": -6.581280708312988, "global_step": 118003, "epoch": 2809} {"train_loss": -6.41747522354126, "global_step": 118004, "epoch": 2809} {"train_loss": -6.549381256103516, "global_step": 118005, "epoch": 2809} {"train_loss": -6.533088684082031, "global_step": 118006, "epoch": 2809} {"train_loss": -6.536320209503174, "global_step": 118007, "epoch": 2809} {"train_loss": -6.493983745574951, "global_step": 118008, "epoch": 2809} {"train_loss": -6.5134477615356445, "global_step": 118009, "epoch": 2809} {"train_loss": -6.490079879760742, "global_step": 118010, "epoch": 2809} {"train_loss": -6.4235076904296875, "global_step": 118011, "epoch": 2809} {"train_loss": -6.604772567749023, "global_step": 118012, "epoch": 2809} {"train_loss": -6.269815921783447, "global_step": 118013, "epoch": 2809} {"train_loss": -6.518056869506836, "global_step": 118014, "epoch": 2809} {"train_loss": -6.410045623779297, "global_step": 118015, "epoch": 2809} {"train_loss": -6.4718756675720215, "global_step": 118016, "epoch": 2809} {"train_loss": -6.515988349914551, "global_step": 118017, "epoch": 2809} {"train_loss": -6.41008186340332, "global_step": 118018, "epoch": 2809} {"train_loss": -6.520903280803135, "global_step": 118019, "epoch": 2809, "val_loss": 77389.4609375} {"train_loss": -6.264649868011475, "global_step": 118020, "epoch": 2810} {"train_loss": -6.534876346588135, "global_step": 118021, "epoch": 2810} {"train_loss": -6.388747215270996, "global_step": 118022, "epoch": 2810} {"train_loss": -6.523932456970215, "global_step": 118023, "epoch": 2810} {"train_loss": -6.500947952270508, "global_step": 118024, "epoch": 2810} {"train_loss": -6.425178527832031, "global_step": 118025, "epoch": 2810} {"train_loss": -6.552580833435059, "global_step": 118026, "epoch": 2810} {"train_loss": -6.383238792419434, "global_step": 118027, "epoch": 2810} {"train_loss": -6.590039253234863, "global_step": 118028, "epoch": 2810} {"train_loss": -6.431271553039551, "global_step": 118029, "epoch": 2810} {"train_loss": -6.556299209594727, "global_step": 118030, "epoch": 2810} {"train_loss": -6.674074649810791, "global_step": 118031, "epoch": 2810} {"train_loss": -6.539556503295898, "global_step": 118032, "epoch": 2810} {"train_loss": -6.569206714630127, "global_step": 118033, "epoch": 2810} {"train_loss": -6.540599822998047, "global_step": 118034, "epoch": 2810} {"train_loss": -6.531110763549805, "global_step": 118035, "epoch": 2810} {"train_loss": -6.564695358276367, "global_step": 118036, "epoch": 2810} {"train_loss": -6.528894424438477, "global_step": 118037, "epoch": 2810} {"train_loss": -6.613747596740723, "global_step": 118038, "epoch": 2810} {"train_loss": -6.542128562927246, "global_step": 118039, "epoch": 2810} {"train_loss": -6.701541423797607, "global_step": 118040, "epoch": 2810} {"train_loss": -6.593524932861328, "global_step": 118041, "epoch": 2810} {"train_loss": -6.535768508911133, "global_step": 118042, "epoch": 2810} {"train_loss": -6.5658392906188965, "global_step": 118043, "epoch": 2810} {"train_loss": -6.543910980224609, "global_step": 118044, "epoch": 2810} {"train_loss": -6.546332836151123, "global_step": 118045, "epoch": 2810} {"train_loss": -6.615838050842285, "global_step": 118046, "epoch": 2810} {"train_loss": -6.616779327392578, "global_step": 118047, "epoch": 2810} {"train_loss": -6.559334754943848, "global_step": 118048, "epoch": 2810} {"train_loss": -6.570793628692627, "global_step": 118049, "epoch": 2810} {"train_loss": -6.560074806213379, "global_step": 118050, "epoch": 2810} {"train_loss": -6.615715026855469, "global_step": 118051, "epoch": 2810} {"train_loss": -6.559260368347168, "global_step": 118052, "epoch": 2810} {"train_loss": -6.590609073638916, "global_step": 118053, "epoch": 2810} {"train_loss": -6.605706214904785, "global_step": 118054, "epoch": 2810} {"train_loss": -6.597538471221924, "global_step": 118055, "epoch": 2810} {"train_loss": -6.526289939880371, "global_step": 118056, "epoch": 2810} {"train_loss": -6.404663562774658, "global_step": 118057, "epoch": 2810} {"train_loss": -6.615283966064453, "global_step": 118058, "epoch": 2810} {"train_loss": -6.5661444664001465, "global_step": 118059, "epoch": 2810} {"train_loss": -6.627565383911133, "global_step": 118060, "epoch": 2810} {"train_loss": -6.545519669850667, "global_step": 118061, "epoch": 2810, "val_loss": 76798.6015625} {"train_loss": -6.514040946960449, "global_step": 118062, "epoch": 2811} {"train_loss": -6.5124969482421875, "global_step": 118063, "epoch": 2811} {"train_loss": -6.589486598968506, "global_step": 118064, "epoch": 2811} {"train_loss": -6.580002784729004, "global_step": 118065, "epoch": 2811} {"train_loss": -6.528647422790527, "global_step": 118066, "epoch": 2811} {"train_loss": -6.59761905670166, "global_step": 118067, "epoch": 2811} {"train_loss": -6.631691932678223, "global_step": 118068, "epoch": 2811} {"train_loss": -6.479074478149414, "global_step": 118069, "epoch": 2811} {"train_loss": -6.517531871795654, "global_step": 118070, "epoch": 2811} {"train_loss": -6.445786952972412, "global_step": 118071, "epoch": 2811} {"train_loss": -6.578126907348633, "global_step": 118072, "epoch": 2811} {"train_loss": -6.576244354248047, "global_step": 118073, "epoch": 2811} {"train_loss": -6.356484413146973, "global_step": 118074, "epoch": 2811} {"train_loss": -6.454831123352051, "global_step": 118075, "epoch": 2811} {"train_loss": -6.448525428771973, "global_step": 118076, "epoch": 2811} {"train_loss": -6.526285648345947, "global_step": 118077, "epoch": 2811} {"train_loss": -6.423939228057861, "global_step": 118078, "epoch": 2811} {"train_loss": -6.525475025177002, "global_step": 118079, "epoch": 2811} {"train_loss": -6.326362133026123, "global_step": 118080, "epoch": 2811} {"train_loss": -6.5982513427734375, "global_step": 118081, "epoch": 2811} {"train_loss": -6.488059997558594, "global_step": 118082, "epoch": 2811} {"train_loss": -6.351114273071289, "global_step": 118083, "epoch": 2811} {"train_loss": -6.481432914733887, "global_step": 118084, "epoch": 2811} {"train_loss": -6.433445453643799, "global_step": 118085, "epoch": 2811} {"train_loss": -6.5374250411987305, "global_step": 118086, "epoch": 2811} {"train_loss": -6.467207908630371, "global_step": 118087, "epoch": 2811} {"train_loss": -6.437734603881836, "global_step": 118088, "epoch": 2811} {"train_loss": -6.534765243530273, "global_step": 118089, "epoch": 2811} {"train_loss": -6.503843307495117, "global_step": 118090, "epoch": 2811} {"train_loss": -6.4995927810668945, "global_step": 118091, "epoch": 2811} {"train_loss": -6.527347087860107, "global_step": 118092, "epoch": 2811} {"train_loss": -6.625399589538574, "global_step": 118093, "epoch": 2811} {"train_loss": -6.4373860359191895, "global_step": 118094, "epoch": 2811} {"train_loss": -6.68115234375, "global_step": 118095, "epoch": 2811} {"train_loss": -6.539520263671875, "global_step": 118096, "epoch": 2811} {"train_loss": -6.575629711151123, "global_step": 118097, "epoch": 2811} {"train_loss": -6.5105881690979, "global_step": 118098, "epoch": 2811} {"train_loss": -6.572086811065674, "global_step": 118099, "epoch": 2811} {"train_loss": -6.532909870147705, "global_step": 118100, "epoch": 2811} {"train_loss": -6.613656997680664, "global_step": 118101, "epoch": 2811} {"train_loss": -6.668808937072754, "global_step": 118102, "epoch": 2811} {"train_loss": -6.518772499901908, "global_step": 118103, "epoch": 2811, "val_loss": 76844.859375} {"train_loss": -6.60092306137085, "global_step": 118104, "epoch": 2812} {"train_loss": -6.602057933807373, "global_step": 118105, "epoch": 2812} {"train_loss": -6.594219207763672, "global_step": 118106, "epoch": 2812} {"train_loss": -6.4618940353393555, "global_step": 118107, "epoch": 2812} {"train_loss": -6.6655473709106445, "global_step": 118108, "epoch": 2812} {"train_loss": -6.6073713302612305, "global_step": 118109, "epoch": 2812} {"train_loss": -6.504220485687256, "global_step": 118110, "epoch": 2812} {"train_loss": -6.616181373596191, "global_step": 118111, "epoch": 2812} {"train_loss": -6.484423637390137, "global_step": 118112, "epoch": 2812} {"train_loss": -6.542971611022949, "global_step": 118113, "epoch": 2812} {"train_loss": -6.575963020324707, "global_step": 118114, "epoch": 2812} {"train_loss": -6.455305099487305, "global_step": 118115, "epoch": 2812} {"train_loss": -6.509910583496094, "global_step": 118116, "epoch": 2812} {"train_loss": -6.4619011878967285, "global_step": 118117, "epoch": 2812} {"train_loss": -6.443985462188721, "global_step": 118118, "epoch": 2812} {"train_loss": -6.560605049133301, "global_step": 118119, "epoch": 2812} {"train_loss": -6.666640281677246, "global_step": 118120, "epoch": 2812} {"train_loss": -6.539732933044434, "global_step": 118121, "epoch": 2812} {"train_loss": -6.557459831237793, "global_step": 118122, "epoch": 2812} {"train_loss": -6.627101898193359, "global_step": 118123, "epoch": 2812} {"train_loss": -6.558994293212891, "global_step": 118124, "epoch": 2812} {"train_loss": -6.539036750793457, "global_step": 118125, "epoch": 2812} {"train_loss": -6.542251110076904, "global_step": 118126, "epoch": 2812} {"train_loss": -6.5084309577941895, "global_step": 118127, "epoch": 2812} {"train_loss": -6.627320289611816, "global_step": 118128, "epoch": 2812} {"train_loss": -6.507735252380371, "global_step": 118129, "epoch": 2812} {"train_loss": -6.499456882476807, "global_step": 118130, "epoch": 2812} {"train_loss": -6.645840644836426, "global_step": 118131, "epoch": 2812} {"train_loss": -6.592939376831055, "global_step": 118132, "epoch": 2812} {"train_loss": -6.502214431762695, "global_step": 118133, "epoch": 2812} {"train_loss": -6.6202616691589355, "global_step": 118134, "epoch": 2812} {"train_loss": -6.6830854415893555, "global_step": 118135, "epoch": 2812} {"train_loss": -6.598287582397461, "global_step": 118136, "epoch": 2812} {"train_loss": -6.639480113983154, "global_step": 118137, "epoch": 2812} {"train_loss": -6.654677391052246, "global_step": 118138, "epoch": 2812} {"train_loss": -6.6235809326171875, "global_step": 118139, "epoch": 2812} {"train_loss": -6.629478931427002, "global_step": 118140, "epoch": 2812} {"train_loss": -6.698702812194824, "global_step": 118141, "epoch": 2812} {"train_loss": -6.530053615570068, "global_step": 118142, "epoch": 2812} {"train_loss": -6.626660346984863, "global_step": 118143, "epoch": 2812} {"train_loss": -6.684207916259766, "global_step": 118144, "epoch": 2812} {"train_loss": -6.577982073738461, "global_step": 118145, "epoch": 2812, "val_loss": 76731.2421875} {"train_loss": -6.539641857147217, "global_step": 118146, "epoch": 2813} {"train_loss": -6.640615463256836, "global_step": 118147, "epoch": 2813} {"train_loss": -6.546200752258301, "global_step": 118148, "epoch": 2813} {"train_loss": -6.683270454406738, "global_step": 118149, "epoch": 2813} {"train_loss": -6.561927795410156, "global_step": 118150, "epoch": 2813} {"train_loss": -6.542226791381836, "global_step": 118151, "epoch": 2813} {"train_loss": -6.5877814292907715, "global_step": 118152, "epoch": 2813} {"train_loss": -6.534431457519531, "global_step": 118153, "epoch": 2813} {"train_loss": -6.576422691345215, "global_step": 118154, "epoch": 2813} {"train_loss": -6.5652384757995605, "global_step": 118155, "epoch": 2813} {"train_loss": -6.588131427764893, "global_step": 118156, "epoch": 2813} {"train_loss": -6.683208465576172, "global_step": 118157, "epoch": 2813} {"train_loss": -6.5944623947143555, "global_step": 118158, "epoch": 2813} {"train_loss": -6.519458770751953, "global_step": 118159, "epoch": 2813} {"train_loss": -6.638477325439453, "global_step": 118160, "epoch": 2813} {"train_loss": -6.534319877624512, "global_step": 118161, "epoch": 2813} {"train_loss": -6.646944999694824, "global_step": 118162, "epoch": 2813} {"train_loss": -6.729080677032471, "global_step": 118163, "epoch": 2813} {"train_loss": -6.58792781829834, "global_step": 118164, "epoch": 2813} {"train_loss": -6.547019004821777, "global_step": 118165, "epoch": 2813} {"train_loss": -6.508781909942627, "global_step": 118166, "epoch": 2813} {"train_loss": -6.518352508544922, "global_step": 118167, "epoch": 2813} {"train_loss": -6.565178394317627, "global_step": 118168, "epoch": 2813} {"train_loss": -6.597828388214111, "global_step": 118169, "epoch": 2813} {"train_loss": -6.516766548156738, "global_step": 118170, "epoch": 2813} {"train_loss": -6.5421576499938965, "global_step": 118171, "epoch": 2813} {"train_loss": -6.710132598876953, "global_step": 118172, "epoch": 2813} {"train_loss": -6.6401286125183105, "global_step": 118173, "epoch": 2813} {"train_loss": -6.662843704223633, "global_step": 118174, "epoch": 2813} {"train_loss": -6.516568660736084, "global_step": 118175, "epoch": 2813} {"train_loss": -6.627237319946289, "global_step": 118176, "epoch": 2813} {"train_loss": -6.580723762512207, "global_step": 118177, "epoch": 2813} {"train_loss": -6.633217811584473, "global_step": 118178, "epoch": 2813} {"train_loss": -6.656343460083008, "global_step": 118179, "epoch": 2813} {"train_loss": -6.696258544921875, "global_step": 118180, "epoch": 2813} {"train_loss": -6.683417320251465, "global_step": 118181, "epoch": 2813} {"train_loss": -6.594170093536377, "global_step": 118182, "epoch": 2813} {"train_loss": -6.567622184753418, "global_step": 118183, "epoch": 2813} {"train_loss": -6.611021041870117, "global_step": 118184, "epoch": 2813} {"train_loss": -6.669169902801514, "global_step": 118185, "epoch": 2813} {"train_loss": -6.657343864440918, "global_step": 118186, "epoch": 2813} {"train_loss": -6.5997907888321645, "global_step": 118187, "epoch": 2813, "val_loss": 76702.1640625} {"train_loss": -6.658727645874023, "global_step": 118188, "epoch": 2814} {"train_loss": -6.664488792419434, "global_step": 118189, "epoch": 2814} {"train_loss": -6.665947914123535, "global_step": 118190, "epoch": 2814} {"train_loss": -6.664968967437744, "global_step": 118191, "epoch": 2814} {"train_loss": -6.572110652923584, "global_step": 118192, "epoch": 2814} {"train_loss": -6.630457878112793, "global_step": 118193, "epoch": 2814} {"train_loss": -6.466609954833984, "global_step": 118194, "epoch": 2814} {"train_loss": -6.638279438018799, "global_step": 118195, "epoch": 2814} {"train_loss": -6.571178913116455, "global_step": 118196, "epoch": 2814} {"train_loss": -6.5427093505859375, "global_step": 118197, "epoch": 2814} {"train_loss": -6.5094757080078125, "global_step": 118198, "epoch": 2814} {"train_loss": -6.7035722732543945, "global_step": 118199, "epoch": 2814} {"train_loss": -6.528342247009277, "global_step": 118200, "epoch": 2814} {"train_loss": -6.498629570007324, "global_step": 118201, "epoch": 2814} {"train_loss": -6.505771636962891, "global_step": 118202, "epoch": 2814} {"train_loss": -6.682098865509033, "global_step": 118203, "epoch": 2814} {"train_loss": -6.579230308532715, "global_step": 118204, "epoch": 2814} {"train_loss": -6.565216064453125, "global_step": 118205, "epoch": 2814} {"train_loss": -6.6084489822387695, "global_step": 118206, "epoch": 2814} {"train_loss": -6.456010341644287, "global_step": 118207, "epoch": 2814} {"train_loss": -6.4548845291137695, "global_step": 118208, "epoch": 2814} {"train_loss": -6.436129570007324, "global_step": 118209, "epoch": 2814} {"train_loss": -6.522984504699707, "global_step": 118210, "epoch": 2814} {"train_loss": -6.575414657592773, "global_step": 118211, "epoch": 2814} {"train_loss": -6.317035675048828, "global_step": 118212, "epoch": 2814} {"train_loss": -6.664377212524414, "global_step": 118213, "epoch": 2814} {"train_loss": -6.378155708312988, "global_step": 118214, "epoch": 2814} {"train_loss": -6.391462326049805, "global_step": 118215, "epoch": 2814} {"train_loss": -6.447224140167236, "global_step": 118216, "epoch": 2814} {"train_loss": -6.58671760559082, "global_step": 118217, "epoch": 2814} {"train_loss": -6.31007194519043, "global_step": 118218, "epoch": 2814} {"train_loss": -6.453893661499023, "global_step": 118219, "epoch": 2814} {"train_loss": -6.512246131896973, "global_step": 118220, "epoch": 2814} {"train_loss": -6.556341171264648, "global_step": 118221, "epoch": 2814} {"train_loss": -6.465822219848633, "global_step": 118222, "epoch": 2814} {"train_loss": -6.492588996887207, "global_step": 118223, "epoch": 2814} {"train_loss": -6.380645751953125, "global_step": 118224, "epoch": 2814} {"train_loss": -6.4954833984375, "global_step": 118225, "epoch": 2814} {"train_loss": -6.530885696411133, "global_step": 118226, "epoch": 2814} {"train_loss": -6.562413215637207, "global_step": 118227, "epoch": 2814} {"train_loss": -6.584607124328613, "global_step": 118228, "epoch": 2814} {"train_loss": -6.528308130445934, "global_step": 118229, "epoch": 2814, "val_loss": 76664.921875} {"train_loss": -6.580388069152832, "global_step": 118230, "epoch": 2815} {"train_loss": -6.495965003967285, "global_step": 118231, "epoch": 2815} {"train_loss": -6.55084228515625, "global_step": 118232, "epoch": 2815} {"train_loss": -6.457952499389648, "global_step": 118233, "epoch": 2815} {"train_loss": -6.485608100891113, "global_step": 118234, "epoch": 2815} {"train_loss": -6.5622358322143555, "global_step": 118235, "epoch": 2815} {"train_loss": -6.610196113586426, "global_step": 118236, "epoch": 2815} {"train_loss": -6.5090765953063965, "global_step": 118237, "epoch": 2815} {"train_loss": -6.541079521179199, "global_step": 118238, "epoch": 2815} {"train_loss": -6.685810089111328, "global_step": 118239, "epoch": 2815} {"train_loss": -6.552481651306152, "global_step": 118240, "epoch": 2815} {"train_loss": -6.581841945648193, "global_step": 118241, "epoch": 2815} {"train_loss": -6.395776748657227, "global_step": 118242, "epoch": 2815} {"train_loss": -6.530737400054932, "global_step": 118243, "epoch": 2815} {"train_loss": -6.597910404205322, "global_step": 118244, "epoch": 2815} {"train_loss": -6.557175159454346, "global_step": 118245, "epoch": 2815} {"train_loss": -6.644834518432617, "global_step": 118246, "epoch": 2815} {"train_loss": -6.565680980682373, "global_step": 118247, "epoch": 2815} {"train_loss": -6.582776069641113, "global_step": 118248, "epoch": 2815} {"train_loss": -6.470057487487793, "global_step": 118249, "epoch": 2815} {"train_loss": -6.511772155761719, "global_step": 118250, "epoch": 2815} {"train_loss": -6.522176742553711, "global_step": 118251, "epoch": 2815} {"train_loss": -6.654085159301758, "global_step": 118252, "epoch": 2815} {"train_loss": -6.57058048248291, "global_step": 118253, "epoch": 2815} {"train_loss": -6.496757984161377, "global_step": 118254, "epoch": 2815} {"train_loss": -6.423763751983643, "global_step": 118255, "epoch": 2815} {"train_loss": -6.5453338623046875, "global_step": 118256, "epoch": 2815} {"train_loss": -6.556483268737793, "global_step": 118257, "epoch": 2815} {"train_loss": -6.48482608795166, "global_step": 118258, "epoch": 2815} {"train_loss": -6.57204532623291, "global_step": 118259, "epoch": 2815} {"train_loss": -6.424522876739502, "global_step": 118260, "epoch": 2815} {"train_loss": -6.682277679443359, "global_step": 118261, "epoch": 2815} {"train_loss": -6.5700812339782715, "global_step": 118262, "epoch": 2815} {"train_loss": -6.562718391418457, "global_step": 118263, "epoch": 2815} {"train_loss": -6.532808780670166, "global_step": 118264, "epoch": 2815} {"train_loss": -6.536962032318115, "global_step": 118265, "epoch": 2815} {"train_loss": -6.609302043914795, "global_step": 118266, "epoch": 2815} {"train_loss": -6.619163513183594, "global_step": 118267, "epoch": 2815} {"train_loss": -6.59675931930542, "global_step": 118268, "epoch": 2815} {"train_loss": -6.6047139167785645, "global_step": 118269, "epoch": 2815} {"train_loss": -6.6208696365356445, "global_step": 118270, "epoch": 2815} {"train_loss": -6.550699268068586, "global_step": 118271, "epoch": 2815, "val_loss": 76569.453125} {"train_loss": -6.642327308654785, "global_step": 118272, "epoch": 2816} {"train_loss": -6.646786212921143, "global_step": 118273, "epoch": 2816} {"train_loss": -6.502411842346191, "global_step": 118274, "epoch": 2816} {"train_loss": -6.58720588684082, "global_step": 118275, "epoch": 2816} {"train_loss": -6.587512969970703, "global_step": 118276, "epoch": 2816} {"train_loss": -6.520698547363281, "global_step": 118277, "epoch": 2816} {"train_loss": -6.411433219909668, "global_step": 118278, "epoch": 2816} {"train_loss": -6.5431084632873535, "global_step": 118279, "epoch": 2816} {"train_loss": -6.4138689041137695, "global_step": 118280, "epoch": 2816} {"train_loss": -6.542788505554199, "global_step": 118281, "epoch": 2816} {"train_loss": -6.399965286254883, "global_step": 118282, "epoch": 2816} {"train_loss": -6.598889350891113, "global_step": 118283, "epoch": 2816} {"train_loss": -6.452497482299805, "global_step": 118284, "epoch": 2816} {"train_loss": -6.428373336791992, "global_step": 118285, "epoch": 2816} {"train_loss": -6.604435920715332, "global_step": 118286, "epoch": 2816} {"train_loss": -6.530002593994141, "global_step": 118287, "epoch": 2816} {"train_loss": -6.564524173736572, "global_step": 118288, "epoch": 2816} {"train_loss": -6.517386436462402, "global_step": 118289, "epoch": 2816} {"train_loss": -6.501768112182617, "global_step": 118290, "epoch": 2816} {"train_loss": -6.415348529815674, "global_step": 118291, "epoch": 2816} {"train_loss": -6.484125137329102, "global_step": 118292, "epoch": 2816} {"train_loss": -6.598117351531982, "global_step": 118293, "epoch": 2816} {"train_loss": -6.445031642913818, "global_step": 118294, "epoch": 2816} {"train_loss": -6.35917329788208, "global_step": 118295, "epoch": 2816} {"train_loss": -6.441117286682129, "global_step": 118296, "epoch": 2816} {"train_loss": -6.409922122955322, "global_step": 118297, "epoch": 2816} {"train_loss": -6.450766086578369, "global_step": 118298, "epoch": 2816} {"train_loss": -6.51779842376709, "global_step": 118299, "epoch": 2816} {"train_loss": -6.302491664886475, "global_step": 118300, "epoch": 2816} {"train_loss": -6.582328796386719, "global_step": 118301, "epoch": 2816} {"train_loss": -6.516282081604004, "global_step": 118302, "epoch": 2816} {"train_loss": -6.515468597412109, "global_step": 118303, "epoch": 2816} {"train_loss": -6.644554138183594, "global_step": 118304, "epoch": 2816} {"train_loss": -6.505704879760742, "global_step": 118305, "epoch": 2816} {"train_loss": -6.557480335235596, "global_step": 118306, "epoch": 2816} {"train_loss": -6.51249885559082, "global_step": 118307, "epoch": 2816} {"train_loss": -6.490466117858887, "global_step": 118308, "epoch": 2816} {"train_loss": -6.509579658508301, "global_step": 118309, "epoch": 2816} {"train_loss": -6.441305160522461, "global_step": 118310, "epoch": 2816} {"train_loss": -6.567225456237793, "global_step": 118311, "epoch": 2816} {"train_loss": -6.581071853637695, "global_step": 118312, "epoch": 2816} {"train_loss": -6.508098170870826, "global_step": 118313, "epoch": 2816, "val_loss": 76768.328125} {"train_loss": -6.625109672546387, "global_step": 118314, "epoch": 2817} {"train_loss": -6.6622490882873535, "global_step": 118315, "epoch": 2817} {"train_loss": -6.509110450744629, "global_step": 118316, "epoch": 2817} {"train_loss": -6.604633331298828, "global_step": 118317, "epoch": 2817} {"train_loss": -6.6021881103515625, "global_step": 118318, "epoch": 2817} {"train_loss": -6.466955184936523, "global_step": 118319, "epoch": 2817} {"train_loss": -6.645402908325195, "global_step": 118320, "epoch": 2817} {"train_loss": -6.452204704284668, "global_step": 118321, "epoch": 2817} {"train_loss": -6.558995246887207, "global_step": 118322, "epoch": 2817} {"train_loss": -6.533442497253418, "global_step": 118323, "epoch": 2817} {"train_loss": -6.504083156585693, "global_step": 118324, "epoch": 2817} {"train_loss": -6.5744171142578125, "global_step": 118325, "epoch": 2817} {"train_loss": -6.4706573486328125, "global_step": 118326, "epoch": 2817} {"train_loss": -6.59930419921875, "global_step": 118327, "epoch": 2817} {"train_loss": -6.562459945678711, "global_step": 118328, "epoch": 2817} {"train_loss": -6.614760398864746, "global_step": 118329, "epoch": 2817} {"train_loss": -6.5714521408081055, "global_step": 118330, "epoch": 2817} {"train_loss": -6.645190238952637, "global_step": 118331, "epoch": 2817} {"train_loss": -6.655984878540039, "global_step": 118332, "epoch": 2817} {"train_loss": -6.516862869262695, "global_step": 118333, "epoch": 2817} {"train_loss": -6.587483882904053, "global_step": 118334, "epoch": 2817} {"train_loss": -6.475745677947998, "global_step": 118335, "epoch": 2817} {"train_loss": -6.4940996170043945, "global_step": 118336, "epoch": 2817} {"train_loss": -6.484689712524414, "global_step": 118337, "epoch": 2817} {"train_loss": -6.559640884399414, "global_step": 118338, "epoch": 2817} {"train_loss": -6.594047546386719, "global_step": 118339, "epoch": 2817} {"train_loss": -6.558403968811035, "global_step": 118340, "epoch": 2817} {"train_loss": -6.511366367340088, "global_step": 118341, "epoch": 2817} {"train_loss": -6.675766468048096, "global_step": 118342, "epoch": 2817} {"train_loss": -6.6666460037231445, "global_step": 118343, "epoch": 2817} {"train_loss": -6.513628005981445, "global_step": 118344, "epoch": 2817} {"train_loss": -6.519644260406494, "global_step": 118345, "epoch": 2817} {"train_loss": -6.662656784057617, "global_step": 118346, "epoch": 2817} {"train_loss": -6.430601596832275, "global_step": 118347, "epoch": 2817} {"train_loss": -6.526777267456055, "global_step": 118348, "epoch": 2817} {"train_loss": -6.555085182189941, "global_step": 118349, "epoch": 2817} {"train_loss": -6.555697441101074, "global_step": 118350, "epoch": 2817} {"train_loss": -6.386693954467773, "global_step": 118351, "epoch": 2817} {"train_loss": -6.637509822845459, "global_step": 118352, "epoch": 2817} {"train_loss": -6.517628192901611, "global_step": 118353, "epoch": 2817} {"train_loss": -6.567938804626465, "global_step": 118354, "epoch": 2817} {"train_loss": -6.559422788165865, "global_step": 118355, "epoch": 2817, "val_loss": 77146.0078125} {"train_loss": -6.416677474975586, "global_step": 118356, "epoch": 2818} {"train_loss": -6.518331527709961, "global_step": 118357, "epoch": 2818} {"train_loss": -6.529457092285156, "global_step": 118358, "epoch": 2818} {"train_loss": -6.529439926147461, "global_step": 118359, "epoch": 2818} {"train_loss": -6.5106706619262695, "global_step": 118360, "epoch": 2818} {"train_loss": -6.559715747833252, "global_step": 118361, "epoch": 2818} {"train_loss": -6.393842697143555, "global_step": 118362, "epoch": 2818} {"train_loss": -6.444840431213379, "global_step": 118363, "epoch": 2818} {"train_loss": -6.566019535064697, "global_step": 118364, "epoch": 2818} {"train_loss": -6.5654683113098145, "global_step": 118365, "epoch": 2818} {"train_loss": -6.488536834716797, "global_step": 118366, "epoch": 2818} {"train_loss": -6.478006839752197, "global_step": 118367, "epoch": 2818} {"train_loss": -6.545835971832275, "global_step": 118368, "epoch": 2818} {"train_loss": -6.58094596862793, "global_step": 118369, "epoch": 2818} {"train_loss": -6.537308216094971, "global_step": 118370, "epoch": 2818} {"train_loss": -6.605123043060303, "global_step": 118371, "epoch": 2818} {"train_loss": -6.380204200744629, "global_step": 118372, "epoch": 2818} {"train_loss": -6.661342144012451, "global_step": 118373, "epoch": 2818} {"train_loss": -6.634942054748535, "global_step": 118374, "epoch": 2818} {"train_loss": -6.403722763061523, "global_step": 118375, "epoch": 2818} {"train_loss": -6.4265289306640625, "global_step": 118376, "epoch": 2818} {"train_loss": -6.452193260192871, "global_step": 118377, "epoch": 2818} {"train_loss": -6.454521179199219, "global_step": 118378, "epoch": 2818} {"train_loss": -6.385278701782227, "global_step": 118379, "epoch": 2818} {"train_loss": -6.547234058380127, "global_step": 118380, "epoch": 2818} {"train_loss": -6.415657043457031, "global_step": 118381, "epoch": 2818} {"train_loss": -6.443013668060303, "global_step": 118382, "epoch": 2818} {"train_loss": -6.6232476234436035, "global_step": 118383, "epoch": 2818} {"train_loss": -6.452271461486816, "global_step": 118384, "epoch": 2818} {"train_loss": -6.529275894165039, "global_step": 118385, "epoch": 2818} {"train_loss": -6.4819512367248535, "global_step": 118386, "epoch": 2818} {"train_loss": -6.489649772644043, "global_step": 118387, "epoch": 2818} {"train_loss": -6.579583168029785, "global_step": 118388, "epoch": 2818} {"train_loss": -6.4817399978637695, "global_step": 118389, "epoch": 2818} {"train_loss": -6.517309188842773, "global_step": 118390, "epoch": 2818} {"train_loss": -6.427565574645996, "global_step": 118391, "epoch": 2818} {"train_loss": -6.661880016326904, "global_step": 118392, "epoch": 2818} {"train_loss": -6.456864356994629, "global_step": 118393, "epoch": 2818} {"train_loss": -6.486995220184326, "global_step": 118394, "epoch": 2818} {"train_loss": -6.548543453216553, "global_step": 118395, "epoch": 2818} {"train_loss": -6.602129936218262, "global_step": 118396, "epoch": 2818} {"train_loss": -6.5095962683359785, "global_step": 118397, "epoch": 2818, "val_loss": 76750.6875} {"train_loss": -6.495236396789551, "global_step": 118398, "epoch": 2819} {"train_loss": -6.56730842590332, "global_step": 118399, "epoch": 2819} {"train_loss": -6.5396504402160645, "global_step": 118400, "epoch": 2819} {"train_loss": -6.559506416320801, "global_step": 118401, "epoch": 2819} {"train_loss": -6.410489082336426, "global_step": 118402, "epoch": 2819} {"train_loss": -6.626410961151123, "global_step": 118403, "epoch": 2819} {"train_loss": -6.516364097595215, "global_step": 118404, "epoch": 2819} {"train_loss": -6.492829322814941, "global_step": 118405, "epoch": 2819} {"train_loss": -6.550568580627441, "global_step": 118406, "epoch": 2819} {"train_loss": -6.575315475463867, "global_step": 118407, "epoch": 2819} {"train_loss": -6.408196449279785, "global_step": 118408, "epoch": 2819} {"train_loss": -6.527592658996582, "global_step": 118409, "epoch": 2819} {"train_loss": -6.457655429840088, "global_step": 118410, "epoch": 2819} {"train_loss": -6.397273063659668, "global_step": 118411, "epoch": 2819} {"train_loss": -6.5921831130981445, "global_step": 118412, "epoch": 2819} {"train_loss": -6.662467956542969, "global_step": 118413, "epoch": 2819} {"train_loss": -6.533501625061035, "global_step": 118414, "epoch": 2819} {"train_loss": -6.623898506164551, "global_step": 118415, "epoch": 2819} {"train_loss": -6.562435150146484, "global_step": 118416, "epoch": 2819} {"train_loss": -6.633017539978027, "global_step": 118417, "epoch": 2819} {"train_loss": -6.489994049072266, "global_step": 118418, "epoch": 2819} {"train_loss": -6.438624382019043, "global_step": 118419, "epoch": 2819} {"train_loss": -6.575663089752197, "global_step": 118420, "epoch": 2819} {"train_loss": -6.423412799835205, "global_step": 118421, "epoch": 2819} {"train_loss": -6.605226516723633, "global_step": 118422, "epoch": 2819} {"train_loss": -6.52178430557251, "global_step": 118423, "epoch": 2819} {"train_loss": -6.529098033905029, "global_step": 118424, "epoch": 2819} {"train_loss": -6.664338111877441, "global_step": 118425, "epoch": 2819} {"train_loss": -6.529007434844971, "global_step": 118426, "epoch": 2819} {"train_loss": -6.572610855102539, "global_step": 118427, "epoch": 2819} {"train_loss": -6.670418739318848, "global_step": 118428, "epoch": 2819} {"train_loss": -6.579196453094482, "global_step": 118429, "epoch": 2819} {"train_loss": -6.597156524658203, "global_step": 118430, "epoch": 2819} {"train_loss": -6.529829025268555, "global_step": 118431, "epoch": 2819} {"train_loss": -6.531954765319824, "global_step": 118432, "epoch": 2819} {"train_loss": -6.469344615936279, "global_step": 118433, "epoch": 2819} {"train_loss": -6.595423698425293, "global_step": 118434, "epoch": 2819} {"train_loss": -6.661441802978516, "global_step": 118435, "epoch": 2819} {"train_loss": -6.566937446594238, "global_step": 118436, "epoch": 2819} {"train_loss": -6.465956687927246, "global_step": 118437, "epoch": 2819} {"train_loss": -6.546030044555664, "global_step": 118438, "epoch": 2819} {"train_loss": -6.539695387794858, "global_step": 118439, "epoch": 2819, "val_loss": 76765.6484375} {"train_loss": -6.499608039855957, "global_step": 118440, "epoch": 2820} {"train_loss": -6.521803855895996, "global_step": 118441, "epoch": 2820} {"train_loss": -6.401677131652832, "global_step": 118442, "epoch": 2820} {"train_loss": -6.467447757720947, "global_step": 118443, "epoch": 2820} {"train_loss": -6.4869890213012695, "global_step": 118444, "epoch": 2820} {"train_loss": -6.42465353012085, "global_step": 118445, "epoch": 2820} {"train_loss": -6.454110622406006, "global_step": 118446, "epoch": 2820} {"train_loss": -6.469099044799805, "global_step": 118447, "epoch": 2820} {"train_loss": -6.5404276847839355, "global_step": 118448, "epoch": 2820} {"train_loss": -6.458593368530273, "global_step": 118449, "epoch": 2820} {"train_loss": -6.506922245025635, "global_step": 118450, "epoch": 2820} {"train_loss": -6.525293827056885, "global_step": 118451, "epoch": 2820} {"train_loss": -6.54642391204834, "global_step": 118452, "epoch": 2820} {"train_loss": -6.502658843994141, "global_step": 118453, "epoch": 2820} {"train_loss": -6.607333660125732, "global_step": 118454, "epoch": 2820} {"train_loss": -6.516094207763672, "global_step": 118455, "epoch": 2820} {"train_loss": -6.645016193389893, "global_step": 118456, "epoch": 2820} {"train_loss": -6.594421863555908, "global_step": 118457, "epoch": 2820} {"train_loss": -6.5423431396484375, "global_step": 118458, "epoch": 2820} {"train_loss": -6.522888660430908, "global_step": 118459, "epoch": 2820} {"train_loss": -6.590695381164551, "global_step": 118460, "epoch": 2820} {"train_loss": -6.459930419921875, "global_step": 118461, "epoch": 2820} {"train_loss": -6.626694679260254, "global_step": 118462, "epoch": 2820} {"train_loss": -6.568948268890381, "global_step": 118463, "epoch": 2820} {"train_loss": -6.497626304626465, "global_step": 118464, "epoch": 2820} {"train_loss": -6.504863262176514, "global_step": 118465, "epoch": 2820} {"train_loss": -6.588235855102539, "global_step": 118466, "epoch": 2820} {"train_loss": -6.500718593597412, "global_step": 118467, "epoch": 2820} {"train_loss": -6.526558876037598, "global_step": 118468, "epoch": 2820} {"train_loss": -6.638584136962891, "global_step": 118469, "epoch": 2820} {"train_loss": -6.472113609313965, "global_step": 118470, "epoch": 2820} {"train_loss": -6.556501865386963, "global_step": 118471, "epoch": 2820} {"train_loss": -6.565346717834473, "global_step": 118472, "epoch": 2820} {"train_loss": -6.5782928466796875, "global_step": 118473, "epoch": 2820} {"train_loss": -6.570178985595703, "global_step": 118474, "epoch": 2820} {"train_loss": -6.539595127105713, "global_step": 118475, "epoch": 2820} {"train_loss": -6.4792890548706055, "global_step": 118476, "epoch": 2820} {"train_loss": -6.630056381225586, "global_step": 118477, "epoch": 2820} {"train_loss": -6.644202709197998, "global_step": 118478, "epoch": 2820} {"train_loss": -6.583762168884277, "global_step": 118479, "epoch": 2820} {"train_loss": -6.551316738128662, "global_step": 118480, "epoch": 2820} {"train_loss": -6.537204299654279, "global_step": 118481, "epoch": 2820, "val_loss": 76798.9453125} {"train_loss": -6.488471031188965, "global_step": 118482, "epoch": 2821} {"train_loss": -6.565152168273926, "global_step": 118483, "epoch": 2821} {"train_loss": -6.508851051330566, "global_step": 118484, "epoch": 2821} {"train_loss": -6.483534812927246, "global_step": 118485, "epoch": 2821} {"train_loss": -6.420377731323242, "global_step": 118486, "epoch": 2821} {"train_loss": -6.553942680358887, "global_step": 118487, "epoch": 2821} {"train_loss": -6.433480262756348, "global_step": 118488, "epoch": 2821} {"train_loss": -6.599517345428467, "global_step": 118489, "epoch": 2821} {"train_loss": -6.525753021240234, "global_step": 118490, "epoch": 2821} {"train_loss": -6.528226852416992, "global_step": 118491, "epoch": 2821} {"train_loss": -6.363650798797607, "global_step": 118492, "epoch": 2821} {"train_loss": -6.539694786071777, "global_step": 118493, "epoch": 2821} {"train_loss": -6.5170578956604, "global_step": 118494, "epoch": 2821} {"train_loss": -6.570206642150879, "global_step": 118495, "epoch": 2821} {"train_loss": -6.560627460479736, "global_step": 118496, "epoch": 2821} {"train_loss": -6.594909191131592, "global_step": 118497, "epoch": 2821} {"train_loss": -6.522769927978516, "global_step": 118498, "epoch": 2821} {"train_loss": -6.545234680175781, "global_step": 118499, "epoch": 2821} {"train_loss": -6.626595973968506, "global_step": 118500, "epoch": 2821} {"train_loss": -6.674938678741455, "global_step": 118501, "epoch": 2821} {"train_loss": -6.577839374542236, "global_step": 118502, "epoch": 2821} {"train_loss": -6.543458938598633, "global_step": 118503, "epoch": 2821} {"train_loss": -6.73577880859375, "global_step": 118504, "epoch": 2821} {"train_loss": -6.557004451751709, "global_step": 118505, "epoch": 2821} {"train_loss": -6.597460746765137, "global_step": 118506, "epoch": 2821} {"train_loss": -6.519196510314941, "global_step": 118507, "epoch": 2821} {"train_loss": -6.574571132659912, "global_step": 118508, "epoch": 2821} {"train_loss": -6.607388973236084, "global_step": 118509, "epoch": 2821} {"train_loss": -6.634771823883057, "global_step": 118510, "epoch": 2821} {"train_loss": -6.539355754852295, "global_step": 118511, "epoch": 2821} {"train_loss": -6.501172065734863, "global_step": 118512, "epoch": 2821} {"train_loss": -6.614352226257324, "global_step": 118513, "epoch": 2821} {"train_loss": -6.61959171295166, "global_step": 118514, "epoch": 2821} {"train_loss": -6.49958610534668, "global_step": 118515, "epoch": 2821} {"train_loss": -6.607432842254639, "global_step": 118516, "epoch": 2821} {"train_loss": -6.66637659072876, "global_step": 118517, "epoch": 2821} {"train_loss": -6.3582682609558105, "global_step": 118518, "epoch": 2821} {"train_loss": -6.500051498413086, "global_step": 118519, "epoch": 2821} {"train_loss": -6.483723163604736, "global_step": 118520, "epoch": 2821} {"train_loss": -6.663863658905029, "global_step": 118521, "epoch": 2821} {"train_loss": -6.522137641906738, "global_step": 118522, "epoch": 2821} {"train_loss": -6.54914124806722, "global_step": 118523, "epoch": 2821, "val_loss": 76921.1015625} {"train_loss": -6.414565086364746, "global_step": 118524, "epoch": 2822} {"train_loss": -6.535001277923584, "global_step": 118525, "epoch": 2822} {"train_loss": -6.360647678375244, "global_step": 118526, "epoch": 2822} {"train_loss": -6.558095932006836, "global_step": 118527, "epoch": 2822} {"train_loss": -6.548559188842773, "global_step": 118528, "epoch": 2822} {"train_loss": -6.473816871643066, "global_step": 118529, "epoch": 2822} {"train_loss": -6.483255863189697, "global_step": 118530, "epoch": 2822} {"train_loss": -6.458670616149902, "global_step": 118531, "epoch": 2822} {"train_loss": -6.518596649169922, "global_step": 118532, "epoch": 2822} {"train_loss": -6.462745666503906, "global_step": 118533, "epoch": 2822} {"train_loss": -6.595633029937744, "global_step": 118534, "epoch": 2822} {"train_loss": -6.420644760131836, "global_step": 118535, "epoch": 2822} {"train_loss": -6.518285274505615, "global_step": 118536, "epoch": 2822} {"train_loss": -6.472537040710449, "global_step": 118537, "epoch": 2822} {"train_loss": -6.521956920623779, "global_step": 118538, "epoch": 2822} {"train_loss": -6.604125022888184, "global_step": 118539, "epoch": 2822} {"train_loss": -6.509614944458008, "global_step": 118540, "epoch": 2822} {"train_loss": -6.462649345397949, "global_step": 118541, "epoch": 2822} {"train_loss": -6.573577880859375, "global_step": 118542, "epoch": 2822} {"train_loss": -6.5167741775512695, "global_step": 118543, "epoch": 2822} {"train_loss": -6.64023494720459, "global_step": 118544, "epoch": 2822} {"train_loss": -6.645238876342773, "global_step": 118545, "epoch": 2822} {"train_loss": -6.5703630447387695, "global_step": 118546, "epoch": 2822} {"train_loss": -6.596504211425781, "global_step": 118547, "epoch": 2822} {"train_loss": -6.607023239135742, "global_step": 118548, "epoch": 2822} {"train_loss": -6.644752502441406, "global_step": 118549, "epoch": 2822} {"train_loss": -6.562906742095947, "global_step": 118550, "epoch": 2822} {"train_loss": -6.655580520629883, "global_step": 118551, "epoch": 2822} {"train_loss": -6.634047985076904, "global_step": 118552, "epoch": 2822} {"train_loss": -6.495295524597168, "global_step": 118553, "epoch": 2822} {"train_loss": -6.498323440551758, "global_step": 118554, "epoch": 2822} {"train_loss": -6.594054222106934, "global_step": 118555, "epoch": 2822} {"train_loss": -6.3296799659729, "global_step": 118556, "epoch": 2822} {"train_loss": -6.430218696594238, "global_step": 118557, "epoch": 2822} {"train_loss": -6.610589027404785, "global_step": 118558, "epoch": 2822} {"train_loss": -6.48881721496582, "global_step": 118559, "epoch": 2822} {"train_loss": -6.500563144683838, "global_step": 118560, "epoch": 2822} {"train_loss": -6.532712459564209, "global_step": 118561, "epoch": 2822} {"train_loss": -6.513152122497559, "global_step": 118562, "epoch": 2822} {"train_loss": -6.560707092285156, "global_step": 118563, "epoch": 2822} {"train_loss": -6.515209197998047, "global_step": 118564, "epoch": 2822} {"train_loss": -6.527995189030965, "global_step": 118565, "epoch": 2822, "val_loss": 76605.03125} {"train_loss": -6.398319721221924, "global_step": 118566, "epoch": 2823} {"train_loss": -6.51426887512207, "global_step": 118567, "epoch": 2823} {"train_loss": -6.539037704467773, "global_step": 118568, "epoch": 2823} {"train_loss": -6.493136405944824, "global_step": 118569, "epoch": 2823} {"train_loss": -6.632168769836426, "global_step": 118570, "epoch": 2823} {"train_loss": -6.583269119262695, "global_step": 118571, "epoch": 2823} {"train_loss": -6.4709649085998535, "global_step": 118572, "epoch": 2823} {"train_loss": -6.536932945251465, "global_step": 118573, "epoch": 2823} {"train_loss": -6.498647689819336, "global_step": 118574, "epoch": 2823} {"train_loss": -6.523163318634033, "global_step": 118575, "epoch": 2823} {"train_loss": -6.577186107635498, "global_step": 118576, "epoch": 2823} {"train_loss": -6.601388931274414, "global_step": 118577, "epoch": 2823} {"train_loss": -6.673588752746582, "global_step": 118578, "epoch": 2823} {"train_loss": -6.456433296203613, "global_step": 118579, "epoch": 2823} {"train_loss": -6.498219966888428, "global_step": 118580, "epoch": 2823} {"train_loss": -6.5146074295043945, "global_step": 118581, "epoch": 2823} {"train_loss": -6.551088333129883, "global_step": 118582, "epoch": 2823} {"train_loss": -6.667407989501953, "global_step": 118583, "epoch": 2823} {"train_loss": -6.50397253036499, "global_step": 118584, "epoch": 2823} {"train_loss": -6.588832855224609, "global_step": 118585, "epoch": 2823} {"train_loss": -6.571229457855225, "global_step": 118586, "epoch": 2823} {"train_loss": -6.5956525802612305, "global_step": 118587, "epoch": 2823} {"train_loss": -6.514510154724121, "global_step": 118588, "epoch": 2823} {"train_loss": -6.598151206970215, "global_step": 118589, "epoch": 2823} {"train_loss": -6.5354323387146, "global_step": 118590, "epoch": 2823} {"train_loss": -6.494596481323242, "global_step": 118591, "epoch": 2823} {"train_loss": -6.555733680725098, "global_step": 118592, "epoch": 2823} {"train_loss": -6.626337051391602, "global_step": 118593, "epoch": 2823} {"train_loss": -6.568022727966309, "global_step": 118594, "epoch": 2823} {"train_loss": -6.5408124923706055, "global_step": 118595, "epoch": 2823} {"train_loss": -6.534561634063721, "global_step": 118596, "epoch": 2823} {"train_loss": -6.522981643676758, "global_step": 118597, "epoch": 2823} {"train_loss": -6.559896469116211, "global_step": 118598, "epoch": 2823} {"train_loss": -6.482702732086182, "global_step": 118599, "epoch": 2823} {"train_loss": -6.5101847648620605, "global_step": 118600, "epoch": 2823} {"train_loss": -6.591115951538086, "global_step": 118601, "epoch": 2823} {"train_loss": -6.536253452301025, "global_step": 118602, "epoch": 2823} {"train_loss": -6.49810791015625, "global_step": 118603, "epoch": 2823} {"train_loss": -6.620927810668945, "global_step": 118604, "epoch": 2823} {"train_loss": -6.6024980545043945, "global_step": 118605, "epoch": 2823} {"train_loss": -6.568444728851318, "global_step": 118606, "epoch": 2823} {"train_loss": -6.547854775474185, "global_step": 118607, "epoch": 2823, "val_loss": 76681.8046875} {"train_loss": -6.484722137451172, "global_step": 118608, "epoch": 2824} {"train_loss": -6.711480140686035, "global_step": 118609, "epoch": 2824} {"train_loss": -6.531593322753906, "global_step": 118610, "epoch": 2824} {"train_loss": -6.530673027038574, "global_step": 118611, "epoch": 2824} {"train_loss": -6.497427463531494, "global_step": 118612, "epoch": 2824} {"train_loss": -6.505311489105225, "global_step": 118613, "epoch": 2824} {"train_loss": -6.60402774810791, "global_step": 118614, "epoch": 2824} {"train_loss": -6.463261604309082, "global_step": 118615, "epoch": 2824} {"train_loss": -6.647459983825684, "global_step": 118616, "epoch": 2824} {"train_loss": -6.466702938079834, "global_step": 118617, "epoch": 2824} {"train_loss": -6.43519401550293, "global_step": 118618, "epoch": 2824} {"train_loss": -6.4399518966674805, "global_step": 118619, "epoch": 2824} {"train_loss": -6.3444342613220215, "global_step": 118620, "epoch": 2824} {"train_loss": -6.491318225860596, "global_step": 118621, "epoch": 2824} {"train_loss": -6.4083757400512695, "global_step": 118622, "epoch": 2824} {"train_loss": -6.541199684143066, "global_step": 118623, "epoch": 2824} {"train_loss": -6.568548679351807, "global_step": 118624, "epoch": 2824} {"train_loss": -6.562517166137695, "global_step": 118625, "epoch": 2824} {"train_loss": -6.566123962402344, "global_step": 118626, "epoch": 2824} {"train_loss": -6.4760613441467285, "global_step": 118627, "epoch": 2824} {"train_loss": -6.4779157638549805, "global_step": 118628, "epoch": 2824} {"train_loss": -6.5153021812438965, "global_step": 118629, "epoch": 2824} {"train_loss": -6.648304462432861, "global_step": 118630, "epoch": 2824} {"train_loss": -6.440718173980713, "global_step": 118631, "epoch": 2824} {"train_loss": -6.490257263183594, "global_step": 118632, "epoch": 2824} {"train_loss": -6.659277439117432, "global_step": 118633, "epoch": 2824} {"train_loss": -6.512643814086914, "global_step": 118634, "epoch": 2824} {"train_loss": -6.423132419586182, "global_step": 118635, "epoch": 2824} {"train_loss": -6.5937066078186035, "global_step": 118636, "epoch": 2824} {"train_loss": -6.611754417419434, "global_step": 118637, "epoch": 2824} {"train_loss": -6.524270057678223, "global_step": 118638, "epoch": 2824} {"train_loss": -6.456263542175293, "global_step": 118639, "epoch": 2824} {"train_loss": -6.582004547119141, "global_step": 118640, "epoch": 2824} {"train_loss": -6.472076892852783, "global_step": 118641, "epoch": 2824} {"train_loss": -6.568172454833984, "global_step": 118642, "epoch": 2824} {"train_loss": -6.568564414978027, "global_step": 118643, "epoch": 2824} {"train_loss": -6.572674751281738, "global_step": 118644, "epoch": 2824} {"train_loss": -6.516580581665039, "global_step": 118645, "epoch": 2824} {"train_loss": -6.604480266571045, "global_step": 118646, "epoch": 2824} {"train_loss": -6.724767684936523, "global_step": 118647, "epoch": 2824} {"train_loss": -6.574253559112549, "global_step": 118648, "epoch": 2824} {"train_loss": -6.5317135992504305, "global_step": 118649, "epoch": 2824, "val_loss": 76857.765625} {"train_loss": -6.598979949951172, "global_step": 118650, "epoch": 2825} {"train_loss": -6.5391950607299805, "global_step": 118651, "epoch": 2825} {"train_loss": -6.528866767883301, "global_step": 118652, "epoch": 2825} {"train_loss": -6.563725471496582, "global_step": 118653, "epoch": 2825} {"train_loss": -6.614441871643066, "global_step": 118654, "epoch": 2825} {"train_loss": -6.603930950164795, "global_step": 118655, "epoch": 2825} {"train_loss": -6.6297478675842285, "global_step": 118656, "epoch": 2825} {"train_loss": -6.478935718536377, "global_step": 118657, "epoch": 2825} {"train_loss": -6.542112827301025, "global_step": 118658, "epoch": 2825} {"train_loss": -6.550854682922363, "global_step": 118659, "epoch": 2825} {"train_loss": -6.56588888168335, "global_step": 118660, "epoch": 2825} {"train_loss": -6.528036117553711, "global_step": 118661, "epoch": 2825} {"train_loss": -6.570010185241699, "global_step": 118662, "epoch": 2825} {"train_loss": -6.664249420166016, "global_step": 118663, "epoch": 2825} {"train_loss": -6.498070240020752, "global_step": 118664, "epoch": 2825} {"train_loss": -6.665068626403809, "global_step": 118665, "epoch": 2825} {"train_loss": -6.559885025024414, "global_step": 118666, "epoch": 2825} {"train_loss": -6.499536991119385, "global_step": 118667, "epoch": 2825} {"train_loss": -6.575963497161865, "global_step": 118668, "epoch": 2825} {"train_loss": -6.467276573181152, "global_step": 118669, "epoch": 2825} {"train_loss": -6.545602798461914, "global_step": 118670, "epoch": 2825} {"train_loss": -6.554441928863525, "global_step": 118671, "epoch": 2825} {"train_loss": -6.426417350769043, "global_step": 118672, "epoch": 2825} {"train_loss": -6.448636531829834, "global_step": 118673, "epoch": 2825} {"train_loss": -6.538278579711914, "global_step": 118674, "epoch": 2825} {"train_loss": -6.517172813415527, "global_step": 118675, "epoch": 2825} {"train_loss": -6.471260070800781, "global_step": 118676, "epoch": 2825} {"train_loss": -6.462759971618652, "global_step": 118677, "epoch": 2825} {"train_loss": -6.514589309692383, "global_step": 118678, "epoch": 2825} {"train_loss": -6.5248799324035645, "global_step": 118679, "epoch": 2825} {"train_loss": -6.503529071807861, "global_step": 118680, "epoch": 2825} {"train_loss": -6.530577659606934, "global_step": 118681, "epoch": 2825} {"train_loss": -6.473228454589844, "global_step": 118682, "epoch": 2825} {"train_loss": -6.52998685836792, "global_step": 118683, "epoch": 2825} {"train_loss": -6.423186302185059, "global_step": 118684, "epoch": 2825} {"train_loss": -6.586498260498047, "global_step": 118685, "epoch": 2825} {"train_loss": -6.431535720825195, "global_step": 118686, "epoch": 2825} {"train_loss": -6.541999816894531, "global_step": 118687, "epoch": 2825} {"train_loss": -6.374969959259033, "global_step": 118688, "epoch": 2825} {"train_loss": -6.59809684753418, "global_step": 118689, "epoch": 2825} {"train_loss": -6.488663196563721, "global_step": 118690, "epoch": 2825} {"train_loss": -6.527501435506911, "global_step": 118691, "epoch": 2825, "val_loss": 76779.96875} {"train_loss": -6.520615100860596, "global_step": 118692, "epoch": 2826} {"train_loss": -6.566045761108398, "global_step": 118693, "epoch": 2826} {"train_loss": -6.603698253631592, "global_step": 118694, "epoch": 2826} {"train_loss": -6.556037902832031, "global_step": 118695, "epoch": 2826} {"train_loss": -6.491127967834473, "global_step": 118696, "epoch": 2826} {"train_loss": -6.590346336364746, "global_step": 118697, "epoch": 2826} {"train_loss": -6.497517108917236, "global_step": 118698, "epoch": 2826} {"train_loss": -6.635949611663818, "global_step": 118699, "epoch": 2826} {"train_loss": -6.534637451171875, "global_step": 118700, "epoch": 2826} {"train_loss": -6.539626598358154, "global_step": 118701, "epoch": 2826} {"train_loss": -6.546246528625488, "global_step": 118702, "epoch": 2826} {"train_loss": -6.554042816162109, "global_step": 118703, "epoch": 2826} {"train_loss": -6.616255760192871, "global_step": 118704, "epoch": 2826} {"train_loss": -6.582916259765625, "global_step": 118705, "epoch": 2826} {"train_loss": -6.444454193115234, "global_step": 118706, "epoch": 2826} {"train_loss": -6.64940071105957, "global_step": 118707, "epoch": 2826} {"train_loss": -6.527557849884033, "global_step": 118708, "epoch": 2826} {"train_loss": -6.530144691467285, "global_step": 118709, "epoch": 2826} {"train_loss": -6.652717590332031, "global_step": 118710, "epoch": 2826} {"train_loss": -6.636503219604492, "global_step": 118711, "epoch": 2826} {"train_loss": -6.604065418243408, "global_step": 118712, "epoch": 2826} {"train_loss": -6.604338645935059, "global_step": 118713, "epoch": 2826} {"train_loss": -6.717963695526123, "global_step": 118714, "epoch": 2826} {"train_loss": -6.621160507202148, "global_step": 118715, "epoch": 2826} {"train_loss": -6.572169303894043, "global_step": 118716, "epoch": 2826} {"train_loss": -6.6640472412109375, "global_step": 118717, "epoch": 2826} {"train_loss": -6.521869659423828, "global_step": 118718, "epoch": 2826} {"train_loss": -6.608964443206787, "global_step": 118719, "epoch": 2826} {"train_loss": -6.574970245361328, "global_step": 118720, "epoch": 2826} {"train_loss": -6.63316535949707, "global_step": 118721, "epoch": 2826} {"train_loss": -6.487924098968506, "global_step": 118722, "epoch": 2826} {"train_loss": -6.6507134437561035, "global_step": 118723, "epoch": 2826} {"train_loss": -6.538030624389648, "global_step": 118724, "epoch": 2826} {"train_loss": -6.6713762283325195, "global_step": 118725, "epoch": 2826} {"train_loss": -6.57445764541626, "global_step": 118726, "epoch": 2826} {"train_loss": -6.631202220916748, "global_step": 118727, "epoch": 2826} {"train_loss": -6.510394096374512, "global_step": 118728, "epoch": 2826} {"train_loss": -6.652334213256836, "global_step": 118729, "epoch": 2826} {"train_loss": -6.515028953552246, "global_step": 118730, "epoch": 2826} {"train_loss": -6.509228706359863, "global_step": 118731, "epoch": 2826} {"train_loss": -6.581228256225586, "global_step": 118732, "epoch": 2826} {"train_loss": -6.576901708330427, "global_step": 118733, "epoch": 2826, "val_loss": 76730.8359375} {"train_loss": -6.706393718719482, "global_step": 118734, "epoch": 2827} {"train_loss": -6.553006172180176, "global_step": 118735, "epoch": 2827} {"train_loss": -6.561373233795166, "global_step": 118736, "epoch": 2827} {"train_loss": -6.498645305633545, "global_step": 118737, "epoch": 2827} {"train_loss": -6.592658042907715, "global_step": 118738, "epoch": 2827} {"train_loss": -6.459730625152588, "global_step": 118739, "epoch": 2827} {"train_loss": -6.533290863037109, "global_step": 118740, "epoch": 2827} {"train_loss": -6.607553482055664, "global_step": 118741, "epoch": 2827} {"train_loss": -6.5631303787231445, "global_step": 118742, "epoch": 2827} {"train_loss": -6.477655410766602, "global_step": 118743, "epoch": 2827} {"train_loss": -6.607990264892578, "global_step": 118744, "epoch": 2827} {"train_loss": -6.602740287780762, "global_step": 118745, "epoch": 2827} {"train_loss": -6.6149725914001465, "global_step": 118746, "epoch": 2827} {"train_loss": -6.342077732086182, "global_step": 118747, "epoch": 2827} {"train_loss": -6.509294509887695, "global_step": 118748, "epoch": 2827} {"train_loss": -6.544191837310791, "global_step": 118749, "epoch": 2827} {"train_loss": -6.495022773742676, "global_step": 118750, "epoch": 2827} {"train_loss": -6.523758888244629, "global_step": 118751, "epoch": 2827} {"train_loss": -6.58487606048584, "global_step": 118752, "epoch": 2827} {"train_loss": -6.608624458312988, "global_step": 118753, "epoch": 2827} {"train_loss": -6.63419246673584, "global_step": 118754, "epoch": 2827} {"train_loss": -6.553690433502197, "global_step": 118755, "epoch": 2827} {"train_loss": -6.518280029296875, "global_step": 118756, "epoch": 2827} {"train_loss": -6.5643486976623535, "global_step": 118757, "epoch": 2827} {"train_loss": -6.614208221435547, "global_step": 118758, "epoch": 2827} {"train_loss": -6.467230319976807, "global_step": 118759, "epoch": 2827} {"train_loss": -6.492120265960693, "global_step": 118760, "epoch": 2827} {"train_loss": -6.435446262359619, "global_step": 118761, "epoch": 2827} {"train_loss": -6.587225437164307, "global_step": 118762, "epoch": 2827} {"train_loss": -6.5686211585998535, "global_step": 118763, "epoch": 2827} {"train_loss": -6.579336166381836, "global_step": 118764, "epoch": 2827} {"train_loss": -6.523894786834717, "global_step": 118765, "epoch": 2827} {"train_loss": -6.657412528991699, "global_step": 118766, "epoch": 2827} {"train_loss": -6.4933576583862305, "global_step": 118767, "epoch": 2827} {"train_loss": -6.521225929260254, "global_step": 118768, "epoch": 2827} {"train_loss": -6.725571632385254, "global_step": 118769, "epoch": 2827} {"train_loss": -6.50078821182251, "global_step": 118770, "epoch": 2827} {"train_loss": -6.613656997680664, "global_step": 118771, "epoch": 2827} {"train_loss": -6.549652099609375, "global_step": 118772, "epoch": 2827} {"train_loss": -6.467962265014648, "global_step": 118773, "epoch": 2827} {"train_loss": -6.61054801940918, "global_step": 118774, "epoch": 2827} {"train_loss": -6.555014928181966, "global_step": 118775, "epoch": 2827, "val_loss": 76627.5859375} {"train_loss": -6.539675235748291, "global_step": 118776, "epoch": 2828} {"train_loss": -6.646159648895264, "global_step": 118777, "epoch": 2828} {"train_loss": -6.539162635803223, "global_step": 118778, "epoch": 2828} {"train_loss": -6.507324695587158, "global_step": 118779, "epoch": 2828} {"train_loss": -6.5165181159973145, "global_step": 118780, "epoch": 2828} {"train_loss": -6.583926200866699, "global_step": 118781, "epoch": 2828} {"train_loss": -6.596685409545898, "global_step": 118782, "epoch": 2828} {"train_loss": -6.530526161193848, "global_step": 118783, "epoch": 2828} {"train_loss": -6.618363857269287, "global_step": 118784, "epoch": 2828} {"train_loss": -6.519298553466797, "global_step": 118785, "epoch": 2828} {"train_loss": -6.521467208862305, "global_step": 118786, "epoch": 2828} {"train_loss": -6.547978401184082, "global_step": 118787, "epoch": 2828} {"train_loss": -6.463459014892578, "global_step": 118788, "epoch": 2828} {"train_loss": -6.757329940795898, "global_step": 118789, "epoch": 2828} {"train_loss": -6.611103534698486, "global_step": 118790, "epoch": 2828} {"train_loss": -6.632659912109375, "global_step": 118791, "epoch": 2828} {"train_loss": -6.542819976806641, "global_step": 118792, "epoch": 2828} {"train_loss": -6.5525712966918945, "global_step": 118793, "epoch": 2828} {"train_loss": -6.608601093292236, "global_step": 118794, "epoch": 2828} {"train_loss": -6.556018352508545, "global_step": 118795, "epoch": 2828} {"train_loss": -6.566091537475586, "global_step": 118796, "epoch": 2828} {"train_loss": -6.595571517944336, "global_step": 118797, "epoch": 2828} {"train_loss": -6.566317558288574, "global_step": 118798, "epoch": 2828} {"train_loss": -6.422969818115234, "global_step": 118799, "epoch": 2828} {"train_loss": -6.543431282043457, "global_step": 118800, "epoch": 2828} {"train_loss": -6.560327529907227, "global_step": 118801, "epoch": 2828} {"train_loss": -6.64523983001709, "global_step": 118802, "epoch": 2828} {"train_loss": -6.5554022789001465, "global_step": 118803, "epoch": 2828} {"train_loss": -6.624490737915039, "global_step": 118804, "epoch": 2828} {"train_loss": -6.602437973022461, "global_step": 118805, "epoch": 2828} {"train_loss": -6.619102478027344, "global_step": 118806, "epoch": 2828} {"train_loss": -6.645021438598633, "global_step": 118807, "epoch": 2828} {"train_loss": -6.538052558898926, "global_step": 118808, "epoch": 2828} {"train_loss": -6.665681838989258, "global_step": 118809, "epoch": 2828} {"train_loss": -6.438623428344727, "global_step": 118810, "epoch": 2828} {"train_loss": -6.518494129180908, "global_step": 118811, "epoch": 2828} {"train_loss": -6.547411918640137, "global_step": 118812, "epoch": 2828} {"train_loss": -6.570400238037109, "global_step": 118813, "epoch": 2828} {"train_loss": -6.761809349060059, "global_step": 118814, "epoch": 2828} {"train_loss": -6.640345573425293, "global_step": 118815, "epoch": 2828} {"train_loss": -6.520087718963623, "global_step": 118816, "epoch": 2828} {"train_loss": -6.572723104840233, "global_step": 118817, "epoch": 2828, "val_loss": 76472.8515625} {"train_loss": -6.459835529327393, "global_step": 118818, "epoch": 2829} {"train_loss": -6.583146095275879, "global_step": 118819, "epoch": 2829} {"train_loss": -6.549430847167969, "global_step": 118820, "epoch": 2829} {"train_loss": -6.525696754455566, "global_step": 118821, "epoch": 2829} {"train_loss": -6.638086318969727, "global_step": 118822, "epoch": 2829} {"train_loss": -6.638006210327148, "global_step": 118823, "epoch": 2829} {"train_loss": -6.550172805786133, "global_step": 118824, "epoch": 2829} {"train_loss": -6.627165794372559, "global_step": 118825, "epoch": 2829} {"train_loss": -6.5883588790893555, "global_step": 118826, "epoch": 2829} {"train_loss": -6.600588798522949, "global_step": 118827, "epoch": 2829} {"train_loss": -6.598339080810547, "global_step": 118828, "epoch": 2829} {"train_loss": -6.569965839385986, "global_step": 118829, "epoch": 2829} {"train_loss": -6.640807151794434, "global_step": 118830, "epoch": 2829} {"train_loss": -6.550850868225098, "global_step": 118831, "epoch": 2829} {"train_loss": -6.675948143005371, "global_step": 118832, "epoch": 2829} {"train_loss": -6.703690528869629, "global_step": 118833, "epoch": 2829} {"train_loss": -6.5853376388549805, "global_step": 118834, "epoch": 2829} {"train_loss": -6.561938285827637, "global_step": 118835, "epoch": 2829} {"train_loss": -6.60737943649292, "global_step": 118836, "epoch": 2829} {"train_loss": -6.628878116607666, "global_step": 118837, "epoch": 2829} {"train_loss": -6.679603576660156, "global_step": 118838, "epoch": 2829} {"train_loss": -6.627881050109863, "global_step": 118839, "epoch": 2829} {"train_loss": -6.487790107727051, "global_step": 118840, "epoch": 2829} {"train_loss": -6.517941474914551, "global_step": 118841, "epoch": 2829} {"train_loss": -6.4356255531311035, "global_step": 118842, "epoch": 2829} {"train_loss": -6.487744331359863, "global_step": 118843, "epoch": 2829} {"train_loss": -6.564521789550781, "global_step": 118844, "epoch": 2829} {"train_loss": -6.5129594802856445, "global_step": 118845, "epoch": 2829} {"train_loss": -6.61949348449707, "global_step": 118846, "epoch": 2829} {"train_loss": -6.577888488769531, "global_step": 118847, "epoch": 2829} {"train_loss": -6.48539924621582, "global_step": 118848, "epoch": 2829} {"train_loss": -6.550691604614258, "global_step": 118849, "epoch": 2829} {"train_loss": -6.4892120361328125, "global_step": 118850, "epoch": 2829} {"train_loss": -6.587411403656006, "global_step": 118851, "epoch": 2829} {"train_loss": -6.589756965637207, "global_step": 118852, "epoch": 2829} {"train_loss": -6.538595199584961, "global_step": 118853, "epoch": 2829} {"train_loss": -6.634765625, "global_step": 118854, "epoch": 2829} {"train_loss": -6.504976272583008, "global_step": 118855, "epoch": 2829} {"train_loss": -6.39676570892334, "global_step": 118856, "epoch": 2829} {"train_loss": -6.626948356628418, "global_step": 118857, "epoch": 2829} {"train_loss": -6.562894821166992, "global_step": 118858, "epoch": 2829} {"train_loss": -6.567659559704008, "global_step": 118859, "epoch": 2829, "val_loss": 76941.484375} {"train_loss": -6.579401969909668, "global_step": 118860, "epoch": 2830} {"train_loss": -6.539748191833496, "global_step": 118861, "epoch": 2830} {"train_loss": -6.581419944763184, "global_step": 118862, "epoch": 2830} {"train_loss": -6.5495758056640625, "global_step": 118863, "epoch": 2830} {"train_loss": -6.60414457321167, "global_step": 118864, "epoch": 2830} {"train_loss": -6.48876953125, "global_step": 118865, "epoch": 2830} {"train_loss": -6.385168552398682, "global_step": 118866, "epoch": 2830} {"train_loss": -6.486256122589111, "global_step": 118867, "epoch": 2830} {"train_loss": -6.627791404724121, "global_step": 118868, "epoch": 2830} {"train_loss": -6.575234413146973, "global_step": 118869, "epoch": 2830} {"train_loss": -6.444153785705566, "global_step": 118870, "epoch": 2830} {"train_loss": -6.588914394378662, "global_step": 118871, "epoch": 2830} {"train_loss": -6.4698591232299805, "global_step": 118872, "epoch": 2830} {"train_loss": -6.57681941986084, "global_step": 118873, "epoch": 2830} {"train_loss": -6.475523948669434, "global_step": 118874, "epoch": 2830} {"train_loss": -6.596868991851807, "global_step": 118875, "epoch": 2830} {"train_loss": -6.627364158630371, "global_step": 118876, "epoch": 2830} {"train_loss": -6.441403388977051, "global_step": 118877, "epoch": 2830} {"train_loss": -6.58717679977417, "global_step": 118878, "epoch": 2830} {"train_loss": -6.48946475982666, "global_step": 118879, "epoch": 2830} {"train_loss": -6.497735500335693, "global_step": 118880, "epoch": 2830} {"train_loss": -6.567384719848633, "global_step": 118881, "epoch": 2830} {"train_loss": -6.523287296295166, "global_step": 118882, "epoch": 2830} {"train_loss": -6.55948543548584, "global_step": 118883, "epoch": 2830} {"train_loss": -6.584676742553711, "global_step": 118884, "epoch": 2830} {"train_loss": -6.571005821228027, "global_step": 118885, "epoch": 2830} {"train_loss": -6.544157981872559, "global_step": 118886, "epoch": 2830} {"train_loss": -6.523558139801025, "global_step": 118887, "epoch": 2830} {"train_loss": -6.506438732147217, "global_step": 118888, "epoch": 2830} {"train_loss": -6.507863998413086, "global_step": 118889, "epoch": 2830} {"train_loss": -6.574202060699463, "global_step": 118890, "epoch": 2830} {"train_loss": -6.559089660644531, "global_step": 118891, "epoch": 2830} {"train_loss": -6.441202640533447, "global_step": 118892, "epoch": 2830} {"train_loss": -6.523438930511475, "global_step": 118893, "epoch": 2830} {"train_loss": -6.555988311767578, "global_step": 118894, "epoch": 2830} {"train_loss": -6.518704414367676, "global_step": 118895, "epoch": 2830} {"train_loss": -6.522719383239746, "global_step": 118896, "epoch": 2830} {"train_loss": -6.503792762756348, "global_step": 118897, "epoch": 2830} {"train_loss": -6.500361919403076, "global_step": 118898, "epoch": 2830} {"train_loss": -6.529097557067871, "global_step": 118899, "epoch": 2830} {"train_loss": -6.545600891113281, "global_step": 118900, "epoch": 2830} {"train_loss": -6.532842284157162, "global_step": 118901, "epoch": 2830, "val_loss": 76739.1484375} {"train_loss": -6.51423454284668, "global_step": 118902, "epoch": 2831} {"train_loss": -6.664254665374756, "global_step": 118903, "epoch": 2831} {"train_loss": -6.618647575378418, "global_step": 118904, "epoch": 2831} {"train_loss": -6.569820404052734, "global_step": 118905, "epoch": 2831} {"train_loss": -6.515703201293945, "global_step": 118906, "epoch": 2831} {"train_loss": -6.655665397644043, "global_step": 118907, "epoch": 2831} {"train_loss": -6.526494026184082, "global_step": 118908, "epoch": 2831} {"train_loss": -6.632565498352051, "global_step": 118909, "epoch": 2831} {"train_loss": -6.546989917755127, "global_step": 118910, "epoch": 2831} {"train_loss": -6.48561954498291, "global_step": 118911, "epoch": 2831} {"train_loss": -6.591707706451416, "global_step": 118912, "epoch": 2831} {"train_loss": -6.56959867477417, "global_step": 118913, "epoch": 2831} {"train_loss": -6.423273086547852, "global_step": 118914, "epoch": 2831} {"train_loss": -6.520679950714111, "global_step": 118915, "epoch": 2831} {"train_loss": -6.506505966186523, "global_step": 118916, "epoch": 2831} {"train_loss": -6.449719429016113, "global_step": 118917, "epoch": 2831} {"train_loss": -6.412182807922363, "global_step": 118918, "epoch": 2831} {"train_loss": -6.687835693359375, "global_step": 118919, "epoch": 2831} {"train_loss": -6.524763107299805, "global_step": 118920, "epoch": 2831} {"train_loss": -6.581972122192383, "global_step": 118921, "epoch": 2831} {"train_loss": -6.424892425537109, "global_step": 118922, "epoch": 2831} {"train_loss": -6.454603672027588, "global_step": 118923, "epoch": 2831} {"train_loss": -6.476977348327637, "global_step": 118924, "epoch": 2831} {"train_loss": -6.400200843811035, "global_step": 118925, "epoch": 2831} {"train_loss": -6.599817752838135, "global_step": 118926, "epoch": 2831} {"train_loss": -6.37299919128418, "global_step": 118927, "epoch": 2831} {"train_loss": -6.55265998840332, "global_step": 118928, "epoch": 2831} {"train_loss": -6.649312973022461, "global_step": 118929, "epoch": 2831} {"train_loss": -6.62809944152832, "global_step": 118930, "epoch": 2831} {"train_loss": -6.5310587882995605, "global_step": 118931, "epoch": 2831} {"train_loss": -6.626396179199219, "global_step": 118932, "epoch": 2831} {"train_loss": -6.493002891540527, "global_step": 118933, "epoch": 2831} {"train_loss": -6.574262619018555, "global_step": 118934, "epoch": 2831} {"train_loss": -6.567404747009277, "global_step": 118935, "epoch": 2831} {"train_loss": -6.424935817718506, "global_step": 118936, "epoch": 2831} {"train_loss": -6.485002517700195, "global_step": 118937, "epoch": 2831} {"train_loss": -6.609211444854736, "global_step": 118938, "epoch": 2831} {"train_loss": -6.535430908203125, "global_step": 118939, "epoch": 2831} {"train_loss": -6.555657386779785, "global_step": 118940, "epoch": 2831} {"train_loss": -6.416487216949463, "global_step": 118941, "epoch": 2831} {"train_loss": -6.414907455444336, "global_step": 118942, "epoch": 2831} {"train_loss": -6.532882906141735, "global_step": 118943, "epoch": 2831, "val_loss": 77181.4296875} {"train_loss": -6.531363487243652, "global_step": 118944, "epoch": 2832} {"train_loss": -6.483269691467285, "global_step": 118945, "epoch": 2832} {"train_loss": -6.493823051452637, "global_step": 118946, "epoch": 2832} {"train_loss": -6.5776777267456055, "global_step": 118947, "epoch": 2832} {"train_loss": -6.531010627746582, "global_step": 118948, "epoch": 2832} {"train_loss": -6.487443923950195, "global_step": 118949, "epoch": 2832} {"train_loss": -6.529500484466553, "global_step": 118950, "epoch": 2832} {"train_loss": -6.490658283233643, "global_step": 118951, "epoch": 2832} {"train_loss": -6.463135242462158, "global_step": 118952, "epoch": 2832} {"train_loss": -6.594865322113037, "global_step": 118953, "epoch": 2832} {"train_loss": -6.620055675506592, "global_step": 118954, "epoch": 2832} {"train_loss": -6.685202598571777, "global_step": 118955, "epoch": 2832} {"train_loss": -6.608242988586426, "global_step": 118956, "epoch": 2832} {"train_loss": -6.659695148468018, "global_step": 118957, "epoch": 2832} {"train_loss": -6.5391435623168945, "global_step": 118958, "epoch": 2832} {"train_loss": -6.667352199554443, "global_step": 118959, "epoch": 2832} {"train_loss": -6.580606937408447, "global_step": 118960, "epoch": 2832} {"train_loss": -6.5855817794799805, "global_step": 118961, "epoch": 2832} {"train_loss": -6.628006935119629, "global_step": 118962, "epoch": 2832} {"train_loss": -6.526486396789551, "global_step": 118963, "epoch": 2832} {"train_loss": -6.65285587310791, "global_step": 118964, "epoch": 2832} {"train_loss": -6.677563190460205, "global_step": 118965, "epoch": 2832} {"train_loss": -6.649990081787109, "global_step": 118966, "epoch": 2832} {"train_loss": -6.581486701965332, "global_step": 118967, "epoch": 2832} {"train_loss": -6.488393783569336, "global_step": 118968, "epoch": 2832} {"train_loss": -6.627749443054199, "global_step": 118969, "epoch": 2832} {"train_loss": -6.637270450592041, "global_step": 118970, "epoch": 2832} {"train_loss": -6.531526565551758, "global_step": 118971, "epoch": 2832} {"train_loss": -6.477930545806885, "global_step": 118972, "epoch": 2832} {"train_loss": -6.523409843444824, "global_step": 118973, "epoch": 2832} {"train_loss": -6.480737686157227, "global_step": 118974, "epoch": 2832} {"train_loss": -6.612199783325195, "global_step": 118975, "epoch": 2832} {"train_loss": -6.7018022537231445, "global_step": 118976, "epoch": 2832} {"train_loss": -6.552403450012207, "global_step": 118977, "epoch": 2832} {"train_loss": -6.5603132247924805, "global_step": 118978, "epoch": 2832} {"train_loss": -6.549960613250732, "global_step": 118979, "epoch": 2832} {"train_loss": -6.521884918212891, "global_step": 118980, "epoch": 2832} {"train_loss": -6.534999847412109, "global_step": 118981, "epoch": 2832} {"train_loss": -6.54628849029541, "global_step": 118982, "epoch": 2832} {"train_loss": -6.419873237609863, "global_step": 118983, "epoch": 2832} {"train_loss": -6.611932754516602, "global_step": 118984, "epoch": 2832} {"train_loss": -6.564933243251982, "global_step": 118985, "epoch": 2832, "val_loss": 76917.3046875} {"train_loss": -6.513824462890625, "global_step": 118986, "epoch": 2833} {"train_loss": -6.4644317626953125, "global_step": 118987, "epoch": 2833} {"train_loss": -6.581348419189453, "global_step": 118988, "epoch": 2833} {"train_loss": -6.528685569763184, "global_step": 118989, "epoch": 2833} {"train_loss": -6.621335983276367, "global_step": 118990, "epoch": 2833} {"train_loss": -6.440757751464844, "global_step": 118991, "epoch": 2833} {"train_loss": -6.586958885192871, "global_step": 118992, "epoch": 2833} {"train_loss": -6.6108245849609375, "global_step": 118993, "epoch": 2833} {"train_loss": -6.532626628875732, "global_step": 118994, "epoch": 2833} {"train_loss": -6.653074264526367, "global_step": 118995, "epoch": 2833} {"train_loss": -6.570269584655762, "global_step": 118996, "epoch": 2833} {"train_loss": -6.626233100891113, "global_step": 118997, "epoch": 2833} {"train_loss": -6.4654083251953125, "global_step": 118998, "epoch": 2833} {"train_loss": -6.421163558959961, "global_step": 118999, "epoch": 2833} {"train_loss": -6.581645965576172, "global_step": 119000, "epoch": 2833} {"train_loss": -6.640556335449219, "global_step": 119001, "epoch": 2833} {"train_loss": -6.466590881347656, "global_step": 119002, "epoch": 2833} {"train_loss": -6.54719352722168, "global_step": 119003, "epoch": 2833} {"train_loss": -6.561968803405762, "global_step": 119004, "epoch": 2833} {"train_loss": -6.556051254272461, "global_step": 119005, "epoch": 2833} {"train_loss": -6.698651313781738, "global_step": 119006, "epoch": 2833} {"train_loss": -6.501137733459473, "global_step": 119007, "epoch": 2833} {"train_loss": -6.660224914550781, "global_step": 119008, "epoch": 2833} {"train_loss": -6.451254844665527, "global_step": 119009, "epoch": 2833} {"train_loss": -6.56315803527832, "global_step": 119010, "epoch": 2833} {"train_loss": -6.615184783935547, "global_step": 119011, "epoch": 2833} {"train_loss": -6.474299430847168, "global_step": 119012, "epoch": 2833} {"train_loss": -6.473730087280273, "global_step": 119013, "epoch": 2833} {"train_loss": -6.5461835861206055, "global_step": 119014, "epoch": 2833} {"train_loss": -6.555675506591797, "global_step": 119015, "epoch": 2833} {"train_loss": -6.557219505310059, "global_step": 119016, "epoch": 2833} {"train_loss": -6.459757328033447, "global_step": 119017, "epoch": 2833} {"train_loss": -6.522599220275879, "global_step": 119018, "epoch": 2833} {"train_loss": -6.53984260559082, "global_step": 119019, "epoch": 2833} {"train_loss": -6.538387775421143, "global_step": 119020, "epoch": 2833} {"train_loss": -6.558487892150879, "global_step": 119021, "epoch": 2833} {"train_loss": -6.674764633178711, "global_step": 119022, "epoch": 2833} {"train_loss": -6.535691738128662, "global_step": 119023, "epoch": 2833} {"train_loss": -6.550843238830566, "global_step": 119024, "epoch": 2833} {"train_loss": -6.616655349731445, "global_step": 119025, "epoch": 2833} {"train_loss": -6.557776927947998, "global_step": 119026, "epoch": 2833} {"train_loss": -6.553663140251523, "global_step": 119027, "epoch": 2833, "val_loss": 76971.3203125} {"train_loss": -6.6584577560424805, "global_step": 119028, "epoch": 2834} {"train_loss": -6.635973930358887, "global_step": 119029, "epoch": 2834} {"train_loss": -6.602516174316406, "global_step": 119030, "epoch": 2834} {"train_loss": -6.643340110778809, "global_step": 119031, "epoch": 2834} {"train_loss": -6.593194961547852, "global_step": 119032, "epoch": 2834} {"train_loss": -6.7218475341796875, "global_step": 119033, "epoch": 2834} {"train_loss": -6.527874946594238, "global_step": 119034, "epoch": 2834} {"train_loss": -6.6016154289245605, "global_step": 119035, "epoch": 2834} {"train_loss": -6.597126483917236, "global_step": 119036, "epoch": 2834} {"train_loss": -6.611227035522461, "global_step": 119037, "epoch": 2834} {"train_loss": -6.63761568069458, "global_step": 119038, "epoch": 2834} {"train_loss": -6.456165313720703, "global_step": 119039, "epoch": 2834} {"train_loss": -6.582480430603027, "global_step": 119040, "epoch": 2834} {"train_loss": -6.590305805206299, "global_step": 119041, "epoch": 2834} {"train_loss": -6.5202484130859375, "global_step": 119042, "epoch": 2834} {"train_loss": -6.576291561126709, "global_step": 119043, "epoch": 2834} {"train_loss": -6.581734657287598, "global_step": 119044, "epoch": 2834} {"train_loss": -6.437566757202148, "global_step": 119045, "epoch": 2834} {"train_loss": -6.544624328613281, "global_step": 119046, "epoch": 2834} {"train_loss": -6.543048858642578, "global_step": 119047, "epoch": 2834} {"train_loss": -6.551612377166748, "global_step": 119048, "epoch": 2834} {"train_loss": -6.465858459472656, "global_step": 119049, "epoch": 2834} {"train_loss": -6.543705463409424, "global_step": 119050, "epoch": 2834} {"train_loss": -6.660103797912598, "global_step": 119051, "epoch": 2834} {"train_loss": -6.56021785736084, "global_step": 119052, "epoch": 2834} {"train_loss": -6.587979316711426, "global_step": 119053, "epoch": 2834} {"train_loss": -6.511665344238281, "global_step": 119054, "epoch": 2834} {"train_loss": -6.468523025512695, "global_step": 119055, "epoch": 2834} {"train_loss": -6.494377136230469, "global_step": 119056, "epoch": 2834} {"train_loss": -6.659804344177246, "global_step": 119057, "epoch": 2834} {"train_loss": -6.477616310119629, "global_step": 119058, "epoch": 2834} {"train_loss": -6.512463569641113, "global_step": 119059, "epoch": 2834} {"train_loss": -6.495877265930176, "global_step": 119060, "epoch": 2834} {"train_loss": -6.479759216308594, "global_step": 119061, "epoch": 2834} {"train_loss": -6.506566047668457, "global_step": 119062, "epoch": 2834} {"train_loss": -6.5972442626953125, "global_step": 119063, "epoch": 2834} {"train_loss": -6.543635368347168, "global_step": 119064, "epoch": 2834} {"train_loss": -6.4235992431640625, "global_step": 119065, "epoch": 2834} {"train_loss": -6.459038734436035, "global_step": 119066, "epoch": 2834} {"train_loss": -6.5920491218566895, "global_step": 119067, "epoch": 2834} {"train_loss": -6.532196044921875, "global_step": 119068, "epoch": 2834} {"train_loss": -6.552872850781395, "global_step": 119069, "epoch": 2834, "val_loss": 76851.4609375} {"train_loss": -6.43488883972168, "global_step": 119070, "epoch": 2835} {"train_loss": -6.387899398803711, "global_step": 119071, "epoch": 2835} {"train_loss": -6.354045867919922, "global_step": 119072, "epoch": 2835} {"train_loss": -6.446519374847412, "global_step": 119073, "epoch": 2835} {"train_loss": -6.487136363983154, "global_step": 119074, "epoch": 2835} {"train_loss": -6.605963706970215, "global_step": 119075, "epoch": 2835} {"train_loss": -6.462647914886475, "global_step": 119076, "epoch": 2835} {"train_loss": -6.551465034484863, "global_step": 119077, "epoch": 2835} {"train_loss": -6.538897514343262, "global_step": 119078, "epoch": 2835} {"train_loss": -6.53081750869751, "global_step": 119079, "epoch": 2835} {"train_loss": -6.554775238037109, "global_step": 119080, "epoch": 2835} {"train_loss": -6.352817058563232, "global_step": 119081, "epoch": 2835} {"train_loss": -6.612041473388672, "global_step": 119082, "epoch": 2835} {"train_loss": -6.5585432052612305, "global_step": 119083, "epoch": 2835} {"train_loss": -6.478206157684326, "global_step": 119084, "epoch": 2835} {"train_loss": -6.67742395401001, "global_step": 119085, "epoch": 2835} {"train_loss": -6.532589435577393, "global_step": 119086, "epoch": 2835} {"train_loss": -6.54545783996582, "global_step": 119087, "epoch": 2835} {"train_loss": -6.5862627029418945, "global_step": 119088, "epoch": 2835} {"train_loss": -6.474946975708008, "global_step": 119089, "epoch": 2835} {"train_loss": -6.568855285644531, "global_step": 119090, "epoch": 2835} {"train_loss": -6.512058258056641, "global_step": 119091, "epoch": 2835} {"train_loss": -6.526684761047363, "global_step": 119092, "epoch": 2835} {"train_loss": -6.672726631164551, "global_step": 119093, "epoch": 2835} {"train_loss": -6.491813659667969, "global_step": 119094, "epoch": 2835} {"train_loss": -6.642549991607666, "global_step": 119095, "epoch": 2835} {"train_loss": -6.58985710144043, "global_step": 119096, "epoch": 2835} {"train_loss": -6.5655951499938965, "global_step": 119097, "epoch": 2835} {"train_loss": -6.6982269287109375, "global_step": 119098, "epoch": 2835} {"train_loss": -6.606998920440674, "global_step": 119099, "epoch": 2835} {"train_loss": -6.646657466888428, "global_step": 119100, "epoch": 2835} {"train_loss": -6.566680908203125, "global_step": 119101, "epoch": 2835} {"train_loss": -6.4681196212768555, "global_step": 119102, "epoch": 2835} {"train_loss": -6.640761375427246, "global_step": 119103, "epoch": 2835} {"train_loss": -6.6341142654418945, "global_step": 119104, "epoch": 2835} {"train_loss": -6.460630416870117, "global_step": 119105, "epoch": 2835} {"train_loss": -6.526346683502197, "global_step": 119106, "epoch": 2835} {"train_loss": -6.515113830566406, "global_step": 119107, "epoch": 2835} {"train_loss": -6.537487030029297, "global_step": 119108, "epoch": 2835} {"train_loss": -6.64555549621582, "global_step": 119109, "epoch": 2835} {"train_loss": -6.561757564544678, "global_step": 119110, "epoch": 2835} {"train_loss": -6.543694053377424, "global_step": 119111, "epoch": 2835, "val_loss": 76654.171875} {"train_loss": -6.652848243713379, "global_step": 119112, "epoch": 2836} {"train_loss": -6.455878257751465, "global_step": 119113, "epoch": 2836} {"train_loss": -6.496482849121094, "global_step": 119114, "epoch": 2836} {"train_loss": -6.57051420211792, "global_step": 119115, "epoch": 2836} {"train_loss": -6.459897518157959, "global_step": 119116, "epoch": 2836} {"train_loss": -6.598243713378906, "global_step": 119117, "epoch": 2836} {"train_loss": -6.706833839416504, "global_step": 119118, "epoch": 2836} {"train_loss": -6.608672142028809, "global_step": 119119, "epoch": 2836} {"train_loss": -6.629508018493652, "global_step": 119120, "epoch": 2836} {"train_loss": -6.696619033813477, "global_step": 119121, "epoch": 2836} {"train_loss": -6.589023590087891, "global_step": 119122, "epoch": 2836} {"train_loss": -6.6476030349731445, "global_step": 119123, "epoch": 2836} {"train_loss": -6.621827125549316, "global_step": 119124, "epoch": 2836} {"train_loss": -6.545482635498047, "global_step": 119125, "epoch": 2836} {"train_loss": -6.583165168762207, "global_step": 119126, "epoch": 2836} {"train_loss": -6.682604789733887, "global_step": 119127, "epoch": 2836} {"train_loss": -6.601151466369629, "global_step": 119128, "epoch": 2836} {"train_loss": -6.771864891052246, "global_step": 119129, "epoch": 2836} {"train_loss": -6.5378265380859375, "global_step": 119130, "epoch": 2836} {"train_loss": -6.746726036071777, "global_step": 119131, "epoch": 2836} {"train_loss": -6.63376522064209, "global_step": 119132, "epoch": 2836} {"train_loss": -6.53620719909668, "global_step": 119133, "epoch": 2836} {"train_loss": -6.534740447998047, "global_step": 119134, "epoch": 2836} {"train_loss": -6.593517303466797, "global_step": 119135, "epoch": 2836} {"train_loss": -6.75341796875, "global_step": 119136, "epoch": 2836} {"train_loss": -6.509109020233154, "global_step": 119137, "epoch": 2836} {"train_loss": -6.549683570861816, "global_step": 119138, "epoch": 2836} {"train_loss": -6.43480920791626, "global_step": 119139, "epoch": 2836} {"train_loss": -6.557635307312012, "global_step": 119140, "epoch": 2836} {"train_loss": -6.508396148681641, "global_step": 119141, "epoch": 2836} {"train_loss": -6.545855522155762, "global_step": 119142, "epoch": 2836} {"train_loss": -6.498818397521973, "global_step": 119143, "epoch": 2836} {"train_loss": -6.496472358703613, "global_step": 119144, "epoch": 2836} {"train_loss": -6.570595741271973, "global_step": 119145, "epoch": 2836} {"train_loss": -6.529377460479736, "global_step": 119146, "epoch": 2836} {"train_loss": -6.610227584838867, "global_step": 119147, "epoch": 2836} {"train_loss": -6.602545261383057, "global_step": 119148, "epoch": 2836} {"train_loss": -6.555065155029297, "global_step": 119149, "epoch": 2836} {"train_loss": -6.610605239868164, "global_step": 119150, "epoch": 2836} {"train_loss": -6.543604850769043, "global_step": 119151, "epoch": 2836} {"train_loss": -6.531712532043457, "global_step": 119152, "epoch": 2836} {"train_loss": -6.583471196038382, "global_step": 119153, "epoch": 2836, "val_loss": 76810.7421875} {"train_loss": -6.491745948791504, "global_step": 119154, "epoch": 2837} {"train_loss": -6.497567653656006, "global_step": 119155, "epoch": 2837} {"train_loss": -6.543398857116699, "global_step": 119156, "epoch": 2837} {"train_loss": -6.630128860473633, "global_step": 119157, "epoch": 2837} {"train_loss": -6.538795471191406, "global_step": 119158, "epoch": 2837} {"train_loss": -6.524888038635254, "global_step": 119159, "epoch": 2837} {"train_loss": -6.650297164916992, "global_step": 119160, "epoch": 2837} {"train_loss": -6.554974555969238, "global_step": 119161, "epoch": 2837} {"train_loss": -6.59074592590332, "global_step": 119162, "epoch": 2837} {"train_loss": -6.686593055725098, "global_step": 119163, "epoch": 2837} {"train_loss": -6.592627048492432, "global_step": 119164, "epoch": 2837} {"train_loss": -6.465560436248779, "global_step": 119165, "epoch": 2837} {"train_loss": -6.548835754394531, "global_step": 119166, "epoch": 2837} {"train_loss": -6.4735331535339355, "global_step": 119167, "epoch": 2837} {"train_loss": -6.564892768859863, "global_step": 119168, "epoch": 2837} {"train_loss": -6.631779670715332, "global_step": 119169, "epoch": 2837} {"train_loss": -6.463832855224609, "global_step": 119170, "epoch": 2837} {"train_loss": -6.489045143127441, "global_step": 119171, "epoch": 2837} {"train_loss": -6.631170272827148, "global_step": 119172, "epoch": 2837} {"train_loss": -6.5057148933410645, "global_step": 119173, "epoch": 2837} {"train_loss": -6.560794830322266, "global_step": 119174, "epoch": 2837} {"train_loss": -6.607966423034668, "global_step": 119175, "epoch": 2837} {"train_loss": -6.762333869934082, "global_step": 119176, "epoch": 2837} {"train_loss": -6.623184680938721, "global_step": 119177, "epoch": 2837} {"train_loss": -6.613417148590088, "global_step": 119178, "epoch": 2837} {"train_loss": -6.612597942352295, "global_step": 119179, "epoch": 2837} {"train_loss": -6.653162956237793, "global_step": 119180, "epoch": 2837} {"train_loss": -6.676943302154541, "global_step": 119181, "epoch": 2837} {"train_loss": -6.567181587219238, "global_step": 119182, "epoch": 2837} {"train_loss": -6.603999137878418, "global_step": 119183, "epoch": 2837} {"train_loss": -6.680552959442139, "global_step": 119184, "epoch": 2837} {"train_loss": -6.496171474456787, "global_step": 119185, "epoch": 2837} {"train_loss": -6.641017913818359, "global_step": 119186, "epoch": 2837} {"train_loss": -6.596233367919922, "global_step": 119187, "epoch": 2837} {"train_loss": -6.489065170288086, "global_step": 119188, "epoch": 2837} {"train_loss": -6.616390705108643, "global_step": 119189, "epoch": 2837} {"train_loss": -6.397500991821289, "global_step": 119190, "epoch": 2837} {"train_loss": -6.357460975646973, "global_step": 119191, "epoch": 2837} {"train_loss": -6.6433539390563965, "global_step": 119192, "epoch": 2837} {"train_loss": -6.400678634643555, "global_step": 119193, "epoch": 2837} {"train_loss": -6.447610855102539, "global_step": 119194, "epoch": 2837} {"train_loss": -6.563739787964594, "global_step": 119195, "epoch": 2837, "val_loss": 76886.046875} {"train_loss": -6.521675109863281, "global_step": 119196, "epoch": 2838} {"train_loss": -6.493496894836426, "global_step": 119197, "epoch": 2838} {"train_loss": -6.553267955780029, "global_step": 119198, "epoch": 2838} {"train_loss": -6.545882225036621, "global_step": 119199, "epoch": 2838} {"train_loss": -6.590970039367676, "global_step": 119200, "epoch": 2838} {"train_loss": -6.448752403259277, "global_step": 119201, "epoch": 2838} {"train_loss": -6.617358684539795, "global_step": 119202, "epoch": 2838} {"train_loss": -6.457742691040039, "global_step": 119203, "epoch": 2838} {"train_loss": -6.520847320556641, "global_step": 119204, "epoch": 2838} {"train_loss": -6.571010112762451, "global_step": 119205, "epoch": 2838} {"train_loss": -6.4541521072387695, "global_step": 119206, "epoch": 2838} {"train_loss": -6.433722019195557, "global_step": 119207, "epoch": 2838} {"train_loss": -6.654167175292969, "global_step": 119208, "epoch": 2838} {"train_loss": -6.549867630004883, "global_step": 119209, "epoch": 2838} {"train_loss": -6.3800482749938965, "global_step": 119210, "epoch": 2838} {"train_loss": -6.732361793518066, "global_step": 119211, "epoch": 2838} {"train_loss": -6.403264999389648, "global_step": 119212, "epoch": 2838} {"train_loss": -6.433666229248047, "global_step": 119213, "epoch": 2838} {"train_loss": -6.64223575592041, "global_step": 119214, "epoch": 2838} {"train_loss": -6.423630237579346, "global_step": 119215, "epoch": 2838} {"train_loss": -6.735573768615723, "global_step": 119216, "epoch": 2838} {"train_loss": -6.363610744476318, "global_step": 119217, "epoch": 2838} {"train_loss": -6.468084335327148, "global_step": 119218, "epoch": 2838} {"train_loss": -6.568357467651367, "global_step": 119219, "epoch": 2838} {"train_loss": -6.409572601318359, "global_step": 119220, "epoch": 2838} {"train_loss": -6.652016639709473, "global_step": 119221, "epoch": 2838} {"train_loss": -6.4607391357421875, "global_step": 119222, "epoch": 2838} {"train_loss": -6.4889960289001465, "global_step": 119223, "epoch": 2838} {"train_loss": -6.487381458282471, "global_step": 119224, "epoch": 2838} {"train_loss": -6.327862739562988, "global_step": 119225, "epoch": 2838} {"train_loss": -6.567471504211426, "global_step": 119226, "epoch": 2838} {"train_loss": -6.344443321228027, "global_step": 119227, "epoch": 2838} {"train_loss": -6.530141830444336, "global_step": 119228, "epoch": 2838} {"train_loss": -6.3806562423706055, "global_step": 119229, "epoch": 2838} {"train_loss": -6.462636947631836, "global_step": 119230, "epoch": 2838} {"train_loss": -6.52496862411499, "global_step": 119231, "epoch": 2838} {"train_loss": -6.3909807205200195, "global_step": 119232, "epoch": 2838} {"train_loss": -6.409721374511719, "global_step": 119233, "epoch": 2838} {"train_loss": -6.5033159255981445, "global_step": 119234, "epoch": 2838} {"train_loss": -6.544450283050537, "global_step": 119235, "epoch": 2838} {"train_loss": -6.414450645446777, "global_step": 119236, "epoch": 2838} {"train_loss": -6.500501871109009, "global_step": 119237, "epoch": 2838, "val_loss": 76578.0390625} {"train_loss": -6.444559097290039, "global_step": 119238, "epoch": 2839} {"train_loss": -6.572721004486084, "global_step": 119239, "epoch": 2839} {"train_loss": -6.4463114738464355, "global_step": 119240, "epoch": 2839} {"train_loss": -6.589962005615234, "global_step": 119241, "epoch": 2839} {"train_loss": -6.599343776702881, "global_step": 119242, "epoch": 2839} {"train_loss": -6.460208892822266, "global_step": 119243, "epoch": 2839} {"train_loss": -6.613207817077637, "global_step": 119244, "epoch": 2839} {"train_loss": -6.4444074630737305, "global_step": 119245, "epoch": 2839} {"train_loss": -6.490365028381348, "global_step": 119246, "epoch": 2839} {"train_loss": -6.469614505767822, "global_step": 119247, "epoch": 2839} {"train_loss": -6.596807956695557, "global_step": 119248, "epoch": 2839} {"train_loss": -6.486584663391113, "global_step": 119249, "epoch": 2839} {"train_loss": -6.542098045349121, "global_step": 119250, "epoch": 2839} {"train_loss": -6.450298309326172, "global_step": 119251, "epoch": 2839} {"train_loss": -6.617155075073242, "global_step": 119252, "epoch": 2839} {"train_loss": -6.529963493347168, "global_step": 119253, "epoch": 2839} {"train_loss": -6.489199161529541, "global_step": 119254, "epoch": 2839} {"train_loss": -6.628719329833984, "global_step": 119255, "epoch": 2839} {"train_loss": -6.545636177062988, "global_step": 119256, "epoch": 2839} {"train_loss": -6.527331352233887, "global_step": 119257, "epoch": 2839} {"train_loss": -6.509228706359863, "global_step": 119258, "epoch": 2839} {"train_loss": -6.403697490692139, "global_step": 119259, "epoch": 2839} {"train_loss": -6.543265342712402, "global_step": 119260, "epoch": 2839} {"train_loss": -6.489738941192627, "global_step": 119261, "epoch": 2839} {"train_loss": -6.446221351623535, "global_step": 119262, "epoch": 2839} {"train_loss": -6.4163408279418945, "global_step": 119263, "epoch": 2839} {"train_loss": -6.433197498321533, "global_step": 119264, "epoch": 2839} {"train_loss": -6.547534465789795, "global_step": 119265, "epoch": 2839} {"train_loss": -6.525989055633545, "global_step": 119266, "epoch": 2839} {"train_loss": -6.563210964202881, "global_step": 119267, "epoch": 2839} {"train_loss": -6.460726261138916, "global_step": 119268, "epoch": 2839} {"train_loss": -6.6199846267700195, "global_step": 119269, "epoch": 2839} {"train_loss": -6.467212677001953, "global_step": 119270, "epoch": 2839} {"train_loss": -6.604961395263672, "global_step": 119271, "epoch": 2839} {"train_loss": -6.582221031188965, "global_step": 119272, "epoch": 2839} {"train_loss": -6.471934795379639, "global_step": 119273, "epoch": 2839} {"train_loss": -6.619525909423828, "global_step": 119274, "epoch": 2839} {"train_loss": -6.442050933837891, "global_step": 119275, "epoch": 2839} {"train_loss": -6.462482452392578, "global_step": 119276, "epoch": 2839} {"train_loss": -6.483369827270508, "global_step": 119277, "epoch": 2839} {"train_loss": -6.499504089355469, "global_step": 119278, "epoch": 2839} {"train_loss": -6.514079184759231, "global_step": 119279, "epoch": 2839, "val_loss": 76865.3671875} {"train_loss": -6.435639381408691, "global_step": 119280, "epoch": 2840} {"train_loss": -6.619075775146484, "global_step": 119281, "epoch": 2840} {"train_loss": -6.707260608673096, "global_step": 119282, "epoch": 2840} {"train_loss": -6.627119541168213, "global_step": 119283, "epoch": 2840} {"train_loss": -6.555142402648926, "global_step": 119284, "epoch": 2840} {"train_loss": -6.626002311706543, "global_step": 119285, "epoch": 2840} {"train_loss": -6.475368499755859, "global_step": 119286, "epoch": 2840} {"train_loss": -6.562039375305176, "global_step": 119287, "epoch": 2840} {"train_loss": -6.59217643737793, "global_step": 119288, "epoch": 2840} {"train_loss": -6.5419392585754395, "global_step": 119289, "epoch": 2840} {"train_loss": -6.52284049987793, "global_step": 119290, "epoch": 2840} {"train_loss": -6.577193260192871, "global_step": 119291, "epoch": 2840} {"train_loss": -6.697601795196533, "global_step": 119292, "epoch": 2840} {"train_loss": -6.719053745269775, "global_step": 119293, "epoch": 2840} {"train_loss": -6.476258754730225, "global_step": 119294, "epoch": 2840} {"train_loss": -6.649827480316162, "global_step": 119295, "epoch": 2840} {"train_loss": -6.421389579772949, "global_step": 119296, "epoch": 2840} {"train_loss": -6.512777328491211, "global_step": 119297, "epoch": 2840} {"train_loss": -6.427803993225098, "global_step": 119298, "epoch": 2840} {"train_loss": -6.600430488586426, "global_step": 119299, "epoch": 2840} {"train_loss": -6.500227451324463, "global_step": 119300, "epoch": 2840} {"train_loss": -6.35903263092041, "global_step": 119301, "epoch": 2840} {"train_loss": -6.557307720184326, "global_step": 119302, "epoch": 2840} {"train_loss": -6.484035491943359, "global_step": 119303, "epoch": 2840} {"train_loss": -6.5118327140808105, "global_step": 119304, "epoch": 2840} {"train_loss": -6.62376070022583, "global_step": 119305, "epoch": 2840} {"train_loss": -6.467207908630371, "global_step": 119306, "epoch": 2840} {"train_loss": -6.369439125061035, "global_step": 119307, "epoch": 2840} {"train_loss": -6.654758453369141, "global_step": 119308, "epoch": 2840} {"train_loss": -6.466817378997803, "global_step": 119309, "epoch": 2840} {"train_loss": -6.512164115905762, "global_step": 119310, "epoch": 2840} {"train_loss": -6.412997245788574, "global_step": 119311, "epoch": 2840} {"train_loss": -6.4747772216796875, "global_step": 119312, "epoch": 2840} {"train_loss": -6.451606750488281, "global_step": 119313, "epoch": 2840} {"train_loss": -6.430932521820068, "global_step": 119314, "epoch": 2840} {"train_loss": -6.534284591674805, "global_step": 119315, "epoch": 2840} {"train_loss": -6.461097240447998, "global_step": 119316, "epoch": 2840} {"train_loss": -6.605929374694824, "global_step": 119317, "epoch": 2840} {"train_loss": -6.364047050476074, "global_step": 119318, "epoch": 2840} {"train_loss": -6.514991760253906, "global_step": 119319, "epoch": 2840} {"train_loss": -6.54530143737793, "global_step": 119320, "epoch": 2840} {"train_loss": -6.5287601834251765, "global_step": 119321, "epoch": 2840, "val_loss": 76791.859375} {"train_loss": -6.530289173126221, "global_step": 119322, "epoch": 2841} {"train_loss": -6.647552490234375, "global_step": 119323, "epoch": 2841} {"train_loss": -6.547904014587402, "global_step": 119324, "epoch": 2841} {"train_loss": -6.591716766357422, "global_step": 119325, "epoch": 2841} {"train_loss": -6.522240161895752, "global_step": 119326, "epoch": 2841} {"train_loss": -6.5311713218688965, "global_step": 119327, "epoch": 2841} {"train_loss": -6.657611846923828, "global_step": 119328, "epoch": 2841} {"train_loss": -6.6340789794921875, "global_step": 119329, "epoch": 2841} {"train_loss": -6.60111141204834, "global_step": 119330, "epoch": 2841} {"train_loss": -6.523139953613281, "global_step": 119331, "epoch": 2841} {"train_loss": -6.620090007781982, "global_step": 119332, "epoch": 2841} {"train_loss": -6.5692138671875, "global_step": 119333, "epoch": 2841} {"train_loss": -6.620087146759033, "global_step": 119334, "epoch": 2841} {"train_loss": -6.65023136138916, "global_step": 119335, "epoch": 2841} {"train_loss": -6.60443639755249, "global_step": 119336, "epoch": 2841} {"train_loss": -6.594890594482422, "global_step": 119337, "epoch": 2841} {"train_loss": -6.746320724487305, "global_step": 119338, "epoch": 2841} {"train_loss": -6.614572525024414, "global_step": 119339, "epoch": 2841} {"train_loss": -6.5653276443481445, "global_step": 119340, "epoch": 2841} {"train_loss": -6.738438606262207, "global_step": 119341, "epoch": 2841} {"train_loss": -6.583488464355469, "global_step": 119342, "epoch": 2841} {"train_loss": -6.4851226806640625, "global_step": 119343, "epoch": 2841} {"train_loss": -6.482645511627197, "global_step": 119344, "epoch": 2841} {"train_loss": -6.63907527923584, "global_step": 119345, "epoch": 2841} {"train_loss": -6.582141876220703, "global_step": 119346, "epoch": 2841} {"train_loss": -6.556883811950684, "global_step": 119347, "epoch": 2841} {"train_loss": -6.540090560913086, "global_step": 119348, "epoch": 2841} {"train_loss": -6.501781463623047, "global_step": 119349, "epoch": 2841} {"train_loss": -6.677417755126953, "global_step": 119350, "epoch": 2841} {"train_loss": -6.652093887329102, "global_step": 119351, "epoch": 2841} {"train_loss": -6.5509796142578125, "global_step": 119352, "epoch": 2841} {"train_loss": -6.540581703186035, "global_step": 119353, "epoch": 2841} {"train_loss": -6.6124491691589355, "global_step": 119354, "epoch": 2841} {"train_loss": -6.656163692474365, "global_step": 119355, "epoch": 2841} {"train_loss": -6.549922943115234, "global_step": 119356, "epoch": 2841} {"train_loss": -6.402133941650391, "global_step": 119357, "epoch": 2841} {"train_loss": -6.568868637084961, "global_step": 119358, "epoch": 2841} {"train_loss": -6.607347011566162, "global_step": 119359, "epoch": 2841} {"train_loss": -6.553421974182129, "global_step": 119360, "epoch": 2841} {"train_loss": -6.584519386291504, "global_step": 119361, "epoch": 2841} {"train_loss": -6.641284942626953, "global_step": 119362, "epoch": 2841} {"train_loss": -6.586124817530314, "global_step": 119363, "epoch": 2841, "val_loss": 77109.6875} {"train_loss": -6.531820297241211, "global_step": 119364, "epoch": 2842} {"train_loss": -6.549696445465088, "global_step": 119365, "epoch": 2842} {"train_loss": -6.633297443389893, "global_step": 119366, "epoch": 2842} {"train_loss": -6.619977951049805, "global_step": 119367, "epoch": 2842} {"train_loss": -6.545217037200928, "global_step": 119368, "epoch": 2842} {"train_loss": -6.531918525695801, "global_step": 119369, "epoch": 2842} {"train_loss": -6.656216621398926, "global_step": 119370, "epoch": 2842} {"train_loss": -6.705419540405273, "global_step": 119371, "epoch": 2842} {"train_loss": -6.6544718742370605, "global_step": 119372, "epoch": 2842} {"train_loss": -6.557851791381836, "global_step": 119373, "epoch": 2842} {"train_loss": -6.584646224975586, "global_step": 119374, "epoch": 2842} {"train_loss": -6.652141571044922, "global_step": 119375, "epoch": 2842} {"train_loss": -6.7042012214660645, "global_step": 119376, "epoch": 2842} {"train_loss": -6.5065436363220215, "global_step": 119377, "epoch": 2842} {"train_loss": -6.487185955047607, "global_step": 119378, "epoch": 2842} {"train_loss": -6.605095863342285, "global_step": 119379, "epoch": 2842} {"train_loss": -6.629716396331787, "global_step": 119380, "epoch": 2842} {"train_loss": -6.623330116271973, "global_step": 119381, "epoch": 2842} {"train_loss": -6.522887229919434, "global_step": 119382, "epoch": 2842} {"train_loss": -6.589621543884277, "global_step": 119383, "epoch": 2842} {"train_loss": -6.6009674072265625, "global_step": 119384, "epoch": 2842} {"train_loss": -6.688246726989746, "global_step": 119385, "epoch": 2842} {"train_loss": -6.555825233459473, "global_step": 119386, "epoch": 2842} {"train_loss": -6.702259540557861, "global_step": 119387, "epoch": 2842} {"train_loss": -6.554078102111816, "global_step": 119388, "epoch": 2842} {"train_loss": -6.618054389953613, "global_step": 119389, "epoch": 2842} {"train_loss": -6.572508335113525, "global_step": 119390, "epoch": 2842} {"train_loss": -6.6561384201049805, "global_step": 119391, "epoch": 2842} {"train_loss": -6.71071195602417, "global_step": 119392, "epoch": 2842} {"train_loss": -6.666780471801758, "global_step": 119393, "epoch": 2842} {"train_loss": -6.587749481201172, "global_step": 119394, "epoch": 2842} {"train_loss": -6.557706832885742, "global_step": 119395, "epoch": 2842} {"train_loss": -6.570261001586914, "global_step": 119396, "epoch": 2842} {"train_loss": -6.544736862182617, "global_step": 119397, "epoch": 2842} {"train_loss": -6.566481113433838, "global_step": 119398, "epoch": 2842} {"train_loss": -6.563436508178711, "global_step": 119399, "epoch": 2842} {"train_loss": -6.597457408905029, "global_step": 119400, "epoch": 2842} {"train_loss": -6.568323135375977, "global_step": 119401, "epoch": 2842} {"train_loss": -6.570703506469727, "global_step": 119402, "epoch": 2842} {"train_loss": -6.5968499183654785, "global_step": 119403, "epoch": 2842} {"train_loss": -6.610408782958984, "global_step": 119404, "epoch": 2842} {"train_loss": -6.595364922568912, "global_step": 119405, "epoch": 2842, "val_loss": 76962.234375} {"train_loss": -6.7156662940979, "global_step": 119406, "epoch": 2843} {"train_loss": -6.5695390701293945, "global_step": 119407, "epoch": 2843} {"train_loss": -6.619312286376953, "global_step": 119408, "epoch": 2843} {"train_loss": -6.576529026031494, "global_step": 119409, "epoch": 2843} {"train_loss": -6.616666793823242, "global_step": 119410, "epoch": 2843} {"train_loss": -6.589262962341309, "global_step": 119411, "epoch": 2843} {"train_loss": -6.672213554382324, "global_step": 119412, "epoch": 2843} {"train_loss": -6.556375980377197, "global_step": 119413, "epoch": 2843} {"train_loss": -6.549416542053223, "global_step": 119414, "epoch": 2843} {"train_loss": -6.486300468444824, "global_step": 119415, "epoch": 2843} {"train_loss": -6.640355110168457, "global_step": 119416, "epoch": 2843} {"train_loss": -6.583213806152344, "global_step": 119417, "epoch": 2843} {"train_loss": -6.58846378326416, "global_step": 119418, "epoch": 2843} {"train_loss": -6.594000816345215, "global_step": 119419, "epoch": 2843} {"train_loss": -6.557955265045166, "global_step": 119420, "epoch": 2843} {"train_loss": -6.5258049964904785, "global_step": 119421, "epoch": 2843} {"train_loss": -6.61447286605835, "global_step": 119422, "epoch": 2843} {"train_loss": -6.605863571166992, "global_step": 119423, "epoch": 2843} {"train_loss": -6.5094757080078125, "global_step": 119424, "epoch": 2843} {"train_loss": -6.6333417892456055, "global_step": 119425, "epoch": 2843} {"train_loss": -6.640721321105957, "global_step": 119426, "epoch": 2843} {"train_loss": -6.570484161376953, "global_step": 119427, "epoch": 2843} {"train_loss": -6.562032699584961, "global_step": 119428, "epoch": 2843} {"train_loss": -6.559035301208496, "global_step": 119429, "epoch": 2843} {"train_loss": -6.553830146789551, "global_step": 119430, "epoch": 2843} {"train_loss": -6.482917785644531, "global_step": 119431, "epoch": 2843} {"train_loss": -6.5672926902771, "global_step": 119432, "epoch": 2843} {"train_loss": -6.615262031555176, "global_step": 119433, "epoch": 2843} {"train_loss": -6.689684867858887, "global_step": 119434, "epoch": 2843} {"train_loss": -6.4713826179504395, "global_step": 119435, "epoch": 2843} {"train_loss": -6.524421215057373, "global_step": 119436, "epoch": 2843} {"train_loss": -6.50485372543335, "global_step": 119437, "epoch": 2843} {"train_loss": -6.523594856262207, "global_step": 119438, "epoch": 2843} {"train_loss": -6.6167168617248535, "global_step": 119439, "epoch": 2843} {"train_loss": -6.572574615478516, "global_step": 119440, "epoch": 2843} {"train_loss": -6.660140514373779, "global_step": 119441, "epoch": 2843} {"train_loss": -6.544013023376465, "global_step": 119442, "epoch": 2843} {"train_loss": -6.566556930541992, "global_step": 119443, "epoch": 2843} {"train_loss": -6.44321346282959, "global_step": 119444, "epoch": 2843} {"train_loss": -6.588523864746094, "global_step": 119445, "epoch": 2843} {"train_loss": -6.575589179992676, "global_step": 119446, "epoch": 2843} {"train_loss": -6.5756644407908125, "global_step": 119447, "epoch": 2843, "val_loss": 76720.6484375} {"train_loss": -6.3896074295043945, "global_step": 119448, "epoch": 2844} {"train_loss": -6.426968097686768, "global_step": 119449, "epoch": 2844} {"train_loss": -6.513988971710205, "global_step": 119450, "epoch": 2844} {"train_loss": -6.640439510345459, "global_step": 119451, "epoch": 2844} {"train_loss": -6.601500988006592, "global_step": 119452, "epoch": 2844} {"train_loss": -6.486673831939697, "global_step": 119453, "epoch": 2844} {"train_loss": -6.405566215515137, "global_step": 119454, "epoch": 2844} {"train_loss": -6.427258491516113, "global_step": 119455, "epoch": 2844} {"train_loss": -6.404386520385742, "global_step": 119456, "epoch": 2844} {"train_loss": -6.605947017669678, "global_step": 119457, "epoch": 2844} {"train_loss": -6.528722763061523, "global_step": 119458, "epoch": 2844} {"train_loss": -6.579676151275635, "global_step": 119459, "epoch": 2844} {"train_loss": -6.437727928161621, "global_step": 119460, "epoch": 2844} {"train_loss": -6.340360164642334, "global_step": 119461, "epoch": 2844} {"train_loss": -6.443674564361572, "global_step": 119462, "epoch": 2844} {"train_loss": -6.349875450134277, "global_step": 119463, "epoch": 2844} {"train_loss": -6.513287544250488, "global_step": 119464, "epoch": 2844} {"train_loss": -6.473923206329346, "global_step": 119465, "epoch": 2844} {"train_loss": -6.390201091766357, "global_step": 119466, "epoch": 2844} {"train_loss": -6.446013450622559, "global_step": 119467, "epoch": 2844} {"train_loss": -6.644582748413086, "global_step": 119468, "epoch": 2844} {"train_loss": -6.555568218231201, "global_step": 119469, "epoch": 2844} {"train_loss": -6.465516090393066, "global_step": 119470, "epoch": 2844} {"train_loss": -6.469655990600586, "global_step": 119471, "epoch": 2844} {"train_loss": -6.485255241394043, "global_step": 119472, "epoch": 2844} {"train_loss": -6.530524253845215, "global_step": 119473, "epoch": 2844} {"train_loss": -6.5197882652282715, "global_step": 119474, "epoch": 2844} {"train_loss": -6.641902446746826, "global_step": 119475, "epoch": 2844} {"train_loss": -6.476962089538574, "global_step": 119476, "epoch": 2844} {"train_loss": -6.636204719543457, "global_step": 119477, "epoch": 2844} {"train_loss": -6.527428150177002, "global_step": 119478, "epoch": 2844} {"train_loss": -6.479562282562256, "global_step": 119479, "epoch": 2844} {"train_loss": -6.520185470581055, "global_step": 119480, "epoch": 2844} {"train_loss": -6.450822830200195, "global_step": 119481, "epoch": 2844} {"train_loss": -6.6494927406311035, "global_step": 119482, "epoch": 2844} {"train_loss": -6.5207743644714355, "global_step": 119483, "epoch": 2844} {"train_loss": -6.466916084289551, "global_step": 119484, "epoch": 2844} {"train_loss": -6.473094940185547, "global_step": 119485, "epoch": 2844} {"train_loss": -6.480908393859863, "global_step": 119486, "epoch": 2844} {"train_loss": -6.542915344238281, "global_step": 119487, "epoch": 2844} {"train_loss": -6.674351692199707, "global_step": 119488, "epoch": 2844} {"train_loss": -6.502223605201358, "global_step": 119489, "epoch": 2844, "val_loss": 76654.140625} {"train_loss": -6.569460868835449, "global_step": 119490, "epoch": 2845} {"train_loss": -6.431107521057129, "global_step": 119491, "epoch": 2845} {"train_loss": -6.561405181884766, "global_step": 119492, "epoch": 2845} {"train_loss": -6.606688499450684, "global_step": 119493, "epoch": 2845} {"train_loss": -6.524491786956787, "global_step": 119494, "epoch": 2845} {"train_loss": -6.6541972160339355, "global_step": 119495, "epoch": 2845} {"train_loss": -6.600458145141602, "global_step": 119496, "epoch": 2845} {"train_loss": -6.570696830749512, "global_step": 119497, "epoch": 2845} {"train_loss": -6.590633869171143, "global_step": 119498, "epoch": 2845} {"train_loss": -6.564752578735352, "global_step": 119499, "epoch": 2845} {"train_loss": -6.487548828125, "global_step": 119500, "epoch": 2845} {"train_loss": -6.598785877227783, "global_step": 119501, "epoch": 2845} {"train_loss": -6.5231122970581055, "global_step": 119502, "epoch": 2845} {"train_loss": -6.550870895385742, "global_step": 119503, "epoch": 2845} {"train_loss": -6.538993835449219, "global_step": 119504, "epoch": 2845} {"train_loss": -6.583495140075684, "global_step": 119505, "epoch": 2845} {"train_loss": -6.583622932434082, "global_step": 119506, "epoch": 2845} {"train_loss": -6.57295036315918, "global_step": 119507, "epoch": 2845} {"train_loss": -6.481806755065918, "global_step": 119508, "epoch": 2845} {"train_loss": -6.560079097747803, "global_step": 119509, "epoch": 2845} {"train_loss": -6.649004936218262, "global_step": 119510, "epoch": 2845} {"train_loss": -6.4098124504089355, "global_step": 119511, "epoch": 2845} {"train_loss": -6.512503623962402, "global_step": 119512, "epoch": 2845} {"train_loss": -6.562380790710449, "global_step": 119513, "epoch": 2845} {"train_loss": -6.503161430358887, "global_step": 119514, "epoch": 2845} {"train_loss": -6.580033302307129, "global_step": 119515, "epoch": 2845} {"train_loss": -6.4040937423706055, "global_step": 119516, "epoch": 2845} {"train_loss": -6.63630485534668, "global_step": 119517, "epoch": 2845} {"train_loss": -6.488903045654297, "global_step": 119518, "epoch": 2845} {"train_loss": -6.516274929046631, "global_step": 119519, "epoch": 2845} {"train_loss": -6.551462173461914, "global_step": 119520, "epoch": 2845} {"train_loss": -6.581049919128418, "global_step": 119521, "epoch": 2845} {"train_loss": -6.510461807250977, "global_step": 119522, "epoch": 2845} {"train_loss": -6.504235744476318, "global_step": 119523, "epoch": 2845} {"train_loss": -6.565441131591797, "global_step": 119524, "epoch": 2845} {"train_loss": -6.478775978088379, "global_step": 119525, "epoch": 2845} {"train_loss": -6.546442985534668, "global_step": 119526, "epoch": 2845} {"train_loss": -6.581921100616455, "global_step": 119527, "epoch": 2845} {"train_loss": -6.555416107177734, "global_step": 119528, "epoch": 2845} {"train_loss": -6.561318397521973, "global_step": 119529, "epoch": 2845} {"train_loss": -6.683260917663574, "global_step": 119530, "epoch": 2845} {"train_loss": -6.55030023484003, "global_step": 119531, "epoch": 2845, "val_loss": 77087.015625} {"train_loss": -6.561332702636719, "global_step": 119532, "epoch": 2846} {"train_loss": -6.642221450805664, "global_step": 119533, "epoch": 2846} {"train_loss": -6.645931243896484, "global_step": 119534, "epoch": 2846} {"train_loss": -6.598435401916504, "global_step": 119535, "epoch": 2846} {"train_loss": -6.539477348327637, "global_step": 119536, "epoch": 2846} {"train_loss": -6.631292819976807, "global_step": 119537, "epoch": 2846} {"train_loss": -6.570693016052246, "global_step": 119538, "epoch": 2846} {"train_loss": -6.460690498352051, "global_step": 119539, "epoch": 2846} {"train_loss": -6.605903625488281, "global_step": 119540, "epoch": 2846} {"train_loss": -6.597456932067871, "global_step": 119541, "epoch": 2846} {"train_loss": -6.518503665924072, "global_step": 119542, "epoch": 2846} {"train_loss": -6.786149978637695, "global_step": 119543, "epoch": 2846} {"train_loss": -6.616459846496582, "global_step": 119544, "epoch": 2846} {"train_loss": -6.666738510131836, "global_step": 119545, "epoch": 2846} {"train_loss": -6.523358345031738, "global_step": 119546, "epoch": 2846} {"train_loss": -6.605956077575684, "global_step": 119547, "epoch": 2846} {"train_loss": -6.553244590759277, "global_step": 119548, "epoch": 2846} {"train_loss": -6.747005462646484, "global_step": 119549, "epoch": 2846} {"train_loss": -6.717751502990723, "global_step": 119550, "epoch": 2846} {"train_loss": -6.612504959106445, "global_step": 119551, "epoch": 2846} {"train_loss": -6.5819926261901855, "global_step": 119552, "epoch": 2846} {"train_loss": -6.568375587463379, "global_step": 119553, "epoch": 2846} {"train_loss": -6.667976379394531, "global_step": 119554, "epoch": 2846} {"train_loss": -6.566556930541992, "global_step": 119555, "epoch": 2846} {"train_loss": -6.653748989105225, "global_step": 119556, "epoch": 2846} {"train_loss": -6.47067928314209, "global_step": 119557, "epoch": 2846} {"train_loss": -6.5173444747924805, "global_step": 119558, "epoch": 2846} {"train_loss": -6.381540298461914, "global_step": 119559, "epoch": 2846} {"train_loss": -6.547675609588623, "global_step": 119560, "epoch": 2846} {"train_loss": -6.395606994628906, "global_step": 119561, "epoch": 2846} {"train_loss": -6.553813457489014, "global_step": 119562, "epoch": 2846} {"train_loss": -6.630003929138184, "global_step": 119563, "epoch": 2846} {"train_loss": -6.5337018966674805, "global_step": 119564, "epoch": 2846} {"train_loss": -6.4482574462890625, "global_step": 119565, "epoch": 2846} {"train_loss": -6.665970325469971, "global_step": 119566, "epoch": 2846} {"train_loss": -6.599431991577148, "global_step": 119567, "epoch": 2846} {"train_loss": -6.619085311889648, "global_step": 119568, "epoch": 2846} {"train_loss": -6.511429786682129, "global_step": 119569, "epoch": 2846} {"train_loss": -6.59914493560791, "global_step": 119570, "epoch": 2846} {"train_loss": -6.5501837730407715, "global_step": 119571, "epoch": 2846} {"train_loss": -6.533831596374512, "global_step": 119572, "epoch": 2846} {"train_loss": -6.581721158254714, "global_step": 119573, "epoch": 2846, "val_loss": 76900.0859375} {"train_loss": -6.512345314025879, "global_step": 119574, "epoch": 2847} {"train_loss": -6.526668548583984, "global_step": 119575, "epoch": 2847} {"train_loss": -6.607483863830566, "global_step": 119576, "epoch": 2847} {"train_loss": -6.580596923828125, "global_step": 119577, "epoch": 2847} {"train_loss": -6.499307632446289, "global_step": 119578, "epoch": 2847} {"train_loss": -6.622162342071533, "global_step": 119579, "epoch": 2847} {"train_loss": -6.656723976135254, "global_step": 119580, "epoch": 2847} {"train_loss": -6.665362358093262, "global_step": 119581, "epoch": 2847} {"train_loss": -6.672309875488281, "global_step": 119582, "epoch": 2847} {"train_loss": -6.664508819580078, "global_step": 119583, "epoch": 2847} {"train_loss": -6.5752458572387695, "global_step": 119584, "epoch": 2847} {"train_loss": -6.695711612701416, "global_step": 119585, "epoch": 2847} {"train_loss": -6.634405612945557, "global_step": 119586, "epoch": 2847} {"train_loss": -6.546391010284424, "global_step": 119587, "epoch": 2847} {"train_loss": -6.597188949584961, "global_step": 119588, "epoch": 2847} {"train_loss": -6.6429901123046875, "global_step": 119589, "epoch": 2847} {"train_loss": -6.59769344329834, "global_step": 119590, "epoch": 2847} {"train_loss": -6.579641342163086, "global_step": 119591, "epoch": 2847} {"train_loss": -6.5902910232543945, "global_step": 119592, "epoch": 2847} {"train_loss": -6.571632385253906, "global_step": 119593, "epoch": 2847} {"train_loss": -6.499666690826416, "global_step": 119594, "epoch": 2847} {"train_loss": -6.465986251831055, "global_step": 119595, "epoch": 2847} {"train_loss": -6.644284248352051, "global_step": 119596, "epoch": 2847} {"train_loss": -6.515565395355225, "global_step": 119597, "epoch": 2847} {"train_loss": -6.574651718139648, "global_step": 119598, "epoch": 2847} {"train_loss": -6.670774936676025, "global_step": 119599, "epoch": 2847} {"train_loss": -6.620591163635254, "global_step": 119600, "epoch": 2847} {"train_loss": -6.588212490081787, "global_step": 119601, "epoch": 2847} {"train_loss": -6.538309574127197, "global_step": 119602, "epoch": 2847} {"train_loss": -6.5813398361206055, "global_step": 119603, "epoch": 2847} {"train_loss": -6.4940900802612305, "global_step": 119604, "epoch": 2847} {"train_loss": -6.4843430519104, "global_step": 119605, "epoch": 2847} {"train_loss": -6.446259498596191, "global_step": 119606, "epoch": 2847} {"train_loss": -6.645322322845459, "global_step": 119607, "epoch": 2847} {"train_loss": -6.443387031555176, "global_step": 119608, "epoch": 2847} {"train_loss": -6.434216499328613, "global_step": 119609, "epoch": 2847} {"train_loss": -6.582512855529785, "global_step": 119610, "epoch": 2847} {"train_loss": -6.483482837677002, "global_step": 119611, "epoch": 2847} {"train_loss": -6.477402687072754, "global_step": 119612, "epoch": 2847} {"train_loss": -6.641757488250732, "global_step": 119613, "epoch": 2847} {"train_loss": -6.40795373916626, "global_step": 119614, "epoch": 2847} {"train_loss": -6.566359349659511, "global_step": 119615, "epoch": 2847, "val_loss": 76915.7578125} {"train_loss": -6.447943687438965, "global_step": 119616, "epoch": 2848} {"train_loss": -6.576409816741943, "global_step": 119617, "epoch": 2848} {"train_loss": -6.4905314445495605, "global_step": 119618, "epoch": 2848} {"train_loss": -6.578600883483887, "global_step": 119619, "epoch": 2848} {"train_loss": -6.584612846374512, "global_step": 119620, "epoch": 2848} {"train_loss": -6.499715805053711, "global_step": 119621, "epoch": 2848} {"train_loss": -6.531952381134033, "global_step": 119622, "epoch": 2848} {"train_loss": -6.575869083404541, "global_step": 119623, "epoch": 2848} {"train_loss": -6.678678512573242, "global_step": 119624, "epoch": 2848} {"train_loss": -6.568761825561523, "global_step": 119625, "epoch": 2848} {"train_loss": -6.608555793762207, "global_step": 119626, "epoch": 2848} {"train_loss": -6.576618194580078, "global_step": 119627, "epoch": 2848} {"train_loss": -6.5348920822143555, "global_step": 119628, "epoch": 2848} {"train_loss": -6.685116767883301, "global_step": 119629, "epoch": 2848} {"train_loss": -6.733733177185059, "global_step": 119630, "epoch": 2848} {"train_loss": -6.501654148101807, "global_step": 119631, "epoch": 2848} {"train_loss": -6.562258720397949, "global_step": 119632, "epoch": 2848} {"train_loss": -6.635859489440918, "global_step": 119633, "epoch": 2848} {"train_loss": -6.647843360900879, "global_step": 119634, "epoch": 2848} {"train_loss": -6.6107563972473145, "global_step": 119635, "epoch": 2848} {"train_loss": -6.627011299133301, "global_step": 119636, "epoch": 2848} {"train_loss": -6.5121750831604, "global_step": 119637, "epoch": 2848} {"train_loss": -6.628897190093994, "global_step": 119638, "epoch": 2848} {"train_loss": -6.640811443328857, "global_step": 119639, "epoch": 2848} {"train_loss": -6.537929534912109, "global_step": 119640, "epoch": 2848} {"train_loss": -6.440982341766357, "global_step": 119641, "epoch": 2848} {"train_loss": -6.615939617156982, "global_step": 119642, "epoch": 2848} {"train_loss": -6.700160026550293, "global_step": 119643, "epoch": 2848} {"train_loss": -6.546966552734375, "global_step": 119644, "epoch": 2848} {"train_loss": -6.606516361236572, "global_step": 119645, "epoch": 2848} {"train_loss": -6.5565409660339355, "global_step": 119646, "epoch": 2848} {"train_loss": -6.549432277679443, "global_step": 119647, "epoch": 2848} {"train_loss": -6.702044486999512, "global_step": 119648, "epoch": 2848} {"train_loss": -6.571212291717529, "global_step": 119649, "epoch": 2848} {"train_loss": -6.530259132385254, "global_step": 119650, "epoch": 2848} {"train_loss": -6.571977615356445, "global_step": 119651, "epoch": 2848} {"train_loss": -6.6338276863098145, "global_step": 119652, "epoch": 2848} {"train_loss": -6.519104957580566, "global_step": 119653, "epoch": 2848} {"train_loss": -6.454689979553223, "global_step": 119654, "epoch": 2848} {"train_loss": -6.673388957977295, "global_step": 119655, "epoch": 2848} {"train_loss": -6.493760108947754, "global_step": 119656, "epoch": 2848} {"train_loss": -6.581152847834995, "global_step": 119657, "epoch": 2848, "val_loss": 77269.375} {"train_loss": -6.562440395355225, "global_step": 119658, "epoch": 2849} {"train_loss": -6.458821773529053, "global_step": 119659, "epoch": 2849} {"train_loss": -6.488718509674072, "global_step": 119660, "epoch": 2849} {"train_loss": -6.527199745178223, "global_step": 119661, "epoch": 2849} {"train_loss": -6.5633039474487305, "global_step": 119662, "epoch": 2849} {"train_loss": -6.556673049926758, "global_step": 119663, "epoch": 2849} {"train_loss": -6.494499206542969, "global_step": 119664, "epoch": 2849} {"train_loss": -6.341184139251709, "global_step": 119665, "epoch": 2849} {"train_loss": -6.529271125793457, "global_step": 119666, "epoch": 2849} {"train_loss": -6.3859453201293945, "global_step": 119667, "epoch": 2849} {"train_loss": -6.577498435974121, "global_step": 119668, "epoch": 2849} {"train_loss": -6.391712188720703, "global_step": 119669, "epoch": 2849} {"train_loss": -6.497591018676758, "global_step": 119670, "epoch": 2849} {"train_loss": -6.4841461181640625, "global_step": 119671, "epoch": 2849} {"train_loss": -6.409244537353516, "global_step": 119672, "epoch": 2849} {"train_loss": -6.613156318664551, "global_step": 119673, "epoch": 2849} {"train_loss": -6.5410637855529785, "global_step": 119674, "epoch": 2849} {"train_loss": -6.461056709289551, "global_step": 119675, "epoch": 2849} {"train_loss": -6.514779567718506, "global_step": 119676, "epoch": 2849} {"train_loss": -6.493719100952148, "global_step": 119677, "epoch": 2849} {"train_loss": -6.526867389678955, "global_step": 119678, "epoch": 2849} {"train_loss": -6.629157066345215, "global_step": 119679, "epoch": 2849} {"train_loss": -6.527632713317871, "global_step": 119680, "epoch": 2849} {"train_loss": -6.564624786376953, "global_step": 119681, "epoch": 2849} {"train_loss": -6.52166748046875, "global_step": 119682, "epoch": 2849} {"train_loss": -6.548015117645264, "global_step": 119683, "epoch": 2849} {"train_loss": -6.518152236938477, "global_step": 119684, "epoch": 2849} {"train_loss": -6.538764476776123, "global_step": 119685, "epoch": 2849} {"train_loss": -6.486911773681641, "global_step": 119686, "epoch": 2849} {"train_loss": -6.476317405700684, "global_step": 119687, "epoch": 2849} {"train_loss": -6.611333847045898, "global_step": 119688, "epoch": 2849} {"train_loss": -6.562861919403076, "global_step": 119689, "epoch": 2849} {"train_loss": -6.457912445068359, "global_step": 119690, "epoch": 2849} {"train_loss": -6.3373918533325195, "global_step": 119691, "epoch": 2849} {"train_loss": -6.496068954467773, "global_step": 119692, "epoch": 2849} {"train_loss": -6.526854991912842, "global_step": 119693, "epoch": 2849} {"train_loss": -6.548511981964111, "global_step": 119694, "epoch": 2849} {"train_loss": -6.549757957458496, "global_step": 119695, "epoch": 2849} {"train_loss": -6.552926063537598, "global_step": 119696, "epoch": 2849} {"train_loss": -6.525322437286377, "global_step": 119697, "epoch": 2849} {"train_loss": -6.561558246612549, "global_step": 119698, "epoch": 2849} {"train_loss": -6.508160863603864, "global_step": 119699, "epoch": 2849, "val_loss": 76750.03125} {"train_loss": -6.615176200866699, "global_step": 119700, "epoch": 2850} {"train_loss": -6.538566589355469, "global_step": 119701, "epoch": 2850} {"train_loss": -6.548906326293945, "global_step": 119702, "epoch": 2850} {"train_loss": -6.4947662353515625, "global_step": 119703, "epoch": 2850} {"train_loss": -6.584049701690674, "global_step": 119704, "epoch": 2850} {"train_loss": -6.553343296051025, "global_step": 119705, "epoch": 2850} {"train_loss": -6.501581192016602, "global_step": 119706, "epoch": 2850} {"train_loss": -6.477148532867432, "global_step": 119707, "epoch": 2850} {"train_loss": -6.543310642242432, "global_step": 119708, "epoch": 2850} {"train_loss": -6.456218242645264, "global_step": 119709, "epoch": 2850} {"train_loss": -6.454588890075684, "global_step": 119710, "epoch": 2850} {"train_loss": -6.521854877471924, "global_step": 119711, "epoch": 2850} {"train_loss": -6.547299385070801, "global_step": 119712, "epoch": 2850} {"train_loss": -6.581298828125, "global_step": 119713, "epoch": 2850} {"train_loss": -6.544094562530518, "global_step": 119714, "epoch": 2850} {"train_loss": -6.414887428283691, "global_step": 119715, "epoch": 2850} {"train_loss": -6.470201015472412, "global_step": 119716, "epoch": 2850} {"train_loss": -6.5614213943481445, "global_step": 119717, "epoch": 2850} {"train_loss": -6.518499374389648, "global_step": 119718, "epoch": 2850} {"train_loss": -6.502989768981934, "global_step": 119719, "epoch": 2850} {"train_loss": -6.551607608795166, "global_step": 119720, "epoch": 2850} {"train_loss": -6.541229248046875, "global_step": 119721, "epoch": 2850} {"train_loss": -6.695004940032959, "global_step": 119722, "epoch": 2850} {"train_loss": -6.576879501342773, "global_step": 119723, "epoch": 2850} {"train_loss": -6.574591636657715, "global_step": 119724, "epoch": 2850} {"train_loss": -6.551541805267334, "global_step": 119725, "epoch": 2850} {"train_loss": -6.630664825439453, "global_step": 119726, "epoch": 2850} {"train_loss": -6.585722923278809, "global_step": 119727, "epoch": 2850} {"train_loss": -6.642065525054932, "global_step": 119728, "epoch": 2850} {"train_loss": -6.623002052307129, "global_step": 119729, "epoch": 2850} {"train_loss": -6.600040435791016, "global_step": 119730, "epoch": 2850} {"train_loss": -6.657623767852783, "global_step": 119731, "epoch": 2850} {"train_loss": -6.556980609893799, "global_step": 119732, "epoch": 2850} {"train_loss": -6.607744216918945, "global_step": 119733, "epoch": 2850} {"train_loss": -6.472158432006836, "global_step": 119734, "epoch": 2850} {"train_loss": -6.5692949295043945, "global_step": 119735, "epoch": 2850} {"train_loss": -6.528292655944824, "global_step": 119736, "epoch": 2850} {"train_loss": -6.401762962341309, "global_step": 119737, "epoch": 2850} {"train_loss": -6.608402252197266, "global_step": 119738, "epoch": 2850} {"train_loss": -6.602452754974365, "global_step": 119739, "epoch": 2850} {"train_loss": -6.483335018157959, "global_step": 119740, "epoch": 2850} {"train_loss": -6.549382425489879, "global_step": 119741, "epoch": 2850, "train/sim_max_reward_0": 0.3791427590358799, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.46193043382287235, "train/sim_max_reward_3": 0.007861271415094177, "train/sim_max_reward_4": 0.9567489036413077, "train/sim_max_reward_5": 0.5906649355778941, "test/sim_max_reward_4500000": 0.33509710564942863, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.96243726747198, "test/sim_max_reward_4500003": 0.8731644220737264, "test/sim_max_reward_4500004": 0.5550878959064183, "test/sim_max_reward_4500005": 0.16478255136293676, "test/sim_max_reward_4500006": 0.9898148193753058, "test/sim_max_reward_4500007": 0.7222969579535976, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.05355320423420974, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 0.4205055403625462, "test/sim_max_reward_4500013": 0.00968460666585962, "test/sim_max_reward_4500014": 0.3034785429464315, "test/sim_max_reward_4500015": 0.885880188516182, "test/sim_max_reward_4500016": 0.01698186275305695, "test/sim_max_reward_4500017": 0.05161613706556221, "test/sim_max_reward_4500018": 0.4460203415027629, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.6098932058097823, "test/sim_max_reward_4500022": 0.7931925084863749, "test/sim_max_reward_4500023": 0.506581963003588, "test/sim_max_reward_4500024": 0.9502755577548525, "test/sim_max_reward_4500025": 0.7875707620352063, "test/sim_max_reward_4500026": 0.5350325246458122, "test/sim_max_reward_4500027": 0.6939696907811946, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.0945797931279958, "test/sim_max_reward_4500030": 0.9746721230034461, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9308022400353205, "test/sim_max_reward_4500034": 0.9966691703430864, "test/sim_max_reward_4500035": 0.5527045492766688, "test/sim_max_reward_4500036": 0.3768003808168513, "test/sim_max_reward_4500037": 0.9260258171078111, "test/sim_max_reward_4500038": 0.32619670858376465, "test/sim_max_reward_4500039": 0.5633101783480077, "test/sim_max_reward_4500040": 0.9391229612690516, "test/sim_max_reward_4500041": 0.8803090391762558, "test/sim_max_reward_4500042": 0.9892066126196928, "test/sim_max_reward_4500043": 0.5107768674954964, "test/sim_max_reward_4500044": 6.961879146049806e-05, "test/sim_max_reward_4500045": 0.39190656557412246, "test/sim_max_reward_4500046": 0.9546410723772173, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 0.4699011108095781, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5660580505821747, "test/mean_score": 0.5039341338316043, "val_loss": 76782.671875} {"train_loss": -6.480040550231934, "global_step": 119742, "epoch": 2851} {"train_loss": -6.627387046813965, "global_step": 119743, "epoch": 2851} {"train_loss": -6.592433929443359, "global_step": 119744, "epoch": 2851} {"train_loss": -6.622939586639404, "global_step": 119745, "epoch": 2851} {"train_loss": -6.555427551269531, "global_step": 119746, "epoch": 2851} {"train_loss": -6.697402000427246, "global_step": 119747, "epoch": 2851} {"train_loss": -6.674846649169922, "global_step": 119748, "epoch": 2851} {"train_loss": -6.5112714767456055, "global_step": 119749, "epoch": 2851} {"train_loss": -6.615328788757324, "global_step": 119750, "epoch": 2851} {"train_loss": -6.5827765464782715, "global_step": 119751, "epoch": 2851} {"train_loss": -6.5776214599609375, "global_step": 119752, "epoch": 2851} {"train_loss": -6.701948165893555, "global_step": 119753, "epoch": 2851} {"train_loss": -6.48020076751709, "global_step": 119754, "epoch": 2851} {"train_loss": -6.587250709533691, "global_step": 119755, "epoch": 2851} {"train_loss": -6.391889572143555, "global_step": 119756, "epoch": 2851} {"train_loss": -6.589046001434326, "global_step": 119757, "epoch": 2851} {"train_loss": -6.579293727874756, "global_step": 119758, "epoch": 2851} {"train_loss": -6.422618865966797, "global_step": 119759, "epoch": 2851} {"train_loss": -6.520581245422363, "global_step": 119760, "epoch": 2851} {"train_loss": -6.498315811157227, "global_step": 119761, "epoch": 2851} {"train_loss": -6.648122787475586, "global_step": 119762, "epoch": 2851} {"train_loss": -6.4675397872924805, "global_step": 119763, "epoch": 2851} {"train_loss": -6.4675140380859375, "global_step": 119764, "epoch": 2851} {"train_loss": -6.596163272857666, "global_step": 119765, "epoch": 2851} {"train_loss": -6.527327537536621, "global_step": 119766, "epoch": 2851} {"train_loss": -6.584473609924316, "global_step": 119767, "epoch": 2851} {"train_loss": -6.493671894073486, "global_step": 119768, "epoch": 2851} {"train_loss": -6.4579057693481445, "global_step": 119769, "epoch": 2851} {"train_loss": -6.563765525817871, "global_step": 119770, "epoch": 2851} {"train_loss": -6.439010143280029, "global_step": 119771, "epoch": 2851} {"train_loss": -6.563591957092285, "global_step": 119772, "epoch": 2851} {"train_loss": -6.564349174499512, "global_step": 119773, "epoch": 2851} {"train_loss": -6.551224708557129, "global_step": 119774, "epoch": 2851} {"train_loss": -6.549230098724365, "global_step": 119775, "epoch": 2851} {"train_loss": -6.478316307067871, "global_step": 119776, "epoch": 2851} {"train_loss": -6.569456100463867, "global_step": 119777, "epoch": 2851} {"train_loss": -6.564155101776123, "global_step": 119778, "epoch": 2851} {"train_loss": -6.681778430938721, "global_step": 119779, "epoch": 2851} {"train_loss": -6.524906635284424, "global_step": 119780, "epoch": 2851} {"train_loss": -6.554030895233154, "global_step": 119781, "epoch": 2851} {"train_loss": -6.456124305725098, "global_step": 119782, "epoch": 2851} {"train_loss": -6.551108110518682, "global_step": 119783, "epoch": 2851, "val_loss": 76583.9140625} {"train_loss": -6.610403060913086, "global_step": 119784, "epoch": 2852} {"train_loss": -6.457651138305664, "global_step": 119785, "epoch": 2852} {"train_loss": -6.411897659301758, "global_step": 119786, "epoch": 2852} {"train_loss": -6.576523780822754, "global_step": 119787, "epoch": 2852} {"train_loss": -6.684908390045166, "global_step": 119788, "epoch": 2852} {"train_loss": -6.536438465118408, "global_step": 119789, "epoch": 2852} {"train_loss": -6.540674209594727, "global_step": 119790, "epoch": 2852} {"train_loss": -6.542565822601318, "global_step": 119791, "epoch": 2852} {"train_loss": -6.657890796661377, "global_step": 119792, "epoch": 2852} {"train_loss": -6.547796249389648, "global_step": 119793, "epoch": 2852} {"train_loss": -6.569531440734863, "global_step": 119794, "epoch": 2852} {"train_loss": -6.484306335449219, "global_step": 119795, "epoch": 2852} {"train_loss": -6.539742946624756, "global_step": 119796, "epoch": 2852} {"train_loss": -6.66218376159668, "global_step": 119797, "epoch": 2852} {"train_loss": -6.462095260620117, "global_step": 119798, "epoch": 2852} {"train_loss": -6.573208332061768, "global_step": 119799, "epoch": 2852} {"train_loss": -6.647441387176514, "global_step": 119800, "epoch": 2852} {"train_loss": -6.637136459350586, "global_step": 119801, "epoch": 2852} {"train_loss": -6.55950927734375, "global_step": 119802, "epoch": 2852} {"train_loss": -6.629363059997559, "global_step": 119803, "epoch": 2852} {"train_loss": -6.475438594818115, "global_step": 119804, "epoch": 2852} {"train_loss": -6.593725204467773, "global_step": 119805, "epoch": 2852} {"train_loss": -6.553531646728516, "global_step": 119806, "epoch": 2852} {"train_loss": -6.473868370056152, "global_step": 119807, "epoch": 2852} {"train_loss": -6.547421932220459, "global_step": 119808, "epoch": 2852} {"train_loss": -6.556430339813232, "global_step": 119809, "epoch": 2852} {"train_loss": -6.490626335144043, "global_step": 119810, "epoch": 2852} {"train_loss": -6.544197082519531, "global_step": 119811, "epoch": 2852} {"train_loss": -6.640224933624268, "global_step": 119812, "epoch": 2852} {"train_loss": -6.541315078735352, "global_step": 119813, "epoch": 2852} {"train_loss": -6.6068949699401855, "global_step": 119814, "epoch": 2852} {"train_loss": -6.573391914367676, "global_step": 119815, "epoch": 2852} {"train_loss": -6.404894828796387, "global_step": 119816, "epoch": 2852} {"train_loss": -6.579010009765625, "global_step": 119817, "epoch": 2852} {"train_loss": -6.585531711578369, "global_step": 119818, "epoch": 2852} {"train_loss": -6.57624626159668, "global_step": 119819, "epoch": 2852} {"train_loss": -6.59625244140625, "global_step": 119820, "epoch": 2852} {"train_loss": -6.625128746032715, "global_step": 119821, "epoch": 2852} {"train_loss": -6.537290096282959, "global_step": 119822, "epoch": 2852} {"train_loss": -6.502447605133057, "global_step": 119823, "epoch": 2852} {"train_loss": -6.644770622253418, "global_step": 119824, "epoch": 2852} {"train_loss": -6.558872631617954, "global_step": 119825, "epoch": 2852, "val_loss": 76824.6171875} {"train_loss": -6.49595308303833, "global_step": 119826, "epoch": 2853} {"train_loss": -6.610011100769043, "global_step": 119827, "epoch": 2853} {"train_loss": -6.433455944061279, "global_step": 119828, "epoch": 2853} {"train_loss": -6.539700031280518, "global_step": 119829, "epoch": 2853} {"train_loss": -6.506852149963379, "global_step": 119830, "epoch": 2853} {"train_loss": -6.53444766998291, "global_step": 119831, "epoch": 2853} {"train_loss": -6.550998687744141, "global_step": 119832, "epoch": 2853} {"train_loss": -6.6008195877075195, "global_step": 119833, "epoch": 2853} {"train_loss": -6.3818769454956055, "global_step": 119834, "epoch": 2853} {"train_loss": -6.496024131774902, "global_step": 119835, "epoch": 2853} {"train_loss": -6.500796318054199, "global_step": 119836, "epoch": 2853} {"train_loss": -6.512266159057617, "global_step": 119837, "epoch": 2853} {"train_loss": -6.593011856079102, "global_step": 119838, "epoch": 2853} {"train_loss": -6.384490966796875, "global_step": 119839, "epoch": 2853} {"train_loss": -6.63790225982666, "global_step": 119840, "epoch": 2853} {"train_loss": -6.536073684692383, "global_step": 119841, "epoch": 2853} {"train_loss": -6.454516410827637, "global_step": 119842, "epoch": 2853} {"train_loss": -6.50656795501709, "global_step": 119843, "epoch": 2853} {"train_loss": -6.472728252410889, "global_step": 119844, "epoch": 2853} {"train_loss": -6.473123550415039, "global_step": 119845, "epoch": 2853} {"train_loss": -6.567719459533691, "global_step": 119846, "epoch": 2853} {"train_loss": -6.408576965332031, "global_step": 119847, "epoch": 2853} {"train_loss": -6.515093803405762, "global_step": 119848, "epoch": 2853} {"train_loss": -6.571867942810059, "global_step": 119849, "epoch": 2853} {"train_loss": -6.437175750732422, "global_step": 119850, "epoch": 2853} {"train_loss": -6.595399379730225, "global_step": 119851, "epoch": 2853} {"train_loss": -6.587430953979492, "global_step": 119852, "epoch": 2853} {"train_loss": -6.543389797210693, "global_step": 119853, "epoch": 2853} {"train_loss": -6.555109024047852, "global_step": 119854, "epoch": 2853} {"train_loss": -6.505817890167236, "global_step": 119855, "epoch": 2853} {"train_loss": -6.4981184005737305, "global_step": 119856, "epoch": 2853} {"train_loss": -6.536955833435059, "global_step": 119857, "epoch": 2853} {"train_loss": -6.659176826477051, "global_step": 119858, "epoch": 2853} {"train_loss": -6.550115585327148, "global_step": 119859, "epoch": 2853} {"train_loss": -6.629698753356934, "global_step": 119860, "epoch": 2853} {"train_loss": -6.556196212768555, "global_step": 119861, "epoch": 2853} {"train_loss": -6.55966854095459, "global_step": 119862, "epoch": 2853} {"train_loss": -6.613826751708984, "global_step": 119863, "epoch": 2853} {"train_loss": -6.605892181396484, "global_step": 119864, "epoch": 2853} {"train_loss": -6.588645935058594, "global_step": 119865, "epoch": 2853} {"train_loss": -6.602309226989746, "global_step": 119866, "epoch": 2853} {"train_loss": -6.532452242715018, "global_step": 119867, "epoch": 2853, "val_loss": 76758.171875} {"train_loss": -6.659575462341309, "global_step": 119868, "epoch": 2854} {"train_loss": -6.5067644119262695, "global_step": 119869, "epoch": 2854} {"train_loss": -6.602356910705566, "global_step": 119870, "epoch": 2854} {"train_loss": -6.510149955749512, "global_step": 119871, "epoch": 2854} {"train_loss": -6.545173645019531, "global_step": 119872, "epoch": 2854} {"train_loss": -6.4862260818481445, "global_step": 119873, "epoch": 2854} {"train_loss": -6.433144569396973, "global_step": 119874, "epoch": 2854} {"train_loss": -6.591136932373047, "global_step": 119875, "epoch": 2854} {"train_loss": -6.334420204162598, "global_step": 119876, "epoch": 2854} {"train_loss": -6.485515117645264, "global_step": 119877, "epoch": 2854} {"train_loss": -6.650583744049072, "global_step": 119878, "epoch": 2854} {"train_loss": -6.551831245422363, "global_step": 119879, "epoch": 2854} {"train_loss": -6.5921406745910645, "global_step": 119880, "epoch": 2854} {"train_loss": -6.492779731750488, "global_step": 119881, "epoch": 2854} {"train_loss": -6.40240478515625, "global_step": 119882, "epoch": 2854} {"train_loss": -6.521490097045898, "global_step": 119883, "epoch": 2854} {"train_loss": -6.462767601013184, "global_step": 119884, "epoch": 2854} {"train_loss": -6.658619403839111, "global_step": 119885, "epoch": 2854} {"train_loss": -6.651362419128418, "global_step": 119886, "epoch": 2854} {"train_loss": -6.599323272705078, "global_step": 119887, "epoch": 2854} {"train_loss": -6.560989856719971, "global_step": 119888, "epoch": 2854} {"train_loss": -6.574648857116699, "global_step": 119889, "epoch": 2854} {"train_loss": -6.620558261871338, "global_step": 119890, "epoch": 2854} {"train_loss": -6.5860981941223145, "global_step": 119891, "epoch": 2854} {"train_loss": -6.669925212860107, "global_step": 119892, "epoch": 2854} {"train_loss": -6.618125915527344, "global_step": 119893, "epoch": 2854} {"train_loss": -6.592494010925293, "global_step": 119894, "epoch": 2854} {"train_loss": -6.549248218536377, "global_step": 119895, "epoch": 2854} {"train_loss": -6.608144760131836, "global_step": 119896, "epoch": 2854} {"train_loss": -6.509720802307129, "global_step": 119897, "epoch": 2854} {"train_loss": -6.577427387237549, "global_step": 119898, "epoch": 2854} {"train_loss": -6.539214134216309, "global_step": 119899, "epoch": 2854} {"train_loss": -6.531991958618164, "global_step": 119900, "epoch": 2854} {"train_loss": -6.636723518371582, "global_step": 119901, "epoch": 2854} {"train_loss": -6.663028240203857, "global_step": 119902, "epoch": 2854} {"train_loss": -6.683426856994629, "global_step": 119903, "epoch": 2854} {"train_loss": -6.609113693237305, "global_step": 119904, "epoch": 2854} {"train_loss": -6.650032043457031, "global_step": 119905, "epoch": 2854} {"train_loss": -6.6197919845581055, "global_step": 119906, "epoch": 2854} {"train_loss": -6.6560773849487305, "global_step": 119907, "epoch": 2854} {"train_loss": -6.602664947509766, "global_step": 119908, "epoch": 2854} {"train_loss": -6.57165173121861, "global_step": 119909, "epoch": 2854, "val_loss": 76803.8671875} {"train_loss": -6.589900970458984, "global_step": 119910, "epoch": 2855} {"train_loss": -6.722229957580566, "global_step": 119911, "epoch": 2855} {"train_loss": -6.720643043518066, "global_step": 119912, "epoch": 2855} {"train_loss": -6.526178359985352, "global_step": 119913, "epoch": 2855} {"train_loss": -6.631947994232178, "global_step": 119914, "epoch": 2855} {"train_loss": -6.613966941833496, "global_step": 119915, "epoch": 2855} {"train_loss": -6.637551307678223, "global_step": 119916, "epoch": 2855} {"train_loss": -6.531412124633789, "global_step": 119917, "epoch": 2855} {"train_loss": -6.579495906829834, "global_step": 119918, "epoch": 2855} {"train_loss": -6.488661766052246, "global_step": 119919, "epoch": 2855} {"train_loss": -6.657249450683594, "global_step": 119920, "epoch": 2855} {"train_loss": -6.567544937133789, "global_step": 119921, "epoch": 2855} {"train_loss": -6.576336860656738, "global_step": 119922, "epoch": 2855} {"train_loss": -6.569268703460693, "global_step": 119923, "epoch": 2855} {"train_loss": -6.611877918243408, "global_step": 119924, "epoch": 2855} {"train_loss": -6.63773250579834, "global_step": 119925, "epoch": 2855} {"train_loss": -6.6192216873168945, "global_step": 119926, "epoch": 2855} {"train_loss": -6.4574971199035645, "global_step": 119927, "epoch": 2855} {"train_loss": -6.509336471557617, "global_step": 119928, "epoch": 2855} {"train_loss": -6.578374862670898, "global_step": 119929, "epoch": 2855} {"train_loss": -6.592784404754639, "global_step": 119930, "epoch": 2855} {"train_loss": -6.560973644256592, "global_step": 119931, "epoch": 2855} {"train_loss": -6.548915386199951, "global_step": 119932, "epoch": 2855} {"train_loss": -6.636672496795654, "global_step": 119933, "epoch": 2855} {"train_loss": -6.527448654174805, "global_step": 119934, "epoch": 2855} {"train_loss": -6.639228820800781, "global_step": 119935, "epoch": 2855} {"train_loss": -6.565595626831055, "global_step": 119936, "epoch": 2855} {"train_loss": -6.589811325073242, "global_step": 119937, "epoch": 2855} {"train_loss": -6.476552963256836, "global_step": 119938, "epoch": 2855} {"train_loss": -6.493098258972168, "global_step": 119939, "epoch": 2855} {"train_loss": -6.570521354675293, "global_step": 119940, "epoch": 2855} {"train_loss": -6.596299171447754, "global_step": 119941, "epoch": 2855} {"train_loss": -6.529880046844482, "global_step": 119942, "epoch": 2855} {"train_loss": -6.476686954498291, "global_step": 119943, "epoch": 2855} {"train_loss": -6.655909538269043, "global_step": 119944, "epoch": 2855} {"train_loss": -6.578824043273926, "global_step": 119945, "epoch": 2855} {"train_loss": -6.466721057891846, "global_step": 119946, "epoch": 2855} {"train_loss": -6.578274726867676, "global_step": 119947, "epoch": 2855} {"train_loss": -6.560863494873047, "global_step": 119948, "epoch": 2855} {"train_loss": -6.664420127868652, "global_step": 119949, "epoch": 2855} {"train_loss": -6.695285797119141, "global_step": 119950, "epoch": 2855} {"train_loss": -6.580175831204369, "global_step": 119951, "epoch": 2855, "val_loss": 76675.4140625} {"train_loss": -6.534868240356445, "global_step": 119952, "epoch": 2856} {"train_loss": -6.641515254974365, "global_step": 119953, "epoch": 2856} {"train_loss": -6.55319881439209, "global_step": 119954, "epoch": 2856} {"train_loss": -6.478571891784668, "global_step": 119955, "epoch": 2856} {"train_loss": -6.540733814239502, "global_step": 119956, "epoch": 2856} {"train_loss": -6.550983428955078, "global_step": 119957, "epoch": 2856} {"train_loss": -6.5768537521362305, "global_step": 119958, "epoch": 2856} {"train_loss": -6.669123649597168, "global_step": 119959, "epoch": 2856} {"train_loss": -6.549150466918945, "global_step": 119960, "epoch": 2856} {"train_loss": -6.574160575866699, "global_step": 119961, "epoch": 2856} {"train_loss": -6.451643943786621, "global_step": 119962, "epoch": 2856} {"train_loss": -6.389078140258789, "global_step": 119963, "epoch": 2856} {"train_loss": -6.549965858459473, "global_step": 119964, "epoch": 2856} {"train_loss": -6.387979507446289, "global_step": 119965, "epoch": 2856} {"train_loss": -6.59653377532959, "global_step": 119966, "epoch": 2856} {"train_loss": -6.637041091918945, "global_step": 119967, "epoch": 2856} {"train_loss": -6.560357093811035, "global_step": 119968, "epoch": 2856} {"train_loss": -6.510380744934082, "global_step": 119969, "epoch": 2856} {"train_loss": -6.559667587280273, "global_step": 119970, "epoch": 2856} {"train_loss": -6.594846725463867, "global_step": 119971, "epoch": 2856} {"train_loss": -6.396872520446777, "global_step": 119972, "epoch": 2856} {"train_loss": -6.505013465881348, "global_step": 119973, "epoch": 2856} {"train_loss": -6.561388969421387, "global_step": 119974, "epoch": 2856} {"train_loss": -6.498682975769043, "global_step": 119975, "epoch": 2856} {"train_loss": -6.544855117797852, "global_step": 119976, "epoch": 2856} {"train_loss": -6.676000118255615, "global_step": 119977, "epoch": 2856} {"train_loss": -6.564756393432617, "global_step": 119978, "epoch": 2856} {"train_loss": -6.62393856048584, "global_step": 119979, "epoch": 2856} {"train_loss": -6.566617012023926, "global_step": 119980, "epoch": 2856} {"train_loss": -6.577707290649414, "global_step": 119981, "epoch": 2856} {"train_loss": -6.521061420440674, "global_step": 119982, "epoch": 2856} {"train_loss": -6.637672424316406, "global_step": 119983, "epoch": 2856} {"train_loss": -6.49359130859375, "global_step": 119984, "epoch": 2856} {"train_loss": -6.581030368804932, "global_step": 119985, "epoch": 2856} {"train_loss": -6.496491432189941, "global_step": 119986, "epoch": 2856} {"train_loss": -6.54473876953125, "global_step": 119987, "epoch": 2856} {"train_loss": -6.5030646324157715, "global_step": 119988, "epoch": 2856} {"train_loss": -6.534757614135742, "global_step": 119989, "epoch": 2856} {"train_loss": -6.490178108215332, "global_step": 119990, "epoch": 2856} {"train_loss": -6.613353252410889, "global_step": 119991, "epoch": 2856} {"train_loss": -6.563393592834473, "global_step": 119992, "epoch": 2856} {"train_loss": -6.5451523917061945, "global_step": 119993, "epoch": 2856, "val_loss": 76818.6640625} {"train_loss": -6.620078086853027, "global_step": 119994, "epoch": 2857} {"train_loss": -6.594206809997559, "global_step": 119995, "epoch": 2857} {"train_loss": -6.515839099884033, "global_step": 119996, "epoch": 2857} {"train_loss": -6.645368576049805, "global_step": 119997, "epoch": 2857} {"train_loss": -6.574347972869873, "global_step": 119998, "epoch": 2857} {"train_loss": -6.613720893859863, "global_step": 119999, "epoch": 2857} {"train_loss": -6.561600685119629, "global_step": 120000, "epoch": 2857} {"train_loss": -6.687371253967285, "global_step": 120001, "epoch": 2857} {"train_loss": -6.621441841125488, "global_step": 120002, "epoch": 2857} {"train_loss": -6.6202874183654785, "global_step": 120003, "epoch": 2857} {"train_loss": -6.672513961791992, "global_step": 120004, "epoch": 2857} {"train_loss": -6.6468186378479, "global_step": 120005, "epoch": 2857} {"train_loss": -6.610630035400391, "global_step": 120006, "epoch": 2857} {"train_loss": -6.598033428192139, "global_step": 120007, "epoch": 2857} {"train_loss": -6.625698089599609, "global_step": 120008, "epoch": 2857} {"train_loss": -6.469171524047852, "global_step": 120009, "epoch": 2857} {"train_loss": -6.571094989776611, "global_step": 120010, "epoch": 2857} {"train_loss": -6.628493309020996, "global_step": 120011, "epoch": 2857} {"train_loss": -6.619777202606201, "global_step": 120012, "epoch": 2857} {"train_loss": -6.5485639572143555, "global_step": 120013, "epoch": 2857} {"train_loss": -6.600466728210449, "global_step": 120014, "epoch": 2857} {"train_loss": -6.49685525894165, "global_step": 120015, "epoch": 2857} {"train_loss": -6.584076881408691, "global_step": 120016, "epoch": 2857} {"train_loss": -6.6969709396362305, "global_step": 120017, "epoch": 2857} {"train_loss": -6.540696144104004, "global_step": 120018, "epoch": 2857} {"train_loss": -6.418370246887207, "global_step": 120019, "epoch": 2857} {"train_loss": -6.381237030029297, "global_step": 120020, "epoch": 2857} {"train_loss": -6.6137261390686035, "global_step": 120021, "epoch": 2857} {"train_loss": -6.488604545593262, "global_step": 120022, "epoch": 2857} {"train_loss": -6.391083240509033, "global_step": 120023, "epoch": 2857} {"train_loss": -6.558847427368164, "global_step": 120024, "epoch": 2857} {"train_loss": -6.5076398849487305, "global_step": 120025, "epoch": 2857} {"train_loss": -6.511684894561768, "global_step": 120026, "epoch": 2857} {"train_loss": -6.545657157897949, "global_step": 120027, "epoch": 2857} {"train_loss": -6.365118980407715, "global_step": 120028, "epoch": 2857} {"train_loss": -6.5486836433410645, "global_step": 120029, "epoch": 2857} {"train_loss": -6.443102836608887, "global_step": 120030, "epoch": 2857} {"train_loss": -6.47815465927124, "global_step": 120031, "epoch": 2857} {"train_loss": -6.601437568664551, "global_step": 120032, "epoch": 2857} {"train_loss": -6.543153285980225, "global_step": 120033, "epoch": 2857} {"train_loss": -6.485882759094238, "global_step": 120034, "epoch": 2857} {"train_loss": -6.559485401426043, "global_step": 120035, "epoch": 2857, "val_loss": 76710.6171875} {"train_loss": -6.459904670715332, "global_step": 120036, "epoch": 2858} {"train_loss": -6.63666296005249, "global_step": 120037, "epoch": 2858} {"train_loss": -6.555695533752441, "global_step": 120038, "epoch": 2858} {"train_loss": -6.5039520263671875, "global_step": 120039, "epoch": 2858} {"train_loss": -6.556989669799805, "global_step": 120040, "epoch": 2858} {"train_loss": -6.477112293243408, "global_step": 120041, "epoch": 2858} {"train_loss": -6.607210636138916, "global_step": 120042, "epoch": 2858} {"train_loss": -6.598567485809326, "global_step": 120043, "epoch": 2858} {"train_loss": -6.573470115661621, "global_step": 120044, "epoch": 2858} {"train_loss": -6.6298089027404785, "global_step": 120045, "epoch": 2858} {"train_loss": -6.547827243804932, "global_step": 120046, "epoch": 2858} {"train_loss": -6.528341770172119, "global_step": 120047, "epoch": 2858} {"train_loss": -6.597525596618652, "global_step": 120048, "epoch": 2858} {"train_loss": -6.613062858581543, "global_step": 120049, "epoch": 2858} {"train_loss": -6.669416427612305, "global_step": 120050, "epoch": 2858} {"train_loss": -6.530571460723877, "global_step": 120051, "epoch": 2858} {"train_loss": -6.554019451141357, "global_step": 120052, "epoch": 2858} {"train_loss": -6.589717864990234, "global_step": 120053, "epoch": 2858} {"train_loss": -6.626276016235352, "global_step": 120054, "epoch": 2858} {"train_loss": -6.529921531677246, "global_step": 120055, "epoch": 2858} {"train_loss": -6.570013999938965, "global_step": 120056, "epoch": 2858} {"train_loss": -6.587347030639648, "global_step": 120057, "epoch": 2858} {"train_loss": -6.476822376251221, "global_step": 120058, "epoch": 2858} {"train_loss": -6.643176555633545, "global_step": 120059, "epoch": 2858} {"train_loss": -6.5812602043151855, "global_step": 120060, "epoch": 2858} {"train_loss": -6.574102878570557, "global_step": 120061, "epoch": 2858} {"train_loss": -6.615639686584473, "global_step": 120062, "epoch": 2858} {"train_loss": -6.572501182556152, "global_step": 120063, "epoch": 2858} {"train_loss": -6.548267841339111, "global_step": 120064, "epoch": 2858} {"train_loss": -6.617836952209473, "global_step": 120065, "epoch": 2858} {"train_loss": -6.617088317871094, "global_step": 120066, "epoch": 2858} {"train_loss": -6.617373466491699, "global_step": 120067, "epoch": 2858} {"train_loss": -6.583162784576416, "global_step": 120068, "epoch": 2858} {"train_loss": -6.5367045402526855, "global_step": 120069, "epoch": 2858} {"train_loss": -6.607522487640381, "global_step": 120070, "epoch": 2858} {"train_loss": -6.278033256530762, "global_step": 120071, "epoch": 2858} {"train_loss": -6.543097496032715, "global_step": 120072, "epoch": 2858} {"train_loss": -6.615605354309082, "global_step": 120073, "epoch": 2858} {"train_loss": -6.5313029289245605, "global_step": 120074, "epoch": 2858} {"train_loss": -6.534836769104004, "global_step": 120075, "epoch": 2858} {"train_loss": -6.514706611633301, "global_step": 120076, "epoch": 2858} {"train_loss": -6.5628597395760675, "global_step": 120077, "epoch": 2858, "val_loss": 77070.3359375} {"train_loss": -6.468314170837402, "global_step": 120078, "epoch": 2859} {"train_loss": -6.434062957763672, "global_step": 120079, "epoch": 2859} {"train_loss": -6.583897590637207, "global_step": 120080, "epoch": 2859} {"train_loss": -6.458130836486816, "global_step": 120081, "epoch": 2859} {"train_loss": -6.533580303192139, "global_step": 120082, "epoch": 2859} {"train_loss": -6.452922344207764, "global_step": 120083, "epoch": 2859} {"train_loss": -6.447844505310059, "global_step": 120084, "epoch": 2859} {"train_loss": -6.477931976318359, "global_step": 120085, "epoch": 2859} {"train_loss": -6.541721343994141, "global_step": 120086, "epoch": 2859} {"train_loss": -6.503114223480225, "global_step": 120087, "epoch": 2859} {"train_loss": -6.610293388366699, "global_step": 120088, "epoch": 2859} {"train_loss": -6.568699836730957, "global_step": 120089, "epoch": 2859} {"train_loss": -6.680388450622559, "global_step": 120090, "epoch": 2859} {"train_loss": -6.523175239562988, "global_step": 120091, "epoch": 2859} {"train_loss": -6.425631523132324, "global_step": 120092, "epoch": 2859} {"train_loss": -6.4975972175598145, "global_step": 120093, "epoch": 2859} {"train_loss": -6.523381233215332, "global_step": 120094, "epoch": 2859} {"train_loss": -6.559749603271484, "global_step": 120095, "epoch": 2859} {"train_loss": -6.508418083190918, "global_step": 120096, "epoch": 2859} {"train_loss": -6.550236701965332, "global_step": 120097, "epoch": 2859} {"train_loss": -6.632783889770508, "global_step": 120098, "epoch": 2859} {"train_loss": -6.546067714691162, "global_step": 120099, "epoch": 2859} {"train_loss": -6.584663391113281, "global_step": 120100, "epoch": 2859} {"train_loss": -6.608310699462891, "global_step": 120101, "epoch": 2859} {"train_loss": -6.446000099182129, "global_step": 120102, "epoch": 2859} {"train_loss": -6.600785732269287, "global_step": 120103, "epoch": 2859} {"train_loss": -6.657614707946777, "global_step": 120104, "epoch": 2859} {"train_loss": -6.540072441101074, "global_step": 120105, "epoch": 2859} {"train_loss": -6.497998237609863, "global_step": 120106, "epoch": 2859} {"train_loss": -6.626223564147949, "global_step": 120107, "epoch": 2859} {"train_loss": -6.789278030395508, "global_step": 120108, "epoch": 2859} {"train_loss": -6.598910331726074, "global_step": 120109, "epoch": 2859} {"train_loss": -6.631462097167969, "global_step": 120110, "epoch": 2859} {"train_loss": -6.56786584854126, "global_step": 120111, "epoch": 2859} {"train_loss": -6.655760765075684, "global_step": 120112, "epoch": 2859} {"train_loss": -6.619538307189941, "global_step": 120113, "epoch": 2859} {"train_loss": -6.576582908630371, "global_step": 120114, "epoch": 2859} {"train_loss": -6.468571186065674, "global_step": 120115, "epoch": 2859} {"train_loss": -6.681699752807617, "global_step": 120116, "epoch": 2859} {"train_loss": -6.639449119567871, "global_step": 120117, "epoch": 2859} {"train_loss": -6.6764678955078125, "global_step": 120118, "epoch": 2859} {"train_loss": -6.565463315872919, "global_step": 120119, "epoch": 2859, "val_loss": 77176.3125} {"train_loss": -6.582242965698242, "global_step": 120120, "epoch": 2860} {"train_loss": -6.596240043640137, "global_step": 120121, "epoch": 2860} {"train_loss": -6.677767753601074, "global_step": 120122, "epoch": 2860} {"train_loss": -6.5697855949401855, "global_step": 120123, "epoch": 2860} {"train_loss": -6.623943328857422, "global_step": 120124, "epoch": 2860} {"train_loss": -6.676288604736328, "global_step": 120125, "epoch": 2860} {"train_loss": -6.630274772644043, "global_step": 120126, "epoch": 2860} {"train_loss": -6.601364612579346, "global_step": 120127, "epoch": 2860} {"train_loss": -6.5389862060546875, "global_step": 120128, "epoch": 2860} {"train_loss": -6.626049041748047, "global_step": 120129, "epoch": 2860} {"train_loss": -6.547602653503418, "global_step": 120130, "epoch": 2860} {"train_loss": -6.640413761138916, "global_step": 120131, "epoch": 2860} {"train_loss": -6.543615341186523, "global_step": 120132, "epoch": 2860} {"train_loss": -6.604730606079102, "global_step": 120133, "epoch": 2860} {"train_loss": -6.536096096038818, "global_step": 120134, "epoch": 2860} {"train_loss": -6.474521160125732, "global_step": 120135, "epoch": 2860} {"train_loss": -6.617811679840088, "global_step": 120136, "epoch": 2860} {"train_loss": -6.499999523162842, "global_step": 120137, "epoch": 2860} {"train_loss": -6.650444030761719, "global_step": 120138, "epoch": 2860} {"train_loss": -6.556171894073486, "global_step": 120139, "epoch": 2860} {"train_loss": -6.60382080078125, "global_step": 120140, "epoch": 2860} {"train_loss": -6.597371578216553, "global_step": 120141, "epoch": 2860} {"train_loss": -6.586885452270508, "global_step": 120142, "epoch": 2860} {"train_loss": -6.601219177246094, "global_step": 120143, "epoch": 2860} {"train_loss": -6.710059642791748, "global_step": 120144, "epoch": 2860} {"train_loss": -6.589420318603516, "global_step": 120145, "epoch": 2860} {"train_loss": -6.60865592956543, "global_step": 120146, "epoch": 2860} {"train_loss": -6.540529251098633, "global_step": 120147, "epoch": 2860} {"train_loss": -6.576008319854736, "global_step": 120148, "epoch": 2860} {"train_loss": -6.486785888671875, "global_step": 120149, "epoch": 2860} {"train_loss": -6.537461280822754, "global_step": 120150, "epoch": 2860} {"train_loss": -6.713007926940918, "global_step": 120151, "epoch": 2860} {"train_loss": -6.529071807861328, "global_step": 120152, "epoch": 2860} {"train_loss": -6.465440273284912, "global_step": 120153, "epoch": 2860} {"train_loss": -6.685800552368164, "global_step": 120154, "epoch": 2860} {"train_loss": -6.510973930358887, "global_step": 120155, "epoch": 2860} {"train_loss": -6.599822044372559, "global_step": 120156, "epoch": 2860} {"train_loss": -6.605428695678711, "global_step": 120157, "epoch": 2860} {"train_loss": -6.655766487121582, "global_step": 120158, "epoch": 2860} {"train_loss": -6.588351249694824, "global_step": 120159, "epoch": 2860} {"train_loss": -6.713325500488281, "global_step": 120160, "epoch": 2860} {"train_loss": -6.594236112776256, "global_step": 120161, "epoch": 2860, "val_loss": 77303.765625} {"train_loss": -6.653077125549316, "global_step": 120162, "epoch": 2861} {"train_loss": -6.622209548950195, "global_step": 120163, "epoch": 2861} {"train_loss": -6.662981033325195, "global_step": 120164, "epoch": 2861} {"train_loss": -6.6931047439575195, "global_step": 120165, "epoch": 2861} {"train_loss": -6.694094657897949, "global_step": 120166, "epoch": 2861} {"train_loss": -6.681707859039307, "global_step": 120167, "epoch": 2861} {"train_loss": -6.541285514831543, "global_step": 120168, "epoch": 2861} {"train_loss": -6.498647212982178, "global_step": 120169, "epoch": 2861} {"train_loss": -6.606548309326172, "global_step": 120170, "epoch": 2861} {"train_loss": -6.585392951965332, "global_step": 120171, "epoch": 2861} {"train_loss": -6.523951530456543, "global_step": 120172, "epoch": 2861} {"train_loss": -6.607515335083008, "global_step": 120173, "epoch": 2861} {"train_loss": -6.618525505065918, "global_step": 120174, "epoch": 2861} {"train_loss": -6.518029689788818, "global_step": 120175, "epoch": 2861} {"train_loss": -6.6157002449035645, "global_step": 120176, "epoch": 2861} {"train_loss": -6.575321197509766, "global_step": 120177, "epoch": 2861} {"train_loss": -6.562843322753906, "global_step": 120178, "epoch": 2861} {"train_loss": -6.593726634979248, "global_step": 120179, "epoch": 2861} {"train_loss": -6.613746643066406, "global_step": 120180, "epoch": 2861} {"train_loss": -6.562631130218506, "global_step": 120181, "epoch": 2861} {"train_loss": -6.61251163482666, "global_step": 120182, "epoch": 2861} {"train_loss": -6.662717819213867, "global_step": 120183, "epoch": 2861} {"train_loss": -6.5477166175842285, "global_step": 120184, "epoch": 2861} {"train_loss": -6.635793685913086, "global_step": 120185, "epoch": 2861} {"train_loss": -6.665348052978516, "global_step": 120186, "epoch": 2861} {"train_loss": -6.65074348449707, "global_step": 120187, "epoch": 2861} {"train_loss": -6.592259407043457, "global_step": 120188, "epoch": 2861} {"train_loss": -6.566001892089844, "global_step": 120189, "epoch": 2861} {"train_loss": -6.679882049560547, "global_step": 120190, "epoch": 2861} {"train_loss": -6.453068733215332, "global_step": 120191, "epoch": 2861} {"train_loss": -6.6219377517700195, "global_step": 120192, "epoch": 2861} {"train_loss": -6.574097156524658, "global_step": 120193, "epoch": 2861} {"train_loss": -6.50698184967041, "global_step": 120194, "epoch": 2861} {"train_loss": -6.655951976776123, "global_step": 120195, "epoch": 2861} {"train_loss": -6.625231742858887, "global_step": 120196, "epoch": 2861} {"train_loss": -6.53729248046875, "global_step": 120197, "epoch": 2861} {"train_loss": -6.59987211227417, "global_step": 120198, "epoch": 2861} {"train_loss": -6.571897506713867, "global_step": 120199, "epoch": 2861} {"train_loss": -6.585396766662598, "global_step": 120200, "epoch": 2861} {"train_loss": -6.617602348327637, "global_step": 120201, "epoch": 2861} {"train_loss": -6.625012397766113, "global_step": 120202, "epoch": 2861} {"train_loss": -6.599572908310663, "global_step": 120203, "epoch": 2861, "val_loss": 76733.296875} {"train_loss": -6.6037068367004395, "global_step": 120204, "epoch": 2862} {"train_loss": -6.66334342956543, "global_step": 120205, "epoch": 2862} {"train_loss": -6.627436637878418, "global_step": 120206, "epoch": 2862} {"train_loss": -6.623956203460693, "global_step": 120207, "epoch": 2862} {"train_loss": -6.650081634521484, "global_step": 120208, "epoch": 2862} {"train_loss": -6.7137532234191895, "global_step": 120209, "epoch": 2862} {"train_loss": -6.6334333419799805, "global_step": 120210, "epoch": 2862} {"train_loss": -6.519087791442871, "global_step": 120211, "epoch": 2862} {"train_loss": -6.47489070892334, "global_step": 120212, "epoch": 2862} {"train_loss": -6.52927303314209, "global_step": 120213, "epoch": 2862} {"train_loss": -6.464206695556641, "global_step": 120214, "epoch": 2862} {"train_loss": -6.637969493865967, "global_step": 120215, "epoch": 2862} {"train_loss": -6.512015342712402, "global_step": 120216, "epoch": 2862} {"train_loss": -6.352893829345703, "global_step": 120217, "epoch": 2862} {"train_loss": -6.464439868927002, "global_step": 120218, "epoch": 2862} {"train_loss": -6.516807556152344, "global_step": 120219, "epoch": 2862} {"train_loss": -6.588768005371094, "global_step": 120220, "epoch": 2862} {"train_loss": -6.5424113273620605, "global_step": 120221, "epoch": 2862} {"train_loss": -6.490039825439453, "global_step": 120222, "epoch": 2862} {"train_loss": -6.511966228485107, "global_step": 120223, "epoch": 2862} {"train_loss": -6.6581597328186035, "global_step": 120224, "epoch": 2862} {"train_loss": -6.518304347991943, "global_step": 120225, "epoch": 2862} {"train_loss": -6.474668502807617, "global_step": 120226, "epoch": 2862} {"train_loss": -6.5722551345825195, "global_step": 120227, "epoch": 2862} {"train_loss": -6.547563552856445, "global_step": 120228, "epoch": 2862} {"train_loss": -6.56965446472168, "global_step": 120229, "epoch": 2862} {"train_loss": -6.54948616027832, "global_step": 120230, "epoch": 2862} {"train_loss": -6.459979057312012, "global_step": 120231, "epoch": 2862} {"train_loss": -6.659603118896484, "global_step": 120232, "epoch": 2862} {"train_loss": -6.55836296081543, "global_step": 120233, "epoch": 2862} {"train_loss": -6.353465557098389, "global_step": 120234, "epoch": 2862} {"train_loss": -6.540663719177246, "global_step": 120235, "epoch": 2862} {"train_loss": -6.550450801849365, "global_step": 120236, "epoch": 2862} {"train_loss": -6.565489768981934, "global_step": 120237, "epoch": 2862} {"train_loss": -6.458580017089844, "global_step": 120238, "epoch": 2862} {"train_loss": -6.609920501708984, "global_step": 120239, "epoch": 2862} {"train_loss": -6.62971830368042, "global_step": 120240, "epoch": 2862} {"train_loss": -6.599180221557617, "global_step": 120241, "epoch": 2862} {"train_loss": -6.601406097412109, "global_step": 120242, "epoch": 2862} {"train_loss": -6.463084697723389, "global_step": 120243, "epoch": 2862} {"train_loss": -6.547609329223633, "global_step": 120244, "epoch": 2862} {"train_loss": -6.552076089949835, "global_step": 120245, "epoch": 2862, "val_loss": 76884.796875} {"train_loss": -6.526259422302246, "global_step": 120246, "epoch": 2863} {"train_loss": -6.581116676330566, "global_step": 120247, "epoch": 2863} {"train_loss": -6.659188270568848, "global_step": 120248, "epoch": 2863} {"train_loss": -6.6038947105407715, "global_step": 120249, "epoch": 2863} {"train_loss": -6.587279319763184, "global_step": 120250, "epoch": 2863} {"train_loss": -6.438253402709961, "global_step": 120251, "epoch": 2863} {"train_loss": -6.539111614227295, "global_step": 120252, "epoch": 2863} {"train_loss": -6.52823543548584, "global_step": 120253, "epoch": 2863} {"train_loss": -6.541478157043457, "global_step": 120254, "epoch": 2863} {"train_loss": -6.626750946044922, "global_step": 120255, "epoch": 2863} {"train_loss": -6.615790367126465, "global_step": 120256, "epoch": 2863} {"train_loss": -6.592379570007324, "global_step": 120257, "epoch": 2863} {"train_loss": -6.583871841430664, "global_step": 120258, "epoch": 2863} {"train_loss": -6.585412979125977, "global_step": 120259, "epoch": 2863} {"train_loss": -6.693700313568115, "global_step": 120260, "epoch": 2863} {"train_loss": -6.677145481109619, "global_step": 120261, "epoch": 2863} {"train_loss": -6.653168201446533, "global_step": 120262, "epoch": 2863} {"train_loss": -6.645833492279053, "global_step": 120263, "epoch": 2863} {"train_loss": -6.515605449676514, "global_step": 120264, "epoch": 2863} {"train_loss": -6.38836669921875, "global_step": 120265, "epoch": 2863} {"train_loss": -6.584661483764648, "global_step": 120266, "epoch": 2863} {"train_loss": -6.43768310546875, "global_step": 120267, "epoch": 2863} {"train_loss": -6.580966472625732, "global_step": 120268, "epoch": 2863} {"train_loss": -6.512141227722168, "global_step": 120269, "epoch": 2863} {"train_loss": -6.469861030578613, "global_step": 120270, "epoch": 2863} {"train_loss": -6.436415672302246, "global_step": 120271, "epoch": 2863} {"train_loss": -6.524346351623535, "global_step": 120272, "epoch": 2863} {"train_loss": -6.433323860168457, "global_step": 120273, "epoch": 2863} {"train_loss": -6.541547775268555, "global_step": 120274, "epoch": 2863} {"train_loss": -6.486952781677246, "global_step": 120275, "epoch": 2863} {"train_loss": -6.545395851135254, "global_step": 120276, "epoch": 2863} {"train_loss": -6.6070451736450195, "global_step": 120277, "epoch": 2863} {"train_loss": -6.557103157043457, "global_step": 120278, "epoch": 2863} {"train_loss": -6.561407089233398, "global_step": 120279, "epoch": 2863} {"train_loss": -6.451571464538574, "global_step": 120280, "epoch": 2863} {"train_loss": -6.62662410736084, "global_step": 120281, "epoch": 2863} {"train_loss": -6.576964378356934, "global_step": 120282, "epoch": 2863} {"train_loss": -6.471968173980713, "global_step": 120283, "epoch": 2863} {"train_loss": -6.540969371795654, "global_step": 120284, "epoch": 2863} {"train_loss": -6.537600994110107, "global_step": 120285, "epoch": 2863} {"train_loss": -6.448367118835449, "global_step": 120286, "epoch": 2863} {"train_loss": -6.545465401240757, "global_step": 120287, "epoch": 2863, "val_loss": 76969.0703125} {"train_loss": -6.5409698486328125, "global_step": 120288, "epoch": 2864} {"train_loss": -6.584059715270996, "global_step": 120289, "epoch": 2864} {"train_loss": -6.6573920249938965, "global_step": 120290, "epoch": 2864} {"train_loss": -6.5273661613464355, "global_step": 120291, "epoch": 2864} {"train_loss": -6.491993427276611, "global_step": 120292, "epoch": 2864} {"train_loss": -6.51711368560791, "global_step": 120293, "epoch": 2864} {"train_loss": -6.553801536560059, "global_step": 120294, "epoch": 2864} {"train_loss": -6.624768257141113, "global_step": 120295, "epoch": 2864} {"train_loss": -6.654243469238281, "global_step": 120296, "epoch": 2864} {"train_loss": -6.5633931159973145, "global_step": 120297, "epoch": 2864} {"train_loss": -6.570785999298096, "global_step": 120298, "epoch": 2864} {"train_loss": -6.567941665649414, "global_step": 120299, "epoch": 2864} {"train_loss": -6.691394805908203, "global_step": 120300, "epoch": 2864} {"train_loss": -6.562273025512695, "global_step": 120301, "epoch": 2864} {"train_loss": -6.534768581390381, "global_step": 120302, "epoch": 2864} {"train_loss": -6.561005592346191, "global_step": 120303, "epoch": 2864} {"train_loss": -6.6154584884643555, "global_step": 120304, "epoch": 2864} {"train_loss": -6.462245941162109, "global_step": 120305, "epoch": 2864} {"train_loss": -6.578947067260742, "global_step": 120306, "epoch": 2864} {"train_loss": -6.49685001373291, "global_step": 120307, "epoch": 2864} {"train_loss": -6.582352161407471, "global_step": 120308, "epoch": 2864} {"train_loss": -6.535656929016113, "global_step": 120309, "epoch": 2864} {"train_loss": -6.45865535736084, "global_step": 120310, "epoch": 2864} {"train_loss": -6.536232948303223, "global_step": 120311, "epoch": 2864} {"train_loss": -6.5667924880981445, "global_step": 120312, "epoch": 2864} {"train_loss": -6.561220169067383, "global_step": 120313, "epoch": 2864} {"train_loss": -6.575155258178711, "global_step": 120314, "epoch": 2864} {"train_loss": -6.579623699188232, "global_step": 120315, "epoch": 2864} {"train_loss": -6.592509746551514, "global_step": 120316, "epoch": 2864} {"train_loss": -6.71533203125, "global_step": 120317, "epoch": 2864} {"train_loss": -6.644952774047852, "global_step": 120318, "epoch": 2864} {"train_loss": -6.53004264831543, "global_step": 120319, "epoch": 2864} {"train_loss": -6.543332099914551, "global_step": 120320, "epoch": 2864} {"train_loss": -6.511506080627441, "global_step": 120321, "epoch": 2864} {"train_loss": -6.527651786804199, "global_step": 120322, "epoch": 2864} {"train_loss": -6.518692970275879, "global_step": 120323, "epoch": 2864} {"train_loss": -6.492282867431641, "global_step": 120324, "epoch": 2864} {"train_loss": -6.538999557495117, "global_step": 120325, "epoch": 2864} {"train_loss": -6.627811431884766, "global_step": 120326, "epoch": 2864} {"train_loss": -6.553463935852051, "global_step": 120327, "epoch": 2864} {"train_loss": -6.457635879516602, "global_step": 120328, "epoch": 2864} {"train_loss": -6.562901303881691, "global_step": 120329, "epoch": 2864, "val_loss": 76847.015625} {"train_loss": -6.429702281951904, "global_step": 120330, "epoch": 2865} {"train_loss": -6.569219589233398, "global_step": 120331, "epoch": 2865} {"train_loss": -6.604535102844238, "global_step": 120332, "epoch": 2865} {"train_loss": -6.478340148925781, "global_step": 120333, "epoch": 2865} {"train_loss": -6.61688232421875, "global_step": 120334, "epoch": 2865} {"train_loss": -6.540338039398193, "global_step": 120335, "epoch": 2865} {"train_loss": -6.584813117980957, "global_step": 120336, "epoch": 2865} {"train_loss": -6.645565032958984, "global_step": 120337, "epoch": 2865} {"train_loss": -6.582418441772461, "global_step": 120338, "epoch": 2865} {"train_loss": -6.582427978515625, "global_step": 120339, "epoch": 2865} {"train_loss": -6.687438011169434, "global_step": 120340, "epoch": 2865} {"train_loss": -6.405425071716309, "global_step": 120341, "epoch": 2865} {"train_loss": -6.482926368713379, "global_step": 120342, "epoch": 2865} {"train_loss": -6.512596130371094, "global_step": 120343, "epoch": 2865} {"train_loss": -6.531093597412109, "global_step": 120344, "epoch": 2865} {"train_loss": -6.742773056030273, "global_step": 120345, "epoch": 2865} {"train_loss": -6.619446754455566, "global_step": 120346, "epoch": 2865} {"train_loss": -6.634391784667969, "global_step": 120347, "epoch": 2865} {"train_loss": -6.436019420623779, "global_step": 120348, "epoch": 2865} {"train_loss": -6.630070209503174, "global_step": 120349, "epoch": 2865} {"train_loss": -6.549330234527588, "global_step": 120350, "epoch": 2865} {"train_loss": -6.613104820251465, "global_step": 120351, "epoch": 2865} {"train_loss": -6.5785722732543945, "global_step": 120352, "epoch": 2865} {"train_loss": -6.486407279968262, "global_step": 120353, "epoch": 2865} {"train_loss": -6.587928771972656, "global_step": 120354, "epoch": 2865} {"train_loss": -6.499294281005859, "global_step": 120355, "epoch": 2865} {"train_loss": -6.521657943725586, "global_step": 120356, "epoch": 2865} {"train_loss": -6.496642112731934, "global_step": 120357, "epoch": 2865} {"train_loss": -6.599722862243652, "global_step": 120358, "epoch": 2865} {"train_loss": -6.518324375152588, "global_step": 120359, "epoch": 2865} {"train_loss": -6.586688041687012, "global_step": 120360, "epoch": 2865} {"train_loss": -6.536524295806885, "global_step": 120361, "epoch": 2865} {"train_loss": -6.5190277099609375, "global_step": 120362, "epoch": 2865} {"train_loss": -6.683070659637451, "global_step": 120363, "epoch": 2865} {"train_loss": -6.487112045288086, "global_step": 120364, "epoch": 2865} {"train_loss": -6.593696117401123, "global_step": 120365, "epoch": 2865} {"train_loss": -6.639881134033203, "global_step": 120366, "epoch": 2865} {"train_loss": -6.506276607513428, "global_step": 120367, "epoch": 2865} {"train_loss": -6.614595413208008, "global_step": 120368, "epoch": 2865} {"train_loss": -6.55692195892334, "global_step": 120369, "epoch": 2865} {"train_loss": -6.544206619262695, "global_step": 120370, "epoch": 2865} {"train_loss": -6.5653614316667825, "global_step": 120371, "epoch": 2865, "val_loss": 76765.5390625} {"train_loss": -6.633855819702148, "global_step": 120372, "epoch": 2866} {"train_loss": -6.643596172332764, "global_step": 120373, "epoch": 2866} {"train_loss": -6.538527965545654, "global_step": 120374, "epoch": 2866} {"train_loss": -6.647673606872559, "global_step": 120375, "epoch": 2866} {"train_loss": -6.73516845703125, "global_step": 120376, "epoch": 2866} {"train_loss": -6.695276737213135, "global_step": 120377, "epoch": 2866} {"train_loss": -6.587342262268066, "global_step": 120378, "epoch": 2866} {"train_loss": -6.614205360412598, "global_step": 120379, "epoch": 2866} {"train_loss": -6.688077926635742, "global_step": 120380, "epoch": 2866} {"train_loss": -6.662647724151611, "global_step": 120381, "epoch": 2866} {"train_loss": -6.590582847595215, "global_step": 120382, "epoch": 2866} {"train_loss": -6.497744083404541, "global_step": 120383, "epoch": 2866} {"train_loss": -6.655735969543457, "global_step": 120384, "epoch": 2866} {"train_loss": -6.548215866088867, "global_step": 120385, "epoch": 2866} {"train_loss": -6.549447536468506, "global_step": 120386, "epoch": 2866} {"train_loss": -6.594555854797363, "global_step": 120387, "epoch": 2866} {"train_loss": -6.634174823760986, "global_step": 120388, "epoch": 2866} {"train_loss": -6.646174430847168, "global_step": 120389, "epoch": 2866} {"train_loss": -6.637307167053223, "global_step": 120390, "epoch": 2866} {"train_loss": -6.547316551208496, "global_step": 120391, "epoch": 2866} {"train_loss": -6.58257532119751, "global_step": 120392, "epoch": 2866} {"train_loss": -6.535021781921387, "global_step": 120393, "epoch": 2866} {"train_loss": -6.550284385681152, "global_step": 120394, "epoch": 2866} {"train_loss": -6.577210426330566, "global_step": 120395, "epoch": 2866} {"train_loss": -6.596584320068359, "global_step": 120396, "epoch": 2866} {"train_loss": -6.628612518310547, "global_step": 120397, "epoch": 2866} {"train_loss": -6.748591423034668, "global_step": 120398, "epoch": 2866} {"train_loss": -6.6011457443237305, "global_step": 120399, "epoch": 2866} {"train_loss": -6.588468551635742, "global_step": 120400, "epoch": 2866} {"train_loss": -6.490056037902832, "global_step": 120401, "epoch": 2866} {"train_loss": -6.50368595123291, "global_step": 120402, "epoch": 2866} {"train_loss": -6.576891899108887, "global_step": 120403, "epoch": 2866} {"train_loss": -6.499602317810059, "global_step": 120404, "epoch": 2866} {"train_loss": -6.5293498039245605, "global_step": 120405, "epoch": 2866} {"train_loss": -6.531883716583252, "global_step": 120406, "epoch": 2866} {"train_loss": -6.642678737640381, "global_step": 120407, "epoch": 2866} {"train_loss": -6.5214433670043945, "global_step": 120408, "epoch": 2866} {"train_loss": -6.57866907119751, "global_step": 120409, "epoch": 2866} {"train_loss": -6.623218536376953, "global_step": 120410, "epoch": 2866} {"train_loss": -6.6067914962768555, "global_step": 120411, "epoch": 2866} {"train_loss": -6.699853897094727, "global_step": 120412, "epoch": 2866} {"train_loss": -6.598636547724406, "global_step": 120413, "epoch": 2866, "val_loss": 76922.1015625} {"train_loss": -6.6488142013549805, "global_step": 120414, "epoch": 2867} {"train_loss": -6.535121917724609, "global_step": 120415, "epoch": 2867} {"train_loss": -6.694447040557861, "global_step": 120416, "epoch": 2867} {"train_loss": -6.649659633636475, "global_step": 120417, "epoch": 2867} {"train_loss": -6.585112571716309, "global_step": 120418, "epoch": 2867} {"train_loss": -6.618143081665039, "global_step": 120419, "epoch": 2867} {"train_loss": -6.745638847351074, "global_step": 120420, "epoch": 2867} {"train_loss": -6.619234085083008, "global_step": 120421, "epoch": 2867} {"train_loss": -6.710725784301758, "global_step": 120422, "epoch": 2867} {"train_loss": -6.662803649902344, "global_step": 120423, "epoch": 2867} {"train_loss": -6.530993938446045, "global_step": 120424, "epoch": 2867} {"train_loss": -6.600957870483398, "global_step": 120425, "epoch": 2867} {"train_loss": -6.644006729125977, "global_step": 120426, "epoch": 2867} {"train_loss": -6.514395713806152, "global_step": 120427, "epoch": 2867} {"train_loss": -6.621713638305664, "global_step": 120428, "epoch": 2867} {"train_loss": -6.626913070678711, "global_step": 120429, "epoch": 2867} {"train_loss": -6.5204362869262695, "global_step": 120430, "epoch": 2867} {"train_loss": -6.643982887268066, "global_step": 120431, "epoch": 2867} {"train_loss": -6.475465774536133, "global_step": 120432, "epoch": 2867} {"train_loss": -6.543507099151611, "global_step": 120433, "epoch": 2867} {"train_loss": -6.669159889221191, "global_step": 120434, "epoch": 2867} {"train_loss": -6.568256378173828, "global_step": 120435, "epoch": 2867} {"train_loss": -6.575952053070068, "global_step": 120436, "epoch": 2867} {"train_loss": -6.587132930755615, "global_step": 120437, "epoch": 2867} {"train_loss": -6.49485969543457, "global_step": 120438, "epoch": 2867} {"train_loss": -6.635838985443115, "global_step": 120439, "epoch": 2867} {"train_loss": -6.4912567138671875, "global_step": 120440, "epoch": 2867} {"train_loss": -6.528639316558838, "global_step": 120441, "epoch": 2867} {"train_loss": -6.612368583679199, "global_step": 120442, "epoch": 2867} {"train_loss": -6.507955551147461, "global_step": 120443, "epoch": 2867} {"train_loss": -6.51312255859375, "global_step": 120444, "epoch": 2867} {"train_loss": -6.687949180603027, "global_step": 120445, "epoch": 2867} {"train_loss": -6.58530330657959, "global_step": 120446, "epoch": 2867} {"train_loss": -6.581345558166504, "global_step": 120447, "epoch": 2867} {"train_loss": -6.376341819763184, "global_step": 120448, "epoch": 2867} {"train_loss": -6.532937049865723, "global_step": 120449, "epoch": 2867} {"train_loss": -6.5180158615112305, "global_step": 120450, "epoch": 2867} {"train_loss": -6.62053108215332, "global_step": 120451, "epoch": 2867} {"train_loss": -6.680280685424805, "global_step": 120452, "epoch": 2867} {"train_loss": -6.540066242218018, "global_step": 120453, "epoch": 2867} {"train_loss": -6.502422332763672, "global_step": 120454, "epoch": 2867} {"train_loss": -6.584481477737427, "global_step": 120455, "epoch": 2867, "val_loss": 76769.5078125} {"train_loss": -6.605010032653809, "global_step": 120456, "epoch": 2868} {"train_loss": -6.703982353210449, "global_step": 120457, "epoch": 2868} {"train_loss": -6.660876750946045, "global_step": 120458, "epoch": 2868} {"train_loss": -6.634517669677734, "global_step": 120459, "epoch": 2868} {"train_loss": -6.541803359985352, "global_step": 120460, "epoch": 2868} {"train_loss": -6.539770126342773, "global_step": 120461, "epoch": 2868} {"train_loss": -6.675751686096191, "global_step": 120462, "epoch": 2868} {"train_loss": -6.594132423400879, "global_step": 120463, "epoch": 2868} {"train_loss": -6.629092693328857, "global_step": 120464, "epoch": 2868} {"train_loss": -6.524720668792725, "global_step": 120465, "epoch": 2868} {"train_loss": -6.678178310394287, "global_step": 120466, "epoch": 2868} {"train_loss": -6.622414588928223, "global_step": 120467, "epoch": 2868} {"train_loss": -6.594992637634277, "global_step": 120468, "epoch": 2868} {"train_loss": -6.483008861541748, "global_step": 120469, "epoch": 2868} {"train_loss": -6.673024654388428, "global_step": 120470, "epoch": 2868} {"train_loss": -6.520544528961182, "global_step": 120471, "epoch": 2868} {"train_loss": -6.530501842498779, "global_step": 120472, "epoch": 2868} {"train_loss": -6.5941290855407715, "global_step": 120473, "epoch": 2868} {"train_loss": -6.647075653076172, "global_step": 120474, "epoch": 2868} {"train_loss": -6.598998069763184, "global_step": 120475, "epoch": 2868} {"train_loss": -6.4714508056640625, "global_step": 120476, "epoch": 2868} {"train_loss": -6.547328948974609, "global_step": 120477, "epoch": 2868} {"train_loss": -6.441728591918945, "global_step": 120478, "epoch": 2868} {"train_loss": -6.43589448928833, "global_step": 120479, "epoch": 2868} {"train_loss": -6.389101505279541, "global_step": 120480, "epoch": 2868} {"train_loss": -6.583730220794678, "global_step": 120481, "epoch": 2868} {"train_loss": -6.430045127868652, "global_step": 120482, "epoch": 2868} {"train_loss": -6.551548004150391, "global_step": 120483, "epoch": 2868} {"train_loss": -6.5903778076171875, "global_step": 120484, "epoch": 2868} {"train_loss": -6.481447696685791, "global_step": 120485, "epoch": 2868} {"train_loss": -6.4924421310424805, "global_step": 120486, "epoch": 2868} {"train_loss": -6.579436302185059, "global_step": 120487, "epoch": 2868} {"train_loss": -6.516604423522949, "global_step": 120488, "epoch": 2868} {"train_loss": -6.569336891174316, "global_step": 120489, "epoch": 2868} {"train_loss": -6.574214935302734, "global_step": 120490, "epoch": 2868} {"train_loss": -6.635415077209473, "global_step": 120491, "epoch": 2868} {"train_loss": -6.536006927490234, "global_step": 120492, "epoch": 2868} {"train_loss": -6.491066932678223, "global_step": 120493, "epoch": 2868} {"train_loss": -6.46912956237793, "global_step": 120494, "epoch": 2868} {"train_loss": -6.587981224060059, "global_step": 120495, "epoch": 2868} {"train_loss": -6.59104061126709, "global_step": 120496, "epoch": 2868} {"train_loss": -6.5653035300118585, "global_step": 120497, "epoch": 2868, "val_loss": 77046.09375} {"train_loss": -6.53421688079834, "global_step": 120498, "epoch": 2869} {"train_loss": -6.517763137817383, "global_step": 120499, "epoch": 2869} {"train_loss": -6.568737030029297, "global_step": 120500, "epoch": 2869} {"train_loss": -6.602542877197266, "global_step": 120501, "epoch": 2869} {"train_loss": -6.5874552726745605, "global_step": 120502, "epoch": 2869} {"train_loss": -6.548303604125977, "global_step": 120503, "epoch": 2869} {"train_loss": -6.554960250854492, "global_step": 120504, "epoch": 2869} {"train_loss": -6.54278564453125, "global_step": 120505, "epoch": 2869} {"train_loss": -6.528802871704102, "global_step": 120506, "epoch": 2869} {"train_loss": -6.542220592498779, "global_step": 120507, "epoch": 2869} {"train_loss": -6.445160865783691, "global_step": 120508, "epoch": 2869} {"train_loss": -6.54856014251709, "global_step": 120509, "epoch": 2869} {"train_loss": -6.51789665222168, "global_step": 120510, "epoch": 2869} {"train_loss": -6.503037452697754, "global_step": 120511, "epoch": 2869} {"train_loss": -6.529358386993408, "global_step": 120512, "epoch": 2869} {"train_loss": -6.513304710388184, "global_step": 120513, "epoch": 2869} {"train_loss": -6.519035339355469, "global_step": 120514, "epoch": 2869} {"train_loss": -6.542047500610352, "global_step": 120515, "epoch": 2869} {"train_loss": -6.528241157531738, "global_step": 120516, "epoch": 2869} {"train_loss": -6.518862724304199, "global_step": 120517, "epoch": 2869} {"train_loss": -6.561842918395996, "global_step": 120518, "epoch": 2869} {"train_loss": -6.413748741149902, "global_step": 120519, "epoch": 2869} {"train_loss": -6.5915093421936035, "global_step": 120520, "epoch": 2869} {"train_loss": -6.643424034118652, "global_step": 120521, "epoch": 2869} {"train_loss": -6.578557968139648, "global_step": 120522, "epoch": 2869} {"train_loss": -6.607605457305908, "global_step": 120523, "epoch": 2869} {"train_loss": -6.529850006103516, "global_step": 120524, "epoch": 2869} {"train_loss": -6.484855651855469, "global_step": 120525, "epoch": 2869} {"train_loss": -6.581823348999023, "global_step": 120526, "epoch": 2869} {"train_loss": -6.567841529846191, "global_step": 120527, "epoch": 2869} {"train_loss": -6.587711811065674, "global_step": 120528, "epoch": 2869} {"train_loss": -6.460933685302734, "global_step": 120529, "epoch": 2869} {"train_loss": -6.532197952270508, "global_step": 120530, "epoch": 2869} {"train_loss": -6.625741004943848, "global_step": 120531, "epoch": 2869} {"train_loss": -6.611317157745361, "global_step": 120532, "epoch": 2869} {"train_loss": -6.443685531616211, "global_step": 120533, "epoch": 2869} {"train_loss": -6.46555757522583, "global_step": 120534, "epoch": 2869} {"train_loss": -6.691492080688477, "global_step": 120535, "epoch": 2869} {"train_loss": -6.515582084655762, "global_step": 120536, "epoch": 2869} {"train_loss": -6.497492790222168, "global_step": 120537, "epoch": 2869} {"train_loss": -6.572164535522461, "global_step": 120538, "epoch": 2869} {"train_loss": -6.542095717929659, "global_step": 120539, "epoch": 2869, "val_loss": 76838.2421875} {"train_loss": -6.537164688110352, "global_step": 120540, "epoch": 2870} {"train_loss": -6.457122325897217, "global_step": 120541, "epoch": 2870} {"train_loss": -6.519939422607422, "global_step": 120542, "epoch": 2870} {"train_loss": -6.535219669342041, "global_step": 120543, "epoch": 2870} {"train_loss": -6.5053558349609375, "global_step": 120544, "epoch": 2870} {"train_loss": -6.54468297958374, "global_step": 120545, "epoch": 2870} {"train_loss": -6.493890762329102, "global_step": 120546, "epoch": 2870} {"train_loss": -6.576598167419434, "global_step": 120547, "epoch": 2870} {"train_loss": -6.50600528717041, "global_step": 120548, "epoch": 2870} {"train_loss": -6.559562683105469, "global_step": 120549, "epoch": 2870} {"train_loss": -6.547256946563721, "global_step": 120550, "epoch": 2870} {"train_loss": -6.612447261810303, "global_step": 120551, "epoch": 2870} {"train_loss": -6.625446319580078, "global_step": 120552, "epoch": 2870} {"train_loss": -6.4796223640441895, "global_step": 120553, "epoch": 2870} {"train_loss": -6.5528883934021, "global_step": 120554, "epoch": 2870} {"train_loss": -6.523404598236084, "global_step": 120555, "epoch": 2870} {"train_loss": -6.521096229553223, "global_step": 120556, "epoch": 2870} {"train_loss": -6.543721675872803, "global_step": 120557, "epoch": 2870} {"train_loss": -6.618687152862549, "global_step": 120558, "epoch": 2870} {"train_loss": -6.518035411834717, "global_step": 120559, "epoch": 2870} {"train_loss": -6.5394768714904785, "global_step": 120560, "epoch": 2870} {"train_loss": -6.671771049499512, "global_step": 120561, "epoch": 2870} {"train_loss": -6.692979335784912, "global_step": 120562, "epoch": 2870} {"train_loss": -6.583155155181885, "global_step": 120563, "epoch": 2870} {"train_loss": -6.606101989746094, "global_step": 120564, "epoch": 2870} {"train_loss": -6.623213768005371, "global_step": 120565, "epoch": 2870} {"train_loss": -6.63861083984375, "global_step": 120566, "epoch": 2870} {"train_loss": -6.4879655838012695, "global_step": 120567, "epoch": 2870} {"train_loss": -6.622648239135742, "global_step": 120568, "epoch": 2870} {"train_loss": -6.590948104858398, "global_step": 120569, "epoch": 2870} {"train_loss": -6.694616317749023, "global_step": 120570, "epoch": 2870} {"train_loss": -6.611997604370117, "global_step": 120571, "epoch": 2870} {"train_loss": -6.57322359085083, "global_step": 120572, "epoch": 2870} {"train_loss": -6.641773700714111, "global_step": 120573, "epoch": 2870} {"train_loss": -6.592561721801758, "global_step": 120574, "epoch": 2870} {"train_loss": -6.694571495056152, "global_step": 120575, "epoch": 2870} {"train_loss": -6.663963794708252, "global_step": 120576, "epoch": 2870} {"train_loss": -6.64112663269043, "global_step": 120577, "epoch": 2870} {"train_loss": -6.534341335296631, "global_step": 120578, "epoch": 2870} {"train_loss": -6.618213653564453, "global_step": 120579, "epoch": 2870} {"train_loss": -6.558803558349609, "global_step": 120580, "epoch": 2870} {"train_loss": -6.579214890797933, "global_step": 120581, "epoch": 2870, "val_loss": 76964.625} {"train_loss": -6.620593547821045, "global_step": 120582, "epoch": 2871} {"train_loss": -6.548678398132324, "global_step": 120583, "epoch": 2871} {"train_loss": -6.601709365844727, "global_step": 120584, "epoch": 2871} {"train_loss": -6.658289909362793, "global_step": 120585, "epoch": 2871} {"train_loss": -6.649384498596191, "global_step": 120586, "epoch": 2871} {"train_loss": -6.6815667152404785, "global_step": 120587, "epoch": 2871} {"train_loss": -6.620522499084473, "global_step": 120588, "epoch": 2871} {"train_loss": -6.626271724700928, "global_step": 120589, "epoch": 2871} {"train_loss": -6.5476298332214355, "global_step": 120590, "epoch": 2871} {"train_loss": -6.603565216064453, "global_step": 120591, "epoch": 2871} {"train_loss": -6.621764183044434, "global_step": 120592, "epoch": 2871} {"train_loss": -6.514422416687012, "global_step": 120593, "epoch": 2871} {"train_loss": -6.695892333984375, "global_step": 120594, "epoch": 2871} {"train_loss": -6.466825485229492, "global_step": 120595, "epoch": 2871} {"train_loss": -6.495842933654785, "global_step": 120596, "epoch": 2871} {"train_loss": -6.680977821350098, "global_step": 120597, "epoch": 2871} {"train_loss": -6.429312705993652, "global_step": 120598, "epoch": 2871} {"train_loss": -6.512692928314209, "global_step": 120599, "epoch": 2871} {"train_loss": -6.553289413452148, "global_step": 120600, "epoch": 2871} {"train_loss": -6.6356072425842285, "global_step": 120601, "epoch": 2871} {"train_loss": -6.475960731506348, "global_step": 120602, "epoch": 2871} {"train_loss": -6.7140960693359375, "global_step": 120603, "epoch": 2871} {"train_loss": -6.547093868255615, "global_step": 120604, "epoch": 2871} {"train_loss": -6.559993743896484, "global_step": 120605, "epoch": 2871} {"train_loss": -6.502735614776611, "global_step": 120606, "epoch": 2871} {"train_loss": -6.512173652648926, "global_step": 120607, "epoch": 2871} {"train_loss": -6.566003799438477, "global_step": 120608, "epoch": 2871} {"train_loss": -6.624278545379639, "global_step": 120609, "epoch": 2871} {"train_loss": -6.457633972167969, "global_step": 120610, "epoch": 2871} {"train_loss": -6.490887641906738, "global_step": 120611, "epoch": 2871} {"train_loss": -6.5267415046691895, "global_step": 120612, "epoch": 2871} {"train_loss": -6.459188461303711, "global_step": 120613, "epoch": 2871} {"train_loss": -6.672608852386475, "global_step": 120614, "epoch": 2871} {"train_loss": -6.535449981689453, "global_step": 120615, "epoch": 2871} {"train_loss": -6.610906600952148, "global_step": 120616, "epoch": 2871} {"train_loss": -6.572922706604004, "global_step": 120617, "epoch": 2871} {"train_loss": -6.460721969604492, "global_step": 120618, "epoch": 2871} {"train_loss": -6.516451835632324, "global_step": 120619, "epoch": 2871} {"train_loss": -6.542441368103027, "global_step": 120620, "epoch": 2871} {"train_loss": -6.53646183013916, "global_step": 120621, "epoch": 2871} {"train_loss": -6.524245262145996, "global_step": 120622, "epoch": 2871} {"train_loss": -6.565605095454624, "global_step": 120623, "epoch": 2871, "val_loss": 76810.4453125} {"train_loss": -6.531771659851074, "global_step": 120624, "epoch": 2872} {"train_loss": -6.664149761199951, "global_step": 120625, "epoch": 2872} {"train_loss": -6.535207271575928, "global_step": 120626, "epoch": 2872} {"train_loss": -6.605003356933594, "global_step": 120627, "epoch": 2872} {"train_loss": -6.588268756866455, "global_step": 120628, "epoch": 2872} {"train_loss": -6.510908126831055, "global_step": 120629, "epoch": 2872} {"train_loss": -6.635622978210449, "global_step": 120630, "epoch": 2872} {"train_loss": -6.689165115356445, "global_step": 120631, "epoch": 2872} {"train_loss": -6.541046142578125, "global_step": 120632, "epoch": 2872} {"train_loss": -6.516555309295654, "global_step": 120633, "epoch": 2872} {"train_loss": -6.594031810760498, "global_step": 120634, "epoch": 2872} {"train_loss": -6.557102203369141, "global_step": 120635, "epoch": 2872} {"train_loss": -6.404952049255371, "global_step": 120636, "epoch": 2872} {"train_loss": -6.645711898803711, "global_step": 120637, "epoch": 2872} {"train_loss": -6.642412185668945, "global_step": 120638, "epoch": 2872} {"train_loss": -6.615438461303711, "global_step": 120639, "epoch": 2872} {"train_loss": -6.600286960601807, "global_step": 120640, "epoch": 2872} {"train_loss": -6.495911598205566, "global_step": 120641, "epoch": 2872} {"train_loss": -6.555949687957764, "global_step": 120642, "epoch": 2872} {"train_loss": -6.452018737792969, "global_step": 120643, "epoch": 2872} {"train_loss": -6.461310386657715, "global_step": 120644, "epoch": 2872} {"train_loss": -6.5570759773254395, "global_step": 120645, "epoch": 2872} {"train_loss": -6.553056716918945, "global_step": 120646, "epoch": 2872} {"train_loss": -6.494100570678711, "global_step": 120647, "epoch": 2872} {"train_loss": -6.68419075012207, "global_step": 120648, "epoch": 2872} {"train_loss": -6.495505332946777, "global_step": 120649, "epoch": 2872} {"train_loss": -6.563969135284424, "global_step": 120650, "epoch": 2872} {"train_loss": -6.514540672302246, "global_step": 120651, "epoch": 2872} {"train_loss": -6.469111442565918, "global_step": 120652, "epoch": 2872} {"train_loss": -6.506351470947266, "global_step": 120653, "epoch": 2872} {"train_loss": -6.5906171798706055, "global_step": 120654, "epoch": 2872} {"train_loss": -6.5666327476501465, "global_step": 120655, "epoch": 2872} {"train_loss": -6.5893049240112305, "global_step": 120656, "epoch": 2872} {"train_loss": -6.5888214111328125, "global_step": 120657, "epoch": 2872} {"train_loss": -6.5228376388549805, "global_step": 120658, "epoch": 2872} {"train_loss": -6.677369117736816, "global_step": 120659, "epoch": 2872} {"train_loss": -6.620913028717041, "global_step": 120660, "epoch": 2872} {"train_loss": -6.591909885406494, "global_step": 120661, "epoch": 2872} {"train_loss": -6.621760368347168, "global_step": 120662, "epoch": 2872} {"train_loss": -6.67609977722168, "global_step": 120663, "epoch": 2872} {"train_loss": -6.634562015533447, "global_step": 120664, "epoch": 2872} {"train_loss": -6.571854909261067, "global_step": 120665, "epoch": 2872, "val_loss": 76935.1640625} {"train_loss": -6.568618297576904, "global_step": 120666, "epoch": 2873} {"train_loss": -6.589557647705078, "global_step": 120667, "epoch": 2873} {"train_loss": -6.7471923828125, "global_step": 120668, "epoch": 2873} {"train_loss": -6.5038604736328125, "global_step": 120669, "epoch": 2873} {"train_loss": -6.603472709655762, "global_step": 120670, "epoch": 2873} {"train_loss": -6.7764692306518555, "global_step": 120671, "epoch": 2873} {"train_loss": -6.618905067443848, "global_step": 120672, "epoch": 2873} {"train_loss": -6.406728744506836, "global_step": 120673, "epoch": 2873} {"train_loss": -6.671102523803711, "global_step": 120674, "epoch": 2873} {"train_loss": -6.670901298522949, "global_step": 120675, "epoch": 2873} {"train_loss": -6.559741020202637, "global_step": 120676, "epoch": 2873} {"train_loss": -6.635256767272949, "global_step": 120677, "epoch": 2873} {"train_loss": -6.507002830505371, "global_step": 120678, "epoch": 2873} {"train_loss": -6.549369812011719, "global_step": 120679, "epoch": 2873} {"train_loss": -6.557811260223389, "global_step": 120680, "epoch": 2873} {"train_loss": -6.697958469390869, "global_step": 120681, "epoch": 2873} {"train_loss": -6.565598964691162, "global_step": 120682, "epoch": 2873} {"train_loss": -6.652567386627197, "global_step": 120683, "epoch": 2873} {"train_loss": -6.580425262451172, "global_step": 120684, "epoch": 2873} {"train_loss": -6.511688709259033, "global_step": 120685, "epoch": 2873} {"train_loss": -6.450797080993652, "global_step": 120686, "epoch": 2873} {"train_loss": -6.4577765464782715, "global_step": 120687, "epoch": 2873} {"train_loss": -6.441769599914551, "global_step": 120688, "epoch": 2873} {"train_loss": -6.622369289398193, "global_step": 120689, "epoch": 2873} {"train_loss": -6.436933994293213, "global_step": 120690, "epoch": 2873} {"train_loss": -6.4974365234375, "global_step": 120691, "epoch": 2873} {"train_loss": -6.375208377838135, "global_step": 120692, "epoch": 2873} {"train_loss": -6.520159721374512, "global_step": 120693, "epoch": 2873} {"train_loss": -6.434078693389893, "global_step": 120694, "epoch": 2873} {"train_loss": -6.48293399810791, "global_step": 120695, "epoch": 2873} {"train_loss": -6.515316009521484, "global_step": 120696, "epoch": 2873} {"train_loss": -6.5889573097229, "global_step": 120697, "epoch": 2873} {"train_loss": -6.466902256011963, "global_step": 120698, "epoch": 2873} {"train_loss": -6.430273056030273, "global_step": 120699, "epoch": 2873} {"train_loss": -6.494688034057617, "global_step": 120700, "epoch": 2873} {"train_loss": -6.565124988555908, "global_step": 120701, "epoch": 2873} {"train_loss": -6.500183582305908, "global_step": 120702, "epoch": 2873} {"train_loss": -6.43931770324707, "global_step": 120703, "epoch": 2873} {"train_loss": -6.540639877319336, "global_step": 120704, "epoch": 2873} {"train_loss": -6.392390251159668, "global_step": 120705, "epoch": 2873} {"train_loss": -6.555262088775635, "global_step": 120706, "epoch": 2873} {"train_loss": -6.537954829988026, "global_step": 120707, "epoch": 2873, "val_loss": 77193.390625} {"train_loss": -6.54313325881958, "global_step": 120708, "epoch": 2874} {"train_loss": -6.421975612640381, "global_step": 120709, "epoch": 2874} {"train_loss": -6.66046667098999, "global_step": 120710, "epoch": 2874} {"train_loss": -6.498306751251221, "global_step": 120711, "epoch": 2874} {"train_loss": -6.5777435302734375, "global_step": 120712, "epoch": 2874} {"train_loss": -6.50032901763916, "global_step": 120713, "epoch": 2874} {"train_loss": -6.578090667724609, "global_step": 120714, "epoch": 2874} {"train_loss": -6.615873336791992, "global_step": 120715, "epoch": 2874} {"train_loss": -6.602426528930664, "global_step": 120716, "epoch": 2874} {"train_loss": -6.5550031661987305, "global_step": 120717, "epoch": 2874} {"train_loss": -6.502562999725342, "global_step": 120718, "epoch": 2874} {"train_loss": -6.6226983070373535, "global_step": 120719, "epoch": 2874} {"train_loss": -6.532061576843262, "global_step": 120720, "epoch": 2874} {"train_loss": -6.594265937805176, "global_step": 120721, "epoch": 2874} {"train_loss": -6.556350231170654, "global_step": 120722, "epoch": 2874} {"train_loss": -6.469302177429199, "global_step": 120723, "epoch": 2874} {"train_loss": -6.476431369781494, "global_step": 120724, "epoch": 2874} {"train_loss": -6.730951309204102, "global_step": 120725, "epoch": 2874} {"train_loss": -6.476315975189209, "global_step": 120726, "epoch": 2874} {"train_loss": -6.581330299377441, "global_step": 120727, "epoch": 2874} {"train_loss": -6.598393440246582, "global_step": 120728, "epoch": 2874} {"train_loss": -6.52918815612793, "global_step": 120729, "epoch": 2874} {"train_loss": -6.601884841918945, "global_step": 120730, "epoch": 2874} {"train_loss": -6.467316150665283, "global_step": 120731, "epoch": 2874} {"train_loss": -6.537595748901367, "global_step": 120732, "epoch": 2874} {"train_loss": -6.605608940124512, "global_step": 120733, "epoch": 2874} {"train_loss": -6.490761756896973, "global_step": 120734, "epoch": 2874} {"train_loss": -6.630924224853516, "global_step": 120735, "epoch": 2874} {"train_loss": -6.45515251159668, "global_step": 120736, "epoch": 2874} {"train_loss": -6.452850341796875, "global_step": 120737, "epoch": 2874} {"train_loss": -6.4392008781433105, "global_step": 120738, "epoch": 2874} {"train_loss": -6.532132625579834, "global_step": 120739, "epoch": 2874} {"train_loss": -6.610990524291992, "global_step": 120740, "epoch": 2874} {"train_loss": -6.537585258483887, "global_step": 120741, "epoch": 2874} {"train_loss": -6.488206386566162, "global_step": 120742, "epoch": 2874} {"train_loss": -6.494697570800781, "global_step": 120743, "epoch": 2874} {"train_loss": -6.455170154571533, "global_step": 120744, "epoch": 2874} {"train_loss": -6.438774585723877, "global_step": 120745, "epoch": 2874} {"train_loss": -6.559276580810547, "global_step": 120746, "epoch": 2874} {"train_loss": -6.54770565032959, "global_step": 120747, "epoch": 2874} {"train_loss": -6.447907447814941, "global_step": 120748, "epoch": 2874} {"train_loss": -6.536480449494862, "global_step": 120749, "epoch": 2874, "val_loss": 76970.1640625} {"train_loss": -6.576168060302734, "global_step": 120750, "epoch": 2875} {"train_loss": -6.5955491065979, "global_step": 120751, "epoch": 2875} {"train_loss": -6.522688865661621, "global_step": 120752, "epoch": 2875} {"train_loss": -6.593874931335449, "global_step": 120753, "epoch": 2875} {"train_loss": -6.641635417938232, "global_step": 120754, "epoch": 2875} {"train_loss": -6.541721820831299, "global_step": 120755, "epoch": 2875} {"train_loss": -6.6477274894714355, "global_step": 120756, "epoch": 2875} {"train_loss": -6.604696273803711, "global_step": 120757, "epoch": 2875} {"train_loss": -6.571053504943848, "global_step": 120758, "epoch": 2875} {"train_loss": -6.649933338165283, "global_step": 120759, "epoch": 2875} {"train_loss": -6.561198711395264, "global_step": 120760, "epoch": 2875} {"train_loss": -6.611043453216553, "global_step": 120761, "epoch": 2875} {"train_loss": -6.637445449829102, "global_step": 120762, "epoch": 2875} {"train_loss": -6.616759300231934, "global_step": 120763, "epoch": 2875} {"train_loss": -6.655545711517334, "global_step": 120764, "epoch": 2875} {"train_loss": -6.597988128662109, "global_step": 120765, "epoch": 2875} {"train_loss": -6.564152717590332, "global_step": 120766, "epoch": 2875} {"train_loss": -6.609262943267822, "global_step": 120767, "epoch": 2875} {"train_loss": -6.534947395324707, "global_step": 120768, "epoch": 2875} {"train_loss": -6.598094940185547, "global_step": 120769, "epoch": 2875} {"train_loss": -6.617736339569092, "global_step": 120770, "epoch": 2875} {"train_loss": -6.53605318069458, "global_step": 120771, "epoch": 2875} {"train_loss": -6.599618434906006, "global_step": 120772, "epoch": 2875} {"train_loss": -6.560945510864258, "global_step": 120773, "epoch": 2875} {"train_loss": -6.657224655151367, "global_step": 120774, "epoch": 2875} {"train_loss": -6.651926040649414, "global_step": 120775, "epoch": 2875} {"train_loss": -6.610159397125244, "global_step": 120776, "epoch": 2875} {"train_loss": -6.594209671020508, "global_step": 120777, "epoch": 2875} {"train_loss": -6.618786811828613, "global_step": 120778, "epoch": 2875} {"train_loss": -6.524247169494629, "global_step": 120779, "epoch": 2875} {"train_loss": -6.5243353843688965, "global_step": 120780, "epoch": 2875} {"train_loss": -6.534049034118652, "global_step": 120781, "epoch": 2875} {"train_loss": -6.600937366485596, "global_step": 120782, "epoch": 2875} {"train_loss": -6.575572967529297, "global_step": 120783, "epoch": 2875} {"train_loss": -6.656457424163818, "global_step": 120784, "epoch": 2875} {"train_loss": -6.589215278625488, "global_step": 120785, "epoch": 2875} {"train_loss": -6.558005332946777, "global_step": 120786, "epoch": 2875} {"train_loss": -6.493846893310547, "global_step": 120787, "epoch": 2875} {"train_loss": -6.5650177001953125, "global_step": 120788, "epoch": 2875} {"train_loss": -6.491039276123047, "global_step": 120789, "epoch": 2875} {"train_loss": -6.518143653869629, "global_step": 120790, "epoch": 2875} {"train_loss": -6.583167552947998, "global_step": 120791, "epoch": 2875, "val_loss": 77100.2421875} {"train_loss": -6.603682518005371, "global_step": 120792, "epoch": 2876} {"train_loss": -6.541801929473877, "global_step": 120793, "epoch": 2876} {"train_loss": -6.654407978057861, "global_step": 120794, "epoch": 2876} {"train_loss": -6.5298075675964355, "global_step": 120795, "epoch": 2876} {"train_loss": -6.694563865661621, "global_step": 120796, "epoch": 2876} {"train_loss": -6.6377692222595215, "global_step": 120797, "epoch": 2876} {"train_loss": -6.62490177154541, "global_step": 120798, "epoch": 2876} {"train_loss": -6.6058173179626465, "global_step": 120799, "epoch": 2876} {"train_loss": -6.580583572387695, "global_step": 120800, "epoch": 2876} {"train_loss": -6.649736404418945, "global_step": 120801, "epoch": 2876} {"train_loss": -6.608146667480469, "global_step": 120802, "epoch": 2876} {"train_loss": -6.512187480926514, "global_step": 120803, "epoch": 2876} {"train_loss": -6.621373176574707, "global_step": 120804, "epoch": 2876} {"train_loss": -6.497163772583008, "global_step": 120805, "epoch": 2876} {"train_loss": -6.717479705810547, "global_step": 120806, "epoch": 2876} {"train_loss": -6.541460990905762, "global_step": 120807, "epoch": 2876} {"train_loss": -6.690336227416992, "global_step": 120808, "epoch": 2876} {"train_loss": -6.475829601287842, "global_step": 120809, "epoch": 2876} {"train_loss": -6.481367588043213, "global_step": 120810, "epoch": 2876} {"train_loss": -6.573854446411133, "global_step": 120811, "epoch": 2876} {"train_loss": -6.6549177169799805, "global_step": 120812, "epoch": 2876} {"train_loss": -6.585430145263672, "global_step": 120813, "epoch": 2876} {"train_loss": -6.7006096839904785, "global_step": 120814, "epoch": 2876} {"train_loss": -6.654173851013184, "global_step": 120815, "epoch": 2876} {"train_loss": -6.598136901855469, "global_step": 120816, "epoch": 2876} {"train_loss": -6.484683036804199, "global_step": 120817, "epoch": 2876} {"train_loss": -6.615368843078613, "global_step": 120818, "epoch": 2876} {"train_loss": -6.628333568572998, "global_step": 120819, "epoch": 2876} {"train_loss": -6.5318756103515625, "global_step": 120820, "epoch": 2876} {"train_loss": -6.387850761413574, "global_step": 120821, "epoch": 2876} {"train_loss": -6.617428779602051, "global_step": 120822, "epoch": 2876} {"train_loss": -6.4869914054870605, "global_step": 120823, "epoch": 2876} {"train_loss": -6.54294490814209, "global_step": 120824, "epoch": 2876} {"train_loss": -6.532523155212402, "global_step": 120825, "epoch": 2876} {"train_loss": -6.513721466064453, "global_step": 120826, "epoch": 2876} {"train_loss": -6.581879615783691, "global_step": 120827, "epoch": 2876} {"train_loss": -6.5352783203125, "global_step": 120828, "epoch": 2876} {"train_loss": -6.5102620124816895, "global_step": 120829, "epoch": 2876} {"train_loss": -6.5708770751953125, "global_step": 120830, "epoch": 2876} {"train_loss": -6.629482746124268, "global_step": 120831, "epoch": 2876} {"train_loss": -6.70451545715332, "global_step": 120832, "epoch": 2876} {"train_loss": -6.582218851361956, "global_step": 120833, "epoch": 2876, "val_loss": 77130.1640625} {"train_loss": -6.7449541091918945, "global_step": 120834, "epoch": 2877} {"train_loss": -6.594228744506836, "global_step": 120835, "epoch": 2877} {"train_loss": -6.62336540222168, "global_step": 120836, "epoch": 2877} {"train_loss": -6.642745018005371, "global_step": 120837, "epoch": 2877} {"train_loss": -6.484134674072266, "global_step": 120838, "epoch": 2877} {"train_loss": -6.501141548156738, "global_step": 120839, "epoch": 2877} {"train_loss": -6.541092872619629, "global_step": 120840, "epoch": 2877} {"train_loss": -6.3666672706604, "global_step": 120841, "epoch": 2877} {"train_loss": -6.501023292541504, "global_step": 120842, "epoch": 2877} {"train_loss": -6.46433162689209, "global_step": 120843, "epoch": 2877} {"train_loss": -6.494095325469971, "global_step": 120844, "epoch": 2877} {"train_loss": -6.546980857849121, "global_step": 120845, "epoch": 2877} {"train_loss": -6.451518535614014, "global_step": 120846, "epoch": 2877} {"train_loss": -6.506237030029297, "global_step": 120847, "epoch": 2877} {"train_loss": -6.654158115386963, "global_step": 120848, "epoch": 2877} {"train_loss": -6.588490009307861, "global_step": 120849, "epoch": 2877} {"train_loss": -6.6051788330078125, "global_step": 120850, "epoch": 2877} {"train_loss": -6.518926620483398, "global_step": 120851, "epoch": 2877} {"train_loss": -6.6518120765686035, "global_step": 120852, "epoch": 2877} {"train_loss": -6.6724138259887695, "global_step": 120853, "epoch": 2877} {"train_loss": -6.46882963180542, "global_step": 120854, "epoch": 2877} {"train_loss": -6.5303239822387695, "global_step": 120855, "epoch": 2877} {"train_loss": -6.489521026611328, "global_step": 120856, "epoch": 2877} {"train_loss": -6.644567489624023, "global_step": 120857, "epoch": 2877} {"train_loss": -6.473093032836914, "global_step": 120858, "epoch": 2877} {"train_loss": -6.605639457702637, "global_step": 120859, "epoch": 2877} {"train_loss": -6.595865726470947, "global_step": 120860, "epoch": 2877} {"train_loss": -6.449443817138672, "global_step": 120861, "epoch": 2877} {"train_loss": -6.440279006958008, "global_step": 120862, "epoch": 2877} {"train_loss": -6.53554630279541, "global_step": 120863, "epoch": 2877} {"train_loss": -6.455374717712402, "global_step": 120864, "epoch": 2877} {"train_loss": -6.376216888427734, "global_step": 120865, "epoch": 2877} {"train_loss": -6.497969627380371, "global_step": 120866, "epoch": 2877} {"train_loss": -6.331694602966309, "global_step": 120867, "epoch": 2877} {"train_loss": -6.583498954772949, "global_step": 120868, "epoch": 2877} {"train_loss": -6.60069465637207, "global_step": 120869, "epoch": 2877} {"train_loss": -6.478799343109131, "global_step": 120870, "epoch": 2877} {"train_loss": -6.523530960083008, "global_step": 120871, "epoch": 2877} {"train_loss": -6.410576820373535, "global_step": 120872, "epoch": 2877} {"train_loss": -6.66928768157959, "global_step": 120873, "epoch": 2877} {"train_loss": -6.578117847442627, "global_step": 120874, "epoch": 2877} {"train_loss": -6.533549831027076, "global_step": 120875, "epoch": 2877, "val_loss": 77054.7578125} {"train_loss": -6.608891487121582, "global_step": 120876, "epoch": 2878} {"train_loss": -6.575071334838867, "global_step": 120877, "epoch": 2878} {"train_loss": -6.545055389404297, "global_step": 120878, "epoch": 2878} {"train_loss": -6.5558671951293945, "global_step": 120879, "epoch": 2878} {"train_loss": -6.595000267028809, "global_step": 120880, "epoch": 2878} {"train_loss": -6.666264057159424, "global_step": 120881, "epoch": 2878} {"train_loss": -6.6641645431518555, "global_step": 120882, "epoch": 2878} {"train_loss": -6.528250694274902, "global_step": 120883, "epoch": 2878} {"train_loss": -6.457832336425781, "global_step": 120884, "epoch": 2878} {"train_loss": -6.506770133972168, "global_step": 120885, "epoch": 2878} {"train_loss": -6.546955108642578, "global_step": 120886, "epoch": 2878} {"train_loss": -6.620739936828613, "global_step": 120887, "epoch": 2878} {"train_loss": -6.402198791503906, "global_step": 120888, "epoch": 2878} {"train_loss": -6.574093341827393, "global_step": 120889, "epoch": 2878} {"train_loss": -6.633133888244629, "global_step": 120890, "epoch": 2878} {"train_loss": -6.333955764770508, "global_step": 120891, "epoch": 2878} {"train_loss": -6.563663005828857, "global_step": 120892, "epoch": 2878} {"train_loss": -6.657561779022217, "global_step": 120893, "epoch": 2878} {"train_loss": -6.482151031494141, "global_step": 120894, "epoch": 2878} {"train_loss": -6.480349540710449, "global_step": 120895, "epoch": 2878} {"train_loss": -6.589746952056885, "global_step": 120896, "epoch": 2878} {"train_loss": -6.6046881675720215, "global_step": 120897, "epoch": 2878} {"train_loss": -6.61478853225708, "global_step": 120898, "epoch": 2878} {"train_loss": -6.489161014556885, "global_step": 120899, "epoch": 2878} {"train_loss": -6.539504051208496, "global_step": 120900, "epoch": 2878} {"train_loss": -6.650620937347412, "global_step": 120901, "epoch": 2878} {"train_loss": -6.624950885772705, "global_step": 120902, "epoch": 2878} {"train_loss": -6.58387565612793, "global_step": 120903, "epoch": 2878} {"train_loss": -6.47730016708374, "global_step": 120904, "epoch": 2878} {"train_loss": -6.5517988204956055, "global_step": 120905, "epoch": 2878} {"train_loss": -6.5575714111328125, "global_step": 120906, "epoch": 2878} {"train_loss": -6.657421112060547, "global_step": 120907, "epoch": 2878} {"train_loss": -6.46381950378418, "global_step": 120908, "epoch": 2878} {"train_loss": -6.6515913009643555, "global_step": 120909, "epoch": 2878} {"train_loss": -6.519740104675293, "global_step": 120910, "epoch": 2878} {"train_loss": -6.4744415283203125, "global_step": 120911, "epoch": 2878} {"train_loss": -6.621274948120117, "global_step": 120912, "epoch": 2878} {"train_loss": -6.488134384155273, "global_step": 120913, "epoch": 2878} {"train_loss": -6.580092906951904, "global_step": 120914, "epoch": 2878} {"train_loss": -6.454960823059082, "global_step": 120915, "epoch": 2878} {"train_loss": -6.649569988250732, "global_step": 120916, "epoch": 2878} {"train_loss": -6.556539058685303, "global_step": 120917, "epoch": 2878, "val_loss": 76976.3984375} {"train_loss": -6.609267234802246, "global_step": 120918, "epoch": 2879} {"train_loss": -6.598628044128418, "global_step": 120919, "epoch": 2879} {"train_loss": -6.6425957679748535, "global_step": 120920, "epoch": 2879} {"train_loss": -6.6703691482543945, "global_step": 120921, "epoch": 2879} {"train_loss": -6.602228164672852, "global_step": 120922, "epoch": 2879} {"train_loss": -6.5961384773254395, "global_step": 120923, "epoch": 2879} {"train_loss": -6.559610366821289, "global_step": 120924, "epoch": 2879} {"train_loss": -6.652799606323242, "global_step": 120925, "epoch": 2879} {"train_loss": -6.582925796508789, "global_step": 120926, "epoch": 2879} {"train_loss": -6.625632286071777, "global_step": 120927, "epoch": 2879} {"train_loss": -6.593703269958496, "global_step": 120928, "epoch": 2879} {"train_loss": -6.701714038848877, "global_step": 120929, "epoch": 2879} {"train_loss": -6.688346862792969, "global_step": 120930, "epoch": 2879} {"train_loss": -6.640986442565918, "global_step": 120931, "epoch": 2879} {"train_loss": -6.711949348449707, "global_step": 120932, "epoch": 2879} {"train_loss": -6.4144368171691895, "global_step": 120933, "epoch": 2879} {"train_loss": -6.613179683685303, "global_step": 120934, "epoch": 2879} {"train_loss": -6.512283802032471, "global_step": 120935, "epoch": 2879} {"train_loss": -6.397861003875732, "global_step": 120936, "epoch": 2879} {"train_loss": -6.548828601837158, "global_step": 120937, "epoch": 2879} {"train_loss": -6.421140670776367, "global_step": 120938, "epoch": 2879} {"train_loss": -6.5478010177612305, "global_step": 120939, "epoch": 2879} {"train_loss": -6.567570686340332, "global_step": 120940, "epoch": 2879} {"train_loss": -6.432028293609619, "global_step": 120941, "epoch": 2879} {"train_loss": -6.517523765563965, "global_step": 120942, "epoch": 2879} {"train_loss": -6.439728736877441, "global_step": 120943, "epoch": 2879} {"train_loss": -6.452031135559082, "global_step": 120944, "epoch": 2879} {"train_loss": -6.627553462982178, "global_step": 120945, "epoch": 2879} {"train_loss": -6.337765216827393, "global_step": 120946, "epoch": 2879} {"train_loss": -6.533323287963867, "global_step": 120947, "epoch": 2879} {"train_loss": -6.385224342346191, "global_step": 120948, "epoch": 2879} {"train_loss": -6.509503364562988, "global_step": 120949, "epoch": 2879} {"train_loss": -6.302666664123535, "global_step": 120950, "epoch": 2879} {"train_loss": -6.473197937011719, "global_step": 120951, "epoch": 2879} {"train_loss": -6.344968795776367, "global_step": 120952, "epoch": 2879} {"train_loss": -6.4916300773620605, "global_step": 120953, "epoch": 2879} {"train_loss": -6.417736053466797, "global_step": 120954, "epoch": 2879} {"train_loss": -6.430201053619385, "global_step": 120955, "epoch": 2879} {"train_loss": -6.479151725769043, "global_step": 120956, "epoch": 2879} {"train_loss": -6.483237266540527, "global_step": 120957, "epoch": 2879} {"train_loss": -6.570336818695068, "global_step": 120958, "epoch": 2879} {"train_loss": -6.530099709828694, "global_step": 120959, "epoch": 2879, "val_loss": 77052.7578125} {"train_loss": -6.4859185218811035, "global_step": 120960, "epoch": 2880} {"train_loss": -6.511760711669922, "global_step": 120961, "epoch": 2880} {"train_loss": -6.572962284088135, "global_step": 120962, "epoch": 2880} {"train_loss": -6.508334159851074, "global_step": 120963, "epoch": 2880} {"train_loss": -6.568931579589844, "global_step": 120964, "epoch": 2880} {"train_loss": -6.5251240730285645, "global_step": 120965, "epoch": 2880} {"train_loss": -6.653159141540527, "global_step": 120966, "epoch": 2880} {"train_loss": -6.500069618225098, "global_step": 120967, "epoch": 2880} {"train_loss": -6.6099348068237305, "global_step": 120968, "epoch": 2880} {"train_loss": -6.629306316375732, "global_step": 120969, "epoch": 2880} {"train_loss": -6.561707496643066, "global_step": 120970, "epoch": 2880} {"train_loss": -6.594119071960449, "global_step": 120971, "epoch": 2880} {"train_loss": -6.618280410766602, "global_step": 120972, "epoch": 2880} {"train_loss": -6.606226921081543, "global_step": 120973, "epoch": 2880} {"train_loss": -6.492071628570557, "global_step": 120974, "epoch": 2880} {"train_loss": -6.537324905395508, "global_step": 120975, "epoch": 2880} {"train_loss": -6.589632987976074, "global_step": 120976, "epoch": 2880} {"train_loss": -6.5294342041015625, "global_step": 120977, "epoch": 2880} {"train_loss": -6.6627960205078125, "global_step": 120978, "epoch": 2880} {"train_loss": -6.617984294891357, "global_step": 120979, "epoch": 2880} {"train_loss": -6.675148010253906, "global_step": 120980, "epoch": 2880} {"train_loss": -6.531772613525391, "global_step": 120981, "epoch": 2880} {"train_loss": -6.517642498016357, "global_step": 120982, "epoch": 2880} {"train_loss": -6.675899505615234, "global_step": 120983, "epoch": 2880} {"train_loss": -6.577818870544434, "global_step": 120984, "epoch": 2880} {"train_loss": -6.564130783081055, "global_step": 120985, "epoch": 2880} {"train_loss": -6.482461452484131, "global_step": 120986, "epoch": 2880} {"train_loss": -6.589537620544434, "global_step": 120987, "epoch": 2880} {"train_loss": -6.465232849121094, "global_step": 120988, "epoch": 2880} {"train_loss": -6.580748558044434, "global_step": 120989, "epoch": 2880} {"train_loss": -6.644847869873047, "global_step": 120990, "epoch": 2880} {"train_loss": -6.668534278869629, "global_step": 120991, "epoch": 2880} {"train_loss": -6.621325492858887, "global_step": 120992, "epoch": 2880} {"train_loss": -6.491415023803711, "global_step": 120993, "epoch": 2880} {"train_loss": -6.595528602600098, "global_step": 120994, "epoch": 2880} {"train_loss": -6.62777042388916, "global_step": 120995, "epoch": 2880} {"train_loss": -6.520235061645508, "global_step": 120996, "epoch": 2880} {"train_loss": -6.620316505432129, "global_step": 120997, "epoch": 2880} {"train_loss": -6.696859359741211, "global_step": 120998, "epoch": 2880} {"train_loss": -6.687775135040283, "global_step": 120999, "epoch": 2880} {"train_loss": -6.537860870361328, "global_step": 121000, "epoch": 2880} {"train_loss": -6.581464960461571, "global_step": 121001, "epoch": 2880, "val_loss": 76827.90625} {"train_loss": -6.516599655151367, "global_step": 121002, "epoch": 2881} {"train_loss": -6.687440872192383, "global_step": 121003, "epoch": 2881} {"train_loss": -6.623354434967041, "global_step": 121004, "epoch": 2881} {"train_loss": -6.60675048828125, "global_step": 121005, "epoch": 2881} {"train_loss": -6.639851093292236, "global_step": 121006, "epoch": 2881} {"train_loss": -6.498337745666504, "global_step": 121007, "epoch": 2881} {"train_loss": -6.697004318237305, "global_step": 121008, "epoch": 2881} {"train_loss": -6.520106315612793, "global_step": 121009, "epoch": 2881} {"train_loss": -6.6883544921875, "global_step": 121010, "epoch": 2881} {"train_loss": -6.50111198425293, "global_step": 121011, "epoch": 2881} {"train_loss": -6.6868438720703125, "global_step": 121012, "epoch": 2881} {"train_loss": -6.529937744140625, "global_step": 121013, "epoch": 2881} {"train_loss": -6.652750015258789, "global_step": 121014, "epoch": 2881} {"train_loss": -6.575090408325195, "global_step": 121015, "epoch": 2881} {"train_loss": -6.595407962799072, "global_step": 121016, "epoch": 2881} {"train_loss": -6.491140365600586, "global_step": 121017, "epoch": 2881} {"train_loss": -6.691051006317139, "global_step": 121018, "epoch": 2881} {"train_loss": -6.548828601837158, "global_step": 121019, "epoch": 2881} {"train_loss": -6.66592264175415, "global_step": 121020, "epoch": 2881} {"train_loss": -6.512319564819336, "global_step": 121021, "epoch": 2881} {"train_loss": -6.655999660491943, "global_step": 121022, "epoch": 2881} {"train_loss": -6.555670738220215, "global_step": 121023, "epoch": 2881} {"train_loss": -6.623157501220703, "global_step": 121024, "epoch": 2881} {"train_loss": -6.578736305236816, "global_step": 121025, "epoch": 2881} {"train_loss": -6.604806900024414, "global_step": 121026, "epoch": 2881} {"train_loss": -6.4631853103637695, "global_step": 121027, "epoch": 2881} {"train_loss": -6.599893569946289, "global_step": 121028, "epoch": 2881} {"train_loss": -6.559903621673584, "global_step": 121029, "epoch": 2881} {"train_loss": -6.550330638885498, "global_step": 121030, "epoch": 2881} {"train_loss": -6.642041206359863, "global_step": 121031, "epoch": 2881} {"train_loss": -6.548948287963867, "global_step": 121032, "epoch": 2881} {"train_loss": -6.586667060852051, "global_step": 121033, "epoch": 2881} {"train_loss": -6.686272621154785, "global_step": 121034, "epoch": 2881} {"train_loss": -6.558141708374023, "global_step": 121035, "epoch": 2881} {"train_loss": -6.564014434814453, "global_step": 121036, "epoch": 2881} {"train_loss": -6.509433269500732, "global_step": 121037, "epoch": 2881} {"train_loss": -6.519932270050049, "global_step": 121038, "epoch": 2881} {"train_loss": -6.602850914001465, "global_step": 121039, "epoch": 2881} {"train_loss": -6.5449934005737305, "global_step": 121040, "epoch": 2881} {"train_loss": -6.586857795715332, "global_step": 121041, "epoch": 2881} {"train_loss": -6.546943664550781, "global_step": 121042, "epoch": 2881} {"train_loss": -6.584019252232143, "global_step": 121043, "epoch": 2881, "val_loss": 76943.9609375} {"train_loss": -6.561098575592041, "global_step": 121044, "epoch": 2882} {"train_loss": -6.660653591156006, "global_step": 121045, "epoch": 2882} {"train_loss": -6.570988655090332, "global_step": 121046, "epoch": 2882} {"train_loss": -6.532381057739258, "global_step": 121047, "epoch": 2882} {"train_loss": -6.557096004486084, "global_step": 121048, "epoch": 2882} {"train_loss": -6.562908172607422, "global_step": 121049, "epoch": 2882} {"train_loss": -6.466401100158691, "global_step": 121050, "epoch": 2882} {"train_loss": -6.614814281463623, "global_step": 121051, "epoch": 2882} {"train_loss": -6.514781951904297, "global_step": 121052, "epoch": 2882} {"train_loss": -6.638472557067871, "global_step": 121053, "epoch": 2882} {"train_loss": -6.567327499389648, "global_step": 121054, "epoch": 2882} {"train_loss": -6.532474040985107, "global_step": 121055, "epoch": 2882} {"train_loss": -6.625458240509033, "global_step": 121056, "epoch": 2882} {"train_loss": -6.65254020690918, "global_step": 121057, "epoch": 2882} {"train_loss": -6.601055145263672, "global_step": 121058, "epoch": 2882} {"train_loss": -6.524483680725098, "global_step": 121059, "epoch": 2882} {"train_loss": -6.656589984893799, "global_step": 121060, "epoch": 2882} {"train_loss": -6.68099308013916, "global_step": 121061, "epoch": 2882} {"train_loss": -6.54817008972168, "global_step": 121062, "epoch": 2882} {"train_loss": -6.513346195220947, "global_step": 121063, "epoch": 2882} {"train_loss": -6.516651153564453, "global_step": 121064, "epoch": 2882} {"train_loss": -6.509795188903809, "global_step": 121065, "epoch": 2882} {"train_loss": -6.692941665649414, "global_step": 121066, "epoch": 2882} {"train_loss": -6.582542896270752, "global_step": 121067, "epoch": 2882} {"train_loss": -6.552448749542236, "global_step": 121068, "epoch": 2882} {"train_loss": -6.493011474609375, "global_step": 121069, "epoch": 2882} {"train_loss": -6.627242565155029, "global_step": 121070, "epoch": 2882} {"train_loss": -6.458606243133545, "global_step": 121071, "epoch": 2882} {"train_loss": -6.458357810974121, "global_step": 121072, "epoch": 2882} {"train_loss": -6.514373779296875, "global_step": 121073, "epoch": 2882} {"train_loss": -6.611733436584473, "global_step": 121074, "epoch": 2882} {"train_loss": -6.583623886108398, "global_step": 121075, "epoch": 2882} {"train_loss": -6.481644630432129, "global_step": 121076, "epoch": 2882} {"train_loss": -6.547745704650879, "global_step": 121077, "epoch": 2882} {"train_loss": -6.619441986083984, "global_step": 121078, "epoch": 2882} {"train_loss": -6.545477867126465, "global_step": 121079, "epoch": 2882} {"train_loss": -6.552393913269043, "global_step": 121080, "epoch": 2882} {"train_loss": -6.6653289794921875, "global_step": 121081, "epoch": 2882} {"train_loss": -6.573312759399414, "global_step": 121082, "epoch": 2882} {"train_loss": -6.5242156982421875, "global_step": 121083, "epoch": 2882} {"train_loss": -6.450305938720703, "global_step": 121084, "epoch": 2882} {"train_loss": -6.565929776146298, "global_step": 121085, "epoch": 2882, "val_loss": 77075.7421875} {"train_loss": -6.702242851257324, "global_step": 121086, "epoch": 2883} {"train_loss": -6.58062219619751, "global_step": 121087, "epoch": 2883} {"train_loss": -6.599407196044922, "global_step": 121088, "epoch": 2883} {"train_loss": -6.699932098388672, "global_step": 121089, "epoch": 2883} {"train_loss": -6.5982818603515625, "global_step": 121090, "epoch": 2883} {"train_loss": -6.721432685852051, "global_step": 121091, "epoch": 2883} {"train_loss": -6.639118671417236, "global_step": 121092, "epoch": 2883} {"train_loss": -6.627378463745117, "global_step": 121093, "epoch": 2883} {"train_loss": -6.532024383544922, "global_step": 121094, "epoch": 2883} {"train_loss": -6.625485420227051, "global_step": 121095, "epoch": 2883} {"train_loss": -6.598576545715332, "global_step": 121096, "epoch": 2883} {"train_loss": -6.585862636566162, "global_step": 121097, "epoch": 2883} {"train_loss": -6.5812578201293945, "global_step": 121098, "epoch": 2883} {"train_loss": -6.662691116333008, "global_step": 121099, "epoch": 2883} {"train_loss": -6.6604461669921875, "global_step": 121100, "epoch": 2883} {"train_loss": -6.601426124572754, "global_step": 121101, "epoch": 2883} {"train_loss": -6.617306232452393, "global_step": 121102, "epoch": 2883} {"train_loss": -6.638767242431641, "global_step": 121103, "epoch": 2883} {"train_loss": -6.537837982177734, "global_step": 121104, "epoch": 2883} {"train_loss": -6.514706611633301, "global_step": 121105, "epoch": 2883} {"train_loss": -6.533492565155029, "global_step": 121106, "epoch": 2883} {"train_loss": -6.456347465515137, "global_step": 121107, "epoch": 2883} {"train_loss": -6.502366065979004, "global_step": 121108, "epoch": 2883} {"train_loss": -6.619786262512207, "global_step": 121109, "epoch": 2883} {"train_loss": -6.570875644683838, "global_step": 121110, "epoch": 2883} {"train_loss": -6.529488563537598, "global_step": 121111, "epoch": 2883} {"train_loss": -6.6444091796875, "global_step": 121112, "epoch": 2883} {"train_loss": -6.454995155334473, "global_step": 121113, "epoch": 2883} {"train_loss": -6.503046989440918, "global_step": 121114, "epoch": 2883} {"train_loss": -6.520552158355713, "global_step": 121115, "epoch": 2883} {"train_loss": -6.58458948135376, "global_step": 121116, "epoch": 2883} {"train_loss": -6.42635440826416, "global_step": 121117, "epoch": 2883} {"train_loss": -6.46529483795166, "global_step": 121118, "epoch": 2883} {"train_loss": -6.418304443359375, "global_step": 121119, "epoch": 2883} {"train_loss": -6.689966201782227, "global_step": 121120, "epoch": 2883} {"train_loss": -6.451014995574951, "global_step": 121121, "epoch": 2883} {"train_loss": -6.508916854858398, "global_step": 121122, "epoch": 2883} {"train_loss": -6.627411365509033, "global_step": 121123, "epoch": 2883} {"train_loss": -6.454245567321777, "global_step": 121124, "epoch": 2883} {"train_loss": -6.648309707641602, "global_step": 121125, "epoch": 2883} {"train_loss": -6.511806964874268, "global_step": 121126, "epoch": 2883} {"train_loss": -6.571838583265032, "global_step": 121127, "epoch": 2883, "val_loss": 76664.2109375} {"train_loss": -6.576276779174805, "global_step": 121128, "epoch": 2884} {"train_loss": -6.614280700683594, "global_step": 121129, "epoch": 2884} {"train_loss": -6.6673431396484375, "global_step": 121130, "epoch": 2884} {"train_loss": -6.561601638793945, "global_step": 121131, "epoch": 2884} {"train_loss": -6.597596168518066, "global_step": 121132, "epoch": 2884} {"train_loss": -6.449354648590088, "global_step": 121133, "epoch": 2884} {"train_loss": -6.510611534118652, "global_step": 121134, "epoch": 2884} {"train_loss": -6.576912879943848, "global_step": 121135, "epoch": 2884} {"train_loss": -6.494232177734375, "global_step": 121136, "epoch": 2884} {"train_loss": -6.598719596862793, "global_step": 121137, "epoch": 2884} {"train_loss": -6.610615253448486, "global_step": 121138, "epoch": 2884} {"train_loss": -6.597569465637207, "global_step": 121139, "epoch": 2884} {"train_loss": -6.4634809494018555, "global_step": 121140, "epoch": 2884} {"train_loss": -6.657182693481445, "global_step": 121141, "epoch": 2884} {"train_loss": -6.5713791847229, "global_step": 121142, "epoch": 2884} {"train_loss": -6.640456676483154, "global_step": 121143, "epoch": 2884} {"train_loss": -6.58735990524292, "global_step": 121144, "epoch": 2884} {"train_loss": -6.498400688171387, "global_step": 121145, "epoch": 2884} {"train_loss": -6.470591068267822, "global_step": 121146, "epoch": 2884} {"train_loss": -6.5511155128479, "global_step": 121147, "epoch": 2884} {"train_loss": -6.631170272827148, "global_step": 121148, "epoch": 2884} {"train_loss": -6.601842880249023, "global_step": 121149, "epoch": 2884} {"train_loss": -6.572720050811768, "global_step": 121150, "epoch": 2884} {"train_loss": -6.488553047180176, "global_step": 121151, "epoch": 2884} {"train_loss": -6.64517879486084, "global_step": 121152, "epoch": 2884} {"train_loss": -6.469701290130615, "global_step": 121153, "epoch": 2884} {"train_loss": -6.490966796875, "global_step": 121154, "epoch": 2884} {"train_loss": -6.6972761154174805, "global_step": 121155, "epoch": 2884} {"train_loss": -6.721856594085693, "global_step": 121156, "epoch": 2884} {"train_loss": -6.689853668212891, "global_step": 121157, "epoch": 2884} {"train_loss": -6.526608943939209, "global_step": 121158, "epoch": 2884} {"train_loss": -6.6747050285339355, "global_step": 121159, "epoch": 2884} {"train_loss": -6.636545658111572, "global_step": 121160, "epoch": 2884} {"train_loss": -6.461751937866211, "global_step": 121161, "epoch": 2884} {"train_loss": -6.622182369232178, "global_step": 121162, "epoch": 2884} {"train_loss": -6.570491790771484, "global_step": 121163, "epoch": 2884} {"train_loss": -6.506681442260742, "global_step": 121164, "epoch": 2884} {"train_loss": -6.602424621582031, "global_step": 121165, "epoch": 2884} {"train_loss": -6.496599197387695, "global_step": 121166, "epoch": 2884} {"train_loss": -6.722455978393555, "global_step": 121167, "epoch": 2884} {"train_loss": -6.543281078338623, "global_step": 121168, "epoch": 2884} {"train_loss": -6.574623562040783, "global_step": 121169, "epoch": 2884, "val_loss": 77012.359375} {"train_loss": -6.5806779861450195, "global_step": 121170, "epoch": 2885} {"train_loss": -6.638894081115723, "global_step": 121171, "epoch": 2885} {"train_loss": -6.572915077209473, "global_step": 121172, "epoch": 2885} {"train_loss": -6.650119781494141, "global_step": 121173, "epoch": 2885} {"train_loss": -6.675815582275391, "global_step": 121174, "epoch": 2885} {"train_loss": -6.504236698150635, "global_step": 121175, "epoch": 2885} {"train_loss": -6.511204719543457, "global_step": 121176, "epoch": 2885} {"train_loss": -6.629001617431641, "global_step": 121177, "epoch": 2885} {"train_loss": -6.479394435882568, "global_step": 121178, "epoch": 2885} {"train_loss": -6.418335914611816, "global_step": 121179, "epoch": 2885} {"train_loss": -6.598211288452148, "global_step": 121180, "epoch": 2885} {"train_loss": -6.559076309204102, "global_step": 121181, "epoch": 2885} {"train_loss": -6.407550811767578, "global_step": 121182, "epoch": 2885} {"train_loss": -6.571866512298584, "global_step": 121183, "epoch": 2885} {"train_loss": -6.426141738891602, "global_step": 121184, "epoch": 2885} {"train_loss": -6.4941816329956055, "global_step": 121185, "epoch": 2885} {"train_loss": -6.357841491699219, "global_step": 121186, "epoch": 2885} {"train_loss": -6.621348857879639, "global_step": 121187, "epoch": 2885} {"train_loss": -6.412572860717773, "global_step": 121188, "epoch": 2885} {"train_loss": -6.512885093688965, "global_step": 121189, "epoch": 2885} {"train_loss": -6.636340141296387, "global_step": 121190, "epoch": 2885} {"train_loss": -6.596169948577881, "global_step": 121191, "epoch": 2885} {"train_loss": -6.550050735473633, "global_step": 121192, "epoch": 2885} {"train_loss": -6.351743698120117, "global_step": 121193, "epoch": 2885} {"train_loss": -6.667876243591309, "global_step": 121194, "epoch": 2885} {"train_loss": -6.501892566680908, "global_step": 121195, "epoch": 2885} {"train_loss": -6.590758800506592, "global_step": 121196, "epoch": 2885} {"train_loss": -6.4589619636535645, "global_step": 121197, "epoch": 2885} {"train_loss": -6.489272594451904, "global_step": 121198, "epoch": 2885} {"train_loss": -6.531408309936523, "global_step": 121199, "epoch": 2885} {"train_loss": -6.4646148681640625, "global_step": 121200, "epoch": 2885} {"train_loss": -6.449926376342773, "global_step": 121201, "epoch": 2885} {"train_loss": -6.587850570678711, "global_step": 121202, "epoch": 2885} {"train_loss": -6.451177597045898, "global_step": 121203, "epoch": 2885} {"train_loss": -6.551548957824707, "global_step": 121204, "epoch": 2885} {"train_loss": -6.654843330383301, "global_step": 121205, "epoch": 2885} {"train_loss": -6.4737629890441895, "global_step": 121206, "epoch": 2885} {"train_loss": -6.535397529602051, "global_step": 121207, "epoch": 2885} {"train_loss": -6.632007598876953, "global_step": 121208, "epoch": 2885} {"train_loss": -6.614603042602539, "global_step": 121209, "epoch": 2885} {"train_loss": -6.623315334320068, "global_step": 121210, "epoch": 2885} {"train_loss": -6.537605035872686, "global_step": 121211, "epoch": 2885, "val_loss": 76985.859375} {"train_loss": -6.586743354797363, "global_step": 121212, "epoch": 2886} {"train_loss": -6.526196479797363, "global_step": 121213, "epoch": 2886} {"train_loss": -6.659885406494141, "global_step": 121214, "epoch": 2886} {"train_loss": -6.647605895996094, "global_step": 121215, "epoch": 2886} {"train_loss": -6.58663272857666, "global_step": 121216, "epoch": 2886} {"train_loss": -6.539763450622559, "global_step": 121217, "epoch": 2886} {"train_loss": -6.496370792388916, "global_step": 121218, "epoch": 2886} {"train_loss": -6.491549015045166, "global_step": 121219, "epoch": 2886} {"train_loss": -6.547407150268555, "global_step": 121220, "epoch": 2886} {"train_loss": -6.589182376861572, "global_step": 121221, "epoch": 2886} {"train_loss": -6.595712661743164, "global_step": 121222, "epoch": 2886} {"train_loss": -6.6375813484191895, "global_step": 121223, "epoch": 2886} {"train_loss": -6.498260021209717, "global_step": 121224, "epoch": 2886} {"train_loss": -6.497086524963379, "global_step": 121225, "epoch": 2886} {"train_loss": -6.522568225860596, "global_step": 121226, "epoch": 2886} {"train_loss": -6.5937089920043945, "global_step": 121227, "epoch": 2886} {"train_loss": -6.608917236328125, "global_step": 121228, "epoch": 2886} {"train_loss": -6.476452827453613, "global_step": 121229, "epoch": 2886} {"train_loss": -6.488134384155273, "global_step": 121230, "epoch": 2886} {"train_loss": -6.5489888191223145, "global_step": 121231, "epoch": 2886} {"train_loss": -6.612664222717285, "global_step": 121232, "epoch": 2886} {"train_loss": -6.524631023406982, "global_step": 121233, "epoch": 2886} {"train_loss": -6.551583766937256, "global_step": 121234, "epoch": 2886} {"train_loss": -6.596944808959961, "global_step": 121235, "epoch": 2886} {"train_loss": -6.59154748916626, "global_step": 121236, "epoch": 2886} {"train_loss": -6.604653358459473, "global_step": 121237, "epoch": 2886} {"train_loss": -6.6992106437683105, "global_step": 121238, "epoch": 2886} {"train_loss": -6.560670852661133, "global_step": 121239, "epoch": 2886} {"train_loss": -6.626689910888672, "global_step": 121240, "epoch": 2886} {"train_loss": -6.496513366699219, "global_step": 121241, "epoch": 2886} {"train_loss": -6.560891151428223, "global_step": 121242, "epoch": 2886} {"train_loss": -6.733469486236572, "global_step": 121243, "epoch": 2886} {"train_loss": -6.56035041809082, "global_step": 121244, "epoch": 2886} {"train_loss": -6.582326412200928, "global_step": 121245, "epoch": 2886} {"train_loss": -6.706204891204834, "global_step": 121246, "epoch": 2886} {"train_loss": -6.697826862335205, "global_step": 121247, "epoch": 2886} {"train_loss": -6.589427947998047, "global_step": 121248, "epoch": 2886} {"train_loss": -6.7015461921691895, "global_step": 121249, "epoch": 2886} {"train_loss": -6.645594120025635, "global_step": 121250, "epoch": 2886} {"train_loss": -6.566521167755127, "global_step": 121251, "epoch": 2886} {"train_loss": -6.452567100524902, "global_step": 121252, "epoch": 2886} {"train_loss": -6.580220483598255, "global_step": 121253, "epoch": 2886, "val_loss": 77218.09375} {"train_loss": -6.636390686035156, "global_step": 121254, "epoch": 2887} {"train_loss": -6.555857181549072, "global_step": 121255, "epoch": 2887} {"train_loss": -6.580507755279541, "global_step": 121256, "epoch": 2887} {"train_loss": -6.480704307556152, "global_step": 121257, "epoch": 2887} {"train_loss": -6.529864311218262, "global_step": 121258, "epoch": 2887} {"train_loss": -6.62053108215332, "global_step": 121259, "epoch": 2887} {"train_loss": -6.5308027267456055, "global_step": 121260, "epoch": 2887} {"train_loss": -6.366833209991455, "global_step": 121261, "epoch": 2887} {"train_loss": -6.584357261657715, "global_step": 121262, "epoch": 2887} {"train_loss": -6.534467697143555, "global_step": 121263, "epoch": 2887} {"train_loss": -6.626828670501709, "global_step": 121264, "epoch": 2887} {"train_loss": -6.6291913986206055, "global_step": 121265, "epoch": 2887} {"train_loss": -6.641529560089111, "global_step": 121266, "epoch": 2887} {"train_loss": -6.6181254386901855, "global_step": 121267, "epoch": 2887} {"train_loss": -6.643563270568848, "global_step": 121268, "epoch": 2887} {"train_loss": -6.524395942687988, "global_step": 121269, "epoch": 2887} {"train_loss": -6.495072364807129, "global_step": 121270, "epoch": 2887} {"train_loss": -6.538890838623047, "global_step": 121271, "epoch": 2887} {"train_loss": -6.622003555297852, "global_step": 121272, "epoch": 2887} {"train_loss": -6.546957969665527, "global_step": 121273, "epoch": 2887} {"train_loss": -6.548004150390625, "global_step": 121274, "epoch": 2887} {"train_loss": -6.581883430480957, "global_step": 121275, "epoch": 2887} {"train_loss": -6.527358055114746, "global_step": 121276, "epoch": 2887} {"train_loss": -6.520340919494629, "global_step": 121277, "epoch": 2887} {"train_loss": -6.586544990539551, "global_step": 121278, "epoch": 2887} {"train_loss": -6.570291996002197, "global_step": 121279, "epoch": 2887} {"train_loss": -6.501893520355225, "global_step": 121280, "epoch": 2887} {"train_loss": -6.584612846374512, "global_step": 121281, "epoch": 2887} {"train_loss": -6.5417633056640625, "global_step": 121282, "epoch": 2887} {"train_loss": -6.645317077636719, "global_step": 121283, "epoch": 2887} {"train_loss": -6.670314788818359, "global_step": 121284, "epoch": 2887} {"train_loss": -6.655219554901123, "global_step": 121285, "epoch": 2887} {"train_loss": -6.526361465454102, "global_step": 121286, "epoch": 2887} {"train_loss": -6.589587688446045, "global_step": 121287, "epoch": 2887} {"train_loss": -6.602190017700195, "global_step": 121288, "epoch": 2887} {"train_loss": -6.663622856140137, "global_step": 121289, "epoch": 2887} {"train_loss": -6.496265411376953, "global_step": 121290, "epoch": 2887} {"train_loss": -6.622077465057373, "global_step": 121291, "epoch": 2887} {"train_loss": -6.679800033569336, "global_step": 121292, "epoch": 2887} {"train_loss": -6.689098834991455, "global_step": 121293, "epoch": 2887} {"train_loss": -6.563388347625732, "global_step": 121294, "epoch": 2887} {"train_loss": -6.57814223425729, "global_step": 121295, "epoch": 2887, "val_loss": 76780.2421875} {"train_loss": -6.705188751220703, "global_step": 121296, "epoch": 2888} {"train_loss": -6.695796012878418, "global_step": 121297, "epoch": 2888} {"train_loss": -6.792093276977539, "global_step": 121298, "epoch": 2888} {"train_loss": -6.613620281219482, "global_step": 121299, "epoch": 2888} {"train_loss": -6.528685569763184, "global_step": 121300, "epoch": 2888} {"train_loss": -6.586919784545898, "global_step": 121301, "epoch": 2888} {"train_loss": -6.615962982177734, "global_step": 121302, "epoch": 2888} {"train_loss": -6.6773881912231445, "global_step": 121303, "epoch": 2888} {"train_loss": -6.580392360687256, "global_step": 121304, "epoch": 2888} {"train_loss": -6.694594383239746, "global_step": 121305, "epoch": 2888} {"train_loss": -6.539715766906738, "global_step": 121306, "epoch": 2888} {"train_loss": -6.614223480224609, "global_step": 121307, "epoch": 2888} {"train_loss": -6.60023832321167, "global_step": 121308, "epoch": 2888} {"train_loss": -6.5842132568359375, "global_step": 121309, "epoch": 2888} {"train_loss": -6.688515663146973, "global_step": 121310, "epoch": 2888} {"train_loss": -6.597991943359375, "global_step": 121311, "epoch": 2888} {"train_loss": -6.6336565017700195, "global_step": 121312, "epoch": 2888} {"train_loss": -6.7303290367126465, "global_step": 121313, "epoch": 2888} {"train_loss": -6.648591995239258, "global_step": 121314, "epoch": 2888} {"train_loss": -6.684109687805176, "global_step": 121315, "epoch": 2888} {"train_loss": -6.632312297821045, "global_step": 121316, "epoch": 2888} {"train_loss": -6.588555335998535, "global_step": 121317, "epoch": 2888} {"train_loss": -6.6668925285339355, "global_step": 121318, "epoch": 2888} {"train_loss": -6.67034387588501, "global_step": 121319, "epoch": 2888} {"train_loss": -6.641510486602783, "global_step": 121320, "epoch": 2888} {"train_loss": -6.672146797180176, "global_step": 121321, "epoch": 2888} {"train_loss": -6.679142951965332, "global_step": 121322, "epoch": 2888} {"train_loss": -6.550588130950928, "global_step": 121323, "epoch": 2888} {"train_loss": -6.5696916580200195, "global_step": 121324, "epoch": 2888} {"train_loss": -6.507948875427246, "global_step": 121325, "epoch": 2888} {"train_loss": -6.690374374389648, "global_step": 121326, "epoch": 2888} {"train_loss": -6.657895088195801, "global_step": 121327, "epoch": 2888} {"train_loss": -6.570818901062012, "global_step": 121328, "epoch": 2888} {"train_loss": -6.6031718254089355, "global_step": 121329, "epoch": 2888} {"train_loss": -6.5085601806640625, "global_step": 121330, "epoch": 2888} {"train_loss": -6.6031575202941895, "global_step": 121331, "epoch": 2888} {"train_loss": -6.470327377319336, "global_step": 121332, "epoch": 2888} {"train_loss": -6.538242816925049, "global_step": 121333, "epoch": 2888} {"train_loss": -6.526165962219238, "global_step": 121334, "epoch": 2888} {"train_loss": -6.543434143066406, "global_step": 121335, "epoch": 2888} {"train_loss": -6.480969429016113, "global_step": 121336, "epoch": 2888} {"train_loss": -6.61217094603039, "global_step": 121337, "epoch": 2888, "val_loss": 76584.890625} {"train_loss": -6.580637454986572, "global_step": 121338, "epoch": 2889} {"train_loss": -6.516695022583008, "global_step": 121339, "epoch": 2889} {"train_loss": -6.464779853820801, "global_step": 121340, "epoch": 2889} {"train_loss": -6.344468593597412, "global_step": 121341, "epoch": 2889} {"train_loss": -6.515215873718262, "global_step": 121342, "epoch": 2889} {"train_loss": -6.545504570007324, "global_step": 121343, "epoch": 2889} {"train_loss": -6.582252502441406, "global_step": 121344, "epoch": 2889} {"train_loss": -6.497560501098633, "global_step": 121345, "epoch": 2889} {"train_loss": -6.743197441101074, "global_step": 121346, "epoch": 2889} {"train_loss": -6.513812065124512, "global_step": 121347, "epoch": 2889} {"train_loss": -6.44511604309082, "global_step": 121348, "epoch": 2889} {"train_loss": -6.59556245803833, "global_step": 121349, "epoch": 2889} {"train_loss": -6.508501052856445, "global_step": 121350, "epoch": 2889} {"train_loss": -6.589491844177246, "global_step": 121351, "epoch": 2889} {"train_loss": -6.70663595199585, "global_step": 121352, "epoch": 2889} {"train_loss": -6.612737655639648, "global_step": 121353, "epoch": 2889} {"train_loss": -6.52171516418457, "global_step": 121354, "epoch": 2889} {"train_loss": -6.584198951721191, "global_step": 121355, "epoch": 2889} {"train_loss": -6.524036407470703, "global_step": 121356, "epoch": 2889} {"train_loss": -6.633370876312256, "global_step": 121357, "epoch": 2889} {"train_loss": -6.680978775024414, "global_step": 121358, "epoch": 2889} {"train_loss": -6.612302303314209, "global_step": 121359, "epoch": 2889} {"train_loss": -6.530209541320801, "global_step": 121360, "epoch": 2889} {"train_loss": -6.629573822021484, "global_step": 121361, "epoch": 2889} {"train_loss": -6.668992519378662, "global_step": 121362, "epoch": 2889} {"train_loss": -6.670019626617432, "global_step": 121363, "epoch": 2889} {"train_loss": -6.66422700881958, "global_step": 121364, "epoch": 2889} {"train_loss": -6.642699718475342, "global_step": 121365, "epoch": 2889} {"train_loss": -6.700845718383789, "global_step": 121366, "epoch": 2889} {"train_loss": -6.6595282554626465, "global_step": 121367, "epoch": 2889} {"train_loss": -6.522425651550293, "global_step": 121368, "epoch": 2889} {"train_loss": -6.539602756500244, "global_step": 121369, "epoch": 2889} {"train_loss": -6.468413829803467, "global_step": 121370, "epoch": 2889} {"train_loss": -6.618356704711914, "global_step": 121371, "epoch": 2889} {"train_loss": -6.639243125915527, "global_step": 121372, "epoch": 2889} {"train_loss": -6.544474124908447, "global_step": 121373, "epoch": 2889} {"train_loss": -6.618395805358887, "global_step": 121374, "epoch": 2889} {"train_loss": -6.701485633850098, "global_step": 121375, "epoch": 2889} {"train_loss": -6.503049850463867, "global_step": 121376, "epoch": 2889} {"train_loss": -6.568795204162598, "global_step": 121377, "epoch": 2889} {"train_loss": -6.547660827636719, "global_step": 121378, "epoch": 2889} {"train_loss": -6.575569323131016, "global_step": 121379, "epoch": 2889, "val_loss": 76843.0546875} {"train_loss": -6.635420799255371, "global_step": 121380, "epoch": 2890} {"train_loss": -6.444476127624512, "global_step": 121381, "epoch": 2890} {"train_loss": -6.509450912475586, "global_step": 121382, "epoch": 2890} {"train_loss": -6.626922607421875, "global_step": 121383, "epoch": 2890} {"train_loss": -6.41279411315918, "global_step": 121384, "epoch": 2890} {"train_loss": -6.691227912902832, "global_step": 121385, "epoch": 2890} {"train_loss": -6.500977516174316, "global_step": 121386, "epoch": 2890} {"train_loss": -6.676220417022705, "global_step": 121387, "epoch": 2890} {"train_loss": -6.542031764984131, "global_step": 121388, "epoch": 2890} {"train_loss": -6.524979591369629, "global_step": 121389, "epoch": 2890} {"train_loss": -6.569437026977539, "global_step": 121390, "epoch": 2890} {"train_loss": -6.464412212371826, "global_step": 121391, "epoch": 2890} {"train_loss": -6.624065399169922, "global_step": 121392, "epoch": 2890} {"train_loss": -6.559504508972168, "global_step": 121393, "epoch": 2890} {"train_loss": -6.5180559158325195, "global_step": 121394, "epoch": 2890} {"train_loss": -6.537962913513184, "global_step": 121395, "epoch": 2890} {"train_loss": -6.590376853942871, "global_step": 121396, "epoch": 2890} {"train_loss": -6.557587623596191, "global_step": 121397, "epoch": 2890} {"train_loss": -6.562254905700684, "global_step": 121398, "epoch": 2890} {"train_loss": -6.651083946228027, "global_step": 121399, "epoch": 2890} {"train_loss": -6.591581344604492, "global_step": 121400, "epoch": 2890} {"train_loss": -6.61248779296875, "global_step": 121401, "epoch": 2890} {"train_loss": -6.572261810302734, "global_step": 121402, "epoch": 2890} {"train_loss": -6.497922420501709, "global_step": 121403, "epoch": 2890} {"train_loss": -6.607116222381592, "global_step": 121404, "epoch": 2890} {"train_loss": -6.486696720123291, "global_step": 121405, "epoch": 2890} {"train_loss": -6.636116027832031, "global_step": 121406, "epoch": 2890} {"train_loss": -6.433349132537842, "global_step": 121407, "epoch": 2890} {"train_loss": -6.50937557220459, "global_step": 121408, "epoch": 2890} {"train_loss": -6.468388557434082, "global_step": 121409, "epoch": 2890} {"train_loss": -6.561196327209473, "global_step": 121410, "epoch": 2890} {"train_loss": -6.604854583740234, "global_step": 121411, "epoch": 2890} {"train_loss": -6.5293803215026855, "global_step": 121412, "epoch": 2890} {"train_loss": -6.493076324462891, "global_step": 121413, "epoch": 2890} {"train_loss": -6.520398139953613, "global_step": 121414, "epoch": 2890} {"train_loss": -6.553277492523193, "global_step": 121415, "epoch": 2890} {"train_loss": -6.575974464416504, "global_step": 121416, "epoch": 2890} {"train_loss": -6.463990688323975, "global_step": 121417, "epoch": 2890} {"train_loss": -6.4997148513793945, "global_step": 121418, "epoch": 2890} {"train_loss": -6.574896812438965, "global_step": 121419, "epoch": 2890} {"train_loss": -6.592520713806152, "global_step": 121420, "epoch": 2890} {"train_loss": -6.551636695861816, "global_step": 121421, "epoch": 2890, "val_loss": 77076.609375} {"train_loss": -6.485603332519531, "global_step": 121422, "epoch": 2891} {"train_loss": -6.483366966247559, "global_step": 121423, "epoch": 2891} {"train_loss": -6.657267093658447, "global_step": 121424, "epoch": 2891} {"train_loss": -6.455946922302246, "global_step": 121425, "epoch": 2891} {"train_loss": -6.615483283996582, "global_step": 121426, "epoch": 2891} {"train_loss": -6.584463119506836, "global_step": 121427, "epoch": 2891} {"train_loss": -6.613980293273926, "global_step": 121428, "epoch": 2891} {"train_loss": -6.5592145919799805, "global_step": 121429, "epoch": 2891} {"train_loss": -6.680451393127441, "global_step": 121430, "epoch": 2891} {"train_loss": -6.581639289855957, "global_step": 121431, "epoch": 2891} {"train_loss": -6.56770133972168, "global_step": 121432, "epoch": 2891} {"train_loss": -6.668087959289551, "global_step": 121433, "epoch": 2891} {"train_loss": -6.55492639541626, "global_step": 121434, "epoch": 2891} {"train_loss": -6.613192081451416, "global_step": 121435, "epoch": 2891} {"train_loss": -6.602795124053955, "global_step": 121436, "epoch": 2891} {"train_loss": -6.539858818054199, "global_step": 121437, "epoch": 2891} {"train_loss": -6.679553985595703, "global_step": 121438, "epoch": 2891} {"train_loss": -6.664718151092529, "global_step": 121439, "epoch": 2891} {"train_loss": -6.587525367736816, "global_step": 121440, "epoch": 2891} {"train_loss": -6.618880271911621, "global_step": 121441, "epoch": 2891} {"train_loss": -6.612715721130371, "global_step": 121442, "epoch": 2891} {"train_loss": -6.704110145568848, "global_step": 121443, "epoch": 2891} {"train_loss": -6.498732566833496, "global_step": 121444, "epoch": 2891} {"train_loss": -6.584328651428223, "global_step": 121445, "epoch": 2891} {"train_loss": -6.605665683746338, "global_step": 121446, "epoch": 2891} {"train_loss": -6.6988205909729, "global_step": 121447, "epoch": 2891} {"train_loss": -6.567730903625488, "global_step": 121448, "epoch": 2891} {"train_loss": -6.449724197387695, "global_step": 121449, "epoch": 2891} {"train_loss": -6.728555679321289, "global_step": 121450, "epoch": 2891} {"train_loss": -6.58233642578125, "global_step": 121451, "epoch": 2891} {"train_loss": -6.559654235839844, "global_step": 121452, "epoch": 2891} {"train_loss": -6.475664138793945, "global_step": 121453, "epoch": 2891} {"train_loss": -6.527464389801025, "global_step": 121454, "epoch": 2891} {"train_loss": -6.6238908767700195, "global_step": 121455, "epoch": 2891} {"train_loss": -6.647496223449707, "global_step": 121456, "epoch": 2891} {"train_loss": -6.615083694458008, "global_step": 121457, "epoch": 2891} {"train_loss": -6.611195087432861, "global_step": 121458, "epoch": 2891} {"train_loss": -6.686290740966797, "global_step": 121459, "epoch": 2891} {"train_loss": -6.628313064575195, "global_step": 121460, "epoch": 2891} {"train_loss": -6.737587928771973, "global_step": 121461, "epoch": 2891} {"train_loss": -6.5253801345825195, "global_step": 121462, "epoch": 2891} {"train_loss": -6.597946325937907, "global_step": 121463, "epoch": 2891, "val_loss": 76819.6640625} {"train_loss": -6.650193214416504, "global_step": 121464, "epoch": 2892} {"train_loss": -6.615213394165039, "global_step": 121465, "epoch": 2892} {"train_loss": -6.657625198364258, "global_step": 121466, "epoch": 2892} {"train_loss": -6.552105903625488, "global_step": 121467, "epoch": 2892} {"train_loss": -6.630269527435303, "global_step": 121468, "epoch": 2892} {"train_loss": -6.508514404296875, "global_step": 121469, "epoch": 2892} {"train_loss": -6.67154598236084, "global_step": 121470, "epoch": 2892} {"train_loss": -6.663393497467041, "global_step": 121471, "epoch": 2892} {"train_loss": -6.459930896759033, "global_step": 121472, "epoch": 2892} {"train_loss": -6.458864212036133, "global_step": 121473, "epoch": 2892} {"train_loss": -6.440654754638672, "global_step": 121474, "epoch": 2892} {"train_loss": -6.623305320739746, "global_step": 121475, "epoch": 2892} {"train_loss": -6.41689395904541, "global_step": 121476, "epoch": 2892} {"train_loss": -6.397640705108643, "global_step": 121477, "epoch": 2892} {"train_loss": -6.519911289215088, "global_step": 121478, "epoch": 2892} {"train_loss": -6.430465221405029, "global_step": 121479, "epoch": 2892} {"train_loss": -6.481860637664795, "global_step": 121480, "epoch": 2892} {"train_loss": -6.537747383117676, "global_step": 121481, "epoch": 2892} {"train_loss": -6.60080623626709, "global_step": 121482, "epoch": 2892} {"train_loss": -6.527882099151611, "global_step": 121483, "epoch": 2892} {"train_loss": -6.594059467315674, "global_step": 121484, "epoch": 2892} {"train_loss": -6.5847296714782715, "global_step": 121485, "epoch": 2892} {"train_loss": -6.503474712371826, "global_step": 121486, "epoch": 2892} {"train_loss": -6.601998805999756, "global_step": 121487, "epoch": 2892} {"train_loss": -6.621649742126465, "global_step": 121488, "epoch": 2892} {"train_loss": -6.574804306030273, "global_step": 121489, "epoch": 2892} {"train_loss": -6.49029541015625, "global_step": 121490, "epoch": 2892} {"train_loss": -6.560904502868652, "global_step": 121491, "epoch": 2892} {"train_loss": -6.596213340759277, "global_step": 121492, "epoch": 2892} {"train_loss": -6.6340179443359375, "global_step": 121493, "epoch": 2892} {"train_loss": -6.602465629577637, "global_step": 121494, "epoch": 2892} {"train_loss": -6.601273536682129, "global_step": 121495, "epoch": 2892} {"train_loss": -6.621885299682617, "global_step": 121496, "epoch": 2892} {"train_loss": -6.603126525878906, "global_step": 121497, "epoch": 2892} {"train_loss": -6.698906421661377, "global_step": 121498, "epoch": 2892} {"train_loss": -6.525145530700684, "global_step": 121499, "epoch": 2892} {"train_loss": -6.639817237854004, "global_step": 121500, "epoch": 2892} {"train_loss": -6.503701686859131, "global_step": 121501, "epoch": 2892} {"train_loss": -6.615748882293701, "global_step": 121502, "epoch": 2892} {"train_loss": -6.758966445922852, "global_step": 121503, "epoch": 2892} {"train_loss": -6.494451999664307, "global_step": 121504, "epoch": 2892} {"train_loss": -6.570602780296689, "global_step": 121505, "epoch": 2892, "val_loss": 76842.53125} {"train_loss": -6.678056716918945, "global_step": 121506, "epoch": 2893} {"train_loss": -6.653837203979492, "global_step": 121507, "epoch": 2893} {"train_loss": -6.631929397583008, "global_step": 121508, "epoch": 2893} {"train_loss": -6.631364822387695, "global_step": 121509, "epoch": 2893} {"train_loss": -6.524097442626953, "global_step": 121510, "epoch": 2893} {"train_loss": -6.5427775382995605, "global_step": 121511, "epoch": 2893} {"train_loss": -6.631217002868652, "global_step": 121512, "epoch": 2893} {"train_loss": -6.717287063598633, "global_step": 121513, "epoch": 2893} {"train_loss": -6.660364151000977, "global_step": 121514, "epoch": 2893} {"train_loss": -6.644125461578369, "global_step": 121515, "epoch": 2893} {"train_loss": -6.751008033752441, "global_step": 121516, "epoch": 2893} {"train_loss": -6.657989978790283, "global_step": 121517, "epoch": 2893} {"train_loss": -6.538060188293457, "global_step": 121518, "epoch": 2893} {"train_loss": -6.690447807312012, "global_step": 121519, "epoch": 2893} {"train_loss": -6.719738006591797, "global_step": 121520, "epoch": 2893} {"train_loss": -6.604920387268066, "global_step": 121521, "epoch": 2893} {"train_loss": -6.58683967590332, "global_step": 121522, "epoch": 2893} {"train_loss": -6.68316650390625, "global_step": 121523, "epoch": 2893} {"train_loss": -6.576383590698242, "global_step": 121524, "epoch": 2893} {"train_loss": -6.63054084777832, "global_step": 121525, "epoch": 2893} {"train_loss": -6.606288909912109, "global_step": 121526, "epoch": 2893} {"train_loss": -6.620608329772949, "global_step": 121527, "epoch": 2893} {"train_loss": -6.697517395019531, "global_step": 121528, "epoch": 2893} {"train_loss": -6.665657043457031, "global_step": 121529, "epoch": 2893} {"train_loss": -6.6220903396606445, "global_step": 121530, "epoch": 2893} {"train_loss": -6.576710224151611, "global_step": 121531, "epoch": 2893} {"train_loss": -6.63380241394043, "global_step": 121532, "epoch": 2893} {"train_loss": -6.619360446929932, "global_step": 121533, "epoch": 2893} {"train_loss": -6.630314826965332, "global_step": 121534, "epoch": 2893} {"train_loss": -6.596003532409668, "global_step": 121535, "epoch": 2893} {"train_loss": -6.527352809906006, "global_step": 121536, "epoch": 2893} {"train_loss": -6.609493255615234, "global_step": 121537, "epoch": 2893} {"train_loss": -6.691776275634766, "global_step": 121538, "epoch": 2893} {"train_loss": -6.539444446563721, "global_step": 121539, "epoch": 2893} {"train_loss": -6.516037940979004, "global_step": 121540, "epoch": 2893} {"train_loss": -6.576300621032715, "global_step": 121541, "epoch": 2893} {"train_loss": -6.607939720153809, "global_step": 121542, "epoch": 2893} {"train_loss": -6.543747901916504, "global_step": 121543, "epoch": 2893} {"train_loss": -6.554840564727783, "global_step": 121544, "epoch": 2893} {"train_loss": -6.533892631530762, "global_step": 121545, "epoch": 2893} {"train_loss": -6.632326602935791, "global_step": 121546, "epoch": 2893} {"train_loss": -6.6170654864538285, "global_step": 121547, "epoch": 2893, "val_loss": 76713.125} {"train_loss": -6.481756210327148, "global_step": 121548, "epoch": 2894} {"train_loss": -6.626093864440918, "global_step": 121549, "epoch": 2894} {"train_loss": -6.5439910888671875, "global_step": 121550, "epoch": 2894} {"train_loss": -6.558609962463379, "global_step": 121551, "epoch": 2894} {"train_loss": -6.65349817276001, "global_step": 121552, "epoch": 2894} {"train_loss": -6.620912551879883, "global_step": 121553, "epoch": 2894} {"train_loss": -6.594021797180176, "global_step": 121554, "epoch": 2894} {"train_loss": -6.584975242614746, "global_step": 121555, "epoch": 2894} {"train_loss": -6.5094523429870605, "global_step": 121556, "epoch": 2894} {"train_loss": -6.595625877380371, "global_step": 121557, "epoch": 2894} {"train_loss": -6.587001800537109, "global_step": 121558, "epoch": 2894} {"train_loss": -6.610752582550049, "global_step": 121559, "epoch": 2894} {"train_loss": -6.495421886444092, "global_step": 121560, "epoch": 2894} {"train_loss": -6.5892438888549805, "global_step": 121561, "epoch": 2894} {"train_loss": -6.694037437438965, "global_step": 121562, "epoch": 2894} {"train_loss": -6.675483703613281, "global_step": 121563, "epoch": 2894} {"train_loss": -6.590939998626709, "global_step": 121564, "epoch": 2894} {"train_loss": -6.347043991088867, "global_step": 121565, "epoch": 2894} {"train_loss": -6.541592597961426, "global_step": 121566, "epoch": 2894} {"train_loss": -6.57034969329834, "global_step": 121567, "epoch": 2894} {"train_loss": -6.540246963500977, "global_step": 121568, "epoch": 2894} {"train_loss": -6.60846471786499, "global_step": 121569, "epoch": 2894} {"train_loss": -6.564450263977051, "global_step": 121570, "epoch": 2894} {"train_loss": -6.618138313293457, "global_step": 121571, "epoch": 2894} {"train_loss": -6.530777454376221, "global_step": 121572, "epoch": 2894} {"train_loss": -6.566835880279541, "global_step": 121573, "epoch": 2894} {"train_loss": -6.608054161071777, "global_step": 121574, "epoch": 2894} {"train_loss": -6.594310760498047, "global_step": 121575, "epoch": 2894} {"train_loss": -6.5782012939453125, "global_step": 121576, "epoch": 2894} {"train_loss": -6.6581573486328125, "global_step": 121577, "epoch": 2894} {"train_loss": -6.567703723907471, "global_step": 121578, "epoch": 2894} {"train_loss": -6.484238624572754, "global_step": 121579, "epoch": 2894} {"train_loss": -6.50909948348999, "global_step": 121580, "epoch": 2894} {"train_loss": -6.649877071380615, "global_step": 121581, "epoch": 2894} {"train_loss": -6.66234016418457, "global_step": 121582, "epoch": 2894} {"train_loss": -6.557163238525391, "global_step": 121583, "epoch": 2894} {"train_loss": -6.460857391357422, "global_step": 121584, "epoch": 2894} {"train_loss": -6.57696008682251, "global_step": 121585, "epoch": 2894} {"train_loss": -6.633662223815918, "global_step": 121586, "epoch": 2894} {"train_loss": -6.62001895904541, "global_step": 121587, "epoch": 2894} {"train_loss": -6.560133934020996, "global_step": 121588, "epoch": 2894} {"train_loss": -6.574600560324533, "global_step": 121589, "epoch": 2894, "val_loss": 76864.1875} {"train_loss": -6.617974281311035, "global_step": 121590, "epoch": 2895} {"train_loss": -6.426970481872559, "global_step": 121591, "epoch": 2895} {"train_loss": -6.497776508331299, "global_step": 121592, "epoch": 2895} {"train_loss": -6.550829887390137, "global_step": 121593, "epoch": 2895} {"train_loss": -6.3862104415893555, "global_step": 121594, "epoch": 2895} {"train_loss": -6.551657199859619, "global_step": 121595, "epoch": 2895} {"train_loss": -6.565126419067383, "global_step": 121596, "epoch": 2895} {"train_loss": -6.586667060852051, "global_step": 121597, "epoch": 2895} {"train_loss": -6.692374229431152, "global_step": 121598, "epoch": 2895} {"train_loss": -6.490691184997559, "global_step": 121599, "epoch": 2895} {"train_loss": -6.465685844421387, "global_step": 121600, "epoch": 2895} {"train_loss": -6.568174362182617, "global_step": 121601, "epoch": 2895} {"train_loss": -6.61655330657959, "global_step": 121602, "epoch": 2895} {"train_loss": -6.590909957885742, "global_step": 121603, "epoch": 2895} {"train_loss": -6.61723518371582, "global_step": 121604, "epoch": 2895} {"train_loss": -6.585590362548828, "global_step": 121605, "epoch": 2895} {"train_loss": -6.5721282958984375, "global_step": 121606, "epoch": 2895} {"train_loss": -6.624520301818848, "global_step": 121607, "epoch": 2895} {"train_loss": -6.521124362945557, "global_step": 121608, "epoch": 2895} {"train_loss": -6.607872009277344, "global_step": 121609, "epoch": 2895} {"train_loss": -6.545936584472656, "global_step": 121610, "epoch": 2895} {"train_loss": -6.567527770996094, "global_step": 121611, "epoch": 2895} {"train_loss": -6.668422698974609, "global_step": 121612, "epoch": 2895} {"train_loss": -6.555769443511963, "global_step": 121613, "epoch": 2895} {"train_loss": -6.514317512512207, "global_step": 121614, "epoch": 2895} {"train_loss": -6.666370391845703, "global_step": 121615, "epoch": 2895} {"train_loss": -6.489059925079346, "global_step": 121616, "epoch": 2895} {"train_loss": -6.527169227600098, "global_step": 121617, "epoch": 2895} {"train_loss": -6.478001594543457, "global_step": 121618, "epoch": 2895} {"train_loss": -6.501129150390625, "global_step": 121619, "epoch": 2895} {"train_loss": -6.567286014556885, "global_step": 121620, "epoch": 2895} {"train_loss": -6.526589393615723, "global_step": 121621, "epoch": 2895} {"train_loss": -6.506758689880371, "global_step": 121622, "epoch": 2895} {"train_loss": -6.463027477264404, "global_step": 121623, "epoch": 2895} {"train_loss": -6.597688674926758, "global_step": 121624, "epoch": 2895} {"train_loss": -6.596578121185303, "global_step": 121625, "epoch": 2895} {"train_loss": -6.615729331970215, "global_step": 121626, "epoch": 2895} {"train_loss": -6.482149124145508, "global_step": 121627, "epoch": 2895} {"train_loss": -6.352827548980713, "global_step": 121628, "epoch": 2895} {"train_loss": -6.537693977355957, "global_step": 121629, "epoch": 2895} {"train_loss": -6.553133010864258, "global_step": 121630, "epoch": 2895} {"train_loss": -6.548580396743048, "global_step": 121631, "epoch": 2895, "val_loss": 76821.6015625} {"train_loss": -6.555019378662109, "global_step": 121632, "epoch": 2896} {"train_loss": -6.585874557495117, "global_step": 121633, "epoch": 2896} {"train_loss": -6.6317877769470215, "global_step": 121634, "epoch": 2896} {"train_loss": -6.565372467041016, "global_step": 121635, "epoch": 2896} {"train_loss": -6.479789733886719, "global_step": 121636, "epoch": 2896} {"train_loss": -6.567721843719482, "global_step": 121637, "epoch": 2896} {"train_loss": -6.5839524269104, "global_step": 121638, "epoch": 2896} {"train_loss": -6.393795013427734, "global_step": 121639, "epoch": 2896} {"train_loss": -6.497223854064941, "global_step": 121640, "epoch": 2896} {"train_loss": -6.5668768882751465, "global_step": 121641, "epoch": 2896} {"train_loss": -6.51188850402832, "global_step": 121642, "epoch": 2896} {"train_loss": -6.599213123321533, "global_step": 121643, "epoch": 2896} {"train_loss": -6.589043617248535, "global_step": 121644, "epoch": 2896} {"train_loss": -6.580960273742676, "global_step": 121645, "epoch": 2896} {"train_loss": -6.594308853149414, "global_step": 121646, "epoch": 2896} {"train_loss": -6.577075481414795, "global_step": 121647, "epoch": 2896} {"train_loss": -6.533814430236816, "global_step": 121648, "epoch": 2896} {"train_loss": -6.682116508483887, "global_step": 121649, "epoch": 2896} {"train_loss": -6.624550819396973, "global_step": 121650, "epoch": 2896} {"train_loss": -6.540132999420166, "global_step": 121651, "epoch": 2896} {"train_loss": -6.6442437171936035, "global_step": 121652, "epoch": 2896} {"train_loss": -6.732245922088623, "global_step": 121653, "epoch": 2896} {"train_loss": -6.619274139404297, "global_step": 121654, "epoch": 2896} {"train_loss": -6.60415506362915, "global_step": 121655, "epoch": 2896} {"train_loss": -6.636292457580566, "global_step": 121656, "epoch": 2896} {"train_loss": -6.493879318237305, "global_step": 121657, "epoch": 2896} {"train_loss": -6.622457504272461, "global_step": 121658, "epoch": 2896} {"train_loss": -6.62705135345459, "global_step": 121659, "epoch": 2896} {"train_loss": -6.638368129730225, "global_step": 121660, "epoch": 2896} {"train_loss": -6.654356956481934, "global_step": 121661, "epoch": 2896} {"train_loss": -6.543026924133301, "global_step": 121662, "epoch": 2896} {"train_loss": -6.6402788162231445, "global_step": 121663, "epoch": 2896} {"train_loss": -6.628982067108154, "global_step": 121664, "epoch": 2896} {"train_loss": -6.524409294128418, "global_step": 121665, "epoch": 2896} {"train_loss": -6.600290298461914, "global_step": 121666, "epoch": 2896} {"train_loss": -6.6739397048950195, "global_step": 121667, "epoch": 2896} {"train_loss": -6.684846878051758, "global_step": 121668, "epoch": 2896} {"train_loss": -6.625633239746094, "global_step": 121669, "epoch": 2896} {"train_loss": -6.625308036804199, "global_step": 121670, "epoch": 2896} {"train_loss": -6.606253623962402, "global_step": 121671, "epoch": 2896} {"train_loss": -6.668045997619629, "global_step": 121672, "epoch": 2896} {"train_loss": -6.594920215152559, "global_step": 121673, "epoch": 2896, "val_loss": 77219.5546875} {"train_loss": -6.65231990814209, "global_step": 121674, "epoch": 2897} {"train_loss": -6.620362281799316, "global_step": 121675, "epoch": 2897} {"train_loss": -6.690954685211182, "global_step": 121676, "epoch": 2897} {"train_loss": -6.570075988769531, "global_step": 121677, "epoch": 2897} {"train_loss": -6.5989508628845215, "global_step": 121678, "epoch": 2897} {"train_loss": -6.65073299407959, "global_step": 121679, "epoch": 2897} {"train_loss": -6.573212623596191, "global_step": 121680, "epoch": 2897} {"train_loss": -6.644255638122559, "global_step": 121681, "epoch": 2897} {"train_loss": -6.618016242980957, "global_step": 121682, "epoch": 2897} {"train_loss": -6.614936828613281, "global_step": 121683, "epoch": 2897} {"train_loss": -6.696503639221191, "global_step": 121684, "epoch": 2897} {"train_loss": -6.635286331176758, "global_step": 121685, "epoch": 2897} {"train_loss": -6.5866546630859375, "global_step": 121686, "epoch": 2897} {"train_loss": -6.619787216186523, "global_step": 121687, "epoch": 2897} {"train_loss": -6.620830059051514, "global_step": 121688, "epoch": 2897} {"train_loss": -6.560739994049072, "global_step": 121689, "epoch": 2897} {"train_loss": -6.513472080230713, "global_step": 121690, "epoch": 2897} {"train_loss": -6.648482322692871, "global_step": 121691, "epoch": 2897} {"train_loss": -6.555150032043457, "global_step": 121692, "epoch": 2897} {"train_loss": -6.528451919555664, "global_step": 121693, "epoch": 2897} {"train_loss": -6.551790237426758, "global_step": 121694, "epoch": 2897} {"train_loss": -6.649923324584961, "global_step": 121695, "epoch": 2897} {"train_loss": -6.652805328369141, "global_step": 121696, "epoch": 2897} {"train_loss": -6.477296829223633, "global_step": 121697, "epoch": 2897} {"train_loss": -6.577153205871582, "global_step": 121698, "epoch": 2897} {"train_loss": -6.580999374389648, "global_step": 121699, "epoch": 2897} {"train_loss": -6.671009063720703, "global_step": 121700, "epoch": 2897} {"train_loss": -6.680437088012695, "global_step": 121701, "epoch": 2897} {"train_loss": -6.583732604980469, "global_step": 121702, "epoch": 2897} {"train_loss": -6.606816291809082, "global_step": 121703, "epoch": 2897} {"train_loss": -6.684437274932861, "global_step": 121704, "epoch": 2897} {"train_loss": -6.722639083862305, "global_step": 121705, "epoch": 2897} {"train_loss": -6.674493789672852, "global_step": 121706, "epoch": 2897} {"train_loss": -6.637835502624512, "global_step": 121707, "epoch": 2897} {"train_loss": -6.664412498474121, "global_step": 121708, "epoch": 2897} {"train_loss": -6.744676113128662, "global_step": 121709, "epoch": 2897} {"train_loss": -6.568426132202148, "global_step": 121710, "epoch": 2897} {"train_loss": -6.648728847503662, "global_step": 121711, "epoch": 2897} {"train_loss": -6.581707954406738, "global_step": 121712, "epoch": 2897} {"train_loss": -6.684350490570068, "global_step": 121713, "epoch": 2897} {"train_loss": -6.592364311218262, "global_step": 121714, "epoch": 2897} {"train_loss": -6.6235412416004, "global_step": 121715, "epoch": 2897, "val_loss": 76850.6640625} {"train_loss": -6.50543737411499, "global_step": 121716, "epoch": 2898} {"train_loss": -6.6798095703125, "global_step": 121717, "epoch": 2898} {"train_loss": -6.63795804977417, "global_step": 121718, "epoch": 2898} {"train_loss": -6.600978851318359, "global_step": 121719, "epoch": 2898} {"train_loss": -6.65895938873291, "global_step": 121720, "epoch": 2898} {"train_loss": -6.564480781555176, "global_step": 121721, "epoch": 2898} {"train_loss": -6.511558532714844, "global_step": 121722, "epoch": 2898} {"train_loss": -6.565285682678223, "global_step": 121723, "epoch": 2898} {"train_loss": -6.496926784515381, "global_step": 121724, "epoch": 2898} {"train_loss": -6.487554550170898, "global_step": 121725, "epoch": 2898} {"train_loss": -6.726174831390381, "global_step": 121726, "epoch": 2898} {"train_loss": -6.496706962585449, "global_step": 121727, "epoch": 2898} {"train_loss": -6.57942008972168, "global_step": 121728, "epoch": 2898} {"train_loss": -6.544149875640869, "global_step": 121729, "epoch": 2898} {"train_loss": -6.598301410675049, "global_step": 121730, "epoch": 2898} {"train_loss": -6.513124465942383, "global_step": 121731, "epoch": 2898} {"train_loss": -6.565440654754639, "global_step": 121732, "epoch": 2898} {"train_loss": -6.573859214782715, "global_step": 121733, "epoch": 2898} {"train_loss": -6.557058811187744, "global_step": 121734, "epoch": 2898} {"train_loss": -6.593715667724609, "global_step": 121735, "epoch": 2898} {"train_loss": -6.623929977416992, "global_step": 121736, "epoch": 2898} {"train_loss": -6.668101787567139, "global_step": 121737, "epoch": 2898} {"train_loss": -6.609766006469727, "global_step": 121738, "epoch": 2898} {"train_loss": -6.551139831542969, "global_step": 121739, "epoch": 2898} {"train_loss": -6.734363555908203, "global_step": 121740, "epoch": 2898} {"train_loss": -6.634350776672363, "global_step": 121741, "epoch": 2898} {"train_loss": -6.568467140197754, "global_step": 121742, "epoch": 2898} {"train_loss": -6.7786359786987305, "global_step": 121743, "epoch": 2898} {"train_loss": -6.472103118896484, "global_step": 121744, "epoch": 2898} {"train_loss": -6.586656093597412, "global_step": 121745, "epoch": 2898} {"train_loss": -6.596200466156006, "global_step": 121746, "epoch": 2898} {"train_loss": -6.624669551849365, "global_step": 121747, "epoch": 2898} {"train_loss": -6.751103401184082, "global_step": 121748, "epoch": 2898} {"train_loss": -6.524660587310791, "global_step": 121749, "epoch": 2898} {"train_loss": -6.592641353607178, "global_step": 121750, "epoch": 2898} {"train_loss": -6.6621551513671875, "global_step": 121751, "epoch": 2898} {"train_loss": -6.658296585083008, "global_step": 121752, "epoch": 2898} {"train_loss": -6.606818199157715, "global_step": 121753, "epoch": 2898} {"train_loss": -6.606657981872559, "global_step": 121754, "epoch": 2898} {"train_loss": -6.556879997253418, "global_step": 121755, "epoch": 2898} {"train_loss": -6.719629287719727, "global_step": 121756, "epoch": 2898} {"train_loss": -6.598076933906192, "global_step": 121757, "epoch": 2898, "val_loss": 77282.2890625} {"train_loss": -6.508659362792969, "global_step": 121758, "epoch": 2899} {"train_loss": -6.576667785644531, "global_step": 121759, "epoch": 2899} {"train_loss": -6.633405685424805, "global_step": 121760, "epoch": 2899} {"train_loss": -6.585693836212158, "global_step": 121761, "epoch": 2899} {"train_loss": -6.486892223358154, "global_step": 121762, "epoch": 2899} {"train_loss": -6.58480167388916, "global_step": 121763, "epoch": 2899} {"train_loss": -6.614158630371094, "global_step": 121764, "epoch": 2899} {"train_loss": -6.661073684692383, "global_step": 121765, "epoch": 2899} {"train_loss": -6.607404708862305, "global_step": 121766, "epoch": 2899} {"train_loss": -6.576849460601807, "global_step": 121767, "epoch": 2899} {"train_loss": -6.553678512573242, "global_step": 121768, "epoch": 2899} {"train_loss": -6.594723701477051, "global_step": 121769, "epoch": 2899} {"train_loss": -6.591383934020996, "global_step": 121770, "epoch": 2899} {"train_loss": -6.619549751281738, "global_step": 121771, "epoch": 2899} {"train_loss": -6.59614372253418, "global_step": 121772, "epoch": 2899} {"train_loss": -6.6324896812438965, "global_step": 121773, "epoch": 2899} {"train_loss": -6.562872409820557, "global_step": 121774, "epoch": 2899} {"train_loss": -6.56658411026001, "global_step": 121775, "epoch": 2899} {"train_loss": -6.67501163482666, "global_step": 121776, "epoch": 2899} {"train_loss": -6.503049850463867, "global_step": 121777, "epoch": 2899} {"train_loss": -6.470186233520508, "global_step": 121778, "epoch": 2899} {"train_loss": -6.597848892211914, "global_step": 121779, "epoch": 2899} {"train_loss": -6.479167461395264, "global_step": 121780, "epoch": 2899} {"train_loss": -6.669259071350098, "global_step": 121781, "epoch": 2899} {"train_loss": -6.489653587341309, "global_step": 121782, "epoch": 2899} {"train_loss": -6.547818183898926, "global_step": 121783, "epoch": 2899} {"train_loss": -6.539751052856445, "global_step": 121784, "epoch": 2899} {"train_loss": -6.583298683166504, "global_step": 121785, "epoch": 2899} {"train_loss": -6.701827049255371, "global_step": 121786, "epoch": 2899} {"train_loss": -6.59099006652832, "global_step": 121787, "epoch": 2899} {"train_loss": -6.5450215339660645, "global_step": 121788, "epoch": 2899} {"train_loss": -6.699257850646973, "global_step": 121789, "epoch": 2899} {"train_loss": -6.6150312423706055, "global_step": 121790, "epoch": 2899} {"train_loss": -6.5476884841918945, "global_step": 121791, "epoch": 2899} {"train_loss": -6.646213531494141, "global_step": 121792, "epoch": 2899} {"train_loss": -6.711970329284668, "global_step": 121793, "epoch": 2899} {"train_loss": -6.496579170227051, "global_step": 121794, "epoch": 2899} {"train_loss": -6.455558776855469, "global_step": 121795, "epoch": 2899} {"train_loss": -6.590180397033691, "global_step": 121796, "epoch": 2899} {"train_loss": -6.631755828857422, "global_step": 121797, "epoch": 2899} {"train_loss": -6.646734714508057, "global_step": 121798, "epoch": 2899} {"train_loss": -6.588406358446393, "global_step": 121799, "epoch": 2899, "val_loss": 77118.03125} {"train_loss": -6.5911784172058105, "global_step": 121800, "epoch": 2900} {"train_loss": -6.6797380447387695, "global_step": 121801, "epoch": 2900} {"train_loss": -6.6015119552612305, "global_step": 121802, "epoch": 2900} {"train_loss": -6.606485843658447, "global_step": 121803, "epoch": 2900} {"train_loss": -6.529630184173584, "global_step": 121804, "epoch": 2900} {"train_loss": -6.686367511749268, "global_step": 121805, "epoch": 2900} {"train_loss": -6.559087753295898, "global_step": 121806, "epoch": 2900} {"train_loss": -6.659866809844971, "global_step": 121807, "epoch": 2900} {"train_loss": -6.603631019592285, "global_step": 121808, "epoch": 2900} {"train_loss": -6.572390556335449, "global_step": 121809, "epoch": 2900} {"train_loss": -6.616349220275879, "global_step": 121810, "epoch": 2900} {"train_loss": -6.592881202697754, "global_step": 121811, "epoch": 2900} {"train_loss": -6.552457809448242, "global_step": 121812, "epoch": 2900} {"train_loss": -6.532896041870117, "global_step": 121813, "epoch": 2900} {"train_loss": -6.609683036804199, "global_step": 121814, "epoch": 2900} {"train_loss": -6.707441806793213, "global_step": 121815, "epoch": 2900} {"train_loss": -6.683816432952881, "global_step": 121816, "epoch": 2900} {"train_loss": -6.739954948425293, "global_step": 121817, "epoch": 2900} {"train_loss": -6.611974716186523, "global_step": 121818, "epoch": 2900} {"train_loss": -6.567509651184082, "global_step": 121819, "epoch": 2900} {"train_loss": -6.536380767822266, "global_step": 121820, "epoch": 2900} {"train_loss": -6.553953170776367, "global_step": 121821, "epoch": 2900} {"train_loss": -6.635283470153809, "global_step": 121822, "epoch": 2900} {"train_loss": -6.584362030029297, "global_step": 121823, "epoch": 2900} {"train_loss": -6.624054431915283, "global_step": 121824, "epoch": 2900} {"train_loss": -6.639128684997559, "global_step": 121825, "epoch": 2900} {"train_loss": -6.67783260345459, "global_step": 121826, "epoch": 2900} {"train_loss": -6.496755123138428, "global_step": 121827, "epoch": 2900} {"train_loss": -6.700847148895264, "global_step": 121828, "epoch": 2900} {"train_loss": -6.607306480407715, "global_step": 121829, "epoch": 2900} {"train_loss": -6.5479326248168945, "global_step": 121830, "epoch": 2900} {"train_loss": -6.739690780639648, "global_step": 121831, "epoch": 2900} {"train_loss": -6.562078475952148, "global_step": 121832, "epoch": 2900} {"train_loss": -6.530255317687988, "global_step": 121833, "epoch": 2900} {"train_loss": -6.6339898109436035, "global_step": 121834, "epoch": 2900} {"train_loss": -6.616053581237793, "global_step": 121835, "epoch": 2900} {"train_loss": -6.680412292480469, "global_step": 121836, "epoch": 2900} {"train_loss": -6.604536533355713, "global_step": 121837, "epoch": 2900} {"train_loss": -6.699407577514648, "global_step": 121838, "epoch": 2900} {"train_loss": -6.605491638183594, "global_step": 121839, "epoch": 2900} {"train_loss": -6.650604248046875, "global_step": 121840, "epoch": 2900} {"train_loss": -6.6173787117004395, "global_step": 121841, "epoch": 2900, "train/sim_max_reward_0": 0.9045556200936472, "train/sim_max_reward_1": 0.9644702299579907, "train/sim_max_reward_2": 0.40067385820925355, "train/sim_max_reward_3": 0.1367354909920113, "train/sim_max_reward_4": 0.8496408409766067, "train/sim_max_reward_5": 0.8853050719743574, "test/sim_max_reward_4500000": 0.9147840271682682, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9791979907383656, "test/sim_max_reward_4500003": 0.8728381794063865, "test/sim_max_reward_4500004": 0.9417681972319828, "test/sim_max_reward_4500005": 0.1716238724420745, "test/sim_max_reward_4500006": 0.928930885362696, "test/sim_max_reward_4500007": 0.9315552260457125, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.053572547230495454, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9793471458037865, "test/sim_max_reward_4500012": 0.9707505252197535, "test/sim_max_reward_4500013": 0.00816349625309084, "test/sim_max_reward_4500014": 0.9382779708221272, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.11987043329813461, "test/sim_max_reward_4500018": 0.9994067237307697, "test/sim_max_reward_4500019": 0.43085345410389364, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.810592706463715, "test/sim_max_reward_4500022": 0.9424168756730473, "test/sim_max_reward_4500023": 0.6336664945270596, "test/sim_max_reward_4500024": 0.8569567045771377, "test/sim_max_reward_4500025": 0.9215271448857066, "test/sim_max_reward_4500026": 0.9669457923393235, "test/sim_max_reward_4500027": 0.9250542806518824, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.13863882941669559, "test/sim_max_reward_4500030": 0.9998565525605246, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04812004572588521, "test/sim_max_reward_4500033": 1.0, "test/sim_max_reward_4500034": 0.9237795504589342, "test/sim_max_reward_4500035": 0.6188521102884702, "test/sim_max_reward_4500036": 0.3887433492373123, "test/sim_max_reward_4500037": 0.8748682642831519, "test/sim_max_reward_4500038": 0.33131986003641534, "test/sim_max_reward_4500039": 0.0, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.8093215636437519, "test/sim_max_reward_4500042": 0.022834506779199147, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.16599808989467982, "test/sim_max_reward_4500046": 0.9491107931507257, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0633402670758769, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6902301853673111, "test/mean_score": 0.5172209144495676, "val_loss": 77080.453125} {"train_loss": -6.658449172973633, "global_step": 121842, "epoch": 2901} {"train_loss": -6.561847686767578, "global_step": 121843, "epoch": 2901} {"train_loss": -6.747361183166504, "global_step": 121844, "epoch": 2901} {"train_loss": -6.731695175170898, "global_step": 121845, "epoch": 2901} {"train_loss": -6.676974773406982, "global_step": 121846, "epoch": 2901} {"train_loss": -6.710940837860107, "global_step": 121847, "epoch": 2901} {"train_loss": -6.720829010009766, "global_step": 121848, "epoch": 2901} {"train_loss": -6.661870956420898, "global_step": 121849, "epoch": 2901} {"train_loss": -6.64013147354126, "global_step": 121850, "epoch": 2901} {"train_loss": -6.65598201751709, "global_step": 121851, "epoch": 2901} {"train_loss": -6.696351051330566, "global_step": 121852, "epoch": 2901} {"train_loss": -6.680814266204834, "global_step": 121853, "epoch": 2901} {"train_loss": -6.649669647216797, "global_step": 121854, "epoch": 2901} {"train_loss": -6.681325435638428, "global_step": 121855, "epoch": 2901} {"train_loss": -6.626643180847168, "global_step": 121856, "epoch": 2901} {"train_loss": -6.640392780303955, "global_step": 121857, "epoch": 2901} {"train_loss": -6.720516204833984, "global_step": 121858, "epoch": 2901} {"train_loss": -6.67407751083374, "global_step": 121859, "epoch": 2901} {"train_loss": -6.668445110321045, "global_step": 121860, "epoch": 2901} {"train_loss": -6.721431732177734, "global_step": 121861, "epoch": 2901} {"train_loss": -6.652133464813232, "global_step": 121862, "epoch": 2901} {"train_loss": -6.572274208068848, "global_step": 121863, "epoch": 2901} {"train_loss": -6.647111892700195, "global_step": 121864, "epoch": 2901} {"train_loss": -6.6506524085998535, "global_step": 121865, "epoch": 2901} {"train_loss": -6.588795185089111, "global_step": 121866, "epoch": 2901} {"train_loss": -6.724155426025391, "global_step": 121867, "epoch": 2901} {"train_loss": -6.474923133850098, "global_step": 121868, "epoch": 2901} {"train_loss": -6.6222944259643555, "global_step": 121869, "epoch": 2901} {"train_loss": -6.580118179321289, "global_step": 121870, "epoch": 2901} {"train_loss": -6.465949058532715, "global_step": 121871, "epoch": 2901} {"train_loss": -6.374120235443115, "global_step": 121872, "epoch": 2901} {"train_loss": -6.626127243041992, "global_step": 121873, "epoch": 2901} {"train_loss": -6.472460746765137, "global_step": 121874, "epoch": 2901} {"train_loss": -6.4134674072265625, "global_step": 121875, "epoch": 2901} {"train_loss": -6.530176162719727, "global_step": 121876, "epoch": 2901} {"train_loss": -6.427404403686523, "global_step": 121877, "epoch": 2901} {"train_loss": -6.571427822113037, "global_step": 121878, "epoch": 2901} {"train_loss": -6.549601078033447, "global_step": 121879, "epoch": 2901} {"train_loss": -6.4162468910217285, "global_step": 121880, "epoch": 2901} {"train_loss": -6.5249552726745605, "global_step": 121881, "epoch": 2901} {"train_loss": -6.430065631866455, "global_step": 121882, "epoch": 2901} {"train_loss": -6.6008420671735495, "global_step": 121883, "epoch": 2901, "val_loss": 77645.3125} {"train_loss": -6.41615104675293, "global_step": 121884, "epoch": 2902} {"train_loss": -6.528314113616943, "global_step": 121885, "epoch": 2902} {"train_loss": -6.4448652267456055, "global_step": 121886, "epoch": 2902} {"train_loss": -6.626175403594971, "global_step": 121887, "epoch": 2902} {"train_loss": -6.545820236206055, "global_step": 121888, "epoch": 2902} {"train_loss": -6.457804203033447, "global_step": 121889, "epoch": 2902} {"train_loss": -6.534879684448242, "global_step": 121890, "epoch": 2902} {"train_loss": -6.461715221405029, "global_step": 121891, "epoch": 2902} {"train_loss": -6.606017589569092, "global_step": 121892, "epoch": 2902} {"train_loss": -6.677217483520508, "global_step": 121893, "epoch": 2902} {"train_loss": -6.590545654296875, "global_step": 121894, "epoch": 2902} {"train_loss": -6.661389350891113, "global_step": 121895, "epoch": 2902} {"train_loss": -6.607300758361816, "global_step": 121896, "epoch": 2902} {"train_loss": -6.643125534057617, "global_step": 121897, "epoch": 2902} {"train_loss": -6.577667236328125, "global_step": 121898, "epoch": 2902} {"train_loss": -6.700060844421387, "global_step": 121899, "epoch": 2902} {"train_loss": -6.553773880004883, "global_step": 121900, "epoch": 2902} {"train_loss": -6.6684889793396, "global_step": 121901, "epoch": 2902} {"train_loss": -6.587841987609863, "global_step": 121902, "epoch": 2902} {"train_loss": -6.562633991241455, "global_step": 121903, "epoch": 2902} {"train_loss": -6.523581504821777, "global_step": 121904, "epoch": 2902} {"train_loss": -6.494946002960205, "global_step": 121905, "epoch": 2902} {"train_loss": -6.431210041046143, "global_step": 121906, "epoch": 2902} {"train_loss": -6.614738941192627, "global_step": 121907, "epoch": 2902} {"train_loss": -6.7512311935424805, "global_step": 121908, "epoch": 2902} {"train_loss": -6.661531925201416, "global_step": 121909, "epoch": 2902} {"train_loss": -6.593045234680176, "global_step": 121910, "epoch": 2902} {"train_loss": -6.634649276733398, "global_step": 121911, "epoch": 2902} {"train_loss": -6.577215194702148, "global_step": 121912, "epoch": 2902} {"train_loss": -6.562033176422119, "global_step": 121913, "epoch": 2902} {"train_loss": -6.721900939941406, "global_step": 121914, "epoch": 2902} {"train_loss": -6.695340156555176, "global_step": 121915, "epoch": 2902} {"train_loss": -6.6910624504089355, "global_step": 121916, "epoch": 2902} {"train_loss": -6.63242244720459, "global_step": 121917, "epoch": 2902} {"train_loss": -6.564180374145508, "global_step": 121918, "epoch": 2902} {"train_loss": -6.560349464416504, "global_step": 121919, "epoch": 2902} {"train_loss": -6.619612216949463, "global_step": 121920, "epoch": 2902} {"train_loss": -6.6533522605896, "global_step": 121921, "epoch": 2902} {"train_loss": -6.5661115646362305, "global_step": 121922, "epoch": 2902} {"train_loss": -6.489384651184082, "global_step": 121923, "epoch": 2902} {"train_loss": -6.526920795440674, "global_step": 121924, "epoch": 2902} {"train_loss": -6.585067896615891, "global_step": 121925, "epoch": 2902, "val_loss": 76873.828125} {"train_loss": -6.50902795791626, "global_step": 121926, "epoch": 2903} {"train_loss": -6.709906578063965, "global_step": 121927, "epoch": 2903} {"train_loss": -6.450014114379883, "global_step": 121928, "epoch": 2903} {"train_loss": -6.545985221862793, "global_step": 121929, "epoch": 2903} {"train_loss": -6.6236114501953125, "global_step": 121930, "epoch": 2903} {"train_loss": -6.505364894866943, "global_step": 121931, "epoch": 2903} {"train_loss": -6.460674285888672, "global_step": 121932, "epoch": 2903} {"train_loss": -6.599270343780518, "global_step": 121933, "epoch": 2903} {"train_loss": -6.573037147521973, "global_step": 121934, "epoch": 2903} {"train_loss": -6.458853721618652, "global_step": 121935, "epoch": 2903} {"train_loss": -6.5706281661987305, "global_step": 121936, "epoch": 2903} {"train_loss": -6.593950271606445, "global_step": 121937, "epoch": 2903} {"train_loss": -6.648434638977051, "global_step": 121938, "epoch": 2903} {"train_loss": -6.625333309173584, "global_step": 121939, "epoch": 2903} {"train_loss": -6.603318214416504, "global_step": 121940, "epoch": 2903} {"train_loss": -6.598736763000488, "global_step": 121941, "epoch": 2903} {"train_loss": -6.470330715179443, "global_step": 121942, "epoch": 2903} {"train_loss": -6.5423583984375, "global_step": 121943, "epoch": 2903} {"train_loss": -6.587846755981445, "global_step": 121944, "epoch": 2903} {"train_loss": -6.572908401489258, "global_step": 121945, "epoch": 2903} {"train_loss": -6.5341796875, "global_step": 121946, "epoch": 2903} {"train_loss": -6.609577655792236, "global_step": 121947, "epoch": 2903} {"train_loss": -6.485836505889893, "global_step": 121948, "epoch": 2903} {"train_loss": -6.555069446563721, "global_step": 121949, "epoch": 2903} {"train_loss": -6.526551246643066, "global_step": 121950, "epoch": 2903} {"train_loss": -6.549029350280762, "global_step": 121951, "epoch": 2903} {"train_loss": -6.55458402633667, "global_step": 121952, "epoch": 2903} {"train_loss": -6.523822784423828, "global_step": 121953, "epoch": 2903} {"train_loss": -6.577828407287598, "global_step": 121954, "epoch": 2903} {"train_loss": -6.657439708709717, "global_step": 121955, "epoch": 2903} {"train_loss": -6.5306220054626465, "global_step": 121956, "epoch": 2903} {"train_loss": -6.66964054107666, "global_step": 121957, "epoch": 2903} {"train_loss": -6.463700294494629, "global_step": 121958, "epoch": 2903} {"train_loss": -6.598523139953613, "global_step": 121959, "epoch": 2903} {"train_loss": -6.55265998840332, "global_step": 121960, "epoch": 2903} {"train_loss": -6.544362545013428, "global_step": 121961, "epoch": 2903} {"train_loss": -6.571961879730225, "global_step": 121962, "epoch": 2903} {"train_loss": -6.586819648742676, "global_step": 121963, "epoch": 2903} {"train_loss": -6.7547712326049805, "global_step": 121964, "epoch": 2903} {"train_loss": -6.580248832702637, "global_step": 121965, "epoch": 2903} {"train_loss": -6.663976192474365, "global_step": 121966, "epoch": 2903} {"train_loss": -6.572695130393619, "global_step": 121967, "epoch": 2903, "val_loss": 76983.2265625} {"train_loss": -6.6055498123168945, "global_step": 121968, "epoch": 2904} {"train_loss": -6.616737365722656, "global_step": 121969, "epoch": 2904} {"train_loss": -6.59740686416626, "global_step": 121970, "epoch": 2904} {"train_loss": -6.615206718444824, "global_step": 121971, "epoch": 2904} {"train_loss": -6.633845329284668, "global_step": 121972, "epoch": 2904} {"train_loss": -6.48520040512085, "global_step": 121973, "epoch": 2904} {"train_loss": -6.679009437561035, "global_step": 121974, "epoch": 2904} {"train_loss": -6.564413070678711, "global_step": 121975, "epoch": 2904} {"train_loss": -6.594468116760254, "global_step": 121976, "epoch": 2904} {"train_loss": -6.616560935974121, "global_step": 121977, "epoch": 2904} {"train_loss": -6.646191596984863, "global_step": 121978, "epoch": 2904} {"train_loss": -6.581276893615723, "global_step": 121979, "epoch": 2904} {"train_loss": -6.505988597869873, "global_step": 121980, "epoch": 2904} {"train_loss": -6.619808197021484, "global_step": 121981, "epoch": 2904} {"train_loss": -6.592240333557129, "global_step": 121982, "epoch": 2904} {"train_loss": -6.567795753479004, "global_step": 121983, "epoch": 2904} {"train_loss": -6.624638080596924, "global_step": 121984, "epoch": 2904} {"train_loss": -6.651432991027832, "global_step": 121985, "epoch": 2904} {"train_loss": -6.530355453491211, "global_step": 121986, "epoch": 2904} {"train_loss": -6.6502885818481445, "global_step": 121987, "epoch": 2904} {"train_loss": -6.528812408447266, "global_step": 121988, "epoch": 2904} {"train_loss": -6.664660453796387, "global_step": 121989, "epoch": 2904} {"train_loss": -6.541927814483643, "global_step": 121990, "epoch": 2904} {"train_loss": -6.540373802185059, "global_step": 121991, "epoch": 2904} {"train_loss": -6.655762195587158, "global_step": 121992, "epoch": 2904} {"train_loss": -6.441270351409912, "global_step": 121993, "epoch": 2904} {"train_loss": -6.59567928314209, "global_step": 121994, "epoch": 2904} {"train_loss": -6.688724517822266, "global_step": 121995, "epoch": 2904} {"train_loss": -6.4833269119262695, "global_step": 121996, "epoch": 2904} {"train_loss": -6.399855613708496, "global_step": 121997, "epoch": 2904} {"train_loss": -6.548907279968262, "global_step": 121998, "epoch": 2904} {"train_loss": -6.668986797332764, "global_step": 121999, "epoch": 2904} {"train_loss": -6.609225749969482, "global_step": 122000, "epoch": 2904} {"train_loss": -6.502869129180908, "global_step": 122001, "epoch": 2904} {"train_loss": -6.512042045593262, "global_step": 122002, "epoch": 2904} {"train_loss": -6.5374579429626465, "global_step": 122003, "epoch": 2904} {"train_loss": -6.5621256828308105, "global_step": 122004, "epoch": 2904} {"train_loss": -6.560336112976074, "global_step": 122005, "epoch": 2904} {"train_loss": -6.465359687805176, "global_step": 122006, "epoch": 2904} {"train_loss": -6.540987014770508, "global_step": 122007, "epoch": 2904} {"train_loss": -6.4910807609558105, "global_step": 122008, "epoch": 2904} {"train_loss": -6.573793592907133, "global_step": 122009, "epoch": 2904, "val_loss": 76892.21875} {"train_loss": -6.541223049163818, "global_step": 122010, "epoch": 2905} {"train_loss": -6.682183265686035, "global_step": 122011, "epoch": 2905} {"train_loss": -6.666489601135254, "global_step": 122012, "epoch": 2905} {"train_loss": -6.669144630432129, "global_step": 122013, "epoch": 2905} {"train_loss": -6.552165985107422, "global_step": 122014, "epoch": 2905} {"train_loss": -6.638057708740234, "global_step": 122015, "epoch": 2905} {"train_loss": -6.674120903015137, "global_step": 122016, "epoch": 2905} {"train_loss": -6.630197048187256, "global_step": 122017, "epoch": 2905} {"train_loss": -6.660839557647705, "global_step": 122018, "epoch": 2905} {"train_loss": -6.555591106414795, "global_step": 122019, "epoch": 2905} {"train_loss": -6.720794677734375, "global_step": 122020, "epoch": 2905} {"train_loss": -6.572035789489746, "global_step": 122021, "epoch": 2905} {"train_loss": -6.503961563110352, "global_step": 122022, "epoch": 2905} {"train_loss": -6.634018898010254, "global_step": 122023, "epoch": 2905} {"train_loss": -6.600865364074707, "global_step": 122024, "epoch": 2905} {"train_loss": -6.7896037101745605, "global_step": 122025, "epoch": 2905} {"train_loss": -6.653558254241943, "global_step": 122026, "epoch": 2905} {"train_loss": -6.658145904541016, "global_step": 122027, "epoch": 2905} {"train_loss": -6.543842315673828, "global_step": 122028, "epoch": 2905} {"train_loss": -6.648372650146484, "global_step": 122029, "epoch": 2905} {"train_loss": -6.655421257019043, "global_step": 122030, "epoch": 2905} {"train_loss": -6.510542869567871, "global_step": 122031, "epoch": 2905} {"train_loss": -6.496827125549316, "global_step": 122032, "epoch": 2905} {"train_loss": -6.556337356567383, "global_step": 122033, "epoch": 2905} {"train_loss": -6.595056533813477, "global_step": 122034, "epoch": 2905} {"train_loss": -6.567511558532715, "global_step": 122035, "epoch": 2905} {"train_loss": -6.663827896118164, "global_step": 122036, "epoch": 2905} {"train_loss": -6.623770713806152, "global_step": 122037, "epoch": 2905} {"train_loss": -6.668021202087402, "global_step": 122038, "epoch": 2905} {"train_loss": -6.498630523681641, "global_step": 122039, "epoch": 2905} {"train_loss": -6.626583099365234, "global_step": 122040, "epoch": 2905} {"train_loss": -6.645903587341309, "global_step": 122041, "epoch": 2905} {"train_loss": -6.708517074584961, "global_step": 122042, "epoch": 2905} {"train_loss": -6.4402360916137695, "global_step": 122043, "epoch": 2905} {"train_loss": -6.612154006958008, "global_step": 122044, "epoch": 2905} {"train_loss": -6.554738998413086, "global_step": 122045, "epoch": 2905} {"train_loss": -6.652612686157227, "global_step": 122046, "epoch": 2905} {"train_loss": -6.553740501403809, "global_step": 122047, "epoch": 2905} {"train_loss": -6.6336750984191895, "global_step": 122048, "epoch": 2905} {"train_loss": -6.482440948486328, "global_step": 122049, "epoch": 2905} {"train_loss": -6.5896100997924805, "global_step": 122050, "epoch": 2905} {"train_loss": -6.606811307725453, "global_step": 122051, "epoch": 2905, "val_loss": 77036.9453125} {"train_loss": -6.640842914581299, "global_step": 122052, "epoch": 2906} {"train_loss": -6.6805267333984375, "global_step": 122053, "epoch": 2906} {"train_loss": -6.60357141494751, "global_step": 122054, "epoch": 2906} {"train_loss": -6.510725498199463, "global_step": 122055, "epoch": 2906} {"train_loss": -6.59502649307251, "global_step": 122056, "epoch": 2906} {"train_loss": -6.595775127410889, "global_step": 122057, "epoch": 2906} {"train_loss": -6.482976913452148, "global_step": 122058, "epoch": 2906} {"train_loss": -6.703550815582275, "global_step": 122059, "epoch": 2906} {"train_loss": -6.60168981552124, "global_step": 122060, "epoch": 2906} {"train_loss": -6.484940528869629, "global_step": 122061, "epoch": 2906} {"train_loss": -6.580731391906738, "global_step": 122062, "epoch": 2906} {"train_loss": -6.451055526733398, "global_step": 122063, "epoch": 2906} {"train_loss": -6.534046173095703, "global_step": 122064, "epoch": 2906} {"train_loss": -6.548422336578369, "global_step": 122065, "epoch": 2906} {"train_loss": -6.509494781494141, "global_step": 122066, "epoch": 2906} {"train_loss": -6.622426986694336, "global_step": 122067, "epoch": 2906} {"train_loss": -6.478115558624268, "global_step": 122068, "epoch": 2906} {"train_loss": -6.620921611785889, "global_step": 122069, "epoch": 2906} {"train_loss": -6.597545623779297, "global_step": 122070, "epoch": 2906} {"train_loss": -6.644292831420898, "global_step": 122071, "epoch": 2906} {"train_loss": -6.525632858276367, "global_step": 122072, "epoch": 2906} {"train_loss": -6.446074962615967, "global_step": 122073, "epoch": 2906} {"train_loss": -6.619166374206543, "global_step": 122074, "epoch": 2906} {"train_loss": -6.535695552825928, "global_step": 122075, "epoch": 2906} {"train_loss": -6.49351692199707, "global_step": 122076, "epoch": 2906} {"train_loss": -6.506396770477295, "global_step": 122077, "epoch": 2906} {"train_loss": -6.561728477478027, "global_step": 122078, "epoch": 2906} {"train_loss": -6.528309345245361, "global_step": 122079, "epoch": 2906} {"train_loss": -6.525669097900391, "global_step": 122080, "epoch": 2906} {"train_loss": -6.614076137542725, "global_step": 122081, "epoch": 2906} {"train_loss": -6.562829971313477, "global_step": 122082, "epoch": 2906} {"train_loss": -6.500382900238037, "global_step": 122083, "epoch": 2906} {"train_loss": -6.615627765655518, "global_step": 122084, "epoch": 2906} {"train_loss": -6.462489128112793, "global_step": 122085, "epoch": 2906} {"train_loss": -6.5448150634765625, "global_step": 122086, "epoch": 2906} {"train_loss": -6.606472015380859, "global_step": 122087, "epoch": 2906} {"train_loss": -6.514477729797363, "global_step": 122088, "epoch": 2906} {"train_loss": -6.571235656738281, "global_step": 122089, "epoch": 2906} {"train_loss": -6.488439559936523, "global_step": 122090, "epoch": 2906} {"train_loss": -6.459497451782227, "global_step": 122091, "epoch": 2906} {"train_loss": -6.50705099105835, "global_step": 122092, "epoch": 2906} {"train_loss": -6.552198092142741, "global_step": 122093, "epoch": 2906, "val_loss": 77252.5859375} {"train_loss": -6.571347236633301, "global_step": 122094, "epoch": 2907} {"train_loss": -6.606781005859375, "global_step": 122095, "epoch": 2907} {"train_loss": -6.596192359924316, "global_step": 122096, "epoch": 2907} {"train_loss": -6.536857604980469, "global_step": 122097, "epoch": 2907} {"train_loss": -6.571053504943848, "global_step": 122098, "epoch": 2907} {"train_loss": -6.620141983032227, "global_step": 122099, "epoch": 2907} {"train_loss": -6.570211410522461, "global_step": 122100, "epoch": 2907} {"train_loss": -6.557469844818115, "global_step": 122101, "epoch": 2907} {"train_loss": -6.536462306976318, "global_step": 122102, "epoch": 2907} {"train_loss": -6.639886856079102, "global_step": 122103, "epoch": 2907} {"train_loss": -6.498967170715332, "global_step": 122104, "epoch": 2907} {"train_loss": -6.674870014190674, "global_step": 122105, "epoch": 2907} {"train_loss": -6.660295486450195, "global_step": 122106, "epoch": 2907} {"train_loss": -6.631002426147461, "global_step": 122107, "epoch": 2907} {"train_loss": -6.540523529052734, "global_step": 122108, "epoch": 2907} {"train_loss": -6.610342979431152, "global_step": 122109, "epoch": 2907} {"train_loss": -6.580170631408691, "global_step": 122110, "epoch": 2907} {"train_loss": -6.5972580909729, "global_step": 122111, "epoch": 2907} {"train_loss": -6.596376419067383, "global_step": 122112, "epoch": 2907} {"train_loss": -6.638826370239258, "global_step": 122113, "epoch": 2907} {"train_loss": -6.576974868774414, "global_step": 122114, "epoch": 2907} {"train_loss": -6.611657619476318, "global_step": 122115, "epoch": 2907} {"train_loss": -6.665124416351318, "global_step": 122116, "epoch": 2907} {"train_loss": -6.581726551055908, "global_step": 122117, "epoch": 2907} {"train_loss": -6.6376633644104, "global_step": 122118, "epoch": 2907} {"train_loss": -6.603271484375, "global_step": 122119, "epoch": 2907} {"train_loss": -6.532711029052734, "global_step": 122120, "epoch": 2907} {"train_loss": -6.570314884185791, "global_step": 122121, "epoch": 2907} {"train_loss": -6.675497055053711, "global_step": 122122, "epoch": 2907} {"train_loss": -6.553894996643066, "global_step": 122123, "epoch": 2907} {"train_loss": -6.591097354888916, "global_step": 122124, "epoch": 2907} {"train_loss": -6.742816925048828, "global_step": 122125, "epoch": 2907} {"train_loss": -6.615495681762695, "global_step": 122126, "epoch": 2907} {"train_loss": -6.689129829406738, "global_step": 122127, "epoch": 2907} {"train_loss": -6.822410583496094, "global_step": 122128, "epoch": 2907} {"train_loss": -6.630666255950928, "global_step": 122129, "epoch": 2907} {"train_loss": -6.5445966720581055, "global_step": 122130, "epoch": 2907} {"train_loss": -6.613869667053223, "global_step": 122131, "epoch": 2907} {"train_loss": -6.632755756378174, "global_step": 122132, "epoch": 2907} {"train_loss": -6.6647844314575195, "global_step": 122133, "epoch": 2907} {"train_loss": -6.5457868576049805, "global_step": 122134, "epoch": 2907} {"train_loss": -6.608193715413411, "global_step": 122135, "epoch": 2907, "val_loss": 76787.6328125} {"train_loss": -6.638069152832031, "global_step": 122136, "epoch": 2908} {"train_loss": -6.626762390136719, "global_step": 122137, "epoch": 2908} {"train_loss": -6.570006370544434, "global_step": 122138, "epoch": 2908} {"train_loss": -6.587220191955566, "global_step": 122139, "epoch": 2908} {"train_loss": -6.5824360847473145, "global_step": 122140, "epoch": 2908} {"train_loss": -6.7234416007995605, "global_step": 122141, "epoch": 2908} {"train_loss": -6.591394424438477, "global_step": 122142, "epoch": 2908} {"train_loss": -6.5979228019714355, "global_step": 122143, "epoch": 2908} {"train_loss": -6.64825439453125, "global_step": 122144, "epoch": 2908} {"train_loss": -6.685358047485352, "global_step": 122145, "epoch": 2908} {"train_loss": -6.53556489944458, "global_step": 122146, "epoch": 2908} {"train_loss": -6.64381217956543, "global_step": 122147, "epoch": 2908} {"train_loss": -6.586332321166992, "global_step": 122148, "epoch": 2908} {"train_loss": -6.671997547149658, "global_step": 122149, "epoch": 2908} {"train_loss": -6.572843551635742, "global_step": 122150, "epoch": 2908} {"train_loss": -6.6614580154418945, "global_step": 122151, "epoch": 2908} {"train_loss": -6.5831074714660645, "global_step": 122152, "epoch": 2908} {"train_loss": -6.596398830413818, "global_step": 122153, "epoch": 2908} {"train_loss": -6.733523845672607, "global_step": 122154, "epoch": 2908} {"train_loss": -6.425478458404541, "global_step": 122155, "epoch": 2908} {"train_loss": -6.525815010070801, "global_step": 122156, "epoch": 2908} {"train_loss": -6.5294013023376465, "global_step": 122157, "epoch": 2908} {"train_loss": -6.3922119140625, "global_step": 122158, "epoch": 2908} {"train_loss": -6.595767974853516, "global_step": 122159, "epoch": 2908} {"train_loss": -6.567776203155518, "global_step": 122160, "epoch": 2908} {"train_loss": -6.529427528381348, "global_step": 122161, "epoch": 2908} {"train_loss": -6.497775077819824, "global_step": 122162, "epoch": 2908} {"train_loss": -6.517380714416504, "global_step": 122163, "epoch": 2908} {"train_loss": -6.448822975158691, "global_step": 122164, "epoch": 2908} {"train_loss": -6.595061302185059, "global_step": 122165, "epoch": 2908} {"train_loss": -6.460748672485352, "global_step": 122166, "epoch": 2908} {"train_loss": -6.598970413208008, "global_step": 122167, "epoch": 2908} {"train_loss": -6.47896671295166, "global_step": 122168, "epoch": 2908} {"train_loss": -6.501878261566162, "global_step": 122169, "epoch": 2908} {"train_loss": -6.4723920822143555, "global_step": 122170, "epoch": 2908} {"train_loss": -6.5618486404418945, "global_step": 122171, "epoch": 2908} {"train_loss": -6.455655574798584, "global_step": 122172, "epoch": 2908} {"train_loss": -6.578305244445801, "global_step": 122173, "epoch": 2908} {"train_loss": -6.495659351348877, "global_step": 122174, "epoch": 2908} {"train_loss": -6.436122894287109, "global_step": 122175, "epoch": 2908} {"train_loss": -6.491498947143555, "global_step": 122176, "epoch": 2908} {"train_loss": -6.5602064700353715, "global_step": 122177, "epoch": 2908, "val_loss": 77222.9453125} {"train_loss": -6.587102890014648, "global_step": 122178, "epoch": 2909} {"train_loss": -6.552828788757324, "global_step": 122179, "epoch": 2909} {"train_loss": -6.507286071777344, "global_step": 122180, "epoch": 2909} {"train_loss": -6.539921760559082, "global_step": 122181, "epoch": 2909} {"train_loss": -6.583461761474609, "global_step": 122182, "epoch": 2909} {"train_loss": -6.476595401763916, "global_step": 122183, "epoch": 2909} {"train_loss": -6.562928199768066, "global_step": 122184, "epoch": 2909} {"train_loss": -6.529808044433594, "global_step": 122185, "epoch": 2909} {"train_loss": -6.52847957611084, "global_step": 122186, "epoch": 2909} {"train_loss": -6.570187568664551, "global_step": 122187, "epoch": 2909} {"train_loss": -6.555861473083496, "global_step": 122188, "epoch": 2909} {"train_loss": -6.576703071594238, "global_step": 122189, "epoch": 2909} {"train_loss": -6.488690376281738, "global_step": 122190, "epoch": 2909} {"train_loss": -6.674104690551758, "global_step": 122191, "epoch": 2909} {"train_loss": -6.593687057495117, "global_step": 122192, "epoch": 2909} {"train_loss": -6.642391204833984, "global_step": 122193, "epoch": 2909} {"train_loss": -6.567821979522705, "global_step": 122194, "epoch": 2909} {"train_loss": -6.499082088470459, "global_step": 122195, "epoch": 2909} {"train_loss": -6.5909504890441895, "global_step": 122196, "epoch": 2909} {"train_loss": -6.474127769470215, "global_step": 122197, "epoch": 2909} {"train_loss": -6.645407199859619, "global_step": 122198, "epoch": 2909} {"train_loss": -6.659875869750977, "global_step": 122199, "epoch": 2909} {"train_loss": -6.608406066894531, "global_step": 122200, "epoch": 2909} {"train_loss": -6.685349464416504, "global_step": 122201, "epoch": 2909} {"train_loss": -6.750522613525391, "global_step": 122202, "epoch": 2909} {"train_loss": -6.583767890930176, "global_step": 122203, "epoch": 2909} {"train_loss": -6.6296586990356445, "global_step": 122204, "epoch": 2909} {"train_loss": -6.656792163848877, "global_step": 122205, "epoch": 2909} {"train_loss": -6.712502956390381, "global_step": 122206, "epoch": 2909} {"train_loss": -6.5083537101745605, "global_step": 122207, "epoch": 2909} {"train_loss": -6.626936435699463, "global_step": 122208, "epoch": 2909} {"train_loss": -6.68937349319458, "global_step": 122209, "epoch": 2909} {"train_loss": -6.5985493659973145, "global_step": 122210, "epoch": 2909} {"train_loss": -6.631834983825684, "global_step": 122211, "epoch": 2909} {"train_loss": -6.480990409851074, "global_step": 122212, "epoch": 2909} {"train_loss": -6.53523588180542, "global_step": 122213, "epoch": 2909} {"train_loss": -6.486832141876221, "global_step": 122214, "epoch": 2909} {"train_loss": -6.5750322341918945, "global_step": 122215, "epoch": 2909} {"train_loss": -6.460690975189209, "global_step": 122216, "epoch": 2909} {"train_loss": -6.473124027252197, "global_step": 122217, "epoch": 2909} {"train_loss": -6.590989112854004, "global_step": 122218, "epoch": 2909} {"train_loss": -6.578067370823452, "global_step": 122219, "epoch": 2909, "val_loss": 77267.1875} {"train_loss": -6.637212753295898, "global_step": 122220, "epoch": 2910} {"train_loss": -6.568373680114746, "global_step": 122221, "epoch": 2910} {"train_loss": -6.625181198120117, "global_step": 122222, "epoch": 2910} {"train_loss": -6.5920562744140625, "global_step": 122223, "epoch": 2910} {"train_loss": -6.553382873535156, "global_step": 122224, "epoch": 2910} {"train_loss": -6.597532749176025, "global_step": 122225, "epoch": 2910} {"train_loss": -6.5858917236328125, "global_step": 122226, "epoch": 2910} {"train_loss": -6.625812530517578, "global_step": 122227, "epoch": 2910} {"train_loss": -6.6014580726623535, "global_step": 122228, "epoch": 2910} {"train_loss": -6.654285430908203, "global_step": 122229, "epoch": 2910} {"train_loss": -6.473849773406982, "global_step": 122230, "epoch": 2910} {"train_loss": -6.536218166351318, "global_step": 122231, "epoch": 2910} {"train_loss": -6.444783687591553, "global_step": 122232, "epoch": 2910} {"train_loss": -6.552712917327881, "global_step": 122233, "epoch": 2910} {"train_loss": -6.5827717781066895, "global_step": 122234, "epoch": 2910} {"train_loss": -6.600842475891113, "global_step": 122235, "epoch": 2910} {"train_loss": -6.637186050415039, "global_step": 122236, "epoch": 2910} {"train_loss": -6.421539306640625, "global_step": 122237, "epoch": 2910} {"train_loss": -6.545920372009277, "global_step": 122238, "epoch": 2910} {"train_loss": -6.6247878074646, "global_step": 122239, "epoch": 2910} {"train_loss": -6.570637226104736, "global_step": 122240, "epoch": 2910} {"train_loss": -6.534008026123047, "global_step": 122241, "epoch": 2910} {"train_loss": -6.510220050811768, "global_step": 122242, "epoch": 2910} {"train_loss": -6.535924911499023, "global_step": 122243, "epoch": 2910} {"train_loss": -6.565788269042969, "global_step": 122244, "epoch": 2910} {"train_loss": -6.516537666320801, "global_step": 122245, "epoch": 2910} {"train_loss": -6.3772478103637695, "global_step": 122246, "epoch": 2910} {"train_loss": -6.572497844696045, "global_step": 122247, "epoch": 2910} {"train_loss": -6.540800094604492, "global_step": 122248, "epoch": 2910} {"train_loss": -6.529536247253418, "global_step": 122249, "epoch": 2910} {"train_loss": -6.522027969360352, "global_step": 122250, "epoch": 2910} {"train_loss": -6.441433906555176, "global_step": 122251, "epoch": 2910} {"train_loss": -6.549130439758301, "global_step": 122252, "epoch": 2910} {"train_loss": -6.435215950012207, "global_step": 122253, "epoch": 2910} {"train_loss": -6.536134719848633, "global_step": 122254, "epoch": 2910} {"train_loss": -6.661447048187256, "global_step": 122255, "epoch": 2910} {"train_loss": -6.33005428314209, "global_step": 122256, "epoch": 2910} {"train_loss": -6.5768632888793945, "global_step": 122257, "epoch": 2910} {"train_loss": -6.4475603103637695, "global_step": 122258, "epoch": 2910} {"train_loss": -6.468954086303711, "global_step": 122259, "epoch": 2910} {"train_loss": -6.53650426864624, "global_step": 122260, "epoch": 2910} {"train_loss": -6.54066336722601, "global_step": 122261, "epoch": 2910, "val_loss": 76784.2109375} {"train_loss": -6.712043762207031, "global_step": 122262, "epoch": 2911} {"train_loss": -6.4557061195373535, "global_step": 122263, "epoch": 2911} {"train_loss": -6.472273826599121, "global_step": 122264, "epoch": 2911} {"train_loss": -6.507882118225098, "global_step": 122265, "epoch": 2911} {"train_loss": -6.55734920501709, "global_step": 122266, "epoch": 2911} {"train_loss": -6.590437889099121, "global_step": 122267, "epoch": 2911} {"train_loss": -6.4937005043029785, "global_step": 122268, "epoch": 2911} {"train_loss": -6.550848007202148, "global_step": 122269, "epoch": 2911} {"train_loss": -6.525997638702393, "global_step": 122270, "epoch": 2911} {"train_loss": -6.5418596267700195, "global_step": 122271, "epoch": 2911} {"train_loss": -6.585503101348877, "global_step": 122272, "epoch": 2911} {"train_loss": -6.475826263427734, "global_step": 122273, "epoch": 2911} {"train_loss": -6.586007595062256, "global_step": 122274, "epoch": 2911} {"train_loss": -6.4877238273620605, "global_step": 122275, "epoch": 2911} {"train_loss": -6.629085540771484, "global_step": 122276, "epoch": 2911} {"train_loss": -6.5333943367004395, "global_step": 122277, "epoch": 2911} {"train_loss": -6.634653091430664, "global_step": 122278, "epoch": 2911} {"train_loss": -6.672057151794434, "global_step": 122279, "epoch": 2911} {"train_loss": -6.558575630187988, "global_step": 122280, "epoch": 2911} {"train_loss": -6.606177806854248, "global_step": 122281, "epoch": 2911} {"train_loss": -6.59498405456543, "global_step": 122282, "epoch": 2911} {"train_loss": -6.596708297729492, "global_step": 122283, "epoch": 2911} {"train_loss": -6.644923210144043, "global_step": 122284, "epoch": 2911} {"train_loss": -6.543195724487305, "global_step": 122285, "epoch": 2911} {"train_loss": -6.5376505851745605, "global_step": 122286, "epoch": 2911} {"train_loss": -6.560640335083008, "global_step": 122287, "epoch": 2911} {"train_loss": -6.524713516235352, "global_step": 122288, "epoch": 2911} {"train_loss": -6.5197954177856445, "global_step": 122289, "epoch": 2911} {"train_loss": -6.585938453674316, "global_step": 122290, "epoch": 2911} {"train_loss": -6.5025739669799805, "global_step": 122291, "epoch": 2911} {"train_loss": -6.442230224609375, "global_step": 122292, "epoch": 2911} {"train_loss": -6.650603771209717, "global_step": 122293, "epoch": 2911} {"train_loss": -6.428565979003906, "global_step": 122294, "epoch": 2911} {"train_loss": -6.52827262878418, "global_step": 122295, "epoch": 2911} {"train_loss": -6.594039440155029, "global_step": 122296, "epoch": 2911} {"train_loss": -6.649164199829102, "global_step": 122297, "epoch": 2911} {"train_loss": -6.577948570251465, "global_step": 122298, "epoch": 2911} {"train_loss": -6.673133373260498, "global_step": 122299, "epoch": 2911} {"train_loss": -6.513729572296143, "global_step": 122300, "epoch": 2911} {"train_loss": -6.611249923706055, "global_step": 122301, "epoch": 2911} {"train_loss": -6.596695423126221, "global_step": 122302, "epoch": 2911} {"train_loss": -6.564813227880569, "global_step": 122303, "epoch": 2911, "val_loss": 76972.453125} {"train_loss": -6.592529296875, "global_step": 122304, "epoch": 2912} {"train_loss": -6.379842758178711, "global_step": 122305, "epoch": 2912} {"train_loss": -6.595577239990234, "global_step": 122306, "epoch": 2912} {"train_loss": -6.6419525146484375, "global_step": 122307, "epoch": 2912} {"train_loss": -6.52801513671875, "global_step": 122308, "epoch": 2912} {"train_loss": -6.517135143280029, "global_step": 122309, "epoch": 2912} {"train_loss": -6.505520820617676, "global_step": 122310, "epoch": 2912} {"train_loss": -6.5399885177612305, "global_step": 122311, "epoch": 2912} {"train_loss": -6.704805374145508, "global_step": 122312, "epoch": 2912} {"train_loss": -6.567038536071777, "global_step": 122313, "epoch": 2912} {"train_loss": -6.696850776672363, "global_step": 122314, "epoch": 2912} {"train_loss": -6.572226524353027, "global_step": 122315, "epoch": 2912} {"train_loss": -6.53572416305542, "global_step": 122316, "epoch": 2912} {"train_loss": -6.633658409118652, "global_step": 122317, "epoch": 2912} {"train_loss": -6.468321800231934, "global_step": 122318, "epoch": 2912} {"train_loss": -6.59647274017334, "global_step": 122319, "epoch": 2912} {"train_loss": -6.5709428787231445, "global_step": 122320, "epoch": 2912} {"train_loss": -6.642229080200195, "global_step": 122321, "epoch": 2912} {"train_loss": -6.510411262512207, "global_step": 122322, "epoch": 2912} {"train_loss": -6.48005485534668, "global_step": 122323, "epoch": 2912} {"train_loss": -6.606842041015625, "global_step": 122324, "epoch": 2912} {"train_loss": -6.591843605041504, "global_step": 122325, "epoch": 2912} {"train_loss": -6.521359443664551, "global_step": 122326, "epoch": 2912} {"train_loss": -6.474189281463623, "global_step": 122327, "epoch": 2912} {"train_loss": -6.6595001220703125, "global_step": 122328, "epoch": 2912} {"train_loss": -6.563777923583984, "global_step": 122329, "epoch": 2912} {"train_loss": -6.714845657348633, "global_step": 122330, "epoch": 2912} {"train_loss": -6.649559020996094, "global_step": 122331, "epoch": 2912} {"train_loss": -6.6635212898254395, "global_step": 122332, "epoch": 2912} {"train_loss": -6.654101371765137, "global_step": 122333, "epoch": 2912} {"train_loss": -6.613646984100342, "global_step": 122334, "epoch": 2912} {"train_loss": -6.654076099395752, "global_step": 122335, "epoch": 2912} {"train_loss": -6.6775126457214355, "global_step": 122336, "epoch": 2912} {"train_loss": -6.716188430786133, "global_step": 122337, "epoch": 2912} {"train_loss": -6.607691764831543, "global_step": 122338, "epoch": 2912} {"train_loss": -6.6006574630737305, "global_step": 122339, "epoch": 2912} {"train_loss": -6.651362419128418, "global_step": 122340, "epoch": 2912} {"train_loss": -6.597326278686523, "global_step": 122341, "epoch": 2912} {"train_loss": -6.606210708618164, "global_step": 122342, "epoch": 2912} {"train_loss": -6.603696346282959, "global_step": 122343, "epoch": 2912} {"train_loss": -6.582979679107666, "global_step": 122344, "epoch": 2912} {"train_loss": -6.592869667779832, "global_step": 122345, "epoch": 2912, "val_loss": 76804.9921875} {"train_loss": -6.634111404418945, "global_step": 122346, "epoch": 2913} {"train_loss": -6.663358688354492, "global_step": 122347, "epoch": 2913} {"train_loss": -6.730136871337891, "global_step": 122348, "epoch": 2913} {"train_loss": -6.766278266906738, "global_step": 122349, "epoch": 2913} {"train_loss": -6.585366249084473, "global_step": 122350, "epoch": 2913} {"train_loss": -6.663975715637207, "global_step": 122351, "epoch": 2913} {"train_loss": -6.584423065185547, "global_step": 122352, "epoch": 2913} {"train_loss": -6.55352783203125, "global_step": 122353, "epoch": 2913} {"train_loss": -6.579493522644043, "global_step": 122354, "epoch": 2913} {"train_loss": -6.70843505859375, "global_step": 122355, "epoch": 2913} {"train_loss": -6.695491313934326, "global_step": 122356, "epoch": 2913} {"train_loss": -6.6116437911987305, "global_step": 122357, "epoch": 2913} {"train_loss": -6.694954872131348, "global_step": 122358, "epoch": 2913} {"train_loss": -6.664559364318848, "global_step": 122359, "epoch": 2913} {"train_loss": -6.566046714782715, "global_step": 122360, "epoch": 2913} {"train_loss": -6.685420989990234, "global_step": 122361, "epoch": 2913} {"train_loss": -6.537651538848877, "global_step": 122362, "epoch": 2913} {"train_loss": -6.572159767150879, "global_step": 122363, "epoch": 2913} {"train_loss": -6.467550754547119, "global_step": 122364, "epoch": 2913} {"train_loss": -6.643733501434326, "global_step": 122365, "epoch": 2913} {"train_loss": -6.587222099304199, "global_step": 122366, "epoch": 2913} {"train_loss": -6.504729270935059, "global_step": 122367, "epoch": 2913} {"train_loss": -6.5776896476745605, "global_step": 122368, "epoch": 2913} {"train_loss": -6.461352348327637, "global_step": 122369, "epoch": 2913} {"train_loss": -6.3452558517456055, "global_step": 122370, "epoch": 2913} {"train_loss": -6.600405693054199, "global_step": 122371, "epoch": 2913} {"train_loss": -6.472995758056641, "global_step": 122372, "epoch": 2913} {"train_loss": -6.5017781257629395, "global_step": 122373, "epoch": 2913} {"train_loss": -6.552066802978516, "global_step": 122374, "epoch": 2913} {"train_loss": -6.485551357269287, "global_step": 122375, "epoch": 2913} {"train_loss": -6.4110565185546875, "global_step": 122376, "epoch": 2913} {"train_loss": -6.481959342956543, "global_step": 122377, "epoch": 2913} {"train_loss": -6.350893020629883, "global_step": 122378, "epoch": 2913} {"train_loss": -6.3463568687438965, "global_step": 122379, "epoch": 2913} {"train_loss": -6.532482147216797, "global_step": 122380, "epoch": 2913} {"train_loss": -6.331376552581787, "global_step": 122381, "epoch": 2913} {"train_loss": -6.433443069458008, "global_step": 122382, "epoch": 2913} {"train_loss": -6.44487190246582, "global_step": 122383, "epoch": 2913} {"train_loss": -6.393759727478027, "global_step": 122384, "epoch": 2913} {"train_loss": -6.572279453277588, "global_step": 122385, "epoch": 2913} {"train_loss": -6.501840114593506, "global_step": 122386, "epoch": 2913} {"train_loss": -6.548772868655977, "global_step": 122387, "epoch": 2913, "val_loss": 76982.0625} {"train_loss": -6.4651594161987305, "global_step": 122388, "epoch": 2914} {"train_loss": -6.490318298339844, "global_step": 122389, "epoch": 2914} {"train_loss": -6.626757621765137, "global_step": 122390, "epoch": 2914} {"train_loss": -6.386157035827637, "global_step": 122391, "epoch": 2914} {"train_loss": -6.467288494110107, "global_step": 122392, "epoch": 2914} {"train_loss": -6.626725196838379, "global_step": 122393, "epoch": 2914} {"train_loss": -6.590649604797363, "global_step": 122394, "epoch": 2914} {"train_loss": -6.590741157531738, "global_step": 122395, "epoch": 2914} {"train_loss": -6.610770225524902, "global_step": 122396, "epoch": 2914} {"train_loss": -6.5981292724609375, "global_step": 122397, "epoch": 2914} {"train_loss": -6.633938789367676, "global_step": 122398, "epoch": 2914} {"train_loss": -6.430185794830322, "global_step": 122399, "epoch": 2914} {"train_loss": -6.6463422775268555, "global_step": 122400, "epoch": 2914} {"train_loss": -6.519569396972656, "global_step": 122401, "epoch": 2914} {"train_loss": -6.4950761795043945, "global_step": 122402, "epoch": 2914} {"train_loss": -6.576622486114502, "global_step": 122403, "epoch": 2914} {"train_loss": -6.586857795715332, "global_step": 122404, "epoch": 2914} {"train_loss": -6.37797737121582, "global_step": 122405, "epoch": 2914} {"train_loss": -6.474852561950684, "global_step": 122406, "epoch": 2914} {"train_loss": -6.589989185333252, "global_step": 122407, "epoch": 2914} {"train_loss": -6.6189165115356445, "global_step": 122408, "epoch": 2914} {"train_loss": -6.56813907623291, "global_step": 122409, "epoch": 2914} {"train_loss": -6.585369110107422, "global_step": 122410, "epoch": 2914} {"train_loss": -6.589474201202393, "global_step": 122411, "epoch": 2914} {"train_loss": -6.516026496887207, "global_step": 122412, "epoch": 2914} {"train_loss": -6.461518287658691, "global_step": 122413, "epoch": 2914} {"train_loss": -6.572279453277588, "global_step": 122414, "epoch": 2914} {"train_loss": -6.483760356903076, "global_step": 122415, "epoch": 2914} {"train_loss": -6.721210479736328, "global_step": 122416, "epoch": 2914} {"train_loss": -6.421756744384766, "global_step": 122417, "epoch": 2914} {"train_loss": -6.478863716125488, "global_step": 122418, "epoch": 2914} {"train_loss": -6.555109024047852, "global_step": 122419, "epoch": 2914} {"train_loss": -6.501939296722412, "global_step": 122420, "epoch": 2914} {"train_loss": -6.607005596160889, "global_step": 122421, "epoch": 2914} {"train_loss": -6.555284023284912, "global_step": 122422, "epoch": 2914} {"train_loss": -6.584864616394043, "global_step": 122423, "epoch": 2914} {"train_loss": -6.647652626037598, "global_step": 122424, "epoch": 2914} {"train_loss": -6.646870136260986, "global_step": 122425, "epoch": 2914} {"train_loss": -6.678643703460693, "global_step": 122426, "epoch": 2914} {"train_loss": -6.5564446449279785, "global_step": 122427, "epoch": 2914} {"train_loss": -6.676974296569824, "global_step": 122428, "epoch": 2914} {"train_loss": -6.555971713293166, "global_step": 122429, "epoch": 2914, "val_loss": 76974.0078125} {"train_loss": -6.608335971832275, "global_step": 122430, "epoch": 2915} {"train_loss": -6.650548934936523, "global_step": 122431, "epoch": 2915} {"train_loss": -6.615512371063232, "global_step": 122432, "epoch": 2915} {"train_loss": -6.624964714050293, "global_step": 122433, "epoch": 2915} {"train_loss": -6.573208808898926, "global_step": 122434, "epoch": 2915} {"train_loss": -6.653444290161133, "global_step": 122435, "epoch": 2915} {"train_loss": -6.529031753540039, "global_step": 122436, "epoch": 2915} {"train_loss": -6.642744541168213, "global_step": 122437, "epoch": 2915} {"train_loss": -6.513358116149902, "global_step": 122438, "epoch": 2915} {"train_loss": -6.549522399902344, "global_step": 122439, "epoch": 2915} {"train_loss": -6.577340126037598, "global_step": 122440, "epoch": 2915} {"train_loss": -6.628270626068115, "global_step": 122441, "epoch": 2915} {"train_loss": -6.727245330810547, "global_step": 122442, "epoch": 2915} {"train_loss": -6.544467926025391, "global_step": 122443, "epoch": 2915} {"train_loss": -6.756861686706543, "global_step": 122444, "epoch": 2915} {"train_loss": -6.5590715408325195, "global_step": 122445, "epoch": 2915} {"train_loss": -6.661734104156494, "global_step": 122446, "epoch": 2915} {"train_loss": -6.609580039978027, "global_step": 122447, "epoch": 2915} {"train_loss": -6.5922112464904785, "global_step": 122448, "epoch": 2915} {"train_loss": -6.750181674957275, "global_step": 122449, "epoch": 2915} {"train_loss": -6.6217041015625, "global_step": 122450, "epoch": 2915} {"train_loss": -6.47055721282959, "global_step": 122451, "epoch": 2915} {"train_loss": -6.691175937652588, "global_step": 122452, "epoch": 2915} {"train_loss": -6.714182376861572, "global_step": 122453, "epoch": 2915} {"train_loss": -6.544524669647217, "global_step": 122454, "epoch": 2915} {"train_loss": -6.625915050506592, "global_step": 122455, "epoch": 2915} {"train_loss": -6.654563903808594, "global_step": 122456, "epoch": 2915} {"train_loss": -6.706606388092041, "global_step": 122457, "epoch": 2915} {"train_loss": -6.720149040222168, "global_step": 122458, "epoch": 2915} {"train_loss": -6.58162260055542, "global_step": 122459, "epoch": 2915} {"train_loss": -6.60918664932251, "global_step": 122460, "epoch": 2915} {"train_loss": -6.50560188293457, "global_step": 122461, "epoch": 2915} {"train_loss": -6.6426286697387695, "global_step": 122462, "epoch": 2915} {"train_loss": -6.527851104736328, "global_step": 122463, "epoch": 2915} {"train_loss": -6.678093910217285, "global_step": 122464, "epoch": 2915} {"train_loss": -6.577511787414551, "global_step": 122465, "epoch": 2915} {"train_loss": -6.653277397155762, "global_step": 122466, "epoch": 2915} {"train_loss": -6.517766952514648, "global_step": 122467, "epoch": 2915} {"train_loss": -6.510355472564697, "global_step": 122468, "epoch": 2915} {"train_loss": -6.557341575622559, "global_step": 122469, "epoch": 2915} {"train_loss": -6.635958671569824, "global_step": 122470, "epoch": 2915} {"train_loss": -6.612737905411493, "global_step": 122471, "epoch": 2915, "val_loss": 77022.3515625} {"train_loss": -6.6866679191589355, "global_step": 122472, "epoch": 2916} {"train_loss": -6.5075554847717285, "global_step": 122473, "epoch": 2916} {"train_loss": -6.538215637207031, "global_step": 122474, "epoch": 2916} {"train_loss": -6.61684513092041, "global_step": 122475, "epoch": 2916} {"train_loss": -6.611198425292969, "global_step": 122476, "epoch": 2916} {"train_loss": -6.467423439025879, "global_step": 122477, "epoch": 2916} {"train_loss": -6.7206830978393555, "global_step": 122478, "epoch": 2916} {"train_loss": -6.612514495849609, "global_step": 122479, "epoch": 2916} {"train_loss": -6.529139995574951, "global_step": 122480, "epoch": 2916} {"train_loss": -6.67875862121582, "global_step": 122481, "epoch": 2916} {"train_loss": -6.633728504180908, "global_step": 122482, "epoch": 2916} {"train_loss": -6.489541053771973, "global_step": 122483, "epoch": 2916} {"train_loss": -6.573869228363037, "global_step": 122484, "epoch": 2916} {"train_loss": -6.521693229675293, "global_step": 122485, "epoch": 2916} {"train_loss": -6.535462379455566, "global_step": 122486, "epoch": 2916} {"train_loss": -6.497214317321777, "global_step": 122487, "epoch": 2916} {"train_loss": -6.536746978759766, "global_step": 122488, "epoch": 2916} {"train_loss": -6.515955448150635, "global_step": 122489, "epoch": 2916} {"train_loss": -6.56118106842041, "global_step": 122490, "epoch": 2916} {"train_loss": -6.579390048980713, "global_step": 122491, "epoch": 2916} {"train_loss": -6.5679612159729, "global_step": 122492, "epoch": 2916} {"train_loss": -6.444991588592529, "global_step": 122493, "epoch": 2916} {"train_loss": -6.572805404663086, "global_step": 122494, "epoch": 2916} {"train_loss": -6.706624507904053, "global_step": 122495, "epoch": 2916} {"train_loss": -6.531723499298096, "global_step": 122496, "epoch": 2916} {"train_loss": -6.568524360656738, "global_step": 122497, "epoch": 2916} {"train_loss": -6.5136871337890625, "global_step": 122498, "epoch": 2916} {"train_loss": -6.645400047302246, "global_step": 122499, "epoch": 2916} {"train_loss": -6.658414840698242, "global_step": 122500, "epoch": 2916} {"train_loss": -6.576350212097168, "global_step": 122501, "epoch": 2916} {"train_loss": -6.580282688140869, "global_step": 122502, "epoch": 2916} {"train_loss": -6.464845180511475, "global_step": 122503, "epoch": 2916} {"train_loss": -6.604659080505371, "global_step": 122504, "epoch": 2916} {"train_loss": -6.585938453674316, "global_step": 122505, "epoch": 2916} {"train_loss": -6.683498382568359, "global_step": 122506, "epoch": 2916} {"train_loss": -6.651636123657227, "global_step": 122507, "epoch": 2916} {"train_loss": -6.687185764312744, "global_step": 122508, "epoch": 2916} {"train_loss": -6.639974594116211, "global_step": 122509, "epoch": 2916} {"train_loss": -6.669360160827637, "global_step": 122510, "epoch": 2916} {"train_loss": -6.673084259033203, "global_step": 122511, "epoch": 2916} {"train_loss": -6.6617937088012695, "global_step": 122512, "epoch": 2916} {"train_loss": -6.588114477339245, "global_step": 122513, "epoch": 2916, "val_loss": 76967.3125} {"train_loss": -6.61217737197876, "global_step": 122514, "epoch": 2917} {"train_loss": -6.7180633544921875, "global_step": 122515, "epoch": 2917} {"train_loss": -6.597795486450195, "global_step": 122516, "epoch": 2917} {"train_loss": -6.563004493713379, "global_step": 122517, "epoch": 2917} {"train_loss": -6.5410919189453125, "global_step": 122518, "epoch": 2917} {"train_loss": -6.604938983917236, "global_step": 122519, "epoch": 2917} {"train_loss": -6.576222896575928, "global_step": 122520, "epoch": 2917} {"train_loss": -6.551605224609375, "global_step": 122521, "epoch": 2917} {"train_loss": -6.5632853507995605, "global_step": 122522, "epoch": 2917} {"train_loss": -6.691671848297119, "global_step": 122523, "epoch": 2917} {"train_loss": -6.578263759613037, "global_step": 122524, "epoch": 2917} {"train_loss": -6.527939796447754, "global_step": 122525, "epoch": 2917} {"train_loss": -6.523313522338867, "global_step": 122526, "epoch": 2917} {"train_loss": -6.550260543823242, "global_step": 122527, "epoch": 2917} {"train_loss": -6.6489973068237305, "global_step": 122528, "epoch": 2917} {"train_loss": -6.448556900024414, "global_step": 122529, "epoch": 2917} {"train_loss": -6.577240943908691, "global_step": 122530, "epoch": 2917} {"train_loss": -6.445294380187988, "global_step": 122531, "epoch": 2917} {"train_loss": -6.544933795928955, "global_step": 122532, "epoch": 2917} {"train_loss": -6.551871299743652, "global_step": 122533, "epoch": 2917} {"train_loss": -6.5479912757873535, "global_step": 122534, "epoch": 2917} {"train_loss": -6.484580993652344, "global_step": 122535, "epoch": 2917} {"train_loss": -6.531756401062012, "global_step": 122536, "epoch": 2917} {"train_loss": -6.635447025299072, "global_step": 122537, "epoch": 2917} {"train_loss": -6.4909234046936035, "global_step": 122538, "epoch": 2917} {"train_loss": -6.530184268951416, "global_step": 122539, "epoch": 2917} {"train_loss": -6.4132232666015625, "global_step": 122540, "epoch": 2917} {"train_loss": -6.475311279296875, "global_step": 122541, "epoch": 2917} {"train_loss": -6.4627861976623535, "global_step": 122542, "epoch": 2917} {"train_loss": -6.430794715881348, "global_step": 122543, "epoch": 2917} {"train_loss": -6.544370174407959, "global_step": 122544, "epoch": 2917} {"train_loss": -6.4184370040893555, "global_step": 122545, "epoch": 2917} {"train_loss": -6.597105503082275, "global_step": 122546, "epoch": 2917} {"train_loss": -6.568453311920166, "global_step": 122547, "epoch": 2917} {"train_loss": -6.651613235473633, "global_step": 122548, "epoch": 2917} {"train_loss": -6.505011081695557, "global_step": 122549, "epoch": 2917} {"train_loss": -6.58786153793335, "global_step": 122550, "epoch": 2917} {"train_loss": -6.610842704772949, "global_step": 122551, "epoch": 2917} {"train_loss": -6.535310745239258, "global_step": 122552, "epoch": 2917} {"train_loss": -6.6045942306518555, "global_step": 122553, "epoch": 2917} {"train_loss": -6.499207973480225, "global_step": 122554, "epoch": 2917} {"train_loss": -6.549714871815273, "global_step": 122555, "epoch": 2917, "val_loss": 76907.3359375} {"train_loss": -6.683503150939941, "global_step": 122556, "epoch": 2918} {"train_loss": -6.595114231109619, "global_step": 122557, "epoch": 2918} {"train_loss": -6.508683204650879, "global_step": 122558, "epoch": 2918} {"train_loss": -6.5824174880981445, "global_step": 122559, "epoch": 2918} {"train_loss": -6.615701675415039, "global_step": 122560, "epoch": 2918} {"train_loss": -6.617566108703613, "global_step": 122561, "epoch": 2918} {"train_loss": -6.656341552734375, "global_step": 122562, "epoch": 2918} {"train_loss": -6.5494279861450195, "global_step": 122563, "epoch": 2918} {"train_loss": -6.684156894683838, "global_step": 122564, "epoch": 2918} {"train_loss": -6.496285915374756, "global_step": 122565, "epoch": 2918} {"train_loss": -6.602333068847656, "global_step": 122566, "epoch": 2918} {"train_loss": -6.608541965484619, "global_step": 122567, "epoch": 2918} {"train_loss": -6.60767936706543, "global_step": 122568, "epoch": 2918} {"train_loss": -6.706088066101074, "global_step": 122569, "epoch": 2918} {"train_loss": -6.621849060058594, "global_step": 122570, "epoch": 2918} {"train_loss": -6.546003818511963, "global_step": 122571, "epoch": 2918} {"train_loss": -6.5249738693237305, "global_step": 122572, "epoch": 2918} {"train_loss": -6.579909324645996, "global_step": 122573, "epoch": 2918} {"train_loss": -6.694189548492432, "global_step": 122574, "epoch": 2918} {"train_loss": -6.608592987060547, "global_step": 122575, "epoch": 2918} {"train_loss": -6.645413398742676, "global_step": 122576, "epoch": 2918} {"train_loss": -6.572425365447998, "global_step": 122577, "epoch": 2918} {"train_loss": -6.495511054992676, "global_step": 122578, "epoch": 2918} {"train_loss": -6.672799587249756, "global_step": 122579, "epoch": 2918} {"train_loss": -6.56108283996582, "global_step": 122580, "epoch": 2918} {"train_loss": -6.57613468170166, "global_step": 122581, "epoch": 2918} {"train_loss": -6.648348808288574, "global_step": 122582, "epoch": 2918} {"train_loss": -6.581914901733398, "global_step": 122583, "epoch": 2918} {"train_loss": -6.549626350402832, "global_step": 122584, "epoch": 2918} {"train_loss": -6.629138946533203, "global_step": 122585, "epoch": 2918} {"train_loss": -6.4903082847595215, "global_step": 122586, "epoch": 2918} {"train_loss": -6.505243301391602, "global_step": 122587, "epoch": 2918} {"train_loss": -6.553906440734863, "global_step": 122588, "epoch": 2918} {"train_loss": -6.592386245727539, "global_step": 122589, "epoch": 2918} {"train_loss": -6.712068557739258, "global_step": 122590, "epoch": 2918} {"train_loss": -6.523552417755127, "global_step": 122591, "epoch": 2918} {"train_loss": -6.609586715698242, "global_step": 122592, "epoch": 2918} {"train_loss": -6.606591701507568, "global_step": 122593, "epoch": 2918} {"train_loss": -6.444469451904297, "global_step": 122594, "epoch": 2918} {"train_loss": -6.65074348449707, "global_step": 122595, "epoch": 2918} {"train_loss": -6.374438285827637, "global_step": 122596, "epoch": 2918} {"train_loss": -6.5842774368467785, "global_step": 122597, "epoch": 2918, "val_loss": 76773.140625} {"train_loss": -6.515442848205566, "global_step": 122598, "epoch": 2919} {"train_loss": -6.537529945373535, "global_step": 122599, "epoch": 2919} {"train_loss": -6.451391696929932, "global_step": 122600, "epoch": 2919} {"train_loss": -6.519461631774902, "global_step": 122601, "epoch": 2919} {"train_loss": -6.561105728149414, "global_step": 122602, "epoch": 2919} {"train_loss": -6.515863418579102, "global_step": 122603, "epoch": 2919} {"train_loss": -6.570072650909424, "global_step": 122604, "epoch": 2919} {"train_loss": -6.635376453399658, "global_step": 122605, "epoch": 2919} {"train_loss": -6.492081165313721, "global_step": 122606, "epoch": 2919} {"train_loss": -6.517436981201172, "global_step": 122607, "epoch": 2919} {"train_loss": -6.591592311859131, "global_step": 122608, "epoch": 2919} {"train_loss": -6.515169143676758, "global_step": 122609, "epoch": 2919} {"train_loss": -6.609292984008789, "global_step": 122610, "epoch": 2919} {"train_loss": -6.500365734100342, "global_step": 122611, "epoch": 2919} {"train_loss": -6.489354610443115, "global_step": 122612, "epoch": 2919} {"train_loss": -6.5574750900268555, "global_step": 122613, "epoch": 2919} {"train_loss": -6.545722961425781, "global_step": 122614, "epoch": 2919} {"train_loss": -6.574593544006348, "global_step": 122615, "epoch": 2919} {"train_loss": -6.550259590148926, "global_step": 122616, "epoch": 2919} {"train_loss": -6.630722999572754, "global_step": 122617, "epoch": 2919} {"train_loss": -6.75963020324707, "global_step": 122618, "epoch": 2919} {"train_loss": -6.52995491027832, "global_step": 122619, "epoch": 2919} {"train_loss": -6.628143787384033, "global_step": 122620, "epoch": 2919} {"train_loss": -6.656989097595215, "global_step": 122621, "epoch": 2919} {"train_loss": -6.59616756439209, "global_step": 122622, "epoch": 2919} {"train_loss": -6.659857749938965, "global_step": 122623, "epoch": 2919} {"train_loss": -6.577700614929199, "global_step": 122624, "epoch": 2919} {"train_loss": -6.618868827819824, "global_step": 122625, "epoch": 2919} {"train_loss": -6.552491188049316, "global_step": 122626, "epoch": 2919} {"train_loss": -6.463822364807129, "global_step": 122627, "epoch": 2919} {"train_loss": -6.5446953773498535, "global_step": 122628, "epoch": 2919} {"train_loss": -6.666980743408203, "global_step": 122629, "epoch": 2919} {"train_loss": -6.571520805358887, "global_step": 122630, "epoch": 2919} {"train_loss": -6.485348701477051, "global_step": 122631, "epoch": 2919} {"train_loss": -6.552381992340088, "global_step": 122632, "epoch": 2919} {"train_loss": -6.547555923461914, "global_step": 122633, "epoch": 2919} {"train_loss": -6.557331085205078, "global_step": 122634, "epoch": 2919} {"train_loss": -6.51113224029541, "global_step": 122635, "epoch": 2919} {"train_loss": -6.564669132232666, "global_step": 122636, "epoch": 2919} {"train_loss": -6.598639488220215, "global_step": 122637, "epoch": 2919} {"train_loss": -6.6769304275512695, "global_step": 122638, "epoch": 2919} {"train_loss": -6.56580156371707, "global_step": 122639, "epoch": 2919, "val_loss": 76946.7734375} {"train_loss": -6.560678005218506, "global_step": 122640, "epoch": 2920} {"train_loss": -6.643338203430176, "global_step": 122641, "epoch": 2920} {"train_loss": -6.664059638977051, "global_step": 122642, "epoch": 2920} {"train_loss": -6.585952281951904, "global_step": 122643, "epoch": 2920} {"train_loss": -6.627447128295898, "global_step": 122644, "epoch": 2920} {"train_loss": -6.7113800048828125, "global_step": 122645, "epoch": 2920} {"train_loss": -6.793933391571045, "global_step": 122646, "epoch": 2920} {"train_loss": -6.725330829620361, "global_step": 122647, "epoch": 2920} {"train_loss": -6.637398719787598, "global_step": 122648, "epoch": 2920} {"train_loss": -6.595464706420898, "global_step": 122649, "epoch": 2920} {"train_loss": -6.6307244300842285, "global_step": 122650, "epoch": 2920} {"train_loss": -6.537668228149414, "global_step": 122651, "epoch": 2920} {"train_loss": -6.682854652404785, "global_step": 122652, "epoch": 2920} {"train_loss": -6.668277740478516, "global_step": 122653, "epoch": 2920} {"train_loss": -6.538919925689697, "global_step": 122654, "epoch": 2920} {"train_loss": -6.5486907958984375, "global_step": 122655, "epoch": 2920} {"train_loss": -6.601439476013184, "global_step": 122656, "epoch": 2920} {"train_loss": -6.674079895019531, "global_step": 122657, "epoch": 2920} {"train_loss": -6.62493896484375, "global_step": 122658, "epoch": 2920} {"train_loss": -6.624375343322754, "global_step": 122659, "epoch": 2920} {"train_loss": -6.549351692199707, "global_step": 122660, "epoch": 2920} {"train_loss": -6.640815734863281, "global_step": 122661, "epoch": 2920} {"train_loss": -6.595841407775879, "global_step": 122662, "epoch": 2920} {"train_loss": -6.544751167297363, "global_step": 122663, "epoch": 2920} {"train_loss": -6.566162109375, "global_step": 122664, "epoch": 2920} {"train_loss": -6.50083065032959, "global_step": 122665, "epoch": 2920} {"train_loss": -6.654117107391357, "global_step": 122666, "epoch": 2920} {"train_loss": -6.744624614715576, "global_step": 122667, "epoch": 2920} {"train_loss": -6.489961624145508, "global_step": 122668, "epoch": 2920} {"train_loss": -6.542483329772949, "global_step": 122669, "epoch": 2920} {"train_loss": -6.534644603729248, "global_step": 122670, "epoch": 2920} {"train_loss": -6.670650482177734, "global_step": 122671, "epoch": 2920} {"train_loss": -6.540273666381836, "global_step": 122672, "epoch": 2920} {"train_loss": -6.571568012237549, "global_step": 122673, "epoch": 2920} {"train_loss": -6.574640274047852, "global_step": 122674, "epoch": 2920} {"train_loss": -6.575860977172852, "global_step": 122675, "epoch": 2920} {"train_loss": -6.595196723937988, "global_step": 122676, "epoch": 2920} {"train_loss": -6.528662204742432, "global_step": 122677, "epoch": 2920} {"train_loss": -6.632473945617676, "global_step": 122678, "epoch": 2920} {"train_loss": -6.630648612976074, "global_step": 122679, "epoch": 2920} {"train_loss": -6.754800796508789, "global_step": 122680, "epoch": 2920} {"train_loss": -6.611314126423427, "global_step": 122681, "epoch": 2920, "val_loss": 76962.8671875} {"train_loss": -6.624926567077637, "global_step": 122682, "epoch": 2921} {"train_loss": -6.621827125549316, "global_step": 122683, "epoch": 2921} {"train_loss": -6.571857452392578, "global_step": 122684, "epoch": 2921} {"train_loss": -6.691291332244873, "global_step": 122685, "epoch": 2921} {"train_loss": -6.638533592224121, "global_step": 122686, "epoch": 2921} {"train_loss": -6.658809661865234, "global_step": 122687, "epoch": 2921} {"train_loss": -6.678602695465088, "global_step": 122688, "epoch": 2921} {"train_loss": -6.753944396972656, "global_step": 122689, "epoch": 2921} {"train_loss": -6.646310329437256, "global_step": 122690, "epoch": 2921} {"train_loss": -6.642350673675537, "global_step": 122691, "epoch": 2921} {"train_loss": -6.672276496887207, "global_step": 122692, "epoch": 2921} {"train_loss": -6.648475646972656, "global_step": 122693, "epoch": 2921} {"train_loss": -6.644448280334473, "global_step": 122694, "epoch": 2921} {"train_loss": -6.575850486755371, "global_step": 122695, "epoch": 2921} {"train_loss": -6.670247554779053, "global_step": 122696, "epoch": 2921} {"train_loss": -6.739229679107666, "global_step": 122697, "epoch": 2921} {"train_loss": -6.587510108947754, "global_step": 122698, "epoch": 2921} {"train_loss": -6.661890029907227, "global_step": 122699, "epoch": 2921} {"train_loss": -6.5651350021362305, "global_step": 122700, "epoch": 2921} {"train_loss": -6.684310436248779, "global_step": 122701, "epoch": 2921} {"train_loss": -6.586627960205078, "global_step": 122702, "epoch": 2921} {"train_loss": -6.561673164367676, "global_step": 122703, "epoch": 2921} {"train_loss": -6.677450656890869, "global_step": 122704, "epoch": 2921} {"train_loss": -6.7013397216796875, "global_step": 122705, "epoch": 2921} {"train_loss": -6.483370304107666, "global_step": 122706, "epoch": 2921} {"train_loss": -6.668755531311035, "global_step": 122707, "epoch": 2921} {"train_loss": -6.490751266479492, "global_step": 122708, "epoch": 2921} {"train_loss": -6.415051460266113, "global_step": 122709, "epoch": 2921} {"train_loss": -6.517559051513672, "global_step": 122710, "epoch": 2921} {"train_loss": -6.530185699462891, "global_step": 122711, "epoch": 2921} {"train_loss": -6.480714797973633, "global_step": 122712, "epoch": 2921} {"train_loss": -6.563041687011719, "global_step": 122713, "epoch": 2921} {"train_loss": -6.481020450592041, "global_step": 122714, "epoch": 2921} {"train_loss": -6.569864749908447, "global_step": 122715, "epoch": 2921} {"train_loss": -6.580173492431641, "global_step": 122716, "epoch": 2921} {"train_loss": -6.517685413360596, "global_step": 122717, "epoch": 2921} {"train_loss": -6.5639448165893555, "global_step": 122718, "epoch": 2921} {"train_loss": -6.594090461730957, "global_step": 122719, "epoch": 2921} {"train_loss": -6.5805745124816895, "global_step": 122720, "epoch": 2921} {"train_loss": -6.514669418334961, "global_step": 122721, "epoch": 2921} {"train_loss": -6.557393550872803, "global_step": 122722, "epoch": 2921} {"train_loss": -6.599851369857788, "global_step": 122723, "epoch": 2921, "val_loss": 77239.328125} {"train_loss": -6.647331714630127, "global_step": 122724, "epoch": 2922} {"train_loss": -6.562868595123291, "global_step": 122725, "epoch": 2922} {"train_loss": -6.56824254989624, "global_step": 122726, "epoch": 2922} {"train_loss": -6.589159965515137, "global_step": 122727, "epoch": 2922} {"train_loss": -6.635707378387451, "global_step": 122728, "epoch": 2922} {"train_loss": -6.671561241149902, "global_step": 122729, "epoch": 2922} {"train_loss": -6.719221115112305, "global_step": 122730, "epoch": 2922} {"train_loss": -6.608441352844238, "global_step": 122731, "epoch": 2922} {"train_loss": -6.550045967102051, "global_step": 122732, "epoch": 2922} {"train_loss": -6.615969657897949, "global_step": 122733, "epoch": 2922} {"train_loss": -6.605231285095215, "global_step": 122734, "epoch": 2922} {"train_loss": -6.636624336242676, "global_step": 122735, "epoch": 2922} {"train_loss": -6.602878570556641, "global_step": 122736, "epoch": 2922} {"train_loss": -6.5925703048706055, "global_step": 122737, "epoch": 2922} {"train_loss": -6.648898124694824, "global_step": 122738, "epoch": 2922} {"train_loss": -6.558788299560547, "global_step": 122739, "epoch": 2922} {"train_loss": -6.604930877685547, "global_step": 122740, "epoch": 2922} {"train_loss": -6.60536003112793, "global_step": 122741, "epoch": 2922} {"train_loss": -6.60947322845459, "global_step": 122742, "epoch": 2922} {"train_loss": -6.612116813659668, "global_step": 122743, "epoch": 2922} {"train_loss": -6.596922397613525, "global_step": 122744, "epoch": 2922} {"train_loss": -6.454843521118164, "global_step": 122745, "epoch": 2922} {"train_loss": -6.543689727783203, "global_step": 122746, "epoch": 2922} {"train_loss": -6.524130821228027, "global_step": 122747, "epoch": 2922} {"train_loss": -6.509011745452881, "global_step": 122748, "epoch": 2922} {"train_loss": -6.574122905731201, "global_step": 122749, "epoch": 2922} {"train_loss": -6.541570663452148, "global_step": 122750, "epoch": 2922} {"train_loss": -6.5557379722595215, "global_step": 122751, "epoch": 2922} {"train_loss": -6.611071586608887, "global_step": 122752, "epoch": 2922} {"train_loss": -6.548933029174805, "global_step": 122753, "epoch": 2922} {"train_loss": -6.538300514221191, "global_step": 122754, "epoch": 2922} {"train_loss": -6.587684631347656, "global_step": 122755, "epoch": 2922} {"train_loss": -6.461666107177734, "global_step": 122756, "epoch": 2922} {"train_loss": -6.580866813659668, "global_step": 122757, "epoch": 2922} {"train_loss": -6.379571914672852, "global_step": 122758, "epoch": 2922} {"train_loss": -6.508726119995117, "global_step": 122759, "epoch": 2922} {"train_loss": -6.639337062835693, "global_step": 122760, "epoch": 2922} {"train_loss": -6.489100456237793, "global_step": 122761, "epoch": 2922} {"train_loss": -6.534808158874512, "global_step": 122762, "epoch": 2922} {"train_loss": -6.526349067687988, "global_step": 122763, "epoch": 2922} {"train_loss": -6.611690521240234, "global_step": 122764, "epoch": 2922} {"train_loss": -6.5740403901963, "global_step": 122765, "epoch": 2922, "val_loss": 77215.1015625} {"train_loss": -6.538633346557617, "global_step": 122766, "epoch": 2923} {"train_loss": -6.609079360961914, "global_step": 122767, "epoch": 2923} {"train_loss": -6.589622497558594, "global_step": 122768, "epoch": 2923} {"train_loss": -6.539003372192383, "global_step": 122769, "epoch": 2923} {"train_loss": -6.660224914550781, "global_step": 122770, "epoch": 2923} {"train_loss": -6.58482551574707, "global_step": 122771, "epoch": 2923} {"train_loss": -6.5093302726745605, "global_step": 122772, "epoch": 2923} {"train_loss": -6.596626281738281, "global_step": 122773, "epoch": 2923} {"train_loss": -6.5662522315979, "global_step": 122774, "epoch": 2923} {"train_loss": -6.538825035095215, "global_step": 122775, "epoch": 2923} {"train_loss": -6.523288726806641, "global_step": 122776, "epoch": 2923} {"train_loss": -6.560528755187988, "global_step": 122777, "epoch": 2923} {"train_loss": -6.622137546539307, "global_step": 122778, "epoch": 2923} {"train_loss": -6.548530578613281, "global_step": 122779, "epoch": 2923} {"train_loss": -6.581206321716309, "global_step": 122780, "epoch": 2923} {"train_loss": -6.616161346435547, "global_step": 122781, "epoch": 2923} {"train_loss": -6.557979106903076, "global_step": 122782, "epoch": 2923} {"train_loss": -6.566856384277344, "global_step": 122783, "epoch": 2923} {"train_loss": -6.3525590896606445, "global_step": 122784, "epoch": 2923} {"train_loss": -6.649918556213379, "global_step": 122785, "epoch": 2923} {"train_loss": -6.4976630210876465, "global_step": 122786, "epoch": 2923} {"train_loss": -6.582945823669434, "global_step": 122787, "epoch": 2923} {"train_loss": -6.605262756347656, "global_step": 122788, "epoch": 2923} {"train_loss": -6.5413007736206055, "global_step": 122789, "epoch": 2923} {"train_loss": -6.540163993835449, "global_step": 122790, "epoch": 2923} {"train_loss": -6.626399040222168, "global_step": 122791, "epoch": 2923} {"train_loss": -6.503068923950195, "global_step": 122792, "epoch": 2923} {"train_loss": -6.632189750671387, "global_step": 122793, "epoch": 2923} {"train_loss": -6.593481063842773, "global_step": 122794, "epoch": 2923} {"train_loss": -6.482267379760742, "global_step": 122795, "epoch": 2923} {"train_loss": -6.478520393371582, "global_step": 122796, "epoch": 2923} {"train_loss": -6.511846542358398, "global_step": 122797, "epoch": 2923} {"train_loss": -6.485374450683594, "global_step": 122798, "epoch": 2923} {"train_loss": -6.6218414306640625, "global_step": 122799, "epoch": 2923} {"train_loss": -6.465607643127441, "global_step": 122800, "epoch": 2923} {"train_loss": -6.5991291999816895, "global_step": 122801, "epoch": 2923} {"train_loss": -6.596357345581055, "global_step": 122802, "epoch": 2923} {"train_loss": -6.499032020568848, "global_step": 122803, "epoch": 2923} {"train_loss": -6.465534210205078, "global_step": 122804, "epoch": 2923} {"train_loss": -6.564872741699219, "global_step": 122805, "epoch": 2923} {"train_loss": -6.515355110168457, "global_step": 122806, "epoch": 2923} {"train_loss": -6.5538077013833185, "global_step": 122807, "epoch": 2923, "val_loss": 77513.2890625} {"train_loss": -6.487193584442139, "global_step": 122808, "epoch": 2924} {"train_loss": -6.520885467529297, "global_step": 122809, "epoch": 2924} {"train_loss": -6.549108982086182, "global_step": 122810, "epoch": 2924} {"train_loss": -6.61408805847168, "global_step": 122811, "epoch": 2924} {"train_loss": -6.487507343292236, "global_step": 122812, "epoch": 2924} {"train_loss": -6.549751281738281, "global_step": 122813, "epoch": 2924} {"train_loss": -6.567607879638672, "global_step": 122814, "epoch": 2924} {"train_loss": -6.669818878173828, "global_step": 122815, "epoch": 2924} {"train_loss": -6.6086554527282715, "global_step": 122816, "epoch": 2924} {"train_loss": -6.56719970703125, "global_step": 122817, "epoch": 2924} {"train_loss": -6.589365005493164, "global_step": 122818, "epoch": 2924} {"train_loss": -6.583747863769531, "global_step": 122819, "epoch": 2924} {"train_loss": -6.634550094604492, "global_step": 122820, "epoch": 2924} {"train_loss": -6.580709457397461, "global_step": 122821, "epoch": 2924} {"train_loss": -6.4225358963012695, "global_step": 122822, "epoch": 2924} {"train_loss": -6.485661029815674, "global_step": 122823, "epoch": 2924} {"train_loss": -6.553771495819092, "global_step": 122824, "epoch": 2924} {"train_loss": -6.647172927856445, "global_step": 122825, "epoch": 2924} {"train_loss": -6.5668463706970215, "global_step": 122826, "epoch": 2924} {"train_loss": -6.576920032501221, "global_step": 122827, "epoch": 2924} {"train_loss": -6.475532054901123, "global_step": 122828, "epoch": 2924} {"train_loss": -6.640646934509277, "global_step": 122829, "epoch": 2924} {"train_loss": -6.592554569244385, "global_step": 122830, "epoch": 2924} {"train_loss": -6.604775428771973, "global_step": 122831, "epoch": 2924} {"train_loss": -6.583115100860596, "global_step": 122832, "epoch": 2924} {"train_loss": -6.591327667236328, "global_step": 122833, "epoch": 2924} {"train_loss": -6.654687881469727, "global_step": 122834, "epoch": 2924} {"train_loss": -6.700257778167725, "global_step": 122835, "epoch": 2924} {"train_loss": -6.524733066558838, "global_step": 122836, "epoch": 2924} {"train_loss": -6.59261417388916, "global_step": 122837, "epoch": 2924} {"train_loss": -6.677264213562012, "global_step": 122838, "epoch": 2924} {"train_loss": -6.668041229248047, "global_step": 122839, "epoch": 2924} {"train_loss": -6.54011344909668, "global_step": 122840, "epoch": 2924} {"train_loss": -6.611525535583496, "global_step": 122841, "epoch": 2924} {"train_loss": -6.617035865783691, "global_step": 122842, "epoch": 2924} {"train_loss": -6.545718193054199, "global_step": 122843, "epoch": 2924} {"train_loss": -6.579261779785156, "global_step": 122844, "epoch": 2924} {"train_loss": -6.610854625701904, "global_step": 122845, "epoch": 2924} {"train_loss": -6.545585632324219, "global_step": 122846, "epoch": 2924} {"train_loss": -6.642444610595703, "global_step": 122847, "epoch": 2924} {"train_loss": -6.634463310241699, "global_step": 122848, "epoch": 2924} {"train_loss": -6.5833091622307185, "global_step": 122849, "epoch": 2924, "val_loss": 77163.2734375} {"train_loss": -6.586667060852051, "global_step": 122850, "epoch": 2925} {"train_loss": -6.629469871520996, "global_step": 122851, "epoch": 2925} {"train_loss": -6.605976581573486, "global_step": 122852, "epoch": 2925} {"train_loss": -6.581789016723633, "global_step": 122853, "epoch": 2925} {"train_loss": -6.568815231323242, "global_step": 122854, "epoch": 2925} {"train_loss": -6.615720748901367, "global_step": 122855, "epoch": 2925} {"train_loss": -6.580650806427002, "global_step": 122856, "epoch": 2925} {"train_loss": -6.657044887542725, "global_step": 122857, "epoch": 2925} {"train_loss": -6.641223907470703, "global_step": 122858, "epoch": 2925} {"train_loss": -6.590919494628906, "global_step": 122859, "epoch": 2925} {"train_loss": -6.690140247344971, "global_step": 122860, "epoch": 2925} {"train_loss": -6.52010440826416, "global_step": 122861, "epoch": 2925} {"train_loss": -6.628330230712891, "global_step": 122862, "epoch": 2925} {"train_loss": -6.52854061126709, "global_step": 122863, "epoch": 2925} {"train_loss": -6.691442966461182, "global_step": 122864, "epoch": 2925} {"train_loss": -6.6435980796813965, "global_step": 122865, "epoch": 2925} {"train_loss": -6.5766496658325195, "global_step": 122866, "epoch": 2925} {"train_loss": -6.6385369300842285, "global_step": 122867, "epoch": 2925} {"train_loss": -6.520471572875977, "global_step": 122868, "epoch": 2925} {"train_loss": -6.537156105041504, "global_step": 122869, "epoch": 2925} {"train_loss": -6.560094833374023, "global_step": 122870, "epoch": 2925} {"train_loss": -6.605192184448242, "global_step": 122871, "epoch": 2925} {"train_loss": -6.382979869842529, "global_step": 122872, "epoch": 2925} {"train_loss": -6.4437432289123535, "global_step": 122873, "epoch": 2925} {"train_loss": -6.601933479309082, "global_step": 122874, "epoch": 2925} {"train_loss": -6.463507652282715, "global_step": 122875, "epoch": 2925} {"train_loss": -6.571375846862793, "global_step": 122876, "epoch": 2925} {"train_loss": -6.507989883422852, "global_step": 122877, "epoch": 2925} {"train_loss": -6.612231731414795, "global_step": 122878, "epoch": 2925} {"train_loss": -6.4352006912231445, "global_step": 122879, "epoch": 2925} {"train_loss": -6.565285682678223, "global_step": 122880, "epoch": 2925} {"train_loss": -6.574739933013916, "global_step": 122881, "epoch": 2925} {"train_loss": -6.653095245361328, "global_step": 122882, "epoch": 2925} {"train_loss": -6.575442790985107, "global_step": 122883, "epoch": 2925} {"train_loss": -6.472995758056641, "global_step": 122884, "epoch": 2925} {"train_loss": -6.512354850769043, "global_step": 122885, "epoch": 2925} {"train_loss": -6.520213603973389, "global_step": 122886, "epoch": 2925} {"train_loss": -6.6054368019104, "global_step": 122887, "epoch": 2925} {"train_loss": -6.511672019958496, "global_step": 122888, "epoch": 2925} {"train_loss": -6.652174949645996, "global_step": 122889, "epoch": 2925} {"train_loss": -6.595510005950928, "global_step": 122890, "epoch": 2925} {"train_loss": -6.570885510671706, "global_step": 122891, "epoch": 2925, "val_loss": 76843.921875} {"train_loss": -6.609092712402344, "global_step": 122892, "epoch": 2926} {"train_loss": -6.581396102905273, "global_step": 122893, "epoch": 2926} {"train_loss": -6.474032402038574, "global_step": 122894, "epoch": 2926} {"train_loss": -6.548955917358398, "global_step": 122895, "epoch": 2926} {"train_loss": -6.430206775665283, "global_step": 122896, "epoch": 2926} {"train_loss": -6.603193283081055, "global_step": 122897, "epoch": 2926} {"train_loss": -6.501617908477783, "global_step": 122898, "epoch": 2926} {"train_loss": -6.5857954025268555, "global_step": 122899, "epoch": 2926} {"train_loss": -6.519425392150879, "global_step": 122900, "epoch": 2926} {"train_loss": -6.618810653686523, "global_step": 122901, "epoch": 2926} {"train_loss": -6.625033378601074, "global_step": 122902, "epoch": 2926} {"train_loss": -6.540423393249512, "global_step": 122903, "epoch": 2926} {"train_loss": -6.6135663986206055, "global_step": 122904, "epoch": 2926} {"train_loss": -6.667745113372803, "global_step": 122905, "epoch": 2926} {"train_loss": -6.558569431304932, "global_step": 122906, "epoch": 2926} {"train_loss": -6.628186225891113, "global_step": 122907, "epoch": 2926} {"train_loss": -6.541119575500488, "global_step": 122908, "epoch": 2926} {"train_loss": -6.636528015136719, "global_step": 122909, "epoch": 2926} {"train_loss": -6.5321173667907715, "global_step": 122910, "epoch": 2926} {"train_loss": -6.57722282409668, "global_step": 122911, "epoch": 2926} {"train_loss": -6.569955348968506, "global_step": 122912, "epoch": 2926} {"train_loss": -6.521005630493164, "global_step": 122913, "epoch": 2926} {"train_loss": -6.601834297180176, "global_step": 122914, "epoch": 2926} {"train_loss": -6.692145347595215, "global_step": 122915, "epoch": 2926} {"train_loss": -6.509322166442871, "global_step": 122916, "epoch": 2926} {"train_loss": -6.623661994934082, "global_step": 122917, "epoch": 2926} {"train_loss": -6.4578399658203125, "global_step": 122918, "epoch": 2926} {"train_loss": -6.593329429626465, "global_step": 122919, "epoch": 2926} {"train_loss": -6.673122406005859, "global_step": 122920, "epoch": 2926} {"train_loss": -6.528745651245117, "global_step": 122921, "epoch": 2926} {"train_loss": -6.602093696594238, "global_step": 122922, "epoch": 2926} {"train_loss": -6.588761329650879, "global_step": 122923, "epoch": 2926} {"train_loss": -6.620757579803467, "global_step": 122924, "epoch": 2926} {"train_loss": -6.557476043701172, "global_step": 122925, "epoch": 2926} {"train_loss": -6.484233379364014, "global_step": 122926, "epoch": 2926} {"train_loss": -6.710817337036133, "global_step": 122927, "epoch": 2926} {"train_loss": -6.649402141571045, "global_step": 122928, "epoch": 2926} {"train_loss": -6.569822311401367, "global_step": 122929, "epoch": 2926} {"train_loss": -6.579127311706543, "global_step": 122930, "epoch": 2926} {"train_loss": -6.631505012512207, "global_step": 122931, "epoch": 2926} {"train_loss": -6.597567558288574, "global_step": 122932, "epoch": 2926} {"train_loss": -6.5809163593110585, "global_step": 122933, "epoch": 2926, "val_loss": 77067.296875} {"train_loss": -6.584650039672852, "global_step": 122934, "epoch": 2927} {"train_loss": -6.667817115783691, "global_step": 122935, "epoch": 2927} {"train_loss": -6.6063690185546875, "global_step": 122936, "epoch": 2927} {"train_loss": -6.671200275421143, "global_step": 122937, "epoch": 2927} {"train_loss": -6.683469772338867, "global_step": 122938, "epoch": 2927} {"train_loss": -6.604344844818115, "global_step": 122939, "epoch": 2927} {"train_loss": -6.559167385101318, "global_step": 122940, "epoch": 2927} {"train_loss": -6.494903564453125, "global_step": 122941, "epoch": 2927} {"train_loss": -6.764690399169922, "global_step": 122942, "epoch": 2927} {"train_loss": -6.605247497558594, "global_step": 122943, "epoch": 2927} {"train_loss": -6.647978782653809, "global_step": 122944, "epoch": 2927} {"train_loss": -6.602372169494629, "global_step": 122945, "epoch": 2927} {"train_loss": -6.618314743041992, "global_step": 122946, "epoch": 2927} {"train_loss": -6.658730983734131, "global_step": 122947, "epoch": 2927} {"train_loss": -6.612957000732422, "global_step": 122948, "epoch": 2927} {"train_loss": -6.726633071899414, "global_step": 122949, "epoch": 2927} {"train_loss": -6.562936782836914, "global_step": 122950, "epoch": 2927} {"train_loss": -6.4880781173706055, "global_step": 122951, "epoch": 2927} {"train_loss": -6.677921295166016, "global_step": 122952, "epoch": 2927} {"train_loss": -6.639416694641113, "global_step": 122953, "epoch": 2927} {"train_loss": -6.559943675994873, "global_step": 122954, "epoch": 2927} {"train_loss": -6.615570068359375, "global_step": 122955, "epoch": 2927} {"train_loss": -6.6693878173828125, "global_step": 122956, "epoch": 2927} {"train_loss": -6.557703018188477, "global_step": 122957, "epoch": 2927} {"train_loss": -6.462861061096191, "global_step": 122958, "epoch": 2927} {"train_loss": -6.658794403076172, "global_step": 122959, "epoch": 2927} {"train_loss": -6.688182353973389, "global_step": 122960, "epoch": 2927} {"train_loss": -6.568808555603027, "global_step": 122961, "epoch": 2927} {"train_loss": -6.636282444000244, "global_step": 122962, "epoch": 2927} {"train_loss": -6.669812202453613, "global_step": 122963, "epoch": 2927} {"train_loss": -6.559072494506836, "global_step": 122964, "epoch": 2927} {"train_loss": -6.621232032775879, "global_step": 122965, "epoch": 2927} {"train_loss": -6.681989669799805, "global_step": 122966, "epoch": 2927} {"train_loss": -6.520355224609375, "global_step": 122967, "epoch": 2927} {"train_loss": -6.597864627838135, "global_step": 122968, "epoch": 2927} {"train_loss": -6.649453163146973, "global_step": 122969, "epoch": 2927} {"train_loss": -6.727050304412842, "global_step": 122970, "epoch": 2927} {"train_loss": -6.578434467315674, "global_step": 122971, "epoch": 2927} {"train_loss": -6.565951824188232, "global_step": 122972, "epoch": 2927} {"train_loss": -6.617099761962891, "global_step": 122973, "epoch": 2927} {"train_loss": -6.595442771911621, "global_step": 122974, "epoch": 2927} {"train_loss": -6.617158356167021, "global_step": 122975, "epoch": 2927, "val_loss": 76939.1484375} {"train_loss": -6.598508358001709, "global_step": 122976, "epoch": 2928} {"train_loss": -6.6613311767578125, "global_step": 122977, "epoch": 2928} {"train_loss": -6.566440582275391, "global_step": 122978, "epoch": 2928} {"train_loss": -6.573348522186279, "global_step": 122979, "epoch": 2928} {"train_loss": -6.548192977905273, "global_step": 122980, "epoch": 2928} {"train_loss": -6.519550323486328, "global_step": 122981, "epoch": 2928} {"train_loss": -6.582273483276367, "global_step": 122982, "epoch": 2928} {"train_loss": -6.477214336395264, "global_step": 122983, "epoch": 2928} {"train_loss": -6.581680774688721, "global_step": 122984, "epoch": 2928} {"train_loss": -6.637928009033203, "global_step": 122985, "epoch": 2928} {"train_loss": -6.579668998718262, "global_step": 122986, "epoch": 2928} {"train_loss": -6.510407447814941, "global_step": 122987, "epoch": 2928} {"train_loss": -6.665622711181641, "global_step": 122988, "epoch": 2928} {"train_loss": -6.597953796386719, "global_step": 122989, "epoch": 2928} {"train_loss": -6.610347270965576, "global_step": 122990, "epoch": 2928} {"train_loss": -6.6234283447265625, "global_step": 122991, "epoch": 2928} {"train_loss": -6.643548011779785, "global_step": 122992, "epoch": 2928} {"train_loss": -6.660650730133057, "global_step": 122993, "epoch": 2928} {"train_loss": -6.654496192932129, "global_step": 122994, "epoch": 2928} {"train_loss": -6.62524938583374, "global_step": 122995, "epoch": 2928} {"train_loss": -6.608014106750488, "global_step": 122996, "epoch": 2928} {"train_loss": -6.560503959655762, "global_step": 122997, "epoch": 2928} {"train_loss": -6.599479675292969, "global_step": 122998, "epoch": 2928} {"train_loss": -6.752407073974609, "global_step": 122999, "epoch": 2928} {"train_loss": -6.610454082489014, "global_step": 123000, "epoch": 2928} {"train_loss": -6.74278450012207, "global_step": 123001, "epoch": 2928} {"train_loss": -6.711673736572266, "global_step": 123002, "epoch": 2928} {"train_loss": -6.620738506317139, "global_step": 123003, "epoch": 2928} {"train_loss": -6.706070423126221, "global_step": 123004, "epoch": 2928} {"train_loss": -6.638688087463379, "global_step": 123005, "epoch": 2928} {"train_loss": -6.690471649169922, "global_step": 123006, "epoch": 2928} {"train_loss": -6.71381139755249, "global_step": 123007, "epoch": 2928} {"train_loss": -6.68179988861084, "global_step": 123008, "epoch": 2928} {"train_loss": -6.6103997230529785, "global_step": 123009, "epoch": 2928} {"train_loss": -6.7143354415893555, "global_step": 123010, "epoch": 2928} {"train_loss": -6.6913347244262695, "global_step": 123011, "epoch": 2928} {"train_loss": -6.532811164855957, "global_step": 123012, "epoch": 2928} {"train_loss": -6.487099647521973, "global_step": 123013, "epoch": 2928} {"train_loss": -6.582961082458496, "global_step": 123014, "epoch": 2928} {"train_loss": -6.440877914428711, "global_step": 123015, "epoch": 2928} {"train_loss": -6.485386848449707, "global_step": 123016, "epoch": 2928} {"train_loss": -6.608282429831369, "global_step": 123017, "epoch": 2928, "val_loss": 77096.0} {"train_loss": -6.508882999420166, "global_step": 123018, "epoch": 2929} {"train_loss": -6.50909423828125, "global_step": 123019, "epoch": 2929} {"train_loss": -6.527676582336426, "global_step": 123020, "epoch": 2929} {"train_loss": -6.627168655395508, "global_step": 123021, "epoch": 2929} {"train_loss": -6.58853816986084, "global_step": 123022, "epoch": 2929} {"train_loss": -6.457633018493652, "global_step": 123023, "epoch": 2929} {"train_loss": -6.690128326416016, "global_step": 123024, "epoch": 2929} {"train_loss": -6.567203521728516, "global_step": 123025, "epoch": 2929} {"train_loss": -6.594603538513184, "global_step": 123026, "epoch": 2929} {"train_loss": -6.471502304077148, "global_step": 123027, "epoch": 2929} {"train_loss": -6.524635314941406, "global_step": 123028, "epoch": 2929} {"train_loss": -6.617981910705566, "global_step": 123029, "epoch": 2929} {"train_loss": -6.461287021636963, "global_step": 123030, "epoch": 2929} {"train_loss": -6.6458234786987305, "global_step": 123031, "epoch": 2929} {"train_loss": -6.754605770111084, "global_step": 123032, "epoch": 2929} {"train_loss": -6.689420700073242, "global_step": 123033, "epoch": 2929} {"train_loss": -6.638011932373047, "global_step": 123034, "epoch": 2929} {"train_loss": -6.532353401184082, "global_step": 123035, "epoch": 2929} {"train_loss": -6.4231767654418945, "global_step": 123036, "epoch": 2929} {"train_loss": -6.548932075500488, "global_step": 123037, "epoch": 2929} {"train_loss": -6.641565322875977, "global_step": 123038, "epoch": 2929} {"train_loss": -6.577035903930664, "global_step": 123039, "epoch": 2929} {"train_loss": -6.647420883178711, "global_step": 123040, "epoch": 2929} {"train_loss": -6.728259563446045, "global_step": 123041, "epoch": 2929} {"train_loss": -6.6727495193481445, "global_step": 123042, "epoch": 2929} {"train_loss": -6.497625350952148, "global_step": 123043, "epoch": 2929} {"train_loss": -6.633938789367676, "global_step": 123044, "epoch": 2929} {"train_loss": -6.74891996383667, "global_step": 123045, "epoch": 2929} {"train_loss": -6.569486618041992, "global_step": 123046, "epoch": 2929} {"train_loss": -6.798022270202637, "global_step": 123047, "epoch": 2929} {"train_loss": -6.605172634124756, "global_step": 123048, "epoch": 2929} {"train_loss": -6.57984733581543, "global_step": 123049, "epoch": 2929} {"train_loss": -6.613472938537598, "global_step": 123050, "epoch": 2929} {"train_loss": -6.625237464904785, "global_step": 123051, "epoch": 2929} {"train_loss": -6.64450216293335, "global_step": 123052, "epoch": 2929} {"train_loss": -6.597626686096191, "global_step": 123053, "epoch": 2929} {"train_loss": -6.637431621551514, "global_step": 123054, "epoch": 2929} {"train_loss": -6.583500385284424, "global_step": 123055, "epoch": 2929} {"train_loss": -6.6043806076049805, "global_step": 123056, "epoch": 2929} {"train_loss": -6.570796012878418, "global_step": 123057, "epoch": 2929} {"train_loss": -6.609087944030762, "global_step": 123058, "epoch": 2929} {"train_loss": -6.5977005163828535, "global_step": 123059, "epoch": 2929, "val_loss": 77204.3515625} {"train_loss": -6.608539581298828, "global_step": 123060, "epoch": 2930} {"train_loss": -6.586151123046875, "global_step": 123061, "epoch": 2930} {"train_loss": -6.601552486419678, "global_step": 123062, "epoch": 2930} {"train_loss": -6.670605182647705, "global_step": 123063, "epoch": 2930} {"train_loss": -6.654447555541992, "global_step": 123064, "epoch": 2930} {"train_loss": -6.579424858093262, "global_step": 123065, "epoch": 2930} {"train_loss": -6.547963619232178, "global_step": 123066, "epoch": 2930} {"train_loss": -6.578916549682617, "global_step": 123067, "epoch": 2930} {"train_loss": -6.499168395996094, "global_step": 123068, "epoch": 2930} {"train_loss": -6.577578067779541, "global_step": 123069, "epoch": 2930} {"train_loss": -6.572938919067383, "global_step": 123070, "epoch": 2930} {"train_loss": -6.68349552154541, "global_step": 123071, "epoch": 2930} {"train_loss": -6.591207981109619, "global_step": 123072, "epoch": 2930} {"train_loss": -6.515634059906006, "global_step": 123073, "epoch": 2930} {"train_loss": -6.63032865524292, "global_step": 123074, "epoch": 2930} {"train_loss": -6.630108833312988, "global_step": 123075, "epoch": 2930} {"train_loss": -6.540506362915039, "global_step": 123076, "epoch": 2930} {"train_loss": -6.584027290344238, "global_step": 123077, "epoch": 2930} {"train_loss": -6.64529275894165, "global_step": 123078, "epoch": 2930} {"train_loss": -6.704071521759033, "global_step": 123079, "epoch": 2930} {"train_loss": -6.583510398864746, "global_step": 123080, "epoch": 2930} {"train_loss": -6.697218418121338, "global_step": 123081, "epoch": 2930} {"train_loss": -6.714105129241943, "global_step": 123082, "epoch": 2930} {"train_loss": -6.498932361602783, "global_step": 123083, "epoch": 2930} {"train_loss": -6.687049865722656, "global_step": 123084, "epoch": 2930} {"train_loss": -6.539732933044434, "global_step": 123085, "epoch": 2930} {"train_loss": -6.609047889709473, "global_step": 123086, "epoch": 2930} {"train_loss": -6.696630477905273, "global_step": 123087, "epoch": 2930} {"train_loss": -6.548395156860352, "global_step": 123088, "epoch": 2930} {"train_loss": -6.635075569152832, "global_step": 123089, "epoch": 2930} {"train_loss": -6.646785736083984, "global_step": 123090, "epoch": 2930} {"train_loss": -6.533389091491699, "global_step": 123091, "epoch": 2930} {"train_loss": -6.693356513977051, "global_step": 123092, "epoch": 2930} {"train_loss": -6.620385646820068, "global_step": 123093, "epoch": 2930} {"train_loss": -6.662128448486328, "global_step": 123094, "epoch": 2930} {"train_loss": -6.52793025970459, "global_step": 123095, "epoch": 2930} {"train_loss": -6.611289978027344, "global_step": 123096, "epoch": 2930} {"train_loss": -6.609732151031494, "global_step": 123097, "epoch": 2930} {"train_loss": -6.665094375610352, "global_step": 123098, "epoch": 2930} {"train_loss": -6.6790852546691895, "global_step": 123099, "epoch": 2930} {"train_loss": -6.611517906188965, "global_step": 123100, "epoch": 2930} {"train_loss": -6.60960190636771, "global_step": 123101, "epoch": 2930, "val_loss": 77004.359375} {"train_loss": -6.700408935546875, "global_step": 123102, "epoch": 2931} {"train_loss": -6.689454078674316, "global_step": 123103, "epoch": 2931} {"train_loss": -6.51204776763916, "global_step": 123104, "epoch": 2931} {"train_loss": -6.67546272277832, "global_step": 123105, "epoch": 2931} {"train_loss": -6.6655402183532715, "global_step": 123106, "epoch": 2931} {"train_loss": -6.629128456115723, "global_step": 123107, "epoch": 2931} {"train_loss": -6.62960958480835, "global_step": 123108, "epoch": 2931} {"train_loss": -6.640536785125732, "global_step": 123109, "epoch": 2931} {"train_loss": -6.542689323425293, "global_step": 123110, "epoch": 2931} {"train_loss": -6.640684127807617, "global_step": 123111, "epoch": 2931} {"train_loss": -6.669692039489746, "global_step": 123112, "epoch": 2931} {"train_loss": -6.6320695877075195, "global_step": 123113, "epoch": 2931} {"train_loss": -6.745776176452637, "global_step": 123114, "epoch": 2931} {"train_loss": -6.632804870605469, "global_step": 123115, "epoch": 2931} {"train_loss": -6.571450233459473, "global_step": 123116, "epoch": 2931} {"train_loss": -6.589942932128906, "global_step": 123117, "epoch": 2931} {"train_loss": -6.608758926391602, "global_step": 123118, "epoch": 2931} {"train_loss": -6.518587589263916, "global_step": 123119, "epoch": 2931} {"train_loss": -6.6625261306762695, "global_step": 123120, "epoch": 2931} {"train_loss": -6.625924110412598, "global_step": 123121, "epoch": 2931} {"train_loss": -6.585602283477783, "global_step": 123122, "epoch": 2931} {"train_loss": -6.562502861022949, "global_step": 123123, "epoch": 2931} {"train_loss": -6.711699485778809, "global_step": 123124, "epoch": 2931} {"train_loss": -6.640150547027588, "global_step": 123125, "epoch": 2931} {"train_loss": -6.574512958526611, "global_step": 123126, "epoch": 2931} {"train_loss": -6.552780628204346, "global_step": 123127, "epoch": 2931} {"train_loss": -6.607359409332275, "global_step": 123128, "epoch": 2931} {"train_loss": -6.510414123535156, "global_step": 123129, "epoch": 2931} {"train_loss": -6.669872760772705, "global_step": 123130, "epoch": 2931} {"train_loss": -6.653230667114258, "global_step": 123131, "epoch": 2931} {"train_loss": -6.457996845245361, "global_step": 123132, "epoch": 2931} {"train_loss": -6.594673156738281, "global_step": 123133, "epoch": 2931} {"train_loss": -6.667267799377441, "global_step": 123134, "epoch": 2931} {"train_loss": -6.576721668243408, "global_step": 123135, "epoch": 2931} {"train_loss": -6.53322696685791, "global_step": 123136, "epoch": 2931} {"train_loss": -6.5200347900390625, "global_step": 123137, "epoch": 2931} {"train_loss": -6.578382968902588, "global_step": 123138, "epoch": 2931} {"train_loss": -6.508720874786377, "global_step": 123139, "epoch": 2931} {"train_loss": -6.629349708557129, "global_step": 123140, "epoch": 2931} {"train_loss": -6.582103252410889, "global_step": 123141, "epoch": 2931} {"train_loss": -6.645717620849609, "global_step": 123142, "epoch": 2931} {"train_loss": -6.609422592889695, "global_step": 123143, "epoch": 2931, "val_loss": 77215.1171875} {"train_loss": -6.495828628540039, "global_step": 123144, "epoch": 2932} {"train_loss": -6.538453102111816, "global_step": 123145, "epoch": 2932} {"train_loss": -6.572629451751709, "global_step": 123146, "epoch": 2932} {"train_loss": -6.619077682495117, "global_step": 123147, "epoch": 2932} {"train_loss": -6.602559566497803, "global_step": 123148, "epoch": 2932} {"train_loss": -6.7061614990234375, "global_step": 123149, "epoch": 2932} {"train_loss": -6.673999786376953, "global_step": 123150, "epoch": 2932} {"train_loss": -6.570139408111572, "global_step": 123151, "epoch": 2932} {"train_loss": -6.560839653015137, "global_step": 123152, "epoch": 2932} {"train_loss": -6.476695537567139, "global_step": 123153, "epoch": 2932} {"train_loss": -6.6051411628723145, "global_step": 123154, "epoch": 2932} {"train_loss": -6.498064041137695, "global_step": 123155, "epoch": 2932} {"train_loss": -6.617226600646973, "global_step": 123156, "epoch": 2932} {"train_loss": -6.62903356552124, "global_step": 123157, "epoch": 2932} {"train_loss": -6.553750038146973, "global_step": 123158, "epoch": 2932} {"train_loss": -6.5459513664245605, "global_step": 123159, "epoch": 2932} {"train_loss": -6.520267486572266, "global_step": 123160, "epoch": 2932} {"train_loss": -6.633027076721191, "global_step": 123161, "epoch": 2932} {"train_loss": -6.5504655838012695, "global_step": 123162, "epoch": 2932} {"train_loss": -6.649251937866211, "global_step": 123163, "epoch": 2932} {"train_loss": -6.578404903411865, "global_step": 123164, "epoch": 2932} {"train_loss": -6.479336738586426, "global_step": 123165, "epoch": 2932} {"train_loss": -6.63939094543457, "global_step": 123166, "epoch": 2932} {"train_loss": -6.366792678833008, "global_step": 123167, "epoch": 2932} {"train_loss": -6.5413665771484375, "global_step": 123168, "epoch": 2932} {"train_loss": -6.596624374389648, "global_step": 123169, "epoch": 2932} {"train_loss": -6.467907905578613, "global_step": 123170, "epoch": 2932} {"train_loss": -6.637129783630371, "global_step": 123171, "epoch": 2932} {"train_loss": -6.5795159339904785, "global_step": 123172, "epoch": 2932} {"train_loss": -6.540839195251465, "global_step": 123173, "epoch": 2932} {"train_loss": -6.443889141082764, "global_step": 123174, "epoch": 2932} {"train_loss": -6.601449012756348, "global_step": 123175, "epoch": 2932} {"train_loss": -6.569798469543457, "global_step": 123176, "epoch": 2932} {"train_loss": -6.518435478210449, "global_step": 123177, "epoch": 2932} {"train_loss": -6.481235980987549, "global_step": 123178, "epoch": 2932} {"train_loss": -6.55247163772583, "global_step": 123179, "epoch": 2932} {"train_loss": -6.675420761108398, "global_step": 123180, "epoch": 2932} {"train_loss": -6.602205276489258, "global_step": 123181, "epoch": 2932} {"train_loss": -6.633884429931641, "global_step": 123182, "epoch": 2932} {"train_loss": -6.598363876342773, "global_step": 123183, "epoch": 2932} {"train_loss": -6.481180191040039, "global_step": 123184, "epoch": 2932} {"train_loss": -6.568117198489961, "global_step": 123185, "epoch": 2932, "val_loss": 77275.109375} {"train_loss": -6.5527472496032715, "global_step": 123186, "epoch": 2933} {"train_loss": -6.650566577911377, "global_step": 123187, "epoch": 2933} {"train_loss": -6.570718765258789, "global_step": 123188, "epoch": 2933} {"train_loss": -6.4075727462768555, "global_step": 123189, "epoch": 2933} {"train_loss": -6.519150257110596, "global_step": 123190, "epoch": 2933} {"train_loss": -6.52175235748291, "global_step": 123191, "epoch": 2933} {"train_loss": -6.485462665557861, "global_step": 123192, "epoch": 2933} {"train_loss": -6.611431121826172, "global_step": 123193, "epoch": 2933} {"train_loss": -6.514174461364746, "global_step": 123194, "epoch": 2933} {"train_loss": -6.522085189819336, "global_step": 123195, "epoch": 2933} {"train_loss": -6.537278652191162, "global_step": 123196, "epoch": 2933} {"train_loss": -6.636987209320068, "global_step": 123197, "epoch": 2933} {"train_loss": -6.677070617675781, "global_step": 123198, "epoch": 2933} {"train_loss": -6.447826385498047, "global_step": 123199, "epoch": 2933} {"train_loss": -6.577183723449707, "global_step": 123200, "epoch": 2933} {"train_loss": -6.579748153686523, "global_step": 123201, "epoch": 2933} {"train_loss": -6.589289665222168, "global_step": 123202, "epoch": 2933} {"train_loss": -6.551645755767822, "global_step": 123203, "epoch": 2933} {"train_loss": -6.543649673461914, "global_step": 123204, "epoch": 2933} {"train_loss": -6.668689727783203, "global_step": 123205, "epoch": 2933} {"train_loss": -6.578396797180176, "global_step": 123206, "epoch": 2933} {"train_loss": -6.601426124572754, "global_step": 123207, "epoch": 2933} {"train_loss": -6.600310325622559, "global_step": 123208, "epoch": 2933} {"train_loss": -6.668127059936523, "global_step": 123209, "epoch": 2933} {"train_loss": -6.654096603393555, "global_step": 123210, "epoch": 2933} {"train_loss": -6.5242919921875, "global_step": 123211, "epoch": 2933} {"train_loss": -6.4663848876953125, "global_step": 123212, "epoch": 2933} {"train_loss": -6.6009111404418945, "global_step": 123213, "epoch": 2933} {"train_loss": -6.4622802734375, "global_step": 123214, "epoch": 2933} {"train_loss": -6.5675225257873535, "global_step": 123215, "epoch": 2933} {"train_loss": -6.6056060791015625, "global_step": 123216, "epoch": 2933} {"train_loss": -6.571599960327148, "global_step": 123217, "epoch": 2933} {"train_loss": -6.557132720947266, "global_step": 123218, "epoch": 2933} {"train_loss": -6.51194953918457, "global_step": 123219, "epoch": 2933} {"train_loss": -6.605218887329102, "global_step": 123220, "epoch": 2933} {"train_loss": -6.652142524719238, "global_step": 123221, "epoch": 2933} {"train_loss": -6.575459957122803, "global_step": 123222, "epoch": 2933} {"train_loss": -6.597271919250488, "global_step": 123223, "epoch": 2933} {"train_loss": -6.549384117126465, "global_step": 123224, "epoch": 2933} {"train_loss": -6.590227127075195, "global_step": 123225, "epoch": 2933} {"train_loss": -6.502303123474121, "global_step": 123226, "epoch": 2933} {"train_loss": -6.566469919113886, "global_step": 123227, "epoch": 2933, "val_loss": 77124.1640625} {"train_loss": -6.438084125518799, "global_step": 123228, "epoch": 2934} {"train_loss": -6.471077919006348, "global_step": 123229, "epoch": 2934} {"train_loss": -6.754936695098877, "global_step": 123230, "epoch": 2934} {"train_loss": -6.561581611633301, "global_step": 123231, "epoch": 2934} {"train_loss": -6.728544235229492, "global_step": 123232, "epoch": 2934} {"train_loss": -6.564939022064209, "global_step": 123233, "epoch": 2934} {"train_loss": -6.733325004577637, "global_step": 123234, "epoch": 2934} {"train_loss": -6.753054141998291, "global_step": 123235, "epoch": 2934} {"train_loss": -6.60205602645874, "global_step": 123236, "epoch": 2934} {"train_loss": -6.558352470397949, "global_step": 123237, "epoch": 2934} {"train_loss": -6.617963790893555, "global_step": 123238, "epoch": 2934} {"train_loss": -6.51762056350708, "global_step": 123239, "epoch": 2934} {"train_loss": -6.56030797958374, "global_step": 123240, "epoch": 2934} {"train_loss": -6.445590496063232, "global_step": 123241, "epoch": 2934} {"train_loss": -6.591991424560547, "global_step": 123242, "epoch": 2934} {"train_loss": -6.6258544921875, "global_step": 123243, "epoch": 2934} {"train_loss": -6.505046367645264, "global_step": 123244, "epoch": 2934} {"train_loss": -6.649452209472656, "global_step": 123245, "epoch": 2934} {"train_loss": -6.645064830780029, "global_step": 123246, "epoch": 2934} {"train_loss": -6.485872745513916, "global_step": 123247, "epoch": 2934} {"train_loss": -6.514153480529785, "global_step": 123248, "epoch": 2934} {"train_loss": -6.442981719970703, "global_step": 123249, "epoch": 2934} {"train_loss": -6.456542015075684, "global_step": 123250, "epoch": 2934} {"train_loss": -6.640587329864502, "global_step": 123251, "epoch": 2934} {"train_loss": -6.466307163238525, "global_step": 123252, "epoch": 2934} {"train_loss": -6.4641828536987305, "global_step": 123253, "epoch": 2934} {"train_loss": -6.505117893218994, "global_step": 123254, "epoch": 2934} {"train_loss": -6.3900370597839355, "global_step": 123255, "epoch": 2934} {"train_loss": -6.42538595199585, "global_step": 123256, "epoch": 2934} {"train_loss": -6.552175521850586, "global_step": 123257, "epoch": 2934} {"train_loss": -6.504015922546387, "global_step": 123258, "epoch": 2934} {"train_loss": -6.518606662750244, "global_step": 123259, "epoch": 2934} {"train_loss": -6.377509117126465, "global_step": 123260, "epoch": 2934} {"train_loss": -6.372647762298584, "global_step": 123261, "epoch": 2934} {"train_loss": -6.462366104125977, "global_step": 123262, "epoch": 2934} {"train_loss": -6.5529327392578125, "global_step": 123263, "epoch": 2934} {"train_loss": -6.5331573486328125, "global_step": 123264, "epoch": 2934} {"train_loss": -6.574366569519043, "global_step": 123265, "epoch": 2934} {"train_loss": -6.6171064376831055, "global_step": 123266, "epoch": 2934} {"train_loss": -6.519827842712402, "global_step": 123267, "epoch": 2934} {"train_loss": -6.502361297607422, "global_step": 123268, "epoch": 2934} {"train_loss": -6.544509478977749, "global_step": 123269, "epoch": 2934, "val_loss": 77248.3046875} {"train_loss": -6.610701084136963, "global_step": 123270, "epoch": 2935} {"train_loss": -6.536903381347656, "global_step": 123271, "epoch": 2935} {"train_loss": -6.591969966888428, "global_step": 123272, "epoch": 2935} {"train_loss": -6.562039375305176, "global_step": 123273, "epoch": 2935} {"train_loss": -6.566951751708984, "global_step": 123274, "epoch": 2935} {"train_loss": -6.529611110687256, "global_step": 123275, "epoch": 2935} {"train_loss": -6.452336311340332, "global_step": 123276, "epoch": 2935} {"train_loss": -6.593569755554199, "global_step": 123277, "epoch": 2935} {"train_loss": -6.634592533111572, "global_step": 123278, "epoch": 2935} {"train_loss": -6.643550872802734, "global_step": 123279, "epoch": 2935} {"train_loss": -6.592325687408447, "global_step": 123280, "epoch": 2935} {"train_loss": -6.543667793273926, "global_step": 123281, "epoch": 2935} {"train_loss": -6.651163101196289, "global_step": 123282, "epoch": 2935} {"train_loss": -6.487386703491211, "global_step": 123283, "epoch": 2935} {"train_loss": -6.6528730392456055, "global_step": 123284, "epoch": 2935} {"train_loss": -6.64891242980957, "global_step": 123285, "epoch": 2935} {"train_loss": -6.674302101135254, "global_step": 123286, "epoch": 2935} {"train_loss": -6.798700332641602, "global_step": 123287, "epoch": 2935} {"train_loss": -6.547940254211426, "global_step": 123288, "epoch": 2935} {"train_loss": -6.616603851318359, "global_step": 123289, "epoch": 2935} {"train_loss": -6.635989189147949, "global_step": 123290, "epoch": 2935} {"train_loss": -6.614019393920898, "global_step": 123291, "epoch": 2935} {"train_loss": -6.660438537597656, "global_step": 123292, "epoch": 2935} {"train_loss": -6.566262722015381, "global_step": 123293, "epoch": 2935} {"train_loss": -6.56281852722168, "global_step": 123294, "epoch": 2935} {"train_loss": -6.626675128936768, "global_step": 123295, "epoch": 2935} {"train_loss": -6.473241329193115, "global_step": 123296, "epoch": 2935} {"train_loss": -6.679659843444824, "global_step": 123297, "epoch": 2935} {"train_loss": -6.701413154602051, "global_step": 123298, "epoch": 2935} {"train_loss": -6.648326873779297, "global_step": 123299, "epoch": 2935} {"train_loss": -6.632665634155273, "global_step": 123300, "epoch": 2935} {"train_loss": -6.670810699462891, "global_step": 123301, "epoch": 2935} {"train_loss": -6.613011837005615, "global_step": 123302, "epoch": 2935} {"train_loss": -6.686933994293213, "global_step": 123303, "epoch": 2935} {"train_loss": -6.555330276489258, "global_step": 123304, "epoch": 2935} {"train_loss": -6.779913902282715, "global_step": 123305, "epoch": 2935} {"train_loss": -6.537213325500488, "global_step": 123306, "epoch": 2935} {"train_loss": -6.64066219329834, "global_step": 123307, "epoch": 2935} {"train_loss": -6.659337043762207, "global_step": 123308, "epoch": 2935} {"train_loss": -6.725507736206055, "global_step": 123309, "epoch": 2935} {"train_loss": -6.532233238220215, "global_step": 123310, "epoch": 2935} {"train_loss": -6.6143724123636884, "global_step": 123311, "epoch": 2935, "val_loss": 76962.8515625} {"train_loss": -6.601438045501709, "global_step": 123312, "epoch": 2936} {"train_loss": -6.581801414489746, "global_step": 123313, "epoch": 2936} {"train_loss": -6.616813659667969, "global_step": 123314, "epoch": 2936} {"train_loss": -6.737046241760254, "global_step": 123315, "epoch": 2936} {"train_loss": -6.666999340057373, "global_step": 123316, "epoch": 2936} {"train_loss": -6.588727951049805, "global_step": 123317, "epoch": 2936} {"train_loss": -6.666584014892578, "global_step": 123318, "epoch": 2936} {"train_loss": -6.788233280181885, "global_step": 123319, "epoch": 2936} {"train_loss": -6.603017807006836, "global_step": 123320, "epoch": 2936} {"train_loss": -6.526446342468262, "global_step": 123321, "epoch": 2936} {"train_loss": -6.64687442779541, "global_step": 123322, "epoch": 2936} {"train_loss": -6.56725549697876, "global_step": 123323, "epoch": 2936} {"train_loss": -6.7002410888671875, "global_step": 123324, "epoch": 2936} {"train_loss": -6.61462926864624, "global_step": 123325, "epoch": 2936} {"train_loss": -6.464183807373047, "global_step": 123326, "epoch": 2936} {"train_loss": -6.489011287689209, "global_step": 123327, "epoch": 2936} {"train_loss": -6.593915939331055, "global_step": 123328, "epoch": 2936} {"train_loss": -6.523157119750977, "global_step": 123329, "epoch": 2936} {"train_loss": -6.694360733032227, "global_step": 123330, "epoch": 2936} {"train_loss": -6.602662086486816, "global_step": 123331, "epoch": 2936} {"train_loss": -6.5066704750061035, "global_step": 123332, "epoch": 2936} {"train_loss": -6.57182502746582, "global_step": 123333, "epoch": 2936} {"train_loss": -6.556883811950684, "global_step": 123334, "epoch": 2936} {"train_loss": -6.4310407638549805, "global_step": 123335, "epoch": 2936} {"train_loss": -6.545634746551514, "global_step": 123336, "epoch": 2936} {"train_loss": -6.389008045196533, "global_step": 123337, "epoch": 2936} {"train_loss": -6.626072883605957, "global_step": 123338, "epoch": 2936} {"train_loss": -6.63706636428833, "global_step": 123339, "epoch": 2936} {"train_loss": -6.615326881408691, "global_step": 123340, "epoch": 2936} {"train_loss": -6.57383918762207, "global_step": 123341, "epoch": 2936} {"train_loss": -6.592945575714111, "global_step": 123342, "epoch": 2936} {"train_loss": -6.475064277648926, "global_step": 123343, "epoch": 2936} {"train_loss": -6.565661430358887, "global_step": 123344, "epoch": 2936} {"train_loss": -6.674311637878418, "global_step": 123345, "epoch": 2936} {"train_loss": -6.478710174560547, "global_step": 123346, "epoch": 2936} {"train_loss": -6.4867353439331055, "global_step": 123347, "epoch": 2936} {"train_loss": -6.680489540100098, "global_step": 123348, "epoch": 2936} {"train_loss": -6.538081645965576, "global_step": 123349, "epoch": 2936} {"train_loss": -6.571874141693115, "global_step": 123350, "epoch": 2936} {"train_loss": -6.49403190612793, "global_step": 123351, "epoch": 2936} {"train_loss": -6.550909996032715, "global_step": 123352, "epoch": 2936} {"train_loss": -6.5831971282050725, "global_step": 123353, "epoch": 2936, "val_loss": 77139.625} {"train_loss": -6.663643836975098, "global_step": 123354, "epoch": 2937} {"train_loss": -6.6261444091796875, "global_step": 123355, "epoch": 2937} {"train_loss": -6.547761917114258, "global_step": 123356, "epoch": 2937} {"train_loss": -6.516175270080566, "global_step": 123357, "epoch": 2937} {"train_loss": -6.465106964111328, "global_step": 123358, "epoch": 2937} {"train_loss": -6.547570705413818, "global_step": 123359, "epoch": 2937} {"train_loss": -6.6258111000061035, "global_step": 123360, "epoch": 2937} {"train_loss": -6.575136184692383, "global_step": 123361, "epoch": 2937} {"train_loss": -6.6804375648498535, "global_step": 123362, "epoch": 2937} {"train_loss": -6.529767990112305, "global_step": 123363, "epoch": 2937} {"train_loss": -6.604523658752441, "global_step": 123364, "epoch": 2937} {"train_loss": -6.696837425231934, "global_step": 123365, "epoch": 2937} {"train_loss": -6.487136363983154, "global_step": 123366, "epoch": 2937} {"train_loss": -6.620488166809082, "global_step": 123367, "epoch": 2937} {"train_loss": -6.732544422149658, "global_step": 123368, "epoch": 2937} {"train_loss": -6.7005205154418945, "global_step": 123369, "epoch": 2937} {"train_loss": -6.585509300231934, "global_step": 123370, "epoch": 2937} {"train_loss": -6.561110973358154, "global_step": 123371, "epoch": 2937} {"train_loss": -6.629537582397461, "global_step": 123372, "epoch": 2937} {"train_loss": -6.698127746582031, "global_step": 123373, "epoch": 2937} {"train_loss": -6.612368583679199, "global_step": 123374, "epoch": 2937} {"train_loss": -6.597582817077637, "global_step": 123375, "epoch": 2937} {"train_loss": -6.735255718231201, "global_step": 123376, "epoch": 2937} {"train_loss": -6.520064353942871, "global_step": 123377, "epoch": 2937} {"train_loss": -6.5235161781311035, "global_step": 123378, "epoch": 2937} {"train_loss": -6.5509538650512695, "global_step": 123379, "epoch": 2937} {"train_loss": -6.624449729919434, "global_step": 123380, "epoch": 2937} {"train_loss": -6.698563575744629, "global_step": 123381, "epoch": 2937} {"train_loss": -6.66337251663208, "global_step": 123382, "epoch": 2937} {"train_loss": -6.647094249725342, "global_step": 123383, "epoch": 2937} {"train_loss": -6.565446376800537, "global_step": 123384, "epoch": 2937} {"train_loss": -6.605539798736572, "global_step": 123385, "epoch": 2937} {"train_loss": -6.62161922454834, "global_step": 123386, "epoch": 2937} {"train_loss": -6.644930839538574, "global_step": 123387, "epoch": 2937} {"train_loss": -6.592616081237793, "global_step": 123388, "epoch": 2937} {"train_loss": -6.660584449768066, "global_step": 123389, "epoch": 2937} {"train_loss": -6.595849514007568, "global_step": 123390, "epoch": 2937} {"train_loss": -6.738916873931885, "global_step": 123391, "epoch": 2937} {"train_loss": -6.597421169281006, "global_step": 123392, "epoch": 2937} {"train_loss": -6.636001110076904, "global_step": 123393, "epoch": 2937} {"train_loss": -6.617828369140625, "global_step": 123394, "epoch": 2937} {"train_loss": -6.615429685229347, "global_step": 123395, "epoch": 2937, "val_loss": 76949.1484375} {"train_loss": -6.611921310424805, "global_step": 123396, "epoch": 2938} {"train_loss": -6.705937385559082, "global_step": 123397, "epoch": 2938} {"train_loss": -6.726309776306152, "global_step": 123398, "epoch": 2938} {"train_loss": -6.647823810577393, "global_step": 123399, "epoch": 2938} {"train_loss": -6.6366987228393555, "global_step": 123400, "epoch": 2938} {"train_loss": -6.693248748779297, "global_step": 123401, "epoch": 2938} {"train_loss": -6.6380109786987305, "global_step": 123402, "epoch": 2938} {"train_loss": -6.563888072967529, "global_step": 123403, "epoch": 2938} {"train_loss": -6.663908958435059, "global_step": 123404, "epoch": 2938} {"train_loss": -6.61573600769043, "global_step": 123405, "epoch": 2938} {"train_loss": -6.505715370178223, "global_step": 123406, "epoch": 2938} {"train_loss": -6.591648101806641, "global_step": 123407, "epoch": 2938} {"train_loss": -6.57785701751709, "global_step": 123408, "epoch": 2938} {"train_loss": -6.655385971069336, "global_step": 123409, "epoch": 2938} {"train_loss": -6.448461532592773, "global_step": 123410, "epoch": 2938} {"train_loss": -6.573876857757568, "global_step": 123411, "epoch": 2938} {"train_loss": -6.602476119995117, "global_step": 123412, "epoch": 2938} {"train_loss": -6.554516792297363, "global_step": 123413, "epoch": 2938} {"train_loss": -6.726617813110352, "global_step": 123414, "epoch": 2938} {"train_loss": -6.5254034996032715, "global_step": 123415, "epoch": 2938} {"train_loss": -6.609062194824219, "global_step": 123416, "epoch": 2938} {"train_loss": -6.700556755065918, "global_step": 123417, "epoch": 2938} {"train_loss": -6.719297885894775, "global_step": 123418, "epoch": 2938} {"train_loss": -6.552101135253906, "global_step": 123419, "epoch": 2938} {"train_loss": -6.628409385681152, "global_step": 123420, "epoch": 2938} {"train_loss": -6.712141990661621, "global_step": 123421, "epoch": 2938} {"train_loss": -6.608522891998291, "global_step": 123422, "epoch": 2938} {"train_loss": -6.713266372680664, "global_step": 123423, "epoch": 2938} {"train_loss": -6.636723041534424, "global_step": 123424, "epoch": 2938} {"train_loss": -6.526660919189453, "global_step": 123425, "epoch": 2938} {"train_loss": -6.693968296051025, "global_step": 123426, "epoch": 2938} {"train_loss": -6.461565017700195, "global_step": 123427, "epoch": 2938} {"train_loss": -6.545876502990723, "global_step": 123428, "epoch": 2938} {"train_loss": -6.591860771179199, "global_step": 123429, "epoch": 2938} {"train_loss": -6.65297794342041, "global_step": 123430, "epoch": 2938} {"train_loss": -6.629878997802734, "global_step": 123431, "epoch": 2938} {"train_loss": -6.756209373474121, "global_step": 123432, "epoch": 2938} {"train_loss": -6.619335174560547, "global_step": 123433, "epoch": 2938} {"train_loss": -6.713796615600586, "global_step": 123434, "epoch": 2938} {"train_loss": -6.563141822814941, "global_step": 123435, "epoch": 2938} {"train_loss": -6.547818183898926, "global_step": 123436, "epoch": 2938} {"train_loss": -6.619543132327852, "global_step": 123437, "epoch": 2938, "val_loss": 77224.484375} {"train_loss": -6.590911865234375, "global_step": 123438, "epoch": 2939} {"train_loss": -6.582911491394043, "global_step": 123439, "epoch": 2939} {"train_loss": -6.611371040344238, "global_step": 123440, "epoch": 2939} {"train_loss": -6.66389274597168, "global_step": 123441, "epoch": 2939} {"train_loss": -6.582150459289551, "global_step": 123442, "epoch": 2939} {"train_loss": -6.675987720489502, "global_step": 123443, "epoch": 2939} {"train_loss": -6.438743591308594, "global_step": 123444, "epoch": 2939} {"train_loss": -6.519012451171875, "global_step": 123445, "epoch": 2939} {"train_loss": -6.667810916900635, "global_step": 123446, "epoch": 2939} {"train_loss": -6.519603729248047, "global_step": 123447, "epoch": 2939} {"train_loss": -6.691799163818359, "global_step": 123448, "epoch": 2939} {"train_loss": -6.6347880363464355, "global_step": 123449, "epoch": 2939} {"train_loss": -6.544508934020996, "global_step": 123450, "epoch": 2939} {"train_loss": -6.460625171661377, "global_step": 123451, "epoch": 2939} {"train_loss": -6.669284343719482, "global_step": 123452, "epoch": 2939} {"train_loss": -6.5157904624938965, "global_step": 123453, "epoch": 2939} {"train_loss": -6.574934959411621, "global_step": 123454, "epoch": 2939} {"train_loss": -6.489013195037842, "global_step": 123455, "epoch": 2939} {"train_loss": -6.552308082580566, "global_step": 123456, "epoch": 2939} {"train_loss": -6.606276035308838, "global_step": 123457, "epoch": 2939} {"train_loss": -6.510674476623535, "global_step": 123458, "epoch": 2939} {"train_loss": -6.5999436378479, "global_step": 123459, "epoch": 2939} {"train_loss": -6.5220513343811035, "global_step": 123460, "epoch": 2939} {"train_loss": -6.401709079742432, "global_step": 123461, "epoch": 2939} {"train_loss": -6.430782318115234, "global_step": 123462, "epoch": 2939} {"train_loss": -6.525301933288574, "global_step": 123463, "epoch": 2939} {"train_loss": -6.5420026779174805, "global_step": 123464, "epoch": 2939} {"train_loss": -6.373823642730713, "global_step": 123465, "epoch": 2939} {"train_loss": -6.5263566970825195, "global_step": 123466, "epoch": 2939} {"train_loss": -6.4220733642578125, "global_step": 123467, "epoch": 2939} {"train_loss": -6.369448661804199, "global_step": 123468, "epoch": 2939} {"train_loss": -6.371249198913574, "global_step": 123469, "epoch": 2939} {"train_loss": -6.523630142211914, "global_step": 123470, "epoch": 2939} {"train_loss": -6.394002914428711, "global_step": 123471, "epoch": 2939} {"train_loss": -6.612759590148926, "global_step": 123472, "epoch": 2939} {"train_loss": -6.364663600921631, "global_step": 123473, "epoch": 2939} {"train_loss": -6.481174468994141, "global_step": 123474, "epoch": 2939} {"train_loss": -6.461122512817383, "global_step": 123475, "epoch": 2939} {"train_loss": -6.517179012298584, "global_step": 123476, "epoch": 2939} {"train_loss": -6.431097984313965, "global_step": 123477, "epoch": 2939} {"train_loss": -6.539671897888184, "global_step": 123478, "epoch": 2939} {"train_loss": -6.524813402266729, "global_step": 123479, "epoch": 2939, "val_loss": 77008.1328125} {"train_loss": -6.624659538269043, "global_step": 123480, "epoch": 2940} {"train_loss": -6.622419357299805, "global_step": 123481, "epoch": 2940} {"train_loss": -6.662966728210449, "global_step": 123482, "epoch": 2940} {"train_loss": -6.628668785095215, "global_step": 123483, "epoch": 2940} {"train_loss": -6.595756530761719, "global_step": 123484, "epoch": 2940} {"train_loss": -6.513643741607666, "global_step": 123485, "epoch": 2940} {"train_loss": -6.562469482421875, "global_step": 123486, "epoch": 2940} {"train_loss": -6.673135757446289, "global_step": 123487, "epoch": 2940} {"train_loss": -6.555505752563477, "global_step": 123488, "epoch": 2940} {"train_loss": -6.612044334411621, "global_step": 123489, "epoch": 2940} {"train_loss": -6.538873672485352, "global_step": 123490, "epoch": 2940} {"train_loss": -6.670401573181152, "global_step": 123491, "epoch": 2940} {"train_loss": -6.6117095947265625, "global_step": 123492, "epoch": 2940} {"train_loss": -6.572453022003174, "global_step": 123493, "epoch": 2940} {"train_loss": -6.462489604949951, "global_step": 123494, "epoch": 2940} {"train_loss": -6.574285984039307, "global_step": 123495, "epoch": 2940} {"train_loss": -6.5427422523498535, "global_step": 123496, "epoch": 2940} {"train_loss": -6.573345184326172, "global_step": 123497, "epoch": 2940} {"train_loss": -6.560855865478516, "global_step": 123498, "epoch": 2940} {"train_loss": -6.415661811828613, "global_step": 123499, "epoch": 2940} {"train_loss": -6.609777450561523, "global_step": 123500, "epoch": 2940} {"train_loss": -6.63584566116333, "global_step": 123501, "epoch": 2940} {"train_loss": -6.556167125701904, "global_step": 123502, "epoch": 2940} {"train_loss": -6.533384323120117, "global_step": 123503, "epoch": 2940} {"train_loss": -6.561305999755859, "global_step": 123504, "epoch": 2940} {"train_loss": -6.442479133605957, "global_step": 123505, "epoch": 2940} {"train_loss": -6.631589412689209, "global_step": 123506, "epoch": 2940} {"train_loss": -6.534787178039551, "global_step": 123507, "epoch": 2940} {"train_loss": -6.636619567871094, "global_step": 123508, "epoch": 2940} {"train_loss": -6.560415744781494, "global_step": 123509, "epoch": 2940} {"train_loss": -6.5560102462768555, "global_step": 123510, "epoch": 2940} {"train_loss": -6.628820419311523, "global_step": 123511, "epoch": 2940} {"train_loss": -6.563358783721924, "global_step": 123512, "epoch": 2940} {"train_loss": -6.59925651550293, "global_step": 123513, "epoch": 2940} {"train_loss": -6.513145446777344, "global_step": 123514, "epoch": 2940} {"train_loss": -6.650088310241699, "global_step": 123515, "epoch": 2940} {"train_loss": -6.5891523361206055, "global_step": 123516, "epoch": 2940} {"train_loss": -6.543356418609619, "global_step": 123517, "epoch": 2940} {"train_loss": -6.578091621398926, "global_step": 123518, "epoch": 2940} {"train_loss": -6.581748008728027, "global_step": 123519, "epoch": 2940} {"train_loss": -6.526164531707764, "global_step": 123520, "epoch": 2940} {"train_loss": -6.577194509052095, "global_step": 123521, "epoch": 2940, "val_loss": 77020.5859375} {"train_loss": -6.668854713439941, "global_step": 123522, "epoch": 2941} {"train_loss": -6.675212383270264, "global_step": 123523, "epoch": 2941} {"train_loss": -6.552369117736816, "global_step": 123524, "epoch": 2941} {"train_loss": -6.664362907409668, "global_step": 123525, "epoch": 2941} {"train_loss": -6.661806106567383, "global_step": 123526, "epoch": 2941} {"train_loss": -6.537035942077637, "global_step": 123527, "epoch": 2941} {"train_loss": -6.660788536071777, "global_step": 123528, "epoch": 2941} {"train_loss": -6.618310928344727, "global_step": 123529, "epoch": 2941} {"train_loss": -6.621580123901367, "global_step": 123530, "epoch": 2941} {"train_loss": -6.448337554931641, "global_step": 123531, "epoch": 2941} {"train_loss": -6.4767889976501465, "global_step": 123532, "epoch": 2941} {"train_loss": -6.722373008728027, "global_step": 123533, "epoch": 2941} {"train_loss": -6.424018383026123, "global_step": 123534, "epoch": 2941} {"train_loss": -6.49583625793457, "global_step": 123535, "epoch": 2941} {"train_loss": -6.663351535797119, "global_step": 123536, "epoch": 2941} {"train_loss": -6.517775058746338, "global_step": 123537, "epoch": 2941} {"train_loss": -6.504641532897949, "global_step": 123538, "epoch": 2941} {"train_loss": -6.402626037597656, "global_step": 123539, "epoch": 2941} {"train_loss": -6.46103572845459, "global_step": 123540, "epoch": 2941} {"train_loss": -6.368368148803711, "global_step": 123541, "epoch": 2941} {"train_loss": -6.644350051879883, "global_step": 123542, "epoch": 2941} {"train_loss": -6.420060634613037, "global_step": 123543, "epoch": 2941} {"train_loss": -6.568037509918213, "global_step": 123544, "epoch": 2941} {"train_loss": -6.338319778442383, "global_step": 123545, "epoch": 2941} {"train_loss": -6.506329536437988, "global_step": 123546, "epoch": 2941} {"train_loss": -6.513313293457031, "global_step": 123547, "epoch": 2941} {"train_loss": -6.485224723815918, "global_step": 123548, "epoch": 2941} {"train_loss": -6.435637474060059, "global_step": 123549, "epoch": 2941} {"train_loss": -6.484323501586914, "global_step": 123550, "epoch": 2941} {"train_loss": -6.483882427215576, "global_step": 123551, "epoch": 2941} {"train_loss": -6.475810527801514, "global_step": 123552, "epoch": 2941} {"train_loss": -6.549909591674805, "global_step": 123553, "epoch": 2941} {"train_loss": -6.584382057189941, "global_step": 123554, "epoch": 2941} {"train_loss": -6.438255310058594, "global_step": 123555, "epoch": 2941} {"train_loss": -6.5401930809021, "global_step": 123556, "epoch": 2941} {"train_loss": -6.630424499511719, "global_step": 123557, "epoch": 2941} {"train_loss": -6.597862243652344, "global_step": 123558, "epoch": 2941} {"train_loss": -6.618703842163086, "global_step": 123559, "epoch": 2941} {"train_loss": -6.516523361206055, "global_step": 123560, "epoch": 2941} {"train_loss": -6.563353061676025, "global_step": 123561, "epoch": 2941} {"train_loss": -6.549001693725586, "global_step": 123562, "epoch": 2941} {"train_loss": -6.540233736946469, "global_step": 123563, "epoch": 2941, "val_loss": 77082.9609375} {"train_loss": -6.649072647094727, "global_step": 123564, "epoch": 2942} {"train_loss": -6.5642313957214355, "global_step": 123565, "epoch": 2942} {"train_loss": -6.472527027130127, "global_step": 123566, "epoch": 2942} {"train_loss": -6.584300994873047, "global_step": 123567, "epoch": 2942} {"train_loss": -6.492094993591309, "global_step": 123568, "epoch": 2942} {"train_loss": -6.6801629066467285, "global_step": 123569, "epoch": 2942} {"train_loss": -6.597624778747559, "global_step": 123570, "epoch": 2942} {"train_loss": -6.529945373535156, "global_step": 123571, "epoch": 2942} {"train_loss": -6.670705795288086, "global_step": 123572, "epoch": 2942} {"train_loss": -6.548696041107178, "global_step": 123573, "epoch": 2942} {"train_loss": -6.576160430908203, "global_step": 123574, "epoch": 2942} {"train_loss": -6.554915428161621, "global_step": 123575, "epoch": 2942} {"train_loss": -6.558594226837158, "global_step": 123576, "epoch": 2942} {"train_loss": -6.593363285064697, "global_step": 123577, "epoch": 2942} {"train_loss": -6.501346588134766, "global_step": 123578, "epoch": 2942} {"train_loss": -6.64256477355957, "global_step": 123579, "epoch": 2942} {"train_loss": -6.529645919799805, "global_step": 123580, "epoch": 2942} {"train_loss": -6.531329154968262, "global_step": 123581, "epoch": 2942} {"train_loss": -6.531567573547363, "global_step": 123582, "epoch": 2942} {"train_loss": -6.608206748962402, "global_step": 123583, "epoch": 2942} {"train_loss": -6.63441276550293, "global_step": 123584, "epoch": 2942} {"train_loss": -6.689761638641357, "global_step": 123585, "epoch": 2942} {"train_loss": -6.526754379272461, "global_step": 123586, "epoch": 2942} {"train_loss": -6.647851467132568, "global_step": 123587, "epoch": 2942} {"train_loss": -6.59653902053833, "global_step": 123588, "epoch": 2942} {"train_loss": -6.568140029907227, "global_step": 123589, "epoch": 2942} {"train_loss": -6.715298652648926, "global_step": 123590, "epoch": 2942} {"train_loss": -6.460611820220947, "global_step": 123591, "epoch": 2942} {"train_loss": -6.636269569396973, "global_step": 123592, "epoch": 2942} {"train_loss": -6.510351657867432, "global_step": 123593, "epoch": 2942} {"train_loss": -6.6684041023254395, "global_step": 123594, "epoch": 2942} {"train_loss": -6.610402584075928, "global_step": 123595, "epoch": 2942} {"train_loss": -6.54379940032959, "global_step": 123596, "epoch": 2942} {"train_loss": -6.5837483406066895, "global_step": 123597, "epoch": 2942} {"train_loss": -6.716716289520264, "global_step": 123598, "epoch": 2942} {"train_loss": -6.543868064880371, "global_step": 123599, "epoch": 2942} {"train_loss": -6.5891828536987305, "global_step": 123600, "epoch": 2942} {"train_loss": -6.639229774475098, "global_step": 123601, "epoch": 2942} {"train_loss": -6.673648357391357, "global_step": 123602, "epoch": 2942} {"train_loss": -6.62033748626709, "global_step": 123603, "epoch": 2942} {"train_loss": -6.631988048553467, "global_step": 123604, "epoch": 2942} {"train_loss": -6.59215910094125, "global_step": 123605, "epoch": 2942, "val_loss": 76931.8046875} {"train_loss": -6.684536933898926, "global_step": 123606, "epoch": 2943} {"train_loss": -6.629859924316406, "global_step": 123607, "epoch": 2943} {"train_loss": -6.577212333679199, "global_step": 123608, "epoch": 2943} {"train_loss": -6.593635559082031, "global_step": 123609, "epoch": 2943} {"train_loss": -6.528680801391602, "global_step": 123610, "epoch": 2943} {"train_loss": -6.567339897155762, "global_step": 123611, "epoch": 2943} {"train_loss": -6.519953727722168, "global_step": 123612, "epoch": 2943} {"train_loss": -6.610409259796143, "global_step": 123613, "epoch": 2943} {"train_loss": -6.532790184020996, "global_step": 123614, "epoch": 2943} {"train_loss": -6.548738479614258, "global_step": 123615, "epoch": 2943} {"train_loss": -6.540865421295166, "global_step": 123616, "epoch": 2943} {"train_loss": -6.550295829772949, "global_step": 123617, "epoch": 2943} {"train_loss": -6.553081035614014, "global_step": 123618, "epoch": 2943} {"train_loss": -6.591133117675781, "global_step": 123619, "epoch": 2943} {"train_loss": -6.653779029846191, "global_step": 123620, "epoch": 2943} {"train_loss": -6.547285556793213, "global_step": 123621, "epoch": 2943} {"train_loss": -6.646755218505859, "global_step": 123622, "epoch": 2943} {"train_loss": -6.574810981750488, "global_step": 123623, "epoch": 2943} {"train_loss": -6.528997421264648, "global_step": 123624, "epoch": 2943} {"train_loss": -6.679248809814453, "global_step": 123625, "epoch": 2943} {"train_loss": -6.612193584442139, "global_step": 123626, "epoch": 2943} {"train_loss": -6.763550758361816, "global_step": 123627, "epoch": 2943} {"train_loss": -6.624488353729248, "global_step": 123628, "epoch": 2943} {"train_loss": -6.642094135284424, "global_step": 123629, "epoch": 2943} {"train_loss": -6.524484634399414, "global_step": 123630, "epoch": 2943} {"train_loss": -6.612015724182129, "global_step": 123631, "epoch": 2943} {"train_loss": -6.646340847015381, "global_step": 123632, "epoch": 2943} {"train_loss": -6.578451156616211, "global_step": 123633, "epoch": 2943} {"train_loss": -6.673139572143555, "global_step": 123634, "epoch": 2943} {"train_loss": -6.544588088989258, "global_step": 123635, "epoch": 2943} {"train_loss": -6.670992851257324, "global_step": 123636, "epoch": 2943} {"train_loss": -6.608365058898926, "global_step": 123637, "epoch": 2943} {"train_loss": -6.667632579803467, "global_step": 123638, "epoch": 2943} {"train_loss": -6.637409210205078, "global_step": 123639, "epoch": 2943} {"train_loss": -6.5588788986206055, "global_step": 123640, "epoch": 2943} {"train_loss": -6.55003023147583, "global_step": 123641, "epoch": 2943} {"train_loss": -6.708076477050781, "global_step": 123642, "epoch": 2943} {"train_loss": -6.597029209136963, "global_step": 123643, "epoch": 2943} {"train_loss": -6.524894714355469, "global_step": 123644, "epoch": 2943} {"train_loss": -6.642760276794434, "global_step": 123645, "epoch": 2943} {"train_loss": -6.676279544830322, "global_step": 123646, "epoch": 2943} {"train_loss": -6.602567843028477, "global_step": 123647, "epoch": 2943, "val_loss": 77105.2890625} {"train_loss": -6.6250200271606445, "global_step": 123648, "epoch": 2944} {"train_loss": -6.633340835571289, "global_step": 123649, "epoch": 2944} {"train_loss": -6.721757888793945, "global_step": 123650, "epoch": 2944} {"train_loss": -6.592121124267578, "global_step": 123651, "epoch": 2944} {"train_loss": -6.689265727996826, "global_step": 123652, "epoch": 2944} {"train_loss": -6.690882682800293, "global_step": 123653, "epoch": 2944} {"train_loss": -6.705852508544922, "global_step": 123654, "epoch": 2944} {"train_loss": -6.7024078369140625, "global_step": 123655, "epoch": 2944} {"train_loss": -6.761906623840332, "global_step": 123656, "epoch": 2944} {"train_loss": -6.632364273071289, "global_step": 123657, "epoch": 2944} {"train_loss": -6.640766143798828, "global_step": 123658, "epoch": 2944} {"train_loss": -6.7093915939331055, "global_step": 123659, "epoch": 2944} {"train_loss": -6.726855754852295, "global_step": 123660, "epoch": 2944} {"train_loss": -6.646079063415527, "global_step": 123661, "epoch": 2944} {"train_loss": -6.7094292640686035, "global_step": 123662, "epoch": 2944} {"train_loss": -6.551277160644531, "global_step": 123663, "epoch": 2944} {"train_loss": -6.681091785430908, "global_step": 123664, "epoch": 2944} {"train_loss": -6.614529132843018, "global_step": 123665, "epoch": 2944} {"train_loss": -6.571218490600586, "global_step": 123666, "epoch": 2944} {"train_loss": -6.675100326538086, "global_step": 123667, "epoch": 2944} {"train_loss": -6.651632308959961, "global_step": 123668, "epoch": 2944} {"train_loss": -6.686272621154785, "global_step": 123669, "epoch": 2944} {"train_loss": -6.495083808898926, "global_step": 123670, "epoch": 2944} {"train_loss": -6.605388641357422, "global_step": 123671, "epoch": 2944} {"train_loss": -6.5757341384887695, "global_step": 123672, "epoch": 2944} {"train_loss": -6.603724956512451, "global_step": 123673, "epoch": 2944} {"train_loss": -6.654604434967041, "global_step": 123674, "epoch": 2944} {"train_loss": -6.577908992767334, "global_step": 123675, "epoch": 2944} {"train_loss": -6.644669055938721, "global_step": 123676, "epoch": 2944} {"train_loss": -6.619419097900391, "global_step": 123677, "epoch": 2944} {"train_loss": -6.706784248352051, "global_step": 123678, "epoch": 2944} {"train_loss": -6.587323188781738, "global_step": 123679, "epoch": 2944} {"train_loss": -6.567162990570068, "global_step": 123680, "epoch": 2944} {"train_loss": -6.477097988128662, "global_step": 123681, "epoch": 2944} {"train_loss": -6.633943557739258, "global_step": 123682, "epoch": 2944} {"train_loss": -6.641088008880615, "global_step": 123683, "epoch": 2944} {"train_loss": -6.580099105834961, "global_step": 123684, "epoch": 2944} {"train_loss": -6.626899719238281, "global_step": 123685, "epoch": 2944} {"train_loss": -6.6135711669921875, "global_step": 123686, "epoch": 2944} {"train_loss": -6.617871284484863, "global_step": 123687, "epoch": 2944} {"train_loss": -6.571088790893555, "global_step": 123688, "epoch": 2944} {"train_loss": -6.634663082304455, "global_step": 123689, "epoch": 2944, "val_loss": 77185.640625} {"train_loss": -6.599499225616455, "global_step": 123690, "epoch": 2945} {"train_loss": -6.638326644897461, "global_step": 123691, "epoch": 2945} {"train_loss": -6.683811664581299, "global_step": 123692, "epoch": 2945} {"train_loss": -6.618875503540039, "global_step": 123693, "epoch": 2945} {"train_loss": -6.52424430847168, "global_step": 123694, "epoch": 2945} {"train_loss": -6.602657318115234, "global_step": 123695, "epoch": 2945} {"train_loss": -6.5895676612854, "global_step": 123696, "epoch": 2945} {"train_loss": -6.519534111022949, "global_step": 123697, "epoch": 2945} {"train_loss": -6.7438645362854, "global_step": 123698, "epoch": 2945} {"train_loss": -6.604629993438721, "global_step": 123699, "epoch": 2945} {"train_loss": -6.728054046630859, "global_step": 123700, "epoch": 2945} {"train_loss": -6.6522908210754395, "global_step": 123701, "epoch": 2945} {"train_loss": -6.570300102233887, "global_step": 123702, "epoch": 2945} {"train_loss": -6.564058303833008, "global_step": 123703, "epoch": 2945} {"train_loss": -6.634589672088623, "global_step": 123704, "epoch": 2945} {"train_loss": -6.709722518920898, "global_step": 123705, "epoch": 2945} {"train_loss": -6.5957536697387695, "global_step": 123706, "epoch": 2945} {"train_loss": -6.698470592498779, "global_step": 123707, "epoch": 2945} {"train_loss": -6.570972919464111, "global_step": 123708, "epoch": 2945} {"train_loss": -6.621028900146484, "global_step": 123709, "epoch": 2945} {"train_loss": -6.631490230560303, "global_step": 123710, "epoch": 2945} {"train_loss": -6.649826526641846, "global_step": 123711, "epoch": 2945} {"train_loss": -6.649013519287109, "global_step": 123712, "epoch": 2945} {"train_loss": -6.653074264526367, "global_step": 123713, "epoch": 2945} {"train_loss": -6.495818138122559, "global_step": 123714, "epoch": 2945} {"train_loss": -6.612736701965332, "global_step": 123715, "epoch": 2945} {"train_loss": -6.559865951538086, "global_step": 123716, "epoch": 2945} {"train_loss": -6.681240081787109, "global_step": 123717, "epoch": 2945} {"train_loss": -6.589791297912598, "global_step": 123718, "epoch": 2945} {"train_loss": -6.512884140014648, "global_step": 123719, "epoch": 2945} {"train_loss": -6.519306659698486, "global_step": 123720, "epoch": 2945} {"train_loss": -6.68496036529541, "global_step": 123721, "epoch": 2945} {"train_loss": -6.6624860763549805, "global_step": 123722, "epoch": 2945} {"train_loss": -6.481952667236328, "global_step": 123723, "epoch": 2945} {"train_loss": -6.575456619262695, "global_step": 123724, "epoch": 2945} {"train_loss": -6.645083427429199, "global_step": 123725, "epoch": 2945} {"train_loss": -6.560615539550781, "global_step": 123726, "epoch": 2945} {"train_loss": -6.495136260986328, "global_step": 123727, "epoch": 2945} {"train_loss": -6.59445858001709, "global_step": 123728, "epoch": 2945} {"train_loss": -6.697816848754883, "global_step": 123729, "epoch": 2945} {"train_loss": -6.638391494750977, "global_step": 123730, "epoch": 2945} {"train_loss": -6.612914766584124, "global_step": 123731, "epoch": 2945, "val_loss": 77193.6796875} {"train_loss": -6.52185583114624, "global_step": 123732, "epoch": 2946} {"train_loss": -6.726717948913574, "global_step": 123733, "epoch": 2946} {"train_loss": -6.5729827880859375, "global_step": 123734, "epoch": 2946} {"train_loss": -6.568881034851074, "global_step": 123735, "epoch": 2946} {"train_loss": -6.722932815551758, "global_step": 123736, "epoch": 2946} {"train_loss": -6.578197956085205, "global_step": 123737, "epoch": 2946} {"train_loss": -6.599774360656738, "global_step": 123738, "epoch": 2946} {"train_loss": -6.540799140930176, "global_step": 123739, "epoch": 2946} {"train_loss": -6.616543769836426, "global_step": 123740, "epoch": 2946} {"train_loss": -6.517826080322266, "global_step": 123741, "epoch": 2946} {"train_loss": -6.5288896560668945, "global_step": 123742, "epoch": 2946} {"train_loss": -6.543414115905762, "global_step": 123743, "epoch": 2946} {"train_loss": -6.450441360473633, "global_step": 123744, "epoch": 2946} {"train_loss": -6.631988525390625, "global_step": 123745, "epoch": 2946} {"train_loss": -6.372418403625488, "global_step": 123746, "epoch": 2946} {"train_loss": -6.525653839111328, "global_step": 123747, "epoch": 2946} {"train_loss": -6.413246154785156, "global_step": 123748, "epoch": 2946} {"train_loss": -6.492480754852295, "global_step": 123749, "epoch": 2946} {"train_loss": -6.600558280944824, "global_step": 123750, "epoch": 2946} {"train_loss": -6.5037150382995605, "global_step": 123751, "epoch": 2946} {"train_loss": -6.591086387634277, "global_step": 123752, "epoch": 2946} {"train_loss": -6.419716835021973, "global_step": 123753, "epoch": 2946} {"train_loss": -6.4628005027771, "global_step": 123754, "epoch": 2946} {"train_loss": -6.397247791290283, "global_step": 123755, "epoch": 2946} {"train_loss": -6.555452346801758, "global_step": 123756, "epoch": 2946} {"train_loss": -6.44992733001709, "global_step": 123757, "epoch": 2946} {"train_loss": -6.51876974105835, "global_step": 123758, "epoch": 2946} {"train_loss": -6.4688825607299805, "global_step": 123759, "epoch": 2946} {"train_loss": -6.609334945678711, "global_step": 123760, "epoch": 2946} {"train_loss": -6.5714111328125, "global_step": 123761, "epoch": 2946} {"train_loss": -6.588971138000488, "global_step": 123762, "epoch": 2946} {"train_loss": -6.559948444366455, "global_step": 123763, "epoch": 2946} {"train_loss": -6.485860824584961, "global_step": 123764, "epoch": 2946} {"train_loss": -6.565680503845215, "global_step": 123765, "epoch": 2946} {"train_loss": -6.518779754638672, "global_step": 123766, "epoch": 2946} {"train_loss": -6.519784927368164, "global_step": 123767, "epoch": 2946} {"train_loss": -6.437140464782715, "global_step": 123768, "epoch": 2946} {"train_loss": -6.605286598205566, "global_step": 123769, "epoch": 2946} {"train_loss": -6.50439977645874, "global_step": 123770, "epoch": 2946} {"train_loss": -6.601102828979492, "global_step": 123771, "epoch": 2946} {"train_loss": -6.72608757019043, "global_step": 123772, "epoch": 2946} {"train_loss": -6.543545825140817, "global_step": 123773, "epoch": 2946, "val_loss": 76977.6015625} {"train_loss": -6.7448015213012695, "global_step": 123774, "epoch": 2947} {"train_loss": -6.584879398345947, "global_step": 123775, "epoch": 2947} {"train_loss": -6.6903157234191895, "global_step": 123776, "epoch": 2947} {"train_loss": -6.5985589027404785, "global_step": 123777, "epoch": 2947} {"train_loss": -6.600451946258545, "global_step": 123778, "epoch": 2947} {"train_loss": -6.626570701599121, "global_step": 123779, "epoch": 2947} {"train_loss": -6.5901689529418945, "global_step": 123780, "epoch": 2947} {"train_loss": -6.718108177185059, "global_step": 123781, "epoch": 2947} {"train_loss": -6.575616359710693, "global_step": 123782, "epoch": 2947} {"train_loss": -6.721181392669678, "global_step": 123783, "epoch": 2947} {"train_loss": -6.6143598556518555, "global_step": 123784, "epoch": 2947} {"train_loss": -6.579822063446045, "global_step": 123785, "epoch": 2947} {"train_loss": -6.612481117248535, "global_step": 123786, "epoch": 2947} {"train_loss": -6.549710273742676, "global_step": 123787, "epoch": 2947} {"train_loss": -6.6837239265441895, "global_step": 123788, "epoch": 2947} {"train_loss": -6.631811618804932, "global_step": 123789, "epoch": 2947} {"train_loss": -6.54892110824585, "global_step": 123790, "epoch": 2947} {"train_loss": -6.684253692626953, "global_step": 123791, "epoch": 2947} {"train_loss": -6.656230449676514, "global_step": 123792, "epoch": 2947} {"train_loss": -6.628019332885742, "global_step": 123793, "epoch": 2947} {"train_loss": -6.697569847106934, "global_step": 123794, "epoch": 2947} {"train_loss": -6.774316787719727, "global_step": 123795, "epoch": 2947} {"train_loss": -6.577198028564453, "global_step": 123796, "epoch": 2947} {"train_loss": -6.58688497543335, "global_step": 123797, "epoch": 2947} {"train_loss": -6.588520050048828, "global_step": 123798, "epoch": 2947} {"train_loss": -6.476495742797852, "global_step": 123799, "epoch": 2947} {"train_loss": -6.504518508911133, "global_step": 123800, "epoch": 2947} {"train_loss": -6.559217929840088, "global_step": 123801, "epoch": 2947} {"train_loss": -6.479193687438965, "global_step": 123802, "epoch": 2947} {"train_loss": -6.553280830383301, "global_step": 123803, "epoch": 2947} {"train_loss": -6.368232250213623, "global_step": 123804, "epoch": 2947} {"train_loss": -6.416171550750732, "global_step": 123805, "epoch": 2947} {"train_loss": -6.633694171905518, "global_step": 123806, "epoch": 2947} {"train_loss": -6.4544219970703125, "global_step": 123807, "epoch": 2947} {"train_loss": -6.66069221496582, "global_step": 123808, "epoch": 2947} {"train_loss": -6.424924373626709, "global_step": 123809, "epoch": 2947} {"train_loss": -6.5713210105896, "global_step": 123810, "epoch": 2947} {"train_loss": -6.571330547332764, "global_step": 123811, "epoch": 2947} {"train_loss": -6.5479736328125, "global_step": 123812, "epoch": 2947} {"train_loss": -6.491868019104004, "global_step": 123813, "epoch": 2947} {"train_loss": -6.52057409286499, "global_step": 123814, "epoch": 2947} {"train_loss": -6.589577016376314, "global_step": 123815, "epoch": 2947, "val_loss": 77309.515625} {"train_loss": -6.530512809753418, "global_step": 123816, "epoch": 2948} {"train_loss": -6.637904167175293, "global_step": 123817, "epoch": 2948} {"train_loss": -6.512060165405273, "global_step": 123818, "epoch": 2948} {"train_loss": -6.650151252746582, "global_step": 123819, "epoch": 2948} {"train_loss": -6.593212127685547, "global_step": 123820, "epoch": 2948} {"train_loss": -6.624997138977051, "global_step": 123821, "epoch": 2948} {"train_loss": -6.653329849243164, "global_step": 123822, "epoch": 2948} {"train_loss": -6.546019077301025, "global_step": 123823, "epoch": 2948} {"train_loss": -6.535095691680908, "global_step": 123824, "epoch": 2948} {"train_loss": -6.610912799835205, "global_step": 123825, "epoch": 2948} {"train_loss": -6.575535297393799, "global_step": 123826, "epoch": 2948} {"train_loss": -6.573470115661621, "global_step": 123827, "epoch": 2948} {"train_loss": -6.62893533706665, "global_step": 123828, "epoch": 2948} {"train_loss": -6.624051570892334, "global_step": 123829, "epoch": 2948} {"train_loss": -6.48803186416626, "global_step": 123830, "epoch": 2948} {"train_loss": -6.61599063873291, "global_step": 123831, "epoch": 2948} {"train_loss": -6.627366065979004, "global_step": 123832, "epoch": 2948} {"train_loss": -6.4902143478393555, "global_step": 123833, "epoch": 2948} {"train_loss": -6.570887088775635, "global_step": 123834, "epoch": 2948} {"train_loss": -6.570340156555176, "global_step": 123835, "epoch": 2948} {"train_loss": -6.691812515258789, "global_step": 123836, "epoch": 2948} {"train_loss": -6.496733665466309, "global_step": 123837, "epoch": 2948} {"train_loss": -6.635320663452148, "global_step": 123838, "epoch": 2948} {"train_loss": -6.706431865692139, "global_step": 123839, "epoch": 2948} {"train_loss": -6.603392124176025, "global_step": 123840, "epoch": 2948} {"train_loss": -6.569069862365723, "global_step": 123841, "epoch": 2948} {"train_loss": -6.613334655761719, "global_step": 123842, "epoch": 2948} {"train_loss": -6.649053573608398, "global_step": 123843, "epoch": 2948} {"train_loss": -6.578449726104736, "global_step": 123844, "epoch": 2948} {"train_loss": -6.491203308105469, "global_step": 123845, "epoch": 2948} {"train_loss": -6.600958824157715, "global_step": 123846, "epoch": 2948} {"train_loss": -6.504546165466309, "global_step": 123847, "epoch": 2948} {"train_loss": -6.563108921051025, "global_step": 123848, "epoch": 2948} {"train_loss": -6.629692077636719, "global_step": 123849, "epoch": 2948} {"train_loss": -6.637569427490234, "global_step": 123850, "epoch": 2948} {"train_loss": -6.554985046386719, "global_step": 123851, "epoch": 2948} {"train_loss": -6.658946990966797, "global_step": 123852, "epoch": 2948} {"train_loss": -6.494515895843506, "global_step": 123853, "epoch": 2948} {"train_loss": -6.689908504486084, "global_step": 123854, "epoch": 2948} {"train_loss": -6.6036858558654785, "global_step": 123855, "epoch": 2948} {"train_loss": -6.660177230834961, "global_step": 123856, "epoch": 2948} {"train_loss": -6.593302772158668, "global_step": 123857, "epoch": 2948, "val_loss": 77071.2265625} {"train_loss": -6.593930244445801, "global_step": 123858, "epoch": 2949} {"train_loss": -6.57047700881958, "global_step": 123859, "epoch": 2949} {"train_loss": -6.69173526763916, "global_step": 123860, "epoch": 2949} {"train_loss": -6.54404354095459, "global_step": 123861, "epoch": 2949} {"train_loss": -6.713740348815918, "global_step": 123862, "epoch": 2949} {"train_loss": -6.645288944244385, "global_step": 123863, "epoch": 2949} {"train_loss": -6.496851444244385, "global_step": 123864, "epoch": 2949} {"train_loss": -6.574616432189941, "global_step": 123865, "epoch": 2949} {"train_loss": -6.517855644226074, "global_step": 123866, "epoch": 2949} {"train_loss": -6.68143367767334, "global_step": 123867, "epoch": 2949} {"train_loss": -6.5651535987854, "global_step": 123868, "epoch": 2949} {"train_loss": -6.584112167358398, "global_step": 123869, "epoch": 2949} {"train_loss": -6.735687255859375, "global_step": 123870, "epoch": 2949} {"train_loss": -6.633976936340332, "global_step": 123871, "epoch": 2949} {"train_loss": -6.532613754272461, "global_step": 123872, "epoch": 2949} {"train_loss": -6.635430335998535, "global_step": 123873, "epoch": 2949} {"train_loss": -6.632509231567383, "global_step": 123874, "epoch": 2949} {"train_loss": -6.703335762023926, "global_step": 123875, "epoch": 2949} {"train_loss": -6.686526298522949, "global_step": 123876, "epoch": 2949} {"train_loss": -6.475994110107422, "global_step": 123877, "epoch": 2949} {"train_loss": -6.71973991394043, "global_step": 123878, "epoch": 2949} {"train_loss": -6.659711837768555, "global_step": 123879, "epoch": 2949} {"train_loss": -6.6713080406188965, "global_step": 123880, "epoch": 2949} {"train_loss": -6.549432754516602, "global_step": 123881, "epoch": 2949} {"train_loss": -6.607739448547363, "global_step": 123882, "epoch": 2949} {"train_loss": -6.6764960289001465, "global_step": 123883, "epoch": 2949} {"train_loss": -6.6422624588012695, "global_step": 123884, "epoch": 2949} {"train_loss": -6.698235511779785, "global_step": 123885, "epoch": 2949} {"train_loss": -6.629209995269775, "global_step": 123886, "epoch": 2949} {"train_loss": -6.6616058349609375, "global_step": 123887, "epoch": 2949} {"train_loss": -6.610567092895508, "global_step": 123888, "epoch": 2949} {"train_loss": -6.595993995666504, "global_step": 123889, "epoch": 2949} {"train_loss": -6.614142417907715, "global_step": 123890, "epoch": 2949} {"train_loss": -6.617325782775879, "global_step": 123891, "epoch": 2949} {"train_loss": -6.602924823760986, "global_step": 123892, "epoch": 2949} {"train_loss": -6.5495524406433105, "global_step": 123893, "epoch": 2949} {"train_loss": -6.677335739135742, "global_step": 123894, "epoch": 2949} {"train_loss": -6.647839546203613, "global_step": 123895, "epoch": 2949} {"train_loss": -6.622030258178711, "global_step": 123896, "epoch": 2949} {"train_loss": -6.701015472412109, "global_step": 123897, "epoch": 2949} {"train_loss": -6.750520706176758, "global_step": 123898, "epoch": 2949} {"train_loss": -6.62874834878104, "global_step": 123899, "epoch": 2949, "val_loss": 77026.0078125} {"train_loss": -6.683349609375, "global_step": 123900, "epoch": 2950} {"train_loss": -6.470290660858154, "global_step": 123901, "epoch": 2950} {"train_loss": -6.493194103240967, "global_step": 123902, "epoch": 2950} {"train_loss": -6.5771894454956055, "global_step": 123903, "epoch": 2950} {"train_loss": -6.7270050048828125, "global_step": 123904, "epoch": 2950} {"train_loss": -6.621086120605469, "global_step": 123905, "epoch": 2950} {"train_loss": -6.4302263259887695, "global_step": 123906, "epoch": 2950} {"train_loss": -6.588840961456299, "global_step": 123907, "epoch": 2950} {"train_loss": -6.463996410369873, "global_step": 123908, "epoch": 2950} {"train_loss": -6.536760330200195, "global_step": 123909, "epoch": 2950} {"train_loss": -6.565893650054932, "global_step": 123910, "epoch": 2950} {"train_loss": -6.554812431335449, "global_step": 123911, "epoch": 2950} {"train_loss": -6.591556072235107, "global_step": 123912, "epoch": 2950} {"train_loss": -6.565255641937256, "global_step": 123913, "epoch": 2950} {"train_loss": -6.585369110107422, "global_step": 123914, "epoch": 2950} {"train_loss": -6.5340681076049805, "global_step": 123915, "epoch": 2950} {"train_loss": -6.688570976257324, "global_step": 123916, "epoch": 2950} {"train_loss": -6.5906476974487305, "global_step": 123917, "epoch": 2950} {"train_loss": -6.573613166809082, "global_step": 123918, "epoch": 2950} {"train_loss": -6.445351600646973, "global_step": 123919, "epoch": 2950} {"train_loss": -6.464935779571533, "global_step": 123920, "epoch": 2950} {"train_loss": -6.587737560272217, "global_step": 123921, "epoch": 2950} {"train_loss": -6.405076026916504, "global_step": 123922, "epoch": 2950} {"train_loss": -6.623072147369385, "global_step": 123923, "epoch": 2950} {"train_loss": -6.578981399536133, "global_step": 123924, "epoch": 2950} {"train_loss": -6.6247663497924805, "global_step": 123925, "epoch": 2950} {"train_loss": -6.5014753341674805, "global_step": 123926, "epoch": 2950} {"train_loss": -6.685807228088379, "global_step": 123927, "epoch": 2950} {"train_loss": -6.630346775054932, "global_step": 123928, "epoch": 2950} {"train_loss": -6.589864253997803, "global_step": 123929, "epoch": 2950} {"train_loss": -6.623444080352783, "global_step": 123930, "epoch": 2950} {"train_loss": -6.625674247741699, "global_step": 123931, "epoch": 2950} {"train_loss": -6.624551773071289, "global_step": 123932, "epoch": 2950} {"train_loss": -6.604079246520996, "global_step": 123933, "epoch": 2950} {"train_loss": -6.63870906829834, "global_step": 123934, "epoch": 2950} {"train_loss": -6.5976972579956055, "global_step": 123935, "epoch": 2950} {"train_loss": -6.543910980224609, "global_step": 123936, "epoch": 2950} {"train_loss": -6.729487419128418, "global_step": 123937, "epoch": 2950} {"train_loss": -6.590600490570068, "global_step": 123938, "epoch": 2950} {"train_loss": -6.734658241271973, "global_step": 123939, "epoch": 2950} {"train_loss": -6.731273651123047, "global_step": 123940, "epoch": 2950} {"train_loss": -6.584254650842576, "global_step": 123941, "epoch": 2950, "train/sim_max_reward_0": 0.7785560689894128, "train/sim_max_reward_1": 0.9167683664020123, "train/sim_max_reward_2": 0.43106360632545176, "train/sim_max_reward_3": 0.13948167549748303, "train/sim_max_reward_4": 0.8874673735291095, "train/sim_max_reward_5": 0.5721060043170969, "test/sim_max_reward_4500000": 0.9414124998986048, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9224227592164131, "test/sim_max_reward_4500003": 0.9479067452021797, "test/sim_max_reward_4500004": 0.16214874049472575, "test/sim_max_reward_4500005": 0.2799202342026372, "test/sim_max_reward_4500006": 0.9801757951736606, "test/sim_max_reward_4500007": 0.8906539980806747, "test/sim_max_reward_4500008": 0.29212063931613863, "test/sim_max_reward_4500009": 0.05356442499758577, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9555807820706836, "test/sim_max_reward_4500012": 0.9003756718872246, "test/sim_max_reward_4500013": 0.00543759360599768, "test/sim_max_reward_4500014": 0.9035128292496244, "test/sim_max_reward_4500015": 0.9885260724060266, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.03712903168658522, "test/sim_max_reward_4500018": 0.9611952643881978, "test/sim_max_reward_4500019": 0.6216376874830379, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.6849047516135064, "test/sim_max_reward_4500022": 0.6245329434464079, "test/sim_max_reward_4500023": 0.5640070447746127, "test/sim_max_reward_4500024": 0.8903172003470177, "test/sim_max_reward_4500025": 0.9751838066205598, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.9315979073102865, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.07480770121156614, "test/sim_max_reward_4500030": 0.9318898187524615, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.046550462860182946, "test/sim_max_reward_4500033": 0.29711038437422616, "test/sim_max_reward_4500034": 0.8800314340102129, "test/sim_max_reward_4500035": 0.6457844662353361, "test/sim_max_reward_4500036": 0.6634144347826514, "test/sim_max_reward_4500037": 0.9757567671191527, "test/sim_max_reward_4500038": 0.9870620875572453, "test/sim_max_reward_4500039": 0.8338537237200875, "test/sim_max_reward_4500040": 0.8753869612940615, "test/sim_max_reward_4500041": 0.37537891276015667, "test/sim_max_reward_4500042": 0.025262400811206114, "test/sim_max_reward_4500043": 0.30585424906750686, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.3903497283019801, "test/sim_max_reward_4500046": 0.18410965754353437, "test/sim_max_reward_4500047": 0.9948329358887052, "test/sim_max_reward_4500048": 0.9951537158083775, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6209071825100944, "test/mean_score": 0.5245003106304478, "val_loss": 77200.6796875} {"train_loss": -6.608226776123047, "global_step": 123942, "epoch": 2951} {"train_loss": -6.599414825439453, "global_step": 123943, "epoch": 2951} {"train_loss": -6.61846923828125, "global_step": 123944, "epoch": 2951} {"train_loss": -6.642552852630615, "global_step": 123945, "epoch": 2951} {"train_loss": -6.447965621948242, "global_step": 123946, "epoch": 2951} {"train_loss": -6.572443008422852, "global_step": 123947, "epoch": 2951} {"train_loss": -6.588260650634766, "global_step": 123948, "epoch": 2951} {"train_loss": -6.662008285522461, "global_step": 123949, "epoch": 2951} {"train_loss": -6.577414512634277, "global_step": 123950, "epoch": 2951} {"train_loss": -6.7456746101379395, "global_step": 123951, "epoch": 2951} {"train_loss": -6.675484657287598, "global_step": 123952, "epoch": 2951} {"train_loss": -6.607508659362793, "global_step": 123953, "epoch": 2951} {"train_loss": -6.680319309234619, "global_step": 123954, "epoch": 2951} {"train_loss": -6.64385986328125, "global_step": 123955, "epoch": 2951} {"train_loss": -6.630270957946777, "global_step": 123956, "epoch": 2951} {"train_loss": -6.5671706199646, "global_step": 123957, "epoch": 2951} {"train_loss": -6.611665725708008, "global_step": 123958, "epoch": 2951} {"train_loss": -6.611915588378906, "global_step": 123959, "epoch": 2951} {"train_loss": -6.486227989196777, "global_step": 123960, "epoch": 2951} {"train_loss": -6.644804000854492, "global_step": 123961, "epoch": 2951} {"train_loss": -6.699579238891602, "global_step": 123962, "epoch": 2951} {"train_loss": -6.652709484100342, "global_step": 123963, "epoch": 2951} {"train_loss": -6.708470344543457, "global_step": 123964, "epoch": 2951} {"train_loss": -6.699849605560303, "global_step": 123965, "epoch": 2951} {"train_loss": -6.731762886047363, "global_step": 123966, "epoch": 2951} {"train_loss": -6.603743553161621, "global_step": 123967, "epoch": 2951} {"train_loss": -6.724688529968262, "global_step": 123968, "epoch": 2951} {"train_loss": -6.6346049308776855, "global_step": 123969, "epoch": 2951} {"train_loss": -6.614431381225586, "global_step": 123970, "epoch": 2951} {"train_loss": -6.62075138092041, "global_step": 123971, "epoch": 2951} {"train_loss": -6.628699779510498, "global_step": 123972, "epoch": 2951} {"train_loss": -6.663003921508789, "global_step": 123973, "epoch": 2951} {"train_loss": -6.708331108093262, "global_step": 123974, "epoch": 2951} {"train_loss": -6.627997398376465, "global_step": 123975, "epoch": 2951} {"train_loss": -6.513728141784668, "global_step": 123976, "epoch": 2951} {"train_loss": -6.615917205810547, "global_step": 123977, "epoch": 2951} {"train_loss": -6.66692590713501, "global_step": 123978, "epoch": 2951} {"train_loss": -6.578322887420654, "global_step": 123979, "epoch": 2951} {"train_loss": -6.639011859893799, "global_step": 123980, "epoch": 2951} {"train_loss": -6.533712863922119, "global_step": 123981, "epoch": 2951} {"train_loss": -6.686357021331787, "global_step": 123982, "epoch": 2951} {"train_loss": -6.62663409823463, "global_step": 123983, "epoch": 2951, "val_loss": 76977.1484375} {"train_loss": -6.558343887329102, "global_step": 123984, "epoch": 2952} {"train_loss": -6.681936264038086, "global_step": 123985, "epoch": 2952} {"train_loss": -6.553955078125, "global_step": 123986, "epoch": 2952} {"train_loss": -6.566779136657715, "global_step": 123987, "epoch": 2952} {"train_loss": -6.591876029968262, "global_step": 123988, "epoch": 2952} {"train_loss": -6.49845027923584, "global_step": 123989, "epoch": 2952} {"train_loss": -6.592368125915527, "global_step": 123990, "epoch": 2952} {"train_loss": -6.57884407043457, "global_step": 123991, "epoch": 2952} {"train_loss": -6.4879255294799805, "global_step": 123992, "epoch": 2952} {"train_loss": -6.488626003265381, "global_step": 123993, "epoch": 2952} {"train_loss": -6.5413923263549805, "global_step": 123994, "epoch": 2952} {"train_loss": -6.5007710456848145, "global_step": 123995, "epoch": 2952} {"train_loss": -6.577251434326172, "global_step": 123996, "epoch": 2952} {"train_loss": -6.550540924072266, "global_step": 123997, "epoch": 2952} {"train_loss": -6.474673271179199, "global_step": 123998, "epoch": 2952} {"train_loss": -6.621244430541992, "global_step": 123999, "epoch": 2952} {"train_loss": -6.449434280395508, "global_step": 124000, "epoch": 2952} {"train_loss": -6.472611427307129, "global_step": 124001, "epoch": 2952} {"train_loss": -6.686456680297852, "global_step": 124002, "epoch": 2952} {"train_loss": -6.447951316833496, "global_step": 124003, "epoch": 2952} {"train_loss": -6.691875457763672, "global_step": 124004, "epoch": 2952} {"train_loss": -6.663823127746582, "global_step": 124005, "epoch": 2952} {"train_loss": -6.672821998596191, "global_step": 124006, "epoch": 2952} {"train_loss": -6.647990703582764, "global_step": 124007, "epoch": 2952} {"train_loss": -6.6063127517700195, "global_step": 124008, "epoch": 2952} {"train_loss": -6.611040115356445, "global_step": 124009, "epoch": 2952} {"train_loss": -6.5023040771484375, "global_step": 124010, "epoch": 2952} {"train_loss": -6.623456954956055, "global_step": 124011, "epoch": 2952} {"train_loss": -6.5655741691589355, "global_step": 124012, "epoch": 2952} {"train_loss": -6.554894924163818, "global_step": 124013, "epoch": 2952} {"train_loss": -6.528534889221191, "global_step": 124014, "epoch": 2952} {"train_loss": -6.508860111236572, "global_step": 124015, "epoch": 2952} {"train_loss": -6.623945236206055, "global_step": 124016, "epoch": 2952} {"train_loss": -6.599854469299316, "global_step": 124017, "epoch": 2952} {"train_loss": -6.573617935180664, "global_step": 124018, "epoch": 2952} {"train_loss": -6.575765132904053, "global_step": 124019, "epoch": 2952} {"train_loss": -6.639915466308594, "global_step": 124020, "epoch": 2952} {"train_loss": -6.587357521057129, "global_step": 124021, "epoch": 2952} {"train_loss": -6.594564437866211, "global_step": 124022, "epoch": 2952} {"train_loss": -6.617144584655762, "global_step": 124023, "epoch": 2952} {"train_loss": -6.550009727478027, "global_step": 124024, "epoch": 2952} {"train_loss": -6.571791989462716, "global_step": 124025, "epoch": 2952, "val_loss": 77164.0859375} {"train_loss": -6.47178840637207, "global_step": 124026, "epoch": 2953} {"train_loss": -6.533036231994629, "global_step": 124027, "epoch": 2953} {"train_loss": -6.576419830322266, "global_step": 124028, "epoch": 2953} {"train_loss": -6.571491241455078, "global_step": 124029, "epoch": 2953} {"train_loss": -6.563313961029053, "global_step": 124030, "epoch": 2953} {"train_loss": -6.635445594787598, "global_step": 124031, "epoch": 2953} {"train_loss": -6.550859451293945, "global_step": 124032, "epoch": 2953} {"train_loss": -6.558452606201172, "global_step": 124033, "epoch": 2953} {"train_loss": -6.536820411682129, "global_step": 124034, "epoch": 2953} {"train_loss": -6.459555625915527, "global_step": 124035, "epoch": 2953} {"train_loss": -6.489713668823242, "global_step": 124036, "epoch": 2953} {"train_loss": -6.582036972045898, "global_step": 124037, "epoch": 2953} {"train_loss": -6.495018005371094, "global_step": 124038, "epoch": 2953} {"train_loss": -6.633556365966797, "global_step": 124039, "epoch": 2953} {"train_loss": -6.663482189178467, "global_step": 124040, "epoch": 2953} {"train_loss": -6.610435485839844, "global_step": 124041, "epoch": 2953} {"train_loss": -6.551207065582275, "global_step": 124042, "epoch": 2953} {"train_loss": -6.635802268981934, "global_step": 124043, "epoch": 2953} {"train_loss": -6.700554847717285, "global_step": 124044, "epoch": 2953} {"train_loss": -6.498322486877441, "global_step": 124045, "epoch": 2953} {"train_loss": -6.567898750305176, "global_step": 124046, "epoch": 2953} {"train_loss": -6.582530975341797, "global_step": 124047, "epoch": 2953} {"train_loss": -6.608368873596191, "global_step": 124048, "epoch": 2953} {"train_loss": -6.644715785980225, "global_step": 124049, "epoch": 2953} {"train_loss": -6.627774238586426, "global_step": 124050, "epoch": 2953} {"train_loss": -6.552455902099609, "global_step": 124051, "epoch": 2953} {"train_loss": -6.502943515777588, "global_step": 124052, "epoch": 2953} {"train_loss": -6.622408390045166, "global_step": 124053, "epoch": 2953} {"train_loss": -6.529945373535156, "global_step": 124054, "epoch": 2953} {"train_loss": -6.640298843383789, "global_step": 124055, "epoch": 2953} {"train_loss": -6.513211250305176, "global_step": 124056, "epoch": 2953} {"train_loss": -6.516173839569092, "global_step": 124057, "epoch": 2953} {"train_loss": -6.579510688781738, "global_step": 124058, "epoch": 2953} {"train_loss": -6.54978084564209, "global_step": 124059, "epoch": 2953} {"train_loss": -6.5170416831970215, "global_step": 124060, "epoch": 2953} {"train_loss": -6.606461524963379, "global_step": 124061, "epoch": 2953} {"train_loss": -6.619997501373291, "global_step": 124062, "epoch": 2953} {"train_loss": -6.583009719848633, "global_step": 124063, "epoch": 2953} {"train_loss": -6.695540428161621, "global_step": 124064, "epoch": 2953} {"train_loss": -6.611247539520264, "global_step": 124065, "epoch": 2953} {"train_loss": -6.602650165557861, "global_step": 124066, "epoch": 2953} {"train_loss": -6.5752604348318915, "global_step": 124067, "epoch": 2953, "val_loss": 76955.8515625} {"train_loss": -6.5303449630737305, "global_step": 124068, "epoch": 2954} {"train_loss": -6.577750205993652, "global_step": 124069, "epoch": 2954} {"train_loss": -6.575206756591797, "global_step": 124070, "epoch": 2954} {"train_loss": -6.539814472198486, "global_step": 124071, "epoch": 2954} {"train_loss": -6.635171890258789, "global_step": 124072, "epoch": 2954} {"train_loss": -6.668212890625, "global_step": 124073, "epoch": 2954} {"train_loss": -6.654260158538818, "global_step": 124074, "epoch": 2954} {"train_loss": -6.583270072937012, "global_step": 124075, "epoch": 2954} {"train_loss": -6.68784236907959, "global_step": 124076, "epoch": 2954} {"train_loss": -6.605449199676514, "global_step": 124077, "epoch": 2954} {"train_loss": -6.546262264251709, "global_step": 124078, "epoch": 2954} {"train_loss": -6.590587615966797, "global_step": 124079, "epoch": 2954} {"train_loss": -6.565324783325195, "global_step": 124080, "epoch": 2954} {"train_loss": -6.653312683105469, "global_step": 124081, "epoch": 2954} {"train_loss": -6.608275413513184, "global_step": 124082, "epoch": 2954} {"train_loss": -6.598138332366943, "global_step": 124083, "epoch": 2954} {"train_loss": -6.742733955383301, "global_step": 124084, "epoch": 2954} {"train_loss": -6.519040107727051, "global_step": 124085, "epoch": 2954} {"train_loss": -6.5740275382995605, "global_step": 124086, "epoch": 2954} {"train_loss": -6.644360065460205, "global_step": 124087, "epoch": 2954} {"train_loss": -6.659860610961914, "global_step": 124088, "epoch": 2954} {"train_loss": -6.693253517150879, "global_step": 124089, "epoch": 2954} {"train_loss": -6.503737449645996, "global_step": 124090, "epoch": 2954} {"train_loss": -6.542928218841553, "global_step": 124091, "epoch": 2954} {"train_loss": -6.6338701248168945, "global_step": 124092, "epoch": 2954} {"train_loss": -6.576884746551514, "global_step": 124093, "epoch": 2954} {"train_loss": -6.641454696655273, "global_step": 124094, "epoch": 2954} {"train_loss": -6.60078763961792, "global_step": 124095, "epoch": 2954} {"train_loss": -6.586933135986328, "global_step": 124096, "epoch": 2954} {"train_loss": -6.512087821960449, "global_step": 124097, "epoch": 2954} {"train_loss": -6.513871192932129, "global_step": 124098, "epoch": 2954} {"train_loss": -6.639463424682617, "global_step": 124099, "epoch": 2954} {"train_loss": -6.656264305114746, "global_step": 124100, "epoch": 2954} {"train_loss": -6.485418796539307, "global_step": 124101, "epoch": 2954} {"train_loss": -6.511529922485352, "global_step": 124102, "epoch": 2954} {"train_loss": -6.656112194061279, "global_step": 124103, "epoch": 2954} {"train_loss": -6.642889022827148, "global_step": 124104, "epoch": 2954} {"train_loss": -6.621044158935547, "global_step": 124105, "epoch": 2954} {"train_loss": -6.528812885284424, "global_step": 124106, "epoch": 2954} {"train_loss": -6.605473041534424, "global_step": 124107, "epoch": 2954} {"train_loss": -6.603286266326904, "global_step": 124108, "epoch": 2954} {"train_loss": -6.598233359200614, "global_step": 124109, "epoch": 2954, "val_loss": 77068.9375} {"train_loss": -6.613158226013184, "global_step": 124110, "epoch": 2955} {"train_loss": -6.644182205200195, "global_step": 124111, "epoch": 2955} {"train_loss": -6.475744247436523, "global_step": 124112, "epoch": 2955} {"train_loss": -6.5521650314331055, "global_step": 124113, "epoch": 2955} {"train_loss": -6.562466621398926, "global_step": 124114, "epoch": 2955} {"train_loss": -6.6083292961120605, "global_step": 124115, "epoch": 2955} {"train_loss": -6.711247444152832, "global_step": 124116, "epoch": 2955} {"train_loss": -6.589588165283203, "global_step": 124117, "epoch": 2955} {"train_loss": -6.598758697509766, "global_step": 124118, "epoch": 2955} {"train_loss": -6.5746002197265625, "global_step": 124119, "epoch": 2955} {"train_loss": -6.6945953369140625, "global_step": 124120, "epoch": 2955} {"train_loss": -6.706364631652832, "global_step": 124121, "epoch": 2955} {"train_loss": -6.679991722106934, "global_step": 124122, "epoch": 2955} {"train_loss": -6.636731147766113, "global_step": 124123, "epoch": 2955} {"train_loss": -6.658638000488281, "global_step": 124124, "epoch": 2955} {"train_loss": -6.574972152709961, "global_step": 124125, "epoch": 2955} {"train_loss": -6.619175910949707, "global_step": 124126, "epoch": 2955} {"train_loss": -6.663984298706055, "global_step": 124127, "epoch": 2955} {"train_loss": -6.709653854370117, "global_step": 124128, "epoch": 2955} {"train_loss": -6.591794967651367, "global_step": 124129, "epoch": 2955} {"train_loss": -6.66534423828125, "global_step": 124130, "epoch": 2955} {"train_loss": -6.668826103210449, "global_step": 124131, "epoch": 2955} {"train_loss": -6.692016124725342, "global_step": 124132, "epoch": 2955} {"train_loss": -6.681367874145508, "global_step": 124133, "epoch": 2955} {"train_loss": -6.6731672286987305, "global_step": 124134, "epoch": 2955} {"train_loss": -6.593559265136719, "global_step": 124135, "epoch": 2955} {"train_loss": -6.7861504554748535, "global_step": 124136, "epoch": 2955} {"train_loss": -6.598048210144043, "global_step": 124137, "epoch": 2955} {"train_loss": -6.692291259765625, "global_step": 124138, "epoch": 2955} {"train_loss": -6.598570346832275, "global_step": 124139, "epoch": 2955} {"train_loss": -6.591843128204346, "global_step": 124140, "epoch": 2955} {"train_loss": -6.742391586303711, "global_step": 124141, "epoch": 2955} {"train_loss": -6.67326545715332, "global_step": 124142, "epoch": 2955} {"train_loss": -6.740574836730957, "global_step": 124143, "epoch": 2955} {"train_loss": -6.662324905395508, "global_step": 124144, "epoch": 2955} {"train_loss": -6.6510910987854, "global_step": 124145, "epoch": 2955} {"train_loss": -6.604212760925293, "global_step": 124146, "epoch": 2955} {"train_loss": -6.608329772949219, "global_step": 124147, "epoch": 2955} {"train_loss": -6.682985305786133, "global_step": 124148, "epoch": 2955} {"train_loss": -6.529340744018555, "global_step": 124149, "epoch": 2955} {"train_loss": -6.546184539794922, "global_step": 124150, "epoch": 2955} {"train_loss": -6.6380187556857155, "global_step": 124151, "epoch": 2955, "val_loss": 76996.96875} {"train_loss": -6.605167865753174, "global_step": 124152, "epoch": 2956} {"train_loss": -6.4928741455078125, "global_step": 124153, "epoch": 2956} {"train_loss": -6.519928932189941, "global_step": 124154, "epoch": 2956} {"train_loss": -6.623223304748535, "global_step": 124155, "epoch": 2956} {"train_loss": -6.7043280601501465, "global_step": 124156, "epoch": 2956} {"train_loss": -6.637170791625977, "global_step": 124157, "epoch": 2956} {"train_loss": -6.5333991050720215, "global_step": 124158, "epoch": 2956} {"train_loss": -6.631059646606445, "global_step": 124159, "epoch": 2956} {"train_loss": -6.6301422119140625, "global_step": 124160, "epoch": 2956} {"train_loss": -6.686028480529785, "global_step": 124161, "epoch": 2956} {"train_loss": -6.57331657409668, "global_step": 124162, "epoch": 2956} {"train_loss": -6.625136375427246, "global_step": 124163, "epoch": 2956} {"train_loss": -6.59486198425293, "global_step": 124164, "epoch": 2956} {"train_loss": -6.5365519523620605, "global_step": 124165, "epoch": 2956} {"train_loss": -6.60816764831543, "global_step": 124166, "epoch": 2956} {"train_loss": -6.720940113067627, "global_step": 124167, "epoch": 2956} {"train_loss": -6.612032890319824, "global_step": 124168, "epoch": 2956} {"train_loss": -6.664095401763916, "global_step": 124169, "epoch": 2956} {"train_loss": -6.610509872436523, "global_step": 124170, "epoch": 2956} {"train_loss": -6.686005592346191, "global_step": 124171, "epoch": 2956} {"train_loss": -6.633230209350586, "global_step": 124172, "epoch": 2956} {"train_loss": -6.599649906158447, "global_step": 124173, "epoch": 2956} {"train_loss": -6.699113368988037, "global_step": 124174, "epoch": 2956} {"train_loss": -6.693727016448975, "global_step": 124175, "epoch": 2956} {"train_loss": -6.690948486328125, "global_step": 124176, "epoch": 2956} {"train_loss": -6.6780290603637695, "global_step": 124177, "epoch": 2956} {"train_loss": -6.7024102210998535, "global_step": 124178, "epoch": 2956} {"train_loss": -6.619941711425781, "global_step": 124179, "epoch": 2956} {"train_loss": -6.609279632568359, "global_step": 124180, "epoch": 2956} {"train_loss": -6.599033355712891, "global_step": 124181, "epoch": 2956} {"train_loss": -6.632992744445801, "global_step": 124182, "epoch": 2956} {"train_loss": -6.594288349151611, "global_step": 124183, "epoch": 2956} {"train_loss": -6.73564338684082, "global_step": 124184, "epoch": 2956} {"train_loss": -6.5865044593811035, "global_step": 124185, "epoch": 2956} {"train_loss": -6.605988502502441, "global_step": 124186, "epoch": 2956} {"train_loss": -6.723959445953369, "global_step": 124187, "epoch": 2956} {"train_loss": -6.608607292175293, "global_step": 124188, "epoch": 2956} {"train_loss": -6.705259323120117, "global_step": 124189, "epoch": 2956} {"train_loss": -6.562257766723633, "global_step": 124190, "epoch": 2956} {"train_loss": -6.605301856994629, "global_step": 124191, "epoch": 2956} {"train_loss": -6.692694664001465, "global_step": 124192, "epoch": 2956} {"train_loss": -6.632653690519787, "global_step": 124193, "epoch": 2956, "val_loss": 77306.4375} {"train_loss": -6.691822528839111, "global_step": 124194, "epoch": 2957} {"train_loss": -6.676876068115234, "global_step": 124195, "epoch": 2957} {"train_loss": -6.652792930603027, "global_step": 124196, "epoch": 2957} {"train_loss": -6.715720176696777, "global_step": 124197, "epoch": 2957} {"train_loss": -6.643178939819336, "global_step": 124198, "epoch": 2957} {"train_loss": -6.682380199432373, "global_step": 124199, "epoch": 2957} {"train_loss": -6.623247146606445, "global_step": 124200, "epoch": 2957} {"train_loss": -6.483112335205078, "global_step": 124201, "epoch": 2957} {"train_loss": -6.632189750671387, "global_step": 124202, "epoch": 2957} {"train_loss": -6.607421398162842, "global_step": 124203, "epoch": 2957} {"train_loss": -6.655109405517578, "global_step": 124204, "epoch": 2957} {"train_loss": -6.6926469802856445, "global_step": 124205, "epoch": 2957} {"train_loss": -6.615246772766113, "global_step": 124206, "epoch": 2957} {"train_loss": -6.726696968078613, "global_step": 124207, "epoch": 2957} {"train_loss": -6.5273637771606445, "global_step": 124208, "epoch": 2957} {"train_loss": -6.6305365562438965, "global_step": 124209, "epoch": 2957} {"train_loss": -6.61855411529541, "global_step": 124210, "epoch": 2957} {"train_loss": -6.660811424255371, "global_step": 124211, "epoch": 2957} {"train_loss": -6.572058200836182, "global_step": 124212, "epoch": 2957} {"train_loss": -6.627055644989014, "global_step": 124213, "epoch": 2957} {"train_loss": -6.563137054443359, "global_step": 124214, "epoch": 2957} {"train_loss": -6.494053363800049, "global_step": 124215, "epoch": 2957} {"train_loss": -6.639430999755859, "global_step": 124216, "epoch": 2957} {"train_loss": -6.549997806549072, "global_step": 124217, "epoch": 2957} {"train_loss": -6.4705071449279785, "global_step": 124218, "epoch": 2957} {"train_loss": -6.585231304168701, "global_step": 124219, "epoch": 2957} {"train_loss": -6.437520980834961, "global_step": 124220, "epoch": 2957} {"train_loss": -6.503803730010986, "global_step": 124221, "epoch": 2957} {"train_loss": -6.484321117401123, "global_step": 124222, "epoch": 2957} {"train_loss": -6.444340705871582, "global_step": 124223, "epoch": 2957} {"train_loss": -6.600518226623535, "global_step": 124224, "epoch": 2957} {"train_loss": -6.472153186798096, "global_step": 124225, "epoch": 2957} {"train_loss": -6.592959403991699, "global_step": 124226, "epoch": 2957} {"train_loss": -6.50982141494751, "global_step": 124227, "epoch": 2957} {"train_loss": -6.542235374450684, "global_step": 124228, "epoch": 2957} {"train_loss": -6.4202880859375, "global_step": 124229, "epoch": 2957} {"train_loss": -6.377742290496826, "global_step": 124230, "epoch": 2957} {"train_loss": -6.511429309844971, "global_step": 124231, "epoch": 2957} {"train_loss": -6.428945541381836, "global_step": 124232, "epoch": 2957} {"train_loss": -6.52836799621582, "global_step": 124233, "epoch": 2957} {"train_loss": -6.565627574920654, "global_step": 124234, "epoch": 2957} {"train_loss": -6.571209260395595, "global_step": 124235, "epoch": 2957, "val_loss": 77197.28125} {"train_loss": -6.527110576629639, "global_step": 124236, "epoch": 2958} {"train_loss": -6.619755744934082, "global_step": 124237, "epoch": 2958} {"train_loss": -6.56851863861084, "global_step": 124238, "epoch": 2958} {"train_loss": -6.5271172523498535, "global_step": 124239, "epoch": 2958} {"train_loss": -6.660833358764648, "global_step": 124240, "epoch": 2958} {"train_loss": -6.578624725341797, "global_step": 124241, "epoch": 2958} {"train_loss": -6.555309295654297, "global_step": 124242, "epoch": 2958} {"train_loss": -6.573457717895508, "global_step": 124243, "epoch": 2958} {"train_loss": -6.529829978942871, "global_step": 124244, "epoch": 2958} {"train_loss": -6.588149070739746, "global_step": 124245, "epoch": 2958} {"train_loss": -6.617210865020752, "global_step": 124246, "epoch": 2958} {"train_loss": -6.5906267166137695, "global_step": 124247, "epoch": 2958} {"train_loss": -6.626378536224365, "global_step": 124248, "epoch": 2958} {"train_loss": -6.688869476318359, "global_step": 124249, "epoch": 2958} {"train_loss": -6.629679203033447, "global_step": 124250, "epoch": 2958} {"train_loss": -6.664166450500488, "global_step": 124251, "epoch": 2958} {"train_loss": -6.657057762145996, "global_step": 124252, "epoch": 2958} {"train_loss": -6.588540077209473, "global_step": 124253, "epoch": 2958} {"train_loss": -6.648452281951904, "global_step": 124254, "epoch": 2958} {"train_loss": -6.640970230102539, "global_step": 124255, "epoch": 2958} {"train_loss": -6.4979705810546875, "global_step": 124256, "epoch": 2958} {"train_loss": -6.854708194732666, "global_step": 124257, "epoch": 2958} {"train_loss": -6.652359485626221, "global_step": 124258, "epoch": 2958} {"train_loss": -6.436851978302002, "global_step": 124259, "epoch": 2958} {"train_loss": -6.564464569091797, "global_step": 124260, "epoch": 2958} {"train_loss": -6.5640692710876465, "global_step": 124261, "epoch": 2958} {"train_loss": -6.39581823348999, "global_step": 124262, "epoch": 2958} {"train_loss": -6.478348731994629, "global_step": 124263, "epoch": 2958} {"train_loss": -6.59456729888916, "global_step": 124264, "epoch": 2958} {"train_loss": -6.448392868041992, "global_step": 124265, "epoch": 2958} {"train_loss": -6.445260524749756, "global_step": 124266, "epoch": 2958} {"train_loss": -6.467155456542969, "global_step": 124267, "epoch": 2958} {"train_loss": -6.59109354019165, "global_step": 124268, "epoch": 2958} {"train_loss": -6.576869010925293, "global_step": 124269, "epoch": 2958} {"train_loss": -6.583250045776367, "global_step": 124270, "epoch": 2958} {"train_loss": -6.437437057495117, "global_step": 124271, "epoch": 2958} {"train_loss": -6.485072135925293, "global_step": 124272, "epoch": 2958} {"train_loss": -6.642374038696289, "global_step": 124273, "epoch": 2958} {"train_loss": -6.528012275695801, "global_step": 124274, "epoch": 2958} {"train_loss": -6.522950172424316, "global_step": 124275, "epoch": 2958} {"train_loss": -6.406534194946289, "global_step": 124276, "epoch": 2958} {"train_loss": -6.56506515684582, "global_step": 124277, "epoch": 2958, "val_loss": 77424.234375} {"train_loss": -6.547466278076172, "global_step": 124278, "epoch": 2959} {"train_loss": -6.574536323547363, "global_step": 124279, "epoch": 2959} {"train_loss": -6.606993198394775, "global_step": 124280, "epoch": 2959} {"train_loss": -6.589627265930176, "global_step": 124281, "epoch": 2959} {"train_loss": -6.633572101593018, "global_step": 124282, "epoch": 2959} {"train_loss": -6.488692283630371, "global_step": 124283, "epoch": 2959} {"train_loss": -6.612924575805664, "global_step": 124284, "epoch": 2959} {"train_loss": -6.519888877868652, "global_step": 124285, "epoch": 2959} {"train_loss": -6.636594295501709, "global_step": 124286, "epoch": 2959} {"train_loss": -6.516404151916504, "global_step": 124287, "epoch": 2959} {"train_loss": -6.657773017883301, "global_step": 124288, "epoch": 2959} {"train_loss": -6.6047821044921875, "global_step": 124289, "epoch": 2959} {"train_loss": -6.784302711486816, "global_step": 124290, "epoch": 2959} {"train_loss": -6.614893913269043, "global_step": 124291, "epoch": 2959} {"train_loss": -6.607980728149414, "global_step": 124292, "epoch": 2959} {"train_loss": -6.610804557800293, "global_step": 124293, "epoch": 2959} {"train_loss": -6.574312210083008, "global_step": 124294, "epoch": 2959} {"train_loss": -6.657087326049805, "global_step": 124295, "epoch": 2959} {"train_loss": -6.632280349731445, "global_step": 124296, "epoch": 2959} {"train_loss": -6.5360822677612305, "global_step": 124297, "epoch": 2959} {"train_loss": -6.7191619873046875, "global_step": 124298, "epoch": 2959} {"train_loss": -6.505245208740234, "global_step": 124299, "epoch": 2959} {"train_loss": -6.693724632263184, "global_step": 124300, "epoch": 2959} {"train_loss": -6.58120059967041, "global_step": 124301, "epoch": 2959} {"train_loss": -6.4788336753845215, "global_step": 124302, "epoch": 2959} {"train_loss": -6.507504463195801, "global_step": 124303, "epoch": 2959} {"train_loss": -6.63500452041626, "global_step": 124304, "epoch": 2959} {"train_loss": -6.569769382476807, "global_step": 124305, "epoch": 2959} {"train_loss": -6.498685836791992, "global_step": 124306, "epoch": 2959} {"train_loss": -6.574810028076172, "global_step": 124307, "epoch": 2959} {"train_loss": -6.596737861633301, "global_step": 124308, "epoch": 2959} {"train_loss": -6.5805253982543945, "global_step": 124309, "epoch": 2959} {"train_loss": -6.5636067390441895, "global_step": 124310, "epoch": 2959} {"train_loss": -6.571926593780518, "global_step": 124311, "epoch": 2959} {"train_loss": -6.569550514221191, "global_step": 124312, "epoch": 2959} {"train_loss": -6.556730270385742, "global_step": 124313, "epoch": 2959} {"train_loss": -6.560938358306885, "global_step": 124314, "epoch": 2959} {"train_loss": -6.663460731506348, "global_step": 124315, "epoch": 2959} {"train_loss": -6.671701431274414, "global_step": 124316, "epoch": 2959} {"train_loss": -6.498006820678711, "global_step": 124317, "epoch": 2959} {"train_loss": -6.68215799331665, "global_step": 124318, "epoch": 2959} {"train_loss": -6.595244487126668, "global_step": 124319, "epoch": 2959, "val_loss": 77300.1640625} {"train_loss": -6.554802894592285, "global_step": 124320, "epoch": 2960} {"train_loss": -6.57456111907959, "global_step": 124321, "epoch": 2960} {"train_loss": -6.434292793273926, "global_step": 124322, "epoch": 2960} {"train_loss": -6.652082920074463, "global_step": 124323, "epoch": 2960} {"train_loss": -6.499135494232178, "global_step": 124324, "epoch": 2960} {"train_loss": -6.457090377807617, "global_step": 124325, "epoch": 2960} {"train_loss": -6.524116516113281, "global_step": 124326, "epoch": 2960} {"train_loss": -6.531754493713379, "global_step": 124327, "epoch": 2960} {"train_loss": -6.577476501464844, "global_step": 124328, "epoch": 2960} {"train_loss": -6.592385292053223, "global_step": 124329, "epoch": 2960} {"train_loss": -6.485928535461426, "global_step": 124330, "epoch": 2960} {"train_loss": -6.59370231628418, "global_step": 124331, "epoch": 2960} {"train_loss": -6.699840068817139, "global_step": 124332, "epoch": 2960} {"train_loss": -6.528768539428711, "global_step": 124333, "epoch": 2960} {"train_loss": -6.588436126708984, "global_step": 124334, "epoch": 2960} {"train_loss": -6.6244964599609375, "global_step": 124335, "epoch": 2960} {"train_loss": -6.617349624633789, "global_step": 124336, "epoch": 2960} {"train_loss": -6.699028968811035, "global_step": 124337, "epoch": 2960} {"train_loss": -6.599616050720215, "global_step": 124338, "epoch": 2960} {"train_loss": -6.6452436447143555, "global_step": 124339, "epoch": 2960} {"train_loss": -6.688506126403809, "global_step": 124340, "epoch": 2960} {"train_loss": -6.671077728271484, "global_step": 124341, "epoch": 2960} {"train_loss": -6.596415042877197, "global_step": 124342, "epoch": 2960} {"train_loss": -6.595894813537598, "global_step": 124343, "epoch": 2960} {"train_loss": -6.6305460929870605, "global_step": 124344, "epoch": 2960} {"train_loss": -6.719627380371094, "global_step": 124345, "epoch": 2960} {"train_loss": -6.647305488586426, "global_step": 124346, "epoch": 2960} {"train_loss": -6.711036682128906, "global_step": 124347, "epoch": 2960} {"train_loss": -6.702712059020996, "global_step": 124348, "epoch": 2960} {"train_loss": -6.606905937194824, "global_step": 124349, "epoch": 2960} {"train_loss": -6.551969528198242, "global_step": 124350, "epoch": 2960} {"train_loss": -6.514072895050049, "global_step": 124351, "epoch": 2960} {"train_loss": -6.592363357543945, "global_step": 124352, "epoch": 2960} {"train_loss": -6.560849189758301, "global_step": 124353, "epoch": 2960} {"train_loss": -6.669541835784912, "global_step": 124354, "epoch": 2960} {"train_loss": -6.575897693634033, "global_step": 124355, "epoch": 2960} {"train_loss": -6.699215888977051, "global_step": 124356, "epoch": 2960} {"train_loss": -6.609498023986816, "global_step": 124357, "epoch": 2960} {"train_loss": -6.530359268188477, "global_step": 124358, "epoch": 2960} {"train_loss": -6.6391801834106445, "global_step": 124359, "epoch": 2960} {"train_loss": -6.552374839782715, "global_step": 124360, "epoch": 2960} {"train_loss": -6.599638904844012, "global_step": 124361, "epoch": 2960, "val_loss": 77454.1328125} {"train_loss": -6.538908958435059, "global_step": 124362, "epoch": 2961} {"train_loss": -6.686756134033203, "global_step": 124363, "epoch": 2961} {"train_loss": -6.477181911468506, "global_step": 124364, "epoch": 2961} {"train_loss": -6.556812286376953, "global_step": 124365, "epoch": 2961} {"train_loss": -6.622219085693359, "global_step": 124366, "epoch": 2961} {"train_loss": -6.485709190368652, "global_step": 124367, "epoch": 2961} {"train_loss": -6.605292320251465, "global_step": 124368, "epoch": 2961} {"train_loss": -6.633407115936279, "global_step": 124369, "epoch": 2961} {"train_loss": -6.633929252624512, "global_step": 124370, "epoch": 2961} {"train_loss": -6.6377458572387695, "global_step": 124371, "epoch": 2961} {"train_loss": -6.57327938079834, "global_step": 124372, "epoch": 2961} {"train_loss": -6.625369071960449, "global_step": 124373, "epoch": 2961} {"train_loss": -6.4747724533081055, "global_step": 124374, "epoch": 2961} {"train_loss": -6.597938537597656, "global_step": 124375, "epoch": 2961} {"train_loss": -6.472649097442627, "global_step": 124376, "epoch": 2961} {"train_loss": -6.595229148864746, "global_step": 124377, "epoch": 2961} {"train_loss": -6.560475826263428, "global_step": 124378, "epoch": 2961} {"train_loss": -6.608161926269531, "global_step": 124379, "epoch": 2961} {"train_loss": -6.569268226623535, "global_step": 124380, "epoch": 2961} {"train_loss": -6.505954742431641, "global_step": 124381, "epoch": 2961} {"train_loss": -6.614253044128418, "global_step": 124382, "epoch": 2961} {"train_loss": -6.590964317321777, "global_step": 124383, "epoch": 2961} {"train_loss": -6.618000507354736, "global_step": 124384, "epoch": 2961} {"train_loss": -6.624971389770508, "global_step": 124385, "epoch": 2961} {"train_loss": -6.67949104309082, "global_step": 124386, "epoch": 2961} {"train_loss": -6.709765434265137, "global_step": 124387, "epoch": 2961} {"train_loss": -6.607661247253418, "global_step": 124388, "epoch": 2961} {"train_loss": -6.554319858551025, "global_step": 124389, "epoch": 2961} {"train_loss": -6.604193687438965, "global_step": 124390, "epoch": 2961} {"train_loss": -6.599656105041504, "global_step": 124391, "epoch": 2961} {"train_loss": -6.58811616897583, "global_step": 124392, "epoch": 2961} {"train_loss": -6.623518943786621, "global_step": 124393, "epoch": 2961} {"train_loss": -6.661186218261719, "global_step": 124394, "epoch": 2961} {"train_loss": -6.719151973724365, "global_step": 124395, "epoch": 2961} {"train_loss": -6.572081565856934, "global_step": 124396, "epoch": 2961} {"train_loss": -6.602109909057617, "global_step": 124397, "epoch": 2961} {"train_loss": -6.592750549316406, "global_step": 124398, "epoch": 2961} {"train_loss": -6.700338840484619, "global_step": 124399, "epoch": 2961} {"train_loss": -6.516544342041016, "global_step": 124400, "epoch": 2961} {"train_loss": -6.69650936126709, "global_step": 124401, "epoch": 2961} {"train_loss": -6.71767520904541, "global_step": 124402, "epoch": 2961} {"train_loss": -6.603630951472691, "global_step": 124403, "epoch": 2961, "val_loss": 77199.6953125} {"train_loss": -6.5799760818481445, "global_step": 124404, "epoch": 2962} {"train_loss": -6.621809959411621, "global_step": 124405, "epoch": 2962} {"train_loss": -6.661318302154541, "global_step": 124406, "epoch": 2962} {"train_loss": -6.637452602386475, "global_step": 124407, "epoch": 2962} {"train_loss": -6.481715679168701, "global_step": 124408, "epoch": 2962} {"train_loss": -6.548213958740234, "global_step": 124409, "epoch": 2962} {"train_loss": -6.560578346252441, "global_step": 124410, "epoch": 2962} {"train_loss": -6.618778705596924, "global_step": 124411, "epoch": 2962} {"train_loss": -6.624417304992676, "global_step": 124412, "epoch": 2962} {"train_loss": -6.531771659851074, "global_step": 124413, "epoch": 2962} {"train_loss": -6.530031204223633, "global_step": 124414, "epoch": 2962} {"train_loss": -6.629362106323242, "global_step": 124415, "epoch": 2962} {"train_loss": -6.61470890045166, "global_step": 124416, "epoch": 2962} {"train_loss": -6.704207420349121, "global_step": 124417, "epoch": 2962} {"train_loss": -6.598784923553467, "global_step": 124418, "epoch": 2962} {"train_loss": -6.644815921783447, "global_step": 124419, "epoch": 2962} {"train_loss": -6.715346336364746, "global_step": 124420, "epoch": 2962} {"train_loss": -6.690454483032227, "global_step": 124421, "epoch": 2962} {"train_loss": -6.611900329589844, "global_step": 124422, "epoch": 2962} {"train_loss": -6.605363845825195, "global_step": 124423, "epoch": 2962} {"train_loss": -6.710628509521484, "global_step": 124424, "epoch": 2962} {"train_loss": -6.609535217285156, "global_step": 124425, "epoch": 2962} {"train_loss": -6.7117462158203125, "global_step": 124426, "epoch": 2962} {"train_loss": -6.774956703186035, "global_step": 124427, "epoch": 2962} {"train_loss": -6.581836700439453, "global_step": 124428, "epoch": 2962} {"train_loss": -6.5986528396606445, "global_step": 124429, "epoch": 2962} {"train_loss": -6.585421085357666, "global_step": 124430, "epoch": 2962} {"train_loss": -6.596881866455078, "global_step": 124431, "epoch": 2962} {"train_loss": -6.593725681304932, "global_step": 124432, "epoch": 2962} {"train_loss": -6.545744895935059, "global_step": 124433, "epoch": 2962} {"train_loss": -6.638045787811279, "global_step": 124434, "epoch": 2962} {"train_loss": -6.618557453155518, "global_step": 124435, "epoch": 2962} {"train_loss": -6.540380477905273, "global_step": 124436, "epoch": 2962} {"train_loss": -6.674720764160156, "global_step": 124437, "epoch": 2962} {"train_loss": -6.578944206237793, "global_step": 124438, "epoch": 2962} {"train_loss": -6.618653297424316, "global_step": 124439, "epoch": 2962} {"train_loss": -6.6161370277404785, "global_step": 124440, "epoch": 2962} {"train_loss": -6.67402458190918, "global_step": 124441, "epoch": 2962} {"train_loss": -6.645317554473877, "global_step": 124442, "epoch": 2962} {"train_loss": -6.639484405517578, "global_step": 124443, "epoch": 2962} {"train_loss": -6.572658538818359, "global_step": 124444, "epoch": 2962} {"train_loss": -6.622996727625529, "global_step": 124445, "epoch": 2962, "val_loss": 76973.2109375} {"train_loss": -6.514017105102539, "global_step": 124446, "epoch": 2963} {"train_loss": -6.619995594024658, "global_step": 124447, "epoch": 2963} {"train_loss": -6.583197593688965, "global_step": 124448, "epoch": 2963} {"train_loss": -6.662670135498047, "global_step": 124449, "epoch": 2963} {"train_loss": -6.5401458740234375, "global_step": 124450, "epoch": 2963} {"train_loss": -6.524576663970947, "global_step": 124451, "epoch": 2963} {"train_loss": -6.474494934082031, "global_step": 124452, "epoch": 2963} {"train_loss": -6.551485061645508, "global_step": 124453, "epoch": 2963} {"train_loss": -6.567854881286621, "global_step": 124454, "epoch": 2963} {"train_loss": -6.488857269287109, "global_step": 124455, "epoch": 2963} {"train_loss": -6.442700386047363, "global_step": 124456, "epoch": 2963} {"train_loss": -6.599617958068848, "global_step": 124457, "epoch": 2963} {"train_loss": -6.5830769538879395, "global_step": 124458, "epoch": 2963} {"train_loss": -6.741034507751465, "global_step": 124459, "epoch": 2963} {"train_loss": -6.668304920196533, "global_step": 124460, "epoch": 2963} {"train_loss": -6.633829593658447, "global_step": 124461, "epoch": 2963} {"train_loss": -6.663907051086426, "global_step": 124462, "epoch": 2963} {"train_loss": -6.660376071929932, "global_step": 124463, "epoch": 2963} {"train_loss": -6.542545318603516, "global_step": 124464, "epoch": 2963} {"train_loss": -6.68255090713501, "global_step": 124465, "epoch": 2963} {"train_loss": -6.698759078979492, "global_step": 124466, "epoch": 2963} {"train_loss": -6.717742919921875, "global_step": 124467, "epoch": 2963} {"train_loss": -6.660759449005127, "global_step": 124468, "epoch": 2963} {"train_loss": -6.71434211730957, "global_step": 124469, "epoch": 2963} {"train_loss": -6.68415641784668, "global_step": 124470, "epoch": 2963} {"train_loss": -6.566454887390137, "global_step": 124471, "epoch": 2963} {"train_loss": -6.719785690307617, "global_step": 124472, "epoch": 2963} {"train_loss": -6.705842018127441, "global_step": 124473, "epoch": 2963} {"train_loss": -6.70280647277832, "global_step": 124474, "epoch": 2963} {"train_loss": -6.669857025146484, "global_step": 124475, "epoch": 2963} {"train_loss": -6.552717685699463, "global_step": 124476, "epoch": 2963} {"train_loss": -6.598941802978516, "global_step": 124477, "epoch": 2963} {"train_loss": -6.604031085968018, "global_step": 124478, "epoch": 2963} {"train_loss": -6.548407077789307, "global_step": 124479, "epoch": 2963} {"train_loss": -6.717221736907959, "global_step": 124480, "epoch": 2963} {"train_loss": -6.593062400817871, "global_step": 124481, "epoch": 2963} {"train_loss": -6.605706691741943, "global_step": 124482, "epoch": 2963} {"train_loss": -6.614252090454102, "global_step": 124483, "epoch": 2963} {"train_loss": -6.698819637298584, "global_step": 124484, "epoch": 2963} {"train_loss": -6.725111961364746, "global_step": 124485, "epoch": 2963} {"train_loss": -6.489077568054199, "global_step": 124486, "epoch": 2963} {"train_loss": -6.619574138096401, "global_step": 124487, "epoch": 2963, "val_loss": 76949.0859375} {"train_loss": -6.640594482421875, "global_step": 124488, "epoch": 2964} {"train_loss": -6.588863372802734, "global_step": 124489, "epoch": 2964} {"train_loss": -6.644144058227539, "global_step": 124490, "epoch": 2964} {"train_loss": -6.663558483123779, "global_step": 124491, "epoch": 2964} {"train_loss": -6.515833854675293, "global_step": 124492, "epoch": 2964} {"train_loss": -6.568793773651123, "global_step": 124493, "epoch": 2964} {"train_loss": -6.564234733581543, "global_step": 124494, "epoch": 2964} {"train_loss": -6.639880180358887, "global_step": 124495, "epoch": 2964} {"train_loss": -6.578363418579102, "global_step": 124496, "epoch": 2964} {"train_loss": -6.490894317626953, "global_step": 124497, "epoch": 2964} {"train_loss": -6.6261749267578125, "global_step": 124498, "epoch": 2964} {"train_loss": -6.569539546966553, "global_step": 124499, "epoch": 2964} {"train_loss": -6.511235237121582, "global_step": 124500, "epoch": 2964} {"train_loss": -6.415477275848389, "global_step": 124501, "epoch": 2964} {"train_loss": -6.678081512451172, "global_step": 124502, "epoch": 2964} {"train_loss": -6.427133560180664, "global_step": 124503, "epoch": 2964} {"train_loss": -6.443063735961914, "global_step": 124504, "epoch": 2964} {"train_loss": -6.509602069854736, "global_step": 124505, "epoch": 2964} {"train_loss": -6.5050554275512695, "global_step": 124506, "epoch": 2964} {"train_loss": -6.579574108123779, "global_step": 124507, "epoch": 2964} {"train_loss": -6.531752586364746, "global_step": 124508, "epoch": 2964} {"train_loss": -6.670100688934326, "global_step": 124509, "epoch": 2964} {"train_loss": -6.6943254470825195, "global_step": 124510, "epoch": 2964} {"train_loss": -6.5454206466674805, "global_step": 124511, "epoch": 2964} {"train_loss": -6.557796955108643, "global_step": 124512, "epoch": 2964} {"train_loss": -6.663764953613281, "global_step": 124513, "epoch": 2964} {"train_loss": -6.690912246704102, "global_step": 124514, "epoch": 2964} {"train_loss": -6.612002372741699, "global_step": 124515, "epoch": 2964} {"train_loss": -6.601643085479736, "global_step": 124516, "epoch": 2964} {"train_loss": -6.627537250518799, "global_step": 124517, "epoch": 2964} {"train_loss": -6.75740909576416, "global_step": 124518, "epoch": 2964} {"train_loss": -6.591628551483154, "global_step": 124519, "epoch": 2964} {"train_loss": -6.619336128234863, "global_step": 124520, "epoch": 2964} {"train_loss": -6.623059272766113, "global_step": 124521, "epoch": 2964} {"train_loss": -6.680590629577637, "global_step": 124522, "epoch": 2964} {"train_loss": -6.636407852172852, "global_step": 124523, "epoch": 2964} {"train_loss": -6.630705833435059, "global_step": 124524, "epoch": 2964} {"train_loss": -6.558167457580566, "global_step": 124525, "epoch": 2964} {"train_loss": -6.678229331970215, "global_step": 124526, "epoch": 2964} {"train_loss": -6.491272926330566, "global_step": 124527, "epoch": 2964} {"train_loss": -6.590704441070557, "global_step": 124528, "epoch": 2964} {"train_loss": -6.58940559341794, "global_step": 124529, "epoch": 2964, "val_loss": 77263.140625} {"train_loss": -6.546501159667969, "global_step": 124530, "epoch": 2965} {"train_loss": -6.603385925292969, "global_step": 124531, "epoch": 2965} {"train_loss": -6.597568511962891, "global_step": 124532, "epoch": 2965} {"train_loss": -6.675698280334473, "global_step": 124533, "epoch": 2965} {"train_loss": -6.627857685089111, "global_step": 124534, "epoch": 2965} {"train_loss": -6.558533668518066, "global_step": 124535, "epoch": 2965} {"train_loss": -6.659728050231934, "global_step": 124536, "epoch": 2965} {"train_loss": -6.611964225769043, "global_step": 124537, "epoch": 2965} {"train_loss": -6.494417190551758, "global_step": 124538, "epoch": 2965} {"train_loss": -6.6083550453186035, "global_step": 124539, "epoch": 2965} {"train_loss": -6.677982330322266, "global_step": 124540, "epoch": 2965} {"train_loss": -6.445530891418457, "global_step": 124541, "epoch": 2965} {"train_loss": -6.651406764984131, "global_step": 124542, "epoch": 2965} {"train_loss": -6.44828987121582, "global_step": 124543, "epoch": 2965} {"train_loss": -6.5048675537109375, "global_step": 124544, "epoch": 2965} {"train_loss": -6.516919136047363, "global_step": 124545, "epoch": 2965} {"train_loss": -6.465137004852295, "global_step": 124546, "epoch": 2965} {"train_loss": -6.511273384094238, "global_step": 124547, "epoch": 2965} {"train_loss": -6.563363075256348, "global_step": 124548, "epoch": 2965} {"train_loss": -6.644933223724365, "global_step": 124549, "epoch": 2965} {"train_loss": -6.533137321472168, "global_step": 124550, "epoch": 2965} {"train_loss": -6.607017517089844, "global_step": 124551, "epoch": 2965} {"train_loss": -6.693033218383789, "global_step": 124552, "epoch": 2965} {"train_loss": -6.60864782333374, "global_step": 124553, "epoch": 2965} {"train_loss": -6.619078636169434, "global_step": 124554, "epoch": 2965} {"train_loss": -6.573631286621094, "global_step": 124555, "epoch": 2965} {"train_loss": -6.53604793548584, "global_step": 124556, "epoch": 2965} {"train_loss": -6.584654808044434, "global_step": 124557, "epoch": 2965} {"train_loss": -6.650482177734375, "global_step": 124558, "epoch": 2965} {"train_loss": -6.4660539627075195, "global_step": 124559, "epoch": 2965} {"train_loss": -6.596344947814941, "global_step": 124560, "epoch": 2965} {"train_loss": -6.683948040008545, "global_step": 124561, "epoch": 2965} {"train_loss": -6.620450973510742, "global_step": 124562, "epoch": 2965} {"train_loss": -6.575251579284668, "global_step": 124563, "epoch": 2965} {"train_loss": -6.47205924987793, "global_step": 124564, "epoch": 2965} {"train_loss": -6.632033824920654, "global_step": 124565, "epoch": 2965} {"train_loss": -6.621306419372559, "global_step": 124566, "epoch": 2965} {"train_loss": -6.538451671600342, "global_step": 124567, "epoch": 2965} {"train_loss": -6.554566860198975, "global_step": 124568, "epoch": 2965} {"train_loss": -6.47273063659668, "global_step": 124569, "epoch": 2965} {"train_loss": -6.598300933837891, "global_step": 124570, "epoch": 2965} {"train_loss": -6.578889108839489, "global_step": 124571, "epoch": 2965, "val_loss": 77057.609375} {"train_loss": -6.554488182067871, "global_step": 124572, "epoch": 2966} {"train_loss": -6.578902244567871, "global_step": 124573, "epoch": 2966} {"train_loss": -6.672243118286133, "global_step": 124574, "epoch": 2966} {"train_loss": -6.603442192077637, "global_step": 124575, "epoch": 2966} {"train_loss": -6.664756774902344, "global_step": 124576, "epoch": 2966} {"train_loss": -6.524040699005127, "global_step": 124577, "epoch": 2966} {"train_loss": -6.594928741455078, "global_step": 124578, "epoch": 2966} {"train_loss": -6.667056560516357, "global_step": 124579, "epoch": 2966} {"train_loss": -6.675137519836426, "global_step": 124580, "epoch": 2966} {"train_loss": -6.660727500915527, "global_step": 124581, "epoch": 2966} {"train_loss": -6.624868869781494, "global_step": 124582, "epoch": 2966} {"train_loss": -6.579168796539307, "global_step": 124583, "epoch": 2966} {"train_loss": -6.610587120056152, "global_step": 124584, "epoch": 2966} {"train_loss": -6.557504177093506, "global_step": 124585, "epoch": 2966} {"train_loss": -6.654818534851074, "global_step": 124586, "epoch": 2966} {"train_loss": -6.5469207763671875, "global_step": 124587, "epoch": 2966} {"train_loss": -6.539671421051025, "global_step": 124588, "epoch": 2966} {"train_loss": -6.738818645477295, "global_step": 124589, "epoch": 2966} {"train_loss": -6.583437442779541, "global_step": 124590, "epoch": 2966} {"train_loss": -6.498957633972168, "global_step": 124591, "epoch": 2966} {"train_loss": -6.4220685958862305, "global_step": 124592, "epoch": 2966} {"train_loss": -6.554714679718018, "global_step": 124593, "epoch": 2966} {"train_loss": -6.516331672668457, "global_step": 124594, "epoch": 2966} {"train_loss": -6.535849094390869, "global_step": 124595, "epoch": 2966} {"train_loss": -6.594841480255127, "global_step": 124596, "epoch": 2966} {"train_loss": -6.575832366943359, "global_step": 124597, "epoch": 2966} {"train_loss": -6.7201433181762695, "global_step": 124598, "epoch": 2966} {"train_loss": -6.575684547424316, "global_step": 124599, "epoch": 2966} {"train_loss": -6.692266464233398, "global_step": 124600, "epoch": 2966} {"train_loss": -6.623051643371582, "global_step": 124601, "epoch": 2966} {"train_loss": -6.483445167541504, "global_step": 124602, "epoch": 2966} {"train_loss": -6.45726203918457, "global_step": 124603, "epoch": 2966} {"train_loss": -6.585488319396973, "global_step": 124604, "epoch": 2966} {"train_loss": -6.601642608642578, "global_step": 124605, "epoch": 2966} {"train_loss": -6.692615509033203, "global_step": 124606, "epoch": 2966} {"train_loss": -6.652454853057861, "global_step": 124607, "epoch": 2966} {"train_loss": -6.70962381362915, "global_step": 124608, "epoch": 2966} {"train_loss": -6.614907264709473, "global_step": 124609, "epoch": 2966} {"train_loss": -6.640998840332031, "global_step": 124610, "epoch": 2966} {"train_loss": -6.55142879486084, "global_step": 124611, "epoch": 2966} {"train_loss": -6.68129825592041, "global_step": 124612, "epoch": 2966} {"train_loss": -6.602968738192604, "global_step": 124613, "epoch": 2966, "val_loss": 77200.1875} {"train_loss": -6.680814743041992, "global_step": 124614, "epoch": 2967} {"train_loss": -6.696032524108887, "global_step": 124615, "epoch": 2967} {"train_loss": -6.66236686706543, "global_step": 124616, "epoch": 2967} {"train_loss": -6.662870407104492, "global_step": 124617, "epoch": 2967} {"train_loss": -6.6073808670043945, "global_step": 124618, "epoch": 2967} {"train_loss": -6.721363544464111, "global_step": 124619, "epoch": 2967} {"train_loss": -6.574135780334473, "global_step": 124620, "epoch": 2967} {"train_loss": -6.481186389923096, "global_step": 124621, "epoch": 2967} {"train_loss": -6.63704252243042, "global_step": 124622, "epoch": 2967} {"train_loss": -6.587327003479004, "global_step": 124623, "epoch": 2967} {"train_loss": -6.694408416748047, "global_step": 124624, "epoch": 2967} {"train_loss": -6.678640365600586, "global_step": 124625, "epoch": 2967} {"train_loss": -6.60174036026001, "global_step": 124626, "epoch": 2967} {"train_loss": -6.602906227111816, "global_step": 124627, "epoch": 2967} {"train_loss": -6.654768466949463, "global_step": 124628, "epoch": 2967} {"train_loss": -6.707404136657715, "global_step": 124629, "epoch": 2967} {"train_loss": -6.604743957519531, "global_step": 124630, "epoch": 2967} {"train_loss": -6.506566047668457, "global_step": 124631, "epoch": 2967} {"train_loss": -6.573087215423584, "global_step": 124632, "epoch": 2967} {"train_loss": -6.632801532745361, "global_step": 124633, "epoch": 2967} {"train_loss": -6.714824676513672, "global_step": 124634, "epoch": 2967} {"train_loss": -6.6140971183776855, "global_step": 124635, "epoch": 2967} {"train_loss": -6.482545852661133, "global_step": 124636, "epoch": 2967} {"train_loss": -6.511722564697266, "global_step": 124637, "epoch": 2967} {"train_loss": -6.640835762023926, "global_step": 124638, "epoch": 2967} {"train_loss": -6.500421524047852, "global_step": 124639, "epoch": 2967} {"train_loss": -6.7196044921875, "global_step": 124640, "epoch": 2967} {"train_loss": -6.5859222412109375, "global_step": 124641, "epoch": 2967} {"train_loss": -6.624421119689941, "global_step": 124642, "epoch": 2967} {"train_loss": -6.728806495666504, "global_step": 124643, "epoch": 2967} {"train_loss": -6.6501665115356445, "global_step": 124644, "epoch": 2967} {"train_loss": -6.630886554718018, "global_step": 124645, "epoch": 2967} {"train_loss": -6.668512344360352, "global_step": 124646, "epoch": 2967} {"train_loss": -6.604791641235352, "global_step": 124647, "epoch": 2967} {"train_loss": -6.670345783233643, "global_step": 124648, "epoch": 2967} {"train_loss": -6.554352283477783, "global_step": 124649, "epoch": 2967} {"train_loss": -6.721902370452881, "global_step": 124650, "epoch": 2967} {"train_loss": -6.594274044036865, "global_step": 124651, "epoch": 2967} {"train_loss": -6.67417049407959, "global_step": 124652, "epoch": 2967} {"train_loss": -6.475004196166992, "global_step": 124653, "epoch": 2967} {"train_loss": -6.525298118591309, "global_step": 124654, "epoch": 2967} {"train_loss": -6.621308201835269, "global_step": 124655, "epoch": 2967, "val_loss": 77107.765625} {"train_loss": -6.483304023742676, "global_step": 124656, "epoch": 2968} {"train_loss": -6.5543012619018555, "global_step": 124657, "epoch": 2968} {"train_loss": -6.5893473625183105, "global_step": 124658, "epoch": 2968} {"train_loss": -6.574556827545166, "global_step": 124659, "epoch": 2968} {"train_loss": -6.535356044769287, "global_step": 124660, "epoch": 2968} {"train_loss": -6.6271772384643555, "global_step": 124661, "epoch": 2968} {"train_loss": -6.426833629608154, "global_step": 124662, "epoch": 2968} {"train_loss": -6.491170883178711, "global_step": 124663, "epoch": 2968} {"train_loss": -6.619747638702393, "global_step": 124664, "epoch": 2968} {"train_loss": -6.621216773986816, "global_step": 124665, "epoch": 2968} {"train_loss": -6.636868476867676, "global_step": 124666, "epoch": 2968} {"train_loss": -6.596792697906494, "global_step": 124667, "epoch": 2968} {"train_loss": -6.511440277099609, "global_step": 124668, "epoch": 2968} {"train_loss": -6.684299468994141, "global_step": 124669, "epoch": 2968} {"train_loss": -6.57563591003418, "global_step": 124670, "epoch": 2968} {"train_loss": -6.6369524002075195, "global_step": 124671, "epoch": 2968} {"train_loss": -6.582693099975586, "global_step": 124672, "epoch": 2968} {"train_loss": -6.543783187866211, "global_step": 124673, "epoch": 2968} {"train_loss": -6.668498516082764, "global_step": 124674, "epoch": 2968} {"train_loss": -6.516235828399658, "global_step": 124675, "epoch": 2968} {"train_loss": -6.457555770874023, "global_step": 124676, "epoch": 2968} {"train_loss": -6.6228179931640625, "global_step": 124677, "epoch": 2968} {"train_loss": -6.600336074829102, "global_step": 124678, "epoch": 2968} {"train_loss": -6.5673933029174805, "global_step": 124679, "epoch": 2968} {"train_loss": -6.617144584655762, "global_step": 124680, "epoch": 2968} {"train_loss": -6.3623552322387695, "global_step": 124681, "epoch": 2968} {"train_loss": -6.6802825927734375, "global_step": 124682, "epoch": 2968} {"train_loss": -6.557672023773193, "global_step": 124683, "epoch": 2968} {"train_loss": -6.59263801574707, "global_step": 124684, "epoch": 2968} {"train_loss": -6.61814022064209, "global_step": 124685, "epoch": 2968} {"train_loss": -6.531926155090332, "global_step": 124686, "epoch": 2968} {"train_loss": -6.57710599899292, "global_step": 124687, "epoch": 2968} {"train_loss": -6.4706854820251465, "global_step": 124688, "epoch": 2968} {"train_loss": -6.537537574768066, "global_step": 124689, "epoch": 2968} {"train_loss": -6.586007118225098, "global_step": 124690, "epoch": 2968} {"train_loss": -6.439980983734131, "global_step": 124691, "epoch": 2968} {"train_loss": -6.613058090209961, "global_step": 124692, "epoch": 2968} {"train_loss": -6.43405818939209, "global_step": 124693, "epoch": 2968} {"train_loss": -6.646466255187988, "global_step": 124694, "epoch": 2968} {"train_loss": -6.47126579284668, "global_step": 124695, "epoch": 2968} {"train_loss": -6.570280075073242, "global_step": 124696, "epoch": 2968} {"train_loss": -6.560968319574992, "global_step": 124697, "epoch": 2968, "val_loss": 77161.9375} {"train_loss": -6.526597499847412, "global_step": 124698, "epoch": 2969} {"train_loss": -6.617818832397461, "global_step": 124699, "epoch": 2969} {"train_loss": -6.534498691558838, "global_step": 124700, "epoch": 2969} {"train_loss": -6.474577903747559, "global_step": 124701, "epoch": 2969} {"train_loss": -6.501761436462402, "global_step": 124702, "epoch": 2969} {"train_loss": -6.5849199295043945, "global_step": 124703, "epoch": 2969} {"train_loss": -6.48360013961792, "global_step": 124704, "epoch": 2969} {"train_loss": -6.63687801361084, "global_step": 124705, "epoch": 2969} {"train_loss": -6.534728050231934, "global_step": 124706, "epoch": 2969} {"train_loss": -6.6722540855407715, "global_step": 124707, "epoch": 2969} {"train_loss": -6.543334007263184, "global_step": 124708, "epoch": 2969} {"train_loss": -6.6981096267700195, "global_step": 124709, "epoch": 2969} {"train_loss": -6.620545387268066, "global_step": 124710, "epoch": 2969} {"train_loss": -6.574697494506836, "global_step": 124711, "epoch": 2969} {"train_loss": -6.668425559997559, "global_step": 124712, "epoch": 2969} {"train_loss": -6.614081382751465, "global_step": 124713, "epoch": 2969} {"train_loss": -6.595534801483154, "global_step": 124714, "epoch": 2969} {"train_loss": -6.631247043609619, "global_step": 124715, "epoch": 2969} {"train_loss": -6.515101909637451, "global_step": 124716, "epoch": 2969} {"train_loss": -6.682153701782227, "global_step": 124717, "epoch": 2969} {"train_loss": -6.690283298492432, "global_step": 124718, "epoch": 2969} {"train_loss": -6.651832580566406, "global_step": 124719, "epoch": 2969} {"train_loss": -6.683220863342285, "global_step": 124720, "epoch": 2969} {"train_loss": -6.631705284118652, "global_step": 124721, "epoch": 2969} {"train_loss": -6.7056474685668945, "global_step": 124722, "epoch": 2969} {"train_loss": -6.697571277618408, "global_step": 124723, "epoch": 2969} {"train_loss": -6.641232013702393, "global_step": 124724, "epoch": 2969} {"train_loss": -6.581114768981934, "global_step": 124725, "epoch": 2969} {"train_loss": -6.664379119873047, "global_step": 124726, "epoch": 2969} {"train_loss": -6.520357131958008, "global_step": 124727, "epoch": 2969} {"train_loss": -6.57121467590332, "global_step": 124728, "epoch": 2969} {"train_loss": -6.703855991363525, "global_step": 124729, "epoch": 2969} {"train_loss": -6.6660637855529785, "global_step": 124730, "epoch": 2969} {"train_loss": -6.649177551269531, "global_step": 124731, "epoch": 2969} {"train_loss": -6.571812629699707, "global_step": 124732, "epoch": 2969} {"train_loss": -6.75434684753418, "global_step": 124733, "epoch": 2969} {"train_loss": -6.546156406402588, "global_step": 124734, "epoch": 2969} {"train_loss": -6.65573787689209, "global_step": 124735, "epoch": 2969} {"train_loss": -6.684122085571289, "global_step": 124736, "epoch": 2969} {"train_loss": -6.507891654968262, "global_step": 124737, "epoch": 2969} {"train_loss": -6.7400360107421875, "global_step": 124738, "epoch": 2969} {"train_loss": -6.614963599613735, "global_step": 124739, "epoch": 2969, "val_loss": 76936.3671875} {"train_loss": -6.620294094085693, "global_step": 124740, "epoch": 2970} {"train_loss": -6.68710994720459, "global_step": 124741, "epoch": 2970} {"train_loss": -6.6491193771362305, "global_step": 124742, "epoch": 2970} {"train_loss": -6.618927001953125, "global_step": 124743, "epoch": 2970} {"train_loss": -6.529306411743164, "global_step": 124744, "epoch": 2970} {"train_loss": -6.520603179931641, "global_step": 124745, "epoch": 2970} {"train_loss": -6.702709674835205, "global_step": 124746, "epoch": 2970} {"train_loss": -6.642815113067627, "global_step": 124747, "epoch": 2970} {"train_loss": -6.624703884124756, "global_step": 124748, "epoch": 2970} {"train_loss": -6.724185943603516, "global_step": 124749, "epoch": 2970} {"train_loss": -6.766953945159912, "global_step": 124750, "epoch": 2970} {"train_loss": -6.535304069519043, "global_step": 124751, "epoch": 2970} {"train_loss": -6.715305805206299, "global_step": 124752, "epoch": 2970} {"train_loss": -6.758051872253418, "global_step": 124753, "epoch": 2970} {"train_loss": -6.643038749694824, "global_step": 124754, "epoch": 2970} {"train_loss": -6.6879191398620605, "global_step": 124755, "epoch": 2970} {"train_loss": -6.592048168182373, "global_step": 124756, "epoch": 2970} {"train_loss": -6.669018745422363, "global_step": 124757, "epoch": 2970} {"train_loss": -6.752424716949463, "global_step": 124758, "epoch": 2970} {"train_loss": -6.6940131187438965, "global_step": 124759, "epoch": 2970} {"train_loss": -6.662179946899414, "global_step": 124760, "epoch": 2970} {"train_loss": -6.559457778930664, "global_step": 124761, "epoch": 2970} {"train_loss": -6.622488975524902, "global_step": 124762, "epoch": 2970} {"train_loss": -6.617618560791016, "global_step": 124763, "epoch": 2970} {"train_loss": -6.702289581298828, "global_step": 124764, "epoch": 2970} {"train_loss": -6.715380668640137, "global_step": 124765, "epoch": 2970} {"train_loss": -6.552554130554199, "global_step": 124766, "epoch": 2970} {"train_loss": -6.628627777099609, "global_step": 124767, "epoch": 2970} {"train_loss": -6.580782413482666, "global_step": 124768, "epoch": 2970} {"train_loss": -6.625927448272705, "global_step": 124769, "epoch": 2970} {"train_loss": -6.639545440673828, "global_step": 124770, "epoch": 2970} {"train_loss": -6.586301803588867, "global_step": 124771, "epoch": 2970} {"train_loss": -6.648369789123535, "global_step": 124772, "epoch": 2970} {"train_loss": -6.546181678771973, "global_step": 124773, "epoch": 2970} {"train_loss": -6.720076560974121, "global_step": 124774, "epoch": 2970} {"train_loss": -6.632364273071289, "global_step": 124775, "epoch": 2970} {"train_loss": -6.614871025085449, "global_step": 124776, "epoch": 2970} {"train_loss": -6.56772518157959, "global_step": 124777, "epoch": 2970} {"train_loss": -6.667510986328125, "global_step": 124778, "epoch": 2970} {"train_loss": -6.665656089782715, "global_step": 124779, "epoch": 2970} {"train_loss": -6.593869209289551, "global_step": 124780, "epoch": 2970} {"train_loss": -6.638608853022258, "global_step": 124781, "epoch": 2970, "val_loss": 77216.875} {"train_loss": -6.652233123779297, "global_step": 124782, "epoch": 2971} {"train_loss": -6.622968673706055, "global_step": 124783, "epoch": 2971} {"train_loss": -6.567021369934082, "global_step": 124784, "epoch": 2971} {"train_loss": -6.601980686187744, "global_step": 124785, "epoch": 2971} {"train_loss": -6.568944931030273, "global_step": 124786, "epoch": 2971} {"train_loss": -6.4694671630859375, "global_step": 124787, "epoch": 2971} {"train_loss": -6.561954498291016, "global_step": 124788, "epoch": 2971} {"train_loss": -6.583629608154297, "global_step": 124789, "epoch": 2971} {"train_loss": -6.6454596519470215, "global_step": 124790, "epoch": 2971} {"train_loss": -6.53880500793457, "global_step": 124791, "epoch": 2971} {"train_loss": -6.6469407081604, "global_step": 124792, "epoch": 2971} {"train_loss": -6.640326499938965, "global_step": 124793, "epoch": 2971} {"train_loss": -6.691048622131348, "global_step": 124794, "epoch": 2971} {"train_loss": -6.627435684204102, "global_step": 124795, "epoch": 2971} {"train_loss": -6.593513488769531, "global_step": 124796, "epoch": 2971} {"train_loss": -6.64571475982666, "global_step": 124797, "epoch": 2971} {"train_loss": -6.61461877822876, "global_step": 124798, "epoch": 2971} {"train_loss": -6.5687150955200195, "global_step": 124799, "epoch": 2971} {"train_loss": -6.6427764892578125, "global_step": 124800, "epoch": 2971} {"train_loss": -6.603794097900391, "global_step": 124801, "epoch": 2971} {"train_loss": -6.59410285949707, "global_step": 124802, "epoch": 2971} {"train_loss": -6.577112674713135, "global_step": 124803, "epoch": 2971} {"train_loss": -6.773502349853516, "global_step": 124804, "epoch": 2971} {"train_loss": -6.718211650848389, "global_step": 124805, "epoch": 2971} {"train_loss": -6.626712322235107, "global_step": 124806, "epoch": 2971} {"train_loss": -6.5578293800354, "global_step": 124807, "epoch": 2971} {"train_loss": -6.658769130706787, "global_step": 124808, "epoch": 2971} {"train_loss": -6.7004852294921875, "global_step": 124809, "epoch": 2971} {"train_loss": -6.723869323730469, "global_step": 124810, "epoch": 2971} {"train_loss": -6.668322563171387, "global_step": 124811, "epoch": 2971} {"train_loss": -6.624506950378418, "global_step": 124812, "epoch": 2971} {"train_loss": -6.620446681976318, "global_step": 124813, "epoch": 2971} {"train_loss": -6.574334621429443, "global_step": 124814, "epoch": 2971} {"train_loss": -6.726543426513672, "global_step": 124815, "epoch": 2971} {"train_loss": -6.645317077636719, "global_step": 124816, "epoch": 2971} {"train_loss": -6.691437721252441, "global_step": 124817, "epoch": 2971} {"train_loss": -6.461754322052002, "global_step": 124818, "epoch": 2971} {"train_loss": -6.54805850982666, "global_step": 124819, "epoch": 2971} {"train_loss": -6.515849590301514, "global_step": 124820, "epoch": 2971} {"train_loss": -6.571010589599609, "global_step": 124821, "epoch": 2971} {"train_loss": -6.697905540466309, "global_step": 124822, "epoch": 2971} {"train_loss": -6.62001541682652, "global_step": 124823, "epoch": 2971, "val_loss": 77276.421875} {"train_loss": -6.632970809936523, "global_step": 124824, "epoch": 2972} {"train_loss": -6.561971664428711, "global_step": 124825, "epoch": 2972} {"train_loss": -6.652178764343262, "global_step": 124826, "epoch": 2972} {"train_loss": -6.564202785491943, "global_step": 124827, "epoch": 2972} {"train_loss": -6.586625099182129, "global_step": 124828, "epoch": 2972} {"train_loss": -6.6794209480285645, "global_step": 124829, "epoch": 2972} {"train_loss": -6.669430732727051, "global_step": 124830, "epoch": 2972} {"train_loss": -6.6747589111328125, "global_step": 124831, "epoch": 2972} {"train_loss": -6.659968376159668, "global_step": 124832, "epoch": 2972} {"train_loss": -6.674684524536133, "global_step": 124833, "epoch": 2972} {"train_loss": -6.758586883544922, "global_step": 124834, "epoch": 2972} {"train_loss": -6.594470024108887, "global_step": 124835, "epoch": 2972} {"train_loss": -6.593541622161865, "global_step": 124836, "epoch": 2972} {"train_loss": -6.545501708984375, "global_step": 124837, "epoch": 2972} {"train_loss": -6.607928276062012, "global_step": 124838, "epoch": 2972} {"train_loss": -6.565263271331787, "global_step": 124839, "epoch": 2972} {"train_loss": -6.666769027709961, "global_step": 124840, "epoch": 2972} {"train_loss": -6.6147308349609375, "global_step": 124841, "epoch": 2972} {"train_loss": -6.565694808959961, "global_step": 124842, "epoch": 2972} {"train_loss": -6.561100006103516, "global_step": 124843, "epoch": 2972} {"train_loss": -6.603621006011963, "global_step": 124844, "epoch": 2972} {"train_loss": -6.576744079589844, "global_step": 124845, "epoch": 2972} {"train_loss": -6.706058502197266, "global_step": 124846, "epoch": 2972} {"train_loss": -6.657509803771973, "global_step": 124847, "epoch": 2972} {"train_loss": -6.6054487228393555, "global_step": 124848, "epoch": 2972} {"train_loss": -6.561816692352295, "global_step": 124849, "epoch": 2972} {"train_loss": -6.691851615905762, "global_step": 124850, "epoch": 2972} {"train_loss": -6.649285316467285, "global_step": 124851, "epoch": 2972} {"train_loss": -6.6640825271606445, "global_step": 124852, "epoch": 2972} {"train_loss": -6.554065227508545, "global_step": 124853, "epoch": 2972} {"train_loss": -6.637570381164551, "global_step": 124854, "epoch": 2972} {"train_loss": -6.667779922485352, "global_step": 124855, "epoch": 2972} {"train_loss": -6.736661911010742, "global_step": 124856, "epoch": 2972} {"train_loss": -6.695895671844482, "global_step": 124857, "epoch": 2972} {"train_loss": -6.663238048553467, "global_step": 124858, "epoch": 2972} {"train_loss": -6.474411964416504, "global_step": 124859, "epoch": 2972} {"train_loss": -6.718971252441406, "global_step": 124860, "epoch": 2972} {"train_loss": -6.683954238891602, "global_step": 124861, "epoch": 2972} {"train_loss": -6.411428451538086, "global_step": 124862, "epoch": 2972} {"train_loss": -6.4382500648498535, "global_step": 124863, "epoch": 2972} {"train_loss": -6.638284683227539, "global_step": 124864, "epoch": 2972} {"train_loss": -6.617852767308553, "global_step": 124865, "epoch": 2972, "val_loss": 77033.59375} {"train_loss": -6.629327774047852, "global_step": 124866, "epoch": 2973} {"train_loss": -6.526076316833496, "global_step": 124867, "epoch": 2973} {"train_loss": -6.69528341293335, "global_step": 124868, "epoch": 2973} {"train_loss": -6.668351173400879, "global_step": 124869, "epoch": 2973} {"train_loss": -6.664576530456543, "global_step": 124870, "epoch": 2973} {"train_loss": -6.529886245727539, "global_step": 124871, "epoch": 2973} {"train_loss": -6.595216274261475, "global_step": 124872, "epoch": 2973} {"train_loss": -6.5283966064453125, "global_step": 124873, "epoch": 2973} {"train_loss": -6.6176605224609375, "global_step": 124874, "epoch": 2973} {"train_loss": -6.548863887786865, "global_step": 124875, "epoch": 2973} {"train_loss": -6.638060569763184, "global_step": 124876, "epoch": 2973} {"train_loss": -6.552443504333496, "global_step": 124877, "epoch": 2973} {"train_loss": -6.688144683837891, "global_step": 124878, "epoch": 2973} {"train_loss": -6.607215881347656, "global_step": 124879, "epoch": 2973} {"train_loss": -6.629528999328613, "global_step": 124880, "epoch": 2973} {"train_loss": -6.63948917388916, "global_step": 124881, "epoch": 2973} {"train_loss": -6.60706901550293, "global_step": 124882, "epoch": 2973} {"train_loss": -6.555119037628174, "global_step": 124883, "epoch": 2973} {"train_loss": -6.668816089630127, "global_step": 124884, "epoch": 2973} {"train_loss": -6.614344596862793, "global_step": 124885, "epoch": 2973} {"train_loss": -6.5272932052612305, "global_step": 124886, "epoch": 2973} {"train_loss": -6.618922233581543, "global_step": 124887, "epoch": 2973} {"train_loss": -6.606152057647705, "global_step": 124888, "epoch": 2973} {"train_loss": -6.502999305725098, "global_step": 124889, "epoch": 2973} {"train_loss": -6.448290824890137, "global_step": 124890, "epoch": 2973} {"train_loss": -6.522023677825928, "global_step": 124891, "epoch": 2973} {"train_loss": -6.537149906158447, "global_step": 124892, "epoch": 2973} {"train_loss": -6.625271320343018, "global_step": 124893, "epoch": 2973} {"train_loss": -6.644383430480957, "global_step": 124894, "epoch": 2973} {"train_loss": -6.561456203460693, "global_step": 124895, "epoch": 2973} {"train_loss": -6.572605133056641, "global_step": 124896, "epoch": 2973} {"train_loss": -6.532558441162109, "global_step": 124897, "epoch": 2973} {"train_loss": -6.712292671203613, "global_step": 124898, "epoch": 2973} {"train_loss": -6.528232574462891, "global_step": 124899, "epoch": 2973} {"train_loss": -6.560821533203125, "global_step": 124900, "epoch": 2973} {"train_loss": -6.6360626220703125, "global_step": 124901, "epoch": 2973} {"train_loss": -6.607915878295898, "global_step": 124902, "epoch": 2973} {"train_loss": -6.638465881347656, "global_step": 124903, "epoch": 2973} {"train_loss": -6.538041114807129, "global_step": 124904, "epoch": 2973} {"train_loss": -6.650747299194336, "global_step": 124905, "epoch": 2973} {"train_loss": -6.647363662719727, "global_step": 124906, "epoch": 2973} {"train_loss": -6.595726819265456, "global_step": 124907, "epoch": 2973, "val_loss": 76995.625} {"train_loss": -6.68341064453125, "global_step": 124908, "epoch": 2974} {"train_loss": -6.73001766204834, "global_step": 124909, "epoch": 2974} {"train_loss": -6.636542797088623, "global_step": 124910, "epoch": 2974} {"train_loss": -6.692109107971191, "global_step": 124911, "epoch": 2974} {"train_loss": -6.692739486694336, "global_step": 124912, "epoch": 2974} {"train_loss": -6.538396835327148, "global_step": 124913, "epoch": 2974} {"train_loss": -6.6523051261901855, "global_step": 124914, "epoch": 2974} {"train_loss": -6.716673374176025, "global_step": 124915, "epoch": 2974} {"train_loss": -6.686985015869141, "global_step": 124916, "epoch": 2974} {"train_loss": -6.724167346954346, "global_step": 124917, "epoch": 2974} {"train_loss": -6.685323715209961, "global_step": 124918, "epoch": 2974} {"train_loss": -6.596419811248779, "global_step": 124919, "epoch": 2974} {"train_loss": -6.669469833374023, "global_step": 124920, "epoch": 2974} {"train_loss": -6.531606674194336, "global_step": 124921, "epoch": 2974} {"train_loss": -6.700160026550293, "global_step": 124922, "epoch": 2974} {"train_loss": -6.715728282928467, "global_step": 124923, "epoch": 2974} {"train_loss": -6.732255935668945, "global_step": 124924, "epoch": 2974} {"train_loss": -6.708029747009277, "global_step": 124925, "epoch": 2974} {"train_loss": -6.623960494995117, "global_step": 124926, "epoch": 2974} {"train_loss": -6.677383899688721, "global_step": 124927, "epoch": 2974} {"train_loss": -6.640214920043945, "global_step": 124928, "epoch": 2974} {"train_loss": -6.659838676452637, "global_step": 124929, "epoch": 2974} {"train_loss": -6.624076843261719, "global_step": 124930, "epoch": 2974} {"train_loss": -6.5226287841796875, "global_step": 124931, "epoch": 2974} {"train_loss": -6.6012067794799805, "global_step": 124932, "epoch": 2974} {"train_loss": -6.631496429443359, "global_step": 124933, "epoch": 2974} {"train_loss": -6.629739761352539, "global_step": 124934, "epoch": 2974} {"train_loss": -6.516671657562256, "global_step": 124935, "epoch": 2974} {"train_loss": -6.628323554992676, "global_step": 124936, "epoch": 2974} {"train_loss": -6.506588935852051, "global_step": 124937, "epoch": 2974} {"train_loss": -6.52412223815918, "global_step": 124938, "epoch": 2974} {"train_loss": -6.512939453125, "global_step": 124939, "epoch": 2974} {"train_loss": -6.486269950866699, "global_step": 124940, "epoch": 2974} {"train_loss": -6.660029411315918, "global_step": 124941, "epoch": 2974} {"train_loss": -6.502139568328857, "global_step": 124942, "epoch": 2974} {"train_loss": -6.483126640319824, "global_step": 124943, "epoch": 2974} {"train_loss": -6.58854341506958, "global_step": 124944, "epoch": 2974} {"train_loss": -6.3903279304504395, "global_step": 124945, "epoch": 2974} {"train_loss": -6.597714424133301, "global_step": 124946, "epoch": 2974} {"train_loss": -6.505784034729004, "global_step": 124947, "epoch": 2974} {"train_loss": -6.586098670959473, "global_step": 124948, "epoch": 2974} {"train_loss": -6.613205444245112, "global_step": 124949, "epoch": 2974, "val_loss": 77102.796875} {"train_loss": -6.559483528137207, "global_step": 124950, "epoch": 2975} {"train_loss": -6.602716445922852, "global_step": 124951, "epoch": 2975} {"train_loss": -6.605796813964844, "global_step": 124952, "epoch": 2975} {"train_loss": -6.603696346282959, "global_step": 124953, "epoch": 2975} {"train_loss": -6.5179643630981445, "global_step": 124954, "epoch": 2975} {"train_loss": -6.611242294311523, "global_step": 124955, "epoch": 2975} {"train_loss": -6.612524032592773, "global_step": 124956, "epoch": 2975} {"train_loss": -6.504383563995361, "global_step": 124957, "epoch": 2975} {"train_loss": -6.494120121002197, "global_step": 124958, "epoch": 2975} {"train_loss": -6.728470802307129, "global_step": 124959, "epoch": 2975} {"train_loss": -6.580264091491699, "global_step": 124960, "epoch": 2975} {"train_loss": -6.662250518798828, "global_step": 124961, "epoch": 2975} {"train_loss": -6.587802886962891, "global_step": 124962, "epoch": 2975} {"train_loss": -6.581080913543701, "global_step": 124963, "epoch": 2975} {"train_loss": -6.532742977142334, "global_step": 124964, "epoch": 2975} {"train_loss": -6.492055892944336, "global_step": 124965, "epoch": 2975} {"train_loss": -6.696741104125977, "global_step": 124966, "epoch": 2975} {"train_loss": -6.619679927825928, "global_step": 124967, "epoch": 2975} {"train_loss": -6.618992805480957, "global_step": 124968, "epoch": 2975} {"train_loss": -6.607593536376953, "global_step": 124969, "epoch": 2975} {"train_loss": -6.570034980773926, "global_step": 124970, "epoch": 2975} {"train_loss": -6.568973064422607, "global_step": 124971, "epoch": 2975} {"train_loss": -6.698484420776367, "global_step": 124972, "epoch": 2975} {"train_loss": -6.602529525756836, "global_step": 124973, "epoch": 2975} {"train_loss": -6.603850364685059, "global_step": 124974, "epoch": 2975} {"train_loss": -6.657841205596924, "global_step": 124975, "epoch": 2975} {"train_loss": -6.536273002624512, "global_step": 124976, "epoch": 2975} {"train_loss": -6.675136566162109, "global_step": 124977, "epoch": 2975} {"train_loss": -6.483614921569824, "global_step": 124978, "epoch": 2975} {"train_loss": -6.620689392089844, "global_step": 124979, "epoch": 2975} {"train_loss": -6.618068695068359, "global_step": 124980, "epoch": 2975} {"train_loss": -6.628874778747559, "global_step": 124981, "epoch": 2975} {"train_loss": -6.657367706298828, "global_step": 124982, "epoch": 2975} {"train_loss": -6.672477722167969, "global_step": 124983, "epoch": 2975} {"train_loss": -6.616113185882568, "global_step": 124984, "epoch": 2975} {"train_loss": -6.561129570007324, "global_step": 124985, "epoch": 2975} {"train_loss": -6.63823938369751, "global_step": 124986, "epoch": 2975} {"train_loss": -6.43297815322876, "global_step": 124987, "epoch": 2975} {"train_loss": -6.672618865966797, "global_step": 124988, "epoch": 2975} {"train_loss": -6.624566078186035, "global_step": 124989, "epoch": 2975} {"train_loss": -6.721350193023682, "global_step": 124990, "epoch": 2975} {"train_loss": -6.602321851821173, "global_step": 124991, "epoch": 2975, "val_loss": 77175.078125} {"train_loss": -6.642020225524902, "global_step": 124992, "epoch": 2976} {"train_loss": -6.669821739196777, "global_step": 124993, "epoch": 2976} {"train_loss": -6.617241859436035, "global_step": 124994, "epoch": 2976} {"train_loss": -6.639551162719727, "global_step": 124995, "epoch": 2976} {"train_loss": -6.694465637207031, "global_step": 124996, "epoch": 2976} {"train_loss": -6.674681663513184, "global_step": 124997, "epoch": 2976} {"train_loss": -6.722640037536621, "global_step": 124998, "epoch": 2976} {"train_loss": -6.672549247741699, "global_step": 124999, "epoch": 2976} {"train_loss": -6.685741424560547, "global_step": 125000, "epoch": 2976} {"train_loss": -6.576747417449951, "global_step": 125001, "epoch": 2976} {"train_loss": -6.6057024002075195, "global_step": 125002, "epoch": 2976} {"train_loss": -6.631167888641357, "global_step": 125003, "epoch": 2976} {"train_loss": -6.449273586273193, "global_step": 125004, "epoch": 2976} {"train_loss": -6.533138275146484, "global_step": 125005, "epoch": 2976} {"train_loss": -6.665688514709473, "global_step": 125006, "epoch": 2976} {"train_loss": -6.590479850769043, "global_step": 125007, "epoch": 2976} {"train_loss": -6.654903411865234, "global_step": 125008, "epoch": 2976} {"train_loss": -6.605973720550537, "global_step": 125009, "epoch": 2976} {"train_loss": -6.502625942230225, "global_step": 125010, "epoch": 2976} {"train_loss": -6.5782928466796875, "global_step": 125011, "epoch": 2976} {"train_loss": -6.582765579223633, "global_step": 125012, "epoch": 2976} {"train_loss": -6.587226390838623, "global_step": 125013, "epoch": 2976} {"train_loss": -6.700881004333496, "global_step": 125014, "epoch": 2976} {"train_loss": -6.551649570465088, "global_step": 125015, "epoch": 2976} {"train_loss": -6.552712440490723, "global_step": 125016, "epoch": 2976} {"train_loss": -6.517866134643555, "global_step": 125017, "epoch": 2976} {"train_loss": -6.523031711578369, "global_step": 125018, "epoch": 2976} {"train_loss": -6.561568260192871, "global_step": 125019, "epoch": 2976} {"train_loss": -6.497474670410156, "global_step": 125020, "epoch": 2976} {"train_loss": -6.659076690673828, "global_step": 125021, "epoch": 2976} {"train_loss": -6.522943019866943, "global_step": 125022, "epoch": 2976} {"train_loss": -6.5091118812561035, "global_step": 125023, "epoch": 2976} {"train_loss": -6.675220966339111, "global_step": 125024, "epoch": 2976} {"train_loss": -6.508940696716309, "global_step": 125025, "epoch": 2976} {"train_loss": -6.529613971710205, "global_step": 125026, "epoch": 2976} {"train_loss": -6.728369235992432, "global_step": 125027, "epoch": 2976} {"train_loss": -6.590986728668213, "global_step": 125028, "epoch": 2976} {"train_loss": -6.598880767822266, "global_step": 125029, "epoch": 2976} {"train_loss": -6.602389335632324, "global_step": 125030, "epoch": 2976} {"train_loss": -6.613016128540039, "global_step": 125031, "epoch": 2976} {"train_loss": -6.616911888122559, "global_step": 125032, "epoch": 2976} {"train_loss": -6.602402914138067, "global_step": 125033, "epoch": 2976, "val_loss": 77051.8125} {"train_loss": -6.623684406280518, "global_step": 125034, "epoch": 2977} {"train_loss": -6.679922103881836, "global_step": 125035, "epoch": 2977} {"train_loss": -6.682021141052246, "global_step": 125036, "epoch": 2977} {"train_loss": -6.582942485809326, "global_step": 125037, "epoch": 2977} {"train_loss": -6.724888801574707, "global_step": 125038, "epoch": 2977} {"train_loss": -6.567020416259766, "global_step": 125039, "epoch": 2977} {"train_loss": -6.607527732849121, "global_step": 125040, "epoch": 2977} {"train_loss": -6.595821857452393, "global_step": 125041, "epoch": 2977} {"train_loss": -6.582420349121094, "global_step": 125042, "epoch": 2977} {"train_loss": -6.578700542449951, "global_step": 125043, "epoch": 2977} {"train_loss": -6.590299129486084, "global_step": 125044, "epoch": 2977} {"train_loss": -6.540472984313965, "global_step": 125045, "epoch": 2977} {"train_loss": -6.522791862487793, "global_step": 125046, "epoch": 2977} {"train_loss": -6.542447566986084, "global_step": 125047, "epoch": 2977} {"train_loss": -6.651287078857422, "global_step": 125048, "epoch": 2977} {"train_loss": -6.5660905838012695, "global_step": 125049, "epoch": 2977} {"train_loss": -6.602898597717285, "global_step": 125050, "epoch": 2977} {"train_loss": -6.541166305541992, "global_step": 125051, "epoch": 2977} {"train_loss": -6.585307598114014, "global_step": 125052, "epoch": 2977} {"train_loss": -6.722369194030762, "global_step": 125053, "epoch": 2977} {"train_loss": -6.639323711395264, "global_step": 125054, "epoch": 2977} {"train_loss": -6.683539390563965, "global_step": 125055, "epoch": 2977} {"train_loss": -6.641421318054199, "global_step": 125056, "epoch": 2977} {"train_loss": -6.715921878814697, "global_step": 125057, "epoch": 2977} {"train_loss": -6.662156105041504, "global_step": 125058, "epoch": 2977} {"train_loss": -6.649304389953613, "global_step": 125059, "epoch": 2977} {"train_loss": -6.558177947998047, "global_step": 125060, "epoch": 2977} {"train_loss": -6.601339817047119, "global_step": 125061, "epoch": 2977} {"train_loss": -6.627987861633301, "global_step": 125062, "epoch": 2977} {"train_loss": -6.554043292999268, "global_step": 125063, "epoch": 2977} {"train_loss": -6.603366851806641, "global_step": 125064, "epoch": 2977} {"train_loss": -6.670698165893555, "global_step": 125065, "epoch": 2977} {"train_loss": -6.517390251159668, "global_step": 125066, "epoch": 2977} {"train_loss": -6.547269821166992, "global_step": 125067, "epoch": 2977} {"train_loss": -6.699084758758545, "global_step": 125068, "epoch": 2977} {"train_loss": -6.592695236206055, "global_step": 125069, "epoch": 2977} {"train_loss": -6.647065162658691, "global_step": 125070, "epoch": 2977} {"train_loss": -6.654678821563721, "global_step": 125071, "epoch": 2977} {"train_loss": -6.685312747955322, "global_step": 125072, "epoch": 2977} {"train_loss": -6.592597484588623, "global_step": 125073, "epoch": 2977} {"train_loss": -6.677128791809082, "global_step": 125074, "epoch": 2977} {"train_loss": -6.618674187433152, "global_step": 125075, "epoch": 2977, "val_loss": 77380.1484375} {"train_loss": -6.655417442321777, "global_step": 125076, "epoch": 2978} {"train_loss": -6.675877571105957, "global_step": 125077, "epoch": 2978} {"train_loss": -6.592525482177734, "global_step": 125078, "epoch": 2978} {"train_loss": -6.600929260253906, "global_step": 125079, "epoch": 2978} {"train_loss": -6.682433128356934, "global_step": 125080, "epoch": 2978} {"train_loss": -6.620350360870361, "global_step": 125081, "epoch": 2978} {"train_loss": -6.645652770996094, "global_step": 125082, "epoch": 2978} {"train_loss": -6.629965782165527, "global_step": 125083, "epoch": 2978} {"train_loss": -6.619760513305664, "global_step": 125084, "epoch": 2978} {"train_loss": -6.526425361633301, "global_step": 125085, "epoch": 2978} {"train_loss": -6.665329933166504, "global_step": 125086, "epoch": 2978} {"train_loss": -6.614080429077148, "global_step": 125087, "epoch": 2978} {"train_loss": -6.668099880218506, "global_step": 125088, "epoch": 2978} {"train_loss": -6.633973121643066, "global_step": 125089, "epoch": 2978} {"train_loss": -6.447290420532227, "global_step": 125090, "epoch": 2978} {"train_loss": -6.657105922698975, "global_step": 125091, "epoch": 2978} {"train_loss": -6.652710437774658, "global_step": 125092, "epoch": 2978} {"train_loss": -6.502197265625, "global_step": 125093, "epoch": 2978} {"train_loss": -6.5245466232299805, "global_step": 125094, "epoch": 2978} {"train_loss": -6.625329494476318, "global_step": 125095, "epoch": 2978} {"train_loss": -6.294244766235352, "global_step": 125096, "epoch": 2978} {"train_loss": -6.614429473876953, "global_step": 125097, "epoch": 2978} {"train_loss": -6.407904148101807, "global_step": 125098, "epoch": 2978} {"train_loss": -6.204716682434082, "global_step": 125099, "epoch": 2978} {"train_loss": -6.506027698516846, "global_step": 125100, "epoch": 2978} {"train_loss": -6.292448043823242, "global_step": 125101, "epoch": 2978} {"train_loss": -6.4161057472229, "global_step": 125102, "epoch": 2978} {"train_loss": -6.4011430740356445, "global_step": 125103, "epoch": 2978} {"train_loss": -6.491448402404785, "global_step": 125104, "epoch": 2978} {"train_loss": -6.353161811828613, "global_step": 125105, "epoch": 2978} {"train_loss": -6.5058770179748535, "global_step": 125106, "epoch": 2978} {"train_loss": -6.270464897155762, "global_step": 125107, "epoch": 2978} {"train_loss": -6.512287139892578, "global_step": 125108, "epoch": 2978} {"train_loss": -6.403693199157715, "global_step": 125109, "epoch": 2978} {"train_loss": -6.343742370605469, "global_step": 125110, "epoch": 2978} {"train_loss": -6.535077095031738, "global_step": 125111, "epoch": 2978} {"train_loss": -6.430176734924316, "global_step": 125112, "epoch": 2978} {"train_loss": -6.5176825523376465, "global_step": 125113, "epoch": 2978} {"train_loss": -6.537500858306885, "global_step": 125114, "epoch": 2978} {"train_loss": -6.4575324058532715, "global_step": 125115, "epoch": 2978} {"train_loss": -6.529458999633789, "global_step": 125116, "epoch": 2978} {"train_loss": -6.520083461488996, "global_step": 125117, "epoch": 2978, "val_loss": 77066.4375} {"train_loss": -6.524892807006836, "global_step": 125118, "epoch": 2979} {"train_loss": -6.522557258605957, "global_step": 125119, "epoch": 2979} {"train_loss": -6.608962059020996, "global_step": 125120, "epoch": 2979} {"train_loss": -6.527419090270996, "global_step": 125121, "epoch": 2979} {"train_loss": -6.564841270446777, "global_step": 125122, "epoch": 2979} {"train_loss": -6.670576095581055, "global_step": 125123, "epoch": 2979} {"train_loss": -6.664571762084961, "global_step": 125124, "epoch": 2979} {"train_loss": -6.648571491241455, "global_step": 125125, "epoch": 2979} {"train_loss": -6.64409065246582, "global_step": 125126, "epoch": 2979} {"train_loss": -6.644733428955078, "global_step": 125127, "epoch": 2979} {"train_loss": -6.646015167236328, "global_step": 125128, "epoch": 2979} {"train_loss": -6.665187835693359, "global_step": 125129, "epoch": 2979} {"train_loss": -6.62611722946167, "global_step": 125130, "epoch": 2979} {"train_loss": -6.733236312866211, "global_step": 125131, "epoch": 2979} {"train_loss": -6.509756088256836, "global_step": 125132, "epoch": 2979} {"train_loss": -6.608852863311768, "global_step": 125133, "epoch": 2979} {"train_loss": -6.637423515319824, "global_step": 125134, "epoch": 2979} {"train_loss": -6.540462493896484, "global_step": 125135, "epoch": 2979} {"train_loss": -6.6171674728393555, "global_step": 125136, "epoch": 2979} {"train_loss": -6.657400608062744, "global_step": 125137, "epoch": 2979} {"train_loss": -6.626579284667969, "global_step": 125138, "epoch": 2979} {"train_loss": -6.649999618530273, "global_step": 125139, "epoch": 2979} {"train_loss": -6.703327178955078, "global_step": 125140, "epoch": 2979} {"train_loss": -6.732325553894043, "global_step": 125141, "epoch": 2979} {"train_loss": -6.574182987213135, "global_step": 125142, "epoch": 2979} {"train_loss": -6.68087911605835, "global_step": 125143, "epoch": 2979} {"train_loss": -6.680165767669678, "global_step": 125144, "epoch": 2979} {"train_loss": -6.630849838256836, "global_step": 125145, "epoch": 2979} {"train_loss": -6.664554595947266, "global_step": 125146, "epoch": 2979} {"train_loss": -6.573966979980469, "global_step": 125147, "epoch": 2979} {"train_loss": -6.574530601501465, "global_step": 125148, "epoch": 2979} {"train_loss": -6.625176429748535, "global_step": 125149, "epoch": 2979} {"train_loss": -6.606295585632324, "global_step": 125150, "epoch": 2979} {"train_loss": -6.548303604125977, "global_step": 125151, "epoch": 2979} {"train_loss": -6.536208629608154, "global_step": 125152, "epoch": 2979} {"train_loss": -6.690731048583984, "global_step": 125153, "epoch": 2979} {"train_loss": -6.666477203369141, "global_step": 125154, "epoch": 2979} {"train_loss": -6.721135139465332, "global_step": 125155, "epoch": 2979} {"train_loss": -6.555149555206299, "global_step": 125156, "epoch": 2979} {"train_loss": -6.717338562011719, "global_step": 125157, "epoch": 2979} {"train_loss": -6.518492221832275, "global_step": 125158, "epoch": 2979} {"train_loss": -6.622039692742484, "global_step": 125159, "epoch": 2979, "val_loss": 77125.0} {"train_loss": -6.589455604553223, "global_step": 125160, "epoch": 2980} {"train_loss": -6.592927932739258, "global_step": 125161, "epoch": 2980} {"train_loss": -6.659876823425293, "global_step": 125162, "epoch": 2980} {"train_loss": -6.620497703552246, "global_step": 125163, "epoch": 2980} {"train_loss": -6.534916877746582, "global_step": 125164, "epoch": 2980} {"train_loss": -6.578351974487305, "global_step": 125165, "epoch": 2980} {"train_loss": -6.585445404052734, "global_step": 125166, "epoch": 2980} {"train_loss": -6.61391544342041, "global_step": 125167, "epoch": 2980} {"train_loss": -6.670605182647705, "global_step": 125168, "epoch": 2980} {"train_loss": -6.513846397399902, "global_step": 125169, "epoch": 2980} {"train_loss": -6.64174747467041, "global_step": 125170, "epoch": 2980} {"train_loss": -6.510991096496582, "global_step": 125171, "epoch": 2980} {"train_loss": -6.712237358093262, "global_step": 125172, "epoch": 2980} {"train_loss": -6.619077682495117, "global_step": 125173, "epoch": 2980} {"train_loss": -6.7096452713012695, "global_step": 125174, "epoch": 2980} {"train_loss": -6.6121954917907715, "global_step": 125175, "epoch": 2980} {"train_loss": -6.575277805328369, "global_step": 125176, "epoch": 2980} {"train_loss": -6.5479278564453125, "global_step": 125177, "epoch": 2980} {"train_loss": -6.612557888031006, "global_step": 125178, "epoch": 2980} {"train_loss": -6.6422529220581055, "global_step": 125179, "epoch": 2980} {"train_loss": -6.516529560089111, "global_step": 125180, "epoch": 2980} {"train_loss": -6.785898208618164, "global_step": 125181, "epoch": 2980} {"train_loss": -6.572690010070801, "global_step": 125182, "epoch": 2980} {"train_loss": -6.5570454597473145, "global_step": 125183, "epoch": 2980} {"train_loss": -6.506870269775391, "global_step": 125184, "epoch": 2980} {"train_loss": -6.633589267730713, "global_step": 125185, "epoch": 2980} {"train_loss": -6.6741485595703125, "global_step": 125186, "epoch": 2980} {"train_loss": -6.583600044250488, "global_step": 125187, "epoch": 2980} {"train_loss": -6.5314836502075195, "global_step": 125188, "epoch": 2980} {"train_loss": -6.593236923217773, "global_step": 125189, "epoch": 2980} {"train_loss": -6.507933616638184, "global_step": 125190, "epoch": 2980} {"train_loss": -6.669938087463379, "global_step": 125191, "epoch": 2980} {"train_loss": -6.354844570159912, "global_step": 125192, "epoch": 2980} {"train_loss": -6.488924026489258, "global_step": 125193, "epoch": 2980} {"train_loss": -6.432143688201904, "global_step": 125194, "epoch": 2980} {"train_loss": -6.4964919090271, "global_step": 125195, "epoch": 2980} {"train_loss": -6.590824127197266, "global_step": 125196, "epoch": 2980} {"train_loss": -6.522549629211426, "global_step": 125197, "epoch": 2980} {"train_loss": -6.610884666442871, "global_step": 125198, "epoch": 2980} {"train_loss": -6.543581008911133, "global_step": 125199, "epoch": 2980} {"train_loss": -6.562563896179199, "global_step": 125200, "epoch": 2980} {"train_loss": -6.579401617958432, "global_step": 125201, "epoch": 2980, "val_loss": 77109.2734375} {"train_loss": -6.633603096008301, "global_step": 125202, "epoch": 2981} {"train_loss": -6.467172622680664, "global_step": 125203, "epoch": 2981} {"train_loss": -6.693709850311279, "global_step": 125204, "epoch": 2981} {"train_loss": -6.622414588928223, "global_step": 125205, "epoch": 2981} {"train_loss": -6.514416694641113, "global_step": 125206, "epoch": 2981} {"train_loss": -6.4051513671875, "global_step": 125207, "epoch": 2981} {"train_loss": -6.543642044067383, "global_step": 125208, "epoch": 2981} {"train_loss": -6.654447078704834, "global_step": 125209, "epoch": 2981} {"train_loss": -6.664069175720215, "global_step": 125210, "epoch": 2981} {"train_loss": -6.706254005432129, "global_step": 125211, "epoch": 2981} {"train_loss": -6.480071067810059, "global_step": 125212, "epoch": 2981} {"train_loss": -6.638461112976074, "global_step": 125213, "epoch": 2981} {"train_loss": -6.542383670806885, "global_step": 125214, "epoch": 2981} {"train_loss": -6.566751003265381, "global_step": 125215, "epoch": 2981} {"train_loss": -6.5917205810546875, "global_step": 125216, "epoch": 2981} {"train_loss": -6.47613525390625, "global_step": 125217, "epoch": 2981} {"train_loss": -6.574751853942871, "global_step": 125218, "epoch": 2981} {"train_loss": -6.616416931152344, "global_step": 125219, "epoch": 2981} {"train_loss": -6.640472412109375, "global_step": 125220, "epoch": 2981} {"train_loss": -6.624332904815674, "global_step": 125221, "epoch": 2981} {"train_loss": -6.661681175231934, "global_step": 125222, "epoch": 2981} {"train_loss": -6.618506908416748, "global_step": 125223, "epoch": 2981} {"train_loss": -6.435839653015137, "global_step": 125224, "epoch": 2981} {"train_loss": -6.523312091827393, "global_step": 125225, "epoch": 2981} {"train_loss": -6.570259094238281, "global_step": 125226, "epoch": 2981} {"train_loss": -6.642153263092041, "global_step": 125227, "epoch": 2981} {"train_loss": -6.755553245544434, "global_step": 125228, "epoch": 2981} {"train_loss": -6.579411029815674, "global_step": 125229, "epoch": 2981} {"train_loss": -6.57985782623291, "global_step": 125230, "epoch": 2981} {"train_loss": -6.636045455932617, "global_step": 125231, "epoch": 2981} {"train_loss": -6.633205413818359, "global_step": 125232, "epoch": 2981} {"train_loss": -6.478766918182373, "global_step": 125233, "epoch": 2981} {"train_loss": -6.588229179382324, "global_step": 125234, "epoch": 2981} {"train_loss": -6.598820686340332, "global_step": 125235, "epoch": 2981} {"train_loss": -6.617399215698242, "global_step": 125236, "epoch": 2981} {"train_loss": -6.655954360961914, "global_step": 125237, "epoch": 2981} {"train_loss": -6.761295795440674, "global_step": 125238, "epoch": 2981} {"train_loss": -6.61099100112915, "global_step": 125239, "epoch": 2981} {"train_loss": -6.569221496582031, "global_step": 125240, "epoch": 2981} {"train_loss": -6.582197189331055, "global_step": 125241, "epoch": 2981} {"train_loss": -6.602049827575684, "global_step": 125242, "epoch": 2981} {"train_loss": -6.595786582855951, "global_step": 125243, "epoch": 2981, "val_loss": 77196.4140625} {"train_loss": -6.627826690673828, "global_step": 125244, "epoch": 2982} {"train_loss": -6.703393459320068, "global_step": 125245, "epoch": 2982} {"train_loss": -6.642858505249023, "global_step": 125246, "epoch": 2982} {"train_loss": -6.639164924621582, "global_step": 125247, "epoch": 2982} {"train_loss": -6.710163116455078, "global_step": 125248, "epoch": 2982} {"train_loss": -6.619784832000732, "global_step": 125249, "epoch": 2982} {"train_loss": -6.568155765533447, "global_step": 125250, "epoch": 2982} {"train_loss": -6.568757057189941, "global_step": 125251, "epoch": 2982} {"train_loss": -6.6250505447387695, "global_step": 125252, "epoch": 2982} {"train_loss": -6.535965442657471, "global_step": 125253, "epoch": 2982} {"train_loss": -6.617692947387695, "global_step": 125254, "epoch": 2982} {"train_loss": -6.61287260055542, "global_step": 125255, "epoch": 2982} {"train_loss": -6.581603050231934, "global_step": 125256, "epoch": 2982} {"train_loss": -6.714768409729004, "global_step": 125257, "epoch": 2982} {"train_loss": -6.6762590408325195, "global_step": 125258, "epoch": 2982} {"train_loss": -6.682882308959961, "global_step": 125259, "epoch": 2982} {"train_loss": -6.632894039154053, "global_step": 125260, "epoch": 2982} {"train_loss": -6.725912570953369, "global_step": 125261, "epoch": 2982} {"train_loss": -6.644684791564941, "global_step": 125262, "epoch": 2982} {"train_loss": -6.6522674560546875, "global_step": 125263, "epoch": 2982} {"train_loss": -6.691851615905762, "global_step": 125264, "epoch": 2982} {"train_loss": -6.599408149719238, "global_step": 125265, "epoch": 2982} {"train_loss": -6.530298233032227, "global_step": 125266, "epoch": 2982} {"train_loss": -6.784473896026611, "global_step": 125267, "epoch": 2982} {"train_loss": -6.62135648727417, "global_step": 125268, "epoch": 2982} {"train_loss": -6.64642333984375, "global_step": 125269, "epoch": 2982} {"train_loss": -6.656320095062256, "global_step": 125270, "epoch": 2982} {"train_loss": -6.7366437911987305, "global_step": 125271, "epoch": 2982} {"train_loss": -6.712874412536621, "global_step": 125272, "epoch": 2982} {"train_loss": -6.631165504455566, "global_step": 125273, "epoch": 2982} {"train_loss": -6.682901859283447, "global_step": 125274, "epoch": 2982} {"train_loss": -6.676586151123047, "global_step": 125275, "epoch": 2982} {"train_loss": -6.658840656280518, "global_step": 125276, "epoch": 2982} {"train_loss": -6.655918598175049, "global_step": 125277, "epoch": 2982} {"train_loss": -6.617615699768066, "global_step": 125278, "epoch": 2982} {"train_loss": -6.581674098968506, "global_step": 125279, "epoch": 2982} {"train_loss": -6.666944980621338, "global_step": 125280, "epoch": 2982} {"train_loss": -6.515885829925537, "global_step": 125281, "epoch": 2982} {"train_loss": -6.632292747497559, "global_step": 125282, "epoch": 2982} {"train_loss": -6.676867485046387, "global_step": 125283, "epoch": 2982} {"train_loss": -6.650601387023926, "global_step": 125284, "epoch": 2982} {"train_loss": -6.6419542744046165, "global_step": 125285, "epoch": 2982, "val_loss": 77133.0078125} {"train_loss": -6.626920700073242, "global_step": 125286, "epoch": 2983} {"train_loss": -6.479485034942627, "global_step": 125287, "epoch": 2983} {"train_loss": -6.627739429473877, "global_step": 125288, "epoch": 2983} {"train_loss": -6.631071090698242, "global_step": 125289, "epoch": 2983} {"train_loss": -6.609803676605225, "global_step": 125290, "epoch": 2983} {"train_loss": -6.638985633850098, "global_step": 125291, "epoch": 2983} {"train_loss": -6.602558135986328, "global_step": 125292, "epoch": 2983} {"train_loss": -6.588254451751709, "global_step": 125293, "epoch": 2983} {"train_loss": -6.660306930541992, "global_step": 125294, "epoch": 2983} {"train_loss": -6.732385635375977, "global_step": 125295, "epoch": 2983} {"train_loss": -6.732762336730957, "global_step": 125296, "epoch": 2983} {"train_loss": -6.6359076499938965, "global_step": 125297, "epoch": 2983} {"train_loss": -6.651638031005859, "global_step": 125298, "epoch": 2983} {"train_loss": -6.673803329467773, "global_step": 125299, "epoch": 2983} {"train_loss": -6.734703063964844, "global_step": 125300, "epoch": 2983} {"train_loss": -6.689277648925781, "global_step": 125301, "epoch": 2983} {"train_loss": -6.640624523162842, "global_step": 125302, "epoch": 2983} {"train_loss": -6.569133281707764, "global_step": 125303, "epoch": 2983} {"train_loss": -6.57731294631958, "global_step": 125304, "epoch": 2983} {"train_loss": -6.7510986328125, "global_step": 125305, "epoch": 2983} {"train_loss": -6.51479959487915, "global_step": 125306, "epoch": 2983} {"train_loss": -6.578617095947266, "global_step": 125307, "epoch": 2983} {"train_loss": -6.673147201538086, "global_step": 125308, "epoch": 2983} {"train_loss": -6.511534690856934, "global_step": 125309, "epoch": 2983} {"train_loss": -6.574826240539551, "global_step": 125310, "epoch": 2983} {"train_loss": -6.514915466308594, "global_step": 125311, "epoch": 2983} {"train_loss": -6.541266441345215, "global_step": 125312, "epoch": 2983} {"train_loss": -6.544846057891846, "global_step": 125313, "epoch": 2983} {"train_loss": -6.551203727722168, "global_step": 125314, "epoch": 2983} {"train_loss": -6.490439414978027, "global_step": 125315, "epoch": 2983} {"train_loss": -6.494615077972412, "global_step": 125316, "epoch": 2983} {"train_loss": -6.399654865264893, "global_step": 125317, "epoch": 2983} {"train_loss": -6.6003522872924805, "global_step": 125318, "epoch": 2983} {"train_loss": -6.462405681610107, "global_step": 125319, "epoch": 2983} {"train_loss": -6.575011730194092, "global_step": 125320, "epoch": 2983} {"train_loss": -6.487545490264893, "global_step": 125321, "epoch": 2983} {"train_loss": -6.595341682434082, "global_step": 125322, "epoch": 2983} {"train_loss": -6.487337112426758, "global_step": 125323, "epoch": 2983} {"train_loss": -6.551668167114258, "global_step": 125324, "epoch": 2983} {"train_loss": -6.458215713500977, "global_step": 125325, "epoch": 2983} {"train_loss": -6.468387126922607, "global_step": 125326, "epoch": 2983} {"train_loss": -6.5791072731926326, "global_step": 125327, "epoch": 2983, "val_loss": 77285.3828125} {"train_loss": -6.542532920837402, "global_step": 125328, "epoch": 2984} {"train_loss": -6.507826805114746, "global_step": 125329, "epoch": 2984} {"train_loss": -6.589560508728027, "global_step": 125330, "epoch": 2984} {"train_loss": -6.514275550842285, "global_step": 125331, "epoch": 2984} {"train_loss": -6.480810642242432, "global_step": 125332, "epoch": 2984} {"train_loss": -6.623082160949707, "global_step": 125333, "epoch": 2984} {"train_loss": -6.625446319580078, "global_step": 125334, "epoch": 2984} {"train_loss": -6.5637407302856445, "global_step": 125335, "epoch": 2984} {"train_loss": -6.532104015350342, "global_step": 125336, "epoch": 2984} {"train_loss": -6.664094924926758, "global_step": 125337, "epoch": 2984} {"train_loss": -6.518440246582031, "global_step": 125338, "epoch": 2984} {"train_loss": -6.589134216308594, "global_step": 125339, "epoch": 2984} {"train_loss": -6.593148231506348, "global_step": 125340, "epoch": 2984} {"train_loss": -6.551602363586426, "global_step": 125341, "epoch": 2984} {"train_loss": -6.629528999328613, "global_step": 125342, "epoch": 2984} {"train_loss": -6.606802940368652, "global_step": 125343, "epoch": 2984} {"train_loss": -6.518700122833252, "global_step": 125344, "epoch": 2984} {"train_loss": -6.637656211853027, "global_step": 125345, "epoch": 2984} {"train_loss": -6.593631744384766, "global_step": 125346, "epoch": 2984} {"train_loss": -6.545589923858643, "global_step": 125347, "epoch": 2984} {"train_loss": -6.645370006561279, "global_step": 125348, "epoch": 2984} {"train_loss": -6.686410903930664, "global_step": 125349, "epoch": 2984} {"train_loss": -6.611957550048828, "global_step": 125350, "epoch": 2984} {"train_loss": -6.509294509887695, "global_step": 125351, "epoch": 2984} {"train_loss": -6.713387966156006, "global_step": 125352, "epoch": 2984} {"train_loss": -6.679024696350098, "global_step": 125353, "epoch": 2984} {"train_loss": -6.604062080383301, "global_step": 125354, "epoch": 2984} {"train_loss": -6.613118648529053, "global_step": 125355, "epoch": 2984} {"train_loss": -6.666155815124512, "global_step": 125356, "epoch": 2984} {"train_loss": -6.654488563537598, "global_step": 125357, "epoch": 2984} {"train_loss": -6.59909200668335, "global_step": 125358, "epoch": 2984} {"train_loss": -6.691432952880859, "global_step": 125359, "epoch": 2984} {"train_loss": -6.6238932609558105, "global_step": 125360, "epoch": 2984} {"train_loss": -6.641335964202881, "global_step": 125361, "epoch": 2984} {"train_loss": -6.67030668258667, "global_step": 125362, "epoch": 2984} {"train_loss": -6.694120407104492, "global_step": 125363, "epoch": 2984} {"train_loss": -6.629246234893799, "global_step": 125364, "epoch": 2984} {"train_loss": -6.710349082946777, "global_step": 125365, "epoch": 2984} {"train_loss": -6.6466474533081055, "global_step": 125366, "epoch": 2984} {"train_loss": -6.68430233001709, "global_step": 125367, "epoch": 2984} {"train_loss": -6.597317218780518, "global_step": 125368, "epoch": 2984} {"train_loss": -6.61023473739624, "global_step": 125369, "epoch": 2984, "val_loss": 77139.2734375} {"train_loss": -6.658621788024902, "global_step": 125370, "epoch": 2985} {"train_loss": -6.719689846038818, "global_step": 125371, "epoch": 2985} {"train_loss": -6.694342136383057, "global_step": 125372, "epoch": 2985} {"train_loss": -6.513665676116943, "global_step": 125373, "epoch": 2985} {"train_loss": -6.604828834533691, "global_step": 125374, "epoch": 2985} {"train_loss": -6.577817916870117, "global_step": 125375, "epoch": 2985} {"train_loss": -6.633278846740723, "global_step": 125376, "epoch": 2985} {"train_loss": -6.6669921875, "global_step": 125377, "epoch": 2985} {"train_loss": -6.746559143066406, "global_step": 125378, "epoch": 2985} {"train_loss": -6.682216644287109, "global_step": 125379, "epoch": 2985} {"train_loss": -6.734389305114746, "global_step": 125380, "epoch": 2985} {"train_loss": -6.563142776489258, "global_step": 125381, "epoch": 2985} {"train_loss": -6.639308452606201, "global_step": 125382, "epoch": 2985} {"train_loss": -6.658750534057617, "global_step": 125383, "epoch": 2985} {"train_loss": -6.665813446044922, "global_step": 125384, "epoch": 2985} {"train_loss": -6.539546489715576, "global_step": 125385, "epoch": 2985} {"train_loss": -6.697490215301514, "global_step": 125386, "epoch": 2985} {"train_loss": -6.584323883056641, "global_step": 125387, "epoch": 2985} {"train_loss": -6.570879936218262, "global_step": 125388, "epoch": 2985} {"train_loss": -6.663061141967773, "global_step": 125389, "epoch": 2985} {"train_loss": -6.708235740661621, "global_step": 125390, "epoch": 2985} {"train_loss": -6.683905601501465, "global_step": 125391, "epoch": 2985} {"train_loss": -6.6403398513793945, "global_step": 125392, "epoch": 2985} {"train_loss": -6.6351423263549805, "global_step": 125393, "epoch": 2985} {"train_loss": -6.7427496910095215, "global_step": 125394, "epoch": 2985} {"train_loss": -6.584310054779053, "global_step": 125395, "epoch": 2985} {"train_loss": -6.705698013305664, "global_step": 125396, "epoch": 2985} {"train_loss": -6.570858001708984, "global_step": 125397, "epoch": 2985} {"train_loss": -6.641929626464844, "global_step": 125398, "epoch": 2985} {"train_loss": -6.679630279541016, "global_step": 125399, "epoch": 2985} {"train_loss": -6.65640115737915, "global_step": 125400, "epoch": 2985} {"train_loss": -6.695549011230469, "global_step": 125401, "epoch": 2985} {"train_loss": -6.559427738189697, "global_step": 125402, "epoch": 2985} {"train_loss": -6.6648101806640625, "global_step": 125403, "epoch": 2985} {"train_loss": -6.5489912033081055, "global_step": 125404, "epoch": 2985} {"train_loss": -6.678101539611816, "global_step": 125405, "epoch": 2985} {"train_loss": -6.662898063659668, "global_step": 125406, "epoch": 2985} {"train_loss": -6.5398101806640625, "global_step": 125407, "epoch": 2985} {"train_loss": -6.65935754776001, "global_step": 125408, "epoch": 2985} {"train_loss": -6.675442695617676, "global_step": 125409, "epoch": 2985} {"train_loss": -6.622832298278809, "global_step": 125410, "epoch": 2985} {"train_loss": -6.640002296084449, "global_step": 125411, "epoch": 2985, "val_loss": 76947.671875} {"train_loss": -6.679978370666504, "global_step": 125412, "epoch": 2986} {"train_loss": -6.592441082000732, "global_step": 125413, "epoch": 2986} {"train_loss": -6.658158779144287, "global_step": 125414, "epoch": 2986} {"train_loss": -6.6335344314575195, "global_step": 125415, "epoch": 2986} {"train_loss": -6.572453498840332, "global_step": 125416, "epoch": 2986} {"train_loss": -6.764378547668457, "global_step": 125417, "epoch": 2986} {"train_loss": -6.657207489013672, "global_step": 125418, "epoch": 2986} {"train_loss": -6.68257474899292, "global_step": 125419, "epoch": 2986} {"train_loss": -6.63721227645874, "global_step": 125420, "epoch": 2986} {"train_loss": -6.575691223144531, "global_step": 125421, "epoch": 2986} {"train_loss": -6.621010780334473, "global_step": 125422, "epoch": 2986} {"train_loss": -6.6681671142578125, "global_step": 125423, "epoch": 2986} {"train_loss": -6.535137176513672, "global_step": 125424, "epoch": 2986} {"train_loss": -6.685690879821777, "global_step": 125425, "epoch": 2986} {"train_loss": -6.706259727478027, "global_step": 125426, "epoch": 2986} {"train_loss": -6.610897064208984, "global_step": 125427, "epoch": 2986} {"train_loss": -6.669291019439697, "global_step": 125428, "epoch": 2986} {"train_loss": -6.607343673706055, "global_step": 125429, "epoch": 2986} {"train_loss": -6.696634292602539, "global_step": 125430, "epoch": 2986} {"train_loss": -6.683506011962891, "global_step": 125431, "epoch": 2986} {"train_loss": -6.698134899139404, "global_step": 125432, "epoch": 2986} {"train_loss": -6.563473224639893, "global_step": 125433, "epoch": 2986} {"train_loss": -6.579438209533691, "global_step": 125434, "epoch": 2986} {"train_loss": -6.680850982666016, "global_step": 125435, "epoch": 2986} {"train_loss": -6.683664798736572, "global_step": 125436, "epoch": 2986} {"train_loss": -6.681210517883301, "global_step": 125437, "epoch": 2986} {"train_loss": -6.64981746673584, "global_step": 125438, "epoch": 2986} {"train_loss": -6.5415120124816895, "global_step": 125439, "epoch": 2986} {"train_loss": -6.685068130493164, "global_step": 125440, "epoch": 2986} {"train_loss": -6.683040618896484, "global_step": 125441, "epoch": 2986} {"train_loss": -6.745933532714844, "global_step": 125442, "epoch": 2986} {"train_loss": -6.659873962402344, "global_step": 125443, "epoch": 2986} {"train_loss": -6.541494846343994, "global_step": 125444, "epoch": 2986} {"train_loss": -6.598245620727539, "global_step": 125445, "epoch": 2986} {"train_loss": -6.595164775848389, "global_step": 125446, "epoch": 2986} {"train_loss": -6.650877952575684, "global_step": 125447, "epoch": 2986} {"train_loss": -6.536696910858154, "global_step": 125448, "epoch": 2986} {"train_loss": -6.652878284454346, "global_step": 125449, "epoch": 2986} {"train_loss": -6.6791887283325195, "global_step": 125450, "epoch": 2986} {"train_loss": -6.643612384796143, "global_step": 125451, "epoch": 2986} {"train_loss": -6.732323169708252, "global_step": 125452, "epoch": 2986} {"train_loss": -6.645195188976469, "global_step": 125453, "epoch": 2986, "val_loss": 77213.6875} {"train_loss": -6.604691982269287, "global_step": 125454, "epoch": 2987} {"train_loss": -6.684310436248779, "global_step": 125455, "epoch": 2987} {"train_loss": -6.470348358154297, "global_step": 125456, "epoch": 2987} {"train_loss": -6.6695990562438965, "global_step": 125457, "epoch": 2987} {"train_loss": -6.633607864379883, "global_step": 125458, "epoch": 2987} {"train_loss": -6.690485000610352, "global_step": 125459, "epoch": 2987} {"train_loss": -6.670849800109863, "global_step": 125460, "epoch": 2987} {"train_loss": -6.794863700866699, "global_step": 125461, "epoch": 2987} {"train_loss": -6.740176677703857, "global_step": 125462, "epoch": 2987} {"train_loss": -6.550789833068848, "global_step": 125463, "epoch": 2987} {"train_loss": -6.589384078979492, "global_step": 125464, "epoch": 2987} {"train_loss": -6.599607467651367, "global_step": 125465, "epoch": 2987} {"train_loss": -6.681992530822754, "global_step": 125466, "epoch": 2987} {"train_loss": -6.577143669128418, "global_step": 125467, "epoch": 2987} {"train_loss": -6.593988418579102, "global_step": 125468, "epoch": 2987} {"train_loss": -6.6192097663879395, "global_step": 125469, "epoch": 2987} {"train_loss": -6.68526029586792, "global_step": 125470, "epoch": 2987} {"train_loss": -6.530834197998047, "global_step": 125471, "epoch": 2987} {"train_loss": -6.5340576171875, "global_step": 125472, "epoch": 2987} {"train_loss": -6.6636762619018555, "global_step": 125473, "epoch": 2987} {"train_loss": -6.697214603424072, "global_step": 125474, "epoch": 2987} {"train_loss": -6.5637431144714355, "global_step": 125475, "epoch": 2987} {"train_loss": -6.527240753173828, "global_step": 125476, "epoch": 2987} {"train_loss": -6.617433547973633, "global_step": 125477, "epoch": 2987} {"train_loss": -6.526002883911133, "global_step": 125478, "epoch": 2987} {"train_loss": -6.449236869812012, "global_step": 125479, "epoch": 2987} {"train_loss": -6.561626434326172, "global_step": 125480, "epoch": 2987} {"train_loss": -6.499213218688965, "global_step": 125481, "epoch": 2987} {"train_loss": -6.563699722290039, "global_step": 125482, "epoch": 2987} {"train_loss": -6.526611328125, "global_step": 125483, "epoch": 2987} {"train_loss": -6.514250755310059, "global_step": 125484, "epoch": 2987} {"train_loss": -6.59168815612793, "global_step": 125485, "epoch": 2987} {"train_loss": -6.425779342651367, "global_step": 125486, "epoch": 2987} {"train_loss": -6.540472984313965, "global_step": 125487, "epoch": 2987} {"train_loss": -6.522897720336914, "global_step": 125488, "epoch": 2987} {"train_loss": -6.694272994995117, "global_step": 125489, "epoch": 2987} {"train_loss": -6.677609443664551, "global_step": 125490, "epoch": 2987} {"train_loss": -6.598518371582031, "global_step": 125491, "epoch": 2987} {"train_loss": -6.551542282104492, "global_step": 125492, "epoch": 2987} {"train_loss": -6.591763019561768, "global_step": 125493, "epoch": 2987} {"train_loss": -6.707918167114258, "global_step": 125494, "epoch": 2987} {"train_loss": -6.599949791317894, "global_step": 125495, "epoch": 2987, "val_loss": 77360.640625} {"train_loss": -6.563531875610352, "global_step": 125496, "epoch": 2988} {"train_loss": -6.65999698638916, "global_step": 125497, "epoch": 2988} {"train_loss": -6.512366771697998, "global_step": 125498, "epoch": 2988} {"train_loss": -6.534241676330566, "global_step": 125499, "epoch": 2988} {"train_loss": -6.635188102722168, "global_step": 125500, "epoch": 2988} {"train_loss": -6.598215103149414, "global_step": 125501, "epoch": 2988} {"train_loss": -6.661569595336914, "global_step": 125502, "epoch": 2988} {"train_loss": -6.613314628601074, "global_step": 125503, "epoch": 2988} {"train_loss": -6.63533878326416, "global_step": 125504, "epoch": 2988} {"train_loss": -6.548852920532227, "global_step": 125505, "epoch": 2988} {"train_loss": -6.532858848571777, "global_step": 125506, "epoch": 2988} {"train_loss": -6.599606513977051, "global_step": 125507, "epoch": 2988} {"train_loss": -6.558952331542969, "global_step": 125508, "epoch": 2988} {"train_loss": -6.58474063873291, "global_step": 125509, "epoch": 2988} {"train_loss": -6.629266262054443, "global_step": 125510, "epoch": 2988} {"train_loss": -6.478569984436035, "global_step": 125511, "epoch": 2988} {"train_loss": -6.69162130355835, "global_step": 125512, "epoch": 2988} {"train_loss": -6.596218109130859, "global_step": 125513, "epoch": 2988} {"train_loss": -6.513718605041504, "global_step": 125514, "epoch": 2988} {"train_loss": -6.596931457519531, "global_step": 125515, "epoch": 2988} {"train_loss": -6.537867069244385, "global_step": 125516, "epoch": 2988} {"train_loss": -6.646995544433594, "global_step": 125517, "epoch": 2988} {"train_loss": -6.548139572143555, "global_step": 125518, "epoch": 2988} {"train_loss": -6.547155857086182, "global_step": 125519, "epoch": 2988} {"train_loss": -6.516635894775391, "global_step": 125520, "epoch": 2988} {"train_loss": -6.592698097229004, "global_step": 125521, "epoch": 2988} {"train_loss": -6.59221887588501, "global_step": 125522, "epoch": 2988} {"train_loss": -6.551139831542969, "global_step": 125523, "epoch": 2988} {"train_loss": -6.603030204772949, "global_step": 125524, "epoch": 2988} {"train_loss": -6.557934284210205, "global_step": 125525, "epoch": 2988} {"train_loss": -6.41070556640625, "global_step": 125526, "epoch": 2988} {"train_loss": -6.659942150115967, "global_step": 125527, "epoch": 2988} {"train_loss": -6.621153831481934, "global_step": 125528, "epoch": 2988} {"train_loss": -6.523063659667969, "global_step": 125529, "epoch": 2988} {"train_loss": -6.627400875091553, "global_step": 125530, "epoch": 2988} {"train_loss": -6.518453598022461, "global_step": 125531, "epoch": 2988} {"train_loss": -6.610675811767578, "global_step": 125532, "epoch": 2988} {"train_loss": -6.642387390136719, "global_step": 125533, "epoch": 2988} {"train_loss": -6.571746826171875, "global_step": 125534, "epoch": 2988} {"train_loss": -6.600951194763184, "global_step": 125535, "epoch": 2988} {"train_loss": -6.6019744873046875, "global_step": 125536, "epoch": 2988} {"train_loss": -6.579332873934791, "global_step": 125537, "epoch": 2988, "val_loss": 77208.65625} {"train_loss": -6.718679428100586, "global_step": 125538, "epoch": 2989} {"train_loss": -6.716283798217773, "global_step": 125539, "epoch": 2989} {"train_loss": -6.6871514320373535, "global_step": 125540, "epoch": 2989} {"train_loss": -6.519674301147461, "global_step": 125541, "epoch": 2989} {"train_loss": -6.624452590942383, "global_step": 125542, "epoch": 2989} {"train_loss": -6.566323757171631, "global_step": 125543, "epoch": 2989} {"train_loss": -6.692371845245361, "global_step": 125544, "epoch": 2989} {"train_loss": -6.68110466003418, "global_step": 125545, "epoch": 2989} {"train_loss": -6.718143939971924, "global_step": 125546, "epoch": 2989} {"train_loss": -6.652254104614258, "global_step": 125547, "epoch": 2989} {"train_loss": -6.565046310424805, "global_step": 125548, "epoch": 2989} {"train_loss": -6.677366256713867, "global_step": 125549, "epoch": 2989} {"train_loss": -6.6826324462890625, "global_step": 125550, "epoch": 2989} {"train_loss": -6.594267845153809, "global_step": 125551, "epoch": 2989} {"train_loss": -6.521712303161621, "global_step": 125552, "epoch": 2989} {"train_loss": -6.660863399505615, "global_step": 125553, "epoch": 2989} {"train_loss": -6.681978225708008, "global_step": 125554, "epoch": 2989} {"train_loss": -6.6454315185546875, "global_step": 125555, "epoch": 2989} {"train_loss": -6.6827850341796875, "global_step": 125556, "epoch": 2989} {"train_loss": -6.590662002563477, "global_step": 125557, "epoch": 2989} {"train_loss": -6.676853179931641, "global_step": 125558, "epoch": 2989} {"train_loss": -6.562931060791016, "global_step": 125559, "epoch": 2989} {"train_loss": -6.643643856048584, "global_step": 125560, "epoch": 2989} {"train_loss": -6.683200836181641, "global_step": 125561, "epoch": 2989} {"train_loss": -6.453569412231445, "global_step": 125562, "epoch": 2989} {"train_loss": -6.57565450668335, "global_step": 125563, "epoch": 2989} {"train_loss": -6.594760894775391, "global_step": 125564, "epoch": 2989} {"train_loss": -6.620510578155518, "global_step": 125565, "epoch": 2989} {"train_loss": -6.562612056732178, "global_step": 125566, "epoch": 2989} {"train_loss": -6.569910526275635, "global_step": 125567, "epoch": 2989} {"train_loss": -6.600266456604004, "global_step": 125568, "epoch": 2989} {"train_loss": -6.657581329345703, "global_step": 125569, "epoch": 2989} {"train_loss": -6.6404805183410645, "global_step": 125570, "epoch": 2989} {"train_loss": -6.570818901062012, "global_step": 125571, "epoch": 2989} {"train_loss": -6.621252536773682, "global_step": 125572, "epoch": 2989} {"train_loss": -6.733011245727539, "global_step": 125573, "epoch": 2989} {"train_loss": -6.6705522537231445, "global_step": 125574, "epoch": 2989} {"train_loss": -6.599099159240723, "global_step": 125575, "epoch": 2989} {"train_loss": -6.6257781982421875, "global_step": 125576, "epoch": 2989} {"train_loss": -6.66371488571167, "global_step": 125577, "epoch": 2989} {"train_loss": -6.655067443847656, "global_step": 125578, "epoch": 2989} {"train_loss": -6.6305432206108454, "global_step": 125579, "epoch": 2989, "val_loss": 77249.5390625} {"train_loss": -6.747030258178711, "global_step": 125580, "epoch": 2990} {"train_loss": -6.626899719238281, "global_step": 125581, "epoch": 2990} {"train_loss": -6.658312797546387, "global_step": 125582, "epoch": 2990} {"train_loss": -6.683724403381348, "global_step": 125583, "epoch": 2990} {"train_loss": -6.724437236785889, "global_step": 125584, "epoch": 2990} {"train_loss": -6.606165885925293, "global_step": 125585, "epoch": 2990} {"train_loss": -6.658633708953857, "global_step": 125586, "epoch": 2990} {"train_loss": -6.663904666900635, "global_step": 125587, "epoch": 2990} {"train_loss": -6.583456039428711, "global_step": 125588, "epoch": 2990} {"train_loss": -6.640830039978027, "global_step": 125589, "epoch": 2990} {"train_loss": -6.654348373413086, "global_step": 125590, "epoch": 2990} {"train_loss": -6.612353801727295, "global_step": 125591, "epoch": 2990} {"train_loss": -6.661349296569824, "global_step": 125592, "epoch": 2990} {"train_loss": -6.512150764465332, "global_step": 125593, "epoch": 2990} {"train_loss": -6.533182621002197, "global_step": 125594, "epoch": 2990} {"train_loss": -6.67464542388916, "global_step": 125595, "epoch": 2990} {"train_loss": -6.671538352966309, "global_step": 125596, "epoch": 2990} {"train_loss": -6.72737455368042, "global_step": 125597, "epoch": 2990} {"train_loss": -6.772190093994141, "global_step": 125598, "epoch": 2990} {"train_loss": -6.566831111907959, "global_step": 125599, "epoch": 2990} {"train_loss": -6.562591552734375, "global_step": 125600, "epoch": 2990} {"train_loss": -6.620449066162109, "global_step": 125601, "epoch": 2990} {"train_loss": -6.668710708618164, "global_step": 125602, "epoch": 2990} {"train_loss": -6.562014579772949, "global_step": 125603, "epoch": 2990} {"train_loss": -6.632221698760986, "global_step": 125604, "epoch": 2990} {"train_loss": -6.529903411865234, "global_step": 125605, "epoch": 2990} {"train_loss": -6.661210536956787, "global_step": 125606, "epoch": 2990} {"train_loss": -6.627026081085205, "global_step": 125607, "epoch": 2990} {"train_loss": -6.524003505706787, "global_step": 125608, "epoch": 2990} {"train_loss": -6.572092533111572, "global_step": 125609, "epoch": 2990} {"train_loss": -6.574493408203125, "global_step": 125610, "epoch": 2990} {"train_loss": -6.585030555725098, "global_step": 125611, "epoch": 2990} {"train_loss": -6.739050388336182, "global_step": 125612, "epoch": 2990} {"train_loss": -6.488883018493652, "global_step": 125613, "epoch": 2990} {"train_loss": -6.566841125488281, "global_step": 125614, "epoch": 2990} {"train_loss": -6.524872303009033, "global_step": 125615, "epoch": 2990} {"train_loss": -6.577498912811279, "global_step": 125616, "epoch": 2990} {"train_loss": -6.478639125823975, "global_step": 125617, "epoch": 2990} {"train_loss": -6.603724002838135, "global_step": 125618, "epoch": 2990} {"train_loss": -6.502527236938477, "global_step": 125619, "epoch": 2990} {"train_loss": -6.595756530761719, "global_step": 125620, "epoch": 2990} {"train_loss": -6.6128180708204, "global_step": 125621, "epoch": 2990, "val_loss": 77318.0078125} {"train_loss": -6.5277509689331055, "global_step": 125622, "epoch": 2991} {"train_loss": -6.545001983642578, "global_step": 125623, "epoch": 2991} {"train_loss": -6.462334632873535, "global_step": 125624, "epoch": 2991} {"train_loss": -6.524213790893555, "global_step": 125625, "epoch": 2991} {"train_loss": -6.392163276672363, "global_step": 125626, "epoch": 2991} {"train_loss": -6.596782684326172, "global_step": 125627, "epoch": 2991} {"train_loss": -6.484129905700684, "global_step": 125628, "epoch": 2991} {"train_loss": -6.452762603759766, "global_step": 125629, "epoch": 2991} {"train_loss": -6.4378743171691895, "global_step": 125630, "epoch": 2991} {"train_loss": -6.428739547729492, "global_step": 125631, "epoch": 2991} {"train_loss": -6.586432933807373, "global_step": 125632, "epoch": 2991} {"train_loss": -6.541464328765869, "global_step": 125633, "epoch": 2991} {"train_loss": -6.62331485748291, "global_step": 125634, "epoch": 2991} {"train_loss": -6.462774276733398, "global_step": 125635, "epoch": 2991} {"train_loss": -6.642962455749512, "global_step": 125636, "epoch": 2991} {"train_loss": -6.532378196716309, "global_step": 125637, "epoch": 2991} {"train_loss": -6.719788551330566, "global_step": 125638, "epoch": 2991} {"train_loss": -6.663203239440918, "global_step": 125639, "epoch": 2991} {"train_loss": -6.689418315887451, "global_step": 125640, "epoch": 2991} {"train_loss": -6.702449321746826, "global_step": 125641, "epoch": 2991} {"train_loss": -6.482914924621582, "global_step": 125642, "epoch": 2991} {"train_loss": -6.650261878967285, "global_step": 125643, "epoch": 2991} {"train_loss": -6.6298370361328125, "global_step": 125644, "epoch": 2991} {"train_loss": -6.573103904724121, "global_step": 125645, "epoch": 2991} {"train_loss": -6.666817665100098, "global_step": 125646, "epoch": 2991} {"train_loss": -6.701328277587891, "global_step": 125647, "epoch": 2991} {"train_loss": -6.727792739868164, "global_step": 125648, "epoch": 2991} {"train_loss": -6.638819694519043, "global_step": 125649, "epoch": 2991} {"train_loss": -6.615429878234863, "global_step": 125650, "epoch": 2991} {"train_loss": -6.718099594116211, "global_step": 125651, "epoch": 2991} {"train_loss": -6.61595344543457, "global_step": 125652, "epoch": 2991} {"train_loss": -6.602484703063965, "global_step": 125653, "epoch": 2991} {"train_loss": -6.6013946533203125, "global_step": 125654, "epoch": 2991} {"train_loss": -6.555310249328613, "global_step": 125655, "epoch": 2991} {"train_loss": -6.598238468170166, "global_step": 125656, "epoch": 2991} {"train_loss": -6.700987815856934, "global_step": 125657, "epoch": 2991} {"train_loss": -6.552116870880127, "global_step": 125658, "epoch": 2991} {"train_loss": -6.537902355194092, "global_step": 125659, "epoch": 2991} {"train_loss": -6.704077243804932, "global_step": 125660, "epoch": 2991} {"train_loss": -6.555318832397461, "global_step": 125661, "epoch": 2991} {"train_loss": -6.596236228942871, "global_step": 125662, "epoch": 2991} {"train_loss": -6.586325645446777, "global_step": 125663, "epoch": 2991, "val_loss": 77056.6015625} {"train_loss": -6.551573276519775, "global_step": 125664, "epoch": 2992} {"train_loss": -6.612865447998047, "global_step": 125665, "epoch": 2992} {"train_loss": -6.670466423034668, "global_step": 125666, "epoch": 2992} {"train_loss": -6.435611724853516, "global_step": 125667, "epoch": 2992} {"train_loss": -6.690999984741211, "global_step": 125668, "epoch": 2992} {"train_loss": -6.596693992614746, "global_step": 125669, "epoch": 2992} {"train_loss": -6.594278812408447, "global_step": 125670, "epoch": 2992} {"train_loss": -6.5692548751831055, "global_step": 125671, "epoch": 2992} {"train_loss": -6.48728084564209, "global_step": 125672, "epoch": 2992} {"train_loss": -6.690113544464111, "global_step": 125673, "epoch": 2992} {"train_loss": -6.516350746154785, "global_step": 125674, "epoch": 2992} {"train_loss": -6.603460788726807, "global_step": 125675, "epoch": 2992} {"train_loss": -6.734346389770508, "global_step": 125676, "epoch": 2992} {"train_loss": -6.635723114013672, "global_step": 125677, "epoch": 2992} {"train_loss": -6.688251972198486, "global_step": 125678, "epoch": 2992} {"train_loss": -6.642611503601074, "global_step": 125679, "epoch": 2992} {"train_loss": -6.592677116394043, "global_step": 125680, "epoch": 2992} {"train_loss": -6.593278884887695, "global_step": 125681, "epoch": 2992} {"train_loss": -6.630044937133789, "global_step": 125682, "epoch": 2992} {"train_loss": -6.540627956390381, "global_step": 125683, "epoch": 2992} {"train_loss": -6.585733413696289, "global_step": 125684, "epoch": 2992} {"train_loss": -6.5248541831970215, "global_step": 125685, "epoch": 2992} {"train_loss": -6.4772257804870605, "global_step": 125686, "epoch": 2992} {"train_loss": -6.578329086303711, "global_step": 125687, "epoch": 2992} {"train_loss": -6.5934906005859375, "global_step": 125688, "epoch": 2992} {"train_loss": -6.597746849060059, "global_step": 125689, "epoch": 2992} {"train_loss": -6.605738162994385, "global_step": 125690, "epoch": 2992} {"train_loss": -6.621294975280762, "global_step": 125691, "epoch": 2992} {"train_loss": -6.6069746017456055, "global_step": 125692, "epoch": 2992} {"train_loss": -6.5669403076171875, "global_step": 125693, "epoch": 2992} {"train_loss": -6.617424964904785, "global_step": 125694, "epoch": 2992} {"train_loss": -6.579890727996826, "global_step": 125695, "epoch": 2992} {"train_loss": -6.450034141540527, "global_step": 125696, "epoch": 2992} {"train_loss": -6.642914772033691, "global_step": 125697, "epoch": 2992} {"train_loss": -6.629737854003906, "global_step": 125698, "epoch": 2992} {"train_loss": -6.486893653869629, "global_step": 125699, "epoch": 2992} {"train_loss": -6.641870021820068, "global_step": 125700, "epoch": 2992} {"train_loss": -6.632737636566162, "global_step": 125701, "epoch": 2992} {"train_loss": -6.642626762390137, "global_step": 125702, "epoch": 2992} {"train_loss": -6.576719284057617, "global_step": 125703, "epoch": 2992} {"train_loss": -6.568655967712402, "global_step": 125704, "epoch": 2992} {"train_loss": -6.593702690941947, "global_step": 125705, "epoch": 2992, "val_loss": 77023.0546875} {"train_loss": -6.651930332183838, "global_step": 125706, "epoch": 2993} {"train_loss": -6.645273208618164, "global_step": 125707, "epoch": 2993} {"train_loss": -6.55733585357666, "global_step": 125708, "epoch": 2993} {"train_loss": -6.686039924621582, "global_step": 125709, "epoch": 2993} {"train_loss": -6.570394992828369, "global_step": 125710, "epoch": 2993} {"train_loss": -6.682417392730713, "global_step": 125711, "epoch": 2993} {"train_loss": -6.58217716217041, "global_step": 125712, "epoch": 2993} {"train_loss": -6.664858818054199, "global_step": 125713, "epoch": 2993} {"train_loss": -6.625245094299316, "global_step": 125714, "epoch": 2993} {"train_loss": -6.664255142211914, "global_step": 125715, "epoch": 2993} {"train_loss": -6.712636470794678, "global_step": 125716, "epoch": 2993} {"train_loss": -6.776669502258301, "global_step": 125717, "epoch": 2993} {"train_loss": -6.613104820251465, "global_step": 125718, "epoch": 2993} {"train_loss": -6.659938812255859, "global_step": 125719, "epoch": 2993} {"train_loss": -6.622079849243164, "global_step": 125720, "epoch": 2993} {"train_loss": -6.5233588218688965, "global_step": 125721, "epoch": 2993} {"train_loss": -6.64162540435791, "global_step": 125722, "epoch": 2993} {"train_loss": -6.538223743438721, "global_step": 125723, "epoch": 2993} {"train_loss": -6.610715866088867, "global_step": 125724, "epoch": 2993} {"train_loss": -6.607929706573486, "global_step": 125725, "epoch": 2993} {"train_loss": -6.578578472137451, "global_step": 125726, "epoch": 2993} {"train_loss": -6.638332843780518, "global_step": 125727, "epoch": 2993} {"train_loss": -6.669405937194824, "global_step": 125728, "epoch": 2993} {"train_loss": -6.544578552246094, "global_step": 125729, "epoch": 2993} {"train_loss": -6.612087726593018, "global_step": 125730, "epoch": 2993} {"train_loss": -6.566214561462402, "global_step": 125731, "epoch": 2993} {"train_loss": -6.562924385070801, "global_step": 125732, "epoch": 2993} {"train_loss": -6.6709513664245605, "global_step": 125733, "epoch": 2993} {"train_loss": -6.611536979675293, "global_step": 125734, "epoch": 2993} {"train_loss": -6.69144868850708, "global_step": 125735, "epoch": 2993} {"train_loss": -6.664691925048828, "global_step": 125736, "epoch": 2993} {"train_loss": -6.589303970336914, "global_step": 125737, "epoch": 2993} {"train_loss": -6.661836624145508, "global_step": 125738, "epoch": 2993} {"train_loss": -6.629390239715576, "global_step": 125739, "epoch": 2993} {"train_loss": -6.537504196166992, "global_step": 125740, "epoch": 2993} {"train_loss": -6.687607765197754, "global_step": 125741, "epoch": 2993} {"train_loss": -6.552371978759766, "global_step": 125742, "epoch": 2993} {"train_loss": -6.577337265014648, "global_step": 125743, "epoch": 2993} {"train_loss": -6.707271575927734, "global_step": 125744, "epoch": 2993} {"train_loss": -6.53600549697876, "global_step": 125745, "epoch": 2993} {"train_loss": -6.614640712738037, "global_step": 125746, "epoch": 2993} {"train_loss": -6.623516196296329, "global_step": 125747, "epoch": 2993, "val_loss": 77188.28125} {"train_loss": -6.50474739074707, "global_step": 125748, "epoch": 2994} {"train_loss": -6.659215927124023, "global_step": 125749, "epoch": 2994} {"train_loss": -6.534800052642822, "global_step": 125750, "epoch": 2994} {"train_loss": -6.586257457733154, "global_step": 125751, "epoch": 2994} {"train_loss": -6.719490051269531, "global_step": 125752, "epoch": 2994} {"train_loss": -6.559535980224609, "global_step": 125753, "epoch": 2994} {"train_loss": -6.713140964508057, "global_step": 125754, "epoch": 2994} {"train_loss": -6.53389835357666, "global_step": 125755, "epoch": 2994} {"train_loss": -6.645997524261475, "global_step": 125756, "epoch": 2994} {"train_loss": -6.646573066711426, "global_step": 125757, "epoch": 2994} {"train_loss": -6.524796485900879, "global_step": 125758, "epoch": 2994} {"train_loss": -6.6507110595703125, "global_step": 125759, "epoch": 2994} {"train_loss": -6.642091751098633, "global_step": 125760, "epoch": 2994} {"train_loss": -6.616507530212402, "global_step": 125761, "epoch": 2994} {"train_loss": -6.483218193054199, "global_step": 125762, "epoch": 2994} {"train_loss": -6.522883415222168, "global_step": 125763, "epoch": 2994} {"train_loss": -6.608443737030029, "global_step": 125764, "epoch": 2994} {"train_loss": -6.678947448730469, "global_step": 125765, "epoch": 2994} {"train_loss": -6.44802188873291, "global_step": 125766, "epoch": 2994} {"train_loss": -6.58814811706543, "global_step": 125767, "epoch": 2994} {"train_loss": -6.557892799377441, "global_step": 125768, "epoch": 2994} {"train_loss": -6.7114787101745605, "global_step": 125769, "epoch": 2994} {"train_loss": -6.622426509857178, "global_step": 125770, "epoch": 2994} {"train_loss": -6.639556884765625, "global_step": 125771, "epoch": 2994} {"train_loss": -6.699315071105957, "global_step": 125772, "epoch": 2994} {"train_loss": -6.6359453201293945, "global_step": 125773, "epoch": 2994} {"train_loss": -6.724544525146484, "global_step": 125774, "epoch": 2994} {"train_loss": -6.663270950317383, "global_step": 125775, "epoch": 2994} {"train_loss": -6.585142612457275, "global_step": 125776, "epoch": 2994} {"train_loss": -6.562828540802002, "global_step": 125777, "epoch": 2994} {"train_loss": -6.650700569152832, "global_step": 125778, "epoch": 2994} {"train_loss": -6.681632995605469, "global_step": 125779, "epoch": 2994} {"train_loss": -6.605085849761963, "global_step": 125780, "epoch": 2994} {"train_loss": -6.582437515258789, "global_step": 125781, "epoch": 2994} {"train_loss": -6.47422456741333, "global_step": 125782, "epoch": 2994} {"train_loss": -6.588754653930664, "global_step": 125783, "epoch": 2994} {"train_loss": -6.623629093170166, "global_step": 125784, "epoch": 2994} {"train_loss": -6.592026233673096, "global_step": 125785, "epoch": 2994} {"train_loss": -6.537300109863281, "global_step": 125786, "epoch": 2994} {"train_loss": -6.655553817749023, "global_step": 125787, "epoch": 2994} {"train_loss": -6.708539009094238, "global_step": 125788, "epoch": 2994} {"train_loss": -6.608204705374582, "global_step": 125789, "epoch": 2994, "val_loss": 77286.6953125} {"train_loss": -6.707503795623779, "global_step": 125790, "epoch": 2995} {"train_loss": -6.548705577850342, "global_step": 125791, "epoch": 2995} {"train_loss": -6.663780212402344, "global_step": 125792, "epoch": 2995} {"train_loss": -6.6776885986328125, "global_step": 125793, "epoch": 2995} {"train_loss": -6.535015106201172, "global_step": 125794, "epoch": 2995} {"train_loss": -6.603760719299316, "global_step": 125795, "epoch": 2995} {"train_loss": -6.576283931732178, "global_step": 125796, "epoch": 2995} {"train_loss": -6.539676666259766, "global_step": 125797, "epoch": 2995} {"train_loss": -6.6422224044799805, "global_step": 125798, "epoch": 2995} {"train_loss": -6.7030253410339355, "global_step": 125799, "epoch": 2995} {"train_loss": -6.628335952758789, "global_step": 125800, "epoch": 2995} {"train_loss": -6.471035003662109, "global_step": 125801, "epoch": 2995} {"train_loss": -6.513283729553223, "global_step": 125802, "epoch": 2995} {"train_loss": -6.459390640258789, "global_step": 125803, "epoch": 2995} {"train_loss": -6.598041534423828, "global_step": 125804, "epoch": 2995} {"train_loss": -6.478612899780273, "global_step": 125805, "epoch": 2995} {"train_loss": -6.552430152893066, "global_step": 125806, "epoch": 2995} {"train_loss": -6.628969192504883, "global_step": 125807, "epoch": 2995} {"train_loss": -6.365156173706055, "global_step": 125808, "epoch": 2995} {"train_loss": -6.686931133270264, "global_step": 125809, "epoch": 2995} {"train_loss": -6.5983381271362305, "global_step": 125810, "epoch": 2995} {"train_loss": -6.562987804412842, "global_step": 125811, "epoch": 2995} {"train_loss": -6.636911392211914, "global_step": 125812, "epoch": 2995} {"train_loss": -6.593657970428467, "global_step": 125813, "epoch": 2995} {"train_loss": -6.744647026062012, "global_step": 125814, "epoch": 2995} {"train_loss": -6.690725326538086, "global_step": 125815, "epoch": 2995} {"train_loss": -6.692600250244141, "global_step": 125816, "epoch": 2995} {"train_loss": -6.589404106140137, "global_step": 125817, "epoch": 2995} {"train_loss": -6.614420413970947, "global_step": 125818, "epoch": 2995} {"train_loss": -6.499466896057129, "global_step": 125819, "epoch": 2995} {"train_loss": -6.705791473388672, "global_step": 125820, "epoch": 2995} {"train_loss": -6.601263046264648, "global_step": 125821, "epoch": 2995} {"train_loss": -6.674129009246826, "global_step": 125822, "epoch": 2995} {"train_loss": -6.8548431396484375, "global_step": 125823, "epoch": 2995} {"train_loss": -6.557075023651123, "global_step": 125824, "epoch": 2995} {"train_loss": -6.64924955368042, "global_step": 125825, "epoch": 2995} {"train_loss": -6.7699151039123535, "global_step": 125826, "epoch": 2995} {"train_loss": -6.805902004241943, "global_step": 125827, "epoch": 2995} {"train_loss": -6.725068092346191, "global_step": 125828, "epoch": 2995} {"train_loss": -6.659688949584961, "global_step": 125829, "epoch": 2995} {"train_loss": -6.660947799682617, "global_step": 125830, "epoch": 2995} {"train_loss": -6.621240025474911, "global_step": 125831, "epoch": 2995, "val_loss": 77305.390625} {"train_loss": -6.730185508728027, "global_step": 125832, "epoch": 2996} {"train_loss": -6.701137542724609, "global_step": 125833, "epoch": 2996} {"train_loss": -6.6454925537109375, "global_step": 125834, "epoch": 2996} {"train_loss": -6.656717777252197, "global_step": 125835, "epoch": 2996} {"train_loss": -6.560635566711426, "global_step": 125836, "epoch": 2996} {"train_loss": -6.628183364868164, "global_step": 125837, "epoch": 2996} {"train_loss": -6.648536682128906, "global_step": 125838, "epoch": 2996} {"train_loss": -6.456423759460449, "global_step": 125839, "epoch": 2996} {"train_loss": -6.68710994720459, "global_step": 125840, "epoch": 2996} {"train_loss": -6.715878486633301, "global_step": 125841, "epoch": 2996} {"train_loss": -6.725020408630371, "global_step": 125842, "epoch": 2996} {"train_loss": -6.747900485992432, "global_step": 125843, "epoch": 2996} {"train_loss": -6.749019622802734, "global_step": 125844, "epoch": 2996} {"train_loss": -6.584615230560303, "global_step": 125845, "epoch": 2996} {"train_loss": -6.627716064453125, "global_step": 125846, "epoch": 2996} {"train_loss": -6.646897315979004, "global_step": 125847, "epoch": 2996} {"train_loss": -6.708961486816406, "global_step": 125848, "epoch": 2996} {"train_loss": -6.698549270629883, "global_step": 125849, "epoch": 2996} {"train_loss": -6.728384971618652, "global_step": 125850, "epoch": 2996} {"train_loss": -6.751543998718262, "global_step": 125851, "epoch": 2996} {"train_loss": -6.70157527923584, "global_step": 125852, "epoch": 2996} {"train_loss": -6.6065168380737305, "global_step": 125853, "epoch": 2996} {"train_loss": -6.627512454986572, "global_step": 125854, "epoch": 2996} {"train_loss": -6.699036121368408, "global_step": 125855, "epoch": 2996} {"train_loss": -6.666231155395508, "global_step": 125856, "epoch": 2996} {"train_loss": -6.693781852722168, "global_step": 125857, "epoch": 2996} {"train_loss": -6.689965724945068, "global_step": 125858, "epoch": 2996} {"train_loss": -6.636949062347412, "global_step": 125859, "epoch": 2996} {"train_loss": -6.595383644104004, "global_step": 125860, "epoch": 2996} {"train_loss": -6.739725112915039, "global_step": 125861, "epoch": 2996} {"train_loss": -6.5774149894714355, "global_step": 125862, "epoch": 2996} {"train_loss": -6.726656913757324, "global_step": 125863, "epoch": 2996} {"train_loss": -6.632794380187988, "global_step": 125864, "epoch": 2996} {"train_loss": -6.734246253967285, "global_step": 125865, "epoch": 2996} {"train_loss": -6.7830400466918945, "global_step": 125866, "epoch": 2996} {"train_loss": -6.7096662521362305, "global_step": 125867, "epoch": 2996} {"train_loss": -6.529770851135254, "global_step": 125868, "epoch": 2996} {"train_loss": -6.73219108581543, "global_step": 125869, "epoch": 2996} {"train_loss": -6.773043632507324, "global_step": 125870, "epoch": 2996} {"train_loss": -6.617396354675293, "global_step": 125871, "epoch": 2996} {"train_loss": -6.756500244140625, "global_step": 125872, "epoch": 2996} {"train_loss": -6.672130527950468, "global_step": 125873, "epoch": 2996, "val_loss": 77270.0078125} {"train_loss": -6.767321586608887, "global_step": 125874, "epoch": 2997} {"train_loss": -6.627072334289551, "global_step": 125875, "epoch": 2997} {"train_loss": -6.527142524719238, "global_step": 125876, "epoch": 2997} {"train_loss": -6.528220176696777, "global_step": 125877, "epoch": 2997} {"train_loss": -6.604669094085693, "global_step": 125878, "epoch": 2997} {"train_loss": -6.615386486053467, "global_step": 125879, "epoch": 2997} {"train_loss": -6.506053924560547, "global_step": 125880, "epoch": 2997} {"train_loss": -6.586971282958984, "global_step": 125881, "epoch": 2997} {"train_loss": -6.525892734527588, "global_step": 125882, "epoch": 2997} {"train_loss": -6.729898452758789, "global_step": 125883, "epoch": 2997} {"train_loss": -6.5764079093933105, "global_step": 125884, "epoch": 2997} {"train_loss": -6.681792259216309, "global_step": 125885, "epoch": 2997} {"train_loss": -6.60096549987793, "global_step": 125886, "epoch": 2997} {"train_loss": -6.575420379638672, "global_step": 125887, "epoch": 2997} {"train_loss": -6.602329254150391, "global_step": 125888, "epoch": 2997} {"train_loss": -6.531180381774902, "global_step": 125889, "epoch": 2997} {"train_loss": -6.650793552398682, "global_step": 125890, "epoch": 2997} {"train_loss": -6.708940505981445, "global_step": 125891, "epoch": 2997} {"train_loss": -6.608375549316406, "global_step": 125892, "epoch": 2997} {"train_loss": -6.650601387023926, "global_step": 125893, "epoch": 2997} {"train_loss": -6.5593061447143555, "global_step": 125894, "epoch": 2997} {"train_loss": -6.546383380889893, "global_step": 125895, "epoch": 2997} {"train_loss": -6.647066116333008, "global_step": 125896, "epoch": 2997} {"train_loss": -6.386013984680176, "global_step": 125897, "epoch": 2997} {"train_loss": -6.540950775146484, "global_step": 125898, "epoch": 2997} {"train_loss": -6.709826946258545, "global_step": 125899, "epoch": 2997} {"train_loss": -6.558863162994385, "global_step": 125900, "epoch": 2997} {"train_loss": -6.649586200714111, "global_step": 125901, "epoch": 2997} {"train_loss": -6.587254524230957, "global_step": 125902, "epoch": 2997} {"train_loss": -6.63646936416626, "global_step": 125903, "epoch": 2997} {"train_loss": -6.603312969207764, "global_step": 125904, "epoch": 2997} {"train_loss": -6.659885406494141, "global_step": 125905, "epoch": 2997} {"train_loss": -6.562491416931152, "global_step": 125906, "epoch": 2997} {"train_loss": -6.645468235015869, "global_step": 125907, "epoch": 2997} {"train_loss": -6.696080207824707, "global_step": 125908, "epoch": 2997} {"train_loss": -6.724267959594727, "global_step": 125909, "epoch": 2997} {"train_loss": -6.678006172180176, "global_step": 125910, "epoch": 2997} {"train_loss": -6.663654327392578, "global_step": 125911, "epoch": 2997} {"train_loss": -6.672325134277344, "global_step": 125912, "epoch": 2997} {"train_loss": -6.6447577476501465, "global_step": 125913, "epoch": 2997} {"train_loss": -6.6215620040893555, "global_step": 125914, "epoch": 2997} {"train_loss": -6.6171141011374335, "global_step": 125915, "epoch": 2997, "val_loss": 77241.7578125} {"train_loss": -6.566211700439453, "global_step": 125916, "epoch": 2998} {"train_loss": -6.647594451904297, "global_step": 125917, "epoch": 2998} {"train_loss": -6.630093574523926, "global_step": 125918, "epoch": 2998} {"train_loss": -6.590523719787598, "global_step": 125919, "epoch": 2998} {"train_loss": -6.6492695808410645, "global_step": 125920, "epoch": 2998} {"train_loss": -6.624564170837402, "global_step": 125921, "epoch": 2998} {"train_loss": -6.674294471740723, "global_step": 125922, "epoch": 2998} {"train_loss": -6.5909624099731445, "global_step": 125923, "epoch": 2998} {"train_loss": -6.64176607131958, "global_step": 125924, "epoch": 2998} {"train_loss": -6.646709442138672, "global_step": 125925, "epoch": 2998} {"train_loss": -6.6417622566223145, "global_step": 125926, "epoch": 2998} {"train_loss": -6.554971694946289, "global_step": 125927, "epoch": 2998} {"train_loss": -6.523446083068848, "global_step": 125928, "epoch": 2998} {"train_loss": -6.562172889709473, "global_step": 125929, "epoch": 2998} {"train_loss": -6.744203090667725, "global_step": 125930, "epoch": 2998} {"train_loss": -6.545166969299316, "global_step": 125931, "epoch": 2998} {"train_loss": -6.535688400268555, "global_step": 125932, "epoch": 2998} {"train_loss": -6.623241424560547, "global_step": 125933, "epoch": 2998} {"train_loss": -6.572198867797852, "global_step": 125934, "epoch": 2998} {"train_loss": -6.46228551864624, "global_step": 125935, "epoch": 2998} {"train_loss": -6.726085662841797, "global_step": 125936, "epoch": 2998} {"train_loss": -6.624535083770752, "global_step": 125937, "epoch": 2998} {"train_loss": -6.534744739532471, "global_step": 125938, "epoch": 2998} {"train_loss": -6.634984493255615, "global_step": 125939, "epoch": 2998} {"train_loss": -6.567201137542725, "global_step": 125940, "epoch": 2998} {"train_loss": -6.498595237731934, "global_step": 125941, "epoch": 2998} {"train_loss": -6.659150123596191, "global_step": 125942, "epoch": 2998} {"train_loss": -6.5367889404296875, "global_step": 125943, "epoch": 2998} {"train_loss": -6.64164924621582, "global_step": 125944, "epoch": 2998} {"train_loss": -6.620853424072266, "global_step": 125945, "epoch": 2998} {"train_loss": -6.628320693969727, "global_step": 125946, "epoch": 2998} {"train_loss": -6.784285545349121, "global_step": 125947, "epoch": 2998} {"train_loss": -6.553793907165527, "global_step": 125948, "epoch": 2998} {"train_loss": -6.772806167602539, "global_step": 125949, "epoch": 2998} {"train_loss": -6.597645282745361, "global_step": 125950, "epoch": 2998} {"train_loss": -6.49013090133667, "global_step": 125951, "epoch": 2998} {"train_loss": -6.539945125579834, "global_step": 125952, "epoch": 2998} {"train_loss": -6.524557113647461, "global_step": 125953, "epoch": 2998} {"train_loss": -6.612078666687012, "global_step": 125954, "epoch": 2998} {"train_loss": -6.526454925537109, "global_step": 125955, "epoch": 2998} {"train_loss": -6.646909713745117, "global_step": 125956, "epoch": 2998} {"train_loss": -6.602085238411313, "global_step": 125957, "epoch": 2998, "val_loss": 77285.6640625} {"train_loss": -6.5471601486206055, "global_step": 125958, "epoch": 2999} {"train_loss": -6.628348350524902, "global_step": 125959, "epoch": 2999} {"train_loss": -6.505597114562988, "global_step": 125960, "epoch": 2999} {"train_loss": -6.672203063964844, "global_step": 125961, "epoch": 2999} {"train_loss": -6.706560134887695, "global_step": 125962, "epoch": 2999} {"train_loss": -6.5724921226501465, "global_step": 125963, "epoch": 2999} {"train_loss": -6.649964332580566, "global_step": 125964, "epoch": 2999} {"train_loss": -6.59052848815918, "global_step": 125965, "epoch": 2999} {"train_loss": -6.669361114501953, "global_step": 125966, "epoch": 2999} {"train_loss": -6.646114349365234, "global_step": 125967, "epoch": 2999} {"train_loss": -6.596925735473633, "global_step": 125968, "epoch": 2999} {"train_loss": -6.653168678283691, "global_step": 125969, "epoch": 2999} {"train_loss": -6.652059555053711, "global_step": 125970, "epoch": 2999} {"train_loss": -6.495914459228516, "global_step": 125971, "epoch": 2999} {"train_loss": -6.6520915031433105, "global_step": 125972, "epoch": 2999} {"train_loss": -6.473387718200684, "global_step": 125973, "epoch": 2999} {"train_loss": -6.556392669677734, "global_step": 125974, "epoch": 2999} {"train_loss": -6.548765659332275, "global_step": 125975, "epoch": 2999} {"train_loss": -6.6155548095703125, "global_step": 125976, "epoch": 2999} {"train_loss": -6.563261032104492, "global_step": 125977, "epoch": 2999} {"train_loss": -6.5303215980529785, "global_step": 125978, "epoch": 2999} {"train_loss": -6.601612091064453, "global_step": 125979, "epoch": 2999} {"train_loss": -6.581508636474609, "global_step": 125980, "epoch": 2999} {"train_loss": -6.649537086486816, "global_step": 125981, "epoch": 2999} {"train_loss": -6.579538822174072, "global_step": 125982, "epoch": 2999} {"train_loss": -6.592123031616211, "global_step": 125983, "epoch": 2999} {"train_loss": -6.557697296142578, "global_step": 125984, "epoch": 2999} {"train_loss": -6.541621208190918, "global_step": 125985, "epoch": 2999} {"train_loss": -6.560092926025391, "global_step": 125986, "epoch": 2999} {"train_loss": -6.6053619384765625, "global_step": 125987, "epoch": 2999} {"train_loss": -6.694934368133545, "global_step": 125988, "epoch": 2999} {"train_loss": -6.743797779083252, "global_step": 125989, "epoch": 2999} {"train_loss": -6.639400482177734, "global_step": 125990, "epoch": 2999} {"train_loss": -6.597142219543457, "global_step": 125991, "epoch": 2999} {"train_loss": -6.605743408203125, "global_step": 125992, "epoch": 2999} {"train_loss": -6.6781768798828125, "global_step": 125993, "epoch": 2999} {"train_loss": -6.618036270141602, "global_step": 125994, "epoch": 2999} {"train_loss": -6.647975921630859, "global_step": 125995, "epoch": 2999} {"train_loss": -6.592903137207031, "global_step": 125996, "epoch": 2999} {"train_loss": -6.624120235443115, "global_step": 125997, "epoch": 2999} {"train_loss": -6.76762580871582, "global_step": 125998, "epoch": 2999} {"train_loss": -6.610895100094023, "global_step": 125999, "epoch": 2999, "val_loss": 77440.859375} {"train_loss": -6.663270950317383, "global_step": 126000, "epoch": 3000} {"train_loss": -6.702986717224121, "global_step": 126001, "epoch": 3000} {"train_loss": -6.709372043609619, "global_step": 126002, "epoch": 3000} {"train_loss": -6.696173667907715, "global_step": 126003, "epoch": 3000} {"train_loss": -6.652945518493652, "global_step": 126004, "epoch": 3000} {"train_loss": -6.660345554351807, "global_step": 126005, "epoch": 3000} {"train_loss": -6.648855209350586, "global_step": 126006, "epoch": 3000} {"train_loss": -6.695033073425293, "global_step": 126007, "epoch": 3000} {"train_loss": -6.659203052520752, "global_step": 126008, "epoch": 3000} {"train_loss": -6.6125664710998535, "global_step": 126009, "epoch": 3000} {"train_loss": -6.649853706359863, "global_step": 126010, "epoch": 3000} {"train_loss": -6.818682670593262, "global_step": 126011, "epoch": 3000} {"train_loss": -6.646949768066406, "global_step": 126012, "epoch": 3000} {"train_loss": -6.607446193695068, "global_step": 126013, "epoch": 3000} {"train_loss": -6.655096530914307, "global_step": 126014, "epoch": 3000} {"train_loss": -6.605586051940918, "global_step": 126015, "epoch": 3000} {"train_loss": -6.6437578201293945, "global_step": 126016, "epoch": 3000} {"train_loss": -6.681117534637451, "global_step": 126017, "epoch": 3000} {"train_loss": -6.57756233215332, "global_step": 126018, "epoch": 3000} {"train_loss": -6.6343255043029785, "global_step": 126019, "epoch": 3000} {"train_loss": -6.699726104736328, "global_step": 126020, "epoch": 3000} {"train_loss": -6.531904697418213, "global_step": 126021, "epoch": 3000} {"train_loss": -6.6468505859375, "global_step": 126022, "epoch": 3000} {"train_loss": -6.62041711807251, "global_step": 126023, "epoch": 3000} {"train_loss": -6.599155902862549, "global_step": 126024, "epoch": 3000} {"train_loss": -6.6423845291137695, "global_step": 126025, "epoch": 3000} {"train_loss": -6.540392875671387, "global_step": 126026, "epoch": 3000} {"train_loss": -6.608038902282715, "global_step": 126027, "epoch": 3000} {"train_loss": -6.59060001373291, "global_step": 126028, "epoch": 3000} {"train_loss": -6.497653961181641, "global_step": 126029, "epoch": 3000} {"train_loss": -6.552792549133301, "global_step": 126030, "epoch": 3000} {"train_loss": -6.631800651550293, "global_step": 126031, "epoch": 3000} {"train_loss": -6.551981449127197, "global_step": 126032, "epoch": 3000} {"train_loss": -6.582043647766113, "global_step": 126033, "epoch": 3000} {"train_loss": -6.581671714782715, "global_step": 126034, "epoch": 3000} {"train_loss": -6.607548713684082, "global_step": 126035, "epoch": 3000} {"train_loss": -6.599550247192383, "global_step": 126036, "epoch": 3000} {"train_loss": -6.550416946411133, "global_step": 126037, "epoch": 3000} {"train_loss": -6.589944839477539, "global_step": 126038, "epoch": 3000} {"train_loss": -6.498360633850098, "global_step": 126039, "epoch": 3000} {"train_loss": -6.6244001388549805, "global_step": 126040, "epoch": 3000} {"train_loss": -6.623398860295613, "global_step": 126041, "epoch": 3000, "train/sim_max_reward_0": 0.496176568163528, "train/sim_max_reward_1": 0.916881337004556, "train/sim_max_reward_2": 0.4127187092968854, "train/sim_max_reward_3": 0.1279174258497364, "train/sim_max_reward_4": 0.2976749933332356, "train/sim_max_reward_5": 0.895510876243244, "test/sim_max_reward_4500000": 0.9720467250788914, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9376456391904602, "test/sim_max_reward_4500003": 0.9888303670995544, "test/sim_max_reward_4500004": 0.958051544821004, "test/sim_max_reward_4500005": 0.2322977493146421, "test/sim_max_reward_4500006": 0.9246537779094006, "test/sim_max_reward_4500007": 0.8158262454774988, "test/sim_max_reward_4500008": 0.9173443026564565, "test/sim_max_reward_4500009": 0.05354587971003398, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.8646719662458242, "test/sim_max_reward_4500012": 0.958523691844671, "test/sim_max_reward_4500013": 0.0028663463537898335, "test/sim_max_reward_4500014": 0.23825588861499805, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.017306375375451728, "test/sim_max_reward_4500017": 0.14444157331049934, "test/sim_max_reward_4500018": 0.40191552454906965, "test/sim_max_reward_4500019": 0.9576035290561433, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9576321739778405, "test/sim_max_reward_4500022": 0.9737393439191099, "test/sim_max_reward_4500023": 0.5731436113295755, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8470952063295089, "test/sim_max_reward_4500026": 1.0, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.09022853333166685, "test/sim_max_reward_4500030": 0.9930366409121718, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.052828237426510376, "test/sim_max_reward_4500033": 0.9794551553762244, "test/sim_max_reward_4500034": 0.0504170720837514, "test/sim_max_reward_4500035": 0.5539698839221954, "test/sim_max_reward_4500036": 0.7894860960443006, "test/sim_max_reward_4500037": 1.0, "test/sim_max_reward_4500038": 0.9509318981975163, "test/sim_max_reward_4500039": 0.8717931613208793, "test/sim_max_reward_4500040": 0.997042305329284, "test/sim_max_reward_4500041": 0.9154198331330838, "test/sim_max_reward_4500042": 0.7652988475266772, "test/sim_max_reward_4500043": 0.2534200635738666, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9261586286616637, "test/sim_max_reward_4500046": 0.21745601496217065, "test/sim_max_reward_4500047": 0.9159994035899205, "test/sim_max_reward_4500048": 0.9745097884545219, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5244799849818642, "test/mean_score": 0.5849101226779517, "val_loss": 77218.859375} {"train_loss": -6.629909992218018, "global_step": 126042, "epoch": 3001} {"train_loss": -6.589996814727783, "global_step": 126043, "epoch": 3001} {"train_loss": -6.52972412109375, "global_step": 126044, "epoch": 3001} {"train_loss": -6.554369926452637, "global_step": 126045, "epoch": 3001} {"train_loss": -6.575787544250488, "global_step": 126046, "epoch": 3001} {"train_loss": -6.5900397300720215, "global_step": 126047, "epoch": 3001} {"train_loss": -6.656958103179932, "global_step": 126048, "epoch": 3001} {"train_loss": -6.616362571716309, "global_step": 126049, "epoch": 3001} {"train_loss": -6.653581142425537, "global_step": 126050, "epoch": 3001} {"train_loss": -6.768157005310059, "global_step": 126051, "epoch": 3001} {"train_loss": -6.7065534591674805, "global_step": 126052, "epoch": 3001} {"train_loss": -6.7414751052856445, "global_step": 126053, "epoch": 3001} {"train_loss": -6.52400016784668, "global_step": 126054, "epoch": 3001} {"train_loss": -6.6946611404418945, "global_step": 126055, "epoch": 3001} {"train_loss": -6.517094135284424, "global_step": 126056, "epoch": 3001} {"train_loss": -6.679688453674316, "global_step": 126057, "epoch": 3001} {"train_loss": -6.642401695251465, "global_step": 126058, "epoch": 3001} {"train_loss": -6.622852325439453, "global_step": 126059, "epoch": 3001} {"train_loss": -6.603187084197998, "global_step": 126060, "epoch": 3001} {"train_loss": -6.6856794357299805, "global_step": 126061, "epoch": 3001} {"train_loss": -6.475671768188477, "global_step": 126062, "epoch": 3001} {"train_loss": -6.653233528137207, "global_step": 126063, "epoch": 3001} {"train_loss": -6.658563137054443, "global_step": 126064, "epoch": 3001} {"train_loss": -6.552394866943359, "global_step": 126065, "epoch": 3001} {"train_loss": -6.561038494110107, "global_step": 126066, "epoch": 3001} {"train_loss": -6.678018569946289, "global_step": 126067, "epoch": 3001} {"train_loss": -6.665689468383789, "global_step": 126068, "epoch": 3001} {"train_loss": -6.530106067657471, "global_step": 126069, "epoch": 3001} {"train_loss": -6.651341915130615, "global_step": 126070, "epoch": 3001} {"train_loss": -6.644732475280762, "global_step": 126071, "epoch": 3001} {"train_loss": -6.573976993560791, "global_step": 126072, "epoch": 3001} {"train_loss": -6.598343849182129, "global_step": 126073, "epoch": 3001} {"train_loss": -6.641459941864014, "global_step": 126074, "epoch": 3001} {"train_loss": -6.761532306671143, "global_step": 126075, "epoch": 3001} {"train_loss": -6.570503234863281, "global_step": 126076, "epoch": 3001} {"train_loss": -6.6861114501953125, "global_step": 126077, "epoch": 3001} {"train_loss": -6.474488735198975, "global_step": 126078, "epoch": 3001} {"train_loss": -6.747007369995117, "global_step": 126079, "epoch": 3001} {"train_loss": -6.621232986450195, "global_step": 126080, "epoch": 3001} {"train_loss": -6.623381614685059, "global_step": 126081, "epoch": 3001} {"train_loss": -6.696045875549316, "global_step": 126082, "epoch": 3001} {"train_loss": -6.625214962732224, "global_step": 126083, "epoch": 3001, "val_loss": 77018.078125} {"train_loss": -6.59562349319458, "global_step": 126084, "epoch": 3002} {"train_loss": -6.666929244995117, "global_step": 126085, "epoch": 3002} {"train_loss": -6.634864807128906, "global_step": 126086, "epoch": 3002} {"train_loss": -6.67679500579834, "global_step": 126087, "epoch": 3002} {"train_loss": -6.605965614318848, "global_step": 126088, "epoch": 3002} {"train_loss": -6.612627983093262, "global_step": 126089, "epoch": 3002} {"train_loss": -6.692094802856445, "global_step": 126090, "epoch": 3002} {"train_loss": -6.5875725746154785, "global_step": 126091, "epoch": 3002} {"train_loss": -6.7223896980285645, "global_step": 126092, "epoch": 3002} {"train_loss": -6.692294597625732, "global_step": 126093, "epoch": 3002} {"train_loss": -6.670262336730957, "global_step": 126094, "epoch": 3002} {"train_loss": -6.561142444610596, "global_step": 126095, "epoch": 3002} {"train_loss": -6.63113260269165, "global_step": 126096, "epoch": 3002} {"train_loss": -6.671152591705322, "global_step": 126097, "epoch": 3002} {"train_loss": -6.528772830963135, "global_step": 126098, "epoch": 3002} {"train_loss": -6.670401573181152, "global_step": 126099, "epoch": 3002} {"train_loss": -6.66702938079834, "global_step": 126100, "epoch": 3002} {"train_loss": -6.685619354248047, "global_step": 126101, "epoch": 3002} {"train_loss": -6.648833274841309, "global_step": 126102, "epoch": 3002} {"train_loss": -6.606158256530762, "global_step": 126103, "epoch": 3002} {"train_loss": -6.622167587280273, "global_step": 126104, "epoch": 3002} {"train_loss": -6.67729377746582, "global_step": 126105, "epoch": 3002} {"train_loss": -6.5345306396484375, "global_step": 126106, "epoch": 3002} {"train_loss": -6.702472686767578, "global_step": 126107, "epoch": 3002} {"train_loss": -6.533209800720215, "global_step": 126108, "epoch": 3002} {"train_loss": -6.546632766723633, "global_step": 126109, "epoch": 3002} {"train_loss": -6.614419937133789, "global_step": 126110, "epoch": 3002} {"train_loss": -6.6011810302734375, "global_step": 126111, "epoch": 3002} {"train_loss": -6.607113361358643, "global_step": 126112, "epoch": 3002} {"train_loss": -6.574278831481934, "global_step": 126113, "epoch": 3002} {"train_loss": -6.586477279663086, "global_step": 126114, "epoch": 3002} {"train_loss": -6.575498580932617, "global_step": 126115, "epoch": 3002} {"train_loss": -6.619510173797607, "global_step": 126116, "epoch": 3002} {"train_loss": -6.644636631011963, "global_step": 126117, "epoch": 3002} {"train_loss": -6.562600135803223, "global_step": 126118, "epoch": 3002} {"train_loss": -6.589852809906006, "global_step": 126119, "epoch": 3002} {"train_loss": -6.554813385009766, "global_step": 126120, "epoch": 3002} {"train_loss": -6.638115406036377, "global_step": 126121, "epoch": 3002} {"train_loss": -6.55417013168335, "global_step": 126122, "epoch": 3002} {"train_loss": -6.5513153076171875, "global_step": 126123, "epoch": 3002} {"train_loss": -6.637395858764648, "global_step": 126124, "epoch": 3002} {"train_loss": -6.615656182879493, "global_step": 126125, "epoch": 3002, "val_loss": 77465.4921875} {"train_loss": -6.643918514251709, "global_step": 126126, "epoch": 3003} {"train_loss": -6.47502326965332, "global_step": 126127, "epoch": 3003} {"train_loss": -6.477644920349121, "global_step": 126128, "epoch": 3003} {"train_loss": -6.606906414031982, "global_step": 126129, "epoch": 3003} {"train_loss": -6.492387771606445, "global_step": 126130, "epoch": 3003} {"train_loss": -6.537519454956055, "global_step": 126131, "epoch": 3003} {"train_loss": -6.6488847732543945, "global_step": 126132, "epoch": 3003} {"train_loss": -6.548229217529297, "global_step": 126133, "epoch": 3003} {"train_loss": -6.58928918838501, "global_step": 126134, "epoch": 3003} {"train_loss": -6.530064105987549, "global_step": 126135, "epoch": 3003} {"train_loss": -6.456230163574219, "global_step": 126136, "epoch": 3003} {"train_loss": -6.527713298797607, "global_step": 126137, "epoch": 3003} {"train_loss": -6.56772518157959, "global_step": 126138, "epoch": 3003} {"train_loss": -6.540308475494385, "global_step": 126139, "epoch": 3003} {"train_loss": -6.518165111541748, "global_step": 126140, "epoch": 3003} {"train_loss": -6.645655632019043, "global_step": 126141, "epoch": 3003} {"train_loss": -6.560113430023193, "global_step": 126142, "epoch": 3003} {"train_loss": -6.558379173278809, "global_step": 126143, "epoch": 3003} {"train_loss": -6.499076843261719, "global_step": 126144, "epoch": 3003} {"train_loss": -6.629990577697754, "global_step": 126145, "epoch": 3003} {"train_loss": -6.633644104003906, "global_step": 126146, "epoch": 3003} {"train_loss": -6.718578338623047, "global_step": 126147, "epoch": 3003} {"train_loss": -6.660150527954102, "global_step": 126148, "epoch": 3003} {"train_loss": -6.631202697753906, "global_step": 126149, "epoch": 3003} {"train_loss": -6.636228561401367, "global_step": 126150, "epoch": 3003} {"train_loss": -6.6684041023254395, "global_step": 126151, "epoch": 3003} {"train_loss": -6.686090469360352, "global_step": 126152, "epoch": 3003} {"train_loss": -6.583661079406738, "global_step": 126153, "epoch": 3003} {"train_loss": -6.590917587280273, "global_step": 126154, "epoch": 3003} {"train_loss": -6.72258996963501, "global_step": 126155, "epoch": 3003} {"train_loss": -6.682500839233398, "global_step": 126156, "epoch": 3003} {"train_loss": -6.627582550048828, "global_step": 126157, "epoch": 3003} {"train_loss": -6.519320487976074, "global_step": 126158, "epoch": 3003} {"train_loss": -6.650386333465576, "global_step": 126159, "epoch": 3003} {"train_loss": -6.4794721603393555, "global_step": 126160, "epoch": 3003} {"train_loss": -6.703102111816406, "global_step": 126161, "epoch": 3003} {"train_loss": -6.64164924621582, "global_step": 126162, "epoch": 3003} {"train_loss": -6.5321807861328125, "global_step": 126163, "epoch": 3003} {"train_loss": -6.598295211791992, "global_step": 126164, "epoch": 3003} {"train_loss": -6.660243511199951, "global_step": 126165, "epoch": 3003} {"train_loss": -6.68657922744751, "global_step": 126166, "epoch": 3003} {"train_loss": -6.5923441251118975, "global_step": 126167, "epoch": 3003, "val_loss": 77278.5546875} {"train_loss": -6.644107818603516, "global_step": 126168, "epoch": 3004} {"train_loss": -6.5391950607299805, "global_step": 126169, "epoch": 3004} {"train_loss": -6.687823295593262, "global_step": 126170, "epoch": 3004} {"train_loss": -6.690326690673828, "global_step": 126171, "epoch": 3004} {"train_loss": -6.555913925170898, "global_step": 126172, "epoch": 3004} {"train_loss": -6.616600036621094, "global_step": 126173, "epoch": 3004} {"train_loss": -6.501543045043945, "global_step": 126174, "epoch": 3004} {"train_loss": -6.639018535614014, "global_step": 126175, "epoch": 3004} {"train_loss": -6.674166679382324, "global_step": 126176, "epoch": 3004} {"train_loss": -6.594593048095703, "global_step": 126177, "epoch": 3004} {"train_loss": -6.665406703948975, "global_step": 126178, "epoch": 3004} {"train_loss": -6.720457077026367, "global_step": 126179, "epoch": 3004} {"train_loss": -6.734865188598633, "global_step": 126180, "epoch": 3004} {"train_loss": -6.788399696350098, "global_step": 126181, "epoch": 3004} {"train_loss": -6.570143699645996, "global_step": 126182, "epoch": 3004} {"train_loss": -6.6847710609436035, "global_step": 126183, "epoch": 3004} {"train_loss": -6.684649467468262, "global_step": 126184, "epoch": 3004} {"train_loss": -6.696045398712158, "global_step": 126185, "epoch": 3004} {"train_loss": -6.770209312438965, "global_step": 126186, "epoch": 3004} {"train_loss": -6.592768669128418, "global_step": 126187, "epoch": 3004} {"train_loss": -6.671571731567383, "global_step": 126188, "epoch": 3004} {"train_loss": -6.723920822143555, "global_step": 126189, "epoch": 3004} {"train_loss": -6.664219856262207, "global_step": 126190, "epoch": 3004} {"train_loss": -6.693333625793457, "global_step": 126191, "epoch": 3004} {"train_loss": -6.566837787628174, "global_step": 126192, "epoch": 3004} {"train_loss": -6.5679755210876465, "global_step": 126193, "epoch": 3004} {"train_loss": -6.722761631011963, "global_step": 126194, "epoch": 3004} {"train_loss": -6.527565002441406, "global_step": 126195, "epoch": 3004} {"train_loss": -6.689013957977295, "global_step": 126196, "epoch": 3004} {"train_loss": -6.5876383781433105, "global_step": 126197, "epoch": 3004} {"train_loss": -6.68882942199707, "global_step": 126198, "epoch": 3004} {"train_loss": -6.641275882720947, "global_step": 126199, "epoch": 3004} {"train_loss": -6.591358184814453, "global_step": 126200, "epoch": 3004} {"train_loss": -6.665399551391602, "global_step": 126201, "epoch": 3004} {"train_loss": -6.665641784667969, "global_step": 126202, "epoch": 3004} {"train_loss": -6.665217876434326, "global_step": 126203, "epoch": 3004} {"train_loss": -6.592830181121826, "global_step": 126204, "epoch": 3004} {"train_loss": -6.622922420501709, "global_step": 126205, "epoch": 3004} {"train_loss": -6.686854362487793, "global_step": 126206, "epoch": 3004} {"train_loss": -6.665119171142578, "global_step": 126207, "epoch": 3004} {"train_loss": -6.677633762359619, "global_step": 126208, "epoch": 3004} {"train_loss": -6.647220077968779, "global_step": 126209, "epoch": 3004, "val_loss": 77042.2265625} {"train_loss": -6.644082069396973, "global_step": 126210, "epoch": 3005} {"train_loss": -6.6537909507751465, "global_step": 126211, "epoch": 3005} {"train_loss": -6.672278881072998, "global_step": 126212, "epoch": 3005} {"train_loss": -6.637555122375488, "global_step": 126213, "epoch": 3005} {"train_loss": -6.660387992858887, "global_step": 126214, "epoch": 3005} {"train_loss": -6.621062278747559, "global_step": 126215, "epoch": 3005} {"train_loss": -6.618190288543701, "global_step": 126216, "epoch": 3005} {"train_loss": -6.542179107666016, "global_step": 126217, "epoch": 3005} {"train_loss": -6.6262335777282715, "global_step": 126218, "epoch": 3005} {"train_loss": -6.580660820007324, "global_step": 126219, "epoch": 3005} {"train_loss": -6.649925231933594, "global_step": 126220, "epoch": 3005} {"train_loss": -6.6967573165893555, "global_step": 126221, "epoch": 3005} {"train_loss": -6.826796531677246, "global_step": 126222, "epoch": 3005} {"train_loss": -6.69776725769043, "global_step": 126223, "epoch": 3005} {"train_loss": -6.67195987701416, "global_step": 126224, "epoch": 3005} {"train_loss": -6.753098487854004, "global_step": 126225, "epoch": 3005} {"train_loss": -6.764993190765381, "global_step": 126226, "epoch": 3005} {"train_loss": -6.490017890930176, "global_step": 126227, "epoch": 3005} {"train_loss": -6.630063533782959, "global_step": 126228, "epoch": 3005} {"train_loss": -6.675267219543457, "global_step": 126229, "epoch": 3005} {"train_loss": -6.690387725830078, "global_step": 126230, "epoch": 3005} {"train_loss": -6.6990485191345215, "global_step": 126231, "epoch": 3005} {"train_loss": -6.716767311096191, "global_step": 126232, "epoch": 3005} {"train_loss": -6.626006126403809, "global_step": 126233, "epoch": 3005} {"train_loss": -6.662624359130859, "global_step": 126234, "epoch": 3005} {"train_loss": -6.5696563720703125, "global_step": 126235, "epoch": 3005} {"train_loss": -6.644482612609863, "global_step": 126236, "epoch": 3005} {"train_loss": -6.596430778503418, "global_step": 126237, "epoch": 3005} {"train_loss": -6.693900108337402, "global_step": 126238, "epoch": 3005} {"train_loss": -6.643545150756836, "global_step": 126239, "epoch": 3005} {"train_loss": -6.5570573806762695, "global_step": 126240, "epoch": 3005} {"train_loss": -6.631953239440918, "global_step": 126241, "epoch": 3005} {"train_loss": -6.579286098480225, "global_step": 126242, "epoch": 3005} {"train_loss": -6.608698844909668, "global_step": 126243, "epoch": 3005} {"train_loss": -6.56104850769043, "global_step": 126244, "epoch": 3005} {"train_loss": -6.585005760192871, "global_step": 126245, "epoch": 3005} {"train_loss": -6.5660295486450195, "global_step": 126246, "epoch": 3005} {"train_loss": -6.618985176086426, "global_step": 126247, "epoch": 3005} {"train_loss": -6.650501251220703, "global_step": 126248, "epoch": 3005} {"train_loss": -6.594904899597168, "global_step": 126249, "epoch": 3005} {"train_loss": -6.570509910583496, "global_step": 126250, "epoch": 3005} {"train_loss": -6.636496260052636, "global_step": 126251, "epoch": 3005, "val_loss": 77279.1875} {"train_loss": -6.721807956695557, "global_step": 126252, "epoch": 3006} {"train_loss": -6.543213367462158, "global_step": 126253, "epoch": 3006} {"train_loss": -6.632486343383789, "global_step": 126254, "epoch": 3006} {"train_loss": -6.572277069091797, "global_step": 126255, "epoch": 3006} {"train_loss": -6.702912330627441, "global_step": 126256, "epoch": 3006} {"train_loss": -6.625643730163574, "global_step": 126257, "epoch": 3006} {"train_loss": -6.689657211303711, "global_step": 126258, "epoch": 3006} {"train_loss": -6.68166971206665, "global_step": 126259, "epoch": 3006} {"train_loss": -6.785947799682617, "global_step": 126260, "epoch": 3006} {"train_loss": -6.612257957458496, "global_step": 126261, "epoch": 3006} {"train_loss": -6.739171504974365, "global_step": 126262, "epoch": 3006} {"train_loss": -6.650989532470703, "global_step": 126263, "epoch": 3006} {"train_loss": -6.682110786437988, "global_step": 126264, "epoch": 3006} {"train_loss": -6.711898326873779, "global_step": 126265, "epoch": 3006} {"train_loss": -6.675783157348633, "global_step": 126266, "epoch": 3006} {"train_loss": -6.673511505126953, "global_step": 126267, "epoch": 3006} {"train_loss": -6.673167705535889, "global_step": 126268, "epoch": 3006} {"train_loss": -6.506775856018066, "global_step": 126269, "epoch": 3006} {"train_loss": -6.706539630889893, "global_step": 126270, "epoch": 3006} {"train_loss": -6.582812309265137, "global_step": 126271, "epoch": 3006} {"train_loss": -6.636726379394531, "global_step": 126272, "epoch": 3006} {"train_loss": -6.632014274597168, "global_step": 126273, "epoch": 3006} {"train_loss": -6.794693470001221, "global_step": 126274, "epoch": 3006} {"train_loss": -6.615677833557129, "global_step": 126275, "epoch": 3006} {"train_loss": -6.738633155822754, "global_step": 126276, "epoch": 3006} {"train_loss": -6.63703727722168, "global_step": 126277, "epoch": 3006} {"train_loss": -6.8128743171691895, "global_step": 126278, "epoch": 3006} {"train_loss": -6.8394317626953125, "global_step": 126279, "epoch": 3006} {"train_loss": -6.664162635803223, "global_step": 126280, "epoch": 3006} {"train_loss": -6.706026077270508, "global_step": 126281, "epoch": 3006} {"train_loss": -6.577132225036621, "global_step": 126282, "epoch": 3006} {"train_loss": -6.628535270690918, "global_step": 126283, "epoch": 3006} {"train_loss": -6.68482780456543, "global_step": 126284, "epoch": 3006} {"train_loss": -6.721446990966797, "global_step": 126285, "epoch": 3006} {"train_loss": -6.638957977294922, "global_step": 126286, "epoch": 3006} {"train_loss": -6.589200973510742, "global_step": 126287, "epoch": 3006} {"train_loss": -6.747032165527344, "global_step": 126288, "epoch": 3006} {"train_loss": -6.669244766235352, "global_step": 126289, "epoch": 3006} {"train_loss": -6.687067985534668, "global_step": 126290, "epoch": 3006} {"train_loss": -6.764123439788818, "global_step": 126291, "epoch": 3006} {"train_loss": -6.652868270874023, "global_step": 126292, "epoch": 3006} {"train_loss": -6.675299213046119, "global_step": 126293, "epoch": 3006, "val_loss": 77277.7734375} {"train_loss": -6.628861427307129, "global_step": 126294, "epoch": 3007} {"train_loss": -6.645559310913086, "global_step": 126295, "epoch": 3007} {"train_loss": -6.579803943634033, "global_step": 126296, "epoch": 3007} {"train_loss": -6.614475727081299, "global_step": 126297, "epoch": 3007} {"train_loss": -6.597982406616211, "global_step": 126298, "epoch": 3007} {"train_loss": -6.6285481452941895, "global_step": 126299, "epoch": 3007} {"train_loss": -6.608377456665039, "global_step": 126300, "epoch": 3007} {"train_loss": -6.725114345550537, "global_step": 126301, "epoch": 3007} {"train_loss": -6.72804594039917, "global_step": 126302, "epoch": 3007} {"train_loss": -6.67415189743042, "global_step": 126303, "epoch": 3007} {"train_loss": -6.672713279724121, "global_step": 126304, "epoch": 3007} {"train_loss": -6.699827671051025, "global_step": 126305, "epoch": 3007} {"train_loss": -6.579746246337891, "global_step": 126306, "epoch": 3007} {"train_loss": -6.629116535186768, "global_step": 126307, "epoch": 3007} {"train_loss": -6.631202220916748, "global_step": 126308, "epoch": 3007} {"train_loss": -6.594985008239746, "global_step": 126309, "epoch": 3007} {"train_loss": -6.5919904708862305, "global_step": 126310, "epoch": 3007} {"train_loss": -6.750288963317871, "global_step": 126311, "epoch": 3007} {"train_loss": -6.624013423919678, "global_step": 126312, "epoch": 3007} {"train_loss": -6.641961097717285, "global_step": 126313, "epoch": 3007} {"train_loss": -6.737816333770752, "global_step": 126314, "epoch": 3007} {"train_loss": -6.458054065704346, "global_step": 126315, "epoch": 3007} {"train_loss": -6.533400058746338, "global_step": 126316, "epoch": 3007} {"train_loss": -6.747247695922852, "global_step": 126317, "epoch": 3007} {"train_loss": -6.554586410522461, "global_step": 126318, "epoch": 3007} {"train_loss": -6.727896690368652, "global_step": 126319, "epoch": 3007} {"train_loss": -6.593639373779297, "global_step": 126320, "epoch": 3007} {"train_loss": -6.595691680908203, "global_step": 126321, "epoch": 3007} {"train_loss": -6.54102897644043, "global_step": 126322, "epoch": 3007} {"train_loss": -6.615599155426025, "global_step": 126323, "epoch": 3007} {"train_loss": -6.642062664031982, "global_step": 126324, "epoch": 3007} {"train_loss": -6.604924201965332, "global_step": 126325, "epoch": 3007} {"train_loss": -6.6673784255981445, "global_step": 126326, "epoch": 3007} {"train_loss": -6.726608753204346, "global_step": 126327, "epoch": 3007} {"train_loss": -6.438131332397461, "global_step": 126328, "epoch": 3007} {"train_loss": -6.640995979309082, "global_step": 126329, "epoch": 3007} {"train_loss": -6.675454139709473, "global_step": 126330, "epoch": 3007} {"train_loss": -6.661554336547852, "global_step": 126331, "epoch": 3007} {"train_loss": -6.683002471923828, "global_step": 126332, "epoch": 3007} {"train_loss": -6.593326568603516, "global_step": 126333, "epoch": 3007} {"train_loss": -6.736347198486328, "global_step": 126334, "epoch": 3007} {"train_loss": -6.632481643131801, "global_step": 126335, "epoch": 3007, "val_loss": 77258.09375} {"train_loss": -6.631137847900391, "global_step": 126336, "epoch": 3008} {"train_loss": -6.6501851081848145, "global_step": 126337, "epoch": 3008} {"train_loss": -6.579985618591309, "global_step": 126338, "epoch": 3008} {"train_loss": -6.549543380737305, "global_step": 126339, "epoch": 3008} {"train_loss": -6.746720790863037, "global_step": 126340, "epoch": 3008} {"train_loss": -6.636020660400391, "global_step": 126341, "epoch": 3008} {"train_loss": -6.701667785644531, "global_step": 126342, "epoch": 3008} {"train_loss": -6.713032245635986, "global_step": 126343, "epoch": 3008} {"train_loss": -6.5528035163879395, "global_step": 126344, "epoch": 3008} {"train_loss": -6.7220258712768555, "global_step": 126345, "epoch": 3008} {"train_loss": -6.755268573760986, "global_step": 126346, "epoch": 3008} {"train_loss": -6.695061683654785, "global_step": 126347, "epoch": 3008} {"train_loss": -6.626436233520508, "global_step": 126348, "epoch": 3008} {"train_loss": -6.754764556884766, "global_step": 126349, "epoch": 3008} {"train_loss": -6.542671203613281, "global_step": 126350, "epoch": 3008} {"train_loss": -6.62681245803833, "global_step": 126351, "epoch": 3008} {"train_loss": -6.56154727935791, "global_step": 126352, "epoch": 3008} {"train_loss": -6.496358871459961, "global_step": 126353, "epoch": 3008} {"train_loss": -6.647618293762207, "global_step": 126354, "epoch": 3008} {"train_loss": -6.596657752990723, "global_step": 126355, "epoch": 3008} {"train_loss": -6.463067054748535, "global_step": 126356, "epoch": 3008} {"train_loss": -6.648708820343018, "global_step": 126357, "epoch": 3008} {"train_loss": -6.577134609222412, "global_step": 126358, "epoch": 3008} {"train_loss": -6.5075531005859375, "global_step": 126359, "epoch": 3008} {"train_loss": -6.698533535003662, "global_step": 126360, "epoch": 3008} {"train_loss": -6.474196434020996, "global_step": 126361, "epoch": 3008} {"train_loss": -6.665671348571777, "global_step": 126362, "epoch": 3008} {"train_loss": -6.568447113037109, "global_step": 126363, "epoch": 3008} {"train_loss": -6.662454605102539, "global_step": 126364, "epoch": 3008} {"train_loss": -6.554622173309326, "global_step": 126365, "epoch": 3008} {"train_loss": -6.595185279846191, "global_step": 126366, "epoch": 3008} {"train_loss": -6.715834617614746, "global_step": 126367, "epoch": 3008} {"train_loss": -6.53817081451416, "global_step": 126368, "epoch": 3008} {"train_loss": -6.570190906524658, "global_step": 126369, "epoch": 3008} {"train_loss": -6.503844261169434, "global_step": 126370, "epoch": 3008} {"train_loss": -6.622633934020996, "global_step": 126371, "epoch": 3008} {"train_loss": -6.6983256340026855, "global_step": 126372, "epoch": 3008} {"train_loss": -6.7191972732543945, "global_step": 126373, "epoch": 3008} {"train_loss": -6.666716575622559, "global_step": 126374, "epoch": 3008} {"train_loss": -6.647096633911133, "global_step": 126375, "epoch": 3008} {"train_loss": -6.612953186035156, "global_step": 126376, "epoch": 3008} {"train_loss": -6.620432808285668, "global_step": 126377, "epoch": 3008, "val_loss": 77310.671875} {"train_loss": -6.739157676696777, "global_step": 126378, "epoch": 3009} {"train_loss": -6.720575332641602, "global_step": 126379, "epoch": 3009} {"train_loss": -6.556329727172852, "global_step": 126380, "epoch": 3009} {"train_loss": -6.6006975173950195, "global_step": 126381, "epoch": 3009} {"train_loss": -6.722744941711426, "global_step": 126382, "epoch": 3009} {"train_loss": -6.535885334014893, "global_step": 126383, "epoch": 3009} {"train_loss": -6.57630729675293, "global_step": 126384, "epoch": 3009} {"train_loss": -6.657161712646484, "global_step": 126385, "epoch": 3009} {"train_loss": -6.599112510681152, "global_step": 126386, "epoch": 3009} {"train_loss": -6.709068298339844, "global_step": 126387, "epoch": 3009} {"train_loss": -6.618867874145508, "global_step": 126388, "epoch": 3009} {"train_loss": -6.707217216491699, "global_step": 126389, "epoch": 3009} {"train_loss": -6.614945411682129, "global_step": 126390, "epoch": 3009} {"train_loss": -6.532412528991699, "global_step": 126391, "epoch": 3009} {"train_loss": -6.72695255279541, "global_step": 126392, "epoch": 3009} {"train_loss": -6.581294536590576, "global_step": 126393, "epoch": 3009} {"train_loss": -6.704094886779785, "global_step": 126394, "epoch": 3009} {"train_loss": -6.593178749084473, "global_step": 126395, "epoch": 3009} {"train_loss": -6.624911308288574, "global_step": 126396, "epoch": 3009} {"train_loss": -6.653846263885498, "global_step": 126397, "epoch": 3009} {"train_loss": -6.506638526916504, "global_step": 126398, "epoch": 3009} {"train_loss": -6.56186056137085, "global_step": 126399, "epoch": 3009} {"train_loss": -6.556082725524902, "global_step": 126400, "epoch": 3009} {"train_loss": -6.58343505859375, "global_step": 126401, "epoch": 3009} {"train_loss": -6.565751075744629, "global_step": 126402, "epoch": 3009} {"train_loss": -6.447653770446777, "global_step": 126403, "epoch": 3009} {"train_loss": -6.693099021911621, "global_step": 126404, "epoch": 3009} {"train_loss": -6.563213348388672, "global_step": 126405, "epoch": 3009} {"train_loss": -6.594978332519531, "global_step": 126406, "epoch": 3009} {"train_loss": -6.595385551452637, "global_step": 126407, "epoch": 3009} {"train_loss": -6.691526889801025, "global_step": 126408, "epoch": 3009} {"train_loss": -6.564117431640625, "global_step": 126409, "epoch": 3009} {"train_loss": -6.563504219055176, "global_step": 126410, "epoch": 3009} {"train_loss": -6.629875183105469, "global_step": 126411, "epoch": 3009} {"train_loss": -6.492744445800781, "global_step": 126412, "epoch": 3009} {"train_loss": -6.576581954956055, "global_step": 126413, "epoch": 3009} {"train_loss": -6.685420513153076, "global_step": 126414, "epoch": 3009} {"train_loss": -6.594609260559082, "global_step": 126415, "epoch": 3009} {"train_loss": -6.645931243896484, "global_step": 126416, "epoch": 3009} {"train_loss": -6.614831447601318, "global_step": 126417, "epoch": 3009} {"train_loss": -6.598072528839111, "global_step": 126418, "epoch": 3009} {"train_loss": -6.612683477855864, "global_step": 126419, "epoch": 3009, "val_loss": 77144.125} {"train_loss": -6.569767951965332, "global_step": 126420, "epoch": 3010} {"train_loss": -6.589332103729248, "global_step": 126421, "epoch": 3010} {"train_loss": -6.521026134490967, "global_step": 126422, "epoch": 3010} {"train_loss": -6.565275192260742, "global_step": 126423, "epoch": 3010} {"train_loss": -6.592074871063232, "global_step": 126424, "epoch": 3010} {"train_loss": -6.608362674713135, "global_step": 126425, "epoch": 3010} {"train_loss": -6.618539810180664, "global_step": 126426, "epoch": 3010} {"train_loss": -6.697813034057617, "global_step": 126427, "epoch": 3010} {"train_loss": -6.539323806762695, "global_step": 126428, "epoch": 3010} {"train_loss": -6.6666717529296875, "global_step": 126429, "epoch": 3010} {"train_loss": -6.527881622314453, "global_step": 126430, "epoch": 3010} {"train_loss": -6.6488938331604, "global_step": 126431, "epoch": 3010} {"train_loss": -6.594335079193115, "global_step": 126432, "epoch": 3010} {"train_loss": -6.532629013061523, "global_step": 126433, "epoch": 3010} {"train_loss": -6.615544319152832, "global_step": 126434, "epoch": 3010} {"train_loss": -6.6102705001831055, "global_step": 126435, "epoch": 3010} {"train_loss": -6.464417457580566, "global_step": 126436, "epoch": 3010} {"train_loss": -6.719259262084961, "global_step": 126437, "epoch": 3010} {"train_loss": -6.676492214202881, "global_step": 126438, "epoch": 3010} {"train_loss": -6.545263290405273, "global_step": 126439, "epoch": 3010} {"train_loss": -6.586686611175537, "global_step": 126440, "epoch": 3010} {"train_loss": -6.641599655151367, "global_step": 126441, "epoch": 3010} {"train_loss": -6.576304912567139, "global_step": 126442, "epoch": 3010} {"train_loss": -6.543844699859619, "global_step": 126443, "epoch": 3010} {"train_loss": -6.581172943115234, "global_step": 126444, "epoch": 3010} {"train_loss": -6.523562431335449, "global_step": 126445, "epoch": 3010} {"train_loss": -6.662123680114746, "global_step": 126446, "epoch": 3010} {"train_loss": -6.5575456619262695, "global_step": 126447, "epoch": 3010} {"train_loss": -6.568986892700195, "global_step": 126448, "epoch": 3010} {"train_loss": -6.662721633911133, "global_step": 126449, "epoch": 3010} {"train_loss": -6.663087844848633, "global_step": 126450, "epoch": 3010} {"train_loss": -6.655139923095703, "global_step": 126451, "epoch": 3010} {"train_loss": -6.645275115966797, "global_step": 126452, "epoch": 3010} {"train_loss": -6.427901268005371, "global_step": 126453, "epoch": 3010} {"train_loss": -6.52845573425293, "global_step": 126454, "epoch": 3010} {"train_loss": -6.60610294342041, "global_step": 126455, "epoch": 3010} {"train_loss": -6.41913366317749, "global_step": 126456, "epoch": 3010} {"train_loss": -6.4424848556518555, "global_step": 126457, "epoch": 3010} {"train_loss": -6.462675094604492, "global_step": 126458, "epoch": 3010} {"train_loss": -6.5572638511657715, "global_step": 126459, "epoch": 3010} {"train_loss": -6.508514404296875, "global_step": 126460, "epoch": 3010} {"train_loss": -6.577476263046265, "global_step": 126461, "epoch": 3010, "val_loss": 77126.1875} {"train_loss": -6.576789855957031, "global_step": 126462, "epoch": 3011} {"train_loss": -6.497489929199219, "global_step": 126463, "epoch": 3011} {"train_loss": -6.456229209899902, "global_step": 126464, "epoch": 3011} {"train_loss": -6.535643577575684, "global_step": 126465, "epoch": 3011} {"train_loss": -6.5659499168396, "global_step": 126466, "epoch": 3011} {"train_loss": -6.567697525024414, "global_step": 126467, "epoch": 3011} {"train_loss": -6.621647834777832, "global_step": 126468, "epoch": 3011} {"train_loss": -6.575135231018066, "global_step": 126469, "epoch": 3011} {"train_loss": -6.580418586730957, "global_step": 126470, "epoch": 3011} {"train_loss": -6.592528820037842, "global_step": 126471, "epoch": 3011} {"train_loss": -6.5793962478637695, "global_step": 126472, "epoch": 3011} {"train_loss": -6.615327835083008, "global_step": 126473, "epoch": 3011} {"train_loss": -6.570509910583496, "global_step": 126474, "epoch": 3011} {"train_loss": -6.630942344665527, "global_step": 126475, "epoch": 3011} {"train_loss": -6.44103479385376, "global_step": 126476, "epoch": 3011} {"train_loss": -6.5586395263671875, "global_step": 126477, "epoch": 3011} {"train_loss": -6.732727527618408, "global_step": 126478, "epoch": 3011} {"train_loss": -6.660074710845947, "global_step": 126479, "epoch": 3011} {"train_loss": -6.59440803527832, "global_step": 126480, "epoch": 3011} {"train_loss": -6.652500629425049, "global_step": 126481, "epoch": 3011} {"train_loss": -6.784237861633301, "global_step": 126482, "epoch": 3011} {"train_loss": -6.698981761932373, "global_step": 126483, "epoch": 3011} {"train_loss": -6.620760917663574, "global_step": 126484, "epoch": 3011} {"train_loss": -6.708240985870361, "global_step": 126485, "epoch": 3011} {"train_loss": -6.718329429626465, "global_step": 126486, "epoch": 3011} {"train_loss": -6.604982376098633, "global_step": 126487, "epoch": 3011} {"train_loss": -6.714780330657959, "global_step": 126488, "epoch": 3011} {"train_loss": -6.6053876876831055, "global_step": 126489, "epoch": 3011} {"train_loss": -6.382923126220703, "global_step": 126490, "epoch": 3011} {"train_loss": -6.614691734313965, "global_step": 126491, "epoch": 3011} {"train_loss": -6.613581657409668, "global_step": 126492, "epoch": 3011} {"train_loss": -6.544013500213623, "global_step": 126493, "epoch": 3011} {"train_loss": -6.639247894287109, "global_step": 126494, "epoch": 3011} {"train_loss": -6.5905866622924805, "global_step": 126495, "epoch": 3011} {"train_loss": -6.637205123901367, "global_step": 126496, "epoch": 3011} {"train_loss": -6.5664472579956055, "global_step": 126497, "epoch": 3011} {"train_loss": -6.657168388366699, "global_step": 126498, "epoch": 3011} {"train_loss": -6.610726356506348, "global_step": 126499, "epoch": 3011} {"train_loss": -6.538328170776367, "global_step": 126500, "epoch": 3011} {"train_loss": -6.7287278175354, "global_step": 126501, "epoch": 3011} {"train_loss": -6.646205902099609, "global_step": 126502, "epoch": 3011} {"train_loss": -6.608185700007847, "global_step": 126503, "epoch": 3011, "val_loss": 77210.2734375} {"train_loss": -6.586545467376709, "global_step": 126504, "epoch": 3012} {"train_loss": -6.646831512451172, "global_step": 126505, "epoch": 3012} {"train_loss": -6.657477855682373, "global_step": 126506, "epoch": 3012} {"train_loss": -6.659706115722656, "global_step": 126507, "epoch": 3012} {"train_loss": -6.605563640594482, "global_step": 126508, "epoch": 3012} {"train_loss": -6.742210388183594, "global_step": 126509, "epoch": 3012} {"train_loss": -6.658247947692871, "global_step": 126510, "epoch": 3012} {"train_loss": -6.561988353729248, "global_step": 126511, "epoch": 3012} {"train_loss": -6.545587062835693, "global_step": 126512, "epoch": 3012} {"train_loss": -6.6939496994018555, "global_step": 126513, "epoch": 3012} {"train_loss": -6.654674530029297, "global_step": 126514, "epoch": 3012} {"train_loss": -6.651206970214844, "global_step": 126515, "epoch": 3012} {"train_loss": -6.657073974609375, "global_step": 126516, "epoch": 3012} {"train_loss": -6.744839191436768, "global_step": 126517, "epoch": 3012} {"train_loss": -6.5471110343933105, "global_step": 126518, "epoch": 3012} {"train_loss": -6.652305603027344, "global_step": 126519, "epoch": 3012} {"train_loss": -6.648497581481934, "global_step": 126520, "epoch": 3012} {"train_loss": -6.648211479187012, "global_step": 126521, "epoch": 3012} {"train_loss": -6.598564624786377, "global_step": 126522, "epoch": 3012} {"train_loss": -6.581835746765137, "global_step": 126523, "epoch": 3012} {"train_loss": -6.488766670227051, "global_step": 126524, "epoch": 3012} {"train_loss": -6.69754695892334, "global_step": 126525, "epoch": 3012} {"train_loss": -6.46541166305542, "global_step": 126526, "epoch": 3012} {"train_loss": -6.638116359710693, "global_step": 126527, "epoch": 3012} {"train_loss": -6.637930870056152, "global_step": 126528, "epoch": 3012} {"train_loss": -6.6215925216674805, "global_step": 126529, "epoch": 3012} {"train_loss": -6.481450080871582, "global_step": 126530, "epoch": 3012} {"train_loss": -6.632416725158691, "global_step": 126531, "epoch": 3012} {"train_loss": -6.6405792236328125, "global_step": 126532, "epoch": 3012} {"train_loss": -6.655790328979492, "global_step": 126533, "epoch": 3012} {"train_loss": -6.597114562988281, "global_step": 126534, "epoch": 3012} {"train_loss": -6.7376251220703125, "global_step": 126535, "epoch": 3012} {"train_loss": -6.630014896392822, "global_step": 126536, "epoch": 3012} {"train_loss": -6.58181095123291, "global_step": 126537, "epoch": 3012} {"train_loss": -6.702320098876953, "global_step": 126538, "epoch": 3012} {"train_loss": -6.736366271972656, "global_step": 126539, "epoch": 3012} {"train_loss": -6.718470096588135, "global_step": 126540, "epoch": 3012} {"train_loss": -6.556729316711426, "global_step": 126541, "epoch": 3012} {"train_loss": -6.712338447570801, "global_step": 126542, "epoch": 3012} {"train_loss": -6.6201677322387695, "global_step": 126543, "epoch": 3012} {"train_loss": -6.5594587326049805, "global_step": 126544, "epoch": 3012} {"train_loss": -6.633066892623901, "global_step": 126545, "epoch": 3012, "val_loss": 77285.609375} {"train_loss": -6.709890842437744, "global_step": 126546, "epoch": 3013} {"train_loss": -6.616765975952148, "global_step": 126547, "epoch": 3013} {"train_loss": -6.579520225524902, "global_step": 126548, "epoch": 3013} {"train_loss": -6.647027969360352, "global_step": 126549, "epoch": 3013} {"train_loss": -6.7426886558532715, "global_step": 126550, "epoch": 3013} {"train_loss": -6.652688026428223, "global_step": 126551, "epoch": 3013} {"train_loss": -6.548986911773682, "global_step": 126552, "epoch": 3013} {"train_loss": -6.597943305969238, "global_step": 126553, "epoch": 3013} {"train_loss": -6.689943313598633, "global_step": 126554, "epoch": 3013} {"train_loss": -6.599783420562744, "global_step": 126555, "epoch": 3013} {"train_loss": -6.598915100097656, "global_step": 126556, "epoch": 3013} {"train_loss": -6.651487350463867, "global_step": 126557, "epoch": 3013} {"train_loss": -6.581113815307617, "global_step": 126558, "epoch": 3013} {"train_loss": -6.691102027893066, "global_step": 126559, "epoch": 3013} {"train_loss": -6.582427024841309, "global_step": 126560, "epoch": 3013} {"train_loss": -6.553909778594971, "global_step": 126561, "epoch": 3013} {"train_loss": -6.692890644073486, "global_step": 126562, "epoch": 3013} {"train_loss": -6.593503475189209, "global_step": 126563, "epoch": 3013} {"train_loss": -6.74953556060791, "global_step": 126564, "epoch": 3013} {"train_loss": -6.588667869567871, "global_step": 126565, "epoch": 3013} {"train_loss": -6.511877059936523, "global_step": 126566, "epoch": 3013} {"train_loss": -6.690867900848389, "global_step": 126567, "epoch": 3013} {"train_loss": -6.552343368530273, "global_step": 126568, "epoch": 3013} {"train_loss": -6.703185081481934, "global_step": 126569, "epoch": 3013} {"train_loss": -6.644730091094971, "global_step": 126570, "epoch": 3013} {"train_loss": -6.485494613647461, "global_step": 126571, "epoch": 3013} {"train_loss": -6.562099456787109, "global_step": 126572, "epoch": 3013} {"train_loss": -6.738168716430664, "global_step": 126573, "epoch": 3013} {"train_loss": -6.6365647315979, "global_step": 126574, "epoch": 3013} {"train_loss": -6.6851301193237305, "global_step": 126575, "epoch": 3013} {"train_loss": -6.6761064529418945, "global_step": 126576, "epoch": 3013} {"train_loss": -6.661110877990723, "global_step": 126577, "epoch": 3013} {"train_loss": -6.728084564208984, "global_step": 126578, "epoch": 3013} {"train_loss": -6.6336517333984375, "global_step": 126579, "epoch": 3013} {"train_loss": -6.552365303039551, "global_step": 126580, "epoch": 3013} {"train_loss": -6.626971244812012, "global_step": 126581, "epoch": 3013} {"train_loss": -6.720763206481934, "global_step": 126582, "epoch": 3013} {"train_loss": -6.650434494018555, "global_step": 126583, "epoch": 3013} {"train_loss": -6.6195573806762695, "global_step": 126584, "epoch": 3013} {"train_loss": -6.731554985046387, "global_step": 126585, "epoch": 3013} {"train_loss": -6.6519951820373535, "global_step": 126586, "epoch": 3013} {"train_loss": -6.635943764731998, "global_step": 126587, "epoch": 3013, "val_loss": 77255.9921875} {"train_loss": -6.65191650390625, "global_step": 126588, "epoch": 3014} {"train_loss": -6.653895378112793, "global_step": 126589, "epoch": 3014} {"train_loss": -6.601083755493164, "global_step": 126590, "epoch": 3014} {"train_loss": -6.648831367492676, "global_step": 126591, "epoch": 3014} {"train_loss": -6.805444717407227, "global_step": 126592, "epoch": 3014} {"train_loss": -6.701643943786621, "global_step": 126593, "epoch": 3014} {"train_loss": -6.698680877685547, "global_step": 126594, "epoch": 3014} {"train_loss": -6.654577732086182, "global_step": 126595, "epoch": 3014} {"train_loss": -6.635229587554932, "global_step": 126596, "epoch": 3014} {"train_loss": -6.776472091674805, "global_step": 126597, "epoch": 3014} {"train_loss": -6.650918483734131, "global_step": 126598, "epoch": 3014} {"train_loss": -6.676824569702148, "global_step": 126599, "epoch": 3014} {"train_loss": -6.734835624694824, "global_step": 126600, "epoch": 3014} {"train_loss": -6.710650444030762, "global_step": 126601, "epoch": 3014} {"train_loss": -6.582071304321289, "global_step": 126602, "epoch": 3014} {"train_loss": -6.632906436920166, "global_step": 126603, "epoch": 3014} {"train_loss": -6.653412818908691, "global_step": 126604, "epoch": 3014} {"train_loss": -6.589649200439453, "global_step": 126605, "epoch": 3014} {"train_loss": -6.516843795776367, "global_step": 126606, "epoch": 3014} {"train_loss": -6.551370143890381, "global_step": 126607, "epoch": 3014} {"train_loss": -6.633974075317383, "global_step": 126608, "epoch": 3014} {"train_loss": -6.6865010261535645, "global_step": 126609, "epoch": 3014} {"train_loss": -6.74653434753418, "global_step": 126610, "epoch": 3014} {"train_loss": -6.621672630310059, "global_step": 126611, "epoch": 3014} {"train_loss": -6.5745744705200195, "global_step": 126612, "epoch": 3014} {"train_loss": -6.687568187713623, "global_step": 126613, "epoch": 3014} {"train_loss": -6.753330230712891, "global_step": 126614, "epoch": 3014} {"train_loss": -6.506292819976807, "global_step": 126615, "epoch": 3014} {"train_loss": -6.644930839538574, "global_step": 126616, "epoch": 3014} {"train_loss": -6.625635147094727, "global_step": 126617, "epoch": 3014} {"train_loss": -6.6710205078125, "global_step": 126618, "epoch": 3014} {"train_loss": -6.711180686950684, "global_step": 126619, "epoch": 3014} {"train_loss": -6.721132278442383, "global_step": 126620, "epoch": 3014} {"train_loss": -6.717026233673096, "global_step": 126621, "epoch": 3014} {"train_loss": -6.71246337890625, "global_step": 126622, "epoch": 3014} {"train_loss": -6.635750770568848, "global_step": 126623, "epoch": 3014} {"train_loss": -6.636483669281006, "global_step": 126624, "epoch": 3014} {"train_loss": -6.697975158691406, "global_step": 126625, "epoch": 3014} {"train_loss": -6.677394390106201, "global_step": 126626, "epoch": 3014} {"train_loss": -6.6777873039245605, "global_step": 126627, "epoch": 3014} {"train_loss": -6.703363418579102, "global_step": 126628, "epoch": 3014} {"train_loss": -6.658590169180007, "global_step": 126629, "epoch": 3014, "val_loss": 77426.9609375} {"train_loss": -6.635565757751465, "global_step": 126630, "epoch": 3015} {"train_loss": -6.671659469604492, "global_step": 126631, "epoch": 3015} {"train_loss": -6.620194435119629, "global_step": 126632, "epoch": 3015} {"train_loss": -6.65287446975708, "global_step": 126633, "epoch": 3015} {"train_loss": -6.647696495056152, "global_step": 126634, "epoch": 3015} {"train_loss": -6.659295558929443, "global_step": 126635, "epoch": 3015} {"train_loss": -6.580057144165039, "global_step": 126636, "epoch": 3015} {"train_loss": -6.769714832305908, "global_step": 126637, "epoch": 3015} {"train_loss": -6.581978797912598, "global_step": 126638, "epoch": 3015} {"train_loss": -6.593264102935791, "global_step": 126639, "epoch": 3015} {"train_loss": -6.688693046569824, "global_step": 126640, "epoch": 3015} {"train_loss": -6.622430324554443, "global_step": 126641, "epoch": 3015} {"train_loss": -6.662579536437988, "global_step": 126642, "epoch": 3015} {"train_loss": -6.689166069030762, "global_step": 126643, "epoch": 3015} {"train_loss": -6.621552467346191, "global_step": 126644, "epoch": 3015} {"train_loss": -6.631467819213867, "global_step": 126645, "epoch": 3015} {"train_loss": -6.506448268890381, "global_step": 126646, "epoch": 3015} {"train_loss": -6.563208103179932, "global_step": 126647, "epoch": 3015} {"train_loss": -6.810427665710449, "global_step": 126648, "epoch": 3015} {"train_loss": -6.549644470214844, "global_step": 126649, "epoch": 3015} {"train_loss": -6.571424961090088, "global_step": 126650, "epoch": 3015} {"train_loss": -6.614542007446289, "global_step": 126651, "epoch": 3015} {"train_loss": -6.603569984436035, "global_step": 126652, "epoch": 3015} {"train_loss": -6.660307884216309, "global_step": 126653, "epoch": 3015} {"train_loss": -6.6451921463012695, "global_step": 126654, "epoch": 3015} {"train_loss": -6.559995174407959, "global_step": 126655, "epoch": 3015} {"train_loss": -6.571084499359131, "global_step": 126656, "epoch": 3015} {"train_loss": -6.5577006340026855, "global_step": 126657, "epoch": 3015} {"train_loss": -6.590912818908691, "global_step": 126658, "epoch": 3015} {"train_loss": -6.6562418937683105, "global_step": 126659, "epoch": 3015} {"train_loss": -6.478553771972656, "global_step": 126660, "epoch": 3015} {"train_loss": -6.492036819458008, "global_step": 126661, "epoch": 3015} {"train_loss": -6.6345415115356445, "global_step": 126662, "epoch": 3015} {"train_loss": -6.519896507263184, "global_step": 126663, "epoch": 3015} {"train_loss": -6.533993721008301, "global_step": 126664, "epoch": 3015} {"train_loss": -6.652644157409668, "global_step": 126665, "epoch": 3015} {"train_loss": -6.589873313903809, "global_step": 126666, "epoch": 3015} {"train_loss": -6.516818046569824, "global_step": 126667, "epoch": 3015} {"train_loss": -6.606261730194092, "global_step": 126668, "epoch": 3015} {"train_loss": -6.604244232177734, "global_step": 126669, "epoch": 3015} {"train_loss": -6.61586856842041, "global_step": 126670, "epoch": 3015} {"train_loss": -6.609093382245018, "global_step": 126671, "epoch": 3015, "val_loss": 77202.125} {"train_loss": -6.639944076538086, "global_step": 126672, "epoch": 3016} {"train_loss": -6.604249000549316, "global_step": 126673, "epoch": 3016} {"train_loss": -6.545354843139648, "global_step": 126674, "epoch": 3016} {"train_loss": -6.6436076164245605, "global_step": 126675, "epoch": 3016} {"train_loss": -6.6416015625, "global_step": 126676, "epoch": 3016} {"train_loss": -6.610564708709717, "global_step": 126677, "epoch": 3016} {"train_loss": -6.683918476104736, "global_step": 126678, "epoch": 3016} {"train_loss": -6.465780258178711, "global_step": 126679, "epoch": 3016} {"train_loss": -6.414180755615234, "global_step": 126680, "epoch": 3016} {"train_loss": -6.631752014160156, "global_step": 126681, "epoch": 3016} {"train_loss": -6.501100540161133, "global_step": 126682, "epoch": 3016} {"train_loss": -6.532070636749268, "global_step": 126683, "epoch": 3016} {"train_loss": -6.655821800231934, "global_step": 126684, "epoch": 3016} {"train_loss": -6.500351428985596, "global_step": 126685, "epoch": 3016} {"train_loss": -6.574244499206543, "global_step": 126686, "epoch": 3016} {"train_loss": -6.729498386383057, "global_step": 126687, "epoch": 3016} {"train_loss": -6.635339260101318, "global_step": 126688, "epoch": 3016} {"train_loss": -6.566895961761475, "global_step": 126689, "epoch": 3016} {"train_loss": -6.637247085571289, "global_step": 126690, "epoch": 3016} {"train_loss": -6.643224716186523, "global_step": 126691, "epoch": 3016} {"train_loss": -6.622581481933594, "global_step": 126692, "epoch": 3016} {"train_loss": -6.666650295257568, "global_step": 126693, "epoch": 3016} {"train_loss": -6.639529228210449, "global_step": 126694, "epoch": 3016} {"train_loss": -6.725646018981934, "global_step": 126695, "epoch": 3016} {"train_loss": -6.6075592041015625, "global_step": 126696, "epoch": 3016} {"train_loss": -6.642148017883301, "global_step": 126697, "epoch": 3016} {"train_loss": -6.7985124588012695, "global_step": 126698, "epoch": 3016} {"train_loss": -6.5616044998168945, "global_step": 126699, "epoch": 3016} {"train_loss": -6.518576622009277, "global_step": 126700, "epoch": 3016} {"train_loss": -6.706188201904297, "global_step": 126701, "epoch": 3016} {"train_loss": -6.593841552734375, "global_step": 126702, "epoch": 3016} {"train_loss": -6.528806686401367, "global_step": 126703, "epoch": 3016} {"train_loss": -6.5634765625, "global_step": 126704, "epoch": 3016} {"train_loss": -6.661963939666748, "global_step": 126705, "epoch": 3016} {"train_loss": -6.621609687805176, "global_step": 126706, "epoch": 3016} {"train_loss": -6.638172149658203, "global_step": 126707, "epoch": 3016} {"train_loss": -6.595885276794434, "global_step": 126708, "epoch": 3016} {"train_loss": -6.745196342468262, "global_step": 126709, "epoch": 3016} {"train_loss": -6.569454193115234, "global_step": 126710, "epoch": 3016} {"train_loss": -6.5572686195373535, "global_step": 126711, "epoch": 3016} {"train_loss": -6.656027793884277, "global_step": 126712, "epoch": 3016} {"train_loss": -6.609401793706985, "global_step": 126713, "epoch": 3016, "val_loss": 77657.5625} {"train_loss": -6.636809349060059, "global_step": 126714, "epoch": 3017} {"train_loss": -6.6856770515441895, "global_step": 126715, "epoch": 3017} {"train_loss": -6.672342300415039, "global_step": 126716, "epoch": 3017} {"train_loss": -6.559108257293701, "global_step": 126717, "epoch": 3017} {"train_loss": -6.708988189697266, "global_step": 126718, "epoch": 3017} {"train_loss": -6.547788619995117, "global_step": 126719, "epoch": 3017} {"train_loss": -6.56461763381958, "global_step": 126720, "epoch": 3017} {"train_loss": -6.5893635749816895, "global_step": 126721, "epoch": 3017} {"train_loss": -6.575385093688965, "global_step": 126722, "epoch": 3017} {"train_loss": -6.533321857452393, "global_step": 126723, "epoch": 3017} {"train_loss": -6.63690185546875, "global_step": 126724, "epoch": 3017} {"train_loss": -6.5035858154296875, "global_step": 126725, "epoch": 3017} {"train_loss": -6.637770652770996, "global_step": 126726, "epoch": 3017} {"train_loss": -6.533805847167969, "global_step": 126727, "epoch": 3017} {"train_loss": -6.598164081573486, "global_step": 126728, "epoch": 3017} {"train_loss": -6.5898590087890625, "global_step": 126729, "epoch": 3017} {"train_loss": -6.328436851501465, "global_step": 126730, "epoch": 3017} {"train_loss": -6.608367919921875, "global_step": 126731, "epoch": 3017} {"train_loss": -6.480962753295898, "global_step": 126732, "epoch": 3017} {"train_loss": -6.523828506469727, "global_step": 126733, "epoch": 3017} {"train_loss": -6.5271711349487305, "global_step": 126734, "epoch": 3017} {"train_loss": -6.552704811096191, "global_step": 126735, "epoch": 3017} {"train_loss": -6.600898265838623, "global_step": 126736, "epoch": 3017} {"train_loss": -6.5001325607299805, "global_step": 126737, "epoch": 3017} {"train_loss": -6.661455154418945, "global_step": 126738, "epoch": 3017} {"train_loss": -6.5417304039001465, "global_step": 126739, "epoch": 3017} {"train_loss": -6.552253723144531, "global_step": 126740, "epoch": 3017} {"train_loss": -6.516119003295898, "global_step": 126741, "epoch": 3017} {"train_loss": -6.625312328338623, "global_step": 126742, "epoch": 3017} {"train_loss": -6.597704887390137, "global_step": 126743, "epoch": 3017} {"train_loss": -6.606359004974365, "global_step": 126744, "epoch": 3017} {"train_loss": -6.6205902099609375, "global_step": 126745, "epoch": 3017} {"train_loss": -6.534034252166748, "global_step": 126746, "epoch": 3017} {"train_loss": -6.661884307861328, "global_step": 126747, "epoch": 3017} {"train_loss": -6.6150712966918945, "global_step": 126748, "epoch": 3017} {"train_loss": -6.5620436668396, "global_step": 126749, "epoch": 3017} {"train_loss": -6.533980369567871, "global_step": 126750, "epoch": 3017} {"train_loss": -6.699838638305664, "global_step": 126751, "epoch": 3017} {"train_loss": -6.735527992248535, "global_step": 126752, "epoch": 3017} {"train_loss": -6.606866836547852, "global_step": 126753, "epoch": 3017} {"train_loss": -6.711958408355713, "global_step": 126754, "epoch": 3017} {"train_loss": -6.5904688494546075, "global_step": 126755, "epoch": 3017, "val_loss": 77471.28125} {"train_loss": -6.621306419372559, "global_step": 126756, "epoch": 3018} {"train_loss": -6.584291458129883, "global_step": 126757, "epoch": 3018} {"train_loss": -6.653966903686523, "global_step": 126758, "epoch": 3018} {"train_loss": -6.58779239654541, "global_step": 126759, "epoch": 3018} {"train_loss": -6.6295952796936035, "global_step": 126760, "epoch": 3018} {"train_loss": -6.434427261352539, "global_step": 126761, "epoch": 3018} {"train_loss": -6.5562591552734375, "global_step": 126762, "epoch": 3018} {"train_loss": -6.440768718719482, "global_step": 126763, "epoch": 3018} {"train_loss": -6.630124568939209, "global_step": 126764, "epoch": 3018} {"train_loss": -6.4929399490356445, "global_step": 126765, "epoch": 3018} {"train_loss": -6.597029685974121, "global_step": 126766, "epoch": 3018} {"train_loss": -6.649662494659424, "global_step": 126767, "epoch": 3018} {"train_loss": -6.507091522216797, "global_step": 126768, "epoch": 3018} {"train_loss": -6.598370552062988, "global_step": 126769, "epoch": 3018} {"train_loss": -6.5555548667907715, "global_step": 126770, "epoch": 3018} {"train_loss": -6.515987873077393, "global_step": 126771, "epoch": 3018} {"train_loss": -6.675334930419922, "global_step": 126772, "epoch": 3018} {"train_loss": -6.575430870056152, "global_step": 126773, "epoch": 3018} {"train_loss": -6.58205509185791, "global_step": 126774, "epoch": 3018} {"train_loss": -6.671629905700684, "global_step": 126775, "epoch": 3018} {"train_loss": -6.668914794921875, "global_step": 126776, "epoch": 3018} {"train_loss": -6.702491283416748, "global_step": 126777, "epoch": 3018} {"train_loss": -6.659751892089844, "global_step": 126778, "epoch": 3018} {"train_loss": -6.640957832336426, "global_step": 126779, "epoch": 3018} {"train_loss": -6.741853713989258, "global_step": 126780, "epoch": 3018} {"train_loss": -6.637036323547363, "global_step": 126781, "epoch": 3018} {"train_loss": -6.599359512329102, "global_step": 126782, "epoch": 3018} {"train_loss": -6.6196370124816895, "global_step": 126783, "epoch": 3018} {"train_loss": -6.633587837219238, "global_step": 126784, "epoch": 3018} {"train_loss": -6.584237098693848, "global_step": 126785, "epoch": 3018} {"train_loss": -6.643991947174072, "global_step": 126786, "epoch": 3018} {"train_loss": -6.638075828552246, "global_step": 126787, "epoch": 3018} {"train_loss": -6.641031265258789, "global_step": 126788, "epoch": 3018} {"train_loss": -6.599052906036377, "global_step": 126789, "epoch": 3018} {"train_loss": -6.625518321990967, "global_step": 126790, "epoch": 3018} {"train_loss": -6.70328426361084, "global_step": 126791, "epoch": 3018} {"train_loss": -6.536131858825684, "global_step": 126792, "epoch": 3018} {"train_loss": -6.603109359741211, "global_step": 126793, "epoch": 3018} {"train_loss": -6.579450607299805, "global_step": 126794, "epoch": 3018} {"train_loss": -6.635033130645752, "global_step": 126795, "epoch": 3018} {"train_loss": -6.734262466430664, "global_step": 126796, "epoch": 3018} {"train_loss": -6.612161363874163, "global_step": 126797, "epoch": 3018, "val_loss": 77243.59375} {"train_loss": -6.597695350646973, "global_step": 126798, "epoch": 3019} {"train_loss": -6.7040205001831055, "global_step": 126799, "epoch": 3019} {"train_loss": -6.617847442626953, "global_step": 126800, "epoch": 3019} {"train_loss": -6.6945414543151855, "global_step": 126801, "epoch": 3019} {"train_loss": -6.729445457458496, "global_step": 126802, "epoch": 3019} {"train_loss": -6.672807693481445, "global_step": 126803, "epoch": 3019} {"train_loss": -6.645742416381836, "global_step": 126804, "epoch": 3019} {"train_loss": -6.719555854797363, "global_step": 126805, "epoch": 3019} {"train_loss": -6.693599224090576, "global_step": 126806, "epoch": 3019} {"train_loss": -6.695512294769287, "global_step": 126807, "epoch": 3019} {"train_loss": -6.761120796203613, "global_step": 126808, "epoch": 3019} {"train_loss": -6.691629409790039, "global_step": 126809, "epoch": 3019} {"train_loss": -6.675160884857178, "global_step": 126810, "epoch": 3019} {"train_loss": -6.630431652069092, "global_step": 126811, "epoch": 3019} {"train_loss": -6.59464693069458, "global_step": 126812, "epoch": 3019} {"train_loss": -6.633767127990723, "global_step": 126813, "epoch": 3019} {"train_loss": -6.739794731140137, "global_step": 126814, "epoch": 3019} {"train_loss": -6.692313194274902, "global_step": 126815, "epoch": 3019} {"train_loss": -6.617973327636719, "global_step": 126816, "epoch": 3019} {"train_loss": -6.568325519561768, "global_step": 126817, "epoch": 3019} {"train_loss": -6.65976619720459, "global_step": 126818, "epoch": 3019} {"train_loss": -6.6835527420043945, "global_step": 126819, "epoch": 3019} {"train_loss": -6.613676071166992, "global_step": 126820, "epoch": 3019} {"train_loss": -6.645486831665039, "global_step": 126821, "epoch": 3019} {"train_loss": -6.646105766296387, "global_step": 126822, "epoch": 3019} {"train_loss": -6.591920852661133, "global_step": 126823, "epoch": 3019} {"train_loss": -6.681059837341309, "global_step": 126824, "epoch": 3019} {"train_loss": -6.611687660217285, "global_step": 126825, "epoch": 3019} {"train_loss": -6.715494155883789, "global_step": 126826, "epoch": 3019} {"train_loss": -6.6416425704956055, "global_step": 126827, "epoch": 3019} {"train_loss": -6.649014472961426, "global_step": 126828, "epoch": 3019} {"train_loss": -6.766036033630371, "global_step": 126829, "epoch": 3019} {"train_loss": -6.606224060058594, "global_step": 126830, "epoch": 3019} {"train_loss": -6.662793159484863, "global_step": 126831, "epoch": 3019} {"train_loss": -6.618567943572998, "global_step": 126832, "epoch": 3019} {"train_loss": -6.618253707885742, "global_step": 126833, "epoch": 3019} {"train_loss": -6.626009941101074, "global_step": 126834, "epoch": 3019} {"train_loss": -6.626856327056885, "global_step": 126835, "epoch": 3019} {"train_loss": -6.741546630859375, "global_step": 126836, "epoch": 3019} {"train_loss": -6.566853046417236, "global_step": 126837, "epoch": 3019} {"train_loss": -6.681913375854492, "global_step": 126838, "epoch": 3019} {"train_loss": -6.658808356239682, "global_step": 126839, "epoch": 3019, "val_loss": 77421.3046875} {"train_loss": -6.649474143981934, "global_step": 126840, "epoch": 3020} {"train_loss": -6.671086311340332, "global_step": 126841, "epoch": 3020} {"train_loss": -6.6718268394470215, "global_step": 126842, "epoch": 3020} {"train_loss": -6.4945292472839355, "global_step": 126843, "epoch": 3020} {"train_loss": -6.657881259918213, "global_step": 126844, "epoch": 3020} {"train_loss": -6.677173614501953, "global_step": 126845, "epoch": 3020} {"train_loss": -6.5878400802612305, "global_step": 126846, "epoch": 3020} {"train_loss": -6.57620906829834, "global_step": 126847, "epoch": 3020} {"train_loss": -6.76505184173584, "global_step": 126848, "epoch": 3020} {"train_loss": -6.565645217895508, "global_step": 126849, "epoch": 3020} {"train_loss": -6.763918399810791, "global_step": 126850, "epoch": 3020} {"train_loss": -6.748085021972656, "global_step": 126851, "epoch": 3020} {"train_loss": -6.643606185913086, "global_step": 126852, "epoch": 3020} {"train_loss": -6.593545436859131, "global_step": 126853, "epoch": 3020} {"train_loss": -6.701851844787598, "global_step": 126854, "epoch": 3020} {"train_loss": -6.626220703125, "global_step": 126855, "epoch": 3020} {"train_loss": -6.504748344421387, "global_step": 126856, "epoch": 3020} {"train_loss": -6.667986869812012, "global_step": 126857, "epoch": 3020} {"train_loss": -6.577183723449707, "global_step": 126858, "epoch": 3020} {"train_loss": -6.6088080406188965, "global_step": 126859, "epoch": 3020} {"train_loss": -6.627745628356934, "global_step": 126860, "epoch": 3020} {"train_loss": -6.61341667175293, "global_step": 126861, "epoch": 3020} {"train_loss": -6.752131462097168, "global_step": 126862, "epoch": 3020} {"train_loss": -6.647335052490234, "global_step": 126863, "epoch": 3020} {"train_loss": -6.625756740570068, "global_step": 126864, "epoch": 3020} {"train_loss": -6.5897746086120605, "global_step": 126865, "epoch": 3020} {"train_loss": -6.607325553894043, "global_step": 126866, "epoch": 3020} {"train_loss": -6.592019557952881, "global_step": 126867, "epoch": 3020} {"train_loss": -6.608208656311035, "global_step": 126868, "epoch": 3020} {"train_loss": -6.774551868438721, "global_step": 126869, "epoch": 3020} {"train_loss": -6.574915885925293, "global_step": 126870, "epoch": 3020} {"train_loss": -6.509496212005615, "global_step": 126871, "epoch": 3020} {"train_loss": -6.58686637878418, "global_step": 126872, "epoch": 3020} {"train_loss": -6.614007949829102, "global_step": 126873, "epoch": 3020} {"train_loss": -6.605774402618408, "global_step": 126874, "epoch": 3020} {"train_loss": -6.580626010894775, "global_step": 126875, "epoch": 3020} {"train_loss": -6.6918416023254395, "global_step": 126876, "epoch": 3020} {"train_loss": -6.615581512451172, "global_step": 126877, "epoch": 3020} {"train_loss": -6.640969276428223, "global_step": 126878, "epoch": 3020} {"train_loss": -6.549430847167969, "global_step": 126879, "epoch": 3020} {"train_loss": -6.667692184448242, "global_step": 126880, "epoch": 3020} {"train_loss": -6.628830614544096, "global_step": 126881, "epoch": 3020, "val_loss": 77473.8828125} {"train_loss": -6.586926460266113, "global_step": 126882, "epoch": 3021} {"train_loss": -6.59848165512085, "global_step": 126883, "epoch": 3021} {"train_loss": -6.6335768699646, "global_step": 126884, "epoch": 3021} {"train_loss": -6.67623233795166, "global_step": 126885, "epoch": 3021} {"train_loss": -6.6396002769470215, "global_step": 126886, "epoch": 3021} {"train_loss": -6.590755939483643, "global_step": 126887, "epoch": 3021} {"train_loss": -6.6760783195495605, "global_step": 126888, "epoch": 3021} {"train_loss": -6.684957504272461, "global_step": 126889, "epoch": 3021} {"train_loss": -6.669168472290039, "global_step": 126890, "epoch": 3021} {"train_loss": -6.543099403381348, "global_step": 126891, "epoch": 3021} {"train_loss": -6.6454901695251465, "global_step": 126892, "epoch": 3021} {"train_loss": -6.631753921508789, "global_step": 126893, "epoch": 3021} {"train_loss": -6.57127046585083, "global_step": 126894, "epoch": 3021} {"train_loss": -6.641478538513184, "global_step": 126895, "epoch": 3021} {"train_loss": -6.698729991912842, "global_step": 126896, "epoch": 3021} {"train_loss": -6.629079341888428, "global_step": 126897, "epoch": 3021} {"train_loss": -6.688096046447754, "global_step": 126898, "epoch": 3021} {"train_loss": -6.758949279785156, "global_step": 126899, "epoch": 3021} {"train_loss": -6.5624799728393555, "global_step": 126900, "epoch": 3021} {"train_loss": -6.694809913635254, "global_step": 126901, "epoch": 3021} {"train_loss": -6.6341423988342285, "global_step": 126902, "epoch": 3021} {"train_loss": -6.779747009277344, "global_step": 126903, "epoch": 3021} {"train_loss": -6.609474182128906, "global_step": 126904, "epoch": 3021} {"train_loss": -6.7669596672058105, "global_step": 126905, "epoch": 3021} {"train_loss": -6.627307891845703, "global_step": 126906, "epoch": 3021} {"train_loss": -6.693806171417236, "global_step": 126907, "epoch": 3021} {"train_loss": -6.620857238769531, "global_step": 126908, "epoch": 3021} {"train_loss": -6.6651530265808105, "global_step": 126909, "epoch": 3021} {"train_loss": -6.752757549285889, "global_step": 126910, "epoch": 3021} {"train_loss": -6.674664497375488, "global_step": 126911, "epoch": 3021} {"train_loss": -6.790854454040527, "global_step": 126912, "epoch": 3021} {"train_loss": -6.626520156860352, "global_step": 126913, "epoch": 3021} {"train_loss": -6.718135356903076, "global_step": 126914, "epoch": 3021} {"train_loss": -6.719544887542725, "global_step": 126915, "epoch": 3021} {"train_loss": -6.769400119781494, "global_step": 126916, "epoch": 3021} {"train_loss": -6.714324951171875, "global_step": 126917, "epoch": 3021} {"train_loss": -6.79404354095459, "global_step": 126918, "epoch": 3021} {"train_loss": -6.687932968139648, "global_step": 126919, "epoch": 3021} {"train_loss": -6.741514205932617, "global_step": 126920, "epoch": 3021} {"train_loss": -6.684535980224609, "global_step": 126921, "epoch": 3021} {"train_loss": -6.669585704803467, "global_step": 126922, "epoch": 3021} {"train_loss": -6.67309528305417, "global_step": 126923, "epoch": 3021, "val_loss": 77387.5625} {"train_loss": -6.7602410316467285, "global_step": 126924, "epoch": 3022} {"train_loss": -6.754384994506836, "global_step": 126925, "epoch": 3022} {"train_loss": -6.79538631439209, "global_step": 126926, "epoch": 3022} {"train_loss": -6.827190399169922, "global_step": 126927, "epoch": 3022} {"train_loss": -6.717990875244141, "global_step": 126928, "epoch": 3022} {"train_loss": -6.672619819641113, "global_step": 126929, "epoch": 3022} {"train_loss": -6.703578948974609, "global_step": 126930, "epoch": 3022} {"train_loss": -6.606675624847412, "global_step": 126931, "epoch": 3022} {"train_loss": -6.736687660217285, "global_step": 126932, "epoch": 3022} {"train_loss": -6.657425403594971, "global_step": 126933, "epoch": 3022} {"train_loss": -6.670243263244629, "global_step": 126934, "epoch": 3022} {"train_loss": -6.598484992980957, "global_step": 126935, "epoch": 3022} {"train_loss": -6.6614155769348145, "global_step": 126936, "epoch": 3022} {"train_loss": -6.63305139541626, "global_step": 126937, "epoch": 3022} {"train_loss": -6.786840438842773, "global_step": 126938, "epoch": 3022} {"train_loss": -6.725679397583008, "global_step": 126939, "epoch": 3022} {"train_loss": -6.6341705322265625, "global_step": 126940, "epoch": 3022} {"train_loss": -6.626708984375, "global_step": 126941, "epoch": 3022} {"train_loss": -6.616499423980713, "global_step": 126942, "epoch": 3022} {"train_loss": -6.652774810791016, "global_step": 126943, "epoch": 3022} {"train_loss": -6.576023101806641, "global_step": 126944, "epoch": 3022} {"train_loss": -6.671041488647461, "global_step": 126945, "epoch": 3022} {"train_loss": -6.5714921951293945, "global_step": 126946, "epoch": 3022} {"train_loss": -6.676085948944092, "global_step": 126947, "epoch": 3022} {"train_loss": -6.580998420715332, "global_step": 126948, "epoch": 3022} {"train_loss": -6.545804023742676, "global_step": 126949, "epoch": 3022} {"train_loss": -6.576390266418457, "global_step": 126950, "epoch": 3022} {"train_loss": -6.730961799621582, "global_step": 126951, "epoch": 3022} {"train_loss": -6.497919082641602, "global_step": 126952, "epoch": 3022} {"train_loss": -6.59787654876709, "global_step": 126953, "epoch": 3022} {"train_loss": -6.558163642883301, "global_step": 126954, "epoch": 3022} {"train_loss": -6.634398460388184, "global_step": 126955, "epoch": 3022} {"train_loss": -6.540490627288818, "global_step": 126956, "epoch": 3022} {"train_loss": -6.526615619659424, "global_step": 126957, "epoch": 3022} {"train_loss": -6.639040946960449, "global_step": 126958, "epoch": 3022} {"train_loss": -6.654894828796387, "global_step": 126959, "epoch": 3022} {"train_loss": -6.607455730438232, "global_step": 126960, "epoch": 3022} {"train_loss": -6.715482711791992, "global_step": 126961, "epoch": 3022} {"train_loss": -6.682003974914551, "global_step": 126962, "epoch": 3022} {"train_loss": -6.543959617614746, "global_step": 126963, "epoch": 3022} {"train_loss": -6.517273902893066, "global_step": 126964, "epoch": 3022} {"train_loss": -6.647050414766584, "global_step": 126965, "epoch": 3022, "val_loss": 77212.0234375} {"train_loss": -6.4506072998046875, "global_step": 126966, "epoch": 3023} {"train_loss": -6.615473747253418, "global_step": 126967, "epoch": 3023} {"train_loss": -6.533185958862305, "global_step": 126968, "epoch": 3023} {"train_loss": -6.680720329284668, "global_step": 126969, "epoch": 3023} {"train_loss": -6.718402862548828, "global_step": 126970, "epoch": 3023} {"train_loss": -6.651649475097656, "global_step": 126971, "epoch": 3023} {"train_loss": -6.5583882331848145, "global_step": 126972, "epoch": 3023} {"train_loss": -6.704925537109375, "global_step": 126973, "epoch": 3023} {"train_loss": -6.6565093994140625, "global_step": 126974, "epoch": 3023} {"train_loss": -6.534688949584961, "global_step": 126975, "epoch": 3023} {"train_loss": -6.587008953094482, "global_step": 126976, "epoch": 3023} {"train_loss": -6.517861843109131, "global_step": 126977, "epoch": 3023} {"train_loss": -6.620589733123779, "global_step": 126978, "epoch": 3023} {"train_loss": -6.6033711433410645, "global_step": 126979, "epoch": 3023} {"train_loss": -6.564939498901367, "global_step": 126980, "epoch": 3023} {"train_loss": -6.643150806427002, "global_step": 126981, "epoch": 3023} {"train_loss": -6.712564945220947, "global_step": 126982, "epoch": 3023} {"train_loss": -6.537103652954102, "global_step": 126983, "epoch": 3023} {"train_loss": -6.586567401885986, "global_step": 126984, "epoch": 3023} {"train_loss": -6.726013660430908, "global_step": 126985, "epoch": 3023} {"train_loss": -6.570862770080566, "global_step": 126986, "epoch": 3023} {"train_loss": -6.685716152191162, "global_step": 126987, "epoch": 3023} {"train_loss": -6.5405168533325195, "global_step": 126988, "epoch": 3023} {"train_loss": -6.615091323852539, "global_step": 126989, "epoch": 3023} {"train_loss": -6.5631890296936035, "global_step": 126990, "epoch": 3023} {"train_loss": -6.645077228546143, "global_step": 126991, "epoch": 3023} {"train_loss": -6.7258172035217285, "global_step": 126992, "epoch": 3023} {"train_loss": -6.6565375328063965, "global_step": 126993, "epoch": 3023} {"train_loss": -6.496546268463135, "global_step": 126994, "epoch": 3023} {"train_loss": -6.703190803527832, "global_step": 126995, "epoch": 3023} {"train_loss": -6.647942066192627, "global_step": 126996, "epoch": 3023} {"train_loss": -6.599020957946777, "global_step": 126997, "epoch": 3023} {"train_loss": -6.611624717712402, "global_step": 126998, "epoch": 3023} {"train_loss": -6.64341402053833, "global_step": 126999, "epoch": 3023} {"train_loss": -6.475762844085693, "global_step": 127000, "epoch": 3023} {"train_loss": -6.570446014404297, "global_step": 127001, "epoch": 3023} {"train_loss": -6.67249059677124, "global_step": 127002, "epoch": 3023} {"train_loss": -6.57289981842041, "global_step": 127003, "epoch": 3023} {"train_loss": -6.607738971710205, "global_step": 127004, "epoch": 3023} {"train_loss": -6.592446804046631, "global_step": 127005, "epoch": 3023} {"train_loss": -6.587213516235352, "global_step": 127006, "epoch": 3023} {"train_loss": -6.609067598978679, "global_step": 127007, "epoch": 3023, "val_loss": 77273.8125} {"train_loss": -6.670459747314453, "global_step": 127008, "epoch": 3024} {"train_loss": -6.599261283874512, "global_step": 127009, "epoch": 3024} {"train_loss": -6.4793171882629395, "global_step": 127010, "epoch": 3024} {"train_loss": -6.659641265869141, "global_step": 127011, "epoch": 3024} {"train_loss": -6.642714500427246, "global_step": 127012, "epoch": 3024} {"train_loss": -6.62905740737915, "global_step": 127013, "epoch": 3024} {"train_loss": -6.767214775085449, "global_step": 127014, "epoch": 3024} {"train_loss": -6.556026458740234, "global_step": 127015, "epoch": 3024} {"train_loss": -6.638391494750977, "global_step": 127016, "epoch": 3024} {"train_loss": -6.589216709136963, "global_step": 127017, "epoch": 3024} {"train_loss": -6.621140480041504, "global_step": 127018, "epoch": 3024} {"train_loss": -6.540312767028809, "global_step": 127019, "epoch": 3024} {"train_loss": -6.616450786590576, "global_step": 127020, "epoch": 3024} {"train_loss": -6.576900959014893, "global_step": 127021, "epoch": 3024} {"train_loss": -6.779060363769531, "global_step": 127022, "epoch": 3024} {"train_loss": -6.592945575714111, "global_step": 127023, "epoch": 3024} {"train_loss": -6.617633819580078, "global_step": 127024, "epoch": 3024} {"train_loss": -6.675061225891113, "global_step": 127025, "epoch": 3024} {"train_loss": -6.761786460876465, "global_step": 127026, "epoch": 3024} {"train_loss": -6.64805269241333, "global_step": 127027, "epoch": 3024} {"train_loss": -6.559566974639893, "global_step": 127028, "epoch": 3024} {"train_loss": -6.70588493347168, "global_step": 127029, "epoch": 3024} {"train_loss": -6.597063064575195, "global_step": 127030, "epoch": 3024} {"train_loss": -6.794899940490723, "global_step": 127031, "epoch": 3024} {"train_loss": -6.639540195465088, "global_step": 127032, "epoch": 3024} {"train_loss": -6.634812355041504, "global_step": 127033, "epoch": 3024} {"train_loss": -6.670210838317871, "global_step": 127034, "epoch": 3024} {"train_loss": -6.612648963928223, "global_step": 127035, "epoch": 3024} {"train_loss": -6.63890266418457, "global_step": 127036, "epoch": 3024} {"train_loss": -6.571897506713867, "global_step": 127037, "epoch": 3024} {"train_loss": -6.560558795928955, "global_step": 127038, "epoch": 3024} {"train_loss": -6.560606479644775, "global_step": 127039, "epoch": 3024} {"train_loss": -6.66894006729126, "global_step": 127040, "epoch": 3024} {"train_loss": -6.570038318634033, "global_step": 127041, "epoch": 3024} {"train_loss": -6.570921897888184, "global_step": 127042, "epoch": 3024} {"train_loss": -6.655890941619873, "global_step": 127043, "epoch": 3024} {"train_loss": -6.658172607421875, "global_step": 127044, "epoch": 3024} {"train_loss": -6.646850109100342, "global_step": 127045, "epoch": 3024} {"train_loss": -6.636325359344482, "global_step": 127046, "epoch": 3024} {"train_loss": -6.600489616394043, "global_step": 127047, "epoch": 3024} {"train_loss": -6.614493370056152, "global_step": 127048, "epoch": 3024} {"train_loss": -6.630521274748302, "global_step": 127049, "epoch": 3024, "val_loss": 77278.265625} {"train_loss": -6.672364234924316, "global_step": 127050, "epoch": 3025} {"train_loss": -6.54705810546875, "global_step": 127051, "epoch": 3025} {"train_loss": -6.631268501281738, "global_step": 127052, "epoch": 3025} {"train_loss": -6.712142467498779, "global_step": 127053, "epoch": 3025} {"train_loss": -6.5517168045043945, "global_step": 127054, "epoch": 3025} {"train_loss": -6.638498783111572, "global_step": 127055, "epoch": 3025} {"train_loss": -6.715497970581055, "global_step": 127056, "epoch": 3025} {"train_loss": -6.620940208435059, "global_step": 127057, "epoch": 3025} {"train_loss": -6.667489528656006, "global_step": 127058, "epoch": 3025} {"train_loss": -6.595148086547852, "global_step": 127059, "epoch": 3025} {"train_loss": -6.672858715057373, "global_step": 127060, "epoch": 3025} {"train_loss": -6.546906471252441, "global_step": 127061, "epoch": 3025} {"train_loss": -6.666701793670654, "global_step": 127062, "epoch": 3025} {"train_loss": -6.665719509124756, "global_step": 127063, "epoch": 3025} {"train_loss": -6.581114768981934, "global_step": 127064, "epoch": 3025} {"train_loss": -6.653316020965576, "global_step": 127065, "epoch": 3025} {"train_loss": -6.555515289306641, "global_step": 127066, "epoch": 3025} {"train_loss": -6.541764259338379, "global_step": 127067, "epoch": 3025} {"train_loss": -6.668755054473877, "global_step": 127068, "epoch": 3025} {"train_loss": -6.571907043457031, "global_step": 127069, "epoch": 3025} {"train_loss": -6.637378692626953, "global_step": 127070, "epoch": 3025} {"train_loss": -6.612732410430908, "global_step": 127071, "epoch": 3025} {"train_loss": -6.630340576171875, "global_step": 127072, "epoch": 3025} {"train_loss": -6.658463001251221, "global_step": 127073, "epoch": 3025} {"train_loss": -6.579660415649414, "global_step": 127074, "epoch": 3025} {"train_loss": -6.557040214538574, "global_step": 127075, "epoch": 3025} {"train_loss": -6.607463836669922, "global_step": 127076, "epoch": 3025} {"train_loss": -6.558273792266846, "global_step": 127077, "epoch": 3025} {"train_loss": -6.625473499298096, "global_step": 127078, "epoch": 3025} {"train_loss": -6.4930877685546875, "global_step": 127079, "epoch": 3025} {"train_loss": -6.626298904418945, "global_step": 127080, "epoch": 3025} {"train_loss": -6.695335388183594, "global_step": 127081, "epoch": 3025} {"train_loss": -6.5633625984191895, "global_step": 127082, "epoch": 3025} {"train_loss": -6.746024131774902, "global_step": 127083, "epoch": 3025} {"train_loss": -6.604345321655273, "global_step": 127084, "epoch": 3025} {"train_loss": -6.673328399658203, "global_step": 127085, "epoch": 3025} {"train_loss": -6.650921821594238, "global_step": 127086, "epoch": 3025} {"train_loss": -6.612722873687744, "global_step": 127087, "epoch": 3025} {"train_loss": -6.563974380493164, "global_step": 127088, "epoch": 3025} {"train_loss": -6.682657241821289, "global_step": 127089, "epoch": 3025} {"train_loss": -6.711149215698242, "global_step": 127090, "epoch": 3025} {"train_loss": -6.6245680423009965, "global_step": 127091, "epoch": 3025, "val_loss": 77506.7109375} {"train_loss": -6.609511375427246, "global_step": 127092, "epoch": 3026} {"train_loss": -6.738339424133301, "global_step": 127093, "epoch": 3026} {"train_loss": -6.669704914093018, "global_step": 127094, "epoch": 3026} {"train_loss": -6.661672592163086, "global_step": 127095, "epoch": 3026} {"train_loss": -6.531517028808594, "global_step": 127096, "epoch": 3026} {"train_loss": -6.6634674072265625, "global_step": 127097, "epoch": 3026} {"train_loss": -6.745828628540039, "global_step": 127098, "epoch": 3026} {"train_loss": -6.628057479858398, "global_step": 127099, "epoch": 3026} {"train_loss": -6.590360641479492, "global_step": 127100, "epoch": 3026} {"train_loss": -6.597475051879883, "global_step": 127101, "epoch": 3026} {"train_loss": -6.685182094573975, "global_step": 127102, "epoch": 3026} {"train_loss": -6.66569709777832, "global_step": 127103, "epoch": 3026} {"train_loss": -6.613397598266602, "global_step": 127104, "epoch": 3026} {"train_loss": -6.594035625457764, "global_step": 127105, "epoch": 3026} {"train_loss": -6.598050117492676, "global_step": 127106, "epoch": 3026} {"train_loss": -6.601235389709473, "global_step": 127107, "epoch": 3026} {"train_loss": -6.71021842956543, "global_step": 127108, "epoch": 3026} {"train_loss": -6.68905782699585, "global_step": 127109, "epoch": 3026} {"train_loss": -6.685415267944336, "global_step": 127110, "epoch": 3026} {"train_loss": -6.715360641479492, "global_step": 127111, "epoch": 3026} {"train_loss": -6.57037353515625, "global_step": 127112, "epoch": 3026} {"train_loss": -6.671005725860596, "global_step": 127113, "epoch": 3026} {"train_loss": -6.712517738342285, "global_step": 127114, "epoch": 3026} {"train_loss": -6.6385273933410645, "global_step": 127115, "epoch": 3026} {"train_loss": -6.592993259429932, "global_step": 127116, "epoch": 3026} {"train_loss": -6.753472328186035, "global_step": 127117, "epoch": 3026} {"train_loss": -6.342146396636963, "global_step": 127118, "epoch": 3026} {"train_loss": -6.548626899719238, "global_step": 127119, "epoch": 3026} {"train_loss": -6.548553466796875, "global_step": 127120, "epoch": 3026} {"train_loss": -6.536792278289795, "global_step": 127121, "epoch": 3026} {"train_loss": -6.615816116333008, "global_step": 127122, "epoch": 3026} {"train_loss": -6.598660469055176, "global_step": 127123, "epoch": 3026} {"train_loss": -6.526248455047607, "global_step": 127124, "epoch": 3026} {"train_loss": -6.584465980529785, "global_step": 127125, "epoch": 3026} {"train_loss": -6.534422397613525, "global_step": 127126, "epoch": 3026} {"train_loss": -6.627013683319092, "global_step": 127127, "epoch": 3026} {"train_loss": -6.479168891906738, "global_step": 127128, "epoch": 3026} {"train_loss": -6.492812633514404, "global_step": 127129, "epoch": 3026} {"train_loss": -6.5277509689331055, "global_step": 127130, "epoch": 3026} {"train_loss": -6.507678985595703, "global_step": 127131, "epoch": 3026} {"train_loss": -6.62819242477417, "global_step": 127132, "epoch": 3026} {"train_loss": -6.609119892120361, "global_step": 127133, "epoch": 3026, "val_loss": 77248.0078125} {"train_loss": -6.485937595367432, "global_step": 127134, "epoch": 3027} {"train_loss": -6.600234031677246, "global_step": 127135, "epoch": 3027} {"train_loss": -6.518345832824707, "global_step": 127136, "epoch": 3027} {"train_loss": -6.765148162841797, "global_step": 127137, "epoch": 3027} {"train_loss": -6.536125659942627, "global_step": 127138, "epoch": 3027} {"train_loss": -6.676470756530762, "global_step": 127139, "epoch": 3027} {"train_loss": -6.523504257202148, "global_step": 127140, "epoch": 3027} {"train_loss": -6.664524078369141, "global_step": 127141, "epoch": 3027} {"train_loss": -6.63459587097168, "global_step": 127142, "epoch": 3027} {"train_loss": -6.628899574279785, "global_step": 127143, "epoch": 3027} {"train_loss": -6.535993576049805, "global_step": 127144, "epoch": 3027} {"train_loss": -6.589139938354492, "global_step": 127145, "epoch": 3027} {"train_loss": -6.620137691497803, "global_step": 127146, "epoch": 3027} {"train_loss": -6.572937965393066, "global_step": 127147, "epoch": 3027} {"train_loss": -6.653783798217773, "global_step": 127148, "epoch": 3027} {"train_loss": -6.54378604888916, "global_step": 127149, "epoch": 3027} {"train_loss": -6.522024154663086, "global_step": 127150, "epoch": 3027} {"train_loss": -6.5970258712768555, "global_step": 127151, "epoch": 3027} {"train_loss": -6.518252849578857, "global_step": 127152, "epoch": 3027} {"train_loss": -6.590402603149414, "global_step": 127153, "epoch": 3027} {"train_loss": -6.512368202209473, "global_step": 127154, "epoch": 3027} {"train_loss": -6.6236982345581055, "global_step": 127155, "epoch": 3027} {"train_loss": -6.562656879425049, "global_step": 127156, "epoch": 3027} {"train_loss": -6.677959442138672, "global_step": 127157, "epoch": 3027} {"train_loss": -6.589210510253906, "global_step": 127158, "epoch": 3027} {"train_loss": -6.551783084869385, "global_step": 127159, "epoch": 3027} {"train_loss": -6.576778411865234, "global_step": 127160, "epoch": 3027} {"train_loss": -6.598893642425537, "global_step": 127161, "epoch": 3027} {"train_loss": -6.584903240203857, "global_step": 127162, "epoch": 3027} {"train_loss": -6.615012168884277, "global_step": 127163, "epoch": 3027} {"train_loss": -6.555939674377441, "global_step": 127164, "epoch": 3027} {"train_loss": -6.6761932373046875, "global_step": 127165, "epoch": 3027} {"train_loss": -6.638001441955566, "global_step": 127166, "epoch": 3027} {"train_loss": -6.613280773162842, "global_step": 127167, "epoch": 3027} {"train_loss": -6.6112165451049805, "global_step": 127168, "epoch": 3027} {"train_loss": -6.589459419250488, "global_step": 127169, "epoch": 3027} {"train_loss": -6.597813606262207, "global_step": 127170, "epoch": 3027} {"train_loss": -6.31357479095459, "global_step": 127171, "epoch": 3027} {"train_loss": -6.612183570861816, "global_step": 127172, "epoch": 3027} {"train_loss": -6.508893966674805, "global_step": 127173, "epoch": 3027} {"train_loss": -6.640880584716797, "global_step": 127174, "epoch": 3027} {"train_loss": -6.58646772021339, "global_step": 127175, "epoch": 3027, "val_loss": 77136.1640625} {"train_loss": -6.664235591888428, "global_step": 127176, "epoch": 3028} {"train_loss": -6.644541263580322, "global_step": 127177, "epoch": 3028} {"train_loss": -6.639972686767578, "global_step": 127178, "epoch": 3028} {"train_loss": -6.608432292938232, "global_step": 127179, "epoch": 3028} {"train_loss": -6.5304036140441895, "global_step": 127180, "epoch": 3028} {"train_loss": -6.70665168762207, "global_step": 127181, "epoch": 3028} {"train_loss": -6.699339389801025, "global_step": 127182, "epoch": 3028} {"train_loss": -6.719015598297119, "global_step": 127183, "epoch": 3028} {"train_loss": -6.6536359786987305, "global_step": 127184, "epoch": 3028} {"train_loss": -6.695666790008545, "global_step": 127185, "epoch": 3028} {"train_loss": -6.710604667663574, "global_step": 127186, "epoch": 3028} {"train_loss": -6.618558406829834, "global_step": 127187, "epoch": 3028} {"train_loss": -6.589111804962158, "global_step": 127188, "epoch": 3028} {"train_loss": -6.6827497482299805, "global_step": 127189, "epoch": 3028} {"train_loss": -6.700483322143555, "global_step": 127190, "epoch": 3028} {"train_loss": -6.691851615905762, "global_step": 127191, "epoch": 3028} {"train_loss": -6.689692974090576, "global_step": 127192, "epoch": 3028} {"train_loss": -6.642413139343262, "global_step": 127193, "epoch": 3028} {"train_loss": -6.591994285583496, "global_step": 127194, "epoch": 3028} {"train_loss": -6.675262451171875, "global_step": 127195, "epoch": 3028} {"train_loss": -6.630565643310547, "global_step": 127196, "epoch": 3028} {"train_loss": -6.580854415893555, "global_step": 127197, "epoch": 3028} {"train_loss": -6.772222995758057, "global_step": 127198, "epoch": 3028} {"train_loss": -6.622977256774902, "global_step": 127199, "epoch": 3028} {"train_loss": -6.659374237060547, "global_step": 127200, "epoch": 3028} {"train_loss": -6.6259589195251465, "global_step": 127201, "epoch": 3028} {"train_loss": -6.718382358551025, "global_step": 127202, "epoch": 3028} {"train_loss": -6.656825065612793, "global_step": 127203, "epoch": 3028} {"train_loss": -6.7415618896484375, "global_step": 127204, "epoch": 3028} {"train_loss": -6.732907772064209, "global_step": 127205, "epoch": 3028} {"train_loss": -6.665547847747803, "global_step": 127206, "epoch": 3028} {"train_loss": -6.675722122192383, "global_step": 127207, "epoch": 3028} {"train_loss": -6.669745445251465, "global_step": 127208, "epoch": 3028} {"train_loss": -6.725987434387207, "global_step": 127209, "epoch": 3028} {"train_loss": -6.747486591339111, "global_step": 127210, "epoch": 3028} {"train_loss": -6.7003984451293945, "global_step": 127211, "epoch": 3028} {"train_loss": -6.677038192749023, "global_step": 127212, "epoch": 3028} {"train_loss": -6.683416843414307, "global_step": 127213, "epoch": 3028} {"train_loss": -6.526040077209473, "global_step": 127214, "epoch": 3028} {"train_loss": -6.685972690582275, "global_step": 127215, "epoch": 3028} {"train_loss": -6.698986053466797, "global_step": 127216, "epoch": 3028} {"train_loss": -6.668320360637846, "global_step": 127217, "epoch": 3028, "val_loss": 77257.6328125} {"train_loss": -6.704583168029785, "global_step": 127218, "epoch": 3029} {"train_loss": -6.7375288009643555, "global_step": 127219, "epoch": 3029} {"train_loss": -6.764937400817871, "global_step": 127220, "epoch": 3029} {"train_loss": -6.767410755157471, "global_step": 127221, "epoch": 3029} {"train_loss": -6.7478179931640625, "global_step": 127222, "epoch": 3029} {"train_loss": -6.670029640197754, "global_step": 127223, "epoch": 3029} {"train_loss": -6.657718181610107, "global_step": 127224, "epoch": 3029} {"train_loss": -6.618011951446533, "global_step": 127225, "epoch": 3029} {"train_loss": -6.601519584655762, "global_step": 127226, "epoch": 3029} {"train_loss": -6.669250011444092, "global_step": 127227, "epoch": 3029} {"train_loss": -6.716801643371582, "global_step": 127228, "epoch": 3029} {"train_loss": -6.750834941864014, "global_step": 127229, "epoch": 3029} {"train_loss": -6.64377498626709, "global_step": 127230, "epoch": 3029} {"train_loss": -6.571872234344482, "global_step": 127231, "epoch": 3029} {"train_loss": -6.660027503967285, "global_step": 127232, "epoch": 3029} {"train_loss": -6.683965682983398, "global_step": 127233, "epoch": 3029} {"train_loss": -6.6873321533203125, "global_step": 127234, "epoch": 3029} {"train_loss": -6.637042045593262, "global_step": 127235, "epoch": 3029} {"train_loss": -6.578625679016113, "global_step": 127236, "epoch": 3029} {"train_loss": -6.643810749053955, "global_step": 127237, "epoch": 3029} {"train_loss": -6.705749034881592, "global_step": 127238, "epoch": 3029} {"train_loss": -6.5790534019470215, "global_step": 127239, "epoch": 3029} {"train_loss": -6.613578796386719, "global_step": 127240, "epoch": 3029} {"train_loss": -6.658247947692871, "global_step": 127241, "epoch": 3029} {"train_loss": -6.588370323181152, "global_step": 127242, "epoch": 3029} {"train_loss": -6.602787017822266, "global_step": 127243, "epoch": 3029} {"train_loss": -6.669458389282227, "global_step": 127244, "epoch": 3029} {"train_loss": -6.504151344299316, "global_step": 127245, "epoch": 3029} {"train_loss": -6.539820671081543, "global_step": 127246, "epoch": 3029} {"train_loss": -6.667264461517334, "global_step": 127247, "epoch": 3029} {"train_loss": -6.589320659637451, "global_step": 127248, "epoch": 3029} {"train_loss": -6.558529853820801, "global_step": 127249, "epoch": 3029} {"train_loss": -6.54722785949707, "global_step": 127250, "epoch": 3029} {"train_loss": -6.666489601135254, "global_step": 127251, "epoch": 3029} {"train_loss": -6.777490615844727, "global_step": 127252, "epoch": 3029} {"train_loss": -6.575756072998047, "global_step": 127253, "epoch": 3029} {"train_loss": -6.599435806274414, "global_step": 127254, "epoch": 3029} {"train_loss": -6.574804782867432, "global_step": 127255, "epoch": 3029} {"train_loss": -6.590239524841309, "global_step": 127256, "epoch": 3029} {"train_loss": -6.618868827819824, "global_step": 127257, "epoch": 3029} {"train_loss": -6.653167724609375, "global_step": 127258, "epoch": 3029} {"train_loss": -6.643373455320086, "global_step": 127259, "epoch": 3029, "val_loss": 77378.7578125} {"train_loss": -6.6673407554626465, "global_step": 127260, "epoch": 3030} {"train_loss": -6.6209893226623535, "global_step": 127261, "epoch": 3030} {"train_loss": -6.533081531524658, "global_step": 127262, "epoch": 3030} {"train_loss": -6.66636323928833, "global_step": 127263, "epoch": 3030} {"train_loss": -6.638130187988281, "global_step": 127264, "epoch": 3030} {"train_loss": -6.709628105163574, "global_step": 127265, "epoch": 3030} {"train_loss": -6.571653366088867, "global_step": 127266, "epoch": 3030} {"train_loss": -6.619650363922119, "global_step": 127267, "epoch": 3030} {"train_loss": -6.600881576538086, "global_step": 127268, "epoch": 3030} {"train_loss": -6.4848785400390625, "global_step": 127269, "epoch": 3030} {"train_loss": -6.457996368408203, "global_step": 127270, "epoch": 3030} {"train_loss": -6.6452460289001465, "global_step": 127271, "epoch": 3030} {"train_loss": -6.515933990478516, "global_step": 127272, "epoch": 3030} {"train_loss": -6.574468612670898, "global_step": 127273, "epoch": 3030} {"train_loss": -6.545527935028076, "global_step": 127274, "epoch": 3030} {"train_loss": -6.59147834777832, "global_step": 127275, "epoch": 3030} {"train_loss": -6.5569257736206055, "global_step": 127276, "epoch": 3030} {"train_loss": -6.6619873046875, "global_step": 127277, "epoch": 3030} {"train_loss": -6.73416805267334, "global_step": 127278, "epoch": 3030} {"train_loss": -6.6221394538879395, "global_step": 127279, "epoch": 3030} {"train_loss": -6.634050369262695, "global_step": 127280, "epoch": 3030} {"train_loss": -6.6565093994140625, "global_step": 127281, "epoch": 3030} {"train_loss": -6.574387073516846, "global_step": 127282, "epoch": 3030} {"train_loss": -6.664730072021484, "global_step": 127283, "epoch": 3030} {"train_loss": -6.6200666427612305, "global_step": 127284, "epoch": 3030} {"train_loss": -6.5966691970825195, "global_step": 127285, "epoch": 3030} {"train_loss": -6.664952278137207, "global_step": 127286, "epoch": 3030} {"train_loss": -6.554547309875488, "global_step": 127287, "epoch": 3030} {"train_loss": -6.684183597564697, "global_step": 127288, "epoch": 3030} {"train_loss": -6.69651985168457, "global_step": 127289, "epoch": 3030} {"train_loss": -6.511846542358398, "global_step": 127290, "epoch": 3030} {"train_loss": -6.627776145935059, "global_step": 127291, "epoch": 3030} {"train_loss": -6.535830497741699, "global_step": 127292, "epoch": 3030} {"train_loss": -6.673610687255859, "global_step": 127293, "epoch": 3030} {"train_loss": -6.602593421936035, "global_step": 127294, "epoch": 3030} {"train_loss": -6.637877941131592, "global_step": 127295, "epoch": 3030} {"train_loss": -6.509814262390137, "global_step": 127296, "epoch": 3030} {"train_loss": -6.6811065673828125, "global_step": 127297, "epoch": 3030} {"train_loss": -6.680514335632324, "global_step": 127298, "epoch": 3030} {"train_loss": -6.59822940826416, "global_step": 127299, "epoch": 3030} {"train_loss": -6.602341651916504, "global_step": 127300, "epoch": 3030} {"train_loss": -6.610572599229359, "global_step": 127301, "epoch": 3030, "val_loss": 77242.6953125} {"train_loss": -6.711268424987793, "global_step": 127302, "epoch": 3031} {"train_loss": -6.656817436218262, "global_step": 127303, "epoch": 3031} {"train_loss": -6.520454406738281, "global_step": 127304, "epoch": 3031} {"train_loss": -6.639009475708008, "global_step": 127305, "epoch": 3031} {"train_loss": -6.6644110679626465, "global_step": 127306, "epoch": 3031} {"train_loss": -6.639874458312988, "global_step": 127307, "epoch": 3031} {"train_loss": -6.64845609664917, "global_step": 127308, "epoch": 3031} {"train_loss": -6.6796979904174805, "global_step": 127309, "epoch": 3031} {"train_loss": -6.583772659301758, "global_step": 127310, "epoch": 3031} {"train_loss": -6.660767555236816, "global_step": 127311, "epoch": 3031} {"train_loss": -6.667983055114746, "global_step": 127312, "epoch": 3031} {"train_loss": -6.608609676361084, "global_step": 127313, "epoch": 3031} {"train_loss": -6.627707004547119, "global_step": 127314, "epoch": 3031} {"train_loss": -6.655621528625488, "global_step": 127315, "epoch": 3031} {"train_loss": -6.707944869995117, "global_step": 127316, "epoch": 3031} {"train_loss": -6.760753631591797, "global_step": 127317, "epoch": 3031} {"train_loss": -6.678933620452881, "global_step": 127318, "epoch": 3031} {"train_loss": -6.6493425369262695, "global_step": 127319, "epoch": 3031} {"train_loss": -6.679614543914795, "global_step": 127320, "epoch": 3031} {"train_loss": -6.630533218383789, "global_step": 127321, "epoch": 3031} {"train_loss": -6.7028913497924805, "global_step": 127322, "epoch": 3031} {"train_loss": -6.634745121002197, "global_step": 127323, "epoch": 3031} {"train_loss": -6.678216934204102, "global_step": 127324, "epoch": 3031} {"train_loss": -6.579311370849609, "global_step": 127325, "epoch": 3031} {"train_loss": -6.665033340454102, "global_step": 127326, "epoch": 3031} {"train_loss": -6.718160629272461, "global_step": 127327, "epoch": 3031} {"train_loss": -6.576227188110352, "global_step": 127328, "epoch": 3031} {"train_loss": -6.57214879989624, "global_step": 127329, "epoch": 3031} {"train_loss": -6.677740097045898, "global_step": 127330, "epoch": 3031} {"train_loss": -6.655009746551514, "global_step": 127331, "epoch": 3031} {"train_loss": -6.606740951538086, "global_step": 127332, "epoch": 3031} {"train_loss": -6.734943389892578, "global_step": 127333, "epoch": 3031} {"train_loss": -6.613521575927734, "global_step": 127334, "epoch": 3031} {"train_loss": -6.729808807373047, "global_step": 127335, "epoch": 3031} {"train_loss": -6.670583248138428, "global_step": 127336, "epoch": 3031} {"train_loss": -6.494668960571289, "global_step": 127337, "epoch": 3031} {"train_loss": -6.680928707122803, "global_step": 127338, "epoch": 3031} {"train_loss": -6.574049472808838, "global_step": 127339, "epoch": 3031} {"train_loss": -6.670298099517822, "global_step": 127340, "epoch": 3031} {"train_loss": -6.714751243591309, "global_step": 127341, "epoch": 3031} {"train_loss": -6.694316864013672, "global_step": 127342, "epoch": 3031} {"train_loss": -6.652798005512783, "global_step": 127343, "epoch": 3031, "val_loss": 77342.9453125} {"train_loss": -6.673852920532227, "global_step": 127344, "epoch": 3032} {"train_loss": -6.599897861480713, "global_step": 127345, "epoch": 3032} {"train_loss": -6.71665620803833, "global_step": 127346, "epoch": 3032} {"train_loss": -6.562366962432861, "global_step": 127347, "epoch": 3032} {"train_loss": -6.640044212341309, "global_step": 127348, "epoch": 3032} {"train_loss": -6.664362907409668, "global_step": 127349, "epoch": 3032} {"train_loss": -6.610467433929443, "global_step": 127350, "epoch": 3032} {"train_loss": -6.656850814819336, "global_step": 127351, "epoch": 3032} {"train_loss": -6.700428009033203, "global_step": 127352, "epoch": 3032} {"train_loss": -6.6593475341796875, "global_step": 127353, "epoch": 3032} {"train_loss": -6.686341285705566, "global_step": 127354, "epoch": 3032} {"train_loss": -6.732688903808594, "global_step": 127355, "epoch": 3032} {"train_loss": -6.722878456115723, "global_step": 127356, "epoch": 3032} {"train_loss": -6.696626663208008, "global_step": 127357, "epoch": 3032} {"train_loss": -6.624647617340088, "global_step": 127358, "epoch": 3032} {"train_loss": -6.827300071716309, "global_step": 127359, "epoch": 3032} {"train_loss": -6.659660816192627, "global_step": 127360, "epoch": 3032} {"train_loss": -6.658379077911377, "global_step": 127361, "epoch": 3032} {"train_loss": -6.70511531829834, "global_step": 127362, "epoch": 3032} {"train_loss": -6.69576358795166, "global_step": 127363, "epoch": 3032} {"train_loss": -6.6175055503845215, "global_step": 127364, "epoch": 3032} {"train_loss": -6.613803386688232, "global_step": 127365, "epoch": 3032} {"train_loss": -6.608100414276123, "global_step": 127366, "epoch": 3032} {"train_loss": -6.741336822509766, "global_step": 127367, "epoch": 3032} {"train_loss": -6.696073532104492, "global_step": 127368, "epoch": 3032} {"train_loss": -6.605731010437012, "global_step": 127369, "epoch": 3032} {"train_loss": -6.604561805725098, "global_step": 127370, "epoch": 3032} {"train_loss": -6.774909496307373, "global_step": 127371, "epoch": 3032} {"train_loss": -6.5909576416015625, "global_step": 127372, "epoch": 3032} {"train_loss": -6.647329330444336, "global_step": 127373, "epoch": 3032} {"train_loss": -6.662424087524414, "global_step": 127374, "epoch": 3032} {"train_loss": -6.724804878234863, "global_step": 127375, "epoch": 3032} {"train_loss": -6.6566925048828125, "global_step": 127376, "epoch": 3032} {"train_loss": -6.5971574783325195, "global_step": 127377, "epoch": 3032} {"train_loss": -6.691756248474121, "global_step": 127378, "epoch": 3032} {"train_loss": -6.573118686676025, "global_step": 127379, "epoch": 3032} {"train_loss": -6.598281383514404, "global_step": 127380, "epoch": 3032} {"train_loss": -6.521059989929199, "global_step": 127381, "epoch": 3032} {"train_loss": -6.761481285095215, "global_step": 127382, "epoch": 3032} {"train_loss": -6.718832492828369, "global_step": 127383, "epoch": 3032} {"train_loss": -6.596363544464111, "global_step": 127384, "epoch": 3032} {"train_loss": -6.658815327144804, "global_step": 127385, "epoch": 3032, "val_loss": 77365.7890625} {"train_loss": -6.755598068237305, "global_step": 127386, "epoch": 3033} {"train_loss": -6.702855110168457, "global_step": 127387, "epoch": 3033} {"train_loss": -6.665226936340332, "global_step": 127388, "epoch": 3033} {"train_loss": -6.610652923583984, "global_step": 127389, "epoch": 3033} {"train_loss": -6.553558349609375, "global_step": 127390, "epoch": 3033} {"train_loss": -6.629958152770996, "global_step": 127391, "epoch": 3033} {"train_loss": -6.676553726196289, "global_step": 127392, "epoch": 3033} {"train_loss": -6.727239608764648, "global_step": 127393, "epoch": 3033} {"train_loss": -6.520806312561035, "global_step": 127394, "epoch": 3033} {"train_loss": -6.6151814460754395, "global_step": 127395, "epoch": 3033} {"train_loss": -6.730371475219727, "global_step": 127396, "epoch": 3033} {"train_loss": -6.632876396179199, "global_step": 127397, "epoch": 3033} {"train_loss": -6.67467737197876, "global_step": 127398, "epoch": 3033} {"train_loss": -6.649746894836426, "global_step": 127399, "epoch": 3033} {"train_loss": -6.748128890991211, "global_step": 127400, "epoch": 3033} {"train_loss": -6.716236591339111, "global_step": 127401, "epoch": 3033} {"train_loss": -6.718048572540283, "global_step": 127402, "epoch": 3033} {"train_loss": -6.690533638000488, "global_step": 127403, "epoch": 3033} {"train_loss": -6.695010662078857, "global_step": 127404, "epoch": 3033} {"train_loss": -6.712410926818848, "global_step": 127405, "epoch": 3033} {"train_loss": -6.683594703674316, "global_step": 127406, "epoch": 3033} {"train_loss": -6.476916313171387, "global_step": 127407, "epoch": 3033} {"train_loss": -6.669354438781738, "global_step": 127408, "epoch": 3033} {"train_loss": -6.534050941467285, "global_step": 127409, "epoch": 3033} {"train_loss": -6.59036111831665, "global_step": 127410, "epoch": 3033} {"train_loss": -6.6921467781066895, "global_step": 127411, "epoch": 3033} {"train_loss": -6.5886125564575195, "global_step": 127412, "epoch": 3033} {"train_loss": -6.5398688316345215, "global_step": 127413, "epoch": 3033} {"train_loss": -6.553511142730713, "global_step": 127414, "epoch": 3033} {"train_loss": -6.638046741485596, "global_step": 127415, "epoch": 3033} {"train_loss": -6.664364814758301, "global_step": 127416, "epoch": 3033} {"train_loss": -6.543468952178955, "global_step": 127417, "epoch": 3033} {"train_loss": -6.648947238922119, "global_step": 127418, "epoch": 3033} {"train_loss": -6.627190113067627, "global_step": 127419, "epoch": 3033} {"train_loss": -6.728203773498535, "global_step": 127420, "epoch": 3033} {"train_loss": -6.5897369384765625, "global_step": 127421, "epoch": 3033} {"train_loss": -6.604216575622559, "global_step": 127422, "epoch": 3033} {"train_loss": -6.707341194152832, "global_step": 127423, "epoch": 3033} {"train_loss": -6.475006580352783, "global_step": 127424, "epoch": 3033} {"train_loss": -6.611104965209961, "global_step": 127425, "epoch": 3033} {"train_loss": -6.555023193359375, "global_step": 127426, "epoch": 3033} {"train_loss": -6.6364799454098655, "global_step": 127427, "epoch": 3033, "val_loss": 77459.3125} {"train_loss": -6.666426658630371, "global_step": 127428, "epoch": 3034} {"train_loss": -6.691296577453613, "global_step": 127429, "epoch": 3034} {"train_loss": -6.71026086807251, "global_step": 127430, "epoch": 3034} {"train_loss": -6.682684898376465, "global_step": 127431, "epoch": 3034} {"train_loss": -6.525191307067871, "global_step": 127432, "epoch": 3034} {"train_loss": -6.7135467529296875, "global_step": 127433, "epoch": 3034} {"train_loss": -6.563266277313232, "global_step": 127434, "epoch": 3034} {"train_loss": -6.64658260345459, "global_step": 127435, "epoch": 3034} {"train_loss": -6.677783489227295, "global_step": 127436, "epoch": 3034} {"train_loss": -6.657540321350098, "global_step": 127437, "epoch": 3034} {"train_loss": -6.567166328430176, "global_step": 127438, "epoch": 3034} {"train_loss": -6.57451057434082, "global_step": 127439, "epoch": 3034} {"train_loss": -6.627870559692383, "global_step": 127440, "epoch": 3034} {"train_loss": -6.683836936950684, "global_step": 127441, "epoch": 3034} {"train_loss": -6.676074504852295, "global_step": 127442, "epoch": 3034} {"train_loss": -6.66480016708374, "global_step": 127443, "epoch": 3034} {"train_loss": -6.480964660644531, "global_step": 127444, "epoch": 3034} {"train_loss": -6.630285739898682, "global_step": 127445, "epoch": 3034} {"train_loss": -6.598930358886719, "global_step": 127446, "epoch": 3034} {"train_loss": -6.566634178161621, "global_step": 127447, "epoch": 3034} {"train_loss": -6.697394371032715, "global_step": 127448, "epoch": 3034} {"train_loss": -6.637398719787598, "global_step": 127449, "epoch": 3034} {"train_loss": -6.617359161376953, "global_step": 127450, "epoch": 3034} {"train_loss": -6.585860252380371, "global_step": 127451, "epoch": 3034} {"train_loss": -6.631338596343994, "global_step": 127452, "epoch": 3034} {"train_loss": -6.656354904174805, "global_step": 127453, "epoch": 3034} {"train_loss": -6.561297416687012, "global_step": 127454, "epoch": 3034} {"train_loss": -6.562056064605713, "global_step": 127455, "epoch": 3034} {"train_loss": -6.557386875152588, "global_step": 127456, "epoch": 3034} {"train_loss": -6.613159656524658, "global_step": 127457, "epoch": 3034} {"train_loss": -6.541373252868652, "global_step": 127458, "epoch": 3034} {"train_loss": -6.681886672973633, "global_step": 127459, "epoch": 3034} {"train_loss": -6.6306257247924805, "global_step": 127460, "epoch": 3034} {"train_loss": -6.586729526519775, "global_step": 127461, "epoch": 3034} {"train_loss": -6.582640647888184, "global_step": 127462, "epoch": 3034} {"train_loss": -6.695744037628174, "global_step": 127463, "epoch": 3034} {"train_loss": -6.620855331420898, "global_step": 127464, "epoch": 3034} {"train_loss": -6.636239051818848, "global_step": 127465, "epoch": 3034} {"train_loss": -6.640028953552246, "global_step": 127466, "epoch": 3034} {"train_loss": -6.632293701171875, "global_step": 127467, "epoch": 3034} {"train_loss": -6.559514045715332, "global_step": 127468, "epoch": 3034} {"train_loss": -6.62323834782555, "global_step": 127469, "epoch": 3034, "val_loss": 77432.28125} {"train_loss": -6.687784194946289, "global_step": 127470, "epoch": 3035} {"train_loss": -6.603302001953125, "global_step": 127471, "epoch": 3035} {"train_loss": -6.6320905685424805, "global_step": 127472, "epoch": 3035} {"train_loss": -6.71775484085083, "global_step": 127473, "epoch": 3035} {"train_loss": -6.671787261962891, "global_step": 127474, "epoch": 3035} {"train_loss": -6.648082733154297, "global_step": 127475, "epoch": 3035} {"train_loss": -6.518999099731445, "global_step": 127476, "epoch": 3035} {"train_loss": -6.5608134269714355, "global_step": 127477, "epoch": 3035} {"train_loss": -6.629002571105957, "global_step": 127478, "epoch": 3035} {"train_loss": -6.644252777099609, "global_step": 127479, "epoch": 3035} {"train_loss": -6.674263000488281, "global_step": 127480, "epoch": 3035} {"train_loss": -6.67744255065918, "global_step": 127481, "epoch": 3035} {"train_loss": -6.669044494628906, "global_step": 127482, "epoch": 3035} {"train_loss": -6.6778154373168945, "global_step": 127483, "epoch": 3035} {"train_loss": -6.663219451904297, "global_step": 127484, "epoch": 3035} {"train_loss": -6.793023109436035, "global_step": 127485, "epoch": 3035} {"train_loss": -6.6344804763793945, "global_step": 127486, "epoch": 3035} {"train_loss": -6.6811933517456055, "global_step": 127487, "epoch": 3035} {"train_loss": -6.653651237487793, "global_step": 127488, "epoch": 3035} {"train_loss": -6.751217365264893, "global_step": 127489, "epoch": 3035} {"train_loss": -6.693805694580078, "global_step": 127490, "epoch": 3035} {"train_loss": -6.677955627441406, "global_step": 127491, "epoch": 3035} {"train_loss": -6.6804351806640625, "global_step": 127492, "epoch": 3035} {"train_loss": -6.633012771606445, "global_step": 127493, "epoch": 3035} {"train_loss": -6.595860481262207, "global_step": 127494, "epoch": 3035} {"train_loss": -6.659519195556641, "global_step": 127495, "epoch": 3035} {"train_loss": -6.652651309967041, "global_step": 127496, "epoch": 3035} {"train_loss": -6.702345371246338, "global_step": 127497, "epoch": 3035} {"train_loss": -6.687051773071289, "global_step": 127498, "epoch": 3035} {"train_loss": -6.604734420776367, "global_step": 127499, "epoch": 3035} {"train_loss": -6.552452087402344, "global_step": 127500, "epoch": 3035} {"train_loss": -6.630437850952148, "global_step": 127501, "epoch": 3035} {"train_loss": -6.70698881149292, "global_step": 127502, "epoch": 3035} {"train_loss": -6.613472938537598, "global_step": 127503, "epoch": 3035} {"train_loss": -6.4410176277160645, "global_step": 127504, "epoch": 3035} {"train_loss": -6.65427827835083, "global_step": 127505, "epoch": 3035} {"train_loss": -6.566335201263428, "global_step": 127506, "epoch": 3035} {"train_loss": -6.5306596755981445, "global_step": 127507, "epoch": 3035} {"train_loss": -6.546146392822266, "global_step": 127508, "epoch": 3035} {"train_loss": -6.6311492919921875, "global_step": 127509, "epoch": 3035} {"train_loss": -6.710818290710449, "global_step": 127510, "epoch": 3035} {"train_loss": -6.640022323245094, "global_step": 127511, "epoch": 3035, "val_loss": 77583.5234375} {"train_loss": -6.490077018737793, "global_step": 127512, "epoch": 3036} {"train_loss": -6.659337997436523, "global_step": 127513, "epoch": 3036} {"train_loss": -6.643035888671875, "global_step": 127514, "epoch": 3036} {"train_loss": -6.561594486236572, "global_step": 127515, "epoch": 3036} {"train_loss": -6.756314277648926, "global_step": 127516, "epoch": 3036} {"train_loss": -6.545555114746094, "global_step": 127517, "epoch": 3036} {"train_loss": -6.48443078994751, "global_step": 127518, "epoch": 3036} {"train_loss": -6.747589588165283, "global_step": 127519, "epoch": 3036} {"train_loss": -6.623898983001709, "global_step": 127520, "epoch": 3036} {"train_loss": -6.523906707763672, "global_step": 127521, "epoch": 3036} {"train_loss": -6.608652114868164, "global_step": 127522, "epoch": 3036} {"train_loss": -6.589241027832031, "global_step": 127523, "epoch": 3036} {"train_loss": -6.598401069641113, "global_step": 127524, "epoch": 3036} {"train_loss": -6.694220542907715, "global_step": 127525, "epoch": 3036} {"train_loss": -6.686182975769043, "global_step": 127526, "epoch": 3036} {"train_loss": -6.6122212409973145, "global_step": 127527, "epoch": 3036} {"train_loss": -6.589510917663574, "global_step": 127528, "epoch": 3036} {"train_loss": -6.583117485046387, "global_step": 127529, "epoch": 3036} {"train_loss": -6.581764221191406, "global_step": 127530, "epoch": 3036} {"train_loss": -6.584551811218262, "global_step": 127531, "epoch": 3036} {"train_loss": -6.73037052154541, "global_step": 127532, "epoch": 3036} {"train_loss": -6.693641662597656, "global_step": 127533, "epoch": 3036} {"train_loss": -6.644341468811035, "global_step": 127534, "epoch": 3036} {"train_loss": -6.667944431304932, "global_step": 127535, "epoch": 3036} {"train_loss": -6.643876075744629, "global_step": 127536, "epoch": 3036} {"train_loss": -6.665006637573242, "global_step": 127537, "epoch": 3036} {"train_loss": -6.75801944732666, "global_step": 127538, "epoch": 3036} {"train_loss": -6.643983364105225, "global_step": 127539, "epoch": 3036} {"train_loss": -6.68090295791626, "global_step": 127540, "epoch": 3036} {"train_loss": -6.706296920776367, "global_step": 127541, "epoch": 3036} {"train_loss": -6.596954345703125, "global_step": 127542, "epoch": 3036} {"train_loss": -6.694197177886963, "global_step": 127543, "epoch": 3036} {"train_loss": -6.676394462585449, "global_step": 127544, "epoch": 3036} {"train_loss": -6.584471702575684, "global_step": 127545, "epoch": 3036} {"train_loss": -6.588506698608398, "global_step": 127546, "epoch": 3036} {"train_loss": -6.643013954162598, "global_step": 127547, "epoch": 3036} {"train_loss": -6.682158470153809, "global_step": 127548, "epoch": 3036} {"train_loss": -6.732421875, "global_step": 127549, "epoch": 3036} {"train_loss": -6.56581974029541, "global_step": 127550, "epoch": 3036} {"train_loss": -6.661236763000488, "global_step": 127551, "epoch": 3036} {"train_loss": -6.7386274337768555, "global_step": 127552, "epoch": 3036} {"train_loss": -6.638754980904715, "global_step": 127553, "epoch": 3036, "val_loss": 77438.1640625} {"train_loss": -6.683869361877441, "global_step": 127554, "epoch": 3037} {"train_loss": -6.692318916320801, "global_step": 127555, "epoch": 3037} {"train_loss": -6.681276321411133, "global_step": 127556, "epoch": 3037} {"train_loss": -6.781835079193115, "global_step": 127557, "epoch": 3037} {"train_loss": -6.680120468139648, "global_step": 127558, "epoch": 3037} {"train_loss": -6.66579532623291, "global_step": 127559, "epoch": 3037} {"train_loss": -6.568152904510498, "global_step": 127560, "epoch": 3037} {"train_loss": -6.6337127685546875, "global_step": 127561, "epoch": 3037} {"train_loss": -6.775869846343994, "global_step": 127562, "epoch": 3037} {"train_loss": -6.616758823394775, "global_step": 127563, "epoch": 3037} {"train_loss": -6.572860240936279, "global_step": 127564, "epoch": 3037} {"train_loss": -6.5515522956848145, "global_step": 127565, "epoch": 3037} {"train_loss": -6.6519622802734375, "global_step": 127566, "epoch": 3037} {"train_loss": -6.4531636238098145, "global_step": 127567, "epoch": 3037} {"train_loss": -6.618481159210205, "global_step": 127568, "epoch": 3037} {"train_loss": -6.630704402923584, "global_step": 127569, "epoch": 3037} {"train_loss": -6.462592124938965, "global_step": 127570, "epoch": 3037} {"train_loss": -6.581245422363281, "global_step": 127571, "epoch": 3037} {"train_loss": -6.462207794189453, "global_step": 127572, "epoch": 3037} {"train_loss": -6.671032905578613, "global_step": 127573, "epoch": 3037} {"train_loss": -6.6488237380981445, "global_step": 127574, "epoch": 3037} {"train_loss": -6.698660850524902, "global_step": 127575, "epoch": 3037} {"train_loss": -6.592581272125244, "global_step": 127576, "epoch": 3037} {"train_loss": -6.659790515899658, "global_step": 127577, "epoch": 3037} {"train_loss": -6.737927436828613, "global_step": 127578, "epoch": 3037} {"train_loss": -6.722070693969727, "global_step": 127579, "epoch": 3037} {"train_loss": -6.652800559997559, "global_step": 127580, "epoch": 3037} {"train_loss": -6.5505523681640625, "global_step": 127581, "epoch": 3037} {"train_loss": -6.7607645988464355, "global_step": 127582, "epoch": 3037} {"train_loss": -6.5445356369018555, "global_step": 127583, "epoch": 3037} {"train_loss": -6.652121543884277, "global_step": 127584, "epoch": 3037} {"train_loss": -6.5942840576171875, "global_step": 127585, "epoch": 3037} {"train_loss": -6.632962226867676, "global_step": 127586, "epoch": 3037} {"train_loss": -6.717347145080566, "global_step": 127587, "epoch": 3037} {"train_loss": -6.644712448120117, "global_step": 127588, "epoch": 3037} {"train_loss": -6.590287685394287, "global_step": 127589, "epoch": 3037} {"train_loss": -6.718518257141113, "global_step": 127590, "epoch": 3037} {"train_loss": -6.624166011810303, "global_step": 127591, "epoch": 3037} {"train_loss": -6.638232707977295, "global_step": 127592, "epoch": 3037} {"train_loss": -6.594879150390625, "global_step": 127593, "epoch": 3037} {"train_loss": -6.665177822113037, "global_step": 127594, "epoch": 3037} {"train_loss": -6.637694483711606, "global_step": 127595, "epoch": 3037, "val_loss": 77648.8203125} {"train_loss": -6.707132816314697, "global_step": 127596, "epoch": 3038} {"train_loss": -6.605282783508301, "global_step": 127597, "epoch": 3038} {"train_loss": -6.5721845626831055, "global_step": 127598, "epoch": 3038} {"train_loss": -6.7050909996032715, "global_step": 127599, "epoch": 3038} {"train_loss": -6.734850883483887, "global_step": 127600, "epoch": 3038} {"train_loss": -6.692032814025879, "global_step": 127601, "epoch": 3038} {"train_loss": -6.7739057540893555, "global_step": 127602, "epoch": 3038} {"train_loss": -6.6709465980529785, "global_step": 127603, "epoch": 3038} {"train_loss": -6.571654319763184, "global_step": 127604, "epoch": 3038} {"train_loss": -6.671235084533691, "global_step": 127605, "epoch": 3038} {"train_loss": -6.536100387573242, "global_step": 127606, "epoch": 3038} {"train_loss": -6.6018571853637695, "global_step": 127607, "epoch": 3038} {"train_loss": -6.744606018066406, "global_step": 127608, "epoch": 3038} {"train_loss": -6.66580057144165, "global_step": 127609, "epoch": 3038} {"train_loss": -6.543259620666504, "global_step": 127610, "epoch": 3038} {"train_loss": -6.621857166290283, "global_step": 127611, "epoch": 3038} {"train_loss": -6.591835975646973, "global_step": 127612, "epoch": 3038} {"train_loss": -6.572871685028076, "global_step": 127613, "epoch": 3038} {"train_loss": -6.641637325286865, "global_step": 127614, "epoch": 3038} {"train_loss": -6.677066326141357, "global_step": 127615, "epoch": 3038} {"train_loss": -6.694861888885498, "global_step": 127616, "epoch": 3038} {"train_loss": -6.634415626525879, "global_step": 127617, "epoch": 3038} {"train_loss": -6.637028694152832, "global_step": 127618, "epoch": 3038} {"train_loss": -6.653693199157715, "global_step": 127619, "epoch": 3038} {"train_loss": -6.663533687591553, "global_step": 127620, "epoch": 3038} {"train_loss": -6.661111354827881, "global_step": 127621, "epoch": 3038} {"train_loss": -6.566332817077637, "global_step": 127622, "epoch": 3038} {"train_loss": -6.650904178619385, "global_step": 127623, "epoch": 3038} {"train_loss": -6.727800369262695, "global_step": 127624, "epoch": 3038} {"train_loss": -6.739529609680176, "global_step": 127625, "epoch": 3038} {"train_loss": -6.507094383239746, "global_step": 127626, "epoch": 3038} {"train_loss": -6.681901454925537, "global_step": 127627, "epoch": 3038} {"train_loss": -6.769447326660156, "global_step": 127628, "epoch": 3038} {"train_loss": -6.583353519439697, "global_step": 127629, "epoch": 3038} {"train_loss": -6.618438243865967, "global_step": 127630, "epoch": 3038} {"train_loss": -6.649270534515381, "global_step": 127631, "epoch": 3038} {"train_loss": -6.570581436157227, "global_step": 127632, "epoch": 3038} {"train_loss": -6.617800712585449, "global_step": 127633, "epoch": 3038} {"train_loss": -6.635044097900391, "global_step": 127634, "epoch": 3038} {"train_loss": -6.678432464599609, "global_step": 127635, "epoch": 3038} {"train_loss": -6.697168350219727, "global_step": 127636, "epoch": 3038} {"train_loss": -6.646218333925519, "global_step": 127637, "epoch": 3038, "val_loss": 77299.3671875} {"train_loss": -6.621254920959473, "global_step": 127638, "epoch": 3039} {"train_loss": -6.602952003479004, "global_step": 127639, "epoch": 3039} {"train_loss": -6.657753944396973, "global_step": 127640, "epoch": 3039} {"train_loss": -6.587928295135498, "global_step": 127641, "epoch": 3039} {"train_loss": -6.647860527038574, "global_step": 127642, "epoch": 3039} {"train_loss": -6.648910999298096, "global_step": 127643, "epoch": 3039} {"train_loss": -6.686195373535156, "global_step": 127644, "epoch": 3039} {"train_loss": -6.742419242858887, "global_step": 127645, "epoch": 3039} {"train_loss": -6.67855167388916, "global_step": 127646, "epoch": 3039} {"train_loss": -6.674345970153809, "global_step": 127647, "epoch": 3039} {"train_loss": -6.5535993576049805, "global_step": 127648, "epoch": 3039} {"train_loss": -6.66448974609375, "global_step": 127649, "epoch": 3039} {"train_loss": -6.656799793243408, "global_step": 127650, "epoch": 3039} {"train_loss": -6.610833644866943, "global_step": 127651, "epoch": 3039} {"train_loss": -6.467113494873047, "global_step": 127652, "epoch": 3039} {"train_loss": -6.625454902648926, "global_step": 127653, "epoch": 3039} {"train_loss": -6.539842128753662, "global_step": 127654, "epoch": 3039} {"train_loss": -6.663406848907471, "global_step": 127655, "epoch": 3039} {"train_loss": -6.7002716064453125, "global_step": 127656, "epoch": 3039} {"train_loss": -6.715182304382324, "global_step": 127657, "epoch": 3039} {"train_loss": -6.614485740661621, "global_step": 127658, "epoch": 3039} {"train_loss": -6.7571611404418945, "global_step": 127659, "epoch": 3039} {"train_loss": -6.700031280517578, "global_step": 127660, "epoch": 3039} {"train_loss": -6.70233154296875, "global_step": 127661, "epoch": 3039} {"train_loss": -6.790696620941162, "global_step": 127662, "epoch": 3039} {"train_loss": -6.665760040283203, "global_step": 127663, "epoch": 3039} {"train_loss": -6.71416711807251, "global_step": 127664, "epoch": 3039} {"train_loss": -6.626054286956787, "global_step": 127665, "epoch": 3039} {"train_loss": -6.425531387329102, "global_step": 127666, "epoch": 3039} {"train_loss": -6.6395039558410645, "global_step": 127667, "epoch": 3039} {"train_loss": -6.614833831787109, "global_step": 127668, "epoch": 3039} {"train_loss": -6.375759124755859, "global_step": 127669, "epoch": 3039} {"train_loss": -6.633853435516357, "global_step": 127670, "epoch": 3039} {"train_loss": -6.407441139221191, "global_step": 127671, "epoch": 3039} {"train_loss": -6.588690280914307, "global_step": 127672, "epoch": 3039} {"train_loss": -6.55057430267334, "global_step": 127673, "epoch": 3039} {"train_loss": -6.526654243469238, "global_step": 127674, "epoch": 3039} {"train_loss": -6.727673053741455, "global_step": 127675, "epoch": 3039} {"train_loss": -6.587109565734863, "global_step": 127676, "epoch": 3039} {"train_loss": -6.6272783279418945, "global_step": 127677, "epoch": 3039} {"train_loss": -6.537629127502441, "global_step": 127678, "epoch": 3039} {"train_loss": -6.621047962279547, "global_step": 127679, "epoch": 3039, "val_loss": 77492.921875} {"train_loss": -6.649294853210449, "global_step": 127680, "epoch": 3040} {"train_loss": -6.613565444946289, "global_step": 127681, "epoch": 3040} {"train_loss": -6.702491760253906, "global_step": 127682, "epoch": 3040} {"train_loss": -6.699235916137695, "global_step": 127683, "epoch": 3040} {"train_loss": -6.517067909240723, "global_step": 127684, "epoch": 3040} {"train_loss": -6.6400651931762695, "global_step": 127685, "epoch": 3040} {"train_loss": -6.637813568115234, "global_step": 127686, "epoch": 3040} {"train_loss": -6.657381057739258, "global_step": 127687, "epoch": 3040} {"train_loss": -6.53607177734375, "global_step": 127688, "epoch": 3040} {"train_loss": -6.6970930099487305, "global_step": 127689, "epoch": 3040} {"train_loss": -6.65004301071167, "global_step": 127690, "epoch": 3040} {"train_loss": -6.633152961730957, "global_step": 127691, "epoch": 3040} {"train_loss": -6.692500114440918, "global_step": 127692, "epoch": 3040} {"train_loss": -6.580118179321289, "global_step": 127693, "epoch": 3040} {"train_loss": -6.5768351554870605, "global_step": 127694, "epoch": 3040} {"train_loss": -6.562009811401367, "global_step": 127695, "epoch": 3040} {"train_loss": -6.612733840942383, "global_step": 127696, "epoch": 3040} {"train_loss": -6.685919284820557, "global_step": 127697, "epoch": 3040} {"train_loss": -6.629293918609619, "global_step": 127698, "epoch": 3040} {"train_loss": -6.59049129486084, "global_step": 127699, "epoch": 3040} {"train_loss": -6.620394706726074, "global_step": 127700, "epoch": 3040} {"train_loss": -6.643803596496582, "global_step": 127701, "epoch": 3040} {"train_loss": -6.62924861907959, "global_step": 127702, "epoch": 3040} {"train_loss": -6.600774765014648, "global_step": 127703, "epoch": 3040} {"train_loss": -6.543322563171387, "global_step": 127704, "epoch": 3040} {"train_loss": -6.592587471008301, "global_step": 127705, "epoch": 3040} {"train_loss": -6.6493964195251465, "global_step": 127706, "epoch": 3040} {"train_loss": -6.689117431640625, "global_step": 127707, "epoch": 3040} {"train_loss": -6.6778459548950195, "global_step": 127708, "epoch": 3040} {"train_loss": -6.662120819091797, "global_step": 127709, "epoch": 3040} {"train_loss": -6.5719709396362305, "global_step": 127710, "epoch": 3040} {"train_loss": -6.654059886932373, "global_step": 127711, "epoch": 3040} {"train_loss": -6.604081630706787, "global_step": 127712, "epoch": 3040} {"train_loss": -6.497128009796143, "global_step": 127713, "epoch": 3040} {"train_loss": -6.675677299499512, "global_step": 127714, "epoch": 3040} {"train_loss": -6.719058036804199, "global_step": 127715, "epoch": 3040} {"train_loss": -6.737296104431152, "global_step": 127716, "epoch": 3040} {"train_loss": -6.668924331665039, "global_step": 127717, "epoch": 3040} {"train_loss": -6.62158203125, "global_step": 127718, "epoch": 3040} {"train_loss": -6.65188455581665, "global_step": 127719, "epoch": 3040} {"train_loss": -6.543988227844238, "global_step": 127720, "epoch": 3040} {"train_loss": -6.63123033160255, "global_step": 127721, "epoch": 3040, "val_loss": 77205.890625} {"train_loss": -6.580187797546387, "global_step": 127722, "epoch": 3041} {"train_loss": -6.623202800750732, "global_step": 127723, "epoch": 3041} {"train_loss": -6.750240325927734, "global_step": 127724, "epoch": 3041} {"train_loss": -6.653707981109619, "global_step": 127725, "epoch": 3041} {"train_loss": -6.712532997131348, "global_step": 127726, "epoch": 3041} {"train_loss": -6.695443153381348, "global_step": 127727, "epoch": 3041} {"train_loss": -6.6363701820373535, "global_step": 127728, "epoch": 3041} {"train_loss": -6.647006034851074, "global_step": 127729, "epoch": 3041} {"train_loss": -6.611694812774658, "global_step": 127730, "epoch": 3041} {"train_loss": -6.524228096008301, "global_step": 127731, "epoch": 3041} {"train_loss": -6.582884788513184, "global_step": 127732, "epoch": 3041} {"train_loss": -6.591764450073242, "global_step": 127733, "epoch": 3041} {"train_loss": -6.6473283767700195, "global_step": 127734, "epoch": 3041} {"train_loss": -6.682506561279297, "global_step": 127735, "epoch": 3041} {"train_loss": -6.6597185134887695, "global_step": 127736, "epoch": 3041} {"train_loss": -6.682229042053223, "global_step": 127737, "epoch": 3041} {"train_loss": -6.7450408935546875, "global_step": 127738, "epoch": 3041} {"train_loss": -6.633126258850098, "global_step": 127739, "epoch": 3041} {"train_loss": -6.677267551422119, "global_step": 127740, "epoch": 3041} {"train_loss": -6.756516456604004, "global_step": 127741, "epoch": 3041} {"train_loss": -6.780745506286621, "global_step": 127742, "epoch": 3041} {"train_loss": -6.687744140625, "global_step": 127743, "epoch": 3041} {"train_loss": -6.684340476989746, "global_step": 127744, "epoch": 3041} {"train_loss": -6.645151138305664, "global_step": 127745, "epoch": 3041} {"train_loss": -6.7222580909729, "global_step": 127746, "epoch": 3041} {"train_loss": -6.558040618896484, "global_step": 127747, "epoch": 3041} {"train_loss": -6.71441125869751, "global_step": 127748, "epoch": 3041} {"train_loss": -6.68348503112793, "global_step": 127749, "epoch": 3041} {"train_loss": -6.704320907592773, "global_step": 127750, "epoch": 3041} {"train_loss": -6.611168384552002, "global_step": 127751, "epoch": 3041} {"train_loss": -6.6472320556640625, "global_step": 127752, "epoch": 3041} {"train_loss": -6.76702880859375, "global_step": 127753, "epoch": 3041} {"train_loss": -6.580257415771484, "global_step": 127754, "epoch": 3041} {"train_loss": -6.5860595703125, "global_step": 127755, "epoch": 3041} {"train_loss": -6.687811374664307, "global_step": 127756, "epoch": 3041} {"train_loss": -6.690369129180908, "global_step": 127757, "epoch": 3041} {"train_loss": -6.744060516357422, "global_step": 127758, "epoch": 3041} {"train_loss": -6.654023170471191, "global_step": 127759, "epoch": 3041} {"train_loss": -6.677321434020996, "global_step": 127760, "epoch": 3041} {"train_loss": -6.618645191192627, "global_step": 127761, "epoch": 3041} {"train_loss": -6.646302223205566, "global_step": 127762, "epoch": 3041} {"train_loss": -6.660940737951369, "global_step": 127763, "epoch": 3041, "val_loss": 77649.921875} {"train_loss": -6.611346244812012, "global_step": 127764, "epoch": 3042} {"train_loss": -6.626611709594727, "global_step": 127765, "epoch": 3042} {"train_loss": -6.624650001525879, "global_step": 127766, "epoch": 3042} {"train_loss": -6.525120735168457, "global_step": 127767, "epoch": 3042} {"train_loss": -6.716561317443848, "global_step": 127768, "epoch": 3042} {"train_loss": -6.640025615692139, "global_step": 127769, "epoch": 3042} {"train_loss": -6.490749835968018, "global_step": 127770, "epoch": 3042} {"train_loss": -6.678627014160156, "global_step": 127771, "epoch": 3042} {"train_loss": -6.652730941772461, "global_step": 127772, "epoch": 3042} {"train_loss": -6.435009002685547, "global_step": 127773, "epoch": 3042} {"train_loss": -6.569005012512207, "global_step": 127774, "epoch": 3042} {"train_loss": -6.634481906890869, "global_step": 127775, "epoch": 3042} {"train_loss": -6.5042853355407715, "global_step": 127776, "epoch": 3042} {"train_loss": -6.583239555358887, "global_step": 127777, "epoch": 3042} {"train_loss": -6.537973403930664, "global_step": 127778, "epoch": 3042} {"train_loss": -6.534393310546875, "global_step": 127779, "epoch": 3042} {"train_loss": -6.615740776062012, "global_step": 127780, "epoch": 3042} {"train_loss": -6.550410270690918, "global_step": 127781, "epoch": 3042} {"train_loss": -6.506556510925293, "global_step": 127782, "epoch": 3042} {"train_loss": -6.628237724304199, "global_step": 127783, "epoch": 3042} {"train_loss": -6.472240447998047, "global_step": 127784, "epoch": 3042} {"train_loss": -6.7305989265441895, "global_step": 127785, "epoch": 3042} {"train_loss": -6.471856594085693, "global_step": 127786, "epoch": 3042} {"train_loss": -6.657082557678223, "global_step": 127787, "epoch": 3042} {"train_loss": -6.4435882568359375, "global_step": 127788, "epoch": 3042} {"train_loss": -6.476825714111328, "global_step": 127789, "epoch": 3042} {"train_loss": -6.55088472366333, "global_step": 127790, "epoch": 3042} {"train_loss": -6.648927688598633, "global_step": 127791, "epoch": 3042} {"train_loss": -6.6398210525512695, "global_step": 127792, "epoch": 3042} {"train_loss": -6.528589248657227, "global_step": 127793, "epoch": 3042} {"train_loss": -6.572803020477295, "global_step": 127794, "epoch": 3042} {"train_loss": -6.6383819580078125, "global_step": 127795, "epoch": 3042} {"train_loss": -6.678889274597168, "global_step": 127796, "epoch": 3042} {"train_loss": -6.529972076416016, "global_step": 127797, "epoch": 3042} {"train_loss": -6.5522565841674805, "global_step": 127798, "epoch": 3042} {"train_loss": -6.772064208984375, "global_step": 127799, "epoch": 3042} {"train_loss": -6.629889488220215, "global_step": 127800, "epoch": 3042} {"train_loss": -6.639192581176758, "global_step": 127801, "epoch": 3042} {"train_loss": -6.670042991638184, "global_step": 127802, "epoch": 3042} {"train_loss": -6.680624961853027, "global_step": 127803, "epoch": 3042} {"train_loss": -6.6385393142700195, "global_step": 127804, "epoch": 3042} {"train_loss": -6.595500378381638, "global_step": 127805, "epoch": 3042, "val_loss": 77586.203125} {"train_loss": -6.684263706207275, "global_step": 127806, "epoch": 3043} {"train_loss": -6.63661003112793, "global_step": 127807, "epoch": 3043} {"train_loss": -6.604768753051758, "global_step": 127808, "epoch": 3043} {"train_loss": -6.641079902648926, "global_step": 127809, "epoch": 3043} {"train_loss": -6.6835222244262695, "global_step": 127810, "epoch": 3043} {"train_loss": -6.629193305969238, "global_step": 127811, "epoch": 3043} {"train_loss": -6.60486364364624, "global_step": 127812, "epoch": 3043} {"train_loss": -6.56314754486084, "global_step": 127813, "epoch": 3043} {"train_loss": -6.574200630187988, "global_step": 127814, "epoch": 3043} {"train_loss": -6.615118026733398, "global_step": 127815, "epoch": 3043} {"train_loss": -6.652886390686035, "global_step": 127816, "epoch": 3043} {"train_loss": -6.57996129989624, "global_step": 127817, "epoch": 3043} {"train_loss": -6.622753143310547, "global_step": 127818, "epoch": 3043} {"train_loss": -6.628278732299805, "global_step": 127819, "epoch": 3043} {"train_loss": -6.511356830596924, "global_step": 127820, "epoch": 3043} {"train_loss": -6.631999492645264, "global_step": 127821, "epoch": 3043} {"train_loss": -6.713682174682617, "global_step": 127822, "epoch": 3043} {"train_loss": -6.546206474304199, "global_step": 127823, "epoch": 3043} {"train_loss": -6.592738628387451, "global_step": 127824, "epoch": 3043} {"train_loss": -6.5648603439331055, "global_step": 127825, "epoch": 3043} {"train_loss": -6.6236982345581055, "global_step": 127826, "epoch": 3043} {"train_loss": -6.529594421386719, "global_step": 127827, "epoch": 3043} {"train_loss": -6.6337127685546875, "global_step": 127828, "epoch": 3043} {"train_loss": -6.609187126159668, "global_step": 127829, "epoch": 3043} {"train_loss": -6.613040924072266, "global_step": 127830, "epoch": 3043} {"train_loss": -6.599055290222168, "global_step": 127831, "epoch": 3043} {"train_loss": -6.58903694152832, "global_step": 127832, "epoch": 3043} {"train_loss": -6.6449480056762695, "global_step": 127833, "epoch": 3043} {"train_loss": -6.488152027130127, "global_step": 127834, "epoch": 3043} {"train_loss": -6.624302387237549, "global_step": 127835, "epoch": 3043} {"train_loss": -6.728152275085449, "global_step": 127836, "epoch": 3043} {"train_loss": -6.533510208129883, "global_step": 127837, "epoch": 3043} {"train_loss": -6.710014343261719, "global_step": 127838, "epoch": 3043} {"train_loss": -6.595404148101807, "global_step": 127839, "epoch": 3043} {"train_loss": -6.672028541564941, "global_step": 127840, "epoch": 3043} {"train_loss": -6.805506229400635, "global_step": 127841, "epoch": 3043} {"train_loss": -6.6863908767700195, "global_step": 127842, "epoch": 3043} {"train_loss": -6.704181671142578, "global_step": 127843, "epoch": 3043} {"train_loss": -6.817084789276123, "global_step": 127844, "epoch": 3043} {"train_loss": -6.666248798370361, "global_step": 127845, "epoch": 3043} {"train_loss": -6.71665096282959, "global_step": 127846, "epoch": 3043} {"train_loss": -6.6310593854813344, "global_step": 127847, "epoch": 3043, "val_loss": 77343.3046875} {"train_loss": -6.635354995727539, "global_step": 127848, "epoch": 3044} {"train_loss": -6.567853927612305, "global_step": 127849, "epoch": 3044} {"train_loss": -6.601914882659912, "global_step": 127850, "epoch": 3044} {"train_loss": -6.542179107666016, "global_step": 127851, "epoch": 3044} {"train_loss": -6.643486499786377, "global_step": 127852, "epoch": 3044} {"train_loss": -6.6274213790893555, "global_step": 127853, "epoch": 3044} {"train_loss": -6.578816890716553, "global_step": 127854, "epoch": 3044} {"train_loss": -6.672126770019531, "global_step": 127855, "epoch": 3044} {"train_loss": -6.615367889404297, "global_step": 127856, "epoch": 3044} {"train_loss": -6.5222015380859375, "global_step": 127857, "epoch": 3044} {"train_loss": -6.537388801574707, "global_step": 127858, "epoch": 3044} {"train_loss": -6.6239423751831055, "global_step": 127859, "epoch": 3044} {"train_loss": -6.597873687744141, "global_step": 127860, "epoch": 3044} {"train_loss": -6.687285423278809, "global_step": 127861, "epoch": 3044} {"train_loss": -6.569169998168945, "global_step": 127862, "epoch": 3044} {"train_loss": -6.733024597167969, "global_step": 127863, "epoch": 3044} {"train_loss": -6.556914806365967, "global_step": 127864, "epoch": 3044} {"train_loss": -6.653754234313965, "global_step": 127865, "epoch": 3044} {"train_loss": -6.624761581420898, "global_step": 127866, "epoch": 3044} {"train_loss": -6.62959098815918, "global_step": 127867, "epoch": 3044} {"train_loss": -6.723670959472656, "global_step": 127868, "epoch": 3044} {"train_loss": -6.602961540222168, "global_step": 127869, "epoch": 3044} {"train_loss": -6.723270893096924, "global_step": 127870, "epoch": 3044} {"train_loss": -6.532138824462891, "global_step": 127871, "epoch": 3044} {"train_loss": -6.64205265045166, "global_step": 127872, "epoch": 3044} {"train_loss": -6.626767635345459, "global_step": 127873, "epoch": 3044} {"train_loss": -6.575955390930176, "global_step": 127874, "epoch": 3044} {"train_loss": -6.6802520751953125, "global_step": 127875, "epoch": 3044} {"train_loss": -6.7177886962890625, "global_step": 127876, "epoch": 3044} {"train_loss": -6.637181758880615, "global_step": 127877, "epoch": 3044} {"train_loss": -6.724795341491699, "global_step": 127878, "epoch": 3044} {"train_loss": -6.79913330078125, "global_step": 127879, "epoch": 3044} {"train_loss": -6.804103374481201, "global_step": 127880, "epoch": 3044} {"train_loss": -6.630978584289551, "global_step": 127881, "epoch": 3044} {"train_loss": -6.749791622161865, "global_step": 127882, "epoch": 3044} {"train_loss": -6.633498191833496, "global_step": 127883, "epoch": 3044} {"train_loss": -6.664092540740967, "global_step": 127884, "epoch": 3044} {"train_loss": -6.744772911071777, "global_step": 127885, "epoch": 3044} {"train_loss": -6.701948165893555, "global_step": 127886, "epoch": 3044} {"train_loss": -6.660366058349609, "global_step": 127887, "epoch": 3044} {"train_loss": -6.693351745605469, "global_step": 127888, "epoch": 3044} {"train_loss": -6.645699739456177, "global_step": 127889, "epoch": 3044, "val_loss": 77292.328125} {"train_loss": -6.552288055419922, "global_step": 127890, "epoch": 3045} {"train_loss": -6.558627128601074, "global_step": 127891, "epoch": 3045} {"train_loss": -6.640947341918945, "global_step": 127892, "epoch": 3045} {"train_loss": -6.510799407958984, "global_step": 127893, "epoch": 3045} {"train_loss": -6.664106369018555, "global_step": 127894, "epoch": 3045} {"train_loss": -6.6985697746276855, "global_step": 127895, "epoch": 3045} {"train_loss": -6.637551784515381, "global_step": 127896, "epoch": 3045} {"train_loss": -6.550930976867676, "global_step": 127897, "epoch": 3045} {"train_loss": -6.609073638916016, "global_step": 127898, "epoch": 3045} {"train_loss": -6.549610614776611, "global_step": 127899, "epoch": 3045} {"train_loss": -6.521389484405518, "global_step": 127900, "epoch": 3045} {"train_loss": -6.710518836975098, "global_step": 127901, "epoch": 3045} {"train_loss": -6.554904460906982, "global_step": 127902, "epoch": 3045} {"train_loss": -6.670917510986328, "global_step": 127903, "epoch": 3045} {"train_loss": -6.577754020690918, "global_step": 127904, "epoch": 3045} {"train_loss": -6.6010918617248535, "global_step": 127905, "epoch": 3045} {"train_loss": -6.676382064819336, "global_step": 127906, "epoch": 3045} {"train_loss": -6.651245594024658, "global_step": 127907, "epoch": 3045} {"train_loss": -6.659262657165527, "global_step": 127908, "epoch": 3045} {"train_loss": -6.643769264221191, "global_step": 127909, "epoch": 3045} {"train_loss": -6.600083351135254, "global_step": 127910, "epoch": 3045} {"train_loss": -6.7051262855529785, "global_step": 127911, "epoch": 3045} {"train_loss": -6.7061920166015625, "global_step": 127912, "epoch": 3045} {"train_loss": -6.5730109214782715, "global_step": 127913, "epoch": 3045} {"train_loss": -6.620974540710449, "global_step": 127914, "epoch": 3045} {"train_loss": -6.716142177581787, "global_step": 127915, "epoch": 3045} {"train_loss": -6.68117094039917, "global_step": 127916, "epoch": 3045} {"train_loss": -6.6796088218688965, "global_step": 127917, "epoch": 3045} {"train_loss": -6.603758335113525, "global_step": 127918, "epoch": 3045} {"train_loss": -6.709069728851318, "global_step": 127919, "epoch": 3045} {"train_loss": -6.713553428649902, "global_step": 127920, "epoch": 3045} {"train_loss": -6.670745849609375, "global_step": 127921, "epoch": 3045} {"train_loss": -6.5397210121154785, "global_step": 127922, "epoch": 3045} {"train_loss": -6.505541801452637, "global_step": 127923, "epoch": 3045} {"train_loss": -6.7362961769104, "global_step": 127924, "epoch": 3045} {"train_loss": -6.579446792602539, "global_step": 127925, "epoch": 3045} {"train_loss": -6.526788711547852, "global_step": 127926, "epoch": 3045} {"train_loss": -6.562823295593262, "global_step": 127927, "epoch": 3045} {"train_loss": -6.534634590148926, "global_step": 127928, "epoch": 3045} {"train_loss": -6.487876892089844, "global_step": 127929, "epoch": 3045} {"train_loss": -6.60776424407959, "global_step": 127930, "epoch": 3045} {"train_loss": -6.614968129566738, "global_step": 127931, "epoch": 3045, "val_loss": 77687.9296875} {"train_loss": -6.628656387329102, "global_step": 127932, "epoch": 3046} {"train_loss": -6.4912872314453125, "global_step": 127933, "epoch": 3046} {"train_loss": -6.484687805175781, "global_step": 127934, "epoch": 3046} {"train_loss": -6.556978225708008, "global_step": 127935, "epoch": 3046} {"train_loss": -6.619376182556152, "global_step": 127936, "epoch": 3046} {"train_loss": -6.568689823150635, "global_step": 127937, "epoch": 3046} {"train_loss": -6.568903923034668, "global_step": 127938, "epoch": 3046} {"train_loss": -6.606315612792969, "global_step": 127939, "epoch": 3046} {"train_loss": -6.629595756530762, "global_step": 127940, "epoch": 3046} {"train_loss": -6.607122421264648, "global_step": 127941, "epoch": 3046} {"train_loss": -6.526149749755859, "global_step": 127942, "epoch": 3046} {"train_loss": -6.571479320526123, "global_step": 127943, "epoch": 3046} {"train_loss": -6.658895969390869, "global_step": 127944, "epoch": 3046} {"train_loss": -6.591689586639404, "global_step": 127945, "epoch": 3046} {"train_loss": -6.462020397186279, "global_step": 127946, "epoch": 3046} {"train_loss": -6.630499839782715, "global_step": 127947, "epoch": 3046} {"train_loss": -6.596405029296875, "global_step": 127948, "epoch": 3046} {"train_loss": -6.53189754486084, "global_step": 127949, "epoch": 3046} {"train_loss": -6.727725982666016, "global_step": 127950, "epoch": 3046} {"train_loss": -6.725736618041992, "global_step": 127951, "epoch": 3046} {"train_loss": -6.607146263122559, "global_step": 127952, "epoch": 3046} {"train_loss": -6.705448150634766, "global_step": 127953, "epoch": 3046} {"train_loss": -6.624694347381592, "global_step": 127954, "epoch": 3046} {"train_loss": -6.723825454711914, "global_step": 127955, "epoch": 3046} {"train_loss": -6.658125400543213, "global_step": 127956, "epoch": 3046} {"train_loss": -6.594508171081543, "global_step": 127957, "epoch": 3046} {"train_loss": -6.702538013458252, "global_step": 127958, "epoch": 3046} {"train_loss": -6.522017478942871, "global_step": 127959, "epoch": 3046} {"train_loss": -6.753243446350098, "global_step": 127960, "epoch": 3046} {"train_loss": -6.76332426071167, "global_step": 127961, "epoch": 3046} {"train_loss": -6.549680709838867, "global_step": 127962, "epoch": 3046} {"train_loss": -6.654138565063477, "global_step": 127963, "epoch": 3046} {"train_loss": -6.569796562194824, "global_step": 127964, "epoch": 3046} {"train_loss": -6.6586503982543945, "global_step": 127965, "epoch": 3046} {"train_loss": -6.620774745941162, "global_step": 127966, "epoch": 3046} {"train_loss": -6.586553573608398, "global_step": 127967, "epoch": 3046} {"train_loss": -6.569069862365723, "global_step": 127968, "epoch": 3046} {"train_loss": -6.60862398147583, "global_step": 127969, "epoch": 3046} {"train_loss": -6.56177282333374, "global_step": 127970, "epoch": 3046} {"train_loss": -6.720669269561768, "global_step": 127971, "epoch": 3046} {"train_loss": -6.672783851623535, "global_step": 127972, "epoch": 3046} {"train_loss": -6.616380941300165, "global_step": 127973, "epoch": 3046, "val_loss": 77401.0078125} {"train_loss": -6.753244400024414, "global_step": 127974, "epoch": 3047} {"train_loss": -6.691263198852539, "global_step": 127975, "epoch": 3047} {"train_loss": -6.609809875488281, "global_step": 127976, "epoch": 3047} {"train_loss": -6.770016670227051, "global_step": 127977, "epoch": 3047} {"train_loss": -6.697841167449951, "global_step": 127978, "epoch": 3047} {"train_loss": -6.595963478088379, "global_step": 127979, "epoch": 3047} {"train_loss": -6.721902847290039, "global_step": 127980, "epoch": 3047} {"train_loss": -6.569256782531738, "global_step": 127981, "epoch": 3047} {"train_loss": -6.681539535522461, "global_step": 127982, "epoch": 3047} {"train_loss": -6.710781097412109, "global_step": 127983, "epoch": 3047} {"train_loss": -6.494209289550781, "global_step": 127984, "epoch": 3047} {"train_loss": -6.757693290710449, "global_step": 127985, "epoch": 3047} {"train_loss": -6.515045166015625, "global_step": 127986, "epoch": 3047} {"train_loss": -6.6815080642700195, "global_step": 127987, "epoch": 3047} {"train_loss": -6.583672046661377, "global_step": 127988, "epoch": 3047} {"train_loss": -6.581904411315918, "global_step": 127989, "epoch": 3047} {"train_loss": -6.672920227050781, "global_step": 127990, "epoch": 3047} {"train_loss": -6.673720359802246, "global_step": 127991, "epoch": 3047} {"train_loss": -6.668821811676025, "global_step": 127992, "epoch": 3047} {"train_loss": -6.704385757446289, "global_step": 127993, "epoch": 3047} {"train_loss": -6.615384101867676, "global_step": 127994, "epoch": 3047} {"train_loss": -6.588525295257568, "global_step": 127995, "epoch": 3047} {"train_loss": -6.552068710327148, "global_step": 127996, "epoch": 3047} {"train_loss": -6.688612937927246, "global_step": 127997, "epoch": 3047} {"train_loss": -6.606980323791504, "global_step": 127998, "epoch": 3047} {"train_loss": -6.704751014709473, "global_step": 127999, "epoch": 3047} {"train_loss": -6.717339038848877, "global_step": 128000, "epoch": 3047} {"train_loss": -6.591498851776123, "global_step": 128001, "epoch": 3047} {"train_loss": -6.633648872375488, "global_step": 128002, "epoch": 3047} {"train_loss": -6.66749382019043, "global_step": 128003, "epoch": 3047} {"train_loss": -6.6448469161987305, "global_step": 128004, "epoch": 3047} {"train_loss": -6.7136125564575195, "global_step": 128005, "epoch": 3047} {"train_loss": -6.548307418823242, "global_step": 128006, "epoch": 3047} {"train_loss": -6.671241760253906, "global_step": 128007, "epoch": 3047} {"train_loss": -6.661996841430664, "global_step": 128008, "epoch": 3047} {"train_loss": -6.537905693054199, "global_step": 128009, "epoch": 3047} {"train_loss": -6.669285297393799, "global_step": 128010, "epoch": 3047} {"train_loss": -6.602983474731445, "global_step": 128011, "epoch": 3047} {"train_loss": -6.564580917358398, "global_step": 128012, "epoch": 3047} {"train_loss": -6.609622001647949, "global_step": 128013, "epoch": 3047} {"train_loss": -6.541614532470703, "global_step": 128014, "epoch": 3047} {"train_loss": -6.641112486521403, "global_step": 128015, "epoch": 3047, "val_loss": 77456.9765625} {"train_loss": -6.7434868812561035, "global_step": 128016, "epoch": 3048} {"train_loss": -6.586935043334961, "global_step": 128017, "epoch": 3048} {"train_loss": -6.508451461791992, "global_step": 128018, "epoch": 3048} {"train_loss": -6.53685188293457, "global_step": 128019, "epoch": 3048} {"train_loss": -6.606637477874756, "global_step": 128020, "epoch": 3048} {"train_loss": -6.689305305480957, "global_step": 128021, "epoch": 3048} {"train_loss": -6.576813697814941, "global_step": 128022, "epoch": 3048} {"train_loss": -6.581855297088623, "global_step": 128023, "epoch": 3048} {"train_loss": -6.583280563354492, "global_step": 128024, "epoch": 3048} {"train_loss": -6.560173034667969, "global_step": 128025, "epoch": 3048} {"train_loss": -6.614003658294678, "global_step": 128026, "epoch": 3048} {"train_loss": -6.607998847961426, "global_step": 128027, "epoch": 3048} {"train_loss": -6.552403450012207, "global_step": 128028, "epoch": 3048} {"train_loss": -6.503705024719238, "global_step": 128029, "epoch": 3048} {"train_loss": -6.448990345001221, "global_step": 128030, "epoch": 3048} {"train_loss": -6.531308174133301, "global_step": 128031, "epoch": 3048} {"train_loss": -6.4927978515625, "global_step": 128032, "epoch": 3048} {"train_loss": -6.615730285644531, "global_step": 128033, "epoch": 3048} {"train_loss": -6.624091148376465, "global_step": 128034, "epoch": 3048} {"train_loss": -6.64725399017334, "global_step": 128035, "epoch": 3048} {"train_loss": -6.610663890838623, "global_step": 128036, "epoch": 3048} {"train_loss": -6.558166027069092, "global_step": 128037, "epoch": 3048} {"train_loss": -6.605012893676758, "global_step": 128038, "epoch": 3048} {"train_loss": -6.657073497772217, "global_step": 128039, "epoch": 3048} {"train_loss": -6.64469051361084, "global_step": 128040, "epoch": 3048} {"train_loss": -6.568288803100586, "global_step": 128041, "epoch": 3048} {"train_loss": -6.601600646972656, "global_step": 128042, "epoch": 3048} {"train_loss": -6.573873519897461, "global_step": 128043, "epoch": 3048} {"train_loss": -6.474339962005615, "global_step": 128044, "epoch": 3048} {"train_loss": -6.629737377166748, "global_step": 128045, "epoch": 3048} {"train_loss": -6.517492294311523, "global_step": 128046, "epoch": 3048} {"train_loss": -6.660089492797852, "global_step": 128047, "epoch": 3048} {"train_loss": -6.508727073669434, "global_step": 128048, "epoch": 3048} {"train_loss": -6.635572910308838, "global_step": 128049, "epoch": 3048} {"train_loss": -6.560052871704102, "global_step": 128050, "epoch": 3048} {"train_loss": -6.522148609161377, "global_step": 128051, "epoch": 3048} {"train_loss": -6.699240684509277, "global_step": 128052, "epoch": 3048} {"train_loss": -6.730513572692871, "global_step": 128053, "epoch": 3048} {"train_loss": -6.61943244934082, "global_step": 128054, "epoch": 3048} {"train_loss": -6.614871978759766, "global_step": 128055, "epoch": 3048} {"train_loss": -6.684834003448486, "global_step": 128056, "epoch": 3048} {"train_loss": -6.591784829185123, "global_step": 128057, "epoch": 3048, "val_loss": 77178.0} {"train_loss": -6.660296440124512, "global_step": 128058, "epoch": 3049} {"train_loss": -6.717873573303223, "global_step": 128059, "epoch": 3049} {"train_loss": -6.656315803527832, "global_step": 128060, "epoch": 3049} {"train_loss": -6.740540504455566, "global_step": 128061, "epoch": 3049} {"train_loss": -6.582043647766113, "global_step": 128062, "epoch": 3049} {"train_loss": -6.521448135375977, "global_step": 128063, "epoch": 3049} {"train_loss": -6.5903825759887695, "global_step": 128064, "epoch": 3049} {"train_loss": -6.429614067077637, "global_step": 128065, "epoch": 3049} {"train_loss": -6.728447914123535, "global_step": 128066, "epoch": 3049} {"train_loss": -6.518562316894531, "global_step": 128067, "epoch": 3049} {"train_loss": -6.596352577209473, "global_step": 128068, "epoch": 3049} {"train_loss": -6.64246940612793, "global_step": 128069, "epoch": 3049} {"train_loss": -6.444228649139404, "global_step": 128070, "epoch": 3049} {"train_loss": -6.54792594909668, "global_step": 128071, "epoch": 3049} {"train_loss": -6.568183422088623, "global_step": 128072, "epoch": 3049} {"train_loss": -6.5880818367004395, "global_step": 128073, "epoch": 3049} {"train_loss": -6.554127216339111, "global_step": 128074, "epoch": 3049} {"train_loss": -6.654742240905762, "global_step": 128075, "epoch": 3049} {"train_loss": -6.562501907348633, "global_step": 128076, "epoch": 3049} {"train_loss": -6.578916072845459, "global_step": 128077, "epoch": 3049} {"train_loss": -6.697142601013184, "global_step": 128078, "epoch": 3049} {"train_loss": -6.555863857269287, "global_step": 128079, "epoch": 3049} {"train_loss": -6.738953590393066, "global_step": 128080, "epoch": 3049} {"train_loss": -6.708349227905273, "global_step": 128081, "epoch": 3049} {"train_loss": -6.620633602142334, "global_step": 128082, "epoch": 3049} {"train_loss": -6.67059326171875, "global_step": 128083, "epoch": 3049} {"train_loss": -6.639192581176758, "global_step": 128084, "epoch": 3049} {"train_loss": -6.632092475891113, "global_step": 128085, "epoch": 3049} {"train_loss": -6.646517276763916, "global_step": 128086, "epoch": 3049} {"train_loss": -6.609323978424072, "global_step": 128087, "epoch": 3049} {"train_loss": -6.725261688232422, "global_step": 128088, "epoch": 3049} {"train_loss": -6.621028900146484, "global_step": 128089, "epoch": 3049} {"train_loss": -6.628155708312988, "global_step": 128090, "epoch": 3049} {"train_loss": -6.639832019805908, "global_step": 128091, "epoch": 3049} {"train_loss": -6.749891757965088, "global_step": 128092, "epoch": 3049} {"train_loss": -6.5827741622924805, "global_step": 128093, "epoch": 3049} {"train_loss": -6.5377516746521, "global_step": 128094, "epoch": 3049} {"train_loss": -6.6486711502075195, "global_step": 128095, "epoch": 3049} {"train_loss": -6.668461799621582, "global_step": 128096, "epoch": 3049} {"train_loss": -6.691061973571777, "global_step": 128097, "epoch": 3049} {"train_loss": -6.534232139587402, "global_step": 128098, "epoch": 3049} {"train_loss": -6.620799041929699, "global_step": 128099, "epoch": 3049, "val_loss": 77192.7578125} {"train_loss": -6.7287678718566895, "global_step": 128100, "epoch": 3050} {"train_loss": -6.653332710266113, "global_step": 128101, "epoch": 3050} {"train_loss": -6.741850852966309, "global_step": 128102, "epoch": 3050} {"train_loss": -6.728574275970459, "global_step": 128103, "epoch": 3050} {"train_loss": -6.702816963195801, "global_step": 128104, "epoch": 3050} {"train_loss": -6.686580657958984, "global_step": 128105, "epoch": 3050} {"train_loss": -6.737240791320801, "global_step": 128106, "epoch": 3050} {"train_loss": -6.70732307434082, "global_step": 128107, "epoch": 3050} {"train_loss": -6.683565139770508, "global_step": 128108, "epoch": 3050} {"train_loss": -6.642820835113525, "global_step": 128109, "epoch": 3050} {"train_loss": -6.633735656738281, "global_step": 128110, "epoch": 3050} {"train_loss": -6.7131452560424805, "global_step": 128111, "epoch": 3050} {"train_loss": -6.504733085632324, "global_step": 128112, "epoch": 3050} {"train_loss": -6.662059307098389, "global_step": 128113, "epoch": 3050} {"train_loss": -6.645040035247803, "global_step": 128114, "epoch": 3050} {"train_loss": -6.669048309326172, "global_step": 128115, "epoch": 3050} {"train_loss": -6.604297637939453, "global_step": 128116, "epoch": 3050} {"train_loss": -6.622885704040527, "global_step": 128117, "epoch": 3050} {"train_loss": -6.614129066467285, "global_step": 128118, "epoch": 3050} {"train_loss": -6.553376197814941, "global_step": 128119, "epoch": 3050} {"train_loss": -6.638731002807617, "global_step": 128120, "epoch": 3050} {"train_loss": -6.733903408050537, "global_step": 128121, "epoch": 3050} {"train_loss": -6.748088836669922, "global_step": 128122, "epoch": 3050} {"train_loss": -6.723089218139648, "global_step": 128123, "epoch": 3050} {"train_loss": -6.697030067443848, "global_step": 128124, "epoch": 3050} {"train_loss": -6.672593116760254, "global_step": 128125, "epoch": 3050} {"train_loss": -6.70433235168457, "global_step": 128126, "epoch": 3050} {"train_loss": -6.5686445236206055, "global_step": 128127, "epoch": 3050} {"train_loss": -6.706015586853027, "global_step": 128128, "epoch": 3050} {"train_loss": -6.683801651000977, "global_step": 128129, "epoch": 3050} {"train_loss": -6.6557393074035645, "global_step": 128130, "epoch": 3050} {"train_loss": -6.583161354064941, "global_step": 128131, "epoch": 3050} {"train_loss": -6.662632465362549, "global_step": 128132, "epoch": 3050} {"train_loss": -6.6857523918151855, "global_step": 128133, "epoch": 3050} {"train_loss": -6.68026065826416, "global_step": 128134, "epoch": 3050} {"train_loss": -6.654677391052246, "global_step": 128135, "epoch": 3050} {"train_loss": -6.61923885345459, "global_step": 128136, "epoch": 3050} {"train_loss": -6.589038848876953, "global_step": 128137, "epoch": 3050} {"train_loss": -6.607271194458008, "global_step": 128138, "epoch": 3050} {"train_loss": -6.641713619232178, "global_step": 128139, "epoch": 3050} {"train_loss": -6.648571968078613, "global_step": 128140, "epoch": 3050} {"train_loss": -6.665845098949614, "global_step": 128141, "epoch": 3050, "train/sim_max_reward_0": 0.48951909318962034, "train/sim_max_reward_1": 0.8985062139607668, "train/sim_max_reward_2": 0.37253522331307354, "train/sim_max_reward_3": 0.13882610385043667, "train/sim_max_reward_4": 0.7009949967291941, "train/sim_max_reward_5": 0.5759883710156919, "test/sim_max_reward_4500000": 0.9411017196777336, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9761767730478451, "test/sim_max_reward_4500004": 0.13486016673428844, "test/sim_max_reward_4500005": 0.2690719014587173, "test/sim_max_reward_4500006": 0.8212717286056186, "test/sim_max_reward_4500007": 0.8613342252886868, "test/sim_max_reward_4500008": 0.13512737057054683, "test/sim_max_reward_4500009": 0.053492091307121924, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.7115930085701135, "test/sim_max_reward_4500012": 0.9234449857238718, "test/sim_max_reward_4500013": 0.0046485325226801036, "test/sim_max_reward_4500014": 0.904813209377808, "test/sim_max_reward_4500015": 0.9464839592355069, "test/sim_max_reward_4500016": 0.017549988542791953, "test/sim_max_reward_4500017": 0.05138703589116797, "test/sim_max_reward_4500018": 0.39281156159870545, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9919761185918853, "test/sim_max_reward_4500022": 0.9535470599221394, "test/sim_max_reward_4500023": 0.5302761052330162, "test/sim_max_reward_4500024": 0.9957831552528925, "test/sim_max_reward_4500025": 0.9755124547324541, "test/sim_max_reward_4500026": 0.9463296794692718, "test/sim_max_reward_4500027": 0.9580887182066556, "test/sim_max_reward_4500028": 0.22459791701977974, "test/sim_max_reward_4500029": 0.07840400050989992, "test/sim_max_reward_4500030": 0.9665916841834473, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9300743866699286, "test/sim_max_reward_4500034": 0.6796303389758173, "test/sim_max_reward_4500035": 0.5580135605370358, "test/sim_max_reward_4500036": 0.9841503473460453, "test/sim_max_reward_4500037": 0.8350663636262218, "test/sim_max_reward_4500038": 0.9251061012663859, "test/sim_max_reward_4500039": 0.9968878162850983, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.9714773233533217, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.42040975850502493, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9213459944333688, "test/sim_max_reward_4500046": 0.6796574936864621, "test/sim_max_reward_4500047": 0.9524446853992711, "test/sim_max_reward_4500048": 0.9279478888048007, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5293950003431305, "test/mean_score": 0.5802480795450866, "val_loss": 77234.75} {"train_loss": -6.583597183227539, "global_step": 128142, "epoch": 3051} {"train_loss": -6.8012847900390625, "global_step": 128143, "epoch": 3051} {"train_loss": -6.651569366455078, "global_step": 128144, "epoch": 3051} {"train_loss": -6.678778648376465, "global_step": 128145, "epoch": 3051} {"train_loss": -6.7550764083862305, "global_step": 128146, "epoch": 3051} {"train_loss": -6.713895320892334, "global_step": 128147, "epoch": 3051} {"train_loss": -6.717012405395508, "global_step": 128148, "epoch": 3051} {"train_loss": -6.650127410888672, "global_step": 128149, "epoch": 3051} {"train_loss": -6.631269454956055, "global_step": 128150, "epoch": 3051} {"train_loss": -6.689766883850098, "global_step": 128151, "epoch": 3051} {"train_loss": -6.701870441436768, "global_step": 128152, "epoch": 3051} {"train_loss": -6.738474369049072, "global_step": 128153, "epoch": 3051} {"train_loss": -6.606814384460449, "global_step": 128154, "epoch": 3051} {"train_loss": -6.616735458374023, "global_step": 128155, "epoch": 3051} {"train_loss": -6.698300361633301, "global_step": 128156, "epoch": 3051} {"train_loss": -6.615572929382324, "global_step": 128157, "epoch": 3051} {"train_loss": -6.690207004547119, "global_step": 128158, "epoch": 3051} {"train_loss": -6.653071403503418, "global_step": 128159, "epoch": 3051} {"train_loss": -6.619937419891357, "global_step": 128160, "epoch": 3051} {"train_loss": -6.666827201843262, "global_step": 128161, "epoch": 3051} {"train_loss": -6.6168437004089355, "global_step": 128162, "epoch": 3051} {"train_loss": -6.550645351409912, "global_step": 128163, "epoch": 3051} {"train_loss": -6.712337970733643, "global_step": 128164, "epoch": 3051} {"train_loss": -6.657254695892334, "global_step": 128165, "epoch": 3051} {"train_loss": -6.752925395965576, "global_step": 128166, "epoch": 3051} {"train_loss": -6.610283374786377, "global_step": 128167, "epoch": 3051} {"train_loss": -6.714971542358398, "global_step": 128168, "epoch": 3051} {"train_loss": -6.636693477630615, "global_step": 128169, "epoch": 3051} {"train_loss": -6.645410537719727, "global_step": 128170, "epoch": 3051} {"train_loss": -6.617421627044678, "global_step": 128171, "epoch": 3051} {"train_loss": -6.629456520080566, "global_step": 128172, "epoch": 3051} {"train_loss": -6.7658514976501465, "global_step": 128173, "epoch": 3051} {"train_loss": -6.5738091468811035, "global_step": 128174, "epoch": 3051} {"train_loss": -6.737631797790527, "global_step": 128175, "epoch": 3051} {"train_loss": -6.643376350402832, "global_step": 128176, "epoch": 3051} {"train_loss": -6.629457473754883, "global_step": 128177, "epoch": 3051} {"train_loss": -6.722274303436279, "global_step": 128178, "epoch": 3051} {"train_loss": -6.644107818603516, "global_step": 128179, "epoch": 3051} {"train_loss": -6.602789402008057, "global_step": 128180, "epoch": 3051} {"train_loss": -6.691646099090576, "global_step": 128181, "epoch": 3051} {"train_loss": -6.623614311218262, "global_step": 128182, "epoch": 3051} {"train_loss": -6.66584232875279, "global_step": 128183, "epoch": 3051, "val_loss": 77288.5546875} {"train_loss": -6.752544403076172, "global_step": 128184, "epoch": 3052} {"train_loss": -6.643608570098877, "global_step": 128185, "epoch": 3052} {"train_loss": -6.734703063964844, "global_step": 128186, "epoch": 3052} {"train_loss": -6.691812515258789, "global_step": 128187, "epoch": 3052} {"train_loss": -6.75395393371582, "global_step": 128188, "epoch": 3052} {"train_loss": -6.729551315307617, "global_step": 128189, "epoch": 3052} {"train_loss": -6.715824604034424, "global_step": 128190, "epoch": 3052} {"train_loss": -6.73725700378418, "global_step": 128191, "epoch": 3052} {"train_loss": -6.713065147399902, "global_step": 128192, "epoch": 3052} {"train_loss": -6.709756374359131, "global_step": 128193, "epoch": 3052} {"train_loss": -6.578859329223633, "global_step": 128194, "epoch": 3052} {"train_loss": -6.66984224319458, "global_step": 128195, "epoch": 3052} {"train_loss": -6.699348449707031, "global_step": 128196, "epoch": 3052} {"train_loss": -6.791201591491699, "global_step": 128197, "epoch": 3052} {"train_loss": -6.653266429901123, "global_step": 128198, "epoch": 3052} {"train_loss": -6.6176629066467285, "global_step": 128199, "epoch": 3052} {"train_loss": -6.658488750457764, "global_step": 128200, "epoch": 3052} {"train_loss": -6.716322898864746, "global_step": 128201, "epoch": 3052} {"train_loss": -6.686947822570801, "global_step": 128202, "epoch": 3052} {"train_loss": -6.675967693328857, "global_step": 128203, "epoch": 3052} {"train_loss": -6.659424781799316, "global_step": 128204, "epoch": 3052} {"train_loss": -6.525087356567383, "global_step": 128205, "epoch": 3052} {"train_loss": -6.615451812744141, "global_step": 128206, "epoch": 3052} {"train_loss": -6.763172149658203, "global_step": 128207, "epoch": 3052} {"train_loss": -6.474774360656738, "global_step": 128208, "epoch": 3052} {"train_loss": -6.44704532623291, "global_step": 128209, "epoch": 3052} {"train_loss": -6.577317237854004, "global_step": 128210, "epoch": 3052} {"train_loss": -6.529247283935547, "global_step": 128211, "epoch": 3052} {"train_loss": -6.569084644317627, "global_step": 128212, "epoch": 3052} {"train_loss": -6.740607261657715, "global_step": 128213, "epoch": 3052} {"train_loss": -6.538921356201172, "global_step": 128214, "epoch": 3052} {"train_loss": -6.703618049621582, "global_step": 128215, "epoch": 3052} {"train_loss": -6.578444957733154, "global_step": 128216, "epoch": 3052} {"train_loss": -6.684102535247803, "global_step": 128217, "epoch": 3052} {"train_loss": -6.637038707733154, "global_step": 128218, "epoch": 3052} {"train_loss": -6.599462032318115, "global_step": 128219, "epoch": 3052} {"train_loss": -6.637729167938232, "global_step": 128220, "epoch": 3052} {"train_loss": -6.712456226348877, "global_step": 128221, "epoch": 3052} {"train_loss": -6.55778694152832, "global_step": 128222, "epoch": 3052} {"train_loss": -6.4436540603637695, "global_step": 128223, "epoch": 3052} {"train_loss": -6.5777130126953125, "global_step": 128224, "epoch": 3052} {"train_loss": -6.6484864212217785, "global_step": 128225, "epoch": 3052, "val_loss": 77399.859375} {"train_loss": -6.735039710998535, "global_step": 128226, "epoch": 3053} {"train_loss": -6.648146152496338, "global_step": 128227, "epoch": 3053} {"train_loss": -6.713155746459961, "global_step": 128228, "epoch": 3053} {"train_loss": -6.778421878814697, "global_step": 128229, "epoch": 3053} {"train_loss": -6.6518330574035645, "global_step": 128230, "epoch": 3053} {"train_loss": -6.740085124969482, "global_step": 128231, "epoch": 3053} {"train_loss": -6.7775774002075195, "global_step": 128232, "epoch": 3053} {"train_loss": -6.64532470703125, "global_step": 128233, "epoch": 3053} {"train_loss": -6.692461967468262, "global_step": 128234, "epoch": 3053} {"train_loss": -6.655628204345703, "global_step": 128235, "epoch": 3053} {"train_loss": -6.627349376678467, "global_step": 128236, "epoch": 3053} {"train_loss": -6.582671642303467, "global_step": 128237, "epoch": 3053} {"train_loss": -6.641445636749268, "global_step": 128238, "epoch": 3053} {"train_loss": -6.6272382736206055, "global_step": 128239, "epoch": 3053} {"train_loss": -6.685912132263184, "global_step": 128240, "epoch": 3053} {"train_loss": -6.656706809997559, "global_step": 128241, "epoch": 3053} {"train_loss": -6.586529731750488, "global_step": 128242, "epoch": 3053} {"train_loss": -6.576338291168213, "global_step": 128243, "epoch": 3053} {"train_loss": -6.582545757293701, "global_step": 128244, "epoch": 3053} {"train_loss": -6.723845481872559, "global_step": 128245, "epoch": 3053} {"train_loss": -6.636565208435059, "global_step": 128246, "epoch": 3053} {"train_loss": -6.549759387969971, "global_step": 128247, "epoch": 3053} {"train_loss": -6.537592887878418, "global_step": 128248, "epoch": 3053} {"train_loss": -6.569393634796143, "global_step": 128249, "epoch": 3053} {"train_loss": -6.75772762298584, "global_step": 128250, "epoch": 3053} {"train_loss": -6.570162773132324, "global_step": 128251, "epoch": 3053} {"train_loss": -6.647188186645508, "global_step": 128252, "epoch": 3053} {"train_loss": -6.704649925231934, "global_step": 128253, "epoch": 3053} {"train_loss": -6.605116844177246, "global_step": 128254, "epoch": 3053} {"train_loss": -6.682526111602783, "global_step": 128255, "epoch": 3053} {"train_loss": -6.7271013259887695, "global_step": 128256, "epoch": 3053} {"train_loss": -6.731010437011719, "global_step": 128257, "epoch": 3053} {"train_loss": -6.5810346603393555, "global_step": 128258, "epoch": 3053} {"train_loss": -6.67457914352417, "global_step": 128259, "epoch": 3053} {"train_loss": -6.659082412719727, "global_step": 128260, "epoch": 3053} {"train_loss": -6.669288635253906, "global_step": 128261, "epoch": 3053} {"train_loss": -6.648333549499512, "global_step": 128262, "epoch": 3053} {"train_loss": -6.574154853820801, "global_step": 128263, "epoch": 3053} {"train_loss": -6.759859085083008, "global_step": 128264, "epoch": 3053} {"train_loss": -6.601167678833008, "global_step": 128265, "epoch": 3053} {"train_loss": -6.584970474243164, "global_step": 128266, "epoch": 3053} {"train_loss": -6.654702220644269, "global_step": 128267, "epoch": 3053, "val_loss": 77212.7578125} {"train_loss": -6.678616523742676, "global_step": 128268, "epoch": 3054} {"train_loss": -6.645364761352539, "global_step": 128269, "epoch": 3054} {"train_loss": -6.685302734375, "global_step": 128270, "epoch": 3054} {"train_loss": -6.729694843292236, "global_step": 128271, "epoch": 3054} {"train_loss": -6.553401947021484, "global_step": 128272, "epoch": 3054} {"train_loss": -6.768831253051758, "global_step": 128273, "epoch": 3054} {"train_loss": -6.640392303466797, "global_step": 128274, "epoch": 3054} {"train_loss": -6.610095024108887, "global_step": 128275, "epoch": 3054} {"train_loss": -6.660079002380371, "global_step": 128276, "epoch": 3054} {"train_loss": -6.5498552322387695, "global_step": 128277, "epoch": 3054} {"train_loss": -6.71994686126709, "global_step": 128278, "epoch": 3054} {"train_loss": -6.728658199310303, "global_step": 128279, "epoch": 3054} {"train_loss": -6.835054397583008, "global_step": 128280, "epoch": 3054} {"train_loss": -6.664745330810547, "global_step": 128281, "epoch": 3054} {"train_loss": -6.7998948097229, "global_step": 128282, "epoch": 3054} {"train_loss": -6.746259689331055, "global_step": 128283, "epoch": 3054} {"train_loss": -6.748605728149414, "global_step": 128284, "epoch": 3054} {"train_loss": -6.68988561630249, "global_step": 128285, "epoch": 3054} {"train_loss": -6.598106861114502, "global_step": 128286, "epoch": 3054} {"train_loss": -6.753551483154297, "global_step": 128287, "epoch": 3054} {"train_loss": -6.65331506729126, "global_step": 128288, "epoch": 3054} {"train_loss": -6.618435382843018, "global_step": 128289, "epoch": 3054} {"train_loss": -6.723211288452148, "global_step": 128290, "epoch": 3054} {"train_loss": -6.73336124420166, "global_step": 128291, "epoch": 3054} {"train_loss": -6.617389678955078, "global_step": 128292, "epoch": 3054} {"train_loss": -6.672747611999512, "global_step": 128293, "epoch": 3054} {"train_loss": -6.64676570892334, "global_step": 128294, "epoch": 3054} {"train_loss": -6.6740264892578125, "global_step": 128295, "epoch": 3054} {"train_loss": -6.570440292358398, "global_step": 128296, "epoch": 3054} {"train_loss": -6.662284851074219, "global_step": 128297, "epoch": 3054} {"train_loss": -6.73685359954834, "global_step": 128298, "epoch": 3054} {"train_loss": -6.636707305908203, "global_step": 128299, "epoch": 3054} {"train_loss": -6.686432838439941, "global_step": 128300, "epoch": 3054} {"train_loss": -6.63206672668457, "global_step": 128301, "epoch": 3054} {"train_loss": -6.78796911239624, "global_step": 128302, "epoch": 3054} {"train_loss": -6.7620062828063965, "global_step": 128303, "epoch": 3054} {"train_loss": -6.629824638366699, "global_step": 128304, "epoch": 3054} {"train_loss": -6.682539463043213, "global_step": 128305, "epoch": 3054} {"train_loss": -6.543932914733887, "global_step": 128306, "epoch": 3054} {"train_loss": -6.642498016357422, "global_step": 128307, "epoch": 3054} {"train_loss": -6.716042518615723, "global_step": 128308, "epoch": 3054} {"train_loss": -6.6802251906622026, "global_step": 128309, "epoch": 3054, "val_loss": 77366.265625} {"train_loss": -6.739026069641113, "global_step": 128310, "epoch": 3055} {"train_loss": -6.812824726104736, "global_step": 128311, "epoch": 3055} {"train_loss": -6.7728776931762695, "global_step": 128312, "epoch": 3055} {"train_loss": -6.609240531921387, "global_step": 128313, "epoch": 3055} {"train_loss": -6.706667900085449, "global_step": 128314, "epoch": 3055} {"train_loss": -6.757667541503906, "global_step": 128315, "epoch": 3055} {"train_loss": -6.739108562469482, "global_step": 128316, "epoch": 3055} {"train_loss": -6.744874000549316, "global_step": 128317, "epoch": 3055} {"train_loss": -6.663763999938965, "global_step": 128318, "epoch": 3055} {"train_loss": -6.829596519470215, "global_step": 128319, "epoch": 3055} {"train_loss": -6.645686626434326, "global_step": 128320, "epoch": 3055} {"train_loss": -6.787178039550781, "global_step": 128321, "epoch": 3055} {"train_loss": -6.685086250305176, "global_step": 128322, "epoch": 3055} {"train_loss": -6.654340744018555, "global_step": 128323, "epoch": 3055} {"train_loss": -6.743353843688965, "global_step": 128324, "epoch": 3055} {"train_loss": -6.533391952514648, "global_step": 128325, "epoch": 3055} {"train_loss": -6.655601978302002, "global_step": 128326, "epoch": 3055} {"train_loss": -6.640059471130371, "global_step": 128327, "epoch": 3055} {"train_loss": -6.567203521728516, "global_step": 128328, "epoch": 3055} {"train_loss": -6.55232572555542, "global_step": 128329, "epoch": 3055} {"train_loss": -6.709347724914551, "global_step": 128330, "epoch": 3055} {"train_loss": -6.578440189361572, "global_step": 128331, "epoch": 3055} {"train_loss": -6.547266483306885, "global_step": 128332, "epoch": 3055} {"train_loss": -6.60001277923584, "global_step": 128333, "epoch": 3055} {"train_loss": -6.555514335632324, "global_step": 128334, "epoch": 3055} {"train_loss": -6.6540656089782715, "global_step": 128335, "epoch": 3055} {"train_loss": -6.549560070037842, "global_step": 128336, "epoch": 3055} {"train_loss": -6.502914905548096, "global_step": 128337, "epoch": 3055} {"train_loss": -6.474987983703613, "global_step": 128338, "epoch": 3055} {"train_loss": -6.55803108215332, "global_step": 128339, "epoch": 3055} {"train_loss": -6.629075050354004, "global_step": 128340, "epoch": 3055} {"train_loss": -6.695680141448975, "global_step": 128341, "epoch": 3055} {"train_loss": -6.611783504486084, "global_step": 128342, "epoch": 3055} {"train_loss": -6.614341735839844, "global_step": 128343, "epoch": 3055} {"train_loss": -6.604377746582031, "global_step": 128344, "epoch": 3055} {"train_loss": -6.618592739105225, "global_step": 128345, "epoch": 3055} {"train_loss": -6.527820110321045, "global_step": 128346, "epoch": 3055} {"train_loss": -6.703252792358398, "global_step": 128347, "epoch": 3055} {"train_loss": -6.63106107711792, "global_step": 128348, "epoch": 3055} {"train_loss": -6.634449481964111, "global_step": 128349, "epoch": 3055} {"train_loss": -6.631021499633789, "global_step": 128350, "epoch": 3055} {"train_loss": -6.644847903932844, "global_step": 128351, "epoch": 3055, "val_loss": 77147.015625} {"train_loss": -6.703892707824707, "global_step": 128352, "epoch": 3056} {"train_loss": -6.748684406280518, "global_step": 128353, "epoch": 3056} {"train_loss": -6.560783386230469, "global_step": 128354, "epoch": 3056} {"train_loss": -6.6733551025390625, "global_step": 128355, "epoch": 3056} {"train_loss": -6.599201202392578, "global_step": 128356, "epoch": 3056} {"train_loss": -6.536013603210449, "global_step": 128357, "epoch": 3056} {"train_loss": -6.635994911193848, "global_step": 128358, "epoch": 3056} {"train_loss": -6.67009162902832, "global_step": 128359, "epoch": 3056} {"train_loss": -6.573618412017822, "global_step": 128360, "epoch": 3056} {"train_loss": -6.672237396240234, "global_step": 128361, "epoch": 3056} {"train_loss": -6.574925899505615, "global_step": 128362, "epoch": 3056} {"train_loss": -6.7561235427856445, "global_step": 128363, "epoch": 3056} {"train_loss": -6.592934608459473, "global_step": 128364, "epoch": 3056} {"train_loss": -6.561448097229004, "global_step": 128365, "epoch": 3056} {"train_loss": -6.725087642669678, "global_step": 128366, "epoch": 3056} {"train_loss": -6.634250640869141, "global_step": 128367, "epoch": 3056} {"train_loss": -6.6287841796875, "global_step": 128368, "epoch": 3056} {"train_loss": -6.636539936065674, "global_step": 128369, "epoch": 3056} {"train_loss": -6.691988468170166, "global_step": 128370, "epoch": 3056} {"train_loss": -6.5889692306518555, "global_step": 128371, "epoch": 3056} {"train_loss": -6.660501480102539, "global_step": 128372, "epoch": 3056} {"train_loss": -6.669659614562988, "global_step": 128373, "epoch": 3056} {"train_loss": -6.617378234863281, "global_step": 128374, "epoch": 3056} {"train_loss": -6.667230606079102, "global_step": 128375, "epoch": 3056} {"train_loss": -6.665823936462402, "global_step": 128376, "epoch": 3056} {"train_loss": -6.635992527008057, "global_step": 128377, "epoch": 3056} {"train_loss": -6.647226810455322, "global_step": 128378, "epoch": 3056} {"train_loss": -6.638476371765137, "global_step": 128379, "epoch": 3056} {"train_loss": -6.667354583740234, "global_step": 128380, "epoch": 3056} {"train_loss": -6.636571407318115, "global_step": 128381, "epoch": 3056} {"train_loss": -6.644192218780518, "global_step": 128382, "epoch": 3056} {"train_loss": -6.759518623352051, "global_step": 128383, "epoch": 3056} {"train_loss": -6.53963565826416, "global_step": 128384, "epoch": 3056} {"train_loss": -6.632665634155273, "global_step": 128385, "epoch": 3056} {"train_loss": -6.604104995727539, "global_step": 128386, "epoch": 3056} {"train_loss": -6.648024559020996, "global_step": 128387, "epoch": 3056} {"train_loss": -6.784949779510498, "global_step": 128388, "epoch": 3056} {"train_loss": -6.597093105316162, "global_step": 128389, "epoch": 3056} {"train_loss": -6.7113447189331055, "global_step": 128390, "epoch": 3056} {"train_loss": -6.719096660614014, "global_step": 128391, "epoch": 3056} {"train_loss": -6.740781784057617, "global_step": 128392, "epoch": 3056} {"train_loss": -6.650879905337379, "global_step": 128393, "epoch": 3056, "val_loss": 77442.3203125} {"train_loss": -6.61691951751709, "global_step": 128394, "epoch": 3057} {"train_loss": -6.6851301193237305, "global_step": 128395, "epoch": 3057} {"train_loss": -6.745174407958984, "global_step": 128396, "epoch": 3057} {"train_loss": -6.764152526855469, "global_step": 128397, "epoch": 3057} {"train_loss": -6.692248821258545, "global_step": 128398, "epoch": 3057} {"train_loss": -6.711263179779053, "global_step": 128399, "epoch": 3057} {"train_loss": -6.708529472351074, "global_step": 128400, "epoch": 3057} {"train_loss": -6.577617168426514, "global_step": 128401, "epoch": 3057} {"train_loss": -6.59783935546875, "global_step": 128402, "epoch": 3057} {"train_loss": -6.626430034637451, "global_step": 128403, "epoch": 3057} {"train_loss": -6.599952697753906, "global_step": 128404, "epoch": 3057} {"train_loss": -6.65272855758667, "global_step": 128405, "epoch": 3057} {"train_loss": -6.709526062011719, "global_step": 128406, "epoch": 3057} {"train_loss": -6.613943099975586, "global_step": 128407, "epoch": 3057} {"train_loss": -6.6702728271484375, "global_step": 128408, "epoch": 3057} {"train_loss": -6.607481002807617, "global_step": 128409, "epoch": 3057} {"train_loss": -6.8174848556518555, "global_step": 128410, "epoch": 3057} {"train_loss": -6.570671081542969, "global_step": 128411, "epoch": 3057} {"train_loss": -6.617005825042725, "global_step": 128412, "epoch": 3057} {"train_loss": -6.693775177001953, "global_step": 128413, "epoch": 3057} {"train_loss": -6.650965213775635, "global_step": 128414, "epoch": 3057} {"train_loss": -6.7747321128845215, "global_step": 128415, "epoch": 3057} {"train_loss": -6.5990986824035645, "global_step": 128416, "epoch": 3057} {"train_loss": -6.662172317504883, "global_step": 128417, "epoch": 3057} {"train_loss": -6.75162935256958, "global_step": 128418, "epoch": 3057} {"train_loss": -6.623366355895996, "global_step": 128419, "epoch": 3057} {"train_loss": -6.688877105712891, "global_step": 128420, "epoch": 3057} {"train_loss": -6.697455406188965, "global_step": 128421, "epoch": 3057} {"train_loss": -6.678102493286133, "global_step": 128422, "epoch": 3057} {"train_loss": -6.64420747756958, "global_step": 128423, "epoch": 3057} {"train_loss": -6.54435920715332, "global_step": 128424, "epoch": 3057} {"train_loss": -6.657299995422363, "global_step": 128425, "epoch": 3057} {"train_loss": -6.68143892288208, "global_step": 128426, "epoch": 3057} {"train_loss": -6.6633734703063965, "global_step": 128427, "epoch": 3057} {"train_loss": -6.674638748168945, "global_step": 128428, "epoch": 3057} {"train_loss": -6.643928050994873, "global_step": 128429, "epoch": 3057} {"train_loss": -6.633914470672607, "global_step": 128430, "epoch": 3057} {"train_loss": -6.7661452293396, "global_step": 128431, "epoch": 3057} {"train_loss": -6.636379241943359, "global_step": 128432, "epoch": 3057} {"train_loss": -6.7407097816467285, "global_step": 128433, "epoch": 3057} {"train_loss": -6.786949157714844, "global_step": 128434, "epoch": 3057} {"train_loss": -6.670608066377186, "global_step": 128435, "epoch": 3057, "val_loss": 77298.8046875} {"train_loss": -6.653850555419922, "global_step": 128436, "epoch": 3058} {"train_loss": -6.739853382110596, "global_step": 128437, "epoch": 3058} {"train_loss": -6.733920097351074, "global_step": 128438, "epoch": 3058} {"train_loss": -6.595475673675537, "global_step": 128439, "epoch": 3058} {"train_loss": -6.656733512878418, "global_step": 128440, "epoch": 3058} {"train_loss": -6.630176544189453, "global_step": 128441, "epoch": 3058} {"train_loss": -6.625324249267578, "global_step": 128442, "epoch": 3058} {"train_loss": -6.678210735321045, "global_step": 128443, "epoch": 3058} {"train_loss": -6.618164539337158, "global_step": 128444, "epoch": 3058} {"train_loss": -6.585326671600342, "global_step": 128445, "epoch": 3058} {"train_loss": -6.7526445388793945, "global_step": 128446, "epoch": 3058} {"train_loss": -6.607787132263184, "global_step": 128447, "epoch": 3058} {"train_loss": -6.683175563812256, "global_step": 128448, "epoch": 3058} {"train_loss": -6.703890800476074, "global_step": 128449, "epoch": 3058} {"train_loss": -6.697165489196777, "global_step": 128450, "epoch": 3058} {"train_loss": -6.702461242675781, "global_step": 128451, "epoch": 3058} {"train_loss": -6.608886241912842, "global_step": 128452, "epoch": 3058} {"train_loss": -6.689807415008545, "global_step": 128453, "epoch": 3058} {"train_loss": -6.748992919921875, "global_step": 128454, "epoch": 3058} {"train_loss": -6.62617301940918, "global_step": 128455, "epoch": 3058} {"train_loss": -6.615621566772461, "global_step": 128456, "epoch": 3058} {"train_loss": -6.759575843811035, "global_step": 128457, "epoch": 3058} {"train_loss": -6.66115665435791, "global_step": 128458, "epoch": 3058} {"train_loss": -6.662225723266602, "global_step": 128459, "epoch": 3058} {"train_loss": -6.49125862121582, "global_step": 128460, "epoch": 3058} {"train_loss": -6.5871477127075195, "global_step": 128461, "epoch": 3058} {"train_loss": -6.657683849334717, "global_step": 128462, "epoch": 3058} {"train_loss": -6.700076103210449, "global_step": 128463, "epoch": 3058} {"train_loss": -6.507856369018555, "global_step": 128464, "epoch": 3058} {"train_loss": -6.517343044281006, "global_step": 128465, "epoch": 3058} {"train_loss": -6.622845649719238, "global_step": 128466, "epoch": 3058} {"train_loss": -6.736241340637207, "global_step": 128467, "epoch": 3058} {"train_loss": -6.614226341247559, "global_step": 128468, "epoch": 3058} {"train_loss": -6.613965034484863, "global_step": 128469, "epoch": 3058} {"train_loss": -6.615735054016113, "global_step": 128470, "epoch": 3058} {"train_loss": -6.623368263244629, "global_step": 128471, "epoch": 3058} {"train_loss": -6.484996318817139, "global_step": 128472, "epoch": 3058} {"train_loss": -6.472668647766113, "global_step": 128473, "epoch": 3058} {"train_loss": -6.470403671264648, "global_step": 128474, "epoch": 3058} {"train_loss": -6.701902389526367, "global_step": 128475, "epoch": 3058} {"train_loss": -6.5843963623046875, "global_step": 128476, "epoch": 3058} {"train_loss": -6.633532478695824, "global_step": 128477, "epoch": 3058, "val_loss": 77342.9453125} {"train_loss": -6.631951808929443, "global_step": 128478, "epoch": 3059} {"train_loss": -6.614542007446289, "global_step": 128479, "epoch": 3059} {"train_loss": -6.559347152709961, "global_step": 128480, "epoch": 3059} {"train_loss": -6.582401275634766, "global_step": 128481, "epoch": 3059} {"train_loss": -6.638142108917236, "global_step": 128482, "epoch": 3059} {"train_loss": -6.725735664367676, "global_step": 128483, "epoch": 3059} {"train_loss": -6.5342583656311035, "global_step": 128484, "epoch": 3059} {"train_loss": -6.7016167640686035, "global_step": 128485, "epoch": 3059} {"train_loss": -6.7419843673706055, "global_step": 128486, "epoch": 3059} {"train_loss": -6.6264753341674805, "global_step": 128487, "epoch": 3059} {"train_loss": -6.65993595123291, "global_step": 128488, "epoch": 3059} {"train_loss": -6.675392150878906, "global_step": 128489, "epoch": 3059} {"train_loss": -6.629218101501465, "global_step": 128490, "epoch": 3059} {"train_loss": -6.672436714172363, "global_step": 128491, "epoch": 3059} {"train_loss": -6.685924530029297, "global_step": 128492, "epoch": 3059} {"train_loss": -6.664250373840332, "global_step": 128493, "epoch": 3059} {"train_loss": -6.540558815002441, "global_step": 128494, "epoch": 3059} {"train_loss": -6.690708637237549, "global_step": 128495, "epoch": 3059} {"train_loss": -6.570313453674316, "global_step": 128496, "epoch": 3059} {"train_loss": -6.7608795166015625, "global_step": 128497, "epoch": 3059} {"train_loss": -6.65496826171875, "global_step": 128498, "epoch": 3059} {"train_loss": -6.749359130859375, "global_step": 128499, "epoch": 3059} {"train_loss": -6.760313034057617, "global_step": 128500, "epoch": 3059} {"train_loss": -6.688266754150391, "global_step": 128501, "epoch": 3059} {"train_loss": -6.667607307434082, "global_step": 128502, "epoch": 3059} {"train_loss": -6.657600402832031, "global_step": 128503, "epoch": 3059} {"train_loss": -6.710363388061523, "global_step": 128504, "epoch": 3059} {"train_loss": -6.643983364105225, "global_step": 128505, "epoch": 3059} {"train_loss": -6.745924949645996, "global_step": 128506, "epoch": 3059} {"train_loss": -6.701930999755859, "global_step": 128507, "epoch": 3059} {"train_loss": -6.658316612243652, "global_step": 128508, "epoch": 3059} {"train_loss": -6.550125598907471, "global_step": 128509, "epoch": 3059} {"train_loss": -6.850316047668457, "global_step": 128510, "epoch": 3059} {"train_loss": -6.697755813598633, "global_step": 128511, "epoch": 3059} {"train_loss": -6.601099491119385, "global_step": 128512, "epoch": 3059} {"train_loss": -6.548819065093994, "global_step": 128513, "epoch": 3059} {"train_loss": -6.701625347137451, "global_step": 128514, "epoch": 3059} {"train_loss": -6.767923355102539, "global_step": 128515, "epoch": 3059} {"train_loss": -6.66082239151001, "global_step": 128516, "epoch": 3059} {"train_loss": -6.634980201721191, "global_step": 128517, "epoch": 3059} {"train_loss": -6.6097869873046875, "global_step": 128518, "epoch": 3059} {"train_loss": -6.663263593401227, "global_step": 128519, "epoch": 3059, "val_loss": 77600.4375} {"train_loss": -6.592923164367676, "global_step": 128520, "epoch": 3060} {"train_loss": -6.494274616241455, "global_step": 128521, "epoch": 3060} {"train_loss": -6.633768081665039, "global_step": 128522, "epoch": 3060} {"train_loss": -6.669341564178467, "global_step": 128523, "epoch": 3060} {"train_loss": -6.464157581329346, "global_step": 128524, "epoch": 3060} {"train_loss": -6.652041912078857, "global_step": 128525, "epoch": 3060} {"train_loss": -6.670086860656738, "global_step": 128526, "epoch": 3060} {"train_loss": -6.638737678527832, "global_step": 128527, "epoch": 3060} {"train_loss": -6.6583356857299805, "global_step": 128528, "epoch": 3060} {"train_loss": -6.589487075805664, "global_step": 128529, "epoch": 3060} {"train_loss": -6.582664489746094, "global_step": 128530, "epoch": 3060} {"train_loss": -6.674463272094727, "global_step": 128531, "epoch": 3060} {"train_loss": -6.539212226867676, "global_step": 128532, "epoch": 3060} {"train_loss": -6.753446102142334, "global_step": 128533, "epoch": 3060} {"train_loss": -6.457036018371582, "global_step": 128534, "epoch": 3060} {"train_loss": -6.527469635009766, "global_step": 128535, "epoch": 3060} {"train_loss": -6.560297966003418, "global_step": 128536, "epoch": 3060} {"train_loss": -6.521557807922363, "global_step": 128537, "epoch": 3060} {"train_loss": -6.523410797119141, "global_step": 128538, "epoch": 3060} {"train_loss": -6.455801963806152, "global_step": 128539, "epoch": 3060} {"train_loss": -6.538033485412598, "global_step": 128540, "epoch": 3060} {"train_loss": -6.407224178314209, "global_step": 128541, "epoch": 3060} {"train_loss": -6.684553146362305, "global_step": 128542, "epoch": 3060} {"train_loss": -6.443791389465332, "global_step": 128543, "epoch": 3060} {"train_loss": -6.577638626098633, "global_step": 128544, "epoch": 3060} {"train_loss": -6.369287490844727, "global_step": 128545, "epoch": 3060} {"train_loss": -6.541727066040039, "global_step": 128546, "epoch": 3060} {"train_loss": -6.455599784851074, "global_step": 128547, "epoch": 3060} {"train_loss": -6.571941375732422, "global_step": 128548, "epoch": 3060} {"train_loss": -6.43324089050293, "global_step": 128549, "epoch": 3060} {"train_loss": -6.512662410736084, "global_step": 128550, "epoch": 3060} {"train_loss": -6.472598075866699, "global_step": 128551, "epoch": 3060} {"train_loss": -6.645841598510742, "global_step": 128552, "epoch": 3060} {"train_loss": -6.485465049743652, "global_step": 128553, "epoch": 3060} {"train_loss": -6.4853835105896, "global_step": 128554, "epoch": 3060} {"train_loss": -6.570605278015137, "global_step": 128555, "epoch": 3060} {"train_loss": -6.619453430175781, "global_step": 128556, "epoch": 3060} {"train_loss": -6.44944953918457, "global_step": 128557, "epoch": 3060} {"train_loss": -6.5879316329956055, "global_step": 128558, "epoch": 3060} {"train_loss": -6.604859352111816, "global_step": 128559, "epoch": 3060} {"train_loss": -6.698290824890137, "global_step": 128560, "epoch": 3060} {"train_loss": -6.556886434555054, "global_step": 128561, "epoch": 3060, "val_loss": 77342.4140625} {"train_loss": -6.6052021980285645, "global_step": 128562, "epoch": 3061} {"train_loss": -6.671612739562988, "global_step": 128563, "epoch": 3061} {"train_loss": -6.716772079467773, "global_step": 128564, "epoch": 3061} {"train_loss": -6.644522666931152, "global_step": 128565, "epoch": 3061} {"train_loss": -6.5796003341674805, "global_step": 128566, "epoch": 3061} {"train_loss": -6.6323676109313965, "global_step": 128567, "epoch": 3061} {"train_loss": -6.60267448425293, "global_step": 128568, "epoch": 3061} {"train_loss": -6.6475677490234375, "global_step": 128569, "epoch": 3061} {"train_loss": -6.760478973388672, "global_step": 128570, "epoch": 3061} {"train_loss": -6.726581573486328, "global_step": 128571, "epoch": 3061} {"train_loss": -6.632205009460449, "global_step": 128572, "epoch": 3061} {"train_loss": -6.706595420837402, "global_step": 128573, "epoch": 3061} {"train_loss": -6.603645324707031, "global_step": 128574, "epoch": 3061} {"train_loss": -6.5693182945251465, "global_step": 128575, "epoch": 3061} {"train_loss": -6.672043800354004, "global_step": 128576, "epoch": 3061} {"train_loss": -6.6631011962890625, "global_step": 128577, "epoch": 3061} {"train_loss": -6.610872268676758, "global_step": 128578, "epoch": 3061} {"train_loss": -6.664734840393066, "global_step": 128579, "epoch": 3061} {"train_loss": -6.774096965789795, "global_step": 128580, "epoch": 3061} {"train_loss": -6.584805488586426, "global_step": 128581, "epoch": 3061} {"train_loss": -6.733258247375488, "global_step": 128582, "epoch": 3061} {"train_loss": -6.668848991394043, "global_step": 128583, "epoch": 3061} {"train_loss": -6.5829548835754395, "global_step": 128584, "epoch": 3061} {"train_loss": -6.740471839904785, "global_step": 128585, "epoch": 3061} {"train_loss": -6.6112060546875, "global_step": 128586, "epoch": 3061} {"train_loss": -6.759006500244141, "global_step": 128587, "epoch": 3061} {"train_loss": -6.721022605895996, "global_step": 128588, "epoch": 3061} {"train_loss": -6.672997951507568, "global_step": 128589, "epoch": 3061} {"train_loss": -6.672106742858887, "global_step": 128590, "epoch": 3061} {"train_loss": -6.657290458679199, "global_step": 128591, "epoch": 3061} {"train_loss": -6.714418411254883, "global_step": 128592, "epoch": 3061} {"train_loss": -6.587196350097656, "global_step": 128593, "epoch": 3061} {"train_loss": -6.595317840576172, "global_step": 128594, "epoch": 3061} {"train_loss": -6.675685882568359, "global_step": 128595, "epoch": 3061} {"train_loss": -6.612383842468262, "global_step": 128596, "epoch": 3061} {"train_loss": -6.6449995040893555, "global_step": 128597, "epoch": 3061} {"train_loss": -6.665172576904297, "global_step": 128598, "epoch": 3061} {"train_loss": -6.604562759399414, "global_step": 128599, "epoch": 3061} {"train_loss": -6.686718940734863, "global_step": 128600, "epoch": 3061} {"train_loss": -6.544886589050293, "global_step": 128601, "epoch": 3061} {"train_loss": -6.507331848144531, "global_step": 128602, "epoch": 3061} {"train_loss": -6.651506639662243, "global_step": 128603, "epoch": 3061, "val_loss": 77360.015625} {"train_loss": -6.514845848083496, "global_step": 128604, "epoch": 3062} {"train_loss": -6.532686710357666, "global_step": 128605, "epoch": 3062} {"train_loss": -6.585068225860596, "global_step": 128606, "epoch": 3062} {"train_loss": -6.569915771484375, "global_step": 128607, "epoch": 3062} {"train_loss": -6.617668151855469, "global_step": 128608, "epoch": 3062} {"train_loss": -6.5724029541015625, "global_step": 128609, "epoch": 3062} {"train_loss": -6.53081750869751, "global_step": 128610, "epoch": 3062} {"train_loss": -6.644779205322266, "global_step": 128611, "epoch": 3062} {"train_loss": -6.399731159210205, "global_step": 128612, "epoch": 3062} {"train_loss": -6.566457271575928, "global_step": 128613, "epoch": 3062} {"train_loss": -6.522453308105469, "global_step": 128614, "epoch": 3062} {"train_loss": -6.664041519165039, "global_step": 128615, "epoch": 3062} {"train_loss": -6.639850616455078, "global_step": 128616, "epoch": 3062} {"train_loss": -6.606934547424316, "global_step": 128617, "epoch": 3062} {"train_loss": -6.606651306152344, "global_step": 128618, "epoch": 3062} {"train_loss": -6.592167854309082, "global_step": 128619, "epoch": 3062} {"train_loss": -6.68414831161499, "global_step": 128620, "epoch": 3062} {"train_loss": -6.489531517028809, "global_step": 128621, "epoch": 3062} {"train_loss": -6.709438323974609, "global_step": 128622, "epoch": 3062} {"train_loss": -6.632033348083496, "global_step": 128623, "epoch": 3062} {"train_loss": -6.624095916748047, "global_step": 128624, "epoch": 3062} {"train_loss": -6.643903732299805, "global_step": 128625, "epoch": 3062} {"train_loss": -6.589480400085449, "global_step": 128626, "epoch": 3062} {"train_loss": -6.604494094848633, "global_step": 128627, "epoch": 3062} {"train_loss": -6.725048065185547, "global_step": 128628, "epoch": 3062} {"train_loss": -6.662915229797363, "global_step": 128629, "epoch": 3062} {"train_loss": -6.733297348022461, "global_step": 128630, "epoch": 3062} {"train_loss": -6.717779636383057, "global_step": 128631, "epoch": 3062} {"train_loss": -6.665986061096191, "global_step": 128632, "epoch": 3062} {"train_loss": -6.799920082092285, "global_step": 128633, "epoch": 3062} {"train_loss": -6.614762306213379, "global_step": 128634, "epoch": 3062} {"train_loss": -6.592158317565918, "global_step": 128635, "epoch": 3062} {"train_loss": -6.716385364532471, "global_step": 128636, "epoch": 3062} {"train_loss": -6.724072456359863, "global_step": 128637, "epoch": 3062} {"train_loss": -6.700360298156738, "global_step": 128638, "epoch": 3062} {"train_loss": -6.568868160247803, "global_step": 128639, "epoch": 3062} {"train_loss": -6.612534523010254, "global_step": 128640, "epoch": 3062} {"train_loss": -6.743671417236328, "global_step": 128641, "epoch": 3062} {"train_loss": -6.616781234741211, "global_step": 128642, "epoch": 3062} {"train_loss": -6.667320251464844, "global_step": 128643, "epoch": 3062} {"train_loss": -6.692775249481201, "global_step": 128644, "epoch": 3062} {"train_loss": -6.624520040693737, "global_step": 128645, "epoch": 3062, "val_loss": 77426.3984375} {"train_loss": -6.618247032165527, "global_step": 128646, "epoch": 3063} {"train_loss": -6.63945198059082, "global_step": 128647, "epoch": 3063} {"train_loss": -6.595883846282959, "global_step": 128648, "epoch": 3063} {"train_loss": -6.595754146575928, "global_step": 128649, "epoch": 3063} {"train_loss": -6.672623634338379, "global_step": 128650, "epoch": 3063} {"train_loss": -6.671412467956543, "global_step": 128651, "epoch": 3063} {"train_loss": -6.674797058105469, "global_step": 128652, "epoch": 3063} {"train_loss": -6.723778247833252, "global_step": 128653, "epoch": 3063} {"train_loss": -6.754611968994141, "global_step": 128654, "epoch": 3063} {"train_loss": -6.846911430358887, "global_step": 128655, "epoch": 3063} {"train_loss": -6.669351577758789, "global_step": 128656, "epoch": 3063} {"train_loss": -6.730186462402344, "global_step": 128657, "epoch": 3063} {"train_loss": -6.815120697021484, "global_step": 128658, "epoch": 3063} {"train_loss": -6.670868873596191, "global_step": 128659, "epoch": 3063} {"train_loss": -6.709772109985352, "global_step": 128660, "epoch": 3063} {"train_loss": -6.652640342712402, "global_step": 128661, "epoch": 3063} {"train_loss": -6.692371368408203, "global_step": 128662, "epoch": 3063} {"train_loss": -6.701190948486328, "global_step": 128663, "epoch": 3063} {"train_loss": -6.756505489349365, "global_step": 128664, "epoch": 3063} {"train_loss": -6.613330364227295, "global_step": 128665, "epoch": 3063} {"train_loss": -6.743193626403809, "global_step": 128666, "epoch": 3063} {"train_loss": -6.658457279205322, "global_step": 128667, "epoch": 3063} {"train_loss": -6.701578140258789, "global_step": 128668, "epoch": 3063} {"train_loss": -6.646844863891602, "global_step": 128669, "epoch": 3063} {"train_loss": -6.663989067077637, "global_step": 128670, "epoch": 3063} {"train_loss": -6.698299884796143, "global_step": 128671, "epoch": 3063} {"train_loss": -6.712848663330078, "global_step": 128672, "epoch": 3063} {"train_loss": -6.49810266494751, "global_step": 128673, "epoch": 3063} {"train_loss": -6.622264862060547, "global_step": 128674, "epoch": 3063} {"train_loss": -6.67177152633667, "global_step": 128675, "epoch": 3063} {"train_loss": -6.606828689575195, "global_step": 128676, "epoch": 3063} {"train_loss": -6.59505558013916, "global_step": 128677, "epoch": 3063} {"train_loss": -6.675351142883301, "global_step": 128678, "epoch": 3063} {"train_loss": -6.482630729675293, "global_step": 128679, "epoch": 3063} {"train_loss": -6.736372947692871, "global_step": 128680, "epoch": 3063} {"train_loss": -6.590550422668457, "global_step": 128681, "epoch": 3063} {"train_loss": -6.534584045410156, "global_step": 128682, "epoch": 3063} {"train_loss": -6.587497234344482, "global_step": 128683, "epoch": 3063} {"train_loss": -6.66603946685791, "global_step": 128684, "epoch": 3063} {"train_loss": -6.614255905151367, "global_step": 128685, "epoch": 3063} {"train_loss": -6.655928611755371, "global_step": 128686, "epoch": 3063} {"train_loss": -6.66296446891058, "global_step": 128687, "epoch": 3063, "val_loss": 77438.0078125} {"train_loss": -6.588067531585693, "global_step": 128688, "epoch": 3064} {"train_loss": -6.723389625549316, "global_step": 128689, "epoch": 3064} {"train_loss": -6.521219253540039, "global_step": 128690, "epoch": 3064} {"train_loss": -6.6894941329956055, "global_step": 128691, "epoch": 3064} {"train_loss": -6.553600311279297, "global_step": 128692, "epoch": 3064} {"train_loss": -6.76167106628418, "global_step": 128693, "epoch": 3064} {"train_loss": -6.591130256652832, "global_step": 128694, "epoch": 3064} {"train_loss": -6.703278064727783, "global_step": 128695, "epoch": 3064} {"train_loss": -6.6222734451293945, "global_step": 128696, "epoch": 3064} {"train_loss": -6.593545436859131, "global_step": 128697, "epoch": 3064} {"train_loss": -6.730574131011963, "global_step": 128698, "epoch": 3064} {"train_loss": -6.623605728149414, "global_step": 128699, "epoch": 3064} {"train_loss": -6.550926208496094, "global_step": 128700, "epoch": 3064} {"train_loss": -6.618687152862549, "global_step": 128701, "epoch": 3064} {"train_loss": -6.648079872131348, "global_step": 128702, "epoch": 3064} {"train_loss": -6.612417221069336, "global_step": 128703, "epoch": 3064} {"train_loss": -6.591480255126953, "global_step": 128704, "epoch": 3064} {"train_loss": -6.6461076736450195, "global_step": 128705, "epoch": 3064} {"train_loss": -6.569635391235352, "global_step": 128706, "epoch": 3064} {"train_loss": -6.462593078613281, "global_step": 128707, "epoch": 3064} {"train_loss": -6.674705505371094, "global_step": 128708, "epoch": 3064} {"train_loss": -6.596793174743652, "global_step": 128709, "epoch": 3064} {"train_loss": -6.694952964782715, "global_step": 128710, "epoch": 3064} {"train_loss": -6.630640983581543, "global_step": 128711, "epoch": 3064} {"train_loss": -6.6610212326049805, "global_step": 128712, "epoch": 3064} {"train_loss": -6.621623992919922, "global_step": 128713, "epoch": 3064} {"train_loss": -6.660008430480957, "global_step": 128714, "epoch": 3064} {"train_loss": -6.544841766357422, "global_step": 128715, "epoch": 3064} {"train_loss": -6.724435806274414, "global_step": 128716, "epoch": 3064} {"train_loss": -6.627886772155762, "global_step": 128717, "epoch": 3064} {"train_loss": -6.656283855438232, "global_step": 128718, "epoch": 3064} {"train_loss": -6.610981464385986, "global_step": 128719, "epoch": 3064} {"train_loss": -6.605941295623779, "global_step": 128720, "epoch": 3064} {"train_loss": -6.790602207183838, "global_step": 128721, "epoch": 3064} {"train_loss": -6.473091125488281, "global_step": 128722, "epoch": 3064} {"train_loss": -6.659593105316162, "global_step": 128723, "epoch": 3064} {"train_loss": -6.523922920227051, "global_step": 128724, "epoch": 3064} {"train_loss": -6.650912284851074, "global_step": 128725, "epoch": 3064} {"train_loss": -6.66749382019043, "global_step": 128726, "epoch": 3064} {"train_loss": -6.651280879974365, "global_step": 128727, "epoch": 3064} {"train_loss": -6.657863616943359, "global_step": 128728, "epoch": 3064} {"train_loss": -6.628267356327602, "global_step": 128729, "epoch": 3064, "val_loss": 77470.0703125} {"train_loss": -6.6147661209106445, "global_step": 128730, "epoch": 3065} {"train_loss": -6.757618427276611, "global_step": 128731, "epoch": 3065} {"train_loss": -6.698118686676025, "global_step": 128732, "epoch": 3065} {"train_loss": -6.752132415771484, "global_step": 128733, "epoch": 3065} {"train_loss": -6.754116058349609, "global_step": 128734, "epoch": 3065} {"train_loss": -6.562838554382324, "global_step": 128735, "epoch": 3065} {"train_loss": -6.649848937988281, "global_step": 128736, "epoch": 3065} {"train_loss": -6.682952880859375, "global_step": 128737, "epoch": 3065} {"train_loss": -6.69307804107666, "global_step": 128738, "epoch": 3065} {"train_loss": -6.639341354370117, "global_step": 128739, "epoch": 3065} {"train_loss": -6.714409828186035, "global_step": 128740, "epoch": 3065} {"train_loss": -6.564354419708252, "global_step": 128741, "epoch": 3065} {"train_loss": -6.572564125061035, "global_step": 128742, "epoch": 3065} {"train_loss": -6.479069232940674, "global_step": 128743, "epoch": 3065} {"train_loss": -6.543612480163574, "global_step": 128744, "epoch": 3065} {"train_loss": -6.717915058135986, "global_step": 128745, "epoch": 3065} {"train_loss": -6.581531524658203, "global_step": 128746, "epoch": 3065} {"train_loss": -6.722264766693115, "global_step": 128747, "epoch": 3065} {"train_loss": -6.57485294342041, "global_step": 128748, "epoch": 3065} {"train_loss": -6.546855926513672, "global_step": 128749, "epoch": 3065} {"train_loss": -6.579328536987305, "global_step": 128750, "epoch": 3065} {"train_loss": -6.5541863441467285, "global_step": 128751, "epoch": 3065} {"train_loss": -6.688967704772949, "global_step": 128752, "epoch": 3065} {"train_loss": -6.498220443725586, "global_step": 128753, "epoch": 3065} {"train_loss": -6.508584976196289, "global_step": 128754, "epoch": 3065} {"train_loss": -6.719557285308838, "global_step": 128755, "epoch": 3065} {"train_loss": -6.643320083618164, "global_step": 128756, "epoch": 3065} {"train_loss": -6.58709716796875, "global_step": 128757, "epoch": 3065} {"train_loss": -6.626825332641602, "global_step": 128758, "epoch": 3065} {"train_loss": -6.730864524841309, "global_step": 128759, "epoch": 3065} {"train_loss": -6.569422721862793, "global_step": 128760, "epoch": 3065} {"train_loss": -6.721067428588867, "global_step": 128761, "epoch": 3065} {"train_loss": -6.694441795349121, "global_step": 128762, "epoch": 3065} {"train_loss": -6.546303749084473, "global_step": 128763, "epoch": 3065} {"train_loss": -6.654122352600098, "global_step": 128764, "epoch": 3065} {"train_loss": -6.670877456665039, "global_step": 128765, "epoch": 3065} {"train_loss": -6.554483413696289, "global_step": 128766, "epoch": 3065} {"train_loss": -6.561760902404785, "global_step": 128767, "epoch": 3065} {"train_loss": -6.455177307128906, "global_step": 128768, "epoch": 3065} {"train_loss": -6.660508632659912, "global_step": 128769, "epoch": 3065} {"train_loss": -6.673894882202148, "global_step": 128770, "epoch": 3065} {"train_loss": -6.62443673043024, "global_step": 128771, "epoch": 3065, "val_loss": 77442.8984375} {"train_loss": -6.702596187591553, "global_step": 128772, "epoch": 3066} {"train_loss": -6.645028114318848, "global_step": 128773, "epoch": 3066} {"train_loss": -6.6305437088012695, "global_step": 128774, "epoch": 3066} {"train_loss": -6.744936943054199, "global_step": 128775, "epoch": 3066} {"train_loss": -6.576596736907959, "global_step": 128776, "epoch": 3066} {"train_loss": -6.653066158294678, "global_step": 128777, "epoch": 3066} {"train_loss": -6.47531795501709, "global_step": 128778, "epoch": 3066} {"train_loss": -6.691465377807617, "global_step": 128779, "epoch": 3066} {"train_loss": -6.592733383178711, "global_step": 128780, "epoch": 3066} {"train_loss": -6.5347394943237305, "global_step": 128781, "epoch": 3066} {"train_loss": -6.597752571105957, "global_step": 128782, "epoch": 3066} {"train_loss": -6.604794502258301, "global_step": 128783, "epoch": 3066} {"train_loss": -6.612776279449463, "global_step": 128784, "epoch": 3066} {"train_loss": -6.659243583679199, "global_step": 128785, "epoch": 3066} {"train_loss": -6.585939884185791, "global_step": 128786, "epoch": 3066} {"train_loss": -6.6765642166137695, "global_step": 128787, "epoch": 3066} {"train_loss": -6.62161922454834, "global_step": 128788, "epoch": 3066} {"train_loss": -6.674968719482422, "global_step": 128789, "epoch": 3066} {"train_loss": -6.631335258483887, "global_step": 128790, "epoch": 3066} {"train_loss": -6.54951286315918, "global_step": 128791, "epoch": 3066} {"train_loss": -6.513246059417725, "global_step": 128792, "epoch": 3066} {"train_loss": -6.595400810241699, "global_step": 128793, "epoch": 3066} {"train_loss": -6.735997200012207, "global_step": 128794, "epoch": 3066} {"train_loss": -6.661646842956543, "global_step": 128795, "epoch": 3066} {"train_loss": -6.7637619972229, "global_step": 128796, "epoch": 3066} {"train_loss": -6.640807151794434, "global_step": 128797, "epoch": 3066} {"train_loss": -6.589776039123535, "global_step": 128798, "epoch": 3066} {"train_loss": -6.744158744812012, "global_step": 128799, "epoch": 3066} {"train_loss": -6.64349365234375, "global_step": 128800, "epoch": 3066} {"train_loss": -6.63331413269043, "global_step": 128801, "epoch": 3066} {"train_loss": -6.607327938079834, "global_step": 128802, "epoch": 3066} {"train_loss": -6.697587013244629, "global_step": 128803, "epoch": 3066} {"train_loss": -6.608442306518555, "global_step": 128804, "epoch": 3066} {"train_loss": -6.626921653747559, "global_step": 128805, "epoch": 3066} {"train_loss": -6.715071678161621, "global_step": 128806, "epoch": 3066} {"train_loss": -6.761656761169434, "global_step": 128807, "epoch": 3066} {"train_loss": -6.583132743835449, "global_step": 128808, "epoch": 3066} {"train_loss": -6.775918483734131, "global_step": 128809, "epoch": 3066} {"train_loss": -6.737203598022461, "global_step": 128810, "epoch": 3066} {"train_loss": -6.627083778381348, "global_step": 128811, "epoch": 3066} {"train_loss": -6.651795387268066, "global_step": 128812, "epoch": 3066} {"train_loss": -6.644106751396542, "global_step": 128813, "epoch": 3066, "val_loss": 77294.8984375} {"train_loss": -6.683655738830566, "global_step": 128814, "epoch": 3067} {"train_loss": -6.628756999969482, "global_step": 128815, "epoch": 3067} {"train_loss": -6.78585147857666, "global_step": 128816, "epoch": 3067} {"train_loss": -6.71173095703125, "global_step": 128817, "epoch": 3067} {"train_loss": -6.789595603942871, "global_step": 128818, "epoch": 3067} {"train_loss": -6.669114112854004, "global_step": 128819, "epoch": 3067} {"train_loss": -6.7197723388671875, "global_step": 128820, "epoch": 3067} {"train_loss": -6.672957420349121, "global_step": 128821, "epoch": 3067} {"train_loss": -6.7166643142700195, "global_step": 128822, "epoch": 3067} {"train_loss": -6.718679428100586, "global_step": 128823, "epoch": 3067} {"train_loss": -6.759541988372803, "global_step": 128824, "epoch": 3067} {"train_loss": -6.634242534637451, "global_step": 128825, "epoch": 3067} {"train_loss": -6.6203789710998535, "global_step": 128826, "epoch": 3067} {"train_loss": -6.6555986404418945, "global_step": 128827, "epoch": 3067} {"train_loss": -6.718687057495117, "global_step": 128828, "epoch": 3067} {"train_loss": -6.666028022766113, "global_step": 128829, "epoch": 3067} {"train_loss": -6.614755630493164, "global_step": 128830, "epoch": 3067} {"train_loss": -6.76793098449707, "global_step": 128831, "epoch": 3067} {"train_loss": -6.622925281524658, "global_step": 128832, "epoch": 3067} {"train_loss": -6.6516523361206055, "global_step": 128833, "epoch": 3067} {"train_loss": -6.7490081787109375, "global_step": 128834, "epoch": 3067} {"train_loss": -6.800580024719238, "global_step": 128835, "epoch": 3067} {"train_loss": -6.811403274536133, "global_step": 128836, "epoch": 3067} {"train_loss": -6.706886291503906, "global_step": 128837, "epoch": 3067} {"train_loss": -6.657535552978516, "global_step": 128838, "epoch": 3067} {"train_loss": -6.77324104309082, "global_step": 128839, "epoch": 3067} {"train_loss": -6.680167198181152, "global_step": 128840, "epoch": 3067} {"train_loss": -6.677646160125732, "global_step": 128841, "epoch": 3067} {"train_loss": -6.7096147537231445, "global_step": 128842, "epoch": 3067} {"train_loss": -6.734139442443848, "global_step": 128843, "epoch": 3067} {"train_loss": -6.701992988586426, "global_step": 128844, "epoch": 3067} {"train_loss": -6.614563465118408, "global_step": 128845, "epoch": 3067} {"train_loss": -6.552781581878662, "global_step": 128846, "epoch": 3067} {"train_loss": -6.719927787780762, "global_step": 128847, "epoch": 3067} {"train_loss": -6.7615861892700195, "global_step": 128848, "epoch": 3067} {"train_loss": -6.55225944519043, "global_step": 128849, "epoch": 3067} {"train_loss": -6.53842306137085, "global_step": 128850, "epoch": 3067} {"train_loss": -6.679062366485596, "global_step": 128851, "epoch": 3067} {"train_loss": -6.544053077697754, "global_step": 128852, "epoch": 3067} {"train_loss": -6.7402753829956055, "global_step": 128853, "epoch": 3067} {"train_loss": -6.608112812042236, "global_step": 128854, "epoch": 3067} {"train_loss": -6.684913828259423, "global_step": 128855, "epoch": 3067, "val_loss": 77691.265625} {"train_loss": -6.615086555480957, "global_step": 128856, "epoch": 3068} {"train_loss": -6.81195068359375, "global_step": 128857, "epoch": 3068} {"train_loss": -6.747971534729004, "global_step": 128858, "epoch": 3068} {"train_loss": -6.672798156738281, "global_step": 128859, "epoch": 3068} {"train_loss": -6.612903118133545, "global_step": 128860, "epoch": 3068} {"train_loss": -6.559818267822266, "global_step": 128861, "epoch": 3068} {"train_loss": -6.688994884490967, "global_step": 128862, "epoch": 3068} {"train_loss": -6.740612030029297, "global_step": 128863, "epoch": 3068} {"train_loss": -6.627288818359375, "global_step": 128864, "epoch": 3068} {"train_loss": -6.653428554534912, "global_step": 128865, "epoch": 3068} {"train_loss": -6.570252418518066, "global_step": 128866, "epoch": 3068} {"train_loss": -6.648879051208496, "global_step": 128867, "epoch": 3068} {"train_loss": -6.683498382568359, "global_step": 128868, "epoch": 3068} {"train_loss": -6.4906005859375, "global_step": 128869, "epoch": 3068} {"train_loss": -6.457005500793457, "global_step": 128870, "epoch": 3068} {"train_loss": -6.530384063720703, "global_step": 128871, "epoch": 3068} {"train_loss": -6.59688663482666, "global_step": 128872, "epoch": 3068} {"train_loss": -6.605064392089844, "global_step": 128873, "epoch": 3068} {"train_loss": -6.565067768096924, "global_step": 128874, "epoch": 3068} {"train_loss": -6.585578441619873, "global_step": 128875, "epoch": 3068} {"train_loss": -6.449419975280762, "global_step": 128876, "epoch": 3068} {"train_loss": -6.699459552764893, "global_step": 128877, "epoch": 3068} {"train_loss": -6.636773586273193, "global_step": 128878, "epoch": 3068} {"train_loss": -6.539798259735107, "global_step": 128879, "epoch": 3068} {"train_loss": -6.489283561706543, "global_step": 128880, "epoch": 3068} {"train_loss": -6.483440399169922, "global_step": 128881, "epoch": 3068} {"train_loss": -6.390331268310547, "global_step": 128882, "epoch": 3068} {"train_loss": -6.646239280700684, "global_step": 128883, "epoch": 3068} {"train_loss": -6.454595565795898, "global_step": 128884, "epoch": 3068} {"train_loss": -6.640557765960693, "global_step": 128885, "epoch": 3068} {"train_loss": -6.620197296142578, "global_step": 128886, "epoch": 3068} {"train_loss": -6.490616798400879, "global_step": 128887, "epoch": 3068} {"train_loss": -6.668317794799805, "global_step": 128888, "epoch": 3068} {"train_loss": -6.589649200439453, "global_step": 128889, "epoch": 3068} {"train_loss": -6.530519008636475, "global_step": 128890, "epoch": 3068} {"train_loss": -6.61494255065918, "global_step": 128891, "epoch": 3068} {"train_loss": -6.613328456878662, "global_step": 128892, "epoch": 3068} {"train_loss": -6.722105503082275, "global_step": 128893, "epoch": 3068} {"train_loss": -6.619097709655762, "global_step": 128894, "epoch": 3068} {"train_loss": -6.613605499267578, "global_step": 128895, "epoch": 3068} {"train_loss": -6.604990005493164, "global_step": 128896, "epoch": 3068} {"train_loss": -6.599395468121483, "global_step": 128897, "epoch": 3068, "val_loss": 77519.4453125} {"train_loss": -6.60329532623291, "global_step": 128898, "epoch": 3069} {"train_loss": -6.613390922546387, "global_step": 128899, "epoch": 3069} {"train_loss": -6.644831657409668, "global_step": 128900, "epoch": 3069} {"train_loss": -6.681387901306152, "global_step": 128901, "epoch": 3069} {"train_loss": -6.55965518951416, "global_step": 128902, "epoch": 3069} {"train_loss": -6.582945823669434, "global_step": 128903, "epoch": 3069} {"train_loss": -6.623661041259766, "global_step": 128904, "epoch": 3069} {"train_loss": -6.502192497253418, "global_step": 128905, "epoch": 3069} {"train_loss": -6.580930233001709, "global_step": 128906, "epoch": 3069} {"train_loss": -6.692351341247559, "global_step": 128907, "epoch": 3069} {"train_loss": -6.730623722076416, "global_step": 128908, "epoch": 3069} {"train_loss": -6.662261962890625, "global_step": 128909, "epoch": 3069} {"train_loss": -6.631870269775391, "global_step": 128910, "epoch": 3069} {"train_loss": -6.5973100662231445, "global_step": 128911, "epoch": 3069} {"train_loss": -6.719522476196289, "global_step": 128912, "epoch": 3069} {"train_loss": -6.440008640289307, "global_step": 128913, "epoch": 3069} {"train_loss": -6.730362892150879, "global_step": 128914, "epoch": 3069} {"train_loss": -6.587508201599121, "global_step": 128915, "epoch": 3069} {"train_loss": -6.608997821807861, "global_step": 128916, "epoch": 3069} {"train_loss": -6.7164812088012695, "global_step": 128917, "epoch": 3069} {"train_loss": -6.512709617614746, "global_step": 128918, "epoch": 3069} {"train_loss": -6.672465801239014, "global_step": 128919, "epoch": 3069} {"train_loss": -6.6598591804504395, "global_step": 128920, "epoch": 3069} {"train_loss": -6.644653797149658, "global_step": 128921, "epoch": 3069} {"train_loss": -6.639556407928467, "global_step": 128922, "epoch": 3069} {"train_loss": -6.730166912078857, "global_step": 128923, "epoch": 3069} {"train_loss": -6.706611633300781, "global_step": 128924, "epoch": 3069} {"train_loss": -6.691675186157227, "global_step": 128925, "epoch": 3069} {"train_loss": -6.791653633117676, "global_step": 128926, "epoch": 3069} {"train_loss": -6.832985877990723, "global_step": 128927, "epoch": 3069} {"train_loss": -6.666245937347412, "global_step": 128928, "epoch": 3069} {"train_loss": -6.599201202392578, "global_step": 128929, "epoch": 3069} {"train_loss": -6.632409572601318, "global_step": 128930, "epoch": 3069} {"train_loss": -6.770758628845215, "global_step": 128931, "epoch": 3069} {"train_loss": -6.684922695159912, "global_step": 128932, "epoch": 3069} {"train_loss": -6.73161506652832, "global_step": 128933, "epoch": 3069} {"train_loss": -6.688869476318359, "global_step": 128934, "epoch": 3069} {"train_loss": -6.711379051208496, "global_step": 128935, "epoch": 3069} {"train_loss": -6.713953018188477, "global_step": 128936, "epoch": 3069} {"train_loss": -6.7894768714904785, "global_step": 128937, "epoch": 3069} {"train_loss": -6.508823394775391, "global_step": 128938, "epoch": 3069} {"train_loss": -6.65748685882205, "global_step": 128939, "epoch": 3069, "val_loss": 77289.0546875} {"train_loss": -6.739943027496338, "global_step": 128940, "epoch": 3070} {"train_loss": -6.732926368713379, "global_step": 128941, "epoch": 3070} {"train_loss": -6.690218448638916, "global_step": 128942, "epoch": 3070} {"train_loss": -6.620779991149902, "global_step": 128943, "epoch": 3070} {"train_loss": -6.6682586669921875, "global_step": 128944, "epoch": 3070} {"train_loss": -6.623502731323242, "global_step": 128945, "epoch": 3070} {"train_loss": -6.738199234008789, "global_step": 128946, "epoch": 3070} {"train_loss": -6.760312080383301, "global_step": 128947, "epoch": 3070} {"train_loss": -6.574167728424072, "global_step": 128948, "epoch": 3070} {"train_loss": -6.66012716293335, "global_step": 128949, "epoch": 3070} {"train_loss": -6.572150230407715, "global_step": 128950, "epoch": 3070} {"train_loss": -6.606993675231934, "global_step": 128951, "epoch": 3070} {"train_loss": -6.657186985015869, "global_step": 128952, "epoch": 3070} {"train_loss": -6.6579179763793945, "global_step": 128953, "epoch": 3070} {"train_loss": -6.607583999633789, "global_step": 128954, "epoch": 3070} {"train_loss": -6.788524627685547, "global_step": 128955, "epoch": 3070} {"train_loss": -6.584555625915527, "global_step": 128956, "epoch": 3070} {"train_loss": -6.665879249572754, "global_step": 128957, "epoch": 3070} {"train_loss": -6.668479919433594, "global_step": 128958, "epoch": 3070} {"train_loss": -6.677203178405762, "global_step": 128959, "epoch": 3070} {"train_loss": -6.601346969604492, "global_step": 128960, "epoch": 3070} {"train_loss": -6.687823295593262, "global_step": 128961, "epoch": 3070} {"train_loss": -6.558976173400879, "global_step": 128962, "epoch": 3070} {"train_loss": -6.656946182250977, "global_step": 128963, "epoch": 3070} {"train_loss": -6.684666156768799, "global_step": 128964, "epoch": 3070} {"train_loss": -6.652071952819824, "global_step": 128965, "epoch": 3070} {"train_loss": -6.68541145324707, "global_step": 128966, "epoch": 3070} {"train_loss": -6.620603561401367, "global_step": 128967, "epoch": 3070} {"train_loss": -6.648531913757324, "global_step": 128968, "epoch": 3070} {"train_loss": -6.643172264099121, "global_step": 128969, "epoch": 3070} {"train_loss": -6.721304416656494, "global_step": 128970, "epoch": 3070} {"train_loss": -6.6551008224487305, "global_step": 128971, "epoch": 3070} {"train_loss": -6.690034866333008, "global_step": 128972, "epoch": 3070} {"train_loss": -6.562777519226074, "global_step": 128973, "epoch": 3070} {"train_loss": -6.642898082733154, "global_step": 128974, "epoch": 3070} {"train_loss": -6.722952842712402, "global_step": 128975, "epoch": 3070} {"train_loss": -6.761765480041504, "global_step": 128976, "epoch": 3070} {"train_loss": -6.599676132202148, "global_step": 128977, "epoch": 3070} {"train_loss": -6.723113059997559, "global_step": 128978, "epoch": 3070} {"train_loss": -6.670071601867676, "global_step": 128979, "epoch": 3070} {"train_loss": -6.638980388641357, "global_step": 128980, "epoch": 3070} {"train_loss": -6.662918454124814, "global_step": 128981, "epoch": 3070, "val_loss": 77629.6953125} {"train_loss": -6.689198017120361, "global_step": 128982, "epoch": 3071} {"train_loss": -6.727739334106445, "global_step": 128983, "epoch": 3071} {"train_loss": -6.638391971588135, "global_step": 128984, "epoch": 3071} {"train_loss": -6.598676681518555, "global_step": 128985, "epoch": 3071} {"train_loss": -6.650606632232666, "global_step": 128986, "epoch": 3071} {"train_loss": -6.630133152008057, "global_step": 128987, "epoch": 3071} {"train_loss": -6.604782581329346, "global_step": 128988, "epoch": 3071} {"train_loss": -6.72366189956665, "global_step": 128989, "epoch": 3071} {"train_loss": -6.691659927368164, "global_step": 128990, "epoch": 3071} {"train_loss": -6.669516086578369, "global_step": 128991, "epoch": 3071} {"train_loss": -6.673428535461426, "global_step": 128992, "epoch": 3071} {"train_loss": -6.653352737426758, "global_step": 128993, "epoch": 3071} {"train_loss": -6.495582580566406, "global_step": 128994, "epoch": 3071} {"train_loss": -6.5608110427856445, "global_step": 128995, "epoch": 3071} {"train_loss": -6.6903300285339355, "global_step": 128996, "epoch": 3071} {"train_loss": -6.6587724685668945, "global_step": 128997, "epoch": 3071} {"train_loss": -6.440558433532715, "global_step": 128998, "epoch": 3071} {"train_loss": -6.5580596923828125, "global_step": 128999, "epoch": 3071} {"train_loss": -6.704441070556641, "global_step": 129000, "epoch": 3071} {"train_loss": -6.48044490814209, "global_step": 129001, "epoch": 3071} {"train_loss": -6.634428977966309, "global_step": 129002, "epoch": 3071} {"train_loss": -6.552539825439453, "global_step": 129003, "epoch": 3071} {"train_loss": -6.715064525604248, "global_step": 129004, "epoch": 3071} {"train_loss": -6.567270278930664, "global_step": 129005, "epoch": 3071} {"train_loss": -6.55158805847168, "global_step": 129006, "epoch": 3071} {"train_loss": -6.579081058502197, "global_step": 129007, "epoch": 3071} {"train_loss": -6.631542682647705, "global_step": 129008, "epoch": 3071} {"train_loss": -6.783882141113281, "global_step": 129009, "epoch": 3071} {"train_loss": -6.506237983703613, "global_step": 129010, "epoch": 3071} {"train_loss": -6.781504154205322, "global_step": 129011, "epoch": 3071} {"train_loss": -6.617767810821533, "global_step": 129012, "epoch": 3071} {"train_loss": -6.651465892791748, "global_step": 129013, "epoch": 3071} {"train_loss": -6.730509281158447, "global_step": 129014, "epoch": 3071} {"train_loss": -6.587573528289795, "global_step": 129015, "epoch": 3071} {"train_loss": -6.640183448791504, "global_step": 129016, "epoch": 3071} {"train_loss": -6.608480930328369, "global_step": 129017, "epoch": 3071} {"train_loss": -6.620837211608887, "global_step": 129018, "epoch": 3071} {"train_loss": -6.591507911682129, "global_step": 129019, "epoch": 3071} {"train_loss": -6.52978515625, "global_step": 129020, "epoch": 3071} {"train_loss": -6.6662068367004395, "global_step": 129021, "epoch": 3071} {"train_loss": -6.542730331420898, "global_step": 129022, "epoch": 3071} {"train_loss": -6.627068655831473, "global_step": 129023, "epoch": 3071, "val_loss": 77437.765625} {"train_loss": -6.726287841796875, "global_step": 129024, "epoch": 3072} {"train_loss": -6.652299880981445, "global_step": 129025, "epoch": 3072} {"train_loss": -6.706916809082031, "global_step": 129026, "epoch": 3072} {"train_loss": -6.585219383239746, "global_step": 129027, "epoch": 3072} {"train_loss": -6.66325569152832, "global_step": 129028, "epoch": 3072} {"train_loss": -6.706287384033203, "global_step": 129029, "epoch": 3072} {"train_loss": -6.661322593688965, "global_step": 129030, "epoch": 3072} {"train_loss": -6.6238861083984375, "global_step": 129031, "epoch": 3072} {"train_loss": -6.710735321044922, "global_step": 129032, "epoch": 3072} {"train_loss": -6.701871395111084, "global_step": 129033, "epoch": 3072} {"train_loss": -6.6856794357299805, "global_step": 129034, "epoch": 3072} {"train_loss": -6.562711715698242, "global_step": 129035, "epoch": 3072} {"train_loss": -6.775713920593262, "global_step": 129036, "epoch": 3072} {"train_loss": -6.626128673553467, "global_step": 129037, "epoch": 3072} {"train_loss": -6.664546012878418, "global_step": 129038, "epoch": 3072} {"train_loss": -6.6297831535339355, "global_step": 129039, "epoch": 3072} {"train_loss": -6.777308940887451, "global_step": 129040, "epoch": 3072} {"train_loss": -6.715522766113281, "global_step": 129041, "epoch": 3072} {"train_loss": -6.665496826171875, "global_step": 129042, "epoch": 3072} {"train_loss": -6.640275955200195, "global_step": 129043, "epoch": 3072} {"train_loss": -6.603084564208984, "global_step": 129044, "epoch": 3072} {"train_loss": -6.61074161529541, "global_step": 129045, "epoch": 3072} {"train_loss": -6.669439315795898, "global_step": 129046, "epoch": 3072} {"train_loss": -6.676276206970215, "global_step": 129047, "epoch": 3072} {"train_loss": -6.6477532386779785, "global_step": 129048, "epoch": 3072} {"train_loss": -6.713844299316406, "global_step": 129049, "epoch": 3072} {"train_loss": -6.818873405456543, "global_step": 129050, "epoch": 3072} {"train_loss": -6.805870056152344, "global_step": 129051, "epoch": 3072} {"train_loss": -6.625688552856445, "global_step": 129052, "epoch": 3072} {"train_loss": -6.62351655960083, "global_step": 129053, "epoch": 3072} {"train_loss": -6.68541145324707, "global_step": 129054, "epoch": 3072} {"train_loss": -6.623056411743164, "global_step": 129055, "epoch": 3072} {"train_loss": -6.606863975524902, "global_step": 129056, "epoch": 3072} {"train_loss": -6.702980995178223, "global_step": 129057, "epoch": 3072} {"train_loss": -6.607922554016113, "global_step": 129058, "epoch": 3072} {"train_loss": -6.68060302734375, "global_step": 129059, "epoch": 3072} {"train_loss": -6.771421432495117, "global_step": 129060, "epoch": 3072} {"train_loss": -6.71214485168457, "global_step": 129061, "epoch": 3072} {"train_loss": -6.672473907470703, "global_step": 129062, "epoch": 3072} {"train_loss": -6.5901899337768555, "global_step": 129063, "epoch": 3072} {"train_loss": -6.730499267578125, "global_step": 129064, "epoch": 3072} {"train_loss": -6.675612540472121, "global_step": 129065, "epoch": 3072, "val_loss": 77422.4609375} {"train_loss": -6.638125896453857, "global_step": 129066, "epoch": 3073} {"train_loss": -6.611382484436035, "global_step": 129067, "epoch": 3073} {"train_loss": -6.522216796875, "global_step": 129068, "epoch": 3073} {"train_loss": -6.571084976196289, "global_step": 129069, "epoch": 3073} {"train_loss": -6.6870245933532715, "global_step": 129070, "epoch": 3073} {"train_loss": -6.640958309173584, "global_step": 129071, "epoch": 3073} {"train_loss": -6.554595947265625, "global_step": 129072, "epoch": 3073} {"train_loss": -6.667938232421875, "global_step": 129073, "epoch": 3073} {"train_loss": -6.613630294799805, "global_step": 129074, "epoch": 3073} {"train_loss": -6.585396766662598, "global_step": 129075, "epoch": 3073} {"train_loss": -6.613621711730957, "global_step": 129076, "epoch": 3073} {"train_loss": -6.636782169342041, "global_step": 129077, "epoch": 3073} {"train_loss": -6.558359146118164, "global_step": 129078, "epoch": 3073} {"train_loss": -6.801575660705566, "global_step": 129079, "epoch": 3073} {"train_loss": -6.739445209503174, "global_step": 129080, "epoch": 3073} {"train_loss": -6.5979814529418945, "global_step": 129081, "epoch": 3073} {"train_loss": -6.62298583984375, "global_step": 129082, "epoch": 3073} {"train_loss": -6.727631092071533, "global_step": 129083, "epoch": 3073} {"train_loss": -6.637245178222656, "global_step": 129084, "epoch": 3073} {"train_loss": -6.601863861083984, "global_step": 129085, "epoch": 3073} {"train_loss": -6.573763847351074, "global_step": 129086, "epoch": 3073} {"train_loss": -6.710467338562012, "global_step": 129087, "epoch": 3073} {"train_loss": -6.7156171798706055, "global_step": 129088, "epoch": 3073} {"train_loss": -6.716874122619629, "global_step": 129089, "epoch": 3073} {"train_loss": -6.62412166595459, "global_step": 129090, "epoch": 3073} {"train_loss": -6.680367946624756, "global_step": 129091, "epoch": 3073} {"train_loss": -6.691013813018799, "global_step": 129092, "epoch": 3073} {"train_loss": -6.7491936683654785, "global_step": 129093, "epoch": 3073} {"train_loss": -6.7863264083862305, "global_step": 129094, "epoch": 3073} {"train_loss": -6.668858051300049, "global_step": 129095, "epoch": 3073} {"train_loss": -6.8599853515625, "global_step": 129096, "epoch": 3073} {"train_loss": -6.57717227935791, "global_step": 129097, "epoch": 3073} {"train_loss": -6.758481979370117, "global_step": 129098, "epoch": 3073} {"train_loss": -6.668263912200928, "global_step": 129099, "epoch": 3073} {"train_loss": -6.7830119132995605, "global_step": 129100, "epoch": 3073} {"train_loss": -6.7069091796875, "global_step": 129101, "epoch": 3073} {"train_loss": -6.689844131469727, "global_step": 129102, "epoch": 3073} {"train_loss": -6.66765832901001, "global_step": 129103, "epoch": 3073} {"train_loss": -6.87733793258667, "global_step": 129104, "epoch": 3073} {"train_loss": -6.725661754608154, "global_step": 129105, "epoch": 3073} {"train_loss": -6.756399631500244, "global_step": 129106, "epoch": 3073} {"train_loss": -6.67736123857044, "global_step": 129107, "epoch": 3073, "val_loss": 77238.28125} {"train_loss": -6.7910871505737305, "global_step": 129108, "epoch": 3074} {"train_loss": -6.74038553237915, "global_step": 129109, "epoch": 3074} {"train_loss": -6.750192642211914, "global_step": 129110, "epoch": 3074} {"train_loss": -6.812389850616455, "global_step": 129111, "epoch": 3074} {"train_loss": -6.74733829498291, "global_step": 129112, "epoch": 3074} {"train_loss": -6.696070671081543, "global_step": 129113, "epoch": 3074} {"train_loss": -6.69236421585083, "global_step": 129114, "epoch": 3074} {"train_loss": -6.603864669799805, "global_step": 129115, "epoch": 3074} {"train_loss": -6.727165222167969, "global_step": 129116, "epoch": 3074} {"train_loss": -6.629812240600586, "global_step": 129117, "epoch": 3074} {"train_loss": -6.726757526397705, "global_step": 129118, "epoch": 3074} {"train_loss": -6.676218032836914, "global_step": 129119, "epoch": 3074} {"train_loss": -6.684220790863037, "global_step": 129120, "epoch": 3074} {"train_loss": -6.716892242431641, "global_step": 129121, "epoch": 3074} {"train_loss": -6.693508625030518, "global_step": 129122, "epoch": 3074} {"train_loss": -6.689375400543213, "global_step": 129123, "epoch": 3074} {"train_loss": -6.384862899780273, "global_step": 129124, "epoch": 3074} {"train_loss": -6.51295804977417, "global_step": 129125, "epoch": 3074} {"train_loss": -6.698586940765381, "global_step": 129126, "epoch": 3074} {"train_loss": -6.568726539611816, "global_step": 129127, "epoch": 3074} {"train_loss": -6.552929878234863, "global_step": 129128, "epoch": 3074} {"train_loss": -6.535586833953857, "global_step": 129129, "epoch": 3074} {"train_loss": -6.64155912399292, "global_step": 129130, "epoch": 3074} {"train_loss": -6.6715006828308105, "global_step": 129131, "epoch": 3074} {"train_loss": -6.750679016113281, "global_step": 129132, "epoch": 3074} {"train_loss": -6.638105392456055, "global_step": 129133, "epoch": 3074} {"train_loss": -6.701354026794434, "global_step": 129134, "epoch": 3074} {"train_loss": -6.670385360717773, "global_step": 129135, "epoch": 3074} {"train_loss": -6.646162033081055, "global_step": 129136, "epoch": 3074} {"train_loss": -6.58230447769165, "global_step": 129137, "epoch": 3074} {"train_loss": -6.593621730804443, "global_step": 129138, "epoch": 3074} {"train_loss": -6.640285491943359, "global_step": 129139, "epoch": 3074} {"train_loss": -6.650348663330078, "global_step": 129140, "epoch": 3074} {"train_loss": -6.57693338394165, "global_step": 129141, "epoch": 3074} {"train_loss": -6.598392486572266, "global_step": 129142, "epoch": 3074} {"train_loss": -6.6688055992126465, "global_step": 129143, "epoch": 3074} {"train_loss": -6.6755194664001465, "global_step": 129144, "epoch": 3074} {"train_loss": -6.537219047546387, "global_step": 129145, "epoch": 3074} {"train_loss": -6.604887962341309, "global_step": 129146, "epoch": 3074} {"train_loss": -6.601513862609863, "global_step": 129147, "epoch": 3074} {"train_loss": -6.649403095245361, "global_step": 129148, "epoch": 3074} {"train_loss": -6.652566160474505, "global_step": 129149, "epoch": 3074, "val_loss": 77423.7421875} {"train_loss": -6.645998001098633, "global_step": 129150, "epoch": 3075} {"train_loss": -6.701642036437988, "global_step": 129151, "epoch": 3075} {"train_loss": -6.666760444641113, "global_step": 129152, "epoch": 3075} {"train_loss": -6.605774402618408, "global_step": 129153, "epoch": 3075} {"train_loss": -6.614004135131836, "global_step": 129154, "epoch": 3075} {"train_loss": -6.770684242248535, "global_step": 129155, "epoch": 3075} {"train_loss": -6.713605880737305, "global_step": 129156, "epoch": 3075} {"train_loss": -6.7079010009765625, "global_step": 129157, "epoch": 3075} {"train_loss": -6.765430450439453, "global_step": 129158, "epoch": 3075} {"train_loss": -6.715634346008301, "global_step": 129159, "epoch": 3075} {"train_loss": -6.7657976150512695, "global_step": 129160, "epoch": 3075} {"train_loss": -6.629166126251221, "global_step": 129161, "epoch": 3075} {"train_loss": -6.704689979553223, "global_step": 129162, "epoch": 3075} {"train_loss": -6.758992671966553, "global_step": 129163, "epoch": 3075} {"train_loss": -6.639146327972412, "global_step": 129164, "epoch": 3075} {"train_loss": -6.637877941131592, "global_step": 129165, "epoch": 3075} {"train_loss": -6.7328081130981445, "global_step": 129166, "epoch": 3075} {"train_loss": -6.619582176208496, "global_step": 129167, "epoch": 3075} {"train_loss": -6.773447513580322, "global_step": 129168, "epoch": 3075} {"train_loss": -6.618988037109375, "global_step": 129169, "epoch": 3075} {"train_loss": -6.772861957550049, "global_step": 129170, "epoch": 3075} {"train_loss": -6.661895751953125, "global_step": 129171, "epoch": 3075} {"train_loss": -6.7243194580078125, "global_step": 129172, "epoch": 3075} {"train_loss": -6.602193832397461, "global_step": 129173, "epoch": 3075} {"train_loss": -6.801486015319824, "global_step": 129174, "epoch": 3075} {"train_loss": -6.720297813415527, "global_step": 129175, "epoch": 3075} {"train_loss": -6.664170265197754, "global_step": 129176, "epoch": 3075} {"train_loss": -6.8005242347717285, "global_step": 129177, "epoch": 3075} {"train_loss": -6.633880615234375, "global_step": 129178, "epoch": 3075} {"train_loss": -6.634340286254883, "global_step": 129179, "epoch": 3075} {"train_loss": -6.699808597564697, "global_step": 129180, "epoch": 3075} {"train_loss": -6.772622108459473, "global_step": 129181, "epoch": 3075} {"train_loss": -6.530501365661621, "global_step": 129182, "epoch": 3075} {"train_loss": -6.7370781898498535, "global_step": 129183, "epoch": 3075} {"train_loss": -6.7457990646362305, "global_step": 129184, "epoch": 3075} {"train_loss": -6.740160942077637, "global_step": 129185, "epoch": 3075} {"train_loss": -6.603719711303711, "global_step": 129186, "epoch": 3075} {"train_loss": -6.69724178314209, "global_step": 129187, "epoch": 3075} {"train_loss": -6.5987653732299805, "global_step": 129188, "epoch": 3075} {"train_loss": -6.666024208068848, "global_step": 129189, "epoch": 3075} {"train_loss": -6.656833648681641, "global_step": 129190, "epoch": 3075} {"train_loss": -6.689123494284494, "global_step": 129191, "epoch": 3075, "val_loss": 77509.984375} {"train_loss": -6.7954511642456055, "global_step": 129192, "epoch": 3076} {"train_loss": -6.714440822601318, "global_step": 129193, "epoch": 3076} {"train_loss": -6.78892183303833, "global_step": 129194, "epoch": 3076} {"train_loss": -6.597830772399902, "global_step": 129195, "epoch": 3076} {"train_loss": -6.789003372192383, "global_step": 129196, "epoch": 3076} {"train_loss": -6.7487688064575195, "global_step": 129197, "epoch": 3076} {"train_loss": -6.628600120544434, "global_step": 129198, "epoch": 3076} {"train_loss": -6.634294033050537, "global_step": 129199, "epoch": 3076} {"train_loss": -6.714444160461426, "global_step": 129200, "epoch": 3076} {"train_loss": -6.61435604095459, "global_step": 129201, "epoch": 3076} {"train_loss": -6.584205627441406, "global_step": 129202, "epoch": 3076} {"train_loss": -6.6862592697143555, "global_step": 129203, "epoch": 3076} {"train_loss": -6.738982200622559, "global_step": 129204, "epoch": 3076} {"train_loss": -6.730685234069824, "global_step": 129205, "epoch": 3076} {"train_loss": -6.77756404876709, "global_step": 129206, "epoch": 3076} {"train_loss": -6.638399600982666, "global_step": 129207, "epoch": 3076} {"train_loss": -6.705636501312256, "global_step": 129208, "epoch": 3076} {"train_loss": -6.673212051391602, "global_step": 129209, "epoch": 3076} {"train_loss": -6.680478096008301, "global_step": 129210, "epoch": 3076} {"train_loss": -6.760030269622803, "global_step": 129211, "epoch": 3076} {"train_loss": -6.689209938049316, "global_step": 129212, "epoch": 3076} {"train_loss": -6.667899131774902, "global_step": 129213, "epoch": 3076} {"train_loss": -6.770033836364746, "global_step": 129214, "epoch": 3076} {"train_loss": -6.619868278503418, "global_step": 129215, "epoch": 3076} {"train_loss": -6.669219970703125, "global_step": 129216, "epoch": 3076} {"train_loss": -6.647227764129639, "global_step": 129217, "epoch": 3076} {"train_loss": -6.720023155212402, "global_step": 129218, "epoch": 3076} {"train_loss": -6.739768981933594, "global_step": 129219, "epoch": 3076} {"train_loss": -6.643677234649658, "global_step": 129220, "epoch": 3076} {"train_loss": -6.689945220947266, "global_step": 129221, "epoch": 3076} {"train_loss": -6.6062164306640625, "global_step": 129222, "epoch": 3076} {"train_loss": -6.620757579803467, "global_step": 129223, "epoch": 3076} {"train_loss": -6.49677848815918, "global_step": 129224, "epoch": 3076} {"train_loss": -6.693525791168213, "global_step": 129225, "epoch": 3076} {"train_loss": -6.565832614898682, "global_step": 129226, "epoch": 3076} {"train_loss": -6.570122718811035, "global_step": 129227, "epoch": 3076} {"train_loss": -6.725017547607422, "global_step": 129228, "epoch": 3076} {"train_loss": -6.590709209442139, "global_step": 129229, "epoch": 3076} {"train_loss": -6.561959266662598, "global_step": 129230, "epoch": 3076} {"train_loss": -6.68145751953125, "global_step": 129231, "epoch": 3076} {"train_loss": -6.6173577308654785, "global_step": 129232, "epoch": 3076} {"train_loss": -6.6717080388750345, "global_step": 129233, "epoch": 3076, "val_loss": 77568.03125} {"train_loss": -6.545718193054199, "global_step": 129234, "epoch": 3077} {"train_loss": -6.729482650756836, "global_step": 129235, "epoch": 3077} {"train_loss": -6.5931549072265625, "global_step": 129236, "epoch": 3077} {"train_loss": -6.706742286682129, "global_step": 129237, "epoch": 3077} {"train_loss": -6.553412437438965, "global_step": 129238, "epoch": 3077} {"train_loss": -6.613499641418457, "global_step": 129239, "epoch": 3077} {"train_loss": -6.555832862854004, "global_step": 129240, "epoch": 3077} {"train_loss": -6.5976338386535645, "global_step": 129241, "epoch": 3077} {"train_loss": -6.570857048034668, "global_step": 129242, "epoch": 3077} {"train_loss": -6.62680196762085, "global_step": 129243, "epoch": 3077} {"train_loss": -6.662154674530029, "global_step": 129244, "epoch": 3077} {"train_loss": -6.562257766723633, "global_step": 129245, "epoch": 3077} {"train_loss": -6.537365913391113, "global_step": 129246, "epoch": 3077} {"train_loss": -6.596938610076904, "global_step": 129247, "epoch": 3077} {"train_loss": -6.645757675170898, "global_step": 129248, "epoch": 3077} {"train_loss": -6.534660339355469, "global_step": 129249, "epoch": 3077} {"train_loss": -6.781275749206543, "global_step": 129250, "epoch": 3077} {"train_loss": -6.628185749053955, "global_step": 129251, "epoch": 3077} {"train_loss": -6.61132287979126, "global_step": 129252, "epoch": 3077} {"train_loss": -6.699844837188721, "global_step": 129253, "epoch": 3077} {"train_loss": -6.580122470855713, "global_step": 129254, "epoch": 3077} {"train_loss": -6.577945709228516, "global_step": 129255, "epoch": 3077} {"train_loss": -6.644315242767334, "global_step": 129256, "epoch": 3077} {"train_loss": -6.526757717132568, "global_step": 129257, "epoch": 3077} {"train_loss": -6.662250995635986, "global_step": 129258, "epoch": 3077} {"train_loss": -6.61706018447876, "global_step": 129259, "epoch": 3077} {"train_loss": -6.635061740875244, "global_step": 129260, "epoch": 3077} {"train_loss": -6.669943809509277, "global_step": 129261, "epoch": 3077} {"train_loss": -6.732115745544434, "global_step": 129262, "epoch": 3077} {"train_loss": -6.51521110534668, "global_step": 129263, "epoch": 3077} {"train_loss": -6.682088851928711, "global_step": 129264, "epoch": 3077} {"train_loss": -6.618679523468018, "global_step": 129265, "epoch": 3077} {"train_loss": -6.712166786193848, "global_step": 129266, "epoch": 3077} {"train_loss": -6.613628387451172, "global_step": 129267, "epoch": 3077} {"train_loss": -6.572633743286133, "global_step": 129268, "epoch": 3077} {"train_loss": -6.787578582763672, "global_step": 129269, "epoch": 3077} {"train_loss": -6.68816614151001, "global_step": 129270, "epoch": 3077} {"train_loss": -6.571353435516357, "global_step": 129271, "epoch": 3077} {"train_loss": -6.802085876464844, "global_step": 129272, "epoch": 3077} {"train_loss": -6.619609832763672, "global_step": 129273, "epoch": 3077} {"train_loss": -6.508598327636719, "global_step": 129274, "epoch": 3077} {"train_loss": -6.629148994173322, "global_step": 129275, "epoch": 3077, "val_loss": 77482.609375} {"train_loss": -6.764106273651123, "global_step": 129276, "epoch": 3078} {"train_loss": -6.783995628356934, "global_step": 129277, "epoch": 3078} {"train_loss": -6.6770501136779785, "global_step": 129278, "epoch": 3078} {"train_loss": -6.638156414031982, "global_step": 129279, "epoch": 3078} {"train_loss": -6.628534317016602, "global_step": 129280, "epoch": 3078} {"train_loss": -6.669754981994629, "global_step": 129281, "epoch": 3078} {"train_loss": -6.819128513336182, "global_step": 129282, "epoch": 3078} {"train_loss": -6.631412506103516, "global_step": 129283, "epoch": 3078} {"train_loss": -6.70341157913208, "global_step": 129284, "epoch": 3078} {"train_loss": -6.758329391479492, "global_step": 129285, "epoch": 3078} {"train_loss": -6.539390563964844, "global_step": 129286, "epoch": 3078} {"train_loss": -6.582650184631348, "global_step": 129287, "epoch": 3078} {"train_loss": -6.679468631744385, "global_step": 129288, "epoch": 3078} {"train_loss": -6.6478166580200195, "global_step": 129289, "epoch": 3078} {"train_loss": -6.635434627532959, "global_step": 129290, "epoch": 3078} {"train_loss": -6.633480072021484, "global_step": 129291, "epoch": 3078} {"train_loss": -6.563692092895508, "global_step": 129292, "epoch": 3078} {"train_loss": -6.572689056396484, "global_step": 129293, "epoch": 3078} {"train_loss": -6.5084381103515625, "global_step": 129294, "epoch": 3078} {"train_loss": -6.591957092285156, "global_step": 129295, "epoch": 3078} {"train_loss": -6.782127380371094, "global_step": 129296, "epoch": 3078} {"train_loss": -6.5429534912109375, "global_step": 129297, "epoch": 3078} {"train_loss": -6.618668079376221, "global_step": 129298, "epoch": 3078} {"train_loss": -6.566048622131348, "global_step": 129299, "epoch": 3078} {"train_loss": -6.637179851531982, "global_step": 129300, "epoch": 3078} {"train_loss": -6.631704330444336, "global_step": 129301, "epoch": 3078} {"train_loss": -6.5528950691223145, "global_step": 129302, "epoch": 3078} {"train_loss": -6.629047870635986, "global_step": 129303, "epoch": 3078} {"train_loss": -6.486189842224121, "global_step": 129304, "epoch": 3078} {"train_loss": -6.4498467445373535, "global_step": 129305, "epoch": 3078} {"train_loss": -6.584235191345215, "global_step": 129306, "epoch": 3078} {"train_loss": -6.566364288330078, "global_step": 129307, "epoch": 3078} {"train_loss": -6.692333698272705, "global_step": 129308, "epoch": 3078} {"train_loss": -6.55196475982666, "global_step": 129309, "epoch": 3078} {"train_loss": -6.586224555969238, "global_step": 129310, "epoch": 3078} {"train_loss": -6.567696571350098, "global_step": 129311, "epoch": 3078} {"train_loss": -6.655703544616699, "global_step": 129312, "epoch": 3078} {"train_loss": -6.604886531829834, "global_step": 129313, "epoch": 3078} {"train_loss": -6.520394325256348, "global_step": 129314, "epoch": 3078} {"train_loss": -6.7301926612854, "global_step": 129315, "epoch": 3078} {"train_loss": -6.6406474113464355, "global_step": 129316, "epoch": 3078} {"train_loss": -6.625096400578816, "global_step": 129317, "epoch": 3078, "val_loss": 77397.7890625} {"train_loss": -6.764448642730713, "global_step": 129318, "epoch": 3079} {"train_loss": -6.651948928833008, "global_step": 129319, "epoch": 3079} {"train_loss": -6.758370399475098, "global_step": 129320, "epoch": 3079} {"train_loss": -6.718145370483398, "global_step": 129321, "epoch": 3079} {"train_loss": -6.742132186889648, "global_step": 129322, "epoch": 3079} {"train_loss": -6.762455463409424, "global_step": 129323, "epoch": 3079} {"train_loss": -6.7487077713012695, "global_step": 129324, "epoch": 3079} {"train_loss": -6.640985488891602, "global_step": 129325, "epoch": 3079} {"train_loss": -6.7068281173706055, "global_step": 129326, "epoch": 3079} {"train_loss": -6.710996627807617, "global_step": 129327, "epoch": 3079} {"train_loss": -6.616661548614502, "global_step": 129328, "epoch": 3079} {"train_loss": -6.632295608520508, "global_step": 129329, "epoch": 3079} {"train_loss": -6.681987285614014, "global_step": 129330, "epoch": 3079} {"train_loss": -6.617203712463379, "global_step": 129331, "epoch": 3079} {"train_loss": -6.6839919090271, "global_step": 129332, "epoch": 3079} {"train_loss": -6.549063682556152, "global_step": 129333, "epoch": 3079} {"train_loss": -6.624876976013184, "global_step": 129334, "epoch": 3079} {"train_loss": -6.518930435180664, "global_step": 129335, "epoch": 3079} {"train_loss": -6.609742164611816, "global_step": 129336, "epoch": 3079} {"train_loss": -6.681307792663574, "global_step": 129337, "epoch": 3079} {"train_loss": -6.500423431396484, "global_step": 129338, "epoch": 3079} {"train_loss": -6.540645599365234, "global_step": 129339, "epoch": 3079} {"train_loss": -6.568734169006348, "global_step": 129340, "epoch": 3079} {"train_loss": -6.633123397827148, "global_step": 129341, "epoch": 3079} {"train_loss": -6.58463191986084, "global_step": 129342, "epoch": 3079} {"train_loss": -6.575470924377441, "global_step": 129343, "epoch": 3079} {"train_loss": -6.565829277038574, "global_step": 129344, "epoch": 3079} {"train_loss": -6.702765941619873, "global_step": 129345, "epoch": 3079} {"train_loss": -6.511767387390137, "global_step": 129346, "epoch": 3079} {"train_loss": -6.5450239181518555, "global_step": 129347, "epoch": 3079} {"train_loss": -6.4512152671813965, "global_step": 129348, "epoch": 3079} {"train_loss": -6.662492752075195, "global_step": 129349, "epoch": 3079} {"train_loss": -6.519887924194336, "global_step": 129350, "epoch": 3079} {"train_loss": -6.542829513549805, "global_step": 129351, "epoch": 3079} {"train_loss": -6.653524398803711, "global_step": 129352, "epoch": 3079} {"train_loss": -6.663577079772949, "global_step": 129353, "epoch": 3079} {"train_loss": -6.576861381530762, "global_step": 129354, "epoch": 3079} {"train_loss": -6.616639137268066, "global_step": 129355, "epoch": 3079} {"train_loss": -6.543004035949707, "global_step": 129356, "epoch": 3079} {"train_loss": -6.606011390686035, "global_step": 129357, "epoch": 3079} {"train_loss": -6.580358982086182, "global_step": 129358, "epoch": 3079} {"train_loss": -6.625351894469488, "global_step": 129359, "epoch": 3079, "val_loss": 77596.1640625} {"train_loss": -6.691211223602295, "global_step": 129360, "epoch": 3080} {"train_loss": -6.734742641448975, "global_step": 129361, "epoch": 3080} {"train_loss": -6.694982051849365, "global_step": 129362, "epoch": 3080} {"train_loss": -6.566245079040527, "global_step": 129363, "epoch": 3080} {"train_loss": -6.634819507598877, "global_step": 129364, "epoch": 3080} {"train_loss": -6.65628719329834, "global_step": 129365, "epoch": 3080} {"train_loss": -6.595906734466553, "global_step": 129366, "epoch": 3080} {"train_loss": -6.626058578491211, "global_step": 129367, "epoch": 3080} {"train_loss": -6.788617134094238, "global_step": 129368, "epoch": 3080} {"train_loss": -6.59489631652832, "global_step": 129369, "epoch": 3080} {"train_loss": -6.700231552124023, "global_step": 129370, "epoch": 3080} {"train_loss": -6.5885820388793945, "global_step": 129371, "epoch": 3080} {"train_loss": -6.661698341369629, "global_step": 129372, "epoch": 3080} {"train_loss": -6.623956203460693, "global_step": 129373, "epoch": 3080} {"train_loss": -6.628391265869141, "global_step": 129374, "epoch": 3080} {"train_loss": -6.699494361877441, "global_step": 129375, "epoch": 3080} {"train_loss": -6.5394134521484375, "global_step": 129376, "epoch": 3080} {"train_loss": -6.731483459472656, "global_step": 129377, "epoch": 3080} {"train_loss": -6.710749626159668, "global_step": 129378, "epoch": 3080} {"train_loss": -6.617762565612793, "global_step": 129379, "epoch": 3080} {"train_loss": -6.657136917114258, "global_step": 129380, "epoch": 3080} {"train_loss": -6.503612995147705, "global_step": 129381, "epoch": 3080} {"train_loss": -6.565089225769043, "global_step": 129382, "epoch": 3080} {"train_loss": -6.53609561920166, "global_step": 129383, "epoch": 3080} {"train_loss": -6.476873874664307, "global_step": 129384, "epoch": 3080} {"train_loss": -6.678069591522217, "global_step": 129385, "epoch": 3080} {"train_loss": -6.71872615814209, "global_step": 129386, "epoch": 3080} {"train_loss": -6.524171352386475, "global_step": 129387, "epoch": 3080} {"train_loss": -6.704952239990234, "global_step": 129388, "epoch": 3080} {"train_loss": -6.535874843597412, "global_step": 129389, "epoch": 3080} {"train_loss": -6.662334442138672, "global_step": 129390, "epoch": 3080} {"train_loss": -6.542852401733398, "global_step": 129391, "epoch": 3080} {"train_loss": -6.485012054443359, "global_step": 129392, "epoch": 3080} {"train_loss": -6.571414470672607, "global_step": 129393, "epoch": 3080} {"train_loss": -6.566144943237305, "global_step": 129394, "epoch": 3080} {"train_loss": -6.638453483581543, "global_step": 129395, "epoch": 3080} {"train_loss": -6.633957862854004, "global_step": 129396, "epoch": 3080} {"train_loss": -6.6369218826293945, "global_step": 129397, "epoch": 3080} {"train_loss": -6.729813098907471, "global_step": 129398, "epoch": 3080} {"train_loss": -6.678255558013916, "global_step": 129399, "epoch": 3080} {"train_loss": -6.674586772918701, "global_step": 129400, "epoch": 3080} {"train_loss": -6.628366651989165, "global_step": 129401, "epoch": 3080, "val_loss": 77571.6015625} {"train_loss": -6.6544647216796875, "global_step": 129402, "epoch": 3081} {"train_loss": -6.682570457458496, "global_step": 129403, "epoch": 3081} {"train_loss": -6.587017059326172, "global_step": 129404, "epoch": 3081} {"train_loss": -6.687008380889893, "global_step": 129405, "epoch": 3081} {"train_loss": -6.686713695526123, "global_step": 129406, "epoch": 3081} {"train_loss": -6.613881587982178, "global_step": 129407, "epoch": 3081} {"train_loss": -6.713513374328613, "global_step": 129408, "epoch": 3081} {"train_loss": -6.595327377319336, "global_step": 129409, "epoch": 3081} {"train_loss": -6.817788600921631, "global_step": 129410, "epoch": 3081} {"train_loss": -6.6212873458862305, "global_step": 129411, "epoch": 3081} {"train_loss": -6.70302677154541, "global_step": 129412, "epoch": 3081} {"train_loss": -6.682483673095703, "global_step": 129413, "epoch": 3081} {"train_loss": -6.47343635559082, "global_step": 129414, "epoch": 3081} {"train_loss": -6.546586990356445, "global_step": 129415, "epoch": 3081} {"train_loss": -6.573597431182861, "global_step": 129416, "epoch": 3081} {"train_loss": -6.6724958419799805, "global_step": 129417, "epoch": 3081} {"train_loss": -6.587279319763184, "global_step": 129418, "epoch": 3081} {"train_loss": -6.647392272949219, "global_step": 129419, "epoch": 3081} {"train_loss": -6.61275577545166, "global_step": 129420, "epoch": 3081} {"train_loss": -6.611645698547363, "global_step": 129421, "epoch": 3081} {"train_loss": -6.726335525512695, "global_step": 129422, "epoch": 3081} {"train_loss": -6.725510597229004, "global_step": 129423, "epoch": 3081} {"train_loss": -6.634000778198242, "global_step": 129424, "epoch": 3081} {"train_loss": -6.66012716293335, "global_step": 129425, "epoch": 3081} {"train_loss": -6.626904010772705, "global_step": 129426, "epoch": 3081} {"train_loss": -6.659101486206055, "global_step": 129427, "epoch": 3081} {"train_loss": -6.756861686706543, "global_step": 129428, "epoch": 3081} {"train_loss": -6.609680652618408, "global_step": 129429, "epoch": 3081} {"train_loss": -6.736571311950684, "global_step": 129430, "epoch": 3081} {"train_loss": -6.695418357849121, "global_step": 129431, "epoch": 3081} {"train_loss": -6.646145820617676, "global_step": 129432, "epoch": 3081} {"train_loss": -6.707437515258789, "global_step": 129433, "epoch": 3081} {"train_loss": -6.728786945343018, "global_step": 129434, "epoch": 3081} {"train_loss": -6.756630897521973, "global_step": 129435, "epoch": 3081} {"train_loss": -6.759930610656738, "global_step": 129436, "epoch": 3081} {"train_loss": -6.671741962432861, "global_step": 129437, "epoch": 3081} {"train_loss": -6.70144510269165, "global_step": 129438, "epoch": 3081} {"train_loss": -6.71407413482666, "global_step": 129439, "epoch": 3081} {"train_loss": -6.644867897033691, "global_step": 129440, "epoch": 3081} {"train_loss": -6.5981550216674805, "global_step": 129441, "epoch": 3081} {"train_loss": -6.636944770812988, "global_step": 129442, "epoch": 3081} {"train_loss": -6.664692844663348, "global_step": 129443, "epoch": 3081, "val_loss": 77497.8515625} {"train_loss": -6.7231645584106445, "global_step": 129444, "epoch": 3082} {"train_loss": -6.687025547027588, "global_step": 129445, "epoch": 3082} {"train_loss": -6.7760138511657715, "global_step": 129446, "epoch": 3082} {"train_loss": -6.76713752746582, "global_step": 129447, "epoch": 3082} {"train_loss": -6.7449846267700195, "global_step": 129448, "epoch": 3082} {"train_loss": -6.644248962402344, "global_step": 129449, "epoch": 3082} {"train_loss": -6.700182914733887, "global_step": 129450, "epoch": 3082} {"train_loss": -6.601268291473389, "global_step": 129451, "epoch": 3082} {"train_loss": -6.585611820220947, "global_step": 129452, "epoch": 3082} {"train_loss": -6.7714924812316895, "global_step": 129453, "epoch": 3082} {"train_loss": -6.606231212615967, "global_step": 129454, "epoch": 3082} {"train_loss": -6.678924083709717, "global_step": 129455, "epoch": 3082} {"train_loss": -6.662820339202881, "global_step": 129456, "epoch": 3082} {"train_loss": -6.593859672546387, "global_step": 129457, "epoch": 3082} {"train_loss": -6.714676856994629, "global_step": 129458, "epoch": 3082} {"train_loss": -6.720515251159668, "global_step": 129459, "epoch": 3082} {"train_loss": -6.640225887298584, "global_step": 129460, "epoch": 3082} {"train_loss": -6.774880409240723, "global_step": 129461, "epoch": 3082} {"train_loss": -6.633640766143799, "global_step": 129462, "epoch": 3082} {"train_loss": -6.681544303894043, "global_step": 129463, "epoch": 3082} {"train_loss": -6.642180919647217, "global_step": 129464, "epoch": 3082} {"train_loss": -6.7985687255859375, "global_step": 129465, "epoch": 3082} {"train_loss": -6.671043395996094, "global_step": 129466, "epoch": 3082} {"train_loss": -6.632828235626221, "global_step": 129467, "epoch": 3082} {"train_loss": -6.565432548522949, "global_step": 129468, "epoch": 3082} {"train_loss": -6.659548282623291, "global_step": 129469, "epoch": 3082} {"train_loss": -6.651158332824707, "global_step": 129470, "epoch": 3082} {"train_loss": -6.684004783630371, "global_step": 129471, "epoch": 3082} {"train_loss": -6.635854244232178, "global_step": 129472, "epoch": 3082} {"train_loss": -6.728694438934326, "global_step": 129473, "epoch": 3082} {"train_loss": -6.676601409912109, "global_step": 129474, "epoch": 3082} {"train_loss": -6.779315948486328, "global_step": 129475, "epoch": 3082} {"train_loss": -6.7729034423828125, "global_step": 129476, "epoch": 3082} {"train_loss": -6.733994483947754, "global_step": 129477, "epoch": 3082} {"train_loss": -6.752145290374756, "global_step": 129478, "epoch": 3082} {"train_loss": -6.772939205169678, "global_step": 129479, "epoch": 3082} {"train_loss": -6.802882194519043, "global_step": 129480, "epoch": 3082} {"train_loss": -6.768611431121826, "global_step": 129481, "epoch": 3082} {"train_loss": -6.675426959991455, "global_step": 129482, "epoch": 3082} {"train_loss": -6.6100263595581055, "global_step": 129483, "epoch": 3082} {"train_loss": -6.6136579513549805, "global_step": 129484, "epoch": 3082} {"train_loss": -6.689752510615757, "global_step": 129485, "epoch": 3082, "val_loss": 77312.71875} {"train_loss": -6.7046332359313965, "global_step": 129486, "epoch": 3083} {"train_loss": -6.738872528076172, "global_step": 129487, "epoch": 3083} {"train_loss": -6.69629430770874, "global_step": 129488, "epoch": 3083} {"train_loss": -6.597263336181641, "global_step": 129489, "epoch": 3083} {"train_loss": -6.707454681396484, "global_step": 129490, "epoch": 3083} {"train_loss": -6.688745975494385, "global_step": 129491, "epoch": 3083} {"train_loss": -6.582925796508789, "global_step": 129492, "epoch": 3083} {"train_loss": -6.60857629776001, "global_step": 129493, "epoch": 3083} {"train_loss": -6.715597629547119, "global_step": 129494, "epoch": 3083} {"train_loss": -6.599967002868652, "global_step": 129495, "epoch": 3083} {"train_loss": -6.576140403747559, "global_step": 129496, "epoch": 3083} {"train_loss": -6.5969953536987305, "global_step": 129497, "epoch": 3083} {"train_loss": -6.601789474487305, "global_step": 129498, "epoch": 3083} {"train_loss": -6.647214889526367, "global_step": 129499, "epoch": 3083} {"train_loss": -6.6600823402404785, "global_step": 129500, "epoch": 3083} {"train_loss": -6.591257572174072, "global_step": 129501, "epoch": 3083} {"train_loss": -6.686364650726318, "global_step": 129502, "epoch": 3083} {"train_loss": -6.6862077713012695, "global_step": 129503, "epoch": 3083} {"train_loss": -6.6501264572143555, "global_step": 129504, "epoch": 3083} {"train_loss": -6.7638373374938965, "global_step": 129505, "epoch": 3083} {"train_loss": -6.697859287261963, "global_step": 129506, "epoch": 3083} {"train_loss": -6.516845703125, "global_step": 129507, "epoch": 3083} {"train_loss": -6.591780662536621, "global_step": 129508, "epoch": 3083} {"train_loss": -6.670589923858643, "global_step": 129509, "epoch": 3083} {"train_loss": -6.720598220825195, "global_step": 129510, "epoch": 3083} {"train_loss": -6.686398506164551, "global_step": 129511, "epoch": 3083} {"train_loss": -6.662387847900391, "global_step": 129512, "epoch": 3083} {"train_loss": -6.630034446716309, "global_step": 129513, "epoch": 3083} {"train_loss": -6.545598983764648, "global_step": 129514, "epoch": 3083} {"train_loss": -6.671998023986816, "global_step": 129515, "epoch": 3083} {"train_loss": -6.653066635131836, "global_step": 129516, "epoch": 3083} {"train_loss": -6.471774101257324, "global_step": 129517, "epoch": 3083} {"train_loss": -6.727812767028809, "global_step": 129518, "epoch": 3083} {"train_loss": -6.652863502502441, "global_step": 129519, "epoch": 3083} {"train_loss": -6.7512288093566895, "global_step": 129520, "epoch": 3083} {"train_loss": -6.55429744720459, "global_step": 129521, "epoch": 3083} {"train_loss": -6.570181846618652, "global_step": 129522, "epoch": 3083} {"train_loss": -6.666755676269531, "global_step": 129523, "epoch": 3083} {"train_loss": -6.527470588684082, "global_step": 129524, "epoch": 3083} {"train_loss": -6.741664886474609, "global_step": 129525, "epoch": 3083} {"train_loss": -6.663946628570557, "global_step": 129526, "epoch": 3083} {"train_loss": -6.648038512184506, "global_step": 129527, "epoch": 3083, "val_loss": 77690.4140625} {"train_loss": -6.693810939788818, "global_step": 129528, "epoch": 3084} {"train_loss": -6.678216934204102, "global_step": 129529, "epoch": 3084} {"train_loss": -6.692919731140137, "global_step": 129530, "epoch": 3084} {"train_loss": -6.601766586303711, "global_step": 129531, "epoch": 3084} {"train_loss": -6.693482398986816, "global_step": 129532, "epoch": 3084} {"train_loss": -6.702089309692383, "global_step": 129533, "epoch": 3084} {"train_loss": -6.683682441711426, "global_step": 129534, "epoch": 3084} {"train_loss": -6.609796524047852, "global_step": 129535, "epoch": 3084} {"train_loss": -6.564074993133545, "global_step": 129536, "epoch": 3084} {"train_loss": -6.714842319488525, "global_step": 129537, "epoch": 3084} {"train_loss": -6.697417259216309, "global_step": 129538, "epoch": 3084} {"train_loss": -6.603376388549805, "global_step": 129539, "epoch": 3084} {"train_loss": -6.655645847320557, "global_step": 129540, "epoch": 3084} {"train_loss": -6.572128772735596, "global_step": 129541, "epoch": 3084} {"train_loss": -6.628383159637451, "global_step": 129542, "epoch": 3084} {"train_loss": -6.774333477020264, "global_step": 129543, "epoch": 3084} {"train_loss": -6.602836608886719, "global_step": 129544, "epoch": 3084} {"train_loss": -6.623051643371582, "global_step": 129545, "epoch": 3084} {"train_loss": -6.768741607666016, "global_step": 129546, "epoch": 3084} {"train_loss": -6.698264122009277, "global_step": 129547, "epoch": 3084} {"train_loss": -6.672000885009766, "global_step": 129548, "epoch": 3084} {"train_loss": -6.741827011108398, "global_step": 129549, "epoch": 3084} {"train_loss": -6.616114139556885, "global_step": 129550, "epoch": 3084} {"train_loss": -6.7640533447265625, "global_step": 129551, "epoch": 3084} {"train_loss": -6.671346664428711, "global_step": 129552, "epoch": 3084} {"train_loss": -6.718871116638184, "global_step": 129553, "epoch": 3084} {"train_loss": -6.750589370727539, "global_step": 129554, "epoch": 3084} {"train_loss": -6.72151517868042, "global_step": 129555, "epoch": 3084} {"train_loss": -6.543713569641113, "global_step": 129556, "epoch": 3084} {"train_loss": -6.654818534851074, "global_step": 129557, "epoch": 3084} {"train_loss": -6.779117107391357, "global_step": 129558, "epoch": 3084} {"train_loss": -6.721489906311035, "global_step": 129559, "epoch": 3084} {"train_loss": -6.574399948120117, "global_step": 129560, "epoch": 3084} {"train_loss": -6.76606559753418, "global_step": 129561, "epoch": 3084} {"train_loss": -6.6454949378967285, "global_step": 129562, "epoch": 3084} {"train_loss": -6.617082595825195, "global_step": 129563, "epoch": 3084} {"train_loss": -6.6231794357299805, "global_step": 129564, "epoch": 3084} {"train_loss": -6.65843391418457, "global_step": 129565, "epoch": 3084} {"train_loss": -6.704189300537109, "global_step": 129566, "epoch": 3084} {"train_loss": -6.695908069610596, "global_step": 129567, "epoch": 3084} {"train_loss": -6.656792163848877, "global_step": 129568, "epoch": 3084} {"train_loss": -6.670239017123268, "global_step": 129569, "epoch": 3084, "val_loss": 77347.0625} {"train_loss": -6.663538455963135, "global_step": 129570, "epoch": 3085} {"train_loss": -6.679220676422119, "global_step": 129571, "epoch": 3085} {"train_loss": -6.7230730056762695, "global_step": 129572, "epoch": 3085} {"train_loss": -6.6406121253967285, "global_step": 129573, "epoch": 3085} {"train_loss": -6.640652656555176, "global_step": 129574, "epoch": 3085} {"train_loss": -6.670629501342773, "global_step": 129575, "epoch": 3085} {"train_loss": -6.678354263305664, "global_step": 129576, "epoch": 3085} {"train_loss": -6.737473487854004, "global_step": 129577, "epoch": 3085} {"train_loss": -6.644881248474121, "global_step": 129578, "epoch": 3085} {"train_loss": -6.764710903167725, "global_step": 129579, "epoch": 3085} {"train_loss": -6.636545181274414, "global_step": 129580, "epoch": 3085} {"train_loss": -6.808788299560547, "global_step": 129581, "epoch": 3085} {"train_loss": -6.646510124206543, "global_step": 129582, "epoch": 3085} {"train_loss": -6.633313179016113, "global_step": 129583, "epoch": 3085} {"train_loss": -6.718392372131348, "global_step": 129584, "epoch": 3085} {"train_loss": -6.588160037994385, "global_step": 129585, "epoch": 3085} {"train_loss": -6.799999237060547, "global_step": 129586, "epoch": 3085} {"train_loss": -6.665369033813477, "global_step": 129587, "epoch": 3085} {"train_loss": -6.653420925140381, "global_step": 129588, "epoch": 3085} {"train_loss": -6.774823188781738, "global_step": 129589, "epoch": 3085} {"train_loss": -6.733887672424316, "global_step": 129590, "epoch": 3085} {"train_loss": -6.59208345413208, "global_step": 129591, "epoch": 3085} {"train_loss": -6.677763938903809, "global_step": 129592, "epoch": 3085} {"train_loss": -6.617110252380371, "global_step": 129593, "epoch": 3085} {"train_loss": -6.562705993652344, "global_step": 129594, "epoch": 3085} {"train_loss": -6.686933994293213, "global_step": 129595, "epoch": 3085} {"train_loss": -6.757102012634277, "global_step": 129596, "epoch": 3085} {"train_loss": -6.720207214355469, "global_step": 129597, "epoch": 3085} {"train_loss": -6.702419281005859, "global_step": 129598, "epoch": 3085} {"train_loss": -6.606204032897949, "global_step": 129599, "epoch": 3085} {"train_loss": -6.619068145751953, "global_step": 129600, "epoch": 3085} {"train_loss": -6.74744987487793, "global_step": 129601, "epoch": 3085} {"train_loss": -6.762457847595215, "global_step": 129602, "epoch": 3085} {"train_loss": -6.796957969665527, "global_step": 129603, "epoch": 3085} {"train_loss": -6.89058780670166, "global_step": 129604, "epoch": 3085} {"train_loss": -6.772796630859375, "global_step": 129605, "epoch": 3085} {"train_loss": -6.671941757202148, "global_step": 129606, "epoch": 3085} {"train_loss": -6.674009323120117, "global_step": 129607, "epoch": 3085} {"train_loss": -6.696625232696533, "global_step": 129608, "epoch": 3085} {"train_loss": -6.598105430603027, "global_step": 129609, "epoch": 3085} {"train_loss": -6.675122261047363, "global_step": 129610, "epoch": 3085} {"train_loss": -6.691581794193813, "global_step": 129611, "epoch": 3085, "val_loss": 77640.4296875} {"train_loss": -6.682982444763184, "global_step": 129612, "epoch": 3086} {"train_loss": -6.795686721801758, "global_step": 129613, "epoch": 3086} {"train_loss": -6.53597354888916, "global_step": 129614, "epoch": 3086} {"train_loss": -6.680410861968994, "global_step": 129615, "epoch": 3086} {"train_loss": -6.639471054077148, "global_step": 129616, "epoch": 3086} {"train_loss": -6.62256383895874, "global_step": 129617, "epoch": 3086} {"train_loss": -6.61557149887085, "global_step": 129618, "epoch": 3086} {"train_loss": -6.721915245056152, "global_step": 129619, "epoch": 3086} {"train_loss": -6.592843532562256, "global_step": 129620, "epoch": 3086} {"train_loss": -6.767227649688721, "global_step": 129621, "epoch": 3086} {"train_loss": -6.4663848876953125, "global_step": 129622, "epoch": 3086} {"train_loss": -6.580775260925293, "global_step": 129623, "epoch": 3086} {"train_loss": -6.687872886657715, "global_step": 129624, "epoch": 3086} {"train_loss": -6.701096534729004, "global_step": 129625, "epoch": 3086} {"train_loss": -6.648244857788086, "global_step": 129626, "epoch": 3086} {"train_loss": -6.526277542114258, "global_step": 129627, "epoch": 3086} {"train_loss": -6.667024612426758, "global_step": 129628, "epoch": 3086} {"train_loss": -6.717830657958984, "global_step": 129629, "epoch": 3086} {"train_loss": -6.620112419128418, "global_step": 129630, "epoch": 3086} {"train_loss": -6.596510410308838, "global_step": 129631, "epoch": 3086} {"train_loss": -6.681868553161621, "global_step": 129632, "epoch": 3086} {"train_loss": -6.6076765060424805, "global_step": 129633, "epoch": 3086} {"train_loss": -6.733298301696777, "global_step": 129634, "epoch": 3086} {"train_loss": -6.595424652099609, "global_step": 129635, "epoch": 3086} {"train_loss": -6.7804975509643555, "global_step": 129636, "epoch": 3086} {"train_loss": -6.630277633666992, "global_step": 129637, "epoch": 3086} {"train_loss": -6.572689056396484, "global_step": 129638, "epoch": 3086} {"train_loss": -6.747368335723877, "global_step": 129639, "epoch": 3086} {"train_loss": -6.603510856628418, "global_step": 129640, "epoch": 3086} {"train_loss": -6.5493645668029785, "global_step": 129641, "epoch": 3086} {"train_loss": -6.666211128234863, "global_step": 129642, "epoch": 3086} {"train_loss": -6.689663887023926, "global_step": 129643, "epoch": 3086} {"train_loss": -6.537187576293945, "global_step": 129644, "epoch": 3086} {"train_loss": -6.638115406036377, "global_step": 129645, "epoch": 3086} {"train_loss": -6.577638626098633, "global_step": 129646, "epoch": 3086} {"train_loss": -6.512356758117676, "global_step": 129647, "epoch": 3086} {"train_loss": -6.49631404876709, "global_step": 129648, "epoch": 3086} {"train_loss": -6.57832145690918, "global_step": 129649, "epoch": 3086} {"train_loss": -6.535709381103516, "global_step": 129650, "epoch": 3086} {"train_loss": -6.644896507263184, "global_step": 129651, "epoch": 3086} {"train_loss": -6.545293807983398, "global_step": 129652, "epoch": 3086} {"train_loss": -6.631119852974301, "global_step": 129653, "epoch": 3086, "val_loss": 77208.015625} {"train_loss": -6.643596649169922, "global_step": 129654, "epoch": 3087} {"train_loss": -6.564239501953125, "global_step": 129655, "epoch": 3087} {"train_loss": -6.757102966308594, "global_step": 129656, "epoch": 3087} {"train_loss": -6.7407612800598145, "global_step": 129657, "epoch": 3087} {"train_loss": -6.612649917602539, "global_step": 129658, "epoch": 3087} {"train_loss": -6.554389953613281, "global_step": 129659, "epoch": 3087} {"train_loss": -6.631735324859619, "global_step": 129660, "epoch": 3087} {"train_loss": -6.536282062530518, "global_step": 129661, "epoch": 3087} {"train_loss": -6.740401268005371, "global_step": 129662, "epoch": 3087} {"train_loss": -6.679478168487549, "global_step": 129663, "epoch": 3087} {"train_loss": -6.661955833435059, "global_step": 129664, "epoch": 3087} {"train_loss": -6.702002048492432, "global_step": 129665, "epoch": 3087} {"train_loss": -6.537153244018555, "global_step": 129666, "epoch": 3087} {"train_loss": -6.653825759887695, "global_step": 129667, "epoch": 3087} {"train_loss": -6.803903579711914, "global_step": 129668, "epoch": 3087} {"train_loss": -6.630685806274414, "global_step": 129669, "epoch": 3087} {"train_loss": -6.744579792022705, "global_step": 129670, "epoch": 3087} {"train_loss": -6.693742752075195, "global_step": 129671, "epoch": 3087} {"train_loss": -6.6522626876831055, "global_step": 129672, "epoch": 3087} {"train_loss": -6.614694595336914, "global_step": 129673, "epoch": 3087} {"train_loss": -6.673971652984619, "global_step": 129674, "epoch": 3087} {"train_loss": -6.604475021362305, "global_step": 129675, "epoch": 3087} {"train_loss": -6.627360820770264, "global_step": 129676, "epoch": 3087} {"train_loss": -6.701408386230469, "global_step": 129677, "epoch": 3087} {"train_loss": -6.650153160095215, "global_step": 129678, "epoch": 3087} {"train_loss": -6.674474716186523, "global_step": 129679, "epoch": 3087} {"train_loss": -6.551019668579102, "global_step": 129680, "epoch": 3087} {"train_loss": -6.571310520172119, "global_step": 129681, "epoch": 3087} {"train_loss": -6.651248931884766, "global_step": 129682, "epoch": 3087} {"train_loss": -6.745352268218994, "global_step": 129683, "epoch": 3087} {"train_loss": -6.67312479019165, "global_step": 129684, "epoch": 3087} {"train_loss": -6.618133544921875, "global_step": 129685, "epoch": 3087} {"train_loss": -6.674310684204102, "global_step": 129686, "epoch": 3087} {"train_loss": -6.668622016906738, "global_step": 129687, "epoch": 3087} {"train_loss": -6.700005531311035, "global_step": 129688, "epoch": 3087} {"train_loss": -6.759820938110352, "global_step": 129689, "epoch": 3087} {"train_loss": -6.733640670776367, "global_step": 129690, "epoch": 3087} {"train_loss": -6.593737602233887, "global_step": 129691, "epoch": 3087} {"train_loss": -6.553753852844238, "global_step": 129692, "epoch": 3087} {"train_loss": -6.51859712600708, "global_step": 129693, "epoch": 3087} {"train_loss": -6.6081695556640625, "global_step": 129694, "epoch": 3087} {"train_loss": -6.649662812550862, "global_step": 129695, "epoch": 3087, "val_loss": 77479.140625} {"train_loss": -6.547774314880371, "global_step": 129696, "epoch": 3088} {"train_loss": -6.627912998199463, "global_step": 129697, "epoch": 3088} {"train_loss": -6.729882717132568, "global_step": 129698, "epoch": 3088} {"train_loss": -6.645764350891113, "global_step": 129699, "epoch": 3088} {"train_loss": -6.628059387207031, "global_step": 129700, "epoch": 3088} {"train_loss": -6.66348934173584, "global_step": 129701, "epoch": 3088} {"train_loss": -6.605129718780518, "global_step": 129702, "epoch": 3088} {"train_loss": -6.7119245529174805, "global_step": 129703, "epoch": 3088} {"train_loss": -6.8108296394348145, "global_step": 129704, "epoch": 3088} {"train_loss": -6.6823577880859375, "global_step": 129705, "epoch": 3088} {"train_loss": -6.802083969116211, "global_step": 129706, "epoch": 3088} {"train_loss": -6.639446258544922, "global_step": 129707, "epoch": 3088} {"train_loss": -6.587841987609863, "global_step": 129708, "epoch": 3088} {"train_loss": -6.779851913452148, "global_step": 129709, "epoch": 3088} {"train_loss": -6.573905944824219, "global_step": 129710, "epoch": 3088} {"train_loss": -6.628240585327148, "global_step": 129711, "epoch": 3088} {"train_loss": -6.656901836395264, "global_step": 129712, "epoch": 3088} {"train_loss": -6.619265556335449, "global_step": 129713, "epoch": 3088} {"train_loss": -6.757955551147461, "global_step": 129714, "epoch": 3088} {"train_loss": -6.679472923278809, "global_step": 129715, "epoch": 3088} {"train_loss": -6.716376304626465, "global_step": 129716, "epoch": 3088} {"train_loss": -6.56438684463501, "global_step": 129717, "epoch": 3088} {"train_loss": -6.644657135009766, "global_step": 129718, "epoch": 3088} {"train_loss": -6.721410751342773, "global_step": 129719, "epoch": 3088} {"train_loss": -6.714808464050293, "global_step": 129720, "epoch": 3088} {"train_loss": -6.6656389236450195, "global_step": 129721, "epoch": 3088} {"train_loss": -6.825091361999512, "global_step": 129722, "epoch": 3088} {"train_loss": -6.73387336730957, "global_step": 129723, "epoch": 3088} {"train_loss": -6.770480632781982, "global_step": 129724, "epoch": 3088} {"train_loss": -6.5058979988098145, "global_step": 129725, "epoch": 3088} {"train_loss": -6.521747589111328, "global_step": 129726, "epoch": 3088} {"train_loss": -6.845942497253418, "global_step": 129727, "epoch": 3088} {"train_loss": -6.652354717254639, "global_step": 129728, "epoch": 3088} {"train_loss": -6.628164291381836, "global_step": 129729, "epoch": 3088} {"train_loss": -6.745362281799316, "global_step": 129730, "epoch": 3088} {"train_loss": -6.6084489822387695, "global_step": 129731, "epoch": 3088} {"train_loss": -6.698914051055908, "global_step": 129732, "epoch": 3088} {"train_loss": -6.714609622955322, "global_step": 129733, "epoch": 3088} {"train_loss": -6.782740592956543, "global_step": 129734, "epoch": 3088} {"train_loss": -6.610561847686768, "global_step": 129735, "epoch": 3088} {"train_loss": -6.647211074829102, "global_step": 129736, "epoch": 3088} {"train_loss": -6.677900541396368, "global_step": 129737, "epoch": 3088, "val_loss": 77295.8515625} {"train_loss": -6.793055534362793, "global_step": 129738, "epoch": 3089} {"train_loss": -6.7344441413879395, "global_step": 129739, "epoch": 3089} {"train_loss": -6.832638740539551, "global_step": 129740, "epoch": 3089} {"train_loss": -6.732363700866699, "global_step": 129741, "epoch": 3089} {"train_loss": -6.7894792556762695, "global_step": 129742, "epoch": 3089} {"train_loss": -6.786565780639648, "global_step": 129743, "epoch": 3089} {"train_loss": -6.6710615158081055, "global_step": 129744, "epoch": 3089} {"train_loss": -6.6246724128723145, "global_step": 129745, "epoch": 3089} {"train_loss": -6.567187309265137, "global_step": 129746, "epoch": 3089} {"train_loss": -6.825188636779785, "global_step": 129747, "epoch": 3089} {"train_loss": -6.757936477661133, "global_step": 129748, "epoch": 3089} {"train_loss": -6.709384918212891, "global_step": 129749, "epoch": 3089} {"train_loss": -6.6442155838012695, "global_step": 129750, "epoch": 3089} {"train_loss": -6.710012912750244, "global_step": 129751, "epoch": 3089} {"train_loss": -6.64085578918457, "global_step": 129752, "epoch": 3089} {"train_loss": -6.757372856140137, "global_step": 129753, "epoch": 3089} {"train_loss": -6.686209678649902, "global_step": 129754, "epoch": 3089} {"train_loss": -6.489362716674805, "global_step": 129755, "epoch": 3089} {"train_loss": -6.659024238586426, "global_step": 129756, "epoch": 3089} {"train_loss": -6.773722171783447, "global_step": 129757, "epoch": 3089} {"train_loss": -6.753455638885498, "global_step": 129758, "epoch": 3089} {"train_loss": -6.590311050415039, "global_step": 129759, "epoch": 3089} {"train_loss": -6.63612174987793, "global_step": 129760, "epoch": 3089} {"train_loss": -6.5924835205078125, "global_step": 129761, "epoch": 3089} {"train_loss": -6.674002170562744, "global_step": 129762, "epoch": 3089} {"train_loss": -6.619378089904785, "global_step": 129763, "epoch": 3089} {"train_loss": -6.674074172973633, "global_step": 129764, "epoch": 3089} {"train_loss": -6.694883346557617, "global_step": 129765, "epoch": 3089} {"train_loss": -6.627847671508789, "global_step": 129766, "epoch": 3089} {"train_loss": -6.668083190917969, "global_step": 129767, "epoch": 3089} {"train_loss": -6.621516704559326, "global_step": 129768, "epoch": 3089} {"train_loss": -6.608654975891113, "global_step": 129769, "epoch": 3089} {"train_loss": -6.496899127960205, "global_step": 129770, "epoch": 3089} {"train_loss": -6.642679691314697, "global_step": 129771, "epoch": 3089} {"train_loss": -6.7829437255859375, "global_step": 129772, "epoch": 3089} {"train_loss": -6.55318546295166, "global_step": 129773, "epoch": 3089} {"train_loss": -6.635777950286865, "global_step": 129774, "epoch": 3089} {"train_loss": -6.631712913513184, "global_step": 129775, "epoch": 3089} {"train_loss": -6.69410514831543, "global_step": 129776, "epoch": 3089} {"train_loss": -6.6446638107299805, "global_step": 129777, "epoch": 3089} {"train_loss": -6.630527019500732, "global_step": 129778, "epoch": 3089} {"train_loss": -6.671813419886997, "global_step": 129779, "epoch": 3089, "val_loss": 77437.9453125} {"train_loss": -6.750547409057617, "global_step": 129780, "epoch": 3090} {"train_loss": -6.707352638244629, "global_step": 129781, "epoch": 3090} {"train_loss": -6.536290645599365, "global_step": 129782, "epoch": 3090} {"train_loss": -6.699322700500488, "global_step": 129783, "epoch": 3090} {"train_loss": -6.686933994293213, "global_step": 129784, "epoch": 3090} {"train_loss": -6.651162624359131, "global_step": 129785, "epoch": 3090} {"train_loss": -6.733037948608398, "global_step": 129786, "epoch": 3090} {"train_loss": -6.694546699523926, "global_step": 129787, "epoch": 3090} {"train_loss": -6.668331146240234, "global_step": 129788, "epoch": 3090} {"train_loss": -6.708654403686523, "global_step": 129789, "epoch": 3090} {"train_loss": -6.689996242523193, "global_step": 129790, "epoch": 3090} {"train_loss": -6.7132568359375, "global_step": 129791, "epoch": 3090} {"train_loss": -6.7429609298706055, "global_step": 129792, "epoch": 3090} {"train_loss": -6.693549156188965, "global_step": 129793, "epoch": 3090} {"train_loss": -6.674860954284668, "global_step": 129794, "epoch": 3090} {"train_loss": -6.714635372161865, "global_step": 129795, "epoch": 3090} {"train_loss": -6.729504585266113, "global_step": 129796, "epoch": 3090} {"train_loss": -6.6921796798706055, "global_step": 129797, "epoch": 3090} {"train_loss": -6.605372428894043, "global_step": 129798, "epoch": 3090} {"train_loss": -6.801044464111328, "global_step": 129799, "epoch": 3090} {"train_loss": -6.738739967346191, "global_step": 129800, "epoch": 3090} {"train_loss": -6.76286506652832, "global_step": 129801, "epoch": 3090} {"train_loss": -6.624840259552002, "global_step": 129802, "epoch": 3090} {"train_loss": -6.597392559051514, "global_step": 129803, "epoch": 3090} {"train_loss": -6.722647666931152, "global_step": 129804, "epoch": 3090} {"train_loss": -6.644908428192139, "global_step": 129805, "epoch": 3090} {"train_loss": -6.619616985321045, "global_step": 129806, "epoch": 3090} {"train_loss": -6.689774990081787, "global_step": 129807, "epoch": 3090} {"train_loss": -6.67413330078125, "global_step": 129808, "epoch": 3090} {"train_loss": -6.689449310302734, "global_step": 129809, "epoch": 3090} {"train_loss": -6.672215938568115, "global_step": 129810, "epoch": 3090} {"train_loss": -6.593593597412109, "global_step": 129811, "epoch": 3090} {"train_loss": -6.659426689147949, "global_step": 129812, "epoch": 3090} {"train_loss": -6.417654037475586, "global_step": 129813, "epoch": 3090} {"train_loss": -6.411736488342285, "global_step": 129814, "epoch": 3090} {"train_loss": -6.722904205322266, "global_step": 129815, "epoch": 3090} {"train_loss": -6.48824405670166, "global_step": 129816, "epoch": 3090} {"train_loss": -6.457378387451172, "global_step": 129817, "epoch": 3090} {"train_loss": -6.548325061798096, "global_step": 129818, "epoch": 3090} {"train_loss": -6.642106533050537, "global_step": 129819, "epoch": 3090} {"train_loss": -6.532930850982666, "global_step": 129820, "epoch": 3090} {"train_loss": -6.648633411952427, "global_step": 129821, "epoch": 3090, "val_loss": 77318.0625} {"train_loss": -6.670932292938232, "global_step": 129822, "epoch": 3091} {"train_loss": -6.331727504730225, "global_step": 129823, "epoch": 3091} {"train_loss": -6.727902412414551, "global_step": 129824, "epoch": 3091} {"train_loss": -6.372088432312012, "global_step": 129825, "epoch": 3091} {"train_loss": -6.5572710037231445, "global_step": 129826, "epoch": 3091} {"train_loss": -6.604071617126465, "global_step": 129827, "epoch": 3091} {"train_loss": -6.411481857299805, "global_step": 129828, "epoch": 3091} {"train_loss": -6.566118240356445, "global_step": 129829, "epoch": 3091} {"train_loss": -6.606248378753662, "global_step": 129830, "epoch": 3091} {"train_loss": -6.595280647277832, "global_step": 129831, "epoch": 3091} {"train_loss": -6.549965858459473, "global_step": 129832, "epoch": 3091} {"train_loss": -6.4099955558776855, "global_step": 129833, "epoch": 3091} {"train_loss": -6.714605808258057, "global_step": 129834, "epoch": 3091} {"train_loss": -6.4844255447387695, "global_step": 129835, "epoch": 3091} {"train_loss": -6.5461320877075195, "global_step": 129836, "epoch": 3091} {"train_loss": -6.588085174560547, "global_step": 129837, "epoch": 3091} {"train_loss": -6.689583778381348, "global_step": 129838, "epoch": 3091} {"train_loss": -6.537444114685059, "global_step": 129839, "epoch": 3091} {"train_loss": -6.531520843505859, "global_step": 129840, "epoch": 3091} {"train_loss": -6.538434028625488, "global_step": 129841, "epoch": 3091} {"train_loss": -6.587986946105957, "global_step": 129842, "epoch": 3091} {"train_loss": -6.670269012451172, "global_step": 129843, "epoch": 3091} {"train_loss": -6.681399345397949, "global_step": 129844, "epoch": 3091} {"train_loss": -6.689990997314453, "global_step": 129845, "epoch": 3091} {"train_loss": -6.638277530670166, "global_step": 129846, "epoch": 3091} {"train_loss": -6.604877471923828, "global_step": 129847, "epoch": 3091} {"train_loss": -6.605528354644775, "global_step": 129848, "epoch": 3091} {"train_loss": -6.737986087799072, "global_step": 129849, "epoch": 3091} {"train_loss": -6.596804141998291, "global_step": 129850, "epoch": 3091} {"train_loss": -6.769961357116699, "global_step": 129851, "epoch": 3091} {"train_loss": -6.630238056182861, "global_step": 129852, "epoch": 3091} {"train_loss": -6.684564113616943, "global_step": 129853, "epoch": 3091} {"train_loss": -6.652336597442627, "global_step": 129854, "epoch": 3091} {"train_loss": -6.696195602416992, "global_step": 129855, "epoch": 3091} {"train_loss": -6.685208320617676, "global_step": 129856, "epoch": 3091} {"train_loss": -6.630422115325928, "global_step": 129857, "epoch": 3091} {"train_loss": -6.66254997253418, "global_step": 129858, "epoch": 3091} {"train_loss": -6.667421817779541, "global_step": 129859, "epoch": 3091} {"train_loss": -6.71867561340332, "global_step": 129860, "epoch": 3091} {"train_loss": -6.643030643463135, "global_step": 129861, "epoch": 3091} {"train_loss": -6.675666332244873, "global_step": 129862, "epoch": 3091} {"train_loss": -6.613274971644084, "global_step": 129863, "epoch": 3091, "val_loss": 77571.8984375} {"train_loss": -6.661766052246094, "global_step": 129864, "epoch": 3092} {"train_loss": -6.807958602905273, "global_step": 129865, "epoch": 3092} {"train_loss": -6.6773600578308105, "global_step": 129866, "epoch": 3092} {"train_loss": -6.780940532684326, "global_step": 129867, "epoch": 3092} {"train_loss": -6.6956095695495605, "global_step": 129868, "epoch": 3092} {"train_loss": -6.820762634277344, "global_step": 129869, "epoch": 3092} {"train_loss": -6.653461933135986, "global_step": 129870, "epoch": 3092} {"train_loss": -6.601900100708008, "global_step": 129871, "epoch": 3092} {"train_loss": -6.719548225402832, "global_step": 129872, "epoch": 3092} {"train_loss": -6.74807596206665, "global_step": 129873, "epoch": 3092} {"train_loss": -6.596996784210205, "global_step": 129874, "epoch": 3092} {"train_loss": -6.678804397583008, "global_step": 129875, "epoch": 3092} {"train_loss": -6.6381916999816895, "global_step": 129876, "epoch": 3092} {"train_loss": -6.674411773681641, "global_step": 129877, "epoch": 3092} {"train_loss": -6.689300060272217, "global_step": 129878, "epoch": 3092} {"train_loss": -6.66805362701416, "global_step": 129879, "epoch": 3092} {"train_loss": -6.8280205726623535, "global_step": 129880, "epoch": 3092} {"train_loss": -6.691319465637207, "global_step": 129881, "epoch": 3092} {"train_loss": -6.7031049728393555, "global_step": 129882, "epoch": 3092} {"train_loss": -6.580104827880859, "global_step": 129883, "epoch": 3092} {"train_loss": -6.658729553222656, "global_step": 129884, "epoch": 3092} {"train_loss": -6.666349411010742, "global_step": 129885, "epoch": 3092} {"train_loss": -6.558809280395508, "global_step": 129886, "epoch": 3092} {"train_loss": -6.6100311279296875, "global_step": 129887, "epoch": 3092} {"train_loss": -6.534684181213379, "global_step": 129888, "epoch": 3092} {"train_loss": -6.634213447570801, "global_step": 129889, "epoch": 3092} {"train_loss": -6.624754905700684, "global_step": 129890, "epoch": 3092} {"train_loss": -6.667849540710449, "global_step": 129891, "epoch": 3092} {"train_loss": -6.638568878173828, "global_step": 129892, "epoch": 3092} {"train_loss": -6.519784927368164, "global_step": 129893, "epoch": 3092} {"train_loss": -6.702722072601318, "global_step": 129894, "epoch": 3092} {"train_loss": -6.784865379333496, "global_step": 129895, "epoch": 3092} {"train_loss": -6.5582075119018555, "global_step": 129896, "epoch": 3092} {"train_loss": -6.620066165924072, "global_step": 129897, "epoch": 3092} {"train_loss": -6.591432571411133, "global_step": 129898, "epoch": 3092} {"train_loss": -6.787406921386719, "global_step": 129899, "epoch": 3092} {"train_loss": -6.638957500457764, "global_step": 129900, "epoch": 3092} {"train_loss": -6.563701629638672, "global_step": 129901, "epoch": 3092} {"train_loss": -6.523576736450195, "global_step": 129902, "epoch": 3092} {"train_loss": -6.695931911468506, "global_step": 129903, "epoch": 3092} {"train_loss": -6.499040126800537, "global_step": 129904, "epoch": 3092} {"train_loss": -6.6586983771551225, "global_step": 129905, "epoch": 3092, "val_loss": 77503.671875} {"train_loss": -6.65609884262085, "global_step": 129906, "epoch": 3093} {"train_loss": -6.787590026855469, "global_step": 129907, "epoch": 3093} {"train_loss": -6.641070365905762, "global_step": 129908, "epoch": 3093} {"train_loss": -6.814392566680908, "global_step": 129909, "epoch": 3093} {"train_loss": -6.6776442527771, "global_step": 129910, "epoch": 3093} {"train_loss": -6.717310905456543, "global_step": 129911, "epoch": 3093} {"train_loss": -6.70729923248291, "global_step": 129912, "epoch": 3093} {"train_loss": -6.611422538757324, "global_step": 129913, "epoch": 3093} {"train_loss": -6.705169677734375, "global_step": 129914, "epoch": 3093} {"train_loss": -6.63234806060791, "global_step": 129915, "epoch": 3093} {"train_loss": -6.646995544433594, "global_step": 129916, "epoch": 3093} {"train_loss": -6.743443489074707, "global_step": 129917, "epoch": 3093} {"train_loss": -6.615342140197754, "global_step": 129918, "epoch": 3093} {"train_loss": -6.701007843017578, "global_step": 129919, "epoch": 3093} {"train_loss": -6.630126953125, "global_step": 129920, "epoch": 3093} {"train_loss": -6.587471008300781, "global_step": 129921, "epoch": 3093} {"train_loss": -6.6827545166015625, "global_step": 129922, "epoch": 3093} {"train_loss": -6.675530433654785, "global_step": 129923, "epoch": 3093} {"train_loss": -6.567631721496582, "global_step": 129924, "epoch": 3093} {"train_loss": -6.707165718078613, "global_step": 129925, "epoch": 3093} {"train_loss": -6.721229553222656, "global_step": 129926, "epoch": 3093} {"train_loss": -6.487586975097656, "global_step": 129927, "epoch": 3093} {"train_loss": -6.665308475494385, "global_step": 129928, "epoch": 3093} {"train_loss": -6.589921474456787, "global_step": 129929, "epoch": 3093} {"train_loss": -6.658078193664551, "global_step": 129930, "epoch": 3093} {"train_loss": -6.716158866882324, "global_step": 129931, "epoch": 3093} {"train_loss": -6.487249851226807, "global_step": 129932, "epoch": 3093} {"train_loss": -6.732362747192383, "global_step": 129933, "epoch": 3093} {"train_loss": -6.560990333557129, "global_step": 129934, "epoch": 3093} {"train_loss": -6.578376770019531, "global_step": 129935, "epoch": 3093} {"train_loss": -6.6534929275512695, "global_step": 129936, "epoch": 3093} {"train_loss": -6.563664436340332, "global_step": 129937, "epoch": 3093} {"train_loss": -6.611769676208496, "global_step": 129938, "epoch": 3093} {"train_loss": -6.652918338775635, "global_step": 129939, "epoch": 3093} {"train_loss": -6.55662727355957, "global_step": 129940, "epoch": 3093} {"train_loss": -6.581256866455078, "global_step": 129941, "epoch": 3093} {"train_loss": -6.6404709815979, "global_step": 129942, "epoch": 3093} {"train_loss": -6.61279821395874, "global_step": 129943, "epoch": 3093} {"train_loss": -6.622966289520264, "global_step": 129944, "epoch": 3093} {"train_loss": -6.710378170013428, "global_step": 129945, "epoch": 3093} {"train_loss": -6.688329696655273, "global_step": 129946, "epoch": 3093} {"train_loss": -6.648611647742135, "global_step": 129947, "epoch": 3093, "val_loss": 77329.9921875} {"train_loss": -6.6427106857299805, "global_step": 129948, "epoch": 3094} {"train_loss": -6.648283004760742, "global_step": 129949, "epoch": 3094} {"train_loss": -6.8215179443359375, "global_step": 129950, "epoch": 3094} {"train_loss": -6.655875205993652, "global_step": 129951, "epoch": 3094} {"train_loss": -6.684978485107422, "global_step": 129952, "epoch": 3094} {"train_loss": -6.618753433227539, "global_step": 129953, "epoch": 3094} {"train_loss": -6.695320129394531, "global_step": 129954, "epoch": 3094} {"train_loss": -6.691871166229248, "global_step": 129955, "epoch": 3094} {"train_loss": -6.598170280456543, "global_step": 129956, "epoch": 3094} {"train_loss": -6.669380187988281, "global_step": 129957, "epoch": 3094} {"train_loss": -6.808049201965332, "global_step": 129958, "epoch": 3094} {"train_loss": -6.707805633544922, "global_step": 129959, "epoch": 3094} {"train_loss": -6.819923400878906, "global_step": 129960, "epoch": 3094} {"train_loss": -6.565968990325928, "global_step": 129961, "epoch": 3094} {"train_loss": -6.73318338394165, "global_step": 129962, "epoch": 3094} {"train_loss": -6.787295341491699, "global_step": 129963, "epoch": 3094} {"train_loss": -6.631385803222656, "global_step": 129964, "epoch": 3094} {"train_loss": -6.6562371253967285, "global_step": 129965, "epoch": 3094} {"train_loss": -6.705255031585693, "global_step": 129966, "epoch": 3094} {"train_loss": -6.766391754150391, "global_step": 129967, "epoch": 3094} {"train_loss": -6.629322528839111, "global_step": 129968, "epoch": 3094} {"train_loss": -6.609230041503906, "global_step": 129969, "epoch": 3094} {"train_loss": -6.571093559265137, "global_step": 129970, "epoch": 3094} {"train_loss": -6.67617130279541, "global_step": 129971, "epoch": 3094} {"train_loss": -6.698896884918213, "global_step": 129972, "epoch": 3094} {"train_loss": -6.59698486328125, "global_step": 129973, "epoch": 3094} {"train_loss": -6.660318851470947, "global_step": 129974, "epoch": 3094} {"train_loss": -6.641819477081299, "global_step": 129975, "epoch": 3094} {"train_loss": -6.625054836273193, "global_step": 129976, "epoch": 3094} {"train_loss": -6.637231349945068, "global_step": 129977, "epoch": 3094} {"train_loss": -6.617099761962891, "global_step": 129978, "epoch": 3094} {"train_loss": -6.7017011642456055, "global_step": 129979, "epoch": 3094} {"train_loss": -6.6714067459106445, "global_step": 129980, "epoch": 3094} {"train_loss": -6.648416519165039, "global_step": 129981, "epoch": 3094} {"train_loss": -6.685108184814453, "global_step": 129982, "epoch": 3094} {"train_loss": -6.803769111633301, "global_step": 129983, "epoch": 3094} {"train_loss": -6.719598293304443, "global_step": 129984, "epoch": 3094} {"train_loss": -6.707986354827881, "global_step": 129985, "epoch": 3094} {"train_loss": -6.660077095031738, "global_step": 129986, "epoch": 3094} {"train_loss": -6.738709926605225, "global_step": 129987, "epoch": 3094} {"train_loss": -6.682863235473633, "global_step": 129988, "epoch": 3094} {"train_loss": -6.678055218287876, "global_step": 129989, "epoch": 3094, "val_loss": 77353.625} {"train_loss": -6.679975986480713, "global_step": 129990, "epoch": 3095} {"train_loss": -6.668204307556152, "global_step": 129991, "epoch": 3095} {"train_loss": -6.690239906311035, "global_step": 129992, "epoch": 3095} {"train_loss": -6.710930824279785, "global_step": 129993, "epoch": 3095} {"train_loss": -6.656050205230713, "global_step": 129994, "epoch": 3095} {"train_loss": -6.530192852020264, "global_step": 129995, "epoch": 3095} {"train_loss": -6.62972354888916, "global_step": 129996, "epoch": 3095} {"train_loss": -6.701379776000977, "global_step": 129997, "epoch": 3095} {"train_loss": -6.468194007873535, "global_step": 129998, "epoch": 3095} {"train_loss": -6.63169002532959, "global_step": 129999, "epoch": 3095} {"train_loss": -6.585445404052734, "global_step": 130000, "epoch": 3095} {"train_loss": -6.808955192565918, "global_step": 130001, "epoch": 3095} {"train_loss": -6.759642124176025, "global_step": 130002, "epoch": 3095} {"train_loss": -6.660318851470947, "global_step": 130003, "epoch": 3095} {"train_loss": -6.742889404296875, "global_step": 130004, "epoch": 3095} {"train_loss": -6.788427352905273, "global_step": 130005, "epoch": 3095} {"train_loss": -6.731339454650879, "global_step": 130006, "epoch": 3095} {"train_loss": -6.7808685302734375, "global_step": 130007, "epoch": 3095} {"train_loss": -6.579530239105225, "global_step": 130008, "epoch": 3095} {"train_loss": -6.611577033996582, "global_step": 130009, "epoch": 3095} {"train_loss": -6.706760406494141, "global_step": 130010, "epoch": 3095} {"train_loss": -6.722558975219727, "global_step": 130011, "epoch": 3095} {"train_loss": -6.701372146606445, "global_step": 130012, "epoch": 3095} {"train_loss": -6.655107498168945, "global_step": 130013, "epoch": 3095} {"train_loss": -6.703134536743164, "global_step": 130014, "epoch": 3095} {"train_loss": -6.739166259765625, "global_step": 130015, "epoch": 3095} {"train_loss": -6.776228427886963, "global_step": 130016, "epoch": 3095} {"train_loss": -6.7361907958984375, "global_step": 130017, "epoch": 3095} {"train_loss": -6.788632869720459, "global_step": 130018, "epoch": 3095} {"train_loss": -6.750441551208496, "global_step": 130019, "epoch": 3095} {"train_loss": -6.6453633308410645, "global_step": 130020, "epoch": 3095} {"train_loss": -6.774759292602539, "global_step": 130021, "epoch": 3095} {"train_loss": -6.699143409729004, "global_step": 130022, "epoch": 3095} {"train_loss": -6.689691543579102, "global_step": 130023, "epoch": 3095} {"train_loss": -6.675549030303955, "global_step": 130024, "epoch": 3095} {"train_loss": -6.746275901794434, "global_step": 130025, "epoch": 3095} {"train_loss": -6.632167339324951, "global_step": 130026, "epoch": 3095} {"train_loss": -6.664393424987793, "global_step": 130027, "epoch": 3095} {"train_loss": -6.627281665802002, "global_step": 130028, "epoch": 3095} {"train_loss": -6.65509033203125, "global_step": 130029, "epoch": 3095} {"train_loss": -6.788314342498779, "global_step": 130030, "epoch": 3095} {"train_loss": -6.689919312795003, "global_step": 130031, "epoch": 3095, "val_loss": 77389.734375} {"train_loss": -6.579424858093262, "global_step": 130032, "epoch": 3096} {"train_loss": -6.793920516967773, "global_step": 130033, "epoch": 3096} {"train_loss": -6.655405521392822, "global_step": 130034, "epoch": 3096} {"train_loss": -6.703887939453125, "global_step": 130035, "epoch": 3096} {"train_loss": -6.748669147491455, "global_step": 130036, "epoch": 3096} {"train_loss": -6.487325191497803, "global_step": 130037, "epoch": 3096} {"train_loss": -6.667445182800293, "global_step": 130038, "epoch": 3096} {"train_loss": -6.628164291381836, "global_step": 130039, "epoch": 3096} {"train_loss": -6.531687259674072, "global_step": 130040, "epoch": 3096} {"train_loss": -6.719968318939209, "global_step": 130041, "epoch": 3096} {"train_loss": -6.404313087463379, "global_step": 130042, "epoch": 3096} {"train_loss": -6.5577473640441895, "global_step": 130043, "epoch": 3096} {"train_loss": -6.631941795349121, "global_step": 130044, "epoch": 3096} {"train_loss": -6.536806106567383, "global_step": 130045, "epoch": 3096} {"train_loss": -6.4548726081848145, "global_step": 130046, "epoch": 3096} {"train_loss": -6.689525604248047, "global_step": 130047, "epoch": 3096} {"train_loss": -6.666510581970215, "global_step": 130048, "epoch": 3096} {"train_loss": -6.587490081787109, "global_step": 130049, "epoch": 3096} {"train_loss": -6.730727195739746, "global_step": 130050, "epoch": 3096} {"train_loss": -6.559036731719971, "global_step": 130051, "epoch": 3096} {"train_loss": -6.571288585662842, "global_step": 130052, "epoch": 3096} {"train_loss": -6.519503593444824, "global_step": 130053, "epoch": 3096} {"train_loss": -6.560624122619629, "global_step": 130054, "epoch": 3096} {"train_loss": -6.517112731933594, "global_step": 130055, "epoch": 3096} {"train_loss": -6.671055793762207, "global_step": 130056, "epoch": 3096} {"train_loss": -6.637393474578857, "global_step": 130057, "epoch": 3096} {"train_loss": -6.642233848571777, "global_step": 130058, "epoch": 3096} {"train_loss": -6.684600830078125, "global_step": 130059, "epoch": 3096} {"train_loss": -6.664383888244629, "global_step": 130060, "epoch": 3096} {"train_loss": -6.722226142883301, "global_step": 130061, "epoch": 3096} {"train_loss": -6.709751129150391, "global_step": 130062, "epoch": 3096} {"train_loss": -6.6389546394348145, "global_step": 130063, "epoch": 3096} {"train_loss": -6.703821182250977, "global_step": 130064, "epoch": 3096} {"train_loss": -6.580144882202148, "global_step": 130065, "epoch": 3096} {"train_loss": -6.649892807006836, "global_step": 130066, "epoch": 3096} {"train_loss": -6.6035308837890625, "global_step": 130067, "epoch": 3096} {"train_loss": -6.622398376464844, "global_step": 130068, "epoch": 3096} {"train_loss": -6.7444047927856445, "global_step": 130069, "epoch": 3096} {"train_loss": -6.470939636230469, "global_step": 130070, "epoch": 3096} {"train_loss": -6.619291305541992, "global_step": 130071, "epoch": 3096} {"train_loss": -6.653670310974121, "global_step": 130072, "epoch": 3096} {"train_loss": -6.620587439764114, "global_step": 130073, "epoch": 3096, "val_loss": 77487.734375} {"train_loss": -6.749336242675781, "global_step": 130074, "epoch": 3097} {"train_loss": -6.555158615112305, "global_step": 130075, "epoch": 3097} {"train_loss": -6.636106491088867, "global_step": 130076, "epoch": 3097} {"train_loss": -6.591488838195801, "global_step": 130077, "epoch": 3097} {"train_loss": -6.610396385192871, "global_step": 130078, "epoch": 3097} {"train_loss": -6.587402820587158, "global_step": 130079, "epoch": 3097} {"train_loss": -6.554069519042969, "global_step": 130080, "epoch": 3097} {"train_loss": -6.543312072753906, "global_step": 130081, "epoch": 3097} {"train_loss": -6.588013648986816, "global_step": 130082, "epoch": 3097} {"train_loss": -6.63441276550293, "global_step": 130083, "epoch": 3097} {"train_loss": -6.565443992614746, "global_step": 130084, "epoch": 3097} {"train_loss": -6.737964153289795, "global_step": 130085, "epoch": 3097} {"train_loss": -6.531704902648926, "global_step": 130086, "epoch": 3097} {"train_loss": -6.574419021606445, "global_step": 130087, "epoch": 3097} {"train_loss": -6.665214538574219, "global_step": 130088, "epoch": 3097} {"train_loss": -6.580991744995117, "global_step": 130089, "epoch": 3097} {"train_loss": -6.611665725708008, "global_step": 130090, "epoch": 3097} {"train_loss": -6.719025611877441, "global_step": 130091, "epoch": 3097} {"train_loss": -6.760758399963379, "global_step": 130092, "epoch": 3097} {"train_loss": -6.668851375579834, "global_step": 130093, "epoch": 3097} {"train_loss": -6.600053787231445, "global_step": 130094, "epoch": 3097} {"train_loss": -6.693230628967285, "global_step": 130095, "epoch": 3097} {"train_loss": -6.633643627166748, "global_step": 130096, "epoch": 3097} {"train_loss": -6.64453649520874, "global_step": 130097, "epoch": 3097} {"train_loss": -6.670405387878418, "global_step": 130098, "epoch": 3097} {"train_loss": -6.692477703094482, "global_step": 130099, "epoch": 3097} {"train_loss": -6.755129337310791, "global_step": 130100, "epoch": 3097} {"train_loss": -6.643067359924316, "global_step": 130101, "epoch": 3097} {"train_loss": -6.653304100036621, "global_step": 130102, "epoch": 3097} {"train_loss": -6.66361141204834, "global_step": 130103, "epoch": 3097} {"train_loss": -6.608880996704102, "global_step": 130104, "epoch": 3097} {"train_loss": -6.647373199462891, "global_step": 130105, "epoch": 3097} {"train_loss": -6.597024440765381, "global_step": 130106, "epoch": 3097} {"train_loss": -6.801592826843262, "global_step": 130107, "epoch": 3097} {"train_loss": -6.71462345123291, "global_step": 130108, "epoch": 3097} {"train_loss": -6.704656600952148, "global_step": 130109, "epoch": 3097} {"train_loss": -6.707211971282959, "global_step": 130110, "epoch": 3097} {"train_loss": -6.751770973205566, "global_step": 130111, "epoch": 3097} {"train_loss": -6.632865905761719, "global_step": 130112, "epoch": 3097} {"train_loss": -6.618186950683594, "global_step": 130113, "epoch": 3097} {"train_loss": -6.55817985534668, "global_step": 130114, "epoch": 3097} {"train_loss": -6.646244968686785, "global_step": 130115, "epoch": 3097, "val_loss": 77363.390625} {"train_loss": -6.789679527282715, "global_step": 130116, "epoch": 3098} {"train_loss": -6.675246715545654, "global_step": 130117, "epoch": 3098} {"train_loss": -6.703137397766113, "global_step": 130118, "epoch": 3098} {"train_loss": -6.72263240814209, "global_step": 130119, "epoch": 3098} {"train_loss": -6.68162727355957, "global_step": 130120, "epoch": 3098} {"train_loss": -6.759390830993652, "global_step": 130121, "epoch": 3098} {"train_loss": -6.68075704574585, "global_step": 130122, "epoch": 3098} {"train_loss": -6.6509785652160645, "global_step": 130123, "epoch": 3098} {"train_loss": -6.756176948547363, "global_step": 130124, "epoch": 3098} {"train_loss": -6.6213059425354, "global_step": 130125, "epoch": 3098} {"train_loss": -6.650572299957275, "global_step": 130126, "epoch": 3098} {"train_loss": -6.685096740722656, "global_step": 130127, "epoch": 3098} {"train_loss": -6.681260585784912, "global_step": 130128, "epoch": 3098} {"train_loss": -6.693411350250244, "global_step": 130129, "epoch": 3098} {"train_loss": -6.75537109375, "global_step": 130130, "epoch": 3098} {"train_loss": -6.701725959777832, "global_step": 130131, "epoch": 3098} {"train_loss": -6.722317695617676, "global_step": 130132, "epoch": 3098} {"train_loss": -6.665877342224121, "global_step": 130133, "epoch": 3098} {"train_loss": -6.686409950256348, "global_step": 130134, "epoch": 3098} {"train_loss": -6.608916282653809, "global_step": 130135, "epoch": 3098} {"train_loss": -6.719156742095947, "global_step": 130136, "epoch": 3098} {"train_loss": -6.716997146606445, "global_step": 130137, "epoch": 3098} {"train_loss": -6.718820571899414, "global_step": 130138, "epoch": 3098} {"train_loss": -6.64938497543335, "global_step": 130139, "epoch": 3098} {"train_loss": -6.692188739776611, "global_step": 130140, "epoch": 3098} {"train_loss": -6.676694393157959, "global_step": 130141, "epoch": 3098} {"train_loss": -6.6893720626831055, "global_step": 130142, "epoch": 3098} {"train_loss": -6.810675621032715, "global_step": 130143, "epoch": 3098} {"train_loss": -6.645481586456299, "global_step": 130144, "epoch": 3098} {"train_loss": -6.4986982345581055, "global_step": 130145, "epoch": 3098} {"train_loss": -6.6892008781433105, "global_step": 130146, "epoch": 3098} {"train_loss": -6.661980152130127, "global_step": 130147, "epoch": 3098} {"train_loss": -6.692097187042236, "global_step": 130148, "epoch": 3098} {"train_loss": -6.760222911834717, "global_step": 130149, "epoch": 3098} {"train_loss": -6.604475498199463, "global_step": 130150, "epoch": 3098} {"train_loss": -6.602545261383057, "global_step": 130151, "epoch": 3098} {"train_loss": -6.719394683837891, "global_step": 130152, "epoch": 3098} {"train_loss": -6.696735382080078, "global_step": 130153, "epoch": 3098} {"train_loss": -6.537304878234863, "global_step": 130154, "epoch": 3098} {"train_loss": -6.699499130249023, "global_step": 130155, "epoch": 3098} {"train_loss": -6.7952961921691895, "global_step": 130156, "epoch": 3098} {"train_loss": -6.687714712960379, "global_step": 130157, "epoch": 3098, "val_loss": 77443.328125} {"train_loss": -6.680888652801514, "global_step": 130158, "epoch": 3099} {"train_loss": -6.666213035583496, "global_step": 130159, "epoch": 3099} {"train_loss": -6.73473596572876, "global_step": 130160, "epoch": 3099} {"train_loss": -6.767940521240234, "global_step": 130161, "epoch": 3099} {"train_loss": -6.651637077331543, "global_step": 130162, "epoch": 3099} {"train_loss": -6.674775123596191, "global_step": 130163, "epoch": 3099} {"train_loss": -6.637700080871582, "global_step": 130164, "epoch": 3099} {"train_loss": -6.784192085266113, "global_step": 130165, "epoch": 3099} {"train_loss": -6.6659836769104, "global_step": 130166, "epoch": 3099} {"train_loss": -6.646658897399902, "global_step": 130167, "epoch": 3099} {"train_loss": -6.732117176055908, "global_step": 130168, "epoch": 3099} {"train_loss": -6.636252403259277, "global_step": 130169, "epoch": 3099} {"train_loss": -6.735332489013672, "global_step": 130170, "epoch": 3099} {"train_loss": -6.711440086364746, "global_step": 130171, "epoch": 3099} {"train_loss": -6.599212646484375, "global_step": 130172, "epoch": 3099} {"train_loss": -6.5988945960998535, "global_step": 130173, "epoch": 3099} {"train_loss": -6.581998825073242, "global_step": 130174, "epoch": 3099} {"train_loss": -6.731337070465088, "global_step": 130175, "epoch": 3099} {"train_loss": -6.575474739074707, "global_step": 130176, "epoch": 3099} {"train_loss": -6.746518135070801, "global_step": 130177, "epoch": 3099} {"train_loss": -6.690406799316406, "global_step": 130178, "epoch": 3099} {"train_loss": -6.709132194519043, "global_step": 130179, "epoch": 3099} {"train_loss": -6.69564151763916, "global_step": 130180, "epoch": 3099} {"train_loss": -6.618436813354492, "global_step": 130181, "epoch": 3099} {"train_loss": -6.70994234085083, "global_step": 130182, "epoch": 3099} {"train_loss": -6.713979721069336, "global_step": 130183, "epoch": 3099} {"train_loss": -6.859403133392334, "global_step": 130184, "epoch": 3099} {"train_loss": -6.569216251373291, "global_step": 130185, "epoch": 3099} {"train_loss": -6.533863067626953, "global_step": 130186, "epoch": 3099} {"train_loss": -6.622776985168457, "global_step": 130187, "epoch": 3099} {"train_loss": -6.63407039642334, "global_step": 130188, "epoch": 3099} {"train_loss": -6.650607585906982, "global_step": 130189, "epoch": 3099} {"train_loss": -6.701719284057617, "global_step": 130190, "epoch": 3099} {"train_loss": -6.702705383300781, "global_step": 130191, "epoch": 3099} {"train_loss": -6.6553144454956055, "global_step": 130192, "epoch": 3099} {"train_loss": -6.607304573059082, "global_step": 130193, "epoch": 3099} {"train_loss": -6.726508140563965, "global_step": 130194, "epoch": 3099} {"train_loss": -6.788602352142334, "global_step": 130195, "epoch": 3099} {"train_loss": -6.64715576171875, "global_step": 130196, "epoch": 3099} {"train_loss": -6.554388523101807, "global_step": 130197, "epoch": 3099} {"train_loss": -6.602900505065918, "global_step": 130198, "epoch": 3099} {"train_loss": -6.66892731757391, "global_step": 130199, "epoch": 3099, "val_loss": 77401.015625} {"train_loss": -6.5898637771606445, "global_step": 130200, "epoch": 3100} {"train_loss": -6.565362930297852, "global_step": 130201, "epoch": 3100} {"train_loss": -6.669069290161133, "global_step": 130202, "epoch": 3100} {"train_loss": -6.628161430358887, "global_step": 130203, "epoch": 3100} {"train_loss": -6.585232257843018, "global_step": 130204, "epoch": 3100} {"train_loss": -6.729674816131592, "global_step": 130205, "epoch": 3100} {"train_loss": -6.615729808807373, "global_step": 130206, "epoch": 3100} {"train_loss": -6.715381622314453, "global_step": 130207, "epoch": 3100} {"train_loss": -6.5376973152160645, "global_step": 130208, "epoch": 3100} {"train_loss": -6.618318557739258, "global_step": 130209, "epoch": 3100} {"train_loss": -6.645498275756836, "global_step": 130210, "epoch": 3100} {"train_loss": -6.5415449142456055, "global_step": 130211, "epoch": 3100} {"train_loss": -6.616114616394043, "global_step": 130212, "epoch": 3100} {"train_loss": -6.729291915893555, "global_step": 130213, "epoch": 3100} {"train_loss": -6.634468078613281, "global_step": 130214, "epoch": 3100} {"train_loss": -6.5829315185546875, "global_step": 130215, "epoch": 3100} {"train_loss": -6.767496585845947, "global_step": 130216, "epoch": 3100} {"train_loss": -6.7351789474487305, "global_step": 130217, "epoch": 3100} {"train_loss": -6.723575115203857, "global_step": 130218, "epoch": 3100} {"train_loss": -6.633841514587402, "global_step": 130219, "epoch": 3100} {"train_loss": -6.6562347412109375, "global_step": 130220, "epoch": 3100} {"train_loss": -6.601653099060059, "global_step": 130221, "epoch": 3100} {"train_loss": -6.7619476318359375, "global_step": 130222, "epoch": 3100} {"train_loss": -6.621791362762451, "global_step": 130223, "epoch": 3100} {"train_loss": -6.704310417175293, "global_step": 130224, "epoch": 3100} {"train_loss": -6.689772605895996, "global_step": 130225, "epoch": 3100} {"train_loss": -6.754519939422607, "global_step": 130226, "epoch": 3100} {"train_loss": -6.818544387817383, "global_step": 130227, "epoch": 3100} {"train_loss": -6.691832542419434, "global_step": 130228, "epoch": 3100} {"train_loss": -6.707876205444336, "global_step": 130229, "epoch": 3100} {"train_loss": -6.708076477050781, "global_step": 130230, "epoch": 3100} {"train_loss": -6.560037612915039, "global_step": 130231, "epoch": 3100} {"train_loss": -6.6034088134765625, "global_step": 130232, "epoch": 3100} {"train_loss": -6.6206254959106445, "global_step": 130233, "epoch": 3100} {"train_loss": -6.565893173217773, "global_step": 130234, "epoch": 3100} {"train_loss": -6.658260345458984, "global_step": 130235, "epoch": 3100} {"train_loss": -6.595160484313965, "global_step": 130236, "epoch": 3100} {"train_loss": -6.5477142333984375, "global_step": 130237, "epoch": 3100} {"train_loss": -6.612123012542725, "global_step": 130238, "epoch": 3100} {"train_loss": -6.6309309005737305, "global_step": 130239, "epoch": 3100} {"train_loss": -6.599767684936523, "global_step": 130240, "epoch": 3100} {"train_loss": -6.650392123631069, "global_step": 130241, "epoch": 3100, "train/sim_max_reward_0": 0.903675690539967, "train/sim_max_reward_1": 0.8924197456151612, "train/sim_max_reward_2": 0.310624889024496, "train/sim_max_reward_3": 0.14040378226609238, "train/sim_max_reward_4": 0.6325626867088413, "train/sim_max_reward_5": 0.5649695275699593, "test/sim_max_reward_4500000": 0.9709131694338511, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9258176175725297, "test/sim_max_reward_4500003": 0.9628623453207228, "test/sim_max_reward_4500004": 0.7137545281118096, "test/sim_max_reward_4500005": 0.16500081773178316, "test/sim_max_reward_4500006": 0.9877671476546983, "test/sim_max_reward_4500007": 0.9561174685396737, "test/sim_max_reward_4500008": 0.0019540404951729753, "test/sim_max_reward_4500009": 0.9623696128767645, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9683333318458106, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.005195534549579351, "test/sim_max_reward_4500014": 0.6989425052907535, "test/sim_max_reward_4500015": 0.9871457942812284, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.09416652611335351, "test/sim_max_reward_4500018": 0.4653829708725019, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8497426644031619, "test/sim_max_reward_4500022": 0.9375999520385938, "test/sim_max_reward_4500023": 0.509683004142205, "test/sim_max_reward_4500024": 0.24236279564353727, "test/sim_max_reward_4500025": 0.7052321024384209, "test/sim_max_reward_4500026": 0.9608929762529069, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.1954431040599846, "test/sim_max_reward_4500029": 0.11090555603323585, "test/sim_max_reward_4500030": 0.8809389117502718, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05180389644362541, "test/sim_max_reward_4500033": 0.09803330160819743, "test/sim_max_reward_4500034": 0.9837796339991507, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 0.8174508061827287, "test/sim_max_reward_4500037": 0.46692124157915865, "test/sim_max_reward_4500038": 0.8441832932427232, "test/sim_max_reward_4500039": 0.9367165307104195, "test/sim_max_reward_4500040": 0.9489185763247525, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.39436864976208164, "test/sim_max_reward_4500043": 0.2572913021353705, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.950185975662016, "test/sim_max_reward_4500046": 0.9203563364598593, "test/sim_max_reward_4500047": 0.9312079825721131, "test/sim_max_reward_4500048": 0.9809800977452391, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5741093869540862, "test/mean_score": 0.5855134707177465, "val_loss": 77634.984375} {"train_loss": -6.5717034339904785, "global_step": 130242, "epoch": 3101} {"train_loss": -6.562196254730225, "global_step": 130243, "epoch": 3101} {"train_loss": -6.724637508392334, "global_step": 130244, "epoch": 3101} {"train_loss": -6.633885860443115, "global_step": 130245, "epoch": 3101} {"train_loss": -6.6108293533325195, "global_step": 130246, "epoch": 3101} {"train_loss": -6.6761369705200195, "global_step": 130247, "epoch": 3101} {"train_loss": -6.55084228515625, "global_step": 130248, "epoch": 3101} {"train_loss": -6.5598554611206055, "global_step": 130249, "epoch": 3101} {"train_loss": -6.67064094543457, "global_step": 130250, "epoch": 3101} {"train_loss": -6.46010160446167, "global_step": 130251, "epoch": 3101} {"train_loss": -6.581989288330078, "global_step": 130252, "epoch": 3101} {"train_loss": -6.584451675415039, "global_step": 130253, "epoch": 3101} {"train_loss": -6.5366716384887695, "global_step": 130254, "epoch": 3101} {"train_loss": -6.585842132568359, "global_step": 130255, "epoch": 3101} {"train_loss": -6.625261306762695, "global_step": 130256, "epoch": 3101} {"train_loss": -6.625862121582031, "global_step": 130257, "epoch": 3101} {"train_loss": -6.568868160247803, "global_step": 130258, "epoch": 3101} {"train_loss": -6.607745170593262, "global_step": 130259, "epoch": 3101} {"train_loss": -6.767917633056641, "global_step": 130260, "epoch": 3101} {"train_loss": -6.682770252227783, "global_step": 130261, "epoch": 3101} {"train_loss": -6.608877658843994, "global_step": 130262, "epoch": 3101} {"train_loss": -6.806324005126953, "global_step": 130263, "epoch": 3101} {"train_loss": -6.570704460144043, "global_step": 130264, "epoch": 3101} {"train_loss": -6.773769378662109, "global_step": 130265, "epoch": 3101} {"train_loss": -6.641829490661621, "global_step": 130266, "epoch": 3101} {"train_loss": -6.677859306335449, "global_step": 130267, "epoch": 3101} {"train_loss": -6.682994365692139, "global_step": 130268, "epoch": 3101} {"train_loss": -6.662919044494629, "global_step": 130269, "epoch": 3101} {"train_loss": -6.658341407775879, "global_step": 130270, "epoch": 3101} {"train_loss": -6.68803596496582, "global_step": 130271, "epoch": 3101} {"train_loss": -6.641467094421387, "global_step": 130272, "epoch": 3101} {"train_loss": -6.683300971984863, "global_step": 130273, "epoch": 3101} {"train_loss": -6.800424575805664, "global_step": 130274, "epoch": 3101} {"train_loss": -6.6951584815979, "global_step": 130275, "epoch": 3101} {"train_loss": -6.6542205810546875, "global_step": 130276, "epoch": 3101} {"train_loss": -6.633157253265381, "global_step": 130277, "epoch": 3101} {"train_loss": -6.800307750701904, "global_step": 130278, "epoch": 3101} {"train_loss": -6.689910888671875, "global_step": 130279, "epoch": 3101} {"train_loss": -6.653579235076904, "global_step": 130280, "epoch": 3101} {"train_loss": -6.620545387268066, "global_step": 130281, "epoch": 3101} {"train_loss": -6.7555437088012695, "global_step": 130282, "epoch": 3101} {"train_loss": -6.651320673170543, "global_step": 130283, "epoch": 3101, "val_loss": 77606.4140625} {"train_loss": -6.690337181091309, "global_step": 130284, "epoch": 3102} {"train_loss": -6.672551155090332, "global_step": 130285, "epoch": 3102} {"train_loss": -6.637660980224609, "global_step": 130286, "epoch": 3102} {"train_loss": -6.802204608917236, "global_step": 130287, "epoch": 3102} {"train_loss": -6.786433219909668, "global_step": 130288, "epoch": 3102} {"train_loss": -6.737008094787598, "global_step": 130289, "epoch": 3102} {"train_loss": -6.557942867279053, "global_step": 130290, "epoch": 3102} {"train_loss": -6.7234930992126465, "global_step": 130291, "epoch": 3102} {"train_loss": -6.775937080383301, "global_step": 130292, "epoch": 3102} {"train_loss": -6.765913009643555, "global_step": 130293, "epoch": 3102} {"train_loss": -6.7651472091674805, "global_step": 130294, "epoch": 3102} {"train_loss": -6.684572219848633, "global_step": 130295, "epoch": 3102} {"train_loss": -6.64759635925293, "global_step": 130296, "epoch": 3102} {"train_loss": -6.557593822479248, "global_step": 130297, "epoch": 3102} {"train_loss": -6.610036373138428, "global_step": 130298, "epoch": 3102} {"train_loss": -6.58244514465332, "global_step": 130299, "epoch": 3102} {"train_loss": -6.635373115539551, "global_step": 130300, "epoch": 3102} {"train_loss": -6.731019020080566, "global_step": 130301, "epoch": 3102} {"train_loss": -6.590128421783447, "global_step": 130302, "epoch": 3102} {"train_loss": -6.654078960418701, "global_step": 130303, "epoch": 3102} {"train_loss": -6.727042198181152, "global_step": 130304, "epoch": 3102} {"train_loss": -6.703556537628174, "global_step": 130305, "epoch": 3102} {"train_loss": -6.56096887588501, "global_step": 130306, "epoch": 3102} {"train_loss": -6.6840620040893555, "global_step": 130307, "epoch": 3102} {"train_loss": -6.62819766998291, "global_step": 130308, "epoch": 3102} {"train_loss": -6.721010208129883, "global_step": 130309, "epoch": 3102} {"train_loss": -6.759479522705078, "global_step": 130310, "epoch": 3102} {"train_loss": -6.687832832336426, "global_step": 130311, "epoch": 3102} {"train_loss": -6.579789638519287, "global_step": 130312, "epoch": 3102} {"train_loss": -6.758905410766602, "global_step": 130313, "epoch": 3102} {"train_loss": -6.67620325088501, "global_step": 130314, "epoch": 3102} {"train_loss": -6.721604824066162, "global_step": 130315, "epoch": 3102} {"train_loss": -6.68477725982666, "global_step": 130316, "epoch": 3102} {"train_loss": -6.714858055114746, "global_step": 130317, "epoch": 3102} {"train_loss": -6.693286418914795, "global_step": 130318, "epoch": 3102} {"train_loss": -6.700469017028809, "global_step": 130319, "epoch": 3102} {"train_loss": -6.688562393188477, "global_step": 130320, "epoch": 3102} {"train_loss": -6.712869644165039, "global_step": 130321, "epoch": 3102} {"train_loss": -6.600765228271484, "global_step": 130322, "epoch": 3102} {"train_loss": -6.7769880294799805, "global_step": 130323, "epoch": 3102} {"train_loss": -6.788285255432129, "global_step": 130324, "epoch": 3102} {"train_loss": -6.689063151677449, "global_step": 130325, "epoch": 3102, "val_loss": 77222.984375} {"train_loss": -6.726018905639648, "global_step": 130326, "epoch": 3103} {"train_loss": -6.7683563232421875, "global_step": 130327, "epoch": 3103} {"train_loss": -6.703522205352783, "global_step": 130328, "epoch": 3103} {"train_loss": -6.733675479888916, "global_step": 130329, "epoch": 3103} {"train_loss": -6.836861610412598, "global_step": 130330, "epoch": 3103} {"train_loss": -6.734428405761719, "global_step": 130331, "epoch": 3103} {"train_loss": -6.786087989807129, "global_step": 130332, "epoch": 3103} {"train_loss": -6.568035125732422, "global_step": 130333, "epoch": 3103} {"train_loss": -6.686433792114258, "global_step": 130334, "epoch": 3103} {"train_loss": -6.612740993499756, "global_step": 130335, "epoch": 3103} {"train_loss": -6.63870906829834, "global_step": 130336, "epoch": 3103} {"train_loss": -6.625716686248779, "global_step": 130337, "epoch": 3103} {"train_loss": -6.732349395751953, "global_step": 130338, "epoch": 3103} {"train_loss": -6.624433517456055, "global_step": 130339, "epoch": 3103} {"train_loss": -6.7474446296691895, "global_step": 130340, "epoch": 3103} {"train_loss": -6.762685298919678, "global_step": 130341, "epoch": 3103} {"train_loss": -6.706143856048584, "global_step": 130342, "epoch": 3103} {"train_loss": -6.555122375488281, "global_step": 130343, "epoch": 3103} {"train_loss": -6.719986438751221, "global_step": 130344, "epoch": 3103} {"train_loss": -6.694781303405762, "global_step": 130345, "epoch": 3103} {"train_loss": -6.6681294441223145, "global_step": 130346, "epoch": 3103} {"train_loss": -6.768925666809082, "global_step": 130347, "epoch": 3103} {"train_loss": -6.749971389770508, "global_step": 130348, "epoch": 3103} {"train_loss": -6.744334697723389, "global_step": 130349, "epoch": 3103} {"train_loss": -6.732428550720215, "global_step": 130350, "epoch": 3103} {"train_loss": -6.672979354858398, "global_step": 130351, "epoch": 3103} {"train_loss": -6.729249954223633, "global_step": 130352, "epoch": 3103} {"train_loss": -6.650395393371582, "global_step": 130353, "epoch": 3103} {"train_loss": -6.70676326751709, "global_step": 130354, "epoch": 3103} {"train_loss": -6.691388130187988, "global_step": 130355, "epoch": 3103} {"train_loss": -6.682518005371094, "global_step": 130356, "epoch": 3103} {"train_loss": -6.812932968139648, "global_step": 130357, "epoch": 3103} {"train_loss": -6.778048515319824, "global_step": 130358, "epoch": 3103} {"train_loss": -6.599498748779297, "global_step": 130359, "epoch": 3103} {"train_loss": -6.692930221557617, "global_step": 130360, "epoch": 3103} {"train_loss": -6.6952033042907715, "global_step": 130361, "epoch": 3103} {"train_loss": -6.720568656921387, "global_step": 130362, "epoch": 3103} {"train_loss": -6.729185104370117, "global_step": 130363, "epoch": 3103} {"train_loss": -6.599332809448242, "global_step": 130364, "epoch": 3103} {"train_loss": -6.707928657531738, "global_step": 130365, "epoch": 3103} {"train_loss": -6.718653678894043, "global_step": 130366, "epoch": 3103} {"train_loss": -6.699825706936064, "global_step": 130367, "epoch": 3103, "val_loss": 77126.1640625} {"train_loss": -6.765030860900879, "global_step": 130368, "epoch": 3104} {"train_loss": -6.630127429962158, "global_step": 130369, "epoch": 3104} {"train_loss": -6.583852767944336, "global_step": 130370, "epoch": 3104} {"train_loss": -6.612646102905273, "global_step": 130371, "epoch": 3104} {"train_loss": -6.61012601852417, "global_step": 130372, "epoch": 3104} {"train_loss": -6.70082950592041, "global_step": 130373, "epoch": 3104} {"train_loss": -6.688579559326172, "global_step": 130374, "epoch": 3104} {"train_loss": -6.701972007751465, "global_step": 130375, "epoch": 3104} {"train_loss": -6.546045303344727, "global_step": 130376, "epoch": 3104} {"train_loss": -6.64675235748291, "global_step": 130377, "epoch": 3104} {"train_loss": -6.645133018493652, "global_step": 130378, "epoch": 3104} {"train_loss": -6.6852545738220215, "global_step": 130379, "epoch": 3104} {"train_loss": -6.757408142089844, "global_step": 130380, "epoch": 3104} {"train_loss": -6.491418838500977, "global_step": 130381, "epoch": 3104} {"train_loss": -6.544054985046387, "global_step": 130382, "epoch": 3104} {"train_loss": -6.525732040405273, "global_step": 130383, "epoch": 3104} {"train_loss": -6.477174282073975, "global_step": 130384, "epoch": 3104} {"train_loss": -6.668526649475098, "global_step": 130385, "epoch": 3104} {"train_loss": -6.550920486450195, "global_step": 130386, "epoch": 3104} {"train_loss": -6.8409104347229, "global_step": 130387, "epoch": 3104} {"train_loss": -6.597988128662109, "global_step": 130388, "epoch": 3104} {"train_loss": -6.7688140869140625, "global_step": 130389, "epoch": 3104} {"train_loss": -6.4622111320495605, "global_step": 130390, "epoch": 3104} {"train_loss": -6.623889923095703, "global_step": 130391, "epoch": 3104} {"train_loss": -6.716376304626465, "global_step": 130392, "epoch": 3104} {"train_loss": -6.5313873291015625, "global_step": 130393, "epoch": 3104} {"train_loss": -6.634921073913574, "global_step": 130394, "epoch": 3104} {"train_loss": -6.591769218444824, "global_step": 130395, "epoch": 3104} {"train_loss": -6.628243446350098, "global_step": 130396, "epoch": 3104} {"train_loss": -6.689876079559326, "global_step": 130397, "epoch": 3104} {"train_loss": -6.634632587432861, "global_step": 130398, "epoch": 3104} {"train_loss": -6.692485809326172, "global_step": 130399, "epoch": 3104} {"train_loss": -6.606561660766602, "global_step": 130400, "epoch": 3104} {"train_loss": -6.6629204750061035, "global_step": 130401, "epoch": 3104} {"train_loss": -6.613890647888184, "global_step": 130402, "epoch": 3104} {"train_loss": -6.805392742156982, "global_step": 130403, "epoch": 3104} {"train_loss": -6.675895690917969, "global_step": 130404, "epoch": 3104} {"train_loss": -6.665814399719238, "global_step": 130405, "epoch": 3104} {"train_loss": -6.656585216522217, "global_step": 130406, "epoch": 3104} {"train_loss": -6.626595497131348, "global_step": 130407, "epoch": 3104} {"train_loss": -6.640674114227295, "global_step": 130408, "epoch": 3104} {"train_loss": -6.638680798666818, "global_step": 130409, "epoch": 3104, "val_loss": 77595.984375} {"train_loss": -6.644220352172852, "global_step": 130410, "epoch": 3105} {"train_loss": -6.753300666809082, "global_step": 130411, "epoch": 3105} {"train_loss": -6.642419815063477, "global_step": 130412, "epoch": 3105} {"train_loss": -6.553630828857422, "global_step": 130413, "epoch": 3105} {"train_loss": -6.595815658569336, "global_step": 130414, "epoch": 3105} {"train_loss": -6.645348072052002, "global_step": 130415, "epoch": 3105} {"train_loss": -6.70536994934082, "global_step": 130416, "epoch": 3105} {"train_loss": -6.636312007904053, "global_step": 130417, "epoch": 3105} {"train_loss": -6.715932846069336, "global_step": 130418, "epoch": 3105} {"train_loss": -6.6701555252075195, "global_step": 130419, "epoch": 3105} {"train_loss": -6.592435359954834, "global_step": 130420, "epoch": 3105} {"train_loss": -6.560161590576172, "global_step": 130421, "epoch": 3105} {"train_loss": -6.601188659667969, "global_step": 130422, "epoch": 3105} {"train_loss": -6.612797737121582, "global_step": 130423, "epoch": 3105} {"train_loss": -6.620236396789551, "global_step": 130424, "epoch": 3105} {"train_loss": -6.593785285949707, "global_step": 130425, "epoch": 3105} {"train_loss": -6.636894226074219, "global_step": 130426, "epoch": 3105} {"train_loss": -6.6207990646362305, "global_step": 130427, "epoch": 3105} {"train_loss": -6.591348171234131, "global_step": 130428, "epoch": 3105} {"train_loss": -6.693403720855713, "global_step": 130429, "epoch": 3105} {"train_loss": -6.682136058807373, "global_step": 130430, "epoch": 3105} {"train_loss": -6.6734137535095215, "global_step": 130431, "epoch": 3105} {"train_loss": -6.620016574859619, "global_step": 130432, "epoch": 3105} {"train_loss": -6.691159725189209, "global_step": 130433, "epoch": 3105} {"train_loss": -6.71623420715332, "global_step": 130434, "epoch": 3105} {"train_loss": -6.58750057220459, "global_step": 130435, "epoch": 3105} {"train_loss": -6.734671592712402, "global_step": 130436, "epoch": 3105} {"train_loss": -6.645459175109863, "global_step": 130437, "epoch": 3105} {"train_loss": -6.729978561401367, "global_step": 130438, "epoch": 3105} {"train_loss": -6.736761093139648, "global_step": 130439, "epoch": 3105} {"train_loss": -6.684688568115234, "global_step": 130440, "epoch": 3105} {"train_loss": -6.5839691162109375, "global_step": 130441, "epoch": 3105} {"train_loss": -6.594875335693359, "global_step": 130442, "epoch": 3105} {"train_loss": -6.545301914215088, "global_step": 130443, "epoch": 3105} {"train_loss": -6.617763519287109, "global_step": 130444, "epoch": 3105} {"train_loss": -6.78010368347168, "global_step": 130445, "epoch": 3105} {"train_loss": -6.4896626472473145, "global_step": 130446, "epoch": 3105} {"train_loss": -6.538738250732422, "global_step": 130447, "epoch": 3105} {"train_loss": -6.561369895935059, "global_step": 130448, "epoch": 3105} {"train_loss": -6.563948631286621, "global_step": 130449, "epoch": 3105} {"train_loss": -6.716213226318359, "global_step": 130450, "epoch": 3105} {"train_loss": -6.639740149180095, "global_step": 130451, "epoch": 3105, "val_loss": 77524.2265625} {"train_loss": -6.736111640930176, "global_step": 130452, "epoch": 3106} {"train_loss": -6.662411212921143, "global_step": 130453, "epoch": 3106} {"train_loss": -6.672324180603027, "global_step": 130454, "epoch": 3106} {"train_loss": -6.663966655731201, "global_step": 130455, "epoch": 3106} {"train_loss": -6.701082229614258, "global_step": 130456, "epoch": 3106} {"train_loss": -6.6059465408325195, "global_step": 130457, "epoch": 3106} {"train_loss": -6.565393447875977, "global_step": 130458, "epoch": 3106} {"train_loss": -6.574189186096191, "global_step": 130459, "epoch": 3106} {"train_loss": -6.743838310241699, "global_step": 130460, "epoch": 3106} {"train_loss": -6.588456153869629, "global_step": 130461, "epoch": 3106} {"train_loss": -6.704180717468262, "global_step": 130462, "epoch": 3106} {"train_loss": -6.673649787902832, "global_step": 130463, "epoch": 3106} {"train_loss": -6.6762895584106445, "global_step": 130464, "epoch": 3106} {"train_loss": -6.626393795013428, "global_step": 130465, "epoch": 3106} {"train_loss": -6.638067245483398, "global_step": 130466, "epoch": 3106} {"train_loss": -6.623424053192139, "global_step": 130467, "epoch": 3106} {"train_loss": -6.594883918762207, "global_step": 130468, "epoch": 3106} {"train_loss": -6.586061477661133, "global_step": 130469, "epoch": 3106} {"train_loss": -6.770281791687012, "global_step": 130470, "epoch": 3106} {"train_loss": -6.530955791473389, "global_step": 130471, "epoch": 3106} {"train_loss": -6.716094017028809, "global_step": 130472, "epoch": 3106} {"train_loss": -6.70237398147583, "global_step": 130473, "epoch": 3106} {"train_loss": -6.657026290893555, "global_step": 130474, "epoch": 3106} {"train_loss": -6.752091884613037, "global_step": 130475, "epoch": 3106} {"train_loss": -6.676921367645264, "global_step": 130476, "epoch": 3106} {"train_loss": -6.757883071899414, "global_step": 130477, "epoch": 3106} {"train_loss": -6.7677812576293945, "global_step": 130478, "epoch": 3106} {"train_loss": -6.710137367248535, "global_step": 130479, "epoch": 3106} {"train_loss": -6.729604721069336, "global_step": 130480, "epoch": 3106} {"train_loss": -6.741503715515137, "global_step": 130481, "epoch": 3106} {"train_loss": -6.7267889976501465, "global_step": 130482, "epoch": 3106} {"train_loss": -6.665632247924805, "global_step": 130483, "epoch": 3106} {"train_loss": -6.7247843742370605, "global_step": 130484, "epoch": 3106} {"train_loss": -6.691161155700684, "global_step": 130485, "epoch": 3106} {"train_loss": -6.685944557189941, "global_step": 130486, "epoch": 3106} {"train_loss": -6.717614650726318, "global_step": 130487, "epoch": 3106} {"train_loss": -6.728798866271973, "global_step": 130488, "epoch": 3106} {"train_loss": -6.623124599456787, "global_step": 130489, "epoch": 3106} {"train_loss": -6.594897270202637, "global_step": 130490, "epoch": 3106} {"train_loss": -6.737482070922852, "global_step": 130491, "epoch": 3106} {"train_loss": -6.652417182922363, "global_step": 130492, "epoch": 3106} {"train_loss": -6.67838986714681, "global_step": 130493, "epoch": 3106, "val_loss": 77617.359375} {"train_loss": -6.703545570373535, "global_step": 130494, "epoch": 3107} {"train_loss": -6.718237400054932, "global_step": 130495, "epoch": 3107} {"train_loss": -6.752854824066162, "global_step": 130496, "epoch": 3107} {"train_loss": -6.648371696472168, "global_step": 130497, "epoch": 3107} {"train_loss": -6.489099502563477, "global_step": 130498, "epoch": 3107} {"train_loss": -6.626232624053955, "global_step": 130499, "epoch": 3107} {"train_loss": -6.679631233215332, "global_step": 130500, "epoch": 3107} {"train_loss": -6.660191535949707, "global_step": 130501, "epoch": 3107} {"train_loss": -6.6209821701049805, "global_step": 130502, "epoch": 3107} {"train_loss": -6.70139217376709, "global_step": 130503, "epoch": 3107} {"train_loss": -6.733275890350342, "global_step": 130504, "epoch": 3107} {"train_loss": -6.737524032592773, "global_step": 130505, "epoch": 3107} {"train_loss": -6.689134120941162, "global_step": 130506, "epoch": 3107} {"train_loss": -6.596900939941406, "global_step": 130507, "epoch": 3107} {"train_loss": -6.812262535095215, "global_step": 130508, "epoch": 3107} {"train_loss": -6.673210144042969, "global_step": 130509, "epoch": 3107} {"train_loss": -6.715883731842041, "global_step": 130510, "epoch": 3107} {"train_loss": -6.740767478942871, "global_step": 130511, "epoch": 3107} {"train_loss": -6.716524124145508, "global_step": 130512, "epoch": 3107} {"train_loss": -6.777410507202148, "global_step": 130513, "epoch": 3107} {"train_loss": -6.699034690856934, "global_step": 130514, "epoch": 3107} {"train_loss": -6.777312278747559, "global_step": 130515, "epoch": 3107} {"train_loss": -6.45574426651001, "global_step": 130516, "epoch": 3107} {"train_loss": -6.604962348937988, "global_step": 130517, "epoch": 3107} {"train_loss": -6.5729875564575195, "global_step": 130518, "epoch": 3107} {"train_loss": -6.596636772155762, "global_step": 130519, "epoch": 3107} {"train_loss": -6.596575736999512, "global_step": 130520, "epoch": 3107} {"train_loss": -6.520296096801758, "global_step": 130521, "epoch": 3107} {"train_loss": -6.529015064239502, "global_step": 130522, "epoch": 3107} {"train_loss": -6.783803462982178, "global_step": 130523, "epoch": 3107} {"train_loss": -6.673989295959473, "global_step": 130524, "epoch": 3107} {"train_loss": -6.762199878692627, "global_step": 130525, "epoch": 3107} {"train_loss": -6.6601033210754395, "global_step": 130526, "epoch": 3107} {"train_loss": -6.652083873748779, "global_step": 130527, "epoch": 3107} {"train_loss": -6.736769676208496, "global_step": 130528, "epoch": 3107} {"train_loss": -6.659366607666016, "global_step": 130529, "epoch": 3107} {"train_loss": -6.688556671142578, "global_step": 130530, "epoch": 3107} {"train_loss": -6.758029937744141, "global_step": 130531, "epoch": 3107} {"train_loss": -6.750213623046875, "global_step": 130532, "epoch": 3107} {"train_loss": -6.657988548278809, "global_step": 130533, "epoch": 3107} {"train_loss": -6.698601722717285, "global_step": 130534, "epoch": 3107} {"train_loss": -6.674496276038034, "global_step": 130535, "epoch": 3107, "val_loss": 77385.765625} {"train_loss": -6.735946178436279, "global_step": 130536, "epoch": 3108} {"train_loss": -6.660046100616455, "global_step": 130537, "epoch": 3108} {"train_loss": -6.6147356033325195, "global_step": 130538, "epoch": 3108} {"train_loss": -6.712474822998047, "global_step": 130539, "epoch": 3108} {"train_loss": -6.6389546394348145, "global_step": 130540, "epoch": 3108} {"train_loss": -6.768856048583984, "global_step": 130541, "epoch": 3108} {"train_loss": -6.649663925170898, "global_step": 130542, "epoch": 3108} {"train_loss": -6.650042533874512, "global_step": 130543, "epoch": 3108} {"train_loss": -6.653538703918457, "global_step": 130544, "epoch": 3108} {"train_loss": -6.631228923797607, "global_step": 130545, "epoch": 3108} {"train_loss": -6.569151878356934, "global_step": 130546, "epoch": 3108} {"train_loss": -6.730370998382568, "global_step": 130547, "epoch": 3108} {"train_loss": -6.577437400817871, "global_step": 130548, "epoch": 3108} {"train_loss": -6.681948661804199, "global_step": 130549, "epoch": 3108} {"train_loss": -6.7037434577941895, "global_step": 130550, "epoch": 3108} {"train_loss": -6.740944862365723, "global_step": 130551, "epoch": 3108} {"train_loss": -6.73884916305542, "global_step": 130552, "epoch": 3108} {"train_loss": -6.693049430847168, "global_step": 130553, "epoch": 3108} {"train_loss": -6.724996566772461, "global_step": 130554, "epoch": 3108} {"train_loss": -6.679803848266602, "global_step": 130555, "epoch": 3108} {"train_loss": -6.66618537902832, "global_step": 130556, "epoch": 3108} {"train_loss": -6.781520843505859, "global_step": 130557, "epoch": 3108} {"train_loss": -6.8916544914245605, "global_step": 130558, "epoch": 3108} {"train_loss": -6.725313663482666, "global_step": 130559, "epoch": 3108} {"train_loss": -6.711050987243652, "global_step": 130560, "epoch": 3108} {"train_loss": -6.810029029846191, "global_step": 130561, "epoch": 3108} {"train_loss": -6.677371501922607, "global_step": 130562, "epoch": 3108} {"train_loss": -6.678204536437988, "global_step": 130563, "epoch": 3108} {"train_loss": -6.734723091125488, "global_step": 130564, "epoch": 3108} {"train_loss": -6.7478461265563965, "global_step": 130565, "epoch": 3108} {"train_loss": -6.677556037902832, "global_step": 130566, "epoch": 3108} {"train_loss": -6.829038143157959, "global_step": 130567, "epoch": 3108} {"train_loss": -6.847815036773682, "global_step": 130568, "epoch": 3108} {"train_loss": -6.685162544250488, "global_step": 130569, "epoch": 3108} {"train_loss": -6.7349348068237305, "global_step": 130570, "epoch": 3108} {"train_loss": -6.67841100692749, "global_step": 130571, "epoch": 3108} {"train_loss": -6.6876983642578125, "global_step": 130572, "epoch": 3108} {"train_loss": -6.73897647857666, "global_step": 130573, "epoch": 3108} {"train_loss": -6.633140563964844, "global_step": 130574, "epoch": 3108} {"train_loss": -6.66507625579834, "global_step": 130575, "epoch": 3108} {"train_loss": -6.701213836669922, "global_step": 130576, "epoch": 3108} {"train_loss": -6.702178591773624, "global_step": 130577, "epoch": 3108, "val_loss": 77163.21875} {"train_loss": -6.695507526397705, "global_step": 130578, "epoch": 3109} {"train_loss": -6.602356910705566, "global_step": 130579, "epoch": 3109} {"train_loss": -6.65366268157959, "global_step": 130580, "epoch": 3109} {"train_loss": -6.562056064605713, "global_step": 130581, "epoch": 3109} {"train_loss": -6.5760498046875, "global_step": 130582, "epoch": 3109} {"train_loss": -6.811745643615723, "global_step": 130583, "epoch": 3109} {"train_loss": -6.589258193969727, "global_step": 130584, "epoch": 3109} {"train_loss": -6.609864234924316, "global_step": 130585, "epoch": 3109} {"train_loss": -6.633385181427002, "global_step": 130586, "epoch": 3109} {"train_loss": -6.668320655822754, "global_step": 130587, "epoch": 3109} {"train_loss": -6.64223575592041, "global_step": 130588, "epoch": 3109} {"train_loss": -6.6183905601501465, "global_step": 130589, "epoch": 3109} {"train_loss": -6.586806297302246, "global_step": 130590, "epoch": 3109} {"train_loss": -6.625321388244629, "global_step": 130591, "epoch": 3109} {"train_loss": -6.5795087814331055, "global_step": 130592, "epoch": 3109} {"train_loss": -6.697705268859863, "global_step": 130593, "epoch": 3109} {"train_loss": -6.713142395019531, "global_step": 130594, "epoch": 3109} {"train_loss": -6.610654830932617, "global_step": 130595, "epoch": 3109} {"train_loss": -6.694829940795898, "global_step": 130596, "epoch": 3109} {"train_loss": -6.530574798583984, "global_step": 130597, "epoch": 3109} {"train_loss": -6.608476638793945, "global_step": 130598, "epoch": 3109} {"train_loss": -6.556787490844727, "global_step": 130599, "epoch": 3109} {"train_loss": -6.701937675476074, "global_step": 130600, "epoch": 3109} {"train_loss": -6.616324424743652, "global_step": 130601, "epoch": 3109} {"train_loss": -6.804227828979492, "global_step": 130602, "epoch": 3109} {"train_loss": -6.628649711608887, "global_step": 130603, "epoch": 3109} {"train_loss": -6.605067729949951, "global_step": 130604, "epoch": 3109} {"train_loss": -6.663541316986084, "global_step": 130605, "epoch": 3109} {"train_loss": -6.64901065826416, "global_step": 130606, "epoch": 3109} {"train_loss": -6.614629745483398, "global_step": 130607, "epoch": 3109} {"train_loss": -6.641207695007324, "global_step": 130608, "epoch": 3109} {"train_loss": -6.715813636779785, "global_step": 130609, "epoch": 3109} {"train_loss": -6.709473609924316, "global_step": 130610, "epoch": 3109} {"train_loss": -6.6273369789123535, "global_step": 130611, "epoch": 3109} {"train_loss": -6.5512375831604, "global_step": 130612, "epoch": 3109} {"train_loss": -6.592545509338379, "global_step": 130613, "epoch": 3109} {"train_loss": -6.671405792236328, "global_step": 130614, "epoch": 3109} {"train_loss": -6.731810569763184, "global_step": 130615, "epoch": 3109} {"train_loss": -6.724350452423096, "global_step": 130616, "epoch": 3109} {"train_loss": -6.560178279876709, "global_step": 130617, "epoch": 3109} {"train_loss": -6.576287269592285, "global_step": 130618, "epoch": 3109} {"train_loss": -6.640245744160244, "global_step": 130619, "epoch": 3109, "val_loss": 77415.359375} {"train_loss": -6.57602596282959, "global_step": 130620, "epoch": 3110} {"train_loss": -6.661938667297363, "global_step": 130621, "epoch": 3110} {"train_loss": -6.729671478271484, "global_step": 130622, "epoch": 3110} {"train_loss": -6.746959209442139, "global_step": 130623, "epoch": 3110} {"train_loss": -6.666776657104492, "global_step": 130624, "epoch": 3110} {"train_loss": -6.7640557289123535, "global_step": 130625, "epoch": 3110} {"train_loss": -6.636487007141113, "global_step": 130626, "epoch": 3110} {"train_loss": -6.721961975097656, "global_step": 130627, "epoch": 3110} {"train_loss": -6.628973960876465, "global_step": 130628, "epoch": 3110} {"train_loss": -6.681775093078613, "global_step": 130629, "epoch": 3110} {"train_loss": -6.735597133636475, "global_step": 130630, "epoch": 3110} {"train_loss": -6.70734977722168, "global_step": 130631, "epoch": 3110} {"train_loss": -6.547884464263916, "global_step": 130632, "epoch": 3110} {"train_loss": -6.806727409362793, "global_step": 130633, "epoch": 3110} {"train_loss": -6.623354434967041, "global_step": 130634, "epoch": 3110} {"train_loss": -6.6743669509887695, "global_step": 130635, "epoch": 3110} {"train_loss": -6.594311714172363, "global_step": 130636, "epoch": 3110} {"train_loss": -6.682133674621582, "global_step": 130637, "epoch": 3110} {"train_loss": -6.7943572998046875, "global_step": 130638, "epoch": 3110} {"train_loss": -6.698442459106445, "global_step": 130639, "epoch": 3110} {"train_loss": -6.738347053527832, "global_step": 130640, "epoch": 3110} {"train_loss": -6.720767498016357, "global_step": 130641, "epoch": 3110} {"train_loss": -6.689348220825195, "global_step": 130642, "epoch": 3110} {"train_loss": -6.801900863647461, "global_step": 130643, "epoch": 3110} {"train_loss": -6.687479019165039, "global_step": 130644, "epoch": 3110} {"train_loss": -6.7510271072387695, "global_step": 130645, "epoch": 3110} {"train_loss": -6.755298137664795, "global_step": 130646, "epoch": 3110} {"train_loss": -6.792448043823242, "global_step": 130647, "epoch": 3110} {"train_loss": -6.64983606338501, "global_step": 130648, "epoch": 3110} {"train_loss": -6.618913650512695, "global_step": 130649, "epoch": 3110} {"train_loss": -6.684273719787598, "global_step": 130650, "epoch": 3110} {"train_loss": -6.776122093200684, "global_step": 130651, "epoch": 3110} {"train_loss": -6.788618564605713, "global_step": 130652, "epoch": 3110} {"train_loss": -6.725582599639893, "global_step": 130653, "epoch": 3110} {"train_loss": -6.785930156707764, "global_step": 130654, "epoch": 3110} {"train_loss": -6.673821449279785, "global_step": 130655, "epoch": 3110} {"train_loss": -6.680242538452148, "global_step": 130656, "epoch": 3110} {"train_loss": -6.675786972045898, "global_step": 130657, "epoch": 3110} {"train_loss": -6.778646469116211, "global_step": 130658, "epoch": 3110} {"train_loss": -6.738048553466797, "global_step": 130659, "epoch": 3110} {"train_loss": -6.686206817626953, "global_step": 130660, "epoch": 3110} {"train_loss": -6.701917784554618, "global_step": 130661, "epoch": 3110, "val_loss": 77459.1953125} {"train_loss": -6.7931413650512695, "global_step": 130662, "epoch": 3111} {"train_loss": -6.811582565307617, "global_step": 130663, "epoch": 3111} {"train_loss": -6.7130937576293945, "global_step": 130664, "epoch": 3111} {"train_loss": -6.68009090423584, "global_step": 130665, "epoch": 3111} {"train_loss": -6.622616767883301, "global_step": 130666, "epoch": 3111} {"train_loss": -6.562701225280762, "global_step": 130667, "epoch": 3111} {"train_loss": -6.772775650024414, "global_step": 130668, "epoch": 3111} {"train_loss": -6.724661350250244, "global_step": 130669, "epoch": 3111} {"train_loss": -6.723838806152344, "global_step": 130670, "epoch": 3111} {"train_loss": -6.717973232269287, "global_step": 130671, "epoch": 3111} {"train_loss": -6.675145626068115, "global_step": 130672, "epoch": 3111} {"train_loss": -6.678452491760254, "global_step": 130673, "epoch": 3111} {"train_loss": -6.684999465942383, "global_step": 130674, "epoch": 3111} {"train_loss": -6.696155548095703, "global_step": 130675, "epoch": 3111} {"train_loss": -6.704339027404785, "global_step": 130676, "epoch": 3111} {"train_loss": -6.686454772949219, "global_step": 130677, "epoch": 3111} {"train_loss": -6.675149917602539, "global_step": 130678, "epoch": 3111} {"train_loss": -6.592396259307861, "global_step": 130679, "epoch": 3111} {"train_loss": -6.733855247497559, "global_step": 130680, "epoch": 3111} {"train_loss": -6.598394870758057, "global_step": 130681, "epoch": 3111} {"train_loss": -6.672214508056641, "global_step": 130682, "epoch": 3111} {"train_loss": -6.7044782638549805, "global_step": 130683, "epoch": 3111} {"train_loss": -6.684781551361084, "global_step": 130684, "epoch": 3111} {"train_loss": -6.747204780578613, "global_step": 130685, "epoch": 3111} {"train_loss": -6.624029159545898, "global_step": 130686, "epoch": 3111} {"train_loss": -6.723756790161133, "global_step": 130687, "epoch": 3111} {"train_loss": -6.729599952697754, "global_step": 130688, "epoch": 3111} {"train_loss": -6.680108547210693, "global_step": 130689, "epoch": 3111} {"train_loss": -6.685037612915039, "global_step": 130690, "epoch": 3111} {"train_loss": -6.746114730834961, "global_step": 130691, "epoch": 3111} {"train_loss": -6.836987495422363, "global_step": 130692, "epoch": 3111} {"train_loss": -6.7640790939331055, "global_step": 130693, "epoch": 3111} {"train_loss": -6.704287052154541, "global_step": 130694, "epoch": 3111} {"train_loss": -6.70707893371582, "global_step": 130695, "epoch": 3111} {"train_loss": -6.739757537841797, "global_step": 130696, "epoch": 3111} {"train_loss": -6.673924922943115, "global_step": 130697, "epoch": 3111} {"train_loss": -6.7523040771484375, "global_step": 130698, "epoch": 3111} {"train_loss": -6.805973052978516, "global_step": 130699, "epoch": 3111} {"train_loss": -6.67510986328125, "global_step": 130700, "epoch": 3111} {"train_loss": -6.699355125427246, "global_step": 130701, "epoch": 3111} {"train_loss": -6.730834484100342, "global_step": 130702, "epoch": 3111} {"train_loss": -6.704667068663097, "global_step": 130703, "epoch": 3111, "val_loss": 77673.7421875} {"train_loss": -6.723953723907471, "global_step": 130704, "epoch": 3112} {"train_loss": -6.626010894775391, "global_step": 130705, "epoch": 3112} {"train_loss": -6.551677703857422, "global_step": 130706, "epoch": 3112} {"train_loss": -6.620875358581543, "global_step": 130707, "epoch": 3112} {"train_loss": -6.699838161468506, "global_step": 130708, "epoch": 3112} {"train_loss": -6.667656421661377, "global_step": 130709, "epoch": 3112} {"train_loss": -6.690896987915039, "global_step": 130710, "epoch": 3112} {"train_loss": -6.592350006103516, "global_step": 130711, "epoch": 3112} {"train_loss": -6.810525894165039, "global_step": 130712, "epoch": 3112} {"train_loss": -6.690271377563477, "global_step": 130713, "epoch": 3112} {"train_loss": -6.826622009277344, "global_step": 130714, "epoch": 3112} {"train_loss": -6.698036193847656, "global_step": 130715, "epoch": 3112} {"train_loss": -6.739554405212402, "global_step": 130716, "epoch": 3112} {"train_loss": -6.684579849243164, "global_step": 130717, "epoch": 3112} {"train_loss": -6.615276336669922, "global_step": 130718, "epoch": 3112} {"train_loss": -6.683448314666748, "global_step": 130719, "epoch": 3112} {"train_loss": -6.612116813659668, "global_step": 130720, "epoch": 3112} {"train_loss": -6.597173690795898, "global_step": 130721, "epoch": 3112} {"train_loss": -6.6283721923828125, "global_step": 130722, "epoch": 3112} {"train_loss": -6.507385730743408, "global_step": 130723, "epoch": 3112} {"train_loss": -6.666059970855713, "global_step": 130724, "epoch": 3112} {"train_loss": -6.6409592628479, "global_step": 130725, "epoch": 3112} {"train_loss": -6.618355751037598, "global_step": 130726, "epoch": 3112} {"train_loss": -6.677388668060303, "global_step": 130727, "epoch": 3112} {"train_loss": -6.6566081047058105, "global_step": 130728, "epoch": 3112} {"train_loss": -6.607249736785889, "global_step": 130729, "epoch": 3112} {"train_loss": -6.573000907897949, "global_step": 130730, "epoch": 3112} {"train_loss": -6.723143577575684, "global_step": 130731, "epoch": 3112} {"train_loss": -6.674105644226074, "global_step": 130732, "epoch": 3112} {"train_loss": -6.708005428314209, "global_step": 130733, "epoch": 3112} {"train_loss": -6.649740219116211, "global_step": 130734, "epoch": 3112} {"train_loss": -6.701379776000977, "global_step": 130735, "epoch": 3112} {"train_loss": -6.6855340003967285, "global_step": 130736, "epoch": 3112} {"train_loss": -6.694547653198242, "global_step": 130737, "epoch": 3112} {"train_loss": -6.748068809509277, "global_step": 130738, "epoch": 3112} {"train_loss": -6.798771381378174, "global_step": 130739, "epoch": 3112} {"train_loss": -6.662846088409424, "global_step": 130740, "epoch": 3112} {"train_loss": -6.621640205383301, "global_step": 130741, "epoch": 3112} {"train_loss": -6.634731292724609, "global_step": 130742, "epoch": 3112} {"train_loss": -6.592537879943848, "global_step": 130743, "epoch": 3112} {"train_loss": -6.60942268371582, "global_step": 130744, "epoch": 3112} {"train_loss": -6.66410543805077, "global_step": 130745, "epoch": 3112, "val_loss": 77517.234375} {"train_loss": -6.691597938537598, "global_step": 130746, "epoch": 3113} {"train_loss": -6.610010623931885, "global_step": 130747, "epoch": 3113} {"train_loss": -6.673727512359619, "global_step": 130748, "epoch": 3113} {"train_loss": -6.6196160316467285, "global_step": 130749, "epoch": 3113} {"train_loss": -6.592633247375488, "global_step": 130750, "epoch": 3113} {"train_loss": -6.6260986328125, "global_step": 130751, "epoch": 3113} {"train_loss": -6.798244476318359, "global_step": 130752, "epoch": 3113} {"train_loss": -6.717230319976807, "global_step": 130753, "epoch": 3113} {"train_loss": -6.763162612915039, "global_step": 130754, "epoch": 3113} {"train_loss": -6.736241340637207, "global_step": 130755, "epoch": 3113} {"train_loss": -6.708324432373047, "global_step": 130756, "epoch": 3113} {"train_loss": -6.776535987854004, "global_step": 130757, "epoch": 3113} {"train_loss": -6.635631561279297, "global_step": 130758, "epoch": 3113} {"train_loss": -6.712543487548828, "global_step": 130759, "epoch": 3113} {"train_loss": -6.714969158172607, "global_step": 130760, "epoch": 3113} {"train_loss": -6.710984706878662, "global_step": 130761, "epoch": 3113} {"train_loss": -6.731393814086914, "global_step": 130762, "epoch": 3113} {"train_loss": -6.671001434326172, "global_step": 130763, "epoch": 3113} {"train_loss": -6.662111759185791, "global_step": 130764, "epoch": 3113} {"train_loss": -6.613680839538574, "global_step": 130765, "epoch": 3113} {"train_loss": -6.647315502166748, "global_step": 130766, "epoch": 3113} {"train_loss": -6.635516166687012, "global_step": 130767, "epoch": 3113} {"train_loss": -6.603863716125488, "global_step": 130768, "epoch": 3113} {"train_loss": -6.785198211669922, "global_step": 130769, "epoch": 3113} {"train_loss": -6.605074882507324, "global_step": 130770, "epoch": 3113} {"train_loss": -6.619235038757324, "global_step": 130771, "epoch": 3113} {"train_loss": -6.762905597686768, "global_step": 130772, "epoch": 3113} {"train_loss": -6.679076194763184, "global_step": 130773, "epoch": 3113} {"train_loss": -6.695287227630615, "global_step": 130774, "epoch": 3113} {"train_loss": -6.77949333190918, "global_step": 130775, "epoch": 3113} {"train_loss": -6.586308002471924, "global_step": 130776, "epoch": 3113} {"train_loss": -6.614742279052734, "global_step": 130777, "epoch": 3113} {"train_loss": -6.634746551513672, "global_step": 130778, "epoch": 3113} {"train_loss": -6.652963638305664, "global_step": 130779, "epoch": 3113} {"train_loss": -6.650003433227539, "global_step": 130780, "epoch": 3113} {"train_loss": -6.659521579742432, "global_step": 130781, "epoch": 3113} {"train_loss": -6.770133972167969, "global_step": 130782, "epoch": 3113} {"train_loss": -6.540509223937988, "global_step": 130783, "epoch": 3113} {"train_loss": -6.661792755126953, "global_step": 130784, "epoch": 3113} {"train_loss": -6.627557754516602, "global_step": 130785, "epoch": 3113} {"train_loss": -6.5796709060668945, "global_step": 130786, "epoch": 3113} {"train_loss": -6.668898695991153, "global_step": 130787, "epoch": 3113, "val_loss": 77267.4453125} {"train_loss": -6.7050580978393555, "global_step": 130788, "epoch": 3114} {"train_loss": -6.766305923461914, "global_step": 130789, "epoch": 3114} {"train_loss": -6.624942779541016, "global_step": 130790, "epoch": 3114} {"train_loss": -6.568864822387695, "global_step": 130791, "epoch": 3114} {"train_loss": -6.7544097900390625, "global_step": 130792, "epoch": 3114} {"train_loss": -6.679171085357666, "global_step": 130793, "epoch": 3114} {"train_loss": -6.6853485107421875, "global_step": 130794, "epoch": 3114} {"train_loss": -6.762577056884766, "global_step": 130795, "epoch": 3114} {"train_loss": -6.657444477081299, "global_step": 130796, "epoch": 3114} {"train_loss": -6.704164505004883, "global_step": 130797, "epoch": 3114} {"train_loss": -6.744329452514648, "global_step": 130798, "epoch": 3114} {"train_loss": -6.68400764465332, "global_step": 130799, "epoch": 3114} {"train_loss": -6.62802267074585, "global_step": 130800, "epoch": 3114} {"train_loss": -6.67911434173584, "global_step": 130801, "epoch": 3114} {"train_loss": -6.615799427032471, "global_step": 130802, "epoch": 3114} {"train_loss": -6.661089897155762, "global_step": 130803, "epoch": 3114} {"train_loss": -6.576421737670898, "global_step": 130804, "epoch": 3114} {"train_loss": -6.596170902252197, "global_step": 130805, "epoch": 3114} {"train_loss": -6.698678970336914, "global_step": 130806, "epoch": 3114} {"train_loss": -6.6731672286987305, "global_step": 130807, "epoch": 3114} {"train_loss": -6.685649871826172, "global_step": 130808, "epoch": 3114} {"train_loss": -6.674344062805176, "global_step": 130809, "epoch": 3114} {"train_loss": -6.670308589935303, "global_step": 130810, "epoch": 3114} {"train_loss": -6.578211784362793, "global_step": 130811, "epoch": 3114} {"train_loss": -6.62936544418335, "global_step": 130812, "epoch": 3114} {"train_loss": -6.638278961181641, "global_step": 130813, "epoch": 3114} {"train_loss": -6.691973686218262, "global_step": 130814, "epoch": 3114} {"train_loss": -6.526434898376465, "global_step": 130815, "epoch": 3114} {"train_loss": -6.5911054611206055, "global_step": 130816, "epoch": 3114} {"train_loss": -6.6600799560546875, "global_step": 130817, "epoch": 3114} {"train_loss": -6.568685531616211, "global_step": 130818, "epoch": 3114} {"train_loss": -6.552972793579102, "global_step": 130819, "epoch": 3114} {"train_loss": -6.665388107299805, "global_step": 130820, "epoch": 3114} {"train_loss": -6.583861351013184, "global_step": 130821, "epoch": 3114} {"train_loss": -6.721492767333984, "global_step": 130822, "epoch": 3114} {"train_loss": -6.635745048522949, "global_step": 130823, "epoch": 3114} {"train_loss": -6.6846513748168945, "global_step": 130824, "epoch": 3114} {"train_loss": -6.717494487762451, "global_step": 130825, "epoch": 3114} {"train_loss": -6.519646644592285, "global_step": 130826, "epoch": 3114} {"train_loss": -6.793391227722168, "global_step": 130827, "epoch": 3114} {"train_loss": -6.547286033630371, "global_step": 130828, "epoch": 3114} {"train_loss": -6.6502184981391546, "global_step": 130829, "epoch": 3114, "val_loss": 77348.4296875} {"train_loss": -6.5662078857421875, "global_step": 130830, "epoch": 3115} {"train_loss": -6.533714294433594, "global_step": 130831, "epoch": 3115} {"train_loss": -6.549740791320801, "global_step": 130832, "epoch": 3115} {"train_loss": -6.6477484703063965, "global_step": 130833, "epoch": 3115} {"train_loss": -6.612161636352539, "global_step": 130834, "epoch": 3115} {"train_loss": -6.5456862449646, "global_step": 130835, "epoch": 3115} {"train_loss": -6.721238136291504, "global_step": 130836, "epoch": 3115} {"train_loss": -6.564945220947266, "global_step": 130837, "epoch": 3115} {"train_loss": -6.742773056030273, "global_step": 130838, "epoch": 3115} {"train_loss": -6.541814804077148, "global_step": 130839, "epoch": 3115} {"train_loss": -6.749563694000244, "global_step": 130840, "epoch": 3115} {"train_loss": -6.636211395263672, "global_step": 130841, "epoch": 3115} {"train_loss": -6.677945137023926, "global_step": 130842, "epoch": 3115} {"train_loss": -6.618402481079102, "global_step": 130843, "epoch": 3115} {"train_loss": -6.631854057312012, "global_step": 130844, "epoch": 3115} {"train_loss": -6.539732933044434, "global_step": 130845, "epoch": 3115} {"train_loss": -6.6429362297058105, "global_step": 130846, "epoch": 3115} {"train_loss": -6.757574558258057, "global_step": 130847, "epoch": 3115} {"train_loss": -6.636289119720459, "global_step": 130848, "epoch": 3115} {"train_loss": -6.728200912475586, "global_step": 130849, "epoch": 3115} {"train_loss": -6.789710521697998, "global_step": 130850, "epoch": 3115} {"train_loss": -6.752103805541992, "global_step": 130851, "epoch": 3115} {"train_loss": -6.657538414001465, "global_step": 130852, "epoch": 3115} {"train_loss": -6.665139198303223, "global_step": 130853, "epoch": 3115} {"train_loss": -6.6790266036987305, "global_step": 130854, "epoch": 3115} {"train_loss": -6.736017227172852, "global_step": 130855, "epoch": 3115} {"train_loss": -6.719171524047852, "global_step": 130856, "epoch": 3115} {"train_loss": -6.613462448120117, "global_step": 130857, "epoch": 3115} {"train_loss": -6.757295608520508, "global_step": 130858, "epoch": 3115} {"train_loss": -6.712680816650391, "global_step": 130859, "epoch": 3115} {"train_loss": -6.606539726257324, "global_step": 130860, "epoch": 3115} {"train_loss": -6.709493637084961, "global_step": 130861, "epoch": 3115} {"train_loss": -6.673091888427734, "global_step": 130862, "epoch": 3115} {"train_loss": -6.60028076171875, "global_step": 130863, "epoch": 3115} {"train_loss": -6.67958402633667, "global_step": 130864, "epoch": 3115} {"train_loss": -6.518741607666016, "global_step": 130865, "epoch": 3115} {"train_loss": -6.716449737548828, "global_step": 130866, "epoch": 3115} {"train_loss": -6.604434013366699, "global_step": 130867, "epoch": 3115} {"train_loss": -6.666395664215088, "global_step": 130868, "epoch": 3115} {"train_loss": -6.683793067932129, "global_step": 130869, "epoch": 3115} {"train_loss": -6.637580871582031, "global_step": 130870, "epoch": 3115} {"train_loss": -6.65429475193932, "global_step": 130871, "epoch": 3115, "val_loss": 77437.46875} {"train_loss": -6.663732051849365, "global_step": 130872, "epoch": 3116} {"train_loss": -6.686191558837891, "global_step": 130873, "epoch": 3116} {"train_loss": -6.621563911437988, "global_step": 130874, "epoch": 3116} {"train_loss": -6.742291450500488, "global_step": 130875, "epoch": 3116} {"train_loss": -6.6578569412231445, "global_step": 130876, "epoch": 3116} {"train_loss": -6.609963893890381, "global_step": 130877, "epoch": 3116} {"train_loss": -6.591703414916992, "global_step": 130878, "epoch": 3116} {"train_loss": -6.752518653869629, "global_step": 130879, "epoch": 3116} {"train_loss": -6.664017200469971, "global_step": 130880, "epoch": 3116} {"train_loss": -6.881323337554932, "global_step": 130881, "epoch": 3116} {"train_loss": -6.731256484985352, "global_step": 130882, "epoch": 3116} {"train_loss": -6.7359209060668945, "global_step": 130883, "epoch": 3116} {"train_loss": -6.6440629959106445, "global_step": 130884, "epoch": 3116} {"train_loss": -6.6927690505981445, "global_step": 130885, "epoch": 3116} {"train_loss": -6.640443801879883, "global_step": 130886, "epoch": 3116} {"train_loss": -6.82868766784668, "global_step": 130887, "epoch": 3116} {"train_loss": -6.62822961807251, "global_step": 130888, "epoch": 3116} {"train_loss": -6.692450523376465, "global_step": 130889, "epoch": 3116} {"train_loss": -6.750554084777832, "global_step": 130890, "epoch": 3116} {"train_loss": -6.754208087921143, "global_step": 130891, "epoch": 3116} {"train_loss": -6.673741340637207, "global_step": 130892, "epoch": 3116} {"train_loss": -6.654971599578857, "global_step": 130893, "epoch": 3116} {"train_loss": -6.661823272705078, "global_step": 130894, "epoch": 3116} {"train_loss": -6.669135093688965, "global_step": 130895, "epoch": 3116} {"train_loss": -6.7513322830200195, "global_step": 130896, "epoch": 3116} {"train_loss": -6.55666446685791, "global_step": 130897, "epoch": 3116} {"train_loss": -6.677906036376953, "global_step": 130898, "epoch": 3116} {"train_loss": -6.808671951293945, "global_step": 130899, "epoch": 3116} {"train_loss": -6.679027557373047, "global_step": 130900, "epoch": 3116} {"train_loss": -6.62995719909668, "global_step": 130901, "epoch": 3116} {"train_loss": -6.660138130187988, "global_step": 130902, "epoch": 3116} {"train_loss": -6.5810980796813965, "global_step": 130903, "epoch": 3116} {"train_loss": -6.643531799316406, "global_step": 130904, "epoch": 3116} {"train_loss": -6.659446716308594, "global_step": 130905, "epoch": 3116} {"train_loss": -6.730984687805176, "global_step": 130906, "epoch": 3116} {"train_loss": -6.704697608947754, "global_step": 130907, "epoch": 3116} {"train_loss": -6.708451747894287, "global_step": 130908, "epoch": 3116} {"train_loss": -6.621379852294922, "global_step": 130909, "epoch": 3116} {"train_loss": -6.593899250030518, "global_step": 130910, "epoch": 3116} {"train_loss": -6.744583606719971, "global_step": 130911, "epoch": 3116} {"train_loss": -6.580129623413086, "global_step": 130912, "epoch": 3116} {"train_loss": -6.681196087882633, "global_step": 130913, "epoch": 3116, "val_loss": 77122.4765625} {"train_loss": -6.675580024719238, "global_step": 130914, "epoch": 3117} {"train_loss": -6.720837593078613, "global_step": 130915, "epoch": 3117} {"train_loss": -6.6779632568359375, "global_step": 130916, "epoch": 3117} {"train_loss": -6.647151947021484, "global_step": 130917, "epoch": 3117} {"train_loss": -6.651040077209473, "global_step": 130918, "epoch": 3117} {"train_loss": -6.69748067855835, "global_step": 130919, "epoch": 3117} {"train_loss": -6.695187568664551, "global_step": 130920, "epoch": 3117} {"train_loss": -6.796812057495117, "global_step": 130921, "epoch": 3117} {"train_loss": -6.603542327880859, "global_step": 130922, "epoch": 3117} {"train_loss": -6.6792988777160645, "global_step": 130923, "epoch": 3117} {"train_loss": -6.697702407836914, "global_step": 130924, "epoch": 3117} {"train_loss": -6.690371036529541, "global_step": 130925, "epoch": 3117} {"train_loss": -6.636410713195801, "global_step": 130926, "epoch": 3117} {"train_loss": -6.522151947021484, "global_step": 130927, "epoch": 3117} {"train_loss": -6.476469993591309, "global_step": 130928, "epoch": 3117} {"train_loss": -6.556056976318359, "global_step": 130929, "epoch": 3117} {"train_loss": -6.4992475509643555, "global_step": 130930, "epoch": 3117} {"train_loss": -6.588939666748047, "global_step": 130931, "epoch": 3117} {"train_loss": -6.676361560821533, "global_step": 130932, "epoch": 3117} {"train_loss": -6.6286187171936035, "global_step": 130933, "epoch": 3117} {"train_loss": -6.597205638885498, "global_step": 130934, "epoch": 3117} {"train_loss": -6.614454746246338, "global_step": 130935, "epoch": 3117} {"train_loss": -6.703880310058594, "global_step": 130936, "epoch": 3117} {"train_loss": -6.579326629638672, "global_step": 130937, "epoch": 3117} {"train_loss": -6.708084583282471, "global_step": 130938, "epoch": 3117} {"train_loss": -6.5704779624938965, "global_step": 130939, "epoch": 3117} {"train_loss": -6.731951713562012, "global_step": 130940, "epoch": 3117} {"train_loss": -6.558855056762695, "global_step": 130941, "epoch": 3117} {"train_loss": -6.61872673034668, "global_step": 130942, "epoch": 3117} {"train_loss": -6.651155948638916, "global_step": 130943, "epoch": 3117} {"train_loss": -6.609370708465576, "global_step": 130944, "epoch": 3117} {"train_loss": -6.608789443969727, "global_step": 130945, "epoch": 3117} {"train_loss": -6.604763984680176, "global_step": 130946, "epoch": 3117} {"train_loss": -6.553444862365723, "global_step": 130947, "epoch": 3117} {"train_loss": -6.658275604248047, "global_step": 130948, "epoch": 3117} {"train_loss": -6.612597942352295, "global_step": 130949, "epoch": 3117} {"train_loss": -6.68619441986084, "global_step": 130950, "epoch": 3117} {"train_loss": -6.704694747924805, "global_step": 130951, "epoch": 3117} {"train_loss": -6.6520490646362305, "global_step": 130952, "epoch": 3117} {"train_loss": -6.626293182373047, "global_step": 130953, "epoch": 3117} {"train_loss": -6.725093841552734, "global_step": 130954, "epoch": 3117} {"train_loss": -6.640134993053618, "global_step": 130955, "epoch": 3117, "val_loss": 77459.9609375} {"train_loss": -6.540914058685303, "global_step": 130956, "epoch": 3118} {"train_loss": -6.643636703491211, "global_step": 130957, "epoch": 3118} {"train_loss": -6.706045627593994, "global_step": 130958, "epoch": 3118} {"train_loss": -6.640351295471191, "global_step": 130959, "epoch": 3118} {"train_loss": -6.653059005737305, "global_step": 130960, "epoch": 3118} {"train_loss": -6.541301727294922, "global_step": 130961, "epoch": 3118} {"train_loss": -6.720392227172852, "global_step": 130962, "epoch": 3118} {"train_loss": -6.5608367919921875, "global_step": 130963, "epoch": 3118} {"train_loss": -6.581516265869141, "global_step": 130964, "epoch": 3118} {"train_loss": -6.684787750244141, "global_step": 130965, "epoch": 3118} {"train_loss": -6.652177810668945, "global_step": 130966, "epoch": 3118} {"train_loss": -6.640663146972656, "global_step": 130967, "epoch": 3118} {"train_loss": -6.607484817504883, "global_step": 130968, "epoch": 3118} {"train_loss": -6.614077091217041, "global_step": 130969, "epoch": 3118} {"train_loss": -6.821237564086914, "global_step": 130970, "epoch": 3118} {"train_loss": -6.625385761260986, "global_step": 130971, "epoch": 3118} {"train_loss": -6.594452857971191, "global_step": 130972, "epoch": 3118} {"train_loss": -6.507831573486328, "global_step": 130973, "epoch": 3118} {"train_loss": -6.583453178405762, "global_step": 130974, "epoch": 3118} {"train_loss": -6.5985918045043945, "global_step": 130975, "epoch": 3118} {"train_loss": -6.637417316436768, "global_step": 130976, "epoch": 3118} {"train_loss": -6.640658378601074, "global_step": 130977, "epoch": 3118} {"train_loss": -6.512392997741699, "global_step": 130978, "epoch": 3118} {"train_loss": -6.6680378913879395, "global_step": 130979, "epoch": 3118} {"train_loss": -6.536927223205566, "global_step": 130980, "epoch": 3118} {"train_loss": -6.638448238372803, "global_step": 130981, "epoch": 3118} {"train_loss": -6.593667030334473, "global_step": 130982, "epoch": 3118} {"train_loss": -6.502117156982422, "global_step": 130983, "epoch": 3118} {"train_loss": -6.707817077636719, "global_step": 130984, "epoch": 3118} {"train_loss": -6.664461135864258, "global_step": 130985, "epoch": 3118} {"train_loss": -6.59505558013916, "global_step": 130986, "epoch": 3118} {"train_loss": -6.529742240905762, "global_step": 130987, "epoch": 3118} {"train_loss": -6.648561477661133, "global_step": 130988, "epoch": 3118} {"train_loss": -6.660442352294922, "global_step": 130989, "epoch": 3118} {"train_loss": -6.6946821212768555, "global_step": 130990, "epoch": 3118} {"train_loss": -6.818270683288574, "global_step": 130991, "epoch": 3118} {"train_loss": -6.683940887451172, "global_step": 130992, "epoch": 3118} {"train_loss": -6.533646583557129, "global_step": 130993, "epoch": 3118} {"train_loss": -6.602556228637695, "global_step": 130994, "epoch": 3118} {"train_loss": -6.761025428771973, "global_step": 130995, "epoch": 3118} {"train_loss": -6.687768936157227, "global_step": 130996, "epoch": 3118} {"train_loss": -6.630339736030216, "global_step": 130997, "epoch": 3118, "val_loss": 77650.4140625} {"train_loss": -6.827661514282227, "global_step": 130998, "epoch": 3119} {"train_loss": -6.700564384460449, "global_step": 130999, "epoch": 3119} {"train_loss": -6.714517116546631, "global_step": 131000, "epoch": 3119} {"train_loss": -6.718386173248291, "global_step": 131001, "epoch": 3119} {"train_loss": -6.7927093505859375, "global_step": 131002, "epoch": 3119} {"train_loss": -6.6867780685424805, "global_step": 131003, "epoch": 3119} {"train_loss": -6.768437385559082, "global_step": 131004, "epoch": 3119} {"train_loss": -6.757528305053711, "global_step": 131005, "epoch": 3119} {"train_loss": -6.729581832885742, "global_step": 131006, "epoch": 3119} {"train_loss": -6.634961128234863, "global_step": 131007, "epoch": 3119} {"train_loss": -6.692867279052734, "global_step": 131008, "epoch": 3119} {"train_loss": -6.706993103027344, "global_step": 131009, "epoch": 3119} {"train_loss": -6.592756271362305, "global_step": 131010, "epoch": 3119} {"train_loss": -6.855623722076416, "global_step": 131011, "epoch": 3119} {"train_loss": -6.681423187255859, "global_step": 131012, "epoch": 3119} {"train_loss": -6.611120223999023, "global_step": 131013, "epoch": 3119} {"train_loss": -6.708038806915283, "global_step": 131014, "epoch": 3119} {"train_loss": -6.637936592102051, "global_step": 131015, "epoch": 3119} {"train_loss": -6.642735004425049, "global_step": 131016, "epoch": 3119} {"train_loss": -6.785677909851074, "global_step": 131017, "epoch": 3119} {"train_loss": -6.667712211608887, "global_step": 131018, "epoch": 3119} {"train_loss": -6.703826904296875, "global_step": 131019, "epoch": 3119} {"train_loss": -6.665491104125977, "global_step": 131020, "epoch": 3119} {"train_loss": -6.797900199890137, "global_step": 131021, "epoch": 3119} {"train_loss": -6.647670745849609, "global_step": 131022, "epoch": 3119} {"train_loss": -6.796430587768555, "global_step": 131023, "epoch": 3119} {"train_loss": -6.698021411895752, "global_step": 131024, "epoch": 3119} {"train_loss": -6.717524528503418, "global_step": 131025, "epoch": 3119} {"train_loss": -6.607704162597656, "global_step": 131026, "epoch": 3119} {"train_loss": -6.688923358917236, "global_step": 131027, "epoch": 3119} {"train_loss": -6.610211372375488, "global_step": 131028, "epoch": 3119} {"train_loss": -6.7509660720825195, "global_step": 131029, "epoch": 3119} {"train_loss": -6.585563659667969, "global_step": 131030, "epoch": 3119} {"train_loss": -6.665882110595703, "global_step": 131031, "epoch": 3119} {"train_loss": -6.702824115753174, "global_step": 131032, "epoch": 3119} {"train_loss": -6.64116096496582, "global_step": 131033, "epoch": 3119} {"train_loss": -6.6083598136901855, "global_step": 131034, "epoch": 3119} {"train_loss": -6.733985900878906, "global_step": 131035, "epoch": 3119} {"train_loss": -6.532896041870117, "global_step": 131036, "epoch": 3119} {"train_loss": -6.6050944328308105, "global_step": 131037, "epoch": 3119} {"train_loss": -6.659117221832275, "global_step": 131038, "epoch": 3119} {"train_loss": -6.689637059257144, "global_step": 131039, "epoch": 3119, "val_loss": 77530.2578125} {"train_loss": -6.599386215209961, "global_step": 131040, "epoch": 3120} {"train_loss": -6.749965667724609, "global_step": 131041, "epoch": 3120} {"train_loss": -6.747485160827637, "global_step": 131042, "epoch": 3120} {"train_loss": -6.748587608337402, "global_step": 131043, "epoch": 3120} {"train_loss": -6.664630889892578, "global_step": 131044, "epoch": 3120} {"train_loss": -6.669455051422119, "global_step": 131045, "epoch": 3120} {"train_loss": -6.738640785217285, "global_step": 131046, "epoch": 3120} {"train_loss": -6.588242530822754, "global_step": 131047, "epoch": 3120} {"train_loss": -6.752157211303711, "global_step": 131048, "epoch": 3120} {"train_loss": -6.796909332275391, "global_step": 131049, "epoch": 3120} {"train_loss": -6.8516364097595215, "global_step": 131050, "epoch": 3120} {"train_loss": -6.635837078094482, "global_step": 131051, "epoch": 3120} {"train_loss": -6.764500141143799, "global_step": 131052, "epoch": 3120} {"train_loss": -6.84116268157959, "global_step": 131053, "epoch": 3120} {"train_loss": -6.703239440917969, "global_step": 131054, "epoch": 3120} {"train_loss": -6.595025062561035, "global_step": 131055, "epoch": 3120} {"train_loss": -6.7094902992248535, "global_step": 131056, "epoch": 3120} {"train_loss": -6.485067367553711, "global_step": 131057, "epoch": 3120} {"train_loss": -6.618154525756836, "global_step": 131058, "epoch": 3120} {"train_loss": -6.630454063415527, "global_step": 131059, "epoch": 3120} {"train_loss": -6.593023300170898, "global_step": 131060, "epoch": 3120} {"train_loss": -6.736259460449219, "global_step": 131061, "epoch": 3120} {"train_loss": -6.4274163246154785, "global_step": 131062, "epoch": 3120} {"train_loss": -6.599450588226318, "global_step": 131063, "epoch": 3120} {"train_loss": -6.750502109527588, "global_step": 131064, "epoch": 3120} {"train_loss": -6.676906585693359, "global_step": 131065, "epoch": 3120} {"train_loss": -6.634253978729248, "global_step": 131066, "epoch": 3120} {"train_loss": -6.729016304016113, "global_step": 131067, "epoch": 3120} {"train_loss": -6.618369102478027, "global_step": 131068, "epoch": 3120} {"train_loss": -6.559792995452881, "global_step": 131069, "epoch": 3120} {"train_loss": -6.752072334289551, "global_step": 131070, "epoch": 3120} {"train_loss": -6.428122520446777, "global_step": 131071, "epoch": 3120} {"train_loss": -6.532912731170654, "global_step": 131072, "epoch": 3120} {"train_loss": -6.639749050140381, "global_step": 131073, "epoch": 3120} {"train_loss": -6.548227787017822, "global_step": 131074, "epoch": 3120} {"train_loss": -6.651111602783203, "global_step": 131075, "epoch": 3120} {"train_loss": -6.590866565704346, "global_step": 131076, "epoch": 3120} {"train_loss": -6.620174884796143, "global_step": 131077, "epoch": 3120} {"train_loss": -6.553318500518799, "global_step": 131078, "epoch": 3120} {"train_loss": -6.786162376403809, "global_step": 131079, "epoch": 3120} {"train_loss": -6.75611686706543, "global_step": 131080, "epoch": 3120} {"train_loss": -6.661139227095104, "global_step": 131081, "epoch": 3120, "val_loss": 77635.0390625} {"train_loss": -6.711576461791992, "global_step": 131082, "epoch": 3121} {"train_loss": -6.685715675354004, "global_step": 131083, "epoch": 3121} {"train_loss": -6.7332658767700195, "global_step": 131084, "epoch": 3121} {"train_loss": -6.732690334320068, "global_step": 131085, "epoch": 3121} {"train_loss": -6.6902337074279785, "global_step": 131086, "epoch": 3121} {"train_loss": -6.696418762207031, "global_step": 131087, "epoch": 3121} {"train_loss": -6.622743606567383, "global_step": 131088, "epoch": 3121} {"train_loss": -6.795290946960449, "global_step": 131089, "epoch": 3121} {"train_loss": -6.676780700683594, "global_step": 131090, "epoch": 3121} {"train_loss": -6.744997501373291, "global_step": 131091, "epoch": 3121} {"train_loss": -6.816899299621582, "global_step": 131092, "epoch": 3121} {"train_loss": -6.644872665405273, "global_step": 131093, "epoch": 3121} {"train_loss": -6.87043571472168, "global_step": 131094, "epoch": 3121} {"train_loss": -6.780699729919434, "global_step": 131095, "epoch": 3121} {"train_loss": -6.733547210693359, "global_step": 131096, "epoch": 3121} {"train_loss": -6.835474967956543, "global_step": 131097, "epoch": 3121} {"train_loss": -6.757864475250244, "global_step": 131098, "epoch": 3121} {"train_loss": -6.699286460876465, "global_step": 131099, "epoch": 3121} {"train_loss": -6.755249977111816, "global_step": 131100, "epoch": 3121} {"train_loss": -6.482449531555176, "global_step": 131101, "epoch": 3121} {"train_loss": -6.642592430114746, "global_step": 131102, "epoch": 3121} {"train_loss": -6.585538864135742, "global_step": 131103, "epoch": 3121} {"train_loss": -6.654253005981445, "global_step": 131104, "epoch": 3121} {"train_loss": -6.633393287658691, "global_step": 131105, "epoch": 3121} {"train_loss": -6.676469802856445, "global_step": 131106, "epoch": 3121} {"train_loss": -6.566659450531006, "global_step": 131107, "epoch": 3121} {"train_loss": -6.667594909667969, "global_step": 131108, "epoch": 3121} {"train_loss": -6.644414901733398, "global_step": 131109, "epoch": 3121} {"train_loss": -6.730791091918945, "global_step": 131110, "epoch": 3121} {"train_loss": -6.629327774047852, "global_step": 131111, "epoch": 3121} {"train_loss": -6.604342460632324, "global_step": 131112, "epoch": 3121} {"train_loss": -6.761031627655029, "global_step": 131113, "epoch": 3121} {"train_loss": -6.585209369659424, "global_step": 131114, "epoch": 3121} {"train_loss": -6.701879978179932, "global_step": 131115, "epoch": 3121} {"train_loss": -6.607863426208496, "global_step": 131116, "epoch": 3121} {"train_loss": -6.579868316650391, "global_step": 131117, "epoch": 3121} {"train_loss": -6.511240005493164, "global_step": 131118, "epoch": 3121} {"train_loss": -6.563297271728516, "global_step": 131119, "epoch": 3121} {"train_loss": -6.6858367919921875, "global_step": 131120, "epoch": 3121} {"train_loss": -6.654201984405518, "global_step": 131121, "epoch": 3121} {"train_loss": -6.629837989807129, "global_step": 131122, "epoch": 3121} {"train_loss": -6.67589012781779, "global_step": 131123, "epoch": 3121, "val_loss": 77584.7578125} {"train_loss": -6.812638282775879, "global_step": 131124, "epoch": 3122} {"train_loss": -6.554596900939941, "global_step": 131125, "epoch": 3122} {"train_loss": -6.738798141479492, "global_step": 131126, "epoch": 3122} {"train_loss": -6.773678302764893, "global_step": 131127, "epoch": 3122} {"train_loss": -6.718832015991211, "global_step": 131128, "epoch": 3122} {"train_loss": -6.714974403381348, "global_step": 131129, "epoch": 3122} {"train_loss": -6.735309600830078, "global_step": 131130, "epoch": 3122} {"train_loss": -6.667726039886475, "global_step": 131131, "epoch": 3122} {"train_loss": -6.6729230880737305, "global_step": 131132, "epoch": 3122} {"train_loss": -6.718678951263428, "global_step": 131133, "epoch": 3122} {"train_loss": -6.689147472381592, "global_step": 131134, "epoch": 3122} {"train_loss": -6.630992889404297, "global_step": 131135, "epoch": 3122} {"train_loss": -6.705724716186523, "global_step": 131136, "epoch": 3122} {"train_loss": -6.697040557861328, "global_step": 131137, "epoch": 3122} {"train_loss": -6.66904354095459, "global_step": 131138, "epoch": 3122} {"train_loss": -6.736464977264404, "global_step": 131139, "epoch": 3122} {"train_loss": -6.58122444152832, "global_step": 131140, "epoch": 3122} {"train_loss": -6.857365608215332, "global_step": 131141, "epoch": 3122} {"train_loss": -6.675480365753174, "global_step": 131142, "epoch": 3122} {"train_loss": -6.709676265716553, "global_step": 131143, "epoch": 3122} {"train_loss": -6.6356964111328125, "global_step": 131144, "epoch": 3122} {"train_loss": -6.7495574951171875, "global_step": 131145, "epoch": 3122} {"train_loss": -6.7214884757995605, "global_step": 131146, "epoch": 3122} {"train_loss": -6.674062728881836, "global_step": 131147, "epoch": 3122} {"train_loss": -6.7786407470703125, "global_step": 131148, "epoch": 3122} {"train_loss": -6.712723731994629, "global_step": 131149, "epoch": 3122} {"train_loss": -6.769977569580078, "global_step": 131150, "epoch": 3122} {"train_loss": -6.735041618347168, "global_step": 131151, "epoch": 3122} {"train_loss": -6.685576438903809, "global_step": 131152, "epoch": 3122} {"train_loss": -6.6913743019104, "global_step": 131153, "epoch": 3122} {"train_loss": -6.629139423370361, "global_step": 131154, "epoch": 3122} {"train_loss": -6.745627403259277, "global_step": 131155, "epoch": 3122} {"train_loss": -6.625026702880859, "global_step": 131156, "epoch": 3122} {"train_loss": -6.693535327911377, "global_step": 131157, "epoch": 3122} {"train_loss": -6.652954578399658, "global_step": 131158, "epoch": 3122} {"train_loss": -6.750921726226807, "global_step": 131159, "epoch": 3122} {"train_loss": -6.66722297668457, "global_step": 131160, "epoch": 3122} {"train_loss": -6.601891040802002, "global_step": 131161, "epoch": 3122} {"train_loss": -6.626079559326172, "global_step": 131162, "epoch": 3122} {"train_loss": -6.729589462280273, "global_step": 131163, "epoch": 3122} {"train_loss": -6.716313362121582, "global_step": 131164, "epoch": 3122} {"train_loss": -6.695457276843843, "global_step": 131165, "epoch": 3122, "val_loss": 77651.4765625} {"train_loss": -6.598005294799805, "global_step": 131166, "epoch": 3123} {"train_loss": -6.784449577331543, "global_step": 131167, "epoch": 3123} {"train_loss": -6.602263450622559, "global_step": 131168, "epoch": 3123} {"train_loss": -6.612906455993652, "global_step": 131169, "epoch": 3123} {"train_loss": -6.741303443908691, "global_step": 131170, "epoch": 3123} {"train_loss": -6.669012069702148, "global_step": 131171, "epoch": 3123} {"train_loss": -6.700993537902832, "global_step": 131172, "epoch": 3123} {"train_loss": -6.658730983734131, "global_step": 131173, "epoch": 3123} {"train_loss": -6.429330348968506, "global_step": 131174, "epoch": 3123} {"train_loss": -6.751803398132324, "global_step": 131175, "epoch": 3123} {"train_loss": -6.70263671875, "global_step": 131176, "epoch": 3123} {"train_loss": -6.621293067932129, "global_step": 131177, "epoch": 3123} {"train_loss": -6.626925468444824, "global_step": 131178, "epoch": 3123} {"train_loss": -6.685909271240234, "global_step": 131179, "epoch": 3123} {"train_loss": -6.678735256195068, "global_step": 131180, "epoch": 3123} {"train_loss": -6.757964134216309, "global_step": 131181, "epoch": 3123} {"train_loss": -6.563345909118652, "global_step": 131182, "epoch": 3123} {"train_loss": -6.911224365234375, "global_step": 131183, "epoch": 3123} {"train_loss": -6.744387626647949, "global_step": 131184, "epoch": 3123} {"train_loss": -6.633103370666504, "global_step": 131185, "epoch": 3123} {"train_loss": -6.8424177169799805, "global_step": 131186, "epoch": 3123} {"train_loss": -6.707808971405029, "global_step": 131187, "epoch": 3123} {"train_loss": -6.711310386657715, "global_step": 131188, "epoch": 3123} {"train_loss": -6.619931221008301, "global_step": 131189, "epoch": 3123} {"train_loss": -6.718588829040527, "global_step": 131190, "epoch": 3123} {"train_loss": -6.683403015136719, "global_step": 131191, "epoch": 3123} {"train_loss": -6.682065963745117, "global_step": 131192, "epoch": 3123} {"train_loss": -6.690659523010254, "global_step": 131193, "epoch": 3123} {"train_loss": -6.704904556274414, "global_step": 131194, "epoch": 3123} {"train_loss": -6.6150221824646, "global_step": 131195, "epoch": 3123} {"train_loss": -6.724600791931152, "global_step": 131196, "epoch": 3123} {"train_loss": -6.704580307006836, "global_step": 131197, "epoch": 3123} {"train_loss": -6.653469085693359, "global_step": 131198, "epoch": 3123} {"train_loss": -6.764215469360352, "global_step": 131199, "epoch": 3123} {"train_loss": -6.805995941162109, "global_step": 131200, "epoch": 3123} {"train_loss": -6.645366668701172, "global_step": 131201, "epoch": 3123} {"train_loss": -6.488920211791992, "global_step": 131202, "epoch": 3123} {"train_loss": -6.598850250244141, "global_step": 131203, "epoch": 3123} {"train_loss": -6.725170135498047, "global_step": 131204, "epoch": 3123} {"train_loss": -6.670514106750488, "global_step": 131205, "epoch": 3123} {"train_loss": -6.717100620269775, "global_step": 131206, "epoch": 3123} {"train_loss": -6.68151144754319, "global_step": 131207, "epoch": 3123, "val_loss": 77475.8125} {"train_loss": -6.738045692443848, "global_step": 131208, "epoch": 3124} {"train_loss": -6.752185821533203, "global_step": 131209, "epoch": 3124} {"train_loss": -6.782651424407959, "global_step": 131210, "epoch": 3124} {"train_loss": -6.60701847076416, "global_step": 131211, "epoch": 3124} {"train_loss": -6.701539039611816, "global_step": 131212, "epoch": 3124} {"train_loss": -6.630866050720215, "global_step": 131213, "epoch": 3124} {"train_loss": -6.618992805480957, "global_step": 131214, "epoch": 3124} {"train_loss": -6.6629557609558105, "global_step": 131215, "epoch": 3124} {"train_loss": -6.5819501876831055, "global_step": 131216, "epoch": 3124} {"train_loss": -6.472192287445068, "global_step": 131217, "epoch": 3124} {"train_loss": -6.641057968139648, "global_step": 131218, "epoch": 3124} {"train_loss": -6.627108573913574, "global_step": 131219, "epoch": 3124} {"train_loss": -6.594176292419434, "global_step": 131220, "epoch": 3124} {"train_loss": -6.695138931274414, "global_step": 131221, "epoch": 3124} {"train_loss": -6.526430130004883, "global_step": 131222, "epoch": 3124} {"train_loss": -6.661499977111816, "global_step": 131223, "epoch": 3124} {"train_loss": -6.76695442199707, "global_step": 131224, "epoch": 3124} {"train_loss": -6.690179824829102, "global_step": 131225, "epoch": 3124} {"train_loss": -6.607577323913574, "global_step": 131226, "epoch": 3124} {"train_loss": -6.648983955383301, "global_step": 131227, "epoch": 3124} {"train_loss": -6.635401725769043, "global_step": 131228, "epoch": 3124} {"train_loss": -6.61331844329834, "global_step": 131229, "epoch": 3124} {"train_loss": -6.616644859313965, "global_step": 131230, "epoch": 3124} {"train_loss": -6.627772808074951, "global_step": 131231, "epoch": 3124} {"train_loss": -6.714934349060059, "global_step": 131232, "epoch": 3124} {"train_loss": -6.623597145080566, "global_step": 131233, "epoch": 3124} {"train_loss": -6.610928058624268, "global_step": 131234, "epoch": 3124} {"train_loss": -6.752086162567139, "global_step": 131235, "epoch": 3124} {"train_loss": -6.631768226623535, "global_step": 131236, "epoch": 3124} {"train_loss": -6.611209392547607, "global_step": 131237, "epoch": 3124} {"train_loss": -6.691990375518799, "global_step": 131238, "epoch": 3124} {"train_loss": -6.638160228729248, "global_step": 131239, "epoch": 3124} {"train_loss": -6.615385055541992, "global_step": 131240, "epoch": 3124} {"train_loss": -6.613780975341797, "global_step": 131241, "epoch": 3124} {"train_loss": -6.606749534606934, "global_step": 131242, "epoch": 3124} {"train_loss": -6.614784240722656, "global_step": 131243, "epoch": 3124} {"train_loss": -6.709547996520996, "global_step": 131244, "epoch": 3124} {"train_loss": -6.541567802429199, "global_step": 131245, "epoch": 3124} {"train_loss": -6.580329418182373, "global_step": 131246, "epoch": 3124} {"train_loss": -6.6965742111206055, "global_step": 131247, "epoch": 3124} {"train_loss": -6.505921363830566, "global_step": 131248, "epoch": 3124} {"train_loss": -6.6428387732732865, "global_step": 131249, "epoch": 3124, "val_loss": 77653.421875} {"train_loss": -6.5574164390563965, "global_step": 131250, "epoch": 3125} {"train_loss": -6.600530624389648, "global_step": 131251, "epoch": 3125} {"train_loss": -6.640305995941162, "global_step": 131252, "epoch": 3125} {"train_loss": -6.405632019042969, "global_step": 131253, "epoch": 3125} {"train_loss": -6.659636497497559, "global_step": 131254, "epoch": 3125} {"train_loss": -6.641578674316406, "global_step": 131255, "epoch": 3125} {"train_loss": -6.696183204650879, "global_step": 131256, "epoch": 3125} {"train_loss": -6.572957992553711, "global_step": 131257, "epoch": 3125} {"train_loss": -6.6651458740234375, "global_step": 131258, "epoch": 3125} {"train_loss": -6.57490348815918, "global_step": 131259, "epoch": 3125} {"train_loss": -6.564356327056885, "global_step": 131260, "epoch": 3125} {"train_loss": -6.59422492980957, "global_step": 131261, "epoch": 3125} {"train_loss": -6.601207256317139, "global_step": 131262, "epoch": 3125} {"train_loss": -6.642864227294922, "global_step": 131263, "epoch": 3125} {"train_loss": -6.426413059234619, "global_step": 131264, "epoch": 3125} {"train_loss": -6.600863456726074, "global_step": 131265, "epoch": 3125} {"train_loss": -6.618191719055176, "global_step": 131266, "epoch": 3125} {"train_loss": -6.659878253936768, "global_step": 131267, "epoch": 3125} {"train_loss": -6.583456993103027, "global_step": 131268, "epoch": 3125} {"train_loss": -6.667911052703857, "global_step": 131269, "epoch": 3125} {"train_loss": -6.67806339263916, "global_step": 131270, "epoch": 3125} {"train_loss": -6.674006462097168, "global_step": 131271, "epoch": 3125} {"train_loss": -6.640646934509277, "global_step": 131272, "epoch": 3125} {"train_loss": -6.730940818786621, "global_step": 131273, "epoch": 3125} {"train_loss": -6.598325729370117, "global_step": 131274, "epoch": 3125} {"train_loss": -6.682429790496826, "global_step": 131275, "epoch": 3125} {"train_loss": -6.71976375579834, "global_step": 131276, "epoch": 3125} {"train_loss": -6.518580913543701, "global_step": 131277, "epoch": 3125} {"train_loss": -6.678813934326172, "global_step": 131278, "epoch": 3125} {"train_loss": -6.556537628173828, "global_step": 131279, "epoch": 3125} {"train_loss": -6.787586688995361, "global_step": 131280, "epoch": 3125} {"train_loss": -6.699332237243652, "global_step": 131281, "epoch": 3125} {"train_loss": -6.627439975738525, "global_step": 131282, "epoch": 3125} {"train_loss": -6.703189849853516, "global_step": 131283, "epoch": 3125} {"train_loss": -6.605772972106934, "global_step": 131284, "epoch": 3125} {"train_loss": -6.772285461425781, "global_step": 131285, "epoch": 3125} {"train_loss": -6.710784912109375, "global_step": 131286, "epoch": 3125} {"train_loss": -6.754915714263916, "global_step": 131287, "epoch": 3125} {"train_loss": -6.581357002258301, "global_step": 131288, "epoch": 3125} {"train_loss": -6.852562427520752, "global_step": 131289, "epoch": 3125} {"train_loss": -6.714369773864746, "global_step": 131290, "epoch": 3125} {"train_loss": -6.6420675459362215, "global_step": 131291, "epoch": 3125, "val_loss": 77428.75} {"train_loss": -6.671192169189453, "global_step": 131292, "epoch": 3126} {"train_loss": -6.8734893798828125, "global_step": 131293, "epoch": 3126} {"train_loss": -6.821698188781738, "global_step": 131294, "epoch": 3126} {"train_loss": -6.788763999938965, "global_step": 131295, "epoch": 3126} {"train_loss": -6.772087574005127, "global_step": 131296, "epoch": 3126} {"train_loss": -6.7130842208862305, "global_step": 131297, "epoch": 3126} {"train_loss": -6.732845306396484, "global_step": 131298, "epoch": 3126} {"train_loss": -6.669844150543213, "global_step": 131299, "epoch": 3126} {"train_loss": -6.731545448303223, "global_step": 131300, "epoch": 3126} {"train_loss": -6.72175407409668, "global_step": 131301, "epoch": 3126} {"train_loss": -6.766348838806152, "global_step": 131302, "epoch": 3126} {"train_loss": -6.742112636566162, "global_step": 131303, "epoch": 3126} {"train_loss": -6.729288578033447, "global_step": 131304, "epoch": 3126} {"train_loss": -6.775800704956055, "global_step": 131305, "epoch": 3126} {"train_loss": -6.711022853851318, "global_step": 131306, "epoch": 3126} {"train_loss": -6.807039260864258, "global_step": 131307, "epoch": 3126} {"train_loss": -6.645978927612305, "global_step": 131308, "epoch": 3126} {"train_loss": -6.696599960327148, "global_step": 131309, "epoch": 3126} {"train_loss": -6.699359893798828, "global_step": 131310, "epoch": 3126} {"train_loss": -6.596378326416016, "global_step": 131311, "epoch": 3126} {"train_loss": -6.688745975494385, "global_step": 131312, "epoch": 3126} {"train_loss": -6.623023986816406, "global_step": 131313, "epoch": 3126} {"train_loss": -6.648632049560547, "global_step": 131314, "epoch": 3126} {"train_loss": -6.679392337799072, "global_step": 131315, "epoch": 3126} {"train_loss": -6.780328750610352, "global_step": 131316, "epoch": 3126} {"train_loss": -6.69940185546875, "global_step": 131317, "epoch": 3126} {"train_loss": -6.696720123291016, "global_step": 131318, "epoch": 3126} {"train_loss": -6.755667209625244, "global_step": 131319, "epoch": 3126} {"train_loss": -6.668820381164551, "global_step": 131320, "epoch": 3126} {"train_loss": -6.612305164337158, "global_step": 131321, "epoch": 3126} {"train_loss": -6.749670505523682, "global_step": 131322, "epoch": 3126} {"train_loss": -6.6887969970703125, "global_step": 131323, "epoch": 3126} {"train_loss": -6.783880233764648, "global_step": 131324, "epoch": 3126} {"train_loss": -6.63690710067749, "global_step": 131325, "epoch": 3126} {"train_loss": -6.77004861831665, "global_step": 131326, "epoch": 3126} {"train_loss": -6.6949334144592285, "global_step": 131327, "epoch": 3126} {"train_loss": -6.741064548492432, "global_step": 131328, "epoch": 3126} {"train_loss": -6.669206619262695, "global_step": 131329, "epoch": 3126} {"train_loss": -6.708495140075684, "global_step": 131330, "epoch": 3126} {"train_loss": -6.6727495193481445, "global_step": 131331, "epoch": 3126} {"train_loss": -6.687003135681152, "global_step": 131332, "epoch": 3126} {"train_loss": -6.713276431674049, "global_step": 131333, "epoch": 3126, "val_loss": 77524.6953125} {"train_loss": -6.647792816162109, "global_step": 131334, "epoch": 3127} {"train_loss": -6.831471920013428, "global_step": 131335, "epoch": 3127} {"train_loss": -6.713195323944092, "global_step": 131336, "epoch": 3127} {"train_loss": -6.6810503005981445, "global_step": 131337, "epoch": 3127} {"train_loss": -6.739180564880371, "global_step": 131338, "epoch": 3127} {"train_loss": -6.632984161376953, "global_step": 131339, "epoch": 3127} {"train_loss": -6.746929168701172, "global_step": 131340, "epoch": 3127} {"train_loss": -6.6338582038879395, "global_step": 131341, "epoch": 3127} {"train_loss": -6.637005805969238, "global_step": 131342, "epoch": 3127} {"train_loss": -6.851743698120117, "global_step": 131343, "epoch": 3127} {"train_loss": -6.600399971008301, "global_step": 131344, "epoch": 3127} {"train_loss": -6.627016067504883, "global_step": 131345, "epoch": 3127} {"train_loss": -6.728174209594727, "global_step": 131346, "epoch": 3127} {"train_loss": -6.732853412628174, "global_step": 131347, "epoch": 3127} {"train_loss": -6.666978359222412, "global_step": 131348, "epoch": 3127} {"train_loss": -6.647854328155518, "global_step": 131349, "epoch": 3127} {"train_loss": -6.632116317749023, "global_step": 131350, "epoch": 3127} {"train_loss": -6.7585601806640625, "global_step": 131351, "epoch": 3127} {"train_loss": -6.65183162689209, "global_step": 131352, "epoch": 3127} {"train_loss": -6.6956586837768555, "global_step": 131353, "epoch": 3127} {"train_loss": -6.699843883514404, "global_step": 131354, "epoch": 3127} {"train_loss": -6.6332855224609375, "global_step": 131355, "epoch": 3127} {"train_loss": -6.647611141204834, "global_step": 131356, "epoch": 3127} {"train_loss": -6.67136287689209, "global_step": 131357, "epoch": 3127} {"train_loss": -6.7406816482543945, "global_step": 131358, "epoch": 3127} {"train_loss": -6.624677658081055, "global_step": 131359, "epoch": 3127} {"train_loss": -6.638448715209961, "global_step": 131360, "epoch": 3127} {"train_loss": -6.695149898529053, "global_step": 131361, "epoch": 3127} {"train_loss": -6.654175758361816, "global_step": 131362, "epoch": 3127} {"train_loss": -6.700910568237305, "global_step": 131363, "epoch": 3127} {"train_loss": -6.7255353927612305, "global_step": 131364, "epoch": 3127} {"train_loss": -6.661410331726074, "global_step": 131365, "epoch": 3127} {"train_loss": -6.611238479614258, "global_step": 131366, "epoch": 3127} {"train_loss": -6.660420894622803, "global_step": 131367, "epoch": 3127} {"train_loss": -6.604886054992676, "global_step": 131368, "epoch": 3127} {"train_loss": -6.6437788009643555, "global_step": 131369, "epoch": 3127} {"train_loss": -6.7363176345825195, "global_step": 131370, "epoch": 3127} {"train_loss": -6.596432209014893, "global_step": 131371, "epoch": 3127} {"train_loss": -6.728429317474365, "global_step": 131372, "epoch": 3127} {"train_loss": -6.602787971496582, "global_step": 131373, "epoch": 3127} {"train_loss": -6.693821430206299, "global_step": 131374, "epoch": 3127} {"train_loss": -6.678647870109195, "global_step": 131375, "epoch": 3127, "val_loss": 77483.5859375} {"train_loss": -6.613319396972656, "global_step": 131376, "epoch": 3128} {"train_loss": -6.658078193664551, "global_step": 131377, "epoch": 3128} {"train_loss": -6.607288360595703, "global_step": 131378, "epoch": 3128} {"train_loss": -6.708806037902832, "global_step": 131379, "epoch": 3128} {"train_loss": -6.713286876678467, "global_step": 131380, "epoch": 3128} {"train_loss": -6.56397008895874, "global_step": 131381, "epoch": 3128} {"train_loss": -6.66762638092041, "global_step": 131382, "epoch": 3128} {"train_loss": -6.69659948348999, "global_step": 131383, "epoch": 3128} {"train_loss": -6.707122802734375, "global_step": 131384, "epoch": 3128} {"train_loss": -6.658989906311035, "global_step": 131385, "epoch": 3128} {"train_loss": -6.603665351867676, "global_step": 131386, "epoch": 3128} {"train_loss": -6.622230529785156, "global_step": 131387, "epoch": 3128} {"train_loss": -6.6756720542907715, "global_step": 131388, "epoch": 3128} {"train_loss": -6.707120895385742, "global_step": 131389, "epoch": 3128} {"train_loss": -6.605752944946289, "global_step": 131390, "epoch": 3128} {"train_loss": -6.756877899169922, "global_step": 131391, "epoch": 3128} {"train_loss": -6.702532768249512, "global_step": 131392, "epoch": 3128} {"train_loss": -6.696800708770752, "global_step": 131393, "epoch": 3128} {"train_loss": -6.569406032562256, "global_step": 131394, "epoch": 3128} {"train_loss": -6.622546195983887, "global_step": 131395, "epoch": 3128} {"train_loss": -6.604848861694336, "global_step": 131396, "epoch": 3128} {"train_loss": -6.710361480712891, "global_step": 131397, "epoch": 3128} {"train_loss": -6.713644981384277, "global_step": 131398, "epoch": 3128} {"train_loss": -6.577535629272461, "global_step": 131399, "epoch": 3128} {"train_loss": -6.752793312072754, "global_step": 131400, "epoch": 3128} {"train_loss": -6.842121124267578, "global_step": 131401, "epoch": 3128} {"train_loss": -6.665896415710449, "global_step": 131402, "epoch": 3128} {"train_loss": -6.725442409515381, "global_step": 131403, "epoch": 3128} {"train_loss": -6.697727680206299, "global_step": 131404, "epoch": 3128} {"train_loss": -6.777776718139648, "global_step": 131405, "epoch": 3128} {"train_loss": -6.656185150146484, "global_step": 131406, "epoch": 3128} {"train_loss": -6.699043273925781, "global_step": 131407, "epoch": 3128} {"train_loss": -6.74465274810791, "global_step": 131408, "epoch": 3128} {"train_loss": -6.6637773513793945, "global_step": 131409, "epoch": 3128} {"train_loss": -6.785707473754883, "global_step": 131410, "epoch": 3128} {"train_loss": -6.680584907531738, "global_step": 131411, "epoch": 3128} {"train_loss": -6.640697479248047, "global_step": 131412, "epoch": 3128} {"train_loss": -6.6054792404174805, "global_step": 131413, "epoch": 3128} {"train_loss": -6.656094074249268, "global_step": 131414, "epoch": 3128} {"train_loss": -6.639939785003662, "global_step": 131415, "epoch": 3128} {"train_loss": -6.676790237426758, "global_step": 131416, "epoch": 3128} {"train_loss": -6.673027288346064, "global_step": 131417, "epoch": 3128, "val_loss": 77492.859375} {"train_loss": -6.665429592132568, "global_step": 131418, "epoch": 3129} {"train_loss": -6.797888278961182, "global_step": 131419, "epoch": 3129} {"train_loss": -6.765104293823242, "global_step": 131420, "epoch": 3129} {"train_loss": -6.630076885223389, "global_step": 131421, "epoch": 3129} {"train_loss": -6.647364616394043, "global_step": 131422, "epoch": 3129} {"train_loss": -6.680851936340332, "global_step": 131423, "epoch": 3129} {"train_loss": -6.636797904968262, "global_step": 131424, "epoch": 3129} {"train_loss": -6.696419715881348, "global_step": 131425, "epoch": 3129} {"train_loss": -6.7421135902404785, "global_step": 131426, "epoch": 3129} {"train_loss": -6.672551155090332, "global_step": 131427, "epoch": 3129} {"train_loss": -6.73309850692749, "global_step": 131428, "epoch": 3129} {"train_loss": -6.685503959655762, "global_step": 131429, "epoch": 3129} {"train_loss": -6.837860584259033, "global_step": 131430, "epoch": 3129} {"train_loss": -6.754047393798828, "global_step": 131431, "epoch": 3129} {"train_loss": -6.696030616760254, "global_step": 131432, "epoch": 3129} {"train_loss": -6.594236373901367, "global_step": 131433, "epoch": 3129} {"train_loss": -6.685291290283203, "global_step": 131434, "epoch": 3129} {"train_loss": -6.698460102081299, "global_step": 131435, "epoch": 3129} {"train_loss": -6.810835838317871, "global_step": 131436, "epoch": 3129} {"train_loss": -6.722912788391113, "global_step": 131437, "epoch": 3129} {"train_loss": -6.767529487609863, "global_step": 131438, "epoch": 3129} {"train_loss": -6.735063552856445, "global_step": 131439, "epoch": 3129} {"train_loss": -6.674715042114258, "global_step": 131440, "epoch": 3129} {"train_loss": -6.672839641571045, "global_step": 131441, "epoch": 3129} {"train_loss": -6.758562088012695, "global_step": 131442, "epoch": 3129} {"train_loss": -6.8412041664123535, "global_step": 131443, "epoch": 3129} {"train_loss": -6.601174354553223, "global_step": 131444, "epoch": 3129} {"train_loss": -6.724422454833984, "global_step": 131445, "epoch": 3129} {"train_loss": -6.717642784118652, "global_step": 131446, "epoch": 3129} {"train_loss": -6.570037841796875, "global_step": 131447, "epoch": 3129} {"train_loss": -6.76617431640625, "global_step": 131448, "epoch": 3129} {"train_loss": -6.677166938781738, "global_step": 131449, "epoch": 3129} {"train_loss": -6.701647758483887, "global_step": 131450, "epoch": 3129} {"train_loss": -6.783259391784668, "global_step": 131451, "epoch": 3129} {"train_loss": -6.748646259307861, "global_step": 131452, "epoch": 3129} {"train_loss": -6.661812782287598, "global_step": 131453, "epoch": 3129} {"train_loss": -6.6974005699157715, "global_step": 131454, "epoch": 3129} {"train_loss": -6.700980186462402, "global_step": 131455, "epoch": 3129} {"train_loss": -6.667922019958496, "global_step": 131456, "epoch": 3129} {"train_loss": -6.670989513397217, "global_step": 131457, "epoch": 3129} {"train_loss": -6.594779968261719, "global_step": 131458, "epoch": 3129} {"train_loss": -6.700403213500977, "global_step": 131459, "epoch": 3129, "val_loss": 77626.8046875} {"train_loss": -6.699366092681885, "global_step": 131460, "epoch": 3130} {"train_loss": -6.657533168792725, "global_step": 131461, "epoch": 3130} {"train_loss": -6.576491355895996, "global_step": 131462, "epoch": 3130} {"train_loss": -6.64780330657959, "global_step": 131463, "epoch": 3130} {"train_loss": -6.6492919921875, "global_step": 131464, "epoch": 3130} {"train_loss": -6.660786151885986, "global_step": 131465, "epoch": 3130} {"train_loss": -6.662893295288086, "global_step": 131466, "epoch": 3130} {"train_loss": -6.708985328674316, "global_step": 131467, "epoch": 3130} {"train_loss": -6.678201675415039, "global_step": 131468, "epoch": 3130} {"train_loss": -6.724879741668701, "global_step": 131469, "epoch": 3130} {"train_loss": -6.722847938537598, "global_step": 131470, "epoch": 3130} {"train_loss": -6.61276912689209, "global_step": 131471, "epoch": 3130} {"train_loss": -6.610002517700195, "global_step": 131472, "epoch": 3130} {"train_loss": -6.721964359283447, "global_step": 131473, "epoch": 3130} {"train_loss": -6.57492208480835, "global_step": 131474, "epoch": 3130} {"train_loss": -6.586144924163818, "global_step": 131475, "epoch": 3130} {"train_loss": -6.607640743255615, "global_step": 131476, "epoch": 3130} {"train_loss": -6.699081897735596, "global_step": 131477, "epoch": 3130} {"train_loss": -6.656071662902832, "global_step": 131478, "epoch": 3130} {"train_loss": -6.517705917358398, "global_step": 131479, "epoch": 3130} {"train_loss": -6.740712642669678, "global_step": 131480, "epoch": 3130} {"train_loss": -6.522806167602539, "global_step": 131481, "epoch": 3130} {"train_loss": -6.567821025848389, "global_step": 131482, "epoch": 3130} {"train_loss": -6.574986457824707, "global_step": 131483, "epoch": 3130} {"train_loss": -6.678055763244629, "global_step": 131484, "epoch": 3130} {"train_loss": -6.6678314208984375, "global_step": 131485, "epoch": 3130} {"train_loss": -6.705035209655762, "global_step": 131486, "epoch": 3130} {"train_loss": -6.648689270019531, "global_step": 131487, "epoch": 3130} {"train_loss": -6.752294063568115, "global_step": 131488, "epoch": 3130} {"train_loss": -6.713618278503418, "global_step": 131489, "epoch": 3130} {"train_loss": -6.659572124481201, "global_step": 131490, "epoch": 3130} {"train_loss": -6.714419364929199, "global_step": 131491, "epoch": 3130} {"train_loss": -6.670496463775635, "global_step": 131492, "epoch": 3130} {"train_loss": -6.661896228790283, "global_step": 131493, "epoch": 3130} {"train_loss": -6.706560134887695, "global_step": 131494, "epoch": 3130} {"train_loss": -6.619819641113281, "global_step": 131495, "epoch": 3130} {"train_loss": -6.653292655944824, "global_step": 131496, "epoch": 3130} {"train_loss": -6.763775825500488, "global_step": 131497, "epoch": 3130} {"train_loss": -6.781946182250977, "global_step": 131498, "epoch": 3130} {"train_loss": -6.8149871826171875, "global_step": 131499, "epoch": 3130} {"train_loss": -6.685391426086426, "global_step": 131500, "epoch": 3130} {"train_loss": -6.670100847880046, "global_step": 131501, "epoch": 3130, "val_loss": 77442.921875} {"train_loss": -6.731127738952637, "global_step": 131502, "epoch": 3131} {"train_loss": -6.708281517028809, "global_step": 131503, "epoch": 3131} {"train_loss": -6.715743541717529, "global_step": 131504, "epoch": 3131} {"train_loss": -6.637031555175781, "global_step": 131505, "epoch": 3131} {"train_loss": -6.618945121765137, "global_step": 131506, "epoch": 3131} {"train_loss": -6.639202117919922, "global_step": 131507, "epoch": 3131} {"train_loss": -6.796204566955566, "global_step": 131508, "epoch": 3131} {"train_loss": -6.699670314788818, "global_step": 131509, "epoch": 3131} {"train_loss": -6.6557512283325195, "global_step": 131510, "epoch": 3131} {"train_loss": -6.623039722442627, "global_step": 131511, "epoch": 3131} {"train_loss": -6.858521938323975, "global_step": 131512, "epoch": 3131} {"train_loss": -6.473193168640137, "global_step": 131513, "epoch": 3131} {"train_loss": -6.579380512237549, "global_step": 131514, "epoch": 3131} {"train_loss": -6.585598945617676, "global_step": 131515, "epoch": 3131} {"train_loss": -6.480233192443848, "global_step": 131516, "epoch": 3131} {"train_loss": -6.648931503295898, "global_step": 131517, "epoch": 3131} {"train_loss": -6.631697654724121, "global_step": 131518, "epoch": 3131} {"train_loss": -6.641714096069336, "global_step": 131519, "epoch": 3131} {"train_loss": -6.6686811447143555, "global_step": 131520, "epoch": 3131} {"train_loss": -6.533041477203369, "global_step": 131521, "epoch": 3131} {"train_loss": -6.723334789276123, "global_step": 131522, "epoch": 3131} {"train_loss": -6.572115421295166, "global_step": 131523, "epoch": 3131} {"train_loss": -6.4797844886779785, "global_step": 131524, "epoch": 3131} {"train_loss": -6.6610870361328125, "global_step": 131525, "epoch": 3131} {"train_loss": -6.639652252197266, "global_step": 131526, "epoch": 3131} {"train_loss": -6.586392879486084, "global_step": 131527, "epoch": 3131} {"train_loss": -6.599665641784668, "global_step": 131528, "epoch": 3131} {"train_loss": -6.612234115600586, "global_step": 131529, "epoch": 3131} {"train_loss": -6.723206520080566, "global_step": 131530, "epoch": 3131} {"train_loss": -6.6502838134765625, "global_step": 131531, "epoch": 3131} {"train_loss": -6.767143249511719, "global_step": 131532, "epoch": 3131} {"train_loss": -6.75115966796875, "global_step": 131533, "epoch": 3131} {"train_loss": -6.70158576965332, "global_step": 131534, "epoch": 3131} {"train_loss": -6.674129962921143, "global_step": 131535, "epoch": 3131} {"train_loss": -6.765976905822754, "global_step": 131536, "epoch": 3131} {"train_loss": -6.624886512756348, "global_step": 131537, "epoch": 3131} {"train_loss": -6.695708751678467, "global_step": 131538, "epoch": 3131} {"train_loss": -6.714284896850586, "global_step": 131539, "epoch": 3131} {"train_loss": -6.709749698638916, "global_step": 131540, "epoch": 3131} {"train_loss": -6.704057693481445, "global_step": 131541, "epoch": 3131} {"train_loss": -6.781115531921387, "global_step": 131542, "epoch": 3131} {"train_loss": -6.661568039939517, "global_step": 131543, "epoch": 3131, "val_loss": 77699.0} {"train_loss": -6.780270576477051, "global_step": 131544, "epoch": 3132} {"train_loss": -6.760299205780029, "global_step": 131545, "epoch": 3132} {"train_loss": -6.644322395324707, "global_step": 131546, "epoch": 3132} {"train_loss": -6.5806193351745605, "global_step": 131547, "epoch": 3132} {"train_loss": -6.73276424407959, "global_step": 131548, "epoch": 3132} {"train_loss": -6.549448013305664, "global_step": 131549, "epoch": 3132} {"train_loss": -6.672320365905762, "global_step": 131550, "epoch": 3132} {"train_loss": -6.728570938110352, "global_step": 131551, "epoch": 3132} {"train_loss": -6.74494743347168, "global_step": 131552, "epoch": 3132} {"train_loss": -6.678520679473877, "global_step": 131553, "epoch": 3132} {"train_loss": -6.739278793334961, "global_step": 131554, "epoch": 3132} {"train_loss": -6.618957996368408, "global_step": 131555, "epoch": 3132} {"train_loss": -6.626777648925781, "global_step": 131556, "epoch": 3132} {"train_loss": -6.725545883178711, "global_step": 131557, "epoch": 3132} {"train_loss": -6.685053825378418, "global_step": 131558, "epoch": 3132} {"train_loss": -6.60951042175293, "global_step": 131559, "epoch": 3132} {"train_loss": -6.63738489151001, "global_step": 131560, "epoch": 3132} {"train_loss": -6.65153694152832, "global_step": 131561, "epoch": 3132} {"train_loss": -6.775354385375977, "global_step": 131562, "epoch": 3132} {"train_loss": -6.689608573913574, "global_step": 131563, "epoch": 3132} {"train_loss": -6.668819427490234, "global_step": 131564, "epoch": 3132} {"train_loss": -6.713275909423828, "global_step": 131565, "epoch": 3132} {"train_loss": -6.703594207763672, "global_step": 131566, "epoch": 3132} {"train_loss": -6.757369518280029, "global_step": 131567, "epoch": 3132} {"train_loss": -6.683144569396973, "global_step": 131568, "epoch": 3132} {"train_loss": -6.6623921394348145, "global_step": 131569, "epoch": 3132} {"train_loss": -6.734475135803223, "global_step": 131570, "epoch": 3132} {"train_loss": -6.6833367347717285, "global_step": 131571, "epoch": 3132} {"train_loss": -6.679971694946289, "global_step": 131572, "epoch": 3132} {"train_loss": -6.727258682250977, "global_step": 131573, "epoch": 3132} {"train_loss": -6.663582801818848, "global_step": 131574, "epoch": 3132} {"train_loss": -6.6561455726623535, "global_step": 131575, "epoch": 3132} {"train_loss": -6.670867919921875, "global_step": 131576, "epoch": 3132} {"train_loss": -6.680078506469727, "global_step": 131577, "epoch": 3132} {"train_loss": -6.70928955078125, "global_step": 131578, "epoch": 3132} {"train_loss": -6.7667236328125, "global_step": 131579, "epoch": 3132} {"train_loss": -6.634180068969727, "global_step": 131580, "epoch": 3132} {"train_loss": -6.744239807128906, "global_step": 131581, "epoch": 3132} {"train_loss": -6.743271827697754, "global_step": 131582, "epoch": 3132} {"train_loss": -6.63698673248291, "global_step": 131583, "epoch": 3132} {"train_loss": -6.68034029006958, "global_step": 131584, "epoch": 3132} {"train_loss": -6.690999405724662, "global_step": 131585, "epoch": 3132, "val_loss": 77507.640625} {"train_loss": -6.695544242858887, "global_step": 131586, "epoch": 3133} {"train_loss": -6.772481918334961, "global_step": 131587, "epoch": 3133} {"train_loss": -6.810369491577148, "global_step": 131588, "epoch": 3133} {"train_loss": -6.688193321228027, "global_step": 131589, "epoch": 3133} {"train_loss": -6.757235527038574, "global_step": 131590, "epoch": 3133} {"train_loss": -6.712307929992676, "global_step": 131591, "epoch": 3133} {"train_loss": -6.701961040496826, "global_step": 131592, "epoch": 3133} {"train_loss": -6.673318386077881, "global_step": 131593, "epoch": 3133} {"train_loss": -6.756601810455322, "global_step": 131594, "epoch": 3133} {"train_loss": -6.651516914367676, "global_step": 131595, "epoch": 3133} {"train_loss": -6.727768898010254, "global_step": 131596, "epoch": 3133} {"train_loss": -6.737525463104248, "global_step": 131597, "epoch": 3133} {"train_loss": -6.633002758026123, "global_step": 131598, "epoch": 3133} {"train_loss": -6.6708598136901855, "global_step": 131599, "epoch": 3133} {"train_loss": -6.756091594696045, "global_step": 131600, "epoch": 3133} {"train_loss": -6.607680797576904, "global_step": 131601, "epoch": 3133} {"train_loss": -6.629962921142578, "global_step": 131602, "epoch": 3133} {"train_loss": -6.575579643249512, "global_step": 131603, "epoch": 3133} {"train_loss": -6.634088516235352, "global_step": 131604, "epoch": 3133} {"train_loss": -6.587814807891846, "global_step": 131605, "epoch": 3133} {"train_loss": -6.663967132568359, "global_step": 131606, "epoch": 3133} {"train_loss": -6.509406089782715, "global_step": 131607, "epoch": 3133} {"train_loss": -6.669716835021973, "global_step": 131608, "epoch": 3133} {"train_loss": -6.706507682800293, "global_step": 131609, "epoch": 3133} {"train_loss": -6.564517021179199, "global_step": 131610, "epoch": 3133} {"train_loss": -6.592273235321045, "global_step": 131611, "epoch": 3133} {"train_loss": -6.6354289054870605, "global_step": 131612, "epoch": 3133} {"train_loss": -6.601714134216309, "global_step": 131613, "epoch": 3133} {"train_loss": -6.734796524047852, "global_step": 131614, "epoch": 3133} {"train_loss": -6.628628730773926, "global_step": 131615, "epoch": 3133} {"train_loss": -6.65912389755249, "global_step": 131616, "epoch": 3133} {"train_loss": -6.665428638458252, "global_step": 131617, "epoch": 3133} {"train_loss": -6.713407039642334, "global_step": 131618, "epoch": 3133} {"train_loss": -6.648975372314453, "global_step": 131619, "epoch": 3133} {"train_loss": -6.590429306030273, "global_step": 131620, "epoch": 3133} {"train_loss": -6.6644697189331055, "global_step": 131621, "epoch": 3133} {"train_loss": -6.685204029083252, "global_step": 131622, "epoch": 3133} {"train_loss": -6.720818519592285, "global_step": 131623, "epoch": 3133} {"train_loss": -6.652063846588135, "global_step": 131624, "epoch": 3133} {"train_loss": -6.595987796783447, "global_step": 131625, "epoch": 3133} {"train_loss": -6.668231964111328, "global_step": 131626, "epoch": 3133} {"train_loss": -6.670333919071016, "global_step": 131627, "epoch": 3133, "val_loss": 77500.7109375} {"train_loss": -6.709549903869629, "global_step": 131628, "epoch": 3134} {"train_loss": -6.724664688110352, "global_step": 131629, "epoch": 3134} {"train_loss": -6.678645610809326, "global_step": 131630, "epoch": 3134} {"train_loss": -6.639677047729492, "global_step": 131631, "epoch": 3134} {"train_loss": -6.717232704162598, "global_step": 131632, "epoch": 3134} {"train_loss": -6.7556233406066895, "global_step": 131633, "epoch": 3134} {"train_loss": -6.651703834533691, "global_step": 131634, "epoch": 3134} {"train_loss": -6.705723762512207, "global_step": 131635, "epoch": 3134} {"train_loss": -6.689676761627197, "global_step": 131636, "epoch": 3134} {"train_loss": -6.749612808227539, "global_step": 131637, "epoch": 3134} {"train_loss": -6.658689022064209, "global_step": 131638, "epoch": 3134} {"train_loss": -6.59620475769043, "global_step": 131639, "epoch": 3134} {"train_loss": -6.545197010040283, "global_step": 131640, "epoch": 3134} {"train_loss": -6.754752159118652, "global_step": 131641, "epoch": 3134} {"train_loss": -6.5267415046691895, "global_step": 131642, "epoch": 3134} {"train_loss": -6.7116851806640625, "global_step": 131643, "epoch": 3134} {"train_loss": -6.6555914878845215, "global_step": 131644, "epoch": 3134} {"train_loss": -6.619982719421387, "global_step": 131645, "epoch": 3134} {"train_loss": -6.758542537689209, "global_step": 131646, "epoch": 3134} {"train_loss": -6.766360282897949, "global_step": 131647, "epoch": 3134} {"train_loss": -6.623863220214844, "global_step": 131648, "epoch": 3134} {"train_loss": -6.649409294128418, "global_step": 131649, "epoch": 3134} {"train_loss": -6.787008285522461, "global_step": 131650, "epoch": 3134} {"train_loss": -6.624481678009033, "global_step": 131651, "epoch": 3134} {"train_loss": -6.750185012817383, "global_step": 131652, "epoch": 3134} {"train_loss": -6.530605792999268, "global_step": 131653, "epoch": 3134} {"train_loss": -6.622499465942383, "global_step": 131654, "epoch": 3134} {"train_loss": -6.628132343292236, "global_step": 131655, "epoch": 3134} {"train_loss": -6.635064601898193, "global_step": 131656, "epoch": 3134} {"train_loss": -6.70197868347168, "global_step": 131657, "epoch": 3134} {"train_loss": -6.715163230895996, "global_step": 131658, "epoch": 3134} {"train_loss": -6.619863510131836, "global_step": 131659, "epoch": 3134} {"train_loss": -6.780055999755859, "global_step": 131660, "epoch": 3134} {"train_loss": -6.541796684265137, "global_step": 131661, "epoch": 3134} {"train_loss": -6.744449138641357, "global_step": 131662, "epoch": 3134} {"train_loss": -6.579881191253662, "global_step": 131663, "epoch": 3134} {"train_loss": -6.653855323791504, "global_step": 131664, "epoch": 3134} {"train_loss": -6.71452522277832, "global_step": 131665, "epoch": 3134} {"train_loss": -6.632814407348633, "global_step": 131666, "epoch": 3134} {"train_loss": -6.645910739898682, "global_step": 131667, "epoch": 3134} {"train_loss": -6.7117743492126465, "global_step": 131668, "epoch": 3134} {"train_loss": -6.672552562895275, "global_step": 131669, "epoch": 3134, "val_loss": 77403.984375} {"train_loss": -6.63884162902832, "global_step": 131670, "epoch": 3135} {"train_loss": -6.655401229858398, "global_step": 131671, "epoch": 3135} {"train_loss": -6.71717643737793, "global_step": 131672, "epoch": 3135} {"train_loss": -6.617831707000732, "global_step": 131673, "epoch": 3135} {"train_loss": -6.691407203674316, "global_step": 131674, "epoch": 3135} {"train_loss": -6.666564464569092, "global_step": 131675, "epoch": 3135} {"train_loss": -6.717597484588623, "global_step": 131676, "epoch": 3135} {"train_loss": -6.696826934814453, "global_step": 131677, "epoch": 3135} {"train_loss": -6.677013397216797, "global_step": 131678, "epoch": 3135} {"train_loss": -6.686631202697754, "global_step": 131679, "epoch": 3135} {"train_loss": -6.607622146606445, "global_step": 131680, "epoch": 3135} {"train_loss": -6.571040153503418, "global_step": 131681, "epoch": 3135} {"train_loss": -6.664333343505859, "global_step": 131682, "epoch": 3135} {"train_loss": -6.616457462310791, "global_step": 131683, "epoch": 3135} {"train_loss": -6.672407150268555, "global_step": 131684, "epoch": 3135} {"train_loss": -6.720516204833984, "global_step": 131685, "epoch": 3135} {"train_loss": -6.743465423583984, "global_step": 131686, "epoch": 3135} {"train_loss": -6.823690414428711, "global_step": 131687, "epoch": 3135} {"train_loss": -6.666922569274902, "global_step": 131688, "epoch": 3135} {"train_loss": -6.759445667266846, "global_step": 131689, "epoch": 3135} {"train_loss": -6.779457092285156, "global_step": 131690, "epoch": 3135} {"train_loss": -6.7495951652526855, "global_step": 131691, "epoch": 3135} {"train_loss": -6.589323997497559, "global_step": 131692, "epoch": 3135} {"train_loss": -6.616423606872559, "global_step": 131693, "epoch": 3135} {"train_loss": -6.588444709777832, "global_step": 131694, "epoch": 3135} {"train_loss": -6.712571620941162, "global_step": 131695, "epoch": 3135} {"train_loss": -6.714068412780762, "global_step": 131696, "epoch": 3135} {"train_loss": -6.622674942016602, "global_step": 131697, "epoch": 3135} {"train_loss": -6.7065019607543945, "global_step": 131698, "epoch": 3135} {"train_loss": -6.665187358856201, "global_step": 131699, "epoch": 3135} {"train_loss": -6.774914741516113, "global_step": 131700, "epoch": 3135} {"train_loss": -6.613317012786865, "global_step": 131701, "epoch": 3135} {"train_loss": -6.670427322387695, "global_step": 131702, "epoch": 3135} {"train_loss": -6.827151775360107, "global_step": 131703, "epoch": 3135} {"train_loss": -6.7245073318481445, "global_step": 131704, "epoch": 3135} {"train_loss": -6.704607009887695, "global_step": 131705, "epoch": 3135} {"train_loss": -6.644713401794434, "global_step": 131706, "epoch": 3135} {"train_loss": -6.587913990020752, "global_step": 131707, "epoch": 3135} {"train_loss": -6.764675140380859, "global_step": 131708, "epoch": 3135} {"train_loss": -6.715456962585449, "global_step": 131709, "epoch": 3135} {"train_loss": -6.65637731552124, "global_step": 131710, "epoch": 3135} {"train_loss": -6.682904618127005, "global_step": 131711, "epoch": 3135, "val_loss": 77766.921875} {"train_loss": -6.71168327331543, "global_step": 131712, "epoch": 3136} {"train_loss": -6.800940990447998, "global_step": 131713, "epoch": 3136} {"train_loss": -6.710478782653809, "global_step": 131714, "epoch": 3136} {"train_loss": -6.666101932525635, "global_step": 131715, "epoch": 3136} {"train_loss": -6.686435699462891, "global_step": 131716, "epoch": 3136} {"train_loss": -6.692970275878906, "global_step": 131717, "epoch": 3136} {"train_loss": -6.753856658935547, "global_step": 131718, "epoch": 3136} {"train_loss": -6.739336013793945, "global_step": 131719, "epoch": 3136} {"train_loss": -6.7422003746032715, "global_step": 131720, "epoch": 3136} {"train_loss": -6.740536689758301, "global_step": 131721, "epoch": 3136} {"train_loss": -6.764532089233398, "global_step": 131722, "epoch": 3136} {"train_loss": -6.719038009643555, "global_step": 131723, "epoch": 3136} {"train_loss": -6.738862037658691, "global_step": 131724, "epoch": 3136} {"train_loss": -6.743715763092041, "global_step": 131725, "epoch": 3136} {"train_loss": -6.737464904785156, "global_step": 131726, "epoch": 3136} {"train_loss": -6.608573913574219, "global_step": 131727, "epoch": 3136} {"train_loss": -6.753819942474365, "global_step": 131728, "epoch": 3136} {"train_loss": -6.751083850860596, "global_step": 131729, "epoch": 3136} {"train_loss": -6.675932884216309, "global_step": 131730, "epoch": 3136} {"train_loss": -6.656177520751953, "global_step": 131731, "epoch": 3136} {"train_loss": -6.672987937927246, "global_step": 131732, "epoch": 3136} {"train_loss": -6.656746864318848, "global_step": 131733, "epoch": 3136} {"train_loss": -6.674954414367676, "global_step": 131734, "epoch": 3136} {"train_loss": -6.676661014556885, "global_step": 131735, "epoch": 3136} {"train_loss": -6.635250568389893, "global_step": 131736, "epoch": 3136} {"train_loss": -6.709493637084961, "global_step": 131737, "epoch": 3136} {"train_loss": -6.658756256103516, "global_step": 131738, "epoch": 3136} {"train_loss": -6.649024963378906, "global_step": 131739, "epoch": 3136} {"train_loss": -6.608198165893555, "global_step": 131740, "epoch": 3136} {"train_loss": -6.628629684448242, "global_step": 131741, "epoch": 3136} {"train_loss": -6.541929721832275, "global_step": 131742, "epoch": 3136} {"train_loss": -6.664012908935547, "global_step": 131743, "epoch": 3136} {"train_loss": -6.6440253257751465, "global_step": 131744, "epoch": 3136} {"train_loss": -6.5847859382629395, "global_step": 131745, "epoch": 3136} {"train_loss": -6.647347927093506, "global_step": 131746, "epoch": 3136} {"train_loss": -6.577755928039551, "global_step": 131747, "epoch": 3136} {"train_loss": -6.710453987121582, "global_step": 131748, "epoch": 3136} {"train_loss": -6.623907089233398, "global_step": 131749, "epoch": 3136} {"train_loss": -6.6537981033325195, "global_step": 131750, "epoch": 3136} {"train_loss": -6.710457801818848, "global_step": 131751, "epoch": 3136} {"train_loss": -6.726378917694092, "global_step": 131752, "epoch": 3136} {"train_loss": -6.685034854071481, "global_step": 131753, "epoch": 3136, "val_loss": 77485.296875} {"train_loss": -6.697957992553711, "global_step": 131754, "epoch": 3137} {"train_loss": -6.776257514953613, "global_step": 131755, "epoch": 3137} {"train_loss": -6.7443528175354, "global_step": 131756, "epoch": 3137} {"train_loss": -6.716888427734375, "global_step": 131757, "epoch": 3137} {"train_loss": -6.8313798904418945, "global_step": 131758, "epoch": 3137} {"train_loss": -6.665126323699951, "global_step": 131759, "epoch": 3137} {"train_loss": -6.572757244110107, "global_step": 131760, "epoch": 3137} {"train_loss": -6.734896659851074, "global_step": 131761, "epoch": 3137} {"train_loss": -6.6259846687316895, "global_step": 131762, "epoch": 3137} {"train_loss": -6.665484428405762, "global_step": 131763, "epoch": 3137} {"train_loss": -6.765723705291748, "global_step": 131764, "epoch": 3137} {"train_loss": -6.487614631652832, "global_step": 131765, "epoch": 3137} {"train_loss": -6.694620132446289, "global_step": 131766, "epoch": 3137} {"train_loss": -6.7467875480651855, "global_step": 131767, "epoch": 3137} {"train_loss": -6.55363655090332, "global_step": 131768, "epoch": 3137} {"train_loss": -6.732237815856934, "global_step": 131769, "epoch": 3137} {"train_loss": -6.674832344055176, "global_step": 131770, "epoch": 3137} {"train_loss": -6.514662742614746, "global_step": 131771, "epoch": 3137} {"train_loss": -6.709591865539551, "global_step": 131772, "epoch": 3137} {"train_loss": -6.634463310241699, "global_step": 131773, "epoch": 3137} {"train_loss": -6.720354080200195, "global_step": 131774, "epoch": 3137} {"train_loss": -6.62441873550415, "global_step": 131775, "epoch": 3137} {"train_loss": -6.497849941253662, "global_step": 131776, "epoch": 3137} {"train_loss": -6.606996059417725, "global_step": 131777, "epoch": 3137} {"train_loss": -6.825547695159912, "global_step": 131778, "epoch": 3137} {"train_loss": -6.457233905792236, "global_step": 131779, "epoch": 3137} {"train_loss": -6.7083587646484375, "global_step": 131780, "epoch": 3137} {"train_loss": -6.688853740692139, "global_step": 131781, "epoch": 3137} {"train_loss": -6.530211448669434, "global_step": 131782, "epoch": 3137} {"train_loss": -6.638328552246094, "global_step": 131783, "epoch": 3137} {"train_loss": -6.668054580688477, "global_step": 131784, "epoch": 3137} {"train_loss": -6.694458961486816, "global_step": 131785, "epoch": 3137} {"train_loss": -6.594415664672852, "global_step": 131786, "epoch": 3137} {"train_loss": -6.641138553619385, "global_step": 131787, "epoch": 3137} {"train_loss": -6.584225177764893, "global_step": 131788, "epoch": 3137} {"train_loss": -6.628634452819824, "global_step": 131789, "epoch": 3137} {"train_loss": -6.763789176940918, "global_step": 131790, "epoch": 3137} {"train_loss": -6.542901992797852, "global_step": 131791, "epoch": 3137} {"train_loss": -6.675113677978516, "global_step": 131792, "epoch": 3137} {"train_loss": -6.568453788757324, "global_step": 131793, "epoch": 3137} {"train_loss": -6.7816338539123535, "global_step": 131794, "epoch": 3137} {"train_loss": -6.657753490266346, "global_step": 131795, "epoch": 3137, "val_loss": 77550.359375} {"train_loss": -6.571647644042969, "global_step": 131796, "epoch": 3138} {"train_loss": -6.561332702636719, "global_step": 131797, "epoch": 3138} {"train_loss": -6.717374801635742, "global_step": 131798, "epoch": 3138} {"train_loss": -6.661665916442871, "global_step": 131799, "epoch": 3138} {"train_loss": -6.666671276092529, "global_step": 131800, "epoch": 3138} {"train_loss": -6.6898088455200195, "global_step": 131801, "epoch": 3138} {"train_loss": -6.6281938552856445, "global_step": 131802, "epoch": 3138} {"train_loss": -6.61284065246582, "global_step": 131803, "epoch": 3138} {"train_loss": -6.837465286254883, "global_step": 131804, "epoch": 3138} {"train_loss": -6.815484046936035, "global_step": 131805, "epoch": 3138} {"train_loss": -6.7044291496276855, "global_step": 131806, "epoch": 3138} {"train_loss": -6.614326477050781, "global_step": 131807, "epoch": 3138} {"train_loss": -6.653979301452637, "global_step": 131808, "epoch": 3138} {"train_loss": -6.854387283325195, "global_step": 131809, "epoch": 3138} {"train_loss": -6.678361415863037, "global_step": 131810, "epoch": 3138} {"train_loss": -6.748189926147461, "global_step": 131811, "epoch": 3138} {"train_loss": -6.783572196960449, "global_step": 131812, "epoch": 3138} {"train_loss": -6.651752471923828, "global_step": 131813, "epoch": 3138} {"train_loss": -6.654780387878418, "global_step": 131814, "epoch": 3138} {"train_loss": -6.848374843597412, "global_step": 131815, "epoch": 3138} {"train_loss": -6.659651279449463, "global_step": 131816, "epoch": 3138} {"train_loss": -6.583175182342529, "global_step": 131817, "epoch": 3138} {"train_loss": -6.657510280609131, "global_step": 131818, "epoch": 3138} {"train_loss": -6.592801094055176, "global_step": 131819, "epoch": 3138} {"train_loss": -6.713770866394043, "global_step": 131820, "epoch": 3138} {"train_loss": -6.685655117034912, "global_step": 131821, "epoch": 3138} {"train_loss": -6.728557586669922, "global_step": 131822, "epoch": 3138} {"train_loss": -6.642045497894287, "global_step": 131823, "epoch": 3138} {"train_loss": -6.755382537841797, "global_step": 131824, "epoch": 3138} {"train_loss": -6.833322525024414, "global_step": 131825, "epoch": 3138} {"train_loss": -6.7480878829956055, "global_step": 131826, "epoch": 3138} {"train_loss": -6.648322105407715, "global_step": 131827, "epoch": 3138} {"train_loss": -6.642676830291748, "global_step": 131828, "epoch": 3138} {"train_loss": -6.693623065948486, "global_step": 131829, "epoch": 3138} {"train_loss": -6.624039649963379, "global_step": 131830, "epoch": 3138} {"train_loss": -6.761300086975098, "global_step": 131831, "epoch": 3138} {"train_loss": -6.690732955932617, "global_step": 131832, "epoch": 3138} {"train_loss": -6.656569480895996, "global_step": 131833, "epoch": 3138} {"train_loss": -6.662012100219727, "global_step": 131834, "epoch": 3138} {"train_loss": -6.617094993591309, "global_step": 131835, "epoch": 3138} {"train_loss": -6.745197296142578, "global_step": 131836, "epoch": 3138} {"train_loss": -6.68979161126273, "global_step": 131837, "epoch": 3138, "val_loss": 77620.0625} {"train_loss": -6.7071332931518555, "global_step": 131838, "epoch": 3139} {"train_loss": -6.663197994232178, "global_step": 131839, "epoch": 3139} {"train_loss": -6.666802406311035, "global_step": 131840, "epoch": 3139} {"train_loss": -6.631256103515625, "global_step": 131841, "epoch": 3139} {"train_loss": -6.7029805183410645, "global_step": 131842, "epoch": 3139} {"train_loss": -6.684497833251953, "global_step": 131843, "epoch": 3139} {"train_loss": -6.579483985900879, "global_step": 131844, "epoch": 3139} {"train_loss": -6.804386615753174, "global_step": 131845, "epoch": 3139} {"train_loss": -6.656997203826904, "global_step": 131846, "epoch": 3139} {"train_loss": -6.570341110229492, "global_step": 131847, "epoch": 3139} {"train_loss": -6.595827579498291, "global_step": 131848, "epoch": 3139} {"train_loss": -6.586673736572266, "global_step": 131849, "epoch": 3139} {"train_loss": -6.643179893493652, "global_step": 131850, "epoch": 3139} {"train_loss": -6.637368679046631, "global_step": 131851, "epoch": 3139} {"train_loss": -6.753452777862549, "global_step": 131852, "epoch": 3139} {"train_loss": -6.533867835998535, "global_step": 131853, "epoch": 3139} {"train_loss": -6.673340797424316, "global_step": 131854, "epoch": 3139} {"train_loss": -6.633561611175537, "global_step": 131855, "epoch": 3139} {"train_loss": -6.663904190063477, "global_step": 131856, "epoch": 3139} {"train_loss": -6.676631450653076, "global_step": 131857, "epoch": 3139} {"train_loss": -6.632946491241455, "global_step": 131858, "epoch": 3139} {"train_loss": -6.678300380706787, "global_step": 131859, "epoch": 3139} {"train_loss": -6.741397857666016, "global_step": 131860, "epoch": 3139} {"train_loss": -6.646608352661133, "global_step": 131861, "epoch": 3139} {"train_loss": -6.689641952514648, "global_step": 131862, "epoch": 3139} {"train_loss": -6.594738006591797, "global_step": 131863, "epoch": 3139} {"train_loss": -6.685417175292969, "global_step": 131864, "epoch": 3139} {"train_loss": -6.572432041168213, "global_step": 131865, "epoch": 3139} {"train_loss": -6.597041130065918, "global_step": 131866, "epoch": 3139} {"train_loss": -6.653367042541504, "global_step": 131867, "epoch": 3139} {"train_loss": -6.591730117797852, "global_step": 131868, "epoch": 3139} {"train_loss": -6.770691871643066, "global_step": 131869, "epoch": 3139} {"train_loss": -6.609694004058838, "global_step": 131870, "epoch": 3139} {"train_loss": -6.595685005187988, "global_step": 131871, "epoch": 3139} {"train_loss": -6.5112152099609375, "global_step": 131872, "epoch": 3139} {"train_loss": -6.570962905883789, "global_step": 131873, "epoch": 3139} {"train_loss": -6.571740627288818, "global_step": 131874, "epoch": 3139} {"train_loss": -6.542326927185059, "global_step": 131875, "epoch": 3139} {"train_loss": -6.61810302734375, "global_step": 131876, "epoch": 3139} {"train_loss": -6.679591655731201, "global_step": 131877, "epoch": 3139} {"train_loss": -6.50203275680542, "global_step": 131878, "epoch": 3139} {"train_loss": -6.639184531711397, "global_step": 131879, "epoch": 3139, "val_loss": 77438.21875} {"train_loss": -6.631758689880371, "global_step": 131880, "epoch": 3140} {"train_loss": -6.669744491577148, "global_step": 131881, "epoch": 3140} {"train_loss": -6.609291076660156, "global_step": 131882, "epoch": 3140} {"train_loss": -6.589703559875488, "global_step": 131883, "epoch": 3140} {"train_loss": -6.694392681121826, "global_step": 131884, "epoch": 3140} {"train_loss": -6.602073669433594, "global_step": 131885, "epoch": 3140} {"train_loss": -6.602424621582031, "global_step": 131886, "epoch": 3140} {"train_loss": -6.6154608726501465, "global_step": 131887, "epoch": 3140} {"train_loss": -6.731423377990723, "global_step": 131888, "epoch": 3140} {"train_loss": -6.555897235870361, "global_step": 131889, "epoch": 3140} {"train_loss": -6.669879913330078, "global_step": 131890, "epoch": 3140} {"train_loss": -6.605343818664551, "global_step": 131891, "epoch": 3140} {"train_loss": -6.6650471687316895, "global_step": 131892, "epoch": 3140} {"train_loss": -6.542998313903809, "global_step": 131893, "epoch": 3140} {"train_loss": -6.603165149688721, "global_step": 131894, "epoch": 3140} {"train_loss": -6.624684810638428, "global_step": 131895, "epoch": 3140} {"train_loss": -6.698948860168457, "global_step": 131896, "epoch": 3140} {"train_loss": -6.730379104614258, "global_step": 131897, "epoch": 3140} {"train_loss": -6.737209796905518, "global_step": 131898, "epoch": 3140} {"train_loss": -6.727759838104248, "global_step": 131899, "epoch": 3140} {"train_loss": -6.572732448577881, "global_step": 131900, "epoch": 3140} {"train_loss": -6.838478088378906, "global_step": 131901, "epoch": 3140} {"train_loss": -6.6320600509643555, "global_step": 131902, "epoch": 3140} {"train_loss": -6.716933727264404, "global_step": 131903, "epoch": 3140} {"train_loss": -6.675299644470215, "global_step": 131904, "epoch": 3140} {"train_loss": -6.67818546295166, "global_step": 131905, "epoch": 3140} {"train_loss": -6.631046295166016, "global_step": 131906, "epoch": 3140} {"train_loss": -6.756172180175781, "global_step": 131907, "epoch": 3140} {"train_loss": -6.721859931945801, "global_step": 131908, "epoch": 3140} {"train_loss": -6.6855974197387695, "global_step": 131909, "epoch": 3140} {"train_loss": -6.799689292907715, "global_step": 131910, "epoch": 3140} {"train_loss": -6.719966411590576, "global_step": 131911, "epoch": 3140} {"train_loss": -6.715742588043213, "global_step": 131912, "epoch": 3140} {"train_loss": -6.580545425415039, "global_step": 131913, "epoch": 3140} {"train_loss": -6.70961332321167, "global_step": 131914, "epoch": 3140} {"train_loss": -6.817791938781738, "global_step": 131915, "epoch": 3140} {"train_loss": -6.714071273803711, "global_step": 131916, "epoch": 3140} {"train_loss": -6.673074722290039, "global_step": 131917, "epoch": 3140} {"train_loss": -6.611083030700684, "global_step": 131918, "epoch": 3140} {"train_loss": -6.666101455688477, "global_step": 131919, "epoch": 3140} {"train_loss": -6.702174186706543, "global_step": 131920, "epoch": 3140} {"train_loss": -6.670343421754383, "global_step": 131921, "epoch": 3140, "val_loss": 77511.265625} {"train_loss": -6.779121398925781, "global_step": 131922, "epoch": 3141} {"train_loss": -6.649751663208008, "global_step": 131923, "epoch": 3141} {"train_loss": -6.67811918258667, "global_step": 131924, "epoch": 3141} {"train_loss": -6.802307605743408, "global_step": 131925, "epoch": 3141} {"train_loss": -6.602078437805176, "global_step": 131926, "epoch": 3141} {"train_loss": -6.734190464019775, "global_step": 131927, "epoch": 3141} {"train_loss": -6.699265480041504, "global_step": 131928, "epoch": 3141} {"train_loss": -6.656503677368164, "global_step": 131929, "epoch": 3141} {"train_loss": -6.732235431671143, "global_step": 131930, "epoch": 3141} {"train_loss": -6.742036819458008, "global_step": 131931, "epoch": 3141} {"train_loss": -6.622623443603516, "global_step": 131932, "epoch": 3141} {"train_loss": -6.729626655578613, "global_step": 131933, "epoch": 3141} {"train_loss": -6.716617107391357, "global_step": 131934, "epoch": 3141} {"train_loss": -6.721836090087891, "global_step": 131935, "epoch": 3141} {"train_loss": -6.769536018371582, "global_step": 131936, "epoch": 3141} {"train_loss": -6.722250938415527, "global_step": 131937, "epoch": 3141} {"train_loss": -6.719623565673828, "global_step": 131938, "epoch": 3141} {"train_loss": -6.778242588043213, "global_step": 131939, "epoch": 3141} {"train_loss": -6.713285446166992, "global_step": 131940, "epoch": 3141} {"train_loss": -6.773193359375, "global_step": 131941, "epoch": 3141} {"train_loss": -6.765902519226074, "global_step": 131942, "epoch": 3141} {"train_loss": -6.669005393981934, "global_step": 131943, "epoch": 3141} {"train_loss": -6.6793317794799805, "global_step": 131944, "epoch": 3141} {"train_loss": -6.6705546379089355, "global_step": 131945, "epoch": 3141} {"train_loss": -6.704471588134766, "global_step": 131946, "epoch": 3141} {"train_loss": -6.854292392730713, "global_step": 131947, "epoch": 3141} {"train_loss": -6.70286750793457, "global_step": 131948, "epoch": 3141} {"train_loss": -6.533249855041504, "global_step": 131949, "epoch": 3141} {"train_loss": -6.714239597320557, "global_step": 131950, "epoch": 3141} {"train_loss": -6.679415702819824, "global_step": 131951, "epoch": 3141} {"train_loss": -6.572844505310059, "global_step": 131952, "epoch": 3141} {"train_loss": -6.624661445617676, "global_step": 131953, "epoch": 3141} {"train_loss": -6.678852081298828, "global_step": 131954, "epoch": 3141} {"train_loss": -6.640599250793457, "global_step": 131955, "epoch": 3141} {"train_loss": -6.655061721801758, "global_step": 131956, "epoch": 3141} {"train_loss": -6.755094051361084, "global_step": 131957, "epoch": 3141} {"train_loss": -6.708473205566406, "global_step": 131958, "epoch": 3141} {"train_loss": -6.67703104019165, "global_step": 131959, "epoch": 3141} {"train_loss": -6.776653289794922, "global_step": 131960, "epoch": 3141} {"train_loss": -6.756148338317871, "global_step": 131961, "epoch": 3141} {"train_loss": -6.681419849395752, "global_step": 131962, "epoch": 3141} {"train_loss": -6.699145112718854, "global_step": 131963, "epoch": 3141, "val_loss": 77375.9609375} {"train_loss": -6.819304466247559, "global_step": 131964, "epoch": 3142} {"train_loss": -6.6722517013549805, "global_step": 131965, "epoch": 3142} {"train_loss": -6.6499857902526855, "global_step": 131966, "epoch": 3142} {"train_loss": -6.742392539978027, "global_step": 131967, "epoch": 3142} {"train_loss": -6.774139404296875, "global_step": 131968, "epoch": 3142} {"train_loss": -6.7307844161987305, "global_step": 131969, "epoch": 3142} {"train_loss": -6.701279640197754, "global_step": 131970, "epoch": 3142} {"train_loss": -6.720684051513672, "global_step": 131971, "epoch": 3142} {"train_loss": -6.662502765655518, "global_step": 131972, "epoch": 3142} {"train_loss": -6.638286113739014, "global_step": 131973, "epoch": 3142} {"train_loss": -6.706210136413574, "global_step": 131974, "epoch": 3142} {"train_loss": -6.6360883712768555, "global_step": 131975, "epoch": 3142} {"train_loss": -6.822567939758301, "global_step": 131976, "epoch": 3142} {"train_loss": -6.7239556312561035, "global_step": 131977, "epoch": 3142} {"train_loss": -6.628939151763916, "global_step": 131978, "epoch": 3142} {"train_loss": -6.770235538482666, "global_step": 131979, "epoch": 3142} {"train_loss": -6.63096809387207, "global_step": 131980, "epoch": 3142} {"train_loss": -6.713811874389648, "global_step": 131981, "epoch": 3142} {"train_loss": -6.629543781280518, "global_step": 131982, "epoch": 3142} {"train_loss": -6.673334121704102, "global_step": 131983, "epoch": 3142} {"train_loss": -6.663971900939941, "global_step": 131984, "epoch": 3142} {"train_loss": -6.749342441558838, "global_step": 131985, "epoch": 3142} {"train_loss": -6.699347496032715, "global_step": 131986, "epoch": 3142} {"train_loss": -6.600469589233398, "global_step": 131987, "epoch": 3142} {"train_loss": -6.514798164367676, "global_step": 131988, "epoch": 3142} {"train_loss": -6.631933212280273, "global_step": 131989, "epoch": 3142} {"train_loss": -6.624381065368652, "global_step": 131990, "epoch": 3142} {"train_loss": -6.688828468322754, "global_step": 131991, "epoch": 3142} {"train_loss": -6.577436923980713, "global_step": 131992, "epoch": 3142} {"train_loss": -6.6900811195373535, "global_step": 131993, "epoch": 3142} {"train_loss": -6.70723295211792, "global_step": 131994, "epoch": 3142} {"train_loss": -6.593873500823975, "global_step": 131995, "epoch": 3142} {"train_loss": -6.658689975738525, "global_step": 131996, "epoch": 3142} {"train_loss": -6.763307094573975, "global_step": 131997, "epoch": 3142} {"train_loss": -6.77897834777832, "global_step": 131998, "epoch": 3142} {"train_loss": -6.683551788330078, "global_step": 131999, "epoch": 3142} {"train_loss": -6.7149858474731445, "global_step": 132000, "epoch": 3142} {"train_loss": -6.770966529846191, "global_step": 132001, "epoch": 3142} {"train_loss": -6.6392011642456055, "global_step": 132002, "epoch": 3142} {"train_loss": -6.719287872314453, "global_step": 132003, "epoch": 3142} {"train_loss": -6.743830680847168, "global_step": 132004, "epoch": 3142} {"train_loss": -6.688822632744198, "global_step": 132005, "epoch": 3142, "val_loss": 77665.0390625} {"train_loss": -6.733123302459717, "global_step": 132006, "epoch": 3143} {"train_loss": -6.647225856781006, "global_step": 132007, "epoch": 3143} {"train_loss": -6.648697376251221, "global_step": 132008, "epoch": 3143} {"train_loss": -6.863315582275391, "global_step": 132009, "epoch": 3143} {"train_loss": -6.738968849182129, "global_step": 132010, "epoch": 3143} {"train_loss": -6.659085273742676, "global_step": 132011, "epoch": 3143} {"train_loss": -6.802602767944336, "global_step": 132012, "epoch": 3143} {"train_loss": -6.650368690490723, "global_step": 132013, "epoch": 3143} {"train_loss": -6.638401031494141, "global_step": 132014, "epoch": 3143} {"train_loss": -6.713966369628906, "global_step": 132015, "epoch": 3143} {"train_loss": -6.7209577560424805, "global_step": 132016, "epoch": 3143} {"train_loss": -6.769064903259277, "global_step": 132017, "epoch": 3143} {"train_loss": -6.611050605773926, "global_step": 132018, "epoch": 3143} {"train_loss": -6.812981605529785, "global_step": 132019, "epoch": 3143} {"train_loss": -6.74098539352417, "global_step": 132020, "epoch": 3143} {"train_loss": -6.770349502563477, "global_step": 132021, "epoch": 3143} {"train_loss": -6.739538192749023, "global_step": 132022, "epoch": 3143} {"train_loss": -6.779329299926758, "global_step": 132023, "epoch": 3143} {"train_loss": -6.706783294677734, "global_step": 132024, "epoch": 3143} {"train_loss": -6.565104961395264, "global_step": 132025, "epoch": 3143} {"train_loss": -6.70565128326416, "global_step": 132026, "epoch": 3143} {"train_loss": -6.689514636993408, "global_step": 132027, "epoch": 3143} {"train_loss": -6.805683135986328, "global_step": 132028, "epoch": 3143} {"train_loss": -6.69050407409668, "global_step": 132029, "epoch": 3143} {"train_loss": -6.728663444519043, "global_step": 132030, "epoch": 3143} {"train_loss": -6.744261264801025, "global_step": 132031, "epoch": 3143} {"train_loss": -6.74971342086792, "global_step": 132032, "epoch": 3143} {"train_loss": -6.745964050292969, "global_step": 132033, "epoch": 3143} {"train_loss": -6.780012130737305, "global_step": 132034, "epoch": 3143} {"train_loss": -6.732975006103516, "global_step": 132035, "epoch": 3143} {"train_loss": -6.738114356994629, "global_step": 132036, "epoch": 3143} {"train_loss": -6.642495632171631, "global_step": 132037, "epoch": 3143} {"train_loss": -6.690428733825684, "global_step": 132038, "epoch": 3143} {"train_loss": -6.70875358581543, "global_step": 132039, "epoch": 3143} {"train_loss": -6.623696327209473, "global_step": 132040, "epoch": 3143} {"train_loss": -6.751802921295166, "global_step": 132041, "epoch": 3143} {"train_loss": -6.693070411682129, "global_step": 132042, "epoch": 3143} {"train_loss": -6.680810928344727, "global_step": 132043, "epoch": 3143} {"train_loss": -6.755826473236084, "global_step": 132044, "epoch": 3143} {"train_loss": -6.590935230255127, "global_step": 132045, "epoch": 3143} {"train_loss": -6.696292877197266, "global_step": 132046, "epoch": 3143} {"train_loss": -6.710327046258109, "global_step": 132047, "epoch": 3143, "val_loss": 77743.0390625} {"train_loss": -6.7771897315979, "global_step": 132048, "epoch": 3144} {"train_loss": -6.629941940307617, "global_step": 132049, "epoch": 3144} {"train_loss": -6.760149002075195, "global_step": 132050, "epoch": 3144} {"train_loss": -6.710629463195801, "global_step": 132051, "epoch": 3144} {"train_loss": -6.7365875244140625, "global_step": 132052, "epoch": 3144} {"train_loss": -6.672181129455566, "global_step": 132053, "epoch": 3144} {"train_loss": -6.656464576721191, "global_step": 132054, "epoch": 3144} {"train_loss": -6.762485504150391, "global_step": 132055, "epoch": 3144} {"train_loss": -6.608356475830078, "global_step": 132056, "epoch": 3144} {"train_loss": -6.717428207397461, "global_step": 132057, "epoch": 3144} {"train_loss": -6.614425182342529, "global_step": 132058, "epoch": 3144} {"train_loss": -6.589008331298828, "global_step": 132059, "epoch": 3144} {"train_loss": -6.681408882141113, "global_step": 132060, "epoch": 3144} {"train_loss": -6.6997175216674805, "global_step": 132061, "epoch": 3144} {"train_loss": -6.596436500549316, "global_step": 132062, "epoch": 3144} {"train_loss": -6.76871395111084, "global_step": 132063, "epoch": 3144} {"train_loss": -6.670815467834473, "global_step": 132064, "epoch": 3144} {"train_loss": -6.640531063079834, "global_step": 132065, "epoch": 3144} {"train_loss": -6.607378005981445, "global_step": 132066, "epoch": 3144} {"train_loss": -6.68231201171875, "global_step": 132067, "epoch": 3144} {"train_loss": -6.7152276039123535, "global_step": 132068, "epoch": 3144} {"train_loss": -6.716824531555176, "global_step": 132069, "epoch": 3144} {"train_loss": -6.79827356338501, "global_step": 132070, "epoch": 3144} {"train_loss": -6.709738254547119, "global_step": 132071, "epoch": 3144} {"train_loss": -6.668530464172363, "global_step": 132072, "epoch": 3144} {"train_loss": -6.662600517272949, "global_step": 132073, "epoch": 3144} {"train_loss": -6.657507419586182, "global_step": 132074, "epoch": 3144} {"train_loss": -6.7090020179748535, "global_step": 132075, "epoch": 3144} {"train_loss": -6.6797990798950195, "global_step": 132076, "epoch": 3144} {"train_loss": -6.540833473205566, "global_step": 132077, "epoch": 3144} {"train_loss": -6.753105163574219, "global_step": 132078, "epoch": 3144} {"train_loss": -6.688331604003906, "global_step": 132079, "epoch": 3144} {"train_loss": -6.806035041809082, "global_step": 132080, "epoch": 3144} {"train_loss": -6.669229030609131, "global_step": 132081, "epoch": 3144} {"train_loss": -6.740542411804199, "global_step": 132082, "epoch": 3144} {"train_loss": -6.705443382263184, "global_step": 132083, "epoch": 3144} {"train_loss": -6.640446186065674, "global_step": 132084, "epoch": 3144} {"train_loss": -6.535921573638916, "global_step": 132085, "epoch": 3144} {"train_loss": -6.748047828674316, "global_step": 132086, "epoch": 3144} {"train_loss": -6.514759063720703, "global_step": 132087, "epoch": 3144} {"train_loss": -6.612105846405029, "global_step": 132088, "epoch": 3144} {"train_loss": -6.681327604112171, "global_step": 132089, "epoch": 3144, "val_loss": 77556.0390625} {"train_loss": -6.66736364364624, "global_step": 132090, "epoch": 3145} {"train_loss": -6.647461891174316, "global_step": 132091, "epoch": 3145} {"train_loss": -6.634880542755127, "global_step": 132092, "epoch": 3145} {"train_loss": -6.634932041168213, "global_step": 132093, "epoch": 3145} {"train_loss": -6.648560523986816, "global_step": 132094, "epoch": 3145} {"train_loss": -6.629806995391846, "global_step": 132095, "epoch": 3145} {"train_loss": -6.874114513397217, "global_step": 132096, "epoch": 3145} {"train_loss": -6.613002300262451, "global_step": 132097, "epoch": 3145} {"train_loss": -6.688634872436523, "global_step": 132098, "epoch": 3145} {"train_loss": -6.6965131759643555, "global_step": 132099, "epoch": 3145} {"train_loss": -6.708333969116211, "global_step": 132100, "epoch": 3145} {"train_loss": -6.77461051940918, "global_step": 132101, "epoch": 3145} {"train_loss": -6.8545331954956055, "global_step": 132102, "epoch": 3145} {"train_loss": -6.707493782043457, "global_step": 132103, "epoch": 3145} {"train_loss": -6.697504997253418, "global_step": 132104, "epoch": 3145} {"train_loss": -6.745903015136719, "global_step": 132105, "epoch": 3145} {"train_loss": -6.694342613220215, "global_step": 132106, "epoch": 3145} {"train_loss": -6.744569778442383, "global_step": 132107, "epoch": 3145} {"train_loss": -6.7210259437561035, "global_step": 132108, "epoch": 3145} {"train_loss": -6.66912841796875, "global_step": 132109, "epoch": 3145} {"train_loss": -6.781557083129883, "global_step": 132110, "epoch": 3145} {"train_loss": -6.793261528015137, "global_step": 132111, "epoch": 3145} {"train_loss": -6.754852294921875, "global_step": 132112, "epoch": 3145} {"train_loss": -6.653617858886719, "global_step": 132113, "epoch": 3145} {"train_loss": -6.778934478759766, "global_step": 132114, "epoch": 3145} {"train_loss": -6.669121742248535, "global_step": 132115, "epoch": 3145} {"train_loss": -6.687061309814453, "global_step": 132116, "epoch": 3145} {"train_loss": -6.778392791748047, "global_step": 132117, "epoch": 3145} {"train_loss": -6.667822360992432, "global_step": 132118, "epoch": 3145} {"train_loss": -6.646246910095215, "global_step": 132119, "epoch": 3145} {"train_loss": -6.561603546142578, "global_step": 132120, "epoch": 3145} {"train_loss": -6.7142534255981445, "global_step": 132121, "epoch": 3145} {"train_loss": -6.669939041137695, "global_step": 132122, "epoch": 3145} {"train_loss": -6.599301338195801, "global_step": 132123, "epoch": 3145} {"train_loss": -6.689189910888672, "global_step": 132124, "epoch": 3145} {"train_loss": -6.70797061920166, "global_step": 132125, "epoch": 3145} {"train_loss": -6.584985733032227, "global_step": 132126, "epoch": 3145} {"train_loss": -6.766918659210205, "global_step": 132127, "epoch": 3145} {"train_loss": -6.718152046203613, "global_step": 132128, "epoch": 3145} {"train_loss": -6.673341751098633, "global_step": 132129, "epoch": 3145} {"train_loss": -6.779510498046875, "global_step": 132130, "epoch": 3145} {"train_loss": -6.699534756796701, "global_step": 132131, "epoch": 3145, "val_loss": 77532.796875} {"train_loss": -6.697488784790039, "global_step": 132132, "epoch": 3146} {"train_loss": -6.7416157722473145, "global_step": 132133, "epoch": 3146} {"train_loss": -6.705308437347412, "global_step": 132134, "epoch": 3146} {"train_loss": -6.719466209411621, "global_step": 132135, "epoch": 3146} {"train_loss": -6.652392387390137, "global_step": 132136, "epoch": 3146} {"train_loss": -6.66424560546875, "global_step": 132137, "epoch": 3146} {"train_loss": -6.757923603057861, "global_step": 132138, "epoch": 3146} {"train_loss": -6.712495803833008, "global_step": 132139, "epoch": 3146} {"train_loss": -6.662164688110352, "global_step": 132140, "epoch": 3146} {"train_loss": -6.756609916687012, "global_step": 132141, "epoch": 3146} {"train_loss": -6.813302040100098, "global_step": 132142, "epoch": 3146} {"train_loss": -6.617679595947266, "global_step": 132143, "epoch": 3146} {"train_loss": -6.690221786499023, "global_step": 132144, "epoch": 3146} {"train_loss": -6.797866344451904, "global_step": 132145, "epoch": 3146} {"train_loss": -6.655194282531738, "global_step": 132146, "epoch": 3146} {"train_loss": -6.768708229064941, "global_step": 132147, "epoch": 3146} {"train_loss": -6.78231143951416, "global_step": 132148, "epoch": 3146} {"train_loss": -6.720669746398926, "global_step": 132149, "epoch": 3146} {"train_loss": -6.673043251037598, "global_step": 132150, "epoch": 3146} {"train_loss": -6.639821529388428, "global_step": 132151, "epoch": 3146} {"train_loss": -6.684632778167725, "global_step": 132152, "epoch": 3146} {"train_loss": -6.707871437072754, "global_step": 132153, "epoch": 3146} {"train_loss": -6.753013610839844, "global_step": 132154, "epoch": 3146} {"train_loss": -6.63805627822876, "global_step": 132155, "epoch": 3146} {"train_loss": -6.6858978271484375, "global_step": 132156, "epoch": 3146} {"train_loss": -6.684450626373291, "global_step": 132157, "epoch": 3146} {"train_loss": -6.570786476135254, "global_step": 132158, "epoch": 3146} {"train_loss": -6.507035255432129, "global_step": 132159, "epoch": 3146} {"train_loss": -6.567826747894287, "global_step": 132160, "epoch": 3146} {"train_loss": -6.658699035644531, "global_step": 132161, "epoch": 3146} {"train_loss": -6.655617713928223, "global_step": 132162, "epoch": 3146} {"train_loss": -6.525644302368164, "global_step": 132163, "epoch": 3146} {"train_loss": -6.6499176025390625, "global_step": 132164, "epoch": 3146} {"train_loss": -6.61778450012207, "global_step": 132165, "epoch": 3146} {"train_loss": -6.441679954528809, "global_step": 132166, "epoch": 3146} {"train_loss": -6.62924337387085, "global_step": 132167, "epoch": 3146} {"train_loss": -6.629903316497803, "global_step": 132168, "epoch": 3146} {"train_loss": -6.616007328033447, "global_step": 132169, "epoch": 3146} {"train_loss": -6.69378662109375, "global_step": 132170, "epoch": 3146} {"train_loss": -6.708542346954346, "global_step": 132171, "epoch": 3146} {"train_loss": -6.648624420166016, "global_step": 132172, "epoch": 3146} {"train_loss": -6.671521902084351, "global_step": 132173, "epoch": 3146, "val_loss": 77616.1953125} {"train_loss": -6.640871047973633, "global_step": 132174, "epoch": 3147} {"train_loss": -6.684430122375488, "global_step": 132175, "epoch": 3147} {"train_loss": -6.686878204345703, "global_step": 132176, "epoch": 3147} {"train_loss": -6.727403163909912, "global_step": 132177, "epoch": 3147} {"train_loss": -6.659095764160156, "global_step": 132178, "epoch": 3147} {"train_loss": -6.761697769165039, "global_step": 132179, "epoch": 3147} {"train_loss": -6.675671100616455, "global_step": 132180, "epoch": 3147} {"train_loss": -6.669299125671387, "global_step": 132181, "epoch": 3147} {"train_loss": -6.745421409606934, "global_step": 132182, "epoch": 3147} {"train_loss": -6.658411979675293, "global_step": 132183, "epoch": 3147} {"train_loss": -6.680253982543945, "global_step": 132184, "epoch": 3147} {"train_loss": -6.70114803314209, "global_step": 132185, "epoch": 3147} {"train_loss": -6.722311973571777, "global_step": 132186, "epoch": 3147} {"train_loss": -6.537479400634766, "global_step": 132187, "epoch": 3147} {"train_loss": -6.612737655639648, "global_step": 132188, "epoch": 3147} {"train_loss": -6.757987022399902, "global_step": 132189, "epoch": 3147} {"train_loss": -6.6957478523254395, "global_step": 132190, "epoch": 3147} {"train_loss": -6.773996829986572, "global_step": 132191, "epoch": 3147} {"train_loss": -6.633002758026123, "global_step": 132192, "epoch": 3147} {"train_loss": -6.732239723205566, "global_step": 132193, "epoch": 3147} {"train_loss": -6.690783977508545, "global_step": 132194, "epoch": 3147} {"train_loss": -6.552945137023926, "global_step": 132195, "epoch": 3147} {"train_loss": -6.680261611938477, "global_step": 132196, "epoch": 3147} {"train_loss": -6.615167617797852, "global_step": 132197, "epoch": 3147} {"train_loss": -6.612705707550049, "global_step": 132198, "epoch": 3147} {"train_loss": -6.580216407775879, "global_step": 132199, "epoch": 3147} {"train_loss": -6.696244716644287, "global_step": 132200, "epoch": 3147} {"train_loss": -6.591493129730225, "global_step": 132201, "epoch": 3147} {"train_loss": -6.743542194366455, "global_step": 132202, "epoch": 3147} {"train_loss": -6.694257736206055, "global_step": 132203, "epoch": 3147} {"train_loss": -6.694750785827637, "global_step": 132204, "epoch": 3147} {"train_loss": -6.611207962036133, "global_step": 132205, "epoch": 3147} {"train_loss": -6.6147918701171875, "global_step": 132206, "epoch": 3147} {"train_loss": -6.731457233428955, "global_step": 132207, "epoch": 3147} {"train_loss": -6.695098876953125, "global_step": 132208, "epoch": 3147} {"train_loss": -6.556887626647949, "global_step": 132209, "epoch": 3147} {"train_loss": -6.725564002990723, "global_step": 132210, "epoch": 3147} {"train_loss": -6.500734329223633, "global_step": 132211, "epoch": 3147} {"train_loss": -6.71024227142334, "global_step": 132212, "epoch": 3147} {"train_loss": -6.6143693923950195, "global_step": 132213, "epoch": 3147} {"train_loss": -6.7593913078308105, "global_step": 132214, "epoch": 3147} {"train_loss": -6.666574239730835, "global_step": 132215, "epoch": 3147, "val_loss": 78117.34375} {"train_loss": -6.5318603515625, "global_step": 132216, "epoch": 3148} {"train_loss": -6.677041053771973, "global_step": 132217, "epoch": 3148} {"train_loss": -6.636780738830566, "global_step": 132218, "epoch": 3148} {"train_loss": -6.6926727294921875, "global_step": 132219, "epoch": 3148} {"train_loss": -6.682028293609619, "global_step": 132220, "epoch": 3148} {"train_loss": -6.5952863693237305, "global_step": 132221, "epoch": 3148} {"train_loss": -6.648814678192139, "global_step": 132222, "epoch": 3148} {"train_loss": -6.687124252319336, "global_step": 132223, "epoch": 3148} {"train_loss": -6.717895030975342, "global_step": 132224, "epoch": 3148} {"train_loss": -6.730172157287598, "global_step": 132225, "epoch": 3148} {"train_loss": -6.734429359436035, "global_step": 132226, "epoch": 3148} {"train_loss": -6.823171615600586, "global_step": 132227, "epoch": 3148} {"train_loss": -6.725168704986572, "global_step": 132228, "epoch": 3148} {"train_loss": -6.686778545379639, "global_step": 132229, "epoch": 3148} {"train_loss": -6.826295852661133, "global_step": 132230, "epoch": 3148} {"train_loss": -6.725874423980713, "global_step": 132231, "epoch": 3148} {"train_loss": -6.701067924499512, "global_step": 132232, "epoch": 3148} {"train_loss": -6.694836616516113, "global_step": 132233, "epoch": 3148} {"train_loss": -6.7359418869018555, "global_step": 132234, "epoch": 3148} {"train_loss": -6.774536609649658, "global_step": 132235, "epoch": 3148} {"train_loss": -6.608612060546875, "global_step": 132236, "epoch": 3148} {"train_loss": -6.745142459869385, "global_step": 132237, "epoch": 3148} {"train_loss": -6.624249458312988, "global_step": 132238, "epoch": 3148} {"train_loss": -6.7325663566589355, "global_step": 132239, "epoch": 3148} {"train_loss": -6.711233139038086, "global_step": 132240, "epoch": 3148} {"train_loss": -6.669297218322754, "global_step": 132241, "epoch": 3148} {"train_loss": -6.658129692077637, "global_step": 132242, "epoch": 3148} {"train_loss": -6.722105979919434, "global_step": 132243, "epoch": 3148} {"train_loss": -6.561992645263672, "global_step": 132244, "epoch": 3148} {"train_loss": -6.705442905426025, "global_step": 132245, "epoch": 3148} {"train_loss": -6.7246904373168945, "global_step": 132246, "epoch": 3148} {"train_loss": -6.494846343994141, "global_step": 132247, "epoch": 3148} {"train_loss": -6.722264289855957, "global_step": 132248, "epoch": 3148} {"train_loss": -6.688166618347168, "global_step": 132249, "epoch": 3148} {"train_loss": -6.66336727142334, "global_step": 132250, "epoch": 3148} {"train_loss": -6.742280960083008, "global_step": 132251, "epoch": 3148} {"train_loss": -6.771608352661133, "global_step": 132252, "epoch": 3148} {"train_loss": -6.840145587921143, "global_step": 132253, "epoch": 3148} {"train_loss": -6.748518943786621, "global_step": 132254, "epoch": 3148} {"train_loss": -6.8103532791137695, "global_step": 132255, "epoch": 3148} {"train_loss": -6.7828779220581055, "global_step": 132256, "epoch": 3148} {"train_loss": -6.701301154636202, "global_step": 132257, "epoch": 3148, "val_loss": 77529.3671875} {"train_loss": -6.700734615325928, "global_step": 132258, "epoch": 3149} {"train_loss": -6.701026439666748, "global_step": 132259, "epoch": 3149} {"train_loss": -6.779345512390137, "global_step": 132260, "epoch": 3149} {"train_loss": -6.66142463684082, "global_step": 132261, "epoch": 3149} {"train_loss": -6.690390586853027, "global_step": 132262, "epoch": 3149} {"train_loss": -6.836931228637695, "global_step": 132263, "epoch": 3149} {"train_loss": -6.718193054199219, "global_step": 132264, "epoch": 3149} {"train_loss": -6.628543853759766, "global_step": 132265, "epoch": 3149} {"train_loss": -6.836582183837891, "global_step": 132266, "epoch": 3149} {"train_loss": -6.69631290435791, "global_step": 132267, "epoch": 3149} {"train_loss": -6.7571282386779785, "global_step": 132268, "epoch": 3149} {"train_loss": -6.723349571228027, "global_step": 132269, "epoch": 3149} {"train_loss": -6.764194488525391, "global_step": 132270, "epoch": 3149} {"train_loss": -6.721026420593262, "global_step": 132271, "epoch": 3149} {"train_loss": -6.660974025726318, "global_step": 132272, "epoch": 3149} {"train_loss": -6.658921241760254, "global_step": 132273, "epoch": 3149} {"train_loss": -6.667279243469238, "global_step": 132274, "epoch": 3149} {"train_loss": -6.738502025604248, "global_step": 132275, "epoch": 3149} {"train_loss": -6.693933486938477, "global_step": 132276, "epoch": 3149} {"train_loss": -6.692979335784912, "global_step": 132277, "epoch": 3149} {"train_loss": -6.713601112365723, "global_step": 132278, "epoch": 3149} {"train_loss": -6.7012176513671875, "global_step": 132279, "epoch": 3149} {"train_loss": -6.744706630706787, "global_step": 132280, "epoch": 3149} {"train_loss": -6.738735198974609, "global_step": 132281, "epoch": 3149} {"train_loss": -6.652709484100342, "global_step": 132282, "epoch": 3149} {"train_loss": -6.687747478485107, "global_step": 132283, "epoch": 3149} {"train_loss": -6.762972831726074, "global_step": 132284, "epoch": 3149} {"train_loss": -6.801975250244141, "global_step": 132285, "epoch": 3149} {"train_loss": -6.706398010253906, "global_step": 132286, "epoch": 3149} {"train_loss": -6.732931137084961, "global_step": 132287, "epoch": 3149} {"train_loss": -6.658225059509277, "global_step": 132288, "epoch": 3149} {"train_loss": -6.74713134765625, "global_step": 132289, "epoch": 3149} {"train_loss": -6.854427337646484, "global_step": 132290, "epoch": 3149} {"train_loss": -6.863579750061035, "global_step": 132291, "epoch": 3149} {"train_loss": -6.77432918548584, "global_step": 132292, "epoch": 3149} {"train_loss": -6.6965837478637695, "global_step": 132293, "epoch": 3149} {"train_loss": -6.733031749725342, "global_step": 132294, "epoch": 3149} {"train_loss": -6.639606475830078, "global_step": 132295, "epoch": 3149} {"train_loss": -6.664322853088379, "global_step": 132296, "epoch": 3149} {"train_loss": -6.895620346069336, "global_step": 132297, "epoch": 3149} {"train_loss": -6.67037296295166, "global_step": 132298, "epoch": 3149} {"train_loss": -6.7240803355262395, "global_step": 132299, "epoch": 3149, "val_loss": 77609.328125} {"train_loss": -6.727625370025635, "global_step": 132300, "epoch": 3150} {"train_loss": -6.616230010986328, "global_step": 132301, "epoch": 3150} {"train_loss": -6.821623802185059, "global_step": 132302, "epoch": 3150} {"train_loss": -6.7190961837768555, "global_step": 132303, "epoch": 3150} {"train_loss": -6.547496795654297, "global_step": 132304, "epoch": 3150} {"train_loss": -6.7950544357299805, "global_step": 132305, "epoch": 3150} {"train_loss": -6.764346122741699, "global_step": 132306, "epoch": 3150} {"train_loss": -6.767631530761719, "global_step": 132307, "epoch": 3150} {"train_loss": -6.579416751861572, "global_step": 132308, "epoch": 3150} {"train_loss": -6.698146343231201, "global_step": 132309, "epoch": 3150} {"train_loss": -6.632880210876465, "global_step": 132310, "epoch": 3150} {"train_loss": -6.623564720153809, "global_step": 132311, "epoch": 3150} {"train_loss": -6.692089080810547, "global_step": 132312, "epoch": 3150} {"train_loss": -6.77265739440918, "global_step": 132313, "epoch": 3150} {"train_loss": -6.600820064544678, "global_step": 132314, "epoch": 3150} {"train_loss": -6.637981414794922, "global_step": 132315, "epoch": 3150} {"train_loss": -6.690921783447266, "global_step": 132316, "epoch": 3150} {"train_loss": -6.713582992553711, "global_step": 132317, "epoch": 3150} {"train_loss": -6.583076477050781, "global_step": 132318, "epoch": 3150} {"train_loss": -6.725540637969971, "global_step": 132319, "epoch": 3150} {"train_loss": -6.625615119934082, "global_step": 132320, "epoch": 3150} {"train_loss": -6.763336181640625, "global_step": 132321, "epoch": 3150} {"train_loss": -6.704689979553223, "global_step": 132322, "epoch": 3150} {"train_loss": -6.544920921325684, "global_step": 132323, "epoch": 3150} {"train_loss": -6.668519973754883, "global_step": 132324, "epoch": 3150} {"train_loss": -6.652508735656738, "global_step": 132325, "epoch": 3150} {"train_loss": -6.68353796005249, "global_step": 132326, "epoch": 3150} {"train_loss": -6.524219989776611, "global_step": 132327, "epoch": 3150} {"train_loss": -6.7212114334106445, "global_step": 132328, "epoch": 3150} {"train_loss": -6.6507086753845215, "global_step": 132329, "epoch": 3150} {"train_loss": -6.727613925933838, "global_step": 132330, "epoch": 3150} {"train_loss": -6.69366455078125, "global_step": 132331, "epoch": 3150} {"train_loss": -6.67315149307251, "global_step": 132332, "epoch": 3150} {"train_loss": -6.622503280639648, "global_step": 132333, "epoch": 3150} {"train_loss": -6.735231399536133, "global_step": 132334, "epoch": 3150} {"train_loss": -6.683823585510254, "global_step": 132335, "epoch": 3150} {"train_loss": -6.738563060760498, "global_step": 132336, "epoch": 3150} {"train_loss": -6.699135780334473, "global_step": 132337, "epoch": 3150} {"train_loss": -6.740548133850098, "global_step": 132338, "epoch": 3150} {"train_loss": -6.715895652770996, "global_step": 132339, "epoch": 3150} {"train_loss": -6.686886310577393, "global_step": 132340, "epoch": 3150} {"train_loss": -6.683934211730957, "global_step": 132341, "epoch": 3150, "train/sim_max_reward_0": 0.4405711090456806, "train/sim_max_reward_1": 0.9273244015378487, "train/sim_max_reward_2": 0.3322889159291775, "train/sim_max_reward_3": 0.1490670198011448, "train/sim_max_reward_4": 0.48378851580426796, "train/sim_max_reward_5": 0.5516045044124825, "test/sim_max_reward_4500000": 0.909589321951339, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.872710159065422, "test/sim_max_reward_4500003": 0.9634934254817972, "test/sim_max_reward_4500004": 0.12271252978649656, "test/sim_max_reward_4500005": 0.25298889024697824, "test/sim_max_reward_4500006": 0.9607181519173087, "test/sim_max_reward_4500007": 0.7068075920655816, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.9143203874842473, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9671908251586424, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.01811945662068588, "test/sim_max_reward_4500014": 0.9331186039982577, "test/sim_max_reward_4500015": 0.4379120414676373, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.04029250086479049, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.39496762743265895, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.8191512824430031, "test/sim_max_reward_4500023": 0.9194628106623761, "test/sim_max_reward_4500024": 0.8906257017678941, "test/sim_max_reward_4500025": 0.6853440980778214, "test/sim_max_reward_4500026": 0.9837330937796208, "test/sim_max_reward_4500027": 0.9766079665441645, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.055668137068927474, "test/sim_max_reward_4500030": 0.9107545096275711, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05063847605487027, "test/sim_max_reward_4500033": 0.9124308762452774, "test/sim_max_reward_4500034": 0.8641735379878609, "test/sim_max_reward_4500035": 0.9364504734528627, "test/sim_max_reward_4500036": 0.39373429009160055, "test/sim_max_reward_4500037": 0.9668817529245984, "test/sim_max_reward_4500038": 0.3399822848946309, "test/sim_max_reward_4500039": 0.933190933937348, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.9490506205471666, "test/sim_max_reward_4500042": 0.03810604852951723, "test/sim_max_reward_4500043": 0.3419062903475574, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.8007764663121272, "test/sim_max_reward_4500046": 0.7494906222151186, "test/sim_max_reward_4500047": 0.9544799303043451, "test/sim_max_reward_4500048": 0.979645396961923, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.4807740777551004, "test/mean_score": 0.5835077676054274, "val_loss": 77823.7109375} {"train_loss": -6.569424629211426, "global_step": 132342, "epoch": 3151} {"train_loss": -6.72472620010376, "global_step": 132343, "epoch": 3151} {"train_loss": -6.649625778198242, "global_step": 132344, "epoch": 3151} {"train_loss": -6.714938163757324, "global_step": 132345, "epoch": 3151} {"train_loss": -6.718826770782471, "global_step": 132346, "epoch": 3151} {"train_loss": -6.777017116546631, "global_step": 132347, "epoch": 3151} {"train_loss": -6.592921257019043, "global_step": 132348, "epoch": 3151} {"train_loss": -6.747856616973877, "global_step": 132349, "epoch": 3151} {"train_loss": -6.798890113830566, "global_step": 132350, "epoch": 3151} {"train_loss": -6.603001117706299, "global_step": 132351, "epoch": 3151} {"train_loss": -6.786830902099609, "global_step": 132352, "epoch": 3151} {"train_loss": -6.801164627075195, "global_step": 132353, "epoch": 3151} {"train_loss": -6.637460708618164, "global_step": 132354, "epoch": 3151} {"train_loss": -6.581319808959961, "global_step": 132355, "epoch": 3151} {"train_loss": -6.689861297607422, "global_step": 132356, "epoch": 3151} {"train_loss": -6.714545249938965, "global_step": 132357, "epoch": 3151} {"train_loss": -6.686697006225586, "global_step": 132358, "epoch": 3151} {"train_loss": -6.805784225463867, "global_step": 132359, "epoch": 3151} {"train_loss": -6.834945201873779, "global_step": 132360, "epoch": 3151} {"train_loss": -6.703410625457764, "global_step": 132361, "epoch": 3151} {"train_loss": -6.805727958679199, "global_step": 132362, "epoch": 3151} {"train_loss": -6.81703519821167, "global_step": 132363, "epoch": 3151} {"train_loss": -6.656599998474121, "global_step": 132364, "epoch": 3151} {"train_loss": -6.6617889404296875, "global_step": 132365, "epoch": 3151} {"train_loss": -6.7607831954956055, "global_step": 132366, "epoch": 3151} {"train_loss": -6.5403852462768555, "global_step": 132367, "epoch": 3151} {"train_loss": -6.675664901733398, "global_step": 132368, "epoch": 3151} {"train_loss": -6.738000392913818, "global_step": 132369, "epoch": 3151} {"train_loss": -6.7869553565979, "global_step": 132370, "epoch": 3151} {"train_loss": -6.807967662811279, "global_step": 132371, "epoch": 3151} {"train_loss": -6.759215354919434, "global_step": 132372, "epoch": 3151} {"train_loss": -6.624387741088867, "global_step": 132373, "epoch": 3151} {"train_loss": -6.6851806640625, "global_step": 132374, "epoch": 3151} {"train_loss": -6.739418029785156, "global_step": 132375, "epoch": 3151} {"train_loss": -6.724806308746338, "global_step": 132376, "epoch": 3151} {"train_loss": -6.6336236000061035, "global_step": 132377, "epoch": 3151} {"train_loss": -6.556981086730957, "global_step": 132378, "epoch": 3151} {"train_loss": -6.607151985168457, "global_step": 132379, "epoch": 3151} {"train_loss": -6.610123634338379, "global_step": 132380, "epoch": 3151} {"train_loss": -6.53577184677124, "global_step": 132381, "epoch": 3151} {"train_loss": -6.7054548263549805, "global_step": 132382, "epoch": 3151} {"train_loss": -6.695306130817959, "global_step": 132383, "epoch": 3151, "val_loss": 77144.4453125} {"train_loss": -6.728764057159424, "global_step": 132384, "epoch": 3152} {"train_loss": -6.657649040222168, "global_step": 132385, "epoch": 3152} {"train_loss": -6.747846603393555, "global_step": 132386, "epoch": 3152} {"train_loss": -6.674371719360352, "global_step": 132387, "epoch": 3152} {"train_loss": -6.706473350524902, "global_step": 132388, "epoch": 3152} {"train_loss": -6.571353435516357, "global_step": 132389, "epoch": 3152} {"train_loss": -6.684491157531738, "global_step": 132390, "epoch": 3152} {"train_loss": -6.570416450500488, "global_step": 132391, "epoch": 3152} {"train_loss": -6.705859184265137, "global_step": 132392, "epoch": 3152} {"train_loss": -6.694725036621094, "global_step": 132393, "epoch": 3152} {"train_loss": -6.565998554229736, "global_step": 132394, "epoch": 3152} {"train_loss": -6.632900238037109, "global_step": 132395, "epoch": 3152} {"train_loss": -6.642446517944336, "global_step": 132396, "epoch": 3152} {"train_loss": -6.618870735168457, "global_step": 132397, "epoch": 3152} {"train_loss": -6.746973037719727, "global_step": 132398, "epoch": 3152} {"train_loss": -6.76580810546875, "global_step": 132399, "epoch": 3152} {"train_loss": -6.55784273147583, "global_step": 132400, "epoch": 3152} {"train_loss": -6.600327968597412, "global_step": 132401, "epoch": 3152} {"train_loss": -6.674951553344727, "global_step": 132402, "epoch": 3152} {"train_loss": -6.639626502990723, "global_step": 132403, "epoch": 3152} {"train_loss": -6.621960639953613, "global_step": 132404, "epoch": 3152} {"train_loss": -6.580505847930908, "global_step": 132405, "epoch": 3152} {"train_loss": -6.620373725891113, "global_step": 132406, "epoch": 3152} {"train_loss": -6.623376369476318, "global_step": 132407, "epoch": 3152} {"train_loss": -6.753235816955566, "global_step": 132408, "epoch": 3152} {"train_loss": -6.601511001586914, "global_step": 132409, "epoch": 3152} {"train_loss": -6.667832374572754, "global_step": 132410, "epoch": 3152} {"train_loss": -6.796329021453857, "global_step": 132411, "epoch": 3152} {"train_loss": -6.717845439910889, "global_step": 132412, "epoch": 3152} {"train_loss": -6.720099449157715, "global_step": 132413, "epoch": 3152} {"train_loss": -6.757378578186035, "global_step": 132414, "epoch": 3152} {"train_loss": -6.672695159912109, "global_step": 132415, "epoch": 3152} {"train_loss": -6.745560646057129, "global_step": 132416, "epoch": 3152} {"train_loss": -6.693119525909424, "global_step": 132417, "epoch": 3152} {"train_loss": -6.632420539855957, "global_step": 132418, "epoch": 3152} {"train_loss": -6.68977689743042, "global_step": 132419, "epoch": 3152} {"train_loss": -6.712378978729248, "global_step": 132420, "epoch": 3152} {"train_loss": -6.622562408447266, "global_step": 132421, "epoch": 3152} {"train_loss": -6.6534552574157715, "global_step": 132422, "epoch": 3152} {"train_loss": -6.680659294128418, "global_step": 132423, "epoch": 3152} {"train_loss": -6.57628870010376, "global_step": 132424, "epoch": 3152} {"train_loss": -6.6660289991469615, "global_step": 132425, "epoch": 3152, "val_loss": 77653.0390625} {"train_loss": -6.730785369873047, "global_step": 132426, "epoch": 3153} {"train_loss": -6.612098693847656, "global_step": 132427, "epoch": 3153} {"train_loss": -6.611572742462158, "global_step": 132428, "epoch": 3153} {"train_loss": -6.58137845993042, "global_step": 132429, "epoch": 3153} {"train_loss": -6.6793131828308105, "global_step": 132430, "epoch": 3153} {"train_loss": -6.63555908203125, "global_step": 132431, "epoch": 3153} {"train_loss": -6.686814785003662, "global_step": 132432, "epoch": 3153} {"train_loss": -6.702150344848633, "global_step": 132433, "epoch": 3153} {"train_loss": -6.608676910400391, "global_step": 132434, "epoch": 3153} {"train_loss": -6.732461452484131, "global_step": 132435, "epoch": 3153} {"train_loss": -6.77777624130249, "global_step": 132436, "epoch": 3153} {"train_loss": -6.69183349609375, "global_step": 132437, "epoch": 3153} {"train_loss": -6.737133026123047, "global_step": 132438, "epoch": 3153} {"train_loss": -6.596568584442139, "global_step": 132439, "epoch": 3153} {"train_loss": -6.688584327697754, "global_step": 132440, "epoch": 3153} {"train_loss": -6.730775833129883, "global_step": 132441, "epoch": 3153} {"train_loss": -6.618652820587158, "global_step": 132442, "epoch": 3153} {"train_loss": -6.649497985839844, "global_step": 132443, "epoch": 3153} {"train_loss": -6.670157432556152, "global_step": 132444, "epoch": 3153} {"train_loss": -6.711917877197266, "global_step": 132445, "epoch": 3153} {"train_loss": -6.679006576538086, "global_step": 132446, "epoch": 3153} {"train_loss": -6.68601131439209, "global_step": 132447, "epoch": 3153} {"train_loss": -6.769114017486572, "global_step": 132448, "epoch": 3153} {"train_loss": -6.629639625549316, "global_step": 132449, "epoch": 3153} {"train_loss": -6.702498912811279, "global_step": 132450, "epoch": 3153} {"train_loss": -6.7991743087768555, "global_step": 132451, "epoch": 3153} {"train_loss": -6.72512674331665, "global_step": 132452, "epoch": 3153} {"train_loss": -6.642851829528809, "global_step": 132453, "epoch": 3153} {"train_loss": -6.742371082305908, "global_step": 132454, "epoch": 3153} {"train_loss": -6.742767333984375, "global_step": 132455, "epoch": 3153} {"train_loss": -6.644802093505859, "global_step": 132456, "epoch": 3153} {"train_loss": -6.720890522003174, "global_step": 132457, "epoch": 3153} {"train_loss": -6.682085037231445, "global_step": 132458, "epoch": 3153} {"train_loss": -6.796935081481934, "global_step": 132459, "epoch": 3153} {"train_loss": -6.753273010253906, "global_step": 132460, "epoch": 3153} {"train_loss": -6.723103046417236, "global_step": 132461, "epoch": 3153} {"train_loss": -6.700019836425781, "global_step": 132462, "epoch": 3153} {"train_loss": -6.718680381774902, "global_step": 132463, "epoch": 3153} {"train_loss": -6.851683616638184, "global_step": 132464, "epoch": 3153} {"train_loss": -6.691058158874512, "global_step": 132465, "epoch": 3153} {"train_loss": -6.656412124633789, "global_step": 132466, "epoch": 3153} {"train_loss": -6.694551944732666, "global_step": 132467, "epoch": 3153, "val_loss": 77562.4765625} {"train_loss": -6.793223857879639, "global_step": 132468, "epoch": 3154} {"train_loss": -6.730106353759766, "global_step": 132469, "epoch": 3154} {"train_loss": -6.767099857330322, "global_step": 132470, "epoch": 3154} {"train_loss": -6.7641825675964355, "global_step": 132471, "epoch": 3154} {"train_loss": -6.76785945892334, "global_step": 132472, "epoch": 3154} {"train_loss": -6.612789630889893, "global_step": 132473, "epoch": 3154} {"train_loss": -6.716122627258301, "global_step": 132474, "epoch": 3154} {"train_loss": -6.799160480499268, "global_step": 132475, "epoch": 3154} {"train_loss": -6.770267486572266, "global_step": 132476, "epoch": 3154} {"train_loss": -6.705558776855469, "global_step": 132477, "epoch": 3154} {"train_loss": -6.754979610443115, "global_step": 132478, "epoch": 3154} {"train_loss": -6.732369899749756, "global_step": 132479, "epoch": 3154} {"train_loss": -6.821681499481201, "global_step": 132480, "epoch": 3154} {"train_loss": -6.720404148101807, "global_step": 132481, "epoch": 3154} {"train_loss": -6.628125190734863, "global_step": 132482, "epoch": 3154} {"train_loss": -6.850518226623535, "global_step": 132483, "epoch": 3154} {"train_loss": -6.782434940338135, "global_step": 132484, "epoch": 3154} {"train_loss": -6.695302486419678, "global_step": 132485, "epoch": 3154} {"train_loss": -6.770502090454102, "global_step": 132486, "epoch": 3154} {"train_loss": -6.756319522857666, "global_step": 132487, "epoch": 3154} {"train_loss": -6.626446723937988, "global_step": 132488, "epoch": 3154} {"train_loss": -6.73397159576416, "global_step": 132489, "epoch": 3154} {"train_loss": -6.7530035972595215, "global_step": 132490, "epoch": 3154} {"train_loss": -6.851410865783691, "global_step": 132491, "epoch": 3154} {"train_loss": -6.7730255126953125, "global_step": 132492, "epoch": 3154} {"train_loss": -6.692069053649902, "global_step": 132493, "epoch": 3154} {"train_loss": -6.690037250518799, "global_step": 132494, "epoch": 3154} {"train_loss": -6.859218597412109, "global_step": 132495, "epoch": 3154} {"train_loss": -6.758580207824707, "global_step": 132496, "epoch": 3154} {"train_loss": -6.7520880699157715, "global_step": 132497, "epoch": 3154} {"train_loss": -6.6444292068481445, "global_step": 132498, "epoch": 3154} {"train_loss": -6.830160140991211, "global_step": 132499, "epoch": 3154} {"train_loss": -6.611173629760742, "global_step": 132500, "epoch": 3154} {"train_loss": -6.760003089904785, "global_step": 132501, "epoch": 3154} {"train_loss": -6.716383934020996, "global_step": 132502, "epoch": 3154} {"train_loss": -6.680453300476074, "global_step": 132503, "epoch": 3154} {"train_loss": -6.798630714416504, "global_step": 132504, "epoch": 3154} {"train_loss": -6.722234725952148, "global_step": 132505, "epoch": 3154} {"train_loss": -6.633472919464111, "global_step": 132506, "epoch": 3154} {"train_loss": -6.7307281494140625, "global_step": 132507, "epoch": 3154} {"train_loss": -6.745553970336914, "global_step": 132508, "epoch": 3154} {"train_loss": -6.735304798398699, "global_step": 132509, "epoch": 3154, "val_loss": 77583.2578125} {"train_loss": -6.595621585845947, "global_step": 132510, "epoch": 3155} {"train_loss": -6.822728157043457, "global_step": 132511, "epoch": 3155} {"train_loss": -6.653875827789307, "global_step": 132512, "epoch": 3155} {"train_loss": -6.827042102813721, "global_step": 132513, "epoch": 3155} {"train_loss": -6.799176216125488, "global_step": 132514, "epoch": 3155} {"train_loss": -6.630965709686279, "global_step": 132515, "epoch": 3155} {"train_loss": -6.745547294616699, "global_step": 132516, "epoch": 3155} {"train_loss": -6.583044052124023, "global_step": 132517, "epoch": 3155} {"train_loss": -6.583138465881348, "global_step": 132518, "epoch": 3155} {"train_loss": -6.863611221313477, "global_step": 132519, "epoch": 3155} {"train_loss": -6.617212295532227, "global_step": 132520, "epoch": 3155} {"train_loss": -6.609419822692871, "global_step": 132521, "epoch": 3155} {"train_loss": -6.678253173828125, "global_step": 132522, "epoch": 3155} {"train_loss": -6.770013809204102, "global_step": 132523, "epoch": 3155} {"train_loss": -6.716734886169434, "global_step": 132524, "epoch": 3155} {"train_loss": -6.738025665283203, "global_step": 132525, "epoch": 3155} {"train_loss": -6.715821266174316, "global_step": 132526, "epoch": 3155} {"train_loss": -6.644619941711426, "global_step": 132527, "epoch": 3155} {"train_loss": -6.580345630645752, "global_step": 132528, "epoch": 3155} {"train_loss": -6.720442771911621, "global_step": 132529, "epoch": 3155} {"train_loss": -6.643348693847656, "global_step": 132530, "epoch": 3155} {"train_loss": -6.730662822723389, "global_step": 132531, "epoch": 3155} {"train_loss": -6.6964640617370605, "global_step": 132532, "epoch": 3155} {"train_loss": -6.5279693603515625, "global_step": 132533, "epoch": 3155} {"train_loss": -6.575495719909668, "global_step": 132534, "epoch": 3155} {"train_loss": -6.533795356750488, "global_step": 132535, "epoch": 3155} {"train_loss": -6.5962910652160645, "global_step": 132536, "epoch": 3155} {"train_loss": -6.596554279327393, "global_step": 132537, "epoch": 3155} {"train_loss": -6.673975467681885, "global_step": 132538, "epoch": 3155} {"train_loss": -6.6475982666015625, "global_step": 132539, "epoch": 3155} {"train_loss": -6.631772994995117, "global_step": 132540, "epoch": 3155} {"train_loss": -6.608896255493164, "global_step": 132541, "epoch": 3155} {"train_loss": -6.698627471923828, "global_step": 132542, "epoch": 3155} {"train_loss": -6.788567543029785, "global_step": 132543, "epoch": 3155} {"train_loss": -6.632841110229492, "global_step": 132544, "epoch": 3155} {"train_loss": -6.711095333099365, "global_step": 132545, "epoch": 3155} {"train_loss": -6.718406677246094, "global_step": 132546, "epoch": 3155} {"train_loss": -6.697507858276367, "global_step": 132547, "epoch": 3155} {"train_loss": -6.746647834777832, "global_step": 132548, "epoch": 3155} {"train_loss": -6.704495906829834, "global_step": 132549, "epoch": 3155} {"train_loss": -6.74754524230957, "global_step": 132550, "epoch": 3155} {"train_loss": -6.6780463854471845, "global_step": 132551, "epoch": 3155, "val_loss": 77552.1796875} {"train_loss": -6.712013244628906, "global_step": 132552, "epoch": 3156} {"train_loss": -6.690810203552246, "global_step": 132553, "epoch": 3156} {"train_loss": -6.587385654449463, "global_step": 132554, "epoch": 3156} {"train_loss": -6.729008674621582, "global_step": 132555, "epoch": 3156} {"train_loss": -6.739165306091309, "global_step": 132556, "epoch": 3156} {"train_loss": -6.697772979736328, "global_step": 132557, "epoch": 3156} {"train_loss": -6.750729084014893, "global_step": 132558, "epoch": 3156} {"train_loss": -6.719459533691406, "global_step": 132559, "epoch": 3156} {"train_loss": -6.7118730545043945, "global_step": 132560, "epoch": 3156} {"train_loss": -6.731441497802734, "global_step": 132561, "epoch": 3156} {"train_loss": -6.73670768737793, "global_step": 132562, "epoch": 3156} {"train_loss": -6.690461158752441, "global_step": 132563, "epoch": 3156} {"train_loss": -6.71970796585083, "global_step": 132564, "epoch": 3156} {"train_loss": -6.680957317352295, "global_step": 132565, "epoch": 3156} {"train_loss": -6.640421390533447, "global_step": 132566, "epoch": 3156} {"train_loss": -6.617004871368408, "global_step": 132567, "epoch": 3156} {"train_loss": -6.583622455596924, "global_step": 132568, "epoch": 3156} {"train_loss": -6.765952110290527, "global_step": 132569, "epoch": 3156} {"train_loss": -6.691308975219727, "global_step": 132570, "epoch": 3156} {"train_loss": -6.629090785980225, "global_step": 132571, "epoch": 3156} {"train_loss": -6.714179039001465, "global_step": 132572, "epoch": 3156} {"train_loss": -6.607125759124756, "global_step": 132573, "epoch": 3156} {"train_loss": -6.632135391235352, "global_step": 132574, "epoch": 3156} {"train_loss": -6.7719268798828125, "global_step": 132575, "epoch": 3156} {"train_loss": -6.6956868171691895, "global_step": 132576, "epoch": 3156} {"train_loss": -6.769000053405762, "global_step": 132577, "epoch": 3156} {"train_loss": -6.704488754272461, "global_step": 132578, "epoch": 3156} {"train_loss": -6.72016716003418, "global_step": 132579, "epoch": 3156} {"train_loss": -6.632607936859131, "global_step": 132580, "epoch": 3156} {"train_loss": -6.687655448913574, "global_step": 132581, "epoch": 3156} {"train_loss": -6.720325469970703, "global_step": 132582, "epoch": 3156} {"train_loss": -6.787388801574707, "global_step": 132583, "epoch": 3156} {"train_loss": -6.640409469604492, "global_step": 132584, "epoch": 3156} {"train_loss": -6.640414714813232, "global_step": 132585, "epoch": 3156} {"train_loss": -6.632905960083008, "global_step": 132586, "epoch": 3156} {"train_loss": -6.677458763122559, "global_step": 132587, "epoch": 3156} {"train_loss": -6.643832683563232, "global_step": 132588, "epoch": 3156} {"train_loss": -6.624887466430664, "global_step": 132589, "epoch": 3156} {"train_loss": -6.686161994934082, "global_step": 132590, "epoch": 3156} {"train_loss": -6.692900657653809, "global_step": 132591, "epoch": 3156} {"train_loss": -6.5585856437683105, "global_step": 132592, "epoch": 3156} {"train_loss": -6.681493736448742, "global_step": 132593, "epoch": 3156, "val_loss": 77604.2890625} {"train_loss": -6.614386081695557, "global_step": 132594, "epoch": 3157} {"train_loss": -6.613256454467773, "global_step": 132595, "epoch": 3157} {"train_loss": -6.712597846984863, "global_step": 132596, "epoch": 3157} {"train_loss": -6.782258987426758, "global_step": 132597, "epoch": 3157} {"train_loss": -6.5996503829956055, "global_step": 132598, "epoch": 3157} {"train_loss": -6.639806747436523, "global_step": 132599, "epoch": 3157} {"train_loss": -6.7238359451293945, "global_step": 132600, "epoch": 3157} {"train_loss": -6.702897071838379, "global_step": 132601, "epoch": 3157} {"train_loss": -6.717365264892578, "global_step": 132602, "epoch": 3157} {"train_loss": -6.725622177124023, "global_step": 132603, "epoch": 3157} {"train_loss": -6.709053993225098, "global_step": 132604, "epoch": 3157} {"train_loss": -6.637636661529541, "global_step": 132605, "epoch": 3157} {"train_loss": -6.631330490112305, "global_step": 132606, "epoch": 3157} {"train_loss": -6.747097015380859, "global_step": 132607, "epoch": 3157} {"train_loss": -6.689343452453613, "global_step": 132608, "epoch": 3157} {"train_loss": -6.654603958129883, "global_step": 132609, "epoch": 3157} {"train_loss": -6.573378562927246, "global_step": 132610, "epoch": 3157} {"train_loss": -6.665925979614258, "global_step": 132611, "epoch": 3157} {"train_loss": -6.642332077026367, "global_step": 132612, "epoch": 3157} {"train_loss": -6.829042434692383, "global_step": 132613, "epoch": 3157} {"train_loss": -6.651669502258301, "global_step": 132614, "epoch": 3157} {"train_loss": -6.703023910522461, "global_step": 132615, "epoch": 3157} {"train_loss": -6.605477809906006, "global_step": 132616, "epoch": 3157} {"train_loss": -6.651074409484863, "global_step": 132617, "epoch": 3157} {"train_loss": -6.553389549255371, "global_step": 132618, "epoch": 3157} {"train_loss": -6.648883819580078, "global_step": 132619, "epoch": 3157} {"train_loss": -6.782752990722656, "global_step": 132620, "epoch": 3157} {"train_loss": -6.625072479248047, "global_step": 132621, "epoch": 3157} {"train_loss": -6.725192070007324, "global_step": 132622, "epoch": 3157} {"train_loss": -6.778316497802734, "global_step": 132623, "epoch": 3157} {"train_loss": -6.695258617401123, "global_step": 132624, "epoch": 3157} {"train_loss": -6.794773578643799, "global_step": 132625, "epoch": 3157} {"train_loss": -6.712308883666992, "global_step": 132626, "epoch": 3157} {"train_loss": -6.853330612182617, "global_step": 132627, "epoch": 3157} {"train_loss": -6.774328708648682, "global_step": 132628, "epoch": 3157} {"train_loss": -6.70205020904541, "global_step": 132629, "epoch": 3157} {"train_loss": -6.675063610076904, "global_step": 132630, "epoch": 3157} {"train_loss": -6.796263217926025, "global_step": 132631, "epoch": 3157} {"train_loss": -6.697575092315674, "global_step": 132632, "epoch": 3157} {"train_loss": -6.7080817222595215, "global_step": 132633, "epoch": 3157} {"train_loss": -6.720237731933594, "global_step": 132634, "epoch": 3157} {"train_loss": -6.696147226151966, "global_step": 132635, "epoch": 3157, "val_loss": 77385.0625} {"train_loss": -6.776933670043945, "global_step": 132636, "epoch": 3158} {"train_loss": -6.756982326507568, "global_step": 132637, "epoch": 3158} {"train_loss": -6.6926422119140625, "global_step": 132638, "epoch": 3158} {"train_loss": -6.8223443031311035, "global_step": 132639, "epoch": 3158} {"train_loss": -6.710379600524902, "global_step": 132640, "epoch": 3158} {"train_loss": -6.758103370666504, "global_step": 132641, "epoch": 3158} {"train_loss": -6.670338153839111, "global_step": 132642, "epoch": 3158} {"train_loss": -6.67714262008667, "global_step": 132643, "epoch": 3158} {"train_loss": -6.735734939575195, "global_step": 132644, "epoch": 3158} {"train_loss": -6.560092926025391, "global_step": 132645, "epoch": 3158} {"train_loss": -6.6769514083862305, "global_step": 132646, "epoch": 3158} {"train_loss": -6.7871551513671875, "global_step": 132647, "epoch": 3158} {"train_loss": -6.641636848449707, "global_step": 132648, "epoch": 3158} {"train_loss": -6.707891464233398, "global_step": 132649, "epoch": 3158} {"train_loss": -6.7134809494018555, "global_step": 132650, "epoch": 3158} {"train_loss": -6.678071975708008, "global_step": 132651, "epoch": 3158} {"train_loss": -6.628998756408691, "global_step": 132652, "epoch": 3158} {"train_loss": -6.6940155029296875, "global_step": 132653, "epoch": 3158} {"train_loss": -6.743098735809326, "global_step": 132654, "epoch": 3158} {"train_loss": -6.653997421264648, "global_step": 132655, "epoch": 3158} {"train_loss": -6.751808166503906, "global_step": 132656, "epoch": 3158} {"train_loss": -6.59079647064209, "global_step": 132657, "epoch": 3158} {"train_loss": -6.581962585449219, "global_step": 132658, "epoch": 3158} {"train_loss": -6.722133636474609, "global_step": 132659, "epoch": 3158} {"train_loss": -6.641765594482422, "global_step": 132660, "epoch": 3158} {"train_loss": -6.76396369934082, "global_step": 132661, "epoch": 3158} {"train_loss": -6.5701704025268555, "global_step": 132662, "epoch": 3158} {"train_loss": -6.589276313781738, "global_step": 132663, "epoch": 3158} {"train_loss": -6.698412895202637, "global_step": 132664, "epoch": 3158} {"train_loss": -6.628400802612305, "global_step": 132665, "epoch": 3158} {"train_loss": -6.680032253265381, "global_step": 132666, "epoch": 3158} {"train_loss": -6.727842807769775, "global_step": 132667, "epoch": 3158} {"train_loss": -6.589695930480957, "global_step": 132668, "epoch": 3158} {"train_loss": -6.645435333251953, "global_step": 132669, "epoch": 3158} {"train_loss": -6.688329696655273, "global_step": 132670, "epoch": 3158} {"train_loss": -6.695855617523193, "global_step": 132671, "epoch": 3158} {"train_loss": -6.696743011474609, "global_step": 132672, "epoch": 3158} {"train_loss": -6.612940788269043, "global_step": 132673, "epoch": 3158} {"train_loss": -6.807750701904297, "global_step": 132674, "epoch": 3158} {"train_loss": -6.716890335083008, "global_step": 132675, "epoch": 3158} {"train_loss": -6.602456092834473, "global_step": 132676, "epoch": 3158} {"train_loss": -6.681950750805083, "global_step": 132677, "epoch": 3158, "val_loss": 77840.0859375} {"train_loss": -6.680886745452881, "global_step": 132678, "epoch": 3159} {"train_loss": -6.659700393676758, "global_step": 132679, "epoch": 3159} {"train_loss": -6.664388179779053, "global_step": 132680, "epoch": 3159} {"train_loss": -6.6811933517456055, "global_step": 132681, "epoch": 3159} {"train_loss": -6.670676231384277, "global_step": 132682, "epoch": 3159} {"train_loss": -6.772809982299805, "global_step": 132683, "epoch": 3159} {"train_loss": -6.647218704223633, "global_step": 132684, "epoch": 3159} {"train_loss": -6.766085624694824, "global_step": 132685, "epoch": 3159} {"train_loss": -6.688179016113281, "global_step": 132686, "epoch": 3159} {"train_loss": -6.683192253112793, "global_step": 132687, "epoch": 3159} {"train_loss": -6.655799865722656, "global_step": 132688, "epoch": 3159} {"train_loss": -6.671665668487549, "global_step": 132689, "epoch": 3159} {"train_loss": -6.747648239135742, "global_step": 132690, "epoch": 3159} {"train_loss": -6.687024116516113, "global_step": 132691, "epoch": 3159} {"train_loss": -6.753528594970703, "global_step": 132692, "epoch": 3159} {"train_loss": -6.672540664672852, "global_step": 132693, "epoch": 3159} {"train_loss": -6.7838335037231445, "global_step": 132694, "epoch": 3159} {"train_loss": -6.59581184387207, "global_step": 132695, "epoch": 3159} {"train_loss": -6.718907356262207, "global_step": 132696, "epoch": 3159} {"train_loss": -6.6090006828308105, "global_step": 132697, "epoch": 3159} {"train_loss": -6.733165740966797, "global_step": 132698, "epoch": 3159} {"train_loss": -6.812127113342285, "global_step": 132699, "epoch": 3159} {"train_loss": -6.618675231933594, "global_step": 132700, "epoch": 3159} {"train_loss": -6.691776275634766, "global_step": 132701, "epoch": 3159} {"train_loss": -6.665319919586182, "global_step": 132702, "epoch": 3159} {"train_loss": -6.659919261932373, "global_step": 132703, "epoch": 3159} {"train_loss": -6.749617576599121, "global_step": 132704, "epoch": 3159} {"train_loss": -6.6317853927612305, "global_step": 132705, "epoch": 3159} {"train_loss": -6.735156059265137, "global_step": 132706, "epoch": 3159} {"train_loss": -6.619030952453613, "global_step": 132707, "epoch": 3159} {"train_loss": -6.6358489990234375, "global_step": 132708, "epoch": 3159} {"train_loss": -6.7795820236206055, "global_step": 132709, "epoch": 3159} {"train_loss": -6.694756507873535, "global_step": 132710, "epoch": 3159} {"train_loss": -6.650494575500488, "global_step": 132711, "epoch": 3159} {"train_loss": -6.647017955780029, "global_step": 132712, "epoch": 3159} {"train_loss": -6.657184600830078, "global_step": 132713, "epoch": 3159} {"train_loss": -6.672638893127441, "global_step": 132714, "epoch": 3159} {"train_loss": -6.56894588470459, "global_step": 132715, "epoch": 3159} {"train_loss": -6.72504997253418, "global_step": 132716, "epoch": 3159} {"train_loss": -6.60758113861084, "global_step": 132717, "epoch": 3159} {"train_loss": -6.623579025268555, "global_step": 132718, "epoch": 3159} {"train_loss": -6.680620034535726, "global_step": 132719, "epoch": 3159, "val_loss": 77478.765625} {"train_loss": -6.628306865692139, "global_step": 132720, "epoch": 3160} {"train_loss": -6.728084564208984, "global_step": 132721, "epoch": 3160} {"train_loss": -6.671198844909668, "global_step": 132722, "epoch": 3160} {"train_loss": -6.670553207397461, "global_step": 132723, "epoch": 3160} {"train_loss": -6.6585164070129395, "global_step": 132724, "epoch": 3160} {"train_loss": -6.608297348022461, "global_step": 132725, "epoch": 3160} {"train_loss": -6.679826736450195, "global_step": 132726, "epoch": 3160} {"train_loss": -6.6902313232421875, "global_step": 132727, "epoch": 3160} {"train_loss": -6.536579132080078, "global_step": 132728, "epoch": 3160} {"train_loss": -6.717436790466309, "global_step": 132729, "epoch": 3160} {"train_loss": -6.679925918579102, "global_step": 132730, "epoch": 3160} {"train_loss": -6.510884761810303, "global_step": 132731, "epoch": 3160} {"train_loss": -6.663326263427734, "global_step": 132732, "epoch": 3160} {"train_loss": -6.584000587463379, "global_step": 132733, "epoch": 3160} {"train_loss": -6.654183387756348, "global_step": 132734, "epoch": 3160} {"train_loss": -6.633296966552734, "global_step": 132735, "epoch": 3160} {"train_loss": -6.605463981628418, "global_step": 132736, "epoch": 3160} {"train_loss": -6.795065879821777, "global_step": 132737, "epoch": 3160} {"train_loss": -6.653801918029785, "global_step": 132738, "epoch": 3160} {"train_loss": -6.672274112701416, "global_step": 132739, "epoch": 3160} {"train_loss": -6.614117622375488, "global_step": 132740, "epoch": 3160} {"train_loss": -6.515827655792236, "global_step": 132741, "epoch": 3160} {"train_loss": -6.681666374206543, "global_step": 132742, "epoch": 3160} {"train_loss": -6.746333599090576, "global_step": 132743, "epoch": 3160} {"train_loss": -6.721303939819336, "global_step": 132744, "epoch": 3160} {"train_loss": -6.655176162719727, "global_step": 132745, "epoch": 3160} {"train_loss": -6.7035980224609375, "global_step": 132746, "epoch": 3160} {"train_loss": -6.500575065612793, "global_step": 132747, "epoch": 3160} {"train_loss": -6.6929426193237305, "global_step": 132748, "epoch": 3160} {"train_loss": -6.6425275802612305, "global_step": 132749, "epoch": 3160} {"train_loss": -6.845388412475586, "global_step": 132750, "epoch": 3160} {"train_loss": -6.5693535804748535, "global_step": 132751, "epoch": 3160} {"train_loss": -6.701704978942871, "global_step": 132752, "epoch": 3160} {"train_loss": -6.677804470062256, "global_step": 132753, "epoch": 3160} {"train_loss": -6.788603782653809, "global_step": 132754, "epoch": 3160} {"train_loss": -6.712968826293945, "global_step": 132755, "epoch": 3160} {"train_loss": -6.791119575500488, "global_step": 132756, "epoch": 3160} {"train_loss": -6.651272773742676, "global_step": 132757, "epoch": 3160} {"train_loss": -6.687882900238037, "global_step": 132758, "epoch": 3160} {"train_loss": -6.670928955078125, "global_step": 132759, "epoch": 3160} {"train_loss": -6.60469913482666, "global_step": 132760, "epoch": 3160} {"train_loss": -6.664523874010358, "global_step": 132761, "epoch": 3160, "val_loss": 77685.21875} {"train_loss": -6.698211193084717, "global_step": 132762, "epoch": 3161} {"train_loss": -6.683093070983887, "global_step": 132763, "epoch": 3161} {"train_loss": -6.749011993408203, "global_step": 132764, "epoch": 3161} {"train_loss": -6.83292293548584, "global_step": 132765, "epoch": 3161} {"train_loss": -6.689955234527588, "global_step": 132766, "epoch": 3161} {"train_loss": -6.761638164520264, "global_step": 132767, "epoch": 3161} {"train_loss": -6.612165451049805, "global_step": 132768, "epoch": 3161} {"train_loss": -6.7645792961120605, "global_step": 132769, "epoch": 3161} {"train_loss": -6.632559776306152, "global_step": 132770, "epoch": 3161} {"train_loss": -6.717862129211426, "global_step": 132771, "epoch": 3161} {"train_loss": -6.638431072235107, "global_step": 132772, "epoch": 3161} {"train_loss": -6.866837501525879, "global_step": 132773, "epoch": 3161} {"train_loss": -6.750664710998535, "global_step": 132774, "epoch": 3161} {"train_loss": -6.845616817474365, "global_step": 132775, "epoch": 3161} {"train_loss": -6.69708776473999, "global_step": 132776, "epoch": 3161} {"train_loss": -6.668421268463135, "global_step": 132777, "epoch": 3161} {"train_loss": -6.8256025314331055, "global_step": 132778, "epoch": 3161} {"train_loss": -6.706287384033203, "global_step": 132779, "epoch": 3161} {"train_loss": -6.734474182128906, "global_step": 132780, "epoch": 3161} {"train_loss": -6.75870943069458, "global_step": 132781, "epoch": 3161} {"train_loss": -6.689522743225098, "global_step": 132782, "epoch": 3161} {"train_loss": -6.7278852462768555, "global_step": 132783, "epoch": 3161} {"train_loss": -6.690028190612793, "global_step": 132784, "epoch": 3161} {"train_loss": -6.712629795074463, "global_step": 132785, "epoch": 3161} {"train_loss": -6.796326637268066, "global_step": 132786, "epoch": 3161} {"train_loss": -6.643519401550293, "global_step": 132787, "epoch": 3161} {"train_loss": -6.729241371154785, "global_step": 132788, "epoch": 3161} {"train_loss": -6.521833419799805, "global_step": 132789, "epoch": 3161} {"train_loss": -6.73213529586792, "global_step": 132790, "epoch": 3161} {"train_loss": -6.672679901123047, "global_step": 132791, "epoch": 3161} {"train_loss": -6.7101874351501465, "global_step": 132792, "epoch": 3161} {"train_loss": -6.739045143127441, "global_step": 132793, "epoch": 3161} {"train_loss": -6.621303081512451, "global_step": 132794, "epoch": 3161} {"train_loss": -6.689178466796875, "global_step": 132795, "epoch": 3161} {"train_loss": -6.65277099609375, "global_step": 132796, "epoch": 3161} {"train_loss": -6.589746952056885, "global_step": 132797, "epoch": 3161} {"train_loss": -6.7979207038879395, "global_step": 132798, "epoch": 3161} {"train_loss": -6.677887916564941, "global_step": 132799, "epoch": 3161} {"train_loss": -6.71220588684082, "global_step": 132800, "epoch": 3161} {"train_loss": -6.624109268188477, "global_step": 132801, "epoch": 3161} {"train_loss": -6.599175453186035, "global_step": 132802, "epoch": 3161} {"train_loss": -6.706004506065732, "global_step": 132803, "epoch": 3161, "val_loss": 77962.1640625} {"train_loss": -6.642509937286377, "global_step": 132804, "epoch": 3162} {"train_loss": -6.783405303955078, "global_step": 132805, "epoch": 3162} {"train_loss": -6.646130561828613, "global_step": 132806, "epoch": 3162} {"train_loss": -6.583436012268066, "global_step": 132807, "epoch": 3162} {"train_loss": -6.772765159606934, "global_step": 132808, "epoch": 3162} {"train_loss": -6.729377746582031, "global_step": 132809, "epoch": 3162} {"train_loss": -6.757167816162109, "global_step": 132810, "epoch": 3162} {"train_loss": -6.766942977905273, "global_step": 132811, "epoch": 3162} {"train_loss": -6.5708465576171875, "global_step": 132812, "epoch": 3162} {"train_loss": -6.686054229736328, "global_step": 132813, "epoch": 3162} {"train_loss": -6.670859336853027, "global_step": 132814, "epoch": 3162} {"train_loss": -6.742866516113281, "global_step": 132815, "epoch": 3162} {"train_loss": -6.719108581542969, "global_step": 132816, "epoch": 3162} {"train_loss": -6.684475898742676, "global_step": 132817, "epoch": 3162} {"train_loss": -6.740352153778076, "global_step": 132818, "epoch": 3162} {"train_loss": -6.68953275680542, "global_step": 132819, "epoch": 3162} {"train_loss": -6.725830078125, "global_step": 132820, "epoch": 3162} {"train_loss": -6.726442337036133, "global_step": 132821, "epoch": 3162} {"train_loss": -6.681793212890625, "global_step": 132822, "epoch": 3162} {"train_loss": -6.682405471801758, "global_step": 132823, "epoch": 3162} {"train_loss": -6.702136993408203, "global_step": 132824, "epoch": 3162} {"train_loss": -6.7188801765441895, "global_step": 132825, "epoch": 3162} {"train_loss": -6.766230583190918, "global_step": 132826, "epoch": 3162} {"train_loss": -6.719263076782227, "global_step": 132827, "epoch": 3162} {"train_loss": -6.727578163146973, "global_step": 132828, "epoch": 3162} {"train_loss": -6.69959831237793, "global_step": 132829, "epoch": 3162} {"train_loss": -6.718883514404297, "global_step": 132830, "epoch": 3162} {"train_loss": -6.723727226257324, "global_step": 132831, "epoch": 3162} {"train_loss": -6.723154067993164, "global_step": 132832, "epoch": 3162} {"train_loss": -6.689813613891602, "global_step": 132833, "epoch": 3162} {"train_loss": -6.591178894042969, "global_step": 132834, "epoch": 3162} {"train_loss": -6.71192741394043, "global_step": 132835, "epoch": 3162} {"train_loss": -6.688956260681152, "global_step": 132836, "epoch": 3162} {"train_loss": -6.5687994956970215, "global_step": 132837, "epoch": 3162} {"train_loss": -6.728216171264648, "global_step": 132838, "epoch": 3162} {"train_loss": -6.659261226654053, "global_step": 132839, "epoch": 3162} {"train_loss": -6.5278754234313965, "global_step": 132840, "epoch": 3162} {"train_loss": -6.540827751159668, "global_step": 132841, "epoch": 3162} {"train_loss": -6.6263580322265625, "global_step": 132842, "epoch": 3162} {"train_loss": -6.602308750152588, "global_step": 132843, "epoch": 3162} {"train_loss": -6.694899559020996, "global_step": 132844, "epoch": 3162} {"train_loss": -6.681180193310692, "global_step": 132845, "epoch": 3162, "val_loss": 77673.5546875} {"train_loss": -6.64168643951416, "global_step": 132846, "epoch": 3163} {"train_loss": -6.502598285675049, "global_step": 132847, "epoch": 3163} {"train_loss": -6.649633884429932, "global_step": 132848, "epoch": 3163} {"train_loss": -6.659938335418701, "global_step": 132849, "epoch": 3163} {"train_loss": -6.713742256164551, "global_step": 132850, "epoch": 3163} {"train_loss": -6.695161819458008, "global_step": 132851, "epoch": 3163} {"train_loss": -6.62907075881958, "global_step": 132852, "epoch": 3163} {"train_loss": -6.830876350402832, "global_step": 132853, "epoch": 3163} {"train_loss": -6.486824035644531, "global_step": 132854, "epoch": 3163} {"train_loss": -6.665276050567627, "global_step": 132855, "epoch": 3163} {"train_loss": -6.692718029022217, "global_step": 132856, "epoch": 3163} {"train_loss": -6.667817115783691, "global_step": 132857, "epoch": 3163} {"train_loss": -6.714787483215332, "global_step": 132858, "epoch": 3163} {"train_loss": -6.650494575500488, "global_step": 132859, "epoch": 3163} {"train_loss": -6.661023139953613, "global_step": 132860, "epoch": 3163} {"train_loss": -6.805759429931641, "global_step": 132861, "epoch": 3163} {"train_loss": -6.579179763793945, "global_step": 132862, "epoch": 3163} {"train_loss": -6.811455726623535, "global_step": 132863, "epoch": 3163} {"train_loss": -6.6520256996154785, "global_step": 132864, "epoch": 3163} {"train_loss": -6.636615753173828, "global_step": 132865, "epoch": 3163} {"train_loss": -6.757549285888672, "global_step": 132866, "epoch": 3163} {"train_loss": -6.534690856933594, "global_step": 132867, "epoch": 3163} {"train_loss": -6.774139404296875, "global_step": 132868, "epoch": 3163} {"train_loss": -6.71333122253418, "global_step": 132869, "epoch": 3163} {"train_loss": -6.660308361053467, "global_step": 132870, "epoch": 3163} {"train_loss": -6.644685745239258, "global_step": 132871, "epoch": 3163} {"train_loss": -6.654067039489746, "global_step": 132872, "epoch": 3163} {"train_loss": -6.743650913238525, "global_step": 132873, "epoch": 3163} {"train_loss": -6.683541774749756, "global_step": 132874, "epoch": 3163} {"train_loss": -6.663261413574219, "global_step": 132875, "epoch": 3163} {"train_loss": -6.721616744995117, "global_step": 132876, "epoch": 3163} {"train_loss": -6.462436676025391, "global_step": 132877, "epoch": 3163} {"train_loss": -6.711495399475098, "global_step": 132878, "epoch": 3163} {"train_loss": -6.618036270141602, "global_step": 132879, "epoch": 3163} {"train_loss": -6.6557793617248535, "global_step": 132880, "epoch": 3163} {"train_loss": -6.788347244262695, "global_step": 132881, "epoch": 3163} {"train_loss": -6.805233001708984, "global_step": 132882, "epoch": 3163} {"train_loss": -6.717559814453125, "global_step": 132883, "epoch": 3163} {"train_loss": -6.646216869354248, "global_step": 132884, "epoch": 3163} {"train_loss": -6.858216285705566, "global_step": 132885, "epoch": 3163} {"train_loss": -6.6892266273498535, "global_step": 132886, "epoch": 3163} {"train_loss": -6.681661957786197, "global_step": 132887, "epoch": 3163, "val_loss": 77519.828125} {"train_loss": -6.707509994506836, "global_step": 132888, "epoch": 3164} {"train_loss": -6.787919044494629, "global_step": 132889, "epoch": 3164} {"train_loss": -6.774593353271484, "global_step": 132890, "epoch": 3164} {"train_loss": -6.726353168487549, "global_step": 132891, "epoch": 3164} {"train_loss": -6.706176280975342, "global_step": 132892, "epoch": 3164} {"train_loss": -6.760232925415039, "global_step": 132893, "epoch": 3164} {"train_loss": -6.7930707931518555, "global_step": 132894, "epoch": 3164} {"train_loss": -6.685750961303711, "global_step": 132895, "epoch": 3164} {"train_loss": -6.629377841949463, "global_step": 132896, "epoch": 3164} {"train_loss": -6.662469387054443, "global_step": 132897, "epoch": 3164} {"train_loss": -6.77166223526001, "global_step": 132898, "epoch": 3164} {"train_loss": -6.709250450134277, "global_step": 132899, "epoch": 3164} {"train_loss": -6.853304862976074, "global_step": 132900, "epoch": 3164} {"train_loss": -6.649026870727539, "global_step": 132901, "epoch": 3164} {"train_loss": -6.765512943267822, "global_step": 132902, "epoch": 3164} {"train_loss": -6.702187538146973, "global_step": 132903, "epoch": 3164} {"train_loss": -6.7256317138671875, "global_step": 132904, "epoch": 3164} {"train_loss": -6.8109965324401855, "global_step": 132905, "epoch": 3164} {"train_loss": -6.733433723449707, "global_step": 132906, "epoch": 3164} {"train_loss": -6.782402992248535, "global_step": 132907, "epoch": 3164} {"train_loss": -6.766791820526123, "global_step": 132908, "epoch": 3164} {"train_loss": -6.745347023010254, "global_step": 132909, "epoch": 3164} {"train_loss": -6.728613376617432, "global_step": 132910, "epoch": 3164} {"train_loss": -6.808619976043701, "global_step": 132911, "epoch": 3164} {"train_loss": -6.761536121368408, "global_step": 132912, "epoch": 3164} {"train_loss": -6.804839134216309, "global_step": 132913, "epoch": 3164} {"train_loss": -6.601840019226074, "global_step": 132914, "epoch": 3164} {"train_loss": -6.7017059326171875, "global_step": 132915, "epoch": 3164} {"train_loss": -6.559795379638672, "global_step": 132916, "epoch": 3164} {"train_loss": -6.640498161315918, "global_step": 132917, "epoch": 3164} {"train_loss": -6.5604166984558105, "global_step": 132918, "epoch": 3164} {"train_loss": -6.677211284637451, "global_step": 132919, "epoch": 3164} {"train_loss": -6.648774147033691, "global_step": 132920, "epoch": 3164} {"train_loss": -6.636509895324707, "global_step": 132921, "epoch": 3164} {"train_loss": -6.668173789978027, "global_step": 132922, "epoch": 3164} {"train_loss": -6.6197404861450195, "global_step": 132923, "epoch": 3164} {"train_loss": -6.621726036071777, "global_step": 132924, "epoch": 3164} {"train_loss": -6.6417999267578125, "global_step": 132925, "epoch": 3164} {"train_loss": -6.754035949707031, "global_step": 132926, "epoch": 3164} {"train_loss": -6.664181709289551, "global_step": 132927, "epoch": 3164} {"train_loss": -6.741356372833252, "global_step": 132928, "epoch": 3164} {"train_loss": -6.7092166514623734, "global_step": 132929, "epoch": 3164, "val_loss": 77561.7421875} {"train_loss": -6.707012176513672, "global_step": 132930, "epoch": 3165} {"train_loss": -6.762828826904297, "global_step": 132931, "epoch": 3165} {"train_loss": -6.646999835968018, "global_step": 132932, "epoch": 3165} {"train_loss": -6.692506790161133, "global_step": 132933, "epoch": 3165} {"train_loss": -6.63520622253418, "global_step": 132934, "epoch": 3165} {"train_loss": -6.612559795379639, "global_step": 132935, "epoch": 3165} {"train_loss": -6.821255207061768, "global_step": 132936, "epoch": 3165} {"train_loss": -6.712580680847168, "global_step": 132937, "epoch": 3165} {"train_loss": -6.771380424499512, "global_step": 132938, "epoch": 3165} {"train_loss": -6.807981491088867, "global_step": 132939, "epoch": 3165} {"train_loss": -6.7588911056518555, "global_step": 132940, "epoch": 3165} {"train_loss": -6.682809829711914, "global_step": 132941, "epoch": 3165} {"train_loss": -6.793739318847656, "global_step": 132942, "epoch": 3165} {"train_loss": -6.699249744415283, "global_step": 132943, "epoch": 3165} {"train_loss": -6.852814674377441, "global_step": 132944, "epoch": 3165} {"train_loss": -6.734781265258789, "global_step": 132945, "epoch": 3165} {"train_loss": -6.689538955688477, "global_step": 132946, "epoch": 3165} {"train_loss": -6.732473373413086, "global_step": 132947, "epoch": 3165} {"train_loss": -6.604349136352539, "global_step": 132948, "epoch": 3165} {"train_loss": -6.611462593078613, "global_step": 132949, "epoch": 3165} {"train_loss": -6.8134613037109375, "global_step": 132950, "epoch": 3165} {"train_loss": -6.690820217132568, "global_step": 132951, "epoch": 3165} {"train_loss": -6.716962814331055, "global_step": 132952, "epoch": 3165} {"train_loss": -6.550519943237305, "global_step": 132953, "epoch": 3165} {"train_loss": -6.70572566986084, "global_step": 132954, "epoch": 3165} {"train_loss": -6.664493560791016, "global_step": 132955, "epoch": 3165} {"train_loss": -6.605010032653809, "global_step": 132956, "epoch": 3165} {"train_loss": -6.713466644287109, "global_step": 132957, "epoch": 3165} {"train_loss": -6.701239585876465, "global_step": 132958, "epoch": 3165} {"train_loss": -6.5436811447143555, "global_step": 132959, "epoch": 3165} {"train_loss": -6.718472003936768, "global_step": 132960, "epoch": 3165} {"train_loss": -6.6333794593811035, "global_step": 132961, "epoch": 3165} {"train_loss": -6.686886787414551, "global_step": 132962, "epoch": 3165} {"train_loss": -6.541506767272949, "global_step": 132963, "epoch": 3165} {"train_loss": -6.708935737609863, "global_step": 132964, "epoch": 3165} {"train_loss": -6.466259479522705, "global_step": 132965, "epoch": 3165} {"train_loss": -6.796404838562012, "global_step": 132966, "epoch": 3165} {"train_loss": -6.6790313720703125, "global_step": 132967, "epoch": 3165} {"train_loss": -6.57304573059082, "global_step": 132968, "epoch": 3165} {"train_loss": -6.67097806930542, "global_step": 132969, "epoch": 3165} {"train_loss": -6.563761234283447, "global_step": 132970, "epoch": 3165} {"train_loss": -6.683590559732346, "global_step": 132971, "epoch": 3165, "val_loss": 77483.96875} {"train_loss": -6.6785125732421875, "global_step": 132972, "epoch": 3166} {"train_loss": -6.664499282836914, "global_step": 132973, "epoch": 3166} {"train_loss": -6.635848045349121, "global_step": 132974, "epoch": 3166} {"train_loss": -6.656239986419678, "global_step": 132975, "epoch": 3166} {"train_loss": -6.6991047859191895, "global_step": 132976, "epoch": 3166} {"train_loss": -6.675433158874512, "global_step": 132977, "epoch": 3166} {"train_loss": -6.8150224685668945, "global_step": 132978, "epoch": 3166} {"train_loss": -6.661567211151123, "global_step": 132979, "epoch": 3166} {"train_loss": -6.7689361572265625, "global_step": 132980, "epoch": 3166} {"train_loss": -6.678925514221191, "global_step": 132981, "epoch": 3166} {"train_loss": -6.537245273590088, "global_step": 132982, "epoch": 3166} {"train_loss": -6.695281028747559, "global_step": 132983, "epoch": 3166} {"train_loss": -6.7016119956970215, "global_step": 132984, "epoch": 3166} {"train_loss": -6.741341590881348, "global_step": 132985, "epoch": 3166} {"train_loss": -6.693916320800781, "global_step": 132986, "epoch": 3166} {"train_loss": -6.814720630645752, "global_step": 132987, "epoch": 3166} {"train_loss": -6.6329450607299805, "global_step": 132988, "epoch": 3166} {"train_loss": -6.691434860229492, "global_step": 132989, "epoch": 3166} {"train_loss": -6.582037448883057, "global_step": 132990, "epoch": 3166} {"train_loss": -6.682992935180664, "global_step": 132991, "epoch": 3166} {"train_loss": -6.8001298904418945, "global_step": 132992, "epoch": 3166} {"train_loss": -6.705945014953613, "global_step": 132993, "epoch": 3166} {"train_loss": -6.695914268493652, "global_step": 132994, "epoch": 3166} {"train_loss": -6.688703536987305, "global_step": 132995, "epoch": 3166} {"train_loss": -6.7300825119018555, "global_step": 132996, "epoch": 3166} {"train_loss": -6.826631546020508, "global_step": 132997, "epoch": 3166} {"train_loss": -6.743298053741455, "global_step": 132998, "epoch": 3166} {"train_loss": -6.582211494445801, "global_step": 132999, "epoch": 3166} {"train_loss": -6.760494232177734, "global_step": 133000, "epoch": 3166} {"train_loss": -6.5769195556640625, "global_step": 133001, "epoch": 3166} {"train_loss": -6.71539306640625, "global_step": 133002, "epoch": 3166} {"train_loss": -6.7166852951049805, "global_step": 133003, "epoch": 3166} {"train_loss": -6.760948181152344, "global_step": 133004, "epoch": 3166} {"train_loss": -6.707212448120117, "global_step": 133005, "epoch": 3166} {"train_loss": -6.622716903686523, "global_step": 133006, "epoch": 3166} {"train_loss": -6.67967414855957, "global_step": 133007, "epoch": 3166} {"train_loss": -6.684655666351318, "global_step": 133008, "epoch": 3166} {"train_loss": -6.707932949066162, "global_step": 133009, "epoch": 3166} {"train_loss": -6.796613693237305, "global_step": 133010, "epoch": 3166} {"train_loss": -6.768517971038818, "global_step": 133011, "epoch": 3166} {"train_loss": -6.730600357055664, "global_step": 133012, "epoch": 3166} {"train_loss": -6.702244474774315, "global_step": 133013, "epoch": 3166, "val_loss": 77392.625} {"train_loss": -6.783925533294678, "global_step": 133014, "epoch": 3167} {"train_loss": -6.699881553649902, "global_step": 133015, "epoch": 3167} {"train_loss": -6.880899429321289, "global_step": 133016, "epoch": 3167} {"train_loss": -6.811020851135254, "global_step": 133017, "epoch": 3167} {"train_loss": -6.695385932922363, "global_step": 133018, "epoch": 3167} {"train_loss": -6.797019958496094, "global_step": 133019, "epoch": 3167} {"train_loss": -6.861891269683838, "global_step": 133020, "epoch": 3167} {"train_loss": -6.821597099304199, "global_step": 133021, "epoch": 3167} {"train_loss": -6.714838027954102, "global_step": 133022, "epoch": 3167} {"train_loss": -6.659900188446045, "global_step": 133023, "epoch": 3167} {"train_loss": -6.813441276550293, "global_step": 133024, "epoch": 3167} {"train_loss": -6.731555461883545, "global_step": 133025, "epoch": 3167} {"train_loss": -6.7290520668029785, "global_step": 133026, "epoch": 3167} {"train_loss": -6.776610374450684, "global_step": 133027, "epoch": 3167} {"train_loss": -6.804703235626221, "global_step": 133028, "epoch": 3167} {"train_loss": -6.76424503326416, "global_step": 133029, "epoch": 3167} {"train_loss": -6.65899658203125, "global_step": 133030, "epoch": 3167} {"train_loss": -6.709425926208496, "global_step": 133031, "epoch": 3167} {"train_loss": -6.768922328948975, "global_step": 133032, "epoch": 3167} {"train_loss": -6.775646209716797, "global_step": 133033, "epoch": 3167} {"train_loss": -6.644784450531006, "global_step": 133034, "epoch": 3167} {"train_loss": -6.778717994689941, "global_step": 133035, "epoch": 3167} {"train_loss": -6.676510334014893, "global_step": 133036, "epoch": 3167} {"train_loss": -6.809368133544922, "global_step": 133037, "epoch": 3167} {"train_loss": -6.7136430740356445, "global_step": 133038, "epoch": 3167} {"train_loss": -6.821949005126953, "global_step": 133039, "epoch": 3167} {"train_loss": -6.825949668884277, "global_step": 133040, "epoch": 3167} {"train_loss": -6.798807144165039, "global_step": 133041, "epoch": 3167} {"train_loss": -6.756072998046875, "global_step": 133042, "epoch": 3167} {"train_loss": -6.738824844360352, "global_step": 133043, "epoch": 3167} {"train_loss": -6.651647090911865, "global_step": 133044, "epoch": 3167} {"train_loss": -6.901121139526367, "global_step": 133045, "epoch": 3167} {"train_loss": -6.785619735717773, "global_step": 133046, "epoch": 3167} {"train_loss": -6.689002990722656, "global_step": 133047, "epoch": 3167} {"train_loss": -6.797945022583008, "global_step": 133048, "epoch": 3167} {"train_loss": -6.728057861328125, "global_step": 133049, "epoch": 3167} {"train_loss": -6.833629608154297, "global_step": 133050, "epoch": 3167} {"train_loss": -6.722503662109375, "global_step": 133051, "epoch": 3167} {"train_loss": -6.523847579956055, "global_step": 133052, "epoch": 3167} {"train_loss": -6.592765808105469, "global_step": 133053, "epoch": 3167} {"train_loss": -6.6240129470825195, "global_step": 133054, "epoch": 3167} {"train_loss": -6.74615850902739, "global_step": 133055, "epoch": 3167, "val_loss": 77538.1875} {"train_loss": -6.814121246337891, "global_step": 133056, "epoch": 3168} {"train_loss": -6.704286575317383, "global_step": 133057, "epoch": 3168} {"train_loss": -6.819275856018066, "global_step": 133058, "epoch": 3168} {"train_loss": -6.694725036621094, "global_step": 133059, "epoch": 3168} {"train_loss": -6.696403503417969, "global_step": 133060, "epoch": 3168} {"train_loss": -6.7865891456604, "global_step": 133061, "epoch": 3168} {"train_loss": -6.678215026855469, "global_step": 133062, "epoch": 3168} {"train_loss": -6.699820518493652, "global_step": 133063, "epoch": 3168} {"train_loss": -6.753385066986084, "global_step": 133064, "epoch": 3168} {"train_loss": -6.828193664550781, "global_step": 133065, "epoch": 3168} {"train_loss": -6.635224342346191, "global_step": 133066, "epoch": 3168} {"train_loss": -6.740320205688477, "global_step": 133067, "epoch": 3168} {"train_loss": -6.543920040130615, "global_step": 133068, "epoch": 3168} {"train_loss": -6.739575386047363, "global_step": 133069, "epoch": 3168} {"train_loss": -6.5672149658203125, "global_step": 133070, "epoch": 3168} {"train_loss": -6.702972888946533, "global_step": 133071, "epoch": 3168} {"train_loss": -6.519889831542969, "global_step": 133072, "epoch": 3168} {"train_loss": -6.76113224029541, "global_step": 133073, "epoch": 3168} {"train_loss": -6.753127574920654, "global_step": 133074, "epoch": 3168} {"train_loss": -6.7517595291137695, "global_step": 133075, "epoch": 3168} {"train_loss": -6.551267623901367, "global_step": 133076, "epoch": 3168} {"train_loss": -6.707819938659668, "global_step": 133077, "epoch": 3168} {"train_loss": -6.666569709777832, "global_step": 133078, "epoch": 3168} {"train_loss": -6.614962100982666, "global_step": 133079, "epoch": 3168} {"train_loss": -6.75648307800293, "global_step": 133080, "epoch": 3168} {"train_loss": -6.692684173583984, "global_step": 133081, "epoch": 3168} {"train_loss": -6.694622993469238, "global_step": 133082, "epoch": 3168} {"train_loss": -6.625613689422607, "global_step": 133083, "epoch": 3168} {"train_loss": -6.638519287109375, "global_step": 133084, "epoch": 3168} {"train_loss": -6.702390193939209, "global_step": 133085, "epoch": 3168} {"train_loss": -6.575718402862549, "global_step": 133086, "epoch": 3168} {"train_loss": -6.656045913696289, "global_step": 133087, "epoch": 3168} {"train_loss": -6.741113662719727, "global_step": 133088, "epoch": 3168} {"train_loss": -6.786739826202393, "global_step": 133089, "epoch": 3168} {"train_loss": -6.704270362854004, "global_step": 133090, "epoch": 3168} {"train_loss": -6.614819526672363, "global_step": 133091, "epoch": 3168} {"train_loss": -6.641569137573242, "global_step": 133092, "epoch": 3168} {"train_loss": -6.739953994750977, "global_step": 133093, "epoch": 3168} {"train_loss": -6.58619499206543, "global_step": 133094, "epoch": 3168} {"train_loss": -6.803609848022461, "global_step": 133095, "epoch": 3168} {"train_loss": -6.81243896484375, "global_step": 133096, "epoch": 3168} {"train_loss": -6.694323494320824, "global_step": 133097, "epoch": 3168, "val_loss": 77760.3984375} {"train_loss": -6.698923587799072, "global_step": 133098, "epoch": 3169} {"train_loss": -6.682140350341797, "global_step": 133099, "epoch": 3169} {"train_loss": -6.643583297729492, "global_step": 133100, "epoch": 3169} {"train_loss": -6.724035739898682, "global_step": 133101, "epoch": 3169} {"train_loss": -6.710031032562256, "global_step": 133102, "epoch": 3169} {"train_loss": -6.445769786834717, "global_step": 133103, "epoch": 3169} {"train_loss": -6.822297096252441, "global_step": 133104, "epoch": 3169} {"train_loss": -6.582674026489258, "global_step": 133105, "epoch": 3169} {"train_loss": -6.575286865234375, "global_step": 133106, "epoch": 3169} {"train_loss": -6.635621070861816, "global_step": 133107, "epoch": 3169} {"train_loss": -6.705748558044434, "global_step": 133108, "epoch": 3169} {"train_loss": -6.744824409484863, "global_step": 133109, "epoch": 3169} {"train_loss": -6.641950607299805, "global_step": 133110, "epoch": 3169} {"train_loss": -6.596826553344727, "global_step": 133111, "epoch": 3169} {"train_loss": -6.6263651847839355, "global_step": 133112, "epoch": 3169} {"train_loss": -6.805727958679199, "global_step": 133113, "epoch": 3169} {"train_loss": -6.635498046875, "global_step": 133114, "epoch": 3169} {"train_loss": -6.6477251052856445, "global_step": 133115, "epoch": 3169} {"train_loss": -6.657027244567871, "global_step": 133116, "epoch": 3169} {"train_loss": -6.600796699523926, "global_step": 133117, "epoch": 3169} {"train_loss": -6.726836204528809, "global_step": 133118, "epoch": 3169} {"train_loss": -6.650086402893066, "global_step": 133119, "epoch": 3169} {"train_loss": -6.82072639465332, "global_step": 133120, "epoch": 3169} {"train_loss": -6.740255355834961, "global_step": 133121, "epoch": 3169} {"train_loss": -6.652798175811768, "global_step": 133122, "epoch": 3169} {"train_loss": -6.663532257080078, "global_step": 133123, "epoch": 3169} {"train_loss": -6.696091175079346, "global_step": 133124, "epoch": 3169} {"train_loss": -6.655885696411133, "global_step": 133125, "epoch": 3169} {"train_loss": -6.654518127441406, "global_step": 133126, "epoch": 3169} {"train_loss": -6.661118030548096, "global_step": 133127, "epoch": 3169} {"train_loss": -6.549350738525391, "global_step": 133128, "epoch": 3169} {"train_loss": -6.779940605163574, "global_step": 133129, "epoch": 3169} {"train_loss": -6.619078636169434, "global_step": 133130, "epoch": 3169} {"train_loss": -6.78787899017334, "global_step": 133131, "epoch": 3169} {"train_loss": -6.7482452392578125, "global_step": 133132, "epoch": 3169} {"train_loss": -6.710423946380615, "global_step": 133133, "epoch": 3169} {"train_loss": -6.8026838302612305, "global_step": 133134, "epoch": 3169} {"train_loss": -6.685667514801025, "global_step": 133135, "epoch": 3169} {"train_loss": -6.732210159301758, "global_step": 133136, "epoch": 3169} {"train_loss": -6.687135696411133, "global_step": 133137, "epoch": 3169} {"train_loss": -6.718071937561035, "global_step": 133138, "epoch": 3169} {"train_loss": -6.680972156070528, "global_step": 133139, "epoch": 3169, "val_loss": 77629.3125} {"train_loss": -6.79944372177124, "global_step": 133140, "epoch": 3170} {"train_loss": -6.604948997497559, "global_step": 133141, "epoch": 3170} {"train_loss": -6.701418876647949, "global_step": 133142, "epoch": 3170} {"train_loss": -6.7864789962768555, "global_step": 133143, "epoch": 3170} {"train_loss": -6.588125228881836, "global_step": 133144, "epoch": 3170} {"train_loss": -6.610896110534668, "global_step": 133145, "epoch": 3170} {"train_loss": -6.676408290863037, "global_step": 133146, "epoch": 3170} {"train_loss": -6.551108360290527, "global_step": 133147, "epoch": 3170} {"train_loss": -6.527331352233887, "global_step": 133148, "epoch": 3170} {"train_loss": -6.708624839782715, "global_step": 133149, "epoch": 3170} {"train_loss": -6.650186061859131, "global_step": 133150, "epoch": 3170} {"train_loss": -6.660585880279541, "global_step": 133151, "epoch": 3170} {"train_loss": -6.672164440155029, "global_step": 133152, "epoch": 3170} {"train_loss": -6.729081153869629, "global_step": 133153, "epoch": 3170} {"train_loss": -6.6139421463012695, "global_step": 133154, "epoch": 3170} {"train_loss": -6.702297210693359, "global_step": 133155, "epoch": 3170} {"train_loss": -6.640063285827637, "global_step": 133156, "epoch": 3170} {"train_loss": -6.759520530700684, "global_step": 133157, "epoch": 3170} {"train_loss": -6.730295658111572, "global_step": 133158, "epoch": 3170} {"train_loss": -6.7866315841674805, "global_step": 133159, "epoch": 3170} {"train_loss": -6.675297737121582, "global_step": 133160, "epoch": 3170} {"train_loss": -6.788206100463867, "global_step": 133161, "epoch": 3170} {"train_loss": -6.743391513824463, "global_step": 133162, "epoch": 3170} {"train_loss": -6.733091354370117, "global_step": 133163, "epoch": 3170} {"train_loss": -6.725311279296875, "global_step": 133164, "epoch": 3170} {"train_loss": -6.711408615112305, "global_step": 133165, "epoch": 3170} {"train_loss": -6.80839729309082, "global_step": 133166, "epoch": 3170} {"train_loss": -6.745304107666016, "global_step": 133167, "epoch": 3170} {"train_loss": -6.715559005737305, "global_step": 133168, "epoch": 3170} {"train_loss": -6.723750591278076, "global_step": 133169, "epoch": 3170} {"train_loss": -6.767098426818848, "global_step": 133170, "epoch": 3170} {"train_loss": -6.706143379211426, "global_step": 133171, "epoch": 3170} {"train_loss": -6.746642112731934, "global_step": 133172, "epoch": 3170} {"train_loss": -6.776003837585449, "global_step": 133173, "epoch": 3170} {"train_loss": -6.789252758026123, "global_step": 133174, "epoch": 3170} {"train_loss": -6.689948558807373, "global_step": 133175, "epoch": 3170} {"train_loss": -6.660639762878418, "global_step": 133176, "epoch": 3170} {"train_loss": -6.732228755950928, "global_step": 133177, "epoch": 3170} {"train_loss": -6.604082107543945, "global_step": 133178, "epoch": 3170} {"train_loss": -6.61820650100708, "global_step": 133179, "epoch": 3170} {"train_loss": -6.6719255447387695, "global_step": 133180, "epoch": 3170} {"train_loss": -6.696783792404902, "global_step": 133181, "epoch": 3170, "val_loss": 77869.859375} {"train_loss": -6.635068893432617, "global_step": 133182, "epoch": 3171} {"train_loss": -6.640685558319092, "global_step": 133183, "epoch": 3171} {"train_loss": -6.566247463226318, "global_step": 133184, "epoch": 3171} {"train_loss": -6.512748718261719, "global_step": 133185, "epoch": 3171} {"train_loss": -6.619945526123047, "global_step": 133186, "epoch": 3171} {"train_loss": -6.512941360473633, "global_step": 133187, "epoch": 3171} {"train_loss": -6.581011772155762, "global_step": 133188, "epoch": 3171} {"train_loss": -6.628904342651367, "global_step": 133189, "epoch": 3171} {"train_loss": -6.613607883453369, "global_step": 133190, "epoch": 3171} {"train_loss": -6.661781311035156, "global_step": 133191, "epoch": 3171} {"train_loss": -6.595786094665527, "global_step": 133192, "epoch": 3171} {"train_loss": -6.564175605773926, "global_step": 133193, "epoch": 3171} {"train_loss": -6.59143590927124, "global_step": 133194, "epoch": 3171} {"train_loss": -6.662285804748535, "global_step": 133195, "epoch": 3171} {"train_loss": -6.625944137573242, "global_step": 133196, "epoch": 3171} {"train_loss": -6.678397178649902, "global_step": 133197, "epoch": 3171} {"train_loss": -6.6144118309021, "global_step": 133198, "epoch": 3171} {"train_loss": -6.669543266296387, "global_step": 133199, "epoch": 3171} {"train_loss": -6.710888385772705, "global_step": 133200, "epoch": 3171} {"train_loss": -6.722430229187012, "global_step": 133201, "epoch": 3171} {"train_loss": -6.691558837890625, "global_step": 133202, "epoch": 3171} {"train_loss": -6.675630569458008, "global_step": 133203, "epoch": 3171} {"train_loss": -6.729216575622559, "global_step": 133204, "epoch": 3171} {"train_loss": -6.630949020385742, "global_step": 133205, "epoch": 3171} {"train_loss": -6.552358627319336, "global_step": 133206, "epoch": 3171} {"train_loss": -6.636238098144531, "global_step": 133207, "epoch": 3171} {"train_loss": -6.532148361206055, "global_step": 133208, "epoch": 3171} {"train_loss": -6.628990650177002, "global_step": 133209, "epoch": 3171} {"train_loss": -6.766267776489258, "global_step": 133210, "epoch": 3171} {"train_loss": -6.566435813903809, "global_step": 133211, "epoch": 3171} {"train_loss": -6.696127414703369, "global_step": 133212, "epoch": 3171} {"train_loss": -6.737098217010498, "global_step": 133213, "epoch": 3171} {"train_loss": -6.619709491729736, "global_step": 133214, "epoch": 3171} {"train_loss": -6.61440372467041, "global_step": 133215, "epoch": 3171} {"train_loss": -6.684304714202881, "global_step": 133216, "epoch": 3171} {"train_loss": -6.639009952545166, "global_step": 133217, "epoch": 3171} {"train_loss": -6.713594436645508, "global_step": 133218, "epoch": 3171} {"train_loss": -6.682663917541504, "global_step": 133219, "epoch": 3171} {"train_loss": -6.656158924102783, "global_step": 133220, "epoch": 3171} {"train_loss": -6.740480422973633, "global_step": 133221, "epoch": 3171} {"train_loss": -6.64893913269043, "global_step": 133222, "epoch": 3171} {"train_loss": -6.642818859645298, "global_step": 133223, "epoch": 3171, "val_loss": 77595.3203125} {"train_loss": -6.617484092712402, "global_step": 133224, "epoch": 3172} {"train_loss": -6.80277156829834, "global_step": 133225, "epoch": 3172} {"train_loss": -6.628879547119141, "global_step": 133226, "epoch": 3172} {"train_loss": -6.694860458374023, "global_step": 133227, "epoch": 3172} {"train_loss": -6.750370025634766, "global_step": 133228, "epoch": 3172} {"train_loss": -6.658388137817383, "global_step": 133229, "epoch": 3172} {"train_loss": -6.8178863525390625, "global_step": 133230, "epoch": 3172} {"train_loss": -6.715959548950195, "global_step": 133231, "epoch": 3172} {"train_loss": -6.692519664764404, "global_step": 133232, "epoch": 3172} {"train_loss": -6.667811393737793, "global_step": 133233, "epoch": 3172} {"train_loss": -6.762439727783203, "global_step": 133234, "epoch": 3172} {"train_loss": -6.879833221435547, "global_step": 133235, "epoch": 3172} {"train_loss": -6.789493560791016, "global_step": 133236, "epoch": 3172} {"train_loss": -6.644807815551758, "global_step": 133237, "epoch": 3172} {"train_loss": -6.717759132385254, "global_step": 133238, "epoch": 3172} {"train_loss": -6.733205795288086, "global_step": 133239, "epoch": 3172} {"train_loss": -6.588752746582031, "global_step": 133240, "epoch": 3172} {"train_loss": -6.6287736892700195, "global_step": 133241, "epoch": 3172} {"train_loss": -6.632684230804443, "global_step": 133242, "epoch": 3172} {"train_loss": -6.663234710693359, "global_step": 133243, "epoch": 3172} {"train_loss": -6.646844863891602, "global_step": 133244, "epoch": 3172} {"train_loss": -6.6363067626953125, "global_step": 133245, "epoch": 3172} {"train_loss": -6.752237319946289, "global_step": 133246, "epoch": 3172} {"train_loss": -6.645393371582031, "global_step": 133247, "epoch": 3172} {"train_loss": -6.664277076721191, "global_step": 133248, "epoch": 3172} {"train_loss": -6.628475189208984, "global_step": 133249, "epoch": 3172} {"train_loss": -6.66625452041626, "global_step": 133250, "epoch": 3172} {"train_loss": -6.755500316619873, "global_step": 133251, "epoch": 3172} {"train_loss": -6.697649955749512, "global_step": 133252, "epoch": 3172} {"train_loss": -6.4909772872924805, "global_step": 133253, "epoch": 3172} {"train_loss": -6.627756118774414, "global_step": 133254, "epoch": 3172} {"train_loss": -6.728338241577148, "global_step": 133255, "epoch": 3172} {"train_loss": -6.642308712005615, "global_step": 133256, "epoch": 3172} {"train_loss": -6.696300029754639, "global_step": 133257, "epoch": 3172} {"train_loss": -6.6680908203125, "global_step": 133258, "epoch": 3172} {"train_loss": -6.688775062561035, "global_step": 133259, "epoch": 3172} {"train_loss": -6.610127925872803, "global_step": 133260, "epoch": 3172} {"train_loss": -6.724644660949707, "global_step": 133261, "epoch": 3172} {"train_loss": -6.597522735595703, "global_step": 133262, "epoch": 3172} {"train_loss": -6.614258766174316, "global_step": 133263, "epoch": 3172} {"train_loss": -6.8197431564331055, "global_step": 133264, "epoch": 3172} {"train_loss": -6.686674401873634, "global_step": 133265, "epoch": 3172, "val_loss": 77746.921875} {"train_loss": -6.750511169433594, "global_step": 133266, "epoch": 3173} {"train_loss": -6.631783485412598, "global_step": 133267, "epoch": 3173} {"train_loss": -6.571087837219238, "global_step": 133268, "epoch": 3173} {"train_loss": -6.748909950256348, "global_step": 133269, "epoch": 3173} {"train_loss": -6.632918357849121, "global_step": 133270, "epoch": 3173} {"train_loss": -6.672524929046631, "global_step": 133271, "epoch": 3173} {"train_loss": -6.731983661651611, "global_step": 133272, "epoch": 3173} {"train_loss": -6.653860092163086, "global_step": 133273, "epoch": 3173} {"train_loss": -6.793850421905518, "global_step": 133274, "epoch": 3173} {"train_loss": -6.561312675476074, "global_step": 133275, "epoch": 3173} {"train_loss": -6.7584099769592285, "global_step": 133276, "epoch": 3173} {"train_loss": -6.693377494812012, "global_step": 133277, "epoch": 3173} {"train_loss": -6.757576942443848, "global_step": 133278, "epoch": 3173} {"train_loss": -6.689563751220703, "global_step": 133279, "epoch": 3173} {"train_loss": -6.637716293334961, "global_step": 133280, "epoch": 3173} {"train_loss": -6.66477632522583, "global_step": 133281, "epoch": 3173} {"train_loss": -6.628329753875732, "global_step": 133282, "epoch": 3173} {"train_loss": -6.719507217407227, "global_step": 133283, "epoch": 3173} {"train_loss": -6.582940578460693, "global_step": 133284, "epoch": 3173} {"train_loss": -6.716713905334473, "global_step": 133285, "epoch": 3173} {"train_loss": -6.6427812576293945, "global_step": 133286, "epoch": 3173} {"train_loss": -6.681102752685547, "global_step": 133287, "epoch": 3173} {"train_loss": -6.634449481964111, "global_step": 133288, "epoch": 3173} {"train_loss": -6.696159362792969, "global_step": 133289, "epoch": 3173} {"train_loss": -6.699334144592285, "global_step": 133290, "epoch": 3173} {"train_loss": -6.547030448913574, "global_step": 133291, "epoch": 3173} {"train_loss": -6.766491889953613, "global_step": 133292, "epoch": 3173} {"train_loss": -6.696462631225586, "global_step": 133293, "epoch": 3173} {"train_loss": -6.5717926025390625, "global_step": 133294, "epoch": 3173} {"train_loss": -6.751714706420898, "global_step": 133295, "epoch": 3173} {"train_loss": -6.637761116027832, "global_step": 133296, "epoch": 3173} {"train_loss": -6.615446090698242, "global_step": 133297, "epoch": 3173} {"train_loss": -6.647225856781006, "global_step": 133298, "epoch": 3173} {"train_loss": -6.636780738830566, "global_step": 133299, "epoch": 3173} {"train_loss": -6.771929740905762, "global_step": 133300, "epoch": 3173} {"train_loss": -6.8313069343566895, "global_step": 133301, "epoch": 3173} {"train_loss": -6.606265544891357, "global_step": 133302, "epoch": 3173} {"train_loss": -6.763646125793457, "global_step": 133303, "epoch": 3173} {"train_loss": -6.638507843017578, "global_step": 133304, "epoch": 3173} {"train_loss": -6.710851669311523, "global_step": 133305, "epoch": 3173} {"train_loss": -6.797476768493652, "global_step": 133306, "epoch": 3173} {"train_loss": -6.681983255204701, "global_step": 133307, "epoch": 3173, "val_loss": 77452.96875} {"train_loss": -6.717162609100342, "global_step": 133308, "epoch": 3174} {"train_loss": -6.665582656860352, "global_step": 133309, "epoch": 3174} {"train_loss": -6.723179817199707, "global_step": 133310, "epoch": 3174} {"train_loss": -6.600061416625977, "global_step": 133311, "epoch": 3174} {"train_loss": -6.568577289581299, "global_step": 133312, "epoch": 3174} {"train_loss": -6.685319423675537, "global_step": 133313, "epoch": 3174} {"train_loss": -6.4550700187683105, "global_step": 133314, "epoch": 3174} {"train_loss": -6.6536760330200195, "global_step": 133315, "epoch": 3174} {"train_loss": -6.537064552307129, "global_step": 133316, "epoch": 3174} {"train_loss": -6.674302101135254, "global_step": 133317, "epoch": 3174} {"train_loss": -6.600769996643066, "global_step": 133318, "epoch": 3174} {"train_loss": -6.614328384399414, "global_step": 133319, "epoch": 3174} {"train_loss": -6.707971572875977, "global_step": 133320, "epoch": 3174} {"train_loss": -6.516636371612549, "global_step": 133321, "epoch": 3174} {"train_loss": -6.718871116638184, "global_step": 133322, "epoch": 3174} {"train_loss": -6.554920196533203, "global_step": 133323, "epoch": 3174} {"train_loss": -6.743988513946533, "global_step": 133324, "epoch": 3174} {"train_loss": -6.594838619232178, "global_step": 133325, "epoch": 3174} {"train_loss": -6.716251373291016, "global_step": 133326, "epoch": 3174} {"train_loss": -6.706266403198242, "global_step": 133327, "epoch": 3174} {"train_loss": -6.666988849639893, "global_step": 133328, "epoch": 3174} {"train_loss": -6.712926864624023, "global_step": 133329, "epoch": 3174} {"train_loss": -6.727868556976318, "global_step": 133330, "epoch": 3174} {"train_loss": -6.647024154663086, "global_step": 133331, "epoch": 3174} {"train_loss": -6.725289821624756, "global_step": 133332, "epoch": 3174} {"train_loss": -6.696976661682129, "global_step": 133333, "epoch": 3174} {"train_loss": -6.6192827224731445, "global_step": 133334, "epoch": 3174} {"train_loss": -6.620915412902832, "global_step": 133335, "epoch": 3174} {"train_loss": -6.682731628417969, "global_step": 133336, "epoch": 3174} {"train_loss": -6.759670257568359, "global_step": 133337, "epoch": 3174} {"train_loss": -6.70655632019043, "global_step": 133338, "epoch": 3174} {"train_loss": -6.7256669998168945, "global_step": 133339, "epoch": 3174} {"train_loss": -6.661128520965576, "global_step": 133340, "epoch": 3174} {"train_loss": -6.595603942871094, "global_step": 133341, "epoch": 3174} {"train_loss": -6.560745716094971, "global_step": 133342, "epoch": 3174} {"train_loss": -6.635046005249023, "global_step": 133343, "epoch": 3174} {"train_loss": -6.703534126281738, "global_step": 133344, "epoch": 3174} {"train_loss": -6.748546600341797, "global_step": 133345, "epoch": 3174} {"train_loss": -6.668384552001953, "global_step": 133346, "epoch": 3174} {"train_loss": -6.709726810455322, "global_step": 133347, "epoch": 3174} {"train_loss": -6.744794845581055, "global_step": 133348, "epoch": 3174} {"train_loss": -6.660992270424252, "global_step": 133349, "epoch": 3174, "val_loss": 77681.1640625} {"train_loss": -6.711689472198486, "global_step": 133350, "epoch": 3175} {"train_loss": -6.803707599639893, "global_step": 133351, "epoch": 3175} {"train_loss": -6.681488990783691, "global_step": 133352, "epoch": 3175} {"train_loss": -6.672968864440918, "global_step": 133353, "epoch": 3175} {"train_loss": -6.71701717376709, "global_step": 133354, "epoch": 3175} {"train_loss": -6.722777366638184, "global_step": 133355, "epoch": 3175} {"train_loss": -6.752181529998779, "global_step": 133356, "epoch": 3175} {"train_loss": -6.659496307373047, "global_step": 133357, "epoch": 3175} {"train_loss": -6.717286109924316, "global_step": 133358, "epoch": 3175} {"train_loss": -6.72314453125, "global_step": 133359, "epoch": 3175} {"train_loss": -6.818015098571777, "global_step": 133360, "epoch": 3175} {"train_loss": -6.810900688171387, "global_step": 133361, "epoch": 3175} {"train_loss": -6.647512912750244, "global_step": 133362, "epoch": 3175} {"train_loss": -6.717860221862793, "global_step": 133363, "epoch": 3175} {"train_loss": -6.626956939697266, "global_step": 133364, "epoch": 3175} {"train_loss": -6.774752616882324, "global_step": 133365, "epoch": 3175} {"train_loss": -6.727442264556885, "global_step": 133366, "epoch": 3175} {"train_loss": -6.802753448486328, "global_step": 133367, "epoch": 3175} {"train_loss": -6.762835502624512, "global_step": 133368, "epoch": 3175} {"train_loss": -6.650486946105957, "global_step": 133369, "epoch": 3175} {"train_loss": -6.827568054199219, "global_step": 133370, "epoch": 3175} {"train_loss": -6.653864860534668, "global_step": 133371, "epoch": 3175} {"train_loss": -6.641178607940674, "global_step": 133372, "epoch": 3175} {"train_loss": -6.725800514221191, "global_step": 133373, "epoch": 3175} {"train_loss": -6.667566776275635, "global_step": 133374, "epoch": 3175} {"train_loss": -6.701077461242676, "global_step": 133375, "epoch": 3175} {"train_loss": -6.686236381530762, "global_step": 133376, "epoch": 3175} {"train_loss": -6.707012176513672, "global_step": 133377, "epoch": 3175} {"train_loss": -6.740765571594238, "global_step": 133378, "epoch": 3175} {"train_loss": -6.865787029266357, "global_step": 133379, "epoch": 3175} {"train_loss": -6.634061813354492, "global_step": 133380, "epoch": 3175} {"train_loss": -6.6264543533325195, "global_step": 133381, "epoch": 3175} {"train_loss": -6.62150764465332, "global_step": 133382, "epoch": 3175} {"train_loss": -6.6265363693237305, "global_step": 133383, "epoch": 3175} {"train_loss": -6.7581329345703125, "global_step": 133384, "epoch": 3175} {"train_loss": -6.685486316680908, "global_step": 133385, "epoch": 3175} {"train_loss": -6.616568088531494, "global_step": 133386, "epoch": 3175} {"train_loss": -6.717875957489014, "global_step": 133387, "epoch": 3175} {"train_loss": -6.647433280944824, "global_step": 133388, "epoch": 3175} {"train_loss": -6.730345726013184, "global_step": 133389, "epoch": 3175} {"train_loss": -6.695768356323242, "global_step": 133390, "epoch": 3175} {"train_loss": -6.707716033572242, "global_step": 133391, "epoch": 3175, "val_loss": 77744.7890625} {"train_loss": -6.7092742919921875, "global_step": 133392, "epoch": 3176} {"train_loss": -6.67063570022583, "global_step": 133393, "epoch": 3176} {"train_loss": -6.634880065917969, "global_step": 133394, "epoch": 3176} {"train_loss": -6.643407821655273, "global_step": 133395, "epoch": 3176} {"train_loss": -6.57073974609375, "global_step": 133396, "epoch": 3176} {"train_loss": -6.56096076965332, "global_step": 133397, "epoch": 3176} {"train_loss": -6.835425853729248, "global_step": 133398, "epoch": 3176} {"train_loss": -6.7287750244140625, "global_step": 133399, "epoch": 3176} {"train_loss": -6.702274322509766, "global_step": 133400, "epoch": 3176} {"train_loss": -6.599863052368164, "global_step": 133401, "epoch": 3176} {"train_loss": -6.731508255004883, "global_step": 133402, "epoch": 3176} {"train_loss": -6.661850929260254, "global_step": 133403, "epoch": 3176} {"train_loss": -6.531412124633789, "global_step": 133404, "epoch": 3176} {"train_loss": -6.649085521697998, "global_step": 133405, "epoch": 3176} {"train_loss": -6.587491989135742, "global_step": 133406, "epoch": 3176} {"train_loss": -6.755601406097412, "global_step": 133407, "epoch": 3176} {"train_loss": -6.551595687866211, "global_step": 133408, "epoch": 3176} {"train_loss": -6.617136001586914, "global_step": 133409, "epoch": 3176} {"train_loss": -6.651637077331543, "global_step": 133410, "epoch": 3176} {"train_loss": -6.602756500244141, "global_step": 133411, "epoch": 3176} {"train_loss": -6.674771308898926, "global_step": 133412, "epoch": 3176} {"train_loss": -6.6033220291137695, "global_step": 133413, "epoch": 3176} {"train_loss": -6.6511101722717285, "global_step": 133414, "epoch": 3176} {"train_loss": -6.684625148773193, "global_step": 133415, "epoch": 3176} {"train_loss": -6.720439910888672, "global_step": 133416, "epoch": 3176} {"train_loss": -6.6543731689453125, "global_step": 133417, "epoch": 3176} {"train_loss": -6.587464332580566, "global_step": 133418, "epoch": 3176} {"train_loss": -6.72702169418335, "global_step": 133419, "epoch": 3176} {"train_loss": -6.55753231048584, "global_step": 133420, "epoch": 3176} {"train_loss": -6.706954002380371, "global_step": 133421, "epoch": 3176} {"train_loss": -6.657476425170898, "global_step": 133422, "epoch": 3176} {"train_loss": -6.705676078796387, "global_step": 133423, "epoch": 3176} {"train_loss": -6.674690246582031, "global_step": 133424, "epoch": 3176} {"train_loss": -6.6767258644104, "global_step": 133425, "epoch": 3176} {"train_loss": -6.713891506195068, "global_step": 133426, "epoch": 3176} {"train_loss": -6.733837127685547, "global_step": 133427, "epoch": 3176} {"train_loss": -6.706157207489014, "global_step": 133428, "epoch": 3176} {"train_loss": -6.809491157531738, "global_step": 133429, "epoch": 3176} {"train_loss": -6.838396072387695, "global_step": 133430, "epoch": 3176} {"train_loss": -6.717785358428955, "global_step": 133431, "epoch": 3176} {"train_loss": -6.748941421508789, "global_step": 133432, "epoch": 3176} {"train_loss": -6.671467281523205, "global_step": 133433, "epoch": 3176, "val_loss": 77631.953125} {"train_loss": -6.731304168701172, "global_step": 133434, "epoch": 3177} {"train_loss": -6.770976543426514, "global_step": 133435, "epoch": 3177} {"train_loss": -6.758049011230469, "global_step": 133436, "epoch": 3177} {"train_loss": -6.803793907165527, "global_step": 133437, "epoch": 3177} {"train_loss": -6.768661022186279, "global_step": 133438, "epoch": 3177} {"train_loss": -6.727252006530762, "global_step": 133439, "epoch": 3177} {"train_loss": -6.675686359405518, "global_step": 133440, "epoch": 3177} {"train_loss": -6.637320518493652, "global_step": 133441, "epoch": 3177} {"train_loss": -6.7064208984375, "global_step": 133442, "epoch": 3177} {"train_loss": -6.770196437835693, "global_step": 133443, "epoch": 3177} {"train_loss": -6.653159141540527, "global_step": 133444, "epoch": 3177} {"train_loss": -6.786901473999023, "global_step": 133445, "epoch": 3177} {"train_loss": -6.8696746826171875, "global_step": 133446, "epoch": 3177} {"train_loss": -6.89133358001709, "global_step": 133447, "epoch": 3177} {"train_loss": -6.732784271240234, "global_step": 133448, "epoch": 3177} {"train_loss": -6.631089687347412, "global_step": 133449, "epoch": 3177} {"train_loss": -6.693985462188721, "global_step": 133450, "epoch": 3177} {"train_loss": -6.809364318847656, "global_step": 133451, "epoch": 3177} {"train_loss": -6.708959579467773, "global_step": 133452, "epoch": 3177} {"train_loss": -6.742000579833984, "global_step": 133453, "epoch": 3177} {"train_loss": -6.630733966827393, "global_step": 133454, "epoch": 3177} {"train_loss": -6.664166450500488, "global_step": 133455, "epoch": 3177} {"train_loss": -6.689280033111572, "global_step": 133456, "epoch": 3177} {"train_loss": -6.674159526824951, "global_step": 133457, "epoch": 3177} {"train_loss": -6.548005104064941, "global_step": 133458, "epoch": 3177} {"train_loss": -6.486868858337402, "global_step": 133459, "epoch": 3177} {"train_loss": -6.712492942810059, "global_step": 133460, "epoch": 3177} {"train_loss": -6.494955539703369, "global_step": 133461, "epoch": 3177} {"train_loss": -6.559060573577881, "global_step": 133462, "epoch": 3177} {"train_loss": -6.534415245056152, "global_step": 133463, "epoch": 3177} {"train_loss": -6.587896823883057, "global_step": 133464, "epoch": 3177} {"train_loss": -6.684553623199463, "global_step": 133465, "epoch": 3177} {"train_loss": -6.642205238342285, "global_step": 133466, "epoch": 3177} {"train_loss": -6.730348110198975, "global_step": 133467, "epoch": 3177} {"train_loss": -6.68131160736084, "global_step": 133468, "epoch": 3177} {"train_loss": -6.565356254577637, "global_step": 133469, "epoch": 3177} {"train_loss": -6.721640586853027, "global_step": 133470, "epoch": 3177} {"train_loss": -6.684023857116699, "global_step": 133471, "epoch": 3177} {"train_loss": -6.731459617614746, "global_step": 133472, "epoch": 3177} {"train_loss": -6.704479217529297, "global_step": 133473, "epoch": 3177} {"train_loss": -6.639493942260742, "global_step": 133474, "epoch": 3177} {"train_loss": -6.687532776877994, "global_step": 133475, "epoch": 3177, "val_loss": 77596.4453125} {"train_loss": -6.689868450164795, "global_step": 133476, "epoch": 3178} {"train_loss": -6.656642913818359, "global_step": 133477, "epoch": 3178} {"train_loss": -6.620657920837402, "global_step": 133478, "epoch": 3178} {"train_loss": -6.631997585296631, "global_step": 133479, "epoch": 3178} {"train_loss": -6.720987319946289, "global_step": 133480, "epoch": 3178} {"train_loss": -6.746233940124512, "global_step": 133481, "epoch": 3178} {"train_loss": -6.8609442710876465, "global_step": 133482, "epoch": 3178} {"train_loss": -6.736009120941162, "global_step": 133483, "epoch": 3178} {"train_loss": -6.711160659790039, "global_step": 133484, "epoch": 3178} {"train_loss": -6.674095153808594, "global_step": 133485, "epoch": 3178} {"train_loss": -6.698383331298828, "global_step": 133486, "epoch": 3178} {"train_loss": -6.714113712310791, "global_step": 133487, "epoch": 3178} {"train_loss": -6.696982383728027, "global_step": 133488, "epoch": 3178} {"train_loss": -6.79973840713501, "global_step": 133489, "epoch": 3178} {"train_loss": -6.761130332946777, "global_step": 133490, "epoch": 3178} {"train_loss": -6.736906051635742, "global_step": 133491, "epoch": 3178} {"train_loss": -6.786956787109375, "global_step": 133492, "epoch": 3178} {"train_loss": -6.714660167694092, "global_step": 133493, "epoch": 3178} {"train_loss": -6.769891738891602, "global_step": 133494, "epoch": 3178} {"train_loss": -6.701121807098389, "global_step": 133495, "epoch": 3178} {"train_loss": -6.719062328338623, "global_step": 133496, "epoch": 3178} {"train_loss": -6.581210136413574, "global_step": 133497, "epoch": 3178} {"train_loss": -6.589718818664551, "global_step": 133498, "epoch": 3178} {"train_loss": -6.536088466644287, "global_step": 133499, "epoch": 3178} {"train_loss": -6.450076103210449, "global_step": 133500, "epoch": 3178} {"train_loss": -6.697423458099365, "global_step": 133501, "epoch": 3178} {"train_loss": -6.513269901275635, "global_step": 133502, "epoch": 3178} {"train_loss": -6.747314453125, "global_step": 133503, "epoch": 3178} {"train_loss": -6.58945894241333, "global_step": 133504, "epoch": 3178} {"train_loss": -6.606203079223633, "global_step": 133505, "epoch": 3178} {"train_loss": -6.616772651672363, "global_step": 133506, "epoch": 3178} {"train_loss": -6.605432510375977, "global_step": 133507, "epoch": 3178} {"train_loss": -6.680153846740723, "global_step": 133508, "epoch": 3178} {"train_loss": -6.562838077545166, "global_step": 133509, "epoch": 3178} {"train_loss": -6.717145919799805, "global_step": 133510, "epoch": 3178} {"train_loss": -6.790205955505371, "global_step": 133511, "epoch": 3178} {"train_loss": -6.669333457946777, "global_step": 133512, "epoch": 3178} {"train_loss": -6.71021032333374, "global_step": 133513, "epoch": 3178} {"train_loss": -6.628878593444824, "global_step": 133514, "epoch": 3178} {"train_loss": -6.595775127410889, "global_step": 133515, "epoch": 3178} {"train_loss": -6.633925914764404, "global_step": 133516, "epoch": 3178} {"train_loss": -6.675503367469425, "global_step": 133517, "epoch": 3178, "val_loss": 77804.234375} {"train_loss": -6.710533142089844, "global_step": 133518, "epoch": 3179} {"train_loss": -6.677498817443848, "global_step": 133519, "epoch": 3179} {"train_loss": -6.66572904586792, "global_step": 133520, "epoch": 3179} {"train_loss": -6.611118793487549, "global_step": 133521, "epoch": 3179} {"train_loss": -6.641618251800537, "global_step": 133522, "epoch": 3179} {"train_loss": -6.841372489929199, "global_step": 133523, "epoch": 3179} {"train_loss": -6.779438018798828, "global_step": 133524, "epoch": 3179} {"train_loss": -6.7452239990234375, "global_step": 133525, "epoch": 3179} {"train_loss": -6.761965274810791, "global_step": 133526, "epoch": 3179} {"train_loss": -6.75876522064209, "global_step": 133527, "epoch": 3179} {"train_loss": -6.846323013305664, "global_step": 133528, "epoch": 3179} {"train_loss": -6.711370944976807, "global_step": 133529, "epoch": 3179} {"train_loss": -6.57843017578125, "global_step": 133530, "epoch": 3179} {"train_loss": -6.743992328643799, "global_step": 133531, "epoch": 3179} {"train_loss": -6.80214786529541, "global_step": 133532, "epoch": 3179} {"train_loss": -6.66721773147583, "global_step": 133533, "epoch": 3179} {"train_loss": -6.760867118835449, "global_step": 133534, "epoch": 3179} {"train_loss": -6.653801441192627, "global_step": 133535, "epoch": 3179} {"train_loss": -6.712048530578613, "global_step": 133536, "epoch": 3179} {"train_loss": -6.755712509155273, "global_step": 133537, "epoch": 3179} {"train_loss": -6.716891765594482, "global_step": 133538, "epoch": 3179} {"train_loss": -6.69434928894043, "global_step": 133539, "epoch": 3179} {"train_loss": -6.731706142425537, "global_step": 133540, "epoch": 3179} {"train_loss": -6.79957389831543, "global_step": 133541, "epoch": 3179} {"train_loss": -6.63372802734375, "global_step": 133542, "epoch": 3179} {"train_loss": -6.69248628616333, "global_step": 133543, "epoch": 3179} {"train_loss": -6.613739013671875, "global_step": 133544, "epoch": 3179} {"train_loss": -6.700547695159912, "global_step": 133545, "epoch": 3179} {"train_loss": -6.700101852416992, "global_step": 133546, "epoch": 3179} {"train_loss": -6.711944103240967, "global_step": 133547, "epoch": 3179} {"train_loss": -6.711527347564697, "global_step": 133548, "epoch": 3179} {"train_loss": -6.653165817260742, "global_step": 133549, "epoch": 3179} {"train_loss": -6.687560558319092, "global_step": 133550, "epoch": 3179} {"train_loss": -6.5577521324157715, "global_step": 133551, "epoch": 3179} {"train_loss": -6.675634384155273, "global_step": 133552, "epoch": 3179} {"train_loss": -6.815073490142822, "global_step": 133553, "epoch": 3179} {"train_loss": -6.620999336242676, "global_step": 133554, "epoch": 3179} {"train_loss": -6.66558313369751, "global_step": 133555, "epoch": 3179} {"train_loss": -6.786371231079102, "global_step": 133556, "epoch": 3179} {"train_loss": -6.654843330383301, "global_step": 133557, "epoch": 3179} {"train_loss": -6.730781078338623, "global_step": 133558, "epoch": 3179} {"train_loss": -6.70417747043428, "global_step": 133559, "epoch": 3179, "val_loss": 77863.2109375} {"train_loss": -6.634552955627441, "global_step": 133560, "epoch": 3180} {"train_loss": -6.810598373413086, "global_step": 133561, "epoch": 3180} {"train_loss": -6.812824726104736, "global_step": 133562, "epoch": 3180} {"train_loss": -6.716508388519287, "global_step": 133563, "epoch": 3180} {"train_loss": -6.738685607910156, "global_step": 133564, "epoch": 3180} {"train_loss": -6.740331172943115, "global_step": 133565, "epoch": 3180} {"train_loss": -6.677585601806641, "global_step": 133566, "epoch": 3180} {"train_loss": -6.894391059875488, "global_step": 133567, "epoch": 3180} {"train_loss": -6.842921257019043, "global_step": 133568, "epoch": 3180} {"train_loss": -6.713259696960449, "global_step": 133569, "epoch": 3180} {"train_loss": -6.721792221069336, "global_step": 133570, "epoch": 3180} {"train_loss": -6.802827835083008, "global_step": 133571, "epoch": 3180} {"train_loss": -6.718944549560547, "global_step": 133572, "epoch": 3180} {"train_loss": -6.684450626373291, "global_step": 133573, "epoch": 3180} {"train_loss": -6.7934064865112305, "global_step": 133574, "epoch": 3180} {"train_loss": -6.676111221313477, "global_step": 133575, "epoch": 3180} {"train_loss": -6.741610527038574, "global_step": 133576, "epoch": 3180} {"train_loss": -6.6909050941467285, "global_step": 133577, "epoch": 3180} {"train_loss": -6.712368965148926, "global_step": 133578, "epoch": 3180} {"train_loss": -6.573799133300781, "global_step": 133579, "epoch": 3180} {"train_loss": -6.733412742614746, "global_step": 133580, "epoch": 3180} {"train_loss": -6.61308479309082, "global_step": 133581, "epoch": 3180} {"train_loss": -6.656391620635986, "global_step": 133582, "epoch": 3180} {"train_loss": -6.821383953094482, "global_step": 133583, "epoch": 3180} {"train_loss": -6.754883289337158, "global_step": 133584, "epoch": 3180} {"train_loss": -6.793386459350586, "global_step": 133585, "epoch": 3180} {"train_loss": -6.710119247436523, "global_step": 133586, "epoch": 3180} {"train_loss": -6.735866546630859, "global_step": 133587, "epoch": 3180} {"train_loss": -6.83963680267334, "global_step": 133588, "epoch": 3180} {"train_loss": -6.646226406097412, "global_step": 133589, "epoch": 3180} {"train_loss": -6.62025785446167, "global_step": 133590, "epoch": 3180} {"train_loss": -6.62169075012207, "global_step": 133591, "epoch": 3180} {"train_loss": -6.749076843261719, "global_step": 133592, "epoch": 3180} {"train_loss": -6.830348968505859, "global_step": 133593, "epoch": 3180} {"train_loss": -6.659518241882324, "global_step": 133594, "epoch": 3180} {"train_loss": -6.708139419555664, "global_step": 133595, "epoch": 3180} {"train_loss": -6.857879638671875, "global_step": 133596, "epoch": 3180} {"train_loss": -6.725045204162598, "global_step": 133597, "epoch": 3180} {"train_loss": -6.630111217498779, "global_step": 133598, "epoch": 3180} {"train_loss": -6.7968339920043945, "global_step": 133599, "epoch": 3180} {"train_loss": -6.707290172576904, "global_step": 133600, "epoch": 3180} {"train_loss": -6.728607404799688, "global_step": 133601, "epoch": 3180, "val_loss": 77703.0625} {"train_loss": -6.819314002990723, "global_step": 133602, "epoch": 3181} {"train_loss": -6.795511722564697, "global_step": 133603, "epoch": 3181} {"train_loss": -6.768305778503418, "global_step": 133604, "epoch": 3181} {"train_loss": -6.75645637512207, "global_step": 133605, "epoch": 3181} {"train_loss": -6.736600399017334, "global_step": 133606, "epoch": 3181} {"train_loss": -6.7865753173828125, "global_step": 133607, "epoch": 3181} {"train_loss": -6.684521675109863, "global_step": 133608, "epoch": 3181} {"train_loss": -6.755385875701904, "global_step": 133609, "epoch": 3181} {"train_loss": -6.607134819030762, "global_step": 133610, "epoch": 3181} {"train_loss": -6.878249168395996, "global_step": 133611, "epoch": 3181} {"train_loss": -6.709804058074951, "global_step": 133612, "epoch": 3181} {"train_loss": -6.783847332000732, "global_step": 133613, "epoch": 3181} {"train_loss": -6.792035102844238, "global_step": 133614, "epoch": 3181} {"train_loss": -6.689396381378174, "global_step": 133615, "epoch": 3181} {"train_loss": -6.729696750640869, "global_step": 133616, "epoch": 3181} {"train_loss": -6.775035858154297, "global_step": 133617, "epoch": 3181} {"train_loss": -6.719381809234619, "global_step": 133618, "epoch": 3181} {"train_loss": -6.645112991333008, "global_step": 133619, "epoch": 3181} {"train_loss": -6.79103422164917, "global_step": 133620, "epoch": 3181} {"train_loss": -6.7306013107299805, "global_step": 133621, "epoch": 3181} {"train_loss": -6.6512556076049805, "global_step": 133622, "epoch": 3181} {"train_loss": -6.788891792297363, "global_step": 133623, "epoch": 3181} {"train_loss": -6.655577659606934, "global_step": 133624, "epoch": 3181} {"train_loss": -6.631711483001709, "global_step": 133625, "epoch": 3181} {"train_loss": -6.785061359405518, "global_step": 133626, "epoch": 3181} {"train_loss": -6.716726779937744, "global_step": 133627, "epoch": 3181} {"train_loss": -6.69556999206543, "global_step": 133628, "epoch": 3181} {"train_loss": -6.7931132316589355, "global_step": 133629, "epoch": 3181} {"train_loss": -6.631110191345215, "global_step": 133630, "epoch": 3181} {"train_loss": -6.7599334716796875, "global_step": 133631, "epoch": 3181} {"train_loss": -6.69278621673584, "global_step": 133632, "epoch": 3181} {"train_loss": -6.728092670440674, "global_step": 133633, "epoch": 3181} {"train_loss": -6.712245464324951, "global_step": 133634, "epoch": 3181} {"train_loss": -6.664901256561279, "global_step": 133635, "epoch": 3181} {"train_loss": -6.756669998168945, "global_step": 133636, "epoch": 3181} {"train_loss": -6.727750778198242, "global_step": 133637, "epoch": 3181} {"train_loss": -6.669795036315918, "global_step": 133638, "epoch": 3181} {"train_loss": -6.681067943572998, "global_step": 133639, "epoch": 3181} {"train_loss": -6.74257755279541, "global_step": 133640, "epoch": 3181} {"train_loss": -6.695556640625, "global_step": 133641, "epoch": 3181} {"train_loss": -6.628262519836426, "global_step": 133642, "epoch": 3181} {"train_loss": -6.728324061348324, "global_step": 133643, "epoch": 3181, "val_loss": 77620.3125} {"train_loss": -6.77963399887085, "global_step": 133644, "epoch": 3182} {"train_loss": -6.712576866149902, "global_step": 133645, "epoch": 3182} {"train_loss": -6.758406162261963, "global_step": 133646, "epoch": 3182} {"train_loss": -6.782960891723633, "global_step": 133647, "epoch": 3182} {"train_loss": -6.795839309692383, "global_step": 133648, "epoch": 3182} {"train_loss": -6.835857391357422, "global_step": 133649, "epoch": 3182} {"train_loss": -6.5722455978393555, "global_step": 133650, "epoch": 3182} {"train_loss": -6.642642498016357, "global_step": 133651, "epoch": 3182} {"train_loss": -6.67784309387207, "global_step": 133652, "epoch": 3182} {"train_loss": -6.6728105545043945, "global_step": 133653, "epoch": 3182} {"train_loss": -6.741331100463867, "global_step": 133654, "epoch": 3182} {"train_loss": -6.834437370300293, "global_step": 133655, "epoch": 3182} {"train_loss": -6.756061553955078, "global_step": 133656, "epoch": 3182} {"train_loss": -6.651782035827637, "global_step": 133657, "epoch": 3182} {"train_loss": -6.72498083114624, "global_step": 133658, "epoch": 3182} {"train_loss": -6.713813781738281, "global_step": 133659, "epoch": 3182} {"train_loss": -6.845581531524658, "global_step": 133660, "epoch": 3182} {"train_loss": -6.747997283935547, "global_step": 133661, "epoch": 3182} {"train_loss": -6.71498441696167, "global_step": 133662, "epoch": 3182} {"train_loss": -6.7490339279174805, "global_step": 133663, "epoch": 3182} {"train_loss": -6.797422409057617, "global_step": 133664, "epoch": 3182} {"train_loss": -6.742059230804443, "global_step": 133665, "epoch": 3182} {"train_loss": -6.812709808349609, "global_step": 133666, "epoch": 3182} {"train_loss": -6.626514911651611, "global_step": 133667, "epoch": 3182} {"train_loss": -6.706944942474365, "global_step": 133668, "epoch": 3182} {"train_loss": -6.745687484741211, "global_step": 133669, "epoch": 3182} {"train_loss": -6.781954288482666, "global_step": 133670, "epoch": 3182} {"train_loss": -6.5712890625, "global_step": 133671, "epoch": 3182} {"train_loss": -6.751412391662598, "global_step": 133672, "epoch": 3182} {"train_loss": -6.723341941833496, "global_step": 133673, "epoch": 3182} {"train_loss": -6.557801246643066, "global_step": 133674, "epoch": 3182} {"train_loss": -6.632244110107422, "global_step": 133675, "epoch": 3182} {"train_loss": -6.637317657470703, "global_step": 133676, "epoch": 3182} {"train_loss": -6.716064453125, "global_step": 133677, "epoch": 3182} {"train_loss": -6.592893600463867, "global_step": 133678, "epoch": 3182} {"train_loss": -6.657371997833252, "global_step": 133679, "epoch": 3182} {"train_loss": -6.665287971496582, "global_step": 133680, "epoch": 3182} {"train_loss": -6.710364818572998, "global_step": 133681, "epoch": 3182} {"train_loss": -6.75963020324707, "global_step": 133682, "epoch": 3182} {"train_loss": -6.734122276306152, "global_step": 133683, "epoch": 3182} {"train_loss": -6.695603370666504, "global_step": 133684, "epoch": 3182} {"train_loss": -6.712230023883638, "global_step": 133685, "epoch": 3182, "val_loss": 77894.328125} {"train_loss": -6.699313163757324, "global_step": 133686, "epoch": 3183} {"train_loss": -6.685637950897217, "global_step": 133687, "epoch": 3183} {"train_loss": -6.832890510559082, "global_step": 133688, "epoch": 3183} {"train_loss": -6.72867488861084, "global_step": 133689, "epoch": 3183} {"train_loss": -6.693264961242676, "global_step": 133690, "epoch": 3183} {"train_loss": -6.753208637237549, "global_step": 133691, "epoch": 3183} {"train_loss": -6.7137651443481445, "global_step": 133692, "epoch": 3183} {"train_loss": -6.660455703735352, "global_step": 133693, "epoch": 3183} {"train_loss": -6.709193706512451, "global_step": 133694, "epoch": 3183} {"train_loss": -6.703991889953613, "global_step": 133695, "epoch": 3183} {"train_loss": -6.692481994628906, "global_step": 133696, "epoch": 3183} {"train_loss": -6.7688188552856445, "global_step": 133697, "epoch": 3183} {"train_loss": -6.846926212310791, "global_step": 133698, "epoch": 3183} {"train_loss": -6.637258052825928, "global_step": 133699, "epoch": 3183} {"train_loss": -6.76638126373291, "global_step": 133700, "epoch": 3183} {"train_loss": -6.777050495147705, "global_step": 133701, "epoch": 3183} {"train_loss": -6.779782295227051, "global_step": 133702, "epoch": 3183} {"train_loss": -6.7371416091918945, "global_step": 133703, "epoch": 3183} {"train_loss": -6.796611785888672, "global_step": 133704, "epoch": 3183} {"train_loss": -6.711063385009766, "global_step": 133705, "epoch": 3183} {"train_loss": -6.648266792297363, "global_step": 133706, "epoch": 3183} {"train_loss": -6.706428527832031, "global_step": 133707, "epoch": 3183} {"train_loss": -6.750301361083984, "global_step": 133708, "epoch": 3183} {"train_loss": -6.667953968048096, "global_step": 133709, "epoch": 3183} {"train_loss": -6.690560340881348, "global_step": 133710, "epoch": 3183} {"train_loss": -6.651501178741455, "global_step": 133711, "epoch": 3183} {"train_loss": -6.743917465209961, "global_step": 133712, "epoch": 3183} {"train_loss": -6.680091381072998, "global_step": 133713, "epoch": 3183} {"train_loss": -6.781381130218506, "global_step": 133714, "epoch": 3183} {"train_loss": -6.63022518157959, "global_step": 133715, "epoch": 3183} {"train_loss": -6.56165075302124, "global_step": 133716, "epoch": 3183} {"train_loss": -6.6272125244140625, "global_step": 133717, "epoch": 3183} {"train_loss": -6.6645002365112305, "global_step": 133718, "epoch": 3183} {"train_loss": -6.619848251342773, "global_step": 133719, "epoch": 3183} {"train_loss": -6.64216947555542, "global_step": 133720, "epoch": 3183} {"train_loss": -6.585062026977539, "global_step": 133721, "epoch": 3183} {"train_loss": -6.646063804626465, "global_step": 133722, "epoch": 3183} {"train_loss": -6.695494651794434, "global_step": 133723, "epoch": 3183} {"train_loss": -6.570807456970215, "global_step": 133724, "epoch": 3183} {"train_loss": -6.758640766143799, "global_step": 133725, "epoch": 3183} {"train_loss": -6.748671054840088, "global_step": 133726, "epoch": 3183} {"train_loss": -6.701621884391422, "global_step": 133727, "epoch": 3183, "val_loss": 77510.875} {"train_loss": -6.669558048248291, "global_step": 133728, "epoch": 3184} {"train_loss": -6.786577224731445, "global_step": 133729, "epoch": 3184} {"train_loss": -6.6938066482543945, "global_step": 133730, "epoch": 3184} {"train_loss": -6.698449611663818, "global_step": 133731, "epoch": 3184} {"train_loss": -6.704794406890869, "global_step": 133732, "epoch": 3184} {"train_loss": -6.827953338623047, "global_step": 133733, "epoch": 3184} {"train_loss": -6.714022636413574, "global_step": 133734, "epoch": 3184} {"train_loss": -6.704890251159668, "global_step": 133735, "epoch": 3184} {"train_loss": -6.739342212677002, "global_step": 133736, "epoch": 3184} {"train_loss": -6.6688232421875, "global_step": 133737, "epoch": 3184} {"train_loss": -6.66105318069458, "global_step": 133738, "epoch": 3184} {"train_loss": -6.762242794036865, "global_step": 133739, "epoch": 3184} {"train_loss": -6.812346458435059, "global_step": 133740, "epoch": 3184} {"train_loss": -6.728266716003418, "global_step": 133741, "epoch": 3184} {"train_loss": -6.7625532150268555, "global_step": 133742, "epoch": 3184} {"train_loss": -6.667335033416748, "global_step": 133743, "epoch": 3184} {"train_loss": -6.720725059509277, "global_step": 133744, "epoch": 3184} {"train_loss": -6.727560520172119, "global_step": 133745, "epoch": 3184} {"train_loss": -6.614328384399414, "global_step": 133746, "epoch": 3184} {"train_loss": -6.640735149383545, "global_step": 133747, "epoch": 3184} {"train_loss": -6.6251020431518555, "global_step": 133748, "epoch": 3184} {"train_loss": -6.665955066680908, "global_step": 133749, "epoch": 3184} {"train_loss": -6.783511161804199, "global_step": 133750, "epoch": 3184} {"train_loss": -6.727029800415039, "global_step": 133751, "epoch": 3184} {"train_loss": -6.633765697479248, "global_step": 133752, "epoch": 3184} {"train_loss": -6.675053119659424, "global_step": 133753, "epoch": 3184} {"train_loss": -6.663614273071289, "global_step": 133754, "epoch": 3184} {"train_loss": -6.747386932373047, "global_step": 133755, "epoch": 3184} {"train_loss": -6.670127868652344, "global_step": 133756, "epoch": 3184} {"train_loss": -6.809884071350098, "global_step": 133757, "epoch": 3184} {"train_loss": -6.6848344802856445, "global_step": 133758, "epoch": 3184} {"train_loss": -6.679819583892822, "global_step": 133759, "epoch": 3184} {"train_loss": -6.758179664611816, "global_step": 133760, "epoch": 3184} {"train_loss": -6.688467979431152, "global_step": 133761, "epoch": 3184} {"train_loss": -6.653239727020264, "global_step": 133762, "epoch": 3184} {"train_loss": -6.773277282714844, "global_step": 133763, "epoch": 3184} {"train_loss": -6.868251800537109, "global_step": 133764, "epoch": 3184} {"train_loss": -6.676167964935303, "global_step": 133765, "epoch": 3184} {"train_loss": -6.657971382141113, "global_step": 133766, "epoch": 3184} {"train_loss": -6.7223920822143555, "global_step": 133767, "epoch": 3184} {"train_loss": -6.5339460372924805, "global_step": 133768, "epoch": 3184} {"train_loss": -6.706162339165097, "global_step": 133769, "epoch": 3184, "val_loss": 77416.0859375} {"train_loss": -6.734140396118164, "global_step": 133770, "epoch": 3185} {"train_loss": -6.720123291015625, "global_step": 133771, "epoch": 3185} {"train_loss": -6.643789291381836, "global_step": 133772, "epoch": 3185} {"train_loss": -6.658015251159668, "global_step": 133773, "epoch": 3185} {"train_loss": -6.7467570304870605, "global_step": 133774, "epoch": 3185} {"train_loss": -6.811777591705322, "global_step": 133775, "epoch": 3185} {"train_loss": -6.743570804595947, "global_step": 133776, "epoch": 3185} {"train_loss": -6.817061424255371, "global_step": 133777, "epoch": 3185} {"train_loss": -6.673676490783691, "global_step": 133778, "epoch": 3185} {"train_loss": -6.698916435241699, "global_step": 133779, "epoch": 3185} {"train_loss": -6.753833770751953, "global_step": 133780, "epoch": 3185} {"train_loss": -6.748566627502441, "global_step": 133781, "epoch": 3185} {"train_loss": -6.5913190841674805, "global_step": 133782, "epoch": 3185} {"train_loss": -6.706640243530273, "global_step": 133783, "epoch": 3185} {"train_loss": -6.70851469039917, "global_step": 133784, "epoch": 3185} {"train_loss": -6.772851943969727, "global_step": 133785, "epoch": 3185} {"train_loss": -6.76265811920166, "global_step": 133786, "epoch": 3185} {"train_loss": -6.632294654846191, "global_step": 133787, "epoch": 3185} {"train_loss": -6.712935447692871, "global_step": 133788, "epoch": 3185} {"train_loss": -6.738902568817139, "global_step": 133789, "epoch": 3185} {"train_loss": -6.751367568969727, "global_step": 133790, "epoch": 3185} {"train_loss": -6.68118953704834, "global_step": 133791, "epoch": 3185} {"train_loss": -6.908773422241211, "global_step": 133792, "epoch": 3185} {"train_loss": -6.581930637359619, "global_step": 133793, "epoch": 3185} {"train_loss": -6.683809280395508, "global_step": 133794, "epoch": 3185} {"train_loss": -6.776410102844238, "global_step": 133795, "epoch": 3185} {"train_loss": -6.64644193649292, "global_step": 133796, "epoch": 3185} {"train_loss": -6.744170188903809, "global_step": 133797, "epoch": 3185} {"train_loss": -6.685958385467529, "global_step": 133798, "epoch": 3185} {"train_loss": -6.791910171508789, "global_step": 133799, "epoch": 3185} {"train_loss": -6.656371593475342, "global_step": 133800, "epoch": 3185} {"train_loss": -6.6369428634643555, "global_step": 133801, "epoch": 3185} {"train_loss": -6.6010050773620605, "global_step": 133802, "epoch": 3185} {"train_loss": -6.735591411590576, "global_step": 133803, "epoch": 3185} {"train_loss": -6.62596321105957, "global_step": 133804, "epoch": 3185} {"train_loss": -6.789424896240234, "global_step": 133805, "epoch": 3185} {"train_loss": -6.780648231506348, "global_step": 133806, "epoch": 3185} {"train_loss": -6.725933074951172, "global_step": 133807, "epoch": 3185} {"train_loss": -6.766599178314209, "global_step": 133808, "epoch": 3185} {"train_loss": -6.77239990234375, "global_step": 133809, "epoch": 3185} {"train_loss": -6.64470100402832, "global_step": 133810, "epoch": 3185} {"train_loss": -6.716574850536528, "global_step": 133811, "epoch": 3185, "val_loss": 77253.0625} {"train_loss": -6.7431230545043945, "global_step": 133812, "epoch": 3186} {"train_loss": -6.762559413909912, "global_step": 133813, "epoch": 3186} {"train_loss": -6.79710578918457, "global_step": 133814, "epoch": 3186} {"train_loss": -6.8202128410339355, "global_step": 133815, "epoch": 3186} {"train_loss": -6.712911605834961, "global_step": 133816, "epoch": 3186} {"train_loss": -6.7169084548950195, "global_step": 133817, "epoch": 3186} {"train_loss": -6.729544162750244, "global_step": 133818, "epoch": 3186} {"train_loss": -6.749117374420166, "global_step": 133819, "epoch": 3186} {"train_loss": -6.734621047973633, "global_step": 133820, "epoch": 3186} {"train_loss": -6.730046272277832, "global_step": 133821, "epoch": 3186} {"train_loss": -6.635098457336426, "global_step": 133822, "epoch": 3186} {"train_loss": -6.577759742736816, "global_step": 133823, "epoch": 3186} {"train_loss": -6.596249580383301, "global_step": 133824, "epoch": 3186} {"train_loss": -6.59996223449707, "global_step": 133825, "epoch": 3186} {"train_loss": -6.468101978302002, "global_step": 133826, "epoch": 3186} {"train_loss": -6.577691555023193, "global_step": 133827, "epoch": 3186} {"train_loss": -6.677657127380371, "global_step": 133828, "epoch": 3186} {"train_loss": -6.502412796020508, "global_step": 133829, "epoch": 3186} {"train_loss": -6.538148403167725, "global_step": 133830, "epoch": 3186} {"train_loss": -6.545591354370117, "global_step": 133831, "epoch": 3186} {"train_loss": -6.618145942687988, "global_step": 133832, "epoch": 3186} {"train_loss": -6.594452857971191, "global_step": 133833, "epoch": 3186} {"train_loss": -6.641213417053223, "global_step": 133834, "epoch": 3186} {"train_loss": -6.479310512542725, "global_step": 133835, "epoch": 3186} {"train_loss": -6.646817207336426, "global_step": 133836, "epoch": 3186} {"train_loss": -6.5822248458862305, "global_step": 133837, "epoch": 3186} {"train_loss": -6.680475234985352, "global_step": 133838, "epoch": 3186} {"train_loss": -6.680497646331787, "global_step": 133839, "epoch": 3186} {"train_loss": -6.624337196350098, "global_step": 133840, "epoch": 3186} {"train_loss": -6.496827125549316, "global_step": 133841, "epoch": 3186} {"train_loss": -6.806135177612305, "global_step": 133842, "epoch": 3186} {"train_loss": -6.652489185333252, "global_step": 133843, "epoch": 3186} {"train_loss": -6.6812663078308105, "global_step": 133844, "epoch": 3186} {"train_loss": -6.600864410400391, "global_step": 133845, "epoch": 3186} {"train_loss": -6.67140007019043, "global_step": 133846, "epoch": 3186} {"train_loss": -6.745139122009277, "global_step": 133847, "epoch": 3186} {"train_loss": -6.526644706726074, "global_step": 133848, "epoch": 3186} {"train_loss": -6.728944778442383, "global_step": 133849, "epoch": 3186} {"train_loss": -6.585615158081055, "global_step": 133850, "epoch": 3186} {"train_loss": -6.773406505584717, "global_step": 133851, "epoch": 3186} {"train_loss": -6.756002426147461, "global_step": 133852, "epoch": 3186} {"train_loss": -6.6513253053029375, "global_step": 133853, "epoch": 3186, "val_loss": 77590.453125} {"train_loss": -6.726154327392578, "global_step": 133854, "epoch": 3187} {"train_loss": -6.621047019958496, "global_step": 133855, "epoch": 3187} {"train_loss": -6.619690895080566, "global_step": 133856, "epoch": 3187} {"train_loss": -6.652830600738525, "global_step": 133857, "epoch": 3187} {"train_loss": -6.6603474617004395, "global_step": 133858, "epoch": 3187} {"train_loss": -6.6723809242248535, "global_step": 133859, "epoch": 3187} {"train_loss": -6.55162239074707, "global_step": 133860, "epoch": 3187} {"train_loss": -6.626290798187256, "global_step": 133861, "epoch": 3187} {"train_loss": -6.698020935058594, "global_step": 133862, "epoch": 3187} {"train_loss": -6.566873550415039, "global_step": 133863, "epoch": 3187} {"train_loss": -6.638526439666748, "global_step": 133864, "epoch": 3187} {"train_loss": -6.654843330383301, "global_step": 133865, "epoch": 3187} {"train_loss": -6.567680358886719, "global_step": 133866, "epoch": 3187} {"train_loss": -6.6229047775268555, "global_step": 133867, "epoch": 3187} {"train_loss": -6.632678508758545, "global_step": 133868, "epoch": 3187} {"train_loss": -6.676868915557861, "global_step": 133869, "epoch": 3187} {"train_loss": -6.680387496948242, "global_step": 133870, "epoch": 3187} {"train_loss": -6.706435203552246, "global_step": 133871, "epoch": 3187} {"train_loss": -6.681229114532471, "global_step": 133872, "epoch": 3187} {"train_loss": -6.77854061126709, "global_step": 133873, "epoch": 3187} {"train_loss": -6.655832290649414, "global_step": 133874, "epoch": 3187} {"train_loss": -6.719641208648682, "global_step": 133875, "epoch": 3187} {"train_loss": -6.732969284057617, "global_step": 133876, "epoch": 3187} {"train_loss": -6.657641410827637, "global_step": 133877, "epoch": 3187} {"train_loss": -6.7129621505737305, "global_step": 133878, "epoch": 3187} {"train_loss": -6.6527204513549805, "global_step": 133879, "epoch": 3187} {"train_loss": -6.694330215454102, "global_step": 133880, "epoch": 3187} {"train_loss": -6.691005706787109, "global_step": 133881, "epoch": 3187} {"train_loss": -6.783291339874268, "global_step": 133882, "epoch": 3187} {"train_loss": -6.73642110824585, "global_step": 133883, "epoch": 3187} {"train_loss": -6.698540687561035, "global_step": 133884, "epoch": 3187} {"train_loss": -6.668801307678223, "global_step": 133885, "epoch": 3187} {"train_loss": -6.854924201965332, "global_step": 133886, "epoch": 3187} {"train_loss": -6.783517837524414, "global_step": 133887, "epoch": 3187} {"train_loss": -6.679805278778076, "global_step": 133888, "epoch": 3187} {"train_loss": -6.655789375305176, "global_step": 133889, "epoch": 3187} {"train_loss": -6.66412878036499, "global_step": 133890, "epoch": 3187} {"train_loss": -6.56483268737793, "global_step": 133891, "epoch": 3187} {"train_loss": -6.707364082336426, "global_step": 133892, "epoch": 3187} {"train_loss": -6.61104154586792, "global_step": 133893, "epoch": 3187} {"train_loss": -6.546430587768555, "global_step": 133894, "epoch": 3187} {"train_loss": -6.670484486080351, "global_step": 133895, "epoch": 3187, "val_loss": 77918.59375} {"train_loss": -6.617039680480957, "global_step": 133896, "epoch": 3188} {"train_loss": -6.640602111816406, "global_step": 133897, "epoch": 3188} {"train_loss": -6.705122947692871, "global_step": 133898, "epoch": 3188} {"train_loss": -6.730306625366211, "global_step": 133899, "epoch": 3188} {"train_loss": -6.725488185882568, "global_step": 133900, "epoch": 3188} {"train_loss": -6.7539381980896, "global_step": 133901, "epoch": 3188} {"train_loss": -6.668088912963867, "global_step": 133902, "epoch": 3188} {"train_loss": -6.624159812927246, "global_step": 133903, "epoch": 3188} {"train_loss": -6.718089580535889, "global_step": 133904, "epoch": 3188} {"train_loss": -6.627429485321045, "global_step": 133905, "epoch": 3188} {"train_loss": -6.7750020027160645, "global_step": 133906, "epoch": 3188} {"train_loss": -6.7459611892700195, "global_step": 133907, "epoch": 3188} {"train_loss": -6.69638729095459, "global_step": 133908, "epoch": 3188} {"train_loss": -6.66707706451416, "global_step": 133909, "epoch": 3188} {"train_loss": -6.732443809509277, "global_step": 133910, "epoch": 3188} {"train_loss": -6.7000837326049805, "global_step": 133911, "epoch": 3188} {"train_loss": -6.756628036499023, "global_step": 133912, "epoch": 3188} {"train_loss": -6.626190185546875, "global_step": 133913, "epoch": 3188} {"train_loss": -6.714998722076416, "global_step": 133914, "epoch": 3188} {"train_loss": -6.774189472198486, "global_step": 133915, "epoch": 3188} {"train_loss": -6.6740546226501465, "global_step": 133916, "epoch": 3188} {"train_loss": -6.711677074432373, "global_step": 133917, "epoch": 3188} {"train_loss": -6.619359970092773, "global_step": 133918, "epoch": 3188} {"train_loss": -6.695838928222656, "global_step": 133919, "epoch": 3188} {"train_loss": -6.694123268127441, "global_step": 133920, "epoch": 3188} {"train_loss": -6.723354339599609, "global_step": 133921, "epoch": 3188} {"train_loss": -6.6161603927612305, "global_step": 133922, "epoch": 3188} {"train_loss": -6.8260931968688965, "global_step": 133923, "epoch": 3188} {"train_loss": -6.6004743576049805, "global_step": 133924, "epoch": 3188} {"train_loss": -6.482831954956055, "global_step": 133925, "epoch": 3188} {"train_loss": -6.695863246917725, "global_step": 133926, "epoch": 3188} {"train_loss": -6.700761795043945, "global_step": 133927, "epoch": 3188} {"train_loss": -6.600250244140625, "global_step": 133928, "epoch": 3188} {"train_loss": -6.618147850036621, "global_step": 133929, "epoch": 3188} {"train_loss": -6.638556003570557, "global_step": 133930, "epoch": 3188} {"train_loss": -6.522952556610107, "global_step": 133931, "epoch": 3188} {"train_loss": -6.756660461425781, "global_step": 133932, "epoch": 3188} {"train_loss": -6.585390567779541, "global_step": 133933, "epoch": 3188} {"train_loss": -6.571347713470459, "global_step": 133934, "epoch": 3188} {"train_loss": -6.659488677978516, "global_step": 133935, "epoch": 3188} {"train_loss": -6.534966468811035, "global_step": 133936, "epoch": 3188} {"train_loss": -6.6703008243015836, "global_step": 133937, "epoch": 3188, "val_loss": 77672.40625} {"train_loss": -6.59406852722168, "global_step": 133938, "epoch": 3189} {"train_loss": -6.786815166473389, "global_step": 133939, "epoch": 3189} {"train_loss": -6.653161525726318, "global_step": 133940, "epoch": 3189} {"train_loss": -6.687305927276611, "global_step": 133941, "epoch": 3189} {"train_loss": -6.678974628448486, "global_step": 133942, "epoch": 3189} {"train_loss": -6.70524263381958, "global_step": 133943, "epoch": 3189} {"train_loss": -6.690532684326172, "global_step": 133944, "epoch": 3189} {"train_loss": -6.730742454528809, "global_step": 133945, "epoch": 3189} {"train_loss": -6.745932102203369, "global_step": 133946, "epoch": 3189} {"train_loss": -6.637169361114502, "global_step": 133947, "epoch": 3189} {"train_loss": -6.667206287384033, "global_step": 133948, "epoch": 3189} {"train_loss": -6.670805931091309, "global_step": 133949, "epoch": 3189} {"train_loss": -6.514758110046387, "global_step": 133950, "epoch": 3189} {"train_loss": -6.721432685852051, "global_step": 133951, "epoch": 3189} {"train_loss": -6.700760841369629, "global_step": 133952, "epoch": 3189} {"train_loss": -6.7443647384643555, "global_step": 133953, "epoch": 3189} {"train_loss": -6.647116184234619, "global_step": 133954, "epoch": 3189} {"train_loss": -6.637770652770996, "global_step": 133955, "epoch": 3189} {"train_loss": -6.687854766845703, "global_step": 133956, "epoch": 3189} {"train_loss": -6.614333152770996, "global_step": 133957, "epoch": 3189} {"train_loss": -6.667058944702148, "global_step": 133958, "epoch": 3189} {"train_loss": -6.706865310668945, "global_step": 133959, "epoch": 3189} {"train_loss": -6.800715923309326, "global_step": 133960, "epoch": 3189} {"train_loss": -6.574712753295898, "global_step": 133961, "epoch": 3189} {"train_loss": -6.714211463928223, "global_step": 133962, "epoch": 3189} {"train_loss": -6.658656120300293, "global_step": 133963, "epoch": 3189} {"train_loss": -6.813971519470215, "global_step": 133964, "epoch": 3189} {"train_loss": -6.8432745933532715, "global_step": 133965, "epoch": 3189} {"train_loss": -6.748331069946289, "global_step": 133966, "epoch": 3189} {"train_loss": -6.726458549499512, "global_step": 133967, "epoch": 3189} {"train_loss": -6.671519756317139, "global_step": 133968, "epoch": 3189} {"train_loss": -6.681903839111328, "global_step": 133969, "epoch": 3189} {"train_loss": -6.7867584228515625, "global_step": 133970, "epoch": 3189} {"train_loss": -6.789314270019531, "global_step": 133971, "epoch": 3189} {"train_loss": -6.927979469299316, "global_step": 133972, "epoch": 3189} {"train_loss": -6.817156791687012, "global_step": 133973, "epoch": 3189} {"train_loss": -6.7468976974487305, "global_step": 133974, "epoch": 3189} {"train_loss": -6.796028137207031, "global_step": 133975, "epoch": 3189} {"train_loss": -6.703690528869629, "global_step": 133976, "epoch": 3189} {"train_loss": -6.762801647186279, "global_step": 133977, "epoch": 3189} {"train_loss": -6.794841766357422, "global_step": 133978, "epoch": 3189} {"train_loss": -6.715852249236334, "global_step": 133979, "epoch": 3189, "val_loss": 77615.78125} {"train_loss": -6.725080490112305, "global_step": 133980, "epoch": 3190} {"train_loss": -6.715060234069824, "global_step": 133981, "epoch": 3190} {"train_loss": -6.717650413513184, "global_step": 133982, "epoch": 3190} {"train_loss": -6.669460773468018, "global_step": 133983, "epoch": 3190} {"train_loss": -6.719778060913086, "global_step": 133984, "epoch": 3190} {"train_loss": -6.714763641357422, "global_step": 133985, "epoch": 3190} {"train_loss": -6.75320291519165, "global_step": 133986, "epoch": 3190} {"train_loss": -6.60513973236084, "global_step": 133987, "epoch": 3190} {"train_loss": -6.600474834442139, "global_step": 133988, "epoch": 3190} {"train_loss": -6.807798385620117, "global_step": 133989, "epoch": 3190} {"train_loss": -6.65151834487915, "global_step": 133990, "epoch": 3190} {"train_loss": -6.582121849060059, "global_step": 133991, "epoch": 3190} {"train_loss": -6.668429374694824, "global_step": 133992, "epoch": 3190} {"train_loss": -6.564766883850098, "global_step": 133993, "epoch": 3190} {"train_loss": -6.664510726928711, "global_step": 133994, "epoch": 3190} {"train_loss": -6.504217147827148, "global_step": 133995, "epoch": 3190} {"train_loss": -6.610846996307373, "global_step": 133996, "epoch": 3190} {"train_loss": -6.629693984985352, "global_step": 133997, "epoch": 3190} {"train_loss": -6.386094093322754, "global_step": 133998, "epoch": 3190} {"train_loss": -6.520971298217773, "global_step": 133999, "epoch": 3190} {"train_loss": -6.590614318847656, "global_step": 134000, "epoch": 3190} {"train_loss": -6.564672470092773, "global_step": 134001, "epoch": 3190} {"train_loss": -6.4586873054504395, "global_step": 134002, "epoch": 3190} {"train_loss": -6.671581745147705, "global_step": 134003, "epoch": 3190} {"train_loss": -6.6031599044799805, "global_step": 134004, "epoch": 3190} {"train_loss": -6.496756553649902, "global_step": 134005, "epoch": 3190} {"train_loss": -6.6336469650268555, "global_step": 134006, "epoch": 3190} {"train_loss": -6.582849502563477, "global_step": 134007, "epoch": 3190} {"train_loss": -6.563511848449707, "global_step": 134008, "epoch": 3190} {"train_loss": -6.60762882232666, "global_step": 134009, "epoch": 3190} {"train_loss": -6.574260711669922, "global_step": 134010, "epoch": 3190} {"train_loss": -6.603959083557129, "global_step": 134011, "epoch": 3190} {"train_loss": -6.695742130279541, "global_step": 134012, "epoch": 3190} {"train_loss": -6.645290374755859, "global_step": 134013, "epoch": 3190} {"train_loss": -6.66871976852417, "global_step": 134014, "epoch": 3190} {"train_loss": -6.642121315002441, "global_step": 134015, "epoch": 3190} {"train_loss": -6.517871379852295, "global_step": 134016, "epoch": 3190} {"train_loss": -6.648797988891602, "global_step": 134017, "epoch": 3190} {"train_loss": -6.728083610534668, "global_step": 134018, "epoch": 3190} {"train_loss": -6.660800933837891, "global_step": 134019, "epoch": 3190} {"train_loss": -6.822120666503906, "global_step": 134020, "epoch": 3190} {"train_loss": -6.630536499477568, "global_step": 134021, "epoch": 3190, "val_loss": 77407.9453125} {"train_loss": -6.656612396240234, "global_step": 134022, "epoch": 3191} {"train_loss": -6.761806488037109, "global_step": 134023, "epoch": 3191} {"train_loss": -6.720142364501953, "global_step": 134024, "epoch": 3191} {"train_loss": -6.761905670166016, "global_step": 134025, "epoch": 3191} {"train_loss": -6.698234558105469, "global_step": 134026, "epoch": 3191} {"train_loss": -6.663911819458008, "global_step": 134027, "epoch": 3191} {"train_loss": -6.700075149536133, "global_step": 134028, "epoch": 3191} {"train_loss": -6.803323268890381, "global_step": 134029, "epoch": 3191} {"train_loss": -6.8240766525268555, "global_step": 134030, "epoch": 3191} {"train_loss": -6.772366523742676, "global_step": 134031, "epoch": 3191} {"train_loss": -6.745532035827637, "global_step": 134032, "epoch": 3191} {"train_loss": -6.671925067901611, "global_step": 134033, "epoch": 3191} {"train_loss": -6.67418098449707, "global_step": 134034, "epoch": 3191} {"train_loss": -6.68489933013916, "global_step": 134035, "epoch": 3191} {"train_loss": -6.653072357177734, "global_step": 134036, "epoch": 3191} {"train_loss": -6.81316614151001, "global_step": 134037, "epoch": 3191} {"train_loss": -6.754889488220215, "global_step": 134038, "epoch": 3191} {"train_loss": -6.672287464141846, "global_step": 134039, "epoch": 3191} {"train_loss": -6.753356456756592, "global_step": 134040, "epoch": 3191} {"train_loss": -6.662710666656494, "global_step": 134041, "epoch": 3191} {"train_loss": -6.6700825691223145, "global_step": 134042, "epoch": 3191} {"train_loss": -6.697120666503906, "global_step": 134043, "epoch": 3191} {"train_loss": -6.777432441711426, "global_step": 134044, "epoch": 3191} {"train_loss": -6.723846435546875, "global_step": 134045, "epoch": 3191} {"train_loss": -6.699673652648926, "global_step": 134046, "epoch": 3191} {"train_loss": -6.810787200927734, "global_step": 134047, "epoch": 3191} {"train_loss": -6.703892707824707, "global_step": 134048, "epoch": 3191} {"train_loss": -6.703561782836914, "global_step": 134049, "epoch": 3191} {"train_loss": -6.665454387664795, "global_step": 134050, "epoch": 3191} {"train_loss": -6.765848636627197, "global_step": 134051, "epoch": 3191} {"train_loss": -6.816036224365234, "global_step": 134052, "epoch": 3191} {"train_loss": -6.704911231994629, "global_step": 134053, "epoch": 3191} {"train_loss": -6.614691734313965, "global_step": 134054, "epoch": 3191} {"train_loss": -6.653194427490234, "global_step": 134055, "epoch": 3191} {"train_loss": -6.6378936767578125, "global_step": 134056, "epoch": 3191} {"train_loss": -6.628335952758789, "global_step": 134057, "epoch": 3191} {"train_loss": -6.6828765869140625, "global_step": 134058, "epoch": 3191} {"train_loss": -6.766115188598633, "global_step": 134059, "epoch": 3191} {"train_loss": -6.590512275695801, "global_step": 134060, "epoch": 3191} {"train_loss": -6.618587493896484, "global_step": 134061, "epoch": 3191} {"train_loss": -6.771701812744141, "global_step": 134062, "epoch": 3191} {"train_loss": -6.709531159628005, "global_step": 134063, "epoch": 3191, "val_loss": 77782.578125} {"train_loss": -6.685968399047852, "global_step": 134064, "epoch": 3192} {"train_loss": -6.810439109802246, "global_step": 134065, "epoch": 3192} {"train_loss": -6.6754584312438965, "global_step": 134066, "epoch": 3192} {"train_loss": -6.7324371337890625, "global_step": 134067, "epoch": 3192} {"train_loss": -6.615200996398926, "global_step": 134068, "epoch": 3192} {"train_loss": -6.782104015350342, "global_step": 134069, "epoch": 3192} {"train_loss": -6.572010040283203, "global_step": 134070, "epoch": 3192} {"train_loss": -6.585109710693359, "global_step": 134071, "epoch": 3192} {"train_loss": -6.512687683105469, "global_step": 134072, "epoch": 3192} {"train_loss": -6.532663345336914, "global_step": 134073, "epoch": 3192} {"train_loss": -6.671223163604736, "global_step": 134074, "epoch": 3192} {"train_loss": -6.652426719665527, "global_step": 134075, "epoch": 3192} {"train_loss": -6.6374664306640625, "global_step": 134076, "epoch": 3192} {"train_loss": -6.737484931945801, "global_step": 134077, "epoch": 3192} {"train_loss": -6.478091239929199, "global_step": 134078, "epoch": 3192} {"train_loss": -6.7717132568359375, "global_step": 134079, "epoch": 3192} {"train_loss": -6.549037933349609, "global_step": 134080, "epoch": 3192} {"train_loss": -6.735873222351074, "global_step": 134081, "epoch": 3192} {"train_loss": -6.697789192199707, "global_step": 134082, "epoch": 3192} {"train_loss": -6.735452651977539, "global_step": 134083, "epoch": 3192} {"train_loss": -6.7469258308410645, "global_step": 134084, "epoch": 3192} {"train_loss": -6.545336723327637, "global_step": 134085, "epoch": 3192} {"train_loss": -6.733664512634277, "global_step": 134086, "epoch": 3192} {"train_loss": -6.692196369171143, "global_step": 134087, "epoch": 3192} {"train_loss": -6.640020370483398, "global_step": 134088, "epoch": 3192} {"train_loss": -6.71811580657959, "global_step": 134089, "epoch": 3192} {"train_loss": -6.693695068359375, "global_step": 134090, "epoch": 3192} {"train_loss": -6.5674238204956055, "global_step": 134091, "epoch": 3192} {"train_loss": -6.698578834533691, "global_step": 134092, "epoch": 3192} {"train_loss": -6.5413641929626465, "global_step": 134093, "epoch": 3192} {"train_loss": -6.711702346801758, "global_step": 134094, "epoch": 3192} {"train_loss": -6.653298377990723, "global_step": 134095, "epoch": 3192} {"train_loss": -6.723340034484863, "global_step": 134096, "epoch": 3192} {"train_loss": -6.707302570343018, "global_step": 134097, "epoch": 3192} {"train_loss": -6.616318702697754, "global_step": 134098, "epoch": 3192} {"train_loss": -6.730228900909424, "global_step": 134099, "epoch": 3192} {"train_loss": -6.743191719055176, "global_step": 134100, "epoch": 3192} {"train_loss": -6.766729354858398, "global_step": 134101, "epoch": 3192} {"train_loss": -6.7368574142456055, "global_step": 134102, "epoch": 3192} {"train_loss": -6.641724586486816, "global_step": 134103, "epoch": 3192} {"train_loss": -6.6982574462890625, "global_step": 134104, "epoch": 3192} {"train_loss": -6.669485364641462, "global_step": 134105, "epoch": 3192, "val_loss": 77948.0} {"train_loss": -6.654061317443848, "global_step": 134106, "epoch": 3193} {"train_loss": -6.72341251373291, "global_step": 134107, "epoch": 3193} {"train_loss": -6.702613353729248, "global_step": 134108, "epoch": 3193} {"train_loss": -6.7112274169921875, "global_step": 134109, "epoch": 3193} {"train_loss": -6.729805946350098, "global_step": 134110, "epoch": 3193} {"train_loss": -6.735262870788574, "global_step": 134111, "epoch": 3193} {"train_loss": -6.648124694824219, "global_step": 134112, "epoch": 3193} {"train_loss": -6.803626537322998, "global_step": 134113, "epoch": 3193} {"train_loss": -6.761369705200195, "global_step": 134114, "epoch": 3193} {"train_loss": -6.8245649337768555, "global_step": 134115, "epoch": 3193} {"train_loss": -6.671883583068848, "global_step": 134116, "epoch": 3193} {"train_loss": -6.763286113739014, "global_step": 134117, "epoch": 3193} {"train_loss": -6.697701454162598, "global_step": 134118, "epoch": 3193} {"train_loss": -6.640552520751953, "global_step": 134119, "epoch": 3193} {"train_loss": -6.7930803298950195, "global_step": 134120, "epoch": 3193} {"train_loss": -6.645926475524902, "global_step": 134121, "epoch": 3193} {"train_loss": -6.743239402770996, "global_step": 134122, "epoch": 3193} {"train_loss": -6.681203842163086, "global_step": 134123, "epoch": 3193} {"train_loss": -6.712759017944336, "global_step": 134124, "epoch": 3193} {"train_loss": -6.714626789093018, "global_step": 134125, "epoch": 3193} {"train_loss": -6.576391696929932, "global_step": 134126, "epoch": 3193} {"train_loss": -6.751843452453613, "global_step": 134127, "epoch": 3193} {"train_loss": -6.829067230224609, "global_step": 134128, "epoch": 3193} {"train_loss": -6.785665988922119, "global_step": 134129, "epoch": 3193} {"train_loss": -6.701650142669678, "global_step": 134130, "epoch": 3193} {"train_loss": -6.7299041748046875, "global_step": 134131, "epoch": 3193} {"train_loss": -6.632428169250488, "global_step": 134132, "epoch": 3193} {"train_loss": -6.743142604827881, "global_step": 134133, "epoch": 3193} {"train_loss": -6.665782928466797, "global_step": 134134, "epoch": 3193} {"train_loss": -6.598470687866211, "global_step": 134135, "epoch": 3193} {"train_loss": -6.688910007476807, "global_step": 134136, "epoch": 3193} {"train_loss": -6.6749677658081055, "global_step": 134137, "epoch": 3193} {"train_loss": -6.6638288497924805, "global_step": 134138, "epoch": 3193} {"train_loss": -6.741180896759033, "global_step": 134139, "epoch": 3193} {"train_loss": -6.763927459716797, "global_step": 134140, "epoch": 3193} {"train_loss": -6.619820594787598, "global_step": 134141, "epoch": 3193} {"train_loss": -6.769712448120117, "global_step": 134142, "epoch": 3193} {"train_loss": -6.821121692657471, "global_step": 134143, "epoch": 3193} {"train_loss": -6.773552417755127, "global_step": 134144, "epoch": 3193} {"train_loss": -6.63215446472168, "global_step": 134145, "epoch": 3193} {"train_loss": -6.799063205718994, "global_step": 134146, "epoch": 3193} {"train_loss": -6.713214567729405, "global_step": 134147, "epoch": 3193, "val_loss": 77669.921875} {"train_loss": -6.725590705871582, "global_step": 134148, "epoch": 3194} {"train_loss": -6.782657623291016, "global_step": 134149, "epoch": 3194} {"train_loss": -6.792618751525879, "global_step": 134150, "epoch": 3194} {"train_loss": -6.632963180541992, "global_step": 134151, "epoch": 3194} {"train_loss": -6.646286964416504, "global_step": 134152, "epoch": 3194} {"train_loss": -6.819025039672852, "global_step": 134153, "epoch": 3194} {"train_loss": -6.677864074707031, "global_step": 134154, "epoch": 3194} {"train_loss": -6.7112579345703125, "global_step": 134155, "epoch": 3194} {"train_loss": -6.830619812011719, "global_step": 134156, "epoch": 3194} {"train_loss": -6.568147659301758, "global_step": 134157, "epoch": 3194} {"train_loss": -6.6052141189575195, "global_step": 134158, "epoch": 3194} {"train_loss": -6.680089473724365, "global_step": 134159, "epoch": 3194} {"train_loss": -6.658656120300293, "global_step": 134160, "epoch": 3194} {"train_loss": -6.722103595733643, "global_step": 134161, "epoch": 3194} {"train_loss": -6.692266464233398, "global_step": 134162, "epoch": 3194} {"train_loss": -6.647851467132568, "global_step": 134163, "epoch": 3194} {"train_loss": -6.699253082275391, "global_step": 134164, "epoch": 3194} {"train_loss": -6.790194034576416, "global_step": 134165, "epoch": 3194} {"train_loss": -6.722652435302734, "global_step": 134166, "epoch": 3194} {"train_loss": -6.561355113983154, "global_step": 134167, "epoch": 3194} {"train_loss": -6.76112174987793, "global_step": 134168, "epoch": 3194} {"train_loss": -6.784161567687988, "global_step": 134169, "epoch": 3194} {"train_loss": -6.814846515655518, "global_step": 134170, "epoch": 3194} {"train_loss": -6.754554748535156, "global_step": 134171, "epoch": 3194} {"train_loss": -6.825304985046387, "global_step": 134172, "epoch": 3194} {"train_loss": -6.687736988067627, "global_step": 134173, "epoch": 3194} {"train_loss": -6.58311653137207, "global_step": 134174, "epoch": 3194} {"train_loss": -6.753742694854736, "global_step": 134175, "epoch": 3194} {"train_loss": -6.704230308532715, "global_step": 134176, "epoch": 3194} {"train_loss": -6.86027193069458, "global_step": 134177, "epoch": 3194} {"train_loss": -6.633095741271973, "global_step": 134178, "epoch": 3194} {"train_loss": -6.772603511810303, "global_step": 134179, "epoch": 3194} {"train_loss": -6.732030391693115, "global_step": 134180, "epoch": 3194} {"train_loss": -6.701053142547607, "global_step": 134181, "epoch": 3194} {"train_loss": -6.689146995544434, "global_step": 134182, "epoch": 3194} {"train_loss": -6.745195388793945, "global_step": 134183, "epoch": 3194} {"train_loss": -6.610461711883545, "global_step": 134184, "epoch": 3194} {"train_loss": -6.757102966308594, "global_step": 134185, "epoch": 3194} {"train_loss": -6.624610424041748, "global_step": 134186, "epoch": 3194} {"train_loss": -6.815620422363281, "global_step": 134187, "epoch": 3194} {"train_loss": -6.693081855773926, "global_step": 134188, "epoch": 3194} {"train_loss": -6.714677844728742, "global_step": 134189, "epoch": 3194, "val_loss": 77651.0625} {"train_loss": -6.7088823318481445, "global_step": 134190, "epoch": 3195} {"train_loss": -6.741896152496338, "global_step": 134191, "epoch": 3195} {"train_loss": -6.699818134307861, "global_step": 134192, "epoch": 3195} {"train_loss": -6.756542205810547, "global_step": 134193, "epoch": 3195} {"train_loss": -6.832703113555908, "global_step": 134194, "epoch": 3195} {"train_loss": -6.767541885375977, "global_step": 134195, "epoch": 3195} {"train_loss": -6.666152000427246, "global_step": 134196, "epoch": 3195} {"train_loss": -6.725142955780029, "global_step": 134197, "epoch": 3195} {"train_loss": -6.6841583251953125, "global_step": 134198, "epoch": 3195} {"train_loss": -6.7527265548706055, "global_step": 134199, "epoch": 3195} {"train_loss": -6.767952919006348, "global_step": 134200, "epoch": 3195} {"train_loss": -6.598391532897949, "global_step": 134201, "epoch": 3195} {"train_loss": -6.739957332611084, "global_step": 134202, "epoch": 3195} {"train_loss": -6.752628803253174, "global_step": 134203, "epoch": 3195} {"train_loss": -6.782550811767578, "global_step": 134204, "epoch": 3195} {"train_loss": -6.868683815002441, "global_step": 134205, "epoch": 3195} {"train_loss": -6.781416893005371, "global_step": 134206, "epoch": 3195} {"train_loss": -6.713868141174316, "global_step": 134207, "epoch": 3195} {"train_loss": -6.6992411613464355, "global_step": 134208, "epoch": 3195} {"train_loss": -6.724966049194336, "global_step": 134209, "epoch": 3195} {"train_loss": -6.729073524475098, "global_step": 134210, "epoch": 3195} {"train_loss": -6.85208797454834, "global_step": 134211, "epoch": 3195} {"train_loss": -6.813239097595215, "global_step": 134212, "epoch": 3195} {"train_loss": -6.722041130065918, "global_step": 134213, "epoch": 3195} {"train_loss": -6.789557456970215, "global_step": 134214, "epoch": 3195} {"train_loss": -6.686784267425537, "global_step": 134215, "epoch": 3195} {"train_loss": -6.761542320251465, "global_step": 134216, "epoch": 3195} {"train_loss": -6.892820358276367, "global_step": 134217, "epoch": 3195} {"train_loss": -6.762131690979004, "global_step": 134218, "epoch": 3195} {"train_loss": -6.705068588256836, "global_step": 134219, "epoch": 3195} {"train_loss": -6.7107038497924805, "global_step": 134220, "epoch": 3195} {"train_loss": -6.808036804199219, "global_step": 134221, "epoch": 3195} {"train_loss": -6.666507720947266, "global_step": 134222, "epoch": 3195} {"train_loss": -6.8290629386901855, "global_step": 134223, "epoch": 3195} {"train_loss": -6.805343151092529, "global_step": 134224, "epoch": 3195} {"train_loss": -6.812588691711426, "global_step": 134225, "epoch": 3195} {"train_loss": -6.873788833618164, "global_step": 134226, "epoch": 3195} {"train_loss": -6.63735818862915, "global_step": 134227, "epoch": 3195} {"train_loss": -6.765950679779053, "global_step": 134228, "epoch": 3195} {"train_loss": -6.773180961608887, "global_step": 134229, "epoch": 3195} {"train_loss": -6.719521522521973, "global_step": 134230, "epoch": 3195} {"train_loss": -6.753280026572091, "global_step": 134231, "epoch": 3195, "val_loss": 77739.3515625} {"train_loss": -6.755017280578613, "global_step": 134232, "epoch": 3196} {"train_loss": -6.759845733642578, "global_step": 134233, "epoch": 3196} {"train_loss": -6.7018256187438965, "global_step": 134234, "epoch": 3196} {"train_loss": -6.678921699523926, "global_step": 134235, "epoch": 3196} {"train_loss": -6.802029609680176, "global_step": 134236, "epoch": 3196} {"train_loss": -6.681958198547363, "global_step": 134237, "epoch": 3196} {"train_loss": -6.752155303955078, "global_step": 134238, "epoch": 3196} {"train_loss": -6.759579658508301, "global_step": 134239, "epoch": 3196} {"train_loss": -6.729132652282715, "global_step": 134240, "epoch": 3196} {"train_loss": -6.837198257446289, "global_step": 134241, "epoch": 3196} {"train_loss": -6.805381774902344, "global_step": 134242, "epoch": 3196} {"train_loss": -6.749478340148926, "global_step": 134243, "epoch": 3196} {"train_loss": -6.783674240112305, "global_step": 134244, "epoch": 3196} {"train_loss": -6.747736930847168, "global_step": 134245, "epoch": 3196} {"train_loss": -6.810365200042725, "global_step": 134246, "epoch": 3196} {"train_loss": -6.803769111633301, "global_step": 134247, "epoch": 3196} {"train_loss": -6.673427581787109, "global_step": 134248, "epoch": 3196} {"train_loss": -6.693665504455566, "global_step": 134249, "epoch": 3196} {"train_loss": -6.552939414978027, "global_step": 134250, "epoch": 3196} {"train_loss": -6.7512125968933105, "global_step": 134251, "epoch": 3196} {"train_loss": -6.7988457679748535, "global_step": 134252, "epoch": 3196} {"train_loss": -6.813220977783203, "global_step": 134253, "epoch": 3196} {"train_loss": -6.771129608154297, "global_step": 134254, "epoch": 3196} {"train_loss": -6.735878944396973, "global_step": 134255, "epoch": 3196} {"train_loss": -6.758769512176514, "global_step": 134256, "epoch": 3196} {"train_loss": -6.62867546081543, "global_step": 134257, "epoch": 3196} {"train_loss": -6.573707580566406, "global_step": 134258, "epoch": 3196} {"train_loss": -6.730835914611816, "global_step": 134259, "epoch": 3196} {"train_loss": -6.691633224487305, "global_step": 134260, "epoch": 3196} {"train_loss": -6.564053058624268, "global_step": 134261, "epoch": 3196} {"train_loss": -6.5905303955078125, "global_step": 134262, "epoch": 3196} {"train_loss": -6.778683662414551, "global_step": 134263, "epoch": 3196} {"train_loss": -6.621684551239014, "global_step": 134264, "epoch": 3196} {"train_loss": -6.668812274932861, "global_step": 134265, "epoch": 3196} {"train_loss": -6.73119592666626, "global_step": 134266, "epoch": 3196} {"train_loss": -6.609699249267578, "global_step": 134267, "epoch": 3196} {"train_loss": -6.772618770599365, "global_step": 134268, "epoch": 3196} {"train_loss": -6.588811874389648, "global_step": 134269, "epoch": 3196} {"train_loss": -6.717449188232422, "global_step": 134270, "epoch": 3196} {"train_loss": -6.708488464355469, "global_step": 134271, "epoch": 3196} {"train_loss": -6.772927284240723, "global_step": 134272, "epoch": 3196} {"train_loss": -6.721818946656727, "global_step": 134273, "epoch": 3196, "val_loss": 77535.65625} {"train_loss": -6.625160217285156, "global_step": 134274, "epoch": 3197} {"train_loss": -6.582128524780273, "global_step": 134275, "epoch": 3197} {"train_loss": -6.693564414978027, "global_step": 134276, "epoch": 3197} {"train_loss": -6.582833766937256, "global_step": 134277, "epoch": 3197} {"train_loss": -6.805661201477051, "global_step": 134278, "epoch": 3197} {"train_loss": -6.796408653259277, "global_step": 134279, "epoch": 3197} {"train_loss": -6.771913528442383, "global_step": 134280, "epoch": 3197} {"train_loss": -6.614955902099609, "global_step": 134281, "epoch": 3197} {"train_loss": -6.833004951477051, "global_step": 134282, "epoch": 3197} {"train_loss": -6.705994606018066, "global_step": 134283, "epoch": 3197} {"train_loss": -6.716753959655762, "global_step": 134284, "epoch": 3197} {"train_loss": -6.734737873077393, "global_step": 134285, "epoch": 3197} {"train_loss": -6.731911659240723, "global_step": 134286, "epoch": 3197} {"train_loss": -6.766208648681641, "global_step": 134287, "epoch": 3197} {"train_loss": -6.727047920227051, "global_step": 134288, "epoch": 3197} {"train_loss": -6.721991539001465, "global_step": 134289, "epoch": 3197} {"train_loss": -6.571225166320801, "global_step": 134290, "epoch": 3197} {"train_loss": -6.6218414306640625, "global_step": 134291, "epoch": 3197} {"train_loss": -6.686421871185303, "global_step": 134292, "epoch": 3197} {"train_loss": -6.666121482849121, "global_step": 134293, "epoch": 3197} {"train_loss": -6.610904693603516, "global_step": 134294, "epoch": 3197} {"train_loss": -6.6747026443481445, "global_step": 134295, "epoch": 3197} {"train_loss": -6.773501396179199, "global_step": 134296, "epoch": 3197} {"train_loss": -6.612466812133789, "global_step": 134297, "epoch": 3197} {"train_loss": -6.714752674102783, "global_step": 134298, "epoch": 3197} {"train_loss": -6.631283760070801, "global_step": 134299, "epoch": 3197} {"train_loss": -6.764781951904297, "global_step": 134300, "epoch": 3197} {"train_loss": -6.632694244384766, "global_step": 134301, "epoch": 3197} {"train_loss": -6.697479248046875, "global_step": 134302, "epoch": 3197} {"train_loss": -6.718345642089844, "global_step": 134303, "epoch": 3197} {"train_loss": -6.75189208984375, "global_step": 134304, "epoch": 3197} {"train_loss": -6.613504409790039, "global_step": 134305, "epoch": 3197} {"train_loss": -6.6448469161987305, "global_step": 134306, "epoch": 3197} {"train_loss": -6.678025245666504, "global_step": 134307, "epoch": 3197} {"train_loss": -6.843138694763184, "global_step": 134308, "epoch": 3197} {"train_loss": -6.778108596801758, "global_step": 134309, "epoch": 3197} {"train_loss": -6.835268020629883, "global_step": 134310, "epoch": 3197} {"train_loss": -6.562229156494141, "global_step": 134311, "epoch": 3197} {"train_loss": -6.735487937927246, "global_step": 134312, "epoch": 3197} {"train_loss": -6.746908187866211, "global_step": 134313, "epoch": 3197} {"train_loss": -6.73141622543335, "global_step": 134314, "epoch": 3197} {"train_loss": -6.700682095118931, "global_step": 134315, "epoch": 3197, "val_loss": 77663.5234375} {"train_loss": -6.713931083679199, "global_step": 134316, "epoch": 3198} {"train_loss": -6.827727794647217, "global_step": 134317, "epoch": 3198} {"train_loss": -6.7905120849609375, "global_step": 134318, "epoch": 3198} {"train_loss": -6.716036319732666, "global_step": 134319, "epoch": 3198} {"train_loss": -6.793587684631348, "global_step": 134320, "epoch": 3198} {"train_loss": -6.836631774902344, "global_step": 134321, "epoch": 3198} {"train_loss": -6.763494491577148, "global_step": 134322, "epoch": 3198} {"train_loss": -6.686844348907471, "global_step": 134323, "epoch": 3198} {"train_loss": -6.686075687408447, "global_step": 134324, "epoch": 3198} {"train_loss": -6.772650718688965, "global_step": 134325, "epoch": 3198} {"train_loss": -6.762063980102539, "global_step": 134326, "epoch": 3198} {"train_loss": -6.700362205505371, "global_step": 134327, "epoch": 3198} {"train_loss": -6.761570453643799, "global_step": 134328, "epoch": 3198} {"train_loss": -6.6861443519592285, "global_step": 134329, "epoch": 3198} {"train_loss": -6.555915832519531, "global_step": 134330, "epoch": 3198} {"train_loss": -6.656744003295898, "global_step": 134331, "epoch": 3198} {"train_loss": -6.596715927124023, "global_step": 134332, "epoch": 3198} {"train_loss": -6.756139755249023, "global_step": 134333, "epoch": 3198} {"train_loss": -6.659017562866211, "global_step": 134334, "epoch": 3198} {"train_loss": -6.604523181915283, "global_step": 134335, "epoch": 3198} {"train_loss": -6.624653339385986, "global_step": 134336, "epoch": 3198} {"train_loss": -6.787610054016113, "global_step": 134337, "epoch": 3198} {"train_loss": -6.672152996063232, "global_step": 134338, "epoch": 3198} {"train_loss": -6.619442939758301, "global_step": 134339, "epoch": 3198} {"train_loss": -6.679783821105957, "global_step": 134340, "epoch": 3198} {"train_loss": -6.8054423332214355, "global_step": 134341, "epoch": 3198} {"train_loss": -6.569891929626465, "global_step": 134342, "epoch": 3198} {"train_loss": -6.698240756988525, "global_step": 134343, "epoch": 3198} {"train_loss": -6.478265762329102, "global_step": 134344, "epoch": 3198} {"train_loss": -6.718426704406738, "global_step": 134345, "epoch": 3198} {"train_loss": -6.719322204589844, "global_step": 134346, "epoch": 3198} {"train_loss": -6.750002861022949, "global_step": 134347, "epoch": 3198} {"train_loss": -6.64744234085083, "global_step": 134348, "epoch": 3198} {"train_loss": -6.706159591674805, "global_step": 134349, "epoch": 3198} {"train_loss": -6.665766716003418, "global_step": 134350, "epoch": 3198} {"train_loss": -6.591161727905273, "global_step": 134351, "epoch": 3198} {"train_loss": -6.717782020568848, "global_step": 134352, "epoch": 3198} {"train_loss": -6.642934322357178, "global_step": 134353, "epoch": 3198} {"train_loss": -6.713594436645508, "global_step": 134354, "epoch": 3198} {"train_loss": -6.68924617767334, "global_step": 134355, "epoch": 3198} {"train_loss": -6.68764591217041, "global_step": 134356, "epoch": 3198} {"train_loss": -6.696827547890799, "global_step": 134357, "epoch": 3198, "val_loss": 77886.28125} {"train_loss": -6.70747184753418, "global_step": 134358, "epoch": 3199} {"train_loss": -6.656951904296875, "global_step": 134359, "epoch": 3199} {"train_loss": -6.852122783660889, "global_step": 134360, "epoch": 3199} {"train_loss": -6.755667686462402, "global_step": 134361, "epoch": 3199} {"train_loss": -6.728399276733398, "global_step": 134362, "epoch": 3199} {"train_loss": -6.784732818603516, "global_step": 134363, "epoch": 3199} {"train_loss": -6.6862006187438965, "global_step": 134364, "epoch": 3199} {"train_loss": -6.8077921867370605, "global_step": 134365, "epoch": 3199} {"train_loss": -6.687200546264648, "global_step": 134366, "epoch": 3199} {"train_loss": -6.815633296966553, "global_step": 134367, "epoch": 3199} {"train_loss": -6.693980693817139, "global_step": 134368, "epoch": 3199} {"train_loss": -6.775367259979248, "global_step": 134369, "epoch": 3199} {"train_loss": -6.864293098449707, "global_step": 134370, "epoch": 3199} {"train_loss": -6.763718605041504, "global_step": 134371, "epoch": 3199} {"train_loss": -6.619390487670898, "global_step": 134372, "epoch": 3199} {"train_loss": -6.672510623931885, "global_step": 134373, "epoch": 3199} {"train_loss": -6.829606056213379, "global_step": 134374, "epoch": 3199} {"train_loss": -6.763917922973633, "global_step": 134375, "epoch": 3199} {"train_loss": -6.7379961013793945, "global_step": 134376, "epoch": 3199} {"train_loss": -6.7884321212768555, "global_step": 134377, "epoch": 3199} {"train_loss": -6.7025299072265625, "global_step": 134378, "epoch": 3199} {"train_loss": -6.717508316040039, "global_step": 134379, "epoch": 3199} {"train_loss": -6.718097686767578, "global_step": 134380, "epoch": 3199} {"train_loss": -6.734997749328613, "global_step": 134381, "epoch": 3199} {"train_loss": -6.798219203948975, "global_step": 134382, "epoch": 3199} {"train_loss": -6.811578750610352, "global_step": 134383, "epoch": 3199} {"train_loss": -6.702960014343262, "global_step": 134384, "epoch": 3199} {"train_loss": -6.832007884979248, "global_step": 134385, "epoch": 3199} {"train_loss": -6.768422603607178, "global_step": 134386, "epoch": 3199} {"train_loss": -6.756855010986328, "global_step": 134387, "epoch": 3199} {"train_loss": -6.763853073120117, "global_step": 134388, "epoch": 3199} {"train_loss": -6.818786144256592, "global_step": 134389, "epoch": 3199} {"train_loss": -6.808881759643555, "global_step": 134390, "epoch": 3199} {"train_loss": -6.647579669952393, "global_step": 134391, "epoch": 3199} {"train_loss": -6.694580078125, "global_step": 134392, "epoch": 3199} {"train_loss": -6.759743690490723, "global_step": 134393, "epoch": 3199} {"train_loss": -6.790532112121582, "global_step": 134394, "epoch": 3199} {"train_loss": -6.771359443664551, "global_step": 134395, "epoch": 3199} {"train_loss": -6.7490129470825195, "global_step": 134396, "epoch": 3199} {"train_loss": -6.817699432373047, "global_step": 134397, "epoch": 3199} {"train_loss": -6.769054889678955, "global_step": 134398, "epoch": 3199} {"train_loss": -6.755641630717686, "global_step": 134399, "epoch": 3199, "val_loss": 77528.21875} {"train_loss": -6.625791549682617, "global_step": 134400, "epoch": 3200} {"train_loss": -6.933760166168213, "global_step": 134401, "epoch": 3200} {"train_loss": -6.731289386749268, "global_step": 134402, "epoch": 3200} {"train_loss": -6.777414321899414, "global_step": 134403, "epoch": 3200} {"train_loss": -6.813243865966797, "global_step": 134404, "epoch": 3200} {"train_loss": -6.76804256439209, "global_step": 134405, "epoch": 3200} {"train_loss": -6.738394260406494, "global_step": 134406, "epoch": 3200} {"train_loss": -6.788693904876709, "global_step": 134407, "epoch": 3200} {"train_loss": -6.787790298461914, "global_step": 134408, "epoch": 3200} {"train_loss": -6.763393878936768, "global_step": 134409, "epoch": 3200} {"train_loss": -6.786928653717041, "global_step": 134410, "epoch": 3200} {"train_loss": -6.797754287719727, "global_step": 134411, "epoch": 3200} {"train_loss": -6.721078872680664, "global_step": 134412, "epoch": 3200} {"train_loss": -6.690202713012695, "global_step": 134413, "epoch": 3200} {"train_loss": -6.782886505126953, "global_step": 134414, "epoch": 3200} {"train_loss": -6.727825164794922, "global_step": 134415, "epoch": 3200} {"train_loss": -6.818889617919922, "global_step": 134416, "epoch": 3200} {"train_loss": -6.732980728149414, "global_step": 134417, "epoch": 3200} {"train_loss": -6.765772819519043, "global_step": 134418, "epoch": 3200} {"train_loss": -6.7544474601745605, "global_step": 134419, "epoch": 3200} {"train_loss": -6.721345901489258, "global_step": 134420, "epoch": 3200} {"train_loss": -6.733510494232178, "global_step": 134421, "epoch": 3200} {"train_loss": -6.7393107414245605, "global_step": 134422, "epoch": 3200} {"train_loss": -6.657068729400635, "global_step": 134423, "epoch": 3200} {"train_loss": -6.664822101593018, "global_step": 134424, "epoch": 3200} {"train_loss": -6.75946044921875, "global_step": 134425, "epoch": 3200} {"train_loss": -6.816411972045898, "global_step": 134426, "epoch": 3200} {"train_loss": -6.6556901931762695, "global_step": 134427, "epoch": 3200} {"train_loss": -6.711430072784424, "global_step": 134428, "epoch": 3200} {"train_loss": -6.644749641418457, "global_step": 134429, "epoch": 3200} {"train_loss": -6.678135871887207, "global_step": 134430, "epoch": 3200} {"train_loss": -6.761005878448486, "global_step": 134431, "epoch": 3200} {"train_loss": -6.66480827331543, "global_step": 134432, "epoch": 3200} {"train_loss": -6.79123592376709, "global_step": 134433, "epoch": 3200} {"train_loss": -6.774421691894531, "global_step": 134434, "epoch": 3200} {"train_loss": -6.722767353057861, "global_step": 134435, "epoch": 3200} {"train_loss": -6.645476818084717, "global_step": 134436, "epoch": 3200} {"train_loss": -6.773839473724365, "global_step": 134437, "epoch": 3200} {"train_loss": -6.680981636047363, "global_step": 134438, "epoch": 3200} {"train_loss": -6.803434371948242, "global_step": 134439, "epoch": 3200} {"train_loss": -6.742469787597656, "global_step": 134440, "epoch": 3200} {"train_loss": -6.742800440107073, "global_step": 134441, "epoch": 3200, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 0.8804711871277354, "train/sim_max_reward_2": 0.5612179280993479, "train/sim_max_reward_3": 0.1475741331102797, "train/sim_max_reward_4": 0.24899108653302982, "train/sim_max_reward_5": 0.8106525296908091, "test/sim_max_reward_4500000": 0.9342817345428517, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8302707864491303, "test/sim_max_reward_4500003": 0.9608280742867659, "test/sim_max_reward_4500004": 0.2455907317718481, "test/sim_max_reward_4500005": 0.9226058921593198, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.8517950101475393, "test/sim_max_reward_4500008": 0.8989542994278008, "test/sim_max_reward_4500009": 0.053479768125535045, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9916245209879283, "test/sim_max_reward_4500012": 0.8244734020965134, "test/sim_max_reward_4500013": 0.008414508586346427, "test/sim_max_reward_4500014": 0.8143070932569398, "test/sim_max_reward_4500015": 0.7941357163452415, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.13657137962032612, "test/sim_max_reward_4500018": 0.4158750106179756, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.770396143191396, "test/sim_max_reward_4500022": 0.9676663865607489, "test/sim_max_reward_4500023": 0.8883339922233668, "test/sim_max_reward_4500024": 0.9938656143546541, "test/sim_max_reward_4500025": 0.8901771672030094, "test/sim_max_reward_4500026": 1.0, "test/sim_max_reward_4500027": 0.9020605991035298, "test/sim_max_reward_4500028": 0.1887070561044036, "test/sim_max_reward_4500029": 0.08080518882733247, "test/sim_max_reward_4500030": 0.9146606141043612, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.05212487674350988, "test/sim_max_reward_4500033": 0.8405422546964746, "test/sim_max_reward_4500034": 0.9285418214441056, "test/sim_max_reward_4500035": 0.7774328900789882, "test/sim_max_reward_4500036": 1.0, "test/sim_max_reward_4500037": 0.5001849146839211, "test/sim_max_reward_4500038": 0.32640751749071506, "test/sim_max_reward_4500039": 0.8879275670017169, "test/sim_max_reward_4500040": 0.9010132407784194, "test/sim_max_reward_4500041": 0.988939819352462, "test/sim_max_reward_4500042": 0.31812228525736547, "test/sim_max_reward_4500043": 0.9689426637997283, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.8894737063410202, "test/sim_max_reward_4500046": 0.9365125604132408, "test/sim_max_reward_4500047": 0.9239446850026255, "test/sim_max_reward_4500048": 0.9693047806783182, "test/sim_max_reward_4500049": 0.029404662524464505, "train/mean_score": 0.6081511440935337, "test/mean_score": 0.6186242544375837, "val_loss": 77711.671875} {"train_loss": -6.7122931480407715, "global_step": 134442, "epoch": 3201} {"train_loss": -6.87653923034668, "global_step": 134443, "epoch": 3201} {"train_loss": -6.694151401519775, "global_step": 134444, "epoch": 3201} {"train_loss": -6.6342034339904785, "global_step": 134445, "epoch": 3201} {"train_loss": -6.827783584594727, "global_step": 134446, "epoch": 3201} {"train_loss": -6.694863319396973, "global_step": 134447, "epoch": 3201} {"train_loss": -6.675330638885498, "global_step": 134448, "epoch": 3201} {"train_loss": -6.713372230529785, "global_step": 134449, "epoch": 3201} {"train_loss": -6.56522798538208, "global_step": 134450, "epoch": 3201} {"train_loss": -6.637702465057373, "global_step": 134451, "epoch": 3201} {"train_loss": -6.654706001281738, "global_step": 134452, "epoch": 3201} {"train_loss": -6.701602458953857, "global_step": 134453, "epoch": 3201} {"train_loss": -6.691189765930176, "global_step": 134454, "epoch": 3201} {"train_loss": -6.801295280456543, "global_step": 134455, "epoch": 3201} {"train_loss": -6.633923053741455, "global_step": 134456, "epoch": 3201} {"train_loss": -6.671131134033203, "global_step": 134457, "epoch": 3201} {"train_loss": -6.743838310241699, "global_step": 134458, "epoch": 3201} {"train_loss": -6.695732116699219, "global_step": 134459, "epoch": 3201} {"train_loss": -6.6746745109558105, "global_step": 134460, "epoch": 3201} {"train_loss": -6.730654239654541, "global_step": 134461, "epoch": 3201} {"train_loss": -6.70203971862793, "global_step": 134462, "epoch": 3201} {"train_loss": -6.79511022567749, "global_step": 134463, "epoch": 3201} {"train_loss": -6.657566070556641, "global_step": 134464, "epoch": 3201} {"train_loss": -6.595120429992676, "global_step": 134465, "epoch": 3201} {"train_loss": -6.692071914672852, "global_step": 134466, "epoch": 3201} {"train_loss": -6.600342273712158, "global_step": 134467, "epoch": 3201} {"train_loss": -6.738638401031494, "global_step": 134468, "epoch": 3201} {"train_loss": -6.643606185913086, "global_step": 134469, "epoch": 3201} {"train_loss": -6.772333145141602, "global_step": 134470, "epoch": 3201} {"train_loss": -6.657688140869141, "global_step": 134471, "epoch": 3201} {"train_loss": -6.656153202056885, "global_step": 134472, "epoch": 3201} {"train_loss": -6.624400615692139, "global_step": 134473, "epoch": 3201} {"train_loss": -6.656538963317871, "global_step": 134474, "epoch": 3201} {"train_loss": -6.655857086181641, "global_step": 134475, "epoch": 3201} {"train_loss": -6.589930534362793, "global_step": 134476, "epoch": 3201} {"train_loss": -6.707135200500488, "global_step": 134477, "epoch": 3201} {"train_loss": -6.670113563537598, "global_step": 134478, "epoch": 3201} {"train_loss": -6.682847023010254, "global_step": 134479, "epoch": 3201} {"train_loss": -6.717403888702393, "global_step": 134480, "epoch": 3201} {"train_loss": -6.6510467529296875, "global_step": 134481, "epoch": 3201} {"train_loss": -6.675543785095215, "global_step": 134482, "epoch": 3201} {"train_loss": -6.686036019098191, "global_step": 134483, "epoch": 3201, "val_loss": 77559.1328125} {"train_loss": -6.7465996742248535, "global_step": 134484, "epoch": 3202} {"train_loss": -6.798362731933594, "global_step": 134485, "epoch": 3202} {"train_loss": -6.768166542053223, "global_step": 134486, "epoch": 3202} {"train_loss": -6.774720668792725, "global_step": 134487, "epoch": 3202} {"train_loss": -6.679718017578125, "global_step": 134488, "epoch": 3202} {"train_loss": -6.7753705978393555, "global_step": 134489, "epoch": 3202} {"train_loss": -6.685691833496094, "global_step": 134490, "epoch": 3202} {"train_loss": -6.74566125869751, "global_step": 134491, "epoch": 3202} {"train_loss": -6.763423442840576, "global_step": 134492, "epoch": 3202} {"train_loss": -6.761647701263428, "global_step": 134493, "epoch": 3202} {"train_loss": -6.818890571594238, "global_step": 134494, "epoch": 3202} {"train_loss": -6.7351837158203125, "global_step": 134495, "epoch": 3202} {"train_loss": -6.804133415222168, "global_step": 134496, "epoch": 3202} {"train_loss": -6.8003668785095215, "global_step": 134497, "epoch": 3202} {"train_loss": -6.73587703704834, "global_step": 134498, "epoch": 3202} {"train_loss": -6.649477005004883, "global_step": 134499, "epoch": 3202} {"train_loss": -6.638943672180176, "global_step": 134500, "epoch": 3202} {"train_loss": -6.7710700035095215, "global_step": 134501, "epoch": 3202} {"train_loss": -6.752350807189941, "global_step": 134502, "epoch": 3202} {"train_loss": -6.785556793212891, "global_step": 134503, "epoch": 3202} {"train_loss": -6.742205619812012, "global_step": 134504, "epoch": 3202} {"train_loss": -6.657395362854004, "global_step": 134505, "epoch": 3202} {"train_loss": -6.704256057739258, "global_step": 134506, "epoch": 3202} {"train_loss": -6.766477584838867, "global_step": 134507, "epoch": 3202} {"train_loss": -6.640059471130371, "global_step": 134508, "epoch": 3202} {"train_loss": -6.732694625854492, "global_step": 134509, "epoch": 3202} {"train_loss": -6.659391403198242, "global_step": 134510, "epoch": 3202} {"train_loss": -6.752814292907715, "global_step": 134511, "epoch": 3202} {"train_loss": -6.705899238586426, "global_step": 134512, "epoch": 3202} {"train_loss": -6.814589977264404, "global_step": 134513, "epoch": 3202} {"train_loss": -6.669655799865723, "global_step": 134514, "epoch": 3202} {"train_loss": -6.705272674560547, "global_step": 134515, "epoch": 3202} {"train_loss": -6.614066123962402, "global_step": 134516, "epoch": 3202} {"train_loss": -6.806534290313721, "global_step": 134517, "epoch": 3202} {"train_loss": -6.745038032531738, "global_step": 134518, "epoch": 3202} {"train_loss": -6.691040515899658, "global_step": 134519, "epoch": 3202} {"train_loss": -6.683149337768555, "global_step": 134520, "epoch": 3202} {"train_loss": -6.632467269897461, "global_step": 134521, "epoch": 3202} {"train_loss": -6.764156341552734, "global_step": 134522, "epoch": 3202} {"train_loss": -6.720366954803467, "global_step": 134523, "epoch": 3202} {"train_loss": -6.800234317779541, "global_step": 134524, "epoch": 3202} {"train_loss": -6.729417517071679, "global_step": 134525, "epoch": 3202, "val_loss": 77606.5234375} {"train_loss": -6.790630340576172, "global_step": 134526, "epoch": 3203} {"train_loss": -6.693146705627441, "global_step": 134527, "epoch": 3203} {"train_loss": -6.688976764678955, "global_step": 134528, "epoch": 3203} {"train_loss": -6.8036274909973145, "global_step": 134529, "epoch": 3203} {"train_loss": -6.59273624420166, "global_step": 134530, "epoch": 3203} {"train_loss": -6.7972002029418945, "global_step": 134531, "epoch": 3203} {"train_loss": -6.823179244995117, "global_step": 134532, "epoch": 3203} {"train_loss": -6.715987682342529, "global_step": 134533, "epoch": 3203} {"train_loss": -6.567172527313232, "global_step": 134534, "epoch": 3203} {"train_loss": -6.777195453643799, "global_step": 134535, "epoch": 3203} {"train_loss": -6.746607780456543, "global_step": 134536, "epoch": 3203} {"train_loss": -6.634247779846191, "global_step": 134537, "epoch": 3203} {"train_loss": -6.862870216369629, "global_step": 134538, "epoch": 3203} {"train_loss": -6.684120178222656, "global_step": 134539, "epoch": 3203} {"train_loss": -6.670947551727295, "global_step": 134540, "epoch": 3203} {"train_loss": -6.589037895202637, "global_step": 134541, "epoch": 3203} {"train_loss": -6.613827228546143, "global_step": 134542, "epoch": 3203} {"train_loss": -6.5184502601623535, "global_step": 134543, "epoch": 3203} {"train_loss": -6.651395320892334, "global_step": 134544, "epoch": 3203} {"train_loss": -6.554169654846191, "global_step": 134545, "epoch": 3203} {"train_loss": -6.682662010192871, "global_step": 134546, "epoch": 3203} {"train_loss": -6.518360137939453, "global_step": 134547, "epoch": 3203} {"train_loss": -6.741359233856201, "global_step": 134548, "epoch": 3203} {"train_loss": -6.554078102111816, "global_step": 134549, "epoch": 3203} {"train_loss": -6.594484806060791, "global_step": 134550, "epoch": 3203} {"train_loss": -6.479649543762207, "global_step": 134551, "epoch": 3203} {"train_loss": -6.494956016540527, "global_step": 134552, "epoch": 3203} {"train_loss": -6.605624198913574, "global_step": 134553, "epoch": 3203} {"train_loss": -6.680400371551514, "global_step": 134554, "epoch": 3203} {"train_loss": -6.58875846862793, "global_step": 134555, "epoch": 3203} {"train_loss": -6.603495121002197, "global_step": 134556, "epoch": 3203} {"train_loss": -6.586933135986328, "global_step": 134557, "epoch": 3203} {"train_loss": -6.646373748779297, "global_step": 134558, "epoch": 3203} {"train_loss": -6.645846366882324, "global_step": 134559, "epoch": 3203} {"train_loss": -6.723998069763184, "global_step": 134560, "epoch": 3203} {"train_loss": -6.73124361038208, "global_step": 134561, "epoch": 3203} {"train_loss": -6.680095672607422, "global_step": 134562, "epoch": 3203} {"train_loss": -6.76209831237793, "global_step": 134563, "epoch": 3203} {"train_loss": -6.7077531814575195, "global_step": 134564, "epoch": 3203} {"train_loss": -6.5981035232543945, "global_step": 134565, "epoch": 3203} {"train_loss": -6.715672492980957, "global_step": 134566, "epoch": 3203} {"train_loss": -6.66386510076977, "global_step": 134567, "epoch": 3203, "val_loss": 77903.3515625} {"train_loss": -6.724578380584717, "global_step": 134568, "epoch": 3204} {"train_loss": -6.714820861816406, "global_step": 134569, "epoch": 3204} {"train_loss": -6.794947147369385, "global_step": 134570, "epoch": 3204} {"train_loss": -6.653173923492432, "global_step": 134571, "epoch": 3204} {"train_loss": -6.568761825561523, "global_step": 134572, "epoch": 3204} {"train_loss": -6.709300994873047, "global_step": 134573, "epoch": 3204} {"train_loss": -6.786801815032959, "global_step": 134574, "epoch": 3204} {"train_loss": -6.646857261657715, "global_step": 134575, "epoch": 3204} {"train_loss": -6.747117519378662, "global_step": 134576, "epoch": 3204} {"train_loss": -6.582796096801758, "global_step": 134577, "epoch": 3204} {"train_loss": -6.656067848205566, "global_step": 134578, "epoch": 3204} {"train_loss": -6.654560089111328, "global_step": 134579, "epoch": 3204} {"train_loss": -6.715668678283691, "global_step": 134580, "epoch": 3204} {"train_loss": -6.6253814697265625, "global_step": 134581, "epoch": 3204} {"train_loss": -6.72922945022583, "global_step": 134582, "epoch": 3204} {"train_loss": -6.723102569580078, "global_step": 134583, "epoch": 3204} {"train_loss": -6.749528884887695, "global_step": 134584, "epoch": 3204} {"train_loss": -6.772538185119629, "global_step": 134585, "epoch": 3204} {"train_loss": -6.632373809814453, "global_step": 134586, "epoch": 3204} {"train_loss": -6.8375115394592285, "global_step": 134587, "epoch": 3204} {"train_loss": -6.8008551597595215, "global_step": 134588, "epoch": 3204} {"train_loss": -6.636894226074219, "global_step": 134589, "epoch": 3204} {"train_loss": -6.72911262512207, "global_step": 134590, "epoch": 3204} {"train_loss": -6.662604331970215, "global_step": 134591, "epoch": 3204} {"train_loss": -6.574692249298096, "global_step": 134592, "epoch": 3204} {"train_loss": -6.637355804443359, "global_step": 134593, "epoch": 3204} {"train_loss": -6.711577415466309, "global_step": 134594, "epoch": 3204} {"train_loss": -6.677321910858154, "global_step": 134595, "epoch": 3204} {"train_loss": -6.679746627807617, "global_step": 134596, "epoch": 3204} {"train_loss": -6.642595291137695, "global_step": 134597, "epoch": 3204} {"train_loss": -6.64838981628418, "global_step": 134598, "epoch": 3204} {"train_loss": -6.555616855621338, "global_step": 134599, "epoch": 3204} {"train_loss": -6.684676647186279, "global_step": 134600, "epoch": 3204} {"train_loss": -6.609821319580078, "global_step": 134601, "epoch": 3204} {"train_loss": -6.496800899505615, "global_step": 134602, "epoch": 3204} {"train_loss": -6.631781101226807, "global_step": 134603, "epoch": 3204} {"train_loss": -6.589864253997803, "global_step": 134604, "epoch": 3204} {"train_loss": -6.610348701477051, "global_step": 134605, "epoch": 3204} {"train_loss": -6.717462539672852, "global_step": 134606, "epoch": 3204} {"train_loss": -6.705026626586914, "global_step": 134607, "epoch": 3204} {"train_loss": -6.661830425262451, "global_step": 134608, "epoch": 3204} {"train_loss": -6.67590806597755, "global_step": 134609, "epoch": 3204, "val_loss": 77601.6875} {"train_loss": -6.622522830963135, "global_step": 134610, "epoch": 3205} {"train_loss": -6.608083724975586, "global_step": 134611, "epoch": 3205} {"train_loss": -6.595737934112549, "global_step": 134612, "epoch": 3205} {"train_loss": -6.643718719482422, "global_step": 134613, "epoch": 3205} {"train_loss": -6.739675045013428, "global_step": 134614, "epoch": 3205} {"train_loss": -6.7102251052856445, "global_step": 134615, "epoch": 3205} {"train_loss": -6.648430824279785, "global_step": 134616, "epoch": 3205} {"train_loss": -6.704336166381836, "global_step": 134617, "epoch": 3205} {"train_loss": -6.651240825653076, "global_step": 134618, "epoch": 3205} {"train_loss": -6.677231788635254, "global_step": 134619, "epoch": 3205} {"train_loss": -6.750242233276367, "global_step": 134620, "epoch": 3205} {"train_loss": -6.676766395568848, "global_step": 134621, "epoch": 3205} {"train_loss": -6.69560432434082, "global_step": 134622, "epoch": 3205} {"train_loss": -6.655811309814453, "global_step": 134623, "epoch": 3205} {"train_loss": -6.647539138793945, "global_step": 134624, "epoch": 3205} {"train_loss": -6.758357524871826, "global_step": 134625, "epoch": 3205} {"train_loss": -6.766622543334961, "global_step": 134626, "epoch": 3205} {"train_loss": -6.689988136291504, "global_step": 134627, "epoch": 3205} {"train_loss": -6.810034275054932, "global_step": 134628, "epoch": 3205} {"train_loss": -6.691431522369385, "global_step": 134629, "epoch": 3205} {"train_loss": -6.628307819366455, "global_step": 134630, "epoch": 3205} {"train_loss": -6.690907955169678, "global_step": 134631, "epoch": 3205} {"train_loss": -6.686408519744873, "global_step": 134632, "epoch": 3205} {"train_loss": -6.471942901611328, "global_step": 134633, "epoch": 3205} {"train_loss": -6.685815334320068, "global_step": 134634, "epoch": 3205} {"train_loss": -6.637118339538574, "global_step": 134635, "epoch": 3205} {"train_loss": -6.627170562744141, "global_step": 134636, "epoch": 3205} {"train_loss": -6.697858810424805, "global_step": 134637, "epoch": 3205} {"train_loss": -6.706547260284424, "global_step": 134638, "epoch": 3205} {"train_loss": -6.7426886558532715, "global_step": 134639, "epoch": 3205} {"train_loss": -6.662390232086182, "global_step": 134640, "epoch": 3205} {"train_loss": -6.679300308227539, "global_step": 134641, "epoch": 3205} {"train_loss": -6.640775680541992, "global_step": 134642, "epoch": 3205} {"train_loss": -6.693471908569336, "global_step": 134643, "epoch": 3205} {"train_loss": -6.626694679260254, "global_step": 134644, "epoch": 3205} {"train_loss": -6.553011894226074, "global_step": 134645, "epoch": 3205} {"train_loss": -6.624556541442871, "global_step": 134646, "epoch": 3205} {"train_loss": -6.633289813995361, "global_step": 134647, "epoch": 3205} {"train_loss": -6.549335479736328, "global_step": 134648, "epoch": 3205} {"train_loss": -6.675060272216797, "global_step": 134649, "epoch": 3205} {"train_loss": -6.709082126617432, "global_step": 134650, "epoch": 3205} {"train_loss": -6.667072432381766, "global_step": 134651, "epoch": 3205, "val_loss": 77833.328125} {"train_loss": -6.75632381439209, "global_step": 134652, "epoch": 3206} {"train_loss": -6.533909320831299, "global_step": 134653, "epoch": 3206} {"train_loss": -6.600221633911133, "global_step": 134654, "epoch": 3206} {"train_loss": -6.558816432952881, "global_step": 134655, "epoch": 3206} {"train_loss": -6.56646728515625, "global_step": 134656, "epoch": 3206} {"train_loss": -6.749778747558594, "global_step": 134657, "epoch": 3206} {"train_loss": -6.67540168762207, "global_step": 134658, "epoch": 3206} {"train_loss": -6.788207530975342, "global_step": 134659, "epoch": 3206} {"train_loss": -6.677634239196777, "global_step": 134660, "epoch": 3206} {"train_loss": -6.650827884674072, "global_step": 134661, "epoch": 3206} {"train_loss": -6.650463104248047, "global_step": 134662, "epoch": 3206} {"train_loss": -6.671170234680176, "global_step": 134663, "epoch": 3206} {"train_loss": -6.685817718505859, "global_step": 134664, "epoch": 3206} {"train_loss": -6.71503210067749, "global_step": 134665, "epoch": 3206} {"train_loss": -6.681600093841553, "global_step": 134666, "epoch": 3206} {"train_loss": -6.816212177276611, "global_step": 134667, "epoch": 3206} {"train_loss": -6.653972625732422, "global_step": 134668, "epoch": 3206} {"train_loss": -6.716290473937988, "global_step": 134669, "epoch": 3206} {"train_loss": -6.578027725219727, "global_step": 134670, "epoch": 3206} {"train_loss": -6.646900653839111, "global_step": 134671, "epoch": 3206} {"train_loss": -6.875853061676025, "global_step": 134672, "epoch": 3206} {"train_loss": -6.713013172149658, "global_step": 134673, "epoch": 3206} {"train_loss": -6.716915607452393, "global_step": 134674, "epoch": 3206} {"train_loss": -6.701805114746094, "global_step": 134675, "epoch": 3206} {"train_loss": -6.6344099044799805, "global_step": 134676, "epoch": 3206} {"train_loss": -6.717142105102539, "global_step": 134677, "epoch": 3206} {"train_loss": -6.583451271057129, "global_step": 134678, "epoch": 3206} {"train_loss": -6.677896022796631, "global_step": 134679, "epoch": 3206} {"train_loss": -6.68079137802124, "global_step": 134680, "epoch": 3206} {"train_loss": -6.535910606384277, "global_step": 134681, "epoch": 3206} {"train_loss": -6.748898983001709, "global_step": 134682, "epoch": 3206} {"train_loss": -6.699128150939941, "global_step": 134683, "epoch": 3206} {"train_loss": -6.688854694366455, "global_step": 134684, "epoch": 3206} {"train_loss": -6.65968132019043, "global_step": 134685, "epoch": 3206} {"train_loss": -6.716386795043945, "global_step": 134686, "epoch": 3206} {"train_loss": -6.639105796813965, "global_step": 134687, "epoch": 3206} {"train_loss": -6.706658840179443, "global_step": 134688, "epoch": 3206} {"train_loss": -6.7288360595703125, "global_step": 134689, "epoch": 3206} {"train_loss": -6.547969341278076, "global_step": 134690, "epoch": 3206} {"train_loss": -6.7429633140563965, "global_step": 134691, "epoch": 3206} {"train_loss": -6.6167311668396, "global_step": 134692, "epoch": 3206} {"train_loss": -6.677018494833083, "global_step": 134693, "epoch": 3206, "val_loss": 77863.03125} {"train_loss": -6.826349258422852, "global_step": 134694, "epoch": 3207} {"train_loss": -6.73478364944458, "global_step": 134695, "epoch": 3207} {"train_loss": -6.813331127166748, "global_step": 134696, "epoch": 3207} {"train_loss": -6.75296688079834, "global_step": 134697, "epoch": 3207} {"train_loss": -6.767905235290527, "global_step": 134698, "epoch": 3207} {"train_loss": -6.777510643005371, "global_step": 134699, "epoch": 3207} {"train_loss": -6.597509860992432, "global_step": 134700, "epoch": 3207} {"train_loss": -6.708134174346924, "global_step": 134701, "epoch": 3207} {"train_loss": -6.725410461425781, "global_step": 134702, "epoch": 3207} {"train_loss": -6.719947338104248, "global_step": 134703, "epoch": 3207} {"train_loss": -6.62950325012207, "global_step": 134704, "epoch": 3207} {"train_loss": -6.711263179779053, "global_step": 134705, "epoch": 3207} {"train_loss": -6.761752128601074, "global_step": 134706, "epoch": 3207} {"train_loss": -6.593968868255615, "global_step": 134707, "epoch": 3207} {"train_loss": -6.596900939941406, "global_step": 134708, "epoch": 3207} {"train_loss": -6.795559406280518, "global_step": 134709, "epoch": 3207} {"train_loss": -6.675156593322754, "global_step": 134710, "epoch": 3207} {"train_loss": -6.889585018157959, "global_step": 134711, "epoch": 3207} {"train_loss": -6.733010768890381, "global_step": 134712, "epoch": 3207} {"train_loss": -6.795262336730957, "global_step": 134713, "epoch": 3207} {"train_loss": -6.716862201690674, "global_step": 134714, "epoch": 3207} {"train_loss": -6.741550445556641, "global_step": 134715, "epoch": 3207} {"train_loss": -6.636703968048096, "global_step": 134716, "epoch": 3207} {"train_loss": -6.710613250732422, "global_step": 134717, "epoch": 3207} {"train_loss": -6.787112236022949, "global_step": 134718, "epoch": 3207} {"train_loss": -6.648983955383301, "global_step": 134719, "epoch": 3207} {"train_loss": -6.585100173950195, "global_step": 134720, "epoch": 3207} {"train_loss": -6.713469982147217, "global_step": 134721, "epoch": 3207} {"train_loss": -6.724975109100342, "global_step": 134722, "epoch": 3207} {"train_loss": -6.620495796203613, "global_step": 134723, "epoch": 3207} {"train_loss": -6.652366638183594, "global_step": 134724, "epoch": 3207} {"train_loss": -6.7523956298828125, "global_step": 134725, "epoch": 3207} {"train_loss": -6.684247970581055, "global_step": 134726, "epoch": 3207} {"train_loss": -6.782296180725098, "global_step": 134727, "epoch": 3207} {"train_loss": -6.760855674743652, "global_step": 134728, "epoch": 3207} {"train_loss": -6.735536098480225, "global_step": 134729, "epoch": 3207} {"train_loss": -6.667764663696289, "global_step": 134730, "epoch": 3207} {"train_loss": -6.674933433532715, "global_step": 134731, "epoch": 3207} {"train_loss": -6.832882881164551, "global_step": 134732, "epoch": 3207} {"train_loss": -6.737490653991699, "global_step": 134733, "epoch": 3207} {"train_loss": -6.649809837341309, "global_step": 134734, "epoch": 3207} {"train_loss": -6.7137538478488015, "global_step": 134735, "epoch": 3207, "val_loss": 77606.9921875} {"train_loss": -6.6493988037109375, "global_step": 134736, "epoch": 3208} {"train_loss": -6.7594146728515625, "global_step": 134737, "epoch": 3208} {"train_loss": -6.674400329589844, "global_step": 134738, "epoch": 3208} {"train_loss": -6.744090557098389, "global_step": 134739, "epoch": 3208} {"train_loss": -6.648962020874023, "global_step": 134740, "epoch": 3208} {"train_loss": -6.729824066162109, "global_step": 134741, "epoch": 3208} {"train_loss": -6.710598945617676, "global_step": 134742, "epoch": 3208} {"train_loss": -6.623658180236816, "global_step": 134743, "epoch": 3208} {"train_loss": -6.875146865844727, "global_step": 134744, "epoch": 3208} {"train_loss": -6.807844161987305, "global_step": 134745, "epoch": 3208} {"train_loss": -6.620148658752441, "global_step": 134746, "epoch": 3208} {"train_loss": -6.69639778137207, "global_step": 134747, "epoch": 3208} {"train_loss": -6.761553764343262, "global_step": 134748, "epoch": 3208} {"train_loss": -6.728943824768066, "global_step": 134749, "epoch": 3208} {"train_loss": -6.609677314758301, "global_step": 134750, "epoch": 3208} {"train_loss": -6.676555633544922, "global_step": 134751, "epoch": 3208} {"train_loss": -6.704093933105469, "global_step": 134752, "epoch": 3208} {"train_loss": -6.8139567375183105, "global_step": 134753, "epoch": 3208} {"train_loss": -6.7056427001953125, "global_step": 134754, "epoch": 3208} {"train_loss": -6.67808723449707, "global_step": 134755, "epoch": 3208} {"train_loss": -6.615581035614014, "global_step": 134756, "epoch": 3208} {"train_loss": -6.666274070739746, "global_step": 134757, "epoch": 3208} {"train_loss": -6.676088333129883, "global_step": 134758, "epoch": 3208} {"train_loss": -6.704341888427734, "global_step": 134759, "epoch": 3208} {"train_loss": -6.707454681396484, "global_step": 134760, "epoch": 3208} {"train_loss": -6.717365741729736, "global_step": 134761, "epoch": 3208} {"train_loss": -6.693267822265625, "global_step": 134762, "epoch": 3208} {"train_loss": -6.780222415924072, "global_step": 134763, "epoch": 3208} {"train_loss": -6.752958297729492, "global_step": 134764, "epoch": 3208} {"train_loss": -6.65150260925293, "global_step": 134765, "epoch": 3208} {"train_loss": -6.715039253234863, "global_step": 134766, "epoch": 3208} {"train_loss": -6.790994644165039, "global_step": 134767, "epoch": 3208} {"train_loss": -6.704189777374268, "global_step": 134768, "epoch": 3208} {"train_loss": -6.7917585372924805, "global_step": 134769, "epoch": 3208} {"train_loss": -6.749934673309326, "global_step": 134770, "epoch": 3208} {"train_loss": -6.757392883300781, "global_step": 134771, "epoch": 3208} {"train_loss": -6.617920398712158, "global_step": 134772, "epoch": 3208} {"train_loss": -6.598855972290039, "global_step": 134773, "epoch": 3208} {"train_loss": -6.769791603088379, "global_step": 134774, "epoch": 3208} {"train_loss": -6.696826934814453, "global_step": 134775, "epoch": 3208} {"train_loss": -6.8367156982421875, "global_step": 134776, "epoch": 3208} {"train_loss": -6.714344762620472, "global_step": 134777, "epoch": 3208, "val_loss": 77770.8359375} {"train_loss": -6.82971715927124, "global_step": 134778, "epoch": 3209} {"train_loss": -6.766119003295898, "global_step": 134779, "epoch": 3209} {"train_loss": -6.796778678894043, "global_step": 134780, "epoch": 3209} {"train_loss": -6.902836799621582, "global_step": 134781, "epoch": 3209} {"train_loss": -6.840493202209473, "global_step": 134782, "epoch": 3209} {"train_loss": -6.738187789916992, "global_step": 134783, "epoch": 3209} {"train_loss": -6.708750247955322, "global_step": 134784, "epoch": 3209} {"train_loss": -6.73902702331543, "global_step": 134785, "epoch": 3209} {"train_loss": -6.691015243530273, "global_step": 134786, "epoch": 3209} {"train_loss": -6.737856864929199, "global_step": 134787, "epoch": 3209} {"train_loss": -6.802859306335449, "global_step": 134788, "epoch": 3209} {"train_loss": -6.663000583648682, "global_step": 134789, "epoch": 3209} {"train_loss": -6.6947784423828125, "global_step": 134790, "epoch": 3209} {"train_loss": -6.744508266448975, "global_step": 134791, "epoch": 3209} {"train_loss": -6.778182506561279, "global_step": 134792, "epoch": 3209} {"train_loss": -6.737456321716309, "global_step": 134793, "epoch": 3209} {"train_loss": -6.7288007736206055, "global_step": 134794, "epoch": 3209} {"train_loss": -6.781266212463379, "global_step": 134795, "epoch": 3209} {"train_loss": -6.715677738189697, "global_step": 134796, "epoch": 3209} {"train_loss": -6.665175914764404, "global_step": 134797, "epoch": 3209} {"train_loss": -6.701055526733398, "global_step": 134798, "epoch": 3209} {"train_loss": -6.753613471984863, "global_step": 134799, "epoch": 3209} {"train_loss": -6.796436309814453, "global_step": 134800, "epoch": 3209} {"train_loss": -6.707269668579102, "global_step": 134801, "epoch": 3209} {"train_loss": -6.760337829589844, "global_step": 134802, "epoch": 3209} {"train_loss": -6.7895917892456055, "global_step": 134803, "epoch": 3209} {"train_loss": -6.7490763664245605, "global_step": 134804, "epoch": 3209} {"train_loss": -6.796685218811035, "global_step": 134805, "epoch": 3209} {"train_loss": -6.673040390014648, "global_step": 134806, "epoch": 3209} {"train_loss": -6.622213363647461, "global_step": 134807, "epoch": 3209} {"train_loss": -6.753650665283203, "global_step": 134808, "epoch": 3209} {"train_loss": -6.674678802490234, "global_step": 134809, "epoch": 3209} {"train_loss": -6.540933609008789, "global_step": 134810, "epoch": 3209} {"train_loss": -6.626645088195801, "global_step": 134811, "epoch": 3209} {"train_loss": -6.672273635864258, "global_step": 134812, "epoch": 3209} {"train_loss": -6.728752613067627, "global_step": 134813, "epoch": 3209} {"train_loss": -6.658126354217529, "global_step": 134814, "epoch": 3209} {"train_loss": -6.6881866455078125, "global_step": 134815, "epoch": 3209} {"train_loss": -6.7214508056640625, "global_step": 134816, "epoch": 3209} {"train_loss": -6.757413864135742, "global_step": 134817, "epoch": 3209} {"train_loss": -6.663235664367676, "global_step": 134818, "epoch": 3209} {"train_loss": -6.7290407703036355, "global_step": 134819, "epoch": 3209, "val_loss": 77842.171875} {"train_loss": -6.688868999481201, "global_step": 134820, "epoch": 3210} {"train_loss": -6.614312648773193, "global_step": 134821, "epoch": 3210} {"train_loss": -6.714090347290039, "global_step": 134822, "epoch": 3210} {"train_loss": -6.7666826248168945, "global_step": 134823, "epoch": 3210} {"train_loss": -6.675296783447266, "global_step": 134824, "epoch": 3210} {"train_loss": -6.717464447021484, "global_step": 134825, "epoch": 3210} {"train_loss": -6.6564717292785645, "global_step": 134826, "epoch": 3210} {"train_loss": -6.671533584594727, "global_step": 134827, "epoch": 3210} {"train_loss": -6.657543182373047, "global_step": 134828, "epoch": 3210} {"train_loss": -6.693905830383301, "global_step": 134829, "epoch": 3210} {"train_loss": -6.649036407470703, "global_step": 134830, "epoch": 3210} {"train_loss": -6.56172513961792, "global_step": 134831, "epoch": 3210} {"train_loss": -6.600027561187744, "global_step": 134832, "epoch": 3210} {"train_loss": -6.736040115356445, "global_step": 134833, "epoch": 3210} {"train_loss": -6.576382637023926, "global_step": 134834, "epoch": 3210} {"train_loss": -6.663149356842041, "global_step": 134835, "epoch": 3210} {"train_loss": -6.532827377319336, "global_step": 134836, "epoch": 3210} {"train_loss": -6.578116416931152, "global_step": 134837, "epoch": 3210} {"train_loss": -6.784650802612305, "global_step": 134838, "epoch": 3210} {"train_loss": -6.5906982421875, "global_step": 134839, "epoch": 3210} {"train_loss": -6.662817001342773, "global_step": 134840, "epoch": 3210} {"train_loss": -6.70281457901001, "global_step": 134841, "epoch": 3210} {"train_loss": -6.587031364440918, "global_step": 134842, "epoch": 3210} {"train_loss": -6.700776100158691, "global_step": 134843, "epoch": 3210} {"train_loss": -6.5216169357299805, "global_step": 134844, "epoch": 3210} {"train_loss": -6.610438823699951, "global_step": 134845, "epoch": 3210} {"train_loss": -6.512015342712402, "global_step": 134846, "epoch": 3210} {"train_loss": -6.831701755523682, "global_step": 134847, "epoch": 3210} {"train_loss": -6.374053955078125, "global_step": 134848, "epoch": 3210} {"train_loss": -6.605892181396484, "global_step": 134849, "epoch": 3210} {"train_loss": -6.495368957519531, "global_step": 134850, "epoch": 3210} {"train_loss": -6.598554611206055, "global_step": 134851, "epoch": 3210} {"train_loss": -6.704774856567383, "global_step": 134852, "epoch": 3210} {"train_loss": -6.591012954711914, "global_step": 134853, "epoch": 3210} {"train_loss": -6.711904048919678, "global_step": 134854, "epoch": 3210} {"train_loss": -6.58610725402832, "global_step": 134855, "epoch": 3210} {"train_loss": -6.548280715942383, "global_step": 134856, "epoch": 3210} {"train_loss": -6.5794782638549805, "global_step": 134857, "epoch": 3210} {"train_loss": -6.6487836837768555, "global_step": 134858, "epoch": 3210} {"train_loss": -6.628159523010254, "global_step": 134859, "epoch": 3210} {"train_loss": -6.695822715759277, "global_step": 134860, "epoch": 3210} {"train_loss": -6.633773962656657, "global_step": 134861, "epoch": 3210, "val_loss": 78017.078125} {"train_loss": -6.726850986480713, "global_step": 134862, "epoch": 3211} {"train_loss": -6.698020935058594, "global_step": 134863, "epoch": 3211} {"train_loss": -6.828454971313477, "global_step": 134864, "epoch": 3211} {"train_loss": -6.637499809265137, "global_step": 134865, "epoch": 3211} {"train_loss": -6.522995948791504, "global_step": 134866, "epoch": 3211} {"train_loss": -6.618323802947998, "global_step": 134867, "epoch": 3211} {"train_loss": -6.539062976837158, "global_step": 134868, "epoch": 3211} {"train_loss": -6.702713966369629, "global_step": 134869, "epoch": 3211} {"train_loss": -6.789544105529785, "global_step": 134870, "epoch": 3211} {"train_loss": -6.709214687347412, "global_step": 134871, "epoch": 3211} {"train_loss": -6.7552595138549805, "global_step": 134872, "epoch": 3211} {"train_loss": -6.586841583251953, "global_step": 134873, "epoch": 3211} {"train_loss": -6.713484287261963, "global_step": 134874, "epoch": 3211} {"train_loss": -6.704499244689941, "global_step": 134875, "epoch": 3211} {"train_loss": -6.7686896324157715, "global_step": 134876, "epoch": 3211} {"train_loss": -6.551774978637695, "global_step": 134877, "epoch": 3211} {"train_loss": -6.766648292541504, "global_step": 134878, "epoch": 3211} {"train_loss": -6.730164051055908, "global_step": 134879, "epoch": 3211} {"train_loss": -6.791838645935059, "global_step": 134880, "epoch": 3211} {"train_loss": -6.8324689865112305, "global_step": 134881, "epoch": 3211} {"train_loss": -6.605940818786621, "global_step": 134882, "epoch": 3211} {"train_loss": -6.718268394470215, "global_step": 134883, "epoch": 3211} {"train_loss": -6.641654014587402, "global_step": 134884, "epoch": 3211} {"train_loss": -6.823409080505371, "global_step": 134885, "epoch": 3211} {"train_loss": -6.781329154968262, "global_step": 134886, "epoch": 3211} {"train_loss": -6.745230674743652, "global_step": 134887, "epoch": 3211} {"train_loss": -6.798418998718262, "global_step": 134888, "epoch": 3211} {"train_loss": -6.700323104858398, "global_step": 134889, "epoch": 3211} {"train_loss": -6.645583152770996, "global_step": 134890, "epoch": 3211} {"train_loss": -6.674729824066162, "global_step": 134891, "epoch": 3211} {"train_loss": -6.596622467041016, "global_step": 134892, "epoch": 3211} {"train_loss": -6.691418647766113, "global_step": 134893, "epoch": 3211} {"train_loss": -6.679553508758545, "global_step": 134894, "epoch": 3211} {"train_loss": -6.710592746734619, "global_step": 134895, "epoch": 3211} {"train_loss": -6.757290840148926, "global_step": 134896, "epoch": 3211} {"train_loss": -6.813129425048828, "global_step": 134897, "epoch": 3211} {"train_loss": -6.773426055908203, "global_step": 134898, "epoch": 3211} {"train_loss": -6.773886680603027, "global_step": 134899, "epoch": 3211} {"train_loss": -6.6666951179504395, "global_step": 134900, "epoch": 3211} {"train_loss": -6.765093803405762, "global_step": 134901, "epoch": 3211} {"train_loss": -6.699349403381348, "global_step": 134902, "epoch": 3211} {"train_loss": -6.707586197626023, "global_step": 134903, "epoch": 3211, "val_loss": 78080.0859375} {"train_loss": -6.6445770263671875, "global_step": 134904, "epoch": 3212} {"train_loss": -6.7901411056518555, "global_step": 134905, "epoch": 3212} {"train_loss": -6.6768293380737305, "global_step": 134906, "epoch": 3212} {"train_loss": -6.787566184997559, "global_step": 134907, "epoch": 3212} {"train_loss": -6.586086273193359, "global_step": 134908, "epoch": 3212} {"train_loss": -6.6365556716918945, "global_step": 134909, "epoch": 3212} {"train_loss": -6.751075744628906, "global_step": 134910, "epoch": 3212} {"train_loss": -6.644640922546387, "global_step": 134911, "epoch": 3212} {"train_loss": -6.771484375, "global_step": 134912, "epoch": 3212} {"train_loss": -6.708288669586182, "global_step": 134913, "epoch": 3212} {"train_loss": -6.624866008758545, "global_step": 134914, "epoch": 3212} {"train_loss": -6.544000625610352, "global_step": 134915, "epoch": 3212} {"train_loss": -6.796457767486572, "global_step": 134916, "epoch": 3212} {"train_loss": -6.610437870025635, "global_step": 134917, "epoch": 3212} {"train_loss": -6.599390983581543, "global_step": 134918, "epoch": 3212} {"train_loss": -6.789096355438232, "global_step": 134919, "epoch": 3212} {"train_loss": -6.688277721405029, "global_step": 134920, "epoch": 3212} {"train_loss": -6.707941055297852, "global_step": 134921, "epoch": 3212} {"train_loss": -6.617349147796631, "global_step": 134922, "epoch": 3212} {"train_loss": -6.650263786315918, "global_step": 134923, "epoch": 3212} {"train_loss": -6.722565650939941, "global_step": 134924, "epoch": 3212} {"train_loss": -6.751922607421875, "global_step": 134925, "epoch": 3212} {"train_loss": -6.745014190673828, "global_step": 134926, "epoch": 3212} {"train_loss": -6.600823402404785, "global_step": 134927, "epoch": 3212} {"train_loss": -6.633380889892578, "global_step": 134928, "epoch": 3212} {"train_loss": -6.811469078063965, "global_step": 134929, "epoch": 3212} {"train_loss": -6.723167419433594, "global_step": 134930, "epoch": 3212} {"train_loss": -6.712061882019043, "global_step": 134931, "epoch": 3212} {"train_loss": -6.61647891998291, "global_step": 134932, "epoch": 3212} {"train_loss": -6.742209434509277, "global_step": 134933, "epoch": 3212} {"train_loss": -6.694746971130371, "global_step": 134934, "epoch": 3212} {"train_loss": -6.768784046173096, "global_step": 134935, "epoch": 3212} {"train_loss": -6.753586769104004, "global_step": 134936, "epoch": 3212} {"train_loss": -6.6606879234313965, "global_step": 134937, "epoch": 3212} {"train_loss": -6.7899065017700195, "global_step": 134938, "epoch": 3212} {"train_loss": -6.639954090118408, "global_step": 134939, "epoch": 3212} {"train_loss": -6.655648231506348, "global_step": 134940, "epoch": 3212} {"train_loss": -6.780580997467041, "global_step": 134941, "epoch": 3212} {"train_loss": -6.726070404052734, "global_step": 134942, "epoch": 3212} {"train_loss": -6.675917148590088, "global_step": 134943, "epoch": 3212} {"train_loss": -6.800331115722656, "global_step": 134944, "epoch": 3212} {"train_loss": -6.698415256681896, "global_step": 134945, "epoch": 3212, "val_loss": 77866.46875} {"train_loss": -6.759955883026123, "global_step": 134946, "epoch": 3213} {"train_loss": -6.701325416564941, "global_step": 134947, "epoch": 3213} {"train_loss": -6.811768531799316, "global_step": 134948, "epoch": 3213} {"train_loss": -6.607944488525391, "global_step": 134949, "epoch": 3213} {"train_loss": -6.767404556274414, "global_step": 134950, "epoch": 3213} {"train_loss": -6.837954521179199, "global_step": 134951, "epoch": 3213} {"train_loss": -6.672147274017334, "global_step": 134952, "epoch": 3213} {"train_loss": -6.8114752769470215, "global_step": 134953, "epoch": 3213} {"train_loss": -6.756255626678467, "global_step": 134954, "epoch": 3213} {"train_loss": -6.81917142868042, "global_step": 134955, "epoch": 3213} {"train_loss": -6.805635929107666, "global_step": 134956, "epoch": 3213} {"train_loss": -6.84454345703125, "global_step": 134957, "epoch": 3213} {"train_loss": -6.62923002243042, "global_step": 134958, "epoch": 3213} {"train_loss": -6.6375885009765625, "global_step": 134959, "epoch": 3213} {"train_loss": -6.749770164489746, "global_step": 134960, "epoch": 3213} {"train_loss": -6.596375465393066, "global_step": 134961, "epoch": 3213} {"train_loss": -6.878614902496338, "global_step": 134962, "epoch": 3213} {"train_loss": -6.789793014526367, "global_step": 134963, "epoch": 3213} {"train_loss": -6.629461288452148, "global_step": 134964, "epoch": 3213} {"train_loss": -6.758336544036865, "global_step": 134965, "epoch": 3213} {"train_loss": -6.688377380371094, "global_step": 134966, "epoch": 3213} {"train_loss": -6.832810401916504, "global_step": 134967, "epoch": 3213} {"train_loss": -6.685091018676758, "global_step": 134968, "epoch": 3213} {"train_loss": -6.691416263580322, "global_step": 134969, "epoch": 3213} {"train_loss": -6.7281599044799805, "global_step": 134970, "epoch": 3213} {"train_loss": -6.622946739196777, "global_step": 134971, "epoch": 3213} {"train_loss": -6.738059043884277, "global_step": 134972, "epoch": 3213} {"train_loss": -6.72080135345459, "global_step": 134973, "epoch": 3213} {"train_loss": -6.641226768493652, "global_step": 134974, "epoch": 3213} {"train_loss": -6.750542163848877, "global_step": 134975, "epoch": 3213} {"train_loss": -6.712821006774902, "global_step": 134976, "epoch": 3213} {"train_loss": -6.631277561187744, "global_step": 134977, "epoch": 3213} {"train_loss": -6.7621307373046875, "global_step": 134978, "epoch": 3213} {"train_loss": -6.64495849609375, "global_step": 134979, "epoch": 3213} {"train_loss": -6.781826972961426, "global_step": 134980, "epoch": 3213} {"train_loss": -6.685098648071289, "global_step": 134981, "epoch": 3213} {"train_loss": -6.712974548339844, "global_step": 134982, "epoch": 3213} {"train_loss": -6.642553806304932, "global_step": 134983, "epoch": 3213} {"train_loss": -6.692901611328125, "global_step": 134984, "epoch": 3213} {"train_loss": -6.675928115844727, "global_step": 134985, "epoch": 3213} {"train_loss": -6.528168678283691, "global_step": 134986, "epoch": 3213} {"train_loss": -6.715835662115188, "global_step": 134987, "epoch": 3213, "val_loss": 77899.609375} {"train_loss": -6.781599044799805, "global_step": 134988, "epoch": 3214} {"train_loss": -6.6686482429504395, "global_step": 134989, "epoch": 3214} {"train_loss": -6.647761821746826, "global_step": 134990, "epoch": 3214} {"train_loss": -6.724039077758789, "global_step": 134991, "epoch": 3214} {"train_loss": -6.753902912139893, "global_step": 134992, "epoch": 3214} {"train_loss": -6.753439903259277, "global_step": 134993, "epoch": 3214} {"train_loss": -6.628212928771973, "global_step": 134994, "epoch": 3214} {"train_loss": -6.680456161499023, "global_step": 134995, "epoch": 3214} {"train_loss": -6.8102617263793945, "global_step": 134996, "epoch": 3214} {"train_loss": -6.702755928039551, "global_step": 134997, "epoch": 3214} {"train_loss": -6.6345977783203125, "global_step": 134998, "epoch": 3214} {"train_loss": -6.671330451965332, "global_step": 134999, "epoch": 3214} {"train_loss": -6.582056522369385, "global_step": 135000, "epoch": 3214} {"train_loss": -6.778806686401367, "global_step": 135001, "epoch": 3214} {"train_loss": -6.714733600616455, "global_step": 135002, "epoch": 3214} {"train_loss": -6.589580535888672, "global_step": 135003, "epoch": 3214} {"train_loss": -6.715520858764648, "global_step": 135004, "epoch": 3214} {"train_loss": -6.516239643096924, "global_step": 135005, "epoch": 3214} {"train_loss": -6.609549522399902, "global_step": 135006, "epoch": 3214} {"train_loss": -6.693815231323242, "global_step": 135007, "epoch": 3214} {"train_loss": -6.794157981872559, "global_step": 135008, "epoch": 3214} {"train_loss": -6.7334136962890625, "global_step": 135009, "epoch": 3214} {"train_loss": -6.784448146820068, "global_step": 135010, "epoch": 3214} {"train_loss": -6.799388885498047, "global_step": 135011, "epoch": 3214} {"train_loss": -6.664758682250977, "global_step": 135012, "epoch": 3214} {"train_loss": -6.76233434677124, "global_step": 135013, "epoch": 3214} {"train_loss": -6.758795738220215, "global_step": 135014, "epoch": 3214} {"train_loss": -6.543766021728516, "global_step": 135015, "epoch": 3214} {"train_loss": -6.811767578125, "global_step": 135016, "epoch": 3214} {"train_loss": -6.691634654998779, "global_step": 135017, "epoch": 3214} {"train_loss": -6.735045433044434, "global_step": 135018, "epoch": 3214} {"train_loss": -6.691594123840332, "global_step": 135019, "epoch": 3214} {"train_loss": -6.694158554077148, "global_step": 135020, "epoch": 3214} {"train_loss": -6.66571569442749, "global_step": 135021, "epoch": 3214} {"train_loss": -6.681551933288574, "global_step": 135022, "epoch": 3214} {"train_loss": -6.780868053436279, "global_step": 135023, "epoch": 3214} {"train_loss": -6.747206687927246, "global_step": 135024, "epoch": 3214} {"train_loss": -6.677602767944336, "global_step": 135025, "epoch": 3214} {"train_loss": -6.723798751831055, "global_step": 135026, "epoch": 3214} {"train_loss": -6.772758483886719, "global_step": 135027, "epoch": 3214} {"train_loss": -6.775489330291748, "global_step": 135028, "epoch": 3214} {"train_loss": -6.709230559212821, "global_step": 135029, "epoch": 3214, "val_loss": 77631.7109375} {"train_loss": -6.864727973937988, "global_step": 135030, "epoch": 3215} {"train_loss": -6.7608771324157715, "global_step": 135031, "epoch": 3215} {"train_loss": -6.765317916870117, "global_step": 135032, "epoch": 3215} {"train_loss": -6.742740631103516, "global_step": 135033, "epoch": 3215} {"train_loss": -6.816131591796875, "global_step": 135034, "epoch": 3215} {"train_loss": -6.756939888000488, "global_step": 135035, "epoch": 3215} {"train_loss": -6.691995620727539, "global_step": 135036, "epoch": 3215} {"train_loss": -6.691006660461426, "global_step": 135037, "epoch": 3215} {"train_loss": -6.751128196716309, "global_step": 135038, "epoch": 3215} {"train_loss": -6.817378520965576, "global_step": 135039, "epoch": 3215} {"train_loss": -6.761466026306152, "global_step": 135040, "epoch": 3215} {"train_loss": -6.776012420654297, "global_step": 135041, "epoch": 3215} {"train_loss": -6.664338111877441, "global_step": 135042, "epoch": 3215} {"train_loss": -6.7106122970581055, "global_step": 135043, "epoch": 3215} {"train_loss": -6.536520957946777, "global_step": 135044, "epoch": 3215} {"train_loss": -6.773508071899414, "global_step": 135045, "epoch": 3215} {"train_loss": -6.615009784698486, "global_step": 135046, "epoch": 3215} {"train_loss": -6.748851776123047, "global_step": 135047, "epoch": 3215} {"train_loss": -6.841974258422852, "global_step": 135048, "epoch": 3215} {"train_loss": -6.7119855880737305, "global_step": 135049, "epoch": 3215} {"train_loss": -6.718399524688721, "global_step": 135050, "epoch": 3215} {"train_loss": -6.661563396453857, "global_step": 135051, "epoch": 3215} {"train_loss": -6.698004722595215, "global_step": 135052, "epoch": 3215} {"train_loss": -6.736781597137451, "global_step": 135053, "epoch": 3215} {"train_loss": -6.76655387878418, "global_step": 135054, "epoch": 3215} {"train_loss": -6.669553756713867, "global_step": 135055, "epoch": 3215} {"train_loss": -6.766321182250977, "global_step": 135056, "epoch": 3215} {"train_loss": -6.762678146362305, "global_step": 135057, "epoch": 3215} {"train_loss": -6.7465691566467285, "global_step": 135058, "epoch": 3215} {"train_loss": -6.668923377990723, "global_step": 135059, "epoch": 3215} {"train_loss": -6.7057719230651855, "global_step": 135060, "epoch": 3215} {"train_loss": -6.846808433532715, "global_step": 135061, "epoch": 3215} {"train_loss": -6.713376998901367, "global_step": 135062, "epoch": 3215} {"train_loss": -6.757533073425293, "global_step": 135063, "epoch": 3215} {"train_loss": -6.788908004760742, "global_step": 135064, "epoch": 3215} {"train_loss": -6.7388834953308105, "global_step": 135065, "epoch": 3215} {"train_loss": -6.796716690063477, "global_step": 135066, "epoch": 3215} {"train_loss": -6.7456865310668945, "global_step": 135067, "epoch": 3215} {"train_loss": -6.76499080657959, "global_step": 135068, "epoch": 3215} {"train_loss": -6.725800514221191, "global_step": 135069, "epoch": 3215} {"train_loss": -6.779715538024902, "global_step": 135070, "epoch": 3215} {"train_loss": -6.7361789998554045, "global_step": 135071, "epoch": 3215, "val_loss": 77824.734375} {"train_loss": -6.7787041664123535, "global_step": 135072, "epoch": 3216} {"train_loss": -6.7494916915893555, "global_step": 135073, "epoch": 3216} {"train_loss": -6.826900005340576, "global_step": 135074, "epoch": 3216} {"train_loss": -6.6694440841674805, "global_step": 135075, "epoch": 3216} {"train_loss": -6.710134506225586, "global_step": 135076, "epoch": 3216} {"train_loss": -6.939681053161621, "global_step": 135077, "epoch": 3216} {"train_loss": -6.816684246063232, "global_step": 135078, "epoch": 3216} {"train_loss": -6.76589298248291, "global_step": 135079, "epoch": 3216} {"train_loss": -6.768783092498779, "global_step": 135080, "epoch": 3216} {"train_loss": -6.670815467834473, "global_step": 135081, "epoch": 3216} {"train_loss": -6.667812347412109, "global_step": 135082, "epoch": 3216} {"train_loss": -6.741726875305176, "global_step": 135083, "epoch": 3216} {"train_loss": -6.758360862731934, "global_step": 135084, "epoch": 3216} {"train_loss": -6.740063667297363, "global_step": 135085, "epoch": 3216} {"train_loss": -6.661220550537109, "global_step": 135086, "epoch": 3216} {"train_loss": -6.6812920570373535, "global_step": 135087, "epoch": 3216} {"train_loss": -6.546971321105957, "global_step": 135088, "epoch": 3216} {"train_loss": -6.618124008178711, "global_step": 135089, "epoch": 3216} {"train_loss": -6.7445759773254395, "global_step": 135090, "epoch": 3216} {"train_loss": -6.718311309814453, "global_step": 135091, "epoch": 3216} {"train_loss": -6.723254680633545, "global_step": 135092, "epoch": 3216} {"train_loss": -6.713471412658691, "global_step": 135093, "epoch": 3216} {"train_loss": -6.778356552124023, "global_step": 135094, "epoch": 3216} {"train_loss": -6.756084442138672, "global_step": 135095, "epoch": 3216} {"train_loss": -6.848660469055176, "global_step": 135096, "epoch": 3216} {"train_loss": -6.8421430587768555, "global_step": 135097, "epoch": 3216} {"train_loss": -6.6168212890625, "global_step": 135098, "epoch": 3216} {"train_loss": -6.652071952819824, "global_step": 135099, "epoch": 3216} {"train_loss": -6.653444290161133, "global_step": 135100, "epoch": 3216} {"train_loss": -6.86574649810791, "global_step": 135101, "epoch": 3216} {"train_loss": -6.74875545501709, "global_step": 135102, "epoch": 3216} {"train_loss": -6.68682861328125, "global_step": 135103, "epoch": 3216} {"train_loss": -6.724254608154297, "global_step": 135104, "epoch": 3216} {"train_loss": -6.715917587280273, "global_step": 135105, "epoch": 3216} {"train_loss": -6.687942981719971, "global_step": 135106, "epoch": 3216} {"train_loss": -6.833129405975342, "global_step": 135107, "epoch": 3216} {"train_loss": -6.806652069091797, "global_step": 135108, "epoch": 3216} {"train_loss": -6.673892974853516, "global_step": 135109, "epoch": 3216} {"train_loss": -6.777178764343262, "global_step": 135110, "epoch": 3216} {"train_loss": -6.892978668212891, "global_step": 135111, "epoch": 3216} {"train_loss": -6.844996452331543, "global_step": 135112, "epoch": 3216} {"train_loss": -6.742350351242792, "global_step": 135113, "epoch": 3216, "val_loss": 77603.421875} {"train_loss": -6.790135383605957, "global_step": 135114, "epoch": 3217} {"train_loss": -6.809088230133057, "global_step": 135115, "epoch": 3217} {"train_loss": -6.76560115814209, "global_step": 135116, "epoch": 3217} {"train_loss": -6.783997535705566, "global_step": 135117, "epoch": 3217} {"train_loss": -6.874527931213379, "global_step": 135118, "epoch": 3217} {"train_loss": -6.762312889099121, "global_step": 135119, "epoch": 3217} {"train_loss": -6.797784805297852, "global_step": 135120, "epoch": 3217} {"train_loss": -6.843622207641602, "global_step": 135121, "epoch": 3217} {"train_loss": -6.804111480712891, "global_step": 135122, "epoch": 3217} {"train_loss": -6.760690689086914, "global_step": 135123, "epoch": 3217} {"train_loss": -6.726646423339844, "global_step": 135124, "epoch": 3217} {"train_loss": -6.847654342651367, "global_step": 135125, "epoch": 3217} {"train_loss": -6.711332321166992, "global_step": 135126, "epoch": 3217} {"train_loss": -6.83741569519043, "global_step": 135127, "epoch": 3217} {"train_loss": -6.742727279663086, "global_step": 135128, "epoch": 3217} {"train_loss": -6.678661346435547, "global_step": 135129, "epoch": 3217} {"train_loss": -6.6309309005737305, "global_step": 135130, "epoch": 3217} {"train_loss": -6.6979780197143555, "global_step": 135131, "epoch": 3217} {"train_loss": -6.640040874481201, "global_step": 135132, "epoch": 3217} {"train_loss": -6.621884346008301, "global_step": 135133, "epoch": 3217} {"train_loss": -6.668052673339844, "global_step": 135134, "epoch": 3217} {"train_loss": -6.700692653656006, "global_step": 135135, "epoch": 3217} {"train_loss": -6.676734924316406, "global_step": 135136, "epoch": 3217} {"train_loss": -6.660727024078369, "global_step": 135137, "epoch": 3217} {"train_loss": -6.830587863922119, "global_step": 135138, "epoch": 3217} {"train_loss": -6.674614906311035, "global_step": 135139, "epoch": 3217} {"train_loss": -6.663055419921875, "global_step": 135140, "epoch": 3217} {"train_loss": -6.741979598999023, "global_step": 135141, "epoch": 3217} {"train_loss": -6.733495712280273, "global_step": 135142, "epoch": 3217} {"train_loss": -6.670711517333984, "global_step": 135143, "epoch": 3217} {"train_loss": -6.684961795806885, "global_step": 135144, "epoch": 3217} {"train_loss": -6.668035507202148, "global_step": 135145, "epoch": 3217} {"train_loss": -6.726723670959473, "global_step": 135146, "epoch": 3217} {"train_loss": -6.730100631713867, "global_step": 135147, "epoch": 3217} {"train_loss": -6.601075172424316, "global_step": 135148, "epoch": 3217} {"train_loss": -6.714552879333496, "global_step": 135149, "epoch": 3217} {"train_loss": -6.701422691345215, "global_step": 135150, "epoch": 3217} {"train_loss": -6.69047737121582, "global_step": 135151, "epoch": 3217} {"train_loss": -6.6627092361450195, "global_step": 135152, "epoch": 3217} {"train_loss": -6.651709079742432, "global_step": 135153, "epoch": 3217} {"train_loss": -6.671232223510742, "global_step": 135154, "epoch": 3217} {"train_loss": -6.719912052154541, "global_step": 135155, "epoch": 3217, "val_loss": 77861.6484375} {"train_loss": -6.7128143310546875, "global_step": 135156, "epoch": 3218} {"train_loss": -6.582819938659668, "global_step": 135157, "epoch": 3218} {"train_loss": -6.568124294281006, "global_step": 135158, "epoch": 3218} {"train_loss": -6.814783096313477, "global_step": 135159, "epoch": 3218} {"train_loss": -6.682032585144043, "global_step": 135160, "epoch": 3218} {"train_loss": -6.63297176361084, "global_step": 135161, "epoch": 3218} {"train_loss": -6.836182594299316, "global_step": 135162, "epoch": 3218} {"train_loss": -6.659666538238525, "global_step": 135163, "epoch": 3218} {"train_loss": -6.486437797546387, "global_step": 135164, "epoch": 3218} {"train_loss": -6.573144912719727, "global_step": 135165, "epoch": 3218} {"train_loss": -6.595645904541016, "global_step": 135166, "epoch": 3218} {"train_loss": -6.6846232414245605, "global_step": 135167, "epoch": 3218} {"train_loss": -6.679660797119141, "global_step": 135168, "epoch": 3218} {"train_loss": -6.5737810134887695, "global_step": 135169, "epoch": 3218} {"train_loss": -6.735893249511719, "global_step": 135170, "epoch": 3218} {"train_loss": -6.661869525909424, "global_step": 135171, "epoch": 3218} {"train_loss": -6.667593479156494, "global_step": 135172, "epoch": 3218} {"train_loss": -6.633991718292236, "global_step": 135173, "epoch": 3218} {"train_loss": -6.6271467208862305, "global_step": 135174, "epoch": 3218} {"train_loss": -6.5108113288879395, "global_step": 135175, "epoch": 3218} {"train_loss": -6.595791339874268, "global_step": 135176, "epoch": 3218} {"train_loss": -6.707658290863037, "global_step": 135177, "epoch": 3218} {"train_loss": -6.553246021270752, "global_step": 135178, "epoch": 3218} {"train_loss": -6.6261067390441895, "global_step": 135179, "epoch": 3218} {"train_loss": -6.516932010650635, "global_step": 135180, "epoch": 3218} {"train_loss": -6.676937103271484, "global_step": 135181, "epoch": 3218} {"train_loss": -6.66185188293457, "global_step": 135182, "epoch": 3218} {"train_loss": -6.688641548156738, "global_step": 135183, "epoch": 3218} {"train_loss": -6.577735900878906, "global_step": 135184, "epoch": 3218} {"train_loss": -6.715734958648682, "global_step": 135185, "epoch": 3218} {"train_loss": -6.724530220031738, "global_step": 135186, "epoch": 3218} {"train_loss": -6.691447734832764, "global_step": 135187, "epoch": 3218} {"train_loss": -6.686470985412598, "global_step": 135188, "epoch": 3218} {"train_loss": -6.762479782104492, "global_step": 135189, "epoch": 3218} {"train_loss": -6.7914838790893555, "global_step": 135190, "epoch": 3218} {"train_loss": -6.704373836517334, "global_step": 135191, "epoch": 3218} {"train_loss": -6.647023677825928, "global_step": 135192, "epoch": 3218} {"train_loss": -6.60211181640625, "global_step": 135193, "epoch": 3218} {"train_loss": -6.677069664001465, "global_step": 135194, "epoch": 3218} {"train_loss": -6.721159934997559, "global_step": 135195, "epoch": 3218} {"train_loss": -6.73674201965332, "global_step": 135196, "epoch": 3218} {"train_loss": -6.659830206916446, "global_step": 135197, "epoch": 3218, "val_loss": 77593.2109375} {"train_loss": -6.786934852600098, "global_step": 135198, "epoch": 3219} {"train_loss": -6.802126884460449, "global_step": 135199, "epoch": 3219} {"train_loss": -6.72295618057251, "global_step": 135200, "epoch": 3219} {"train_loss": -6.754899024963379, "global_step": 135201, "epoch": 3219} {"train_loss": -6.776350021362305, "global_step": 135202, "epoch": 3219} {"train_loss": -6.741467475891113, "global_step": 135203, "epoch": 3219} {"train_loss": -6.767900466918945, "global_step": 135204, "epoch": 3219} {"train_loss": -6.640494346618652, "global_step": 135205, "epoch": 3219} {"train_loss": -6.787303924560547, "global_step": 135206, "epoch": 3219} {"train_loss": -6.786273956298828, "global_step": 135207, "epoch": 3219} {"train_loss": -6.829724311828613, "global_step": 135208, "epoch": 3219} {"train_loss": -6.7081146240234375, "global_step": 135209, "epoch": 3219} {"train_loss": -6.804427623748779, "global_step": 135210, "epoch": 3219} {"train_loss": -6.789722919464111, "global_step": 135211, "epoch": 3219} {"train_loss": -6.8832292556762695, "global_step": 135212, "epoch": 3219} {"train_loss": -6.753383636474609, "global_step": 135213, "epoch": 3219} {"train_loss": -6.772212028503418, "global_step": 135214, "epoch": 3219} {"train_loss": -6.684097766876221, "global_step": 135215, "epoch": 3219} {"train_loss": -6.683620929718018, "global_step": 135216, "epoch": 3219} {"train_loss": -6.756275177001953, "global_step": 135217, "epoch": 3219} {"train_loss": -6.551945209503174, "global_step": 135218, "epoch": 3219} {"train_loss": -6.7316203117370605, "global_step": 135219, "epoch": 3219} {"train_loss": -6.639407157897949, "global_step": 135220, "epoch": 3219} {"train_loss": -6.550330638885498, "global_step": 135221, "epoch": 3219} {"train_loss": -6.705435752868652, "global_step": 135222, "epoch": 3219} {"train_loss": -6.709139823913574, "global_step": 135223, "epoch": 3219} {"train_loss": -6.659785270690918, "global_step": 135224, "epoch": 3219} {"train_loss": -6.793025016784668, "global_step": 135225, "epoch": 3219} {"train_loss": -6.8156538009643555, "global_step": 135226, "epoch": 3219} {"train_loss": -6.801455497741699, "global_step": 135227, "epoch": 3219} {"train_loss": -6.7474565505981445, "global_step": 135228, "epoch": 3219} {"train_loss": -6.648652076721191, "global_step": 135229, "epoch": 3219} {"train_loss": -6.8392438888549805, "global_step": 135230, "epoch": 3219} {"train_loss": -6.747188568115234, "global_step": 135231, "epoch": 3219} {"train_loss": -6.699651718139648, "global_step": 135232, "epoch": 3219} {"train_loss": -6.753770351409912, "global_step": 135233, "epoch": 3219} {"train_loss": -6.703829288482666, "global_step": 135234, "epoch": 3219} {"train_loss": -6.82416296005249, "global_step": 135235, "epoch": 3219} {"train_loss": -6.6732025146484375, "global_step": 135236, "epoch": 3219} {"train_loss": -6.824247360229492, "global_step": 135237, "epoch": 3219} {"train_loss": -6.8476972579956055, "global_step": 135238, "epoch": 3219} {"train_loss": -6.742226112456549, "global_step": 135239, "epoch": 3219, "val_loss": 77882.9140625} {"train_loss": -6.748357772827148, "global_step": 135240, "epoch": 3220} {"train_loss": -6.75018310546875, "global_step": 135241, "epoch": 3220} {"train_loss": -6.815213680267334, "global_step": 135242, "epoch": 3220} {"train_loss": -6.850342273712158, "global_step": 135243, "epoch": 3220} {"train_loss": -6.770838737487793, "global_step": 135244, "epoch": 3220} {"train_loss": -6.665894508361816, "global_step": 135245, "epoch": 3220} {"train_loss": -6.63419246673584, "global_step": 135246, "epoch": 3220} {"train_loss": -6.656192302703857, "global_step": 135247, "epoch": 3220} {"train_loss": -6.7235493659973145, "global_step": 135248, "epoch": 3220} {"train_loss": -6.700322151184082, "global_step": 135249, "epoch": 3220} {"train_loss": -6.751217842102051, "global_step": 135250, "epoch": 3220} {"train_loss": -6.73985481262207, "global_step": 135251, "epoch": 3220} {"train_loss": -6.612780570983887, "global_step": 135252, "epoch": 3220} {"train_loss": -6.67075777053833, "global_step": 135253, "epoch": 3220} {"train_loss": -6.780391216278076, "global_step": 135254, "epoch": 3220} {"train_loss": -6.652266025543213, "global_step": 135255, "epoch": 3220} {"train_loss": -6.5830230712890625, "global_step": 135256, "epoch": 3220} {"train_loss": -6.780017375946045, "global_step": 135257, "epoch": 3220} {"train_loss": -6.689505577087402, "global_step": 135258, "epoch": 3220} {"train_loss": -6.783605575561523, "global_step": 135259, "epoch": 3220} {"train_loss": -6.69010066986084, "global_step": 135260, "epoch": 3220} {"train_loss": -6.597978115081787, "global_step": 135261, "epoch": 3220} {"train_loss": -6.611765384674072, "global_step": 135262, "epoch": 3220} {"train_loss": -6.809893608093262, "global_step": 135263, "epoch": 3220} {"train_loss": -6.843732833862305, "global_step": 135264, "epoch": 3220} {"train_loss": -6.714847564697266, "global_step": 135265, "epoch": 3220} {"train_loss": -6.690500259399414, "global_step": 135266, "epoch": 3220} {"train_loss": -6.7868242263793945, "global_step": 135267, "epoch": 3220} {"train_loss": -6.724571228027344, "global_step": 135268, "epoch": 3220} {"train_loss": -6.731501579284668, "global_step": 135269, "epoch": 3220} {"train_loss": -6.776006698608398, "global_step": 135270, "epoch": 3220} {"train_loss": -6.753880977630615, "global_step": 135271, "epoch": 3220} {"train_loss": -6.756484031677246, "global_step": 135272, "epoch": 3220} {"train_loss": -6.797827243804932, "global_step": 135273, "epoch": 3220} {"train_loss": -6.7663774490356445, "global_step": 135274, "epoch": 3220} {"train_loss": -6.684908390045166, "global_step": 135275, "epoch": 3220} {"train_loss": -6.7192583084106445, "global_step": 135276, "epoch": 3220} {"train_loss": -6.745378017425537, "global_step": 135277, "epoch": 3220} {"train_loss": -6.7514238357543945, "global_step": 135278, "epoch": 3220} {"train_loss": -6.704880714416504, "global_step": 135279, "epoch": 3220} {"train_loss": -6.745635032653809, "global_step": 135280, "epoch": 3220} {"train_loss": -6.727381501879011, "global_step": 135281, "epoch": 3220, "val_loss": 77921.171875} {"train_loss": -6.738414764404297, "global_step": 135282, "epoch": 3221} {"train_loss": -6.827216625213623, "global_step": 135283, "epoch": 3221} {"train_loss": -6.668614387512207, "global_step": 135284, "epoch": 3221} {"train_loss": -6.644264221191406, "global_step": 135285, "epoch": 3221} {"train_loss": -6.692303657531738, "global_step": 135286, "epoch": 3221} {"train_loss": -6.797661304473877, "global_step": 135287, "epoch": 3221} {"train_loss": -6.7653489112854, "global_step": 135288, "epoch": 3221} {"train_loss": -6.803134441375732, "global_step": 135289, "epoch": 3221} {"train_loss": -6.743039608001709, "global_step": 135290, "epoch": 3221} {"train_loss": -6.7305192947387695, "global_step": 135291, "epoch": 3221} {"train_loss": -6.771939277648926, "global_step": 135292, "epoch": 3221} {"train_loss": -6.780167579650879, "global_step": 135293, "epoch": 3221} {"train_loss": -6.823513984680176, "global_step": 135294, "epoch": 3221} {"train_loss": -6.738157272338867, "global_step": 135295, "epoch": 3221} {"train_loss": -6.766529560089111, "global_step": 135296, "epoch": 3221} {"train_loss": -6.800630569458008, "global_step": 135297, "epoch": 3221} {"train_loss": -6.752342224121094, "global_step": 135298, "epoch": 3221} {"train_loss": -6.699912071228027, "global_step": 135299, "epoch": 3221} {"train_loss": -6.6757731437683105, "global_step": 135300, "epoch": 3221} {"train_loss": -6.629815101623535, "global_step": 135301, "epoch": 3221} {"train_loss": -6.729811668395996, "global_step": 135302, "epoch": 3221} {"train_loss": -6.541637420654297, "global_step": 135303, "epoch": 3221} {"train_loss": -6.648877143859863, "global_step": 135304, "epoch": 3221} {"train_loss": -6.5989274978637695, "global_step": 135305, "epoch": 3221} {"train_loss": -6.618804931640625, "global_step": 135306, "epoch": 3221} {"train_loss": -6.7487945556640625, "global_step": 135307, "epoch": 3221} {"train_loss": -6.700106620788574, "global_step": 135308, "epoch": 3221} {"train_loss": -6.7728424072265625, "global_step": 135309, "epoch": 3221} {"train_loss": -6.657044410705566, "global_step": 135310, "epoch": 3221} {"train_loss": -6.723060607910156, "global_step": 135311, "epoch": 3221} {"train_loss": -6.581241607666016, "global_step": 135312, "epoch": 3221} {"train_loss": -6.612920761108398, "global_step": 135313, "epoch": 3221} {"train_loss": -6.746838092803955, "global_step": 135314, "epoch": 3221} {"train_loss": -6.793488502502441, "global_step": 135315, "epoch": 3221} {"train_loss": -6.767858505249023, "global_step": 135316, "epoch": 3221} {"train_loss": -6.651877403259277, "global_step": 135317, "epoch": 3221} {"train_loss": -6.71558952331543, "global_step": 135318, "epoch": 3221} {"train_loss": -6.590844631195068, "global_step": 135319, "epoch": 3221} {"train_loss": -6.689889430999756, "global_step": 135320, "epoch": 3221} {"train_loss": -6.738661289215088, "global_step": 135321, "epoch": 3221} {"train_loss": -6.631261825561523, "global_step": 135322, "epoch": 3221} {"train_loss": -6.710775398072743, "global_step": 135323, "epoch": 3221, "val_loss": 77902.0390625} {"train_loss": -6.779610633850098, "global_step": 135324, "epoch": 3222} {"train_loss": -6.740623474121094, "global_step": 135325, "epoch": 3222} {"train_loss": -6.79287576675415, "global_step": 135326, "epoch": 3222} {"train_loss": -6.744817733764648, "global_step": 135327, "epoch": 3222} {"train_loss": -6.829732418060303, "global_step": 135328, "epoch": 3222} {"train_loss": -6.747559070587158, "global_step": 135329, "epoch": 3222} {"train_loss": -6.673570156097412, "global_step": 135330, "epoch": 3222} {"train_loss": -6.71436882019043, "global_step": 135331, "epoch": 3222} {"train_loss": -6.662013530731201, "global_step": 135332, "epoch": 3222} {"train_loss": -6.896812915802002, "global_step": 135333, "epoch": 3222} {"train_loss": -6.643138885498047, "global_step": 135334, "epoch": 3222} {"train_loss": -6.675093650817871, "global_step": 135335, "epoch": 3222} {"train_loss": -6.780585289001465, "global_step": 135336, "epoch": 3222} {"train_loss": -6.545149326324463, "global_step": 135337, "epoch": 3222} {"train_loss": -6.760732650756836, "global_step": 135338, "epoch": 3222} {"train_loss": -6.596746921539307, "global_step": 135339, "epoch": 3222} {"train_loss": -6.601886749267578, "global_step": 135340, "epoch": 3222} {"train_loss": -6.634254455566406, "global_step": 135341, "epoch": 3222} {"train_loss": -6.665716171264648, "global_step": 135342, "epoch": 3222} {"train_loss": -6.598336219787598, "global_step": 135343, "epoch": 3222} {"train_loss": -6.687515735626221, "global_step": 135344, "epoch": 3222} {"train_loss": -6.614011287689209, "global_step": 135345, "epoch": 3222} {"train_loss": -6.723491191864014, "global_step": 135346, "epoch": 3222} {"train_loss": -6.70539665222168, "global_step": 135347, "epoch": 3222} {"train_loss": -6.6223955154418945, "global_step": 135348, "epoch": 3222} {"train_loss": -6.833595275878906, "global_step": 135349, "epoch": 3222} {"train_loss": -6.645986557006836, "global_step": 135350, "epoch": 3222} {"train_loss": -6.731103897094727, "global_step": 135351, "epoch": 3222} {"train_loss": -6.717947959899902, "global_step": 135352, "epoch": 3222} {"train_loss": -6.704606533050537, "global_step": 135353, "epoch": 3222} {"train_loss": -6.769465446472168, "global_step": 135354, "epoch": 3222} {"train_loss": -6.749248504638672, "global_step": 135355, "epoch": 3222} {"train_loss": -6.8109636306762695, "global_step": 135356, "epoch": 3222} {"train_loss": -6.7469096183776855, "global_step": 135357, "epoch": 3222} {"train_loss": -6.764156818389893, "global_step": 135358, "epoch": 3222} {"train_loss": -6.827712059020996, "global_step": 135359, "epoch": 3222} {"train_loss": -6.773453235626221, "global_step": 135360, "epoch": 3222} {"train_loss": -6.803993225097656, "global_step": 135361, "epoch": 3222} {"train_loss": -6.768159866333008, "global_step": 135362, "epoch": 3222} {"train_loss": -6.698267459869385, "global_step": 135363, "epoch": 3222} {"train_loss": -6.675305366516113, "global_step": 135364, "epoch": 3222} {"train_loss": -6.719105164210002, "global_step": 135365, "epoch": 3222, "val_loss": 77920.890625} {"train_loss": -6.759604454040527, "global_step": 135366, "epoch": 3223} {"train_loss": -6.696667671203613, "global_step": 135367, "epoch": 3223} {"train_loss": -6.664762020111084, "global_step": 135368, "epoch": 3223} {"train_loss": -6.668430805206299, "global_step": 135369, "epoch": 3223} {"train_loss": -6.688869476318359, "global_step": 135370, "epoch": 3223} {"train_loss": -6.7273030281066895, "global_step": 135371, "epoch": 3223} {"train_loss": -6.618615627288818, "global_step": 135372, "epoch": 3223} {"train_loss": -6.769671440124512, "global_step": 135373, "epoch": 3223} {"train_loss": -6.599093437194824, "global_step": 135374, "epoch": 3223} {"train_loss": -6.680136680603027, "global_step": 135375, "epoch": 3223} {"train_loss": -6.6864213943481445, "global_step": 135376, "epoch": 3223} {"train_loss": -6.616947174072266, "global_step": 135377, "epoch": 3223} {"train_loss": -6.732329845428467, "global_step": 135378, "epoch": 3223} {"train_loss": -6.603913307189941, "global_step": 135379, "epoch": 3223} {"train_loss": -6.648065567016602, "global_step": 135380, "epoch": 3223} {"train_loss": -6.72403621673584, "global_step": 135381, "epoch": 3223} {"train_loss": -6.64786958694458, "global_step": 135382, "epoch": 3223} {"train_loss": -6.759519577026367, "global_step": 135383, "epoch": 3223} {"train_loss": -6.571933746337891, "global_step": 135384, "epoch": 3223} {"train_loss": -6.726690292358398, "global_step": 135385, "epoch": 3223} {"train_loss": -6.651941776275635, "global_step": 135386, "epoch": 3223} {"train_loss": -6.730507850646973, "global_step": 135387, "epoch": 3223} {"train_loss": -6.706052780151367, "global_step": 135388, "epoch": 3223} {"train_loss": -6.612793922424316, "global_step": 135389, "epoch": 3223} {"train_loss": -6.6126532554626465, "global_step": 135390, "epoch": 3223} {"train_loss": -6.685737609863281, "global_step": 135391, "epoch": 3223} {"train_loss": -6.752143859863281, "global_step": 135392, "epoch": 3223} {"train_loss": -6.745988845825195, "global_step": 135393, "epoch": 3223} {"train_loss": -6.72591495513916, "global_step": 135394, "epoch": 3223} {"train_loss": -6.8618927001953125, "global_step": 135395, "epoch": 3223} {"train_loss": -6.6745429039001465, "global_step": 135396, "epoch": 3223} {"train_loss": -6.641092300415039, "global_step": 135397, "epoch": 3223} {"train_loss": -6.713247299194336, "global_step": 135398, "epoch": 3223} {"train_loss": -6.6959943771362305, "global_step": 135399, "epoch": 3223} {"train_loss": -6.727556228637695, "global_step": 135400, "epoch": 3223} {"train_loss": -6.725386142730713, "global_step": 135401, "epoch": 3223} {"train_loss": -6.773873805999756, "global_step": 135402, "epoch": 3223} {"train_loss": -6.800325393676758, "global_step": 135403, "epoch": 3223} {"train_loss": -6.764806747436523, "global_step": 135404, "epoch": 3223} {"train_loss": -6.856250286102295, "global_step": 135405, "epoch": 3223} {"train_loss": -6.68779182434082, "global_step": 135406, "epoch": 3223} {"train_loss": -6.702046235402425, "global_step": 135407, "epoch": 3223, "val_loss": 77819.71875} {"train_loss": -6.762105464935303, "global_step": 135408, "epoch": 3224} {"train_loss": -6.8059844970703125, "global_step": 135409, "epoch": 3224} {"train_loss": -6.873563766479492, "global_step": 135410, "epoch": 3224} {"train_loss": -6.717174530029297, "global_step": 135411, "epoch": 3224} {"train_loss": -6.728361129760742, "global_step": 135412, "epoch": 3224} {"train_loss": -6.701590538024902, "global_step": 135413, "epoch": 3224} {"train_loss": -6.734795570373535, "global_step": 135414, "epoch": 3224} {"train_loss": -6.720116138458252, "global_step": 135415, "epoch": 3224} {"train_loss": -6.7145795822143555, "global_step": 135416, "epoch": 3224} {"train_loss": -6.695289611816406, "global_step": 135417, "epoch": 3224} {"train_loss": -6.6400041580200195, "global_step": 135418, "epoch": 3224} {"train_loss": -6.8016462326049805, "global_step": 135419, "epoch": 3224} {"train_loss": -6.76407527923584, "global_step": 135420, "epoch": 3224} {"train_loss": -6.8343915939331055, "global_step": 135421, "epoch": 3224} {"train_loss": -6.725677490234375, "global_step": 135422, "epoch": 3224} {"train_loss": -6.727123737335205, "global_step": 135423, "epoch": 3224} {"train_loss": -6.7652435302734375, "global_step": 135424, "epoch": 3224} {"train_loss": -6.722776412963867, "global_step": 135425, "epoch": 3224} {"train_loss": -6.740024089813232, "global_step": 135426, "epoch": 3224} {"train_loss": -6.799463748931885, "global_step": 135427, "epoch": 3224} {"train_loss": -6.761476516723633, "global_step": 135428, "epoch": 3224} {"train_loss": -6.6399641036987305, "global_step": 135429, "epoch": 3224} {"train_loss": -6.802131175994873, "global_step": 135430, "epoch": 3224} {"train_loss": -6.830846309661865, "global_step": 135431, "epoch": 3224} {"train_loss": -6.751007080078125, "global_step": 135432, "epoch": 3224} {"train_loss": -6.657411575317383, "global_step": 135433, "epoch": 3224} {"train_loss": -6.744869232177734, "global_step": 135434, "epoch": 3224} {"train_loss": -6.66297721862793, "global_step": 135435, "epoch": 3224} {"train_loss": -6.854437351226807, "global_step": 135436, "epoch": 3224} {"train_loss": -6.719247817993164, "global_step": 135437, "epoch": 3224} {"train_loss": -6.74945068359375, "global_step": 135438, "epoch": 3224} {"train_loss": -6.83579683303833, "global_step": 135439, "epoch": 3224} {"train_loss": -6.715949058532715, "global_step": 135440, "epoch": 3224} {"train_loss": -6.779080867767334, "global_step": 135441, "epoch": 3224} {"train_loss": -6.7073845863342285, "global_step": 135442, "epoch": 3224} {"train_loss": -6.739444732666016, "global_step": 135443, "epoch": 3224} {"train_loss": -6.815743923187256, "global_step": 135444, "epoch": 3224} {"train_loss": -6.713167667388916, "global_step": 135445, "epoch": 3224} {"train_loss": -6.759095668792725, "global_step": 135446, "epoch": 3224} {"train_loss": -6.568641662597656, "global_step": 135447, "epoch": 3224} {"train_loss": -6.614894866943359, "global_step": 135448, "epoch": 3224} {"train_loss": -6.7400319916861395, "global_step": 135449, "epoch": 3224, "val_loss": 77800.515625} {"train_loss": -6.629899024963379, "global_step": 135450, "epoch": 3225} {"train_loss": -6.690275192260742, "global_step": 135451, "epoch": 3225} {"train_loss": -6.71958589553833, "global_step": 135452, "epoch": 3225} {"train_loss": -6.550294876098633, "global_step": 135453, "epoch": 3225} {"train_loss": -6.560505390167236, "global_step": 135454, "epoch": 3225} {"train_loss": -6.525237083435059, "global_step": 135455, "epoch": 3225} {"train_loss": -6.58270263671875, "global_step": 135456, "epoch": 3225} {"train_loss": -6.630053520202637, "global_step": 135457, "epoch": 3225} {"train_loss": -6.559377670288086, "global_step": 135458, "epoch": 3225} {"train_loss": -6.579554557800293, "global_step": 135459, "epoch": 3225} {"train_loss": -6.678834915161133, "global_step": 135460, "epoch": 3225} {"train_loss": -6.614530563354492, "global_step": 135461, "epoch": 3225} {"train_loss": -6.77358341217041, "global_step": 135462, "epoch": 3225} {"train_loss": -6.561211585998535, "global_step": 135463, "epoch": 3225} {"train_loss": -6.726254940032959, "global_step": 135464, "epoch": 3225} {"train_loss": -6.653441429138184, "global_step": 135465, "epoch": 3225} {"train_loss": -6.740582466125488, "global_step": 135466, "epoch": 3225} {"train_loss": -6.6861395835876465, "global_step": 135467, "epoch": 3225} {"train_loss": -6.71272087097168, "global_step": 135468, "epoch": 3225} {"train_loss": -6.681584358215332, "global_step": 135469, "epoch": 3225} {"train_loss": -6.751291751861572, "global_step": 135470, "epoch": 3225} {"train_loss": -6.7291035652160645, "global_step": 135471, "epoch": 3225} {"train_loss": -6.595057010650635, "global_step": 135472, "epoch": 3225} {"train_loss": -6.753548622131348, "global_step": 135473, "epoch": 3225} {"train_loss": -6.779247283935547, "global_step": 135474, "epoch": 3225} {"train_loss": -6.629394054412842, "global_step": 135475, "epoch": 3225} {"train_loss": -6.658450126647949, "global_step": 135476, "epoch": 3225} {"train_loss": -6.72629451751709, "global_step": 135477, "epoch": 3225} {"train_loss": -6.748687744140625, "global_step": 135478, "epoch": 3225} {"train_loss": -6.66163444519043, "global_step": 135479, "epoch": 3225} {"train_loss": -6.589973449707031, "global_step": 135480, "epoch": 3225} {"train_loss": -6.667237281799316, "global_step": 135481, "epoch": 3225} {"train_loss": -6.749488830566406, "global_step": 135482, "epoch": 3225} {"train_loss": -6.743716716766357, "global_step": 135483, "epoch": 3225} {"train_loss": -6.722590923309326, "global_step": 135484, "epoch": 3225} {"train_loss": -6.705261707305908, "global_step": 135485, "epoch": 3225} {"train_loss": -6.736602783203125, "global_step": 135486, "epoch": 3225} {"train_loss": -6.6556196212768555, "global_step": 135487, "epoch": 3225} {"train_loss": -6.658327579498291, "global_step": 135488, "epoch": 3225} {"train_loss": -6.704130172729492, "global_step": 135489, "epoch": 3225} {"train_loss": -6.632023811340332, "global_step": 135490, "epoch": 3225} {"train_loss": -6.6695162909371515, "global_step": 135491, "epoch": 3225, "val_loss": 78073.2734375} {"train_loss": -6.6492109298706055, "global_step": 135492, "epoch": 3226} {"train_loss": -6.638546943664551, "global_step": 135493, "epoch": 3226} {"train_loss": -6.557200908660889, "global_step": 135494, "epoch": 3226} {"train_loss": -6.505995750427246, "global_step": 135495, "epoch": 3226} {"train_loss": -6.678505897521973, "global_step": 135496, "epoch": 3226} {"train_loss": -6.719113349914551, "global_step": 135497, "epoch": 3226} {"train_loss": -6.581181049346924, "global_step": 135498, "epoch": 3226} {"train_loss": -6.670169830322266, "global_step": 135499, "epoch": 3226} {"train_loss": -6.714470863342285, "global_step": 135500, "epoch": 3226} {"train_loss": -6.604281902313232, "global_step": 135501, "epoch": 3226} {"train_loss": -6.758284091949463, "global_step": 135502, "epoch": 3226} {"train_loss": -6.633414268493652, "global_step": 135503, "epoch": 3226} {"train_loss": -6.614130973815918, "global_step": 135504, "epoch": 3226} {"train_loss": -6.830409049987793, "global_step": 135505, "epoch": 3226} {"train_loss": -6.646979331970215, "global_step": 135506, "epoch": 3226} {"train_loss": -6.6634063720703125, "global_step": 135507, "epoch": 3226} {"train_loss": -6.646031379699707, "global_step": 135508, "epoch": 3226} {"train_loss": -6.792207717895508, "global_step": 135509, "epoch": 3226} {"train_loss": -6.7916998863220215, "global_step": 135510, "epoch": 3226} {"train_loss": -6.7649407386779785, "global_step": 135511, "epoch": 3226} {"train_loss": -6.771786689758301, "global_step": 135512, "epoch": 3226} {"train_loss": -6.890819549560547, "global_step": 135513, "epoch": 3226} {"train_loss": -6.757133483886719, "global_step": 135514, "epoch": 3226} {"train_loss": -6.719789981842041, "global_step": 135515, "epoch": 3226} {"train_loss": -6.775816917419434, "global_step": 135516, "epoch": 3226} {"train_loss": -6.733693599700928, "global_step": 135517, "epoch": 3226} {"train_loss": -6.753948211669922, "global_step": 135518, "epoch": 3226} {"train_loss": -6.771169662475586, "global_step": 135519, "epoch": 3226} {"train_loss": -6.812355041503906, "global_step": 135520, "epoch": 3226} {"train_loss": -6.823653697967529, "global_step": 135521, "epoch": 3226} {"train_loss": -6.797614097595215, "global_step": 135522, "epoch": 3226} {"train_loss": -6.702759265899658, "global_step": 135523, "epoch": 3226} {"train_loss": -6.834621429443359, "global_step": 135524, "epoch": 3226} {"train_loss": -6.685343265533447, "global_step": 135525, "epoch": 3226} {"train_loss": -6.671098709106445, "global_step": 135526, "epoch": 3226} {"train_loss": -6.69003963470459, "global_step": 135527, "epoch": 3226} {"train_loss": -6.694389343261719, "global_step": 135528, "epoch": 3226} {"train_loss": -6.560103416442871, "global_step": 135529, "epoch": 3226} {"train_loss": -6.565406799316406, "global_step": 135530, "epoch": 3226} {"train_loss": -6.6207990646362305, "global_step": 135531, "epoch": 3226} {"train_loss": -6.5595574378967285, "global_step": 135532, "epoch": 3226} {"train_loss": -6.696002074650356, "global_step": 135533, "epoch": 3226, "val_loss": 77565.8515625} {"train_loss": -6.622189521789551, "global_step": 135534, "epoch": 3227} {"train_loss": -6.622910499572754, "global_step": 135535, "epoch": 3227} {"train_loss": -6.6346821784973145, "global_step": 135536, "epoch": 3227} {"train_loss": -6.752720832824707, "global_step": 135537, "epoch": 3227} {"train_loss": -6.573163986206055, "global_step": 135538, "epoch": 3227} {"train_loss": -6.74511194229126, "global_step": 135539, "epoch": 3227} {"train_loss": -6.757683753967285, "global_step": 135540, "epoch": 3227} {"train_loss": -6.697102069854736, "global_step": 135541, "epoch": 3227} {"train_loss": -6.698474407196045, "global_step": 135542, "epoch": 3227} {"train_loss": -6.794217109680176, "global_step": 135543, "epoch": 3227} {"train_loss": -6.653048038482666, "global_step": 135544, "epoch": 3227} {"train_loss": -6.613969802856445, "global_step": 135545, "epoch": 3227} {"train_loss": -6.761876106262207, "global_step": 135546, "epoch": 3227} {"train_loss": -6.656248092651367, "global_step": 135547, "epoch": 3227} {"train_loss": -6.753678321838379, "global_step": 135548, "epoch": 3227} {"train_loss": -6.680417060852051, "global_step": 135549, "epoch": 3227} {"train_loss": -6.759858131408691, "global_step": 135550, "epoch": 3227} {"train_loss": -6.616822242736816, "global_step": 135551, "epoch": 3227} {"train_loss": -6.603693008422852, "global_step": 135552, "epoch": 3227} {"train_loss": -6.698220252990723, "global_step": 135553, "epoch": 3227} {"train_loss": -6.574883937835693, "global_step": 135554, "epoch": 3227} {"train_loss": -6.7655863761901855, "global_step": 135555, "epoch": 3227} {"train_loss": -6.621669292449951, "global_step": 135556, "epoch": 3227} {"train_loss": -6.7090606689453125, "global_step": 135557, "epoch": 3227} {"train_loss": -6.6973795890808105, "global_step": 135558, "epoch": 3227} {"train_loss": -6.59780740737915, "global_step": 135559, "epoch": 3227} {"train_loss": -6.7435407638549805, "global_step": 135560, "epoch": 3227} {"train_loss": -6.756995677947998, "global_step": 135561, "epoch": 3227} {"train_loss": -6.605027198791504, "global_step": 135562, "epoch": 3227} {"train_loss": -6.684149265289307, "global_step": 135563, "epoch": 3227} {"train_loss": -6.623085975646973, "global_step": 135564, "epoch": 3227} {"train_loss": -6.747861862182617, "global_step": 135565, "epoch": 3227} {"train_loss": -6.757134914398193, "global_step": 135566, "epoch": 3227} {"train_loss": -6.720279693603516, "global_step": 135567, "epoch": 3227} {"train_loss": -6.747958183288574, "global_step": 135568, "epoch": 3227} {"train_loss": -6.713433265686035, "global_step": 135569, "epoch": 3227} {"train_loss": -6.776523590087891, "global_step": 135570, "epoch": 3227} {"train_loss": -6.795357704162598, "global_step": 135571, "epoch": 3227} {"train_loss": -6.699609756469727, "global_step": 135572, "epoch": 3227} {"train_loss": -6.693434715270996, "global_step": 135573, "epoch": 3227} {"train_loss": -6.71697998046875, "global_step": 135574, "epoch": 3227} {"train_loss": -6.693928934278942, "global_step": 135575, "epoch": 3227, "val_loss": 77783.6484375} {"train_loss": -6.823119163513184, "global_step": 135576, "epoch": 3228} {"train_loss": -6.841670989990234, "global_step": 135577, "epoch": 3228} {"train_loss": -6.7799177169799805, "global_step": 135578, "epoch": 3228} {"train_loss": -6.83585262298584, "global_step": 135579, "epoch": 3228} {"train_loss": -6.701911926269531, "global_step": 135580, "epoch": 3228} {"train_loss": -6.7725677490234375, "global_step": 135581, "epoch": 3228} {"train_loss": -6.713461399078369, "global_step": 135582, "epoch": 3228} {"train_loss": -6.839140892028809, "global_step": 135583, "epoch": 3228} {"train_loss": -6.821331977844238, "global_step": 135584, "epoch": 3228} {"train_loss": -6.67788028717041, "global_step": 135585, "epoch": 3228} {"train_loss": -6.686969757080078, "global_step": 135586, "epoch": 3228} {"train_loss": -6.769689083099365, "global_step": 135587, "epoch": 3228} {"train_loss": -6.706425666809082, "global_step": 135588, "epoch": 3228} {"train_loss": -6.805059909820557, "global_step": 135589, "epoch": 3228} {"train_loss": -6.630374908447266, "global_step": 135590, "epoch": 3228} {"train_loss": -6.468092918395996, "global_step": 135591, "epoch": 3228} {"train_loss": -6.5881452560424805, "global_step": 135592, "epoch": 3228} {"train_loss": -6.59940767288208, "global_step": 135593, "epoch": 3228} {"train_loss": -6.592449188232422, "global_step": 135594, "epoch": 3228} {"train_loss": -6.5989837646484375, "global_step": 135595, "epoch": 3228} {"train_loss": -6.517518043518066, "global_step": 135596, "epoch": 3228} {"train_loss": -6.643311500549316, "global_step": 135597, "epoch": 3228} {"train_loss": -6.564268112182617, "global_step": 135598, "epoch": 3228} {"train_loss": -6.569143295288086, "global_step": 135599, "epoch": 3228} {"train_loss": -6.657574653625488, "global_step": 135600, "epoch": 3228} {"train_loss": -6.627543926239014, "global_step": 135601, "epoch": 3228} {"train_loss": -6.566953659057617, "global_step": 135602, "epoch": 3228} {"train_loss": -6.613001823425293, "global_step": 135603, "epoch": 3228} {"train_loss": -6.660282135009766, "global_step": 135604, "epoch": 3228} {"train_loss": -6.579263687133789, "global_step": 135605, "epoch": 3228} {"train_loss": -6.572606086730957, "global_step": 135606, "epoch": 3228} {"train_loss": -6.677124977111816, "global_step": 135607, "epoch": 3228} {"train_loss": -6.547318458557129, "global_step": 135608, "epoch": 3228} {"train_loss": -6.73672342300415, "global_step": 135609, "epoch": 3228} {"train_loss": -6.616197109222412, "global_step": 135610, "epoch": 3228} {"train_loss": -6.646928787231445, "global_step": 135611, "epoch": 3228} {"train_loss": -6.656973838806152, "global_step": 135612, "epoch": 3228} {"train_loss": -6.686106204986572, "global_step": 135613, "epoch": 3228} {"train_loss": -6.53080940246582, "global_step": 135614, "epoch": 3228} {"train_loss": -6.6133198738098145, "global_step": 135615, "epoch": 3228} {"train_loss": -6.64605712890625, "global_step": 135616, "epoch": 3228} {"train_loss": -6.663087981087821, "global_step": 135617, "epoch": 3228, "val_loss": 77819.4609375} {"train_loss": -6.631927490234375, "global_step": 135618, "epoch": 3229} {"train_loss": -6.648508071899414, "global_step": 135619, "epoch": 3229} {"train_loss": -6.792382717132568, "global_step": 135620, "epoch": 3229} {"train_loss": -6.626307487487793, "global_step": 135621, "epoch": 3229} {"train_loss": -6.7858405113220215, "global_step": 135622, "epoch": 3229} {"train_loss": -6.852632522583008, "global_step": 135623, "epoch": 3229} {"train_loss": -6.757494926452637, "global_step": 135624, "epoch": 3229} {"train_loss": -6.747567176818848, "global_step": 135625, "epoch": 3229} {"train_loss": -6.758256435394287, "global_step": 135626, "epoch": 3229} {"train_loss": -6.697026252746582, "global_step": 135627, "epoch": 3229} {"train_loss": -6.709629058837891, "global_step": 135628, "epoch": 3229} {"train_loss": -6.660926818847656, "global_step": 135629, "epoch": 3229} {"train_loss": -6.708846092224121, "global_step": 135630, "epoch": 3229} {"train_loss": -6.739940166473389, "global_step": 135631, "epoch": 3229} {"train_loss": -6.732751369476318, "global_step": 135632, "epoch": 3229} {"train_loss": -6.707753658294678, "global_step": 135633, "epoch": 3229} {"train_loss": -6.89218807220459, "global_step": 135634, "epoch": 3229} {"train_loss": -6.786008358001709, "global_step": 135635, "epoch": 3229} {"train_loss": -6.691597938537598, "global_step": 135636, "epoch": 3229} {"train_loss": -6.645833492279053, "global_step": 135637, "epoch": 3229} {"train_loss": -6.753517150878906, "global_step": 135638, "epoch": 3229} {"train_loss": -6.833346366882324, "global_step": 135639, "epoch": 3229} {"train_loss": -6.584693908691406, "global_step": 135640, "epoch": 3229} {"train_loss": -6.717353820800781, "global_step": 135641, "epoch": 3229} {"train_loss": -6.788298606872559, "global_step": 135642, "epoch": 3229} {"train_loss": -6.537832260131836, "global_step": 135643, "epoch": 3229} {"train_loss": -6.822303771972656, "global_step": 135644, "epoch": 3229} {"train_loss": -6.816066265106201, "global_step": 135645, "epoch": 3229} {"train_loss": -6.694833278656006, "global_step": 135646, "epoch": 3229} {"train_loss": -6.839843273162842, "global_step": 135647, "epoch": 3229} {"train_loss": -6.802854537963867, "global_step": 135648, "epoch": 3229} {"train_loss": -6.711274147033691, "global_step": 135649, "epoch": 3229} {"train_loss": -6.799412250518799, "global_step": 135650, "epoch": 3229} {"train_loss": -6.771595478057861, "global_step": 135651, "epoch": 3229} {"train_loss": -6.701223373413086, "global_step": 135652, "epoch": 3229} {"train_loss": -6.725521564483643, "global_step": 135653, "epoch": 3229} {"train_loss": -6.737855911254883, "global_step": 135654, "epoch": 3229} {"train_loss": -6.824624061584473, "global_step": 135655, "epoch": 3229} {"train_loss": -6.660229682922363, "global_step": 135656, "epoch": 3229} {"train_loss": -6.7442779541015625, "global_step": 135657, "epoch": 3229} {"train_loss": -6.751335144042969, "global_step": 135658, "epoch": 3229} {"train_loss": -6.738178673244658, "global_step": 135659, "epoch": 3229, "val_loss": 77854.1640625} {"train_loss": -6.759853363037109, "global_step": 135660, "epoch": 3230} {"train_loss": -6.795092582702637, "global_step": 135661, "epoch": 3230} {"train_loss": -6.767763137817383, "global_step": 135662, "epoch": 3230} {"train_loss": -6.828742027282715, "global_step": 135663, "epoch": 3230} {"train_loss": -6.814269542694092, "global_step": 135664, "epoch": 3230} {"train_loss": -6.733382225036621, "global_step": 135665, "epoch": 3230} {"train_loss": -6.768465518951416, "global_step": 135666, "epoch": 3230} {"train_loss": -6.7699875831604, "global_step": 135667, "epoch": 3230} {"train_loss": -6.786764144897461, "global_step": 135668, "epoch": 3230} {"train_loss": -6.698129653930664, "global_step": 135669, "epoch": 3230} {"train_loss": -6.7996110916137695, "global_step": 135670, "epoch": 3230} {"train_loss": -6.848126411437988, "global_step": 135671, "epoch": 3230} {"train_loss": -6.772001266479492, "global_step": 135672, "epoch": 3230} {"train_loss": -6.762324333190918, "global_step": 135673, "epoch": 3230} {"train_loss": -6.784770965576172, "global_step": 135674, "epoch": 3230} {"train_loss": -6.746506214141846, "global_step": 135675, "epoch": 3230} {"train_loss": -6.68233585357666, "global_step": 135676, "epoch": 3230} {"train_loss": -6.742293834686279, "global_step": 135677, "epoch": 3230} {"train_loss": -6.807286262512207, "global_step": 135678, "epoch": 3230} {"train_loss": -6.773166656494141, "global_step": 135679, "epoch": 3230} {"train_loss": -6.8221025466918945, "global_step": 135680, "epoch": 3230} {"train_loss": -6.699413299560547, "global_step": 135681, "epoch": 3230} {"train_loss": -6.752401351928711, "global_step": 135682, "epoch": 3230} {"train_loss": -6.7925190925598145, "global_step": 135683, "epoch": 3230} {"train_loss": -6.826715469360352, "global_step": 135684, "epoch": 3230} {"train_loss": -6.836783409118652, "global_step": 135685, "epoch": 3230} {"train_loss": -6.70469856262207, "global_step": 135686, "epoch": 3230} {"train_loss": -6.7255730628967285, "global_step": 135687, "epoch": 3230} {"train_loss": -6.756173610687256, "global_step": 135688, "epoch": 3230} {"train_loss": -6.710555076599121, "global_step": 135689, "epoch": 3230} {"train_loss": -6.7466020584106445, "global_step": 135690, "epoch": 3230} {"train_loss": -6.806422233581543, "global_step": 135691, "epoch": 3230} {"train_loss": -6.672446250915527, "global_step": 135692, "epoch": 3230} {"train_loss": -6.5745954513549805, "global_step": 135693, "epoch": 3230} {"train_loss": -6.729901313781738, "global_step": 135694, "epoch": 3230} {"train_loss": -6.654390335083008, "global_step": 135695, "epoch": 3230} {"train_loss": -6.6857805252075195, "global_step": 135696, "epoch": 3230} {"train_loss": -6.5883684158325195, "global_step": 135697, "epoch": 3230} {"train_loss": -6.647836685180664, "global_step": 135698, "epoch": 3230} {"train_loss": -6.687878608703613, "global_step": 135699, "epoch": 3230} {"train_loss": -6.748490333557129, "global_step": 135700, "epoch": 3230} {"train_loss": -6.7461704186030795, "global_step": 135701, "epoch": 3230, "val_loss": 77712.7421875} {"train_loss": -6.820842266082764, "global_step": 135702, "epoch": 3231} {"train_loss": -6.740961074829102, "global_step": 135703, "epoch": 3231} {"train_loss": -6.727209091186523, "global_step": 135704, "epoch": 3231} {"train_loss": -6.725251197814941, "global_step": 135705, "epoch": 3231} {"train_loss": -6.771966934204102, "global_step": 135706, "epoch": 3231} {"train_loss": -6.756577491760254, "global_step": 135707, "epoch": 3231} {"train_loss": -6.851645469665527, "global_step": 135708, "epoch": 3231} {"train_loss": -6.719682216644287, "global_step": 135709, "epoch": 3231} {"train_loss": -6.641587257385254, "global_step": 135710, "epoch": 3231} {"train_loss": -6.850437164306641, "global_step": 135711, "epoch": 3231} {"train_loss": -6.754905700683594, "global_step": 135712, "epoch": 3231} {"train_loss": -6.645748138427734, "global_step": 135713, "epoch": 3231} {"train_loss": -6.687570095062256, "global_step": 135714, "epoch": 3231} {"train_loss": -6.718475818634033, "global_step": 135715, "epoch": 3231} {"train_loss": -6.846586227416992, "global_step": 135716, "epoch": 3231} {"train_loss": -6.777739524841309, "global_step": 135717, "epoch": 3231} {"train_loss": -6.773135662078857, "global_step": 135718, "epoch": 3231} {"train_loss": -6.847001075744629, "global_step": 135719, "epoch": 3231} {"train_loss": -6.845186233520508, "global_step": 135720, "epoch": 3231} {"train_loss": -6.751939296722412, "global_step": 135721, "epoch": 3231} {"train_loss": -6.837528705596924, "global_step": 135722, "epoch": 3231} {"train_loss": -6.726510524749756, "global_step": 135723, "epoch": 3231} {"train_loss": -6.702220916748047, "global_step": 135724, "epoch": 3231} {"train_loss": -6.696097373962402, "global_step": 135725, "epoch": 3231} {"train_loss": -6.837252616882324, "global_step": 135726, "epoch": 3231} {"train_loss": -6.793340682983398, "global_step": 135727, "epoch": 3231} {"train_loss": -6.817563056945801, "global_step": 135728, "epoch": 3231} {"train_loss": -6.7697367668151855, "global_step": 135729, "epoch": 3231} {"train_loss": -6.738656997680664, "global_step": 135730, "epoch": 3231} {"train_loss": -6.840973377227783, "global_step": 135731, "epoch": 3231} {"train_loss": -6.5643630027771, "global_step": 135732, "epoch": 3231} {"train_loss": -6.533864974975586, "global_step": 135733, "epoch": 3231} {"train_loss": -6.679683685302734, "global_step": 135734, "epoch": 3231} {"train_loss": -6.7117767333984375, "global_step": 135735, "epoch": 3231} {"train_loss": -6.8003692626953125, "global_step": 135736, "epoch": 3231} {"train_loss": -6.747976779937744, "global_step": 135737, "epoch": 3231} {"train_loss": -6.700543403625488, "global_step": 135738, "epoch": 3231} {"train_loss": -6.74883508682251, "global_step": 135739, "epoch": 3231} {"train_loss": -6.670286178588867, "global_step": 135740, "epoch": 3231} {"train_loss": -6.670661926269531, "global_step": 135741, "epoch": 3231} {"train_loss": -6.705008506774902, "global_step": 135742, "epoch": 3231} {"train_loss": -6.741827011108398, "global_step": 135743, "epoch": 3231, "val_loss": 77626.03125} {"train_loss": -6.414155960083008, "global_step": 135744, "epoch": 3232} {"train_loss": -6.640872955322266, "global_step": 135745, "epoch": 3232} {"train_loss": -6.501377105712891, "global_step": 135746, "epoch": 3232} {"train_loss": -6.649852752685547, "global_step": 135747, "epoch": 3232} {"train_loss": -6.41956090927124, "global_step": 135748, "epoch": 3232} {"train_loss": -6.680356979370117, "global_step": 135749, "epoch": 3232} {"train_loss": -6.349529266357422, "global_step": 135750, "epoch": 3232} {"train_loss": -6.548233985900879, "global_step": 135751, "epoch": 3232} {"train_loss": -6.5302629470825195, "global_step": 135752, "epoch": 3232} {"train_loss": -6.497402191162109, "global_step": 135753, "epoch": 3232} {"train_loss": -6.513858318328857, "global_step": 135754, "epoch": 3232} {"train_loss": -6.560219764709473, "global_step": 135755, "epoch": 3232} {"train_loss": -6.518881797790527, "global_step": 135756, "epoch": 3232} {"train_loss": -6.508266448974609, "global_step": 135757, "epoch": 3232} {"train_loss": -6.523880958557129, "global_step": 135758, "epoch": 3232} {"train_loss": -6.473897457122803, "global_step": 135759, "epoch": 3232} {"train_loss": -6.428747653961182, "global_step": 135760, "epoch": 3232} {"train_loss": -6.549201011657715, "global_step": 135761, "epoch": 3232} {"train_loss": -6.58367919921875, "global_step": 135762, "epoch": 3232} {"train_loss": -6.630222797393799, "global_step": 135763, "epoch": 3232} {"train_loss": -6.483440399169922, "global_step": 135764, "epoch": 3232} {"train_loss": -6.545270919799805, "global_step": 135765, "epoch": 3232} {"train_loss": -6.575467109680176, "global_step": 135766, "epoch": 3232} {"train_loss": -6.7188262939453125, "global_step": 135767, "epoch": 3232} {"train_loss": -6.6323137283325195, "global_step": 135768, "epoch": 3232} {"train_loss": -6.551503658294678, "global_step": 135769, "epoch": 3232} {"train_loss": -6.63275146484375, "global_step": 135770, "epoch": 3232} {"train_loss": -6.698764801025391, "global_step": 135771, "epoch": 3232} {"train_loss": -6.716832160949707, "global_step": 135772, "epoch": 3232} {"train_loss": -6.693853378295898, "global_step": 135773, "epoch": 3232} {"train_loss": -6.6612372398376465, "global_step": 135774, "epoch": 3232} {"train_loss": -6.750909805297852, "global_step": 135775, "epoch": 3232} {"train_loss": -6.7841796875, "global_step": 135776, "epoch": 3232} {"train_loss": -6.816006660461426, "global_step": 135777, "epoch": 3232} {"train_loss": -6.690353870391846, "global_step": 135778, "epoch": 3232} {"train_loss": -6.806281089782715, "global_step": 135779, "epoch": 3232} {"train_loss": -6.692255020141602, "global_step": 135780, "epoch": 3232} {"train_loss": -6.729800224304199, "global_step": 135781, "epoch": 3232} {"train_loss": -6.803627967834473, "global_step": 135782, "epoch": 3232} {"train_loss": -6.6719183921813965, "global_step": 135783, "epoch": 3232} {"train_loss": -6.783745288848877, "global_step": 135784, "epoch": 3232} {"train_loss": -6.609894638969784, "global_step": 135785, "epoch": 3232, "val_loss": 77971.0390625} {"train_loss": -6.741856575012207, "global_step": 135786, "epoch": 3233} {"train_loss": -6.820426940917969, "global_step": 135787, "epoch": 3233} {"train_loss": -6.653858184814453, "global_step": 135788, "epoch": 3233} {"train_loss": -6.736056327819824, "global_step": 135789, "epoch": 3233} {"train_loss": -6.7604241371154785, "global_step": 135790, "epoch": 3233} {"train_loss": -6.758485794067383, "global_step": 135791, "epoch": 3233} {"train_loss": -6.726107597351074, "global_step": 135792, "epoch": 3233} {"train_loss": -6.8629045486450195, "global_step": 135793, "epoch": 3233} {"train_loss": -6.753978252410889, "global_step": 135794, "epoch": 3233} {"train_loss": -6.667162895202637, "global_step": 135795, "epoch": 3233} {"train_loss": -6.824884414672852, "global_step": 135796, "epoch": 3233} {"train_loss": -6.7515130043029785, "global_step": 135797, "epoch": 3233} {"train_loss": -6.6244797706604, "global_step": 135798, "epoch": 3233} {"train_loss": -6.664594650268555, "global_step": 135799, "epoch": 3233} {"train_loss": -6.835447788238525, "global_step": 135800, "epoch": 3233} {"train_loss": -6.703059196472168, "global_step": 135801, "epoch": 3233} {"train_loss": -6.720270156860352, "global_step": 135802, "epoch": 3233} {"train_loss": -6.763645648956299, "global_step": 135803, "epoch": 3233} {"train_loss": -6.747156620025635, "global_step": 135804, "epoch": 3233} {"train_loss": -6.687422275543213, "global_step": 135805, "epoch": 3233} {"train_loss": -6.759737014770508, "global_step": 135806, "epoch": 3233} {"train_loss": -6.672369003295898, "global_step": 135807, "epoch": 3233} {"train_loss": -6.768799304962158, "global_step": 135808, "epoch": 3233} {"train_loss": -6.755552291870117, "global_step": 135809, "epoch": 3233} {"train_loss": -6.614201545715332, "global_step": 135810, "epoch": 3233} {"train_loss": -6.747647762298584, "global_step": 135811, "epoch": 3233} {"train_loss": -6.664461135864258, "global_step": 135812, "epoch": 3233} {"train_loss": -6.7509331703186035, "global_step": 135813, "epoch": 3233} {"train_loss": -6.754264831542969, "global_step": 135814, "epoch": 3233} {"train_loss": -6.642298698425293, "global_step": 135815, "epoch": 3233} {"train_loss": -6.648714542388916, "global_step": 135816, "epoch": 3233} {"train_loss": -6.598264694213867, "global_step": 135817, "epoch": 3233} {"train_loss": -6.7480926513671875, "global_step": 135818, "epoch": 3233} {"train_loss": -6.706369876861572, "global_step": 135819, "epoch": 3233} {"train_loss": -6.715631484985352, "global_step": 135820, "epoch": 3233} {"train_loss": -6.708591938018799, "global_step": 135821, "epoch": 3233} {"train_loss": -6.606966972351074, "global_step": 135822, "epoch": 3233} {"train_loss": -6.682791233062744, "global_step": 135823, "epoch": 3233} {"train_loss": -6.8074631690979, "global_step": 135824, "epoch": 3233} {"train_loss": -6.61691427230835, "global_step": 135825, "epoch": 3233} {"train_loss": -6.692384719848633, "global_step": 135826, "epoch": 3233} {"train_loss": -6.7191526889801025, "global_step": 135827, "epoch": 3233, "val_loss": 77871.1875} {"train_loss": -6.744050979614258, "global_step": 135828, "epoch": 3234} {"train_loss": -6.766057014465332, "global_step": 135829, "epoch": 3234} {"train_loss": -6.7264862060546875, "global_step": 135830, "epoch": 3234} {"train_loss": -6.857668399810791, "global_step": 135831, "epoch": 3234} {"train_loss": -6.687786102294922, "global_step": 135832, "epoch": 3234} {"train_loss": -6.85033655166626, "global_step": 135833, "epoch": 3234} {"train_loss": -6.752801418304443, "global_step": 135834, "epoch": 3234} {"train_loss": -6.629136562347412, "global_step": 135835, "epoch": 3234} {"train_loss": -6.8327741622924805, "global_step": 135836, "epoch": 3234} {"train_loss": -6.842082977294922, "global_step": 135837, "epoch": 3234} {"train_loss": -6.730990886688232, "global_step": 135838, "epoch": 3234} {"train_loss": -6.767664909362793, "global_step": 135839, "epoch": 3234} {"train_loss": -6.682173728942871, "global_step": 135840, "epoch": 3234} {"train_loss": -6.852985382080078, "global_step": 135841, "epoch": 3234} {"train_loss": -6.814242362976074, "global_step": 135842, "epoch": 3234} {"train_loss": -6.826259613037109, "global_step": 135843, "epoch": 3234} {"train_loss": -6.719395637512207, "global_step": 135844, "epoch": 3234} {"train_loss": -6.7317657470703125, "global_step": 135845, "epoch": 3234} {"train_loss": -6.852458953857422, "global_step": 135846, "epoch": 3234} {"train_loss": -6.738645553588867, "global_step": 135847, "epoch": 3234} {"train_loss": -6.814620018005371, "global_step": 135848, "epoch": 3234} {"train_loss": -6.706986904144287, "global_step": 135849, "epoch": 3234} {"train_loss": -6.740979194641113, "global_step": 135850, "epoch": 3234} {"train_loss": -6.750487804412842, "global_step": 135851, "epoch": 3234} {"train_loss": -6.691009044647217, "global_step": 135852, "epoch": 3234} {"train_loss": -6.621219635009766, "global_step": 135853, "epoch": 3234} {"train_loss": -6.794088363647461, "global_step": 135854, "epoch": 3234} {"train_loss": -6.654986381530762, "global_step": 135855, "epoch": 3234} {"train_loss": -6.67544412612915, "global_step": 135856, "epoch": 3234} {"train_loss": -6.78971004486084, "global_step": 135857, "epoch": 3234} {"train_loss": -6.651454925537109, "global_step": 135858, "epoch": 3234} {"train_loss": -6.6506853103637695, "global_step": 135859, "epoch": 3234} {"train_loss": -6.714381694793701, "global_step": 135860, "epoch": 3234} {"train_loss": -6.70523738861084, "global_step": 135861, "epoch": 3234} {"train_loss": -6.691495418548584, "global_step": 135862, "epoch": 3234} {"train_loss": -6.6412739753723145, "global_step": 135863, "epoch": 3234} {"train_loss": -6.693543910980225, "global_step": 135864, "epoch": 3234} {"train_loss": -6.564731597900391, "global_step": 135865, "epoch": 3234} {"train_loss": -6.623790740966797, "global_step": 135866, "epoch": 3234} {"train_loss": -6.758476734161377, "global_step": 135867, "epoch": 3234} {"train_loss": -6.539186954498291, "global_step": 135868, "epoch": 3234} {"train_loss": -6.727992977414813, "global_step": 135869, "epoch": 3234, "val_loss": 77902.890625} {"train_loss": -6.710105895996094, "global_step": 135870, "epoch": 3235} {"train_loss": -6.706399917602539, "global_step": 135871, "epoch": 3235} {"train_loss": -6.613826751708984, "global_step": 135872, "epoch": 3235} {"train_loss": -6.678161144256592, "global_step": 135873, "epoch": 3235} {"train_loss": -6.633508682250977, "global_step": 135874, "epoch": 3235} {"train_loss": -6.63001823425293, "global_step": 135875, "epoch": 3235} {"train_loss": -6.719286918640137, "global_step": 135876, "epoch": 3235} {"train_loss": -6.694894313812256, "global_step": 135877, "epoch": 3235} {"train_loss": -6.654854774475098, "global_step": 135878, "epoch": 3235} {"train_loss": -6.672921180725098, "global_step": 135879, "epoch": 3235} {"train_loss": -6.548384666442871, "global_step": 135880, "epoch": 3235} {"train_loss": -6.773439884185791, "global_step": 135881, "epoch": 3235} {"train_loss": -6.632818222045898, "global_step": 135882, "epoch": 3235} {"train_loss": -6.6114044189453125, "global_step": 135883, "epoch": 3235} {"train_loss": -6.6082916259765625, "global_step": 135884, "epoch": 3235} {"train_loss": -6.689833164215088, "global_step": 135885, "epoch": 3235} {"train_loss": -6.620023727416992, "global_step": 135886, "epoch": 3235} {"train_loss": -6.603102207183838, "global_step": 135887, "epoch": 3235} {"train_loss": -6.676177024841309, "global_step": 135888, "epoch": 3235} {"train_loss": -6.645562171936035, "global_step": 135889, "epoch": 3235} {"train_loss": -6.453059196472168, "global_step": 135890, "epoch": 3235} {"train_loss": -6.717121601104736, "global_step": 135891, "epoch": 3235} {"train_loss": -6.7160539627075195, "global_step": 135892, "epoch": 3235} {"train_loss": -6.526729106903076, "global_step": 135893, "epoch": 3235} {"train_loss": -6.7004241943359375, "global_step": 135894, "epoch": 3235} {"train_loss": -6.56884765625, "global_step": 135895, "epoch": 3235} {"train_loss": -6.6576948165893555, "global_step": 135896, "epoch": 3235} {"train_loss": -6.692587852478027, "global_step": 135897, "epoch": 3235} {"train_loss": -6.733433723449707, "global_step": 135898, "epoch": 3235} {"train_loss": -6.493948459625244, "global_step": 135899, "epoch": 3235} {"train_loss": -6.556662082672119, "global_step": 135900, "epoch": 3235} {"train_loss": -6.720174789428711, "global_step": 135901, "epoch": 3235} {"train_loss": -6.535012722015381, "global_step": 135902, "epoch": 3235} {"train_loss": -6.61679220199585, "global_step": 135903, "epoch": 3235} {"train_loss": -6.689950942993164, "global_step": 135904, "epoch": 3235} {"train_loss": -6.712386131286621, "global_step": 135905, "epoch": 3235} {"train_loss": -6.883825302124023, "global_step": 135906, "epoch": 3235} {"train_loss": -6.691805839538574, "global_step": 135907, "epoch": 3235} {"train_loss": -6.68992805480957, "global_step": 135908, "epoch": 3235} {"train_loss": -6.806121826171875, "global_step": 135909, "epoch": 3235} {"train_loss": -6.741465091705322, "global_step": 135910, "epoch": 3235} {"train_loss": -6.6603909106481645, "global_step": 135911, "epoch": 3235, "val_loss": 77689.609375} {"train_loss": -6.693172931671143, "global_step": 135912, "epoch": 3236} {"train_loss": -6.7912750244140625, "global_step": 135913, "epoch": 3236} {"train_loss": -6.679310321807861, "global_step": 135914, "epoch": 3236} {"train_loss": -6.655254364013672, "global_step": 135915, "epoch": 3236} {"train_loss": -6.7441534996032715, "global_step": 135916, "epoch": 3236} {"train_loss": -6.716924667358398, "global_step": 135917, "epoch": 3236} {"train_loss": -6.754887580871582, "global_step": 135918, "epoch": 3236} {"train_loss": -6.829165458679199, "global_step": 135919, "epoch": 3236} {"train_loss": -6.702006816864014, "global_step": 135920, "epoch": 3236} {"train_loss": -6.827760696411133, "global_step": 135921, "epoch": 3236} {"train_loss": -6.809967994689941, "global_step": 135922, "epoch": 3236} {"train_loss": -6.693387031555176, "global_step": 135923, "epoch": 3236} {"train_loss": -6.7910661697387695, "global_step": 135924, "epoch": 3236} {"train_loss": -6.884162902832031, "global_step": 135925, "epoch": 3236} {"train_loss": -6.724515438079834, "global_step": 135926, "epoch": 3236} {"train_loss": -6.784936904907227, "global_step": 135927, "epoch": 3236} {"train_loss": -6.72200345993042, "global_step": 135928, "epoch": 3236} {"train_loss": -6.761178493499756, "global_step": 135929, "epoch": 3236} {"train_loss": -6.809345722198486, "global_step": 135930, "epoch": 3236} {"train_loss": -6.88010311126709, "global_step": 135931, "epoch": 3236} {"train_loss": -6.747128963470459, "global_step": 135932, "epoch": 3236} {"train_loss": -6.791775703430176, "global_step": 135933, "epoch": 3236} {"train_loss": -6.684321880340576, "global_step": 135934, "epoch": 3236} {"train_loss": -6.673766136169434, "global_step": 135935, "epoch": 3236} {"train_loss": -6.758774757385254, "global_step": 135936, "epoch": 3236} {"train_loss": -6.758485794067383, "global_step": 135937, "epoch": 3236} {"train_loss": -6.697112083435059, "global_step": 135938, "epoch": 3236} {"train_loss": -6.783316135406494, "global_step": 135939, "epoch": 3236} {"train_loss": -6.756831169128418, "global_step": 135940, "epoch": 3236} {"train_loss": -6.766611099243164, "global_step": 135941, "epoch": 3236} {"train_loss": -6.710205078125, "global_step": 135942, "epoch": 3236} {"train_loss": -6.761130332946777, "global_step": 135943, "epoch": 3236} {"train_loss": -6.731994152069092, "global_step": 135944, "epoch": 3236} {"train_loss": -6.741763114929199, "global_step": 135945, "epoch": 3236} {"train_loss": -6.792384624481201, "global_step": 135946, "epoch": 3236} {"train_loss": -6.794615268707275, "global_step": 135947, "epoch": 3236} {"train_loss": -6.744835376739502, "global_step": 135948, "epoch": 3236} {"train_loss": -6.722604751586914, "global_step": 135949, "epoch": 3236} {"train_loss": -6.726665496826172, "global_step": 135950, "epoch": 3236} {"train_loss": -6.707634449005127, "global_step": 135951, "epoch": 3236} {"train_loss": -6.762551307678223, "global_step": 135952, "epoch": 3236} {"train_loss": -6.7538720199040005, "global_step": 135953, "epoch": 3236, "val_loss": 77860.6796875} {"train_loss": -6.735601902008057, "global_step": 135954, "epoch": 3237} {"train_loss": -6.576000213623047, "global_step": 135955, "epoch": 3237} {"train_loss": -6.7820892333984375, "global_step": 135956, "epoch": 3237} {"train_loss": -6.773746490478516, "global_step": 135957, "epoch": 3237} {"train_loss": -6.737325668334961, "global_step": 135958, "epoch": 3237} {"train_loss": -6.7655839920043945, "global_step": 135959, "epoch": 3237} {"train_loss": -6.661698341369629, "global_step": 135960, "epoch": 3237} {"train_loss": -6.7261457443237305, "global_step": 135961, "epoch": 3237} {"train_loss": -6.735372066497803, "global_step": 135962, "epoch": 3237} {"train_loss": -6.768557548522949, "global_step": 135963, "epoch": 3237} {"train_loss": -6.857851505279541, "global_step": 135964, "epoch": 3237} {"train_loss": -6.804007530212402, "global_step": 135965, "epoch": 3237} {"train_loss": -6.796631336212158, "global_step": 135966, "epoch": 3237} {"train_loss": -6.834658145904541, "global_step": 135967, "epoch": 3237} {"train_loss": -6.907164573669434, "global_step": 135968, "epoch": 3237} {"train_loss": -6.803497314453125, "global_step": 135969, "epoch": 3237} {"train_loss": -6.737148284912109, "global_step": 135970, "epoch": 3237} {"train_loss": -6.722997188568115, "global_step": 135971, "epoch": 3237} {"train_loss": -6.771670818328857, "global_step": 135972, "epoch": 3237} {"train_loss": -6.7940168380737305, "global_step": 135973, "epoch": 3237} {"train_loss": -6.674849510192871, "global_step": 135974, "epoch": 3237} {"train_loss": -6.764276504516602, "global_step": 135975, "epoch": 3237} {"train_loss": -6.755605220794678, "global_step": 135976, "epoch": 3237} {"train_loss": -6.777250289916992, "global_step": 135977, "epoch": 3237} {"train_loss": -6.644469261169434, "global_step": 135978, "epoch": 3237} {"train_loss": -6.684252738952637, "global_step": 135979, "epoch": 3237} {"train_loss": -6.736734390258789, "global_step": 135980, "epoch": 3237} {"train_loss": -6.7332763671875, "global_step": 135981, "epoch": 3237} {"train_loss": -6.7056884765625, "global_step": 135982, "epoch": 3237} {"train_loss": -6.767505168914795, "global_step": 135983, "epoch": 3237} {"train_loss": -6.851228713989258, "global_step": 135984, "epoch": 3237} {"train_loss": -6.730982780456543, "global_step": 135985, "epoch": 3237} {"train_loss": -6.752354621887207, "global_step": 135986, "epoch": 3237} {"train_loss": -6.79936408996582, "global_step": 135987, "epoch": 3237} {"train_loss": -6.728181838989258, "global_step": 135988, "epoch": 3237} {"train_loss": -6.799909591674805, "global_step": 135989, "epoch": 3237} {"train_loss": -6.775662422180176, "global_step": 135990, "epoch": 3237} {"train_loss": -6.772256851196289, "global_step": 135991, "epoch": 3237} {"train_loss": -6.715814113616943, "global_step": 135992, "epoch": 3237} {"train_loss": -6.823080062866211, "global_step": 135993, "epoch": 3237} {"train_loss": -6.717805862426758, "global_step": 135994, "epoch": 3237} {"train_loss": -6.756938582374936, "global_step": 135995, "epoch": 3237, "val_loss": 77981.015625} {"train_loss": -6.919039726257324, "global_step": 135996, "epoch": 3238} {"train_loss": -6.717413902282715, "global_step": 135997, "epoch": 3238} {"train_loss": -6.7611083984375, "global_step": 135998, "epoch": 3238} {"train_loss": -6.791646957397461, "global_step": 135999, "epoch": 3238} {"train_loss": -6.748661994934082, "global_step": 136000, "epoch": 3238} {"train_loss": -6.716025352478027, "global_step": 136001, "epoch": 3238} {"train_loss": -6.780728340148926, "global_step": 136002, "epoch": 3238} {"train_loss": -6.687260627746582, "global_step": 136003, "epoch": 3238} {"train_loss": -6.754068374633789, "global_step": 136004, "epoch": 3238} {"train_loss": -6.76143741607666, "global_step": 136005, "epoch": 3238} {"train_loss": -6.654779434204102, "global_step": 136006, "epoch": 3238} {"train_loss": -6.840297698974609, "global_step": 136007, "epoch": 3238} {"train_loss": -6.712987899780273, "global_step": 136008, "epoch": 3238} {"train_loss": -6.764962196350098, "global_step": 136009, "epoch": 3238} {"train_loss": -6.7176361083984375, "global_step": 136010, "epoch": 3238} {"train_loss": -6.820353031158447, "global_step": 136011, "epoch": 3238} {"train_loss": -6.716442108154297, "global_step": 136012, "epoch": 3238} {"train_loss": -6.765284061431885, "global_step": 136013, "epoch": 3238} {"train_loss": -6.661418914794922, "global_step": 136014, "epoch": 3238} {"train_loss": -6.8110246658325195, "global_step": 136015, "epoch": 3238} {"train_loss": -6.605085372924805, "global_step": 136016, "epoch": 3238} {"train_loss": -6.693566799163818, "global_step": 136017, "epoch": 3238} {"train_loss": -6.563156604766846, "global_step": 136018, "epoch": 3238} {"train_loss": -6.462455749511719, "global_step": 136019, "epoch": 3238} {"train_loss": -6.7738823890686035, "global_step": 136020, "epoch": 3238} {"train_loss": -6.621175765991211, "global_step": 136021, "epoch": 3238} {"train_loss": -6.507708549499512, "global_step": 136022, "epoch": 3238} {"train_loss": -6.751348495483398, "global_step": 136023, "epoch": 3238} {"train_loss": -6.660612106323242, "global_step": 136024, "epoch": 3238} {"train_loss": -6.575458526611328, "global_step": 136025, "epoch": 3238} {"train_loss": -6.6506547927856445, "global_step": 136026, "epoch": 3238} {"train_loss": -6.5500288009643555, "global_step": 136027, "epoch": 3238} {"train_loss": -6.759208679199219, "global_step": 136028, "epoch": 3238} {"train_loss": -6.667891502380371, "global_step": 136029, "epoch": 3238} {"train_loss": -6.7377824783325195, "global_step": 136030, "epoch": 3238} {"train_loss": -6.677594184875488, "global_step": 136031, "epoch": 3238} {"train_loss": -6.665431499481201, "global_step": 136032, "epoch": 3238} {"train_loss": -6.642120361328125, "global_step": 136033, "epoch": 3238} {"train_loss": -6.681575775146484, "global_step": 136034, "epoch": 3238} {"train_loss": -6.764095306396484, "global_step": 136035, "epoch": 3238} {"train_loss": -6.542907238006592, "global_step": 136036, "epoch": 3238} {"train_loss": -6.6965590090978715, "global_step": 136037, "epoch": 3238, "val_loss": 77565.375} {"train_loss": -6.487018585205078, "global_step": 136038, "epoch": 3239} {"train_loss": -6.651008605957031, "global_step": 136039, "epoch": 3239} {"train_loss": -6.703513145446777, "global_step": 136040, "epoch": 3239} {"train_loss": -6.622681617736816, "global_step": 136041, "epoch": 3239} {"train_loss": -6.524410724639893, "global_step": 136042, "epoch": 3239} {"train_loss": -6.739739418029785, "global_step": 136043, "epoch": 3239} {"train_loss": -6.623099327087402, "global_step": 136044, "epoch": 3239} {"train_loss": -6.613494873046875, "global_step": 136045, "epoch": 3239} {"train_loss": -6.691063404083252, "global_step": 136046, "epoch": 3239} {"train_loss": -6.75209379196167, "global_step": 136047, "epoch": 3239} {"train_loss": -6.641510963439941, "global_step": 136048, "epoch": 3239} {"train_loss": -6.660782814025879, "global_step": 136049, "epoch": 3239} {"train_loss": -6.700409889221191, "global_step": 136050, "epoch": 3239} {"train_loss": -6.720361709594727, "global_step": 136051, "epoch": 3239} {"train_loss": -6.655917167663574, "global_step": 136052, "epoch": 3239} {"train_loss": -6.725729465484619, "global_step": 136053, "epoch": 3239} {"train_loss": -6.6178436279296875, "global_step": 136054, "epoch": 3239} {"train_loss": -6.642152786254883, "global_step": 136055, "epoch": 3239} {"train_loss": -6.759139060974121, "global_step": 136056, "epoch": 3239} {"train_loss": -6.720519065856934, "global_step": 136057, "epoch": 3239} {"train_loss": -6.7908430099487305, "global_step": 136058, "epoch": 3239} {"train_loss": -6.79112434387207, "global_step": 136059, "epoch": 3239} {"train_loss": -6.6656317710876465, "global_step": 136060, "epoch": 3239} {"train_loss": -6.83344030380249, "global_step": 136061, "epoch": 3239} {"train_loss": -6.813124656677246, "global_step": 136062, "epoch": 3239} {"train_loss": -6.690531253814697, "global_step": 136063, "epoch": 3239} {"train_loss": -6.765451431274414, "global_step": 136064, "epoch": 3239} {"train_loss": -6.764557838439941, "global_step": 136065, "epoch": 3239} {"train_loss": -6.791851997375488, "global_step": 136066, "epoch": 3239} {"train_loss": -6.680764198303223, "global_step": 136067, "epoch": 3239} {"train_loss": -6.670077323913574, "global_step": 136068, "epoch": 3239} {"train_loss": -6.761960983276367, "global_step": 136069, "epoch": 3239} {"train_loss": -6.807183742523193, "global_step": 136070, "epoch": 3239} {"train_loss": -6.757283687591553, "global_step": 136071, "epoch": 3239} {"train_loss": -6.7454729080200195, "global_step": 136072, "epoch": 3239} {"train_loss": -6.714240550994873, "global_step": 136073, "epoch": 3239} {"train_loss": -6.679296493530273, "global_step": 136074, "epoch": 3239} {"train_loss": -6.7032246589660645, "global_step": 136075, "epoch": 3239} {"train_loss": -6.727668762207031, "global_step": 136076, "epoch": 3239} {"train_loss": -6.747148513793945, "global_step": 136077, "epoch": 3239} {"train_loss": -6.748427391052246, "global_step": 136078, "epoch": 3239} {"train_loss": -6.706059228806269, "global_step": 136079, "epoch": 3239, "val_loss": 77710.2578125} {"train_loss": -6.667076587677002, "global_step": 136080, "epoch": 3240} {"train_loss": -6.770400524139404, "global_step": 136081, "epoch": 3240} {"train_loss": -6.5661725997924805, "global_step": 136082, "epoch": 3240} {"train_loss": -6.769704818725586, "global_step": 136083, "epoch": 3240} {"train_loss": -6.750699996948242, "global_step": 136084, "epoch": 3240} {"train_loss": -6.720965385437012, "global_step": 136085, "epoch": 3240} {"train_loss": -6.774008750915527, "global_step": 136086, "epoch": 3240} {"train_loss": -6.791776657104492, "global_step": 136087, "epoch": 3240} {"train_loss": -6.597194671630859, "global_step": 136088, "epoch": 3240} {"train_loss": -6.752049446105957, "global_step": 136089, "epoch": 3240} {"train_loss": -6.62299919128418, "global_step": 136090, "epoch": 3240} {"train_loss": -6.657463073730469, "global_step": 136091, "epoch": 3240} {"train_loss": -6.656522750854492, "global_step": 136092, "epoch": 3240} {"train_loss": -6.6615166664123535, "global_step": 136093, "epoch": 3240} {"train_loss": -6.624934196472168, "global_step": 136094, "epoch": 3240} {"train_loss": -6.769655704498291, "global_step": 136095, "epoch": 3240} {"train_loss": -6.667662620544434, "global_step": 136096, "epoch": 3240} {"train_loss": -6.6967620849609375, "global_step": 136097, "epoch": 3240} {"train_loss": -6.708987236022949, "global_step": 136098, "epoch": 3240} {"train_loss": -6.741024971008301, "global_step": 136099, "epoch": 3240} {"train_loss": -6.689632892608643, "global_step": 136100, "epoch": 3240} {"train_loss": -6.808099269866943, "global_step": 136101, "epoch": 3240} {"train_loss": -6.797893047332764, "global_step": 136102, "epoch": 3240} {"train_loss": -6.59456729888916, "global_step": 136103, "epoch": 3240} {"train_loss": -6.800090789794922, "global_step": 136104, "epoch": 3240} {"train_loss": -6.609630584716797, "global_step": 136105, "epoch": 3240} {"train_loss": -6.7864990234375, "global_step": 136106, "epoch": 3240} {"train_loss": -6.791927337646484, "global_step": 136107, "epoch": 3240} {"train_loss": -6.761453628540039, "global_step": 136108, "epoch": 3240} {"train_loss": -6.705832004547119, "global_step": 136109, "epoch": 3240} {"train_loss": -6.719834327697754, "global_step": 136110, "epoch": 3240} {"train_loss": -6.617145538330078, "global_step": 136111, "epoch": 3240} {"train_loss": -6.780834197998047, "global_step": 136112, "epoch": 3240} {"train_loss": -6.732450485229492, "global_step": 136113, "epoch": 3240} {"train_loss": -6.657278060913086, "global_step": 136114, "epoch": 3240} {"train_loss": -6.714787483215332, "global_step": 136115, "epoch": 3240} {"train_loss": -6.710073471069336, "global_step": 136116, "epoch": 3240} {"train_loss": -6.6969475746154785, "global_step": 136117, "epoch": 3240} {"train_loss": -6.750471591949463, "global_step": 136118, "epoch": 3240} {"train_loss": -6.617740631103516, "global_step": 136119, "epoch": 3240} {"train_loss": -6.751874923706055, "global_step": 136120, "epoch": 3240} {"train_loss": -6.7108475140162875, "global_step": 136121, "epoch": 3240, "val_loss": 77805.4453125} {"train_loss": -6.614484786987305, "global_step": 136122, "epoch": 3241} {"train_loss": -6.604604721069336, "global_step": 136123, "epoch": 3241} {"train_loss": -6.736001968383789, "global_step": 136124, "epoch": 3241} {"train_loss": -6.741118431091309, "global_step": 136125, "epoch": 3241} {"train_loss": -6.7045392990112305, "global_step": 136126, "epoch": 3241} {"train_loss": -6.732327938079834, "global_step": 136127, "epoch": 3241} {"train_loss": -6.649384021759033, "global_step": 136128, "epoch": 3241} {"train_loss": -6.788478851318359, "global_step": 136129, "epoch": 3241} {"train_loss": -6.741619110107422, "global_step": 136130, "epoch": 3241} {"train_loss": -6.634614944458008, "global_step": 136131, "epoch": 3241} {"train_loss": -6.831507682800293, "global_step": 136132, "epoch": 3241} {"train_loss": -6.7048749923706055, "global_step": 136133, "epoch": 3241} {"train_loss": -6.756159782409668, "global_step": 136134, "epoch": 3241} {"train_loss": -6.673081398010254, "global_step": 136135, "epoch": 3241} {"train_loss": -6.673257827758789, "global_step": 136136, "epoch": 3241} {"train_loss": -6.667034149169922, "global_step": 136137, "epoch": 3241} {"train_loss": -6.633861064910889, "global_step": 136138, "epoch": 3241} {"train_loss": -6.774570465087891, "global_step": 136139, "epoch": 3241} {"train_loss": -6.622920513153076, "global_step": 136140, "epoch": 3241} {"train_loss": -6.612425804138184, "global_step": 136141, "epoch": 3241} {"train_loss": -6.737081050872803, "global_step": 136142, "epoch": 3241} {"train_loss": -6.756624221801758, "global_step": 136143, "epoch": 3241} {"train_loss": -6.751377105712891, "global_step": 136144, "epoch": 3241} {"train_loss": -6.6512980461120605, "global_step": 136145, "epoch": 3241} {"train_loss": -6.747994422912598, "global_step": 136146, "epoch": 3241} {"train_loss": -6.856106758117676, "global_step": 136147, "epoch": 3241} {"train_loss": -6.700645923614502, "global_step": 136148, "epoch": 3241} {"train_loss": -6.693068504333496, "global_step": 136149, "epoch": 3241} {"train_loss": -6.661933422088623, "global_step": 136150, "epoch": 3241} {"train_loss": -6.6689348220825195, "global_step": 136151, "epoch": 3241} {"train_loss": -6.834362983703613, "global_step": 136152, "epoch": 3241} {"train_loss": -6.684974193572998, "global_step": 136153, "epoch": 3241} {"train_loss": -6.7547454833984375, "global_step": 136154, "epoch": 3241} {"train_loss": -6.690932273864746, "global_step": 136155, "epoch": 3241} {"train_loss": -6.741868019104004, "global_step": 136156, "epoch": 3241} {"train_loss": -6.782433032989502, "global_step": 136157, "epoch": 3241} {"train_loss": -6.577561855316162, "global_step": 136158, "epoch": 3241} {"train_loss": -6.588796615600586, "global_step": 136159, "epoch": 3241} {"train_loss": -6.724579811096191, "global_step": 136160, "epoch": 3241} {"train_loss": -6.79432487487793, "global_step": 136161, "epoch": 3241} {"train_loss": -6.7968902587890625, "global_step": 136162, "epoch": 3241} {"train_loss": -6.708116542725336, "global_step": 136163, "epoch": 3241, "val_loss": 77964.28125} {"train_loss": -6.5989789962768555, "global_step": 136164, "epoch": 3242} {"train_loss": -6.6520466804504395, "global_step": 136165, "epoch": 3242} {"train_loss": -6.818831443786621, "global_step": 136166, "epoch": 3242} {"train_loss": -6.658483505249023, "global_step": 136167, "epoch": 3242} {"train_loss": -6.7607927322387695, "global_step": 136168, "epoch": 3242} {"train_loss": -6.599575042724609, "global_step": 136169, "epoch": 3242} {"train_loss": -6.54852294921875, "global_step": 136170, "epoch": 3242} {"train_loss": -6.606575012207031, "global_step": 136171, "epoch": 3242} {"train_loss": -6.653634071350098, "global_step": 136172, "epoch": 3242} {"train_loss": -6.6167449951171875, "global_step": 136173, "epoch": 3242} {"train_loss": -6.711288928985596, "global_step": 136174, "epoch": 3242} {"train_loss": -6.574565887451172, "global_step": 136175, "epoch": 3242} {"train_loss": -6.758485794067383, "global_step": 136176, "epoch": 3242} {"train_loss": -6.869698524475098, "global_step": 136177, "epoch": 3242} {"train_loss": -6.75581693649292, "global_step": 136178, "epoch": 3242} {"train_loss": -6.842624664306641, "global_step": 136179, "epoch": 3242} {"train_loss": -6.777411937713623, "global_step": 136180, "epoch": 3242} {"train_loss": -6.847586631774902, "global_step": 136181, "epoch": 3242} {"train_loss": -6.671083927154541, "global_step": 136182, "epoch": 3242} {"train_loss": -6.6960248947143555, "global_step": 136183, "epoch": 3242} {"train_loss": -6.770232677459717, "global_step": 136184, "epoch": 3242} {"train_loss": -6.666651248931885, "global_step": 136185, "epoch": 3242} {"train_loss": -6.645938873291016, "global_step": 136186, "epoch": 3242} {"train_loss": -6.740711688995361, "global_step": 136187, "epoch": 3242} {"train_loss": -6.710841178894043, "global_step": 136188, "epoch": 3242} {"train_loss": -6.782373905181885, "global_step": 136189, "epoch": 3242} {"train_loss": -6.742365837097168, "global_step": 136190, "epoch": 3242} {"train_loss": -6.73035192489624, "global_step": 136191, "epoch": 3242} {"train_loss": -6.751699447631836, "global_step": 136192, "epoch": 3242} {"train_loss": -6.791722297668457, "global_step": 136193, "epoch": 3242} {"train_loss": -6.880076885223389, "global_step": 136194, "epoch": 3242} {"train_loss": -6.828497409820557, "global_step": 136195, "epoch": 3242} {"train_loss": -6.795274257659912, "global_step": 136196, "epoch": 3242} {"train_loss": -6.7233734130859375, "global_step": 136197, "epoch": 3242} {"train_loss": -6.776457786560059, "global_step": 136198, "epoch": 3242} {"train_loss": -6.735530853271484, "global_step": 136199, "epoch": 3242} {"train_loss": -6.7013750076293945, "global_step": 136200, "epoch": 3242} {"train_loss": -6.549288749694824, "global_step": 136201, "epoch": 3242} {"train_loss": -6.69679594039917, "global_step": 136202, "epoch": 3242} {"train_loss": -6.643211841583252, "global_step": 136203, "epoch": 3242} {"train_loss": -6.621663570404053, "global_step": 136204, "epoch": 3242} {"train_loss": -6.714160817010062, "global_step": 136205, "epoch": 3242, "val_loss": 77779.9765625} {"train_loss": -6.518811225891113, "global_step": 136206, "epoch": 3243} {"train_loss": -6.619616508483887, "global_step": 136207, "epoch": 3243} {"train_loss": -6.801538944244385, "global_step": 136208, "epoch": 3243} {"train_loss": -6.680436134338379, "global_step": 136209, "epoch": 3243} {"train_loss": -6.727518081665039, "global_step": 136210, "epoch": 3243} {"train_loss": -6.744653701782227, "global_step": 136211, "epoch": 3243} {"train_loss": -6.5837836265563965, "global_step": 136212, "epoch": 3243} {"train_loss": -6.5823187828063965, "global_step": 136213, "epoch": 3243} {"train_loss": -6.65769100189209, "global_step": 136214, "epoch": 3243} {"train_loss": -6.645538330078125, "global_step": 136215, "epoch": 3243} {"train_loss": -6.639171600341797, "global_step": 136216, "epoch": 3243} {"train_loss": -6.794412612915039, "global_step": 136217, "epoch": 3243} {"train_loss": -6.614443778991699, "global_step": 136218, "epoch": 3243} {"train_loss": -6.641237735748291, "global_step": 136219, "epoch": 3243} {"train_loss": -6.666874885559082, "global_step": 136220, "epoch": 3243} {"train_loss": -6.513965606689453, "global_step": 136221, "epoch": 3243} {"train_loss": -6.70328426361084, "global_step": 136222, "epoch": 3243} {"train_loss": -6.683791637420654, "global_step": 136223, "epoch": 3243} {"train_loss": -6.69393253326416, "global_step": 136224, "epoch": 3243} {"train_loss": -6.6241888999938965, "global_step": 136225, "epoch": 3243} {"train_loss": -6.832535266876221, "global_step": 136226, "epoch": 3243} {"train_loss": -6.585685729980469, "global_step": 136227, "epoch": 3243} {"train_loss": -6.766946315765381, "global_step": 136228, "epoch": 3243} {"train_loss": -6.738677024841309, "global_step": 136229, "epoch": 3243} {"train_loss": -6.705575942993164, "global_step": 136230, "epoch": 3243} {"train_loss": -6.807267189025879, "global_step": 136231, "epoch": 3243} {"train_loss": -6.686223030090332, "global_step": 136232, "epoch": 3243} {"train_loss": -6.613514423370361, "global_step": 136233, "epoch": 3243} {"train_loss": -6.704668998718262, "global_step": 136234, "epoch": 3243} {"train_loss": -6.771209239959717, "global_step": 136235, "epoch": 3243} {"train_loss": -6.735472679138184, "global_step": 136236, "epoch": 3243} {"train_loss": -6.730358123779297, "global_step": 136237, "epoch": 3243} {"train_loss": -6.807526588439941, "global_step": 136238, "epoch": 3243} {"train_loss": -6.654531955718994, "global_step": 136239, "epoch": 3243} {"train_loss": -6.704336166381836, "global_step": 136240, "epoch": 3243} {"train_loss": -6.605424880981445, "global_step": 136241, "epoch": 3243} {"train_loss": -6.7962846755981445, "global_step": 136242, "epoch": 3243} {"train_loss": -6.7266740798950195, "global_step": 136243, "epoch": 3243} {"train_loss": -6.6919755935668945, "global_step": 136244, "epoch": 3243} {"train_loss": -6.715310096740723, "global_step": 136245, "epoch": 3243} {"train_loss": -6.740614891052246, "global_step": 136246, "epoch": 3243} {"train_loss": -6.689148573648362, "global_step": 136247, "epoch": 3243, "val_loss": 78024.9140625} {"train_loss": -6.727842330932617, "global_step": 136248, "epoch": 3244} {"train_loss": -6.6842546463012695, "global_step": 136249, "epoch": 3244} {"train_loss": -6.795180320739746, "global_step": 136250, "epoch": 3244} {"train_loss": -6.751955032348633, "global_step": 136251, "epoch": 3244} {"train_loss": -6.722771167755127, "global_step": 136252, "epoch": 3244} {"train_loss": -6.708644390106201, "global_step": 136253, "epoch": 3244} {"train_loss": -6.599944591522217, "global_step": 136254, "epoch": 3244} {"train_loss": -6.642148494720459, "global_step": 136255, "epoch": 3244} {"train_loss": -6.716804027557373, "global_step": 136256, "epoch": 3244} {"train_loss": -6.701951026916504, "global_step": 136257, "epoch": 3244} {"train_loss": -6.6285505294799805, "global_step": 136258, "epoch": 3244} {"train_loss": -6.694051265716553, "global_step": 136259, "epoch": 3244} {"train_loss": -6.680519104003906, "global_step": 136260, "epoch": 3244} {"train_loss": -6.6242570877075195, "global_step": 136261, "epoch": 3244} {"train_loss": -6.76140022277832, "global_step": 136262, "epoch": 3244} {"train_loss": -6.655229091644287, "global_step": 136263, "epoch": 3244} {"train_loss": -6.749953269958496, "global_step": 136264, "epoch": 3244} {"train_loss": -6.689774513244629, "global_step": 136265, "epoch": 3244} {"train_loss": -6.672213554382324, "global_step": 136266, "epoch": 3244} {"train_loss": -6.635058403015137, "global_step": 136267, "epoch": 3244} {"train_loss": -6.65726375579834, "global_step": 136268, "epoch": 3244} {"train_loss": -6.848116874694824, "global_step": 136269, "epoch": 3244} {"train_loss": -6.653063774108887, "global_step": 136270, "epoch": 3244} {"train_loss": -6.7202911376953125, "global_step": 136271, "epoch": 3244} {"train_loss": -6.691999912261963, "global_step": 136272, "epoch": 3244} {"train_loss": -6.76560115814209, "global_step": 136273, "epoch": 3244} {"train_loss": -6.790555953979492, "global_step": 136274, "epoch": 3244} {"train_loss": -6.698055267333984, "global_step": 136275, "epoch": 3244} {"train_loss": -6.809679985046387, "global_step": 136276, "epoch": 3244} {"train_loss": -6.673793792724609, "global_step": 136277, "epoch": 3244} {"train_loss": -6.667311191558838, "global_step": 136278, "epoch": 3244} {"train_loss": -6.825693130493164, "global_step": 136279, "epoch": 3244} {"train_loss": -6.680977821350098, "global_step": 136280, "epoch": 3244} {"train_loss": -6.641353607177734, "global_step": 136281, "epoch": 3244} {"train_loss": -6.842131614685059, "global_step": 136282, "epoch": 3244} {"train_loss": -6.674517631530762, "global_step": 136283, "epoch": 3244} {"train_loss": -6.679355621337891, "global_step": 136284, "epoch": 3244} {"train_loss": -6.657939434051514, "global_step": 136285, "epoch": 3244} {"train_loss": -6.63778018951416, "global_step": 136286, "epoch": 3244} {"train_loss": -6.679165840148926, "global_step": 136287, "epoch": 3244} {"train_loss": -6.774941444396973, "global_step": 136288, "epoch": 3244} {"train_loss": -6.704238664536249, "global_step": 136289, "epoch": 3244, "val_loss": 77935.4609375} {"train_loss": -6.787786960601807, "global_step": 136290, "epoch": 3245} {"train_loss": -6.752684593200684, "global_step": 136291, "epoch": 3245} {"train_loss": -6.754217147827148, "global_step": 136292, "epoch": 3245} {"train_loss": -6.705679893493652, "global_step": 136293, "epoch": 3245} {"train_loss": -6.812819480895996, "global_step": 136294, "epoch": 3245} {"train_loss": -6.730573654174805, "global_step": 136295, "epoch": 3245} {"train_loss": -6.8287153244018555, "global_step": 136296, "epoch": 3245} {"train_loss": -6.7561445236206055, "global_step": 136297, "epoch": 3245} {"train_loss": -6.836555480957031, "global_step": 136298, "epoch": 3245} {"train_loss": -6.769444465637207, "global_step": 136299, "epoch": 3245} {"train_loss": -6.762547016143799, "global_step": 136300, "epoch": 3245} {"train_loss": -6.664653778076172, "global_step": 136301, "epoch": 3245} {"train_loss": -6.834773063659668, "global_step": 136302, "epoch": 3245} {"train_loss": -6.66343879699707, "global_step": 136303, "epoch": 3245} {"train_loss": -6.758980751037598, "global_step": 136304, "epoch": 3245} {"train_loss": -6.673409938812256, "global_step": 136305, "epoch": 3245} {"train_loss": -6.7821245193481445, "global_step": 136306, "epoch": 3245} {"train_loss": -6.592740058898926, "global_step": 136307, "epoch": 3245} {"train_loss": -6.7221879959106445, "global_step": 136308, "epoch": 3245} {"train_loss": -6.640633583068848, "global_step": 136309, "epoch": 3245} {"train_loss": -6.774668216705322, "global_step": 136310, "epoch": 3245} {"train_loss": -6.703465461730957, "global_step": 136311, "epoch": 3245} {"train_loss": -6.705130577087402, "global_step": 136312, "epoch": 3245} {"train_loss": -6.693573951721191, "global_step": 136313, "epoch": 3245} {"train_loss": -6.6631269454956055, "global_step": 136314, "epoch": 3245} {"train_loss": -6.590279579162598, "global_step": 136315, "epoch": 3245} {"train_loss": -6.697544097900391, "global_step": 136316, "epoch": 3245} {"train_loss": -6.66190242767334, "global_step": 136317, "epoch": 3245} {"train_loss": -6.724045753479004, "global_step": 136318, "epoch": 3245} {"train_loss": -6.826394081115723, "global_step": 136319, "epoch": 3245} {"train_loss": -6.71237850189209, "global_step": 136320, "epoch": 3245} {"train_loss": -6.655645370483398, "global_step": 136321, "epoch": 3245} {"train_loss": -6.6228132247924805, "global_step": 136322, "epoch": 3245} {"train_loss": -6.656924247741699, "global_step": 136323, "epoch": 3245} {"train_loss": -6.647229194641113, "global_step": 136324, "epoch": 3245} {"train_loss": -6.771732330322266, "global_step": 136325, "epoch": 3245} {"train_loss": -6.711657524108887, "global_step": 136326, "epoch": 3245} {"train_loss": -6.755077838897705, "global_step": 136327, "epoch": 3245} {"train_loss": -6.876018524169922, "global_step": 136328, "epoch": 3245} {"train_loss": -6.68408727645874, "global_step": 136329, "epoch": 3245} {"train_loss": -6.671316146850586, "global_step": 136330, "epoch": 3245} {"train_loss": -6.72216736702692, "global_step": 136331, "epoch": 3245, "val_loss": 77947.046875} {"train_loss": -6.791467666625977, "global_step": 136332, "epoch": 3246} {"train_loss": -6.69614315032959, "global_step": 136333, "epoch": 3246} {"train_loss": -6.688216209411621, "global_step": 136334, "epoch": 3246} {"train_loss": -6.746079444885254, "global_step": 136335, "epoch": 3246} {"train_loss": -6.793485641479492, "global_step": 136336, "epoch": 3246} {"train_loss": -6.858434677124023, "global_step": 136337, "epoch": 3246} {"train_loss": -6.8496880531311035, "global_step": 136338, "epoch": 3246} {"train_loss": -6.726907253265381, "global_step": 136339, "epoch": 3246} {"train_loss": -6.866199970245361, "global_step": 136340, "epoch": 3246} {"train_loss": -6.710324764251709, "global_step": 136341, "epoch": 3246} {"train_loss": -6.84251070022583, "global_step": 136342, "epoch": 3246} {"train_loss": -6.805947303771973, "global_step": 136343, "epoch": 3246} {"train_loss": -6.629480361938477, "global_step": 136344, "epoch": 3246} {"train_loss": -6.707464218139648, "global_step": 136345, "epoch": 3246} {"train_loss": -6.769216060638428, "global_step": 136346, "epoch": 3246} {"train_loss": -6.71544075012207, "global_step": 136347, "epoch": 3246} {"train_loss": -6.80952787399292, "global_step": 136348, "epoch": 3246} {"train_loss": -6.717226505279541, "global_step": 136349, "epoch": 3246} {"train_loss": -6.644011497497559, "global_step": 136350, "epoch": 3246} {"train_loss": -6.811284065246582, "global_step": 136351, "epoch": 3246} {"train_loss": -6.667238235473633, "global_step": 136352, "epoch": 3246} {"train_loss": -6.773778915405273, "global_step": 136353, "epoch": 3246} {"train_loss": -6.760645866394043, "global_step": 136354, "epoch": 3246} {"train_loss": -6.796778678894043, "global_step": 136355, "epoch": 3246} {"train_loss": -6.742344856262207, "global_step": 136356, "epoch": 3246} {"train_loss": -6.829276084899902, "global_step": 136357, "epoch": 3246} {"train_loss": -6.719067573547363, "global_step": 136358, "epoch": 3246} {"train_loss": -6.731949806213379, "global_step": 136359, "epoch": 3246} {"train_loss": -6.678994655609131, "global_step": 136360, "epoch": 3246} {"train_loss": -6.7784013748168945, "global_step": 136361, "epoch": 3246} {"train_loss": -6.724197864532471, "global_step": 136362, "epoch": 3246} {"train_loss": -6.675046443939209, "global_step": 136363, "epoch": 3246} {"train_loss": -6.73590087890625, "global_step": 136364, "epoch": 3246} {"train_loss": -6.6997599601745605, "global_step": 136365, "epoch": 3246} {"train_loss": -6.739688873291016, "global_step": 136366, "epoch": 3246} {"train_loss": -6.651064872741699, "global_step": 136367, "epoch": 3246} {"train_loss": -6.779120445251465, "global_step": 136368, "epoch": 3246} {"train_loss": -6.781076431274414, "global_step": 136369, "epoch": 3246} {"train_loss": -6.794182777404785, "global_step": 136370, "epoch": 3246} {"train_loss": -6.6017022132873535, "global_step": 136371, "epoch": 3246} {"train_loss": -6.710361480712891, "global_step": 136372, "epoch": 3246} {"train_loss": -6.745726233436947, "global_step": 136373, "epoch": 3246, "val_loss": 77943.1640625} {"train_loss": -6.705163955688477, "global_step": 136374, "epoch": 3247} {"train_loss": -6.7429633140563965, "global_step": 136375, "epoch": 3247} {"train_loss": -6.646857261657715, "global_step": 136376, "epoch": 3247} {"train_loss": -6.739701747894287, "global_step": 136377, "epoch": 3247} {"train_loss": -6.81431245803833, "global_step": 136378, "epoch": 3247} {"train_loss": -6.815345764160156, "global_step": 136379, "epoch": 3247} {"train_loss": -6.875263214111328, "global_step": 136380, "epoch": 3247} {"train_loss": -6.7954301834106445, "global_step": 136381, "epoch": 3247} {"train_loss": -6.665983200073242, "global_step": 136382, "epoch": 3247} {"train_loss": -6.794514179229736, "global_step": 136383, "epoch": 3247} {"train_loss": -6.653802394866943, "global_step": 136384, "epoch": 3247} {"train_loss": -6.762574195861816, "global_step": 136385, "epoch": 3247} {"train_loss": -6.835784435272217, "global_step": 136386, "epoch": 3247} {"train_loss": -6.763584136962891, "global_step": 136387, "epoch": 3247} {"train_loss": -6.68190860748291, "global_step": 136388, "epoch": 3247} {"train_loss": -6.772761344909668, "global_step": 136389, "epoch": 3247} {"train_loss": -6.709129333496094, "global_step": 136390, "epoch": 3247} {"train_loss": -6.688024997711182, "global_step": 136391, "epoch": 3247} {"train_loss": -6.796509742736816, "global_step": 136392, "epoch": 3247} {"train_loss": -6.77968692779541, "global_step": 136393, "epoch": 3247} {"train_loss": -6.677989482879639, "global_step": 136394, "epoch": 3247} {"train_loss": -6.841150283813477, "global_step": 136395, "epoch": 3247} {"train_loss": -6.696168422698975, "global_step": 136396, "epoch": 3247} {"train_loss": -6.715002059936523, "global_step": 136397, "epoch": 3247} {"train_loss": -6.644564628601074, "global_step": 136398, "epoch": 3247} {"train_loss": -6.696791648864746, "global_step": 136399, "epoch": 3247} {"train_loss": -6.718229293823242, "global_step": 136400, "epoch": 3247} {"train_loss": -6.768558502197266, "global_step": 136401, "epoch": 3247} {"train_loss": -6.669551849365234, "global_step": 136402, "epoch": 3247} {"train_loss": -6.742470741271973, "global_step": 136403, "epoch": 3247} {"train_loss": -6.741601943969727, "global_step": 136404, "epoch": 3247} {"train_loss": -6.805760860443115, "global_step": 136405, "epoch": 3247} {"train_loss": -6.787833213806152, "global_step": 136406, "epoch": 3247} {"train_loss": -6.820298671722412, "global_step": 136407, "epoch": 3247} {"train_loss": -6.662566184997559, "global_step": 136408, "epoch": 3247} {"train_loss": -6.638121128082275, "global_step": 136409, "epoch": 3247} {"train_loss": -6.842119216918945, "global_step": 136410, "epoch": 3247} {"train_loss": -6.635922908782959, "global_step": 136411, "epoch": 3247} {"train_loss": -6.82502555847168, "global_step": 136412, "epoch": 3247} {"train_loss": -6.643831253051758, "global_step": 136413, "epoch": 3247} {"train_loss": -6.705690383911133, "global_step": 136414, "epoch": 3247} {"train_loss": -6.7364900679815385, "global_step": 136415, "epoch": 3247, "val_loss": 78095.3359375} {"train_loss": -6.78674840927124, "global_step": 136416, "epoch": 3248} {"train_loss": -6.6518049240112305, "global_step": 136417, "epoch": 3248} {"train_loss": -6.833166599273682, "global_step": 136418, "epoch": 3248} {"train_loss": -6.753412246704102, "global_step": 136419, "epoch": 3248} {"train_loss": -6.7342329025268555, "global_step": 136420, "epoch": 3248} {"train_loss": -6.724872589111328, "global_step": 136421, "epoch": 3248} {"train_loss": -6.7895402908325195, "global_step": 136422, "epoch": 3248} {"train_loss": -6.717257022857666, "global_step": 136423, "epoch": 3248} {"train_loss": -6.806487560272217, "global_step": 136424, "epoch": 3248} {"train_loss": -6.791828632354736, "global_step": 136425, "epoch": 3248} {"train_loss": -6.748023986816406, "global_step": 136426, "epoch": 3248} {"train_loss": -6.759740829467773, "global_step": 136427, "epoch": 3248} {"train_loss": -6.789310455322266, "global_step": 136428, "epoch": 3248} {"train_loss": -6.754983425140381, "global_step": 136429, "epoch": 3248} {"train_loss": -6.775069236755371, "global_step": 136430, "epoch": 3248} {"train_loss": -6.6991167068481445, "global_step": 136431, "epoch": 3248} {"train_loss": -6.8323073387146, "global_step": 136432, "epoch": 3248} {"train_loss": -6.784842014312744, "global_step": 136433, "epoch": 3248} {"train_loss": -6.756908416748047, "global_step": 136434, "epoch": 3248} {"train_loss": -6.670717239379883, "global_step": 136435, "epoch": 3248} {"train_loss": -6.645471572875977, "global_step": 136436, "epoch": 3248} {"train_loss": -6.794165134429932, "global_step": 136437, "epoch": 3248} {"train_loss": -6.676779270172119, "global_step": 136438, "epoch": 3248} {"train_loss": -6.637214660644531, "global_step": 136439, "epoch": 3248} {"train_loss": -6.756840705871582, "global_step": 136440, "epoch": 3248} {"train_loss": -6.662819862365723, "global_step": 136441, "epoch": 3248} {"train_loss": -6.477704048156738, "global_step": 136442, "epoch": 3248} {"train_loss": -6.7354254722595215, "global_step": 136443, "epoch": 3248} {"train_loss": -6.728117942810059, "global_step": 136444, "epoch": 3248} {"train_loss": -6.639127731323242, "global_step": 136445, "epoch": 3248} {"train_loss": -6.671361923217773, "global_step": 136446, "epoch": 3248} {"train_loss": -6.589293956756592, "global_step": 136447, "epoch": 3248} {"train_loss": -6.630692958831787, "global_step": 136448, "epoch": 3248} {"train_loss": -6.5912065505981445, "global_step": 136449, "epoch": 3248} {"train_loss": -6.551603317260742, "global_step": 136450, "epoch": 3248} {"train_loss": -6.710277557373047, "global_step": 136451, "epoch": 3248} {"train_loss": -6.617856979370117, "global_step": 136452, "epoch": 3248} {"train_loss": -6.697226524353027, "global_step": 136453, "epoch": 3248} {"train_loss": -6.702723026275635, "global_step": 136454, "epoch": 3248} {"train_loss": -6.768935203552246, "global_step": 136455, "epoch": 3248} {"train_loss": -6.637428283691406, "global_step": 136456, "epoch": 3248} {"train_loss": -6.7104203133356, "global_step": 136457, "epoch": 3248, "val_loss": 77831.1484375} {"train_loss": -6.6034135818481445, "global_step": 136458, "epoch": 3249} {"train_loss": -6.708371162414551, "global_step": 136459, "epoch": 3249} {"train_loss": -6.652438163757324, "global_step": 136460, "epoch": 3249} {"train_loss": -6.638487815856934, "global_step": 136461, "epoch": 3249} {"train_loss": -6.586498260498047, "global_step": 136462, "epoch": 3249} {"train_loss": -6.750946044921875, "global_step": 136463, "epoch": 3249} {"train_loss": -6.642481803894043, "global_step": 136464, "epoch": 3249} {"train_loss": -6.572109222412109, "global_step": 136465, "epoch": 3249} {"train_loss": -6.562576770782471, "global_step": 136466, "epoch": 3249} {"train_loss": -6.685938835144043, "global_step": 136467, "epoch": 3249} {"train_loss": -6.594621181488037, "global_step": 136468, "epoch": 3249} {"train_loss": -6.755743026733398, "global_step": 136469, "epoch": 3249} {"train_loss": -6.720524787902832, "global_step": 136470, "epoch": 3249} {"train_loss": -6.6503119468688965, "global_step": 136471, "epoch": 3249} {"train_loss": -6.897294044494629, "global_step": 136472, "epoch": 3249} {"train_loss": -6.6229248046875, "global_step": 136473, "epoch": 3249} {"train_loss": -6.732682228088379, "global_step": 136474, "epoch": 3249} {"train_loss": -6.610616683959961, "global_step": 136475, "epoch": 3249} {"train_loss": -6.67406702041626, "global_step": 136476, "epoch": 3249} {"train_loss": -6.772350311279297, "global_step": 136477, "epoch": 3249} {"train_loss": -6.711511611938477, "global_step": 136478, "epoch": 3249} {"train_loss": -6.774774551391602, "global_step": 136479, "epoch": 3249} {"train_loss": -6.645538806915283, "global_step": 136480, "epoch": 3249} {"train_loss": -6.601156711578369, "global_step": 136481, "epoch": 3249} {"train_loss": -6.76055383682251, "global_step": 136482, "epoch": 3249} {"train_loss": -6.783533573150635, "global_step": 136483, "epoch": 3249} {"train_loss": -6.684395790100098, "global_step": 136484, "epoch": 3249} {"train_loss": -6.735658168792725, "global_step": 136485, "epoch": 3249} {"train_loss": -6.611973285675049, "global_step": 136486, "epoch": 3249} {"train_loss": -6.749143600463867, "global_step": 136487, "epoch": 3249} {"train_loss": -6.718596935272217, "global_step": 136488, "epoch": 3249} {"train_loss": -6.643301010131836, "global_step": 136489, "epoch": 3249} {"train_loss": -6.668768882751465, "global_step": 136490, "epoch": 3249} {"train_loss": -6.573397636413574, "global_step": 136491, "epoch": 3249} {"train_loss": -6.741927146911621, "global_step": 136492, "epoch": 3249} {"train_loss": -6.654711723327637, "global_step": 136493, "epoch": 3249} {"train_loss": -6.742832183837891, "global_step": 136494, "epoch": 3249} {"train_loss": -6.627979278564453, "global_step": 136495, "epoch": 3249} {"train_loss": -6.7005486488342285, "global_step": 136496, "epoch": 3249} {"train_loss": -6.6595563888549805, "global_step": 136497, "epoch": 3249} {"train_loss": -6.687190055847168, "global_step": 136498, "epoch": 3249} {"train_loss": -6.680844363712129, "global_step": 136499, "epoch": 3249, "val_loss": 77877.2109375} {"train_loss": -6.764753818511963, "global_step": 136500, "epoch": 3250} {"train_loss": -6.71377420425415, "global_step": 136501, "epoch": 3250} {"train_loss": -6.705896854400635, "global_step": 136502, "epoch": 3250} {"train_loss": -6.771211624145508, "global_step": 136503, "epoch": 3250} {"train_loss": -6.884115219116211, "global_step": 136504, "epoch": 3250} {"train_loss": -6.69703483581543, "global_step": 136505, "epoch": 3250} {"train_loss": -6.711566925048828, "global_step": 136506, "epoch": 3250} {"train_loss": -6.755940914154053, "global_step": 136507, "epoch": 3250} {"train_loss": -6.659398078918457, "global_step": 136508, "epoch": 3250} {"train_loss": -6.768336772918701, "global_step": 136509, "epoch": 3250} {"train_loss": -6.682585716247559, "global_step": 136510, "epoch": 3250} {"train_loss": -6.756130218505859, "global_step": 136511, "epoch": 3250} {"train_loss": -6.727870941162109, "global_step": 136512, "epoch": 3250} {"train_loss": -6.799460411071777, "global_step": 136513, "epoch": 3250} {"train_loss": -6.6715474128723145, "global_step": 136514, "epoch": 3250} {"train_loss": -6.650078773498535, "global_step": 136515, "epoch": 3250} {"train_loss": -6.714996337890625, "global_step": 136516, "epoch": 3250} {"train_loss": -6.774343490600586, "global_step": 136517, "epoch": 3250} {"train_loss": -6.727058410644531, "global_step": 136518, "epoch": 3250} {"train_loss": -6.7044854164123535, "global_step": 136519, "epoch": 3250} {"train_loss": -6.706865310668945, "global_step": 136520, "epoch": 3250} {"train_loss": -6.700216293334961, "global_step": 136521, "epoch": 3250} {"train_loss": -6.67707633972168, "global_step": 136522, "epoch": 3250} {"train_loss": -6.80372428894043, "global_step": 136523, "epoch": 3250} {"train_loss": -6.721164703369141, "global_step": 136524, "epoch": 3250} {"train_loss": -6.637548923492432, "global_step": 136525, "epoch": 3250} {"train_loss": -6.855843544006348, "global_step": 136526, "epoch": 3250} {"train_loss": -6.804191589355469, "global_step": 136527, "epoch": 3250} {"train_loss": -6.770206451416016, "global_step": 136528, "epoch": 3250} {"train_loss": -6.665772914886475, "global_step": 136529, "epoch": 3250} {"train_loss": -6.775263786315918, "global_step": 136530, "epoch": 3250} {"train_loss": -6.797382831573486, "global_step": 136531, "epoch": 3250} {"train_loss": -6.763808250427246, "global_step": 136532, "epoch": 3250} {"train_loss": -6.746124267578125, "global_step": 136533, "epoch": 3250} {"train_loss": -6.920352935791016, "global_step": 136534, "epoch": 3250} {"train_loss": -6.767270565032959, "global_step": 136535, "epoch": 3250} {"train_loss": -6.850796699523926, "global_step": 136536, "epoch": 3250} {"train_loss": -6.773852348327637, "global_step": 136537, "epoch": 3250} {"train_loss": -6.714278221130371, "global_step": 136538, "epoch": 3250} {"train_loss": -6.697609901428223, "global_step": 136539, "epoch": 3250} {"train_loss": -6.745908737182617, "global_step": 136540, "epoch": 3250} {"train_loss": -6.745243946711223, "global_step": 136541, "epoch": 3250, "train/sim_max_reward_0": 0.4011358218880728, "train/sim_max_reward_1": 0.8985312824088497, "train/sim_max_reward_2": 0.41494797002445394, "train/sim_max_reward_3": 0.13275448128485526, "train/sim_max_reward_4": 0.9208838237773627, "train/sim_max_reward_5": 0.5724785261152691, "test/sim_max_reward_4500000": 0.9078491752271025, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9858412971968576, "test/sim_max_reward_4500003": 0.1989040773371007, "test/sim_max_reward_4500004": 0.18582062688703263, "test/sim_max_reward_4500005": 0.17688711409318197, "test/sim_max_reward_4500006": 0.9832464813254059, "test/sim_max_reward_4500007": 0.919933876226768, "test/sim_max_reward_4500008": 0.9609605566408366, "test/sim_max_reward_4500009": 0.05347213665904676, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.997166602720924, "test/sim_max_reward_4500012": 0.8872327453615877, "test/sim_max_reward_4500013": 0.008527455640533104, "test/sim_max_reward_4500014": 0.8316469044095081, "test/sim_max_reward_4500015": 0.835786778088434, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.039551073372177045, "test/sim_max_reward_4500018": 0.9518013882575613, "test/sim_max_reward_4500019": 0.9756886773864265, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9308006480015665, "test/sim_max_reward_4500022": 0.7659368964562977, "test/sim_max_reward_4500023": 0.5277646789693283, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9150840471587443, "test/sim_max_reward_4500026": 0.6820723823055654, "test/sim_max_reward_4500027": 0.9667778849545835, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.04163460642148004, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04656241646823892, "test/sim_max_reward_4500033": 0.8254561213213276, "test/sim_max_reward_4500034": 0.9565920593518694, "test/sim_max_reward_4500035": 0.7605097844493912, "test/sim_max_reward_4500036": 0.4607129989612143, "test/sim_max_reward_4500037": 0.839467982122499, "test/sim_max_reward_4500038": 0.8967251164222921, "test/sim_max_reward_4500039": 0.7672424315250129, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.5582591503572336, "test/sim_max_reward_4500042": 0.04691175656443609, "test/sim_max_reward_4500043": 0.0, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9824887703939682, "test/sim_max_reward_4500046": 0.14365429947997868, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9524112861570235, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5567886509164772, "test/mean_score": 0.5239108710124776, "val_loss": 77812.828125} {"train_loss": -6.723865509033203, "global_step": 136542, "epoch": 3251} {"train_loss": -6.744551181793213, "global_step": 136543, "epoch": 3251} {"train_loss": -6.837377548217773, "global_step": 136544, "epoch": 3251} {"train_loss": -6.871303558349609, "global_step": 136545, "epoch": 3251} {"train_loss": -6.746528625488281, "global_step": 136546, "epoch": 3251} {"train_loss": -6.801783561706543, "global_step": 136547, "epoch": 3251} {"train_loss": -6.8434672355651855, "global_step": 136548, "epoch": 3251} {"train_loss": -6.845692157745361, "global_step": 136549, "epoch": 3251} {"train_loss": -6.776549339294434, "global_step": 136550, "epoch": 3251} {"train_loss": -6.764632701873779, "global_step": 136551, "epoch": 3251} {"train_loss": -6.74025821685791, "global_step": 136552, "epoch": 3251} {"train_loss": -6.88718843460083, "global_step": 136553, "epoch": 3251} {"train_loss": -6.666199684143066, "global_step": 136554, "epoch": 3251} {"train_loss": -6.768704891204834, "global_step": 136555, "epoch": 3251} {"train_loss": -6.645071506500244, "global_step": 136556, "epoch": 3251} {"train_loss": -6.819033145904541, "global_step": 136557, "epoch": 3251} {"train_loss": -6.781187534332275, "global_step": 136558, "epoch": 3251} {"train_loss": -6.840366363525391, "global_step": 136559, "epoch": 3251} {"train_loss": -6.7148261070251465, "global_step": 136560, "epoch": 3251} {"train_loss": -6.596433639526367, "global_step": 136561, "epoch": 3251} {"train_loss": -6.628498554229736, "global_step": 136562, "epoch": 3251} {"train_loss": -6.7567925453186035, "global_step": 136563, "epoch": 3251} {"train_loss": -6.6656036376953125, "global_step": 136564, "epoch": 3251} {"train_loss": -6.702648162841797, "global_step": 136565, "epoch": 3251} {"train_loss": -6.732840538024902, "global_step": 136566, "epoch": 3251} {"train_loss": -6.68540620803833, "global_step": 136567, "epoch": 3251} {"train_loss": -6.702613830566406, "global_step": 136568, "epoch": 3251} {"train_loss": -6.696789264678955, "global_step": 136569, "epoch": 3251} {"train_loss": -6.688807010650635, "global_step": 136570, "epoch": 3251} {"train_loss": -6.749457359313965, "global_step": 136571, "epoch": 3251} {"train_loss": -6.727373123168945, "global_step": 136572, "epoch": 3251} {"train_loss": -6.546812534332275, "global_step": 136573, "epoch": 3251} {"train_loss": -6.631494998931885, "global_step": 136574, "epoch": 3251} {"train_loss": -6.635035514831543, "global_step": 136575, "epoch": 3251} {"train_loss": -6.541367530822754, "global_step": 136576, "epoch": 3251} {"train_loss": -6.622729301452637, "global_step": 136577, "epoch": 3251} {"train_loss": -6.627356052398682, "global_step": 136578, "epoch": 3251} {"train_loss": -6.730818748474121, "global_step": 136579, "epoch": 3251} {"train_loss": -6.709591388702393, "global_step": 136580, "epoch": 3251} {"train_loss": -6.733975410461426, "global_step": 136581, "epoch": 3251} {"train_loss": -6.621617317199707, "global_step": 136582, "epoch": 3251} {"train_loss": -6.720112698418753, "global_step": 136583, "epoch": 3251, "val_loss": 77802.2890625} {"train_loss": -6.803228378295898, "global_step": 136584, "epoch": 3252} {"train_loss": -6.723232746124268, "global_step": 136585, "epoch": 3252} {"train_loss": -6.734964370727539, "global_step": 136586, "epoch": 3252} {"train_loss": -6.737870216369629, "global_step": 136587, "epoch": 3252} {"train_loss": -6.6442413330078125, "global_step": 136588, "epoch": 3252} {"train_loss": -6.740008354187012, "global_step": 136589, "epoch": 3252} {"train_loss": -6.782625675201416, "global_step": 136590, "epoch": 3252} {"train_loss": -6.8370795249938965, "global_step": 136591, "epoch": 3252} {"train_loss": -6.691039085388184, "global_step": 136592, "epoch": 3252} {"train_loss": -6.755107402801514, "global_step": 136593, "epoch": 3252} {"train_loss": -6.815494537353516, "global_step": 136594, "epoch": 3252} {"train_loss": -6.6867828369140625, "global_step": 136595, "epoch": 3252} {"train_loss": -6.721380233764648, "global_step": 136596, "epoch": 3252} {"train_loss": -6.835381507873535, "global_step": 136597, "epoch": 3252} {"train_loss": -6.769156455993652, "global_step": 136598, "epoch": 3252} {"train_loss": -6.757050514221191, "global_step": 136599, "epoch": 3252} {"train_loss": -6.702937126159668, "global_step": 136600, "epoch": 3252} {"train_loss": -6.780178546905518, "global_step": 136601, "epoch": 3252} {"train_loss": -6.712374687194824, "global_step": 136602, "epoch": 3252} {"train_loss": -6.7205328941345215, "global_step": 136603, "epoch": 3252} {"train_loss": -6.695977210998535, "global_step": 136604, "epoch": 3252} {"train_loss": -6.776547431945801, "global_step": 136605, "epoch": 3252} {"train_loss": -6.7068071365356445, "global_step": 136606, "epoch": 3252} {"train_loss": -6.66584587097168, "global_step": 136607, "epoch": 3252} {"train_loss": -6.7954583168029785, "global_step": 136608, "epoch": 3252} {"train_loss": -6.7431535720825195, "global_step": 136609, "epoch": 3252} {"train_loss": -6.674278259277344, "global_step": 136610, "epoch": 3252} {"train_loss": -6.717791557312012, "global_step": 136611, "epoch": 3252} {"train_loss": -6.772199630737305, "global_step": 136612, "epoch": 3252} {"train_loss": -6.801413536071777, "global_step": 136613, "epoch": 3252} {"train_loss": -6.678532600402832, "global_step": 136614, "epoch": 3252} {"train_loss": -6.673569679260254, "global_step": 136615, "epoch": 3252} {"train_loss": -6.747365951538086, "global_step": 136616, "epoch": 3252} {"train_loss": -6.600131034851074, "global_step": 136617, "epoch": 3252} {"train_loss": -6.747313499450684, "global_step": 136618, "epoch": 3252} {"train_loss": -6.784590721130371, "global_step": 136619, "epoch": 3252} {"train_loss": -6.688435077667236, "global_step": 136620, "epoch": 3252} {"train_loss": -6.764402866363525, "global_step": 136621, "epoch": 3252} {"train_loss": -6.6114397048950195, "global_step": 136622, "epoch": 3252} {"train_loss": -6.732567310333252, "global_step": 136623, "epoch": 3252} {"train_loss": -6.721192359924316, "global_step": 136624, "epoch": 3252} {"train_loss": -6.732041143235707, "global_step": 136625, "epoch": 3252, "val_loss": 77812.7109375} {"train_loss": -6.7180633544921875, "global_step": 136626, "epoch": 3253} {"train_loss": -6.7492852210998535, "global_step": 136627, "epoch": 3253} {"train_loss": -6.741190433502197, "global_step": 136628, "epoch": 3253} {"train_loss": -6.60203742980957, "global_step": 136629, "epoch": 3253} {"train_loss": -6.749401092529297, "global_step": 136630, "epoch": 3253} {"train_loss": -6.71771240234375, "global_step": 136631, "epoch": 3253} {"train_loss": -6.72188663482666, "global_step": 136632, "epoch": 3253} {"train_loss": -6.7719502449035645, "global_step": 136633, "epoch": 3253} {"train_loss": -6.727736949920654, "global_step": 136634, "epoch": 3253} {"train_loss": -6.737804412841797, "global_step": 136635, "epoch": 3253} {"train_loss": -6.800357818603516, "global_step": 136636, "epoch": 3253} {"train_loss": -6.686694145202637, "global_step": 136637, "epoch": 3253} {"train_loss": -6.748856067657471, "global_step": 136638, "epoch": 3253} {"train_loss": -6.7357177734375, "global_step": 136639, "epoch": 3253} {"train_loss": -6.71034574508667, "global_step": 136640, "epoch": 3253} {"train_loss": -6.625808238983154, "global_step": 136641, "epoch": 3253} {"train_loss": -6.584362030029297, "global_step": 136642, "epoch": 3253} {"train_loss": -6.695054054260254, "global_step": 136643, "epoch": 3253} {"train_loss": -6.661149024963379, "global_step": 136644, "epoch": 3253} {"train_loss": -6.533690452575684, "global_step": 136645, "epoch": 3253} {"train_loss": -6.6656646728515625, "global_step": 136646, "epoch": 3253} {"train_loss": -6.742945671081543, "global_step": 136647, "epoch": 3253} {"train_loss": -6.632604598999023, "global_step": 136648, "epoch": 3253} {"train_loss": -6.698182582855225, "global_step": 136649, "epoch": 3253} {"train_loss": -6.514310836791992, "global_step": 136650, "epoch": 3253} {"train_loss": -6.617406845092773, "global_step": 136651, "epoch": 3253} {"train_loss": -6.707001209259033, "global_step": 136652, "epoch": 3253} {"train_loss": -6.4959001541137695, "global_step": 136653, "epoch": 3253} {"train_loss": -6.674232482910156, "global_step": 136654, "epoch": 3253} {"train_loss": -6.70045280456543, "global_step": 136655, "epoch": 3253} {"train_loss": -6.692738056182861, "global_step": 136656, "epoch": 3253} {"train_loss": -6.7513933181762695, "global_step": 136657, "epoch": 3253} {"train_loss": -6.671835899353027, "global_step": 136658, "epoch": 3253} {"train_loss": -6.662186145782471, "global_step": 136659, "epoch": 3253} {"train_loss": -6.676058769226074, "global_step": 136660, "epoch": 3253} {"train_loss": -6.731856346130371, "global_step": 136661, "epoch": 3253} {"train_loss": -6.804556369781494, "global_step": 136662, "epoch": 3253} {"train_loss": -6.68113899230957, "global_step": 136663, "epoch": 3253} {"train_loss": -6.611371040344238, "global_step": 136664, "epoch": 3253} {"train_loss": -6.704644203186035, "global_step": 136665, "epoch": 3253} {"train_loss": -6.7601423263549805, "global_step": 136666, "epoch": 3253} {"train_loss": -6.689992268880208, "global_step": 136667, "epoch": 3253, "val_loss": 77809.171875} {"train_loss": -6.741809368133545, "global_step": 136668, "epoch": 3254} {"train_loss": -6.746822357177734, "global_step": 136669, "epoch": 3254} {"train_loss": -6.713558197021484, "global_step": 136670, "epoch": 3254} {"train_loss": -6.81465482711792, "global_step": 136671, "epoch": 3254} {"train_loss": -6.688262939453125, "global_step": 136672, "epoch": 3254} {"train_loss": -6.645824909210205, "global_step": 136673, "epoch": 3254} {"train_loss": -6.758342742919922, "global_step": 136674, "epoch": 3254} {"train_loss": -6.609399795532227, "global_step": 136675, "epoch": 3254} {"train_loss": -6.725767135620117, "global_step": 136676, "epoch": 3254} {"train_loss": -6.8918137550354, "global_step": 136677, "epoch": 3254} {"train_loss": -6.555044174194336, "global_step": 136678, "epoch": 3254} {"train_loss": -6.625109672546387, "global_step": 136679, "epoch": 3254} {"train_loss": -6.663704872131348, "global_step": 136680, "epoch": 3254} {"train_loss": -6.6983747482299805, "global_step": 136681, "epoch": 3254} {"train_loss": -6.7450714111328125, "global_step": 136682, "epoch": 3254} {"train_loss": -6.7910308837890625, "global_step": 136683, "epoch": 3254} {"train_loss": -6.698110103607178, "global_step": 136684, "epoch": 3254} {"train_loss": -6.727705001831055, "global_step": 136685, "epoch": 3254} {"train_loss": -6.757742881774902, "global_step": 136686, "epoch": 3254} {"train_loss": -6.631074905395508, "global_step": 136687, "epoch": 3254} {"train_loss": -6.759955883026123, "global_step": 136688, "epoch": 3254} {"train_loss": -6.763540267944336, "global_step": 136689, "epoch": 3254} {"train_loss": -6.807077407836914, "global_step": 136690, "epoch": 3254} {"train_loss": -6.877895832061768, "global_step": 136691, "epoch": 3254} {"train_loss": -6.76578426361084, "global_step": 136692, "epoch": 3254} {"train_loss": -6.827112197875977, "global_step": 136693, "epoch": 3254} {"train_loss": -6.738184452056885, "global_step": 136694, "epoch": 3254} {"train_loss": -6.768851280212402, "global_step": 136695, "epoch": 3254} {"train_loss": -6.676251411437988, "global_step": 136696, "epoch": 3254} {"train_loss": -6.833536624908447, "global_step": 136697, "epoch": 3254} {"train_loss": -6.7397966384887695, "global_step": 136698, "epoch": 3254} {"train_loss": -6.726742744445801, "global_step": 136699, "epoch": 3254} {"train_loss": -6.753952980041504, "global_step": 136700, "epoch": 3254} {"train_loss": -6.702335357666016, "global_step": 136701, "epoch": 3254} {"train_loss": -6.799882888793945, "global_step": 136702, "epoch": 3254} {"train_loss": -6.7998762130737305, "global_step": 136703, "epoch": 3254} {"train_loss": -6.7409348487854, "global_step": 136704, "epoch": 3254} {"train_loss": -6.772465705871582, "global_step": 136705, "epoch": 3254} {"train_loss": -6.819342613220215, "global_step": 136706, "epoch": 3254} {"train_loss": -6.812626838684082, "global_step": 136707, "epoch": 3254} {"train_loss": -6.654380798339844, "global_step": 136708, "epoch": 3254} {"train_loss": -6.741674741109212, "global_step": 136709, "epoch": 3254, "val_loss": 78089.328125} {"train_loss": -6.74732780456543, "global_step": 136710, "epoch": 3255} {"train_loss": -6.720873832702637, "global_step": 136711, "epoch": 3255} {"train_loss": -6.73250675201416, "global_step": 136712, "epoch": 3255} {"train_loss": -6.723269462585449, "global_step": 136713, "epoch": 3255} {"train_loss": -6.790019989013672, "global_step": 136714, "epoch": 3255} {"train_loss": -6.755792617797852, "global_step": 136715, "epoch": 3255} {"train_loss": -6.7461957931518555, "global_step": 136716, "epoch": 3255} {"train_loss": -6.760230541229248, "global_step": 136717, "epoch": 3255} {"train_loss": -6.781082630157471, "global_step": 136718, "epoch": 3255} {"train_loss": -6.734196186065674, "global_step": 136719, "epoch": 3255} {"train_loss": -6.775232315063477, "global_step": 136720, "epoch": 3255} {"train_loss": -6.681102752685547, "global_step": 136721, "epoch": 3255} {"train_loss": -6.881100654602051, "global_step": 136722, "epoch": 3255} {"train_loss": -6.7824320793151855, "global_step": 136723, "epoch": 3255} {"train_loss": -6.852410316467285, "global_step": 136724, "epoch": 3255} {"train_loss": -6.750458717346191, "global_step": 136725, "epoch": 3255} {"train_loss": -6.8291425704956055, "global_step": 136726, "epoch": 3255} {"train_loss": -6.823540210723877, "global_step": 136727, "epoch": 3255} {"train_loss": -6.7471771240234375, "global_step": 136728, "epoch": 3255} {"train_loss": -6.723293781280518, "global_step": 136729, "epoch": 3255} {"train_loss": -6.75483512878418, "global_step": 136730, "epoch": 3255} {"train_loss": -6.7921342849731445, "global_step": 136731, "epoch": 3255} {"train_loss": -6.760424613952637, "global_step": 136732, "epoch": 3255} {"train_loss": -6.775536060333252, "global_step": 136733, "epoch": 3255} {"train_loss": -6.796408653259277, "global_step": 136734, "epoch": 3255} {"train_loss": -6.712928771972656, "global_step": 136735, "epoch": 3255} {"train_loss": -6.628495693206787, "global_step": 136736, "epoch": 3255} {"train_loss": -6.679328918457031, "global_step": 136737, "epoch": 3255} {"train_loss": -6.676091194152832, "global_step": 136738, "epoch": 3255} {"train_loss": -6.736793041229248, "global_step": 136739, "epoch": 3255} {"train_loss": -6.616877555847168, "global_step": 136740, "epoch": 3255} {"train_loss": -6.674463748931885, "global_step": 136741, "epoch": 3255} {"train_loss": -6.683588027954102, "global_step": 136742, "epoch": 3255} {"train_loss": -6.759891986846924, "global_step": 136743, "epoch": 3255} {"train_loss": -6.655135154724121, "global_step": 136744, "epoch": 3255} {"train_loss": -6.81764554977417, "global_step": 136745, "epoch": 3255} {"train_loss": -6.645998001098633, "global_step": 136746, "epoch": 3255} {"train_loss": -6.736489295959473, "global_step": 136747, "epoch": 3255} {"train_loss": -6.7437052726745605, "global_step": 136748, "epoch": 3255} {"train_loss": -6.748374938964844, "global_step": 136749, "epoch": 3255} {"train_loss": -6.716220855712891, "global_step": 136750, "epoch": 3255} {"train_loss": -6.742411647524152, "global_step": 136751, "epoch": 3255, "val_loss": 77912.8359375} {"train_loss": -6.612729072570801, "global_step": 136752, "epoch": 3256} {"train_loss": -6.747074604034424, "global_step": 136753, "epoch": 3256} {"train_loss": -6.789379596710205, "global_step": 136754, "epoch": 3256} {"train_loss": -6.762555122375488, "global_step": 136755, "epoch": 3256} {"train_loss": -6.663799285888672, "global_step": 136756, "epoch": 3256} {"train_loss": -6.6860246658325195, "global_step": 136757, "epoch": 3256} {"train_loss": -6.644960403442383, "global_step": 136758, "epoch": 3256} {"train_loss": -6.683053016662598, "global_step": 136759, "epoch": 3256} {"train_loss": -6.729742050170898, "global_step": 136760, "epoch": 3256} {"train_loss": -6.646047592163086, "global_step": 136761, "epoch": 3256} {"train_loss": -6.876068115234375, "global_step": 136762, "epoch": 3256} {"train_loss": -6.6772990226745605, "global_step": 136763, "epoch": 3256} {"train_loss": -6.684477806091309, "global_step": 136764, "epoch": 3256} {"train_loss": -6.739194869995117, "global_step": 136765, "epoch": 3256} {"train_loss": -6.558938026428223, "global_step": 136766, "epoch": 3256} {"train_loss": -6.666591644287109, "global_step": 136767, "epoch": 3256} {"train_loss": -6.678897857666016, "global_step": 136768, "epoch": 3256} {"train_loss": -6.585573196411133, "global_step": 136769, "epoch": 3256} {"train_loss": -6.712069988250732, "global_step": 136770, "epoch": 3256} {"train_loss": -6.609764099121094, "global_step": 136771, "epoch": 3256} {"train_loss": -6.730776309967041, "global_step": 136772, "epoch": 3256} {"train_loss": -6.708532333374023, "global_step": 136773, "epoch": 3256} {"train_loss": -6.636959075927734, "global_step": 136774, "epoch": 3256} {"train_loss": -6.677576541900635, "global_step": 136775, "epoch": 3256} {"train_loss": -6.592052936553955, "global_step": 136776, "epoch": 3256} {"train_loss": -6.712124347686768, "global_step": 136777, "epoch": 3256} {"train_loss": -6.625450134277344, "global_step": 136778, "epoch": 3256} {"train_loss": -6.788064956665039, "global_step": 136779, "epoch": 3256} {"train_loss": -6.7685160636901855, "global_step": 136780, "epoch": 3256} {"train_loss": -6.713357448577881, "global_step": 136781, "epoch": 3256} {"train_loss": -6.7474236488342285, "global_step": 136782, "epoch": 3256} {"train_loss": -6.709536552429199, "global_step": 136783, "epoch": 3256} {"train_loss": -6.682305812835693, "global_step": 136784, "epoch": 3256} {"train_loss": -6.633023262023926, "global_step": 136785, "epoch": 3256} {"train_loss": -6.708248138427734, "global_step": 136786, "epoch": 3256} {"train_loss": -6.757653713226318, "global_step": 136787, "epoch": 3256} {"train_loss": -6.8652753829956055, "global_step": 136788, "epoch": 3256} {"train_loss": -6.740234375, "global_step": 136789, "epoch": 3256} {"train_loss": -6.8021440505981445, "global_step": 136790, "epoch": 3256} {"train_loss": -6.711864471435547, "global_step": 136791, "epoch": 3256} {"train_loss": -6.648337364196777, "global_step": 136792, "epoch": 3256} {"train_loss": -6.699055841990879, "global_step": 136793, "epoch": 3256, "val_loss": 77860.921875} {"train_loss": -6.687170505523682, "global_step": 136794, "epoch": 3257} {"train_loss": -6.834253787994385, "global_step": 136795, "epoch": 3257} {"train_loss": -6.768189430236816, "global_step": 136796, "epoch": 3257} {"train_loss": -6.664241313934326, "global_step": 136797, "epoch": 3257} {"train_loss": -6.767441749572754, "global_step": 136798, "epoch": 3257} {"train_loss": -6.787911415100098, "global_step": 136799, "epoch": 3257} {"train_loss": -6.649567604064941, "global_step": 136800, "epoch": 3257} {"train_loss": -6.73942756652832, "global_step": 136801, "epoch": 3257} {"train_loss": -6.805112838745117, "global_step": 136802, "epoch": 3257} {"train_loss": -6.667588233947754, "global_step": 136803, "epoch": 3257} {"train_loss": -6.646561145782471, "global_step": 136804, "epoch": 3257} {"train_loss": -6.59328556060791, "global_step": 136805, "epoch": 3257} {"train_loss": -6.77418327331543, "global_step": 136806, "epoch": 3257} {"train_loss": -6.634517192840576, "global_step": 136807, "epoch": 3257} {"train_loss": -6.5901408195495605, "global_step": 136808, "epoch": 3257} {"train_loss": -6.819415092468262, "global_step": 136809, "epoch": 3257} {"train_loss": -6.594104290008545, "global_step": 136810, "epoch": 3257} {"train_loss": -6.703864097595215, "global_step": 136811, "epoch": 3257} {"train_loss": -6.771258354187012, "global_step": 136812, "epoch": 3257} {"train_loss": -6.636951923370361, "global_step": 136813, "epoch": 3257} {"train_loss": -6.6103997230529785, "global_step": 136814, "epoch": 3257} {"train_loss": -6.704357624053955, "global_step": 136815, "epoch": 3257} {"train_loss": -6.744078159332275, "global_step": 136816, "epoch": 3257} {"train_loss": -6.781709671020508, "global_step": 136817, "epoch": 3257} {"train_loss": -6.7583160400390625, "global_step": 136818, "epoch": 3257} {"train_loss": -6.827732086181641, "global_step": 136819, "epoch": 3257} {"train_loss": -6.742653846740723, "global_step": 136820, "epoch": 3257} {"train_loss": -6.69307804107666, "global_step": 136821, "epoch": 3257} {"train_loss": -6.609196662902832, "global_step": 136822, "epoch": 3257} {"train_loss": -6.823065757751465, "global_step": 136823, "epoch": 3257} {"train_loss": -6.691110134124756, "global_step": 136824, "epoch": 3257} {"train_loss": -6.818573951721191, "global_step": 136825, "epoch": 3257} {"train_loss": -6.766019344329834, "global_step": 136826, "epoch": 3257} {"train_loss": -6.822164535522461, "global_step": 136827, "epoch": 3257} {"train_loss": -6.699484825134277, "global_step": 136828, "epoch": 3257} {"train_loss": -6.770749092102051, "global_step": 136829, "epoch": 3257} {"train_loss": -6.751157760620117, "global_step": 136830, "epoch": 3257} {"train_loss": -6.877274990081787, "global_step": 136831, "epoch": 3257} {"train_loss": -6.834566116333008, "global_step": 136832, "epoch": 3257} {"train_loss": -6.768883228302002, "global_step": 136833, "epoch": 3257} {"train_loss": -6.758754253387451, "global_step": 136834, "epoch": 3257} {"train_loss": -6.73213479632423, "global_step": 136835, "epoch": 3257, "val_loss": 77753.875} {"train_loss": -6.755623817443848, "global_step": 136836, "epoch": 3258} {"train_loss": -6.868963241577148, "global_step": 136837, "epoch": 3258} {"train_loss": -6.77011775970459, "global_step": 136838, "epoch": 3258} {"train_loss": -6.858856678009033, "global_step": 136839, "epoch": 3258} {"train_loss": -6.712069511413574, "global_step": 136840, "epoch": 3258} {"train_loss": -6.819511413574219, "global_step": 136841, "epoch": 3258} {"train_loss": -6.737996578216553, "global_step": 136842, "epoch": 3258} {"train_loss": -6.8308210372924805, "global_step": 136843, "epoch": 3258} {"train_loss": -6.78658390045166, "global_step": 136844, "epoch": 3258} {"train_loss": -6.7250776290893555, "global_step": 136845, "epoch": 3258} {"train_loss": -6.800841331481934, "global_step": 136846, "epoch": 3258} {"train_loss": -6.7540812492370605, "global_step": 136847, "epoch": 3258} {"train_loss": -6.782987594604492, "global_step": 136848, "epoch": 3258} {"train_loss": -6.858617782592773, "global_step": 136849, "epoch": 3258} {"train_loss": -6.693264484405518, "global_step": 136850, "epoch": 3258} {"train_loss": -6.6676836013793945, "global_step": 136851, "epoch": 3258} {"train_loss": -6.767998218536377, "global_step": 136852, "epoch": 3258} {"train_loss": -6.703530311584473, "global_step": 136853, "epoch": 3258} {"train_loss": -6.781108856201172, "global_step": 136854, "epoch": 3258} {"train_loss": -6.749133586883545, "global_step": 136855, "epoch": 3258} {"train_loss": -6.755130767822266, "global_step": 136856, "epoch": 3258} {"train_loss": -6.710013389587402, "global_step": 136857, "epoch": 3258} {"train_loss": -6.761923789978027, "global_step": 136858, "epoch": 3258} {"train_loss": -6.714687347412109, "global_step": 136859, "epoch": 3258} {"train_loss": -6.706063270568848, "global_step": 136860, "epoch": 3258} {"train_loss": -6.705499649047852, "global_step": 136861, "epoch": 3258} {"train_loss": -6.785604476928711, "global_step": 136862, "epoch": 3258} {"train_loss": -6.712523460388184, "global_step": 136863, "epoch": 3258} {"train_loss": -6.685921669006348, "global_step": 136864, "epoch": 3258} {"train_loss": -6.739049434661865, "global_step": 136865, "epoch": 3258} {"train_loss": -6.753993511199951, "global_step": 136866, "epoch": 3258} {"train_loss": -6.642187595367432, "global_step": 136867, "epoch": 3258} {"train_loss": -6.721283912658691, "global_step": 136868, "epoch": 3258} {"train_loss": -6.736982345581055, "global_step": 136869, "epoch": 3258} {"train_loss": -6.639433860778809, "global_step": 136870, "epoch": 3258} {"train_loss": -6.63851261138916, "global_step": 136871, "epoch": 3258} {"train_loss": -6.734074592590332, "global_step": 136872, "epoch": 3258} {"train_loss": -6.599522590637207, "global_step": 136873, "epoch": 3258} {"train_loss": -6.741900444030762, "global_step": 136874, "epoch": 3258} {"train_loss": -6.625311851501465, "global_step": 136875, "epoch": 3258} {"train_loss": -6.647837162017822, "global_step": 136876, "epoch": 3258} {"train_loss": -6.735544874554589, "global_step": 136877, "epoch": 3258, "val_loss": 78035.7734375} {"train_loss": -6.7154316902160645, "global_step": 136878, "epoch": 3259} {"train_loss": -6.748697757720947, "global_step": 136879, "epoch": 3259} {"train_loss": -6.646823406219482, "global_step": 136880, "epoch": 3259} {"train_loss": -6.655158996582031, "global_step": 136881, "epoch": 3259} {"train_loss": -6.5670318603515625, "global_step": 136882, "epoch": 3259} {"train_loss": -6.728343963623047, "global_step": 136883, "epoch": 3259} {"train_loss": -6.648506164550781, "global_step": 136884, "epoch": 3259} {"train_loss": -6.569620132446289, "global_step": 136885, "epoch": 3259} {"train_loss": -6.602948188781738, "global_step": 136886, "epoch": 3259} {"train_loss": -6.736456394195557, "global_step": 136887, "epoch": 3259} {"train_loss": -6.640999794006348, "global_step": 136888, "epoch": 3259} {"train_loss": -6.697628974914551, "global_step": 136889, "epoch": 3259} {"train_loss": -6.7180986404418945, "global_step": 136890, "epoch": 3259} {"train_loss": -6.669705390930176, "global_step": 136891, "epoch": 3259} {"train_loss": -6.610548973083496, "global_step": 136892, "epoch": 3259} {"train_loss": -6.689201831817627, "global_step": 136893, "epoch": 3259} {"train_loss": -6.748567581176758, "global_step": 136894, "epoch": 3259} {"train_loss": -6.697129249572754, "global_step": 136895, "epoch": 3259} {"train_loss": -6.752127647399902, "global_step": 136896, "epoch": 3259} {"train_loss": -6.783289432525635, "global_step": 136897, "epoch": 3259} {"train_loss": -6.796294212341309, "global_step": 136898, "epoch": 3259} {"train_loss": -6.829984188079834, "global_step": 136899, "epoch": 3259} {"train_loss": -6.788998603820801, "global_step": 136900, "epoch": 3259} {"train_loss": -6.715423107147217, "global_step": 136901, "epoch": 3259} {"train_loss": -6.716864585876465, "global_step": 136902, "epoch": 3259} {"train_loss": -6.669214248657227, "global_step": 136903, "epoch": 3259} {"train_loss": -6.763897895812988, "global_step": 136904, "epoch": 3259} {"train_loss": -6.737090110778809, "global_step": 136905, "epoch": 3259} {"train_loss": -6.746790885925293, "global_step": 136906, "epoch": 3259} {"train_loss": -6.787741184234619, "global_step": 136907, "epoch": 3259} {"train_loss": -6.719144344329834, "global_step": 136908, "epoch": 3259} {"train_loss": -6.753121376037598, "global_step": 136909, "epoch": 3259} {"train_loss": -6.7148518562316895, "global_step": 136910, "epoch": 3259} {"train_loss": -6.734017372131348, "global_step": 136911, "epoch": 3259} {"train_loss": -6.823254108428955, "global_step": 136912, "epoch": 3259} {"train_loss": -6.709064483642578, "global_step": 136913, "epoch": 3259} {"train_loss": -6.7029008865356445, "global_step": 136914, "epoch": 3259} {"train_loss": -6.699418544769287, "global_step": 136915, "epoch": 3259} {"train_loss": -6.784743309020996, "global_step": 136916, "epoch": 3259} {"train_loss": -6.712477684020996, "global_step": 136917, "epoch": 3259} {"train_loss": -6.750511169433594, "global_step": 136918, "epoch": 3259} {"train_loss": -6.714798643475487, "global_step": 136919, "epoch": 3259, "val_loss": 77743.1328125} {"train_loss": -6.791614532470703, "global_step": 136920, "epoch": 3260} {"train_loss": -6.67764949798584, "global_step": 136921, "epoch": 3260} {"train_loss": -6.813390254974365, "global_step": 136922, "epoch": 3260} {"train_loss": -6.725249290466309, "global_step": 136923, "epoch": 3260} {"train_loss": -6.643075466156006, "global_step": 136924, "epoch": 3260} {"train_loss": -6.834124565124512, "global_step": 136925, "epoch": 3260} {"train_loss": -6.735584259033203, "global_step": 136926, "epoch": 3260} {"train_loss": -6.786231994628906, "global_step": 136927, "epoch": 3260} {"train_loss": -6.701230049133301, "global_step": 136928, "epoch": 3260} {"train_loss": -6.766453742980957, "global_step": 136929, "epoch": 3260} {"train_loss": -6.7520341873168945, "global_step": 136930, "epoch": 3260} {"train_loss": -6.821813106536865, "global_step": 136931, "epoch": 3260} {"train_loss": -6.711980819702148, "global_step": 136932, "epoch": 3260} {"train_loss": -6.849236965179443, "global_step": 136933, "epoch": 3260} {"train_loss": -6.776386737823486, "global_step": 136934, "epoch": 3260} {"train_loss": -6.664295196533203, "global_step": 136935, "epoch": 3260} {"train_loss": -6.7187418937683105, "global_step": 136936, "epoch": 3260} {"train_loss": -6.840147495269775, "global_step": 136937, "epoch": 3260} {"train_loss": -6.797506809234619, "global_step": 136938, "epoch": 3260} {"train_loss": -6.789500713348389, "global_step": 136939, "epoch": 3260} {"train_loss": -6.800737380981445, "global_step": 136940, "epoch": 3260} {"train_loss": -6.797514915466309, "global_step": 136941, "epoch": 3260} {"train_loss": -6.669190406799316, "global_step": 136942, "epoch": 3260} {"train_loss": -6.777348518371582, "global_step": 136943, "epoch": 3260} {"train_loss": -6.824703216552734, "global_step": 136944, "epoch": 3260} {"train_loss": -6.731884956359863, "global_step": 136945, "epoch": 3260} {"train_loss": -6.706658363342285, "global_step": 136946, "epoch": 3260} {"train_loss": -6.699183464050293, "global_step": 136947, "epoch": 3260} {"train_loss": -6.74969482421875, "global_step": 136948, "epoch": 3260} {"train_loss": -6.729451656341553, "global_step": 136949, "epoch": 3260} {"train_loss": -6.6869893074035645, "global_step": 136950, "epoch": 3260} {"train_loss": -6.797831058502197, "global_step": 136951, "epoch": 3260} {"train_loss": -6.711888313293457, "global_step": 136952, "epoch": 3260} {"train_loss": -6.740537166595459, "global_step": 136953, "epoch": 3260} {"train_loss": -6.76259708404541, "global_step": 136954, "epoch": 3260} {"train_loss": -6.680421829223633, "global_step": 136955, "epoch": 3260} {"train_loss": -6.873676300048828, "global_step": 136956, "epoch": 3260} {"train_loss": -6.845091819763184, "global_step": 136957, "epoch": 3260} {"train_loss": -6.772831439971924, "global_step": 136958, "epoch": 3260} {"train_loss": -6.799519062042236, "global_step": 136959, "epoch": 3260} {"train_loss": -6.856882095336914, "global_step": 136960, "epoch": 3260} {"train_loss": -6.762110437665667, "global_step": 136961, "epoch": 3260, "val_loss": 77811.2890625} {"train_loss": -6.842066764831543, "global_step": 136962, "epoch": 3261} {"train_loss": -6.74775505065918, "global_step": 136963, "epoch": 3261} {"train_loss": -6.716150283813477, "global_step": 136964, "epoch": 3261} {"train_loss": -6.7856645584106445, "global_step": 136965, "epoch": 3261} {"train_loss": -6.7596635818481445, "global_step": 136966, "epoch": 3261} {"train_loss": -6.825592041015625, "global_step": 136967, "epoch": 3261} {"train_loss": -6.790175437927246, "global_step": 136968, "epoch": 3261} {"train_loss": -6.79644775390625, "global_step": 136969, "epoch": 3261} {"train_loss": -6.740199089050293, "global_step": 136970, "epoch": 3261} {"train_loss": -6.760919570922852, "global_step": 136971, "epoch": 3261} {"train_loss": -6.749705791473389, "global_step": 136972, "epoch": 3261} {"train_loss": -6.821131706237793, "global_step": 136973, "epoch": 3261} {"train_loss": -6.795933723449707, "global_step": 136974, "epoch": 3261} {"train_loss": -6.563076496124268, "global_step": 136975, "epoch": 3261} {"train_loss": -6.542204856872559, "global_step": 136976, "epoch": 3261} {"train_loss": -6.620288848876953, "global_step": 136977, "epoch": 3261} {"train_loss": -6.5181965827941895, "global_step": 136978, "epoch": 3261} {"train_loss": -6.431621551513672, "global_step": 136979, "epoch": 3261} {"train_loss": -6.65599250793457, "global_step": 136980, "epoch": 3261} {"train_loss": -6.57720947265625, "global_step": 136981, "epoch": 3261} {"train_loss": -6.637065410614014, "global_step": 136982, "epoch": 3261} {"train_loss": -6.607499122619629, "global_step": 136983, "epoch": 3261} {"train_loss": -6.5721435546875, "global_step": 136984, "epoch": 3261} {"train_loss": -6.656982421875, "global_step": 136985, "epoch": 3261} {"train_loss": -6.676588535308838, "global_step": 136986, "epoch": 3261} {"train_loss": -6.671107769012451, "global_step": 136987, "epoch": 3261} {"train_loss": -6.707610607147217, "global_step": 136988, "epoch": 3261} {"train_loss": -6.553251266479492, "global_step": 136989, "epoch": 3261} {"train_loss": -6.668033599853516, "global_step": 136990, "epoch": 3261} {"train_loss": -6.464687347412109, "global_step": 136991, "epoch": 3261} {"train_loss": -6.519593238830566, "global_step": 136992, "epoch": 3261} {"train_loss": -6.614384651184082, "global_step": 136993, "epoch": 3261} {"train_loss": -6.751459121704102, "global_step": 136994, "epoch": 3261} {"train_loss": -6.531335830688477, "global_step": 136995, "epoch": 3261} {"train_loss": -6.752554416656494, "global_step": 136996, "epoch": 3261} {"train_loss": -6.596672058105469, "global_step": 136997, "epoch": 3261} {"train_loss": -6.564911842346191, "global_step": 136998, "epoch": 3261} {"train_loss": -6.618966102600098, "global_step": 136999, "epoch": 3261} {"train_loss": -6.683987140655518, "global_step": 137000, "epoch": 3261} {"train_loss": -6.601123809814453, "global_step": 137001, "epoch": 3261} {"train_loss": -6.6565704345703125, "global_step": 137002, "epoch": 3261} {"train_loss": -6.661033357892718, "global_step": 137003, "epoch": 3261, "val_loss": 77952.03125} {"train_loss": -6.698422431945801, "global_step": 137004, "epoch": 3262} {"train_loss": -6.76102352142334, "global_step": 137005, "epoch": 3262} {"train_loss": -6.627598285675049, "global_step": 137006, "epoch": 3262} {"train_loss": -6.677878379821777, "global_step": 137007, "epoch": 3262} {"train_loss": -6.686586380004883, "global_step": 137008, "epoch": 3262} {"train_loss": -6.714877128601074, "global_step": 137009, "epoch": 3262} {"train_loss": -6.6746745109558105, "global_step": 137010, "epoch": 3262} {"train_loss": -6.722575664520264, "global_step": 137011, "epoch": 3262} {"train_loss": -6.705458641052246, "global_step": 137012, "epoch": 3262} {"train_loss": -6.5934929847717285, "global_step": 137013, "epoch": 3262} {"train_loss": -6.796565532684326, "global_step": 137014, "epoch": 3262} {"train_loss": -6.757726192474365, "global_step": 137015, "epoch": 3262} {"train_loss": -6.760702610015869, "global_step": 137016, "epoch": 3262} {"train_loss": -6.820859909057617, "global_step": 137017, "epoch": 3262} {"train_loss": -6.723816871643066, "global_step": 137018, "epoch": 3262} {"train_loss": -6.833187103271484, "global_step": 137019, "epoch": 3262} {"train_loss": -6.670629501342773, "global_step": 137020, "epoch": 3262} {"train_loss": -6.741625785827637, "global_step": 137021, "epoch": 3262} {"train_loss": -6.736223220825195, "global_step": 137022, "epoch": 3262} {"train_loss": -6.686959266662598, "global_step": 137023, "epoch": 3262} {"train_loss": -6.741322040557861, "global_step": 137024, "epoch": 3262} {"train_loss": -6.748749732971191, "global_step": 137025, "epoch": 3262} {"train_loss": -6.572875022888184, "global_step": 137026, "epoch": 3262} {"train_loss": -6.759731292724609, "global_step": 137027, "epoch": 3262} {"train_loss": -6.77011775970459, "global_step": 137028, "epoch": 3262} {"train_loss": -6.6351118087768555, "global_step": 137029, "epoch": 3262} {"train_loss": -6.693373680114746, "global_step": 137030, "epoch": 3262} {"train_loss": -6.706821441650391, "global_step": 137031, "epoch": 3262} {"train_loss": -6.676855087280273, "global_step": 137032, "epoch": 3262} {"train_loss": -6.6238884925842285, "global_step": 137033, "epoch": 3262} {"train_loss": -6.7701520919799805, "global_step": 137034, "epoch": 3262} {"train_loss": -6.642446994781494, "global_step": 137035, "epoch": 3262} {"train_loss": -6.751330375671387, "global_step": 137036, "epoch": 3262} {"train_loss": -6.842184543609619, "global_step": 137037, "epoch": 3262} {"train_loss": -6.5279951095581055, "global_step": 137038, "epoch": 3262} {"train_loss": -6.722006320953369, "global_step": 137039, "epoch": 3262} {"train_loss": -6.73178243637085, "global_step": 137040, "epoch": 3262} {"train_loss": -6.684237957000732, "global_step": 137041, "epoch": 3262} {"train_loss": -6.681410789489746, "global_step": 137042, "epoch": 3262} {"train_loss": -6.787734031677246, "global_step": 137043, "epoch": 3262} {"train_loss": -6.825197696685791, "global_step": 137044, "epoch": 3262} {"train_loss": -6.714822610219319, "global_step": 137045, "epoch": 3262, "val_loss": 77896.484375} {"train_loss": -6.8677897453308105, "global_step": 137046, "epoch": 3263} {"train_loss": -6.662497520446777, "global_step": 137047, "epoch": 3263} {"train_loss": -6.879992485046387, "global_step": 137048, "epoch": 3263} {"train_loss": -6.780976295471191, "global_step": 137049, "epoch": 3263} {"train_loss": -6.79947566986084, "global_step": 137050, "epoch": 3263} {"train_loss": -6.626879692077637, "global_step": 137051, "epoch": 3263} {"train_loss": -6.787344932556152, "global_step": 137052, "epoch": 3263} {"train_loss": -6.723113059997559, "global_step": 137053, "epoch": 3263} {"train_loss": -6.693955421447754, "global_step": 137054, "epoch": 3263} {"train_loss": -6.610263347625732, "global_step": 137055, "epoch": 3263} {"train_loss": -6.682608604431152, "global_step": 137056, "epoch": 3263} {"train_loss": -6.650561809539795, "global_step": 137057, "epoch": 3263} {"train_loss": -6.645739555358887, "global_step": 137058, "epoch": 3263} {"train_loss": -6.781244277954102, "global_step": 137059, "epoch": 3263} {"train_loss": -6.6378302574157715, "global_step": 137060, "epoch": 3263} {"train_loss": -6.658963203430176, "global_step": 137061, "epoch": 3263} {"train_loss": -6.791187286376953, "global_step": 137062, "epoch": 3263} {"train_loss": -6.595104217529297, "global_step": 137063, "epoch": 3263} {"train_loss": -6.589933395385742, "global_step": 137064, "epoch": 3263} {"train_loss": -6.770997047424316, "global_step": 137065, "epoch": 3263} {"train_loss": -6.686749458312988, "global_step": 137066, "epoch": 3263} {"train_loss": -6.755014896392822, "global_step": 137067, "epoch": 3263} {"train_loss": -6.707582473754883, "global_step": 137068, "epoch": 3263} {"train_loss": -6.775879859924316, "global_step": 137069, "epoch": 3263} {"train_loss": -6.590751647949219, "global_step": 137070, "epoch": 3263} {"train_loss": -6.688956260681152, "global_step": 137071, "epoch": 3263} {"train_loss": -6.695098876953125, "global_step": 137072, "epoch": 3263} {"train_loss": -6.753237724304199, "global_step": 137073, "epoch": 3263} {"train_loss": -6.678638935089111, "global_step": 137074, "epoch": 3263} {"train_loss": -6.7124433517456055, "global_step": 137075, "epoch": 3263} {"train_loss": -6.678776741027832, "global_step": 137076, "epoch": 3263} {"train_loss": -6.701286792755127, "global_step": 137077, "epoch": 3263} {"train_loss": -6.654280662536621, "global_step": 137078, "epoch": 3263} {"train_loss": -6.684073448181152, "global_step": 137079, "epoch": 3263} {"train_loss": -6.6186442375183105, "global_step": 137080, "epoch": 3263} {"train_loss": -6.674630165100098, "global_step": 137081, "epoch": 3263} {"train_loss": -6.827065467834473, "global_step": 137082, "epoch": 3263} {"train_loss": -6.625901222229004, "global_step": 137083, "epoch": 3263} {"train_loss": -6.735756874084473, "global_step": 137084, "epoch": 3263} {"train_loss": -6.778079032897949, "global_step": 137085, "epoch": 3263} {"train_loss": -6.612346649169922, "global_step": 137086, "epoch": 3263} {"train_loss": -6.70567512512207, "global_step": 137087, "epoch": 3263, "val_loss": 77889.609375} {"train_loss": -6.745878219604492, "global_step": 137088, "epoch": 3264} {"train_loss": -6.602791786193848, "global_step": 137089, "epoch": 3264} {"train_loss": -6.69281005859375, "global_step": 137090, "epoch": 3264} {"train_loss": -6.657156944274902, "global_step": 137091, "epoch": 3264} {"train_loss": -6.692071914672852, "global_step": 137092, "epoch": 3264} {"train_loss": -6.7541069984436035, "global_step": 137093, "epoch": 3264} {"train_loss": -6.732636451721191, "global_step": 137094, "epoch": 3264} {"train_loss": -6.75676155090332, "global_step": 137095, "epoch": 3264} {"train_loss": -6.7668137550354, "global_step": 137096, "epoch": 3264} {"train_loss": -6.6745734214782715, "global_step": 137097, "epoch": 3264} {"train_loss": -6.721811294555664, "global_step": 137098, "epoch": 3264} {"train_loss": -6.830622673034668, "global_step": 137099, "epoch": 3264} {"train_loss": -6.684152603149414, "global_step": 137100, "epoch": 3264} {"train_loss": -6.813223838806152, "global_step": 137101, "epoch": 3264} {"train_loss": -6.873311996459961, "global_step": 137102, "epoch": 3264} {"train_loss": -6.6987690925598145, "global_step": 137103, "epoch": 3264} {"train_loss": -6.802974700927734, "global_step": 137104, "epoch": 3264} {"train_loss": -6.720193862915039, "global_step": 137105, "epoch": 3264} {"train_loss": -6.785068511962891, "global_step": 137106, "epoch": 3264} {"train_loss": -6.799074649810791, "global_step": 137107, "epoch": 3264} {"train_loss": -6.7776641845703125, "global_step": 137108, "epoch": 3264} {"train_loss": -6.929543972015381, "global_step": 137109, "epoch": 3264} {"train_loss": -6.784468650817871, "global_step": 137110, "epoch": 3264} {"train_loss": -6.713023662567139, "global_step": 137111, "epoch": 3264} {"train_loss": -6.866080284118652, "global_step": 137112, "epoch": 3264} {"train_loss": -6.788358688354492, "global_step": 137113, "epoch": 3264} {"train_loss": -6.739015579223633, "global_step": 137114, "epoch": 3264} {"train_loss": -6.794576644897461, "global_step": 137115, "epoch": 3264} {"train_loss": -6.608333110809326, "global_step": 137116, "epoch": 3264} {"train_loss": -6.7281270027160645, "global_step": 137117, "epoch": 3264} {"train_loss": -6.783908843994141, "global_step": 137118, "epoch": 3264} {"train_loss": -6.770755290985107, "global_step": 137119, "epoch": 3264} {"train_loss": -6.768326759338379, "global_step": 137120, "epoch": 3264} {"train_loss": -6.756674766540527, "global_step": 137121, "epoch": 3264} {"train_loss": -6.715837478637695, "global_step": 137122, "epoch": 3264} {"train_loss": -6.7594709396362305, "global_step": 137123, "epoch": 3264} {"train_loss": -6.799304008483887, "global_step": 137124, "epoch": 3264} {"train_loss": -6.763432025909424, "global_step": 137125, "epoch": 3264} {"train_loss": -6.75026798248291, "global_step": 137126, "epoch": 3264} {"train_loss": -6.684593677520752, "global_step": 137127, "epoch": 3264} {"train_loss": -6.682497024536133, "global_step": 137128, "epoch": 3264} {"train_loss": -6.749533517020089, "global_step": 137129, "epoch": 3264, "val_loss": 77727.4453125} {"train_loss": -6.879364967346191, "global_step": 137130, "epoch": 3265} {"train_loss": -6.760284900665283, "global_step": 137131, "epoch": 3265} {"train_loss": -6.756308555603027, "global_step": 137132, "epoch": 3265} {"train_loss": -6.815092086791992, "global_step": 137133, "epoch": 3265} {"train_loss": -6.8101348876953125, "global_step": 137134, "epoch": 3265} {"train_loss": -6.804129123687744, "global_step": 137135, "epoch": 3265} {"train_loss": -6.7379913330078125, "global_step": 137136, "epoch": 3265} {"train_loss": -6.659156799316406, "global_step": 137137, "epoch": 3265} {"train_loss": -6.77230978012085, "global_step": 137138, "epoch": 3265} {"train_loss": -6.835366249084473, "global_step": 137139, "epoch": 3265} {"train_loss": -6.744613170623779, "global_step": 137140, "epoch": 3265} {"train_loss": -6.596035003662109, "global_step": 137141, "epoch": 3265} {"train_loss": -6.736185550689697, "global_step": 137142, "epoch": 3265} {"train_loss": -6.695411682128906, "global_step": 137143, "epoch": 3265} {"train_loss": -6.635411739349365, "global_step": 137144, "epoch": 3265} {"train_loss": -6.785447597503662, "global_step": 137145, "epoch": 3265} {"train_loss": -6.618141174316406, "global_step": 137146, "epoch": 3265} {"train_loss": -6.651411533355713, "global_step": 137147, "epoch": 3265} {"train_loss": -6.587963581085205, "global_step": 137148, "epoch": 3265} {"train_loss": -6.633623123168945, "global_step": 137149, "epoch": 3265} {"train_loss": -6.689410209655762, "global_step": 137150, "epoch": 3265} {"train_loss": -6.68930721282959, "global_step": 137151, "epoch": 3265} {"train_loss": -6.8220930099487305, "global_step": 137152, "epoch": 3265} {"train_loss": -6.683375835418701, "global_step": 137153, "epoch": 3265} {"train_loss": -6.687694549560547, "global_step": 137154, "epoch": 3265} {"train_loss": -6.709864139556885, "global_step": 137155, "epoch": 3265} {"train_loss": -6.630492210388184, "global_step": 137156, "epoch": 3265} {"train_loss": -6.632508277893066, "global_step": 137157, "epoch": 3265} {"train_loss": -6.712913990020752, "global_step": 137158, "epoch": 3265} {"train_loss": -6.777439594268799, "global_step": 137159, "epoch": 3265} {"train_loss": -6.627264976501465, "global_step": 137160, "epoch": 3265} {"train_loss": -6.7627763748168945, "global_step": 137161, "epoch": 3265} {"train_loss": -6.719624996185303, "global_step": 137162, "epoch": 3265} {"train_loss": -6.733067035675049, "global_step": 137163, "epoch": 3265} {"train_loss": -6.753620147705078, "global_step": 137164, "epoch": 3265} {"train_loss": -6.748537063598633, "global_step": 137165, "epoch": 3265} {"train_loss": -6.7669477462768555, "global_step": 137166, "epoch": 3265} {"train_loss": -6.861563205718994, "global_step": 137167, "epoch": 3265} {"train_loss": -6.648408889770508, "global_step": 137168, "epoch": 3265} {"train_loss": -6.697903633117676, "global_step": 137169, "epoch": 3265} {"train_loss": -6.664760589599609, "global_step": 137170, "epoch": 3265} {"train_loss": -6.71974641936166, "global_step": 137171, "epoch": 3265, "val_loss": 77897.125} {"train_loss": -6.712621688842773, "global_step": 137172, "epoch": 3266} {"train_loss": -6.722872734069824, "global_step": 137173, "epoch": 3266} {"train_loss": -6.630393028259277, "global_step": 137174, "epoch": 3266} {"train_loss": -6.673731327056885, "global_step": 137175, "epoch": 3266} {"train_loss": -6.6758246421813965, "global_step": 137176, "epoch": 3266} {"train_loss": -6.735757827758789, "global_step": 137177, "epoch": 3266} {"train_loss": -6.7899250984191895, "global_step": 137178, "epoch": 3266} {"train_loss": -6.753780841827393, "global_step": 137179, "epoch": 3266} {"train_loss": -6.828482627868652, "global_step": 137180, "epoch": 3266} {"train_loss": -6.875572681427002, "global_step": 137181, "epoch": 3266} {"train_loss": -6.712880611419678, "global_step": 137182, "epoch": 3266} {"train_loss": -6.764869689941406, "global_step": 137183, "epoch": 3266} {"train_loss": -6.804263114929199, "global_step": 137184, "epoch": 3266} {"train_loss": -6.674271583557129, "global_step": 137185, "epoch": 3266} {"train_loss": -6.696255683898926, "global_step": 137186, "epoch": 3266} {"train_loss": -6.8114824295043945, "global_step": 137187, "epoch": 3266} {"train_loss": -6.810256004333496, "global_step": 137188, "epoch": 3266} {"train_loss": -6.698752403259277, "global_step": 137189, "epoch": 3266} {"train_loss": -6.78434419631958, "global_step": 137190, "epoch": 3266} {"train_loss": -6.721467018127441, "global_step": 137191, "epoch": 3266} {"train_loss": -6.755119323730469, "global_step": 137192, "epoch": 3266} {"train_loss": -6.696681976318359, "global_step": 137193, "epoch": 3266} {"train_loss": -6.757101535797119, "global_step": 137194, "epoch": 3266} {"train_loss": -6.770562171936035, "global_step": 137195, "epoch": 3266} {"train_loss": -6.734277248382568, "global_step": 137196, "epoch": 3266} {"train_loss": -6.667984485626221, "global_step": 137197, "epoch": 3266} {"train_loss": -6.746613502502441, "global_step": 137198, "epoch": 3266} {"train_loss": -6.631299018859863, "global_step": 137199, "epoch": 3266} {"train_loss": -6.6617937088012695, "global_step": 137200, "epoch": 3266} {"train_loss": -6.586259841918945, "global_step": 137201, "epoch": 3266} {"train_loss": -6.704326629638672, "global_step": 137202, "epoch": 3266} {"train_loss": -6.573677062988281, "global_step": 137203, "epoch": 3266} {"train_loss": -6.626568794250488, "global_step": 137204, "epoch": 3266} {"train_loss": -6.619230270385742, "global_step": 137205, "epoch": 3266} {"train_loss": -6.5051140785217285, "global_step": 137206, "epoch": 3266} {"train_loss": -6.650189399719238, "global_step": 137207, "epoch": 3266} {"train_loss": -6.6989593505859375, "global_step": 137208, "epoch": 3266} {"train_loss": -6.644927978515625, "global_step": 137209, "epoch": 3266} {"train_loss": -6.712587356567383, "global_step": 137210, "epoch": 3266} {"train_loss": -6.563888072967529, "global_step": 137211, "epoch": 3266} {"train_loss": -6.562006950378418, "global_step": 137212, "epoch": 3266} {"train_loss": -6.699494395937238, "global_step": 137213, "epoch": 3266, "val_loss": 77710.546875} {"train_loss": -6.63859224319458, "global_step": 137214, "epoch": 3267} {"train_loss": -6.609451770782471, "global_step": 137215, "epoch": 3267} {"train_loss": -6.630014896392822, "global_step": 137216, "epoch": 3267} {"train_loss": -6.699244022369385, "global_step": 137217, "epoch": 3267} {"train_loss": -6.5260467529296875, "global_step": 137218, "epoch": 3267} {"train_loss": -6.731646537780762, "global_step": 137219, "epoch": 3267} {"train_loss": -6.691272735595703, "global_step": 137220, "epoch": 3267} {"train_loss": -6.7208147048950195, "global_step": 137221, "epoch": 3267} {"train_loss": -6.6943254470825195, "global_step": 137222, "epoch": 3267} {"train_loss": -6.723825454711914, "global_step": 137223, "epoch": 3267} {"train_loss": -6.698979377746582, "global_step": 137224, "epoch": 3267} {"train_loss": -6.756968975067139, "global_step": 137225, "epoch": 3267} {"train_loss": -6.689380645751953, "global_step": 137226, "epoch": 3267} {"train_loss": -6.6971845626831055, "global_step": 137227, "epoch": 3267} {"train_loss": -6.809884071350098, "global_step": 137228, "epoch": 3267} {"train_loss": -6.795910835266113, "global_step": 137229, "epoch": 3267} {"train_loss": -6.774401664733887, "global_step": 137230, "epoch": 3267} {"train_loss": -6.743706703186035, "global_step": 137231, "epoch": 3267} {"train_loss": -6.7702460289001465, "global_step": 137232, "epoch": 3267} {"train_loss": -6.803994178771973, "global_step": 137233, "epoch": 3267} {"train_loss": -6.744902610778809, "global_step": 137234, "epoch": 3267} {"train_loss": -6.696284294128418, "global_step": 137235, "epoch": 3267} {"train_loss": -6.814105987548828, "global_step": 137236, "epoch": 3267} {"train_loss": -6.7332305908203125, "global_step": 137237, "epoch": 3267} {"train_loss": -6.809820175170898, "global_step": 137238, "epoch": 3267} {"train_loss": -6.724052429199219, "global_step": 137239, "epoch": 3267} {"train_loss": -6.692892074584961, "global_step": 137240, "epoch": 3267} {"train_loss": -6.66965913772583, "global_step": 137241, "epoch": 3267} {"train_loss": -6.582707405090332, "global_step": 137242, "epoch": 3267} {"train_loss": -6.71907901763916, "global_step": 137243, "epoch": 3267} {"train_loss": -6.7425150871276855, "global_step": 137244, "epoch": 3267} {"train_loss": -6.756347179412842, "global_step": 137245, "epoch": 3267} {"train_loss": -6.699672698974609, "global_step": 137246, "epoch": 3267} {"train_loss": -6.689087390899658, "global_step": 137247, "epoch": 3267} {"train_loss": -6.754858493804932, "global_step": 137248, "epoch": 3267} {"train_loss": -6.756870269775391, "global_step": 137249, "epoch": 3267} {"train_loss": -6.788748264312744, "global_step": 137250, "epoch": 3267} {"train_loss": -6.72224760055542, "global_step": 137251, "epoch": 3267} {"train_loss": -6.688106060028076, "global_step": 137252, "epoch": 3267} {"train_loss": -6.839628219604492, "global_step": 137253, "epoch": 3267} {"train_loss": -6.6838836669921875, "global_step": 137254, "epoch": 3267} {"train_loss": -6.716252156666347, "global_step": 137255, "epoch": 3267, "val_loss": 77783.3203125} {"train_loss": -6.857007026672363, "global_step": 137256, "epoch": 3268} {"train_loss": -6.744503974914551, "global_step": 137257, "epoch": 3268} {"train_loss": -6.8527374267578125, "global_step": 137258, "epoch": 3268} {"train_loss": -6.736865043640137, "global_step": 137259, "epoch": 3268} {"train_loss": -6.810047149658203, "global_step": 137260, "epoch": 3268} {"train_loss": -6.692134857177734, "global_step": 137261, "epoch": 3268} {"train_loss": -6.645251274108887, "global_step": 137262, "epoch": 3268} {"train_loss": -6.738428115844727, "global_step": 137263, "epoch": 3268} {"train_loss": -6.695618629455566, "global_step": 137264, "epoch": 3268} {"train_loss": -6.697079658508301, "global_step": 137265, "epoch": 3268} {"train_loss": -6.687498092651367, "global_step": 137266, "epoch": 3268} {"train_loss": -6.7088541984558105, "global_step": 137267, "epoch": 3268} {"train_loss": -6.644584655761719, "global_step": 137268, "epoch": 3268} {"train_loss": -6.587305068969727, "global_step": 137269, "epoch": 3268} {"train_loss": -6.625176906585693, "global_step": 137270, "epoch": 3268} {"train_loss": -6.714487075805664, "global_step": 137271, "epoch": 3268} {"train_loss": -6.729606628417969, "global_step": 137272, "epoch": 3268} {"train_loss": -6.727738380432129, "global_step": 137273, "epoch": 3268} {"train_loss": -6.7356743812561035, "global_step": 137274, "epoch": 3268} {"train_loss": -6.63817024230957, "global_step": 137275, "epoch": 3268} {"train_loss": -6.633424758911133, "global_step": 137276, "epoch": 3268} {"train_loss": -6.753644943237305, "global_step": 137277, "epoch": 3268} {"train_loss": -6.634819030761719, "global_step": 137278, "epoch": 3268} {"train_loss": -6.657171249389648, "global_step": 137279, "epoch": 3268} {"train_loss": -6.789358139038086, "global_step": 137280, "epoch": 3268} {"train_loss": -6.702780723571777, "global_step": 137281, "epoch": 3268} {"train_loss": -6.6603803634643555, "global_step": 137282, "epoch": 3268} {"train_loss": -6.609163761138916, "global_step": 137283, "epoch": 3268} {"train_loss": -6.682458877563477, "global_step": 137284, "epoch": 3268} {"train_loss": -6.7377166748046875, "global_step": 137285, "epoch": 3268} {"train_loss": -6.8209638595581055, "global_step": 137286, "epoch": 3268} {"train_loss": -6.726395606994629, "global_step": 137287, "epoch": 3268} {"train_loss": -6.728610515594482, "global_step": 137288, "epoch": 3268} {"train_loss": -6.74066162109375, "global_step": 137289, "epoch": 3268} {"train_loss": -6.776260852813721, "global_step": 137290, "epoch": 3268} {"train_loss": -6.832670211791992, "global_step": 137291, "epoch": 3268} {"train_loss": -6.848498821258545, "global_step": 137292, "epoch": 3268} {"train_loss": -6.637594223022461, "global_step": 137293, "epoch": 3268} {"train_loss": -6.6791157722473145, "global_step": 137294, "epoch": 3268} {"train_loss": -6.764579772949219, "global_step": 137295, "epoch": 3268} {"train_loss": -6.733789443969727, "global_step": 137296, "epoch": 3268} {"train_loss": -6.71943770136152, "global_step": 137297, "epoch": 3268, "val_loss": 78013.421875} {"train_loss": -6.5721025466918945, "global_step": 137298, "epoch": 3269} {"train_loss": -6.781445503234863, "global_step": 137299, "epoch": 3269} {"train_loss": -6.757849216461182, "global_step": 137300, "epoch": 3269} {"train_loss": -6.587952613830566, "global_step": 137301, "epoch": 3269} {"train_loss": -6.8298444747924805, "global_step": 137302, "epoch": 3269} {"train_loss": -6.646803855895996, "global_step": 137303, "epoch": 3269} {"train_loss": -6.769105911254883, "global_step": 137304, "epoch": 3269} {"train_loss": -6.681093215942383, "global_step": 137305, "epoch": 3269} {"train_loss": -6.754956245422363, "global_step": 137306, "epoch": 3269} {"train_loss": -6.656220436096191, "global_step": 137307, "epoch": 3269} {"train_loss": -6.611018180847168, "global_step": 137308, "epoch": 3269} {"train_loss": -6.764935493469238, "global_step": 137309, "epoch": 3269} {"train_loss": -6.668497085571289, "global_step": 137310, "epoch": 3269} {"train_loss": -6.5943498611450195, "global_step": 137311, "epoch": 3269} {"train_loss": -6.665163516998291, "global_step": 137312, "epoch": 3269} {"train_loss": -6.703807830810547, "global_step": 137313, "epoch": 3269} {"train_loss": -6.5344390869140625, "global_step": 137314, "epoch": 3269} {"train_loss": -6.646631240844727, "global_step": 137315, "epoch": 3269} {"train_loss": -6.655562400817871, "global_step": 137316, "epoch": 3269} {"train_loss": -6.642978668212891, "global_step": 137317, "epoch": 3269} {"train_loss": -6.812278747558594, "global_step": 137318, "epoch": 3269} {"train_loss": -6.5773420333862305, "global_step": 137319, "epoch": 3269} {"train_loss": -6.644509315490723, "global_step": 137320, "epoch": 3269} {"train_loss": -6.715856075286865, "global_step": 137321, "epoch": 3269} {"train_loss": -6.587332725524902, "global_step": 137322, "epoch": 3269} {"train_loss": -6.679933547973633, "global_step": 137323, "epoch": 3269} {"train_loss": -6.407674789428711, "global_step": 137324, "epoch": 3269} {"train_loss": -6.769218444824219, "global_step": 137325, "epoch": 3269} {"train_loss": -6.72989559173584, "global_step": 137326, "epoch": 3269} {"train_loss": -6.557592391967773, "global_step": 137327, "epoch": 3269} {"train_loss": -6.698934555053711, "global_step": 137328, "epoch": 3269} {"train_loss": -6.6263203620910645, "global_step": 137329, "epoch": 3269} {"train_loss": -6.709346294403076, "global_step": 137330, "epoch": 3269} {"train_loss": -6.552753448486328, "global_step": 137331, "epoch": 3269} {"train_loss": -6.70913553237915, "global_step": 137332, "epoch": 3269} {"train_loss": -6.6847991943359375, "global_step": 137333, "epoch": 3269} {"train_loss": -6.763948440551758, "global_step": 137334, "epoch": 3269} {"train_loss": -6.558758735656738, "global_step": 137335, "epoch": 3269} {"train_loss": -6.684239387512207, "global_step": 137336, "epoch": 3269} {"train_loss": -6.601253509521484, "global_step": 137337, "epoch": 3269} {"train_loss": -6.6505279541015625, "global_step": 137338, "epoch": 3269} {"train_loss": -6.6630787054697675, "global_step": 137339, "epoch": 3269, "val_loss": 77779.953125} {"train_loss": -6.701545715332031, "global_step": 137340, "epoch": 3270} {"train_loss": -6.752839088439941, "global_step": 137341, "epoch": 3270} {"train_loss": -6.822697162628174, "global_step": 137342, "epoch": 3270} {"train_loss": -6.647463798522949, "global_step": 137343, "epoch": 3270} {"train_loss": -6.702963352203369, "global_step": 137344, "epoch": 3270} {"train_loss": -6.590658187866211, "global_step": 137345, "epoch": 3270} {"train_loss": -6.706165790557861, "global_step": 137346, "epoch": 3270} {"train_loss": -6.713869094848633, "global_step": 137347, "epoch": 3270} {"train_loss": -6.647364616394043, "global_step": 137348, "epoch": 3270} {"train_loss": -6.686244010925293, "global_step": 137349, "epoch": 3270} {"train_loss": -6.677372932434082, "global_step": 137350, "epoch": 3270} {"train_loss": -6.762631416320801, "global_step": 137351, "epoch": 3270} {"train_loss": -6.593977928161621, "global_step": 137352, "epoch": 3270} {"train_loss": -6.622563362121582, "global_step": 137353, "epoch": 3270} {"train_loss": -6.690008163452148, "global_step": 137354, "epoch": 3270} {"train_loss": -6.7174224853515625, "global_step": 137355, "epoch": 3270} {"train_loss": -6.825499057769775, "global_step": 137356, "epoch": 3270} {"train_loss": -6.694340705871582, "global_step": 137357, "epoch": 3270} {"train_loss": -6.530749320983887, "global_step": 137358, "epoch": 3270} {"train_loss": -6.803343772888184, "global_step": 137359, "epoch": 3270} {"train_loss": -6.690967559814453, "global_step": 137360, "epoch": 3270} {"train_loss": -6.752094268798828, "global_step": 137361, "epoch": 3270} {"train_loss": -6.699060440063477, "global_step": 137362, "epoch": 3270} {"train_loss": -6.67006778717041, "global_step": 137363, "epoch": 3270} {"train_loss": -6.732328414916992, "global_step": 137364, "epoch": 3270} {"train_loss": -6.762054443359375, "global_step": 137365, "epoch": 3270} {"train_loss": -6.6928863525390625, "global_step": 137366, "epoch": 3270} {"train_loss": -6.807497024536133, "global_step": 137367, "epoch": 3270} {"train_loss": -6.799222469329834, "global_step": 137368, "epoch": 3270} {"train_loss": -6.831661224365234, "global_step": 137369, "epoch": 3270} {"train_loss": -6.687819480895996, "global_step": 137370, "epoch": 3270} {"train_loss": -6.776815414428711, "global_step": 137371, "epoch": 3270} {"train_loss": -6.764423370361328, "global_step": 137372, "epoch": 3270} {"train_loss": -6.5654826164245605, "global_step": 137373, "epoch": 3270} {"train_loss": -6.758829116821289, "global_step": 137374, "epoch": 3270} {"train_loss": -6.755187034606934, "global_step": 137375, "epoch": 3270} {"train_loss": -6.690921306610107, "global_step": 137376, "epoch": 3270} {"train_loss": -6.813709259033203, "global_step": 137377, "epoch": 3270} {"train_loss": -6.765619277954102, "global_step": 137378, "epoch": 3270} {"train_loss": -6.65690279006958, "global_step": 137379, "epoch": 3270} {"train_loss": -6.716397762298584, "global_step": 137380, "epoch": 3270} {"train_loss": -6.717053367978051, "global_step": 137381, "epoch": 3270, "val_loss": 78172.21875} {"train_loss": -6.693454742431641, "global_step": 137382, "epoch": 3271} {"train_loss": -6.7808332443237305, "global_step": 137383, "epoch": 3271} {"train_loss": -6.715769290924072, "global_step": 137384, "epoch": 3271} {"train_loss": -6.789345741271973, "global_step": 137385, "epoch": 3271} {"train_loss": -6.836238861083984, "global_step": 137386, "epoch": 3271} {"train_loss": -6.699836730957031, "global_step": 137387, "epoch": 3271} {"train_loss": -6.775660514831543, "global_step": 137388, "epoch": 3271} {"train_loss": -6.743990898132324, "global_step": 137389, "epoch": 3271} {"train_loss": -6.677761554718018, "global_step": 137390, "epoch": 3271} {"train_loss": -6.805532455444336, "global_step": 137391, "epoch": 3271} {"train_loss": -6.652572154998779, "global_step": 137392, "epoch": 3271} {"train_loss": -6.649496078491211, "global_step": 137393, "epoch": 3271} {"train_loss": -6.7213029861450195, "global_step": 137394, "epoch": 3271} {"train_loss": -6.544098854064941, "global_step": 137395, "epoch": 3271} {"train_loss": -6.805913925170898, "global_step": 137396, "epoch": 3271} {"train_loss": -6.545932769775391, "global_step": 137397, "epoch": 3271} {"train_loss": -6.74942684173584, "global_step": 137398, "epoch": 3271} {"train_loss": -6.462284564971924, "global_step": 137399, "epoch": 3271} {"train_loss": -6.801959037780762, "global_step": 137400, "epoch": 3271} {"train_loss": -6.62610387802124, "global_step": 137401, "epoch": 3271} {"train_loss": -6.682858467102051, "global_step": 137402, "epoch": 3271} {"train_loss": -6.761780738830566, "global_step": 137403, "epoch": 3271} {"train_loss": -6.633163928985596, "global_step": 137404, "epoch": 3271} {"train_loss": -6.729206085205078, "global_step": 137405, "epoch": 3271} {"train_loss": -6.687996864318848, "global_step": 137406, "epoch": 3271} {"train_loss": -6.723614692687988, "global_step": 137407, "epoch": 3271} {"train_loss": -6.68523645401001, "global_step": 137408, "epoch": 3271} {"train_loss": -6.721649646759033, "global_step": 137409, "epoch": 3271} {"train_loss": -6.79744815826416, "global_step": 137410, "epoch": 3271} {"train_loss": -6.7388763427734375, "global_step": 137411, "epoch": 3271} {"train_loss": -6.79928731918335, "global_step": 137412, "epoch": 3271} {"train_loss": -6.685751914978027, "global_step": 137413, "epoch": 3271} {"train_loss": -6.775330543518066, "global_step": 137414, "epoch": 3271} {"train_loss": -6.711860656738281, "global_step": 137415, "epoch": 3271} {"train_loss": -6.7842936515808105, "global_step": 137416, "epoch": 3271} {"train_loss": -6.834685325622559, "global_step": 137417, "epoch": 3271} {"train_loss": -6.753335952758789, "global_step": 137418, "epoch": 3271} {"train_loss": -6.798196315765381, "global_step": 137419, "epoch": 3271} {"train_loss": -6.672024250030518, "global_step": 137420, "epoch": 3271} {"train_loss": -6.693029403686523, "global_step": 137421, "epoch": 3271} {"train_loss": -6.668294906616211, "global_step": 137422, "epoch": 3271} {"train_loss": -6.717440139679682, "global_step": 137423, "epoch": 3271, "val_loss": 77830.890625} {"train_loss": -6.679863452911377, "global_step": 137424, "epoch": 3272} {"train_loss": -6.829082489013672, "global_step": 137425, "epoch": 3272} {"train_loss": -6.733564376831055, "global_step": 137426, "epoch": 3272} {"train_loss": -6.8511786460876465, "global_step": 137427, "epoch": 3272} {"train_loss": -6.67877197265625, "global_step": 137428, "epoch": 3272} {"train_loss": -6.732878684997559, "global_step": 137429, "epoch": 3272} {"train_loss": -6.904384136199951, "global_step": 137430, "epoch": 3272} {"train_loss": -6.768651485443115, "global_step": 137431, "epoch": 3272} {"train_loss": -6.761175632476807, "global_step": 137432, "epoch": 3272} {"train_loss": -6.877120018005371, "global_step": 137433, "epoch": 3272} {"train_loss": -6.757072448730469, "global_step": 137434, "epoch": 3272} {"train_loss": -6.686286926269531, "global_step": 137435, "epoch": 3272} {"train_loss": -6.660505294799805, "global_step": 137436, "epoch": 3272} {"train_loss": -6.725457191467285, "global_step": 137437, "epoch": 3272} {"train_loss": -6.640443801879883, "global_step": 137438, "epoch": 3272} {"train_loss": -6.828341484069824, "global_step": 137439, "epoch": 3272} {"train_loss": -6.6513566970825195, "global_step": 137440, "epoch": 3272} {"train_loss": -6.6198201179504395, "global_step": 137441, "epoch": 3272} {"train_loss": -6.774709701538086, "global_step": 137442, "epoch": 3272} {"train_loss": -6.632880210876465, "global_step": 137443, "epoch": 3272} {"train_loss": -6.637480735778809, "global_step": 137444, "epoch": 3272} {"train_loss": -6.658252716064453, "global_step": 137445, "epoch": 3272} {"train_loss": -6.689789295196533, "global_step": 137446, "epoch": 3272} {"train_loss": -6.645779609680176, "global_step": 137447, "epoch": 3272} {"train_loss": -6.663522243499756, "global_step": 137448, "epoch": 3272} {"train_loss": -6.644937515258789, "global_step": 137449, "epoch": 3272} {"train_loss": -6.735307693481445, "global_step": 137450, "epoch": 3272} {"train_loss": -6.594025611877441, "global_step": 137451, "epoch": 3272} {"train_loss": -6.620500564575195, "global_step": 137452, "epoch": 3272} {"train_loss": -6.588626384735107, "global_step": 137453, "epoch": 3272} {"train_loss": -6.551642894744873, "global_step": 137454, "epoch": 3272} {"train_loss": -6.687020301818848, "global_step": 137455, "epoch": 3272} {"train_loss": -6.64835262298584, "global_step": 137456, "epoch": 3272} {"train_loss": -6.687191963195801, "global_step": 137457, "epoch": 3272} {"train_loss": -6.616211414337158, "global_step": 137458, "epoch": 3272} {"train_loss": -6.702352523803711, "global_step": 137459, "epoch": 3272} {"train_loss": -6.675073623657227, "global_step": 137460, "epoch": 3272} {"train_loss": -6.698402404785156, "global_step": 137461, "epoch": 3272} {"train_loss": -6.738196849822998, "global_step": 137462, "epoch": 3272} {"train_loss": -6.69085693359375, "global_step": 137463, "epoch": 3272} {"train_loss": -6.6959757804870605, "global_step": 137464, "epoch": 3272} {"train_loss": -6.700204633531117, "global_step": 137465, "epoch": 3272, "val_loss": 78059.40625} {"train_loss": -6.685349464416504, "global_step": 137466, "epoch": 3273} {"train_loss": -6.782713890075684, "global_step": 137467, "epoch": 3273} {"train_loss": -6.614160537719727, "global_step": 137468, "epoch": 3273} {"train_loss": -6.589053153991699, "global_step": 137469, "epoch": 3273} {"train_loss": -6.715375900268555, "global_step": 137470, "epoch": 3273} {"train_loss": -6.686525344848633, "global_step": 137471, "epoch": 3273} {"train_loss": -6.754430294036865, "global_step": 137472, "epoch": 3273} {"train_loss": -6.695438861846924, "global_step": 137473, "epoch": 3273} {"train_loss": -6.701565742492676, "global_step": 137474, "epoch": 3273} {"train_loss": -6.722373008728027, "global_step": 137475, "epoch": 3273} {"train_loss": -6.849991798400879, "global_step": 137476, "epoch": 3273} {"train_loss": -6.696361541748047, "global_step": 137477, "epoch": 3273} {"train_loss": -6.803613662719727, "global_step": 137478, "epoch": 3273} {"train_loss": -6.6445631980896, "global_step": 137479, "epoch": 3273} {"train_loss": -6.722799301147461, "global_step": 137480, "epoch": 3273} {"train_loss": -6.749654769897461, "global_step": 137481, "epoch": 3273} {"train_loss": -6.764193534851074, "global_step": 137482, "epoch": 3273} {"train_loss": -6.735596656799316, "global_step": 137483, "epoch": 3273} {"train_loss": -6.712845802307129, "global_step": 137484, "epoch": 3273} {"train_loss": -6.629616737365723, "global_step": 137485, "epoch": 3273} {"train_loss": -6.79521369934082, "global_step": 137486, "epoch": 3273} {"train_loss": -6.673051834106445, "global_step": 137487, "epoch": 3273} {"train_loss": -6.668763637542725, "global_step": 137488, "epoch": 3273} {"train_loss": -6.733921051025391, "global_step": 137489, "epoch": 3273} {"train_loss": -6.703932762145996, "global_step": 137490, "epoch": 3273} {"train_loss": -6.793671607971191, "global_step": 137491, "epoch": 3273} {"train_loss": -6.742671012878418, "global_step": 137492, "epoch": 3273} {"train_loss": -6.699338912963867, "global_step": 137493, "epoch": 3273} {"train_loss": -6.651839256286621, "global_step": 137494, "epoch": 3273} {"train_loss": -6.755658149719238, "global_step": 137495, "epoch": 3273} {"train_loss": -6.7584381103515625, "global_step": 137496, "epoch": 3273} {"train_loss": -6.79161262512207, "global_step": 137497, "epoch": 3273} {"train_loss": -6.789478778839111, "global_step": 137498, "epoch": 3273} {"train_loss": -6.809469223022461, "global_step": 137499, "epoch": 3273} {"train_loss": -6.838352680206299, "global_step": 137500, "epoch": 3273} {"train_loss": -6.7215399742126465, "global_step": 137501, "epoch": 3273} {"train_loss": -6.710280418395996, "global_step": 137502, "epoch": 3273} {"train_loss": -6.813713550567627, "global_step": 137503, "epoch": 3273} {"train_loss": -6.620149612426758, "global_step": 137504, "epoch": 3273} {"train_loss": -6.649713039398193, "global_step": 137505, "epoch": 3273} {"train_loss": -6.771286964416504, "global_step": 137506, "epoch": 3273} {"train_loss": -6.727162940161569, "global_step": 137507, "epoch": 3273, "val_loss": 77816.1484375} {"train_loss": -6.601921081542969, "global_step": 137508, "epoch": 3274} {"train_loss": -6.656191825866699, "global_step": 137509, "epoch": 3274} {"train_loss": -6.670343399047852, "global_step": 137510, "epoch": 3274} {"train_loss": -6.780699729919434, "global_step": 137511, "epoch": 3274} {"train_loss": -6.726646423339844, "global_step": 137512, "epoch": 3274} {"train_loss": -6.808035850524902, "global_step": 137513, "epoch": 3274} {"train_loss": -6.675826072692871, "global_step": 137514, "epoch": 3274} {"train_loss": -6.610593795776367, "global_step": 137515, "epoch": 3274} {"train_loss": -6.7197489738464355, "global_step": 137516, "epoch": 3274} {"train_loss": -6.706128120422363, "global_step": 137517, "epoch": 3274} {"train_loss": -6.7269816398620605, "global_step": 137518, "epoch": 3274} {"train_loss": -6.652748107910156, "global_step": 137519, "epoch": 3274} {"train_loss": -6.666371822357178, "global_step": 137520, "epoch": 3274} {"train_loss": -6.74904727935791, "global_step": 137521, "epoch": 3274} {"train_loss": -6.684903621673584, "global_step": 137522, "epoch": 3274} {"train_loss": -6.7192840576171875, "global_step": 137523, "epoch": 3274} {"train_loss": -6.856750965118408, "global_step": 137524, "epoch": 3274} {"train_loss": -6.826210021972656, "global_step": 137525, "epoch": 3274} {"train_loss": -6.843027114868164, "global_step": 137526, "epoch": 3274} {"train_loss": -6.751286506652832, "global_step": 137527, "epoch": 3274} {"train_loss": -6.792515277862549, "global_step": 137528, "epoch": 3274} {"train_loss": -6.83126163482666, "global_step": 137529, "epoch": 3274} {"train_loss": -6.763125419616699, "global_step": 137530, "epoch": 3274} {"train_loss": -6.77315616607666, "global_step": 137531, "epoch": 3274} {"train_loss": -6.8953046798706055, "global_step": 137532, "epoch": 3274} {"train_loss": -6.789919376373291, "global_step": 137533, "epoch": 3274} {"train_loss": -6.679104804992676, "global_step": 137534, "epoch": 3274} {"train_loss": -6.817517280578613, "global_step": 137535, "epoch": 3274} {"train_loss": -6.618949890136719, "global_step": 137536, "epoch": 3274} {"train_loss": -6.740815162658691, "global_step": 137537, "epoch": 3274} {"train_loss": -6.687507152557373, "global_step": 137538, "epoch": 3274} {"train_loss": -6.702857971191406, "global_step": 137539, "epoch": 3274} {"train_loss": -6.709865570068359, "global_step": 137540, "epoch": 3274} {"train_loss": -6.859363555908203, "global_step": 137541, "epoch": 3274} {"train_loss": -6.611024856567383, "global_step": 137542, "epoch": 3274} {"train_loss": -6.741483688354492, "global_step": 137543, "epoch": 3274} {"train_loss": -6.733753204345703, "global_step": 137544, "epoch": 3274} {"train_loss": -6.764369964599609, "global_step": 137545, "epoch": 3274} {"train_loss": -6.770613193511963, "global_step": 137546, "epoch": 3274} {"train_loss": -6.746402740478516, "global_step": 137547, "epoch": 3274} {"train_loss": -6.671045303344727, "global_step": 137548, "epoch": 3274} {"train_loss": -6.736152898697626, "global_step": 137549, "epoch": 3274, "val_loss": 77710.8359375} {"train_loss": -6.752547740936279, "global_step": 137550, "epoch": 3275} {"train_loss": -6.804688453674316, "global_step": 137551, "epoch": 3275} {"train_loss": -6.766624450683594, "global_step": 137552, "epoch": 3275} {"train_loss": -6.806397438049316, "global_step": 137553, "epoch": 3275} {"train_loss": -6.8086442947387695, "global_step": 137554, "epoch": 3275} {"train_loss": -6.735199928283691, "global_step": 137555, "epoch": 3275} {"train_loss": -6.777005672454834, "global_step": 137556, "epoch": 3275} {"train_loss": -6.65831995010376, "global_step": 137557, "epoch": 3275} {"train_loss": -6.768481731414795, "global_step": 137558, "epoch": 3275} {"train_loss": -6.868154525756836, "global_step": 137559, "epoch": 3275} {"train_loss": -6.714103698730469, "global_step": 137560, "epoch": 3275} {"train_loss": -6.743827819824219, "global_step": 137561, "epoch": 3275} {"train_loss": -6.751106262207031, "global_step": 137562, "epoch": 3275} {"train_loss": -6.730326175689697, "global_step": 137563, "epoch": 3275} {"train_loss": -6.761951446533203, "global_step": 137564, "epoch": 3275} {"train_loss": -6.780172824859619, "global_step": 137565, "epoch": 3275} {"train_loss": -6.796318054199219, "global_step": 137566, "epoch": 3275} {"train_loss": -6.8256635665893555, "global_step": 137567, "epoch": 3275} {"train_loss": -6.824154376983643, "global_step": 137568, "epoch": 3275} {"train_loss": -6.659616470336914, "global_step": 137569, "epoch": 3275} {"train_loss": -6.835692405700684, "global_step": 137570, "epoch": 3275} {"train_loss": -6.752661228179932, "global_step": 137571, "epoch": 3275} {"train_loss": -6.721168518066406, "global_step": 137572, "epoch": 3275} {"train_loss": -6.8415846824646, "global_step": 137573, "epoch": 3275} {"train_loss": -6.7305803298950195, "global_step": 137574, "epoch": 3275} {"train_loss": -6.698966979980469, "global_step": 137575, "epoch": 3275} {"train_loss": -6.807266712188721, "global_step": 137576, "epoch": 3275} {"train_loss": -6.552211284637451, "global_step": 137577, "epoch": 3275} {"train_loss": -6.715277671813965, "global_step": 137578, "epoch": 3275} {"train_loss": -6.71219539642334, "global_step": 137579, "epoch": 3275} {"train_loss": -6.649598598480225, "global_step": 137580, "epoch": 3275} {"train_loss": -6.7055983543396, "global_step": 137581, "epoch": 3275} {"train_loss": -6.661101818084717, "global_step": 137582, "epoch": 3275} {"train_loss": -6.661802291870117, "global_step": 137583, "epoch": 3275} {"train_loss": -6.675707817077637, "global_step": 137584, "epoch": 3275} {"train_loss": -6.614126205444336, "global_step": 137585, "epoch": 3275} {"train_loss": -6.64443302154541, "global_step": 137586, "epoch": 3275} {"train_loss": -6.7694807052612305, "global_step": 137587, "epoch": 3275} {"train_loss": -6.59852933883667, "global_step": 137588, "epoch": 3275} {"train_loss": -6.723996162414551, "global_step": 137589, "epoch": 3275} {"train_loss": -6.738865852355957, "global_step": 137590, "epoch": 3275} {"train_loss": -6.733638888313656, "global_step": 137591, "epoch": 3275, "val_loss": 77737.7734375} {"train_loss": -6.7615156173706055, "global_step": 137592, "epoch": 3276} {"train_loss": -6.614934921264648, "global_step": 137593, "epoch": 3276} {"train_loss": -6.731414318084717, "global_step": 137594, "epoch": 3276} {"train_loss": -6.715024948120117, "global_step": 137595, "epoch": 3276} {"train_loss": -6.756356239318848, "global_step": 137596, "epoch": 3276} {"train_loss": -6.768517971038818, "global_step": 137597, "epoch": 3276} {"train_loss": -6.73512077331543, "global_step": 137598, "epoch": 3276} {"train_loss": -6.753605365753174, "global_step": 137599, "epoch": 3276} {"train_loss": -6.752595901489258, "global_step": 137600, "epoch": 3276} {"train_loss": -6.717704772949219, "global_step": 137601, "epoch": 3276} {"train_loss": -6.665645599365234, "global_step": 137602, "epoch": 3276} {"train_loss": -6.732494354248047, "global_step": 137603, "epoch": 3276} {"train_loss": -6.677499771118164, "global_step": 137604, "epoch": 3276} {"train_loss": -6.706798076629639, "global_step": 137605, "epoch": 3276} {"train_loss": -6.748872756958008, "global_step": 137606, "epoch": 3276} {"train_loss": -6.812078475952148, "global_step": 137607, "epoch": 3276} {"train_loss": -6.778935432434082, "global_step": 137608, "epoch": 3276} {"train_loss": -6.884681224822998, "global_step": 137609, "epoch": 3276} {"train_loss": -6.68206262588501, "global_step": 137610, "epoch": 3276} {"train_loss": -6.7576775550842285, "global_step": 137611, "epoch": 3276} {"train_loss": -6.754727363586426, "global_step": 137612, "epoch": 3276} {"train_loss": -6.754843711853027, "global_step": 137613, "epoch": 3276} {"train_loss": -6.7726640701293945, "global_step": 137614, "epoch": 3276} {"train_loss": -6.87375545501709, "global_step": 137615, "epoch": 3276} {"train_loss": -6.598724365234375, "global_step": 137616, "epoch": 3276} {"train_loss": -6.669096946716309, "global_step": 137617, "epoch": 3276} {"train_loss": -6.787547588348389, "global_step": 137618, "epoch": 3276} {"train_loss": -6.7325005531311035, "global_step": 137619, "epoch": 3276} {"train_loss": -6.787264823913574, "global_step": 137620, "epoch": 3276} {"train_loss": -6.7850494384765625, "global_step": 137621, "epoch": 3276} {"train_loss": -6.832920074462891, "global_step": 137622, "epoch": 3276} {"train_loss": -6.740693092346191, "global_step": 137623, "epoch": 3276} {"train_loss": -6.710838317871094, "global_step": 137624, "epoch": 3276} {"train_loss": -6.679436206817627, "global_step": 137625, "epoch": 3276} {"train_loss": -6.848337650299072, "global_step": 137626, "epoch": 3276} {"train_loss": -6.756440162658691, "global_step": 137627, "epoch": 3276} {"train_loss": -6.729284286499023, "global_step": 137628, "epoch": 3276} {"train_loss": -6.696081638336182, "global_step": 137629, "epoch": 3276} {"train_loss": -6.753586769104004, "global_step": 137630, "epoch": 3276} {"train_loss": -6.626989364624023, "global_step": 137631, "epoch": 3276} {"train_loss": -6.646392822265625, "global_step": 137632, "epoch": 3276} {"train_loss": -6.7394103095645, "global_step": 137633, "epoch": 3276, "val_loss": 78091.46875} {"train_loss": -6.698143482208252, "global_step": 137634, "epoch": 3277} {"train_loss": -6.726600170135498, "global_step": 137635, "epoch": 3277} {"train_loss": -6.729372978210449, "global_step": 137636, "epoch": 3277} {"train_loss": -6.765453338623047, "global_step": 137637, "epoch": 3277} {"train_loss": -6.721650123596191, "global_step": 137638, "epoch": 3277} {"train_loss": -6.705615997314453, "global_step": 137639, "epoch": 3277} {"train_loss": -6.788154602050781, "global_step": 137640, "epoch": 3277} {"train_loss": -6.696745872497559, "global_step": 137641, "epoch": 3277} {"train_loss": -6.581757068634033, "global_step": 137642, "epoch": 3277} {"train_loss": -6.813291549682617, "global_step": 137643, "epoch": 3277} {"train_loss": -6.67036247253418, "global_step": 137644, "epoch": 3277} {"train_loss": -6.733251094818115, "global_step": 137645, "epoch": 3277} {"train_loss": -6.627723693847656, "global_step": 137646, "epoch": 3277} {"train_loss": -6.611996650695801, "global_step": 137647, "epoch": 3277} {"train_loss": -6.856147766113281, "global_step": 137648, "epoch": 3277} {"train_loss": -6.575154781341553, "global_step": 137649, "epoch": 3277} {"train_loss": -6.742405891418457, "global_step": 137650, "epoch": 3277} {"train_loss": -6.713403701782227, "global_step": 137651, "epoch": 3277} {"train_loss": -6.702827453613281, "global_step": 137652, "epoch": 3277} {"train_loss": -6.612538814544678, "global_step": 137653, "epoch": 3277} {"train_loss": -6.578756332397461, "global_step": 137654, "epoch": 3277} {"train_loss": -6.747539520263672, "global_step": 137655, "epoch": 3277} {"train_loss": -6.5932440757751465, "global_step": 137656, "epoch": 3277} {"train_loss": -6.674621105194092, "global_step": 137657, "epoch": 3277} {"train_loss": -6.359596252441406, "global_step": 137658, "epoch": 3277} {"train_loss": -6.527754783630371, "global_step": 137659, "epoch": 3277} {"train_loss": -6.568110942840576, "global_step": 137660, "epoch": 3277} {"train_loss": -6.650362968444824, "global_step": 137661, "epoch": 3277} {"train_loss": -6.704965591430664, "global_step": 137662, "epoch": 3277} {"train_loss": -6.7884063720703125, "global_step": 137663, "epoch": 3277} {"train_loss": -6.635547637939453, "global_step": 137664, "epoch": 3277} {"train_loss": -6.712475776672363, "global_step": 137665, "epoch": 3277} {"train_loss": -6.764001846313477, "global_step": 137666, "epoch": 3277} {"train_loss": -6.76685905456543, "global_step": 137667, "epoch": 3277} {"train_loss": -6.706943511962891, "global_step": 137668, "epoch": 3277} {"train_loss": -6.600828647613525, "global_step": 137669, "epoch": 3277} {"train_loss": -6.788383483886719, "global_step": 137670, "epoch": 3277} {"train_loss": -6.7411789894104, "global_step": 137671, "epoch": 3277} {"train_loss": -6.844703197479248, "global_step": 137672, "epoch": 3277} {"train_loss": -6.6937456130981445, "global_step": 137673, "epoch": 3277} {"train_loss": -6.748715400695801, "global_step": 137674, "epoch": 3277} {"train_loss": -6.693543797447568, "global_step": 137675, "epoch": 3277, "val_loss": 78000.609375} {"train_loss": -6.766049385070801, "global_step": 137676, "epoch": 3278} {"train_loss": -6.808206558227539, "global_step": 137677, "epoch": 3278} {"train_loss": -6.715952396392822, "global_step": 137678, "epoch": 3278} {"train_loss": -6.7821550369262695, "global_step": 137679, "epoch": 3278} {"train_loss": -6.8505024909973145, "global_step": 137680, "epoch": 3278} {"train_loss": -6.748435974121094, "global_step": 137681, "epoch": 3278} {"train_loss": -6.839352607727051, "global_step": 137682, "epoch": 3278} {"train_loss": -6.840061187744141, "global_step": 137683, "epoch": 3278} {"train_loss": -6.8641357421875, "global_step": 137684, "epoch": 3278} {"train_loss": -6.801936149597168, "global_step": 137685, "epoch": 3278} {"train_loss": -6.765002250671387, "global_step": 137686, "epoch": 3278} {"train_loss": -6.742700099945068, "global_step": 137687, "epoch": 3278} {"train_loss": -6.802187919616699, "global_step": 137688, "epoch": 3278} {"train_loss": -6.8352789878845215, "global_step": 137689, "epoch": 3278} {"train_loss": -6.823879241943359, "global_step": 137690, "epoch": 3278} {"train_loss": -6.713508605957031, "global_step": 137691, "epoch": 3278} {"train_loss": -6.885756015777588, "global_step": 137692, "epoch": 3278} {"train_loss": -6.858173370361328, "global_step": 137693, "epoch": 3278} {"train_loss": -6.850500106811523, "global_step": 137694, "epoch": 3278} {"train_loss": -6.639226913452148, "global_step": 137695, "epoch": 3278} {"train_loss": -6.695868492126465, "global_step": 137696, "epoch": 3278} {"train_loss": -6.763298511505127, "global_step": 137697, "epoch": 3278} {"train_loss": -6.7921061515808105, "global_step": 137698, "epoch": 3278} {"train_loss": -6.751406669616699, "global_step": 137699, "epoch": 3278} {"train_loss": -6.681899547576904, "global_step": 137700, "epoch": 3278} {"train_loss": -6.810207366943359, "global_step": 137701, "epoch": 3278} {"train_loss": -6.726581573486328, "global_step": 137702, "epoch": 3278} {"train_loss": -6.6887993812561035, "global_step": 137703, "epoch": 3278} {"train_loss": -6.737844944000244, "global_step": 137704, "epoch": 3278} {"train_loss": -6.763822078704834, "global_step": 137705, "epoch": 3278} {"train_loss": -6.773064136505127, "global_step": 137706, "epoch": 3278} {"train_loss": -6.805336952209473, "global_step": 137707, "epoch": 3278} {"train_loss": -6.806331157684326, "global_step": 137708, "epoch": 3278} {"train_loss": -6.750880241394043, "global_step": 137709, "epoch": 3278} {"train_loss": -6.719475269317627, "global_step": 137710, "epoch": 3278} {"train_loss": -6.686356544494629, "global_step": 137711, "epoch": 3278} {"train_loss": -6.6938676834106445, "global_step": 137712, "epoch": 3278} {"train_loss": -6.8331804275512695, "global_step": 137713, "epoch": 3278} {"train_loss": -6.793825149536133, "global_step": 137714, "epoch": 3278} {"train_loss": -6.784400463104248, "global_step": 137715, "epoch": 3278} {"train_loss": -6.78114128112793, "global_step": 137716, "epoch": 3278} {"train_loss": -6.773684706006732, "global_step": 137717, "epoch": 3278, "val_loss": 78094.46875} {"train_loss": -6.8192243576049805, "global_step": 137718, "epoch": 3279} {"train_loss": -6.734097957611084, "global_step": 137719, "epoch": 3279} {"train_loss": -6.815824508666992, "global_step": 137720, "epoch": 3279} {"train_loss": -6.662698745727539, "global_step": 137721, "epoch": 3279} {"train_loss": -6.6805500984191895, "global_step": 137722, "epoch": 3279} {"train_loss": -6.716985702514648, "global_step": 137723, "epoch": 3279} {"train_loss": -6.564613342285156, "global_step": 137724, "epoch": 3279} {"train_loss": -6.710375785827637, "global_step": 137725, "epoch": 3279} {"train_loss": -6.751678943634033, "global_step": 137726, "epoch": 3279} {"train_loss": -6.599801063537598, "global_step": 137727, "epoch": 3279} {"train_loss": -6.759275436401367, "global_step": 137728, "epoch": 3279} {"train_loss": -6.740233421325684, "global_step": 137729, "epoch": 3279} {"train_loss": -6.706090927124023, "global_step": 137730, "epoch": 3279} {"train_loss": -6.721675872802734, "global_step": 137731, "epoch": 3279} {"train_loss": -6.695629119873047, "global_step": 137732, "epoch": 3279} {"train_loss": -6.676525115966797, "global_step": 137733, "epoch": 3279} {"train_loss": -6.6350579261779785, "global_step": 137734, "epoch": 3279} {"train_loss": -6.757430076599121, "global_step": 137735, "epoch": 3279} {"train_loss": -6.770804405212402, "global_step": 137736, "epoch": 3279} {"train_loss": -6.76546049118042, "global_step": 137737, "epoch": 3279} {"train_loss": -6.8280134201049805, "global_step": 137738, "epoch": 3279} {"train_loss": -6.626890182495117, "global_step": 137739, "epoch": 3279} {"train_loss": -6.841175079345703, "global_step": 137740, "epoch": 3279} {"train_loss": -6.794794082641602, "global_step": 137741, "epoch": 3279} {"train_loss": -6.734287261962891, "global_step": 137742, "epoch": 3279} {"train_loss": -6.772619247436523, "global_step": 137743, "epoch": 3279} {"train_loss": -6.887956142425537, "global_step": 137744, "epoch": 3279} {"train_loss": -6.717492580413818, "global_step": 137745, "epoch": 3279} {"train_loss": -6.771488189697266, "global_step": 137746, "epoch": 3279} {"train_loss": -6.725994110107422, "global_step": 137747, "epoch": 3279} {"train_loss": -6.713823318481445, "global_step": 137748, "epoch": 3279} {"train_loss": -6.624410152435303, "global_step": 137749, "epoch": 3279} {"train_loss": -6.786990642547607, "global_step": 137750, "epoch": 3279} {"train_loss": -6.81374454498291, "global_step": 137751, "epoch": 3279} {"train_loss": -6.8018693923950195, "global_step": 137752, "epoch": 3279} {"train_loss": -6.810337066650391, "global_step": 137753, "epoch": 3279} {"train_loss": -6.877148151397705, "global_step": 137754, "epoch": 3279} {"train_loss": -6.868217468261719, "global_step": 137755, "epoch": 3279} {"train_loss": -6.719691276550293, "global_step": 137756, "epoch": 3279} {"train_loss": -6.798764228820801, "global_step": 137757, "epoch": 3279} {"train_loss": -6.8134026527404785, "global_step": 137758, "epoch": 3279} {"train_loss": -6.747727371397472, "global_step": 137759, "epoch": 3279, "val_loss": 77944.1640625} {"train_loss": -6.8351850509643555, "global_step": 137760, "epoch": 3280} {"train_loss": -6.7281951904296875, "global_step": 137761, "epoch": 3280} {"train_loss": -6.83297061920166, "global_step": 137762, "epoch": 3280} {"train_loss": -6.799802303314209, "global_step": 137763, "epoch": 3280} {"train_loss": -6.6550798416137695, "global_step": 137764, "epoch": 3280} {"train_loss": -6.671579837799072, "global_step": 137765, "epoch": 3280} {"train_loss": -6.909285545349121, "global_step": 137766, "epoch": 3280} {"train_loss": -6.786093711853027, "global_step": 137767, "epoch": 3280} {"train_loss": -6.7330827713012695, "global_step": 137768, "epoch": 3280} {"train_loss": -6.666277885437012, "global_step": 137769, "epoch": 3280} {"train_loss": -6.832132816314697, "global_step": 137770, "epoch": 3280} {"train_loss": -6.693340301513672, "global_step": 137771, "epoch": 3280} {"train_loss": -6.779975414276123, "global_step": 137772, "epoch": 3280} {"train_loss": -6.756349563598633, "global_step": 137773, "epoch": 3280} {"train_loss": -6.791658401489258, "global_step": 137774, "epoch": 3280} {"train_loss": -6.7144598960876465, "global_step": 137775, "epoch": 3280} {"train_loss": -6.827163219451904, "global_step": 137776, "epoch": 3280} {"train_loss": -6.631657600402832, "global_step": 137777, "epoch": 3280} {"train_loss": -6.652800559997559, "global_step": 137778, "epoch": 3280} {"train_loss": -6.785554885864258, "global_step": 137779, "epoch": 3280} {"train_loss": -6.792998313903809, "global_step": 137780, "epoch": 3280} {"train_loss": -6.544008255004883, "global_step": 137781, "epoch": 3280} {"train_loss": -6.727903842926025, "global_step": 137782, "epoch": 3280} {"train_loss": -6.714520454406738, "global_step": 137783, "epoch": 3280} {"train_loss": -6.627033233642578, "global_step": 137784, "epoch": 3280} {"train_loss": -6.613797187805176, "global_step": 137785, "epoch": 3280} {"train_loss": -6.639149188995361, "global_step": 137786, "epoch": 3280} {"train_loss": -6.72132682800293, "global_step": 137787, "epoch": 3280} {"train_loss": -6.54106330871582, "global_step": 137788, "epoch": 3280} {"train_loss": -6.679418563842773, "global_step": 137789, "epoch": 3280} {"train_loss": -6.533638000488281, "global_step": 137790, "epoch": 3280} {"train_loss": -6.708304405212402, "global_step": 137791, "epoch": 3280} {"train_loss": -6.657922267913818, "global_step": 137792, "epoch": 3280} {"train_loss": -6.610852241516113, "global_step": 137793, "epoch": 3280} {"train_loss": -6.560075759887695, "global_step": 137794, "epoch": 3280} {"train_loss": -6.683065891265869, "global_step": 137795, "epoch": 3280} {"train_loss": -6.684994220733643, "global_step": 137796, "epoch": 3280} {"train_loss": -6.704338073730469, "global_step": 137797, "epoch": 3280} {"train_loss": -6.723863124847412, "global_step": 137798, "epoch": 3280} {"train_loss": -6.592751502990723, "global_step": 137799, "epoch": 3280} {"train_loss": -6.756326675415039, "global_step": 137800, "epoch": 3280} {"train_loss": -6.709514220555623, "global_step": 137801, "epoch": 3280, "val_loss": 77907.1171875} {"train_loss": -6.688858985900879, "global_step": 137802, "epoch": 3281} {"train_loss": -6.803061485290527, "global_step": 137803, "epoch": 3281} {"train_loss": -6.703956604003906, "global_step": 137804, "epoch": 3281} {"train_loss": -6.830662727355957, "global_step": 137805, "epoch": 3281} {"train_loss": -6.847933769226074, "global_step": 137806, "epoch": 3281} {"train_loss": -6.883941650390625, "global_step": 137807, "epoch": 3281} {"train_loss": -6.761185646057129, "global_step": 137808, "epoch": 3281} {"train_loss": -6.7901201248168945, "global_step": 137809, "epoch": 3281} {"train_loss": -6.783432483673096, "global_step": 137810, "epoch": 3281} {"train_loss": -6.804388046264648, "global_step": 137811, "epoch": 3281} {"train_loss": -6.764415264129639, "global_step": 137812, "epoch": 3281} {"train_loss": -6.883498191833496, "global_step": 137813, "epoch": 3281} {"train_loss": -6.852090835571289, "global_step": 137814, "epoch": 3281} {"train_loss": -6.719637870788574, "global_step": 137815, "epoch": 3281} {"train_loss": -6.744729042053223, "global_step": 137816, "epoch": 3281} {"train_loss": -6.725702285766602, "global_step": 137817, "epoch": 3281} {"train_loss": -6.836925983428955, "global_step": 137818, "epoch": 3281} {"train_loss": -6.701803207397461, "global_step": 137819, "epoch": 3281} {"train_loss": -6.808450698852539, "global_step": 137820, "epoch": 3281} {"train_loss": -6.6423773765563965, "global_step": 137821, "epoch": 3281} {"train_loss": -6.730859756469727, "global_step": 137822, "epoch": 3281} {"train_loss": -6.840688228607178, "global_step": 137823, "epoch": 3281} {"train_loss": -6.80501651763916, "global_step": 137824, "epoch": 3281} {"train_loss": -6.892582893371582, "global_step": 137825, "epoch": 3281} {"train_loss": -6.800796985626221, "global_step": 137826, "epoch": 3281} {"train_loss": -6.758389472961426, "global_step": 137827, "epoch": 3281} {"train_loss": -6.83131217956543, "global_step": 137828, "epoch": 3281} {"train_loss": -6.716079235076904, "global_step": 137829, "epoch": 3281} {"train_loss": -6.718465805053711, "global_step": 137830, "epoch": 3281} {"train_loss": -6.862757682800293, "global_step": 137831, "epoch": 3281} {"train_loss": -6.813927173614502, "global_step": 137832, "epoch": 3281} {"train_loss": -6.852257251739502, "global_step": 137833, "epoch": 3281} {"train_loss": -6.832841873168945, "global_step": 137834, "epoch": 3281} {"train_loss": -6.803860664367676, "global_step": 137835, "epoch": 3281} {"train_loss": -6.624508857727051, "global_step": 137836, "epoch": 3281} {"train_loss": -6.73636531829834, "global_step": 137837, "epoch": 3281} {"train_loss": -6.864429950714111, "global_step": 137838, "epoch": 3281} {"train_loss": -6.664684772491455, "global_step": 137839, "epoch": 3281} {"train_loss": -6.688567161560059, "global_step": 137840, "epoch": 3281} {"train_loss": -6.832792282104492, "global_step": 137841, "epoch": 3281} {"train_loss": -6.770662784576416, "global_step": 137842, "epoch": 3281} {"train_loss": -6.782422383626302, "global_step": 137843, "epoch": 3281, "val_loss": 77850.46875} {"train_loss": -6.80949068069458, "global_step": 137844, "epoch": 3282} {"train_loss": -6.701485633850098, "global_step": 137845, "epoch": 3282} {"train_loss": -6.828875541687012, "global_step": 137846, "epoch": 3282} {"train_loss": -6.746840953826904, "global_step": 137847, "epoch": 3282} {"train_loss": -6.919271469116211, "global_step": 137848, "epoch": 3282} {"train_loss": -6.820879936218262, "global_step": 137849, "epoch": 3282} {"train_loss": -6.8183698654174805, "global_step": 137850, "epoch": 3282} {"train_loss": -6.784807205200195, "global_step": 137851, "epoch": 3282} {"train_loss": -6.8704514503479, "global_step": 137852, "epoch": 3282} {"train_loss": -6.903939247131348, "global_step": 137853, "epoch": 3282} {"train_loss": -6.800849914550781, "global_step": 137854, "epoch": 3282} {"train_loss": -6.865251064300537, "global_step": 137855, "epoch": 3282} {"train_loss": -6.8678412437438965, "global_step": 137856, "epoch": 3282} {"train_loss": -6.846831798553467, "global_step": 137857, "epoch": 3282} {"train_loss": -6.800136566162109, "global_step": 137858, "epoch": 3282} {"train_loss": -6.697169780731201, "global_step": 137859, "epoch": 3282} {"train_loss": -6.840065002441406, "global_step": 137860, "epoch": 3282} {"train_loss": -6.855626106262207, "global_step": 137861, "epoch": 3282} {"train_loss": -6.887140274047852, "global_step": 137862, "epoch": 3282} {"train_loss": -6.710537910461426, "global_step": 137863, "epoch": 3282} {"train_loss": -6.801329612731934, "global_step": 137864, "epoch": 3282} {"train_loss": -6.735286712646484, "global_step": 137865, "epoch": 3282} {"train_loss": -6.868456840515137, "global_step": 137866, "epoch": 3282} {"train_loss": -6.8090667724609375, "global_step": 137867, "epoch": 3282} {"train_loss": -6.775683403015137, "global_step": 137868, "epoch": 3282} {"train_loss": -6.675624847412109, "global_step": 137869, "epoch": 3282} {"train_loss": -6.537606716156006, "global_step": 137870, "epoch": 3282} {"train_loss": -6.895589828491211, "global_step": 137871, "epoch": 3282} {"train_loss": -6.693323135375977, "global_step": 137872, "epoch": 3282} {"train_loss": -6.807248115539551, "global_step": 137873, "epoch": 3282} {"train_loss": -6.78668212890625, "global_step": 137874, "epoch": 3282} {"train_loss": -6.632174491882324, "global_step": 137875, "epoch": 3282} {"train_loss": -6.7679924964904785, "global_step": 137876, "epoch": 3282} {"train_loss": -6.70037841796875, "global_step": 137877, "epoch": 3282} {"train_loss": -6.656469345092773, "global_step": 137878, "epoch": 3282} {"train_loss": -6.7457404136657715, "global_step": 137879, "epoch": 3282} {"train_loss": -6.703113079071045, "global_step": 137880, "epoch": 3282} {"train_loss": -6.7582197189331055, "global_step": 137881, "epoch": 3282} {"train_loss": -6.714992046356201, "global_step": 137882, "epoch": 3282} {"train_loss": -6.7328572273254395, "global_step": 137883, "epoch": 3282} {"train_loss": -6.697563171386719, "global_step": 137884, "epoch": 3282} {"train_loss": -6.772519100280035, "global_step": 137885, "epoch": 3282, "val_loss": 77776.953125} {"train_loss": -6.721810340881348, "global_step": 137886, "epoch": 3283} {"train_loss": -6.610247611999512, "global_step": 137887, "epoch": 3283} {"train_loss": -6.8072309494018555, "global_step": 137888, "epoch": 3283} {"train_loss": -6.782979488372803, "global_step": 137889, "epoch": 3283} {"train_loss": -6.728515625, "global_step": 137890, "epoch": 3283} {"train_loss": -6.749651908874512, "global_step": 137891, "epoch": 3283} {"train_loss": -6.760003089904785, "global_step": 137892, "epoch": 3283} {"train_loss": -6.7030134201049805, "global_step": 137893, "epoch": 3283} {"train_loss": -6.743695259094238, "global_step": 137894, "epoch": 3283} {"train_loss": -6.636155128479004, "global_step": 137895, "epoch": 3283} {"train_loss": -6.682289123535156, "global_step": 137896, "epoch": 3283} {"train_loss": -6.835082054138184, "global_step": 137897, "epoch": 3283} {"train_loss": -6.693129062652588, "global_step": 137898, "epoch": 3283} {"train_loss": -6.771801948547363, "global_step": 137899, "epoch": 3283} {"train_loss": -6.702315330505371, "global_step": 137900, "epoch": 3283} {"train_loss": -6.804967403411865, "global_step": 137901, "epoch": 3283} {"train_loss": -6.7627458572387695, "global_step": 137902, "epoch": 3283} {"train_loss": -6.6586503982543945, "global_step": 137903, "epoch": 3283} {"train_loss": -6.858137130737305, "global_step": 137904, "epoch": 3283} {"train_loss": -6.793188095092773, "global_step": 137905, "epoch": 3283} {"train_loss": -6.626426696777344, "global_step": 137906, "epoch": 3283} {"train_loss": -6.721222877502441, "global_step": 137907, "epoch": 3283} {"train_loss": -6.700742721557617, "global_step": 137908, "epoch": 3283} {"train_loss": -6.715465068817139, "global_step": 137909, "epoch": 3283} {"train_loss": -6.775507926940918, "global_step": 137910, "epoch": 3283} {"train_loss": -6.779762268066406, "global_step": 137911, "epoch": 3283} {"train_loss": -6.8094587326049805, "global_step": 137912, "epoch": 3283} {"train_loss": -6.781558513641357, "global_step": 137913, "epoch": 3283} {"train_loss": -6.671928405761719, "global_step": 137914, "epoch": 3283} {"train_loss": -6.738859176635742, "global_step": 137915, "epoch": 3283} {"train_loss": -6.815882682800293, "global_step": 137916, "epoch": 3283} {"train_loss": -6.802499294281006, "global_step": 137917, "epoch": 3283} {"train_loss": -6.8398284912109375, "global_step": 137918, "epoch": 3283} {"train_loss": -6.811673164367676, "global_step": 137919, "epoch": 3283} {"train_loss": -6.776139736175537, "global_step": 137920, "epoch": 3283} {"train_loss": -6.80495548248291, "global_step": 137921, "epoch": 3283} {"train_loss": -6.798842906951904, "global_step": 137922, "epoch": 3283} {"train_loss": -6.862961769104004, "global_step": 137923, "epoch": 3283} {"train_loss": -6.724494934082031, "global_step": 137924, "epoch": 3283} {"train_loss": -6.745667934417725, "global_step": 137925, "epoch": 3283} {"train_loss": -6.763556957244873, "global_step": 137926, "epoch": 3283} {"train_loss": -6.753532579966953, "global_step": 137927, "epoch": 3283, "val_loss": 77747.09375} {"train_loss": -6.713551044464111, "global_step": 137928, "epoch": 3284} {"train_loss": -6.814421653747559, "global_step": 137929, "epoch": 3284} {"train_loss": -6.843593597412109, "global_step": 137930, "epoch": 3284} {"train_loss": -6.728597164154053, "global_step": 137931, "epoch": 3284} {"train_loss": -6.798464775085449, "global_step": 137932, "epoch": 3284} {"train_loss": -6.81153678894043, "global_step": 137933, "epoch": 3284} {"train_loss": -6.650745868682861, "global_step": 137934, "epoch": 3284} {"train_loss": -6.74234676361084, "global_step": 137935, "epoch": 3284} {"train_loss": -6.777596473693848, "global_step": 137936, "epoch": 3284} {"train_loss": -6.804171085357666, "global_step": 137937, "epoch": 3284} {"train_loss": -6.549548149108887, "global_step": 137938, "epoch": 3284} {"train_loss": -6.732489109039307, "global_step": 137939, "epoch": 3284} {"train_loss": -6.747830390930176, "global_step": 137940, "epoch": 3284} {"train_loss": -6.715660572052002, "global_step": 137941, "epoch": 3284} {"train_loss": -6.664308547973633, "global_step": 137942, "epoch": 3284} {"train_loss": -6.6895270347595215, "global_step": 137943, "epoch": 3284} {"train_loss": -6.7575860023498535, "global_step": 137944, "epoch": 3284} {"train_loss": -6.839817523956299, "global_step": 137945, "epoch": 3284} {"train_loss": -6.6274309158325195, "global_step": 137946, "epoch": 3284} {"train_loss": -6.73105525970459, "global_step": 137947, "epoch": 3284} {"train_loss": -6.759577751159668, "global_step": 137948, "epoch": 3284} {"train_loss": -6.736081123352051, "global_step": 137949, "epoch": 3284} {"train_loss": -6.753887176513672, "global_step": 137950, "epoch": 3284} {"train_loss": -6.6886467933654785, "global_step": 137951, "epoch": 3284} {"train_loss": -6.665415287017822, "global_step": 137952, "epoch": 3284} {"train_loss": -6.663074016571045, "global_step": 137953, "epoch": 3284} {"train_loss": -6.709662914276123, "global_step": 137954, "epoch": 3284} {"train_loss": -6.714146614074707, "global_step": 137955, "epoch": 3284} {"train_loss": -6.761347770690918, "global_step": 137956, "epoch": 3284} {"train_loss": -6.751153945922852, "global_step": 137957, "epoch": 3284} {"train_loss": -6.7172980308532715, "global_step": 137958, "epoch": 3284} {"train_loss": -6.745278358459473, "global_step": 137959, "epoch": 3284} {"train_loss": -6.798705101013184, "global_step": 137960, "epoch": 3284} {"train_loss": -6.763654708862305, "global_step": 137961, "epoch": 3284} {"train_loss": -6.8204498291015625, "global_step": 137962, "epoch": 3284} {"train_loss": -6.723003387451172, "global_step": 137963, "epoch": 3284} {"train_loss": -6.775974273681641, "global_step": 137964, "epoch": 3284} {"train_loss": -6.777235507965088, "global_step": 137965, "epoch": 3284} {"train_loss": -6.834526062011719, "global_step": 137966, "epoch": 3284} {"train_loss": -6.760596752166748, "global_step": 137967, "epoch": 3284} {"train_loss": -6.887936592102051, "global_step": 137968, "epoch": 3284} {"train_loss": -6.745475065140497, "global_step": 137969, "epoch": 3284, "val_loss": 78086.171875} {"train_loss": -6.829517364501953, "global_step": 137970, "epoch": 3285} {"train_loss": -6.741600036621094, "global_step": 137971, "epoch": 3285} {"train_loss": -6.741913795471191, "global_step": 137972, "epoch": 3285} {"train_loss": -6.760251045227051, "global_step": 137973, "epoch": 3285} {"train_loss": -6.827899932861328, "global_step": 137974, "epoch": 3285} {"train_loss": -6.859025001525879, "global_step": 137975, "epoch": 3285} {"train_loss": -6.751797199249268, "global_step": 137976, "epoch": 3285} {"train_loss": -6.742120742797852, "global_step": 137977, "epoch": 3285} {"train_loss": -6.784763336181641, "global_step": 137978, "epoch": 3285} {"train_loss": -6.923498153686523, "global_step": 137979, "epoch": 3285} {"train_loss": -6.701268196105957, "global_step": 137980, "epoch": 3285} {"train_loss": -6.705874919891357, "global_step": 137981, "epoch": 3285} {"train_loss": -6.741883754730225, "global_step": 137982, "epoch": 3285} {"train_loss": -6.778219223022461, "global_step": 137983, "epoch": 3285} {"train_loss": -6.609935760498047, "global_step": 137984, "epoch": 3285} {"train_loss": -6.696105480194092, "global_step": 137985, "epoch": 3285} {"train_loss": -6.603439807891846, "global_step": 137986, "epoch": 3285} {"train_loss": -6.620363712310791, "global_step": 137987, "epoch": 3285} {"train_loss": -6.6257500648498535, "global_step": 137988, "epoch": 3285} {"train_loss": -6.629940986633301, "global_step": 137989, "epoch": 3285} {"train_loss": -6.73345947265625, "global_step": 137990, "epoch": 3285} {"train_loss": -6.645114421844482, "global_step": 137991, "epoch": 3285} {"train_loss": -6.609865665435791, "global_step": 137992, "epoch": 3285} {"train_loss": -6.677977561950684, "global_step": 137993, "epoch": 3285} {"train_loss": -6.668460845947266, "global_step": 137994, "epoch": 3285} {"train_loss": -6.825943946838379, "global_step": 137995, "epoch": 3285} {"train_loss": -6.796169757843018, "global_step": 137996, "epoch": 3285} {"train_loss": -6.789482116699219, "global_step": 137997, "epoch": 3285} {"train_loss": -6.84158992767334, "global_step": 137998, "epoch": 3285} {"train_loss": -6.653077125549316, "global_step": 137999, "epoch": 3285} {"train_loss": -6.7377705574035645, "global_step": 138000, "epoch": 3285} {"train_loss": -6.835264205932617, "global_step": 138001, "epoch": 3285} {"train_loss": -6.820629119873047, "global_step": 138002, "epoch": 3285} {"train_loss": -6.756093502044678, "global_step": 138003, "epoch": 3285} {"train_loss": -6.809401512145996, "global_step": 138004, "epoch": 3285} {"train_loss": -6.70646858215332, "global_step": 138005, "epoch": 3285} {"train_loss": -6.780833721160889, "global_step": 138006, "epoch": 3285} {"train_loss": -6.758062362670898, "global_step": 138007, "epoch": 3285} {"train_loss": -6.65199613571167, "global_step": 138008, "epoch": 3285} {"train_loss": -6.803319931030273, "global_step": 138009, "epoch": 3285} {"train_loss": -6.782788276672363, "global_step": 138010, "epoch": 3285} {"train_loss": -6.740325723375593, "global_step": 138011, "epoch": 3285, "val_loss": 78048.7109375} {"train_loss": -6.654501438140869, "global_step": 138012, "epoch": 3286} {"train_loss": -6.678095817565918, "global_step": 138013, "epoch": 3286} {"train_loss": -6.601689338684082, "global_step": 138014, "epoch": 3286} {"train_loss": -6.7195539474487305, "global_step": 138015, "epoch": 3286} {"train_loss": -6.670496940612793, "global_step": 138016, "epoch": 3286} {"train_loss": -6.711032390594482, "global_step": 138017, "epoch": 3286} {"train_loss": -6.70960807800293, "global_step": 138018, "epoch": 3286} {"train_loss": -6.7374725341796875, "global_step": 138019, "epoch": 3286} {"train_loss": -6.769321441650391, "global_step": 138020, "epoch": 3286} {"train_loss": -6.825212478637695, "global_step": 138021, "epoch": 3286} {"train_loss": -6.882813930511475, "global_step": 138022, "epoch": 3286} {"train_loss": -6.611120700836182, "global_step": 138023, "epoch": 3286} {"train_loss": -6.899511337280273, "global_step": 138024, "epoch": 3286} {"train_loss": -6.590898036956787, "global_step": 138025, "epoch": 3286} {"train_loss": -6.545215606689453, "global_step": 138026, "epoch": 3286} {"train_loss": -6.738473415374756, "global_step": 138027, "epoch": 3286} {"train_loss": -6.685534477233887, "global_step": 138028, "epoch": 3286} {"train_loss": -6.786357879638672, "global_step": 138029, "epoch": 3286} {"train_loss": -6.736175537109375, "global_step": 138030, "epoch": 3286} {"train_loss": -6.748611927032471, "global_step": 138031, "epoch": 3286} {"train_loss": -6.740629196166992, "global_step": 138032, "epoch": 3286} {"train_loss": -6.5763421058654785, "global_step": 138033, "epoch": 3286} {"train_loss": -6.767292022705078, "global_step": 138034, "epoch": 3286} {"train_loss": -6.771913528442383, "global_step": 138035, "epoch": 3286} {"train_loss": -6.705930709838867, "global_step": 138036, "epoch": 3286} {"train_loss": -6.790752410888672, "global_step": 138037, "epoch": 3286} {"train_loss": -6.721859931945801, "global_step": 138038, "epoch": 3286} {"train_loss": -6.785616874694824, "global_step": 138039, "epoch": 3286} {"train_loss": -6.927242279052734, "global_step": 138040, "epoch": 3286} {"train_loss": -6.929698944091797, "global_step": 138041, "epoch": 3286} {"train_loss": -6.793153762817383, "global_step": 138042, "epoch": 3286} {"train_loss": -6.7944722175598145, "global_step": 138043, "epoch": 3286} {"train_loss": -6.813154220581055, "global_step": 138044, "epoch": 3286} {"train_loss": -6.8139848709106445, "global_step": 138045, "epoch": 3286} {"train_loss": -6.794913291931152, "global_step": 138046, "epoch": 3286} {"train_loss": -6.811474800109863, "global_step": 138047, "epoch": 3286} {"train_loss": -6.67967414855957, "global_step": 138048, "epoch": 3286} {"train_loss": -6.813304901123047, "global_step": 138049, "epoch": 3286} {"train_loss": -6.8582611083984375, "global_step": 138050, "epoch": 3286} {"train_loss": -6.748032093048096, "global_step": 138051, "epoch": 3286} {"train_loss": -6.82363224029541, "global_step": 138052, "epoch": 3286} {"train_loss": -6.753268684659686, "global_step": 138053, "epoch": 3286, "val_loss": 77912.2890625} {"train_loss": -6.794739723205566, "global_step": 138054, "epoch": 3287} {"train_loss": -6.605834007263184, "global_step": 138055, "epoch": 3287} {"train_loss": -6.787210464477539, "global_step": 138056, "epoch": 3287} {"train_loss": -6.77229118347168, "global_step": 138057, "epoch": 3287} {"train_loss": -6.835710525512695, "global_step": 138058, "epoch": 3287} {"train_loss": -6.912745952606201, "global_step": 138059, "epoch": 3287} {"train_loss": -6.629096031188965, "global_step": 138060, "epoch": 3287} {"train_loss": -6.770465850830078, "global_step": 138061, "epoch": 3287} {"train_loss": -6.766386985778809, "global_step": 138062, "epoch": 3287} {"train_loss": -6.598352432250977, "global_step": 138063, "epoch": 3287} {"train_loss": -6.760029315948486, "global_step": 138064, "epoch": 3287} {"train_loss": -6.636260986328125, "global_step": 138065, "epoch": 3287} {"train_loss": -6.774068832397461, "global_step": 138066, "epoch": 3287} {"train_loss": -6.801048278808594, "global_step": 138067, "epoch": 3287} {"train_loss": -6.757803916931152, "global_step": 138068, "epoch": 3287} {"train_loss": -6.75601863861084, "global_step": 138069, "epoch": 3287} {"train_loss": -6.870886325836182, "global_step": 138070, "epoch": 3287} {"train_loss": -6.788250923156738, "global_step": 138071, "epoch": 3287} {"train_loss": -6.637725830078125, "global_step": 138072, "epoch": 3287} {"train_loss": -6.696407318115234, "global_step": 138073, "epoch": 3287} {"train_loss": -6.789941787719727, "global_step": 138074, "epoch": 3287} {"train_loss": -6.712676525115967, "global_step": 138075, "epoch": 3287} {"train_loss": -6.80169153213501, "global_step": 138076, "epoch": 3287} {"train_loss": -6.810454368591309, "global_step": 138077, "epoch": 3287} {"train_loss": -6.763931751251221, "global_step": 138078, "epoch": 3287} {"train_loss": -6.7132158279418945, "global_step": 138079, "epoch": 3287} {"train_loss": -6.720658302307129, "global_step": 138080, "epoch": 3287} {"train_loss": -6.75324010848999, "global_step": 138081, "epoch": 3287} {"train_loss": -6.811725616455078, "global_step": 138082, "epoch": 3287} {"train_loss": -6.664877891540527, "global_step": 138083, "epoch": 3287} {"train_loss": -6.791382789611816, "global_step": 138084, "epoch": 3287} {"train_loss": -6.874330520629883, "global_step": 138085, "epoch": 3287} {"train_loss": -6.734419345855713, "global_step": 138086, "epoch": 3287} {"train_loss": -6.699453353881836, "global_step": 138087, "epoch": 3287} {"train_loss": -6.750730514526367, "global_step": 138088, "epoch": 3287} {"train_loss": -6.711644172668457, "global_step": 138089, "epoch": 3287} {"train_loss": -6.7229814529418945, "global_step": 138090, "epoch": 3287} {"train_loss": -6.803475379943848, "global_step": 138091, "epoch": 3287} {"train_loss": -6.692411422729492, "global_step": 138092, "epoch": 3287} {"train_loss": -6.711544036865234, "global_step": 138093, "epoch": 3287} {"train_loss": -6.833901882171631, "global_step": 138094, "epoch": 3287} {"train_loss": -6.752170108613514, "global_step": 138095, "epoch": 3287, "val_loss": 78040.0546875} {"train_loss": -6.828062057495117, "global_step": 138096, "epoch": 3288} {"train_loss": -6.655684471130371, "global_step": 138097, "epoch": 3288} {"train_loss": -6.84556770324707, "global_step": 138098, "epoch": 3288} {"train_loss": -6.8546857833862305, "global_step": 138099, "epoch": 3288} {"train_loss": -6.692175388336182, "global_step": 138100, "epoch": 3288} {"train_loss": -6.782179832458496, "global_step": 138101, "epoch": 3288} {"train_loss": -6.7567362785339355, "global_step": 138102, "epoch": 3288} {"train_loss": -6.777230262756348, "global_step": 138103, "epoch": 3288} {"train_loss": -6.759579181671143, "global_step": 138104, "epoch": 3288} {"train_loss": -6.669548511505127, "global_step": 138105, "epoch": 3288} {"train_loss": -6.720029830932617, "global_step": 138106, "epoch": 3288} {"train_loss": -6.617617607116699, "global_step": 138107, "epoch": 3288} {"train_loss": -6.665795803070068, "global_step": 138108, "epoch": 3288} {"train_loss": -6.770698070526123, "global_step": 138109, "epoch": 3288} {"train_loss": -6.767642021179199, "global_step": 138110, "epoch": 3288} {"train_loss": -6.661883354187012, "global_step": 138111, "epoch": 3288} {"train_loss": -6.768974304199219, "global_step": 138112, "epoch": 3288} {"train_loss": -6.700103759765625, "global_step": 138113, "epoch": 3288} {"train_loss": -6.6657633781433105, "global_step": 138114, "epoch": 3288} {"train_loss": -6.584360122680664, "global_step": 138115, "epoch": 3288} {"train_loss": -6.749696731567383, "global_step": 138116, "epoch": 3288} {"train_loss": -6.794476509094238, "global_step": 138117, "epoch": 3288} {"train_loss": -6.72514533996582, "global_step": 138118, "epoch": 3288} {"train_loss": -6.8308186531066895, "global_step": 138119, "epoch": 3288} {"train_loss": -6.785253524780273, "global_step": 138120, "epoch": 3288} {"train_loss": -6.810036659240723, "global_step": 138121, "epoch": 3288} {"train_loss": -6.794634819030762, "global_step": 138122, "epoch": 3288} {"train_loss": -6.711950302124023, "global_step": 138123, "epoch": 3288} {"train_loss": -6.691200256347656, "global_step": 138124, "epoch": 3288} {"train_loss": -6.817850112915039, "global_step": 138125, "epoch": 3288} {"train_loss": -6.792017459869385, "global_step": 138126, "epoch": 3288} {"train_loss": -6.775363445281982, "global_step": 138127, "epoch": 3288} {"train_loss": -6.759505271911621, "global_step": 138128, "epoch": 3288} {"train_loss": -6.8040266036987305, "global_step": 138129, "epoch": 3288} {"train_loss": -6.656052112579346, "global_step": 138130, "epoch": 3288} {"train_loss": -6.81417179107666, "global_step": 138131, "epoch": 3288} {"train_loss": -6.804632663726807, "global_step": 138132, "epoch": 3288} {"train_loss": -6.718574523925781, "global_step": 138133, "epoch": 3288} {"train_loss": -6.695135116577148, "global_step": 138134, "epoch": 3288} {"train_loss": -6.755871772766113, "global_step": 138135, "epoch": 3288} {"train_loss": -6.738852500915527, "global_step": 138136, "epoch": 3288} {"train_loss": -6.743053424926031, "global_step": 138137, "epoch": 3288, "val_loss": 78090.4453125} {"train_loss": -6.746881484985352, "global_step": 138138, "epoch": 3289} {"train_loss": -6.677708148956299, "global_step": 138139, "epoch": 3289} {"train_loss": -6.752536296844482, "global_step": 138140, "epoch": 3289} {"train_loss": -6.682657241821289, "global_step": 138141, "epoch": 3289} {"train_loss": -6.784406661987305, "global_step": 138142, "epoch": 3289} {"train_loss": -6.816379547119141, "global_step": 138143, "epoch": 3289} {"train_loss": -6.873495101928711, "global_step": 138144, "epoch": 3289} {"train_loss": -6.681430816650391, "global_step": 138145, "epoch": 3289} {"train_loss": -6.647698402404785, "global_step": 138146, "epoch": 3289} {"train_loss": -6.724124431610107, "global_step": 138147, "epoch": 3289} {"train_loss": -6.887232780456543, "global_step": 138148, "epoch": 3289} {"train_loss": -6.73917818069458, "global_step": 138149, "epoch": 3289} {"train_loss": -6.736333847045898, "global_step": 138150, "epoch": 3289} {"train_loss": -6.755608558654785, "global_step": 138151, "epoch": 3289} {"train_loss": -6.784670829772949, "global_step": 138152, "epoch": 3289} {"train_loss": -6.813871383666992, "global_step": 138153, "epoch": 3289} {"train_loss": -6.808816909790039, "global_step": 138154, "epoch": 3289} {"train_loss": -6.715346813201904, "global_step": 138155, "epoch": 3289} {"train_loss": -6.776941299438477, "global_step": 138156, "epoch": 3289} {"train_loss": -6.7865471839904785, "global_step": 138157, "epoch": 3289} {"train_loss": -6.679872512817383, "global_step": 138158, "epoch": 3289} {"train_loss": -6.807066440582275, "global_step": 138159, "epoch": 3289} {"train_loss": -6.833892822265625, "global_step": 138160, "epoch": 3289} {"train_loss": -6.75258731842041, "global_step": 138161, "epoch": 3289} {"train_loss": -6.691883563995361, "global_step": 138162, "epoch": 3289} {"train_loss": -6.68167781829834, "global_step": 138163, "epoch": 3289} {"train_loss": -6.723138809204102, "global_step": 138164, "epoch": 3289} {"train_loss": -6.708148002624512, "global_step": 138165, "epoch": 3289} {"train_loss": -6.744752883911133, "global_step": 138166, "epoch": 3289} {"train_loss": -6.8016791343688965, "global_step": 138167, "epoch": 3289} {"train_loss": -6.804662227630615, "global_step": 138168, "epoch": 3289} {"train_loss": -6.763220310211182, "global_step": 138169, "epoch": 3289} {"train_loss": -6.76229190826416, "global_step": 138170, "epoch": 3289} {"train_loss": -6.720036506652832, "global_step": 138171, "epoch": 3289} {"train_loss": -6.701345443725586, "global_step": 138172, "epoch": 3289} {"train_loss": -6.690438270568848, "global_step": 138173, "epoch": 3289} {"train_loss": -6.646254539489746, "global_step": 138174, "epoch": 3289} {"train_loss": -6.630835056304932, "global_step": 138175, "epoch": 3289} {"train_loss": -6.7245283126831055, "global_step": 138176, "epoch": 3289} {"train_loss": -6.808295726776123, "global_step": 138177, "epoch": 3289} {"train_loss": -6.669081687927246, "global_step": 138178, "epoch": 3289} {"train_loss": -6.746601002556937, "global_step": 138179, "epoch": 3289, "val_loss": 77741.96875} {"train_loss": -6.754088401794434, "global_step": 138180, "epoch": 3290} {"train_loss": -6.770359039306641, "global_step": 138181, "epoch": 3290} {"train_loss": -6.685344696044922, "global_step": 138182, "epoch": 3290} {"train_loss": -6.770925521850586, "global_step": 138183, "epoch": 3290} {"train_loss": -6.763324737548828, "global_step": 138184, "epoch": 3290} {"train_loss": -6.720623016357422, "global_step": 138185, "epoch": 3290} {"train_loss": -6.779772758483887, "global_step": 138186, "epoch": 3290} {"train_loss": -6.718915939331055, "global_step": 138187, "epoch": 3290} {"train_loss": -6.821375370025635, "global_step": 138188, "epoch": 3290} {"train_loss": -6.8240485191345215, "global_step": 138189, "epoch": 3290} {"train_loss": -6.850825309753418, "global_step": 138190, "epoch": 3290} {"train_loss": -6.769082069396973, "global_step": 138191, "epoch": 3290} {"train_loss": -6.692174434661865, "global_step": 138192, "epoch": 3290} {"train_loss": -6.712601661682129, "global_step": 138193, "epoch": 3290} {"train_loss": -6.664330005645752, "global_step": 138194, "epoch": 3290} {"train_loss": -6.734891414642334, "global_step": 138195, "epoch": 3290} {"train_loss": -6.770197868347168, "global_step": 138196, "epoch": 3290} {"train_loss": -6.744917869567871, "global_step": 138197, "epoch": 3290} {"train_loss": -6.689268589019775, "global_step": 138198, "epoch": 3290} {"train_loss": -6.894447326660156, "global_step": 138199, "epoch": 3290} {"train_loss": -6.802416801452637, "global_step": 138200, "epoch": 3290} {"train_loss": -6.7633256912231445, "global_step": 138201, "epoch": 3290} {"train_loss": -6.704920768737793, "global_step": 138202, "epoch": 3290} {"train_loss": -6.841152191162109, "global_step": 138203, "epoch": 3290} {"train_loss": -6.758249282836914, "global_step": 138204, "epoch": 3290} {"train_loss": -6.689213752746582, "global_step": 138205, "epoch": 3290} {"train_loss": -6.731468200683594, "global_step": 138206, "epoch": 3290} {"train_loss": -6.740693092346191, "global_step": 138207, "epoch": 3290} {"train_loss": -6.658662796020508, "global_step": 138208, "epoch": 3290} {"train_loss": -6.755352020263672, "global_step": 138209, "epoch": 3290} {"train_loss": -6.651810169219971, "global_step": 138210, "epoch": 3290} {"train_loss": -6.6861371994018555, "global_step": 138211, "epoch": 3290} {"train_loss": -6.7963361740112305, "global_step": 138212, "epoch": 3290} {"train_loss": -6.717471599578857, "global_step": 138213, "epoch": 3290} {"train_loss": -6.8012847900390625, "global_step": 138214, "epoch": 3290} {"train_loss": -6.5680694580078125, "global_step": 138215, "epoch": 3290} {"train_loss": -6.684558391571045, "global_step": 138216, "epoch": 3290} {"train_loss": -6.777402400970459, "global_step": 138217, "epoch": 3290} {"train_loss": -6.654815673828125, "global_step": 138218, "epoch": 3290} {"train_loss": -6.806126594543457, "global_step": 138219, "epoch": 3290} {"train_loss": -6.764583587646484, "global_step": 138220, "epoch": 3290} {"train_loss": -6.741102161861601, "global_step": 138221, "epoch": 3290, "val_loss": 77967.6328125} {"train_loss": -6.782426357269287, "global_step": 138222, "epoch": 3291} {"train_loss": -6.629183292388916, "global_step": 138223, "epoch": 3291} {"train_loss": -6.747321128845215, "global_step": 138224, "epoch": 3291} {"train_loss": -6.651551246643066, "global_step": 138225, "epoch": 3291} {"train_loss": -6.578155040740967, "global_step": 138226, "epoch": 3291} {"train_loss": -6.857261657714844, "global_step": 138227, "epoch": 3291} {"train_loss": -6.7410454750061035, "global_step": 138228, "epoch": 3291} {"train_loss": -6.723567962646484, "global_step": 138229, "epoch": 3291} {"train_loss": -6.673123359680176, "global_step": 138230, "epoch": 3291} {"train_loss": -6.702887535095215, "global_step": 138231, "epoch": 3291} {"train_loss": -6.709572792053223, "global_step": 138232, "epoch": 3291} {"train_loss": -6.751039981842041, "global_step": 138233, "epoch": 3291} {"train_loss": -6.648530006408691, "global_step": 138234, "epoch": 3291} {"train_loss": -6.798839092254639, "global_step": 138235, "epoch": 3291} {"train_loss": -6.910769462585449, "global_step": 138236, "epoch": 3291} {"train_loss": -6.817210674285889, "global_step": 138237, "epoch": 3291} {"train_loss": -6.7571306228637695, "global_step": 138238, "epoch": 3291} {"train_loss": -6.690436363220215, "global_step": 138239, "epoch": 3291} {"train_loss": -6.646265506744385, "global_step": 138240, "epoch": 3291} {"train_loss": -6.686349868774414, "global_step": 138241, "epoch": 3291} {"train_loss": -6.707540512084961, "global_step": 138242, "epoch": 3291} {"train_loss": -6.71937894821167, "global_step": 138243, "epoch": 3291} {"train_loss": -6.700638771057129, "global_step": 138244, "epoch": 3291} {"train_loss": -6.700711250305176, "global_step": 138245, "epoch": 3291} {"train_loss": -6.73037052154541, "global_step": 138246, "epoch": 3291} {"train_loss": -6.827795028686523, "global_step": 138247, "epoch": 3291} {"train_loss": -6.745693206787109, "global_step": 138248, "epoch": 3291} {"train_loss": -6.812617301940918, "global_step": 138249, "epoch": 3291} {"train_loss": -6.695548057556152, "global_step": 138250, "epoch": 3291} {"train_loss": -6.65114688873291, "global_step": 138251, "epoch": 3291} {"train_loss": -6.8132476806640625, "global_step": 138252, "epoch": 3291} {"train_loss": -6.659144401550293, "global_step": 138253, "epoch": 3291} {"train_loss": -6.815729141235352, "global_step": 138254, "epoch": 3291} {"train_loss": -6.7442545890808105, "global_step": 138255, "epoch": 3291} {"train_loss": -6.756240367889404, "global_step": 138256, "epoch": 3291} {"train_loss": -6.756341934204102, "global_step": 138257, "epoch": 3291} {"train_loss": -6.751186847686768, "global_step": 138258, "epoch": 3291} {"train_loss": -6.668208599090576, "global_step": 138259, "epoch": 3291} {"train_loss": -6.651656150817871, "global_step": 138260, "epoch": 3291} {"train_loss": -6.737734317779541, "global_step": 138261, "epoch": 3291} {"train_loss": -6.733490943908691, "global_step": 138262, "epoch": 3291} {"train_loss": -6.728552704765683, "global_step": 138263, "epoch": 3291, "val_loss": 78033.015625} {"train_loss": -6.804116249084473, "global_step": 138264, "epoch": 3292} {"train_loss": -6.78572940826416, "global_step": 138265, "epoch": 3292} {"train_loss": -6.820431232452393, "global_step": 138266, "epoch": 3292} {"train_loss": -6.696778774261475, "global_step": 138267, "epoch": 3292} {"train_loss": -6.767451763153076, "global_step": 138268, "epoch": 3292} {"train_loss": -6.774474620819092, "global_step": 138269, "epoch": 3292} {"train_loss": -6.903983116149902, "global_step": 138270, "epoch": 3292} {"train_loss": -6.867408752441406, "global_step": 138271, "epoch": 3292} {"train_loss": -6.764986038208008, "global_step": 138272, "epoch": 3292} {"train_loss": -6.819720268249512, "global_step": 138273, "epoch": 3292} {"train_loss": -6.738801002502441, "global_step": 138274, "epoch": 3292} {"train_loss": -6.748918056488037, "global_step": 138275, "epoch": 3292} {"train_loss": -6.8321614265441895, "global_step": 138276, "epoch": 3292} {"train_loss": -6.7519941329956055, "global_step": 138277, "epoch": 3292} {"train_loss": -6.766041278839111, "global_step": 138278, "epoch": 3292} {"train_loss": -6.71307897567749, "global_step": 138279, "epoch": 3292} {"train_loss": -6.7581987380981445, "global_step": 138280, "epoch": 3292} {"train_loss": -6.70816707611084, "global_step": 138281, "epoch": 3292} {"train_loss": -6.729753494262695, "global_step": 138282, "epoch": 3292} {"train_loss": -6.646457672119141, "global_step": 138283, "epoch": 3292} {"train_loss": -6.742898941040039, "global_step": 138284, "epoch": 3292} {"train_loss": -6.769425868988037, "global_step": 138285, "epoch": 3292} {"train_loss": -6.767343044281006, "global_step": 138286, "epoch": 3292} {"train_loss": -6.855870723724365, "global_step": 138287, "epoch": 3292} {"train_loss": -6.721930503845215, "global_step": 138288, "epoch": 3292} {"train_loss": -6.676362037658691, "global_step": 138289, "epoch": 3292} {"train_loss": -6.7518310546875, "global_step": 138290, "epoch": 3292} {"train_loss": -6.687145233154297, "global_step": 138291, "epoch": 3292} {"train_loss": -6.676239967346191, "global_step": 138292, "epoch": 3292} {"train_loss": -6.801725387573242, "global_step": 138293, "epoch": 3292} {"train_loss": -6.816280364990234, "global_step": 138294, "epoch": 3292} {"train_loss": -6.650730609893799, "global_step": 138295, "epoch": 3292} {"train_loss": -6.745735168457031, "global_step": 138296, "epoch": 3292} {"train_loss": -6.733898162841797, "global_step": 138297, "epoch": 3292} {"train_loss": -6.697404861450195, "global_step": 138298, "epoch": 3292} {"train_loss": -6.778631210327148, "global_step": 138299, "epoch": 3292} {"train_loss": -6.861861228942871, "global_step": 138300, "epoch": 3292} {"train_loss": -6.832592010498047, "global_step": 138301, "epoch": 3292} {"train_loss": -6.73813533782959, "global_step": 138302, "epoch": 3292} {"train_loss": -6.708646774291992, "global_step": 138303, "epoch": 3292} {"train_loss": -6.672386169433594, "global_step": 138304, "epoch": 3292} {"train_loss": -6.759019431613741, "global_step": 138305, "epoch": 3292, "val_loss": 77932.8828125} {"train_loss": -6.70878791809082, "global_step": 138306, "epoch": 3293} {"train_loss": -6.669287204742432, "global_step": 138307, "epoch": 3293} {"train_loss": -6.835566997528076, "global_step": 138308, "epoch": 3293} {"train_loss": -6.710192680358887, "global_step": 138309, "epoch": 3293} {"train_loss": -6.594324111938477, "global_step": 138310, "epoch": 3293} {"train_loss": -6.771731376647949, "global_step": 138311, "epoch": 3293} {"train_loss": -6.792529106140137, "global_step": 138312, "epoch": 3293} {"train_loss": -6.732531547546387, "global_step": 138313, "epoch": 3293} {"train_loss": -6.7622880935668945, "global_step": 138314, "epoch": 3293} {"train_loss": -6.716039180755615, "global_step": 138315, "epoch": 3293} {"train_loss": -6.705615043640137, "global_step": 138316, "epoch": 3293} {"train_loss": -6.810925483703613, "global_step": 138317, "epoch": 3293} {"train_loss": -6.788417339324951, "global_step": 138318, "epoch": 3293} {"train_loss": -6.794665336608887, "global_step": 138319, "epoch": 3293} {"train_loss": -6.6524763107299805, "global_step": 138320, "epoch": 3293} {"train_loss": -6.7223992347717285, "global_step": 138321, "epoch": 3293} {"train_loss": -6.659791946411133, "global_step": 138322, "epoch": 3293} {"train_loss": -6.713675022125244, "global_step": 138323, "epoch": 3293} {"train_loss": -6.693009376525879, "global_step": 138324, "epoch": 3293} {"train_loss": -6.647705078125, "global_step": 138325, "epoch": 3293} {"train_loss": -6.611537933349609, "global_step": 138326, "epoch": 3293} {"train_loss": -6.820243835449219, "global_step": 138327, "epoch": 3293} {"train_loss": -6.782083511352539, "global_step": 138328, "epoch": 3293} {"train_loss": -6.779280662536621, "global_step": 138329, "epoch": 3293} {"train_loss": -6.686413764953613, "global_step": 138330, "epoch": 3293} {"train_loss": -6.80776834487915, "global_step": 138331, "epoch": 3293} {"train_loss": -6.6963911056518555, "global_step": 138332, "epoch": 3293} {"train_loss": -6.691800117492676, "global_step": 138333, "epoch": 3293} {"train_loss": -6.717806816101074, "global_step": 138334, "epoch": 3293} {"train_loss": -6.76588249206543, "global_step": 138335, "epoch": 3293} {"train_loss": -6.628120422363281, "global_step": 138336, "epoch": 3293} {"train_loss": -6.663724422454834, "global_step": 138337, "epoch": 3293} {"train_loss": -6.727653503417969, "global_step": 138338, "epoch": 3293} {"train_loss": -6.765730381011963, "global_step": 138339, "epoch": 3293} {"train_loss": -6.802178382873535, "global_step": 138340, "epoch": 3293} {"train_loss": -6.727659225463867, "global_step": 138341, "epoch": 3293} {"train_loss": -6.692328453063965, "global_step": 138342, "epoch": 3293} {"train_loss": -6.715090274810791, "global_step": 138343, "epoch": 3293} {"train_loss": -6.919029235839844, "global_step": 138344, "epoch": 3293} {"train_loss": -6.740436553955078, "global_step": 138345, "epoch": 3293} {"train_loss": -6.642764091491699, "global_step": 138346, "epoch": 3293} {"train_loss": -6.728986478987194, "global_step": 138347, "epoch": 3293, "val_loss": 78143.515625} {"train_loss": -6.711216926574707, "global_step": 138348, "epoch": 3294} {"train_loss": -6.714659690856934, "global_step": 138349, "epoch": 3294} {"train_loss": -6.674262046813965, "global_step": 138350, "epoch": 3294} {"train_loss": -6.664105415344238, "global_step": 138351, "epoch": 3294} {"train_loss": -6.702732086181641, "global_step": 138352, "epoch": 3294} {"train_loss": -6.716418266296387, "global_step": 138353, "epoch": 3294} {"train_loss": -6.757019996643066, "global_step": 138354, "epoch": 3294} {"train_loss": -6.647855281829834, "global_step": 138355, "epoch": 3294} {"train_loss": -6.797546863555908, "global_step": 138356, "epoch": 3294} {"train_loss": -6.8201165199279785, "global_step": 138357, "epoch": 3294} {"train_loss": -6.628653526306152, "global_step": 138358, "epoch": 3294} {"train_loss": -6.663199424743652, "global_step": 138359, "epoch": 3294} {"train_loss": -6.699838638305664, "global_step": 138360, "epoch": 3294} {"train_loss": -6.502753257751465, "global_step": 138361, "epoch": 3294} {"train_loss": -6.619923114776611, "global_step": 138362, "epoch": 3294} {"train_loss": -6.704166412353516, "global_step": 138363, "epoch": 3294} {"train_loss": -6.565279006958008, "global_step": 138364, "epoch": 3294} {"train_loss": -6.827647686004639, "global_step": 138365, "epoch": 3294} {"train_loss": -6.62276554107666, "global_step": 138366, "epoch": 3294} {"train_loss": -6.699617385864258, "global_step": 138367, "epoch": 3294} {"train_loss": -6.677131652832031, "global_step": 138368, "epoch": 3294} {"train_loss": -6.694913864135742, "global_step": 138369, "epoch": 3294} {"train_loss": -6.635453224182129, "global_step": 138370, "epoch": 3294} {"train_loss": -6.675649166107178, "global_step": 138371, "epoch": 3294} {"train_loss": -6.757688522338867, "global_step": 138372, "epoch": 3294} {"train_loss": -6.682271957397461, "global_step": 138373, "epoch": 3294} {"train_loss": -6.780280113220215, "global_step": 138374, "epoch": 3294} {"train_loss": -6.702709197998047, "global_step": 138375, "epoch": 3294} {"train_loss": -6.729331016540527, "global_step": 138376, "epoch": 3294} {"train_loss": -6.7088751792907715, "global_step": 138377, "epoch": 3294} {"train_loss": -6.655468940734863, "global_step": 138378, "epoch": 3294} {"train_loss": -6.743356704711914, "global_step": 138379, "epoch": 3294} {"train_loss": -6.690117835998535, "global_step": 138380, "epoch": 3294} {"train_loss": -6.770824432373047, "global_step": 138381, "epoch": 3294} {"train_loss": -6.7014665603637695, "global_step": 138382, "epoch": 3294} {"train_loss": -6.774386405944824, "global_step": 138383, "epoch": 3294} {"train_loss": -6.657252311706543, "global_step": 138384, "epoch": 3294} {"train_loss": -6.761553764343262, "global_step": 138385, "epoch": 3294} {"train_loss": -6.758751392364502, "global_step": 138386, "epoch": 3294} {"train_loss": -6.742872714996338, "global_step": 138387, "epoch": 3294} {"train_loss": -6.646219253540039, "global_step": 138388, "epoch": 3294} {"train_loss": -6.702726852326166, "global_step": 138389, "epoch": 3294, "val_loss": 78012.0625} {"train_loss": -6.742609977722168, "global_step": 138390, "epoch": 3295} {"train_loss": -6.765366554260254, "global_step": 138391, "epoch": 3295} {"train_loss": -6.8541154861450195, "global_step": 138392, "epoch": 3295} {"train_loss": -6.78870153427124, "global_step": 138393, "epoch": 3295} {"train_loss": -6.773665428161621, "global_step": 138394, "epoch": 3295} {"train_loss": -6.798661708831787, "global_step": 138395, "epoch": 3295} {"train_loss": -6.6864471435546875, "global_step": 138396, "epoch": 3295} {"train_loss": -6.65210485458374, "global_step": 138397, "epoch": 3295} {"train_loss": -6.785248756408691, "global_step": 138398, "epoch": 3295} {"train_loss": -6.900021553039551, "global_step": 138399, "epoch": 3295} {"train_loss": -6.679086208343506, "global_step": 138400, "epoch": 3295} {"train_loss": -6.766302108764648, "global_step": 138401, "epoch": 3295} {"train_loss": -6.774936676025391, "global_step": 138402, "epoch": 3295} {"train_loss": -6.841177940368652, "global_step": 138403, "epoch": 3295} {"train_loss": -6.736983299255371, "global_step": 138404, "epoch": 3295} {"train_loss": -6.529237270355225, "global_step": 138405, "epoch": 3295} {"train_loss": -6.829291343688965, "global_step": 138406, "epoch": 3295} {"train_loss": -6.817854881286621, "global_step": 138407, "epoch": 3295} {"train_loss": -6.768101692199707, "global_step": 138408, "epoch": 3295} {"train_loss": -6.8310465812683105, "global_step": 138409, "epoch": 3295} {"train_loss": -6.91233491897583, "global_step": 138410, "epoch": 3295} {"train_loss": -6.866165637969971, "global_step": 138411, "epoch": 3295} {"train_loss": -6.759344577789307, "global_step": 138412, "epoch": 3295} {"train_loss": -6.6310601234436035, "global_step": 138413, "epoch": 3295} {"train_loss": -6.661096572875977, "global_step": 138414, "epoch": 3295} {"train_loss": -6.608105659484863, "global_step": 138415, "epoch": 3295} {"train_loss": -6.661615371704102, "global_step": 138416, "epoch": 3295} {"train_loss": -6.646949768066406, "global_step": 138417, "epoch": 3295} {"train_loss": -6.784348964691162, "global_step": 138418, "epoch": 3295} {"train_loss": -6.726027011871338, "global_step": 138419, "epoch": 3295} {"train_loss": -6.633822441101074, "global_step": 138420, "epoch": 3295} {"train_loss": -6.815891265869141, "global_step": 138421, "epoch": 3295} {"train_loss": -6.805633544921875, "global_step": 138422, "epoch": 3295} {"train_loss": -6.65318489074707, "global_step": 138423, "epoch": 3295} {"train_loss": -6.715007305145264, "global_step": 138424, "epoch": 3295} {"train_loss": -6.709776878356934, "global_step": 138425, "epoch": 3295} {"train_loss": -6.678555488586426, "global_step": 138426, "epoch": 3295} {"train_loss": -6.62031364440918, "global_step": 138427, "epoch": 3295} {"train_loss": -6.6818366050720215, "global_step": 138428, "epoch": 3295} {"train_loss": -6.755466938018799, "global_step": 138429, "epoch": 3295} {"train_loss": -6.766368865966797, "global_step": 138430, "epoch": 3295} {"train_loss": -6.739864224479312, "global_step": 138431, "epoch": 3295, "val_loss": 78303.671875} {"train_loss": -6.742959022521973, "global_step": 138432, "epoch": 3296} {"train_loss": -6.831286907196045, "global_step": 138433, "epoch": 3296} {"train_loss": -6.511665344238281, "global_step": 138434, "epoch": 3296} {"train_loss": -6.720837593078613, "global_step": 138435, "epoch": 3296} {"train_loss": -6.842288017272949, "global_step": 138436, "epoch": 3296} {"train_loss": -6.710073471069336, "global_step": 138437, "epoch": 3296} {"train_loss": -6.815284729003906, "global_step": 138438, "epoch": 3296} {"train_loss": -6.780429840087891, "global_step": 138439, "epoch": 3296} {"train_loss": -6.657443046569824, "global_step": 138440, "epoch": 3296} {"train_loss": -6.783525466918945, "global_step": 138441, "epoch": 3296} {"train_loss": -6.958019256591797, "global_step": 138442, "epoch": 3296} {"train_loss": -6.751214981079102, "global_step": 138443, "epoch": 3296} {"train_loss": -6.681699275970459, "global_step": 138444, "epoch": 3296} {"train_loss": -6.727355003356934, "global_step": 138445, "epoch": 3296} {"train_loss": -6.682038307189941, "global_step": 138446, "epoch": 3296} {"train_loss": -6.846070289611816, "global_step": 138447, "epoch": 3296} {"train_loss": -6.898616313934326, "global_step": 138448, "epoch": 3296} {"train_loss": -6.851596832275391, "global_step": 138449, "epoch": 3296} {"train_loss": -6.817225933074951, "global_step": 138450, "epoch": 3296} {"train_loss": -6.853611946105957, "global_step": 138451, "epoch": 3296} {"train_loss": -6.78473424911499, "global_step": 138452, "epoch": 3296} {"train_loss": -6.628857135772705, "global_step": 138453, "epoch": 3296} {"train_loss": -6.838316440582275, "global_step": 138454, "epoch": 3296} {"train_loss": -6.758139133453369, "global_step": 138455, "epoch": 3296} {"train_loss": -6.733933448791504, "global_step": 138456, "epoch": 3296} {"train_loss": -6.757503509521484, "global_step": 138457, "epoch": 3296} {"train_loss": -6.769043922424316, "global_step": 138458, "epoch": 3296} {"train_loss": -6.667438507080078, "global_step": 138459, "epoch": 3296} {"train_loss": -6.732247352600098, "global_step": 138460, "epoch": 3296} {"train_loss": -6.68794059753418, "global_step": 138461, "epoch": 3296} {"train_loss": -6.693314552307129, "global_step": 138462, "epoch": 3296} {"train_loss": -6.9082746505737305, "global_step": 138463, "epoch": 3296} {"train_loss": -6.717700004577637, "global_step": 138464, "epoch": 3296} {"train_loss": -6.7704057693481445, "global_step": 138465, "epoch": 3296} {"train_loss": -6.759200572967529, "global_step": 138466, "epoch": 3296} {"train_loss": -6.673172473907471, "global_step": 138467, "epoch": 3296} {"train_loss": -6.70141077041626, "global_step": 138468, "epoch": 3296} {"train_loss": -6.599985122680664, "global_step": 138469, "epoch": 3296} {"train_loss": -6.738491058349609, "global_step": 138470, "epoch": 3296} {"train_loss": -6.659497261047363, "global_step": 138471, "epoch": 3296} {"train_loss": -6.78997802734375, "global_step": 138472, "epoch": 3296} {"train_loss": -6.750578744070871, "global_step": 138473, "epoch": 3296, "val_loss": 78262.7734375} {"train_loss": -6.700345039367676, "global_step": 138474, "epoch": 3297} {"train_loss": -6.846101760864258, "global_step": 138475, "epoch": 3297} {"train_loss": -6.79811954498291, "global_step": 138476, "epoch": 3297} {"train_loss": -6.67757511138916, "global_step": 138477, "epoch": 3297} {"train_loss": -6.690026760101318, "global_step": 138478, "epoch": 3297} {"train_loss": -6.729206085205078, "global_step": 138479, "epoch": 3297} {"train_loss": -6.814126014709473, "global_step": 138480, "epoch": 3297} {"train_loss": -6.853706359863281, "global_step": 138481, "epoch": 3297} {"train_loss": -6.629519939422607, "global_step": 138482, "epoch": 3297} {"train_loss": -6.696811676025391, "global_step": 138483, "epoch": 3297} {"train_loss": -6.6840739250183105, "global_step": 138484, "epoch": 3297} {"train_loss": -6.5829010009765625, "global_step": 138485, "epoch": 3297} {"train_loss": -6.748836994171143, "global_step": 138486, "epoch": 3297} {"train_loss": -6.582571983337402, "global_step": 138487, "epoch": 3297} {"train_loss": -6.656996726989746, "global_step": 138488, "epoch": 3297} {"train_loss": -6.625913619995117, "global_step": 138489, "epoch": 3297} {"train_loss": -6.550971984863281, "global_step": 138490, "epoch": 3297} {"train_loss": -6.612067222595215, "global_step": 138491, "epoch": 3297} {"train_loss": -6.574962615966797, "global_step": 138492, "epoch": 3297} {"train_loss": -6.712137222290039, "global_step": 138493, "epoch": 3297} {"train_loss": -6.560085773468018, "global_step": 138494, "epoch": 3297} {"train_loss": -6.8154096603393555, "global_step": 138495, "epoch": 3297} {"train_loss": -6.767804145812988, "global_step": 138496, "epoch": 3297} {"train_loss": -6.7743144035339355, "global_step": 138497, "epoch": 3297} {"train_loss": -6.68134880065918, "global_step": 138498, "epoch": 3297} {"train_loss": -6.694910049438477, "global_step": 138499, "epoch": 3297} {"train_loss": -6.667872428894043, "global_step": 138500, "epoch": 3297} {"train_loss": -6.718941688537598, "global_step": 138501, "epoch": 3297} {"train_loss": -6.678681373596191, "global_step": 138502, "epoch": 3297} {"train_loss": -6.805665969848633, "global_step": 138503, "epoch": 3297} {"train_loss": -6.770959854125977, "global_step": 138504, "epoch": 3297} {"train_loss": -6.680456161499023, "global_step": 138505, "epoch": 3297} {"train_loss": -6.702080726623535, "global_step": 138506, "epoch": 3297} {"train_loss": -6.690821647644043, "global_step": 138507, "epoch": 3297} {"train_loss": -6.5835957527160645, "global_step": 138508, "epoch": 3297} {"train_loss": -6.778433799743652, "global_step": 138509, "epoch": 3297} {"train_loss": -6.740099906921387, "global_step": 138510, "epoch": 3297} {"train_loss": -6.846280097961426, "global_step": 138511, "epoch": 3297} {"train_loss": -6.759310722351074, "global_step": 138512, "epoch": 3297} {"train_loss": -6.708742618560791, "global_step": 138513, "epoch": 3297} {"train_loss": -6.710577487945557, "global_step": 138514, "epoch": 3297} {"train_loss": -6.706882578986032, "global_step": 138515, "epoch": 3297, "val_loss": 77850.1640625} {"train_loss": -6.747000694274902, "global_step": 138516, "epoch": 3298} {"train_loss": -6.629452705383301, "global_step": 138517, "epoch": 3298} {"train_loss": -6.754228115081787, "global_step": 138518, "epoch": 3298} {"train_loss": -6.769481182098389, "global_step": 138519, "epoch": 3298} {"train_loss": -6.712324619293213, "global_step": 138520, "epoch": 3298} {"train_loss": -6.896183490753174, "global_step": 138521, "epoch": 3298} {"train_loss": -6.717661380767822, "global_step": 138522, "epoch": 3298} {"train_loss": -6.750035762786865, "global_step": 138523, "epoch": 3298} {"train_loss": -6.753452301025391, "global_step": 138524, "epoch": 3298} {"train_loss": -6.649316310882568, "global_step": 138525, "epoch": 3298} {"train_loss": -6.693991661071777, "global_step": 138526, "epoch": 3298} {"train_loss": -6.73322868347168, "global_step": 138527, "epoch": 3298} {"train_loss": -6.648068428039551, "global_step": 138528, "epoch": 3298} {"train_loss": -6.6530327796936035, "global_step": 138529, "epoch": 3298} {"train_loss": -6.795721530914307, "global_step": 138530, "epoch": 3298} {"train_loss": -6.799330234527588, "global_step": 138531, "epoch": 3298} {"train_loss": -6.812078475952148, "global_step": 138532, "epoch": 3298} {"train_loss": -6.764898300170898, "global_step": 138533, "epoch": 3298} {"train_loss": -6.882590293884277, "global_step": 138534, "epoch": 3298} {"train_loss": -6.762885093688965, "global_step": 138535, "epoch": 3298} {"train_loss": -6.767138481140137, "global_step": 138536, "epoch": 3298} {"train_loss": -6.835212707519531, "global_step": 138537, "epoch": 3298} {"train_loss": -6.739862442016602, "global_step": 138538, "epoch": 3298} {"train_loss": -6.882219314575195, "global_step": 138539, "epoch": 3298} {"train_loss": -6.749438285827637, "global_step": 138540, "epoch": 3298} {"train_loss": -6.630167007446289, "global_step": 138541, "epoch": 3298} {"train_loss": -6.757387161254883, "global_step": 138542, "epoch": 3298} {"train_loss": -6.726469993591309, "global_step": 138543, "epoch": 3298} {"train_loss": -6.833033561706543, "global_step": 138544, "epoch": 3298} {"train_loss": -6.71507453918457, "global_step": 138545, "epoch": 3298} {"train_loss": -6.901500225067139, "global_step": 138546, "epoch": 3298} {"train_loss": -6.677478790283203, "global_step": 138547, "epoch": 3298} {"train_loss": -6.531203269958496, "global_step": 138548, "epoch": 3298} {"train_loss": -6.690184593200684, "global_step": 138549, "epoch": 3298} {"train_loss": -6.688051223754883, "global_step": 138550, "epoch": 3298} {"train_loss": -6.750380039215088, "global_step": 138551, "epoch": 3298} {"train_loss": -6.730473041534424, "global_step": 138552, "epoch": 3298} {"train_loss": -6.7500834465026855, "global_step": 138553, "epoch": 3298} {"train_loss": -6.619831085205078, "global_step": 138554, "epoch": 3298} {"train_loss": -6.78403377532959, "global_step": 138555, "epoch": 3298} {"train_loss": -6.745061874389648, "global_step": 138556, "epoch": 3298} {"train_loss": -6.741149539039249, "global_step": 138557, "epoch": 3298, "val_loss": 77964.2578125} {"train_loss": -6.6517558097839355, "global_step": 138558, "epoch": 3299} {"train_loss": -6.645145416259766, "global_step": 138559, "epoch": 3299} {"train_loss": -6.790643215179443, "global_step": 138560, "epoch": 3299} {"train_loss": -6.774382591247559, "global_step": 138561, "epoch": 3299} {"train_loss": -6.7980780601501465, "global_step": 138562, "epoch": 3299} {"train_loss": -6.697360038757324, "global_step": 138563, "epoch": 3299} {"train_loss": -6.616887092590332, "global_step": 138564, "epoch": 3299} {"train_loss": -6.7538580894470215, "global_step": 138565, "epoch": 3299} {"train_loss": -6.806334495544434, "global_step": 138566, "epoch": 3299} {"train_loss": -6.836242198944092, "global_step": 138567, "epoch": 3299} {"train_loss": -6.693399429321289, "global_step": 138568, "epoch": 3299} {"train_loss": -6.750019073486328, "global_step": 138569, "epoch": 3299} {"train_loss": -6.7122907638549805, "global_step": 138570, "epoch": 3299} {"train_loss": -6.686089515686035, "global_step": 138571, "epoch": 3299} {"train_loss": -6.769396781921387, "global_step": 138572, "epoch": 3299} {"train_loss": -6.7803053855896, "global_step": 138573, "epoch": 3299} {"train_loss": -6.686101913452148, "global_step": 138574, "epoch": 3299} {"train_loss": -6.790694236755371, "global_step": 138575, "epoch": 3299} {"train_loss": -6.610435962677002, "global_step": 138576, "epoch": 3299} {"train_loss": -6.766299247741699, "global_step": 138577, "epoch": 3299} {"train_loss": -6.801427841186523, "global_step": 138578, "epoch": 3299} {"train_loss": -6.756196975708008, "global_step": 138579, "epoch": 3299} {"train_loss": -6.893056392669678, "global_step": 138580, "epoch": 3299} {"train_loss": -6.803849220275879, "global_step": 138581, "epoch": 3299} {"train_loss": -6.712421417236328, "global_step": 138582, "epoch": 3299} {"train_loss": -6.84535026550293, "global_step": 138583, "epoch": 3299} {"train_loss": -6.698479175567627, "global_step": 138584, "epoch": 3299} {"train_loss": -6.85120964050293, "global_step": 138585, "epoch": 3299} {"train_loss": -6.742081642150879, "global_step": 138586, "epoch": 3299} {"train_loss": -6.77094841003418, "global_step": 138587, "epoch": 3299} {"train_loss": -6.823731899261475, "global_step": 138588, "epoch": 3299} {"train_loss": -6.790914535522461, "global_step": 138589, "epoch": 3299} {"train_loss": -6.763704299926758, "global_step": 138590, "epoch": 3299} {"train_loss": -6.808845520019531, "global_step": 138591, "epoch": 3299} {"train_loss": -6.679618835449219, "global_step": 138592, "epoch": 3299} {"train_loss": -6.807685375213623, "global_step": 138593, "epoch": 3299} {"train_loss": -6.813460350036621, "global_step": 138594, "epoch": 3299} {"train_loss": -6.752251625061035, "global_step": 138595, "epoch": 3299} {"train_loss": -6.744695663452148, "global_step": 138596, "epoch": 3299} {"train_loss": -6.772706031799316, "global_step": 138597, "epoch": 3299} {"train_loss": -6.799360752105713, "global_step": 138598, "epoch": 3299} {"train_loss": -6.757421550296602, "global_step": 138599, "epoch": 3299, "val_loss": 77956.6484375} {"train_loss": -6.740955829620361, "global_step": 138600, "epoch": 3300} {"train_loss": -6.725451946258545, "global_step": 138601, "epoch": 3300} {"train_loss": -6.752915382385254, "global_step": 138602, "epoch": 3300} {"train_loss": -6.773006916046143, "global_step": 138603, "epoch": 3300} {"train_loss": -6.798377990722656, "global_step": 138604, "epoch": 3300} {"train_loss": -6.750892162322998, "global_step": 138605, "epoch": 3300} {"train_loss": -6.713846206665039, "global_step": 138606, "epoch": 3300} {"train_loss": -6.7744598388671875, "global_step": 138607, "epoch": 3300} {"train_loss": -6.779779434204102, "global_step": 138608, "epoch": 3300} {"train_loss": -6.799108505249023, "global_step": 138609, "epoch": 3300} {"train_loss": -6.658052921295166, "global_step": 138610, "epoch": 3300} {"train_loss": -6.668251991271973, "global_step": 138611, "epoch": 3300} {"train_loss": -6.8434062004089355, "global_step": 138612, "epoch": 3300} {"train_loss": -6.781296730041504, "global_step": 138613, "epoch": 3300} {"train_loss": -6.708443641662598, "global_step": 138614, "epoch": 3300} {"train_loss": -6.863261699676514, "global_step": 138615, "epoch": 3300} {"train_loss": -6.735654354095459, "global_step": 138616, "epoch": 3300} {"train_loss": -6.781251430511475, "global_step": 138617, "epoch": 3300} {"train_loss": -6.853968143463135, "global_step": 138618, "epoch": 3300} {"train_loss": -6.863044738769531, "global_step": 138619, "epoch": 3300} {"train_loss": -6.758893013000488, "global_step": 138620, "epoch": 3300} {"train_loss": -6.70515251159668, "global_step": 138621, "epoch": 3300} {"train_loss": -6.767346382141113, "global_step": 138622, "epoch": 3300} {"train_loss": -6.7677693367004395, "global_step": 138623, "epoch": 3300} {"train_loss": -6.677209854125977, "global_step": 138624, "epoch": 3300} {"train_loss": -6.667435169219971, "global_step": 138625, "epoch": 3300} {"train_loss": -6.606401443481445, "global_step": 138626, "epoch": 3300} {"train_loss": -6.669985771179199, "global_step": 138627, "epoch": 3300} {"train_loss": -6.714207649230957, "global_step": 138628, "epoch": 3300} {"train_loss": -6.759260177612305, "global_step": 138629, "epoch": 3300} {"train_loss": -6.581638336181641, "global_step": 138630, "epoch": 3300} {"train_loss": -6.7725749015808105, "global_step": 138631, "epoch": 3300} {"train_loss": -6.6687445640563965, "global_step": 138632, "epoch": 3300} {"train_loss": -6.691425323486328, "global_step": 138633, "epoch": 3300} {"train_loss": -6.746802806854248, "global_step": 138634, "epoch": 3300} {"train_loss": -6.606761932373047, "global_step": 138635, "epoch": 3300} {"train_loss": -6.69404935836792, "global_step": 138636, "epoch": 3300} {"train_loss": -6.7791595458984375, "global_step": 138637, "epoch": 3300} {"train_loss": -6.776299953460693, "global_step": 138638, "epoch": 3300} {"train_loss": -6.6465864181518555, "global_step": 138639, "epoch": 3300} {"train_loss": -6.612636566162109, "global_step": 138640, "epoch": 3300} {"train_loss": -6.731872047696795, "global_step": 138641, "epoch": 3300, "train/sim_max_reward_0": 0.4036004581667562, "train/sim_max_reward_1": 0.9568114691260414, "train/sim_max_reward_2": 0.4096465576717757, "train/sim_max_reward_3": 0.15051660801280875, "train/sim_max_reward_4": 0.9061121099276064, "train/sim_max_reward_5": 0.8023803234611017, "test/sim_max_reward_4500000": 0.4289546767054707, "test/sim_max_reward_4500001": 0.8563554068324578, "test/sim_max_reward_4500002": 0.9624068605412246, "test/sim_max_reward_4500003": 0.9203144555509425, "test/sim_max_reward_4500004": 0.16251301971935872, "test/sim_max_reward_4500005": 0.19640968435617584, "test/sim_max_reward_4500006": 0.952365067460506, "test/sim_max_reward_4500007": 0.8748057742944565, "test/sim_max_reward_4500008": 0.9433679129239156, "test/sim_max_reward_4500009": 0.053585315275686045, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9482842571969495, "test/sim_max_reward_4500012": 0.8685028055659657, "test/sim_max_reward_4500013": 0.8100829690597323, "test/sim_max_reward_4500014": 0.46066218090129996, "test/sim_max_reward_4500015": 0.8732529649104716, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.134353576385003, "test/sim_max_reward_4500018": 0.4305171882841655, "test/sim_max_reward_4500019": 0.8483254192816119, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.554478905913255, "test/sim_max_reward_4500022": 0.889495778290337, "test/sim_max_reward_4500023": 0.7546451395014195, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8664543787644894, "test/sim_max_reward_4500026": 0.9011946785460399, "test/sim_max_reward_4500027": 0.6116510892165378, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.11848355955140893, "test/sim_max_reward_4500030": 0.9590176680991711, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9519519854765378, "test/sim_max_reward_4500034": 0.8699704343358408, "test/sim_max_reward_4500035": 0.9250687700244207, "test/sim_max_reward_4500036": 0.4609306589955257, "test/sim_max_reward_4500037": 0.4827543840480155, "test/sim_max_reward_4500038": 0.9095265728391541, "test/sim_max_reward_4500039": 0.992890548764269, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.911994099953924, "test/sim_max_reward_4500042": 0.6401481702177174, "test/sim_max_reward_4500043": 0.8384940532206799, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9065743023615985, "test/sim_max_reward_4500046": 0.8983620083574279, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9244916958040896, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6048445877276817, "test/mean_score": 0.5873661834925352, "val_loss": 77805.8203125} {"train_loss": -6.536891937255859, "global_step": 138642, "epoch": 3301} {"train_loss": -6.612312316894531, "global_step": 138643, "epoch": 3301} {"train_loss": -6.426189422607422, "global_step": 138644, "epoch": 3301} {"train_loss": -6.620862007141113, "global_step": 138645, "epoch": 3301} {"train_loss": -6.536316871643066, "global_step": 138646, "epoch": 3301} {"train_loss": -6.591254234313965, "global_step": 138647, "epoch": 3301} {"train_loss": -6.484973907470703, "global_step": 138648, "epoch": 3301} {"train_loss": -6.656378746032715, "global_step": 138649, "epoch": 3301} {"train_loss": -6.625139236450195, "global_step": 138650, "epoch": 3301} {"train_loss": -6.602303981781006, "global_step": 138651, "epoch": 3301} {"train_loss": -6.717981815338135, "global_step": 138652, "epoch": 3301} {"train_loss": -6.648013114929199, "global_step": 138653, "epoch": 3301} {"train_loss": -6.617806911468506, "global_step": 138654, "epoch": 3301} {"train_loss": -6.690123558044434, "global_step": 138655, "epoch": 3301} {"train_loss": -6.669669151306152, "global_step": 138656, "epoch": 3301} {"train_loss": -6.688902854919434, "global_step": 138657, "epoch": 3301} {"train_loss": -6.747791290283203, "global_step": 138658, "epoch": 3301} {"train_loss": -6.719820976257324, "global_step": 138659, "epoch": 3301} {"train_loss": -6.645071506500244, "global_step": 138660, "epoch": 3301} {"train_loss": -6.6546735763549805, "global_step": 138661, "epoch": 3301} {"train_loss": -6.687684059143066, "global_step": 138662, "epoch": 3301} {"train_loss": -6.751494884490967, "global_step": 138663, "epoch": 3301} {"train_loss": -6.631519794464111, "global_step": 138664, "epoch": 3301} {"train_loss": -6.64096736907959, "global_step": 138665, "epoch": 3301} {"train_loss": -6.7436723709106445, "global_step": 138666, "epoch": 3301} {"train_loss": -6.776019096374512, "global_step": 138667, "epoch": 3301} {"train_loss": -6.762226104736328, "global_step": 138668, "epoch": 3301} {"train_loss": -6.723628997802734, "global_step": 138669, "epoch": 3301} {"train_loss": -6.785211563110352, "global_step": 138670, "epoch": 3301} {"train_loss": -6.868873119354248, "global_step": 138671, "epoch": 3301} {"train_loss": -6.891483306884766, "global_step": 138672, "epoch": 3301} {"train_loss": -6.9316840171813965, "global_step": 138673, "epoch": 3301} {"train_loss": -6.693178176879883, "global_step": 138674, "epoch": 3301} {"train_loss": -6.815284252166748, "global_step": 138675, "epoch": 3301} {"train_loss": -6.841994285583496, "global_step": 138676, "epoch": 3301} {"train_loss": -6.745166778564453, "global_step": 138677, "epoch": 3301} {"train_loss": -6.825599670410156, "global_step": 138678, "epoch": 3301} {"train_loss": -6.909321308135986, "global_step": 138679, "epoch": 3301} {"train_loss": -6.807414531707764, "global_step": 138680, "epoch": 3301} {"train_loss": -6.8858323097229, "global_step": 138681, "epoch": 3301} {"train_loss": -6.71975040435791, "global_step": 138682, "epoch": 3301} {"train_loss": -6.708431573141189, "global_step": 138683, "epoch": 3301, "val_loss": 78036.90625} {"train_loss": -6.877159118652344, "global_step": 138684, "epoch": 3302} {"train_loss": -6.792163848876953, "global_step": 138685, "epoch": 3302} {"train_loss": -6.767971038818359, "global_step": 138686, "epoch": 3302} {"train_loss": -6.7609100341796875, "global_step": 138687, "epoch": 3302} {"train_loss": -6.694248199462891, "global_step": 138688, "epoch": 3302} {"train_loss": -6.715807914733887, "global_step": 138689, "epoch": 3302} {"train_loss": -6.774044513702393, "global_step": 138690, "epoch": 3302} {"train_loss": -6.809368133544922, "global_step": 138691, "epoch": 3302} {"train_loss": -6.784734725952148, "global_step": 138692, "epoch": 3302} {"train_loss": -6.938149452209473, "global_step": 138693, "epoch": 3302} {"train_loss": -6.747012615203857, "global_step": 138694, "epoch": 3302} {"train_loss": -6.805088520050049, "global_step": 138695, "epoch": 3302} {"train_loss": -6.744777679443359, "global_step": 138696, "epoch": 3302} {"train_loss": -6.718746185302734, "global_step": 138697, "epoch": 3302} {"train_loss": -6.8226518630981445, "global_step": 138698, "epoch": 3302} {"train_loss": -6.7546586990356445, "global_step": 138699, "epoch": 3302} {"train_loss": -6.682769775390625, "global_step": 138700, "epoch": 3302} {"train_loss": -6.670778751373291, "global_step": 138701, "epoch": 3302} {"train_loss": -6.67441987991333, "global_step": 138702, "epoch": 3302} {"train_loss": -6.871703147888184, "global_step": 138703, "epoch": 3302} {"train_loss": -6.764654159545898, "global_step": 138704, "epoch": 3302} {"train_loss": -6.728826522827148, "global_step": 138705, "epoch": 3302} {"train_loss": -6.754358291625977, "global_step": 138706, "epoch": 3302} {"train_loss": -6.828306674957275, "global_step": 138707, "epoch": 3302} {"train_loss": -6.6804046630859375, "global_step": 138708, "epoch": 3302} {"train_loss": -6.729981422424316, "global_step": 138709, "epoch": 3302} {"train_loss": -6.816238880157471, "global_step": 138710, "epoch": 3302} {"train_loss": -6.703909873962402, "global_step": 138711, "epoch": 3302} {"train_loss": -6.772067546844482, "global_step": 138712, "epoch": 3302} {"train_loss": -6.7795090675354, "global_step": 138713, "epoch": 3302} {"train_loss": -6.672792434692383, "global_step": 138714, "epoch": 3302} {"train_loss": -6.807565212249756, "global_step": 138715, "epoch": 3302} {"train_loss": -6.802942276000977, "global_step": 138716, "epoch": 3302} {"train_loss": -6.723148345947266, "global_step": 138717, "epoch": 3302} {"train_loss": -6.6686201095581055, "global_step": 138718, "epoch": 3302} {"train_loss": -6.803615093231201, "global_step": 138719, "epoch": 3302} {"train_loss": -6.756702899932861, "global_step": 138720, "epoch": 3302} {"train_loss": -6.742327690124512, "global_step": 138721, "epoch": 3302} {"train_loss": -6.61696720123291, "global_step": 138722, "epoch": 3302} {"train_loss": -6.778099060058594, "global_step": 138723, "epoch": 3302} {"train_loss": -6.663719177246094, "global_step": 138724, "epoch": 3302} {"train_loss": -6.75697880699521, "global_step": 138725, "epoch": 3302, "val_loss": 78086.6796875} {"train_loss": -6.686854839324951, "global_step": 138726, "epoch": 3303} {"train_loss": -6.772369384765625, "global_step": 138727, "epoch": 3303} {"train_loss": -6.844069957733154, "global_step": 138728, "epoch": 3303} {"train_loss": -6.703309059143066, "global_step": 138729, "epoch": 3303} {"train_loss": -6.681700706481934, "global_step": 138730, "epoch": 3303} {"train_loss": -6.79126501083374, "global_step": 138731, "epoch": 3303} {"train_loss": -6.703187465667725, "global_step": 138732, "epoch": 3303} {"train_loss": -6.871034622192383, "global_step": 138733, "epoch": 3303} {"train_loss": -6.818306922912598, "global_step": 138734, "epoch": 3303} {"train_loss": -6.772001266479492, "global_step": 138735, "epoch": 3303} {"train_loss": -6.909158229827881, "global_step": 138736, "epoch": 3303} {"train_loss": -6.7891459465026855, "global_step": 138737, "epoch": 3303} {"train_loss": -6.8309783935546875, "global_step": 138738, "epoch": 3303} {"train_loss": -6.762831687927246, "global_step": 138739, "epoch": 3303} {"train_loss": -6.719353675842285, "global_step": 138740, "epoch": 3303} {"train_loss": -6.732393264770508, "global_step": 138741, "epoch": 3303} {"train_loss": -6.693183422088623, "global_step": 138742, "epoch": 3303} {"train_loss": -6.762296199798584, "global_step": 138743, "epoch": 3303} {"train_loss": -6.678400039672852, "global_step": 138744, "epoch": 3303} {"train_loss": -6.837433815002441, "global_step": 138745, "epoch": 3303} {"train_loss": -6.7768120765686035, "global_step": 138746, "epoch": 3303} {"train_loss": -6.803548336029053, "global_step": 138747, "epoch": 3303} {"train_loss": -6.628238677978516, "global_step": 138748, "epoch": 3303} {"train_loss": -6.748517036437988, "global_step": 138749, "epoch": 3303} {"train_loss": -6.657296180725098, "global_step": 138750, "epoch": 3303} {"train_loss": -6.800544261932373, "global_step": 138751, "epoch": 3303} {"train_loss": -6.806544303894043, "global_step": 138752, "epoch": 3303} {"train_loss": -6.722353935241699, "global_step": 138753, "epoch": 3303} {"train_loss": -6.66590690612793, "global_step": 138754, "epoch": 3303} {"train_loss": -6.771811008453369, "global_step": 138755, "epoch": 3303} {"train_loss": -6.702933311462402, "global_step": 138756, "epoch": 3303} {"train_loss": -6.835141658782959, "global_step": 138757, "epoch": 3303} {"train_loss": -6.848696708679199, "global_step": 138758, "epoch": 3303} {"train_loss": -6.7916741371154785, "global_step": 138759, "epoch": 3303} {"train_loss": -6.892879486083984, "global_step": 138760, "epoch": 3303} {"train_loss": -6.783762454986572, "global_step": 138761, "epoch": 3303} {"train_loss": -6.724994659423828, "global_step": 138762, "epoch": 3303} {"train_loss": -6.76415491104126, "global_step": 138763, "epoch": 3303} {"train_loss": -6.705631256103516, "global_step": 138764, "epoch": 3303} {"train_loss": -6.801980018615723, "global_step": 138765, "epoch": 3303} {"train_loss": -6.710872650146484, "global_step": 138766, "epoch": 3303} {"train_loss": -6.761740116845994, "global_step": 138767, "epoch": 3303, "val_loss": 77890.46875} {"train_loss": -6.777776718139648, "global_step": 138768, "epoch": 3304} {"train_loss": -6.652244567871094, "global_step": 138769, "epoch": 3304} {"train_loss": -6.789751052856445, "global_step": 138770, "epoch": 3304} {"train_loss": -6.801314353942871, "global_step": 138771, "epoch": 3304} {"train_loss": -6.680935382843018, "global_step": 138772, "epoch": 3304} {"train_loss": -6.758644104003906, "global_step": 138773, "epoch": 3304} {"train_loss": -6.78546142578125, "global_step": 138774, "epoch": 3304} {"train_loss": -6.749274730682373, "global_step": 138775, "epoch": 3304} {"train_loss": -6.720740795135498, "global_step": 138776, "epoch": 3304} {"train_loss": -6.710265159606934, "global_step": 138777, "epoch": 3304} {"train_loss": -6.8129987716674805, "global_step": 138778, "epoch": 3304} {"train_loss": -6.731780052185059, "global_step": 138779, "epoch": 3304} {"train_loss": -6.801845073699951, "global_step": 138780, "epoch": 3304} {"train_loss": -6.709316253662109, "global_step": 138781, "epoch": 3304} {"train_loss": -6.773540496826172, "global_step": 138782, "epoch": 3304} {"train_loss": -6.784302711486816, "global_step": 138783, "epoch": 3304} {"train_loss": -6.713461875915527, "global_step": 138784, "epoch": 3304} {"train_loss": -6.730841636657715, "global_step": 138785, "epoch": 3304} {"train_loss": -6.716061592102051, "global_step": 138786, "epoch": 3304} {"train_loss": -6.850627899169922, "global_step": 138787, "epoch": 3304} {"train_loss": -6.826326847076416, "global_step": 138788, "epoch": 3304} {"train_loss": -6.6888227462768555, "global_step": 138789, "epoch": 3304} {"train_loss": -6.665887832641602, "global_step": 138790, "epoch": 3304} {"train_loss": -6.689583778381348, "global_step": 138791, "epoch": 3304} {"train_loss": -6.709726333618164, "global_step": 138792, "epoch": 3304} {"train_loss": -6.605531692504883, "global_step": 138793, "epoch": 3304} {"train_loss": -6.824285507202148, "global_step": 138794, "epoch": 3304} {"train_loss": -6.903261661529541, "global_step": 138795, "epoch": 3304} {"train_loss": -6.748475074768066, "global_step": 138796, "epoch": 3304} {"train_loss": -6.787362098693848, "global_step": 138797, "epoch": 3304} {"train_loss": -6.67230224609375, "global_step": 138798, "epoch": 3304} {"train_loss": -6.705838680267334, "global_step": 138799, "epoch": 3304} {"train_loss": -6.875832557678223, "global_step": 138800, "epoch": 3304} {"train_loss": -6.728178024291992, "global_step": 138801, "epoch": 3304} {"train_loss": -6.733851909637451, "global_step": 138802, "epoch": 3304} {"train_loss": -6.797901630401611, "global_step": 138803, "epoch": 3304} {"train_loss": -6.7267913818359375, "global_step": 138804, "epoch": 3304} {"train_loss": -6.7598876953125, "global_step": 138805, "epoch": 3304} {"train_loss": -6.687908172607422, "global_step": 138806, "epoch": 3304} {"train_loss": -6.749942302703857, "global_step": 138807, "epoch": 3304} {"train_loss": -6.736205577850342, "global_step": 138808, "epoch": 3304} {"train_loss": -6.748297963823591, "global_step": 138809, "epoch": 3304, "val_loss": 77889.9375} {"train_loss": -6.7463884353637695, "global_step": 138810, "epoch": 3305} {"train_loss": -6.618760108947754, "global_step": 138811, "epoch": 3305} {"train_loss": -6.720853805541992, "global_step": 138812, "epoch": 3305} {"train_loss": -6.710484504699707, "global_step": 138813, "epoch": 3305} {"train_loss": -6.675343990325928, "global_step": 138814, "epoch": 3305} {"train_loss": -6.760475158691406, "global_step": 138815, "epoch": 3305} {"train_loss": -6.841986656188965, "global_step": 138816, "epoch": 3305} {"train_loss": -6.737120151519775, "global_step": 138817, "epoch": 3305} {"train_loss": -6.817263126373291, "global_step": 138818, "epoch": 3305} {"train_loss": -6.77548360824585, "global_step": 138819, "epoch": 3305} {"train_loss": -6.776018142700195, "global_step": 138820, "epoch": 3305} {"train_loss": -6.804566383361816, "global_step": 138821, "epoch": 3305} {"train_loss": -6.832375526428223, "global_step": 138822, "epoch": 3305} {"train_loss": -6.785793304443359, "global_step": 138823, "epoch": 3305} {"train_loss": -6.687933921813965, "global_step": 138824, "epoch": 3305} {"train_loss": -6.682730674743652, "global_step": 138825, "epoch": 3305} {"train_loss": -6.887136936187744, "global_step": 138826, "epoch": 3305} {"train_loss": -6.755276203155518, "global_step": 138827, "epoch": 3305} {"train_loss": -6.786642551422119, "global_step": 138828, "epoch": 3305} {"train_loss": -6.73832368850708, "global_step": 138829, "epoch": 3305} {"train_loss": -6.743265628814697, "global_step": 138830, "epoch": 3305} {"train_loss": -6.807025909423828, "global_step": 138831, "epoch": 3305} {"train_loss": -6.803247928619385, "global_step": 138832, "epoch": 3305} {"train_loss": -6.75655460357666, "global_step": 138833, "epoch": 3305} {"train_loss": -6.740269660949707, "global_step": 138834, "epoch": 3305} {"train_loss": -6.833768844604492, "global_step": 138835, "epoch": 3305} {"train_loss": -6.827659606933594, "global_step": 138836, "epoch": 3305} {"train_loss": -6.739363670349121, "global_step": 138837, "epoch": 3305} {"train_loss": -6.83655309677124, "global_step": 138838, "epoch": 3305} {"train_loss": -6.759239196777344, "global_step": 138839, "epoch": 3305} {"train_loss": -6.774813652038574, "global_step": 138840, "epoch": 3305} {"train_loss": -6.848618030548096, "global_step": 138841, "epoch": 3305} {"train_loss": -6.7764081954956055, "global_step": 138842, "epoch": 3305} {"train_loss": -6.791351318359375, "global_step": 138843, "epoch": 3305} {"train_loss": -6.7734246253967285, "global_step": 138844, "epoch": 3305} {"train_loss": -6.823988437652588, "global_step": 138845, "epoch": 3305} {"train_loss": -6.774641036987305, "global_step": 138846, "epoch": 3305} {"train_loss": -6.731632232666016, "global_step": 138847, "epoch": 3305} {"train_loss": -6.753133773803711, "global_step": 138848, "epoch": 3305} {"train_loss": -6.866279602050781, "global_step": 138849, "epoch": 3305} {"train_loss": -6.69924783706665, "global_step": 138850, "epoch": 3305} {"train_loss": -6.768968411854336, "global_step": 138851, "epoch": 3305, "val_loss": 77918.8046875} {"train_loss": -6.892119884490967, "global_step": 138852, "epoch": 3306} {"train_loss": -6.738063812255859, "global_step": 138853, "epoch": 3306} {"train_loss": -6.831880569458008, "global_step": 138854, "epoch": 3306} {"train_loss": -6.82972526550293, "global_step": 138855, "epoch": 3306} {"train_loss": -6.843238830566406, "global_step": 138856, "epoch": 3306} {"train_loss": -6.652707099914551, "global_step": 138857, "epoch": 3306} {"train_loss": -6.839792251586914, "global_step": 138858, "epoch": 3306} {"train_loss": -6.7406134605407715, "global_step": 138859, "epoch": 3306} {"train_loss": -6.83359432220459, "global_step": 138860, "epoch": 3306} {"train_loss": -6.763583183288574, "global_step": 138861, "epoch": 3306} {"train_loss": -6.822922706604004, "global_step": 138862, "epoch": 3306} {"train_loss": -6.858487129211426, "global_step": 138863, "epoch": 3306} {"train_loss": -6.814682483673096, "global_step": 138864, "epoch": 3306} {"train_loss": -6.7262420654296875, "global_step": 138865, "epoch": 3306} {"train_loss": -6.752204895019531, "global_step": 138866, "epoch": 3306} {"train_loss": -6.790343284606934, "global_step": 138867, "epoch": 3306} {"train_loss": -6.800848960876465, "global_step": 138868, "epoch": 3306} {"train_loss": -6.9082770347595215, "global_step": 138869, "epoch": 3306} {"train_loss": -6.755222320556641, "global_step": 138870, "epoch": 3306} {"train_loss": -6.747506141662598, "global_step": 138871, "epoch": 3306} {"train_loss": -6.836684703826904, "global_step": 138872, "epoch": 3306} {"train_loss": -6.773571968078613, "global_step": 138873, "epoch": 3306} {"train_loss": -6.756800651550293, "global_step": 138874, "epoch": 3306} {"train_loss": -6.811191558837891, "global_step": 138875, "epoch": 3306} {"train_loss": -6.8254170417785645, "global_step": 138876, "epoch": 3306} {"train_loss": -6.624086380004883, "global_step": 138877, "epoch": 3306} {"train_loss": -6.771075248718262, "global_step": 138878, "epoch": 3306} {"train_loss": -6.941340446472168, "global_step": 138879, "epoch": 3306} {"train_loss": -6.779465675354004, "global_step": 138880, "epoch": 3306} {"train_loss": -6.783045768737793, "global_step": 138881, "epoch": 3306} {"train_loss": -7.010140419006348, "global_step": 138882, "epoch": 3306} {"train_loss": -6.854061126708984, "global_step": 138883, "epoch": 3306} {"train_loss": -6.886099338531494, "global_step": 138884, "epoch": 3306} {"train_loss": -6.845975399017334, "global_step": 138885, "epoch": 3306} {"train_loss": -6.880270957946777, "global_step": 138886, "epoch": 3306} {"train_loss": -6.829483985900879, "global_step": 138887, "epoch": 3306} {"train_loss": -6.727268218994141, "global_step": 138888, "epoch": 3306} {"train_loss": -6.802407264709473, "global_step": 138889, "epoch": 3306} {"train_loss": -6.697831153869629, "global_step": 138890, "epoch": 3306} {"train_loss": -6.6192545890808105, "global_step": 138891, "epoch": 3306} {"train_loss": -6.75152587890625, "global_step": 138892, "epoch": 3306} {"train_loss": -6.797239496594384, "global_step": 138893, "epoch": 3306, "val_loss": 78129.671875} {"train_loss": -6.944120407104492, "global_step": 138894, "epoch": 3307} {"train_loss": -6.748002529144287, "global_step": 138895, "epoch": 3307} {"train_loss": -6.842569828033447, "global_step": 138896, "epoch": 3307} {"train_loss": -6.730690002441406, "global_step": 138897, "epoch": 3307} {"train_loss": -6.757570743560791, "global_step": 138898, "epoch": 3307} {"train_loss": -6.817360877990723, "global_step": 138899, "epoch": 3307} {"train_loss": -6.6715006828308105, "global_step": 138900, "epoch": 3307} {"train_loss": -6.744563102722168, "global_step": 138901, "epoch": 3307} {"train_loss": -6.657083988189697, "global_step": 138902, "epoch": 3307} {"train_loss": -6.652868270874023, "global_step": 138903, "epoch": 3307} {"train_loss": -6.733608245849609, "global_step": 138904, "epoch": 3307} {"train_loss": -6.713149070739746, "global_step": 138905, "epoch": 3307} {"train_loss": -6.800173759460449, "global_step": 138906, "epoch": 3307} {"train_loss": -6.7244391441345215, "global_step": 138907, "epoch": 3307} {"train_loss": -6.730475902557373, "global_step": 138908, "epoch": 3307} {"train_loss": -6.706052303314209, "global_step": 138909, "epoch": 3307} {"train_loss": -6.734100341796875, "global_step": 138910, "epoch": 3307} {"train_loss": -6.729011058807373, "global_step": 138911, "epoch": 3307} {"train_loss": -6.631691932678223, "global_step": 138912, "epoch": 3307} {"train_loss": -6.741612434387207, "global_step": 138913, "epoch": 3307} {"train_loss": -6.729797840118408, "global_step": 138914, "epoch": 3307} {"train_loss": -6.662786960601807, "global_step": 138915, "epoch": 3307} {"train_loss": -6.649802207946777, "global_step": 138916, "epoch": 3307} {"train_loss": -6.832858562469482, "global_step": 138917, "epoch": 3307} {"train_loss": -6.61478328704834, "global_step": 138918, "epoch": 3307} {"train_loss": -6.668291091918945, "global_step": 138919, "epoch": 3307} {"train_loss": -6.725140571594238, "global_step": 138920, "epoch": 3307} {"train_loss": -6.636725425720215, "global_step": 138921, "epoch": 3307} {"train_loss": -6.731445789337158, "global_step": 138922, "epoch": 3307} {"train_loss": -6.633450508117676, "global_step": 138923, "epoch": 3307} {"train_loss": -6.69484806060791, "global_step": 138924, "epoch": 3307} {"train_loss": -6.630885601043701, "global_step": 138925, "epoch": 3307} {"train_loss": -6.767482757568359, "global_step": 138926, "epoch": 3307} {"train_loss": -6.623836994171143, "global_step": 138927, "epoch": 3307} {"train_loss": -6.7372355461120605, "global_step": 138928, "epoch": 3307} {"train_loss": -6.8636474609375, "global_step": 138929, "epoch": 3307} {"train_loss": -6.633272171020508, "global_step": 138930, "epoch": 3307} {"train_loss": -6.698225021362305, "global_step": 138931, "epoch": 3307} {"train_loss": -6.626616477966309, "global_step": 138932, "epoch": 3307} {"train_loss": -6.7383623123168945, "global_step": 138933, "epoch": 3307} {"train_loss": -6.715454578399658, "global_step": 138934, "epoch": 3307} {"train_loss": -6.715566930316744, "global_step": 138935, "epoch": 3307, "val_loss": 77789.96875} {"train_loss": -6.736622333526611, "global_step": 138936, "epoch": 3308} {"train_loss": -6.8156023025512695, "global_step": 138937, "epoch": 3308} {"train_loss": -6.767791748046875, "global_step": 138938, "epoch": 3308} {"train_loss": -6.595754623413086, "global_step": 138939, "epoch": 3308} {"train_loss": -6.598458766937256, "global_step": 138940, "epoch": 3308} {"train_loss": -6.80665397644043, "global_step": 138941, "epoch": 3308} {"train_loss": -6.613321304321289, "global_step": 138942, "epoch": 3308} {"train_loss": -6.857308387756348, "global_step": 138943, "epoch": 3308} {"train_loss": -6.668294906616211, "global_step": 138944, "epoch": 3308} {"train_loss": -6.722318172454834, "global_step": 138945, "epoch": 3308} {"train_loss": -6.825884819030762, "global_step": 138946, "epoch": 3308} {"train_loss": -6.7420549392700195, "global_step": 138947, "epoch": 3308} {"train_loss": -6.691648006439209, "global_step": 138948, "epoch": 3308} {"train_loss": -6.761951446533203, "global_step": 138949, "epoch": 3308} {"train_loss": -6.809743881225586, "global_step": 138950, "epoch": 3308} {"train_loss": -6.646409511566162, "global_step": 138951, "epoch": 3308} {"train_loss": -6.76886510848999, "global_step": 138952, "epoch": 3308} {"train_loss": -6.886077880859375, "global_step": 138953, "epoch": 3308} {"train_loss": -6.673048496246338, "global_step": 138954, "epoch": 3308} {"train_loss": -6.839422225952148, "global_step": 138955, "epoch": 3308} {"train_loss": -6.841152191162109, "global_step": 138956, "epoch": 3308} {"train_loss": -6.786141872406006, "global_step": 138957, "epoch": 3308} {"train_loss": -6.743010997772217, "global_step": 138958, "epoch": 3308} {"train_loss": -6.656796455383301, "global_step": 138959, "epoch": 3308} {"train_loss": -6.758029460906982, "global_step": 138960, "epoch": 3308} {"train_loss": -6.751978874206543, "global_step": 138961, "epoch": 3308} {"train_loss": -6.846249580383301, "global_step": 138962, "epoch": 3308} {"train_loss": -6.75888729095459, "global_step": 138963, "epoch": 3308} {"train_loss": -6.8036699295043945, "global_step": 138964, "epoch": 3308} {"train_loss": -6.730598449707031, "global_step": 138965, "epoch": 3308} {"train_loss": -6.92046594619751, "global_step": 138966, "epoch": 3308} {"train_loss": -6.746068954467773, "global_step": 138967, "epoch": 3308} {"train_loss": -6.709578990936279, "global_step": 138968, "epoch": 3308} {"train_loss": -6.838151931762695, "global_step": 138969, "epoch": 3308} {"train_loss": -6.760833740234375, "global_step": 138970, "epoch": 3308} {"train_loss": -6.75444221496582, "global_step": 138971, "epoch": 3308} {"train_loss": -6.855480670928955, "global_step": 138972, "epoch": 3308} {"train_loss": -6.800498962402344, "global_step": 138973, "epoch": 3308} {"train_loss": -6.857240200042725, "global_step": 138974, "epoch": 3308} {"train_loss": -6.854363441467285, "global_step": 138975, "epoch": 3308} {"train_loss": -6.771248817443848, "global_step": 138976, "epoch": 3308} {"train_loss": -6.76828560375032, "global_step": 138977, "epoch": 3308, "val_loss": 77934.984375} {"train_loss": -6.937446117401123, "global_step": 138978, "epoch": 3309} {"train_loss": -6.907312393188477, "global_step": 138979, "epoch": 3309} {"train_loss": -6.839216232299805, "global_step": 138980, "epoch": 3309} {"train_loss": -6.846452713012695, "global_step": 138981, "epoch": 3309} {"train_loss": -6.796947002410889, "global_step": 138982, "epoch": 3309} {"train_loss": -6.741302967071533, "global_step": 138983, "epoch": 3309} {"train_loss": -6.7340850830078125, "global_step": 138984, "epoch": 3309} {"train_loss": -6.821356773376465, "global_step": 138985, "epoch": 3309} {"train_loss": -6.741980075836182, "global_step": 138986, "epoch": 3309} {"train_loss": -6.7748517990112305, "global_step": 138987, "epoch": 3309} {"train_loss": -6.780744552612305, "global_step": 138988, "epoch": 3309} {"train_loss": -6.784067630767822, "global_step": 138989, "epoch": 3309} {"train_loss": -6.684818267822266, "global_step": 138990, "epoch": 3309} {"train_loss": -6.5756402015686035, "global_step": 138991, "epoch": 3309} {"train_loss": -6.633111000061035, "global_step": 138992, "epoch": 3309} {"train_loss": -6.75485897064209, "global_step": 138993, "epoch": 3309} {"train_loss": -6.67706298828125, "global_step": 138994, "epoch": 3309} {"train_loss": -6.646126747131348, "global_step": 138995, "epoch": 3309} {"train_loss": -6.748498439788818, "global_step": 138996, "epoch": 3309} {"train_loss": -6.644632339477539, "global_step": 138997, "epoch": 3309} {"train_loss": -6.809083938598633, "global_step": 138998, "epoch": 3309} {"train_loss": -6.745055198669434, "global_step": 138999, "epoch": 3309} {"train_loss": -6.674065589904785, "global_step": 139000, "epoch": 3309} {"train_loss": -6.723751068115234, "global_step": 139001, "epoch": 3309} {"train_loss": -6.88210916519165, "global_step": 139002, "epoch": 3309} {"train_loss": -6.696382999420166, "global_step": 139003, "epoch": 3309} {"train_loss": -6.768701076507568, "global_step": 139004, "epoch": 3309} {"train_loss": -6.761099338531494, "global_step": 139005, "epoch": 3309} {"train_loss": -6.691428184509277, "global_step": 139006, "epoch": 3309} {"train_loss": -6.801620960235596, "global_step": 139007, "epoch": 3309} {"train_loss": -6.81126594543457, "global_step": 139008, "epoch": 3309} {"train_loss": -6.846658706665039, "global_step": 139009, "epoch": 3309} {"train_loss": -6.746251106262207, "global_step": 139010, "epoch": 3309} {"train_loss": -6.77341365814209, "global_step": 139011, "epoch": 3309} {"train_loss": -6.906159400939941, "global_step": 139012, "epoch": 3309} {"train_loss": -6.656286716461182, "global_step": 139013, "epoch": 3309} {"train_loss": -6.806078910827637, "global_step": 139014, "epoch": 3309} {"train_loss": -6.7507476806640625, "global_step": 139015, "epoch": 3309} {"train_loss": -6.810514450073242, "global_step": 139016, "epoch": 3309} {"train_loss": -6.775196075439453, "global_step": 139017, "epoch": 3309} {"train_loss": -6.774490833282471, "global_step": 139018, "epoch": 3309} {"train_loss": -6.763244220188686, "global_step": 139019, "epoch": 3309, "val_loss": 77932.203125} {"train_loss": -6.790731906890869, "global_step": 139020, "epoch": 3310} {"train_loss": -6.880522727966309, "global_step": 139021, "epoch": 3310} {"train_loss": -6.76008415222168, "global_step": 139022, "epoch": 3310} {"train_loss": -6.809576034545898, "global_step": 139023, "epoch": 3310} {"train_loss": -6.765066623687744, "global_step": 139024, "epoch": 3310} {"train_loss": -6.819165229797363, "global_step": 139025, "epoch": 3310} {"train_loss": -6.784214973449707, "global_step": 139026, "epoch": 3310} {"train_loss": -6.776634216308594, "global_step": 139027, "epoch": 3310} {"train_loss": -6.754025936126709, "global_step": 139028, "epoch": 3310} {"train_loss": -6.808860778808594, "global_step": 139029, "epoch": 3310} {"train_loss": -6.809643745422363, "global_step": 139030, "epoch": 3310} {"train_loss": -6.878725051879883, "global_step": 139031, "epoch": 3310} {"train_loss": -6.820891380310059, "global_step": 139032, "epoch": 3310} {"train_loss": -6.783167839050293, "global_step": 139033, "epoch": 3310} {"train_loss": -6.837767601013184, "global_step": 139034, "epoch": 3310} {"train_loss": -6.821920394897461, "global_step": 139035, "epoch": 3310} {"train_loss": -6.832043170928955, "global_step": 139036, "epoch": 3310} {"train_loss": -6.775022029876709, "global_step": 139037, "epoch": 3310} {"train_loss": -6.775773048400879, "global_step": 139038, "epoch": 3310} {"train_loss": -6.881248950958252, "global_step": 139039, "epoch": 3310} {"train_loss": -6.7810564041137695, "global_step": 139040, "epoch": 3310} {"train_loss": -6.769035816192627, "global_step": 139041, "epoch": 3310} {"train_loss": -6.757296562194824, "global_step": 139042, "epoch": 3310} {"train_loss": -6.75199031829834, "global_step": 139043, "epoch": 3310} {"train_loss": -6.8444366455078125, "global_step": 139044, "epoch": 3310} {"train_loss": -6.814280033111572, "global_step": 139045, "epoch": 3310} {"train_loss": -6.782320022583008, "global_step": 139046, "epoch": 3310} {"train_loss": -6.916886329650879, "global_step": 139047, "epoch": 3310} {"train_loss": -6.586660385131836, "global_step": 139048, "epoch": 3310} {"train_loss": -6.681765556335449, "global_step": 139049, "epoch": 3310} {"train_loss": -6.664399147033691, "global_step": 139050, "epoch": 3310} {"train_loss": -6.390491485595703, "global_step": 139051, "epoch": 3310} {"train_loss": -6.651082515716553, "global_step": 139052, "epoch": 3310} {"train_loss": -6.635769844055176, "global_step": 139053, "epoch": 3310} {"train_loss": -6.630724906921387, "global_step": 139054, "epoch": 3310} {"train_loss": -6.785552978515625, "global_step": 139055, "epoch": 3310} {"train_loss": -6.614927291870117, "global_step": 139056, "epoch": 3310} {"train_loss": -6.6581807136535645, "global_step": 139057, "epoch": 3310} {"train_loss": -6.725135803222656, "global_step": 139058, "epoch": 3310} {"train_loss": -6.516454219818115, "global_step": 139059, "epoch": 3310} {"train_loss": -6.599759578704834, "global_step": 139060, "epoch": 3310} {"train_loss": -6.743279354912894, "global_step": 139061, "epoch": 3310, "val_loss": 78032.84375} {"train_loss": -6.706789016723633, "global_step": 139062, "epoch": 3311} {"train_loss": -6.542184829711914, "global_step": 139063, "epoch": 3311} {"train_loss": -6.512514114379883, "global_step": 139064, "epoch": 3311} {"train_loss": -6.72299861907959, "global_step": 139065, "epoch": 3311} {"train_loss": -6.624510765075684, "global_step": 139066, "epoch": 3311} {"train_loss": -6.5324554443359375, "global_step": 139067, "epoch": 3311} {"train_loss": -6.543564796447754, "global_step": 139068, "epoch": 3311} {"train_loss": -6.659709930419922, "global_step": 139069, "epoch": 3311} {"train_loss": -6.586570739746094, "global_step": 139070, "epoch": 3311} {"train_loss": -6.560314178466797, "global_step": 139071, "epoch": 3311} {"train_loss": -6.719989776611328, "global_step": 139072, "epoch": 3311} {"train_loss": -6.6917195320129395, "global_step": 139073, "epoch": 3311} {"train_loss": -6.567132949829102, "global_step": 139074, "epoch": 3311} {"train_loss": -6.473690032958984, "global_step": 139075, "epoch": 3311} {"train_loss": -6.684576511383057, "global_step": 139076, "epoch": 3311} {"train_loss": -6.647866249084473, "global_step": 139077, "epoch": 3311} {"train_loss": -6.761990070343018, "global_step": 139078, "epoch": 3311} {"train_loss": -6.632119178771973, "global_step": 139079, "epoch": 3311} {"train_loss": -6.682995319366455, "global_step": 139080, "epoch": 3311} {"train_loss": -6.714729309082031, "global_step": 139081, "epoch": 3311} {"train_loss": -6.606716156005859, "global_step": 139082, "epoch": 3311} {"train_loss": -6.744704723358154, "global_step": 139083, "epoch": 3311} {"train_loss": -6.5728759765625, "global_step": 139084, "epoch": 3311} {"train_loss": -6.654689311981201, "global_step": 139085, "epoch": 3311} {"train_loss": -6.637005805969238, "global_step": 139086, "epoch": 3311} {"train_loss": -6.668102264404297, "global_step": 139087, "epoch": 3311} {"train_loss": -6.608092308044434, "global_step": 139088, "epoch": 3311} {"train_loss": -6.648216724395752, "global_step": 139089, "epoch": 3311} {"train_loss": -6.758452892303467, "global_step": 139090, "epoch": 3311} {"train_loss": -6.663734436035156, "global_step": 139091, "epoch": 3311} {"train_loss": -6.676314353942871, "global_step": 139092, "epoch": 3311} {"train_loss": -6.7837677001953125, "global_step": 139093, "epoch": 3311} {"train_loss": -6.741145133972168, "global_step": 139094, "epoch": 3311} {"train_loss": -6.786166191101074, "global_step": 139095, "epoch": 3311} {"train_loss": -6.680808067321777, "global_step": 139096, "epoch": 3311} {"train_loss": -6.853128433227539, "global_step": 139097, "epoch": 3311} {"train_loss": -6.698139190673828, "global_step": 139098, "epoch": 3311} {"train_loss": -6.701456069946289, "global_step": 139099, "epoch": 3311} {"train_loss": -6.743836402893066, "global_step": 139100, "epoch": 3311} {"train_loss": -6.737188816070557, "global_step": 139101, "epoch": 3311} {"train_loss": -6.707283020019531, "global_step": 139102, "epoch": 3311} {"train_loss": -6.665197678974697, "global_step": 139103, "epoch": 3311, "val_loss": 77938.234375} {"train_loss": -6.780704498291016, "global_step": 139104, "epoch": 3312} {"train_loss": -6.720156192779541, "global_step": 139105, "epoch": 3312} {"train_loss": -6.693029403686523, "global_step": 139106, "epoch": 3312} {"train_loss": -6.75039529800415, "global_step": 139107, "epoch": 3312} {"train_loss": -6.838608741760254, "global_step": 139108, "epoch": 3312} {"train_loss": -6.834529399871826, "global_step": 139109, "epoch": 3312} {"train_loss": -6.6631011962890625, "global_step": 139110, "epoch": 3312} {"train_loss": -6.79979133605957, "global_step": 139111, "epoch": 3312} {"train_loss": -6.832700729370117, "global_step": 139112, "epoch": 3312} {"train_loss": -6.6626458168029785, "global_step": 139113, "epoch": 3312} {"train_loss": -6.8072190284729, "global_step": 139114, "epoch": 3312} {"train_loss": -6.812481880187988, "global_step": 139115, "epoch": 3312} {"train_loss": -6.811922073364258, "global_step": 139116, "epoch": 3312} {"train_loss": -6.658703804016113, "global_step": 139117, "epoch": 3312} {"train_loss": -6.772701740264893, "global_step": 139118, "epoch": 3312} {"train_loss": -6.730240345001221, "global_step": 139119, "epoch": 3312} {"train_loss": -6.808086395263672, "global_step": 139120, "epoch": 3312} {"train_loss": -6.785801887512207, "global_step": 139121, "epoch": 3312} {"train_loss": -6.801945686340332, "global_step": 139122, "epoch": 3312} {"train_loss": -6.806804656982422, "global_step": 139123, "epoch": 3312} {"train_loss": -6.758640289306641, "global_step": 139124, "epoch": 3312} {"train_loss": -6.634718894958496, "global_step": 139125, "epoch": 3312} {"train_loss": -6.76871395111084, "global_step": 139126, "epoch": 3312} {"train_loss": -6.607692718505859, "global_step": 139127, "epoch": 3312} {"train_loss": -6.678806304931641, "global_step": 139128, "epoch": 3312} {"train_loss": -6.669549942016602, "global_step": 139129, "epoch": 3312} {"train_loss": -6.635850429534912, "global_step": 139130, "epoch": 3312} {"train_loss": -6.634969234466553, "global_step": 139131, "epoch": 3312} {"train_loss": -6.772519111633301, "global_step": 139132, "epoch": 3312} {"train_loss": -6.680466651916504, "global_step": 139133, "epoch": 3312} {"train_loss": -6.608818054199219, "global_step": 139134, "epoch": 3312} {"train_loss": -6.676115989685059, "global_step": 139135, "epoch": 3312} {"train_loss": -6.716817855834961, "global_step": 139136, "epoch": 3312} {"train_loss": -6.752470970153809, "global_step": 139137, "epoch": 3312} {"train_loss": -6.703593730926514, "global_step": 139138, "epoch": 3312} {"train_loss": -6.569530487060547, "global_step": 139139, "epoch": 3312} {"train_loss": -6.829130172729492, "global_step": 139140, "epoch": 3312} {"train_loss": -6.581993103027344, "global_step": 139141, "epoch": 3312} {"train_loss": -6.694413185119629, "global_step": 139142, "epoch": 3312} {"train_loss": -6.545487880706787, "global_step": 139143, "epoch": 3312} {"train_loss": -6.641509056091309, "global_step": 139144, "epoch": 3312} {"train_loss": -6.72079923039391, "global_step": 139145, "epoch": 3312, "val_loss": 78216.265625} {"train_loss": -6.624390602111816, "global_step": 139146, "epoch": 3313} {"train_loss": -6.689042091369629, "global_step": 139147, "epoch": 3313} {"train_loss": -6.677402496337891, "global_step": 139148, "epoch": 3313} {"train_loss": -6.727475643157959, "global_step": 139149, "epoch": 3313} {"train_loss": -6.701811790466309, "global_step": 139150, "epoch": 3313} {"train_loss": -6.73341178894043, "global_step": 139151, "epoch": 3313} {"train_loss": -6.577829360961914, "global_step": 139152, "epoch": 3313} {"train_loss": -6.825141906738281, "global_step": 139153, "epoch": 3313} {"train_loss": -6.693709373474121, "global_step": 139154, "epoch": 3313} {"train_loss": -6.725134372711182, "global_step": 139155, "epoch": 3313} {"train_loss": -6.620640277862549, "global_step": 139156, "epoch": 3313} {"train_loss": -6.737526893615723, "global_step": 139157, "epoch": 3313} {"train_loss": -6.722037315368652, "global_step": 139158, "epoch": 3313} {"train_loss": -6.699987888336182, "global_step": 139159, "epoch": 3313} {"train_loss": -6.703951358795166, "global_step": 139160, "epoch": 3313} {"train_loss": -6.690982818603516, "global_step": 139161, "epoch": 3313} {"train_loss": -6.851462364196777, "global_step": 139162, "epoch": 3313} {"train_loss": -6.804134845733643, "global_step": 139163, "epoch": 3313} {"train_loss": -6.80424690246582, "global_step": 139164, "epoch": 3313} {"train_loss": -6.816760063171387, "global_step": 139165, "epoch": 3313} {"train_loss": -6.728529930114746, "global_step": 139166, "epoch": 3313} {"train_loss": -6.851563930511475, "global_step": 139167, "epoch": 3313} {"train_loss": -6.795252799987793, "global_step": 139168, "epoch": 3313} {"train_loss": -6.669395446777344, "global_step": 139169, "epoch": 3313} {"train_loss": -6.833211421966553, "global_step": 139170, "epoch": 3313} {"train_loss": -6.6901397705078125, "global_step": 139171, "epoch": 3313} {"train_loss": -6.800178527832031, "global_step": 139172, "epoch": 3313} {"train_loss": -6.77419376373291, "global_step": 139173, "epoch": 3313} {"train_loss": -6.841656684875488, "global_step": 139174, "epoch": 3313} {"train_loss": -6.7132697105407715, "global_step": 139175, "epoch": 3313} {"train_loss": -6.656460762023926, "global_step": 139176, "epoch": 3313} {"train_loss": -6.773432731628418, "global_step": 139177, "epoch": 3313} {"train_loss": -6.665342807769775, "global_step": 139178, "epoch": 3313} {"train_loss": -6.656511306762695, "global_step": 139179, "epoch": 3313} {"train_loss": -6.765913009643555, "global_step": 139180, "epoch": 3313} {"train_loss": -6.7165679931640625, "global_step": 139181, "epoch": 3313} {"train_loss": -6.841999530792236, "global_step": 139182, "epoch": 3313} {"train_loss": -6.808966636657715, "global_step": 139183, "epoch": 3313} {"train_loss": -6.646903038024902, "global_step": 139184, "epoch": 3313} {"train_loss": -6.752718925476074, "global_step": 139185, "epoch": 3313} {"train_loss": -6.858180999755859, "global_step": 139186, "epoch": 3313} {"train_loss": -6.737256186349051, "global_step": 139187, "epoch": 3313, "val_loss": 77837.5078125} {"train_loss": -6.770672798156738, "global_step": 139188, "epoch": 3314} {"train_loss": -6.740220069885254, "global_step": 139189, "epoch": 3314} {"train_loss": -6.888286113739014, "global_step": 139190, "epoch": 3314} {"train_loss": -6.791212558746338, "global_step": 139191, "epoch": 3314} {"train_loss": -6.835251808166504, "global_step": 139192, "epoch": 3314} {"train_loss": -6.701499938964844, "global_step": 139193, "epoch": 3314} {"train_loss": -6.896843910217285, "global_step": 139194, "epoch": 3314} {"train_loss": -6.837819576263428, "global_step": 139195, "epoch": 3314} {"train_loss": -6.799675464630127, "global_step": 139196, "epoch": 3314} {"train_loss": -6.925688743591309, "global_step": 139197, "epoch": 3314} {"train_loss": -6.76782751083374, "global_step": 139198, "epoch": 3314} {"train_loss": -6.695940971374512, "global_step": 139199, "epoch": 3314} {"train_loss": -6.918200492858887, "global_step": 139200, "epoch": 3314} {"train_loss": -6.829063415527344, "global_step": 139201, "epoch": 3314} {"train_loss": -6.864257335662842, "global_step": 139202, "epoch": 3314} {"train_loss": -6.861681938171387, "global_step": 139203, "epoch": 3314} {"train_loss": -6.785271167755127, "global_step": 139204, "epoch": 3314} {"train_loss": -6.827216625213623, "global_step": 139205, "epoch": 3314} {"train_loss": -6.8121232986450195, "global_step": 139206, "epoch": 3314} {"train_loss": -6.877962589263916, "global_step": 139207, "epoch": 3314} {"train_loss": -6.892368316650391, "global_step": 139208, "epoch": 3314} {"train_loss": -6.876076698303223, "global_step": 139209, "epoch": 3314} {"train_loss": -6.778335094451904, "global_step": 139210, "epoch": 3314} {"train_loss": -6.8153300285339355, "global_step": 139211, "epoch": 3314} {"train_loss": -6.590778350830078, "global_step": 139212, "epoch": 3314} {"train_loss": -6.787205696105957, "global_step": 139213, "epoch": 3314} {"train_loss": -6.741928577423096, "global_step": 139214, "epoch": 3314} {"train_loss": -6.657589435577393, "global_step": 139215, "epoch": 3314} {"train_loss": -6.688448905944824, "global_step": 139216, "epoch": 3314} {"train_loss": -6.646397590637207, "global_step": 139217, "epoch": 3314} {"train_loss": -6.655375003814697, "global_step": 139218, "epoch": 3314} {"train_loss": -6.710847854614258, "global_step": 139219, "epoch": 3314} {"train_loss": -6.595418930053711, "global_step": 139220, "epoch": 3314} {"train_loss": -6.60241174697876, "global_step": 139221, "epoch": 3314} {"train_loss": -6.731841087341309, "global_step": 139222, "epoch": 3314} {"train_loss": -6.639482498168945, "global_step": 139223, "epoch": 3314} {"train_loss": -6.757953643798828, "global_step": 139224, "epoch": 3314} {"train_loss": -6.543935775756836, "global_step": 139225, "epoch": 3314} {"train_loss": -6.752501010894775, "global_step": 139226, "epoch": 3314} {"train_loss": -6.652671813964844, "global_step": 139227, "epoch": 3314} {"train_loss": -6.593393325805664, "global_step": 139228, "epoch": 3314} {"train_loss": -6.756718374433971, "global_step": 139229, "epoch": 3314, "val_loss": 77811.7421875} {"train_loss": -6.689723014831543, "global_step": 139230, "epoch": 3315} {"train_loss": -6.68894100189209, "global_step": 139231, "epoch": 3315} {"train_loss": -6.58913516998291, "global_step": 139232, "epoch": 3315} {"train_loss": -6.608676910400391, "global_step": 139233, "epoch": 3315} {"train_loss": -6.680184841156006, "global_step": 139234, "epoch": 3315} {"train_loss": -6.725098609924316, "global_step": 139235, "epoch": 3315} {"train_loss": -6.605259895324707, "global_step": 139236, "epoch": 3315} {"train_loss": -6.644536018371582, "global_step": 139237, "epoch": 3315} {"train_loss": -6.648695945739746, "global_step": 139238, "epoch": 3315} {"train_loss": -6.679640769958496, "global_step": 139239, "epoch": 3315} {"train_loss": -6.80271577835083, "global_step": 139240, "epoch": 3315} {"train_loss": -6.634879112243652, "global_step": 139241, "epoch": 3315} {"train_loss": -6.694161415100098, "global_step": 139242, "epoch": 3315} {"train_loss": -6.730864524841309, "global_step": 139243, "epoch": 3315} {"train_loss": -6.662830352783203, "global_step": 139244, "epoch": 3315} {"train_loss": -6.836044788360596, "global_step": 139245, "epoch": 3315} {"train_loss": -6.7231221199035645, "global_step": 139246, "epoch": 3315} {"train_loss": -6.749417304992676, "global_step": 139247, "epoch": 3315} {"train_loss": -6.709171772003174, "global_step": 139248, "epoch": 3315} {"train_loss": -6.730431079864502, "global_step": 139249, "epoch": 3315} {"train_loss": -6.607723236083984, "global_step": 139250, "epoch": 3315} {"train_loss": -6.729935169219971, "global_step": 139251, "epoch": 3315} {"train_loss": -6.590695381164551, "global_step": 139252, "epoch": 3315} {"train_loss": -6.637648582458496, "global_step": 139253, "epoch": 3315} {"train_loss": -6.695379734039307, "global_step": 139254, "epoch": 3315} {"train_loss": -6.801467418670654, "global_step": 139255, "epoch": 3315} {"train_loss": -6.645298004150391, "global_step": 139256, "epoch": 3315} {"train_loss": -6.720308303833008, "global_step": 139257, "epoch": 3315} {"train_loss": -6.700891971588135, "global_step": 139258, "epoch": 3315} {"train_loss": -6.690035343170166, "global_step": 139259, "epoch": 3315} {"train_loss": -6.737961769104004, "global_step": 139260, "epoch": 3315} {"train_loss": -6.766173362731934, "global_step": 139261, "epoch": 3315} {"train_loss": -6.838858604431152, "global_step": 139262, "epoch": 3315} {"train_loss": -6.722568511962891, "global_step": 139263, "epoch": 3315} {"train_loss": -6.682035446166992, "global_step": 139264, "epoch": 3315} {"train_loss": -6.716280937194824, "global_step": 139265, "epoch": 3315} {"train_loss": -6.772820472717285, "global_step": 139266, "epoch": 3315} {"train_loss": -6.775540351867676, "global_step": 139267, "epoch": 3315} {"train_loss": -6.851398468017578, "global_step": 139268, "epoch": 3315} {"train_loss": -6.802183151245117, "global_step": 139269, "epoch": 3315} {"train_loss": -6.7869062423706055, "global_step": 139270, "epoch": 3315} {"train_loss": -6.70972922870091, "global_step": 139271, "epoch": 3315, "val_loss": 78110.734375} {"train_loss": -6.6884002685546875, "global_step": 139272, "epoch": 3316} {"train_loss": -6.636209011077881, "global_step": 139273, "epoch": 3316} {"train_loss": -6.775750160217285, "global_step": 139274, "epoch": 3316} {"train_loss": -6.774816513061523, "global_step": 139275, "epoch": 3316} {"train_loss": -6.755253791809082, "global_step": 139276, "epoch": 3316} {"train_loss": -6.8391547203063965, "global_step": 139277, "epoch": 3316} {"train_loss": -6.643612861633301, "global_step": 139278, "epoch": 3316} {"train_loss": -6.760758399963379, "global_step": 139279, "epoch": 3316} {"train_loss": -6.772422790527344, "global_step": 139280, "epoch": 3316} {"train_loss": -6.884305953979492, "global_step": 139281, "epoch": 3316} {"train_loss": -6.857301712036133, "global_step": 139282, "epoch": 3316} {"train_loss": -6.89381742477417, "global_step": 139283, "epoch": 3316} {"train_loss": -6.900647163391113, "global_step": 139284, "epoch": 3316} {"train_loss": -6.844396114349365, "global_step": 139285, "epoch": 3316} {"train_loss": -6.829072952270508, "global_step": 139286, "epoch": 3316} {"train_loss": -6.824725151062012, "global_step": 139287, "epoch": 3316} {"train_loss": -6.918702602386475, "global_step": 139288, "epoch": 3316} {"train_loss": -6.767452239990234, "global_step": 139289, "epoch": 3316} {"train_loss": -6.846713066101074, "global_step": 139290, "epoch": 3316} {"train_loss": -6.773597240447998, "global_step": 139291, "epoch": 3316} {"train_loss": -6.816469192504883, "global_step": 139292, "epoch": 3316} {"train_loss": -6.79451847076416, "global_step": 139293, "epoch": 3316} {"train_loss": -6.85948371887207, "global_step": 139294, "epoch": 3316} {"train_loss": -6.936374187469482, "global_step": 139295, "epoch": 3316} {"train_loss": -6.84572172164917, "global_step": 139296, "epoch": 3316} {"train_loss": -6.880615234375, "global_step": 139297, "epoch": 3316} {"train_loss": -6.752167224884033, "global_step": 139298, "epoch": 3316} {"train_loss": -6.780709743499756, "global_step": 139299, "epoch": 3316} {"train_loss": -6.83197546005249, "global_step": 139300, "epoch": 3316} {"train_loss": -6.680365562438965, "global_step": 139301, "epoch": 3316} {"train_loss": -6.777715682983398, "global_step": 139302, "epoch": 3316} {"train_loss": -6.777194976806641, "global_step": 139303, "epoch": 3316} {"train_loss": -6.714856147766113, "global_step": 139304, "epoch": 3316} {"train_loss": -6.653894424438477, "global_step": 139305, "epoch": 3316} {"train_loss": -6.751437187194824, "global_step": 139306, "epoch": 3316} {"train_loss": -6.590686798095703, "global_step": 139307, "epoch": 3316} {"train_loss": -6.610373497009277, "global_step": 139308, "epoch": 3316} {"train_loss": -6.637659072875977, "global_step": 139309, "epoch": 3316} {"train_loss": -6.664333820343018, "global_step": 139310, "epoch": 3316} {"train_loss": -6.792601585388184, "global_step": 139311, "epoch": 3316} {"train_loss": -6.690643787384033, "global_step": 139312, "epoch": 3316} {"train_loss": -6.775051877612159, "global_step": 139313, "epoch": 3316, "val_loss": 78289.2578125} {"train_loss": -6.768894195556641, "global_step": 139314, "epoch": 3317} {"train_loss": -6.672817230224609, "global_step": 139315, "epoch": 3317} {"train_loss": -6.681425094604492, "global_step": 139316, "epoch": 3317} {"train_loss": -6.732503890991211, "global_step": 139317, "epoch": 3317} {"train_loss": -6.600645065307617, "global_step": 139318, "epoch": 3317} {"train_loss": -6.722532272338867, "global_step": 139319, "epoch": 3317} {"train_loss": -6.747125625610352, "global_step": 139320, "epoch": 3317} {"train_loss": -6.566431045532227, "global_step": 139321, "epoch": 3317} {"train_loss": -6.746516227722168, "global_step": 139322, "epoch": 3317} {"train_loss": -6.650299072265625, "global_step": 139323, "epoch": 3317} {"train_loss": -6.675166130065918, "global_step": 139324, "epoch": 3317} {"train_loss": -6.653833389282227, "global_step": 139325, "epoch": 3317} {"train_loss": -6.8459553718566895, "global_step": 139326, "epoch": 3317} {"train_loss": -6.670726776123047, "global_step": 139327, "epoch": 3317} {"train_loss": -6.708829402923584, "global_step": 139328, "epoch": 3317} {"train_loss": -6.6489105224609375, "global_step": 139329, "epoch": 3317} {"train_loss": -6.659574508666992, "global_step": 139330, "epoch": 3317} {"train_loss": -6.605413436889648, "global_step": 139331, "epoch": 3317} {"train_loss": -6.654305458068848, "global_step": 139332, "epoch": 3317} {"train_loss": -6.5937724113464355, "global_step": 139333, "epoch": 3317} {"train_loss": -6.603370666503906, "global_step": 139334, "epoch": 3317} {"train_loss": -6.717089653015137, "global_step": 139335, "epoch": 3317} {"train_loss": -6.565105438232422, "global_step": 139336, "epoch": 3317} {"train_loss": -6.7606401443481445, "global_step": 139337, "epoch": 3317} {"train_loss": -6.807429313659668, "global_step": 139338, "epoch": 3317} {"train_loss": -6.663172245025635, "global_step": 139339, "epoch": 3317} {"train_loss": -6.706101417541504, "global_step": 139340, "epoch": 3317} {"train_loss": -6.657336235046387, "global_step": 139341, "epoch": 3317} {"train_loss": -6.739105701446533, "global_step": 139342, "epoch": 3317} {"train_loss": -6.6884965896606445, "global_step": 139343, "epoch": 3317} {"train_loss": -6.797293186187744, "global_step": 139344, "epoch": 3317} {"train_loss": -6.6968278884887695, "global_step": 139345, "epoch": 3317} {"train_loss": -6.774358749389648, "global_step": 139346, "epoch": 3317} {"train_loss": -6.791736125946045, "global_step": 139347, "epoch": 3317} {"train_loss": -6.792265892028809, "global_step": 139348, "epoch": 3317} {"train_loss": -6.738986968994141, "global_step": 139349, "epoch": 3317} {"train_loss": -6.706454277038574, "global_step": 139350, "epoch": 3317} {"train_loss": -6.696972370147705, "global_step": 139351, "epoch": 3317} {"train_loss": -6.821410179138184, "global_step": 139352, "epoch": 3317} {"train_loss": -6.741156578063965, "global_step": 139353, "epoch": 3317} {"train_loss": -6.743535041809082, "global_step": 139354, "epoch": 3317} {"train_loss": -6.7059063003176735, "global_step": 139355, "epoch": 3317, "val_loss": 78180.6640625} {"train_loss": -6.738749980926514, "global_step": 139356, "epoch": 3318} {"train_loss": -6.885761260986328, "global_step": 139357, "epoch": 3318} {"train_loss": -6.754262447357178, "global_step": 139358, "epoch": 3318} {"train_loss": -6.730812072753906, "global_step": 139359, "epoch": 3318} {"train_loss": -6.897548675537109, "global_step": 139360, "epoch": 3318} {"train_loss": -6.861192226409912, "global_step": 139361, "epoch": 3318} {"train_loss": -6.682159423828125, "global_step": 139362, "epoch": 3318} {"train_loss": -6.842113018035889, "global_step": 139363, "epoch": 3318} {"train_loss": -6.845770835876465, "global_step": 139364, "epoch": 3318} {"train_loss": -6.855094909667969, "global_step": 139365, "epoch": 3318} {"train_loss": -6.714461803436279, "global_step": 139366, "epoch": 3318} {"train_loss": -6.8296709060668945, "global_step": 139367, "epoch": 3318} {"train_loss": -6.778865814208984, "global_step": 139368, "epoch": 3318} {"train_loss": -6.7217206954956055, "global_step": 139369, "epoch": 3318} {"train_loss": -6.655104160308838, "global_step": 139370, "epoch": 3318} {"train_loss": -6.817055702209473, "global_step": 139371, "epoch": 3318} {"train_loss": -6.693248748779297, "global_step": 139372, "epoch": 3318} {"train_loss": -6.685250759124756, "global_step": 139373, "epoch": 3318} {"train_loss": -6.854832649230957, "global_step": 139374, "epoch": 3318} {"train_loss": -6.692348480224609, "global_step": 139375, "epoch": 3318} {"train_loss": -6.770230293273926, "global_step": 139376, "epoch": 3318} {"train_loss": -6.6233720779418945, "global_step": 139377, "epoch": 3318} {"train_loss": -6.712562084197998, "global_step": 139378, "epoch": 3318} {"train_loss": -6.741587162017822, "global_step": 139379, "epoch": 3318} {"train_loss": -6.703794956207275, "global_step": 139380, "epoch": 3318} {"train_loss": -6.76863956451416, "global_step": 139381, "epoch": 3318} {"train_loss": -6.642343521118164, "global_step": 139382, "epoch": 3318} {"train_loss": -6.764364242553711, "global_step": 139383, "epoch": 3318} {"train_loss": -6.627697944641113, "global_step": 139384, "epoch": 3318} {"train_loss": -6.7499566078186035, "global_step": 139385, "epoch": 3318} {"train_loss": -6.7810516357421875, "global_step": 139386, "epoch": 3318} {"train_loss": -6.791133403778076, "global_step": 139387, "epoch": 3318} {"train_loss": -6.884824752807617, "global_step": 139388, "epoch": 3318} {"train_loss": -6.7674407958984375, "global_step": 139389, "epoch": 3318} {"train_loss": -6.650895118713379, "global_step": 139390, "epoch": 3318} {"train_loss": -6.83543062210083, "global_step": 139391, "epoch": 3318} {"train_loss": -6.599475383758545, "global_step": 139392, "epoch": 3318} {"train_loss": -6.688991546630859, "global_step": 139393, "epoch": 3318} {"train_loss": -6.781569957733154, "global_step": 139394, "epoch": 3318} {"train_loss": -6.68146276473999, "global_step": 139395, "epoch": 3318} {"train_loss": -6.6799468994140625, "global_step": 139396, "epoch": 3318} {"train_loss": -6.748781102044242, "global_step": 139397, "epoch": 3318, "val_loss": 78025.9765625} {"train_loss": -6.809426784515381, "global_step": 139398, "epoch": 3319} {"train_loss": -6.678749084472656, "global_step": 139399, "epoch": 3319} {"train_loss": -6.72872257232666, "global_step": 139400, "epoch": 3319} {"train_loss": -6.673875331878662, "global_step": 139401, "epoch": 3319} {"train_loss": -6.774286270141602, "global_step": 139402, "epoch": 3319} {"train_loss": -6.809919357299805, "global_step": 139403, "epoch": 3319} {"train_loss": -6.798978805541992, "global_step": 139404, "epoch": 3319} {"train_loss": -6.809378623962402, "global_step": 139405, "epoch": 3319} {"train_loss": -6.798874855041504, "global_step": 139406, "epoch": 3319} {"train_loss": -6.7045698165893555, "global_step": 139407, "epoch": 3319} {"train_loss": -6.796658992767334, "global_step": 139408, "epoch": 3319} {"train_loss": -6.912468910217285, "global_step": 139409, "epoch": 3319} {"train_loss": -6.8618388175964355, "global_step": 139410, "epoch": 3319} {"train_loss": -6.825560092926025, "global_step": 139411, "epoch": 3319} {"train_loss": -6.655980110168457, "global_step": 139412, "epoch": 3319} {"train_loss": -6.647838592529297, "global_step": 139413, "epoch": 3319} {"train_loss": -6.816871643066406, "global_step": 139414, "epoch": 3319} {"train_loss": -6.759400367736816, "global_step": 139415, "epoch": 3319} {"train_loss": -6.618247032165527, "global_step": 139416, "epoch": 3319} {"train_loss": -6.7940802574157715, "global_step": 139417, "epoch": 3319} {"train_loss": -6.728039741516113, "global_step": 139418, "epoch": 3319} {"train_loss": -6.689448356628418, "global_step": 139419, "epoch": 3319} {"train_loss": -6.640472412109375, "global_step": 139420, "epoch": 3319} {"train_loss": -6.7193756103515625, "global_step": 139421, "epoch": 3319} {"train_loss": -6.736039638519287, "global_step": 139422, "epoch": 3319} {"train_loss": -6.693552017211914, "global_step": 139423, "epoch": 3319} {"train_loss": -6.741353988647461, "global_step": 139424, "epoch": 3319} {"train_loss": -6.665797233581543, "global_step": 139425, "epoch": 3319} {"train_loss": -6.839043617248535, "global_step": 139426, "epoch": 3319} {"train_loss": -6.729301452636719, "global_step": 139427, "epoch": 3319} {"train_loss": -6.798347473144531, "global_step": 139428, "epoch": 3319} {"train_loss": -6.769497871398926, "global_step": 139429, "epoch": 3319} {"train_loss": -6.809591770172119, "global_step": 139430, "epoch": 3319} {"train_loss": -6.8389177322387695, "global_step": 139431, "epoch": 3319} {"train_loss": -6.8191447257995605, "global_step": 139432, "epoch": 3319} {"train_loss": -6.668157577514648, "global_step": 139433, "epoch": 3319} {"train_loss": -6.857969760894775, "global_step": 139434, "epoch": 3319} {"train_loss": -6.822019100189209, "global_step": 139435, "epoch": 3319} {"train_loss": -6.812918663024902, "global_step": 139436, "epoch": 3319} {"train_loss": -6.850502014160156, "global_step": 139437, "epoch": 3319} {"train_loss": -6.722540855407715, "global_step": 139438, "epoch": 3319} {"train_loss": -6.7605274858928865, "global_step": 139439, "epoch": 3319, "val_loss": 78204.703125} {"train_loss": -6.798467636108398, "global_step": 139440, "epoch": 3320} {"train_loss": -6.817488193511963, "global_step": 139441, "epoch": 3320} {"train_loss": -6.803879737854004, "global_step": 139442, "epoch": 3320} {"train_loss": -6.8824005126953125, "global_step": 139443, "epoch": 3320} {"train_loss": -6.8224005699157715, "global_step": 139444, "epoch": 3320} {"train_loss": -6.736232757568359, "global_step": 139445, "epoch": 3320} {"train_loss": -6.804725646972656, "global_step": 139446, "epoch": 3320} {"train_loss": -6.808508396148682, "global_step": 139447, "epoch": 3320} {"train_loss": -6.889277458190918, "global_step": 139448, "epoch": 3320} {"train_loss": -6.832226276397705, "global_step": 139449, "epoch": 3320} {"train_loss": -6.730236530303955, "global_step": 139450, "epoch": 3320} {"train_loss": -6.7881622314453125, "global_step": 139451, "epoch": 3320} {"train_loss": -6.798849105834961, "global_step": 139452, "epoch": 3320} {"train_loss": -6.7530059814453125, "global_step": 139453, "epoch": 3320} {"train_loss": -6.822731018066406, "global_step": 139454, "epoch": 3320} {"train_loss": -6.8216753005981445, "global_step": 139455, "epoch": 3320} {"train_loss": -6.74381160736084, "global_step": 139456, "epoch": 3320} {"train_loss": -6.7883405685424805, "global_step": 139457, "epoch": 3320} {"train_loss": -6.815011978149414, "global_step": 139458, "epoch": 3320} {"train_loss": -6.702997207641602, "global_step": 139459, "epoch": 3320} {"train_loss": -6.788044452667236, "global_step": 139460, "epoch": 3320} {"train_loss": -6.768449783325195, "global_step": 139461, "epoch": 3320} {"train_loss": -6.85910177230835, "global_step": 139462, "epoch": 3320} {"train_loss": -6.801063537597656, "global_step": 139463, "epoch": 3320} {"train_loss": -6.783881187438965, "global_step": 139464, "epoch": 3320} {"train_loss": -6.8190412521362305, "global_step": 139465, "epoch": 3320} {"train_loss": -6.7025861740112305, "global_step": 139466, "epoch": 3320} {"train_loss": -6.866210460662842, "global_step": 139467, "epoch": 3320} {"train_loss": -6.808436393737793, "global_step": 139468, "epoch": 3320} {"train_loss": -6.834412097930908, "global_step": 139469, "epoch": 3320} {"train_loss": -6.683913230895996, "global_step": 139470, "epoch": 3320} {"train_loss": -6.90630578994751, "global_step": 139471, "epoch": 3320} {"train_loss": -6.751116752624512, "global_step": 139472, "epoch": 3320} {"train_loss": -6.845821380615234, "global_step": 139473, "epoch": 3320} {"train_loss": -6.947919845581055, "global_step": 139474, "epoch": 3320} {"train_loss": -6.774930953979492, "global_step": 139475, "epoch": 3320} {"train_loss": -6.741796493530273, "global_step": 139476, "epoch": 3320} {"train_loss": -6.945395469665527, "global_step": 139477, "epoch": 3320} {"train_loss": -6.841371536254883, "global_step": 139478, "epoch": 3320} {"train_loss": -6.782679557800293, "global_step": 139479, "epoch": 3320} {"train_loss": -6.771657943725586, "global_step": 139480, "epoch": 3320} {"train_loss": -6.804098640169416, "global_step": 139481, "epoch": 3320, "val_loss": 78143.8125} {"train_loss": -6.882530212402344, "global_step": 139482, "epoch": 3321} {"train_loss": -6.682701110839844, "global_step": 139483, "epoch": 3321} {"train_loss": -6.653647422790527, "global_step": 139484, "epoch": 3321} {"train_loss": -6.779798984527588, "global_step": 139485, "epoch": 3321} {"train_loss": -6.758777141571045, "global_step": 139486, "epoch": 3321} {"train_loss": -6.502206325531006, "global_step": 139487, "epoch": 3321} {"train_loss": -6.820825099945068, "global_step": 139488, "epoch": 3321} {"train_loss": -6.768154144287109, "global_step": 139489, "epoch": 3321} {"train_loss": -6.673913955688477, "global_step": 139490, "epoch": 3321} {"train_loss": -6.733267784118652, "global_step": 139491, "epoch": 3321} {"train_loss": -6.783316135406494, "global_step": 139492, "epoch": 3321} {"train_loss": -6.91004753112793, "global_step": 139493, "epoch": 3321} {"train_loss": -6.787980079650879, "global_step": 139494, "epoch": 3321} {"train_loss": -6.6383161544799805, "global_step": 139495, "epoch": 3321} {"train_loss": -6.737494945526123, "global_step": 139496, "epoch": 3321} {"train_loss": -6.577858924865723, "global_step": 139497, "epoch": 3321} {"train_loss": -6.743335723876953, "global_step": 139498, "epoch": 3321} {"train_loss": -6.739514350891113, "global_step": 139499, "epoch": 3321} {"train_loss": -6.766725063323975, "global_step": 139500, "epoch": 3321} {"train_loss": -6.777157783508301, "global_step": 139501, "epoch": 3321} {"train_loss": -6.609214782714844, "global_step": 139502, "epoch": 3321} {"train_loss": -6.686609268188477, "global_step": 139503, "epoch": 3321} {"train_loss": -6.621131420135498, "global_step": 139504, "epoch": 3321} {"train_loss": -6.7814555168151855, "global_step": 139505, "epoch": 3321} {"train_loss": -6.8715691566467285, "global_step": 139506, "epoch": 3321} {"train_loss": -6.7488555908203125, "global_step": 139507, "epoch": 3321} {"train_loss": -6.718851566314697, "global_step": 139508, "epoch": 3321} {"train_loss": -6.726169586181641, "global_step": 139509, "epoch": 3321} {"train_loss": -6.730926513671875, "global_step": 139510, "epoch": 3321} {"train_loss": -6.781423568725586, "global_step": 139511, "epoch": 3321} {"train_loss": -6.883772373199463, "global_step": 139512, "epoch": 3321} {"train_loss": -6.64138126373291, "global_step": 139513, "epoch": 3321} {"train_loss": -6.684579849243164, "global_step": 139514, "epoch": 3321} {"train_loss": -6.672457695007324, "global_step": 139515, "epoch": 3321} {"train_loss": -6.707561016082764, "global_step": 139516, "epoch": 3321} {"train_loss": -6.516671180725098, "global_step": 139517, "epoch": 3321} {"train_loss": -6.72441291809082, "global_step": 139518, "epoch": 3321} {"train_loss": -6.814577102661133, "global_step": 139519, "epoch": 3321} {"train_loss": -6.601404190063477, "global_step": 139520, "epoch": 3321} {"train_loss": -6.7077460289001465, "global_step": 139521, "epoch": 3321} {"train_loss": -6.690684795379639, "global_step": 139522, "epoch": 3321} {"train_loss": -6.719845487957909, "global_step": 139523, "epoch": 3321, "val_loss": 77862.28125} {"train_loss": -6.7972259521484375, "global_step": 139524, "epoch": 3322} {"train_loss": -6.670840263366699, "global_step": 139525, "epoch": 3322} {"train_loss": -6.720808506011963, "global_step": 139526, "epoch": 3322} {"train_loss": -6.685586452484131, "global_step": 139527, "epoch": 3322} {"train_loss": -6.725124359130859, "global_step": 139528, "epoch": 3322} {"train_loss": -6.7512526512146, "global_step": 139529, "epoch": 3322} {"train_loss": -6.77312707901001, "global_step": 139530, "epoch": 3322} {"train_loss": -6.634458541870117, "global_step": 139531, "epoch": 3322} {"train_loss": -6.750527381896973, "global_step": 139532, "epoch": 3322} {"train_loss": -6.840794563293457, "global_step": 139533, "epoch": 3322} {"train_loss": -6.758704662322998, "global_step": 139534, "epoch": 3322} {"train_loss": -6.776369094848633, "global_step": 139535, "epoch": 3322} {"train_loss": -6.741393089294434, "global_step": 139536, "epoch": 3322} {"train_loss": -6.747066020965576, "global_step": 139537, "epoch": 3322} {"train_loss": -6.806396484375, "global_step": 139538, "epoch": 3322} {"train_loss": -6.724619388580322, "global_step": 139539, "epoch": 3322} {"train_loss": -6.734523296356201, "global_step": 139540, "epoch": 3322} {"train_loss": -6.773763656616211, "global_step": 139541, "epoch": 3322} {"train_loss": -6.54685115814209, "global_step": 139542, "epoch": 3322} {"train_loss": -6.62916898727417, "global_step": 139543, "epoch": 3322} {"train_loss": -6.616359233856201, "global_step": 139544, "epoch": 3322} {"train_loss": -6.625701904296875, "global_step": 139545, "epoch": 3322} {"train_loss": -6.597045421600342, "global_step": 139546, "epoch": 3322} {"train_loss": -6.702230453491211, "global_step": 139547, "epoch": 3322} {"train_loss": -6.731393814086914, "global_step": 139548, "epoch": 3322} {"train_loss": -6.67651891708374, "global_step": 139549, "epoch": 3322} {"train_loss": -6.79184103012085, "global_step": 139550, "epoch": 3322} {"train_loss": -6.666379928588867, "global_step": 139551, "epoch": 3322} {"train_loss": -6.786904811859131, "global_step": 139552, "epoch": 3322} {"train_loss": -6.758453369140625, "global_step": 139553, "epoch": 3322} {"train_loss": -6.581191062927246, "global_step": 139554, "epoch": 3322} {"train_loss": -6.750393390655518, "global_step": 139555, "epoch": 3322} {"train_loss": -6.728669166564941, "global_step": 139556, "epoch": 3322} {"train_loss": -6.766849994659424, "global_step": 139557, "epoch": 3322} {"train_loss": -6.64318323135376, "global_step": 139558, "epoch": 3322} {"train_loss": -6.755542278289795, "global_step": 139559, "epoch": 3322} {"train_loss": -6.7066192626953125, "global_step": 139560, "epoch": 3322} {"train_loss": -6.699872016906738, "global_step": 139561, "epoch": 3322} {"train_loss": -6.690492630004883, "global_step": 139562, "epoch": 3322} {"train_loss": -6.683201313018799, "global_step": 139563, "epoch": 3322} {"train_loss": -6.650267124176025, "global_step": 139564, "epoch": 3322} {"train_loss": -6.713228259767805, "global_step": 139565, "epoch": 3322, "val_loss": 77808.1484375} {"train_loss": -6.786228179931641, "global_step": 139566, "epoch": 3323} {"train_loss": -6.597020149230957, "global_step": 139567, "epoch": 3323} {"train_loss": -6.773759841918945, "global_step": 139568, "epoch": 3323} {"train_loss": -6.767200469970703, "global_step": 139569, "epoch": 3323} {"train_loss": -6.694188117980957, "global_step": 139570, "epoch": 3323} {"train_loss": -6.802836894989014, "global_step": 139571, "epoch": 3323} {"train_loss": -6.849254608154297, "global_step": 139572, "epoch": 3323} {"train_loss": -6.850507736206055, "global_step": 139573, "epoch": 3323} {"train_loss": -6.82028341293335, "global_step": 139574, "epoch": 3323} {"train_loss": -6.731624603271484, "global_step": 139575, "epoch": 3323} {"train_loss": -6.651853561401367, "global_step": 139576, "epoch": 3323} {"train_loss": -6.775506973266602, "global_step": 139577, "epoch": 3323} {"train_loss": -6.818685531616211, "global_step": 139578, "epoch": 3323} {"train_loss": -6.815999507904053, "global_step": 139579, "epoch": 3323} {"train_loss": -6.772255897521973, "global_step": 139580, "epoch": 3323} {"train_loss": -6.805459976196289, "global_step": 139581, "epoch": 3323} {"train_loss": -6.7899556159973145, "global_step": 139582, "epoch": 3323} {"train_loss": -6.72843074798584, "global_step": 139583, "epoch": 3323} {"train_loss": -6.808052062988281, "global_step": 139584, "epoch": 3323} {"train_loss": -6.75502347946167, "global_step": 139585, "epoch": 3323} {"train_loss": -6.821518898010254, "global_step": 139586, "epoch": 3323} {"train_loss": -6.796360969543457, "global_step": 139587, "epoch": 3323} {"train_loss": -6.851624488830566, "global_step": 139588, "epoch": 3323} {"train_loss": -6.834081649780273, "global_step": 139589, "epoch": 3323} {"train_loss": -6.818329811096191, "global_step": 139590, "epoch": 3323} {"train_loss": -6.708332061767578, "global_step": 139591, "epoch": 3323} {"train_loss": -6.88084077835083, "global_step": 139592, "epoch": 3323} {"train_loss": -6.702748775482178, "global_step": 139593, "epoch": 3323} {"train_loss": -6.797624588012695, "global_step": 139594, "epoch": 3323} {"train_loss": -6.8059492111206055, "global_step": 139595, "epoch": 3323} {"train_loss": -6.628772735595703, "global_step": 139596, "epoch": 3323} {"train_loss": -6.709720611572266, "global_step": 139597, "epoch": 3323} {"train_loss": -6.836917877197266, "global_step": 139598, "epoch": 3323} {"train_loss": -6.600907802581787, "global_step": 139599, "epoch": 3323} {"train_loss": -6.751703262329102, "global_step": 139600, "epoch": 3323} {"train_loss": -6.800483703613281, "global_step": 139601, "epoch": 3323} {"train_loss": -6.774064540863037, "global_step": 139602, "epoch": 3323} {"train_loss": -6.835468769073486, "global_step": 139603, "epoch": 3323} {"train_loss": -6.786261558532715, "global_step": 139604, "epoch": 3323} {"train_loss": -6.770103454589844, "global_step": 139605, "epoch": 3323} {"train_loss": -6.802083969116211, "global_step": 139606, "epoch": 3323} {"train_loss": -6.772720484506516, "global_step": 139607, "epoch": 3323, "val_loss": 78144.4921875} {"train_loss": -6.800014019012451, "global_step": 139608, "epoch": 3324} {"train_loss": -6.8447585105896, "global_step": 139609, "epoch": 3324} {"train_loss": -6.797915458679199, "global_step": 139610, "epoch": 3324} {"train_loss": -6.96389102935791, "global_step": 139611, "epoch": 3324} {"train_loss": -6.750888824462891, "global_step": 139612, "epoch": 3324} {"train_loss": -6.731695175170898, "global_step": 139613, "epoch": 3324} {"train_loss": -6.627579212188721, "global_step": 139614, "epoch": 3324} {"train_loss": -6.752744197845459, "global_step": 139615, "epoch": 3324} {"train_loss": -6.736692905426025, "global_step": 139616, "epoch": 3324} {"train_loss": -6.719033241271973, "global_step": 139617, "epoch": 3324} {"train_loss": -6.792003154754639, "global_step": 139618, "epoch": 3324} {"train_loss": -6.758861541748047, "global_step": 139619, "epoch": 3324} {"train_loss": -6.8438825607299805, "global_step": 139620, "epoch": 3324} {"train_loss": -6.728308200836182, "global_step": 139621, "epoch": 3324} {"train_loss": -6.674485683441162, "global_step": 139622, "epoch": 3324} {"train_loss": -6.827304840087891, "global_step": 139623, "epoch": 3324} {"train_loss": -6.670949935913086, "global_step": 139624, "epoch": 3324} {"train_loss": -6.735773086547852, "global_step": 139625, "epoch": 3324} {"train_loss": -6.756159782409668, "global_step": 139626, "epoch": 3324} {"train_loss": -6.763669967651367, "global_step": 139627, "epoch": 3324} {"train_loss": -6.72093391418457, "global_step": 139628, "epoch": 3324} {"train_loss": -6.854349136352539, "global_step": 139629, "epoch": 3324} {"train_loss": -6.8089165687561035, "global_step": 139630, "epoch": 3324} {"train_loss": -6.714032173156738, "global_step": 139631, "epoch": 3324} {"train_loss": -6.656339645385742, "global_step": 139632, "epoch": 3324} {"train_loss": -6.732417106628418, "global_step": 139633, "epoch": 3324} {"train_loss": -6.70671272277832, "global_step": 139634, "epoch": 3324} {"train_loss": -6.684910297393799, "global_step": 139635, "epoch": 3324} {"train_loss": -6.767621040344238, "global_step": 139636, "epoch": 3324} {"train_loss": -6.7035722732543945, "global_step": 139637, "epoch": 3324} {"train_loss": -6.885405540466309, "global_step": 139638, "epoch": 3324} {"train_loss": -6.788144111633301, "global_step": 139639, "epoch": 3324} {"train_loss": -6.845651626586914, "global_step": 139640, "epoch": 3324} {"train_loss": -6.8883185386657715, "global_step": 139641, "epoch": 3324} {"train_loss": -6.890671730041504, "global_step": 139642, "epoch": 3324} {"train_loss": -6.738541603088379, "global_step": 139643, "epoch": 3324} {"train_loss": -6.770113945007324, "global_step": 139644, "epoch": 3324} {"train_loss": -6.731985092163086, "global_step": 139645, "epoch": 3324} {"train_loss": -6.878034591674805, "global_step": 139646, "epoch": 3324} {"train_loss": -6.691495895385742, "global_step": 139647, "epoch": 3324} {"train_loss": -6.883657455444336, "global_step": 139648, "epoch": 3324} {"train_loss": -6.771597884950184, "global_step": 139649, "epoch": 3324, "val_loss": 78027.109375} {"train_loss": -6.9259138107299805, "global_step": 139650, "epoch": 3325} {"train_loss": -6.958962440490723, "global_step": 139651, "epoch": 3325} {"train_loss": -6.819073677062988, "global_step": 139652, "epoch": 3325} {"train_loss": -6.657893180847168, "global_step": 139653, "epoch": 3325} {"train_loss": -6.741021156311035, "global_step": 139654, "epoch": 3325} {"train_loss": -6.873695373535156, "global_step": 139655, "epoch": 3325} {"train_loss": -6.758155822753906, "global_step": 139656, "epoch": 3325} {"train_loss": -6.784478664398193, "global_step": 139657, "epoch": 3325} {"train_loss": -6.627823829650879, "global_step": 139658, "epoch": 3325} {"train_loss": -6.892812252044678, "global_step": 139659, "epoch": 3325} {"train_loss": -6.769600868225098, "global_step": 139660, "epoch": 3325} {"train_loss": -6.664111137390137, "global_step": 139661, "epoch": 3325} {"train_loss": -6.797898769378662, "global_step": 139662, "epoch": 3325} {"train_loss": -6.800253391265869, "global_step": 139663, "epoch": 3325} {"train_loss": -6.75651216506958, "global_step": 139664, "epoch": 3325} {"train_loss": -6.760570049285889, "global_step": 139665, "epoch": 3325} {"train_loss": -6.734460830688477, "global_step": 139666, "epoch": 3325} {"train_loss": -6.776442050933838, "global_step": 139667, "epoch": 3325} {"train_loss": -6.802742004394531, "global_step": 139668, "epoch": 3325} {"train_loss": -6.717121124267578, "global_step": 139669, "epoch": 3325} {"train_loss": -6.7257537841796875, "global_step": 139670, "epoch": 3325} {"train_loss": -6.747565269470215, "global_step": 139671, "epoch": 3325} {"train_loss": -6.653640270233154, "global_step": 139672, "epoch": 3325} {"train_loss": -6.668759346008301, "global_step": 139673, "epoch": 3325} {"train_loss": -6.659609794616699, "global_step": 139674, "epoch": 3325} {"train_loss": -6.797571659088135, "global_step": 139675, "epoch": 3325} {"train_loss": -6.674213886260986, "global_step": 139676, "epoch": 3325} {"train_loss": -6.619641304016113, "global_step": 139677, "epoch": 3325} {"train_loss": -6.6868367195129395, "global_step": 139678, "epoch": 3325} {"train_loss": -6.748628616333008, "global_step": 139679, "epoch": 3325} {"train_loss": -6.741212368011475, "global_step": 139680, "epoch": 3325} {"train_loss": -6.799871444702148, "global_step": 139681, "epoch": 3325} {"train_loss": -6.771097183227539, "global_step": 139682, "epoch": 3325} {"train_loss": -6.801955223083496, "global_step": 139683, "epoch": 3325} {"train_loss": -6.808898448944092, "global_step": 139684, "epoch": 3325} {"train_loss": -6.787130355834961, "global_step": 139685, "epoch": 3325} {"train_loss": -6.7315778732299805, "global_step": 139686, "epoch": 3325} {"train_loss": -6.81058406829834, "global_step": 139687, "epoch": 3325} {"train_loss": -6.754538536071777, "global_step": 139688, "epoch": 3325} {"train_loss": -6.764383316040039, "global_step": 139689, "epoch": 3325} {"train_loss": -6.811283588409424, "global_step": 139690, "epoch": 3325} {"train_loss": -6.761854875655401, "global_step": 139691, "epoch": 3325, "val_loss": 78127.4921875} {"train_loss": -6.781539440155029, "global_step": 139692, "epoch": 3326} {"train_loss": -6.807097434997559, "global_step": 139693, "epoch": 3326} {"train_loss": -6.77225399017334, "global_step": 139694, "epoch": 3326} {"train_loss": -6.765680313110352, "global_step": 139695, "epoch": 3326} {"train_loss": -6.81707763671875, "global_step": 139696, "epoch": 3326} {"train_loss": -6.827566146850586, "global_step": 139697, "epoch": 3326} {"train_loss": -6.697073936462402, "global_step": 139698, "epoch": 3326} {"train_loss": -6.824410915374756, "global_step": 139699, "epoch": 3326} {"train_loss": -6.7029008865356445, "global_step": 139700, "epoch": 3326} {"train_loss": -6.880899906158447, "global_step": 139701, "epoch": 3326} {"train_loss": -6.911654472351074, "global_step": 139702, "epoch": 3326} {"train_loss": -6.744279861450195, "global_step": 139703, "epoch": 3326} {"train_loss": -6.789545059204102, "global_step": 139704, "epoch": 3326} {"train_loss": -6.807000160217285, "global_step": 139705, "epoch": 3326} {"train_loss": -6.811750411987305, "global_step": 139706, "epoch": 3326} {"train_loss": -6.736077308654785, "global_step": 139707, "epoch": 3326} {"train_loss": -6.758562088012695, "global_step": 139708, "epoch": 3326} {"train_loss": -6.729530334472656, "global_step": 139709, "epoch": 3326} {"train_loss": -6.823849678039551, "global_step": 139710, "epoch": 3326} {"train_loss": -6.689304828643799, "global_step": 139711, "epoch": 3326} {"train_loss": -6.687461853027344, "global_step": 139712, "epoch": 3326} {"train_loss": -6.767277240753174, "global_step": 139713, "epoch": 3326} {"train_loss": -6.707008361816406, "global_step": 139714, "epoch": 3326} {"train_loss": -6.754427909851074, "global_step": 139715, "epoch": 3326} {"train_loss": -6.855454921722412, "global_step": 139716, "epoch": 3326} {"train_loss": -6.7817912101745605, "global_step": 139717, "epoch": 3326} {"train_loss": -6.781988143920898, "global_step": 139718, "epoch": 3326} {"train_loss": -6.689218997955322, "global_step": 139719, "epoch": 3326} {"train_loss": -6.714279651641846, "global_step": 139720, "epoch": 3326} {"train_loss": -6.704963684082031, "global_step": 139721, "epoch": 3326} {"train_loss": -6.617522239685059, "global_step": 139722, "epoch": 3326} {"train_loss": -6.647624492645264, "global_step": 139723, "epoch": 3326} {"train_loss": -6.707400321960449, "global_step": 139724, "epoch": 3326} {"train_loss": -6.70566463470459, "global_step": 139725, "epoch": 3326} {"train_loss": -6.530323028564453, "global_step": 139726, "epoch": 3326} {"train_loss": -6.733644008636475, "global_step": 139727, "epoch": 3326} {"train_loss": -6.681849479675293, "global_step": 139728, "epoch": 3326} {"train_loss": -6.6792755126953125, "global_step": 139729, "epoch": 3326} {"train_loss": -6.752486228942871, "global_step": 139730, "epoch": 3326} {"train_loss": -6.585064888000488, "global_step": 139731, "epoch": 3326} {"train_loss": -6.708704471588135, "global_step": 139732, "epoch": 3326} {"train_loss": -6.739815553029378, "global_step": 139733, "epoch": 3326, "val_loss": 78327.875} {"train_loss": -6.619718551635742, "global_step": 139734, "epoch": 3327} {"train_loss": -6.642061233520508, "global_step": 139735, "epoch": 3327} {"train_loss": -6.693950653076172, "global_step": 139736, "epoch": 3327} {"train_loss": -6.523215293884277, "global_step": 139737, "epoch": 3327} {"train_loss": -6.666757106781006, "global_step": 139738, "epoch": 3327} {"train_loss": -6.673430442810059, "global_step": 139739, "epoch": 3327} {"train_loss": -6.527856826782227, "global_step": 139740, "epoch": 3327} {"train_loss": -6.656496047973633, "global_step": 139741, "epoch": 3327} {"train_loss": -6.707569599151611, "global_step": 139742, "epoch": 3327} {"train_loss": -6.635592460632324, "global_step": 139743, "epoch": 3327} {"train_loss": -6.627618312835693, "global_step": 139744, "epoch": 3327} {"train_loss": -6.785649299621582, "global_step": 139745, "epoch": 3327} {"train_loss": -6.702935218811035, "global_step": 139746, "epoch": 3327} {"train_loss": -6.616623401641846, "global_step": 139747, "epoch": 3327} {"train_loss": -6.756802558898926, "global_step": 139748, "epoch": 3327} {"train_loss": -6.722180366516113, "global_step": 139749, "epoch": 3327} {"train_loss": -6.670768737792969, "global_step": 139750, "epoch": 3327} {"train_loss": -6.735569477081299, "global_step": 139751, "epoch": 3327} {"train_loss": -6.652173042297363, "global_step": 139752, "epoch": 3327} {"train_loss": -6.762202739715576, "global_step": 139753, "epoch": 3327} {"train_loss": -6.7377777099609375, "global_step": 139754, "epoch": 3327} {"train_loss": -6.646875381469727, "global_step": 139755, "epoch": 3327} {"train_loss": -6.774436950683594, "global_step": 139756, "epoch": 3327} {"train_loss": -6.72270393371582, "global_step": 139757, "epoch": 3327} {"train_loss": -6.610416412353516, "global_step": 139758, "epoch": 3327} {"train_loss": -6.637308597564697, "global_step": 139759, "epoch": 3327} {"train_loss": -6.6866960525512695, "global_step": 139760, "epoch": 3327} {"train_loss": -6.748289585113525, "global_step": 139761, "epoch": 3327} {"train_loss": -6.690623760223389, "global_step": 139762, "epoch": 3327} {"train_loss": -6.68821382522583, "global_step": 139763, "epoch": 3327} {"train_loss": -6.742008686065674, "global_step": 139764, "epoch": 3327} {"train_loss": -6.7922468185424805, "global_step": 139765, "epoch": 3327} {"train_loss": -6.573336601257324, "global_step": 139766, "epoch": 3327} {"train_loss": -6.663888931274414, "global_step": 139767, "epoch": 3327} {"train_loss": -6.688780784606934, "global_step": 139768, "epoch": 3327} {"train_loss": -6.737400054931641, "global_step": 139769, "epoch": 3327} {"train_loss": -6.654494762420654, "global_step": 139770, "epoch": 3327} {"train_loss": -6.723087310791016, "global_step": 139771, "epoch": 3327} {"train_loss": -6.6744279861450195, "global_step": 139772, "epoch": 3327} {"train_loss": -6.739442348480225, "global_step": 139773, "epoch": 3327} {"train_loss": -6.7433271408081055, "global_step": 139774, "epoch": 3327} {"train_loss": -6.68629899479094, "global_step": 139775, "epoch": 3327, "val_loss": 77989.2109375} {"train_loss": -6.841331481933594, "global_step": 139776, "epoch": 3328} {"train_loss": -6.6729278564453125, "global_step": 139777, "epoch": 3328} {"train_loss": -6.679543495178223, "global_step": 139778, "epoch": 3328} {"train_loss": -6.7832746505737305, "global_step": 139779, "epoch": 3328} {"train_loss": -6.865015983581543, "global_step": 139780, "epoch": 3328} {"train_loss": -6.800403594970703, "global_step": 139781, "epoch": 3328} {"train_loss": -6.725978374481201, "global_step": 139782, "epoch": 3328} {"train_loss": -6.845094203948975, "global_step": 139783, "epoch": 3328} {"train_loss": -6.731149196624756, "global_step": 139784, "epoch": 3328} {"train_loss": -6.787187576293945, "global_step": 139785, "epoch": 3328} {"train_loss": -6.781530380249023, "global_step": 139786, "epoch": 3328} {"train_loss": -6.784036636352539, "global_step": 139787, "epoch": 3328} {"train_loss": -6.877861976623535, "global_step": 139788, "epoch": 3328} {"train_loss": -6.704867362976074, "global_step": 139789, "epoch": 3328} {"train_loss": -6.728146553039551, "global_step": 139790, "epoch": 3328} {"train_loss": -6.9003496170043945, "global_step": 139791, "epoch": 3328} {"train_loss": -6.744753837585449, "global_step": 139792, "epoch": 3328} {"train_loss": -6.821199893951416, "global_step": 139793, "epoch": 3328} {"train_loss": -6.883167266845703, "global_step": 139794, "epoch": 3328} {"train_loss": -6.8028244972229, "global_step": 139795, "epoch": 3328} {"train_loss": -6.781034469604492, "global_step": 139796, "epoch": 3328} {"train_loss": -6.791589736938477, "global_step": 139797, "epoch": 3328} {"train_loss": -6.742095470428467, "global_step": 139798, "epoch": 3328} {"train_loss": -6.888031005859375, "global_step": 139799, "epoch": 3328} {"train_loss": -6.65110445022583, "global_step": 139800, "epoch": 3328} {"train_loss": -6.797122955322266, "global_step": 139801, "epoch": 3328} {"train_loss": -6.866741180419922, "global_step": 139802, "epoch": 3328} {"train_loss": -6.729770660400391, "global_step": 139803, "epoch": 3328} {"train_loss": -6.718840599060059, "global_step": 139804, "epoch": 3328} {"train_loss": -6.705259799957275, "global_step": 139805, "epoch": 3328} {"train_loss": -6.710464954376221, "global_step": 139806, "epoch": 3328} {"train_loss": -6.725769996643066, "global_step": 139807, "epoch": 3328} {"train_loss": -6.673809051513672, "global_step": 139808, "epoch": 3328} {"train_loss": -6.744958877563477, "global_step": 139809, "epoch": 3328} {"train_loss": -6.729825019836426, "global_step": 139810, "epoch": 3328} {"train_loss": -6.714505195617676, "global_step": 139811, "epoch": 3328} {"train_loss": -6.903992652893066, "global_step": 139812, "epoch": 3328} {"train_loss": -6.764389991760254, "global_step": 139813, "epoch": 3328} {"train_loss": -6.74483585357666, "global_step": 139814, "epoch": 3328} {"train_loss": -6.764317989349365, "global_step": 139815, "epoch": 3328} {"train_loss": -6.769015312194824, "global_step": 139816, "epoch": 3328} {"train_loss": -6.7739694232032415, "global_step": 139817, "epoch": 3328, "val_loss": 77865.125} {"train_loss": -6.794269561767578, "global_step": 139818, "epoch": 3329} {"train_loss": -6.793017864227295, "global_step": 139819, "epoch": 3329} {"train_loss": -6.768049240112305, "global_step": 139820, "epoch": 3329} {"train_loss": -6.840525150299072, "global_step": 139821, "epoch": 3329} {"train_loss": -6.694717884063721, "global_step": 139822, "epoch": 3329} {"train_loss": -6.786770820617676, "global_step": 139823, "epoch": 3329} {"train_loss": -6.890295028686523, "global_step": 139824, "epoch": 3329} {"train_loss": -6.867259502410889, "global_step": 139825, "epoch": 3329} {"train_loss": -6.862520217895508, "global_step": 139826, "epoch": 3329} {"train_loss": -6.839014053344727, "global_step": 139827, "epoch": 3329} {"train_loss": -6.744621753692627, "global_step": 139828, "epoch": 3329} {"train_loss": -6.820128440856934, "global_step": 139829, "epoch": 3329} {"train_loss": -6.912407875061035, "global_step": 139830, "epoch": 3329} {"train_loss": -6.837026596069336, "global_step": 139831, "epoch": 3329} {"train_loss": -6.783242702484131, "global_step": 139832, "epoch": 3329} {"train_loss": -6.817348003387451, "global_step": 139833, "epoch": 3329} {"train_loss": -6.746127128601074, "global_step": 139834, "epoch": 3329} {"train_loss": -6.84071159362793, "global_step": 139835, "epoch": 3329} {"train_loss": -6.805868148803711, "global_step": 139836, "epoch": 3329} {"train_loss": -6.797750473022461, "global_step": 139837, "epoch": 3329} {"train_loss": -6.788043975830078, "global_step": 139838, "epoch": 3329} {"train_loss": -6.787324905395508, "global_step": 139839, "epoch": 3329} {"train_loss": -6.866591453552246, "global_step": 139840, "epoch": 3329} {"train_loss": -6.88964319229126, "global_step": 139841, "epoch": 3329} {"train_loss": -6.909610748291016, "global_step": 139842, "epoch": 3329} {"train_loss": -6.861496925354004, "global_step": 139843, "epoch": 3329} {"train_loss": -6.910586357116699, "global_step": 139844, "epoch": 3329} {"train_loss": -6.834929466247559, "global_step": 139845, "epoch": 3329} {"train_loss": -6.769085884094238, "global_step": 139846, "epoch": 3329} {"train_loss": -6.623010635375977, "global_step": 139847, "epoch": 3329} {"train_loss": -6.7553629875183105, "global_step": 139848, "epoch": 3329} {"train_loss": -6.8449602127075195, "global_step": 139849, "epoch": 3329} {"train_loss": -6.830422401428223, "global_step": 139850, "epoch": 3329} {"train_loss": -6.870759963989258, "global_step": 139851, "epoch": 3329} {"train_loss": -6.731082916259766, "global_step": 139852, "epoch": 3329} {"train_loss": -6.83775520324707, "global_step": 139853, "epoch": 3329} {"train_loss": -6.81452751159668, "global_step": 139854, "epoch": 3329} {"train_loss": -6.791616916656494, "global_step": 139855, "epoch": 3329} {"train_loss": -6.742547035217285, "global_step": 139856, "epoch": 3329} {"train_loss": -6.735947608947754, "global_step": 139857, "epoch": 3329} {"train_loss": -6.763847351074219, "global_step": 139858, "epoch": 3329} {"train_loss": -6.808784984406971, "global_step": 139859, "epoch": 3329, "val_loss": 77985.5390625} {"train_loss": -6.75445032119751, "global_step": 139860, "epoch": 3330} {"train_loss": -6.816493511199951, "global_step": 139861, "epoch": 3330} {"train_loss": -6.669851303100586, "global_step": 139862, "epoch": 3330} {"train_loss": -6.820291519165039, "global_step": 139863, "epoch": 3330} {"train_loss": -6.800850868225098, "global_step": 139864, "epoch": 3330} {"train_loss": -6.832200050354004, "global_step": 139865, "epoch": 3330} {"train_loss": -6.7542009353637695, "global_step": 139866, "epoch": 3330} {"train_loss": -6.948003768920898, "global_step": 139867, "epoch": 3330} {"train_loss": -6.700168609619141, "global_step": 139868, "epoch": 3330} {"train_loss": -6.731067657470703, "global_step": 139869, "epoch": 3330} {"train_loss": -6.872403144836426, "global_step": 139870, "epoch": 3330} {"train_loss": -6.766666889190674, "global_step": 139871, "epoch": 3330} {"train_loss": -6.7109375, "global_step": 139872, "epoch": 3330} {"train_loss": -6.715081691741943, "global_step": 139873, "epoch": 3330} {"train_loss": -6.80900239944458, "global_step": 139874, "epoch": 3330} {"train_loss": -6.79685115814209, "global_step": 139875, "epoch": 3330} {"train_loss": -6.8140549659729, "global_step": 139876, "epoch": 3330} {"train_loss": -6.828814506530762, "global_step": 139877, "epoch": 3330} {"train_loss": -6.714911460876465, "global_step": 139878, "epoch": 3330} {"train_loss": -6.698892593383789, "global_step": 139879, "epoch": 3330} {"train_loss": -6.852320671081543, "global_step": 139880, "epoch": 3330} {"train_loss": -6.771225929260254, "global_step": 139881, "epoch": 3330} {"train_loss": -6.842408180236816, "global_step": 139882, "epoch": 3330} {"train_loss": -6.902085304260254, "global_step": 139883, "epoch": 3330} {"train_loss": -6.790460109710693, "global_step": 139884, "epoch": 3330} {"train_loss": -6.822718620300293, "global_step": 139885, "epoch": 3330} {"train_loss": -6.769300937652588, "global_step": 139886, "epoch": 3330} {"train_loss": -6.802964210510254, "global_step": 139887, "epoch": 3330} {"train_loss": -6.841863632202148, "global_step": 139888, "epoch": 3330} {"train_loss": -6.760411262512207, "global_step": 139889, "epoch": 3330} {"train_loss": -6.813087463378906, "global_step": 139890, "epoch": 3330} {"train_loss": -6.807311058044434, "global_step": 139891, "epoch": 3330} {"train_loss": -6.7805891036987305, "global_step": 139892, "epoch": 3330} {"train_loss": -6.868309497833252, "global_step": 139893, "epoch": 3330} {"train_loss": -6.73680305480957, "global_step": 139894, "epoch": 3330} {"train_loss": -6.69258975982666, "global_step": 139895, "epoch": 3330} {"train_loss": -6.634115695953369, "global_step": 139896, "epoch": 3330} {"train_loss": -6.666298866271973, "global_step": 139897, "epoch": 3330} {"train_loss": -6.758984565734863, "global_step": 139898, "epoch": 3330} {"train_loss": -6.687753677368164, "global_step": 139899, "epoch": 3330} {"train_loss": -6.734286308288574, "global_step": 139900, "epoch": 3330} {"train_loss": -6.7788703101021905, "global_step": 139901, "epoch": 3330, "val_loss": 78332.734375} {"train_loss": -6.656321048736572, "global_step": 139902, "epoch": 3331} {"train_loss": -6.781942367553711, "global_step": 139903, "epoch": 3331} {"train_loss": -6.816821098327637, "global_step": 139904, "epoch": 3331} {"train_loss": -6.741623878479004, "global_step": 139905, "epoch": 3331} {"train_loss": -6.732388019561768, "global_step": 139906, "epoch": 3331} {"train_loss": -6.792250633239746, "global_step": 139907, "epoch": 3331} {"train_loss": -6.745706558227539, "global_step": 139908, "epoch": 3331} {"train_loss": -6.777066230773926, "global_step": 139909, "epoch": 3331} {"train_loss": -6.8812408447265625, "global_step": 139910, "epoch": 3331} {"train_loss": -6.716588020324707, "global_step": 139911, "epoch": 3331} {"train_loss": -6.668478965759277, "global_step": 139912, "epoch": 3331} {"train_loss": -6.710227012634277, "global_step": 139913, "epoch": 3331} {"train_loss": -6.636244773864746, "global_step": 139914, "epoch": 3331} {"train_loss": -6.757800102233887, "global_step": 139915, "epoch": 3331} {"train_loss": -6.7687458992004395, "global_step": 139916, "epoch": 3331} {"train_loss": -6.767049789428711, "global_step": 139917, "epoch": 3331} {"train_loss": -6.678866386413574, "global_step": 139918, "epoch": 3331} {"train_loss": -6.6693830490112305, "global_step": 139919, "epoch": 3331} {"train_loss": -6.765017986297607, "global_step": 139920, "epoch": 3331} {"train_loss": -6.72412109375, "global_step": 139921, "epoch": 3331} {"train_loss": -6.7663068771362305, "global_step": 139922, "epoch": 3331} {"train_loss": -6.753749847412109, "global_step": 139923, "epoch": 3331} {"train_loss": -6.7426438331604, "global_step": 139924, "epoch": 3331} {"train_loss": -6.706418037414551, "global_step": 139925, "epoch": 3331} {"train_loss": -6.664478778839111, "global_step": 139926, "epoch": 3331} {"train_loss": -6.814011573791504, "global_step": 139927, "epoch": 3331} {"train_loss": -6.476618766784668, "global_step": 139928, "epoch": 3331} {"train_loss": -6.758883953094482, "global_step": 139929, "epoch": 3331} {"train_loss": -6.569481372833252, "global_step": 139930, "epoch": 3331} {"train_loss": -6.561321258544922, "global_step": 139931, "epoch": 3331} {"train_loss": -6.634562015533447, "global_step": 139932, "epoch": 3331} {"train_loss": -6.567164421081543, "global_step": 139933, "epoch": 3331} {"train_loss": -6.762855052947998, "global_step": 139934, "epoch": 3331} {"train_loss": -6.588615417480469, "global_step": 139935, "epoch": 3331} {"train_loss": -6.596189975738525, "global_step": 139936, "epoch": 3331} {"train_loss": -6.616885185241699, "global_step": 139937, "epoch": 3331} {"train_loss": -6.609715461730957, "global_step": 139938, "epoch": 3331} {"train_loss": -6.496261119842529, "global_step": 139939, "epoch": 3331} {"train_loss": -6.708889007568359, "global_step": 139940, "epoch": 3331} {"train_loss": -6.625572681427002, "global_step": 139941, "epoch": 3331} {"train_loss": -6.631766319274902, "global_step": 139942, "epoch": 3331} {"train_loss": -6.69657133874439, "global_step": 139943, "epoch": 3331, "val_loss": 78298.328125} {"train_loss": -6.7829084396362305, "global_step": 139944, "epoch": 3332} {"train_loss": -6.668735027313232, "global_step": 139945, "epoch": 3332} {"train_loss": -6.744654178619385, "global_step": 139946, "epoch": 3332} {"train_loss": -6.785891532897949, "global_step": 139947, "epoch": 3332} {"train_loss": -6.653409481048584, "global_step": 139948, "epoch": 3332} {"train_loss": -6.861971378326416, "global_step": 139949, "epoch": 3332} {"train_loss": -6.718901634216309, "global_step": 139950, "epoch": 3332} {"train_loss": -6.777695655822754, "global_step": 139951, "epoch": 3332} {"train_loss": -6.765634536743164, "global_step": 139952, "epoch": 3332} {"train_loss": -6.688235282897949, "global_step": 139953, "epoch": 3332} {"train_loss": -6.79302978515625, "global_step": 139954, "epoch": 3332} {"train_loss": -6.813778877258301, "global_step": 139955, "epoch": 3332} {"train_loss": -6.793953895568848, "global_step": 139956, "epoch": 3332} {"train_loss": -6.736773490905762, "global_step": 139957, "epoch": 3332} {"train_loss": -6.869401931762695, "global_step": 139958, "epoch": 3332} {"train_loss": -6.734216213226318, "global_step": 139959, "epoch": 3332} {"train_loss": -6.8993096351623535, "global_step": 139960, "epoch": 3332} {"train_loss": -6.817104339599609, "global_step": 139961, "epoch": 3332} {"train_loss": -6.800076484680176, "global_step": 139962, "epoch": 3332} {"train_loss": -6.79716682434082, "global_step": 139963, "epoch": 3332} {"train_loss": -6.864965438842773, "global_step": 139964, "epoch": 3332} {"train_loss": -6.763823509216309, "global_step": 139965, "epoch": 3332} {"train_loss": -6.859940052032471, "global_step": 139966, "epoch": 3332} {"train_loss": -6.864500045776367, "global_step": 139967, "epoch": 3332} {"train_loss": -6.829712867736816, "global_step": 139968, "epoch": 3332} {"train_loss": -6.688143730163574, "global_step": 139969, "epoch": 3332} {"train_loss": -6.851632118225098, "global_step": 139970, "epoch": 3332} {"train_loss": -6.75456428527832, "global_step": 139971, "epoch": 3332} {"train_loss": -6.854310035705566, "global_step": 139972, "epoch": 3332} {"train_loss": -6.785588264465332, "global_step": 139973, "epoch": 3332} {"train_loss": -6.724155902862549, "global_step": 139974, "epoch": 3332} {"train_loss": -6.729672431945801, "global_step": 139975, "epoch": 3332} {"train_loss": -6.86721658706665, "global_step": 139976, "epoch": 3332} {"train_loss": -6.730815887451172, "global_step": 139977, "epoch": 3332} {"train_loss": -6.723234176635742, "global_step": 139978, "epoch": 3332} {"train_loss": -6.785618305206299, "global_step": 139979, "epoch": 3332} {"train_loss": -6.864783763885498, "global_step": 139980, "epoch": 3332} {"train_loss": -6.695631980895996, "global_step": 139981, "epoch": 3332} {"train_loss": -6.757425308227539, "global_step": 139982, "epoch": 3332} {"train_loss": -6.826152324676514, "global_step": 139983, "epoch": 3332} {"train_loss": -6.617640495300293, "global_step": 139984, "epoch": 3332} {"train_loss": -6.779146114985148, "global_step": 139985, "epoch": 3332, "val_loss": 78002.078125} {"train_loss": -6.815770626068115, "global_step": 139986, "epoch": 3333} {"train_loss": -6.662031173706055, "global_step": 139987, "epoch": 3333} {"train_loss": -6.716977596282959, "global_step": 139988, "epoch": 3333} {"train_loss": -6.834266662597656, "global_step": 139989, "epoch": 3333} {"train_loss": -6.645265579223633, "global_step": 139990, "epoch": 3333} {"train_loss": -6.823562145233154, "global_step": 139991, "epoch": 3333} {"train_loss": -6.739087104797363, "global_step": 139992, "epoch": 3333} {"train_loss": -6.746118545532227, "global_step": 139993, "epoch": 3333} {"train_loss": -6.886675834655762, "global_step": 139994, "epoch": 3333} {"train_loss": -6.770488262176514, "global_step": 139995, "epoch": 3333} {"train_loss": -6.666592597961426, "global_step": 139996, "epoch": 3333} {"train_loss": -6.805956840515137, "global_step": 139997, "epoch": 3333} {"train_loss": -6.74088191986084, "global_step": 139998, "epoch": 3333} {"train_loss": -6.810699462890625, "global_step": 139999, "epoch": 3333} {"train_loss": -6.846600532531738, "global_step": 140000, "epoch": 3333} {"train_loss": -6.549999713897705, "global_step": 140001, "epoch": 3333} {"train_loss": -6.745267868041992, "global_step": 140002, "epoch": 3333} {"train_loss": -6.839261054992676, "global_step": 140003, "epoch": 3333} {"train_loss": -6.669510841369629, "global_step": 140004, "epoch": 3333} {"train_loss": -6.888392448425293, "global_step": 140005, "epoch": 3333} {"train_loss": -6.642063140869141, "global_step": 140006, "epoch": 3333} {"train_loss": -6.684263229370117, "global_step": 140007, "epoch": 3333} {"train_loss": -6.807705402374268, "global_step": 140008, "epoch": 3333} {"train_loss": -6.639528751373291, "global_step": 140009, "epoch": 3333} {"train_loss": -6.792749404907227, "global_step": 140010, "epoch": 3333} {"train_loss": -6.721638202667236, "global_step": 140011, "epoch": 3333} {"train_loss": -6.727214813232422, "global_step": 140012, "epoch": 3333} {"train_loss": -6.867302894592285, "global_step": 140013, "epoch": 3333} {"train_loss": -6.7010626792907715, "global_step": 140014, "epoch": 3333} {"train_loss": -6.8604936599731445, "global_step": 140015, "epoch": 3333} {"train_loss": -6.789555549621582, "global_step": 140016, "epoch": 3333} {"train_loss": -6.591855049133301, "global_step": 140017, "epoch": 3333} {"train_loss": -6.760315895080566, "global_step": 140018, "epoch": 3333} {"train_loss": -6.843748092651367, "global_step": 140019, "epoch": 3333} {"train_loss": -6.711447715759277, "global_step": 140020, "epoch": 3333} {"train_loss": -6.804187297821045, "global_step": 140021, "epoch": 3333} {"train_loss": -6.711702346801758, "global_step": 140022, "epoch": 3333} {"train_loss": -6.787445068359375, "global_step": 140023, "epoch": 3333} {"train_loss": -6.8545708656311035, "global_step": 140024, "epoch": 3333} {"train_loss": -6.694231986999512, "global_step": 140025, "epoch": 3333} {"train_loss": -6.673674583435059, "global_step": 140026, "epoch": 3333} {"train_loss": -6.755068529219854, "global_step": 140027, "epoch": 3333, "val_loss": 78130.0546875} {"train_loss": -6.698534965515137, "global_step": 140028, "epoch": 3334} {"train_loss": -6.7424116134643555, "global_step": 140029, "epoch": 3334} {"train_loss": -6.744950771331787, "global_step": 140030, "epoch": 3334} {"train_loss": -6.685082912445068, "global_step": 140031, "epoch": 3334} {"train_loss": -6.822161674499512, "global_step": 140032, "epoch": 3334} {"train_loss": -6.808131217956543, "global_step": 140033, "epoch": 3334} {"train_loss": -6.733416557312012, "global_step": 140034, "epoch": 3334} {"train_loss": -6.761961936950684, "global_step": 140035, "epoch": 3334} {"train_loss": -6.859981060028076, "global_step": 140036, "epoch": 3334} {"train_loss": -6.799623012542725, "global_step": 140037, "epoch": 3334} {"train_loss": -6.710388660430908, "global_step": 140038, "epoch": 3334} {"train_loss": -6.867047309875488, "global_step": 140039, "epoch": 3334} {"train_loss": -6.80673885345459, "global_step": 140040, "epoch": 3334} {"train_loss": -6.745851516723633, "global_step": 140041, "epoch": 3334} {"train_loss": -6.797511100769043, "global_step": 140042, "epoch": 3334} {"train_loss": -6.803222179412842, "global_step": 140043, "epoch": 3334} {"train_loss": -6.769251346588135, "global_step": 140044, "epoch": 3334} {"train_loss": -6.836667537689209, "global_step": 140045, "epoch": 3334} {"train_loss": -6.777584552764893, "global_step": 140046, "epoch": 3334} {"train_loss": -6.917933940887451, "global_step": 140047, "epoch": 3334} {"train_loss": -6.740731239318848, "global_step": 140048, "epoch": 3334} {"train_loss": -6.798147201538086, "global_step": 140049, "epoch": 3334} {"train_loss": -6.7681708335876465, "global_step": 140050, "epoch": 3334} {"train_loss": -6.759222984313965, "global_step": 140051, "epoch": 3334} {"train_loss": -6.756452560424805, "global_step": 140052, "epoch": 3334} {"train_loss": -6.918848037719727, "global_step": 140053, "epoch": 3334} {"train_loss": -6.875749588012695, "global_step": 140054, "epoch": 3334} {"train_loss": -6.74992561340332, "global_step": 140055, "epoch": 3334} {"train_loss": -6.773016929626465, "global_step": 140056, "epoch": 3334} {"train_loss": -6.805397033691406, "global_step": 140057, "epoch": 3334} {"train_loss": -6.784716606140137, "global_step": 140058, "epoch": 3334} {"train_loss": -6.809788703918457, "global_step": 140059, "epoch": 3334} {"train_loss": -6.809079647064209, "global_step": 140060, "epoch": 3334} {"train_loss": -6.721344947814941, "global_step": 140061, "epoch": 3334} {"train_loss": -6.796457290649414, "global_step": 140062, "epoch": 3334} {"train_loss": -6.630024433135986, "global_step": 140063, "epoch": 3334} {"train_loss": -6.735256671905518, "global_step": 140064, "epoch": 3334} {"train_loss": -6.744610786437988, "global_step": 140065, "epoch": 3334} {"train_loss": -6.873144149780273, "global_step": 140066, "epoch": 3334} {"train_loss": -6.702692031860352, "global_step": 140067, "epoch": 3334} {"train_loss": -6.918601036071777, "global_step": 140068, "epoch": 3334} {"train_loss": -6.784089871815273, "global_step": 140069, "epoch": 3334, "val_loss": 78099.0546875} {"train_loss": -6.772247314453125, "global_step": 140070, "epoch": 3335} {"train_loss": -6.885348320007324, "global_step": 140071, "epoch": 3335} {"train_loss": -6.819666385650635, "global_step": 140072, "epoch": 3335} {"train_loss": -6.799502849578857, "global_step": 140073, "epoch": 3335} {"train_loss": -6.7968926429748535, "global_step": 140074, "epoch": 3335} {"train_loss": -6.748571395874023, "global_step": 140075, "epoch": 3335} {"train_loss": -6.7326507568359375, "global_step": 140076, "epoch": 3335} {"train_loss": -6.738795757293701, "global_step": 140077, "epoch": 3335} {"train_loss": -6.793198108673096, "global_step": 140078, "epoch": 3335} {"train_loss": -6.835417747497559, "global_step": 140079, "epoch": 3335} {"train_loss": -6.801084995269775, "global_step": 140080, "epoch": 3335} {"train_loss": -6.730177879333496, "global_step": 140081, "epoch": 3335} {"train_loss": -6.757364273071289, "global_step": 140082, "epoch": 3335} {"train_loss": -6.699098110198975, "global_step": 140083, "epoch": 3335} {"train_loss": -6.696227550506592, "global_step": 140084, "epoch": 3335} {"train_loss": -6.74709415435791, "global_step": 140085, "epoch": 3335} {"train_loss": -6.8098859786987305, "global_step": 140086, "epoch": 3335} {"train_loss": -6.551305770874023, "global_step": 140087, "epoch": 3335} {"train_loss": -6.674313545227051, "global_step": 140088, "epoch": 3335} {"train_loss": -6.689702987670898, "global_step": 140089, "epoch": 3335} {"train_loss": -6.628722190856934, "global_step": 140090, "epoch": 3335} {"train_loss": -6.854022026062012, "global_step": 140091, "epoch": 3335} {"train_loss": -6.82228946685791, "global_step": 140092, "epoch": 3335} {"train_loss": -6.850990295410156, "global_step": 140093, "epoch": 3335} {"train_loss": -6.682406902313232, "global_step": 140094, "epoch": 3335} {"train_loss": -6.686014652252197, "global_step": 140095, "epoch": 3335} {"train_loss": -6.697881698608398, "global_step": 140096, "epoch": 3335} {"train_loss": -6.672308444976807, "global_step": 140097, "epoch": 3335} {"train_loss": -6.850817680358887, "global_step": 140098, "epoch": 3335} {"train_loss": -6.803628921508789, "global_step": 140099, "epoch": 3335} {"train_loss": -6.739499092102051, "global_step": 140100, "epoch": 3335} {"train_loss": -6.749522686004639, "global_step": 140101, "epoch": 3335} {"train_loss": -6.749373435974121, "global_step": 140102, "epoch": 3335} {"train_loss": -6.729495048522949, "global_step": 140103, "epoch": 3335} {"train_loss": -6.834197044372559, "global_step": 140104, "epoch": 3335} {"train_loss": -6.73573637008667, "global_step": 140105, "epoch": 3335} {"train_loss": -6.852621078491211, "global_step": 140106, "epoch": 3335} {"train_loss": -6.772618770599365, "global_step": 140107, "epoch": 3335} {"train_loss": -6.8002166748046875, "global_step": 140108, "epoch": 3335} {"train_loss": -6.945608139038086, "global_step": 140109, "epoch": 3335} {"train_loss": -6.689976215362549, "global_step": 140110, "epoch": 3335} {"train_loss": -6.762122404007685, "global_step": 140111, "epoch": 3335, "val_loss": 78038.59375} {"train_loss": -6.705387115478516, "global_step": 140112, "epoch": 3336} {"train_loss": -6.847339630126953, "global_step": 140113, "epoch": 3336} {"train_loss": -6.815774917602539, "global_step": 140114, "epoch": 3336} {"train_loss": -6.9110565185546875, "global_step": 140115, "epoch": 3336} {"train_loss": -6.798242092132568, "global_step": 140116, "epoch": 3336} {"train_loss": -6.872941017150879, "global_step": 140117, "epoch": 3336} {"train_loss": -6.818966865539551, "global_step": 140118, "epoch": 3336} {"train_loss": -6.769634246826172, "global_step": 140119, "epoch": 3336} {"train_loss": -6.713843822479248, "global_step": 140120, "epoch": 3336} {"train_loss": -6.792448997497559, "global_step": 140121, "epoch": 3336} {"train_loss": -6.742495536804199, "global_step": 140122, "epoch": 3336} {"train_loss": -6.731775283813477, "global_step": 140123, "epoch": 3336} {"train_loss": -6.863995552062988, "global_step": 140124, "epoch": 3336} {"train_loss": -6.706995010375977, "global_step": 140125, "epoch": 3336} {"train_loss": -6.700274467468262, "global_step": 140126, "epoch": 3336} {"train_loss": -6.775606155395508, "global_step": 140127, "epoch": 3336} {"train_loss": -6.7669219970703125, "global_step": 140128, "epoch": 3336} {"train_loss": -6.7372727394104, "global_step": 140129, "epoch": 3336} {"train_loss": -6.815764427185059, "global_step": 140130, "epoch": 3336} {"train_loss": -6.772322654724121, "global_step": 140131, "epoch": 3336} {"train_loss": -6.814384460449219, "global_step": 140132, "epoch": 3336} {"train_loss": -6.738768100738525, "global_step": 140133, "epoch": 3336} {"train_loss": -6.697597503662109, "global_step": 140134, "epoch": 3336} {"train_loss": -6.717237949371338, "global_step": 140135, "epoch": 3336} {"train_loss": -6.776126384735107, "global_step": 140136, "epoch": 3336} {"train_loss": -6.686613082885742, "global_step": 140137, "epoch": 3336} {"train_loss": -6.730541706085205, "global_step": 140138, "epoch": 3336} {"train_loss": -6.70778226852417, "global_step": 140139, "epoch": 3336} {"train_loss": -6.619987487792969, "global_step": 140140, "epoch": 3336} {"train_loss": -6.705238342285156, "global_step": 140141, "epoch": 3336} {"train_loss": -6.720776557922363, "global_step": 140142, "epoch": 3336} {"train_loss": -6.683443069458008, "global_step": 140143, "epoch": 3336} {"train_loss": -6.657201766967773, "global_step": 140144, "epoch": 3336} {"train_loss": -6.849423408508301, "global_step": 140145, "epoch": 3336} {"train_loss": -6.715628147125244, "global_step": 140146, "epoch": 3336} {"train_loss": -6.827572822570801, "global_step": 140147, "epoch": 3336} {"train_loss": -6.797435283660889, "global_step": 140148, "epoch": 3336} {"train_loss": -6.700339317321777, "global_step": 140149, "epoch": 3336} {"train_loss": -6.822110652923584, "global_step": 140150, "epoch": 3336} {"train_loss": -6.669477462768555, "global_step": 140151, "epoch": 3336} {"train_loss": -6.697911262512207, "global_step": 140152, "epoch": 3336} {"train_loss": -6.756906884057181, "global_step": 140153, "epoch": 3336, "val_loss": 78443.8984375} {"train_loss": -6.758786201477051, "global_step": 140154, "epoch": 3337} {"train_loss": -6.742980003356934, "global_step": 140155, "epoch": 3337} {"train_loss": -6.703217506408691, "global_step": 140156, "epoch": 3337} {"train_loss": -6.635586738586426, "global_step": 140157, "epoch": 3337} {"train_loss": -6.77553129196167, "global_step": 140158, "epoch": 3337} {"train_loss": -6.762722015380859, "global_step": 140159, "epoch": 3337} {"train_loss": -6.806168556213379, "global_step": 140160, "epoch": 3337} {"train_loss": -6.696495056152344, "global_step": 140161, "epoch": 3337} {"train_loss": -6.776330471038818, "global_step": 140162, "epoch": 3337} {"train_loss": -6.745233535766602, "global_step": 140163, "epoch": 3337} {"train_loss": -6.7172040939331055, "global_step": 140164, "epoch": 3337} {"train_loss": -6.738665580749512, "global_step": 140165, "epoch": 3337} {"train_loss": -6.829254627227783, "global_step": 140166, "epoch": 3337} {"train_loss": -6.796494960784912, "global_step": 140167, "epoch": 3337} {"train_loss": -6.608429908752441, "global_step": 140168, "epoch": 3337} {"train_loss": -6.60803747177124, "global_step": 140169, "epoch": 3337} {"train_loss": -6.677353858947754, "global_step": 140170, "epoch": 3337} {"train_loss": -6.685234069824219, "global_step": 140171, "epoch": 3337} {"train_loss": -6.72517204284668, "global_step": 140172, "epoch": 3337} {"train_loss": -6.716830253601074, "global_step": 140173, "epoch": 3337} {"train_loss": -6.771702766418457, "global_step": 140174, "epoch": 3337} {"train_loss": -6.658351898193359, "global_step": 140175, "epoch": 3337} {"train_loss": -6.755183696746826, "global_step": 140176, "epoch": 3337} {"train_loss": -6.720782279968262, "global_step": 140177, "epoch": 3337} {"train_loss": -6.769509792327881, "global_step": 140178, "epoch": 3337} {"train_loss": -6.7808098793029785, "global_step": 140179, "epoch": 3337} {"train_loss": -6.820809364318848, "global_step": 140180, "epoch": 3337} {"train_loss": -6.799012184143066, "global_step": 140181, "epoch": 3337} {"train_loss": -6.804688453674316, "global_step": 140182, "epoch": 3337} {"train_loss": -6.774913787841797, "global_step": 140183, "epoch": 3337} {"train_loss": -6.748072147369385, "global_step": 140184, "epoch": 3337} {"train_loss": -6.8167033195495605, "global_step": 140185, "epoch": 3337} {"train_loss": -6.849602699279785, "global_step": 140186, "epoch": 3337} {"train_loss": -6.793011665344238, "global_step": 140187, "epoch": 3337} {"train_loss": -6.717560768127441, "global_step": 140188, "epoch": 3337} {"train_loss": -6.794790267944336, "global_step": 140189, "epoch": 3337} {"train_loss": -6.70596981048584, "global_step": 140190, "epoch": 3337} {"train_loss": -6.774048805236816, "global_step": 140191, "epoch": 3337} {"train_loss": -6.921950340270996, "global_step": 140192, "epoch": 3337} {"train_loss": -6.654873847961426, "global_step": 140193, "epoch": 3337} {"train_loss": -6.845650672912598, "global_step": 140194, "epoch": 3337} {"train_loss": -6.750109808785575, "global_step": 140195, "epoch": 3337, "val_loss": 78053.53125} {"train_loss": -6.78767204284668, "global_step": 140196, "epoch": 3338} {"train_loss": -6.908611297607422, "global_step": 140197, "epoch": 3338} {"train_loss": -6.85142707824707, "global_step": 140198, "epoch": 3338} {"train_loss": -6.826376914978027, "global_step": 140199, "epoch": 3338} {"train_loss": -6.838742256164551, "global_step": 140200, "epoch": 3338} {"train_loss": -6.929900169372559, "global_step": 140201, "epoch": 3338} {"train_loss": -6.912677764892578, "global_step": 140202, "epoch": 3338} {"train_loss": -6.7555694580078125, "global_step": 140203, "epoch": 3338} {"train_loss": -6.864107131958008, "global_step": 140204, "epoch": 3338} {"train_loss": -6.662841796875, "global_step": 140205, "epoch": 3338} {"train_loss": -6.835225582122803, "global_step": 140206, "epoch": 3338} {"train_loss": -6.769930839538574, "global_step": 140207, "epoch": 3338} {"train_loss": -6.7364654541015625, "global_step": 140208, "epoch": 3338} {"train_loss": -6.907079696655273, "global_step": 140209, "epoch": 3338} {"train_loss": -6.691240310668945, "global_step": 140210, "epoch": 3338} {"train_loss": -6.819492816925049, "global_step": 140211, "epoch": 3338} {"train_loss": -6.661280632019043, "global_step": 140212, "epoch": 3338} {"train_loss": -6.869706153869629, "global_step": 140213, "epoch": 3338} {"train_loss": -6.707934379577637, "global_step": 140214, "epoch": 3338} {"train_loss": -6.724384307861328, "global_step": 140215, "epoch": 3338} {"train_loss": -6.907247543334961, "global_step": 140216, "epoch": 3338} {"train_loss": -6.820486068725586, "global_step": 140217, "epoch": 3338} {"train_loss": -6.83778190612793, "global_step": 140218, "epoch": 3338} {"train_loss": -6.792870998382568, "global_step": 140219, "epoch": 3338} {"train_loss": -6.682046890258789, "global_step": 140220, "epoch": 3338} {"train_loss": -6.709460258483887, "global_step": 140221, "epoch": 3338} {"train_loss": -6.690756797790527, "global_step": 140222, "epoch": 3338} {"train_loss": -6.596312046051025, "global_step": 140223, "epoch": 3338} {"train_loss": -6.802596092224121, "global_step": 140224, "epoch": 3338} {"train_loss": -6.6982221603393555, "global_step": 140225, "epoch": 3338} {"train_loss": -6.723457336425781, "global_step": 140226, "epoch": 3338} {"train_loss": -6.723927974700928, "global_step": 140227, "epoch": 3338} {"train_loss": -6.7192487716674805, "global_step": 140228, "epoch": 3338} {"train_loss": -6.732236862182617, "global_step": 140229, "epoch": 3338} {"train_loss": -6.790895462036133, "global_step": 140230, "epoch": 3338} {"train_loss": -6.695187568664551, "global_step": 140231, "epoch": 3338} {"train_loss": -6.639383316040039, "global_step": 140232, "epoch": 3338} {"train_loss": -6.871617317199707, "global_step": 140233, "epoch": 3338} {"train_loss": -6.842350006103516, "global_step": 140234, "epoch": 3338} {"train_loss": -6.81852912902832, "global_step": 140235, "epoch": 3338} {"train_loss": -6.827747344970703, "global_step": 140236, "epoch": 3338} {"train_loss": -6.780756030763898, "global_step": 140237, "epoch": 3338, "val_loss": 78244.4921875} {"train_loss": -6.893158912658691, "global_step": 140238, "epoch": 3339} {"train_loss": -6.832340240478516, "global_step": 140239, "epoch": 3339} {"train_loss": -6.6894941329956055, "global_step": 140240, "epoch": 3339} {"train_loss": -6.844563961029053, "global_step": 140241, "epoch": 3339} {"train_loss": -6.702472686767578, "global_step": 140242, "epoch": 3339} {"train_loss": -6.778855323791504, "global_step": 140243, "epoch": 3339} {"train_loss": -6.706404685974121, "global_step": 140244, "epoch": 3339} {"train_loss": -6.82209587097168, "global_step": 140245, "epoch": 3339} {"train_loss": -6.747640609741211, "global_step": 140246, "epoch": 3339} {"train_loss": -6.739617824554443, "global_step": 140247, "epoch": 3339} {"train_loss": -6.825197219848633, "global_step": 140248, "epoch": 3339} {"train_loss": -6.778104782104492, "global_step": 140249, "epoch": 3339} {"train_loss": -6.743987083435059, "global_step": 140250, "epoch": 3339} {"train_loss": -6.787078857421875, "global_step": 140251, "epoch": 3339} {"train_loss": -6.955216407775879, "global_step": 140252, "epoch": 3339} {"train_loss": -6.7541961669921875, "global_step": 140253, "epoch": 3339} {"train_loss": -6.7821455001831055, "global_step": 140254, "epoch": 3339} {"train_loss": -6.827587127685547, "global_step": 140255, "epoch": 3339} {"train_loss": -6.818195819854736, "global_step": 140256, "epoch": 3339} {"train_loss": -6.77138614654541, "global_step": 140257, "epoch": 3339} {"train_loss": -6.78018045425415, "global_step": 140258, "epoch": 3339} {"train_loss": -6.911704063415527, "global_step": 140259, "epoch": 3339} {"train_loss": -6.87027645111084, "global_step": 140260, "epoch": 3339} {"train_loss": -6.894650459289551, "global_step": 140261, "epoch": 3339} {"train_loss": -6.8318681716918945, "global_step": 140262, "epoch": 3339} {"train_loss": -6.768593788146973, "global_step": 140263, "epoch": 3339} {"train_loss": -6.711085796356201, "global_step": 140264, "epoch": 3339} {"train_loss": -6.777746200561523, "global_step": 140265, "epoch": 3339} {"train_loss": -6.766615390777588, "global_step": 140266, "epoch": 3339} {"train_loss": -6.693525314331055, "global_step": 140267, "epoch": 3339} {"train_loss": -6.826753616333008, "global_step": 140268, "epoch": 3339} {"train_loss": -6.816985130310059, "global_step": 140269, "epoch": 3339} {"train_loss": -6.7584991455078125, "global_step": 140270, "epoch": 3339} {"train_loss": -6.847142219543457, "global_step": 140271, "epoch": 3339} {"train_loss": -6.761979103088379, "global_step": 140272, "epoch": 3339} {"train_loss": -6.761554718017578, "global_step": 140273, "epoch": 3339} {"train_loss": -6.783137798309326, "global_step": 140274, "epoch": 3339} {"train_loss": -6.676480293273926, "global_step": 140275, "epoch": 3339} {"train_loss": -6.855498313903809, "global_step": 140276, "epoch": 3339} {"train_loss": -6.897093296051025, "global_step": 140277, "epoch": 3339} {"train_loss": -6.745828628540039, "global_step": 140278, "epoch": 3339} {"train_loss": -6.7920630886441185, "global_step": 140279, "epoch": 3339, "val_loss": 78224.359375} {"train_loss": -6.710824012756348, "global_step": 140280, "epoch": 3340} {"train_loss": -6.802619934082031, "global_step": 140281, "epoch": 3340} {"train_loss": -6.815499305725098, "global_step": 140282, "epoch": 3340} {"train_loss": -6.777198791503906, "global_step": 140283, "epoch": 3340} {"train_loss": -6.669511795043945, "global_step": 140284, "epoch": 3340} {"train_loss": -6.698925018310547, "global_step": 140285, "epoch": 3340} {"train_loss": -6.801365852355957, "global_step": 140286, "epoch": 3340} {"train_loss": -6.691483497619629, "global_step": 140287, "epoch": 3340} {"train_loss": -6.731223106384277, "global_step": 140288, "epoch": 3340} {"train_loss": -6.829754829406738, "global_step": 140289, "epoch": 3340} {"train_loss": -6.713451385498047, "global_step": 140290, "epoch": 3340} {"train_loss": -6.7605180740356445, "global_step": 140291, "epoch": 3340} {"train_loss": -6.712393283843994, "global_step": 140292, "epoch": 3340} {"train_loss": -6.710068702697754, "global_step": 140293, "epoch": 3340} {"train_loss": -6.744550704956055, "global_step": 140294, "epoch": 3340} {"train_loss": -6.774019241333008, "global_step": 140295, "epoch": 3340} {"train_loss": -6.689192771911621, "global_step": 140296, "epoch": 3340} {"train_loss": -6.764316558837891, "global_step": 140297, "epoch": 3340} {"train_loss": -6.732797622680664, "global_step": 140298, "epoch": 3340} {"train_loss": -6.614805221557617, "global_step": 140299, "epoch": 3340} {"train_loss": -6.723796367645264, "global_step": 140300, "epoch": 3340} {"train_loss": -6.838999271392822, "global_step": 140301, "epoch": 3340} {"train_loss": -6.701990127563477, "global_step": 140302, "epoch": 3340} {"train_loss": -6.687705993652344, "global_step": 140303, "epoch": 3340} {"train_loss": -6.744119167327881, "global_step": 140304, "epoch": 3340} {"train_loss": -6.60853910446167, "global_step": 140305, "epoch": 3340} {"train_loss": -6.6987457275390625, "global_step": 140306, "epoch": 3340} {"train_loss": -6.753454208374023, "global_step": 140307, "epoch": 3340} {"train_loss": -6.707852363586426, "global_step": 140308, "epoch": 3340} {"train_loss": -6.635756015777588, "global_step": 140309, "epoch": 3340} {"train_loss": -6.758166790008545, "global_step": 140310, "epoch": 3340} {"train_loss": -6.6105804443359375, "global_step": 140311, "epoch": 3340} {"train_loss": -6.746250152587891, "global_step": 140312, "epoch": 3340} {"train_loss": -6.736062049865723, "global_step": 140313, "epoch": 3340} {"train_loss": -6.544829845428467, "global_step": 140314, "epoch": 3340} {"train_loss": -6.817004203796387, "global_step": 140315, "epoch": 3340} {"train_loss": -6.6571455001831055, "global_step": 140316, "epoch": 3340} {"train_loss": -6.771176815032959, "global_step": 140317, "epoch": 3340} {"train_loss": -6.657507419586182, "global_step": 140318, "epoch": 3340} {"train_loss": -6.623068809509277, "global_step": 140319, "epoch": 3340} {"train_loss": -6.790443420410156, "global_step": 140320, "epoch": 3340} {"train_loss": -6.7170253821781705, "global_step": 140321, "epoch": 3340, "val_loss": 78362.3515625} {"train_loss": -6.575093746185303, "global_step": 140322, "epoch": 3341} {"train_loss": -6.73443603515625, "global_step": 140323, "epoch": 3341} {"train_loss": -6.567553520202637, "global_step": 140324, "epoch": 3341} {"train_loss": -6.856596946716309, "global_step": 140325, "epoch": 3341} {"train_loss": -6.604097366333008, "global_step": 140326, "epoch": 3341} {"train_loss": -6.6852827072143555, "global_step": 140327, "epoch": 3341} {"train_loss": -6.761514663696289, "global_step": 140328, "epoch": 3341} {"train_loss": -6.590288162231445, "global_step": 140329, "epoch": 3341} {"train_loss": -6.775713920593262, "global_step": 140330, "epoch": 3341} {"train_loss": -6.666385650634766, "global_step": 140331, "epoch": 3341} {"train_loss": -6.738082408905029, "global_step": 140332, "epoch": 3341} {"train_loss": -6.851543426513672, "global_step": 140333, "epoch": 3341} {"train_loss": -6.741107940673828, "global_step": 140334, "epoch": 3341} {"train_loss": -6.665954113006592, "global_step": 140335, "epoch": 3341} {"train_loss": -6.672229290008545, "global_step": 140336, "epoch": 3341} {"train_loss": -6.6984758377075195, "global_step": 140337, "epoch": 3341} {"train_loss": -6.765675067901611, "global_step": 140338, "epoch": 3341} {"train_loss": -6.80436897277832, "global_step": 140339, "epoch": 3341} {"train_loss": -6.8024749755859375, "global_step": 140340, "epoch": 3341} {"train_loss": -6.8452606201171875, "global_step": 140341, "epoch": 3341} {"train_loss": -6.8768720626831055, "global_step": 140342, "epoch": 3341} {"train_loss": -6.795653820037842, "global_step": 140343, "epoch": 3341} {"train_loss": -6.931246280670166, "global_step": 140344, "epoch": 3341} {"train_loss": -6.835013389587402, "global_step": 140345, "epoch": 3341} {"train_loss": -6.745629787445068, "global_step": 140346, "epoch": 3341} {"train_loss": -6.866393089294434, "global_step": 140347, "epoch": 3341} {"train_loss": -6.7440290451049805, "global_step": 140348, "epoch": 3341} {"train_loss": -6.788763046264648, "global_step": 140349, "epoch": 3341} {"train_loss": -6.894965171813965, "global_step": 140350, "epoch": 3341} {"train_loss": -6.800283432006836, "global_step": 140351, "epoch": 3341} {"train_loss": -6.639659881591797, "global_step": 140352, "epoch": 3341} {"train_loss": -6.836852073669434, "global_step": 140353, "epoch": 3341} {"train_loss": -6.598576545715332, "global_step": 140354, "epoch": 3341} {"train_loss": -6.695140838623047, "global_step": 140355, "epoch": 3341} {"train_loss": -6.638665676116943, "global_step": 140356, "epoch": 3341} {"train_loss": -6.735710620880127, "global_step": 140357, "epoch": 3341} {"train_loss": -6.7497639656066895, "global_step": 140358, "epoch": 3341} {"train_loss": -6.791709899902344, "global_step": 140359, "epoch": 3341} {"train_loss": -6.7097578048706055, "global_step": 140360, "epoch": 3341} {"train_loss": -6.6193132400512695, "global_step": 140361, "epoch": 3341} {"train_loss": -6.792049407958984, "global_step": 140362, "epoch": 3341} {"train_loss": -6.746677001317342, "global_step": 140363, "epoch": 3341, "val_loss": 78221.1171875} {"train_loss": -6.902480125427246, "global_step": 140364, "epoch": 3342} {"train_loss": -6.935995101928711, "global_step": 140365, "epoch": 3342} {"train_loss": -6.807748794555664, "global_step": 140366, "epoch": 3342} {"train_loss": -6.806142807006836, "global_step": 140367, "epoch": 3342} {"train_loss": -6.853854179382324, "global_step": 140368, "epoch": 3342} {"train_loss": -6.873028755187988, "global_step": 140369, "epoch": 3342} {"train_loss": -6.808956623077393, "global_step": 140370, "epoch": 3342} {"train_loss": -6.80881404876709, "global_step": 140371, "epoch": 3342} {"train_loss": -6.894111156463623, "global_step": 140372, "epoch": 3342} {"train_loss": -6.871935844421387, "global_step": 140373, "epoch": 3342} {"train_loss": -6.806438446044922, "global_step": 140374, "epoch": 3342} {"train_loss": -6.787917137145996, "global_step": 140375, "epoch": 3342} {"train_loss": -6.899083137512207, "global_step": 140376, "epoch": 3342} {"train_loss": -6.732287883758545, "global_step": 140377, "epoch": 3342} {"train_loss": -6.833053112030029, "global_step": 140378, "epoch": 3342} {"train_loss": -6.844493865966797, "global_step": 140379, "epoch": 3342} {"train_loss": -6.70222806930542, "global_step": 140380, "epoch": 3342} {"train_loss": -6.795442581176758, "global_step": 140381, "epoch": 3342} {"train_loss": -6.771257400512695, "global_step": 140382, "epoch": 3342} {"train_loss": -6.711793899536133, "global_step": 140383, "epoch": 3342} {"train_loss": -6.705758094787598, "global_step": 140384, "epoch": 3342} {"train_loss": -6.66416597366333, "global_step": 140385, "epoch": 3342} {"train_loss": -6.498795986175537, "global_step": 140386, "epoch": 3342} {"train_loss": -6.744681358337402, "global_step": 140387, "epoch": 3342} {"train_loss": -6.702406883239746, "global_step": 140388, "epoch": 3342} {"train_loss": -6.648586273193359, "global_step": 140389, "epoch": 3342} {"train_loss": -6.676182746887207, "global_step": 140390, "epoch": 3342} {"train_loss": -6.77733039855957, "global_step": 140391, "epoch": 3342} {"train_loss": -6.61682653427124, "global_step": 140392, "epoch": 3342} {"train_loss": -6.8056840896606445, "global_step": 140393, "epoch": 3342} {"train_loss": -6.795087814331055, "global_step": 140394, "epoch": 3342} {"train_loss": -6.65174674987793, "global_step": 140395, "epoch": 3342} {"train_loss": -6.84279727935791, "global_step": 140396, "epoch": 3342} {"train_loss": -6.7949724197387695, "global_step": 140397, "epoch": 3342} {"train_loss": -6.658880233764648, "global_step": 140398, "epoch": 3342} {"train_loss": -6.664711952209473, "global_step": 140399, "epoch": 3342} {"train_loss": -6.676837921142578, "global_step": 140400, "epoch": 3342} {"train_loss": -6.657207012176514, "global_step": 140401, "epoch": 3342} {"train_loss": -6.826530456542969, "global_step": 140402, "epoch": 3342} {"train_loss": -6.700206756591797, "global_step": 140403, "epoch": 3342} {"train_loss": -6.736794948577881, "global_step": 140404, "epoch": 3342} {"train_loss": -6.761771122614543, "global_step": 140405, "epoch": 3342, "val_loss": 78292.359375} {"train_loss": -6.6155595779418945, "global_step": 140406, "epoch": 3343} {"train_loss": -6.789887428283691, "global_step": 140407, "epoch": 3343} {"train_loss": -6.798689842224121, "global_step": 140408, "epoch": 3343} {"train_loss": -6.875460624694824, "global_step": 140409, "epoch": 3343} {"train_loss": -6.826298713684082, "global_step": 140410, "epoch": 3343} {"train_loss": -6.7989091873168945, "global_step": 140411, "epoch": 3343} {"train_loss": -6.783062934875488, "global_step": 140412, "epoch": 3343} {"train_loss": -6.775514602661133, "global_step": 140413, "epoch": 3343} {"train_loss": -6.851142883300781, "global_step": 140414, "epoch": 3343} {"train_loss": -6.804955005645752, "global_step": 140415, "epoch": 3343} {"train_loss": -6.768817901611328, "global_step": 140416, "epoch": 3343} {"train_loss": -6.642330646514893, "global_step": 140417, "epoch": 3343} {"train_loss": -6.747715950012207, "global_step": 140418, "epoch": 3343} {"train_loss": -6.836811065673828, "global_step": 140419, "epoch": 3343} {"train_loss": -6.7431135177612305, "global_step": 140420, "epoch": 3343} {"train_loss": -6.741698265075684, "global_step": 140421, "epoch": 3343} {"train_loss": -6.80802059173584, "global_step": 140422, "epoch": 3343} {"train_loss": -6.716408729553223, "global_step": 140423, "epoch": 3343} {"train_loss": -6.756713390350342, "global_step": 140424, "epoch": 3343} {"train_loss": -6.761991500854492, "global_step": 140425, "epoch": 3343} {"train_loss": -6.50444221496582, "global_step": 140426, "epoch": 3343} {"train_loss": -6.8999247550964355, "global_step": 140427, "epoch": 3343} {"train_loss": -6.6668853759765625, "global_step": 140428, "epoch": 3343} {"train_loss": -6.724277496337891, "global_step": 140429, "epoch": 3343} {"train_loss": -6.712708473205566, "global_step": 140430, "epoch": 3343} {"train_loss": -6.598898410797119, "global_step": 140431, "epoch": 3343} {"train_loss": -6.732004165649414, "global_step": 140432, "epoch": 3343} {"train_loss": -6.674863815307617, "global_step": 140433, "epoch": 3343} {"train_loss": -6.766839504241943, "global_step": 140434, "epoch": 3343} {"train_loss": -6.641768932342529, "global_step": 140435, "epoch": 3343} {"train_loss": -6.785867691040039, "global_step": 140436, "epoch": 3343} {"train_loss": -6.779977798461914, "global_step": 140437, "epoch": 3343} {"train_loss": -6.632542133331299, "global_step": 140438, "epoch": 3343} {"train_loss": -6.743285179138184, "global_step": 140439, "epoch": 3343} {"train_loss": -6.686237335205078, "global_step": 140440, "epoch": 3343} {"train_loss": -6.837925910949707, "global_step": 140441, "epoch": 3343} {"train_loss": -6.528311252593994, "global_step": 140442, "epoch": 3343} {"train_loss": -6.726192474365234, "global_step": 140443, "epoch": 3343} {"train_loss": -6.694777011871338, "global_step": 140444, "epoch": 3343} {"train_loss": -6.664597988128662, "global_step": 140445, "epoch": 3343} {"train_loss": -6.6646318435668945, "global_step": 140446, "epoch": 3343} {"train_loss": -6.732999551863897, "global_step": 140447, "epoch": 3343, "val_loss": 78487.015625} {"train_loss": -6.732860088348389, "global_step": 140448, "epoch": 3344} {"train_loss": -6.563930511474609, "global_step": 140449, "epoch": 3344} {"train_loss": -6.715871810913086, "global_step": 140450, "epoch": 3344} {"train_loss": -6.706973075866699, "global_step": 140451, "epoch": 3344} {"train_loss": -6.762057781219482, "global_step": 140452, "epoch": 3344} {"train_loss": -6.600936412811279, "global_step": 140453, "epoch": 3344} {"train_loss": -6.774525165557861, "global_step": 140454, "epoch": 3344} {"train_loss": -6.754485130310059, "global_step": 140455, "epoch": 3344} {"train_loss": -6.6967668533325195, "global_step": 140456, "epoch": 3344} {"train_loss": -6.664742469787598, "global_step": 140457, "epoch": 3344} {"train_loss": -6.855097770690918, "global_step": 140458, "epoch": 3344} {"train_loss": -6.820468902587891, "global_step": 140459, "epoch": 3344} {"train_loss": -6.6788811683654785, "global_step": 140460, "epoch": 3344} {"train_loss": -6.776819229125977, "global_step": 140461, "epoch": 3344} {"train_loss": -6.733821392059326, "global_step": 140462, "epoch": 3344} {"train_loss": -6.67901611328125, "global_step": 140463, "epoch": 3344} {"train_loss": -6.74513578414917, "global_step": 140464, "epoch": 3344} {"train_loss": -6.72007417678833, "global_step": 140465, "epoch": 3344} {"train_loss": -6.837051868438721, "global_step": 140466, "epoch": 3344} {"train_loss": -6.867038726806641, "global_step": 140467, "epoch": 3344} {"train_loss": -6.818670272827148, "global_step": 140468, "epoch": 3344} {"train_loss": -6.710673809051514, "global_step": 140469, "epoch": 3344} {"train_loss": -6.829154968261719, "global_step": 140470, "epoch": 3344} {"train_loss": -6.8014116287231445, "global_step": 140471, "epoch": 3344} {"train_loss": -6.6845903396606445, "global_step": 140472, "epoch": 3344} {"train_loss": -6.922875881195068, "global_step": 140473, "epoch": 3344} {"train_loss": -6.787482261657715, "global_step": 140474, "epoch": 3344} {"train_loss": -6.708003997802734, "global_step": 140475, "epoch": 3344} {"train_loss": -6.799323081970215, "global_step": 140476, "epoch": 3344} {"train_loss": -6.871590614318848, "global_step": 140477, "epoch": 3344} {"train_loss": -6.754037857055664, "global_step": 140478, "epoch": 3344} {"train_loss": -6.796296119689941, "global_step": 140479, "epoch": 3344} {"train_loss": -6.834259510040283, "global_step": 140480, "epoch": 3344} {"train_loss": -6.722482681274414, "global_step": 140481, "epoch": 3344} {"train_loss": -6.8884077072143555, "global_step": 140482, "epoch": 3344} {"train_loss": -6.7257080078125, "global_step": 140483, "epoch": 3344} {"train_loss": -6.816473007202148, "global_step": 140484, "epoch": 3344} {"train_loss": -6.867856502532959, "global_step": 140485, "epoch": 3344} {"train_loss": -6.911436080932617, "global_step": 140486, "epoch": 3344} {"train_loss": -6.796477794647217, "global_step": 140487, "epoch": 3344} {"train_loss": -6.868050575256348, "global_step": 140488, "epoch": 3344} {"train_loss": -6.773108925138201, "global_step": 140489, "epoch": 3344, "val_loss": 78092.6484375} {"train_loss": -6.837718963623047, "global_step": 140490, "epoch": 3345} {"train_loss": -6.737834930419922, "global_step": 140491, "epoch": 3345} {"train_loss": -6.818645000457764, "global_step": 140492, "epoch": 3345} {"train_loss": -6.808543682098389, "global_step": 140493, "epoch": 3345} {"train_loss": -6.762775421142578, "global_step": 140494, "epoch": 3345} {"train_loss": -6.696746349334717, "global_step": 140495, "epoch": 3345} {"train_loss": -6.923103332519531, "global_step": 140496, "epoch": 3345} {"train_loss": -6.896822452545166, "global_step": 140497, "epoch": 3345} {"train_loss": -6.883737087249756, "global_step": 140498, "epoch": 3345} {"train_loss": -6.8877973556518555, "global_step": 140499, "epoch": 3345} {"train_loss": -6.680742263793945, "global_step": 140500, "epoch": 3345} {"train_loss": -6.7325310707092285, "global_step": 140501, "epoch": 3345} {"train_loss": -6.864987373352051, "global_step": 140502, "epoch": 3345} {"train_loss": -6.809426307678223, "global_step": 140503, "epoch": 3345} {"train_loss": -6.91175651550293, "global_step": 140504, "epoch": 3345} {"train_loss": -6.812129020690918, "global_step": 140505, "epoch": 3345} {"train_loss": -6.795792579650879, "global_step": 140506, "epoch": 3345} {"train_loss": -6.680283546447754, "global_step": 140507, "epoch": 3345} {"train_loss": -6.750294208526611, "global_step": 140508, "epoch": 3345} {"train_loss": -6.7250494956970215, "global_step": 140509, "epoch": 3345} {"train_loss": -6.751219749450684, "global_step": 140510, "epoch": 3345} {"train_loss": -6.7853899002075195, "global_step": 140511, "epoch": 3345} {"train_loss": -6.674196243286133, "global_step": 140512, "epoch": 3345} {"train_loss": -6.7238311767578125, "global_step": 140513, "epoch": 3345} {"train_loss": -6.73902702331543, "global_step": 140514, "epoch": 3345} {"train_loss": -6.770096778869629, "global_step": 140515, "epoch": 3345} {"train_loss": -6.727051734924316, "global_step": 140516, "epoch": 3345} {"train_loss": -6.806332111358643, "global_step": 140517, "epoch": 3345} {"train_loss": -6.754513740539551, "global_step": 140518, "epoch": 3345} {"train_loss": -6.850184917449951, "global_step": 140519, "epoch": 3345} {"train_loss": -6.793527603149414, "global_step": 140520, "epoch": 3345} {"train_loss": -6.910930633544922, "global_step": 140521, "epoch": 3345} {"train_loss": -6.766329765319824, "global_step": 140522, "epoch": 3345} {"train_loss": -6.802976131439209, "global_step": 140523, "epoch": 3345} {"train_loss": -6.725264549255371, "global_step": 140524, "epoch": 3345} {"train_loss": -6.757848262786865, "global_step": 140525, "epoch": 3345} {"train_loss": -6.669224262237549, "global_step": 140526, "epoch": 3345} {"train_loss": -6.749057292938232, "global_step": 140527, "epoch": 3345} {"train_loss": -6.655970573425293, "global_step": 140528, "epoch": 3345} {"train_loss": -6.530524253845215, "global_step": 140529, "epoch": 3345} {"train_loss": -6.7219390869140625, "global_step": 140530, "epoch": 3345} {"train_loss": -6.768935544150216, "global_step": 140531, "epoch": 3345, "val_loss": 78136.46875} {"train_loss": -6.766880512237549, "global_step": 140532, "epoch": 3346} {"train_loss": -6.642906188964844, "global_step": 140533, "epoch": 3346} {"train_loss": -6.66463041305542, "global_step": 140534, "epoch": 3346} {"train_loss": -6.7849555015563965, "global_step": 140535, "epoch": 3346} {"train_loss": -6.603432655334473, "global_step": 140536, "epoch": 3346} {"train_loss": -6.6683125495910645, "global_step": 140537, "epoch": 3346} {"train_loss": -6.55400276184082, "global_step": 140538, "epoch": 3346} {"train_loss": -6.7016921043396, "global_step": 140539, "epoch": 3346} {"train_loss": -6.81784725189209, "global_step": 140540, "epoch": 3346} {"train_loss": -6.736372947692871, "global_step": 140541, "epoch": 3346} {"train_loss": -6.833884239196777, "global_step": 140542, "epoch": 3346} {"train_loss": -6.726240158081055, "global_step": 140543, "epoch": 3346} {"train_loss": -6.77388858795166, "global_step": 140544, "epoch": 3346} {"train_loss": -6.685007095336914, "global_step": 140545, "epoch": 3346} {"train_loss": -6.728897571563721, "global_step": 140546, "epoch": 3346} {"train_loss": -6.7754597663879395, "global_step": 140547, "epoch": 3346} {"train_loss": -6.675107955932617, "global_step": 140548, "epoch": 3346} {"train_loss": -6.79000186920166, "global_step": 140549, "epoch": 3346} {"train_loss": -6.643209457397461, "global_step": 140550, "epoch": 3346} {"train_loss": -6.712105751037598, "global_step": 140551, "epoch": 3346} {"train_loss": -6.719071388244629, "global_step": 140552, "epoch": 3346} {"train_loss": -6.813963890075684, "global_step": 140553, "epoch": 3346} {"train_loss": -6.669438362121582, "global_step": 140554, "epoch": 3346} {"train_loss": -6.9198784828186035, "global_step": 140555, "epoch": 3346} {"train_loss": -6.832373142242432, "global_step": 140556, "epoch": 3346} {"train_loss": -6.719237327575684, "global_step": 140557, "epoch": 3346} {"train_loss": -6.800130844116211, "global_step": 140558, "epoch": 3346} {"train_loss": -6.678558826446533, "global_step": 140559, "epoch": 3346} {"train_loss": -6.728583335876465, "global_step": 140560, "epoch": 3346} {"train_loss": -6.75646448135376, "global_step": 140561, "epoch": 3346} {"train_loss": -6.683366775512695, "global_step": 140562, "epoch": 3346} {"train_loss": -6.663578033447266, "global_step": 140563, "epoch": 3346} {"train_loss": -6.660078048706055, "global_step": 140564, "epoch": 3346} {"train_loss": -6.568129539489746, "global_step": 140565, "epoch": 3346} {"train_loss": -6.772580146789551, "global_step": 140566, "epoch": 3346} {"train_loss": -6.754903793334961, "global_step": 140567, "epoch": 3346} {"train_loss": -6.627098083496094, "global_step": 140568, "epoch": 3346} {"train_loss": -6.8613715171813965, "global_step": 140569, "epoch": 3346} {"train_loss": -6.512724876403809, "global_step": 140570, "epoch": 3346} {"train_loss": -6.8402557373046875, "global_step": 140571, "epoch": 3346} {"train_loss": -6.741887092590332, "global_step": 140572, "epoch": 3346} {"train_loss": -6.720066536040533, "global_step": 140573, "epoch": 3346, "val_loss": 78345.1171875} {"train_loss": -6.823216438293457, "global_step": 140574, "epoch": 3347} {"train_loss": -6.73483419418335, "global_step": 140575, "epoch": 3347} {"train_loss": -6.710150718688965, "global_step": 140576, "epoch": 3347} {"train_loss": -6.6718339920043945, "global_step": 140577, "epoch": 3347} {"train_loss": -6.656511306762695, "global_step": 140578, "epoch": 3347} {"train_loss": -6.818727493286133, "global_step": 140579, "epoch": 3347} {"train_loss": -6.780187606811523, "global_step": 140580, "epoch": 3347} {"train_loss": -6.7997307777404785, "global_step": 140581, "epoch": 3347} {"train_loss": -6.609632968902588, "global_step": 140582, "epoch": 3347} {"train_loss": -6.80086088180542, "global_step": 140583, "epoch": 3347} {"train_loss": -6.821990489959717, "global_step": 140584, "epoch": 3347} {"train_loss": -6.746549606323242, "global_step": 140585, "epoch": 3347} {"train_loss": -6.764693737030029, "global_step": 140586, "epoch": 3347} {"train_loss": -6.77574348449707, "global_step": 140587, "epoch": 3347} {"train_loss": -6.810263633728027, "global_step": 140588, "epoch": 3347} {"train_loss": -6.791809558868408, "global_step": 140589, "epoch": 3347} {"train_loss": -6.749698638916016, "global_step": 140590, "epoch": 3347} {"train_loss": -6.724770545959473, "global_step": 140591, "epoch": 3347} {"train_loss": -6.7554521560668945, "global_step": 140592, "epoch": 3347} {"train_loss": -6.864717483520508, "global_step": 140593, "epoch": 3347} {"train_loss": -6.7718400955200195, "global_step": 140594, "epoch": 3347} {"train_loss": -6.798650741577148, "global_step": 140595, "epoch": 3347} {"train_loss": -6.779331207275391, "global_step": 140596, "epoch": 3347} {"train_loss": -6.731695175170898, "global_step": 140597, "epoch": 3347} {"train_loss": -6.773910999298096, "global_step": 140598, "epoch": 3347} {"train_loss": -6.731776237487793, "global_step": 140599, "epoch": 3347} {"train_loss": -6.967360496520996, "global_step": 140600, "epoch": 3347} {"train_loss": -6.7730255126953125, "global_step": 140601, "epoch": 3347} {"train_loss": -6.807708740234375, "global_step": 140602, "epoch": 3347} {"train_loss": -6.758167266845703, "global_step": 140603, "epoch": 3347} {"train_loss": -6.809557914733887, "global_step": 140604, "epoch": 3347} {"train_loss": -6.850112438201904, "global_step": 140605, "epoch": 3347} {"train_loss": -6.905383110046387, "global_step": 140606, "epoch": 3347} {"train_loss": -6.7935075759887695, "global_step": 140607, "epoch": 3347} {"train_loss": -6.844054698944092, "global_step": 140608, "epoch": 3347} {"train_loss": -6.814800262451172, "global_step": 140609, "epoch": 3347} {"train_loss": -6.744919776916504, "global_step": 140610, "epoch": 3347} {"train_loss": -6.819209098815918, "global_step": 140611, "epoch": 3347} {"train_loss": -6.882225513458252, "global_step": 140612, "epoch": 3347} {"train_loss": -6.720788955688477, "global_step": 140613, "epoch": 3347} {"train_loss": -6.777632236480713, "global_step": 140614, "epoch": 3347} {"train_loss": -6.7846848737625844, "global_step": 140615, "epoch": 3347, "val_loss": 78211.6484375} {"train_loss": -6.896040916442871, "global_step": 140616, "epoch": 3348} {"train_loss": -6.7885284423828125, "global_step": 140617, "epoch": 3348} {"train_loss": -6.782608985900879, "global_step": 140618, "epoch": 3348} {"train_loss": -6.786090850830078, "global_step": 140619, "epoch": 3348} {"train_loss": -6.862828254699707, "global_step": 140620, "epoch": 3348} {"train_loss": -6.915173530578613, "global_step": 140621, "epoch": 3348} {"train_loss": -6.870578289031982, "global_step": 140622, "epoch": 3348} {"train_loss": -6.768745422363281, "global_step": 140623, "epoch": 3348} {"train_loss": -6.748104095458984, "global_step": 140624, "epoch": 3348} {"train_loss": -6.807182312011719, "global_step": 140625, "epoch": 3348} {"train_loss": -6.842557430267334, "global_step": 140626, "epoch": 3348} {"train_loss": -6.759267807006836, "global_step": 140627, "epoch": 3348} {"train_loss": -6.692002296447754, "global_step": 140628, "epoch": 3348} {"train_loss": -6.708889961242676, "global_step": 140629, "epoch": 3348} {"train_loss": -6.852342128753662, "global_step": 140630, "epoch": 3348} {"train_loss": -6.663071632385254, "global_step": 140631, "epoch": 3348} {"train_loss": -6.680115699768066, "global_step": 140632, "epoch": 3348} {"train_loss": -6.745102882385254, "global_step": 140633, "epoch": 3348} {"train_loss": -6.776602268218994, "global_step": 140634, "epoch": 3348} {"train_loss": -6.721723556518555, "global_step": 140635, "epoch": 3348} {"train_loss": -6.841860771179199, "global_step": 140636, "epoch": 3348} {"train_loss": -6.644604682922363, "global_step": 140637, "epoch": 3348} {"train_loss": -6.790719985961914, "global_step": 140638, "epoch": 3348} {"train_loss": -6.799888610839844, "global_step": 140639, "epoch": 3348} {"train_loss": -6.721153259277344, "global_step": 140640, "epoch": 3348} {"train_loss": -6.789438247680664, "global_step": 140641, "epoch": 3348} {"train_loss": -6.770308494567871, "global_step": 140642, "epoch": 3348} {"train_loss": -6.773982048034668, "global_step": 140643, "epoch": 3348} {"train_loss": -6.747116565704346, "global_step": 140644, "epoch": 3348} {"train_loss": -6.6455793380737305, "global_step": 140645, "epoch": 3348} {"train_loss": -6.844587326049805, "global_step": 140646, "epoch": 3348} {"train_loss": -6.732174873352051, "global_step": 140647, "epoch": 3348} {"train_loss": -6.804662227630615, "global_step": 140648, "epoch": 3348} {"train_loss": -6.7399420738220215, "global_step": 140649, "epoch": 3348} {"train_loss": -6.729118347167969, "global_step": 140650, "epoch": 3348} {"train_loss": -6.81827449798584, "global_step": 140651, "epoch": 3348} {"train_loss": -6.723655700683594, "global_step": 140652, "epoch": 3348} {"train_loss": -6.663572311401367, "global_step": 140653, "epoch": 3348} {"train_loss": -6.794066429138184, "global_step": 140654, "epoch": 3348} {"train_loss": -6.901494026184082, "global_step": 140655, "epoch": 3348} {"train_loss": -6.850127220153809, "global_step": 140656, "epoch": 3348} {"train_loss": -6.775407371066866, "global_step": 140657, "epoch": 3348, "val_loss": 78064.6875} {"train_loss": -6.83393669128418, "global_step": 140658, "epoch": 3349} {"train_loss": -6.866159915924072, "global_step": 140659, "epoch": 3349} {"train_loss": -6.738263130187988, "global_step": 140660, "epoch": 3349} {"train_loss": -6.891779899597168, "global_step": 140661, "epoch": 3349} {"train_loss": -6.726950645446777, "global_step": 140662, "epoch": 3349} {"train_loss": -6.778926849365234, "global_step": 140663, "epoch": 3349} {"train_loss": -6.787894248962402, "global_step": 140664, "epoch": 3349} {"train_loss": -6.905800819396973, "global_step": 140665, "epoch": 3349} {"train_loss": -6.706833362579346, "global_step": 140666, "epoch": 3349} {"train_loss": -6.793348789215088, "global_step": 140667, "epoch": 3349} {"train_loss": -6.775940895080566, "global_step": 140668, "epoch": 3349} {"train_loss": -6.770842552185059, "global_step": 140669, "epoch": 3349} {"train_loss": -6.863244533538818, "global_step": 140670, "epoch": 3349} {"train_loss": -6.723141670227051, "global_step": 140671, "epoch": 3349} {"train_loss": -6.7605509757995605, "global_step": 140672, "epoch": 3349} {"train_loss": -6.818141937255859, "global_step": 140673, "epoch": 3349} {"train_loss": -6.827520370483398, "global_step": 140674, "epoch": 3349} {"train_loss": -6.763467788696289, "global_step": 140675, "epoch": 3349} {"train_loss": -6.855537414550781, "global_step": 140676, "epoch": 3349} {"train_loss": -6.76959228515625, "global_step": 140677, "epoch": 3349} {"train_loss": -6.8135600090026855, "global_step": 140678, "epoch": 3349} {"train_loss": -6.854434013366699, "global_step": 140679, "epoch": 3349} {"train_loss": -6.794894218444824, "global_step": 140680, "epoch": 3349} {"train_loss": -6.753404140472412, "global_step": 140681, "epoch": 3349} {"train_loss": -6.670588493347168, "global_step": 140682, "epoch": 3349} {"train_loss": -6.7908854484558105, "global_step": 140683, "epoch": 3349} {"train_loss": -6.738354682922363, "global_step": 140684, "epoch": 3349} {"train_loss": -6.701083660125732, "global_step": 140685, "epoch": 3349} {"train_loss": -6.769853591918945, "global_step": 140686, "epoch": 3349} {"train_loss": -6.8325395584106445, "global_step": 140687, "epoch": 3349} {"train_loss": -6.647861480712891, "global_step": 140688, "epoch": 3349} {"train_loss": -6.775132179260254, "global_step": 140689, "epoch": 3349} {"train_loss": -6.725472927093506, "global_step": 140690, "epoch": 3349} {"train_loss": -6.776829719543457, "global_step": 140691, "epoch": 3349} {"train_loss": -6.764167785644531, "global_step": 140692, "epoch": 3349} {"train_loss": -6.693558216094971, "global_step": 140693, "epoch": 3349} {"train_loss": -6.684004306793213, "global_step": 140694, "epoch": 3349} {"train_loss": -6.7620849609375, "global_step": 140695, "epoch": 3349} {"train_loss": -6.620068550109863, "global_step": 140696, "epoch": 3349} {"train_loss": -6.776039123535156, "global_step": 140697, "epoch": 3349} {"train_loss": -6.7552971839904785, "global_step": 140698, "epoch": 3349} {"train_loss": -6.771483818689982, "global_step": 140699, "epoch": 3349, "val_loss": 78141.7890625} {"train_loss": -6.937555313110352, "global_step": 140700, "epoch": 3350} {"train_loss": -6.706500053405762, "global_step": 140701, "epoch": 3350} {"train_loss": -6.702364921569824, "global_step": 140702, "epoch": 3350} {"train_loss": -6.663158416748047, "global_step": 140703, "epoch": 3350} {"train_loss": -6.681691646575928, "global_step": 140704, "epoch": 3350} {"train_loss": -6.691189765930176, "global_step": 140705, "epoch": 3350} {"train_loss": -6.613471508026123, "global_step": 140706, "epoch": 3350} {"train_loss": -6.567950248718262, "global_step": 140707, "epoch": 3350} {"train_loss": -6.787746429443359, "global_step": 140708, "epoch": 3350} {"train_loss": -6.70049524307251, "global_step": 140709, "epoch": 3350} {"train_loss": -6.787974834442139, "global_step": 140710, "epoch": 3350} {"train_loss": -6.705021858215332, "global_step": 140711, "epoch": 3350} {"train_loss": -6.700199127197266, "global_step": 140712, "epoch": 3350} {"train_loss": -6.7411346435546875, "global_step": 140713, "epoch": 3350} {"train_loss": -6.730526447296143, "global_step": 140714, "epoch": 3350} {"train_loss": -6.751889705657959, "global_step": 140715, "epoch": 3350} {"train_loss": -6.750571250915527, "global_step": 140716, "epoch": 3350} {"train_loss": -6.781347274780273, "global_step": 140717, "epoch": 3350} {"train_loss": -6.810923099517822, "global_step": 140718, "epoch": 3350} {"train_loss": -6.69193696975708, "global_step": 140719, "epoch": 3350} {"train_loss": -6.763903617858887, "global_step": 140720, "epoch": 3350} {"train_loss": -6.781201362609863, "global_step": 140721, "epoch": 3350} {"train_loss": -6.86784553527832, "global_step": 140722, "epoch": 3350} {"train_loss": -6.771821022033691, "global_step": 140723, "epoch": 3350} {"train_loss": -6.708499431610107, "global_step": 140724, "epoch": 3350} {"train_loss": -6.782980918884277, "global_step": 140725, "epoch": 3350} {"train_loss": -6.844572067260742, "global_step": 140726, "epoch": 3350} {"train_loss": -6.785066604614258, "global_step": 140727, "epoch": 3350} {"train_loss": -6.845534324645996, "global_step": 140728, "epoch": 3350} {"train_loss": -6.753111839294434, "global_step": 140729, "epoch": 3350} {"train_loss": -6.834710121154785, "global_step": 140730, "epoch": 3350} {"train_loss": -6.72917366027832, "global_step": 140731, "epoch": 3350} {"train_loss": -6.7668561935424805, "global_step": 140732, "epoch": 3350} {"train_loss": -6.682041645050049, "global_step": 140733, "epoch": 3350} {"train_loss": -6.749393939971924, "global_step": 140734, "epoch": 3350} {"train_loss": -6.7905497550964355, "global_step": 140735, "epoch": 3350} {"train_loss": -6.728322505950928, "global_step": 140736, "epoch": 3350} {"train_loss": -6.619690895080566, "global_step": 140737, "epoch": 3350} {"train_loss": -6.73663330078125, "global_step": 140738, "epoch": 3350} {"train_loss": -6.715665817260742, "global_step": 140739, "epoch": 3350} {"train_loss": -6.794556617736816, "global_step": 140740, "epoch": 3350} {"train_loss": -6.745847520374117, "global_step": 140741, "epoch": 3350, "train/sim_max_reward_0": 0.979268642966024, "train/sim_max_reward_1": 0.9189955356866386, "train/sim_max_reward_2": 0.48209791235326205, "train/sim_max_reward_3": 0.1398271320043724, "train/sim_max_reward_4": 0.455373774685323, "train/sim_max_reward_5": 0.5798204392839919, "test/sim_max_reward_4500000": 0.9200529224042804, "test/sim_max_reward_4500001": 0.9475415240730499, "test/sim_max_reward_4500002": 0.9158763046572482, "test/sim_max_reward_4500003": 0.9561117987300861, "test/sim_max_reward_4500004": 0.14811348176091244, "test/sim_max_reward_4500005": 0.4091401986825263, "test/sim_max_reward_4500006": 0.9292015673019552, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.8764012226256473, "test/sim_max_reward_4500009": 0.05352865159482127, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9920078895549417, "test/sim_max_reward_4500012": 0.9946382573956826, "test/sim_max_reward_4500013": 0.0020087518360477753, "test/sim_max_reward_4500014": 0.3826917125095503, "test/sim_max_reward_4500015": 0.9124583930072588, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.17588443013062, "test/sim_max_reward_4500018": 0.4226182933911735, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.45807314532069465, "test/sim_max_reward_4500022": 0.9494887455603399, "test/sim_max_reward_4500023": 0.9201931006231416, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.6800083886391732, "test/sim_max_reward_4500026": 0.8847000621186537, "test/sim_max_reward_4500027": 0.9606405923409366, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.13060110357851387, "test/sim_max_reward_4500030": 0.8819727847954414, "test/sim_max_reward_4500031": 0.3915636665326893, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.23141728338571813, "test/sim_max_reward_4500034": 0.8799340686159419, "test/sim_max_reward_4500035": 0.6557578987709756, "test/sim_max_reward_4500036": 0.9788131936184299, "test/sim_max_reward_4500037": 0.8623090944747223, "test/sim_max_reward_4500038": 0.3155143871791256, "test/sim_max_reward_4500039": 0.9019591217734348, "test/sim_max_reward_4500040": 0.940080386960197, "test/sim_max_reward_4500041": 0.7305990454819871, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.25480739262707636, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.3954526739269966, "test/sim_max_reward_4500046": 0.20193610541546148, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 0.9827074061352896, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5925639061632686, "test/mean_score": 0.558029516092605, "val_loss": 78074.4921875} {"train_loss": -6.659881591796875, "global_step": 140742, "epoch": 3351} {"train_loss": -6.633062362670898, "global_step": 140743, "epoch": 3351} {"train_loss": -6.770406246185303, "global_step": 140744, "epoch": 3351} {"train_loss": -6.518986701965332, "global_step": 140745, "epoch": 3351} {"train_loss": -6.88558292388916, "global_step": 140746, "epoch": 3351} {"train_loss": -6.656789302825928, "global_step": 140747, "epoch": 3351} {"train_loss": -6.599416732788086, "global_step": 140748, "epoch": 3351} {"train_loss": -6.590146064758301, "global_step": 140749, "epoch": 3351} {"train_loss": -6.568948745727539, "global_step": 140750, "epoch": 3351} {"train_loss": -6.724865436553955, "global_step": 140751, "epoch": 3351} {"train_loss": -6.5365095138549805, "global_step": 140752, "epoch": 3351} {"train_loss": -6.71026611328125, "global_step": 140753, "epoch": 3351} {"train_loss": -6.57148551940918, "global_step": 140754, "epoch": 3351} {"train_loss": -6.613454818725586, "global_step": 140755, "epoch": 3351} {"train_loss": -6.621679306030273, "global_step": 140756, "epoch": 3351} {"train_loss": -6.619765281677246, "global_step": 140757, "epoch": 3351} {"train_loss": -6.7177324295043945, "global_step": 140758, "epoch": 3351} {"train_loss": -6.599096298217773, "global_step": 140759, "epoch": 3351} {"train_loss": -6.732776165008545, "global_step": 140760, "epoch": 3351} {"train_loss": -6.615824222564697, "global_step": 140761, "epoch": 3351} {"train_loss": -6.677947521209717, "global_step": 140762, "epoch": 3351} {"train_loss": -6.590152740478516, "global_step": 140763, "epoch": 3351} {"train_loss": -6.548429012298584, "global_step": 140764, "epoch": 3351} {"train_loss": -6.760930061340332, "global_step": 140765, "epoch": 3351} {"train_loss": -6.685311317443848, "global_step": 140766, "epoch": 3351} {"train_loss": -6.744121551513672, "global_step": 140767, "epoch": 3351} {"train_loss": -6.675127029418945, "global_step": 140768, "epoch": 3351} {"train_loss": -6.76479434967041, "global_step": 140769, "epoch": 3351} {"train_loss": -6.584471225738525, "global_step": 140770, "epoch": 3351} {"train_loss": -6.639510154724121, "global_step": 140771, "epoch": 3351} {"train_loss": -6.740976333618164, "global_step": 140772, "epoch": 3351} {"train_loss": -6.663943290710449, "global_step": 140773, "epoch": 3351} {"train_loss": -6.7674665451049805, "global_step": 140774, "epoch": 3351} {"train_loss": -6.783204078674316, "global_step": 140775, "epoch": 3351} {"train_loss": -6.828902244567871, "global_step": 140776, "epoch": 3351} {"train_loss": -6.732518196105957, "global_step": 140777, "epoch": 3351} {"train_loss": -6.816338539123535, "global_step": 140778, "epoch": 3351} {"train_loss": -6.764047622680664, "global_step": 140779, "epoch": 3351} {"train_loss": -6.700081825256348, "global_step": 140780, "epoch": 3351} {"train_loss": -6.825945854187012, "global_step": 140781, "epoch": 3351} {"train_loss": -6.5667924880981445, "global_step": 140782, "epoch": 3351} {"train_loss": -6.679764917918614, "global_step": 140783, "epoch": 3351, "val_loss": 77972.0625} {"train_loss": -6.7847514152526855, "global_step": 140784, "epoch": 3352} {"train_loss": -6.739452362060547, "global_step": 140785, "epoch": 3352} {"train_loss": -6.796808242797852, "global_step": 140786, "epoch": 3352} {"train_loss": -6.666815280914307, "global_step": 140787, "epoch": 3352} {"train_loss": -6.746387004852295, "global_step": 140788, "epoch": 3352} {"train_loss": -6.7584028244018555, "global_step": 140789, "epoch": 3352} {"train_loss": -6.620643138885498, "global_step": 140790, "epoch": 3352} {"train_loss": -6.674200534820557, "global_step": 140791, "epoch": 3352} {"train_loss": -6.7596845626831055, "global_step": 140792, "epoch": 3352} {"train_loss": -6.781325817108154, "global_step": 140793, "epoch": 3352} {"train_loss": -6.8440046310424805, "global_step": 140794, "epoch": 3352} {"train_loss": -6.749493598937988, "global_step": 140795, "epoch": 3352} {"train_loss": -6.809082984924316, "global_step": 140796, "epoch": 3352} {"train_loss": -6.807092666625977, "global_step": 140797, "epoch": 3352} {"train_loss": -6.805130481719971, "global_step": 140798, "epoch": 3352} {"train_loss": -6.70430326461792, "global_step": 140799, "epoch": 3352} {"train_loss": -6.83074951171875, "global_step": 140800, "epoch": 3352} {"train_loss": -6.814220428466797, "global_step": 140801, "epoch": 3352} {"train_loss": -6.806552886962891, "global_step": 140802, "epoch": 3352} {"train_loss": -6.872175216674805, "global_step": 140803, "epoch": 3352} {"train_loss": -6.716988563537598, "global_step": 140804, "epoch": 3352} {"train_loss": -6.820502281188965, "global_step": 140805, "epoch": 3352} {"train_loss": -6.8318328857421875, "global_step": 140806, "epoch": 3352} {"train_loss": -6.716069221496582, "global_step": 140807, "epoch": 3352} {"train_loss": -6.8165998458862305, "global_step": 140808, "epoch": 3352} {"train_loss": -6.865185260772705, "global_step": 140809, "epoch": 3352} {"train_loss": -6.852176666259766, "global_step": 140810, "epoch": 3352} {"train_loss": -6.837204933166504, "global_step": 140811, "epoch": 3352} {"train_loss": -6.82358980178833, "global_step": 140812, "epoch": 3352} {"train_loss": -6.791717529296875, "global_step": 140813, "epoch": 3352} {"train_loss": -6.950685501098633, "global_step": 140814, "epoch": 3352} {"train_loss": -6.8547892570495605, "global_step": 140815, "epoch": 3352} {"train_loss": -6.806098461151123, "global_step": 140816, "epoch": 3352} {"train_loss": -6.859014511108398, "global_step": 140817, "epoch": 3352} {"train_loss": -6.845186710357666, "global_step": 140818, "epoch": 3352} {"train_loss": -6.77735710144043, "global_step": 140819, "epoch": 3352} {"train_loss": -6.731867790222168, "global_step": 140820, "epoch": 3352} {"train_loss": -6.660738945007324, "global_step": 140821, "epoch": 3352} {"train_loss": -6.7116498947143555, "global_step": 140822, "epoch": 3352} {"train_loss": -6.840290069580078, "global_step": 140823, "epoch": 3352} {"train_loss": -6.748217582702637, "global_step": 140824, "epoch": 3352} {"train_loss": -6.787420954023089, "global_step": 140825, "epoch": 3352, "val_loss": 78324.5546875} {"train_loss": -6.707939624786377, "global_step": 140826, "epoch": 3353} {"train_loss": -6.550128936767578, "global_step": 140827, "epoch": 3353} {"train_loss": -6.841990947723389, "global_step": 140828, "epoch": 3353} {"train_loss": -6.716865539550781, "global_step": 140829, "epoch": 3353} {"train_loss": -6.718199729919434, "global_step": 140830, "epoch": 3353} {"train_loss": -6.866971969604492, "global_step": 140831, "epoch": 3353} {"train_loss": -6.675040245056152, "global_step": 140832, "epoch": 3353} {"train_loss": -6.733083724975586, "global_step": 140833, "epoch": 3353} {"train_loss": -6.768655300140381, "global_step": 140834, "epoch": 3353} {"train_loss": -6.726099967956543, "global_step": 140835, "epoch": 3353} {"train_loss": -6.823875427246094, "global_step": 140836, "epoch": 3353} {"train_loss": -6.768481731414795, "global_step": 140837, "epoch": 3353} {"train_loss": -6.725586891174316, "global_step": 140838, "epoch": 3353} {"train_loss": -6.791788101196289, "global_step": 140839, "epoch": 3353} {"train_loss": -6.739658355712891, "global_step": 140840, "epoch": 3353} {"train_loss": -6.705234527587891, "global_step": 140841, "epoch": 3353} {"train_loss": -6.849442481994629, "global_step": 140842, "epoch": 3353} {"train_loss": -6.6876654624938965, "global_step": 140843, "epoch": 3353} {"train_loss": -6.693929672241211, "global_step": 140844, "epoch": 3353} {"train_loss": -6.741150856018066, "global_step": 140845, "epoch": 3353} {"train_loss": -6.602278709411621, "global_step": 140846, "epoch": 3353} {"train_loss": -6.766007423400879, "global_step": 140847, "epoch": 3353} {"train_loss": -6.739461421966553, "global_step": 140848, "epoch": 3353} {"train_loss": -6.768263816833496, "global_step": 140849, "epoch": 3353} {"train_loss": -6.733551979064941, "global_step": 140850, "epoch": 3353} {"train_loss": -6.635453224182129, "global_step": 140851, "epoch": 3353} {"train_loss": -6.748757362365723, "global_step": 140852, "epoch": 3353} {"train_loss": -6.681268692016602, "global_step": 140853, "epoch": 3353} {"train_loss": -6.718510150909424, "global_step": 140854, "epoch": 3353} {"train_loss": -6.709738254547119, "global_step": 140855, "epoch": 3353} {"train_loss": -6.743008136749268, "global_step": 140856, "epoch": 3353} {"train_loss": -6.645559787750244, "global_step": 140857, "epoch": 3353} {"train_loss": -6.63845157623291, "global_step": 140858, "epoch": 3353} {"train_loss": -6.785025119781494, "global_step": 140859, "epoch": 3353} {"train_loss": -6.8591766357421875, "global_step": 140860, "epoch": 3353} {"train_loss": -6.773754596710205, "global_step": 140861, "epoch": 3353} {"train_loss": -6.871316909790039, "global_step": 140862, "epoch": 3353} {"train_loss": -6.966940402984619, "global_step": 140863, "epoch": 3353} {"train_loss": -6.641445636749268, "global_step": 140864, "epoch": 3353} {"train_loss": -6.78143310546875, "global_step": 140865, "epoch": 3353} {"train_loss": -6.769956588745117, "global_step": 140866, "epoch": 3353} {"train_loss": -6.740666275932675, "global_step": 140867, "epoch": 3353, "val_loss": 77863.5234375} {"train_loss": -6.784111976623535, "global_step": 140868, "epoch": 3354} {"train_loss": -6.763671398162842, "global_step": 140869, "epoch": 3354} {"train_loss": -6.727199554443359, "global_step": 140870, "epoch": 3354} {"train_loss": -6.750327110290527, "global_step": 140871, "epoch": 3354} {"train_loss": -6.714476585388184, "global_step": 140872, "epoch": 3354} {"train_loss": -6.815291881561279, "global_step": 140873, "epoch": 3354} {"train_loss": -6.870396614074707, "global_step": 140874, "epoch": 3354} {"train_loss": -6.656050205230713, "global_step": 140875, "epoch": 3354} {"train_loss": -6.797215461730957, "global_step": 140876, "epoch": 3354} {"train_loss": -6.794992446899414, "global_step": 140877, "epoch": 3354} {"train_loss": -6.818498611450195, "global_step": 140878, "epoch": 3354} {"train_loss": -6.7823686599731445, "global_step": 140879, "epoch": 3354} {"train_loss": -6.8966875076293945, "global_step": 140880, "epoch": 3354} {"train_loss": -6.861561298370361, "global_step": 140881, "epoch": 3354} {"train_loss": -6.8339056968688965, "global_step": 140882, "epoch": 3354} {"train_loss": -6.792564392089844, "global_step": 140883, "epoch": 3354} {"train_loss": -6.784478187561035, "global_step": 140884, "epoch": 3354} {"train_loss": -6.870304107666016, "global_step": 140885, "epoch": 3354} {"train_loss": -6.8374738693237305, "global_step": 140886, "epoch": 3354} {"train_loss": -6.892396450042725, "global_step": 140887, "epoch": 3354} {"train_loss": -6.829081058502197, "global_step": 140888, "epoch": 3354} {"train_loss": -6.833755016326904, "global_step": 140889, "epoch": 3354} {"train_loss": -6.778258323669434, "global_step": 140890, "epoch": 3354} {"train_loss": -6.88665771484375, "global_step": 140891, "epoch": 3354} {"train_loss": -6.906562805175781, "global_step": 140892, "epoch": 3354} {"train_loss": -6.849099159240723, "global_step": 140893, "epoch": 3354} {"train_loss": -6.7035675048828125, "global_step": 140894, "epoch": 3354} {"train_loss": -6.8488593101501465, "global_step": 140895, "epoch": 3354} {"train_loss": -6.853600978851318, "global_step": 140896, "epoch": 3354} {"train_loss": -6.875058174133301, "global_step": 140897, "epoch": 3354} {"train_loss": -6.935964584350586, "global_step": 140898, "epoch": 3354} {"train_loss": -6.85476541519165, "global_step": 140899, "epoch": 3354} {"train_loss": -6.812597751617432, "global_step": 140900, "epoch": 3354} {"train_loss": -6.867616653442383, "global_step": 140901, "epoch": 3354} {"train_loss": -6.777781963348389, "global_step": 140902, "epoch": 3354} {"train_loss": -6.824220180511475, "global_step": 140903, "epoch": 3354} {"train_loss": -6.790584564208984, "global_step": 140904, "epoch": 3354} {"train_loss": -6.73676872253418, "global_step": 140905, "epoch": 3354} {"train_loss": -6.776854038238525, "global_step": 140906, "epoch": 3354} {"train_loss": -6.7575788497924805, "global_step": 140907, "epoch": 3354} {"train_loss": -6.80609130859375, "global_step": 140908, "epoch": 3354} {"train_loss": -6.812004078002203, "global_step": 140909, "epoch": 3354, "val_loss": 78310.9609375} {"train_loss": -6.716799736022949, "global_step": 140910, "epoch": 3355} {"train_loss": -6.854722499847412, "global_step": 140911, "epoch": 3355} {"train_loss": -6.628396987915039, "global_step": 140912, "epoch": 3355} {"train_loss": -6.761331558227539, "global_step": 140913, "epoch": 3355} {"train_loss": -6.798244476318359, "global_step": 140914, "epoch": 3355} {"train_loss": -6.742093086242676, "global_step": 140915, "epoch": 3355} {"train_loss": -6.812823295593262, "global_step": 140916, "epoch": 3355} {"train_loss": -6.922781467437744, "global_step": 140917, "epoch": 3355} {"train_loss": -6.785521507263184, "global_step": 140918, "epoch": 3355} {"train_loss": -6.758307456970215, "global_step": 140919, "epoch": 3355} {"train_loss": -6.93204927444458, "global_step": 140920, "epoch": 3355} {"train_loss": -6.905434608459473, "global_step": 140921, "epoch": 3355} {"train_loss": -6.907679557800293, "global_step": 140922, "epoch": 3355} {"train_loss": -6.8303022384643555, "global_step": 140923, "epoch": 3355} {"train_loss": -6.8476033210754395, "global_step": 140924, "epoch": 3355} {"train_loss": -6.823790073394775, "global_step": 140925, "epoch": 3355} {"train_loss": -6.8400187492370605, "global_step": 140926, "epoch": 3355} {"train_loss": -6.689899444580078, "global_step": 140927, "epoch": 3355} {"train_loss": -6.819799423217773, "global_step": 140928, "epoch": 3355} {"train_loss": -6.707681179046631, "global_step": 140929, "epoch": 3355} {"train_loss": -6.876351356506348, "global_step": 140930, "epoch": 3355} {"train_loss": -6.934460163116455, "global_step": 140931, "epoch": 3355} {"train_loss": -6.827874660491943, "global_step": 140932, "epoch": 3355} {"train_loss": -6.79680061340332, "global_step": 140933, "epoch": 3355} {"train_loss": -6.773764610290527, "global_step": 140934, "epoch": 3355} {"train_loss": -6.779706001281738, "global_step": 140935, "epoch": 3355} {"train_loss": -6.784868240356445, "global_step": 140936, "epoch": 3355} {"train_loss": -6.645952224731445, "global_step": 140937, "epoch": 3355} {"train_loss": -6.803023338317871, "global_step": 140938, "epoch": 3355} {"train_loss": -6.856335639953613, "global_step": 140939, "epoch": 3355} {"train_loss": -6.77655029296875, "global_step": 140940, "epoch": 3355} {"train_loss": -6.755362510681152, "global_step": 140941, "epoch": 3355} {"train_loss": -6.757692337036133, "global_step": 140942, "epoch": 3355} {"train_loss": -6.732176780700684, "global_step": 140943, "epoch": 3355} {"train_loss": -6.7943620681762695, "global_step": 140944, "epoch": 3355} {"train_loss": -6.8033037185668945, "global_step": 140945, "epoch": 3355} {"train_loss": -6.825103759765625, "global_step": 140946, "epoch": 3355} {"train_loss": -6.711771011352539, "global_step": 140947, "epoch": 3355} {"train_loss": -6.683504581451416, "global_step": 140948, "epoch": 3355} {"train_loss": -6.833845138549805, "global_step": 140949, "epoch": 3355} {"train_loss": -6.77678108215332, "global_step": 140950, "epoch": 3355} {"train_loss": -6.795019694737026, "global_step": 140951, "epoch": 3355, "val_loss": 78329.0078125} {"train_loss": -6.779696464538574, "global_step": 140952, "epoch": 3356} {"train_loss": -6.745372772216797, "global_step": 140953, "epoch": 3356} {"train_loss": -6.810763835906982, "global_step": 140954, "epoch": 3356} {"train_loss": -6.726413249969482, "global_step": 140955, "epoch": 3356} {"train_loss": -6.761483192443848, "global_step": 140956, "epoch": 3356} {"train_loss": -6.800821304321289, "global_step": 140957, "epoch": 3356} {"train_loss": -6.69807243347168, "global_step": 140958, "epoch": 3356} {"train_loss": -6.756742477416992, "global_step": 140959, "epoch": 3356} {"train_loss": -6.781259059906006, "global_step": 140960, "epoch": 3356} {"train_loss": -6.818630218505859, "global_step": 140961, "epoch": 3356} {"train_loss": -6.802278518676758, "global_step": 140962, "epoch": 3356} {"train_loss": -6.814244270324707, "global_step": 140963, "epoch": 3356} {"train_loss": -6.766382217407227, "global_step": 140964, "epoch": 3356} {"train_loss": -6.708794593811035, "global_step": 140965, "epoch": 3356} {"train_loss": -6.827548980712891, "global_step": 140966, "epoch": 3356} {"train_loss": -6.726519584655762, "global_step": 140967, "epoch": 3356} {"train_loss": -6.731054306030273, "global_step": 140968, "epoch": 3356} {"train_loss": -6.779545783996582, "global_step": 140969, "epoch": 3356} {"train_loss": -6.699213981628418, "global_step": 140970, "epoch": 3356} {"train_loss": -6.802005767822266, "global_step": 140971, "epoch": 3356} {"train_loss": -6.784196853637695, "global_step": 140972, "epoch": 3356} {"train_loss": -6.72726583480835, "global_step": 140973, "epoch": 3356} {"train_loss": -6.781402587890625, "global_step": 140974, "epoch": 3356} {"train_loss": -6.773522853851318, "global_step": 140975, "epoch": 3356} {"train_loss": -6.827483654022217, "global_step": 140976, "epoch": 3356} {"train_loss": -6.8085713386535645, "global_step": 140977, "epoch": 3356} {"train_loss": -6.793375492095947, "global_step": 140978, "epoch": 3356} {"train_loss": -6.836835861206055, "global_step": 140979, "epoch": 3356} {"train_loss": -6.7479634284973145, "global_step": 140980, "epoch": 3356} {"train_loss": -6.855780124664307, "global_step": 140981, "epoch": 3356} {"train_loss": -6.750211715698242, "global_step": 140982, "epoch": 3356} {"train_loss": -6.830503463745117, "global_step": 140983, "epoch": 3356} {"train_loss": -6.853794097900391, "global_step": 140984, "epoch": 3356} {"train_loss": -6.866942405700684, "global_step": 140985, "epoch": 3356} {"train_loss": -6.782327175140381, "global_step": 140986, "epoch": 3356} {"train_loss": -6.6985931396484375, "global_step": 140987, "epoch": 3356} {"train_loss": -6.765837669372559, "global_step": 140988, "epoch": 3356} {"train_loss": -6.618973731994629, "global_step": 140989, "epoch": 3356} {"train_loss": -6.797041893005371, "global_step": 140990, "epoch": 3356} {"train_loss": -6.888724327087402, "global_step": 140991, "epoch": 3356} {"train_loss": -6.69384765625, "global_step": 140992, "epoch": 3356} {"train_loss": -6.7766913913545155, "global_step": 140993, "epoch": 3356, "val_loss": 78256.5390625} {"train_loss": -6.703696250915527, "global_step": 140994, "epoch": 3357} {"train_loss": -6.849271774291992, "global_step": 140995, "epoch": 3357} {"train_loss": -6.655815124511719, "global_step": 140996, "epoch": 3357} {"train_loss": -6.755706787109375, "global_step": 140997, "epoch": 3357} {"train_loss": -6.801533222198486, "global_step": 140998, "epoch": 3357} {"train_loss": -6.553416728973389, "global_step": 140999, "epoch": 3357} {"train_loss": -6.825218200683594, "global_step": 141000, "epoch": 3357} {"train_loss": -6.778495788574219, "global_step": 141001, "epoch": 3357} {"train_loss": -6.706935882568359, "global_step": 141002, "epoch": 3357} {"train_loss": -6.721981048583984, "global_step": 141003, "epoch": 3357} {"train_loss": -6.781513690948486, "global_step": 141004, "epoch": 3357} {"train_loss": -6.845800399780273, "global_step": 141005, "epoch": 3357} {"train_loss": -6.818778991699219, "global_step": 141006, "epoch": 3357} {"train_loss": -6.814733982086182, "global_step": 141007, "epoch": 3357} {"train_loss": -6.720119953155518, "global_step": 141008, "epoch": 3357} {"train_loss": -6.715757369995117, "global_step": 141009, "epoch": 3357} {"train_loss": -6.76882266998291, "global_step": 141010, "epoch": 3357} {"train_loss": -6.674359321594238, "global_step": 141011, "epoch": 3357} {"train_loss": -6.732748031616211, "global_step": 141012, "epoch": 3357} {"train_loss": -6.738190650939941, "global_step": 141013, "epoch": 3357} {"train_loss": -6.843913555145264, "global_step": 141014, "epoch": 3357} {"train_loss": -6.862113952636719, "global_step": 141015, "epoch": 3357} {"train_loss": -6.7123565673828125, "global_step": 141016, "epoch": 3357} {"train_loss": -6.706403732299805, "global_step": 141017, "epoch": 3357} {"train_loss": -6.712325096130371, "global_step": 141018, "epoch": 3357} {"train_loss": -6.695815563201904, "global_step": 141019, "epoch": 3357} {"train_loss": -6.739528179168701, "global_step": 141020, "epoch": 3357} {"train_loss": -6.8436126708984375, "global_step": 141021, "epoch": 3357} {"train_loss": -6.760974884033203, "global_step": 141022, "epoch": 3357} {"train_loss": -6.752277851104736, "global_step": 141023, "epoch": 3357} {"train_loss": -6.717335224151611, "global_step": 141024, "epoch": 3357} {"train_loss": -6.678524971008301, "global_step": 141025, "epoch": 3357} {"train_loss": -6.694591522216797, "global_step": 141026, "epoch": 3357} {"train_loss": -6.837294101715088, "global_step": 141027, "epoch": 3357} {"train_loss": -6.847031593322754, "global_step": 141028, "epoch": 3357} {"train_loss": -6.695932388305664, "global_step": 141029, "epoch": 3357} {"train_loss": -6.758405685424805, "global_step": 141030, "epoch": 3357} {"train_loss": -6.84099006652832, "global_step": 141031, "epoch": 3357} {"train_loss": -6.702813148498535, "global_step": 141032, "epoch": 3357} {"train_loss": -6.82020378112793, "global_step": 141033, "epoch": 3357} {"train_loss": -6.683219909667969, "global_step": 141034, "epoch": 3357} {"train_loss": -6.751533962431408, "global_step": 141035, "epoch": 3357, "val_loss": 78278.8203125} {"train_loss": -6.755856513977051, "global_step": 141036, "epoch": 3358} {"train_loss": -6.692781448364258, "global_step": 141037, "epoch": 3358} {"train_loss": -6.5707550048828125, "global_step": 141038, "epoch": 3358} {"train_loss": -6.890807151794434, "global_step": 141039, "epoch": 3358} {"train_loss": -6.775869846343994, "global_step": 141040, "epoch": 3358} {"train_loss": -6.729829788208008, "global_step": 141041, "epoch": 3358} {"train_loss": -6.758319854736328, "global_step": 141042, "epoch": 3358} {"train_loss": -6.797700881958008, "global_step": 141043, "epoch": 3358} {"train_loss": -6.738637447357178, "global_step": 141044, "epoch": 3358} {"train_loss": -6.6941022872924805, "global_step": 141045, "epoch": 3358} {"train_loss": -6.630031108856201, "global_step": 141046, "epoch": 3358} {"train_loss": -6.794279098510742, "global_step": 141047, "epoch": 3358} {"train_loss": -6.917429447174072, "global_step": 141048, "epoch": 3358} {"train_loss": -6.720051288604736, "global_step": 141049, "epoch": 3358} {"train_loss": -6.638998985290527, "global_step": 141050, "epoch": 3358} {"train_loss": -6.629753112792969, "global_step": 141051, "epoch": 3358} {"train_loss": -6.805828094482422, "global_step": 141052, "epoch": 3358} {"train_loss": -6.68971061706543, "global_step": 141053, "epoch": 3358} {"train_loss": -6.689065933227539, "global_step": 141054, "epoch": 3358} {"train_loss": -6.6761322021484375, "global_step": 141055, "epoch": 3358} {"train_loss": -6.794706344604492, "global_step": 141056, "epoch": 3358} {"train_loss": -6.708502769470215, "global_step": 141057, "epoch": 3358} {"train_loss": -6.724339962005615, "global_step": 141058, "epoch": 3358} {"train_loss": -6.8297929763793945, "global_step": 141059, "epoch": 3358} {"train_loss": -6.8016557693481445, "global_step": 141060, "epoch": 3358} {"train_loss": -6.735811710357666, "global_step": 141061, "epoch": 3358} {"train_loss": -6.814242839813232, "global_step": 141062, "epoch": 3358} {"train_loss": -6.834159851074219, "global_step": 141063, "epoch": 3358} {"train_loss": -6.811196327209473, "global_step": 141064, "epoch": 3358} {"train_loss": -6.827073097229004, "global_step": 141065, "epoch": 3358} {"train_loss": -6.7075042724609375, "global_step": 141066, "epoch": 3358} {"train_loss": -6.805823802947998, "global_step": 141067, "epoch": 3358} {"train_loss": -6.79205322265625, "global_step": 141068, "epoch": 3358} {"train_loss": -6.849093437194824, "global_step": 141069, "epoch": 3358} {"train_loss": -6.83223819732666, "global_step": 141070, "epoch": 3358} {"train_loss": -6.891053676605225, "global_step": 141071, "epoch": 3358} {"train_loss": -6.73681116104126, "global_step": 141072, "epoch": 3358} {"train_loss": -6.7612714767456055, "global_step": 141073, "epoch": 3358} {"train_loss": -6.793769836425781, "global_step": 141074, "epoch": 3358} {"train_loss": -6.837923049926758, "global_step": 141075, "epoch": 3358} {"train_loss": -6.817877769470215, "global_step": 141076, "epoch": 3358} {"train_loss": -6.763865561712356, "global_step": 141077, "epoch": 3358, "val_loss": 77969.390625} {"train_loss": -6.83827018737793, "global_step": 141078, "epoch": 3359} {"train_loss": -6.922077178955078, "global_step": 141079, "epoch": 3359} {"train_loss": -6.710799217224121, "global_step": 141080, "epoch": 3359} {"train_loss": -6.825613021850586, "global_step": 141081, "epoch": 3359} {"train_loss": -6.789039611816406, "global_step": 141082, "epoch": 3359} {"train_loss": -6.804015159606934, "global_step": 141083, "epoch": 3359} {"train_loss": -6.762174129486084, "global_step": 141084, "epoch": 3359} {"train_loss": -6.781487464904785, "global_step": 141085, "epoch": 3359} {"train_loss": -6.792149543762207, "global_step": 141086, "epoch": 3359} {"train_loss": -6.751462459564209, "global_step": 141087, "epoch": 3359} {"train_loss": -6.7902021408081055, "global_step": 141088, "epoch": 3359} {"train_loss": -6.77017068862915, "global_step": 141089, "epoch": 3359} {"train_loss": -6.782256126403809, "global_step": 141090, "epoch": 3359} {"train_loss": -6.8391265869140625, "global_step": 141091, "epoch": 3359} {"train_loss": -6.781970977783203, "global_step": 141092, "epoch": 3359} {"train_loss": -6.8404412269592285, "global_step": 141093, "epoch": 3359} {"train_loss": -6.718592166900635, "global_step": 141094, "epoch": 3359} {"train_loss": -6.836836814880371, "global_step": 141095, "epoch": 3359} {"train_loss": -6.750458717346191, "global_step": 141096, "epoch": 3359} {"train_loss": -6.819762706756592, "global_step": 141097, "epoch": 3359} {"train_loss": -6.837983131408691, "global_step": 141098, "epoch": 3359} {"train_loss": -6.8277130126953125, "global_step": 141099, "epoch": 3359} {"train_loss": -6.709977626800537, "global_step": 141100, "epoch": 3359} {"train_loss": -6.831107139587402, "global_step": 141101, "epoch": 3359} {"train_loss": -6.799308776855469, "global_step": 141102, "epoch": 3359} {"train_loss": -6.865163326263428, "global_step": 141103, "epoch": 3359} {"train_loss": -6.836932182312012, "global_step": 141104, "epoch": 3359} {"train_loss": -6.781885623931885, "global_step": 141105, "epoch": 3359} {"train_loss": -6.812417030334473, "global_step": 141106, "epoch": 3359} {"train_loss": -6.87729024887085, "global_step": 141107, "epoch": 3359} {"train_loss": -6.817721366882324, "global_step": 141108, "epoch": 3359} {"train_loss": -6.876104354858398, "global_step": 141109, "epoch": 3359} {"train_loss": -6.929750442504883, "global_step": 141110, "epoch": 3359} {"train_loss": -6.734267711639404, "global_step": 141111, "epoch": 3359} {"train_loss": -6.824204444885254, "global_step": 141112, "epoch": 3359} {"train_loss": -6.791578769683838, "global_step": 141113, "epoch": 3359} {"train_loss": -6.69795036315918, "global_step": 141114, "epoch": 3359} {"train_loss": -6.818814754486084, "global_step": 141115, "epoch": 3359} {"train_loss": -6.796368598937988, "global_step": 141116, "epoch": 3359} {"train_loss": -6.686359882354736, "global_step": 141117, "epoch": 3359} {"train_loss": -6.6438398361206055, "global_step": 141118, "epoch": 3359} {"train_loss": -6.796647900626773, "global_step": 141119, "epoch": 3359, "val_loss": 78369.875} {"train_loss": -6.738898277282715, "global_step": 141120, "epoch": 3360} {"train_loss": -6.498858451843262, "global_step": 141121, "epoch": 3360} {"train_loss": -6.564934730529785, "global_step": 141122, "epoch": 3360} {"train_loss": -6.701737880706787, "global_step": 141123, "epoch": 3360} {"train_loss": -6.510664939880371, "global_step": 141124, "epoch": 3360} {"train_loss": -6.640779495239258, "global_step": 141125, "epoch": 3360} {"train_loss": -6.7769575119018555, "global_step": 141126, "epoch": 3360} {"train_loss": -6.64689826965332, "global_step": 141127, "epoch": 3360} {"train_loss": -6.758505821228027, "global_step": 141128, "epoch": 3360} {"train_loss": -6.715605735778809, "global_step": 141129, "epoch": 3360} {"train_loss": -6.6780500411987305, "global_step": 141130, "epoch": 3360} {"train_loss": -6.7723612785339355, "global_step": 141131, "epoch": 3360} {"train_loss": -6.773791790008545, "global_step": 141132, "epoch": 3360} {"train_loss": -6.639269828796387, "global_step": 141133, "epoch": 3360} {"train_loss": -6.733282089233398, "global_step": 141134, "epoch": 3360} {"train_loss": -6.688333034515381, "global_step": 141135, "epoch": 3360} {"train_loss": -6.738663673400879, "global_step": 141136, "epoch": 3360} {"train_loss": -6.802567481994629, "global_step": 141137, "epoch": 3360} {"train_loss": -6.696981430053711, "global_step": 141138, "epoch": 3360} {"train_loss": -6.712804794311523, "global_step": 141139, "epoch": 3360} {"train_loss": -6.752578258514404, "global_step": 141140, "epoch": 3360} {"train_loss": -6.767845630645752, "global_step": 141141, "epoch": 3360} {"train_loss": -6.647051811218262, "global_step": 141142, "epoch": 3360} {"train_loss": -6.871755599975586, "global_step": 141143, "epoch": 3360} {"train_loss": -6.696583271026611, "global_step": 141144, "epoch": 3360} {"train_loss": -6.794991493225098, "global_step": 141145, "epoch": 3360} {"train_loss": -6.7303056716918945, "global_step": 141146, "epoch": 3360} {"train_loss": -6.661068439483643, "global_step": 141147, "epoch": 3360} {"train_loss": -6.736964702606201, "global_step": 141148, "epoch": 3360} {"train_loss": -6.833952903747559, "global_step": 141149, "epoch": 3360} {"train_loss": -6.778653621673584, "global_step": 141150, "epoch": 3360} {"train_loss": -6.749619483947754, "global_step": 141151, "epoch": 3360} {"train_loss": -6.72910737991333, "global_step": 141152, "epoch": 3360} {"train_loss": -6.724740505218506, "global_step": 141153, "epoch": 3360} {"train_loss": -6.667333126068115, "global_step": 141154, "epoch": 3360} {"train_loss": -6.785205364227295, "global_step": 141155, "epoch": 3360} {"train_loss": -6.690357208251953, "global_step": 141156, "epoch": 3360} {"train_loss": -6.760767936706543, "global_step": 141157, "epoch": 3360} {"train_loss": -6.686659336090088, "global_step": 141158, "epoch": 3360} {"train_loss": -6.699066638946533, "global_step": 141159, "epoch": 3360} {"train_loss": -6.662452697753906, "global_step": 141160, "epoch": 3360} {"train_loss": -6.712153514226277, "global_step": 141161, "epoch": 3360, "val_loss": 78111.8359375} {"train_loss": -6.685967445373535, "global_step": 141162, "epoch": 3361} {"train_loss": -6.755825996398926, "global_step": 141163, "epoch": 3361} {"train_loss": -6.895792484283447, "global_step": 141164, "epoch": 3361} {"train_loss": -6.698474884033203, "global_step": 141165, "epoch": 3361} {"train_loss": -6.710357189178467, "global_step": 141166, "epoch": 3361} {"train_loss": -6.730921745300293, "global_step": 141167, "epoch": 3361} {"train_loss": -6.785279273986816, "global_step": 141168, "epoch": 3361} {"train_loss": -6.835094928741455, "global_step": 141169, "epoch": 3361} {"train_loss": -6.797815322875977, "global_step": 141170, "epoch": 3361} {"train_loss": -6.706708908081055, "global_step": 141171, "epoch": 3361} {"train_loss": -6.735710620880127, "global_step": 141172, "epoch": 3361} {"train_loss": -6.736615180969238, "global_step": 141173, "epoch": 3361} {"train_loss": -6.782565116882324, "global_step": 141174, "epoch": 3361} {"train_loss": -6.722639083862305, "global_step": 141175, "epoch": 3361} {"train_loss": -6.7554097175598145, "global_step": 141176, "epoch": 3361} {"train_loss": -6.714831352233887, "global_step": 141177, "epoch": 3361} {"train_loss": -6.748061656951904, "global_step": 141178, "epoch": 3361} {"train_loss": -6.73124885559082, "global_step": 141179, "epoch": 3361} {"train_loss": -6.601699352264404, "global_step": 141180, "epoch": 3361} {"train_loss": -6.727419853210449, "global_step": 141181, "epoch": 3361} {"train_loss": -6.7063117027282715, "global_step": 141182, "epoch": 3361} {"train_loss": -6.766044616699219, "global_step": 141183, "epoch": 3361} {"train_loss": -6.570984363555908, "global_step": 141184, "epoch": 3361} {"train_loss": -6.771263122558594, "global_step": 141185, "epoch": 3361} {"train_loss": -6.7544989585876465, "global_step": 141186, "epoch": 3361} {"train_loss": -6.768181324005127, "global_step": 141187, "epoch": 3361} {"train_loss": -6.858673095703125, "global_step": 141188, "epoch": 3361} {"train_loss": -6.816214561462402, "global_step": 141189, "epoch": 3361} {"train_loss": -6.7623982429504395, "global_step": 141190, "epoch": 3361} {"train_loss": -6.853009223937988, "global_step": 141191, "epoch": 3361} {"train_loss": -6.849926948547363, "global_step": 141192, "epoch": 3361} {"train_loss": -6.678500652313232, "global_step": 141193, "epoch": 3361} {"train_loss": -6.825457572937012, "global_step": 141194, "epoch": 3361} {"train_loss": -6.809720993041992, "global_step": 141195, "epoch": 3361} {"train_loss": -6.889472007751465, "global_step": 141196, "epoch": 3361} {"train_loss": -6.77169132232666, "global_step": 141197, "epoch": 3361} {"train_loss": -6.833697319030762, "global_step": 141198, "epoch": 3361} {"train_loss": -6.7359700202941895, "global_step": 141199, "epoch": 3361} {"train_loss": -6.8227996826171875, "global_step": 141200, "epoch": 3361} {"train_loss": -6.780733585357666, "global_step": 141201, "epoch": 3361} {"train_loss": -6.782042026519775, "global_step": 141202, "epoch": 3361} {"train_loss": -6.762206327347529, "global_step": 141203, "epoch": 3361, "val_loss": 78276.484375} {"train_loss": -6.675676345825195, "global_step": 141204, "epoch": 3362} {"train_loss": -6.781645774841309, "global_step": 141205, "epoch": 3362} {"train_loss": -6.7520294189453125, "global_step": 141206, "epoch": 3362} {"train_loss": -6.751031875610352, "global_step": 141207, "epoch": 3362} {"train_loss": -6.7221784591674805, "global_step": 141208, "epoch": 3362} {"train_loss": -6.767364025115967, "global_step": 141209, "epoch": 3362} {"train_loss": -6.688996315002441, "global_step": 141210, "epoch": 3362} {"train_loss": -6.542925834655762, "global_step": 141211, "epoch": 3362} {"train_loss": -6.850050449371338, "global_step": 141212, "epoch": 3362} {"train_loss": -6.766164779663086, "global_step": 141213, "epoch": 3362} {"train_loss": -6.628813743591309, "global_step": 141214, "epoch": 3362} {"train_loss": -6.709839820861816, "global_step": 141215, "epoch": 3362} {"train_loss": -6.750473976135254, "global_step": 141216, "epoch": 3362} {"train_loss": -6.736023902893066, "global_step": 141217, "epoch": 3362} {"train_loss": -6.7264251708984375, "global_step": 141218, "epoch": 3362} {"train_loss": -6.7735724449157715, "global_step": 141219, "epoch": 3362} {"train_loss": -6.846268177032471, "global_step": 141220, "epoch": 3362} {"train_loss": -6.761513710021973, "global_step": 141221, "epoch": 3362} {"train_loss": -6.913841247558594, "global_step": 141222, "epoch": 3362} {"train_loss": -6.643233299255371, "global_step": 141223, "epoch": 3362} {"train_loss": -6.776101112365723, "global_step": 141224, "epoch": 3362} {"train_loss": -6.910813331604004, "global_step": 141225, "epoch": 3362} {"train_loss": -6.711275100708008, "global_step": 141226, "epoch": 3362} {"train_loss": -6.77149772644043, "global_step": 141227, "epoch": 3362} {"train_loss": -6.750208377838135, "global_step": 141228, "epoch": 3362} {"train_loss": -6.782627105712891, "global_step": 141229, "epoch": 3362} {"train_loss": -6.847662925720215, "global_step": 141230, "epoch": 3362} {"train_loss": -6.8366851806640625, "global_step": 141231, "epoch": 3362} {"train_loss": -6.6949052810668945, "global_step": 141232, "epoch": 3362} {"train_loss": -6.717617988586426, "global_step": 141233, "epoch": 3362} {"train_loss": -6.760041236877441, "global_step": 141234, "epoch": 3362} {"train_loss": -6.750093460083008, "global_step": 141235, "epoch": 3362} {"train_loss": -6.864961624145508, "global_step": 141236, "epoch": 3362} {"train_loss": -6.757022857666016, "global_step": 141237, "epoch": 3362} {"train_loss": -6.802309036254883, "global_step": 141238, "epoch": 3362} {"train_loss": -6.82900333404541, "global_step": 141239, "epoch": 3362} {"train_loss": -6.868602752685547, "global_step": 141240, "epoch": 3362} {"train_loss": -6.835497856140137, "global_step": 141241, "epoch": 3362} {"train_loss": -6.727211952209473, "global_step": 141242, "epoch": 3362} {"train_loss": -6.672320365905762, "global_step": 141243, "epoch": 3362} {"train_loss": -6.745156288146973, "global_step": 141244, "epoch": 3362} {"train_loss": -6.760602792104085, "global_step": 141245, "epoch": 3362, "val_loss": 78018.3359375} {"train_loss": -6.762064456939697, "global_step": 141246, "epoch": 3363} {"train_loss": -6.798405647277832, "global_step": 141247, "epoch": 3363} {"train_loss": -6.833301544189453, "global_step": 141248, "epoch": 3363} {"train_loss": -6.752994537353516, "global_step": 141249, "epoch": 3363} {"train_loss": -6.751274108886719, "global_step": 141250, "epoch": 3363} {"train_loss": -6.760650634765625, "global_step": 141251, "epoch": 3363} {"train_loss": -6.677813529968262, "global_step": 141252, "epoch": 3363} {"train_loss": -6.849562644958496, "global_step": 141253, "epoch": 3363} {"train_loss": -6.653764724731445, "global_step": 141254, "epoch": 3363} {"train_loss": -6.78553581237793, "global_step": 141255, "epoch": 3363} {"train_loss": -6.718637466430664, "global_step": 141256, "epoch": 3363} {"train_loss": -6.852131366729736, "global_step": 141257, "epoch": 3363} {"train_loss": -6.799437522888184, "global_step": 141258, "epoch": 3363} {"train_loss": -6.73679256439209, "global_step": 141259, "epoch": 3363} {"train_loss": -6.818642616271973, "global_step": 141260, "epoch": 3363} {"train_loss": -6.8681721687316895, "global_step": 141261, "epoch": 3363} {"train_loss": -6.775112152099609, "global_step": 141262, "epoch": 3363} {"train_loss": -6.788442134857178, "global_step": 141263, "epoch": 3363} {"train_loss": -6.748394012451172, "global_step": 141264, "epoch": 3363} {"train_loss": -6.798203468322754, "global_step": 141265, "epoch": 3363} {"train_loss": -6.752231597900391, "global_step": 141266, "epoch": 3363} {"train_loss": -6.824222564697266, "global_step": 141267, "epoch": 3363} {"train_loss": -6.7423529624938965, "global_step": 141268, "epoch": 3363} {"train_loss": -6.736171722412109, "global_step": 141269, "epoch": 3363} {"train_loss": -6.8017120361328125, "global_step": 141270, "epoch": 3363} {"train_loss": -6.779653549194336, "global_step": 141271, "epoch": 3363} {"train_loss": -6.803132057189941, "global_step": 141272, "epoch": 3363} {"train_loss": -6.778228759765625, "global_step": 141273, "epoch": 3363} {"train_loss": -6.780832290649414, "global_step": 141274, "epoch": 3363} {"train_loss": -6.78885555267334, "global_step": 141275, "epoch": 3363} {"train_loss": -6.860655784606934, "global_step": 141276, "epoch": 3363} {"train_loss": -6.8779191970825195, "global_step": 141277, "epoch": 3363} {"train_loss": -6.893916130065918, "global_step": 141278, "epoch": 3363} {"train_loss": -6.807794570922852, "global_step": 141279, "epoch": 3363} {"train_loss": -6.779350280761719, "global_step": 141280, "epoch": 3363} {"train_loss": -6.836725234985352, "global_step": 141281, "epoch": 3363} {"train_loss": -6.717990875244141, "global_step": 141282, "epoch": 3363} {"train_loss": -6.769588947296143, "global_step": 141283, "epoch": 3363} {"train_loss": -6.808490753173828, "global_step": 141284, "epoch": 3363} {"train_loss": -6.939290523529053, "global_step": 141285, "epoch": 3363} {"train_loss": -6.81385612487793, "global_step": 141286, "epoch": 3363} {"train_loss": -6.7914688019525435, "global_step": 141287, "epoch": 3363, "val_loss": 77974.953125} {"train_loss": -6.850669860839844, "global_step": 141288, "epoch": 3364} {"train_loss": -6.804730415344238, "global_step": 141289, "epoch": 3364} {"train_loss": -6.842581748962402, "global_step": 141290, "epoch": 3364} {"train_loss": -6.8550004959106445, "global_step": 141291, "epoch": 3364} {"train_loss": -6.816034317016602, "global_step": 141292, "epoch": 3364} {"train_loss": -6.779402732849121, "global_step": 141293, "epoch": 3364} {"train_loss": -6.805342197418213, "global_step": 141294, "epoch": 3364} {"train_loss": -6.770256996154785, "global_step": 141295, "epoch": 3364} {"train_loss": -6.834980010986328, "global_step": 141296, "epoch": 3364} {"train_loss": -6.831993103027344, "global_step": 141297, "epoch": 3364} {"train_loss": -6.608183860778809, "global_step": 141298, "epoch": 3364} {"train_loss": -6.7304368019104, "global_step": 141299, "epoch": 3364} {"train_loss": -6.861112594604492, "global_step": 141300, "epoch": 3364} {"train_loss": -6.635046005249023, "global_step": 141301, "epoch": 3364} {"train_loss": -6.731049537658691, "global_step": 141302, "epoch": 3364} {"train_loss": -6.839733123779297, "global_step": 141303, "epoch": 3364} {"train_loss": -6.7581787109375, "global_step": 141304, "epoch": 3364} {"train_loss": -6.752249240875244, "global_step": 141305, "epoch": 3364} {"train_loss": -6.8036651611328125, "global_step": 141306, "epoch": 3364} {"train_loss": -6.785161972045898, "global_step": 141307, "epoch": 3364} {"train_loss": -6.862178802490234, "global_step": 141308, "epoch": 3364} {"train_loss": -6.75289249420166, "global_step": 141309, "epoch": 3364} {"train_loss": -6.730690956115723, "global_step": 141310, "epoch": 3364} {"train_loss": -6.82511043548584, "global_step": 141311, "epoch": 3364} {"train_loss": -6.61510705947876, "global_step": 141312, "epoch": 3364} {"train_loss": -6.723982334136963, "global_step": 141313, "epoch": 3364} {"train_loss": -6.673003673553467, "global_step": 141314, "epoch": 3364} {"train_loss": -6.681502342224121, "global_step": 141315, "epoch": 3364} {"train_loss": -6.685123443603516, "global_step": 141316, "epoch": 3364} {"train_loss": -6.739770889282227, "global_step": 141317, "epoch": 3364} {"train_loss": -6.755772590637207, "global_step": 141318, "epoch": 3364} {"train_loss": -6.768956184387207, "global_step": 141319, "epoch": 3364} {"train_loss": -6.822714328765869, "global_step": 141320, "epoch": 3364} {"train_loss": -6.750544548034668, "global_step": 141321, "epoch": 3364} {"train_loss": -6.751014709472656, "global_step": 141322, "epoch": 3364} {"train_loss": -6.690863609313965, "global_step": 141323, "epoch": 3364} {"train_loss": -6.645052909851074, "global_step": 141324, "epoch": 3364} {"train_loss": -6.811469078063965, "global_step": 141325, "epoch": 3364} {"train_loss": -6.731997489929199, "global_step": 141326, "epoch": 3364} {"train_loss": -6.771596908569336, "global_step": 141327, "epoch": 3364} {"train_loss": -6.700290203094482, "global_step": 141328, "epoch": 3364} {"train_loss": -6.7589179788316995, "global_step": 141329, "epoch": 3364, "val_loss": 78082.0859375} {"train_loss": -6.727191925048828, "global_step": 141330, "epoch": 3365} {"train_loss": -6.765632629394531, "global_step": 141331, "epoch": 3365} {"train_loss": -6.719102382659912, "global_step": 141332, "epoch": 3365} {"train_loss": -6.74096155166626, "global_step": 141333, "epoch": 3365} {"train_loss": -6.753429412841797, "global_step": 141334, "epoch": 3365} {"train_loss": -6.767097473144531, "global_step": 141335, "epoch": 3365} {"train_loss": -6.775585651397705, "global_step": 141336, "epoch": 3365} {"train_loss": -6.727155685424805, "global_step": 141337, "epoch": 3365} {"train_loss": -6.63632869720459, "global_step": 141338, "epoch": 3365} {"train_loss": -6.699981689453125, "global_step": 141339, "epoch": 3365} {"train_loss": -6.645289897918701, "global_step": 141340, "epoch": 3365} {"train_loss": -6.82213020324707, "global_step": 141341, "epoch": 3365} {"train_loss": -6.593238830566406, "global_step": 141342, "epoch": 3365} {"train_loss": -6.806606769561768, "global_step": 141343, "epoch": 3365} {"train_loss": -6.791181564331055, "global_step": 141344, "epoch": 3365} {"train_loss": -6.8253021240234375, "global_step": 141345, "epoch": 3365} {"train_loss": -6.673329830169678, "global_step": 141346, "epoch": 3365} {"train_loss": -6.673948287963867, "global_step": 141347, "epoch": 3365} {"train_loss": -6.722764015197754, "global_step": 141348, "epoch": 3365} {"train_loss": -6.6636223793029785, "global_step": 141349, "epoch": 3365} {"train_loss": -6.6427412033081055, "global_step": 141350, "epoch": 3365} {"train_loss": -6.783555507659912, "global_step": 141351, "epoch": 3365} {"train_loss": -6.6890740394592285, "global_step": 141352, "epoch": 3365} {"train_loss": -6.7716965675354, "global_step": 141353, "epoch": 3365} {"train_loss": -6.745100498199463, "global_step": 141354, "epoch": 3365} {"train_loss": -6.738894939422607, "global_step": 141355, "epoch": 3365} {"train_loss": -6.714325904846191, "global_step": 141356, "epoch": 3365} {"train_loss": -6.800952911376953, "global_step": 141357, "epoch": 3365} {"train_loss": -6.70295524597168, "global_step": 141358, "epoch": 3365} {"train_loss": -6.727076530456543, "global_step": 141359, "epoch": 3365} {"train_loss": -6.729425430297852, "global_step": 141360, "epoch": 3365} {"train_loss": -6.727666854858398, "global_step": 141361, "epoch": 3365} {"train_loss": -6.734497547149658, "global_step": 141362, "epoch": 3365} {"train_loss": -6.82991886138916, "global_step": 141363, "epoch": 3365} {"train_loss": -6.767854690551758, "global_step": 141364, "epoch": 3365} {"train_loss": -6.713404178619385, "global_step": 141365, "epoch": 3365} {"train_loss": -6.795231819152832, "global_step": 141366, "epoch": 3365} {"train_loss": -6.801586151123047, "global_step": 141367, "epoch": 3365} {"train_loss": -6.738180160522461, "global_step": 141368, "epoch": 3365} {"train_loss": -6.799327850341797, "global_step": 141369, "epoch": 3365} {"train_loss": -6.691252708435059, "global_step": 141370, "epoch": 3365} {"train_loss": -6.737156266257877, "global_step": 141371, "epoch": 3365, "val_loss": 78135.9140625} {"train_loss": -6.8558220863342285, "global_step": 141372, "epoch": 3366} {"train_loss": -6.756268501281738, "global_step": 141373, "epoch": 3366} {"train_loss": -6.864084243774414, "global_step": 141374, "epoch": 3366} {"train_loss": -6.860644340515137, "global_step": 141375, "epoch": 3366} {"train_loss": -6.952113151550293, "global_step": 141376, "epoch": 3366} {"train_loss": -6.825985908508301, "global_step": 141377, "epoch": 3366} {"train_loss": -6.705775737762451, "global_step": 141378, "epoch": 3366} {"train_loss": -6.906900405883789, "global_step": 141379, "epoch": 3366} {"train_loss": -6.816657066345215, "global_step": 141380, "epoch": 3366} {"train_loss": -6.811718463897705, "global_step": 141381, "epoch": 3366} {"train_loss": -6.728657245635986, "global_step": 141382, "epoch": 3366} {"train_loss": -6.876731872558594, "global_step": 141383, "epoch": 3366} {"train_loss": -6.7921648025512695, "global_step": 141384, "epoch": 3366} {"train_loss": -6.775413513183594, "global_step": 141385, "epoch": 3366} {"train_loss": -6.754674434661865, "global_step": 141386, "epoch": 3366} {"train_loss": -6.823483943939209, "global_step": 141387, "epoch": 3366} {"train_loss": -6.694299697875977, "global_step": 141388, "epoch": 3366} {"train_loss": -6.896038055419922, "global_step": 141389, "epoch": 3366} {"train_loss": -6.759990692138672, "global_step": 141390, "epoch": 3366} {"train_loss": -6.844815254211426, "global_step": 141391, "epoch": 3366} {"train_loss": -6.740963935852051, "global_step": 141392, "epoch": 3366} {"train_loss": -6.8315935134887695, "global_step": 141393, "epoch": 3366} {"train_loss": -6.85689640045166, "global_step": 141394, "epoch": 3366} {"train_loss": -6.830463409423828, "global_step": 141395, "epoch": 3366} {"train_loss": -6.832714080810547, "global_step": 141396, "epoch": 3366} {"train_loss": -6.803732395172119, "global_step": 141397, "epoch": 3366} {"train_loss": -6.8213396072387695, "global_step": 141398, "epoch": 3366} {"train_loss": -6.862384796142578, "global_step": 141399, "epoch": 3366} {"train_loss": -6.850337028503418, "global_step": 141400, "epoch": 3366} {"train_loss": -6.81142520904541, "global_step": 141401, "epoch": 3366} {"train_loss": -6.790472984313965, "global_step": 141402, "epoch": 3366} {"train_loss": -6.839531898498535, "global_step": 141403, "epoch": 3366} {"train_loss": -6.765155792236328, "global_step": 141404, "epoch": 3366} {"train_loss": -6.796563148498535, "global_step": 141405, "epoch": 3366} {"train_loss": -6.908746242523193, "global_step": 141406, "epoch": 3366} {"train_loss": -6.769765853881836, "global_step": 141407, "epoch": 3366} {"train_loss": -6.771567344665527, "global_step": 141408, "epoch": 3366} {"train_loss": -6.871454238891602, "global_step": 141409, "epoch": 3366} {"train_loss": -6.7127580642700195, "global_step": 141410, "epoch": 3366} {"train_loss": -6.831175804138184, "global_step": 141411, "epoch": 3366} {"train_loss": -6.801088809967041, "global_step": 141412, "epoch": 3366} {"train_loss": -6.813009636742728, "global_step": 141413, "epoch": 3366, "val_loss": 78266.9921875} {"train_loss": -6.825991153717041, "global_step": 141414, "epoch": 3367} {"train_loss": -6.785810470581055, "global_step": 141415, "epoch": 3367} {"train_loss": -6.720886707305908, "global_step": 141416, "epoch": 3367} {"train_loss": -6.81019401550293, "global_step": 141417, "epoch": 3367} {"train_loss": -6.663967132568359, "global_step": 141418, "epoch": 3367} {"train_loss": -6.6296892166137695, "global_step": 141419, "epoch": 3367} {"train_loss": -6.825932502746582, "global_step": 141420, "epoch": 3367} {"train_loss": -6.844696998596191, "global_step": 141421, "epoch": 3367} {"train_loss": -6.819185733795166, "global_step": 141422, "epoch": 3367} {"train_loss": -6.779463291168213, "global_step": 141423, "epoch": 3367} {"train_loss": -6.742197036743164, "global_step": 141424, "epoch": 3367} {"train_loss": -6.793959617614746, "global_step": 141425, "epoch": 3367} {"train_loss": -6.825133800506592, "global_step": 141426, "epoch": 3367} {"train_loss": -6.828258514404297, "global_step": 141427, "epoch": 3367} {"train_loss": -6.818727493286133, "global_step": 141428, "epoch": 3367} {"train_loss": -6.8051981925964355, "global_step": 141429, "epoch": 3367} {"train_loss": -6.820648193359375, "global_step": 141430, "epoch": 3367} {"train_loss": -6.814882278442383, "global_step": 141431, "epoch": 3367} {"train_loss": -6.734227180480957, "global_step": 141432, "epoch": 3367} {"train_loss": -6.7745747566223145, "global_step": 141433, "epoch": 3367} {"train_loss": -6.863631725311279, "global_step": 141434, "epoch": 3367} {"train_loss": -6.830174922943115, "global_step": 141435, "epoch": 3367} {"train_loss": -6.826629638671875, "global_step": 141436, "epoch": 3367} {"train_loss": -6.748559474945068, "global_step": 141437, "epoch": 3367} {"train_loss": -6.799412727355957, "global_step": 141438, "epoch": 3367} {"train_loss": -6.679075717926025, "global_step": 141439, "epoch": 3367} {"train_loss": -6.7799577713012695, "global_step": 141440, "epoch": 3367} {"train_loss": -6.6472601890563965, "global_step": 141441, "epoch": 3367} {"train_loss": -6.7392377853393555, "global_step": 141442, "epoch": 3367} {"train_loss": -6.832618713378906, "global_step": 141443, "epoch": 3367} {"train_loss": -6.724890232086182, "global_step": 141444, "epoch": 3367} {"train_loss": -6.750263214111328, "global_step": 141445, "epoch": 3367} {"train_loss": -6.762701988220215, "global_step": 141446, "epoch": 3367} {"train_loss": -6.741445541381836, "global_step": 141447, "epoch": 3367} {"train_loss": -6.849430561065674, "global_step": 141448, "epoch": 3367} {"train_loss": -6.742663383483887, "global_step": 141449, "epoch": 3367} {"train_loss": -6.815696716308594, "global_step": 141450, "epoch": 3367} {"train_loss": -6.783217430114746, "global_step": 141451, "epoch": 3367} {"train_loss": -6.734310626983643, "global_step": 141452, "epoch": 3367} {"train_loss": -6.685647010803223, "global_step": 141453, "epoch": 3367} {"train_loss": -6.695152759552002, "global_step": 141454, "epoch": 3367} {"train_loss": -6.772640932173956, "global_step": 141455, "epoch": 3367, "val_loss": 78108.265625} {"train_loss": -6.703585624694824, "global_step": 141456, "epoch": 3368} {"train_loss": -6.808018684387207, "global_step": 141457, "epoch": 3368} {"train_loss": -6.842709064483643, "global_step": 141458, "epoch": 3368} {"train_loss": -6.74100399017334, "global_step": 141459, "epoch": 3368} {"train_loss": -6.681398391723633, "global_step": 141460, "epoch": 3368} {"train_loss": -6.656787872314453, "global_step": 141461, "epoch": 3368} {"train_loss": -6.789310455322266, "global_step": 141462, "epoch": 3368} {"train_loss": -6.782167911529541, "global_step": 141463, "epoch": 3368} {"train_loss": -6.870410919189453, "global_step": 141464, "epoch": 3368} {"train_loss": -6.8192548751831055, "global_step": 141465, "epoch": 3368} {"train_loss": -6.83467960357666, "global_step": 141466, "epoch": 3368} {"train_loss": -6.829275608062744, "global_step": 141467, "epoch": 3368} {"train_loss": -6.835733413696289, "global_step": 141468, "epoch": 3368} {"train_loss": -6.831713676452637, "global_step": 141469, "epoch": 3368} {"train_loss": -6.810048580169678, "global_step": 141470, "epoch": 3368} {"train_loss": -6.7289533615112305, "global_step": 141471, "epoch": 3368} {"train_loss": -6.790864944458008, "global_step": 141472, "epoch": 3368} {"train_loss": -6.774715423583984, "global_step": 141473, "epoch": 3368} {"train_loss": -6.805395126342773, "global_step": 141474, "epoch": 3368} {"train_loss": -6.753104209899902, "global_step": 141475, "epoch": 3368} {"train_loss": -6.8666462898254395, "global_step": 141476, "epoch": 3368} {"train_loss": -6.717320442199707, "global_step": 141477, "epoch": 3368} {"train_loss": -6.844501972198486, "global_step": 141478, "epoch": 3368} {"train_loss": -6.746301174163818, "global_step": 141479, "epoch": 3368} {"train_loss": -6.85530424118042, "global_step": 141480, "epoch": 3368} {"train_loss": -6.816768169403076, "global_step": 141481, "epoch": 3368} {"train_loss": -6.890606880187988, "global_step": 141482, "epoch": 3368} {"train_loss": -6.7877912521362305, "global_step": 141483, "epoch": 3368} {"train_loss": -6.779232978820801, "global_step": 141484, "epoch": 3368} {"train_loss": -6.82659387588501, "global_step": 141485, "epoch": 3368} {"train_loss": -6.860080718994141, "global_step": 141486, "epoch": 3368} {"train_loss": -6.719892501831055, "global_step": 141487, "epoch": 3368} {"train_loss": -6.764608383178711, "global_step": 141488, "epoch": 3368} {"train_loss": -6.8250579833984375, "global_step": 141489, "epoch": 3368} {"train_loss": -6.876544952392578, "global_step": 141490, "epoch": 3368} {"train_loss": -6.948989391326904, "global_step": 141491, "epoch": 3368} {"train_loss": -6.670553207397461, "global_step": 141492, "epoch": 3368} {"train_loss": -6.684866428375244, "global_step": 141493, "epoch": 3368} {"train_loss": -6.797192096710205, "global_step": 141494, "epoch": 3368} {"train_loss": -6.7024359703063965, "global_step": 141495, "epoch": 3368} {"train_loss": -6.8230390548706055, "global_step": 141496, "epoch": 3368} {"train_loss": -6.791935580117362, "global_step": 141497, "epoch": 3368, "val_loss": 78220.1953125} {"train_loss": -6.777552604675293, "global_step": 141498, "epoch": 3369} {"train_loss": -6.861333847045898, "global_step": 141499, "epoch": 3369} {"train_loss": -6.85507345199585, "global_step": 141500, "epoch": 3369} {"train_loss": -6.774711608886719, "global_step": 141501, "epoch": 3369} {"train_loss": -6.917348861694336, "global_step": 141502, "epoch": 3369} {"train_loss": -6.821447372436523, "global_step": 141503, "epoch": 3369} {"train_loss": -6.834258079528809, "global_step": 141504, "epoch": 3369} {"train_loss": -6.896409034729004, "global_step": 141505, "epoch": 3369} {"train_loss": -6.713878631591797, "global_step": 141506, "epoch": 3369} {"train_loss": -6.824864387512207, "global_step": 141507, "epoch": 3369} {"train_loss": -6.892536640167236, "global_step": 141508, "epoch": 3369} {"train_loss": -6.850257873535156, "global_step": 141509, "epoch": 3369} {"train_loss": -6.793180465698242, "global_step": 141510, "epoch": 3369} {"train_loss": -6.824926376342773, "global_step": 141511, "epoch": 3369} {"train_loss": -6.750931739807129, "global_step": 141512, "epoch": 3369} {"train_loss": -6.814455509185791, "global_step": 141513, "epoch": 3369} {"train_loss": -6.777105808258057, "global_step": 141514, "epoch": 3369} {"train_loss": -6.778747081756592, "global_step": 141515, "epoch": 3369} {"train_loss": -6.8212151527404785, "global_step": 141516, "epoch": 3369} {"train_loss": -6.840938091278076, "global_step": 141517, "epoch": 3369} {"train_loss": -6.860692024230957, "global_step": 141518, "epoch": 3369} {"train_loss": -6.8599443435668945, "global_step": 141519, "epoch": 3369} {"train_loss": -6.834840774536133, "global_step": 141520, "epoch": 3369} {"train_loss": -6.856838703155518, "global_step": 141521, "epoch": 3369} {"train_loss": -6.805485725402832, "global_step": 141522, "epoch": 3369} {"train_loss": -6.607328414916992, "global_step": 141523, "epoch": 3369} {"train_loss": -6.713307857513428, "global_step": 141524, "epoch": 3369} {"train_loss": -6.9468584060668945, "global_step": 141525, "epoch": 3369} {"train_loss": -6.794942855834961, "global_step": 141526, "epoch": 3369} {"train_loss": -6.794911861419678, "global_step": 141527, "epoch": 3369} {"train_loss": -6.846799373626709, "global_step": 141528, "epoch": 3369} {"train_loss": -6.724001884460449, "global_step": 141529, "epoch": 3369} {"train_loss": -6.899549961090088, "global_step": 141530, "epoch": 3369} {"train_loss": -6.740092754364014, "global_step": 141531, "epoch": 3369} {"train_loss": -6.821887016296387, "global_step": 141532, "epoch": 3369} {"train_loss": -6.824209690093994, "global_step": 141533, "epoch": 3369} {"train_loss": -6.855795383453369, "global_step": 141534, "epoch": 3369} {"train_loss": -6.956966400146484, "global_step": 141535, "epoch": 3369} {"train_loss": -6.798868179321289, "global_step": 141536, "epoch": 3369} {"train_loss": -6.785484790802002, "global_step": 141537, "epoch": 3369} {"train_loss": -6.797572135925293, "global_step": 141538, "epoch": 3369} {"train_loss": -6.818410067331223, "global_step": 141539, "epoch": 3369, "val_loss": 78141.8046875} {"train_loss": -6.787998199462891, "global_step": 141540, "epoch": 3370} {"train_loss": -6.917487144470215, "global_step": 141541, "epoch": 3370} {"train_loss": -6.854339599609375, "global_step": 141542, "epoch": 3370} {"train_loss": -6.8170552253723145, "global_step": 141543, "epoch": 3370} {"train_loss": -6.811008453369141, "global_step": 141544, "epoch": 3370} {"train_loss": -6.768163681030273, "global_step": 141545, "epoch": 3370} {"train_loss": -6.802329063415527, "global_step": 141546, "epoch": 3370} {"train_loss": -6.833286285400391, "global_step": 141547, "epoch": 3370} {"train_loss": -6.7686381340026855, "global_step": 141548, "epoch": 3370} {"train_loss": -6.958141326904297, "global_step": 141549, "epoch": 3370} {"train_loss": -6.923686981201172, "global_step": 141550, "epoch": 3370} {"train_loss": -6.885073661804199, "global_step": 141551, "epoch": 3370} {"train_loss": -6.9167799949646, "global_step": 141552, "epoch": 3370} {"train_loss": -6.88869047164917, "global_step": 141553, "epoch": 3370} {"train_loss": -6.917520523071289, "global_step": 141554, "epoch": 3370} {"train_loss": -6.939631462097168, "global_step": 141555, "epoch": 3370} {"train_loss": -6.827298641204834, "global_step": 141556, "epoch": 3370} {"train_loss": -6.767058372497559, "global_step": 141557, "epoch": 3370} {"train_loss": -6.841123580932617, "global_step": 141558, "epoch": 3370} {"train_loss": -6.740288734436035, "global_step": 141559, "epoch": 3370} {"train_loss": -6.73185920715332, "global_step": 141560, "epoch": 3370} {"train_loss": -6.938450813293457, "global_step": 141561, "epoch": 3370} {"train_loss": -6.8433942794799805, "global_step": 141562, "epoch": 3370} {"train_loss": -6.663932800292969, "global_step": 141563, "epoch": 3370} {"train_loss": -6.731851577758789, "global_step": 141564, "epoch": 3370} {"train_loss": -6.835200786590576, "global_step": 141565, "epoch": 3370} {"train_loss": -6.821221351623535, "global_step": 141566, "epoch": 3370} {"train_loss": -6.637251853942871, "global_step": 141567, "epoch": 3370} {"train_loss": -6.833375453948975, "global_step": 141568, "epoch": 3370} {"train_loss": -6.763511657714844, "global_step": 141569, "epoch": 3370} {"train_loss": -6.724428176879883, "global_step": 141570, "epoch": 3370} {"train_loss": -6.811273574829102, "global_step": 141571, "epoch": 3370} {"train_loss": -6.845302581787109, "global_step": 141572, "epoch": 3370} {"train_loss": -6.8160858154296875, "global_step": 141573, "epoch": 3370} {"train_loss": -6.825677394866943, "global_step": 141574, "epoch": 3370} {"train_loss": -6.786402225494385, "global_step": 141575, "epoch": 3370} {"train_loss": -6.812358856201172, "global_step": 141576, "epoch": 3370} {"train_loss": -6.643154621124268, "global_step": 141577, "epoch": 3370} {"train_loss": -6.859018325805664, "global_step": 141578, "epoch": 3370} {"train_loss": -6.80205774307251, "global_step": 141579, "epoch": 3370} {"train_loss": -6.739489555358887, "global_step": 141580, "epoch": 3370} {"train_loss": -6.814979223977952, "global_step": 141581, "epoch": 3370, "val_loss": 78535.671875} {"train_loss": -6.782617568969727, "global_step": 141582, "epoch": 3371} {"train_loss": -6.803770065307617, "global_step": 141583, "epoch": 3371} {"train_loss": -6.88239049911499, "global_step": 141584, "epoch": 3371} {"train_loss": -6.713920593261719, "global_step": 141585, "epoch": 3371} {"train_loss": -6.907837390899658, "global_step": 141586, "epoch": 3371} {"train_loss": -6.804666519165039, "global_step": 141587, "epoch": 3371} {"train_loss": -6.745708465576172, "global_step": 141588, "epoch": 3371} {"train_loss": -6.84166145324707, "global_step": 141589, "epoch": 3371} {"train_loss": -6.763006210327148, "global_step": 141590, "epoch": 3371} {"train_loss": -6.956793785095215, "global_step": 141591, "epoch": 3371} {"train_loss": -6.890902996063232, "global_step": 141592, "epoch": 3371} {"train_loss": -6.7839860916137695, "global_step": 141593, "epoch": 3371} {"train_loss": -6.870910167694092, "global_step": 141594, "epoch": 3371} {"train_loss": -6.920899868011475, "global_step": 141595, "epoch": 3371} {"train_loss": -6.774533271789551, "global_step": 141596, "epoch": 3371} {"train_loss": -6.797140121459961, "global_step": 141597, "epoch": 3371} {"train_loss": -6.861279010772705, "global_step": 141598, "epoch": 3371} {"train_loss": -6.648679733276367, "global_step": 141599, "epoch": 3371} {"train_loss": -6.83805513381958, "global_step": 141600, "epoch": 3371} {"train_loss": -6.811590671539307, "global_step": 141601, "epoch": 3371} {"train_loss": -6.813962936401367, "global_step": 141602, "epoch": 3371} {"train_loss": -6.806727409362793, "global_step": 141603, "epoch": 3371} {"train_loss": -6.815413475036621, "global_step": 141604, "epoch": 3371} {"train_loss": -6.817239284515381, "global_step": 141605, "epoch": 3371} {"train_loss": -6.713216304779053, "global_step": 141606, "epoch": 3371} {"train_loss": -6.779412746429443, "global_step": 141607, "epoch": 3371} {"train_loss": -6.787420272827148, "global_step": 141608, "epoch": 3371} {"train_loss": -6.897285461425781, "global_step": 141609, "epoch": 3371} {"train_loss": -6.883058547973633, "global_step": 141610, "epoch": 3371} {"train_loss": -6.821972846984863, "global_step": 141611, "epoch": 3371} {"train_loss": -6.68729305267334, "global_step": 141612, "epoch": 3371} {"train_loss": -6.675631523132324, "global_step": 141613, "epoch": 3371} {"train_loss": -6.53559684753418, "global_step": 141614, "epoch": 3371} {"train_loss": -6.764348030090332, "global_step": 141615, "epoch": 3371} {"train_loss": -6.706772327423096, "global_step": 141616, "epoch": 3371} {"train_loss": -6.790543556213379, "global_step": 141617, "epoch": 3371} {"train_loss": -6.661647796630859, "global_step": 141618, "epoch": 3371} {"train_loss": -6.697955131530762, "global_step": 141619, "epoch": 3371} {"train_loss": -6.684365272521973, "global_step": 141620, "epoch": 3371} {"train_loss": -6.641420364379883, "global_step": 141621, "epoch": 3371} {"train_loss": -6.7598981857299805, "global_step": 141622, "epoch": 3371} {"train_loss": -6.780866940816243, "global_step": 141623, "epoch": 3371, "val_loss": 78044.2265625} {"train_loss": -6.727967262268066, "global_step": 141624, "epoch": 3372} {"train_loss": -6.718019008636475, "global_step": 141625, "epoch": 3372} {"train_loss": -6.683956146240234, "global_step": 141626, "epoch": 3372} {"train_loss": -6.8621954917907715, "global_step": 141627, "epoch": 3372} {"train_loss": -6.658412933349609, "global_step": 141628, "epoch": 3372} {"train_loss": -6.85048246383667, "global_step": 141629, "epoch": 3372} {"train_loss": -6.711655139923096, "global_step": 141630, "epoch": 3372} {"train_loss": -6.6709885597229, "global_step": 141631, "epoch": 3372} {"train_loss": -6.737354278564453, "global_step": 141632, "epoch": 3372} {"train_loss": -6.816530227661133, "global_step": 141633, "epoch": 3372} {"train_loss": -6.711933135986328, "global_step": 141634, "epoch": 3372} {"train_loss": -6.658355236053467, "global_step": 141635, "epoch": 3372} {"train_loss": -6.742147922515869, "global_step": 141636, "epoch": 3372} {"train_loss": -6.852455139160156, "global_step": 141637, "epoch": 3372} {"train_loss": -6.776854038238525, "global_step": 141638, "epoch": 3372} {"train_loss": -6.859316349029541, "global_step": 141639, "epoch": 3372} {"train_loss": -6.713830947875977, "global_step": 141640, "epoch": 3372} {"train_loss": -6.708345890045166, "global_step": 141641, "epoch": 3372} {"train_loss": -6.717110633850098, "global_step": 141642, "epoch": 3372} {"train_loss": -6.782010555267334, "global_step": 141643, "epoch": 3372} {"train_loss": -6.832118988037109, "global_step": 141644, "epoch": 3372} {"train_loss": -6.733780384063721, "global_step": 141645, "epoch": 3372} {"train_loss": -6.736518859863281, "global_step": 141646, "epoch": 3372} {"train_loss": -6.836899757385254, "global_step": 141647, "epoch": 3372} {"train_loss": -6.761455535888672, "global_step": 141648, "epoch": 3372} {"train_loss": -6.750089645385742, "global_step": 141649, "epoch": 3372} {"train_loss": -6.752281188964844, "global_step": 141650, "epoch": 3372} {"train_loss": -6.731639862060547, "global_step": 141651, "epoch": 3372} {"train_loss": -6.870891571044922, "global_step": 141652, "epoch": 3372} {"train_loss": -6.798810005187988, "global_step": 141653, "epoch": 3372} {"train_loss": -6.783090591430664, "global_step": 141654, "epoch": 3372} {"train_loss": -6.870928764343262, "global_step": 141655, "epoch": 3372} {"train_loss": -6.8597798347473145, "global_step": 141656, "epoch": 3372} {"train_loss": -6.773002624511719, "global_step": 141657, "epoch": 3372} {"train_loss": -6.822659969329834, "global_step": 141658, "epoch": 3372} {"train_loss": -6.768345832824707, "global_step": 141659, "epoch": 3372} {"train_loss": -6.893894195556641, "global_step": 141660, "epoch": 3372} {"train_loss": -6.84874963760376, "global_step": 141661, "epoch": 3372} {"train_loss": -6.784646034240723, "global_step": 141662, "epoch": 3372} {"train_loss": -6.625664710998535, "global_step": 141663, "epoch": 3372} {"train_loss": -6.8830485343933105, "global_step": 141664, "epoch": 3372} {"train_loss": -6.771974824723744, "global_step": 141665, "epoch": 3372, "val_loss": 78415.6171875} {"train_loss": -6.751166343688965, "global_step": 141666, "epoch": 3373} {"train_loss": -6.810818672180176, "global_step": 141667, "epoch": 3373} {"train_loss": -6.874575614929199, "global_step": 141668, "epoch": 3373} {"train_loss": -6.8185529708862305, "global_step": 141669, "epoch": 3373} {"train_loss": -6.692685127258301, "global_step": 141670, "epoch": 3373} {"train_loss": -6.7754974365234375, "global_step": 141671, "epoch": 3373} {"train_loss": -6.788933753967285, "global_step": 141672, "epoch": 3373} {"train_loss": -6.88730525970459, "global_step": 141673, "epoch": 3373} {"train_loss": -6.744494915008545, "global_step": 141674, "epoch": 3373} {"train_loss": -6.796795845031738, "global_step": 141675, "epoch": 3373} {"train_loss": -6.703734874725342, "global_step": 141676, "epoch": 3373} {"train_loss": -6.768163681030273, "global_step": 141677, "epoch": 3373} {"train_loss": -6.791576385498047, "global_step": 141678, "epoch": 3373} {"train_loss": -6.817423343658447, "global_step": 141679, "epoch": 3373} {"train_loss": -6.890742778778076, "global_step": 141680, "epoch": 3373} {"train_loss": -6.744672775268555, "global_step": 141681, "epoch": 3373} {"train_loss": -6.6928863525390625, "global_step": 141682, "epoch": 3373} {"train_loss": -6.756061553955078, "global_step": 141683, "epoch": 3373} {"train_loss": -6.78634786605835, "global_step": 141684, "epoch": 3373} {"train_loss": -6.633912086486816, "global_step": 141685, "epoch": 3373} {"train_loss": -6.6896209716796875, "global_step": 141686, "epoch": 3373} {"train_loss": -6.683317184448242, "global_step": 141687, "epoch": 3373} {"train_loss": -6.817570209503174, "global_step": 141688, "epoch": 3373} {"train_loss": -6.752631187438965, "global_step": 141689, "epoch": 3373} {"train_loss": -6.7159810066223145, "global_step": 141690, "epoch": 3373} {"train_loss": -6.815245628356934, "global_step": 141691, "epoch": 3373} {"train_loss": -6.759124279022217, "global_step": 141692, "epoch": 3373} {"train_loss": -6.848714828491211, "global_step": 141693, "epoch": 3373} {"train_loss": -6.854362487792969, "global_step": 141694, "epoch": 3373} {"train_loss": -6.764290809631348, "global_step": 141695, "epoch": 3373} {"train_loss": -6.893823623657227, "global_step": 141696, "epoch": 3373} {"train_loss": -6.703437328338623, "global_step": 141697, "epoch": 3373} {"train_loss": -6.713641166687012, "global_step": 141698, "epoch": 3373} {"train_loss": -6.769837856292725, "global_step": 141699, "epoch": 3373} {"train_loss": -6.83480167388916, "global_step": 141700, "epoch": 3373} {"train_loss": -6.726565361022949, "global_step": 141701, "epoch": 3373} {"train_loss": -6.712555408477783, "global_step": 141702, "epoch": 3373} {"train_loss": -6.8216400146484375, "global_step": 141703, "epoch": 3373} {"train_loss": -6.762976169586182, "global_step": 141704, "epoch": 3373} {"train_loss": -6.704803943634033, "global_step": 141705, "epoch": 3373} {"train_loss": -6.795731544494629, "global_step": 141706, "epoch": 3373} {"train_loss": -6.773301079159691, "global_step": 141707, "epoch": 3373, "val_loss": 78401.0} {"train_loss": -6.772157669067383, "global_step": 141708, "epoch": 3374} {"train_loss": -6.891768455505371, "global_step": 141709, "epoch": 3374} {"train_loss": -6.730218410491943, "global_step": 141710, "epoch": 3374} {"train_loss": -6.733177185058594, "global_step": 141711, "epoch": 3374} {"train_loss": -6.778697967529297, "global_step": 141712, "epoch": 3374} {"train_loss": -6.806466102600098, "global_step": 141713, "epoch": 3374} {"train_loss": -6.862776756286621, "global_step": 141714, "epoch": 3374} {"train_loss": -6.7514848709106445, "global_step": 141715, "epoch": 3374} {"train_loss": -6.829293251037598, "global_step": 141716, "epoch": 3374} {"train_loss": -6.7190704345703125, "global_step": 141717, "epoch": 3374} {"train_loss": -6.751446723937988, "global_step": 141718, "epoch": 3374} {"train_loss": -6.85753059387207, "global_step": 141719, "epoch": 3374} {"train_loss": -6.8207879066467285, "global_step": 141720, "epoch": 3374} {"train_loss": -6.728244781494141, "global_step": 141721, "epoch": 3374} {"train_loss": -6.84632682800293, "global_step": 141722, "epoch": 3374} {"train_loss": -6.777101993560791, "global_step": 141723, "epoch": 3374} {"train_loss": -6.693955421447754, "global_step": 141724, "epoch": 3374} {"train_loss": -6.823992729187012, "global_step": 141725, "epoch": 3374} {"train_loss": -6.788349151611328, "global_step": 141726, "epoch": 3374} {"train_loss": -6.627397060394287, "global_step": 141727, "epoch": 3374} {"train_loss": -6.751737117767334, "global_step": 141728, "epoch": 3374} {"train_loss": -6.874181747436523, "global_step": 141729, "epoch": 3374} {"train_loss": -6.713763236999512, "global_step": 141730, "epoch": 3374} {"train_loss": -6.725428581237793, "global_step": 141731, "epoch": 3374} {"train_loss": -6.78691291809082, "global_step": 141732, "epoch": 3374} {"train_loss": -6.663511276245117, "global_step": 141733, "epoch": 3374} {"train_loss": -6.825613021850586, "global_step": 141734, "epoch": 3374} {"train_loss": -6.929449558258057, "global_step": 141735, "epoch": 3374} {"train_loss": -6.847762107849121, "global_step": 141736, "epoch": 3374} {"train_loss": -6.78702449798584, "global_step": 141737, "epoch": 3374} {"train_loss": -6.791740894317627, "global_step": 141738, "epoch": 3374} {"train_loss": -6.80368709564209, "global_step": 141739, "epoch": 3374} {"train_loss": -6.725871562957764, "global_step": 141740, "epoch": 3374} {"train_loss": -6.756160259246826, "global_step": 141741, "epoch": 3374} {"train_loss": -6.709738731384277, "global_step": 141742, "epoch": 3374} {"train_loss": -6.823498249053955, "global_step": 141743, "epoch": 3374} {"train_loss": -6.619295120239258, "global_step": 141744, "epoch": 3374} {"train_loss": -6.680981159210205, "global_step": 141745, "epoch": 3374} {"train_loss": -6.819477558135986, "global_step": 141746, "epoch": 3374} {"train_loss": -6.691330909729004, "global_step": 141747, "epoch": 3374} {"train_loss": -6.629612445831299, "global_step": 141748, "epoch": 3374} {"train_loss": -6.768988597960699, "global_step": 141749, "epoch": 3374, "val_loss": 78685.609375} {"train_loss": -6.614537239074707, "global_step": 141750, "epoch": 3375} {"train_loss": -6.8058013916015625, "global_step": 141751, "epoch": 3375} {"train_loss": -6.58063268661499, "global_step": 141752, "epoch": 3375} {"train_loss": -6.664754867553711, "global_step": 141753, "epoch": 3375} {"train_loss": -6.781523704528809, "global_step": 141754, "epoch": 3375} {"train_loss": -6.567864418029785, "global_step": 141755, "epoch": 3375} {"train_loss": -6.8202128410339355, "global_step": 141756, "epoch": 3375} {"train_loss": -6.743074417114258, "global_step": 141757, "epoch": 3375} {"train_loss": -6.72987174987793, "global_step": 141758, "epoch": 3375} {"train_loss": -6.7696709632873535, "global_step": 141759, "epoch": 3375} {"train_loss": -6.6915283203125, "global_step": 141760, "epoch": 3375} {"train_loss": -6.7281107902526855, "global_step": 141761, "epoch": 3375} {"train_loss": -6.711505889892578, "global_step": 141762, "epoch": 3375} {"train_loss": -6.820250511169434, "global_step": 141763, "epoch": 3375} {"train_loss": -6.596284866333008, "global_step": 141764, "epoch": 3375} {"train_loss": -6.6756439208984375, "global_step": 141765, "epoch": 3375} {"train_loss": -6.737918853759766, "global_step": 141766, "epoch": 3375} {"train_loss": -6.725217819213867, "global_step": 141767, "epoch": 3375} {"train_loss": -6.741185665130615, "global_step": 141768, "epoch": 3375} {"train_loss": -6.789632320404053, "global_step": 141769, "epoch": 3375} {"train_loss": -6.726197242736816, "global_step": 141770, "epoch": 3375} {"train_loss": -6.79423713684082, "global_step": 141771, "epoch": 3375} {"train_loss": -6.686224937438965, "global_step": 141772, "epoch": 3375} {"train_loss": -6.725255966186523, "global_step": 141773, "epoch": 3375} {"train_loss": -6.755743503570557, "global_step": 141774, "epoch": 3375} {"train_loss": -6.809342384338379, "global_step": 141775, "epoch": 3375} {"train_loss": -6.706084728240967, "global_step": 141776, "epoch": 3375} {"train_loss": -6.827797889709473, "global_step": 141777, "epoch": 3375} {"train_loss": -6.598034858703613, "global_step": 141778, "epoch": 3375} {"train_loss": -6.810596466064453, "global_step": 141779, "epoch": 3375} {"train_loss": -6.800882339477539, "global_step": 141780, "epoch": 3375} {"train_loss": -6.704390525817871, "global_step": 141781, "epoch": 3375} {"train_loss": -6.760666847229004, "global_step": 141782, "epoch": 3375} {"train_loss": -6.651154518127441, "global_step": 141783, "epoch": 3375} {"train_loss": -6.724367618560791, "global_step": 141784, "epoch": 3375} {"train_loss": -6.795584678649902, "global_step": 141785, "epoch": 3375} {"train_loss": -6.856280326843262, "global_step": 141786, "epoch": 3375} {"train_loss": -6.803832054138184, "global_step": 141787, "epoch": 3375} {"train_loss": -6.672661781311035, "global_step": 141788, "epoch": 3375} {"train_loss": -6.80441427230835, "global_step": 141789, "epoch": 3375} {"train_loss": -6.836788177490234, "global_step": 141790, "epoch": 3375} {"train_loss": -6.735517604010446, "global_step": 141791, "epoch": 3375, "val_loss": 78080.96875} {"train_loss": -6.77393102645874, "global_step": 141792, "epoch": 3376} {"train_loss": -6.7842535972595215, "global_step": 141793, "epoch": 3376} {"train_loss": -6.69791316986084, "global_step": 141794, "epoch": 3376} {"train_loss": -6.890329360961914, "global_step": 141795, "epoch": 3376} {"train_loss": -6.7814459800720215, "global_step": 141796, "epoch": 3376} {"train_loss": -6.775066375732422, "global_step": 141797, "epoch": 3376} {"train_loss": -6.658957481384277, "global_step": 141798, "epoch": 3376} {"train_loss": -6.74007511138916, "global_step": 141799, "epoch": 3376} {"train_loss": -6.812033653259277, "global_step": 141800, "epoch": 3376} {"train_loss": -6.837099552154541, "global_step": 141801, "epoch": 3376} {"train_loss": -6.652832984924316, "global_step": 141802, "epoch": 3376} {"train_loss": -6.757577419281006, "global_step": 141803, "epoch": 3376} {"train_loss": -6.814058780670166, "global_step": 141804, "epoch": 3376} {"train_loss": -6.760943412780762, "global_step": 141805, "epoch": 3376} {"train_loss": -6.729961395263672, "global_step": 141806, "epoch": 3376} {"train_loss": -6.700498580932617, "global_step": 141807, "epoch": 3376} {"train_loss": -6.746735095977783, "global_step": 141808, "epoch": 3376} {"train_loss": -6.767668724060059, "global_step": 141809, "epoch": 3376} {"train_loss": -6.822326183319092, "global_step": 141810, "epoch": 3376} {"train_loss": -6.754777908325195, "global_step": 141811, "epoch": 3376} {"train_loss": -6.798508644104004, "global_step": 141812, "epoch": 3376} {"train_loss": -6.759852886199951, "global_step": 141813, "epoch": 3376} {"train_loss": -6.682024002075195, "global_step": 141814, "epoch": 3376} {"train_loss": -6.830999374389648, "global_step": 141815, "epoch": 3376} {"train_loss": -6.764508247375488, "global_step": 141816, "epoch": 3376} {"train_loss": -6.82955265045166, "global_step": 141817, "epoch": 3376} {"train_loss": -6.821300983428955, "global_step": 141818, "epoch": 3376} {"train_loss": -6.766941070556641, "global_step": 141819, "epoch": 3376} {"train_loss": -6.774002552032471, "global_step": 141820, "epoch": 3376} {"train_loss": -6.7855305671691895, "global_step": 141821, "epoch": 3376} {"train_loss": -6.825692176818848, "global_step": 141822, "epoch": 3376} {"train_loss": -6.837982177734375, "global_step": 141823, "epoch": 3376} {"train_loss": -6.796180725097656, "global_step": 141824, "epoch": 3376} {"train_loss": -6.834991931915283, "global_step": 141825, "epoch": 3376} {"train_loss": -6.891822338104248, "global_step": 141826, "epoch": 3376} {"train_loss": -6.813292503356934, "global_step": 141827, "epoch": 3376} {"train_loss": -6.866244316101074, "global_step": 141828, "epoch": 3376} {"train_loss": -6.724740982055664, "global_step": 141829, "epoch": 3376} {"train_loss": -6.899580955505371, "global_step": 141830, "epoch": 3376} {"train_loss": -6.78721809387207, "global_step": 141831, "epoch": 3376} {"train_loss": -6.762561798095703, "global_step": 141832, "epoch": 3376} {"train_loss": -6.785809187662034, "global_step": 141833, "epoch": 3376, "val_loss": 78112.578125} {"train_loss": -6.863563060760498, "global_step": 141834, "epoch": 3377} {"train_loss": -6.837360858917236, "global_step": 141835, "epoch": 3377} {"train_loss": -6.735143661499023, "global_step": 141836, "epoch": 3377} {"train_loss": -6.824578285217285, "global_step": 141837, "epoch": 3377} {"train_loss": -6.865762233734131, "global_step": 141838, "epoch": 3377} {"train_loss": -6.8544158935546875, "global_step": 141839, "epoch": 3377} {"train_loss": -6.827964782714844, "global_step": 141840, "epoch": 3377} {"train_loss": -6.7906012535095215, "global_step": 141841, "epoch": 3377} {"train_loss": -6.780622482299805, "global_step": 141842, "epoch": 3377} {"train_loss": -6.730843544006348, "global_step": 141843, "epoch": 3377} {"train_loss": -6.799947738647461, "global_step": 141844, "epoch": 3377} {"train_loss": -6.741274356842041, "global_step": 141845, "epoch": 3377} {"train_loss": -6.62022590637207, "global_step": 141846, "epoch": 3377} {"train_loss": -6.684482097625732, "global_step": 141847, "epoch": 3377} {"train_loss": -6.500316619873047, "global_step": 141848, "epoch": 3377} {"train_loss": -6.786937713623047, "global_step": 141849, "epoch": 3377} {"train_loss": -6.619153022766113, "global_step": 141850, "epoch": 3377} {"train_loss": -6.676239967346191, "global_step": 141851, "epoch": 3377} {"train_loss": -6.688178062438965, "global_step": 141852, "epoch": 3377} {"train_loss": -6.552707672119141, "global_step": 141853, "epoch": 3377} {"train_loss": -6.751989364624023, "global_step": 141854, "epoch": 3377} {"train_loss": -6.734842777252197, "global_step": 141855, "epoch": 3377} {"train_loss": -6.732804298400879, "global_step": 141856, "epoch": 3377} {"train_loss": -6.785886764526367, "global_step": 141857, "epoch": 3377} {"train_loss": -6.6125078201293945, "global_step": 141858, "epoch": 3377} {"train_loss": -6.697010517120361, "global_step": 141859, "epoch": 3377} {"train_loss": -6.8049116134643555, "global_step": 141860, "epoch": 3377} {"train_loss": -6.770866394042969, "global_step": 141861, "epoch": 3377} {"train_loss": -6.758880615234375, "global_step": 141862, "epoch": 3377} {"train_loss": -6.602133274078369, "global_step": 141863, "epoch": 3377} {"train_loss": -6.6568450927734375, "global_step": 141864, "epoch": 3377} {"train_loss": -6.740433692932129, "global_step": 141865, "epoch": 3377} {"train_loss": -6.606595039367676, "global_step": 141866, "epoch": 3377} {"train_loss": -6.681524276733398, "global_step": 141867, "epoch": 3377} {"train_loss": -6.795505523681641, "global_step": 141868, "epoch": 3377} {"train_loss": -6.803247451782227, "global_step": 141869, "epoch": 3377} {"train_loss": -6.831618309020996, "global_step": 141870, "epoch": 3377} {"train_loss": -6.655834197998047, "global_step": 141871, "epoch": 3377} {"train_loss": -6.8492560386657715, "global_step": 141872, "epoch": 3377} {"train_loss": -6.891718864440918, "global_step": 141873, "epoch": 3377} {"train_loss": -6.702437400817871, "global_step": 141874, "epoch": 3377} {"train_loss": -6.74096357254755, "global_step": 141875, "epoch": 3377, "val_loss": 78297.734375} {"train_loss": -6.82112979888916, "global_step": 141876, "epoch": 3378} {"train_loss": -6.826128005981445, "global_step": 141877, "epoch": 3378} {"train_loss": -6.861629009246826, "global_step": 141878, "epoch": 3378} {"train_loss": -6.792361736297607, "global_step": 141879, "epoch": 3378} {"train_loss": -6.873869895935059, "global_step": 141880, "epoch": 3378} {"train_loss": -6.819486141204834, "global_step": 141881, "epoch": 3378} {"train_loss": -6.75701904296875, "global_step": 141882, "epoch": 3378} {"train_loss": -6.727158546447754, "global_step": 141883, "epoch": 3378} {"train_loss": -6.9459381103515625, "global_step": 141884, "epoch": 3378} {"train_loss": -6.781589508056641, "global_step": 141885, "epoch": 3378} {"train_loss": -6.791686534881592, "global_step": 141886, "epoch": 3378} {"train_loss": -6.773435592651367, "global_step": 141887, "epoch": 3378} {"train_loss": -6.894689559936523, "global_step": 141888, "epoch": 3378} {"train_loss": -6.863101959228516, "global_step": 141889, "epoch": 3378} {"train_loss": -6.872870445251465, "global_step": 141890, "epoch": 3378} {"train_loss": -6.7832746505737305, "global_step": 141891, "epoch": 3378} {"train_loss": -6.860363960266113, "global_step": 141892, "epoch": 3378} {"train_loss": -6.792116641998291, "global_step": 141893, "epoch": 3378} {"train_loss": -6.724916458129883, "global_step": 141894, "epoch": 3378} {"train_loss": -6.7572832107543945, "global_step": 141895, "epoch": 3378} {"train_loss": -6.74976110458374, "global_step": 141896, "epoch": 3378} {"train_loss": -6.826169013977051, "global_step": 141897, "epoch": 3378} {"train_loss": -6.795065402984619, "global_step": 141898, "epoch": 3378} {"train_loss": -6.7492241859436035, "global_step": 141899, "epoch": 3378} {"train_loss": -6.76350212097168, "global_step": 141900, "epoch": 3378} {"train_loss": -6.700908184051514, "global_step": 141901, "epoch": 3378} {"train_loss": -6.656246185302734, "global_step": 141902, "epoch": 3378} {"train_loss": -6.766284942626953, "global_step": 141903, "epoch": 3378} {"train_loss": -6.715767860412598, "global_step": 141904, "epoch": 3378} {"train_loss": -6.859286308288574, "global_step": 141905, "epoch": 3378} {"train_loss": -6.630749702453613, "global_step": 141906, "epoch": 3378} {"train_loss": -6.680438041687012, "global_step": 141907, "epoch": 3378} {"train_loss": -6.589468002319336, "global_step": 141908, "epoch": 3378} {"train_loss": -6.840719699859619, "global_step": 141909, "epoch": 3378} {"train_loss": -6.746437072753906, "global_step": 141910, "epoch": 3378} {"train_loss": -6.667820453643799, "global_step": 141911, "epoch": 3378} {"train_loss": -6.795449256896973, "global_step": 141912, "epoch": 3378} {"train_loss": -6.773869514465332, "global_step": 141913, "epoch": 3378} {"train_loss": -6.653264045715332, "global_step": 141914, "epoch": 3378} {"train_loss": -6.71514892578125, "global_step": 141915, "epoch": 3378} {"train_loss": -6.730401515960693, "global_step": 141916, "epoch": 3378} {"train_loss": -6.7745309103102915, "global_step": 141917, "epoch": 3378, "val_loss": 78257.5546875} {"train_loss": -6.803508758544922, "global_step": 141918, "epoch": 3379} {"train_loss": -6.884032249450684, "global_step": 141919, "epoch": 3379} {"train_loss": -6.75791597366333, "global_step": 141920, "epoch": 3379} {"train_loss": -6.788578987121582, "global_step": 141921, "epoch": 3379} {"train_loss": -6.70582389831543, "global_step": 141922, "epoch": 3379} {"train_loss": -6.709469795227051, "global_step": 141923, "epoch": 3379} {"train_loss": -6.784059047698975, "global_step": 141924, "epoch": 3379} {"train_loss": -6.70986270904541, "global_step": 141925, "epoch": 3379} {"train_loss": -6.77990198135376, "global_step": 141926, "epoch": 3379} {"train_loss": -6.7262701988220215, "global_step": 141927, "epoch": 3379} {"train_loss": -6.763684272766113, "global_step": 141928, "epoch": 3379} {"train_loss": -6.824368476867676, "global_step": 141929, "epoch": 3379} {"train_loss": -6.744617462158203, "global_step": 141930, "epoch": 3379} {"train_loss": -6.728968620300293, "global_step": 141931, "epoch": 3379} {"train_loss": -6.810757637023926, "global_step": 141932, "epoch": 3379} {"train_loss": -6.815097332000732, "global_step": 141933, "epoch": 3379} {"train_loss": -6.672760009765625, "global_step": 141934, "epoch": 3379} {"train_loss": -6.7696533203125, "global_step": 141935, "epoch": 3379} {"train_loss": -6.8163533210754395, "global_step": 141936, "epoch": 3379} {"train_loss": -6.748561382293701, "global_step": 141937, "epoch": 3379} {"train_loss": -6.774762153625488, "global_step": 141938, "epoch": 3379} {"train_loss": -6.802736282348633, "global_step": 141939, "epoch": 3379} {"train_loss": -6.711511611938477, "global_step": 141940, "epoch": 3379} {"train_loss": -6.753185272216797, "global_step": 141941, "epoch": 3379} {"train_loss": -6.5570068359375, "global_step": 141942, "epoch": 3379} {"train_loss": -6.716710090637207, "global_step": 141943, "epoch": 3379} {"train_loss": -6.752959251403809, "global_step": 141944, "epoch": 3379} {"train_loss": -6.691403865814209, "global_step": 141945, "epoch": 3379} {"train_loss": -6.8308868408203125, "global_step": 141946, "epoch": 3379} {"train_loss": -6.6275482177734375, "global_step": 141947, "epoch": 3379} {"train_loss": -6.8121337890625, "global_step": 141948, "epoch": 3379} {"train_loss": -6.794751167297363, "global_step": 141949, "epoch": 3379} {"train_loss": -6.7181010246276855, "global_step": 141950, "epoch": 3379} {"train_loss": -6.59709358215332, "global_step": 141951, "epoch": 3379} {"train_loss": -6.672891616821289, "global_step": 141952, "epoch": 3379} {"train_loss": -6.705764293670654, "global_step": 141953, "epoch": 3379} {"train_loss": -6.784825325012207, "global_step": 141954, "epoch": 3379} {"train_loss": -6.650864601135254, "global_step": 141955, "epoch": 3379} {"train_loss": -6.7768402099609375, "global_step": 141956, "epoch": 3379} {"train_loss": -6.760002136230469, "global_step": 141957, "epoch": 3379} {"train_loss": -6.754599571228027, "global_step": 141958, "epoch": 3379} {"train_loss": -6.745105277924311, "global_step": 141959, "epoch": 3379, "val_loss": 78422.7109375} {"train_loss": -6.823791027069092, "global_step": 141960, "epoch": 3380} {"train_loss": -6.75075626373291, "global_step": 141961, "epoch": 3380} {"train_loss": -6.730940818786621, "global_step": 141962, "epoch": 3380} {"train_loss": -6.8139142990112305, "global_step": 141963, "epoch": 3380} {"train_loss": -6.646614074707031, "global_step": 141964, "epoch": 3380} {"train_loss": -6.709685802459717, "global_step": 141965, "epoch": 3380} {"train_loss": -6.7802324295043945, "global_step": 141966, "epoch": 3380} {"train_loss": -6.670013427734375, "global_step": 141967, "epoch": 3380} {"train_loss": -6.679732322692871, "global_step": 141968, "epoch": 3380} {"train_loss": -6.779062271118164, "global_step": 141969, "epoch": 3380} {"train_loss": -6.577836990356445, "global_step": 141970, "epoch": 3380} {"train_loss": -6.784812927246094, "global_step": 141971, "epoch": 3380} {"train_loss": -6.785346031188965, "global_step": 141972, "epoch": 3380} {"train_loss": -6.784790992736816, "global_step": 141973, "epoch": 3380} {"train_loss": -6.70013427734375, "global_step": 141974, "epoch": 3380} {"train_loss": -6.741313934326172, "global_step": 141975, "epoch": 3380} {"train_loss": -6.774165153503418, "global_step": 141976, "epoch": 3380} {"train_loss": -6.712701797485352, "global_step": 141977, "epoch": 3380} {"train_loss": -6.863500118255615, "global_step": 141978, "epoch": 3380} {"train_loss": -6.840846061706543, "global_step": 141979, "epoch": 3380} {"train_loss": -6.835168838500977, "global_step": 141980, "epoch": 3380} {"train_loss": -6.82591438293457, "global_step": 141981, "epoch": 3380} {"train_loss": -6.77100944519043, "global_step": 141982, "epoch": 3380} {"train_loss": -6.804165363311768, "global_step": 141983, "epoch": 3380} {"train_loss": -6.824954032897949, "global_step": 141984, "epoch": 3380} {"train_loss": -6.844519138336182, "global_step": 141985, "epoch": 3380} {"train_loss": -6.770816802978516, "global_step": 141986, "epoch": 3380} {"train_loss": -6.786399841308594, "global_step": 141987, "epoch": 3380} {"train_loss": -6.83900260925293, "global_step": 141988, "epoch": 3380} {"train_loss": -6.846245765686035, "global_step": 141989, "epoch": 3380} {"train_loss": -6.797608852386475, "global_step": 141990, "epoch": 3380} {"train_loss": -6.838483810424805, "global_step": 141991, "epoch": 3380} {"train_loss": -6.841718673706055, "global_step": 141992, "epoch": 3380} {"train_loss": -6.764853477478027, "global_step": 141993, "epoch": 3380} {"train_loss": -6.8114776611328125, "global_step": 141994, "epoch": 3380} {"train_loss": -6.734803199768066, "global_step": 141995, "epoch": 3380} {"train_loss": -6.8231964111328125, "global_step": 141996, "epoch": 3380} {"train_loss": -6.64488410949707, "global_step": 141997, "epoch": 3380} {"train_loss": -6.68701696395874, "global_step": 141998, "epoch": 3380} {"train_loss": -6.688970565795898, "global_step": 141999, "epoch": 3380} {"train_loss": -6.729308605194092, "global_step": 142000, "epoch": 3380} {"train_loss": -6.76739223798116, "global_step": 142001, "epoch": 3380, "val_loss": 78365.9609375} {"train_loss": -6.671967506408691, "global_step": 142002, "epoch": 3381} {"train_loss": -6.763155937194824, "global_step": 142003, "epoch": 3381} {"train_loss": -6.809041500091553, "global_step": 142004, "epoch": 3381} {"train_loss": -6.769865989685059, "global_step": 142005, "epoch": 3381} {"train_loss": -6.813309669494629, "global_step": 142006, "epoch": 3381} {"train_loss": -6.790587902069092, "global_step": 142007, "epoch": 3381} {"train_loss": -6.778262138366699, "global_step": 142008, "epoch": 3381} {"train_loss": -6.7902750968933105, "global_step": 142009, "epoch": 3381} {"train_loss": -6.821768760681152, "global_step": 142010, "epoch": 3381} {"train_loss": -6.8353400230407715, "global_step": 142011, "epoch": 3381} {"train_loss": -6.806726455688477, "global_step": 142012, "epoch": 3381} {"train_loss": -6.837400436401367, "global_step": 142013, "epoch": 3381} {"train_loss": -6.844009876251221, "global_step": 142014, "epoch": 3381} {"train_loss": -6.646005630493164, "global_step": 142015, "epoch": 3381} {"train_loss": -6.803429126739502, "global_step": 142016, "epoch": 3381} {"train_loss": -6.8639092445373535, "global_step": 142017, "epoch": 3381} {"train_loss": -6.771091461181641, "global_step": 142018, "epoch": 3381} {"train_loss": -6.663417816162109, "global_step": 142019, "epoch": 3381} {"train_loss": -6.817313194274902, "global_step": 142020, "epoch": 3381} {"train_loss": -6.6572675704956055, "global_step": 142021, "epoch": 3381} {"train_loss": -6.760043144226074, "global_step": 142022, "epoch": 3381} {"train_loss": -6.751967430114746, "global_step": 142023, "epoch": 3381} {"train_loss": -6.727218151092529, "global_step": 142024, "epoch": 3381} {"train_loss": -6.70650053024292, "global_step": 142025, "epoch": 3381} {"train_loss": -6.765565872192383, "global_step": 142026, "epoch": 3381} {"train_loss": -6.757997512817383, "global_step": 142027, "epoch": 3381} {"train_loss": -6.798555850982666, "global_step": 142028, "epoch": 3381} {"train_loss": -6.758869171142578, "global_step": 142029, "epoch": 3381} {"train_loss": -6.728710651397705, "global_step": 142030, "epoch": 3381} {"train_loss": -6.700433731079102, "global_step": 142031, "epoch": 3381} {"train_loss": -6.921126365661621, "global_step": 142032, "epoch": 3381} {"train_loss": -6.632501125335693, "global_step": 142033, "epoch": 3381} {"train_loss": -6.6990838050842285, "global_step": 142034, "epoch": 3381} {"train_loss": -6.814061641693115, "global_step": 142035, "epoch": 3381} {"train_loss": -6.81519889831543, "global_step": 142036, "epoch": 3381} {"train_loss": -6.732068061828613, "global_step": 142037, "epoch": 3381} {"train_loss": -6.795495986938477, "global_step": 142038, "epoch": 3381} {"train_loss": -6.764244079589844, "global_step": 142039, "epoch": 3381} {"train_loss": -6.708432674407959, "global_step": 142040, "epoch": 3381} {"train_loss": -6.908227443695068, "global_step": 142041, "epoch": 3381} {"train_loss": -6.625783920288086, "global_step": 142042, "epoch": 3381} {"train_loss": -6.769751526060558, "global_step": 142043, "epoch": 3381, "val_loss": 78242.0625} {"train_loss": -6.739178657531738, "global_step": 142044, "epoch": 3382} {"train_loss": -6.797614574432373, "global_step": 142045, "epoch": 3382} {"train_loss": -6.887330055236816, "global_step": 142046, "epoch": 3382} {"train_loss": -6.7761077880859375, "global_step": 142047, "epoch": 3382} {"train_loss": -6.836493968963623, "global_step": 142048, "epoch": 3382} {"train_loss": -6.872913837432861, "global_step": 142049, "epoch": 3382} {"train_loss": -6.764391899108887, "global_step": 142050, "epoch": 3382} {"train_loss": -6.792692184448242, "global_step": 142051, "epoch": 3382} {"train_loss": -6.702823638916016, "global_step": 142052, "epoch": 3382} {"train_loss": -6.867186546325684, "global_step": 142053, "epoch": 3382} {"train_loss": -6.760281085968018, "global_step": 142054, "epoch": 3382} {"train_loss": -6.854905128479004, "global_step": 142055, "epoch": 3382} {"train_loss": -6.758914470672607, "global_step": 142056, "epoch": 3382} {"train_loss": -6.820937156677246, "global_step": 142057, "epoch": 3382} {"train_loss": -6.877219200134277, "global_step": 142058, "epoch": 3382} {"train_loss": -6.8003716468811035, "global_step": 142059, "epoch": 3382} {"train_loss": -6.739566802978516, "global_step": 142060, "epoch": 3382} {"train_loss": -6.748472690582275, "global_step": 142061, "epoch": 3382} {"train_loss": -6.678374290466309, "global_step": 142062, "epoch": 3382} {"train_loss": -6.81205940246582, "global_step": 142063, "epoch": 3382} {"train_loss": -6.755064010620117, "global_step": 142064, "epoch": 3382} {"train_loss": -6.796964645385742, "global_step": 142065, "epoch": 3382} {"train_loss": -6.826601982116699, "global_step": 142066, "epoch": 3382} {"train_loss": -6.784287452697754, "global_step": 142067, "epoch": 3382} {"train_loss": -6.626321315765381, "global_step": 142068, "epoch": 3382} {"train_loss": -6.723241806030273, "global_step": 142069, "epoch": 3382} {"train_loss": -6.77049446105957, "global_step": 142070, "epoch": 3382} {"train_loss": -6.7249321937561035, "global_step": 142071, "epoch": 3382} {"train_loss": -6.778172492980957, "global_step": 142072, "epoch": 3382} {"train_loss": -6.554538726806641, "global_step": 142073, "epoch": 3382} {"train_loss": -6.666028022766113, "global_step": 142074, "epoch": 3382} {"train_loss": -6.831735610961914, "global_step": 142075, "epoch": 3382} {"train_loss": -6.478514671325684, "global_step": 142076, "epoch": 3382} {"train_loss": -6.752230644226074, "global_step": 142077, "epoch": 3382} {"train_loss": -6.6993513107299805, "global_step": 142078, "epoch": 3382} {"train_loss": -6.708902359008789, "global_step": 142079, "epoch": 3382} {"train_loss": -6.712640285491943, "global_step": 142080, "epoch": 3382} {"train_loss": -6.597927093505859, "global_step": 142081, "epoch": 3382} {"train_loss": -6.702192306518555, "global_step": 142082, "epoch": 3382} {"train_loss": -6.656978607177734, "global_step": 142083, "epoch": 3382} {"train_loss": -6.713991165161133, "global_step": 142084, "epoch": 3382} {"train_loss": -6.749131032398769, "global_step": 142085, "epoch": 3382, "val_loss": 78192.265625} {"train_loss": -6.7351579666137695, "global_step": 142086, "epoch": 3383} {"train_loss": -6.729903221130371, "global_step": 142087, "epoch": 3383} {"train_loss": -6.79913854598999, "global_step": 142088, "epoch": 3383} {"train_loss": -6.79911994934082, "global_step": 142089, "epoch": 3383} {"train_loss": -6.825838088989258, "global_step": 142090, "epoch": 3383} {"train_loss": -6.833652496337891, "global_step": 142091, "epoch": 3383} {"train_loss": -6.805833339691162, "global_step": 142092, "epoch": 3383} {"train_loss": -6.835981845855713, "global_step": 142093, "epoch": 3383} {"train_loss": -6.858148097991943, "global_step": 142094, "epoch": 3383} {"train_loss": -6.755325794219971, "global_step": 142095, "epoch": 3383} {"train_loss": -6.766222953796387, "global_step": 142096, "epoch": 3383} {"train_loss": -6.750094413757324, "global_step": 142097, "epoch": 3383} {"train_loss": -6.8415679931640625, "global_step": 142098, "epoch": 3383} {"train_loss": -6.703108787536621, "global_step": 142099, "epoch": 3383} {"train_loss": -6.70426082611084, "global_step": 142100, "epoch": 3383} {"train_loss": -6.725531578063965, "global_step": 142101, "epoch": 3383} {"train_loss": -6.774469375610352, "global_step": 142102, "epoch": 3383} {"train_loss": -6.741148471832275, "global_step": 142103, "epoch": 3383} {"train_loss": -6.772953033447266, "global_step": 142104, "epoch": 3383} {"train_loss": -6.825098037719727, "global_step": 142105, "epoch": 3383} {"train_loss": -6.821773529052734, "global_step": 142106, "epoch": 3383} {"train_loss": -6.852123737335205, "global_step": 142107, "epoch": 3383} {"train_loss": -6.8592119216918945, "global_step": 142108, "epoch": 3383} {"train_loss": -6.8335185050964355, "global_step": 142109, "epoch": 3383} {"train_loss": -6.869455337524414, "global_step": 142110, "epoch": 3383} {"train_loss": -6.941262722015381, "global_step": 142111, "epoch": 3383} {"train_loss": -6.808563232421875, "global_step": 142112, "epoch": 3383} {"train_loss": -6.901663780212402, "global_step": 142113, "epoch": 3383} {"train_loss": -6.866903305053711, "global_step": 142114, "epoch": 3383} {"train_loss": -6.839734077453613, "global_step": 142115, "epoch": 3383} {"train_loss": -6.820709228515625, "global_step": 142116, "epoch": 3383} {"train_loss": -6.90411901473999, "global_step": 142117, "epoch": 3383} {"train_loss": -6.763662338256836, "global_step": 142118, "epoch": 3383} {"train_loss": -6.880415439605713, "global_step": 142119, "epoch": 3383} {"train_loss": -6.900335311889648, "global_step": 142120, "epoch": 3383} {"train_loss": -6.773187160491943, "global_step": 142121, "epoch": 3383} {"train_loss": -6.640225410461426, "global_step": 142122, "epoch": 3383} {"train_loss": -6.762519359588623, "global_step": 142123, "epoch": 3383} {"train_loss": -6.695844650268555, "global_step": 142124, "epoch": 3383} {"train_loss": -6.576552391052246, "global_step": 142125, "epoch": 3383} {"train_loss": -6.719545841217041, "global_step": 142126, "epoch": 3383} {"train_loss": -6.791383232389178, "global_step": 142127, "epoch": 3383, "val_loss": 78424.78125} {"train_loss": -6.657998085021973, "global_step": 142128, "epoch": 3384} {"train_loss": -6.796584129333496, "global_step": 142129, "epoch": 3384} {"train_loss": -6.703890800476074, "global_step": 142130, "epoch": 3384} {"train_loss": -6.859372138977051, "global_step": 142131, "epoch": 3384} {"train_loss": -6.6551513671875, "global_step": 142132, "epoch": 3384} {"train_loss": -6.686309814453125, "global_step": 142133, "epoch": 3384} {"train_loss": -6.691381454467773, "global_step": 142134, "epoch": 3384} {"train_loss": -6.760796546936035, "global_step": 142135, "epoch": 3384} {"train_loss": -6.828408718109131, "global_step": 142136, "epoch": 3384} {"train_loss": -6.690178394317627, "global_step": 142137, "epoch": 3384} {"train_loss": -6.736332893371582, "global_step": 142138, "epoch": 3384} {"train_loss": -6.802825450897217, "global_step": 142139, "epoch": 3384} {"train_loss": -6.781381607055664, "global_step": 142140, "epoch": 3384} {"train_loss": -6.8354668617248535, "global_step": 142141, "epoch": 3384} {"train_loss": -6.828324317932129, "global_step": 142142, "epoch": 3384} {"train_loss": -6.74305534362793, "global_step": 142143, "epoch": 3384} {"train_loss": -6.884135723114014, "global_step": 142144, "epoch": 3384} {"train_loss": -6.811828136444092, "global_step": 142145, "epoch": 3384} {"train_loss": -6.862717628479004, "global_step": 142146, "epoch": 3384} {"train_loss": -6.795428276062012, "global_step": 142147, "epoch": 3384} {"train_loss": -6.747537136077881, "global_step": 142148, "epoch": 3384} {"train_loss": -6.874814987182617, "global_step": 142149, "epoch": 3384} {"train_loss": -6.795034885406494, "global_step": 142150, "epoch": 3384} {"train_loss": -6.7986040115356445, "global_step": 142151, "epoch": 3384} {"train_loss": -6.81668758392334, "global_step": 142152, "epoch": 3384} {"train_loss": -6.774752616882324, "global_step": 142153, "epoch": 3384} {"train_loss": -6.840041160583496, "global_step": 142154, "epoch": 3384} {"train_loss": -6.737349987030029, "global_step": 142155, "epoch": 3384} {"train_loss": -6.77928352355957, "global_step": 142156, "epoch": 3384} {"train_loss": -6.62033224105835, "global_step": 142157, "epoch": 3384} {"train_loss": -6.806617259979248, "global_step": 142158, "epoch": 3384} {"train_loss": -6.7750749588012695, "global_step": 142159, "epoch": 3384} {"train_loss": -6.789364814758301, "global_step": 142160, "epoch": 3384} {"train_loss": -6.727688312530518, "global_step": 142161, "epoch": 3384} {"train_loss": -6.820873260498047, "global_step": 142162, "epoch": 3384} {"train_loss": -6.680781364440918, "global_step": 142163, "epoch": 3384} {"train_loss": -6.755638122558594, "global_step": 142164, "epoch": 3384} {"train_loss": -6.663302421569824, "global_step": 142165, "epoch": 3384} {"train_loss": -6.783473014831543, "global_step": 142166, "epoch": 3384} {"train_loss": -6.766023635864258, "global_step": 142167, "epoch": 3384} {"train_loss": -6.7295145988464355, "global_step": 142168, "epoch": 3384} {"train_loss": -6.768604585102627, "global_step": 142169, "epoch": 3384, "val_loss": 78443.5} {"train_loss": -6.862034797668457, "global_step": 142170, "epoch": 3385} {"train_loss": -6.854124069213867, "global_step": 142171, "epoch": 3385} {"train_loss": -6.7946062088012695, "global_step": 142172, "epoch": 3385} {"train_loss": -6.845480442047119, "global_step": 142173, "epoch": 3385} {"train_loss": -6.873305320739746, "global_step": 142174, "epoch": 3385} {"train_loss": -6.845826148986816, "global_step": 142175, "epoch": 3385} {"train_loss": -6.707881927490234, "global_step": 142176, "epoch": 3385} {"train_loss": -6.886475563049316, "global_step": 142177, "epoch": 3385} {"train_loss": -6.830235481262207, "global_step": 142178, "epoch": 3385} {"train_loss": -6.6781744956970215, "global_step": 142179, "epoch": 3385} {"train_loss": -6.8179168701171875, "global_step": 142180, "epoch": 3385} {"train_loss": -6.740167140960693, "global_step": 142181, "epoch": 3385} {"train_loss": -6.910104274749756, "global_step": 142182, "epoch": 3385} {"train_loss": -6.750805377960205, "global_step": 142183, "epoch": 3385} {"train_loss": -6.609786033630371, "global_step": 142184, "epoch": 3385} {"train_loss": -6.876814365386963, "global_step": 142185, "epoch": 3385} {"train_loss": -6.567234039306641, "global_step": 142186, "epoch": 3385} {"train_loss": -6.610840320587158, "global_step": 142187, "epoch": 3385} {"train_loss": -6.761181354522705, "global_step": 142188, "epoch": 3385} {"train_loss": -6.603481292724609, "global_step": 142189, "epoch": 3385} {"train_loss": -6.756523132324219, "global_step": 142190, "epoch": 3385} {"train_loss": -6.716357231140137, "global_step": 142191, "epoch": 3385} {"train_loss": -6.681406497955322, "global_step": 142192, "epoch": 3385} {"train_loss": -6.708741188049316, "global_step": 142193, "epoch": 3385} {"train_loss": -6.800589561462402, "global_step": 142194, "epoch": 3385} {"train_loss": -6.779050827026367, "global_step": 142195, "epoch": 3385} {"train_loss": -6.664179801940918, "global_step": 142196, "epoch": 3385} {"train_loss": -6.826671600341797, "global_step": 142197, "epoch": 3385} {"train_loss": -6.8790130615234375, "global_step": 142198, "epoch": 3385} {"train_loss": -6.622335910797119, "global_step": 142199, "epoch": 3385} {"train_loss": -6.712851524353027, "global_step": 142200, "epoch": 3385} {"train_loss": -6.632869720458984, "global_step": 142201, "epoch": 3385} {"train_loss": -6.823929309844971, "global_step": 142202, "epoch": 3385} {"train_loss": -6.534137725830078, "global_step": 142203, "epoch": 3385} {"train_loss": -6.688701152801514, "global_step": 142204, "epoch": 3385} {"train_loss": -6.694853782653809, "global_step": 142205, "epoch": 3385} {"train_loss": -6.742768287658691, "global_step": 142206, "epoch": 3385} {"train_loss": -6.840373992919922, "global_step": 142207, "epoch": 3385} {"train_loss": -6.656527996063232, "global_step": 142208, "epoch": 3385} {"train_loss": -6.726163864135742, "global_step": 142209, "epoch": 3385} {"train_loss": -6.787391662597656, "global_step": 142210, "epoch": 3385} {"train_loss": -6.750336090723674, "global_step": 142211, "epoch": 3385, "val_loss": 78078.5078125} {"train_loss": -6.885153293609619, "global_step": 142212, "epoch": 3386} {"train_loss": -6.751264572143555, "global_step": 142213, "epoch": 3386} {"train_loss": -6.915402412414551, "global_step": 142214, "epoch": 3386} {"train_loss": -6.750787734985352, "global_step": 142215, "epoch": 3386} {"train_loss": -6.868502616882324, "global_step": 142216, "epoch": 3386} {"train_loss": -6.733795642852783, "global_step": 142217, "epoch": 3386} {"train_loss": -6.736883163452148, "global_step": 142218, "epoch": 3386} {"train_loss": -6.870250701904297, "global_step": 142219, "epoch": 3386} {"train_loss": -6.793728351593018, "global_step": 142220, "epoch": 3386} {"train_loss": -6.8167266845703125, "global_step": 142221, "epoch": 3386} {"train_loss": -6.712663173675537, "global_step": 142222, "epoch": 3386} {"train_loss": -6.7565155029296875, "global_step": 142223, "epoch": 3386} {"train_loss": -6.855433464050293, "global_step": 142224, "epoch": 3386} {"train_loss": -6.704448699951172, "global_step": 142225, "epoch": 3386} {"train_loss": -6.665097713470459, "global_step": 142226, "epoch": 3386} {"train_loss": -6.829833984375, "global_step": 142227, "epoch": 3386} {"train_loss": -6.696413516998291, "global_step": 142228, "epoch": 3386} {"train_loss": -6.755383491516113, "global_step": 142229, "epoch": 3386} {"train_loss": -6.630450248718262, "global_step": 142230, "epoch": 3386} {"train_loss": -6.819643020629883, "global_step": 142231, "epoch": 3386} {"train_loss": -6.791484832763672, "global_step": 142232, "epoch": 3386} {"train_loss": -6.638333797454834, "global_step": 142233, "epoch": 3386} {"train_loss": -6.733706474304199, "global_step": 142234, "epoch": 3386} {"train_loss": -6.700030326843262, "global_step": 142235, "epoch": 3386} {"train_loss": -6.736151218414307, "global_step": 142236, "epoch": 3386} {"train_loss": -6.656198501586914, "global_step": 142237, "epoch": 3386} {"train_loss": -6.7231597900390625, "global_step": 142238, "epoch": 3386} {"train_loss": -6.6123504638671875, "global_step": 142239, "epoch": 3386} {"train_loss": -6.6924028396606445, "global_step": 142240, "epoch": 3386} {"train_loss": -6.66310977935791, "global_step": 142241, "epoch": 3386} {"train_loss": -6.62547492980957, "global_step": 142242, "epoch": 3386} {"train_loss": -6.839785099029541, "global_step": 142243, "epoch": 3386} {"train_loss": -6.771609306335449, "global_step": 142244, "epoch": 3386} {"train_loss": -6.655470848083496, "global_step": 142245, "epoch": 3386} {"train_loss": -6.735973358154297, "global_step": 142246, "epoch": 3386} {"train_loss": -6.749508857727051, "global_step": 142247, "epoch": 3386} {"train_loss": -6.825520992279053, "global_step": 142248, "epoch": 3386} {"train_loss": -6.782047271728516, "global_step": 142249, "epoch": 3386} {"train_loss": -6.799614906311035, "global_step": 142250, "epoch": 3386} {"train_loss": -6.815169334411621, "global_step": 142251, "epoch": 3386} {"train_loss": -6.7234907150268555, "global_step": 142252, "epoch": 3386} {"train_loss": -6.7552902812049505, "global_step": 142253, "epoch": 3386, "val_loss": 77998.5546875} {"train_loss": -6.936476230621338, "global_step": 142254, "epoch": 3387} {"train_loss": -6.82373046875, "global_step": 142255, "epoch": 3387} {"train_loss": -6.784554958343506, "global_step": 142256, "epoch": 3387} {"train_loss": -6.8688459396362305, "global_step": 142257, "epoch": 3387} {"train_loss": -6.822757720947266, "global_step": 142258, "epoch": 3387} {"train_loss": -6.930177688598633, "global_step": 142259, "epoch": 3387} {"train_loss": -6.896873950958252, "global_step": 142260, "epoch": 3387} {"train_loss": -6.913993835449219, "global_step": 142261, "epoch": 3387} {"train_loss": -6.78767204284668, "global_step": 142262, "epoch": 3387} {"train_loss": -6.662052631378174, "global_step": 142263, "epoch": 3387} {"train_loss": -6.936311721801758, "global_step": 142264, "epoch": 3387} {"train_loss": -6.774121284484863, "global_step": 142265, "epoch": 3387} {"train_loss": -6.855316638946533, "global_step": 142266, "epoch": 3387} {"train_loss": -6.855841636657715, "global_step": 142267, "epoch": 3387} {"train_loss": -6.859318256378174, "global_step": 142268, "epoch": 3387} {"train_loss": -6.870110511779785, "global_step": 142269, "epoch": 3387} {"train_loss": -6.8801984786987305, "global_step": 142270, "epoch": 3387} {"train_loss": -6.883871078491211, "global_step": 142271, "epoch": 3387} {"train_loss": -6.850582122802734, "global_step": 142272, "epoch": 3387} {"train_loss": -6.804633140563965, "global_step": 142273, "epoch": 3387} {"train_loss": -6.919189453125, "global_step": 142274, "epoch": 3387} {"train_loss": -6.845011234283447, "global_step": 142275, "epoch": 3387} {"train_loss": -6.755998611450195, "global_step": 142276, "epoch": 3387} {"train_loss": -6.718679428100586, "global_step": 142277, "epoch": 3387} {"train_loss": -6.83903694152832, "global_step": 142278, "epoch": 3387} {"train_loss": -6.768854141235352, "global_step": 142279, "epoch": 3387} {"train_loss": -6.891746997833252, "global_step": 142280, "epoch": 3387} {"train_loss": -6.882477760314941, "global_step": 142281, "epoch": 3387} {"train_loss": -6.800807952880859, "global_step": 142282, "epoch": 3387} {"train_loss": -6.771542549133301, "global_step": 142283, "epoch": 3387} {"train_loss": -6.801136016845703, "global_step": 142284, "epoch": 3387} {"train_loss": -6.718000888824463, "global_step": 142285, "epoch": 3387} {"train_loss": -6.834585189819336, "global_step": 142286, "epoch": 3387} {"train_loss": -6.681560039520264, "global_step": 142287, "epoch": 3387} {"train_loss": -6.729935646057129, "global_step": 142288, "epoch": 3387} {"train_loss": -6.689511299133301, "global_step": 142289, "epoch": 3387} {"train_loss": -6.684769630432129, "global_step": 142290, "epoch": 3387} {"train_loss": -6.826432228088379, "global_step": 142291, "epoch": 3387} {"train_loss": -6.667644023895264, "global_step": 142292, "epoch": 3387} {"train_loss": -6.794478416442871, "global_step": 142293, "epoch": 3387} {"train_loss": -6.6826581954956055, "global_step": 142294, "epoch": 3387} {"train_loss": -6.808106025060018, "global_step": 142295, "epoch": 3387, "val_loss": 78153.3515625} {"train_loss": -6.613742828369141, "global_step": 142296, "epoch": 3388} {"train_loss": -6.710284233093262, "global_step": 142297, "epoch": 3388} {"train_loss": -6.793651103973389, "global_step": 142298, "epoch": 3388} {"train_loss": -6.699319839477539, "global_step": 142299, "epoch": 3388} {"train_loss": -6.750573635101318, "global_step": 142300, "epoch": 3388} {"train_loss": -6.704171180725098, "global_step": 142301, "epoch": 3388} {"train_loss": -6.786052703857422, "global_step": 142302, "epoch": 3388} {"train_loss": -6.6652727127075195, "global_step": 142303, "epoch": 3388} {"train_loss": -6.666468620300293, "global_step": 142304, "epoch": 3388} {"train_loss": -6.707242012023926, "global_step": 142305, "epoch": 3388} {"train_loss": -6.845067977905273, "global_step": 142306, "epoch": 3388} {"train_loss": -6.636638641357422, "global_step": 142307, "epoch": 3388} {"train_loss": -6.908295631408691, "global_step": 142308, "epoch": 3388} {"train_loss": -6.761046886444092, "global_step": 142309, "epoch": 3388} {"train_loss": -6.651544570922852, "global_step": 142310, "epoch": 3388} {"train_loss": -6.827532768249512, "global_step": 142311, "epoch": 3388} {"train_loss": -6.590690612792969, "global_step": 142312, "epoch": 3388} {"train_loss": -6.739166259765625, "global_step": 142313, "epoch": 3388} {"train_loss": -6.658246994018555, "global_step": 142314, "epoch": 3388} {"train_loss": -6.632085800170898, "global_step": 142315, "epoch": 3388} {"train_loss": -6.82249116897583, "global_step": 142316, "epoch": 3388} {"train_loss": -6.7033796310424805, "global_step": 142317, "epoch": 3388} {"train_loss": -6.740540504455566, "global_step": 142318, "epoch": 3388} {"train_loss": -6.829118251800537, "global_step": 142319, "epoch": 3388} {"train_loss": -6.729963302612305, "global_step": 142320, "epoch": 3388} {"train_loss": -6.788603782653809, "global_step": 142321, "epoch": 3388} {"train_loss": -6.707730770111084, "global_step": 142322, "epoch": 3388} {"train_loss": -6.855701923370361, "global_step": 142323, "epoch": 3388} {"train_loss": -6.801230430603027, "global_step": 142324, "epoch": 3388} {"train_loss": -6.805359840393066, "global_step": 142325, "epoch": 3388} {"train_loss": -6.749965190887451, "global_step": 142326, "epoch": 3388} {"train_loss": -6.7637763023376465, "global_step": 142327, "epoch": 3388} {"train_loss": -6.804883003234863, "global_step": 142328, "epoch": 3388} {"train_loss": -6.687699317932129, "global_step": 142329, "epoch": 3388} {"train_loss": -6.808378219604492, "global_step": 142330, "epoch": 3388} {"train_loss": -6.879270076751709, "global_step": 142331, "epoch": 3388} {"train_loss": -6.7054443359375, "global_step": 142332, "epoch": 3388} {"train_loss": -6.8173441886901855, "global_step": 142333, "epoch": 3388} {"train_loss": -6.836387634277344, "global_step": 142334, "epoch": 3388} {"train_loss": -6.693285942077637, "global_step": 142335, "epoch": 3388} {"train_loss": -6.759378910064697, "global_step": 142336, "epoch": 3388} {"train_loss": -6.745847781499227, "global_step": 142337, "epoch": 3388, "val_loss": 78313.328125} {"train_loss": -6.732917785644531, "global_step": 142338, "epoch": 3389} {"train_loss": -6.710843563079834, "global_step": 142339, "epoch": 3389} {"train_loss": -6.856935024261475, "global_step": 142340, "epoch": 3389} {"train_loss": -6.788588047027588, "global_step": 142341, "epoch": 3389} {"train_loss": -6.856473445892334, "global_step": 142342, "epoch": 3389} {"train_loss": -6.744057655334473, "global_step": 142343, "epoch": 3389} {"train_loss": -6.823754787445068, "global_step": 142344, "epoch": 3389} {"train_loss": -6.803118705749512, "global_step": 142345, "epoch": 3389} {"train_loss": -6.841931343078613, "global_step": 142346, "epoch": 3389} {"train_loss": -6.73127555847168, "global_step": 142347, "epoch": 3389} {"train_loss": -6.745852470397949, "global_step": 142348, "epoch": 3389} {"train_loss": -6.811966896057129, "global_step": 142349, "epoch": 3389} {"train_loss": -6.839273929595947, "global_step": 142350, "epoch": 3389} {"train_loss": -6.839857578277588, "global_step": 142351, "epoch": 3389} {"train_loss": -6.818658351898193, "global_step": 142352, "epoch": 3389} {"train_loss": -6.7990617752075195, "global_step": 142353, "epoch": 3389} {"train_loss": -6.8363165855407715, "global_step": 142354, "epoch": 3389} {"train_loss": -6.770647048950195, "global_step": 142355, "epoch": 3389} {"train_loss": -6.864252090454102, "global_step": 142356, "epoch": 3389} {"train_loss": -6.772914886474609, "global_step": 142357, "epoch": 3389} {"train_loss": -6.752461910247803, "global_step": 142358, "epoch": 3389} {"train_loss": -6.84401798248291, "global_step": 142359, "epoch": 3389} {"train_loss": -6.904603958129883, "global_step": 142360, "epoch": 3389} {"train_loss": -6.720229148864746, "global_step": 142361, "epoch": 3389} {"train_loss": -6.781381607055664, "global_step": 142362, "epoch": 3389} {"train_loss": -6.808733940124512, "global_step": 142363, "epoch": 3389} {"train_loss": -6.851130485534668, "global_step": 142364, "epoch": 3389} {"train_loss": -6.888821125030518, "global_step": 142365, "epoch": 3389} {"train_loss": -6.656656742095947, "global_step": 142366, "epoch": 3389} {"train_loss": -6.87551212310791, "global_step": 142367, "epoch": 3389} {"train_loss": -6.828316688537598, "global_step": 142368, "epoch": 3389} {"train_loss": -6.7819414138793945, "global_step": 142369, "epoch": 3389} {"train_loss": -6.719125747680664, "global_step": 142370, "epoch": 3389} {"train_loss": -6.736526966094971, "global_step": 142371, "epoch": 3389} {"train_loss": -6.572977066040039, "global_step": 142372, "epoch": 3389} {"train_loss": -6.9062113761901855, "global_step": 142373, "epoch": 3389} {"train_loss": -6.742819309234619, "global_step": 142374, "epoch": 3389} {"train_loss": -6.716773986816406, "global_step": 142375, "epoch": 3389} {"train_loss": -6.873918056488037, "global_step": 142376, "epoch": 3389} {"train_loss": -6.681640625, "global_step": 142377, "epoch": 3389} {"train_loss": -6.596482276916504, "global_step": 142378, "epoch": 3389} {"train_loss": -6.788300661813645, "global_step": 142379, "epoch": 3389, "val_loss": 78358.515625} {"train_loss": -6.720682621002197, "global_step": 142380, "epoch": 3390} {"train_loss": -6.776050567626953, "global_step": 142381, "epoch": 3390} {"train_loss": -6.816617965698242, "global_step": 142382, "epoch": 3390} {"train_loss": -6.9062933921813965, "global_step": 142383, "epoch": 3390} {"train_loss": -6.71578311920166, "global_step": 142384, "epoch": 3390} {"train_loss": -6.790191650390625, "global_step": 142385, "epoch": 3390} {"train_loss": -6.746580600738525, "global_step": 142386, "epoch": 3390} {"train_loss": -6.740313529968262, "global_step": 142387, "epoch": 3390} {"train_loss": -6.668393611907959, "global_step": 142388, "epoch": 3390} {"train_loss": -6.753561973571777, "global_step": 142389, "epoch": 3390} {"train_loss": -6.746835708618164, "global_step": 142390, "epoch": 3390} {"train_loss": -6.732454299926758, "global_step": 142391, "epoch": 3390} {"train_loss": -6.757057189941406, "global_step": 142392, "epoch": 3390} {"train_loss": -6.809112548828125, "global_step": 142393, "epoch": 3390} {"train_loss": -6.78331184387207, "global_step": 142394, "epoch": 3390} {"train_loss": -6.722145080566406, "global_step": 142395, "epoch": 3390} {"train_loss": -6.809957504272461, "global_step": 142396, "epoch": 3390} {"train_loss": -6.7973313331604, "global_step": 142397, "epoch": 3390} {"train_loss": -6.7654266357421875, "global_step": 142398, "epoch": 3390} {"train_loss": -6.770768165588379, "global_step": 142399, "epoch": 3390} {"train_loss": -6.6467976570129395, "global_step": 142400, "epoch": 3390} {"train_loss": -6.8287739753723145, "global_step": 142401, "epoch": 3390} {"train_loss": -6.7040815353393555, "global_step": 142402, "epoch": 3390} {"train_loss": -6.7274322509765625, "global_step": 142403, "epoch": 3390} {"train_loss": -6.8197126388549805, "global_step": 142404, "epoch": 3390} {"train_loss": -6.717927932739258, "global_step": 142405, "epoch": 3390} {"train_loss": -6.725222587585449, "global_step": 142406, "epoch": 3390} {"train_loss": -6.802391529083252, "global_step": 142407, "epoch": 3390} {"train_loss": -6.669781684875488, "global_step": 142408, "epoch": 3390} {"train_loss": -6.763674736022949, "global_step": 142409, "epoch": 3390} {"train_loss": -6.741687774658203, "global_step": 142410, "epoch": 3390} {"train_loss": -6.6781325340271, "global_step": 142411, "epoch": 3390} {"train_loss": -6.79390811920166, "global_step": 142412, "epoch": 3390} {"train_loss": -6.756500720977783, "global_step": 142413, "epoch": 3390} {"train_loss": -6.8186492919921875, "global_step": 142414, "epoch": 3390} {"train_loss": -6.689491271972656, "global_step": 142415, "epoch": 3390} {"train_loss": -6.82807731628418, "global_step": 142416, "epoch": 3390} {"train_loss": -6.818809509277344, "global_step": 142417, "epoch": 3390} {"train_loss": -6.732546806335449, "global_step": 142418, "epoch": 3390} {"train_loss": -6.678727149963379, "global_step": 142419, "epoch": 3390} {"train_loss": -6.7673139572143555, "global_step": 142420, "epoch": 3390} {"train_loss": -6.757609787441435, "global_step": 142421, "epoch": 3390, "val_loss": 78086.4296875} {"train_loss": -6.869722366333008, "global_step": 142422, "epoch": 3391} {"train_loss": -6.9068121910095215, "global_step": 142423, "epoch": 3391} {"train_loss": -6.700857162475586, "global_step": 142424, "epoch": 3391} {"train_loss": -6.8496222496032715, "global_step": 142425, "epoch": 3391} {"train_loss": -6.777520179748535, "global_step": 142426, "epoch": 3391} {"train_loss": -6.749971389770508, "global_step": 142427, "epoch": 3391} {"train_loss": -6.816997051239014, "global_step": 142428, "epoch": 3391} {"train_loss": -6.740633010864258, "global_step": 142429, "epoch": 3391} {"train_loss": -6.791980266571045, "global_step": 142430, "epoch": 3391} {"train_loss": -6.775531768798828, "global_step": 142431, "epoch": 3391} {"train_loss": -6.7534565925598145, "global_step": 142432, "epoch": 3391} {"train_loss": -6.775511741638184, "global_step": 142433, "epoch": 3391} {"train_loss": -6.713100910186768, "global_step": 142434, "epoch": 3391} {"train_loss": -6.829766273498535, "global_step": 142435, "epoch": 3391} {"train_loss": -6.672029495239258, "global_step": 142436, "epoch": 3391} {"train_loss": -6.872045516967773, "global_step": 142437, "epoch": 3391} {"train_loss": -6.771132469177246, "global_step": 142438, "epoch": 3391} {"train_loss": -6.845089435577393, "global_step": 142439, "epoch": 3391} {"train_loss": -6.762852668762207, "global_step": 142440, "epoch": 3391} {"train_loss": -6.747604846954346, "global_step": 142441, "epoch": 3391} {"train_loss": -6.7669854164123535, "global_step": 142442, "epoch": 3391} {"train_loss": -6.826437950134277, "global_step": 142443, "epoch": 3391} {"train_loss": -6.958096027374268, "global_step": 142444, "epoch": 3391} {"train_loss": -6.7376604080200195, "global_step": 142445, "epoch": 3391} {"train_loss": -6.726820468902588, "global_step": 142446, "epoch": 3391} {"train_loss": -6.793326377868652, "global_step": 142447, "epoch": 3391} {"train_loss": -6.7150068283081055, "global_step": 142448, "epoch": 3391} {"train_loss": -6.78692626953125, "global_step": 142449, "epoch": 3391} {"train_loss": -6.835282325744629, "global_step": 142450, "epoch": 3391} {"train_loss": -6.867295265197754, "global_step": 142451, "epoch": 3391} {"train_loss": -6.904990196228027, "global_step": 142452, "epoch": 3391} {"train_loss": -6.785312175750732, "global_step": 142453, "epoch": 3391} {"train_loss": -6.791237831115723, "global_step": 142454, "epoch": 3391} {"train_loss": -6.841977596282959, "global_step": 142455, "epoch": 3391} {"train_loss": -6.830530643463135, "global_step": 142456, "epoch": 3391} {"train_loss": -6.8083295822143555, "global_step": 142457, "epoch": 3391} {"train_loss": -6.727741241455078, "global_step": 142458, "epoch": 3391} {"train_loss": -6.784806251525879, "global_step": 142459, "epoch": 3391} {"train_loss": -6.722596168518066, "global_step": 142460, "epoch": 3391} {"train_loss": -6.79998254776001, "global_step": 142461, "epoch": 3391} {"train_loss": -6.7970709800720215, "global_step": 142462, "epoch": 3391} {"train_loss": -6.7929018679119295, "global_step": 142463, "epoch": 3391, "val_loss": 78659.6484375} {"train_loss": -6.832267761230469, "global_step": 142464, "epoch": 3392} {"train_loss": -6.760704040527344, "global_step": 142465, "epoch": 3392} {"train_loss": -6.688508033752441, "global_step": 142466, "epoch": 3392} {"train_loss": -6.922978401184082, "global_step": 142467, "epoch": 3392} {"train_loss": -6.809436798095703, "global_step": 142468, "epoch": 3392} {"train_loss": -6.780282020568848, "global_step": 142469, "epoch": 3392} {"train_loss": -6.902891159057617, "global_step": 142470, "epoch": 3392} {"train_loss": -6.811361312866211, "global_step": 142471, "epoch": 3392} {"train_loss": -6.852607727050781, "global_step": 142472, "epoch": 3392} {"train_loss": -6.984118461608887, "global_step": 142473, "epoch": 3392} {"train_loss": -6.840048789978027, "global_step": 142474, "epoch": 3392} {"train_loss": -6.7728495597839355, "global_step": 142475, "epoch": 3392} {"train_loss": -6.765334129333496, "global_step": 142476, "epoch": 3392} {"train_loss": -6.864502906799316, "global_step": 142477, "epoch": 3392} {"train_loss": -6.786133766174316, "global_step": 142478, "epoch": 3392} {"train_loss": -6.716081619262695, "global_step": 142479, "epoch": 3392} {"train_loss": -6.834819793701172, "global_step": 142480, "epoch": 3392} {"train_loss": -6.6898088455200195, "global_step": 142481, "epoch": 3392} {"train_loss": -6.808899879455566, "global_step": 142482, "epoch": 3392} {"train_loss": -6.89959716796875, "global_step": 142483, "epoch": 3392} {"train_loss": -6.894598960876465, "global_step": 142484, "epoch": 3392} {"train_loss": -6.910987854003906, "global_step": 142485, "epoch": 3392} {"train_loss": -6.7828369140625, "global_step": 142486, "epoch": 3392} {"train_loss": -6.730587005615234, "global_step": 142487, "epoch": 3392} {"train_loss": -6.88047456741333, "global_step": 142488, "epoch": 3392} {"train_loss": -6.647904396057129, "global_step": 142489, "epoch": 3392} {"train_loss": -6.692523002624512, "global_step": 142490, "epoch": 3392} {"train_loss": -6.899827480316162, "global_step": 142491, "epoch": 3392} {"train_loss": -6.831643104553223, "global_step": 142492, "epoch": 3392} {"train_loss": -6.91319465637207, "global_step": 142493, "epoch": 3392} {"train_loss": -6.852051734924316, "global_step": 142494, "epoch": 3392} {"train_loss": -6.740524768829346, "global_step": 142495, "epoch": 3392} {"train_loss": -6.810962677001953, "global_step": 142496, "epoch": 3392} {"train_loss": -6.740135669708252, "global_step": 142497, "epoch": 3392} {"train_loss": -6.71150541305542, "global_step": 142498, "epoch": 3392} {"train_loss": -6.883230209350586, "global_step": 142499, "epoch": 3392} {"train_loss": -6.734962463378906, "global_step": 142500, "epoch": 3392} {"train_loss": -6.936997413635254, "global_step": 142501, "epoch": 3392} {"train_loss": -6.845427513122559, "global_step": 142502, "epoch": 3392} {"train_loss": -6.834193229675293, "global_step": 142503, "epoch": 3392} {"train_loss": -6.725291728973389, "global_step": 142504, "epoch": 3392} {"train_loss": -6.814380509512765, "global_step": 142505, "epoch": 3392, "val_loss": 77917.7578125} {"train_loss": -6.819471836090088, "global_step": 142506, "epoch": 3393} {"train_loss": -6.883824348449707, "global_step": 142507, "epoch": 3393} {"train_loss": -6.845943450927734, "global_step": 142508, "epoch": 3393} {"train_loss": -6.796486854553223, "global_step": 142509, "epoch": 3393} {"train_loss": -6.9187798500061035, "global_step": 142510, "epoch": 3393} {"train_loss": -6.747293472290039, "global_step": 142511, "epoch": 3393} {"train_loss": -6.877364158630371, "global_step": 142512, "epoch": 3393} {"train_loss": -6.930297374725342, "global_step": 142513, "epoch": 3393} {"train_loss": -6.845142364501953, "global_step": 142514, "epoch": 3393} {"train_loss": -6.832033634185791, "global_step": 142515, "epoch": 3393} {"train_loss": -6.74459171295166, "global_step": 142516, "epoch": 3393} {"train_loss": -6.863102912902832, "global_step": 142517, "epoch": 3393} {"train_loss": -6.73990535736084, "global_step": 142518, "epoch": 3393} {"train_loss": -6.67934513092041, "global_step": 142519, "epoch": 3393} {"train_loss": -6.700206756591797, "global_step": 142520, "epoch": 3393} {"train_loss": -6.671148777008057, "global_step": 142521, "epoch": 3393} {"train_loss": -6.55068826675415, "global_step": 142522, "epoch": 3393} {"train_loss": -6.591879844665527, "global_step": 142523, "epoch": 3393} {"train_loss": -6.719423294067383, "global_step": 142524, "epoch": 3393} {"train_loss": -6.705300331115723, "global_step": 142525, "epoch": 3393} {"train_loss": -6.85081672668457, "global_step": 142526, "epoch": 3393} {"train_loss": -6.5450968742370605, "global_step": 142527, "epoch": 3393} {"train_loss": -6.860968112945557, "global_step": 142528, "epoch": 3393} {"train_loss": -6.5764360427856445, "global_step": 142529, "epoch": 3393} {"train_loss": -6.7962470054626465, "global_step": 142530, "epoch": 3393} {"train_loss": -6.718898773193359, "global_step": 142531, "epoch": 3393} {"train_loss": -6.677563667297363, "global_step": 142532, "epoch": 3393} {"train_loss": -6.6056928634643555, "global_step": 142533, "epoch": 3393} {"train_loss": -6.591375350952148, "global_step": 142534, "epoch": 3393} {"train_loss": -6.663036346435547, "global_step": 142535, "epoch": 3393} {"train_loss": -6.732501983642578, "global_step": 142536, "epoch": 3393} {"train_loss": -6.539231777191162, "global_step": 142537, "epoch": 3393} {"train_loss": -6.630525588989258, "global_step": 142538, "epoch": 3393} {"train_loss": -6.62020206451416, "global_step": 142539, "epoch": 3393} {"train_loss": -6.767468452453613, "global_step": 142540, "epoch": 3393} {"train_loss": -6.651905059814453, "global_step": 142541, "epoch": 3393} {"train_loss": -6.750857353210449, "global_step": 142542, "epoch": 3393} {"train_loss": -6.705967426300049, "global_step": 142543, "epoch": 3393} {"train_loss": -6.6797380447387695, "global_step": 142544, "epoch": 3393} {"train_loss": -6.726041316986084, "global_step": 142545, "epoch": 3393} {"train_loss": -6.688296318054199, "global_step": 142546, "epoch": 3393} {"train_loss": -6.726792823700678, "global_step": 142547, "epoch": 3393, "val_loss": 78247.7109375} {"train_loss": -6.697044849395752, "global_step": 142548, "epoch": 3394} {"train_loss": -6.852642059326172, "global_step": 142549, "epoch": 3394} {"train_loss": -6.661555290222168, "global_step": 142550, "epoch": 3394} {"train_loss": -6.815971374511719, "global_step": 142551, "epoch": 3394} {"train_loss": -6.743640422821045, "global_step": 142552, "epoch": 3394} {"train_loss": -6.746959209442139, "global_step": 142553, "epoch": 3394} {"train_loss": -6.721428871154785, "global_step": 142554, "epoch": 3394} {"train_loss": -6.834092617034912, "global_step": 142555, "epoch": 3394} {"train_loss": -6.774370193481445, "global_step": 142556, "epoch": 3394} {"train_loss": -6.715522766113281, "global_step": 142557, "epoch": 3394} {"train_loss": -6.928153038024902, "global_step": 142558, "epoch": 3394} {"train_loss": -6.785373210906982, "global_step": 142559, "epoch": 3394} {"train_loss": -6.83250617980957, "global_step": 142560, "epoch": 3394} {"train_loss": -6.804247856140137, "global_step": 142561, "epoch": 3394} {"train_loss": -6.7527875900268555, "global_step": 142562, "epoch": 3394} {"train_loss": -6.793951034545898, "global_step": 142563, "epoch": 3394} {"train_loss": -6.7148332595825195, "global_step": 142564, "epoch": 3394} {"train_loss": -6.814100742340088, "global_step": 142565, "epoch": 3394} {"train_loss": -6.882930278778076, "global_step": 142566, "epoch": 3394} {"train_loss": -6.8776044845581055, "global_step": 142567, "epoch": 3394} {"train_loss": -6.867214202880859, "global_step": 142568, "epoch": 3394} {"train_loss": -6.807704925537109, "global_step": 142569, "epoch": 3394} {"train_loss": -6.781323432922363, "global_step": 142570, "epoch": 3394} {"train_loss": -6.7686333656311035, "global_step": 142571, "epoch": 3394} {"train_loss": -6.741708755493164, "global_step": 142572, "epoch": 3394} {"train_loss": -6.803118705749512, "global_step": 142573, "epoch": 3394} {"train_loss": -6.958787441253662, "global_step": 142574, "epoch": 3394} {"train_loss": -6.751317024230957, "global_step": 142575, "epoch": 3394} {"train_loss": -6.821895122528076, "global_step": 142576, "epoch": 3394} {"train_loss": -6.9278059005737305, "global_step": 142577, "epoch": 3394} {"train_loss": -6.775944709777832, "global_step": 142578, "epoch": 3394} {"train_loss": -6.815774917602539, "global_step": 142579, "epoch": 3394} {"train_loss": -6.842565536499023, "global_step": 142580, "epoch": 3394} {"train_loss": -6.846549034118652, "global_step": 142581, "epoch": 3394} {"train_loss": -6.7023725509643555, "global_step": 142582, "epoch": 3394} {"train_loss": -6.7126851081848145, "global_step": 142583, "epoch": 3394} {"train_loss": -6.669606685638428, "global_step": 142584, "epoch": 3394} {"train_loss": -6.917502403259277, "global_step": 142585, "epoch": 3394} {"train_loss": -6.654529571533203, "global_step": 142586, "epoch": 3394} {"train_loss": -6.799261093139648, "global_step": 142587, "epoch": 3394} {"train_loss": -6.829503059387207, "global_step": 142588, "epoch": 3394} {"train_loss": -6.792016438075474, "global_step": 142589, "epoch": 3394, "val_loss": 78278.0859375} {"train_loss": -6.860887050628662, "global_step": 142590, "epoch": 3395} {"train_loss": -6.830141067504883, "global_step": 142591, "epoch": 3395} {"train_loss": -6.702310085296631, "global_step": 142592, "epoch": 3395} {"train_loss": -6.814555644989014, "global_step": 142593, "epoch": 3395} {"train_loss": -6.651398181915283, "global_step": 142594, "epoch": 3395} {"train_loss": -6.687655448913574, "global_step": 142595, "epoch": 3395} {"train_loss": -6.704951286315918, "global_step": 142596, "epoch": 3395} {"train_loss": -6.844415664672852, "global_step": 142597, "epoch": 3395} {"train_loss": -6.734156131744385, "global_step": 142598, "epoch": 3395} {"train_loss": -6.728992462158203, "global_step": 142599, "epoch": 3395} {"train_loss": -6.783690452575684, "global_step": 142600, "epoch": 3395} {"train_loss": -6.846003532409668, "global_step": 142601, "epoch": 3395} {"train_loss": -6.721144199371338, "global_step": 142602, "epoch": 3395} {"train_loss": -6.785615921020508, "global_step": 142603, "epoch": 3395} {"train_loss": -6.755239486694336, "global_step": 142604, "epoch": 3395} {"train_loss": -6.85774040222168, "global_step": 142605, "epoch": 3395} {"train_loss": -6.826920509338379, "global_step": 142606, "epoch": 3395} {"train_loss": -6.832582473754883, "global_step": 142607, "epoch": 3395} {"train_loss": -6.73272705078125, "global_step": 142608, "epoch": 3395} {"train_loss": -6.776640892028809, "global_step": 142609, "epoch": 3395} {"train_loss": -6.9308762550354, "global_step": 142610, "epoch": 3395} {"train_loss": -6.821619987487793, "global_step": 142611, "epoch": 3395} {"train_loss": -6.715789794921875, "global_step": 142612, "epoch": 3395} {"train_loss": -6.792099952697754, "global_step": 142613, "epoch": 3395} {"train_loss": -6.899051189422607, "global_step": 142614, "epoch": 3395} {"train_loss": -6.765841484069824, "global_step": 142615, "epoch": 3395} {"train_loss": -6.700815200805664, "global_step": 142616, "epoch": 3395} {"train_loss": -6.736279010772705, "global_step": 142617, "epoch": 3395} {"train_loss": -6.76922607421875, "global_step": 142618, "epoch": 3395} {"train_loss": -6.923849582672119, "global_step": 142619, "epoch": 3395} {"train_loss": -6.775114059448242, "global_step": 142620, "epoch": 3395} {"train_loss": -6.757241249084473, "global_step": 142621, "epoch": 3395} {"train_loss": -6.845559120178223, "global_step": 142622, "epoch": 3395} {"train_loss": -6.793820381164551, "global_step": 142623, "epoch": 3395} {"train_loss": -6.778963088989258, "global_step": 142624, "epoch": 3395} {"train_loss": -6.7716498374938965, "global_step": 142625, "epoch": 3395} {"train_loss": -6.737105846405029, "global_step": 142626, "epoch": 3395} {"train_loss": -6.794948577880859, "global_step": 142627, "epoch": 3395} {"train_loss": -6.823645114898682, "global_step": 142628, "epoch": 3395} {"train_loss": -6.851953983306885, "global_step": 142629, "epoch": 3395} {"train_loss": -6.735574722290039, "global_step": 142630, "epoch": 3395} {"train_loss": -6.787326222374325, "global_step": 142631, "epoch": 3395, "val_loss": 78230.4609375} {"train_loss": -6.801426410675049, "global_step": 142632, "epoch": 3396} {"train_loss": -6.8399128913879395, "global_step": 142633, "epoch": 3396} {"train_loss": -6.897601127624512, "global_step": 142634, "epoch": 3396} {"train_loss": -6.649153709411621, "global_step": 142635, "epoch": 3396} {"train_loss": -6.785603046417236, "global_step": 142636, "epoch": 3396} {"train_loss": -6.709066390991211, "global_step": 142637, "epoch": 3396} {"train_loss": -6.840137004852295, "global_step": 142638, "epoch": 3396} {"train_loss": -6.818266868591309, "global_step": 142639, "epoch": 3396} {"train_loss": -6.890496253967285, "global_step": 142640, "epoch": 3396} {"train_loss": -6.740635395050049, "global_step": 142641, "epoch": 3396} {"train_loss": -6.709568500518799, "global_step": 142642, "epoch": 3396} {"train_loss": -6.823347091674805, "global_step": 142643, "epoch": 3396} {"train_loss": -6.809988975524902, "global_step": 142644, "epoch": 3396} {"train_loss": -6.648220062255859, "global_step": 142645, "epoch": 3396} {"train_loss": -6.759958267211914, "global_step": 142646, "epoch": 3396} {"train_loss": -6.696502685546875, "global_step": 142647, "epoch": 3396} {"train_loss": -6.848778247833252, "global_step": 142648, "epoch": 3396} {"train_loss": -6.884623050689697, "global_step": 142649, "epoch": 3396} {"train_loss": -6.790823459625244, "global_step": 142650, "epoch": 3396} {"train_loss": -6.939093589782715, "global_step": 142651, "epoch": 3396} {"train_loss": -6.745469093322754, "global_step": 142652, "epoch": 3396} {"train_loss": -6.778773307800293, "global_step": 142653, "epoch": 3396} {"train_loss": -6.778631687164307, "global_step": 142654, "epoch": 3396} {"train_loss": -6.699202060699463, "global_step": 142655, "epoch": 3396} {"train_loss": -6.891780853271484, "global_step": 142656, "epoch": 3396} {"train_loss": -6.819859027862549, "global_step": 142657, "epoch": 3396} {"train_loss": -6.808455467224121, "global_step": 142658, "epoch": 3396} {"train_loss": -6.75473165512085, "global_step": 142659, "epoch": 3396} {"train_loss": -6.844598293304443, "global_step": 142660, "epoch": 3396} {"train_loss": -6.855019569396973, "global_step": 142661, "epoch": 3396} {"train_loss": -6.767816543579102, "global_step": 142662, "epoch": 3396} {"train_loss": -6.773543357849121, "global_step": 142663, "epoch": 3396} {"train_loss": -6.742870807647705, "global_step": 142664, "epoch": 3396} {"train_loss": -6.755044937133789, "global_step": 142665, "epoch": 3396} {"train_loss": -6.78777551651001, "global_step": 142666, "epoch": 3396} {"train_loss": -6.6746649742126465, "global_step": 142667, "epoch": 3396} {"train_loss": -6.815289497375488, "global_step": 142668, "epoch": 3396} {"train_loss": -6.956421375274658, "global_step": 142669, "epoch": 3396} {"train_loss": -6.803740501403809, "global_step": 142670, "epoch": 3396} {"train_loss": -6.879239082336426, "global_step": 142671, "epoch": 3396} {"train_loss": -6.843896865844727, "global_step": 142672, "epoch": 3396} {"train_loss": -6.795718817483811, "global_step": 142673, "epoch": 3396, "val_loss": 78340.515625} {"train_loss": -6.815637588500977, "global_step": 142674, "epoch": 3397} {"train_loss": -6.78656005859375, "global_step": 142675, "epoch": 3397} {"train_loss": -6.935985565185547, "global_step": 142676, "epoch": 3397} {"train_loss": -6.772171974182129, "global_step": 142677, "epoch": 3397} {"train_loss": -6.822775840759277, "global_step": 142678, "epoch": 3397} {"train_loss": -6.852283477783203, "global_step": 142679, "epoch": 3397} {"train_loss": -6.776543617248535, "global_step": 142680, "epoch": 3397} {"train_loss": -6.860272407531738, "global_step": 142681, "epoch": 3397} {"train_loss": -6.848641872406006, "global_step": 142682, "epoch": 3397} {"train_loss": -6.7274489402771, "global_step": 142683, "epoch": 3397} {"train_loss": -6.80446195602417, "global_step": 142684, "epoch": 3397} {"train_loss": -6.808602333068848, "global_step": 142685, "epoch": 3397} {"train_loss": -6.785791397094727, "global_step": 142686, "epoch": 3397} {"train_loss": -6.759469985961914, "global_step": 142687, "epoch": 3397} {"train_loss": -6.765633583068848, "global_step": 142688, "epoch": 3397} {"train_loss": -6.800412654876709, "global_step": 142689, "epoch": 3397} {"train_loss": -6.883631706237793, "global_step": 142690, "epoch": 3397} {"train_loss": -6.704512596130371, "global_step": 142691, "epoch": 3397} {"train_loss": -6.719306945800781, "global_step": 142692, "epoch": 3397} {"train_loss": -6.748553276062012, "global_step": 142693, "epoch": 3397} {"train_loss": -6.79865837097168, "global_step": 142694, "epoch": 3397} {"train_loss": -6.774941921234131, "global_step": 142695, "epoch": 3397} {"train_loss": -6.767000198364258, "global_step": 142696, "epoch": 3397} {"train_loss": -6.799830436706543, "global_step": 142697, "epoch": 3397} {"train_loss": -6.726775169372559, "global_step": 142698, "epoch": 3397} {"train_loss": -6.627334117889404, "global_step": 142699, "epoch": 3397} {"train_loss": -6.856927871704102, "global_step": 142700, "epoch": 3397} {"train_loss": -6.62642240524292, "global_step": 142701, "epoch": 3397} {"train_loss": -6.680756568908691, "global_step": 142702, "epoch": 3397} {"train_loss": -6.752780437469482, "global_step": 142703, "epoch": 3397} {"train_loss": -6.6962080001831055, "global_step": 142704, "epoch": 3397} {"train_loss": -6.667201042175293, "global_step": 142705, "epoch": 3397} {"train_loss": -6.784865379333496, "global_step": 142706, "epoch": 3397} {"train_loss": -6.728631496429443, "global_step": 142707, "epoch": 3397} {"train_loss": -6.7328572273254395, "global_step": 142708, "epoch": 3397} {"train_loss": -6.701169490814209, "global_step": 142709, "epoch": 3397} {"train_loss": -6.709273338317871, "global_step": 142710, "epoch": 3397} {"train_loss": -6.848186492919922, "global_step": 142711, "epoch": 3397} {"train_loss": -6.734821796417236, "global_step": 142712, "epoch": 3397} {"train_loss": -6.739479064941406, "global_step": 142713, "epoch": 3397} {"train_loss": -6.764088153839111, "global_step": 142714, "epoch": 3397} {"train_loss": -6.77106507619222, "global_step": 142715, "epoch": 3397, "val_loss": 78407.765625} {"train_loss": -6.815769195556641, "global_step": 142716, "epoch": 3398} {"train_loss": -6.871719837188721, "global_step": 142717, "epoch": 3398} {"train_loss": -6.844941139221191, "global_step": 142718, "epoch": 3398} {"train_loss": -6.768282890319824, "global_step": 142719, "epoch": 3398} {"train_loss": -6.941725730895996, "global_step": 142720, "epoch": 3398} {"train_loss": -6.806550025939941, "global_step": 142721, "epoch": 3398} {"train_loss": -6.737163543701172, "global_step": 142722, "epoch": 3398} {"train_loss": -6.981589317321777, "global_step": 142723, "epoch": 3398} {"train_loss": -6.937431335449219, "global_step": 142724, "epoch": 3398} {"train_loss": -6.707705020904541, "global_step": 142725, "epoch": 3398} {"train_loss": -6.7225542068481445, "global_step": 142726, "epoch": 3398} {"train_loss": -6.8404951095581055, "global_step": 142727, "epoch": 3398} {"train_loss": -6.942336082458496, "global_step": 142728, "epoch": 3398} {"train_loss": -6.807070255279541, "global_step": 142729, "epoch": 3398} {"train_loss": -6.917426109313965, "global_step": 142730, "epoch": 3398} {"train_loss": -6.880749225616455, "global_step": 142731, "epoch": 3398} {"train_loss": -6.786626815795898, "global_step": 142732, "epoch": 3398} {"train_loss": -6.869080066680908, "global_step": 142733, "epoch": 3398} {"train_loss": -6.87779426574707, "global_step": 142734, "epoch": 3398} {"train_loss": -6.811909198760986, "global_step": 142735, "epoch": 3398} {"train_loss": -6.789812088012695, "global_step": 142736, "epoch": 3398} {"train_loss": -6.873993873596191, "global_step": 142737, "epoch": 3398} {"train_loss": -6.776899337768555, "global_step": 142738, "epoch": 3398} {"train_loss": -6.862527847290039, "global_step": 142739, "epoch": 3398} {"train_loss": -6.719170570373535, "global_step": 142740, "epoch": 3398} {"train_loss": -6.722399711608887, "global_step": 142741, "epoch": 3398} {"train_loss": -6.6509199142456055, "global_step": 142742, "epoch": 3398} {"train_loss": -6.78933048248291, "global_step": 142743, "epoch": 3398} {"train_loss": -6.593611717224121, "global_step": 142744, "epoch": 3398} {"train_loss": -6.677496910095215, "global_step": 142745, "epoch": 3398} {"train_loss": -6.804269790649414, "global_step": 142746, "epoch": 3398} {"train_loss": -6.585165977478027, "global_step": 142747, "epoch": 3398} {"train_loss": -6.647794246673584, "global_step": 142748, "epoch": 3398} {"train_loss": -6.794471740722656, "global_step": 142749, "epoch": 3398} {"train_loss": -6.608386993408203, "global_step": 142750, "epoch": 3398} {"train_loss": -6.787871360778809, "global_step": 142751, "epoch": 3398} {"train_loss": -6.542656898498535, "global_step": 142752, "epoch": 3398} {"train_loss": -6.613929271697998, "global_step": 142753, "epoch": 3398} {"train_loss": -6.731668472290039, "global_step": 142754, "epoch": 3398} {"train_loss": -6.637341499328613, "global_step": 142755, "epoch": 3398} {"train_loss": -6.783245086669922, "global_step": 142756, "epoch": 3398} {"train_loss": -6.772315229688372, "global_step": 142757, "epoch": 3398, "val_loss": 78225.28125} {"train_loss": -6.808424949645996, "global_step": 142758, "epoch": 3399} {"train_loss": -6.686544418334961, "global_step": 142759, "epoch": 3399} {"train_loss": -6.690186977386475, "global_step": 142760, "epoch": 3399} {"train_loss": -6.824924468994141, "global_step": 142761, "epoch": 3399} {"train_loss": -6.726663112640381, "global_step": 142762, "epoch": 3399} {"train_loss": -6.777255535125732, "global_step": 142763, "epoch": 3399} {"train_loss": -6.718939304351807, "global_step": 142764, "epoch": 3399} {"train_loss": -6.802626609802246, "global_step": 142765, "epoch": 3399} {"train_loss": -6.9225263595581055, "global_step": 142766, "epoch": 3399} {"train_loss": -6.812589645385742, "global_step": 142767, "epoch": 3399} {"train_loss": -6.724740505218506, "global_step": 142768, "epoch": 3399} {"train_loss": -6.887462615966797, "global_step": 142769, "epoch": 3399} {"train_loss": -6.922879695892334, "global_step": 142770, "epoch": 3399} {"train_loss": -6.7789788246154785, "global_step": 142771, "epoch": 3399} {"train_loss": -6.802285194396973, "global_step": 142772, "epoch": 3399} {"train_loss": -6.7751359939575195, "global_step": 142773, "epoch": 3399} {"train_loss": -6.781519412994385, "global_step": 142774, "epoch": 3399} {"train_loss": -6.800863265991211, "global_step": 142775, "epoch": 3399} {"train_loss": -6.808897972106934, "global_step": 142776, "epoch": 3399} {"train_loss": -6.880219459533691, "global_step": 142777, "epoch": 3399} {"train_loss": -6.83098030090332, "global_step": 142778, "epoch": 3399} {"train_loss": -6.829421043395996, "global_step": 142779, "epoch": 3399} {"train_loss": -6.816779136657715, "global_step": 142780, "epoch": 3399} {"train_loss": -6.7112579345703125, "global_step": 142781, "epoch": 3399} {"train_loss": -6.766670227050781, "global_step": 142782, "epoch": 3399} {"train_loss": -6.896178245544434, "global_step": 142783, "epoch": 3399} {"train_loss": -6.82896614074707, "global_step": 142784, "epoch": 3399} {"train_loss": -6.758513927459717, "global_step": 142785, "epoch": 3399} {"train_loss": -6.769765853881836, "global_step": 142786, "epoch": 3399} {"train_loss": -6.832278251647949, "global_step": 142787, "epoch": 3399} {"train_loss": -6.839471817016602, "global_step": 142788, "epoch": 3399} {"train_loss": -6.802584648132324, "global_step": 142789, "epoch": 3399} {"train_loss": -6.86962366104126, "global_step": 142790, "epoch": 3399} {"train_loss": -6.921673774719238, "global_step": 142791, "epoch": 3399} {"train_loss": -6.8021039962768555, "global_step": 142792, "epoch": 3399} {"train_loss": -6.741264820098877, "global_step": 142793, "epoch": 3399} {"train_loss": -6.588924884796143, "global_step": 142794, "epoch": 3399} {"train_loss": -6.68431282043457, "global_step": 142795, "epoch": 3399} {"train_loss": -6.799623489379883, "global_step": 142796, "epoch": 3399} {"train_loss": -6.793150424957275, "global_step": 142797, "epoch": 3399} {"train_loss": -6.913661003112793, "global_step": 142798, "epoch": 3399} {"train_loss": -6.799572762988863, "global_step": 142799, "epoch": 3399, "val_loss": 78386.234375} {"train_loss": -6.742422103881836, "global_step": 142800, "epoch": 3400} {"train_loss": -6.781366348266602, "global_step": 142801, "epoch": 3400} {"train_loss": -6.6163649559021, "global_step": 142802, "epoch": 3400} {"train_loss": -6.759124279022217, "global_step": 142803, "epoch": 3400} {"train_loss": -6.900483131408691, "global_step": 142804, "epoch": 3400} {"train_loss": -6.7186126708984375, "global_step": 142805, "epoch": 3400} {"train_loss": -6.773623466491699, "global_step": 142806, "epoch": 3400} {"train_loss": -6.781907081604004, "global_step": 142807, "epoch": 3400} {"train_loss": -6.647242546081543, "global_step": 142808, "epoch": 3400} {"train_loss": -6.722525596618652, "global_step": 142809, "epoch": 3400} {"train_loss": -6.737658500671387, "global_step": 142810, "epoch": 3400} {"train_loss": -6.640406608581543, "global_step": 142811, "epoch": 3400} {"train_loss": -6.745645523071289, "global_step": 142812, "epoch": 3400} {"train_loss": -6.785764694213867, "global_step": 142813, "epoch": 3400} {"train_loss": -6.790584564208984, "global_step": 142814, "epoch": 3400} {"train_loss": -6.781519889831543, "global_step": 142815, "epoch": 3400} {"train_loss": -6.7014970779418945, "global_step": 142816, "epoch": 3400} {"train_loss": -6.65572452545166, "global_step": 142817, "epoch": 3400} {"train_loss": -6.781374931335449, "global_step": 142818, "epoch": 3400} {"train_loss": -6.825094699859619, "global_step": 142819, "epoch": 3400} {"train_loss": -6.8457183837890625, "global_step": 142820, "epoch": 3400} {"train_loss": -6.706079483032227, "global_step": 142821, "epoch": 3400} {"train_loss": -6.851263046264648, "global_step": 142822, "epoch": 3400} {"train_loss": -6.84055233001709, "global_step": 142823, "epoch": 3400} {"train_loss": -6.899997711181641, "global_step": 142824, "epoch": 3400} {"train_loss": -6.794454574584961, "global_step": 142825, "epoch": 3400} {"train_loss": -6.894845962524414, "global_step": 142826, "epoch": 3400} {"train_loss": -6.749670028686523, "global_step": 142827, "epoch": 3400} {"train_loss": -6.777486801147461, "global_step": 142828, "epoch": 3400} {"train_loss": -6.908374786376953, "global_step": 142829, "epoch": 3400} {"train_loss": -6.819993019104004, "global_step": 142830, "epoch": 3400} {"train_loss": -6.770588397979736, "global_step": 142831, "epoch": 3400} {"train_loss": -6.827890396118164, "global_step": 142832, "epoch": 3400} {"train_loss": -6.910012245178223, "global_step": 142833, "epoch": 3400} {"train_loss": -6.9427900314331055, "global_step": 142834, "epoch": 3400} {"train_loss": -6.84698486328125, "global_step": 142835, "epoch": 3400} {"train_loss": -6.833558082580566, "global_step": 142836, "epoch": 3400} {"train_loss": -6.887866497039795, "global_step": 142837, "epoch": 3400} {"train_loss": -6.726592540740967, "global_step": 142838, "epoch": 3400} {"train_loss": -6.776059627532959, "global_step": 142839, "epoch": 3400} {"train_loss": -6.584766864776611, "global_step": 142840, "epoch": 3400} {"train_loss": -6.782273065476191, "global_step": 142841, "epoch": 3400, "train/sim_max_reward_0": 0.8787755173520515, "train/sim_max_reward_1": 0.9249159960098217, "train/sim_max_reward_2": 0.42964985577907316, "train/sim_max_reward_3": 0.14955672622733462, "train/sim_max_reward_4": 0.5679968579586736, "train/sim_max_reward_5": 0.5699000131403772, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9165571090812739, "test/sim_max_reward_4500003": 0.8458145616406791, "test/sim_max_reward_4500004": 0.9661644518949005, "test/sim_max_reward_4500005": 0.17787084688838206, "test/sim_max_reward_4500006": 0.9586340057421888, "test/sim_max_reward_4500007": 0.7349930916970974, "test/sim_max_reward_4500008": 0.9524779893592851, "test/sim_max_reward_4500009": 0.05349882088801387, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9385656107277304, "test/sim_max_reward_4500012": 0.8729770247813988, "test/sim_max_reward_4500013": 0.0031813553188643254, "test/sim_max_reward_4500014": 0.8685435437608572, "test/sim_max_reward_4500015": 0.9995527020588276, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.040604757988687956, "test/sim_max_reward_4500018": 0.43568662759026855, "test/sim_max_reward_4500019": 0.9518339412586257, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 1.0, "test/sim_max_reward_4500023": 0.6119037195406875, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9084495369569034, "test/sim_max_reward_4500026": 0.8648240109948708, "test/sim_max_reward_4500027": 0.8885774887915384, "test/sim_max_reward_4500028": 0.19581326582344327, "test/sim_max_reward_4500029": 0.05890790935991761, "test/sim_max_reward_4500030": 0.7391483244131304, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.022490944833504358, "test/sim_max_reward_4500034": 0.6952471115885627, "test/sim_max_reward_4500035": 0.8487357717128954, "test/sim_max_reward_4500036": 0.6585165504261926, "test/sim_max_reward_4500037": 0.5915655016454217, "test/sim_max_reward_4500038": 0.31865062505226655, "test/sim_max_reward_4500039": 0.9031651893736993, "test/sim_max_reward_4500040": 0.980488204245411, "test/sim_max_reward_4500041": 0.8838254853243321, "test/sim_max_reward_4500042": 0.011468281611380474, "test/sim_max_reward_4500043": 0.9762675682450327, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.39684293303288354, "test/sim_max_reward_4500046": 0.18738728053389497, "test/sim_max_reward_4500047": 0.9420854181298092, "test/sim_max_reward_4500048": 0.9736578697862974, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5867991610778888, "test/mean_score": 0.54922937459644, "val_loss": 78185.03125} {"train_loss": -6.87186861038208, "global_step": 142842, "epoch": 3401} {"train_loss": -6.692807197570801, "global_step": 142843, "epoch": 3401} {"train_loss": -6.889755725860596, "global_step": 142844, "epoch": 3401} {"train_loss": -6.705193996429443, "global_step": 142845, "epoch": 3401} {"train_loss": -6.604833602905273, "global_step": 142846, "epoch": 3401} {"train_loss": -6.624069690704346, "global_step": 142847, "epoch": 3401} {"train_loss": -6.749181747436523, "global_step": 142848, "epoch": 3401} {"train_loss": -6.868253231048584, "global_step": 142849, "epoch": 3401} {"train_loss": -6.695592880249023, "global_step": 142850, "epoch": 3401} {"train_loss": -6.708218574523926, "global_step": 142851, "epoch": 3401} {"train_loss": -6.80352783203125, "global_step": 142852, "epoch": 3401} {"train_loss": -6.86860990524292, "global_step": 142853, "epoch": 3401} {"train_loss": -6.892848014831543, "global_step": 142854, "epoch": 3401} {"train_loss": -6.69658899307251, "global_step": 142855, "epoch": 3401} {"train_loss": -6.8564934730529785, "global_step": 142856, "epoch": 3401} {"train_loss": -6.882472038269043, "global_step": 142857, "epoch": 3401} {"train_loss": -6.865775108337402, "global_step": 142858, "epoch": 3401} {"train_loss": -6.85304069519043, "global_step": 142859, "epoch": 3401} {"train_loss": -6.795807838439941, "global_step": 142860, "epoch": 3401} {"train_loss": -6.769426345825195, "global_step": 142861, "epoch": 3401} {"train_loss": -6.922850131988525, "global_step": 142862, "epoch": 3401} {"train_loss": -6.7489752769470215, "global_step": 142863, "epoch": 3401} {"train_loss": -6.764629364013672, "global_step": 142864, "epoch": 3401} {"train_loss": -6.9127092361450195, "global_step": 142865, "epoch": 3401} {"train_loss": -6.887696743011475, "global_step": 142866, "epoch": 3401} {"train_loss": -6.874220371246338, "global_step": 142867, "epoch": 3401} {"train_loss": -6.807735443115234, "global_step": 142868, "epoch": 3401} {"train_loss": -6.928057670593262, "global_step": 142869, "epoch": 3401} {"train_loss": -6.788181304931641, "global_step": 142870, "epoch": 3401} {"train_loss": -6.862314224243164, "global_step": 142871, "epoch": 3401} {"train_loss": -6.9028730392456055, "global_step": 142872, "epoch": 3401} {"train_loss": -6.79695987701416, "global_step": 142873, "epoch": 3401} {"train_loss": -6.963224411010742, "global_step": 142874, "epoch": 3401} {"train_loss": -6.777510166168213, "global_step": 142875, "epoch": 3401} {"train_loss": -6.708208084106445, "global_step": 142876, "epoch": 3401} {"train_loss": -6.7881340980529785, "global_step": 142877, "epoch": 3401} {"train_loss": -6.867177963256836, "global_step": 142878, "epoch": 3401} {"train_loss": -6.792229652404785, "global_step": 142879, "epoch": 3401} {"train_loss": -6.8717756271362305, "global_step": 142880, "epoch": 3401} {"train_loss": -6.900143623352051, "global_step": 142881, "epoch": 3401} {"train_loss": -6.685130596160889, "global_step": 142882, "epoch": 3401} {"train_loss": -6.8091087227775935, "global_step": 142883, "epoch": 3401, "val_loss": 78150.875} {"train_loss": -6.840826034545898, "global_step": 142884, "epoch": 3402} {"train_loss": -6.739592552185059, "global_step": 142885, "epoch": 3402} {"train_loss": -6.843296051025391, "global_step": 142886, "epoch": 3402} {"train_loss": -6.906599998474121, "global_step": 142887, "epoch": 3402} {"train_loss": -6.886845111846924, "global_step": 142888, "epoch": 3402} {"train_loss": -6.8180832862854, "global_step": 142889, "epoch": 3402} {"train_loss": -6.895168304443359, "global_step": 142890, "epoch": 3402} {"train_loss": -6.867478370666504, "global_step": 142891, "epoch": 3402} {"train_loss": -6.779212951660156, "global_step": 142892, "epoch": 3402} {"train_loss": -6.863285541534424, "global_step": 142893, "epoch": 3402} {"train_loss": -6.962161064147949, "global_step": 142894, "epoch": 3402} {"train_loss": -6.814117431640625, "global_step": 142895, "epoch": 3402} {"train_loss": -6.86915922164917, "global_step": 142896, "epoch": 3402} {"train_loss": -6.719184875488281, "global_step": 142897, "epoch": 3402} {"train_loss": -6.766556739807129, "global_step": 142898, "epoch": 3402} {"train_loss": -6.869299411773682, "global_step": 142899, "epoch": 3402} {"train_loss": -6.724008083343506, "global_step": 142900, "epoch": 3402} {"train_loss": -6.802443504333496, "global_step": 142901, "epoch": 3402} {"train_loss": -6.937075138092041, "global_step": 142902, "epoch": 3402} {"train_loss": -6.716573238372803, "global_step": 142903, "epoch": 3402} {"train_loss": -6.824824333190918, "global_step": 142904, "epoch": 3402} {"train_loss": -6.704286575317383, "global_step": 142905, "epoch": 3402} {"train_loss": -6.782251358032227, "global_step": 142906, "epoch": 3402} {"train_loss": -6.674790859222412, "global_step": 142907, "epoch": 3402} {"train_loss": -6.7588067054748535, "global_step": 142908, "epoch": 3402} {"train_loss": -6.7522664070129395, "global_step": 142909, "epoch": 3402} {"train_loss": -6.735936641693115, "global_step": 142910, "epoch": 3402} {"train_loss": -6.735601902008057, "global_step": 142911, "epoch": 3402} {"train_loss": -6.748345375061035, "global_step": 142912, "epoch": 3402} {"train_loss": -6.756305694580078, "global_step": 142913, "epoch": 3402} {"train_loss": -6.633993148803711, "global_step": 142914, "epoch": 3402} {"train_loss": -6.792349338531494, "global_step": 142915, "epoch": 3402} {"train_loss": -6.6017985343933105, "global_step": 142916, "epoch": 3402} {"train_loss": -6.711287498474121, "global_step": 142917, "epoch": 3402} {"train_loss": -6.722451210021973, "global_step": 142918, "epoch": 3402} {"train_loss": -6.682154178619385, "global_step": 142919, "epoch": 3402} {"train_loss": -6.713226318359375, "global_step": 142920, "epoch": 3402} {"train_loss": -6.6372833251953125, "global_step": 142921, "epoch": 3402} {"train_loss": -6.717956066131592, "global_step": 142922, "epoch": 3402} {"train_loss": -6.6824846267700195, "global_step": 142923, "epoch": 3402} {"train_loss": -6.853845119476318, "global_step": 142924, "epoch": 3402} {"train_loss": -6.775937557220459, "global_step": 142925, "epoch": 3402, "val_loss": 78295.109375} {"train_loss": -6.690101146697998, "global_step": 142926, "epoch": 3403} {"train_loss": -6.86557674407959, "global_step": 142927, "epoch": 3403} {"train_loss": -6.696364402770996, "global_step": 142928, "epoch": 3403} {"train_loss": -6.834352016448975, "global_step": 142929, "epoch": 3403} {"train_loss": -6.739291191101074, "global_step": 142930, "epoch": 3403} {"train_loss": -6.723354816436768, "global_step": 142931, "epoch": 3403} {"train_loss": -6.868404388427734, "global_step": 142932, "epoch": 3403} {"train_loss": -6.818819046020508, "global_step": 142933, "epoch": 3403} {"train_loss": -6.718954086303711, "global_step": 142934, "epoch": 3403} {"train_loss": -6.797495365142822, "global_step": 142935, "epoch": 3403} {"train_loss": -6.735481262207031, "global_step": 142936, "epoch": 3403} {"train_loss": -6.749379634857178, "global_step": 142937, "epoch": 3403} {"train_loss": -6.594616889953613, "global_step": 142938, "epoch": 3403} {"train_loss": -6.776099681854248, "global_step": 142939, "epoch": 3403} {"train_loss": -6.760770320892334, "global_step": 142940, "epoch": 3403} {"train_loss": -6.764545440673828, "global_step": 142941, "epoch": 3403} {"train_loss": -6.689878463745117, "global_step": 142942, "epoch": 3403} {"train_loss": -6.732733249664307, "global_step": 142943, "epoch": 3403} {"train_loss": -6.74470329284668, "global_step": 142944, "epoch": 3403} {"train_loss": -6.694087028503418, "global_step": 142945, "epoch": 3403} {"train_loss": -6.691150665283203, "global_step": 142946, "epoch": 3403} {"train_loss": -6.720950126647949, "global_step": 142947, "epoch": 3403} {"train_loss": -6.7354021072387695, "global_step": 142948, "epoch": 3403} {"train_loss": -6.826624870300293, "global_step": 142949, "epoch": 3403} {"train_loss": -6.740683555603027, "global_step": 142950, "epoch": 3403} {"train_loss": -6.868877410888672, "global_step": 142951, "epoch": 3403} {"train_loss": -6.829536437988281, "global_step": 142952, "epoch": 3403} {"train_loss": -6.643531799316406, "global_step": 142953, "epoch": 3403} {"train_loss": -6.82285213470459, "global_step": 142954, "epoch": 3403} {"train_loss": -6.749424934387207, "global_step": 142955, "epoch": 3403} {"train_loss": -6.842118740081787, "global_step": 142956, "epoch": 3403} {"train_loss": -6.856335639953613, "global_step": 142957, "epoch": 3403} {"train_loss": -6.749788284301758, "global_step": 142958, "epoch": 3403} {"train_loss": -6.800710678100586, "global_step": 142959, "epoch": 3403} {"train_loss": -6.888790130615234, "global_step": 142960, "epoch": 3403} {"train_loss": -6.805522441864014, "global_step": 142961, "epoch": 3403} {"train_loss": -6.751222610473633, "global_step": 142962, "epoch": 3403} {"train_loss": -6.881806373596191, "global_step": 142963, "epoch": 3403} {"train_loss": -6.855923175811768, "global_step": 142964, "epoch": 3403} {"train_loss": -6.9033308029174805, "global_step": 142965, "epoch": 3403} {"train_loss": -6.948802471160889, "global_step": 142966, "epoch": 3403} {"train_loss": -6.7774423985254195, "global_step": 142967, "epoch": 3403, "val_loss": 78575.3359375} {"train_loss": -6.804365158081055, "global_step": 142968, "epoch": 3404} {"train_loss": -6.821883201599121, "global_step": 142969, "epoch": 3404} {"train_loss": -6.838092803955078, "global_step": 142970, "epoch": 3404} {"train_loss": -6.7430901527404785, "global_step": 142971, "epoch": 3404} {"train_loss": -6.773525714874268, "global_step": 142972, "epoch": 3404} {"train_loss": -6.699162006378174, "global_step": 142973, "epoch": 3404} {"train_loss": -6.833641052246094, "global_step": 142974, "epoch": 3404} {"train_loss": -6.702352523803711, "global_step": 142975, "epoch": 3404} {"train_loss": -6.636046886444092, "global_step": 142976, "epoch": 3404} {"train_loss": -6.814737796783447, "global_step": 142977, "epoch": 3404} {"train_loss": -6.517250061035156, "global_step": 142978, "epoch": 3404} {"train_loss": -6.86515998840332, "global_step": 142979, "epoch": 3404} {"train_loss": -6.643832683563232, "global_step": 142980, "epoch": 3404} {"train_loss": -6.663387298583984, "global_step": 142981, "epoch": 3404} {"train_loss": -6.717989444732666, "global_step": 142982, "epoch": 3404} {"train_loss": -6.7724432945251465, "global_step": 142983, "epoch": 3404} {"train_loss": -6.821859836578369, "global_step": 142984, "epoch": 3404} {"train_loss": -6.732454299926758, "global_step": 142985, "epoch": 3404} {"train_loss": -6.716107368469238, "global_step": 142986, "epoch": 3404} {"train_loss": -6.7360944747924805, "global_step": 142987, "epoch": 3404} {"train_loss": -6.798311233520508, "global_step": 142988, "epoch": 3404} {"train_loss": -6.7144575119018555, "global_step": 142989, "epoch": 3404} {"train_loss": -6.8602375984191895, "global_step": 142990, "epoch": 3404} {"train_loss": -6.849177837371826, "global_step": 142991, "epoch": 3404} {"train_loss": -6.740054130554199, "global_step": 142992, "epoch": 3404} {"train_loss": -6.94316291809082, "global_step": 142993, "epoch": 3404} {"train_loss": -6.772642135620117, "global_step": 142994, "epoch": 3404} {"train_loss": -6.836347579956055, "global_step": 142995, "epoch": 3404} {"train_loss": -6.901769161224365, "global_step": 142996, "epoch": 3404} {"train_loss": -6.79058837890625, "global_step": 142997, "epoch": 3404} {"train_loss": -6.791266918182373, "global_step": 142998, "epoch": 3404} {"train_loss": -6.862031936645508, "global_step": 142999, "epoch": 3404} {"train_loss": -6.836456298828125, "global_step": 143000, "epoch": 3404} {"train_loss": -6.75910758972168, "global_step": 143001, "epoch": 3404} {"train_loss": -6.821063995361328, "global_step": 143002, "epoch": 3404} {"train_loss": -6.81772518157959, "global_step": 143003, "epoch": 3404} {"train_loss": -6.842398643493652, "global_step": 143004, "epoch": 3404} {"train_loss": -6.766750812530518, "global_step": 143005, "epoch": 3404} {"train_loss": -6.726658344268799, "global_step": 143006, "epoch": 3404} {"train_loss": -6.680027008056641, "global_step": 143007, "epoch": 3404} {"train_loss": -6.590888023376465, "global_step": 143008, "epoch": 3404} {"train_loss": -6.767510175704956, "global_step": 143009, "epoch": 3404, "val_loss": 78461.375} {"train_loss": -6.834831237792969, "global_step": 143010, "epoch": 3405} {"train_loss": -6.69387149810791, "global_step": 143011, "epoch": 3405} {"train_loss": -6.702245712280273, "global_step": 143012, "epoch": 3405} {"train_loss": -6.593926429748535, "global_step": 143013, "epoch": 3405} {"train_loss": -6.737610816955566, "global_step": 143014, "epoch": 3405} {"train_loss": -6.576326370239258, "global_step": 143015, "epoch": 3405} {"train_loss": -6.628739356994629, "global_step": 143016, "epoch": 3405} {"train_loss": -6.817719459533691, "global_step": 143017, "epoch": 3405} {"train_loss": -6.644131183624268, "global_step": 143018, "epoch": 3405} {"train_loss": -6.779089450836182, "global_step": 143019, "epoch": 3405} {"train_loss": -6.650317192077637, "global_step": 143020, "epoch": 3405} {"train_loss": -6.608478546142578, "global_step": 143021, "epoch": 3405} {"train_loss": -6.714053153991699, "global_step": 143022, "epoch": 3405} {"train_loss": -6.79832649230957, "global_step": 143023, "epoch": 3405} {"train_loss": -6.499587059020996, "global_step": 143024, "epoch": 3405} {"train_loss": -6.847525596618652, "global_step": 143025, "epoch": 3405} {"train_loss": -6.705967426300049, "global_step": 143026, "epoch": 3405} {"train_loss": -6.755383491516113, "global_step": 143027, "epoch": 3405} {"train_loss": -6.833419322967529, "global_step": 143028, "epoch": 3405} {"train_loss": -6.88383150100708, "global_step": 143029, "epoch": 3405} {"train_loss": -6.751793384552002, "global_step": 143030, "epoch": 3405} {"train_loss": -6.91337776184082, "global_step": 143031, "epoch": 3405} {"train_loss": -6.685892105102539, "global_step": 143032, "epoch": 3405} {"train_loss": -6.820043563842773, "global_step": 143033, "epoch": 3405} {"train_loss": -6.746685028076172, "global_step": 143034, "epoch": 3405} {"train_loss": -6.840193271636963, "global_step": 143035, "epoch": 3405} {"train_loss": -6.826204776763916, "global_step": 143036, "epoch": 3405} {"train_loss": -6.719017028808594, "global_step": 143037, "epoch": 3405} {"train_loss": -6.755182266235352, "global_step": 143038, "epoch": 3405} {"train_loss": -6.702495098114014, "global_step": 143039, "epoch": 3405} {"train_loss": -6.889069557189941, "global_step": 143040, "epoch": 3405} {"train_loss": -6.824646472930908, "global_step": 143041, "epoch": 3405} {"train_loss": -6.7681803703308105, "global_step": 143042, "epoch": 3405} {"train_loss": -6.8933563232421875, "global_step": 143043, "epoch": 3405} {"train_loss": -6.875429153442383, "global_step": 143044, "epoch": 3405} {"train_loss": -6.86969518661499, "global_step": 143045, "epoch": 3405} {"train_loss": -6.816751003265381, "global_step": 143046, "epoch": 3405} {"train_loss": -6.755365371704102, "global_step": 143047, "epoch": 3405} {"train_loss": -6.785580635070801, "global_step": 143048, "epoch": 3405} {"train_loss": -6.767805099487305, "global_step": 143049, "epoch": 3405} {"train_loss": -6.724523067474365, "global_step": 143050, "epoch": 3405} {"train_loss": -6.7600321769714355, "global_step": 143051, "epoch": 3405, "val_loss": 78102.6015625} {"train_loss": -6.8135576248168945, "global_step": 143052, "epoch": 3406} {"train_loss": -6.772366523742676, "global_step": 143053, "epoch": 3406} {"train_loss": -6.846453666687012, "global_step": 143054, "epoch": 3406} {"train_loss": -6.798315525054932, "global_step": 143055, "epoch": 3406} {"train_loss": -6.8416666984558105, "global_step": 143056, "epoch": 3406} {"train_loss": -6.819801330566406, "global_step": 143057, "epoch": 3406} {"train_loss": -6.928930759429932, "global_step": 143058, "epoch": 3406} {"train_loss": -6.863997459411621, "global_step": 143059, "epoch": 3406} {"train_loss": -6.899730205535889, "global_step": 143060, "epoch": 3406} {"train_loss": -6.743505954742432, "global_step": 143061, "epoch": 3406} {"train_loss": -6.973705291748047, "global_step": 143062, "epoch": 3406} {"train_loss": -6.7653398513793945, "global_step": 143063, "epoch": 3406} {"train_loss": -6.810702323913574, "global_step": 143064, "epoch": 3406} {"train_loss": -6.8910813331604, "global_step": 143065, "epoch": 3406} {"train_loss": -6.8349480628967285, "global_step": 143066, "epoch": 3406} {"train_loss": -6.883704662322998, "global_step": 143067, "epoch": 3406} {"train_loss": -6.81392765045166, "global_step": 143068, "epoch": 3406} {"train_loss": -6.881747245788574, "global_step": 143069, "epoch": 3406} {"train_loss": -6.923089981079102, "global_step": 143070, "epoch": 3406} {"train_loss": -6.852024078369141, "global_step": 143071, "epoch": 3406} {"train_loss": -6.859339714050293, "global_step": 143072, "epoch": 3406} {"train_loss": -6.760546684265137, "global_step": 143073, "epoch": 3406} {"train_loss": -6.899502754211426, "global_step": 143074, "epoch": 3406} {"train_loss": -6.837376594543457, "global_step": 143075, "epoch": 3406} {"train_loss": -6.727421760559082, "global_step": 143076, "epoch": 3406} {"train_loss": -6.827740669250488, "global_step": 143077, "epoch": 3406} {"train_loss": -6.862940311431885, "global_step": 143078, "epoch": 3406} {"train_loss": -6.681845188140869, "global_step": 143079, "epoch": 3406} {"train_loss": -6.828758239746094, "global_step": 143080, "epoch": 3406} {"train_loss": -6.807130813598633, "global_step": 143081, "epoch": 3406} {"train_loss": -6.766791820526123, "global_step": 143082, "epoch": 3406} {"train_loss": -6.825268745422363, "global_step": 143083, "epoch": 3406} {"train_loss": -6.856540679931641, "global_step": 143084, "epoch": 3406} {"train_loss": -6.783015251159668, "global_step": 143085, "epoch": 3406} {"train_loss": -6.840612888336182, "global_step": 143086, "epoch": 3406} {"train_loss": -6.949197769165039, "global_step": 143087, "epoch": 3406} {"train_loss": -6.796273231506348, "global_step": 143088, "epoch": 3406} {"train_loss": -6.768829345703125, "global_step": 143089, "epoch": 3406} {"train_loss": -6.832700729370117, "global_step": 143090, "epoch": 3406} {"train_loss": -6.890810012817383, "global_step": 143091, "epoch": 3406} {"train_loss": -6.884193420410156, "global_step": 143092, "epoch": 3406} {"train_loss": -6.835977611087618, "global_step": 143093, "epoch": 3406, "val_loss": 78235.359375} {"train_loss": -6.594292640686035, "global_step": 143094, "epoch": 3407} {"train_loss": -6.687331199645996, "global_step": 143095, "epoch": 3407} {"train_loss": -6.941470146179199, "global_step": 143096, "epoch": 3407} {"train_loss": -6.673423767089844, "global_step": 143097, "epoch": 3407} {"train_loss": -6.8705339431762695, "global_step": 143098, "epoch": 3407} {"train_loss": -6.777083396911621, "global_step": 143099, "epoch": 3407} {"train_loss": -6.943811893463135, "global_step": 143100, "epoch": 3407} {"train_loss": -6.761277198791504, "global_step": 143101, "epoch": 3407} {"train_loss": -6.789880752563477, "global_step": 143102, "epoch": 3407} {"train_loss": -6.833642482757568, "global_step": 143103, "epoch": 3407} {"train_loss": -6.702571868896484, "global_step": 143104, "epoch": 3407} {"train_loss": -6.8269195556640625, "global_step": 143105, "epoch": 3407} {"train_loss": -6.767168045043945, "global_step": 143106, "epoch": 3407} {"train_loss": -6.845841407775879, "global_step": 143107, "epoch": 3407} {"train_loss": -6.83226203918457, "global_step": 143108, "epoch": 3407} {"train_loss": -6.84562873840332, "global_step": 143109, "epoch": 3407} {"train_loss": -6.830480575561523, "global_step": 143110, "epoch": 3407} {"train_loss": -6.794287204742432, "global_step": 143111, "epoch": 3407} {"train_loss": -6.839905261993408, "global_step": 143112, "epoch": 3407} {"train_loss": -6.8764495849609375, "global_step": 143113, "epoch": 3407} {"train_loss": -6.860101222991943, "global_step": 143114, "epoch": 3407} {"train_loss": -6.827539920806885, "global_step": 143115, "epoch": 3407} {"train_loss": -6.787796497344971, "global_step": 143116, "epoch": 3407} {"train_loss": -6.912149429321289, "global_step": 143117, "epoch": 3407} {"train_loss": -6.912470817565918, "global_step": 143118, "epoch": 3407} {"train_loss": -6.7853193283081055, "global_step": 143119, "epoch": 3407} {"train_loss": -6.824613094329834, "global_step": 143120, "epoch": 3407} {"train_loss": -6.880364894866943, "global_step": 143121, "epoch": 3407} {"train_loss": -6.870038986206055, "global_step": 143122, "epoch": 3407} {"train_loss": -6.8617048263549805, "global_step": 143123, "epoch": 3407} {"train_loss": -6.854368209838867, "global_step": 143124, "epoch": 3407} {"train_loss": -6.760555744171143, "global_step": 143125, "epoch": 3407} {"train_loss": -6.843229293823242, "global_step": 143126, "epoch": 3407} {"train_loss": -6.827754974365234, "global_step": 143127, "epoch": 3407} {"train_loss": -6.718015670776367, "global_step": 143128, "epoch": 3407} {"train_loss": -6.926348686218262, "global_step": 143129, "epoch": 3407} {"train_loss": -6.773805618286133, "global_step": 143130, "epoch": 3407} {"train_loss": -6.814019203186035, "global_step": 143131, "epoch": 3407} {"train_loss": -6.797959804534912, "global_step": 143132, "epoch": 3407} {"train_loss": -6.83699893951416, "global_step": 143133, "epoch": 3407} {"train_loss": -6.892139911651611, "global_step": 143134, "epoch": 3407} {"train_loss": -6.8163504259926935, "global_step": 143135, "epoch": 3407, "val_loss": 78239.9296875} {"train_loss": -6.851665496826172, "global_step": 143136, "epoch": 3408} {"train_loss": -6.7623186111450195, "global_step": 143137, "epoch": 3408} {"train_loss": -6.739998817443848, "global_step": 143138, "epoch": 3408} {"train_loss": -6.850887298583984, "global_step": 143139, "epoch": 3408} {"train_loss": -6.770751953125, "global_step": 143140, "epoch": 3408} {"train_loss": -6.702836036682129, "global_step": 143141, "epoch": 3408} {"train_loss": -6.880309104919434, "global_step": 143142, "epoch": 3408} {"train_loss": -6.837302207946777, "global_step": 143143, "epoch": 3408} {"train_loss": -6.785712242126465, "global_step": 143144, "epoch": 3408} {"train_loss": -6.6346964836120605, "global_step": 143145, "epoch": 3408} {"train_loss": -6.683277606964111, "global_step": 143146, "epoch": 3408} {"train_loss": -6.835201263427734, "global_step": 143147, "epoch": 3408} {"train_loss": -6.762113571166992, "global_step": 143148, "epoch": 3408} {"train_loss": -6.8814167976379395, "global_step": 143149, "epoch": 3408} {"train_loss": -6.7623796463012695, "global_step": 143150, "epoch": 3408} {"train_loss": -6.923452854156494, "global_step": 143151, "epoch": 3408} {"train_loss": -6.786105155944824, "global_step": 143152, "epoch": 3408} {"train_loss": -6.7766618728637695, "global_step": 143153, "epoch": 3408} {"train_loss": -6.783941268920898, "global_step": 143154, "epoch": 3408} {"train_loss": -6.750991344451904, "global_step": 143155, "epoch": 3408} {"train_loss": -6.738680839538574, "global_step": 143156, "epoch": 3408} {"train_loss": -6.784825325012207, "global_step": 143157, "epoch": 3408} {"train_loss": -6.863024711608887, "global_step": 143158, "epoch": 3408} {"train_loss": -6.702780723571777, "global_step": 143159, "epoch": 3408} {"train_loss": -6.76689338684082, "global_step": 143160, "epoch": 3408} {"train_loss": -6.862190246582031, "global_step": 143161, "epoch": 3408} {"train_loss": -6.701699256896973, "global_step": 143162, "epoch": 3408} {"train_loss": -6.704602241516113, "global_step": 143163, "epoch": 3408} {"train_loss": -6.756694316864014, "global_step": 143164, "epoch": 3408} {"train_loss": -6.83112096786499, "global_step": 143165, "epoch": 3408} {"train_loss": -6.741481781005859, "global_step": 143166, "epoch": 3408} {"train_loss": -6.864619255065918, "global_step": 143167, "epoch": 3408} {"train_loss": -6.939364433288574, "global_step": 143168, "epoch": 3408} {"train_loss": -6.811260223388672, "global_step": 143169, "epoch": 3408} {"train_loss": -6.834980010986328, "global_step": 143170, "epoch": 3408} {"train_loss": -6.7783894538879395, "global_step": 143171, "epoch": 3408} {"train_loss": -6.846351623535156, "global_step": 143172, "epoch": 3408} {"train_loss": -6.718738555908203, "global_step": 143173, "epoch": 3408} {"train_loss": -6.86638069152832, "global_step": 143174, "epoch": 3408} {"train_loss": -6.823948383331299, "global_step": 143175, "epoch": 3408} {"train_loss": -6.8328070640563965, "global_step": 143176, "epoch": 3408} {"train_loss": -6.793947628566197, "global_step": 143177, "epoch": 3408, "val_loss": 78390.8984375} {"train_loss": -6.746222019195557, "global_step": 143178, "epoch": 3409} {"train_loss": -6.778202056884766, "global_step": 143179, "epoch": 3409} {"train_loss": -6.825852870941162, "global_step": 143180, "epoch": 3409} {"train_loss": -6.869900703430176, "global_step": 143181, "epoch": 3409} {"train_loss": -6.772235870361328, "global_step": 143182, "epoch": 3409} {"train_loss": -6.943276405334473, "global_step": 143183, "epoch": 3409} {"train_loss": -6.8103556632995605, "global_step": 143184, "epoch": 3409} {"train_loss": -6.864372253417969, "global_step": 143185, "epoch": 3409} {"train_loss": -6.801340103149414, "global_step": 143186, "epoch": 3409} {"train_loss": -6.833174705505371, "global_step": 143187, "epoch": 3409} {"train_loss": -6.812421798706055, "global_step": 143188, "epoch": 3409} {"train_loss": -6.848684310913086, "global_step": 143189, "epoch": 3409} {"train_loss": -6.82056999206543, "global_step": 143190, "epoch": 3409} {"train_loss": -6.730197906494141, "global_step": 143191, "epoch": 3409} {"train_loss": -6.730309963226318, "global_step": 143192, "epoch": 3409} {"train_loss": -6.895934104919434, "global_step": 143193, "epoch": 3409} {"train_loss": -6.7008514404296875, "global_step": 143194, "epoch": 3409} {"train_loss": -6.770284652709961, "global_step": 143195, "epoch": 3409} {"train_loss": -6.746059417724609, "global_step": 143196, "epoch": 3409} {"train_loss": -6.712094306945801, "global_step": 143197, "epoch": 3409} {"train_loss": -6.756166458129883, "global_step": 143198, "epoch": 3409} {"train_loss": -6.849841117858887, "global_step": 143199, "epoch": 3409} {"train_loss": -6.729488372802734, "global_step": 143200, "epoch": 3409} {"train_loss": -6.722777843475342, "global_step": 143201, "epoch": 3409} {"train_loss": -6.641225814819336, "global_step": 143202, "epoch": 3409} {"train_loss": -6.642300605773926, "global_step": 143203, "epoch": 3409} {"train_loss": -6.625601291656494, "global_step": 143204, "epoch": 3409} {"train_loss": -6.735300064086914, "global_step": 143205, "epoch": 3409} {"train_loss": -6.704237461090088, "global_step": 143206, "epoch": 3409} {"train_loss": -6.894076824188232, "global_step": 143207, "epoch": 3409} {"train_loss": -6.610036849975586, "global_step": 143208, "epoch": 3409} {"train_loss": -6.767192363739014, "global_step": 143209, "epoch": 3409} {"train_loss": -6.715000152587891, "global_step": 143210, "epoch": 3409} {"train_loss": -6.619675159454346, "global_step": 143211, "epoch": 3409} {"train_loss": -6.658881187438965, "global_step": 143212, "epoch": 3409} {"train_loss": -6.747392654418945, "global_step": 143213, "epoch": 3409} {"train_loss": -6.808501720428467, "global_step": 143214, "epoch": 3409} {"train_loss": -6.659589767456055, "global_step": 143215, "epoch": 3409} {"train_loss": -6.757512092590332, "global_step": 143216, "epoch": 3409} {"train_loss": -6.582582950592041, "global_step": 143217, "epoch": 3409} {"train_loss": -6.697883605957031, "global_step": 143218, "epoch": 3409} {"train_loss": -6.754517646062942, "global_step": 143219, "epoch": 3409, "val_loss": 78519.2578125} {"train_loss": -6.750662803649902, "global_step": 143220, "epoch": 3410} {"train_loss": -6.727219581604004, "global_step": 143221, "epoch": 3410} {"train_loss": -6.77085018157959, "global_step": 143222, "epoch": 3410} {"train_loss": -6.898095607757568, "global_step": 143223, "epoch": 3410} {"train_loss": -6.704642295837402, "global_step": 143224, "epoch": 3410} {"train_loss": -6.779791355133057, "global_step": 143225, "epoch": 3410} {"train_loss": -6.744787216186523, "global_step": 143226, "epoch": 3410} {"train_loss": -6.692873477935791, "global_step": 143227, "epoch": 3410} {"train_loss": -6.89117431640625, "global_step": 143228, "epoch": 3410} {"train_loss": -6.649129867553711, "global_step": 143229, "epoch": 3410} {"train_loss": -6.869311332702637, "global_step": 143230, "epoch": 3410} {"train_loss": -6.722886562347412, "global_step": 143231, "epoch": 3410} {"train_loss": -6.654352188110352, "global_step": 143232, "epoch": 3410} {"train_loss": -6.800528049468994, "global_step": 143233, "epoch": 3410} {"train_loss": -6.709883213043213, "global_step": 143234, "epoch": 3410} {"train_loss": -6.681401252746582, "global_step": 143235, "epoch": 3410} {"train_loss": -6.82069206237793, "global_step": 143236, "epoch": 3410} {"train_loss": -6.822671890258789, "global_step": 143237, "epoch": 3410} {"train_loss": -6.776017665863037, "global_step": 143238, "epoch": 3410} {"train_loss": -6.682271480560303, "global_step": 143239, "epoch": 3410} {"train_loss": -6.831330299377441, "global_step": 143240, "epoch": 3410} {"train_loss": -6.744861602783203, "global_step": 143241, "epoch": 3410} {"train_loss": -6.53270149230957, "global_step": 143242, "epoch": 3410} {"train_loss": -6.836668968200684, "global_step": 143243, "epoch": 3410} {"train_loss": -6.719754695892334, "global_step": 143244, "epoch": 3410} {"train_loss": -6.539572715759277, "global_step": 143245, "epoch": 3410} {"train_loss": -6.703985214233398, "global_step": 143246, "epoch": 3410} {"train_loss": -6.694193363189697, "global_step": 143247, "epoch": 3410} {"train_loss": -6.67989444732666, "global_step": 143248, "epoch": 3410} {"train_loss": -6.737146377563477, "global_step": 143249, "epoch": 3410} {"train_loss": -6.562198638916016, "global_step": 143250, "epoch": 3410} {"train_loss": -6.7258148193359375, "global_step": 143251, "epoch": 3410} {"train_loss": -6.743302822113037, "global_step": 143252, "epoch": 3410} {"train_loss": -6.768723011016846, "global_step": 143253, "epoch": 3410} {"train_loss": -6.80354118347168, "global_step": 143254, "epoch": 3410} {"train_loss": -6.759242534637451, "global_step": 143255, "epoch": 3410} {"train_loss": -6.8448333740234375, "global_step": 143256, "epoch": 3410} {"train_loss": -6.876218795776367, "global_step": 143257, "epoch": 3410} {"train_loss": -6.811251640319824, "global_step": 143258, "epoch": 3410} {"train_loss": -6.798579216003418, "global_step": 143259, "epoch": 3410} {"train_loss": -6.748638153076172, "global_step": 143260, "epoch": 3410} {"train_loss": -6.748437552225022, "global_step": 143261, "epoch": 3410, "val_loss": 78197.2734375} {"train_loss": -6.845559120178223, "global_step": 143262, "epoch": 3411} {"train_loss": -6.656173229217529, "global_step": 143263, "epoch": 3411} {"train_loss": -6.8352766036987305, "global_step": 143264, "epoch": 3411} {"train_loss": -6.722925186157227, "global_step": 143265, "epoch": 3411} {"train_loss": -6.806639671325684, "global_step": 143266, "epoch": 3411} {"train_loss": -6.8646721839904785, "global_step": 143267, "epoch": 3411} {"train_loss": -6.724116325378418, "global_step": 143268, "epoch": 3411} {"train_loss": -6.924454689025879, "global_step": 143269, "epoch": 3411} {"train_loss": -6.822575569152832, "global_step": 143270, "epoch": 3411} {"train_loss": -6.7580180168151855, "global_step": 143271, "epoch": 3411} {"train_loss": -6.712138652801514, "global_step": 143272, "epoch": 3411} {"train_loss": -6.843633651733398, "global_step": 143273, "epoch": 3411} {"train_loss": -6.75337028503418, "global_step": 143274, "epoch": 3411} {"train_loss": -6.746246814727783, "global_step": 143275, "epoch": 3411} {"train_loss": -6.86785888671875, "global_step": 143276, "epoch": 3411} {"train_loss": -6.774731636047363, "global_step": 143277, "epoch": 3411} {"train_loss": -6.658287525177002, "global_step": 143278, "epoch": 3411} {"train_loss": -6.76541805267334, "global_step": 143279, "epoch": 3411} {"train_loss": -6.860992431640625, "global_step": 143280, "epoch": 3411} {"train_loss": -6.745016574859619, "global_step": 143281, "epoch": 3411} {"train_loss": -6.838501453399658, "global_step": 143282, "epoch": 3411} {"train_loss": -6.840213298797607, "global_step": 143283, "epoch": 3411} {"train_loss": -6.777244567871094, "global_step": 143284, "epoch": 3411} {"train_loss": -6.791729927062988, "global_step": 143285, "epoch": 3411} {"train_loss": -6.736117362976074, "global_step": 143286, "epoch": 3411} {"train_loss": -6.805120468139648, "global_step": 143287, "epoch": 3411} {"train_loss": -6.9567646980285645, "global_step": 143288, "epoch": 3411} {"train_loss": -6.689985275268555, "global_step": 143289, "epoch": 3411} {"train_loss": -6.870241165161133, "global_step": 143290, "epoch": 3411} {"train_loss": -6.851030349731445, "global_step": 143291, "epoch": 3411} {"train_loss": -6.804853439331055, "global_step": 143292, "epoch": 3411} {"train_loss": -6.738410949707031, "global_step": 143293, "epoch": 3411} {"train_loss": -6.770694732666016, "global_step": 143294, "epoch": 3411} {"train_loss": -6.7839155197143555, "global_step": 143295, "epoch": 3411} {"train_loss": -6.823144912719727, "global_step": 143296, "epoch": 3411} {"train_loss": -6.856754779815674, "global_step": 143297, "epoch": 3411} {"train_loss": -6.735193252563477, "global_step": 143298, "epoch": 3411} {"train_loss": -6.725491523742676, "global_step": 143299, "epoch": 3411} {"train_loss": -6.674056053161621, "global_step": 143300, "epoch": 3411} {"train_loss": -6.65696382522583, "global_step": 143301, "epoch": 3411} {"train_loss": -6.6421661376953125, "global_step": 143302, "epoch": 3411} {"train_loss": -6.7826454639434814, "global_step": 143303, "epoch": 3411, "val_loss": 78261.0859375} {"train_loss": -6.681803226470947, "global_step": 143304, "epoch": 3412} {"train_loss": -6.850463390350342, "global_step": 143305, "epoch": 3412} {"train_loss": -6.682454586029053, "global_step": 143306, "epoch": 3412} {"train_loss": -6.698690414428711, "global_step": 143307, "epoch": 3412} {"train_loss": -6.704690456390381, "global_step": 143308, "epoch": 3412} {"train_loss": -6.6500935554504395, "global_step": 143309, "epoch": 3412} {"train_loss": -6.851055145263672, "global_step": 143310, "epoch": 3412} {"train_loss": -6.676449775695801, "global_step": 143311, "epoch": 3412} {"train_loss": -6.747251033782959, "global_step": 143312, "epoch": 3412} {"train_loss": -6.670574188232422, "global_step": 143313, "epoch": 3412} {"train_loss": -6.808282375335693, "global_step": 143314, "epoch": 3412} {"train_loss": -6.737048625946045, "global_step": 143315, "epoch": 3412} {"train_loss": -6.800398826599121, "global_step": 143316, "epoch": 3412} {"train_loss": -6.876418113708496, "global_step": 143317, "epoch": 3412} {"train_loss": -6.739272117614746, "global_step": 143318, "epoch": 3412} {"train_loss": -6.831600189208984, "global_step": 143319, "epoch": 3412} {"train_loss": -6.857126712799072, "global_step": 143320, "epoch": 3412} {"train_loss": -6.7382636070251465, "global_step": 143321, "epoch": 3412} {"train_loss": -6.9093217849731445, "global_step": 143322, "epoch": 3412} {"train_loss": -6.731639862060547, "global_step": 143323, "epoch": 3412} {"train_loss": -6.757349491119385, "global_step": 143324, "epoch": 3412} {"train_loss": -6.761264801025391, "global_step": 143325, "epoch": 3412} {"train_loss": -6.853787422180176, "global_step": 143326, "epoch": 3412} {"train_loss": -6.80818510055542, "global_step": 143327, "epoch": 3412} {"train_loss": -6.857563018798828, "global_step": 143328, "epoch": 3412} {"train_loss": -6.848682403564453, "global_step": 143329, "epoch": 3412} {"train_loss": -6.790234088897705, "global_step": 143330, "epoch": 3412} {"train_loss": -6.897507667541504, "global_step": 143331, "epoch": 3412} {"train_loss": -6.749969482421875, "global_step": 143332, "epoch": 3412} {"train_loss": -6.847917556762695, "global_step": 143333, "epoch": 3412} {"train_loss": -6.842404365539551, "global_step": 143334, "epoch": 3412} {"train_loss": -6.751962184906006, "global_step": 143335, "epoch": 3412} {"train_loss": -6.830602645874023, "global_step": 143336, "epoch": 3412} {"train_loss": -6.821998596191406, "global_step": 143337, "epoch": 3412} {"train_loss": -6.8133463859558105, "global_step": 143338, "epoch": 3412} {"train_loss": -6.815354347229004, "global_step": 143339, "epoch": 3412} {"train_loss": -6.782376766204834, "global_step": 143340, "epoch": 3412} {"train_loss": -6.742035388946533, "global_step": 143341, "epoch": 3412} {"train_loss": -6.67512321472168, "global_step": 143342, "epoch": 3412} {"train_loss": -6.856596946716309, "global_step": 143343, "epoch": 3412} {"train_loss": -6.806124687194824, "global_step": 143344, "epoch": 3412} {"train_loss": -6.782242059707642, "global_step": 143345, "epoch": 3412, "val_loss": 78076.3984375} {"train_loss": -6.836309909820557, "global_step": 143346, "epoch": 3413} {"train_loss": -6.704239845275879, "global_step": 143347, "epoch": 3413} {"train_loss": -6.736577033996582, "global_step": 143348, "epoch": 3413} {"train_loss": -6.73109245300293, "global_step": 143349, "epoch": 3413} {"train_loss": -6.806697368621826, "global_step": 143350, "epoch": 3413} {"train_loss": -6.632349967956543, "global_step": 143351, "epoch": 3413} {"train_loss": -6.903268814086914, "global_step": 143352, "epoch": 3413} {"train_loss": -6.564179420471191, "global_step": 143353, "epoch": 3413} {"train_loss": -6.734427452087402, "global_step": 143354, "epoch": 3413} {"train_loss": -6.795901298522949, "global_step": 143355, "epoch": 3413} {"train_loss": -6.724261283874512, "global_step": 143356, "epoch": 3413} {"train_loss": -6.843094348907471, "global_step": 143357, "epoch": 3413} {"train_loss": -6.7294464111328125, "global_step": 143358, "epoch": 3413} {"train_loss": -6.69230842590332, "global_step": 143359, "epoch": 3413} {"train_loss": -6.8013458251953125, "global_step": 143360, "epoch": 3413} {"train_loss": -6.737321853637695, "global_step": 143361, "epoch": 3413} {"train_loss": -6.80556583404541, "global_step": 143362, "epoch": 3413} {"train_loss": -6.886082172393799, "global_step": 143363, "epoch": 3413} {"train_loss": -6.827045440673828, "global_step": 143364, "epoch": 3413} {"train_loss": -6.814304351806641, "global_step": 143365, "epoch": 3413} {"train_loss": -6.839057922363281, "global_step": 143366, "epoch": 3413} {"train_loss": -6.741274356842041, "global_step": 143367, "epoch": 3413} {"train_loss": -6.8728485107421875, "global_step": 143368, "epoch": 3413} {"train_loss": -6.8160200119018555, "global_step": 143369, "epoch": 3413} {"train_loss": -6.852115154266357, "global_step": 143370, "epoch": 3413} {"train_loss": -6.852017402648926, "global_step": 143371, "epoch": 3413} {"train_loss": -6.788332462310791, "global_step": 143372, "epoch": 3413} {"train_loss": -6.736143112182617, "global_step": 143373, "epoch": 3413} {"train_loss": -6.62496280670166, "global_step": 143374, "epoch": 3413} {"train_loss": -6.541086196899414, "global_step": 143375, "epoch": 3413} {"train_loss": -6.9427032470703125, "global_step": 143376, "epoch": 3413} {"train_loss": -6.733282566070557, "global_step": 143377, "epoch": 3413} {"train_loss": -6.720952033996582, "global_step": 143378, "epoch": 3413} {"train_loss": -6.8150129318237305, "global_step": 143379, "epoch": 3413} {"train_loss": -6.778936386108398, "global_step": 143380, "epoch": 3413} {"train_loss": -6.782217025756836, "global_step": 143381, "epoch": 3413} {"train_loss": -6.714178085327148, "global_step": 143382, "epoch": 3413} {"train_loss": -6.859180927276611, "global_step": 143383, "epoch": 3413} {"train_loss": -6.873821258544922, "global_step": 143384, "epoch": 3413} {"train_loss": -6.5868611335754395, "global_step": 143385, "epoch": 3413} {"train_loss": -6.807085037231445, "global_step": 143386, "epoch": 3413} {"train_loss": -6.7702598458244685, "global_step": 143387, "epoch": 3413, "val_loss": 78134.7578125} {"train_loss": -6.813830852508545, "global_step": 143388, "epoch": 3414} {"train_loss": -6.752837657928467, "global_step": 143389, "epoch": 3414} {"train_loss": -6.864118576049805, "global_step": 143390, "epoch": 3414} {"train_loss": -6.939243316650391, "global_step": 143391, "epoch": 3414} {"train_loss": -6.7641425132751465, "global_step": 143392, "epoch": 3414} {"train_loss": -6.864838123321533, "global_step": 143393, "epoch": 3414} {"train_loss": -6.864233016967773, "global_step": 143394, "epoch": 3414} {"train_loss": -6.908878326416016, "global_step": 143395, "epoch": 3414} {"train_loss": -6.793354034423828, "global_step": 143396, "epoch": 3414} {"train_loss": -6.846368312835693, "global_step": 143397, "epoch": 3414} {"train_loss": -6.807246685028076, "global_step": 143398, "epoch": 3414} {"train_loss": -6.878052711486816, "global_step": 143399, "epoch": 3414} {"train_loss": -6.842619895935059, "global_step": 143400, "epoch": 3414} {"train_loss": -6.846638202667236, "global_step": 143401, "epoch": 3414} {"train_loss": -6.738547325134277, "global_step": 143402, "epoch": 3414} {"train_loss": -6.968859672546387, "global_step": 143403, "epoch": 3414} {"train_loss": -6.82690954208374, "global_step": 143404, "epoch": 3414} {"train_loss": -6.872668266296387, "global_step": 143405, "epoch": 3414} {"train_loss": -6.812497138977051, "global_step": 143406, "epoch": 3414} {"train_loss": -6.884031295776367, "global_step": 143407, "epoch": 3414} {"train_loss": -6.802475929260254, "global_step": 143408, "epoch": 3414} {"train_loss": -6.762955665588379, "global_step": 143409, "epoch": 3414} {"train_loss": -6.806353569030762, "global_step": 143410, "epoch": 3414} {"train_loss": -6.6266608238220215, "global_step": 143411, "epoch": 3414} {"train_loss": -6.7823896408081055, "global_step": 143412, "epoch": 3414} {"train_loss": -6.871533393859863, "global_step": 143413, "epoch": 3414} {"train_loss": -6.815624237060547, "global_step": 143414, "epoch": 3414} {"train_loss": -6.793375015258789, "global_step": 143415, "epoch": 3414} {"train_loss": -6.761107921600342, "global_step": 143416, "epoch": 3414} {"train_loss": -6.753069877624512, "global_step": 143417, "epoch": 3414} {"train_loss": -6.741574287414551, "global_step": 143418, "epoch": 3414} {"train_loss": -6.801910877227783, "global_step": 143419, "epoch": 3414} {"train_loss": -6.674566268920898, "global_step": 143420, "epoch": 3414} {"train_loss": -6.809506893157959, "global_step": 143421, "epoch": 3414} {"train_loss": -6.700550079345703, "global_step": 143422, "epoch": 3414} {"train_loss": -6.681829452514648, "global_step": 143423, "epoch": 3414} {"train_loss": -6.74790096282959, "global_step": 143424, "epoch": 3414} {"train_loss": -6.733280181884766, "global_step": 143425, "epoch": 3414} {"train_loss": -6.848978042602539, "global_step": 143426, "epoch": 3414} {"train_loss": -6.7834954261779785, "global_step": 143427, "epoch": 3414} {"train_loss": -6.761299133300781, "global_step": 143428, "epoch": 3414} {"train_loss": -6.8023135889144175, "global_step": 143429, "epoch": 3414, "val_loss": 78626.71875} {"train_loss": -6.569519996643066, "global_step": 143430, "epoch": 3415} {"train_loss": -6.723083019256592, "global_step": 143431, "epoch": 3415} {"train_loss": -6.6738786697387695, "global_step": 143432, "epoch": 3415} {"train_loss": -6.603859901428223, "global_step": 143433, "epoch": 3415} {"train_loss": -6.857312202453613, "global_step": 143434, "epoch": 3415} {"train_loss": -6.641119956970215, "global_step": 143435, "epoch": 3415} {"train_loss": -6.801331520080566, "global_step": 143436, "epoch": 3415} {"train_loss": -6.709268093109131, "global_step": 143437, "epoch": 3415} {"train_loss": -6.647114276885986, "global_step": 143438, "epoch": 3415} {"train_loss": -6.730776786804199, "global_step": 143439, "epoch": 3415} {"train_loss": -6.749597549438477, "global_step": 143440, "epoch": 3415} {"train_loss": -6.704518795013428, "global_step": 143441, "epoch": 3415} {"train_loss": -6.758281707763672, "global_step": 143442, "epoch": 3415} {"train_loss": -6.660308837890625, "global_step": 143443, "epoch": 3415} {"train_loss": -6.719599723815918, "global_step": 143444, "epoch": 3415} {"train_loss": -6.8172149658203125, "global_step": 143445, "epoch": 3415} {"train_loss": -6.808102607727051, "global_step": 143446, "epoch": 3415} {"train_loss": -6.8307881355285645, "global_step": 143447, "epoch": 3415} {"train_loss": -6.729273796081543, "global_step": 143448, "epoch": 3415} {"train_loss": -6.7830424308776855, "global_step": 143449, "epoch": 3415} {"train_loss": -6.697155952453613, "global_step": 143450, "epoch": 3415} {"train_loss": -6.876676559448242, "global_step": 143451, "epoch": 3415} {"train_loss": -6.732686519622803, "global_step": 143452, "epoch": 3415} {"train_loss": -6.826205253601074, "global_step": 143453, "epoch": 3415} {"train_loss": -6.853585720062256, "global_step": 143454, "epoch": 3415} {"train_loss": -6.738894462585449, "global_step": 143455, "epoch": 3415} {"train_loss": -6.780101776123047, "global_step": 143456, "epoch": 3415} {"train_loss": -6.792752265930176, "global_step": 143457, "epoch": 3415} {"train_loss": -6.753806114196777, "global_step": 143458, "epoch": 3415} {"train_loss": -6.731748580932617, "global_step": 143459, "epoch": 3415} {"train_loss": -6.8756585121154785, "global_step": 143460, "epoch": 3415} {"train_loss": -6.810359477996826, "global_step": 143461, "epoch": 3415} {"train_loss": -6.847776412963867, "global_step": 143462, "epoch": 3415} {"train_loss": -6.8955888748168945, "global_step": 143463, "epoch": 3415} {"train_loss": -6.7276153564453125, "global_step": 143464, "epoch": 3415} {"train_loss": -6.796271800994873, "global_step": 143465, "epoch": 3415} {"train_loss": -6.83918571472168, "global_step": 143466, "epoch": 3415} {"train_loss": -6.802295207977295, "global_step": 143467, "epoch": 3415} {"train_loss": -6.821493148803711, "global_step": 143468, "epoch": 3415} {"train_loss": -6.753542900085449, "global_step": 143469, "epoch": 3415} {"train_loss": -6.83070182800293, "global_step": 143470, "epoch": 3415} {"train_loss": -6.765369653701782, "global_step": 143471, "epoch": 3415, "val_loss": 78178.8203125} {"train_loss": -6.789085865020752, "global_step": 143472, "epoch": 3416} {"train_loss": -6.859343528747559, "global_step": 143473, "epoch": 3416} {"train_loss": -6.85092830657959, "global_step": 143474, "epoch": 3416} {"train_loss": -6.805310249328613, "global_step": 143475, "epoch": 3416} {"train_loss": -6.714174270629883, "global_step": 143476, "epoch": 3416} {"train_loss": -6.694828033447266, "global_step": 143477, "epoch": 3416} {"train_loss": -6.839055061340332, "global_step": 143478, "epoch": 3416} {"train_loss": -6.845925331115723, "global_step": 143479, "epoch": 3416} {"train_loss": -6.804533958435059, "global_step": 143480, "epoch": 3416} {"train_loss": -6.9109649658203125, "global_step": 143481, "epoch": 3416} {"train_loss": -6.717846870422363, "global_step": 143482, "epoch": 3416} {"train_loss": -6.746218204498291, "global_step": 143483, "epoch": 3416} {"train_loss": -6.862495422363281, "global_step": 143484, "epoch": 3416} {"train_loss": -6.843585014343262, "global_step": 143485, "epoch": 3416} {"train_loss": -6.719328880310059, "global_step": 143486, "epoch": 3416} {"train_loss": -6.754265785217285, "global_step": 143487, "epoch": 3416} {"train_loss": -6.844106674194336, "global_step": 143488, "epoch": 3416} {"train_loss": -6.868475437164307, "global_step": 143489, "epoch": 3416} {"train_loss": -6.82173490524292, "global_step": 143490, "epoch": 3416} {"train_loss": -6.8273115158081055, "global_step": 143491, "epoch": 3416} {"train_loss": -6.809594631195068, "global_step": 143492, "epoch": 3416} {"train_loss": -6.797124862670898, "global_step": 143493, "epoch": 3416} {"train_loss": -6.826412200927734, "global_step": 143494, "epoch": 3416} {"train_loss": -6.768759727478027, "global_step": 143495, "epoch": 3416} {"train_loss": -6.692868709564209, "global_step": 143496, "epoch": 3416} {"train_loss": -6.788442611694336, "global_step": 143497, "epoch": 3416} {"train_loss": -6.685115337371826, "global_step": 143498, "epoch": 3416} {"train_loss": -6.665848731994629, "global_step": 143499, "epoch": 3416} {"train_loss": -6.947072982788086, "global_step": 143500, "epoch": 3416} {"train_loss": -6.678680896759033, "global_step": 143501, "epoch": 3416} {"train_loss": -6.745388984680176, "global_step": 143502, "epoch": 3416} {"train_loss": -6.684976577758789, "global_step": 143503, "epoch": 3416} {"train_loss": -6.701956272125244, "global_step": 143504, "epoch": 3416} {"train_loss": -6.660140037536621, "global_step": 143505, "epoch": 3416} {"train_loss": -6.7934699058532715, "global_step": 143506, "epoch": 3416} {"train_loss": -6.854546070098877, "global_step": 143507, "epoch": 3416} {"train_loss": -6.688474655151367, "global_step": 143508, "epoch": 3416} {"train_loss": -6.651476860046387, "global_step": 143509, "epoch": 3416} {"train_loss": -6.638645172119141, "global_step": 143510, "epoch": 3416} {"train_loss": -6.645375728607178, "global_step": 143511, "epoch": 3416} {"train_loss": -6.739014625549316, "global_step": 143512, "epoch": 3416} {"train_loss": -6.769072305588495, "global_step": 143513, "epoch": 3416, "val_loss": 78326.0625} {"train_loss": -6.832512855529785, "global_step": 143514, "epoch": 3417} {"train_loss": -6.609075546264648, "global_step": 143515, "epoch": 3417} {"train_loss": -6.850290298461914, "global_step": 143516, "epoch": 3417} {"train_loss": -6.715427398681641, "global_step": 143517, "epoch": 3417} {"train_loss": -6.805170059204102, "global_step": 143518, "epoch": 3417} {"train_loss": -6.647073745727539, "global_step": 143519, "epoch": 3417} {"train_loss": -6.601471900939941, "global_step": 143520, "epoch": 3417} {"train_loss": -6.8508405685424805, "global_step": 143521, "epoch": 3417} {"train_loss": -6.680935859680176, "global_step": 143522, "epoch": 3417} {"train_loss": -6.847680568695068, "global_step": 143523, "epoch": 3417} {"train_loss": -6.586992263793945, "global_step": 143524, "epoch": 3417} {"train_loss": -6.822029113769531, "global_step": 143525, "epoch": 3417} {"train_loss": -6.683664321899414, "global_step": 143526, "epoch": 3417} {"train_loss": -6.883822441101074, "global_step": 143527, "epoch": 3417} {"train_loss": -6.737860202789307, "global_step": 143528, "epoch": 3417} {"train_loss": -6.804656982421875, "global_step": 143529, "epoch": 3417} {"train_loss": -6.750918388366699, "global_step": 143530, "epoch": 3417} {"train_loss": -6.804051399230957, "global_step": 143531, "epoch": 3417} {"train_loss": -6.749593734741211, "global_step": 143532, "epoch": 3417} {"train_loss": -6.726268768310547, "global_step": 143533, "epoch": 3417} {"train_loss": -6.701655864715576, "global_step": 143534, "epoch": 3417} {"train_loss": -6.700838088989258, "global_step": 143535, "epoch": 3417} {"train_loss": -6.73745059967041, "global_step": 143536, "epoch": 3417} {"train_loss": -6.9056501388549805, "global_step": 143537, "epoch": 3417} {"train_loss": -6.796231746673584, "global_step": 143538, "epoch": 3417} {"train_loss": -6.765417098999023, "global_step": 143539, "epoch": 3417} {"train_loss": -6.788486003875732, "global_step": 143540, "epoch": 3417} {"train_loss": -6.70767879486084, "global_step": 143541, "epoch": 3417} {"train_loss": -6.811211109161377, "global_step": 143542, "epoch": 3417} {"train_loss": -6.791402816772461, "global_step": 143543, "epoch": 3417} {"train_loss": -6.8479695320129395, "global_step": 143544, "epoch": 3417} {"train_loss": -6.872780799865723, "global_step": 143545, "epoch": 3417} {"train_loss": -6.836945533752441, "global_step": 143546, "epoch": 3417} {"train_loss": -6.7762956619262695, "global_step": 143547, "epoch": 3417} {"train_loss": -6.815085411071777, "global_step": 143548, "epoch": 3417} {"train_loss": -6.707916736602783, "global_step": 143549, "epoch": 3417} {"train_loss": -6.829439163208008, "global_step": 143550, "epoch": 3417} {"train_loss": -6.74118185043335, "global_step": 143551, "epoch": 3417} {"train_loss": -6.863157749176025, "global_step": 143552, "epoch": 3417} {"train_loss": -6.760473251342773, "global_step": 143553, "epoch": 3417} {"train_loss": -6.940803050994873, "global_step": 143554, "epoch": 3417} {"train_loss": -6.771918353580293, "global_step": 143555, "epoch": 3417, "val_loss": 78437.59375} {"train_loss": -6.850769519805908, "global_step": 143556, "epoch": 3418} {"train_loss": -6.724822044372559, "global_step": 143557, "epoch": 3418} {"train_loss": -6.825301170349121, "global_step": 143558, "epoch": 3418} {"train_loss": -6.829456329345703, "global_step": 143559, "epoch": 3418} {"train_loss": -6.880856037139893, "global_step": 143560, "epoch": 3418} {"train_loss": -6.720447540283203, "global_step": 143561, "epoch": 3418} {"train_loss": -6.917908668518066, "global_step": 143562, "epoch": 3418} {"train_loss": -6.689064979553223, "global_step": 143563, "epoch": 3418} {"train_loss": -6.795282363891602, "global_step": 143564, "epoch": 3418} {"train_loss": -6.894507884979248, "global_step": 143565, "epoch": 3418} {"train_loss": -6.623243808746338, "global_step": 143566, "epoch": 3418} {"train_loss": -6.879541397094727, "global_step": 143567, "epoch": 3418} {"train_loss": -6.873222351074219, "global_step": 143568, "epoch": 3418} {"train_loss": -6.8423051834106445, "global_step": 143569, "epoch": 3418} {"train_loss": -6.834403991699219, "global_step": 143570, "epoch": 3418} {"train_loss": -6.7584075927734375, "global_step": 143571, "epoch": 3418} {"train_loss": -6.812053680419922, "global_step": 143572, "epoch": 3418} {"train_loss": -6.908741474151611, "global_step": 143573, "epoch": 3418} {"train_loss": -6.737273216247559, "global_step": 143574, "epoch": 3418} {"train_loss": -6.847545623779297, "global_step": 143575, "epoch": 3418} {"train_loss": -6.884726047515869, "global_step": 143576, "epoch": 3418} {"train_loss": -6.836757659912109, "global_step": 143577, "epoch": 3418} {"train_loss": -6.892018795013428, "global_step": 143578, "epoch": 3418} {"train_loss": -6.663611888885498, "global_step": 143579, "epoch": 3418} {"train_loss": -6.757913589477539, "global_step": 143580, "epoch": 3418} {"train_loss": -6.855423450469971, "global_step": 143581, "epoch": 3418} {"train_loss": -6.798393249511719, "global_step": 143582, "epoch": 3418} {"train_loss": -6.794284820556641, "global_step": 143583, "epoch": 3418} {"train_loss": -6.641183376312256, "global_step": 143584, "epoch": 3418} {"train_loss": -6.76009464263916, "global_step": 143585, "epoch": 3418} {"train_loss": -6.765083312988281, "global_step": 143586, "epoch": 3418} {"train_loss": -6.780572414398193, "global_step": 143587, "epoch": 3418} {"train_loss": -6.82998514175415, "global_step": 143588, "epoch": 3418} {"train_loss": -6.9072465896606445, "global_step": 143589, "epoch": 3418} {"train_loss": -6.8689680099487305, "global_step": 143590, "epoch": 3418} {"train_loss": -6.774237632751465, "global_step": 143591, "epoch": 3418} {"train_loss": -6.737987518310547, "global_step": 143592, "epoch": 3418} {"train_loss": -6.710707187652588, "global_step": 143593, "epoch": 3418} {"train_loss": -6.835402488708496, "global_step": 143594, "epoch": 3418} {"train_loss": -6.821473121643066, "global_step": 143595, "epoch": 3418} {"train_loss": -6.865819931030273, "global_step": 143596, "epoch": 3418} {"train_loss": -6.806008565993536, "global_step": 143597, "epoch": 3418, "val_loss": 78155.96875} {"train_loss": -6.81010627746582, "global_step": 143598, "epoch": 3419} {"train_loss": -6.801295757293701, "global_step": 143599, "epoch": 3419} {"train_loss": -6.795938491821289, "global_step": 143600, "epoch": 3419} {"train_loss": -6.8577880859375, "global_step": 143601, "epoch": 3419} {"train_loss": -6.8065690994262695, "global_step": 143602, "epoch": 3419} {"train_loss": -6.676380157470703, "global_step": 143603, "epoch": 3419} {"train_loss": -6.841273307800293, "global_step": 143604, "epoch": 3419} {"train_loss": -6.738452911376953, "global_step": 143605, "epoch": 3419} {"train_loss": -6.745319366455078, "global_step": 143606, "epoch": 3419} {"train_loss": -6.892923831939697, "global_step": 143607, "epoch": 3419} {"train_loss": -6.770834922790527, "global_step": 143608, "epoch": 3419} {"train_loss": -6.607853412628174, "global_step": 143609, "epoch": 3419} {"train_loss": -6.81336784362793, "global_step": 143610, "epoch": 3419} {"train_loss": -6.662909507751465, "global_step": 143611, "epoch": 3419} {"train_loss": -6.724902153015137, "global_step": 143612, "epoch": 3419} {"train_loss": -6.865713119506836, "global_step": 143613, "epoch": 3419} {"train_loss": -6.771244049072266, "global_step": 143614, "epoch": 3419} {"train_loss": -6.693437099456787, "global_step": 143615, "epoch": 3419} {"train_loss": -6.778851509094238, "global_step": 143616, "epoch": 3419} {"train_loss": -6.5273966789245605, "global_step": 143617, "epoch": 3419} {"train_loss": -6.776312351226807, "global_step": 143618, "epoch": 3419} {"train_loss": -6.711080074310303, "global_step": 143619, "epoch": 3419} {"train_loss": -6.687007427215576, "global_step": 143620, "epoch": 3419} {"train_loss": -6.67756462097168, "global_step": 143621, "epoch": 3419} {"train_loss": -6.49245548248291, "global_step": 143622, "epoch": 3419} {"train_loss": -6.623478412628174, "global_step": 143623, "epoch": 3419} {"train_loss": -6.6012773513793945, "global_step": 143624, "epoch": 3419} {"train_loss": -6.825705528259277, "global_step": 143625, "epoch": 3419} {"train_loss": -6.627164363861084, "global_step": 143626, "epoch": 3419} {"train_loss": -6.691695213317871, "global_step": 143627, "epoch": 3419} {"train_loss": -6.7331695556640625, "global_step": 143628, "epoch": 3419} {"train_loss": -6.748124122619629, "global_step": 143629, "epoch": 3419} {"train_loss": -6.712743759155273, "global_step": 143630, "epoch": 3419} {"train_loss": -6.654070854187012, "global_step": 143631, "epoch": 3419} {"train_loss": -6.7256035804748535, "global_step": 143632, "epoch": 3419} {"train_loss": -6.763380527496338, "global_step": 143633, "epoch": 3419} {"train_loss": -6.762481212615967, "global_step": 143634, "epoch": 3419} {"train_loss": -6.7403669357299805, "global_step": 143635, "epoch": 3419} {"train_loss": -6.842227935791016, "global_step": 143636, "epoch": 3419} {"train_loss": -6.820740699768066, "global_step": 143637, "epoch": 3419} {"train_loss": -6.673843860626221, "global_step": 143638, "epoch": 3419} {"train_loss": -6.736222460156395, "global_step": 143639, "epoch": 3419, "val_loss": 78572.265625} {"train_loss": -6.788071632385254, "global_step": 143640, "epoch": 3420} {"train_loss": -6.792057991027832, "global_step": 143641, "epoch": 3420} {"train_loss": -6.864218711853027, "global_step": 143642, "epoch": 3420} {"train_loss": -6.778918266296387, "global_step": 143643, "epoch": 3420} {"train_loss": -6.902957439422607, "global_step": 143644, "epoch": 3420} {"train_loss": -6.82125186920166, "global_step": 143645, "epoch": 3420} {"train_loss": -6.934864044189453, "global_step": 143646, "epoch": 3420} {"train_loss": -6.808847427368164, "global_step": 143647, "epoch": 3420} {"train_loss": -6.798830032348633, "global_step": 143648, "epoch": 3420} {"train_loss": -6.8548970222473145, "global_step": 143649, "epoch": 3420} {"train_loss": -6.843860626220703, "global_step": 143650, "epoch": 3420} {"train_loss": -6.977136611938477, "global_step": 143651, "epoch": 3420} {"train_loss": -6.726777076721191, "global_step": 143652, "epoch": 3420} {"train_loss": -6.762173652648926, "global_step": 143653, "epoch": 3420} {"train_loss": -6.780163764953613, "global_step": 143654, "epoch": 3420} {"train_loss": -6.758872032165527, "global_step": 143655, "epoch": 3420} {"train_loss": -6.836765766143799, "global_step": 143656, "epoch": 3420} {"train_loss": -6.630630016326904, "global_step": 143657, "epoch": 3420} {"train_loss": -6.881231307983398, "global_step": 143658, "epoch": 3420} {"train_loss": -6.74351692199707, "global_step": 143659, "epoch": 3420} {"train_loss": -6.7031660079956055, "global_step": 143660, "epoch": 3420} {"train_loss": -6.775990009307861, "global_step": 143661, "epoch": 3420} {"train_loss": -6.633086204528809, "global_step": 143662, "epoch": 3420} {"train_loss": -6.768516540527344, "global_step": 143663, "epoch": 3420} {"train_loss": -6.651068210601807, "global_step": 143664, "epoch": 3420} {"train_loss": -6.738160133361816, "global_step": 143665, "epoch": 3420} {"train_loss": -6.747312545776367, "global_step": 143666, "epoch": 3420} {"train_loss": -6.584580421447754, "global_step": 143667, "epoch": 3420} {"train_loss": -6.703878402709961, "global_step": 143668, "epoch": 3420} {"train_loss": -6.682950973510742, "global_step": 143669, "epoch": 3420} {"train_loss": -6.73796272277832, "global_step": 143670, "epoch": 3420} {"train_loss": -6.6558074951171875, "global_step": 143671, "epoch": 3420} {"train_loss": -6.697398662567139, "global_step": 143672, "epoch": 3420} {"train_loss": -6.682671546936035, "global_step": 143673, "epoch": 3420} {"train_loss": -6.692174911499023, "global_step": 143674, "epoch": 3420} {"train_loss": -6.75343132019043, "global_step": 143675, "epoch": 3420} {"train_loss": -6.704010009765625, "global_step": 143676, "epoch": 3420} {"train_loss": -6.700723171234131, "global_step": 143677, "epoch": 3420} {"train_loss": -6.763518810272217, "global_step": 143678, "epoch": 3420} {"train_loss": -6.794181823730469, "global_step": 143679, "epoch": 3420} {"train_loss": -6.793465614318848, "global_step": 143680, "epoch": 3420} {"train_loss": -6.764079241525559, "global_step": 143681, "epoch": 3420, "val_loss": 78339.1953125} {"train_loss": -6.764922142028809, "global_step": 143682, "epoch": 3421} {"train_loss": -6.784736633300781, "global_step": 143683, "epoch": 3421} {"train_loss": -6.794370174407959, "global_step": 143684, "epoch": 3421} {"train_loss": -6.887652397155762, "global_step": 143685, "epoch": 3421} {"train_loss": -6.90641450881958, "global_step": 143686, "epoch": 3421} {"train_loss": -6.817658424377441, "global_step": 143687, "epoch": 3421} {"train_loss": -6.829115390777588, "global_step": 143688, "epoch": 3421} {"train_loss": -6.8157057762146, "global_step": 143689, "epoch": 3421} {"train_loss": -6.8329010009765625, "global_step": 143690, "epoch": 3421} {"train_loss": -6.775599002838135, "global_step": 143691, "epoch": 3421} {"train_loss": -6.8837056159973145, "global_step": 143692, "epoch": 3421} {"train_loss": -6.925257205963135, "global_step": 143693, "epoch": 3421} {"train_loss": -6.709561347961426, "global_step": 143694, "epoch": 3421} {"train_loss": -6.954917907714844, "global_step": 143695, "epoch": 3421} {"train_loss": -6.735968112945557, "global_step": 143696, "epoch": 3421} {"train_loss": -6.792660236358643, "global_step": 143697, "epoch": 3421} {"train_loss": -6.8806047439575195, "global_step": 143698, "epoch": 3421} {"train_loss": -6.766141891479492, "global_step": 143699, "epoch": 3421} {"train_loss": -6.869487285614014, "global_step": 143700, "epoch": 3421} {"train_loss": -6.851709365844727, "global_step": 143701, "epoch": 3421} {"train_loss": -6.969717502593994, "global_step": 143702, "epoch": 3421} {"train_loss": -6.89466667175293, "global_step": 143703, "epoch": 3421} {"train_loss": -6.785940170288086, "global_step": 143704, "epoch": 3421} {"train_loss": -6.829508304595947, "global_step": 143705, "epoch": 3421} {"train_loss": -6.782495498657227, "global_step": 143706, "epoch": 3421} {"train_loss": -6.957028388977051, "global_step": 143707, "epoch": 3421} {"train_loss": -6.936629772186279, "global_step": 143708, "epoch": 3421} {"train_loss": -6.837861061096191, "global_step": 143709, "epoch": 3421} {"train_loss": -6.743078231811523, "global_step": 143710, "epoch": 3421} {"train_loss": -6.926272392272949, "global_step": 143711, "epoch": 3421} {"train_loss": -6.870477676391602, "global_step": 143712, "epoch": 3421} {"train_loss": -6.81538724899292, "global_step": 143713, "epoch": 3421} {"train_loss": -6.9217143058776855, "global_step": 143714, "epoch": 3421} {"train_loss": -6.848371505737305, "global_step": 143715, "epoch": 3421} {"train_loss": -6.880069732666016, "global_step": 143716, "epoch": 3421} {"train_loss": -6.861241340637207, "global_step": 143717, "epoch": 3421} {"train_loss": -6.87360954284668, "global_step": 143718, "epoch": 3421} {"train_loss": -6.833063125610352, "global_step": 143719, "epoch": 3421} {"train_loss": -6.8907670974731445, "global_step": 143720, "epoch": 3421} {"train_loss": -6.828274726867676, "global_step": 143721, "epoch": 3421} {"train_loss": -6.871455192565918, "global_step": 143722, "epoch": 3421} {"train_loss": -6.848316238040016, "global_step": 143723, "epoch": 3421, "val_loss": 78496.0078125} {"train_loss": -6.766147136688232, "global_step": 143724, "epoch": 3422} {"train_loss": -6.740257263183594, "global_step": 143725, "epoch": 3422} {"train_loss": -6.660305976867676, "global_step": 143726, "epoch": 3422} {"train_loss": -6.8229780197143555, "global_step": 143727, "epoch": 3422} {"train_loss": -6.798293590545654, "global_step": 143728, "epoch": 3422} {"train_loss": -6.829164028167725, "global_step": 143729, "epoch": 3422} {"train_loss": -6.886007785797119, "global_step": 143730, "epoch": 3422} {"train_loss": -6.8430891036987305, "global_step": 143731, "epoch": 3422} {"train_loss": -6.915144920349121, "global_step": 143732, "epoch": 3422} {"train_loss": -6.837545871734619, "global_step": 143733, "epoch": 3422} {"train_loss": -6.851223468780518, "global_step": 143734, "epoch": 3422} {"train_loss": -6.890633583068848, "global_step": 143735, "epoch": 3422} {"train_loss": -6.883116722106934, "global_step": 143736, "epoch": 3422} {"train_loss": -6.850264549255371, "global_step": 143737, "epoch": 3422} {"train_loss": -6.838929176330566, "global_step": 143738, "epoch": 3422} {"train_loss": -6.837520122528076, "global_step": 143739, "epoch": 3422} {"train_loss": -6.752319812774658, "global_step": 143740, "epoch": 3422} {"train_loss": -6.819787979125977, "global_step": 143741, "epoch": 3422} {"train_loss": -6.857007026672363, "global_step": 143742, "epoch": 3422} {"train_loss": -6.892958641052246, "global_step": 143743, "epoch": 3422} {"train_loss": -6.7763166427612305, "global_step": 143744, "epoch": 3422} {"train_loss": -6.850360870361328, "global_step": 143745, "epoch": 3422} {"train_loss": -6.884295463562012, "global_step": 143746, "epoch": 3422} {"train_loss": -6.886820316314697, "global_step": 143747, "epoch": 3422} {"train_loss": -6.691869735717773, "global_step": 143748, "epoch": 3422} {"train_loss": -6.675110816955566, "global_step": 143749, "epoch": 3422} {"train_loss": -6.766471862792969, "global_step": 143750, "epoch": 3422} {"train_loss": -6.841798782348633, "global_step": 143751, "epoch": 3422} {"train_loss": -6.664282321929932, "global_step": 143752, "epoch": 3422} {"train_loss": -6.822968482971191, "global_step": 143753, "epoch": 3422} {"train_loss": -6.757435321807861, "global_step": 143754, "epoch": 3422} {"train_loss": -6.713815689086914, "global_step": 143755, "epoch": 3422} {"train_loss": -6.834062576293945, "global_step": 143756, "epoch": 3422} {"train_loss": -6.842662811279297, "global_step": 143757, "epoch": 3422} {"train_loss": -6.802102088928223, "global_step": 143758, "epoch": 3422} {"train_loss": -6.753829479217529, "global_step": 143759, "epoch": 3422} {"train_loss": -6.727813720703125, "global_step": 143760, "epoch": 3422} {"train_loss": -6.9062581062316895, "global_step": 143761, "epoch": 3422} {"train_loss": -6.7820024490356445, "global_step": 143762, "epoch": 3422} {"train_loss": -6.8192901611328125, "global_step": 143763, "epoch": 3422} {"train_loss": -6.764281272888184, "global_step": 143764, "epoch": 3422} {"train_loss": -6.808753706160045, "global_step": 143765, "epoch": 3422, "val_loss": 78362.984375} {"train_loss": -6.859811782836914, "global_step": 143766, "epoch": 3423} {"train_loss": -6.804287910461426, "global_step": 143767, "epoch": 3423} {"train_loss": -6.765902519226074, "global_step": 143768, "epoch": 3423} {"train_loss": -6.882838249206543, "global_step": 143769, "epoch": 3423} {"train_loss": -6.885237693786621, "global_step": 143770, "epoch": 3423} {"train_loss": -6.798279762268066, "global_step": 143771, "epoch": 3423} {"train_loss": -6.859706401824951, "global_step": 143772, "epoch": 3423} {"train_loss": -6.77501106262207, "global_step": 143773, "epoch": 3423} {"train_loss": -6.785484790802002, "global_step": 143774, "epoch": 3423} {"train_loss": -6.867165565490723, "global_step": 143775, "epoch": 3423} {"train_loss": -6.696994781494141, "global_step": 143776, "epoch": 3423} {"train_loss": -6.789670944213867, "global_step": 143777, "epoch": 3423} {"train_loss": -6.770040512084961, "global_step": 143778, "epoch": 3423} {"train_loss": -6.795324802398682, "global_step": 143779, "epoch": 3423} {"train_loss": -6.663546562194824, "global_step": 143780, "epoch": 3423} {"train_loss": -6.8671674728393555, "global_step": 143781, "epoch": 3423} {"train_loss": -6.771305084228516, "global_step": 143782, "epoch": 3423} {"train_loss": -6.7262420654296875, "global_step": 143783, "epoch": 3423} {"train_loss": -6.82417106628418, "global_step": 143784, "epoch": 3423} {"train_loss": -6.795926570892334, "global_step": 143785, "epoch": 3423} {"train_loss": -6.726749420166016, "global_step": 143786, "epoch": 3423} {"train_loss": -6.843057155609131, "global_step": 143787, "epoch": 3423} {"train_loss": -6.866330146789551, "global_step": 143788, "epoch": 3423} {"train_loss": -6.749902725219727, "global_step": 143789, "epoch": 3423} {"train_loss": -6.862722873687744, "global_step": 143790, "epoch": 3423} {"train_loss": -6.973670959472656, "global_step": 143791, "epoch": 3423} {"train_loss": -6.806809425354004, "global_step": 143792, "epoch": 3423} {"train_loss": -6.864772319793701, "global_step": 143793, "epoch": 3423} {"train_loss": -6.856462478637695, "global_step": 143794, "epoch": 3423} {"train_loss": -6.8688554763793945, "global_step": 143795, "epoch": 3423} {"train_loss": -6.84237813949585, "global_step": 143796, "epoch": 3423} {"train_loss": -6.806929588317871, "global_step": 143797, "epoch": 3423} {"train_loss": -6.869268417358398, "global_step": 143798, "epoch": 3423} {"train_loss": -6.794002532958984, "global_step": 143799, "epoch": 3423} {"train_loss": -6.755291938781738, "global_step": 143800, "epoch": 3423} {"train_loss": -6.847909927368164, "global_step": 143801, "epoch": 3423} {"train_loss": -6.82765007019043, "global_step": 143802, "epoch": 3423} {"train_loss": -6.915705680847168, "global_step": 143803, "epoch": 3423} {"train_loss": -6.820919036865234, "global_step": 143804, "epoch": 3423} {"train_loss": -6.790428161621094, "global_step": 143805, "epoch": 3423} {"train_loss": -6.81027889251709, "global_step": 143806, "epoch": 3423} {"train_loss": -6.812277544112432, "global_step": 143807, "epoch": 3423, "val_loss": 78192.8515625} {"train_loss": -6.836336135864258, "global_step": 143808, "epoch": 3424} {"train_loss": -6.820735454559326, "global_step": 143809, "epoch": 3424} {"train_loss": -6.612673759460449, "global_step": 143810, "epoch": 3424} {"train_loss": -6.750927925109863, "global_step": 143811, "epoch": 3424} {"train_loss": -6.850883483886719, "global_step": 143812, "epoch": 3424} {"train_loss": -6.809730052947998, "global_step": 143813, "epoch": 3424} {"train_loss": -6.752350807189941, "global_step": 143814, "epoch": 3424} {"train_loss": -6.7699079513549805, "global_step": 143815, "epoch": 3424} {"train_loss": -6.7737531661987305, "global_step": 143816, "epoch": 3424} {"train_loss": -6.7019853591918945, "global_step": 143817, "epoch": 3424} {"train_loss": -6.610567569732666, "global_step": 143818, "epoch": 3424} {"train_loss": -6.884391784667969, "global_step": 143819, "epoch": 3424} {"train_loss": -6.817385673522949, "global_step": 143820, "epoch": 3424} {"train_loss": -6.822995185852051, "global_step": 143821, "epoch": 3424} {"train_loss": -6.876201629638672, "global_step": 143822, "epoch": 3424} {"train_loss": -6.920638084411621, "global_step": 143823, "epoch": 3424} {"train_loss": -6.648153305053711, "global_step": 143824, "epoch": 3424} {"train_loss": -6.792464733123779, "global_step": 143825, "epoch": 3424} {"train_loss": -6.833981990814209, "global_step": 143826, "epoch": 3424} {"train_loss": -6.823281288146973, "global_step": 143827, "epoch": 3424} {"train_loss": -6.802473068237305, "global_step": 143828, "epoch": 3424} {"train_loss": -6.7689924240112305, "global_step": 143829, "epoch": 3424} {"train_loss": -6.785165786743164, "global_step": 143830, "epoch": 3424} {"train_loss": -6.826828479766846, "global_step": 143831, "epoch": 3424} {"train_loss": -6.76148796081543, "global_step": 143832, "epoch": 3424} {"train_loss": -6.924286842346191, "global_step": 143833, "epoch": 3424} {"train_loss": -6.8384833335876465, "global_step": 143834, "epoch": 3424} {"train_loss": -6.793566703796387, "global_step": 143835, "epoch": 3424} {"train_loss": -6.632051467895508, "global_step": 143836, "epoch": 3424} {"train_loss": -6.797743797302246, "global_step": 143837, "epoch": 3424} {"train_loss": -6.693858623504639, "global_step": 143838, "epoch": 3424} {"train_loss": -6.6209588050842285, "global_step": 143839, "epoch": 3424} {"train_loss": -6.696969032287598, "global_step": 143840, "epoch": 3424} {"train_loss": -6.769203186035156, "global_step": 143841, "epoch": 3424} {"train_loss": -6.718668460845947, "global_step": 143842, "epoch": 3424} {"train_loss": -6.662138938903809, "global_step": 143843, "epoch": 3424} {"train_loss": -6.750409126281738, "global_step": 143844, "epoch": 3424} {"train_loss": -6.647275924682617, "global_step": 143845, "epoch": 3424} {"train_loss": -6.662718296051025, "global_step": 143846, "epoch": 3424} {"train_loss": -6.695289611816406, "global_step": 143847, "epoch": 3424} {"train_loss": -6.86021614074707, "global_step": 143848, "epoch": 3424} {"train_loss": -6.765344983055478, "global_step": 143849, "epoch": 3424, "val_loss": 78048.5390625} {"train_loss": -6.718571186065674, "global_step": 143850, "epoch": 3425} {"train_loss": -6.669301986694336, "global_step": 143851, "epoch": 3425} {"train_loss": -6.899824619293213, "global_step": 143852, "epoch": 3425} {"train_loss": -6.739995956420898, "global_step": 143853, "epoch": 3425} {"train_loss": -6.7603960037231445, "global_step": 143854, "epoch": 3425} {"train_loss": -6.797733306884766, "global_step": 143855, "epoch": 3425} {"train_loss": -6.760197639465332, "global_step": 143856, "epoch": 3425} {"train_loss": -6.967280864715576, "global_step": 143857, "epoch": 3425} {"train_loss": -6.883585453033447, "global_step": 143858, "epoch": 3425} {"train_loss": -6.837462425231934, "global_step": 143859, "epoch": 3425} {"train_loss": -6.918802261352539, "global_step": 143860, "epoch": 3425} {"train_loss": -6.867825984954834, "global_step": 143861, "epoch": 3425} {"train_loss": -6.9143524169921875, "global_step": 143862, "epoch": 3425} {"train_loss": -6.843043327331543, "global_step": 143863, "epoch": 3425} {"train_loss": -6.844536781311035, "global_step": 143864, "epoch": 3425} {"train_loss": -6.87228536605835, "global_step": 143865, "epoch": 3425} {"train_loss": -6.922022342681885, "global_step": 143866, "epoch": 3425} {"train_loss": -6.786730766296387, "global_step": 143867, "epoch": 3425} {"train_loss": -6.796960353851318, "global_step": 143868, "epoch": 3425} {"train_loss": -6.813340663909912, "global_step": 143869, "epoch": 3425} {"train_loss": -6.876287460327148, "global_step": 143870, "epoch": 3425} {"train_loss": -6.8024492263793945, "global_step": 143871, "epoch": 3425} {"train_loss": -6.885271072387695, "global_step": 143872, "epoch": 3425} {"train_loss": -6.739707946777344, "global_step": 143873, "epoch": 3425} {"train_loss": -6.849736213684082, "global_step": 143874, "epoch": 3425} {"train_loss": -6.781864166259766, "global_step": 143875, "epoch": 3425} {"train_loss": -6.877901077270508, "global_step": 143876, "epoch": 3425} {"train_loss": -6.890687465667725, "global_step": 143877, "epoch": 3425} {"train_loss": -6.852569580078125, "global_step": 143878, "epoch": 3425} {"train_loss": -6.778469085693359, "global_step": 143879, "epoch": 3425} {"train_loss": -6.709927558898926, "global_step": 143880, "epoch": 3425} {"train_loss": -6.794950485229492, "global_step": 143881, "epoch": 3425} {"train_loss": -6.857758045196533, "global_step": 143882, "epoch": 3425} {"train_loss": -6.651117324829102, "global_step": 143883, "epoch": 3425} {"train_loss": -6.858332633972168, "global_step": 143884, "epoch": 3425} {"train_loss": -6.704714775085449, "global_step": 143885, "epoch": 3425} {"train_loss": -6.848317623138428, "global_step": 143886, "epoch": 3425} {"train_loss": -6.803271293640137, "global_step": 143887, "epoch": 3425} {"train_loss": -6.672243118286133, "global_step": 143888, "epoch": 3425} {"train_loss": -6.79481315612793, "global_step": 143889, "epoch": 3425} {"train_loss": -6.705390453338623, "global_step": 143890, "epoch": 3425} {"train_loss": -6.811984981809344, "global_step": 143891, "epoch": 3425, "val_loss": 78384.2421875} {"train_loss": -6.753081321716309, "global_step": 143892, "epoch": 3426} {"train_loss": -6.664022922515869, "global_step": 143893, "epoch": 3426} {"train_loss": -6.825888633728027, "global_step": 143894, "epoch": 3426} {"train_loss": -6.540938377380371, "global_step": 143895, "epoch": 3426} {"train_loss": -6.702962875366211, "global_step": 143896, "epoch": 3426} {"train_loss": -6.670375347137451, "global_step": 143897, "epoch": 3426} {"train_loss": -6.641407489776611, "global_step": 143898, "epoch": 3426} {"train_loss": -6.799493789672852, "global_step": 143899, "epoch": 3426} {"train_loss": -6.7591352462768555, "global_step": 143900, "epoch": 3426} {"train_loss": -6.752899169921875, "global_step": 143901, "epoch": 3426} {"train_loss": -6.769908905029297, "global_step": 143902, "epoch": 3426} {"train_loss": -6.77559757232666, "global_step": 143903, "epoch": 3426} {"train_loss": -6.797159194946289, "global_step": 143904, "epoch": 3426} {"train_loss": -6.791948318481445, "global_step": 143905, "epoch": 3426} {"train_loss": -6.842182159423828, "global_step": 143906, "epoch": 3426} {"train_loss": -6.789395332336426, "global_step": 143907, "epoch": 3426} {"train_loss": -6.761649131774902, "global_step": 143908, "epoch": 3426} {"train_loss": -6.828075408935547, "global_step": 143909, "epoch": 3426} {"train_loss": -6.725619316101074, "global_step": 143910, "epoch": 3426} {"train_loss": -6.867682933807373, "global_step": 143911, "epoch": 3426} {"train_loss": -6.8746442794799805, "global_step": 143912, "epoch": 3426} {"train_loss": -6.842833518981934, "global_step": 143913, "epoch": 3426} {"train_loss": -6.787092685699463, "global_step": 143914, "epoch": 3426} {"train_loss": -6.785833835601807, "global_step": 143915, "epoch": 3426} {"train_loss": -6.772078514099121, "global_step": 143916, "epoch": 3426} {"train_loss": -6.9700493812561035, "global_step": 143917, "epoch": 3426} {"train_loss": -6.767014503479004, "global_step": 143918, "epoch": 3426} {"train_loss": -6.8535308837890625, "global_step": 143919, "epoch": 3426} {"train_loss": -6.793215751647949, "global_step": 143920, "epoch": 3426} {"train_loss": -6.870769023895264, "global_step": 143921, "epoch": 3426} {"train_loss": -6.716742992401123, "global_step": 143922, "epoch": 3426} {"train_loss": -6.8614020347595215, "global_step": 143923, "epoch": 3426} {"train_loss": -6.716507911682129, "global_step": 143924, "epoch": 3426} {"train_loss": -6.7823028564453125, "global_step": 143925, "epoch": 3426} {"train_loss": -6.866693496704102, "global_step": 143926, "epoch": 3426} {"train_loss": -6.867210388183594, "global_step": 143927, "epoch": 3426} {"train_loss": -6.918662071228027, "global_step": 143928, "epoch": 3426} {"train_loss": -6.932455062866211, "global_step": 143929, "epoch": 3426} {"train_loss": -6.782038688659668, "global_step": 143930, "epoch": 3426} {"train_loss": -6.714277744293213, "global_step": 143931, "epoch": 3426} {"train_loss": -6.892984390258789, "global_step": 143932, "epoch": 3426} {"train_loss": -6.791229690824236, "global_step": 143933, "epoch": 3426, "val_loss": 78173.2734375} {"train_loss": -6.8769989013671875, "global_step": 143934, "epoch": 3427} {"train_loss": -6.7696332931518555, "global_step": 143935, "epoch": 3427} {"train_loss": -6.855782508850098, "global_step": 143936, "epoch": 3427} {"train_loss": -6.9069414138793945, "global_step": 143937, "epoch": 3427} {"train_loss": -6.841499328613281, "global_step": 143938, "epoch": 3427} {"train_loss": -6.721433639526367, "global_step": 143939, "epoch": 3427} {"train_loss": -6.812455654144287, "global_step": 143940, "epoch": 3427} {"train_loss": -6.772029876708984, "global_step": 143941, "epoch": 3427} {"train_loss": -6.623656749725342, "global_step": 143942, "epoch": 3427} {"train_loss": -6.784239768981934, "global_step": 143943, "epoch": 3427} {"train_loss": -6.714284896850586, "global_step": 143944, "epoch": 3427} {"train_loss": -6.6588544845581055, "global_step": 143945, "epoch": 3427} {"train_loss": -6.952814102172852, "global_step": 143946, "epoch": 3427} {"train_loss": -6.832614898681641, "global_step": 143947, "epoch": 3427} {"train_loss": -6.866539001464844, "global_step": 143948, "epoch": 3427} {"train_loss": -6.8960371017456055, "global_step": 143949, "epoch": 3427} {"train_loss": -6.737157821655273, "global_step": 143950, "epoch": 3427} {"train_loss": -6.7644548416137695, "global_step": 143951, "epoch": 3427} {"train_loss": -6.839276313781738, "global_step": 143952, "epoch": 3427} {"train_loss": -6.723705291748047, "global_step": 143953, "epoch": 3427} {"train_loss": -6.845005035400391, "global_step": 143954, "epoch": 3427} {"train_loss": -6.779421806335449, "global_step": 143955, "epoch": 3427} {"train_loss": -6.925163269042969, "global_step": 143956, "epoch": 3427} {"train_loss": -6.916624069213867, "global_step": 143957, "epoch": 3427} {"train_loss": -6.694455623626709, "global_step": 143958, "epoch": 3427} {"train_loss": -6.856696128845215, "global_step": 143959, "epoch": 3427} {"train_loss": -6.668720245361328, "global_step": 143960, "epoch": 3427} {"train_loss": -6.94492769241333, "global_step": 143961, "epoch": 3427} {"train_loss": -6.853588104248047, "global_step": 143962, "epoch": 3427} {"train_loss": -6.764301300048828, "global_step": 143963, "epoch": 3427} {"train_loss": -6.78513765335083, "global_step": 143964, "epoch": 3427} {"train_loss": -6.729851722717285, "global_step": 143965, "epoch": 3427} {"train_loss": -6.861397743225098, "global_step": 143966, "epoch": 3427} {"train_loss": -6.854493618011475, "global_step": 143967, "epoch": 3427} {"train_loss": -6.752547264099121, "global_step": 143968, "epoch": 3427} {"train_loss": -6.851990699768066, "global_step": 143969, "epoch": 3427} {"train_loss": -6.841484069824219, "global_step": 143970, "epoch": 3427} {"train_loss": -6.738929748535156, "global_step": 143971, "epoch": 3427} {"train_loss": -6.776010513305664, "global_step": 143972, "epoch": 3427} {"train_loss": -6.758608341217041, "global_step": 143973, "epoch": 3427} {"train_loss": -6.708676815032959, "global_step": 143974, "epoch": 3427} {"train_loss": -6.803375959396362, "global_step": 143975, "epoch": 3427, "val_loss": 78308.0546875} {"train_loss": -6.864482402801514, "global_step": 143976, "epoch": 3428} {"train_loss": -6.853803634643555, "global_step": 143977, "epoch": 3428} {"train_loss": -6.806879997253418, "global_step": 143978, "epoch": 3428} {"train_loss": -6.864882469177246, "global_step": 143979, "epoch": 3428} {"train_loss": -6.859297752380371, "global_step": 143980, "epoch": 3428} {"train_loss": -6.829933166503906, "global_step": 143981, "epoch": 3428} {"train_loss": -6.9348883628845215, "global_step": 143982, "epoch": 3428} {"train_loss": -6.8690290451049805, "global_step": 143983, "epoch": 3428} {"train_loss": -6.830320358276367, "global_step": 143984, "epoch": 3428} {"train_loss": -6.764693260192871, "global_step": 143985, "epoch": 3428} {"train_loss": -6.7765793800354, "global_step": 143986, "epoch": 3428} {"train_loss": -6.880237579345703, "global_step": 143987, "epoch": 3428} {"train_loss": -6.915529251098633, "global_step": 143988, "epoch": 3428} {"train_loss": -6.886368274688721, "global_step": 143989, "epoch": 3428} {"train_loss": -6.778106689453125, "global_step": 143990, "epoch": 3428} {"train_loss": -6.703039169311523, "global_step": 143991, "epoch": 3428} {"train_loss": -6.76878547668457, "global_step": 143992, "epoch": 3428} {"train_loss": -6.705476760864258, "global_step": 143993, "epoch": 3428} {"train_loss": -6.730539321899414, "global_step": 143994, "epoch": 3428} {"train_loss": -6.661018371582031, "global_step": 143995, "epoch": 3428} {"train_loss": -6.757892608642578, "global_step": 143996, "epoch": 3428} {"train_loss": -6.753085136413574, "global_step": 143997, "epoch": 3428} {"train_loss": -6.694569110870361, "global_step": 143998, "epoch": 3428} {"train_loss": -6.871395587921143, "global_step": 143999, "epoch": 3428} {"train_loss": -6.817911148071289, "global_step": 144000, "epoch": 3428} {"train_loss": -6.909519672393799, "global_step": 144001, "epoch": 3428} {"train_loss": -6.817066192626953, "global_step": 144002, "epoch": 3428} {"train_loss": -6.836530685424805, "global_step": 144003, "epoch": 3428} {"train_loss": -6.774353981018066, "global_step": 144004, "epoch": 3428} {"train_loss": -6.70997428894043, "global_step": 144005, "epoch": 3428} {"train_loss": -6.838855743408203, "global_step": 144006, "epoch": 3428} {"train_loss": -6.824051856994629, "global_step": 144007, "epoch": 3428} {"train_loss": -6.8355607986450195, "global_step": 144008, "epoch": 3428} {"train_loss": -6.796632766723633, "global_step": 144009, "epoch": 3428} {"train_loss": -6.9045820236206055, "global_step": 144010, "epoch": 3428} {"train_loss": -6.8213911056518555, "global_step": 144011, "epoch": 3428} {"train_loss": -6.891181945800781, "global_step": 144012, "epoch": 3428} {"train_loss": -6.748194694519043, "global_step": 144013, "epoch": 3428} {"train_loss": -6.759853363037109, "global_step": 144014, "epoch": 3428} {"train_loss": -6.889097213745117, "global_step": 144015, "epoch": 3428} {"train_loss": -6.671555519104004, "global_step": 144016, "epoch": 3428} {"train_loss": -6.808732884270804, "global_step": 144017, "epoch": 3428, "val_loss": 78204.984375} {"train_loss": -6.884205341339111, "global_step": 144018, "epoch": 3429} {"train_loss": -6.847143173217773, "global_step": 144019, "epoch": 3429} {"train_loss": -6.83241605758667, "global_step": 144020, "epoch": 3429} {"train_loss": -6.793249130249023, "global_step": 144021, "epoch": 3429} {"train_loss": -6.820066452026367, "global_step": 144022, "epoch": 3429} {"train_loss": -6.767590522766113, "global_step": 144023, "epoch": 3429} {"train_loss": -6.82832670211792, "global_step": 144024, "epoch": 3429} {"train_loss": -6.796916961669922, "global_step": 144025, "epoch": 3429} {"train_loss": -6.770000457763672, "global_step": 144026, "epoch": 3429} {"train_loss": -6.767385482788086, "global_step": 144027, "epoch": 3429} {"train_loss": -6.754500389099121, "global_step": 144028, "epoch": 3429} {"train_loss": -6.965065956115723, "global_step": 144029, "epoch": 3429} {"train_loss": -6.869318008422852, "global_step": 144030, "epoch": 3429} {"train_loss": -6.959792137145996, "global_step": 144031, "epoch": 3429} {"train_loss": -6.810493469238281, "global_step": 144032, "epoch": 3429} {"train_loss": -6.7637481689453125, "global_step": 144033, "epoch": 3429} {"train_loss": -6.737525939941406, "global_step": 144034, "epoch": 3429} {"train_loss": -6.822075843811035, "global_step": 144035, "epoch": 3429} {"train_loss": -6.835666179656982, "global_step": 144036, "epoch": 3429} {"train_loss": -6.8898773193359375, "global_step": 144037, "epoch": 3429} {"train_loss": -6.878619194030762, "global_step": 144038, "epoch": 3429} {"train_loss": -6.842360496520996, "global_step": 144039, "epoch": 3429} {"train_loss": -6.751224517822266, "global_step": 144040, "epoch": 3429} {"train_loss": -6.791897773742676, "global_step": 144041, "epoch": 3429} {"train_loss": -6.680388450622559, "global_step": 144042, "epoch": 3429} {"train_loss": -6.940277099609375, "global_step": 144043, "epoch": 3429} {"train_loss": -6.776010036468506, "global_step": 144044, "epoch": 3429} {"train_loss": -6.786363124847412, "global_step": 144045, "epoch": 3429} {"train_loss": -6.714990139007568, "global_step": 144046, "epoch": 3429} {"train_loss": -6.756609916687012, "global_step": 144047, "epoch": 3429} {"train_loss": -6.771847248077393, "global_step": 144048, "epoch": 3429} {"train_loss": -6.741792678833008, "global_step": 144049, "epoch": 3429} {"train_loss": -6.843169212341309, "global_step": 144050, "epoch": 3429} {"train_loss": -6.770000457763672, "global_step": 144051, "epoch": 3429} {"train_loss": -6.679813861846924, "global_step": 144052, "epoch": 3429} {"train_loss": -6.759077072143555, "global_step": 144053, "epoch": 3429} {"train_loss": -6.800412178039551, "global_step": 144054, "epoch": 3429} {"train_loss": -6.725066184997559, "global_step": 144055, "epoch": 3429} {"train_loss": -6.7357988357543945, "global_step": 144056, "epoch": 3429} {"train_loss": -6.8313517570495605, "global_step": 144057, "epoch": 3429} {"train_loss": -6.682312965393066, "global_step": 144058, "epoch": 3429} {"train_loss": -6.797939187004452, "global_step": 144059, "epoch": 3429, "val_loss": 78527.921875} {"train_loss": -6.762243270874023, "global_step": 144060, "epoch": 3430} {"train_loss": -6.776102066040039, "global_step": 144061, "epoch": 3430} {"train_loss": -6.854203224182129, "global_step": 144062, "epoch": 3430} {"train_loss": -6.716054916381836, "global_step": 144063, "epoch": 3430} {"train_loss": -6.638513088226318, "global_step": 144064, "epoch": 3430} {"train_loss": -6.70085334777832, "global_step": 144065, "epoch": 3430} {"train_loss": -6.433287620544434, "global_step": 144066, "epoch": 3430} {"train_loss": -6.698392868041992, "global_step": 144067, "epoch": 3430} {"train_loss": -6.591119766235352, "global_step": 144068, "epoch": 3430} {"train_loss": -6.620589733123779, "global_step": 144069, "epoch": 3430} {"train_loss": -6.571087837219238, "global_step": 144070, "epoch": 3430} {"train_loss": -6.668983459472656, "global_step": 144071, "epoch": 3430} {"train_loss": -6.627964973449707, "global_step": 144072, "epoch": 3430} {"train_loss": -6.674967288970947, "global_step": 144073, "epoch": 3430} {"train_loss": -6.661114692687988, "global_step": 144074, "epoch": 3430} {"train_loss": -6.707590103149414, "global_step": 144075, "epoch": 3430} {"train_loss": -6.637446403503418, "global_step": 144076, "epoch": 3430} {"train_loss": -6.657318115234375, "global_step": 144077, "epoch": 3430} {"train_loss": -6.6977009773254395, "global_step": 144078, "epoch": 3430} {"train_loss": -6.497699737548828, "global_step": 144079, "epoch": 3430} {"train_loss": -6.782138824462891, "global_step": 144080, "epoch": 3430} {"train_loss": -6.624469757080078, "global_step": 144081, "epoch": 3430} {"train_loss": -6.701086521148682, "global_step": 144082, "epoch": 3430} {"train_loss": -6.65128231048584, "global_step": 144083, "epoch": 3430} {"train_loss": -6.734597206115723, "global_step": 144084, "epoch": 3430} {"train_loss": -6.733128070831299, "global_step": 144085, "epoch": 3430} {"train_loss": -6.779045104980469, "global_step": 144086, "epoch": 3430} {"train_loss": -6.7328596115112305, "global_step": 144087, "epoch": 3430} {"train_loss": -6.819691181182861, "global_step": 144088, "epoch": 3430} {"train_loss": -6.8439483642578125, "global_step": 144089, "epoch": 3430} {"train_loss": -6.788344383239746, "global_step": 144090, "epoch": 3430} {"train_loss": -6.819432258605957, "global_step": 144091, "epoch": 3430} {"train_loss": -6.731590747833252, "global_step": 144092, "epoch": 3430} {"train_loss": -6.753403186798096, "global_step": 144093, "epoch": 3430} {"train_loss": -6.823009490966797, "global_step": 144094, "epoch": 3430} {"train_loss": -6.8480634689331055, "global_step": 144095, "epoch": 3430} {"train_loss": -6.773702621459961, "global_step": 144096, "epoch": 3430} {"train_loss": -6.869917869567871, "global_step": 144097, "epoch": 3430} {"train_loss": -6.878567695617676, "global_step": 144098, "epoch": 3430} {"train_loss": -6.789213180541992, "global_step": 144099, "epoch": 3430} {"train_loss": -6.802873134613037, "global_step": 144100, "epoch": 3430} {"train_loss": -6.722149122328985, "global_step": 144101, "epoch": 3430, "val_loss": 78325.5390625} {"train_loss": -6.8125410079956055, "global_step": 144102, "epoch": 3431} {"train_loss": -6.976282119750977, "global_step": 144103, "epoch": 3431} {"train_loss": -6.886310577392578, "global_step": 144104, "epoch": 3431} {"train_loss": -6.8021240234375, "global_step": 144105, "epoch": 3431} {"train_loss": -6.804994583129883, "global_step": 144106, "epoch": 3431} {"train_loss": -6.80714750289917, "global_step": 144107, "epoch": 3431} {"train_loss": -6.869460105895996, "global_step": 144108, "epoch": 3431} {"train_loss": -6.799165725708008, "global_step": 144109, "epoch": 3431} {"train_loss": -6.988797187805176, "global_step": 144110, "epoch": 3431} {"train_loss": -6.884774684906006, "global_step": 144111, "epoch": 3431} {"train_loss": -6.778127670288086, "global_step": 144112, "epoch": 3431} {"train_loss": -6.845221042633057, "global_step": 144113, "epoch": 3431} {"train_loss": -6.860556602478027, "global_step": 144114, "epoch": 3431} {"train_loss": -6.882112503051758, "global_step": 144115, "epoch": 3431} {"train_loss": -6.650593280792236, "global_step": 144116, "epoch": 3431} {"train_loss": -6.763172149658203, "global_step": 144117, "epoch": 3431} {"train_loss": -6.8870849609375, "global_step": 144118, "epoch": 3431} {"train_loss": -6.791042327880859, "global_step": 144119, "epoch": 3431} {"train_loss": -6.7502336502075195, "global_step": 144120, "epoch": 3431} {"train_loss": -6.777037620544434, "global_step": 144121, "epoch": 3431} {"train_loss": -6.7549662590026855, "global_step": 144122, "epoch": 3431} {"train_loss": -6.793526649475098, "global_step": 144123, "epoch": 3431} {"train_loss": -6.746524810791016, "global_step": 144124, "epoch": 3431} {"train_loss": -6.781912326812744, "global_step": 144125, "epoch": 3431} {"train_loss": -6.851761341094971, "global_step": 144126, "epoch": 3431} {"train_loss": -6.71807861328125, "global_step": 144127, "epoch": 3431} {"train_loss": -6.73658561706543, "global_step": 144128, "epoch": 3431} {"train_loss": -6.729610443115234, "global_step": 144129, "epoch": 3431} {"train_loss": -6.788076877593994, "global_step": 144130, "epoch": 3431} {"train_loss": -6.815237998962402, "global_step": 144131, "epoch": 3431} {"train_loss": -6.688365936279297, "global_step": 144132, "epoch": 3431} {"train_loss": -6.82420539855957, "global_step": 144133, "epoch": 3431} {"train_loss": -6.915987968444824, "global_step": 144134, "epoch": 3431} {"train_loss": -7.0090837478637695, "global_step": 144135, "epoch": 3431} {"train_loss": -6.835121154785156, "global_step": 144136, "epoch": 3431} {"train_loss": -6.811404228210449, "global_step": 144137, "epoch": 3431} {"train_loss": -6.780596733093262, "global_step": 144138, "epoch": 3431} {"train_loss": -6.835613250732422, "global_step": 144139, "epoch": 3431} {"train_loss": -6.789344787597656, "global_step": 144140, "epoch": 3431} {"train_loss": -6.885082244873047, "global_step": 144141, "epoch": 3431} {"train_loss": -6.740726470947266, "global_step": 144142, "epoch": 3431} {"train_loss": -6.817677565983364, "global_step": 144143, "epoch": 3431, "val_loss": 78278.421875} {"train_loss": -6.965526580810547, "global_step": 144144, "epoch": 3432} {"train_loss": -6.881428241729736, "global_step": 144145, "epoch": 3432} {"train_loss": -6.846538543701172, "global_step": 144146, "epoch": 3432} {"train_loss": -6.941132068634033, "global_step": 144147, "epoch": 3432} {"train_loss": -6.908252716064453, "global_step": 144148, "epoch": 3432} {"train_loss": -6.87838077545166, "global_step": 144149, "epoch": 3432} {"train_loss": -6.8621931076049805, "global_step": 144150, "epoch": 3432} {"train_loss": -6.7472381591796875, "global_step": 144151, "epoch": 3432} {"train_loss": -6.839310646057129, "global_step": 144152, "epoch": 3432} {"train_loss": -6.8868303298950195, "global_step": 144153, "epoch": 3432} {"train_loss": -6.84041690826416, "global_step": 144154, "epoch": 3432} {"train_loss": -6.6270856857299805, "global_step": 144155, "epoch": 3432} {"train_loss": -6.830630302429199, "global_step": 144156, "epoch": 3432} {"train_loss": -6.722811222076416, "global_step": 144157, "epoch": 3432} {"train_loss": -6.693565368652344, "global_step": 144158, "epoch": 3432} {"train_loss": -6.891095161437988, "global_step": 144159, "epoch": 3432} {"train_loss": -6.7710041999816895, "global_step": 144160, "epoch": 3432} {"train_loss": -6.797170639038086, "global_step": 144161, "epoch": 3432} {"train_loss": -6.893919467926025, "global_step": 144162, "epoch": 3432} {"train_loss": -6.796767711639404, "global_step": 144163, "epoch": 3432} {"train_loss": -6.830483436584473, "global_step": 144164, "epoch": 3432} {"train_loss": -6.718008995056152, "global_step": 144165, "epoch": 3432} {"train_loss": -6.744744300842285, "global_step": 144166, "epoch": 3432} {"train_loss": -6.824985504150391, "global_step": 144167, "epoch": 3432} {"train_loss": -6.753208637237549, "global_step": 144168, "epoch": 3432} {"train_loss": -6.880216121673584, "global_step": 144169, "epoch": 3432} {"train_loss": -6.884100914001465, "global_step": 144170, "epoch": 3432} {"train_loss": -6.814548492431641, "global_step": 144171, "epoch": 3432} {"train_loss": -6.851469993591309, "global_step": 144172, "epoch": 3432} {"train_loss": -6.687738418579102, "global_step": 144173, "epoch": 3432} {"train_loss": -6.902785301208496, "global_step": 144174, "epoch": 3432} {"train_loss": -6.888427734375, "global_step": 144175, "epoch": 3432} {"train_loss": -6.6982526779174805, "global_step": 144176, "epoch": 3432} {"train_loss": -6.718902587890625, "global_step": 144177, "epoch": 3432} {"train_loss": -6.8663105964660645, "global_step": 144178, "epoch": 3432} {"train_loss": -6.755492687225342, "global_step": 144179, "epoch": 3432} {"train_loss": -6.821876525878906, "global_step": 144180, "epoch": 3432} {"train_loss": -6.873159885406494, "global_step": 144181, "epoch": 3432} {"train_loss": -6.817717552185059, "global_step": 144182, "epoch": 3432} {"train_loss": -6.938346862792969, "global_step": 144183, "epoch": 3432} {"train_loss": -6.814594745635986, "global_step": 144184, "epoch": 3432} {"train_loss": -6.820001136688959, "global_step": 144185, "epoch": 3432, "val_loss": 78425.5} {"train_loss": -6.846851348876953, "global_step": 144186, "epoch": 3433} {"train_loss": -6.850904941558838, "global_step": 144187, "epoch": 3433} {"train_loss": -6.800704002380371, "global_step": 144188, "epoch": 3433} {"train_loss": -6.891903877258301, "global_step": 144189, "epoch": 3433} {"train_loss": -6.80545711517334, "global_step": 144190, "epoch": 3433} {"train_loss": -6.72581672668457, "global_step": 144191, "epoch": 3433} {"train_loss": -6.860987663269043, "global_step": 144192, "epoch": 3433} {"train_loss": -6.838282108306885, "global_step": 144193, "epoch": 3433} {"train_loss": -6.887540817260742, "global_step": 144194, "epoch": 3433} {"train_loss": -6.834507942199707, "global_step": 144195, "epoch": 3433} {"train_loss": -6.8034257888793945, "global_step": 144196, "epoch": 3433} {"train_loss": -6.728267669677734, "global_step": 144197, "epoch": 3433} {"train_loss": -6.779422283172607, "global_step": 144198, "epoch": 3433} {"train_loss": -6.865313529968262, "global_step": 144199, "epoch": 3433} {"train_loss": -6.740118026733398, "global_step": 144200, "epoch": 3433} {"train_loss": -6.703916072845459, "global_step": 144201, "epoch": 3433} {"train_loss": -6.772819995880127, "global_step": 144202, "epoch": 3433} {"train_loss": -6.712363243103027, "global_step": 144203, "epoch": 3433} {"train_loss": -6.86978816986084, "global_step": 144204, "epoch": 3433} {"train_loss": -6.761792182922363, "global_step": 144205, "epoch": 3433} {"train_loss": -6.790055274963379, "global_step": 144206, "epoch": 3433} {"train_loss": -6.82814359664917, "global_step": 144207, "epoch": 3433} {"train_loss": -6.870973587036133, "global_step": 144208, "epoch": 3433} {"train_loss": -6.722372055053711, "global_step": 144209, "epoch": 3433} {"train_loss": -6.79204797744751, "global_step": 144210, "epoch": 3433} {"train_loss": -6.8596673011779785, "global_step": 144211, "epoch": 3433} {"train_loss": -6.782590866088867, "global_step": 144212, "epoch": 3433} {"train_loss": -6.784153461456299, "global_step": 144213, "epoch": 3433} {"train_loss": -6.7889275550842285, "global_step": 144214, "epoch": 3433} {"train_loss": -6.845919609069824, "global_step": 144215, "epoch": 3433} {"train_loss": -6.748029708862305, "global_step": 144216, "epoch": 3433} {"train_loss": -6.900395393371582, "global_step": 144217, "epoch": 3433} {"train_loss": -6.707343578338623, "global_step": 144218, "epoch": 3433} {"train_loss": -6.722417831420898, "global_step": 144219, "epoch": 3433} {"train_loss": -6.791432857513428, "global_step": 144220, "epoch": 3433} {"train_loss": -6.792186737060547, "global_step": 144221, "epoch": 3433} {"train_loss": -6.762200355529785, "global_step": 144222, "epoch": 3433} {"train_loss": -6.688454627990723, "global_step": 144223, "epoch": 3433} {"train_loss": -6.768406391143799, "global_step": 144224, "epoch": 3433} {"train_loss": -6.849537372589111, "global_step": 144225, "epoch": 3433} {"train_loss": -6.713144302368164, "global_step": 144226, "epoch": 3433} {"train_loss": -6.795169932501657, "global_step": 144227, "epoch": 3433, "val_loss": 78516.46875} {"train_loss": -6.759540557861328, "global_step": 144228, "epoch": 3434} {"train_loss": -6.739758491516113, "global_step": 144229, "epoch": 3434} {"train_loss": -6.895328998565674, "global_step": 144230, "epoch": 3434} {"train_loss": -6.9437761306762695, "global_step": 144231, "epoch": 3434} {"train_loss": -6.846798419952393, "global_step": 144232, "epoch": 3434} {"train_loss": -6.6880412101745605, "global_step": 144233, "epoch": 3434} {"train_loss": -6.897637844085693, "global_step": 144234, "epoch": 3434} {"train_loss": -6.94612455368042, "global_step": 144235, "epoch": 3434} {"train_loss": -6.970381736755371, "global_step": 144236, "epoch": 3434} {"train_loss": -6.849762916564941, "global_step": 144237, "epoch": 3434} {"train_loss": -6.878780364990234, "global_step": 144238, "epoch": 3434} {"train_loss": -6.882369041442871, "global_step": 144239, "epoch": 3434} {"train_loss": -6.84898567199707, "global_step": 144240, "epoch": 3434} {"train_loss": -6.778785228729248, "global_step": 144241, "epoch": 3434} {"train_loss": -6.858188629150391, "global_step": 144242, "epoch": 3434} {"train_loss": -6.884871959686279, "global_step": 144243, "epoch": 3434} {"train_loss": -6.7559990882873535, "global_step": 144244, "epoch": 3434} {"train_loss": -6.823184967041016, "global_step": 144245, "epoch": 3434} {"train_loss": -6.825262069702148, "global_step": 144246, "epoch": 3434} {"train_loss": -6.757347583770752, "global_step": 144247, "epoch": 3434} {"train_loss": -6.769100189208984, "global_step": 144248, "epoch": 3434} {"train_loss": -6.897792816162109, "global_step": 144249, "epoch": 3434} {"train_loss": -6.8878583908081055, "global_step": 144250, "epoch": 3434} {"train_loss": -6.809330940246582, "global_step": 144251, "epoch": 3434} {"train_loss": -6.830360412597656, "global_step": 144252, "epoch": 3434} {"train_loss": -6.931890487670898, "global_step": 144253, "epoch": 3434} {"train_loss": -6.851792812347412, "global_step": 144254, "epoch": 3434} {"train_loss": -6.8148345947265625, "global_step": 144255, "epoch": 3434} {"train_loss": -6.787840366363525, "global_step": 144256, "epoch": 3434} {"train_loss": -6.829402923583984, "global_step": 144257, "epoch": 3434} {"train_loss": -6.840322971343994, "global_step": 144258, "epoch": 3434} {"train_loss": -6.85490608215332, "global_step": 144259, "epoch": 3434} {"train_loss": -6.86013126373291, "global_step": 144260, "epoch": 3434} {"train_loss": -6.881019592285156, "global_step": 144261, "epoch": 3434} {"train_loss": -6.903063774108887, "global_step": 144262, "epoch": 3434} {"train_loss": -6.882384300231934, "global_step": 144263, "epoch": 3434} {"train_loss": -6.720223426818848, "global_step": 144264, "epoch": 3434} {"train_loss": -6.963907241821289, "global_step": 144265, "epoch": 3434} {"train_loss": -6.711419105529785, "global_step": 144266, "epoch": 3434} {"train_loss": -6.739049911499023, "global_step": 144267, "epoch": 3434} {"train_loss": -6.906515121459961, "global_step": 144268, "epoch": 3434} {"train_loss": -6.841743219466436, "global_step": 144269, "epoch": 3434, "val_loss": 78298.3828125} {"train_loss": -6.865539073944092, "global_step": 144270, "epoch": 3435} {"train_loss": -6.814340591430664, "global_step": 144271, "epoch": 3435} {"train_loss": -6.781782150268555, "global_step": 144272, "epoch": 3435} {"train_loss": -6.851090908050537, "global_step": 144273, "epoch": 3435} {"train_loss": -6.971529483795166, "global_step": 144274, "epoch": 3435} {"train_loss": -6.852693557739258, "global_step": 144275, "epoch": 3435} {"train_loss": -6.815896987915039, "global_step": 144276, "epoch": 3435} {"train_loss": -6.731917381286621, "global_step": 144277, "epoch": 3435} {"train_loss": -6.782826900482178, "global_step": 144278, "epoch": 3435} {"train_loss": -6.761590480804443, "global_step": 144279, "epoch": 3435} {"train_loss": -6.841657638549805, "global_step": 144280, "epoch": 3435} {"train_loss": -6.816218376159668, "global_step": 144281, "epoch": 3435} {"train_loss": -6.835956573486328, "global_step": 144282, "epoch": 3435} {"train_loss": -6.721199989318848, "global_step": 144283, "epoch": 3435} {"train_loss": -6.813019275665283, "global_step": 144284, "epoch": 3435} {"train_loss": -6.814325332641602, "global_step": 144285, "epoch": 3435} {"train_loss": -6.578921318054199, "global_step": 144286, "epoch": 3435} {"train_loss": -6.921975135803223, "global_step": 144287, "epoch": 3435} {"train_loss": -6.947782516479492, "global_step": 144288, "epoch": 3435} {"train_loss": -6.879117965698242, "global_step": 144289, "epoch": 3435} {"train_loss": -6.769463539123535, "global_step": 144290, "epoch": 3435} {"train_loss": -6.749851226806641, "global_step": 144291, "epoch": 3435} {"train_loss": -6.791539669036865, "global_step": 144292, "epoch": 3435} {"train_loss": -6.779850006103516, "global_step": 144293, "epoch": 3435} {"train_loss": -6.715064525604248, "global_step": 144294, "epoch": 3435} {"train_loss": -6.745198726654053, "global_step": 144295, "epoch": 3435} {"train_loss": -6.733406066894531, "global_step": 144296, "epoch": 3435} {"train_loss": -6.681468486785889, "global_step": 144297, "epoch": 3435} {"train_loss": -6.780466556549072, "global_step": 144298, "epoch": 3435} {"train_loss": -6.760357856750488, "global_step": 144299, "epoch": 3435} {"train_loss": -6.724947452545166, "global_step": 144300, "epoch": 3435} {"train_loss": -6.75700569152832, "global_step": 144301, "epoch": 3435} {"train_loss": -6.704173564910889, "global_step": 144302, "epoch": 3435} {"train_loss": -6.716195106506348, "global_step": 144303, "epoch": 3435} {"train_loss": -6.832671642303467, "global_step": 144304, "epoch": 3435} {"train_loss": -6.814927101135254, "global_step": 144305, "epoch": 3435} {"train_loss": -6.8471455574035645, "global_step": 144306, "epoch": 3435} {"train_loss": -6.797567367553711, "global_step": 144307, "epoch": 3435} {"train_loss": -6.8534650802612305, "global_step": 144308, "epoch": 3435} {"train_loss": -6.769565105438232, "global_step": 144309, "epoch": 3435} {"train_loss": -6.79853630065918, "global_step": 144310, "epoch": 3435} {"train_loss": -6.792723065330868, "global_step": 144311, "epoch": 3435, "val_loss": 78445.65625} {"train_loss": -6.771126747131348, "global_step": 144312, "epoch": 3436} {"train_loss": -6.720597267150879, "global_step": 144313, "epoch": 3436} {"train_loss": -6.820026397705078, "global_step": 144314, "epoch": 3436} {"train_loss": -6.736565589904785, "global_step": 144315, "epoch": 3436} {"train_loss": -6.78706169128418, "global_step": 144316, "epoch": 3436} {"train_loss": -6.879190444946289, "global_step": 144317, "epoch": 3436} {"train_loss": -6.74794864654541, "global_step": 144318, "epoch": 3436} {"train_loss": -6.828334808349609, "global_step": 144319, "epoch": 3436} {"train_loss": -6.775428295135498, "global_step": 144320, "epoch": 3436} {"train_loss": -6.818473815917969, "global_step": 144321, "epoch": 3436} {"train_loss": -6.842371463775635, "global_step": 144322, "epoch": 3436} {"train_loss": -6.849615573883057, "global_step": 144323, "epoch": 3436} {"train_loss": -6.788103103637695, "global_step": 144324, "epoch": 3436} {"train_loss": -6.939544200897217, "global_step": 144325, "epoch": 3436} {"train_loss": -6.851489543914795, "global_step": 144326, "epoch": 3436} {"train_loss": -6.911403179168701, "global_step": 144327, "epoch": 3436} {"train_loss": -6.779560089111328, "global_step": 144328, "epoch": 3436} {"train_loss": -6.851089000701904, "global_step": 144329, "epoch": 3436} {"train_loss": -6.787755012512207, "global_step": 144330, "epoch": 3436} {"train_loss": -6.876850128173828, "global_step": 144331, "epoch": 3436} {"train_loss": -6.796497344970703, "global_step": 144332, "epoch": 3436} {"train_loss": -6.816897392272949, "global_step": 144333, "epoch": 3436} {"train_loss": -6.785799026489258, "global_step": 144334, "epoch": 3436} {"train_loss": -6.828723907470703, "global_step": 144335, "epoch": 3436} {"train_loss": -6.816693305969238, "global_step": 144336, "epoch": 3436} {"train_loss": -6.838120937347412, "global_step": 144337, "epoch": 3436} {"train_loss": -6.810524940490723, "global_step": 144338, "epoch": 3436} {"train_loss": -6.752224445343018, "global_step": 144339, "epoch": 3436} {"train_loss": -6.844768524169922, "global_step": 144340, "epoch": 3436} {"train_loss": -6.774907112121582, "global_step": 144341, "epoch": 3436} {"train_loss": -6.749361515045166, "global_step": 144342, "epoch": 3436} {"train_loss": -6.794975280761719, "global_step": 144343, "epoch": 3436} {"train_loss": -6.868427276611328, "global_step": 144344, "epoch": 3436} {"train_loss": -6.766456604003906, "global_step": 144345, "epoch": 3436} {"train_loss": -6.768982887268066, "global_step": 144346, "epoch": 3436} {"train_loss": -6.82745361328125, "global_step": 144347, "epoch": 3436} {"train_loss": -6.77401876449585, "global_step": 144348, "epoch": 3436} {"train_loss": -6.806358337402344, "global_step": 144349, "epoch": 3436} {"train_loss": -6.782288074493408, "global_step": 144350, "epoch": 3436} {"train_loss": -6.686468124389648, "global_step": 144351, "epoch": 3436} {"train_loss": -6.830475807189941, "global_step": 144352, "epoch": 3436} {"train_loss": -6.806600831803822, "global_step": 144353, "epoch": 3436, "val_loss": 78459.265625} {"train_loss": -6.800727844238281, "global_step": 144354, "epoch": 3437} {"train_loss": -6.776412010192871, "global_step": 144355, "epoch": 3437} {"train_loss": -6.942314147949219, "global_step": 144356, "epoch": 3437} {"train_loss": -6.850664138793945, "global_step": 144357, "epoch": 3437} {"train_loss": -6.69032096862793, "global_step": 144358, "epoch": 3437} {"train_loss": -6.645449161529541, "global_step": 144359, "epoch": 3437} {"train_loss": -6.774294853210449, "global_step": 144360, "epoch": 3437} {"train_loss": -6.9108147621154785, "global_step": 144361, "epoch": 3437} {"train_loss": -6.689454078674316, "global_step": 144362, "epoch": 3437} {"train_loss": -6.855774402618408, "global_step": 144363, "epoch": 3437} {"train_loss": -6.8203535079956055, "global_step": 144364, "epoch": 3437} {"train_loss": -6.7758989334106445, "global_step": 144365, "epoch": 3437} {"train_loss": -6.880751609802246, "global_step": 144366, "epoch": 3437} {"train_loss": -6.800582408905029, "global_step": 144367, "epoch": 3437} {"train_loss": -6.795596122741699, "global_step": 144368, "epoch": 3437} {"train_loss": -6.763860702514648, "global_step": 144369, "epoch": 3437} {"train_loss": -6.9000091552734375, "global_step": 144370, "epoch": 3437} {"train_loss": -6.814335823059082, "global_step": 144371, "epoch": 3437} {"train_loss": -6.754254341125488, "global_step": 144372, "epoch": 3437} {"train_loss": -6.891352653503418, "global_step": 144373, "epoch": 3437} {"train_loss": -6.96547794342041, "global_step": 144374, "epoch": 3437} {"train_loss": -6.887612819671631, "global_step": 144375, "epoch": 3437} {"train_loss": -6.943118095397949, "global_step": 144376, "epoch": 3437} {"train_loss": -6.768190383911133, "global_step": 144377, "epoch": 3437} {"train_loss": -6.768293380737305, "global_step": 144378, "epoch": 3437} {"train_loss": -6.849203586578369, "global_step": 144379, "epoch": 3437} {"train_loss": -6.847697734832764, "global_step": 144380, "epoch": 3437} {"train_loss": -6.795635223388672, "global_step": 144381, "epoch": 3437} {"train_loss": -6.814844131469727, "global_step": 144382, "epoch": 3437} {"train_loss": -6.9170050621032715, "global_step": 144383, "epoch": 3437} {"train_loss": -6.83579158782959, "global_step": 144384, "epoch": 3437} {"train_loss": -6.862357139587402, "global_step": 144385, "epoch": 3437} {"train_loss": -6.806416988372803, "global_step": 144386, "epoch": 3437} {"train_loss": -6.7820725440979, "global_step": 144387, "epoch": 3437} {"train_loss": -6.852926254272461, "global_step": 144388, "epoch": 3437} {"train_loss": -6.9237565994262695, "global_step": 144389, "epoch": 3437} {"train_loss": -6.91710090637207, "global_step": 144390, "epoch": 3437} {"train_loss": -6.830150127410889, "global_step": 144391, "epoch": 3437} {"train_loss": -6.810533046722412, "global_step": 144392, "epoch": 3437} {"train_loss": -6.822369575500488, "global_step": 144393, "epoch": 3437} {"train_loss": -6.755607604980469, "global_step": 144394, "epoch": 3437} {"train_loss": -6.824465604055495, "global_step": 144395, "epoch": 3437, "val_loss": 78232.359375} {"train_loss": -6.840242385864258, "global_step": 144396, "epoch": 3438} {"train_loss": -6.8121337890625, "global_step": 144397, "epoch": 3438} {"train_loss": -6.711781978607178, "global_step": 144398, "epoch": 3438} {"train_loss": -6.889285087585449, "global_step": 144399, "epoch": 3438} {"train_loss": -6.881665229797363, "global_step": 144400, "epoch": 3438} {"train_loss": -6.766040802001953, "global_step": 144401, "epoch": 3438} {"train_loss": -6.865339756011963, "global_step": 144402, "epoch": 3438} {"train_loss": -6.667180061340332, "global_step": 144403, "epoch": 3438} {"train_loss": -6.790470123291016, "global_step": 144404, "epoch": 3438} {"train_loss": -6.858600616455078, "global_step": 144405, "epoch": 3438} {"train_loss": -6.643008232116699, "global_step": 144406, "epoch": 3438} {"train_loss": -6.761981010437012, "global_step": 144407, "epoch": 3438} {"train_loss": -6.8042497634887695, "global_step": 144408, "epoch": 3438} {"train_loss": -6.831420421600342, "global_step": 144409, "epoch": 3438} {"train_loss": -6.802934169769287, "global_step": 144410, "epoch": 3438} {"train_loss": -6.683127403259277, "global_step": 144411, "epoch": 3438} {"train_loss": -6.727542400360107, "global_step": 144412, "epoch": 3438} {"train_loss": -6.935084342956543, "global_step": 144413, "epoch": 3438} {"train_loss": -6.738523006439209, "global_step": 144414, "epoch": 3438} {"train_loss": -6.8814239501953125, "global_step": 144415, "epoch": 3438} {"train_loss": -6.715417861938477, "global_step": 144416, "epoch": 3438} {"train_loss": -6.85390567779541, "global_step": 144417, "epoch": 3438} {"train_loss": -6.864108562469482, "global_step": 144418, "epoch": 3438} {"train_loss": -6.799878120422363, "global_step": 144419, "epoch": 3438} {"train_loss": -6.8458404541015625, "global_step": 144420, "epoch": 3438} {"train_loss": -6.718575477600098, "global_step": 144421, "epoch": 3438} {"train_loss": -6.697007179260254, "global_step": 144422, "epoch": 3438} {"train_loss": -6.888639450073242, "global_step": 144423, "epoch": 3438} {"train_loss": -6.703334808349609, "global_step": 144424, "epoch": 3438} {"train_loss": -6.728389263153076, "global_step": 144425, "epoch": 3438} {"train_loss": -6.605228424072266, "global_step": 144426, "epoch": 3438} {"train_loss": -6.712265968322754, "global_step": 144427, "epoch": 3438} {"train_loss": -6.74299430847168, "global_step": 144428, "epoch": 3438} {"train_loss": -6.672362327575684, "global_step": 144429, "epoch": 3438} {"train_loss": -6.81303071975708, "global_step": 144430, "epoch": 3438} {"train_loss": -6.767927169799805, "global_step": 144431, "epoch": 3438} {"train_loss": -6.772412300109863, "global_step": 144432, "epoch": 3438} {"train_loss": -6.6916351318359375, "global_step": 144433, "epoch": 3438} {"train_loss": -6.737919807434082, "global_step": 144434, "epoch": 3438} {"train_loss": -6.835997104644775, "global_step": 144435, "epoch": 3438} {"train_loss": -6.7078399658203125, "global_step": 144436, "epoch": 3438} {"train_loss": -6.7726723693666, "global_step": 144437, "epoch": 3438, "val_loss": 78226.375} {"train_loss": -6.875504016876221, "global_step": 144438, "epoch": 3439} {"train_loss": -6.691656112670898, "global_step": 144439, "epoch": 3439} {"train_loss": -6.854766845703125, "global_step": 144440, "epoch": 3439} {"train_loss": -6.832256317138672, "global_step": 144441, "epoch": 3439} {"train_loss": -6.7995147705078125, "global_step": 144442, "epoch": 3439} {"train_loss": -6.8413405418396, "global_step": 144443, "epoch": 3439} {"train_loss": -6.790167808532715, "global_step": 144444, "epoch": 3439} {"train_loss": -6.812007904052734, "global_step": 144445, "epoch": 3439} {"train_loss": -6.681882858276367, "global_step": 144446, "epoch": 3439} {"train_loss": -6.754695892333984, "global_step": 144447, "epoch": 3439} {"train_loss": -6.685735702514648, "global_step": 144448, "epoch": 3439} {"train_loss": -6.842668533325195, "global_step": 144449, "epoch": 3439} {"train_loss": -6.691068649291992, "global_step": 144450, "epoch": 3439} {"train_loss": -6.915098190307617, "global_step": 144451, "epoch": 3439} {"train_loss": -6.801241397857666, "global_step": 144452, "epoch": 3439} {"train_loss": -6.880495071411133, "global_step": 144453, "epoch": 3439} {"train_loss": -6.904115676879883, "global_step": 144454, "epoch": 3439} {"train_loss": -6.842362403869629, "global_step": 144455, "epoch": 3439} {"train_loss": -6.842689514160156, "global_step": 144456, "epoch": 3439} {"train_loss": -6.844829559326172, "global_step": 144457, "epoch": 3439} {"train_loss": -6.744326591491699, "global_step": 144458, "epoch": 3439} {"train_loss": -6.83507776260376, "global_step": 144459, "epoch": 3439} {"train_loss": -6.808825492858887, "global_step": 144460, "epoch": 3439} {"train_loss": -6.6259918212890625, "global_step": 144461, "epoch": 3439} {"train_loss": -6.780523300170898, "global_step": 144462, "epoch": 3439} {"train_loss": -6.702159881591797, "global_step": 144463, "epoch": 3439} {"train_loss": -6.752221584320068, "global_step": 144464, "epoch": 3439} {"train_loss": -6.759738445281982, "global_step": 144465, "epoch": 3439} {"train_loss": -6.725370407104492, "global_step": 144466, "epoch": 3439} {"train_loss": -6.635770797729492, "global_step": 144467, "epoch": 3439} {"train_loss": -6.924324989318848, "global_step": 144468, "epoch": 3439} {"train_loss": -6.709244251251221, "global_step": 144469, "epoch": 3439} {"train_loss": -6.869943141937256, "global_step": 144470, "epoch": 3439} {"train_loss": -6.7966413497924805, "global_step": 144471, "epoch": 3439} {"train_loss": -6.800721168518066, "global_step": 144472, "epoch": 3439} {"train_loss": -6.683300971984863, "global_step": 144473, "epoch": 3439} {"train_loss": -6.758073806762695, "global_step": 144474, "epoch": 3439} {"train_loss": -6.850323677062988, "global_step": 144475, "epoch": 3439} {"train_loss": -6.630645275115967, "global_step": 144476, "epoch": 3439} {"train_loss": -6.694123268127441, "global_step": 144477, "epoch": 3439} {"train_loss": -6.794338703155518, "global_step": 144478, "epoch": 3439} {"train_loss": -6.780610016414097, "global_step": 144479, "epoch": 3439, "val_loss": 78364.9765625} {"train_loss": -6.807529449462891, "global_step": 144480, "epoch": 3440} {"train_loss": -6.815793991088867, "global_step": 144481, "epoch": 3440} {"train_loss": -6.7532958984375, "global_step": 144482, "epoch": 3440} {"train_loss": -6.805784225463867, "global_step": 144483, "epoch": 3440} {"train_loss": -6.817352294921875, "global_step": 144484, "epoch": 3440} {"train_loss": -6.817046165466309, "global_step": 144485, "epoch": 3440} {"train_loss": -6.770360469818115, "global_step": 144486, "epoch": 3440} {"train_loss": -6.812292098999023, "global_step": 144487, "epoch": 3440} {"train_loss": -6.9348673820495605, "global_step": 144488, "epoch": 3440} {"train_loss": -6.878852844238281, "global_step": 144489, "epoch": 3440} {"train_loss": -6.807860374450684, "global_step": 144490, "epoch": 3440} {"train_loss": -6.80845832824707, "global_step": 144491, "epoch": 3440} {"train_loss": -6.839640140533447, "global_step": 144492, "epoch": 3440} {"train_loss": -6.818920612335205, "global_step": 144493, "epoch": 3440} {"train_loss": -6.834793567657471, "global_step": 144494, "epoch": 3440} {"train_loss": -6.877066612243652, "global_step": 144495, "epoch": 3440} {"train_loss": -6.860963821411133, "global_step": 144496, "epoch": 3440} {"train_loss": -6.899364471435547, "global_step": 144497, "epoch": 3440} {"train_loss": -6.836479187011719, "global_step": 144498, "epoch": 3440} {"train_loss": -6.820540428161621, "global_step": 144499, "epoch": 3440} {"train_loss": -6.902552127838135, "global_step": 144500, "epoch": 3440} {"train_loss": -6.901254653930664, "global_step": 144501, "epoch": 3440} {"train_loss": -6.8345232009887695, "global_step": 144502, "epoch": 3440} {"train_loss": -6.82397985458374, "global_step": 144503, "epoch": 3440} {"train_loss": -6.823551177978516, "global_step": 144504, "epoch": 3440} {"train_loss": -6.7861175537109375, "global_step": 144505, "epoch": 3440} {"train_loss": -6.8246541023254395, "global_step": 144506, "epoch": 3440} {"train_loss": -6.844651222229004, "global_step": 144507, "epoch": 3440} {"train_loss": -6.900343894958496, "global_step": 144508, "epoch": 3440} {"train_loss": -6.816073417663574, "global_step": 144509, "epoch": 3440} {"train_loss": -6.792845726013184, "global_step": 144510, "epoch": 3440} {"train_loss": -6.839794158935547, "global_step": 144511, "epoch": 3440} {"train_loss": -6.770871162414551, "global_step": 144512, "epoch": 3440} {"train_loss": -6.837508201599121, "global_step": 144513, "epoch": 3440} {"train_loss": -6.850330829620361, "global_step": 144514, "epoch": 3440} {"train_loss": -6.779637336730957, "global_step": 144515, "epoch": 3440} {"train_loss": -6.8672075271606445, "global_step": 144516, "epoch": 3440} {"train_loss": -6.791262626647949, "global_step": 144517, "epoch": 3440} {"train_loss": -6.865566253662109, "global_step": 144518, "epoch": 3440} {"train_loss": -6.890540599822998, "global_step": 144519, "epoch": 3440} {"train_loss": -6.777853965759277, "global_step": 144520, "epoch": 3440} {"train_loss": -6.834749721345448, "global_step": 144521, "epoch": 3440, "val_loss": 78307.453125} {"train_loss": -6.8976030349731445, "global_step": 144522, "epoch": 3441} {"train_loss": -6.90751838684082, "global_step": 144523, "epoch": 3441} {"train_loss": -6.8952956199646, "global_step": 144524, "epoch": 3441} {"train_loss": -6.888428211212158, "global_step": 144525, "epoch": 3441} {"train_loss": -6.902843952178955, "global_step": 144526, "epoch": 3441} {"train_loss": -6.958822250366211, "global_step": 144527, "epoch": 3441} {"train_loss": -6.9564361572265625, "global_step": 144528, "epoch": 3441} {"train_loss": -6.852919578552246, "global_step": 144529, "epoch": 3441} {"train_loss": -6.8665852546691895, "global_step": 144530, "epoch": 3441} {"train_loss": -6.849642276763916, "global_step": 144531, "epoch": 3441} {"train_loss": -6.84318733215332, "global_step": 144532, "epoch": 3441} {"train_loss": -6.7942304611206055, "global_step": 144533, "epoch": 3441} {"train_loss": -6.73172664642334, "global_step": 144534, "epoch": 3441} {"train_loss": -6.904685974121094, "global_step": 144535, "epoch": 3441} {"train_loss": -6.89895486831665, "global_step": 144536, "epoch": 3441} {"train_loss": -6.833463191986084, "global_step": 144537, "epoch": 3441} {"train_loss": -6.858386039733887, "global_step": 144538, "epoch": 3441} {"train_loss": -6.838000297546387, "global_step": 144539, "epoch": 3441} {"train_loss": -6.926080226898193, "global_step": 144540, "epoch": 3441} {"train_loss": -6.79757022857666, "global_step": 144541, "epoch": 3441} {"train_loss": -6.7926106452941895, "global_step": 144542, "epoch": 3441} {"train_loss": -6.829845905303955, "global_step": 144543, "epoch": 3441} {"train_loss": -6.83137321472168, "global_step": 144544, "epoch": 3441} {"train_loss": -6.946197509765625, "global_step": 144545, "epoch": 3441} {"train_loss": -6.793035984039307, "global_step": 144546, "epoch": 3441} {"train_loss": -6.784558296203613, "global_step": 144547, "epoch": 3441} {"train_loss": -6.827392578125, "global_step": 144548, "epoch": 3441} {"train_loss": -6.824312210083008, "global_step": 144549, "epoch": 3441} {"train_loss": -6.645024299621582, "global_step": 144550, "epoch": 3441} {"train_loss": -6.742228031158447, "global_step": 144551, "epoch": 3441} {"train_loss": -6.914655685424805, "global_step": 144552, "epoch": 3441} {"train_loss": -6.786333084106445, "global_step": 144553, "epoch": 3441} {"train_loss": -6.738507270812988, "global_step": 144554, "epoch": 3441} {"train_loss": -6.79295539855957, "global_step": 144555, "epoch": 3441} {"train_loss": -6.8026556968688965, "global_step": 144556, "epoch": 3441} {"train_loss": -6.711006164550781, "global_step": 144557, "epoch": 3441} {"train_loss": -6.884866237640381, "global_step": 144558, "epoch": 3441} {"train_loss": -6.910590171813965, "global_step": 144559, "epoch": 3441} {"train_loss": -6.865134239196777, "global_step": 144560, "epoch": 3441} {"train_loss": -6.748772621154785, "global_step": 144561, "epoch": 3441} {"train_loss": -6.887269973754883, "global_step": 144562, "epoch": 3441} {"train_loss": -6.838739554087321, "global_step": 144563, "epoch": 3441, "val_loss": 78525.390625} {"train_loss": -6.920641899108887, "global_step": 144564, "epoch": 3442} {"train_loss": -6.832798004150391, "global_step": 144565, "epoch": 3442} {"train_loss": -6.876835823059082, "global_step": 144566, "epoch": 3442} {"train_loss": -6.8940653800964355, "global_step": 144567, "epoch": 3442} {"train_loss": -6.855042457580566, "global_step": 144568, "epoch": 3442} {"train_loss": -6.768815040588379, "global_step": 144569, "epoch": 3442} {"train_loss": -6.824110507965088, "global_step": 144570, "epoch": 3442} {"train_loss": -6.845672607421875, "global_step": 144571, "epoch": 3442} {"train_loss": -6.79859733581543, "global_step": 144572, "epoch": 3442} {"train_loss": -6.928653240203857, "global_step": 144573, "epoch": 3442} {"train_loss": -6.874789237976074, "global_step": 144574, "epoch": 3442} {"train_loss": -6.801589012145996, "global_step": 144575, "epoch": 3442} {"train_loss": -6.895738124847412, "global_step": 144576, "epoch": 3442} {"train_loss": -6.748080253601074, "global_step": 144577, "epoch": 3442} {"train_loss": -6.7547383308410645, "global_step": 144578, "epoch": 3442} {"train_loss": -6.852343559265137, "global_step": 144579, "epoch": 3442} {"train_loss": -6.844073295593262, "global_step": 144580, "epoch": 3442} {"train_loss": -6.83059024810791, "global_step": 144581, "epoch": 3442} {"train_loss": -6.805663108825684, "global_step": 144582, "epoch": 3442} {"train_loss": -6.749448299407959, "global_step": 144583, "epoch": 3442} {"train_loss": -6.8268513679504395, "global_step": 144584, "epoch": 3442} {"train_loss": -6.867257118225098, "global_step": 144585, "epoch": 3442} {"train_loss": -6.734780311584473, "global_step": 144586, "epoch": 3442} {"train_loss": -6.771418571472168, "global_step": 144587, "epoch": 3442} {"train_loss": -6.6843061447143555, "global_step": 144588, "epoch": 3442} {"train_loss": -6.631709098815918, "global_step": 144589, "epoch": 3442} {"train_loss": -6.808527946472168, "global_step": 144590, "epoch": 3442} {"train_loss": -6.898610591888428, "global_step": 144591, "epoch": 3442} {"train_loss": -6.813274383544922, "global_step": 144592, "epoch": 3442} {"train_loss": -6.780790328979492, "global_step": 144593, "epoch": 3442} {"train_loss": -6.859711647033691, "global_step": 144594, "epoch": 3442} {"train_loss": -6.788848876953125, "global_step": 144595, "epoch": 3442} {"train_loss": -6.854133605957031, "global_step": 144596, "epoch": 3442} {"train_loss": -6.782471656799316, "global_step": 144597, "epoch": 3442} {"train_loss": -6.802285194396973, "global_step": 144598, "epoch": 3442} {"train_loss": -6.757717132568359, "global_step": 144599, "epoch": 3442} {"train_loss": -6.891750812530518, "global_step": 144600, "epoch": 3442} {"train_loss": -6.910189628601074, "global_step": 144601, "epoch": 3442} {"train_loss": -6.824893951416016, "global_step": 144602, "epoch": 3442} {"train_loss": -6.906731605529785, "global_step": 144603, "epoch": 3442} {"train_loss": -6.798624515533447, "global_step": 144604, "epoch": 3442} {"train_loss": -6.820964926765079, "global_step": 144605, "epoch": 3442, "val_loss": 78555.828125} {"train_loss": -6.8313140869140625, "global_step": 144606, "epoch": 3443} {"train_loss": -6.858279705047607, "global_step": 144607, "epoch": 3443} {"train_loss": -6.754278659820557, "global_step": 144608, "epoch": 3443} {"train_loss": -6.910544395446777, "global_step": 144609, "epoch": 3443} {"train_loss": -6.791306495666504, "global_step": 144610, "epoch": 3443} {"train_loss": -6.948577880859375, "global_step": 144611, "epoch": 3443} {"train_loss": -6.826845169067383, "global_step": 144612, "epoch": 3443} {"train_loss": -6.850275993347168, "global_step": 144613, "epoch": 3443} {"train_loss": -6.9489898681640625, "global_step": 144614, "epoch": 3443} {"train_loss": -6.8286638259887695, "global_step": 144615, "epoch": 3443} {"train_loss": -6.85257625579834, "global_step": 144616, "epoch": 3443} {"train_loss": -6.811192512512207, "global_step": 144617, "epoch": 3443} {"train_loss": -6.752985954284668, "global_step": 144618, "epoch": 3443} {"train_loss": -6.809932708740234, "global_step": 144619, "epoch": 3443} {"train_loss": -6.6768388748168945, "global_step": 144620, "epoch": 3443} {"train_loss": -6.687078952789307, "global_step": 144621, "epoch": 3443} {"train_loss": -6.788999557495117, "global_step": 144622, "epoch": 3443} {"train_loss": -6.779624938964844, "global_step": 144623, "epoch": 3443} {"train_loss": -6.828523635864258, "global_step": 144624, "epoch": 3443} {"train_loss": -6.919558048248291, "global_step": 144625, "epoch": 3443} {"train_loss": -6.732898712158203, "global_step": 144626, "epoch": 3443} {"train_loss": -6.860257148742676, "global_step": 144627, "epoch": 3443} {"train_loss": -6.81947135925293, "global_step": 144628, "epoch": 3443} {"train_loss": -6.964618682861328, "global_step": 144629, "epoch": 3443} {"train_loss": -6.91500186920166, "global_step": 144630, "epoch": 3443} {"train_loss": -6.832789421081543, "global_step": 144631, "epoch": 3443} {"train_loss": -6.756039619445801, "global_step": 144632, "epoch": 3443} {"train_loss": -6.770705699920654, "global_step": 144633, "epoch": 3443} {"train_loss": -6.916179656982422, "global_step": 144634, "epoch": 3443} {"train_loss": -6.797271251678467, "global_step": 144635, "epoch": 3443} {"train_loss": -6.9045844078063965, "global_step": 144636, "epoch": 3443} {"train_loss": -6.76837682723999, "global_step": 144637, "epoch": 3443} {"train_loss": -6.849916458129883, "global_step": 144638, "epoch": 3443} {"train_loss": -6.790208339691162, "global_step": 144639, "epoch": 3443} {"train_loss": -6.860164642333984, "global_step": 144640, "epoch": 3443} {"train_loss": -6.8391804695129395, "global_step": 144641, "epoch": 3443} {"train_loss": -6.844292640686035, "global_step": 144642, "epoch": 3443} {"train_loss": -6.924545764923096, "global_step": 144643, "epoch": 3443} {"train_loss": -6.78409481048584, "global_step": 144644, "epoch": 3443} {"train_loss": -6.775343418121338, "global_step": 144645, "epoch": 3443} {"train_loss": -6.8756103515625, "global_step": 144646, "epoch": 3443} {"train_loss": -6.831521477018084, "global_step": 144647, "epoch": 3443, "val_loss": 78535.140625} {"train_loss": -6.801405906677246, "global_step": 144648, "epoch": 3444} {"train_loss": -6.9705586433410645, "global_step": 144649, "epoch": 3444} {"train_loss": -6.8540425300598145, "global_step": 144650, "epoch": 3444} {"train_loss": -6.838313102722168, "global_step": 144651, "epoch": 3444} {"train_loss": -6.89822244644165, "global_step": 144652, "epoch": 3444} {"train_loss": -6.855846405029297, "global_step": 144653, "epoch": 3444} {"train_loss": -6.847905158996582, "global_step": 144654, "epoch": 3444} {"train_loss": -6.873080730438232, "global_step": 144655, "epoch": 3444} {"train_loss": -6.812325477600098, "global_step": 144656, "epoch": 3444} {"train_loss": -6.775607109069824, "global_step": 144657, "epoch": 3444} {"train_loss": -6.826259136199951, "global_step": 144658, "epoch": 3444} {"train_loss": -6.8325653076171875, "global_step": 144659, "epoch": 3444} {"train_loss": -6.90544319152832, "global_step": 144660, "epoch": 3444} {"train_loss": -6.792359352111816, "global_step": 144661, "epoch": 3444} {"train_loss": -6.807736873626709, "global_step": 144662, "epoch": 3444} {"train_loss": -6.842695713043213, "global_step": 144663, "epoch": 3444} {"train_loss": -6.854381084442139, "global_step": 144664, "epoch": 3444} {"train_loss": -6.845739364624023, "global_step": 144665, "epoch": 3444} {"train_loss": -6.906421661376953, "global_step": 144666, "epoch": 3444} {"train_loss": -6.94349479675293, "global_step": 144667, "epoch": 3444} {"train_loss": -6.759371280670166, "global_step": 144668, "epoch": 3444} {"train_loss": -6.818122863769531, "global_step": 144669, "epoch": 3444} {"train_loss": -6.737645626068115, "global_step": 144670, "epoch": 3444} {"train_loss": -6.646364212036133, "global_step": 144671, "epoch": 3444} {"train_loss": -6.791386604309082, "global_step": 144672, "epoch": 3444} {"train_loss": -6.743081092834473, "global_step": 144673, "epoch": 3444} {"train_loss": -6.78075647354126, "global_step": 144674, "epoch": 3444} {"train_loss": -6.685969352722168, "global_step": 144675, "epoch": 3444} {"train_loss": -6.7434563636779785, "global_step": 144676, "epoch": 3444} {"train_loss": -6.869699954986572, "global_step": 144677, "epoch": 3444} {"train_loss": -6.845317363739014, "global_step": 144678, "epoch": 3444} {"train_loss": -6.699461936950684, "global_step": 144679, "epoch": 3444} {"train_loss": -6.837447166442871, "global_step": 144680, "epoch": 3444} {"train_loss": -6.8602399826049805, "global_step": 144681, "epoch": 3444} {"train_loss": -6.717038154602051, "global_step": 144682, "epoch": 3444} {"train_loss": -6.855391502380371, "global_step": 144683, "epoch": 3444} {"train_loss": -6.579148292541504, "global_step": 144684, "epoch": 3444} {"train_loss": -6.792453765869141, "global_step": 144685, "epoch": 3444} {"train_loss": -6.801525592803955, "global_step": 144686, "epoch": 3444} {"train_loss": -6.727376937866211, "global_step": 144687, "epoch": 3444} {"train_loss": -6.898346424102783, "global_step": 144688, "epoch": 3444} {"train_loss": -6.810177814392817, "global_step": 144689, "epoch": 3444, "val_loss": 78837.6875} {"train_loss": -6.7331953048706055, "global_step": 144690, "epoch": 3445} {"train_loss": -6.743413925170898, "global_step": 144691, "epoch": 3445} {"train_loss": -6.819784164428711, "global_step": 144692, "epoch": 3445} {"train_loss": -6.684592247009277, "global_step": 144693, "epoch": 3445} {"train_loss": -6.736625671386719, "global_step": 144694, "epoch": 3445} {"train_loss": -6.781224250793457, "global_step": 144695, "epoch": 3445} {"train_loss": -6.712269306182861, "global_step": 144696, "epoch": 3445} {"train_loss": -6.717368125915527, "global_step": 144697, "epoch": 3445} {"train_loss": -6.790246486663818, "global_step": 144698, "epoch": 3445} {"train_loss": -6.760547161102295, "global_step": 144699, "epoch": 3445} {"train_loss": -6.872138977050781, "global_step": 144700, "epoch": 3445} {"train_loss": -6.73355770111084, "global_step": 144701, "epoch": 3445} {"train_loss": -6.687686443328857, "global_step": 144702, "epoch": 3445} {"train_loss": -6.901384353637695, "global_step": 144703, "epoch": 3445} {"train_loss": -6.803010940551758, "global_step": 144704, "epoch": 3445} {"train_loss": -6.638751029968262, "global_step": 144705, "epoch": 3445} {"train_loss": -6.748353004455566, "global_step": 144706, "epoch": 3445} {"train_loss": -6.9116950035095215, "global_step": 144707, "epoch": 3445} {"train_loss": -6.807314872741699, "global_step": 144708, "epoch": 3445} {"train_loss": -6.897915840148926, "global_step": 144709, "epoch": 3445} {"train_loss": -6.859623908996582, "global_step": 144710, "epoch": 3445} {"train_loss": -6.865461349487305, "global_step": 144711, "epoch": 3445} {"train_loss": -6.891528129577637, "global_step": 144712, "epoch": 3445} {"train_loss": -6.866264343261719, "global_step": 144713, "epoch": 3445} {"train_loss": -6.920090675354004, "global_step": 144714, "epoch": 3445} {"train_loss": -6.752190589904785, "global_step": 144715, "epoch": 3445} {"train_loss": -6.779275894165039, "global_step": 144716, "epoch": 3445} {"train_loss": -6.74077033996582, "global_step": 144717, "epoch": 3445} {"train_loss": -6.714729309082031, "global_step": 144718, "epoch": 3445} {"train_loss": -6.703183174133301, "global_step": 144719, "epoch": 3445} {"train_loss": -6.859861850738525, "global_step": 144720, "epoch": 3445} {"train_loss": -6.720243453979492, "global_step": 144721, "epoch": 3445} {"train_loss": -6.791721820831299, "global_step": 144722, "epoch": 3445} {"train_loss": -6.853374481201172, "global_step": 144723, "epoch": 3445} {"train_loss": -6.759387016296387, "global_step": 144724, "epoch": 3445} {"train_loss": -6.836484909057617, "global_step": 144725, "epoch": 3445} {"train_loss": -6.750176906585693, "global_step": 144726, "epoch": 3445} {"train_loss": -6.7849602699279785, "global_step": 144727, "epoch": 3445} {"train_loss": -6.81782341003418, "global_step": 144728, "epoch": 3445} {"train_loss": -6.703145980834961, "global_step": 144729, "epoch": 3445} {"train_loss": -6.7491607666015625, "global_step": 144730, "epoch": 3445} {"train_loss": -6.785938864662533, "global_step": 144731, "epoch": 3445, "val_loss": 78329.65625} {"train_loss": -6.806769371032715, "global_step": 144732, "epoch": 3446} {"train_loss": -6.81096076965332, "global_step": 144733, "epoch": 3446} {"train_loss": -6.789222717285156, "global_step": 144734, "epoch": 3446} {"train_loss": -6.811502456665039, "global_step": 144735, "epoch": 3446} {"train_loss": -6.815521240234375, "global_step": 144736, "epoch": 3446} {"train_loss": -6.890973091125488, "global_step": 144737, "epoch": 3446} {"train_loss": -6.780930042266846, "global_step": 144738, "epoch": 3446} {"train_loss": -6.849257469177246, "global_step": 144739, "epoch": 3446} {"train_loss": -6.908447742462158, "global_step": 144740, "epoch": 3446} {"train_loss": -6.84318208694458, "global_step": 144741, "epoch": 3446} {"train_loss": -6.798202991485596, "global_step": 144742, "epoch": 3446} {"train_loss": -6.768991470336914, "global_step": 144743, "epoch": 3446} {"train_loss": -6.854257106781006, "global_step": 144744, "epoch": 3446} {"train_loss": -6.9208574295043945, "global_step": 144745, "epoch": 3446} {"train_loss": -6.845297813415527, "global_step": 144746, "epoch": 3446} {"train_loss": -6.794766902923584, "global_step": 144747, "epoch": 3446} {"train_loss": -6.919545650482178, "global_step": 144748, "epoch": 3446} {"train_loss": -6.774855613708496, "global_step": 144749, "epoch": 3446} {"train_loss": -6.813600063323975, "global_step": 144750, "epoch": 3446} {"train_loss": -6.750087738037109, "global_step": 144751, "epoch": 3446} {"train_loss": -6.862694263458252, "global_step": 144752, "epoch": 3446} {"train_loss": -6.75251579284668, "global_step": 144753, "epoch": 3446} {"train_loss": -6.905240058898926, "global_step": 144754, "epoch": 3446} {"train_loss": -6.8955769538879395, "global_step": 144755, "epoch": 3446} {"train_loss": -6.782209873199463, "global_step": 144756, "epoch": 3446} {"train_loss": -6.839566230773926, "global_step": 144757, "epoch": 3446} {"train_loss": -6.774425506591797, "global_step": 144758, "epoch": 3446} {"train_loss": -6.808147430419922, "global_step": 144759, "epoch": 3446} {"train_loss": -6.914716720581055, "global_step": 144760, "epoch": 3446} {"train_loss": -6.876755714416504, "global_step": 144761, "epoch": 3446} {"train_loss": -6.683076858520508, "global_step": 144762, "epoch": 3446} {"train_loss": -6.824667930603027, "global_step": 144763, "epoch": 3446} {"train_loss": -6.856904983520508, "global_step": 144764, "epoch": 3446} {"train_loss": -6.767375469207764, "global_step": 144765, "epoch": 3446} {"train_loss": -6.781526565551758, "global_step": 144766, "epoch": 3446} {"train_loss": -6.733304977416992, "global_step": 144767, "epoch": 3446} {"train_loss": -6.776943206787109, "global_step": 144768, "epoch": 3446} {"train_loss": -6.7610673904418945, "global_step": 144769, "epoch": 3446} {"train_loss": -6.75834846496582, "global_step": 144770, "epoch": 3446} {"train_loss": -6.785771369934082, "global_step": 144771, "epoch": 3446} {"train_loss": -6.733578205108643, "global_step": 144772, "epoch": 3446} {"train_loss": -6.814144055048625, "global_step": 144773, "epoch": 3446, "val_loss": 78540.0625} {"train_loss": -6.7790422439575195, "global_step": 144774, "epoch": 3447} {"train_loss": -6.793684959411621, "global_step": 144775, "epoch": 3447} {"train_loss": -6.75985050201416, "global_step": 144776, "epoch": 3447} {"train_loss": -6.79852819442749, "global_step": 144777, "epoch": 3447} {"train_loss": -6.939394950866699, "global_step": 144778, "epoch": 3447} {"train_loss": -6.82814884185791, "global_step": 144779, "epoch": 3447} {"train_loss": -6.835727691650391, "global_step": 144780, "epoch": 3447} {"train_loss": -6.707518577575684, "global_step": 144781, "epoch": 3447} {"train_loss": -6.908342361450195, "global_step": 144782, "epoch": 3447} {"train_loss": -6.793093681335449, "global_step": 144783, "epoch": 3447} {"train_loss": -6.815428733825684, "global_step": 144784, "epoch": 3447} {"train_loss": -6.871197700500488, "global_step": 144785, "epoch": 3447} {"train_loss": -6.791473865509033, "global_step": 144786, "epoch": 3447} {"train_loss": -6.786365509033203, "global_step": 144787, "epoch": 3447} {"train_loss": -6.776318550109863, "global_step": 144788, "epoch": 3447} {"train_loss": -6.841861248016357, "global_step": 144789, "epoch": 3447} {"train_loss": -6.947134017944336, "global_step": 144790, "epoch": 3447} {"train_loss": -6.853980541229248, "global_step": 144791, "epoch": 3447} {"train_loss": -6.913512706756592, "global_step": 144792, "epoch": 3447} {"train_loss": -6.951814651489258, "global_step": 144793, "epoch": 3447} {"train_loss": -6.857515335083008, "global_step": 144794, "epoch": 3447} {"train_loss": -6.872717380523682, "global_step": 144795, "epoch": 3447} {"train_loss": -6.762843608856201, "global_step": 144796, "epoch": 3447} {"train_loss": -6.738447189331055, "global_step": 144797, "epoch": 3447} {"train_loss": -6.771869659423828, "global_step": 144798, "epoch": 3447} {"train_loss": -6.809506893157959, "global_step": 144799, "epoch": 3447} {"train_loss": -6.791623592376709, "global_step": 144800, "epoch": 3447} {"train_loss": -6.841918468475342, "global_step": 144801, "epoch": 3447} {"train_loss": -6.890685081481934, "global_step": 144802, "epoch": 3447} {"train_loss": -6.786421775817871, "global_step": 144803, "epoch": 3447} {"train_loss": -6.874612808227539, "global_step": 144804, "epoch": 3447} {"train_loss": -6.772562026977539, "global_step": 144805, "epoch": 3447} {"train_loss": -6.861088275909424, "global_step": 144806, "epoch": 3447} {"train_loss": -6.839453220367432, "global_step": 144807, "epoch": 3447} {"train_loss": -6.797503471374512, "global_step": 144808, "epoch": 3447} {"train_loss": -6.751653671264648, "global_step": 144809, "epoch": 3447} {"train_loss": -6.776450157165527, "global_step": 144810, "epoch": 3447} {"train_loss": -6.658246040344238, "global_step": 144811, "epoch": 3447} {"train_loss": -6.854706287384033, "global_step": 144812, "epoch": 3447} {"train_loss": -6.803402900695801, "global_step": 144813, "epoch": 3447} {"train_loss": -6.7835798263549805, "global_step": 144814, "epoch": 3447} {"train_loss": -6.8176862966446645, "global_step": 144815, "epoch": 3447, "val_loss": 78297.609375} {"train_loss": -6.868691444396973, "global_step": 144816, "epoch": 3448} {"train_loss": -6.794844627380371, "global_step": 144817, "epoch": 3448} {"train_loss": -6.709212779998779, "global_step": 144818, "epoch": 3448} {"train_loss": -6.8304548263549805, "global_step": 144819, "epoch": 3448} {"train_loss": -6.81862735748291, "global_step": 144820, "epoch": 3448} {"train_loss": -6.873442649841309, "global_step": 144821, "epoch": 3448} {"train_loss": -6.7465009689331055, "global_step": 144822, "epoch": 3448} {"train_loss": -6.781510353088379, "global_step": 144823, "epoch": 3448} {"train_loss": -6.807121276855469, "global_step": 144824, "epoch": 3448} {"train_loss": -6.789436340332031, "global_step": 144825, "epoch": 3448} {"train_loss": -6.732828140258789, "global_step": 144826, "epoch": 3448} {"train_loss": -6.963663578033447, "global_step": 144827, "epoch": 3448} {"train_loss": -6.817968368530273, "global_step": 144828, "epoch": 3448} {"train_loss": -6.72541618347168, "global_step": 144829, "epoch": 3448} {"train_loss": -6.787876129150391, "global_step": 144830, "epoch": 3448} {"train_loss": -6.7831315994262695, "global_step": 144831, "epoch": 3448} {"train_loss": -6.850680351257324, "global_step": 144832, "epoch": 3448} {"train_loss": -6.8621392250061035, "global_step": 144833, "epoch": 3448} {"train_loss": -6.838775634765625, "global_step": 144834, "epoch": 3448} {"train_loss": -6.66215705871582, "global_step": 144835, "epoch": 3448} {"train_loss": -6.8796067237854, "global_step": 144836, "epoch": 3448} {"train_loss": -6.863941669464111, "global_step": 144837, "epoch": 3448} {"train_loss": -6.7581024169921875, "global_step": 144838, "epoch": 3448} {"train_loss": -6.844396591186523, "global_step": 144839, "epoch": 3448} {"train_loss": -6.871922492980957, "global_step": 144840, "epoch": 3448} {"train_loss": -6.834489822387695, "global_step": 144841, "epoch": 3448} {"train_loss": -6.798433303833008, "global_step": 144842, "epoch": 3448} {"train_loss": -6.893336296081543, "global_step": 144843, "epoch": 3448} {"train_loss": -6.886188507080078, "global_step": 144844, "epoch": 3448} {"train_loss": -6.919356822967529, "global_step": 144845, "epoch": 3448} {"train_loss": -6.817234039306641, "global_step": 144846, "epoch": 3448} {"train_loss": -6.781301975250244, "global_step": 144847, "epoch": 3448} {"train_loss": -6.858281135559082, "global_step": 144848, "epoch": 3448} {"train_loss": -6.815356254577637, "global_step": 144849, "epoch": 3448} {"train_loss": -6.848437309265137, "global_step": 144850, "epoch": 3448} {"train_loss": -6.865861415863037, "global_step": 144851, "epoch": 3448} {"train_loss": -6.937544822692871, "global_step": 144852, "epoch": 3448} {"train_loss": -6.89459753036499, "global_step": 144853, "epoch": 3448} {"train_loss": -6.787227630615234, "global_step": 144854, "epoch": 3448} {"train_loss": -6.757227897644043, "global_step": 144855, "epoch": 3448} {"train_loss": -6.877447128295898, "global_step": 144856, "epoch": 3448} {"train_loss": -6.821838242667062, "global_step": 144857, "epoch": 3448, "val_loss": 78595.0859375} {"train_loss": -6.833399772644043, "global_step": 144858, "epoch": 3449} {"train_loss": -6.8975067138671875, "global_step": 144859, "epoch": 3449} {"train_loss": -6.763532638549805, "global_step": 144860, "epoch": 3449} {"train_loss": -6.91939640045166, "global_step": 144861, "epoch": 3449} {"train_loss": -6.77092170715332, "global_step": 144862, "epoch": 3449} {"train_loss": -6.910276889801025, "global_step": 144863, "epoch": 3449} {"train_loss": -6.728794574737549, "global_step": 144864, "epoch": 3449} {"train_loss": -6.791184902191162, "global_step": 144865, "epoch": 3449} {"train_loss": -6.757280349731445, "global_step": 144866, "epoch": 3449} {"train_loss": -6.819692134857178, "global_step": 144867, "epoch": 3449} {"train_loss": -6.772561073303223, "global_step": 144868, "epoch": 3449} {"train_loss": -6.891654968261719, "global_step": 144869, "epoch": 3449} {"train_loss": -6.85007905960083, "global_step": 144870, "epoch": 3449} {"train_loss": -6.800571441650391, "global_step": 144871, "epoch": 3449} {"train_loss": -6.856184959411621, "global_step": 144872, "epoch": 3449} {"train_loss": -6.796018600463867, "global_step": 144873, "epoch": 3449} {"train_loss": -6.814668655395508, "global_step": 144874, "epoch": 3449} {"train_loss": -6.81026554107666, "global_step": 144875, "epoch": 3449} {"train_loss": -6.804671287536621, "global_step": 144876, "epoch": 3449} {"train_loss": -6.701432228088379, "global_step": 144877, "epoch": 3449} {"train_loss": -6.820254802703857, "global_step": 144878, "epoch": 3449} {"train_loss": -6.732946395874023, "global_step": 144879, "epoch": 3449} {"train_loss": -6.692580223083496, "global_step": 144880, "epoch": 3449} {"train_loss": -6.645717620849609, "global_step": 144881, "epoch": 3449} {"train_loss": -6.8052873611450195, "global_step": 144882, "epoch": 3449} {"train_loss": -6.838313102722168, "global_step": 144883, "epoch": 3449} {"train_loss": -6.867837905883789, "global_step": 144884, "epoch": 3449} {"train_loss": -6.699166297912598, "global_step": 144885, "epoch": 3449} {"train_loss": -6.865815162658691, "global_step": 144886, "epoch": 3449} {"train_loss": -6.7717485427856445, "global_step": 144887, "epoch": 3449} {"train_loss": -6.8094563484191895, "global_step": 144888, "epoch": 3449} {"train_loss": -6.802408695220947, "global_step": 144889, "epoch": 3449} {"train_loss": -6.773200035095215, "global_step": 144890, "epoch": 3449} {"train_loss": -6.923795700073242, "global_step": 144891, "epoch": 3449} {"train_loss": -6.856448173522949, "global_step": 144892, "epoch": 3449} {"train_loss": -6.888647079467773, "global_step": 144893, "epoch": 3449} {"train_loss": -7.012660980224609, "global_step": 144894, "epoch": 3449} {"train_loss": -6.761123180389404, "global_step": 144895, "epoch": 3449} {"train_loss": -6.82589054107666, "global_step": 144896, "epoch": 3449} {"train_loss": -6.789438724517822, "global_step": 144897, "epoch": 3449} {"train_loss": -6.798325061798096, "global_step": 144898, "epoch": 3449} {"train_loss": -6.81411135764349, "global_step": 144899, "epoch": 3449, "val_loss": 78340.9609375} {"train_loss": -6.924118518829346, "global_step": 144900, "epoch": 3450} {"train_loss": -6.741268157958984, "global_step": 144901, "epoch": 3450} {"train_loss": -6.668572425842285, "global_step": 144902, "epoch": 3450} {"train_loss": -6.8095574378967285, "global_step": 144903, "epoch": 3450} {"train_loss": -6.844666481018066, "global_step": 144904, "epoch": 3450} {"train_loss": -6.704977989196777, "global_step": 144905, "epoch": 3450} {"train_loss": -6.7844743728637695, "global_step": 144906, "epoch": 3450} {"train_loss": -6.772066116333008, "global_step": 144907, "epoch": 3450} {"train_loss": -6.659405708312988, "global_step": 144908, "epoch": 3450} {"train_loss": -6.745217323303223, "global_step": 144909, "epoch": 3450} {"train_loss": -6.753746032714844, "global_step": 144910, "epoch": 3450} {"train_loss": -6.555332183837891, "global_step": 144911, "epoch": 3450} {"train_loss": -6.877413749694824, "global_step": 144912, "epoch": 3450} {"train_loss": -6.708661079406738, "global_step": 144913, "epoch": 3450} {"train_loss": -6.873065948486328, "global_step": 144914, "epoch": 3450} {"train_loss": -6.976147651672363, "global_step": 144915, "epoch": 3450} {"train_loss": -6.627703666687012, "global_step": 144916, "epoch": 3450} {"train_loss": -6.7450666427612305, "global_step": 144917, "epoch": 3450} {"train_loss": -6.79231071472168, "global_step": 144918, "epoch": 3450} {"train_loss": -6.801619529724121, "global_step": 144919, "epoch": 3450} {"train_loss": -6.781111717224121, "global_step": 144920, "epoch": 3450} {"train_loss": -6.742892265319824, "global_step": 144921, "epoch": 3450} {"train_loss": -6.7997026443481445, "global_step": 144922, "epoch": 3450} {"train_loss": -6.8557820320129395, "global_step": 144923, "epoch": 3450} {"train_loss": -6.6527485847473145, "global_step": 144924, "epoch": 3450} {"train_loss": -6.575173377990723, "global_step": 144925, "epoch": 3450} {"train_loss": -6.696898460388184, "global_step": 144926, "epoch": 3450} {"train_loss": -6.758131504058838, "global_step": 144927, "epoch": 3450} {"train_loss": -6.630980491638184, "global_step": 144928, "epoch": 3450} {"train_loss": -6.788384437561035, "global_step": 144929, "epoch": 3450} {"train_loss": -6.69624137878418, "global_step": 144930, "epoch": 3450} {"train_loss": -6.7206807136535645, "global_step": 144931, "epoch": 3450} {"train_loss": -6.842233180999756, "global_step": 144932, "epoch": 3450} {"train_loss": -6.773347854614258, "global_step": 144933, "epoch": 3450} {"train_loss": -6.758383750915527, "global_step": 144934, "epoch": 3450} {"train_loss": -6.832468032836914, "global_step": 144935, "epoch": 3450} {"train_loss": -6.780186653137207, "global_step": 144936, "epoch": 3450} {"train_loss": -6.853973388671875, "global_step": 144937, "epoch": 3450} {"train_loss": -6.834702491760254, "global_step": 144938, "epoch": 3450} {"train_loss": -6.682187557220459, "global_step": 144939, "epoch": 3450} {"train_loss": -6.810192108154297, "global_step": 144940, "epoch": 3450} {"train_loss": -6.7602156684512185, "global_step": 144941, "epoch": 3450, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.8965380317488869, "train/sim_max_reward_2": 0.45383378545387376, "train/sim_max_reward_3": 0.13721363816874038, "train/sim_max_reward_4": 0.8651235959277043, "train/sim_max_reward_5": 0.8382655695958976, "test/sim_max_reward_4500000": 0.8616413764853311, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.7578887137147536, "test/sim_max_reward_4500003": 0.7809719145947236, "test/sim_max_reward_4500004": 0.23342191743326238, "test/sim_max_reward_4500005": 0.2831198463859101, "test/sim_max_reward_4500006": 0.972431576808049, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.08078581171344833, "test/sim_max_reward_4500009": 0.05352859588002659, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9890461446255117, "test/sim_max_reward_4500012": 0.9002030116493, "test/sim_max_reward_4500013": 0.003300843805836914, "test/sim_max_reward_4500014": 0.3803356908198748, "test/sim_max_reward_4500015": 0.8984578983958413, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.19858084428673803, "test/sim_max_reward_4500018": 0.9725842812451807, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9612405634940507, "test/sim_max_reward_4500022": 0.9650838280176611, "test/sim_max_reward_4500023": 0.5822893801298646, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9554936440511959, "test/sim_max_reward_4500026": 0.9595421976183856, "test/sim_max_reward_4500027": 0.9116509910504943, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.07853609857753395, "test/sim_max_reward_4500030": 0.9743726155827455, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.01446172420974913, "test/sim_max_reward_4500034": 0.9935005842824897, "test/sim_max_reward_4500035": 0.7360508933687004, "test/sim_max_reward_4500036": 0.46888635803278167, "test/sim_max_reward_4500037": 0.9910567686956343, "test/sim_max_reward_4500038": 0.9660280729509734, "test/sim_max_reward_4500039": 0.0, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.9391617607328103, "test/sim_max_reward_4500042": 0.0319524501494338, "test/sim_max_reward_4500043": 0.19616232289987565, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.821715688859444, "test/sim_max_reward_4500046": 0.2195593852190503, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 0.9826691272655659, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5635453529168591, "test/mean_score": 0.5157070261512878, "val_loss": 78675.9765625} {"train_loss": -6.861359596252441, "global_step": 144942, "epoch": 3451} {"train_loss": -6.6889872550964355, "global_step": 144943, "epoch": 3451} {"train_loss": -6.8513288497924805, "global_step": 144944, "epoch": 3451} {"train_loss": -6.906308174133301, "global_step": 144945, "epoch": 3451} {"train_loss": -6.721583366394043, "global_step": 144946, "epoch": 3451} {"train_loss": -6.763376712799072, "global_step": 144947, "epoch": 3451} {"train_loss": -6.772955894470215, "global_step": 144948, "epoch": 3451} {"train_loss": -6.870363712310791, "global_step": 144949, "epoch": 3451} {"train_loss": -6.7698588371276855, "global_step": 144950, "epoch": 3451} {"train_loss": -6.688650131225586, "global_step": 144951, "epoch": 3451} {"train_loss": -6.816926956176758, "global_step": 144952, "epoch": 3451} {"train_loss": -6.848552227020264, "global_step": 144953, "epoch": 3451} {"train_loss": -6.755825519561768, "global_step": 144954, "epoch": 3451} {"train_loss": -6.936966896057129, "global_step": 144955, "epoch": 3451} {"train_loss": -6.8315839767456055, "global_step": 144956, "epoch": 3451} {"train_loss": -6.901275634765625, "global_step": 144957, "epoch": 3451} {"train_loss": -6.8822021484375, "global_step": 144958, "epoch": 3451} {"train_loss": -6.826918601989746, "global_step": 144959, "epoch": 3451} {"train_loss": -6.845522403717041, "global_step": 144960, "epoch": 3451} {"train_loss": -6.719651222229004, "global_step": 144961, "epoch": 3451} {"train_loss": -6.863630294799805, "global_step": 144962, "epoch": 3451} {"train_loss": -6.8044281005859375, "global_step": 144963, "epoch": 3451} {"train_loss": -6.7516374588012695, "global_step": 144964, "epoch": 3451} {"train_loss": -6.765429973602295, "global_step": 144965, "epoch": 3451} {"train_loss": -6.821136951446533, "global_step": 144966, "epoch": 3451} {"train_loss": -6.87135124206543, "global_step": 144967, "epoch": 3451} {"train_loss": -6.8011474609375, "global_step": 144968, "epoch": 3451} {"train_loss": -6.606739044189453, "global_step": 144969, "epoch": 3451} {"train_loss": -6.786874294281006, "global_step": 144970, "epoch": 3451} {"train_loss": -6.765288829803467, "global_step": 144971, "epoch": 3451} {"train_loss": -6.642512321472168, "global_step": 144972, "epoch": 3451} {"train_loss": -6.70569372177124, "global_step": 144973, "epoch": 3451} {"train_loss": -6.777941703796387, "global_step": 144974, "epoch": 3451} {"train_loss": -6.578622817993164, "global_step": 144975, "epoch": 3451} {"train_loss": -6.771482467651367, "global_step": 144976, "epoch": 3451} {"train_loss": -6.729153633117676, "global_step": 144977, "epoch": 3451} {"train_loss": -6.631230354309082, "global_step": 144978, "epoch": 3451} {"train_loss": -6.82491397857666, "global_step": 144979, "epoch": 3451} {"train_loss": -6.645161151885986, "global_step": 144980, "epoch": 3451} {"train_loss": -6.6970062255859375, "global_step": 144981, "epoch": 3451} {"train_loss": -6.753750801086426, "global_step": 144982, "epoch": 3451} {"train_loss": -6.7748911153702505, "global_step": 144983, "epoch": 3451, "val_loss": 78384.40625} {"train_loss": -6.813594818115234, "global_step": 144984, "epoch": 3452} {"train_loss": -6.775750160217285, "global_step": 144985, "epoch": 3452} {"train_loss": -6.742759704589844, "global_step": 144986, "epoch": 3452} {"train_loss": -6.693288803100586, "global_step": 144987, "epoch": 3452} {"train_loss": -6.877103328704834, "global_step": 144988, "epoch": 3452} {"train_loss": -6.70721435546875, "global_step": 144989, "epoch": 3452} {"train_loss": -6.846464157104492, "global_step": 144990, "epoch": 3452} {"train_loss": -6.808298110961914, "global_step": 144991, "epoch": 3452} {"train_loss": -6.770144462585449, "global_step": 144992, "epoch": 3452} {"train_loss": -6.799943923950195, "global_step": 144993, "epoch": 3452} {"train_loss": -6.766493797302246, "global_step": 144994, "epoch": 3452} {"train_loss": -6.768708229064941, "global_step": 144995, "epoch": 3452} {"train_loss": -6.72905158996582, "global_step": 144996, "epoch": 3452} {"train_loss": -6.636859893798828, "global_step": 144997, "epoch": 3452} {"train_loss": -6.703988075256348, "global_step": 144998, "epoch": 3452} {"train_loss": -6.985069751739502, "global_step": 144999, "epoch": 3452} {"train_loss": -6.761993408203125, "global_step": 145000, "epoch": 3452} {"train_loss": -6.804849624633789, "global_step": 145001, "epoch": 3452} {"train_loss": -6.774442672729492, "global_step": 145002, "epoch": 3452} {"train_loss": -6.891809463500977, "global_step": 145003, "epoch": 3452} {"train_loss": -6.7691650390625, "global_step": 145004, "epoch": 3452} {"train_loss": -6.923227310180664, "global_step": 145005, "epoch": 3452} {"train_loss": -6.9178900718688965, "global_step": 145006, "epoch": 3452} {"train_loss": -6.902549743652344, "global_step": 145007, "epoch": 3452} {"train_loss": -6.9006781578063965, "global_step": 145008, "epoch": 3452} {"train_loss": -6.88831901550293, "global_step": 145009, "epoch": 3452} {"train_loss": -6.871635437011719, "global_step": 145010, "epoch": 3452} {"train_loss": -6.926640033721924, "global_step": 145011, "epoch": 3452} {"train_loss": -6.874138832092285, "global_step": 145012, "epoch": 3452} {"train_loss": -6.892055034637451, "global_step": 145013, "epoch": 3452} {"train_loss": -6.77366828918457, "global_step": 145014, "epoch": 3452} {"train_loss": -6.836204528808594, "global_step": 145015, "epoch": 3452} {"train_loss": -6.850704193115234, "global_step": 145016, "epoch": 3452} {"train_loss": -6.897144317626953, "global_step": 145017, "epoch": 3452} {"train_loss": -6.7837419509887695, "global_step": 145018, "epoch": 3452} {"train_loss": -6.85447883605957, "global_step": 145019, "epoch": 3452} {"train_loss": -6.748070240020752, "global_step": 145020, "epoch": 3452} {"train_loss": -6.838253498077393, "global_step": 145021, "epoch": 3452} {"train_loss": -6.878496170043945, "global_step": 145022, "epoch": 3452} {"train_loss": -6.819404125213623, "global_step": 145023, "epoch": 3452} {"train_loss": -6.725527286529541, "global_step": 145024, "epoch": 3452} {"train_loss": -6.8194545450664705, "global_step": 145025, "epoch": 3452, "val_loss": 78276.5390625} {"train_loss": -6.807356357574463, "global_step": 145026, "epoch": 3453} {"train_loss": -7.03000545501709, "global_step": 145027, "epoch": 3453} {"train_loss": -6.783716201782227, "global_step": 145028, "epoch": 3453} {"train_loss": -6.80936336517334, "global_step": 145029, "epoch": 3453} {"train_loss": -6.738608360290527, "global_step": 145030, "epoch": 3453} {"train_loss": -6.81410026550293, "global_step": 145031, "epoch": 3453} {"train_loss": -6.811139106750488, "global_step": 145032, "epoch": 3453} {"train_loss": -6.859715461730957, "global_step": 145033, "epoch": 3453} {"train_loss": -6.804934978485107, "global_step": 145034, "epoch": 3453} {"train_loss": -6.9653120040893555, "global_step": 145035, "epoch": 3453} {"train_loss": -6.747862339019775, "global_step": 145036, "epoch": 3453} {"train_loss": -6.812984466552734, "global_step": 145037, "epoch": 3453} {"train_loss": -6.874368667602539, "global_step": 145038, "epoch": 3453} {"train_loss": -6.777309417724609, "global_step": 145039, "epoch": 3453} {"train_loss": -6.936410903930664, "global_step": 145040, "epoch": 3453} {"train_loss": -6.852329254150391, "global_step": 145041, "epoch": 3453} {"train_loss": -6.935290813446045, "global_step": 145042, "epoch": 3453} {"train_loss": -6.81807279586792, "global_step": 145043, "epoch": 3453} {"train_loss": -6.825072288513184, "global_step": 145044, "epoch": 3453} {"train_loss": -6.983355522155762, "global_step": 145045, "epoch": 3453} {"train_loss": -6.739816665649414, "global_step": 145046, "epoch": 3453} {"train_loss": -6.7710394859313965, "global_step": 145047, "epoch": 3453} {"train_loss": -6.918844223022461, "global_step": 145048, "epoch": 3453} {"train_loss": -6.944499969482422, "global_step": 145049, "epoch": 3453} {"train_loss": -6.795998573303223, "global_step": 145050, "epoch": 3453} {"train_loss": -6.907842636108398, "global_step": 145051, "epoch": 3453} {"train_loss": -6.849968910217285, "global_step": 145052, "epoch": 3453} {"train_loss": -6.851279258728027, "global_step": 145053, "epoch": 3453} {"train_loss": -6.793232440948486, "global_step": 145054, "epoch": 3453} {"train_loss": -6.81236457824707, "global_step": 145055, "epoch": 3453} {"train_loss": -6.9010725021362305, "global_step": 145056, "epoch": 3453} {"train_loss": -6.749398231506348, "global_step": 145057, "epoch": 3453} {"train_loss": -6.764928817749023, "global_step": 145058, "epoch": 3453} {"train_loss": -6.790592193603516, "global_step": 145059, "epoch": 3453} {"train_loss": -6.601970195770264, "global_step": 145060, "epoch": 3453} {"train_loss": -6.523192882537842, "global_step": 145061, "epoch": 3453} {"train_loss": -6.714140892028809, "global_step": 145062, "epoch": 3453} {"train_loss": -6.530526161193848, "global_step": 145063, "epoch": 3453} {"train_loss": -6.62758731842041, "global_step": 145064, "epoch": 3453} {"train_loss": -6.680879592895508, "global_step": 145065, "epoch": 3453} {"train_loss": -6.575212478637695, "global_step": 145066, "epoch": 3453} {"train_loss": -6.797468367077055, "global_step": 145067, "epoch": 3453, "val_loss": 79154.03125} {"train_loss": -6.460101127624512, "global_step": 145068, "epoch": 3454} {"train_loss": -6.618926048278809, "global_step": 145069, "epoch": 3454} {"train_loss": -6.4719133377075195, "global_step": 145070, "epoch": 3454} {"train_loss": -6.673219680786133, "global_step": 145071, "epoch": 3454} {"train_loss": -6.533561706542969, "global_step": 145072, "epoch": 3454} {"train_loss": -6.70435905456543, "global_step": 145073, "epoch": 3454} {"train_loss": -6.570969581604004, "global_step": 145074, "epoch": 3454} {"train_loss": -6.69413948059082, "global_step": 145075, "epoch": 3454} {"train_loss": -6.5669355392456055, "global_step": 145076, "epoch": 3454} {"train_loss": -6.630753040313721, "global_step": 145077, "epoch": 3454} {"train_loss": -6.651683807373047, "global_step": 145078, "epoch": 3454} {"train_loss": -6.537714004516602, "global_step": 145079, "epoch": 3454} {"train_loss": -6.600992202758789, "global_step": 145080, "epoch": 3454} {"train_loss": -6.546985626220703, "global_step": 145081, "epoch": 3454} {"train_loss": -6.689211845397949, "global_step": 145082, "epoch": 3454} {"train_loss": -6.523210525512695, "global_step": 145083, "epoch": 3454} {"train_loss": -6.676872253417969, "global_step": 145084, "epoch": 3454} {"train_loss": -6.6425957679748535, "global_step": 145085, "epoch": 3454} {"train_loss": -6.654544830322266, "global_step": 145086, "epoch": 3454} {"train_loss": -6.734675407409668, "global_step": 145087, "epoch": 3454} {"train_loss": -6.551093578338623, "global_step": 145088, "epoch": 3454} {"train_loss": -6.621518135070801, "global_step": 145089, "epoch": 3454} {"train_loss": -6.741522789001465, "global_step": 145090, "epoch": 3454} {"train_loss": -6.725834369659424, "global_step": 145091, "epoch": 3454} {"train_loss": -6.653347492218018, "global_step": 145092, "epoch": 3454} {"train_loss": -6.731542110443115, "global_step": 145093, "epoch": 3454} {"train_loss": -6.756158351898193, "global_step": 145094, "epoch": 3454} {"train_loss": -6.81348991394043, "global_step": 145095, "epoch": 3454} {"train_loss": -6.8150787353515625, "global_step": 145096, "epoch": 3454} {"train_loss": -6.773346424102783, "global_step": 145097, "epoch": 3454} {"train_loss": -6.8127899169921875, "global_step": 145098, "epoch": 3454} {"train_loss": -6.80380916595459, "global_step": 145099, "epoch": 3454} {"train_loss": -6.927642822265625, "global_step": 145100, "epoch": 3454} {"train_loss": -6.76445198059082, "global_step": 145101, "epoch": 3454} {"train_loss": -6.763658046722412, "global_step": 145102, "epoch": 3454} {"train_loss": -6.704980850219727, "global_step": 145103, "epoch": 3454} {"train_loss": -6.766942501068115, "global_step": 145104, "epoch": 3454} {"train_loss": -6.941652774810791, "global_step": 145105, "epoch": 3454} {"train_loss": -6.805424690246582, "global_step": 145106, "epoch": 3454} {"train_loss": -6.675868988037109, "global_step": 145107, "epoch": 3454} {"train_loss": -6.848541259765625, "global_step": 145108, "epoch": 3454} {"train_loss": -6.691571814673288, "global_step": 145109, "epoch": 3454, "val_loss": 78466.09375} {"train_loss": -6.879081726074219, "global_step": 145110, "epoch": 3455} {"train_loss": -6.703289985656738, "global_step": 145111, "epoch": 3455} {"train_loss": -6.813338279724121, "global_step": 145112, "epoch": 3455} {"train_loss": -6.769599914550781, "global_step": 145113, "epoch": 3455} {"train_loss": -6.707151889801025, "global_step": 145114, "epoch": 3455} {"train_loss": -6.858343124389648, "global_step": 145115, "epoch": 3455} {"train_loss": -6.721117973327637, "global_step": 145116, "epoch": 3455} {"train_loss": -6.810876846313477, "global_step": 145117, "epoch": 3455} {"train_loss": -6.858772277832031, "global_step": 145118, "epoch": 3455} {"train_loss": -6.890773773193359, "global_step": 145119, "epoch": 3455} {"train_loss": -6.843164920806885, "global_step": 145120, "epoch": 3455} {"train_loss": -6.693848609924316, "global_step": 145121, "epoch": 3455} {"train_loss": -6.719862937927246, "global_step": 145122, "epoch": 3455} {"train_loss": -6.800929546356201, "global_step": 145123, "epoch": 3455} {"train_loss": -6.817981719970703, "global_step": 145124, "epoch": 3455} {"train_loss": -6.760321617126465, "global_step": 145125, "epoch": 3455} {"train_loss": -6.7068681716918945, "global_step": 145126, "epoch": 3455} {"train_loss": -6.863251686096191, "global_step": 145127, "epoch": 3455} {"train_loss": -6.676515102386475, "global_step": 145128, "epoch": 3455} {"train_loss": -6.872390270233154, "global_step": 145129, "epoch": 3455} {"train_loss": -6.769875526428223, "global_step": 145130, "epoch": 3455} {"train_loss": -6.728964328765869, "global_step": 145131, "epoch": 3455} {"train_loss": -6.643877983093262, "global_step": 145132, "epoch": 3455} {"train_loss": -6.688671112060547, "global_step": 145133, "epoch": 3455} {"train_loss": -6.683587074279785, "global_step": 145134, "epoch": 3455} {"train_loss": -6.65977668762207, "global_step": 145135, "epoch": 3455} {"train_loss": -6.841116428375244, "global_step": 145136, "epoch": 3455} {"train_loss": -6.653475761413574, "global_step": 145137, "epoch": 3455} {"train_loss": -6.741333484649658, "global_step": 145138, "epoch": 3455} {"train_loss": -6.707291126251221, "global_step": 145139, "epoch": 3455} {"train_loss": -6.808505058288574, "global_step": 145140, "epoch": 3455} {"train_loss": -6.846673011779785, "global_step": 145141, "epoch": 3455} {"train_loss": -6.814425945281982, "global_step": 145142, "epoch": 3455} {"train_loss": -6.801530838012695, "global_step": 145143, "epoch": 3455} {"train_loss": -6.739243507385254, "global_step": 145144, "epoch": 3455} {"train_loss": -6.760200500488281, "global_step": 145145, "epoch": 3455} {"train_loss": -6.818697452545166, "global_step": 145146, "epoch": 3455} {"train_loss": -6.728543281555176, "global_step": 145147, "epoch": 3455} {"train_loss": -6.848971366882324, "global_step": 145148, "epoch": 3455} {"train_loss": -6.806331157684326, "global_step": 145149, "epoch": 3455} {"train_loss": -6.684928894042969, "global_step": 145150, "epoch": 3455} {"train_loss": -6.768539723895845, "global_step": 145151, "epoch": 3455, "val_loss": 78524.375} {"train_loss": -6.823910713195801, "global_step": 145152, "epoch": 3456} {"train_loss": -6.760903358459473, "global_step": 145153, "epoch": 3456} {"train_loss": -6.820691108703613, "global_step": 145154, "epoch": 3456} {"train_loss": -6.6538310050964355, "global_step": 145155, "epoch": 3456} {"train_loss": -6.758896827697754, "global_step": 145156, "epoch": 3456} {"train_loss": -6.780848503112793, "global_step": 145157, "epoch": 3456} {"train_loss": -6.676951885223389, "global_step": 145158, "epoch": 3456} {"train_loss": -6.801936149597168, "global_step": 145159, "epoch": 3456} {"train_loss": -6.847348213195801, "global_step": 145160, "epoch": 3456} {"train_loss": -6.763124465942383, "global_step": 145161, "epoch": 3456} {"train_loss": -6.744393348693848, "global_step": 145162, "epoch": 3456} {"train_loss": -6.843073844909668, "global_step": 145163, "epoch": 3456} {"train_loss": -6.802051067352295, "global_step": 145164, "epoch": 3456} {"train_loss": -6.815929889678955, "global_step": 145165, "epoch": 3456} {"train_loss": -6.905834197998047, "global_step": 145166, "epoch": 3456} {"train_loss": -6.858339786529541, "global_step": 145167, "epoch": 3456} {"train_loss": -6.814255714416504, "global_step": 145168, "epoch": 3456} {"train_loss": -6.775087356567383, "global_step": 145169, "epoch": 3456} {"train_loss": -6.790778160095215, "global_step": 145170, "epoch": 3456} {"train_loss": -6.821042060852051, "global_step": 145171, "epoch": 3456} {"train_loss": -6.822161674499512, "global_step": 145172, "epoch": 3456} {"train_loss": -6.877859592437744, "global_step": 145173, "epoch": 3456} {"train_loss": -6.822846412658691, "global_step": 145174, "epoch": 3456} {"train_loss": -6.731941223144531, "global_step": 145175, "epoch": 3456} {"train_loss": -6.886789798736572, "global_step": 145176, "epoch": 3456} {"train_loss": -6.810868263244629, "global_step": 145177, "epoch": 3456} {"train_loss": -6.79534912109375, "global_step": 145178, "epoch": 3456} {"train_loss": -6.998692989349365, "global_step": 145179, "epoch": 3456} {"train_loss": -6.733219146728516, "global_step": 145180, "epoch": 3456} {"train_loss": -6.790363788604736, "global_step": 145181, "epoch": 3456} {"train_loss": -6.716826438903809, "global_step": 145182, "epoch": 3456} {"train_loss": -6.824562072753906, "global_step": 145183, "epoch": 3456} {"train_loss": -6.868226051330566, "global_step": 145184, "epoch": 3456} {"train_loss": -6.711265563964844, "global_step": 145185, "epoch": 3456} {"train_loss": -6.7523932456970215, "global_step": 145186, "epoch": 3456} {"train_loss": -6.822474956512451, "global_step": 145187, "epoch": 3456} {"train_loss": -6.689400672912598, "global_step": 145188, "epoch": 3456} {"train_loss": -6.676337242126465, "global_step": 145189, "epoch": 3456} {"train_loss": -6.893415451049805, "global_step": 145190, "epoch": 3456} {"train_loss": -6.794030666351318, "global_step": 145191, "epoch": 3456} {"train_loss": -6.804014205932617, "global_step": 145192, "epoch": 3456} {"train_loss": -6.79517776625497, "global_step": 145193, "epoch": 3456, "val_loss": 78405.953125} {"train_loss": -6.74937629699707, "global_step": 145194, "epoch": 3457} {"train_loss": -6.7849907875061035, "global_step": 145195, "epoch": 3457} {"train_loss": -6.816620826721191, "global_step": 145196, "epoch": 3457} {"train_loss": -6.84965705871582, "global_step": 145197, "epoch": 3457} {"train_loss": -6.845276832580566, "global_step": 145198, "epoch": 3457} {"train_loss": -6.77597713470459, "global_step": 145199, "epoch": 3457} {"train_loss": -6.783686637878418, "global_step": 145200, "epoch": 3457} {"train_loss": -6.7843194007873535, "global_step": 145201, "epoch": 3457} {"train_loss": -6.864589691162109, "global_step": 145202, "epoch": 3457} {"train_loss": -6.876497268676758, "global_step": 145203, "epoch": 3457} {"train_loss": -6.803931713104248, "global_step": 145204, "epoch": 3457} {"train_loss": -6.884636878967285, "global_step": 145205, "epoch": 3457} {"train_loss": -6.759487152099609, "global_step": 145206, "epoch": 3457} {"train_loss": -6.822871208190918, "global_step": 145207, "epoch": 3457} {"train_loss": -6.859374523162842, "global_step": 145208, "epoch": 3457} {"train_loss": -6.8864946365356445, "global_step": 145209, "epoch": 3457} {"train_loss": -6.846583366394043, "global_step": 145210, "epoch": 3457} {"train_loss": -6.954373836517334, "global_step": 145211, "epoch": 3457} {"train_loss": -6.754036903381348, "global_step": 145212, "epoch": 3457} {"train_loss": -6.77863883972168, "global_step": 145213, "epoch": 3457} {"train_loss": -6.85813570022583, "global_step": 145214, "epoch": 3457} {"train_loss": -6.810334205627441, "global_step": 145215, "epoch": 3457} {"train_loss": -6.802210807800293, "global_step": 145216, "epoch": 3457} {"train_loss": -6.798664093017578, "global_step": 145217, "epoch": 3457} {"train_loss": -6.8262481689453125, "global_step": 145218, "epoch": 3457} {"train_loss": -6.823795318603516, "global_step": 145219, "epoch": 3457} {"train_loss": -6.887636184692383, "global_step": 145220, "epoch": 3457} {"train_loss": -6.949106693267822, "global_step": 145221, "epoch": 3457} {"train_loss": -6.8886847496032715, "global_step": 145222, "epoch": 3457} {"train_loss": -6.887752532958984, "global_step": 145223, "epoch": 3457} {"train_loss": -6.7957329750061035, "global_step": 145224, "epoch": 3457} {"train_loss": -6.925455570220947, "global_step": 145225, "epoch": 3457} {"train_loss": -6.811387062072754, "global_step": 145226, "epoch": 3457} {"train_loss": -6.874960899353027, "global_step": 145227, "epoch": 3457} {"train_loss": -6.758284568786621, "global_step": 145228, "epoch": 3457} {"train_loss": -6.883119583129883, "global_step": 145229, "epoch": 3457} {"train_loss": -6.916919231414795, "global_step": 145230, "epoch": 3457} {"train_loss": -6.919547080993652, "global_step": 145231, "epoch": 3457} {"train_loss": -6.758838653564453, "global_step": 145232, "epoch": 3457} {"train_loss": -6.889968395233154, "global_step": 145233, "epoch": 3457} {"train_loss": -6.95956563949585, "global_step": 145234, "epoch": 3457} {"train_loss": -6.842078401928856, "global_step": 145235, "epoch": 3457, "val_loss": 78333.1484375} {"train_loss": -6.814774513244629, "global_step": 145236, "epoch": 3458} {"train_loss": -6.960663318634033, "global_step": 145237, "epoch": 3458} {"train_loss": -6.936132431030273, "global_step": 145238, "epoch": 3458} {"train_loss": -6.89106559753418, "global_step": 145239, "epoch": 3458} {"train_loss": -6.907268047332764, "global_step": 145240, "epoch": 3458} {"train_loss": -6.892470836639404, "global_step": 145241, "epoch": 3458} {"train_loss": -6.8181047439575195, "global_step": 145242, "epoch": 3458} {"train_loss": -6.74207067489624, "global_step": 145243, "epoch": 3458} {"train_loss": -6.87946891784668, "global_step": 145244, "epoch": 3458} {"train_loss": -6.863587379455566, "global_step": 145245, "epoch": 3458} {"train_loss": -6.85517692565918, "global_step": 145246, "epoch": 3458} {"train_loss": -6.838960647583008, "global_step": 145247, "epoch": 3458} {"train_loss": -6.804102897644043, "global_step": 145248, "epoch": 3458} {"train_loss": -6.944101333618164, "global_step": 145249, "epoch": 3458} {"train_loss": -6.931686878204346, "global_step": 145250, "epoch": 3458} {"train_loss": -6.885247230529785, "global_step": 145251, "epoch": 3458} {"train_loss": -6.92791748046875, "global_step": 145252, "epoch": 3458} {"train_loss": -6.798468589782715, "global_step": 145253, "epoch": 3458} {"train_loss": -6.788832664489746, "global_step": 145254, "epoch": 3458} {"train_loss": -6.838591575622559, "global_step": 145255, "epoch": 3458} {"train_loss": -6.840864181518555, "global_step": 145256, "epoch": 3458} {"train_loss": -6.981433868408203, "global_step": 145257, "epoch": 3458} {"train_loss": -6.861886024475098, "global_step": 145258, "epoch": 3458} {"train_loss": -6.755691051483154, "global_step": 145259, "epoch": 3458} {"train_loss": -6.901334762573242, "global_step": 145260, "epoch": 3458} {"train_loss": -6.9695210456848145, "global_step": 145261, "epoch": 3458} {"train_loss": -6.877956390380859, "global_step": 145262, "epoch": 3458} {"train_loss": -6.866128921508789, "global_step": 145263, "epoch": 3458} {"train_loss": -6.818114280700684, "global_step": 145264, "epoch": 3458} {"train_loss": -6.891350746154785, "global_step": 145265, "epoch": 3458} {"train_loss": -6.866186141967773, "global_step": 145266, "epoch": 3458} {"train_loss": -6.782900333404541, "global_step": 145267, "epoch": 3458} {"train_loss": -6.877590656280518, "global_step": 145268, "epoch": 3458} {"train_loss": -6.827919960021973, "global_step": 145269, "epoch": 3458} {"train_loss": -6.876971244812012, "global_step": 145270, "epoch": 3458} {"train_loss": -6.788234710693359, "global_step": 145271, "epoch": 3458} {"train_loss": -6.743196487426758, "global_step": 145272, "epoch": 3458} {"train_loss": -6.874118804931641, "global_step": 145273, "epoch": 3458} {"train_loss": -6.723886489868164, "global_step": 145274, "epoch": 3458} {"train_loss": -6.667059421539307, "global_step": 145275, "epoch": 3458} {"train_loss": -6.788801193237305, "global_step": 145276, "epoch": 3458} {"train_loss": -6.847143093744914, "global_step": 145277, "epoch": 3458, "val_loss": 78148.1796875} {"train_loss": -6.709227561950684, "global_step": 145278, "epoch": 3459} {"train_loss": -6.846982955932617, "global_step": 145279, "epoch": 3459} {"train_loss": -6.879371643066406, "global_step": 145280, "epoch": 3459} {"train_loss": -6.6981916427612305, "global_step": 145281, "epoch": 3459} {"train_loss": -6.734275817871094, "global_step": 145282, "epoch": 3459} {"train_loss": -6.866781711578369, "global_step": 145283, "epoch": 3459} {"train_loss": -6.897539138793945, "global_step": 145284, "epoch": 3459} {"train_loss": -6.665867805480957, "global_step": 145285, "epoch": 3459} {"train_loss": -6.7791428565979, "global_step": 145286, "epoch": 3459} {"train_loss": -6.679664611816406, "global_step": 145287, "epoch": 3459} {"train_loss": -6.886080265045166, "global_step": 145288, "epoch": 3459} {"train_loss": -6.766054153442383, "global_step": 145289, "epoch": 3459} {"train_loss": -6.860358238220215, "global_step": 145290, "epoch": 3459} {"train_loss": -6.781915664672852, "global_step": 145291, "epoch": 3459} {"train_loss": -6.795882701873779, "global_step": 145292, "epoch": 3459} {"train_loss": -6.728694915771484, "global_step": 145293, "epoch": 3459} {"train_loss": -6.716549873352051, "global_step": 145294, "epoch": 3459} {"train_loss": -6.860651016235352, "global_step": 145295, "epoch": 3459} {"train_loss": -6.720972061157227, "global_step": 145296, "epoch": 3459} {"train_loss": -6.85427188873291, "global_step": 145297, "epoch": 3459} {"train_loss": -6.702167510986328, "global_step": 145298, "epoch": 3459} {"train_loss": -6.817440986633301, "global_step": 145299, "epoch": 3459} {"train_loss": -6.8140716552734375, "global_step": 145300, "epoch": 3459} {"train_loss": -6.823761463165283, "global_step": 145301, "epoch": 3459} {"train_loss": -6.798060417175293, "global_step": 145302, "epoch": 3459} {"train_loss": -6.842690944671631, "global_step": 145303, "epoch": 3459} {"train_loss": -6.672759532928467, "global_step": 145304, "epoch": 3459} {"train_loss": -6.9044904708862305, "global_step": 145305, "epoch": 3459} {"train_loss": -6.850528717041016, "global_step": 145306, "epoch": 3459} {"train_loss": -6.719826698303223, "global_step": 145307, "epoch": 3459} {"train_loss": -6.899085521697998, "global_step": 145308, "epoch": 3459} {"train_loss": -6.680060863494873, "global_step": 145309, "epoch": 3459} {"train_loss": -6.846653938293457, "global_step": 145310, "epoch": 3459} {"train_loss": -6.835903644561768, "global_step": 145311, "epoch": 3459} {"train_loss": -6.856391906738281, "global_step": 145312, "epoch": 3459} {"train_loss": -6.819141864776611, "global_step": 145313, "epoch": 3459} {"train_loss": -6.8347578048706055, "global_step": 145314, "epoch": 3459} {"train_loss": -6.814388275146484, "global_step": 145315, "epoch": 3459} {"train_loss": -6.650857925415039, "global_step": 145316, "epoch": 3459} {"train_loss": -6.791404724121094, "global_step": 145317, "epoch": 3459} {"train_loss": -6.858342170715332, "global_step": 145318, "epoch": 3459} {"train_loss": -6.79546806925819, "global_step": 145319, "epoch": 3459, "val_loss": 78376.765625} {"train_loss": -6.75501823425293, "global_step": 145320, "epoch": 3460} {"train_loss": -6.833817481994629, "global_step": 145321, "epoch": 3460} {"train_loss": -6.582697868347168, "global_step": 145322, "epoch": 3460} {"train_loss": -6.928886413574219, "global_step": 145323, "epoch": 3460} {"train_loss": -6.771273612976074, "global_step": 145324, "epoch": 3460} {"train_loss": -6.782947063446045, "global_step": 145325, "epoch": 3460} {"train_loss": -6.834351539611816, "global_step": 145326, "epoch": 3460} {"train_loss": -6.792180061340332, "global_step": 145327, "epoch": 3460} {"train_loss": -6.916689872741699, "global_step": 145328, "epoch": 3460} {"train_loss": -6.874107360839844, "global_step": 145329, "epoch": 3460} {"train_loss": -6.708558082580566, "global_step": 145330, "epoch": 3460} {"train_loss": -6.882369041442871, "global_step": 145331, "epoch": 3460} {"train_loss": -6.878066062927246, "global_step": 145332, "epoch": 3460} {"train_loss": -6.754500865936279, "global_step": 145333, "epoch": 3460} {"train_loss": -6.910723686218262, "global_step": 145334, "epoch": 3460} {"train_loss": -6.834070682525635, "global_step": 145335, "epoch": 3460} {"train_loss": -6.692272663116455, "global_step": 145336, "epoch": 3460} {"train_loss": -6.663355827331543, "global_step": 145337, "epoch": 3460} {"train_loss": -6.85702657699585, "global_step": 145338, "epoch": 3460} {"train_loss": -6.638431072235107, "global_step": 145339, "epoch": 3460} {"train_loss": -6.662814140319824, "global_step": 145340, "epoch": 3460} {"train_loss": -6.847784042358398, "global_step": 145341, "epoch": 3460} {"train_loss": -6.952889442443848, "global_step": 145342, "epoch": 3460} {"train_loss": -6.703629493713379, "global_step": 145343, "epoch": 3460} {"train_loss": -6.687144756317139, "global_step": 145344, "epoch": 3460} {"train_loss": -6.660969257354736, "global_step": 145345, "epoch": 3460} {"train_loss": -6.8000993728637695, "global_step": 145346, "epoch": 3460} {"train_loss": -6.698486328125, "global_step": 145347, "epoch": 3460} {"train_loss": -6.7138261795043945, "global_step": 145348, "epoch": 3460} {"train_loss": -6.729689598083496, "global_step": 145349, "epoch": 3460} {"train_loss": -6.520601272583008, "global_step": 145350, "epoch": 3460} {"train_loss": -6.728926658630371, "global_step": 145351, "epoch": 3460} {"train_loss": -6.64388370513916, "global_step": 145352, "epoch": 3460} {"train_loss": -6.762418746948242, "global_step": 145353, "epoch": 3460} {"train_loss": -6.654908180236816, "global_step": 145354, "epoch": 3460} {"train_loss": -6.732056617736816, "global_step": 145355, "epoch": 3460} {"train_loss": -6.751565933227539, "global_step": 145356, "epoch": 3460} {"train_loss": -6.6738457679748535, "global_step": 145357, "epoch": 3460} {"train_loss": -6.688590049743652, "global_step": 145358, "epoch": 3460} {"train_loss": -6.720754623413086, "global_step": 145359, "epoch": 3460} {"train_loss": -6.799968719482422, "global_step": 145360, "epoch": 3460} {"train_loss": -6.757583220799764, "global_step": 145361, "epoch": 3460, "val_loss": 78206.0859375} {"train_loss": -6.88458776473999, "global_step": 145362, "epoch": 3461} {"train_loss": -6.839487552642822, "global_step": 145363, "epoch": 3461} {"train_loss": -6.778452396392822, "global_step": 145364, "epoch": 3461} {"train_loss": -6.786848068237305, "global_step": 145365, "epoch": 3461} {"train_loss": -6.795354843139648, "global_step": 145366, "epoch": 3461} {"train_loss": -6.831607818603516, "global_step": 145367, "epoch": 3461} {"train_loss": -6.794195652008057, "global_step": 145368, "epoch": 3461} {"train_loss": -6.861576557159424, "global_step": 145369, "epoch": 3461} {"train_loss": -6.7970428466796875, "global_step": 145370, "epoch": 3461} {"train_loss": -6.934331893920898, "global_step": 145371, "epoch": 3461} {"train_loss": -6.772509574890137, "global_step": 145372, "epoch": 3461} {"train_loss": -6.864840030670166, "global_step": 145373, "epoch": 3461} {"train_loss": -6.6016387939453125, "global_step": 145374, "epoch": 3461} {"train_loss": -6.675662994384766, "global_step": 145375, "epoch": 3461} {"train_loss": -6.726062774658203, "global_step": 145376, "epoch": 3461} {"train_loss": -6.761636734008789, "global_step": 145377, "epoch": 3461} {"train_loss": -6.587204456329346, "global_step": 145378, "epoch": 3461} {"train_loss": -6.773927688598633, "global_step": 145379, "epoch": 3461} {"train_loss": -6.605236530303955, "global_step": 145380, "epoch": 3461} {"train_loss": -6.836355686187744, "global_step": 145381, "epoch": 3461} {"train_loss": -6.769793510437012, "global_step": 145382, "epoch": 3461} {"train_loss": -6.677431583404541, "global_step": 145383, "epoch": 3461} {"train_loss": -6.834256172180176, "global_step": 145384, "epoch": 3461} {"train_loss": -6.568297863006592, "global_step": 145385, "epoch": 3461} {"train_loss": -6.7663493156433105, "global_step": 145386, "epoch": 3461} {"train_loss": -6.755289554595947, "global_step": 145387, "epoch": 3461} {"train_loss": -6.7021942138671875, "global_step": 145388, "epoch": 3461} {"train_loss": -6.804699897766113, "global_step": 145389, "epoch": 3461} {"train_loss": -6.687021255493164, "global_step": 145390, "epoch": 3461} {"train_loss": -6.781713485717773, "global_step": 145391, "epoch": 3461} {"train_loss": -6.90200662612915, "global_step": 145392, "epoch": 3461} {"train_loss": -6.720194339752197, "global_step": 145393, "epoch": 3461} {"train_loss": -6.729395866394043, "global_step": 145394, "epoch": 3461} {"train_loss": -6.8941168785095215, "global_step": 145395, "epoch": 3461} {"train_loss": -6.8175764083862305, "global_step": 145396, "epoch": 3461} {"train_loss": -6.787412166595459, "global_step": 145397, "epoch": 3461} {"train_loss": -6.8539228439331055, "global_step": 145398, "epoch": 3461} {"train_loss": -6.872583389282227, "global_step": 145399, "epoch": 3461} {"train_loss": -6.793964385986328, "global_step": 145400, "epoch": 3461} {"train_loss": -6.855398654937744, "global_step": 145401, "epoch": 3461} {"train_loss": -6.815473556518555, "global_step": 145402, "epoch": 3461} {"train_loss": -6.781276271456764, "global_step": 145403, "epoch": 3461, "val_loss": 78300.2578125} {"train_loss": -6.958335876464844, "global_step": 145404, "epoch": 3462} {"train_loss": -6.8634514808654785, "global_step": 145405, "epoch": 3462} {"train_loss": -6.817865371704102, "global_step": 145406, "epoch": 3462} {"train_loss": -6.935576438903809, "global_step": 145407, "epoch": 3462} {"train_loss": -6.890038013458252, "global_step": 145408, "epoch": 3462} {"train_loss": -6.959380149841309, "global_step": 145409, "epoch": 3462} {"train_loss": -6.892549514770508, "global_step": 145410, "epoch": 3462} {"train_loss": -6.956353664398193, "global_step": 145411, "epoch": 3462} {"train_loss": -6.919190406799316, "global_step": 145412, "epoch": 3462} {"train_loss": -6.8154191970825195, "global_step": 145413, "epoch": 3462} {"train_loss": -6.883020401000977, "global_step": 145414, "epoch": 3462} {"train_loss": -6.9025139808654785, "global_step": 145415, "epoch": 3462} {"train_loss": -6.862029075622559, "global_step": 145416, "epoch": 3462} {"train_loss": -6.76691198348999, "global_step": 145417, "epoch": 3462} {"train_loss": -6.904356956481934, "global_step": 145418, "epoch": 3462} {"train_loss": -6.872555255889893, "global_step": 145419, "epoch": 3462} {"train_loss": -6.8936944007873535, "global_step": 145420, "epoch": 3462} {"train_loss": -6.9644975662231445, "global_step": 145421, "epoch": 3462} {"train_loss": -6.818719863891602, "global_step": 145422, "epoch": 3462} {"train_loss": -6.872425079345703, "global_step": 145423, "epoch": 3462} {"train_loss": -6.812627792358398, "global_step": 145424, "epoch": 3462} {"train_loss": -6.879423141479492, "global_step": 145425, "epoch": 3462} {"train_loss": -6.852497100830078, "global_step": 145426, "epoch": 3462} {"train_loss": -6.764217853546143, "global_step": 145427, "epoch": 3462} {"train_loss": -6.88243293762207, "global_step": 145428, "epoch": 3462} {"train_loss": -6.874352931976318, "global_step": 145429, "epoch": 3462} {"train_loss": -6.995645046234131, "global_step": 145430, "epoch": 3462} {"train_loss": -6.829244613647461, "global_step": 145431, "epoch": 3462} {"train_loss": -6.8305864334106445, "global_step": 145432, "epoch": 3462} {"train_loss": -6.881834030151367, "global_step": 145433, "epoch": 3462} {"train_loss": -6.931377410888672, "global_step": 145434, "epoch": 3462} {"train_loss": -6.861464500427246, "global_step": 145435, "epoch": 3462} {"train_loss": -6.788402557373047, "global_step": 145436, "epoch": 3462} {"train_loss": -6.890185356140137, "global_step": 145437, "epoch": 3462} {"train_loss": -6.759029865264893, "global_step": 145438, "epoch": 3462} {"train_loss": -6.906432151794434, "global_step": 145439, "epoch": 3462} {"train_loss": -6.846540451049805, "global_step": 145440, "epoch": 3462} {"train_loss": -6.83245849609375, "global_step": 145441, "epoch": 3462} {"train_loss": -6.880428791046143, "global_step": 145442, "epoch": 3462} {"train_loss": -6.794954299926758, "global_step": 145443, "epoch": 3462} {"train_loss": -6.8914995193481445, "global_step": 145444, "epoch": 3462} {"train_loss": -6.870823371978033, "global_step": 145445, "epoch": 3462, "val_loss": 78463.8515625} {"train_loss": -6.927834510803223, "global_step": 145446, "epoch": 3463} {"train_loss": -6.9349212646484375, "global_step": 145447, "epoch": 3463} {"train_loss": -6.818103790283203, "global_step": 145448, "epoch": 3463} {"train_loss": -6.870634078979492, "global_step": 145449, "epoch": 3463} {"train_loss": -6.882468223571777, "global_step": 145450, "epoch": 3463} {"train_loss": -6.881928443908691, "global_step": 145451, "epoch": 3463} {"train_loss": -6.854789733886719, "global_step": 145452, "epoch": 3463} {"train_loss": -6.866387367248535, "global_step": 145453, "epoch": 3463} {"train_loss": -6.845613479614258, "global_step": 145454, "epoch": 3463} {"train_loss": -6.793544769287109, "global_step": 145455, "epoch": 3463} {"train_loss": -6.936800479888916, "global_step": 145456, "epoch": 3463} {"train_loss": -6.90014123916626, "global_step": 145457, "epoch": 3463} {"train_loss": -6.766326904296875, "global_step": 145458, "epoch": 3463} {"train_loss": -6.817262649536133, "global_step": 145459, "epoch": 3463} {"train_loss": -6.981088638305664, "global_step": 145460, "epoch": 3463} {"train_loss": -6.823850154876709, "global_step": 145461, "epoch": 3463} {"train_loss": -6.666100978851318, "global_step": 145462, "epoch": 3463} {"train_loss": -6.700623989105225, "global_step": 145463, "epoch": 3463} {"train_loss": -6.727682113647461, "global_step": 145464, "epoch": 3463} {"train_loss": -6.692543029785156, "global_step": 145465, "epoch": 3463} {"train_loss": -6.686511039733887, "global_step": 145466, "epoch": 3463} {"train_loss": -6.778364658355713, "global_step": 145467, "epoch": 3463} {"train_loss": -6.749032020568848, "global_step": 145468, "epoch": 3463} {"train_loss": -6.7073822021484375, "global_step": 145469, "epoch": 3463} {"train_loss": -6.803098201751709, "global_step": 145470, "epoch": 3463} {"train_loss": -6.726407051086426, "global_step": 145471, "epoch": 3463} {"train_loss": -6.8086161613464355, "global_step": 145472, "epoch": 3463} {"train_loss": -6.802545547485352, "global_step": 145473, "epoch": 3463} {"train_loss": -6.81761360168457, "global_step": 145474, "epoch": 3463} {"train_loss": -6.810302734375, "global_step": 145475, "epoch": 3463} {"train_loss": -6.836080551147461, "global_step": 145476, "epoch": 3463} {"train_loss": -6.763522148132324, "global_step": 145477, "epoch": 3463} {"train_loss": -6.911596775054932, "global_step": 145478, "epoch": 3463} {"train_loss": -6.716757297515869, "global_step": 145479, "epoch": 3463} {"train_loss": -6.845231056213379, "global_step": 145480, "epoch": 3463} {"train_loss": -6.813905715942383, "global_step": 145481, "epoch": 3463} {"train_loss": -6.780821800231934, "global_step": 145482, "epoch": 3463} {"train_loss": -6.759737491607666, "global_step": 145483, "epoch": 3463} {"train_loss": -6.9213175773620605, "global_step": 145484, "epoch": 3463} {"train_loss": -6.761761665344238, "global_step": 145485, "epoch": 3463} {"train_loss": -6.858485221862793, "global_step": 145486, "epoch": 3463} {"train_loss": -6.812781560988653, "global_step": 145487, "epoch": 3463, "val_loss": 78531.6875} {"train_loss": -6.781848907470703, "global_step": 145488, "epoch": 3464} {"train_loss": -6.877285003662109, "global_step": 145489, "epoch": 3464} {"train_loss": -6.733425617218018, "global_step": 145490, "epoch": 3464} {"train_loss": -6.796054363250732, "global_step": 145491, "epoch": 3464} {"train_loss": -6.863947868347168, "global_step": 145492, "epoch": 3464} {"train_loss": -6.8677873611450195, "global_step": 145493, "epoch": 3464} {"train_loss": -6.797788619995117, "global_step": 145494, "epoch": 3464} {"train_loss": -6.865070343017578, "global_step": 145495, "epoch": 3464} {"train_loss": -6.958895683288574, "global_step": 145496, "epoch": 3464} {"train_loss": -6.907968521118164, "global_step": 145497, "epoch": 3464} {"train_loss": -6.857877254486084, "global_step": 145498, "epoch": 3464} {"train_loss": -6.9300103187561035, "global_step": 145499, "epoch": 3464} {"train_loss": -6.878446102142334, "global_step": 145500, "epoch": 3464} {"train_loss": -6.732724189758301, "global_step": 145501, "epoch": 3464} {"train_loss": -6.814030170440674, "global_step": 145502, "epoch": 3464} {"train_loss": -6.877032279968262, "global_step": 145503, "epoch": 3464} {"train_loss": -6.871796607971191, "global_step": 145504, "epoch": 3464} {"train_loss": -6.815273761749268, "global_step": 145505, "epoch": 3464} {"train_loss": -6.756443977355957, "global_step": 145506, "epoch": 3464} {"train_loss": -6.830646991729736, "global_step": 145507, "epoch": 3464} {"train_loss": -6.771127223968506, "global_step": 145508, "epoch": 3464} {"train_loss": -6.885117530822754, "global_step": 145509, "epoch": 3464} {"train_loss": -6.853763580322266, "global_step": 145510, "epoch": 3464} {"train_loss": -6.787315368652344, "global_step": 145511, "epoch": 3464} {"train_loss": -6.923052787780762, "global_step": 145512, "epoch": 3464} {"train_loss": -6.8364434242248535, "global_step": 145513, "epoch": 3464} {"train_loss": -6.746772766113281, "global_step": 145514, "epoch": 3464} {"train_loss": -6.837615966796875, "global_step": 145515, "epoch": 3464} {"train_loss": -6.776028156280518, "global_step": 145516, "epoch": 3464} {"train_loss": -6.760559558868408, "global_step": 145517, "epoch": 3464} {"train_loss": -6.830873489379883, "global_step": 145518, "epoch": 3464} {"train_loss": -6.805850028991699, "global_step": 145519, "epoch": 3464} {"train_loss": -6.633388042449951, "global_step": 145520, "epoch": 3464} {"train_loss": -6.741572380065918, "global_step": 145521, "epoch": 3464} {"train_loss": -6.817832946777344, "global_step": 145522, "epoch": 3464} {"train_loss": -6.809817790985107, "global_step": 145523, "epoch": 3464} {"train_loss": -6.666342735290527, "global_step": 145524, "epoch": 3464} {"train_loss": -6.806384563446045, "global_step": 145525, "epoch": 3464} {"train_loss": -6.769968509674072, "global_step": 145526, "epoch": 3464} {"train_loss": -6.759966850280762, "global_step": 145527, "epoch": 3464} {"train_loss": -6.801567077636719, "global_step": 145528, "epoch": 3464} {"train_loss": -6.81663627851577, "global_step": 145529, "epoch": 3464, "val_loss": 78355.921875} {"train_loss": -6.893565654754639, "global_step": 145530, "epoch": 3465} {"train_loss": -6.691427230834961, "global_step": 145531, "epoch": 3465} {"train_loss": -6.727569580078125, "global_step": 145532, "epoch": 3465} {"train_loss": -6.859287261962891, "global_step": 145533, "epoch": 3465} {"train_loss": -6.855018615722656, "global_step": 145534, "epoch": 3465} {"train_loss": -6.8817830085754395, "global_step": 145535, "epoch": 3465} {"train_loss": -6.77655553817749, "global_step": 145536, "epoch": 3465} {"train_loss": -6.881168365478516, "global_step": 145537, "epoch": 3465} {"train_loss": -6.8086090087890625, "global_step": 145538, "epoch": 3465} {"train_loss": -6.848893165588379, "global_step": 145539, "epoch": 3465} {"train_loss": -6.824443340301514, "global_step": 145540, "epoch": 3465} {"train_loss": -6.946650505065918, "global_step": 145541, "epoch": 3465} {"train_loss": -6.807446479797363, "global_step": 145542, "epoch": 3465} {"train_loss": -6.710918426513672, "global_step": 145543, "epoch": 3465} {"train_loss": -6.939421653747559, "global_step": 145544, "epoch": 3465} {"train_loss": -6.764399528503418, "global_step": 145545, "epoch": 3465} {"train_loss": -6.697688102722168, "global_step": 145546, "epoch": 3465} {"train_loss": -6.754055976867676, "global_step": 145547, "epoch": 3465} {"train_loss": -6.69855260848999, "global_step": 145548, "epoch": 3465} {"train_loss": -6.634692192077637, "global_step": 145549, "epoch": 3465} {"train_loss": -6.712116241455078, "global_step": 145550, "epoch": 3465} {"train_loss": -6.73609733581543, "global_step": 145551, "epoch": 3465} {"train_loss": -6.634360313415527, "global_step": 145552, "epoch": 3465} {"train_loss": -6.780755519866943, "global_step": 145553, "epoch": 3465} {"train_loss": -6.681612968444824, "global_step": 145554, "epoch": 3465} {"train_loss": -6.6161394119262695, "global_step": 145555, "epoch": 3465} {"train_loss": -6.618267059326172, "global_step": 145556, "epoch": 3465} {"train_loss": -6.721771240234375, "global_step": 145557, "epoch": 3465} {"train_loss": -6.587128162384033, "global_step": 145558, "epoch": 3465} {"train_loss": -6.837706565856934, "global_step": 145559, "epoch": 3465} {"train_loss": -6.650536060333252, "global_step": 145560, "epoch": 3465} {"train_loss": -6.638676166534424, "global_step": 145561, "epoch": 3465} {"train_loss": -6.657557487487793, "global_step": 145562, "epoch": 3465} {"train_loss": -6.774019241333008, "global_step": 145563, "epoch": 3465} {"train_loss": -6.728794097900391, "global_step": 145564, "epoch": 3465} {"train_loss": -6.758130073547363, "global_step": 145565, "epoch": 3465} {"train_loss": -6.691512107849121, "global_step": 145566, "epoch": 3465} {"train_loss": -6.691198825836182, "global_step": 145567, "epoch": 3465} {"train_loss": -6.732708930969238, "global_step": 145568, "epoch": 3465} {"train_loss": -6.784843444824219, "global_step": 145569, "epoch": 3465} {"train_loss": -6.714969158172607, "global_step": 145570, "epoch": 3465} {"train_loss": -6.753838357471285, "global_step": 145571, "epoch": 3465, "val_loss": 78729.3125} {"train_loss": -6.718423366546631, "global_step": 145572, "epoch": 3466} {"train_loss": -6.753776550292969, "global_step": 145573, "epoch": 3466} {"train_loss": -6.85047721862793, "global_step": 145574, "epoch": 3466} {"train_loss": -6.741024971008301, "global_step": 145575, "epoch": 3466} {"train_loss": -6.799830913543701, "global_step": 145576, "epoch": 3466} {"train_loss": -6.77104377746582, "global_step": 145577, "epoch": 3466} {"train_loss": -6.835972785949707, "global_step": 145578, "epoch": 3466} {"train_loss": -6.8103508949279785, "global_step": 145579, "epoch": 3466} {"train_loss": -6.792403221130371, "global_step": 145580, "epoch": 3466} {"train_loss": -6.797706604003906, "global_step": 145581, "epoch": 3466} {"train_loss": -6.864078521728516, "global_step": 145582, "epoch": 3466} {"train_loss": -6.924491882324219, "global_step": 145583, "epoch": 3466} {"train_loss": -6.817986488342285, "global_step": 145584, "epoch": 3466} {"train_loss": -6.886204242706299, "global_step": 145585, "epoch": 3466} {"train_loss": -6.784363746643066, "global_step": 145586, "epoch": 3466} {"train_loss": -6.844061851501465, "global_step": 145587, "epoch": 3466} {"train_loss": -6.959595680236816, "global_step": 145588, "epoch": 3466} {"train_loss": -6.8916473388671875, "global_step": 145589, "epoch": 3466} {"train_loss": -6.792088508605957, "global_step": 145590, "epoch": 3466} {"train_loss": -6.832796096801758, "global_step": 145591, "epoch": 3466} {"train_loss": -6.869073867797852, "global_step": 145592, "epoch": 3466} {"train_loss": -6.8784589767456055, "global_step": 145593, "epoch": 3466} {"train_loss": -6.832831382751465, "global_step": 145594, "epoch": 3466} {"train_loss": -6.9049906730651855, "global_step": 145595, "epoch": 3466} {"train_loss": -6.78574800491333, "global_step": 145596, "epoch": 3466} {"train_loss": -6.72373104095459, "global_step": 145597, "epoch": 3466} {"train_loss": -6.889114856719971, "global_step": 145598, "epoch": 3466} {"train_loss": -6.878713607788086, "global_step": 145599, "epoch": 3466} {"train_loss": -6.850484371185303, "global_step": 145600, "epoch": 3466} {"train_loss": -6.975407600402832, "global_step": 145601, "epoch": 3466} {"train_loss": -6.877683162689209, "global_step": 145602, "epoch": 3466} {"train_loss": -6.855380058288574, "global_step": 145603, "epoch": 3466} {"train_loss": -6.822099685668945, "global_step": 145604, "epoch": 3466} {"train_loss": -6.963572978973389, "global_step": 145605, "epoch": 3466} {"train_loss": -6.919849395751953, "global_step": 145606, "epoch": 3466} {"train_loss": -6.859374523162842, "global_step": 145607, "epoch": 3466} {"train_loss": -6.834292411804199, "global_step": 145608, "epoch": 3466} {"train_loss": -6.942104339599609, "global_step": 145609, "epoch": 3466} {"train_loss": -6.778563022613525, "global_step": 145610, "epoch": 3466} {"train_loss": -6.807309627532959, "global_step": 145611, "epoch": 3466} {"train_loss": -6.858376502990723, "global_step": 145612, "epoch": 3466} {"train_loss": -6.845205681664603, "global_step": 145613, "epoch": 3466, "val_loss": 78334.03125} {"train_loss": -6.895691394805908, "global_step": 145614, "epoch": 3467} {"train_loss": -6.820739269256592, "global_step": 145615, "epoch": 3467} {"train_loss": -6.779526710510254, "global_step": 145616, "epoch": 3467} {"train_loss": -6.916547775268555, "global_step": 145617, "epoch": 3467} {"train_loss": -6.898059844970703, "global_step": 145618, "epoch": 3467} {"train_loss": -6.831233024597168, "global_step": 145619, "epoch": 3467} {"train_loss": -6.882661819458008, "global_step": 145620, "epoch": 3467} {"train_loss": -6.705750942230225, "global_step": 145621, "epoch": 3467} {"train_loss": -6.752040863037109, "global_step": 145622, "epoch": 3467} {"train_loss": -6.949052810668945, "global_step": 145623, "epoch": 3467} {"train_loss": -6.786468982696533, "global_step": 145624, "epoch": 3467} {"train_loss": -6.8114776611328125, "global_step": 145625, "epoch": 3467} {"train_loss": -6.877767562866211, "global_step": 145626, "epoch": 3467} {"train_loss": -6.852334499359131, "global_step": 145627, "epoch": 3467} {"train_loss": -6.8555145263671875, "global_step": 145628, "epoch": 3467} {"train_loss": -6.814603805541992, "global_step": 145629, "epoch": 3467} {"train_loss": -6.911553382873535, "global_step": 145630, "epoch": 3467} {"train_loss": -6.925728797912598, "global_step": 145631, "epoch": 3467} {"train_loss": -6.788590908050537, "global_step": 145632, "epoch": 3467} {"train_loss": -6.800065517425537, "global_step": 145633, "epoch": 3467} {"train_loss": -6.804747581481934, "global_step": 145634, "epoch": 3467} {"train_loss": -6.983531951904297, "global_step": 145635, "epoch": 3467} {"train_loss": -6.826317310333252, "global_step": 145636, "epoch": 3467} {"train_loss": -6.883443832397461, "global_step": 145637, "epoch": 3467} {"train_loss": -6.90513801574707, "global_step": 145638, "epoch": 3467} {"train_loss": -6.868349075317383, "global_step": 145639, "epoch": 3467} {"train_loss": -6.783874034881592, "global_step": 145640, "epoch": 3467} {"train_loss": -6.802567958831787, "global_step": 145641, "epoch": 3467} {"train_loss": -6.932450294494629, "global_step": 145642, "epoch": 3467} {"train_loss": -6.992188453674316, "global_step": 145643, "epoch": 3467} {"train_loss": -6.8623809814453125, "global_step": 145644, "epoch": 3467} {"train_loss": -6.830148696899414, "global_step": 145645, "epoch": 3467} {"train_loss": -6.988173007965088, "global_step": 145646, "epoch": 3467} {"train_loss": -6.8212175369262695, "global_step": 145647, "epoch": 3467} {"train_loss": -6.7771525382995605, "global_step": 145648, "epoch": 3467} {"train_loss": -6.908429145812988, "global_step": 145649, "epoch": 3467} {"train_loss": -6.853087425231934, "global_step": 145650, "epoch": 3467} {"train_loss": -6.867547988891602, "global_step": 145651, "epoch": 3467} {"train_loss": -6.689701557159424, "global_step": 145652, "epoch": 3467} {"train_loss": -6.827157974243164, "global_step": 145653, "epoch": 3467} {"train_loss": -6.907664775848389, "global_step": 145654, "epoch": 3467} {"train_loss": -6.851916483470371, "global_step": 145655, "epoch": 3467, "val_loss": 78319.9609375} {"train_loss": -6.805077075958252, "global_step": 145656, "epoch": 3468} {"train_loss": -6.899176597595215, "global_step": 145657, "epoch": 3468} {"train_loss": -6.844725131988525, "global_step": 145658, "epoch": 3468} {"train_loss": -6.821465969085693, "global_step": 145659, "epoch": 3468} {"train_loss": -6.878291130065918, "global_step": 145660, "epoch": 3468} {"train_loss": -6.771817207336426, "global_step": 145661, "epoch": 3468} {"train_loss": -6.814846515655518, "global_step": 145662, "epoch": 3468} {"train_loss": -6.805196762084961, "global_step": 145663, "epoch": 3468} {"train_loss": -6.867659568786621, "global_step": 145664, "epoch": 3468} {"train_loss": -6.97407341003418, "global_step": 145665, "epoch": 3468} {"train_loss": -6.884119987487793, "global_step": 145666, "epoch": 3468} {"train_loss": -6.905455589294434, "global_step": 145667, "epoch": 3468} {"train_loss": -6.94162654876709, "global_step": 145668, "epoch": 3468} {"train_loss": -6.865084648132324, "global_step": 145669, "epoch": 3468} {"train_loss": -6.845357894897461, "global_step": 145670, "epoch": 3468} {"train_loss": -6.901480197906494, "global_step": 145671, "epoch": 3468} {"train_loss": -6.929285049438477, "global_step": 145672, "epoch": 3468} {"train_loss": -6.803849220275879, "global_step": 145673, "epoch": 3468} {"train_loss": -6.8651018142700195, "global_step": 145674, "epoch": 3468} {"train_loss": -6.967571258544922, "global_step": 145675, "epoch": 3468} {"train_loss": -6.870169639587402, "global_step": 145676, "epoch": 3468} {"train_loss": -6.893116474151611, "global_step": 145677, "epoch": 3468} {"train_loss": -6.922079086303711, "global_step": 145678, "epoch": 3468} {"train_loss": -6.810625076293945, "global_step": 145679, "epoch": 3468} {"train_loss": -6.972110271453857, "global_step": 145680, "epoch": 3468} {"train_loss": -6.9016828536987305, "global_step": 145681, "epoch": 3468} {"train_loss": -6.777201175689697, "global_step": 145682, "epoch": 3468} {"train_loss": -6.732643127441406, "global_step": 145683, "epoch": 3468} {"train_loss": -6.85125732421875, "global_step": 145684, "epoch": 3468} {"train_loss": -6.859356880187988, "global_step": 145685, "epoch": 3468} {"train_loss": -6.862067222595215, "global_step": 145686, "epoch": 3468} {"train_loss": -6.91909122467041, "global_step": 145687, "epoch": 3468} {"train_loss": -6.854188919067383, "global_step": 145688, "epoch": 3468} {"train_loss": -6.994756698608398, "global_step": 145689, "epoch": 3468} {"train_loss": -6.867465972900391, "global_step": 145690, "epoch": 3468} {"train_loss": -6.869319915771484, "global_step": 145691, "epoch": 3468} {"train_loss": -6.845367431640625, "global_step": 145692, "epoch": 3468} {"train_loss": -6.9093780517578125, "global_step": 145693, "epoch": 3468} {"train_loss": -6.953244686126709, "global_step": 145694, "epoch": 3468} {"train_loss": -6.873407363891602, "global_step": 145695, "epoch": 3468} {"train_loss": -6.911583423614502, "global_step": 145696, "epoch": 3468} {"train_loss": -6.876465513592675, "global_step": 145697, "epoch": 3468, "val_loss": 78368.7734375} {"train_loss": -6.862396240234375, "global_step": 145698, "epoch": 3469} {"train_loss": -6.832401752471924, "global_step": 145699, "epoch": 3469} {"train_loss": -6.846344947814941, "global_step": 145700, "epoch": 3469} {"train_loss": -6.76400899887085, "global_step": 145701, "epoch": 3469} {"train_loss": -6.941923141479492, "global_step": 145702, "epoch": 3469} {"train_loss": -6.880918502807617, "global_step": 145703, "epoch": 3469} {"train_loss": -6.7639055252075195, "global_step": 145704, "epoch": 3469} {"train_loss": -6.758840560913086, "global_step": 145705, "epoch": 3469} {"train_loss": -6.882453918457031, "global_step": 145706, "epoch": 3469} {"train_loss": -6.879958629608154, "global_step": 145707, "epoch": 3469} {"train_loss": -6.713503837585449, "global_step": 145708, "epoch": 3469} {"train_loss": -6.676064491271973, "global_step": 145709, "epoch": 3469} {"train_loss": -6.880515098571777, "global_step": 145710, "epoch": 3469} {"train_loss": -6.828691482543945, "global_step": 145711, "epoch": 3469} {"train_loss": -6.708951950073242, "global_step": 145712, "epoch": 3469} {"train_loss": -6.835941314697266, "global_step": 145713, "epoch": 3469} {"train_loss": -6.798819541931152, "global_step": 145714, "epoch": 3469} {"train_loss": -6.698803901672363, "global_step": 145715, "epoch": 3469} {"train_loss": -6.829176902770996, "global_step": 145716, "epoch": 3469} {"train_loss": -6.671467304229736, "global_step": 145717, "epoch": 3469} {"train_loss": -6.785146713256836, "global_step": 145718, "epoch": 3469} {"train_loss": -6.61137580871582, "global_step": 145719, "epoch": 3469} {"train_loss": -6.837757110595703, "global_step": 145720, "epoch": 3469} {"train_loss": -6.761358261108398, "global_step": 145721, "epoch": 3469} {"train_loss": -6.747148513793945, "global_step": 145722, "epoch": 3469} {"train_loss": -6.841840744018555, "global_step": 145723, "epoch": 3469} {"train_loss": -6.689581871032715, "global_step": 145724, "epoch": 3469} {"train_loss": -6.764982223510742, "global_step": 145725, "epoch": 3469} {"train_loss": -6.829379081726074, "global_step": 145726, "epoch": 3469} {"train_loss": -6.738637924194336, "global_step": 145727, "epoch": 3469} {"train_loss": -6.788620948791504, "global_step": 145728, "epoch": 3469} {"train_loss": -6.8098297119140625, "global_step": 145729, "epoch": 3469} {"train_loss": -6.724932670593262, "global_step": 145730, "epoch": 3469} {"train_loss": -6.776766300201416, "global_step": 145731, "epoch": 3469} {"train_loss": -6.815017223358154, "global_step": 145732, "epoch": 3469} {"train_loss": -6.7888712882995605, "global_step": 145733, "epoch": 3469} {"train_loss": -6.814604759216309, "global_step": 145734, "epoch": 3469} {"train_loss": -6.890603542327881, "global_step": 145735, "epoch": 3469} {"train_loss": -6.919111251831055, "global_step": 145736, "epoch": 3469} {"train_loss": -6.87141752243042, "global_step": 145737, "epoch": 3469} {"train_loss": -6.920975208282471, "global_step": 145738, "epoch": 3469} {"train_loss": -6.799527531578427, "global_step": 145739, "epoch": 3469, "val_loss": 78244.609375} {"train_loss": -6.74210262298584, "global_step": 145740, "epoch": 3470} {"train_loss": -6.920346260070801, "global_step": 145741, "epoch": 3470} {"train_loss": -6.76234245300293, "global_step": 145742, "epoch": 3470} {"train_loss": -6.7795586585998535, "global_step": 145743, "epoch": 3470} {"train_loss": -6.886440277099609, "global_step": 145744, "epoch": 3470} {"train_loss": -6.6993303298950195, "global_step": 145745, "epoch": 3470} {"train_loss": -6.866243362426758, "global_step": 145746, "epoch": 3470} {"train_loss": -6.764034271240234, "global_step": 145747, "epoch": 3470} {"train_loss": -6.693054676055908, "global_step": 145748, "epoch": 3470} {"train_loss": -6.911434173583984, "global_step": 145749, "epoch": 3470} {"train_loss": -6.821147918701172, "global_step": 145750, "epoch": 3470} {"train_loss": -6.696564674377441, "global_step": 145751, "epoch": 3470} {"train_loss": -6.899878025054932, "global_step": 145752, "epoch": 3470} {"train_loss": -6.8149094581604, "global_step": 145753, "epoch": 3470} {"train_loss": -6.685972213745117, "global_step": 145754, "epoch": 3470} {"train_loss": -6.9381866455078125, "global_step": 145755, "epoch": 3470} {"train_loss": -6.763630390167236, "global_step": 145756, "epoch": 3470} {"train_loss": -6.817330360412598, "global_step": 145757, "epoch": 3470} {"train_loss": -6.837523937225342, "global_step": 145758, "epoch": 3470} {"train_loss": -6.708606719970703, "global_step": 145759, "epoch": 3470} {"train_loss": -6.835634708404541, "global_step": 145760, "epoch": 3470} {"train_loss": -6.65058708190918, "global_step": 145761, "epoch": 3470} {"train_loss": -6.819931983947754, "global_step": 145762, "epoch": 3470} {"train_loss": -6.687229156494141, "global_step": 145763, "epoch": 3470} {"train_loss": -6.704005241394043, "global_step": 145764, "epoch": 3470} {"train_loss": -6.838399410247803, "global_step": 145765, "epoch": 3470} {"train_loss": -6.69660758972168, "global_step": 145766, "epoch": 3470} {"train_loss": -6.7081780433654785, "global_step": 145767, "epoch": 3470} {"train_loss": -6.575565814971924, "global_step": 145768, "epoch": 3470} {"train_loss": -6.809496879577637, "global_step": 145769, "epoch": 3470} {"train_loss": -6.643679618835449, "global_step": 145770, "epoch": 3470} {"train_loss": -6.751652717590332, "global_step": 145771, "epoch": 3470} {"train_loss": -6.80321741104126, "global_step": 145772, "epoch": 3470} {"train_loss": -6.845234394073486, "global_step": 145773, "epoch": 3470} {"train_loss": -6.716000080108643, "global_step": 145774, "epoch": 3470} {"train_loss": -6.6654205322265625, "global_step": 145775, "epoch": 3470} {"train_loss": -6.75996732711792, "global_step": 145776, "epoch": 3470} {"train_loss": -6.694351673126221, "global_step": 145777, "epoch": 3470} {"train_loss": -6.663163185119629, "global_step": 145778, "epoch": 3470} {"train_loss": -6.643448352813721, "global_step": 145779, "epoch": 3470} {"train_loss": -6.760894775390625, "global_step": 145780, "epoch": 3470} {"train_loss": -6.765427646182832, "global_step": 145781, "epoch": 3470, "val_loss": 78499.828125} {"train_loss": -6.7558088302612305, "global_step": 145782, "epoch": 3471} {"train_loss": -6.834208965301514, "global_step": 145783, "epoch": 3471} {"train_loss": -6.77783727645874, "global_step": 145784, "epoch": 3471} {"train_loss": -6.736238956451416, "global_step": 145785, "epoch": 3471} {"train_loss": -6.824819564819336, "global_step": 145786, "epoch": 3471} {"train_loss": -6.808135032653809, "global_step": 145787, "epoch": 3471} {"train_loss": -6.80025577545166, "global_step": 145788, "epoch": 3471} {"train_loss": -6.726099014282227, "global_step": 145789, "epoch": 3471} {"train_loss": -6.74953556060791, "global_step": 145790, "epoch": 3471} {"train_loss": -6.745987415313721, "global_step": 145791, "epoch": 3471} {"train_loss": -6.886236190795898, "global_step": 145792, "epoch": 3471} {"train_loss": -6.816595077514648, "global_step": 145793, "epoch": 3471} {"train_loss": -6.804346084594727, "global_step": 145794, "epoch": 3471} {"train_loss": -6.781792640686035, "global_step": 145795, "epoch": 3471} {"train_loss": -6.826511383056641, "global_step": 145796, "epoch": 3471} {"train_loss": -6.886629104614258, "global_step": 145797, "epoch": 3471} {"train_loss": -6.833723068237305, "global_step": 145798, "epoch": 3471} {"train_loss": -6.803048610687256, "global_step": 145799, "epoch": 3471} {"train_loss": -6.947323799133301, "global_step": 145800, "epoch": 3471} {"train_loss": -6.832919597625732, "global_step": 145801, "epoch": 3471} {"train_loss": -6.841213703155518, "global_step": 145802, "epoch": 3471} {"train_loss": -6.876922130584717, "global_step": 145803, "epoch": 3471} {"train_loss": -6.84805154800415, "global_step": 145804, "epoch": 3471} {"train_loss": -6.792795658111572, "global_step": 145805, "epoch": 3471} {"train_loss": -6.9862823486328125, "global_step": 145806, "epoch": 3471} {"train_loss": -6.922915458679199, "global_step": 145807, "epoch": 3471} {"train_loss": -6.813033103942871, "global_step": 145808, "epoch": 3471} {"train_loss": -6.849867343902588, "global_step": 145809, "epoch": 3471} {"train_loss": -6.9304375648498535, "global_step": 145810, "epoch": 3471} {"train_loss": -6.871580600738525, "global_step": 145811, "epoch": 3471} {"train_loss": -6.841569900512695, "global_step": 145812, "epoch": 3471} {"train_loss": -6.89363956451416, "global_step": 145813, "epoch": 3471} {"train_loss": -6.754080772399902, "global_step": 145814, "epoch": 3471} {"train_loss": -6.801617622375488, "global_step": 145815, "epoch": 3471} {"train_loss": -6.836386680603027, "global_step": 145816, "epoch": 3471} {"train_loss": -6.718054294586182, "global_step": 145817, "epoch": 3471} {"train_loss": -6.801097869873047, "global_step": 145818, "epoch": 3471} {"train_loss": -6.628614902496338, "global_step": 145819, "epoch": 3471} {"train_loss": -6.823265552520752, "global_step": 145820, "epoch": 3471} {"train_loss": -6.864527702331543, "global_step": 145821, "epoch": 3471} {"train_loss": -6.792413711547852, "global_step": 145822, "epoch": 3471} {"train_loss": -6.822318849109468, "global_step": 145823, "epoch": 3471, "val_loss": 78549.5390625} {"train_loss": -6.742982864379883, "global_step": 145824, "epoch": 3472} {"train_loss": -6.8900041580200195, "global_step": 145825, "epoch": 3472} {"train_loss": -6.603670597076416, "global_step": 145826, "epoch": 3472} {"train_loss": -6.772615432739258, "global_step": 145827, "epoch": 3472} {"train_loss": -6.64738655090332, "global_step": 145828, "epoch": 3472} {"train_loss": -6.7648234367370605, "global_step": 145829, "epoch": 3472} {"train_loss": -6.728559494018555, "global_step": 145830, "epoch": 3472} {"train_loss": -6.783890724182129, "global_step": 145831, "epoch": 3472} {"train_loss": -6.849742889404297, "global_step": 145832, "epoch": 3472} {"train_loss": -6.721366882324219, "global_step": 145833, "epoch": 3472} {"train_loss": -6.722434043884277, "global_step": 145834, "epoch": 3472} {"train_loss": -6.850006103515625, "global_step": 145835, "epoch": 3472} {"train_loss": -6.7378129959106445, "global_step": 145836, "epoch": 3472} {"train_loss": -6.805473804473877, "global_step": 145837, "epoch": 3472} {"train_loss": -6.855839252471924, "global_step": 145838, "epoch": 3472} {"train_loss": -6.893130302429199, "global_step": 145839, "epoch": 3472} {"train_loss": -6.849398612976074, "global_step": 145840, "epoch": 3472} {"train_loss": -6.850714683532715, "global_step": 145841, "epoch": 3472} {"train_loss": -6.819998741149902, "global_step": 145842, "epoch": 3472} {"train_loss": -6.8995184898376465, "global_step": 145843, "epoch": 3472} {"train_loss": -6.883450508117676, "global_step": 145844, "epoch": 3472} {"train_loss": -6.9060564041137695, "global_step": 145845, "epoch": 3472} {"train_loss": -6.896060466766357, "global_step": 145846, "epoch": 3472} {"train_loss": -6.825276851654053, "global_step": 145847, "epoch": 3472} {"train_loss": -6.889824867248535, "global_step": 145848, "epoch": 3472} {"train_loss": -6.924823760986328, "global_step": 145849, "epoch": 3472} {"train_loss": -6.824534893035889, "global_step": 145850, "epoch": 3472} {"train_loss": -6.869962692260742, "global_step": 145851, "epoch": 3472} {"train_loss": -6.817774772644043, "global_step": 145852, "epoch": 3472} {"train_loss": -6.825240135192871, "global_step": 145853, "epoch": 3472} {"train_loss": -6.679513931274414, "global_step": 145854, "epoch": 3472} {"train_loss": -6.804621696472168, "global_step": 145855, "epoch": 3472} {"train_loss": -6.859889984130859, "global_step": 145856, "epoch": 3472} {"train_loss": -6.73914909362793, "global_step": 145857, "epoch": 3472} {"train_loss": -6.87675666809082, "global_step": 145858, "epoch": 3472} {"train_loss": -6.708736419677734, "global_step": 145859, "epoch": 3472} {"train_loss": -6.813296318054199, "global_step": 145860, "epoch": 3472} {"train_loss": -6.89431095123291, "global_step": 145861, "epoch": 3472} {"train_loss": -6.843303680419922, "global_step": 145862, "epoch": 3472} {"train_loss": -6.82896614074707, "global_step": 145863, "epoch": 3472} {"train_loss": -6.716361999511719, "global_step": 145864, "epoch": 3472} {"train_loss": -6.810163407098679, "global_step": 145865, "epoch": 3472, "val_loss": 78608.6484375} {"train_loss": -6.930773735046387, "global_step": 145866, "epoch": 3473} {"train_loss": -6.751104831695557, "global_step": 145867, "epoch": 3473} {"train_loss": -6.870105743408203, "global_step": 145868, "epoch": 3473} {"train_loss": -6.714987754821777, "global_step": 145869, "epoch": 3473} {"train_loss": -6.913477420806885, "global_step": 145870, "epoch": 3473} {"train_loss": -6.7944817543029785, "global_step": 145871, "epoch": 3473} {"train_loss": -6.800200939178467, "global_step": 145872, "epoch": 3473} {"train_loss": -6.8851213455200195, "global_step": 145873, "epoch": 3473} {"train_loss": -6.769535541534424, "global_step": 145874, "epoch": 3473} {"train_loss": -6.868600368499756, "global_step": 145875, "epoch": 3473} {"train_loss": -6.740461349487305, "global_step": 145876, "epoch": 3473} {"train_loss": -6.714272975921631, "global_step": 145877, "epoch": 3473} {"train_loss": -6.927243232727051, "global_step": 145878, "epoch": 3473} {"train_loss": -6.828864097595215, "global_step": 145879, "epoch": 3473} {"train_loss": -6.821866035461426, "global_step": 145880, "epoch": 3473} {"train_loss": -6.767134666442871, "global_step": 145881, "epoch": 3473} {"train_loss": -6.740408897399902, "global_step": 145882, "epoch": 3473} {"train_loss": -6.917885780334473, "global_step": 145883, "epoch": 3473} {"train_loss": -6.8064985275268555, "global_step": 145884, "epoch": 3473} {"train_loss": -6.8115925788879395, "global_step": 145885, "epoch": 3473} {"train_loss": -6.921570777893066, "global_step": 145886, "epoch": 3473} {"train_loss": -6.8207831382751465, "global_step": 145887, "epoch": 3473} {"train_loss": -6.744559288024902, "global_step": 145888, "epoch": 3473} {"train_loss": -6.946955680847168, "global_step": 145889, "epoch": 3473} {"train_loss": -6.881471633911133, "global_step": 145890, "epoch": 3473} {"train_loss": -6.90659236907959, "global_step": 145891, "epoch": 3473} {"train_loss": -6.815856456756592, "global_step": 145892, "epoch": 3473} {"train_loss": -6.681950569152832, "global_step": 145893, "epoch": 3473} {"train_loss": -6.844938278198242, "global_step": 145894, "epoch": 3473} {"train_loss": -6.7819390296936035, "global_step": 145895, "epoch": 3473} {"train_loss": -6.852540016174316, "global_step": 145896, "epoch": 3473} {"train_loss": -6.926255226135254, "global_step": 145897, "epoch": 3473} {"train_loss": -6.854736328125, "global_step": 145898, "epoch": 3473} {"train_loss": -6.708993434906006, "global_step": 145899, "epoch": 3473} {"train_loss": -6.760836601257324, "global_step": 145900, "epoch": 3473} {"train_loss": -6.663693428039551, "global_step": 145901, "epoch": 3473} {"train_loss": -6.80775260925293, "global_step": 145902, "epoch": 3473} {"train_loss": -6.892039775848389, "global_step": 145903, "epoch": 3473} {"train_loss": -6.664271354675293, "global_step": 145904, "epoch": 3473} {"train_loss": -6.746611595153809, "global_step": 145905, "epoch": 3473} {"train_loss": -6.675615310668945, "global_step": 145906, "epoch": 3473} {"train_loss": -6.808895769573393, "global_step": 145907, "epoch": 3473, "val_loss": 78618.7578125} {"train_loss": -6.826297760009766, "global_step": 145908, "epoch": 3474} {"train_loss": -6.733537673950195, "global_step": 145909, "epoch": 3474} {"train_loss": -6.905236721038818, "global_step": 145910, "epoch": 3474} {"train_loss": -6.706392765045166, "global_step": 145911, "epoch": 3474} {"train_loss": -6.836379528045654, "global_step": 145912, "epoch": 3474} {"train_loss": -6.7270660400390625, "global_step": 145913, "epoch": 3474} {"train_loss": -6.806134223937988, "global_step": 145914, "epoch": 3474} {"train_loss": -6.860678195953369, "global_step": 145915, "epoch": 3474} {"train_loss": -6.898316860198975, "global_step": 145916, "epoch": 3474} {"train_loss": -6.780786991119385, "global_step": 145917, "epoch": 3474} {"train_loss": -6.8683319091796875, "global_step": 145918, "epoch": 3474} {"train_loss": -6.826535701751709, "global_step": 145919, "epoch": 3474} {"train_loss": -6.85398006439209, "global_step": 145920, "epoch": 3474} {"train_loss": -6.8346781730651855, "global_step": 145921, "epoch": 3474} {"train_loss": -6.860544204711914, "global_step": 145922, "epoch": 3474} {"train_loss": -6.818304061889648, "global_step": 145923, "epoch": 3474} {"train_loss": -6.776955604553223, "global_step": 145924, "epoch": 3474} {"train_loss": -6.93165397644043, "global_step": 145925, "epoch": 3474} {"train_loss": -6.952749252319336, "global_step": 145926, "epoch": 3474} {"train_loss": -6.7738847732543945, "global_step": 145927, "epoch": 3474} {"train_loss": -6.880318641662598, "global_step": 145928, "epoch": 3474} {"train_loss": -6.779218673706055, "global_step": 145929, "epoch": 3474} {"train_loss": -6.757657527923584, "global_step": 145930, "epoch": 3474} {"train_loss": -6.859323024749756, "global_step": 145931, "epoch": 3474} {"train_loss": -6.996993064880371, "global_step": 145932, "epoch": 3474} {"train_loss": -6.686166763305664, "global_step": 145933, "epoch": 3474} {"train_loss": -6.7946457862854, "global_step": 145934, "epoch": 3474} {"train_loss": -6.644254684448242, "global_step": 145935, "epoch": 3474} {"train_loss": -6.744088172912598, "global_step": 145936, "epoch": 3474} {"train_loss": -6.941768646240234, "global_step": 145937, "epoch": 3474} {"train_loss": -6.730217933654785, "global_step": 145938, "epoch": 3474} {"train_loss": -6.802858829498291, "global_step": 145939, "epoch": 3474} {"train_loss": -6.846463203430176, "global_step": 145940, "epoch": 3474} {"train_loss": -6.803647994995117, "global_step": 145941, "epoch": 3474} {"train_loss": -6.787315368652344, "global_step": 145942, "epoch": 3474} {"train_loss": -6.832026481628418, "global_step": 145943, "epoch": 3474} {"train_loss": -6.80450439453125, "global_step": 145944, "epoch": 3474} {"train_loss": -6.821880340576172, "global_step": 145945, "epoch": 3474} {"train_loss": -6.780426979064941, "global_step": 145946, "epoch": 3474} {"train_loss": -6.864381790161133, "global_step": 145947, "epoch": 3474} {"train_loss": -6.860776424407959, "global_step": 145948, "epoch": 3474} {"train_loss": -6.821845043273199, "global_step": 145949, "epoch": 3474, "val_loss": 78323.890625} {"train_loss": -6.796651840209961, "global_step": 145950, "epoch": 3475} {"train_loss": -6.856720924377441, "global_step": 145951, "epoch": 3475} {"train_loss": -6.859506607055664, "global_step": 145952, "epoch": 3475} {"train_loss": -6.810013771057129, "global_step": 145953, "epoch": 3475} {"train_loss": -6.841236114501953, "global_step": 145954, "epoch": 3475} {"train_loss": -6.871999740600586, "global_step": 145955, "epoch": 3475} {"train_loss": -6.878283500671387, "global_step": 145956, "epoch": 3475} {"train_loss": -6.856889247894287, "global_step": 145957, "epoch": 3475} {"train_loss": -6.824180603027344, "global_step": 145958, "epoch": 3475} {"train_loss": -6.880227088928223, "global_step": 145959, "epoch": 3475} {"train_loss": -6.638950347900391, "global_step": 145960, "epoch": 3475} {"train_loss": -6.7447099685668945, "global_step": 145961, "epoch": 3475} {"train_loss": -6.815120697021484, "global_step": 145962, "epoch": 3475} {"train_loss": -6.81804084777832, "global_step": 145963, "epoch": 3475} {"train_loss": -6.907946586608887, "global_step": 145964, "epoch": 3475} {"train_loss": -6.804378509521484, "global_step": 145965, "epoch": 3475} {"train_loss": -6.743762969970703, "global_step": 145966, "epoch": 3475} {"train_loss": -6.824261665344238, "global_step": 145967, "epoch": 3475} {"train_loss": -6.800177574157715, "global_step": 145968, "epoch": 3475} {"train_loss": -6.766921043395996, "global_step": 145969, "epoch": 3475} {"train_loss": -6.951282978057861, "global_step": 145970, "epoch": 3475} {"train_loss": -6.854531288146973, "global_step": 145971, "epoch": 3475} {"train_loss": -6.843467712402344, "global_step": 145972, "epoch": 3475} {"train_loss": -6.754097938537598, "global_step": 145973, "epoch": 3475} {"train_loss": -6.950716018676758, "global_step": 145974, "epoch": 3475} {"train_loss": -6.8473005294799805, "global_step": 145975, "epoch": 3475} {"train_loss": -6.7803754806518555, "global_step": 145976, "epoch": 3475} {"train_loss": -6.8389434814453125, "global_step": 145977, "epoch": 3475} {"train_loss": -6.952996253967285, "global_step": 145978, "epoch": 3475} {"train_loss": -6.826579570770264, "global_step": 145979, "epoch": 3475} {"train_loss": -6.845094680786133, "global_step": 145980, "epoch": 3475} {"train_loss": -6.799178123474121, "global_step": 145981, "epoch": 3475} {"train_loss": -6.776352882385254, "global_step": 145982, "epoch": 3475} {"train_loss": -6.921795845031738, "global_step": 145983, "epoch": 3475} {"train_loss": -6.890620708465576, "global_step": 145984, "epoch": 3475} {"train_loss": -6.746230125427246, "global_step": 145985, "epoch": 3475} {"train_loss": -6.736950397491455, "global_step": 145986, "epoch": 3475} {"train_loss": -6.777331352233887, "global_step": 145987, "epoch": 3475} {"train_loss": -6.672318935394287, "global_step": 145988, "epoch": 3475} {"train_loss": -6.641069412231445, "global_step": 145989, "epoch": 3475} {"train_loss": -6.855906009674072, "global_step": 145990, "epoch": 3475} {"train_loss": -6.815815698532831, "global_step": 145991, "epoch": 3475, "val_loss": 78451.0390625} {"train_loss": -6.637200355529785, "global_step": 145992, "epoch": 3476} {"train_loss": -6.787853240966797, "global_step": 145993, "epoch": 3476} {"train_loss": -6.604461669921875, "global_step": 145994, "epoch": 3476} {"train_loss": -6.809438228607178, "global_step": 145995, "epoch": 3476} {"train_loss": -6.6197357177734375, "global_step": 145996, "epoch": 3476} {"train_loss": -6.687740325927734, "global_step": 145997, "epoch": 3476} {"train_loss": -6.733466148376465, "global_step": 145998, "epoch": 3476} {"train_loss": -6.762036323547363, "global_step": 145999, "epoch": 3476} {"train_loss": -6.691188335418701, "global_step": 146000, "epoch": 3476} {"train_loss": -6.655099868774414, "global_step": 146001, "epoch": 3476} {"train_loss": -6.762056350708008, "global_step": 146002, "epoch": 3476} {"train_loss": -6.718459129333496, "global_step": 146003, "epoch": 3476} {"train_loss": -6.894688606262207, "global_step": 146004, "epoch": 3476} {"train_loss": -6.7724609375, "global_step": 146005, "epoch": 3476} {"train_loss": -6.72138786315918, "global_step": 146006, "epoch": 3476} {"train_loss": -6.727458953857422, "global_step": 146007, "epoch": 3476} {"train_loss": -6.869653701782227, "global_step": 146008, "epoch": 3476} {"train_loss": -6.820700645446777, "global_step": 146009, "epoch": 3476} {"train_loss": -6.7139129638671875, "global_step": 146010, "epoch": 3476} {"train_loss": -6.776294708251953, "global_step": 146011, "epoch": 3476} {"train_loss": -6.881067276000977, "global_step": 146012, "epoch": 3476} {"train_loss": -6.8146772384643555, "global_step": 146013, "epoch": 3476} {"train_loss": -6.903749465942383, "global_step": 146014, "epoch": 3476} {"train_loss": -6.846056938171387, "global_step": 146015, "epoch": 3476} {"train_loss": -6.822742938995361, "global_step": 146016, "epoch": 3476} {"train_loss": -6.829132080078125, "global_step": 146017, "epoch": 3476} {"train_loss": -6.873976707458496, "global_step": 146018, "epoch": 3476} {"train_loss": -6.772231101989746, "global_step": 146019, "epoch": 3476} {"train_loss": -6.8564324378967285, "global_step": 146020, "epoch": 3476} {"train_loss": -6.950749397277832, "global_step": 146021, "epoch": 3476} {"train_loss": -6.858668804168701, "global_step": 146022, "epoch": 3476} {"train_loss": -6.843052864074707, "global_step": 146023, "epoch": 3476} {"train_loss": -6.860294342041016, "global_step": 146024, "epoch": 3476} {"train_loss": -6.859574317932129, "global_step": 146025, "epoch": 3476} {"train_loss": -6.850290298461914, "global_step": 146026, "epoch": 3476} {"train_loss": -6.9235687255859375, "global_step": 146027, "epoch": 3476} {"train_loss": -6.874444961547852, "global_step": 146028, "epoch": 3476} {"train_loss": -6.980503082275391, "global_step": 146029, "epoch": 3476} {"train_loss": -6.868392467498779, "global_step": 146030, "epoch": 3476} {"train_loss": -6.789422035217285, "global_step": 146031, "epoch": 3476} {"train_loss": -6.896084308624268, "global_step": 146032, "epoch": 3476} {"train_loss": -6.806803862253825, "global_step": 146033, "epoch": 3476, "val_loss": 78433.2578125} {"train_loss": -6.828401565551758, "global_step": 146034, "epoch": 3477} {"train_loss": -6.884146213531494, "global_step": 146035, "epoch": 3477} {"train_loss": -6.907253265380859, "global_step": 146036, "epoch": 3477} {"train_loss": -6.861845016479492, "global_step": 146037, "epoch": 3477} {"train_loss": -6.770913124084473, "global_step": 146038, "epoch": 3477} {"train_loss": -6.9299774169921875, "global_step": 146039, "epoch": 3477} {"train_loss": -6.86903715133667, "global_step": 146040, "epoch": 3477} {"train_loss": -6.8360595703125, "global_step": 146041, "epoch": 3477} {"train_loss": -6.791153907775879, "global_step": 146042, "epoch": 3477} {"train_loss": -6.90965461730957, "global_step": 146043, "epoch": 3477} {"train_loss": -6.7129058837890625, "global_step": 146044, "epoch": 3477} {"train_loss": -6.801368236541748, "global_step": 146045, "epoch": 3477} {"train_loss": -6.814480781555176, "global_step": 146046, "epoch": 3477} {"train_loss": -6.724826335906982, "global_step": 146047, "epoch": 3477} {"train_loss": -6.680735111236572, "global_step": 146048, "epoch": 3477} {"train_loss": -6.916298866271973, "global_step": 146049, "epoch": 3477} {"train_loss": -6.768954277038574, "global_step": 146050, "epoch": 3477} {"train_loss": -6.744039058685303, "global_step": 146051, "epoch": 3477} {"train_loss": -6.76073694229126, "global_step": 146052, "epoch": 3477} {"train_loss": -6.751093864440918, "global_step": 146053, "epoch": 3477} {"train_loss": -6.743344306945801, "global_step": 146054, "epoch": 3477} {"train_loss": -6.727480888366699, "global_step": 146055, "epoch": 3477} {"train_loss": -6.664848804473877, "global_step": 146056, "epoch": 3477} {"train_loss": -6.895116806030273, "global_step": 146057, "epoch": 3477} {"train_loss": -6.681944370269775, "global_step": 146058, "epoch": 3477} {"train_loss": -6.799707412719727, "global_step": 146059, "epoch": 3477} {"train_loss": -6.833211898803711, "global_step": 146060, "epoch": 3477} {"train_loss": -6.749302864074707, "global_step": 146061, "epoch": 3477} {"train_loss": -6.779623985290527, "global_step": 146062, "epoch": 3477} {"train_loss": -6.856240272521973, "global_step": 146063, "epoch": 3477} {"train_loss": -6.806995868682861, "global_step": 146064, "epoch": 3477} {"train_loss": -6.882541656494141, "global_step": 146065, "epoch": 3477} {"train_loss": -6.870349884033203, "global_step": 146066, "epoch": 3477} {"train_loss": -6.917065620422363, "global_step": 146067, "epoch": 3477} {"train_loss": -6.919013023376465, "global_step": 146068, "epoch": 3477} {"train_loss": -6.7822771072387695, "global_step": 146069, "epoch": 3477} {"train_loss": -6.816938877105713, "global_step": 146070, "epoch": 3477} {"train_loss": -6.83206844329834, "global_step": 146071, "epoch": 3477} {"train_loss": -6.856581687927246, "global_step": 146072, "epoch": 3477} {"train_loss": -6.848109245300293, "global_step": 146073, "epoch": 3477} {"train_loss": -6.7612624168396, "global_step": 146074, "epoch": 3477} {"train_loss": -6.810649860472906, "global_step": 146075, "epoch": 3477, "val_loss": 78496.5078125} {"train_loss": -6.943158149719238, "global_step": 146076, "epoch": 3478} {"train_loss": -6.839815139770508, "global_step": 146077, "epoch": 3478} {"train_loss": -6.823436260223389, "global_step": 146078, "epoch": 3478} {"train_loss": -6.775113105773926, "global_step": 146079, "epoch": 3478} {"train_loss": -6.818785667419434, "global_step": 146080, "epoch": 3478} {"train_loss": -6.821989059448242, "global_step": 146081, "epoch": 3478} {"train_loss": -6.946002960205078, "global_step": 146082, "epoch": 3478} {"train_loss": -6.829206943511963, "global_step": 146083, "epoch": 3478} {"train_loss": -6.837394714355469, "global_step": 146084, "epoch": 3478} {"train_loss": -6.7862548828125, "global_step": 146085, "epoch": 3478} {"train_loss": -6.79217529296875, "global_step": 146086, "epoch": 3478} {"train_loss": -6.756019115447998, "global_step": 146087, "epoch": 3478} {"train_loss": -6.873224258422852, "global_step": 146088, "epoch": 3478} {"train_loss": -6.8190412521362305, "global_step": 146089, "epoch": 3478} {"train_loss": -6.728178024291992, "global_step": 146090, "epoch": 3478} {"train_loss": -6.926758766174316, "global_step": 146091, "epoch": 3478} {"train_loss": -6.747983932495117, "global_step": 146092, "epoch": 3478} {"train_loss": -6.793118953704834, "global_step": 146093, "epoch": 3478} {"train_loss": -6.788082122802734, "global_step": 146094, "epoch": 3478} {"train_loss": -6.792717456817627, "global_step": 146095, "epoch": 3478} {"train_loss": -6.819062232971191, "global_step": 146096, "epoch": 3478} {"train_loss": -6.782961845397949, "global_step": 146097, "epoch": 3478} {"train_loss": -6.7717695236206055, "global_step": 146098, "epoch": 3478} {"train_loss": -6.811101913452148, "global_step": 146099, "epoch": 3478} {"train_loss": -6.854712009429932, "global_step": 146100, "epoch": 3478} {"train_loss": -6.846430778503418, "global_step": 146101, "epoch": 3478} {"train_loss": -6.680214881896973, "global_step": 146102, "epoch": 3478} {"train_loss": -6.84805965423584, "global_step": 146103, "epoch": 3478} {"train_loss": -6.776878356933594, "global_step": 146104, "epoch": 3478} {"train_loss": -6.825497627258301, "global_step": 146105, "epoch": 3478} {"train_loss": -6.7618408203125, "global_step": 146106, "epoch": 3478} {"train_loss": -6.819793224334717, "global_step": 146107, "epoch": 3478} {"train_loss": -6.881645202636719, "global_step": 146108, "epoch": 3478} {"train_loss": -6.785819053649902, "global_step": 146109, "epoch": 3478} {"train_loss": -6.762735366821289, "global_step": 146110, "epoch": 3478} {"train_loss": -6.859636306762695, "global_step": 146111, "epoch": 3478} {"train_loss": -6.810086250305176, "global_step": 146112, "epoch": 3478} {"train_loss": -6.869380474090576, "global_step": 146113, "epoch": 3478} {"train_loss": -6.8472394943237305, "global_step": 146114, "epoch": 3478} {"train_loss": -6.896786689758301, "global_step": 146115, "epoch": 3478} {"train_loss": -6.691094875335693, "global_step": 146116, "epoch": 3478} {"train_loss": -6.816864660808018, "global_step": 146117, "epoch": 3478, "val_loss": 78272.1875} {"train_loss": -6.843608856201172, "global_step": 146118, "epoch": 3479} {"train_loss": -6.765372276306152, "global_step": 146119, "epoch": 3479} {"train_loss": -6.852376937866211, "global_step": 146120, "epoch": 3479} {"train_loss": -6.857166290283203, "global_step": 146121, "epoch": 3479} {"train_loss": -6.808865547180176, "global_step": 146122, "epoch": 3479} {"train_loss": -6.829190731048584, "global_step": 146123, "epoch": 3479} {"train_loss": -6.799257278442383, "global_step": 146124, "epoch": 3479} {"train_loss": -6.96195125579834, "global_step": 146125, "epoch": 3479} {"train_loss": -6.768272399902344, "global_step": 146126, "epoch": 3479} {"train_loss": -6.868993282318115, "global_step": 146127, "epoch": 3479} {"train_loss": -6.883242607116699, "global_step": 146128, "epoch": 3479} {"train_loss": -6.777541637420654, "global_step": 146129, "epoch": 3479} {"train_loss": -6.822232246398926, "global_step": 146130, "epoch": 3479} {"train_loss": -6.687621116638184, "global_step": 146131, "epoch": 3479} {"train_loss": -6.873071670532227, "global_step": 146132, "epoch": 3479} {"train_loss": -6.9162797927856445, "global_step": 146133, "epoch": 3479} {"train_loss": -6.840524196624756, "global_step": 146134, "epoch": 3479} {"train_loss": -6.86686897277832, "global_step": 146135, "epoch": 3479} {"train_loss": -6.754986763000488, "global_step": 146136, "epoch": 3479} {"train_loss": -6.710668087005615, "global_step": 146137, "epoch": 3479} {"train_loss": -6.835087776184082, "global_step": 146138, "epoch": 3479} {"train_loss": -6.776931285858154, "global_step": 146139, "epoch": 3479} {"train_loss": -6.7698774337768555, "global_step": 146140, "epoch": 3479} {"train_loss": -6.781118392944336, "global_step": 146141, "epoch": 3479} {"train_loss": -6.658441066741943, "global_step": 146142, "epoch": 3479} {"train_loss": -6.759638786315918, "global_step": 146143, "epoch": 3479} {"train_loss": -6.8298139572143555, "global_step": 146144, "epoch": 3479} {"train_loss": -6.776984691619873, "global_step": 146145, "epoch": 3479} {"train_loss": -6.703370094299316, "global_step": 146146, "epoch": 3479} {"train_loss": -6.559624671936035, "global_step": 146147, "epoch": 3479} {"train_loss": -6.85575008392334, "global_step": 146148, "epoch": 3479} {"train_loss": -6.651185989379883, "global_step": 146149, "epoch": 3479} {"train_loss": -6.7537760734558105, "global_step": 146150, "epoch": 3479} {"train_loss": -6.706127166748047, "global_step": 146151, "epoch": 3479} {"train_loss": -6.809637069702148, "global_step": 146152, "epoch": 3479} {"train_loss": -6.7574615478515625, "global_step": 146153, "epoch": 3479} {"train_loss": -6.770603179931641, "global_step": 146154, "epoch": 3479} {"train_loss": -6.793980598449707, "global_step": 146155, "epoch": 3479} {"train_loss": -6.717877388000488, "global_step": 146156, "epoch": 3479} {"train_loss": -6.78007173538208, "global_step": 146157, "epoch": 3479} {"train_loss": -6.773712635040283, "global_step": 146158, "epoch": 3479} {"train_loss": -6.792034864425659, "global_step": 146159, "epoch": 3479, "val_loss": 78590.8203125} {"train_loss": -6.8110151290893555, "global_step": 146160, "epoch": 3480} {"train_loss": -6.865367889404297, "global_step": 146161, "epoch": 3480} {"train_loss": -6.843501567840576, "global_step": 146162, "epoch": 3480} {"train_loss": -6.899086952209473, "global_step": 146163, "epoch": 3480} {"train_loss": -6.852363586425781, "global_step": 146164, "epoch": 3480} {"train_loss": -6.878862380981445, "global_step": 146165, "epoch": 3480} {"train_loss": -6.771302700042725, "global_step": 146166, "epoch": 3480} {"train_loss": -6.753034591674805, "global_step": 146167, "epoch": 3480} {"train_loss": -6.715219497680664, "global_step": 146168, "epoch": 3480} {"train_loss": -6.717480659484863, "global_step": 146169, "epoch": 3480} {"train_loss": -6.838168144226074, "global_step": 146170, "epoch": 3480} {"train_loss": -6.6972975730896, "global_step": 146171, "epoch": 3480} {"train_loss": -6.84255313873291, "global_step": 146172, "epoch": 3480} {"train_loss": -6.688238143920898, "global_step": 146173, "epoch": 3480} {"train_loss": -6.736457824707031, "global_step": 146174, "epoch": 3480} {"train_loss": -6.760191917419434, "global_step": 146175, "epoch": 3480} {"train_loss": -6.650875091552734, "global_step": 146176, "epoch": 3480} {"train_loss": -6.832164287567139, "global_step": 146177, "epoch": 3480} {"train_loss": -6.741703033447266, "global_step": 146178, "epoch": 3480} {"train_loss": -6.756711959838867, "global_step": 146179, "epoch": 3480} {"train_loss": -6.811101913452148, "global_step": 146180, "epoch": 3480} {"train_loss": -6.729793071746826, "global_step": 146181, "epoch": 3480} {"train_loss": -6.616042613983154, "global_step": 146182, "epoch": 3480} {"train_loss": -6.836443901062012, "global_step": 146183, "epoch": 3480} {"train_loss": -6.689699172973633, "global_step": 146184, "epoch": 3480} {"train_loss": -6.8644866943359375, "global_step": 146185, "epoch": 3480} {"train_loss": -6.875205039978027, "global_step": 146186, "epoch": 3480} {"train_loss": -6.852972030639648, "global_step": 146187, "epoch": 3480} {"train_loss": -6.860253810882568, "global_step": 146188, "epoch": 3480} {"train_loss": -6.823760509490967, "global_step": 146189, "epoch": 3480} {"train_loss": -6.861452579498291, "global_step": 146190, "epoch": 3480} {"train_loss": -6.911964416503906, "global_step": 146191, "epoch": 3480} {"train_loss": -6.865527629852295, "global_step": 146192, "epoch": 3480} {"train_loss": -6.829864501953125, "global_step": 146193, "epoch": 3480} {"train_loss": -6.900712966918945, "global_step": 146194, "epoch": 3480} {"train_loss": -6.853480815887451, "global_step": 146195, "epoch": 3480} {"train_loss": -6.87041711807251, "global_step": 146196, "epoch": 3480} {"train_loss": -6.80863094329834, "global_step": 146197, "epoch": 3480} {"train_loss": -6.605171203613281, "global_step": 146198, "epoch": 3480} {"train_loss": -6.859700679779053, "global_step": 146199, "epoch": 3480} {"train_loss": -6.884930610656738, "global_step": 146200, "epoch": 3480} {"train_loss": -6.8029511996677945, "global_step": 146201, "epoch": 3480, "val_loss": 78424.0546875} {"train_loss": -6.841281414031982, "global_step": 146202, "epoch": 3481} {"train_loss": -6.920458793640137, "global_step": 146203, "epoch": 3481} {"train_loss": -6.793733596801758, "global_step": 146204, "epoch": 3481} {"train_loss": -6.962153434753418, "global_step": 146205, "epoch": 3481} {"train_loss": -6.789284706115723, "global_step": 146206, "epoch": 3481} {"train_loss": -6.806690216064453, "global_step": 146207, "epoch": 3481} {"train_loss": -6.85546875, "global_step": 146208, "epoch": 3481} {"train_loss": -6.9345598220825195, "global_step": 146209, "epoch": 3481} {"train_loss": -6.896937370300293, "global_step": 146210, "epoch": 3481} {"train_loss": -6.80385684967041, "global_step": 146211, "epoch": 3481} {"train_loss": -6.751646995544434, "global_step": 146212, "epoch": 3481} {"train_loss": -6.719122409820557, "global_step": 146213, "epoch": 3481} {"train_loss": -6.913903713226318, "global_step": 146214, "epoch": 3481} {"train_loss": -6.865549564361572, "global_step": 146215, "epoch": 3481} {"train_loss": -6.757190704345703, "global_step": 146216, "epoch": 3481} {"train_loss": -6.870644569396973, "global_step": 146217, "epoch": 3481} {"train_loss": -6.908346176147461, "global_step": 146218, "epoch": 3481} {"train_loss": -6.8291916847229, "global_step": 146219, "epoch": 3481} {"train_loss": -6.7755327224731445, "global_step": 146220, "epoch": 3481} {"train_loss": -6.7936248779296875, "global_step": 146221, "epoch": 3481} {"train_loss": -6.777403354644775, "global_step": 146222, "epoch": 3481} {"train_loss": -6.806313514709473, "global_step": 146223, "epoch": 3481} {"train_loss": -6.9076642990112305, "global_step": 146224, "epoch": 3481} {"train_loss": -6.862667083740234, "global_step": 146225, "epoch": 3481} {"train_loss": -6.9481072425842285, "global_step": 146226, "epoch": 3481} {"train_loss": -6.9545416831970215, "global_step": 146227, "epoch": 3481} {"train_loss": -6.878137111663818, "global_step": 146228, "epoch": 3481} {"train_loss": -6.83388614654541, "global_step": 146229, "epoch": 3481} {"train_loss": -6.913095474243164, "global_step": 146230, "epoch": 3481} {"train_loss": -6.779794216156006, "global_step": 146231, "epoch": 3481} {"train_loss": -7.001869201660156, "global_step": 146232, "epoch": 3481} {"train_loss": -6.911417007446289, "global_step": 146233, "epoch": 3481} {"train_loss": -6.828222274780273, "global_step": 146234, "epoch": 3481} {"train_loss": -6.984905242919922, "global_step": 146235, "epoch": 3481} {"train_loss": -6.849665641784668, "global_step": 146236, "epoch": 3481} {"train_loss": -6.9564313888549805, "global_step": 146237, "epoch": 3481} {"train_loss": -6.941890716552734, "global_step": 146238, "epoch": 3481} {"train_loss": -6.884100914001465, "global_step": 146239, "epoch": 3481} {"train_loss": -6.882822036743164, "global_step": 146240, "epoch": 3481} {"train_loss": -6.840332508087158, "global_step": 146241, "epoch": 3481} {"train_loss": -6.978661060333252, "global_step": 146242, "epoch": 3481} {"train_loss": -6.86650596346174, "global_step": 146243, "epoch": 3481, "val_loss": 78472.7265625} {"train_loss": -6.763768196105957, "global_step": 146244, "epoch": 3482} {"train_loss": -6.9909772872924805, "global_step": 146245, "epoch": 3482} {"train_loss": -6.926505088806152, "global_step": 146246, "epoch": 3482} {"train_loss": -6.824645519256592, "global_step": 146247, "epoch": 3482} {"train_loss": -6.860797882080078, "global_step": 146248, "epoch": 3482} {"train_loss": -6.783109188079834, "global_step": 146249, "epoch": 3482} {"train_loss": -6.798050403594971, "global_step": 146250, "epoch": 3482} {"train_loss": -6.9469099044799805, "global_step": 146251, "epoch": 3482} {"train_loss": -6.787353992462158, "global_step": 146252, "epoch": 3482} {"train_loss": -6.8376007080078125, "global_step": 146253, "epoch": 3482} {"train_loss": -6.905673503875732, "global_step": 146254, "epoch": 3482} {"train_loss": -6.8120927810668945, "global_step": 146255, "epoch": 3482} {"train_loss": -6.846166610717773, "global_step": 146256, "epoch": 3482} {"train_loss": -6.816603660583496, "global_step": 146257, "epoch": 3482} {"train_loss": -6.766913414001465, "global_step": 146258, "epoch": 3482} {"train_loss": -6.773670196533203, "global_step": 146259, "epoch": 3482} {"train_loss": -6.832769393920898, "global_step": 146260, "epoch": 3482} {"train_loss": -6.922294616699219, "global_step": 146261, "epoch": 3482} {"train_loss": -6.846290588378906, "global_step": 146262, "epoch": 3482} {"train_loss": -6.851873397827148, "global_step": 146263, "epoch": 3482} {"train_loss": -6.708738327026367, "global_step": 146264, "epoch": 3482} {"train_loss": -6.773738384246826, "global_step": 146265, "epoch": 3482} {"train_loss": -6.816381454467773, "global_step": 146266, "epoch": 3482} {"train_loss": -6.732988357543945, "global_step": 146267, "epoch": 3482} {"train_loss": -6.730348110198975, "global_step": 146268, "epoch": 3482} {"train_loss": -6.781618118286133, "global_step": 146269, "epoch": 3482} {"train_loss": -6.829546928405762, "global_step": 146270, "epoch": 3482} {"train_loss": -6.79000997543335, "global_step": 146271, "epoch": 3482} {"train_loss": -6.836981773376465, "global_step": 146272, "epoch": 3482} {"train_loss": -6.904638290405273, "global_step": 146273, "epoch": 3482} {"train_loss": -6.7670183181762695, "global_step": 146274, "epoch": 3482} {"train_loss": -6.795212745666504, "global_step": 146275, "epoch": 3482} {"train_loss": -6.898062705993652, "global_step": 146276, "epoch": 3482} {"train_loss": -6.843195915222168, "global_step": 146277, "epoch": 3482} {"train_loss": -6.805490016937256, "global_step": 146278, "epoch": 3482} {"train_loss": -6.763889312744141, "global_step": 146279, "epoch": 3482} {"train_loss": -6.903064250946045, "global_step": 146280, "epoch": 3482} {"train_loss": -6.867212295532227, "global_step": 146281, "epoch": 3482} {"train_loss": -6.8279337882995605, "global_step": 146282, "epoch": 3482} {"train_loss": -6.814252853393555, "global_step": 146283, "epoch": 3482} {"train_loss": -6.852162837982178, "global_step": 146284, "epoch": 3482} {"train_loss": -6.829317615145729, "global_step": 146285, "epoch": 3482, "val_loss": 78516.5625} {"train_loss": -6.851526260375977, "global_step": 146286, "epoch": 3483} {"train_loss": -6.838807106018066, "global_step": 146287, "epoch": 3483} {"train_loss": -6.73574686050415, "global_step": 146288, "epoch": 3483} {"train_loss": -6.909167766571045, "global_step": 146289, "epoch": 3483} {"train_loss": -6.914731502532959, "global_step": 146290, "epoch": 3483} {"train_loss": -6.744289398193359, "global_step": 146291, "epoch": 3483} {"train_loss": -6.817211151123047, "global_step": 146292, "epoch": 3483} {"train_loss": -6.795446872711182, "global_step": 146293, "epoch": 3483} {"train_loss": -6.81643009185791, "global_step": 146294, "epoch": 3483} {"train_loss": -6.837549209594727, "global_step": 146295, "epoch": 3483} {"train_loss": -6.861692905426025, "global_step": 146296, "epoch": 3483} {"train_loss": -6.73151969909668, "global_step": 146297, "epoch": 3483} {"train_loss": -6.774709701538086, "global_step": 146298, "epoch": 3483} {"train_loss": -6.773836612701416, "global_step": 146299, "epoch": 3483} {"train_loss": -6.85065221786499, "global_step": 146300, "epoch": 3483} {"train_loss": -6.828124523162842, "global_step": 146301, "epoch": 3483} {"train_loss": -6.726370811462402, "global_step": 146302, "epoch": 3483} {"train_loss": -6.735850811004639, "global_step": 146303, "epoch": 3483} {"train_loss": -6.796717643737793, "global_step": 146304, "epoch": 3483} {"train_loss": -6.7954912185668945, "global_step": 146305, "epoch": 3483} {"train_loss": -6.789011478424072, "global_step": 146306, "epoch": 3483} {"train_loss": -6.825047969818115, "global_step": 146307, "epoch": 3483} {"train_loss": -6.740818023681641, "global_step": 146308, "epoch": 3483} {"train_loss": -6.886824607849121, "global_step": 146309, "epoch": 3483} {"train_loss": -6.81494140625, "global_step": 146310, "epoch": 3483} {"train_loss": -6.697359085083008, "global_step": 146311, "epoch": 3483} {"train_loss": -6.8216753005981445, "global_step": 146312, "epoch": 3483} {"train_loss": -6.738883972167969, "global_step": 146313, "epoch": 3483} {"train_loss": -6.787891864776611, "global_step": 146314, "epoch": 3483} {"train_loss": -6.785557746887207, "global_step": 146315, "epoch": 3483} {"train_loss": -6.7991743087768555, "global_step": 146316, "epoch": 3483} {"train_loss": -6.79310417175293, "global_step": 146317, "epoch": 3483} {"train_loss": -6.8057475090026855, "global_step": 146318, "epoch": 3483} {"train_loss": -6.782840728759766, "global_step": 146319, "epoch": 3483} {"train_loss": -6.765155792236328, "global_step": 146320, "epoch": 3483} {"train_loss": -6.7721147537231445, "global_step": 146321, "epoch": 3483} {"train_loss": -6.799570083618164, "global_step": 146322, "epoch": 3483} {"train_loss": -6.754200458526611, "global_step": 146323, "epoch": 3483} {"train_loss": -6.956890106201172, "global_step": 146324, "epoch": 3483} {"train_loss": -6.801344871520996, "global_step": 146325, "epoch": 3483} {"train_loss": -6.808930397033691, "global_step": 146326, "epoch": 3483} {"train_loss": -6.801223891122, "global_step": 146327, "epoch": 3483, "val_loss": 78579.3125} {"train_loss": -6.772467613220215, "global_step": 146328, "epoch": 3484} {"train_loss": -6.952366828918457, "global_step": 146329, "epoch": 3484} {"train_loss": -6.8754472732543945, "global_step": 146330, "epoch": 3484} {"train_loss": -6.900671005249023, "global_step": 146331, "epoch": 3484} {"train_loss": -6.860939979553223, "global_step": 146332, "epoch": 3484} {"train_loss": -6.855650901794434, "global_step": 146333, "epoch": 3484} {"train_loss": -6.900744438171387, "global_step": 146334, "epoch": 3484} {"train_loss": -6.88935661315918, "global_step": 146335, "epoch": 3484} {"train_loss": -6.928540229797363, "global_step": 146336, "epoch": 3484} {"train_loss": -6.822304725646973, "global_step": 146337, "epoch": 3484} {"train_loss": -6.943362236022949, "global_step": 146338, "epoch": 3484} {"train_loss": -6.868403911590576, "global_step": 146339, "epoch": 3484} {"train_loss": -6.808722496032715, "global_step": 146340, "epoch": 3484} {"train_loss": -6.8594489097595215, "global_step": 146341, "epoch": 3484} {"train_loss": -6.894118309020996, "global_step": 146342, "epoch": 3484} {"train_loss": -6.887293338775635, "global_step": 146343, "epoch": 3484} {"train_loss": -6.816035747528076, "global_step": 146344, "epoch": 3484} {"train_loss": -6.925657272338867, "global_step": 146345, "epoch": 3484} {"train_loss": -6.815494060516357, "global_step": 146346, "epoch": 3484} {"train_loss": -6.902773380279541, "global_step": 146347, "epoch": 3484} {"train_loss": -6.891502380371094, "global_step": 146348, "epoch": 3484} {"train_loss": -6.836790084838867, "global_step": 146349, "epoch": 3484} {"train_loss": -6.8762922286987305, "global_step": 146350, "epoch": 3484} {"train_loss": -6.897056579589844, "global_step": 146351, "epoch": 3484} {"train_loss": -6.85579776763916, "global_step": 146352, "epoch": 3484} {"train_loss": -6.8433709144592285, "global_step": 146353, "epoch": 3484} {"train_loss": -6.901095867156982, "global_step": 146354, "epoch": 3484} {"train_loss": -6.877873420715332, "global_step": 146355, "epoch": 3484} {"train_loss": -6.821778297424316, "global_step": 146356, "epoch": 3484} {"train_loss": -6.910693645477295, "global_step": 146357, "epoch": 3484} {"train_loss": -6.7813496589660645, "global_step": 146358, "epoch": 3484} {"train_loss": -6.865423202514648, "global_step": 146359, "epoch": 3484} {"train_loss": -6.844736576080322, "global_step": 146360, "epoch": 3484} {"train_loss": -6.942363739013672, "global_step": 146361, "epoch": 3484} {"train_loss": -6.928896427154541, "global_step": 146362, "epoch": 3484} {"train_loss": -6.8963518142700195, "global_step": 146363, "epoch": 3484} {"train_loss": -6.721258163452148, "global_step": 146364, "epoch": 3484} {"train_loss": -6.823813438415527, "global_step": 146365, "epoch": 3484} {"train_loss": -6.850407123565674, "global_step": 146366, "epoch": 3484} {"train_loss": -6.801288604736328, "global_step": 146367, "epoch": 3484} {"train_loss": -6.934969902038574, "global_step": 146368, "epoch": 3484} {"train_loss": -6.866299231847127, "global_step": 146369, "epoch": 3484, "val_loss": 78572.40625} {"train_loss": -6.810378074645996, "global_step": 146370, "epoch": 3485} {"train_loss": -6.767917156219482, "global_step": 146371, "epoch": 3485} {"train_loss": -6.820089817047119, "global_step": 146372, "epoch": 3485} {"train_loss": -6.788010597229004, "global_step": 146373, "epoch": 3485} {"train_loss": -6.918521881103516, "global_step": 146374, "epoch": 3485} {"train_loss": -6.692704200744629, "global_step": 146375, "epoch": 3485} {"train_loss": -6.8342695236206055, "global_step": 146376, "epoch": 3485} {"train_loss": -6.901725769042969, "global_step": 146377, "epoch": 3485} {"train_loss": -6.730854034423828, "global_step": 146378, "epoch": 3485} {"train_loss": -6.835813522338867, "global_step": 146379, "epoch": 3485} {"train_loss": -6.886241912841797, "global_step": 146380, "epoch": 3485} {"train_loss": -6.810058116912842, "global_step": 146381, "epoch": 3485} {"train_loss": -6.90729284286499, "global_step": 146382, "epoch": 3485} {"train_loss": -6.774911403656006, "global_step": 146383, "epoch": 3485} {"train_loss": -6.771518230438232, "global_step": 146384, "epoch": 3485} {"train_loss": -6.948793411254883, "global_step": 146385, "epoch": 3485} {"train_loss": -6.855971336364746, "global_step": 146386, "epoch": 3485} {"train_loss": -6.863944053649902, "global_step": 146387, "epoch": 3485} {"train_loss": -6.771608352661133, "global_step": 146388, "epoch": 3485} {"train_loss": -6.677058219909668, "global_step": 146389, "epoch": 3485} {"train_loss": -6.8240647315979, "global_step": 146390, "epoch": 3485} {"train_loss": -6.760517120361328, "global_step": 146391, "epoch": 3485} {"train_loss": -6.765024185180664, "global_step": 146392, "epoch": 3485} {"train_loss": -6.821941375732422, "global_step": 146393, "epoch": 3485} {"train_loss": -6.779812812805176, "global_step": 146394, "epoch": 3485} {"train_loss": -6.850700855255127, "global_step": 146395, "epoch": 3485} {"train_loss": -6.870578765869141, "global_step": 146396, "epoch": 3485} {"train_loss": -6.718298435211182, "global_step": 146397, "epoch": 3485} {"train_loss": -6.767712593078613, "global_step": 146398, "epoch": 3485} {"train_loss": -6.691850662231445, "global_step": 146399, "epoch": 3485} {"train_loss": -6.870988368988037, "global_step": 146400, "epoch": 3485} {"train_loss": -6.74605655670166, "global_step": 146401, "epoch": 3485} {"train_loss": -6.774128437042236, "global_step": 146402, "epoch": 3485} {"train_loss": -6.803431034088135, "global_step": 146403, "epoch": 3485} {"train_loss": -6.754500389099121, "global_step": 146404, "epoch": 3485} {"train_loss": -6.829774856567383, "global_step": 146405, "epoch": 3485} {"train_loss": -6.76345157623291, "global_step": 146406, "epoch": 3485} {"train_loss": -6.746760845184326, "global_step": 146407, "epoch": 3485} {"train_loss": -6.767496585845947, "global_step": 146408, "epoch": 3485} {"train_loss": -6.7344841957092285, "global_step": 146409, "epoch": 3485} {"train_loss": -6.801906585693359, "global_step": 146410, "epoch": 3485} {"train_loss": -6.800901072365897, "global_step": 146411, "epoch": 3485, "val_loss": 78512.046875} {"train_loss": -6.809947967529297, "global_step": 146412, "epoch": 3486} {"train_loss": -6.892254829406738, "global_step": 146413, "epoch": 3486} {"train_loss": -6.856005668640137, "global_step": 146414, "epoch": 3486} {"train_loss": -6.896154403686523, "global_step": 146415, "epoch": 3486} {"train_loss": -6.903074264526367, "global_step": 146416, "epoch": 3486} {"train_loss": -6.836647033691406, "global_step": 146417, "epoch": 3486} {"train_loss": -6.836977481842041, "global_step": 146418, "epoch": 3486} {"train_loss": -6.82855224609375, "global_step": 146419, "epoch": 3486} {"train_loss": -6.908285140991211, "global_step": 146420, "epoch": 3486} {"train_loss": -6.761727333068848, "global_step": 146421, "epoch": 3486} {"train_loss": -6.812799453735352, "global_step": 146422, "epoch": 3486} {"train_loss": -6.790677070617676, "global_step": 146423, "epoch": 3486} {"train_loss": -6.598049163818359, "global_step": 146424, "epoch": 3486} {"train_loss": -6.720643997192383, "global_step": 146425, "epoch": 3486} {"train_loss": -6.721034049987793, "global_step": 146426, "epoch": 3486} {"train_loss": -6.750741958618164, "global_step": 146427, "epoch": 3486} {"train_loss": -6.881558418273926, "global_step": 146428, "epoch": 3486} {"train_loss": -6.868244171142578, "global_step": 146429, "epoch": 3486} {"train_loss": -6.928729057312012, "global_step": 146430, "epoch": 3486} {"train_loss": -6.947914123535156, "global_step": 146431, "epoch": 3486} {"train_loss": -6.793296813964844, "global_step": 146432, "epoch": 3486} {"train_loss": -6.848206043243408, "global_step": 146433, "epoch": 3486} {"train_loss": -6.838983535766602, "global_step": 146434, "epoch": 3486} {"train_loss": -6.757791996002197, "global_step": 146435, "epoch": 3486} {"train_loss": -6.825535774230957, "global_step": 146436, "epoch": 3486} {"train_loss": -6.837120056152344, "global_step": 146437, "epoch": 3486} {"train_loss": -6.7932634353637695, "global_step": 146438, "epoch": 3486} {"train_loss": -6.767829895019531, "global_step": 146439, "epoch": 3486} {"train_loss": -6.750943183898926, "global_step": 146440, "epoch": 3486} {"train_loss": -6.7642502784729, "global_step": 146441, "epoch": 3486} {"train_loss": -6.801811218261719, "global_step": 146442, "epoch": 3486} {"train_loss": -6.837767601013184, "global_step": 146443, "epoch": 3486} {"train_loss": -6.853676795959473, "global_step": 146444, "epoch": 3486} {"train_loss": -6.838178634643555, "global_step": 146445, "epoch": 3486} {"train_loss": -6.8873443603515625, "global_step": 146446, "epoch": 3486} {"train_loss": -6.852476119995117, "global_step": 146447, "epoch": 3486} {"train_loss": -6.945220947265625, "global_step": 146448, "epoch": 3486} {"train_loss": -6.649661064147949, "global_step": 146449, "epoch": 3486} {"train_loss": -6.752631187438965, "global_step": 146450, "epoch": 3486} {"train_loss": -6.7557373046875, "global_step": 146451, "epoch": 3486} {"train_loss": -6.641175270080566, "global_step": 146452, "epoch": 3486} {"train_loss": -6.81354942775908, "global_step": 146453, "epoch": 3486, "val_loss": 78386.9453125} {"train_loss": -6.962097644805908, "global_step": 146454, "epoch": 3487} {"train_loss": -6.817493438720703, "global_step": 146455, "epoch": 3487} {"train_loss": -7.017803192138672, "global_step": 146456, "epoch": 3487} {"train_loss": -6.820914268493652, "global_step": 146457, "epoch": 3487} {"train_loss": -6.788968086242676, "global_step": 146458, "epoch": 3487} {"train_loss": -6.887737274169922, "global_step": 146459, "epoch": 3487} {"train_loss": -6.874428749084473, "global_step": 146460, "epoch": 3487} {"train_loss": -6.822607040405273, "global_step": 146461, "epoch": 3487} {"train_loss": -6.952521324157715, "global_step": 146462, "epoch": 3487} {"train_loss": -6.951080322265625, "global_step": 146463, "epoch": 3487} {"train_loss": -6.8226518630981445, "global_step": 146464, "epoch": 3487} {"train_loss": -6.790379047393799, "global_step": 146465, "epoch": 3487} {"train_loss": -6.858097076416016, "global_step": 146466, "epoch": 3487} {"train_loss": -6.914646148681641, "global_step": 146467, "epoch": 3487} {"train_loss": -6.836258888244629, "global_step": 146468, "epoch": 3487} {"train_loss": -6.926547050476074, "global_step": 146469, "epoch": 3487} {"train_loss": -6.885698318481445, "global_step": 146470, "epoch": 3487} {"train_loss": -6.72413444519043, "global_step": 146471, "epoch": 3487} {"train_loss": -6.793302536010742, "global_step": 146472, "epoch": 3487} {"train_loss": -6.879366874694824, "global_step": 146473, "epoch": 3487} {"train_loss": -6.907356262207031, "global_step": 146474, "epoch": 3487} {"train_loss": -6.934332847595215, "global_step": 146475, "epoch": 3487} {"train_loss": -6.890948295593262, "global_step": 146476, "epoch": 3487} {"train_loss": -6.738928318023682, "global_step": 146477, "epoch": 3487} {"train_loss": -6.7853617668151855, "global_step": 146478, "epoch": 3487} {"train_loss": -6.6412153244018555, "global_step": 146479, "epoch": 3487} {"train_loss": -6.8513336181640625, "global_step": 146480, "epoch": 3487} {"train_loss": -6.700993061065674, "global_step": 146481, "epoch": 3487} {"train_loss": -6.708500862121582, "global_step": 146482, "epoch": 3487} {"train_loss": -6.753081321716309, "global_step": 146483, "epoch": 3487} {"train_loss": -6.828386306762695, "global_step": 146484, "epoch": 3487} {"train_loss": -6.713943958282471, "global_step": 146485, "epoch": 3487} {"train_loss": -6.871507167816162, "global_step": 146486, "epoch": 3487} {"train_loss": -6.681095600128174, "global_step": 146487, "epoch": 3487} {"train_loss": -6.729532241821289, "global_step": 146488, "epoch": 3487} {"train_loss": -6.838659763336182, "global_step": 146489, "epoch": 3487} {"train_loss": -6.783082962036133, "global_step": 146490, "epoch": 3487} {"train_loss": -6.772487640380859, "global_step": 146491, "epoch": 3487} {"train_loss": -6.6925859451293945, "global_step": 146492, "epoch": 3487} {"train_loss": -6.764948844909668, "global_step": 146493, "epoch": 3487} {"train_loss": -6.831137180328369, "global_step": 146494, "epoch": 3487} {"train_loss": -6.820838258379982, "global_step": 146495, "epoch": 3487, "val_loss": 78589.0625} {"train_loss": -6.774723052978516, "global_step": 146496, "epoch": 3488} {"train_loss": -6.8952436447143555, "global_step": 146497, "epoch": 3488} {"train_loss": -6.758666038513184, "global_step": 146498, "epoch": 3488} {"train_loss": -6.70287561416626, "global_step": 146499, "epoch": 3488} {"train_loss": -6.812524795532227, "global_step": 146500, "epoch": 3488} {"train_loss": -6.762453556060791, "global_step": 146501, "epoch": 3488} {"train_loss": -6.647116184234619, "global_step": 146502, "epoch": 3488} {"train_loss": -6.60629940032959, "global_step": 146503, "epoch": 3488} {"train_loss": -6.7734456062316895, "global_step": 146504, "epoch": 3488} {"train_loss": -6.63796329498291, "global_step": 146505, "epoch": 3488} {"train_loss": -6.7893524169921875, "global_step": 146506, "epoch": 3488} {"train_loss": -6.681198596954346, "global_step": 146507, "epoch": 3488} {"train_loss": -6.71534538269043, "global_step": 146508, "epoch": 3488} {"train_loss": -6.732778072357178, "global_step": 146509, "epoch": 3488} {"train_loss": -6.778280258178711, "global_step": 146510, "epoch": 3488} {"train_loss": -6.7580180168151855, "global_step": 146511, "epoch": 3488} {"train_loss": -6.743035793304443, "global_step": 146512, "epoch": 3488} {"train_loss": -6.774852275848389, "global_step": 146513, "epoch": 3488} {"train_loss": -6.8037214279174805, "global_step": 146514, "epoch": 3488} {"train_loss": -6.7794575691223145, "global_step": 146515, "epoch": 3488} {"train_loss": -6.807207107543945, "global_step": 146516, "epoch": 3488} {"train_loss": -6.737636566162109, "global_step": 146517, "epoch": 3488} {"train_loss": -6.924281597137451, "global_step": 146518, "epoch": 3488} {"train_loss": -6.782415390014648, "global_step": 146519, "epoch": 3488} {"train_loss": -6.718889236450195, "global_step": 146520, "epoch": 3488} {"train_loss": -6.839150428771973, "global_step": 146521, "epoch": 3488} {"train_loss": -6.808202266693115, "global_step": 146522, "epoch": 3488} {"train_loss": -6.657965660095215, "global_step": 146523, "epoch": 3488} {"train_loss": -6.647843360900879, "global_step": 146524, "epoch": 3488} {"train_loss": -6.861377716064453, "global_step": 146525, "epoch": 3488} {"train_loss": -6.760437488555908, "global_step": 146526, "epoch": 3488} {"train_loss": -6.878838539123535, "global_step": 146527, "epoch": 3488} {"train_loss": -6.77708625793457, "global_step": 146528, "epoch": 3488} {"train_loss": -6.730791091918945, "global_step": 146529, "epoch": 3488} {"train_loss": -6.73538875579834, "global_step": 146530, "epoch": 3488} {"train_loss": -6.894306659698486, "global_step": 146531, "epoch": 3488} {"train_loss": -6.902491569519043, "global_step": 146532, "epoch": 3488} {"train_loss": -6.790657997131348, "global_step": 146533, "epoch": 3488} {"train_loss": -6.764247894287109, "global_step": 146534, "epoch": 3488} {"train_loss": -6.793959617614746, "global_step": 146535, "epoch": 3488} {"train_loss": -6.804337501525879, "global_step": 146536, "epoch": 3488} {"train_loss": -6.771966673078991, "global_step": 146537, "epoch": 3488, "val_loss": 78406.578125} {"train_loss": -6.778961181640625, "global_step": 146538, "epoch": 3489} {"train_loss": -6.862649917602539, "global_step": 146539, "epoch": 3489} {"train_loss": -6.796189785003662, "global_step": 146540, "epoch": 3489} {"train_loss": -6.804816246032715, "global_step": 146541, "epoch": 3489} {"train_loss": -6.822786331176758, "global_step": 146542, "epoch": 3489} {"train_loss": -6.727778911590576, "global_step": 146543, "epoch": 3489} {"train_loss": -6.816821575164795, "global_step": 146544, "epoch": 3489} {"train_loss": -6.767994403839111, "global_step": 146545, "epoch": 3489} {"train_loss": -6.658658027648926, "global_step": 146546, "epoch": 3489} {"train_loss": -6.864621162414551, "global_step": 146547, "epoch": 3489} {"train_loss": -6.80190372467041, "global_step": 146548, "epoch": 3489} {"train_loss": -6.906601428985596, "global_step": 146549, "epoch": 3489} {"train_loss": -6.755293846130371, "global_step": 146550, "epoch": 3489} {"train_loss": -6.829804420471191, "global_step": 146551, "epoch": 3489} {"train_loss": -6.796463966369629, "global_step": 146552, "epoch": 3489} {"train_loss": -6.747157096862793, "global_step": 146553, "epoch": 3489} {"train_loss": -6.862462997436523, "global_step": 146554, "epoch": 3489} {"train_loss": -6.880672454833984, "global_step": 146555, "epoch": 3489} {"train_loss": -6.821789264678955, "global_step": 146556, "epoch": 3489} {"train_loss": -6.903625965118408, "global_step": 146557, "epoch": 3489} {"train_loss": -6.777544975280762, "global_step": 146558, "epoch": 3489} {"train_loss": -6.759141445159912, "global_step": 146559, "epoch": 3489} {"train_loss": -6.733663558959961, "global_step": 146560, "epoch": 3489} {"train_loss": -6.906952381134033, "global_step": 146561, "epoch": 3489} {"train_loss": -6.809064865112305, "global_step": 146562, "epoch": 3489} {"train_loss": -6.825222969055176, "global_step": 146563, "epoch": 3489} {"train_loss": -6.865987300872803, "global_step": 146564, "epoch": 3489} {"train_loss": -6.7644124031066895, "global_step": 146565, "epoch": 3489} {"train_loss": -6.699580192565918, "global_step": 146566, "epoch": 3489} {"train_loss": -6.731475830078125, "global_step": 146567, "epoch": 3489} {"train_loss": -6.84082555770874, "global_step": 146568, "epoch": 3489} {"train_loss": -6.845576286315918, "global_step": 146569, "epoch": 3489} {"train_loss": -6.822938442230225, "global_step": 146570, "epoch": 3489} {"train_loss": -6.874030113220215, "global_step": 146571, "epoch": 3489} {"train_loss": -6.778502941131592, "global_step": 146572, "epoch": 3489} {"train_loss": -6.849995136260986, "global_step": 146573, "epoch": 3489} {"train_loss": -6.676264762878418, "global_step": 146574, "epoch": 3489} {"train_loss": -6.820186614990234, "global_step": 146575, "epoch": 3489} {"train_loss": -6.735607147216797, "global_step": 146576, "epoch": 3489} {"train_loss": -6.519960403442383, "global_step": 146577, "epoch": 3489} {"train_loss": -6.739185333251953, "global_step": 146578, "epoch": 3489} {"train_loss": -6.794303723743984, "global_step": 146579, "epoch": 3489, "val_loss": 78323.15625} {"train_loss": -6.795064926147461, "global_step": 146580, "epoch": 3490} {"train_loss": -6.774919509887695, "global_step": 146581, "epoch": 3490} {"train_loss": -6.788031578063965, "global_step": 146582, "epoch": 3490} {"train_loss": -6.810262680053711, "global_step": 146583, "epoch": 3490} {"train_loss": -6.768536567687988, "global_step": 146584, "epoch": 3490} {"train_loss": -6.865772724151611, "global_step": 146585, "epoch": 3490} {"train_loss": -6.753351211547852, "global_step": 146586, "epoch": 3490} {"train_loss": -6.8262739181518555, "global_step": 146587, "epoch": 3490} {"train_loss": -6.868991851806641, "global_step": 146588, "epoch": 3490} {"train_loss": -6.88679313659668, "global_step": 146589, "epoch": 3490} {"train_loss": -6.800833225250244, "global_step": 146590, "epoch": 3490} {"train_loss": -6.769978046417236, "global_step": 146591, "epoch": 3490} {"train_loss": -6.711861610412598, "global_step": 146592, "epoch": 3490} {"train_loss": -6.8404412269592285, "global_step": 146593, "epoch": 3490} {"train_loss": -6.932795524597168, "global_step": 146594, "epoch": 3490} {"train_loss": -6.7543416023254395, "global_step": 146595, "epoch": 3490} {"train_loss": -6.796894550323486, "global_step": 146596, "epoch": 3490} {"train_loss": -6.62961483001709, "global_step": 146597, "epoch": 3490} {"train_loss": -6.788143157958984, "global_step": 146598, "epoch": 3490} {"train_loss": -6.7795939445495605, "global_step": 146599, "epoch": 3490} {"train_loss": -6.609041690826416, "global_step": 146600, "epoch": 3490} {"train_loss": -6.831933498382568, "global_step": 146601, "epoch": 3490} {"train_loss": -6.70109748840332, "global_step": 146602, "epoch": 3490} {"train_loss": -6.769923210144043, "global_step": 146603, "epoch": 3490} {"train_loss": -6.757998943328857, "global_step": 146604, "epoch": 3490} {"train_loss": -6.606080055236816, "global_step": 146605, "epoch": 3490} {"train_loss": -6.871901035308838, "global_step": 146606, "epoch": 3490} {"train_loss": -6.847013473510742, "global_step": 146607, "epoch": 3490} {"train_loss": -6.755929470062256, "global_step": 146608, "epoch": 3490} {"train_loss": -6.767750263214111, "global_step": 146609, "epoch": 3490} {"train_loss": -6.730690956115723, "global_step": 146610, "epoch": 3490} {"train_loss": -6.853613376617432, "global_step": 146611, "epoch": 3490} {"train_loss": -6.8312177658081055, "global_step": 146612, "epoch": 3490} {"train_loss": -6.900860786437988, "global_step": 146613, "epoch": 3490} {"train_loss": -6.8864006996154785, "global_step": 146614, "epoch": 3490} {"train_loss": -6.805048942565918, "global_step": 146615, "epoch": 3490} {"train_loss": -6.876948356628418, "global_step": 146616, "epoch": 3490} {"train_loss": -6.844135761260986, "global_step": 146617, "epoch": 3490} {"train_loss": -6.687073230743408, "global_step": 146618, "epoch": 3490} {"train_loss": -6.798804759979248, "global_step": 146619, "epoch": 3490} {"train_loss": -6.810888290405273, "global_step": 146620, "epoch": 3490} {"train_loss": -6.7909127076466875, "global_step": 146621, "epoch": 3490, "val_loss": 78549.9921875} {"train_loss": -6.824737548828125, "global_step": 146622, "epoch": 3491} {"train_loss": -6.777076721191406, "global_step": 146623, "epoch": 3491} {"train_loss": -6.820767402648926, "global_step": 146624, "epoch": 3491} {"train_loss": -6.774049758911133, "global_step": 146625, "epoch": 3491} {"train_loss": -6.842451572418213, "global_step": 146626, "epoch": 3491} {"train_loss": -6.908749103546143, "global_step": 146627, "epoch": 3491} {"train_loss": -6.8565168380737305, "global_step": 146628, "epoch": 3491} {"train_loss": -6.8931050300598145, "global_step": 146629, "epoch": 3491} {"train_loss": -6.767311096191406, "global_step": 146630, "epoch": 3491} {"train_loss": -6.763125419616699, "global_step": 146631, "epoch": 3491} {"train_loss": -6.692783832550049, "global_step": 146632, "epoch": 3491} {"train_loss": -6.849123477935791, "global_step": 146633, "epoch": 3491} {"train_loss": -6.813747406005859, "global_step": 146634, "epoch": 3491} {"train_loss": -6.870469570159912, "global_step": 146635, "epoch": 3491} {"train_loss": -6.796421527862549, "global_step": 146636, "epoch": 3491} {"train_loss": -6.853251934051514, "global_step": 146637, "epoch": 3491} {"train_loss": -6.798315048217773, "global_step": 146638, "epoch": 3491} {"train_loss": -6.906238079071045, "global_step": 146639, "epoch": 3491} {"train_loss": -6.933403968811035, "global_step": 146640, "epoch": 3491} {"train_loss": -6.833059310913086, "global_step": 146641, "epoch": 3491} {"train_loss": -6.726347923278809, "global_step": 146642, "epoch": 3491} {"train_loss": -6.785479545593262, "global_step": 146643, "epoch": 3491} {"train_loss": -6.7738542556762695, "global_step": 146644, "epoch": 3491} {"train_loss": -6.750254154205322, "global_step": 146645, "epoch": 3491} {"train_loss": -6.891962051391602, "global_step": 146646, "epoch": 3491} {"train_loss": -6.741722583770752, "global_step": 146647, "epoch": 3491} {"train_loss": -6.8413848876953125, "global_step": 146648, "epoch": 3491} {"train_loss": -6.734490394592285, "global_step": 146649, "epoch": 3491} {"train_loss": -6.752706050872803, "global_step": 146650, "epoch": 3491} {"train_loss": -6.820807456970215, "global_step": 146651, "epoch": 3491} {"train_loss": -6.744475364685059, "global_step": 146652, "epoch": 3491} {"train_loss": -6.895678520202637, "global_step": 146653, "epoch": 3491} {"train_loss": -6.915037155151367, "global_step": 146654, "epoch": 3491} {"train_loss": -6.931174278259277, "global_step": 146655, "epoch": 3491} {"train_loss": -6.838662147521973, "global_step": 146656, "epoch": 3491} {"train_loss": -7.0093278884887695, "global_step": 146657, "epoch": 3491} {"train_loss": -6.810259819030762, "global_step": 146658, "epoch": 3491} {"train_loss": -6.822786331176758, "global_step": 146659, "epoch": 3491} {"train_loss": -6.9702653884887695, "global_step": 146660, "epoch": 3491} {"train_loss": -6.8617706298828125, "global_step": 146661, "epoch": 3491} {"train_loss": -6.815515518188477, "global_step": 146662, "epoch": 3491} {"train_loss": -6.827636639277141, "global_step": 146663, "epoch": 3491, "val_loss": 78591.5078125} {"train_loss": -6.6124396324157715, "global_step": 146664, "epoch": 3492} {"train_loss": -6.827642917633057, "global_step": 146665, "epoch": 3492} {"train_loss": -6.819239139556885, "global_step": 146666, "epoch": 3492} {"train_loss": -6.834473133087158, "global_step": 146667, "epoch": 3492} {"train_loss": -6.867627143859863, "global_step": 146668, "epoch": 3492} {"train_loss": -6.802271366119385, "global_step": 146669, "epoch": 3492} {"train_loss": -6.793022155761719, "global_step": 146670, "epoch": 3492} {"train_loss": -6.74992561340332, "global_step": 146671, "epoch": 3492} {"train_loss": -6.8431901931762695, "global_step": 146672, "epoch": 3492} {"train_loss": -6.881933212280273, "global_step": 146673, "epoch": 3492} {"train_loss": -6.858426570892334, "global_step": 146674, "epoch": 3492} {"train_loss": -6.8789262771606445, "global_step": 146675, "epoch": 3492} {"train_loss": -6.819470405578613, "global_step": 146676, "epoch": 3492} {"train_loss": -6.740022659301758, "global_step": 146677, "epoch": 3492} {"train_loss": -6.857982158660889, "global_step": 146678, "epoch": 3492} {"train_loss": -6.821961402893066, "global_step": 146679, "epoch": 3492} {"train_loss": -6.879395484924316, "global_step": 146680, "epoch": 3492} {"train_loss": -6.789966583251953, "global_step": 146681, "epoch": 3492} {"train_loss": -6.869502067565918, "global_step": 146682, "epoch": 3492} {"train_loss": -6.881711959838867, "global_step": 146683, "epoch": 3492} {"train_loss": -6.823055267333984, "global_step": 146684, "epoch": 3492} {"train_loss": -6.798819541931152, "global_step": 146685, "epoch": 3492} {"train_loss": -6.693418502807617, "global_step": 146686, "epoch": 3492} {"train_loss": -6.862351894378662, "global_step": 146687, "epoch": 3492} {"train_loss": -6.799374580383301, "global_step": 146688, "epoch": 3492} {"train_loss": -6.921356201171875, "global_step": 146689, "epoch": 3492} {"train_loss": -6.735796928405762, "global_step": 146690, "epoch": 3492} {"train_loss": -6.8528900146484375, "global_step": 146691, "epoch": 3492} {"train_loss": -6.736473083496094, "global_step": 146692, "epoch": 3492} {"train_loss": -6.804316520690918, "global_step": 146693, "epoch": 3492} {"train_loss": -6.965262413024902, "global_step": 146694, "epoch": 3492} {"train_loss": -6.773950576782227, "global_step": 146695, "epoch": 3492} {"train_loss": -6.8970136642456055, "global_step": 146696, "epoch": 3492} {"train_loss": -6.885878086090088, "global_step": 146697, "epoch": 3492} {"train_loss": -6.8111467361450195, "global_step": 146698, "epoch": 3492} {"train_loss": -6.94590950012207, "global_step": 146699, "epoch": 3492} {"train_loss": -6.995321273803711, "global_step": 146700, "epoch": 3492} {"train_loss": -6.8964524269104, "global_step": 146701, "epoch": 3492} {"train_loss": -6.813597679138184, "global_step": 146702, "epoch": 3492} {"train_loss": -6.917325019836426, "global_step": 146703, "epoch": 3492} {"train_loss": -6.779910087585449, "global_step": 146704, "epoch": 3492} {"train_loss": -6.835792972928002, "global_step": 146705, "epoch": 3492, "val_loss": 78575.4765625} {"train_loss": -6.762938022613525, "global_step": 146706, "epoch": 3493} {"train_loss": -6.634432792663574, "global_step": 146707, "epoch": 3493} {"train_loss": -6.67055606842041, "global_step": 146708, "epoch": 3493} {"train_loss": -6.825898170471191, "global_step": 146709, "epoch": 3493} {"train_loss": -6.628983497619629, "global_step": 146710, "epoch": 3493} {"train_loss": -6.729372978210449, "global_step": 146711, "epoch": 3493} {"train_loss": -6.611516952514648, "global_step": 146712, "epoch": 3493} {"train_loss": -6.782668590545654, "global_step": 146713, "epoch": 3493} {"train_loss": -6.731183052062988, "global_step": 146714, "epoch": 3493} {"train_loss": -6.901584625244141, "global_step": 146715, "epoch": 3493} {"train_loss": -6.8304443359375, "global_step": 146716, "epoch": 3493} {"train_loss": -6.832876205444336, "global_step": 146717, "epoch": 3493} {"train_loss": -6.897995471954346, "global_step": 146718, "epoch": 3493} {"train_loss": -6.795285224914551, "global_step": 146719, "epoch": 3493} {"train_loss": -6.925372123718262, "global_step": 146720, "epoch": 3493} {"train_loss": -6.802397727966309, "global_step": 146721, "epoch": 3493} {"train_loss": -6.892247200012207, "global_step": 146722, "epoch": 3493} {"train_loss": -6.769602298736572, "global_step": 146723, "epoch": 3493} {"train_loss": -6.843010425567627, "global_step": 146724, "epoch": 3493} {"train_loss": -6.804305076599121, "global_step": 146725, "epoch": 3493} {"train_loss": -6.888419151306152, "global_step": 146726, "epoch": 3493} {"train_loss": -6.803027629852295, "global_step": 146727, "epoch": 3493} {"train_loss": -6.780780792236328, "global_step": 146728, "epoch": 3493} {"train_loss": -6.934879779815674, "global_step": 146729, "epoch": 3493} {"train_loss": -6.825023651123047, "global_step": 146730, "epoch": 3493} {"train_loss": -6.9105987548828125, "global_step": 146731, "epoch": 3493} {"train_loss": -6.928632736206055, "global_step": 146732, "epoch": 3493} {"train_loss": -6.7831268310546875, "global_step": 146733, "epoch": 3493} {"train_loss": -6.8476409912109375, "global_step": 146734, "epoch": 3493} {"train_loss": -6.847158432006836, "global_step": 146735, "epoch": 3493} {"train_loss": -6.8767290115356445, "global_step": 146736, "epoch": 3493} {"train_loss": -6.88475227355957, "global_step": 146737, "epoch": 3493} {"train_loss": -6.76784086227417, "global_step": 146738, "epoch": 3493} {"train_loss": -7.05774450302124, "global_step": 146739, "epoch": 3493} {"train_loss": -6.807131767272949, "global_step": 146740, "epoch": 3493} {"train_loss": -6.765514373779297, "global_step": 146741, "epoch": 3493} {"train_loss": -6.80539083480835, "global_step": 146742, "epoch": 3493} {"train_loss": -6.8240156173706055, "global_step": 146743, "epoch": 3493} {"train_loss": -6.888120651245117, "global_step": 146744, "epoch": 3493} {"train_loss": -6.689223289489746, "global_step": 146745, "epoch": 3493} {"train_loss": -6.698081970214844, "global_step": 146746, "epoch": 3493} {"train_loss": -6.808414561407907, "global_step": 146747, "epoch": 3493, "val_loss": 78748.953125} {"train_loss": -6.595397472381592, "global_step": 146748, "epoch": 3494} {"train_loss": -6.811347007751465, "global_step": 146749, "epoch": 3494} {"train_loss": -6.669373512268066, "global_step": 146750, "epoch": 3494} {"train_loss": -6.894099235534668, "global_step": 146751, "epoch": 3494} {"train_loss": -6.6525774002075195, "global_step": 146752, "epoch": 3494} {"train_loss": -6.827588081359863, "global_step": 146753, "epoch": 3494} {"train_loss": -6.683662414550781, "global_step": 146754, "epoch": 3494} {"train_loss": -6.701735019683838, "global_step": 146755, "epoch": 3494} {"train_loss": -6.6876959800720215, "global_step": 146756, "epoch": 3494} {"train_loss": -6.665509223937988, "global_step": 146757, "epoch": 3494} {"train_loss": -6.784282207489014, "global_step": 146758, "epoch": 3494} {"train_loss": -6.805169105529785, "global_step": 146759, "epoch": 3494} {"train_loss": -6.755579948425293, "global_step": 146760, "epoch": 3494} {"train_loss": -6.720837593078613, "global_step": 146761, "epoch": 3494} {"train_loss": -6.88400411605835, "global_step": 146762, "epoch": 3494} {"train_loss": -6.863295555114746, "global_step": 146763, "epoch": 3494} {"train_loss": -6.796459197998047, "global_step": 146764, "epoch": 3494} {"train_loss": -6.815861225128174, "global_step": 146765, "epoch": 3494} {"train_loss": -6.865762710571289, "global_step": 146766, "epoch": 3494} {"train_loss": -6.865442752838135, "global_step": 146767, "epoch": 3494} {"train_loss": -6.895659446716309, "global_step": 146768, "epoch": 3494} {"train_loss": -6.780725002288818, "global_step": 146769, "epoch": 3494} {"train_loss": -6.873068809509277, "global_step": 146770, "epoch": 3494} {"train_loss": -6.992949485778809, "global_step": 146771, "epoch": 3494} {"train_loss": -6.724550247192383, "global_step": 146772, "epoch": 3494} {"train_loss": -6.85943078994751, "global_step": 146773, "epoch": 3494} {"train_loss": -6.816587448120117, "global_step": 146774, "epoch": 3494} {"train_loss": -6.762063980102539, "global_step": 146775, "epoch": 3494} {"train_loss": -6.844274520874023, "global_step": 146776, "epoch": 3494} {"train_loss": -6.597786903381348, "global_step": 146777, "epoch": 3494} {"train_loss": -6.775232315063477, "global_step": 146778, "epoch": 3494} {"train_loss": -6.8339409828186035, "global_step": 146779, "epoch": 3494} {"train_loss": -6.795505046844482, "global_step": 146780, "epoch": 3494} {"train_loss": -6.747096061706543, "global_step": 146781, "epoch": 3494} {"train_loss": -6.848797798156738, "global_step": 146782, "epoch": 3494} {"train_loss": -6.838767051696777, "global_step": 146783, "epoch": 3494} {"train_loss": -6.899158477783203, "global_step": 146784, "epoch": 3494} {"train_loss": -6.818411827087402, "global_step": 146785, "epoch": 3494} {"train_loss": -6.973557949066162, "global_step": 146786, "epoch": 3494} {"train_loss": -6.890969276428223, "global_step": 146787, "epoch": 3494} {"train_loss": -6.916151523590088, "global_step": 146788, "epoch": 3494} {"train_loss": -6.801485368183681, "global_step": 146789, "epoch": 3494, "val_loss": 78422.4140625} {"train_loss": -6.826623916625977, "global_step": 146790, "epoch": 3495} {"train_loss": -6.771183967590332, "global_step": 146791, "epoch": 3495} {"train_loss": -6.936060905456543, "global_step": 146792, "epoch": 3495} {"train_loss": -6.870030879974365, "global_step": 146793, "epoch": 3495} {"train_loss": -6.8987627029418945, "global_step": 146794, "epoch": 3495} {"train_loss": -6.923524856567383, "global_step": 146795, "epoch": 3495} {"train_loss": -6.918731689453125, "global_step": 146796, "epoch": 3495} {"train_loss": -6.8881731033325195, "global_step": 146797, "epoch": 3495} {"train_loss": -6.876228332519531, "global_step": 146798, "epoch": 3495} {"train_loss": -6.89304780960083, "global_step": 146799, "epoch": 3495} {"train_loss": -6.9062676429748535, "global_step": 146800, "epoch": 3495} {"train_loss": -6.8984270095825195, "global_step": 146801, "epoch": 3495} {"train_loss": -6.830148696899414, "global_step": 146802, "epoch": 3495} {"train_loss": -6.836573600769043, "global_step": 146803, "epoch": 3495} {"train_loss": -6.962352752685547, "global_step": 146804, "epoch": 3495} {"train_loss": -6.900394439697266, "global_step": 146805, "epoch": 3495} {"train_loss": -6.875449180603027, "global_step": 146806, "epoch": 3495} {"train_loss": -6.8766632080078125, "global_step": 146807, "epoch": 3495} {"train_loss": -6.91087532043457, "global_step": 146808, "epoch": 3495} {"train_loss": -6.935012340545654, "global_step": 146809, "epoch": 3495} {"train_loss": -6.870379447937012, "global_step": 146810, "epoch": 3495} {"train_loss": -6.887877941131592, "global_step": 146811, "epoch": 3495} {"train_loss": -6.838334083557129, "global_step": 146812, "epoch": 3495} {"train_loss": -6.891351699829102, "global_step": 146813, "epoch": 3495} {"train_loss": -7.004908561706543, "global_step": 146814, "epoch": 3495} {"train_loss": -6.868915557861328, "global_step": 146815, "epoch": 3495} {"train_loss": -6.792380332946777, "global_step": 146816, "epoch": 3495} {"train_loss": -6.839799404144287, "global_step": 146817, "epoch": 3495} {"train_loss": -6.8359575271606445, "global_step": 146818, "epoch": 3495} {"train_loss": -6.926490306854248, "global_step": 146819, "epoch": 3495} {"train_loss": -6.906513690948486, "global_step": 146820, "epoch": 3495} {"train_loss": -6.8459367752075195, "global_step": 146821, "epoch": 3495} {"train_loss": -6.930473327636719, "global_step": 146822, "epoch": 3495} {"train_loss": -6.835848331451416, "global_step": 146823, "epoch": 3495} {"train_loss": -6.925166130065918, "global_step": 146824, "epoch": 3495} {"train_loss": -6.858766555786133, "global_step": 146825, "epoch": 3495} {"train_loss": -6.890682697296143, "global_step": 146826, "epoch": 3495} {"train_loss": -6.7663679122924805, "global_step": 146827, "epoch": 3495} {"train_loss": -6.8896074295043945, "global_step": 146828, "epoch": 3495} {"train_loss": -6.865462303161621, "global_step": 146829, "epoch": 3495} {"train_loss": -6.960362911224365, "global_step": 146830, "epoch": 3495} {"train_loss": -6.879205669675555, "global_step": 146831, "epoch": 3495, "val_loss": 78574.375} {"train_loss": -6.861005783081055, "global_step": 146832, "epoch": 3496} {"train_loss": -6.884324073791504, "global_step": 146833, "epoch": 3496} {"train_loss": -6.75221586227417, "global_step": 146834, "epoch": 3496} {"train_loss": -6.818707466125488, "global_step": 146835, "epoch": 3496} {"train_loss": -6.79185676574707, "global_step": 146836, "epoch": 3496} {"train_loss": -6.916223049163818, "global_step": 146837, "epoch": 3496} {"train_loss": -6.753973007202148, "global_step": 146838, "epoch": 3496} {"train_loss": -6.9754462242126465, "global_step": 146839, "epoch": 3496} {"train_loss": -6.692244052886963, "global_step": 146840, "epoch": 3496} {"train_loss": -6.870340824127197, "global_step": 146841, "epoch": 3496} {"train_loss": -6.8043365478515625, "global_step": 146842, "epoch": 3496} {"train_loss": -6.826727390289307, "global_step": 146843, "epoch": 3496} {"train_loss": -6.821337699890137, "global_step": 146844, "epoch": 3496} {"train_loss": -6.864985466003418, "global_step": 146845, "epoch": 3496} {"train_loss": -6.826987266540527, "global_step": 146846, "epoch": 3496} {"train_loss": -6.883698463439941, "global_step": 146847, "epoch": 3496} {"train_loss": -6.812298774719238, "global_step": 146848, "epoch": 3496} {"train_loss": -6.776836395263672, "global_step": 146849, "epoch": 3496} {"train_loss": -6.836175441741943, "global_step": 146850, "epoch": 3496} {"train_loss": -6.740236759185791, "global_step": 146851, "epoch": 3496} {"train_loss": -6.770510673522949, "global_step": 146852, "epoch": 3496} {"train_loss": -6.782362937927246, "global_step": 146853, "epoch": 3496} {"train_loss": -6.87360954284668, "global_step": 146854, "epoch": 3496} {"train_loss": -6.875887393951416, "global_step": 146855, "epoch": 3496} {"train_loss": -6.888507843017578, "global_step": 146856, "epoch": 3496} {"train_loss": -6.814851760864258, "global_step": 146857, "epoch": 3496} {"train_loss": -6.8638386726379395, "global_step": 146858, "epoch": 3496} {"train_loss": -6.7347941398620605, "global_step": 146859, "epoch": 3496} {"train_loss": -6.784304618835449, "global_step": 146860, "epoch": 3496} {"train_loss": -6.831817150115967, "global_step": 146861, "epoch": 3496} {"train_loss": -6.873509883880615, "global_step": 146862, "epoch": 3496} {"train_loss": -6.924561500549316, "global_step": 146863, "epoch": 3496} {"train_loss": -6.859283447265625, "global_step": 146864, "epoch": 3496} {"train_loss": -6.76972770690918, "global_step": 146865, "epoch": 3496} {"train_loss": -6.8885579109191895, "global_step": 146866, "epoch": 3496} {"train_loss": -6.8072099685668945, "global_step": 146867, "epoch": 3496} {"train_loss": -6.764214038848877, "global_step": 146868, "epoch": 3496} {"train_loss": -6.8484625816345215, "global_step": 146869, "epoch": 3496} {"train_loss": -6.782256126403809, "global_step": 146870, "epoch": 3496} {"train_loss": -6.792117118835449, "global_step": 146871, "epoch": 3496} {"train_loss": -6.716650009155273, "global_step": 146872, "epoch": 3496} {"train_loss": -6.8238131772904165, "global_step": 146873, "epoch": 3496, "val_loss": 78408.3671875} {"train_loss": -6.822184085845947, "global_step": 146874, "epoch": 3497} {"train_loss": -6.794179916381836, "global_step": 146875, "epoch": 3497} {"train_loss": -6.771009922027588, "global_step": 146876, "epoch": 3497} {"train_loss": -6.8717145919799805, "global_step": 146877, "epoch": 3497} {"train_loss": -6.835063934326172, "global_step": 146878, "epoch": 3497} {"train_loss": -6.877654075622559, "global_step": 146879, "epoch": 3497} {"train_loss": -6.779054641723633, "global_step": 146880, "epoch": 3497} {"train_loss": -6.729998588562012, "global_step": 146881, "epoch": 3497} {"train_loss": -6.880455017089844, "global_step": 146882, "epoch": 3497} {"train_loss": -6.772524833679199, "global_step": 146883, "epoch": 3497} {"train_loss": -6.819461822509766, "global_step": 146884, "epoch": 3497} {"train_loss": -6.804028511047363, "global_step": 146885, "epoch": 3497} {"train_loss": -6.825369834899902, "global_step": 146886, "epoch": 3497} {"train_loss": -6.874154090881348, "global_step": 146887, "epoch": 3497} {"train_loss": -6.765716552734375, "global_step": 146888, "epoch": 3497} {"train_loss": -6.812247276306152, "global_step": 146889, "epoch": 3497} {"train_loss": -6.67667293548584, "global_step": 146890, "epoch": 3497} {"train_loss": -6.679156303405762, "global_step": 146891, "epoch": 3497} {"train_loss": -6.86148738861084, "global_step": 146892, "epoch": 3497} {"train_loss": -6.595787048339844, "global_step": 146893, "epoch": 3497} {"train_loss": -6.793713569641113, "global_step": 146894, "epoch": 3497} {"train_loss": -6.726963043212891, "global_step": 146895, "epoch": 3497} {"train_loss": -6.667102813720703, "global_step": 146896, "epoch": 3497} {"train_loss": -6.673087120056152, "global_step": 146897, "epoch": 3497} {"train_loss": -6.504139423370361, "global_step": 146898, "epoch": 3497} {"train_loss": -6.718700408935547, "global_step": 146899, "epoch": 3497} {"train_loss": -6.536789417266846, "global_step": 146900, "epoch": 3497} {"train_loss": -6.7832465171813965, "global_step": 146901, "epoch": 3497} {"train_loss": -6.696285247802734, "global_step": 146902, "epoch": 3497} {"train_loss": -6.783333778381348, "global_step": 146903, "epoch": 3497} {"train_loss": -6.694265365600586, "global_step": 146904, "epoch": 3497} {"train_loss": -6.685412883758545, "global_step": 146905, "epoch": 3497} {"train_loss": -6.788793087005615, "global_step": 146906, "epoch": 3497} {"train_loss": -6.795489311218262, "global_step": 146907, "epoch": 3497} {"train_loss": -6.7352800369262695, "global_step": 146908, "epoch": 3497} {"train_loss": -6.727123737335205, "global_step": 146909, "epoch": 3497} {"train_loss": -6.753182411193848, "global_step": 146910, "epoch": 3497} {"train_loss": -6.792226314544678, "global_step": 146911, "epoch": 3497} {"train_loss": -6.7573747634887695, "global_step": 146912, "epoch": 3497} {"train_loss": -6.747912406921387, "global_step": 146913, "epoch": 3497} {"train_loss": -6.8010358810424805, "global_step": 146914, "epoch": 3497} {"train_loss": -6.757087741579328, "global_step": 146915, "epoch": 3497, "val_loss": 78657.984375} {"train_loss": -6.87180233001709, "global_step": 146916, "epoch": 3498} {"train_loss": -6.817892074584961, "global_step": 146917, "epoch": 3498} {"train_loss": -6.860910415649414, "global_step": 146918, "epoch": 3498} {"train_loss": -6.859030246734619, "global_step": 146919, "epoch": 3498} {"train_loss": -6.809504508972168, "global_step": 146920, "epoch": 3498} {"train_loss": -6.884182929992676, "global_step": 146921, "epoch": 3498} {"train_loss": -6.934566974639893, "global_step": 146922, "epoch": 3498} {"train_loss": -6.797637939453125, "global_step": 146923, "epoch": 3498} {"train_loss": -6.916031837463379, "global_step": 146924, "epoch": 3498} {"train_loss": -6.90377140045166, "global_step": 146925, "epoch": 3498} {"train_loss": -6.929030418395996, "global_step": 146926, "epoch": 3498} {"train_loss": -6.790098190307617, "global_step": 146927, "epoch": 3498} {"train_loss": -6.867977142333984, "global_step": 146928, "epoch": 3498} {"train_loss": -6.7748494148254395, "global_step": 146929, "epoch": 3498} {"train_loss": -6.790717601776123, "global_step": 146930, "epoch": 3498} {"train_loss": -6.821724891662598, "global_step": 146931, "epoch": 3498} {"train_loss": -6.869352340698242, "global_step": 146932, "epoch": 3498} {"train_loss": -6.8847761154174805, "global_step": 146933, "epoch": 3498} {"train_loss": -6.914742946624756, "global_step": 146934, "epoch": 3498} {"train_loss": -6.878157138824463, "global_step": 146935, "epoch": 3498} {"train_loss": -6.8795013427734375, "global_step": 146936, "epoch": 3498} {"train_loss": -6.848575592041016, "global_step": 146937, "epoch": 3498} {"train_loss": -6.929274559020996, "global_step": 146938, "epoch": 3498} {"train_loss": -6.823631286621094, "global_step": 146939, "epoch": 3498} {"train_loss": -6.747330665588379, "global_step": 146940, "epoch": 3498} {"train_loss": -6.870326042175293, "global_step": 146941, "epoch": 3498} {"train_loss": -6.798700332641602, "global_step": 146942, "epoch": 3498} {"train_loss": -6.830522060394287, "global_step": 146943, "epoch": 3498} {"train_loss": -6.881581783294678, "global_step": 146944, "epoch": 3498} {"train_loss": -6.805080413818359, "global_step": 146945, "epoch": 3498} {"train_loss": -6.891757965087891, "global_step": 146946, "epoch": 3498} {"train_loss": -6.927289962768555, "global_step": 146947, "epoch": 3498} {"train_loss": -6.875894546508789, "global_step": 146948, "epoch": 3498} {"train_loss": -6.929050445556641, "global_step": 146949, "epoch": 3498} {"train_loss": -6.812411308288574, "global_step": 146950, "epoch": 3498} {"train_loss": -6.901181221008301, "global_step": 146951, "epoch": 3498} {"train_loss": -6.796252250671387, "global_step": 146952, "epoch": 3498} {"train_loss": -6.869063377380371, "global_step": 146953, "epoch": 3498} {"train_loss": -6.914071083068848, "global_step": 146954, "epoch": 3498} {"train_loss": -6.834524154663086, "global_step": 146955, "epoch": 3498} {"train_loss": -6.871321678161621, "global_step": 146956, "epoch": 3498} {"train_loss": -6.860635337375459, "global_step": 146957, "epoch": 3498, "val_loss": 78583.21875} {"train_loss": -6.899469375610352, "global_step": 146958, "epoch": 3499} {"train_loss": -6.835209369659424, "global_step": 146959, "epoch": 3499} {"train_loss": -6.882290363311768, "global_step": 146960, "epoch": 3499} {"train_loss": -6.964695453643799, "global_step": 146961, "epoch": 3499} {"train_loss": -6.779808044433594, "global_step": 146962, "epoch": 3499} {"train_loss": -6.890235900878906, "global_step": 146963, "epoch": 3499} {"train_loss": -6.776703834533691, "global_step": 146964, "epoch": 3499} {"train_loss": -6.909890174865723, "global_step": 146965, "epoch": 3499} {"train_loss": -6.986851215362549, "global_step": 146966, "epoch": 3499} {"train_loss": -6.7482452392578125, "global_step": 146967, "epoch": 3499} {"train_loss": -6.928196430206299, "global_step": 146968, "epoch": 3499} {"train_loss": -6.837353229522705, "global_step": 146969, "epoch": 3499} {"train_loss": -6.747661113739014, "global_step": 146970, "epoch": 3499} {"train_loss": -6.798064708709717, "global_step": 146971, "epoch": 3499} {"train_loss": -6.955102443695068, "global_step": 146972, "epoch": 3499} {"train_loss": -6.857268333435059, "global_step": 146973, "epoch": 3499} {"train_loss": -6.949904918670654, "global_step": 146974, "epoch": 3499} {"train_loss": -6.814946174621582, "global_step": 146975, "epoch": 3499} {"train_loss": -6.797637939453125, "global_step": 146976, "epoch": 3499} {"train_loss": -6.9858903884887695, "global_step": 146977, "epoch": 3499} {"train_loss": -6.823647975921631, "global_step": 146978, "epoch": 3499} {"train_loss": -6.663653373718262, "global_step": 146979, "epoch": 3499} {"train_loss": -6.868056297302246, "global_step": 146980, "epoch": 3499} {"train_loss": -6.758632659912109, "global_step": 146981, "epoch": 3499} {"train_loss": -6.703675746917725, "global_step": 146982, "epoch": 3499} {"train_loss": -6.85459041595459, "global_step": 146983, "epoch": 3499} {"train_loss": -6.847182273864746, "global_step": 146984, "epoch": 3499} {"train_loss": -6.8250627517700195, "global_step": 146985, "epoch": 3499} {"train_loss": -6.952219486236572, "global_step": 146986, "epoch": 3499} {"train_loss": -6.882529258728027, "global_step": 146987, "epoch": 3499} {"train_loss": -6.853525161743164, "global_step": 146988, "epoch": 3499} {"train_loss": -6.9217529296875, "global_step": 146989, "epoch": 3499} {"train_loss": -6.819329738616943, "global_step": 146990, "epoch": 3499} {"train_loss": -6.894525527954102, "global_step": 146991, "epoch": 3499} {"train_loss": -6.8652849197387695, "global_step": 146992, "epoch": 3499} {"train_loss": -6.844892501831055, "global_step": 146993, "epoch": 3499} {"train_loss": -6.857563018798828, "global_step": 146994, "epoch": 3499} {"train_loss": -6.748067855834961, "global_step": 146995, "epoch": 3499} {"train_loss": -6.830106735229492, "global_step": 146996, "epoch": 3499} {"train_loss": -6.8581085205078125, "global_step": 146997, "epoch": 3499} {"train_loss": -6.7063751220703125, "global_step": 146998, "epoch": 3499} {"train_loss": -6.84604100953965, "global_step": 146999, "epoch": 3499, "val_loss": 78681.5625} {"train_loss": -6.736367702484131, "global_step": 147000, "epoch": 3500} {"train_loss": -6.8004961013793945, "global_step": 147001, "epoch": 3500} {"train_loss": -6.810906410217285, "global_step": 147002, "epoch": 3500} {"train_loss": -6.810740947723389, "global_step": 147003, "epoch": 3500} {"train_loss": -6.870142936706543, "global_step": 147004, "epoch": 3500} {"train_loss": -6.805548191070557, "global_step": 147005, "epoch": 3500} {"train_loss": -6.853023529052734, "global_step": 147006, "epoch": 3500} {"train_loss": -6.856810569763184, "global_step": 147007, "epoch": 3500} {"train_loss": -6.764803886413574, "global_step": 147008, "epoch": 3500} {"train_loss": -6.894935131072998, "global_step": 147009, "epoch": 3500} {"train_loss": -6.896230697631836, "global_step": 147010, "epoch": 3500} {"train_loss": -6.766481399536133, "global_step": 147011, "epoch": 3500} {"train_loss": -6.864140510559082, "global_step": 147012, "epoch": 3500} {"train_loss": -6.697235107421875, "global_step": 147013, "epoch": 3500} {"train_loss": -6.7728657722473145, "global_step": 147014, "epoch": 3500} {"train_loss": -6.827180862426758, "global_step": 147015, "epoch": 3500} {"train_loss": -6.791031837463379, "global_step": 147016, "epoch": 3500} {"train_loss": -6.731539249420166, "global_step": 147017, "epoch": 3500} {"train_loss": -6.691072940826416, "global_step": 147018, "epoch": 3500} {"train_loss": -6.617805480957031, "global_step": 147019, "epoch": 3500} {"train_loss": -6.852877616882324, "global_step": 147020, "epoch": 3500} {"train_loss": -6.624545097351074, "global_step": 147021, "epoch": 3500} {"train_loss": -6.743186950683594, "global_step": 147022, "epoch": 3500} {"train_loss": -6.744786262512207, "global_step": 147023, "epoch": 3500} {"train_loss": -6.628479957580566, "global_step": 147024, "epoch": 3500} {"train_loss": -6.719839096069336, "global_step": 147025, "epoch": 3500} {"train_loss": -6.427773952484131, "global_step": 147026, "epoch": 3500} {"train_loss": -6.775629043579102, "global_step": 147027, "epoch": 3500} {"train_loss": -6.59602689743042, "global_step": 147028, "epoch": 3500} {"train_loss": -6.863950729370117, "global_step": 147029, "epoch": 3500} {"train_loss": -6.682342529296875, "global_step": 147030, "epoch": 3500} {"train_loss": -6.694173336029053, "global_step": 147031, "epoch": 3500} {"train_loss": -6.823611259460449, "global_step": 147032, "epoch": 3500} {"train_loss": -6.651912689208984, "global_step": 147033, "epoch": 3500} {"train_loss": -6.781023025512695, "global_step": 147034, "epoch": 3500} {"train_loss": -6.801727294921875, "global_step": 147035, "epoch": 3500} {"train_loss": -6.651646614074707, "global_step": 147036, "epoch": 3500} {"train_loss": -6.722794532775879, "global_step": 147037, "epoch": 3500} {"train_loss": -6.785459518432617, "global_step": 147038, "epoch": 3500} {"train_loss": -6.757706642150879, "global_step": 147039, "epoch": 3500} {"train_loss": -6.781749725341797, "global_step": 147040, "epoch": 3500} {"train_loss": -6.7537213280087425, "global_step": 147041, "epoch": 3500, "train/sim_max_reward_0": 0.8599554082903468, "train/sim_max_reward_1": 0.4296068322673853, "train/sim_max_reward_2": 0.4201341991980087, "train/sim_max_reward_3": 0.13504581027293233, "train/sim_max_reward_4": 0.8658920960758193, "train/sim_max_reward_5": 0.5727933470607128, "test/sim_max_reward_4500000": 0.9935002370739884, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.8686310536860021, "test/sim_max_reward_4500003": 0.9654576845302371, "test/sim_max_reward_4500004": 0.19748780615349087, "test/sim_max_reward_4500005": 0.9742922203282782, "test/sim_max_reward_4500006": 0.9625000850164835, "test/sim_max_reward_4500007": 0.9414224524512379, "test/sim_max_reward_4500008": 0.383502339912813, "test/sim_max_reward_4500009": 0.05341076557445537, "test/sim_max_reward_4500010": 0.18016122307054247, "test/sim_max_reward_4500011": 0.9449222282037972, "test/sim_max_reward_4500012": 0.8505707897661491, "test/sim_max_reward_4500013": 0.004296764231990662, "test/sim_max_reward_4500014": 0.9228934854903873, "test/sim_max_reward_4500015": 0.9272027469393694, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.14747810416924345, "test/sim_max_reward_4500018": 0.4434312077081415, "test/sim_max_reward_4500019": 0.9711525439351886, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9163462108079964, "test/sim_max_reward_4500022": 0.9214866425987476, "test/sim_max_reward_4500023": 0.5346361306332756, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.6928295826988047, "test/sim_max_reward_4500026": 0.9643127687072379, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.1015363458943072, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0495590467788576, "test/sim_max_reward_4500033": 0.08287518269813765, "test/sim_max_reward_4500034": 0.8742686062117132, "test/sim_max_reward_4500035": 0.673649864126455, "test/sim_max_reward_4500036": 0.9299373229287157, "test/sim_max_reward_4500037": 0.9989221555670219, "test/sim_max_reward_4500038": 0.30516662526674904, "test/sim_max_reward_4500039": 0.9781491861456764, "test/sim_max_reward_4500040": 0.8392336814889199, "test/sim_max_reward_4500041": 0.9911066835267183, "test/sim_max_reward_4500042": 0.915856154798235, "test/sim_max_reward_4500043": 1.0, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9407997940298308, "test/sim_max_reward_4500046": 0.21722482651803587, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5472379488608675, "test/mean_score": 0.5977674363123716, "val_loss": 78479.7890625} {"train_loss": -6.8012895584106445, "global_step": 147042, "epoch": 3501} {"train_loss": -6.778723239898682, "global_step": 147043, "epoch": 3501} {"train_loss": -6.776421070098877, "global_step": 147044, "epoch": 3501} {"train_loss": -6.782158851623535, "global_step": 147045, "epoch": 3501} {"train_loss": -6.77985954284668, "global_step": 147046, "epoch": 3501} {"train_loss": -6.796358108520508, "global_step": 147047, "epoch": 3501} {"train_loss": -6.883088111877441, "global_step": 147048, "epoch": 3501} {"train_loss": -6.77092170715332, "global_step": 147049, "epoch": 3501} {"train_loss": -6.8231587409973145, "global_step": 147050, "epoch": 3501} {"train_loss": -6.871273040771484, "global_step": 147051, "epoch": 3501} {"train_loss": -6.888804912567139, "global_step": 147052, "epoch": 3501} {"train_loss": -6.819962501525879, "global_step": 147053, "epoch": 3501} {"train_loss": -6.805354118347168, "global_step": 147054, "epoch": 3501} {"train_loss": -6.810479164123535, "global_step": 147055, "epoch": 3501} {"train_loss": -6.810532569885254, "global_step": 147056, "epoch": 3501} {"train_loss": -6.97705602645874, "global_step": 147057, "epoch": 3501} {"train_loss": -6.854086875915527, "global_step": 147058, "epoch": 3501} {"train_loss": -6.798828125, "global_step": 147059, "epoch": 3501} {"train_loss": -6.699448585510254, "global_step": 147060, "epoch": 3501} {"train_loss": -6.910984992980957, "global_step": 147061, "epoch": 3501} {"train_loss": -6.79730224609375, "global_step": 147062, "epoch": 3501} {"train_loss": -6.89491081237793, "global_step": 147063, "epoch": 3501} {"train_loss": -6.86454439163208, "global_step": 147064, "epoch": 3501} {"train_loss": -6.830506324768066, "global_step": 147065, "epoch": 3501} {"train_loss": -6.957156658172607, "global_step": 147066, "epoch": 3501} {"train_loss": -6.837648868560791, "global_step": 147067, "epoch": 3501} {"train_loss": -6.693703651428223, "global_step": 147068, "epoch": 3501} {"train_loss": -6.719669818878174, "global_step": 147069, "epoch": 3501} {"train_loss": -6.779231548309326, "global_step": 147070, "epoch": 3501} {"train_loss": -6.773335933685303, "global_step": 147071, "epoch": 3501} {"train_loss": -6.657998085021973, "global_step": 147072, "epoch": 3501} {"train_loss": -6.847123146057129, "global_step": 147073, "epoch": 3501} {"train_loss": -6.704348564147949, "global_step": 147074, "epoch": 3501} {"train_loss": -6.736084938049316, "global_step": 147075, "epoch": 3501} {"train_loss": -6.793828010559082, "global_step": 147076, "epoch": 3501} {"train_loss": -6.82680606842041, "global_step": 147077, "epoch": 3501} {"train_loss": -6.801451683044434, "global_step": 147078, "epoch": 3501} {"train_loss": -6.903241157531738, "global_step": 147079, "epoch": 3501} {"train_loss": -6.929518699645996, "global_step": 147080, "epoch": 3501} {"train_loss": -6.914183616638184, "global_step": 147081, "epoch": 3501} {"train_loss": -6.812442302703857, "global_step": 147082, "epoch": 3501} {"train_loss": -6.819789523170108, "global_step": 147083, "epoch": 3501, "val_loss": 78478.1015625} {"train_loss": -6.945798873901367, "global_step": 147084, "epoch": 3502} {"train_loss": -6.892516136169434, "global_step": 147085, "epoch": 3502} {"train_loss": -6.888530254364014, "global_step": 147086, "epoch": 3502} {"train_loss": -6.809256553649902, "global_step": 147087, "epoch": 3502} {"train_loss": -6.841309547424316, "global_step": 147088, "epoch": 3502} {"train_loss": -6.805316925048828, "global_step": 147089, "epoch": 3502} {"train_loss": -6.730747222900391, "global_step": 147090, "epoch": 3502} {"train_loss": -6.844244480133057, "global_step": 147091, "epoch": 3502} {"train_loss": -6.816065788269043, "global_step": 147092, "epoch": 3502} {"train_loss": -6.829329013824463, "global_step": 147093, "epoch": 3502} {"train_loss": -6.784153461456299, "global_step": 147094, "epoch": 3502} {"train_loss": -6.8827667236328125, "global_step": 147095, "epoch": 3502} {"train_loss": -6.826443672180176, "global_step": 147096, "epoch": 3502} {"train_loss": -6.897148609161377, "global_step": 147097, "epoch": 3502} {"train_loss": -6.8951334953308105, "global_step": 147098, "epoch": 3502} {"train_loss": -6.804110527038574, "global_step": 147099, "epoch": 3502} {"train_loss": -6.907294750213623, "global_step": 147100, "epoch": 3502} {"train_loss": -6.773411750793457, "global_step": 147101, "epoch": 3502} {"train_loss": -6.894819259643555, "global_step": 147102, "epoch": 3502} {"train_loss": -6.853724956512451, "global_step": 147103, "epoch": 3502} {"train_loss": -6.783513069152832, "global_step": 147104, "epoch": 3502} {"train_loss": -6.7336344718933105, "global_step": 147105, "epoch": 3502} {"train_loss": -6.91397762298584, "global_step": 147106, "epoch": 3502} {"train_loss": -6.871343612670898, "global_step": 147107, "epoch": 3502} {"train_loss": -6.822842597961426, "global_step": 147108, "epoch": 3502} {"train_loss": -6.810873031616211, "global_step": 147109, "epoch": 3502} {"train_loss": -6.80198335647583, "global_step": 147110, "epoch": 3502} {"train_loss": -6.872561454772949, "global_step": 147111, "epoch": 3502} {"train_loss": -6.752429008483887, "global_step": 147112, "epoch": 3502} {"train_loss": -6.899646759033203, "global_step": 147113, "epoch": 3502} {"train_loss": -6.974713325500488, "global_step": 147114, "epoch": 3502} {"train_loss": -6.812959671020508, "global_step": 147115, "epoch": 3502} {"train_loss": -6.878907680511475, "global_step": 147116, "epoch": 3502} {"train_loss": -6.904227256774902, "global_step": 147117, "epoch": 3502} {"train_loss": -6.838989734649658, "global_step": 147118, "epoch": 3502} {"train_loss": -6.936370849609375, "global_step": 147119, "epoch": 3502} {"train_loss": -6.834277153015137, "global_step": 147120, "epoch": 3502} {"train_loss": -6.942481517791748, "global_step": 147121, "epoch": 3502} {"train_loss": -6.813901901245117, "global_step": 147122, "epoch": 3502} {"train_loss": -6.838623046875, "global_step": 147123, "epoch": 3502} {"train_loss": -6.8564453125, "global_step": 147124, "epoch": 3502} {"train_loss": -6.848951453254337, "global_step": 147125, "epoch": 3502, "val_loss": 78497.484375} {"train_loss": -6.8400678634643555, "global_step": 147126, "epoch": 3503} {"train_loss": -7.012392044067383, "global_step": 147127, "epoch": 3503} {"train_loss": -6.928412437438965, "global_step": 147128, "epoch": 3503} {"train_loss": -6.7026495933532715, "global_step": 147129, "epoch": 3503} {"train_loss": -6.75568962097168, "global_step": 147130, "epoch": 3503} {"train_loss": -6.762009620666504, "global_step": 147131, "epoch": 3503} {"train_loss": -6.848887920379639, "global_step": 147132, "epoch": 3503} {"train_loss": -6.584339141845703, "global_step": 147133, "epoch": 3503} {"train_loss": -6.801396369934082, "global_step": 147134, "epoch": 3503} {"train_loss": -6.779514789581299, "global_step": 147135, "epoch": 3503} {"train_loss": -6.758175849914551, "global_step": 147136, "epoch": 3503} {"train_loss": -6.788814067840576, "global_step": 147137, "epoch": 3503} {"train_loss": -6.648977279663086, "global_step": 147138, "epoch": 3503} {"train_loss": -6.903841972351074, "global_step": 147139, "epoch": 3503} {"train_loss": -6.755280494689941, "global_step": 147140, "epoch": 3503} {"train_loss": -6.6543869972229, "global_step": 147141, "epoch": 3503} {"train_loss": -6.777371406555176, "global_step": 147142, "epoch": 3503} {"train_loss": -6.793169021606445, "global_step": 147143, "epoch": 3503} {"train_loss": -6.755985260009766, "global_step": 147144, "epoch": 3503} {"train_loss": -6.821106910705566, "global_step": 147145, "epoch": 3503} {"train_loss": -6.82463264465332, "global_step": 147146, "epoch": 3503} {"train_loss": -6.7519073486328125, "global_step": 147147, "epoch": 3503} {"train_loss": -6.924244403839111, "global_step": 147148, "epoch": 3503} {"train_loss": -6.808475494384766, "global_step": 147149, "epoch": 3503} {"train_loss": -6.86259651184082, "global_step": 147150, "epoch": 3503} {"train_loss": -6.842394828796387, "global_step": 147151, "epoch": 3503} {"train_loss": -6.890749931335449, "global_step": 147152, "epoch": 3503} {"train_loss": -6.926483631134033, "global_step": 147153, "epoch": 3503} {"train_loss": -6.843158721923828, "global_step": 147154, "epoch": 3503} {"train_loss": -6.853906154632568, "global_step": 147155, "epoch": 3503} {"train_loss": -6.913113594055176, "global_step": 147156, "epoch": 3503} {"train_loss": -6.862648010253906, "global_step": 147157, "epoch": 3503} {"train_loss": -6.900815010070801, "global_step": 147158, "epoch": 3503} {"train_loss": -6.915804862976074, "global_step": 147159, "epoch": 3503} {"train_loss": -6.822187900543213, "global_step": 147160, "epoch": 3503} {"train_loss": -6.828605651855469, "global_step": 147161, "epoch": 3503} {"train_loss": -6.848170757293701, "global_step": 147162, "epoch": 3503} {"train_loss": -6.910005569458008, "global_step": 147163, "epoch": 3503} {"train_loss": -6.910801887512207, "global_step": 147164, "epoch": 3503} {"train_loss": -6.891568660736084, "global_step": 147165, "epoch": 3503} {"train_loss": -6.862870216369629, "global_step": 147166, "epoch": 3503} {"train_loss": -6.827621187482562, "global_step": 147167, "epoch": 3503, "val_loss": 78342.1484375} {"train_loss": -6.792641639709473, "global_step": 147168, "epoch": 3504} {"train_loss": -6.87919807434082, "global_step": 147169, "epoch": 3504} {"train_loss": -7.011214256286621, "global_step": 147170, "epoch": 3504} {"train_loss": -6.904157638549805, "global_step": 147171, "epoch": 3504} {"train_loss": -6.93919563293457, "global_step": 147172, "epoch": 3504} {"train_loss": -6.792374610900879, "global_step": 147173, "epoch": 3504} {"train_loss": -6.8685150146484375, "global_step": 147174, "epoch": 3504} {"train_loss": -6.8470458984375, "global_step": 147175, "epoch": 3504} {"train_loss": -6.712785243988037, "global_step": 147176, "epoch": 3504} {"train_loss": -6.818611145019531, "global_step": 147177, "epoch": 3504} {"train_loss": -6.8384599685668945, "global_step": 147178, "epoch": 3504} {"train_loss": -6.781351089477539, "global_step": 147179, "epoch": 3504} {"train_loss": -6.794866561889648, "global_step": 147180, "epoch": 3504} {"train_loss": -6.848056793212891, "global_step": 147181, "epoch": 3504} {"train_loss": -6.876121520996094, "global_step": 147182, "epoch": 3504} {"train_loss": -6.539059162139893, "global_step": 147183, "epoch": 3504} {"train_loss": -6.66779899597168, "global_step": 147184, "epoch": 3504} {"train_loss": -6.612934112548828, "global_step": 147185, "epoch": 3504} {"train_loss": -6.589138507843018, "global_step": 147186, "epoch": 3504} {"train_loss": -6.762653350830078, "global_step": 147187, "epoch": 3504} {"train_loss": -6.577099800109863, "global_step": 147188, "epoch": 3504} {"train_loss": -6.686445236206055, "global_step": 147189, "epoch": 3504} {"train_loss": -6.650013446807861, "global_step": 147190, "epoch": 3504} {"train_loss": -6.7237749099731445, "global_step": 147191, "epoch": 3504} {"train_loss": -6.748287200927734, "global_step": 147192, "epoch": 3504} {"train_loss": -6.815003395080566, "global_step": 147193, "epoch": 3504} {"train_loss": -6.707147598266602, "global_step": 147194, "epoch": 3504} {"train_loss": -6.642727851867676, "global_step": 147195, "epoch": 3504} {"train_loss": -6.818686485290527, "global_step": 147196, "epoch": 3504} {"train_loss": -6.7095818519592285, "global_step": 147197, "epoch": 3504} {"train_loss": -6.8072028160095215, "global_step": 147198, "epoch": 3504} {"train_loss": -6.733298301696777, "global_step": 147199, "epoch": 3504} {"train_loss": -6.7151288986206055, "global_step": 147200, "epoch": 3504} {"train_loss": -6.8202619552612305, "global_step": 147201, "epoch": 3504} {"train_loss": -6.762221336364746, "global_step": 147202, "epoch": 3504} {"train_loss": -6.773933410644531, "global_step": 147203, "epoch": 3504} {"train_loss": -6.812351226806641, "global_step": 147204, "epoch": 3504} {"train_loss": -6.936659812927246, "global_step": 147205, "epoch": 3504} {"train_loss": -6.775783538818359, "global_step": 147206, "epoch": 3504} {"train_loss": -6.801657676696777, "global_step": 147207, "epoch": 3504} {"train_loss": -6.861940383911133, "global_step": 147208, "epoch": 3504} {"train_loss": -6.777552127838135, "global_step": 147209, "epoch": 3504, "val_loss": 78464.6015625} {"train_loss": -6.843357086181641, "global_step": 147210, "epoch": 3505} {"train_loss": -6.953783988952637, "global_step": 147211, "epoch": 3505} {"train_loss": -6.773652076721191, "global_step": 147212, "epoch": 3505} {"train_loss": -6.857354164123535, "global_step": 147213, "epoch": 3505} {"train_loss": -6.774425506591797, "global_step": 147214, "epoch": 3505} {"train_loss": -6.852459907531738, "global_step": 147215, "epoch": 3505} {"train_loss": -6.865867614746094, "global_step": 147216, "epoch": 3505} {"train_loss": -6.815249443054199, "global_step": 147217, "epoch": 3505} {"train_loss": -6.747164726257324, "global_step": 147218, "epoch": 3505} {"train_loss": -6.790914535522461, "global_step": 147219, "epoch": 3505} {"train_loss": -6.84865665435791, "global_step": 147220, "epoch": 3505} {"train_loss": -6.897798538208008, "global_step": 147221, "epoch": 3505} {"train_loss": -6.774830341339111, "global_step": 147222, "epoch": 3505} {"train_loss": -6.799687385559082, "global_step": 147223, "epoch": 3505} {"train_loss": -6.680905342102051, "global_step": 147224, "epoch": 3505} {"train_loss": -6.815952301025391, "global_step": 147225, "epoch": 3505} {"train_loss": -6.612937927246094, "global_step": 147226, "epoch": 3505} {"train_loss": -6.792482376098633, "global_step": 147227, "epoch": 3505} {"train_loss": -6.905815601348877, "global_step": 147228, "epoch": 3505} {"train_loss": -6.795055389404297, "global_step": 147229, "epoch": 3505} {"train_loss": -6.909972190856934, "global_step": 147230, "epoch": 3505} {"train_loss": -6.79885196685791, "global_step": 147231, "epoch": 3505} {"train_loss": -6.797396659851074, "global_step": 147232, "epoch": 3505} {"train_loss": -6.744011878967285, "global_step": 147233, "epoch": 3505} {"train_loss": -6.778124809265137, "global_step": 147234, "epoch": 3505} {"train_loss": -6.896128177642822, "global_step": 147235, "epoch": 3505} {"train_loss": -6.921184062957764, "global_step": 147236, "epoch": 3505} {"train_loss": -6.850937843322754, "global_step": 147237, "epoch": 3505} {"train_loss": -6.813250541687012, "global_step": 147238, "epoch": 3505} {"train_loss": -6.837102890014648, "global_step": 147239, "epoch": 3505} {"train_loss": -6.990600109100342, "global_step": 147240, "epoch": 3505} {"train_loss": -6.930269241333008, "global_step": 147241, "epoch": 3505} {"train_loss": -6.72896671295166, "global_step": 147242, "epoch": 3505} {"train_loss": -6.888463020324707, "global_step": 147243, "epoch": 3505} {"train_loss": -6.783794403076172, "global_step": 147244, "epoch": 3505} {"train_loss": -6.784533977508545, "global_step": 147245, "epoch": 3505} {"train_loss": -6.810385227203369, "global_step": 147246, "epoch": 3505} {"train_loss": -6.827912330627441, "global_step": 147247, "epoch": 3505} {"train_loss": -6.8527703285217285, "global_step": 147248, "epoch": 3505} {"train_loss": -6.899791717529297, "global_step": 147249, "epoch": 3505} {"train_loss": -6.790224552154541, "global_step": 147250, "epoch": 3505} {"train_loss": -6.825344891775222, "global_step": 147251, "epoch": 3505, "val_loss": 78520.109375} {"train_loss": -6.759437561035156, "global_step": 147252, "epoch": 3506} {"train_loss": -6.8344221115112305, "global_step": 147253, "epoch": 3506} {"train_loss": -6.8582763671875, "global_step": 147254, "epoch": 3506} {"train_loss": -6.824940204620361, "global_step": 147255, "epoch": 3506} {"train_loss": -6.748114585876465, "global_step": 147256, "epoch": 3506} {"train_loss": -6.6358795166015625, "global_step": 147257, "epoch": 3506} {"train_loss": -6.822251319885254, "global_step": 147258, "epoch": 3506} {"train_loss": -6.927290439605713, "global_step": 147259, "epoch": 3506} {"train_loss": -6.825952053070068, "global_step": 147260, "epoch": 3506} {"train_loss": -6.71349573135376, "global_step": 147261, "epoch": 3506} {"train_loss": -6.814038276672363, "global_step": 147262, "epoch": 3506} {"train_loss": -6.604480743408203, "global_step": 147263, "epoch": 3506} {"train_loss": -6.822970390319824, "global_step": 147264, "epoch": 3506} {"train_loss": -6.671333312988281, "global_step": 147265, "epoch": 3506} {"train_loss": -6.768597602844238, "global_step": 147266, "epoch": 3506} {"train_loss": -6.818121910095215, "global_step": 147267, "epoch": 3506} {"train_loss": -6.760283946990967, "global_step": 147268, "epoch": 3506} {"train_loss": -6.739984512329102, "global_step": 147269, "epoch": 3506} {"train_loss": -6.84910249710083, "global_step": 147270, "epoch": 3506} {"train_loss": -6.837021827697754, "global_step": 147271, "epoch": 3506} {"train_loss": -6.7487311363220215, "global_step": 147272, "epoch": 3506} {"train_loss": -6.857526779174805, "global_step": 147273, "epoch": 3506} {"train_loss": -6.756071090698242, "global_step": 147274, "epoch": 3506} {"train_loss": -6.6386308670043945, "global_step": 147275, "epoch": 3506} {"train_loss": -6.749030113220215, "global_step": 147276, "epoch": 3506} {"train_loss": -6.862759590148926, "global_step": 147277, "epoch": 3506} {"train_loss": -6.802254676818848, "global_step": 147278, "epoch": 3506} {"train_loss": -6.7566423416137695, "global_step": 147279, "epoch": 3506} {"train_loss": -6.804418563842773, "global_step": 147280, "epoch": 3506} {"train_loss": -6.685268402099609, "global_step": 147281, "epoch": 3506} {"train_loss": -6.799731254577637, "global_step": 147282, "epoch": 3506} {"train_loss": -6.758265495300293, "global_step": 147283, "epoch": 3506} {"train_loss": -6.891460418701172, "global_step": 147284, "epoch": 3506} {"train_loss": -6.734407424926758, "global_step": 147285, "epoch": 3506} {"train_loss": -6.822844505310059, "global_step": 147286, "epoch": 3506} {"train_loss": -6.703383445739746, "global_step": 147287, "epoch": 3506} {"train_loss": -6.707487106323242, "global_step": 147288, "epoch": 3506} {"train_loss": -6.772160530090332, "global_step": 147289, "epoch": 3506} {"train_loss": -6.795195579528809, "global_step": 147290, "epoch": 3506} {"train_loss": -6.9146928787231445, "global_step": 147291, "epoch": 3506} {"train_loss": -6.836270809173584, "global_step": 147292, "epoch": 3506} {"train_loss": -6.78197245370774, "global_step": 147293, "epoch": 3506, "val_loss": 78636.890625} {"train_loss": -6.7649383544921875, "global_step": 147294, "epoch": 3507} {"train_loss": -6.826979637145996, "global_step": 147295, "epoch": 3507} {"train_loss": -6.825730323791504, "global_step": 147296, "epoch": 3507} {"train_loss": -6.8910980224609375, "global_step": 147297, "epoch": 3507} {"train_loss": -6.878190517425537, "global_step": 147298, "epoch": 3507} {"train_loss": -6.867215156555176, "global_step": 147299, "epoch": 3507} {"train_loss": -6.878344535827637, "global_step": 147300, "epoch": 3507} {"train_loss": -6.836216926574707, "global_step": 147301, "epoch": 3507} {"train_loss": -6.925299644470215, "global_step": 147302, "epoch": 3507} {"train_loss": -6.867430210113525, "global_step": 147303, "epoch": 3507} {"train_loss": -6.895999431610107, "global_step": 147304, "epoch": 3507} {"train_loss": -6.895655632019043, "global_step": 147305, "epoch": 3507} {"train_loss": -6.90052604675293, "global_step": 147306, "epoch": 3507} {"train_loss": -6.949708461761475, "global_step": 147307, "epoch": 3507} {"train_loss": -6.862082481384277, "global_step": 147308, "epoch": 3507} {"train_loss": -6.904074668884277, "global_step": 147309, "epoch": 3507} {"train_loss": -6.918313026428223, "global_step": 147310, "epoch": 3507} {"train_loss": -6.8778228759765625, "global_step": 147311, "epoch": 3507} {"train_loss": -6.872422218322754, "global_step": 147312, "epoch": 3507} {"train_loss": -6.914811611175537, "global_step": 147313, "epoch": 3507} {"train_loss": -6.819415092468262, "global_step": 147314, "epoch": 3507} {"train_loss": -6.956406593322754, "global_step": 147315, "epoch": 3507} {"train_loss": -6.831799030303955, "global_step": 147316, "epoch": 3507} {"train_loss": -6.855214595794678, "global_step": 147317, "epoch": 3507} {"train_loss": -6.908077239990234, "global_step": 147318, "epoch": 3507} {"train_loss": -6.956881999969482, "global_step": 147319, "epoch": 3507} {"train_loss": -6.793900489807129, "global_step": 147320, "epoch": 3507} {"train_loss": -7.018592834472656, "global_step": 147321, "epoch": 3507} {"train_loss": -6.771394729614258, "global_step": 147322, "epoch": 3507} {"train_loss": -6.867230415344238, "global_step": 147323, "epoch": 3507} {"train_loss": -6.74919319152832, "global_step": 147324, "epoch": 3507} {"train_loss": -6.881032466888428, "global_step": 147325, "epoch": 3507} {"train_loss": -6.783383846282959, "global_step": 147326, "epoch": 3507} {"train_loss": -6.819850444793701, "global_step": 147327, "epoch": 3507} {"train_loss": -6.789032936096191, "global_step": 147328, "epoch": 3507} {"train_loss": -6.8318634033203125, "global_step": 147329, "epoch": 3507} {"train_loss": -6.8318328857421875, "global_step": 147330, "epoch": 3507} {"train_loss": -6.8071160316467285, "global_step": 147331, "epoch": 3507} {"train_loss": -6.768709659576416, "global_step": 147332, "epoch": 3507} {"train_loss": -6.883847236633301, "global_step": 147333, "epoch": 3507} {"train_loss": -6.896761417388916, "global_step": 147334, "epoch": 3507} {"train_loss": -6.86131967817034, "global_step": 147335, "epoch": 3507, "val_loss": 78467.875} {"train_loss": -6.893549919128418, "global_step": 147336, "epoch": 3508} {"train_loss": -6.814908027648926, "global_step": 147337, "epoch": 3508} {"train_loss": -7.005064010620117, "global_step": 147338, "epoch": 3508} {"train_loss": -6.844751358032227, "global_step": 147339, "epoch": 3508} {"train_loss": -6.840073585510254, "global_step": 147340, "epoch": 3508} {"train_loss": -6.758945465087891, "global_step": 147341, "epoch": 3508} {"train_loss": -6.860494136810303, "global_step": 147342, "epoch": 3508} {"train_loss": -6.857178211212158, "global_step": 147343, "epoch": 3508} {"train_loss": -6.925958633422852, "global_step": 147344, "epoch": 3508} {"train_loss": -6.882044315338135, "global_step": 147345, "epoch": 3508} {"train_loss": -6.991005897521973, "global_step": 147346, "epoch": 3508} {"train_loss": -6.92988395690918, "global_step": 147347, "epoch": 3508} {"train_loss": -6.88655948638916, "global_step": 147348, "epoch": 3508} {"train_loss": -6.9584503173828125, "global_step": 147349, "epoch": 3508} {"train_loss": -6.942587852478027, "global_step": 147350, "epoch": 3508} {"train_loss": -6.864407539367676, "global_step": 147351, "epoch": 3508} {"train_loss": -6.636641979217529, "global_step": 147352, "epoch": 3508} {"train_loss": -6.81479549407959, "global_step": 147353, "epoch": 3508} {"train_loss": -6.926627159118652, "global_step": 147354, "epoch": 3508} {"train_loss": -6.6707844734191895, "global_step": 147355, "epoch": 3508} {"train_loss": -6.77542781829834, "global_step": 147356, "epoch": 3508} {"train_loss": -6.896177291870117, "global_step": 147357, "epoch": 3508} {"train_loss": -6.600477695465088, "global_step": 147358, "epoch": 3508} {"train_loss": -6.875308036804199, "global_step": 147359, "epoch": 3508} {"train_loss": -6.654000282287598, "global_step": 147360, "epoch": 3508} {"train_loss": -6.800792217254639, "global_step": 147361, "epoch": 3508} {"train_loss": -6.754782676696777, "global_step": 147362, "epoch": 3508} {"train_loss": -6.829317092895508, "global_step": 147363, "epoch": 3508} {"train_loss": -6.809817790985107, "global_step": 147364, "epoch": 3508} {"train_loss": -6.661871910095215, "global_step": 147365, "epoch": 3508} {"train_loss": -6.844820022583008, "global_step": 147366, "epoch": 3508} {"train_loss": -6.663933753967285, "global_step": 147367, "epoch": 3508} {"train_loss": -6.835254669189453, "global_step": 147368, "epoch": 3508} {"train_loss": -6.700484275817871, "global_step": 147369, "epoch": 3508} {"train_loss": -6.838322162628174, "global_step": 147370, "epoch": 3508} {"train_loss": -6.723963737487793, "global_step": 147371, "epoch": 3508} {"train_loss": -6.805492401123047, "global_step": 147372, "epoch": 3508} {"train_loss": -6.675748825073242, "global_step": 147373, "epoch": 3508} {"train_loss": -6.777719974517822, "global_step": 147374, "epoch": 3508} {"train_loss": -6.751270294189453, "global_step": 147375, "epoch": 3508} {"train_loss": -6.79234504699707, "global_step": 147376, "epoch": 3508} {"train_loss": -6.812866755894253, "global_step": 147377, "epoch": 3508, "val_loss": 78756.5390625} {"train_loss": -6.716744422912598, "global_step": 147378, "epoch": 3509} {"train_loss": -6.82491397857666, "global_step": 147379, "epoch": 3509} {"train_loss": -6.734344482421875, "global_step": 147380, "epoch": 3509} {"train_loss": -6.736291885375977, "global_step": 147381, "epoch": 3509} {"train_loss": -6.983434200286865, "global_step": 147382, "epoch": 3509} {"train_loss": -6.876198768615723, "global_step": 147383, "epoch": 3509} {"train_loss": -6.899369716644287, "global_step": 147384, "epoch": 3509} {"train_loss": -6.667311191558838, "global_step": 147385, "epoch": 3509} {"train_loss": -6.899810791015625, "global_step": 147386, "epoch": 3509} {"train_loss": -6.784716606140137, "global_step": 147387, "epoch": 3509} {"train_loss": -6.969329833984375, "global_step": 147388, "epoch": 3509} {"train_loss": -6.860944747924805, "global_step": 147389, "epoch": 3509} {"train_loss": -6.8344621658325195, "global_step": 147390, "epoch": 3509} {"train_loss": -6.804347515106201, "global_step": 147391, "epoch": 3509} {"train_loss": -6.671835899353027, "global_step": 147392, "epoch": 3509} {"train_loss": -6.826581001281738, "global_step": 147393, "epoch": 3509} {"train_loss": -6.76899528503418, "global_step": 147394, "epoch": 3509} {"train_loss": -6.737273693084717, "global_step": 147395, "epoch": 3509} {"train_loss": -6.6689958572387695, "global_step": 147396, "epoch": 3509} {"train_loss": -6.850304126739502, "global_step": 147397, "epoch": 3509} {"train_loss": -6.833309650421143, "global_step": 147398, "epoch": 3509} {"train_loss": -6.656050205230713, "global_step": 147399, "epoch": 3509} {"train_loss": -6.821504592895508, "global_step": 147400, "epoch": 3509} {"train_loss": -6.597029209136963, "global_step": 147401, "epoch": 3509} {"train_loss": -6.796299934387207, "global_step": 147402, "epoch": 3509} {"train_loss": -6.804856300354004, "global_step": 147403, "epoch": 3509} {"train_loss": -6.655012130737305, "global_step": 147404, "epoch": 3509} {"train_loss": -6.809685707092285, "global_step": 147405, "epoch": 3509} {"train_loss": -6.846896171569824, "global_step": 147406, "epoch": 3509} {"train_loss": -6.663287162780762, "global_step": 147407, "epoch": 3509} {"train_loss": -6.773689270019531, "global_step": 147408, "epoch": 3509} {"train_loss": -6.684882640838623, "global_step": 147409, "epoch": 3509} {"train_loss": -6.794247150421143, "global_step": 147410, "epoch": 3509} {"train_loss": -6.710935592651367, "global_step": 147411, "epoch": 3509} {"train_loss": -6.786044120788574, "global_step": 147412, "epoch": 3509} {"train_loss": -6.8903961181640625, "global_step": 147413, "epoch": 3509} {"train_loss": -6.855580806732178, "global_step": 147414, "epoch": 3509} {"train_loss": -6.807323455810547, "global_step": 147415, "epoch": 3509} {"train_loss": -6.920108795166016, "global_step": 147416, "epoch": 3509} {"train_loss": -6.714799880981445, "global_step": 147417, "epoch": 3509} {"train_loss": -6.777500629425049, "global_step": 147418, "epoch": 3509} {"train_loss": -6.790443488529751, "global_step": 147419, "epoch": 3509, "val_loss": 78607.6171875} {"train_loss": -6.9162092208862305, "global_step": 147420, "epoch": 3510} {"train_loss": -6.860008716583252, "global_step": 147421, "epoch": 3510} {"train_loss": -6.8979692459106445, "global_step": 147422, "epoch": 3510} {"train_loss": -6.802209854125977, "global_step": 147423, "epoch": 3510} {"train_loss": -6.847393989562988, "global_step": 147424, "epoch": 3510} {"train_loss": -6.9263434410095215, "global_step": 147425, "epoch": 3510} {"train_loss": -6.815679550170898, "global_step": 147426, "epoch": 3510} {"train_loss": -6.881040573120117, "global_step": 147427, "epoch": 3510} {"train_loss": -6.822998046875, "global_step": 147428, "epoch": 3510} {"train_loss": -6.888547897338867, "global_step": 147429, "epoch": 3510} {"train_loss": -6.786989688873291, "global_step": 147430, "epoch": 3510} {"train_loss": -6.7827911376953125, "global_step": 147431, "epoch": 3510} {"train_loss": -6.965741157531738, "global_step": 147432, "epoch": 3510} {"train_loss": -6.76088809967041, "global_step": 147433, "epoch": 3510} {"train_loss": -6.722325801849365, "global_step": 147434, "epoch": 3510} {"train_loss": -6.7584123611450195, "global_step": 147435, "epoch": 3510} {"train_loss": -6.926772117614746, "global_step": 147436, "epoch": 3510} {"train_loss": -6.873035430908203, "global_step": 147437, "epoch": 3510} {"train_loss": -6.67880916595459, "global_step": 147438, "epoch": 3510} {"train_loss": -6.870115280151367, "global_step": 147439, "epoch": 3510} {"train_loss": -6.863564491271973, "global_step": 147440, "epoch": 3510} {"train_loss": -6.6891069412231445, "global_step": 147441, "epoch": 3510} {"train_loss": -6.869283199310303, "global_step": 147442, "epoch": 3510} {"train_loss": -6.804112434387207, "global_step": 147443, "epoch": 3510} {"train_loss": -6.77773380279541, "global_step": 147444, "epoch": 3510} {"train_loss": -6.870573043823242, "global_step": 147445, "epoch": 3510} {"train_loss": -6.870155334472656, "global_step": 147446, "epoch": 3510} {"train_loss": -6.763523101806641, "global_step": 147447, "epoch": 3510} {"train_loss": -6.808073997497559, "global_step": 147448, "epoch": 3510} {"train_loss": -6.846665382385254, "global_step": 147449, "epoch": 3510} {"train_loss": -6.793970108032227, "global_step": 147450, "epoch": 3510} {"train_loss": -6.797269821166992, "global_step": 147451, "epoch": 3510} {"train_loss": -6.921234607696533, "global_step": 147452, "epoch": 3510} {"train_loss": -6.907153129577637, "global_step": 147453, "epoch": 3510} {"train_loss": -6.865327835083008, "global_step": 147454, "epoch": 3510} {"train_loss": -6.764246940612793, "global_step": 147455, "epoch": 3510} {"train_loss": -6.852147102355957, "global_step": 147456, "epoch": 3510} {"train_loss": -6.808423042297363, "global_step": 147457, "epoch": 3510} {"train_loss": -6.756126403808594, "global_step": 147458, "epoch": 3510} {"train_loss": -6.810220241546631, "global_step": 147459, "epoch": 3510} {"train_loss": -6.655623435974121, "global_step": 147460, "epoch": 3510} {"train_loss": -6.826926049732027, "global_step": 147461, "epoch": 3510, "val_loss": 78605.1484375} {"train_loss": -6.816926956176758, "global_step": 147462, "epoch": 3511} {"train_loss": -6.802288055419922, "global_step": 147463, "epoch": 3511} {"train_loss": -6.745990753173828, "global_step": 147464, "epoch": 3511} {"train_loss": -6.904785633087158, "global_step": 147465, "epoch": 3511} {"train_loss": -6.7122297286987305, "global_step": 147466, "epoch": 3511} {"train_loss": -6.937327861785889, "global_step": 147467, "epoch": 3511} {"train_loss": -6.70742130279541, "global_step": 147468, "epoch": 3511} {"train_loss": -6.898109436035156, "global_step": 147469, "epoch": 3511} {"train_loss": -6.742101669311523, "global_step": 147470, "epoch": 3511} {"train_loss": -6.769412994384766, "global_step": 147471, "epoch": 3511} {"train_loss": -6.899580001831055, "global_step": 147472, "epoch": 3511} {"train_loss": -6.970836639404297, "global_step": 147473, "epoch": 3511} {"train_loss": -6.852158546447754, "global_step": 147474, "epoch": 3511} {"train_loss": -6.953096389770508, "global_step": 147475, "epoch": 3511} {"train_loss": -6.817134380340576, "global_step": 147476, "epoch": 3511} {"train_loss": -6.830283164978027, "global_step": 147477, "epoch": 3511} {"train_loss": -6.932844638824463, "global_step": 147478, "epoch": 3511} {"train_loss": -6.874947547912598, "global_step": 147479, "epoch": 3511} {"train_loss": -6.750985622406006, "global_step": 147480, "epoch": 3511} {"train_loss": -6.794980049133301, "global_step": 147481, "epoch": 3511} {"train_loss": -6.712653160095215, "global_step": 147482, "epoch": 3511} {"train_loss": -6.858735084533691, "global_step": 147483, "epoch": 3511} {"train_loss": -6.878692626953125, "global_step": 147484, "epoch": 3511} {"train_loss": -6.727233409881592, "global_step": 147485, "epoch": 3511} {"train_loss": -6.863469123840332, "global_step": 147486, "epoch": 3511} {"train_loss": -6.831510066986084, "global_step": 147487, "epoch": 3511} {"train_loss": -6.872614860534668, "global_step": 147488, "epoch": 3511} {"train_loss": -6.9396772384643555, "global_step": 147489, "epoch": 3511} {"train_loss": -6.79854679107666, "global_step": 147490, "epoch": 3511} {"train_loss": -6.889352798461914, "global_step": 147491, "epoch": 3511} {"train_loss": -6.868953704833984, "global_step": 147492, "epoch": 3511} {"train_loss": -6.811563491821289, "global_step": 147493, "epoch": 3511} {"train_loss": -6.782720565795898, "global_step": 147494, "epoch": 3511} {"train_loss": -6.756202697753906, "global_step": 147495, "epoch": 3511} {"train_loss": -6.888518333435059, "global_step": 147496, "epoch": 3511} {"train_loss": -6.7960662841796875, "global_step": 147497, "epoch": 3511} {"train_loss": -6.915281295776367, "global_step": 147498, "epoch": 3511} {"train_loss": -6.797122478485107, "global_step": 147499, "epoch": 3511} {"train_loss": -6.905935287475586, "global_step": 147500, "epoch": 3511} {"train_loss": -6.925518035888672, "global_step": 147501, "epoch": 3511} {"train_loss": -6.858498573303223, "global_step": 147502, "epoch": 3511} {"train_loss": -6.839197476704915, "global_step": 147503, "epoch": 3511, "val_loss": 78472.4375} {"train_loss": -6.820485591888428, "global_step": 147504, "epoch": 3512} {"train_loss": -6.996975421905518, "global_step": 147505, "epoch": 3512} {"train_loss": -6.775435447692871, "global_step": 147506, "epoch": 3512} {"train_loss": -6.9953999519348145, "global_step": 147507, "epoch": 3512} {"train_loss": -6.948761940002441, "global_step": 147508, "epoch": 3512} {"train_loss": -6.813241481781006, "global_step": 147509, "epoch": 3512} {"train_loss": -6.88024377822876, "global_step": 147510, "epoch": 3512} {"train_loss": -6.69521427154541, "global_step": 147511, "epoch": 3512} {"train_loss": -6.9134521484375, "global_step": 147512, "epoch": 3512} {"train_loss": -6.903325080871582, "global_step": 147513, "epoch": 3512} {"train_loss": -6.832569122314453, "global_step": 147514, "epoch": 3512} {"train_loss": -6.8638505935668945, "global_step": 147515, "epoch": 3512} {"train_loss": -6.871770858764648, "global_step": 147516, "epoch": 3512} {"train_loss": -6.816324234008789, "global_step": 147517, "epoch": 3512} {"train_loss": -6.891693115234375, "global_step": 147518, "epoch": 3512} {"train_loss": -6.793001651763916, "global_step": 147519, "epoch": 3512} {"train_loss": -6.739068984985352, "global_step": 147520, "epoch": 3512} {"train_loss": -6.977967262268066, "global_step": 147521, "epoch": 3512} {"train_loss": -6.924160480499268, "global_step": 147522, "epoch": 3512} {"train_loss": -6.865551948547363, "global_step": 147523, "epoch": 3512} {"train_loss": -6.961889743804932, "global_step": 147524, "epoch": 3512} {"train_loss": -6.83713436126709, "global_step": 147525, "epoch": 3512} {"train_loss": -6.849822998046875, "global_step": 147526, "epoch": 3512} {"train_loss": -6.809289932250977, "global_step": 147527, "epoch": 3512} {"train_loss": -6.765687465667725, "global_step": 147528, "epoch": 3512} {"train_loss": -6.779897689819336, "global_step": 147529, "epoch": 3512} {"train_loss": -6.781976699829102, "global_step": 147530, "epoch": 3512} {"train_loss": -6.76283073425293, "global_step": 147531, "epoch": 3512} {"train_loss": -6.874823570251465, "global_step": 147532, "epoch": 3512} {"train_loss": -6.897927284240723, "global_step": 147533, "epoch": 3512} {"train_loss": -6.7851948738098145, "global_step": 147534, "epoch": 3512} {"train_loss": -6.872572898864746, "global_step": 147535, "epoch": 3512} {"train_loss": -6.935311317443848, "global_step": 147536, "epoch": 3512} {"train_loss": -6.8256306648254395, "global_step": 147537, "epoch": 3512} {"train_loss": -6.8601837158203125, "global_step": 147538, "epoch": 3512} {"train_loss": -6.918862342834473, "global_step": 147539, "epoch": 3512} {"train_loss": -6.891806125640869, "global_step": 147540, "epoch": 3512} {"train_loss": -6.904400825500488, "global_step": 147541, "epoch": 3512} {"train_loss": -6.728544235229492, "global_step": 147542, "epoch": 3512} {"train_loss": -6.873476028442383, "global_step": 147543, "epoch": 3512} {"train_loss": -6.914641380310059, "global_step": 147544, "epoch": 3512} {"train_loss": -6.855996438435146, "global_step": 147545, "epoch": 3512, "val_loss": 78745.2890625} {"train_loss": -6.821887016296387, "global_step": 147546, "epoch": 3513} {"train_loss": -6.941831111907959, "global_step": 147547, "epoch": 3513} {"train_loss": -6.758559226989746, "global_step": 147548, "epoch": 3513} {"train_loss": -6.758881568908691, "global_step": 147549, "epoch": 3513} {"train_loss": -6.820405960083008, "global_step": 147550, "epoch": 3513} {"train_loss": -6.828066825866699, "global_step": 147551, "epoch": 3513} {"train_loss": -6.831271648406982, "global_step": 147552, "epoch": 3513} {"train_loss": -6.861987113952637, "global_step": 147553, "epoch": 3513} {"train_loss": -6.879446506500244, "global_step": 147554, "epoch": 3513} {"train_loss": -6.832106590270996, "global_step": 147555, "epoch": 3513} {"train_loss": -6.817984104156494, "global_step": 147556, "epoch": 3513} {"train_loss": -6.84467077255249, "global_step": 147557, "epoch": 3513} {"train_loss": -6.746395111083984, "global_step": 147558, "epoch": 3513} {"train_loss": -6.661116600036621, "global_step": 147559, "epoch": 3513} {"train_loss": -6.897455215454102, "global_step": 147560, "epoch": 3513} {"train_loss": -6.719234466552734, "global_step": 147561, "epoch": 3513} {"train_loss": -6.714035987854004, "global_step": 147562, "epoch": 3513} {"train_loss": -6.7441582679748535, "global_step": 147563, "epoch": 3513} {"train_loss": -6.675127029418945, "global_step": 147564, "epoch": 3513} {"train_loss": -6.807283401489258, "global_step": 147565, "epoch": 3513} {"train_loss": -6.728758811950684, "global_step": 147566, "epoch": 3513} {"train_loss": -6.806838512420654, "global_step": 147567, "epoch": 3513} {"train_loss": -6.65768575668335, "global_step": 147568, "epoch": 3513} {"train_loss": -6.864543914794922, "global_step": 147569, "epoch": 3513} {"train_loss": -6.716187953948975, "global_step": 147570, "epoch": 3513} {"train_loss": -6.825806617736816, "global_step": 147571, "epoch": 3513} {"train_loss": -6.8195085525512695, "global_step": 147572, "epoch": 3513} {"train_loss": -6.889372825622559, "global_step": 147573, "epoch": 3513} {"train_loss": -6.835493087768555, "global_step": 147574, "epoch": 3513} {"train_loss": -6.90106201171875, "global_step": 147575, "epoch": 3513} {"train_loss": -6.751023292541504, "global_step": 147576, "epoch": 3513} {"train_loss": -6.906398773193359, "global_step": 147577, "epoch": 3513} {"train_loss": -6.8254475593566895, "global_step": 147578, "epoch": 3513} {"train_loss": -6.693914413452148, "global_step": 147579, "epoch": 3513} {"train_loss": -6.932065010070801, "global_step": 147580, "epoch": 3513} {"train_loss": -6.761211395263672, "global_step": 147581, "epoch": 3513} {"train_loss": -6.806195259094238, "global_step": 147582, "epoch": 3513} {"train_loss": -6.7376532554626465, "global_step": 147583, "epoch": 3513} {"train_loss": -6.860004425048828, "global_step": 147584, "epoch": 3513} {"train_loss": -6.779629707336426, "global_step": 147585, "epoch": 3513} {"train_loss": -6.868524551391602, "global_step": 147586, "epoch": 3513} {"train_loss": -6.804486547197614, "global_step": 147587, "epoch": 3513, "val_loss": 78594.4921875} {"train_loss": -6.801260471343994, "global_step": 147588, "epoch": 3514} {"train_loss": -6.759984970092773, "global_step": 147589, "epoch": 3514} {"train_loss": -6.89735221862793, "global_step": 147590, "epoch": 3514} {"train_loss": -6.860986232757568, "global_step": 147591, "epoch": 3514} {"train_loss": -6.820634841918945, "global_step": 147592, "epoch": 3514} {"train_loss": -6.88895845413208, "global_step": 147593, "epoch": 3514} {"train_loss": -6.7924699783325195, "global_step": 147594, "epoch": 3514} {"train_loss": -6.961212158203125, "global_step": 147595, "epoch": 3514} {"train_loss": -6.857804298400879, "global_step": 147596, "epoch": 3514} {"train_loss": -6.9693403244018555, "global_step": 147597, "epoch": 3514} {"train_loss": -6.975505828857422, "global_step": 147598, "epoch": 3514} {"train_loss": -6.8364410400390625, "global_step": 147599, "epoch": 3514} {"train_loss": -6.772069931030273, "global_step": 147600, "epoch": 3514} {"train_loss": -6.953916549682617, "global_step": 147601, "epoch": 3514} {"train_loss": -6.753046989440918, "global_step": 147602, "epoch": 3514} {"train_loss": -6.7838897705078125, "global_step": 147603, "epoch": 3514} {"train_loss": -6.879025459289551, "global_step": 147604, "epoch": 3514} {"train_loss": -6.737349987030029, "global_step": 147605, "epoch": 3514} {"train_loss": -6.891879558563232, "global_step": 147606, "epoch": 3514} {"train_loss": -6.8381547927856445, "global_step": 147607, "epoch": 3514} {"train_loss": -6.771903038024902, "global_step": 147608, "epoch": 3514} {"train_loss": -6.900843620300293, "global_step": 147609, "epoch": 3514} {"train_loss": -6.905634880065918, "global_step": 147610, "epoch": 3514} {"train_loss": -6.809453964233398, "global_step": 147611, "epoch": 3514} {"train_loss": -6.956244468688965, "global_step": 147612, "epoch": 3514} {"train_loss": -6.73521614074707, "global_step": 147613, "epoch": 3514} {"train_loss": -6.824694633483887, "global_step": 147614, "epoch": 3514} {"train_loss": -6.912456035614014, "global_step": 147615, "epoch": 3514} {"train_loss": -6.822783470153809, "global_step": 147616, "epoch": 3514} {"train_loss": -6.771062850952148, "global_step": 147617, "epoch": 3514} {"train_loss": -6.870165824890137, "global_step": 147618, "epoch": 3514} {"train_loss": -6.845734119415283, "global_step": 147619, "epoch": 3514} {"train_loss": -6.866445541381836, "global_step": 147620, "epoch": 3514} {"train_loss": -6.8474225997924805, "global_step": 147621, "epoch": 3514} {"train_loss": -6.6852617263793945, "global_step": 147622, "epoch": 3514} {"train_loss": -6.78461217880249, "global_step": 147623, "epoch": 3514} {"train_loss": -6.8896870613098145, "global_step": 147624, "epoch": 3514} {"train_loss": -6.746086597442627, "global_step": 147625, "epoch": 3514} {"train_loss": -6.848482131958008, "global_step": 147626, "epoch": 3514} {"train_loss": -6.8421478271484375, "global_step": 147627, "epoch": 3514} {"train_loss": -6.835667610168457, "global_step": 147628, "epoch": 3514} {"train_loss": -6.840934571765718, "global_step": 147629, "epoch": 3514, "val_loss": 78610.0078125} {"train_loss": -6.770277500152588, "global_step": 147630, "epoch": 3515} {"train_loss": -6.726239204406738, "global_step": 147631, "epoch": 3515} {"train_loss": -6.909423828125, "global_step": 147632, "epoch": 3515} {"train_loss": -6.931087493896484, "global_step": 147633, "epoch": 3515} {"train_loss": -6.787450790405273, "global_step": 147634, "epoch": 3515} {"train_loss": -6.705838203430176, "global_step": 147635, "epoch": 3515} {"train_loss": -6.856694221496582, "global_step": 147636, "epoch": 3515} {"train_loss": -6.886968612670898, "global_step": 147637, "epoch": 3515} {"train_loss": -6.783698081970215, "global_step": 147638, "epoch": 3515} {"train_loss": -6.824867248535156, "global_step": 147639, "epoch": 3515} {"train_loss": -6.964175224304199, "global_step": 147640, "epoch": 3515} {"train_loss": -6.767542362213135, "global_step": 147641, "epoch": 3515} {"train_loss": -6.788552284240723, "global_step": 147642, "epoch": 3515} {"train_loss": -6.836612701416016, "global_step": 147643, "epoch": 3515} {"train_loss": -6.784514427185059, "global_step": 147644, "epoch": 3515} {"train_loss": -6.835141181945801, "global_step": 147645, "epoch": 3515} {"train_loss": -6.780344486236572, "global_step": 147646, "epoch": 3515} {"train_loss": -6.852245807647705, "global_step": 147647, "epoch": 3515} {"train_loss": -6.847647666931152, "global_step": 147648, "epoch": 3515} {"train_loss": -6.837474822998047, "global_step": 147649, "epoch": 3515} {"train_loss": -6.889060974121094, "global_step": 147650, "epoch": 3515} {"train_loss": -6.8758745193481445, "global_step": 147651, "epoch": 3515} {"train_loss": -6.632839679718018, "global_step": 147652, "epoch": 3515} {"train_loss": -6.843184471130371, "global_step": 147653, "epoch": 3515} {"train_loss": -6.7796711921691895, "global_step": 147654, "epoch": 3515} {"train_loss": -6.907635688781738, "global_step": 147655, "epoch": 3515} {"train_loss": -6.774306297302246, "global_step": 147656, "epoch": 3515} {"train_loss": -6.828818321228027, "global_step": 147657, "epoch": 3515} {"train_loss": -6.716564178466797, "global_step": 147658, "epoch": 3515} {"train_loss": -6.846700668334961, "global_step": 147659, "epoch": 3515} {"train_loss": -6.887011528015137, "global_step": 147660, "epoch": 3515} {"train_loss": -6.8674468994140625, "global_step": 147661, "epoch": 3515} {"train_loss": -6.87384033203125, "global_step": 147662, "epoch": 3515} {"train_loss": -6.661404609680176, "global_step": 147663, "epoch": 3515} {"train_loss": -6.796144485473633, "global_step": 147664, "epoch": 3515} {"train_loss": -6.941237449645996, "global_step": 147665, "epoch": 3515} {"train_loss": -6.84342622756958, "global_step": 147666, "epoch": 3515} {"train_loss": -6.720158100128174, "global_step": 147667, "epoch": 3515} {"train_loss": -6.836551666259766, "global_step": 147668, "epoch": 3515} {"train_loss": -6.780975341796875, "global_step": 147669, "epoch": 3515} {"train_loss": -6.897275924682617, "global_step": 147670, "epoch": 3515} {"train_loss": -6.8194674877893355, "global_step": 147671, "epoch": 3515, "val_loss": 78441.1796875} {"train_loss": -6.841575622558594, "global_step": 147672, "epoch": 3516} {"train_loss": -6.902799606323242, "global_step": 147673, "epoch": 3516} {"train_loss": -6.830288887023926, "global_step": 147674, "epoch": 3516} {"train_loss": -6.877242088317871, "global_step": 147675, "epoch": 3516} {"train_loss": -6.992127418518066, "global_step": 147676, "epoch": 3516} {"train_loss": -6.911118984222412, "global_step": 147677, "epoch": 3516} {"train_loss": -6.856566905975342, "global_step": 147678, "epoch": 3516} {"train_loss": -6.961665630340576, "global_step": 147679, "epoch": 3516} {"train_loss": -6.951175689697266, "global_step": 147680, "epoch": 3516} {"train_loss": -6.952791690826416, "global_step": 147681, "epoch": 3516} {"train_loss": -6.917362213134766, "global_step": 147682, "epoch": 3516} {"train_loss": -6.752967834472656, "global_step": 147683, "epoch": 3516} {"train_loss": -6.899353981018066, "global_step": 147684, "epoch": 3516} {"train_loss": -6.917931079864502, "global_step": 147685, "epoch": 3516} {"train_loss": -6.744940757751465, "global_step": 147686, "epoch": 3516} {"train_loss": -6.862816333770752, "global_step": 147687, "epoch": 3516} {"train_loss": -6.818452835083008, "global_step": 147688, "epoch": 3516} {"train_loss": -6.715767860412598, "global_step": 147689, "epoch": 3516} {"train_loss": -6.710545539855957, "global_step": 147690, "epoch": 3516} {"train_loss": -6.815485954284668, "global_step": 147691, "epoch": 3516} {"train_loss": -6.812778472900391, "global_step": 147692, "epoch": 3516} {"train_loss": -6.836159706115723, "global_step": 147693, "epoch": 3516} {"train_loss": -6.912533283233643, "global_step": 147694, "epoch": 3516} {"train_loss": -6.929431915283203, "global_step": 147695, "epoch": 3516} {"train_loss": -6.908306121826172, "global_step": 147696, "epoch": 3516} {"train_loss": -6.847519397735596, "global_step": 147697, "epoch": 3516} {"train_loss": -6.835799217224121, "global_step": 147698, "epoch": 3516} {"train_loss": -6.885453701019287, "global_step": 147699, "epoch": 3516} {"train_loss": -6.7628703117370605, "global_step": 147700, "epoch": 3516} {"train_loss": -6.799618721008301, "global_step": 147701, "epoch": 3516} {"train_loss": -6.8725738525390625, "global_step": 147702, "epoch": 3516} {"train_loss": -6.852022171020508, "global_step": 147703, "epoch": 3516} {"train_loss": -6.813128471374512, "global_step": 147704, "epoch": 3516} {"train_loss": -6.8350419998168945, "global_step": 147705, "epoch": 3516} {"train_loss": -6.769655227661133, "global_step": 147706, "epoch": 3516} {"train_loss": -6.693046569824219, "global_step": 147707, "epoch": 3516} {"train_loss": -6.91225528717041, "global_step": 147708, "epoch": 3516} {"train_loss": -6.838606834411621, "global_step": 147709, "epoch": 3516} {"train_loss": -6.846956253051758, "global_step": 147710, "epoch": 3516} {"train_loss": -6.753324508666992, "global_step": 147711, "epoch": 3516} {"train_loss": -6.831738471984863, "global_step": 147712, "epoch": 3516} {"train_loss": -6.8481667041778564, "global_step": 147713, "epoch": 3516, "val_loss": 78826.0703125} {"train_loss": -6.778144836425781, "global_step": 147714, "epoch": 3517} {"train_loss": -6.746982574462891, "global_step": 147715, "epoch": 3517} {"train_loss": -6.777664661407471, "global_step": 147716, "epoch": 3517} {"train_loss": -6.674409866333008, "global_step": 147717, "epoch": 3517} {"train_loss": -6.83444356918335, "global_step": 147718, "epoch": 3517} {"train_loss": -6.74423885345459, "global_step": 147719, "epoch": 3517} {"train_loss": -6.810171127319336, "global_step": 147720, "epoch": 3517} {"train_loss": -6.760678291320801, "global_step": 147721, "epoch": 3517} {"train_loss": -6.784753799438477, "global_step": 147722, "epoch": 3517} {"train_loss": -6.845269203186035, "global_step": 147723, "epoch": 3517} {"train_loss": -6.786190032958984, "global_step": 147724, "epoch": 3517} {"train_loss": -6.724664211273193, "global_step": 147725, "epoch": 3517} {"train_loss": -6.7091474533081055, "global_step": 147726, "epoch": 3517} {"train_loss": -6.713200569152832, "global_step": 147727, "epoch": 3517} {"train_loss": -6.970107078552246, "global_step": 147728, "epoch": 3517} {"train_loss": -6.735844135284424, "global_step": 147729, "epoch": 3517} {"train_loss": -6.803183555603027, "global_step": 147730, "epoch": 3517} {"train_loss": -6.796015739440918, "global_step": 147731, "epoch": 3517} {"train_loss": -6.634424209594727, "global_step": 147732, "epoch": 3517} {"train_loss": -6.805304527282715, "global_step": 147733, "epoch": 3517} {"train_loss": -6.771363735198975, "global_step": 147734, "epoch": 3517} {"train_loss": -6.822267532348633, "global_step": 147735, "epoch": 3517} {"train_loss": -6.856351852416992, "global_step": 147736, "epoch": 3517} {"train_loss": -6.851452350616455, "global_step": 147737, "epoch": 3517} {"train_loss": -6.711575508117676, "global_step": 147738, "epoch": 3517} {"train_loss": -6.894033908843994, "global_step": 147739, "epoch": 3517} {"train_loss": -6.788589000701904, "global_step": 147740, "epoch": 3517} {"train_loss": -6.823475360870361, "global_step": 147741, "epoch": 3517} {"train_loss": -6.865790843963623, "global_step": 147742, "epoch": 3517} {"train_loss": -6.801018714904785, "global_step": 147743, "epoch": 3517} {"train_loss": -6.881152153015137, "global_step": 147744, "epoch": 3517} {"train_loss": -6.77644157409668, "global_step": 147745, "epoch": 3517} {"train_loss": -6.853478908538818, "global_step": 147746, "epoch": 3517} {"train_loss": -6.869408130645752, "global_step": 147747, "epoch": 3517} {"train_loss": -6.891439437866211, "global_step": 147748, "epoch": 3517} {"train_loss": -6.928156852722168, "global_step": 147749, "epoch": 3517} {"train_loss": -6.779451847076416, "global_step": 147750, "epoch": 3517} {"train_loss": -6.7261528968811035, "global_step": 147751, "epoch": 3517} {"train_loss": -6.838650703430176, "global_step": 147752, "epoch": 3517} {"train_loss": -6.863297939300537, "global_step": 147753, "epoch": 3517} {"train_loss": -6.651712417602539, "global_step": 147754, "epoch": 3517} {"train_loss": -6.7997553916204545, "global_step": 147755, "epoch": 3517, "val_loss": 78267.8515625} {"train_loss": -6.771885395050049, "global_step": 147756, "epoch": 3518} {"train_loss": -6.72559118270874, "global_step": 147757, "epoch": 3518} {"train_loss": -6.82794713973999, "global_step": 147758, "epoch": 3518} {"train_loss": -6.691324710845947, "global_step": 147759, "epoch": 3518} {"train_loss": -6.907372951507568, "global_step": 147760, "epoch": 3518} {"train_loss": -6.7611260414123535, "global_step": 147761, "epoch": 3518} {"train_loss": -6.6511688232421875, "global_step": 147762, "epoch": 3518} {"train_loss": -6.645627021789551, "global_step": 147763, "epoch": 3518} {"train_loss": -6.55937385559082, "global_step": 147764, "epoch": 3518} {"train_loss": -6.9088873863220215, "global_step": 147765, "epoch": 3518} {"train_loss": -6.699533939361572, "global_step": 147766, "epoch": 3518} {"train_loss": -6.602560520172119, "global_step": 147767, "epoch": 3518} {"train_loss": -6.628661632537842, "global_step": 147768, "epoch": 3518} {"train_loss": -6.622377395629883, "global_step": 147769, "epoch": 3518} {"train_loss": -6.6564106941223145, "global_step": 147770, "epoch": 3518} {"train_loss": -6.837550163269043, "global_step": 147771, "epoch": 3518} {"train_loss": -6.7204179763793945, "global_step": 147772, "epoch": 3518} {"train_loss": -6.648777961730957, "global_step": 147773, "epoch": 3518} {"train_loss": -6.7509846687316895, "global_step": 147774, "epoch": 3518} {"train_loss": -6.688723564147949, "global_step": 147775, "epoch": 3518} {"train_loss": -6.610980987548828, "global_step": 147776, "epoch": 3518} {"train_loss": -6.661603927612305, "global_step": 147777, "epoch": 3518} {"train_loss": -6.729538917541504, "global_step": 147778, "epoch": 3518} {"train_loss": -6.682798862457275, "global_step": 147779, "epoch": 3518} {"train_loss": -6.73268461227417, "global_step": 147780, "epoch": 3518} {"train_loss": -6.727017402648926, "global_step": 147781, "epoch": 3518} {"train_loss": -6.78565788269043, "global_step": 147782, "epoch": 3518} {"train_loss": -6.7940449714660645, "global_step": 147783, "epoch": 3518} {"train_loss": -6.713550567626953, "global_step": 147784, "epoch": 3518} {"train_loss": -6.807639122009277, "global_step": 147785, "epoch": 3518} {"train_loss": -6.737497329711914, "global_step": 147786, "epoch": 3518} {"train_loss": -6.714509963989258, "global_step": 147787, "epoch": 3518} {"train_loss": -6.812245845794678, "global_step": 147788, "epoch": 3518} {"train_loss": -6.751948356628418, "global_step": 147789, "epoch": 3518} {"train_loss": -6.897485256195068, "global_step": 147790, "epoch": 3518} {"train_loss": -6.813694953918457, "global_step": 147791, "epoch": 3518} {"train_loss": -6.867772102355957, "global_step": 147792, "epoch": 3518} {"train_loss": -6.782486915588379, "global_step": 147793, "epoch": 3518} {"train_loss": -6.772832870483398, "global_step": 147794, "epoch": 3518} {"train_loss": -6.957636833190918, "global_step": 147795, "epoch": 3518} {"train_loss": -6.8201904296875, "global_step": 147796, "epoch": 3518} {"train_loss": -6.747922897338867, "global_step": 147797, "epoch": 3518, "val_loss": 78653.3359375} {"train_loss": -7.047740936279297, "global_step": 147798, "epoch": 3519} {"train_loss": -6.899712562561035, "global_step": 147799, "epoch": 3519} {"train_loss": -6.858121871948242, "global_step": 147800, "epoch": 3519} {"train_loss": -6.8106231689453125, "global_step": 147801, "epoch": 3519} {"train_loss": -6.85006856918335, "global_step": 147802, "epoch": 3519} {"train_loss": -6.927205562591553, "global_step": 147803, "epoch": 3519} {"train_loss": -6.8679399490356445, "global_step": 147804, "epoch": 3519} {"train_loss": -6.911011695861816, "global_step": 147805, "epoch": 3519} {"train_loss": -6.897748947143555, "global_step": 147806, "epoch": 3519} {"train_loss": -6.8367838859558105, "global_step": 147807, "epoch": 3519} {"train_loss": -6.904287338256836, "global_step": 147808, "epoch": 3519} {"train_loss": -6.761392593383789, "global_step": 147809, "epoch": 3519} {"train_loss": -6.884060859680176, "global_step": 147810, "epoch": 3519} {"train_loss": -6.900799751281738, "global_step": 147811, "epoch": 3519} {"train_loss": -6.832592964172363, "global_step": 147812, "epoch": 3519} {"train_loss": -6.840330123901367, "global_step": 147813, "epoch": 3519} {"train_loss": -6.853041648864746, "global_step": 147814, "epoch": 3519} {"train_loss": -6.876516342163086, "global_step": 147815, "epoch": 3519} {"train_loss": -6.794956207275391, "global_step": 147816, "epoch": 3519} {"train_loss": -6.829824447631836, "global_step": 147817, "epoch": 3519} {"train_loss": -6.940638542175293, "global_step": 147818, "epoch": 3519} {"train_loss": -6.930690765380859, "global_step": 147819, "epoch": 3519} {"train_loss": -6.876836776733398, "global_step": 147820, "epoch": 3519} {"train_loss": -6.873281955718994, "global_step": 147821, "epoch": 3519} {"train_loss": -6.904062747955322, "global_step": 147822, "epoch": 3519} {"train_loss": -6.9199323654174805, "global_step": 147823, "epoch": 3519} {"train_loss": -6.92160701751709, "global_step": 147824, "epoch": 3519} {"train_loss": -6.943747520446777, "global_step": 147825, "epoch": 3519} {"train_loss": -6.761496543884277, "global_step": 147826, "epoch": 3519} {"train_loss": -6.9783935546875, "global_step": 147827, "epoch": 3519} {"train_loss": -6.822242259979248, "global_step": 147828, "epoch": 3519} {"train_loss": -6.827698707580566, "global_step": 147829, "epoch": 3519} {"train_loss": -6.781771183013916, "global_step": 147830, "epoch": 3519} {"train_loss": -6.812921047210693, "global_step": 147831, "epoch": 3519} {"train_loss": -6.710187911987305, "global_step": 147832, "epoch": 3519} {"train_loss": -6.8227081298828125, "global_step": 147833, "epoch": 3519} {"train_loss": -6.881130695343018, "global_step": 147834, "epoch": 3519} {"train_loss": -6.867079734802246, "global_step": 147835, "epoch": 3519} {"train_loss": -6.897995948791504, "global_step": 147836, "epoch": 3519} {"train_loss": -6.812440872192383, "global_step": 147837, "epoch": 3519} {"train_loss": -6.832590579986572, "global_step": 147838, "epoch": 3519} {"train_loss": -6.865713357925415, "global_step": 147839, "epoch": 3519, "val_loss": 78947.109375} {"train_loss": -6.646949768066406, "global_step": 147840, "epoch": 3520} {"train_loss": -6.878701686859131, "global_step": 147841, "epoch": 3520} {"train_loss": -6.765153884887695, "global_step": 147842, "epoch": 3520} {"train_loss": -6.780283451080322, "global_step": 147843, "epoch": 3520} {"train_loss": -6.761029243469238, "global_step": 147844, "epoch": 3520} {"train_loss": -6.761175632476807, "global_step": 147845, "epoch": 3520} {"train_loss": -6.833944320678711, "global_step": 147846, "epoch": 3520} {"train_loss": -6.849818229675293, "global_step": 147847, "epoch": 3520} {"train_loss": -6.780073165893555, "global_step": 147848, "epoch": 3520} {"train_loss": -6.775050163269043, "global_step": 147849, "epoch": 3520} {"train_loss": -6.74053955078125, "global_step": 147850, "epoch": 3520} {"train_loss": -6.891881942749023, "global_step": 147851, "epoch": 3520} {"train_loss": -6.883852958679199, "global_step": 147852, "epoch": 3520} {"train_loss": -6.987332344055176, "global_step": 147853, "epoch": 3520} {"train_loss": -6.9448137283325195, "global_step": 147854, "epoch": 3520} {"train_loss": -6.9077372550964355, "global_step": 147855, "epoch": 3520} {"train_loss": -6.869209289550781, "global_step": 147856, "epoch": 3520} {"train_loss": -6.820292949676514, "global_step": 147857, "epoch": 3520} {"train_loss": -6.903134346008301, "global_step": 147858, "epoch": 3520} {"train_loss": -6.897912979125977, "global_step": 147859, "epoch": 3520} {"train_loss": -6.862528324127197, "global_step": 147860, "epoch": 3520} {"train_loss": -6.818866729736328, "global_step": 147861, "epoch": 3520} {"train_loss": -6.871634483337402, "global_step": 147862, "epoch": 3520} {"train_loss": -6.840429306030273, "global_step": 147863, "epoch": 3520} {"train_loss": -6.892197132110596, "global_step": 147864, "epoch": 3520} {"train_loss": -6.889804363250732, "global_step": 147865, "epoch": 3520} {"train_loss": -6.758195400238037, "global_step": 147866, "epoch": 3520} {"train_loss": -6.878701210021973, "global_step": 147867, "epoch": 3520} {"train_loss": -6.86381721496582, "global_step": 147868, "epoch": 3520} {"train_loss": -7.0031867027282715, "global_step": 147869, "epoch": 3520} {"train_loss": -6.968547344207764, "global_step": 147870, "epoch": 3520} {"train_loss": -6.987897872924805, "global_step": 147871, "epoch": 3520} {"train_loss": -6.809499740600586, "global_step": 147872, "epoch": 3520} {"train_loss": -6.878354072570801, "global_step": 147873, "epoch": 3520} {"train_loss": -6.852234363555908, "global_step": 147874, "epoch": 3520} {"train_loss": -6.815058708190918, "global_step": 147875, "epoch": 3520} {"train_loss": -6.836056232452393, "global_step": 147876, "epoch": 3520} {"train_loss": -6.921184539794922, "global_step": 147877, "epoch": 3520} {"train_loss": -6.900521278381348, "global_step": 147878, "epoch": 3520} {"train_loss": -6.910016059875488, "global_step": 147879, "epoch": 3520} {"train_loss": -6.853853702545166, "global_step": 147880, "epoch": 3520} {"train_loss": -6.854875189917428, "global_step": 147881, "epoch": 3520, "val_loss": 78386.875} {"train_loss": -6.848233699798584, "global_step": 147882, "epoch": 3521} {"train_loss": -6.972199440002441, "global_step": 147883, "epoch": 3521} {"train_loss": -6.824640274047852, "global_step": 147884, "epoch": 3521} {"train_loss": -6.936493873596191, "global_step": 147885, "epoch": 3521} {"train_loss": -6.8126397132873535, "global_step": 147886, "epoch": 3521} {"train_loss": -6.9332733154296875, "global_step": 147887, "epoch": 3521} {"train_loss": -6.831475734710693, "global_step": 147888, "epoch": 3521} {"train_loss": -6.9370880126953125, "global_step": 147889, "epoch": 3521} {"train_loss": -6.779729843139648, "global_step": 147890, "epoch": 3521} {"train_loss": -6.775980472564697, "global_step": 147891, "epoch": 3521} {"train_loss": -6.873722076416016, "global_step": 147892, "epoch": 3521} {"train_loss": -6.89211368560791, "global_step": 147893, "epoch": 3521} {"train_loss": -6.691241264343262, "global_step": 147894, "epoch": 3521} {"train_loss": -6.8447065353393555, "global_step": 147895, "epoch": 3521} {"train_loss": -6.869324684143066, "global_step": 147896, "epoch": 3521} {"train_loss": -6.766435623168945, "global_step": 147897, "epoch": 3521} {"train_loss": -6.875297546386719, "global_step": 147898, "epoch": 3521} {"train_loss": -6.862056732177734, "global_step": 147899, "epoch": 3521} {"train_loss": -6.870570659637451, "global_step": 147900, "epoch": 3521} {"train_loss": -6.706438064575195, "global_step": 147901, "epoch": 3521} {"train_loss": -6.773037433624268, "global_step": 147902, "epoch": 3521} {"train_loss": -6.9043474197387695, "global_step": 147903, "epoch": 3521} {"train_loss": -6.774015426635742, "global_step": 147904, "epoch": 3521} {"train_loss": -6.886941909790039, "global_step": 147905, "epoch": 3521} {"train_loss": -6.8275041580200195, "global_step": 147906, "epoch": 3521} {"train_loss": -6.843967437744141, "global_step": 147907, "epoch": 3521} {"train_loss": -6.726659774780273, "global_step": 147908, "epoch": 3521} {"train_loss": -6.890582084655762, "global_step": 147909, "epoch": 3521} {"train_loss": -6.77079439163208, "global_step": 147910, "epoch": 3521} {"train_loss": -6.815278053283691, "global_step": 147911, "epoch": 3521} {"train_loss": -6.807153224945068, "global_step": 147912, "epoch": 3521} {"train_loss": -6.765417098999023, "global_step": 147913, "epoch": 3521} {"train_loss": -6.824892997741699, "global_step": 147914, "epoch": 3521} {"train_loss": -6.79703426361084, "global_step": 147915, "epoch": 3521} {"train_loss": -6.7484588623046875, "global_step": 147916, "epoch": 3521} {"train_loss": -6.818641662597656, "global_step": 147917, "epoch": 3521} {"train_loss": -6.965227127075195, "global_step": 147918, "epoch": 3521} {"train_loss": -6.7115325927734375, "global_step": 147919, "epoch": 3521} {"train_loss": -6.788647174835205, "global_step": 147920, "epoch": 3521} {"train_loss": -6.8772501945495605, "global_step": 147921, "epoch": 3521} {"train_loss": -6.779048442840576, "global_step": 147922, "epoch": 3521} {"train_loss": -6.8306448346092585, "global_step": 147923, "epoch": 3521, "val_loss": 78648.640625} {"train_loss": -6.827348232269287, "global_step": 147924, "epoch": 3522} {"train_loss": -6.79249382019043, "global_step": 147925, "epoch": 3522} {"train_loss": -6.72454833984375, "global_step": 147926, "epoch": 3522} {"train_loss": -6.8434247970581055, "global_step": 147927, "epoch": 3522} {"train_loss": -6.905318260192871, "global_step": 147928, "epoch": 3522} {"train_loss": -6.774596691131592, "global_step": 147929, "epoch": 3522} {"train_loss": -6.721435546875, "global_step": 147930, "epoch": 3522} {"train_loss": -6.8066205978393555, "global_step": 147931, "epoch": 3522} {"train_loss": -6.6919660568237305, "global_step": 147932, "epoch": 3522} {"train_loss": -6.8000335693359375, "global_step": 147933, "epoch": 3522} {"train_loss": -6.844019889831543, "global_step": 147934, "epoch": 3522} {"train_loss": -6.871455192565918, "global_step": 147935, "epoch": 3522} {"train_loss": -6.787114143371582, "global_step": 147936, "epoch": 3522} {"train_loss": -6.7452216148376465, "global_step": 147937, "epoch": 3522} {"train_loss": -6.7773308753967285, "global_step": 147938, "epoch": 3522} {"train_loss": -6.890448093414307, "global_step": 147939, "epoch": 3522} {"train_loss": -6.864020347595215, "global_step": 147940, "epoch": 3522} {"train_loss": -6.842601776123047, "global_step": 147941, "epoch": 3522} {"train_loss": -6.880962371826172, "global_step": 147942, "epoch": 3522} {"train_loss": -6.857904434204102, "global_step": 147943, "epoch": 3522} {"train_loss": -6.856310844421387, "global_step": 147944, "epoch": 3522} {"train_loss": -6.78771448135376, "global_step": 147945, "epoch": 3522} {"train_loss": -6.77768087387085, "global_step": 147946, "epoch": 3522} {"train_loss": -6.878832817077637, "global_step": 147947, "epoch": 3522} {"train_loss": -6.942330360412598, "global_step": 147948, "epoch": 3522} {"train_loss": -6.76149845123291, "global_step": 147949, "epoch": 3522} {"train_loss": -6.758941650390625, "global_step": 147950, "epoch": 3522} {"train_loss": -6.74191951751709, "global_step": 147951, "epoch": 3522} {"train_loss": -6.826343536376953, "global_step": 147952, "epoch": 3522} {"train_loss": -6.852853775024414, "global_step": 147953, "epoch": 3522} {"train_loss": -6.785292148590088, "global_step": 147954, "epoch": 3522} {"train_loss": -6.894659519195557, "global_step": 147955, "epoch": 3522} {"train_loss": -6.754779815673828, "global_step": 147956, "epoch": 3522} {"train_loss": -6.840439796447754, "global_step": 147957, "epoch": 3522} {"train_loss": -6.986110210418701, "global_step": 147958, "epoch": 3522} {"train_loss": -6.799853801727295, "global_step": 147959, "epoch": 3522} {"train_loss": -6.891279220581055, "global_step": 147960, "epoch": 3522} {"train_loss": -6.764321804046631, "global_step": 147961, "epoch": 3522} {"train_loss": -6.71572208404541, "global_step": 147962, "epoch": 3522} {"train_loss": -6.892732620239258, "global_step": 147963, "epoch": 3522} {"train_loss": -6.756621837615967, "global_step": 147964, "epoch": 3522} {"train_loss": -6.8198314394269675, "global_step": 147965, "epoch": 3522, "val_loss": 78739.625} {"train_loss": -6.865257263183594, "global_step": 147966, "epoch": 3523} {"train_loss": -6.591765880584717, "global_step": 147967, "epoch": 3523} {"train_loss": -6.787834167480469, "global_step": 147968, "epoch": 3523} {"train_loss": -6.758031368255615, "global_step": 147969, "epoch": 3523} {"train_loss": -6.888469696044922, "global_step": 147970, "epoch": 3523} {"train_loss": -6.773555278778076, "global_step": 147971, "epoch": 3523} {"train_loss": -6.8552751541137695, "global_step": 147972, "epoch": 3523} {"train_loss": -6.788454055786133, "global_step": 147973, "epoch": 3523} {"train_loss": -6.694181442260742, "global_step": 147974, "epoch": 3523} {"train_loss": -6.855218410491943, "global_step": 147975, "epoch": 3523} {"train_loss": -6.953683376312256, "global_step": 147976, "epoch": 3523} {"train_loss": -6.8560285568237305, "global_step": 147977, "epoch": 3523} {"train_loss": -6.946012496948242, "global_step": 147978, "epoch": 3523} {"train_loss": -6.871360778808594, "global_step": 147979, "epoch": 3523} {"train_loss": -6.980483531951904, "global_step": 147980, "epoch": 3523} {"train_loss": -6.851452827453613, "global_step": 147981, "epoch": 3523} {"train_loss": -7.013557434082031, "global_step": 147982, "epoch": 3523} {"train_loss": -6.95591926574707, "global_step": 147983, "epoch": 3523} {"train_loss": -6.8934006690979, "global_step": 147984, "epoch": 3523} {"train_loss": -6.894081115722656, "global_step": 147985, "epoch": 3523} {"train_loss": -6.841955184936523, "global_step": 147986, "epoch": 3523} {"train_loss": -6.902732849121094, "global_step": 147987, "epoch": 3523} {"train_loss": -6.939750671386719, "global_step": 147988, "epoch": 3523} {"train_loss": -6.849775314331055, "global_step": 147989, "epoch": 3523} {"train_loss": -6.810589790344238, "global_step": 147990, "epoch": 3523} {"train_loss": -6.909066200256348, "global_step": 147991, "epoch": 3523} {"train_loss": -6.675746440887451, "global_step": 147992, "epoch": 3523} {"train_loss": -6.814348220825195, "global_step": 147993, "epoch": 3523} {"train_loss": -6.891317844390869, "global_step": 147994, "epoch": 3523} {"train_loss": -6.891232490539551, "global_step": 147995, "epoch": 3523} {"train_loss": -6.88946533203125, "global_step": 147996, "epoch": 3523} {"train_loss": -6.767640113830566, "global_step": 147997, "epoch": 3523} {"train_loss": -6.854349136352539, "global_step": 147998, "epoch": 3523} {"train_loss": -6.859379768371582, "global_step": 147999, "epoch": 3523} {"train_loss": -6.801574230194092, "global_step": 148000, "epoch": 3523} {"train_loss": -6.8308234214782715, "global_step": 148001, "epoch": 3523} {"train_loss": -6.856075763702393, "global_step": 148002, "epoch": 3523} {"train_loss": -6.924394607543945, "global_step": 148003, "epoch": 3523} {"train_loss": -6.7549052238464355, "global_step": 148004, "epoch": 3523} {"train_loss": -6.941647529602051, "global_step": 148005, "epoch": 3523} {"train_loss": -6.804949760437012, "global_step": 148006, "epoch": 3523} {"train_loss": -6.849612849099295, "global_step": 148007, "epoch": 3523, "val_loss": 78538.5859375} {"train_loss": -6.859724044799805, "global_step": 148008, "epoch": 3524} {"train_loss": -6.867547988891602, "global_step": 148009, "epoch": 3524} {"train_loss": -6.90379524230957, "global_step": 148010, "epoch": 3524} {"train_loss": -6.81620454788208, "global_step": 148011, "epoch": 3524} {"train_loss": -6.722025394439697, "global_step": 148012, "epoch": 3524} {"train_loss": -6.88215446472168, "global_step": 148013, "epoch": 3524} {"train_loss": -6.798643112182617, "global_step": 148014, "epoch": 3524} {"train_loss": -6.95935583114624, "global_step": 148015, "epoch": 3524} {"train_loss": -6.811676025390625, "global_step": 148016, "epoch": 3524} {"train_loss": -6.824934959411621, "global_step": 148017, "epoch": 3524} {"train_loss": -6.864953994750977, "global_step": 148018, "epoch": 3524} {"train_loss": -6.6823930740356445, "global_step": 148019, "epoch": 3524} {"train_loss": -7.009478569030762, "global_step": 148020, "epoch": 3524} {"train_loss": -6.7716569900512695, "global_step": 148021, "epoch": 3524} {"train_loss": -6.723868370056152, "global_step": 148022, "epoch": 3524} {"train_loss": -6.901843070983887, "global_step": 148023, "epoch": 3524} {"train_loss": -6.752414703369141, "global_step": 148024, "epoch": 3524} {"train_loss": -6.9505462646484375, "global_step": 148025, "epoch": 3524} {"train_loss": -6.831756591796875, "global_step": 148026, "epoch": 3524} {"train_loss": -6.773739814758301, "global_step": 148027, "epoch": 3524} {"train_loss": -6.833104133605957, "global_step": 148028, "epoch": 3524} {"train_loss": -6.669247627258301, "global_step": 148029, "epoch": 3524} {"train_loss": -6.919746398925781, "global_step": 148030, "epoch": 3524} {"train_loss": -6.682500839233398, "global_step": 148031, "epoch": 3524} {"train_loss": -6.682377815246582, "global_step": 148032, "epoch": 3524} {"train_loss": -6.773873329162598, "global_step": 148033, "epoch": 3524} {"train_loss": -6.82650899887085, "global_step": 148034, "epoch": 3524} {"train_loss": -6.872631549835205, "global_step": 148035, "epoch": 3524} {"train_loss": -6.8827290534973145, "global_step": 148036, "epoch": 3524} {"train_loss": -6.731708526611328, "global_step": 148037, "epoch": 3524} {"train_loss": -6.893181800842285, "global_step": 148038, "epoch": 3524} {"train_loss": -6.765039443969727, "global_step": 148039, "epoch": 3524} {"train_loss": -6.779749870300293, "global_step": 148040, "epoch": 3524} {"train_loss": -6.853404521942139, "global_step": 148041, "epoch": 3524} {"train_loss": -6.797456741333008, "global_step": 148042, "epoch": 3524} {"train_loss": -6.81374454498291, "global_step": 148043, "epoch": 3524} {"train_loss": -6.811982154846191, "global_step": 148044, "epoch": 3524} {"train_loss": -6.7394938468933105, "global_step": 148045, "epoch": 3524} {"train_loss": -6.856642723083496, "global_step": 148046, "epoch": 3524} {"train_loss": -6.754944324493408, "global_step": 148047, "epoch": 3524} {"train_loss": -6.722723484039307, "global_step": 148048, "epoch": 3524} {"train_loss": -6.810056277683803, "global_step": 148049, "epoch": 3524, "val_loss": 78651.9765625} {"train_loss": -6.773937225341797, "global_step": 148050, "epoch": 3525} {"train_loss": -6.8258466720581055, "global_step": 148051, "epoch": 3525} {"train_loss": -6.735198020935059, "global_step": 148052, "epoch": 3525} {"train_loss": -6.7296142578125, "global_step": 148053, "epoch": 3525} {"train_loss": -6.841634750366211, "global_step": 148054, "epoch": 3525} {"train_loss": -6.795572280883789, "global_step": 148055, "epoch": 3525} {"train_loss": -6.5447587966918945, "global_step": 148056, "epoch": 3525} {"train_loss": -6.691916465759277, "global_step": 148057, "epoch": 3525} {"train_loss": -6.830234527587891, "global_step": 148058, "epoch": 3525} {"train_loss": -6.860230445861816, "global_step": 148059, "epoch": 3525} {"train_loss": -6.769915580749512, "global_step": 148060, "epoch": 3525} {"train_loss": -6.87762451171875, "global_step": 148061, "epoch": 3525} {"train_loss": -6.805955410003662, "global_step": 148062, "epoch": 3525} {"train_loss": -6.76131534576416, "global_step": 148063, "epoch": 3525} {"train_loss": -6.770194053649902, "global_step": 148064, "epoch": 3525} {"train_loss": -6.644829750061035, "global_step": 148065, "epoch": 3525} {"train_loss": -6.838350296020508, "global_step": 148066, "epoch": 3525} {"train_loss": -6.807177543640137, "global_step": 148067, "epoch": 3525} {"train_loss": -6.855059623718262, "global_step": 148068, "epoch": 3525} {"train_loss": -6.785804748535156, "global_step": 148069, "epoch": 3525} {"train_loss": -6.801894187927246, "global_step": 148070, "epoch": 3525} {"train_loss": -6.78076171875, "global_step": 148071, "epoch": 3525} {"train_loss": -6.730287551879883, "global_step": 148072, "epoch": 3525} {"train_loss": -6.812242031097412, "global_step": 148073, "epoch": 3525} {"train_loss": -6.695690631866455, "global_step": 148074, "epoch": 3525} {"train_loss": -6.844280242919922, "global_step": 148075, "epoch": 3525} {"train_loss": -6.783553123474121, "global_step": 148076, "epoch": 3525} {"train_loss": -6.747645378112793, "global_step": 148077, "epoch": 3525} {"train_loss": -6.788304805755615, "global_step": 148078, "epoch": 3525} {"train_loss": -6.735400199890137, "global_step": 148079, "epoch": 3525} {"train_loss": -6.8811798095703125, "global_step": 148080, "epoch": 3525} {"train_loss": -6.886105060577393, "global_step": 148081, "epoch": 3525} {"train_loss": -6.884323596954346, "global_step": 148082, "epoch": 3525} {"train_loss": -6.813096523284912, "global_step": 148083, "epoch": 3525} {"train_loss": -6.9005208015441895, "global_step": 148084, "epoch": 3525} {"train_loss": -6.764055252075195, "global_step": 148085, "epoch": 3525} {"train_loss": -6.925895690917969, "global_step": 148086, "epoch": 3525} {"train_loss": -6.787363052368164, "global_step": 148087, "epoch": 3525} {"train_loss": -6.8267822265625, "global_step": 148088, "epoch": 3525} {"train_loss": -6.835269927978516, "global_step": 148089, "epoch": 3525} {"train_loss": -6.946149826049805, "global_step": 148090, "epoch": 3525} {"train_loss": -6.798039561226254, "global_step": 148091, "epoch": 3525, "val_loss": 78438.4140625} {"train_loss": -6.897985935211182, "global_step": 148092, "epoch": 3526} {"train_loss": -6.926839351654053, "global_step": 148093, "epoch": 3526} {"train_loss": -6.759015083312988, "global_step": 148094, "epoch": 3526} {"train_loss": -6.92664909362793, "global_step": 148095, "epoch": 3526} {"train_loss": -6.855955123901367, "global_step": 148096, "epoch": 3526} {"train_loss": -6.8987579345703125, "global_step": 148097, "epoch": 3526} {"train_loss": -6.8550519943237305, "global_step": 148098, "epoch": 3526} {"train_loss": -6.908587455749512, "global_step": 148099, "epoch": 3526} {"train_loss": -6.874614715576172, "global_step": 148100, "epoch": 3526} {"train_loss": -6.930739402770996, "global_step": 148101, "epoch": 3526} {"train_loss": -6.887624740600586, "global_step": 148102, "epoch": 3526} {"train_loss": -6.771007537841797, "global_step": 148103, "epoch": 3526} {"train_loss": -6.9202985763549805, "global_step": 148104, "epoch": 3526} {"train_loss": -6.97985315322876, "global_step": 148105, "epoch": 3526} {"train_loss": -6.769622325897217, "global_step": 148106, "epoch": 3526} {"train_loss": -6.763433456420898, "global_step": 148107, "epoch": 3526} {"train_loss": -6.775446891784668, "global_step": 148108, "epoch": 3526} {"train_loss": -6.820130348205566, "global_step": 148109, "epoch": 3526} {"train_loss": -6.9186692237854, "global_step": 148110, "epoch": 3526} {"train_loss": -6.665026664733887, "global_step": 148111, "epoch": 3526} {"train_loss": -6.67609977722168, "global_step": 148112, "epoch": 3526} {"train_loss": -6.679640769958496, "global_step": 148113, "epoch": 3526} {"train_loss": -6.739621162414551, "global_step": 148114, "epoch": 3526} {"train_loss": -6.862454891204834, "global_step": 148115, "epoch": 3526} {"train_loss": -6.832788467407227, "global_step": 148116, "epoch": 3526} {"train_loss": -6.901322364807129, "global_step": 148117, "epoch": 3526} {"train_loss": -6.804836273193359, "global_step": 148118, "epoch": 3526} {"train_loss": -6.762378692626953, "global_step": 148119, "epoch": 3526} {"train_loss": -6.8125386238098145, "global_step": 148120, "epoch": 3526} {"train_loss": -6.780999660491943, "global_step": 148121, "epoch": 3526} {"train_loss": -6.884327411651611, "global_step": 148122, "epoch": 3526} {"train_loss": -6.815921783447266, "global_step": 148123, "epoch": 3526} {"train_loss": -6.726918697357178, "global_step": 148124, "epoch": 3526} {"train_loss": -6.751611232757568, "global_step": 148125, "epoch": 3526} {"train_loss": -6.958720684051514, "global_step": 148126, "epoch": 3526} {"train_loss": -6.946201801300049, "global_step": 148127, "epoch": 3526} {"train_loss": -6.9134063720703125, "global_step": 148128, "epoch": 3526} {"train_loss": -6.977009296417236, "global_step": 148129, "epoch": 3526} {"train_loss": -6.9237775802612305, "global_step": 148130, "epoch": 3526} {"train_loss": -6.8931803703308105, "global_step": 148131, "epoch": 3526} {"train_loss": -6.878443241119385, "global_step": 148132, "epoch": 3526} {"train_loss": -6.843885750997634, "global_step": 148133, "epoch": 3526, "val_loss": 78689.1953125} {"train_loss": -6.881568908691406, "global_step": 148134, "epoch": 3527} {"train_loss": -6.942145824432373, "global_step": 148135, "epoch": 3527} {"train_loss": -6.929049968719482, "global_step": 148136, "epoch": 3527} {"train_loss": -6.8804168701171875, "global_step": 148137, "epoch": 3527} {"train_loss": -6.988044261932373, "global_step": 148138, "epoch": 3527} {"train_loss": -6.932504177093506, "global_step": 148139, "epoch": 3527} {"train_loss": -6.914319038391113, "global_step": 148140, "epoch": 3527} {"train_loss": -6.925423622131348, "global_step": 148141, "epoch": 3527} {"train_loss": -6.827733039855957, "global_step": 148142, "epoch": 3527} {"train_loss": -6.756309509277344, "global_step": 148143, "epoch": 3527} {"train_loss": -6.839271545410156, "global_step": 148144, "epoch": 3527} {"train_loss": -6.831554412841797, "global_step": 148145, "epoch": 3527} {"train_loss": -6.682199478149414, "global_step": 148146, "epoch": 3527} {"train_loss": -6.600314617156982, "global_step": 148147, "epoch": 3527} {"train_loss": -6.874622344970703, "global_step": 148148, "epoch": 3527} {"train_loss": -6.856025695800781, "global_step": 148149, "epoch": 3527} {"train_loss": -6.811192512512207, "global_step": 148150, "epoch": 3527} {"train_loss": -6.6813859939575195, "global_step": 148151, "epoch": 3527} {"train_loss": -6.87708854675293, "global_step": 148152, "epoch": 3527} {"train_loss": -6.775712966918945, "global_step": 148153, "epoch": 3527} {"train_loss": -6.791853427886963, "global_step": 148154, "epoch": 3527} {"train_loss": -6.788510799407959, "global_step": 148155, "epoch": 3527} {"train_loss": -6.811064720153809, "global_step": 148156, "epoch": 3527} {"train_loss": -6.794942378997803, "global_step": 148157, "epoch": 3527} {"train_loss": -6.893868446350098, "global_step": 148158, "epoch": 3527} {"train_loss": -6.826831817626953, "global_step": 148159, "epoch": 3527} {"train_loss": -6.760645389556885, "global_step": 148160, "epoch": 3527} {"train_loss": -6.829000473022461, "global_step": 148161, "epoch": 3527} {"train_loss": -6.751945495605469, "global_step": 148162, "epoch": 3527} {"train_loss": -6.848354339599609, "global_step": 148163, "epoch": 3527} {"train_loss": -6.787094593048096, "global_step": 148164, "epoch": 3527} {"train_loss": -6.7401041984558105, "global_step": 148165, "epoch": 3527} {"train_loss": -6.855185508728027, "global_step": 148166, "epoch": 3527} {"train_loss": -6.736755847930908, "global_step": 148167, "epoch": 3527} {"train_loss": -6.888670921325684, "global_step": 148168, "epoch": 3527} {"train_loss": -6.7134294509887695, "global_step": 148169, "epoch": 3527} {"train_loss": -6.833114147186279, "global_step": 148170, "epoch": 3527} {"train_loss": -6.762355327606201, "global_step": 148171, "epoch": 3527} {"train_loss": -6.80611515045166, "global_step": 148172, "epoch": 3527} {"train_loss": -6.846620559692383, "global_step": 148173, "epoch": 3527} {"train_loss": -6.944159507751465, "global_step": 148174, "epoch": 3527} {"train_loss": -6.823078893479847, "global_step": 148175, "epoch": 3527, "val_loss": 78614.890625} {"train_loss": -6.928832054138184, "global_step": 148176, "epoch": 3528} {"train_loss": -6.900798797607422, "global_step": 148177, "epoch": 3528} {"train_loss": -6.823410987854004, "global_step": 148178, "epoch": 3528} {"train_loss": -6.93275260925293, "global_step": 148179, "epoch": 3528} {"train_loss": -6.785443305969238, "global_step": 148180, "epoch": 3528} {"train_loss": -6.823516368865967, "global_step": 148181, "epoch": 3528} {"train_loss": -6.856408596038818, "global_step": 148182, "epoch": 3528} {"train_loss": -6.904505729675293, "global_step": 148183, "epoch": 3528} {"train_loss": -6.807547092437744, "global_step": 148184, "epoch": 3528} {"train_loss": -6.804997444152832, "global_step": 148185, "epoch": 3528} {"train_loss": -6.83586311340332, "global_step": 148186, "epoch": 3528} {"train_loss": -6.907899379730225, "global_step": 148187, "epoch": 3528} {"train_loss": -6.727595329284668, "global_step": 148188, "epoch": 3528} {"train_loss": -6.9455156326293945, "global_step": 148189, "epoch": 3528} {"train_loss": -6.753896713256836, "global_step": 148190, "epoch": 3528} {"train_loss": -6.853668689727783, "global_step": 148191, "epoch": 3528} {"train_loss": -6.807428359985352, "global_step": 148192, "epoch": 3528} {"train_loss": -6.884997844696045, "global_step": 148193, "epoch": 3528} {"train_loss": -6.872508525848389, "global_step": 148194, "epoch": 3528} {"train_loss": -6.980069160461426, "global_step": 148195, "epoch": 3528} {"train_loss": -6.895804405212402, "global_step": 148196, "epoch": 3528} {"train_loss": -6.845307350158691, "global_step": 148197, "epoch": 3528} {"train_loss": -6.983943939208984, "global_step": 148198, "epoch": 3528} {"train_loss": -6.912362575531006, "global_step": 148199, "epoch": 3528} {"train_loss": -6.795499324798584, "global_step": 148200, "epoch": 3528} {"train_loss": -6.889610290527344, "global_step": 148201, "epoch": 3528} {"train_loss": -6.8563232421875, "global_step": 148202, "epoch": 3528} {"train_loss": -6.831859588623047, "global_step": 148203, "epoch": 3528} {"train_loss": -6.77207612991333, "global_step": 148204, "epoch": 3528} {"train_loss": -6.750353813171387, "global_step": 148205, "epoch": 3528} {"train_loss": -6.814302444458008, "global_step": 148206, "epoch": 3528} {"train_loss": -6.815059661865234, "global_step": 148207, "epoch": 3528} {"train_loss": -6.660564422607422, "global_step": 148208, "epoch": 3528} {"train_loss": -6.737429618835449, "global_step": 148209, "epoch": 3528} {"train_loss": -6.644829750061035, "global_step": 148210, "epoch": 3528} {"train_loss": -6.840213775634766, "global_step": 148211, "epoch": 3528} {"train_loss": -6.7138824462890625, "global_step": 148212, "epoch": 3528} {"train_loss": -6.689131736755371, "global_step": 148213, "epoch": 3528} {"train_loss": -6.850903034210205, "global_step": 148214, "epoch": 3528} {"train_loss": -6.67949104309082, "global_step": 148215, "epoch": 3528} {"train_loss": -6.749044895172119, "global_step": 148216, "epoch": 3528} {"train_loss": -6.824233407065982, "global_step": 148217, "epoch": 3528, "val_loss": 78499.46875} {"train_loss": -6.8178582191467285, "global_step": 148218, "epoch": 3529} {"train_loss": -6.737885475158691, "global_step": 148219, "epoch": 3529} {"train_loss": -6.767657279968262, "global_step": 148220, "epoch": 3529} {"train_loss": -6.760659217834473, "global_step": 148221, "epoch": 3529} {"train_loss": -6.7579755783081055, "global_step": 148222, "epoch": 3529} {"train_loss": -6.875597953796387, "global_step": 148223, "epoch": 3529} {"train_loss": -6.843632698059082, "global_step": 148224, "epoch": 3529} {"train_loss": -6.772760391235352, "global_step": 148225, "epoch": 3529} {"train_loss": -6.76791524887085, "global_step": 148226, "epoch": 3529} {"train_loss": -6.897942066192627, "global_step": 148227, "epoch": 3529} {"train_loss": -6.85865592956543, "global_step": 148228, "epoch": 3529} {"train_loss": -6.828514099121094, "global_step": 148229, "epoch": 3529} {"train_loss": -6.826861381530762, "global_step": 148230, "epoch": 3529} {"train_loss": -6.734167098999023, "global_step": 148231, "epoch": 3529} {"train_loss": -6.864188194274902, "global_step": 148232, "epoch": 3529} {"train_loss": -6.808429718017578, "global_step": 148233, "epoch": 3529} {"train_loss": -6.856210231781006, "global_step": 148234, "epoch": 3529} {"train_loss": -6.861685276031494, "global_step": 148235, "epoch": 3529} {"train_loss": -6.726737022399902, "global_step": 148236, "epoch": 3529} {"train_loss": -6.865212917327881, "global_step": 148237, "epoch": 3529} {"train_loss": -6.746837615966797, "global_step": 148238, "epoch": 3529} {"train_loss": -6.873157978057861, "global_step": 148239, "epoch": 3529} {"train_loss": -6.7837419509887695, "global_step": 148240, "epoch": 3529} {"train_loss": -6.83226203918457, "global_step": 148241, "epoch": 3529} {"train_loss": -6.815657615661621, "global_step": 148242, "epoch": 3529} {"train_loss": -6.9034223556518555, "global_step": 148243, "epoch": 3529} {"train_loss": -6.872596740722656, "global_step": 148244, "epoch": 3529} {"train_loss": -6.771053791046143, "global_step": 148245, "epoch": 3529} {"train_loss": -6.9621782302856445, "global_step": 148246, "epoch": 3529} {"train_loss": -6.81920051574707, "global_step": 148247, "epoch": 3529} {"train_loss": -6.809796333312988, "global_step": 148248, "epoch": 3529} {"train_loss": -6.889004707336426, "global_step": 148249, "epoch": 3529} {"train_loss": -6.873702049255371, "global_step": 148250, "epoch": 3529} {"train_loss": -6.915650844573975, "global_step": 148251, "epoch": 3529} {"train_loss": -6.838744640350342, "global_step": 148252, "epoch": 3529} {"train_loss": -6.900113105773926, "global_step": 148253, "epoch": 3529} {"train_loss": -6.8820648193359375, "global_step": 148254, "epoch": 3529} {"train_loss": -6.873020172119141, "global_step": 148255, "epoch": 3529} {"train_loss": -6.818210601806641, "global_step": 148256, "epoch": 3529} {"train_loss": -6.861161708831787, "global_step": 148257, "epoch": 3529} {"train_loss": -6.856385707855225, "global_step": 148258, "epoch": 3529} {"train_loss": -6.834219262713478, "global_step": 148259, "epoch": 3529, "val_loss": 78455.2734375} {"train_loss": -6.87113094329834, "global_step": 148260, "epoch": 3530} {"train_loss": -6.8094964027404785, "global_step": 148261, "epoch": 3530} {"train_loss": -6.802265644073486, "global_step": 148262, "epoch": 3530} {"train_loss": -6.807225227355957, "global_step": 148263, "epoch": 3530} {"train_loss": -6.803596496582031, "global_step": 148264, "epoch": 3530} {"train_loss": -6.943658828735352, "global_step": 148265, "epoch": 3530} {"train_loss": -6.889923572540283, "global_step": 148266, "epoch": 3530} {"train_loss": -6.9168701171875, "global_step": 148267, "epoch": 3530} {"train_loss": -6.860898971557617, "global_step": 148268, "epoch": 3530} {"train_loss": -6.737898826599121, "global_step": 148269, "epoch": 3530} {"train_loss": -6.94172477722168, "global_step": 148270, "epoch": 3530} {"train_loss": -6.864339828491211, "global_step": 148271, "epoch": 3530} {"train_loss": -6.8292951583862305, "global_step": 148272, "epoch": 3530} {"train_loss": -6.951286315917969, "global_step": 148273, "epoch": 3530} {"train_loss": -6.928864479064941, "global_step": 148274, "epoch": 3530} {"train_loss": -6.882436752319336, "global_step": 148275, "epoch": 3530} {"train_loss": -6.819677352905273, "global_step": 148276, "epoch": 3530} {"train_loss": -6.8129963874816895, "global_step": 148277, "epoch": 3530} {"train_loss": -6.9138898849487305, "global_step": 148278, "epoch": 3530} {"train_loss": -6.832581520080566, "global_step": 148279, "epoch": 3530} {"train_loss": -6.91359281539917, "global_step": 148280, "epoch": 3530} {"train_loss": -6.912176132202148, "global_step": 148281, "epoch": 3530} {"train_loss": -6.828159809112549, "global_step": 148282, "epoch": 3530} {"train_loss": -6.851654529571533, "global_step": 148283, "epoch": 3530} {"train_loss": -6.777100563049316, "global_step": 148284, "epoch": 3530} {"train_loss": -6.897439479827881, "global_step": 148285, "epoch": 3530} {"train_loss": -6.937443733215332, "global_step": 148286, "epoch": 3530} {"train_loss": -6.945340156555176, "global_step": 148287, "epoch": 3530} {"train_loss": -6.925201416015625, "global_step": 148288, "epoch": 3530} {"train_loss": -6.923586845397949, "global_step": 148289, "epoch": 3530} {"train_loss": -6.813658237457275, "global_step": 148290, "epoch": 3530} {"train_loss": -6.9037580490112305, "global_step": 148291, "epoch": 3530} {"train_loss": -6.927945613861084, "global_step": 148292, "epoch": 3530} {"train_loss": -6.976236820220947, "global_step": 148293, "epoch": 3530} {"train_loss": -6.875513076782227, "global_step": 148294, "epoch": 3530} {"train_loss": -6.960553169250488, "global_step": 148295, "epoch": 3530} {"train_loss": -6.835926055908203, "global_step": 148296, "epoch": 3530} {"train_loss": -6.840916633605957, "global_step": 148297, "epoch": 3530} {"train_loss": -6.960052967071533, "global_step": 148298, "epoch": 3530} {"train_loss": -6.986464023590088, "global_step": 148299, "epoch": 3530} {"train_loss": -6.940670013427734, "global_step": 148300, "epoch": 3530} {"train_loss": -6.8809105441683815, "global_step": 148301, "epoch": 3530, "val_loss": 78281.7109375} {"train_loss": -6.844128608703613, "global_step": 148302, "epoch": 3531} {"train_loss": -6.973825454711914, "global_step": 148303, "epoch": 3531} {"train_loss": -6.940328598022461, "global_step": 148304, "epoch": 3531} {"train_loss": -6.987407684326172, "global_step": 148305, "epoch": 3531} {"train_loss": -6.951777935028076, "global_step": 148306, "epoch": 3531} {"train_loss": -6.952533721923828, "global_step": 148307, "epoch": 3531} {"train_loss": -6.8986639976501465, "global_step": 148308, "epoch": 3531} {"train_loss": -7.04985237121582, "global_step": 148309, "epoch": 3531} {"train_loss": -6.958823204040527, "global_step": 148310, "epoch": 3531} {"train_loss": -6.966436386108398, "global_step": 148311, "epoch": 3531} {"train_loss": -6.939566612243652, "global_step": 148312, "epoch": 3531} {"train_loss": -6.907494068145752, "global_step": 148313, "epoch": 3531} {"train_loss": -6.791947841644287, "global_step": 148314, "epoch": 3531} {"train_loss": -6.904506683349609, "global_step": 148315, "epoch": 3531} {"train_loss": -6.7765913009643555, "global_step": 148316, "epoch": 3531} {"train_loss": -6.840571403503418, "global_step": 148317, "epoch": 3531} {"train_loss": -6.940225124359131, "global_step": 148318, "epoch": 3531} {"train_loss": -6.85526180267334, "global_step": 148319, "epoch": 3531} {"train_loss": -6.881801605224609, "global_step": 148320, "epoch": 3531} {"train_loss": -6.8961591720581055, "global_step": 148321, "epoch": 3531} {"train_loss": -6.726037979125977, "global_step": 148322, "epoch": 3531} {"train_loss": -6.870267868041992, "global_step": 148323, "epoch": 3531} {"train_loss": -6.6850690841674805, "global_step": 148324, "epoch": 3531} {"train_loss": -6.633110523223877, "global_step": 148325, "epoch": 3531} {"train_loss": -6.608073711395264, "global_step": 148326, "epoch": 3531} {"train_loss": -6.839914798736572, "global_step": 148327, "epoch": 3531} {"train_loss": -6.582200527191162, "global_step": 148328, "epoch": 3531} {"train_loss": -6.725469589233398, "global_step": 148329, "epoch": 3531} {"train_loss": -6.810546875, "global_step": 148330, "epoch": 3531} {"train_loss": -6.771468162536621, "global_step": 148331, "epoch": 3531} {"train_loss": -6.859974384307861, "global_step": 148332, "epoch": 3531} {"train_loss": -6.840974807739258, "global_step": 148333, "epoch": 3531} {"train_loss": -6.702378749847412, "global_step": 148334, "epoch": 3531} {"train_loss": -6.809588432312012, "global_step": 148335, "epoch": 3531} {"train_loss": -6.836790084838867, "global_step": 148336, "epoch": 3531} {"train_loss": -6.909088134765625, "global_step": 148337, "epoch": 3531} {"train_loss": -6.838620662689209, "global_step": 148338, "epoch": 3531} {"train_loss": -6.879122257232666, "global_step": 148339, "epoch": 3531} {"train_loss": -6.783066749572754, "global_step": 148340, "epoch": 3531} {"train_loss": -6.852675437927246, "global_step": 148341, "epoch": 3531} {"train_loss": -6.878091812133789, "global_step": 148342, "epoch": 3531} {"train_loss": -6.84538399605524, "global_step": 148343, "epoch": 3531, "val_loss": 78732.4140625} {"train_loss": -6.922658920288086, "global_step": 148344, "epoch": 3532} {"train_loss": -6.955954551696777, "global_step": 148345, "epoch": 3532} {"train_loss": -6.795257091522217, "global_step": 148346, "epoch": 3532} {"train_loss": -6.89335823059082, "global_step": 148347, "epoch": 3532} {"train_loss": -6.888190269470215, "global_step": 148348, "epoch": 3532} {"train_loss": -6.966375350952148, "global_step": 148349, "epoch": 3532} {"train_loss": -6.928234100341797, "global_step": 148350, "epoch": 3532} {"train_loss": -6.882038593292236, "global_step": 148351, "epoch": 3532} {"train_loss": -6.83851432800293, "global_step": 148352, "epoch": 3532} {"train_loss": -6.930830478668213, "global_step": 148353, "epoch": 3532} {"train_loss": -6.76259708404541, "global_step": 148354, "epoch": 3532} {"train_loss": -6.762721061706543, "global_step": 148355, "epoch": 3532} {"train_loss": -6.888764381408691, "global_step": 148356, "epoch": 3532} {"train_loss": -6.831634998321533, "global_step": 148357, "epoch": 3532} {"train_loss": -6.893768787384033, "global_step": 148358, "epoch": 3532} {"train_loss": -6.868022918701172, "global_step": 148359, "epoch": 3532} {"train_loss": -6.866582870483398, "global_step": 148360, "epoch": 3532} {"train_loss": -6.874459266662598, "global_step": 148361, "epoch": 3532} {"train_loss": -6.796863555908203, "global_step": 148362, "epoch": 3532} {"train_loss": -6.860472679138184, "global_step": 148363, "epoch": 3532} {"train_loss": -6.815443992614746, "global_step": 148364, "epoch": 3532} {"train_loss": -6.8417205810546875, "global_step": 148365, "epoch": 3532} {"train_loss": -6.651555061340332, "global_step": 148366, "epoch": 3532} {"train_loss": -6.791102886199951, "global_step": 148367, "epoch": 3532} {"train_loss": -6.843605041503906, "global_step": 148368, "epoch": 3532} {"train_loss": -6.862575531005859, "global_step": 148369, "epoch": 3532} {"train_loss": -6.866896629333496, "global_step": 148370, "epoch": 3532} {"train_loss": -6.846356391906738, "global_step": 148371, "epoch": 3532} {"train_loss": -6.753653526306152, "global_step": 148372, "epoch": 3532} {"train_loss": -6.894174098968506, "global_step": 148373, "epoch": 3532} {"train_loss": -6.859677314758301, "global_step": 148374, "epoch": 3532} {"train_loss": -6.735200881958008, "global_step": 148375, "epoch": 3532} {"train_loss": -6.848258972167969, "global_step": 148376, "epoch": 3532} {"train_loss": -6.724003791809082, "global_step": 148377, "epoch": 3532} {"train_loss": -6.832717418670654, "global_step": 148378, "epoch": 3532} {"train_loss": -6.747730255126953, "global_step": 148379, "epoch": 3532} {"train_loss": -6.625832557678223, "global_step": 148380, "epoch": 3532} {"train_loss": -6.802239418029785, "global_step": 148381, "epoch": 3532} {"train_loss": -6.8855485916137695, "global_step": 148382, "epoch": 3532} {"train_loss": -6.682343482971191, "global_step": 148383, "epoch": 3532} {"train_loss": -6.867486000061035, "global_step": 148384, "epoch": 3532} {"train_loss": -6.831367015838623, "global_step": 148385, "epoch": 3532, "val_loss": 78528.2890625} {"train_loss": -6.74219274520874, "global_step": 148386, "epoch": 3533} {"train_loss": -6.737459659576416, "global_step": 148387, "epoch": 3533} {"train_loss": -6.836183547973633, "global_step": 148388, "epoch": 3533} {"train_loss": -6.803292751312256, "global_step": 148389, "epoch": 3533} {"train_loss": -6.840883255004883, "global_step": 148390, "epoch": 3533} {"train_loss": -6.795925140380859, "global_step": 148391, "epoch": 3533} {"train_loss": -6.780694961547852, "global_step": 148392, "epoch": 3533} {"train_loss": -6.731478691101074, "global_step": 148393, "epoch": 3533} {"train_loss": -6.925743103027344, "global_step": 148394, "epoch": 3533} {"train_loss": -6.749475479125977, "global_step": 148395, "epoch": 3533} {"train_loss": -6.686971187591553, "global_step": 148396, "epoch": 3533} {"train_loss": -6.889095306396484, "global_step": 148397, "epoch": 3533} {"train_loss": -6.866782188415527, "global_step": 148398, "epoch": 3533} {"train_loss": -6.794015884399414, "global_step": 148399, "epoch": 3533} {"train_loss": -6.789381980895996, "global_step": 148400, "epoch": 3533} {"train_loss": -6.951879978179932, "global_step": 148401, "epoch": 3533} {"train_loss": -6.842164039611816, "global_step": 148402, "epoch": 3533} {"train_loss": -6.813812732696533, "global_step": 148403, "epoch": 3533} {"train_loss": -6.878509521484375, "global_step": 148404, "epoch": 3533} {"train_loss": -6.889167308807373, "global_step": 148405, "epoch": 3533} {"train_loss": -6.7935261726379395, "global_step": 148406, "epoch": 3533} {"train_loss": -6.894357204437256, "global_step": 148407, "epoch": 3533} {"train_loss": -6.972776889801025, "global_step": 148408, "epoch": 3533} {"train_loss": -6.972174167633057, "global_step": 148409, "epoch": 3533} {"train_loss": -6.952888488769531, "global_step": 148410, "epoch": 3533} {"train_loss": -6.872685432434082, "global_step": 148411, "epoch": 3533} {"train_loss": -6.932701110839844, "global_step": 148412, "epoch": 3533} {"train_loss": -6.7739338874816895, "global_step": 148413, "epoch": 3533} {"train_loss": -6.860088348388672, "global_step": 148414, "epoch": 3533} {"train_loss": -6.817188739776611, "global_step": 148415, "epoch": 3533} {"train_loss": -6.901426315307617, "global_step": 148416, "epoch": 3533} {"train_loss": -6.819023132324219, "global_step": 148417, "epoch": 3533} {"train_loss": -6.885922431945801, "global_step": 148418, "epoch": 3533} {"train_loss": -6.703197002410889, "global_step": 148419, "epoch": 3533} {"train_loss": -6.8088531494140625, "global_step": 148420, "epoch": 3533} {"train_loss": -6.859561920166016, "global_step": 148421, "epoch": 3533} {"train_loss": -6.889894485473633, "global_step": 148422, "epoch": 3533} {"train_loss": -6.7852373123168945, "global_step": 148423, "epoch": 3533} {"train_loss": -6.906928062438965, "global_step": 148424, "epoch": 3533} {"train_loss": -6.823967933654785, "global_step": 148425, "epoch": 3533} {"train_loss": -6.978476047515869, "global_step": 148426, "epoch": 3533} {"train_loss": -6.843699625560215, "global_step": 148427, "epoch": 3533, "val_loss": 78602.9609375} {"train_loss": -6.882391929626465, "global_step": 148428, "epoch": 3534} {"train_loss": -6.915534019470215, "global_step": 148429, "epoch": 3534} {"train_loss": -6.824586868286133, "global_step": 148430, "epoch": 3534} {"train_loss": -6.883663654327393, "global_step": 148431, "epoch": 3534} {"train_loss": -6.880918502807617, "global_step": 148432, "epoch": 3534} {"train_loss": -6.843528747558594, "global_step": 148433, "epoch": 3534} {"train_loss": -6.944253921508789, "global_step": 148434, "epoch": 3534} {"train_loss": -6.883688449859619, "global_step": 148435, "epoch": 3534} {"train_loss": -6.783320426940918, "global_step": 148436, "epoch": 3534} {"train_loss": -6.891107082366943, "global_step": 148437, "epoch": 3534} {"train_loss": -6.962352752685547, "global_step": 148438, "epoch": 3534} {"train_loss": -6.878470420837402, "global_step": 148439, "epoch": 3534} {"train_loss": -6.897045135498047, "global_step": 148440, "epoch": 3534} {"train_loss": -6.90510368347168, "global_step": 148441, "epoch": 3534} {"train_loss": -6.810004234313965, "global_step": 148442, "epoch": 3534} {"train_loss": -6.784405708312988, "global_step": 148443, "epoch": 3534} {"train_loss": -6.794601917266846, "global_step": 148444, "epoch": 3534} {"train_loss": -7.0106658935546875, "global_step": 148445, "epoch": 3534} {"train_loss": -6.84077262878418, "global_step": 148446, "epoch": 3534} {"train_loss": -6.941106796264648, "global_step": 148447, "epoch": 3534} {"train_loss": -6.905725955963135, "global_step": 148448, "epoch": 3534} {"train_loss": -6.90595817565918, "global_step": 148449, "epoch": 3534} {"train_loss": -6.815739631652832, "global_step": 148450, "epoch": 3534} {"train_loss": -6.7863945960998535, "global_step": 148451, "epoch": 3534} {"train_loss": -6.8748860359191895, "global_step": 148452, "epoch": 3534} {"train_loss": -6.727244853973389, "global_step": 148453, "epoch": 3534} {"train_loss": -6.8783979415893555, "global_step": 148454, "epoch": 3534} {"train_loss": -6.881547927856445, "global_step": 148455, "epoch": 3534} {"train_loss": -6.851874351501465, "global_step": 148456, "epoch": 3534} {"train_loss": -6.8771491050720215, "global_step": 148457, "epoch": 3534} {"train_loss": -6.887435436248779, "global_step": 148458, "epoch": 3534} {"train_loss": -6.735486030578613, "global_step": 148459, "epoch": 3534} {"train_loss": -6.797784805297852, "global_step": 148460, "epoch": 3534} {"train_loss": -6.803818702697754, "global_step": 148461, "epoch": 3534} {"train_loss": -6.904864311218262, "global_step": 148462, "epoch": 3534} {"train_loss": -6.791797161102295, "global_step": 148463, "epoch": 3534} {"train_loss": -6.923700332641602, "global_step": 148464, "epoch": 3534} {"train_loss": -6.782552719116211, "global_step": 148465, "epoch": 3534} {"train_loss": -6.854687213897705, "global_step": 148466, "epoch": 3534} {"train_loss": -6.828016757965088, "global_step": 148467, "epoch": 3534} {"train_loss": -6.881486892700195, "global_step": 148468, "epoch": 3534} {"train_loss": -6.859953187760853, "global_step": 148469, "epoch": 3534, "val_loss": 78727.8515625} {"train_loss": -6.9322733879089355, "global_step": 148470, "epoch": 3535} {"train_loss": -6.8654327392578125, "global_step": 148471, "epoch": 3535} {"train_loss": -6.756226539611816, "global_step": 148472, "epoch": 3535} {"train_loss": -6.892099380493164, "global_step": 148473, "epoch": 3535} {"train_loss": -6.72874641418457, "global_step": 148474, "epoch": 3535} {"train_loss": -6.914899826049805, "global_step": 148475, "epoch": 3535} {"train_loss": -6.9238996505737305, "global_step": 148476, "epoch": 3535} {"train_loss": -6.836586952209473, "global_step": 148477, "epoch": 3535} {"train_loss": -6.80465030670166, "global_step": 148478, "epoch": 3535} {"train_loss": -6.817534446716309, "global_step": 148479, "epoch": 3535} {"train_loss": -6.858291149139404, "global_step": 148480, "epoch": 3535} {"train_loss": -6.945040225982666, "global_step": 148481, "epoch": 3535} {"train_loss": -6.938357830047607, "global_step": 148482, "epoch": 3535} {"train_loss": -6.796670436859131, "global_step": 148483, "epoch": 3535} {"train_loss": -6.878314971923828, "global_step": 148484, "epoch": 3535} {"train_loss": -6.814777374267578, "global_step": 148485, "epoch": 3535} {"train_loss": -6.778268337249756, "global_step": 148486, "epoch": 3535} {"train_loss": -6.811161994934082, "global_step": 148487, "epoch": 3535} {"train_loss": -6.837247371673584, "global_step": 148488, "epoch": 3535} {"train_loss": -6.752349853515625, "global_step": 148489, "epoch": 3535} {"train_loss": -6.893002033233643, "global_step": 148490, "epoch": 3535} {"train_loss": -6.6387834548950195, "global_step": 148491, "epoch": 3535} {"train_loss": -6.896840572357178, "global_step": 148492, "epoch": 3535} {"train_loss": -6.788349151611328, "global_step": 148493, "epoch": 3535} {"train_loss": -6.736652374267578, "global_step": 148494, "epoch": 3535} {"train_loss": -6.7557830810546875, "global_step": 148495, "epoch": 3535} {"train_loss": -6.829568862915039, "global_step": 148496, "epoch": 3535} {"train_loss": -6.872949600219727, "global_step": 148497, "epoch": 3535} {"train_loss": -6.780416965484619, "global_step": 148498, "epoch": 3535} {"train_loss": -6.822245121002197, "global_step": 148499, "epoch": 3535} {"train_loss": -6.889476299285889, "global_step": 148500, "epoch": 3535} {"train_loss": -6.867714881896973, "global_step": 148501, "epoch": 3535} {"train_loss": -6.809403896331787, "global_step": 148502, "epoch": 3535} {"train_loss": -6.744407653808594, "global_step": 148503, "epoch": 3535} {"train_loss": -6.808880805969238, "global_step": 148504, "epoch": 3535} {"train_loss": -6.709474086761475, "global_step": 148505, "epoch": 3535} {"train_loss": -6.731383323669434, "global_step": 148506, "epoch": 3535} {"train_loss": -6.772634983062744, "global_step": 148507, "epoch": 3535} {"train_loss": -6.697678565979004, "global_step": 148508, "epoch": 3535} {"train_loss": -6.8836870193481445, "global_step": 148509, "epoch": 3535} {"train_loss": -6.5476579666137695, "global_step": 148510, "epoch": 3535} {"train_loss": -6.8158425490061445, "global_step": 148511, "epoch": 3535, "val_loss": 79068.953125} {"train_loss": -6.748199462890625, "global_step": 148512, "epoch": 3536} {"train_loss": -6.878835678100586, "global_step": 148513, "epoch": 3536} {"train_loss": -6.838939666748047, "global_step": 148514, "epoch": 3536} {"train_loss": -6.935555458068848, "global_step": 148515, "epoch": 3536} {"train_loss": -6.759873390197754, "global_step": 148516, "epoch": 3536} {"train_loss": -6.755060195922852, "global_step": 148517, "epoch": 3536} {"train_loss": -6.845375061035156, "global_step": 148518, "epoch": 3536} {"train_loss": -6.8755388259887695, "global_step": 148519, "epoch": 3536} {"train_loss": -6.871670246124268, "global_step": 148520, "epoch": 3536} {"train_loss": -6.885500907897949, "global_step": 148521, "epoch": 3536} {"train_loss": -6.863946914672852, "global_step": 148522, "epoch": 3536} {"train_loss": -6.823294639587402, "global_step": 148523, "epoch": 3536} {"train_loss": -6.833388328552246, "global_step": 148524, "epoch": 3536} {"train_loss": -6.862280368804932, "global_step": 148525, "epoch": 3536} {"train_loss": -6.832505226135254, "global_step": 148526, "epoch": 3536} {"train_loss": -6.856100082397461, "global_step": 148527, "epoch": 3536} {"train_loss": -6.890388488769531, "global_step": 148528, "epoch": 3536} {"train_loss": -6.875443935394287, "global_step": 148529, "epoch": 3536} {"train_loss": -6.926979064941406, "global_step": 148530, "epoch": 3536} {"train_loss": -6.846600532531738, "global_step": 148531, "epoch": 3536} {"train_loss": -6.89412784576416, "global_step": 148532, "epoch": 3536} {"train_loss": -6.815651893615723, "global_step": 148533, "epoch": 3536} {"train_loss": -6.882345199584961, "global_step": 148534, "epoch": 3536} {"train_loss": -6.809109687805176, "global_step": 148535, "epoch": 3536} {"train_loss": -6.839249134063721, "global_step": 148536, "epoch": 3536} {"train_loss": -6.914833068847656, "global_step": 148537, "epoch": 3536} {"train_loss": -6.8831071853637695, "global_step": 148538, "epoch": 3536} {"train_loss": -6.853823661804199, "global_step": 148539, "epoch": 3536} {"train_loss": -6.788094520568848, "global_step": 148540, "epoch": 3536} {"train_loss": -6.812809944152832, "global_step": 148541, "epoch": 3536} {"train_loss": -6.944411277770996, "global_step": 148542, "epoch": 3536} {"train_loss": -6.793532848358154, "global_step": 148543, "epoch": 3536} {"train_loss": -6.783646106719971, "global_step": 148544, "epoch": 3536} {"train_loss": -6.844595909118652, "global_step": 148545, "epoch": 3536} {"train_loss": -6.6673665046691895, "global_step": 148546, "epoch": 3536} {"train_loss": -6.794602870941162, "global_step": 148547, "epoch": 3536} {"train_loss": -6.890687942504883, "global_step": 148548, "epoch": 3536} {"train_loss": -6.729122638702393, "global_step": 148549, "epoch": 3536} {"train_loss": -6.780379295349121, "global_step": 148550, "epoch": 3536} {"train_loss": -6.805135726928711, "global_step": 148551, "epoch": 3536} {"train_loss": -6.791092395782471, "global_step": 148552, "epoch": 3536} {"train_loss": -6.8371608938489645, "global_step": 148553, "epoch": 3536, "val_loss": 78998.796875} {"train_loss": -6.796810150146484, "global_step": 148554, "epoch": 3537} {"train_loss": -6.736410140991211, "global_step": 148555, "epoch": 3537} {"train_loss": -6.679995536804199, "global_step": 148556, "epoch": 3537} {"train_loss": -6.7815093994140625, "global_step": 148557, "epoch": 3537} {"train_loss": -6.725484848022461, "global_step": 148558, "epoch": 3537} {"train_loss": -6.834894180297852, "global_step": 148559, "epoch": 3537} {"train_loss": -6.695889472961426, "global_step": 148560, "epoch": 3537} {"train_loss": -6.728619575500488, "global_step": 148561, "epoch": 3537} {"train_loss": -6.79043436050415, "global_step": 148562, "epoch": 3537} {"train_loss": -6.758818626403809, "global_step": 148563, "epoch": 3537} {"train_loss": -6.832735061645508, "global_step": 148564, "epoch": 3537} {"train_loss": -6.717284679412842, "global_step": 148565, "epoch": 3537} {"train_loss": -6.757658958435059, "global_step": 148566, "epoch": 3537} {"train_loss": -6.872788429260254, "global_step": 148567, "epoch": 3537} {"train_loss": -6.870233058929443, "global_step": 148568, "epoch": 3537} {"train_loss": -6.901121139526367, "global_step": 148569, "epoch": 3537} {"train_loss": -6.858423709869385, "global_step": 148570, "epoch": 3537} {"train_loss": -6.705438613891602, "global_step": 148571, "epoch": 3537} {"train_loss": -6.874990463256836, "global_step": 148572, "epoch": 3537} {"train_loss": -6.769133567810059, "global_step": 148573, "epoch": 3537} {"train_loss": -6.773722171783447, "global_step": 148574, "epoch": 3537} {"train_loss": -6.816996097564697, "global_step": 148575, "epoch": 3537} {"train_loss": -6.791053771972656, "global_step": 148576, "epoch": 3537} {"train_loss": -6.835447788238525, "global_step": 148577, "epoch": 3537} {"train_loss": -6.89731502532959, "global_step": 148578, "epoch": 3537} {"train_loss": -6.938982009887695, "global_step": 148579, "epoch": 3537} {"train_loss": -6.8391642570495605, "global_step": 148580, "epoch": 3537} {"train_loss": -6.843679904937744, "global_step": 148581, "epoch": 3537} {"train_loss": -6.829405784606934, "global_step": 148582, "epoch": 3537} {"train_loss": -6.867959022521973, "global_step": 148583, "epoch": 3537} {"train_loss": -6.838808059692383, "global_step": 148584, "epoch": 3537} {"train_loss": -6.866350173950195, "global_step": 148585, "epoch": 3537} {"train_loss": -6.762820243835449, "global_step": 148586, "epoch": 3537} {"train_loss": -6.752036094665527, "global_step": 148587, "epoch": 3537} {"train_loss": -6.882112979888916, "global_step": 148588, "epoch": 3537} {"train_loss": -6.794144630432129, "global_step": 148589, "epoch": 3537} {"train_loss": -6.895504474639893, "global_step": 148590, "epoch": 3537} {"train_loss": -6.819498062133789, "global_step": 148591, "epoch": 3537} {"train_loss": -6.729501724243164, "global_step": 148592, "epoch": 3537} {"train_loss": -6.837093353271484, "global_step": 148593, "epoch": 3537} {"train_loss": -6.758539199829102, "global_step": 148594, "epoch": 3537} {"train_loss": -6.807926995413644, "global_step": 148595, "epoch": 3537, "val_loss": 78628.3046875} {"train_loss": -6.778334140777588, "global_step": 148596, "epoch": 3538} {"train_loss": -6.8122053146362305, "global_step": 148597, "epoch": 3538} {"train_loss": -6.775632858276367, "global_step": 148598, "epoch": 3538} {"train_loss": -6.815478324890137, "global_step": 148599, "epoch": 3538} {"train_loss": -6.682035446166992, "global_step": 148600, "epoch": 3538} {"train_loss": -6.750081539154053, "global_step": 148601, "epoch": 3538} {"train_loss": -6.702923774719238, "global_step": 148602, "epoch": 3538} {"train_loss": -6.789115905761719, "global_step": 148603, "epoch": 3538} {"train_loss": -6.840609550476074, "global_step": 148604, "epoch": 3538} {"train_loss": -6.875290393829346, "global_step": 148605, "epoch": 3538} {"train_loss": -6.825009822845459, "global_step": 148606, "epoch": 3538} {"train_loss": -6.849077224731445, "global_step": 148607, "epoch": 3538} {"train_loss": -6.755136489868164, "global_step": 148608, "epoch": 3538} {"train_loss": -6.9158854484558105, "global_step": 148609, "epoch": 3538} {"train_loss": -6.787168502807617, "global_step": 148610, "epoch": 3538} {"train_loss": -6.830032825469971, "global_step": 148611, "epoch": 3538} {"train_loss": -6.783496379852295, "global_step": 148612, "epoch": 3538} {"train_loss": -6.810199737548828, "global_step": 148613, "epoch": 3538} {"train_loss": -6.98079776763916, "global_step": 148614, "epoch": 3538} {"train_loss": -6.926522254943848, "global_step": 148615, "epoch": 3538} {"train_loss": -6.875810623168945, "global_step": 148616, "epoch": 3538} {"train_loss": -6.83072566986084, "global_step": 148617, "epoch": 3538} {"train_loss": -6.840734481811523, "global_step": 148618, "epoch": 3538} {"train_loss": -6.895170211791992, "global_step": 148619, "epoch": 3538} {"train_loss": -6.888526916503906, "global_step": 148620, "epoch": 3538} {"train_loss": -6.779799461364746, "global_step": 148621, "epoch": 3538} {"train_loss": -6.836390495300293, "global_step": 148622, "epoch": 3538} {"train_loss": -6.881194114685059, "global_step": 148623, "epoch": 3538} {"train_loss": -6.926828861236572, "global_step": 148624, "epoch": 3538} {"train_loss": -6.95616340637207, "global_step": 148625, "epoch": 3538} {"train_loss": -6.888169288635254, "global_step": 148626, "epoch": 3538} {"train_loss": -6.882902145385742, "global_step": 148627, "epoch": 3538} {"train_loss": -6.917740345001221, "global_step": 148628, "epoch": 3538} {"train_loss": -6.867818355560303, "global_step": 148629, "epoch": 3538} {"train_loss": -7.026848793029785, "global_step": 148630, "epoch": 3538} {"train_loss": -6.893215179443359, "global_step": 148631, "epoch": 3538} {"train_loss": -6.860701560974121, "global_step": 148632, "epoch": 3538} {"train_loss": -6.719987869262695, "global_step": 148633, "epoch": 3538} {"train_loss": -6.747594833374023, "global_step": 148634, "epoch": 3538} {"train_loss": -7.001449108123779, "global_step": 148635, "epoch": 3538} {"train_loss": -6.8712029457092285, "global_step": 148636, "epoch": 3538} {"train_loss": -6.844684010460263, "global_step": 148637, "epoch": 3538, "val_loss": 78652.953125} {"train_loss": -6.925773620605469, "global_step": 148638, "epoch": 3539} {"train_loss": -6.711127281188965, "global_step": 148639, "epoch": 3539} {"train_loss": -6.864443302154541, "global_step": 148640, "epoch": 3539} {"train_loss": -6.754714012145996, "global_step": 148641, "epoch": 3539} {"train_loss": -6.690958023071289, "global_step": 148642, "epoch": 3539} {"train_loss": -6.836496353149414, "global_step": 148643, "epoch": 3539} {"train_loss": -6.656927585601807, "global_step": 148644, "epoch": 3539} {"train_loss": -6.689630508422852, "global_step": 148645, "epoch": 3539} {"train_loss": -6.834964752197266, "global_step": 148646, "epoch": 3539} {"train_loss": -6.789309501647949, "global_step": 148647, "epoch": 3539} {"train_loss": -6.7181901931762695, "global_step": 148648, "epoch": 3539} {"train_loss": -6.675205230712891, "global_step": 148649, "epoch": 3539} {"train_loss": -6.772390365600586, "global_step": 148650, "epoch": 3539} {"train_loss": -6.7234086990356445, "global_step": 148651, "epoch": 3539} {"train_loss": -6.758109092712402, "global_step": 148652, "epoch": 3539} {"train_loss": -6.736899375915527, "global_step": 148653, "epoch": 3539} {"train_loss": -6.820737838745117, "global_step": 148654, "epoch": 3539} {"train_loss": -6.770224571228027, "global_step": 148655, "epoch": 3539} {"train_loss": -6.887129783630371, "global_step": 148656, "epoch": 3539} {"train_loss": -6.728316307067871, "global_step": 148657, "epoch": 3539} {"train_loss": -6.7572174072265625, "global_step": 148658, "epoch": 3539} {"train_loss": -6.7156524658203125, "global_step": 148659, "epoch": 3539} {"train_loss": -6.7895097732543945, "global_step": 148660, "epoch": 3539} {"train_loss": -6.80996036529541, "global_step": 148661, "epoch": 3539} {"train_loss": -6.8095197677612305, "global_step": 148662, "epoch": 3539} {"train_loss": -6.839852809906006, "global_step": 148663, "epoch": 3539} {"train_loss": -6.878844261169434, "global_step": 148664, "epoch": 3539} {"train_loss": -6.871381759643555, "global_step": 148665, "epoch": 3539} {"train_loss": -6.950888156890869, "global_step": 148666, "epoch": 3539} {"train_loss": -6.842692852020264, "global_step": 148667, "epoch": 3539} {"train_loss": -6.895072937011719, "global_step": 148668, "epoch": 3539} {"train_loss": -6.856559753417969, "global_step": 148669, "epoch": 3539} {"train_loss": -6.970347881317139, "global_step": 148670, "epoch": 3539} {"train_loss": -6.8806610107421875, "global_step": 148671, "epoch": 3539} {"train_loss": -6.842257499694824, "global_step": 148672, "epoch": 3539} {"train_loss": -6.857998371124268, "global_step": 148673, "epoch": 3539} {"train_loss": -6.780251979827881, "global_step": 148674, "epoch": 3539} {"train_loss": -6.754425048828125, "global_step": 148675, "epoch": 3539} {"train_loss": -6.837588310241699, "global_step": 148676, "epoch": 3539} {"train_loss": -6.837376594543457, "global_step": 148677, "epoch": 3539} {"train_loss": -6.714508533477783, "global_step": 148678, "epoch": 3539} {"train_loss": -6.803252413159325, "global_step": 148679, "epoch": 3539, "val_loss": 78651.8515625} {"train_loss": -6.848480701446533, "global_step": 148680, "epoch": 3540} {"train_loss": -6.727977275848389, "global_step": 148681, "epoch": 3540} {"train_loss": -6.877322196960449, "global_step": 148682, "epoch": 3540} {"train_loss": -6.951892852783203, "global_step": 148683, "epoch": 3540} {"train_loss": -6.740520477294922, "global_step": 148684, "epoch": 3540} {"train_loss": -6.823290824890137, "global_step": 148685, "epoch": 3540} {"train_loss": -6.898747444152832, "global_step": 148686, "epoch": 3540} {"train_loss": -6.73946475982666, "global_step": 148687, "epoch": 3540} {"train_loss": -6.904676914215088, "global_step": 148688, "epoch": 3540} {"train_loss": -6.8786516189575195, "global_step": 148689, "epoch": 3540} {"train_loss": -6.715574264526367, "global_step": 148690, "epoch": 3540} {"train_loss": -6.811582565307617, "global_step": 148691, "epoch": 3540} {"train_loss": -6.907729148864746, "global_step": 148692, "epoch": 3540} {"train_loss": -6.804207801818848, "global_step": 148693, "epoch": 3540} {"train_loss": -6.827320098876953, "global_step": 148694, "epoch": 3540} {"train_loss": -6.819662094116211, "global_step": 148695, "epoch": 3540} {"train_loss": -6.719002723693848, "global_step": 148696, "epoch": 3540} {"train_loss": -6.814364433288574, "global_step": 148697, "epoch": 3540} {"train_loss": -6.788097381591797, "global_step": 148698, "epoch": 3540} {"train_loss": -6.826793670654297, "global_step": 148699, "epoch": 3540} {"train_loss": -6.870857238769531, "global_step": 148700, "epoch": 3540} {"train_loss": -6.8260040283203125, "global_step": 148701, "epoch": 3540} {"train_loss": -6.7763543128967285, "global_step": 148702, "epoch": 3540} {"train_loss": -6.8140034675598145, "global_step": 148703, "epoch": 3540} {"train_loss": -6.825340270996094, "global_step": 148704, "epoch": 3540} {"train_loss": -6.901494979858398, "global_step": 148705, "epoch": 3540} {"train_loss": -6.855565071105957, "global_step": 148706, "epoch": 3540} {"train_loss": -6.831526279449463, "global_step": 148707, "epoch": 3540} {"train_loss": -6.762820243835449, "global_step": 148708, "epoch": 3540} {"train_loss": -6.789865493774414, "global_step": 148709, "epoch": 3540} {"train_loss": -7.0342698097229, "global_step": 148710, "epoch": 3540} {"train_loss": -6.7972025871276855, "global_step": 148711, "epoch": 3540} {"train_loss": -7.043562889099121, "global_step": 148712, "epoch": 3540} {"train_loss": -6.925731658935547, "global_step": 148713, "epoch": 3540} {"train_loss": -6.883906364440918, "global_step": 148714, "epoch": 3540} {"train_loss": -6.874375343322754, "global_step": 148715, "epoch": 3540} {"train_loss": -6.914788246154785, "global_step": 148716, "epoch": 3540} {"train_loss": -6.809340476989746, "global_step": 148717, "epoch": 3540} {"train_loss": -7.0084228515625, "global_step": 148718, "epoch": 3540} {"train_loss": -7.034582138061523, "global_step": 148719, "epoch": 3540} {"train_loss": -6.943842887878418, "global_step": 148720, "epoch": 3540} {"train_loss": -6.855339027586437, "global_step": 148721, "epoch": 3540, "val_loss": 78586.2890625} {"train_loss": -6.8862457275390625, "global_step": 148722, "epoch": 3541} {"train_loss": -6.733055114746094, "global_step": 148723, "epoch": 3541} {"train_loss": -6.801947593688965, "global_step": 148724, "epoch": 3541} {"train_loss": -6.938704490661621, "global_step": 148725, "epoch": 3541} {"train_loss": -6.855510711669922, "global_step": 148726, "epoch": 3541} {"train_loss": -6.8172101974487305, "global_step": 148727, "epoch": 3541} {"train_loss": -6.92764949798584, "global_step": 148728, "epoch": 3541} {"train_loss": -6.829148292541504, "global_step": 148729, "epoch": 3541} {"train_loss": -6.80104398727417, "global_step": 148730, "epoch": 3541} {"train_loss": -6.919092655181885, "global_step": 148731, "epoch": 3541} {"train_loss": -6.879523277282715, "global_step": 148732, "epoch": 3541} {"train_loss": -6.852729320526123, "global_step": 148733, "epoch": 3541} {"train_loss": -6.806953430175781, "global_step": 148734, "epoch": 3541} {"train_loss": -6.838037490844727, "global_step": 148735, "epoch": 3541} {"train_loss": -6.979517936706543, "global_step": 148736, "epoch": 3541} {"train_loss": -6.881344795227051, "global_step": 148737, "epoch": 3541} {"train_loss": -6.865306854248047, "global_step": 148738, "epoch": 3541} {"train_loss": -6.858010292053223, "global_step": 148739, "epoch": 3541} {"train_loss": -6.879328727722168, "global_step": 148740, "epoch": 3541} {"train_loss": -6.8772358894348145, "global_step": 148741, "epoch": 3541} {"train_loss": -6.9027509689331055, "global_step": 148742, "epoch": 3541} {"train_loss": -6.875424385070801, "global_step": 148743, "epoch": 3541} {"train_loss": -6.846606254577637, "global_step": 148744, "epoch": 3541} {"train_loss": -6.928634166717529, "global_step": 148745, "epoch": 3541} {"train_loss": -6.678524494171143, "global_step": 148746, "epoch": 3541} {"train_loss": -6.5722503662109375, "global_step": 148747, "epoch": 3541} {"train_loss": -6.936803817749023, "global_step": 148748, "epoch": 3541} {"train_loss": -6.713141441345215, "global_step": 148749, "epoch": 3541} {"train_loss": -6.768893718719482, "global_step": 148750, "epoch": 3541} {"train_loss": -6.9027581214904785, "global_step": 148751, "epoch": 3541} {"train_loss": -6.680973529815674, "global_step": 148752, "epoch": 3541} {"train_loss": -6.838034629821777, "global_step": 148753, "epoch": 3541} {"train_loss": -6.845867156982422, "global_step": 148754, "epoch": 3541} {"train_loss": -6.759809494018555, "global_step": 148755, "epoch": 3541} {"train_loss": -6.984495162963867, "global_step": 148756, "epoch": 3541} {"train_loss": -6.849872589111328, "global_step": 148757, "epoch": 3541} {"train_loss": -6.817601203918457, "global_step": 148758, "epoch": 3541} {"train_loss": -6.8433709144592285, "global_step": 148759, "epoch": 3541} {"train_loss": -6.827157974243164, "global_step": 148760, "epoch": 3541} {"train_loss": -6.90256404876709, "global_step": 148761, "epoch": 3541} {"train_loss": -6.862224578857422, "global_step": 148762, "epoch": 3541} {"train_loss": -6.843147028060186, "global_step": 148763, "epoch": 3541, "val_loss": 78507.9140625} {"train_loss": -6.987260818481445, "global_step": 148764, "epoch": 3542} {"train_loss": -6.841897964477539, "global_step": 148765, "epoch": 3542} {"train_loss": -6.834430694580078, "global_step": 148766, "epoch": 3542} {"train_loss": -6.822770118713379, "global_step": 148767, "epoch": 3542} {"train_loss": -6.856400489807129, "global_step": 148768, "epoch": 3542} {"train_loss": -6.889377593994141, "global_step": 148769, "epoch": 3542} {"train_loss": -6.853116512298584, "global_step": 148770, "epoch": 3542} {"train_loss": -6.793957710266113, "global_step": 148771, "epoch": 3542} {"train_loss": -6.760608673095703, "global_step": 148772, "epoch": 3542} {"train_loss": -6.935198783874512, "global_step": 148773, "epoch": 3542} {"train_loss": -6.848658561706543, "global_step": 148774, "epoch": 3542} {"train_loss": -6.737004280090332, "global_step": 148775, "epoch": 3542} {"train_loss": -6.912021636962891, "global_step": 148776, "epoch": 3542} {"train_loss": -6.934771537780762, "global_step": 148777, "epoch": 3542} {"train_loss": -6.777897834777832, "global_step": 148778, "epoch": 3542} {"train_loss": -6.8595709800720215, "global_step": 148779, "epoch": 3542} {"train_loss": -6.8335957527160645, "global_step": 148780, "epoch": 3542} {"train_loss": -6.843351364135742, "global_step": 148781, "epoch": 3542} {"train_loss": -6.808476448059082, "global_step": 148782, "epoch": 3542} {"train_loss": -6.612724304199219, "global_step": 148783, "epoch": 3542} {"train_loss": -6.755403995513916, "global_step": 148784, "epoch": 3542} {"train_loss": -6.7598395347595215, "global_step": 148785, "epoch": 3542} {"train_loss": -6.761152267456055, "global_step": 148786, "epoch": 3542} {"train_loss": -6.817380905151367, "global_step": 148787, "epoch": 3542} {"train_loss": -6.764996528625488, "global_step": 148788, "epoch": 3542} {"train_loss": -6.915567874908447, "global_step": 148789, "epoch": 3542} {"train_loss": -6.782409191131592, "global_step": 148790, "epoch": 3542} {"train_loss": -6.829967498779297, "global_step": 148791, "epoch": 3542} {"train_loss": -6.792762756347656, "global_step": 148792, "epoch": 3542} {"train_loss": -6.9304399490356445, "global_step": 148793, "epoch": 3542} {"train_loss": -6.78981876373291, "global_step": 148794, "epoch": 3542} {"train_loss": -6.875235557556152, "global_step": 148795, "epoch": 3542} {"train_loss": -6.8785295486450195, "global_step": 148796, "epoch": 3542} {"train_loss": -6.8266425132751465, "global_step": 148797, "epoch": 3542} {"train_loss": -6.871275424957275, "global_step": 148798, "epoch": 3542} {"train_loss": -6.945492744445801, "global_step": 148799, "epoch": 3542} {"train_loss": -6.819949150085449, "global_step": 148800, "epoch": 3542} {"train_loss": -6.884942054748535, "global_step": 148801, "epoch": 3542} {"train_loss": -6.828351020812988, "global_step": 148802, "epoch": 3542} {"train_loss": -6.741177558898926, "global_step": 148803, "epoch": 3542} {"train_loss": -6.816122055053711, "global_step": 148804, "epoch": 3542} {"train_loss": -6.832453262238276, "global_step": 148805, "epoch": 3542, "val_loss": 78609.0390625} {"train_loss": -6.870880126953125, "global_step": 148806, "epoch": 3543} {"train_loss": -6.771361351013184, "global_step": 148807, "epoch": 3543} {"train_loss": -6.609738826751709, "global_step": 148808, "epoch": 3543} {"train_loss": -6.775385856628418, "global_step": 148809, "epoch": 3543} {"train_loss": -7.04931116104126, "global_step": 148810, "epoch": 3543} {"train_loss": -6.597855567932129, "global_step": 148811, "epoch": 3543} {"train_loss": -6.718033790588379, "global_step": 148812, "epoch": 3543} {"train_loss": -6.903565883636475, "global_step": 148813, "epoch": 3543} {"train_loss": -6.688972473144531, "global_step": 148814, "epoch": 3543} {"train_loss": -6.816947937011719, "global_step": 148815, "epoch": 3543} {"train_loss": -6.655213356018066, "global_step": 148816, "epoch": 3543} {"train_loss": -6.794354438781738, "global_step": 148817, "epoch": 3543} {"train_loss": -6.720456123352051, "global_step": 148818, "epoch": 3543} {"train_loss": -6.784638404846191, "global_step": 148819, "epoch": 3543} {"train_loss": -6.880168437957764, "global_step": 148820, "epoch": 3543} {"train_loss": -6.712642669677734, "global_step": 148821, "epoch": 3543} {"train_loss": -6.768672943115234, "global_step": 148822, "epoch": 3543} {"train_loss": -6.696706295013428, "global_step": 148823, "epoch": 3543} {"train_loss": -6.740746021270752, "global_step": 148824, "epoch": 3543} {"train_loss": -6.684144973754883, "global_step": 148825, "epoch": 3543} {"train_loss": -6.792870998382568, "global_step": 148826, "epoch": 3543} {"train_loss": -6.867955207824707, "global_step": 148827, "epoch": 3543} {"train_loss": -6.878678321838379, "global_step": 148828, "epoch": 3543} {"train_loss": -6.893527984619141, "global_step": 148829, "epoch": 3543} {"train_loss": -6.850534439086914, "global_step": 148830, "epoch": 3543} {"train_loss": -7.009184837341309, "global_step": 148831, "epoch": 3543} {"train_loss": -6.826909065246582, "global_step": 148832, "epoch": 3543} {"train_loss": -6.868032455444336, "global_step": 148833, "epoch": 3543} {"train_loss": -6.869019508361816, "global_step": 148834, "epoch": 3543} {"train_loss": -6.792666912078857, "global_step": 148835, "epoch": 3543} {"train_loss": -6.8575239181518555, "global_step": 148836, "epoch": 3543} {"train_loss": -6.735197067260742, "global_step": 148837, "epoch": 3543} {"train_loss": -6.797755241394043, "global_step": 148838, "epoch": 3543} {"train_loss": -6.829832077026367, "global_step": 148839, "epoch": 3543} {"train_loss": -6.8629469871521, "global_step": 148840, "epoch": 3543} {"train_loss": -6.871955871582031, "global_step": 148841, "epoch": 3543} {"train_loss": -6.873329162597656, "global_step": 148842, "epoch": 3543} {"train_loss": -6.893471717834473, "global_step": 148843, "epoch": 3543} {"train_loss": -6.860593795776367, "global_step": 148844, "epoch": 3543} {"train_loss": -6.854996681213379, "global_step": 148845, "epoch": 3543} {"train_loss": -6.844913482666016, "global_step": 148846, "epoch": 3543} {"train_loss": -6.8109288556235175, "global_step": 148847, "epoch": 3543, "val_loss": 78682.0390625} {"train_loss": -6.958559989929199, "global_step": 148848, "epoch": 3544} {"train_loss": -6.808429718017578, "global_step": 148849, "epoch": 3544} {"train_loss": -6.94458532333374, "global_step": 148850, "epoch": 3544} {"train_loss": -6.875599384307861, "global_step": 148851, "epoch": 3544} {"train_loss": -6.9113922119140625, "global_step": 148852, "epoch": 3544} {"train_loss": -6.859262466430664, "global_step": 148853, "epoch": 3544} {"train_loss": -6.831496238708496, "global_step": 148854, "epoch": 3544} {"train_loss": -6.85825252532959, "global_step": 148855, "epoch": 3544} {"train_loss": -6.836870193481445, "global_step": 148856, "epoch": 3544} {"train_loss": -6.938622951507568, "global_step": 148857, "epoch": 3544} {"train_loss": -6.851768970489502, "global_step": 148858, "epoch": 3544} {"train_loss": -6.8644256591796875, "global_step": 148859, "epoch": 3544} {"train_loss": -7.002871513366699, "global_step": 148860, "epoch": 3544} {"train_loss": -6.940001487731934, "global_step": 148861, "epoch": 3544} {"train_loss": -6.8842315673828125, "global_step": 148862, "epoch": 3544} {"train_loss": -6.875547409057617, "global_step": 148863, "epoch": 3544} {"train_loss": -6.9450364112854, "global_step": 148864, "epoch": 3544} {"train_loss": -6.90921688079834, "global_step": 148865, "epoch": 3544} {"train_loss": -6.956987380981445, "global_step": 148866, "epoch": 3544} {"train_loss": -6.990532875061035, "global_step": 148867, "epoch": 3544} {"train_loss": -6.796872138977051, "global_step": 148868, "epoch": 3544} {"train_loss": -6.956070899963379, "global_step": 148869, "epoch": 3544} {"train_loss": -6.90169620513916, "global_step": 148870, "epoch": 3544} {"train_loss": -6.723954677581787, "global_step": 148871, "epoch": 3544} {"train_loss": -6.875856876373291, "global_step": 148872, "epoch": 3544} {"train_loss": -6.872274398803711, "global_step": 148873, "epoch": 3544} {"train_loss": -6.818284034729004, "global_step": 148874, "epoch": 3544} {"train_loss": -6.906848907470703, "global_step": 148875, "epoch": 3544} {"train_loss": -6.868655204772949, "global_step": 148876, "epoch": 3544} {"train_loss": -6.977006912231445, "global_step": 148877, "epoch": 3544} {"train_loss": -6.84252405166626, "global_step": 148878, "epoch": 3544} {"train_loss": -6.881687641143799, "global_step": 148879, "epoch": 3544} {"train_loss": -6.861230373382568, "global_step": 148880, "epoch": 3544} {"train_loss": -6.897838592529297, "global_step": 148881, "epoch": 3544} {"train_loss": -6.790180206298828, "global_step": 148882, "epoch": 3544} {"train_loss": -6.904701232910156, "global_step": 148883, "epoch": 3544} {"train_loss": -7.0079851150512695, "global_step": 148884, "epoch": 3544} {"train_loss": -6.864392280578613, "global_step": 148885, "epoch": 3544} {"train_loss": -6.860891342163086, "global_step": 148886, "epoch": 3544} {"train_loss": -6.939988136291504, "global_step": 148887, "epoch": 3544} {"train_loss": -6.7685723304748535, "global_step": 148888, "epoch": 3544} {"train_loss": -6.8872880935668945, "global_step": 148889, "epoch": 3544, "val_loss": 78792.4609375} {"train_loss": -6.956911087036133, "global_step": 148890, "epoch": 3545} {"train_loss": -6.858603477478027, "global_step": 148891, "epoch": 3545} {"train_loss": -7.005780220031738, "global_step": 148892, "epoch": 3545} {"train_loss": -6.859487056732178, "global_step": 148893, "epoch": 3545} {"train_loss": -6.876684188842773, "global_step": 148894, "epoch": 3545} {"train_loss": -6.98331356048584, "global_step": 148895, "epoch": 3545} {"train_loss": -6.864812850952148, "global_step": 148896, "epoch": 3545} {"train_loss": -6.835968017578125, "global_step": 148897, "epoch": 3545} {"train_loss": -6.96425199508667, "global_step": 148898, "epoch": 3545} {"train_loss": -6.764572620391846, "global_step": 148899, "epoch": 3545} {"train_loss": -6.725020408630371, "global_step": 148900, "epoch": 3545} {"train_loss": -6.952365875244141, "global_step": 148901, "epoch": 3545} {"train_loss": -6.732346534729004, "global_step": 148902, "epoch": 3545} {"train_loss": -6.662192344665527, "global_step": 148903, "epoch": 3545} {"train_loss": -6.835589408874512, "global_step": 148904, "epoch": 3545} {"train_loss": -6.843138694763184, "global_step": 148905, "epoch": 3545} {"train_loss": -6.8712921142578125, "global_step": 148906, "epoch": 3545} {"train_loss": -6.871678829193115, "global_step": 148907, "epoch": 3545} {"train_loss": -6.698920249938965, "global_step": 148908, "epoch": 3545} {"train_loss": -6.839308261871338, "global_step": 148909, "epoch": 3545} {"train_loss": -6.794684410095215, "global_step": 148910, "epoch": 3545} {"train_loss": -6.765315055847168, "global_step": 148911, "epoch": 3545} {"train_loss": -6.854964256286621, "global_step": 148912, "epoch": 3545} {"train_loss": -6.6985273361206055, "global_step": 148913, "epoch": 3545} {"train_loss": -6.879966735839844, "global_step": 148914, "epoch": 3545} {"train_loss": -6.755192756652832, "global_step": 148915, "epoch": 3545} {"train_loss": -6.766826629638672, "global_step": 148916, "epoch": 3545} {"train_loss": -6.900338172912598, "global_step": 148917, "epoch": 3545} {"train_loss": -6.879071235656738, "global_step": 148918, "epoch": 3545} {"train_loss": -6.758457660675049, "global_step": 148919, "epoch": 3545} {"train_loss": -6.803235054016113, "global_step": 148920, "epoch": 3545} {"train_loss": -6.907877445220947, "global_step": 148921, "epoch": 3545} {"train_loss": -6.736113548278809, "global_step": 148922, "epoch": 3545} {"train_loss": -6.856213092803955, "global_step": 148923, "epoch": 3545} {"train_loss": -6.747933387756348, "global_step": 148924, "epoch": 3545} {"train_loss": -6.8782172203063965, "global_step": 148925, "epoch": 3545} {"train_loss": -6.859908580780029, "global_step": 148926, "epoch": 3545} {"train_loss": -6.786561012268066, "global_step": 148927, "epoch": 3545} {"train_loss": -6.828334331512451, "global_step": 148928, "epoch": 3545} {"train_loss": -6.7401885986328125, "global_step": 148929, "epoch": 3545} {"train_loss": -6.868239402770996, "global_step": 148930, "epoch": 3545} {"train_loss": -6.834338244937715, "global_step": 148931, "epoch": 3545, "val_loss": 78969.734375} {"train_loss": -6.837348937988281, "global_step": 148932, "epoch": 3546} {"train_loss": -6.873800277709961, "global_step": 148933, "epoch": 3546} {"train_loss": -6.801632881164551, "global_step": 148934, "epoch": 3546} {"train_loss": -6.750572681427002, "global_step": 148935, "epoch": 3546} {"train_loss": -6.8375420570373535, "global_step": 148936, "epoch": 3546} {"train_loss": -6.810608863830566, "global_step": 148937, "epoch": 3546} {"train_loss": -6.850135803222656, "global_step": 148938, "epoch": 3546} {"train_loss": -6.831362247467041, "global_step": 148939, "epoch": 3546} {"train_loss": -6.813896179199219, "global_step": 148940, "epoch": 3546} {"train_loss": -6.797739505767822, "global_step": 148941, "epoch": 3546} {"train_loss": -6.933650970458984, "global_step": 148942, "epoch": 3546} {"train_loss": -6.920514106750488, "global_step": 148943, "epoch": 3546} {"train_loss": -6.797393798828125, "global_step": 148944, "epoch": 3546} {"train_loss": -6.814377307891846, "global_step": 148945, "epoch": 3546} {"train_loss": -6.758134841918945, "global_step": 148946, "epoch": 3546} {"train_loss": -6.884310722351074, "global_step": 148947, "epoch": 3546} {"train_loss": -6.792299747467041, "global_step": 148948, "epoch": 3546} {"train_loss": -6.900457859039307, "global_step": 148949, "epoch": 3546} {"train_loss": -6.8024139404296875, "global_step": 148950, "epoch": 3546} {"train_loss": -6.983948707580566, "global_step": 148951, "epoch": 3546} {"train_loss": -6.975090026855469, "global_step": 148952, "epoch": 3546} {"train_loss": -6.98093318939209, "global_step": 148953, "epoch": 3546} {"train_loss": -6.94448709487915, "global_step": 148954, "epoch": 3546} {"train_loss": -6.972845077514648, "global_step": 148955, "epoch": 3546} {"train_loss": -6.832573890686035, "global_step": 148956, "epoch": 3546} {"train_loss": -6.914943695068359, "global_step": 148957, "epoch": 3546} {"train_loss": -6.929011344909668, "global_step": 148958, "epoch": 3546} {"train_loss": -6.890498161315918, "global_step": 148959, "epoch": 3546} {"train_loss": -6.872091293334961, "global_step": 148960, "epoch": 3546} {"train_loss": -6.971656799316406, "global_step": 148961, "epoch": 3546} {"train_loss": -6.890744686126709, "global_step": 148962, "epoch": 3546} {"train_loss": -6.882798671722412, "global_step": 148963, "epoch": 3546} {"train_loss": -6.825639724731445, "global_step": 148964, "epoch": 3546} {"train_loss": -6.994379043579102, "global_step": 148965, "epoch": 3546} {"train_loss": -7.017998695373535, "global_step": 148966, "epoch": 3546} {"train_loss": -6.984949111938477, "global_step": 148967, "epoch": 3546} {"train_loss": -6.903091907501221, "global_step": 148968, "epoch": 3546} {"train_loss": -6.763919830322266, "global_step": 148969, "epoch": 3546} {"train_loss": -6.898509502410889, "global_step": 148970, "epoch": 3546} {"train_loss": -6.91286563873291, "global_step": 148971, "epoch": 3546} {"train_loss": -6.836429119110107, "global_step": 148972, "epoch": 3546} {"train_loss": -6.880465235028948, "global_step": 148973, "epoch": 3546, "val_loss": 78909.875} {"train_loss": -6.905797004699707, "global_step": 148974, "epoch": 3547} {"train_loss": -6.779896259307861, "global_step": 148975, "epoch": 3547} {"train_loss": -6.897997856140137, "global_step": 148976, "epoch": 3547} {"train_loss": -6.952157497406006, "global_step": 148977, "epoch": 3547} {"train_loss": -6.802951335906982, "global_step": 148978, "epoch": 3547} {"train_loss": -6.987314701080322, "global_step": 148979, "epoch": 3547} {"train_loss": -6.925503730773926, "global_step": 148980, "epoch": 3547} {"train_loss": -6.880755424499512, "global_step": 148981, "epoch": 3547} {"train_loss": -6.890740394592285, "global_step": 148982, "epoch": 3547} {"train_loss": -6.777528285980225, "global_step": 148983, "epoch": 3547} {"train_loss": -6.861687183380127, "global_step": 148984, "epoch": 3547} {"train_loss": -6.920709609985352, "global_step": 148985, "epoch": 3547} {"train_loss": -6.89334774017334, "global_step": 148986, "epoch": 3547} {"train_loss": -6.88893985748291, "global_step": 148987, "epoch": 3547} {"train_loss": -6.949420928955078, "global_step": 148988, "epoch": 3547} {"train_loss": -6.863808631896973, "global_step": 148989, "epoch": 3547} {"train_loss": -6.748948097229004, "global_step": 148990, "epoch": 3547} {"train_loss": -6.924684524536133, "global_step": 148991, "epoch": 3547} {"train_loss": -6.856067657470703, "global_step": 148992, "epoch": 3547} {"train_loss": -6.8414812088012695, "global_step": 148993, "epoch": 3547} {"train_loss": -7.020895957946777, "global_step": 148994, "epoch": 3547} {"train_loss": -6.942342758178711, "global_step": 148995, "epoch": 3547} {"train_loss": -6.871402740478516, "global_step": 148996, "epoch": 3547} {"train_loss": -6.872495651245117, "global_step": 148997, "epoch": 3547} {"train_loss": -6.885859489440918, "global_step": 148998, "epoch": 3547} {"train_loss": -6.916098594665527, "global_step": 148999, "epoch": 3547} {"train_loss": -6.908107757568359, "global_step": 149000, "epoch": 3547} {"train_loss": -6.975894927978516, "global_step": 149001, "epoch": 3547} {"train_loss": -6.829310417175293, "global_step": 149002, "epoch": 3547} {"train_loss": -6.770455837249756, "global_step": 149003, "epoch": 3547} {"train_loss": -6.926637172698975, "global_step": 149004, "epoch": 3547} {"train_loss": -6.853900909423828, "global_step": 149005, "epoch": 3547} {"train_loss": -6.877240180969238, "global_step": 149006, "epoch": 3547} {"train_loss": -6.856481552124023, "global_step": 149007, "epoch": 3547} {"train_loss": -6.750882148742676, "global_step": 149008, "epoch": 3547} {"train_loss": -6.74163818359375, "global_step": 149009, "epoch": 3547} {"train_loss": -6.832131385803223, "global_step": 149010, "epoch": 3547} {"train_loss": -6.796645164489746, "global_step": 149011, "epoch": 3547} {"train_loss": -6.699467182159424, "global_step": 149012, "epoch": 3547} {"train_loss": -6.84995174407959, "global_step": 149013, "epoch": 3547} {"train_loss": -6.726330757141113, "global_step": 149014, "epoch": 3547} {"train_loss": -6.864674386524019, "global_step": 149015, "epoch": 3547, "val_loss": 78600.2109375} {"train_loss": -6.857795715332031, "global_step": 149016, "epoch": 3548} {"train_loss": -6.8567328453063965, "global_step": 149017, "epoch": 3548} {"train_loss": -6.771636009216309, "global_step": 149018, "epoch": 3548} {"train_loss": -6.866976737976074, "global_step": 149019, "epoch": 3548} {"train_loss": -6.765340805053711, "global_step": 149020, "epoch": 3548} {"train_loss": -6.742697238922119, "global_step": 149021, "epoch": 3548} {"train_loss": -6.8302412033081055, "global_step": 149022, "epoch": 3548} {"train_loss": -6.746230125427246, "global_step": 149023, "epoch": 3548} {"train_loss": -6.818857669830322, "global_step": 149024, "epoch": 3548} {"train_loss": -6.817365646362305, "global_step": 149025, "epoch": 3548} {"train_loss": -6.8022050857543945, "global_step": 149026, "epoch": 3548} {"train_loss": -6.6855974197387695, "global_step": 149027, "epoch": 3548} {"train_loss": -6.861651420593262, "global_step": 149028, "epoch": 3548} {"train_loss": -6.756047248840332, "global_step": 149029, "epoch": 3548} {"train_loss": -6.848154067993164, "global_step": 149030, "epoch": 3548} {"train_loss": -6.810552597045898, "global_step": 149031, "epoch": 3548} {"train_loss": -6.603833198547363, "global_step": 149032, "epoch": 3548} {"train_loss": -6.901951789855957, "global_step": 149033, "epoch": 3548} {"train_loss": -6.693821430206299, "global_step": 149034, "epoch": 3548} {"train_loss": -6.826987266540527, "global_step": 149035, "epoch": 3548} {"train_loss": -6.6886162757873535, "global_step": 149036, "epoch": 3548} {"train_loss": -6.9303131103515625, "global_step": 149037, "epoch": 3548} {"train_loss": -6.784151077270508, "global_step": 149038, "epoch": 3548} {"train_loss": -6.775327682495117, "global_step": 149039, "epoch": 3548} {"train_loss": -6.878408432006836, "global_step": 149040, "epoch": 3548} {"train_loss": -6.739732265472412, "global_step": 149041, "epoch": 3548} {"train_loss": -6.833436012268066, "global_step": 149042, "epoch": 3548} {"train_loss": -6.796529769897461, "global_step": 149043, "epoch": 3548} {"train_loss": -6.788617134094238, "global_step": 149044, "epoch": 3548} {"train_loss": -6.801689147949219, "global_step": 149045, "epoch": 3548} {"train_loss": -6.777915954589844, "global_step": 149046, "epoch": 3548} {"train_loss": -6.718888282775879, "global_step": 149047, "epoch": 3548} {"train_loss": -6.772058486938477, "global_step": 149048, "epoch": 3548} {"train_loss": -6.715421199798584, "global_step": 149049, "epoch": 3548} {"train_loss": -6.622720241546631, "global_step": 149050, "epoch": 3548} {"train_loss": -6.924555778503418, "global_step": 149051, "epoch": 3548} {"train_loss": -6.684243202209473, "global_step": 149052, "epoch": 3548} {"train_loss": -6.7768096923828125, "global_step": 149053, "epoch": 3548} {"train_loss": -6.8652801513671875, "global_step": 149054, "epoch": 3548} {"train_loss": -6.896204948425293, "global_step": 149055, "epoch": 3548} {"train_loss": -6.828858375549316, "global_step": 149056, "epoch": 3548} {"train_loss": -6.790315775644212, "global_step": 149057, "epoch": 3548, "val_loss": 78821.8984375} {"train_loss": -6.869295120239258, "global_step": 149058, "epoch": 3549} {"train_loss": -6.780193328857422, "global_step": 149059, "epoch": 3549} {"train_loss": -6.809181213378906, "global_step": 149060, "epoch": 3549} {"train_loss": -6.770376205444336, "global_step": 149061, "epoch": 3549} {"train_loss": -6.7777605056762695, "global_step": 149062, "epoch": 3549} {"train_loss": -6.832461357116699, "global_step": 149063, "epoch": 3549} {"train_loss": -6.84511137008667, "global_step": 149064, "epoch": 3549} {"train_loss": -6.828929424285889, "global_step": 149065, "epoch": 3549} {"train_loss": -6.706047534942627, "global_step": 149066, "epoch": 3549} {"train_loss": -6.867708206176758, "global_step": 149067, "epoch": 3549} {"train_loss": -6.879478931427002, "global_step": 149068, "epoch": 3549} {"train_loss": -6.828188896179199, "global_step": 149069, "epoch": 3549} {"train_loss": -6.861888408660889, "global_step": 149070, "epoch": 3549} {"train_loss": -6.938773155212402, "global_step": 149071, "epoch": 3549} {"train_loss": -6.866972923278809, "global_step": 149072, "epoch": 3549} {"train_loss": -6.865273475646973, "global_step": 149073, "epoch": 3549} {"train_loss": -6.712967872619629, "global_step": 149074, "epoch": 3549} {"train_loss": -6.837236404418945, "global_step": 149075, "epoch": 3549} {"train_loss": -6.83994722366333, "global_step": 149076, "epoch": 3549} {"train_loss": -6.843017578125, "global_step": 149077, "epoch": 3549} {"train_loss": -6.950340747833252, "global_step": 149078, "epoch": 3549} {"train_loss": -6.864918231964111, "global_step": 149079, "epoch": 3549} {"train_loss": -6.859688758850098, "global_step": 149080, "epoch": 3549} {"train_loss": -6.8347368240356445, "global_step": 149081, "epoch": 3549} {"train_loss": -6.883675575256348, "global_step": 149082, "epoch": 3549} {"train_loss": -6.845548152923584, "global_step": 149083, "epoch": 3549} {"train_loss": -6.839130401611328, "global_step": 149084, "epoch": 3549} {"train_loss": -6.901857376098633, "global_step": 149085, "epoch": 3549} {"train_loss": -6.8827691078186035, "global_step": 149086, "epoch": 3549} {"train_loss": -6.800273895263672, "global_step": 149087, "epoch": 3549} {"train_loss": -6.760045051574707, "global_step": 149088, "epoch": 3549} {"train_loss": -6.858802795410156, "global_step": 149089, "epoch": 3549} {"train_loss": -6.715129375457764, "global_step": 149090, "epoch": 3549} {"train_loss": -6.832736492156982, "global_step": 149091, "epoch": 3549} {"train_loss": -6.826970100402832, "global_step": 149092, "epoch": 3549} {"train_loss": -6.743518829345703, "global_step": 149093, "epoch": 3549} {"train_loss": -6.823939323425293, "global_step": 149094, "epoch": 3549} {"train_loss": -6.746334075927734, "global_step": 149095, "epoch": 3549} {"train_loss": -6.80640983581543, "global_step": 149096, "epoch": 3549} {"train_loss": -6.8397932052612305, "global_step": 149097, "epoch": 3549} {"train_loss": -6.818301677703857, "global_step": 149098, "epoch": 3549} {"train_loss": -6.828156743730817, "global_step": 149099, "epoch": 3549, "val_loss": 78729.375} {"train_loss": -6.867822647094727, "global_step": 149100, "epoch": 3550} {"train_loss": -6.786007404327393, "global_step": 149101, "epoch": 3550} {"train_loss": -6.9759721755981445, "global_step": 149102, "epoch": 3550} {"train_loss": -6.8545002937316895, "global_step": 149103, "epoch": 3550} {"train_loss": -6.938952445983887, "global_step": 149104, "epoch": 3550} {"train_loss": -6.75731086730957, "global_step": 149105, "epoch": 3550} {"train_loss": -6.870769500732422, "global_step": 149106, "epoch": 3550} {"train_loss": -6.892172336578369, "global_step": 149107, "epoch": 3550} {"train_loss": -6.909632205963135, "global_step": 149108, "epoch": 3550} {"train_loss": -6.976295471191406, "global_step": 149109, "epoch": 3550} {"train_loss": -6.936736583709717, "global_step": 149110, "epoch": 3550} {"train_loss": -6.934330940246582, "global_step": 149111, "epoch": 3550} {"train_loss": -6.959543228149414, "global_step": 149112, "epoch": 3550} {"train_loss": -6.8484086990356445, "global_step": 149113, "epoch": 3550} {"train_loss": -7.002318382263184, "global_step": 149114, "epoch": 3550} {"train_loss": -6.997365951538086, "global_step": 149115, "epoch": 3550} {"train_loss": -6.956382751464844, "global_step": 149116, "epoch": 3550} {"train_loss": -6.97678279876709, "global_step": 149117, "epoch": 3550} {"train_loss": -6.937475681304932, "global_step": 149118, "epoch": 3550} {"train_loss": -6.853494167327881, "global_step": 149119, "epoch": 3550} {"train_loss": -6.956360816955566, "global_step": 149120, "epoch": 3550} {"train_loss": -6.811325550079346, "global_step": 149121, "epoch": 3550} {"train_loss": -6.7423224449157715, "global_step": 149122, "epoch": 3550} {"train_loss": -6.711403846740723, "global_step": 149123, "epoch": 3550} {"train_loss": -6.940600395202637, "global_step": 149124, "epoch": 3550} {"train_loss": -6.785157680511475, "global_step": 149125, "epoch": 3550} {"train_loss": -6.911963939666748, "global_step": 149126, "epoch": 3550} {"train_loss": -6.926326751708984, "global_step": 149127, "epoch": 3550} {"train_loss": -6.834905624389648, "global_step": 149128, "epoch": 3550} {"train_loss": -6.6772966384887695, "global_step": 149129, "epoch": 3550} {"train_loss": -6.852619171142578, "global_step": 149130, "epoch": 3550} {"train_loss": -6.828779697418213, "global_step": 149131, "epoch": 3550} {"train_loss": -6.549687385559082, "global_step": 149132, "epoch": 3550} {"train_loss": -6.663503646850586, "global_step": 149133, "epoch": 3550} {"train_loss": -6.605696201324463, "global_step": 149134, "epoch": 3550} {"train_loss": -6.801461219787598, "global_step": 149135, "epoch": 3550} {"train_loss": -6.721533298492432, "global_step": 149136, "epoch": 3550} {"train_loss": -6.824619293212891, "global_step": 149137, "epoch": 3550} {"train_loss": -6.7731547355651855, "global_step": 149138, "epoch": 3550} {"train_loss": -6.700859069824219, "global_step": 149139, "epoch": 3550} {"train_loss": -6.864143371582031, "global_step": 149140, "epoch": 3550} {"train_loss": -6.844443082809448, "global_step": 149141, "epoch": 3550, "train/sim_max_reward_0": 0.39128708349040875, "train/sim_max_reward_1": 0.5588251495525944, "train/sim_max_reward_2": 0.3474520306575242, "train/sim_max_reward_3": 0.1382410920755088, "train/sim_max_reward_4": 0.9521006807495825, "train/sim_max_reward_5": 0.590787591946162, "test/sim_max_reward_4500000": 0.8534324490776865, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9160715503657475, "test/sim_max_reward_4500003": 0.9702461064499119, "test/sim_max_reward_4500004": 0.18394454412915578, "test/sim_max_reward_4500005": 0.6867660751882366, "test/sim_max_reward_4500006": 0.8605189615829831, "test/sim_max_reward_4500007": 0.9029680709228501, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.05345960344422962, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9028226560253361, "test/sim_max_reward_4500012": 0.8523876836430141, "test/sim_max_reward_4500013": 0.004534939298560809, "test/sim_max_reward_4500014": 0.4211656862167782, "test/sim_max_reward_4500015": 0.467972470218766, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.07761662694227217, "test/sim_max_reward_4500018": 0.971344202796169, "test/sim_max_reward_4500019": 0.39496762743265906, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.7743406178885535, "test/sim_max_reward_4500023": 0.9018825396579541, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.7976189890364181, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.9866133397003238, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.04864087033323357, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04885620390810934, "test/sim_max_reward_4500033": 0.15113649098778403, "test/sim_max_reward_4500034": 0.8752634682553868, "test/sim_max_reward_4500035": 0.8476526203499671, "test/sim_max_reward_4500036": 0.572709054198534, "test/sim_max_reward_4500037": 0.5627810584672277, "test/sim_max_reward_4500038": 0.3174482189564419, "test/sim_max_reward_4500039": 0.0, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.9752599686741626, "test/sim_max_reward_4500042": 0.7589946217407197, "test/sim_max_reward_4500043": 0.17619764904801263, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.5949857500249366, "test/sim_max_reward_4500046": 1.0, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.8836955361386598, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.4964489380786301, "test/mean_score": 0.4804491503410426, "val_loss": 78711.6796875} {"train_loss": -6.788060665130615, "global_step": 149142, "epoch": 3551} {"train_loss": -6.793497085571289, "global_step": 149143, "epoch": 3551} {"train_loss": -6.810657501220703, "global_step": 149144, "epoch": 3551} {"train_loss": -6.807533264160156, "global_step": 149145, "epoch": 3551} {"train_loss": -6.841678142547607, "global_step": 149146, "epoch": 3551} {"train_loss": -6.784836769104004, "global_step": 149147, "epoch": 3551} {"train_loss": -6.845156669616699, "global_step": 149148, "epoch": 3551} {"train_loss": -6.811931610107422, "global_step": 149149, "epoch": 3551} {"train_loss": -6.742035865783691, "global_step": 149150, "epoch": 3551} {"train_loss": -6.824012279510498, "global_step": 149151, "epoch": 3551} {"train_loss": -6.8295111656188965, "global_step": 149152, "epoch": 3551} {"train_loss": -6.559787273406982, "global_step": 149153, "epoch": 3551} {"train_loss": -6.838724136352539, "global_step": 149154, "epoch": 3551} {"train_loss": -6.716503620147705, "global_step": 149155, "epoch": 3551} {"train_loss": -6.762605667114258, "global_step": 149156, "epoch": 3551} {"train_loss": -6.846484184265137, "global_step": 149157, "epoch": 3551} {"train_loss": -6.738975524902344, "global_step": 149158, "epoch": 3551} {"train_loss": -6.809744834899902, "global_step": 149159, "epoch": 3551} {"train_loss": -6.856639862060547, "global_step": 149160, "epoch": 3551} {"train_loss": -6.804595947265625, "global_step": 149161, "epoch": 3551} {"train_loss": -6.7063751220703125, "global_step": 149162, "epoch": 3551} {"train_loss": -6.778776168823242, "global_step": 149163, "epoch": 3551} {"train_loss": -6.814953804016113, "global_step": 149164, "epoch": 3551} {"train_loss": -6.879711627960205, "global_step": 149165, "epoch": 3551} {"train_loss": -6.865508556365967, "global_step": 149166, "epoch": 3551} {"train_loss": -6.779463768005371, "global_step": 149167, "epoch": 3551} {"train_loss": -6.918490886688232, "global_step": 149168, "epoch": 3551} {"train_loss": -6.8587117195129395, "global_step": 149169, "epoch": 3551} {"train_loss": -6.897197723388672, "global_step": 149170, "epoch": 3551} {"train_loss": -6.908756732940674, "global_step": 149171, "epoch": 3551} {"train_loss": -6.936115264892578, "global_step": 149172, "epoch": 3551} {"train_loss": -6.897012233734131, "global_step": 149173, "epoch": 3551} {"train_loss": -6.8225250244140625, "global_step": 149174, "epoch": 3551} {"train_loss": -6.9530534744262695, "global_step": 149175, "epoch": 3551} {"train_loss": -6.827808380126953, "global_step": 149176, "epoch": 3551} {"train_loss": -6.722694396972656, "global_step": 149177, "epoch": 3551} {"train_loss": -6.8959503173828125, "global_step": 149178, "epoch": 3551} {"train_loss": -6.775146484375, "global_step": 149179, "epoch": 3551} {"train_loss": -6.847607612609863, "global_step": 149180, "epoch": 3551} {"train_loss": -6.894965171813965, "global_step": 149181, "epoch": 3551} {"train_loss": -6.903090953826904, "global_step": 149182, "epoch": 3551} {"train_loss": -6.82331911722819, "global_step": 149183, "epoch": 3551, "val_loss": 78784.3828125} {"train_loss": -6.938017845153809, "global_step": 149184, "epoch": 3552} {"train_loss": -6.972647666931152, "global_step": 149185, "epoch": 3552} {"train_loss": -6.93120002746582, "global_step": 149186, "epoch": 3552} {"train_loss": -6.948309898376465, "global_step": 149187, "epoch": 3552} {"train_loss": -6.9206438064575195, "global_step": 149188, "epoch": 3552} {"train_loss": -6.80573844909668, "global_step": 149189, "epoch": 3552} {"train_loss": -6.916512489318848, "global_step": 149190, "epoch": 3552} {"train_loss": -6.818734169006348, "global_step": 149191, "epoch": 3552} {"train_loss": -6.955901622772217, "global_step": 149192, "epoch": 3552} {"train_loss": -6.85594367980957, "global_step": 149193, "epoch": 3552} {"train_loss": -6.935924530029297, "global_step": 149194, "epoch": 3552} {"train_loss": -6.900803565979004, "global_step": 149195, "epoch": 3552} {"train_loss": -6.855847358703613, "global_step": 149196, "epoch": 3552} {"train_loss": -6.854371547698975, "global_step": 149197, "epoch": 3552} {"train_loss": -6.742504596710205, "global_step": 149198, "epoch": 3552} {"train_loss": -6.864249229431152, "global_step": 149199, "epoch": 3552} {"train_loss": -6.800083160400391, "global_step": 149200, "epoch": 3552} {"train_loss": -6.7254319190979, "global_step": 149201, "epoch": 3552} {"train_loss": -6.858713150024414, "global_step": 149202, "epoch": 3552} {"train_loss": -6.832131385803223, "global_step": 149203, "epoch": 3552} {"train_loss": -6.838472843170166, "global_step": 149204, "epoch": 3552} {"train_loss": -6.8836259841918945, "global_step": 149205, "epoch": 3552} {"train_loss": -6.803434371948242, "global_step": 149206, "epoch": 3552} {"train_loss": -6.918779373168945, "global_step": 149207, "epoch": 3552} {"train_loss": -6.874706268310547, "global_step": 149208, "epoch": 3552} {"train_loss": -6.874536037445068, "global_step": 149209, "epoch": 3552} {"train_loss": -6.909965515136719, "global_step": 149210, "epoch": 3552} {"train_loss": -6.799770832061768, "global_step": 149211, "epoch": 3552} {"train_loss": -6.779816150665283, "global_step": 149212, "epoch": 3552} {"train_loss": -6.860944747924805, "global_step": 149213, "epoch": 3552} {"train_loss": -6.931822776794434, "global_step": 149214, "epoch": 3552} {"train_loss": -6.894772052764893, "global_step": 149215, "epoch": 3552} {"train_loss": -6.8707804679870605, "global_step": 149216, "epoch": 3552} {"train_loss": -6.967728614807129, "global_step": 149217, "epoch": 3552} {"train_loss": -6.956575393676758, "global_step": 149218, "epoch": 3552} {"train_loss": -6.9383931159973145, "global_step": 149219, "epoch": 3552} {"train_loss": -6.826749801635742, "global_step": 149220, "epoch": 3552} {"train_loss": -6.817810535430908, "global_step": 149221, "epoch": 3552} {"train_loss": -6.80181884765625, "global_step": 149222, "epoch": 3552} {"train_loss": -6.8537774085998535, "global_step": 149223, "epoch": 3552} {"train_loss": -6.8736162185668945, "global_step": 149224, "epoch": 3552} {"train_loss": -6.87126628557841, "global_step": 149225, "epoch": 3552, "val_loss": 78619.03125} {"train_loss": -6.777359962463379, "global_step": 149226, "epoch": 3553} {"train_loss": -6.753658294677734, "global_step": 149227, "epoch": 3553} {"train_loss": -6.812647342681885, "global_step": 149228, "epoch": 3553} {"train_loss": -6.804762840270996, "global_step": 149229, "epoch": 3553} {"train_loss": -6.827615737915039, "global_step": 149230, "epoch": 3553} {"train_loss": -6.766238212585449, "global_step": 149231, "epoch": 3553} {"train_loss": -6.82283353805542, "global_step": 149232, "epoch": 3553} {"train_loss": -6.8427734375, "global_step": 149233, "epoch": 3553} {"train_loss": -6.929908752441406, "global_step": 149234, "epoch": 3553} {"train_loss": -6.845690727233887, "global_step": 149235, "epoch": 3553} {"train_loss": -6.9071455001831055, "global_step": 149236, "epoch": 3553} {"train_loss": -6.967532157897949, "global_step": 149237, "epoch": 3553} {"train_loss": -6.870511054992676, "global_step": 149238, "epoch": 3553} {"train_loss": -6.827492713928223, "global_step": 149239, "epoch": 3553} {"train_loss": -6.9097466468811035, "global_step": 149240, "epoch": 3553} {"train_loss": -6.81840181350708, "global_step": 149241, "epoch": 3553} {"train_loss": -7.036091327667236, "global_step": 149242, "epoch": 3553} {"train_loss": -6.98988676071167, "global_step": 149243, "epoch": 3553} {"train_loss": -6.802881240844727, "global_step": 149244, "epoch": 3553} {"train_loss": -6.819135665893555, "global_step": 149245, "epoch": 3553} {"train_loss": -6.996779441833496, "global_step": 149246, "epoch": 3553} {"train_loss": -6.887664794921875, "global_step": 149247, "epoch": 3553} {"train_loss": -6.860278129577637, "global_step": 149248, "epoch": 3553} {"train_loss": -6.823180198669434, "global_step": 149249, "epoch": 3553} {"train_loss": -6.739468574523926, "global_step": 149250, "epoch": 3553} {"train_loss": -6.714236259460449, "global_step": 149251, "epoch": 3553} {"train_loss": -6.867921829223633, "global_step": 149252, "epoch": 3553} {"train_loss": -6.770430564880371, "global_step": 149253, "epoch": 3553} {"train_loss": -6.673581123352051, "global_step": 149254, "epoch": 3553} {"train_loss": -6.811801910400391, "global_step": 149255, "epoch": 3553} {"train_loss": -6.807516098022461, "global_step": 149256, "epoch": 3553} {"train_loss": -6.823486328125, "global_step": 149257, "epoch": 3553} {"train_loss": -6.694364070892334, "global_step": 149258, "epoch": 3553} {"train_loss": -6.799133777618408, "global_step": 149259, "epoch": 3553} {"train_loss": -6.806761741638184, "global_step": 149260, "epoch": 3553} {"train_loss": -6.882172107696533, "global_step": 149261, "epoch": 3553} {"train_loss": -6.928075790405273, "global_step": 149262, "epoch": 3553} {"train_loss": -6.754854202270508, "global_step": 149263, "epoch": 3553} {"train_loss": -6.867993354797363, "global_step": 149264, "epoch": 3553} {"train_loss": -6.6899614334106445, "global_step": 149265, "epoch": 3553} {"train_loss": -6.835456371307373, "global_step": 149266, "epoch": 3553} {"train_loss": -6.835158620561872, "global_step": 149267, "epoch": 3553, "val_loss": 78997.3359375} {"train_loss": -6.817678451538086, "global_step": 149268, "epoch": 3554} {"train_loss": -6.9584856033325195, "global_step": 149269, "epoch": 3554} {"train_loss": -6.923989295959473, "global_step": 149270, "epoch": 3554} {"train_loss": -6.963928699493408, "global_step": 149271, "epoch": 3554} {"train_loss": -6.803956985473633, "global_step": 149272, "epoch": 3554} {"train_loss": -6.946453094482422, "global_step": 149273, "epoch": 3554} {"train_loss": -6.771244525909424, "global_step": 149274, "epoch": 3554} {"train_loss": -6.8999223709106445, "global_step": 149275, "epoch": 3554} {"train_loss": -6.92213773727417, "global_step": 149276, "epoch": 3554} {"train_loss": -6.914925575256348, "global_step": 149277, "epoch": 3554} {"train_loss": -6.900008201599121, "global_step": 149278, "epoch": 3554} {"train_loss": -6.825520992279053, "global_step": 149279, "epoch": 3554} {"train_loss": -6.943325519561768, "global_step": 149280, "epoch": 3554} {"train_loss": -6.961698532104492, "global_step": 149281, "epoch": 3554} {"train_loss": -6.756842613220215, "global_step": 149282, "epoch": 3554} {"train_loss": -6.811063766479492, "global_step": 149283, "epoch": 3554} {"train_loss": -6.8502631187438965, "global_step": 149284, "epoch": 3554} {"train_loss": -6.8115386962890625, "global_step": 149285, "epoch": 3554} {"train_loss": -6.841286659240723, "global_step": 149286, "epoch": 3554} {"train_loss": -6.9655656814575195, "global_step": 149287, "epoch": 3554} {"train_loss": -6.899529457092285, "global_step": 149288, "epoch": 3554} {"train_loss": -7.05055046081543, "global_step": 149289, "epoch": 3554} {"train_loss": -6.846584320068359, "global_step": 149290, "epoch": 3554} {"train_loss": -6.840787410736084, "global_step": 149291, "epoch": 3554} {"train_loss": -6.850222110748291, "global_step": 149292, "epoch": 3554} {"train_loss": -6.791029930114746, "global_step": 149293, "epoch": 3554} {"train_loss": -6.9092607498168945, "global_step": 149294, "epoch": 3554} {"train_loss": -6.862142562866211, "global_step": 149295, "epoch": 3554} {"train_loss": -6.89748477935791, "global_step": 149296, "epoch": 3554} {"train_loss": -6.822113513946533, "global_step": 149297, "epoch": 3554} {"train_loss": -6.814618110656738, "global_step": 149298, "epoch": 3554} {"train_loss": -6.83681583404541, "global_step": 149299, "epoch": 3554} {"train_loss": -6.949403762817383, "global_step": 149300, "epoch": 3554} {"train_loss": -6.829129219055176, "global_step": 149301, "epoch": 3554} {"train_loss": -6.948392868041992, "global_step": 149302, "epoch": 3554} {"train_loss": -6.925712585449219, "global_step": 149303, "epoch": 3554} {"train_loss": -6.769871711730957, "global_step": 149304, "epoch": 3554} {"train_loss": -6.915214538574219, "global_step": 149305, "epoch": 3554} {"train_loss": -6.951559543609619, "global_step": 149306, "epoch": 3554} {"train_loss": -6.849330425262451, "global_step": 149307, "epoch": 3554} {"train_loss": -6.959899425506592, "global_step": 149308, "epoch": 3554} {"train_loss": -6.88038284437997, "global_step": 149309, "epoch": 3554, "val_loss": 78644.0390625} {"train_loss": -6.897083759307861, "global_step": 149310, "epoch": 3555} {"train_loss": -6.887977123260498, "global_step": 149311, "epoch": 3555} {"train_loss": -6.819741249084473, "global_step": 149312, "epoch": 3555} {"train_loss": -6.937274932861328, "global_step": 149313, "epoch": 3555} {"train_loss": -6.856866836547852, "global_step": 149314, "epoch": 3555} {"train_loss": -6.867263317108154, "global_step": 149315, "epoch": 3555} {"train_loss": -6.804211139678955, "global_step": 149316, "epoch": 3555} {"train_loss": -6.8608598709106445, "global_step": 149317, "epoch": 3555} {"train_loss": -6.825103759765625, "global_step": 149318, "epoch": 3555} {"train_loss": -6.885019302368164, "global_step": 149319, "epoch": 3555} {"train_loss": -6.85630464553833, "global_step": 149320, "epoch": 3555} {"train_loss": -6.805181503295898, "global_step": 149321, "epoch": 3555} {"train_loss": -6.701136112213135, "global_step": 149322, "epoch": 3555} {"train_loss": -6.8330583572387695, "global_step": 149323, "epoch": 3555} {"train_loss": -6.8162994384765625, "global_step": 149324, "epoch": 3555} {"train_loss": -6.829350471496582, "global_step": 149325, "epoch": 3555} {"train_loss": -6.902048110961914, "global_step": 149326, "epoch": 3555} {"train_loss": -6.821842193603516, "global_step": 149327, "epoch": 3555} {"train_loss": -6.869450569152832, "global_step": 149328, "epoch": 3555} {"train_loss": -6.8165388107299805, "global_step": 149329, "epoch": 3555} {"train_loss": -6.899261474609375, "global_step": 149330, "epoch": 3555} {"train_loss": -6.787055015563965, "global_step": 149331, "epoch": 3555} {"train_loss": -6.743552207946777, "global_step": 149332, "epoch": 3555} {"train_loss": -6.94256067276001, "global_step": 149333, "epoch": 3555} {"train_loss": -6.599190711975098, "global_step": 149334, "epoch": 3555} {"train_loss": -6.767592430114746, "global_step": 149335, "epoch": 3555} {"train_loss": -6.581701278686523, "global_step": 149336, "epoch": 3555} {"train_loss": -6.838929653167725, "global_step": 149337, "epoch": 3555} {"train_loss": -6.741208553314209, "global_step": 149338, "epoch": 3555} {"train_loss": -6.611667156219482, "global_step": 149339, "epoch": 3555} {"train_loss": -6.783679008483887, "global_step": 149340, "epoch": 3555} {"train_loss": -6.653298854827881, "global_step": 149341, "epoch": 3555} {"train_loss": -6.86611795425415, "global_step": 149342, "epoch": 3555} {"train_loss": -6.783633232116699, "global_step": 149343, "epoch": 3555} {"train_loss": -6.770452499389648, "global_step": 149344, "epoch": 3555} {"train_loss": -6.71510648727417, "global_step": 149345, "epoch": 3555} {"train_loss": -6.875893592834473, "global_step": 149346, "epoch": 3555} {"train_loss": -6.822029113769531, "global_step": 149347, "epoch": 3555} {"train_loss": -6.753264427185059, "global_step": 149348, "epoch": 3555} {"train_loss": -6.7634782791137695, "global_step": 149349, "epoch": 3555} {"train_loss": -6.7710418701171875, "global_step": 149350, "epoch": 3555} {"train_loss": -6.804626010713124, "global_step": 149351, "epoch": 3555, "val_loss": 78663.75} {"train_loss": -6.90817403793335, "global_step": 149352, "epoch": 3556} {"train_loss": -6.851940155029297, "global_step": 149353, "epoch": 3556} {"train_loss": -6.928158760070801, "global_step": 149354, "epoch": 3556} {"train_loss": -6.883831977844238, "global_step": 149355, "epoch": 3556} {"train_loss": -6.833776473999023, "global_step": 149356, "epoch": 3556} {"train_loss": -6.750511169433594, "global_step": 149357, "epoch": 3556} {"train_loss": -6.912576675415039, "global_step": 149358, "epoch": 3556} {"train_loss": -6.8717241287231445, "global_step": 149359, "epoch": 3556} {"train_loss": -6.788145065307617, "global_step": 149360, "epoch": 3556} {"train_loss": -6.84592342376709, "global_step": 149361, "epoch": 3556} {"train_loss": -6.819859504699707, "global_step": 149362, "epoch": 3556} {"train_loss": -6.821853160858154, "global_step": 149363, "epoch": 3556} {"train_loss": -6.777309417724609, "global_step": 149364, "epoch": 3556} {"train_loss": -6.763216495513916, "global_step": 149365, "epoch": 3556} {"train_loss": -6.724386215209961, "global_step": 149366, "epoch": 3556} {"train_loss": -6.848188400268555, "global_step": 149367, "epoch": 3556} {"train_loss": -6.808468818664551, "global_step": 149368, "epoch": 3556} {"train_loss": -6.800376892089844, "global_step": 149369, "epoch": 3556} {"train_loss": -6.804228782653809, "global_step": 149370, "epoch": 3556} {"train_loss": -6.591310501098633, "global_step": 149371, "epoch": 3556} {"train_loss": -6.874587535858154, "global_step": 149372, "epoch": 3556} {"train_loss": -6.812479496002197, "global_step": 149373, "epoch": 3556} {"train_loss": -6.663311004638672, "global_step": 149374, "epoch": 3556} {"train_loss": -6.869421482086182, "global_step": 149375, "epoch": 3556} {"train_loss": -6.8475446701049805, "global_step": 149376, "epoch": 3556} {"train_loss": -6.876412868499756, "global_step": 149377, "epoch": 3556} {"train_loss": -6.748766899108887, "global_step": 149378, "epoch": 3556} {"train_loss": -6.58255672454834, "global_step": 149379, "epoch": 3556} {"train_loss": -6.801750183105469, "global_step": 149380, "epoch": 3556} {"train_loss": -6.952915668487549, "global_step": 149381, "epoch": 3556} {"train_loss": -6.867530345916748, "global_step": 149382, "epoch": 3556} {"train_loss": -6.886814117431641, "global_step": 149383, "epoch": 3556} {"train_loss": -6.767556190490723, "global_step": 149384, "epoch": 3556} {"train_loss": -6.878167152404785, "global_step": 149385, "epoch": 3556} {"train_loss": -6.884197235107422, "global_step": 149386, "epoch": 3556} {"train_loss": -6.848051071166992, "global_step": 149387, "epoch": 3556} {"train_loss": -6.930995941162109, "global_step": 149388, "epoch": 3556} {"train_loss": -6.7083892822265625, "global_step": 149389, "epoch": 3556} {"train_loss": -6.8975300788879395, "global_step": 149390, "epoch": 3556} {"train_loss": -6.839542388916016, "global_step": 149391, "epoch": 3556} {"train_loss": -6.849508285522461, "global_step": 149392, "epoch": 3556} {"train_loss": -6.823662780580067, "global_step": 149393, "epoch": 3556, "val_loss": 78710.765625} {"train_loss": -6.874914169311523, "global_step": 149394, "epoch": 3557} {"train_loss": -6.9904046058654785, "global_step": 149395, "epoch": 3557} {"train_loss": -6.795519828796387, "global_step": 149396, "epoch": 3557} {"train_loss": -6.928012371063232, "global_step": 149397, "epoch": 3557} {"train_loss": -6.794203758239746, "global_step": 149398, "epoch": 3557} {"train_loss": -6.904836654663086, "global_step": 149399, "epoch": 3557} {"train_loss": -6.795140266418457, "global_step": 149400, "epoch": 3557} {"train_loss": -6.809024333953857, "global_step": 149401, "epoch": 3557} {"train_loss": -6.852880001068115, "global_step": 149402, "epoch": 3557} {"train_loss": -6.714700698852539, "global_step": 149403, "epoch": 3557} {"train_loss": -6.8956298828125, "global_step": 149404, "epoch": 3557} {"train_loss": -6.910574436187744, "global_step": 149405, "epoch": 3557} {"train_loss": -6.770480155944824, "global_step": 149406, "epoch": 3557} {"train_loss": -6.6985578536987305, "global_step": 149407, "epoch": 3557} {"train_loss": -6.847038269042969, "global_step": 149408, "epoch": 3557} {"train_loss": -6.785646915435791, "global_step": 149409, "epoch": 3557} {"train_loss": -6.746338367462158, "global_step": 149410, "epoch": 3557} {"train_loss": -6.8063554763793945, "global_step": 149411, "epoch": 3557} {"train_loss": -6.830113410949707, "global_step": 149412, "epoch": 3557} {"train_loss": -6.672507286071777, "global_step": 149413, "epoch": 3557} {"train_loss": -6.865509986877441, "global_step": 149414, "epoch": 3557} {"train_loss": -6.86619758605957, "global_step": 149415, "epoch": 3557} {"train_loss": -6.86814546585083, "global_step": 149416, "epoch": 3557} {"train_loss": -6.860894680023193, "global_step": 149417, "epoch": 3557} {"train_loss": -6.74684476852417, "global_step": 149418, "epoch": 3557} {"train_loss": -6.800113677978516, "global_step": 149419, "epoch": 3557} {"train_loss": -6.837893486022949, "global_step": 149420, "epoch": 3557} {"train_loss": -6.81484317779541, "global_step": 149421, "epoch": 3557} {"train_loss": -6.816853046417236, "global_step": 149422, "epoch": 3557} {"train_loss": -6.732888698577881, "global_step": 149423, "epoch": 3557} {"train_loss": -6.550252914428711, "global_step": 149424, "epoch": 3557} {"train_loss": -6.580568790435791, "global_step": 149425, "epoch": 3557} {"train_loss": -6.775712490081787, "global_step": 149426, "epoch": 3557} {"train_loss": -6.645588397979736, "global_step": 149427, "epoch": 3557} {"train_loss": -6.707538604736328, "global_step": 149428, "epoch": 3557} {"train_loss": -6.66141939163208, "global_step": 149429, "epoch": 3557} {"train_loss": -6.791412353515625, "global_step": 149430, "epoch": 3557} {"train_loss": -6.816080093383789, "global_step": 149431, "epoch": 3557} {"train_loss": -6.684255123138428, "global_step": 149432, "epoch": 3557} {"train_loss": -6.723481178283691, "global_step": 149433, "epoch": 3557} {"train_loss": -6.746696949005127, "global_step": 149434, "epoch": 3557} {"train_loss": -6.786071345919654, "global_step": 149435, "epoch": 3557, "val_loss": 79194.1015625} {"train_loss": -6.739094257354736, "global_step": 149436, "epoch": 3558} {"train_loss": -6.782923698425293, "global_step": 149437, "epoch": 3558} {"train_loss": -6.809919357299805, "global_step": 149438, "epoch": 3558} {"train_loss": -6.8667707443237305, "global_step": 149439, "epoch": 3558} {"train_loss": -6.73834753036499, "global_step": 149440, "epoch": 3558} {"train_loss": -6.790650367736816, "global_step": 149441, "epoch": 3558} {"train_loss": -6.690150260925293, "global_step": 149442, "epoch": 3558} {"train_loss": -6.757224082946777, "global_step": 149443, "epoch": 3558} {"train_loss": -6.7083635330200195, "global_step": 149444, "epoch": 3558} {"train_loss": -6.904955863952637, "global_step": 149445, "epoch": 3558} {"train_loss": -6.62689208984375, "global_step": 149446, "epoch": 3558} {"train_loss": -6.666018009185791, "global_step": 149447, "epoch": 3558} {"train_loss": -6.822394371032715, "global_step": 149448, "epoch": 3558} {"train_loss": -6.720431327819824, "global_step": 149449, "epoch": 3558} {"train_loss": -6.749178886413574, "global_step": 149450, "epoch": 3558} {"train_loss": -6.812607288360596, "global_step": 149451, "epoch": 3558} {"train_loss": -6.931754112243652, "global_step": 149452, "epoch": 3558} {"train_loss": -6.786774158477783, "global_step": 149453, "epoch": 3558} {"train_loss": -6.885169982910156, "global_step": 149454, "epoch": 3558} {"train_loss": -6.948218822479248, "global_step": 149455, "epoch": 3558} {"train_loss": -6.9101057052612305, "global_step": 149456, "epoch": 3558} {"train_loss": -6.863038063049316, "global_step": 149457, "epoch": 3558} {"train_loss": -6.7795586585998535, "global_step": 149458, "epoch": 3558} {"train_loss": -6.830718994140625, "global_step": 149459, "epoch": 3558} {"train_loss": -6.747175693511963, "global_step": 149460, "epoch": 3558} {"train_loss": -6.973945617675781, "global_step": 149461, "epoch": 3558} {"train_loss": -6.900933265686035, "global_step": 149462, "epoch": 3558} {"train_loss": -6.799141883850098, "global_step": 149463, "epoch": 3558} {"train_loss": -6.882786273956299, "global_step": 149464, "epoch": 3558} {"train_loss": -6.828991889953613, "global_step": 149465, "epoch": 3558} {"train_loss": -6.773721218109131, "global_step": 149466, "epoch": 3558} {"train_loss": -6.841525077819824, "global_step": 149467, "epoch": 3558} {"train_loss": -6.86797571182251, "global_step": 149468, "epoch": 3558} {"train_loss": -6.982160568237305, "global_step": 149469, "epoch": 3558} {"train_loss": -6.930057525634766, "global_step": 149470, "epoch": 3558} {"train_loss": -6.892009735107422, "global_step": 149471, "epoch": 3558} {"train_loss": -7.004733085632324, "global_step": 149472, "epoch": 3558} {"train_loss": -6.837143898010254, "global_step": 149473, "epoch": 3558} {"train_loss": -6.841333389282227, "global_step": 149474, "epoch": 3558} {"train_loss": -6.748885154724121, "global_step": 149475, "epoch": 3558} {"train_loss": -6.862622261047363, "global_step": 149476, "epoch": 3558} {"train_loss": -6.827566850753057, "global_step": 149477, "epoch": 3558, "val_loss": 78526.3984375} {"train_loss": -6.892534255981445, "global_step": 149478, "epoch": 3559} {"train_loss": -6.947101593017578, "global_step": 149479, "epoch": 3559} {"train_loss": -6.938045501708984, "global_step": 149480, "epoch": 3559} {"train_loss": -6.953361988067627, "global_step": 149481, "epoch": 3559} {"train_loss": -6.869030952453613, "global_step": 149482, "epoch": 3559} {"train_loss": -7.050106048583984, "global_step": 149483, "epoch": 3559} {"train_loss": -6.958629608154297, "global_step": 149484, "epoch": 3559} {"train_loss": -6.794068336486816, "global_step": 149485, "epoch": 3559} {"train_loss": -6.852441787719727, "global_step": 149486, "epoch": 3559} {"train_loss": -6.950085163116455, "global_step": 149487, "epoch": 3559} {"train_loss": -6.918000221252441, "global_step": 149488, "epoch": 3559} {"train_loss": -6.8685150146484375, "global_step": 149489, "epoch": 3559} {"train_loss": -6.84475564956665, "global_step": 149490, "epoch": 3559} {"train_loss": -6.9183454513549805, "global_step": 149491, "epoch": 3559} {"train_loss": -6.951296806335449, "global_step": 149492, "epoch": 3559} {"train_loss": -6.949492454528809, "global_step": 149493, "epoch": 3559} {"train_loss": -6.8919148445129395, "global_step": 149494, "epoch": 3559} {"train_loss": -6.884757995605469, "global_step": 149495, "epoch": 3559} {"train_loss": -6.922022819519043, "global_step": 149496, "epoch": 3559} {"train_loss": -6.773994445800781, "global_step": 149497, "epoch": 3559} {"train_loss": -6.769012928009033, "global_step": 149498, "epoch": 3559} {"train_loss": -6.998189449310303, "global_step": 149499, "epoch": 3559} {"train_loss": -6.857728004455566, "global_step": 149500, "epoch": 3559} {"train_loss": -6.961150169372559, "global_step": 149501, "epoch": 3559} {"train_loss": -6.862392902374268, "global_step": 149502, "epoch": 3559} {"train_loss": -6.857473373413086, "global_step": 149503, "epoch": 3559} {"train_loss": -6.861898422241211, "global_step": 149504, "epoch": 3559} {"train_loss": -6.92764949798584, "global_step": 149505, "epoch": 3559} {"train_loss": -6.882105350494385, "global_step": 149506, "epoch": 3559} {"train_loss": -7.004111289978027, "global_step": 149507, "epoch": 3559} {"train_loss": -6.983678340911865, "global_step": 149508, "epoch": 3559} {"train_loss": -6.890939235687256, "global_step": 149509, "epoch": 3559} {"train_loss": -6.931839466094971, "global_step": 149510, "epoch": 3559} {"train_loss": -6.905733108520508, "global_step": 149511, "epoch": 3559} {"train_loss": -6.8900861740112305, "global_step": 149512, "epoch": 3559} {"train_loss": -6.978231430053711, "global_step": 149513, "epoch": 3559} {"train_loss": -6.8976030349731445, "global_step": 149514, "epoch": 3559} {"train_loss": -6.910879135131836, "global_step": 149515, "epoch": 3559} {"train_loss": -6.833479881286621, "global_step": 149516, "epoch": 3559} {"train_loss": -6.8723955154418945, "global_step": 149517, "epoch": 3559} {"train_loss": -6.911557197570801, "global_step": 149518, "epoch": 3559} {"train_loss": -6.905671392168317, "global_step": 149519, "epoch": 3559, "val_loss": 78581.78125} {"train_loss": -6.938995361328125, "global_step": 149520, "epoch": 3560} {"train_loss": -6.830585479736328, "global_step": 149521, "epoch": 3560} {"train_loss": -6.784722328186035, "global_step": 149522, "epoch": 3560} {"train_loss": -6.904194355010986, "global_step": 149523, "epoch": 3560} {"train_loss": -6.865955352783203, "global_step": 149524, "epoch": 3560} {"train_loss": -6.772671699523926, "global_step": 149525, "epoch": 3560} {"train_loss": -6.828854560852051, "global_step": 149526, "epoch": 3560} {"train_loss": -6.99782657623291, "global_step": 149527, "epoch": 3560} {"train_loss": -6.949526786804199, "global_step": 149528, "epoch": 3560} {"train_loss": -6.855802536010742, "global_step": 149529, "epoch": 3560} {"train_loss": -6.9266438484191895, "global_step": 149530, "epoch": 3560} {"train_loss": -6.750401973724365, "global_step": 149531, "epoch": 3560} {"train_loss": -6.902227401733398, "global_step": 149532, "epoch": 3560} {"train_loss": -6.7478413581848145, "global_step": 149533, "epoch": 3560} {"train_loss": -6.79636287689209, "global_step": 149534, "epoch": 3560} {"train_loss": -6.906164169311523, "global_step": 149535, "epoch": 3560} {"train_loss": -6.940027236938477, "global_step": 149536, "epoch": 3560} {"train_loss": -6.856473922729492, "global_step": 149537, "epoch": 3560} {"train_loss": -6.831729888916016, "global_step": 149538, "epoch": 3560} {"train_loss": -6.88926887512207, "global_step": 149539, "epoch": 3560} {"train_loss": -6.80845832824707, "global_step": 149540, "epoch": 3560} {"train_loss": -6.809699058532715, "global_step": 149541, "epoch": 3560} {"train_loss": -6.740109443664551, "global_step": 149542, "epoch": 3560} {"train_loss": -6.808468818664551, "global_step": 149543, "epoch": 3560} {"train_loss": -6.883674144744873, "global_step": 149544, "epoch": 3560} {"train_loss": -6.862961769104004, "global_step": 149545, "epoch": 3560} {"train_loss": -6.892831325531006, "global_step": 149546, "epoch": 3560} {"train_loss": -6.874516010284424, "global_step": 149547, "epoch": 3560} {"train_loss": -6.805159091949463, "global_step": 149548, "epoch": 3560} {"train_loss": -6.899521827697754, "global_step": 149549, "epoch": 3560} {"train_loss": -6.996672630310059, "global_step": 149550, "epoch": 3560} {"train_loss": -6.859561920166016, "global_step": 149551, "epoch": 3560} {"train_loss": -6.892679214477539, "global_step": 149552, "epoch": 3560} {"train_loss": -6.851445198059082, "global_step": 149553, "epoch": 3560} {"train_loss": -6.888623237609863, "global_step": 149554, "epoch": 3560} {"train_loss": -6.955747127532959, "global_step": 149555, "epoch": 3560} {"train_loss": -6.82153844833374, "global_step": 149556, "epoch": 3560} {"train_loss": -6.882380485534668, "global_step": 149557, "epoch": 3560} {"train_loss": -6.8231282234191895, "global_step": 149558, "epoch": 3560} {"train_loss": -6.835971832275391, "global_step": 149559, "epoch": 3560} {"train_loss": -6.907200813293457, "global_step": 149560, "epoch": 3560} {"train_loss": -6.862595444633847, "global_step": 149561, "epoch": 3560, "val_loss": 78815.4453125} {"train_loss": -6.885237693786621, "global_step": 149562, "epoch": 3561} {"train_loss": -6.707033157348633, "global_step": 149563, "epoch": 3561} {"train_loss": -6.728301525115967, "global_step": 149564, "epoch": 3561} {"train_loss": -6.697112083435059, "global_step": 149565, "epoch": 3561} {"train_loss": -6.965549468994141, "global_step": 149566, "epoch": 3561} {"train_loss": -6.9056806564331055, "global_step": 149567, "epoch": 3561} {"train_loss": -6.821785926818848, "global_step": 149568, "epoch": 3561} {"train_loss": -6.877285480499268, "global_step": 149569, "epoch": 3561} {"train_loss": -6.897157669067383, "global_step": 149570, "epoch": 3561} {"train_loss": -6.9448747634887695, "global_step": 149571, "epoch": 3561} {"train_loss": -6.860048770904541, "global_step": 149572, "epoch": 3561} {"train_loss": -6.886412143707275, "global_step": 149573, "epoch": 3561} {"train_loss": -6.908693790435791, "global_step": 149574, "epoch": 3561} {"train_loss": -6.794413089752197, "global_step": 149575, "epoch": 3561} {"train_loss": -6.870206832885742, "global_step": 149576, "epoch": 3561} {"train_loss": -6.869449615478516, "global_step": 149577, "epoch": 3561} {"train_loss": -6.790700912475586, "global_step": 149578, "epoch": 3561} {"train_loss": -6.828444004058838, "global_step": 149579, "epoch": 3561} {"train_loss": -6.877202987670898, "global_step": 149580, "epoch": 3561} {"train_loss": -6.704710483551025, "global_step": 149581, "epoch": 3561} {"train_loss": -6.781447410583496, "global_step": 149582, "epoch": 3561} {"train_loss": -6.8001604080200195, "global_step": 149583, "epoch": 3561} {"train_loss": -6.792590141296387, "global_step": 149584, "epoch": 3561} {"train_loss": -6.833802700042725, "global_step": 149585, "epoch": 3561} {"train_loss": -6.934129238128662, "global_step": 149586, "epoch": 3561} {"train_loss": -6.873591423034668, "global_step": 149587, "epoch": 3561} {"train_loss": -6.835358619689941, "global_step": 149588, "epoch": 3561} {"train_loss": -6.900805950164795, "global_step": 149589, "epoch": 3561} {"train_loss": -6.860871315002441, "global_step": 149590, "epoch": 3561} {"train_loss": -6.898172855377197, "global_step": 149591, "epoch": 3561} {"train_loss": -6.803425312042236, "global_step": 149592, "epoch": 3561} {"train_loss": -6.866453170776367, "global_step": 149593, "epoch": 3561} {"train_loss": -6.8540143966674805, "global_step": 149594, "epoch": 3561} {"train_loss": -6.786909103393555, "global_step": 149595, "epoch": 3561} {"train_loss": -6.831206321716309, "global_step": 149596, "epoch": 3561} {"train_loss": -6.777370452880859, "global_step": 149597, "epoch": 3561} {"train_loss": -6.79554557800293, "global_step": 149598, "epoch": 3561} {"train_loss": -6.752852439880371, "global_step": 149599, "epoch": 3561} {"train_loss": -6.8274641036987305, "global_step": 149600, "epoch": 3561} {"train_loss": -6.831331253051758, "global_step": 149601, "epoch": 3561} {"train_loss": -6.77971887588501, "global_step": 149602, "epoch": 3561} {"train_loss": -6.836183638799758, "global_step": 149603, "epoch": 3561, "val_loss": 78844.5} {"train_loss": -6.771908283233643, "global_step": 149604, "epoch": 3562} {"train_loss": -6.895284652709961, "global_step": 149605, "epoch": 3562} {"train_loss": -6.7916579246521, "global_step": 149606, "epoch": 3562} {"train_loss": -6.876748085021973, "global_step": 149607, "epoch": 3562} {"train_loss": -6.782917022705078, "global_step": 149608, "epoch": 3562} {"train_loss": -6.777094841003418, "global_step": 149609, "epoch": 3562} {"train_loss": -6.9034342765808105, "global_step": 149610, "epoch": 3562} {"train_loss": -6.790369510650635, "global_step": 149611, "epoch": 3562} {"train_loss": -6.759474754333496, "global_step": 149612, "epoch": 3562} {"train_loss": -7.027889251708984, "global_step": 149613, "epoch": 3562} {"train_loss": -6.879925727844238, "global_step": 149614, "epoch": 3562} {"train_loss": -6.9631547927856445, "global_step": 149615, "epoch": 3562} {"train_loss": -6.917036056518555, "global_step": 149616, "epoch": 3562} {"train_loss": -6.846161842346191, "global_step": 149617, "epoch": 3562} {"train_loss": -6.914617538452148, "global_step": 149618, "epoch": 3562} {"train_loss": -6.9522881507873535, "global_step": 149619, "epoch": 3562} {"train_loss": -6.960809230804443, "global_step": 149620, "epoch": 3562} {"train_loss": -6.868269443511963, "global_step": 149621, "epoch": 3562} {"train_loss": -6.925620079040527, "global_step": 149622, "epoch": 3562} {"train_loss": -6.853699684143066, "global_step": 149623, "epoch": 3562} {"train_loss": -6.967717170715332, "global_step": 149624, "epoch": 3562} {"train_loss": -6.917954921722412, "global_step": 149625, "epoch": 3562} {"train_loss": -6.831913948059082, "global_step": 149626, "epoch": 3562} {"train_loss": -6.890113353729248, "global_step": 149627, "epoch": 3562} {"train_loss": -6.840765953063965, "global_step": 149628, "epoch": 3562} {"train_loss": -6.9178056716918945, "global_step": 149629, "epoch": 3562} {"train_loss": -6.934821605682373, "global_step": 149630, "epoch": 3562} {"train_loss": -7.028947830200195, "global_step": 149631, "epoch": 3562} {"train_loss": -6.886196136474609, "global_step": 149632, "epoch": 3562} {"train_loss": -6.913431167602539, "global_step": 149633, "epoch": 3562} {"train_loss": -6.900235176086426, "global_step": 149634, "epoch": 3562} {"train_loss": -6.831475257873535, "global_step": 149635, "epoch": 3562} {"train_loss": -6.852468490600586, "global_step": 149636, "epoch": 3562} {"train_loss": -6.957326889038086, "global_step": 149637, "epoch": 3562} {"train_loss": -6.856121063232422, "global_step": 149638, "epoch": 3562} {"train_loss": -6.8579630851745605, "global_step": 149639, "epoch": 3562} {"train_loss": -6.829275131225586, "global_step": 149640, "epoch": 3562} {"train_loss": -6.938579559326172, "global_step": 149641, "epoch": 3562} {"train_loss": -6.951168060302734, "global_step": 149642, "epoch": 3562} {"train_loss": -6.78542423248291, "global_step": 149643, "epoch": 3562} {"train_loss": -6.843284606933594, "global_step": 149644, "epoch": 3562} {"train_loss": -6.884898980458577, "global_step": 149645, "epoch": 3562, "val_loss": 78695.4453125} {"train_loss": -6.98759651184082, "global_step": 149646, "epoch": 3563} {"train_loss": -6.912276744842529, "global_step": 149647, "epoch": 3563} {"train_loss": -6.885854244232178, "global_step": 149648, "epoch": 3563} {"train_loss": -6.99128532409668, "global_step": 149649, "epoch": 3563} {"train_loss": -6.922810077667236, "global_step": 149650, "epoch": 3563} {"train_loss": -6.879936218261719, "global_step": 149651, "epoch": 3563} {"train_loss": -6.894402503967285, "global_step": 149652, "epoch": 3563} {"train_loss": -6.7998366355896, "global_step": 149653, "epoch": 3563} {"train_loss": -6.856732368469238, "global_step": 149654, "epoch": 3563} {"train_loss": -6.898717403411865, "global_step": 149655, "epoch": 3563} {"train_loss": -6.831761360168457, "global_step": 149656, "epoch": 3563} {"train_loss": -6.894801139831543, "global_step": 149657, "epoch": 3563} {"train_loss": -6.893842697143555, "global_step": 149658, "epoch": 3563} {"train_loss": -6.94467306137085, "global_step": 149659, "epoch": 3563} {"train_loss": -6.857873916625977, "global_step": 149660, "epoch": 3563} {"train_loss": -6.82672119140625, "global_step": 149661, "epoch": 3563} {"train_loss": -6.850976467132568, "global_step": 149662, "epoch": 3563} {"train_loss": -6.8396315574646, "global_step": 149663, "epoch": 3563} {"train_loss": -6.714786052703857, "global_step": 149664, "epoch": 3563} {"train_loss": -6.742058277130127, "global_step": 149665, "epoch": 3563} {"train_loss": -6.842859745025635, "global_step": 149666, "epoch": 3563} {"train_loss": -6.720656394958496, "global_step": 149667, "epoch": 3563} {"train_loss": -6.806793212890625, "global_step": 149668, "epoch": 3563} {"train_loss": -6.854626178741455, "global_step": 149669, "epoch": 3563} {"train_loss": -6.802853584289551, "global_step": 149670, "epoch": 3563} {"train_loss": -6.8017425537109375, "global_step": 149671, "epoch": 3563} {"train_loss": -6.652811527252197, "global_step": 149672, "epoch": 3563} {"train_loss": -6.902031898498535, "global_step": 149673, "epoch": 3563} {"train_loss": -6.824065208435059, "global_step": 149674, "epoch": 3563} {"train_loss": -6.6898698806762695, "global_step": 149675, "epoch": 3563} {"train_loss": -6.85292911529541, "global_step": 149676, "epoch": 3563} {"train_loss": -6.730679035186768, "global_step": 149677, "epoch": 3563} {"train_loss": -6.836103439331055, "global_step": 149678, "epoch": 3563} {"train_loss": -6.881702423095703, "global_step": 149679, "epoch": 3563} {"train_loss": -6.841368675231934, "global_step": 149680, "epoch": 3563} {"train_loss": -6.912055015563965, "global_step": 149681, "epoch": 3563} {"train_loss": -6.752394676208496, "global_step": 149682, "epoch": 3563} {"train_loss": -6.8216657638549805, "global_step": 149683, "epoch": 3563} {"train_loss": -6.796877861022949, "global_step": 149684, "epoch": 3563} {"train_loss": -6.821957588195801, "global_step": 149685, "epoch": 3563} {"train_loss": -6.746874809265137, "global_step": 149686, "epoch": 3563} {"train_loss": -6.837774628684635, "global_step": 149687, "epoch": 3563, "val_loss": 78763.2421875} {"train_loss": -6.783762454986572, "global_step": 149688, "epoch": 3564} {"train_loss": -6.894567966461182, "global_step": 149689, "epoch": 3564} {"train_loss": -6.951155662536621, "global_step": 149690, "epoch": 3564} {"train_loss": -6.772902488708496, "global_step": 149691, "epoch": 3564} {"train_loss": -6.801225662231445, "global_step": 149692, "epoch": 3564} {"train_loss": -6.973893642425537, "global_step": 149693, "epoch": 3564} {"train_loss": -6.919075012207031, "global_step": 149694, "epoch": 3564} {"train_loss": -6.8195576667785645, "global_step": 149695, "epoch": 3564} {"train_loss": -6.857924938201904, "global_step": 149696, "epoch": 3564} {"train_loss": -6.818942546844482, "global_step": 149697, "epoch": 3564} {"train_loss": -6.854133605957031, "global_step": 149698, "epoch": 3564} {"train_loss": -6.835200309753418, "global_step": 149699, "epoch": 3564} {"train_loss": -6.8361005783081055, "global_step": 149700, "epoch": 3564} {"train_loss": -6.850776672363281, "global_step": 149701, "epoch": 3564} {"train_loss": -6.790452003479004, "global_step": 149702, "epoch": 3564} {"train_loss": -6.776708602905273, "global_step": 149703, "epoch": 3564} {"train_loss": -6.876376628875732, "global_step": 149704, "epoch": 3564} {"train_loss": -6.8237504959106445, "global_step": 149705, "epoch": 3564} {"train_loss": -6.816423416137695, "global_step": 149706, "epoch": 3564} {"train_loss": -6.860110282897949, "global_step": 149707, "epoch": 3564} {"train_loss": -6.838029384613037, "global_step": 149708, "epoch": 3564} {"train_loss": -6.643772125244141, "global_step": 149709, "epoch": 3564} {"train_loss": -6.886588096618652, "global_step": 149710, "epoch": 3564} {"train_loss": -6.678030967712402, "global_step": 149711, "epoch": 3564} {"train_loss": -6.58986759185791, "global_step": 149712, "epoch": 3564} {"train_loss": -6.822882652282715, "global_step": 149713, "epoch": 3564} {"train_loss": -6.743677616119385, "global_step": 149714, "epoch": 3564} {"train_loss": -6.790154933929443, "global_step": 149715, "epoch": 3564} {"train_loss": -6.905767440795898, "global_step": 149716, "epoch": 3564} {"train_loss": -6.671069145202637, "global_step": 149717, "epoch": 3564} {"train_loss": -6.848405361175537, "global_step": 149718, "epoch": 3564} {"train_loss": -6.688995838165283, "global_step": 149719, "epoch": 3564} {"train_loss": -6.88462495803833, "global_step": 149720, "epoch": 3564} {"train_loss": -6.809968948364258, "global_step": 149721, "epoch": 3564} {"train_loss": -6.847752571105957, "global_step": 149722, "epoch": 3564} {"train_loss": -6.85010290145874, "global_step": 149723, "epoch": 3564} {"train_loss": -6.881976127624512, "global_step": 149724, "epoch": 3564} {"train_loss": -6.729276657104492, "global_step": 149725, "epoch": 3564} {"train_loss": -6.859439849853516, "global_step": 149726, "epoch": 3564} {"train_loss": -6.814990997314453, "global_step": 149727, "epoch": 3564} {"train_loss": -6.730622291564941, "global_step": 149728, "epoch": 3564} {"train_loss": -6.8141936007000155, "global_step": 149729, "epoch": 3564, "val_loss": 78761.421875} {"train_loss": -6.915224075317383, "global_step": 149730, "epoch": 3565} {"train_loss": -6.799961090087891, "global_step": 149731, "epoch": 3565} {"train_loss": -6.886885643005371, "global_step": 149732, "epoch": 3565} {"train_loss": -6.740504264831543, "global_step": 149733, "epoch": 3565} {"train_loss": -6.847731590270996, "global_step": 149734, "epoch": 3565} {"train_loss": -6.812811851501465, "global_step": 149735, "epoch": 3565} {"train_loss": -6.738160133361816, "global_step": 149736, "epoch": 3565} {"train_loss": -6.771074295043945, "global_step": 149737, "epoch": 3565} {"train_loss": -6.746454238891602, "global_step": 149738, "epoch": 3565} {"train_loss": -6.914556503295898, "global_step": 149739, "epoch": 3565} {"train_loss": -6.949429512023926, "global_step": 149740, "epoch": 3565} {"train_loss": -6.851574897766113, "global_step": 149741, "epoch": 3565} {"train_loss": -6.732900619506836, "global_step": 149742, "epoch": 3565} {"train_loss": -6.836905002593994, "global_step": 149743, "epoch": 3565} {"train_loss": -6.911993980407715, "global_step": 149744, "epoch": 3565} {"train_loss": -6.824605941772461, "global_step": 149745, "epoch": 3565} {"train_loss": -6.9059247970581055, "global_step": 149746, "epoch": 3565} {"train_loss": -6.8253173828125, "global_step": 149747, "epoch": 3565} {"train_loss": -6.736889362335205, "global_step": 149748, "epoch": 3565} {"train_loss": -6.932842254638672, "global_step": 149749, "epoch": 3565} {"train_loss": -6.937440872192383, "global_step": 149750, "epoch": 3565} {"train_loss": -6.849499702453613, "global_step": 149751, "epoch": 3565} {"train_loss": -6.876114845275879, "global_step": 149752, "epoch": 3565} {"train_loss": -6.852884292602539, "global_step": 149753, "epoch": 3565} {"train_loss": -6.989258766174316, "global_step": 149754, "epoch": 3565} {"train_loss": -6.901942253112793, "global_step": 149755, "epoch": 3565} {"train_loss": -6.8783769607543945, "global_step": 149756, "epoch": 3565} {"train_loss": -6.763171195983887, "global_step": 149757, "epoch": 3565} {"train_loss": -6.819165229797363, "global_step": 149758, "epoch": 3565} {"train_loss": -6.9429612159729, "global_step": 149759, "epoch": 3565} {"train_loss": -6.858946800231934, "global_step": 149760, "epoch": 3565} {"train_loss": -6.90162467956543, "global_step": 149761, "epoch": 3565} {"train_loss": -6.929419040679932, "global_step": 149762, "epoch": 3565} {"train_loss": -6.8239850997924805, "global_step": 149763, "epoch": 3565} {"train_loss": -6.780282974243164, "global_step": 149764, "epoch": 3565} {"train_loss": -6.811099052429199, "global_step": 149765, "epoch": 3565} {"train_loss": -6.959547996520996, "global_step": 149766, "epoch": 3565} {"train_loss": -6.810055732727051, "global_step": 149767, "epoch": 3565} {"train_loss": -6.818336486816406, "global_step": 149768, "epoch": 3565} {"train_loss": -6.899044990539551, "global_step": 149769, "epoch": 3565} {"train_loss": -6.973460674285889, "global_step": 149770, "epoch": 3565} {"train_loss": -6.8572161084129695, "global_step": 149771, "epoch": 3565, "val_loss": 78988.7890625} {"train_loss": -6.868217468261719, "global_step": 149772, "epoch": 3566} {"train_loss": -6.948426246643066, "global_step": 149773, "epoch": 3566} {"train_loss": -6.91671085357666, "global_step": 149774, "epoch": 3566} {"train_loss": -6.724818706512451, "global_step": 149775, "epoch": 3566} {"train_loss": -6.859631061553955, "global_step": 149776, "epoch": 3566} {"train_loss": -6.755605697631836, "global_step": 149777, "epoch": 3566} {"train_loss": -6.643960952758789, "global_step": 149778, "epoch": 3566} {"train_loss": -6.913707256317139, "global_step": 149779, "epoch": 3566} {"train_loss": -6.841839790344238, "global_step": 149780, "epoch": 3566} {"train_loss": -6.856460094451904, "global_step": 149781, "epoch": 3566} {"train_loss": -6.815703868865967, "global_step": 149782, "epoch": 3566} {"train_loss": -6.651057243347168, "global_step": 149783, "epoch": 3566} {"train_loss": -6.795385837554932, "global_step": 149784, "epoch": 3566} {"train_loss": -6.882047653198242, "global_step": 149785, "epoch": 3566} {"train_loss": -6.8034467697143555, "global_step": 149786, "epoch": 3566} {"train_loss": -6.763262748718262, "global_step": 149787, "epoch": 3566} {"train_loss": -6.8696064949035645, "global_step": 149788, "epoch": 3566} {"train_loss": -6.83347225189209, "global_step": 149789, "epoch": 3566} {"train_loss": -6.936253547668457, "global_step": 149790, "epoch": 3566} {"train_loss": -6.8188982009887695, "global_step": 149791, "epoch": 3566} {"train_loss": -6.800901412963867, "global_step": 149792, "epoch": 3566} {"train_loss": -6.934505462646484, "global_step": 149793, "epoch": 3566} {"train_loss": -6.843210697174072, "global_step": 149794, "epoch": 3566} {"train_loss": -6.898420333862305, "global_step": 149795, "epoch": 3566} {"train_loss": -6.7499775886535645, "global_step": 149796, "epoch": 3566} {"train_loss": -6.545201778411865, "global_step": 149797, "epoch": 3566} {"train_loss": -6.829100608825684, "global_step": 149798, "epoch": 3566} {"train_loss": -6.715397834777832, "global_step": 149799, "epoch": 3566} {"train_loss": -6.80180549621582, "global_step": 149800, "epoch": 3566} {"train_loss": -6.841239929199219, "global_step": 149801, "epoch": 3566} {"train_loss": -6.684950351715088, "global_step": 149802, "epoch": 3566} {"train_loss": -6.976111888885498, "global_step": 149803, "epoch": 3566} {"train_loss": -6.709255695343018, "global_step": 149804, "epoch": 3566} {"train_loss": -6.796788692474365, "global_step": 149805, "epoch": 3566} {"train_loss": -6.704639434814453, "global_step": 149806, "epoch": 3566} {"train_loss": -6.680702209472656, "global_step": 149807, "epoch": 3566} {"train_loss": -6.912574291229248, "global_step": 149808, "epoch": 3566} {"train_loss": -6.84206485748291, "global_step": 149809, "epoch": 3566} {"train_loss": -6.836630344390869, "global_step": 149810, "epoch": 3566} {"train_loss": -6.807722091674805, "global_step": 149811, "epoch": 3566} {"train_loss": -6.869361877441406, "global_step": 149812, "epoch": 3566} {"train_loss": -6.8109902540842695, "global_step": 149813, "epoch": 3566, "val_loss": 78675.59375} {"train_loss": -6.878400802612305, "global_step": 149814, "epoch": 3567} {"train_loss": -6.873256206512451, "global_step": 149815, "epoch": 3567} {"train_loss": -6.962926864624023, "global_step": 149816, "epoch": 3567} {"train_loss": -6.9490814208984375, "global_step": 149817, "epoch": 3567} {"train_loss": -6.870288848876953, "global_step": 149818, "epoch": 3567} {"train_loss": -6.951586723327637, "global_step": 149819, "epoch": 3567} {"train_loss": -6.773407459259033, "global_step": 149820, "epoch": 3567} {"train_loss": -6.949728012084961, "global_step": 149821, "epoch": 3567} {"train_loss": -6.921233654022217, "global_step": 149822, "epoch": 3567} {"train_loss": -6.961348533630371, "global_step": 149823, "epoch": 3567} {"train_loss": -6.971097946166992, "global_step": 149824, "epoch": 3567} {"train_loss": -6.985034942626953, "global_step": 149825, "epoch": 3567} {"train_loss": -6.961791515350342, "global_step": 149826, "epoch": 3567} {"train_loss": -6.883898735046387, "global_step": 149827, "epoch": 3567} {"train_loss": -6.899639129638672, "global_step": 149828, "epoch": 3567} {"train_loss": -6.896231651306152, "global_step": 149829, "epoch": 3567} {"train_loss": -6.867554664611816, "global_step": 149830, "epoch": 3567} {"train_loss": -6.9434099197387695, "global_step": 149831, "epoch": 3567} {"train_loss": -6.7820725440979, "global_step": 149832, "epoch": 3567} {"train_loss": -6.804421424865723, "global_step": 149833, "epoch": 3567} {"train_loss": -6.891297817230225, "global_step": 149834, "epoch": 3567} {"train_loss": -6.773015975952148, "global_step": 149835, "epoch": 3567} {"train_loss": -6.773725986480713, "global_step": 149836, "epoch": 3567} {"train_loss": -6.77750301361084, "global_step": 149837, "epoch": 3567} {"train_loss": -6.438965320587158, "global_step": 149838, "epoch": 3567} {"train_loss": -6.802983283996582, "global_step": 149839, "epoch": 3567} {"train_loss": -6.741499900817871, "global_step": 149840, "epoch": 3567} {"train_loss": -6.563209533691406, "global_step": 149841, "epoch": 3567} {"train_loss": -6.9590935707092285, "global_step": 149842, "epoch": 3567} {"train_loss": -6.803011894226074, "global_step": 149843, "epoch": 3567} {"train_loss": -6.766955375671387, "global_step": 149844, "epoch": 3567} {"train_loss": -6.836045742034912, "global_step": 149845, "epoch": 3567} {"train_loss": -6.771800994873047, "global_step": 149846, "epoch": 3567} {"train_loss": -6.8009161949157715, "global_step": 149847, "epoch": 3567} {"train_loss": -6.756300449371338, "global_step": 149848, "epoch": 3567} {"train_loss": -6.796826362609863, "global_step": 149849, "epoch": 3567} {"train_loss": -6.658105850219727, "global_step": 149850, "epoch": 3567} {"train_loss": -6.804556846618652, "global_step": 149851, "epoch": 3567} {"train_loss": -6.7872185707092285, "global_step": 149852, "epoch": 3567} {"train_loss": -6.774227142333984, "global_step": 149853, "epoch": 3567} {"train_loss": -6.766340255737305, "global_step": 149854, "epoch": 3567} {"train_loss": -6.8324913410913375, "global_step": 149855, "epoch": 3567, "val_loss": 78621.1484375} {"train_loss": -6.774106502532959, "global_step": 149856, "epoch": 3568} {"train_loss": -6.851241111755371, "global_step": 149857, "epoch": 3568} {"train_loss": -6.8282575607299805, "global_step": 149858, "epoch": 3568} {"train_loss": -6.775113582611084, "global_step": 149859, "epoch": 3568} {"train_loss": -6.905130863189697, "global_step": 149860, "epoch": 3568} {"train_loss": -6.71504020690918, "global_step": 149861, "epoch": 3568} {"train_loss": -6.8677978515625, "global_step": 149862, "epoch": 3568} {"train_loss": -6.862140655517578, "global_step": 149863, "epoch": 3568} {"train_loss": -6.801732063293457, "global_step": 149864, "epoch": 3568} {"train_loss": -6.832241058349609, "global_step": 149865, "epoch": 3568} {"train_loss": -6.792342185974121, "global_step": 149866, "epoch": 3568} {"train_loss": -6.82963752746582, "global_step": 149867, "epoch": 3568} {"train_loss": -6.797585487365723, "global_step": 149868, "epoch": 3568} {"train_loss": -6.808725357055664, "global_step": 149869, "epoch": 3568} {"train_loss": -6.808321952819824, "global_step": 149870, "epoch": 3568} {"train_loss": -6.817203998565674, "global_step": 149871, "epoch": 3568} {"train_loss": -6.855442047119141, "global_step": 149872, "epoch": 3568} {"train_loss": -6.895233154296875, "global_step": 149873, "epoch": 3568} {"train_loss": -6.91119384765625, "global_step": 149874, "epoch": 3568} {"train_loss": -6.758545398712158, "global_step": 149875, "epoch": 3568} {"train_loss": -6.884712219238281, "global_step": 149876, "epoch": 3568} {"train_loss": -6.924890518188477, "global_step": 149877, "epoch": 3568} {"train_loss": -6.737907409667969, "global_step": 149878, "epoch": 3568} {"train_loss": -6.84775447845459, "global_step": 149879, "epoch": 3568} {"train_loss": -6.872067451477051, "global_step": 149880, "epoch": 3568} {"train_loss": -6.798468589782715, "global_step": 149881, "epoch": 3568} {"train_loss": -6.855552673339844, "global_step": 149882, "epoch": 3568} {"train_loss": -6.815600395202637, "global_step": 149883, "epoch": 3568} {"train_loss": -6.927577018737793, "global_step": 149884, "epoch": 3568} {"train_loss": -6.82733154296875, "global_step": 149885, "epoch": 3568} {"train_loss": -6.774943828582764, "global_step": 149886, "epoch": 3568} {"train_loss": -6.891760349273682, "global_step": 149887, "epoch": 3568} {"train_loss": -6.922576427459717, "global_step": 149888, "epoch": 3568} {"train_loss": -6.8203277587890625, "global_step": 149889, "epoch": 3568} {"train_loss": -6.8224663734436035, "global_step": 149890, "epoch": 3568} {"train_loss": -6.937530994415283, "global_step": 149891, "epoch": 3568} {"train_loss": -6.887540817260742, "global_step": 149892, "epoch": 3568} {"train_loss": -6.928720474243164, "global_step": 149893, "epoch": 3568} {"train_loss": -7.103274345397949, "global_step": 149894, "epoch": 3568} {"train_loss": -6.853636741638184, "global_step": 149895, "epoch": 3568} {"train_loss": -6.883504867553711, "global_step": 149896, "epoch": 3568} {"train_loss": -6.850843486331758, "global_step": 149897, "epoch": 3568, "val_loss": 78630.359375} {"train_loss": -6.87106990814209, "global_step": 149898, "epoch": 3569} {"train_loss": -6.878763198852539, "global_step": 149899, "epoch": 3569} {"train_loss": -6.964722633361816, "global_step": 149900, "epoch": 3569} {"train_loss": -6.861416816711426, "global_step": 149901, "epoch": 3569} {"train_loss": -6.901776313781738, "global_step": 149902, "epoch": 3569} {"train_loss": -6.943055152893066, "global_step": 149903, "epoch": 3569} {"train_loss": -6.883426666259766, "global_step": 149904, "epoch": 3569} {"train_loss": -6.833641052246094, "global_step": 149905, "epoch": 3569} {"train_loss": -6.80472993850708, "global_step": 149906, "epoch": 3569} {"train_loss": -6.904749870300293, "global_step": 149907, "epoch": 3569} {"train_loss": -6.697608470916748, "global_step": 149908, "epoch": 3569} {"train_loss": -6.8380842208862305, "global_step": 149909, "epoch": 3569} {"train_loss": -6.826888561248779, "global_step": 149910, "epoch": 3569} {"train_loss": -6.893246650695801, "global_step": 149911, "epoch": 3569} {"train_loss": -6.8628435134887695, "global_step": 149912, "epoch": 3569} {"train_loss": -6.860211372375488, "global_step": 149913, "epoch": 3569} {"train_loss": -6.870067596435547, "global_step": 149914, "epoch": 3569} {"train_loss": -6.707578659057617, "global_step": 149915, "epoch": 3569} {"train_loss": -6.859570503234863, "global_step": 149916, "epoch": 3569} {"train_loss": -6.864629745483398, "global_step": 149917, "epoch": 3569} {"train_loss": -6.887697219848633, "global_step": 149918, "epoch": 3569} {"train_loss": -6.853081226348877, "global_step": 149919, "epoch": 3569} {"train_loss": -6.829736709594727, "global_step": 149920, "epoch": 3569} {"train_loss": -6.818280220031738, "global_step": 149921, "epoch": 3569} {"train_loss": -6.817544937133789, "global_step": 149922, "epoch": 3569} {"train_loss": -6.849368095397949, "global_step": 149923, "epoch": 3569} {"train_loss": -6.806293964385986, "global_step": 149924, "epoch": 3569} {"train_loss": -6.83392333984375, "global_step": 149925, "epoch": 3569} {"train_loss": -6.755620956420898, "global_step": 149926, "epoch": 3569} {"train_loss": -6.849632740020752, "global_step": 149927, "epoch": 3569} {"train_loss": -6.893000602722168, "global_step": 149928, "epoch": 3569} {"train_loss": -6.826939582824707, "global_step": 149929, "epoch": 3569} {"train_loss": -6.837695121765137, "global_step": 149930, "epoch": 3569} {"train_loss": -6.882299423217773, "global_step": 149931, "epoch": 3569} {"train_loss": -6.819828510284424, "global_step": 149932, "epoch": 3569} {"train_loss": -6.846352577209473, "global_step": 149933, "epoch": 3569} {"train_loss": -6.831612586975098, "global_step": 149934, "epoch": 3569} {"train_loss": -6.905352592468262, "global_step": 149935, "epoch": 3569} {"train_loss": -7.012051105499268, "global_step": 149936, "epoch": 3569} {"train_loss": -7.0038838386535645, "global_step": 149937, "epoch": 3569} {"train_loss": -6.7779107093811035, "global_step": 149938, "epoch": 3569} {"train_loss": -6.8553675810496015, "global_step": 149939, "epoch": 3569, "val_loss": 78642.6171875} {"train_loss": -6.971945285797119, "global_step": 149940, "epoch": 3570} {"train_loss": -6.84473991394043, "global_step": 149941, "epoch": 3570} {"train_loss": -6.939792633056641, "global_step": 149942, "epoch": 3570} {"train_loss": -6.94527006149292, "global_step": 149943, "epoch": 3570} {"train_loss": -6.821990489959717, "global_step": 149944, "epoch": 3570} {"train_loss": -6.850287437438965, "global_step": 149945, "epoch": 3570} {"train_loss": -6.931687831878662, "global_step": 149946, "epoch": 3570} {"train_loss": -6.727395534515381, "global_step": 149947, "epoch": 3570} {"train_loss": -6.873006820678711, "global_step": 149948, "epoch": 3570} {"train_loss": -6.805790901184082, "global_step": 149949, "epoch": 3570} {"train_loss": -6.8563737869262695, "global_step": 149950, "epoch": 3570} {"train_loss": -6.8319597244262695, "global_step": 149951, "epoch": 3570} {"train_loss": -6.827564239501953, "global_step": 149952, "epoch": 3570} {"train_loss": -6.729070663452148, "global_step": 149953, "epoch": 3570} {"train_loss": -6.615861415863037, "global_step": 149954, "epoch": 3570} {"train_loss": -6.80626106262207, "global_step": 149955, "epoch": 3570} {"train_loss": -6.731742858886719, "global_step": 149956, "epoch": 3570} {"train_loss": -6.851099491119385, "global_step": 149957, "epoch": 3570} {"train_loss": -6.79098653793335, "global_step": 149958, "epoch": 3570} {"train_loss": -6.75947380065918, "global_step": 149959, "epoch": 3570} {"train_loss": -6.804501533508301, "global_step": 149960, "epoch": 3570} {"train_loss": -6.7242631912231445, "global_step": 149961, "epoch": 3570} {"train_loss": -6.734743118286133, "global_step": 149962, "epoch": 3570} {"train_loss": -6.741714000701904, "global_step": 149963, "epoch": 3570} {"train_loss": -6.747940540313721, "global_step": 149964, "epoch": 3570} {"train_loss": -6.7018537521362305, "global_step": 149965, "epoch": 3570} {"train_loss": -6.713242053985596, "global_step": 149966, "epoch": 3570} {"train_loss": -6.927279472351074, "global_step": 149967, "epoch": 3570} {"train_loss": -6.673301696777344, "global_step": 149968, "epoch": 3570} {"train_loss": -6.785546779632568, "global_step": 149969, "epoch": 3570} {"train_loss": -6.795253753662109, "global_step": 149970, "epoch": 3570} {"train_loss": -6.831374645233154, "global_step": 149971, "epoch": 3570} {"train_loss": -6.907799243927002, "global_step": 149972, "epoch": 3570} {"train_loss": -6.816001892089844, "global_step": 149973, "epoch": 3570} {"train_loss": -6.848208904266357, "global_step": 149974, "epoch": 3570} {"train_loss": -6.854014873504639, "global_step": 149975, "epoch": 3570} {"train_loss": -6.925685405731201, "global_step": 149976, "epoch": 3570} {"train_loss": -6.64522647857666, "global_step": 149977, "epoch": 3570} {"train_loss": -6.794587135314941, "global_step": 149978, "epoch": 3570} {"train_loss": -6.879690647125244, "global_step": 149979, "epoch": 3570} {"train_loss": -6.625505447387695, "global_step": 149980, "epoch": 3570} {"train_loss": -6.8024673121316095, "global_step": 149981, "epoch": 3570, "val_loss": 78798.859375} {"train_loss": -6.914897918701172, "global_step": 149982, "epoch": 3571} {"train_loss": -6.915447235107422, "global_step": 149983, "epoch": 3571} {"train_loss": -6.932920932769775, "global_step": 149984, "epoch": 3571} {"train_loss": -6.800287246704102, "global_step": 149985, "epoch": 3571} {"train_loss": -6.975560188293457, "global_step": 149986, "epoch": 3571} {"train_loss": -6.869290351867676, "global_step": 149987, "epoch": 3571} {"train_loss": -6.88486385345459, "global_step": 149988, "epoch": 3571} {"train_loss": -6.8481669425964355, "global_step": 149989, "epoch": 3571} {"train_loss": -6.807334899902344, "global_step": 149990, "epoch": 3571} {"train_loss": -6.755997657775879, "global_step": 149991, "epoch": 3571} {"train_loss": -6.6474409103393555, "global_step": 149992, "epoch": 3571} {"train_loss": -6.84225606918335, "global_step": 149993, "epoch": 3571} {"train_loss": -6.712538719177246, "global_step": 149994, "epoch": 3571} {"train_loss": -6.708080291748047, "global_step": 149995, "epoch": 3571} {"train_loss": -6.9220781326293945, "global_step": 149996, "epoch": 3571} {"train_loss": -6.64259672164917, "global_step": 149997, "epoch": 3571} {"train_loss": -6.925070762634277, "global_step": 149998, "epoch": 3571} {"train_loss": -6.862760543823242, "global_step": 149999, "epoch": 3571} {"train_loss": -6.719075679779053, "global_step": 150000, "epoch": 3571} {"train_loss": -6.808719635009766, "global_step": 150001, "epoch": 3571} {"train_loss": -6.664169788360596, "global_step": 150002, "epoch": 3571} {"train_loss": -6.767523288726807, "global_step": 150003, "epoch": 3571} {"train_loss": -6.842070579528809, "global_step": 150004, "epoch": 3571} {"train_loss": -6.943292140960693, "global_step": 150005, "epoch": 3571} {"train_loss": -6.852280616760254, "global_step": 150006, "epoch": 3571} {"train_loss": -6.889098167419434, "global_step": 150007, "epoch": 3571} {"train_loss": -6.797219276428223, "global_step": 150008, "epoch": 3571} {"train_loss": -6.8444318771362305, "global_step": 150009, "epoch": 3571} {"train_loss": -6.882628440856934, "global_step": 150010, "epoch": 3571} {"train_loss": -6.854729652404785, "global_step": 150011, "epoch": 3571} {"train_loss": -6.916412353515625, "global_step": 150012, "epoch": 3571} {"train_loss": -6.939920425415039, "global_step": 150013, "epoch": 3571} {"train_loss": -6.873795509338379, "global_step": 150014, "epoch": 3571} {"train_loss": -6.859103679656982, "global_step": 150015, "epoch": 3571} {"train_loss": -6.856405258178711, "global_step": 150016, "epoch": 3571} {"train_loss": -6.92337703704834, "global_step": 150017, "epoch": 3571} {"train_loss": -6.8642354011535645, "global_step": 150018, "epoch": 3571} {"train_loss": -6.882438659667969, "global_step": 150019, "epoch": 3571} {"train_loss": -6.85589075088501, "global_step": 150020, "epoch": 3571} {"train_loss": -6.84450101852417, "global_step": 150021, "epoch": 3571} {"train_loss": -6.735930442810059, "global_step": 150022, "epoch": 3571} {"train_loss": -6.840966622034709, "global_step": 150023, "epoch": 3571, "val_loss": 78699.4921875} {"train_loss": -6.838866233825684, "global_step": 150024, "epoch": 3572} {"train_loss": -6.833584785461426, "global_step": 150025, "epoch": 3572} {"train_loss": -6.938967704772949, "global_step": 150026, "epoch": 3572} {"train_loss": -6.849296569824219, "global_step": 150027, "epoch": 3572} {"train_loss": -6.90087890625, "global_step": 150028, "epoch": 3572} {"train_loss": -6.817877769470215, "global_step": 150029, "epoch": 3572} {"train_loss": -6.926704406738281, "global_step": 150030, "epoch": 3572} {"train_loss": -6.894335746765137, "global_step": 150031, "epoch": 3572} {"train_loss": -6.967276096343994, "global_step": 150032, "epoch": 3572} {"train_loss": -6.751675605773926, "global_step": 150033, "epoch": 3572} {"train_loss": -6.854132652282715, "global_step": 150034, "epoch": 3572} {"train_loss": -6.859337329864502, "global_step": 150035, "epoch": 3572} {"train_loss": -6.875768661499023, "global_step": 150036, "epoch": 3572} {"train_loss": -6.803332805633545, "global_step": 150037, "epoch": 3572} {"train_loss": -6.864002704620361, "global_step": 150038, "epoch": 3572} {"train_loss": -6.86623477935791, "global_step": 150039, "epoch": 3572} {"train_loss": -6.83193826675415, "global_step": 150040, "epoch": 3572} {"train_loss": -6.782296657562256, "global_step": 150041, "epoch": 3572} {"train_loss": -6.907862186431885, "global_step": 150042, "epoch": 3572} {"train_loss": -6.881656169891357, "global_step": 150043, "epoch": 3572} {"train_loss": -6.819543838500977, "global_step": 150044, "epoch": 3572} {"train_loss": -6.873898983001709, "global_step": 150045, "epoch": 3572} {"train_loss": -6.892622470855713, "global_step": 150046, "epoch": 3572} {"train_loss": -6.937519073486328, "global_step": 150047, "epoch": 3572} {"train_loss": -6.859297752380371, "global_step": 150048, "epoch": 3572} {"train_loss": -6.883420944213867, "global_step": 150049, "epoch": 3572} {"train_loss": -6.934566497802734, "global_step": 150050, "epoch": 3572} {"train_loss": -6.7870283126831055, "global_step": 150051, "epoch": 3572} {"train_loss": -6.915844917297363, "global_step": 150052, "epoch": 3572} {"train_loss": -6.892524719238281, "global_step": 150053, "epoch": 3572} {"train_loss": -6.868228912353516, "global_step": 150054, "epoch": 3572} {"train_loss": -6.947107315063477, "global_step": 150055, "epoch": 3572} {"train_loss": -6.947094917297363, "global_step": 150056, "epoch": 3572} {"train_loss": -6.895132064819336, "global_step": 150057, "epoch": 3572} {"train_loss": -6.811130046844482, "global_step": 150058, "epoch": 3572} {"train_loss": -6.783489227294922, "global_step": 150059, "epoch": 3572} {"train_loss": -6.7523603439331055, "global_step": 150060, "epoch": 3572} {"train_loss": -6.739215850830078, "global_step": 150061, "epoch": 3572} {"train_loss": -6.9173407554626465, "global_step": 150062, "epoch": 3572} {"train_loss": -6.9191694259643555, "global_step": 150063, "epoch": 3572} {"train_loss": -6.931673049926758, "global_step": 150064, "epoch": 3572} {"train_loss": -6.866650411060879, "global_step": 150065, "epoch": 3572, "val_loss": 79048.359375} {"train_loss": -6.756486892700195, "global_step": 150066, "epoch": 3573} {"train_loss": -6.831554412841797, "global_step": 150067, "epoch": 3573} {"train_loss": -6.894797325134277, "global_step": 150068, "epoch": 3573} {"train_loss": -6.8569817543029785, "global_step": 150069, "epoch": 3573} {"train_loss": -6.8169355392456055, "global_step": 150070, "epoch": 3573} {"train_loss": -6.7206339836120605, "global_step": 150071, "epoch": 3573} {"train_loss": -6.833710670471191, "global_step": 150072, "epoch": 3573} {"train_loss": -6.811546802520752, "global_step": 150073, "epoch": 3573} {"train_loss": -6.693469047546387, "global_step": 150074, "epoch": 3573} {"train_loss": -6.784562587738037, "global_step": 150075, "epoch": 3573} {"train_loss": -6.750399589538574, "global_step": 150076, "epoch": 3573} {"train_loss": -6.864592552185059, "global_step": 150077, "epoch": 3573} {"train_loss": -6.857979774475098, "global_step": 150078, "epoch": 3573} {"train_loss": -6.65775203704834, "global_step": 150079, "epoch": 3573} {"train_loss": -6.662524223327637, "global_step": 150080, "epoch": 3573} {"train_loss": -6.761855125427246, "global_step": 150081, "epoch": 3573} {"train_loss": -6.684572219848633, "global_step": 150082, "epoch": 3573} {"train_loss": -6.786230564117432, "global_step": 150083, "epoch": 3573} {"train_loss": -6.711331844329834, "global_step": 150084, "epoch": 3573} {"train_loss": -6.820562839508057, "global_step": 150085, "epoch": 3573} {"train_loss": -6.8403239250183105, "global_step": 150086, "epoch": 3573} {"train_loss": -6.685586452484131, "global_step": 150087, "epoch": 3573} {"train_loss": -6.809456825256348, "global_step": 150088, "epoch": 3573} {"train_loss": -6.660919189453125, "global_step": 150089, "epoch": 3573} {"train_loss": -6.831838130950928, "global_step": 150090, "epoch": 3573} {"train_loss": -6.805500030517578, "global_step": 150091, "epoch": 3573} {"train_loss": -6.783098220825195, "global_step": 150092, "epoch": 3573} {"train_loss": -6.886804580688477, "global_step": 150093, "epoch": 3573} {"train_loss": -6.815986156463623, "global_step": 150094, "epoch": 3573} {"train_loss": -6.904654502868652, "global_step": 150095, "epoch": 3573} {"train_loss": -6.919090747833252, "global_step": 150096, "epoch": 3573} {"train_loss": -6.915618896484375, "global_step": 150097, "epoch": 3573} {"train_loss": -6.859767436981201, "global_step": 150098, "epoch": 3573} {"train_loss": -6.868624687194824, "global_step": 150099, "epoch": 3573} {"train_loss": -6.906075954437256, "global_step": 150100, "epoch": 3573} {"train_loss": -6.791922092437744, "global_step": 150101, "epoch": 3573} {"train_loss": -6.894591331481934, "global_step": 150102, "epoch": 3573} {"train_loss": -6.793037414550781, "global_step": 150103, "epoch": 3573} {"train_loss": -6.928309440612793, "global_step": 150104, "epoch": 3573} {"train_loss": -6.859745025634766, "global_step": 150105, "epoch": 3573} {"train_loss": -6.831859588623047, "global_step": 150106, "epoch": 3573} {"train_loss": -6.810230221067156, "global_step": 150107, "epoch": 3573, "val_loss": 78526.828125} {"train_loss": -6.896042823791504, "global_step": 150108, "epoch": 3574} {"train_loss": -6.83212947845459, "global_step": 150109, "epoch": 3574} {"train_loss": -6.978634834289551, "global_step": 150110, "epoch": 3574} {"train_loss": -6.887263298034668, "global_step": 150111, "epoch": 3574} {"train_loss": -6.7811408042907715, "global_step": 150112, "epoch": 3574} {"train_loss": -6.840654373168945, "global_step": 150113, "epoch": 3574} {"train_loss": -6.777360916137695, "global_step": 150114, "epoch": 3574} {"train_loss": -6.851597785949707, "global_step": 150115, "epoch": 3574} {"train_loss": -6.7251739501953125, "global_step": 150116, "epoch": 3574} {"train_loss": -6.892189025878906, "global_step": 150117, "epoch": 3574} {"train_loss": -6.739171504974365, "global_step": 150118, "epoch": 3574} {"train_loss": -6.813467025756836, "global_step": 150119, "epoch": 3574} {"train_loss": -6.906445503234863, "global_step": 150120, "epoch": 3574} {"train_loss": -6.854867935180664, "global_step": 150121, "epoch": 3574} {"train_loss": -6.857465744018555, "global_step": 150122, "epoch": 3574} {"train_loss": -6.816985130310059, "global_step": 150123, "epoch": 3574} {"train_loss": -6.7877349853515625, "global_step": 150124, "epoch": 3574} {"train_loss": -6.839923858642578, "global_step": 150125, "epoch": 3574} {"train_loss": -6.774055480957031, "global_step": 150126, "epoch": 3574} {"train_loss": -6.909759521484375, "global_step": 150127, "epoch": 3574} {"train_loss": -6.781558990478516, "global_step": 150128, "epoch": 3574} {"train_loss": -6.944843769073486, "global_step": 150129, "epoch": 3574} {"train_loss": -6.8418192863464355, "global_step": 150130, "epoch": 3574} {"train_loss": -6.8780975341796875, "global_step": 150131, "epoch": 3574} {"train_loss": -6.953424453735352, "global_step": 150132, "epoch": 3574} {"train_loss": -6.750258445739746, "global_step": 150133, "epoch": 3574} {"train_loss": -6.899879455566406, "global_step": 150134, "epoch": 3574} {"train_loss": -6.707662105560303, "global_step": 150135, "epoch": 3574} {"train_loss": -6.90983247756958, "global_step": 150136, "epoch": 3574} {"train_loss": -6.825665473937988, "global_step": 150137, "epoch": 3574} {"train_loss": -6.941425323486328, "global_step": 150138, "epoch": 3574} {"train_loss": -6.891407012939453, "global_step": 150139, "epoch": 3574} {"train_loss": -6.934741497039795, "global_step": 150140, "epoch": 3574} {"train_loss": -6.86182975769043, "global_step": 150141, "epoch": 3574} {"train_loss": -6.909823417663574, "global_step": 150142, "epoch": 3574} {"train_loss": -6.9050397872924805, "global_step": 150143, "epoch": 3574} {"train_loss": -6.910886764526367, "global_step": 150144, "epoch": 3574} {"train_loss": -7.020447731018066, "global_step": 150145, "epoch": 3574} {"train_loss": -6.806215286254883, "global_step": 150146, "epoch": 3574} {"train_loss": -6.841541767120361, "global_step": 150147, "epoch": 3574} {"train_loss": -6.7888689041137695, "global_step": 150148, "epoch": 3574} {"train_loss": -6.857707523164295, "global_step": 150149, "epoch": 3574, "val_loss": 79036.625} {"train_loss": -6.926821708679199, "global_step": 150150, "epoch": 3575} {"train_loss": -6.91234016418457, "global_step": 150151, "epoch": 3575} {"train_loss": -6.830509662628174, "global_step": 150152, "epoch": 3575} {"train_loss": -6.9494709968566895, "global_step": 150153, "epoch": 3575} {"train_loss": -6.91949462890625, "global_step": 150154, "epoch": 3575} {"train_loss": -7.030956268310547, "global_step": 150155, "epoch": 3575} {"train_loss": -6.847784996032715, "global_step": 150156, "epoch": 3575} {"train_loss": -6.896189212799072, "global_step": 150157, "epoch": 3575} {"train_loss": -6.773185729980469, "global_step": 150158, "epoch": 3575} {"train_loss": -6.906946182250977, "global_step": 150159, "epoch": 3575} {"train_loss": -6.785942077636719, "global_step": 150160, "epoch": 3575} {"train_loss": -6.802059173583984, "global_step": 150161, "epoch": 3575} {"train_loss": -6.821303367614746, "global_step": 150162, "epoch": 3575} {"train_loss": -6.714700698852539, "global_step": 150163, "epoch": 3575} {"train_loss": -6.8895978927612305, "global_step": 150164, "epoch": 3575} {"train_loss": -6.811522483825684, "global_step": 150165, "epoch": 3575} {"train_loss": -6.839026927947998, "global_step": 150166, "epoch": 3575} {"train_loss": -6.819762229919434, "global_step": 150167, "epoch": 3575} {"train_loss": -6.768232822418213, "global_step": 150168, "epoch": 3575} {"train_loss": -6.7379608154296875, "global_step": 150169, "epoch": 3575} {"train_loss": -6.872942924499512, "global_step": 150170, "epoch": 3575} {"train_loss": -6.866326332092285, "global_step": 150171, "epoch": 3575} {"train_loss": -6.901759147644043, "global_step": 150172, "epoch": 3575} {"train_loss": -6.924135208129883, "global_step": 150173, "epoch": 3575} {"train_loss": -6.856218338012695, "global_step": 150174, "epoch": 3575} {"train_loss": -6.870800971984863, "global_step": 150175, "epoch": 3575} {"train_loss": -6.888605117797852, "global_step": 150176, "epoch": 3575} {"train_loss": -6.863691329956055, "global_step": 150177, "epoch": 3575} {"train_loss": -6.936298847198486, "global_step": 150178, "epoch": 3575} {"train_loss": -6.842360019683838, "global_step": 150179, "epoch": 3575} {"train_loss": -6.90340518951416, "global_step": 150180, "epoch": 3575} {"train_loss": -6.867950916290283, "global_step": 150181, "epoch": 3575} {"train_loss": -6.789587497711182, "global_step": 150182, "epoch": 3575} {"train_loss": -6.943655490875244, "global_step": 150183, "epoch": 3575} {"train_loss": -6.864559173583984, "global_step": 150184, "epoch": 3575} {"train_loss": -6.735006332397461, "global_step": 150185, "epoch": 3575} {"train_loss": -6.953795433044434, "global_step": 150186, "epoch": 3575} {"train_loss": -6.864936351776123, "global_step": 150187, "epoch": 3575} {"train_loss": -6.801644802093506, "global_step": 150188, "epoch": 3575} {"train_loss": -6.947501182556152, "global_step": 150189, "epoch": 3575} {"train_loss": -7.025237083435059, "global_step": 150190, "epoch": 3575} {"train_loss": -6.8702795051393055, "global_step": 150191, "epoch": 3575, "val_loss": 78655.1484375} {"train_loss": -6.951663017272949, "global_step": 150192, "epoch": 3576} {"train_loss": -6.894277572631836, "global_step": 150193, "epoch": 3576} {"train_loss": -6.93442440032959, "global_step": 150194, "epoch": 3576} {"train_loss": -6.927552223205566, "global_step": 150195, "epoch": 3576} {"train_loss": -6.95919132232666, "global_step": 150196, "epoch": 3576} {"train_loss": -6.927244186401367, "global_step": 150197, "epoch": 3576} {"train_loss": -6.967484474182129, "global_step": 150198, "epoch": 3576} {"train_loss": -6.994409084320068, "global_step": 150199, "epoch": 3576} {"train_loss": -6.946006774902344, "global_step": 150200, "epoch": 3576} {"train_loss": -6.851451873779297, "global_step": 150201, "epoch": 3576} {"train_loss": -6.8606157302856445, "global_step": 150202, "epoch": 3576} {"train_loss": -6.901618003845215, "global_step": 150203, "epoch": 3576} {"train_loss": -6.91793155670166, "global_step": 150204, "epoch": 3576} {"train_loss": -6.833249092102051, "global_step": 150205, "epoch": 3576} {"train_loss": -6.969771385192871, "global_step": 150206, "epoch": 3576} {"train_loss": -6.815052032470703, "global_step": 150207, "epoch": 3576} {"train_loss": -6.826932430267334, "global_step": 150208, "epoch": 3576} {"train_loss": -6.849268436431885, "global_step": 150209, "epoch": 3576} {"train_loss": -6.8771796226501465, "global_step": 150210, "epoch": 3576} {"train_loss": -7.001565456390381, "global_step": 150211, "epoch": 3576} {"train_loss": -6.839521408081055, "global_step": 150212, "epoch": 3576} {"train_loss": -6.817812919616699, "global_step": 150213, "epoch": 3576} {"train_loss": -6.863895416259766, "global_step": 150214, "epoch": 3576} {"train_loss": -6.900582313537598, "global_step": 150215, "epoch": 3576} {"train_loss": -6.978431701660156, "global_step": 150216, "epoch": 3576} {"train_loss": -6.943880081176758, "global_step": 150217, "epoch": 3576} {"train_loss": -6.877899169921875, "global_step": 150218, "epoch": 3576} {"train_loss": -6.906428337097168, "global_step": 150219, "epoch": 3576} {"train_loss": -6.785536766052246, "global_step": 150220, "epoch": 3576} {"train_loss": -6.741158485412598, "global_step": 150221, "epoch": 3576} {"train_loss": -6.730920791625977, "global_step": 150222, "epoch": 3576} {"train_loss": -6.814055919647217, "global_step": 150223, "epoch": 3576} {"train_loss": -6.652680397033691, "global_step": 150224, "epoch": 3576} {"train_loss": -6.739131450653076, "global_step": 150225, "epoch": 3576} {"train_loss": -6.993861198425293, "global_step": 150226, "epoch": 3576} {"train_loss": -6.564067363739014, "global_step": 150227, "epoch": 3576} {"train_loss": -6.670543670654297, "global_step": 150228, "epoch": 3576} {"train_loss": -6.852145195007324, "global_step": 150229, "epoch": 3576} {"train_loss": -6.759228706359863, "global_step": 150230, "epoch": 3576} {"train_loss": -6.765356063842773, "global_step": 150231, "epoch": 3576} {"train_loss": -6.880346775054932, "global_step": 150232, "epoch": 3576} {"train_loss": -6.857674927938552, "global_step": 150233, "epoch": 3576, "val_loss": 78666.0234375} {"train_loss": -6.807351589202881, "global_step": 150234, "epoch": 3577} {"train_loss": -6.879988193511963, "global_step": 150235, "epoch": 3577} {"train_loss": -6.7897868156433105, "global_step": 150236, "epoch": 3577} {"train_loss": -6.833799362182617, "global_step": 150237, "epoch": 3577} {"train_loss": -6.784022331237793, "global_step": 150238, "epoch": 3577} {"train_loss": -6.914937973022461, "global_step": 150239, "epoch": 3577} {"train_loss": -6.77249813079834, "global_step": 150240, "epoch": 3577} {"train_loss": -6.749690055847168, "global_step": 150241, "epoch": 3577} {"train_loss": -6.7811994552612305, "global_step": 150242, "epoch": 3577} {"train_loss": -6.759960174560547, "global_step": 150243, "epoch": 3577} {"train_loss": -6.906452655792236, "global_step": 150244, "epoch": 3577} {"train_loss": -6.904430389404297, "global_step": 150245, "epoch": 3577} {"train_loss": -6.831188678741455, "global_step": 150246, "epoch": 3577} {"train_loss": -6.816655158996582, "global_step": 150247, "epoch": 3577} {"train_loss": -6.847446441650391, "global_step": 150248, "epoch": 3577} {"train_loss": -6.667356967926025, "global_step": 150249, "epoch": 3577} {"train_loss": -6.953621864318848, "global_step": 150250, "epoch": 3577} {"train_loss": -6.950913429260254, "global_step": 150251, "epoch": 3577} {"train_loss": -6.865684986114502, "global_step": 150252, "epoch": 3577} {"train_loss": -6.811702728271484, "global_step": 150253, "epoch": 3577} {"train_loss": -6.896462440490723, "global_step": 150254, "epoch": 3577} {"train_loss": -6.7863922119140625, "global_step": 150255, "epoch": 3577} {"train_loss": -6.949129581451416, "global_step": 150256, "epoch": 3577} {"train_loss": -6.893537521362305, "global_step": 150257, "epoch": 3577} {"train_loss": -6.916092872619629, "global_step": 150258, "epoch": 3577} {"train_loss": -6.841787338256836, "global_step": 150259, "epoch": 3577} {"train_loss": -6.8456711769104, "global_step": 150260, "epoch": 3577} {"train_loss": -6.886891841888428, "global_step": 150261, "epoch": 3577} {"train_loss": -6.817829132080078, "global_step": 150262, "epoch": 3577} {"train_loss": -6.873473167419434, "global_step": 150263, "epoch": 3577} {"train_loss": -6.844392776489258, "global_step": 150264, "epoch": 3577} {"train_loss": -6.961069583892822, "global_step": 150265, "epoch": 3577} {"train_loss": -6.913079738616943, "global_step": 150266, "epoch": 3577} {"train_loss": -6.823906898498535, "global_step": 150267, "epoch": 3577} {"train_loss": -6.921323299407959, "global_step": 150268, "epoch": 3577} {"train_loss": -7.061089515686035, "global_step": 150269, "epoch": 3577} {"train_loss": -6.852231979370117, "global_step": 150270, "epoch": 3577} {"train_loss": -7.017271041870117, "global_step": 150271, "epoch": 3577} {"train_loss": -6.840363502502441, "global_step": 150272, "epoch": 3577} {"train_loss": -6.851972579956055, "global_step": 150273, "epoch": 3577} {"train_loss": -6.682859420776367, "global_step": 150274, "epoch": 3577} {"train_loss": -6.854332821709769, "global_step": 150275, "epoch": 3577, "val_loss": 78577.2265625} {"train_loss": -6.777670860290527, "global_step": 150276, "epoch": 3578} {"train_loss": -6.834545135498047, "global_step": 150277, "epoch": 3578} {"train_loss": -6.874171257019043, "global_step": 150278, "epoch": 3578} {"train_loss": -6.874041557312012, "global_step": 150279, "epoch": 3578} {"train_loss": -6.815741539001465, "global_step": 150280, "epoch": 3578} {"train_loss": -6.825980186462402, "global_step": 150281, "epoch": 3578} {"train_loss": -6.842199325561523, "global_step": 150282, "epoch": 3578} {"train_loss": -6.8764142990112305, "global_step": 150283, "epoch": 3578} {"train_loss": -6.836838722229004, "global_step": 150284, "epoch": 3578} {"train_loss": -6.776277542114258, "global_step": 150285, "epoch": 3578} {"train_loss": -6.853874683380127, "global_step": 150286, "epoch": 3578} {"train_loss": -6.749342918395996, "global_step": 150287, "epoch": 3578} {"train_loss": -6.773044586181641, "global_step": 150288, "epoch": 3578} {"train_loss": -6.909024238586426, "global_step": 150289, "epoch": 3578} {"train_loss": -6.8128790855407715, "global_step": 150290, "epoch": 3578} {"train_loss": -6.9466657638549805, "global_step": 150291, "epoch": 3578} {"train_loss": -6.797717571258545, "global_step": 150292, "epoch": 3578} {"train_loss": -6.923550605773926, "global_step": 150293, "epoch": 3578} {"train_loss": -6.818282604217529, "global_step": 150294, "epoch": 3578} {"train_loss": -6.763419151306152, "global_step": 150295, "epoch": 3578} {"train_loss": -6.819877624511719, "global_step": 150296, "epoch": 3578} {"train_loss": -6.778339385986328, "global_step": 150297, "epoch": 3578} {"train_loss": -6.929187774658203, "global_step": 150298, "epoch": 3578} {"train_loss": -6.772219657897949, "global_step": 150299, "epoch": 3578} {"train_loss": -6.8167033195495605, "global_step": 150300, "epoch": 3578} {"train_loss": -6.847070217132568, "global_step": 150301, "epoch": 3578} {"train_loss": -6.83524227142334, "global_step": 150302, "epoch": 3578} {"train_loss": -7.011066436767578, "global_step": 150303, "epoch": 3578} {"train_loss": -6.7937493324279785, "global_step": 150304, "epoch": 3578} {"train_loss": -6.939239978790283, "global_step": 150305, "epoch": 3578} {"train_loss": -6.787845611572266, "global_step": 150306, "epoch": 3578} {"train_loss": -6.894670486450195, "global_step": 150307, "epoch": 3578} {"train_loss": -6.789809226989746, "global_step": 150308, "epoch": 3578} {"train_loss": -6.841787338256836, "global_step": 150309, "epoch": 3578} {"train_loss": -6.9781389236450195, "global_step": 150310, "epoch": 3578} {"train_loss": -6.8659281730651855, "global_step": 150311, "epoch": 3578} {"train_loss": -6.8598713874816895, "global_step": 150312, "epoch": 3578} {"train_loss": -6.983314514160156, "global_step": 150313, "epoch": 3578} {"train_loss": -6.801715850830078, "global_step": 150314, "epoch": 3578} {"train_loss": -6.895511627197266, "global_step": 150315, "epoch": 3578} {"train_loss": -6.761922359466553, "global_step": 150316, "epoch": 3578} {"train_loss": -6.846309832164219, "global_step": 150317, "epoch": 3578, "val_loss": 78652.921875} {"train_loss": -6.962563991546631, "global_step": 150318, "epoch": 3579} {"train_loss": -6.827872276306152, "global_step": 150319, "epoch": 3579} {"train_loss": -6.8236188888549805, "global_step": 150320, "epoch": 3579} {"train_loss": -6.867437362670898, "global_step": 150321, "epoch": 3579} {"train_loss": -6.912288665771484, "global_step": 150322, "epoch": 3579} {"train_loss": -6.849466323852539, "global_step": 150323, "epoch": 3579} {"train_loss": -6.811681747436523, "global_step": 150324, "epoch": 3579} {"train_loss": -6.881814002990723, "global_step": 150325, "epoch": 3579} {"train_loss": -6.928971767425537, "global_step": 150326, "epoch": 3579} {"train_loss": -6.947444915771484, "global_step": 150327, "epoch": 3579} {"train_loss": -6.94017219543457, "global_step": 150328, "epoch": 3579} {"train_loss": -6.8202643394470215, "global_step": 150329, "epoch": 3579} {"train_loss": -6.852177619934082, "global_step": 150330, "epoch": 3579} {"train_loss": -6.941491603851318, "global_step": 150331, "epoch": 3579} {"train_loss": -6.994485855102539, "global_step": 150332, "epoch": 3579} {"train_loss": -6.896501541137695, "global_step": 150333, "epoch": 3579} {"train_loss": -6.900442123413086, "global_step": 150334, "epoch": 3579} {"train_loss": -6.9181013107299805, "global_step": 150335, "epoch": 3579} {"train_loss": -6.844066619873047, "global_step": 150336, "epoch": 3579} {"train_loss": -6.806958198547363, "global_step": 150337, "epoch": 3579} {"train_loss": -6.872716903686523, "global_step": 150338, "epoch": 3579} {"train_loss": -6.828121185302734, "global_step": 150339, "epoch": 3579} {"train_loss": -6.87235689163208, "global_step": 150340, "epoch": 3579} {"train_loss": -6.833214282989502, "global_step": 150341, "epoch": 3579} {"train_loss": -6.814404487609863, "global_step": 150342, "epoch": 3579} {"train_loss": -6.835740089416504, "global_step": 150343, "epoch": 3579} {"train_loss": -6.761592388153076, "global_step": 150344, "epoch": 3579} {"train_loss": -6.833493232727051, "global_step": 150345, "epoch": 3579} {"train_loss": -6.7567620277404785, "global_step": 150346, "epoch": 3579} {"train_loss": -6.911587715148926, "global_step": 150347, "epoch": 3579} {"train_loss": -6.939184188842773, "global_step": 150348, "epoch": 3579} {"train_loss": -6.844171047210693, "global_step": 150349, "epoch": 3579} {"train_loss": -6.805323600769043, "global_step": 150350, "epoch": 3579} {"train_loss": -6.914274215698242, "global_step": 150351, "epoch": 3579} {"train_loss": -6.935389518737793, "global_step": 150352, "epoch": 3579} {"train_loss": -6.826852798461914, "global_step": 150353, "epoch": 3579} {"train_loss": -6.882422924041748, "global_step": 150354, "epoch": 3579} {"train_loss": -6.9312849044799805, "global_step": 150355, "epoch": 3579} {"train_loss": -6.833309173583984, "global_step": 150356, "epoch": 3579} {"train_loss": -6.950155258178711, "global_step": 150357, "epoch": 3579} {"train_loss": -6.839012145996094, "global_step": 150358, "epoch": 3579} {"train_loss": -6.870236283256894, "global_step": 150359, "epoch": 3579, "val_loss": 78830.3984375} {"train_loss": -6.9612531661987305, "global_step": 150360, "epoch": 3580} {"train_loss": -6.742515563964844, "global_step": 150361, "epoch": 3580} {"train_loss": -6.87440299987793, "global_step": 150362, "epoch": 3580} {"train_loss": -6.910885810852051, "global_step": 150363, "epoch": 3580} {"train_loss": -6.918872356414795, "global_step": 150364, "epoch": 3580} {"train_loss": -6.842951774597168, "global_step": 150365, "epoch": 3580} {"train_loss": -6.885258674621582, "global_step": 150366, "epoch": 3580} {"train_loss": -6.940620422363281, "global_step": 150367, "epoch": 3580} {"train_loss": -6.927748680114746, "global_step": 150368, "epoch": 3580} {"train_loss": -6.842226982116699, "global_step": 150369, "epoch": 3580} {"train_loss": -6.8899006843566895, "global_step": 150370, "epoch": 3580} {"train_loss": -6.9056501388549805, "global_step": 150371, "epoch": 3580} {"train_loss": -6.90562629699707, "global_step": 150372, "epoch": 3580} {"train_loss": -6.718605041503906, "global_step": 150373, "epoch": 3580} {"train_loss": -6.758164405822754, "global_step": 150374, "epoch": 3580} {"train_loss": -6.819499969482422, "global_step": 150375, "epoch": 3580} {"train_loss": -6.828929901123047, "global_step": 150376, "epoch": 3580} {"train_loss": -6.839486122131348, "global_step": 150377, "epoch": 3580} {"train_loss": -6.875837802886963, "global_step": 150378, "epoch": 3580} {"train_loss": -6.987696170806885, "global_step": 150379, "epoch": 3580} {"train_loss": -6.828514099121094, "global_step": 150380, "epoch": 3580} {"train_loss": -6.783336639404297, "global_step": 150381, "epoch": 3580} {"train_loss": -6.816528797149658, "global_step": 150382, "epoch": 3580} {"train_loss": -6.802373886108398, "global_step": 150383, "epoch": 3580} {"train_loss": -6.850058078765869, "global_step": 150384, "epoch": 3580} {"train_loss": -6.9130754470825195, "global_step": 150385, "epoch": 3580} {"train_loss": -6.864545822143555, "global_step": 150386, "epoch": 3580} {"train_loss": -6.856901168823242, "global_step": 150387, "epoch": 3580} {"train_loss": -6.841330051422119, "global_step": 150388, "epoch": 3580} {"train_loss": -6.808813095092773, "global_step": 150389, "epoch": 3580} {"train_loss": -6.853806972503662, "global_step": 150390, "epoch": 3580} {"train_loss": -6.933075904846191, "global_step": 150391, "epoch": 3580} {"train_loss": -6.848818302154541, "global_step": 150392, "epoch": 3580} {"train_loss": -6.96550178527832, "global_step": 150393, "epoch": 3580} {"train_loss": -6.93044376373291, "global_step": 150394, "epoch": 3580} {"train_loss": -6.874677658081055, "global_step": 150395, "epoch": 3580} {"train_loss": -6.9265289306640625, "global_step": 150396, "epoch": 3580} {"train_loss": -6.973709583282471, "global_step": 150397, "epoch": 3580} {"train_loss": -6.8233184814453125, "global_step": 150398, "epoch": 3580} {"train_loss": -6.8492536544799805, "global_step": 150399, "epoch": 3580} {"train_loss": -6.902604579925537, "global_step": 150400, "epoch": 3580} {"train_loss": -6.868721360252017, "global_step": 150401, "epoch": 3580, "val_loss": 78848.2421875} {"train_loss": -6.919155597686768, "global_step": 150402, "epoch": 3581} {"train_loss": -6.957574844360352, "global_step": 150403, "epoch": 3581} {"train_loss": -6.819022178649902, "global_step": 150404, "epoch": 3581} {"train_loss": -6.958474159240723, "global_step": 150405, "epoch": 3581} {"train_loss": -6.959933280944824, "global_step": 150406, "epoch": 3581} {"train_loss": -6.9364824295043945, "global_step": 150407, "epoch": 3581} {"train_loss": -6.816478729248047, "global_step": 150408, "epoch": 3581} {"train_loss": -6.944224834442139, "global_step": 150409, "epoch": 3581} {"train_loss": -6.959456920623779, "global_step": 150410, "epoch": 3581} {"train_loss": -6.84316349029541, "global_step": 150411, "epoch": 3581} {"train_loss": -6.845341682434082, "global_step": 150412, "epoch": 3581} {"train_loss": -6.902769565582275, "global_step": 150413, "epoch": 3581} {"train_loss": -6.854341506958008, "global_step": 150414, "epoch": 3581} {"train_loss": -6.929684162139893, "global_step": 150415, "epoch": 3581} {"train_loss": -6.728320598602295, "global_step": 150416, "epoch": 3581} {"train_loss": -6.894176006317139, "global_step": 150417, "epoch": 3581} {"train_loss": -6.81862735748291, "global_step": 150418, "epoch": 3581} {"train_loss": -6.890193939208984, "global_step": 150419, "epoch": 3581} {"train_loss": -6.848620414733887, "global_step": 150420, "epoch": 3581} {"train_loss": -6.8705573081970215, "global_step": 150421, "epoch": 3581} {"train_loss": -6.748039245605469, "global_step": 150422, "epoch": 3581} {"train_loss": -6.866849422454834, "global_step": 150423, "epoch": 3581} {"train_loss": -6.851422309875488, "global_step": 150424, "epoch": 3581} {"train_loss": -6.9009108543396, "global_step": 150425, "epoch": 3581} {"train_loss": -6.8840460777282715, "global_step": 150426, "epoch": 3581} {"train_loss": -6.909229755401611, "global_step": 150427, "epoch": 3581} {"train_loss": -6.898645877838135, "global_step": 150428, "epoch": 3581} {"train_loss": -6.958441734313965, "global_step": 150429, "epoch": 3581} {"train_loss": -6.800875663757324, "global_step": 150430, "epoch": 3581} {"train_loss": -6.896592617034912, "global_step": 150431, "epoch": 3581} {"train_loss": -6.950058937072754, "global_step": 150432, "epoch": 3581} {"train_loss": -6.799342632293701, "global_step": 150433, "epoch": 3581} {"train_loss": -6.942139148712158, "global_step": 150434, "epoch": 3581} {"train_loss": -6.806150436401367, "global_step": 150435, "epoch": 3581} {"train_loss": -6.834048271179199, "global_step": 150436, "epoch": 3581} {"train_loss": -6.879762649536133, "global_step": 150437, "epoch": 3581} {"train_loss": -6.80803108215332, "global_step": 150438, "epoch": 3581} {"train_loss": -6.895428657531738, "global_step": 150439, "epoch": 3581} {"train_loss": -6.936474800109863, "global_step": 150440, "epoch": 3581} {"train_loss": -6.891993522644043, "global_step": 150441, "epoch": 3581} {"train_loss": -6.851332187652588, "global_step": 150442, "epoch": 3581} {"train_loss": -6.8797943365006216, "global_step": 150443, "epoch": 3581, "val_loss": 78494.0390625} {"train_loss": -6.940888404846191, "global_step": 150444, "epoch": 3582} {"train_loss": -6.9117021560668945, "global_step": 150445, "epoch": 3582} {"train_loss": -6.966054439544678, "global_step": 150446, "epoch": 3582} {"train_loss": -6.8323163986206055, "global_step": 150447, "epoch": 3582} {"train_loss": -6.805743217468262, "global_step": 150448, "epoch": 3582} {"train_loss": -7.036478042602539, "global_step": 150449, "epoch": 3582} {"train_loss": -6.986188888549805, "global_step": 150450, "epoch": 3582} {"train_loss": -6.889056205749512, "global_step": 150451, "epoch": 3582} {"train_loss": -6.906249523162842, "global_step": 150452, "epoch": 3582} {"train_loss": -7.013772964477539, "global_step": 150453, "epoch": 3582} {"train_loss": -7.021084785461426, "global_step": 150454, "epoch": 3582} {"train_loss": -6.940561771392822, "global_step": 150455, "epoch": 3582} {"train_loss": -6.926822662353516, "global_step": 150456, "epoch": 3582} {"train_loss": -6.8433685302734375, "global_step": 150457, "epoch": 3582} {"train_loss": -6.8836774826049805, "global_step": 150458, "epoch": 3582} {"train_loss": -6.84635591506958, "global_step": 150459, "epoch": 3582} {"train_loss": -6.942111968994141, "global_step": 150460, "epoch": 3582} {"train_loss": -6.95869255065918, "global_step": 150461, "epoch": 3582} {"train_loss": -6.721728324890137, "global_step": 150462, "epoch": 3582} {"train_loss": -6.761706829071045, "global_step": 150463, "epoch": 3582} {"train_loss": -6.891998291015625, "global_step": 150464, "epoch": 3582} {"train_loss": -6.920897006988525, "global_step": 150465, "epoch": 3582} {"train_loss": -6.825279235839844, "global_step": 150466, "epoch": 3582} {"train_loss": -6.883276462554932, "global_step": 150467, "epoch": 3582} {"train_loss": -6.83079719543457, "global_step": 150468, "epoch": 3582} {"train_loss": -6.852298736572266, "global_step": 150469, "epoch": 3582} {"train_loss": -6.8763017654418945, "global_step": 150470, "epoch": 3582} {"train_loss": -6.795975685119629, "global_step": 150471, "epoch": 3582} {"train_loss": -6.990775108337402, "global_step": 150472, "epoch": 3582} {"train_loss": -6.951350212097168, "global_step": 150473, "epoch": 3582} {"train_loss": -6.874248504638672, "global_step": 150474, "epoch": 3582} {"train_loss": -6.957953453063965, "global_step": 150475, "epoch": 3582} {"train_loss": -6.910574913024902, "global_step": 150476, "epoch": 3582} {"train_loss": -6.8347578048706055, "global_step": 150477, "epoch": 3582} {"train_loss": -6.872541904449463, "global_step": 150478, "epoch": 3582} {"train_loss": -6.946529388427734, "global_step": 150479, "epoch": 3582} {"train_loss": -6.999444007873535, "global_step": 150480, "epoch": 3582} {"train_loss": -6.867216110229492, "global_step": 150481, "epoch": 3582} {"train_loss": -6.977723121643066, "global_step": 150482, "epoch": 3582} {"train_loss": -6.942640781402588, "global_step": 150483, "epoch": 3582} {"train_loss": -6.978457927703857, "global_step": 150484, "epoch": 3582} {"train_loss": -6.902784313474383, "global_step": 150485, "epoch": 3582, "val_loss": 78726.671875} {"train_loss": -6.995848655700684, "global_step": 150486, "epoch": 3583} {"train_loss": -6.891046524047852, "global_step": 150487, "epoch": 3583} {"train_loss": -7.037486553192139, "global_step": 150488, "epoch": 3583} {"train_loss": -6.873213291168213, "global_step": 150489, "epoch": 3583} {"train_loss": -6.916533470153809, "global_step": 150490, "epoch": 3583} {"train_loss": -6.95521879196167, "global_step": 150491, "epoch": 3583} {"train_loss": -6.925322532653809, "global_step": 150492, "epoch": 3583} {"train_loss": -6.928979873657227, "global_step": 150493, "epoch": 3583} {"train_loss": -6.940664291381836, "global_step": 150494, "epoch": 3583} {"train_loss": -6.840705394744873, "global_step": 150495, "epoch": 3583} {"train_loss": -6.867438793182373, "global_step": 150496, "epoch": 3583} {"train_loss": -6.934000492095947, "global_step": 150497, "epoch": 3583} {"train_loss": -6.942108154296875, "global_step": 150498, "epoch": 3583} {"train_loss": -6.899763107299805, "global_step": 150499, "epoch": 3583} {"train_loss": -6.864238262176514, "global_step": 150500, "epoch": 3583} {"train_loss": -6.9954962730407715, "global_step": 150501, "epoch": 3583} {"train_loss": -6.851504802703857, "global_step": 150502, "epoch": 3583} {"train_loss": -6.912138938903809, "global_step": 150503, "epoch": 3583} {"train_loss": -7.018503665924072, "global_step": 150504, "epoch": 3583} {"train_loss": -6.778476238250732, "global_step": 150505, "epoch": 3583} {"train_loss": -6.611830711364746, "global_step": 150506, "epoch": 3583} {"train_loss": -6.727424144744873, "global_step": 150507, "epoch": 3583} {"train_loss": -6.855713844299316, "global_step": 150508, "epoch": 3583} {"train_loss": -6.96455192565918, "global_step": 150509, "epoch": 3583} {"train_loss": -6.713564395904541, "global_step": 150510, "epoch": 3583} {"train_loss": -6.848810195922852, "global_step": 150511, "epoch": 3583} {"train_loss": -6.880575180053711, "global_step": 150512, "epoch": 3583} {"train_loss": -6.841186046600342, "global_step": 150513, "epoch": 3583} {"train_loss": -6.7728986740112305, "global_step": 150514, "epoch": 3583} {"train_loss": -6.9246602058410645, "global_step": 150515, "epoch": 3583} {"train_loss": -6.7932329177856445, "global_step": 150516, "epoch": 3583} {"train_loss": -6.980087757110596, "global_step": 150517, "epoch": 3583} {"train_loss": -6.854033946990967, "global_step": 150518, "epoch": 3583} {"train_loss": -6.855803489685059, "global_step": 150519, "epoch": 3583} {"train_loss": -6.8689775466918945, "global_step": 150520, "epoch": 3583} {"train_loss": -6.759500503540039, "global_step": 150521, "epoch": 3583} {"train_loss": -6.9290337562561035, "global_step": 150522, "epoch": 3583} {"train_loss": -6.8719940185546875, "global_step": 150523, "epoch": 3583} {"train_loss": -6.881796360015869, "global_step": 150524, "epoch": 3583} {"train_loss": -6.837119102478027, "global_step": 150525, "epoch": 3583} {"train_loss": -6.844220161437988, "global_step": 150526, "epoch": 3583} {"train_loss": -6.87657752491179, "global_step": 150527, "epoch": 3583, "val_loss": 78937.3125} {"train_loss": -6.937774658203125, "global_step": 150528, "epoch": 3584} {"train_loss": -6.857241630554199, "global_step": 150529, "epoch": 3584} {"train_loss": -6.844263076782227, "global_step": 150530, "epoch": 3584} {"train_loss": -6.894918918609619, "global_step": 150531, "epoch": 3584} {"train_loss": -6.981757164001465, "global_step": 150532, "epoch": 3584} {"train_loss": -6.832034111022949, "global_step": 150533, "epoch": 3584} {"train_loss": -6.918628692626953, "global_step": 150534, "epoch": 3584} {"train_loss": -6.947998046875, "global_step": 150535, "epoch": 3584} {"train_loss": -6.784559726715088, "global_step": 150536, "epoch": 3584} {"train_loss": -6.9844970703125, "global_step": 150537, "epoch": 3584} {"train_loss": -6.779426097869873, "global_step": 150538, "epoch": 3584} {"train_loss": -6.819991111755371, "global_step": 150539, "epoch": 3584} {"train_loss": -6.897553443908691, "global_step": 150540, "epoch": 3584} {"train_loss": -6.772791385650635, "global_step": 150541, "epoch": 3584} {"train_loss": -6.792518615722656, "global_step": 150542, "epoch": 3584} {"train_loss": -6.883383750915527, "global_step": 150543, "epoch": 3584} {"train_loss": -6.849602222442627, "global_step": 150544, "epoch": 3584} {"train_loss": -6.895830154418945, "global_step": 150545, "epoch": 3584} {"train_loss": -6.818702697753906, "global_step": 150546, "epoch": 3584} {"train_loss": -6.957093238830566, "global_step": 150547, "epoch": 3584} {"train_loss": -6.848294258117676, "global_step": 150548, "epoch": 3584} {"train_loss": -6.95572566986084, "global_step": 150549, "epoch": 3584} {"train_loss": -6.806663513183594, "global_step": 150550, "epoch": 3584} {"train_loss": -6.843768119812012, "global_step": 150551, "epoch": 3584} {"train_loss": -6.838037014007568, "global_step": 150552, "epoch": 3584} {"train_loss": -6.9411187171936035, "global_step": 150553, "epoch": 3584} {"train_loss": -6.783353328704834, "global_step": 150554, "epoch": 3584} {"train_loss": -6.992975234985352, "global_step": 150555, "epoch": 3584} {"train_loss": -6.886532783508301, "global_step": 150556, "epoch": 3584} {"train_loss": -6.740181922912598, "global_step": 150557, "epoch": 3584} {"train_loss": -6.866341590881348, "global_step": 150558, "epoch": 3584} {"train_loss": -6.7889299392700195, "global_step": 150559, "epoch": 3584} {"train_loss": -6.861534118652344, "global_step": 150560, "epoch": 3584} {"train_loss": -6.831071853637695, "global_step": 150561, "epoch": 3584} {"train_loss": -6.949350357055664, "global_step": 150562, "epoch": 3584} {"train_loss": -6.816096305847168, "global_step": 150563, "epoch": 3584} {"train_loss": -6.883602619171143, "global_step": 150564, "epoch": 3584} {"train_loss": -6.898787498474121, "global_step": 150565, "epoch": 3584} {"train_loss": -6.9234161376953125, "global_step": 150566, "epoch": 3584} {"train_loss": -6.943423271179199, "global_step": 150567, "epoch": 3584} {"train_loss": -6.86151123046875, "global_step": 150568, "epoch": 3584} {"train_loss": -6.872398455937703, "global_step": 150569, "epoch": 3584, "val_loss": 78354.015625} {"train_loss": -6.721715927124023, "global_step": 150570, "epoch": 3585} {"train_loss": -6.930685997009277, "global_step": 150571, "epoch": 3585} {"train_loss": -6.844099044799805, "global_step": 150572, "epoch": 3585} {"train_loss": -6.920607089996338, "global_step": 150573, "epoch": 3585} {"train_loss": -6.846323013305664, "global_step": 150574, "epoch": 3585} {"train_loss": -6.833780765533447, "global_step": 150575, "epoch": 3585} {"train_loss": -6.868247032165527, "global_step": 150576, "epoch": 3585} {"train_loss": -6.727909088134766, "global_step": 150577, "epoch": 3585} {"train_loss": -6.886471271514893, "global_step": 150578, "epoch": 3585} {"train_loss": -6.884661674499512, "global_step": 150579, "epoch": 3585} {"train_loss": -6.921054840087891, "global_step": 150580, "epoch": 3585} {"train_loss": -6.811817169189453, "global_step": 150581, "epoch": 3585} {"train_loss": -6.860184669494629, "global_step": 150582, "epoch": 3585} {"train_loss": -6.829164028167725, "global_step": 150583, "epoch": 3585} {"train_loss": -6.760453701019287, "global_step": 150584, "epoch": 3585} {"train_loss": -6.841742992401123, "global_step": 150585, "epoch": 3585} {"train_loss": -6.928534507751465, "global_step": 150586, "epoch": 3585} {"train_loss": -6.8682122230529785, "global_step": 150587, "epoch": 3585} {"train_loss": -6.829509258270264, "global_step": 150588, "epoch": 3585} {"train_loss": -6.82649040222168, "global_step": 150589, "epoch": 3585} {"train_loss": -6.849623680114746, "global_step": 150590, "epoch": 3585} {"train_loss": -6.861069202423096, "global_step": 150591, "epoch": 3585} {"train_loss": -6.76131534576416, "global_step": 150592, "epoch": 3585} {"train_loss": -6.725368499755859, "global_step": 150593, "epoch": 3585} {"train_loss": -6.929544925689697, "global_step": 150594, "epoch": 3585} {"train_loss": -6.69029426574707, "global_step": 150595, "epoch": 3585} {"train_loss": -6.812161445617676, "global_step": 150596, "epoch": 3585} {"train_loss": -6.8076372146606445, "global_step": 150597, "epoch": 3585} {"train_loss": -6.790424346923828, "global_step": 150598, "epoch": 3585} {"train_loss": -6.823379993438721, "global_step": 150599, "epoch": 3585} {"train_loss": -6.766963005065918, "global_step": 150600, "epoch": 3585} {"train_loss": -6.9104766845703125, "global_step": 150601, "epoch": 3585} {"train_loss": -6.86943244934082, "global_step": 150602, "epoch": 3585} {"train_loss": -6.843733787536621, "global_step": 150603, "epoch": 3585} {"train_loss": -6.933547019958496, "global_step": 150604, "epoch": 3585} {"train_loss": -6.918519020080566, "global_step": 150605, "epoch": 3585} {"train_loss": -6.876288414001465, "global_step": 150606, "epoch": 3585} {"train_loss": -6.843294620513916, "global_step": 150607, "epoch": 3585} {"train_loss": -6.842900276184082, "global_step": 150608, "epoch": 3585} {"train_loss": -6.942700386047363, "global_step": 150609, "epoch": 3585} {"train_loss": -6.7305908203125, "global_step": 150610, "epoch": 3585} {"train_loss": -6.84251518476577, "global_step": 150611, "epoch": 3585, "val_loss": 78747.59375} {"train_loss": -6.848895072937012, "global_step": 150612, "epoch": 3586} {"train_loss": -6.93203067779541, "global_step": 150613, "epoch": 3586} {"train_loss": -6.7937235832214355, "global_step": 150614, "epoch": 3586} {"train_loss": -6.8097758293151855, "global_step": 150615, "epoch": 3586} {"train_loss": -6.822972297668457, "global_step": 150616, "epoch": 3586} {"train_loss": -6.808175086975098, "global_step": 150617, "epoch": 3586} {"train_loss": -6.83512020111084, "global_step": 150618, "epoch": 3586} {"train_loss": -6.774465560913086, "global_step": 150619, "epoch": 3586} {"train_loss": -6.860203742980957, "global_step": 150620, "epoch": 3586} {"train_loss": -6.876618385314941, "global_step": 150621, "epoch": 3586} {"train_loss": -6.895842552185059, "global_step": 150622, "epoch": 3586} {"train_loss": -6.856149673461914, "global_step": 150623, "epoch": 3586} {"train_loss": -6.926405906677246, "global_step": 150624, "epoch": 3586} {"train_loss": -6.868022918701172, "global_step": 150625, "epoch": 3586} {"train_loss": -6.859267234802246, "global_step": 150626, "epoch": 3586} {"train_loss": -6.854059219360352, "global_step": 150627, "epoch": 3586} {"train_loss": -6.898224353790283, "global_step": 150628, "epoch": 3586} {"train_loss": -6.835171699523926, "global_step": 150629, "epoch": 3586} {"train_loss": -6.861573219299316, "global_step": 150630, "epoch": 3586} {"train_loss": -6.8293137550354, "global_step": 150631, "epoch": 3586} {"train_loss": -6.92816686630249, "global_step": 150632, "epoch": 3586} {"train_loss": -6.744529724121094, "global_step": 150633, "epoch": 3586} {"train_loss": -6.770907878875732, "global_step": 150634, "epoch": 3586} {"train_loss": -6.84263801574707, "global_step": 150635, "epoch": 3586} {"train_loss": -6.754687786102295, "global_step": 150636, "epoch": 3586} {"train_loss": -6.900216102600098, "global_step": 150637, "epoch": 3586} {"train_loss": -6.869932174682617, "global_step": 150638, "epoch": 3586} {"train_loss": -6.6632537841796875, "global_step": 150639, "epoch": 3586} {"train_loss": -6.747773170471191, "global_step": 150640, "epoch": 3586} {"train_loss": -6.812647819519043, "global_step": 150641, "epoch": 3586} {"train_loss": -6.911334991455078, "global_step": 150642, "epoch": 3586} {"train_loss": -6.79127311706543, "global_step": 150643, "epoch": 3586} {"train_loss": -6.834133148193359, "global_step": 150644, "epoch": 3586} {"train_loss": -6.923919677734375, "global_step": 150645, "epoch": 3586} {"train_loss": -6.720663547515869, "global_step": 150646, "epoch": 3586} {"train_loss": -6.778262138366699, "global_step": 150647, "epoch": 3586} {"train_loss": -6.638113975524902, "global_step": 150648, "epoch": 3586} {"train_loss": -6.796708106994629, "global_step": 150649, "epoch": 3586} {"train_loss": -6.656408309936523, "global_step": 150650, "epoch": 3586} {"train_loss": -6.627674102783203, "global_step": 150651, "epoch": 3586} {"train_loss": -6.807986736297607, "global_step": 150652, "epoch": 3586} {"train_loss": -6.816515218643915, "global_step": 150653, "epoch": 3586, "val_loss": 78733.5625} {"train_loss": -6.771697998046875, "global_step": 150654, "epoch": 3587} {"train_loss": -6.772292137145996, "global_step": 150655, "epoch": 3587} {"train_loss": -6.827652454376221, "global_step": 150656, "epoch": 3587} {"train_loss": -6.82951021194458, "global_step": 150657, "epoch": 3587} {"train_loss": -6.787766933441162, "global_step": 150658, "epoch": 3587} {"train_loss": -6.76767110824585, "global_step": 150659, "epoch": 3587} {"train_loss": -6.773007392883301, "global_step": 150660, "epoch": 3587} {"train_loss": -6.761115550994873, "global_step": 150661, "epoch": 3587} {"train_loss": -6.820011138916016, "global_step": 150662, "epoch": 3587} {"train_loss": -6.884049892425537, "global_step": 150663, "epoch": 3587} {"train_loss": -6.837377548217773, "global_step": 150664, "epoch": 3587} {"train_loss": -6.708982467651367, "global_step": 150665, "epoch": 3587} {"train_loss": -6.776355743408203, "global_step": 150666, "epoch": 3587} {"train_loss": -6.897593975067139, "global_step": 150667, "epoch": 3587} {"train_loss": -6.806145668029785, "global_step": 150668, "epoch": 3587} {"train_loss": -6.755204200744629, "global_step": 150669, "epoch": 3587} {"train_loss": -6.898250579833984, "global_step": 150670, "epoch": 3587} {"train_loss": -6.897122383117676, "global_step": 150671, "epoch": 3587} {"train_loss": -6.871410369873047, "global_step": 150672, "epoch": 3587} {"train_loss": -6.940119743347168, "global_step": 150673, "epoch": 3587} {"train_loss": -6.852147102355957, "global_step": 150674, "epoch": 3587} {"train_loss": -6.952331066131592, "global_step": 150675, "epoch": 3587} {"train_loss": -6.875522136688232, "global_step": 150676, "epoch": 3587} {"train_loss": -6.802562713623047, "global_step": 150677, "epoch": 3587} {"train_loss": -6.827193737030029, "global_step": 150678, "epoch": 3587} {"train_loss": -6.919671058654785, "global_step": 150679, "epoch": 3587} {"train_loss": -6.915440559387207, "global_step": 150680, "epoch": 3587} {"train_loss": -6.895911693572998, "global_step": 150681, "epoch": 3587} {"train_loss": -6.769120216369629, "global_step": 150682, "epoch": 3587} {"train_loss": -6.918049335479736, "global_step": 150683, "epoch": 3587} {"train_loss": -6.845421314239502, "global_step": 150684, "epoch": 3587} {"train_loss": -6.815067291259766, "global_step": 150685, "epoch": 3587} {"train_loss": -6.947482585906982, "global_step": 150686, "epoch": 3587} {"train_loss": -6.877092361450195, "global_step": 150687, "epoch": 3587} {"train_loss": -6.898096084594727, "global_step": 150688, "epoch": 3587} {"train_loss": -7.026634216308594, "global_step": 150689, "epoch": 3587} {"train_loss": -6.9890618324279785, "global_step": 150690, "epoch": 3587} {"train_loss": -6.856269836425781, "global_step": 150691, "epoch": 3587} {"train_loss": -6.752885341644287, "global_step": 150692, "epoch": 3587} {"train_loss": -6.765406131744385, "global_step": 150693, "epoch": 3587} {"train_loss": -6.898370742797852, "global_step": 150694, "epoch": 3587} {"train_loss": -6.846911543891544, "global_step": 150695, "epoch": 3587, "val_loss": 78791.0390625} {"train_loss": -6.917248249053955, "global_step": 150696, "epoch": 3588} {"train_loss": -7.030235290527344, "global_step": 150697, "epoch": 3588} {"train_loss": -6.917590618133545, "global_step": 150698, "epoch": 3588} {"train_loss": -6.908347129821777, "global_step": 150699, "epoch": 3588} {"train_loss": -6.85484504699707, "global_step": 150700, "epoch": 3588} {"train_loss": -6.89629602432251, "global_step": 150701, "epoch": 3588} {"train_loss": -6.959664821624756, "global_step": 150702, "epoch": 3588} {"train_loss": -6.7992963790893555, "global_step": 150703, "epoch": 3588} {"train_loss": -6.947062969207764, "global_step": 150704, "epoch": 3588} {"train_loss": -6.798793792724609, "global_step": 150705, "epoch": 3588} {"train_loss": -6.844773292541504, "global_step": 150706, "epoch": 3588} {"train_loss": -6.92254638671875, "global_step": 150707, "epoch": 3588} {"train_loss": -6.95921516418457, "global_step": 150708, "epoch": 3588} {"train_loss": -6.914921760559082, "global_step": 150709, "epoch": 3588} {"train_loss": -6.808869361877441, "global_step": 150710, "epoch": 3588} {"train_loss": -6.953563213348389, "global_step": 150711, "epoch": 3588} {"train_loss": -6.95020866394043, "global_step": 150712, "epoch": 3588} {"train_loss": -6.815676212310791, "global_step": 150713, "epoch": 3588} {"train_loss": -6.888281345367432, "global_step": 150714, "epoch": 3588} {"train_loss": -7.010248184204102, "global_step": 150715, "epoch": 3588} {"train_loss": -6.793634414672852, "global_step": 150716, "epoch": 3588} {"train_loss": -6.854254722595215, "global_step": 150717, "epoch": 3588} {"train_loss": -6.966864585876465, "global_step": 150718, "epoch": 3588} {"train_loss": -6.928329944610596, "global_step": 150719, "epoch": 3588} {"train_loss": -6.822601318359375, "global_step": 150720, "epoch": 3588} {"train_loss": -6.80238151550293, "global_step": 150721, "epoch": 3588} {"train_loss": -6.7929911613464355, "global_step": 150722, "epoch": 3588} {"train_loss": -6.883225440979004, "global_step": 150723, "epoch": 3588} {"train_loss": -6.878704071044922, "global_step": 150724, "epoch": 3588} {"train_loss": -6.894273281097412, "global_step": 150725, "epoch": 3588} {"train_loss": -6.880444526672363, "global_step": 150726, "epoch": 3588} {"train_loss": -6.865437984466553, "global_step": 150727, "epoch": 3588} {"train_loss": -6.97053337097168, "global_step": 150728, "epoch": 3588} {"train_loss": -6.921092987060547, "global_step": 150729, "epoch": 3588} {"train_loss": -6.931018829345703, "global_step": 150730, "epoch": 3588} {"train_loss": -6.930541515350342, "global_step": 150731, "epoch": 3588} {"train_loss": -7.024507522583008, "global_step": 150732, "epoch": 3588} {"train_loss": -6.857083797454834, "global_step": 150733, "epoch": 3588} {"train_loss": -6.801570892333984, "global_step": 150734, "epoch": 3588} {"train_loss": -6.853925704956055, "global_step": 150735, "epoch": 3588} {"train_loss": -6.855010986328125, "global_step": 150736, "epoch": 3588} {"train_loss": -6.891013860702515, "global_step": 150737, "epoch": 3588, "val_loss": 78793.4375} {"train_loss": -6.92716646194458, "global_step": 150738, "epoch": 3589} {"train_loss": -7.04477596282959, "global_step": 150739, "epoch": 3589} {"train_loss": -6.925656318664551, "global_step": 150740, "epoch": 3589} {"train_loss": -6.870919704437256, "global_step": 150741, "epoch": 3589} {"train_loss": -6.880114555358887, "global_step": 150742, "epoch": 3589} {"train_loss": -7.000117301940918, "global_step": 150743, "epoch": 3589} {"train_loss": -7.029754161834717, "global_step": 150744, "epoch": 3589} {"train_loss": -6.918788909912109, "global_step": 150745, "epoch": 3589} {"train_loss": -6.880646705627441, "global_step": 150746, "epoch": 3589} {"train_loss": -6.952787399291992, "global_step": 150747, "epoch": 3589} {"train_loss": -6.919258117675781, "global_step": 150748, "epoch": 3589} {"train_loss": -6.976861000061035, "global_step": 150749, "epoch": 3589} {"train_loss": -6.887092590332031, "global_step": 150750, "epoch": 3589} {"train_loss": -6.90360164642334, "global_step": 150751, "epoch": 3589} {"train_loss": -7.073474407196045, "global_step": 150752, "epoch": 3589} {"train_loss": -6.833772659301758, "global_step": 150753, "epoch": 3589} {"train_loss": -6.851358413696289, "global_step": 150754, "epoch": 3589} {"train_loss": -6.889992713928223, "global_step": 150755, "epoch": 3589} {"train_loss": -6.884530067443848, "global_step": 150756, "epoch": 3589} {"train_loss": -6.815657615661621, "global_step": 150757, "epoch": 3589} {"train_loss": -6.826379776000977, "global_step": 150758, "epoch": 3589} {"train_loss": -6.873041152954102, "global_step": 150759, "epoch": 3589} {"train_loss": -6.8968119621276855, "global_step": 150760, "epoch": 3589} {"train_loss": -6.726894378662109, "global_step": 150761, "epoch": 3589} {"train_loss": -6.933993816375732, "global_step": 150762, "epoch": 3589} {"train_loss": -6.944298267364502, "global_step": 150763, "epoch": 3589} {"train_loss": -6.8584442138671875, "global_step": 150764, "epoch": 3589} {"train_loss": -6.900373458862305, "global_step": 150765, "epoch": 3589} {"train_loss": -6.970335483551025, "global_step": 150766, "epoch": 3589} {"train_loss": -6.899936199188232, "global_step": 150767, "epoch": 3589} {"train_loss": -6.816745281219482, "global_step": 150768, "epoch": 3589} {"train_loss": -6.823281764984131, "global_step": 150769, "epoch": 3589} {"train_loss": -6.925201416015625, "global_step": 150770, "epoch": 3589} {"train_loss": -6.8090314865112305, "global_step": 150771, "epoch": 3589} {"train_loss": -6.85383415222168, "global_step": 150772, "epoch": 3589} {"train_loss": -6.8470354080200195, "global_step": 150773, "epoch": 3589} {"train_loss": -6.898342132568359, "global_step": 150774, "epoch": 3589} {"train_loss": -6.92487096786499, "global_step": 150775, "epoch": 3589} {"train_loss": -6.999441623687744, "global_step": 150776, "epoch": 3589} {"train_loss": -6.849992752075195, "global_step": 150777, "epoch": 3589} {"train_loss": -6.8978424072265625, "global_step": 150778, "epoch": 3589} {"train_loss": -6.899006412142799, "global_step": 150779, "epoch": 3589, "val_loss": 78853.453125} {"train_loss": -6.906355857849121, "global_step": 150780, "epoch": 3590} {"train_loss": -6.893318176269531, "global_step": 150781, "epoch": 3590} {"train_loss": -6.845000267028809, "global_step": 150782, "epoch": 3590} {"train_loss": -6.860612869262695, "global_step": 150783, "epoch": 3590} {"train_loss": -6.856173038482666, "global_step": 150784, "epoch": 3590} {"train_loss": -6.989442825317383, "global_step": 150785, "epoch": 3590} {"train_loss": -6.9562554359436035, "global_step": 150786, "epoch": 3590} {"train_loss": -6.756165027618408, "global_step": 150787, "epoch": 3590} {"train_loss": -6.95909309387207, "global_step": 150788, "epoch": 3590} {"train_loss": -6.953122138977051, "global_step": 150789, "epoch": 3590} {"train_loss": -6.916337490081787, "global_step": 150790, "epoch": 3590} {"train_loss": -6.881137371063232, "global_step": 150791, "epoch": 3590} {"train_loss": -6.925268650054932, "global_step": 150792, "epoch": 3590} {"train_loss": -6.881499767303467, "global_step": 150793, "epoch": 3590} {"train_loss": -6.841065883636475, "global_step": 150794, "epoch": 3590} {"train_loss": -6.956629753112793, "global_step": 150795, "epoch": 3590} {"train_loss": -6.922137260437012, "global_step": 150796, "epoch": 3590} {"train_loss": -6.911484718322754, "global_step": 150797, "epoch": 3590} {"train_loss": -6.962459564208984, "global_step": 150798, "epoch": 3590} {"train_loss": -6.97114372253418, "global_step": 150799, "epoch": 3590} {"train_loss": -6.909918785095215, "global_step": 150800, "epoch": 3590} {"train_loss": -6.916913986206055, "global_step": 150801, "epoch": 3590} {"train_loss": -6.961038112640381, "global_step": 150802, "epoch": 3590} {"train_loss": -6.864724636077881, "global_step": 150803, "epoch": 3590} {"train_loss": -7.003763198852539, "global_step": 150804, "epoch": 3590} {"train_loss": -6.854275226593018, "global_step": 150805, "epoch": 3590} {"train_loss": -6.809322357177734, "global_step": 150806, "epoch": 3590} {"train_loss": -6.906411170959473, "global_step": 150807, "epoch": 3590} {"train_loss": -6.823469161987305, "global_step": 150808, "epoch": 3590} {"train_loss": -6.784383773803711, "global_step": 150809, "epoch": 3590} {"train_loss": -6.728785991668701, "global_step": 150810, "epoch": 3590} {"train_loss": -6.830911159515381, "global_step": 150811, "epoch": 3590} {"train_loss": -6.883953094482422, "global_step": 150812, "epoch": 3590} {"train_loss": -6.681576728820801, "global_step": 150813, "epoch": 3590} {"train_loss": -6.800234794616699, "global_step": 150814, "epoch": 3590} {"train_loss": -6.801426887512207, "global_step": 150815, "epoch": 3590} {"train_loss": -6.7844085693359375, "global_step": 150816, "epoch": 3590} {"train_loss": -6.905358791351318, "global_step": 150817, "epoch": 3590} {"train_loss": -6.950342655181885, "global_step": 150818, "epoch": 3590} {"train_loss": -6.830480575561523, "global_step": 150819, "epoch": 3590} {"train_loss": -6.755438327789307, "global_step": 150820, "epoch": 3590} {"train_loss": -6.877291463670277, "global_step": 150821, "epoch": 3590, "val_loss": 78626.0390625} {"train_loss": -6.900574684143066, "global_step": 150822, "epoch": 3591} {"train_loss": -6.797739028930664, "global_step": 150823, "epoch": 3591} {"train_loss": -6.882453918457031, "global_step": 150824, "epoch": 3591} {"train_loss": -6.871244430541992, "global_step": 150825, "epoch": 3591} {"train_loss": -6.94711971282959, "global_step": 150826, "epoch": 3591} {"train_loss": -6.830561637878418, "global_step": 150827, "epoch": 3591} {"train_loss": -7.004631042480469, "global_step": 150828, "epoch": 3591} {"train_loss": -6.860335350036621, "global_step": 150829, "epoch": 3591} {"train_loss": -6.920094013214111, "global_step": 150830, "epoch": 3591} {"train_loss": -7.016674041748047, "global_step": 150831, "epoch": 3591} {"train_loss": -6.769888877868652, "global_step": 150832, "epoch": 3591} {"train_loss": -6.970989227294922, "global_step": 150833, "epoch": 3591} {"train_loss": -6.921696662902832, "global_step": 150834, "epoch": 3591} {"train_loss": -7.043649673461914, "global_step": 150835, "epoch": 3591} {"train_loss": -6.852158546447754, "global_step": 150836, "epoch": 3591} {"train_loss": -6.865830421447754, "global_step": 150837, "epoch": 3591} {"train_loss": -7.078127861022949, "global_step": 150838, "epoch": 3591} {"train_loss": -6.883934497833252, "global_step": 150839, "epoch": 3591} {"train_loss": -6.964760780334473, "global_step": 150840, "epoch": 3591} {"train_loss": -6.97005558013916, "global_step": 150841, "epoch": 3591} {"train_loss": -6.985134124755859, "global_step": 150842, "epoch": 3591} {"train_loss": -6.857846736907959, "global_step": 150843, "epoch": 3591} {"train_loss": -6.932724475860596, "global_step": 150844, "epoch": 3591} {"train_loss": -6.864074230194092, "global_step": 150845, "epoch": 3591} {"train_loss": -6.984589576721191, "global_step": 150846, "epoch": 3591} {"train_loss": -6.8295159339904785, "global_step": 150847, "epoch": 3591} {"train_loss": -6.85130500793457, "global_step": 150848, "epoch": 3591} {"train_loss": -6.869256973266602, "global_step": 150849, "epoch": 3591} {"train_loss": -6.86489200592041, "global_step": 150850, "epoch": 3591} {"train_loss": -6.801329135894775, "global_step": 150851, "epoch": 3591} {"train_loss": -6.8707780838012695, "global_step": 150852, "epoch": 3591} {"train_loss": -6.760804176330566, "global_step": 150853, "epoch": 3591} {"train_loss": -6.83704948425293, "global_step": 150854, "epoch": 3591} {"train_loss": -6.95725154876709, "global_step": 150855, "epoch": 3591} {"train_loss": -6.840323448181152, "global_step": 150856, "epoch": 3591} {"train_loss": -6.965003967285156, "global_step": 150857, "epoch": 3591} {"train_loss": -6.934210300445557, "global_step": 150858, "epoch": 3591} {"train_loss": -6.869619846343994, "global_step": 150859, "epoch": 3591} {"train_loss": -6.874855041503906, "global_step": 150860, "epoch": 3591} {"train_loss": -6.944056034088135, "global_step": 150861, "epoch": 3591} {"train_loss": -6.880249500274658, "global_step": 150862, "epoch": 3591} {"train_loss": -6.8997840994880315, "global_step": 150863, "epoch": 3591, "val_loss": 78667.0859375} {"train_loss": -6.844895362854004, "global_step": 150864, "epoch": 3592} {"train_loss": -6.929638862609863, "global_step": 150865, "epoch": 3592} {"train_loss": -6.834402084350586, "global_step": 150866, "epoch": 3592} {"train_loss": -6.824151039123535, "global_step": 150867, "epoch": 3592} {"train_loss": -6.869362831115723, "global_step": 150868, "epoch": 3592} {"train_loss": -6.911309719085693, "global_step": 150869, "epoch": 3592} {"train_loss": -6.860339164733887, "global_step": 150870, "epoch": 3592} {"train_loss": -6.9163384437561035, "global_step": 150871, "epoch": 3592} {"train_loss": -6.765880107879639, "global_step": 150872, "epoch": 3592} {"train_loss": -6.753287315368652, "global_step": 150873, "epoch": 3592} {"train_loss": -6.845152854919434, "global_step": 150874, "epoch": 3592} {"train_loss": -6.669894218444824, "global_step": 150875, "epoch": 3592} {"train_loss": -6.730876922607422, "global_step": 150876, "epoch": 3592} {"train_loss": -6.904440402984619, "global_step": 150877, "epoch": 3592} {"train_loss": -6.798892498016357, "global_step": 150878, "epoch": 3592} {"train_loss": -6.794562339782715, "global_step": 150879, "epoch": 3592} {"train_loss": -6.8479108810424805, "global_step": 150880, "epoch": 3592} {"train_loss": -6.803292274475098, "global_step": 150881, "epoch": 3592} {"train_loss": -6.781095504760742, "global_step": 150882, "epoch": 3592} {"train_loss": -6.882601737976074, "global_step": 150883, "epoch": 3592} {"train_loss": -6.877833843231201, "global_step": 150884, "epoch": 3592} {"train_loss": -6.7726030349731445, "global_step": 150885, "epoch": 3592} {"train_loss": -6.794003963470459, "global_step": 150886, "epoch": 3592} {"train_loss": -6.81453800201416, "global_step": 150887, "epoch": 3592} {"train_loss": -6.848363876342773, "global_step": 150888, "epoch": 3592} {"train_loss": -6.795407295227051, "global_step": 150889, "epoch": 3592} {"train_loss": -6.7031965255737305, "global_step": 150890, "epoch": 3592} {"train_loss": -6.821839332580566, "global_step": 150891, "epoch": 3592} {"train_loss": -6.830496788024902, "global_step": 150892, "epoch": 3592} {"train_loss": -6.916371822357178, "global_step": 150893, "epoch": 3592} {"train_loss": -6.849979400634766, "global_step": 150894, "epoch": 3592} {"train_loss": -6.809908866882324, "global_step": 150895, "epoch": 3592} {"train_loss": -6.719867706298828, "global_step": 150896, "epoch": 3592} {"train_loss": -6.826506614685059, "global_step": 150897, "epoch": 3592} {"train_loss": -6.906277656555176, "global_step": 150898, "epoch": 3592} {"train_loss": -6.86160945892334, "global_step": 150899, "epoch": 3592} {"train_loss": -6.857007026672363, "global_step": 150900, "epoch": 3592} {"train_loss": -6.8031816482543945, "global_step": 150901, "epoch": 3592} {"train_loss": -6.69879150390625, "global_step": 150902, "epoch": 3592} {"train_loss": -6.742763042449951, "global_step": 150903, "epoch": 3592} {"train_loss": -6.8917555809021, "global_step": 150904, "epoch": 3592} {"train_loss": -6.822397515887306, "global_step": 150905, "epoch": 3592, "val_loss": 78475.875} {"train_loss": -6.760436058044434, "global_step": 150906, "epoch": 3593} {"train_loss": -6.904664993286133, "global_step": 150907, "epoch": 3593} {"train_loss": -6.87264347076416, "global_step": 150908, "epoch": 3593} {"train_loss": -6.7259931564331055, "global_step": 150909, "epoch": 3593} {"train_loss": -6.825002193450928, "global_step": 150910, "epoch": 3593} {"train_loss": -6.590867519378662, "global_step": 150911, "epoch": 3593} {"train_loss": -6.768093109130859, "global_step": 150912, "epoch": 3593} {"train_loss": -6.854516983032227, "global_step": 150913, "epoch": 3593} {"train_loss": -6.813342094421387, "global_step": 150914, "epoch": 3593} {"train_loss": -6.77915096282959, "global_step": 150915, "epoch": 3593} {"train_loss": -6.862323760986328, "global_step": 150916, "epoch": 3593} {"train_loss": -6.840431213378906, "global_step": 150917, "epoch": 3593} {"train_loss": -6.928976058959961, "global_step": 150918, "epoch": 3593} {"train_loss": -6.908051490783691, "global_step": 150919, "epoch": 3593} {"train_loss": -6.834585189819336, "global_step": 150920, "epoch": 3593} {"train_loss": -6.891674995422363, "global_step": 150921, "epoch": 3593} {"train_loss": -6.850040435791016, "global_step": 150922, "epoch": 3593} {"train_loss": -6.900883674621582, "global_step": 150923, "epoch": 3593} {"train_loss": -6.745501518249512, "global_step": 150924, "epoch": 3593} {"train_loss": -6.792677879333496, "global_step": 150925, "epoch": 3593} {"train_loss": -6.964201927185059, "global_step": 150926, "epoch": 3593} {"train_loss": -6.943981170654297, "global_step": 150927, "epoch": 3593} {"train_loss": -6.934399604797363, "global_step": 150928, "epoch": 3593} {"train_loss": -6.850692272186279, "global_step": 150929, "epoch": 3593} {"train_loss": -6.918415546417236, "global_step": 150930, "epoch": 3593} {"train_loss": -6.878252983093262, "global_step": 150931, "epoch": 3593} {"train_loss": -6.798521995544434, "global_step": 150932, "epoch": 3593} {"train_loss": -6.8380045890808105, "global_step": 150933, "epoch": 3593} {"train_loss": -6.784401893615723, "global_step": 150934, "epoch": 3593} {"train_loss": -6.914520263671875, "global_step": 150935, "epoch": 3593} {"train_loss": -6.92112922668457, "global_step": 150936, "epoch": 3593} {"train_loss": -6.819585800170898, "global_step": 150937, "epoch": 3593} {"train_loss": -6.716269016265869, "global_step": 150938, "epoch": 3593} {"train_loss": -6.88811731338501, "global_step": 150939, "epoch": 3593} {"train_loss": -6.789319038391113, "global_step": 150940, "epoch": 3593} {"train_loss": -6.663902282714844, "global_step": 150941, "epoch": 3593} {"train_loss": -6.846619606018066, "global_step": 150942, "epoch": 3593} {"train_loss": -6.849532604217529, "global_step": 150943, "epoch": 3593} {"train_loss": -6.918254375457764, "global_step": 150944, "epoch": 3593} {"train_loss": -6.758622169494629, "global_step": 150945, "epoch": 3593} {"train_loss": -6.850558757781982, "global_step": 150946, "epoch": 3593} {"train_loss": -6.835751022611346, "global_step": 150947, "epoch": 3593, "val_loss": 78815.5546875} {"train_loss": -6.889277458190918, "global_step": 150948, "epoch": 3594} {"train_loss": -6.79820442199707, "global_step": 150949, "epoch": 3594} {"train_loss": -6.9106035232543945, "global_step": 150950, "epoch": 3594} {"train_loss": -6.861739158630371, "global_step": 150951, "epoch": 3594} {"train_loss": -6.892899513244629, "global_step": 150952, "epoch": 3594} {"train_loss": -6.866635322570801, "global_step": 150953, "epoch": 3594} {"train_loss": -6.887086868286133, "global_step": 150954, "epoch": 3594} {"train_loss": -6.799537658691406, "global_step": 150955, "epoch": 3594} {"train_loss": -6.8434343338012695, "global_step": 150956, "epoch": 3594} {"train_loss": -6.84967041015625, "global_step": 150957, "epoch": 3594} {"train_loss": -6.776692867279053, "global_step": 150958, "epoch": 3594} {"train_loss": -6.783476829528809, "global_step": 150959, "epoch": 3594} {"train_loss": -6.807811737060547, "global_step": 150960, "epoch": 3594} {"train_loss": -6.90390157699585, "global_step": 150961, "epoch": 3594} {"train_loss": -6.741175174713135, "global_step": 150962, "epoch": 3594} {"train_loss": -6.775913238525391, "global_step": 150963, "epoch": 3594} {"train_loss": -6.833148002624512, "global_step": 150964, "epoch": 3594} {"train_loss": -6.70713996887207, "global_step": 150965, "epoch": 3594} {"train_loss": -6.892419815063477, "global_step": 150966, "epoch": 3594} {"train_loss": -6.660514831542969, "global_step": 150967, "epoch": 3594} {"train_loss": -6.74178409576416, "global_step": 150968, "epoch": 3594} {"train_loss": -6.908600807189941, "global_step": 150969, "epoch": 3594} {"train_loss": -6.689190864562988, "global_step": 150970, "epoch": 3594} {"train_loss": -6.922035217285156, "global_step": 150971, "epoch": 3594} {"train_loss": -6.76104211807251, "global_step": 150972, "epoch": 3594} {"train_loss": -6.8546295166015625, "global_step": 150973, "epoch": 3594} {"train_loss": -6.7741241455078125, "global_step": 150974, "epoch": 3594} {"train_loss": -6.791601657867432, "global_step": 150975, "epoch": 3594} {"train_loss": -6.656301498413086, "global_step": 150976, "epoch": 3594} {"train_loss": -6.739545822143555, "global_step": 150977, "epoch": 3594} {"train_loss": -6.877693176269531, "global_step": 150978, "epoch": 3594} {"train_loss": -6.842865943908691, "global_step": 150979, "epoch": 3594} {"train_loss": -6.6529221534729, "global_step": 150980, "epoch": 3594} {"train_loss": -6.7905473709106445, "global_step": 150981, "epoch": 3594} {"train_loss": -6.693507194519043, "global_step": 150982, "epoch": 3594} {"train_loss": -6.813193321228027, "global_step": 150983, "epoch": 3594} {"train_loss": -6.711278438568115, "global_step": 150984, "epoch": 3594} {"train_loss": -6.710326194763184, "global_step": 150985, "epoch": 3594} {"train_loss": -6.750807762145996, "global_step": 150986, "epoch": 3594} {"train_loss": -6.8367719650268555, "global_step": 150987, "epoch": 3594} {"train_loss": -6.837371826171875, "global_step": 150988, "epoch": 3594} {"train_loss": -6.803731452851069, "global_step": 150989, "epoch": 3594, "val_loss": 78745.0625} {"train_loss": -6.887424468994141, "global_step": 150990, "epoch": 3595} {"train_loss": -6.726987361907959, "global_step": 150991, "epoch": 3595} {"train_loss": -6.877872467041016, "global_step": 150992, "epoch": 3595} {"train_loss": -6.799300193786621, "global_step": 150993, "epoch": 3595} {"train_loss": -6.704206943511963, "global_step": 150994, "epoch": 3595} {"train_loss": -6.867304801940918, "global_step": 150995, "epoch": 3595} {"train_loss": -6.870237350463867, "global_step": 150996, "epoch": 3595} {"train_loss": -6.842361927032471, "global_step": 150997, "epoch": 3595} {"train_loss": -6.812984466552734, "global_step": 150998, "epoch": 3595} {"train_loss": -6.789648532867432, "global_step": 150999, "epoch": 3595} {"train_loss": -6.9067606925964355, "global_step": 151000, "epoch": 3595} {"train_loss": -6.818978309631348, "global_step": 151001, "epoch": 3595} {"train_loss": -6.931209564208984, "global_step": 151002, "epoch": 3595} {"train_loss": -6.952911853790283, "global_step": 151003, "epoch": 3595} {"train_loss": -6.7981648445129395, "global_step": 151004, "epoch": 3595} {"train_loss": -6.908994197845459, "global_step": 151005, "epoch": 3595} {"train_loss": -6.650949954986572, "global_step": 151006, "epoch": 3595} {"train_loss": -6.888993263244629, "global_step": 151007, "epoch": 3595} {"train_loss": -6.95780611038208, "global_step": 151008, "epoch": 3595} {"train_loss": -6.779400825500488, "global_step": 151009, "epoch": 3595} {"train_loss": -6.8938517570495605, "global_step": 151010, "epoch": 3595} {"train_loss": -6.986324787139893, "global_step": 151011, "epoch": 3595} {"train_loss": -6.898241996765137, "global_step": 151012, "epoch": 3595} {"train_loss": -6.943412780761719, "global_step": 151013, "epoch": 3595} {"train_loss": -6.978750228881836, "global_step": 151014, "epoch": 3595} {"train_loss": -6.884171009063721, "global_step": 151015, "epoch": 3595} {"train_loss": -6.770691871643066, "global_step": 151016, "epoch": 3595} {"train_loss": -6.95258903503418, "global_step": 151017, "epoch": 3595} {"train_loss": -6.88551139831543, "global_step": 151018, "epoch": 3595} {"train_loss": -7.012237548828125, "global_step": 151019, "epoch": 3595} {"train_loss": -6.920920372009277, "global_step": 151020, "epoch": 3595} {"train_loss": -6.933911323547363, "global_step": 151021, "epoch": 3595} {"train_loss": -6.912784576416016, "global_step": 151022, "epoch": 3595} {"train_loss": -6.914035797119141, "global_step": 151023, "epoch": 3595} {"train_loss": -7.0046892166137695, "global_step": 151024, "epoch": 3595} {"train_loss": -6.889244556427002, "global_step": 151025, "epoch": 3595} {"train_loss": -6.801487922668457, "global_step": 151026, "epoch": 3595} {"train_loss": -6.892284393310547, "global_step": 151027, "epoch": 3595} {"train_loss": -6.915816307067871, "global_step": 151028, "epoch": 3595} {"train_loss": -6.791265487670898, "global_step": 151029, "epoch": 3595} {"train_loss": -6.911954879760742, "global_step": 151030, "epoch": 3595} {"train_loss": -6.871101765405564, "global_step": 151031, "epoch": 3595, "val_loss": 78570.1875} {"train_loss": -6.736056327819824, "global_step": 151032, "epoch": 3596} {"train_loss": -6.977723121643066, "global_step": 151033, "epoch": 3596} {"train_loss": -6.832070350646973, "global_step": 151034, "epoch": 3596} {"train_loss": -6.863804817199707, "global_step": 151035, "epoch": 3596} {"train_loss": -6.914062976837158, "global_step": 151036, "epoch": 3596} {"train_loss": -6.915020942687988, "global_step": 151037, "epoch": 3596} {"train_loss": -6.924365520477295, "global_step": 151038, "epoch": 3596} {"train_loss": -6.833623886108398, "global_step": 151039, "epoch": 3596} {"train_loss": -6.783644199371338, "global_step": 151040, "epoch": 3596} {"train_loss": -6.803275108337402, "global_step": 151041, "epoch": 3596} {"train_loss": -6.824549674987793, "global_step": 151042, "epoch": 3596} {"train_loss": -6.942419052124023, "global_step": 151043, "epoch": 3596} {"train_loss": -6.810177326202393, "global_step": 151044, "epoch": 3596} {"train_loss": -6.882142066955566, "global_step": 151045, "epoch": 3596} {"train_loss": -6.8551483154296875, "global_step": 151046, "epoch": 3596} {"train_loss": -6.922560691833496, "global_step": 151047, "epoch": 3596} {"train_loss": -6.853899955749512, "global_step": 151048, "epoch": 3596} {"train_loss": -6.89090633392334, "global_step": 151049, "epoch": 3596} {"train_loss": -6.787219524383545, "global_step": 151050, "epoch": 3596} {"train_loss": -6.745194435119629, "global_step": 151051, "epoch": 3596} {"train_loss": -6.70394229888916, "global_step": 151052, "epoch": 3596} {"train_loss": -6.882072448730469, "global_step": 151053, "epoch": 3596} {"train_loss": -6.805775165557861, "global_step": 151054, "epoch": 3596} {"train_loss": -6.843954563140869, "global_step": 151055, "epoch": 3596} {"train_loss": -6.917657852172852, "global_step": 151056, "epoch": 3596} {"train_loss": -6.8355207443237305, "global_step": 151057, "epoch": 3596} {"train_loss": -6.921968460083008, "global_step": 151058, "epoch": 3596} {"train_loss": -6.792277812957764, "global_step": 151059, "epoch": 3596} {"train_loss": -6.800348281860352, "global_step": 151060, "epoch": 3596} {"train_loss": -6.909177780151367, "global_step": 151061, "epoch": 3596} {"train_loss": -6.834280490875244, "global_step": 151062, "epoch": 3596} {"train_loss": -6.791094779968262, "global_step": 151063, "epoch": 3596} {"train_loss": -6.943163871765137, "global_step": 151064, "epoch": 3596} {"train_loss": -6.861193656921387, "global_step": 151065, "epoch": 3596} {"train_loss": -6.907461643218994, "global_step": 151066, "epoch": 3596} {"train_loss": -6.926138877868652, "global_step": 151067, "epoch": 3596} {"train_loss": -6.85902214050293, "global_step": 151068, "epoch": 3596} {"train_loss": -6.938431262969971, "global_step": 151069, "epoch": 3596} {"train_loss": -6.842522621154785, "global_step": 151070, "epoch": 3596} {"train_loss": -6.868407726287842, "global_step": 151071, "epoch": 3596} {"train_loss": -6.955450057983398, "global_step": 151072, "epoch": 3596} {"train_loss": -6.859066202527001, "global_step": 151073, "epoch": 3596, "val_loss": 78777.0859375} {"train_loss": -6.827426910400391, "global_step": 151074, "epoch": 3597} {"train_loss": -6.844516754150391, "global_step": 151075, "epoch": 3597} {"train_loss": -6.843510627746582, "global_step": 151076, "epoch": 3597} {"train_loss": -6.829923629760742, "global_step": 151077, "epoch": 3597} {"train_loss": -7.133641719818115, "global_step": 151078, "epoch": 3597} {"train_loss": -7.012990474700928, "global_step": 151079, "epoch": 3597} {"train_loss": -6.728318214416504, "global_step": 151080, "epoch": 3597} {"train_loss": -6.841787815093994, "global_step": 151081, "epoch": 3597} {"train_loss": -6.911250114440918, "global_step": 151082, "epoch": 3597} {"train_loss": -6.739768981933594, "global_step": 151083, "epoch": 3597} {"train_loss": -6.807037830352783, "global_step": 151084, "epoch": 3597} {"train_loss": -6.921054840087891, "global_step": 151085, "epoch": 3597} {"train_loss": -6.825037002563477, "global_step": 151086, "epoch": 3597} {"train_loss": -6.826358795166016, "global_step": 151087, "epoch": 3597} {"train_loss": -6.907554626464844, "global_step": 151088, "epoch": 3597} {"train_loss": -6.875809192657471, "global_step": 151089, "epoch": 3597} {"train_loss": -6.869770050048828, "global_step": 151090, "epoch": 3597} {"train_loss": -6.909921646118164, "global_step": 151091, "epoch": 3597} {"train_loss": -6.8223557472229, "global_step": 151092, "epoch": 3597} {"train_loss": -6.839533805847168, "global_step": 151093, "epoch": 3597} {"train_loss": -6.995737075805664, "global_step": 151094, "epoch": 3597} {"train_loss": -6.810173034667969, "global_step": 151095, "epoch": 3597} {"train_loss": -6.9909467697143555, "global_step": 151096, "epoch": 3597} {"train_loss": -6.668251037597656, "global_step": 151097, "epoch": 3597} {"train_loss": -6.832470417022705, "global_step": 151098, "epoch": 3597} {"train_loss": -6.924481391906738, "global_step": 151099, "epoch": 3597} {"train_loss": -6.7077860832214355, "global_step": 151100, "epoch": 3597} {"train_loss": -6.795446872711182, "global_step": 151101, "epoch": 3597} {"train_loss": -6.828102111816406, "global_step": 151102, "epoch": 3597} {"train_loss": -6.824375152587891, "global_step": 151103, "epoch": 3597} {"train_loss": -6.887691974639893, "global_step": 151104, "epoch": 3597} {"train_loss": -6.821107864379883, "global_step": 151105, "epoch": 3597} {"train_loss": -6.856110095977783, "global_step": 151106, "epoch": 3597} {"train_loss": -6.873538970947266, "global_step": 151107, "epoch": 3597} {"train_loss": -6.888497352600098, "global_step": 151108, "epoch": 3597} {"train_loss": -6.786031723022461, "global_step": 151109, "epoch": 3597} {"train_loss": -6.904942512512207, "global_step": 151110, "epoch": 3597} {"train_loss": -6.985323905944824, "global_step": 151111, "epoch": 3597} {"train_loss": -6.870642185211182, "global_step": 151112, "epoch": 3597} {"train_loss": -6.893932342529297, "global_step": 151113, "epoch": 3597} {"train_loss": -6.891523361206055, "global_step": 151114, "epoch": 3597} {"train_loss": -6.8597465356191, "global_step": 151115, "epoch": 3597, "val_loss": 78887.9140625} {"train_loss": -6.887368679046631, "global_step": 151116, "epoch": 3598} {"train_loss": -6.841410160064697, "global_step": 151117, "epoch": 3598} {"train_loss": -6.7878522872924805, "global_step": 151118, "epoch": 3598} {"train_loss": -6.908796310424805, "global_step": 151119, "epoch": 3598} {"train_loss": -6.78037166595459, "global_step": 151120, "epoch": 3598} {"train_loss": -6.856454849243164, "global_step": 151121, "epoch": 3598} {"train_loss": -6.831147193908691, "global_step": 151122, "epoch": 3598} {"train_loss": -6.789546966552734, "global_step": 151123, "epoch": 3598} {"train_loss": -6.815457344055176, "global_step": 151124, "epoch": 3598} {"train_loss": -6.918914794921875, "global_step": 151125, "epoch": 3598} {"train_loss": -6.873877048492432, "global_step": 151126, "epoch": 3598} {"train_loss": -6.770061492919922, "global_step": 151127, "epoch": 3598} {"train_loss": -6.827668190002441, "global_step": 151128, "epoch": 3598} {"train_loss": -6.942662239074707, "global_step": 151129, "epoch": 3598} {"train_loss": -6.896409511566162, "global_step": 151130, "epoch": 3598} {"train_loss": -6.910636901855469, "global_step": 151131, "epoch": 3598} {"train_loss": -6.97620153427124, "global_step": 151132, "epoch": 3598} {"train_loss": -6.8582940101623535, "global_step": 151133, "epoch": 3598} {"train_loss": -6.846288681030273, "global_step": 151134, "epoch": 3598} {"train_loss": -6.829346656799316, "global_step": 151135, "epoch": 3598} {"train_loss": -6.925034523010254, "global_step": 151136, "epoch": 3598} {"train_loss": -6.871156215667725, "global_step": 151137, "epoch": 3598} {"train_loss": -6.930854797363281, "global_step": 151138, "epoch": 3598} {"train_loss": -6.961069107055664, "global_step": 151139, "epoch": 3598} {"train_loss": -6.753750801086426, "global_step": 151140, "epoch": 3598} {"train_loss": -6.929950714111328, "global_step": 151141, "epoch": 3598} {"train_loss": -6.869495391845703, "global_step": 151142, "epoch": 3598} {"train_loss": -6.921962738037109, "global_step": 151143, "epoch": 3598} {"train_loss": -6.844310760498047, "global_step": 151144, "epoch": 3598} {"train_loss": -6.9406256675720215, "global_step": 151145, "epoch": 3598} {"train_loss": -6.761171340942383, "global_step": 151146, "epoch": 3598} {"train_loss": -6.919354438781738, "global_step": 151147, "epoch": 3598} {"train_loss": -6.663557052612305, "global_step": 151148, "epoch": 3598} {"train_loss": -6.6908955574035645, "global_step": 151149, "epoch": 3598} {"train_loss": -6.864765167236328, "global_step": 151150, "epoch": 3598} {"train_loss": -6.917972564697266, "global_step": 151151, "epoch": 3598} {"train_loss": -6.799126148223877, "global_step": 151152, "epoch": 3598} {"train_loss": -6.733645439147949, "global_step": 151153, "epoch": 3598} {"train_loss": -6.813576698303223, "global_step": 151154, "epoch": 3598} {"train_loss": -6.891082763671875, "global_step": 151155, "epoch": 3598} {"train_loss": -6.863880634307861, "global_step": 151156, "epoch": 3598} {"train_loss": -6.850248768216088, "global_step": 151157, "epoch": 3598, "val_loss": 78664.7109375} {"train_loss": -6.932936191558838, "global_step": 151158, "epoch": 3599} {"train_loss": -6.805910110473633, "global_step": 151159, "epoch": 3599} {"train_loss": -6.850057125091553, "global_step": 151160, "epoch": 3599} {"train_loss": -6.798641204833984, "global_step": 151161, "epoch": 3599} {"train_loss": -6.852941513061523, "global_step": 151162, "epoch": 3599} {"train_loss": -6.802329063415527, "global_step": 151163, "epoch": 3599} {"train_loss": -6.840607643127441, "global_step": 151164, "epoch": 3599} {"train_loss": -6.838411808013916, "global_step": 151165, "epoch": 3599} {"train_loss": -6.974754333496094, "global_step": 151166, "epoch": 3599} {"train_loss": -6.955212593078613, "global_step": 151167, "epoch": 3599} {"train_loss": -6.949619293212891, "global_step": 151168, "epoch": 3599} {"train_loss": -6.861247539520264, "global_step": 151169, "epoch": 3599} {"train_loss": -6.851576805114746, "global_step": 151170, "epoch": 3599} {"train_loss": -6.935431957244873, "global_step": 151171, "epoch": 3599} {"train_loss": -6.931029796600342, "global_step": 151172, "epoch": 3599} {"train_loss": -7.02448844909668, "global_step": 151173, "epoch": 3599} {"train_loss": -6.828453063964844, "global_step": 151174, "epoch": 3599} {"train_loss": -6.864241600036621, "global_step": 151175, "epoch": 3599} {"train_loss": -6.94807243347168, "global_step": 151176, "epoch": 3599} {"train_loss": -6.834296226501465, "global_step": 151177, "epoch": 3599} {"train_loss": -6.922901153564453, "global_step": 151178, "epoch": 3599} {"train_loss": -6.916346549987793, "global_step": 151179, "epoch": 3599} {"train_loss": -6.959181785583496, "global_step": 151180, "epoch": 3599} {"train_loss": -6.778119087219238, "global_step": 151181, "epoch": 3599} {"train_loss": -6.902804374694824, "global_step": 151182, "epoch": 3599} {"train_loss": -7.025485992431641, "global_step": 151183, "epoch": 3599} {"train_loss": -6.787677764892578, "global_step": 151184, "epoch": 3599} {"train_loss": -6.892452239990234, "global_step": 151185, "epoch": 3599} {"train_loss": -6.860226154327393, "global_step": 151186, "epoch": 3599} {"train_loss": -6.959564208984375, "global_step": 151187, "epoch": 3599} {"train_loss": -6.884259223937988, "global_step": 151188, "epoch": 3599} {"train_loss": -6.941850662231445, "global_step": 151189, "epoch": 3599} {"train_loss": -6.813870429992676, "global_step": 151190, "epoch": 3599} {"train_loss": -6.855571746826172, "global_step": 151191, "epoch": 3599} {"train_loss": -6.81243896484375, "global_step": 151192, "epoch": 3599} {"train_loss": -6.955326080322266, "global_step": 151193, "epoch": 3599} {"train_loss": -6.801526069641113, "global_step": 151194, "epoch": 3599} {"train_loss": -6.822848796844482, "global_step": 151195, "epoch": 3599} {"train_loss": -6.884975433349609, "global_step": 151196, "epoch": 3599} {"train_loss": -6.750953674316406, "global_step": 151197, "epoch": 3599} {"train_loss": -6.889062404632568, "global_step": 151198, "epoch": 3599} {"train_loss": -6.879269395555768, "global_step": 151199, "epoch": 3599, "val_loss": 78799.8515625} {"train_loss": -6.8982648849487305, "global_step": 151200, "epoch": 3600} {"train_loss": -6.815036296844482, "global_step": 151201, "epoch": 3600} {"train_loss": -6.870047092437744, "global_step": 151202, "epoch": 3600} {"train_loss": -6.835367202758789, "global_step": 151203, "epoch": 3600} {"train_loss": -6.891753196716309, "global_step": 151204, "epoch": 3600} {"train_loss": -6.919960975646973, "global_step": 151205, "epoch": 3600} {"train_loss": -6.888998985290527, "global_step": 151206, "epoch": 3600} {"train_loss": -6.869561672210693, "global_step": 151207, "epoch": 3600} {"train_loss": -6.842120170593262, "global_step": 151208, "epoch": 3600} {"train_loss": -6.840109825134277, "global_step": 151209, "epoch": 3600} {"train_loss": -6.718408584594727, "global_step": 151210, "epoch": 3600} {"train_loss": -6.757373332977295, "global_step": 151211, "epoch": 3600} {"train_loss": -6.821233749389648, "global_step": 151212, "epoch": 3600} {"train_loss": -6.7592573165893555, "global_step": 151213, "epoch": 3600} {"train_loss": -6.888708114624023, "global_step": 151214, "epoch": 3600} {"train_loss": -6.836713790893555, "global_step": 151215, "epoch": 3600} {"train_loss": -6.957769393920898, "global_step": 151216, "epoch": 3600} {"train_loss": -6.759941101074219, "global_step": 151217, "epoch": 3600} {"train_loss": -6.957912445068359, "global_step": 151218, "epoch": 3600} {"train_loss": -6.850966453552246, "global_step": 151219, "epoch": 3600} {"train_loss": -6.8950958251953125, "global_step": 151220, "epoch": 3600} {"train_loss": -6.879339218139648, "global_step": 151221, "epoch": 3600} {"train_loss": -6.8403401374816895, "global_step": 151222, "epoch": 3600} {"train_loss": -6.900964736938477, "global_step": 151223, "epoch": 3600} {"train_loss": -6.906371116638184, "global_step": 151224, "epoch": 3600} {"train_loss": -6.821815013885498, "global_step": 151225, "epoch": 3600} {"train_loss": -6.834755897521973, "global_step": 151226, "epoch": 3600} {"train_loss": -6.8050432205200195, "global_step": 151227, "epoch": 3600} {"train_loss": -6.7200727462768555, "global_step": 151228, "epoch": 3600} {"train_loss": -6.770403861999512, "global_step": 151229, "epoch": 3600} {"train_loss": -6.794398307800293, "global_step": 151230, "epoch": 3600} {"train_loss": -6.831132411956787, "global_step": 151231, "epoch": 3600} {"train_loss": -6.752280235290527, "global_step": 151232, "epoch": 3600} {"train_loss": -6.913186073303223, "global_step": 151233, "epoch": 3600} {"train_loss": -6.793307304382324, "global_step": 151234, "epoch": 3600} {"train_loss": -6.824211120605469, "global_step": 151235, "epoch": 3600} {"train_loss": -6.75585412979126, "global_step": 151236, "epoch": 3600} {"train_loss": -6.746964454650879, "global_step": 151237, "epoch": 3600} {"train_loss": -6.862337112426758, "global_step": 151238, "epoch": 3600} {"train_loss": -6.702610015869141, "global_step": 151239, "epoch": 3600} {"train_loss": -6.748387336730957, "global_step": 151240, "epoch": 3600} {"train_loss": -6.829016821725028, "global_step": 151241, "epoch": 3600, "train/sim_max_reward_0": 0.8715772146840582, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.5587287605524341, "train/sim_max_reward_3": 0.1344281208043714, "train/sim_max_reward_4": 0.9745485140218424, "train/sim_max_reward_5": 0.5791553663289083, "test/sim_max_reward_4500000": 0.9678762397528282, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9600554087171179, "test/sim_max_reward_4500003": 0.5031277786194065, "test/sim_max_reward_4500004": 0.14992410760208896, "test/sim_max_reward_4500005": 0.9434903088453179, "test/sim_max_reward_4500006": 0.9591463900462219, "test/sim_max_reward_4500007": 0.9918279577878086, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 0.05353387953145978, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9686701655694475, "test/sim_max_reward_4500012": 0.8209159070996582, "test/sim_max_reward_4500013": 0.004337725040095588, "test/sim_max_reward_4500014": 0.9989631716183262, "test/sim_max_reward_4500015": 0.8850668608951103, "test/sim_max_reward_4500016": 0.01746389330523892, "test/sim_max_reward_4500017": 0.14259306382311623, "test/sim_max_reward_4500018": 0.8673853280495304, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8222274918517399, "test/sim_max_reward_4500022": 0.9926185924058378, "test/sim_max_reward_4500023": 0.9413882231042828, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.7689726653632744, "test/sim_max_reward_4500026": 0.874093417827245, "test/sim_max_reward_4500027": 0.9117854454496964, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.07253341663098875, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9298533088687665, "test/sim_max_reward_4500034": 0.8798270566133164, "test/sim_max_reward_4500035": 0.8138628313086197, "test/sim_max_reward_4500036": 0.9944771392038816, "test/sim_max_reward_4500037": 0.8186294480435998, "test/sim_max_reward_4500038": 0.3658158513448205, "test/sim_max_reward_4500039": 0.8139683555072316, "test/sim_max_reward_4500040": 0.9127060802011873, "test/sim_max_reward_4500041": 0.9084030389439177, "test/sim_max_reward_4500042": 0.031129619197738764, "test/sim_max_reward_4500043": 0.25085443829210763, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.7575450026084876, "test/sim_max_reward_4500046": 0.20256570637868454, "test/sim_max_reward_4500047": 0.8214030981452801, "test/sim_max_reward_4500048": 0.9466419769732626, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6864063293986025, "test/mean_score": 0.5864561397920331, "val_loss": 78622.7890625} {"train_loss": -6.852543354034424, "global_step": 151242, "epoch": 3601} {"train_loss": -6.848405838012695, "global_step": 151243, "epoch": 3601} {"train_loss": -6.723918914794922, "global_step": 151244, "epoch": 3601} {"train_loss": -6.819381237030029, "global_step": 151245, "epoch": 3601} {"train_loss": -6.749787330627441, "global_step": 151246, "epoch": 3601} {"train_loss": -6.8552327156066895, "global_step": 151247, "epoch": 3601} {"train_loss": -6.9359893798828125, "global_step": 151248, "epoch": 3601} {"train_loss": -6.688526153564453, "global_step": 151249, "epoch": 3601} {"train_loss": -6.885077476501465, "global_step": 151250, "epoch": 3601} {"train_loss": -6.784688949584961, "global_step": 151251, "epoch": 3601} {"train_loss": -6.915416240692139, "global_step": 151252, "epoch": 3601} {"train_loss": -6.850893974304199, "global_step": 151253, "epoch": 3601} {"train_loss": -6.847291946411133, "global_step": 151254, "epoch": 3601} {"train_loss": -6.843810081481934, "global_step": 151255, "epoch": 3601} {"train_loss": -6.754386901855469, "global_step": 151256, "epoch": 3601} {"train_loss": -6.69502067565918, "global_step": 151257, "epoch": 3601} {"train_loss": -6.953046798706055, "global_step": 151258, "epoch": 3601} {"train_loss": -6.803561687469482, "global_step": 151259, "epoch": 3601} {"train_loss": -6.676664352416992, "global_step": 151260, "epoch": 3601} {"train_loss": -6.801525115966797, "global_step": 151261, "epoch": 3601} {"train_loss": -6.852731227874756, "global_step": 151262, "epoch": 3601} {"train_loss": -6.852441787719727, "global_step": 151263, "epoch": 3601} {"train_loss": -6.893747329711914, "global_step": 151264, "epoch": 3601} {"train_loss": -6.73544979095459, "global_step": 151265, "epoch": 3601} {"train_loss": -6.82324743270874, "global_step": 151266, "epoch": 3601} {"train_loss": -6.7472429275512695, "global_step": 151267, "epoch": 3601} {"train_loss": -6.800841331481934, "global_step": 151268, "epoch": 3601} {"train_loss": -6.7156901359558105, "global_step": 151269, "epoch": 3601} {"train_loss": -6.902799606323242, "global_step": 151270, "epoch": 3601} {"train_loss": -6.787538528442383, "global_step": 151271, "epoch": 3601} {"train_loss": -6.805986404418945, "global_step": 151272, "epoch": 3601} {"train_loss": -6.730966567993164, "global_step": 151273, "epoch": 3601} {"train_loss": -6.797320365905762, "global_step": 151274, "epoch": 3601} {"train_loss": -6.693019866943359, "global_step": 151275, "epoch": 3601} {"train_loss": -6.657896995544434, "global_step": 151276, "epoch": 3601} {"train_loss": -6.73518705368042, "global_step": 151277, "epoch": 3601} {"train_loss": -6.824713706970215, "global_step": 151278, "epoch": 3601} {"train_loss": -6.638008117675781, "global_step": 151279, "epoch": 3601} {"train_loss": -6.796382904052734, "global_step": 151280, "epoch": 3601} {"train_loss": -6.6298418045043945, "global_step": 151281, "epoch": 3601} {"train_loss": -6.899026870727539, "global_step": 151282, "epoch": 3601} {"train_loss": -6.793699537004743, "global_step": 151283, "epoch": 3601, "val_loss": 78810.65625} {"train_loss": -6.774126052856445, "global_step": 151284, "epoch": 3602} {"train_loss": -6.845643043518066, "global_step": 151285, "epoch": 3602} {"train_loss": -6.706142425537109, "global_step": 151286, "epoch": 3602} {"train_loss": -6.846349716186523, "global_step": 151287, "epoch": 3602} {"train_loss": -6.839262962341309, "global_step": 151288, "epoch": 3602} {"train_loss": -6.768091201782227, "global_step": 151289, "epoch": 3602} {"train_loss": -6.911231994628906, "global_step": 151290, "epoch": 3602} {"train_loss": -6.834270000457764, "global_step": 151291, "epoch": 3602} {"train_loss": -6.820181846618652, "global_step": 151292, "epoch": 3602} {"train_loss": -6.8324360847473145, "global_step": 151293, "epoch": 3602} {"train_loss": -6.944979667663574, "global_step": 151294, "epoch": 3602} {"train_loss": -6.853860855102539, "global_step": 151295, "epoch": 3602} {"train_loss": -6.89422607421875, "global_step": 151296, "epoch": 3602} {"train_loss": -6.868067741394043, "global_step": 151297, "epoch": 3602} {"train_loss": -6.853332042694092, "global_step": 151298, "epoch": 3602} {"train_loss": -6.928122520446777, "global_step": 151299, "epoch": 3602} {"train_loss": -6.942678451538086, "global_step": 151300, "epoch": 3602} {"train_loss": -6.866706848144531, "global_step": 151301, "epoch": 3602} {"train_loss": -6.926063537597656, "global_step": 151302, "epoch": 3602} {"train_loss": -6.808501720428467, "global_step": 151303, "epoch": 3602} {"train_loss": -6.898325443267822, "global_step": 151304, "epoch": 3602} {"train_loss": -6.798794269561768, "global_step": 151305, "epoch": 3602} {"train_loss": -6.858811855316162, "global_step": 151306, "epoch": 3602} {"train_loss": -6.812980651855469, "global_step": 151307, "epoch": 3602} {"train_loss": -6.874993324279785, "global_step": 151308, "epoch": 3602} {"train_loss": -6.855050086975098, "global_step": 151309, "epoch": 3602} {"train_loss": -6.908415794372559, "global_step": 151310, "epoch": 3602} {"train_loss": -6.9400248527526855, "global_step": 151311, "epoch": 3602} {"train_loss": -6.81369686126709, "global_step": 151312, "epoch": 3602} {"train_loss": -6.907390594482422, "global_step": 151313, "epoch": 3602} {"train_loss": -6.909574508666992, "global_step": 151314, "epoch": 3602} {"train_loss": -6.843343734741211, "global_step": 151315, "epoch": 3602} {"train_loss": -6.821435928344727, "global_step": 151316, "epoch": 3602} {"train_loss": -7.008029937744141, "global_step": 151317, "epoch": 3602} {"train_loss": -6.981069087982178, "global_step": 151318, "epoch": 3602} {"train_loss": -6.7521514892578125, "global_step": 151319, "epoch": 3602} {"train_loss": -6.917487621307373, "global_step": 151320, "epoch": 3602} {"train_loss": -7.01225471496582, "global_step": 151321, "epoch": 3602} {"train_loss": -6.824772834777832, "global_step": 151322, "epoch": 3602} {"train_loss": -6.927455902099609, "global_step": 151323, "epoch": 3602} {"train_loss": -6.906222820281982, "global_step": 151324, "epoch": 3602} {"train_loss": -6.869680223010835, "global_step": 151325, "epoch": 3602, "val_loss": 78793.9453125} {"train_loss": -6.96279239654541, "global_step": 151326, "epoch": 3603} {"train_loss": -6.861747741699219, "global_step": 151327, "epoch": 3603} {"train_loss": -6.928497791290283, "global_step": 151328, "epoch": 3603} {"train_loss": -6.84718132019043, "global_step": 151329, "epoch": 3603} {"train_loss": -6.947663307189941, "global_step": 151330, "epoch": 3603} {"train_loss": -6.868114948272705, "global_step": 151331, "epoch": 3603} {"train_loss": -6.919520378112793, "global_step": 151332, "epoch": 3603} {"train_loss": -6.846582412719727, "global_step": 151333, "epoch": 3603} {"train_loss": -6.8564348220825195, "global_step": 151334, "epoch": 3603} {"train_loss": -6.818785190582275, "global_step": 151335, "epoch": 3603} {"train_loss": -6.976223468780518, "global_step": 151336, "epoch": 3603} {"train_loss": -6.7280426025390625, "global_step": 151337, "epoch": 3603} {"train_loss": -6.958776473999023, "global_step": 151338, "epoch": 3603} {"train_loss": -6.799314498901367, "global_step": 151339, "epoch": 3603} {"train_loss": -6.752917766571045, "global_step": 151340, "epoch": 3603} {"train_loss": -6.84832239151001, "global_step": 151341, "epoch": 3603} {"train_loss": -6.882059574127197, "global_step": 151342, "epoch": 3603} {"train_loss": -6.8480329513549805, "global_step": 151343, "epoch": 3603} {"train_loss": -6.854349613189697, "global_step": 151344, "epoch": 3603} {"train_loss": -6.873183727264404, "global_step": 151345, "epoch": 3603} {"train_loss": -6.916916847229004, "global_step": 151346, "epoch": 3603} {"train_loss": -6.946460723876953, "global_step": 151347, "epoch": 3603} {"train_loss": -6.898542404174805, "global_step": 151348, "epoch": 3603} {"train_loss": -6.883083343505859, "global_step": 151349, "epoch": 3603} {"train_loss": -6.8309173583984375, "global_step": 151350, "epoch": 3603} {"train_loss": -6.893905162811279, "global_step": 151351, "epoch": 3603} {"train_loss": -7.104691028594971, "global_step": 151352, "epoch": 3603} {"train_loss": -6.886171340942383, "global_step": 151353, "epoch": 3603} {"train_loss": -6.904324531555176, "global_step": 151354, "epoch": 3603} {"train_loss": -6.893380641937256, "global_step": 151355, "epoch": 3603} {"train_loss": -6.936764717102051, "global_step": 151356, "epoch": 3603} {"train_loss": -6.895191669464111, "global_step": 151357, "epoch": 3603} {"train_loss": -6.84221076965332, "global_step": 151358, "epoch": 3603} {"train_loss": -6.879201889038086, "global_step": 151359, "epoch": 3603} {"train_loss": -6.885101318359375, "global_step": 151360, "epoch": 3603} {"train_loss": -6.872236251831055, "global_step": 151361, "epoch": 3603} {"train_loss": -6.8593950271606445, "global_step": 151362, "epoch": 3603} {"train_loss": -6.858702659606934, "global_step": 151363, "epoch": 3603} {"train_loss": -6.858211994171143, "global_step": 151364, "epoch": 3603} {"train_loss": -6.839022159576416, "global_step": 151365, "epoch": 3603} {"train_loss": -6.830353736877441, "global_step": 151366, "epoch": 3603} {"train_loss": -6.880179291679745, "global_step": 151367, "epoch": 3603, "val_loss": 78720.640625} {"train_loss": -6.886465072631836, "global_step": 151368, "epoch": 3604} {"train_loss": -6.907851696014404, "global_step": 151369, "epoch": 3604} {"train_loss": -6.953678131103516, "global_step": 151370, "epoch": 3604} {"train_loss": -6.912193298339844, "global_step": 151371, "epoch": 3604} {"train_loss": -6.840516090393066, "global_step": 151372, "epoch": 3604} {"train_loss": -7.022218704223633, "global_step": 151373, "epoch": 3604} {"train_loss": -6.8374457359313965, "global_step": 151374, "epoch": 3604} {"train_loss": -6.874145984649658, "global_step": 151375, "epoch": 3604} {"train_loss": -6.838608264923096, "global_step": 151376, "epoch": 3604} {"train_loss": -6.930574417114258, "global_step": 151377, "epoch": 3604} {"train_loss": -6.93265962600708, "global_step": 151378, "epoch": 3604} {"train_loss": -6.955394268035889, "global_step": 151379, "epoch": 3604} {"train_loss": -6.8944501876831055, "global_step": 151380, "epoch": 3604} {"train_loss": -6.987314701080322, "global_step": 151381, "epoch": 3604} {"train_loss": -6.905247211456299, "global_step": 151382, "epoch": 3604} {"train_loss": -7.035330772399902, "global_step": 151383, "epoch": 3604} {"train_loss": -6.791808128356934, "global_step": 151384, "epoch": 3604} {"train_loss": -7.030882835388184, "global_step": 151385, "epoch": 3604} {"train_loss": -6.9484758377075195, "global_step": 151386, "epoch": 3604} {"train_loss": -6.865956783294678, "global_step": 151387, "epoch": 3604} {"train_loss": -7.02381706237793, "global_step": 151388, "epoch": 3604} {"train_loss": -6.894968509674072, "global_step": 151389, "epoch": 3604} {"train_loss": -6.990525245666504, "global_step": 151390, "epoch": 3604} {"train_loss": -6.946853160858154, "global_step": 151391, "epoch": 3604} {"train_loss": -7.025925636291504, "global_step": 151392, "epoch": 3604} {"train_loss": -6.9200592041015625, "global_step": 151393, "epoch": 3604} {"train_loss": -6.963028430938721, "global_step": 151394, "epoch": 3604} {"train_loss": -6.878426551818848, "global_step": 151395, "epoch": 3604} {"train_loss": -6.826757431030273, "global_step": 151396, "epoch": 3604} {"train_loss": -6.830643653869629, "global_step": 151397, "epoch": 3604} {"train_loss": -6.906650543212891, "global_step": 151398, "epoch": 3604} {"train_loss": -6.739229202270508, "global_step": 151399, "epoch": 3604} {"train_loss": -6.953055381774902, "global_step": 151400, "epoch": 3604} {"train_loss": -6.970346927642822, "global_step": 151401, "epoch": 3604} {"train_loss": -6.909902572631836, "global_step": 151402, "epoch": 3604} {"train_loss": -6.914923667907715, "global_step": 151403, "epoch": 3604} {"train_loss": -6.778014183044434, "global_step": 151404, "epoch": 3604} {"train_loss": -6.780941009521484, "global_step": 151405, "epoch": 3604} {"train_loss": -6.940112113952637, "global_step": 151406, "epoch": 3604} {"train_loss": -6.907055854797363, "global_step": 151407, "epoch": 3604} {"train_loss": -6.833494186401367, "global_step": 151408, "epoch": 3604} {"train_loss": -6.909659544626872, "global_step": 151409, "epoch": 3604, "val_loss": 78779.484375} {"train_loss": -6.896994590759277, "global_step": 151410, "epoch": 3605} {"train_loss": -6.93827486038208, "global_step": 151411, "epoch": 3605} {"train_loss": -6.865133285522461, "global_step": 151412, "epoch": 3605} {"train_loss": -6.859699726104736, "global_step": 151413, "epoch": 3605} {"train_loss": -6.891928195953369, "global_step": 151414, "epoch": 3605} {"train_loss": -6.711101531982422, "global_step": 151415, "epoch": 3605} {"train_loss": -6.834892272949219, "global_step": 151416, "epoch": 3605} {"train_loss": -6.88348913192749, "global_step": 151417, "epoch": 3605} {"train_loss": -6.9426703453063965, "global_step": 151418, "epoch": 3605} {"train_loss": -6.899155616760254, "global_step": 151419, "epoch": 3605} {"train_loss": -6.888570785522461, "global_step": 151420, "epoch": 3605} {"train_loss": -6.947279930114746, "global_step": 151421, "epoch": 3605} {"train_loss": -6.803284645080566, "global_step": 151422, "epoch": 3605} {"train_loss": -6.911559104919434, "global_step": 151423, "epoch": 3605} {"train_loss": -6.874935150146484, "global_step": 151424, "epoch": 3605} {"train_loss": -6.883404731750488, "global_step": 151425, "epoch": 3605} {"train_loss": -6.911179065704346, "global_step": 151426, "epoch": 3605} {"train_loss": -6.885603904724121, "global_step": 151427, "epoch": 3605} {"train_loss": -6.925158977508545, "global_step": 151428, "epoch": 3605} {"train_loss": -6.908909320831299, "global_step": 151429, "epoch": 3605} {"train_loss": -6.933901309967041, "global_step": 151430, "epoch": 3605} {"train_loss": -6.910001754760742, "global_step": 151431, "epoch": 3605} {"train_loss": -6.84644889831543, "global_step": 151432, "epoch": 3605} {"train_loss": -6.934859752655029, "global_step": 151433, "epoch": 3605} {"train_loss": -6.891021728515625, "global_step": 151434, "epoch": 3605} {"train_loss": -6.872087478637695, "global_step": 151435, "epoch": 3605} {"train_loss": -6.9498066902160645, "global_step": 151436, "epoch": 3605} {"train_loss": -6.959080696105957, "global_step": 151437, "epoch": 3605} {"train_loss": -6.781678676605225, "global_step": 151438, "epoch": 3605} {"train_loss": -6.803469657897949, "global_step": 151439, "epoch": 3605} {"train_loss": -6.819272994995117, "global_step": 151440, "epoch": 3605} {"train_loss": -6.924649238586426, "global_step": 151441, "epoch": 3605} {"train_loss": -6.842647552490234, "global_step": 151442, "epoch": 3605} {"train_loss": -6.804612159729004, "global_step": 151443, "epoch": 3605} {"train_loss": -6.913522720336914, "global_step": 151444, "epoch": 3605} {"train_loss": -6.736394882202148, "global_step": 151445, "epoch": 3605} {"train_loss": -6.873961448669434, "global_step": 151446, "epoch": 3605} {"train_loss": -6.889881134033203, "global_step": 151447, "epoch": 3605} {"train_loss": -6.860051155090332, "global_step": 151448, "epoch": 3605} {"train_loss": -6.814812660217285, "global_step": 151449, "epoch": 3605} {"train_loss": -6.874697685241699, "global_step": 151450, "epoch": 3605} {"train_loss": -6.876452491396949, "global_step": 151451, "epoch": 3605, "val_loss": 78769.921875} {"train_loss": -6.871169567108154, "global_step": 151452, "epoch": 3606} {"train_loss": -6.953767776489258, "global_step": 151453, "epoch": 3606} {"train_loss": -6.87542200088501, "global_step": 151454, "epoch": 3606} {"train_loss": -6.896177291870117, "global_step": 151455, "epoch": 3606} {"train_loss": -6.943466663360596, "global_step": 151456, "epoch": 3606} {"train_loss": -6.904224395751953, "global_step": 151457, "epoch": 3606} {"train_loss": -6.910895824432373, "global_step": 151458, "epoch": 3606} {"train_loss": -6.9297356605529785, "global_step": 151459, "epoch": 3606} {"train_loss": -6.928565979003906, "global_step": 151460, "epoch": 3606} {"train_loss": -6.96530818939209, "global_step": 151461, "epoch": 3606} {"train_loss": -6.905696868896484, "global_step": 151462, "epoch": 3606} {"train_loss": -6.862267971038818, "global_step": 151463, "epoch": 3606} {"train_loss": -6.931520462036133, "global_step": 151464, "epoch": 3606} {"train_loss": -6.810244560241699, "global_step": 151465, "epoch": 3606} {"train_loss": -6.966486930847168, "global_step": 151466, "epoch": 3606} {"train_loss": -6.9853363037109375, "global_step": 151467, "epoch": 3606} {"train_loss": -6.847570896148682, "global_step": 151468, "epoch": 3606} {"train_loss": -6.962673187255859, "global_step": 151469, "epoch": 3606} {"train_loss": -7.01343297958374, "global_step": 151470, "epoch": 3606} {"train_loss": -6.847286224365234, "global_step": 151471, "epoch": 3606} {"train_loss": -6.745615482330322, "global_step": 151472, "epoch": 3606} {"train_loss": -6.859505653381348, "global_step": 151473, "epoch": 3606} {"train_loss": -6.924924373626709, "global_step": 151474, "epoch": 3606} {"train_loss": -7.006526947021484, "global_step": 151475, "epoch": 3606} {"train_loss": -6.771492958068848, "global_step": 151476, "epoch": 3606} {"train_loss": -6.896452903747559, "global_step": 151477, "epoch": 3606} {"train_loss": -6.804112434387207, "global_step": 151478, "epoch": 3606} {"train_loss": -6.916867256164551, "global_step": 151479, "epoch": 3606} {"train_loss": -6.935577392578125, "global_step": 151480, "epoch": 3606} {"train_loss": -7.008918762207031, "global_step": 151481, "epoch": 3606} {"train_loss": -7.011216640472412, "global_step": 151482, "epoch": 3606} {"train_loss": -6.84230375289917, "global_step": 151483, "epoch": 3606} {"train_loss": -6.85725212097168, "global_step": 151484, "epoch": 3606} {"train_loss": -7.004321098327637, "global_step": 151485, "epoch": 3606} {"train_loss": -6.942419528961182, "global_step": 151486, "epoch": 3606} {"train_loss": -6.932559967041016, "global_step": 151487, "epoch": 3606} {"train_loss": -6.962206840515137, "global_step": 151488, "epoch": 3606} {"train_loss": -6.897875785827637, "global_step": 151489, "epoch": 3606} {"train_loss": -6.989543914794922, "global_step": 151490, "epoch": 3606} {"train_loss": -6.983814716339111, "global_step": 151491, "epoch": 3606} {"train_loss": -6.892935276031494, "global_step": 151492, "epoch": 3606} {"train_loss": -6.910587674095517, "global_step": 151493, "epoch": 3606, "val_loss": 78884.421875} {"train_loss": -6.74242639541626, "global_step": 151494, "epoch": 3607} {"train_loss": -6.902827739715576, "global_step": 151495, "epoch": 3607} {"train_loss": -6.847846984863281, "global_step": 151496, "epoch": 3607} {"train_loss": -6.914400577545166, "global_step": 151497, "epoch": 3607} {"train_loss": -6.911753177642822, "global_step": 151498, "epoch": 3607} {"train_loss": -6.895387172698975, "global_step": 151499, "epoch": 3607} {"train_loss": -6.844511032104492, "global_step": 151500, "epoch": 3607} {"train_loss": -6.949496746063232, "global_step": 151501, "epoch": 3607} {"train_loss": -6.825951099395752, "global_step": 151502, "epoch": 3607} {"train_loss": -6.921734809875488, "global_step": 151503, "epoch": 3607} {"train_loss": -6.815567970275879, "global_step": 151504, "epoch": 3607} {"train_loss": -6.855016708374023, "global_step": 151505, "epoch": 3607} {"train_loss": -6.831487655639648, "global_step": 151506, "epoch": 3607} {"train_loss": -6.838094711303711, "global_step": 151507, "epoch": 3607} {"train_loss": -6.711570739746094, "global_step": 151508, "epoch": 3607} {"train_loss": -6.849762916564941, "global_step": 151509, "epoch": 3607} {"train_loss": -6.9207658767700195, "global_step": 151510, "epoch": 3607} {"train_loss": -6.880213737487793, "global_step": 151511, "epoch": 3607} {"train_loss": -6.891500473022461, "global_step": 151512, "epoch": 3607} {"train_loss": -6.909696578979492, "global_step": 151513, "epoch": 3607} {"train_loss": -6.867006301879883, "global_step": 151514, "epoch": 3607} {"train_loss": -7.0034990310668945, "global_step": 151515, "epoch": 3607} {"train_loss": -6.905097484588623, "global_step": 151516, "epoch": 3607} {"train_loss": -6.977388858795166, "global_step": 151517, "epoch": 3607} {"train_loss": -6.674585342407227, "global_step": 151518, "epoch": 3607} {"train_loss": -6.858697414398193, "global_step": 151519, "epoch": 3607} {"train_loss": -6.9308576583862305, "global_step": 151520, "epoch": 3607} {"train_loss": -6.965648174285889, "global_step": 151521, "epoch": 3607} {"train_loss": -6.884346008300781, "global_step": 151522, "epoch": 3607} {"train_loss": -6.771615982055664, "global_step": 151523, "epoch": 3607} {"train_loss": -6.931735038757324, "global_step": 151524, "epoch": 3607} {"train_loss": -6.810075759887695, "global_step": 151525, "epoch": 3607} {"train_loss": -6.907286643981934, "global_step": 151526, "epoch": 3607} {"train_loss": -6.821926593780518, "global_step": 151527, "epoch": 3607} {"train_loss": -6.8116607666015625, "global_step": 151528, "epoch": 3607} {"train_loss": -6.679203033447266, "global_step": 151529, "epoch": 3607} {"train_loss": -6.882547855377197, "global_step": 151530, "epoch": 3607} {"train_loss": -6.860717296600342, "global_step": 151531, "epoch": 3607} {"train_loss": -6.939448356628418, "global_step": 151532, "epoch": 3607} {"train_loss": -6.879856586456299, "global_step": 151533, "epoch": 3607} {"train_loss": -6.859326362609863, "global_step": 151534, "epoch": 3607} {"train_loss": -6.862440052486601, "global_step": 151535, "epoch": 3607, "val_loss": 78812.3984375} {"train_loss": -6.770536422729492, "global_step": 151536, "epoch": 3608} {"train_loss": -6.781898021697998, "global_step": 151537, "epoch": 3608} {"train_loss": -6.87107515335083, "global_step": 151538, "epoch": 3608} {"train_loss": -6.80164909362793, "global_step": 151539, "epoch": 3608} {"train_loss": -6.792463779449463, "global_step": 151540, "epoch": 3608} {"train_loss": -6.986893653869629, "global_step": 151541, "epoch": 3608} {"train_loss": -6.969562530517578, "global_step": 151542, "epoch": 3608} {"train_loss": -6.904178142547607, "global_step": 151543, "epoch": 3608} {"train_loss": -6.768172264099121, "global_step": 151544, "epoch": 3608} {"train_loss": -6.835101127624512, "global_step": 151545, "epoch": 3608} {"train_loss": -6.8531036376953125, "global_step": 151546, "epoch": 3608} {"train_loss": -6.820146560668945, "global_step": 151547, "epoch": 3608} {"train_loss": -6.8594231605529785, "global_step": 151548, "epoch": 3608} {"train_loss": -6.791460990905762, "global_step": 151549, "epoch": 3608} {"train_loss": -6.844992637634277, "global_step": 151550, "epoch": 3608} {"train_loss": -6.854981422424316, "global_step": 151551, "epoch": 3608} {"train_loss": -6.691328525543213, "global_step": 151552, "epoch": 3608} {"train_loss": -6.916007995605469, "global_step": 151553, "epoch": 3608} {"train_loss": -6.792211532592773, "global_step": 151554, "epoch": 3608} {"train_loss": -6.860931396484375, "global_step": 151555, "epoch": 3608} {"train_loss": -6.752254962921143, "global_step": 151556, "epoch": 3608} {"train_loss": -6.87548828125, "global_step": 151557, "epoch": 3608} {"train_loss": -6.852268695831299, "global_step": 151558, "epoch": 3608} {"train_loss": -6.669121742248535, "global_step": 151559, "epoch": 3608} {"train_loss": -6.857524394989014, "global_step": 151560, "epoch": 3608} {"train_loss": -6.771782875061035, "global_step": 151561, "epoch": 3608} {"train_loss": -6.660175323486328, "global_step": 151562, "epoch": 3608} {"train_loss": -6.759677410125732, "global_step": 151563, "epoch": 3608} {"train_loss": -6.749184608459473, "global_step": 151564, "epoch": 3608} {"train_loss": -6.89406681060791, "global_step": 151565, "epoch": 3608} {"train_loss": -6.815125465393066, "global_step": 151566, "epoch": 3608} {"train_loss": -6.8703155517578125, "global_step": 151567, "epoch": 3608} {"train_loss": -6.892518043518066, "global_step": 151568, "epoch": 3608} {"train_loss": -6.825186729431152, "global_step": 151569, "epoch": 3608} {"train_loss": -6.785177230834961, "global_step": 151570, "epoch": 3608} {"train_loss": -6.7396440505981445, "global_step": 151571, "epoch": 3608} {"train_loss": -6.858540058135986, "global_step": 151572, "epoch": 3608} {"train_loss": -6.762480735778809, "global_step": 151573, "epoch": 3608} {"train_loss": -6.845524787902832, "global_step": 151574, "epoch": 3608} {"train_loss": -6.7981390953063965, "global_step": 151575, "epoch": 3608} {"train_loss": -6.885782718658447, "global_step": 151576, "epoch": 3608} {"train_loss": -6.822113922664097, "global_step": 151577, "epoch": 3608, "val_loss": 78813.5859375} {"train_loss": -6.844344615936279, "global_step": 151578, "epoch": 3609} {"train_loss": -6.803323268890381, "global_step": 151579, "epoch": 3609} {"train_loss": -6.758174896240234, "global_step": 151580, "epoch": 3609} {"train_loss": -6.964292526245117, "global_step": 151581, "epoch": 3609} {"train_loss": -6.788433074951172, "global_step": 151582, "epoch": 3609} {"train_loss": -6.805188179016113, "global_step": 151583, "epoch": 3609} {"train_loss": -6.938013076782227, "global_step": 151584, "epoch": 3609} {"train_loss": -6.81839656829834, "global_step": 151585, "epoch": 3609} {"train_loss": -6.879148006439209, "global_step": 151586, "epoch": 3609} {"train_loss": -6.926301956176758, "global_step": 151587, "epoch": 3609} {"train_loss": -6.739757537841797, "global_step": 151588, "epoch": 3609} {"train_loss": -6.789974212646484, "global_step": 151589, "epoch": 3609} {"train_loss": -6.704920291900635, "global_step": 151590, "epoch": 3609} {"train_loss": -6.901313781738281, "global_step": 151591, "epoch": 3609} {"train_loss": -6.935854911804199, "global_step": 151592, "epoch": 3609} {"train_loss": -6.905900001525879, "global_step": 151593, "epoch": 3609} {"train_loss": -6.77908182144165, "global_step": 151594, "epoch": 3609} {"train_loss": -6.767714500427246, "global_step": 151595, "epoch": 3609} {"train_loss": -6.901208877563477, "global_step": 151596, "epoch": 3609} {"train_loss": -6.858376979827881, "global_step": 151597, "epoch": 3609} {"train_loss": -6.624722480773926, "global_step": 151598, "epoch": 3609} {"train_loss": -6.706454277038574, "global_step": 151599, "epoch": 3609} {"train_loss": -6.908957481384277, "global_step": 151600, "epoch": 3609} {"train_loss": -6.806736469268799, "global_step": 151601, "epoch": 3609} {"train_loss": -6.914595603942871, "global_step": 151602, "epoch": 3609} {"train_loss": -6.827297687530518, "global_step": 151603, "epoch": 3609} {"train_loss": -6.92891263961792, "global_step": 151604, "epoch": 3609} {"train_loss": -6.920445442199707, "global_step": 151605, "epoch": 3609} {"train_loss": -6.894467353820801, "global_step": 151606, "epoch": 3609} {"train_loss": -6.886415958404541, "global_step": 151607, "epoch": 3609} {"train_loss": -6.828318119049072, "global_step": 151608, "epoch": 3609} {"train_loss": -6.9114580154418945, "global_step": 151609, "epoch": 3609} {"train_loss": -6.8566389083862305, "global_step": 151610, "epoch": 3609} {"train_loss": -6.890840530395508, "global_step": 151611, "epoch": 3609} {"train_loss": -6.8912129402160645, "global_step": 151612, "epoch": 3609} {"train_loss": -6.915659427642822, "global_step": 151613, "epoch": 3609} {"train_loss": -6.917545318603516, "global_step": 151614, "epoch": 3609} {"train_loss": -6.911981582641602, "global_step": 151615, "epoch": 3609} {"train_loss": -6.921332359313965, "global_step": 151616, "epoch": 3609} {"train_loss": -6.8861494064331055, "global_step": 151617, "epoch": 3609} {"train_loss": -6.975907325744629, "global_step": 151618, "epoch": 3609} {"train_loss": -6.860963367280506, "global_step": 151619, "epoch": 3609, "val_loss": 78933.390625} {"train_loss": -6.9319353103637695, "global_step": 151620, "epoch": 3610} {"train_loss": -6.869649887084961, "global_step": 151621, "epoch": 3610} {"train_loss": -6.771857738494873, "global_step": 151622, "epoch": 3610} {"train_loss": -6.901841163635254, "global_step": 151623, "epoch": 3610} {"train_loss": -6.940092086791992, "global_step": 151624, "epoch": 3610} {"train_loss": -6.9791717529296875, "global_step": 151625, "epoch": 3610} {"train_loss": -6.974327087402344, "global_step": 151626, "epoch": 3610} {"train_loss": -6.890830993652344, "global_step": 151627, "epoch": 3610} {"train_loss": -6.910805702209473, "global_step": 151628, "epoch": 3610} {"train_loss": -6.893699645996094, "global_step": 151629, "epoch": 3610} {"train_loss": -6.707449436187744, "global_step": 151630, "epoch": 3610} {"train_loss": -7.041351318359375, "global_step": 151631, "epoch": 3610} {"train_loss": -6.705682277679443, "global_step": 151632, "epoch": 3610} {"train_loss": -6.6890764236450195, "global_step": 151633, "epoch": 3610} {"train_loss": -6.835381507873535, "global_step": 151634, "epoch": 3610} {"train_loss": -6.712745666503906, "global_step": 151635, "epoch": 3610} {"train_loss": -6.779329299926758, "global_step": 151636, "epoch": 3610} {"train_loss": -6.986972808837891, "global_step": 151637, "epoch": 3610} {"train_loss": -6.737157821655273, "global_step": 151638, "epoch": 3610} {"train_loss": -6.812870025634766, "global_step": 151639, "epoch": 3610} {"train_loss": -6.7670135498046875, "global_step": 151640, "epoch": 3610} {"train_loss": -6.887502193450928, "global_step": 151641, "epoch": 3610} {"train_loss": -6.914831161499023, "global_step": 151642, "epoch": 3610} {"train_loss": -6.688255786895752, "global_step": 151643, "epoch": 3610} {"train_loss": -6.849557876586914, "global_step": 151644, "epoch": 3610} {"train_loss": -6.674323558807373, "global_step": 151645, "epoch": 3610} {"train_loss": -6.941928863525391, "global_step": 151646, "epoch": 3610} {"train_loss": -6.749585151672363, "global_step": 151647, "epoch": 3610} {"train_loss": -6.693534851074219, "global_step": 151648, "epoch": 3610} {"train_loss": -6.731836795806885, "global_step": 151649, "epoch": 3610} {"train_loss": -6.758731842041016, "global_step": 151650, "epoch": 3610} {"train_loss": -6.7522077560424805, "global_step": 151651, "epoch": 3610} {"train_loss": -6.707867622375488, "global_step": 151652, "epoch": 3610} {"train_loss": -6.848331451416016, "global_step": 151653, "epoch": 3610} {"train_loss": -6.854300498962402, "global_step": 151654, "epoch": 3610} {"train_loss": -6.844254970550537, "global_step": 151655, "epoch": 3610} {"train_loss": -6.75022029876709, "global_step": 151656, "epoch": 3610} {"train_loss": -6.929023265838623, "global_step": 151657, "epoch": 3610} {"train_loss": -6.852558612823486, "global_step": 151658, "epoch": 3610} {"train_loss": -6.838301181793213, "global_step": 151659, "epoch": 3610} {"train_loss": -6.7498979568481445, "global_step": 151660, "epoch": 3610} {"train_loss": -6.8289431390308195, "global_step": 151661, "epoch": 3610, "val_loss": 78803.3125} {"train_loss": -6.898247718811035, "global_step": 151662, "epoch": 3611} {"train_loss": -6.9734697341918945, "global_step": 151663, "epoch": 3611} {"train_loss": -6.883172988891602, "global_step": 151664, "epoch": 3611} {"train_loss": -6.945920944213867, "global_step": 151665, "epoch": 3611} {"train_loss": -6.887326240539551, "global_step": 151666, "epoch": 3611} {"train_loss": -6.978465557098389, "global_step": 151667, "epoch": 3611} {"train_loss": -6.7605671882629395, "global_step": 151668, "epoch": 3611} {"train_loss": -6.874446868896484, "global_step": 151669, "epoch": 3611} {"train_loss": -6.841291427612305, "global_step": 151670, "epoch": 3611} {"train_loss": -6.920656204223633, "global_step": 151671, "epoch": 3611} {"train_loss": -6.896224498748779, "global_step": 151672, "epoch": 3611} {"train_loss": -6.985966682434082, "global_step": 151673, "epoch": 3611} {"train_loss": -6.969952583312988, "global_step": 151674, "epoch": 3611} {"train_loss": -6.95564603805542, "global_step": 151675, "epoch": 3611} {"train_loss": -6.952789306640625, "global_step": 151676, "epoch": 3611} {"train_loss": -6.895764350891113, "global_step": 151677, "epoch": 3611} {"train_loss": -6.8744378089904785, "global_step": 151678, "epoch": 3611} {"train_loss": -6.873612880706787, "global_step": 151679, "epoch": 3611} {"train_loss": -6.982749938964844, "global_step": 151680, "epoch": 3611} {"train_loss": -6.875515460968018, "global_step": 151681, "epoch": 3611} {"train_loss": -6.866533279418945, "global_step": 151682, "epoch": 3611} {"train_loss": -6.822832107543945, "global_step": 151683, "epoch": 3611} {"train_loss": -6.874622344970703, "global_step": 151684, "epoch": 3611} {"train_loss": -6.8711934089660645, "global_step": 151685, "epoch": 3611} {"train_loss": -6.807019233703613, "global_step": 151686, "epoch": 3611} {"train_loss": -6.797550201416016, "global_step": 151687, "epoch": 3611} {"train_loss": -6.786155700683594, "global_step": 151688, "epoch": 3611} {"train_loss": -6.77824068069458, "global_step": 151689, "epoch": 3611} {"train_loss": -6.589868068695068, "global_step": 151690, "epoch": 3611} {"train_loss": -6.710364818572998, "global_step": 151691, "epoch": 3611} {"train_loss": -6.63334846496582, "global_step": 151692, "epoch": 3611} {"train_loss": -6.687190055847168, "global_step": 151693, "epoch": 3611} {"train_loss": -6.671055316925049, "global_step": 151694, "epoch": 3611} {"train_loss": -6.788604259490967, "global_step": 151695, "epoch": 3611} {"train_loss": -6.8284406661987305, "global_step": 151696, "epoch": 3611} {"train_loss": -6.67751407623291, "global_step": 151697, "epoch": 3611} {"train_loss": -6.6829915046691895, "global_step": 151698, "epoch": 3611} {"train_loss": -6.67226505279541, "global_step": 151699, "epoch": 3611} {"train_loss": -6.665019989013672, "global_step": 151700, "epoch": 3611} {"train_loss": -6.807629585266113, "global_step": 151701, "epoch": 3611} {"train_loss": -6.633497714996338, "global_step": 151702, "epoch": 3611} {"train_loss": -6.826272578466506, "global_step": 151703, "epoch": 3611, "val_loss": 78986.296875} {"train_loss": -6.805844306945801, "global_step": 151704, "epoch": 3612} {"train_loss": -6.877867221832275, "global_step": 151705, "epoch": 3612} {"train_loss": -6.692370414733887, "global_step": 151706, "epoch": 3612} {"train_loss": -6.925684928894043, "global_step": 151707, "epoch": 3612} {"train_loss": -6.892541408538818, "global_step": 151708, "epoch": 3612} {"train_loss": -6.7780585289001465, "global_step": 151709, "epoch": 3612} {"train_loss": -6.788121700286865, "global_step": 151710, "epoch": 3612} {"train_loss": -6.926042556762695, "global_step": 151711, "epoch": 3612} {"train_loss": -6.896685600280762, "global_step": 151712, "epoch": 3612} {"train_loss": -6.889122009277344, "global_step": 151713, "epoch": 3612} {"train_loss": -6.895348072052002, "global_step": 151714, "epoch": 3612} {"train_loss": -6.882696151733398, "global_step": 151715, "epoch": 3612} {"train_loss": -6.822321891784668, "global_step": 151716, "epoch": 3612} {"train_loss": -6.862302303314209, "global_step": 151717, "epoch": 3612} {"train_loss": -6.888662815093994, "global_step": 151718, "epoch": 3612} {"train_loss": -6.926601409912109, "global_step": 151719, "epoch": 3612} {"train_loss": -6.992218017578125, "global_step": 151720, "epoch": 3612} {"train_loss": -6.965521812438965, "global_step": 151721, "epoch": 3612} {"train_loss": -6.892147541046143, "global_step": 151722, "epoch": 3612} {"train_loss": -6.889370918273926, "global_step": 151723, "epoch": 3612} {"train_loss": -6.924105167388916, "global_step": 151724, "epoch": 3612} {"train_loss": -6.857161521911621, "global_step": 151725, "epoch": 3612} {"train_loss": -6.8973283767700195, "global_step": 151726, "epoch": 3612} {"train_loss": -6.8672637939453125, "global_step": 151727, "epoch": 3612} {"train_loss": -6.873073577880859, "global_step": 151728, "epoch": 3612} {"train_loss": -6.8677849769592285, "global_step": 151729, "epoch": 3612} {"train_loss": -6.801650524139404, "global_step": 151730, "epoch": 3612} {"train_loss": -6.969574451446533, "global_step": 151731, "epoch": 3612} {"train_loss": -6.82755184173584, "global_step": 151732, "epoch": 3612} {"train_loss": -6.879484176635742, "global_step": 151733, "epoch": 3612} {"train_loss": -6.914676666259766, "global_step": 151734, "epoch": 3612} {"train_loss": -6.865989685058594, "global_step": 151735, "epoch": 3612} {"train_loss": -6.840723991394043, "global_step": 151736, "epoch": 3612} {"train_loss": -6.934281349182129, "global_step": 151737, "epoch": 3612} {"train_loss": -6.908816337585449, "global_step": 151738, "epoch": 3612} {"train_loss": -6.904518127441406, "global_step": 151739, "epoch": 3612} {"train_loss": -6.909505367279053, "global_step": 151740, "epoch": 3612} {"train_loss": -6.863364219665527, "global_step": 151741, "epoch": 3612} {"train_loss": -6.916585445404053, "global_step": 151742, "epoch": 3612} {"train_loss": -6.928603649139404, "global_step": 151743, "epoch": 3612} {"train_loss": -6.829416275024414, "global_step": 151744, "epoch": 3612} {"train_loss": -6.880987428483509, "global_step": 151745, "epoch": 3612, "val_loss": 78922.0546875} {"train_loss": -6.8606181144714355, "global_step": 151746, "epoch": 3613} {"train_loss": -6.879987716674805, "global_step": 151747, "epoch": 3613} {"train_loss": -7.038148880004883, "global_step": 151748, "epoch": 3613} {"train_loss": -6.920057773590088, "global_step": 151749, "epoch": 3613} {"train_loss": -6.949100017547607, "global_step": 151750, "epoch": 3613} {"train_loss": -6.905491828918457, "global_step": 151751, "epoch": 3613} {"train_loss": -6.92378044128418, "global_step": 151752, "epoch": 3613} {"train_loss": -6.874104976654053, "global_step": 151753, "epoch": 3613} {"train_loss": -6.913735389709473, "global_step": 151754, "epoch": 3613} {"train_loss": -6.938353538513184, "global_step": 151755, "epoch": 3613} {"train_loss": -6.741485595703125, "global_step": 151756, "epoch": 3613} {"train_loss": -6.916179180145264, "global_step": 151757, "epoch": 3613} {"train_loss": -6.8173651695251465, "global_step": 151758, "epoch": 3613} {"train_loss": -6.767229080200195, "global_step": 151759, "epoch": 3613} {"train_loss": -6.736127853393555, "global_step": 151760, "epoch": 3613} {"train_loss": -6.891840934753418, "global_step": 151761, "epoch": 3613} {"train_loss": -6.754048824310303, "global_step": 151762, "epoch": 3613} {"train_loss": -6.812578201293945, "global_step": 151763, "epoch": 3613} {"train_loss": -6.7025604248046875, "global_step": 151764, "epoch": 3613} {"train_loss": -6.643060684204102, "global_step": 151765, "epoch": 3613} {"train_loss": -6.871047019958496, "global_step": 151766, "epoch": 3613} {"train_loss": -6.729328632354736, "global_step": 151767, "epoch": 3613} {"train_loss": -6.826292991638184, "global_step": 151768, "epoch": 3613} {"train_loss": -6.852739334106445, "global_step": 151769, "epoch": 3613} {"train_loss": -6.972010612487793, "global_step": 151770, "epoch": 3613} {"train_loss": -6.820244789123535, "global_step": 151771, "epoch": 3613} {"train_loss": -6.89794397354126, "global_step": 151772, "epoch": 3613} {"train_loss": -6.914007186889648, "global_step": 151773, "epoch": 3613} {"train_loss": -6.8547749519348145, "global_step": 151774, "epoch": 3613} {"train_loss": -6.747817039489746, "global_step": 151775, "epoch": 3613} {"train_loss": -6.8900346755981445, "global_step": 151776, "epoch": 3613} {"train_loss": -6.88741397857666, "global_step": 151777, "epoch": 3613} {"train_loss": -6.934689521789551, "global_step": 151778, "epoch": 3613} {"train_loss": -6.91615104675293, "global_step": 151779, "epoch": 3613} {"train_loss": -6.870519638061523, "global_step": 151780, "epoch": 3613} {"train_loss": -6.919003486633301, "global_step": 151781, "epoch": 3613} {"train_loss": -6.871673583984375, "global_step": 151782, "epoch": 3613} {"train_loss": -6.907093524932861, "global_step": 151783, "epoch": 3613} {"train_loss": -6.929161548614502, "global_step": 151784, "epoch": 3613} {"train_loss": -7.05122709274292, "global_step": 151785, "epoch": 3613} {"train_loss": -6.984044075012207, "global_step": 151786, "epoch": 3613} {"train_loss": -6.870304732095628, "global_step": 151787, "epoch": 3613, "val_loss": 78501.8046875} {"train_loss": -6.923105716705322, "global_step": 151788, "epoch": 3614} {"train_loss": -6.958247184753418, "global_step": 151789, "epoch": 3614} {"train_loss": -6.823202610015869, "global_step": 151790, "epoch": 3614} {"train_loss": -6.890694618225098, "global_step": 151791, "epoch": 3614} {"train_loss": -6.972175598144531, "global_step": 151792, "epoch": 3614} {"train_loss": -6.662805080413818, "global_step": 151793, "epoch": 3614} {"train_loss": -6.791271209716797, "global_step": 151794, "epoch": 3614} {"train_loss": -6.791999816894531, "global_step": 151795, "epoch": 3614} {"train_loss": -6.666572570800781, "global_step": 151796, "epoch": 3614} {"train_loss": -6.8442158699035645, "global_step": 151797, "epoch": 3614} {"train_loss": -6.821920394897461, "global_step": 151798, "epoch": 3614} {"train_loss": -6.889161109924316, "global_step": 151799, "epoch": 3614} {"train_loss": -6.922172546386719, "global_step": 151800, "epoch": 3614} {"train_loss": -6.85009765625, "global_step": 151801, "epoch": 3614} {"train_loss": -6.837011814117432, "global_step": 151802, "epoch": 3614} {"train_loss": -6.78224515914917, "global_step": 151803, "epoch": 3614} {"train_loss": -6.973262786865234, "global_step": 151804, "epoch": 3614} {"train_loss": -6.940132141113281, "global_step": 151805, "epoch": 3614} {"train_loss": -6.872403144836426, "global_step": 151806, "epoch": 3614} {"train_loss": -6.8619303703308105, "global_step": 151807, "epoch": 3614} {"train_loss": -6.876320838928223, "global_step": 151808, "epoch": 3614} {"train_loss": -6.88937520980835, "global_step": 151809, "epoch": 3614} {"train_loss": -6.892064094543457, "global_step": 151810, "epoch": 3614} {"train_loss": -6.927063941955566, "global_step": 151811, "epoch": 3614} {"train_loss": -6.932509422302246, "global_step": 151812, "epoch": 3614} {"train_loss": -6.790586948394775, "global_step": 151813, "epoch": 3614} {"train_loss": -6.975006103515625, "global_step": 151814, "epoch": 3614} {"train_loss": -6.878668308258057, "global_step": 151815, "epoch": 3614} {"train_loss": -6.978404521942139, "global_step": 151816, "epoch": 3614} {"train_loss": -6.981637001037598, "global_step": 151817, "epoch": 3614} {"train_loss": -6.86977481842041, "global_step": 151818, "epoch": 3614} {"train_loss": -6.957174301147461, "global_step": 151819, "epoch": 3614} {"train_loss": -6.871257781982422, "global_step": 151820, "epoch": 3614} {"train_loss": -6.872160911560059, "global_step": 151821, "epoch": 3614} {"train_loss": -6.896549701690674, "global_step": 151822, "epoch": 3614} {"train_loss": -6.854451656341553, "global_step": 151823, "epoch": 3614} {"train_loss": -6.896995544433594, "global_step": 151824, "epoch": 3614} {"train_loss": -6.878185749053955, "global_step": 151825, "epoch": 3614} {"train_loss": -6.834383487701416, "global_step": 151826, "epoch": 3614} {"train_loss": -6.964024066925049, "global_step": 151827, "epoch": 3614} {"train_loss": -6.917541980743408, "global_step": 151828, "epoch": 3614} {"train_loss": -6.878257433573405, "global_step": 151829, "epoch": 3614, "val_loss": 79046.6953125} {"train_loss": -6.775207042694092, "global_step": 151830, "epoch": 3615} {"train_loss": -6.751944541931152, "global_step": 151831, "epoch": 3615} {"train_loss": -6.731783866882324, "global_step": 151832, "epoch": 3615} {"train_loss": -6.931191444396973, "global_step": 151833, "epoch": 3615} {"train_loss": -6.839642524719238, "global_step": 151834, "epoch": 3615} {"train_loss": -6.933420181274414, "global_step": 151835, "epoch": 3615} {"train_loss": -6.845831394195557, "global_step": 151836, "epoch": 3615} {"train_loss": -6.7517194747924805, "global_step": 151837, "epoch": 3615} {"train_loss": -6.9657697677612305, "global_step": 151838, "epoch": 3615} {"train_loss": -6.699470520019531, "global_step": 151839, "epoch": 3615} {"train_loss": -6.935177803039551, "global_step": 151840, "epoch": 3615} {"train_loss": -6.886661529541016, "global_step": 151841, "epoch": 3615} {"train_loss": -6.74771785736084, "global_step": 151842, "epoch": 3615} {"train_loss": -6.962126731872559, "global_step": 151843, "epoch": 3615} {"train_loss": -6.777338027954102, "global_step": 151844, "epoch": 3615} {"train_loss": -6.895981788635254, "global_step": 151845, "epoch": 3615} {"train_loss": -6.896720886230469, "global_step": 151846, "epoch": 3615} {"train_loss": -6.883506774902344, "global_step": 151847, "epoch": 3615} {"train_loss": -6.804745674133301, "global_step": 151848, "epoch": 3615} {"train_loss": -6.82404899597168, "global_step": 151849, "epoch": 3615} {"train_loss": -6.933672904968262, "global_step": 151850, "epoch": 3615} {"train_loss": -6.852462291717529, "global_step": 151851, "epoch": 3615} {"train_loss": -7.035145282745361, "global_step": 151852, "epoch": 3615} {"train_loss": -7.002084732055664, "global_step": 151853, "epoch": 3615} {"train_loss": -6.940793991088867, "global_step": 151854, "epoch": 3615} {"train_loss": -6.8885393142700195, "global_step": 151855, "epoch": 3615} {"train_loss": -6.916335105895996, "global_step": 151856, "epoch": 3615} {"train_loss": -6.910935401916504, "global_step": 151857, "epoch": 3615} {"train_loss": -6.874794960021973, "global_step": 151858, "epoch": 3615} {"train_loss": -6.802840709686279, "global_step": 151859, "epoch": 3615} {"train_loss": -6.869976043701172, "global_step": 151860, "epoch": 3615} {"train_loss": -6.873727798461914, "global_step": 151861, "epoch": 3615} {"train_loss": -6.672983169555664, "global_step": 151862, "epoch": 3615} {"train_loss": -6.815119743347168, "global_step": 151863, "epoch": 3615} {"train_loss": -6.873249530792236, "global_step": 151864, "epoch": 3615} {"train_loss": -6.817825794219971, "global_step": 151865, "epoch": 3615} {"train_loss": -6.768243789672852, "global_step": 151866, "epoch": 3615} {"train_loss": -6.949621677398682, "global_step": 151867, "epoch": 3615} {"train_loss": -6.895175457000732, "global_step": 151868, "epoch": 3615} {"train_loss": -6.860198020935059, "global_step": 151869, "epoch": 3615} {"train_loss": -6.830466270446777, "global_step": 151870, "epoch": 3615} {"train_loss": -6.860713743028187, "global_step": 151871, "epoch": 3615, "val_loss": 78729.75} {"train_loss": -6.942739486694336, "global_step": 151872, "epoch": 3616} {"train_loss": -6.948119163513184, "global_step": 151873, "epoch": 3616} {"train_loss": -6.956648349761963, "global_step": 151874, "epoch": 3616} {"train_loss": -6.852324485778809, "global_step": 151875, "epoch": 3616} {"train_loss": -6.94632625579834, "global_step": 151876, "epoch": 3616} {"train_loss": -6.77325439453125, "global_step": 151877, "epoch": 3616} {"train_loss": -6.9347991943359375, "global_step": 151878, "epoch": 3616} {"train_loss": -6.904621124267578, "global_step": 151879, "epoch": 3616} {"train_loss": -6.881045818328857, "global_step": 151880, "epoch": 3616} {"train_loss": -6.778651714324951, "global_step": 151881, "epoch": 3616} {"train_loss": -6.923837661743164, "global_step": 151882, "epoch": 3616} {"train_loss": -6.949625015258789, "global_step": 151883, "epoch": 3616} {"train_loss": -6.971471309661865, "global_step": 151884, "epoch": 3616} {"train_loss": -6.893678665161133, "global_step": 151885, "epoch": 3616} {"train_loss": -6.854327201843262, "global_step": 151886, "epoch": 3616} {"train_loss": -6.763597011566162, "global_step": 151887, "epoch": 3616} {"train_loss": -6.830066204071045, "global_step": 151888, "epoch": 3616} {"train_loss": -6.834716796875, "global_step": 151889, "epoch": 3616} {"train_loss": -6.963901042938232, "global_step": 151890, "epoch": 3616} {"train_loss": -6.7604522705078125, "global_step": 151891, "epoch": 3616} {"train_loss": -6.813757419586182, "global_step": 151892, "epoch": 3616} {"train_loss": -6.809526443481445, "global_step": 151893, "epoch": 3616} {"train_loss": -6.891186714172363, "global_step": 151894, "epoch": 3616} {"train_loss": -6.792213439941406, "global_step": 151895, "epoch": 3616} {"train_loss": -6.971654891967773, "global_step": 151896, "epoch": 3616} {"train_loss": -6.732604503631592, "global_step": 151897, "epoch": 3616} {"train_loss": -6.82890510559082, "global_step": 151898, "epoch": 3616} {"train_loss": -6.883326530456543, "global_step": 151899, "epoch": 3616} {"train_loss": -6.921108245849609, "global_step": 151900, "epoch": 3616} {"train_loss": -6.77814245223999, "global_step": 151901, "epoch": 3616} {"train_loss": -6.96689510345459, "global_step": 151902, "epoch": 3616} {"train_loss": -6.89579963684082, "global_step": 151903, "epoch": 3616} {"train_loss": -6.888436794281006, "global_step": 151904, "epoch": 3616} {"train_loss": -6.841898441314697, "global_step": 151905, "epoch": 3616} {"train_loss": -6.813377380371094, "global_step": 151906, "epoch": 3616} {"train_loss": -6.873236179351807, "global_step": 151907, "epoch": 3616} {"train_loss": -6.768009662628174, "global_step": 151908, "epoch": 3616} {"train_loss": -6.814495086669922, "global_step": 151909, "epoch": 3616} {"train_loss": -6.974459648132324, "global_step": 151910, "epoch": 3616} {"train_loss": -6.830010890960693, "global_step": 151911, "epoch": 3616} {"train_loss": -6.892606735229492, "global_step": 151912, "epoch": 3616} {"train_loss": -6.870722305207026, "global_step": 151913, "epoch": 3616, "val_loss": 79136.078125} {"train_loss": -6.78544282913208, "global_step": 151914, "epoch": 3617} {"train_loss": -6.918089866638184, "global_step": 151915, "epoch": 3617} {"train_loss": -7.066597938537598, "global_step": 151916, "epoch": 3617} {"train_loss": -6.807927131652832, "global_step": 151917, "epoch": 3617} {"train_loss": -6.934497356414795, "global_step": 151918, "epoch": 3617} {"train_loss": -6.916614532470703, "global_step": 151919, "epoch": 3617} {"train_loss": -6.996705055236816, "global_step": 151920, "epoch": 3617} {"train_loss": -6.918744087219238, "global_step": 151921, "epoch": 3617} {"train_loss": -6.998469352722168, "global_step": 151922, "epoch": 3617} {"train_loss": -6.943141460418701, "global_step": 151923, "epoch": 3617} {"train_loss": -6.812900543212891, "global_step": 151924, "epoch": 3617} {"train_loss": -6.938201904296875, "global_step": 151925, "epoch": 3617} {"train_loss": -6.960101127624512, "global_step": 151926, "epoch": 3617} {"train_loss": -6.8901777267456055, "global_step": 151927, "epoch": 3617} {"train_loss": -6.985712051391602, "global_step": 151928, "epoch": 3617} {"train_loss": -6.775432586669922, "global_step": 151929, "epoch": 3617} {"train_loss": -6.9572038650512695, "global_step": 151930, "epoch": 3617} {"train_loss": -6.959146976470947, "global_step": 151931, "epoch": 3617} {"train_loss": -6.893510341644287, "global_step": 151932, "epoch": 3617} {"train_loss": -6.955253601074219, "global_step": 151933, "epoch": 3617} {"train_loss": -6.910784721374512, "global_step": 151934, "epoch": 3617} {"train_loss": -6.9114155769348145, "global_step": 151935, "epoch": 3617} {"train_loss": -6.977458953857422, "global_step": 151936, "epoch": 3617} {"train_loss": -6.934484481811523, "global_step": 151937, "epoch": 3617} {"train_loss": -6.937810897827148, "global_step": 151938, "epoch": 3617} {"train_loss": -6.942972660064697, "global_step": 151939, "epoch": 3617} {"train_loss": -6.879010200500488, "global_step": 151940, "epoch": 3617} {"train_loss": -7.01033878326416, "global_step": 151941, "epoch": 3617} {"train_loss": -6.8966898918151855, "global_step": 151942, "epoch": 3617} {"train_loss": -6.810464859008789, "global_step": 151943, "epoch": 3617} {"train_loss": -7.007900714874268, "global_step": 151944, "epoch": 3617} {"train_loss": -6.850248336791992, "global_step": 151945, "epoch": 3617} {"train_loss": -6.81495475769043, "global_step": 151946, "epoch": 3617} {"train_loss": -6.78997802734375, "global_step": 151947, "epoch": 3617} {"train_loss": -6.900701522827148, "global_step": 151948, "epoch": 3617} {"train_loss": -6.815893173217773, "global_step": 151949, "epoch": 3617} {"train_loss": -6.8867387771606445, "global_step": 151950, "epoch": 3617} {"train_loss": -6.810530662536621, "global_step": 151951, "epoch": 3617} {"train_loss": -6.885066986083984, "global_step": 151952, "epoch": 3617} {"train_loss": -7.018365383148193, "global_step": 151953, "epoch": 3617} {"train_loss": -6.916770935058594, "global_step": 151954, "epoch": 3617} {"train_loss": -6.909454561415172, "global_step": 151955, "epoch": 3617, "val_loss": 78782.109375} {"train_loss": -6.879015922546387, "global_step": 151956, "epoch": 3618} {"train_loss": -6.994481563568115, "global_step": 151957, "epoch": 3618} {"train_loss": -6.905360698699951, "global_step": 151958, "epoch": 3618} {"train_loss": -6.91676139831543, "global_step": 151959, "epoch": 3618} {"train_loss": -6.811901092529297, "global_step": 151960, "epoch": 3618} {"train_loss": -6.760526657104492, "global_step": 151961, "epoch": 3618} {"train_loss": -6.963581085205078, "global_step": 151962, "epoch": 3618} {"train_loss": -6.904791831970215, "global_step": 151963, "epoch": 3618} {"train_loss": -6.81108283996582, "global_step": 151964, "epoch": 3618} {"train_loss": -6.836548805236816, "global_step": 151965, "epoch": 3618} {"train_loss": -6.61699914932251, "global_step": 151966, "epoch": 3618} {"train_loss": -6.882111072540283, "global_step": 151967, "epoch": 3618} {"train_loss": -6.916546821594238, "global_step": 151968, "epoch": 3618} {"train_loss": -6.929004669189453, "global_step": 151969, "epoch": 3618} {"train_loss": -6.923222541809082, "global_step": 151970, "epoch": 3618} {"train_loss": -6.764307022094727, "global_step": 151971, "epoch": 3618} {"train_loss": -6.82215690612793, "global_step": 151972, "epoch": 3618} {"train_loss": -6.795368194580078, "global_step": 151973, "epoch": 3618} {"train_loss": -6.940851211547852, "global_step": 151974, "epoch": 3618} {"train_loss": -6.725033760070801, "global_step": 151975, "epoch": 3618} {"train_loss": -6.67526912689209, "global_step": 151976, "epoch": 3618} {"train_loss": -6.913507461547852, "global_step": 151977, "epoch": 3618} {"train_loss": -6.81439733505249, "global_step": 151978, "epoch": 3618} {"train_loss": -6.799709796905518, "global_step": 151979, "epoch": 3618} {"train_loss": -6.840992450714111, "global_step": 151980, "epoch": 3618} {"train_loss": -6.695508003234863, "global_step": 151981, "epoch": 3618} {"train_loss": -6.74061918258667, "global_step": 151982, "epoch": 3618} {"train_loss": -6.708548545837402, "global_step": 151983, "epoch": 3618} {"train_loss": -6.819400787353516, "global_step": 151984, "epoch": 3618} {"train_loss": -6.809240341186523, "global_step": 151985, "epoch": 3618} {"train_loss": -6.822021484375, "global_step": 151986, "epoch": 3618} {"train_loss": -6.8745436668396, "global_step": 151987, "epoch": 3618} {"train_loss": -6.72332763671875, "global_step": 151988, "epoch": 3618} {"train_loss": -6.915145397186279, "global_step": 151989, "epoch": 3618} {"train_loss": -6.803799629211426, "global_step": 151990, "epoch": 3618} {"train_loss": -6.878454208374023, "global_step": 151991, "epoch": 3618} {"train_loss": -6.907988548278809, "global_step": 151992, "epoch": 3618} {"train_loss": -6.804368495941162, "global_step": 151993, "epoch": 3618} {"train_loss": -6.749650001525879, "global_step": 151994, "epoch": 3618} {"train_loss": -6.779026985168457, "global_step": 151995, "epoch": 3618} {"train_loss": -6.957446575164795, "global_step": 151996, "epoch": 3618} {"train_loss": -6.835578623272124, "global_step": 151997, "epoch": 3618, "val_loss": 78696.1953125} {"train_loss": -6.7974042892456055, "global_step": 151998, "epoch": 3619} {"train_loss": -6.963320732116699, "global_step": 151999, "epoch": 3619} {"train_loss": -6.929370880126953, "global_step": 152000, "epoch": 3619} {"train_loss": -6.9563069343566895, "global_step": 152001, "epoch": 3619} {"train_loss": -6.867114067077637, "global_step": 152002, "epoch": 3619} {"train_loss": -6.969958305358887, "global_step": 152003, "epoch": 3619} {"train_loss": -6.781364440917969, "global_step": 152004, "epoch": 3619} {"train_loss": -6.929778099060059, "global_step": 152005, "epoch": 3619} {"train_loss": -6.968435764312744, "global_step": 152006, "epoch": 3619} {"train_loss": -6.714942932128906, "global_step": 152007, "epoch": 3619} {"train_loss": -6.686698913574219, "global_step": 152008, "epoch": 3619} {"train_loss": -6.779581546783447, "global_step": 152009, "epoch": 3619} {"train_loss": -6.858075141906738, "global_step": 152010, "epoch": 3619} {"train_loss": -6.785697937011719, "global_step": 152011, "epoch": 3619} {"train_loss": -6.887251853942871, "global_step": 152012, "epoch": 3619} {"train_loss": -6.737229824066162, "global_step": 152013, "epoch": 3619} {"train_loss": -6.888751029968262, "global_step": 152014, "epoch": 3619} {"train_loss": -6.845440864562988, "global_step": 152015, "epoch": 3619} {"train_loss": -6.941502094268799, "global_step": 152016, "epoch": 3619} {"train_loss": -6.7888383865356445, "global_step": 152017, "epoch": 3619} {"train_loss": -6.8155694007873535, "global_step": 152018, "epoch": 3619} {"train_loss": -6.733906269073486, "global_step": 152019, "epoch": 3619} {"train_loss": -6.913558483123779, "global_step": 152020, "epoch": 3619} {"train_loss": -6.934078216552734, "global_step": 152021, "epoch": 3619} {"train_loss": -6.851815223693848, "global_step": 152022, "epoch": 3619} {"train_loss": -6.7868781089782715, "global_step": 152023, "epoch": 3619} {"train_loss": -6.775618553161621, "global_step": 152024, "epoch": 3619} {"train_loss": -6.8941779136657715, "global_step": 152025, "epoch": 3619} {"train_loss": -6.841927528381348, "global_step": 152026, "epoch": 3619} {"train_loss": -6.8735432624816895, "global_step": 152027, "epoch": 3619} {"train_loss": -6.797555923461914, "global_step": 152028, "epoch": 3619} {"train_loss": -6.960707187652588, "global_step": 152029, "epoch": 3619} {"train_loss": -6.910191535949707, "global_step": 152030, "epoch": 3619} {"train_loss": -6.851699352264404, "global_step": 152031, "epoch": 3619} {"train_loss": -6.7962164878845215, "global_step": 152032, "epoch": 3619} {"train_loss": -6.855908393859863, "global_step": 152033, "epoch": 3619} {"train_loss": -6.936964988708496, "global_step": 152034, "epoch": 3619} {"train_loss": -6.921796798706055, "global_step": 152035, "epoch": 3619} {"train_loss": -6.901654243469238, "global_step": 152036, "epoch": 3619} {"train_loss": -6.8357744216918945, "global_step": 152037, "epoch": 3619} {"train_loss": -6.925465106964111, "global_step": 152038, "epoch": 3619} {"train_loss": -6.860434872763498, "global_step": 152039, "epoch": 3619, "val_loss": 78865.8984375} {"train_loss": -6.85495662689209, "global_step": 152040, "epoch": 3620} {"train_loss": -6.935086250305176, "global_step": 152041, "epoch": 3620} {"train_loss": -6.850849151611328, "global_step": 152042, "epoch": 3620} {"train_loss": -6.943861484527588, "global_step": 152043, "epoch": 3620} {"train_loss": -6.8998308181762695, "global_step": 152044, "epoch": 3620} {"train_loss": -6.956989288330078, "global_step": 152045, "epoch": 3620} {"train_loss": -6.99362325668335, "global_step": 152046, "epoch": 3620} {"train_loss": -7.013895034790039, "global_step": 152047, "epoch": 3620} {"train_loss": -6.939851760864258, "global_step": 152048, "epoch": 3620} {"train_loss": -6.968717098236084, "global_step": 152049, "epoch": 3620} {"train_loss": -6.920572280883789, "global_step": 152050, "epoch": 3620} {"train_loss": -6.947484970092773, "global_step": 152051, "epoch": 3620} {"train_loss": -6.991551876068115, "global_step": 152052, "epoch": 3620} {"train_loss": -6.922128677368164, "global_step": 152053, "epoch": 3620} {"train_loss": -6.763397216796875, "global_step": 152054, "epoch": 3620} {"train_loss": -6.898415565490723, "global_step": 152055, "epoch": 3620} {"train_loss": -6.920101642608643, "global_step": 152056, "epoch": 3620} {"train_loss": -6.864267349243164, "global_step": 152057, "epoch": 3620} {"train_loss": -6.932980537414551, "global_step": 152058, "epoch": 3620} {"train_loss": -6.923890113830566, "global_step": 152059, "epoch": 3620} {"train_loss": -6.837128162384033, "global_step": 152060, "epoch": 3620} {"train_loss": -6.826827526092529, "global_step": 152061, "epoch": 3620} {"train_loss": -6.744307518005371, "global_step": 152062, "epoch": 3620} {"train_loss": -6.773452281951904, "global_step": 152063, "epoch": 3620} {"train_loss": -6.857318878173828, "global_step": 152064, "epoch": 3620} {"train_loss": -6.793199062347412, "global_step": 152065, "epoch": 3620} {"train_loss": -6.95133113861084, "global_step": 152066, "epoch": 3620} {"train_loss": -6.827069282531738, "global_step": 152067, "epoch": 3620} {"train_loss": -6.812565803527832, "global_step": 152068, "epoch": 3620} {"train_loss": -6.829104423522949, "global_step": 152069, "epoch": 3620} {"train_loss": -6.712108612060547, "global_step": 152070, "epoch": 3620} {"train_loss": -6.791593074798584, "global_step": 152071, "epoch": 3620} {"train_loss": -6.71840238571167, "global_step": 152072, "epoch": 3620} {"train_loss": -6.829643726348877, "global_step": 152073, "epoch": 3620} {"train_loss": -6.857583045959473, "global_step": 152074, "epoch": 3620} {"train_loss": -6.760249137878418, "global_step": 152075, "epoch": 3620} {"train_loss": -6.924185276031494, "global_step": 152076, "epoch": 3620} {"train_loss": -6.856540679931641, "global_step": 152077, "epoch": 3620} {"train_loss": -6.885693550109863, "global_step": 152078, "epoch": 3620} {"train_loss": -6.8862152099609375, "global_step": 152079, "epoch": 3620} {"train_loss": -6.79325008392334, "global_step": 152080, "epoch": 3620} {"train_loss": -6.870403062729609, "global_step": 152081, "epoch": 3620, "val_loss": 78859.8515625} {"train_loss": -6.835667133331299, "global_step": 152082, "epoch": 3621} {"train_loss": -6.78548526763916, "global_step": 152083, "epoch": 3621} {"train_loss": -6.863812446594238, "global_step": 152084, "epoch": 3621} {"train_loss": -6.8288068771362305, "global_step": 152085, "epoch": 3621} {"train_loss": -6.865267753601074, "global_step": 152086, "epoch": 3621} {"train_loss": -6.912275314331055, "global_step": 152087, "epoch": 3621} {"train_loss": -6.691806793212891, "global_step": 152088, "epoch": 3621} {"train_loss": -6.863760948181152, "global_step": 152089, "epoch": 3621} {"train_loss": -6.73552942276001, "global_step": 152090, "epoch": 3621} {"train_loss": -6.8898186683654785, "global_step": 152091, "epoch": 3621} {"train_loss": -6.985011100769043, "global_step": 152092, "epoch": 3621} {"train_loss": -6.78559684753418, "global_step": 152093, "epoch": 3621} {"train_loss": -6.9406418800354, "global_step": 152094, "epoch": 3621} {"train_loss": -6.896844387054443, "global_step": 152095, "epoch": 3621} {"train_loss": -6.808679103851318, "global_step": 152096, "epoch": 3621} {"train_loss": -6.873486042022705, "global_step": 152097, "epoch": 3621} {"train_loss": -6.830822467803955, "global_step": 152098, "epoch": 3621} {"train_loss": -6.949347496032715, "global_step": 152099, "epoch": 3621} {"train_loss": -6.928106784820557, "global_step": 152100, "epoch": 3621} {"train_loss": -6.801831245422363, "global_step": 152101, "epoch": 3621} {"train_loss": -6.798614025115967, "global_step": 152102, "epoch": 3621} {"train_loss": -6.842292308807373, "global_step": 152103, "epoch": 3621} {"train_loss": -6.88378381729126, "global_step": 152104, "epoch": 3621} {"train_loss": -6.777985095977783, "global_step": 152105, "epoch": 3621} {"train_loss": -6.924101829528809, "global_step": 152106, "epoch": 3621} {"train_loss": -6.789392471313477, "global_step": 152107, "epoch": 3621} {"train_loss": -6.825387477874756, "global_step": 152108, "epoch": 3621} {"train_loss": -6.816278457641602, "global_step": 152109, "epoch": 3621} {"train_loss": -6.84627103805542, "global_step": 152110, "epoch": 3621} {"train_loss": -6.768587112426758, "global_step": 152111, "epoch": 3621} {"train_loss": -6.946843147277832, "global_step": 152112, "epoch": 3621} {"train_loss": -6.920838356018066, "global_step": 152113, "epoch": 3621} {"train_loss": -6.804786682128906, "global_step": 152114, "epoch": 3621} {"train_loss": -6.802617073059082, "global_step": 152115, "epoch": 3621} {"train_loss": -6.8082098960876465, "global_step": 152116, "epoch": 3621} {"train_loss": -6.774225234985352, "global_step": 152117, "epoch": 3621} {"train_loss": -6.904401779174805, "global_step": 152118, "epoch": 3621} {"train_loss": -6.839615821838379, "global_step": 152119, "epoch": 3621} {"train_loss": -6.970584869384766, "global_step": 152120, "epoch": 3621} {"train_loss": -6.872074127197266, "global_step": 152121, "epoch": 3621} {"train_loss": -6.833379745483398, "global_step": 152122, "epoch": 3621} {"train_loss": -6.848479475293841, "global_step": 152123, "epoch": 3621, "val_loss": 78645.9140625} {"train_loss": -6.76844596862793, "global_step": 152124, "epoch": 3622} {"train_loss": -6.891376972198486, "global_step": 152125, "epoch": 3622} {"train_loss": -6.768804550170898, "global_step": 152126, "epoch": 3622} {"train_loss": -6.91910457611084, "global_step": 152127, "epoch": 3622} {"train_loss": -6.919563293457031, "global_step": 152128, "epoch": 3622} {"train_loss": -6.814583778381348, "global_step": 152129, "epoch": 3622} {"train_loss": -6.935871124267578, "global_step": 152130, "epoch": 3622} {"train_loss": -6.88736629486084, "global_step": 152131, "epoch": 3622} {"train_loss": -6.894009590148926, "global_step": 152132, "epoch": 3622} {"train_loss": -6.856257438659668, "global_step": 152133, "epoch": 3622} {"train_loss": -6.896617889404297, "global_step": 152134, "epoch": 3622} {"train_loss": -6.881608009338379, "global_step": 152135, "epoch": 3622} {"train_loss": -6.839158058166504, "global_step": 152136, "epoch": 3622} {"train_loss": -6.765565395355225, "global_step": 152137, "epoch": 3622} {"train_loss": -6.904651641845703, "global_step": 152138, "epoch": 3622} {"train_loss": -6.948992729187012, "global_step": 152139, "epoch": 3622} {"train_loss": -6.815206050872803, "global_step": 152140, "epoch": 3622} {"train_loss": -6.781572341918945, "global_step": 152141, "epoch": 3622} {"train_loss": -6.896317005157471, "global_step": 152142, "epoch": 3622} {"train_loss": -6.9524455070495605, "global_step": 152143, "epoch": 3622} {"train_loss": -6.916766166687012, "global_step": 152144, "epoch": 3622} {"train_loss": -6.983091354370117, "global_step": 152145, "epoch": 3622} {"train_loss": -6.941481113433838, "global_step": 152146, "epoch": 3622} {"train_loss": -7.028759956359863, "global_step": 152147, "epoch": 3622} {"train_loss": -6.9088969230651855, "global_step": 152148, "epoch": 3622} {"train_loss": -6.885712146759033, "global_step": 152149, "epoch": 3622} {"train_loss": -6.85931396484375, "global_step": 152150, "epoch": 3622} {"train_loss": -6.868126392364502, "global_step": 152151, "epoch": 3622} {"train_loss": -7.079846382141113, "global_step": 152152, "epoch": 3622} {"train_loss": -7.004085540771484, "global_step": 152153, "epoch": 3622} {"train_loss": -6.881902694702148, "global_step": 152154, "epoch": 3622} {"train_loss": -6.885138511657715, "global_step": 152155, "epoch": 3622} {"train_loss": -6.888802528381348, "global_step": 152156, "epoch": 3622} {"train_loss": -6.835165977478027, "global_step": 152157, "epoch": 3622} {"train_loss": -6.783414363861084, "global_step": 152158, "epoch": 3622} {"train_loss": -6.921239852905273, "global_step": 152159, "epoch": 3622} {"train_loss": -6.836055755615234, "global_step": 152160, "epoch": 3622} {"train_loss": -6.905357360839844, "global_step": 152161, "epoch": 3622} {"train_loss": -6.854552745819092, "global_step": 152162, "epoch": 3622} {"train_loss": -6.881091594696045, "global_step": 152163, "epoch": 3622} {"train_loss": -6.8888325691223145, "global_step": 152164, "epoch": 3622} {"train_loss": -6.88989215805417, "global_step": 152165, "epoch": 3622, "val_loss": 78927.484375} {"train_loss": -6.9001970291137695, "global_step": 152166, "epoch": 3623} {"train_loss": -6.894338607788086, "global_step": 152167, "epoch": 3623} {"train_loss": -6.799042224884033, "global_step": 152168, "epoch": 3623} {"train_loss": -6.8115010261535645, "global_step": 152169, "epoch": 3623} {"train_loss": -6.706162452697754, "global_step": 152170, "epoch": 3623} {"train_loss": -6.827657699584961, "global_step": 152171, "epoch": 3623} {"train_loss": -6.830521583557129, "global_step": 152172, "epoch": 3623} {"train_loss": -6.86258602142334, "global_step": 152173, "epoch": 3623} {"train_loss": -6.845987796783447, "global_step": 152174, "epoch": 3623} {"train_loss": -6.844128131866455, "global_step": 152175, "epoch": 3623} {"train_loss": -6.875543594360352, "global_step": 152176, "epoch": 3623} {"train_loss": -6.835046768188477, "global_step": 152177, "epoch": 3623} {"train_loss": -6.8152360916137695, "global_step": 152178, "epoch": 3623} {"train_loss": -6.895623207092285, "global_step": 152179, "epoch": 3623} {"train_loss": -6.760906219482422, "global_step": 152180, "epoch": 3623} {"train_loss": -6.895802021026611, "global_step": 152181, "epoch": 3623} {"train_loss": -6.927867889404297, "global_step": 152182, "epoch": 3623} {"train_loss": -6.841675758361816, "global_step": 152183, "epoch": 3623} {"train_loss": -6.897364616394043, "global_step": 152184, "epoch": 3623} {"train_loss": -6.934209823608398, "global_step": 152185, "epoch": 3623} {"train_loss": -6.899792671203613, "global_step": 152186, "epoch": 3623} {"train_loss": -6.969671726226807, "global_step": 152187, "epoch": 3623} {"train_loss": -6.989031791687012, "global_step": 152188, "epoch": 3623} {"train_loss": -7.013084411621094, "global_step": 152189, "epoch": 3623} {"train_loss": -6.955765724182129, "global_step": 152190, "epoch": 3623} {"train_loss": -6.968377113342285, "global_step": 152191, "epoch": 3623} {"train_loss": -6.909849643707275, "global_step": 152192, "epoch": 3623} {"train_loss": -6.9334330558776855, "global_step": 152193, "epoch": 3623} {"train_loss": -6.950671195983887, "global_step": 152194, "epoch": 3623} {"train_loss": -7.0287041664123535, "global_step": 152195, "epoch": 3623} {"train_loss": -6.963499546051025, "global_step": 152196, "epoch": 3623} {"train_loss": -6.942059516906738, "global_step": 152197, "epoch": 3623} {"train_loss": -6.836758136749268, "global_step": 152198, "epoch": 3623} {"train_loss": -7.031534194946289, "global_step": 152199, "epoch": 3623} {"train_loss": -7.115630626678467, "global_step": 152200, "epoch": 3623} {"train_loss": -6.929619789123535, "global_step": 152201, "epoch": 3623} {"train_loss": -6.922183990478516, "global_step": 152202, "epoch": 3623} {"train_loss": -7.069022178649902, "global_step": 152203, "epoch": 3623} {"train_loss": -6.930069923400879, "global_step": 152204, "epoch": 3623} {"train_loss": -6.7640790939331055, "global_step": 152205, "epoch": 3623} {"train_loss": -6.88295841217041, "global_step": 152206, "epoch": 3623} {"train_loss": -6.903137876873925, "global_step": 152207, "epoch": 3623, "val_loss": 78807.5859375} {"train_loss": -6.899247169494629, "global_step": 152208, "epoch": 3624} {"train_loss": -6.946043491363525, "global_step": 152209, "epoch": 3624} {"train_loss": -6.976187705993652, "global_step": 152210, "epoch": 3624} {"train_loss": -6.972936630249023, "global_step": 152211, "epoch": 3624} {"train_loss": -6.950048446655273, "global_step": 152212, "epoch": 3624} {"train_loss": -6.873064041137695, "global_step": 152213, "epoch": 3624} {"train_loss": -7.0688252449035645, "global_step": 152214, "epoch": 3624} {"train_loss": -6.836447715759277, "global_step": 152215, "epoch": 3624} {"train_loss": -6.726922988891602, "global_step": 152216, "epoch": 3624} {"train_loss": -6.864725112915039, "global_step": 152217, "epoch": 3624} {"train_loss": -6.888433456420898, "global_step": 152218, "epoch": 3624} {"train_loss": -6.7752580642700195, "global_step": 152219, "epoch": 3624} {"train_loss": -6.595441818237305, "global_step": 152220, "epoch": 3624} {"train_loss": -6.945156097412109, "global_step": 152221, "epoch": 3624} {"train_loss": -6.854150772094727, "global_step": 152222, "epoch": 3624} {"train_loss": -6.678229331970215, "global_step": 152223, "epoch": 3624} {"train_loss": -6.716448783874512, "global_step": 152224, "epoch": 3624} {"train_loss": -6.808087348937988, "global_step": 152225, "epoch": 3624} {"train_loss": -6.660445213317871, "global_step": 152226, "epoch": 3624} {"train_loss": -6.882978439331055, "global_step": 152227, "epoch": 3624} {"train_loss": -6.810630798339844, "global_step": 152228, "epoch": 3624} {"train_loss": -6.867402076721191, "global_step": 152229, "epoch": 3624} {"train_loss": -6.797938823699951, "global_step": 152230, "epoch": 3624} {"train_loss": -6.708497047424316, "global_step": 152231, "epoch": 3624} {"train_loss": -6.81156587600708, "global_step": 152232, "epoch": 3624} {"train_loss": -6.7382893562316895, "global_step": 152233, "epoch": 3624} {"train_loss": -6.873863220214844, "global_step": 152234, "epoch": 3624} {"train_loss": -6.964079856872559, "global_step": 152235, "epoch": 3624} {"train_loss": -6.667445182800293, "global_step": 152236, "epoch": 3624} {"train_loss": -6.855898857116699, "global_step": 152237, "epoch": 3624} {"train_loss": -6.81453800201416, "global_step": 152238, "epoch": 3624} {"train_loss": -6.879217147827148, "global_step": 152239, "epoch": 3624} {"train_loss": -6.909762382507324, "global_step": 152240, "epoch": 3624} {"train_loss": -6.7444281578063965, "global_step": 152241, "epoch": 3624} {"train_loss": -6.819006443023682, "global_step": 152242, "epoch": 3624} {"train_loss": -6.8473944664001465, "global_step": 152243, "epoch": 3624} {"train_loss": -6.999762535095215, "global_step": 152244, "epoch": 3624} {"train_loss": -6.7725701332092285, "global_step": 152245, "epoch": 3624} {"train_loss": -6.899800777435303, "global_step": 152246, "epoch": 3624} {"train_loss": -6.810242652893066, "global_step": 152247, "epoch": 3624} {"train_loss": -6.806310653686523, "global_step": 152248, "epoch": 3624} {"train_loss": -6.8412300405048185, "global_step": 152249, "epoch": 3624, "val_loss": 78689.6328125} {"train_loss": -7.001936912536621, "global_step": 152250, "epoch": 3625} {"train_loss": -6.889852523803711, "global_step": 152251, "epoch": 3625} {"train_loss": -6.966283321380615, "global_step": 152252, "epoch": 3625} {"train_loss": -6.909730911254883, "global_step": 152253, "epoch": 3625} {"train_loss": -6.998483180999756, "global_step": 152254, "epoch": 3625} {"train_loss": -6.8822832107543945, "global_step": 152255, "epoch": 3625} {"train_loss": -6.880718231201172, "global_step": 152256, "epoch": 3625} {"train_loss": -6.888859748840332, "global_step": 152257, "epoch": 3625} {"train_loss": -6.850963592529297, "global_step": 152258, "epoch": 3625} {"train_loss": -6.812826156616211, "global_step": 152259, "epoch": 3625} {"train_loss": -6.852791786193848, "global_step": 152260, "epoch": 3625} {"train_loss": -6.921294212341309, "global_step": 152261, "epoch": 3625} {"train_loss": -6.888702392578125, "global_step": 152262, "epoch": 3625} {"train_loss": -6.746974945068359, "global_step": 152263, "epoch": 3625} {"train_loss": -6.81663703918457, "global_step": 152264, "epoch": 3625} {"train_loss": -6.813828468322754, "global_step": 152265, "epoch": 3625} {"train_loss": -6.6674604415893555, "global_step": 152266, "epoch": 3625} {"train_loss": -6.737575054168701, "global_step": 152267, "epoch": 3625} {"train_loss": -6.934412002563477, "global_step": 152268, "epoch": 3625} {"train_loss": -6.865704536437988, "global_step": 152269, "epoch": 3625} {"train_loss": -6.774700164794922, "global_step": 152270, "epoch": 3625} {"train_loss": -6.734448432922363, "global_step": 152271, "epoch": 3625} {"train_loss": -6.7349700927734375, "global_step": 152272, "epoch": 3625} {"train_loss": -6.902477264404297, "global_step": 152273, "epoch": 3625} {"train_loss": -6.779218673706055, "global_step": 152274, "epoch": 3625} {"train_loss": -6.695751190185547, "global_step": 152275, "epoch": 3625} {"train_loss": -6.680335521697998, "global_step": 152276, "epoch": 3625} {"train_loss": -6.60750675201416, "global_step": 152277, "epoch": 3625} {"train_loss": -6.800519943237305, "global_step": 152278, "epoch": 3625} {"train_loss": -6.504683494567871, "global_step": 152279, "epoch": 3625} {"train_loss": -6.849260330200195, "global_step": 152280, "epoch": 3625} {"train_loss": -6.577851295471191, "global_step": 152281, "epoch": 3625} {"train_loss": -6.6747822761535645, "global_step": 152282, "epoch": 3625} {"train_loss": -6.483095169067383, "global_step": 152283, "epoch": 3625} {"train_loss": -6.6868414878845215, "global_step": 152284, "epoch": 3625} {"train_loss": -6.717685222625732, "global_step": 152285, "epoch": 3625} {"train_loss": -6.754969596862793, "global_step": 152286, "epoch": 3625} {"train_loss": -6.589502334594727, "global_step": 152287, "epoch": 3625} {"train_loss": -6.655248641967773, "global_step": 152288, "epoch": 3625} {"train_loss": -6.664078712463379, "global_step": 152289, "epoch": 3625} {"train_loss": -6.697379112243652, "global_step": 152290, "epoch": 3625} {"train_loss": -6.776719729105632, "global_step": 152291, "epoch": 3625, "val_loss": 79469.3359375} {"train_loss": -6.658324241638184, "global_step": 152292, "epoch": 3626} {"train_loss": -6.77398681640625, "global_step": 152293, "epoch": 3626} {"train_loss": -6.62644624710083, "global_step": 152294, "epoch": 3626} {"train_loss": -6.920604705810547, "global_step": 152295, "epoch": 3626} {"train_loss": -6.857602119445801, "global_step": 152296, "epoch": 3626} {"train_loss": -6.854213714599609, "global_step": 152297, "epoch": 3626} {"train_loss": -6.78617000579834, "global_step": 152298, "epoch": 3626} {"train_loss": -6.84100341796875, "global_step": 152299, "epoch": 3626} {"train_loss": -6.826681137084961, "global_step": 152300, "epoch": 3626} {"train_loss": -6.692627429962158, "global_step": 152301, "epoch": 3626} {"train_loss": -6.943638801574707, "global_step": 152302, "epoch": 3626} {"train_loss": -6.7880377769470215, "global_step": 152303, "epoch": 3626} {"train_loss": -6.785696983337402, "global_step": 152304, "epoch": 3626} {"train_loss": -6.76842737197876, "global_step": 152305, "epoch": 3626} {"train_loss": -6.8454461097717285, "global_step": 152306, "epoch": 3626} {"train_loss": -6.733592987060547, "global_step": 152307, "epoch": 3626} {"train_loss": -6.905269622802734, "global_step": 152308, "epoch": 3626} {"train_loss": -6.8752336502075195, "global_step": 152309, "epoch": 3626} {"train_loss": -6.835333824157715, "global_step": 152310, "epoch": 3626} {"train_loss": -6.731451988220215, "global_step": 152311, "epoch": 3626} {"train_loss": -6.913034439086914, "global_step": 152312, "epoch": 3626} {"train_loss": -6.725097179412842, "global_step": 152313, "epoch": 3626} {"train_loss": -6.96418571472168, "global_step": 152314, "epoch": 3626} {"train_loss": -6.761168956756592, "global_step": 152315, "epoch": 3626} {"train_loss": -6.96533203125, "global_step": 152316, "epoch": 3626} {"train_loss": -6.815392971038818, "global_step": 152317, "epoch": 3626} {"train_loss": -6.814601898193359, "global_step": 152318, "epoch": 3626} {"train_loss": -6.850766658782959, "global_step": 152319, "epoch": 3626} {"train_loss": -6.887265205383301, "global_step": 152320, "epoch": 3626} {"train_loss": -6.801804542541504, "global_step": 152321, "epoch": 3626} {"train_loss": -6.938451766967773, "global_step": 152322, "epoch": 3626} {"train_loss": -7.029017448425293, "global_step": 152323, "epoch": 3626} {"train_loss": -6.887135982513428, "global_step": 152324, "epoch": 3626} {"train_loss": -7.048091411590576, "global_step": 152325, "epoch": 3626} {"train_loss": -6.88682746887207, "global_step": 152326, "epoch": 3626} {"train_loss": -6.954252243041992, "global_step": 152327, "epoch": 3626} {"train_loss": -6.873332977294922, "global_step": 152328, "epoch": 3626} {"train_loss": -7.016368389129639, "global_step": 152329, "epoch": 3626} {"train_loss": -6.984587669372559, "global_step": 152330, "epoch": 3626} {"train_loss": -6.861043930053711, "global_step": 152331, "epoch": 3626} {"train_loss": -6.906647682189941, "global_step": 152332, "epoch": 3626} {"train_loss": -6.854906797409058, "global_step": 152333, "epoch": 3626, "val_loss": 78695.2109375} {"train_loss": -6.8227105140686035, "global_step": 152334, "epoch": 3627} {"train_loss": -7.001313209533691, "global_step": 152335, "epoch": 3627} {"train_loss": -7.0611114501953125, "global_step": 152336, "epoch": 3627} {"train_loss": -6.985660552978516, "global_step": 152337, "epoch": 3627} {"train_loss": -6.9487152099609375, "global_step": 152338, "epoch": 3627} {"train_loss": -7.003059387207031, "global_step": 152339, "epoch": 3627} {"train_loss": -6.861403465270996, "global_step": 152340, "epoch": 3627} {"train_loss": -6.980410575866699, "global_step": 152341, "epoch": 3627} {"train_loss": -6.993820667266846, "global_step": 152342, "epoch": 3627} {"train_loss": -6.853365898132324, "global_step": 152343, "epoch": 3627} {"train_loss": -6.82869815826416, "global_step": 152344, "epoch": 3627} {"train_loss": -6.828130722045898, "global_step": 152345, "epoch": 3627} {"train_loss": -6.826662063598633, "global_step": 152346, "epoch": 3627} {"train_loss": -6.912032604217529, "global_step": 152347, "epoch": 3627} {"train_loss": -6.815437316894531, "global_step": 152348, "epoch": 3627} {"train_loss": -6.938139915466309, "global_step": 152349, "epoch": 3627} {"train_loss": -6.927495956420898, "global_step": 152350, "epoch": 3627} {"train_loss": -6.891949653625488, "global_step": 152351, "epoch": 3627} {"train_loss": -6.959892272949219, "global_step": 152352, "epoch": 3627} {"train_loss": -6.803318977355957, "global_step": 152353, "epoch": 3627} {"train_loss": -6.8463311195373535, "global_step": 152354, "epoch": 3627} {"train_loss": -6.7083964347839355, "global_step": 152355, "epoch": 3627} {"train_loss": -6.83150577545166, "global_step": 152356, "epoch": 3627} {"train_loss": -6.777997016906738, "global_step": 152357, "epoch": 3627} {"train_loss": -6.931715965270996, "global_step": 152358, "epoch": 3627} {"train_loss": -6.821624755859375, "global_step": 152359, "epoch": 3627} {"train_loss": -6.740068435668945, "global_step": 152360, "epoch": 3627} {"train_loss": -6.79500675201416, "global_step": 152361, "epoch": 3627} {"train_loss": -6.803929328918457, "global_step": 152362, "epoch": 3627} {"train_loss": -6.870166778564453, "global_step": 152363, "epoch": 3627} {"train_loss": -6.734442234039307, "global_step": 152364, "epoch": 3627} {"train_loss": -6.860324859619141, "global_step": 152365, "epoch": 3627} {"train_loss": -6.81733512878418, "global_step": 152366, "epoch": 3627} {"train_loss": -6.868537902832031, "global_step": 152367, "epoch": 3627} {"train_loss": -6.808266639709473, "global_step": 152368, "epoch": 3627} {"train_loss": -6.82540225982666, "global_step": 152369, "epoch": 3627} {"train_loss": -6.859942436218262, "global_step": 152370, "epoch": 3627} {"train_loss": -6.818456172943115, "global_step": 152371, "epoch": 3627} {"train_loss": -6.9355573654174805, "global_step": 152372, "epoch": 3627} {"train_loss": -6.991212844848633, "global_step": 152373, "epoch": 3627} {"train_loss": -6.987590789794922, "global_step": 152374, "epoch": 3627} {"train_loss": -6.87511894816444, "global_step": 152375, "epoch": 3627, "val_loss": 78629.5859375} {"train_loss": -6.909920692443848, "global_step": 152376, "epoch": 3628} {"train_loss": -6.95851469039917, "global_step": 152377, "epoch": 3628} {"train_loss": -6.907266616821289, "global_step": 152378, "epoch": 3628} {"train_loss": -6.879727363586426, "global_step": 152379, "epoch": 3628} {"train_loss": -6.887613296508789, "global_step": 152380, "epoch": 3628} {"train_loss": -6.886155128479004, "global_step": 152381, "epoch": 3628} {"train_loss": -6.882957935333252, "global_step": 152382, "epoch": 3628} {"train_loss": -6.848132133483887, "global_step": 152383, "epoch": 3628} {"train_loss": -6.893824577331543, "global_step": 152384, "epoch": 3628} {"train_loss": -6.886773109436035, "global_step": 152385, "epoch": 3628} {"train_loss": -6.678945541381836, "global_step": 152386, "epoch": 3628} {"train_loss": -6.947292327880859, "global_step": 152387, "epoch": 3628} {"train_loss": -6.861136436462402, "global_step": 152388, "epoch": 3628} {"train_loss": -6.8184990882873535, "global_step": 152389, "epoch": 3628} {"train_loss": -6.8259358406066895, "global_step": 152390, "epoch": 3628} {"train_loss": -6.77092981338501, "global_step": 152391, "epoch": 3628} {"train_loss": -6.764806747436523, "global_step": 152392, "epoch": 3628} {"train_loss": -6.807005882263184, "global_step": 152393, "epoch": 3628} {"train_loss": -6.8425984382629395, "global_step": 152394, "epoch": 3628} {"train_loss": -6.877586841583252, "global_step": 152395, "epoch": 3628} {"train_loss": -6.833744049072266, "global_step": 152396, "epoch": 3628} {"train_loss": -6.8215436935424805, "global_step": 152397, "epoch": 3628} {"train_loss": -6.801061153411865, "global_step": 152398, "epoch": 3628} {"train_loss": -6.901532173156738, "global_step": 152399, "epoch": 3628} {"train_loss": -6.791152000427246, "global_step": 152400, "epoch": 3628} {"train_loss": -6.811829090118408, "global_step": 152401, "epoch": 3628} {"train_loss": -6.784316062927246, "global_step": 152402, "epoch": 3628} {"train_loss": -6.779227256774902, "global_step": 152403, "epoch": 3628} {"train_loss": -6.77969217300415, "global_step": 152404, "epoch": 3628} {"train_loss": -6.734515190124512, "global_step": 152405, "epoch": 3628} {"train_loss": -6.802512168884277, "global_step": 152406, "epoch": 3628} {"train_loss": -6.813206672668457, "global_step": 152407, "epoch": 3628} {"train_loss": -6.858270645141602, "global_step": 152408, "epoch": 3628} {"train_loss": -6.832534313201904, "global_step": 152409, "epoch": 3628} {"train_loss": -6.856378555297852, "global_step": 152410, "epoch": 3628} {"train_loss": -6.766091346740723, "global_step": 152411, "epoch": 3628} {"train_loss": -6.969664573669434, "global_step": 152412, "epoch": 3628} {"train_loss": -6.826781272888184, "global_step": 152413, "epoch": 3628} {"train_loss": -6.855000019073486, "global_step": 152414, "epoch": 3628} {"train_loss": -6.848418235778809, "global_step": 152415, "epoch": 3628} {"train_loss": -6.861687660217285, "global_step": 152416, "epoch": 3628} {"train_loss": -6.843422571818034, "global_step": 152417, "epoch": 3628, "val_loss": 78791.5078125} {"train_loss": -6.891335487365723, "global_step": 152418, "epoch": 3629} {"train_loss": -6.961603164672852, "global_step": 152419, "epoch": 3629} {"train_loss": -6.930325984954834, "global_step": 152420, "epoch": 3629} {"train_loss": -6.886075973510742, "global_step": 152421, "epoch": 3629} {"train_loss": -6.897582530975342, "global_step": 152422, "epoch": 3629} {"train_loss": -6.86374568939209, "global_step": 152423, "epoch": 3629} {"train_loss": -6.814960956573486, "global_step": 152424, "epoch": 3629} {"train_loss": -6.821422100067139, "global_step": 152425, "epoch": 3629} {"train_loss": -6.902325630187988, "global_step": 152426, "epoch": 3629} {"train_loss": -6.951828956604004, "global_step": 152427, "epoch": 3629} {"train_loss": -6.96702766418457, "global_step": 152428, "epoch": 3629} {"train_loss": -7.012619972229004, "global_step": 152429, "epoch": 3629} {"train_loss": -6.850758075714111, "global_step": 152430, "epoch": 3629} {"train_loss": -6.877199172973633, "global_step": 152431, "epoch": 3629} {"train_loss": -6.943751335144043, "global_step": 152432, "epoch": 3629} {"train_loss": -6.914802551269531, "global_step": 152433, "epoch": 3629} {"train_loss": -6.925919532775879, "global_step": 152434, "epoch": 3629} {"train_loss": -6.97106409072876, "global_step": 152435, "epoch": 3629} {"train_loss": -7.057956218719482, "global_step": 152436, "epoch": 3629} {"train_loss": -6.994490146636963, "global_step": 152437, "epoch": 3629} {"train_loss": -6.962144374847412, "global_step": 152438, "epoch": 3629} {"train_loss": -6.852824687957764, "global_step": 152439, "epoch": 3629} {"train_loss": -6.9227800369262695, "global_step": 152440, "epoch": 3629} {"train_loss": -6.878353118896484, "global_step": 152441, "epoch": 3629} {"train_loss": -7.046158790588379, "global_step": 152442, "epoch": 3629} {"train_loss": -6.827534198760986, "global_step": 152443, "epoch": 3629} {"train_loss": -7.01031494140625, "global_step": 152444, "epoch": 3629} {"train_loss": -6.895759105682373, "global_step": 152445, "epoch": 3629} {"train_loss": -6.940279960632324, "global_step": 152446, "epoch": 3629} {"train_loss": -6.909490585327148, "global_step": 152447, "epoch": 3629} {"train_loss": -6.97015905380249, "global_step": 152448, "epoch": 3629} {"train_loss": -6.956127166748047, "global_step": 152449, "epoch": 3629} {"train_loss": -6.88953161239624, "global_step": 152450, "epoch": 3629} {"train_loss": -6.937027931213379, "global_step": 152451, "epoch": 3629} {"train_loss": -6.91736364364624, "global_step": 152452, "epoch": 3629} {"train_loss": -6.99545431137085, "global_step": 152453, "epoch": 3629} {"train_loss": -6.83920955657959, "global_step": 152454, "epoch": 3629} {"train_loss": -6.873532295227051, "global_step": 152455, "epoch": 3629} {"train_loss": -6.871022701263428, "global_step": 152456, "epoch": 3629} {"train_loss": -6.852844715118408, "global_step": 152457, "epoch": 3629} {"train_loss": -6.785988807678223, "global_step": 152458, "epoch": 3629} {"train_loss": -6.914440404801142, "global_step": 152459, "epoch": 3629, "val_loss": 78824.828125} {"train_loss": -6.916257381439209, "global_step": 152460, "epoch": 3630} {"train_loss": -6.8497161865234375, "global_step": 152461, "epoch": 3630} {"train_loss": -7.0390119552612305, "global_step": 152462, "epoch": 3630} {"train_loss": -7.009000778198242, "global_step": 152463, "epoch": 3630} {"train_loss": -6.997970104217529, "global_step": 152464, "epoch": 3630} {"train_loss": -6.865325927734375, "global_step": 152465, "epoch": 3630} {"train_loss": -7.006494998931885, "global_step": 152466, "epoch": 3630} {"train_loss": -6.967581748962402, "global_step": 152467, "epoch": 3630} {"train_loss": -6.908023834228516, "global_step": 152468, "epoch": 3630} {"train_loss": -6.841127395629883, "global_step": 152469, "epoch": 3630} {"train_loss": -6.9461140632629395, "global_step": 152470, "epoch": 3630} {"train_loss": -6.935025215148926, "global_step": 152471, "epoch": 3630} {"train_loss": -6.927041530609131, "global_step": 152472, "epoch": 3630} {"train_loss": -6.819990158081055, "global_step": 152473, "epoch": 3630} {"train_loss": -6.892587184906006, "global_step": 152474, "epoch": 3630} {"train_loss": -6.847665786743164, "global_step": 152475, "epoch": 3630} {"train_loss": -6.844364166259766, "global_step": 152476, "epoch": 3630} {"train_loss": -6.845339775085449, "global_step": 152477, "epoch": 3630} {"train_loss": -6.941804885864258, "global_step": 152478, "epoch": 3630} {"train_loss": -6.950600624084473, "global_step": 152479, "epoch": 3630} {"train_loss": -6.874112129211426, "global_step": 152480, "epoch": 3630} {"train_loss": -6.981241226196289, "global_step": 152481, "epoch": 3630} {"train_loss": -6.906850814819336, "global_step": 152482, "epoch": 3630} {"train_loss": -6.850505828857422, "global_step": 152483, "epoch": 3630} {"train_loss": -6.863978862762451, "global_step": 152484, "epoch": 3630} {"train_loss": -6.900360584259033, "global_step": 152485, "epoch": 3630} {"train_loss": -6.861748695373535, "global_step": 152486, "epoch": 3630} {"train_loss": -6.924717903137207, "global_step": 152487, "epoch": 3630} {"train_loss": -6.878449440002441, "global_step": 152488, "epoch": 3630} {"train_loss": -6.981044769287109, "global_step": 152489, "epoch": 3630} {"train_loss": -6.928315162658691, "global_step": 152490, "epoch": 3630} {"train_loss": -6.942655563354492, "global_step": 152491, "epoch": 3630} {"train_loss": -6.9207024574279785, "global_step": 152492, "epoch": 3630} {"train_loss": -6.726107120513916, "global_step": 152493, "epoch": 3630} {"train_loss": -6.987456321716309, "global_step": 152494, "epoch": 3630} {"train_loss": -6.734064102172852, "global_step": 152495, "epoch": 3630} {"train_loss": -6.874366283416748, "global_step": 152496, "epoch": 3630} {"train_loss": -6.941882610321045, "global_step": 152497, "epoch": 3630} {"train_loss": -6.965902328491211, "global_step": 152498, "epoch": 3630} {"train_loss": -6.907253265380859, "global_step": 152499, "epoch": 3630} {"train_loss": -6.8471245765686035, "global_step": 152500, "epoch": 3630} {"train_loss": -6.903786511648269, "global_step": 152501, "epoch": 3630, "val_loss": 79042.2578125} {"train_loss": -6.755024433135986, "global_step": 152502, "epoch": 3631} {"train_loss": -6.935590744018555, "global_step": 152503, "epoch": 3631} {"train_loss": -6.8211164474487305, "global_step": 152504, "epoch": 3631} {"train_loss": -6.796399116516113, "global_step": 152505, "epoch": 3631} {"train_loss": -6.9534149169921875, "global_step": 152506, "epoch": 3631} {"train_loss": -6.8674774169921875, "global_step": 152507, "epoch": 3631} {"train_loss": -6.989290714263916, "global_step": 152508, "epoch": 3631} {"train_loss": -6.82804012298584, "global_step": 152509, "epoch": 3631} {"train_loss": -6.910049915313721, "global_step": 152510, "epoch": 3631} {"train_loss": -6.932236671447754, "global_step": 152511, "epoch": 3631} {"train_loss": -6.981655597686768, "global_step": 152512, "epoch": 3631} {"train_loss": -6.896063804626465, "global_step": 152513, "epoch": 3631} {"train_loss": -6.864828586578369, "global_step": 152514, "epoch": 3631} {"train_loss": -6.95599365234375, "global_step": 152515, "epoch": 3631} {"train_loss": -6.886563777923584, "global_step": 152516, "epoch": 3631} {"train_loss": -6.898534774780273, "global_step": 152517, "epoch": 3631} {"train_loss": -6.872654914855957, "global_step": 152518, "epoch": 3631} {"train_loss": -6.877555847167969, "global_step": 152519, "epoch": 3631} {"train_loss": -6.797385215759277, "global_step": 152520, "epoch": 3631} {"train_loss": -6.815227508544922, "global_step": 152521, "epoch": 3631} {"train_loss": -6.957469940185547, "global_step": 152522, "epoch": 3631} {"train_loss": -6.75725793838501, "global_step": 152523, "epoch": 3631} {"train_loss": -6.897404670715332, "global_step": 152524, "epoch": 3631} {"train_loss": -6.861842155456543, "global_step": 152525, "epoch": 3631} {"train_loss": -6.853609561920166, "global_step": 152526, "epoch": 3631} {"train_loss": -6.8415069580078125, "global_step": 152527, "epoch": 3631} {"train_loss": -6.91960334777832, "global_step": 152528, "epoch": 3631} {"train_loss": -6.795629978179932, "global_step": 152529, "epoch": 3631} {"train_loss": -6.819097518920898, "global_step": 152530, "epoch": 3631} {"train_loss": -6.9051594734191895, "global_step": 152531, "epoch": 3631} {"train_loss": -6.947208404541016, "global_step": 152532, "epoch": 3631} {"train_loss": -6.777666091918945, "global_step": 152533, "epoch": 3631} {"train_loss": -6.950778007507324, "global_step": 152534, "epoch": 3631} {"train_loss": -6.82974910736084, "global_step": 152535, "epoch": 3631} {"train_loss": -6.900350570678711, "global_step": 152536, "epoch": 3631} {"train_loss": -6.855154037475586, "global_step": 152537, "epoch": 3631} {"train_loss": -6.92661190032959, "global_step": 152538, "epoch": 3631} {"train_loss": -6.868313789367676, "global_step": 152539, "epoch": 3631} {"train_loss": -6.831936359405518, "global_step": 152540, "epoch": 3631} {"train_loss": -6.773157119750977, "global_step": 152541, "epoch": 3631} {"train_loss": -6.853736877441406, "global_step": 152542, "epoch": 3631} {"train_loss": -6.868928114573161, "global_step": 152543, "epoch": 3631, "val_loss": 79052.2109375} {"train_loss": -6.828945159912109, "global_step": 152544, "epoch": 3632} {"train_loss": -6.908561706542969, "global_step": 152545, "epoch": 3632} {"train_loss": -6.923945426940918, "global_step": 152546, "epoch": 3632} {"train_loss": -6.975893974304199, "global_step": 152547, "epoch": 3632} {"train_loss": -6.845424652099609, "global_step": 152548, "epoch": 3632} {"train_loss": -6.838869571685791, "global_step": 152549, "epoch": 3632} {"train_loss": -6.934215068817139, "global_step": 152550, "epoch": 3632} {"train_loss": -6.9428863525390625, "global_step": 152551, "epoch": 3632} {"train_loss": -6.852199554443359, "global_step": 152552, "epoch": 3632} {"train_loss": -6.858368396759033, "global_step": 152553, "epoch": 3632} {"train_loss": -6.968992233276367, "global_step": 152554, "epoch": 3632} {"train_loss": -6.832644462585449, "global_step": 152555, "epoch": 3632} {"train_loss": -6.913125991821289, "global_step": 152556, "epoch": 3632} {"train_loss": -7.036370277404785, "global_step": 152557, "epoch": 3632} {"train_loss": -7.051041603088379, "global_step": 152558, "epoch": 3632} {"train_loss": -6.884187698364258, "global_step": 152559, "epoch": 3632} {"train_loss": -6.908364295959473, "global_step": 152560, "epoch": 3632} {"train_loss": -7.000255584716797, "global_step": 152561, "epoch": 3632} {"train_loss": -6.899526596069336, "global_step": 152562, "epoch": 3632} {"train_loss": -6.858676910400391, "global_step": 152563, "epoch": 3632} {"train_loss": -6.94740104675293, "global_step": 152564, "epoch": 3632} {"train_loss": -6.909550666809082, "global_step": 152565, "epoch": 3632} {"train_loss": -6.811708450317383, "global_step": 152566, "epoch": 3632} {"train_loss": -6.88682746887207, "global_step": 152567, "epoch": 3632} {"train_loss": -6.718721389770508, "global_step": 152568, "epoch": 3632} {"train_loss": -6.789182662963867, "global_step": 152569, "epoch": 3632} {"train_loss": -6.856696128845215, "global_step": 152570, "epoch": 3632} {"train_loss": -6.925797939300537, "global_step": 152571, "epoch": 3632} {"train_loss": -6.730964660644531, "global_step": 152572, "epoch": 3632} {"train_loss": -6.859877586364746, "global_step": 152573, "epoch": 3632} {"train_loss": -6.842944145202637, "global_step": 152574, "epoch": 3632} {"train_loss": -6.899649620056152, "global_step": 152575, "epoch": 3632} {"train_loss": -6.838146686553955, "global_step": 152576, "epoch": 3632} {"train_loss": -6.824947834014893, "global_step": 152577, "epoch": 3632} {"train_loss": -6.704476356506348, "global_step": 152578, "epoch": 3632} {"train_loss": -6.87800407409668, "global_step": 152579, "epoch": 3632} {"train_loss": -6.962739944458008, "global_step": 152580, "epoch": 3632} {"train_loss": -6.877124786376953, "global_step": 152581, "epoch": 3632} {"train_loss": -6.911773681640625, "global_step": 152582, "epoch": 3632} {"train_loss": -6.99313497543335, "global_step": 152583, "epoch": 3632} {"train_loss": -6.855610370635986, "global_step": 152584, "epoch": 3632} {"train_loss": -6.886183602469308, "global_step": 152585, "epoch": 3632, "val_loss": 79083.5} {"train_loss": -6.906579971313477, "global_step": 152586, "epoch": 3633} {"train_loss": -6.866751670837402, "global_step": 152587, "epoch": 3633} {"train_loss": -6.826717376708984, "global_step": 152588, "epoch": 3633} {"train_loss": -6.906916618347168, "global_step": 152589, "epoch": 3633} {"train_loss": -7.008379936218262, "global_step": 152590, "epoch": 3633} {"train_loss": -6.914154529571533, "global_step": 152591, "epoch": 3633} {"train_loss": -6.957553863525391, "global_step": 152592, "epoch": 3633} {"train_loss": -6.809967994689941, "global_step": 152593, "epoch": 3633} {"train_loss": -6.880014419555664, "global_step": 152594, "epoch": 3633} {"train_loss": -6.910060882568359, "global_step": 152595, "epoch": 3633} {"train_loss": -6.890192031860352, "global_step": 152596, "epoch": 3633} {"train_loss": -6.892110347747803, "global_step": 152597, "epoch": 3633} {"train_loss": -7.025284767150879, "global_step": 152598, "epoch": 3633} {"train_loss": -6.9033026695251465, "global_step": 152599, "epoch": 3633} {"train_loss": -6.845326900482178, "global_step": 152600, "epoch": 3633} {"train_loss": -6.880696773529053, "global_step": 152601, "epoch": 3633} {"train_loss": -6.923956394195557, "global_step": 152602, "epoch": 3633} {"train_loss": -6.805493354797363, "global_step": 152603, "epoch": 3633} {"train_loss": -6.767603874206543, "global_step": 152604, "epoch": 3633} {"train_loss": -6.88327693939209, "global_step": 152605, "epoch": 3633} {"train_loss": -6.869410514831543, "global_step": 152606, "epoch": 3633} {"train_loss": -6.93106746673584, "global_step": 152607, "epoch": 3633} {"train_loss": -6.787470817565918, "global_step": 152608, "epoch": 3633} {"train_loss": -6.837058067321777, "global_step": 152609, "epoch": 3633} {"train_loss": -6.7562150955200195, "global_step": 152610, "epoch": 3633} {"train_loss": -6.710545539855957, "global_step": 152611, "epoch": 3633} {"train_loss": -6.744148254394531, "global_step": 152612, "epoch": 3633} {"train_loss": -6.799139022827148, "global_step": 152613, "epoch": 3633} {"train_loss": -6.832131385803223, "global_step": 152614, "epoch": 3633} {"train_loss": -6.776180744171143, "global_step": 152615, "epoch": 3633} {"train_loss": -6.956151485443115, "global_step": 152616, "epoch": 3633} {"train_loss": -7.015697479248047, "global_step": 152617, "epoch": 3633} {"train_loss": -6.888273239135742, "global_step": 152618, "epoch": 3633} {"train_loss": -6.916531085968018, "global_step": 152619, "epoch": 3633} {"train_loss": -6.898407936096191, "global_step": 152620, "epoch": 3633} {"train_loss": -6.804344654083252, "global_step": 152621, "epoch": 3633} {"train_loss": -6.817590713500977, "global_step": 152622, "epoch": 3633} {"train_loss": -6.959123611450195, "global_step": 152623, "epoch": 3633} {"train_loss": -6.840789794921875, "global_step": 152624, "epoch": 3633} {"train_loss": -6.981806755065918, "global_step": 152625, "epoch": 3633} {"train_loss": -6.853808403015137, "global_step": 152626, "epoch": 3633} {"train_loss": -6.8752647922152565, "global_step": 152627, "epoch": 3633, "val_loss": 79053.6484375} {"train_loss": -6.828803539276123, "global_step": 152628, "epoch": 3634} {"train_loss": -7.036060810089111, "global_step": 152629, "epoch": 3634} {"train_loss": -6.895472526550293, "global_step": 152630, "epoch": 3634} {"train_loss": -7.024646759033203, "global_step": 152631, "epoch": 3634} {"train_loss": -6.957403182983398, "global_step": 152632, "epoch": 3634} {"train_loss": -7.005031585693359, "global_step": 152633, "epoch": 3634} {"train_loss": -6.928220748901367, "global_step": 152634, "epoch": 3634} {"train_loss": -6.945951461791992, "global_step": 152635, "epoch": 3634} {"train_loss": -6.974830150604248, "global_step": 152636, "epoch": 3634} {"train_loss": -6.937028884887695, "global_step": 152637, "epoch": 3634} {"train_loss": -6.824316024780273, "global_step": 152638, "epoch": 3634} {"train_loss": -6.8322978019714355, "global_step": 152639, "epoch": 3634} {"train_loss": -6.9108428955078125, "global_step": 152640, "epoch": 3634} {"train_loss": -6.959321975708008, "global_step": 152641, "epoch": 3634} {"train_loss": -6.7625732421875, "global_step": 152642, "epoch": 3634} {"train_loss": -6.832418918609619, "global_step": 152643, "epoch": 3634} {"train_loss": -6.995725154876709, "global_step": 152644, "epoch": 3634} {"train_loss": -6.873743057250977, "global_step": 152645, "epoch": 3634} {"train_loss": -6.859617233276367, "global_step": 152646, "epoch": 3634} {"train_loss": -6.947174072265625, "global_step": 152647, "epoch": 3634} {"train_loss": -6.972546577453613, "global_step": 152648, "epoch": 3634} {"train_loss": -6.92249870300293, "global_step": 152649, "epoch": 3634} {"train_loss": -6.9155473709106445, "global_step": 152650, "epoch": 3634} {"train_loss": -6.917981147766113, "global_step": 152651, "epoch": 3634} {"train_loss": -6.712467670440674, "global_step": 152652, "epoch": 3634} {"train_loss": -6.825403213500977, "global_step": 152653, "epoch": 3634} {"train_loss": -6.991812229156494, "global_step": 152654, "epoch": 3634} {"train_loss": -6.768756866455078, "global_step": 152655, "epoch": 3634} {"train_loss": -6.777315139770508, "global_step": 152656, "epoch": 3634} {"train_loss": -6.8641157150268555, "global_step": 152657, "epoch": 3634} {"train_loss": -6.742449760437012, "global_step": 152658, "epoch": 3634} {"train_loss": -6.811712741851807, "global_step": 152659, "epoch": 3634} {"train_loss": -6.818778038024902, "global_step": 152660, "epoch": 3634} {"train_loss": -6.81738805770874, "global_step": 152661, "epoch": 3634} {"train_loss": -6.999673366546631, "global_step": 152662, "epoch": 3634} {"train_loss": -6.789113998413086, "global_step": 152663, "epoch": 3634} {"train_loss": -6.794466972351074, "global_step": 152664, "epoch": 3634} {"train_loss": -6.839776992797852, "global_step": 152665, "epoch": 3634} {"train_loss": -6.8767499923706055, "global_step": 152666, "epoch": 3634} {"train_loss": -6.937723159790039, "global_step": 152667, "epoch": 3634} {"train_loss": -6.821115016937256, "global_step": 152668, "epoch": 3634} {"train_loss": -6.884863308497837, "global_step": 152669, "epoch": 3634, "val_loss": 78933.4375} {"train_loss": -6.773536205291748, "global_step": 152670, "epoch": 3635} {"train_loss": -6.85614538192749, "global_step": 152671, "epoch": 3635} {"train_loss": -6.947343826293945, "global_step": 152672, "epoch": 3635} {"train_loss": -6.889033317565918, "global_step": 152673, "epoch": 3635} {"train_loss": -6.767420291900635, "global_step": 152674, "epoch": 3635} {"train_loss": -6.782344341278076, "global_step": 152675, "epoch": 3635} {"train_loss": -6.850866317749023, "global_step": 152676, "epoch": 3635} {"train_loss": -6.8254594802856445, "global_step": 152677, "epoch": 3635} {"train_loss": -6.835674285888672, "global_step": 152678, "epoch": 3635} {"train_loss": -6.972402095794678, "global_step": 152679, "epoch": 3635} {"train_loss": -6.830451488494873, "global_step": 152680, "epoch": 3635} {"train_loss": -7.023443222045898, "global_step": 152681, "epoch": 3635} {"train_loss": -6.954669952392578, "global_step": 152682, "epoch": 3635} {"train_loss": -6.929644584655762, "global_step": 152683, "epoch": 3635} {"train_loss": -6.815825462341309, "global_step": 152684, "epoch": 3635} {"train_loss": -6.994548797607422, "global_step": 152685, "epoch": 3635} {"train_loss": -6.831923484802246, "global_step": 152686, "epoch": 3635} {"train_loss": -6.956845760345459, "global_step": 152687, "epoch": 3635} {"train_loss": -6.888257026672363, "global_step": 152688, "epoch": 3635} {"train_loss": -7.010012626647949, "global_step": 152689, "epoch": 3635} {"train_loss": -6.8955488204956055, "global_step": 152690, "epoch": 3635} {"train_loss": -6.924039840698242, "global_step": 152691, "epoch": 3635} {"train_loss": -6.807751655578613, "global_step": 152692, "epoch": 3635} {"train_loss": -6.9275007247924805, "global_step": 152693, "epoch": 3635} {"train_loss": -6.977088928222656, "global_step": 152694, "epoch": 3635} {"train_loss": -6.989259719848633, "global_step": 152695, "epoch": 3635} {"train_loss": -6.892617225646973, "global_step": 152696, "epoch": 3635} {"train_loss": -6.884941577911377, "global_step": 152697, "epoch": 3635} {"train_loss": -6.725587368011475, "global_step": 152698, "epoch": 3635} {"train_loss": -6.895738124847412, "global_step": 152699, "epoch": 3635} {"train_loss": -6.671286582946777, "global_step": 152700, "epoch": 3635} {"train_loss": -6.448240280151367, "global_step": 152701, "epoch": 3635} {"train_loss": -6.786592483520508, "global_step": 152702, "epoch": 3635} {"train_loss": -6.722526550292969, "global_step": 152703, "epoch": 3635} {"train_loss": -6.603659629821777, "global_step": 152704, "epoch": 3635} {"train_loss": -6.815990447998047, "global_step": 152705, "epoch": 3635} {"train_loss": -6.562830924987793, "global_step": 152706, "epoch": 3635} {"train_loss": -6.878156661987305, "global_step": 152707, "epoch": 3635} {"train_loss": -6.725685119628906, "global_step": 152708, "epoch": 3635} {"train_loss": -6.80974006652832, "global_step": 152709, "epoch": 3635} {"train_loss": -6.67110013961792, "global_step": 152710, "epoch": 3635} {"train_loss": -6.840868336813791, "global_step": 152711, "epoch": 3635, "val_loss": 79203.9921875} {"train_loss": -6.796580791473389, "global_step": 152712, "epoch": 3636} {"train_loss": -6.800907135009766, "global_step": 152713, "epoch": 3636} {"train_loss": -6.8396687507629395, "global_step": 152714, "epoch": 3636} {"train_loss": -6.72518253326416, "global_step": 152715, "epoch": 3636} {"train_loss": -6.884227275848389, "global_step": 152716, "epoch": 3636} {"train_loss": -6.928228378295898, "global_step": 152717, "epoch": 3636} {"train_loss": -6.921727180480957, "global_step": 152718, "epoch": 3636} {"train_loss": -6.775136470794678, "global_step": 152719, "epoch": 3636} {"train_loss": -6.878076553344727, "global_step": 152720, "epoch": 3636} {"train_loss": -6.813854217529297, "global_step": 152721, "epoch": 3636} {"train_loss": -6.898562431335449, "global_step": 152722, "epoch": 3636} {"train_loss": -6.735629081726074, "global_step": 152723, "epoch": 3636} {"train_loss": -6.820123672485352, "global_step": 152724, "epoch": 3636} {"train_loss": -6.903063774108887, "global_step": 152725, "epoch": 3636} {"train_loss": -6.768346786499023, "global_step": 152726, "epoch": 3636} {"train_loss": -6.948644638061523, "global_step": 152727, "epoch": 3636} {"train_loss": -6.754223823547363, "global_step": 152728, "epoch": 3636} {"train_loss": -6.880451679229736, "global_step": 152729, "epoch": 3636} {"train_loss": -6.850414276123047, "global_step": 152730, "epoch": 3636} {"train_loss": -6.802274703979492, "global_step": 152731, "epoch": 3636} {"train_loss": -6.853824138641357, "global_step": 152732, "epoch": 3636} {"train_loss": -6.908059597015381, "global_step": 152733, "epoch": 3636} {"train_loss": -6.831059455871582, "global_step": 152734, "epoch": 3636} {"train_loss": -6.853335857391357, "global_step": 152735, "epoch": 3636} {"train_loss": -6.9222588539123535, "global_step": 152736, "epoch": 3636} {"train_loss": -6.807464599609375, "global_step": 152737, "epoch": 3636} {"train_loss": -6.9180755615234375, "global_step": 152738, "epoch": 3636} {"train_loss": -6.961001873016357, "global_step": 152739, "epoch": 3636} {"train_loss": -6.962998390197754, "global_step": 152740, "epoch": 3636} {"train_loss": -6.911691665649414, "global_step": 152741, "epoch": 3636} {"train_loss": -6.904794692993164, "global_step": 152742, "epoch": 3636} {"train_loss": -6.839297294616699, "global_step": 152743, "epoch": 3636} {"train_loss": -6.793882369995117, "global_step": 152744, "epoch": 3636} {"train_loss": -6.947053909301758, "global_step": 152745, "epoch": 3636} {"train_loss": -6.85581111907959, "global_step": 152746, "epoch": 3636} {"train_loss": -6.914539337158203, "global_step": 152747, "epoch": 3636} {"train_loss": -7.024744987487793, "global_step": 152748, "epoch": 3636} {"train_loss": -6.906630039215088, "global_step": 152749, "epoch": 3636} {"train_loss": -6.872713088989258, "global_step": 152750, "epoch": 3636} {"train_loss": -7.052826404571533, "global_step": 152751, "epoch": 3636} {"train_loss": -6.833818435668945, "global_step": 152752, "epoch": 3636} {"train_loss": -6.8667812915075395, "global_step": 152753, "epoch": 3636, "val_loss": 78999.828125} {"train_loss": -6.801507949829102, "global_step": 152754, "epoch": 3637} {"train_loss": -6.869328498840332, "global_step": 152755, "epoch": 3637} {"train_loss": -6.9756317138671875, "global_step": 152756, "epoch": 3637} {"train_loss": -6.865082263946533, "global_step": 152757, "epoch": 3637} {"train_loss": -6.899163246154785, "global_step": 152758, "epoch": 3637} {"train_loss": -6.839434623718262, "global_step": 152759, "epoch": 3637} {"train_loss": -6.9896931648254395, "global_step": 152760, "epoch": 3637} {"train_loss": -6.839797019958496, "global_step": 152761, "epoch": 3637} {"train_loss": -6.923959732055664, "global_step": 152762, "epoch": 3637} {"train_loss": -6.9842729568481445, "global_step": 152763, "epoch": 3637} {"train_loss": -6.93031644821167, "global_step": 152764, "epoch": 3637} {"train_loss": -6.891371250152588, "global_step": 152765, "epoch": 3637} {"train_loss": -6.784877777099609, "global_step": 152766, "epoch": 3637} {"train_loss": -6.906293869018555, "global_step": 152767, "epoch": 3637} {"train_loss": -6.907597064971924, "global_step": 152768, "epoch": 3637} {"train_loss": -6.957618236541748, "global_step": 152769, "epoch": 3637} {"train_loss": -6.821848392486572, "global_step": 152770, "epoch": 3637} {"train_loss": -6.945963382720947, "global_step": 152771, "epoch": 3637} {"train_loss": -6.876951217651367, "global_step": 152772, "epoch": 3637} {"train_loss": -6.858280181884766, "global_step": 152773, "epoch": 3637} {"train_loss": -6.964925765991211, "global_step": 152774, "epoch": 3637} {"train_loss": -6.9894280433654785, "global_step": 152775, "epoch": 3637} {"train_loss": -6.825170516967773, "global_step": 152776, "epoch": 3637} {"train_loss": -6.844338893890381, "global_step": 152777, "epoch": 3637} {"train_loss": -6.870090484619141, "global_step": 152778, "epoch": 3637} {"train_loss": -6.965496063232422, "global_step": 152779, "epoch": 3637} {"train_loss": -6.888794422149658, "global_step": 152780, "epoch": 3637} {"train_loss": -6.979044437408447, "global_step": 152781, "epoch": 3637} {"train_loss": -6.83029842376709, "global_step": 152782, "epoch": 3637} {"train_loss": -6.787367343902588, "global_step": 152783, "epoch": 3637} {"train_loss": -6.892768859863281, "global_step": 152784, "epoch": 3637} {"train_loss": -6.7949652671813965, "global_step": 152785, "epoch": 3637} {"train_loss": -6.890458106994629, "global_step": 152786, "epoch": 3637} {"train_loss": -6.953927040100098, "global_step": 152787, "epoch": 3637} {"train_loss": -6.904412269592285, "global_step": 152788, "epoch": 3637} {"train_loss": -6.966990947723389, "global_step": 152789, "epoch": 3637} {"train_loss": -6.927990913391113, "global_step": 152790, "epoch": 3637} {"train_loss": -6.959850311279297, "global_step": 152791, "epoch": 3637} {"train_loss": -6.881329536437988, "global_step": 152792, "epoch": 3637} {"train_loss": -6.922435760498047, "global_step": 152793, "epoch": 3637} {"train_loss": -6.999835968017578, "global_step": 152794, "epoch": 3637} {"train_loss": -6.8989151772998625, "global_step": 152795, "epoch": 3637, "val_loss": 78727.7734375} {"train_loss": -6.849836349487305, "global_step": 152796, "epoch": 3638} {"train_loss": -6.951730728149414, "global_step": 152797, "epoch": 3638} {"train_loss": -6.977705955505371, "global_step": 152798, "epoch": 3638} {"train_loss": -6.958049297332764, "global_step": 152799, "epoch": 3638} {"train_loss": -6.844775199890137, "global_step": 152800, "epoch": 3638} {"train_loss": -7.046737194061279, "global_step": 152801, "epoch": 3638} {"train_loss": -6.904742240905762, "global_step": 152802, "epoch": 3638} {"train_loss": -6.897787094116211, "global_step": 152803, "epoch": 3638} {"train_loss": -6.961458683013916, "global_step": 152804, "epoch": 3638} {"train_loss": -6.845956325531006, "global_step": 152805, "epoch": 3638} {"train_loss": -6.9294114112854, "global_step": 152806, "epoch": 3638} {"train_loss": -6.942304611206055, "global_step": 152807, "epoch": 3638} {"train_loss": -6.900791168212891, "global_step": 152808, "epoch": 3638} {"train_loss": -6.937205791473389, "global_step": 152809, "epoch": 3638} {"train_loss": -6.943541526794434, "global_step": 152810, "epoch": 3638} {"train_loss": -6.8038740158081055, "global_step": 152811, "epoch": 3638} {"train_loss": -6.996556758880615, "global_step": 152812, "epoch": 3638} {"train_loss": -6.967668533325195, "global_step": 152813, "epoch": 3638} {"train_loss": -6.856642246246338, "global_step": 152814, "epoch": 3638} {"train_loss": -6.78787088394165, "global_step": 152815, "epoch": 3638} {"train_loss": -6.911779880523682, "global_step": 152816, "epoch": 3638} {"train_loss": -7.064334869384766, "global_step": 152817, "epoch": 3638} {"train_loss": -6.972841262817383, "global_step": 152818, "epoch": 3638} {"train_loss": -6.864710807800293, "global_step": 152819, "epoch": 3638} {"train_loss": -6.8995513916015625, "global_step": 152820, "epoch": 3638} {"train_loss": -6.864099025726318, "global_step": 152821, "epoch": 3638} {"train_loss": -6.850567817687988, "global_step": 152822, "epoch": 3638} {"train_loss": -6.884954452514648, "global_step": 152823, "epoch": 3638} {"train_loss": -6.800130844116211, "global_step": 152824, "epoch": 3638} {"train_loss": -6.778702735900879, "global_step": 152825, "epoch": 3638} {"train_loss": -6.932068824768066, "global_step": 152826, "epoch": 3638} {"train_loss": -6.815499305725098, "global_step": 152827, "epoch": 3638} {"train_loss": -6.9223198890686035, "global_step": 152828, "epoch": 3638} {"train_loss": -7.000460624694824, "global_step": 152829, "epoch": 3638} {"train_loss": -6.859981060028076, "global_step": 152830, "epoch": 3638} {"train_loss": -7.019284248352051, "global_step": 152831, "epoch": 3638} {"train_loss": -6.810398101806641, "global_step": 152832, "epoch": 3638} {"train_loss": -6.834237575531006, "global_step": 152833, "epoch": 3638} {"train_loss": -6.9026384353637695, "global_step": 152834, "epoch": 3638} {"train_loss": -6.9898576736450195, "global_step": 152835, "epoch": 3638} {"train_loss": -6.849748134613037, "global_step": 152836, "epoch": 3638} {"train_loss": -6.905459596997216, "global_step": 152837, "epoch": 3638, "val_loss": 79050.234375} {"train_loss": -6.760196208953857, "global_step": 152838, "epoch": 3639} {"train_loss": -6.897885322570801, "global_step": 152839, "epoch": 3639} {"train_loss": -6.786458969116211, "global_step": 152840, "epoch": 3639} {"train_loss": -6.833937644958496, "global_step": 152841, "epoch": 3639} {"train_loss": -6.852808475494385, "global_step": 152842, "epoch": 3639} {"train_loss": -6.898116588592529, "global_step": 152843, "epoch": 3639} {"train_loss": -6.906933784484863, "global_step": 152844, "epoch": 3639} {"train_loss": -6.829768180847168, "global_step": 152845, "epoch": 3639} {"train_loss": -7.038382530212402, "global_step": 152846, "epoch": 3639} {"train_loss": -6.815862655639648, "global_step": 152847, "epoch": 3639} {"train_loss": -6.864097595214844, "global_step": 152848, "epoch": 3639} {"train_loss": -6.963308334350586, "global_step": 152849, "epoch": 3639} {"train_loss": -6.965909004211426, "global_step": 152850, "epoch": 3639} {"train_loss": -6.801856994628906, "global_step": 152851, "epoch": 3639} {"train_loss": -6.851738929748535, "global_step": 152852, "epoch": 3639} {"train_loss": -6.954434394836426, "global_step": 152853, "epoch": 3639} {"train_loss": -6.893111228942871, "global_step": 152854, "epoch": 3639} {"train_loss": -6.89560604095459, "global_step": 152855, "epoch": 3639} {"train_loss": -6.909639835357666, "global_step": 152856, "epoch": 3639} {"train_loss": -6.940424919128418, "global_step": 152857, "epoch": 3639} {"train_loss": -6.923056602478027, "global_step": 152858, "epoch": 3639} {"train_loss": -6.973714828491211, "global_step": 152859, "epoch": 3639} {"train_loss": -6.860690116882324, "global_step": 152860, "epoch": 3639} {"train_loss": -7.00069522857666, "global_step": 152861, "epoch": 3639} {"train_loss": -6.890982627868652, "global_step": 152862, "epoch": 3639} {"train_loss": -6.975205898284912, "global_step": 152863, "epoch": 3639} {"train_loss": -6.885933876037598, "global_step": 152864, "epoch": 3639} {"train_loss": -7.015249729156494, "global_step": 152865, "epoch": 3639} {"train_loss": -6.959934234619141, "global_step": 152866, "epoch": 3639} {"train_loss": -6.9547271728515625, "global_step": 152867, "epoch": 3639} {"train_loss": -6.947229385375977, "global_step": 152868, "epoch": 3639} {"train_loss": -6.829143047332764, "global_step": 152869, "epoch": 3639} {"train_loss": -6.865324974060059, "global_step": 152870, "epoch": 3639} {"train_loss": -6.818580627441406, "global_step": 152871, "epoch": 3639} {"train_loss": -6.752194881439209, "global_step": 152872, "epoch": 3639} {"train_loss": -6.896905899047852, "global_step": 152873, "epoch": 3639} {"train_loss": -6.845746994018555, "global_step": 152874, "epoch": 3639} {"train_loss": -6.833762168884277, "global_step": 152875, "epoch": 3639} {"train_loss": -6.891372203826904, "global_step": 152876, "epoch": 3639} {"train_loss": -6.921061992645264, "global_step": 152877, "epoch": 3639} {"train_loss": -6.805431365966797, "global_step": 152878, "epoch": 3639} {"train_loss": -6.886366174334571, "global_step": 152879, "epoch": 3639, "val_loss": 78946.5} {"train_loss": -6.8949875831604, "global_step": 152880, "epoch": 3640} {"train_loss": -6.766518592834473, "global_step": 152881, "epoch": 3640} {"train_loss": -6.767309188842773, "global_step": 152882, "epoch": 3640} {"train_loss": -6.880772113800049, "global_step": 152883, "epoch": 3640} {"train_loss": -6.798602104187012, "global_step": 152884, "epoch": 3640} {"train_loss": -6.9188551902771, "global_step": 152885, "epoch": 3640} {"train_loss": -6.774726867675781, "global_step": 152886, "epoch": 3640} {"train_loss": -6.819673538208008, "global_step": 152887, "epoch": 3640} {"train_loss": -6.816247940063477, "global_step": 152888, "epoch": 3640} {"train_loss": -6.854646682739258, "global_step": 152889, "epoch": 3640} {"train_loss": -6.823186874389648, "global_step": 152890, "epoch": 3640} {"train_loss": -6.824680805206299, "global_step": 152891, "epoch": 3640} {"train_loss": -6.885646820068359, "global_step": 152892, "epoch": 3640} {"train_loss": -6.871296405792236, "global_step": 152893, "epoch": 3640} {"train_loss": -6.699850082397461, "global_step": 152894, "epoch": 3640} {"train_loss": -6.914366722106934, "global_step": 152895, "epoch": 3640} {"train_loss": -6.811801433563232, "global_step": 152896, "epoch": 3640} {"train_loss": -6.954668998718262, "global_step": 152897, "epoch": 3640} {"train_loss": -6.832597732543945, "global_step": 152898, "epoch": 3640} {"train_loss": -6.907011032104492, "global_step": 152899, "epoch": 3640} {"train_loss": -6.859773635864258, "global_step": 152900, "epoch": 3640} {"train_loss": -6.81788444519043, "global_step": 152901, "epoch": 3640} {"train_loss": -6.854692459106445, "global_step": 152902, "epoch": 3640} {"train_loss": -6.921178817749023, "global_step": 152903, "epoch": 3640} {"train_loss": -6.980136871337891, "global_step": 152904, "epoch": 3640} {"train_loss": -6.789940357208252, "global_step": 152905, "epoch": 3640} {"train_loss": -6.950925827026367, "global_step": 152906, "epoch": 3640} {"train_loss": -6.878515243530273, "global_step": 152907, "epoch": 3640} {"train_loss": -6.810829162597656, "global_step": 152908, "epoch": 3640} {"train_loss": -6.939565658569336, "global_step": 152909, "epoch": 3640} {"train_loss": -6.833982944488525, "global_step": 152910, "epoch": 3640} {"train_loss": -6.91618537902832, "global_step": 152911, "epoch": 3640} {"train_loss": -6.970322608947754, "global_step": 152912, "epoch": 3640} {"train_loss": -6.852090358734131, "global_step": 152913, "epoch": 3640} {"train_loss": -7.053442001342773, "global_step": 152914, "epoch": 3640} {"train_loss": -6.818133354187012, "global_step": 152915, "epoch": 3640} {"train_loss": -6.977978229522705, "global_step": 152916, "epoch": 3640} {"train_loss": -6.861824989318848, "global_step": 152917, "epoch": 3640} {"train_loss": -6.866525173187256, "global_step": 152918, "epoch": 3640} {"train_loss": -6.944637775421143, "global_step": 152919, "epoch": 3640} {"train_loss": -6.859058380126953, "global_step": 152920, "epoch": 3640} {"train_loss": -6.86757230758667, "global_step": 152921, "epoch": 3640, "val_loss": 78771.40625} {"train_loss": -6.827229022979736, "global_step": 152922, "epoch": 3641} {"train_loss": -6.914341449737549, "global_step": 152923, "epoch": 3641} {"train_loss": -6.923064231872559, "global_step": 152924, "epoch": 3641} {"train_loss": -6.816288471221924, "global_step": 152925, "epoch": 3641} {"train_loss": -6.8342204093933105, "global_step": 152926, "epoch": 3641} {"train_loss": -6.959076881408691, "global_step": 152927, "epoch": 3641} {"train_loss": -6.794088363647461, "global_step": 152928, "epoch": 3641} {"train_loss": -6.804734230041504, "global_step": 152929, "epoch": 3641} {"train_loss": -6.77595329284668, "global_step": 152930, "epoch": 3641} {"train_loss": -6.89317512512207, "global_step": 152931, "epoch": 3641} {"train_loss": -6.881131172180176, "global_step": 152932, "epoch": 3641} {"train_loss": -6.91065788269043, "global_step": 152933, "epoch": 3641} {"train_loss": -6.793575763702393, "global_step": 152934, "epoch": 3641} {"train_loss": -6.830979347229004, "global_step": 152935, "epoch": 3641} {"train_loss": -6.8231096267700195, "global_step": 152936, "epoch": 3641} {"train_loss": -6.7812886238098145, "global_step": 152937, "epoch": 3641} {"train_loss": -6.7215375900268555, "global_step": 152938, "epoch": 3641} {"train_loss": -6.820150375366211, "global_step": 152939, "epoch": 3641} {"train_loss": -6.748497009277344, "global_step": 152940, "epoch": 3641} {"train_loss": -6.727219581604004, "global_step": 152941, "epoch": 3641} {"train_loss": -6.829922676086426, "global_step": 152942, "epoch": 3641} {"train_loss": -6.824945449829102, "global_step": 152943, "epoch": 3641} {"train_loss": -6.6921305656433105, "global_step": 152944, "epoch": 3641} {"train_loss": -6.803293228149414, "global_step": 152945, "epoch": 3641} {"train_loss": -6.664597988128662, "global_step": 152946, "epoch": 3641} {"train_loss": -6.689085960388184, "global_step": 152947, "epoch": 3641} {"train_loss": -6.8211894035339355, "global_step": 152948, "epoch": 3641} {"train_loss": -6.661245346069336, "global_step": 152949, "epoch": 3641} {"train_loss": -6.767621994018555, "global_step": 152950, "epoch": 3641} {"train_loss": -6.780915260314941, "global_step": 152951, "epoch": 3641} {"train_loss": -6.6821088790893555, "global_step": 152952, "epoch": 3641} {"train_loss": -6.732003688812256, "global_step": 152953, "epoch": 3641} {"train_loss": -6.780000686645508, "global_step": 152954, "epoch": 3641} {"train_loss": -6.725958824157715, "global_step": 152955, "epoch": 3641} {"train_loss": -6.761043548583984, "global_step": 152956, "epoch": 3641} {"train_loss": -6.774595737457275, "global_step": 152957, "epoch": 3641} {"train_loss": -6.7909932136535645, "global_step": 152958, "epoch": 3641} {"train_loss": -6.8887529373168945, "global_step": 152959, "epoch": 3641} {"train_loss": -6.822856903076172, "global_step": 152960, "epoch": 3641} {"train_loss": -6.830845355987549, "global_step": 152961, "epoch": 3641} {"train_loss": -6.952258110046387, "global_step": 152962, "epoch": 3641} {"train_loss": -6.803129922775995, "global_step": 152963, "epoch": 3641, "val_loss": 78633.7421875} {"train_loss": -6.852500915527344, "global_step": 152964, "epoch": 3642} {"train_loss": -6.739014625549316, "global_step": 152965, "epoch": 3642} {"train_loss": -6.845455169677734, "global_step": 152966, "epoch": 3642} {"train_loss": -6.910325050354004, "global_step": 152967, "epoch": 3642} {"train_loss": -6.81831169128418, "global_step": 152968, "epoch": 3642} {"train_loss": -6.850051403045654, "global_step": 152969, "epoch": 3642} {"train_loss": -6.906503677368164, "global_step": 152970, "epoch": 3642} {"train_loss": -6.773372650146484, "global_step": 152971, "epoch": 3642} {"train_loss": -6.867339134216309, "global_step": 152972, "epoch": 3642} {"train_loss": -6.807520866394043, "global_step": 152973, "epoch": 3642} {"train_loss": -6.874089241027832, "global_step": 152974, "epoch": 3642} {"train_loss": -6.928652286529541, "global_step": 152975, "epoch": 3642} {"train_loss": -6.824173927307129, "global_step": 152976, "epoch": 3642} {"train_loss": -6.869735240936279, "global_step": 152977, "epoch": 3642} {"train_loss": -6.75602388381958, "global_step": 152978, "epoch": 3642} {"train_loss": -6.761654853820801, "global_step": 152979, "epoch": 3642} {"train_loss": -6.847160339355469, "global_step": 152980, "epoch": 3642} {"train_loss": -6.8099260330200195, "global_step": 152981, "epoch": 3642} {"train_loss": -6.8335113525390625, "global_step": 152982, "epoch": 3642} {"train_loss": -6.876533031463623, "global_step": 152983, "epoch": 3642} {"train_loss": -6.763557434082031, "global_step": 152984, "epoch": 3642} {"train_loss": -6.835145950317383, "global_step": 152985, "epoch": 3642} {"train_loss": -6.901316165924072, "global_step": 152986, "epoch": 3642} {"train_loss": -6.809618949890137, "global_step": 152987, "epoch": 3642} {"train_loss": -6.993405818939209, "global_step": 152988, "epoch": 3642} {"train_loss": -6.7248687744140625, "global_step": 152989, "epoch": 3642} {"train_loss": -6.975177764892578, "global_step": 152990, "epoch": 3642} {"train_loss": -6.901279449462891, "global_step": 152991, "epoch": 3642} {"train_loss": -6.85599946975708, "global_step": 152992, "epoch": 3642} {"train_loss": -6.890255928039551, "global_step": 152993, "epoch": 3642} {"train_loss": -6.890648365020752, "global_step": 152994, "epoch": 3642} {"train_loss": -6.900015830993652, "global_step": 152995, "epoch": 3642} {"train_loss": -6.971100807189941, "global_step": 152996, "epoch": 3642} {"train_loss": -6.796708583831787, "global_step": 152997, "epoch": 3642} {"train_loss": -6.931027412414551, "global_step": 152998, "epoch": 3642} {"train_loss": -6.777373313903809, "global_step": 152999, "epoch": 3642} {"train_loss": -6.865736484527588, "global_step": 153000, "epoch": 3642} {"train_loss": -6.835751056671143, "global_step": 153001, "epoch": 3642} {"train_loss": -6.736588478088379, "global_step": 153002, "epoch": 3642} {"train_loss": -6.9132890701293945, "global_step": 153003, "epoch": 3642} {"train_loss": -6.797082424163818, "global_step": 153004, "epoch": 3642} {"train_loss": -6.850582259041922, "global_step": 153005, "epoch": 3642, "val_loss": 79000.4296875} {"train_loss": -6.855852127075195, "global_step": 153006, "epoch": 3643} {"train_loss": -6.857056140899658, "global_step": 153007, "epoch": 3643} {"train_loss": -6.938006401062012, "global_step": 153008, "epoch": 3643} {"train_loss": -6.801330089569092, "global_step": 153009, "epoch": 3643} {"train_loss": -6.913141250610352, "global_step": 153010, "epoch": 3643} {"train_loss": -6.804271697998047, "global_step": 153011, "epoch": 3643} {"train_loss": -6.909700870513916, "global_step": 153012, "epoch": 3643} {"train_loss": -6.953832149505615, "global_step": 153013, "epoch": 3643} {"train_loss": -6.95404052734375, "global_step": 153014, "epoch": 3643} {"train_loss": -6.940217971801758, "global_step": 153015, "epoch": 3643} {"train_loss": -6.806515693664551, "global_step": 153016, "epoch": 3643} {"train_loss": -6.952891826629639, "global_step": 153017, "epoch": 3643} {"train_loss": -6.846374988555908, "global_step": 153018, "epoch": 3643} {"train_loss": -6.896294593811035, "global_step": 153019, "epoch": 3643} {"train_loss": -6.801502227783203, "global_step": 153020, "epoch": 3643} {"train_loss": -6.805482864379883, "global_step": 153021, "epoch": 3643} {"train_loss": -6.828820705413818, "global_step": 153022, "epoch": 3643} {"train_loss": -6.806768417358398, "global_step": 153023, "epoch": 3643} {"train_loss": -6.878692626953125, "global_step": 153024, "epoch": 3643} {"train_loss": -6.876389503479004, "global_step": 153025, "epoch": 3643} {"train_loss": -6.805373668670654, "global_step": 153026, "epoch": 3643} {"train_loss": -6.810919761657715, "global_step": 153027, "epoch": 3643} {"train_loss": -6.790480613708496, "global_step": 153028, "epoch": 3643} {"train_loss": -6.929042816162109, "global_step": 153029, "epoch": 3643} {"train_loss": -6.939646244049072, "global_step": 153030, "epoch": 3643} {"train_loss": -6.905866622924805, "global_step": 153031, "epoch": 3643} {"train_loss": -6.7427263259887695, "global_step": 153032, "epoch": 3643} {"train_loss": -6.970907211303711, "global_step": 153033, "epoch": 3643} {"train_loss": -6.809633731842041, "global_step": 153034, "epoch": 3643} {"train_loss": -6.938126087188721, "global_step": 153035, "epoch": 3643} {"train_loss": -6.891010284423828, "global_step": 153036, "epoch": 3643} {"train_loss": -6.773079872131348, "global_step": 153037, "epoch": 3643} {"train_loss": -6.870073318481445, "global_step": 153038, "epoch": 3643} {"train_loss": -6.868867874145508, "global_step": 153039, "epoch": 3643} {"train_loss": -6.83120059967041, "global_step": 153040, "epoch": 3643} {"train_loss": -6.870100021362305, "global_step": 153041, "epoch": 3643} {"train_loss": -6.8174238204956055, "global_step": 153042, "epoch": 3643} {"train_loss": -6.978890895843506, "global_step": 153043, "epoch": 3643} {"train_loss": -6.992758750915527, "global_step": 153044, "epoch": 3643} {"train_loss": -6.671354293823242, "global_step": 153045, "epoch": 3643} {"train_loss": -6.8524088859558105, "global_step": 153046, "epoch": 3643} {"train_loss": -6.866938170932588, "global_step": 153047, "epoch": 3643, "val_loss": 78932.1484375} {"train_loss": -6.78904914855957, "global_step": 153048, "epoch": 3644} {"train_loss": -6.879598617553711, "global_step": 153049, "epoch": 3644} {"train_loss": -6.85844087600708, "global_step": 153050, "epoch": 3644} {"train_loss": -6.801793098449707, "global_step": 153051, "epoch": 3644} {"train_loss": -6.818940162658691, "global_step": 153052, "epoch": 3644} {"train_loss": -6.867064476013184, "global_step": 153053, "epoch": 3644} {"train_loss": -6.863243579864502, "global_step": 153054, "epoch": 3644} {"train_loss": -6.8414998054504395, "global_step": 153055, "epoch": 3644} {"train_loss": -6.81925106048584, "global_step": 153056, "epoch": 3644} {"train_loss": -6.903512001037598, "global_step": 153057, "epoch": 3644} {"train_loss": -6.800137996673584, "global_step": 153058, "epoch": 3644} {"train_loss": -6.860187530517578, "global_step": 153059, "epoch": 3644} {"train_loss": -6.913544654846191, "global_step": 153060, "epoch": 3644} {"train_loss": -6.884208679199219, "global_step": 153061, "epoch": 3644} {"train_loss": -6.851874351501465, "global_step": 153062, "epoch": 3644} {"train_loss": -6.910937309265137, "global_step": 153063, "epoch": 3644} {"train_loss": -6.864798545837402, "global_step": 153064, "epoch": 3644} {"train_loss": -6.888889312744141, "global_step": 153065, "epoch": 3644} {"train_loss": -6.748807907104492, "global_step": 153066, "epoch": 3644} {"train_loss": -6.793521881103516, "global_step": 153067, "epoch": 3644} {"train_loss": -6.774165153503418, "global_step": 153068, "epoch": 3644} {"train_loss": -6.766136169433594, "global_step": 153069, "epoch": 3644} {"train_loss": -7.023586273193359, "global_step": 153070, "epoch": 3644} {"train_loss": -6.741143703460693, "global_step": 153071, "epoch": 3644} {"train_loss": -6.857674598693848, "global_step": 153072, "epoch": 3644} {"train_loss": -6.807358264923096, "global_step": 153073, "epoch": 3644} {"train_loss": -6.802665710449219, "global_step": 153074, "epoch": 3644} {"train_loss": -6.948212146759033, "global_step": 153075, "epoch": 3644} {"train_loss": -6.837095260620117, "global_step": 153076, "epoch": 3644} {"train_loss": -6.912178993225098, "global_step": 153077, "epoch": 3644} {"train_loss": -6.966433525085449, "global_step": 153078, "epoch": 3644} {"train_loss": -6.851374626159668, "global_step": 153079, "epoch": 3644} {"train_loss": -6.845928192138672, "global_step": 153080, "epoch": 3644} {"train_loss": -6.96822452545166, "global_step": 153081, "epoch": 3644} {"train_loss": -7.020773410797119, "global_step": 153082, "epoch": 3644} {"train_loss": -6.936553955078125, "global_step": 153083, "epoch": 3644} {"train_loss": -6.963129997253418, "global_step": 153084, "epoch": 3644} {"train_loss": -7.040457725524902, "global_step": 153085, "epoch": 3644} {"train_loss": -6.846978187561035, "global_step": 153086, "epoch": 3644} {"train_loss": -6.874667644500732, "global_step": 153087, "epoch": 3644} {"train_loss": -6.872347831726074, "global_step": 153088, "epoch": 3644} {"train_loss": -6.869241146814256, "global_step": 153089, "epoch": 3644, "val_loss": 78645.140625} {"train_loss": -7.0266618728637695, "global_step": 153090, "epoch": 3645} {"train_loss": -6.943366050720215, "global_step": 153091, "epoch": 3645} {"train_loss": -6.879705429077148, "global_step": 153092, "epoch": 3645} {"train_loss": -6.882054328918457, "global_step": 153093, "epoch": 3645} {"train_loss": -6.944810390472412, "global_step": 153094, "epoch": 3645} {"train_loss": -7.050393104553223, "global_step": 153095, "epoch": 3645} {"train_loss": -6.867384910583496, "global_step": 153096, "epoch": 3645} {"train_loss": -6.965817451477051, "global_step": 153097, "epoch": 3645} {"train_loss": -6.92933988571167, "global_step": 153098, "epoch": 3645} {"train_loss": -6.8339738845825195, "global_step": 153099, "epoch": 3645} {"train_loss": -6.870774745941162, "global_step": 153100, "epoch": 3645} {"train_loss": -6.8586273193359375, "global_step": 153101, "epoch": 3645} {"train_loss": -7.026219844818115, "global_step": 153102, "epoch": 3645} {"train_loss": -6.814775466918945, "global_step": 153103, "epoch": 3645} {"train_loss": -6.846380710601807, "global_step": 153104, "epoch": 3645} {"train_loss": -6.843194484710693, "global_step": 153105, "epoch": 3645} {"train_loss": -6.991546154022217, "global_step": 153106, "epoch": 3645} {"train_loss": -7.006115913391113, "global_step": 153107, "epoch": 3645} {"train_loss": -6.94766092300415, "global_step": 153108, "epoch": 3645} {"train_loss": -6.947118759155273, "global_step": 153109, "epoch": 3645} {"train_loss": -6.845344543457031, "global_step": 153110, "epoch": 3645} {"train_loss": -6.842950820922852, "global_step": 153111, "epoch": 3645} {"train_loss": -6.837026596069336, "global_step": 153112, "epoch": 3645} {"train_loss": -6.854538917541504, "global_step": 153113, "epoch": 3645} {"train_loss": -7.041858196258545, "global_step": 153114, "epoch": 3645} {"train_loss": -6.8286452293396, "global_step": 153115, "epoch": 3645} {"train_loss": -6.8644914627075195, "global_step": 153116, "epoch": 3645} {"train_loss": -6.881228446960449, "global_step": 153117, "epoch": 3645} {"train_loss": -6.801826477050781, "global_step": 153118, "epoch": 3645} {"train_loss": -6.844579219818115, "global_step": 153119, "epoch": 3645} {"train_loss": -6.806657791137695, "global_step": 153120, "epoch": 3645} {"train_loss": -6.846540451049805, "global_step": 153121, "epoch": 3645} {"train_loss": -6.949231147766113, "global_step": 153122, "epoch": 3645} {"train_loss": -6.84998893737793, "global_step": 153123, "epoch": 3645} {"train_loss": -6.84794807434082, "global_step": 153124, "epoch": 3645} {"train_loss": -6.906840801239014, "global_step": 153125, "epoch": 3645} {"train_loss": -6.844001770019531, "global_step": 153126, "epoch": 3645} {"train_loss": -6.782037734985352, "global_step": 153127, "epoch": 3645} {"train_loss": -6.930119514465332, "global_step": 153128, "epoch": 3645} {"train_loss": -6.75683069229126, "global_step": 153129, "epoch": 3645} {"train_loss": -6.878596305847168, "global_step": 153130, "epoch": 3645} {"train_loss": -6.890783264523461, "global_step": 153131, "epoch": 3645, "val_loss": 79115.21875} {"train_loss": -6.838239669799805, "global_step": 153132, "epoch": 3646} {"train_loss": -6.908915042877197, "global_step": 153133, "epoch": 3646} {"train_loss": -6.931842803955078, "global_step": 153134, "epoch": 3646} {"train_loss": -6.99554967880249, "global_step": 153135, "epoch": 3646} {"train_loss": -7.017327308654785, "global_step": 153136, "epoch": 3646} {"train_loss": -6.943244457244873, "global_step": 153137, "epoch": 3646} {"train_loss": -6.861058235168457, "global_step": 153138, "epoch": 3646} {"train_loss": -7.029474258422852, "global_step": 153139, "epoch": 3646} {"train_loss": -6.887062072753906, "global_step": 153140, "epoch": 3646} {"train_loss": -6.931148529052734, "global_step": 153141, "epoch": 3646} {"train_loss": -6.911694049835205, "global_step": 153142, "epoch": 3646} {"train_loss": -6.887187957763672, "global_step": 153143, "epoch": 3646} {"train_loss": -7.030428409576416, "global_step": 153144, "epoch": 3646} {"train_loss": -6.8775787353515625, "global_step": 153145, "epoch": 3646} {"train_loss": -6.854374885559082, "global_step": 153146, "epoch": 3646} {"train_loss": -6.812605857849121, "global_step": 153147, "epoch": 3646} {"train_loss": -6.86339807510376, "global_step": 153148, "epoch": 3646} {"train_loss": -6.912043571472168, "global_step": 153149, "epoch": 3646} {"train_loss": -6.862783432006836, "global_step": 153150, "epoch": 3646} {"train_loss": -6.89615535736084, "global_step": 153151, "epoch": 3646} {"train_loss": -7.005414962768555, "global_step": 153152, "epoch": 3646} {"train_loss": -6.897627830505371, "global_step": 153153, "epoch": 3646} {"train_loss": -7.005582809448242, "global_step": 153154, "epoch": 3646} {"train_loss": -6.907066822052002, "global_step": 153155, "epoch": 3646} {"train_loss": -6.9175496101379395, "global_step": 153156, "epoch": 3646} {"train_loss": -6.910882949829102, "global_step": 153157, "epoch": 3646} {"train_loss": -6.994455814361572, "global_step": 153158, "epoch": 3646} {"train_loss": -6.949670314788818, "global_step": 153159, "epoch": 3646} {"train_loss": -6.908545970916748, "global_step": 153160, "epoch": 3646} {"train_loss": -6.84885311126709, "global_step": 153161, "epoch": 3646} {"train_loss": -6.912576675415039, "global_step": 153162, "epoch": 3646} {"train_loss": -6.958410739898682, "global_step": 153163, "epoch": 3646} {"train_loss": -6.883059024810791, "global_step": 153164, "epoch": 3646} {"train_loss": -6.93354606628418, "global_step": 153165, "epoch": 3646} {"train_loss": -6.910805702209473, "global_step": 153166, "epoch": 3646} {"train_loss": -6.908028602600098, "global_step": 153167, "epoch": 3646} {"train_loss": -6.901401996612549, "global_step": 153168, "epoch": 3646} {"train_loss": -6.895258903503418, "global_step": 153169, "epoch": 3646} {"train_loss": -6.919992446899414, "global_step": 153170, "epoch": 3646} {"train_loss": -6.955029487609863, "global_step": 153171, "epoch": 3646} {"train_loss": -6.853761672973633, "global_step": 153172, "epoch": 3646} {"train_loss": -6.917890332994007, "global_step": 153173, "epoch": 3646, "val_loss": 78989.03125} {"train_loss": -6.8585615158081055, "global_step": 153174, "epoch": 3647} {"train_loss": -7.022652626037598, "global_step": 153175, "epoch": 3647} {"train_loss": -6.851146221160889, "global_step": 153176, "epoch": 3647} {"train_loss": -6.8265581130981445, "global_step": 153177, "epoch": 3647} {"train_loss": -6.831789970397949, "global_step": 153178, "epoch": 3647} {"train_loss": -6.646992206573486, "global_step": 153179, "epoch": 3647} {"train_loss": -6.837497711181641, "global_step": 153180, "epoch": 3647} {"train_loss": -6.937301158905029, "global_step": 153181, "epoch": 3647} {"train_loss": -6.771544456481934, "global_step": 153182, "epoch": 3647} {"train_loss": -6.773334503173828, "global_step": 153183, "epoch": 3647} {"train_loss": -6.859312057495117, "global_step": 153184, "epoch": 3647} {"train_loss": -6.957035541534424, "global_step": 153185, "epoch": 3647} {"train_loss": -6.8093414306640625, "global_step": 153186, "epoch": 3647} {"train_loss": -6.7589263916015625, "global_step": 153187, "epoch": 3647} {"train_loss": -6.838996887207031, "global_step": 153188, "epoch": 3647} {"train_loss": -6.7734761238098145, "global_step": 153189, "epoch": 3647} {"train_loss": -6.836833953857422, "global_step": 153190, "epoch": 3647} {"train_loss": -6.9165520668029785, "global_step": 153191, "epoch": 3647} {"train_loss": -6.805253982543945, "global_step": 153192, "epoch": 3647} {"train_loss": -6.78317403793335, "global_step": 153193, "epoch": 3647} {"train_loss": -6.907547950744629, "global_step": 153194, "epoch": 3647} {"train_loss": -6.88339900970459, "global_step": 153195, "epoch": 3647} {"train_loss": -7.017569541931152, "global_step": 153196, "epoch": 3647} {"train_loss": -6.967916965484619, "global_step": 153197, "epoch": 3647} {"train_loss": -6.9083757400512695, "global_step": 153198, "epoch": 3647} {"train_loss": -6.989712715148926, "global_step": 153199, "epoch": 3647} {"train_loss": -6.8942413330078125, "global_step": 153200, "epoch": 3647} {"train_loss": -6.924126148223877, "global_step": 153201, "epoch": 3647} {"train_loss": -6.90757417678833, "global_step": 153202, "epoch": 3647} {"train_loss": -6.969803810119629, "global_step": 153203, "epoch": 3647} {"train_loss": -6.960418701171875, "global_step": 153204, "epoch": 3647} {"train_loss": -6.8762288093566895, "global_step": 153205, "epoch": 3647} {"train_loss": -6.932089805603027, "global_step": 153206, "epoch": 3647} {"train_loss": -6.941439628601074, "global_step": 153207, "epoch": 3647} {"train_loss": -6.8940229415893555, "global_step": 153208, "epoch": 3647} {"train_loss": -6.802775859832764, "global_step": 153209, "epoch": 3647} {"train_loss": -6.940058708190918, "global_step": 153210, "epoch": 3647} {"train_loss": -6.925069808959961, "global_step": 153211, "epoch": 3647} {"train_loss": -7.013932228088379, "global_step": 153212, "epoch": 3647} {"train_loss": -6.879818439483643, "global_step": 153213, "epoch": 3647} {"train_loss": -6.803550720214844, "global_step": 153214, "epoch": 3647} {"train_loss": -6.881540411994571, "global_step": 153215, "epoch": 3647, "val_loss": 79020.0} {"train_loss": -6.9225029945373535, "global_step": 153216, "epoch": 3648} {"train_loss": -6.988203048706055, "global_step": 153217, "epoch": 3648} {"train_loss": -6.96392297744751, "global_step": 153218, "epoch": 3648} {"train_loss": -6.821935653686523, "global_step": 153219, "epoch": 3648} {"train_loss": -6.937185287475586, "global_step": 153220, "epoch": 3648} {"train_loss": -6.8814473152160645, "global_step": 153221, "epoch": 3648} {"train_loss": -6.928682327270508, "global_step": 153222, "epoch": 3648} {"train_loss": -6.866517543792725, "global_step": 153223, "epoch": 3648} {"train_loss": -6.977901458740234, "global_step": 153224, "epoch": 3648} {"train_loss": -6.963860511779785, "global_step": 153225, "epoch": 3648} {"train_loss": -6.808846473693848, "global_step": 153226, "epoch": 3648} {"train_loss": -6.960791110992432, "global_step": 153227, "epoch": 3648} {"train_loss": -6.9403486251831055, "global_step": 153228, "epoch": 3648} {"train_loss": -6.808956623077393, "global_step": 153229, "epoch": 3648} {"train_loss": -6.94517183303833, "global_step": 153230, "epoch": 3648} {"train_loss": -6.824450492858887, "global_step": 153231, "epoch": 3648} {"train_loss": -6.930034160614014, "global_step": 153232, "epoch": 3648} {"train_loss": -6.896148681640625, "global_step": 153233, "epoch": 3648} {"train_loss": -6.775964736938477, "global_step": 153234, "epoch": 3648} {"train_loss": -6.883650779724121, "global_step": 153235, "epoch": 3648} {"train_loss": -6.882776737213135, "global_step": 153236, "epoch": 3648} {"train_loss": -6.840028285980225, "global_step": 153237, "epoch": 3648} {"train_loss": -6.887118339538574, "global_step": 153238, "epoch": 3648} {"train_loss": -6.7936906814575195, "global_step": 153239, "epoch": 3648} {"train_loss": -6.913113594055176, "global_step": 153240, "epoch": 3648} {"train_loss": -6.8748016357421875, "global_step": 153241, "epoch": 3648} {"train_loss": -6.963976860046387, "global_step": 153242, "epoch": 3648} {"train_loss": -6.849662780761719, "global_step": 153243, "epoch": 3648} {"train_loss": -6.8673295974731445, "global_step": 153244, "epoch": 3648} {"train_loss": -6.845178604125977, "global_step": 153245, "epoch": 3648} {"train_loss": -6.813154697418213, "global_step": 153246, "epoch": 3648} {"train_loss": -6.865413665771484, "global_step": 153247, "epoch": 3648} {"train_loss": -6.8967437744140625, "global_step": 153248, "epoch": 3648} {"train_loss": -6.8720622062683105, "global_step": 153249, "epoch": 3648} {"train_loss": -6.735271453857422, "global_step": 153250, "epoch": 3648} {"train_loss": -6.84246826171875, "global_step": 153251, "epoch": 3648} {"train_loss": -6.920419692993164, "global_step": 153252, "epoch": 3648} {"train_loss": -6.87119722366333, "global_step": 153253, "epoch": 3648} {"train_loss": -6.911914348602295, "global_step": 153254, "epoch": 3648} {"train_loss": -6.871206283569336, "global_step": 153255, "epoch": 3648} {"train_loss": -6.914478302001953, "global_step": 153256, "epoch": 3648} {"train_loss": -6.880250522068569, "global_step": 153257, "epoch": 3648, "val_loss": 78989.7578125} {"train_loss": -6.918487071990967, "global_step": 153258, "epoch": 3649} {"train_loss": -6.920717239379883, "global_step": 153259, "epoch": 3649} {"train_loss": -6.902190208435059, "global_step": 153260, "epoch": 3649} {"train_loss": -6.914283752441406, "global_step": 153261, "epoch": 3649} {"train_loss": -6.960198879241943, "global_step": 153262, "epoch": 3649} {"train_loss": -7.042891502380371, "global_step": 153263, "epoch": 3649} {"train_loss": -6.835446357727051, "global_step": 153264, "epoch": 3649} {"train_loss": -6.962770938873291, "global_step": 153265, "epoch": 3649} {"train_loss": -6.966207981109619, "global_step": 153266, "epoch": 3649} {"train_loss": -6.841744422912598, "global_step": 153267, "epoch": 3649} {"train_loss": -6.957664966583252, "global_step": 153268, "epoch": 3649} {"train_loss": -6.848015308380127, "global_step": 153269, "epoch": 3649} {"train_loss": -6.990257263183594, "global_step": 153270, "epoch": 3649} {"train_loss": -6.89540433883667, "global_step": 153271, "epoch": 3649} {"train_loss": -6.7947797775268555, "global_step": 153272, "epoch": 3649} {"train_loss": -6.852758884429932, "global_step": 153273, "epoch": 3649} {"train_loss": -6.902231693267822, "global_step": 153274, "epoch": 3649} {"train_loss": -6.9495038986206055, "global_step": 153275, "epoch": 3649} {"train_loss": -6.837158203125, "global_step": 153276, "epoch": 3649} {"train_loss": -6.871006965637207, "global_step": 153277, "epoch": 3649} {"train_loss": -6.938099384307861, "global_step": 153278, "epoch": 3649} {"train_loss": -6.982320785522461, "global_step": 153279, "epoch": 3649} {"train_loss": -6.821035861968994, "global_step": 153280, "epoch": 3649} {"train_loss": -6.867792129516602, "global_step": 153281, "epoch": 3649} {"train_loss": -6.89506721496582, "global_step": 153282, "epoch": 3649} {"train_loss": -6.904314994812012, "global_step": 153283, "epoch": 3649} {"train_loss": -6.918315887451172, "global_step": 153284, "epoch": 3649} {"train_loss": -6.844344139099121, "global_step": 153285, "epoch": 3649} {"train_loss": -6.860339641571045, "global_step": 153286, "epoch": 3649} {"train_loss": -6.726762294769287, "global_step": 153287, "epoch": 3649} {"train_loss": -6.777989387512207, "global_step": 153288, "epoch": 3649} {"train_loss": -6.823360443115234, "global_step": 153289, "epoch": 3649} {"train_loss": -6.7960100173950195, "global_step": 153290, "epoch": 3649} {"train_loss": -6.754246234893799, "global_step": 153291, "epoch": 3649} {"train_loss": -6.823243141174316, "global_step": 153292, "epoch": 3649} {"train_loss": -6.914731025695801, "global_step": 153293, "epoch": 3649} {"train_loss": -6.836266040802002, "global_step": 153294, "epoch": 3649} {"train_loss": -6.8286004066467285, "global_step": 153295, "epoch": 3649} {"train_loss": -6.846057891845703, "global_step": 153296, "epoch": 3649} {"train_loss": -6.872077941894531, "global_step": 153297, "epoch": 3649} {"train_loss": -6.891545295715332, "global_step": 153298, "epoch": 3649} {"train_loss": -6.8818423975081675, "global_step": 153299, "epoch": 3649, "val_loss": 79135.3359375} {"train_loss": -6.7194390296936035, "global_step": 153300, "epoch": 3650} {"train_loss": -6.913671970367432, "global_step": 153301, "epoch": 3650} {"train_loss": -6.854508399963379, "global_step": 153302, "epoch": 3650} {"train_loss": -6.927661895751953, "global_step": 153303, "epoch": 3650} {"train_loss": -6.813469409942627, "global_step": 153304, "epoch": 3650} {"train_loss": -6.880029678344727, "global_step": 153305, "epoch": 3650} {"train_loss": -6.778572082519531, "global_step": 153306, "epoch": 3650} {"train_loss": -6.702240467071533, "global_step": 153307, "epoch": 3650} {"train_loss": -6.7811713218688965, "global_step": 153308, "epoch": 3650} {"train_loss": -6.707737922668457, "global_step": 153309, "epoch": 3650} {"train_loss": -6.846022605895996, "global_step": 153310, "epoch": 3650} {"train_loss": -6.782159805297852, "global_step": 153311, "epoch": 3650} {"train_loss": -6.908838272094727, "global_step": 153312, "epoch": 3650} {"train_loss": -6.937582969665527, "global_step": 153313, "epoch": 3650} {"train_loss": -6.777851104736328, "global_step": 153314, "epoch": 3650} {"train_loss": -6.7823567390441895, "global_step": 153315, "epoch": 3650} {"train_loss": -6.847428321838379, "global_step": 153316, "epoch": 3650} {"train_loss": -6.904702186584473, "global_step": 153317, "epoch": 3650} {"train_loss": -6.891663551330566, "global_step": 153318, "epoch": 3650} {"train_loss": -6.815899848937988, "global_step": 153319, "epoch": 3650} {"train_loss": -6.862054347991943, "global_step": 153320, "epoch": 3650} {"train_loss": -6.868196487426758, "global_step": 153321, "epoch": 3650} {"train_loss": -6.761242866516113, "global_step": 153322, "epoch": 3650} {"train_loss": -6.836392879486084, "global_step": 153323, "epoch": 3650} {"train_loss": -6.972714424133301, "global_step": 153324, "epoch": 3650} {"train_loss": -6.961991786956787, "global_step": 153325, "epoch": 3650} {"train_loss": -6.825804710388184, "global_step": 153326, "epoch": 3650} {"train_loss": -6.9055376052856445, "global_step": 153327, "epoch": 3650} {"train_loss": -6.908931732177734, "global_step": 153328, "epoch": 3650} {"train_loss": -6.821494102478027, "global_step": 153329, "epoch": 3650} {"train_loss": -6.758646488189697, "global_step": 153330, "epoch": 3650} {"train_loss": -6.838713645935059, "global_step": 153331, "epoch": 3650} {"train_loss": -6.9154558181762695, "global_step": 153332, "epoch": 3650} {"train_loss": -6.769993782043457, "global_step": 153333, "epoch": 3650} {"train_loss": -6.909334182739258, "global_step": 153334, "epoch": 3650} {"train_loss": -6.8394083976745605, "global_step": 153335, "epoch": 3650} {"train_loss": -6.875822067260742, "global_step": 153336, "epoch": 3650} {"train_loss": -6.89945125579834, "global_step": 153337, "epoch": 3650} {"train_loss": -6.804482460021973, "global_step": 153338, "epoch": 3650} {"train_loss": -6.866147041320801, "global_step": 153339, "epoch": 3650} {"train_loss": -6.836478233337402, "global_step": 153340, "epoch": 3650} {"train_loss": -6.84359259832473, "global_step": 153341, "epoch": 3650, "train/sim_max_reward_0": 0.9101069308982744, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.4429729140595867, "train/sim_max_reward_3": 0.16353836883572262, "train/sim_max_reward_4": 0.9925595430684263, "train/sim_max_reward_5": 0.5720870570230563, "test/sim_max_reward_4500000": 0.9280996454996158, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9971291691499795, "test/sim_max_reward_4500003": 1.0, "test/sim_max_reward_4500004": 0.10146167233984504, "test/sim_max_reward_4500005": 0.8681656459542415, "test/sim_max_reward_4500006": 0.9385514662096561, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.9279602884512823, "test/sim_max_reward_4500009": 0.05338886244506898, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9805148950516943, "test/sim_max_reward_4500012": 0.8971333263398065, "test/sim_max_reward_4500013": 0.003887954713421722, "test/sim_max_reward_4500014": 0.4233860366342443, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.2662043657961781, "test/sim_max_reward_4500018": 0.4902565457329739, "test/sim_max_reward_4500019": 0.8566530770482169, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.7971479599214463, "test/sim_max_reward_4500022": 0.46464249911401384, "test/sim_max_reward_4500023": 0.5534352706784939, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8742861252553209, "test/sim_max_reward_4500026": 0.9288856717603766, "test/sim_max_reward_4500027": 0.9344935334734935, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.05001327984708833, "test/sim_max_reward_4500030": 0.8182019351787142, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.7343873197459613, "test/sim_max_reward_4500035": 0.9687981668701614, "test/sim_max_reward_4500036": 1.0, "test/sim_max_reward_4500037": 0.829183738429664, "test/sim_max_reward_4500038": 0.31709969931654486, "test/sim_max_reward_4500039": 0.9361456914536302, "test/sim_max_reward_4500040": 0.9977945076530758, "test/sim_max_reward_4500041": 0.7198634868538206, "test/sim_max_reward_4500042": 0.021334721715024974, "test/sim_max_reward_4500043": 0.33849825151144547, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9168133299213367, "test/sim_max_reward_4500046": 0.28947743437019435, "test/sim_max_reward_4500047": 0.9295727119644388, "test/sim_max_reward_4500048": 0.9823444735033795, "test/sim_max_reward_4500049": 0.9605843726769518, "train/mean_score": 0.6802108023141779, "test/mean_score": 0.5669630273309495, "val_loss": 78983.28125} {"train_loss": -6.952720642089844, "global_step": 153342, "epoch": 3651} {"train_loss": -6.833627700805664, "global_step": 153343, "epoch": 3651} {"train_loss": -6.89729118347168, "global_step": 153344, "epoch": 3651} {"train_loss": -6.886085033416748, "global_step": 153345, "epoch": 3651} {"train_loss": -6.7711920738220215, "global_step": 153346, "epoch": 3651} {"train_loss": -6.858841896057129, "global_step": 153347, "epoch": 3651} {"train_loss": -6.878316879272461, "global_step": 153348, "epoch": 3651} {"train_loss": -6.9277191162109375, "global_step": 153349, "epoch": 3651} {"train_loss": -6.8458251953125, "global_step": 153350, "epoch": 3651} {"train_loss": -6.883101940155029, "global_step": 153351, "epoch": 3651} {"train_loss": -6.930758476257324, "global_step": 153352, "epoch": 3651} {"train_loss": -6.8252692222595215, "global_step": 153353, "epoch": 3651} {"train_loss": -6.914628982543945, "global_step": 153354, "epoch": 3651} {"train_loss": -6.759922027587891, "global_step": 153355, "epoch": 3651} {"train_loss": -6.882349967956543, "global_step": 153356, "epoch": 3651} {"train_loss": -6.924447536468506, "global_step": 153357, "epoch": 3651} {"train_loss": -6.818681716918945, "global_step": 153358, "epoch": 3651} {"train_loss": -6.929776668548584, "global_step": 153359, "epoch": 3651} {"train_loss": -6.8643693923950195, "global_step": 153360, "epoch": 3651} {"train_loss": -6.963229179382324, "global_step": 153361, "epoch": 3651} {"train_loss": -6.8587446212768555, "global_step": 153362, "epoch": 3651} {"train_loss": -6.9018754959106445, "global_step": 153363, "epoch": 3651} {"train_loss": -6.854257106781006, "global_step": 153364, "epoch": 3651} {"train_loss": -6.884160041809082, "global_step": 153365, "epoch": 3651} {"train_loss": -6.799014568328857, "global_step": 153366, "epoch": 3651} {"train_loss": -6.880161285400391, "global_step": 153367, "epoch": 3651} {"train_loss": -6.829985618591309, "global_step": 153368, "epoch": 3651} {"train_loss": -6.828742027282715, "global_step": 153369, "epoch": 3651} {"train_loss": -6.845974445343018, "global_step": 153370, "epoch": 3651} {"train_loss": -6.819166660308838, "global_step": 153371, "epoch": 3651} {"train_loss": -6.830870628356934, "global_step": 153372, "epoch": 3651} {"train_loss": -6.8357930183410645, "global_step": 153373, "epoch": 3651} {"train_loss": -6.752846717834473, "global_step": 153374, "epoch": 3651} {"train_loss": -6.957854747772217, "global_step": 153375, "epoch": 3651} {"train_loss": -6.864571571350098, "global_step": 153376, "epoch": 3651} {"train_loss": -6.882034778594971, "global_step": 153377, "epoch": 3651} {"train_loss": -6.873725414276123, "global_step": 153378, "epoch": 3651} {"train_loss": -6.9094696044921875, "global_step": 153379, "epoch": 3651} {"train_loss": -6.909313678741455, "global_step": 153380, "epoch": 3651} {"train_loss": -6.771397113800049, "global_step": 153381, "epoch": 3651} {"train_loss": -6.915266513824463, "global_step": 153382, "epoch": 3651} {"train_loss": -6.8646023614065985, "global_step": 153383, "epoch": 3651, "val_loss": 78928.2734375} {"train_loss": -6.901902198791504, "global_step": 153384, "epoch": 3652} {"train_loss": -6.844449043273926, "global_step": 153385, "epoch": 3652} {"train_loss": -6.883851051330566, "global_step": 153386, "epoch": 3652} {"train_loss": -6.829015254974365, "global_step": 153387, "epoch": 3652} {"train_loss": -6.809229850769043, "global_step": 153388, "epoch": 3652} {"train_loss": -6.886928558349609, "global_step": 153389, "epoch": 3652} {"train_loss": -6.899857521057129, "global_step": 153390, "epoch": 3652} {"train_loss": -6.823760509490967, "global_step": 153391, "epoch": 3652} {"train_loss": -6.922854900360107, "global_step": 153392, "epoch": 3652} {"train_loss": -6.935089111328125, "global_step": 153393, "epoch": 3652} {"train_loss": -6.869887351989746, "global_step": 153394, "epoch": 3652} {"train_loss": -6.929216384887695, "global_step": 153395, "epoch": 3652} {"train_loss": -6.938650131225586, "global_step": 153396, "epoch": 3652} {"train_loss": -6.926165580749512, "global_step": 153397, "epoch": 3652} {"train_loss": -6.895607948303223, "global_step": 153398, "epoch": 3652} {"train_loss": -6.965124607086182, "global_step": 153399, "epoch": 3652} {"train_loss": -6.923440933227539, "global_step": 153400, "epoch": 3652} {"train_loss": -6.896714210510254, "global_step": 153401, "epoch": 3652} {"train_loss": -6.944685935974121, "global_step": 153402, "epoch": 3652} {"train_loss": -7.043401718139648, "global_step": 153403, "epoch": 3652} {"train_loss": -6.8982343673706055, "global_step": 153404, "epoch": 3652} {"train_loss": -6.909055233001709, "global_step": 153405, "epoch": 3652} {"train_loss": -6.931752681732178, "global_step": 153406, "epoch": 3652} {"train_loss": -6.982569694519043, "global_step": 153407, "epoch": 3652} {"train_loss": -6.9461517333984375, "global_step": 153408, "epoch": 3652} {"train_loss": -6.966625213623047, "global_step": 153409, "epoch": 3652} {"train_loss": -7.007720470428467, "global_step": 153410, "epoch": 3652} {"train_loss": -7.05804443359375, "global_step": 153411, "epoch": 3652} {"train_loss": -6.892943382263184, "global_step": 153412, "epoch": 3652} {"train_loss": -6.856621265411377, "global_step": 153413, "epoch": 3652} {"train_loss": -6.932894706726074, "global_step": 153414, "epoch": 3652} {"train_loss": -6.930911064147949, "global_step": 153415, "epoch": 3652} {"train_loss": -6.928903579711914, "global_step": 153416, "epoch": 3652} {"train_loss": -6.897249221801758, "global_step": 153417, "epoch": 3652} {"train_loss": -7.012731552124023, "global_step": 153418, "epoch": 3652} {"train_loss": -6.964048862457275, "global_step": 153419, "epoch": 3652} {"train_loss": -6.929803848266602, "global_step": 153420, "epoch": 3652} {"train_loss": -6.98729944229126, "global_step": 153421, "epoch": 3652} {"train_loss": -6.965914726257324, "global_step": 153422, "epoch": 3652} {"train_loss": -6.9417924880981445, "global_step": 153423, "epoch": 3652} {"train_loss": -6.899013519287109, "global_step": 153424, "epoch": 3652} {"train_loss": -6.922565834862845, "global_step": 153425, "epoch": 3652, "val_loss": 78819.3359375} {"train_loss": -7.0182671546936035, "global_step": 153426, "epoch": 3653} {"train_loss": -7.003600120544434, "global_step": 153427, "epoch": 3653} {"train_loss": -6.97532844543457, "global_step": 153428, "epoch": 3653} {"train_loss": -6.947630882263184, "global_step": 153429, "epoch": 3653} {"train_loss": -7.017649173736572, "global_step": 153430, "epoch": 3653} {"train_loss": -6.9126996994018555, "global_step": 153431, "epoch": 3653} {"train_loss": -7.010445594787598, "global_step": 153432, "epoch": 3653} {"train_loss": -6.845296382904053, "global_step": 153433, "epoch": 3653} {"train_loss": -6.883151054382324, "global_step": 153434, "epoch": 3653} {"train_loss": -6.913493633270264, "global_step": 153435, "epoch": 3653} {"train_loss": -6.927386283874512, "global_step": 153436, "epoch": 3653} {"train_loss": -6.753392696380615, "global_step": 153437, "epoch": 3653} {"train_loss": -6.870885848999023, "global_step": 153438, "epoch": 3653} {"train_loss": -6.973875045776367, "global_step": 153439, "epoch": 3653} {"train_loss": -6.833965301513672, "global_step": 153440, "epoch": 3653} {"train_loss": -6.970686435699463, "global_step": 153441, "epoch": 3653} {"train_loss": -7.0145463943481445, "global_step": 153442, "epoch": 3653} {"train_loss": -6.768324375152588, "global_step": 153443, "epoch": 3653} {"train_loss": -6.906071662902832, "global_step": 153444, "epoch": 3653} {"train_loss": -6.959830284118652, "global_step": 153445, "epoch": 3653} {"train_loss": -6.883749008178711, "global_step": 153446, "epoch": 3653} {"train_loss": -6.887817859649658, "global_step": 153447, "epoch": 3653} {"train_loss": -6.825927734375, "global_step": 153448, "epoch": 3653} {"train_loss": -6.827251434326172, "global_step": 153449, "epoch": 3653} {"train_loss": -6.9359354972839355, "global_step": 153450, "epoch": 3653} {"train_loss": -6.889551162719727, "global_step": 153451, "epoch": 3653} {"train_loss": -6.987937927246094, "global_step": 153452, "epoch": 3653} {"train_loss": -6.923666477203369, "global_step": 153453, "epoch": 3653} {"train_loss": -7.006042003631592, "global_step": 153454, "epoch": 3653} {"train_loss": -6.988345146179199, "global_step": 153455, "epoch": 3653} {"train_loss": -6.927579879760742, "global_step": 153456, "epoch": 3653} {"train_loss": -6.94273042678833, "global_step": 153457, "epoch": 3653} {"train_loss": -6.927539825439453, "global_step": 153458, "epoch": 3653} {"train_loss": -6.946299076080322, "global_step": 153459, "epoch": 3653} {"train_loss": -7.0000505447387695, "global_step": 153460, "epoch": 3653} {"train_loss": -6.898578643798828, "global_step": 153461, "epoch": 3653} {"train_loss": -6.888673782348633, "global_step": 153462, "epoch": 3653} {"train_loss": -6.96525764465332, "global_step": 153463, "epoch": 3653} {"train_loss": -6.886720657348633, "global_step": 153464, "epoch": 3653} {"train_loss": -6.751591682434082, "global_step": 153465, "epoch": 3653} {"train_loss": -6.911447525024414, "global_step": 153466, "epoch": 3653} {"train_loss": -6.917585509163993, "global_step": 153467, "epoch": 3653, "val_loss": 78845.40625} {"train_loss": -6.874370574951172, "global_step": 153468, "epoch": 3654} {"train_loss": -6.964580535888672, "global_step": 153469, "epoch": 3654} {"train_loss": -6.935880661010742, "global_step": 153470, "epoch": 3654} {"train_loss": -6.890408515930176, "global_step": 153471, "epoch": 3654} {"train_loss": -6.844740867614746, "global_step": 153472, "epoch": 3654} {"train_loss": -7.037657737731934, "global_step": 153473, "epoch": 3654} {"train_loss": -6.854010581970215, "global_step": 153474, "epoch": 3654} {"train_loss": -6.843768119812012, "global_step": 153475, "epoch": 3654} {"train_loss": -7.016953468322754, "global_step": 153476, "epoch": 3654} {"train_loss": -6.797693252563477, "global_step": 153477, "epoch": 3654} {"train_loss": -6.874597549438477, "global_step": 153478, "epoch": 3654} {"train_loss": -6.859443664550781, "global_step": 153479, "epoch": 3654} {"train_loss": -6.887082099914551, "global_step": 153480, "epoch": 3654} {"train_loss": -6.962708473205566, "global_step": 153481, "epoch": 3654} {"train_loss": -6.869436740875244, "global_step": 153482, "epoch": 3654} {"train_loss": -6.97182559967041, "global_step": 153483, "epoch": 3654} {"train_loss": -6.954057216644287, "global_step": 153484, "epoch": 3654} {"train_loss": -6.936344146728516, "global_step": 153485, "epoch": 3654} {"train_loss": -7.007486820220947, "global_step": 153486, "epoch": 3654} {"train_loss": -6.829470634460449, "global_step": 153487, "epoch": 3654} {"train_loss": -6.867809295654297, "global_step": 153488, "epoch": 3654} {"train_loss": -6.9268798828125, "global_step": 153489, "epoch": 3654} {"train_loss": -6.83116340637207, "global_step": 153490, "epoch": 3654} {"train_loss": -7.053295135498047, "global_step": 153491, "epoch": 3654} {"train_loss": -6.857357025146484, "global_step": 153492, "epoch": 3654} {"train_loss": -7.009172439575195, "global_step": 153493, "epoch": 3654} {"train_loss": -7.033724308013916, "global_step": 153494, "epoch": 3654} {"train_loss": -6.797007083892822, "global_step": 153495, "epoch": 3654} {"train_loss": -6.99384880065918, "global_step": 153496, "epoch": 3654} {"train_loss": -6.943960666656494, "global_step": 153497, "epoch": 3654} {"train_loss": -7.0036211013793945, "global_step": 153498, "epoch": 3654} {"train_loss": -6.974290370941162, "global_step": 153499, "epoch": 3654} {"train_loss": -6.831235408782959, "global_step": 153500, "epoch": 3654} {"train_loss": -6.924410820007324, "global_step": 153501, "epoch": 3654} {"train_loss": -6.859649658203125, "global_step": 153502, "epoch": 3654} {"train_loss": -6.841309547424316, "global_step": 153503, "epoch": 3654} {"train_loss": -6.888739585876465, "global_step": 153504, "epoch": 3654} {"train_loss": -7.00630521774292, "global_step": 153505, "epoch": 3654} {"train_loss": -6.919638633728027, "global_step": 153506, "epoch": 3654} {"train_loss": -6.874094009399414, "global_step": 153507, "epoch": 3654} {"train_loss": -6.918336868286133, "global_step": 153508, "epoch": 3654} {"train_loss": -6.913784038452875, "global_step": 153509, "epoch": 3654, "val_loss": 78758.6484375} {"train_loss": -6.957469940185547, "global_step": 153510, "epoch": 3655} {"train_loss": -7.025669097900391, "global_step": 153511, "epoch": 3655} {"train_loss": -6.921682357788086, "global_step": 153512, "epoch": 3655} {"train_loss": -7.0298566818237305, "global_step": 153513, "epoch": 3655} {"train_loss": -6.900620460510254, "global_step": 153514, "epoch": 3655} {"train_loss": -6.7878899574279785, "global_step": 153515, "epoch": 3655} {"train_loss": -6.905765533447266, "global_step": 153516, "epoch": 3655} {"train_loss": -6.943624496459961, "global_step": 153517, "epoch": 3655} {"train_loss": -6.832736492156982, "global_step": 153518, "epoch": 3655} {"train_loss": -6.859367847442627, "global_step": 153519, "epoch": 3655} {"train_loss": -6.885573387145996, "global_step": 153520, "epoch": 3655} {"train_loss": -6.895627021789551, "global_step": 153521, "epoch": 3655} {"train_loss": -6.794160842895508, "global_step": 153522, "epoch": 3655} {"train_loss": -6.781678199768066, "global_step": 153523, "epoch": 3655} {"train_loss": -6.821796894073486, "global_step": 153524, "epoch": 3655} {"train_loss": -6.6768693923950195, "global_step": 153525, "epoch": 3655} {"train_loss": -6.827642917633057, "global_step": 153526, "epoch": 3655} {"train_loss": -6.854660987854004, "global_step": 153527, "epoch": 3655} {"train_loss": -6.961519718170166, "global_step": 153528, "epoch": 3655} {"train_loss": -6.885228157043457, "global_step": 153529, "epoch": 3655} {"train_loss": -6.869090557098389, "global_step": 153530, "epoch": 3655} {"train_loss": -6.842742443084717, "global_step": 153531, "epoch": 3655} {"train_loss": -6.86529016494751, "global_step": 153532, "epoch": 3655} {"train_loss": -6.806715965270996, "global_step": 153533, "epoch": 3655} {"train_loss": -6.842231750488281, "global_step": 153534, "epoch": 3655} {"train_loss": -6.828709602355957, "global_step": 153535, "epoch": 3655} {"train_loss": -6.882052421569824, "global_step": 153536, "epoch": 3655} {"train_loss": -6.804683208465576, "global_step": 153537, "epoch": 3655} {"train_loss": -6.649735450744629, "global_step": 153538, "epoch": 3655} {"train_loss": -6.921334266662598, "global_step": 153539, "epoch": 3655} {"train_loss": -6.758022308349609, "global_step": 153540, "epoch": 3655} {"train_loss": -6.920633792877197, "global_step": 153541, "epoch": 3655} {"train_loss": -6.879430294036865, "global_step": 153542, "epoch": 3655} {"train_loss": -6.702874660491943, "global_step": 153543, "epoch": 3655} {"train_loss": -6.806809425354004, "global_step": 153544, "epoch": 3655} {"train_loss": -6.827123165130615, "global_step": 153545, "epoch": 3655} {"train_loss": -6.940361022949219, "global_step": 153546, "epoch": 3655} {"train_loss": -6.803510665893555, "global_step": 153547, "epoch": 3655} {"train_loss": -6.843360900878906, "global_step": 153548, "epoch": 3655} {"train_loss": -6.83795690536499, "global_step": 153549, "epoch": 3655} {"train_loss": -6.790156364440918, "global_step": 153550, "epoch": 3655} {"train_loss": -6.853854406447637, "global_step": 153551, "epoch": 3655, "val_loss": 79002.6953125} {"train_loss": -6.730011940002441, "global_step": 153552, "epoch": 3656} {"train_loss": -6.984928131103516, "global_step": 153553, "epoch": 3656} {"train_loss": -6.8811187744140625, "global_step": 153554, "epoch": 3656} {"train_loss": -6.815406322479248, "global_step": 153555, "epoch": 3656} {"train_loss": -6.867853164672852, "global_step": 153556, "epoch": 3656} {"train_loss": -6.909599304199219, "global_step": 153557, "epoch": 3656} {"train_loss": -6.873284339904785, "global_step": 153558, "epoch": 3656} {"train_loss": -6.941782474517822, "global_step": 153559, "epoch": 3656} {"train_loss": -6.8922858238220215, "global_step": 153560, "epoch": 3656} {"train_loss": -6.847106456756592, "global_step": 153561, "epoch": 3656} {"train_loss": -6.926884651184082, "global_step": 153562, "epoch": 3656} {"train_loss": -6.905259132385254, "global_step": 153563, "epoch": 3656} {"train_loss": -6.890793323516846, "global_step": 153564, "epoch": 3656} {"train_loss": -6.868043899536133, "global_step": 153565, "epoch": 3656} {"train_loss": -6.89096736907959, "global_step": 153566, "epoch": 3656} {"train_loss": -6.9442033767700195, "global_step": 153567, "epoch": 3656} {"train_loss": -7.008876323699951, "global_step": 153568, "epoch": 3656} {"train_loss": -6.86201286315918, "global_step": 153569, "epoch": 3656} {"train_loss": -6.954735279083252, "global_step": 153570, "epoch": 3656} {"train_loss": -6.846879959106445, "global_step": 153571, "epoch": 3656} {"train_loss": -6.883256912231445, "global_step": 153572, "epoch": 3656} {"train_loss": -6.934206008911133, "global_step": 153573, "epoch": 3656} {"train_loss": -6.8394341468811035, "global_step": 153574, "epoch": 3656} {"train_loss": -6.898077011108398, "global_step": 153575, "epoch": 3656} {"train_loss": -6.961803436279297, "global_step": 153576, "epoch": 3656} {"train_loss": -6.961427211761475, "global_step": 153577, "epoch": 3656} {"train_loss": -6.896334171295166, "global_step": 153578, "epoch": 3656} {"train_loss": -7.063478946685791, "global_step": 153579, "epoch": 3656} {"train_loss": -6.960110187530518, "global_step": 153580, "epoch": 3656} {"train_loss": -6.967347621917725, "global_step": 153581, "epoch": 3656} {"train_loss": -6.898750305175781, "global_step": 153582, "epoch": 3656} {"train_loss": -6.95759391784668, "global_step": 153583, "epoch": 3656} {"train_loss": -6.983658790588379, "global_step": 153584, "epoch": 3656} {"train_loss": -6.952867031097412, "global_step": 153585, "epoch": 3656} {"train_loss": -6.922420501708984, "global_step": 153586, "epoch": 3656} {"train_loss": -6.783074378967285, "global_step": 153587, "epoch": 3656} {"train_loss": -6.884812355041504, "global_step": 153588, "epoch": 3656} {"train_loss": -6.6717329025268555, "global_step": 153589, "epoch": 3656} {"train_loss": -6.929879188537598, "global_step": 153590, "epoch": 3656} {"train_loss": -6.868096351623535, "global_step": 153591, "epoch": 3656} {"train_loss": -6.839459419250488, "global_step": 153592, "epoch": 3656} {"train_loss": -6.8960597060975575, "global_step": 153593, "epoch": 3656, "val_loss": 79135.4765625} {"train_loss": -6.982598304748535, "global_step": 153594, "epoch": 3657} {"train_loss": -6.910512447357178, "global_step": 153595, "epoch": 3657} {"train_loss": -6.789133071899414, "global_step": 153596, "epoch": 3657} {"train_loss": -6.870685577392578, "global_step": 153597, "epoch": 3657} {"train_loss": -6.809686660766602, "global_step": 153598, "epoch": 3657} {"train_loss": -6.735821723937988, "global_step": 153599, "epoch": 3657} {"train_loss": -6.927422046661377, "global_step": 153600, "epoch": 3657} {"train_loss": -6.589995384216309, "global_step": 153601, "epoch": 3657} {"train_loss": -6.757992744445801, "global_step": 153602, "epoch": 3657} {"train_loss": -6.861029624938965, "global_step": 153603, "epoch": 3657} {"train_loss": -6.757359504699707, "global_step": 153604, "epoch": 3657} {"train_loss": -6.782007694244385, "global_step": 153605, "epoch": 3657} {"train_loss": -6.738784313201904, "global_step": 153606, "epoch": 3657} {"train_loss": -6.6404924392700195, "global_step": 153607, "epoch": 3657} {"train_loss": -6.728200435638428, "global_step": 153608, "epoch": 3657} {"train_loss": -6.748628616333008, "global_step": 153609, "epoch": 3657} {"train_loss": -6.744270324707031, "global_step": 153610, "epoch": 3657} {"train_loss": -6.856170177459717, "global_step": 153611, "epoch": 3657} {"train_loss": -6.8082499504089355, "global_step": 153612, "epoch": 3657} {"train_loss": -6.8979268074035645, "global_step": 153613, "epoch": 3657} {"train_loss": -6.7714738845825195, "global_step": 153614, "epoch": 3657} {"train_loss": -6.857526779174805, "global_step": 153615, "epoch": 3657} {"train_loss": -6.809144020080566, "global_step": 153616, "epoch": 3657} {"train_loss": -6.963818550109863, "global_step": 153617, "epoch": 3657} {"train_loss": -6.856797218322754, "global_step": 153618, "epoch": 3657} {"train_loss": -6.988382339477539, "global_step": 153619, "epoch": 3657} {"train_loss": -6.951808929443359, "global_step": 153620, "epoch": 3657} {"train_loss": -6.8975725173950195, "global_step": 153621, "epoch": 3657} {"train_loss": -6.937060356140137, "global_step": 153622, "epoch": 3657} {"train_loss": -6.988433837890625, "global_step": 153623, "epoch": 3657} {"train_loss": -6.9545979499816895, "global_step": 153624, "epoch": 3657} {"train_loss": -6.965087890625, "global_step": 153625, "epoch": 3657} {"train_loss": -6.962006568908691, "global_step": 153626, "epoch": 3657} {"train_loss": -6.828778266906738, "global_step": 153627, "epoch": 3657} {"train_loss": -6.893352508544922, "global_step": 153628, "epoch": 3657} {"train_loss": -7.0071120262146, "global_step": 153629, "epoch": 3657} {"train_loss": -6.8460187911987305, "global_step": 153630, "epoch": 3657} {"train_loss": -6.835904121398926, "global_step": 153631, "epoch": 3657} {"train_loss": -6.717907428741455, "global_step": 153632, "epoch": 3657} {"train_loss": -6.862833023071289, "global_step": 153633, "epoch": 3657} {"train_loss": -6.7884721755981445, "global_step": 153634, "epoch": 3657} {"train_loss": -6.845831848326183, "global_step": 153635, "epoch": 3657, "val_loss": 78854.6328125} {"train_loss": -6.809654712677002, "global_step": 153636, "epoch": 3658} {"train_loss": -6.829028129577637, "global_step": 153637, "epoch": 3658} {"train_loss": -6.831225872039795, "global_step": 153638, "epoch": 3658} {"train_loss": -6.865300178527832, "global_step": 153639, "epoch": 3658} {"train_loss": -6.786403656005859, "global_step": 153640, "epoch": 3658} {"train_loss": -6.8097124099731445, "global_step": 153641, "epoch": 3658} {"train_loss": -6.996182441711426, "global_step": 153642, "epoch": 3658} {"train_loss": -6.893153190612793, "global_step": 153643, "epoch": 3658} {"train_loss": -6.840208053588867, "global_step": 153644, "epoch": 3658} {"train_loss": -6.870508193969727, "global_step": 153645, "epoch": 3658} {"train_loss": -6.954130172729492, "global_step": 153646, "epoch": 3658} {"train_loss": -6.778185844421387, "global_step": 153647, "epoch": 3658} {"train_loss": -6.828470230102539, "global_step": 153648, "epoch": 3658} {"train_loss": -6.914412498474121, "global_step": 153649, "epoch": 3658} {"train_loss": -6.807687759399414, "global_step": 153650, "epoch": 3658} {"train_loss": -6.907380104064941, "global_step": 153651, "epoch": 3658} {"train_loss": -6.933766841888428, "global_step": 153652, "epoch": 3658} {"train_loss": -6.9111175537109375, "global_step": 153653, "epoch": 3658} {"train_loss": -6.855621337890625, "global_step": 153654, "epoch": 3658} {"train_loss": -6.927346229553223, "global_step": 153655, "epoch": 3658} {"train_loss": -6.9515509605407715, "global_step": 153656, "epoch": 3658} {"train_loss": -6.937341690063477, "global_step": 153657, "epoch": 3658} {"train_loss": -7.00811767578125, "global_step": 153658, "epoch": 3658} {"train_loss": -7.003103256225586, "global_step": 153659, "epoch": 3658} {"train_loss": -6.849247932434082, "global_step": 153660, "epoch": 3658} {"train_loss": -6.972506523132324, "global_step": 153661, "epoch": 3658} {"train_loss": -6.914364337921143, "global_step": 153662, "epoch": 3658} {"train_loss": -6.917482376098633, "global_step": 153663, "epoch": 3658} {"train_loss": -6.944950103759766, "global_step": 153664, "epoch": 3658} {"train_loss": -6.953197479248047, "global_step": 153665, "epoch": 3658} {"train_loss": -6.91953182220459, "global_step": 153666, "epoch": 3658} {"train_loss": -7.0231404304504395, "global_step": 153667, "epoch": 3658} {"train_loss": -6.971056938171387, "global_step": 153668, "epoch": 3658} {"train_loss": -6.954089164733887, "global_step": 153669, "epoch": 3658} {"train_loss": -6.984713554382324, "global_step": 153670, "epoch": 3658} {"train_loss": -6.905139923095703, "global_step": 153671, "epoch": 3658} {"train_loss": -6.8901262283325195, "global_step": 153672, "epoch": 3658} {"train_loss": -6.839359283447266, "global_step": 153673, "epoch": 3658} {"train_loss": -6.882848739624023, "global_step": 153674, "epoch": 3658} {"train_loss": -6.985264301300049, "global_step": 153675, "epoch": 3658} {"train_loss": -6.930887222290039, "global_step": 153676, "epoch": 3658} {"train_loss": -6.904135965165638, "global_step": 153677, "epoch": 3658, "val_loss": 78887.3515625} {"train_loss": -6.971662521362305, "global_step": 153678, "epoch": 3659} {"train_loss": -6.858587265014648, "global_step": 153679, "epoch": 3659} {"train_loss": -6.821199893951416, "global_step": 153680, "epoch": 3659} {"train_loss": -6.8615922927856445, "global_step": 153681, "epoch": 3659} {"train_loss": -6.851813316345215, "global_step": 153682, "epoch": 3659} {"train_loss": -6.818657875061035, "global_step": 153683, "epoch": 3659} {"train_loss": -6.852790832519531, "global_step": 153684, "epoch": 3659} {"train_loss": -6.940483093261719, "global_step": 153685, "epoch": 3659} {"train_loss": -6.883023262023926, "global_step": 153686, "epoch": 3659} {"train_loss": -7.001248836517334, "global_step": 153687, "epoch": 3659} {"train_loss": -6.914252281188965, "global_step": 153688, "epoch": 3659} {"train_loss": -6.952771186828613, "global_step": 153689, "epoch": 3659} {"train_loss": -6.935066223144531, "global_step": 153690, "epoch": 3659} {"train_loss": -6.955122470855713, "global_step": 153691, "epoch": 3659} {"train_loss": -6.997531414031982, "global_step": 153692, "epoch": 3659} {"train_loss": -6.958272933959961, "global_step": 153693, "epoch": 3659} {"train_loss": -6.991397380828857, "global_step": 153694, "epoch": 3659} {"train_loss": -6.976095199584961, "global_step": 153695, "epoch": 3659} {"train_loss": -6.936182022094727, "global_step": 153696, "epoch": 3659} {"train_loss": -6.979115009307861, "global_step": 153697, "epoch": 3659} {"train_loss": -6.955873966217041, "global_step": 153698, "epoch": 3659} {"train_loss": -6.97637939453125, "global_step": 153699, "epoch": 3659} {"train_loss": -6.779190540313721, "global_step": 153700, "epoch": 3659} {"train_loss": -6.793461799621582, "global_step": 153701, "epoch": 3659} {"train_loss": -6.869052410125732, "global_step": 153702, "epoch": 3659} {"train_loss": -6.991176128387451, "global_step": 153703, "epoch": 3659} {"train_loss": -6.658324241638184, "global_step": 153704, "epoch": 3659} {"train_loss": -7.027310371398926, "global_step": 153705, "epoch": 3659} {"train_loss": -6.714971542358398, "global_step": 153706, "epoch": 3659} {"train_loss": -6.801981449127197, "global_step": 153707, "epoch": 3659} {"train_loss": -6.899654865264893, "global_step": 153708, "epoch": 3659} {"train_loss": -6.938048362731934, "global_step": 153709, "epoch": 3659} {"train_loss": -6.8299407958984375, "global_step": 153710, "epoch": 3659} {"train_loss": -6.9042439460754395, "global_step": 153711, "epoch": 3659} {"train_loss": -6.803987979888916, "global_step": 153712, "epoch": 3659} {"train_loss": -6.912611961364746, "global_step": 153713, "epoch": 3659} {"train_loss": -6.943381309509277, "global_step": 153714, "epoch": 3659} {"train_loss": -6.715285301208496, "global_step": 153715, "epoch": 3659} {"train_loss": -6.771397590637207, "global_step": 153716, "epoch": 3659} {"train_loss": -6.7403740882873535, "global_step": 153717, "epoch": 3659} {"train_loss": -6.927931785583496, "global_step": 153718, "epoch": 3659} {"train_loss": -6.886269921348209, "global_step": 153719, "epoch": 3659, "val_loss": 79237.3515625} {"train_loss": -6.923411846160889, "global_step": 153720, "epoch": 3660} {"train_loss": -6.894979953765869, "global_step": 153721, "epoch": 3660} {"train_loss": -6.9016523361206055, "global_step": 153722, "epoch": 3660} {"train_loss": -6.883025169372559, "global_step": 153723, "epoch": 3660} {"train_loss": -6.992345809936523, "global_step": 153724, "epoch": 3660} {"train_loss": -6.906650543212891, "global_step": 153725, "epoch": 3660} {"train_loss": -6.950566291809082, "global_step": 153726, "epoch": 3660} {"train_loss": -6.892516613006592, "global_step": 153727, "epoch": 3660} {"train_loss": -6.985747337341309, "global_step": 153728, "epoch": 3660} {"train_loss": -6.872377872467041, "global_step": 153729, "epoch": 3660} {"train_loss": -6.931510925292969, "global_step": 153730, "epoch": 3660} {"train_loss": -6.910694122314453, "global_step": 153731, "epoch": 3660} {"train_loss": -6.891462326049805, "global_step": 153732, "epoch": 3660} {"train_loss": -6.977310657501221, "global_step": 153733, "epoch": 3660} {"train_loss": -6.858428001403809, "global_step": 153734, "epoch": 3660} {"train_loss": -6.946037292480469, "global_step": 153735, "epoch": 3660} {"train_loss": -6.944599628448486, "global_step": 153736, "epoch": 3660} {"train_loss": -6.799748420715332, "global_step": 153737, "epoch": 3660} {"train_loss": -6.927574157714844, "global_step": 153738, "epoch": 3660} {"train_loss": -6.894840240478516, "global_step": 153739, "epoch": 3660} {"train_loss": -6.901195526123047, "global_step": 153740, "epoch": 3660} {"train_loss": -6.825479030609131, "global_step": 153741, "epoch": 3660} {"train_loss": -6.892816543579102, "global_step": 153742, "epoch": 3660} {"train_loss": -6.9041948318481445, "global_step": 153743, "epoch": 3660} {"train_loss": -6.886267185211182, "global_step": 153744, "epoch": 3660} {"train_loss": -6.946303844451904, "global_step": 153745, "epoch": 3660} {"train_loss": -6.771545886993408, "global_step": 153746, "epoch": 3660} {"train_loss": -7.005911827087402, "global_step": 153747, "epoch": 3660} {"train_loss": -6.962881088256836, "global_step": 153748, "epoch": 3660} {"train_loss": -6.977300643920898, "global_step": 153749, "epoch": 3660} {"train_loss": -6.880541801452637, "global_step": 153750, "epoch": 3660} {"train_loss": -6.84425163269043, "global_step": 153751, "epoch": 3660} {"train_loss": -6.983184814453125, "global_step": 153752, "epoch": 3660} {"train_loss": -6.994089126586914, "global_step": 153753, "epoch": 3660} {"train_loss": -6.9774675369262695, "global_step": 153754, "epoch": 3660} {"train_loss": -6.872312545776367, "global_step": 153755, "epoch": 3660} {"train_loss": -6.908416748046875, "global_step": 153756, "epoch": 3660} {"train_loss": -6.933506011962891, "global_step": 153757, "epoch": 3660} {"train_loss": -6.948112487792969, "global_step": 153758, "epoch": 3660} {"train_loss": -6.896589756011963, "global_step": 153759, "epoch": 3660} {"train_loss": -6.972775936126709, "global_step": 153760, "epoch": 3660} {"train_loss": -6.917173192614601, "global_step": 153761, "epoch": 3660, "val_loss": 78883.3046875} {"train_loss": -7.043827533721924, "global_step": 153762, "epoch": 3661} {"train_loss": -7.0034332275390625, "global_step": 153763, "epoch": 3661} {"train_loss": -6.932009696960449, "global_step": 153764, "epoch": 3661} {"train_loss": -6.9128923416137695, "global_step": 153765, "epoch": 3661} {"train_loss": -7.0396728515625, "global_step": 153766, "epoch": 3661} {"train_loss": -6.7914958000183105, "global_step": 153767, "epoch": 3661} {"train_loss": -6.82947301864624, "global_step": 153768, "epoch": 3661} {"train_loss": -7.0251946449279785, "global_step": 153769, "epoch": 3661} {"train_loss": -6.965695381164551, "global_step": 153770, "epoch": 3661} {"train_loss": -6.9780778884887695, "global_step": 153771, "epoch": 3661} {"train_loss": -6.884268760681152, "global_step": 153772, "epoch": 3661} {"train_loss": -6.944683074951172, "global_step": 153773, "epoch": 3661} {"train_loss": -6.849300384521484, "global_step": 153774, "epoch": 3661} {"train_loss": -7.020010471343994, "global_step": 153775, "epoch": 3661} {"train_loss": -6.695673942565918, "global_step": 153776, "epoch": 3661} {"train_loss": -6.807656288146973, "global_step": 153777, "epoch": 3661} {"train_loss": -7.055948734283447, "global_step": 153778, "epoch": 3661} {"train_loss": -6.807110786437988, "global_step": 153779, "epoch": 3661} {"train_loss": -6.80982780456543, "global_step": 153780, "epoch": 3661} {"train_loss": -6.9063615798950195, "global_step": 153781, "epoch": 3661} {"train_loss": -6.697390079498291, "global_step": 153782, "epoch": 3661} {"train_loss": -6.875003814697266, "global_step": 153783, "epoch": 3661} {"train_loss": -6.813469409942627, "global_step": 153784, "epoch": 3661} {"train_loss": -6.876123428344727, "global_step": 153785, "epoch": 3661} {"train_loss": -6.794747352600098, "global_step": 153786, "epoch": 3661} {"train_loss": -6.889250755310059, "global_step": 153787, "epoch": 3661} {"train_loss": -6.730518341064453, "global_step": 153788, "epoch": 3661} {"train_loss": -6.859513282775879, "global_step": 153789, "epoch": 3661} {"train_loss": -6.84243106842041, "global_step": 153790, "epoch": 3661} {"train_loss": -6.8479461669921875, "global_step": 153791, "epoch": 3661} {"train_loss": -6.858648300170898, "global_step": 153792, "epoch": 3661} {"train_loss": -6.714700222015381, "global_step": 153793, "epoch": 3661} {"train_loss": -6.787724018096924, "global_step": 153794, "epoch": 3661} {"train_loss": -6.8169050216674805, "global_step": 153795, "epoch": 3661} {"train_loss": -6.755976676940918, "global_step": 153796, "epoch": 3661} {"train_loss": -6.889281749725342, "global_step": 153797, "epoch": 3661} {"train_loss": -6.842724800109863, "global_step": 153798, "epoch": 3661} {"train_loss": -6.834433555603027, "global_step": 153799, "epoch": 3661} {"train_loss": -6.776371002197266, "global_step": 153800, "epoch": 3661} {"train_loss": -6.833188533782959, "global_step": 153801, "epoch": 3661} {"train_loss": -6.95574426651001, "global_step": 153802, "epoch": 3661} {"train_loss": -6.867473227637155, "global_step": 153803, "epoch": 3661, "val_loss": 78880.4765625} {"train_loss": -6.855811595916748, "global_step": 153804, "epoch": 3662} {"train_loss": -6.883513450622559, "global_step": 153805, "epoch": 3662} {"train_loss": -6.919822692871094, "global_step": 153806, "epoch": 3662} {"train_loss": -6.753944396972656, "global_step": 153807, "epoch": 3662} {"train_loss": -6.907753944396973, "global_step": 153808, "epoch": 3662} {"train_loss": -6.887284755706787, "global_step": 153809, "epoch": 3662} {"train_loss": -6.866016387939453, "global_step": 153810, "epoch": 3662} {"train_loss": -6.845861434936523, "global_step": 153811, "epoch": 3662} {"train_loss": -6.930922985076904, "global_step": 153812, "epoch": 3662} {"train_loss": -6.807768821716309, "global_step": 153813, "epoch": 3662} {"train_loss": -6.834554672241211, "global_step": 153814, "epoch": 3662} {"train_loss": -6.874262809753418, "global_step": 153815, "epoch": 3662} {"train_loss": -6.896238327026367, "global_step": 153816, "epoch": 3662} {"train_loss": -6.736159324645996, "global_step": 153817, "epoch": 3662} {"train_loss": -7.010425090789795, "global_step": 153818, "epoch": 3662} {"train_loss": -6.890045642852783, "global_step": 153819, "epoch": 3662} {"train_loss": -6.920439720153809, "global_step": 153820, "epoch": 3662} {"train_loss": -6.911378860473633, "global_step": 153821, "epoch": 3662} {"train_loss": -6.892127990722656, "global_step": 153822, "epoch": 3662} {"train_loss": -6.844371318817139, "global_step": 153823, "epoch": 3662} {"train_loss": -6.872373580932617, "global_step": 153824, "epoch": 3662} {"train_loss": -6.964396953582764, "global_step": 153825, "epoch": 3662} {"train_loss": -6.911489009857178, "global_step": 153826, "epoch": 3662} {"train_loss": -6.962285995483398, "global_step": 153827, "epoch": 3662} {"train_loss": -6.856769561767578, "global_step": 153828, "epoch": 3662} {"train_loss": -6.887917518615723, "global_step": 153829, "epoch": 3662} {"train_loss": -6.886496543884277, "global_step": 153830, "epoch": 3662} {"train_loss": -6.9489641189575195, "global_step": 153831, "epoch": 3662} {"train_loss": -6.944687843322754, "global_step": 153832, "epoch": 3662} {"train_loss": -6.851956367492676, "global_step": 153833, "epoch": 3662} {"train_loss": -6.903640270233154, "global_step": 153834, "epoch": 3662} {"train_loss": -6.978425025939941, "global_step": 153835, "epoch": 3662} {"train_loss": -6.875916481018066, "global_step": 153836, "epoch": 3662} {"train_loss": -6.9111738204956055, "global_step": 153837, "epoch": 3662} {"train_loss": -6.927154541015625, "global_step": 153838, "epoch": 3662} {"train_loss": -6.889396667480469, "global_step": 153839, "epoch": 3662} {"train_loss": -6.931550979614258, "global_step": 153840, "epoch": 3662} {"train_loss": -6.863312244415283, "global_step": 153841, "epoch": 3662} {"train_loss": -6.841166019439697, "global_step": 153842, "epoch": 3662} {"train_loss": -6.939576625823975, "global_step": 153843, "epoch": 3662} {"train_loss": -6.946011543273926, "global_step": 153844, "epoch": 3662} {"train_loss": -6.889744917551677, "global_step": 153845, "epoch": 3662, "val_loss": 79138.078125} {"train_loss": -6.857725143432617, "global_step": 153846, "epoch": 3663} {"train_loss": -6.807890892028809, "global_step": 153847, "epoch": 3663} {"train_loss": -6.964932918548584, "global_step": 153848, "epoch": 3663} {"train_loss": -6.862273216247559, "global_step": 153849, "epoch": 3663} {"train_loss": -6.963602066040039, "global_step": 153850, "epoch": 3663} {"train_loss": -6.919715881347656, "global_step": 153851, "epoch": 3663} {"train_loss": -6.861516952514648, "global_step": 153852, "epoch": 3663} {"train_loss": -6.932910919189453, "global_step": 153853, "epoch": 3663} {"train_loss": -6.946779251098633, "global_step": 153854, "epoch": 3663} {"train_loss": -6.9371843338012695, "global_step": 153855, "epoch": 3663} {"train_loss": -6.8746843338012695, "global_step": 153856, "epoch": 3663} {"train_loss": -6.854503631591797, "global_step": 153857, "epoch": 3663} {"train_loss": -6.868041515350342, "global_step": 153858, "epoch": 3663} {"train_loss": -6.902688503265381, "global_step": 153859, "epoch": 3663} {"train_loss": -7.020435810089111, "global_step": 153860, "epoch": 3663} {"train_loss": -6.937472343444824, "global_step": 153861, "epoch": 3663} {"train_loss": -6.9667253494262695, "global_step": 153862, "epoch": 3663} {"train_loss": -6.797798156738281, "global_step": 153863, "epoch": 3663} {"train_loss": -6.916919708251953, "global_step": 153864, "epoch": 3663} {"train_loss": -6.833661079406738, "global_step": 153865, "epoch": 3663} {"train_loss": -6.873391151428223, "global_step": 153866, "epoch": 3663} {"train_loss": -6.886773109436035, "global_step": 153867, "epoch": 3663} {"train_loss": -6.984813690185547, "global_step": 153868, "epoch": 3663} {"train_loss": -6.989840507507324, "global_step": 153869, "epoch": 3663} {"train_loss": -6.904902458190918, "global_step": 153870, "epoch": 3663} {"train_loss": -6.992583274841309, "global_step": 153871, "epoch": 3663} {"train_loss": -6.864005088806152, "global_step": 153872, "epoch": 3663} {"train_loss": -6.873344421386719, "global_step": 153873, "epoch": 3663} {"train_loss": -6.8298797607421875, "global_step": 153874, "epoch": 3663} {"train_loss": -6.896892547607422, "global_step": 153875, "epoch": 3663} {"train_loss": -6.9037065505981445, "global_step": 153876, "epoch": 3663} {"train_loss": -6.967334747314453, "global_step": 153877, "epoch": 3663} {"train_loss": -6.822841167449951, "global_step": 153878, "epoch": 3663} {"train_loss": -6.9718475341796875, "global_step": 153879, "epoch": 3663} {"train_loss": -6.9029717445373535, "global_step": 153880, "epoch": 3663} {"train_loss": -6.999392509460449, "global_step": 153881, "epoch": 3663} {"train_loss": -6.865367412567139, "global_step": 153882, "epoch": 3663} {"train_loss": -6.891422271728516, "global_step": 153883, "epoch": 3663} {"train_loss": -6.991456031799316, "global_step": 153884, "epoch": 3663} {"train_loss": -6.831194877624512, "global_step": 153885, "epoch": 3663} {"train_loss": -6.848766326904297, "global_step": 153886, "epoch": 3663} {"train_loss": -6.903841609046573, "global_step": 153887, "epoch": 3663, "val_loss": 78870.4453125} {"train_loss": -6.953709602355957, "global_step": 153888, "epoch": 3664} {"train_loss": -6.9365997314453125, "global_step": 153889, "epoch": 3664} {"train_loss": -6.9758148193359375, "global_step": 153890, "epoch": 3664} {"train_loss": -6.925519943237305, "global_step": 153891, "epoch": 3664} {"train_loss": -6.907011032104492, "global_step": 153892, "epoch": 3664} {"train_loss": -6.989443302154541, "global_step": 153893, "epoch": 3664} {"train_loss": -6.841096878051758, "global_step": 153894, "epoch": 3664} {"train_loss": -6.950377464294434, "global_step": 153895, "epoch": 3664} {"train_loss": -6.962275505065918, "global_step": 153896, "epoch": 3664} {"train_loss": -6.981609344482422, "global_step": 153897, "epoch": 3664} {"train_loss": -6.858161449432373, "global_step": 153898, "epoch": 3664} {"train_loss": -6.9084038734436035, "global_step": 153899, "epoch": 3664} {"train_loss": -6.970837116241455, "global_step": 153900, "epoch": 3664} {"train_loss": -6.921080112457275, "global_step": 153901, "epoch": 3664} {"train_loss": -6.704540252685547, "global_step": 153902, "epoch": 3664} {"train_loss": -6.847817420959473, "global_step": 153903, "epoch": 3664} {"train_loss": -6.9414286613464355, "global_step": 153904, "epoch": 3664} {"train_loss": -6.978065490722656, "global_step": 153905, "epoch": 3664} {"train_loss": -6.768568992614746, "global_step": 153906, "epoch": 3664} {"train_loss": -7.002746105194092, "global_step": 153907, "epoch": 3664} {"train_loss": -6.794515609741211, "global_step": 153908, "epoch": 3664} {"train_loss": -6.8925700187683105, "global_step": 153909, "epoch": 3664} {"train_loss": -6.767725944519043, "global_step": 153910, "epoch": 3664} {"train_loss": -6.981487274169922, "global_step": 153911, "epoch": 3664} {"train_loss": -6.641534805297852, "global_step": 153912, "epoch": 3664} {"train_loss": -6.851517677307129, "global_step": 153913, "epoch": 3664} {"train_loss": -6.706416130065918, "global_step": 153914, "epoch": 3664} {"train_loss": -6.829343795776367, "global_step": 153915, "epoch": 3664} {"train_loss": -6.756406784057617, "global_step": 153916, "epoch": 3664} {"train_loss": -6.755391597747803, "global_step": 153917, "epoch": 3664} {"train_loss": -6.704105377197266, "global_step": 153918, "epoch": 3664} {"train_loss": -6.784191608428955, "global_step": 153919, "epoch": 3664} {"train_loss": -6.654036045074463, "global_step": 153920, "epoch": 3664} {"train_loss": -6.855931758880615, "global_step": 153921, "epoch": 3664} {"train_loss": -6.750967979431152, "global_step": 153922, "epoch": 3664} {"train_loss": -6.877340316772461, "global_step": 153923, "epoch": 3664} {"train_loss": -6.713798999786377, "global_step": 153924, "epoch": 3664} {"train_loss": -6.758803367614746, "global_step": 153925, "epoch": 3664} {"train_loss": -6.6568732261657715, "global_step": 153926, "epoch": 3664} {"train_loss": -6.857784271240234, "global_step": 153927, "epoch": 3664} {"train_loss": -6.777920722961426, "global_step": 153928, "epoch": 3664} {"train_loss": -6.8453269345419745, "global_step": 153929, "epoch": 3664, "val_loss": 78809.3359375} {"train_loss": -6.795775890350342, "global_step": 153930, "epoch": 3665} {"train_loss": -6.880519866943359, "global_step": 153931, "epoch": 3665} {"train_loss": -6.892421722412109, "global_step": 153932, "epoch": 3665} {"train_loss": -6.6744384765625, "global_step": 153933, "epoch": 3665} {"train_loss": -6.827291488647461, "global_step": 153934, "epoch": 3665} {"train_loss": -6.750848293304443, "global_step": 153935, "epoch": 3665} {"train_loss": -6.918642044067383, "global_step": 153936, "epoch": 3665} {"train_loss": -6.898241996765137, "global_step": 153937, "epoch": 3665} {"train_loss": -6.696290493011475, "global_step": 153938, "epoch": 3665} {"train_loss": -6.872982025146484, "global_step": 153939, "epoch": 3665} {"train_loss": -7.03352165222168, "global_step": 153940, "epoch": 3665} {"train_loss": -6.854245185852051, "global_step": 153941, "epoch": 3665} {"train_loss": -6.956545829772949, "global_step": 153942, "epoch": 3665} {"train_loss": -6.909843444824219, "global_step": 153943, "epoch": 3665} {"train_loss": -6.865633010864258, "global_step": 153944, "epoch": 3665} {"train_loss": -6.764297008514404, "global_step": 153945, "epoch": 3665} {"train_loss": -6.871271133422852, "global_step": 153946, "epoch": 3665} {"train_loss": -6.899514675140381, "global_step": 153947, "epoch": 3665} {"train_loss": -6.862398624420166, "global_step": 153948, "epoch": 3665} {"train_loss": -6.955084800720215, "global_step": 153949, "epoch": 3665} {"train_loss": -7.055622577667236, "global_step": 153950, "epoch": 3665} {"train_loss": -6.84412956237793, "global_step": 153951, "epoch": 3665} {"train_loss": -6.890574932098389, "global_step": 153952, "epoch": 3665} {"train_loss": -6.916959285736084, "global_step": 153953, "epoch": 3665} {"train_loss": -7.05067253112793, "global_step": 153954, "epoch": 3665} {"train_loss": -6.9321465492248535, "global_step": 153955, "epoch": 3665} {"train_loss": -7.032279968261719, "global_step": 153956, "epoch": 3665} {"train_loss": -6.969402313232422, "global_step": 153957, "epoch": 3665} {"train_loss": -6.917569637298584, "global_step": 153958, "epoch": 3665} {"train_loss": -7.037257194519043, "global_step": 153959, "epoch": 3665} {"train_loss": -6.912254333496094, "global_step": 153960, "epoch": 3665} {"train_loss": -7.066617965698242, "global_step": 153961, "epoch": 3665} {"train_loss": -6.832634925842285, "global_step": 153962, "epoch": 3665} {"train_loss": -6.97715425491333, "global_step": 153963, "epoch": 3665} {"train_loss": -6.868073463439941, "global_step": 153964, "epoch": 3665} {"train_loss": -6.855490684509277, "global_step": 153965, "epoch": 3665} {"train_loss": -6.722312927246094, "global_step": 153966, "epoch": 3665} {"train_loss": -6.858914852142334, "global_step": 153967, "epoch": 3665} {"train_loss": -6.911091327667236, "global_step": 153968, "epoch": 3665} {"train_loss": -6.801248550415039, "global_step": 153969, "epoch": 3665} {"train_loss": -6.828487396240234, "global_step": 153970, "epoch": 3665} {"train_loss": -6.889047406968617, "global_step": 153971, "epoch": 3665, "val_loss": 78830.640625} {"train_loss": -6.897374153137207, "global_step": 153972, "epoch": 3666} {"train_loss": -6.893122673034668, "global_step": 153973, "epoch": 3666} {"train_loss": -6.8808441162109375, "global_step": 153974, "epoch": 3666} {"train_loss": -6.925661087036133, "global_step": 153975, "epoch": 3666} {"train_loss": -6.954113006591797, "global_step": 153976, "epoch": 3666} {"train_loss": -6.991327285766602, "global_step": 153977, "epoch": 3666} {"train_loss": -6.969985485076904, "global_step": 153978, "epoch": 3666} {"train_loss": -6.939520359039307, "global_step": 153979, "epoch": 3666} {"train_loss": -7.012331485748291, "global_step": 153980, "epoch": 3666} {"train_loss": -6.834537029266357, "global_step": 153981, "epoch": 3666} {"train_loss": -6.885677814483643, "global_step": 153982, "epoch": 3666} {"train_loss": -6.912090301513672, "global_step": 153983, "epoch": 3666} {"train_loss": -7.012897491455078, "global_step": 153984, "epoch": 3666} {"train_loss": -7.014509201049805, "global_step": 153985, "epoch": 3666} {"train_loss": -6.936556816101074, "global_step": 153986, "epoch": 3666} {"train_loss": -7.101146697998047, "global_step": 153987, "epoch": 3666} {"train_loss": -6.8012003898620605, "global_step": 153988, "epoch": 3666} {"train_loss": -6.983050346374512, "global_step": 153989, "epoch": 3666} {"train_loss": -6.903171062469482, "global_step": 153990, "epoch": 3666} {"train_loss": -7.030471324920654, "global_step": 153991, "epoch": 3666} {"train_loss": -6.874861717224121, "global_step": 153992, "epoch": 3666} {"train_loss": -6.949863910675049, "global_step": 153993, "epoch": 3666} {"train_loss": -6.932030200958252, "global_step": 153994, "epoch": 3666} {"train_loss": -6.921076774597168, "global_step": 153995, "epoch": 3666} {"train_loss": -6.863696098327637, "global_step": 153996, "epoch": 3666} {"train_loss": -7.024900436401367, "global_step": 153997, "epoch": 3666} {"train_loss": -6.919561386108398, "global_step": 153998, "epoch": 3666} {"train_loss": -6.985189437866211, "global_step": 153999, "epoch": 3666} {"train_loss": -6.935663223266602, "global_step": 154000, "epoch": 3666} {"train_loss": -6.964045524597168, "global_step": 154001, "epoch": 3666} {"train_loss": -6.898386001586914, "global_step": 154002, "epoch": 3666} {"train_loss": -6.771263599395752, "global_step": 154003, "epoch": 3666} {"train_loss": -6.924589157104492, "global_step": 154004, "epoch": 3666} {"train_loss": -6.983183860778809, "global_step": 154005, "epoch": 3666} {"train_loss": -6.9127960205078125, "global_step": 154006, "epoch": 3666} {"train_loss": -6.888425350189209, "global_step": 154007, "epoch": 3666} {"train_loss": -6.930768966674805, "global_step": 154008, "epoch": 3666} {"train_loss": -6.906993865966797, "global_step": 154009, "epoch": 3666} {"train_loss": -6.987256050109863, "global_step": 154010, "epoch": 3666} {"train_loss": -6.873037338256836, "global_step": 154011, "epoch": 3666} {"train_loss": -6.569473743438721, "global_step": 154012, "epoch": 3666} {"train_loss": -6.92191431635902, "global_step": 154013, "epoch": 3666, "val_loss": 79268.875} {"train_loss": -6.851545333862305, "global_step": 154014, "epoch": 3667} {"train_loss": -6.70603084564209, "global_step": 154015, "epoch": 3667} {"train_loss": -6.832184314727783, "global_step": 154016, "epoch": 3667} {"train_loss": -6.84920597076416, "global_step": 154017, "epoch": 3667} {"train_loss": -6.73729944229126, "global_step": 154018, "epoch": 3667} {"train_loss": -6.856922626495361, "global_step": 154019, "epoch": 3667} {"train_loss": -6.880618095397949, "global_step": 154020, "epoch": 3667} {"train_loss": -6.770692825317383, "global_step": 154021, "epoch": 3667} {"train_loss": -6.8865132331848145, "global_step": 154022, "epoch": 3667} {"train_loss": -6.946609020233154, "global_step": 154023, "epoch": 3667} {"train_loss": -6.780424118041992, "global_step": 154024, "epoch": 3667} {"train_loss": -6.889307022094727, "global_step": 154025, "epoch": 3667} {"train_loss": -6.647991180419922, "global_step": 154026, "epoch": 3667} {"train_loss": -6.949047565460205, "global_step": 154027, "epoch": 3667} {"train_loss": -6.773739814758301, "global_step": 154028, "epoch": 3667} {"train_loss": -6.919924259185791, "global_step": 154029, "epoch": 3667} {"train_loss": -6.846388816833496, "global_step": 154030, "epoch": 3667} {"train_loss": -6.785857200622559, "global_step": 154031, "epoch": 3667} {"train_loss": -6.848552703857422, "global_step": 154032, "epoch": 3667} {"train_loss": -6.716828346252441, "global_step": 154033, "epoch": 3667} {"train_loss": -6.838674545288086, "global_step": 154034, "epoch": 3667} {"train_loss": -6.855708122253418, "global_step": 154035, "epoch": 3667} {"train_loss": -7.028667449951172, "global_step": 154036, "epoch": 3667} {"train_loss": -6.840455055236816, "global_step": 154037, "epoch": 3667} {"train_loss": -6.860182762145996, "global_step": 154038, "epoch": 3667} {"train_loss": -6.931586265563965, "global_step": 154039, "epoch": 3667} {"train_loss": -6.863999843597412, "global_step": 154040, "epoch": 3667} {"train_loss": -7.019455909729004, "global_step": 154041, "epoch": 3667} {"train_loss": -6.872123718261719, "global_step": 154042, "epoch": 3667} {"train_loss": -6.931962490081787, "global_step": 154043, "epoch": 3667} {"train_loss": -6.942084312438965, "global_step": 154044, "epoch": 3667} {"train_loss": -6.944943428039551, "global_step": 154045, "epoch": 3667} {"train_loss": -6.924801826477051, "global_step": 154046, "epoch": 3667} {"train_loss": -6.963104724884033, "global_step": 154047, "epoch": 3667} {"train_loss": -6.864292621612549, "global_step": 154048, "epoch": 3667} {"train_loss": -7.009037971496582, "global_step": 154049, "epoch": 3667} {"train_loss": -6.977241039276123, "global_step": 154050, "epoch": 3667} {"train_loss": -6.909299373626709, "global_step": 154051, "epoch": 3667} {"train_loss": -6.86480712890625, "global_step": 154052, "epoch": 3667} {"train_loss": -6.801468372344971, "global_step": 154053, "epoch": 3667} {"train_loss": -6.8995256423950195, "global_step": 154054, "epoch": 3667} {"train_loss": -6.870017744245983, "global_step": 154055, "epoch": 3667, "val_loss": 78940.7578125} {"train_loss": -6.969820022583008, "global_step": 154056, "epoch": 3668} {"train_loss": -6.898560523986816, "global_step": 154057, "epoch": 3668} {"train_loss": -6.878601551055908, "global_step": 154058, "epoch": 3668} {"train_loss": -6.803564071655273, "global_step": 154059, "epoch": 3668} {"train_loss": -6.9703216552734375, "global_step": 154060, "epoch": 3668} {"train_loss": -6.954183578491211, "global_step": 154061, "epoch": 3668} {"train_loss": -6.885834693908691, "global_step": 154062, "epoch": 3668} {"train_loss": -6.888962745666504, "global_step": 154063, "epoch": 3668} {"train_loss": -6.855125427246094, "global_step": 154064, "epoch": 3668} {"train_loss": -6.8590803146362305, "global_step": 154065, "epoch": 3668} {"train_loss": -6.810308456420898, "global_step": 154066, "epoch": 3668} {"train_loss": -6.898443222045898, "global_step": 154067, "epoch": 3668} {"train_loss": -6.9311017990112305, "global_step": 154068, "epoch": 3668} {"train_loss": -6.930344104766846, "global_step": 154069, "epoch": 3668} {"train_loss": -6.940694808959961, "global_step": 154070, "epoch": 3668} {"train_loss": -6.983692646026611, "global_step": 154071, "epoch": 3668} {"train_loss": -6.899325370788574, "global_step": 154072, "epoch": 3668} {"train_loss": -6.859110355377197, "global_step": 154073, "epoch": 3668} {"train_loss": -6.870744705200195, "global_step": 154074, "epoch": 3668} {"train_loss": -6.973690032958984, "global_step": 154075, "epoch": 3668} {"train_loss": -6.8674774169921875, "global_step": 154076, "epoch": 3668} {"train_loss": -6.903648853302002, "global_step": 154077, "epoch": 3668} {"train_loss": -6.823520660400391, "global_step": 154078, "epoch": 3668} {"train_loss": -6.829362392425537, "global_step": 154079, "epoch": 3668} {"train_loss": -6.9067182540893555, "global_step": 154080, "epoch": 3668} {"train_loss": -6.838311195373535, "global_step": 154081, "epoch": 3668} {"train_loss": -6.801177978515625, "global_step": 154082, "epoch": 3668} {"train_loss": -6.901474952697754, "global_step": 154083, "epoch": 3668} {"train_loss": -6.740694999694824, "global_step": 154084, "epoch": 3668} {"train_loss": -6.915033340454102, "global_step": 154085, "epoch": 3668} {"train_loss": -6.734189033508301, "global_step": 154086, "epoch": 3668} {"train_loss": -6.951426982879639, "global_step": 154087, "epoch": 3668} {"train_loss": -6.891185283660889, "global_step": 154088, "epoch": 3668} {"train_loss": -6.861560344696045, "global_step": 154089, "epoch": 3668} {"train_loss": -6.839365005493164, "global_step": 154090, "epoch": 3668} {"train_loss": -6.869394302368164, "global_step": 154091, "epoch": 3668} {"train_loss": -6.846923828125, "global_step": 154092, "epoch": 3668} {"train_loss": -6.816434860229492, "global_step": 154093, "epoch": 3668} {"train_loss": -6.852142810821533, "global_step": 154094, "epoch": 3668} {"train_loss": -6.885027885437012, "global_step": 154095, "epoch": 3668} {"train_loss": -6.848845481872559, "global_step": 154096, "epoch": 3668} {"train_loss": -6.879758255822318, "global_step": 154097, "epoch": 3668, "val_loss": 78889.9140625} {"train_loss": -6.864206790924072, "global_step": 154098, "epoch": 3669} {"train_loss": -6.848265171051025, "global_step": 154099, "epoch": 3669} {"train_loss": -6.851944923400879, "global_step": 154100, "epoch": 3669} {"train_loss": -6.899142265319824, "global_step": 154101, "epoch": 3669} {"train_loss": -6.891050815582275, "global_step": 154102, "epoch": 3669} {"train_loss": -6.911696434020996, "global_step": 154103, "epoch": 3669} {"train_loss": -6.983842372894287, "global_step": 154104, "epoch": 3669} {"train_loss": -6.8521013259887695, "global_step": 154105, "epoch": 3669} {"train_loss": -6.839861869812012, "global_step": 154106, "epoch": 3669} {"train_loss": -6.885599136352539, "global_step": 154107, "epoch": 3669} {"train_loss": -6.801702976226807, "global_step": 154108, "epoch": 3669} {"train_loss": -6.859848499298096, "global_step": 154109, "epoch": 3669} {"train_loss": -6.9146728515625, "global_step": 154110, "epoch": 3669} {"train_loss": -6.9052205085754395, "global_step": 154111, "epoch": 3669} {"train_loss": -6.843557357788086, "global_step": 154112, "epoch": 3669} {"train_loss": -6.8101396560668945, "global_step": 154113, "epoch": 3669} {"train_loss": -6.810750961303711, "global_step": 154114, "epoch": 3669} {"train_loss": -6.891691207885742, "global_step": 154115, "epoch": 3669} {"train_loss": -6.870904922485352, "global_step": 154116, "epoch": 3669} {"train_loss": -6.782136917114258, "global_step": 154117, "epoch": 3669} {"train_loss": -7.016322612762451, "global_step": 154118, "epoch": 3669} {"train_loss": -6.84880256652832, "global_step": 154119, "epoch": 3669} {"train_loss": -6.922053337097168, "global_step": 154120, "epoch": 3669} {"train_loss": -6.827826499938965, "global_step": 154121, "epoch": 3669} {"train_loss": -6.934296131134033, "global_step": 154122, "epoch": 3669} {"train_loss": -6.8095784187316895, "global_step": 154123, "epoch": 3669} {"train_loss": -6.827119827270508, "global_step": 154124, "epoch": 3669} {"train_loss": -6.757021903991699, "global_step": 154125, "epoch": 3669} {"train_loss": -6.7251129150390625, "global_step": 154126, "epoch": 3669} {"train_loss": -6.812103271484375, "global_step": 154127, "epoch": 3669} {"train_loss": -6.602290630340576, "global_step": 154128, "epoch": 3669} {"train_loss": -6.913150787353516, "global_step": 154129, "epoch": 3669} {"train_loss": -6.670896530151367, "global_step": 154130, "epoch": 3669} {"train_loss": -6.777981758117676, "global_step": 154131, "epoch": 3669} {"train_loss": -6.856929302215576, "global_step": 154132, "epoch": 3669} {"train_loss": -6.620731830596924, "global_step": 154133, "epoch": 3669} {"train_loss": -6.868254661560059, "global_step": 154134, "epoch": 3669} {"train_loss": -6.758244514465332, "global_step": 154135, "epoch": 3669} {"train_loss": -6.7782135009765625, "global_step": 154136, "epoch": 3669} {"train_loss": -6.684376239776611, "global_step": 154137, "epoch": 3669} {"train_loss": -6.8382978439331055, "global_step": 154138, "epoch": 3669} {"train_loss": -6.831888550803775, "global_step": 154139, "epoch": 3669, "val_loss": 78922.6875} {"train_loss": -6.716599941253662, "global_step": 154140, "epoch": 3670} {"train_loss": -6.665482521057129, "global_step": 154141, "epoch": 3670} {"train_loss": -6.881941795349121, "global_step": 154142, "epoch": 3670} {"train_loss": -6.858546733856201, "global_step": 154143, "epoch": 3670} {"train_loss": -6.915972709655762, "global_step": 154144, "epoch": 3670} {"train_loss": -6.829216957092285, "global_step": 154145, "epoch": 3670} {"train_loss": -6.854855537414551, "global_step": 154146, "epoch": 3670} {"train_loss": -6.938767910003662, "global_step": 154147, "epoch": 3670} {"train_loss": -6.965306758880615, "global_step": 154148, "epoch": 3670} {"train_loss": -6.917940139770508, "global_step": 154149, "epoch": 3670} {"train_loss": -6.956133842468262, "global_step": 154150, "epoch": 3670} {"train_loss": -6.8884735107421875, "global_step": 154151, "epoch": 3670} {"train_loss": -6.910427570343018, "global_step": 154152, "epoch": 3670} {"train_loss": -6.9553937911987305, "global_step": 154153, "epoch": 3670} {"train_loss": -6.896157741546631, "global_step": 154154, "epoch": 3670} {"train_loss": -7.032179355621338, "global_step": 154155, "epoch": 3670} {"train_loss": -6.883079528808594, "global_step": 154156, "epoch": 3670} {"train_loss": -6.7957963943481445, "global_step": 154157, "epoch": 3670} {"train_loss": -6.680024147033691, "global_step": 154158, "epoch": 3670} {"train_loss": -6.919395446777344, "global_step": 154159, "epoch": 3670} {"train_loss": -6.713774681091309, "global_step": 154160, "epoch": 3670} {"train_loss": -6.617088317871094, "global_step": 154161, "epoch": 3670} {"train_loss": -6.84386682510376, "global_step": 154162, "epoch": 3670} {"train_loss": -6.466099739074707, "global_step": 154163, "epoch": 3670} {"train_loss": -6.732338905334473, "global_step": 154164, "epoch": 3670} {"train_loss": -6.710873603820801, "global_step": 154165, "epoch": 3670} {"train_loss": -6.618685722351074, "global_step": 154166, "epoch": 3670} {"train_loss": -6.800851345062256, "global_step": 154167, "epoch": 3670} {"train_loss": -6.632444381713867, "global_step": 154168, "epoch": 3670} {"train_loss": -6.730681419372559, "global_step": 154169, "epoch": 3670} {"train_loss": -6.754380226135254, "global_step": 154170, "epoch": 3670} {"train_loss": -6.639738082885742, "global_step": 154171, "epoch": 3670} {"train_loss": -6.776833534240723, "global_step": 154172, "epoch": 3670} {"train_loss": -6.737285614013672, "global_step": 154173, "epoch": 3670} {"train_loss": -6.88622522354126, "global_step": 154174, "epoch": 3670} {"train_loss": -6.771899223327637, "global_step": 154175, "epoch": 3670} {"train_loss": -6.703322887420654, "global_step": 154176, "epoch": 3670} {"train_loss": -6.714029312133789, "global_step": 154177, "epoch": 3670} {"train_loss": -6.755260467529297, "global_step": 154178, "epoch": 3670} {"train_loss": -6.68712854385376, "global_step": 154179, "epoch": 3670} {"train_loss": -6.844276428222656, "global_step": 154180, "epoch": 3670} {"train_loss": -6.796571856453305, "global_step": 154181, "epoch": 3670, "val_loss": 78860.2109375} {"train_loss": -6.71304178237915, "global_step": 154182, "epoch": 3671} {"train_loss": -6.920088291168213, "global_step": 154183, "epoch": 3671} {"train_loss": -6.81821346282959, "global_step": 154184, "epoch": 3671} {"train_loss": -6.92631196975708, "global_step": 154185, "epoch": 3671} {"train_loss": -6.8861260414123535, "global_step": 154186, "epoch": 3671} {"train_loss": -6.889822006225586, "global_step": 154187, "epoch": 3671} {"train_loss": -6.771017074584961, "global_step": 154188, "epoch": 3671} {"train_loss": -6.845736503601074, "global_step": 154189, "epoch": 3671} {"train_loss": -6.808588027954102, "global_step": 154190, "epoch": 3671} {"train_loss": -6.883289337158203, "global_step": 154191, "epoch": 3671} {"train_loss": -6.9776153564453125, "global_step": 154192, "epoch": 3671} {"train_loss": -6.743168354034424, "global_step": 154193, "epoch": 3671} {"train_loss": -7.032114505767822, "global_step": 154194, "epoch": 3671} {"train_loss": -6.906933784484863, "global_step": 154195, "epoch": 3671} {"train_loss": -6.925217628479004, "global_step": 154196, "epoch": 3671} {"train_loss": -7.006885528564453, "global_step": 154197, "epoch": 3671} {"train_loss": -6.9728217124938965, "global_step": 154198, "epoch": 3671} {"train_loss": -6.820840835571289, "global_step": 154199, "epoch": 3671} {"train_loss": -6.785601615905762, "global_step": 154200, "epoch": 3671} {"train_loss": -6.922867774963379, "global_step": 154201, "epoch": 3671} {"train_loss": -6.845429420471191, "global_step": 154202, "epoch": 3671} {"train_loss": -6.737382888793945, "global_step": 154203, "epoch": 3671} {"train_loss": -6.970279216766357, "global_step": 154204, "epoch": 3671} {"train_loss": -6.90255069732666, "global_step": 154205, "epoch": 3671} {"train_loss": -6.9338250160217285, "global_step": 154206, "epoch": 3671} {"train_loss": -6.86659574508667, "global_step": 154207, "epoch": 3671} {"train_loss": -6.81452751159668, "global_step": 154208, "epoch": 3671} {"train_loss": -6.948968887329102, "global_step": 154209, "epoch": 3671} {"train_loss": -6.957571029663086, "global_step": 154210, "epoch": 3671} {"train_loss": -6.7923479080200195, "global_step": 154211, "epoch": 3671} {"train_loss": -6.899998188018799, "global_step": 154212, "epoch": 3671} {"train_loss": -6.88092565536499, "global_step": 154213, "epoch": 3671} {"train_loss": -6.917956352233887, "global_step": 154214, "epoch": 3671} {"train_loss": -6.805184364318848, "global_step": 154215, "epoch": 3671} {"train_loss": -6.970781326293945, "global_step": 154216, "epoch": 3671} {"train_loss": -6.900774002075195, "global_step": 154217, "epoch": 3671} {"train_loss": -6.807400703430176, "global_step": 154218, "epoch": 3671} {"train_loss": -6.917802810668945, "global_step": 154219, "epoch": 3671} {"train_loss": -6.808521270751953, "global_step": 154220, "epoch": 3671} {"train_loss": -6.922250747680664, "global_step": 154221, "epoch": 3671} {"train_loss": -6.981568336486816, "global_step": 154222, "epoch": 3671} {"train_loss": -6.878654128029233, "global_step": 154223, "epoch": 3671, "val_loss": 79115.484375} {"train_loss": -7.044955730438232, "global_step": 154224, "epoch": 3672} {"train_loss": -7.032282829284668, "global_step": 154225, "epoch": 3672} {"train_loss": -6.947620391845703, "global_step": 154226, "epoch": 3672} {"train_loss": -6.888317108154297, "global_step": 154227, "epoch": 3672} {"train_loss": -6.872190952301025, "global_step": 154228, "epoch": 3672} {"train_loss": -7.017465114593506, "global_step": 154229, "epoch": 3672} {"train_loss": -6.918977737426758, "global_step": 154230, "epoch": 3672} {"train_loss": -6.9566450119018555, "global_step": 154231, "epoch": 3672} {"train_loss": -6.898608207702637, "global_step": 154232, "epoch": 3672} {"train_loss": -6.860528945922852, "global_step": 154233, "epoch": 3672} {"train_loss": -6.873145580291748, "global_step": 154234, "epoch": 3672} {"train_loss": -6.880475997924805, "global_step": 154235, "epoch": 3672} {"train_loss": -7.005426406860352, "global_step": 154236, "epoch": 3672} {"train_loss": -6.828547477722168, "global_step": 154237, "epoch": 3672} {"train_loss": -6.9552507400512695, "global_step": 154238, "epoch": 3672} {"train_loss": -6.892429351806641, "global_step": 154239, "epoch": 3672} {"train_loss": -6.9337053298950195, "global_step": 154240, "epoch": 3672} {"train_loss": -6.968036651611328, "global_step": 154241, "epoch": 3672} {"train_loss": -6.949896812438965, "global_step": 154242, "epoch": 3672} {"train_loss": -6.923890113830566, "global_step": 154243, "epoch": 3672} {"train_loss": -6.870973110198975, "global_step": 154244, "epoch": 3672} {"train_loss": -6.9585113525390625, "global_step": 154245, "epoch": 3672} {"train_loss": -6.9153242111206055, "global_step": 154246, "epoch": 3672} {"train_loss": -6.924700736999512, "global_step": 154247, "epoch": 3672} {"train_loss": -7.014650344848633, "global_step": 154248, "epoch": 3672} {"train_loss": -6.991049766540527, "global_step": 154249, "epoch": 3672} {"train_loss": -6.991086959838867, "global_step": 154250, "epoch": 3672} {"train_loss": -6.871010780334473, "global_step": 154251, "epoch": 3672} {"train_loss": -6.928885459899902, "global_step": 154252, "epoch": 3672} {"train_loss": -6.854916572570801, "global_step": 154253, "epoch": 3672} {"train_loss": -6.960198402404785, "global_step": 154254, "epoch": 3672} {"train_loss": -6.909538269042969, "global_step": 154255, "epoch": 3672} {"train_loss": -6.975277900695801, "global_step": 154256, "epoch": 3672} {"train_loss": -6.883378028869629, "global_step": 154257, "epoch": 3672} {"train_loss": -6.902953147888184, "global_step": 154258, "epoch": 3672} {"train_loss": -6.916522979736328, "global_step": 154259, "epoch": 3672} {"train_loss": -6.96074914932251, "global_step": 154260, "epoch": 3672} {"train_loss": -6.951906681060791, "global_step": 154261, "epoch": 3672} {"train_loss": -6.966922760009766, "global_step": 154262, "epoch": 3672} {"train_loss": -6.851370811462402, "global_step": 154263, "epoch": 3672} {"train_loss": -6.852558135986328, "global_step": 154264, "epoch": 3672} {"train_loss": -6.926989067168463, "global_step": 154265, "epoch": 3672, "val_loss": 78974.0078125} {"train_loss": -6.8035149574279785, "global_step": 154266, "epoch": 3673} {"train_loss": -6.8017988204956055, "global_step": 154267, "epoch": 3673} {"train_loss": -6.801918029785156, "global_step": 154268, "epoch": 3673} {"train_loss": -6.596926689147949, "global_step": 154269, "epoch": 3673} {"train_loss": -6.720691204071045, "global_step": 154270, "epoch": 3673} {"train_loss": -6.835489273071289, "global_step": 154271, "epoch": 3673} {"train_loss": -6.622183799743652, "global_step": 154272, "epoch": 3673} {"train_loss": -6.608000755310059, "global_step": 154273, "epoch": 3673} {"train_loss": -6.561579704284668, "global_step": 154274, "epoch": 3673} {"train_loss": -6.758179187774658, "global_step": 154275, "epoch": 3673} {"train_loss": -6.617718696594238, "global_step": 154276, "epoch": 3673} {"train_loss": -6.875286102294922, "global_step": 154277, "epoch": 3673} {"train_loss": -6.637458801269531, "global_step": 154278, "epoch": 3673} {"train_loss": -6.81633996963501, "global_step": 154279, "epoch": 3673} {"train_loss": -6.628544330596924, "global_step": 154280, "epoch": 3673} {"train_loss": -6.846423149108887, "global_step": 154281, "epoch": 3673} {"train_loss": -6.786512851715088, "global_step": 154282, "epoch": 3673} {"train_loss": -6.730463027954102, "global_step": 154283, "epoch": 3673} {"train_loss": -6.732836723327637, "global_step": 154284, "epoch": 3673} {"train_loss": -6.69342041015625, "global_step": 154285, "epoch": 3673} {"train_loss": -6.750674247741699, "global_step": 154286, "epoch": 3673} {"train_loss": -6.777588844299316, "global_step": 154287, "epoch": 3673} {"train_loss": -6.786681175231934, "global_step": 154288, "epoch": 3673} {"train_loss": -6.743968963623047, "global_step": 154289, "epoch": 3673} {"train_loss": -6.877387046813965, "global_step": 154290, "epoch": 3673} {"train_loss": -6.719241619110107, "global_step": 154291, "epoch": 3673} {"train_loss": -6.782425880432129, "global_step": 154292, "epoch": 3673} {"train_loss": -6.691668510437012, "global_step": 154293, "epoch": 3673} {"train_loss": -6.7768096923828125, "global_step": 154294, "epoch": 3673} {"train_loss": -6.707161903381348, "global_step": 154295, "epoch": 3673} {"train_loss": -6.864222049713135, "global_step": 154296, "epoch": 3673} {"train_loss": -6.830404281616211, "global_step": 154297, "epoch": 3673} {"train_loss": -6.85292911529541, "global_step": 154298, "epoch": 3673} {"train_loss": -6.724411964416504, "global_step": 154299, "epoch": 3673} {"train_loss": -6.7846527099609375, "global_step": 154300, "epoch": 3673} {"train_loss": -6.75308895111084, "global_step": 154301, "epoch": 3673} {"train_loss": -6.804798603057861, "global_step": 154302, "epoch": 3673} {"train_loss": -6.76750373840332, "global_step": 154303, "epoch": 3673} {"train_loss": -6.808170318603516, "global_step": 154304, "epoch": 3673} {"train_loss": -6.883674144744873, "global_step": 154305, "epoch": 3673} {"train_loss": -6.8494696617126465, "global_step": 154306, "epoch": 3673} {"train_loss": -6.758917025157383, "global_step": 154307, "epoch": 3673, "val_loss": 79246.328125} {"train_loss": -6.854475021362305, "global_step": 154308, "epoch": 3674} {"train_loss": -6.866452693939209, "global_step": 154309, "epoch": 3674} {"train_loss": -6.929525852203369, "global_step": 154310, "epoch": 3674} {"train_loss": -6.934220314025879, "global_step": 154311, "epoch": 3674} {"train_loss": -6.788107872009277, "global_step": 154312, "epoch": 3674} {"train_loss": -6.9309186935424805, "global_step": 154313, "epoch": 3674} {"train_loss": -6.919071197509766, "global_step": 154314, "epoch": 3674} {"train_loss": -6.9058942794799805, "global_step": 154315, "epoch": 3674} {"train_loss": -6.896319389343262, "global_step": 154316, "epoch": 3674} {"train_loss": -6.844451904296875, "global_step": 154317, "epoch": 3674} {"train_loss": -6.922699928283691, "global_step": 154318, "epoch": 3674} {"train_loss": -6.926967620849609, "global_step": 154319, "epoch": 3674} {"train_loss": -6.928073883056641, "global_step": 154320, "epoch": 3674} {"train_loss": -6.956772327423096, "global_step": 154321, "epoch": 3674} {"train_loss": -6.916386604309082, "global_step": 154322, "epoch": 3674} {"train_loss": -6.874207019805908, "global_step": 154323, "epoch": 3674} {"train_loss": -6.768284797668457, "global_step": 154324, "epoch": 3674} {"train_loss": -6.897016525268555, "global_step": 154325, "epoch": 3674} {"train_loss": -6.809142112731934, "global_step": 154326, "epoch": 3674} {"train_loss": -6.942953586578369, "global_step": 154327, "epoch": 3674} {"train_loss": -6.9711809158325195, "global_step": 154328, "epoch": 3674} {"train_loss": -7.0748138427734375, "global_step": 154329, "epoch": 3674} {"train_loss": -6.941802978515625, "global_step": 154330, "epoch": 3674} {"train_loss": -6.8907880783081055, "global_step": 154331, "epoch": 3674} {"train_loss": -6.950335502624512, "global_step": 154332, "epoch": 3674} {"train_loss": -6.877518653869629, "global_step": 154333, "epoch": 3674} {"train_loss": -6.971959114074707, "global_step": 154334, "epoch": 3674} {"train_loss": -6.998325347900391, "global_step": 154335, "epoch": 3674} {"train_loss": -6.948326587677002, "global_step": 154336, "epoch": 3674} {"train_loss": -6.979393005371094, "global_step": 154337, "epoch": 3674} {"train_loss": -6.964987754821777, "global_step": 154338, "epoch": 3674} {"train_loss": -6.865418434143066, "global_step": 154339, "epoch": 3674} {"train_loss": -6.982695579528809, "global_step": 154340, "epoch": 3674} {"train_loss": -6.74172830581665, "global_step": 154341, "epoch": 3674} {"train_loss": -6.960301399230957, "global_step": 154342, "epoch": 3674} {"train_loss": -6.940962791442871, "global_step": 154343, "epoch": 3674} {"train_loss": -6.944125175476074, "global_step": 154344, "epoch": 3674} {"train_loss": -7.019638538360596, "global_step": 154345, "epoch": 3674} {"train_loss": -6.77089262008667, "global_step": 154346, "epoch": 3674} {"train_loss": -6.825353622436523, "global_step": 154347, "epoch": 3674} {"train_loss": -6.889389991760254, "global_step": 154348, "epoch": 3674} {"train_loss": -6.910957098007202, "global_step": 154349, "epoch": 3674, "val_loss": 78939.421875} {"train_loss": -6.837008476257324, "global_step": 154350, "epoch": 3675} {"train_loss": -6.898306369781494, "global_step": 154351, "epoch": 3675} {"train_loss": -6.976597785949707, "global_step": 154352, "epoch": 3675} {"train_loss": -6.935734748840332, "global_step": 154353, "epoch": 3675} {"train_loss": -6.846142292022705, "global_step": 154354, "epoch": 3675} {"train_loss": -7.028820514678955, "global_step": 154355, "epoch": 3675} {"train_loss": -6.888862609863281, "global_step": 154356, "epoch": 3675} {"train_loss": -6.980469703674316, "global_step": 154357, "epoch": 3675} {"train_loss": -6.904866695404053, "global_step": 154358, "epoch": 3675} {"train_loss": -6.868149757385254, "global_step": 154359, "epoch": 3675} {"train_loss": -6.943906307220459, "global_step": 154360, "epoch": 3675} {"train_loss": -6.963841915130615, "global_step": 154361, "epoch": 3675} {"train_loss": -6.823996543884277, "global_step": 154362, "epoch": 3675} {"train_loss": -6.89088773727417, "global_step": 154363, "epoch": 3675} {"train_loss": -6.833279609680176, "global_step": 154364, "epoch": 3675} {"train_loss": -6.880889892578125, "global_step": 154365, "epoch": 3675} {"train_loss": -6.849776268005371, "global_step": 154366, "epoch": 3675} {"train_loss": -6.631258010864258, "global_step": 154367, "epoch": 3675} {"train_loss": -6.8962860107421875, "global_step": 154368, "epoch": 3675} {"train_loss": -6.821093559265137, "global_step": 154369, "epoch": 3675} {"train_loss": -6.908867359161377, "global_step": 154370, "epoch": 3675} {"train_loss": -6.988689422607422, "global_step": 154371, "epoch": 3675} {"train_loss": -6.8433332443237305, "global_step": 154372, "epoch": 3675} {"train_loss": -6.867252349853516, "global_step": 154373, "epoch": 3675} {"train_loss": -6.98584508895874, "global_step": 154374, "epoch": 3675} {"train_loss": -6.913147926330566, "global_step": 154375, "epoch": 3675} {"train_loss": -6.942973613739014, "global_step": 154376, "epoch": 3675} {"train_loss": -6.948814392089844, "global_step": 154377, "epoch": 3675} {"train_loss": -6.9194560050964355, "global_step": 154378, "epoch": 3675} {"train_loss": -6.936461448669434, "global_step": 154379, "epoch": 3675} {"train_loss": -7.051203727722168, "global_step": 154380, "epoch": 3675} {"train_loss": -6.786521911621094, "global_step": 154381, "epoch": 3675} {"train_loss": -6.94826602935791, "global_step": 154382, "epoch": 3675} {"train_loss": -6.827906608581543, "global_step": 154383, "epoch": 3675} {"train_loss": -7.04828405380249, "global_step": 154384, "epoch": 3675} {"train_loss": -6.935211181640625, "global_step": 154385, "epoch": 3675} {"train_loss": -6.9822797775268555, "global_step": 154386, "epoch": 3675} {"train_loss": -6.938828468322754, "global_step": 154387, "epoch": 3675} {"train_loss": -6.937673568725586, "global_step": 154388, "epoch": 3675} {"train_loss": -6.956840515136719, "global_step": 154389, "epoch": 3675} {"train_loss": -6.856599807739258, "global_step": 154390, "epoch": 3675} {"train_loss": -6.9098503930228095, "global_step": 154391, "epoch": 3675, "val_loss": 78877.078125} {"train_loss": -6.898715972900391, "global_step": 154392, "epoch": 3676} {"train_loss": -6.994307041168213, "global_step": 154393, "epoch": 3676} {"train_loss": -6.958645343780518, "global_step": 154394, "epoch": 3676} {"train_loss": -6.890425682067871, "global_step": 154395, "epoch": 3676} {"train_loss": -6.9950270652771, "global_step": 154396, "epoch": 3676} {"train_loss": -7.008911609649658, "global_step": 154397, "epoch": 3676} {"train_loss": -6.878444194793701, "global_step": 154398, "epoch": 3676} {"train_loss": -6.976285934448242, "global_step": 154399, "epoch": 3676} {"train_loss": -7.069065093994141, "global_step": 154400, "epoch": 3676} {"train_loss": -6.959889888763428, "global_step": 154401, "epoch": 3676} {"train_loss": -6.94608736038208, "global_step": 154402, "epoch": 3676} {"train_loss": -7.035976409912109, "global_step": 154403, "epoch": 3676} {"train_loss": -6.908121109008789, "global_step": 154404, "epoch": 3676} {"train_loss": -6.956981658935547, "global_step": 154405, "epoch": 3676} {"train_loss": -6.854581832885742, "global_step": 154406, "epoch": 3676} {"train_loss": -6.92922306060791, "global_step": 154407, "epoch": 3676} {"train_loss": -6.977240562438965, "global_step": 154408, "epoch": 3676} {"train_loss": -6.889370441436768, "global_step": 154409, "epoch": 3676} {"train_loss": -6.904496192932129, "global_step": 154410, "epoch": 3676} {"train_loss": -6.938410758972168, "global_step": 154411, "epoch": 3676} {"train_loss": -6.789019584655762, "global_step": 154412, "epoch": 3676} {"train_loss": -6.801088809967041, "global_step": 154413, "epoch": 3676} {"train_loss": -6.8990864753723145, "global_step": 154414, "epoch": 3676} {"train_loss": -6.863809585571289, "global_step": 154415, "epoch": 3676} {"train_loss": -6.778700351715088, "global_step": 154416, "epoch": 3676} {"train_loss": -6.90950870513916, "global_step": 154417, "epoch": 3676} {"train_loss": -6.826037406921387, "global_step": 154418, "epoch": 3676} {"train_loss": -6.743440628051758, "global_step": 154419, "epoch": 3676} {"train_loss": -6.920926570892334, "global_step": 154420, "epoch": 3676} {"train_loss": -6.784324645996094, "global_step": 154421, "epoch": 3676} {"train_loss": -6.862817764282227, "global_step": 154422, "epoch": 3676} {"train_loss": -6.729612827301025, "global_step": 154423, "epoch": 3676} {"train_loss": -6.679903984069824, "global_step": 154424, "epoch": 3676} {"train_loss": -6.8779802322387695, "global_step": 154425, "epoch": 3676} {"train_loss": -6.740151405334473, "global_step": 154426, "epoch": 3676} {"train_loss": -6.857561111450195, "global_step": 154427, "epoch": 3676} {"train_loss": -6.65914249420166, "global_step": 154428, "epoch": 3676} {"train_loss": -6.766395568847656, "global_step": 154429, "epoch": 3676} {"train_loss": -6.790684223175049, "global_step": 154430, "epoch": 3676} {"train_loss": -6.766139984130859, "global_step": 154431, "epoch": 3676} {"train_loss": -6.849262237548828, "global_step": 154432, "epoch": 3676} {"train_loss": -6.86893215633574, "global_step": 154433, "epoch": 3676, "val_loss": 78939.4453125} {"train_loss": -6.704667568206787, "global_step": 154434, "epoch": 3677} {"train_loss": -6.72252082824707, "global_step": 154435, "epoch": 3677} {"train_loss": -6.769779205322266, "global_step": 154436, "epoch": 3677} {"train_loss": -6.787839889526367, "global_step": 154437, "epoch": 3677} {"train_loss": -6.659324645996094, "global_step": 154438, "epoch": 3677} {"train_loss": -6.94386100769043, "global_step": 154439, "epoch": 3677} {"train_loss": -6.804502487182617, "global_step": 154440, "epoch": 3677} {"train_loss": -6.83195161819458, "global_step": 154441, "epoch": 3677} {"train_loss": -6.859854698181152, "global_step": 154442, "epoch": 3677} {"train_loss": -6.730461597442627, "global_step": 154443, "epoch": 3677} {"train_loss": -6.811474800109863, "global_step": 154444, "epoch": 3677} {"train_loss": -6.811899185180664, "global_step": 154445, "epoch": 3677} {"train_loss": -6.729365348815918, "global_step": 154446, "epoch": 3677} {"train_loss": -6.901071548461914, "global_step": 154447, "epoch": 3677} {"train_loss": -6.6548991203308105, "global_step": 154448, "epoch": 3677} {"train_loss": -6.8379716873168945, "global_step": 154449, "epoch": 3677} {"train_loss": -6.611921310424805, "global_step": 154450, "epoch": 3677} {"train_loss": -6.8556108474731445, "global_step": 154451, "epoch": 3677} {"train_loss": -6.8831892013549805, "global_step": 154452, "epoch": 3677} {"train_loss": -6.839656829833984, "global_step": 154453, "epoch": 3677} {"train_loss": -6.808998107910156, "global_step": 154454, "epoch": 3677} {"train_loss": -6.841443061828613, "global_step": 154455, "epoch": 3677} {"train_loss": -6.860019683837891, "global_step": 154456, "epoch": 3677} {"train_loss": -6.772215843200684, "global_step": 154457, "epoch": 3677} {"train_loss": -6.9711127281188965, "global_step": 154458, "epoch": 3677} {"train_loss": -6.889936447143555, "global_step": 154459, "epoch": 3677} {"train_loss": -6.891536712646484, "global_step": 154460, "epoch": 3677} {"train_loss": -6.715244293212891, "global_step": 154461, "epoch": 3677} {"train_loss": -6.9187912940979, "global_step": 154462, "epoch": 3677} {"train_loss": -6.730175971984863, "global_step": 154463, "epoch": 3677} {"train_loss": -6.909270286560059, "global_step": 154464, "epoch": 3677} {"train_loss": -6.8024797439575195, "global_step": 154465, "epoch": 3677} {"train_loss": -6.94399881362915, "global_step": 154466, "epoch": 3677} {"train_loss": -6.877358913421631, "global_step": 154467, "epoch": 3677} {"train_loss": -6.917242527008057, "global_step": 154468, "epoch": 3677} {"train_loss": -6.887822151184082, "global_step": 154469, "epoch": 3677} {"train_loss": -6.847060680389404, "global_step": 154470, "epoch": 3677} {"train_loss": -6.937348365783691, "global_step": 154471, "epoch": 3677} {"train_loss": -6.816367149353027, "global_step": 154472, "epoch": 3677} {"train_loss": -6.821624279022217, "global_step": 154473, "epoch": 3677} {"train_loss": -6.802107810974121, "global_step": 154474, "epoch": 3677} {"train_loss": -6.8226170880453925, "global_step": 154475, "epoch": 3677, "val_loss": 78841.640625} {"train_loss": -6.791179656982422, "global_step": 154476, "epoch": 3678} {"train_loss": -6.743729591369629, "global_step": 154477, "epoch": 3678} {"train_loss": -6.9678802490234375, "global_step": 154478, "epoch": 3678} {"train_loss": -6.800910949707031, "global_step": 154479, "epoch": 3678} {"train_loss": -6.9629411697387695, "global_step": 154480, "epoch": 3678} {"train_loss": -6.930263996124268, "global_step": 154481, "epoch": 3678} {"train_loss": -6.909798622131348, "global_step": 154482, "epoch": 3678} {"train_loss": -6.975228309631348, "global_step": 154483, "epoch": 3678} {"train_loss": -6.947848320007324, "global_step": 154484, "epoch": 3678} {"train_loss": -6.815371513366699, "global_step": 154485, "epoch": 3678} {"train_loss": -6.926959991455078, "global_step": 154486, "epoch": 3678} {"train_loss": -6.957317352294922, "global_step": 154487, "epoch": 3678} {"train_loss": -6.880598068237305, "global_step": 154488, "epoch": 3678} {"train_loss": -6.900394439697266, "global_step": 154489, "epoch": 3678} {"train_loss": -6.936487197875977, "global_step": 154490, "epoch": 3678} {"train_loss": -6.839223384857178, "global_step": 154491, "epoch": 3678} {"train_loss": -6.87789249420166, "global_step": 154492, "epoch": 3678} {"train_loss": -6.931818962097168, "global_step": 154493, "epoch": 3678} {"train_loss": -6.951366424560547, "global_step": 154494, "epoch": 3678} {"train_loss": -6.847239017486572, "global_step": 154495, "epoch": 3678} {"train_loss": -6.936188697814941, "global_step": 154496, "epoch": 3678} {"train_loss": -6.853395462036133, "global_step": 154497, "epoch": 3678} {"train_loss": -6.876082897186279, "global_step": 154498, "epoch": 3678} {"train_loss": -6.9317240715026855, "global_step": 154499, "epoch": 3678} {"train_loss": -6.967655658721924, "global_step": 154500, "epoch": 3678} {"train_loss": -6.803742408752441, "global_step": 154501, "epoch": 3678} {"train_loss": -6.842315673828125, "global_step": 154502, "epoch": 3678} {"train_loss": -6.905324935913086, "global_step": 154503, "epoch": 3678} {"train_loss": -6.812559127807617, "global_step": 154504, "epoch": 3678} {"train_loss": -6.947232723236084, "global_step": 154505, "epoch": 3678} {"train_loss": -6.971757411956787, "global_step": 154506, "epoch": 3678} {"train_loss": -6.922759056091309, "global_step": 154507, "epoch": 3678} {"train_loss": -6.9166717529296875, "global_step": 154508, "epoch": 3678} {"train_loss": -6.892688751220703, "global_step": 154509, "epoch": 3678} {"train_loss": -6.908955097198486, "global_step": 154510, "epoch": 3678} {"train_loss": -6.875622749328613, "global_step": 154511, "epoch": 3678} {"train_loss": -6.792169570922852, "global_step": 154512, "epoch": 3678} {"train_loss": -6.809291839599609, "global_step": 154513, "epoch": 3678} {"train_loss": -6.850417613983154, "global_step": 154514, "epoch": 3678} {"train_loss": -6.8192219734191895, "global_step": 154515, "epoch": 3678} {"train_loss": -6.936357498168945, "global_step": 154516, "epoch": 3678} {"train_loss": -6.886153073537917, "global_step": 154517, "epoch": 3678, "val_loss": 78990.34375} {"train_loss": -6.915844440460205, "global_step": 154518, "epoch": 3679} {"train_loss": -6.840865135192871, "global_step": 154519, "epoch": 3679} {"train_loss": -6.880016326904297, "global_step": 154520, "epoch": 3679} {"train_loss": -7.055899143218994, "global_step": 154521, "epoch": 3679} {"train_loss": -6.886465549468994, "global_step": 154522, "epoch": 3679} {"train_loss": -6.975640296936035, "global_step": 154523, "epoch": 3679} {"train_loss": -6.908971309661865, "global_step": 154524, "epoch": 3679} {"train_loss": -6.9442644119262695, "global_step": 154525, "epoch": 3679} {"train_loss": -7.081705093383789, "global_step": 154526, "epoch": 3679} {"train_loss": -6.958568572998047, "global_step": 154527, "epoch": 3679} {"train_loss": -7.0013251304626465, "global_step": 154528, "epoch": 3679} {"train_loss": -7.005369186401367, "global_step": 154529, "epoch": 3679} {"train_loss": -6.87907075881958, "global_step": 154530, "epoch": 3679} {"train_loss": -6.824955940246582, "global_step": 154531, "epoch": 3679} {"train_loss": -6.899036884307861, "global_step": 154532, "epoch": 3679} {"train_loss": -7.056168556213379, "global_step": 154533, "epoch": 3679} {"train_loss": -6.896805763244629, "global_step": 154534, "epoch": 3679} {"train_loss": -6.924197196960449, "global_step": 154535, "epoch": 3679} {"train_loss": -6.883646011352539, "global_step": 154536, "epoch": 3679} {"train_loss": -6.797963619232178, "global_step": 154537, "epoch": 3679} {"train_loss": -6.912728309631348, "global_step": 154538, "epoch": 3679} {"train_loss": -6.844420433044434, "global_step": 154539, "epoch": 3679} {"train_loss": -6.928757667541504, "global_step": 154540, "epoch": 3679} {"train_loss": -6.890573978424072, "global_step": 154541, "epoch": 3679} {"train_loss": -6.92686128616333, "global_step": 154542, "epoch": 3679} {"train_loss": -6.998154640197754, "global_step": 154543, "epoch": 3679} {"train_loss": -6.9285807609558105, "global_step": 154544, "epoch": 3679} {"train_loss": -6.9655232429504395, "global_step": 154545, "epoch": 3679} {"train_loss": -6.815164089202881, "global_step": 154546, "epoch": 3679} {"train_loss": -6.9565510749816895, "global_step": 154547, "epoch": 3679} {"train_loss": -6.8759026527404785, "global_step": 154548, "epoch": 3679} {"train_loss": -6.923252105712891, "global_step": 154549, "epoch": 3679} {"train_loss": -6.994636058807373, "global_step": 154550, "epoch": 3679} {"train_loss": -6.937732696533203, "global_step": 154551, "epoch": 3679} {"train_loss": -6.839624881744385, "global_step": 154552, "epoch": 3679} {"train_loss": -6.904848575592041, "global_step": 154553, "epoch": 3679} {"train_loss": -6.971778869628906, "global_step": 154554, "epoch": 3679} {"train_loss": -7.004616737365723, "global_step": 154555, "epoch": 3679} {"train_loss": -6.945878505706787, "global_step": 154556, "epoch": 3679} {"train_loss": -6.9164509773254395, "global_step": 154557, "epoch": 3679} {"train_loss": -6.904451370239258, "global_step": 154558, "epoch": 3679} {"train_loss": -6.926742792129517, "global_step": 154559, "epoch": 3679, "val_loss": 79042.671875} {"train_loss": -6.88210391998291, "global_step": 154560, "epoch": 3680} {"train_loss": -6.9309821128845215, "global_step": 154561, "epoch": 3680} {"train_loss": -6.760312080383301, "global_step": 154562, "epoch": 3680} {"train_loss": -6.829126834869385, "global_step": 154563, "epoch": 3680} {"train_loss": -6.929409027099609, "global_step": 154564, "epoch": 3680} {"train_loss": -6.880060195922852, "global_step": 154565, "epoch": 3680} {"train_loss": -7.0068817138671875, "global_step": 154566, "epoch": 3680} {"train_loss": -6.891658782958984, "global_step": 154567, "epoch": 3680} {"train_loss": -6.9845967292785645, "global_step": 154568, "epoch": 3680} {"train_loss": -6.9142656326293945, "global_step": 154569, "epoch": 3680} {"train_loss": -6.909387588500977, "global_step": 154570, "epoch": 3680} {"train_loss": -6.872224807739258, "global_step": 154571, "epoch": 3680} {"train_loss": -6.832779884338379, "global_step": 154572, "epoch": 3680} {"train_loss": -6.9872050285339355, "global_step": 154573, "epoch": 3680} {"train_loss": -7.00014591217041, "global_step": 154574, "epoch": 3680} {"train_loss": -6.9725236892700195, "global_step": 154575, "epoch": 3680} {"train_loss": -6.961389064788818, "global_step": 154576, "epoch": 3680} {"train_loss": -6.8666276931762695, "global_step": 154577, "epoch": 3680} {"train_loss": -6.977736473083496, "global_step": 154578, "epoch": 3680} {"train_loss": -6.9636688232421875, "global_step": 154579, "epoch": 3680} {"train_loss": -6.97591495513916, "global_step": 154580, "epoch": 3680} {"train_loss": -6.963383674621582, "global_step": 154581, "epoch": 3680} {"train_loss": -6.82794189453125, "global_step": 154582, "epoch": 3680} {"train_loss": -6.910162925720215, "global_step": 154583, "epoch": 3680} {"train_loss": -6.958411693572998, "global_step": 154584, "epoch": 3680} {"train_loss": -6.901215076446533, "global_step": 154585, "epoch": 3680} {"train_loss": -6.946922779083252, "global_step": 154586, "epoch": 3680} {"train_loss": -6.865161895751953, "global_step": 154587, "epoch": 3680} {"train_loss": -6.888006210327148, "global_step": 154588, "epoch": 3680} {"train_loss": -6.92893648147583, "global_step": 154589, "epoch": 3680} {"train_loss": -6.963420867919922, "global_step": 154590, "epoch": 3680} {"train_loss": -6.921714782714844, "global_step": 154591, "epoch": 3680} {"train_loss": -6.85190486907959, "global_step": 154592, "epoch": 3680} {"train_loss": -6.900903701782227, "global_step": 154593, "epoch": 3680} {"train_loss": -6.773961544036865, "global_step": 154594, "epoch": 3680} {"train_loss": -6.847256660461426, "global_step": 154595, "epoch": 3680} {"train_loss": -6.895994186401367, "global_step": 154596, "epoch": 3680} {"train_loss": -6.883131980895996, "global_step": 154597, "epoch": 3680} {"train_loss": -6.901849746704102, "global_step": 154598, "epoch": 3680} {"train_loss": -6.967049598693848, "global_step": 154599, "epoch": 3680} {"train_loss": -6.868874549865723, "global_step": 154600, "epoch": 3680} {"train_loss": -6.909192028499785, "global_step": 154601, "epoch": 3680, "val_loss": 78929.4140625} {"train_loss": -7.08126163482666, "global_step": 154602, "epoch": 3681} {"train_loss": -6.9881486892700195, "global_step": 154603, "epoch": 3681} {"train_loss": -6.982975959777832, "global_step": 154604, "epoch": 3681} {"train_loss": -6.905464172363281, "global_step": 154605, "epoch": 3681} {"train_loss": -6.781371593475342, "global_step": 154606, "epoch": 3681} {"train_loss": -6.949518203735352, "global_step": 154607, "epoch": 3681} {"train_loss": -6.830804347991943, "global_step": 154608, "epoch": 3681} {"train_loss": -6.914287567138672, "global_step": 154609, "epoch": 3681} {"train_loss": -6.99458646774292, "global_step": 154610, "epoch": 3681} {"train_loss": -6.990886211395264, "global_step": 154611, "epoch": 3681} {"train_loss": -6.933678150177002, "global_step": 154612, "epoch": 3681} {"train_loss": -6.749245643615723, "global_step": 154613, "epoch": 3681} {"train_loss": -6.919966697692871, "global_step": 154614, "epoch": 3681} {"train_loss": -6.990514755249023, "global_step": 154615, "epoch": 3681} {"train_loss": -7.008845806121826, "global_step": 154616, "epoch": 3681} {"train_loss": -6.898926734924316, "global_step": 154617, "epoch": 3681} {"train_loss": -6.896435737609863, "global_step": 154618, "epoch": 3681} {"train_loss": -6.80013370513916, "global_step": 154619, "epoch": 3681} {"train_loss": -6.949265956878662, "global_step": 154620, "epoch": 3681} {"train_loss": -7.075289726257324, "global_step": 154621, "epoch": 3681} {"train_loss": -6.901529312133789, "global_step": 154622, "epoch": 3681} {"train_loss": -6.861412048339844, "global_step": 154623, "epoch": 3681} {"train_loss": -6.851351737976074, "global_step": 154624, "epoch": 3681} {"train_loss": -6.801578521728516, "global_step": 154625, "epoch": 3681} {"train_loss": -7.001914978027344, "global_step": 154626, "epoch": 3681} {"train_loss": -6.9821085929870605, "global_step": 154627, "epoch": 3681} {"train_loss": -6.8083391189575195, "global_step": 154628, "epoch": 3681} {"train_loss": -6.853883743286133, "global_step": 154629, "epoch": 3681} {"train_loss": -6.873348236083984, "global_step": 154630, "epoch": 3681} {"train_loss": -6.849853992462158, "global_step": 154631, "epoch": 3681} {"train_loss": -6.967930316925049, "global_step": 154632, "epoch": 3681} {"train_loss": -6.903082370758057, "global_step": 154633, "epoch": 3681} {"train_loss": -6.992252826690674, "global_step": 154634, "epoch": 3681} {"train_loss": -7.054990768432617, "global_step": 154635, "epoch": 3681} {"train_loss": -6.858942985534668, "global_step": 154636, "epoch": 3681} {"train_loss": -6.978992462158203, "global_step": 154637, "epoch": 3681} {"train_loss": -6.877297401428223, "global_step": 154638, "epoch": 3681} {"train_loss": -6.8490400314331055, "global_step": 154639, "epoch": 3681} {"train_loss": -7.017400741577148, "global_step": 154640, "epoch": 3681} {"train_loss": -7.055156230926514, "global_step": 154641, "epoch": 3681} {"train_loss": -6.97249174118042, "global_step": 154642, "epoch": 3681} {"train_loss": -6.9253663789658315, "global_step": 154643, "epoch": 3681, "val_loss": 79060.1640625} {"train_loss": -6.863076686859131, "global_step": 154644, "epoch": 3682} {"train_loss": -6.892592906951904, "global_step": 154645, "epoch": 3682} {"train_loss": -6.8634419441223145, "global_step": 154646, "epoch": 3682} {"train_loss": -6.893571853637695, "global_step": 154647, "epoch": 3682} {"train_loss": -6.838136672973633, "global_step": 154648, "epoch": 3682} {"train_loss": -6.950545310974121, "global_step": 154649, "epoch": 3682} {"train_loss": -6.998305320739746, "global_step": 154650, "epoch": 3682} {"train_loss": -6.933291435241699, "global_step": 154651, "epoch": 3682} {"train_loss": -6.888645172119141, "global_step": 154652, "epoch": 3682} {"train_loss": -6.971274375915527, "global_step": 154653, "epoch": 3682} {"train_loss": -6.915569305419922, "global_step": 154654, "epoch": 3682} {"train_loss": -6.917761325836182, "global_step": 154655, "epoch": 3682} {"train_loss": -6.87318229675293, "global_step": 154656, "epoch": 3682} {"train_loss": -6.937480449676514, "global_step": 154657, "epoch": 3682} {"train_loss": -6.975923538208008, "global_step": 154658, "epoch": 3682} {"train_loss": -6.883974075317383, "global_step": 154659, "epoch": 3682} {"train_loss": -6.752450466156006, "global_step": 154660, "epoch": 3682} {"train_loss": -7.035970687866211, "global_step": 154661, "epoch": 3682} {"train_loss": -6.871708869934082, "global_step": 154662, "epoch": 3682} {"train_loss": -6.955268383026123, "global_step": 154663, "epoch": 3682} {"train_loss": -6.95481538772583, "global_step": 154664, "epoch": 3682} {"train_loss": -6.942470550537109, "global_step": 154665, "epoch": 3682} {"train_loss": -6.948562145233154, "global_step": 154666, "epoch": 3682} {"train_loss": -6.880246162414551, "global_step": 154667, "epoch": 3682} {"train_loss": -6.879486083984375, "global_step": 154668, "epoch": 3682} {"train_loss": -6.815616607666016, "global_step": 154669, "epoch": 3682} {"train_loss": -6.882500648498535, "global_step": 154670, "epoch": 3682} {"train_loss": -6.823446273803711, "global_step": 154671, "epoch": 3682} {"train_loss": -6.934578895568848, "global_step": 154672, "epoch": 3682} {"train_loss": -6.787596225738525, "global_step": 154673, "epoch": 3682} {"train_loss": -6.922147750854492, "global_step": 154674, "epoch": 3682} {"train_loss": -6.942523956298828, "global_step": 154675, "epoch": 3682} {"train_loss": -6.879676818847656, "global_step": 154676, "epoch": 3682} {"train_loss": -6.766679763793945, "global_step": 154677, "epoch": 3682} {"train_loss": -6.8051371574401855, "global_step": 154678, "epoch": 3682} {"train_loss": -6.679946422576904, "global_step": 154679, "epoch": 3682} {"train_loss": -6.844676971435547, "global_step": 154680, "epoch": 3682} {"train_loss": -6.917456150054932, "global_step": 154681, "epoch": 3682} {"train_loss": -6.743978500366211, "global_step": 154682, "epoch": 3682} {"train_loss": -6.913155555725098, "global_step": 154683, "epoch": 3682} {"train_loss": -6.836213111877441, "global_step": 154684, "epoch": 3682} {"train_loss": -6.887152194976807, "global_step": 154685, "epoch": 3682, "val_loss": 78888.125} {"train_loss": -6.957406044006348, "global_step": 154686, "epoch": 3683} {"train_loss": -6.914969444274902, "global_step": 154687, "epoch": 3683} {"train_loss": -6.759089469909668, "global_step": 154688, "epoch": 3683} {"train_loss": -6.787732124328613, "global_step": 154689, "epoch": 3683} {"train_loss": -6.922290802001953, "global_step": 154690, "epoch": 3683} {"train_loss": -6.888159275054932, "global_step": 154691, "epoch": 3683} {"train_loss": -6.936131477355957, "global_step": 154692, "epoch": 3683} {"train_loss": -6.826297283172607, "global_step": 154693, "epoch": 3683} {"train_loss": -6.787111282348633, "global_step": 154694, "epoch": 3683} {"train_loss": -6.915226936340332, "global_step": 154695, "epoch": 3683} {"train_loss": -6.867493629455566, "global_step": 154696, "epoch": 3683} {"train_loss": -6.9156599044799805, "global_step": 154697, "epoch": 3683} {"train_loss": -6.986472129821777, "global_step": 154698, "epoch": 3683} {"train_loss": -6.90988302230835, "global_step": 154699, "epoch": 3683} {"train_loss": -6.877017974853516, "global_step": 154700, "epoch": 3683} {"train_loss": -6.86940336227417, "global_step": 154701, "epoch": 3683} {"train_loss": -6.9176025390625, "global_step": 154702, "epoch": 3683} {"train_loss": -6.905385971069336, "global_step": 154703, "epoch": 3683} {"train_loss": -6.901235580444336, "global_step": 154704, "epoch": 3683} {"train_loss": -6.852382659912109, "global_step": 154705, "epoch": 3683} {"train_loss": -6.754098415374756, "global_step": 154706, "epoch": 3683} {"train_loss": -6.966962814331055, "global_step": 154707, "epoch": 3683} {"train_loss": -6.872345924377441, "global_step": 154708, "epoch": 3683} {"train_loss": -6.835318565368652, "global_step": 154709, "epoch": 3683} {"train_loss": -6.894704818725586, "global_step": 154710, "epoch": 3683} {"train_loss": -6.877475738525391, "global_step": 154711, "epoch": 3683} {"train_loss": -6.88878059387207, "global_step": 154712, "epoch": 3683} {"train_loss": -6.8388495445251465, "global_step": 154713, "epoch": 3683} {"train_loss": -6.850998878479004, "global_step": 154714, "epoch": 3683} {"train_loss": -6.995734214782715, "global_step": 154715, "epoch": 3683} {"train_loss": -6.8937458992004395, "global_step": 154716, "epoch": 3683} {"train_loss": -7.014373779296875, "global_step": 154717, "epoch": 3683} {"train_loss": -6.974505424499512, "global_step": 154718, "epoch": 3683} {"train_loss": -6.859650611877441, "global_step": 154719, "epoch": 3683} {"train_loss": -6.915769100189209, "global_step": 154720, "epoch": 3683} {"train_loss": -6.925651550292969, "global_step": 154721, "epoch": 3683} {"train_loss": -7.011070728302002, "global_step": 154722, "epoch": 3683} {"train_loss": -6.914320945739746, "global_step": 154723, "epoch": 3683} {"train_loss": -6.884331703186035, "global_step": 154724, "epoch": 3683} {"train_loss": -6.975268363952637, "global_step": 154725, "epoch": 3683} {"train_loss": -7.010922908782959, "global_step": 154726, "epoch": 3683} {"train_loss": -6.8980114459991455, "global_step": 154727, "epoch": 3683, "val_loss": 79006.328125} {"train_loss": -6.882087707519531, "global_step": 154728, "epoch": 3684} {"train_loss": -6.93583869934082, "global_step": 154729, "epoch": 3684} {"train_loss": -6.875087738037109, "global_step": 154730, "epoch": 3684} {"train_loss": -7.082265853881836, "global_step": 154731, "epoch": 3684} {"train_loss": -6.887313365936279, "global_step": 154732, "epoch": 3684} {"train_loss": -6.898834228515625, "global_step": 154733, "epoch": 3684} {"train_loss": -6.94865608215332, "global_step": 154734, "epoch": 3684} {"train_loss": -6.934799671173096, "global_step": 154735, "epoch": 3684} {"train_loss": -6.848232269287109, "global_step": 154736, "epoch": 3684} {"train_loss": -6.979353427886963, "global_step": 154737, "epoch": 3684} {"train_loss": -6.866077423095703, "global_step": 154738, "epoch": 3684} {"train_loss": -6.840117454528809, "global_step": 154739, "epoch": 3684} {"train_loss": -6.915195465087891, "global_step": 154740, "epoch": 3684} {"train_loss": -6.86727237701416, "global_step": 154741, "epoch": 3684} {"train_loss": -6.966691017150879, "global_step": 154742, "epoch": 3684} {"train_loss": -7.057090759277344, "global_step": 154743, "epoch": 3684} {"train_loss": -6.917333602905273, "global_step": 154744, "epoch": 3684} {"train_loss": -6.9482197761535645, "global_step": 154745, "epoch": 3684} {"train_loss": -7.076122283935547, "global_step": 154746, "epoch": 3684} {"train_loss": -6.88835334777832, "global_step": 154747, "epoch": 3684} {"train_loss": -6.887361526489258, "global_step": 154748, "epoch": 3684} {"train_loss": -6.933872222900391, "global_step": 154749, "epoch": 3684} {"train_loss": -6.7809062004089355, "global_step": 154750, "epoch": 3684} {"train_loss": -6.988677501678467, "global_step": 154751, "epoch": 3684} {"train_loss": -6.887944221496582, "global_step": 154752, "epoch": 3684} {"train_loss": -6.774288177490234, "global_step": 154753, "epoch": 3684} {"train_loss": -6.945572853088379, "global_step": 154754, "epoch": 3684} {"train_loss": -6.988001823425293, "global_step": 154755, "epoch": 3684} {"train_loss": -6.838815689086914, "global_step": 154756, "epoch": 3684} {"train_loss": -6.867279052734375, "global_step": 154757, "epoch": 3684} {"train_loss": -6.887681484222412, "global_step": 154758, "epoch": 3684} {"train_loss": -6.761029243469238, "global_step": 154759, "epoch": 3684} {"train_loss": -6.937031269073486, "global_step": 154760, "epoch": 3684} {"train_loss": -6.8344316482543945, "global_step": 154761, "epoch": 3684} {"train_loss": -6.782073020935059, "global_step": 154762, "epoch": 3684} {"train_loss": -6.921308517456055, "global_step": 154763, "epoch": 3684} {"train_loss": -6.82988166809082, "global_step": 154764, "epoch": 3684} {"train_loss": -6.907111167907715, "global_step": 154765, "epoch": 3684} {"train_loss": -6.894968032836914, "global_step": 154766, "epoch": 3684} {"train_loss": -6.844479560852051, "global_step": 154767, "epoch": 3684} {"train_loss": -6.950990676879883, "global_step": 154768, "epoch": 3684} {"train_loss": -6.902547234580631, "global_step": 154769, "epoch": 3684, "val_loss": 79166.4453125} {"train_loss": -6.975747108459473, "global_step": 154770, "epoch": 3685} {"train_loss": -6.894032001495361, "global_step": 154771, "epoch": 3685} {"train_loss": -6.975255966186523, "global_step": 154772, "epoch": 3685} {"train_loss": -6.972508430480957, "global_step": 154773, "epoch": 3685} {"train_loss": -6.8837080001831055, "global_step": 154774, "epoch": 3685} {"train_loss": -6.894449234008789, "global_step": 154775, "epoch": 3685} {"train_loss": -6.968039512634277, "global_step": 154776, "epoch": 3685} {"train_loss": -6.984767913818359, "global_step": 154777, "epoch": 3685} {"train_loss": -6.925919532775879, "global_step": 154778, "epoch": 3685} {"train_loss": -6.685274124145508, "global_step": 154779, "epoch": 3685} {"train_loss": -6.971737861633301, "global_step": 154780, "epoch": 3685} {"train_loss": -6.677842140197754, "global_step": 154781, "epoch": 3685} {"train_loss": -6.749076843261719, "global_step": 154782, "epoch": 3685} {"train_loss": -6.830050945281982, "global_step": 154783, "epoch": 3685} {"train_loss": -6.959803104400635, "global_step": 154784, "epoch": 3685} {"train_loss": -6.882634162902832, "global_step": 154785, "epoch": 3685} {"train_loss": -6.930384635925293, "global_step": 154786, "epoch": 3685} {"train_loss": -6.967450141906738, "global_step": 154787, "epoch": 3685} {"train_loss": -6.878639221191406, "global_step": 154788, "epoch": 3685} {"train_loss": -6.808894157409668, "global_step": 154789, "epoch": 3685} {"train_loss": -6.790839195251465, "global_step": 154790, "epoch": 3685} {"train_loss": -6.9184160232543945, "global_step": 154791, "epoch": 3685} {"train_loss": -6.891716957092285, "global_step": 154792, "epoch": 3685} {"train_loss": -6.908308982849121, "global_step": 154793, "epoch": 3685} {"train_loss": -6.8256072998046875, "global_step": 154794, "epoch": 3685} {"train_loss": -6.906578063964844, "global_step": 154795, "epoch": 3685} {"train_loss": -6.938868522644043, "global_step": 154796, "epoch": 3685} {"train_loss": -6.895051002502441, "global_step": 154797, "epoch": 3685} {"train_loss": -6.742302894592285, "global_step": 154798, "epoch": 3685} {"train_loss": -6.854639053344727, "global_step": 154799, "epoch": 3685} {"train_loss": -6.966770648956299, "global_step": 154800, "epoch": 3685} {"train_loss": -6.821358680725098, "global_step": 154801, "epoch": 3685} {"train_loss": -6.767397880554199, "global_step": 154802, "epoch": 3685} {"train_loss": -6.849127292633057, "global_step": 154803, "epoch": 3685} {"train_loss": -6.929436683654785, "global_step": 154804, "epoch": 3685} {"train_loss": -6.894672870635986, "global_step": 154805, "epoch": 3685} {"train_loss": -6.919938087463379, "global_step": 154806, "epoch": 3685} {"train_loss": -6.871319770812988, "global_step": 154807, "epoch": 3685} {"train_loss": -6.824872016906738, "global_step": 154808, "epoch": 3685} {"train_loss": -6.918164253234863, "global_step": 154809, "epoch": 3685} {"train_loss": -6.732767581939697, "global_step": 154810, "epoch": 3685} {"train_loss": -6.87735256694612, "global_step": 154811, "epoch": 3685, "val_loss": 78949.0078125} {"train_loss": -6.818027496337891, "global_step": 154812, "epoch": 3686} {"train_loss": -6.752763748168945, "global_step": 154813, "epoch": 3686} {"train_loss": -6.87500524520874, "global_step": 154814, "epoch": 3686} {"train_loss": -6.745719909667969, "global_step": 154815, "epoch": 3686} {"train_loss": -6.982556343078613, "global_step": 154816, "epoch": 3686} {"train_loss": -6.870824813842773, "global_step": 154817, "epoch": 3686} {"train_loss": -6.919816493988037, "global_step": 154818, "epoch": 3686} {"train_loss": -6.927021503448486, "global_step": 154819, "epoch": 3686} {"train_loss": -6.961958885192871, "global_step": 154820, "epoch": 3686} {"train_loss": -6.930893898010254, "global_step": 154821, "epoch": 3686} {"train_loss": -6.946989059448242, "global_step": 154822, "epoch": 3686} {"train_loss": -6.9665446281433105, "global_step": 154823, "epoch": 3686} {"train_loss": -6.917755126953125, "global_step": 154824, "epoch": 3686} {"train_loss": -6.899048805236816, "global_step": 154825, "epoch": 3686} {"train_loss": -6.896695137023926, "global_step": 154826, "epoch": 3686} {"train_loss": -6.899258613586426, "global_step": 154827, "epoch": 3686} {"train_loss": -6.788318634033203, "global_step": 154828, "epoch": 3686} {"train_loss": -6.872231960296631, "global_step": 154829, "epoch": 3686} {"train_loss": -6.906420707702637, "global_step": 154830, "epoch": 3686} {"train_loss": -6.781728267669678, "global_step": 154831, "epoch": 3686} {"train_loss": -6.895809173583984, "global_step": 154832, "epoch": 3686} {"train_loss": -6.911546230316162, "global_step": 154833, "epoch": 3686} {"train_loss": -6.750896453857422, "global_step": 154834, "epoch": 3686} {"train_loss": -6.873211860656738, "global_step": 154835, "epoch": 3686} {"train_loss": -6.786089897155762, "global_step": 154836, "epoch": 3686} {"train_loss": -6.909099102020264, "global_step": 154837, "epoch": 3686} {"train_loss": -6.907345771789551, "global_step": 154838, "epoch": 3686} {"train_loss": -6.874387741088867, "global_step": 154839, "epoch": 3686} {"train_loss": -6.906540870666504, "global_step": 154840, "epoch": 3686} {"train_loss": -6.957715034484863, "global_step": 154841, "epoch": 3686} {"train_loss": -6.851156711578369, "global_step": 154842, "epoch": 3686} {"train_loss": -6.987904071807861, "global_step": 154843, "epoch": 3686} {"train_loss": -6.919809341430664, "global_step": 154844, "epoch": 3686} {"train_loss": -6.852541446685791, "global_step": 154845, "epoch": 3686} {"train_loss": -6.743046283721924, "global_step": 154846, "epoch": 3686} {"train_loss": -6.90015983581543, "global_step": 154847, "epoch": 3686} {"train_loss": -6.824344158172607, "global_step": 154848, "epoch": 3686} {"train_loss": -6.907564163208008, "global_step": 154849, "epoch": 3686} {"train_loss": -6.8582916259765625, "global_step": 154850, "epoch": 3686} {"train_loss": -6.730472564697266, "global_step": 154851, "epoch": 3686} {"train_loss": -6.851069450378418, "global_step": 154852, "epoch": 3686} {"train_loss": -6.872466246287028, "global_step": 154853, "epoch": 3686, "val_loss": 79138.640625} {"train_loss": -6.9000773429870605, "global_step": 154854, "epoch": 3687} {"train_loss": -6.900778770446777, "global_step": 154855, "epoch": 3687} {"train_loss": -6.906585216522217, "global_step": 154856, "epoch": 3687} {"train_loss": -6.84147310256958, "global_step": 154857, "epoch": 3687} {"train_loss": -6.837333679199219, "global_step": 154858, "epoch": 3687} {"train_loss": -6.882571220397949, "global_step": 154859, "epoch": 3687} {"train_loss": -6.909650802612305, "global_step": 154860, "epoch": 3687} {"train_loss": -6.7501912117004395, "global_step": 154861, "epoch": 3687} {"train_loss": -6.90359354019165, "global_step": 154862, "epoch": 3687} {"train_loss": -6.817575454711914, "global_step": 154863, "epoch": 3687} {"train_loss": -6.835616588592529, "global_step": 154864, "epoch": 3687} {"train_loss": -6.939937591552734, "global_step": 154865, "epoch": 3687} {"train_loss": -6.8414530754089355, "global_step": 154866, "epoch": 3687} {"train_loss": -6.957557678222656, "global_step": 154867, "epoch": 3687} {"train_loss": -6.948569297790527, "global_step": 154868, "epoch": 3687} {"train_loss": -6.98370361328125, "global_step": 154869, "epoch": 3687} {"train_loss": -6.8984222412109375, "global_step": 154870, "epoch": 3687} {"train_loss": -6.896278381347656, "global_step": 154871, "epoch": 3687} {"train_loss": -6.962047576904297, "global_step": 154872, "epoch": 3687} {"train_loss": -6.959908485412598, "global_step": 154873, "epoch": 3687} {"train_loss": -6.860176086425781, "global_step": 154874, "epoch": 3687} {"train_loss": -6.991511344909668, "global_step": 154875, "epoch": 3687} {"train_loss": -6.788971900939941, "global_step": 154876, "epoch": 3687} {"train_loss": -7.02052116394043, "global_step": 154877, "epoch": 3687} {"train_loss": -6.94710636138916, "global_step": 154878, "epoch": 3687} {"train_loss": -6.915209770202637, "global_step": 154879, "epoch": 3687} {"train_loss": -6.941084384918213, "global_step": 154880, "epoch": 3687} {"train_loss": -6.93869686126709, "global_step": 154881, "epoch": 3687} {"train_loss": -6.9007568359375, "global_step": 154882, "epoch": 3687} {"train_loss": -6.972917556762695, "global_step": 154883, "epoch": 3687} {"train_loss": -6.887258529663086, "global_step": 154884, "epoch": 3687} {"train_loss": -7.05502986907959, "global_step": 154885, "epoch": 3687} {"train_loss": -6.962307929992676, "global_step": 154886, "epoch": 3687} {"train_loss": -6.906743049621582, "global_step": 154887, "epoch": 3687} {"train_loss": -6.891983509063721, "global_step": 154888, "epoch": 3687} {"train_loss": -7.043852806091309, "global_step": 154889, "epoch": 3687} {"train_loss": -6.792967796325684, "global_step": 154890, "epoch": 3687} {"train_loss": -6.9417924880981445, "global_step": 154891, "epoch": 3687} {"train_loss": -6.934232711791992, "global_step": 154892, "epoch": 3687} {"train_loss": -7.075558185577393, "global_step": 154893, "epoch": 3687} {"train_loss": -6.981044292449951, "global_step": 154894, "epoch": 3687} {"train_loss": -6.919101170131138, "global_step": 154895, "epoch": 3687, "val_loss": 78987.140625} {"train_loss": -7.038534164428711, "global_step": 154896, "epoch": 3688} {"train_loss": -6.975990295410156, "global_step": 154897, "epoch": 3688} {"train_loss": -7.001055717468262, "global_step": 154898, "epoch": 3688} {"train_loss": -6.961645126342773, "global_step": 154899, "epoch": 3688} {"train_loss": -6.980325698852539, "global_step": 154900, "epoch": 3688} {"train_loss": -6.955142021179199, "global_step": 154901, "epoch": 3688} {"train_loss": -6.976907730102539, "global_step": 154902, "epoch": 3688} {"train_loss": -6.852446556091309, "global_step": 154903, "epoch": 3688} {"train_loss": -6.98137092590332, "global_step": 154904, "epoch": 3688} {"train_loss": -6.9199934005737305, "global_step": 154905, "epoch": 3688} {"train_loss": -7.042600631713867, "global_step": 154906, "epoch": 3688} {"train_loss": -6.868588447570801, "global_step": 154907, "epoch": 3688} {"train_loss": -6.892512321472168, "global_step": 154908, "epoch": 3688} {"train_loss": -6.8906450271606445, "global_step": 154909, "epoch": 3688} {"train_loss": -6.854825973510742, "global_step": 154910, "epoch": 3688} {"train_loss": -6.830677509307861, "global_step": 154911, "epoch": 3688} {"train_loss": -6.831109046936035, "global_step": 154912, "epoch": 3688} {"train_loss": -6.872251510620117, "global_step": 154913, "epoch": 3688} {"train_loss": -6.8790764808654785, "global_step": 154914, "epoch": 3688} {"train_loss": -6.857438087463379, "global_step": 154915, "epoch": 3688} {"train_loss": -6.9138994216918945, "global_step": 154916, "epoch": 3688} {"train_loss": -6.857292652130127, "global_step": 154917, "epoch": 3688} {"train_loss": -6.838808059692383, "global_step": 154918, "epoch": 3688} {"train_loss": -6.967914581298828, "global_step": 154919, "epoch": 3688} {"train_loss": -6.929516792297363, "global_step": 154920, "epoch": 3688} {"train_loss": -6.929128646850586, "global_step": 154921, "epoch": 3688} {"train_loss": -7.096120357513428, "global_step": 154922, "epoch": 3688} {"train_loss": -6.963109970092773, "global_step": 154923, "epoch": 3688} {"train_loss": -6.994513511657715, "global_step": 154924, "epoch": 3688} {"train_loss": -6.910438060760498, "global_step": 154925, "epoch": 3688} {"train_loss": -6.9774580001831055, "global_step": 154926, "epoch": 3688} {"train_loss": -7.040396213531494, "global_step": 154927, "epoch": 3688} {"train_loss": -6.7864885330200195, "global_step": 154928, "epoch": 3688} {"train_loss": -6.9584431648254395, "global_step": 154929, "epoch": 3688} {"train_loss": -7.0191473960876465, "global_step": 154930, "epoch": 3688} {"train_loss": -6.933675289154053, "global_step": 154931, "epoch": 3688} {"train_loss": -6.992081165313721, "global_step": 154932, "epoch": 3688} {"train_loss": -7.028130531311035, "global_step": 154933, "epoch": 3688} {"train_loss": -6.970242023468018, "global_step": 154934, "epoch": 3688} {"train_loss": -6.877801895141602, "global_step": 154935, "epoch": 3688} {"train_loss": -6.961757659912109, "global_step": 154936, "epoch": 3688} {"train_loss": -6.937545685541062, "global_step": 154937, "epoch": 3688, "val_loss": 79019.03125} {"train_loss": -6.960331916809082, "global_step": 154938, "epoch": 3689} {"train_loss": -6.9458537101745605, "global_step": 154939, "epoch": 3689} {"train_loss": -6.922959327697754, "global_step": 154940, "epoch": 3689} {"train_loss": -6.976320266723633, "global_step": 154941, "epoch": 3689} {"train_loss": -6.894652843475342, "global_step": 154942, "epoch": 3689} {"train_loss": -6.934893608093262, "global_step": 154943, "epoch": 3689} {"train_loss": -7.015148162841797, "global_step": 154944, "epoch": 3689} {"train_loss": -6.975096702575684, "global_step": 154945, "epoch": 3689} {"train_loss": -7.0320587158203125, "global_step": 154946, "epoch": 3689} {"train_loss": -6.986424446105957, "global_step": 154947, "epoch": 3689} {"train_loss": -6.943798542022705, "global_step": 154948, "epoch": 3689} {"train_loss": -7.015666484832764, "global_step": 154949, "epoch": 3689} {"train_loss": -6.9906721115112305, "global_step": 154950, "epoch": 3689} {"train_loss": -7.013424396514893, "global_step": 154951, "epoch": 3689} {"train_loss": -6.954233169555664, "global_step": 154952, "epoch": 3689} {"train_loss": -6.9245524406433105, "global_step": 154953, "epoch": 3689} {"train_loss": -6.876708030700684, "global_step": 154954, "epoch": 3689} {"train_loss": -7.029621601104736, "global_step": 154955, "epoch": 3689} {"train_loss": -6.8610124588012695, "global_step": 154956, "epoch": 3689} {"train_loss": -7.014325141906738, "global_step": 154957, "epoch": 3689} {"train_loss": -6.9296555519104, "global_step": 154958, "epoch": 3689} {"train_loss": -6.861019134521484, "global_step": 154959, "epoch": 3689} {"train_loss": -7.009742259979248, "global_step": 154960, "epoch": 3689} {"train_loss": -6.901101112365723, "global_step": 154961, "epoch": 3689} {"train_loss": -6.955019950866699, "global_step": 154962, "epoch": 3689} {"train_loss": -6.903100967407227, "global_step": 154963, "epoch": 3689} {"train_loss": -6.9434099197387695, "global_step": 154964, "epoch": 3689} {"train_loss": -7.0267014503479, "global_step": 154965, "epoch": 3689} {"train_loss": -7.026487350463867, "global_step": 154966, "epoch": 3689} {"train_loss": -7.036033630371094, "global_step": 154967, "epoch": 3689} {"train_loss": -6.939722061157227, "global_step": 154968, "epoch": 3689} {"train_loss": -6.980866432189941, "global_step": 154969, "epoch": 3689} {"train_loss": -6.974676132202148, "global_step": 154970, "epoch": 3689} {"train_loss": -6.914438247680664, "global_step": 154971, "epoch": 3689} {"train_loss": -6.889158725738525, "global_step": 154972, "epoch": 3689} {"train_loss": -6.892196178436279, "global_step": 154973, "epoch": 3689} {"train_loss": -7.0219807624816895, "global_step": 154974, "epoch": 3689} {"train_loss": -6.871545791625977, "global_step": 154975, "epoch": 3689} {"train_loss": -6.902285099029541, "global_step": 154976, "epoch": 3689} {"train_loss": -6.940718650817871, "global_step": 154977, "epoch": 3689} {"train_loss": -6.989007472991943, "global_step": 154978, "epoch": 3689} {"train_loss": -6.953368402662731, "global_step": 154979, "epoch": 3689, "val_loss": 78868.6875} {"train_loss": -6.933783531188965, "global_step": 154980, "epoch": 3690} {"train_loss": -6.9872612953186035, "global_step": 154981, "epoch": 3690} {"train_loss": -6.848997592926025, "global_step": 154982, "epoch": 3690} {"train_loss": -6.994326591491699, "global_step": 154983, "epoch": 3690} {"train_loss": -6.949178218841553, "global_step": 154984, "epoch": 3690} {"train_loss": -6.912526607513428, "global_step": 154985, "epoch": 3690} {"train_loss": -6.919898986816406, "global_step": 154986, "epoch": 3690} {"train_loss": -6.972515106201172, "global_step": 154987, "epoch": 3690} {"train_loss": -7.018242359161377, "global_step": 154988, "epoch": 3690} {"train_loss": -6.981985569000244, "global_step": 154989, "epoch": 3690} {"train_loss": -6.910403728485107, "global_step": 154990, "epoch": 3690} {"train_loss": -6.794501304626465, "global_step": 154991, "epoch": 3690} {"train_loss": -6.939665794372559, "global_step": 154992, "epoch": 3690} {"train_loss": -6.749983787536621, "global_step": 154993, "epoch": 3690} {"train_loss": -6.914000511169434, "global_step": 154994, "epoch": 3690} {"train_loss": -6.8739752769470215, "global_step": 154995, "epoch": 3690} {"train_loss": -6.872125625610352, "global_step": 154996, "epoch": 3690} {"train_loss": -6.990977764129639, "global_step": 154997, "epoch": 3690} {"train_loss": -6.843428134918213, "global_step": 154998, "epoch": 3690} {"train_loss": -6.832492351531982, "global_step": 154999, "epoch": 3690} {"train_loss": -6.98390007019043, "global_step": 155000, "epoch": 3690} {"train_loss": -6.938290596008301, "global_step": 155001, "epoch": 3690} {"train_loss": -7.002936363220215, "global_step": 155002, "epoch": 3690} {"train_loss": -6.814389705657959, "global_step": 155003, "epoch": 3690} {"train_loss": -6.837328910827637, "global_step": 155004, "epoch": 3690} {"train_loss": -6.898982048034668, "global_step": 155005, "epoch": 3690} {"train_loss": -7.0165276527404785, "global_step": 155006, "epoch": 3690} {"train_loss": -6.827254295349121, "global_step": 155007, "epoch": 3690} {"train_loss": -6.843811988830566, "global_step": 155008, "epoch": 3690} {"train_loss": -6.842931747436523, "global_step": 155009, "epoch": 3690} {"train_loss": -6.732181549072266, "global_step": 155010, "epoch": 3690} {"train_loss": -6.973931312561035, "global_step": 155011, "epoch": 3690} {"train_loss": -6.892435550689697, "global_step": 155012, "epoch": 3690} {"train_loss": -6.963994979858398, "global_step": 155013, "epoch": 3690} {"train_loss": -6.950803756713867, "global_step": 155014, "epoch": 3690} {"train_loss": -6.90391731262207, "global_step": 155015, "epoch": 3690} {"train_loss": -6.920385360717773, "global_step": 155016, "epoch": 3690} {"train_loss": -6.927770137786865, "global_step": 155017, "epoch": 3690} {"train_loss": -6.840291976928711, "global_step": 155018, "epoch": 3690} {"train_loss": -6.9065752029418945, "global_step": 155019, "epoch": 3690} {"train_loss": -6.662206172943115, "global_step": 155020, "epoch": 3690} {"train_loss": -6.90035917645409, "global_step": 155021, "epoch": 3690, "val_loss": 78984.5625} {"train_loss": -6.9346699714660645, "global_step": 155022, "epoch": 3691} {"train_loss": -6.871732234954834, "global_step": 155023, "epoch": 3691} {"train_loss": -6.915987968444824, "global_step": 155024, "epoch": 3691} {"train_loss": -6.924403190612793, "global_step": 155025, "epoch": 3691} {"train_loss": -6.876934051513672, "global_step": 155026, "epoch": 3691} {"train_loss": -7.042348861694336, "global_step": 155027, "epoch": 3691} {"train_loss": -6.983948707580566, "global_step": 155028, "epoch": 3691} {"train_loss": -6.893237113952637, "global_step": 155029, "epoch": 3691} {"train_loss": -6.781881809234619, "global_step": 155030, "epoch": 3691} {"train_loss": -6.959764003753662, "global_step": 155031, "epoch": 3691} {"train_loss": -6.943739891052246, "global_step": 155032, "epoch": 3691} {"train_loss": -6.962733268737793, "global_step": 155033, "epoch": 3691} {"train_loss": -6.904840469360352, "global_step": 155034, "epoch": 3691} {"train_loss": -6.869997024536133, "global_step": 155035, "epoch": 3691} {"train_loss": -6.901623725891113, "global_step": 155036, "epoch": 3691} {"train_loss": -6.895848274230957, "global_step": 155037, "epoch": 3691} {"train_loss": -6.817408084869385, "global_step": 155038, "epoch": 3691} {"train_loss": -6.895139694213867, "global_step": 155039, "epoch": 3691} {"train_loss": -6.8964385986328125, "global_step": 155040, "epoch": 3691} {"train_loss": -6.986148357391357, "global_step": 155041, "epoch": 3691} {"train_loss": -6.873589038848877, "global_step": 155042, "epoch": 3691} {"train_loss": -6.8326334953308105, "global_step": 155043, "epoch": 3691} {"train_loss": -6.909470558166504, "global_step": 155044, "epoch": 3691} {"train_loss": -6.903690338134766, "global_step": 155045, "epoch": 3691} {"train_loss": -6.92474365234375, "global_step": 155046, "epoch": 3691} {"train_loss": -6.923755645751953, "global_step": 155047, "epoch": 3691} {"train_loss": -6.934701919555664, "global_step": 155048, "epoch": 3691} {"train_loss": -6.940825462341309, "global_step": 155049, "epoch": 3691} {"train_loss": -6.947562217712402, "global_step": 155050, "epoch": 3691} {"train_loss": -6.816423416137695, "global_step": 155051, "epoch": 3691} {"train_loss": -6.950325965881348, "global_step": 155052, "epoch": 3691} {"train_loss": -6.805405139923096, "global_step": 155053, "epoch": 3691} {"train_loss": -6.9409379959106445, "global_step": 155054, "epoch": 3691} {"train_loss": -6.833836555480957, "global_step": 155055, "epoch": 3691} {"train_loss": -6.852109909057617, "global_step": 155056, "epoch": 3691} {"train_loss": -6.774664878845215, "global_step": 155057, "epoch": 3691} {"train_loss": -6.873600959777832, "global_step": 155058, "epoch": 3691} {"train_loss": -6.799780368804932, "global_step": 155059, "epoch": 3691} {"train_loss": -6.812664031982422, "global_step": 155060, "epoch": 3691} {"train_loss": -6.766195297241211, "global_step": 155061, "epoch": 3691} {"train_loss": -6.654674530029297, "global_step": 155062, "epoch": 3691} {"train_loss": -6.888350872766404, "global_step": 155063, "epoch": 3691, "val_loss": 78835.78125} {"train_loss": -6.689704895019531, "global_step": 155064, "epoch": 3692} {"train_loss": -6.827056884765625, "global_step": 155065, "epoch": 3692} {"train_loss": -6.864153861999512, "global_step": 155066, "epoch": 3692} {"train_loss": -6.8209381103515625, "global_step": 155067, "epoch": 3692} {"train_loss": -6.813685894012451, "global_step": 155068, "epoch": 3692} {"train_loss": -6.809138298034668, "global_step": 155069, "epoch": 3692} {"train_loss": -6.879389762878418, "global_step": 155070, "epoch": 3692} {"train_loss": -6.800900459289551, "global_step": 155071, "epoch": 3692} {"train_loss": -6.8858489990234375, "global_step": 155072, "epoch": 3692} {"train_loss": -6.77886962890625, "global_step": 155073, "epoch": 3692} {"train_loss": -6.915415287017822, "global_step": 155074, "epoch": 3692} {"train_loss": -6.971343040466309, "global_step": 155075, "epoch": 3692} {"train_loss": -6.811398506164551, "global_step": 155076, "epoch": 3692} {"train_loss": -6.855607509613037, "global_step": 155077, "epoch": 3692} {"train_loss": -6.707202434539795, "global_step": 155078, "epoch": 3692} {"train_loss": -6.7609734535217285, "global_step": 155079, "epoch": 3692} {"train_loss": -6.78702449798584, "global_step": 155080, "epoch": 3692} {"train_loss": -6.886205196380615, "global_step": 155081, "epoch": 3692} {"train_loss": -6.752407073974609, "global_step": 155082, "epoch": 3692} {"train_loss": -6.795581817626953, "global_step": 155083, "epoch": 3692} {"train_loss": -6.978738784790039, "global_step": 155084, "epoch": 3692} {"train_loss": -6.7116618156433105, "global_step": 155085, "epoch": 3692} {"train_loss": -6.869034290313721, "global_step": 155086, "epoch": 3692} {"train_loss": -6.75990104675293, "global_step": 155087, "epoch": 3692} {"train_loss": -6.79586124420166, "global_step": 155088, "epoch": 3692} {"train_loss": -6.798347473144531, "global_step": 155089, "epoch": 3692} {"train_loss": -6.845533847808838, "global_step": 155090, "epoch": 3692} {"train_loss": -6.7689738273620605, "global_step": 155091, "epoch": 3692} {"train_loss": -6.77059268951416, "global_step": 155092, "epoch": 3692} {"train_loss": -6.873287200927734, "global_step": 155093, "epoch": 3692} {"train_loss": -6.8592987060546875, "global_step": 155094, "epoch": 3692} {"train_loss": -6.833402633666992, "global_step": 155095, "epoch": 3692} {"train_loss": -6.831384658813477, "global_step": 155096, "epoch": 3692} {"train_loss": -6.888726234436035, "global_step": 155097, "epoch": 3692} {"train_loss": -6.917728900909424, "global_step": 155098, "epoch": 3692} {"train_loss": -6.9343109130859375, "global_step": 155099, "epoch": 3692} {"train_loss": -6.9759931564331055, "global_step": 155100, "epoch": 3692} {"train_loss": -6.961186408996582, "global_step": 155101, "epoch": 3692} {"train_loss": -6.948585510253906, "global_step": 155102, "epoch": 3692} {"train_loss": -6.911569595336914, "global_step": 155103, "epoch": 3692} {"train_loss": -6.933320045471191, "global_step": 155104, "epoch": 3692} {"train_loss": -6.84366496404012, "global_step": 155105, "epoch": 3692, "val_loss": 79043.1015625} {"train_loss": -6.8675031661987305, "global_step": 155106, "epoch": 3693} {"train_loss": -6.9416279792785645, "global_step": 155107, "epoch": 3693} {"train_loss": -6.930140495300293, "global_step": 155108, "epoch": 3693} {"train_loss": -6.958728790283203, "global_step": 155109, "epoch": 3693} {"train_loss": -6.894309997558594, "global_step": 155110, "epoch": 3693} {"train_loss": -6.9512810707092285, "global_step": 155111, "epoch": 3693} {"train_loss": -6.883554458618164, "global_step": 155112, "epoch": 3693} {"train_loss": -6.923887252807617, "global_step": 155113, "epoch": 3693} {"train_loss": -6.902451992034912, "global_step": 155114, "epoch": 3693} {"train_loss": -6.955953598022461, "global_step": 155115, "epoch": 3693} {"train_loss": -6.934778213500977, "global_step": 155116, "epoch": 3693} {"train_loss": -6.980253219604492, "global_step": 155117, "epoch": 3693} {"train_loss": -7.060197353363037, "global_step": 155118, "epoch": 3693} {"train_loss": -6.819549560546875, "global_step": 155119, "epoch": 3693} {"train_loss": -6.939189910888672, "global_step": 155120, "epoch": 3693} {"train_loss": -7.004934310913086, "global_step": 155121, "epoch": 3693} {"train_loss": -6.894414901733398, "global_step": 155122, "epoch": 3693} {"train_loss": -6.933985710144043, "global_step": 155123, "epoch": 3693} {"train_loss": -6.918483257293701, "global_step": 155124, "epoch": 3693} {"train_loss": -6.975678443908691, "global_step": 155125, "epoch": 3693} {"train_loss": -7.014966011047363, "global_step": 155126, "epoch": 3693} {"train_loss": -6.960343837738037, "global_step": 155127, "epoch": 3693} {"train_loss": -6.886076927185059, "global_step": 155128, "epoch": 3693} {"train_loss": -6.888952255249023, "global_step": 155129, "epoch": 3693} {"train_loss": -6.863222599029541, "global_step": 155130, "epoch": 3693} {"train_loss": -7.023344039916992, "global_step": 155131, "epoch": 3693} {"train_loss": -7.011242866516113, "global_step": 155132, "epoch": 3693} {"train_loss": -6.825610637664795, "global_step": 155133, "epoch": 3693} {"train_loss": -6.886090278625488, "global_step": 155134, "epoch": 3693} {"train_loss": -6.936400890350342, "global_step": 155135, "epoch": 3693} {"train_loss": -7.03531551361084, "global_step": 155136, "epoch": 3693} {"train_loss": -6.971287727355957, "global_step": 155137, "epoch": 3693} {"train_loss": -6.921908855438232, "global_step": 155138, "epoch": 3693} {"train_loss": -6.837002277374268, "global_step": 155139, "epoch": 3693} {"train_loss": -6.979023456573486, "global_step": 155140, "epoch": 3693} {"train_loss": -6.835221290588379, "global_step": 155141, "epoch": 3693} {"train_loss": -6.975213050842285, "global_step": 155142, "epoch": 3693} {"train_loss": -6.9765777587890625, "global_step": 155143, "epoch": 3693} {"train_loss": -6.888564586639404, "global_step": 155144, "epoch": 3693} {"train_loss": -6.9842209815979, "global_step": 155145, "epoch": 3693} {"train_loss": -6.9067792892456055, "global_step": 155146, "epoch": 3693} {"train_loss": -6.931227298009963, "global_step": 155147, "epoch": 3693, "val_loss": 79172.9609375} {"train_loss": -6.93086051940918, "global_step": 155148, "epoch": 3694} {"train_loss": -6.834856033325195, "global_step": 155149, "epoch": 3694} {"train_loss": -6.9557294845581055, "global_step": 155150, "epoch": 3694} {"train_loss": -6.830245018005371, "global_step": 155151, "epoch": 3694} {"train_loss": -7.051787376403809, "global_step": 155152, "epoch": 3694} {"train_loss": -6.808072090148926, "global_step": 155153, "epoch": 3694} {"train_loss": -6.731441497802734, "global_step": 155154, "epoch": 3694} {"train_loss": -6.865738868713379, "global_step": 155155, "epoch": 3694} {"train_loss": -6.753146648406982, "global_step": 155156, "epoch": 3694} {"train_loss": -6.954761028289795, "global_step": 155157, "epoch": 3694} {"train_loss": -6.829493999481201, "global_step": 155158, "epoch": 3694} {"train_loss": -6.76427698135376, "global_step": 155159, "epoch": 3694} {"train_loss": -6.87657356262207, "global_step": 155160, "epoch": 3694} {"train_loss": -6.841325283050537, "global_step": 155161, "epoch": 3694} {"train_loss": -6.959734916687012, "global_step": 155162, "epoch": 3694} {"train_loss": -6.94264030456543, "global_step": 155163, "epoch": 3694} {"train_loss": -6.717633247375488, "global_step": 155164, "epoch": 3694} {"train_loss": -6.853599548339844, "global_step": 155165, "epoch": 3694} {"train_loss": -6.680224418640137, "global_step": 155166, "epoch": 3694} {"train_loss": -6.853414535522461, "global_step": 155167, "epoch": 3694} {"train_loss": -6.650589942932129, "global_step": 155168, "epoch": 3694} {"train_loss": -6.765350341796875, "global_step": 155169, "epoch": 3694} {"train_loss": -6.847647190093994, "global_step": 155170, "epoch": 3694} {"train_loss": -6.703713417053223, "global_step": 155171, "epoch": 3694} {"train_loss": -6.916182518005371, "global_step": 155172, "epoch": 3694} {"train_loss": -6.863986968994141, "global_step": 155173, "epoch": 3694} {"train_loss": -6.753729343414307, "global_step": 155174, "epoch": 3694} {"train_loss": -6.86128568649292, "global_step": 155175, "epoch": 3694} {"train_loss": -6.747896671295166, "global_step": 155176, "epoch": 3694} {"train_loss": -6.949969291687012, "global_step": 155177, "epoch": 3694} {"train_loss": -6.6916656494140625, "global_step": 155178, "epoch": 3694} {"train_loss": -6.887548923492432, "global_step": 155179, "epoch": 3694} {"train_loss": -6.735518455505371, "global_step": 155180, "epoch": 3694} {"train_loss": -6.90679931640625, "global_step": 155181, "epoch": 3694} {"train_loss": -6.933880805969238, "global_step": 155182, "epoch": 3694} {"train_loss": -6.904067516326904, "global_step": 155183, "epoch": 3694} {"train_loss": -6.888110160827637, "global_step": 155184, "epoch": 3694} {"train_loss": -6.919559478759766, "global_step": 155185, "epoch": 3694} {"train_loss": -6.846540451049805, "global_step": 155186, "epoch": 3694} {"train_loss": -6.89461612701416, "global_step": 155187, "epoch": 3694} {"train_loss": -6.835536003112793, "global_step": 155188, "epoch": 3694} {"train_loss": -6.845678386234102, "global_step": 155189, "epoch": 3694, "val_loss": 79116.890625} {"train_loss": -7.012935161590576, "global_step": 155190, "epoch": 3695} {"train_loss": -6.899332523345947, "global_step": 155191, "epoch": 3695} {"train_loss": -6.980674743652344, "global_step": 155192, "epoch": 3695} {"train_loss": -6.768618106842041, "global_step": 155193, "epoch": 3695} {"train_loss": -6.905442237854004, "global_step": 155194, "epoch": 3695} {"train_loss": -6.951790809631348, "global_step": 155195, "epoch": 3695} {"train_loss": -6.830209732055664, "global_step": 155196, "epoch": 3695} {"train_loss": -6.951790809631348, "global_step": 155197, "epoch": 3695} {"train_loss": -6.958673477172852, "global_step": 155198, "epoch": 3695} {"train_loss": -6.903772830963135, "global_step": 155199, "epoch": 3695} {"train_loss": -6.996781349182129, "global_step": 155200, "epoch": 3695} {"train_loss": -6.896684646606445, "global_step": 155201, "epoch": 3695} {"train_loss": -6.86811637878418, "global_step": 155202, "epoch": 3695} {"train_loss": -7.041556358337402, "global_step": 155203, "epoch": 3695} {"train_loss": -6.954738616943359, "global_step": 155204, "epoch": 3695} {"train_loss": -6.874960899353027, "global_step": 155205, "epoch": 3695} {"train_loss": -6.96066951751709, "global_step": 155206, "epoch": 3695} {"train_loss": -6.933494567871094, "global_step": 155207, "epoch": 3695} {"train_loss": -6.919909477233887, "global_step": 155208, "epoch": 3695} {"train_loss": -6.834073066711426, "global_step": 155209, "epoch": 3695} {"train_loss": -6.845006942749023, "global_step": 155210, "epoch": 3695} {"train_loss": -6.789072036743164, "global_step": 155211, "epoch": 3695} {"train_loss": -6.902611255645752, "global_step": 155212, "epoch": 3695} {"train_loss": -6.974282264709473, "global_step": 155213, "epoch": 3695} {"train_loss": -6.96470832824707, "global_step": 155214, "epoch": 3695} {"train_loss": -6.871054172515869, "global_step": 155215, "epoch": 3695} {"train_loss": -6.8297247886657715, "global_step": 155216, "epoch": 3695} {"train_loss": -6.674353122711182, "global_step": 155217, "epoch": 3695} {"train_loss": -6.978302955627441, "global_step": 155218, "epoch": 3695} {"train_loss": -6.90334415435791, "global_step": 155219, "epoch": 3695} {"train_loss": -6.9493584632873535, "global_step": 155220, "epoch": 3695} {"train_loss": -6.840593338012695, "global_step": 155221, "epoch": 3695} {"train_loss": -6.794665336608887, "global_step": 155222, "epoch": 3695} {"train_loss": -6.937651634216309, "global_step": 155223, "epoch": 3695} {"train_loss": -6.816515922546387, "global_step": 155224, "epoch": 3695} {"train_loss": -6.90413236618042, "global_step": 155225, "epoch": 3695} {"train_loss": -6.805512428283691, "global_step": 155226, "epoch": 3695} {"train_loss": -6.812493324279785, "global_step": 155227, "epoch": 3695} {"train_loss": -6.885275840759277, "global_step": 155228, "epoch": 3695} {"train_loss": -6.630300521850586, "global_step": 155229, "epoch": 3695} {"train_loss": -6.6844282150268555, "global_step": 155230, "epoch": 3695} {"train_loss": -6.883313701266334, "global_step": 155231, "epoch": 3695, "val_loss": 79125.2109375} {"train_loss": -6.625585556030273, "global_step": 155232, "epoch": 3696} {"train_loss": -6.8790435791015625, "global_step": 155233, "epoch": 3696} {"train_loss": -6.782317161560059, "global_step": 155234, "epoch": 3696} {"train_loss": -6.827009677886963, "global_step": 155235, "epoch": 3696} {"train_loss": -6.79482364654541, "global_step": 155236, "epoch": 3696} {"train_loss": -6.831650733947754, "global_step": 155237, "epoch": 3696} {"train_loss": -6.850554466247559, "global_step": 155238, "epoch": 3696} {"train_loss": -6.8104472160339355, "global_step": 155239, "epoch": 3696} {"train_loss": -6.8436737060546875, "global_step": 155240, "epoch": 3696} {"train_loss": -6.833076477050781, "global_step": 155241, "epoch": 3696} {"train_loss": -6.762399673461914, "global_step": 155242, "epoch": 3696} {"train_loss": -6.876664161682129, "global_step": 155243, "epoch": 3696} {"train_loss": -6.826669692993164, "global_step": 155244, "epoch": 3696} {"train_loss": -6.812606334686279, "global_step": 155245, "epoch": 3696} {"train_loss": -6.881614685058594, "global_step": 155246, "epoch": 3696} {"train_loss": -7.061386585235596, "global_step": 155247, "epoch": 3696} {"train_loss": -6.845854759216309, "global_step": 155248, "epoch": 3696} {"train_loss": -6.836682319641113, "global_step": 155249, "epoch": 3696} {"train_loss": -6.906319618225098, "global_step": 155250, "epoch": 3696} {"train_loss": -6.872608661651611, "global_step": 155251, "epoch": 3696} {"train_loss": -7.007391929626465, "global_step": 155252, "epoch": 3696} {"train_loss": -6.911571979522705, "global_step": 155253, "epoch": 3696} {"train_loss": -6.893467903137207, "global_step": 155254, "epoch": 3696} {"train_loss": -6.9300456047058105, "global_step": 155255, "epoch": 3696} {"train_loss": -6.95474100112915, "global_step": 155256, "epoch": 3696} {"train_loss": -6.914968013763428, "global_step": 155257, "epoch": 3696} {"train_loss": -7.03019905090332, "global_step": 155258, "epoch": 3696} {"train_loss": -6.800930500030518, "global_step": 155259, "epoch": 3696} {"train_loss": -6.976086616516113, "global_step": 155260, "epoch": 3696} {"train_loss": -6.8891167640686035, "global_step": 155261, "epoch": 3696} {"train_loss": -6.831414222717285, "global_step": 155262, "epoch": 3696} {"train_loss": -6.841400146484375, "global_step": 155263, "epoch": 3696} {"train_loss": -6.850987434387207, "global_step": 155264, "epoch": 3696} {"train_loss": -6.8787055015563965, "global_step": 155265, "epoch": 3696} {"train_loss": -7.058306694030762, "global_step": 155266, "epoch": 3696} {"train_loss": -6.864017486572266, "global_step": 155267, "epoch": 3696} {"train_loss": -6.962954521179199, "global_step": 155268, "epoch": 3696} {"train_loss": -7.029052734375, "global_step": 155269, "epoch": 3696} {"train_loss": -6.835931777954102, "global_step": 155270, "epoch": 3696} {"train_loss": -6.876769542694092, "global_step": 155271, "epoch": 3696} {"train_loss": -6.728255271911621, "global_step": 155272, "epoch": 3696} {"train_loss": -6.872039942514329, "global_step": 155273, "epoch": 3696, "val_loss": 78979.78125} {"train_loss": -6.905468940734863, "global_step": 155274, "epoch": 3697} {"train_loss": -6.7858757972717285, "global_step": 155275, "epoch": 3697} {"train_loss": -7.009076118469238, "global_step": 155276, "epoch": 3697} {"train_loss": -6.891750812530518, "global_step": 155277, "epoch": 3697} {"train_loss": -6.860476493835449, "global_step": 155278, "epoch": 3697} {"train_loss": -6.950336456298828, "global_step": 155279, "epoch": 3697} {"train_loss": -6.712209224700928, "global_step": 155280, "epoch": 3697} {"train_loss": -6.899809837341309, "global_step": 155281, "epoch": 3697} {"train_loss": -6.634819984436035, "global_step": 155282, "epoch": 3697} {"train_loss": -6.994718551635742, "global_step": 155283, "epoch": 3697} {"train_loss": -6.755908966064453, "global_step": 155284, "epoch": 3697} {"train_loss": -6.949671745300293, "global_step": 155285, "epoch": 3697} {"train_loss": -6.8633575439453125, "global_step": 155286, "epoch": 3697} {"train_loss": -6.82070255279541, "global_step": 155287, "epoch": 3697} {"train_loss": -6.848281383514404, "global_step": 155288, "epoch": 3697} {"train_loss": -6.866259574890137, "global_step": 155289, "epoch": 3697} {"train_loss": -6.8583502769470215, "global_step": 155290, "epoch": 3697} {"train_loss": -6.903932571411133, "global_step": 155291, "epoch": 3697} {"train_loss": -6.96979284286499, "global_step": 155292, "epoch": 3697} {"train_loss": -6.937544822692871, "global_step": 155293, "epoch": 3697} {"train_loss": -6.859897136688232, "global_step": 155294, "epoch": 3697} {"train_loss": -6.88882303237915, "global_step": 155295, "epoch": 3697} {"train_loss": -6.895181655883789, "global_step": 155296, "epoch": 3697} {"train_loss": -6.853949546813965, "global_step": 155297, "epoch": 3697} {"train_loss": -6.9057297706604, "global_step": 155298, "epoch": 3697} {"train_loss": -6.963711738586426, "global_step": 155299, "epoch": 3697} {"train_loss": -7.068875312805176, "global_step": 155300, "epoch": 3697} {"train_loss": -6.930129051208496, "global_step": 155301, "epoch": 3697} {"train_loss": -6.9635419845581055, "global_step": 155302, "epoch": 3697} {"train_loss": -6.961202144622803, "global_step": 155303, "epoch": 3697} {"train_loss": -6.960665225982666, "global_step": 155304, "epoch": 3697} {"train_loss": -6.911032199859619, "global_step": 155305, "epoch": 3697} {"train_loss": -7.04945182800293, "global_step": 155306, "epoch": 3697} {"train_loss": -6.939700603485107, "global_step": 155307, "epoch": 3697} {"train_loss": -6.866929054260254, "global_step": 155308, "epoch": 3697} {"train_loss": -6.832538604736328, "global_step": 155309, "epoch": 3697} {"train_loss": -6.891134262084961, "global_step": 155310, "epoch": 3697} {"train_loss": -6.862151622772217, "global_step": 155311, "epoch": 3697} {"train_loss": -6.90254020690918, "global_step": 155312, "epoch": 3697} {"train_loss": -7.001081466674805, "global_step": 155313, "epoch": 3697} {"train_loss": -6.788244247436523, "global_step": 155314, "epoch": 3697} {"train_loss": -6.893086739948818, "global_step": 155315, "epoch": 3697, "val_loss": 78992.8125} {"train_loss": -6.971015930175781, "global_step": 155316, "epoch": 3698} {"train_loss": -6.617590427398682, "global_step": 155317, "epoch": 3698} {"train_loss": -6.859133243560791, "global_step": 155318, "epoch": 3698} {"train_loss": -6.829082489013672, "global_step": 155319, "epoch": 3698} {"train_loss": -6.802548885345459, "global_step": 155320, "epoch": 3698} {"train_loss": -6.862082004547119, "global_step": 155321, "epoch": 3698} {"train_loss": -6.920090198516846, "global_step": 155322, "epoch": 3698} {"train_loss": -6.833281517028809, "global_step": 155323, "epoch": 3698} {"train_loss": -6.942047595977783, "global_step": 155324, "epoch": 3698} {"train_loss": -6.785152435302734, "global_step": 155325, "epoch": 3698} {"train_loss": -6.810083866119385, "global_step": 155326, "epoch": 3698} {"train_loss": -6.8479156494140625, "global_step": 155327, "epoch": 3698} {"train_loss": -6.778862953186035, "global_step": 155328, "epoch": 3698} {"train_loss": -7.006437301635742, "global_step": 155329, "epoch": 3698} {"train_loss": -6.765303611755371, "global_step": 155330, "epoch": 3698} {"train_loss": -6.852412700653076, "global_step": 155331, "epoch": 3698} {"train_loss": -6.781063556671143, "global_step": 155332, "epoch": 3698} {"train_loss": -6.864325523376465, "global_step": 155333, "epoch": 3698} {"train_loss": -6.864295482635498, "global_step": 155334, "epoch": 3698} {"train_loss": -6.890876770019531, "global_step": 155335, "epoch": 3698} {"train_loss": -6.961976051330566, "global_step": 155336, "epoch": 3698} {"train_loss": -6.977110862731934, "global_step": 155337, "epoch": 3698} {"train_loss": -6.967142105102539, "global_step": 155338, "epoch": 3698} {"train_loss": -6.870020866394043, "global_step": 155339, "epoch": 3698} {"train_loss": -6.882264137268066, "global_step": 155340, "epoch": 3698} {"train_loss": -6.78336238861084, "global_step": 155341, "epoch": 3698} {"train_loss": -6.95721960067749, "global_step": 155342, "epoch": 3698} {"train_loss": -6.918572425842285, "global_step": 155343, "epoch": 3698} {"train_loss": -6.948911666870117, "global_step": 155344, "epoch": 3698} {"train_loss": -6.915971279144287, "global_step": 155345, "epoch": 3698} {"train_loss": -6.992772102355957, "global_step": 155346, "epoch": 3698} {"train_loss": -6.85632848739624, "global_step": 155347, "epoch": 3698} {"train_loss": -7.003674507141113, "global_step": 155348, "epoch": 3698} {"train_loss": -6.97483491897583, "global_step": 155349, "epoch": 3698} {"train_loss": -6.934974670410156, "global_step": 155350, "epoch": 3698} {"train_loss": -6.895720481872559, "global_step": 155351, "epoch": 3698} {"train_loss": -6.885817527770996, "global_step": 155352, "epoch": 3698} {"train_loss": -7.057884216308594, "global_step": 155353, "epoch": 3698} {"train_loss": -6.89617395401001, "global_step": 155354, "epoch": 3698} {"train_loss": -6.869661808013916, "global_step": 155355, "epoch": 3698} {"train_loss": -6.967595100402832, "global_step": 155356, "epoch": 3698} {"train_loss": -6.8868418988727385, "global_step": 155357, "epoch": 3698, "val_loss": 78878.15625} {"train_loss": -6.865103721618652, "global_step": 155358, "epoch": 3699} {"train_loss": -7.045571804046631, "global_step": 155359, "epoch": 3699} {"train_loss": -6.951685905456543, "global_step": 155360, "epoch": 3699} {"train_loss": -6.894283294677734, "global_step": 155361, "epoch": 3699} {"train_loss": -6.963052749633789, "global_step": 155362, "epoch": 3699} {"train_loss": -7.011360168457031, "global_step": 155363, "epoch": 3699} {"train_loss": -7.018188953399658, "global_step": 155364, "epoch": 3699} {"train_loss": -6.93219518661499, "global_step": 155365, "epoch": 3699} {"train_loss": -7.087275505065918, "global_step": 155366, "epoch": 3699} {"train_loss": -6.931403160095215, "global_step": 155367, "epoch": 3699} {"train_loss": -7.066301345825195, "global_step": 155368, "epoch": 3699} {"train_loss": -6.9512434005737305, "global_step": 155369, "epoch": 3699} {"train_loss": -6.794163703918457, "global_step": 155370, "epoch": 3699} {"train_loss": -6.900581359863281, "global_step": 155371, "epoch": 3699} {"train_loss": -6.954306602478027, "global_step": 155372, "epoch": 3699} {"train_loss": -6.883345603942871, "global_step": 155373, "epoch": 3699} {"train_loss": -6.866484642028809, "global_step": 155374, "epoch": 3699} {"train_loss": -6.927516937255859, "global_step": 155375, "epoch": 3699} {"train_loss": -6.900484085083008, "global_step": 155376, "epoch": 3699} {"train_loss": -7.024896621704102, "global_step": 155377, "epoch": 3699} {"train_loss": -6.942692756652832, "global_step": 155378, "epoch": 3699} {"train_loss": -6.944146156311035, "global_step": 155379, "epoch": 3699} {"train_loss": -6.847797393798828, "global_step": 155380, "epoch": 3699} {"train_loss": -6.955972194671631, "global_step": 155381, "epoch": 3699} {"train_loss": -6.937621593475342, "global_step": 155382, "epoch": 3699} {"train_loss": -6.8099284172058105, "global_step": 155383, "epoch": 3699} {"train_loss": -6.855037689208984, "global_step": 155384, "epoch": 3699} {"train_loss": -6.8720245361328125, "global_step": 155385, "epoch": 3699} {"train_loss": -6.93624210357666, "global_step": 155386, "epoch": 3699} {"train_loss": -6.939658164978027, "global_step": 155387, "epoch": 3699} {"train_loss": -7.042909622192383, "global_step": 155388, "epoch": 3699} {"train_loss": -6.953963756561279, "global_step": 155389, "epoch": 3699} {"train_loss": -6.839733600616455, "global_step": 155390, "epoch": 3699} {"train_loss": -6.966823577880859, "global_step": 155391, "epoch": 3699} {"train_loss": -6.972653388977051, "global_step": 155392, "epoch": 3699} {"train_loss": -6.8171892166137695, "global_step": 155393, "epoch": 3699} {"train_loss": -6.867147922515869, "global_step": 155394, "epoch": 3699} {"train_loss": -6.903756141662598, "global_step": 155395, "epoch": 3699} {"train_loss": -6.841318130493164, "global_step": 155396, "epoch": 3699} {"train_loss": -6.840253829956055, "global_step": 155397, "epoch": 3699} {"train_loss": -7.012014865875244, "global_step": 155398, "epoch": 3699} {"train_loss": -6.924375897362118, "global_step": 155399, "epoch": 3699, "val_loss": 79123.171875} {"train_loss": -6.9775590896606445, "global_step": 155400, "epoch": 3700} {"train_loss": -6.846473217010498, "global_step": 155401, "epoch": 3700} {"train_loss": -6.814397811889648, "global_step": 155402, "epoch": 3700} {"train_loss": -6.990392208099365, "global_step": 155403, "epoch": 3700} {"train_loss": -6.929114818572998, "global_step": 155404, "epoch": 3700} {"train_loss": -6.961583614349365, "global_step": 155405, "epoch": 3700} {"train_loss": -6.848536491394043, "global_step": 155406, "epoch": 3700} {"train_loss": -6.822266578674316, "global_step": 155407, "epoch": 3700} {"train_loss": -6.96732759475708, "global_step": 155408, "epoch": 3700} {"train_loss": -6.82867431640625, "global_step": 155409, "epoch": 3700} {"train_loss": -6.796869277954102, "global_step": 155410, "epoch": 3700} {"train_loss": -6.90619421005249, "global_step": 155411, "epoch": 3700} {"train_loss": -6.930805206298828, "global_step": 155412, "epoch": 3700} {"train_loss": -7.05183744430542, "global_step": 155413, "epoch": 3700} {"train_loss": -6.924112319946289, "global_step": 155414, "epoch": 3700} {"train_loss": -6.86168098449707, "global_step": 155415, "epoch": 3700} {"train_loss": -6.967829704284668, "global_step": 155416, "epoch": 3700} {"train_loss": -6.853452682495117, "global_step": 155417, "epoch": 3700} {"train_loss": -6.946990013122559, "global_step": 155418, "epoch": 3700} {"train_loss": -6.914237976074219, "global_step": 155419, "epoch": 3700} {"train_loss": -6.894891262054443, "global_step": 155420, "epoch": 3700} {"train_loss": -6.890567779541016, "global_step": 155421, "epoch": 3700} {"train_loss": -6.884245872497559, "global_step": 155422, "epoch": 3700} {"train_loss": -6.907355308532715, "global_step": 155423, "epoch": 3700} {"train_loss": -6.938220977783203, "global_step": 155424, "epoch": 3700} {"train_loss": -6.9877610206604, "global_step": 155425, "epoch": 3700} {"train_loss": -7.001593589782715, "global_step": 155426, "epoch": 3700} {"train_loss": -6.939159393310547, "global_step": 155427, "epoch": 3700} {"train_loss": -6.856903076171875, "global_step": 155428, "epoch": 3700} {"train_loss": -6.8247575759887695, "global_step": 155429, "epoch": 3700} {"train_loss": -6.985261917114258, "global_step": 155430, "epoch": 3700} {"train_loss": -6.660847187042236, "global_step": 155431, "epoch": 3700} {"train_loss": -6.936770439147949, "global_step": 155432, "epoch": 3700} {"train_loss": -6.870510101318359, "global_step": 155433, "epoch": 3700} {"train_loss": -6.937657833099365, "global_step": 155434, "epoch": 3700} {"train_loss": -6.822351932525635, "global_step": 155435, "epoch": 3700} {"train_loss": -6.90044641494751, "global_step": 155436, "epoch": 3700} {"train_loss": -6.835428237915039, "global_step": 155437, "epoch": 3700} {"train_loss": -6.902059555053711, "global_step": 155438, "epoch": 3700} {"train_loss": -6.869016647338867, "global_step": 155439, "epoch": 3700} {"train_loss": -7.031198024749756, "global_step": 155440, "epoch": 3700} {"train_loss": -6.902713219324748, "global_step": 155441, "epoch": 3700, "train/sim_max_reward_0": 1.0, "train/sim_max_reward_1": 0.9226052142659521, "train/sim_max_reward_2": 0.3888092688609717, "train/sim_max_reward_3": 0.13753565361461273, "train/sim_max_reward_4": 0.23671744167086442, "train/sim_max_reward_5": 0.559918611732619, "test/sim_max_reward_4500000": 0.9268656345325879, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.47823474945607464, "test/sim_max_reward_4500003": 0.8579362762064028, "test/sim_max_reward_4500004": 0.19478155186552581, "test/sim_max_reward_4500005": 0.931277208991413, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.9103679007617822, "test/sim_max_reward_4500008": 0.012991240740145701, "test/sim_max_reward_4500009": 0.05340172294464145, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 0.800855475481829, "test/sim_max_reward_4500013": 0.0034051138917877365, "test/sim_max_reward_4500014": 0.9634448794354468, "test/sim_max_reward_4500015": 0.9500372090326884, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.06112330546217465, "test/sim_max_reward_4500018": 0.4599065161731219, "test/sim_max_reward_4500019": 0.882645887196851, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.881170261057358, "test/sim_max_reward_4500022": 0.9608150353084606, "test/sim_max_reward_4500023": 0.9781963091985562, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.7645330259488348, "test/sim_max_reward_4500026": 0.8699660073396751, "test/sim_max_reward_4500027": 0.9261316147297763, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.07919054834280721, "test/sim_max_reward_4500030": 0.9434970170358852, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04965027341874408, "test/sim_max_reward_4500033": 0.9763363693459182, "test/sim_max_reward_4500034": 0.9541880540721204, "test/sim_max_reward_4500035": 0.9520882882334545, "test/sim_max_reward_4500036": 0.5505085073730365, "test/sim_max_reward_4500037": 1.0, "test/sim_max_reward_4500038": 0.9216025296430796, "test/sim_max_reward_4500039": 1.0, "test/sim_max_reward_4500040": 0.991801289828972, "test/sim_max_reward_4500041": 0.9438285993039127, "test/sim_max_reward_4500042": 0.03304341064645425, "test/sim_max_reward_4500043": 0.6770394732088738, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.8863536709203415, "test/sim_max_reward_4500046": 0.17157999717633315, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9075239641370728, "test/sim_max_reward_4500049": 0.917754247032957, "train/mean_score": 0.5409310316908367, "test/mean_score": 0.580595895658327, "val_loss": 79005.234375} {"train_loss": -6.9239115715026855, "global_step": 155442, "epoch": 3701} {"train_loss": -6.852924346923828, "global_step": 155443, "epoch": 3701} {"train_loss": -6.94964075088501, "global_step": 155444, "epoch": 3701} {"train_loss": -6.906625270843506, "global_step": 155445, "epoch": 3701} {"train_loss": -6.912306308746338, "global_step": 155446, "epoch": 3701} {"train_loss": -6.989305019378662, "global_step": 155447, "epoch": 3701} {"train_loss": -6.9552459716796875, "global_step": 155448, "epoch": 3701} {"train_loss": -6.831655502319336, "global_step": 155449, "epoch": 3701} {"train_loss": -6.995819091796875, "global_step": 155450, "epoch": 3701} {"train_loss": -6.850315570831299, "global_step": 155451, "epoch": 3701} {"train_loss": -6.993533134460449, "global_step": 155452, "epoch": 3701} {"train_loss": -6.975761890411377, "global_step": 155453, "epoch": 3701} {"train_loss": -6.816606044769287, "global_step": 155454, "epoch": 3701} {"train_loss": -6.908560752868652, "global_step": 155455, "epoch": 3701} {"train_loss": -6.837701797485352, "global_step": 155456, "epoch": 3701} {"train_loss": -6.8818254470825195, "global_step": 155457, "epoch": 3701} {"train_loss": -6.970263957977295, "global_step": 155458, "epoch": 3701} {"train_loss": -6.905980110168457, "global_step": 155459, "epoch": 3701} {"train_loss": -6.867941856384277, "global_step": 155460, "epoch": 3701} {"train_loss": -6.879443645477295, "global_step": 155461, "epoch": 3701} {"train_loss": -6.8846964836120605, "global_step": 155462, "epoch": 3701} {"train_loss": -6.958630561828613, "global_step": 155463, "epoch": 3701} {"train_loss": -6.797257423400879, "global_step": 155464, "epoch": 3701} {"train_loss": -6.773672103881836, "global_step": 155465, "epoch": 3701} {"train_loss": -6.977175712585449, "global_step": 155466, "epoch": 3701} {"train_loss": -6.848750114440918, "global_step": 155467, "epoch": 3701} {"train_loss": -6.917757511138916, "global_step": 155468, "epoch": 3701} {"train_loss": -6.89855432510376, "global_step": 155469, "epoch": 3701} {"train_loss": -6.841005802154541, "global_step": 155470, "epoch": 3701} {"train_loss": -6.886324882507324, "global_step": 155471, "epoch": 3701} {"train_loss": -7.023484230041504, "global_step": 155472, "epoch": 3701} {"train_loss": -6.939395904541016, "global_step": 155473, "epoch": 3701} {"train_loss": -6.939484596252441, "global_step": 155474, "epoch": 3701} {"train_loss": -6.759914875030518, "global_step": 155475, "epoch": 3701} {"train_loss": -6.9621429443359375, "global_step": 155476, "epoch": 3701} {"train_loss": -6.87265682220459, "global_step": 155477, "epoch": 3701} {"train_loss": -7.005369186401367, "global_step": 155478, "epoch": 3701} {"train_loss": -6.9699554443359375, "global_step": 155479, "epoch": 3701} {"train_loss": -6.753488063812256, "global_step": 155480, "epoch": 3701} {"train_loss": -6.920337677001953, "global_step": 155481, "epoch": 3701} {"train_loss": -6.794987201690674, "global_step": 155482, "epoch": 3701} {"train_loss": -6.903307199478149, "global_step": 155483, "epoch": 3701, "val_loss": 79267.96875} {"train_loss": -6.860677719116211, "global_step": 155484, "epoch": 3702} {"train_loss": -6.8202972412109375, "global_step": 155485, "epoch": 3702} {"train_loss": -6.878870010375977, "global_step": 155486, "epoch": 3702} {"train_loss": -6.918145656585693, "global_step": 155487, "epoch": 3702} {"train_loss": -6.944730758666992, "global_step": 155488, "epoch": 3702} {"train_loss": -6.872720718383789, "global_step": 155489, "epoch": 3702} {"train_loss": -6.842218399047852, "global_step": 155490, "epoch": 3702} {"train_loss": -6.911517143249512, "global_step": 155491, "epoch": 3702} {"train_loss": -6.805689811706543, "global_step": 155492, "epoch": 3702} {"train_loss": -6.895824432373047, "global_step": 155493, "epoch": 3702} {"train_loss": -6.934327602386475, "global_step": 155494, "epoch": 3702} {"train_loss": -6.738574028015137, "global_step": 155495, "epoch": 3702} {"train_loss": -6.886494159698486, "global_step": 155496, "epoch": 3702} {"train_loss": -6.856307029724121, "global_step": 155497, "epoch": 3702} {"train_loss": -6.898104667663574, "global_step": 155498, "epoch": 3702} {"train_loss": -6.907538414001465, "global_step": 155499, "epoch": 3702} {"train_loss": -6.878774642944336, "global_step": 155500, "epoch": 3702} {"train_loss": -6.892064094543457, "global_step": 155501, "epoch": 3702} {"train_loss": -6.8337602615356445, "global_step": 155502, "epoch": 3702} {"train_loss": -6.840226173400879, "global_step": 155503, "epoch": 3702} {"train_loss": -6.917843818664551, "global_step": 155504, "epoch": 3702} {"train_loss": -6.851164817810059, "global_step": 155505, "epoch": 3702} {"train_loss": -6.752486228942871, "global_step": 155506, "epoch": 3702} {"train_loss": -6.916962623596191, "global_step": 155507, "epoch": 3702} {"train_loss": -6.831273078918457, "global_step": 155508, "epoch": 3702} {"train_loss": -7.031977653503418, "global_step": 155509, "epoch": 3702} {"train_loss": -6.981372833251953, "global_step": 155510, "epoch": 3702} {"train_loss": -6.886849403381348, "global_step": 155511, "epoch": 3702} {"train_loss": -6.928842067718506, "global_step": 155512, "epoch": 3702} {"train_loss": -6.859800338745117, "global_step": 155513, "epoch": 3702} {"train_loss": -6.853899002075195, "global_step": 155514, "epoch": 3702} {"train_loss": -6.853412628173828, "global_step": 155515, "epoch": 3702} {"train_loss": -6.90045690536499, "global_step": 155516, "epoch": 3702} {"train_loss": -6.973897933959961, "global_step": 155517, "epoch": 3702} {"train_loss": -6.911080360412598, "global_step": 155518, "epoch": 3702} {"train_loss": -6.928029537200928, "global_step": 155519, "epoch": 3702} {"train_loss": -6.889488220214844, "global_step": 155520, "epoch": 3702} {"train_loss": -6.784850120544434, "global_step": 155521, "epoch": 3702} {"train_loss": -6.993318557739258, "global_step": 155522, "epoch": 3702} {"train_loss": -6.926381587982178, "global_step": 155523, "epoch": 3702} {"train_loss": -7.000735282897949, "global_step": 155524, "epoch": 3702} {"train_loss": -6.888300907044184, "global_step": 155525, "epoch": 3702, "val_loss": 79110.0} {"train_loss": -6.97592306137085, "global_step": 155526, "epoch": 3703} {"train_loss": -6.974888324737549, "global_step": 155527, "epoch": 3703} {"train_loss": -6.955813407897949, "global_step": 155528, "epoch": 3703} {"train_loss": -6.797983169555664, "global_step": 155529, "epoch": 3703} {"train_loss": -6.965906143188477, "global_step": 155530, "epoch": 3703} {"train_loss": -6.901357173919678, "global_step": 155531, "epoch": 3703} {"train_loss": -6.904200077056885, "global_step": 155532, "epoch": 3703} {"train_loss": -6.886017799377441, "global_step": 155533, "epoch": 3703} {"train_loss": -6.785374164581299, "global_step": 155534, "epoch": 3703} {"train_loss": -6.974504470825195, "global_step": 155535, "epoch": 3703} {"train_loss": -6.93034029006958, "global_step": 155536, "epoch": 3703} {"train_loss": -6.906813621520996, "global_step": 155537, "epoch": 3703} {"train_loss": -6.980931758880615, "global_step": 155538, "epoch": 3703} {"train_loss": -6.943241596221924, "global_step": 155539, "epoch": 3703} {"train_loss": -6.986089706420898, "global_step": 155540, "epoch": 3703} {"train_loss": -7.013655662536621, "global_step": 155541, "epoch": 3703} {"train_loss": -6.947254180908203, "global_step": 155542, "epoch": 3703} {"train_loss": -7.043455123901367, "global_step": 155543, "epoch": 3703} {"train_loss": -6.976673126220703, "global_step": 155544, "epoch": 3703} {"train_loss": -6.907863616943359, "global_step": 155545, "epoch": 3703} {"train_loss": -6.95399284362793, "global_step": 155546, "epoch": 3703} {"train_loss": -7.01014518737793, "global_step": 155547, "epoch": 3703} {"train_loss": -6.866868019104004, "global_step": 155548, "epoch": 3703} {"train_loss": -7.054126739501953, "global_step": 155549, "epoch": 3703} {"train_loss": -7.001495838165283, "global_step": 155550, "epoch": 3703} {"train_loss": -6.906273365020752, "global_step": 155551, "epoch": 3703} {"train_loss": -7.055913925170898, "global_step": 155552, "epoch": 3703} {"train_loss": -6.884432315826416, "global_step": 155553, "epoch": 3703} {"train_loss": -7.0734405517578125, "global_step": 155554, "epoch": 3703} {"train_loss": -6.846003532409668, "global_step": 155555, "epoch": 3703} {"train_loss": -6.987287521362305, "global_step": 155556, "epoch": 3703} {"train_loss": -6.976181507110596, "global_step": 155557, "epoch": 3703} {"train_loss": -6.972282409667969, "global_step": 155558, "epoch": 3703} {"train_loss": -6.900161266326904, "global_step": 155559, "epoch": 3703} {"train_loss": -6.947066307067871, "global_step": 155560, "epoch": 3703} {"train_loss": -6.890103340148926, "global_step": 155561, "epoch": 3703} {"train_loss": -6.863711833953857, "global_step": 155562, "epoch": 3703} {"train_loss": -6.935991287231445, "global_step": 155563, "epoch": 3703} {"train_loss": -6.838096618652344, "global_step": 155564, "epoch": 3703} {"train_loss": -6.857585906982422, "global_step": 155565, "epoch": 3703} {"train_loss": -6.929341793060303, "global_step": 155566, "epoch": 3703} {"train_loss": -6.938663425899687, "global_step": 155567, "epoch": 3703, "val_loss": 78769.390625} {"train_loss": -6.886537075042725, "global_step": 155568, "epoch": 3704} {"train_loss": -6.9316606521606445, "global_step": 155569, "epoch": 3704} {"train_loss": -6.934927940368652, "global_step": 155570, "epoch": 3704} {"train_loss": -6.8680853843688965, "global_step": 155571, "epoch": 3704} {"train_loss": -6.940041542053223, "global_step": 155572, "epoch": 3704} {"train_loss": -6.963950157165527, "global_step": 155573, "epoch": 3704} {"train_loss": -6.833447456359863, "global_step": 155574, "epoch": 3704} {"train_loss": -6.859096527099609, "global_step": 155575, "epoch": 3704} {"train_loss": -6.916660785675049, "global_step": 155576, "epoch": 3704} {"train_loss": -6.926987648010254, "global_step": 155577, "epoch": 3704} {"train_loss": -6.979502201080322, "global_step": 155578, "epoch": 3704} {"train_loss": -6.911257266998291, "global_step": 155579, "epoch": 3704} {"train_loss": -6.887823104858398, "global_step": 155580, "epoch": 3704} {"train_loss": -6.854294776916504, "global_step": 155581, "epoch": 3704} {"train_loss": -6.850264549255371, "global_step": 155582, "epoch": 3704} {"train_loss": -6.9192094802856445, "global_step": 155583, "epoch": 3704} {"train_loss": -6.898680686950684, "global_step": 155584, "epoch": 3704} {"train_loss": -6.980353355407715, "global_step": 155585, "epoch": 3704} {"train_loss": -7.066317081451416, "global_step": 155586, "epoch": 3704} {"train_loss": -6.938355922698975, "global_step": 155587, "epoch": 3704} {"train_loss": -6.958763122558594, "global_step": 155588, "epoch": 3704} {"train_loss": -7.0164690017700195, "global_step": 155589, "epoch": 3704} {"train_loss": -6.901495933532715, "global_step": 155590, "epoch": 3704} {"train_loss": -7.083197593688965, "global_step": 155591, "epoch": 3704} {"train_loss": -6.907781600952148, "global_step": 155592, "epoch": 3704} {"train_loss": -6.8992815017700195, "global_step": 155593, "epoch": 3704} {"train_loss": -6.940976142883301, "global_step": 155594, "epoch": 3704} {"train_loss": -6.804775714874268, "global_step": 155595, "epoch": 3704} {"train_loss": -6.938544273376465, "global_step": 155596, "epoch": 3704} {"train_loss": -7.001828193664551, "global_step": 155597, "epoch": 3704} {"train_loss": -6.930601119995117, "global_step": 155598, "epoch": 3704} {"train_loss": -6.9314374923706055, "global_step": 155599, "epoch": 3704} {"train_loss": -6.993516445159912, "global_step": 155600, "epoch": 3704} {"train_loss": -6.815953254699707, "global_step": 155601, "epoch": 3704} {"train_loss": -6.808864593505859, "global_step": 155602, "epoch": 3704} {"train_loss": -6.914350509643555, "global_step": 155603, "epoch": 3704} {"train_loss": -6.851243495941162, "global_step": 155604, "epoch": 3704} {"train_loss": -6.963412761688232, "global_step": 155605, "epoch": 3704} {"train_loss": -6.942743301391602, "global_step": 155606, "epoch": 3704} {"train_loss": -7.076172828674316, "global_step": 155607, "epoch": 3704} {"train_loss": -6.921660423278809, "global_step": 155608, "epoch": 3704} {"train_loss": -6.928774572554088, "global_step": 155609, "epoch": 3704, "val_loss": 78935.7109375} {"train_loss": -7.002964973449707, "global_step": 155610, "epoch": 3705} {"train_loss": -7.028913497924805, "global_step": 155611, "epoch": 3705} {"train_loss": -7.061297416687012, "global_step": 155612, "epoch": 3705} {"train_loss": -7.018091201782227, "global_step": 155613, "epoch": 3705} {"train_loss": -6.8668365478515625, "global_step": 155614, "epoch": 3705} {"train_loss": -6.970151901245117, "global_step": 155615, "epoch": 3705} {"train_loss": -6.909526824951172, "global_step": 155616, "epoch": 3705} {"train_loss": -6.828695297241211, "global_step": 155617, "epoch": 3705} {"train_loss": -6.930069446563721, "global_step": 155618, "epoch": 3705} {"train_loss": -6.881446361541748, "global_step": 155619, "epoch": 3705} {"train_loss": -6.820173263549805, "global_step": 155620, "epoch": 3705} {"train_loss": -6.875198841094971, "global_step": 155621, "epoch": 3705} {"train_loss": -6.771529674530029, "global_step": 155622, "epoch": 3705} {"train_loss": -6.850030422210693, "global_step": 155623, "epoch": 3705} {"train_loss": -6.885395526885986, "global_step": 155624, "epoch": 3705} {"train_loss": -7.010556697845459, "global_step": 155625, "epoch": 3705} {"train_loss": -6.910252571105957, "global_step": 155626, "epoch": 3705} {"train_loss": -6.852446556091309, "global_step": 155627, "epoch": 3705} {"train_loss": -6.990407943725586, "global_step": 155628, "epoch": 3705} {"train_loss": -6.911191463470459, "global_step": 155629, "epoch": 3705} {"train_loss": -6.965975761413574, "global_step": 155630, "epoch": 3705} {"train_loss": -6.804924964904785, "global_step": 155631, "epoch": 3705} {"train_loss": -6.878408432006836, "global_step": 155632, "epoch": 3705} {"train_loss": -6.987454414367676, "global_step": 155633, "epoch": 3705} {"train_loss": -6.878450393676758, "global_step": 155634, "epoch": 3705} {"train_loss": -6.902527332305908, "global_step": 155635, "epoch": 3705} {"train_loss": -6.9175519943237305, "global_step": 155636, "epoch": 3705} {"train_loss": -6.959451675415039, "global_step": 155637, "epoch": 3705} {"train_loss": -6.995408058166504, "global_step": 155638, "epoch": 3705} {"train_loss": -7.0378828048706055, "global_step": 155639, "epoch": 3705} {"train_loss": -7.072043418884277, "global_step": 155640, "epoch": 3705} {"train_loss": -6.916308403015137, "global_step": 155641, "epoch": 3705} {"train_loss": -6.918377876281738, "global_step": 155642, "epoch": 3705} {"train_loss": -6.953002452850342, "global_step": 155643, "epoch": 3705} {"train_loss": -6.8558030128479, "global_step": 155644, "epoch": 3705} {"train_loss": -7.031623840332031, "global_step": 155645, "epoch": 3705} {"train_loss": -6.950435638427734, "global_step": 155646, "epoch": 3705} {"train_loss": -6.825446128845215, "global_step": 155647, "epoch": 3705} {"train_loss": -6.817124366760254, "global_step": 155648, "epoch": 3705} {"train_loss": -6.871768474578857, "global_step": 155649, "epoch": 3705} {"train_loss": -6.9224066734313965, "global_step": 155650, "epoch": 3705} {"train_loss": -6.924068053563436, "global_step": 155651, "epoch": 3705, "val_loss": 79052.921875} {"train_loss": -6.786881446838379, "global_step": 155652, "epoch": 3706} {"train_loss": -6.821247100830078, "global_step": 155653, "epoch": 3706} {"train_loss": -6.767879486083984, "global_step": 155654, "epoch": 3706} {"train_loss": -6.826420783996582, "global_step": 155655, "epoch": 3706} {"train_loss": -6.916375160217285, "global_step": 155656, "epoch": 3706} {"train_loss": -7.005343914031982, "global_step": 155657, "epoch": 3706} {"train_loss": -6.9342546463012695, "global_step": 155658, "epoch": 3706} {"train_loss": -6.9491472244262695, "global_step": 155659, "epoch": 3706} {"train_loss": -6.91283655166626, "global_step": 155660, "epoch": 3706} {"train_loss": -6.913442611694336, "global_step": 155661, "epoch": 3706} {"train_loss": -6.776561737060547, "global_step": 155662, "epoch": 3706} {"train_loss": -6.895207405090332, "global_step": 155663, "epoch": 3706} {"train_loss": -6.967491149902344, "global_step": 155664, "epoch": 3706} {"train_loss": -6.960170745849609, "global_step": 155665, "epoch": 3706} {"train_loss": -6.935500621795654, "global_step": 155666, "epoch": 3706} {"train_loss": -6.9843831062316895, "global_step": 155667, "epoch": 3706} {"train_loss": -6.957781791687012, "global_step": 155668, "epoch": 3706} {"train_loss": -6.940356731414795, "global_step": 155669, "epoch": 3706} {"train_loss": -6.934969902038574, "global_step": 155670, "epoch": 3706} {"train_loss": -6.899206161499023, "global_step": 155671, "epoch": 3706} {"train_loss": -6.985040664672852, "global_step": 155672, "epoch": 3706} {"train_loss": -6.9075775146484375, "global_step": 155673, "epoch": 3706} {"train_loss": -6.926273822784424, "global_step": 155674, "epoch": 3706} {"train_loss": -6.828345775604248, "global_step": 155675, "epoch": 3706} {"train_loss": -6.885249137878418, "global_step": 155676, "epoch": 3706} {"train_loss": -6.90804386138916, "global_step": 155677, "epoch": 3706} {"train_loss": -7.050045013427734, "global_step": 155678, "epoch": 3706} {"train_loss": -6.678874969482422, "global_step": 155679, "epoch": 3706} {"train_loss": -6.93635368347168, "global_step": 155680, "epoch": 3706} {"train_loss": -6.933043479919434, "global_step": 155681, "epoch": 3706} {"train_loss": -6.747476100921631, "global_step": 155682, "epoch": 3706} {"train_loss": -6.901336669921875, "global_step": 155683, "epoch": 3706} {"train_loss": -6.83124303817749, "global_step": 155684, "epoch": 3706} {"train_loss": -6.7898101806640625, "global_step": 155685, "epoch": 3706} {"train_loss": -6.942622184753418, "global_step": 155686, "epoch": 3706} {"train_loss": -6.865272045135498, "global_step": 155687, "epoch": 3706} {"train_loss": -6.775972366333008, "global_step": 155688, "epoch": 3706} {"train_loss": -6.909493446350098, "global_step": 155689, "epoch": 3706} {"train_loss": -6.905995845794678, "global_step": 155690, "epoch": 3706} {"train_loss": -6.927881240844727, "global_step": 155691, "epoch": 3706} {"train_loss": -6.822641372680664, "global_step": 155692, "epoch": 3706} {"train_loss": -6.891099850336711, "global_step": 155693, "epoch": 3706, "val_loss": 79332.4609375} {"train_loss": -6.9656219482421875, "global_step": 155694, "epoch": 3707} {"train_loss": -6.900542736053467, "global_step": 155695, "epoch": 3707} {"train_loss": -6.89755916595459, "global_step": 155696, "epoch": 3707} {"train_loss": -6.973681926727295, "global_step": 155697, "epoch": 3707} {"train_loss": -6.8844757080078125, "global_step": 155698, "epoch": 3707} {"train_loss": -6.936420440673828, "global_step": 155699, "epoch": 3707} {"train_loss": -6.955840110778809, "global_step": 155700, "epoch": 3707} {"train_loss": -6.981442451477051, "global_step": 155701, "epoch": 3707} {"train_loss": -6.851731300354004, "global_step": 155702, "epoch": 3707} {"train_loss": -6.838468551635742, "global_step": 155703, "epoch": 3707} {"train_loss": -6.8628716468811035, "global_step": 155704, "epoch": 3707} {"train_loss": -6.964008331298828, "global_step": 155705, "epoch": 3707} {"train_loss": -7.064558982849121, "global_step": 155706, "epoch": 3707} {"train_loss": -6.884709358215332, "global_step": 155707, "epoch": 3707} {"train_loss": -7.066246032714844, "global_step": 155708, "epoch": 3707} {"train_loss": -6.960941314697266, "global_step": 155709, "epoch": 3707} {"train_loss": -6.882009506225586, "global_step": 155710, "epoch": 3707} {"train_loss": -6.951297283172607, "global_step": 155711, "epoch": 3707} {"train_loss": -7.0201263427734375, "global_step": 155712, "epoch": 3707} {"train_loss": -6.957294464111328, "global_step": 155713, "epoch": 3707} {"train_loss": -7.008700370788574, "global_step": 155714, "epoch": 3707} {"train_loss": -7.01537561416626, "global_step": 155715, "epoch": 3707} {"train_loss": -7.106881141662598, "global_step": 155716, "epoch": 3707} {"train_loss": -7.049452304840088, "global_step": 155717, "epoch": 3707} {"train_loss": -6.972815036773682, "global_step": 155718, "epoch": 3707} {"train_loss": -6.975788116455078, "global_step": 155719, "epoch": 3707} {"train_loss": -6.920237064361572, "global_step": 155720, "epoch": 3707} {"train_loss": -6.883831024169922, "global_step": 155721, "epoch": 3707} {"train_loss": -6.922397136688232, "global_step": 155722, "epoch": 3707} {"train_loss": -6.8704447746276855, "global_step": 155723, "epoch": 3707} {"train_loss": -6.784076690673828, "global_step": 155724, "epoch": 3707} {"train_loss": -6.881683826446533, "global_step": 155725, "epoch": 3707} {"train_loss": -6.865410327911377, "global_step": 155726, "epoch": 3707} {"train_loss": -6.8819122314453125, "global_step": 155727, "epoch": 3707} {"train_loss": -6.715353012084961, "global_step": 155728, "epoch": 3707} {"train_loss": -6.891441822052002, "global_step": 155729, "epoch": 3707} {"train_loss": -6.8406877517700195, "global_step": 155730, "epoch": 3707} {"train_loss": -6.756830215454102, "global_step": 155731, "epoch": 3707} {"train_loss": -6.802581310272217, "global_step": 155732, "epoch": 3707} {"train_loss": -6.802386283874512, "global_step": 155733, "epoch": 3707} {"train_loss": -6.869688034057617, "global_step": 155734, "epoch": 3707} {"train_loss": -6.918082055591402, "global_step": 155735, "epoch": 3707, "val_loss": 78867.984375} {"train_loss": -6.796168327331543, "global_step": 155736, "epoch": 3708} {"train_loss": -6.7502264976501465, "global_step": 155737, "epoch": 3708} {"train_loss": -6.852759838104248, "global_step": 155738, "epoch": 3708} {"train_loss": -6.912801742553711, "global_step": 155739, "epoch": 3708} {"train_loss": -6.815298080444336, "global_step": 155740, "epoch": 3708} {"train_loss": -6.8347649574279785, "global_step": 155741, "epoch": 3708} {"train_loss": -6.952415466308594, "global_step": 155742, "epoch": 3708} {"train_loss": -6.854653358459473, "global_step": 155743, "epoch": 3708} {"train_loss": -6.7599077224731445, "global_step": 155744, "epoch": 3708} {"train_loss": -6.787158012390137, "global_step": 155745, "epoch": 3708} {"train_loss": -6.812504291534424, "global_step": 155746, "epoch": 3708} {"train_loss": -6.764303207397461, "global_step": 155747, "epoch": 3708} {"train_loss": -6.984610557556152, "global_step": 155748, "epoch": 3708} {"train_loss": -6.809122085571289, "global_step": 155749, "epoch": 3708} {"train_loss": -6.886200904846191, "global_step": 155750, "epoch": 3708} {"train_loss": -6.817967414855957, "global_step": 155751, "epoch": 3708} {"train_loss": -6.857895851135254, "global_step": 155752, "epoch": 3708} {"train_loss": -6.908143520355225, "global_step": 155753, "epoch": 3708} {"train_loss": -6.886099815368652, "global_step": 155754, "epoch": 3708} {"train_loss": -6.844287872314453, "global_step": 155755, "epoch": 3708} {"train_loss": -6.76390266418457, "global_step": 155756, "epoch": 3708} {"train_loss": -6.8859100341796875, "global_step": 155757, "epoch": 3708} {"train_loss": -6.845089912414551, "global_step": 155758, "epoch": 3708} {"train_loss": -6.877510070800781, "global_step": 155759, "epoch": 3708} {"train_loss": -6.855224132537842, "global_step": 155760, "epoch": 3708} {"train_loss": -6.962160110473633, "global_step": 155761, "epoch": 3708} {"train_loss": -6.988630771636963, "global_step": 155762, "epoch": 3708} {"train_loss": -6.858105659484863, "global_step": 155763, "epoch": 3708} {"train_loss": -6.9166975021362305, "global_step": 155764, "epoch": 3708} {"train_loss": -6.997945308685303, "global_step": 155765, "epoch": 3708} {"train_loss": -6.936459541320801, "global_step": 155766, "epoch": 3708} {"train_loss": -6.848676681518555, "global_step": 155767, "epoch": 3708} {"train_loss": -6.871350288391113, "global_step": 155768, "epoch": 3708} {"train_loss": -6.852705955505371, "global_step": 155769, "epoch": 3708} {"train_loss": -6.905986785888672, "global_step": 155770, "epoch": 3708} {"train_loss": -6.861220359802246, "global_step": 155771, "epoch": 3708} {"train_loss": -6.9827423095703125, "global_step": 155772, "epoch": 3708} {"train_loss": -6.848505020141602, "global_step": 155773, "epoch": 3708} {"train_loss": -6.95785665512085, "global_step": 155774, "epoch": 3708} {"train_loss": -7.045055389404297, "global_step": 155775, "epoch": 3708} {"train_loss": -6.943859100341797, "global_step": 155776, "epoch": 3708} {"train_loss": -6.875312930061703, "global_step": 155777, "epoch": 3708, "val_loss": 78807.53125} {"train_loss": -6.958925247192383, "global_step": 155778, "epoch": 3709} {"train_loss": -6.929251670837402, "global_step": 155779, "epoch": 3709} {"train_loss": -6.895756721496582, "global_step": 155780, "epoch": 3709} {"train_loss": -6.958163261413574, "global_step": 155781, "epoch": 3709} {"train_loss": -6.9436187744140625, "global_step": 155782, "epoch": 3709} {"train_loss": -6.950242042541504, "global_step": 155783, "epoch": 3709} {"train_loss": -6.951473236083984, "global_step": 155784, "epoch": 3709} {"train_loss": -6.93805456161499, "global_step": 155785, "epoch": 3709} {"train_loss": -6.88817834854126, "global_step": 155786, "epoch": 3709} {"train_loss": -6.877459526062012, "global_step": 155787, "epoch": 3709} {"train_loss": -6.809613227844238, "global_step": 155788, "epoch": 3709} {"train_loss": -7.024747371673584, "global_step": 155789, "epoch": 3709} {"train_loss": -6.885272026062012, "global_step": 155790, "epoch": 3709} {"train_loss": -6.709691524505615, "global_step": 155791, "epoch": 3709} {"train_loss": -6.92159366607666, "global_step": 155792, "epoch": 3709} {"train_loss": -7.07463264465332, "global_step": 155793, "epoch": 3709} {"train_loss": -6.839892864227295, "global_step": 155794, "epoch": 3709} {"train_loss": -6.941773414611816, "global_step": 155795, "epoch": 3709} {"train_loss": -6.878208160400391, "global_step": 155796, "epoch": 3709} {"train_loss": -6.851295471191406, "global_step": 155797, "epoch": 3709} {"train_loss": -6.9670209884643555, "global_step": 155798, "epoch": 3709} {"train_loss": -6.88301944732666, "global_step": 155799, "epoch": 3709} {"train_loss": -6.795979976654053, "global_step": 155800, "epoch": 3709} {"train_loss": -6.807056427001953, "global_step": 155801, "epoch": 3709} {"train_loss": -6.808200836181641, "global_step": 155802, "epoch": 3709} {"train_loss": -6.82310676574707, "global_step": 155803, "epoch": 3709} {"train_loss": -6.908012866973877, "global_step": 155804, "epoch": 3709} {"train_loss": -7.012025833129883, "global_step": 155805, "epoch": 3709} {"train_loss": -6.894870281219482, "global_step": 155806, "epoch": 3709} {"train_loss": -6.884279251098633, "global_step": 155807, "epoch": 3709} {"train_loss": -6.923492431640625, "global_step": 155808, "epoch": 3709} {"train_loss": -6.928353309631348, "global_step": 155809, "epoch": 3709} {"train_loss": -6.915700912475586, "global_step": 155810, "epoch": 3709} {"train_loss": -6.930248260498047, "global_step": 155811, "epoch": 3709} {"train_loss": -6.978267192840576, "global_step": 155812, "epoch": 3709} {"train_loss": -6.842496871948242, "global_step": 155813, "epoch": 3709} {"train_loss": -6.993072509765625, "global_step": 155814, "epoch": 3709} {"train_loss": -6.8695783615112305, "global_step": 155815, "epoch": 3709} {"train_loss": -6.895934104919434, "global_step": 155816, "epoch": 3709} {"train_loss": -6.841458320617676, "global_step": 155817, "epoch": 3709} {"train_loss": -7.009194850921631, "global_step": 155818, "epoch": 3709} {"train_loss": -6.90377384140378, "global_step": 155819, "epoch": 3709, "val_loss": 78944.0078125} {"train_loss": -6.897027015686035, "global_step": 155820, "epoch": 3710} {"train_loss": -6.7698588371276855, "global_step": 155821, "epoch": 3710} {"train_loss": -6.939996242523193, "global_step": 155822, "epoch": 3710} {"train_loss": -6.960615158081055, "global_step": 155823, "epoch": 3710} {"train_loss": -6.922564506530762, "global_step": 155824, "epoch": 3710} {"train_loss": -6.8314971923828125, "global_step": 155825, "epoch": 3710} {"train_loss": -6.850947380065918, "global_step": 155826, "epoch": 3710} {"train_loss": -6.884265899658203, "global_step": 155827, "epoch": 3710} {"train_loss": -6.925089359283447, "global_step": 155828, "epoch": 3710} {"train_loss": -7.007357597351074, "global_step": 155829, "epoch": 3710} {"train_loss": -6.909632682800293, "global_step": 155830, "epoch": 3710} {"train_loss": -6.9432196617126465, "global_step": 155831, "epoch": 3710} {"train_loss": -6.873865127563477, "global_step": 155832, "epoch": 3710} {"train_loss": -6.948984622955322, "global_step": 155833, "epoch": 3710} {"train_loss": -6.95555305480957, "global_step": 155834, "epoch": 3710} {"train_loss": -6.957518100738525, "global_step": 155835, "epoch": 3710} {"train_loss": -6.879418849945068, "global_step": 155836, "epoch": 3710} {"train_loss": -6.923272132873535, "global_step": 155837, "epoch": 3710} {"train_loss": -7.030864238739014, "global_step": 155838, "epoch": 3710} {"train_loss": -6.852047443389893, "global_step": 155839, "epoch": 3710} {"train_loss": -6.927842140197754, "global_step": 155840, "epoch": 3710} {"train_loss": -6.966477870941162, "global_step": 155841, "epoch": 3710} {"train_loss": -6.8675713539123535, "global_step": 155842, "epoch": 3710} {"train_loss": -6.956600189208984, "global_step": 155843, "epoch": 3710} {"train_loss": -6.911454200744629, "global_step": 155844, "epoch": 3710} {"train_loss": -6.910813331604004, "global_step": 155845, "epoch": 3710} {"train_loss": -6.710636615753174, "global_step": 155846, "epoch": 3710} {"train_loss": -6.859255313873291, "global_step": 155847, "epoch": 3710} {"train_loss": -6.951960563659668, "global_step": 155848, "epoch": 3710} {"train_loss": -6.867769241333008, "global_step": 155849, "epoch": 3710} {"train_loss": -7.013334274291992, "global_step": 155850, "epoch": 3710} {"train_loss": -6.957550048828125, "global_step": 155851, "epoch": 3710} {"train_loss": -6.922473907470703, "global_step": 155852, "epoch": 3710} {"train_loss": -7.029173374176025, "global_step": 155853, "epoch": 3710} {"train_loss": -6.806690216064453, "global_step": 155854, "epoch": 3710} {"train_loss": -6.9475579261779785, "global_step": 155855, "epoch": 3710} {"train_loss": -6.854128837585449, "global_step": 155856, "epoch": 3710} {"train_loss": -6.921175956726074, "global_step": 155857, "epoch": 3710} {"train_loss": -6.997316837310791, "global_step": 155858, "epoch": 3710} {"train_loss": -6.928361892700195, "global_step": 155859, "epoch": 3710} {"train_loss": -6.93228816986084, "global_step": 155860, "epoch": 3710} {"train_loss": -6.915896699542091, "global_step": 155861, "epoch": 3710, "val_loss": 79122.578125} {"train_loss": -6.865135192871094, "global_step": 155862, "epoch": 3711} {"train_loss": -7.021047592163086, "global_step": 155863, "epoch": 3711} {"train_loss": -7.022908687591553, "global_step": 155864, "epoch": 3711} {"train_loss": -6.986385345458984, "global_step": 155865, "epoch": 3711} {"train_loss": -7.018675804138184, "global_step": 155866, "epoch": 3711} {"train_loss": -6.95107364654541, "global_step": 155867, "epoch": 3711} {"train_loss": -6.951865196228027, "global_step": 155868, "epoch": 3711} {"train_loss": -6.926845550537109, "global_step": 155869, "epoch": 3711} {"train_loss": -6.987320423126221, "global_step": 155870, "epoch": 3711} {"train_loss": -7.081565856933594, "global_step": 155871, "epoch": 3711} {"train_loss": -7.060217380523682, "global_step": 155872, "epoch": 3711} {"train_loss": -7.008623123168945, "global_step": 155873, "epoch": 3711} {"train_loss": -7.054381847381592, "global_step": 155874, "epoch": 3711} {"train_loss": -6.941920280456543, "global_step": 155875, "epoch": 3711} {"train_loss": -6.973876476287842, "global_step": 155876, "epoch": 3711} {"train_loss": -6.848115921020508, "global_step": 155877, "epoch": 3711} {"train_loss": -6.879774570465088, "global_step": 155878, "epoch": 3711} {"train_loss": -6.873022079467773, "global_step": 155879, "epoch": 3711} {"train_loss": -6.870588302612305, "global_step": 155880, "epoch": 3711} {"train_loss": -6.880711555480957, "global_step": 155881, "epoch": 3711} {"train_loss": -6.891223907470703, "global_step": 155882, "epoch": 3711} {"train_loss": -6.752749443054199, "global_step": 155883, "epoch": 3711} {"train_loss": -6.954963684082031, "global_step": 155884, "epoch": 3711} {"train_loss": -6.852845191955566, "global_step": 155885, "epoch": 3711} {"train_loss": -6.911186218261719, "global_step": 155886, "epoch": 3711} {"train_loss": -6.9856133460998535, "global_step": 155887, "epoch": 3711} {"train_loss": -6.997689247131348, "global_step": 155888, "epoch": 3711} {"train_loss": -6.834053993225098, "global_step": 155889, "epoch": 3711} {"train_loss": -6.913235187530518, "global_step": 155890, "epoch": 3711} {"train_loss": -6.979190826416016, "global_step": 155891, "epoch": 3711} {"train_loss": -6.925839900970459, "global_step": 155892, "epoch": 3711} {"train_loss": -6.878086566925049, "global_step": 155893, "epoch": 3711} {"train_loss": -6.891082763671875, "global_step": 155894, "epoch": 3711} {"train_loss": -6.856396198272705, "global_step": 155895, "epoch": 3711} {"train_loss": -6.932980537414551, "global_step": 155896, "epoch": 3711} {"train_loss": -6.806741714477539, "global_step": 155897, "epoch": 3711} {"train_loss": -6.950597286224365, "global_step": 155898, "epoch": 3711} {"train_loss": -6.8104047775268555, "global_step": 155899, "epoch": 3711} {"train_loss": -6.974399566650391, "global_step": 155900, "epoch": 3711} {"train_loss": -6.893547534942627, "global_step": 155901, "epoch": 3711} {"train_loss": -6.877110481262207, "global_step": 155902, "epoch": 3711} {"train_loss": -6.92772558757237, "global_step": 155903, "epoch": 3711, "val_loss": 78971.0390625} {"train_loss": -6.915850639343262, "global_step": 155904, "epoch": 3712} {"train_loss": -6.886816501617432, "global_step": 155905, "epoch": 3712} {"train_loss": -6.765684127807617, "global_step": 155906, "epoch": 3712} {"train_loss": -6.808208465576172, "global_step": 155907, "epoch": 3712} {"train_loss": -6.905941486358643, "global_step": 155908, "epoch": 3712} {"train_loss": -6.779455184936523, "global_step": 155909, "epoch": 3712} {"train_loss": -6.87961483001709, "global_step": 155910, "epoch": 3712} {"train_loss": -6.989030838012695, "global_step": 155911, "epoch": 3712} {"train_loss": -6.779971599578857, "global_step": 155912, "epoch": 3712} {"train_loss": -6.885144233703613, "global_step": 155913, "epoch": 3712} {"train_loss": -6.962791442871094, "global_step": 155914, "epoch": 3712} {"train_loss": -6.919002532958984, "global_step": 155915, "epoch": 3712} {"train_loss": -6.86886739730835, "global_step": 155916, "epoch": 3712} {"train_loss": -6.879568099975586, "global_step": 155917, "epoch": 3712} {"train_loss": -6.7349443435668945, "global_step": 155918, "epoch": 3712} {"train_loss": -6.9098968505859375, "global_step": 155919, "epoch": 3712} {"train_loss": -6.951250076293945, "global_step": 155920, "epoch": 3712} {"train_loss": -6.830471992492676, "global_step": 155921, "epoch": 3712} {"train_loss": -6.886618614196777, "global_step": 155922, "epoch": 3712} {"train_loss": -6.805668830871582, "global_step": 155923, "epoch": 3712} {"train_loss": -7.005863189697266, "global_step": 155924, "epoch": 3712} {"train_loss": -7.025609970092773, "global_step": 155925, "epoch": 3712} {"train_loss": -7.041817665100098, "global_step": 155926, "epoch": 3712} {"train_loss": -6.976162910461426, "global_step": 155927, "epoch": 3712} {"train_loss": -6.891799449920654, "global_step": 155928, "epoch": 3712} {"train_loss": -7.012683868408203, "global_step": 155929, "epoch": 3712} {"train_loss": -6.9242095947265625, "global_step": 155930, "epoch": 3712} {"train_loss": -6.9440813064575195, "global_step": 155931, "epoch": 3712} {"train_loss": -6.920620441436768, "global_step": 155932, "epoch": 3712} {"train_loss": -6.9099555015563965, "global_step": 155933, "epoch": 3712} {"train_loss": -6.969993591308594, "global_step": 155934, "epoch": 3712} {"train_loss": -6.8955559730529785, "global_step": 155935, "epoch": 3712} {"train_loss": -6.937946796417236, "global_step": 155936, "epoch": 3712} {"train_loss": -7.038392066955566, "global_step": 155937, "epoch": 3712} {"train_loss": -6.856395721435547, "global_step": 155938, "epoch": 3712} {"train_loss": -6.785316467285156, "global_step": 155939, "epoch": 3712} {"train_loss": -6.794957160949707, "global_step": 155940, "epoch": 3712} {"train_loss": -6.944821357727051, "global_step": 155941, "epoch": 3712} {"train_loss": -6.771065711975098, "global_step": 155942, "epoch": 3712} {"train_loss": -6.848118305206299, "global_step": 155943, "epoch": 3712} {"train_loss": -6.925769329071045, "global_step": 155944, "epoch": 3712} {"train_loss": -6.894629240036011, "global_step": 155945, "epoch": 3712, "val_loss": 79288.265625} {"train_loss": -6.84649658203125, "global_step": 155946, "epoch": 3713} {"train_loss": -6.998952388763428, "global_step": 155947, "epoch": 3713} {"train_loss": -6.9174299240112305, "global_step": 155948, "epoch": 3713} {"train_loss": -6.927305221557617, "global_step": 155949, "epoch": 3713} {"train_loss": -6.832130432128906, "global_step": 155950, "epoch": 3713} {"train_loss": -6.883800983428955, "global_step": 155951, "epoch": 3713} {"train_loss": -6.81143856048584, "global_step": 155952, "epoch": 3713} {"train_loss": -6.9323930740356445, "global_step": 155953, "epoch": 3713} {"train_loss": -6.918424129486084, "global_step": 155954, "epoch": 3713} {"train_loss": -6.8385467529296875, "global_step": 155955, "epoch": 3713} {"train_loss": -6.846203804016113, "global_step": 155956, "epoch": 3713} {"train_loss": -6.929948806762695, "global_step": 155957, "epoch": 3713} {"train_loss": -6.860262870788574, "global_step": 155958, "epoch": 3713} {"train_loss": -7.000017166137695, "global_step": 155959, "epoch": 3713} {"train_loss": -6.895935535430908, "global_step": 155960, "epoch": 3713} {"train_loss": -6.983225345611572, "global_step": 155961, "epoch": 3713} {"train_loss": -6.8880109786987305, "global_step": 155962, "epoch": 3713} {"train_loss": -6.875370979309082, "global_step": 155963, "epoch": 3713} {"train_loss": -6.871604919433594, "global_step": 155964, "epoch": 3713} {"train_loss": -6.859619140625, "global_step": 155965, "epoch": 3713} {"train_loss": -6.910033702850342, "global_step": 155966, "epoch": 3713} {"train_loss": -6.701266288757324, "global_step": 155967, "epoch": 3713} {"train_loss": -6.781459808349609, "global_step": 155968, "epoch": 3713} {"train_loss": -6.89077091217041, "global_step": 155969, "epoch": 3713} {"train_loss": -6.735783576965332, "global_step": 155970, "epoch": 3713} {"train_loss": -6.981430530548096, "global_step": 155971, "epoch": 3713} {"train_loss": -6.709750175476074, "global_step": 155972, "epoch": 3713} {"train_loss": -6.7241106033325195, "global_step": 155973, "epoch": 3713} {"train_loss": -6.891395568847656, "global_step": 155974, "epoch": 3713} {"train_loss": -6.9307122230529785, "global_step": 155975, "epoch": 3713} {"train_loss": -6.770920753479004, "global_step": 155976, "epoch": 3713} {"train_loss": -6.761408805847168, "global_step": 155977, "epoch": 3713} {"train_loss": -6.82517671585083, "global_step": 155978, "epoch": 3713} {"train_loss": -6.876439571380615, "global_step": 155979, "epoch": 3713} {"train_loss": -6.904722213745117, "global_step": 155980, "epoch": 3713} {"train_loss": -6.825283050537109, "global_step": 155981, "epoch": 3713} {"train_loss": -6.790626525878906, "global_step": 155982, "epoch": 3713} {"train_loss": -6.872790813446045, "global_step": 155983, "epoch": 3713} {"train_loss": -6.741533279418945, "global_step": 155984, "epoch": 3713} {"train_loss": -6.896938323974609, "global_step": 155985, "epoch": 3713} {"train_loss": -6.880112648010254, "global_step": 155986, "epoch": 3713} {"train_loss": -6.861102524257841, "global_step": 155987, "epoch": 3713, "val_loss": 79311.5546875} {"train_loss": -6.822992324829102, "global_step": 155988, "epoch": 3714} {"train_loss": -6.954030990600586, "global_step": 155989, "epoch": 3714} {"train_loss": -6.876432418823242, "global_step": 155990, "epoch": 3714} {"train_loss": -6.904510498046875, "global_step": 155991, "epoch": 3714} {"train_loss": -6.904651641845703, "global_step": 155992, "epoch": 3714} {"train_loss": -6.806667327880859, "global_step": 155993, "epoch": 3714} {"train_loss": -7.00139045715332, "global_step": 155994, "epoch": 3714} {"train_loss": -6.892662048339844, "global_step": 155995, "epoch": 3714} {"train_loss": -6.8520731925964355, "global_step": 155996, "epoch": 3714} {"train_loss": -6.9790802001953125, "global_step": 155997, "epoch": 3714} {"train_loss": -7.005609512329102, "global_step": 155998, "epoch": 3714} {"train_loss": -6.8631744384765625, "global_step": 155999, "epoch": 3714} {"train_loss": -6.899412631988525, "global_step": 156000, "epoch": 3714} {"train_loss": -6.982752799987793, "global_step": 156001, "epoch": 3714} {"train_loss": -6.8374810218811035, "global_step": 156002, "epoch": 3714} {"train_loss": -7.024844169616699, "global_step": 156003, "epoch": 3714} {"train_loss": -6.879537582397461, "global_step": 156004, "epoch": 3714} {"train_loss": -6.867834568023682, "global_step": 156005, "epoch": 3714} {"train_loss": -6.751540184020996, "global_step": 156006, "epoch": 3714} {"train_loss": -6.768430709838867, "global_step": 156007, "epoch": 3714} {"train_loss": -6.87123441696167, "global_step": 156008, "epoch": 3714} {"train_loss": -6.946540832519531, "global_step": 156009, "epoch": 3714} {"train_loss": -6.856941223144531, "global_step": 156010, "epoch": 3714} {"train_loss": -6.751500129699707, "global_step": 156011, "epoch": 3714} {"train_loss": -6.888721942901611, "global_step": 156012, "epoch": 3714} {"train_loss": -6.6641845703125, "global_step": 156013, "epoch": 3714} {"train_loss": -6.807028770446777, "global_step": 156014, "epoch": 3714} {"train_loss": -6.8804450035095215, "global_step": 156015, "epoch": 3714} {"train_loss": -6.8939127922058105, "global_step": 156016, "epoch": 3714} {"train_loss": -6.724789619445801, "global_step": 156017, "epoch": 3714} {"train_loss": -6.782623291015625, "global_step": 156018, "epoch": 3714} {"train_loss": -6.829577922821045, "global_step": 156019, "epoch": 3714} {"train_loss": -6.733578681945801, "global_step": 156020, "epoch": 3714} {"train_loss": -6.789473533630371, "global_step": 156021, "epoch": 3714} {"train_loss": -6.868973731994629, "global_step": 156022, "epoch": 3714} {"train_loss": -6.835843086242676, "global_step": 156023, "epoch": 3714} {"train_loss": -6.831984519958496, "global_step": 156024, "epoch": 3714} {"train_loss": -6.802389144897461, "global_step": 156025, "epoch": 3714} {"train_loss": -6.807364463806152, "global_step": 156026, "epoch": 3714} {"train_loss": -6.9049577713012695, "global_step": 156027, "epoch": 3714} {"train_loss": -6.793858051300049, "global_step": 156028, "epoch": 3714} {"train_loss": -6.856478305090041, "global_step": 156029, "epoch": 3714, "val_loss": 78880.984375} {"train_loss": -6.956391334533691, "global_step": 156030, "epoch": 3715} {"train_loss": -6.887988567352295, "global_step": 156031, "epoch": 3715} {"train_loss": -6.861719131469727, "global_step": 156032, "epoch": 3715} {"train_loss": -6.864162445068359, "global_step": 156033, "epoch": 3715} {"train_loss": -6.760037422180176, "global_step": 156034, "epoch": 3715} {"train_loss": -6.885557651519775, "global_step": 156035, "epoch": 3715} {"train_loss": -6.976371765136719, "global_step": 156036, "epoch": 3715} {"train_loss": -6.862573623657227, "global_step": 156037, "epoch": 3715} {"train_loss": -6.928745269775391, "global_step": 156038, "epoch": 3715} {"train_loss": -6.9068193435668945, "global_step": 156039, "epoch": 3715} {"train_loss": -6.8800859451293945, "global_step": 156040, "epoch": 3715} {"train_loss": -6.979244232177734, "global_step": 156041, "epoch": 3715} {"train_loss": -6.963858604431152, "global_step": 156042, "epoch": 3715} {"train_loss": -6.999820709228516, "global_step": 156043, "epoch": 3715} {"train_loss": -6.933486461639404, "global_step": 156044, "epoch": 3715} {"train_loss": -6.948326110839844, "global_step": 156045, "epoch": 3715} {"train_loss": -6.94493293762207, "global_step": 156046, "epoch": 3715} {"train_loss": -7.079491138458252, "global_step": 156047, "epoch": 3715} {"train_loss": -6.923288345336914, "global_step": 156048, "epoch": 3715} {"train_loss": -6.949853897094727, "global_step": 156049, "epoch": 3715} {"train_loss": -6.968270301818848, "global_step": 156050, "epoch": 3715} {"train_loss": -6.913349628448486, "global_step": 156051, "epoch": 3715} {"train_loss": -6.9615678787231445, "global_step": 156052, "epoch": 3715} {"train_loss": -7.0093231201171875, "global_step": 156053, "epoch": 3715} {"train_loss": -6.927539825439453, "global_step": 156054, "epoch": 3715} {"train_loss": -6.89784049987793, "global_step": 156055, "epoch": 3715} {"train_loss": -7.033030986785889, "global_step": 156056, "epoch": 3715} {"train_loss": -6.871923446655273, "global_step": 156057, "epoch": 3715} {"train_loss": -6.885886192321777, "global_step": 156058, "epoch": 3715} {"train_loss": -6.946881294250488, "global_step": 156059, "epoch": 3715} {"train_loss": -6.931103229522705, "global_step": 156060, "epoch": 3715} {"train_loss": -7.0139899253845215, "global_step": 156061, "epoch": 3715} {"train_loss": -6.894265174865723, "global_step": 156062, "epoch": 3715} {"train_loss": -6.909814357757568, "global_step": 156063, "epoch": 3715} {"train_loss": -6.987639904022217, "global_step": 156064, "epoch": 3715} {"train_loss": -6.922661781311035, "global_step": 156065, "epoch": 3715} {"train_loss": -6.921187877655029, "global_step": 156066, "epoch": 3715} {"train_loss": -6.942745208740234, "global_step": 156067, "epoch": 3715} {"train_loss": -6.768582344055176, "global_step": 156068, "epoch": 3715} {"train_loss": -7.018017768859863, "global_step": 156069, "epoch": 3715} {"train_loss": -6.924890518188477, "global_step": 156070, "epoch": 3715} {"train_loss": -6.930393684478033, "global_step": 156071, "epoch": 3715, "val_loss": 79165.6640625} {"train_loss": -6.985008716583252, "global_step": 156072, "epoch": 3716} {"train_loss": -6.866023063659668, "global_step": 156073, "epoch": 3716} {"train_loss": -6.8517656326293945, "global_step": 156074, "epoch": 3716} {"train_loss": -7.0289154052734375, "global_step": 156075, "epoch": 3716} {"train_loss": -6.918048858642578, "global_step": 156076, "epoch": 3716} {"train_loss": -6.9425153732299805, "global_step": 156077, "epoch": 3716} {"train_loss": -6.910185813903809, "global_step": 156078, "epoch": 3716} {"train_loss": -6.960184097290039, "global_step": 156079, "epoch": 3716} {"train_loss": -7.045722961425781, "global_step": 156080, "epoch": 3716} {"train_loss": -6.92808723449707, "global_step": 156081, "epoch": 3716} {"train_loss": -6.9216461181640625, "global_step": 156082, "epoch": 3716} {"train_loss": -6.9097065925598145, "global_step": 156083, "epoch": 3716} {"train_loss": -6.930979251861572, "global_step": 156084, "epoch": 3716} {"train_loss": -6.910641670227051, "global_step": 156085, "epoch": 3716} {"train_loss": -6.895285129547119, "global_step": 156086, "epoch": 3716} {"train_loss": -6.953773498535156, "global_step": 156087, "epoch": 3716} {"train_loss": -6.916217803955078, "global_step": 156088, "epoch": 3716} {"train_loss": -6.897541522979736, "global_step": 156089, "epoch": 3716} {"train_loss": -7.046401500701904, "global_step": 156090, "epoch": 3716} {"train_loss": -6.8975419998168945, "global_step": 156091, "epoch": 3716} {"train_loss": -7.0201239585876465, "global_step": 156092, "epoch": 3716} {"train_loss": -6.885082244873047, "global_step": 156093, "epoch": 3716} {"train_loss": -6.89902925491333, "global_step": 156094, "epoch": 3716} {"train_loss": -6.869699954986572, "global_step": 156095, "epoch": 3716} {"train_loss": -6.928213596343994, "global_step": 156096, "epoch": 3716} {"train_loss": -6.867861747741699, "global_step": 156097, "epoch": 3716} {"train_loss": -6.891226291656494, "global_step": 156098, "epoch": 3716} {"train_loss": -6.943257808685303, "global_step": 156099, "epoch": 3716} {"train_loss": -6.814810752868652, "global_step": 156100, "epoch": 3716} {"train_loss": -7.015008926391602, "global_step": 156101, "epoch": 3716} {"train_loss": -6.78907585144043, "global_step": 156102, "epoch": 3716} {"train_loss": -6.942897796630859, "global_step": 156103, "epoch": 3716} {"train_loss": -6.9123640060424805, "global_step": 156104, "epoch": 3716} {"train_loss": -6.84055233001709, "global_step": 156105, "epoch": 3716} {"train_loss": -6.888484001159668, "global_step": 156106, "epoch": 3716} {"train_loss": -6.854128837585449, "global_step": 156107, "epoch": 3716} {"train_loss": -6.804225921630859, "global_step": 156108, "epoch": 3716} {"train_loss": -6.997997283935547, "global_step": 156109, "epoch": 3716} {"train_loss": -6.877862930297852, "global_step": 156110, "epoch": 3716} {"train_loss": -6.876860618591309, "global_step": 156111, "epoch": 3716} {"train_loss": -6.893298149108887, "global_step": 156112, "epoch": 3716} {"train_loss": -6.914344537825811, "global_step": 156113, "epoch": 3716, "val_loss": 79145.8984375} {"train_loss": -6.9131669998168945, "global_step": 156114, "epoch": 3717} {"train_loss": -6.829258918762207, "global_step": 156115, "epoch": 3717} {"train_loss": -6.974371433258057, "global_step": 156116, "epoch": 3717} {"train_loss": -7.138896942138672, "global_step": 156117, "epoch": 3717} {"train_loss": -6.8540849685668945, "global_step": 156118, "epoch": 3717} {"train_loss": -6.879085540771484, "global_step": 156119, "epoch": 3717} {"train_loss": -6.835076332092285, "global_step": 156120, "epoch": 3717} {"train_loss": -6.984810829162598, "global_step": 156121, "epoch": 3717} {"train_loss": -6.82595157623291, "global_step": 156122, "epoch": 3717} {"train_loss": -6.923836708068848, "global_step": 156123, "epoch": 3717} {"train_loss": -6.884964942932129, "global_step": 156124, "epoch": 3717} {"train_loss": -6.97659969329834, "global_step": 156125, "epoch": 3717} {"train_loss": -6.958979606628418, "global_step": 156126, "epoch": 3717} {"train_loss": -6.966765880584717, "global_step": 156127, "epoch": 3717} {"train_loss": -6.91526985168457, "global_step": 156128, "epoch": 3717} {"train_loss": -6.968628883361816, "global_step": 156129, "epoch": 3717} {"train_loss": -6.989311218261719, "global_step": 156130, "epoch": 3717} {"train_loss": -6.9243268966674805, "global_step": 156131, "epoch": 3717} {"train_loss": -6.863019943237305, "global_step": 156132, "epoch": 3717} {"train_loss": -7.019584655761719, "global_step": 156133, "epoch": 3717} {"train_loss": -6.904111862182617, "global_step": 156134, "epoch": 3717} {"train_loss": -6.978342056274414, "global_step": 156135, "epoch": 3717} {"train_loss": -6.996146202087402, "global_step": 156136, "epoch": 3717} {"train_loss": -6.788414001464844, "global_step": 156137, "epoch": 3717} {"train_loss": -6.786123752593994, "global_step": 156138, "epoch": 3717} {"train_loss": -7.006379127502441, "global_step": 156139, "epoch": 3717} {"train_loss": -6.821813583374023, "global_step": 156140, "epoch": 3717} {"train_loss": -7.004937171936035, "global_step": 156141, "epoch": 3717} {"train_loss": -6.860391616821289, "global_step": 156142, "epoch": 3717} {"train_loss": -6.878425121307373, "global_step": 156143, "epoch": 3717} {"train_loss": -6.998083591461182, "global_step": 156144, "epoch": 3717} {"train_loss": -6.859805583953857, "global_step": 156145, "epoch": 3717} {"train_loss": -6.948540687561035, "global_step": 156146, "epoch": 3717} {"train_loss": -6.935729503631592, "global_step": 156147, "epoch": 3717} {"train_loss": -6.824365139007568, "global_step": 156148, "epoch": 3717} {"train_loss": -6.907590389251709, "global_step": 156149, "epoch": 3717} {"train_loss": -6.889840126037598, "global_step": 156150, "epoch": 3717} {"train_loss": -6.93416690826416, "global_step": 156151, "epoch": 3717} {"train_loss": -7.017837047576904, "global_step": 156152, "epoch": 3717} {"train_loss": -6.859448432922363, "global_step": 156153, "epoch": 3717} {"train_loss": -6.8889031410217285, "global_step": 156154, "epoch": 3717} {"train_loss": -6.921443802969796, "global_step": 156155, "epoch": 3717, "val_loss": 79223.8203125} {"train_loss": -6.9740095138549805, "global_step": 156156, "epoch": 3718} {"train_loss": -6.914412498474121, "global_step": 156157, "epoch": 3718} {"train_loss": -6.977063179016113, "global_step": 156158, "epoch": 3718} {"train_loss": -6.966824054718018, "global_step": 156159, "epoch": 3718} {"train_loss": -6.916896820068359, "global_step": 156160, "epoch": 3718} {"train_loss": -6.962944030761719, "global_step": 156161, "epoch": 3718} {"train_loss": -6.954707145690918, "global_step": 156162, "epoch": 3718} {"train_loss": -7.055637359619141, "global_step": 156163, "epoch": 3718} {"train_loss": -6.871018409729004, "global_step": 156164, "epoch": 3718} {"train_loss": -7.0091729164123535, "global_step": 156165, "epoch": 3718} {"train_loss": -6.947330951690674, "global_step": 156166, "epoch": 3718} {"train_loss": -6.874543190002441, "global_step": 156167, "epoch": 3718} {"train_loss": -6.998754501342773, "global_step": 156168, "epoch": 3718} {"train_loss": -6.827831268310547, "global_step": 156169, "epoch": 3718} {"train_loss": -6.8507080078125, "global_step": 156170, "epoch": 3718} {"train_loss": -6.985743522644043, "global_step": 156171, "epoch": 3718} {"train_loss": -6.952425003051758, "global_step": 156172, "epoch": 3718} {"train_loss": -6.94831657409668, "global_step": 156173, "epoch": 3718} {"train_loss": -6.899589538574219, "global_step": 156174, "epoch": 3718} {"train_loss": -6.884905815124512, "global_step": 156175, "epoch": 3718} {"train_loss": -6.819643974304199, "global_step": 156176, "epoch": 3718} {"train_loss": -6.83379602432251, "global_step": 156177, "epoch": 3718} {"train_loss": -6.987154960632324, "global_step": 156178, "epoch": 3718} {"train_loss": -6.837553977966309, "global_step": 156179, "epoch": 3718} {"train_loss": -6.880721092224121, "global_step": 156180, "epoch": 3718} {"train_loss": -6.926056861877441, "global_step": 156181, "epoch": 3718} {"train_loss": -6.927351951599121, "global_step": 156182, "epoch": 3718} {"train_loss": -6.930815696716309, "global_step": 156183, "epoch": 3718} {"train_loss": -6.915503025054932, "global_step": 156184, "epoch": 3718} {"train_loss": -6.940274238586426, "global_step": 156185, "epoch": 3718} {"train_loss": -7.010300159454346, "global_step": 156186, "epoch": 3718} {"train_loss": -6.907073020935059, "global_step": 156187, "epoch": 3718} {"train_loss": -6.897817611694336, "global_step": 156188, "epoch": 3718} {"train_loss": -6.92899227142334, "global_step": 156189, "epoch": 3718} {"train_loss": -6.944960594177246, "global_step": 156190, "epoch": 3718} {"train_loss": -6.9937639236450195, "global_step": 156191, "epoch": 3718} {"train_loss": -6.885743141174316, "global_step": 156192, "epoch": 3718} {"train_loss": -6.967143535614014, "global_step": 156193, "epoch": 3718} {"train_loss": -7.099588394165039, "global_step": 156194, "epoch": 3718} {"train_loss": -6.990041255950928, "global_step": 156195, "epoch": 3718} {"train_loss": -6.9956583976745605, "global_step": 156196, "epoch": 3718} {"train_loss": -6.938495488393874, "global_step": 156197, "epoch": 3718, "val_loss": 79117.8359375} {"train_loss": -7.109583854675293, "global_step": 156198, "epoch": 3719} {"train_loss": -6.993231296539307, "global_step": 156199, "epoch": 3719} {"train_loss": -7.028338432312012, "global_step": 156200, "epoch": 3719} {"train_loss": -7.044319152832031, "global_step": 156201, "epoch": 3719} {"train_loss": -7.071341514587402, "global_step": 156202, "epoch": 3719} {"train_loss": -6.974268913269043, "global_step": 156203, "epoch": 3719} {"train_loss": -6.9944939613342285, "global_step": 156204, "epoch": 3719} {"train_loss": -6.8942999839782715, "global_step": 156205, "epoch": 3719} {"train_loss": -6.977303504943848, "global_step": 156206, "epoch": 3719} {"train_loss": -7.026874542236328, "global_step": 156207, "epoch": 3719} {"train_loss": -6.868375778198242, "global_step": 156208, "epoch": 3719} {"train_loss": -6.915258407592773, "global_step": 156209, "epoch": 3719} {"train_loss": -6.925268173217773, "global_step": 156210, "epoch": 3719} {"train_loss": -7.004666328430176, "global_step": 156211, "epoch": 3719} {"train_loss": -6.930278778076172, "global_step": 156212, "epoch": 3719} {"train_loss": -6.9885029792785645, "global_step": 156213, "epoch": 3719} {"train_loss": -6.964574813842773, "global_step": 156214, "epoch": 3719} {"train_loss": -6.769732475280762, "global_step": 156215, "epoch": 3719} {"train_loss": -6.913945198059082, "global_step": 156216, "epoch": 3719} {"train_loss": -6.84304141998291, "global_step": 156217, "epoch": 3719} {"train_loss": -6.837610244750977, "global_step": 156218, "epoch": 3719} {"train_loss": -6.863263130187988, "global_step": 156219, "epoch": 3719} {"train_loss": -6.872285842895508, "global_step": 156220, "epoch": 3719} {"train_loss": -6.7683916091918945, "global_step": 156221, "epoch": 3719} {"train_loss": -6.864799976348877, "global_step": 156222, "epoch": 3719} {"train_loss": -6.850306510925293, "global_step": 156223, "epoch": 3719} {"train_loss": -6.647353172302246, "global_step": 156224, "epoch": 3719} {"train_loss": -6.913352966308594, "global_step": 156225, "epoch": 3719} {"train_loss": -6.719721794128418, "global_step": 156226, "epoch": 3719} {"train_loss": -6.679004192352295, "global_step": 156227, "epoch": 3719} {"train_loss": -6.811621189117432, "global_step": 156228, "epoch": 3719} {"train_loss": -6.795655250549316, "global_step": 156229, "epoch": 3719} {"train_loss": -6.688129425048828, "global_step": 156230, "epoch": 3719} {"train_loss": -6.677619934082031, "global_step": 156231, "epoch": 3719} {"train_loss": -6.783440589904785, "global_step": 156232, "epoch": 3719} {"train_loss": -6.6847124099731445, "global_step": 156233, "epoch": 3719} {"train_loss": -6.917975425720215, "global_step": 156234, "epoch": 3719} {"train_loss": -6.768048286437988, "global_step": 156235, "epoch": 3719} {"train_loss": -6.7520432472229, "global_step": 156236, "epoch": 3719} {"train_loss": -6.917386054992676, "global_step": 156237, "epoch": 3719} {"train_loss": -6.832193851470947, "global_step": 156238, "epoch": 3719} {"train_loss": -6.874767428352719, "global_step": 156239, "epoch": 3719, "val_loss": 79165.953125} {"train_loss": -6.822854042053223, "global_step": 156240, "epoch": 3720} {"train_loss": -7.042998790740967, "global_step": 156241, "epoch": 3720} {"train_loss": -6.900503635406494, "global_step": 156242, "epoch": 3720} {"train_loss": -6.818107604980469, "global_step": 156243, "epoch": 3720} {"train_loss": -6.894707679748535, "global_step": 156244, "epoch": 3720} {"train_loss": -6.893377304077148, "global_step": 156245, "epoch": 3720} {"train_loss": -6.875736236572266, "global_step": 156246, "epoch": 3720} {"train_loss": -6.882549285888672, "global_step": 156247, "epoch": 3720} {"train_loss": -6.845170021057129, "global_step": 156248, "epoch": 3720} {"train_loss": -6.925172805786133, "global_step": 156249, "epoch": 3720} {"train_loss": -6.849597930908203, "global_step": 156250, "epoch": 3720} {"train_loss": -6.805599212646484, "global_step": 156251, "epoch": 3720} {"train_loss": -6.899593353271484, "global_step": 156252, "epoch": 3720} {"train_loss": -6.751648426055908, "global_step": 156253, "epoch": 3720} {"train_loss": -6.922364711761475, "global_step": 156254, "epoch": 3720} {"train_loss": -6.770044326782227, "global_step": 156255, "epoch": 3720} {"train_loss": -6.937360763549805, "global_step": 156256, "epoch": 3720} {"train_loss": -6.919243812561035, "global_step": 156257, "epoch": 3720} {"train_loss": -6.918182373046875, "global_step": 156258, "epoch": 3720} {"train_loss": -6.800167560577393, "global_step": 156259, "epoch": 3720} {"train_loss": -6.7696943283081055, "global_step": 156260, "epoch": 3720} {"train_loss": -6.983077526092529, "global_step": 156261, "epoch": 3720} {"train_loss": -6.839711666107178, "global_step": 156262, "epoch": 3720} {"train_loss": -6.977497577667236, "global_step": 156263, "epoch": 3720} {"train_loss": -6.832001686096191, "global_step": 156264, "epoch": 3720} {"train_loss": -6.917082786560059, "global_step": 156265, "epoch": 3720} {"train_loss": -6.8779191970825195, "global_step": 156266, "epoch": 3720} {"train_loss": -6.813638687133789, "global_step": 156267, "epoch": 3720} {"train_loss": -6.911170959472656, "global_step": 156268, "epoch": 3720} {"train_loss": -6.9056806564331055, "global_step": 156269, "epoch": 3720} {"train_loss": -7.001605987548828, "global_step": 156270, "epoch": 3720} {"train_loss": -6.97476863861084, "global_step": 156271, "epoch": 3720} {"train_loss": -6.898451805114746, "global_step": 156272, "epoch": 3720} {"train_loss": -6.839694976806641, "global_step": 156273, "epoch": 3720} {"train_loss": -6.9064531326293945, "global_step": 156274, "epoch": 3720} {"train_loss": -6.918503284454346, "global_step": 156275, "epoch": 3720} {"train_loss": -6.91053581237793, "global_step": 156276, "epoch": 3720} {"train_loss": -7.006362438201904, "global_step": 156277, "epoch": 3720} {"train_loss": -6.898262977600098, "global_step": 156278, "epoch": 3720} {"train_loss": -6.974160194396973, "global_step": 156279, "epoch": 3720} {"train_loss": -6.971238136291504, "global_step": 156280, "epoch": 3720} {"train_loss": -6.890571037928264, "global_step": 156281, "epoch": 3720, "val_loss": 79036.1328125} {"train_loss": -6.911786079406738, "global_step": 156282, "epoch": 3721} {"train_loss": -6.938468933105469, "global_step": 156283, "epoch": 3721} {"train_loss": -6.9668498039245605, "global_step": 156284, "epoch": 3721} {"train_loss": -6.8466386795043945, "global_step": 156285, "epoch": 3721} {"train_loss": -6.987839698791504, "global_step": 156286, "epoch": 3721} {"train_loss": -6.7852325439453125, "global_step": 156287, "epoch": 3721} {"train_loss": -6.899712562561035, "global_step": 156288, "epoch": 3721} {"train_loss": -6.953851699829102, "global_step": 156289, "epoch": 3721} {"train_loss": -6.9107279777526855, "global_step": 156290, "epoch": 3721} {"train_loss": -6.847272872924805, "global_step": 156291, "epoch": 3721} {"train_loss": -7.006719589233398, "global_step": 156292, "epoch": 3721} {"train_loss": -7.019474506378174, "global_step": 156293, "epoch": 3721} {"train_loss": -6.830350875854492, "global_step": 156294, "epoch": 3721} {"train_loss": -7.081766605377197, "global_step": 156295, "epoch": 3721} {"train_loss": -7.113775253295898, "global_step": 156296, "epoch": 3721} {"train_loss": -6.929778099060059, "global_step": 156297, "epoch": 3721} {"train_loss": -7.068948745727539, "global_step": 156298, "epoch": 3721} {"train_loss": -6.985230445861816, "global_step": 156299, "epoch": 3721} {"train_loss": -6.839077949523926, "global_step": 156300, "epoch": 3721} {"train_loss": -6.966935157775879, "global_step": 156301, "epoch": 3721} {"train_loss": -7.033486366271973, "global_step": 156302, "epoch": 3721} {"train_loss": -6.924692153930664, "global_step": 156303, "epoch": 3721} {"train_loss": -6.946300506591797, "global_step": 156304, "epoch": 3721} {"train_loss": -6.890827655792236, "global_step": 156305, "epoch": 3721} {"train_loss": -6.980188369750977, "global_step": 156306, "epoch": 3721} {"train_loss": -7.05206823348999, "global_step": 156307, "epoch": 3721} {"train_loss": -6.826787948608398, "global_step": 156308, "epoch": 3721} {"train_loss": -6.909208297729492, "global_step": 156309, "epoch": 3721} {"train_loss": -6.996071815490723, "global_step": 156310, "epoch": 3721} {"train_loss": -7.061427116394043, "global_step": 156311, "epoch": 3721} {"train_loss": -6.969064235687256, "global_step": 156312, "epoch": 3721} {"train_loss": -6.862347602844238, "global_step": 156313, "epoch": 3721} {"train_loss": -7.102928161621094, "global_step": 156314, "epoch": 3721} {"train_loss": -6.970717906951904, "global_step": 156315, "epoch": 3721} {"train_loss": -7.016670227050781, "global_step": 156316, "epoch": 3721} {"train_loss": -6.998758316040039, "global_step": 156317, "epoch": 3721} {"train_loss": -6.984753608703613, "global_step": 156318, "epoch": 3721} {"train_loss": -7.011099815368652, "global_step": 156319, "epoch": 3721} {"train_loss": -6.937346935272217, "global_step": 156320, "epoch": 3721} {"train_loss": -6.939777374267578, "global_step": 156321, "epoch": 3721} {"train_loss": -6.998651504516602, "global_step": 156322, "epoch": 3721} {"train_loss": -6.960845788319905, "global_step": 156323, "epoch": 3721, "val_loss": 79456.0546875} {"train_loss": -6.925117492675781, "global_step": 156324, "epoch": 3722} {"train_loss": -7.046814918518066, "global_step": 156325, "epoch": 3722} {"train_loss": -6.891280174255371, "global_step": 156326, "epoch": 3722} {"train_loss": -6.946030139923096, "global_step": 156327, "epoch": 3722} {"train_loss": -6.968850612640381, "global_step": 156328, "epoch": 3722} {"train_loss": -7.037847518920898, "global_step": 156329, "epoch": 3722} {"train_loss": -6.849093437194824, "global_step": 156330, "epoch": 3722} {"train_loss": -6.9998064041137695, "global_step": 156331, "epoch": 3722} {"train_loss": -6.961032867431641, "global_step": 156332, "epoch": 3722} {"train_loss": -6.916537284851074, "global_step": 156333, "epoch": 3722} {"train_loss": -6.946784019470215, "global_step": 156334, "epoch": 3722} {"train_loss": -6.995779037475586, "global_step": 156335, "epoch": 3722} {"train_loss": -6.860135078430176, "global_step": 156336, "epoch": 3722} {"train_loss": -6.88832426071167, "global_step": 156337, "epoch": 3722} {"train_loss": -6.9552693367004395, "global_step": 156338, "epoch": 3722} {"train_loss": -6.869650363922119, "global_step": 156339, "epoch": 3722} {"train_loss": -7.000446319580078, "global_step": 156340, "epoch": 3722} {"train_loss": -6.930639266967773, "global_step": 156341, "epoch": 3722} {"train_loss": -6.993694305419922, "global_step": 156342, "epoch": 3722} {"train_loss": -6.92722225189209, "global_step": 156343, "epoch": 3722} {"train_loss": -6.9860382080078125, "global_step": 156344, "epoch": 3722} {"train_loss": -6.893847465515137, "global_step": 156345, "epoch": 3722} {"train_loss": -6.842007637023926, "global_step": 156346, "epoch": 3722} {"train_loss": -6.922375679016113, "global_step": 156347, "epoch": 3722} {"train_loss": -6.887081146240234, "global_step": 156348, "epoch": 3722} {"train_loss": -7.066860675811768, "global_step": 156349, "epoch": 3722} {"train_loss": -6.819195747375488, "global_step": 156350, "epoch": 3722} {"train_loss": -6.910797119140625, "global_step": 156351, "epoch": 3722} {"train_loss": -6.878278732299805, "global_step": 156352, "epoch": 3722} {"train_loss": -6.868034362792969, "global_step": 156353, "epoch": 3722} {"train_loss": -6.914000034332275, "global_step": 156354, "epoch": 3722} {"train_loss": -6.866272926330566, "global_step": 156355, "epoch": 3722} {"train_loss": -7.000774383544922, "global_step": 156356, "epoch": 3722} {"train_loss": -6.88286018371582, "global_step": 156357, "epoch": 3722} {"train_loss": -6.8328752517700195, "global_step": 156358, "epoch": 3722} {"train_loss": -6.957707405090332, "global_step": 156359, "epoch": 3722} {"train_loss": -6.854213237762451, "global_step": 156360, "epoch": 3722} {"train_loss": -6.827375411987305, "global_step": 156361, "epoch": 3722} {"train_loss": -6.90113639831543, "global_step": 156362, "epoch": 3722} {"train_loss": -6.755173206329346, "global_step": 156363, "epoch": 3722} {"train_loss": -6.846856117248535, "global_step": 156364, "epoch": 3722} {"train_loss": -6.914964551017398, "global_step": 156365, "epoch": 3722, "val_loss": 78977.5390625} {"train_loss": -6.863252639770508, "global_step": 156366, "epoch": 3723} {"train_loss": -6.7797346115112305, "global_step": 156367, "epoch": 3723} {"train_loss": -6.789028167724609, "global_step": 156368, "epoch": 3723} {"train_loss": -6.878145217895508, "global_step": 156369, "epoch": 3723} {"train_loss": -6.770787239074707, "global_step": 156370, "epoch": 3723} {"train_loss": -6.91732120513916, "global_step": 156371, "epoch": 3723} {"train_loss": -6.9296112060546875, "global_step": 156372, "epoch": 3723} {"train_loss": -6.729769706726074, "global_step": 156373, "epoch": 3723} {"train_loss": -6.745340824127197, "global_step": 156374, "epoch": 3723} {"train_loss": -6.877361297607422, "global_step": 156375, "epoch": 3723} {"train_loss": -6.83034610748291, "global_step": 156376, "epoch": 3723} {"train_loss": -6.718756675720215, "global_step": 156377, "epoch": 3723} {"train_loss": -6.770975112915039, "global_step": 156378, "epoch": 3723} {"train_loss": -6.918776988983154, "global_step": 156379, "epoch": 3723} {"train_loss": -6.804008483886719, "global_step": 156380, "epoch": 3723} {"train_loss": -6.733760356903076, "global_step": 156381, "epoch": 3723} {"train_loss": -6.935970306396484, "global_step": 156382, "epoch": 3723} {"train_loss": -6.882704734802246, "global_step": 156383, "epoch": 3723} {"train_loss": -6.834464073181152, "global_step": 156384, "epoch": 3723} {"train_loss": -6.831977844238281, "global_step": 156385, "epoch": 3723} {"train_loss": -6.785676002502441, "global_step": 156386, "epoch": 3723} {"train_loss": -6.749070644378662, "global_step": 156387, "epoch": 3723} {"train_loss": -6.917654991149902, "global_step": 156388, "epoch": 3723} {"train_loss": -6.797906875610352, "global_step": 156389, "epoch": 3723} {"train_loss": -6.907649040222168, "global_step": 156390, "epoch": 3723} {"train_loss": -6.742213249206543, "global_step": 156391, "epoch": 3723} {"train_loss": -6.879375457763672, "global_step": 156392, "epoch": 3723} {"train_loss": -6.882152557373047, "global_step": 156393, "epoch": 3723} {"train_loss": -6.849498748779297, "global_step": 156394, "epoch": 3723} {"train_loss": -6.902288913726807, "global_step": 156395, "epoch": 3723} {"train_loss": -6.898952960968018, "global_step": 156396, "epoch": 3723} {"train_loss": -6.873933792114258, "global_step": 156397, "epoch": 3723} {"train_loss": -6.981854438781738, "global_step": 156398, "epoch": 3723} {"train_loss": -7.010788917541504, "global_step": 156399, "epoch": 3723} {"train_loss": -6.966732978820801, "global_step": 156400, "epoch": 3723} {"train_loss": -6.930567741394043, "global_step": 156401, "epoch": 3723} {"train_loss": -6.886782169342041, "global_step": 156402, "epoch": 3723} {"train_loss": -6.967281341552734, "global_step": 156403, "epoch": 3723} {"train_loss": -7.031525135040283, "global_step": 156404, "epoch": 3723} {"train_loss": -6.89830207824707, "global_step": 156405, "epoch": 3723} {"train_loss": -6.901473045349121, "global_step": 156406, "epoch": 3723} {"train_loss": -6.864181484494891, "global_step": 156407, "epoch": 3723, "val_loss": 79176.5546875} {"train_loss": -6.86415958404541, "global_step": 156408, "epoch": 3724} {"train_loss": -6.931061744689941, "global_step": 156409, "epoch": 3724} {"train_loss": -6.857562065124512, "global_step": 156410, "epoch": 3724} {"train_loss": -6.912090301513672, "global_step": 156411, "epoch": 3724} {"train_loss": -6.854214668273926, "global_step": 156412, "epoch": 3724} {"train_loss": -6.95274543762207, "global_step": 156413, "epoch": 3724} {"train_loss": -6.987471580505371, "global_step": 156414, "epoch": 3724} {"train_loss": -6.851906776428223, "global_step": 156415, "epoch": 3724} {"train_loss": -6.919028282165527, "global_step": 156416, "epoch": 3724} {"train_loss": -6.880661964416504, "global_step": 156417, "epoch": 3724} {"train_loss": -6.952446937561035, "global_step": 156418, "epoch": 3724} {"train_loss": -6.912813186645508, "global_step": 156419, "epoch": 3724} {"train_loss": -6.983259677886963, "global_step": 156420, "epoch": 3724} {"train_loss": -6.859539031982422, "global_step": 156421, "epoch": 3724} {"train_loss": -6.730068683624268, "global_step": 156422, "epoch": 3724} {"train_loss": -6.839688301086426, "global_step": 156423, "epoch": 3724} {"train_loss": -6.997570037841797, "global_step": 156424, "epoch": 3724} {"train_loss": -6.897252082824707, "global_step": 156425, "epoch": 3724} {"train_loss": -6.931332588195801, "global_step": 156426, "epoch": 3724} {"train_loss": -6.837491035461426, "global_step": 156427, "epoch": 3724} {"train_loss": -6.9920220375061035, "global_step": 156428, "epoch": 3724} {"train_loss": -6.984683036804199, "global_step": 156429, "epoch": 3724} {"train_loss": -6.830371379852295, "global_step": 156430, "epoch": 3724} {"train_loss": -6.972480297088623, "global_step": 156431, "epoch": 3724} {"train_loss": -6.978267192840576, "global_step": 156432, "epoch": 3724} {"train_loss": -6.8499956130981445, "global_step": 156433, "epoch": 3724} {"train_loss": -6.878396034240723, "global_step": 156434, "epoch": 3724} {"train_loss": -6.9642534255981445, "global_step": 156435, "epoch": 3724} {"train_loss": -6.866458892822266, "global_step": 156436, "epoch": 3724} {"train_loss": -6.975009918212891, "global_step": 156437, "epoch": 3724} {"train_loss": -7.00612735748291, "global_step": 156438, "epoch": 3724} {"train_loss": -6.945524215698242, "global_step": 156439, "epoch": 3724} {"train_loss": -6.99904727935791, "global_step": 156440, "epoch": 3724} {"train_loss": -6.843699932098389, "global_step": 156441, "epoch": 3724} {"train_loss": -7.044435501098633, "global_step": 156442, "epoch": 3724} {"train_loss": -7.039909362792969, "global_step": 156443, "epoch": 3724} {"train_loss": -6.915303707122803, "global_step": 156444, "epoch": 3724} {"train_loss": -6.938764572143555, "global_step": 156445, "epoch": 3724} {"train_loss": -6.960317611694336, "global_step": 156446, "epoch": 3724} {"train_loss": -6.933791160583496, "global_step": 156447, "epoch": 3724} {"train_loss": -6.943048477172852, "global_step": 156448, "epoch": 3724} {"train_loss": -6.920614651271275, "global_step": 156449, "epoch": 3724, "val_loss": 79315.6015625} {"train_loss": -6.977734088897705, "global_step": 156450, "epoch": 3725} {"train_loss": -6.993023872375488, "global_step": 156451, "epoch": 3725} {"train_loss": -6.875028610229492, "global_step": 156452, "epoch": 3725} {"train_loss": -6.898523330688477, "global_step": 156453, "epoch": 3725} {"train_loss": -6.876678943634033, "global_step": 156454, "epoch": 3725} {"train_loss": -6.844454765319824, "global_step": 156455, "epoch": 3725} {"train_loss": -6.8745436668396, "global_step": 156456, "epoch": 3725} {"train_loss": -6.931008338928223, "global_step": 156457, "epoch": 3725} {"train_loss": -6.999675750732422, "global_step": 156458, "epoch": 3725} {"train_loss": -6.952469825744629, "global_step": 156459, "epoch": 3725} {"train_loss": -6.857264518737793, "global_step": 156460, "epoch": 3725} {"train_loss": -6.88160514831543, "global_step": 156461, "epoch": 3725} {"train_loss": -6.90150785446167, "global_step": 156462, "epoch": 3725} {"train_loss": -6.921663284301758, "global_step": 156463, "epoch": 3725} {"train_loss": -6.9409990310668945, "global_step": 156464, "epoch": 3725} {"train_loss": -6.853640556335449, "global_step": 156465, "epoch": 3725} {"train_loss": -6.949641227722168, "global_step": 156466, "epoch": 3725} {"train_loss": -6.953544616699219, "global_step": 156467, "epoch": 3725} {"train_loss": -7.05573844909668, "global_step": 156468, "epoch": 3725} {"train_loss": -7.005934715270996, "global_step": 156469, "epoch": 3725} {"train_loss": -6.948389053344727, "global_step": 156470, "epoch": 3725} {"train_loss": -6.90949821472168, "global_step": 156471, "epoch": 3725} {"train_loss": -6.977200031280518, "global_step": 156472, "epoch": 3725} {"train_loss": -6.951717376708984, "global_step": 156473, "epoch": 3725} {"train_loss": -6.984457015991211, "global_step": 156474, "epoch": 3725} {"train_loss": -6.927231311798096, "global_step": 156475, "epoch": 3725} {"train_loss": -7.01341438293457, "global_step": 156476, "epoch": 3725} {"train_loss": -7.0649824142456055, "global_step": 156477, "epoch": 3725} {"train_loss": -6.988448143005371, "global_step": 156478, "epoch": 3725} {"train_loss": -6.911841869354248, "global_step": 156479, "epoch": 3725} {"train_loss": -7.0404863357543945, "global_step": 156480, "epoch": 3725} {"train_loss": -7.020316123962402, "global_step": 156481, "epoch": 3725} {"train_loss": -6.993809700012207, "global_step": 156482, "epoch": 3725} {"train_loss": -6.8732099533081055, "global_step": 156483, "epoch": 3725} {"train_loss": -6.947647571563721, "global_step": 156484, "epoch": 3725} {"train_loss": -6.912789344787598, "global_step": 156485, "epoch": 3725} {"train_loss": -6.901370048522949, "global_step": 156486, "epoch": 3725} {"train_loss": -7.001532077789307, "global_step": 156487, "epoch": 3725} {"train_loss": -6.943030834197998, "global_step": 156488, "epoch": 3725} {"train_loss": -6.888421535491943, "global_step": 156489, "epoch": 3725} {"train_loss": -6.909980297088623, "global_step": 156490, "epoch": 3725} {"train_loss": -6.9432839552561445, "global_step": 156491, "epoch": 3725, "val_loss": 79255.3359375} {"train_loss": -6.850329399108887, "global_step": 156492, "epoch": 3726} {"train_loss": -6.822771072387695, "global_step": 156493, "epoch": 3726} {"train_loss": -6.827816009521484, "global_step": 156494, "epoch": 3726} {"train_loss": -6.983531951904297, "global_step": 156495, "epoch": 3726} {"train_loss": -6.994421005249023, "global_step": 156496, "epoch": 3726} {"train_loss": -7.033394813537598, "global_step": 156497, "epoch": 3726} {"train_loss": -6.876643180847168, "global_step": 156498, "epoch": 3726} {"train_loss": -6.765763282775879, "global_step": 156499, "epoch": 3726} {"train_loss": -6.7835493087768555, "global_step": 156500, "epoch": 3726} {"train_loss": -6.943657875061035, "global_step": 156501, "epoch": 3726} {"train_loss": -6.874139785766602, "global_step": 156502, "epoch": 3726} {"train_loss": -6.8693742752075195, "global_step": 156503, "epoch": 3726} {"train_loss": -6.930842399597168, "global_step": 156504, "epoch": 3726} {"train_loss": -6.842782974243164, "global_step": 156505, "epoch": 3726} {"train_loss": -6.981849670410156, "global_step": 156506, "epoch": 3726} {"train_loss": -6.849478244781494, "global_step": 156507, "epoch": 3726} {"train_loss": -6.919613838195801, "global_step": 156508, "epoch": 3726} {"train_loss": -6.976803779602051, "global_step": 156509, "epoch": 3726} {"train_loss": -6.790745735168457, "global_step": 156510, "epoch": 3726} {"train_loss": -6.990503787994385, "global_step": 156511, "epoch": 3726} {"train_loss": -6.895403861999512, "global_step": 156512, "epoch": 3726} {"train_loss": -6.904009819030762, "global_step": 156513, "epoch": 3726} {"train_loss": -6.955286026000977, "global_step": 156514, "epoch": 3726} {"train_loss": -6.892325401306152, "global_step": 156515, "epoch": 3726} {"train_loss": -6.926445007324219, "global_step": 156516, "epoch": 3726} {"train_loss": -7.01689338684082, "global_step": 156517, "epoch": 3726} {"train_loss": -6.953166484832764, "global_step": 156518, "epoch": 3726} {"train_loss": -6.756970405578613, "global_step": 156519, "epoch": 3726} {"train_loss": -6.889223575592041, "global_step": 156520, "epoch": 3726} {"train_loss": -6.825406074523926, "global_step": 156521, "epoch": 3726} {"train_loss": -6.863106727600098, "global_step": 156522, "epoch": 3726} {"train_loss": -6.9542646408081055, "global_step": 156523, "epoch": 3726} {"train_loss": -6.960166931152344, "global_step": 156524, "epoch": 3726} {"train_loss": -6.8586931228637695, "global_step": 156525, "epoch": 3726} {"train_loss": -6.933152198791504, "global_step": 156526, "epoch": 3726} {"train_loss": -6.943735122680664, "global_step": 156527, "epoch": 3726} {"train_loss": -6.953884124755859, "global_step": 156528, "epoch": 3726} {"train_loss": -6.707200527191162, "global_step": 156529, "epoch": 3726} {"train_loss": -6.917145252227783, "global_step": 156530, "epoch": 3726} {"train_loss": -6.874645233154297, "global_step": 156531, "epoch": 3726} {"train_loss": -6.834925651550293, "global_step": 156532, "epoch": 3726} {"train_loss": -6.897024892625355, "global_step": 156533, "epoch": 3726, "val_loss": 79292.4453125} {"train_loss": -6.890926837921143, "global_step": 156534, "epoch": 3727} {"train_loss": -6.929682731628418, "global_step": 156535, "epoch": 3727} {"train_loss": -6.838990211486816, "global_step": 156536, "epoch": 3727} {"train_loss": -6.836452484130859, "global_step": 156537, "epoch": 3727} {"train_loss": -6.9542412757873535, "global_step": 156538, "epoch": 3727} {"train_loss": -6.810920238494873, "global_step": 156539, "epoch": 3727} {"train_loss": -6.939653396606445, "global_step": 156540, "epoch": 3727} {"train_loss": -6.953608512878418, "global_step": 156541, "epoch": 3727} {"train_loss": -6.947029113769531, "global_step": 156542, "epoch": 3727} {"train_loss": -6.95455265045166, "global_step": 156543, "epoch": 3727} {"train_loss": -6.90582275390625, "global_step": 156544, "epoch": 3727} {"train_loss": -6.919118404388428, "global_step": 156545, "epoch": 3727} {"train_loss": -6.89127254486084, "global_step": 156546, "epoch": 3727} {"train_loss": -6.922482967376709, "global_step": 156547, "epoch": 3727} {"train_loss": -6.975612640380859, "global_step": 156548, "epoch": 3727} {"train_loss": -7.000014781951904, "global_step": 156549, "epoch": 3727} {"train_loss": -6.861968994140625, "global_step": 156550, "epoch": 3727} {"train_loss": -6.933631896972656, "global_step": 156551, "epoch": 3727} {"train_loss": -7.008624076843262, "global_step": 156552, "epoch": 3727} {"train_loss": -7.087222099304199, "global_step": 156553, "epoch": 3727} {"train_loss": -7.025606632232666, "global_step": 156554, "epoch": 3727} {"train_loss": -6.996829986572266, "global_step": 156555, "epoch": 3727} {"train_loss": -6.904050827026367, "global_step": 156556, "epoch": 3727} {"train_loss": -6.872389793395996, "global_step": 156557, "epoch": 3727} {"train_loss": -6.973840236663818, "global_step": 156558, "epoch": 3727} {"train_loss": -7.0279693603515625, "global_step": 156559, "epoch": 3727} {"train_loss": -6.9151930809021, "global_step": 156560, "epoch": 3727} {"train_loss": -6.904310703277588, "global_step": 156561, "epoch": 3727} {"train_loss": -6.958585262298584, "global_step": 156562, "epoch": 3727} {"train_loss": -6.971156597137451, "global_step": 156563, "epoch": 3727} {"train_loss": -7.047540664672852, "global_step": 156564, "epoch": 3727} {"train_loss": -6.954360008239746, "global_step": 156565, "epoch": 3727} {"train_loss": -6.924465179443359, "global_step": 156566, "epoch": 3727} {"train_loss": -6.934852123260498, "global_step": 156567, "epoch": 3727} {"train_loss": -7.023186683654785, "global_step": 156568, "epoch": 3727} {"train_loss": -6.792309761047363, "global_step": 156569, "epoch": 3727} {"train_loss": -6.988510608673096, "global_step": 156570, "epoch": 3727} {"train_loss": -6.933661937713623, "global_step": 156571, "epoch": 3727} {"train_loss": -6.9676408767700195, "global_step": 156572, "epoch": 3727} {"train_loss": -7.00836181640625, "global_step": 156573, "epoch": 3727} {"train_loss": -6.8937273025512695, "global_step": 156574, "epoch": 3727} {"train_loss": -6.939054012298584, "global_step": 156575, "epoch": 3727, "val_loss": 79025.921875} {"train_loss": -6.89860725402832, "global_step": 156576, "epoch": 3728} {"train_loss": -6.938342094421387, "global_step": 156577, "epoch": 3728} {"train_loss": -6.9757819175720215, "global_step": 156578, "epoch": 3728} {"train_loss": -6.917891025543213, "global_step": 156579, "epoch": 3728} {"train_loss": -6.897326946258545, "global_step": 156580, "epoch": 3728} {"train_loss": -6.862570762634277, "global_step": 156581, "epoch": 3728} {"train_loss": -6.872097969055176, "global_step": 156582, "epoch": 3728} {"train_loss": -6.9034271240234375, "global_step": 156583, "epoch": 3728} {"train_loss": -7.024049758911133, "global_step": 156584, "epoch": 3728} {"train_loss": -6.908748626708984, "global_step": 156585, "epoch": 3728} {"train_loss": -6.9113850593566895, "global_step": 156586, "epoch": 3728} {"train_loss": -6.967202186584473, "global_step": 156587, "epoch": 3728} {"train_loss": -6.859272003173828, "global_step": 156588, "epoch": 3728} {"train_loss": -6.894158840179443, "global_step": 156589, "epoch": 3728} {"train_loss": -7.043120384216309, "global_step": 156590, "epoch": 3728} {"train_loss": -6.9411725997924805, "global_step": 156591, "epoch": 3728} {"train_loss": -6.994217872619629, "global_step": 156592, "epoch": 3728} {"train_loss": -6.863791465759277, "global_step": 156593, "epoch": 3728} {"train_loss": -6.907381534576416, "global_step": 156594, "epoch": 3728} {"train_loss": -7.031503677368164, "global_step": 156595, "epoch": 3728} {"train_loss": -6.938366413116455, "global_step": 156596, "epoch": 3728} {"train_loss": -6.876794338226318, "global_step": 156597, "epoch": 3728} {"train_loss": -6.985300540924072, "global_step": 156598, "epoch": 3728} {"train_loss": -6.927703857421875, "global_step": 156599, "epoch": 3728} {"train_loss": -6.98687744140625, "global_step": 156600, "epoch": 3728} {"train_loss": -6.749183177947998, "global_step": 156601, "epoch": 3728} {"train_loss": -6.88507080078125, "global_step": 156602, "epoch": 3728} {"train_loss": -6.957391738891602, "global_step": 156603, "epoch": 3728} {"train_loss": -7.017365455627441, "global_step": 156604, "epoch": 3728} {"train_loss": -6.974911212921143, "global_step": 156605, "epoch": 3728} {"train_loss": -6.985579490661621, "global_step": 156606, "epoch": 3728} {"train_loss": -6.914717197418213, "global_step": 156607, "epoch": 3728} {"train_loss": -6.940927028656006, "global_step": 156608, "epoch": 3728} {"train_loss": -7.049868583679199, "global_step": 156609, "epoch": 3728} {"train_loss": -6.95454216003418, "global_step": 156610, "epoch": 3728} {"train_loss": -6.99814510345459, "global_step": 156611, "epoch": 3728} {"train_loss": -7.005995750427246, "global_step": 156612, "epoch": 3728} {"train_loss": -6.856006622314453, "global_step": 156613, "epoch": 3728} {"train_loss": -6.935972213745117, "global_step": 156614, "epoch": 3728} {"train_loss": -6.882411956787109, "global_step": 156615, "epoch": 3728} {"train_loss": -7.0648884773254395, "global_step": 156616, "epoch": 3728} {"train_loss": -6.938496998378208, "global_step": 156617, "epoch": 3728, "val_loss": 79109.703125} {"train_loss": -6.9325480461120605, "global_step": 156618, "epoch": 3729} {"train_loss": -6.953017234802246, "global_step": 156619, "epoch": 3729} {"train_loss": -7.002105236053467, "global_step": 156620, "epoch": 3729} {"train_loss": -7.008000373840332, "global_step": 156621, "epoch": 3729} {"train_loss": -7.088226318359375, "global_step": 156622, "epoch": 3729} {"train_loss": -6.993382930755615, "global_step": 156623, "epoch": 3729} {"train_loss": -6.968891143798828, "global_step": 156624, "epoch": 3729} {"train_loss": -6.959912300109863, "global_step": 156625, "epoch": 3729} {"train_loss": -6.910991668701172, "global_step": 156626, "epoch": 3729} {"train_loss": -6.9870710372924805, "global_step": 156627, "epoch": 3729} {"train_loss": -6.961083889007568, "global_step": 156628, "epoch": 3729} {"train_loss": -7.059885501861572, "global_step": 156629, "epoch": 3729} {"train_loss": -6.9524641036987305, "global_step": 156630, "epoch": 3729} {"train_loss": -6.898517608642578, "global_step": 156631, "epoch": 3729} {"train_loss": -6.867505073547363, "global_step": 156632, "epoch": 3729} {"train_loss": -7.012528896331787, "global_step": 156633, "epoch": 3729} {"train_loss": -7.013108253479004, "global_step": 156634, "epoch": 3729} {"train_loss": -6.964380264282227, "global_step": 156635, "epoch": 3729} {"train_loss": -7.062592506408691, "global_step": 156636, "epoch": 3729} {"train_loss": -6.848812103271484, "global_step": 156637, "epoch": 3729} {"train_loss": -6.999058723449707, "global_step": 156638, "epoch": 3729} {"train_loss": -7.014359474182129, "global_step": 156639, "epoch": 3729} {"train_loss": -6.920993804931641, "global_step": 156640, "epoch": 3729} {"train_loss": -6.895081996917725, "global_step": 156641, "epoch": 3729} {"train_loss": -7.005209922790527, "global_step": 156642, "epoch": 3729} {"train_loss": -6.939209461212158, "global_step": 156643, "epoch": 3729} {"train_loss": -6.944828987121582, "global_step": 156644, "epoch": 3729} {"train_loss": -6.939823627471924, "global_step": 156645, "epoch": 3729} {"train_loss": -6.830414772033691, "global_step": 156646, "epoch": 3729} {"train_loss": -6.808055877685547, "global_step": 156647, "epoch": 3729} {"train_loss": -6.912856101989746, "global_step": 156648, "epoch": 3729} {"train_loss": -6.938900470733643, "global_step": 156649, "epoch": 3729} {"train_loss": -6.762639999389648, "global_step": 156650, "epoch": 3729} {"train_loss": -6.722675323486328, "global_step": 156651, "epoch": 3729} {"train_loss": -6.851678848266602, "global_step": 156652, "epoch": 3729} {"train_loss": -6.823395729064941, "global_step": 156653, "epoch": 3729} {"train_loss": -6.889780521392822, "global_step": 156654, "epoch": 3729} {"train_loss": -6.928805351257324, "global_step": 156655, "epoch": 3729} {"train_loss": -6.7659406661987305, "global_step": 156656, "epoch": 3729} {"train_loss": -6.922918796539307, "global_step": 156657, "epoch": 3729} {"train_loss": -6.955423355102539, "global_step": 156658, "epoch": 3729} {"train_loss": -6.9321837311699275, "global_step": 156659, "epoch": 3729, "val_loss": 79215.9375} {"train_loss": -6.945221424102783, "global_step": 156660, "epoch": 3730} {"train_loss": -6.805269241333008, "global_step": 156661, "epoch": 3730} {"train_loss": -6.908328056335449, "global_step": 156662, "epoch": 3730} {"train_loss": -6.895505905151367, "global_step": 156663, "epoch": 3730} {"train_loss": -6.868381023406982, "global_step": 156664, "epoch": 3730} {"train_loss": -7.013089656829834, "global_step": 156665, "epoch": 3730} {"train_loss": -6.861176490783691, "global_step": 156666, "epoch": 3730} {"train_loss": -6.799646854400635, "global_step": 156667, "epoch": 3730} {"train_loss": -6.963175296783447, "global_step": 156668, "epoch": 3730} {"train_loss": -6.891415119171143, "global_step": 156669, "epoch": 3730} {"train_loss": -6.902727127075195, "global_step": 156670, "epoch": 3730} {"train_loss": -6.863860130310059, "global_step": 156671, "epoch": 3730} {"train_loss": -6.987667083740234, "global_step": 156672, "epoch": 3730} {"train_loss": -6.948349952697754, "global_step": 156673, "epoch": 3730} {"train_loss": -6.944624900817871, "global_step": 156674, "epoch": 3730} {"train_loss": -7.034746170043945, "global_step": 156675, "epoch": 3730} {"train_loss": -6.840951919555664, "global_step": 156676, "epoch": 3730} {"train_loss": -6.995649814605713, "global_step": 156677, "epoch": 3730} {"train_loss": -6.901425361633301, "global_step": 156678, "epoch": 3730} {"train_loss": -6.992781639099121, "global_step": 156679, "epoch": 3730} {"train_loss": -6.935906887054443, "global_step": 156680, "epoch": 3730} {"train_loss": -6.976142883300781, "global_step": 156681, "epoch": 3730} {"train_loss": -6.955507278442383, "global_step": 156682, "epoch": 3730} {"train_loss": -6.983753681182861, "global_step": 156683, "epoch": 3730} {"train_loss": -6.941171169281006, "global_step": 156684, "epoch": 3730} {"train_loss": -6.922738552093506, "global_step": 156685, "epoch": 3730} {"train_loss": -6.928329944610596, "global_step": 156686, "epoch": 3730} {"train_loss": -6.879202842712402, "global_step": 156687, "epoch": 3730} {"train_loss": -6.8333740234375, "global_step": 156688, "epoch": 3730} {"train_loss": -6.84269380569458, "global_step": 156689, "epoch": 3730} {"train_loss": -6.79464054107666, "global_step": 156690, "epoch": 3730} {"train_loss": -6.816699981689453, "global_step": 156691, "epoch": 3730} {"train_loss": -6.953391075134277, "global_step": 156692, "epoch": 3730} {"train_loss": -6.888698101043701, "global_step": 156693, "epoch": 3730} {"train_loss": -6.87500524520874, "global_step": 156694, "epoch": 3730} {"train_loss": -6.86757755279541, "global_step": 156695, "epoch": 3730} {"train_loss": -6.900223731994629, "global_step": 156696, "epoch": 3730} {"train_loss": -6.858936309814453, "global_step": 156697, "epoch": 3730} {"train_loss": -6.829558372497559, "global_step": 156698, "epoch": 3730} {"train_loss": -6.862200736999512, "global_step": 156699, "epoch": 3730} {"train_loss": -6.897405624389648, "global_step": 156700, "epoch": 3730} {"train_loss": -6.902933325086321, "global_step": 156701, "epoch": 3730, "val_loss": 79071.7421875} {"train_loss": -6.985470294952393, "global_step": 156702, "epoch": 3731} {"train_loss": -6.905605316162109, "global_step": 156703, "epoch": 3731} {"train_loss": -6.861225605010986, "global_step": 156704, "epoch": 3731} {"train_loss": -6.882510185241699, "global_step": 156705, "epoch": 3731} {"train_loss": -6.892403602600098, "global_step": 156706, "epoch": 3731} {"train_loss": -6.782163619995117, "global_step": 156707, "epoch": 3731} {"train_loss": -6.798990249633789, "global_step": 156708, "epoch": 3731} {"train_loss": -6.7063751220703125, "global_step": 156709, "epoch": 3731} {"train_loss": -6.98192024230957, "global_step": 156710, "epoch": 3731} {"train_loss": -6.808663368225098, "global_step": 156711, "epoch": 3731} {"train_loss": -6.851365089416504, "global_step": 156712, "epoch": 3731} {"train_loss": -6.855144500732422, "global_step": 156713, "epoch": 3731} {"train_loss": -6.73932409286499, "global_step": 156714, "epoch": 3731} {"train_loss": -6.787945747375488, "global_step": 156715, "epoch": 3731} {"train_loss": -6.759588241577148, "global_step": 156716, "epoch": 3731} {"train_loss": -6.925772666931152, "global_step": 156717, "epoch": 3731} {"train_loss": -6.696971893310547, "global_step": 156718, "epoch": 3731} {"train_loss": -6.774828910827637, "global_step": 156719, "epoch": 3731} {"train_loss": -6.659074783325195, "global_step": 156720, "epoch": 3731} {"train_loss": -6.8221893310546875, "global_step": 156721, "epoch": 3731} {"train_loss": -6.707531929016113, "global_step": 156722, "epoch": 3731} {"train_loss": -6.918468475341797, "global_step": 156723, "epoch": 3731} {"train_loss": -6.7964067459106445, "global_step": 156724, "epoch": 3731} {"train_loss": -6.838469505310059, "global_step": 156725, "epoch": 3731} {"train_loss": -6.818399429321289, "global_step": 156726, "epoch": 3731} {"train_loss": -6.766258239746094, "global_step": 156727, "epoch": 3731} {"train_loss": -6.814820289611816, "global_step": 156728, "epoch": 3731} {"train_loss": -6.797933101654053, "global_step": 156729, "epoch": 3731} {"train_loss": -6.8344855308532715, "global_step": 156730, "epoch": 3731} {"train_loss": -6.844512462615967, "global_step": 156731, "epoch": 3731} {"train_loss": -6.978153228759766, "global_step": 156732, "epoch": 3731} {"train_loss": -6.839426040649414, "global_step": 156733, "epoch": 3731} {"train_loss": -6.862090110778809, "global_step": 156734, "epoch": 3731} {"train_loss": -6.8581037521362305, "global_step": 156735, "epoch": 3731} {"train_loss": -6.798670768737793, "global_step": 156736, "epoch": 3731} {"train_loss": -6.932908058166504, "global_step": 156737, "epoch": 3731} {"train_loss": -6.969206809997559, "global_step": 156738, "epoch": 3731} {"train_loss": -6.925042629241943, "global_step": 156739, "epoch": 3731} {"train_loss": -6.853410243988037, "global_step": 156740, "epoch": 3731} {"train_loss": -6.943478584289551, "global_step": 156741, "epoch": 3731} {"train_loss": -7.018150329589844, "global_step": 156742, "epoch": 3731} {"train_loss": -6.843963577633812, "global_step": 156743, "epoch": 3731, "val_loss": 79088.5859375} {"train_loss": -6.97132682800293, "global_step": 156744, "epoch": 3732} {"train_loss": -6.935678005218506, "global_step": 156745, "epoch": 3732} {"train_loss": -6.9965715408325195, "global_step": 156746, "epoch": 3732} {"train_loss": -6.9846649169921875, "global_step": 156747, "epoch": 3732} {"train_loss": -6.833920478820801, "global_step": 156748, "epoch": 3732} {"train_loss": -7.016760349273682, "global_step": 156749, "epoch": 3732} {"train_loss": -6.900666236877441, "global_step": 156750, "epoch": 3732} {"train_loss": -6.9154744148254395, "global_step": 156751, "epoch": 3732} {"train_loss": -6.984528541564941, "global_step": 156752, "epoch": 3732} {"train_loss": -6.985237121582031, "global_step": 156753, "epoch": 3732} {"train_loss": -7.072389602661133, "global_step": 156754, "epoch": 3732} {"train_loss": -6.826995372772217, "global_step": 156755, "epoch": 3732} {"train_loss": -7.012054920196533, "global_step": 156756, "epoch": 3732} {"train_loss": -6.954529285430908, "global_step": 156757, "epoch": 3732} {"train_loss": -6.93109130859375, "global_step": 156758, "epoch": 3732} {"train_loss": -6.750320911407471, "global_step": 156759, "epoch": 3732} {"train_loss": -6.829326629638672, "global_step": 156760, "epoch": 3732} {"train_loss": -6.950423717498779, "global_step": 156761, "epoch": 3732} {"train_loss": -6.997997283935547, "global_step": 156762, "epoch": 3732} {"train_loss": -7.016349792480469, "global_step": 156763, "epoch": 3732} {"train_loss": -6.89786958694458, "global_step": 156764, "epoch": 3732} {"train_loss": -6.814474105834961, "global_step": 156765, "epoch": 3732} {"train_loss": -6.866235733032227, "global_step": 156766, "epoch": 3732} {"train_loss": -6.937664031982422, "global_step": 156767, "epoch": 3732} {"train_loss": -6.883333206176758, "global_step": 156768, "epoch": 3732} {"train_loss": -6.962430953979492, "global_step": 156769, "epoch": 3732} {"train_loss": -6.847273826599121, "global_step": 156770, "epoch": 3732} {"train_loss": -6.922063827514648, "global_step": 156771, "epoch": 3732} {"train_loss": -6.965268135070801, "global_step": 156772, "epoch": 3732} {"train_loss": -6.899055004119873, "global_step": 156773, "epoch": 3732} {"train_loss": -6.9857401847839355, "global_step": 156774, "epoch": 3732} {"train_loss": -6.897124290466309, "global_step": 156775, "epoch": 3732} {"train_loss": -6.9534711837768555, "global_step": 156776, "epoch": 3732} {"train_loss": -6.941993713378906, "global_step": 156777, "epoch": 3732} {"train_loss": -6.908203125, "global_step": 156778, "epoch": 3732} {"train_loss": -6.897780418395996, "global_step": 156779, "epoch": 3732} {"train_loss": -6.998429298400879, "global_step": 156780, "epoch": 3732} {"train_loss": -6.904086112976074, "global_step": 156781, "epoch": 3732} {"train_loss": -6.928428649902344, "global_step": 156782, "epoch": 3732} {"train_loss": -6.944319725036621, "global_step": 156783, "epoch": 3732} {"train_loss": -7.00450325012207, "global_step": 156784, "epoch": 3732} {"train_loss": -6.935518821080525, "global_step": 156785, "epoch": 3732, "val_loss": 79161.859375} {"train_loss": -7.062723159790039, "global_step": 156786, "epoch": 3733} {"train_loss": -6.923423767089844, "global_step": 156787, "epoch": 3733} {"train_loss": -6.95255184173584, "global_step": 156788, "epoch": 3733} {"train_loss": -7.051093101501465, "global_step": 156789, "epoch": 3733} {"train_loss": -7.059591293334961, "global_step": 156790, "epoch": 3733} {"train_loss": -7.0772905349731445, "global_step": 156791, "epoch": 3733} {"train_loss": -7.06468391418457, "global_step": 156792, "epoch": 3733} {"train_loss": -6.958436489105225, "global_step": 156793, "epoch": 3733} {"train_loss": -6.908595085144043, "global_step": 156794, "epoch": 3733} {"train_loss": -7.002076148986816, "global_step": 156795, "epoch": 3733} {"train_loss": -7.034544944763184, "global_step": 156796, "epoch": 3733} {"train_loss": -7.00642204284668, "global_step": 156797, "epoch": 3733} {"train_loss": -6.93596076965332, "global_step": 156798, "epoch": 3733} {"train_loss": -6.865166664123535, "global_step": 156799, "epoch": 3733} {"train_loss": -6.866539001464844, "global_step": 156800, "epoch": 3733} {"train_loss": -6.95646858215332, "global_step": 156801, "epoch": 3733} {"train_loss": -6.902487277984619, "global_step": 156802, "epoch": 3733} {"train_loss": -6.911224842071533, "global_step": 156803, "epoch": 3733} {"train_loss": -6.811468124389648, "global_step": 156804, "epoch": 3733} {"train_loss": -6.90962028503418, "global_step": 156805, "epoch": 3733} {"train_loss": -6.738936424255371, "global_step": 156806, "epoch": 3733} {"train_loss": -6.667477607727051, "global_step": 156807, "epoch": 3733} {"train_loss": -6.9562883377075195, "global_step": 156808, "epoch": 3733} {"train_loss": -6.823825359344482, "global_step": 156809, "epoch": 3733} {"train_loss": -6.790842533111572, "global_step": 156810, "epoch": 3733} {"train_loss": -6.9420599937438965, "global_step": 156811, "epoch": 3733} {"train_loss": -6.721945285797119, "global_step": 156812, "epoch": 3733} {"train_loss": -6.917325496673584, "global_step": 156813, "epoch": 3733} {"train_loss": -6.875400543212891, "global_step": 156814, "epoch": 3733} {"train_loss": -6.909832000732422, "global_step": 156815, "epoch": 3733} {"train_loss": -6.973869323730469, "global_step": 156816, "epoch": 3733} {"train_loss": -6.863952159881592, "global_step": 156817, "epoch": 3733} {"train_loss": -6.942487716674805, "global_step": 156818, "epoch": 3733} {"train_loss": -6.91066312789917, "global_step": 156819, "epoch": 3733} {"train_loss": -6.971470355987549, "global_step": 156820, "epoch": 3733} {"train_loss": -6.988773822784424, "global_step": 156821, "epoch": 3733} {"train_loss": -6.96897029876709, "global_step": 156822, "epoch": 3733} {"train_loss": -6.952145576477051, "global_step": 156823, "epoch": 3733} {"train_loss": -6.935266494750977, "global_step": 156824, "epoch": 3733} {"train_loss": -6.879734992980957, "global_step": 156825, "epoch": 3733} {"train_loss": -7.014455795288086, "global_step": 156826, "epoch": 3733} {"train_loss": -6.928787503923688, "global_step": 156827, "epoch": 3733, "val_loss": 79117.6875} {"train_loss": -7.008639335632324, "global_step": 156828, "epoch": 3734} {"train_loss": -6.930758476257324, "global_step": 156829, "epoch": 3734} {"train_loss": -6.98190450668335, "global_step": 156830, "epoch": 3734} {"train_loss": -6.937696933746338, "global_step": 156831, "epoch": 3734} {"train_loss": -6.980385780334473, "global_step": 156832, "epoch": 3734} {"train_loss": -7.009103775024414, "global_step": 156833, "epoch": 3734} {"train_loss": -6.937939167022705, "global_step": 156834, "epoch": 3734} {"train_loss": -6.9744720458984375, "global_step": 156835, "epoch": 3734} {"train_loss": -6.945418357849121, "global_step": 156836, "epoch": 3734} {"train_loss": -7.011375427246094, "global_step": 156837, "epoch": 3734} {"train_loss": -6.960249423980713, "global_step": 156838, "epoch": 3734} {"train_loss": -6.916587829589844, "global_step": 156839, "epoch": 3734} {"train_loss": -6.835238456726074, "global_step": 156840, "epoch": 3734} {"train_loss": -6.992621421813965, "global_step": 156841, "epoch": 3734} {"train_loss": -7.072590351104736, "global_step": 156842, "epoch": 3734} {"train_loss": -6.980348110198975, "global_step": 156843, "epoch": 3734} {"train_loss": -6.880270481109619, "global_step": 156844, "epoch": 3734} {"train_loss": -6.965520858764648, "global_step": 156845, "epoch": 3734} {"train_loss": -6.990617752075195, "global_step": 156846, "epoch": 3734} {"train_loss": -7.015669822692871, "global_step": 156847, "epoch": 3734} {"train_loss": -7.015470504760742, "global_step": 156848, "epoch": 3734} {"train_loss": -6.921625137329102, "global_step": 156849, "epoch": 3734} {"train_loss": -7.0318098068237305, "global_step": 156850, "epoch": 3734} {"train_loss": -7.067407131195068, "global_step": 156851, "epoch": 3734} {"train_loss": -6.900994300842285, "global_step": 156852, "epoch": 3734} {"train_loss": -6.920289039611816, "global_step": 156853, "epoch": 3734} {"train_loss": -7.013576507568359, "global_step": 156854, "epoch": 3734} {"train_loss": -7.117849349975586, "global_step": 156855, "epoch": 3734} {"train_loss": -6.902775287628174, "global_step": 156856, "epoch": 3734} {"train_loss": -7.018622875213623, "global_step": 156857, "epoch": 3734} {"train_loss": -6.968494415283203, "global_step": 156858, "epoch": 3734} {"train_loss": -6.863051891326904, "global_step": 156859, "epoch": 3734} {"train_loss": -6.910625457763672, "global_step": 156860, "epoch": 3734} {"train_loss": -6.949124336242676, "global_step": 156861, "epoch": 3734} {"train_loss": -6.74269962310791, "global_step": 156862, "epoch": 3734} {"train_loss": -6.8459553718566895, "global_step": 156863, "epoch": 3734} {"train_loss": -6.968997955322266, "global_step": 156864, "epoch": 3734} {"train_loss": -6.801375389099121, "global_step": 156865, "epoch": 3734} {"train_loss": -6.750395774841309, "global_step": 156866, "epoch": 3734} {"train_loss": -7.010526657104492, "global_step": 156867, "epoch": 3734} {"train_loss": -6.879763603210449, "global_step": 156868, "epoch": 3734} {"train_loss": -6.946219955171857, "global_step": 156869, "epoch": 3734, "val_loss": 79013.9609375} {"train_loss": -6.903439044952393, "global_step": 156870, "epoch": 3735} {"train_loss": -6.837493896484375, "global_step": 156871, "epoch": 3735} {"train_loss": -6.944537162780762, "global_step": 156872, "epoch": 3735} {"train_loss": -6.8270978927612305, "global_step": 156873, "epoch": 3735} {"train_loss": -6.959394454956055, "global_step": 156874, "epoch": 3735} {"train_loss": -6.903526306152344, "global_step": 156875, "epoch": 3735} {"train_loss": -6.900453090667725, "global_step": 156876, "epoch": 3735} {"train_loss": -6.982925891876221, "global_step": 156877, "epoch": 3735} {"train_loss": -6.958063125610352, "global_step": 156878, "epoch": 3735} {"train_loss": -6.889505386352539, "global_step": 156879, "epoch": 3735} {"train_loss": -6.936769485473633, "global_step": 156880, "epoch": 3735} {"train_loss": -6.893404006958008, "global_step": 156881, "epoch": 3735} {"train_loss": -6.850350379943848, "global_step": 156882, "epoch": 3735} {"train_loss": -7.001038074493408, "global_step": 156883, "epoch": 3735} {"train_loss": -6.94611930847168, "global_step": 156884, "epoch": 3735} {"train_loss": -6.857152462005615, "global_step": 156885, "epoch": 3735} {"train_loss": -6.907359600067139, "global_step": 156886, "epoch": 3735} {"train_loss": -7.020041465759277, "global_step": 156887, "epoch": 3735} {"train_loss": -6.879524230957031, "global_step": 156888, "epoch": 3735} {"train_loss": -6.932595729827881, "global_step": 156889, "epoch": 3735} {"train_loss": -7.022320747375488, "global_step": 156890, "epoch": 3735} {"train_loss": -6.903224945068359, "global_step": 156891, "epoch": 3735} {"train_loss": -6.919938087463379, "global_step": 156892, "epoch": 3735} {"train_loss": -6.884601593017578, "global_step": 156893, "epoch": 3735} {"train_loss": -6.816676139831543, "global_step": 156894, "epoch": 3735} {"train_loss": -6.885847091674805, "global_step": 156895, "epoch": 3735} {"train_loss": -6.964485168457031, "global_step": 156896, "epoch": 3735} {"train_loss": -6.925868988037109, "global_step": 156897, "epoch": 3735} {"train_loss": -6.907237529754639, "global_step": 156898, "epoch": 3735} {"train_loss": -6.839810371398926, "global_step": 156899, "epoch": 3735} {"train_loss": -6.856867790222168, "global_step": 156900, "epoch": 3735} {"train_loss": -6.891907691955566, "global_step": 156901, "epoch": 3735} {"train_loss": -7.001451015472412, "global_step": 156902, "epoch": 3735} {"train_loss": -6.957859992980957, "global_step": 156903, "epoch": 3735} {"train_loss": -7.040069103240967, "global_step": 156904, "epoch": 3735} {"train_loss": -6.779102802276611, "global_step": 156905, "epoch": 3735} {"train_loss": -6.862068176269531, "global_step": 156906, "epoch": 3735} {"train_loss": -6.9768524169921875, "global_step": 156907, "epoch": 3735} {"train_loss": -6.834277153015137, "global_step": 156908, "epoch": 3735} {"train_loss": -6.9086151123046875, "global_step": 156909, "epoch": 3735} {"train_loss": -6.908759117126465, "global_step": 156910, "epoch": 3735} {"train_loss": -6.910221985408238, "global_step": 156911, "epoch": 3735, "val_loss": 79220.765625} {"train_loss": -6.898153781890869, "global_step": 156912, "epoch": 3736} {"train_loss": -6.882754325866699, "global_step": 156913, "epoch": 3736} {"train_loss": -6.910397052764893, "global_step": 156914, "epoch": 3736} {"train_loss": -7.016674995422363, "global_step": 156915, "epoch": 3736} {"train_loss": -6.917654991149902, "global_step": 156916, "epoch": 3736} {"train_loss": -6.852636337280273, "global_step": 156917, "epoch": 3736} {"train_loss": -6.934025764465332, "global_step": 156918, "epoch": 3736} {"train_loss": -6.989565849304199, "global_step": 156919, "epoch": 3736} {"train_loss": -6.963193893432617, "global_step": 156920, "epoch": 3736} {"train_loss": -6.8550004959106445, "global_step": 156921, "epoch": 3736} {"train_loss": -7.074479579925537, "global_step": 156922, "epoch": 3736} {"train_loss": -7.003020286560059, "global_step": 156923, "epoch": 3736} {"train_loss": -6.934206485748291, "global_step": 156924, "epoch": 3736} {"train_loss": -6.969522476196289, "global_step": 156925, "epoch": 3736} {"train_loss": -7.007452487945557, "global_step": 156926, "epoch": 3736} {"train_loss": -7.0091962814331055, "global_step": 156927, "epoch": 3736} {"train_loss": -6.98649787902832, "global_step": 156928, "epoch": 3736} {"train_loss": -6.977763652801514, "global_step": 156929, "epoch": 3736} {"train_loss": -6.9185357093811035, "global_step": 156930, "epoch": 3736} {"train_loss": -6.93652868270874, "global_step": 156931, "epoch": 3736} {"train_loss": -6.9674458503723145, "global_step": 156932, "epoch": 3736} {"train_loss": -6.897188186645508, "global_step": 156933, "epoch": 3736} {"train_loss": -6.967970848083496, "global_step": 156934, "epoch": 3736} {"train_loss": -7.003591537475586, "global_step": 156935, "epoch": 3736} {"train_loss": -6.958558082580566, "global_step": 156936, "epoch": 3736} {"train_loss": -6.9482221603393555, "global_step": 156937, "epoch": 3736} {"train_loss": -6.92856502532959, "global_step": 156938, "epoch": 3736} {"train_loss": -6.990870475769043, "global_step": 156939, "epoch": 3736} {"train_loss": -6.934709548950195, "global_step": 156940, "epoch": 3736} {"train_loss": -7.0086669921875, "global_step": 156941, "epoch": 3736} {"train_loss": -7.0085673332214355, "global_step": 156942, "epoch": 3736} {"train_loss": -6.825039863586426, "global_step": 156943, "epoch": 3736} {"train_loss": -6.993897914886475, "global_step": 156944, "epoch": 3736} {"train_loss": -6.856719970703125, "global_step": 156945, "epoch": 3736} {"train_loss": -6.867462158203125, "global_step": 156946, "epoch": 3736} {"train_loss": -6.87192440032959, "global_step": 156947, "epoch": 3736} {"train_loss": -6.794833183288574, "global_step": 156948, "epoch": 3736} {"train_loss": -6.802700519561768, "global_step": 156949, "epoch": 3736} {"train_loss": -6.885721683502197, "global_step": 156950, "epoch": 3736} {"train_loss": -6.876188278198242, "global_step": 156951, "epoch": 3736} {"train_loss": -6.791781425476074, "global_step": 156952, "epoch": 3736} {"train_loss": -6.931203342619396, "global_step": 156953, "epoch": 3736, "val_loss": 79168.78125} {"train_loss": -6.807764053344727, "global_step": 156954, "epoch": 3737} {"train_loss": -6.824106216430664, "global_step": 156955, "epoch": 3737} {"train_loss": -6.849274635314941, "global_step": 156956, "epoch": 3737} {"train_loss": -6.911437034606934, "global_step": 156957, "epoch": 3737} {"train_loss": -6.9611077308654785, "global_step": 156958, "epoch": 3737} {"train_loss": -6.7443952560424805, "global_step": 156959, "epoch": 3737} {"train_loss": -6.907597064971924, "global_step": 156960, "epoch": 3737} {"train_loss": -6.94943904876709, "global_step": 156961, "epoch": 3737} {"train_loss": -6.848419189453125, "global_step": 156962, "epoch": 3737} {"train_loss": -6.892404556274414, "global_step": 156963, "epoch": 3737} {"train_loss": -6.915818214416504, "global_step": 156964, "epoch": 3737} {"train_loss": -6.878120422363281, "global_step": 156965, "epoch": 3737} {"train_loss": -6.98691463470459, "global_step": 156966, "epoch": 3737} {"train_loss": -6.977634906768799, "global_step": 156967, "epoch": 3737} {"train_loss": -6.998512268066406, "global_step": 156968, "epoch": 3737} {"train_loss": -7.021301746368408, "global_step": 156969, "epoch": 3737} {"train_loss": -6.823463439941406, "global_step": 156970, "epoch": 3737} {"train_loss": -6.89340353012085, "global_step": 156971, "epoch": 3737} {"train_loss": -7.039575576782227, "global_step": 156972, "epoch": 3737} {"train_loss": -6.827396392822266, "global_step": 156973, "epoch": 3737} {"train_loss": -6.979060173034668, "global_step": 156974, "epoch": 3737} {"train_loss": -7.008942604064941, "global_step": 156975, "epoch": 3737} {"train_loss": -6.932818412780762, "global_step": 156976, "epoch": 3737} {"train_loss": -6.9641218185424805, "global_step": 156977, "epoch": 3737} {"train_loss": -6.910507678985596, "global_step": 156978, "epoch": 3737} {"train_loss": -6.8105292320251465, "global_step": 156979, "epoch": 3737} {"train_loss": -6.941503524780273, "global_step": 156980, "epoch": 3737} {"train_loss": -7.003486633300781, "global_step": 156981, "epoch": 3737} {"train_loss": -6.785346508026123, "global_step": 156982, "epoch": 3737} {"train_loss": -6.922861099243164, "global_step": 156983, "epoch": 3737} {"train_loss": -6.968520641326904, "global_step": 156984, "epoch": 3737} {"train_loss": -6.862799644470215, "global_step": 156985, "epoch": 3737} {"train_loss": -6.973496437072754, "global_step": 156986, "epoch": 3737} {"train_loss": -6.975687503814697, "global_step": 156987, "epoch": 3737} {"train_loss": -6.888995170593262, "global_step": 156988, "epoch": 3737} {"train_loss": -6.900426864624023, "global_step": 156989, "epoch": 3737} {"train_loss": -7.025450706481934, "global_step": 156990, "epoch": 3737} {"train_loss": -6.898631572723389, "global_step": 156991, "epoch": 3737} {"train_loss": -7.076178550720215, "global_step": 156992, "epoch": 3737} {"train_loss": -6.801401138305664, "global_step": 156993, "epoch": 3737} {"train_loss": -6.95634651184082, "global_step": 156994, "epoch": 3737} {"train_loss": -6.923117444628761, "global_step": 156995, "epoch": 3737, "val_loss": 78970.5390625} {"train_loss": -7.117734909057617, "global_step": 156996, "epoch": 3738} {"train_loss": -6.928229808807373, "global_step": 156997, "epoch": 3738} {"train_loss": -6.901522636413574, "global_step": 156998, "epoch": 3738} {"train_loss": -7.016334533691406, "global_step": 156999, "epoch": 3738} {"train_loss": -6.863115310668945, "global_step": 157000, "epoch": 3738} {"train_loss": -6.980228900909424, "global_step": 157001, "epoch": 3738} {"train_loss": -6.887866020202637, "global_step": 157002, "epoch": 3738} {"train_loss": -7.095422744750977, "global_step": 157003, "epoch": 3738} {"train_loss": -6.967975616455078, "global_step": 157004, "epoch": 3738} {"train_loss": -6.937034606933594, "global_step": 157005, "epoch": 3738} {"train_loss": -7.081932544708252, "global_step": 157006, "epoch": 3738} {"train_loss": -6.794561386108398, "global_step": 157007, "epoch": 3738} {"train_loss": -6.988103866577148, "global_step": 157008, "epoch": 3738} {"train_loss": -7.010876655578613, "global_step": 157009, "epoch": 3738} {"train_loss": -7.02711296081543, "global_step": 157010, "epoch": 3738} {"train_loss": -6.805216312408447, "global_step": 157011, "epoch": 3738} {"train_loss": -6.966170310974121, "global_step": 157012, "epoch": 3738} {"train_loss": -6.946150779724121, "global_step": 157013, "epoch": 3738} {"train_loss": -6.91976261138916, "global_step": 157014, "epoch": 3738} {"train_loss": -6.849093437194824, "global_step": 157015, "epoch": 3738} {"train_loss": -6.783872604370117, "global_step": 157016, "epoch": 3738} {"train_loss": -6.804694652557373, "global_step": 157017, "epoch": 3738} {"train_loss": -6.9362945556640625, "global_step": 157018, "epoch": 3738} {"train_loss": -6.853058815002441, "global_step": 157019, "epoch": 3738} {"train_loss": -6.5855841636657715, "global_step": 157020, "epoch": 3738} {"train_loss": -6.665679931640625, "global_step": 157021, "epoch": 3738} {"train_loss": -6.641745567321777, "global_step": 157022, "epoch": 3738} {"train_loss": -6.731609344482422, "global_step": 157023, "epoch": 3738} {"train_loss": -6.843378067016602, "global_step": 157024, "epoch": 3738} {"train_loss": -6.547666072845459, "global_step": 157025, "epoch": 3738} {"train_loss": -6.869375705718994, "global_step": 157026, "epoch": 3738} {"train_loss": -6.655797004699707, "global_step": 157027, "epoch": 3738} {"train_loss": -6.70413875579834, "global_step": 157028, "epoch": 3738} {"train_loss": -6.598482131958008, "global_step": 157029, "epoch": 3738} {"train_loss": -6.887535572052002, "global_step": 157030, "epoch": 3738} {"train_loss": -6.771510124206543, "global_step": 157031, "epoch": 3738} {"train_loss": -6.731417655944824, "global_step": 157032, "epoch": 3738} {"train_loss": -6.768894195556641, "global_step": 157033, "epoch": 3738} {"train_loss": -6.706441879272461, "global_step": 157034, "epoch": 3738} {"train_loss": -6.792071342468262, "global_step": 157035, "epoch": 3738} {"train_loss": -6.703216552734375, "global_step": 157036, "epoch": 3738} {"train_loss": -6.844023250398182, "global_step": 157037, "epoch": 3738, "val_loss": 79004.265625} {"train_loss": -6.752976417541504, "global_step": 157038, "epoch": 3739} {"train_loss": -6.869367599487305, "global_step": 157039, "epoch": 3739} {"train_loss": -6.872464179992676, "global_step": 157040, "epoch": 3739} {"train_loss": -6.781310081481934, "global_step": 157041, "epoch": 3739} {"train_loss": -6.950723648071289, "global_step": 157042, "epoch": 3739} {"train_loss": -6.818872451782227, "global_step": 157043, "epoch": 3739} {"train_loss": -6.876270294189453, "global_step": 157044, "epoch": 3739} {"train_loss": -6.891228199005127, "global_step": 157045, "epoch": 3739} {"train_loss": -6.792240142822266, "global_step": 157046, "epoch": 3739} {"train_loss": -6.902606010437012, "global_step": 157047, "epoch": 3739} {"train_loss": -6.854513168334961, "global_step": 157048, "epoch": 3739} {"train_loss": -6.903743743896484, "global_step": 157049, "epoch": 3739} {"train_loss": -7.01182746887207, "global_step": 157050, "epoch": 3739} {"train_loss": -6.832115173339844, "global_step": 157051, "epoch": 3739} {"train_loss": -6.883973121643066, "global_step": 157052, "epoch": 3739} {"train_loss": -6.927350044250488, "global_step": 157053, "epoch": 3739} {"train_loss": -6.8516316413879395, "global_step": 157054, "epoch": 3739} {"train_loss": -6.97569465637207, "global_step": 157055, "epoch": 3739} {"train_loss": -7.062539100646973, "global_step": 157056, "epoch": 3739} {"train_loss": -6.914403438568115, "global_step": 157057, "epoch": 3739} {"train_loss": -6.839437007904053, "global_step": 157058, "epoch": 3739} {"train_loss": -6.997593402862549, "global_step": 157059, "epoch": 3739} {"train_loss": -6.951783180236816, "global_step": 157060, "epoch": 3739} {"train_loss": -6.821698188781738, "global_step": 157061, "epoch": 3739} {"train_loss": -6.883430004119873, "global_step": 157062, "epoch": 3739} {"train_loss": -6.762801170349121, "global_step": 157063, "epoch": 3739} {"train_loss": -6.9235944747924805, "global_step": 157064, "epoch": 3739} {"train_loss": -6.888235569000244, "global_step": 157065, "epoch": 3739} {"train_loss": -6.900575160980225, "global_step": 157066, "epoch": 3739} {"train_loss": -6.72266960144043, "global_step": 157067, "epoch": 3739} {"train_loss": -6.905519485473633, "global_step": 157068, "epoch": 3739} {"train_loss": -6.918508529663086, "global_step": 157069, "epoch": 3739} {"train_loss": -6.947867393493652, "global_step": 157070, "epoch": 3739} {"train_loss": -6.956035137176514, "global_step": 157071, "epoch": 3739} {"train_loss": -6.853374481201172, "global_step": 157072, "epoch": 3739} {"train_loss": -6.923337936401367, "global_step": 157073, "epoch": 3739} {"train_loss": -6.889507293701172, "global_step": 157074, "epoch": 3739} {"train_loss": -6.895124912261963, "global_step": 157075, "epoch": 3739} {"train_loss": -6.800440311431885, "global_step": 157076, "epoch": 3739} {"train_loss": -6.900535583496094, "global_step": 157077, "epoch": 3739} {"train_loss": -6.848158836364746, "global_step": 157078, "epoch": 3739} {"train_loss": -6.884675695782616, "global_step": 157079, "epoch": 3739, "val_loss": 78869.5546875} {"train_loss": -6.873638153076172, "global_step": 157080, "epoch": 3740} {"train_loss": -6.9813337326049805, "global_step": 157081, "epoch": 3740} {"train_loss": -6.927369117736816, "global_step": 157082, "epoch": 3740} {"train_loss": -6.87076473236084, "global_step": 157083, "epoch": 3740} {"train_loss": -6.988525867462158, "global_step": 157084, "epoch": 3740} {"train_loss": -7.010124206542969, "global_step": 157085, "epoch": 3740} {"train_loss": -6.781589508056641, "global_step": 157086, "epoch": 3740} {"train_loss": -6.8424272537231445, "global_step": 157087, "epoch": 3740} {"train_loss": -6.78521728515625, "global_step": 157088, "epoch": 3740} {"train_loss": -6.902768611907959, "global_step": 157089, "epoch": 3740} {"train_loss": -6.768782615661621, "global_step": 157090, "epoch": 3740} {"train_loss": -6.792755603790283, "global_step": 157091, "epoch": 3740} {"train_loss": -6.89523983001709, "global_step": 157092, "epoch": 3740} {"train_loss": -6.7572712898254395, "global_step": 157093, "epoch": 3740} {"train_loss": -6.903061866760254, "global_step": 157094, "epoch": 3740} {"train_loss": -6.651745319366455, "global_step": 157095, "epoch": 3740} {"train_loss": -6.91890811920166, "global_step": 157096, "epoch": 3740} {"train_loss": -6.935959815979004, "global_step": 157097, "epoch": 3740} {"train_loss": -6.948330879211426, "global_step": 157098, "epoch": 3740} {"train_loss": -6.895691394805908, "global_step": 157099, "epoch": 3740} {"train_loss": -6.840412139892578, "global_step": 157100, "epoch": 3740} {"train_loss": -6.931799411773682, "global_step": 157101, "epoch": 3740} {"train_loss": -6.842277526855469, "global_step": 157102, "epoch": 3740} {"train_loss": -6.96060848236084, "global_step": 157103, "epoch": 3740} {"train_loss": -6.932919502258301, "global_step": 157104, "epoch": 3740} {"train_loss": -6.816984176635742, "global_step": 157105, "epoch": 3740} {"train_loss": -6.968325614929199, "global_step": 157106, "epoch": 3740} {"train_loss": -6.904760360717773, "global_step": 157107, "epoch": 3740} {"train_loss": -6.900720119476318, "global_step": 157108, "epoch": 3740} {"train_loss": -6.890288829803467, "global_step": 157109, "epoch": 3740} {"train_loss": -6.846363544464111, "global_step": 157110, "epoch": 3740} {"train_loss": -6.965368270874023, "global_step": 157111, "epoch": 3740} {"train_loss": -6.930141925811768, "global_step": 157112, "epoch": 3740} {"train_loss": -6.983514785766602, "global_step": 157113, "epoch": 3740} {"train_loss": -6.815177917480469, "global_step": 157114, "epoch": 3740} {"train_loss": -6.889538288116455, "global_step": 157115, "epoch": 3740} {"train_loss": -6.879730224609375, "global_step": 157116, "epoch": 3740} {"train_loss": -6.881879806518555, "global_step": 157117, "epoch": 3740} {"train_loss": -7.014487266540527, "global_step": 157118, "epoch": 3740} {"train_loss": -6.976727485656738, "global_step": 157119, "epoch": 3740} {"train_loss": -6.975754261016846, "global_step": 157120, "epoch": 3740} {"train_loss": -6.892559267225719, "global_step": 157121, "epoch": 3740, "val_loss": 79111.75} {"train_loss": -6.886554718017578, "global_step": 157122, "epoch": 3741} {"train_loss": -6.907984733581543, "global_step": 157123, "epoch": 3741} {"train_loss": -6.8842315673828125, "global_step": 157124, "epoch": 3741} {"train_loss": -6.897980213165283, "global_step": 157125, "epoch": 3741} {"train_loss": -7.025101661682129, "global_step": 157126, "epoch": 3741} {"train_loss": -6.835684776306152, "global_step": 157127, "epoch": 3741} {"train_loss": -7.001460075378418, "global_step": 157128, "epoch": 3741} {"train_loss": -6.972900867462158, "global_step": 157129, "epoch": 3741} {"train_loss": -6.894387245178223, "global_step": 157130, "epoch": 3741} {"train_loss": -7.034690856933594, "global_step": 157131, "epoch": 3741} {"train_loss": -6.8211774826049805, "global_step": 157132, "epoch": 3741} {"train_loss": -6.838980674743652, "global_step": 157133, "epoch": 3741} {"train_loss": -6.9749956130981445, "global_step": 157134, "epoch": 3741} {"train_loss": -6.974699020385742, "global_step": 157135, "epoch": 3741} {"train_loss": -7.004406929016113, "global_step": 157136, "epoch": 3741} {"train_loss": -7.0288777351379395, "global_step": 157137, "epoch": 3741} {"train_loss": -6.937352180480957, "global_step": 157138, "epoch": 3741} {"train_loss": -7.067124366760254, "global_step": 157139, "epoch": 3741} {"train_loss": -6.84714937210083, "global_step": 157140, "epoch": 3741} {"train_loss": -6.872700214385986, "global_step": 157141, "epoch": 3741} {"train_loss": -7.046597480773926, "global_step": 157142, "epoch": 3741} {"train_loss": -6.914495468139648, "global_step": 157143, "epoch": 3741} {"train_loss": -6.968390464782715, "global_step": 157144, "epoch": 3741} {"train_loss": -6.994713306427002, "global_step": 157145, "epoch": 3741} {"train_loss": -6.915257453918457, "global_step": 157146, "epoch": 3741} {"train_loss": -7.001440048217773, "global_step": 157147, "epoch": 3741} {"train_loss": -6.922738075256348, "global_step": 157148, "epoch": 3741} {"train_loss": -6.879277229309082, "global_step": 157149, "epoch": 3741} {"train_loss": -7.029813766479492, "global_step": 157150, "epoch": 3741} {"train_loss": -6.973110675811768, "global_step": 157151, "epoch": 3741} {"train_loss": -6.968818187713623, "global_step": 157152, "epoch": 3741} {"train_loss": -6.911167621612549, "global_step": 157153, "epoch": 3741} {"train_loss": -6.9831085205078125, "global_step": 157154, "epoch": 3741} {"train_loss": -6.915360927581787, "global_step": 157155, "epoch": 3741} {"train_loss": -6.9376630783081055, "global_step": 157156, "epoch": 3741} {"train_loss": -6.922804832458496, "global_step": 157157, "epoch": 3741} {"train_loss": -6.975386142730713, "global_step": 157158, "epoch": 3741} {"train_loss": -6.936509132385254, "global_step": 157159, "epoch": 3741} {"train_loss": -6.912128448486328, "global_step": 157160, "epoch": 3741} {"train_loss": -6.904699325561523, "global_step": 157161, "epoch": 3741} {"train_loss": -6.9357075691223145, "global_step": 157162, "epoch": 3741} {"train_loss": -6.942620504470098, "global_step": 157163, "epoch": 3741, "val_loss": 79278.6875} {"train_loss": -6.939910888671875, "global_step": 157164, "epoch": 3742} {"train_loss": -6.9082932472229, "global_step": 157165, "epoch": 3742} {"train_loss": -6.8866071701049805, "global_step": 157166, "epoch": 3742} {"train_loss": -6.949820518493652, "global_step": 157167, "epoch": 3742} {"train_loss": -6.935605049133301, "global_step": 157168, "epoch": 3742} {"train_loss": -6.983483791351318, "global_step": 157169, "epoch": 3742} {"train_loss": -6.980331897735596, "global_step": 157170, "epoch": 3742} {"train_loss": -6.958779811859131, "global_step": 157171, "epoch": 3742} {"train_loss": -6.944741249084473, "global_step": 157172, "epoch": 3742} {"train_loss": -6.849951267242432, "global_step": 157173, "epoch": 3742} {"train_loss": -6.91007661819458, "global_step": 157174, "epoch": 3742} {"train_loss": -6.719791412353516, "global_step": 157175, "epoch": 3742} {"train_loss": -7.055178642272949, "global_step": 157176, "epoch": 3742} {"train_loss": -6.947171688079834, "global_step": 157177, "epoch": 3742} {"train_loss": -6.789799690246582, "global_step": 157178, "epoch": 3742} {"train_loss": -6.8270111083984375, "global_step": 157179, "epoch": 3742} {"train_loss": -6.833600997924805, "global_step": 157180, "epoch": 3742} {"train_loss": -6.83133602142334, "global_step": 157181, "epoch": 3742} {"train_loss": -6.84604549407959, "global_step": 157182, "epoch": 3742} {"train_loss": -6.886784553527832, "global_step": 157183, "epoch": 3742} {"train_loss": -6.9123382568359375, "global_step": 157184, "epoch": 3742} {"train_loss": -6.840890407562256, "global_step": 157185, "epoch": 3742} {"train_loss": -6.953423976898193, "global_step": 157186, "epoch": 3742} {"train_loss": -7.015011310577393, "global_step": 157187, "epoch": 3742} {"train_loss": -6.82247257232666, "global_step": 157188, "epoch": 3742} {"train_loss": -6.918595314025879, "global_step": 157189, "epoch": 3742} {"train_loss": -6.900272846221924, "global_step": 157190, "epoch": 3742} {"train_loss": -6.919370651245117, "global_step": 157191, "epoch": 3742} {"train_loss": -7.052639007568359, "global_step": 157192, "epoch": 3742} {"train_loss": -6.9271769523620605, "global_step": 157193, "epoch": 3742} {"train_loss": -6.873812198638916, "global_step": 157194, "epoch": 3742} {"train_loss": -6.9095869064331055, "global_step": 157195, "epoch": 3742} {"train_loss": -6.92820405960083, "global_step": 157196, "epoch": 3742} {"train_loss": -6.841555118560791, "global_step": 157197, "epoch": 3742} {"train_loss": -7.002658367156982, "global_step": 157198, "epoch": 3742} {"train_loss": -6.844085693359375, "global_step": 157199, "epoch": 3742} {"train_loss": -6.8948516845703125, "global_step": 157200, "epoch": 3742} {"train_loss": -7.051485538482666, "global_step": 157201, "epoch": 3742} {"train_loss": -6.9825005531311035, "global_step": 157202, "epoch": 3742} {"train_loss": -6.973609924316406, "global_step": 157203, "epoch": 3742} {"train_loss": -6.967885971069336, "global_step": 157204, "epoch": 3742} {"train_loss": -6.91330835932777, "global_step": 157205, "epoch": 3742, "val_loss": 79024.0546875} {"train_loss": -7.069716453552246, "global_step": 157206, "epoch": 3743} {"train_loss": -6.9391350746154785, "global_step": 157207, "epoch": 3743} {"train_loss": -6.93195915222168, "global_step": 157208, "epoch": 3743} {"train_loss": -6.946694374084473, "global_step": 157209, "epoch": 3743} {"train_loss": -6.883060932159424, "global_step": 157210, "epoch": 3743} {"train_loss": -6.942988395690918, "global_step": 157211, "epoch": 3743} {"train_loss": -7.05167293548584, "global_step": 157212, "epoch": 3743} {"train_loss": -6.915042877197266, "global_step": 157213, "epoch": 3743} {"train_loss": -6.935713291168213, "global_step": 157214, "epoch": 3743} {"train_loss": -6.923035621643066, "global_step": 157215, "epoch": 3743} {"train_loss": -6.842431545257568, "global_step": 157216, "epoch": 3743} {"train_loss": -6.90927791595459, "global_step": 157217, "epoch": 3743} {"train_loss": -7.050541877746582, "global_step": 157218, "epoch": 3743} {"train_loss": -6.985478401184082, "global_step": 157219, "epoch": 3743} {"train_loss": -6.820057392120361, "global_step": 157220, "epoch": 3743} {"train_loss": -6.920932769775391, "global_step": 157221, "epoch": 3743} {"train_loss": -6.995597839355469, "global_step": 157222, "epoch": 3743} {"train_loss": -6.938417434692383, "global_step": 157223, "epoch": 3743} {"train_loss": -6.989880561828613, "global_step": 157224, "epoch": 3743} {"train_loss": -7.034107208251953, "global_step": 157225, "epoch": 3743} {"train_loss": -7.036016464233398, "global_step": 157226, "epoch": 3743} {"train_loss": -6.9442830085754395, "global_step": 157227, "epoch": 3743} {"train_loss": -6.992508888244629, "global_step": 157228, "epoch": 3743} {"train_loss": -6.884623050689697, "global_step": 157229, "epoch": 3743} {"train_loss": -7.022982597351074, "global_step": 157230, "epoch": 3743} {"train_loss": -6.980517387390137, "global_step": 157231, "epoch": 3743} {"train_loss": -7.013354301452637, "global_step": 157232, "epoch": 3743} {"train_loss": -6.903061866760254, "global_step": 157233, "epoch": 3743} {"train_loss": -7.007475852966309, "global_step": 157234, "epoch": 3743} {"train_loss": -7.046683311462402, "global_step": 157235, "epoch": 3743} {"train_loss": -6.905298709869385, "global_step": 157236, "epoch": 3743} {"train_loss": -6.938072204589844, "global_step": 157237, "epoch": 3743} {"train_loss": -6.935602188110352, "global_step": 157238, "epoch": 3743} {"train_loss": -6.865062713623047, "global_step": 157239, "epoch": 3743} {"train_loss": -7.075843811035156, "global_step": 157240, "epoch": 3743} {"train_loss": -7.045232772827148, "global_step": 157241, "epoch": 3743} {"train_loss": -6.902063846588135, "global_step": 157242, "epoch": 3743} {"train_loss": -7.002238750457764, "global_step": 157243, "epoch": 3743} {"train_loss": -6.964387893676758, "global_step": 157244, "epoch": 3743} {"train_loss": -6.956071853637695, "global_step": 157245, "epoch": 3743} {"train_loss": -6.957828521728516, "global_step": 157246, "epoch": 3743} {"train_loss": -6.963217156273978, "global_step": 157247, "epoch": 3743, "val_loss": 78938.453125} {"train_loss": -6.900494575500488, "global_step": 157248, "epoch": 3744} {"train_loss": -6.982968807220459, "global_step": 157249, "epoch": 3744} {"train_loss": -7.024750709533691, "global_step": 157250, "epoch": 3744} {"train_loss": -6.823732852935791, "global_step": 157251, "epoch": 3744} {"train_loss": -6.881783485412598, "global_step": 157252, "epoch": 3744} {"train_loss": -6.975628852844238, "global_step": 157253, "epoch": 3744} {"train_loss": -6.846146583557129, "global_step": 157254, "epoch": 3744} {"train_loss": -6.949461460113525, "global_step": 157255, "epoch": 3744} {"train_loss": -6.758279800415039, "global_step": 157256, "epoch": 3744} {"train_loss": -6.83229923248291, "global_step": 157257, "epoch": 3744} {"train_loss": -6.952532768249512, "global_step": 157258, "epoch": 3744} {"train_loss": -6.937897205352783, "global_step": 157259, "epoch": 3744} {"train_loss": -6.859423637390137, "global_step": 157260, "epoch": 3744} {"train_loss": -6.921195030212402, "global_step": 157261, "epoch": 3744} {"train_loss": -6.8709821701049805, "global_step": 157262, "epoch": 3744} {"train_loss": -6.952086448669434, "global_step": 157263, "epoch": 3744} {"train_loss": -6.931526184082031, "global_step": 157264, "epoch": 3744} {"train_loss": -6.864298343658447, "global_step": 157265, "epoch": 3744} {"train_loss": -6.8552961349487305, "global_step": 157266, "epoch": 3744} {"train_loss": -6.79373836517334, "global_step": 157267, "epoch": 3744} {"train_loss": -6.9557600021362305, "global_step": 157268, "epoch": 3744} {"train_loss": -6.871364593505859, "global_step": 157269, "epoch": 3744} {"train_loss": -6.911219596862793, "global_step": 157270, "epoch": 3744} {"train_loss": -6.912257194519043, "global_step": 157271, "epoch": 3744} {"train_loss": -7.012961387634277, "global_step": 157272, "epoch": 3744} {"train_loss": -6.940136909484863, "global_step": 157273, "epoch": 3744} {"train_loss": -7.041093349456787, "global_step": 157274, "epoch": 3744} {"train_loss": -6.9850664138793945, "global_step": 157275, "epoch": 3744} {"train_loss": -6.96359920501709, "global_step": 157276, "epoch": 3744} {"train_loss": -6.944578170776367, "global_step": 157277, "epoch": 3744} {"train_loss": -7.049193382263184, "global_step": 157278, "epoch": 3744} {"train_loss": -6.894385814666748, "global_step": 157279, "epoch": 3744} {"train_loss": -6.838217258453369, "global_step": 157280, "epoch": 3744} {"train_loss": -6.937411785125732, "global_step": 157281, "epoch": 3744} {"train_loss": -6.894718647003174, "global_step": 157282, "epoch": 3744} {"train_loss": -6.886913299560547, "global_step": 157283, "epoch": 3744} {"train_loss": -6.91771125793457, "global_step": 157284, "epoch": 3744} {"train_loss": -6.795940399169922, "global_step": 157285, "epoch": 3744} {"train_loss": -6.815468788146973, "global_step": 157286, "epoch": 3744} {"train_loss": -6.830108642578125, "global_step": 157287, "epoch": 3744} {"train_loss": -6.850005149841309, "global_step": 157288, "epoch": 3744} {"train_loss": -6.908673127492269, "global_step": 157289, "epoch": 3744, "val_loss": 79168.6796875} {"train_loss": -6.972886085510254, "global_step": 157290, "epoch": 3745} {"train_loss": -6.965744495391846, "global_step": 157291, "epoch": 3745} {"train_loss": -6.931497097015381, "global_step": 157292, "epoch": 3745} {"train_loss": -6.908220291137695, "global_step": 157293, "epoch": 3745} {"train_loss": -6.944537162780762, "global_step": 157294, "epoch": 3745} {"train_loss": -6.921874523162842, "global_step": 157295, "epoch": 3745} {"train_loss": -6.932153701782227, "global_step": 157296, "epoch": 3745} {"train_loss": -6.943298816680908, "global_step": 157297, "epoch": 3745} {"train_loss": -7.0055623054504395, "global_step": 157298, "epoch": 3745} {"train_loss": -6.937929630279541, "global_step": 157299, "epoch": 3745} {"train_loss": -6.888443946838379, "global_step": 157300, "epoch": 3745} {"train_loss": -6.874505043029785, "global_step": 157301, "epoch": 3745} {"train_loss": -6.956306457519531, "global_step": 157302, "epoch": 3745} {"train_loss": -6.9471635818481445, "global_step": 157303, "epoch": 3745} {"train_loss": -6.866067886352539, "global_step": 157304, "epoch": 3745} {"train_loss": -6.890101909637451, "global_step": 157305, "epoch": 3745} {"train_loss": -7.045029640197754, "global_step": 157306, "epoch": 3745} {"train_loss": -6.876500129699707, "global_step": 157307, "epoch": 3745} {"train_loss": -6.8888654708862305, "global_step": 157308, "epoch": 3745} {"train_loss": -6.776386260986328, "global_step": 157309, "epoch": 3745} {"train_loss": -6.8677568435668945, "global_step": 157310, "epoch": 3745} {"train_loss": -6.883464813232422, "global_step": 157311, "epoch": 3745} {"train_loss": -6.892791748046875, "global_step": 157312, "epoch": 3745} {"train_loss": -6.9637274742126465, "global_step": 157313, "epoch": 3745} {"train_loss": -6.990325450897217, "global_step": 157314, "epoch": 3745} {"train_loss": -7.014822483062744, "global_step": 157315, "epoch": 3745} {"train_loss": -6.91878080368042, "global_step": 157316, "epoch": 3745} {"train_loss": -7.025330543518066, "global_step": 157317, "epoch": 3745} {"train_loss": -6.941709995269775, "global_step": 157318, "epoch": 3745} {"train_loss": -6.8236894607543945, "global_step": 157319, "epoch": 3745} {"train_loss": -6.835575103759766, "global_step": 157320, "epoch": 3745} {"train_loss": -6.810811519622803, "global_step": 157321, "epoch": 3745} {"train_loss": -6.803066730499268, "global_step": 157322, "epoch": 3745} {"train_loss": -6.940995216369629, "global_step": 157323, "epoch": 3745} {"train_loss": -6.952572822570801, "global_step": 157324, "epoch": 3745} {"train_loss": -6.810422897338867, "global_step": 157325, "epoch": 3745} {"train_loss": -6.827094554901123, "global_step": 157326, "epoch": 3745} {"train_loss": -6.827066898345947, "global_step": 157327, "epoch": 3745} {"train_loss": -6.899811744689941, "global_step": 157328, "epoch": 3745} {"train_loss": -6.935320854187012, "global_step": 157329, "epoch": 3745} {"train_loss": -6.857563018798828, "global_step": 157330, "epoch": 3745} {"train_loss": -6.911642699014573, "global_step": 157331, "epoch": 3745, "val_loss": 79173.234375} {"train_loss": -6.7371392250061035, "global_step": 157332, "epoch": 3746} {"train_loss": -6.878106117248535, "global_step": 157333, "epoch": 3746} {"train_loss": -6.981678009033203, "global_step": 157334, "epoch": 3746} {"train_loss": -6.857243537902832, "global_step": 157335, "epoch": 3746} {"train_loss": -6.943745136260986, "global_step": 157336, "epoch": 3746} {"train_loss": -6.988922595977783, "global_step": 157337, "epoch": 3746} {"train_loss": -7.038136959075928, "global_step": 157338, "epoch": 3746} {"train_loss": -6.981114387512207, "global_step": 157339, "epoch": 3746} {"train_loss": -7.0152387619018555, "global_step": 157340, "epoch": 3746} {"train_loss": -6.9067702293396, "global_step": 157341, "epoch": 3746} {"train_loss": -7.069466590881348, "global_step": 157342, "epoch": 3746} {"train_loss": -6.797328948974609, "global_step": 157343, "epoch": 3746} {"train_loss": -7.0988874435424805, "global_step": 157344, "epoch": 3746} {"train_loss": -6.9962477684021, "global_step": 157345, "epoch": 3746} {"train_loss": -6.99793815612793, "global_step": 157346, "epoch": 3746} {"train_loss": -7.046060085296631, "global_step": 157347, "epoch": 3746} {"train_loss": -6.964375019073486, "global_step": 157348, "epoch": 3746} {"train_loss": -7.064887046813965, "global_step": 157349, "epoch": 3746} {"train_loss": -6.996676445007324, "global_step": 157350, "epoch": 3746} {"train_loss": -7.001071929931641, "global_step": 157351, "epoch": 3746} {"train_loss": -6.935718059539795, "global_step": 157352, "epoch": 3746} {"train_loss": -6.968703746795654, "global_step": 157353, "epoch": 3746} {"train_loss": -6.8716630935668945, "global_step": 157354, "epoch": 3746} {"train_loss": -6.9109392166137695, "global_step": 157355, "epoch": 3746} {"train_loss": -6.902576923370361, "global_step": 157356, "epoch": 3746} {"train_loss": -6.8269548416137695, "global_step": 157357, "epoch": 3746} {"train_loss": -6.942503929138184, "global_step": 157358, "epoch": 3746} {"train_loss": -6.965422630310059, "global_step": 157359, "epoch": 3746} {"train_loss": -6.90856409072876, "global_step": 157360, "epoch": 3746} {"train_loss": -6.855658531188965, "global_step": 157361, "epoch": 3746} {"train_loss": -6.65071964263916, "global_step": 157362, "epoch": 3746} {"train_loss": -6.929287433624268, "global_step": 157363, "epoch": 3746} {"train_loss": -6.674197673797607, "global_step": 157364, "epoch": 3746} {"train_loss": -6.846834659576416, "global_step": 157365, "epoch": 3746} {"train_loss": -6.822521209716797, "global_step": 157366, "epoch": 3746} {"train_loss": -6.733889579772949, "global_step": 157367, "epoch": 3746} {"train_loss": -6.742283821105957, "global_step": 157368, "epoch": 3746} {"train_loss": -6.871247291564941, "global_step": 157369, "epoch": 3746} {"train_loss": -6.898796558380127, "global_step": 157370, "epoch": 3746} {"train_loss": -6.838464260101318, "global_step": 157371, "epoch": 3746} {"train_loss": -6.840428829193115, "global_step": 157372, "epoch": 3746} {"train_loss": -6.909682114919026, "global_step": 157373, "epoch": 3746, "val_loss": 79063.0625} {"train_loss": -6.771570205688477, "global_step": 157374, "epoch": 3747} {"train_loss": -6.969005584716797, "global_step": 157375, "epoch": 3747} {"train_loss": -6.913947105407715, "global_step": 157376, "epoch": 3747} {"train_loss": -6.679028511047363, "global_step": 157377, "epoch": 3747} {"train_loss": -6.772810935974121, "global_step": 157378, "epoch": 3747} {"train_loss": -6.84929895401001, "global_step": 157379, "epoch": 3747} {"train_loss": -6.784574031829834, "global_step": 157380, "epoch": 3747} {"train_loss": -6.849067687988281, "global_step": 157381, "epoch": 3747} {"train_loss": -6.799612998962402, "global_step": 157382, "epoch": 3747} {"train_loss": -6.804503917694092, "global_step": 157383, "epoch": 3747} {"train_loss": -6.879359245300293, "global_step": 157384, "epoch": 3747} {"train_loss": -6.90673828125, "global_step": 157385, "epoch": 3747} {"train_loss": -6.712059020996094, "global_step": 157386, "epoch": 3747} {"train_loss": -6.990193843841553, "global_step": 157387, "epoch": 3747} {"train_loss": -6.8154473304748535, "global_step": 157388, "epoch": 3747} {"train_loss": -6.640092849731445, "global_step": 157389, "epoch": 3747} {"train_loss": -6.973608016967773, "global_step": 157390, "epoch": 3747} {"train_loss": -6.764815807342529, "global_step": 157391, "epoch": 3747} {"train_loss": -6.79939079284668, "global_step": 157392, "epoch": 3747} {"train_loss": -6.9772562980651855, "global_step": 157393, "epoch": 3747} {"train_loss": -6.836696624755859, "global_step": 157394, "epoch": 3747} {"train_loss": -7.009407043457031, "global_step": 157395, "epoch": 3747} {"train_loss": -6.84316349029541, "global_step": 157396, "epoch": 3747} {"train_loss": -6.749386787414551, "global_step": 157397, "epoch": 3747} {"train_loss": -6.803081512451172, "global_step": 157398, "epoch": 3747} {"train_loss": -6.857384204864502, "global_step": 157399, "epoch": 3747} {"train_loss": -6.815907955169678, "global_step": 157400, "epoch": 3747} {"train_loss": -6.873751163482666, "global_step": 157401, "epoch": 3747} {"train_loss": -6.828653812408447, "global_step": 157402, "epoch": 3747} {"train_loss": -6.822979927062988, "global_step": 157403, "epoch": 3747} {"train_loss": -6.9645891189575195, "global_step": 157404, "epoch": 3747} {"train_loss": -6.800173759460449, "global_step": 157405, "epoch": 3747} {"train_loss": -7.013666152954102, "global_step": 157406, "epoch": 3747} {"train_loss": -6.928375720977783, "global_step": 157407, "epoch": 3747} {"train_loss": -6.854424953460693, "global_step": 157408, "epoch": 3747} {"train_loss": -6.944704055786133, "global_step": 157409, "epoch": 3747} {"train_loss": -6.933568954467773, "global_step": 157410, "epoch": 3747} {"train_loss": -6.967073917388916, "global_step": 157411, "epoch": 3747} {"train_loss": -6.86468505859375, "global_step": 157412, "epoch": 3747} {"train_loss": -6.926910400390625, "global_step": 157413, "epoch": 3747} {"train_loss": -7.013866424560547, "global_step": 157414, "epoch": 3747} {"train_loss": -6.862188850130353, "global_step": 157415, "epoch": 3747, "val_loss": 79271.8515625} {"train_loss": -6.933536529541016, "global_step": 157416, "epoch": 3748} {"train_loss": -6.960291385650635, "global_step": 157417, "epoch": 3748} {"train_loss": -6.950418949127197, "global_step": 157418, "epoch": 3748} {"train_loss": -7.039209365844727, "global_step": 157419, "epoch": 3748} {"train_loss": -6.869165897369385, "global_step": 157420, "epoch": 3748} {"train_loss": -6.930526256561279, "global_step": 157421, "epoch": 3748} {"train_loss": -7.003241539001465, "global_step": 157422, "epoch": 3748} {"train_loss": -6.943495750427246, "global_step": 157423, "epoch": 3748} {"train_loss": -6.966603755950928, "global_step": 157424, "epoch": 3748} {"train_loss": -6.962170600891113, "global_step": 157425, "epoch": 3748} {"train_loss": -6.937932968139648, "global_step": 157426, "epoch": 3748} {"train_loss": -6.927044868469238, "global_step": 157427, "epoch": 3748} {"train_loss": -7.004639625549316, "global_step": 157428, "epoch": 3748} {"train_loss": -6.996655464172363, "global_step": 157429, "epoch": 3748} {"train_loss": -6.9167561531066895, "global_step": 157430, "epoch": 3748} {"train_loss": -7.150629997253418, "global_step": 157431, "epoch": 3748} {"train_loss": -7.104753017425537, "global_step": 157432, "epoch": 3748} {"train_loss": -6.948738098144531, "global_step": 157433, "epoch": 3748} {"train_loss": -6.891161918640137, "global_step": 157434, "epoch": 3748} {"train_loss": -7.053729057312012, "global_step": 157435, "epoch": 3748} {"train_loss": -7.027285575866699, "global_step": 157436, "epoch": 3748} {"train_loss": -6.982605457305908, "global_step": 157437, "epoch": 3748} {"train_loss": -6.975856304168701, "global_step": 157438, "epoch": 3748} {"train_loss": -7.010503768920898, "global_step": 157439, "epoch": 3748} {"train_loss": -6.8564348220825195, "global_step": 157440, "epoch": 3748} {"train_loss": -6.905562400817871, "global_step": 157441, "epoch": 3748} {"train_loss": -6.896636009216309, "global_step": 157442, "epoch": 3748} {"train_loss": -6.9882378578186035, "global_step": 157443, "epoch": 3748} {"train_loss": -6.966155052185059, "global_step": 157444, "epoch": 3748} {"train_loss": -6.957669734954834, "global_step": 157445, "epoch": 3748} {"train_loss": -6.9897613525390625, "global_step": 157446, "epoch": 3748} {"train_loss": -7.001519203186035, "global_step": 157447, "epoch": 3748} {"train_loss": -7.02829647064209, "global_step": 157448, "epoch": 3748} {"train_loss": -7.012970924377441, "global_step": 157449, "epoch": 3748} {"train_loss": -6.96689510345459, "global_step": 157450, "epoch": 3748} {"train_loss": -6.973012924194336, "global_step": 157451, "epoch": 3748} {"train_loss": -6.880990982055664, "global_step": 157452, "epoch": 3748} {"train_loss": -7.018850326538086, "global_step": 157453, "epoch": 3748} {"train_loss": -6.9511637687683105, "global_step": 157454, "epoch": 3748} {"train_loss": -6.850734710693359, "global_step": 157455, "epoch": 3748} {"train_loss": -6.931831359863281, "global_step": 157456, "epoch": 3748} {"train_loss": -6.9687601044064476, "global_step": 157457, "epoch": 3748, "val_loss": 79341.0546875} {"train_loss": -7.020421981811523, "global_step": 157458, "epoch": 3749} {"train_loss": -6.847761154174805, "global_step": 157459, "epoch": 3749} {"train_loss": -6.976894378662109, "global_step": 157460, "epoch": 3749} {"train_loss": -7.000082969665527, "global_step": 157461, "epoch": 3749} {"train_loss": -6.934300422668457, "global_step": 157462, "epoch": 3749} {"train_loss": -6.9340105056762695, "global_step": 157463, "epoch": 3749} {"train_loss": -6.953261852264404, "global_step": 157464, "epoch": 3749} {"train_loss": -6.98953914642334, "global_step": 157465, "epoch": 3749} {"train_loss": -6.901300430297852, "global_step": 157466, "epoch": 3749} {"train_loss": -6.999368667602539, "global_step": 157467, "epoch": 3749} {"train_loss": -6.99302864074707, "global_step": 157468, "epoch": 3749} {"train_loss": -6.847672462463379, "global_step": 157469, "epoch": 3749} {"train_loss": -6.960695266723633, "global_step": 157470, "epoch": 3749} {"train_loss": -6.800893783569336, "global_step": 157471, "epoch": 3749} {"train_loss": -6.941042423248291, "global_step": 157472, "epoch": 3749} {"train_loss": -6.921944618225098, "global_step": 157473, "epoch": 3749} {"train_loss": -6.891391754150391, "global_step": 157474, "epoch": 3749} {"train_loss": -7.018980026245117, "global_step": 157475, "epoch": 3749} {"train_loss": -6.925807952880859, "global_step": 157476, "epoch": 3749} {"train_loss": -6.99130916595459, "global_step": 157477, "epoch": 3749} {"train_loss": -6.996551513671875, "global_step": 157478, "epoch": 3749} {"train_loss": -6.916201591491699, "global_step": 157479, "epoch": 3749} {"train_loss": -6.965723514556885, "global_step": 157480, "epoch": 3749} {"train_loss": -6.9217987060546875, "global_step": 157481, "epoch": 3749} {"train_loss": -6.928215980529785, "global_step": 157482, "epoch": 3749} {"train_loss": -6.872852325439453, "global_step": 157483, "epoch": 3749} {"train_loss": -7.041975021362305, "global_step": 157484, "epoch": 3749} {"train_loss": -7.097536087036133, "global_step": 157485, "epoch": 3749} {"train_loss": -6.985359191894531, "global_step": 157486, "epoch": 3749} {"train_loss": -6.9125776290893555, "global_step": 157487, "epoch": 3749} {"train_loss": -6.930791854858398, "global_step": 157488, "epoch": 3749} {"train_loss": -6.941595077514648, "global_step": 157489, "epoch": 3749} {"train_loss": -6.94513463973999, "global_step": 157490, "epoch": 3749} {"train_loss": -6.921273708343506, "global_step": 157491, "epoch": 3749} {"train_loss": -6.847747802734375, "global_step": 157492, "epoch": 3749} {"train_loss": -6.8562726974487305, "global_step": 157493, "epoch": 3749} {"train_loss": -6.974653244018555, "global_step": 157494, "epoch": 3749} {"train_loss": -7.039989471435547, "global_step": 157495, "epoch": 3749} {"train_loss": -6.903467655181885, "global_step": 157496, "epoch": 3749} {"train_loss": -7.004603385925293, "global_step": 157497, "epoch": 3749} {"train_loss": -6.955296993255615, "global_step": 157498, "epoch": 3749} {"train_loss": -6.947731199718657, "global_step": 157499, "epoch": 3749, "val_loss": 79431.859375} {"train_loss": -6.925054550170898, "global_step": 157500, "epoch": 3750} {"train_loss": -6.920375823974609, "global_step": 157501, "epoch": 3750} {"train_loss": -6.914361476898193, "global_step": 157502, "epoch": 3750} {"train_loss": -6.911327362060547, "global_step": 157503, "epoch": 3750} {"train_loss": -6.912765026092529, "global_step": 157504, "epoch": 3750} {"train_loss": -6.938357830047607, "global_step": 157505, "epoch": 3750} {"train_loss": -6.945115089416504, "global_step": 157506, "epoch": 3750} {"train_loss": -6.848804473876953, "global_step": 157507, "epoch": 3750} {"train_loss": -6.883147239685059, "global_step": 157508, "epoch": 3750} {"train_loss": -6.767088890075684, "global_step": 157509, "epoch": 3750} {"train_loss": -6.980590343475342, "global_step": 157510, "epoch": 3750} {"train_loss": -6.732633590698242, "global_step": 157511, "epoch": 3750} {"train_loss": -6.843425750732422, "global_step": 157512, "epoch": 3750} {"train_loss": -6.938381195068359, "global_step": 157513, "epoch": 3750} {"train_loss": -6.8107805252075195, "global_step": 157514, "epoch": 3750} {"train_loss": -6.826981067657471, "global_step": 157515, "epoch": 3750} {"train_loss": -6.912076950073242, "global_step": 157516, "epoch": 3750} {"train_loss": -6.836484909057617, "global_step": 157517, "epoch": 3750} {"train_loss": -6.893733978271484, "global_step": 157518, "epoch": 3750} {"train_loss": -6.917331695556641, "global_step": 157519, "epoch": 3750} {"train_loss": -6.857139587402344, "global_step": 157520, "epoch": 3750} {"train_loss": -6.797656059265137, "global_step": 157521, "epoch": 3750} {"train_loss": -6.94173002243042, "global_step": 157522, "epoch": 3750} {"train_loss": -6.801894187927246, "global_step": 157523, "epoch": 3750} {"train_loss": -6.7474517822265625, "global_step": 157524, "epoch": 3750} {"train_loss": -6.880091667175293, "global_step": 157525, "epoch": 3750} {"train_loss": -6.785950183868408, "global_step": 157526, "epoch": 3750} {"train_loss": -6.969293594360352, "global_step": 157527, "epoch": 3750} {"train_loss": -6.812982082366943, "global_step": 157528, "epoch": 3750} {"train_loss": -6.927785873413086, "global_step": 157529, "epoch": 3750} {"train_loss": -7.017210006713867, "global_step": 157530, "epoch": 3750} {"train_loss": -6.9842634201049805, "global_step": 157531, "epoch": 3750} {"train_loss": -6.8566365242004395, "global_step": 157532, "epoch": 3750} {"train_loss": -6.83980655670166, "global_step": 157533, "epoch": 3750} {"train_loss": -6.956265926361084, "global_step": 157534, "epoch": 3750} {"train_loss": -6.873639106750488, "global_step": 157535, "epoch": 3750} {"train_loss": -6.9421820640563965, "global_step": 157536, "epoch": 3750} {"train_loss": -7.019057273864746, "global_step": 157537, "epoch": 3750} {"train_loss": -6.963900566101074, "global_step": 157538, "epoch": 3750} {"train_loss": -6.8667120933532715, "global_step": 157539, "epoch": 3750} {"train_loss": -6.996547698974609, "global_step": 157540, "epoch": 3750} {"train_loss": -6.891791559401012, "global_step": 157541, "epoch": 3750, "train/sim_max_reward_0": 0.9004945418503182, "train/sim_max_reward_1": 0.88135258407441, "train/sim_max_reward_2": 0.5122510209298349, "train/sim_max_reward_3": 0.1271177118886611, "train/sim_max_reward_4": 0.30421820591606563, "train/sim_max_reward_5": 0.5615294522913116, "test/sim_max_reward_4500000": 0.8446619655267237, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9797719853567547, "test/sim_max_reward_4500003": 0.9922387357194741, "test/sim_max_reward_4500004": 0.1604553240669574, "test/sim_max_reward_4500005": 0.5445656324707092, "test/sim_max_reward_4500006": 0.915658112245788, "test/sim_max_reward_4500007": 0.994808003127845, "test/sim_max_reward_4500008": 0.3985716490083401, "test/sim_max_reward_4500009": 0.05332849793594213, "test/sim_max_reward_4500010": 0.05545401490636288, "test/sim_max_reward_4500011": 0.9730291292755361, "test/sim_max_reward_4500012": 0.9931295588687817, "test/sim_max_reward_4500013": 0.004521832131012125, "test/sim_max_reward_4500014": 0.9970495206223243, "test/sim_max_reward_4500015": 0.8535008736628085, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.05508209145558441, "test/sim_max_reward_4500018": 0.32526663263210026, "test/sim_max_reward_4500019": 0.9547207957863574, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.5520634787036366, "test/sim_max_reward_4500022": 0.999356444902266, "test/sim_max_reward_4500023": 0.8695050328486486, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.7300479143127028, "test/sim_max_reward_4500026": 0.9659112195640298, "test/sim_max_reward_4500027": 0.9610395988301746, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.06262892401150706, "test/sim_max_reward_4500030": 0.9810068316091294, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.7875370789012636, "test/sim_max_reward_4500034": 0.907409984889934, "test/sim_max_reward_4500035": 0.852801391607866, "test/sim_max_reward_4500036": 0.4067101713470536, "test/sim_max_reward_4500037": 0.9261433224420057, "test/sim_max_reward_4500038": 0.9669276885258206, "test/sim_max_reward_4500039": 0.867066504141787, "test/sim_max_reward_4500040": 0.9639773656947802, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.028506561700876575, "test/sim_max_reward_4500043": 0.9739620801964842, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.8568894810896565, "test/sim_max_reward_4500046": 0.1203116053124875, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5478272528251003, "test/mean_score": 0.5430057558506204, "val_loss": 79053.03125} {"train_loss": -6.914981365203857, "global_step": 157542, "epoch": 3751} {"train_loss": -6.916440963745117, "global_step": 157543, "epoch": 3751} {"train_loss": -7.0248212814331055, "global_step": 157544, "epoch": 3751} {"train_loss": -6.878549575805664, "global_step": 157545, "epoch": 3751} {"train_loss": -6.947441101074219, "global_step": 157546, "epoch": 3751} {"train_loss": -7.005005836486816, "global_step": 157547, "epoch": 3751} {"train_loss": -6.937561988830566, "global_step": 157548, "epoch": 3751} {"train_loss": -6.91148042678833, "global_step": 157549, "epoch": 3751} {"train_loss": -6.989428520202637, "global_step": 157550, "epoch": 3751} {"train_loss": -6.747620582580566, "global_step": 157551, "epoch": 3751} {"train_loss": -6.947696208953857, "global_step": 157552, "epoch": 3751} {"train_loss": -6.928008079528809, "global_step": 157553, "epoch": 3751} {"train_loss": -6.906983375549316, "global_step": 157554, "epoch": 3751} {"train_loss": -6.877923011779785, "global_step": 157555, "epoch": 3751} {"train_loss": -6.913390636444092, "global_step": 157556, "epoch": 3751} {"train_loss": -6.99738883972168, "global_step": 157557, "epoch": 3751} {"train_loss": -6.942795276641846, "global_step": 157558, "epoch": 3751} {"train_loss": -7.008811950683594, "global_step": 157559, "epoch": 3751} {"train_loss": -6.935476779937744, "global_step": 157560, "epoch": 3751} {"train_loss": -6.934622764587402, "global_step": 157561, "epoch": 3751} {"train_loss": -6.908625602722168, "global_step": 157562, "epoch": 3751} {"train_loss": -6.947323799133301, "global_step": 157563, "epoch": 3751} {"train_loss": -6.939981460571289, "global_step": 157564, "epoch": 3751} {"train_loss": -6.979308605194092, "global_step": 157565, "epoch": 3751} {"train_loss": -6.780168533325195, "global_step": 157566, "epoch": 3751} {"train_loss": -7.053720474243164, "global_step": 157567, "epoch": 3751} {"train_loss": -6.93626070022583, "global_step": 157568, "epoch": 3751} {"train_loss": -6.832046985626221, "global_step": 157569, "epoch": 3751} {"train_loss": -7.006179332733154, "global_step": 157570, "epoch": 3751} {"train_loss": -6.961160659790039, "global_step": 157571, "epoch": 3751} {"train_loss": -6.981800079345703, "global_step": 157572, "epoch": 3751} {"train_loss": -6.728316783905029, "global_step": 157573, "epoch": 3751} {"train_loss": -6.989077568054199, "global_step": 157574, "epoch": 3751} {"train_loss": -6.924571514129639, "global_step": 157575, "epoch": 3751} {"train_loss": -7.024904727935791, "global_step": 157576, "epoch": 3751} {"train_loss": -6.873249053955078, "global_step": 157577, "epoch": 3751} {"train_loss": -6.8871965408325195, "global_step": 157578, "epoch": 3751} {"train_loss": -7.002777099609375, "global_step": 157579, "epoch": 3751} {"train_loss": -7.017441749572754, "global_step": 157580, "epoch": 3751} {"train_loss": -6.848804950714111, "global_step": 157581, "epoch": 3751} {"train_loss": -6.881969451904297, "global_step": 157582, "epoch": 3751} {"train_loss": -6.930936722528367, "global_step": 157583, "epoch": 3751, "val_loss": 78904.90625} {"train_loss": -6.940845489501953, "global_step": 157584, "epoch": 3752} {"train_loss": -6.956911087036133, "global_step": 157585, "epoch": 3752} {"train_loss": -6.859058856964111, "global_step": 157586, "epoch": 3752} {"train_loss": -6.878328800201416, "global_step": 157587, "epoch": 3752} {"train_loss": -6.8993635177612305, "global_step": 157588, "epoch": 3752} {"train_loss": -6.880303859710693, "global_step": 157589, "epoch": 3752} {"train_loss": -6.8912353515625, "global_step": 157590, "epoch": 3752} {"train_loss": -6.955524444580078, "global_step": 157591, "epoch": 3752} {"train_loss": -7.042400360107422, "global_step": 157592, "epoch": 3752} {"train_loss": -6.937784671783447, "global_step": 157593, "epoch": 3752} {"train_loss": -7.033422470092773, "global_step": 157594, "epoch": 3752} {"train_loss": -6.993517875671387, "global_step": 157595, "epoch": 3752} {"train_loss": -6.985160827636719, "global_step": 157596, "epoch": 3752} {"train_loss": -6.944641590118408, "global_step": 157597, "epoch": 3752} {"train_loss": -6.908236503601074, "global_step": 157598, "epoch": 3752} {"train_loss": -6.983715534210205, "global_step": 157599, "epoch": 3752} {"train_loss": -6.910191535949707, "global_step": 157600, "epoch": 3752} {"train_loss": -6.988773345947266, "global_step": 157601, "epoch": 3752} {"train_loss": -6.9576826095581055, "global_step": 157602, "epoch": 3752} {"train_loss": -7.056568622589111, "global_step": 157603, "epoch": 3752} {"train_loss": -7.020216941833496, "global_step": 157604, "epoch": 3752} {"train_loss": -6.965040683746338, "global_step": 157605, "epoch": 3752} {"train_loss": -7.009324073791504, "global_step": 157606, "epoch": 3752} {"train_loss": -6.952201843261719, "global_step": 157607, "epoch": 3752} {"train_loss": -6.942522048950195, "global_step": 157608, "epoch": 3752} {"train_loss": -6.983029365539551, "global_step": 157609, "epoch": 3752} {"train_loss": -6.879110336303711, "global_step": 157610, "epoch": 3752} {"train_loss": -6.880542755126953, "global_step": 157611, "epoch": 3752} {"train_loss": -7.072345733642578, "global_step": 157612, "epoch": 3752} {"train_loss": -6.976102352142334, "global_step": 157613, "epoch": 3752} {"train_loss": -6.906635284423828, "global_step": 157614, "epoch": 3752} {"train_loss": -6.94965124130249, "global_step": 157615, "epoch": 3752} {"train_loss": -6.962240219116211, "global_step": 157616, "epoch": 3752} {"train_loss": -6.928275108337402, "global_step": 157617, "epoch": 3752} {"train_loss": -6.92902135848999, "global_step": 157618, "epoch": 3752} {"train_loss": -6.798661231994629, "global_step": 157619, "epoch": 3752} {"train_loss": -6.909050941467285, "global_step": 157620, "epoch": 3752} {"train_loss": -6.916380882263184, "global_step": 157621, "epoch": 3752} {"train_loss": -6.934447288513184, "global_step": 157622, "epoch": 3752} {"train_loss": -6.8403778076171875, "global_step": 157623, "epoch": 3752} {"train_loss": -6.994596481323242, "global_step": 157624, "epoch": 3752} {"train_loss": -6.947552192778814, "global_step": 157625, "epoch": 3752, "val_loss": 79085.1328125} {"train_loss": -6.943978309631348, "global_step": 157626, "epoch": 3753} {"train_loss": -7.021401405334473, "global_step": 157627, "epoch": 3753} {"train_loss": -6.888761520385742, "global_step": 157628, "epoch": 3753} {"train_loss": -6.885760307312012, "global_step": 157629, "epoch": 3753} {"train_loss": -6.923998832702637, "global_step": 157630, "epoch": 3753} {"train_loss": -6.897016525268555, "global_step": 157631, "epoch": 3753} {"train_loss": -6.958544731140137, "global_step": 157632, "epoch": 3753} {"train_loss": -7.020543575286865, "global_step": 157633, "epoch": 3753} {"train_loss": -6.979457855224609, "global_step": 157634, "epoch": 3753} {"train_loss": -6.876073837280273, "global_step": 157635, "epoch": 3753} {"train_loss": -6.979634761810303, "global_step": 157636, "epoch": 3753} {"train_loss": -6.909687042236328, "global_step": 157637, "epoch": 3753} {"train_loss": -6.868484973907471, "global_step": 157638, "epoch": 3753} {"train_loss": -7.001709461212158, "global_step": 157639, "epoch": 3753} {"train_loss": -7.031713485717773, "global_step": 157640, "epoch": 3753} {"train_loss": -7.085859298706055, "global_step": 157641, "epoch": 3753} {"train_loss": -6.882226943969727, "global_step": 157642, "epoch": 3753} {"train_loss": -7.071311950683594, "global_step": 157643, "epoch": 3753} {"train_loss": -6.8307318687438965, "global_step": 157644, "epoch": 3753} {"train_loss": -6.867656707763672, "global_step": 157645, "epoch": 3753} {"train_loss": -6.987941741943359, "global_step": 157646, "epoch": 3753} {"train_loss": -6.9069623947143555, "global_step": 157647, "epoch": 3753} {"train_loss": -7.0778398513793945, "global_step": 157648, "epoch": 3753} {"train_loss": -6.8990020751953125, "global_step": 157649, "epoch": 3753} {"train_loss": -6.8955769538879395, "global_step": 157650, "epoch": 3753} {"train_loss": -6.9384260177612305, "global_step": 157651, "epoch": 3753} {"train_loss": -6.871016025543213, "global_step": 157652, "epoch": 3753} {"train_loss": -6.9173736572265625, "global_step": 157653, "epoch": 3753} {"train_loss": -6.875572204589844, "global_step": 157654, "epoch": 3753} {"train_loss": -6.860655307769775, "global_step": 157655, "epoch": 3753} {"train_loss": -6.912893295288086, "global_step": 157656, "epoch": 3753} {"train_loss": -6.771457672119141, "global_step": 157657, "epoch": 3753} {"train_loss": -6.807582855224609, "global_step": 157658, "epoch": 3753} {"train_loss": -6.7908501625061035, "global_step": 157659, "epoch": 3753} {"train_loss": -6.926814079284668, "global_step": 157660, "epoch": 3753} {"train_loss": -6.919439315795898, "global_step": 157661, "epoch": 3753} {"train_loss": -6.946193695068359, "global_step": 157662, "epoch": 3753} {"train_loss": -6.962437629699707, "global_step": 157663, "epoch": 3753} {"train_loss": -6.9084367752075195, "global_step": 157664, "epoch": 3753} {"train_loss": -7.039412021636963, "global_step": 157665, "epoch": 3753} {"train_loss": -6.888288497924805, "global_step": 157666, "epoch": 3753} {"train_loss": -6.925153652826945, "global_step": 157667, "epoch": 3753, "val_loss": 78969.6953125} {"train_loss": -6.7838358879089355, "global_step": 157668, "epoch": 3754} {"train_loss": -6.857337951660156, "global_step": 157669, "epoch": 3754} {"train_loss": -6.917305946350098, "global_step": 157670, "epoch": 3754} {"train_loss": -6.95645809173584, "global_step": 157671, "epoch": 3754} {"train_loss": -6.790220260620117, "global_step": 157672, "epoch": 3754} {"train_loss": -6.811955451965332, "global_step": 157673, "epoch": 3754} {"train_loss": -6.902230262756348, "global_step": 157674, "epoch": 3754} {"train_loss": -6.785357475280762, "global_step": 157675, "epoch": 3754} {"train_loss": -6.767513275146484, "global_step": 157676, "epoch": 3754} {"train_loss": -6.874420642852783, "global_step": 157677, "epoch": 3754} {"train_loss": -6.908425331115723, "global_step": 157678, "epoch": 3754} {"train_loss": -6.8866286277771, "global_step": 157679, "epoch": 3754} {"train_loss": -6.947747230529785, "global_step": 157680, "epoch": 3754} {"train_loss": -6.906613826751709, "global_step": 157681, "epoch": 3754} {"train_loss": -6.8700971603393555, "global_step": 157682, "epoch": 3754} {"train_loss": -6.944345474243164, "global_step": 157683, "epoch": 3754} {"train_loss": -6.984865188598633, "global_step": 157684, "epoch": 3754} {"train_loss": -6.911904335021973, "global_step": 157685, "epoch": 3754} {"train_loss": -6.904029846191406, "global_step": 157686, "epoch": 3754} {"train_loss": -6.998706817626953, "global_step": 157687, "epoch": 3754} {"train_loss": -7.002536296844482, "global_step": 157688, "epoch": 3754} {"train_loss": -6.950501918792725, "global_step": 157689, "epoch": 3754} {"train_loss": -7.062390327453613, "global_step": 157690, "epoch": 3754} {"train_loss": -6.9456400871276855, "global_step": 157691, "epoch": 3754} {"train_loss": -6.860861778259277, "global_step": 157692, "epoch": 3754} {"train_loss": -6.958573818206787, "global_step": 157693, "epoch": 3754} {"train_loss": -6.688785552978516, "global_step": 157694, "epoch": 3754} {"train_loss": -6.817188739776611, "global_step": 157695, "epoch": 3754} {"train_loss": -6.953627109527588, "global_step": 157696, "epoch": 3754} {"train_loss": -6.667176246643066, "global_step": 157697, "epoch": 3754} {"train_loss": -6.892361640930176, "global_step": 157698, "epoch": 3754} {"train_loss": -6.850009918212891, "global_step": 157699, "epoch": 3754} {"train_loss": -6.806074619293213, "global_step": 157700, "epoch": 3754} {"train_loss": -6.897112846374512, "global_step": 157701, "epoch": 3754} {"train_loss": -6.784891128540039, "global_step": 157702, "epoch": 3754} {"train_loss": -6.884257793426514, "global_step": 157703, "epoch": 3754} {"train_loss": -6.842988014221191, "global_step": 157704, "epoch": 3754} {"train_loss": -6.951269149780273, "global_step": 157705, "epoch": 3754} {"train_loss": -6.930564880371094, "global_step": 157706, "epoch": 3754} {"train_loss": -6.895685195922852, "global_step": 157707, "epoch": 3754} {"train_loss": -7.0740227699279785, "global_step": 157708, "epoch": 3754} {"train_loss": -6.889547734033494, "global_step": 157709, "epoch": 3754, "val_loss": 79064.8984375} {"train_loss": -6.938093185424805, "global_step": 157710, "epoch": 3755} {"train_loss": -6.813284397125244, "global_step": 157711, "epoch": 3755} {"train_loss": -6.891798496246338, "global_step": 157712, "epoch": 3755} {"train_loss": -6.925322532653809, "global_step": 157713, "epoch": 3755} {"train_loss": -6.824372291564941, "global_step": 157714, "epoch": 3755} {"train_loss": -6.948667526245117, "global_step": 157715, "epoch": 3755} {"train_loss": -6.9057159423828125, "global_step": 157716, "epoch": 3755} {"train_loss": -6.920205116271973, "global_step": 157717, "epoch": 3755} {"train_loss": -6.907251358032227, "global_step": 157718, "epoch": 3755} {"train_loss": -6.801119327545166, "global_step": 157719, "epoch": 3755} {"train_loss": -7.041762828826904, "global_step": 157720, "epoch": 3755} {"train_loss": -6.889710903167725, "global_step": 157721, "epoch": 3755} {"train_loss": -6.939037322998047, "global_step": 157722, "epoch": 3755} {"train_loss": -6.827764511108398, "global_step": 157723, "epoch": 3755} {"train_loss": -6.89940071105957, "global_step": 157724, "epoch": 3755} {"train_loss": -6.984233856201172, "global_step": 157725, "epoch": 3755} {"train_loss": -6.916158676147461, "global_step": 157726, "epoch": 3755} {"train_loss": -6.911252498626709, "global_step": 157727, "epoch": 3755} {"train_loss": -6.848992824554443, "global_step": 157728, "epoch": 3755} {"train_loss": -6.901206970214844, "global_step": 157729, "epoch": 3755} {"train_loss": -6.818810939788818, "global_step": 157730, "epoch": 3755} {"train_loss": -6.900210857391357, "global_step": 157731, "epoch": 3755} {"train_loss": -6.892572402954102, "global_step": 157732, "epoch": 3755} {"train_loss": -6.989459991455078, "global_step": 157733, "epoch": 3755} {"train_loss": -6.732847213745117, "global_step": 157734, "epoch": 3755} {"train_loss": -6.959677696228027, "global_step": 157735, "epoch": 3755} {"train_loss": -6.83504056930542, "global_step": 157736, "epoch": 3755} {"train_loss": -6.829642295837402, "global_step": 157737, "epoch": 3755} {"train_loss": -7.004861831665039, "global_step": 157738, "epoch": 3755} {"train_loss": -6.934833526611328, "global_step": 157739, "epoch": 3755} {"train_loss": -6.915433883666992, "global_step": 157740, "epoch": 3755} {"train_loss": -6.878270149230957, "global_step": 157741, "epoch": 3755} {"train_loss": -6.898212909698486, "global_step": 157742, "epoch": 3755} {"train_loss": -6.911043167114258, "global_step": 157743, "epoch": 3755} {"train_loss": -6.930108547210693, "global_step": 157744, "epoch": 3755} {"train_loss": -6.983720779418945, "global_step": 157745, "epoch": 3755} {"train_loss": -6.906698226928711, "global_step": 157746, "epoch": 3755} {"train_loss": -6.958225250244141, "global_step": 157747, "epoch": 3755} {"train_loss": -6.745969295501709, "global_step": 157748, "epoch": 3755} {"train_loss": -6.999128341674805, "global_step": 157749, "epoch": 3755} {"train_loss": -6.860361576080322, "global_step": 157750, "epoch": 3755} {"train_loss": -6.903097005117507, "global_step": 157751, "epoch": 3755, "val_loss": 79179.8203125} {"train_loss": -6.999172210693359, "global_step": 157752, "epoch": 3756} {"train_loss": -6.915639400482178, "global_step": 157753, "epoch": 3756} {"train_loss": -6.888715744018555, "global_step": 157754, "epoch": 3756} {"train_loss": -7.036174297332764, "global_step": 157755, "epoch": 3756} {"train_loss": -6.921623706817627, "global_step": 157756, "epoch": 3756} {"train_loss": -7.064276218414307, "global_step": 157757, "epoch": 3756} {"train_loss": -6.883213043212891, "global_step": 157758, "epoch": 3756} {"train_loss": -6.893213272094727, "global_step": 157759, "epoch": 3756} {"train_loss": -6.972280502319336, "global_step": 157760, "epoch": 3756} {"train_loss": -6.944221019744873, "global_step": 157761, "epoch": 3756} {"train_loss": -6.8236284255981445, "global_step": 157762, "epoch": 3756} {"train_loss": -7.031682968139648, "global_step": 157763, "epoch": 3756} {"train_loss": -6.983131408691406, "global_step": 157764, "epoch": 3756} {"train_loss": -6.874157428741455, "global_step": 157765, "epoch": 3756} {"train_loss": -6.982591152191162, "global_step": 157766, "epoch": 3756} {"train_loss": -7.107453346252441, "global_step": 157767, "epoch": 3756} {"train_loss": -6.912337303161621, "global_step": 157768, "epoch": 3756} {"train_loss": -7.028677463531494, "global_step": 157769, "epoch": 3756} {"train_loss": -7.037136077880859, "global_step": 157770, "epoch": 3756} {"train_loss": -6.913504123687744, "global_step": 157771, "epoch": 3756} {"train_loss": -6.96203088760376, "global_step": 157772, "epoch": 3756} {"train_loss": -6.9504499435424805, "global_step": 157773, "epoch": 3756} {"train_loss": -6.909152984619141, "global_step": 157774, "epoch": 3756} {"train_loss": -6.937254905700684, "global_step": 157775, "epoch": 3756} {"train_loss": -6.839350700378418, "global_step": 157776, "epoch": 3756} {"train_loss": -6.766966819763184, "global_step": 157777, "epoch": 3756} {"train_loss": -6.8946356773376465, "global_step": 157778, "epoch": 3756} {"train_loss": -6.758942604064941, "global_step": 157779, "epoch": 3756} {"train_loss": -6.889298915863037, "global_step": 157780, "epoch": 3756} {"train_loss": -6.814770698547363, "global_step": 157781, "epoch": 3756} {"train_loss": -6.964038372039795, "global_step": 157782, "epoch": 3756} {"train_loss": -6.95505952835083, "global_step": 157783, "epoch": 3756} {"train_loss": -6.981476783752441, "global_step": 157784, "epoch": 3756} {"train_loss": -6.7759857177734375, "global_step": 157785, "epoch": 3756} {"train_loss": -6.946348190307617, "global_step": 157786, "epoch": 3756} {"train_loss": -6.872450828552246, "global_step": 157787, "epoch": 3756} {"train_loss": -6.878127098083496, "global_step": 157788, "epoch": 3756} {"train_loss": -7.0686259269714355, "global_step": 157789, "epoch": 3756} {"train_loss": -6.8561859130859375, "global_step": 157790, "epoch": 3756} {"train_loss": -6.984188079833984, "global_step": 157791, "epoch": 3756} {"train_loss": -6.86774206161499, "global_step": 157792, "epoch": 3756} {"train_loss": -6.92840119770595, "global_step": 157793, "epoch": 3756, "val_loss": 79188.8046875} {"train_loss": -6.756309986114502, "global_step": 157794, "epoch": 3757} {"train_loss": -6.91996955871582, "global_step": 157795, "epoch": 3757} {"train_loss": -6.787544250488281, "global_step": 157796, "epoch": 3757} {"train_loss": -6.975824356079102, "global_step": 157797, "epoch": 3757} {"train_loss": -6.863987922668457, "global_step": 157798, "epoch": 3757} {"train_loss": -6.687172889709473, "global_step": 157799, "epoch": 3757} {"train_loss": -6.996628284454346, "global_step": 157800, "epoch": 3757} {"train_loss": -6.924799919128418, "global_step": 157801, "epoch": 3757} {"train_loss": -6.823935508728027, "global_step": 157802, "epoch": 3757} {"train_loss": -6.885960578918457, "global_step": 157803, "epoch": 3757} {"train_loss": -6.84193754196167, "global_step": 157804, "epoch": 3757} {"train_loss": -6.892851829528809, "global_step": 157805, "epoch": 3757} {"train_loss": -6.944958209991455, "global_step": 157806, "epoch": 3757} {"train_loss": -6.716343402862549, "global_step": 157807, "epoch": 3757} {"train_loss": -7.044974327087402, "global_step": 157808, "epoch": 3757} {"train_loss": -6.890263557434082, "global_step": 157809, "epoch": 3757} {"train_loss": -6.915527820587158, "global_step": 157810, "epoch": 3757} {"train_loss": -6.8461222648620605, "global_step": 157811, "epoch": 3757} {"train_loss": -6.850866317749023, "global_step": 157812, "epoch": 3757} {"train_loss": -7.010821342468262, "global_step": 157813, "epoch": 3757} {"train_loss": -6.799074649810791, "global_step": 157814, "epoch": 3757} {"train_loss": -6.857170581817627, "global_step": 157815, "epoch": 3757} {"train_loss": -6.819321632385254, "global_step": 157816, "epoch": 3757} {"train_loss": -6.819668769836426, "global_step": 157817, "epoch": 3757} {"train_loss": -6.8774518966674805, "global_step": 157818, "epoch": 3757} {"train_loss": -6.819797992706299, "global_step": 157819, "epoch": 3757} {"train_loss": -6.898155212402344, "global_step": 157820, "epoch": 3757} {"train_loss": -6.7549238204956055, "global_step": 157821, "epoch": 3757} {"train_loss": -7.018110275268555, "global_step": 157822, "epoch": 3757} {"train_loss": -6.8571577072143555, "global_step": 157823, "epoch": 3757} {"train_loss": -6.816615104675293, "global_step": 157824, "epoch": 3757} {"train_loss": -6.902671813964844, "global_step": 157825, "epoch": 3757} {"train_loss": -6.927066802978516, "global_step": 157826, "epoch": 3757} {"train_loss": -6.919072151184082, "global_step": 157827, "epoch": 3757} {"train_loss": -7.003026962280273, "global_step": 157828, "epoch": 3757} {"train_loss": -6.817164897918701, "global_step": 157829, "epoch": 3757} {"train_loss": -7.021859169006348, "global_step": 157830, "epoch": 3757} {"train_loss": -6.9663286209106445, "global_step": 157831, "epoch": 3757} {"train_loss": -7.045202255249023, "global_step": 157832, "epoch": 3757} {"train_loss": -6.8787617683410645, "global_step": 157833, "epoch": 3757} {"train_loss": -6.8533935546875, "global_step": 157834, "epoch": 3757} {"train_loss": -6.883378244581676, "global_step": 157835, "epoch": 3757, "val_loss": 79119.65625} {"train_loss": -6.907182693481445, "global_step": 157836, "epoch": 3758} {"train_loss": -6.979635238647461, "global_step": 157837, "epoch": 3758} {"train_loss": -7.03431510925293, "global_step": 157838, "epoch": 3758} {"train_loss": -6.891408920288086, "global_step": 157839, "epoch": 3758} {"train_loss": -6.957827091217041, "global_step": 157840, "epoch": 3758} {"train_loss": -6.82879638671875, "global_step": 157841, "epoch": 3758} {"train_loss": -6.765999794006348, "global_step": 157842, "epoch": 3758} {"train_loss": -6.870109558105469, "global_step": 157843, "epoch": 3758} {"train_loss": -6.983787536621094, "global_step": 157844, "epoch": 3758} {"train_loss": -6.7577338218688965, "global_step": 157845, "epoch": 3758} {"train_loss": -6.830938339233398, "global_step": 157846, "epoch": 3758} {"train_loss": -6.904965400695801, "global_step": 157847, "epoch": 3758} {"train_loss": -6.785382270812988, "global_step": 157848, "epoch": 3758} {"train_loss": -6.934370994567871, "global_step": 157849, "epoch": 3758} {"train_loss": -6.802687644958496, "global_step": 157850, "epoch": 3758} {"train_loss": -6.984135627746582, "global_step": 157851, "epoch": 3758} {"train_loss": -6.862813949584961, "global_step": 157852, "epoch": 3758} {"train_loss": -6.839358329772949, "global_step": 157853, "epoch": 3758} {"train_loss": -6.939499855041504, "global_step": 157854, "epoch": 3758} {"train_loss": -7.011763572692871, "global_step": 157855, "epoch": 3758} {"train_loss": -6.907258987426758, "global_step": 157856, "epoch": 3758} {"train_loss": -6.879141330718994, "global_step": 157857, "epoch": 3758} {"train_loss": -6.888937950134277, "global_step": 157858, "epoch": 3758} {"train_loss": -6.894723892211914, "global_step": 157859, "epoch": 3758} {"train_loss": -6.8049092292785645, "global_step": 157860, "epoch": 3758} {"train_loss": -7.034244537353516, "global_step": 157861, "epoch": 3758} {"train_loss": -6.871105194091797, "global_step": 157862, "epoch": 3758} {"train_loss": -6.866999626159668, "global_step": 157863, "epoch": 3758} {"train_loss": -6.945523738861084, "global_step": 157864, "epoch": 3758} {"train_loss": -6.8248467445373535, "global_step": 157865, "epoch": 3758} {"train_loss": -6.92935037612915, "global_step": 157866, "epoch": 3758} {"train_loss": -6.985631942749023, "global_step": 157867, "epoch": 3758} {"train_loss": -6.950726509094238, "global_step": 157868, "epoch": 3758} {"train_loss": -6.822346210479736, "global_step": 157869, "epoch": 3758} {"train_loss": -6.899859428405762, "global_step": 157870, "epoch": 3758} {"train_loss": -6.733359336853027, "global_step": 157871, "epoch": 3758} {"train_loss": -6.83555269241333, "global_step": 157872, "epoch": 3758} {"train_loss": -6.824592590332031, "global_step": 157873, "epoch": 3758} {"train_loss": -6.930623531341553, "global_step": 157874, "epoch": 3758} {"train_loss": -6.941039085388184, "global_step": 157875, "epoch": 3758} {"train_loss": -6.967268943786621, "global_step": 157876, "epoch": 3758} {"train_loss": -6.892645938055856, "global_step": 157877, "epoch": 3758, "val_loss": 79048.2890625} {"train_loss": -7.021556854248047, "global_step": 157878, "epoch": 3759} {"train_loss": -6.9200439453125, "global_step": 157879, "epoch": 3759} {"train_loss": -6.941523551940918, "global_step": 157880, "epoch": 3759} {"train_loss": -6.805912971496582, "global_step": 157881, "epoch": 3759} {"train_loss": -6.903293132781982, "global_step": 157882, "epoch": 3759} {"train_loss": -6.913924217224121, "global_step": 157883, "epoch": 3759} {"train_loss": -6.935938835144043, "global_step": 157884, "epoch": 3759} {"train_loss": -7.030306339263916, "global_step": 157885, "epoch": 3759} {"train_loss": -7.011070728302002, "global_step": 157886, "epoch": 3759} {"train_loss": -7.033389568328857, "global_step": 157887, "epoch": 3759} {"train_loss": -6.969106674194336, "global_step": 157888, "epoch": 3759} {"train_loss": -6.861109733581543, "global_step": 157889, "epoch": 3759} {"train_loss": -6.9162797927856445, "global_step": 157890, "epoch": 3759} {"train_loss": -7.018742561340332, "global_step": 157891, "epoch": 3759} {"train_loss": -6.921914577484131, "global_step": 157892, "epoch": 3759} {"train_loss": -6.99436092376709, "global_step": 157893, "epoch": 3759} {"train_loss": -6.868032455444336, "global_step": 157894, "epoch": 3759} {"train_loss": -7.016927242279053, "global_step": 157895, "epoch": 3759} {"train_loss": -6.997647285461426, "global_step": 157896, "epoch": 3759} {"train_loss": -6.951882362365723, "global_step": 157897, "epoch": 3759} {"train_loss": -7.011155605316162, "global_step": 157898, "epoch": 3759} {"train_loss": -6.941006660461426, "global_step": 157899, "epoch": 3759} {"train_loss": -7.053658485412598, "global_step": 157900, "epoch": 3759} {"train_loss": -6.967835426330566, "global_step": 157901, "epoch": 3759} {"train_loss": -6.946192741394043, "global_step": 157902, "epoch": 3759} {"train_loss": -7.042148590087891, "global_step": 157903, "epoch": 3759} {"train_loss": -7.0273942947387695, "global_step": 157904, "epoch": 3759} {"train_loss": -6.94744873046875, "global_step": 157905, "epoch": 3759} {"train_loss": -6.894093990325928, "global_step": 157906, "epoch": 3759} {"train_loss": -6.923471450805664, "global_step": 157907, "epoch": 3759} {"train_loss": -6.945979118347168, "global_step": 157908, "epoch": 3759} {"train_loss": -6.909497261047363, "global_step": 157909, "epoch": 3759} {"train_loss": -6.957180500030518, "global_step": 157910, "epoch": 3759} {"train_loss": -7.006994247436523, "global_step": 157911, "epoch": 3759} {"train_loss": -7.016487121582031, "global_step": 157912, "epoch": 3759} {"train_loss": -6.966797828674316, "global_step": 157913, "epoch": 3759} {"train_loss": -7.014830112457275, "global_step": 157914, "epoch": 3759} {"train_loss": -6.959819316864014, "global_step": 157915, "epoch": 3759} {"train_loss": -7.105536460876465, "global_step": 157916, "epoch": 3759} {"train_loss": -7.016310691833496, "global_step": 157917, "epoch": 3759} {"train_loss": -6.928524971008301, "global_step": 157918, "epoch": 3759} {"train_loss": -6.96562139193217, "global_step": 157919, "epoch": 3759, "val_loss": 79267.4140625} {"train_loss": -6.888904571533203, "global_step": 157920, "epoch": 3760} {"train_loss": -6.8819260597229, "global_step": 157921, "epoch": 3760} {"train_loss": -7.021512031555176, "global_step": 157922, "epoch": 3760} {"train_loss": -6.924530506134033, "global_step": 157923, "epoch": 3760} {"train_loss": -6.9989542961120605, "global_step": 157924, "epoch": 3760} {"train_loss": -6.9654221534729, "global_step": 157925, "epoch": 3760} {"train_loss": -7.008820056915283, "global_step": 157926, "epoch": 3760} {"train_loss": -6.987155914306641, "global_step": 157927, "epoch": 3760} {"train_loss": -6.948350429534912, "global_step": 157928, "epoch": 3760} {"train_loss": -7.110302925109863, "global_step": 157929, "epoch": 3760} {"train_loss": -7.051107406616211, "global_step": 157930, "epoch": 3760} {"train_loss": -7.123330116271973, "global_step": 157931, "epoch": 3760} {"train_loss": -6.998898029327393, "global_step": 157932, "epoch": 3760} {"train_loss": -6.988897800445557, "global_step": 157933, "epoch": 3760} {"train_loss": -6.884260177612305, "global_step": 157934, "epoch": 3760} {"train_loss": -6.970339298248291, "global_step": 157935, "epoch": 3760} {"train_loss": -6.88060998916626, "global_step": 157936, "epoch": 3760} {"train_loss": -6.849602222442627, "global_step": 157937, "epoch": 3760} {"train_loss": -6.967489719390869, "global_step": 157938, "epoch": 3760} {"train_loss": -6.923410415649414, "global_step": 157939, "epoch": 3760} {"train_loss": -6.831181526184082, "global_step": 157940, "epoch": 3760} {"train_loss": -6.96220064163208, "global_step": 157941, "epoch": 3760} {"train_loss": -6.97995662689209, "global_step": 157942, "epoch": 3760} {"train_loss": -6.879632472991943, "global_step": 157943, "epoch": 3760} {"train_loss": -6.876717567443848, "global_step": 157944, "epoch": 3760} {"train_loss": -7.014216899871826, "global_step": 157945, "epoch": 3760} {"train_loss": -6.943840026855469, "global_step": 157946, "epoch": 3760} {"train_loss": -6.944803237915039, "global_step": 157947, "epoch": 3760} {"train_loss": -6.984129905700684, "global_step": 157948, "epoch": 3760} {"train_loss": -6.9709153175354, "global_step": 157949, "epoch": 3760} {"train_loss": -6.923798561096191, "global_step": 157950, "epoch": 3760} {"train_loss": -6.9130353927612305, "global_step": 157951, "epoch": 3760} {"train_loss": -7.01563835144043, "global_step": 157952, "epoch": 3760} {"train_loss": -6.989429473876953, "global_step": 157953, "epoch": 3760} {"train_loss": -6.9593071937561035, "global_step": 157954, "epoch": 3760} {"train_loss": -6.9182963371276855, "global_step": 157955, "epoch": 3760} {"train_loss": -7.021132469177246, "global_step": 157956, "epoch": 3760} {"train_loss": -7.041687965393066, "global_step": 157957, "epoch": 3760} {"train_loss": -6.9350810050964355, "global_step": 157958, "epoch": 3760} {"train_loss": -6.966935634613037, "global_step": 157959, "epoch": 3760} {"train_loss": -6.840994834899902, "global_step": 157960, "epoch": 3760} {"train_loss": -6.9584863640013195, "global_step": 157961, "epoch": 3760, "val_loss": 79397.28125} {"train_loss": -6.874344825744629, "global_step": 157962, "epoch": 3761} {"train_loss": -6.945741653442383, "global_step": 157963, "epoch": 3761} {"train_loss": -6.845831871032715, "global_step": 157964, "epoch": 3761} {"train_loss": -6.998036861419678, "global_step": 157965, "epoch": 3761} {"train_loss": -6.90797233581543, "global_step": 157966, "epoch": 3761} {"train_loss": -6.970034599304199, "global_step": 157967, "epoch": 3761} {"train_loss": -6.85409688949585, "global_step": 157968, "epoch": 3761} {"train_loss": -6.871192932128906, "global_step": 157969, "epoch": 3761} {"train_loss": -7.048468589782715, "global_step": 157970, "epoch": 3761} {"train_loss": -6.970255374908447, "global_step": 157971, "epoch": 3761} {"train_loss": -6.9301910400390625, "global_step": 157972, "epoch": 3761} {"train_loss": -6.953611373901367, "global_step": 157973, "epoch": 3761} {"train_loss": -6.948782920837402, "global_step": 157974, "epoch": 3761} {"train_loss": -6.9679365158081055, "global_step": 157975, "epoch": 3761} {"train_loss": -7.046175956726074, "global_step": 157976, "epoch": 3761} {"train_loss": -6.921791076660156, "global_step": 157977, "epoch": 3761} {"train_loss": -7.0663299560546875, "global_step": 157978, "epoch": 3761} {"train_loss": -6.980437278747559, "global_step": 157979, "epoch": 3761} {"train_loss": -6.861101150512695, "global_step": 157980, "epoch": 3761} {"train_loss": -7.05929708480835, "global_step": 157981, "epoch": 3761} {"train_loss": -6.999789237976074, "global_step": 157982, "epoch": 3761} {"train_loss": -6.883174419403076, "global_step": 157983, "epoch": 3761} {"train_loss": -7.092232704162598, "global_step": 157984, "epoch": 3761} {"train_loss": -6.998371124267578, "global_step": 157985, "epoch": 3761} {"train_loss": -6.9016804695129395, "global_step": 157986, "epoch": 3761} {"train_loss": -7.034487724304199, "global_step": 157987, "epoch": 3761} {"train_loss": -6.914650917053223, "global_step": 157988, "epoch": 3761} {"train_loss": -6.915401458740234, "global_step": 157989, "epoch": 3761} {"train_loss": -6.856385231018066, "global_step": 157990, "epoch": 3761} {"train_loss": -7.037964820861816, "global_step": 157991, "epoch": 3761} {"train_loss": -6.874578952789307, "global_step": 157992, "epoch": 3761} {"train_loss": -6.883391380310059, "global_step": 157993, "epoch": 3761} {"train_loss": -6.952800750732422, "global_step": 157994, "epoch": 3761} {"train_loss": -6.924343585968018, "global_step": 157995, "epoch": 3761} {"train_loss": -6.747465133666992, "global_step": 157996, "epoch": 3761} {"train_loss": -6.749444007873535, "global_step": 157997, "epoch": 3761} {"train_loss": -6.971621513366699, "global_step": 157998, "epoch": 3761} {"train_loss": -6.910226821899414, "global_step": 157999, "epoch": 3761} {"train_loss": -6.868936061859131, "global_step": 158000, "epoch": 3761} {"train_loss": -6.980498313903809, "global_step": 158001, "epoch": 3761} {"train_loss": -6.878299236297607, "global_step": 158002, "epoch": 3761} {"train_loss": -6.9349415983472555, "global_step": 158003, "epoch": 3761, "val_loss": 79118.0390625} {"train_loss": -6.995145320892334, "global_step": 158004, "epoch": 3762} {"train_loss": -6.967870712280273, "global_step": 158005, "epoch": 3762} {"train_loss": -7.013463973999023, "global_step": 158006, "epoch": 3762} {"train_loss": -6.96483850479126, "global_step": 158007, "epoch": 3762} {"train_loss": -7.04631233215332, "global_step": 158008, "epoch": 3762} {"train_loss": -6.949403762817383, "global_step": 158009, "epoch": 3762} {"train_loss": -6.9610595703125, "global_step": 158010, "epoch": 3762} {"train_loss": -7.1086883544921875, "global_step": 158011, "epoch": 3762} {"train_loss": -6.974531650543213, "global_step": 158012, "epoch": 3762} {"train_loss": -6.984244346618652, "global_step": 158013, "epoch": 3762} {"train_loss": -6.952633857727051, "global_step": 158014, "epoch": 3762} {"train_loss": -7.093748569488525, "global_step": 158015, "epoch": 3762} {"train_loss": -6.977595806121826, "global_step": 158016, "epoch": 3762} {"train_loss": -6.790483474731445, "global_step": 158017, "epoch": 3762} {"train_loss": -7.0263543128967285, "global_step": 158018, "epoch": 3762} {"train_loss": -6.689046382904053, "global_step": 158019, "epoch": 3762} {"train_loss": -6.885676383972168, "global_step": 158020, "epoch": 3762} {"train_loss": -6.719386100769043, "global_step": 158021, "epoch": 3762} {"train_loss": -6.731338024139404, "global_step": 158022, "epoch": 3762} {"train_loss": -6.93541145324707, "global_step": 158023, "epoch": 3762} {"train_loss": -6.73774528503418, "global_step": 158024, "epoch": 3762} {"train_loss": -6.871715068817139, "global_step": 158025, "epoch": 3762} {"train_loss": -6.800537586212158, "global_step": 158026, "epoch": 3762} {"train_loss": -6.812295436859131, "global_step": 158027, "epoch": 3762} {"train_loss": -6.8076324462890625, "global_step": 158028, "epoch": 3762} {"train_loss": -6.738840579986572, "global_step": 158029, "epoch": 3762} {"train_loss": -6.776463031768799, "global_step": 158030, "epoch": 3762} {"train_loss": -6.762384414672852, "global_step": 158031, "epoch": 3762} {"train_loss": -7.007445812225342, "global_step": 158032, "epoch": 3762} {"train_loss": -6.834477424621582, "global_step": 158033, "epoch": 3762} {"train_loss": -6.850471019744873, "global_step": 158034, "epoch": 3762} {"train_loss": -6.837213039398193, "global_step": 158035, "epoch": 3762} {"train_loss": -6.978156566619873, "global_step": 158036, "epoch": 3762} {"train_loss": -6.8687028884887695, "global_step": 158037, "epoch": 3762} {"train_loss": -6.924662113189697, "global_step": 158038, "epoch": 3762} {"train_loss": -6.851691722869873, "global_step": 158039, "epoch": 3762} {"train_loss": -6.897587776184082, "global_step": 158040, "epoch": 3762} {"train_loss": -6.874204158782959, "global_step": 158041, "epoch": 3762} {"train_loss": -6.736186504364014, "global_step": 158042, "epoch": 3762} {"train_loss": -6.861396789550781, "global_step": 158043, "epoch": 3762} {"train_loss": -6.852227210998535, "global_step": 158044, "epoch": 3762} {"train_loss": -6.890250978015718, "global_step": 158045, "epoch": 3762, "val_loss": 79207.3359375} {"train_loss": -6.947925090789795, "global_step": 158046, "epoch": 3763} {"train_loss": -6.992781162261963, "global_step": 158047, "epoch": 3763} {"train_loss": -6.962489128112793, "global_step": 158048, "epoch": 3763} {"train_loss": -7.032182693481445, "global_step": 158049, "epoch": 3763} {"train_loss": -6.9296441078186035, "global_step": 158050, "epoch": 3763} {"train_loss": -6.9228386878967285, "global_step": 158051, "epoch": 3763} {"train_loss": -6.923943042755127, "global_step": 158052, "epoch": 3763} {"train_loss": -6.880274295806885, "global_step": 158053, "epoch": 3763} {"train_loss": -6.76438045501709, "global_step": 158054, "epoch": 3763} {"train_loss": -7.0403594970703125, "global_step": 158055, "epoch": 3763} {"train_loss": -6.875058174133301, "global_step": 158056, "epoch": 3763} {"train_loss": -7.0252909660339355, "global_step": 158057, "epoch": 3763} {"train_loss": -6.800753593444824, "global_step": 158058, "epoch": 3763} {"train_loss": -6.9174604415893555, "global_step": 158059, "epoch": 3763} {"train_loss": -6.915487289428711, "global_step": 158060, "epoch": 3763} {"train_loss": -6.835030555725098, "global_step": 158061, "epoch": 3763} {"train_loss": -7.026608943939209, "global_step": 158062, "epoch": 3763} {"train_loss": -6.912051200866699, "global_step": 158063, "epoch": 3763} {"train_loss": -6.934480667114258, "global_step": 158064, "epoch": 3763} {"train_loss": -6.949214935302734, "global_step": 158065, "epoch": 3763} {"train_loss": -6.8902363777160645, "global_step": 158066, "epoch": 3763} {"train_loss": -6.923403263092041, "global_step": 158067, "epoch": 3763} {"train_loss": -6.931612014770508, "global_step": 158068, "epoch": 3763} {"train_loss": -6.872581481933594, "global_step": 158069, "epoch": 3763} {"train_loss": -6.795044898986816, "global_step": 158070, "epoch": 3763} {"train_loss": -6.848291873931885, "global_step": 158071, "epoch": 3763} {"train_loss": -7.001041412353516, "global_step": 158072, "epoch": 3763} {"train_loss": -6.949833393096924, "global_step": 158073, "epoch": 3763} {"train_loss": -6.997896194458008, "global_step": 158074, "epoch": 3763} {"train_loss": -6.922372817993164, "global_step": 158075, "epoch": 3763} {"train_loss": -6.917218208312988, "global_step": 158076, "epoch": 3763} {"train_loss": -6.989167213439941, "global_step": 158077, "epoch": 3763} {"train_loss": -6.841518402099609, "global_step": 158078, "epoch": 3763} {"train_loss": -6.929919242858887, "global_step": 158079, "epoch": 3763} {"train_loss": -7.005495548248291, "global_step": 158080, "epoch": 3763} {"train_loss": -6.987058162689209, "global_step": 158081, "epoch": 3763} {"train_loss": -6.898393154144287, "global_step": 158082, "epoch": 3763} {"train_loss": -6.9997453689575195, "global_step": 158083, "epoch": 3763} {"train_loss": -6.95979642868042, "global_step": 158084, "epoch": 3763} {"train_loss": -6.847761154174805, "global_step": 158085, "epoch": 3763} {"train_loss": -6.896786212921143, "global_step": 158086, "epoch": 3763} {"train_loss": -6.925067822138469, "global_step": 158087, "epoch": 3763, "val_loss": 79128.3515625} {"train_loss": -7.028223991394043, "global_step": 158088, "epoch": 3764} {"train_loss": -6.670943260192871, "global_step": 158089, "epoch": 3764} {"train_loss": -6.744927406311035, "global_step": 158090, "epoch": 3764} {"train_loss": -6.83351993560791, "global_step": 158091, "epoch": 3764} {"train_loss": -6.878352642059326, "global_step": 158092, "epoch": 3764} {"train_loss": -6.794833183288574, "global_step": 158093, "epoch": 3764} {"train_loss": -7.026244163513184, "global_step": 158094, "epoch": 3764} {"train_loss": -6.870925426483154, "global_step": 158095, "epoch": 3764} {"train_loss": -6.919024467468262, "global_step": 158096, "epoch": 3764} {"train_loss": -6.943185329437256, "global_step": 158097, "epoch": 3764} {"train_loss": -6.968567848205566, "global_step": 158098, "epoch": 3764} {"train_loss": -6.985012054443359, "global_step": 158099, "epoch": 3764} {"train_loss": -6.899283409118652, "global_step": 158100, "epoch": 3764} {"train_loss": -6.866141319274902, "global_step": 158101, "epoch": 3764} {"train_loss": -6.911479473114014, "global_step": 158102, "epoch": 3764} {"train_loss": -7.038701057434082, "global_step": 158103, "epoch": 3764} {"train_loss": -6.953515529632568, "global_step": 158104, "epoch": 3764} {"train_loss": -7.043287754058838, "global_step": 158105, "epoch": 3764} {"train_loss": -7.052769660949707, "global_step": 158106, "epoch": 3764} {"train_loss": -6.925371170043945, "global_step": 158107, "epoch": 3764} {"train_loss": -6.974870204925537, "global_step": 158108, "epoch": 3764} {"train_loss": -6.967839241027832, "global_step": 158109, "epoch": 3764} {"train_loss": -6.860410213470459, "global_step": 158110, "epoch": 3764} {"train_loss": -7.036456108093262, "global_step": 158111, "epoch": 3764} {"train_loss": -6.95737886428833, "global_step": 158112, "epoch": 3764} {"train_loss": -6.967569828033447, "global_step": 158113, "epoch": 3764} {"train_loss": -6.878800392150879, "global_step": 158114, "epoch": 3764} {"train_loss": -7.0362372398376465, "global_step": 158115, "epoch": 3764} {"train_loss": -6.893448829650879, "global_step": 158116, "epoch": 3764} {"train_loss": -6.908032417297363, "global_step": 158117, "epoch": 3764} {"train_loss": -6.93623161315918, "global_step": 158118, "epoch": 3764} {"train_loss": -6.917852401733398, "global_step": 158119, "epoch": 3764} {"train_loss": -6.886335372924805, "global_step": 158120, "epoch": 3764} {"train_loss": -6.994626045227051, "global_step": 158121, "epoch": 3764} {"train_loss": -6.841352462768555, "global_step": 158122, "epoch": 3764} {"train_loss": -6.980669975280762, "global_step": 158123, "epoch": 3764} {"train_loss": -6.925370693206787, "global_step": 158124, "epoch": 3764} {"train_loss": -7.0674028396606445, "global_step": 158125, "epoch": 3764} {"train_loss": -7.034789085388184, "global_step": 158126, "epoch": 3764} {"train_loss": -6.9136505126953125, "global_step": 158127, "epoch": 3764} {"train_loss": -6.957357883453369, "global_step": 158128, "epoch": 3764} {"train_loss": -6.93468807992481, "global_step": 158129, "epoch": 3764, "val_loss": 79051.9921875} {"train_loss": -7.05872106552124, "global_step": 158130, "epoch": 3765} {"train_loss": -6.828303337097168, "global_step": 158131, "epoch": 3765} {"train_loss": -6.893357753753662, "global_step": 158132, "epoch": 3765} {"train_loss": -6.974287509918213, "global_step": 158133, "epoch": 3765} {"train_loss": -6.610713481903076, "global_step": 158134, "epoch": 3765} {"train_loss": -6.835566520690918, "global_step": 158135, "epoch": 3765} {"train_loss": -6.983543872833252, "global_step": 158136, "epoch": 3765} {"train_loss": -6.918761253356934, "global_step": 158137, "epoch": 3765} {"train_loss": -6.885953903198242, "global_step": 158138, "epoch": 3765} {"train_loss": -6.918235778808594, "global_step": 158139, "epoch": 3765} {"train_loss": -6.987845420837402, "global_step": 158140, "epoch": 3765} {"train_loss": -6.744726181030273, "global_step": 158141, "epoch": 3765} {"train_loss": -6.945079803466797, "global_step": 158142, "epoch": 3765} {"train_loss": -6.96663236618042, "global_step": 158143, "epoch": 3765} {"train_loss": -6.877727508544922, "global_step": 158144, "epoch": 3765} {"train_loss": -6.913314342498779, "global_step": 158145, "epoch": 3765} {"train_loss": -6.890949726104736, "global_step": 158146, "epoch": 3765} {"train_loss": -6.926840782165527, "global_step": 158147, "epoch": 3765} {"train_loss": -7.0040602684021, "global_step": 158148, "epoch": 3765} {"train_loss": -6.877173900604248, "global_step": 158149, "epoch": 3765} {"train_loss": -6.909372329711914, "global_step": 158150, "epoch": 3765} {"train_loss": -6.923272609710693, "global_step": 158151, "epoch": 3765} {"train_loss": -6.964949607849121, "global_step": 158152, "epoch": 3765} {"train_loss": -6.8932390213012695, "global_step": 158153, "epoch": 3765} {"train_loss": -6.962418556213379, "global_step": 158154, "epoch": 3765} {"train_loss": -6.975751876831055, "global_step": 158155, "epoch": 3765} {"train_loss": -6.898873329162598, "global_step": 158156, "epoch": 3765} {"train_loss": -6.886577606201172, "global_step": 158157, "epoch": 3765} {"train_loss": -6.749117851257324, "global_step": 158158, "epoch": 3765} {"train_loss": -6.8860273361206055, "global_step": 158159, "epoch": 3765} {"train_loss": -6.78648567199707, "global_step": 158160, "epoch": 3765} {"train_loss": -6.922477722167969, "global_step": 158161, "epoch": 3765} {"train_loss": -6.905412197113037, "global_step": 158162, "epoch": 3765} {"train_loss": -6.820645809173584, "global_step": 158163, "epoch": 3765} {"train_loss": -6.937370300292969, "global_step": 158164, "epoch": 3765} {"train_loss": -6.890951156616211, "global_step": 158165, "epoch": 3765} {"train_loss": -6.864853858947754, "global_step": 158166, "epoch": 3765} {"train_loss": -6.922956466674805, "global_step": 158167, "epoch": 3765} {"train_loss": -6.8772478103637695, "global_step": 158168, "epoch": 3765} {"train_loss": -6.891540050506592, "global_step": 158169, "epoch": 3765} {"train_loss": -6.935697555541992, "global_step": 158170, "epoch": 3765} {"train_loss": -6.898692585173107, "global_step": 158171, "epoch": 3765, "val_loss": 79232.140625} {"train_loss": -7.000498294830322, "global_step": 158172, "epoch": 3766} {"train_loss": -6.666347026824951, "global_step": 158173, "epoch": 3766} {"train_loss": -6.885053634643555, "global_step": 158174, "epoch": 3766} {"train_loss": -6.7120361328125, "global_step": 158175, "epoch": 3766} {"train_loss": -6.940792083740234, "global_step": 158176, "epoch": 3766} {"train_loss": -6.797101974487305, "global_step": 158177, "epoch": 3766} {"train_loss": -6.935776710510254, "global_step": 158178, "epoch": 3766} {"train_loss": -6.780272483825684, "global_step": 158179, "epoch": 3766} {"train_loss": -6.867196083068848, "global_step": 158180, "epoch": 3766} {"train_loss": -6.941362380981445, "global_step": 158181, "epoch": 3766} {"train_loss": -6.839899063110352, "global_step": 158182, "epoch": 3766} {"train_loss": -6.8432841300964355, "global_step": 158183, "epoch": 3766} {"train_loss": -6.86566162109375, "global_step": 158184, "epoch": 3766} {"train_loss": -6.910852432250977, "global_step": 158185, "epoch": 3766} {"train_loss": -6.7582831382751465, "global_step": 158186, "epoch": 3766} {"train_loss": -6.947645664215088, "global_step": 158187, "epoch": 3766} {"train_loss": -6.917550086975098, "global_step": 158188, "epoch": 3766} {"train_loss": -6.929197311401367, "global_step": 158189, "epoch": 3766} {"train_loss": -6.864418983459473, "global_step": 158190, "epoch": 3766} {"train_loss": -6.917105674743652, "global_step": 158191, "epoch": 3766} {"train_loss": -6.831111907958984, "global_step": 158192, "epoch": 3766} {"train_loss": -6.905251502990723, "global_step": 158193, "epoch": 3766} {"train_loss": -6.945422172546387, "global_step": 158194, "epoch": 3766} {"train_loss": -6.850020408630371, "global_step": 158195, "epoch": 3766} {"train_loss": -6.935520648956299, "global_step": 158196, "epoch": 3766} {"train_loss": -6.9548211097717285, "global_step": 158197, "epoch": 3766} {"train_loss": -6.892642021179199, "global_step": 158198, "epoch": 3766} {"train_loss": -6.837558746337891, "global_step": 158199, "epoch": 3766} {"train_loss": -6.702182769775391, "global_step": 158200, "epoch": 3766} {"train_loss": -6.773838996887207, "global_step": 158201, "epoch": 3766} {"train_loss": -6.833794593811035, "global_step": 158202, "epoch": 3766} {"train_loss": -6.895591735839844, "global_step": 158203, "epoch": 3766} {"train_loss": -6.9376983642578125, "global_step": 158204, "epoch": 3766} {"train_loss": -6.878175735473633, "global_step": 158205, "epoch": 3766} {"train_loss": -6.914913177490234, "global_step": 158206, "epoch": 3766} {"train_loss": -6.912883281707764, "global_step": 158207, "epoch": 3766} {"train_loss": -7.005928039550781, "global_step": 158208, "epoch": 3766} {"train_loss": -7.028700351715088, "global_step": 158209, "epoch": 3766} {"train_loss": -6.9082746505737305, "global_step": 158210, "epoch": 3766} {"train_loss": -6.889949798583984, "global_step": 158211, "epoch": 3766} {"train_loss": -6.881418228149414, "global_step": 158212, "epoch": 3766} {"train_loss": -6.879290501276652, "global_step": 158213, "epoch": 3766, "val_loss": 79475.8046875} {"train_loss": -6.9910569190979, "global_step": 158214, "epoch": 3767} {"train_loss": -6.9078474044799805, "global_step": 158215, "epoch": 3767} {"train_loss": -6.927464485168457, "global_step": 158216, "epoch": 3767} {"train_loss": -6.949365139007568, "global_step": 158217, "epoch": 3767} {"train_loss": -6.955833435058594, "global_step": 158218, "epoch": 3767} {"train_loss": -6.931488990783691, "global_step": 158219, "epoch": 3767} {"train_loss": -6.987608909606934, "global_step": 158220, "epoch": 3767} {"train_loss": -6.895628929138184, "global_step": 158221, "epoch": 3767} {"train_loss": -7.03983211517334, "global_step": 158222, "epoch": 3767} {"train_loss": -6.975771903991699, "global_step": 158223, "epoch": 3767} {"train_loss": -6.912047386169434, "global_step": 158224, "epoch": 3767} {"train_loss": -7.038473129272461, "global_step": 158225, "epoch": 3767} {"train_loss": -6.9812188148498535, "global_step": 158226, "epoch": 3767} {"train_loss": -6.99589204788208, "global_step": 158227, "epoch": 3767} {"train_loss": -6.999284267425537, "global_step": 158228, "epoch": 3767} {"train_loss": -6.996250152587891, "global_step": 158229, "epoch": 3767} {"train_loss": -6.980295658111572, "global_step": 158230, "epoch": 3767} {"train_loss": -7.0197319984436035, "global_step": 158231, "epoch": 3767} {"train_loss": -6.894601821899414, "global_step": 158232, "epoch": 3767} {"train_loss": -6.832942485809326, "global_step": 158233, "epoch": 3767} {"train_loss": -6.997518062591553, "global_step": 158234, "epoch": 3767} {"train_loss": -7.028617858886719, "global_step": 158235, "epoch": 3767} {"train_loss": -7.048197269439697, "global_step": 158236, "epoch": 3767} {"train_loss": -6.969886779785156, "global_step": 158237, "epoch": 3767} {"train_loss": -6.894697189331055, "global_step": 158238, "epoch": 3767} {"train_loss": -6.825900077819824, "global_step": 158239, "epoch": 3767} {"train_loss": -6.863385200500488, "global_step": 158240, "epoch": 3767} {"train_loss": -6.723000526428223, "global_step": 158241, "epoch": 3767} {"train_loss": -6.97797966003418, "global_step": 158242, "epoch": 3767} {"train_loss": -6.742373466491699, "global_step": 158243, "epoch": 3767} {"train_loss": -6.848108291625977, "global_step": 158244, "epoch": 3767} {"train_loss": -6.895315170288086, "global_step": 158245, "epoch": 3767} {"train_loss": -6.807255268096924, "global_step": 158246, "epoch": 3767} {"train_loss": -6.978604316711426, "global_step": 158247, "epoch": 3767} {"train_loss": -6.8172607421875, "global_step": 158248, "epoch": 3767} {"train_loss": -6.8715691566467285, "global_step": 158249, "epoch": 3767} {"train_loss": -6.850963592529297, "global_step": 158250, "epoch": 3767} {"train_loss": -6.946201324462891, "global_step": 158251, "epoch": 3767} {"train_loss": -6.922834873199463, "global_step": 158252, "epoch": 3767} {"train_loss": -7.037990570068359, "global_step": 158253, "epoch": 3767} {"train_loss": -6.997156143188477, "global_step": 158254, "epoch": 3767} {"train_loss": -6.934171347391038, "global_step": 158255, "epoch": 3767, "val_loss": 79142.6640625} {"train_loss": -7.009280681610107, "global_step": 158256, "epoch": 3768} {"train_loss": -7.017721652984619, "global_step": 158257, "epoch": 3768} {"train_loss": -6.988663673400879, "global_step": 158258, "epoch": 3768} {"train_loss": -6.971842288970947, "global_step": 158259, "epoch": 3768} {"train_loss": -6.9474616050720215, "global_step": 158260, "epoch": 3768} {"train_loss": -7.135571479797363, "global_step": 158261, "epoch": 3768} {"train_loss": -6.963898658752441, "global_step": 158262, "epoch": 3768} {"train_loss": -6.975381851196289, "global_step": 158263, "epoch": 3768} {"train_loss": -7.028441905975342, "global_step": 158264, "epoch": 3768} {"train_loss": -6.935510635375977, "global_step": 158265, "epoch": 3768} {"train_loss": -7.021985054016113, "global_step": 158266, "epoch": 3768} {"train_loss": -7.00661563873291, "global_step": 158267, "epoch": 3768} {"train_loss": -7.03116512298584, "global_step": 158268, "epoch": 3768} {"train_loss": -6.969779014587402, "global_step": 158269, "epoch": 3768} {"train_loss": -7.013313293457031, "global_step": 158270, "epoch": 3768} {"train_loss": -6.956427097320557, "global_step": 158271, "epoch": 3768} {"train_loss": -6.9964118003845215, "global_step": 158272, "epoch": 3768} {"train_loss": -6.917079925537109, "global_step": 158273, "epoch": 3768} {"train_loss": -6.997981071472168, "global_step": 158274, "epoch": 3768} {"train_loss": -7.064509868621826, "global_step": 158275, "epoch": 3768} {"train_loss": -6.971986770629883, "global_step": 158276, "epoch": 3768} {"train_loss": -6.976425647735596, "global_step": 158277, "epoch": 3768} {"train_loss": -6.976326942443848, "global_step": 158278, "epoch": 3768} {"train_loss": -7.04110050201416, "global_step": 158279, "epoch": 3768} {"train_loss": -6.8302106857299805, "global_step": 158280, "epoch": 3768} {"train_loss": -6.87676477432251, "global_step": 158281, "epoch": 3768} {"train_loss": -7.0025634765625, "global_step": 158282, "epoch": 3768} {"train_loss": -6.853695869445801, "global_step": 158283, "epoch": 3768} {"train_loss": -6.951925277709961, "global_step": 158284, "epoch": 3768} {"train_loss": -7.024857997894287, "global_step": 158285, "epoch": 3768} {"train_loss": -6.794383525848389, "global_step": 158286, "epoch": 3768} {"train_loss": -6.926176071166992, "global_step": 158287, "epoch": 3768} {"train_loss": -6.947939872741699, "global_step": 158288, "epoch": 3768} {"train_loss": -6.912325859069824, "global_step": 158289, "epoch": 3768} {"train_loss": -6.956979274749756, "global_step": 158290, "epoch": 3768} {"train_loss": -6.891036033630371, "global_step": 158291, "epoch": 3768} {"train_loss": -6.812429904937744, "global_step": 158292, "epoch": 3768} {"train_loss": -6.818446159362793, "global_step": 158293, "epoch": 3768} {"train_loss": -6.839173316955566, "global_step": 158294, "epoch": 3768} {"train_loss": -6.739753246307373, "global_step": 158295, "epoch": 3768} {"train_loss": -6.9584808349609375, "global_step": 158296, "epoch": 3768} {"train_loss": -6.951122624533517, "global_step": 158297, "epoch": 3768, "val_loss": 79224.484375} {"train_loss": -6.963469505310059, "global_step": 158298, "epoch": 3769} {"train_loss": -6.803750038146973, "global_step": 158299, "epoch": 3769} {"train_loss": -6.819733142852783, "global_step": 158300, "epoch": 3769} {"train_loss": -6.90424919128418, "global_step": 158301, "epoch": 3769} {"train_loss": -6.923603534698486, "global_step": 158302, "epoch": 3769} {"train_loss": -6.821463584899902, "global_step": 158303, "epoch": 3769} {"train_loss": -6.768367767333984, "global_step": 158304, "epoch": 3769} {"train_loss": -6.8844451904296875, "global_step": 158305, "epoch": 3769} {"train_loss": -6.884823799133301, "global_step": 158306, "epoch": 3769} {"train_loss": -6.946148872375488, "global_step": 158307, "epoch": 3769} {"train_loss": -7.026531219482422, "global_step": 158308, "epoch": 3769} {"train_loss": -6.806146144866943, "global_step": 158309, "epoch": 3769} {"train_loss": -7.016977310180664, "global_step": 158310, "epoch": 3769} {"train_loss": -6.946019172668457, "global_step": 158311, "epoch": 3769} {"train_loss": -6.822272300720215, "global_step": 158312, "epoch": 3769} {"train_loss": -7.037856101989746, "global_step": 158313, "epoch": 3769} {"train_loss": -6.7690958976745605, "global_step": 158314, "epoch": 3769} {"train_loss": -6.948902606964111, "global_step": 158315, "epoch": 3769} {"train_loss": -6.867387771606445, "global_step": 158316, "epoch": 3769} {"train_loss": -6.853976249694824, "global_step": 158317, "epoch": 3769} {"train_loss": -6.986968994140625, "global_step": 158318, "epoch": 3769} {"train_loss": -6.880037307739258, "global_step": 158319, "epoch": 3769} {"train_loss": -6.820596694946289, "global_step": 158320, "epoch": 3769} {"train_loss": -6.867607116699219, "global_step": 158321, "epoch": 3769} {"train_loss": -6.8375325202941895, "global_step": 158322, "epoch": 3769} {"train_loss": -6.9138383865356445, "global_step": 158323, "epoch": 3769} {"train_loss": -6.768421173095703, "global_step": 158324, "epoch": 3769} {"train_loss": -6.9073166847229, "global_step": 158325, "epoch": 3769} {"train_loss": -6.89374303817749, "global_step": 158326, "epoch": 3769} {"train_loss": -6.74355936050415, "global_step": 158327, "epoch": 3769} {"train_loss": -6.795499324798584, "global_step": 158328, "epoch": 3769} {"train_loss": -6.804567337036133, "global_step": 158329, "epoch": 3769} {"train_loss": -6.754932403564453, "global_step": 158330, "epoch": 3769} {"train_loss": -6.842251777648926, "global_step": 158331, "epoch": 3769} {"train_loss": -6.926351070404053, "global_step": 158332, "epoch": 3769} {"train_loss": -6.719120979309082, "global_step": 158333, "epoch": 3769} {"train_loss": -6.9252424240112305, "global_step": 158334, "epoch": 3769} {"train_loss": -6.756010055541992, "global_step": 158335, "epoch": 3769} {"train_loss": -6.77134895324707, "global_step": 158336, "epoch": 3769} {"train_loss": -6.9077606201171875, "global_step": 158337, "epoch": 3769} {"train_loss": -6.807990074157715, "global_step": 158338, "epoch": 3769} {"train_loss": -6.862689199901762, "global_step": 158339, "epoch": 3769, "val_loss": 79202.9921875} {"train_loss": -6.961142539978027, "global_step": 158340, "epoch": 3770} {"train_loss": -6.750773906707764, "global_step": 158341, "epoch": 3770} {"train_loss": -6.895689964294434, "global_step": 158342, "epoch": 3770} {"train_loss": -6.822017192840576, "global_step": 158343, "epoch": 3770} {"train_loss": -6.786087989807129, "global_step": 158344, "epoch": 3770} {"train_loss": -6.935479164123535, "global_step": 158345, "epoch": 3770} {"train_loss": -6.87224006652832, "global_step": 158346, "epoch": 3770} {"train_loss": -6.850217342376709, "global_step": 158347, "epoch": 3770} {"train_loss": -6.775408744812012, "global_step": 158348, "epoch": 3770} {"train_loss": -6.857154369354248, "global_step": 158349, "epoch": 3770} {"train_loss": -6.8665876388549805, "global_step": 158350, "epoch": 3770} {"train_loss": -6.837227821350098, "global_step": 158351, "epoch": 3770} {"train_loss": -6.909449577331543, "global_step": 158352, "epoch": 3770} {"train_loss": -6.947116851806641, "global_step": 158353, "epoch": 3770} {"train_loss": -6.927001953125, "global_step": 158354, "epoch": 3770} {"train_loss": -6.9965434074401855, "global_step": 158355, "epoch": 3770} {"train_loss": -6.971151828765869, "global_step": 158356, "epoch": 3770} {"train_loss": -6.905028343200684, "global_step": 158357, "epoch": 3770} {"train_loss": -6.952997207641602, "global_step": 158358, "epoch": 3770} {"train_loss": -6.99074649810791, "global_step": 158359, "epoch": 3770} {"train_loss": -6.9002604484558105, "global_step": 158360, "epoch": 3770} {"train_loss": -6.876943588256836, "global_step": 158361, "epoch": 3770} {"train_loss": -7.037784576416016, "global_step": 158362, "epoch": 3770} {"train_loss": -6.9835405349731445, "global_step": 158363, "epoch": 3770} {"train_loss": -7.0305938720703125, "global_step": 158364, "epoch": 3770} {"train_loss": -6.973109722137451, "global_step": 158365, "epoch": 3770} {"train_loss": -6.853918075561523, "global_step": 158366, "epoch": 3770} {"train_loss": -6.929614543914795, "global_step": 158367, "epoch": 3770} {"train_loss": -6.800975322723389, "global_step": 158368, "epoch": 3770} {"train_loss": -7.019974708557129, "global_step": 158369, "epoch": 3770} {"train_loss": -6.973357200622559, "global_step": 158370, "epoch": 3770} {"train_loss": -6.937719821929932, "global_step": 158371, "epoch": 3770} {"train_loss": -6.944100379943848, "global_step": 158372, "epoch": 3770} {"train_loss": -6.942306995391846, "global_step": 158373, "epoch": 3770} {"train_loss": -6.941033840179443, "global_step": 158374, "epoch": 3770} {"train_loss": -6.990365028381348, "global_step": 158375, "epoch": 3770} {"train_loss": -6.932306289672852, "global_step": 158376, "epoch": 3770} {"train_loss": -7.004932403564453, "global_step": 158377, "epoch": 3770} {"train_loss": -7.020798206329346, "global_step": 158378, "epoch": 3770} {"train_loss": -7.037195205688477, "global_step": 158379, "epoch": 3770} {"train_loss": -6.956517696380615, "global_step": 158380, "epoch": 3770} {"train_loss": -6.922783794857207, "global_step": 158381, "epoch": 3770, "val_loss": 79036.015625} {"train_loss": -6.90471076965332, "global_step": 158382, "epoch": 3771} {"train_loss": -7.072238445281982, "global_step": 158383, "epoch": 3771} {"train_loss": -6.950870513916016, "global_step": 158384, "epoch": 3771} {"train_loss": -6.969180107116699, "global_step": 158385, "epoch": 3771} {"train_loss": -7.001569747924805, "global_step": 158386, "epoch": 3771} {"train_loss": -6.971053123474121, "global_step": 158387, "epoch": 3771} {"train_loss": -6.859391212463379, "global_step": 158388, "epoch": 3771} {"train_loss": -6.934544563293457, "global_step": 158389, "epoch": 3771} {"train_loss": -6.758637428283691, "global_step": 158390, "epoch": 3771} {"train_loss": -6.830639839172363, "global_step": 158391, "epoch": 3771} {"train_loss": -6.887643337249756, "global_step": 158392, "epoch": 3771} {"train_loss": -6.9349517822265625, "global_step": 158393, "epoch": 3771} {"train_loss": -6.840742588043213, "global_step": 158394, "epoch": 3771} {"train_loss": -6.81894588470459, "global_step": 158395, "epoch": 3771} {"train_loss": -6.994208812713623, "global_step": 158396, "epoch": 3771} {"train_loss": -6.846616744995117, "global_step": 158397, "epoch": 3771} {"train_loss": -6.943018913269043, "global_step": 158398, "epoch": 3771} {"train_loss": -6.9764556884765625, "global_step": 158399, "epoch": 3771} {"train_loss": -6.916016578674316, "global_step": 158400, "epoch": 3771} {"train_loss": -6.931491374969482, "global_step": 158401, "epoch": 3771} {"train_loss": -6.921905517578125, "global_step": 158402, "epoch": 3771} {"train_loss": -7.047375679016113, "global_step": 158403, "epoch": 3771} {"train_loss": -6.817371368408203, "global_step": 158404, "epoch": 3771} {"train_loss": -6.960623741149902, "global_step": 158405, "epoch": 3771} {"train_loss": -6.97276496887207, "global_step": 158406, "epoch": 3771} {"train_loss": -6.9462971687316895, "global_step": 158407, "epoch": 3771} {"train_loss": -7.03105354309082, "global_step": 158408, "epoch": 3771} {"train_loss": -6.87914514541626, "global_step": 158409, "epoch": 3771} {"train_loss": -6.998249053955078, "global_step": 158410, "epoch": 3771} {"train_loss": -6.993329048156738, "global_step": 158411, "epoch": 3771} {"train_loss": -6.982043266296387, "global_step": 158412, "epoch": 3771} {"train_loss": -6.973980903625488, "global_step": 158413, "epoch": 3771} {"train_loss": -7.173083305358887, "global_step": 158414, "epoch": 3771} {"train_loss": -7.054627418518066, "global_step": 158415, "epoch": 3771} {"train_loss": -6.9220733642578125, "global_step": 158416, "epoch": 3771} {"train_loss": -6.985225677490234, "global_step": 158417, "epoch": 3771} {"train_loss": -6.964240074157715, "global_step": 158418, "epoch": 3771} {"train_loss": -7.014185905456543, "global_step": 158419, "epoch": 3771} {"train_loss": -6.974555969238281, "global_step": 158420, "epoch": 3771} {"train_loss": -6.901049613952637, "global_step": 158421, "epoch": 3771} {"train_loss": -6.929417610168457, "global_step": 158422, "epoch": 3771} {"train_loss": -6.946824573335194, "global_step": 158423, "epoch": 3771, "val_loss": 79189.0546875} {"train_loss": -7.045621871948242, "global_step": 158424, "epoch": 3772} {"train_loss": -7.004387378692627, "global_step": 158425, "epoch": 3772} {"train_loss": -6.982576847076416, "global_step": 158426, "epoch": 3772} {"train_loss": -7.039366722106934, "global_step": 158427, "epoch": 3772} {"train_loss": -7.047756195068359, "global_step": 158428, "epoch": 3772} {"train_loss": -7.1118364334106445, "global_step": 158429, "epoch": 3772} {"train_loss": -7.0029706954956055, "global_step": 158430, "epoch": 3772} {"train_loss": -6.929684638977051, "global_step": 158431, "epoch": 3772} {"train_loss": -6.832790851593018, "global_step": 158432, "epoch": 3772} {"train_loss": -7.06816291809082, "global_step": 158433, "epoch": 3772} {"train_loss": -6.990624904632568, "global_step": 158434, "epoch": 3772} {"train_loss": -6.832632064819336, "global_step": 158435, "epoch": 3772} {"train_loss": -6.950740814208984, "global_step": 158436, "epoch": 3772} {"train_loss": -6.960275650024414, "global_step": 158437, "epoch": 3772} {"train_loss": -6.975576400756836, "global_step": 158438, "epoch": 3772} {"train_loss": -6.99604606628418, "global_step": 158439, "epoch": 3772} {"train_loss": -6.830901145935059, "global_step": 158440, "epoch": 3772} {"train_loss": -6.882821083068848, "global_step": 158441, "epoch": 3772} {"train_loss": -6.8304266929626465, "global_step": 158442, "epoch": 3772} {"train_loss": -6.796327590942383, "global_step": 158443, "epoch": 3772} {"train_loss": -6.925485134124756, "global_step": 158444, "epoch": 3772} {"train_loss": -6.850459098815918, "global_step": 158445, "epoch": 3772} {"train_loss": -6.814277648925781, "global_step": 158446, "epoch": 3772} {"train_loss": -7.034731864929199, "global_step": 158447, "epoch": 3772} {"train_loss": -6.802946090698242, "global_step": 158448, "epoch": 3772} {"train_loss": -6.867800235748291, "global_step": 158449, "epoch": 3772} {"train_loss": -6.859523773193359, "global_step": 158450, "epoch": 3772} {"train_loss": -6.924010276794434, "global_step": 158451, "epoch": 3772} {"train_loss": -6.804841041564941, "global_step": 158452, "epoch": 3772} {"train_loss": -6.865862846374512, "global_step": 158453, "epoch": 3772} {"train_loss": -6.829146862030029, "global_step": 158454, "epoch": 3772} {"train_loss": -6.848505973815918, "global_step": 158455, "epoch": 3772} {"train_loss": -6.804329872131348, "global_step": 158456, "epoch": 3772} {"train_loss": -6.832074165344238, "global_step": 158457, "epoch": 3772} {"train_loss": -6.882339954376221, "global_step": 158458, "epoch": 3772} {"train_loss": -6.876185894012451, "global_step": 158459, "epoch": 3772} {"train_loss": -6.789251327514648, "global_step": 158460, "epoch": 3772} {"train_loss": -7.009540557861328, "global_step": 158461, "epoch": 3772} {"train_loss": -6.793890953063965, "global_step": 158462, "epoch": 3772} {"train_loss": -6.980157852172852, "global_step": 158463, "epoch": 3772} {"train_loss": -6.727115154266357, "global_step": 158464, "epoch": 3772} {"train_loss": -6.906989915030343, "global_step": 158465, "epoch": 3772, "val_loss": 79193.9921875} {"train_loss": -6.984955787658691, "global_step": 158466, "epoch": 3773} {"train_loss": -6.801311492919922, "global_step": 158467, "epoch": 3773} {"train_loss": -6.9494428634643555, "global_step": 158468, "epoch": 3773} {"train_loss": -6.868963241577148, "global_step": 158469, "epoch": 3773} {"train_loss": -6.923873424530029, "global_step": 158470, "epoch": 3773} {"train_loss": -7.00905704498291, "global_step": 158471, "epoch": 3773} {"train_loss": -7.019685745239258, "global_step": 158472, "epoch": 3773} {"train_loss": -7.016852855682373, "global_step": 158473, "epoch": 3773} {"train_loss": -7.046536445617676, "global_step": 158474, "epoch": 3773} {"train_loss": -6.898193359375, "global_step": 158475, "epoch": 3773} {"train_loss": -6.9900288581848145, "global_step": 158476, "epoch": 3773} {"train_loss": -6.962078094482422, "global_step": 158477, "epoch": 3773} {"train_loss": -6.968446731567383, "global_step": 158478, "epoch": 3773} {"train_loss": -6.912215709686279, "global_step": 158479, "epoch": 3773} {"train_loss": -6.9703216552734375, "global_step": 158480, "epoch": 3773} {"train_loss": -6.818889617919922, "global_step": 158481, "epoch": 3773} {"train_loss": -6.971173286437988, "global_step": 158482, "epoch": 3773} {"train_loss": -6.841657638549805, "global_step": 158483, "epoch": 3773} {"train_loss": -6.917288780212402, "global_step": 158484, "epoch": 3773} {"train_loss": -6.921078681945801, "global_step": 158485, "epoch": 3773} {"train_loss": -7.017604827880859, "global_step": 158486, "epoch": 3773} {"train_loss": -6.940683841705322, "global_step": 158487, "epoch": 3773} {"train_loss": -6.838322639465332, "global_step": 158488, "epoch": 3773} {"train_loss": -6.982588768005371, "global_step": 158489, "epoch": 3773} {"train_loss": -6.9712018966674805, "global_step": 158490, "epoch": 3773} {"train_loss": -7.0446906089782715, "global_step": 158491, "epoch": 3773} {"train_loss": -7.050001621246338, "global_step": 158492, "epoch": 3773} {"train_loss": -7.027787208557129, "global_step": 158493, "epoch": 3773} {"train_loss": -6.973940372467041, "global_step": 158494, "epoch": 3773} {"train_loss": -6.917562484741211, "global_step": 158495, "epoch": 3773} {"train_loss": -6.919523239135742, "global_step": 158496, "epoch": 3773} {"train_loss": -6.976940631866455, "global_step": 158497, "epoch": 3773} {"train_loss": -6.916682243347168, "global_step": 158498, "epoch": 3773} {"train_loss": -6.820141792297363, "global_step": 158499, "epoch": 3773} {"train_loss": -7.061975479125977, "global_step": 158500, "epoch": 3773} {"train_loss": -6.978514671325684, "global_step": 158501, "epoch": 3773} {"train_loss": -6.912709712982178, "global_step": 158502, "epoch": 3773} {"train_loss": -6.94155740737915, "global_step": 158503, "epoch": 3773} {"train_loss": -6.965394973754883, "global_step": 158504, "epoch": 3773} {"train_loss": -7.113893508911133, "global_step": 158505, "epoch": 3773} {"train_loss": -6.956620216369629, "global_step": 158506, "epoch": 3773} {"train_loss": -6.953226827439808, "global_step": 158507, "epoch": 3773, "val_loss": 79375.640625} {"train_loss": -6.892505168914795, "global_step": 158508, "epoch": 3774} {"train_loss": -6.969106674194336, "global_step": 158509, "epoch": 3774} {"train_loss": -6.891897678375244, "global_step": 158510, "epoch": 3774} {"train_loss": -6.8301520347595215, "global_step": 158511, "epoch": 3774} {"train_loss": -6.855256080627441, "global_step": 158512, "epoch": 3774} {"train_loss": -6.799525737762451, "global_step": 158513, "epoch": 3774} {"train_loss": -6.819096565246582, "global_step": 158514, "epoch": 3774} {"train_loss": -6.935091972351074, "global_step": 158515, "epoch": 3774} {"train_loss": -6.811456203460693, "global_step": 158516, "epoch": 3774} {"train_loss": -6.823251724243164, "global_step": 158517, "epoch": 3774} {"train_loss": -7.111484527587891, "global_step": 158518, "epoch": 3774} {"train_loss": -6.780026912689209, "global_step": 158519, "epoch": 3774} {"train_loss": -6.84764289855957, "global_step": 158520, "epoch": 3774} {"train_loss": -6.9048357009887695, "global_step": 158521, "epoch": 3774} {"train_loss": -6.848728656768799, "global_step": 158522, "epoch": 3774} {"train_loss": -6.9174041748046875, "global_step": 158523, "epoch": 3774} {"train_loss": -6.90646505355835, "global_step": 158524, "epoch": 3774} {"train_loss": -6.775444507598877, "global_step": 158525, "epoch": 3774} {"train_loss": -6.981656074523926, "global_step": 158526, "epoch": 3774} {"train_loss": -6.905242443084717, "global_step": 158527, "epoch": 3774} {"train_loss": -6.791173458099365, "global_step": 158528, "epoch": 3774} {"train_loss": -6.994414329528809, "global_step": 158529, "epoch": 3774} {"train_loss": -6.983218669891357, "global_step": 158530, "epoch": 3774} {"train_loss": -6.952419281005859, "global_step": 158531, "epoch": 3774} {"train_loss": -6.856557369232178, "global_step": 158532, "epoch": 3774} {"train_loss": -7.010656356811523, "global_step": 158533, "epoch": 3774} {"train_loss": -6.994675636291504, "global_step": 158534, "epoch": 3774} {"train_loss": -6.872066020965576, "global_step": 158535, "epoch": 3774} {"train_loss": -7.06574821472168, "global_step": 158536, "epoch": 3774} {"train_loss": -6.904808521270752, "global_step": 158537, "epoch": 3774} {"train_loss": -7.044978141784668, "global_step": 158538, "epoch": 3774} {"train_loss": -7.045963287353516, "global_step": 158539, "epoch": 3774} {"train_loss": -6.9007978439331055, "global_step": 158540, "epoch": 3774} {"train_loss": -6.995844841003418, "global_step": 158541, "epoch": 3774} {"train_loss": -6.982901573181152, "global_step": 158542, "epoch": 3774} {"train_loss": -6.886521339416504, "global_step": 158543, "epoch": 3774} {"train_loss": -6.830321311950684, "global_step": 158544, "epoch": 3774} {"train_loss": -6.943744659423828, "global_step": 158545, "epoch": 3774} {"train_loss": -6.752957344055176, "global_step": 158546, "epoch": 3774} {"train_loss": -6.988734245300293, "global_step": 158547, "epoch": 3774} {"train_loss": -6.842899799346924, "global_step": 158548, "epoch": 3774} {"train_loss": -6.909168493180048, "global_step": 158549, "epoch": 3774, "val_loss": 79270.5859375} {"train_loss": -6.786713123321533, "global_step": 158550, "epoch": 3775} {"train_loss": -6.907796859741211, "global_step": 158551, "epoch": 3775} {"train_loss": -6.933114051818848, "global_step": 158552, "epoch": 3775} {"train_loss": -6.818114280700684, "global_step": 158553, "epoch": 3775} {"train_loss": -6.939330577850342, "global_step": 158554, "epoch": 3775} {"train_loss": -7.024658679962158, "global_step": 158555, "epoch": 3775} {"train_loss": -6.8223557472229, "global_step": 158556, "epoch": 3775} {"train_loss": -6.969172477722168, "global_step": 158557, "epoch": 3775} {"train_loss": -7.013480186462402, "global_step": 158558, "epoch": 3775} {"train_loss": -6.967838287353516, "global_step": 158559, "epoch": 3775} {"train_loss": -6.983386039733887, "global_step": 158560, "epoch": 3775} {"train_loss": -6.895144939422607, "global_step": 158561, "epoch": 3775} {"train_loss": -7.005363941192627, "global_step": 158562, "epoch": 3775} {"train_loss": -7.036842346191406, "global_step": 158563, "epoch": 3775} {"train_loss": -6.911922454833984, "global_step": 158564, "epoch": 3775} {"train_loss": -7.035804748535156, "global_step": 158565, "epoch": 3775} {"train_loss": -7.002011299133301, "global_step": 158566, "epoch": 3775} {"train_loss": -6.869990825653076, "global_step": 158567, "epoch": 3775} {"train_loss": -7.008155822753906, "global_step": 158568, "epoch": 3775} {"train_loss": -6.867244720458984, "global_step": 158569, "epoch": 3775} {"train_loss": -6.948179244995117, "global_step": 158570, "epoch": 3775} {"train_loss": -6.822022914886475, "global_step": 158571, "epoch": 3775} {"train_loss": -6.834603309631348, "global_step": 158572, "epoch": 3775} {"train_loss": -7.066405296325684, "global_step": 158573, "epoch": 3775} {"train_loss": -6.981243133544922, "global_step": 158574, "epoch": 3775} {"train_loss": -7.021402359008789, "global_step": 158575, "epoch": 3775} {"train_loss": -6.931576728820801, "global_step": 158576, "epoch": 3775} {"train_loss": -6.956015586853027, "global_step": 158577, "epoch": 3775} {"train_loss": -6.9607038497924805, "global_step": 158578, "epoch": 3775} {"train_loss": -6.937385559082031, "global_step": 158579, "epoch": 3775} {"train_loss": -6.920864105224609, "global_step": 158580, "epoch": 3775} {"train_loss": -6.947547435760498, "global_step": 158581, "epoch": 3775} {"train_loss": -7.0038042068481445, "global_step": 158582, "epoch": 3775} {"train_loss": -7.081803321838379, "global_step": 158583, "epoch": 3775} {"train_loss": -6.913843154907227, "global_step": 158584, "epoch": 3775} {"train_loss": -6.940239429473877, "global_step": 158585, "epoch": 3775} {"train_loss": -6.998318672180176, "global_step": 158586, "epoch": 3775} {"train_loss": -6.990760803222656, "global_step": 158587, "epoch": 3775} {"train_loss": -7.070382595062256, "global_step": 158588, "epoch": 3775} {"train_loss": -7.0139312744140625, "global_step": 158589, "epoch": 3775} {"train_loss": -6.932803153991699, "global_step": 158590, "epoch": 3775} {"train_loss": -6.951071421305339, "global_step": 158591, "epoch": 3775, "val_loss": 79236.734375} {"train_loss": -6.978414535522461, "global_step": 158592, "epoch": 3776} {"train_loss": -6.886789798736572, "global_step": 158593, "epoch": 3776} {"train_loss": -6.9889936447143555, "global_step": 158594, "epoch": 3776} {"train_loss": -6.954991340637207, "global_step": 158595, "epoch": 3776} {"train_loss": -6.949389457702637, "global_step": 158596, "epoch": 3776} {"train_loss": -6.992574691772461, "global_step": 158597, "epoch": 3776} {"train_loss": -6.984392166137695, "global_step": 158598, "epoch": 3776} {"train_loss": -6.9386396408081055, "global_step": 158599, "epoch": 3776} {"train_loss": -6.821815013885498, "global_step": 158600, "epoch": 3776} {"train_loss": -7.0533366203308105, "global_step": 158601, "epoch": 3776} {"train_loss": -6.9313063621521, "global_step": 158602, "epoch": 3776} {"train_loss": -6.897822380065918, "global_step": 158603, "epoch": 3776} {"train_loss": -7.0154218673706055, "global_step": 158604, "epoch": 3776} {"train_loss": -6.9570207595825195, "global_step": 158605, "epoch": 3776} {"train_loss": -6.956897735595703, "global_step": 158606, "epoch": 3776} {"train_loss": -6.819850444793701, "global_step": 158607, "epoch": 3776} {"train_loss": -6.940351486206055, "global_step": 158608, "epoch": 3776} {"train_loss": -6.850203037261963, "global_step": 158609, "epoch": 3776} {"train_loss": -6.922032833099365, "global_step": 158610, "epoch": 3776} {"train_loss": -6.9328155517578125, "global_step": 158611, "epoch": 3776} {"train_loss": -6.88702392578125, "global_step": 158612, "epoch": 3776} {"train_loss": -6.967989921569824, "global_step": 158613, "epoch": 3776} {"train_loss": -6.9196672439575195, "global_step": 158614, "epoch": 3776} {"train_loss": -7.084619522094727, "global_step": 158615, "epoch": 3776} {"train_loss": -6.952639102935791, "global_step": 158616, "epoch": 3776} {"train_loss": -6.949865341186523, "global_step": 158617, "epoch": 3776} {"train_loss": -7.00429630279541, "global_step": 158618, "epoch": 3776} {"train_loss": -6.921281814575195, "global_step": 158619, "epoch": 3776} {"train_loss": -6.961968421936035, "global_step": 158620, "epoch": 3776} {"train_loss": -6.988184928894043, "global_step": 158621, "epoch": 3776} {"train_loss": -7.000405311584473, "global_step": 158622, "epoch": 3776} {"train_loss": -6.928632736206055, "global_step": 158623, "epoch": 3776} {"train_loss": -6.903020858764648, "global_step": 158624, "epoch": 3776} {"train_loss": -7.0010294914245605, "global_step": 158625, "epoch": 3776} {"train_loss": -6.987208366394043, "global_step": 158626, "epoch": 3776} {"train_loss": -7.013753414154053, "global_step": 158627, "epoch": 3776} {"train_loss": -6.988686561584473, "global_step": 158628, "epoch": 3776} {"train_loss": -6.928343772888184, "global_step": 158629, "epoch": 3776} {"train_loss": -6.881470680236816, "global_step": 158630, "epoch": 3776} {"train_loss": -6.971731662750244, "global_step": 158631, "epoch": 3776} {"train_loss": -6.922811031341553, "global_step": 158632, "epoch": 3776} {"train_loss": -6.949945938019526, "global_step": 158633, "epoch": 3776, "val_loss": 79563.7421875} {"train_loss": -6.796980381011963, "global_step": 158634, "epoch": 3777} {"train_loss": -7.028573989868164, "global_step": 158635, "epoch": 3777} {"train_loss": -6.749758243560791, "global_step": 158636, "epoch": 3777} {"train_loss": -6.747664928436279, "global_step": 158637, "epoch": 3777} {"train_loss": -6.899127960205078, "global_step": 158638, "epoch": 3777} {"train_loss": -6.890835762023926, "global_step": 158639, "epoch": 3777} {"train_loss": -6.9436564445495605, "global_step": 158640, "epoch": 3777} {"train_loss": -6.968929767608643, "global_step": 158641, "epoch": 3777} {"train_loss": -6.8806843757629395, "global_step": 158642, "epoch": 3777} {"train_loss": -7.006487846374512, "global_step": 158643, "epoch": 3777} {"train_loss": -6.837096214294434, "global_step": 158644, "epoch": 3777} {"train_loss": -6.902112007141113, "global_step": 158645, "epoch": 3777} {"train_loss": -6.8936262130737305, "global_step": 158646, "epoch": 3777} {"train_loss": -6.865373134613037, "global_step": 158647, "epoch": 3777} {"train_loss": -6.826268196105957, "global_step": 158648, "epoch": 3777} {"train_loss": -6.841457366943359, "global_step": 158649, "epoch": 3777} {"train_loss": -6.948596954345703, "global_step": 158650, "epoch": 3777} {"train_loss": -6.982548236846924, "global_step": 158651, "epoch": 3777} {"train_loss": -6.929075241088867, "global_step": 158652, "epoch": 3777} {"train_loss": -6.871140480041504, "global_step": 158653, "epoch": 3777} {"train_loss": -7.0007452964782715, "global_step": 158654, "epoch": 3777} {"train_loss": -6.826861381530762, "global_step": 158655, "epoch": 3777} {"train_loss": -7.033199310302734, "global_step": 158656, "epoch": 3777} {"train_loss": -6.88084602355957, "global_step": 158657, "epoch": 3777} {"train_loss": -6.9093146324157715, "global_step": 158658, "epoch": 3777} {"train_loss": -7.015089988708496, "global_step": 158659, "epoch": 3777} {"train_loss": -6.859219551086426, "global_step": 158660, "epoch": 3777} {"train_loss": -6.939413070678711, "global_step": 158661, "epoch": 3777} {"train_loss": -6.910358428955078, "global_step": 158662, "epoch": 3777} {"train_loss": -6.927093505859375, "global_step": 158663, "epoch": 3777} {"train_loss": -6.892664432525635, "global_step": 158664, "epoch": 3777} {"train_loss": -6.9317121505737305, "global_step": 158665, "epoch": 3777} {"train_loss": -6.90768575668335, "global_step": 158666, "epoch": 3777} {"train_loss": -6.861919403076172, "global_step": 158667, "epoch": 3777} {"train_loss": -6.7888569831848145, "global_step": 158668, "epoch": 3777} {"train_loss": -6.986109256744385, "global_step": 158669, "epoch": 3777} {"train_loss": -6.898621559143066, "global_step": 158670, "epoch": 3777} {"train_loss": -6.891449451446533, "global_step": 158671, "epoch": 3777} {"train_loss": -6.880197525024414, "global_step": 158672, "epoch": 3777} {"train_loss": -6.876446723937988, "global_step": 158673, "epoch": 3777} {"train_loss": -6.833797454833984, "global_step": 158674, "epoch": 3777} {"train_loss": -6.898873204276676, "global_step": 158675, "epoch": 3777, "val_loss": 79068.3125} {"train_loss": -6.9721879959106445, "global_step": 158676, "epoch": 3778} {"train_loss": -6.907429218292236, "global_step": 158677, "epoch": 3778} {"train_loss": -6.933514595031738, "global_step": 158678, "epoch": 3778} {"train_loss": -6.818109035491943, "global_step": 158679, "epoch": 3778} {"train_loss": -6.910399436950684, "global_step": 158680, "epoch": 3778} {"train_loss": -7.042279243469238, "global_step": 158681, "epoch": 3778} {"train_loss": -6.826874256134033, "global_step": 158682, "epoch": 3778} {"train_loss": -6.9197187423706055, "global_step": 158683, "epoch": 3778} {"train_loss": -7.003719329833984, "global_step": 158684, "epoch": 3778} {"train_loss": -6.933009147644043, "global_step": 158685, "epoch": 3778} {"train_loss": -6.92540168762207, "global_step": 158686, "epoch": 3778} {"train_loss": -6.793003082275391, "global_step": 158687, "epoch": 3778} {"train_loss": -6.890190601348877, "global_step": 158688, "epoch": 3778} {"train_loss": -6.877839088439941, "global_step": 158689, "epoch": 3778} {"train_loss": -7.014553070068359, "global_step": 158690, "epoch": 3778} {"train_loss": -6.768315315246582, "global_step": 158691, "epoch": 3778} {"train_loss": -7.014366149902344, "global_step": 158692, "epoch": 3778} {"train_loss": -6.85024356842041, "global_step": 158693, "epoch": 3778} {"train_loss": -6.798788547515869, "global_step": 158694, "epoch": 3778} {"train_loss": -6.971321105957031, "global_step": 158695, "epoch": 3778} {"train_loss": -6.7658281326293945, "global_step": 158696, "epoch": 3778} {"train_loss": -7.027359962463379, "global_step": 158697, "epoch": 3778} {"train_loss": -6.8977742195129395, "global_step": 158698, "epoch": 3778} {"train_loss": -6.8909454345703125, "global_step": 158699, "epoch": 3778} {"train_loss": -6.9782257080078125, "global_step": 158700, "epoch": 3778} {"train_loss": -6.890735626220703, "global_step": 158701, "epoch": 3778} {"train_loss": -6.974078178405762, "global_step": 158702, "epoch": 3778} {"train_loss": -7.008414268493652, "global_step": 158703, "epoch": 3778} {"train_loss": -6.929068565368652, "global_step": 158704, "epoch": 3778} {"train_loss": -6.890978813171387, "global_step": 158705, "epoch": 3778} {"train_loss": -6.952879905700684, "global_step": 158706, "epoch": 3778} {"train_loss": -6.863189220428467, "global_step": 158707, "epoch": 3778} {"train_loss": -6.926822662353516, "global_step": 158708, "epoch": 3778} {"train_loss": -6.870099067687988, "global_step": 158709, "epoch": 3778} {"train_loss": -6.966762065887451, "global_step": 158710, "epoch": 3778} {"train_loss": -6.9171953201293945, "global_step": 158711, "epoch": 3778} {"train_loss": -6.857914447784424, "global_step": 158712, "epoch": 3778} {"train_loss": -6.8558807373046875, "global_step": 158713, "epoch": 3778} {"train_loss": -6.984352111816406, "global_step": 158714, "epoch": 3778} {"train_loss": -6.892032623291016, "global_step": 158715, "epoch": 3778} {"train_loss": -6.942749977111816, "global_step": 158716, "epoch": 3778} {"train_loss": -6.912778366179693, "global_step": 158717, "epoch": 3778, "val_loss": 79132.1328125} {"train_loss": -6.963791847229004, "global_step": 158718, "epoch": 3779} {"train_loss": -6.908902645111084, "global_step": 158719, "epoch": 3779} {"train_loss": -6.809138298034668, "global_step": 158720, "epoch": 3779} {"train_loss": -6.96796989440918, "global_step": 158721, "epoch": 3779} {"train_loss": -6.911137580871582, "global_step": 158722, "epoch": 3779} {"train_loss": -6.944877624511719, "global_step": 158723, "epoch": 3779} {"train_loss": -6.897615432739258, "global_step": 158724, "epoch": 3779} {"train_loss": -6.959370136260986, "global_step": 158725, "epoch": 3779} {"train_loss": -6.879022598266602, "global_step": 158726, "epoch": 3779} {"train_loss": -6.857448577880859, "global_step": 158727, "epoch": 3779} {"train_loss": -6.983010292053223, "global_step": 158728, "epoch": 3779} {"train_loss": -6.933246612548828, "global_step": 158729, "epoch": 3779} {"train_loss": -6.993200302124023, "global_step": 158730, "epoch": 3779} {"train_loss": -6.957009792327881, "global_step": 158731, "epoch": 3779} {"train_loss": -6.991266250610352, "global_step": 158732, "epoch": 3779} {"train_loss": -6.960057258605957, "global_step": 158733, "epoch": 3779} {"train_loss": -7.076677322387695, "global_step": 158734, "epoch": 3779} {"train_loss": -6.896819114685059, "global_step": 158735, "epoch": 3779} {"train_loss": -6.973198890686035, "global_step": 158736, "epoch": 3779} {"train_loss": -6.847473621368408, "global_step": 158737, "epoch": 3779} {"train_loss": -6.92707633972168, "global_step": 158738, "epoch": 3779} {"train_loss": -6.985179901123047, "global_step": 158739, "epoch": 3779} {"train_loss": -6.930359840393066, "global_step": 158740, "epoch": 3779} {"train_loss": -6.878981590270996, "global_step": 158741, "epoch": 3779} {"train_loss": -6.922335624694824, "global_step": 158742, "epoch": 3779} {"train_loss": -6.995131492614746, "global_step": 158743, "epoch": 3779} {"train_loss": -6.921288967132568, "global_step": 158744, "epoch": 3779} {"train_loss": -6.98966121673584, "global_step": 158745, "epoch": 3779} {"train_loss": -6.921469688415527, "global_step": 158746, "epoch": 3779} {"train_loss": -6.850892066955566, "global_step": 158747, "epoch": 3779} {"train_loss": -6.86900520324707, "global_step": 158748, "epoch": 3779} {"train_loss": -6.900653839111328, "global_step": 158749, "epoch": 3779} {"train_loss": -6.879524230957031, "global_step": 158750, "epoch": 3779} {"train_loss": -6.957549571990967, "global_step": 158751, "epoch": 3779} {"train_loss": -6.957317352294922, "global_step": 158752, "epoch": 3779} {"train_loss": -6.892513275146484, "global_step": 158753, "epoch": 3779} {"train_loss": -6.91187047958374, "global_step": 158754, "epoch": 3779} {"train_loss": -6.935421466827393, "global_step": 158755, "epoch": 3779} {"train_loss": -6.87782621383667, "global_step": 158756, "epoch": 3779} {"train_loss": -7.062139511108398, "global_step": 158757, "epoch": 3779} {"train_loss": -6.996993064880371, "global_step": 158758, "epoch": 3779} {"train_loss": -6.932985578264509, "global_step": 158759, "epoch": 3779, "val_loss": 79242.5390625} {"train_loss": -7.003634452819824, "global_step": 158760, "epoch": 3780} {"train_loss": -6.922451019287109, "global_step": 158761, "epoch": 3780} {"train_loss": -6.998283386230469, "global_step": 158762, "epoch": 3780} {"train_loss": -6.997906684875488, "global_step": 158763, "epoch": 3780} {"train_loss": -7.028903484344482, "global_step": 158764, "epoch": 3780} {"train_loss": -7.0065083503723145, "global_step": 158765, "epoch": 3780} {"train_loss": -7.008899688720703, "global_step": 158766, "epoch": 3780} {"train_loss": -6.924127578735352, "global_step": 158767, "epoch": 3780} {"train_loss": -6.932125568389893, "global_step": 158768, "epoch": 3780} {"train_loss": -7.093042373657227, "global_step": 158769, "epoch": 3780} {"train_loss": -6.986655235290527, "global_step": 158770, "epoch": 3780} {"train_loss": -6.970337390899658, "global_step": 158771, "epoch": 3780} {"train_loss": -6.880800247192383, "global_step": 158772, "epoch": 3780} {"train_loss": -6.911740303039551, "global_step": 158773, "epoch": 3780} {"train_loss": -7.03516960144043, "global_step": 158774, "epoch": 3780} {"train_loss": -7.0452470779418945, "global_step": 158775, "epoch": 3780} {"train_loss": -7.005393981933594, "global_step": 158776, "epoch": 3780} {"train_loss": -6.98369836807251, "global_step": 158777, "epoch": 3780} {"train_loss": -6.951653957366943, "global_step": 158778, "epoch": 3780} {"train_loss": -6.87080192565918, "global_step": 158779, "epoch": 3780} {"train_loss": -6.920896530151367, "global_step": 158780, "epoch": 3780} {"train_loss": -6.865114688873291, "global_step": 158781, "epoch": 3780} {"train_loss": -6.908036708831787, "global_step": 158782, "epoch": 3780} {"train_loss": -6.915127277374268, "global_step": 158783, "epoch": 3780} {"train_loss": -6.87443733215332, "global_step": 158784, "epoch": 3780} {"train_loss": -6.953423500061035, "global_step": 158785, "epoch": 3780} {"train_loss": -6.877384662628174, "global_step": 158786, "epoch": 3780} {"train_loss": -6.79168701171875, "global_step": 158787, "epoch": 3780} {"train_loss": -6.937199592590332, "global_step": 158788, "epoch": 3780} {"train_loss": -6.976433753967285, "global_step": 158789, "epoch": 3780} {"train_loss": -6.894097805023193, "global_step": 158790, "epoch": 3780} {"train_loss": -6.852506637573242, "global_step": 158791, "epoch": 3780} {"train_loss": -6.837378025054932, "global_step": 158792, "epoch": 3780} {"train_loss": -6.922738075256348, "global_step": 158793, "epoch": 3780} {"train_loss": -6.81833553314209, "global_step": 158794, "epoch": 3780} {"train_loss": -6.639537334442139, "global_step": 158795, "epoch": 3780} {"train_loss": -6.997563362121582, "global_step": 158796, "epoch": 3780} {"train_loss": -6.7233099937438965, "global_step": 158797, "epoch": 3780} {"train_loss": -6.759592056274414, "global_step": 158798, "epoch": 3780} {"train_loss": -6.9301252365112305, "global_step": 158799, "epoch": 3780} {"train_loss": -6.818471908569336, "global_step": 158800, "epoch": 3780} {"train_loss": -6.9194771108173185, "global_step": 158801, "epoch": 3780, "val_loss": 79017.1484375} {"train_loss": -6.754456520080566, "global_step": 158802, "epoch": 3781} {"train_loss": -6.901116371154785, "global_step": 158803, "epoch": 3781} {"train_loss": -6.713696479797363, "global_step": 158804, "epoch": 3781} {"train_loss": -6.789095878601074, "global_step": 158805, "epoch": 3781} {"train_loss": -6.846142768859863, "global_step": 158806, "epoch": 3781} {"train_loss": -6.7227044105529785, "global_step": 158807, "epoch": 3781} {"train_loss": -6.967932224273682, "global_step": 158808, "epoch": 3781} {"train_loss": -6.779172420501709, "global_step": 158809, "epoch": 3781} {"train_loss": -6.933071136474609, "global_step": 158810, "epoch": 3781} {"train_loss": -6.932959079742432, "global_step": 158811, "epoch": 3781} {"train_loss": -6.92773962020874, "global_step": 158812, "epoch": 3781} {"train_loss": -6.82187557220459, "global_step": 158813, "epoch": 3781} {"train_loss": -6.873817443847656, "global_step": 158814, "epoch": 3781} {"train_loss": -6.865616798400879, "global_step": 158815, "epoch": 3781} {"train_loss": -6.95517635345459, "global_step": 158816, "epoch": 3781} {"train_loss": -6.792642593383789, "global_step": 158817, "epoch": 3781} {"train_loss": -6.935946464538574, "global_step": 158818, "epoch": 3781} {"train_loss": -6.9339141845703125, "global_step": 158819, "epoch": 3781} {"train_loss": -6.7964019775390625, "global_step": 158820, "epoch": 3781} {"train_loss": -7.027998924255371, "global_step": 158821, "epoch": 3781} {"train_loss": -6.963766098022461, "global_step": 158822, "epoch": 3781} {"train_loss": -7.058807373046875, "global_step": 158823, "epoch": 3781} {"train_loss": -6.865521430969238, "global_step": 158824, "epoch": 3781} {"train_loss": -7.1005144119262695, "global_step": 158825, "epoch": 3781} {"train_loss": -6.984318733215332, "global_step": 158826, "epoch": 3781} {"train_loss": -6.9711198806762695, "global_step": 158827, "epoch": 3781} {"train_loss": -7.00993537902832, "global_step": 158828, "epoch": 3781} {"train_loss": -6.945608139038086, "global_step": 158829, "epoch": 3781} {"train_loss": -7.060340404510498, "global_step": 158830, "epoch": 3781} {"train_loss": -7.109092712402344, "global_step": 158831, "epoch": 3781} {"train_loss": -7.010339736938477, "global_step": 158832, "epoch": 3781} {"train_loss": -6.972641468048096, "global_step": 158833, "epoch": 3781} {"train_loss": -6.909543991088867, "global_step": 158834, "epoch": 3781} {"train_loss": -7.012221813201904, "global_step": 158835, "epoch": 3781} {"train_loss": -6.941952705383301, "global_step": 158836, "epoch": 3781} {"train_loss": -6.954686164855957, "global_step": 158837, "epoch": 3781} {"train_loss": -6.968448638916016, "global_step": 158838, "epoch": 3781} {"train_loss": -7.0791826248168945, "global_step": 158839, "epoch": 3781} {"train_loss": -6.883679389953613, "global_step": 158840, "epoch": 3781} {"train_loss": -7.005895614624023, "global_step": 158841, "epoch": 3781} {"train_loss": -6.898253917694092, "global_step": 158842, "epoch": 3781} {"train_loss": -6.926632120495751, "global_step": 158843, "epoch": 3781, "val_loss": 79400.21875} {"train_loss": -6.980007648468018, "global_step": 158844, "epoch": 3782} {"train_loss": -7.030701160430908, "global_step": 158845, "epoch": 3782} {"train_loss": -6.82606315612793, "global_step": 158846, "epoch": 3782} {"train_loss": -6.931542873382568, "global_step": 158847, "epoch": 3782} {"train_loss": -6.9434614181518555, "global_step": 158848, "epoch": 3782} {"train_loss": -6.866127967834473, "global_step": 158849, "epoch": 3782} {"train_loss": -6.9722137451171875, "global_step": 158850, "epoch": 3782} {"train_loss": -6.931051254272461, "global_step": 158851, "epoch": 3782} {"train_loss": -6.913951873779297, "global_step": 158852, "epoch": 3782} {"train_loss": -6.862825393676758, "global_step": 158853, "epoch": 3782} {"train_loss": -6.909307956695557, "global_step": 158854, "epoch": 3782} {"train_loss": -6.997201442718506, "global_step": 158855, "epoch": 3782} {"train_loss": -6.809162139892578, "global_step": 158856, "epoch": 3782} {"train_loss": -6.959824085235596, "global_step": 158857, "epoch": 3782} {"train_loss": -6.8338189125061035, "global_step": 158858, "epoch": 3782} {"train_loss": -7.000064849853516, "global_step": 158859, "epoch": 3782} {"train_loss": -6.901310920715332, "global_step": 158860, "epoch": 3782} {"train_loss": -6.906764030456543, "global_step": 158861, "epoch": 3782} {"train_loss": -7.032323837280273, "global_step": 158862, "epoch": 3782} {"train_loss": -6.944729804992676, "global_step": 158863, "epoch": 3782} {"train_loss": -6.981069564819336, "global_step": 158864, "epoch": 3782} {"train_loss": -6.9055986404418945, "global_step": 158865, "epoch": 3782} {"train_loss": -7.10056209564209, "global_step": 158866, "epoch": 3782} {"train_loss": -6.901242256164551, "global_step": 158867, "epoch": 3782} {"train_loss": -6.905686378479004, "global_step": 158868, "epoch": 3782} {"train_loss": -7.081775665283203, "global_step": 158869, "epoch": 3782} {"train_loss": -6.87501335144043, "global_step": 158870, "epoch": 3782} {"train_loss": -7.076136589050293, "global_step": 158871, "epoch": 3782} {"train_loss": -6.971435546875, "global_step": 158872, "epoch": 3782} {"train_loss": -7.004487037658691, "global_step": 158873, "epoch": 3782} {"train_loss": -6.950993061065674, "global_step": 158874, "epoch": 3782} {"train_loss": -7.006249904632568, "global_step": 158875, "epoch": 3782} {"train_loss": -6.880248069763184, "global_step": 158876, "epoch": 3782} {"train_loss": -6.927695274353027, "global_step": 158877, "epoch": 3782} {"train_loss": -7.0310468673706055, "global_step": 158878, "epoch": 3782} {"train_loss": -6.956758499145508, "global_step": 158879, "epoch": 3782} {"train_loss": -7.007928848266602, "global_step": 158880, "epoch": 3782} {"train_loss": -7.006263732910156, "global_step": 158881, "epoch": 3782} {"train_loss": -7.016364574432373, "global_step": 158882, "epoch": 3782} {"train_loss": -6.93755578994751, "global_step": 158883, "epoch": 3782} {"train_loss": -6.91115665435791, "global_step": 158884, "epoch": 3782} {"train_loss": -6.950158357620239, "global_step": 158885, "epoch": 3782, "val_loss": 79175.078125} {"train_loss": -7.0190629959106445, "global_step": 158886, "epoch": 3783} {"train_loss": -7.007309913635254, "global_step": 158887, "epoch": 3783} {"train_loss": -6.997811794281006, "global_step": 158888, "epoch": 3783} {"train_loss": -6.986774444580078, "global_step": 158889, "epoch": 3783} {"train_loss": -6.946798324584961, "global_step": 158890, "epoch": 3783} {"train_loss": -6.885756969451904, "global_step": 158891, "epoch": 3783} {"train_loss": -6.969280242919922, "global_step": 158892, "epoch": 3783} {"train_loss": -6.868926048278809, "global_step": 158893, "epoch": 3783} {"train_loss": -6.990875244140625, "global_step": 158894, "epoch": 3783} {"train_loss": -7.009279251098633, "global_step": 158895, "epoch": 3783} {"train_loss": -6.95655632019043, "global_step": 158896, "epoch": 3783} {"train_loss": -7.01621150970459, "global_step": 158897, "epoch": 3783} {"train_loss": -6.94638729095459, "global_step": 158898, "epoch": 3783} {"train_loss": -6.805995941162109, "global_step": 158899, "epoch": 3783} {"train_loss": -6.983829498291016, "global_step": 158900, "epoch": 3783} {"train_loss": -6.96111536026001, "global_step": 158901, "epoch": 3783} {"train_loss": -6.954094886779785, "global_step": 158902, "epoch": 3783} {"train_loss": -6.950127601623535, "global_step": 158903, "epoch": 3783} {"train_loss": -6.968509674072266, "global_step": 158904, "epoch": 3783} {"train_loss": -7.034788608551025, "global_step": 158905, "epoch": 3783} {"train_loss": -6.907434463500977, "global_step": 158906, "epoch": 3783} {"train_loss": -7.025907516479492, "global_step": 158907, "epoch": 3783} {"train_loss": -6.900905132293701, "global_step": 158908, "epoch": 3783} {"train_loss": -6.906447410583496, "global_step": 158909, "epoch": 3783} {"train_loss": -7.11734676361084, "global_step": 158910, "epoch": 3783} {"train_loss": -6.979000091552734, "global_step": 158911, "epoch": 3783} {"train_loss": -6.894609451293945, "global_step": 158912, "epoch": 3783} {"train_loss": -6.925385475158691, "global_step": 158913, "epoch": 3783} {"train_loss": -6.984487533569336, "global_step": 158914, "epoch": 3783} {"train_loss": -6.9216837882995605, "global_step": 158915, "epoch": 3783} {"train_loss": -6.9303364753723145, "global_step": 158916, "epoch": 3783} {"train_loss": -6.996450424194336, "global_step": 158917, "epoch": 3783} {"train_loss": -6.956437110900879, "global_step": 158918, "epoch": 3783} {"train_loss": -6.9045820236206055, "global_step": 158919, "epoch": 3783} {"train_loss": -6.884228706359863, "global_step": 158920, "epoch": 3783} {"train_loss": -6.970917224884033, "global_step": 158921, "epoch": 3783} {"train_loss": -6.866052627563477, "global_step": 158922, "epoch": 3783} {"train_loss": -6.801845073699951, "global_step": 158923, "epoch": 3783} {"train_loss": -6.841516017913818, "global_step": 158924, "epoch": 3783} {"train_loss": -7.006483554840088, "global_step": 158925, "epoch": 3783} {"train_loss": -6.909534454345703, "global_step": 158926, "epoch": 3783} {"train_loss": -6.949808018548148, "global_step": 158927, "epoch": 3783, "val_loss": 79256.1328125} {"train_loss": -6.885168552398682, "global_step": 158928, "epoch": 3784} {"train_loss": -6.870797157287598, "global_step": 158929, "epoch": 3784} {"train_loss": -6.859820365905762, "global_step": 158930, "epoch": 3784} {"train_loss": -6.975379467010498, "global_step": 158931, "epoch": 3784} {"train_loss": -6.898883819580078, "global_step": 158932, "epoch": 3784} {"train_loss": -6.780427932739258, "global_step": 158933, "epoch": 3784} {"train_loss": -6.987654209136963, "global_step": 158934, "epoch": 3784} {"train_loss": -6.8579864501953125, "global_step": 158935, "epoch": 3784} {"train_loss": -6.930507659912109, "global_step": 158936, "epoch": 3784} {"train_loss": -6.9182610511779785, "global_step": 158937, "epoch": 3784} {"train_loss": -6.830209732055664, "global_step": 158938, "epoch": 3784} {"train_loss": -6.8996453285217285, "global_step": 158939, "epoch": 3784} {"train_loss": -6.960506439208984, "global_step": 158940, "epoch": 3784} {"train_loss": -6.880965232849121, "global_step": 158941, "epoch": 3784} {"train_loss": -6.810632228851318, "global_step": 158942, "epoch": 3784} {"train_loss": -7.075241565704346, "global_step": 158943, "epoch": 3784} {"train_loss": -6.847439765930176, "global_step": 158944, "epoch": 3784} {"train_loss": -6.9959001541137695, "global_step": 158945, "epoch": 3784} {"train_loss": -6.913125038146973, "global_step": 158946, "epoch": 3784} {"train_loss": -6.977681636810303, "global_step": 158947, "epoch": 3784} {"train_loss": -6.852782249450684, "global_step": 158948, "epoch": 3784} {"train_loss": -6.889172554016113, "global_step": 158949, "epoch": 3784} {"train_loss": -6.877504348754883, "global_step": 158950, "epoch": 3784} {"train_loss": -7.028752326965332, "global_step": 158951, "epoch": 3784} {"train_loss": -6.970806121826172, "global_step": 158952, "epoch": 3784} {"train_loss": -6.950090408325195, "global_step": 158953, "epoch": 3784} {"train_loss": -6.958856582641602, "global_step": 158954, "epoch": 3784} {"train_loss": -6.860610008239746, "global_step": 158955, "epoch": 3784} {"train_loss": -6.926896095275879, "global_step": 158956, "epoch": 3784} {"train_loss": -6.8635663986206055, "global_step": 158957, "epoch": 3784} {"train_loss": -6.851016044616699, "global_step": 158958, "epoch": 3784} {"train_loss": -6.940384864807129, "global_step": 158959, "epoch": 3784} {"train_loss": -6.809475898742676, "global_step": 158960, "epoch": 3784} {"train_loss": -6.887397289276123, "global_step": 158961, "epoch": 3784} {"train_loss": -6.984010696411133, "global_step": 158962, "epoch": 3784} {"train_loss": -6.831210613250732, "global_step": 158963, "epoch": 3784} {"train_loss": -7.020175933837891, "global_step": 158964, "epoch": 3784} {"train_loss": -6.944647312164307, "global_step": 158965, "epoch": 3784} {"train_loss": -6.923774242401123, "global_step": 158966, "epoch": 3784} {"train_loss": -6.911479949951172, "global_step": 158967, "epoch": 3784} {"train_loss": -6.950837135314941, "global_step": 158968, "epoch": 3784} {"train_loss": -6.913762058530535, "global_step": 158969, "epoch": 3784, "val_loss": 79140.046875} {"train_loss": -6.986459732055664, "global_step": 158970, "epoch": 3785} {"train_loss": -6.880068302154541, "global_step": 158971, "epoch": 3785} {"train_loss": -6.989184856414795, "global_step": 158972, "epoch": 3785} {"train_loss": -7.015453338623047, "global_step": 158973, "epoch": 3785} {"train_loss": -6.997247695922852, "global_step": 158974, "epoch": 3785} {"train_loss": -6.908912658691406, "global_step": 158975, "epoch": 3785} {"train_loss": -6.870950222015381, "global_step": 158976, "epoch": 3785} {"train_loss": -6.958645820617676, "global_step": 158977, "epoch": 3785} {"train_loss": -6.929975509643555, "global_step": 158978, "epoch": 3785} {"train_loss": -6.974296569824219, "global_step": 158979, "epoch": 3785} {"train_loss": -7.040771484375, "global_step": 158980, "epoch": 3785} {"train_loss": -6.912200450897217, "global_step": 158981, "epoch": 3785} {"train_loss": -7.010712623596191, "global_step": 158982, "epoch": 3785} {"train_loss": -7.042088031768799, "global_step": 158983, "epoch": 3785} {"train_loss": -7.015018463134766, "global_step": 158984, "epoch": 3785} {"train_loss": -7.02764892578125, "global_step": 158985, "epoch": 3785} {"train_loss": -7.03501033782959, "global_step": 158986, "epoch": 3785} {"train_loss": -7.016634941101074, "global_step": 158987, "epoch": 3785} {"train_loss": -6.990218162536621, "global_step": 158988, "epoch": 3785} {"train_loss": -6.9951171875, "global_step": 158989, "epoch": 3785} {"train_loss": -6.984294891357422, "global_step": 158990, "epoch": 3785} {"train_loss": -7.04465389251709, "global_step": 158991, "epoch": 3785} {"train_loss": -6.979213714599609, "global_step": 158992, "epoch": 3785} {"train_loss": -6.909491539001465, "global_step": 158993, "epoch": 3785} {"train_loss": -6.980722427368164, "global_step": 158994, "epoch": 3785} {"train_loss": -7.0614013671875, "global_step": 158995, "epoch": 3785} {"train_loss": -7.0452375411987305, "global_step": 158996, "epoch": 3785} {"train_loss": -7.060703277587891, "global_step": 158997, "epoch": 3785} {"train_loss": -7.0236663818359375, "global_step": 158998, "epoch": 3785} {"train_loss": -7.064081192016602, "global_step": 158999, "epoch": 3785} {"train_loss": -6.950292110443115, "global_step": 159000, "epoch": 3785} {"train_loss": -6.995855331420898, "global_step": 159001, "epoch": 3785} {"train_loss": -6.949807643890381, "global_step": 159002, "epoch": 3785} {"train_loss": -6.9398040771484375, "global_step": 159003, "epoch": 3785} {"train_loss": -7.118113040924072, "global_step": 159004, "epoch": 3785} {"train_loss": -7.060516357421875, "global_step": 159005, "epoch": 3785} {"train_loss": -7.075115203857422, "global_step": 159006, "epoch": 3785} {"train_loss": -7.0005388259887695, "global_step": 159007, "epoch": 3785} {"train_loss": -7.101054668426514, "global_step": 159008, "epoch": 3785} {"train_loss": -6.968549728393555, "global_step": 159009, "epoch": 3785} {"train_loss": -6.908507823944092, "global_step": 159010, "epoch": 3785} {"train_loss": -6.9933860301971436, "global_step": 159011, "epoch": 3785, "val_loss": 79117.3359375} {"train_loss": -7.241080284118652, "global_step": 159012, "epoch": 3786} {"train_loss": -6.975808143615723, "global_step": 159013, "epoch": 3786} {"train_loss": -6.921413421630859, "global_step": 159014, "epoch": 3786} {"train_loss": -7.081177711486816, "global_step": 159015, "epoch": 3786} {"train_loss": -6.920924186706543, "global_step": 159016, "epoch": 3786} {"train_loss": -7.019881248474121, "global_step": 159017, "epoch": 3786} {"train_loss": -7.045436382293701, "global_step": 159018, "epoch": 3786} {"train_loss": -7.030529022216797, "global_step": 159019, "epoch": 3786} {"train_loss": -6.899926662445068, "global_step": 159020, "epoch": 3786} {"train_loss": -7.001316070556641, "global_step": 159021, "epoch": 3786} {"train_loss": -6.979361057281494, "global_step": 159022, "epoch": 3786} {"train_loss": -7.001519203186035, "global_step": 159023, "epoch": 3786} {"train_loss": -6.956275939941406, "global_step": 159024, "epoch": 3786} {"train_loss": -6.953585624694824, "global_step": 159025, "epoch": 3786} {"train_loss": -6.951557159423828, "global_step": 159026, "epoch": 3786} {"train_loss": -6.879019737243652, "global_step": 159027, "epoch": 3786} {"train_loss": -6.9398298263549805, "global_step": 159028, "epoch": 3786} {"train_loss": -6.916412353515625, "global_step": 159029, "epoch": 3786} {"train_loss": -6.92112922668457, "global_step": 159030, "epoch": 3786} {"train_loss": -7.005753040313721, "global_step": 159031, "epoch": 3786} {"train_loss": -6.829427719116211, "global_step": 159032, "epoch": 3786} {"train_loss": -6.89475154876709, "global_step": 159033, "epoch": 3786} {"train_loss": -6.8389573097229, "global_step": 159034, "epoch": 3786} {"train_loss": -6.841223239898682, "global_step": 159035, "epoch": 3786} {"train_loss": -6.880769729614258, "global_step": 159036, "epoch": 3786} {"train_loss": -6.902449607849121, "global_step": 159037, "epoch": 3786} {"train_loss": -6.89508056640625, "global_step": 159038, "epoch": 3786} {"train_loss": -6.855396270751953, "global_step": 159039, "epoch": 3786} {"train_loss": -6.898818492889404, "global_step": 159040, "epoch": 3786} {"train_loss": -6.7988996505737305, "global_step": 159041, "epoch": 3786} {"train_loss": -6.901490688323975, "global_step": 159042, "epoch": 3786} {"train_loss": -6.910440921783447, "global_step": 159043, "epoch": 3786} {"train_loss": -6.843073844909668, "global_step": 159044, "epoch": 3786} {"train_loss": -6.841817855834961, "global_step": 159045, "epoch": 3786} {"train_loss": -6.922834396362305, "global_step": 159046, "epoch": 3786} {"train_loss": -6.902196884155273, "global_step": 159047, "epoch": 3786} {"train_loss": -6.772495269775391, "global_step": 159048, "epoch": 3786} {"train_loss": -6.871232032775879, "global_step": 159049, "epoch": 3786} {"train_loss": -6.9244184494018555, "global_step": 159050, "epoch": 3786} {"train_loss": -6.7843780517578125, "global_step": 159051, "epoch": 3786} {"train_loss": -6.879657745361328, "global_step": 159052, "epoch": 3786} {"train_loss": -6.922879593712943, "global_step": 159053, "epoch": 3786, "val_loss": 79188.0078125} {"train_loss": -6.9430646896362305, "global_step": 159054, "epoch": 3787} {"train_loss": -6.925609588623047, "global_step": 159055, "epoch": 3787} {"train_loss": -6.960597991943359, "global_step": 159056, "epoch": 3787} {"train_loss": -6.90641975402832, "global_step": 159057, "epoch": 3787} {"train_loss": -6.959746837615967, "global_step": 159058, "epoch": 3787} {"train_loss": -6.896822929382324, "global_step": 159059, "epoch": 3787} {"train_loss": -6.996707439422607, "global_step": 159060, "epoch": 3787} {"train_loss": -7.069498062133789, "global_step": 159061, "epoch": 3787} {"train_loss": -6.949517250061035, "global_step": 159062, "epoch": 3787} {"train_loss": -6.9127092361450195, "global_step": 159063, "epoch": 3787} {"train_loss": -7.029574394226074, "global_step": 159064, "epoch": 3787} {"train_loss": -6.900215148925781, "global_step": 159065, "epoch": 3787} {"train_loss": -6.919422149658203, "global_step": 159066, "epoch": 3787} {"train_loss": -7.040281772613525, "global_step": 159067, "epoch": 3787} {"train_loss": -7.046761512756348, "global_step": 159068, "epoch": 3787} {"train_loss": -6.950831413269043, "global_step": 159069, "epoch": 3787} {"train_loss": -6.95783805847168, "global_step": 159070, "epoch": 3787} {"train_loss": -6.972204685211182, "global_step": 159071, "epoch": 3787} {"train_loss": -6.920263767242432, "global_step": 159072, "epoch": 3787} {"train_loss": -6.913799285888672, "global_step": 159073, "epoch": 3787} {"train_loss": -6.9546403884887695, "global_step": 159074, "epoch": 3787} {"train_loss": -6.853227615356445, "global_step": 159075, "epoch": 3787} {"train_loss": -6.744808197021484, "global_step": 159076, "epoch": 3787} {"train_loss": -6.86641788482666, "global_step": 159077, "epoch": 3787} {"train_loss": -7.023840427398682, "global_step": 159078, "epoch": 3787} {"train_loss": -6.879404067993164, "global_step": 159079, "epoch": 3787} {"train_loss": -7.030298233032227, "global_step": 159080, "epoch": 3787} {"train_loss": -6.870757102966309, "global_step": 159081, "epoch": 3787} {"train_loss": -6.850582122802734, "global_step": 159082, "epoch": 3787} {"train_loss": -6.914772987365723, "global_step": 159083, "epoch": 3787} {"train_loss": -6.893112659454346, "global_step": 159084, "epoch": 3787} {"train_loss": -6.806006908416748, "global_step": 159085, "epoch": 3787} {"train_loss": -6.912035942077637, "global_step": 159086, "epoch": 3787} {"train_loss": -6.920970439910889, "global_step": 159087, "epoch": 3787} {"train_loss": -6.857497215270996, "global_step": 159088, "epoch": 3787} {"train_loss": -6.9231157302856445, "global_step": 159089, "epoch": 3787} {"train_loss": -6.961939811706543, "global_step": 159090, "epoch": 3787} {"train_loss": -6.905569076538086, "global_step": 159091, "epoch": 3787} {"train_loss": -6.995547294616699, "global_step": 159092, "epoch": 3787} {"train_loss": -6.966719627380371, "global_step": 159093, "epoch": 3787} {"train_loss": -6.9272308349609375, "global_step": 159094, "epoch": 3787} {"train_loss": -6.932329768226261, "global_step": 159095, "epoch": 3787, "val_loss": 79288.0546875} {"train_loss": -6.842354774475098, "global_step": 159096, "epoch": 3788} {"train_loss": -7.034585952758789, "global_step": 159097, "epoch": 3788} {"train_loss": -6.979466915130615, "global_step": 159098, "epoch": 3788} {"train_loss": -7.014473915100098, "global_step": 159099, "epoch": 3788} {"train_loss": -6.977590560913086, "global_step": 159100, "epoch": 3788} {"train_loss": -7.0480170249938965, "global_step": 159101, "epoch": 3788} {"train_loss": -6.882678031921387, "global_step": 159102, "epoch": 3788} {"train_loss": -6.938800811767578, "global_step": 159103, "epoch": 3788} {"train_loss": -6.9044904708862305, "global_step": 159104, "epoch": 3788} {"train_loss": -6.862307548522949, "global_step": 159105, "epoch": 3788} {"train_loss": -6.953500747680664, "global_step": 159106, "epoch": 3788} {"train_loss": -6.896244525909424, "global_step": 159107, "epoch": 3788} {"train_loss": -7.025393486022949, "global_step": 159108, "epoch": 3788} {"train_loss": -6.972921371459961, "global_step": 159109, "epoch": 3788} {"train_loss": -6.887337684631348, "global_step": 159110, "epoch": 3788} {"train_loss": -6.804045677185059, "global_step": 159111, "epoch": 3788} {"train_loss": -6.563551902770996, "global_step": 159112, "epoch": 3788} {"train_loss": -6.683438301086426, "global_step": 159113, "epoch": 3788} {"train_loss": -6.915170192718506, "global_step": 159114, "epoch": 3788} {"train_loss": -6.688943386077881, "global_step": 159115, "epoch": 3788} {"train_loss": -6.717671871185303, "global_step": 159116, "epoch": 3788} {"train_loss": -6.691995620727539, "global_step": 159117, "epoch": 3788} {"train_loss": -6.74531364440918, "global_step": 159118, "epoch": 3788} {"train_loss": -6.80939245223999, "global_step": 159119, "epoch": 3788} {"train_loss": -6.814474105834961, "global_step": 159120, "epoch": 3788} {"train_loss": -6.69924259185791, "global_step": 159121, "epoch": 3788} {"train_loss": -6.942868232727051, "global_step": 159122, "epoch": 3788} {"train_loss": -6.851409912109375, "global_step": 159123, "epoch": 3788} {"train_loss": -6.835984230041504, "global_step": 159124, "epoch": 3788} {"train_loss": -6.894622802734375, "global_step": 159125, "epoch": 3788} {"train_loss": -6.705362319946289, "global_step": 159126, "epoch": 3788} {"train_loss": -6.930232048034668, "global_step": 159127, "epoch": 3788} {"train_loss": -6.853911399841309, "global_step": 159128, "epoch": 3788} {"train_loss": -6.880200386047363, "global_step": 159129, "epoch": 3788} {"train_loss": -6.847333908081055, "global_step": 159130, "epoch": 3788} {"train_loss": -6.946538925170898, "global_step": 159131, "epoch": 3788} {"train_loss": -6.752109527587891, "global_step": 159132, "epoch": 3788} {"train_loss": -6.977089881896973, "global_step": 159133, "epoch": 3788} {"train_loss": -6.828464508056641, "global_step": 159134, "epoch": 3788} {"train_loss": -6.717679500579834, "global_step": 159135, "epoch": 3788} {"train_loss": -6.966333866119385, "global_step": 159136, "epoch": 3788} {"train_loss": -6.86026178087507, "global_step": 159137, "epoch": 3788, "val_loss": 79262.3671875} {"train_loss": -6.7213969230651855, "global_step": 159138, "epoch": 3789} {"train_loss": -6.961145877838135, "global_step": 159139, "epoch": 3789} {"train_loss": -6.9221696853637695, "global_step": 159140, "epoch": 3789} {"train_loss": -6.906054496765137, "global_step": 159141, "epoch": 3789} {"train_loss": -6.919852256774902, "global_step": 159142, "epoch": 3789} {"train_loss": -6.966639995574951, "global_step": 159143, "epoch": 3789} {"train_loss": -6.9319987297058105, "global_step": 159144, "epoch": 3789} {"train_loss": -6.903653621673584, "global_step": 159145, "epoch": 3789} {"train_loss": -6.90045166015625, "global_step": 159146, "epoch": 3789} {"train_loss": -6.70306921005249, "global_step": 159147, "epoch": 3789} {"train_loss": -6.903500080108643, "global_step": 159148, "epoch": 3789} {"train_loss": -6.941995143890381, "global_step": 159149, "epoch": 3789} {"train_loss": -6.879258155822754, "global_step": 159150, "epoch": 3789} {"train_loss": -6.994105815887451, "global_step": 159151, "epoch": 3789} {"train_loss": -6.793255805969238, "global_step": 159152, "epoch": 3789} {"train_loss": -6.9974365234375, "global_step": 159153, "epoch": 3789} {"train_loss": -6.894866943359375, "global_step": 159154, "epoch": 3789} {"train_loss": -6.817408561706543, "global_step": 159155, "epoch": 3789} {"train_loss": -6.899630069732666, "global_step": 159156, "epoch": 3789} {"train_loss": -6.963720321655273, "global_step": 159157, "epoch": 3789} {"train_loss": -6.985294818878174, "global_step": 159158, "epoch": 3789} {"train_loss": -6.842714309692383, "global_step": 159159, "epoch": 3789} {"train_loss": -7.000061511993408, "global_step": 159160, "epoch": 3789} {"train_loss": -6.982013702392578, "global_step": 159161, "epoch": 3789} {"train_loss": -7.009946823120117, "global_step": 159162, "epoch": 3789} {"train_loss": -6.952333927154541, "global_step": 159163, "epoch": 3789} {"train_loss": -6.9567975997924805, "global_step": 159164, "epoch": 3789} {"train_loss": -6.926496982574463, "global_step": 159165, "epoch": 3789} {"train_loss": -7.0378241539001465, "global_step": 159166, "epoch": 3789} {"train_loss": -6.968147277832031, "global_step": 159167, "epoch": 3789} {"train_loss": -7.010660648345947, "global_step": 159168, "epoch": 3789} {"train_loss": -7.112802982330322, "global_step": 159169, "epoch": 3789} {"train_loss": -6.985359191894531, "global_step": 159170, "epoch": 3789} {"train_loss": -6.993729591369629, "global_step": 159171, "epoch": 3789} {"train_loss": -6.995166778564453, "global_step": 159172, "epoch": 3789} {"train_loss": -7.042897701263428, "global_step": 159173, "epoch": 3789} {"train_loss": -6.9757537841796875, "global_step": 159174, "epoch": 3789} {"train_loss": -6.937048435211182, "global_step": 159175, "epoch": 3789} {"train_loss": -6.953530788421631, "global_step": 159176, "epoch": 3789} {"train_loss": -6.974276542663574, "global_step": 159177, "epoch": 3789} {"train_loss": -7.032426834106445, "global_step": 159178, "epoch": 3789} {"train_loss": -6.940429653440203, "global_step": 159179, "epoch": 3789, "val_loss": 79283.9375} {"train_loss": -6.977242469787598, "global_step": 159180, "epoch": 3790} {"train_loss": -6.9551286697387695, "global_step": 159181, "epoch": 3790} {"train_loss": -6.989505767822266, "global_step": 159182, "epoch": 3790} {"train_loss": -6.99623441696167, "global_step": 159183, "epoch": 3790} {"train_loss": -7.0353474617004395, "global_step": 159184, "epoch": 3790} {"train_loss": -6.868785858154297, "global_step": 159185, "epoch": 3790} {"train_loss": -6.990755081176758, "global_step": 159186, "epoch": 3790} {"train_loss": -7.12824821472168, "global_step": 159187, "epoch": 3790} {"train_loss": -6.881867408752441, "global_step": 159188, "epoch": 3790} {"train_loss": -6.954778671264648, "global_step": 159189, "epoch": 3790} {"train_loss": -6.857334613800049, "global_step": 159190, "epoch": 3790} {"train_loss": -6.912325859069824, "global_step": 159191, "epoch": 3790} {"train_loss": -6.966879367828369, "global_step": 159192, "epoch": 3790} {"train_loss": -6.99483585357666, "global_step": 159193, "epoch": 3790} {"train_loss": -6.964582443237305, "global_step": 159194, "epoch": 3790} {"train_loss": -6.918244361877441, "global_step": 159195, "epoch": 3790} {"train_loss": -7.02577018737793, "global_step": 159196, "epoch": 3790} {"train_loss": -7.019855499267578, "global_step": 159197, "epoch": 3790} {"train_loss": -6.930597305297852, "global_step": 159198, "epoch": 3790} {"train_loss": -6.979756832122803, "global_step": 159199, "epoch": 3790} {"train_loss": -6.878406524658203, "global_step": 159200, "epoch": 3790} {"train_loss": -7.069568157196045, "global_step": 159201, "epoch": 3790} {"train_loss": -6.9429931640625, "global_step": 159202, "epoch": 3790} {"train_loss": -6.9535231590271, "global_step": 159203, "epoch": 3790} {"train_loss": -6.886812210083008, "global_step": 159204, "epoch": 3790} {"train_loss": -6.827340602874756, "global_step": 159205, "epoch": 3790} {"train_loss": -6.93992805480957, "global_step": 159206, "epoch": 3790} {"train_loss": -6.910693168640137, "global_step": 159207, "epoch": 3790} {"train_loss": -6.993074417114258, "global_step": 159208, "epoch": 3790} {"train_loss": -7.01692008972168, "global_step": 159209, "epoch": 3790} {"train_loss": -7.012779712677002, "global_step": 159210, "epoch": 3790} {"train_loss": -6.903341770172119, "global_step": 159211, "epoch": 3790} {"train_loss": -6.892184257507324, "global_step": 159212, "epoch": 3790} {"train_loss": -6.9552507400512695, "global_step": 159213, "epoch": 3790} {"train_loss": -6.808465480804443, "global_step": 159214, "epoch": 3790} {"train_loss": -6.916089057922363, "global_step": 159215, "epoch": 3790} {"train_loss": -6.936159133911133, "global_step": 159216, "epoch": 3790} {"train_loss": -6.977304935455322, "global_step": 159217, "epoch": 3790} {"train_loss": -6.994152069091797, "global_step": 159218, "epoch": 3790} {"train_loss": -6.789831161499023, "global_step": 159219, "epoch": 3790} {"train_loss": -6.9200921058654785, "global_step": 159220, "epoch": 3790} {"train_loss": -6.947745186941964, "global_step": 159221, "epoch": 3790, "val_loss": 78834.109375} {"train_loss": -6.744513988494873, "global_step": 159222, "epoch": 3791} {"train_loss": -6.803422927856445, "global_step": 159223, "epoch": 3791} {"train_loss": -6.919281959533691, "global_step": 159224, "epoch": 3791} {"train_loss": -6.747211933135986, "global_step": 159225, "epoch": 3791} {"train_loss": -6.863344192504883, "global_step": 159226, "epoch": 3791} {"train_loss": -6.994599342346191, "global_step": 159227, "epoch": 3791} {"train_loss": -6.87413215637207, "global_step": 159228, "epoch": 3791} {"train_loss": -6.89137077331543, "global_step": 159229, "epoch": 3791} {"train_loss": -6.830434799194336, "global_step": 159230, "epoch": 3791} {"train_loss": -6.8971452713012695, "global_step": 159231, "epoch": 3791} {"train_loss": -6.914056777954102, "global_step": 159232, "epoch": 3791} {"train_loss": -6.867201805114746, "global_step": 159233, "epoch": 3791} {"train_loss": -6.944310188293457, "global_step": 159234, "epoch": 3791} {"train_loss": -7.020298480987549, "global_step": 159235, "epoch": 3791} {"train_loss": -6.934316635131836, "global_step": 159236, "epoch": 3791} {"train_loss": -6.8770833015441895, "global_step": 159237, "epoch": 3791} {"train_loss": -6.961302757263184, "global_step": 159238, "epoch": 3791} {"train_loss": -6.887283802032471, "global_step": 159239, "epoch": 3791} {"train_loss": -6.926997184753418, "global_step": 159240, "epoch": 3791} {"train_loss": -7.028278350830078, "global_step": 159241, "epoch": 3791} {"train_loss": -6.869438171386719, "global_step": 159242, "epoch": 3791} {"train_loss": -6.924827575683594, "global_step": 159243, "epoch": 3791} {"train_loss": -6.91097354888916, "global_step": 159244, "epoch": 3791} {"train_loss": -6.833327293395996, "global_step": 159245, "epoch": 3791} {"train_loss": -6.911983489990234, "global_step": 159246, "epoch": 3791} {"train_loss": -6.956186294555664, "global_step": 159247, "epoch": 3791} {"train_loss": -6.895944118499756, "global_step": 159248, "epoch": 3791} {"train_loss": -6.88292121887207, "global_step": 159249, "epoch": 3791} {"train_loss": -6.818775177001953, "global_step": 159250, "epoch": 3791} {"train_loss": -6.965051651000977, "global_step": 159251, "epoch": 3791} {"train_loss": -6.859089374542236, "global_step": 159252, "epoch": 3791} {"train_loss": -6.797399997711182, "global_step": 159253, "epoch": 3791} {"train_loss": -6.968135833740234, "global_step": 159254, "epoch": 3791} {"train_loss": -6.8338704109191895, "global_step": 159255, "epoch": 3791} {"train_loss": -6.917191505432129, "global_step": 159256, "epoch": 3791} {"train_loss": -6.910444736480713, "global_step": 159257, "epoch": 3791} {"train_loss": -6.8891119956970215, "global_step": 159258, "epoch": 3791} {"train_loss": -6.866977691650391, "global_step": 159259, "epoch": 3791} {"train_loss": -6.929346084594727, "global_step": 159260, "epoch": 3791} {"train_loss": -6.956811428070068, "global_step": 159261, "epoch": 3791} {"train_loss": -6.857345104217529, "global_step": 159262, "epoch": 3791} {"train_loss": -6.8945998918442495, "global_step": 159263, "epoch": 3791, "val_loss": 79551.90625} {"train_loss": -6.908068656921387, "global_step": 159264, "epoch": 3792} {"train_loss": -6.939600944519043, "global_step": 159265, "epoch": 3792} {"train_loss": -6.8910088539123535, "global_step": 159266, "epoch": 3792} {"train_loss": -6.968707084655762, "global_step": 159267, "epoch": 3792} {"train_loss": -6.933525562286377, "global_step": 159268, "epoch": 3792} {"train_loss": -6.940238952636719, "global_step": 159269, "epoch": 3792} {"train_loss": -6.92681360244751, "global_step": 159270, "epoch": 3792} {"train_loss": -6.957667350769043, "global_step": 159271, "epoch": 3792} {"train_loss": -6.9314374923706055, "global_step": 159272, "epoch": 3792} {"train_loss": -7.014759540557861, "global_step": 159273, "epoch": 3792} {"train_loss": -6.956841468811035, "global_step": 159274, "epoch": 3792} {"train_loss": -6.880084037780762, "global_step": 159275, "epoch": 3792} {"train_loss": -6.911502838134766, "global_step": 159276, "epoch": 3792} {"train_loss": -6.832515716552734, "global_step": 159277, "epoch": 3792} {"train_loss": -6.976565361022949, "global_step": 159278, "epoch": 3792} {"train_loss": -6.860177993774414, "global_step": 159279, "epoch": 3792} {"train_loss": -6.768787384033203, "global_step": 159280, "epoch": 3792} {"train_loss": -6.925737380981445, "global_step": 159281, "epoch": 3792} {"train_loss": -6.928025245666504, "global_step": 159282, "epoch": 3792} {"train_loss": -6.8503336906433105, "global_step": 159283, "epoch": 3792} {"train_loss": -6.940168380737305, "global_step": 159284, "epoch": 3792} {"train_loss": -6.91005277633667, "global_step": 159285, "epoch": 3792} {"train_loss": -6.956146240234375, "global_step": 159286, "epoch": 3792} {"train_loss": -6.906235694885254, "global_step": 159287, "epoch": 3792} {"train_loss": -6.835790157318115, "global_step": 159288, "epoch": 3792} {"train_loss": -6.978199481964111, "global_step": 159289, "epoch": 3792} {"train_loss": -6.906637191772461, "global_step": 159290, "epoch": 3792} {"train_loss": -6.850450038909912, "global_step": 159291, "epoch": 3792} {"train_loss": -6.960936546325684, "global_step": 159292, "epoch": 3792} {"train_loss": -6.980159759521484, "global_step": 159293, "epoch": 3792} {"train_loss": -6.788940906524658, "global_step": 159294, "epoch": 3792} {"train_loss": -6.939824104309082, "global_step": 159295, "epoch": 3792} {"train_loss": -6.940647125244141, "global_step": 159296, "epoch": 3792} {"train_loss": -6.923211097717285, "global_step": 159297, "epoch": 3792} {"train_loss": -6.906582832336426, "global_step": 159298, "epoch": 3792} {"train_loss": -6.911073684692383, "global_step": 159299, "epoch": 3792} {"train_loss": -6.994518756866455, "global_step": 159300, "epoch": 3792} {"train_loss": -6.977851867675781, "global_step": 159301, "epoch": 3792} {"train_loss": -6.919687271118164, "global_step": 159302, "epoch": 3792} {"train_loss": -6.951803684234619, "global_step": 159303, "epoch": 3792} {"train_loss": -6.970785140991211, "global_step": 159304, "epoch": 3792} {"train_loss": -6.923637662615095, "global_step": 159305, "epoch": 3792, "val_loss": 79382.21875} {"train_loss": -6.981436252593994, "global_step": 159306, "epoch": 3793} {"train_loss": -7.099414825439453, "global_step": 159307, "epoch": 3793} {"train_loss": -6.913372039794922, "global_step": 159308, "epoch": 3793} {"train_loss": -6.953145980834961, "global_step": 159309, "epoch": 3793} {"train_loss": -6.894927024841309, "global_step": 159310, "epoch": 3793} {"train_loss": -6.867396354675293, "global_step": 159311, "epoch": 3793} {"train_loss": -6.893497467041016, "global_step": 159312, "epoch": 3793} {"train_loss": -7.075418472290039, "global_step": 159313, "epoch": 3793} {"train_loss": -6.981781005859375, "global_step": 159314, "epoch": 3793} {"train_loss": -6.934467315673828, "global_step": 159315, "epoch": 3793} {"train_loss": -6.977859020233154, "global_step": 159316, "epoch": 3793} {"train_loss": -6.853065490722656, "global_step": 159317, "epoch": 3793} {"train_loss": -6.93125057220459, "global_step": 159318, "epoch": 3793} {"train_loss": -7.056118488311768, "global_step": 159319, "epoch": 3793} {"train_loss": -6.942083358764648, "global_step": 159320, "epoch": 3793} {"train_loss": -7.014678478240967, "global_step": 159321, "epoch": 3793} {"train_loss": -6.95311975479126, "global_step": 159322, "epoch": 3793} {"train_loss": -6.803658962249756, "global_step": 159323, "epoch": 3793} {"train_loss": -6.914085388183594, "global_step": 159324, "epoch": 3793} {"train_loss": -6.818171501159668, "global_step": 159325, "epoch": 3793} {"train_loss": -6.998431205749512, "global_step": 159326, "epoch": 3793} {"train_loss": -7.036648750305176, "global_step": 159327, "epoch": 3793} {"train_loss": -6.964452743530273, "global_step": 159328, "epoch": 3793} {"train_loss": -6.942967414855957, "global_step": 159329, "epoch": 3793} {"train_loss": -6.983598232269287, "global_step": 159330, "epoch": 3793} {"train_loss": -7.027153968811035, "global_step": 159331, "epoch": 3793} {"train_loss": -6.9319539070129395, "global_step": 159332, "epoch": 3793} {"train_loss": -6.85479736328125, "global_step": 159333, "epoch": 3793} {"train_loss": -7.006161689758301, "global_step": 159334, "epoch": 3793} {"train_loss": -6.952183723449707, "global_step": 159335, "epoch": 3793} {"train_loss": -7.054417610168457, "global_step": 159336, "epoch": 3793} {"train_loss": -6.993549346923828, "global_step": 159337, "epoch": 3793} {"train_loss": -6.85658597946167, "global_step": 159338, "epoch": 3793} {"train_loss": -6.9200639724731445, "global_step": 159339, "epoch": 3793} {"train_loss": -7.043473243713379, "global_step": 159340, "epoch": 3793} {"train_loss": -6.962350845336914, "global_step": 159341, "epoch": 3793} {"train_loss": -7.015157699584961, "global_step": 159342, "epoch": 3793} {"train_loss": -7.027969837188721, "global_step": 159343, "epoch": 3793} {"train_loss": -6.925656795501709, "global_step": 159344, "epoch": 3793} {"train_loss": -7.050987243652344, "global_step": 159345, "epoch": 3793} {"train_loss": -6.989388465881348, "global_step": 159346, "epoch": 3793} {"train_loss": -6.962142524265108, "global_step": 159347, "epoch": 3793, "val_loss": 79339.21875} {"train_loss": -7.116511344909668, "global_step": 159348, "epoch": 3794} {"train_loss": -7.0391845703125, "global_step": 159349, "epoch": 3794} {"train_loss": -6.9513092041015625, "global_step": 159350, "epoch": 3794} {"train_loss": -6.980088710784912, "global_step": 159351, "epoch": 3794} {"train_loss": -6.960355281829834, "global_step": 159352, "epoch": 3794} {"train_loss": -7.0298309326171875, "global_step": 159353, "epoch": 3794} {"train_loss": -6.898101806640625, "global_step": 159354, "epoch": 3794} {"train_loss": -7.115974426269531, "global_step": 159355, "epoch": 3794} {"train_loss": -7.0548200607299805, "global_step": 159356, "epoch": 3794} {"train_loss": -7.003057956695557, "global_step": 159357, "epoch": 3794} {"train_loss": -7.046202659606934, "global_step": 159358, "epoch": 3794} {"train_loss": -6.9775261878967285, "global_step": 159359, "epoch": 3794} {"train_loss": -6.897489547729492, "global_step": 159360, "epoch": 3794} {"train_loss": -6.963602542877197, "global_step": 159361, "epoch": 3794} {"train_loss": -6.951264381408691, "global_step": 159362, "epoch": 3794} {"train_loss": -6.762677192687988, "global_step": 159363, "epoch": 3794} {"train_loss": -6.959381580352783, "global_step": 159364, "epoch": 3794} {"train_loss": -7.024462699890137, "global_step": 159365, "epoch": 3794} {"train_loss": -6.845520496368408, "global_step": 159366, "epoch": 3794} {"train_loss": -6.950620651245117, "global_step": 159367, "epoch": 3794} {"train_loss": -6.950895309448242, "global_step": 159368, "epoch": 3794} {"train_loss": -6.943177223205566, "global_step": 159369, "epoch": 3794} {"train_loss": -6.862435340881348, "global_step": 159370, "epoch": 3794} {"train_loss": -6.81862735748291, "global_step": 159371, "epoch": 3794} {"train_loss": -6.919274806976318, "global_step": 159372, "epoch": 3794} {"train_loss": -6.855799198150635, "global_step": 159373, "epoch": 3794} {"train_loss": -6.83775520324707, "global_step": 159374, "epoch": 3794} {"train_loss": -6.852547645568848, "global_step": 159375, "epoch": 3794} {"train_loss": -6.811050891876221, "global_step": 159376, "epoch": 3794} {"train_loss": -6.946489334106445, "global_step": 159377, "epoch": 3794} {"train_loss": -6.93575382232666, "global_step": 159378, "epoch": 3794} {"train_loss": -6.908707618713379, "global_step": 159379, "epoch": 3794} {"train_loss": -6.863816738128662, "global_step": 159380, "epoch": 3794} {"train_loss": -6.96190071105957, "global_step": 159381, "epoch": 3794} {"train_loss": -6.892117500305176, "global_step": 159382, "epoch": 3794} {"train_loss": -6.959738731384277, "global_step": 159383, "epoch": 3794} {"train_loss": -6.891317367553711, "global_step": 159384, "epoch": 3794} {"train_loss": -6.868099689483643, "global_step": 159385, "epoch": 3794} {"train_loss": -6.875373840332031, "global_step": 159386, "epoch": 3794} {"train_loss": -6.76144552230835, "global_step": 159387, "epoch": 3794} {"train_loss": -7.015712738037109, "global_step": 159388, "epoch": 3794} {"train_loss": -6.92856054078965, "global_step": 159389, "epoch": 3794, "val_loss": 79318.390625} {"train_loss": -6.8195648193359375, "global_step": 159390, "epoch": 3795} {"train_loss": -6.870944976806641, "global_step": 159391, "epoch": 3795} {"train_loss": -6.911874771118164, "global_step": 159392, "epoch": 3795} {"train_loss": -6.945919990539551, "global_step": 159393, "epoch": 3795} {"train_loss": -6.942831993103027, "global_step": 159394, "epoch": 3795} {"train_loss": -6.896456718444824, "global_step": 159395, "epoch": 3795} {"train_loss": -6.973755836486816, "global_step": 159396, "epoch": 3795} {"train_loss": -6.831431865692139, "global_step": 159397, "epoch": 3795} {"train_loss": -6.947353363037109, "global_step": 159398, "epoch": 3795} {"train_loss": -6.908168315887451, "global_step": 159399, "epoch": 3795} {"train_loss": -6.8523969650268555, "global_step": 159400, "epoch": 3795} {"train_loss": -6.983438491821289, "global_step": 159401, "epoch": 3795} {"train_loss": -6.8431620597839355, "global_step": 159402, "epoch": 3795} {"train_loss": -7.042814254760742, "global_step": 159403, "epoch": 3795} {"train_loss": -6.99748420715332, "global_step": 159404, "epoch": 3795} {"train_loss": -6.906156539916992, "global_step": 159405, "epoch": 3795} {"train_loss": -7.056169509887695, "global_step": 159406, "epoch": 3795} {"train_loss": -6.958998680114746, "global_step": 159407, "epoch": 3795} {"train_loss": -7.066726207733154, "global_step": 159408, "epoch": 3795} {"train_loss": -6.883057594299316, "global_step": 159409, "epoch": 3795} {"train_loss": -7.032840251922607, "global_step": 159410, "epoch": 3795} {"train_loss": -6.8854851722717285, "global_step": 159411, "epoch": 3795} {"train_loss": -6.90342903137207, "global_step": 159412, "epoch": 3795} {"train_loss": -6.942577838897705, "global_step": 159413, "epoch": 3795} {"train_loss": -6.936959743499756, "global_step": 159414, "epoch": 3795} {"train_loss": -6.9528398513793945, "global_step": 159415, "epoch": 3795} {"train_loss": -7.033646106719971, "global_step": 159416, "epoch": 3795} {"train_loss": -6.9573564529418945, "global_step": 159417, "epoch": 3795} {"train_loss": -6.913591384887695, "global_step": 159418, "epoch": 3795} {"train_loss": -6.962395668029785, "global_step": 159419, "epoch": 3795} {"train_loss": -6.7870965003967285, "global_step": 159420, "epoch": 3795} {"train_loss": -7.07051944732666, "global_step": 159421, "epoch": 3795} {"train_loss": -6.936074733734131, "global_step": 159422, "epoch": 3795} {"train_loss": -6.612757205963135, "global_step": 159423, "epoch": 3795} {"train_loss": -6.802412986755371, "global_step": 159424, "epoch": 3795} {"train_loss": -6.852271556854248, "global_step": 159425, "epoch": 3795} {"train_loss": -6.883881568908691, "global_step": 159426, "epoch": 3795} {"train_loss": -6.972641944885254, "global_step": 159427, "epoch": 3795} {"train_loss": -6.884058475494385, "global_step": 159428, "epoch": 3795} {"train_loss": -6.82367467880249, "global_step": 159429, "epoch": 3795} {"train_loss": -6.790680885314941, "global_step": 159430, "epoch": 3795} {"train_loss": -6.912563448860531, "global_step": 159431, "epoch": 3795, "val_loss": 79414.71875} {"train_loss": -6.923325538635254, "global_step": 159432, "epoch": 3796} {"train_loss": -6.911463737487793, "global_step": 159433, "epoch": 3796} {"train_loss": -6.90875244140625, "global_step": 159434, "epoch": 3796} {"train_loss": -6.926260471343994, "global_step": 159435, "epoch": 3796} {"train_loss": -6.87863826751709, "global_step": 159436, "epoch": 3796} {"train_loss": -6.892031669616699, "global_step": 159437, "epoch": 3796} {"train_loss": -6.874386787414551, "global_step": 159438, "epoch": 3796} {"train_loss": -6.993128776550293, "global_step": 159439, "epoch": 3796} {"train_loss": -6.881753444671631, "global_step": 159440, "epoch": 3796} {"train_loss": -6.997932434082031, "global_step": 159441, "epoch": 3796} {"train_loss": -6.930944442749023, "global_step": 159442, "epoch": 3796} {"train_loss": -6.960883617401123, "global_step": 159443, "epoch": 3796} {"train_loss": -6.979355812072754, "global_step": 159444, "epoch": 3796} {"train_loss": -6.866025924682617, "global_step": 159445, "epoch": 3796} {"train_loss": -6.945921897888184, "global_step": 159446, "epoch": 3796} {"train_loss": -6.952291488647461, "global_step": 159447, "epoch": 3796} {"train_loss": -6.9719157218933105, "global_step": 159448, "epoch": 3796} {"train_loss": -6.9327073097229, "global_step": 159449, "epoch": 3796} {"train_loss": -6.886702537536621, "global_step": 159450, "epoch": 3796} {"train_loss": -7.05185604095459, "global_step": 159451, "epoch": 3796} {"train_loss": -6.918784141540527, "global_step": 159452, "epoch": 3796} {"train_loss": -6.964902400970459, "global_step": 159453, "epoch": 3796} {"train_loss": -6.921589374542236, "global_step": 159454, "epoch": 3796} {"train_loss": -6.889366149902344, "global_step": 159455, "epoch": 3796} {"train_loss": -6.978010177612305, "global_step": 159456, "epoch": 3796} {"train_loss": -6.934131622314453, "global_step": 159457, "epoch": 3796} {"train_loss": -6.888998508453369, "global_step": 159458, "epoch": 3796} {"train_loss": -6.961025714874268, "global_step": 159459, "epoch": 3796} {"train_loss": -6.901648044586182, "global_step": 159460, "epoch": 3796} {"train_loss": -6.894628524780273, "global_step": 159461, "epoch": 3796} {"train_loss": -7.0514349937438965, "global_step": 159462, "epoch": 3796} {"train_loss": -6.910787105560303, "global_step": 159463, "epoch": 3796} {"train_loss": -6.774600028991699, "global_step": 159464, "epoch": 3796} {"train_loss": -6.872262954711914, "global_step": 159465, "epoch": 3796} {"train_loss": -6.669158935546875, "global_step": 159466, "epoch": 3796} {"train_loss": -6.853353500366211, "global_step": 159467, "epoch": 3796} {"train_loss": -6.766964912414551, "global_step": 159468, "epoch": 3796} {"train_loss": -6.831989288330078, "global_step": 159469, "epoch": 3796} {"train_loss": -6.991977691650391, "global_step": 159470, "epoch": 3796} {"train_loss": -6.8188676834106445, "global_step": 159471, "epoch": 3796} {"train_loss": -6.884313583374023, "global_step": 159472, "epoch": 3796} {"train_loss": -6.910227026258196, "global_step": 159473, "epoch": 3796, "val_loss": 79233.9921875} {"train_loss": -6.897212982177734, "global_step": 159474, "epoch": 3797} {"train_loss": -6.88210916519165, "global_step": 159475, "epoch": 3797} {"train_loss": -6.89167594909668, "global_step": 159476, "epoch": 3797} {"train_loss": -6.98161506652832, "global_step": 159477, "epoch": 3797} {"train_loss": -6.853967666625977, "global_step": 159478, "epoch": 3797} {"train_loss": -6.8850860595703125, "global_step": 159479, "epoch": 3797} {"train_loss": -6.854711532592773, "global_step": 159480, "epoch": 3797} {"train_loss": -6.868464469909668, "global_step": 159481, "epoch": 3797} {"train_loss": -7.003908157348633, "global_step": 159482, "epoch": 3797} {"train_loss": -7.018154144287109, "global_step": 159483, "epoch": 3797} {"train_loss": -7.059321880340576, "global_step": 159484, "epoch": 3797} {"train_loss": -6.843502044677734, "global_step": 159485, "epoch": 3797} {"train_loss": -6.908450603485107, "global_step": 159486, "epoch": 3797} {"train_loss": -6.997523307800293, "global_step": 159487, "epoch": 3797} {"train_loss": -6.970461368560791, "global_step": 159488, "epoch": 3797} {"train_loss": -7.036188125610352, "global_step": 159489, "epoch": 3797} {"train_loss": -6.941255569458008, "global_step": 159490, "epoch": 3797} {"train_loss": -6.946910858154297, "global_step": 159491, "epoch": 3797} {"train_loss": -7.0183491706848145, "global_step": 159492, "epoch": 3797} {"train_loss": -7.0725226402282715, "global_step": 159493, "epoch": 3797} {"train_loss": -6.96134090423584, "global_step": 159494, "epoch": 3797} {"train_loss": -6.925365447998047, "global_step": 159495, "epoch": 3797} {"train_loss": -6.937860012054443, "global_step": 159496, "epoch": 3797} {"train_loss": -6.997339248657227, "global_step": 159497, "epoch": 3797} {"train_loss": -6.872723579406738, "global_step": 159498, "epoch": 3797} {"train_loss": -6.916584014892578, "global_step": 159499, "epoch": 3797} {"train_loss": -6.82144832611084, "global_step": 159500, "epoch": 3797} {"train_loss": -6.903067588806152, "global_step": 159501, "epoch": 3797} {"train_loss": -6.938738822937012, "global_step": 159502, "epoch": 3797} {"train_loss": -6.817973613739014, "global_step": 159503, "epoch": 3797} {"train_loss": -7.015935897827148, "global_step": 159504, "epoch": 3797} {"train_loss": -6.960781097412109, "global_step": 159505, "epoch": 3797} {"train_loss": -6.876068592071533, "global_step": 159506, "epoch": 3797} {"train_loss": -6.95298957824707, "global_step": 159507, "epoch": 3797} {"train_loss": -7.088583946228027, "global_step": 159508, "epoch": 3797} {"train_loss": -6.920590877532959, "global_step": 159509, "epoch": 3797} {"train_loss": -7.0111823081970215, "global_step": 159510, "epoch": 3797} {"train_loss": -6.997786045074463, "global_step": 159511, "epoch": 3797} {"train_loss": -7.017261505126953, "global_step": 159512, "epoch": 3797} {"train_loss": -6.939878463745117, "global_step": 159513, "epoch": 3797} {"train_loss": -6.80621337890625, "global_step": 159514, "epoch": 3797} {"train_loss": -6.942942687443325, "global_step": 159515, "epoch": 3797, "val_loss": 79565.6484375} {"train_loss": -6.926224708557129, "global_step": 159516, "epoch": 3798} {"train_loss": -6.935521125793457, "global_step": 159517, "epoch": 3798} {"train_loss": -6.964796543121338, "global_step": 159518, "epoch": 3798} {"train_loss": -7.0504913330078125, "global_step": 159519, "epoch": 3798} {"train_loss": -6.937513828277588, "global_step": 159520, "epoch": 3798} {"train_loss": -6.967800140380859, "global_step": 159521, "epoch": 3798} {"train_loss": -6.984394073486328, "global_step": 159522, "epoch": 3798} {"train_loss": -6.955120086669922, "global_step": 159523, "epoch": 3798} {"train_loss": -6.988149642944336, "global_step": 159524, "epoch": 3798} {"train_loss": -6.914514064788818, "global_step": 159525, "epoch": 3798} {"train_loss": -6.874266147613525, "global_step": 159526, "epoch": 3798} {"train_loss": -7.102628707885742, "global_step": 159527, "epoch": 3798} {"train_loss": -6.857731819152832, "global_step": 159528, "epoch": 3798} {"train_loss": -6.966915607452393, "global_step": 159529, "epoch": 3798} {"train_loss": -6.974906921386719, "global_step": 159530, "epoch": 3798} {"train_loss": -7.011849403381348, "global_step": 159531, "epoch": 3798} {"train_loss": -6.87952995300293, "global_step": 159532, "epoch": 3798} {"train_loss": -6.990045547485352, "global_step": 159533, "epoch": 3798} {"train_loss": -6.971756458282471, "global_step": 159534, "epoch": 3798} {"train_loss": -7.005423069000244, "global_step": 159535, "epoch": 3798} {"train_loss": -6.983826637268066, "global_step": 159536, "epoch": 3798} {"train_loss": -6.8953728675842285, "global_step": 159537, "epoch": 3798} {"train_loss": -6.991790771484375, "global_step": 159538, "epoch": 3798} {"train_loss": -6.969888687133789, "global_step": 159539, "epoch": 3798} {"train_loss": -6.977179527282715, "global_step": 159540, "epoch": 3798} {"train_loss": -6.980738639831543, "global_step": 159541, "epoch": 3798} {"train_loss": -6.956956386566162, "global_step": 159542, "epoch": 3798} {"train_loss": -6.943523406982422, "global_step": 159543, "epoch": 3798} {"train_loss": -7.029250144958496, "global_step": 159544, "epoch": 3798} {"train_loss": -6.773420333862305, "global_step": 159545, "epoch": 3798} {"train_loss": -6.9229960441589355, "global_step": 159546, "epoch": 3798} {"train_loss": -6.85036563873291, "global_step": 159547, "epoch": 3798} {"train_loss": -6.877994537353516, "global_step": 159548, "epoch": 3798} {"train_loss": -6.945488929748535, "global_step": 159549, "epoch": 3798} {"train_loss": -6.887103080749512, "global_step": 159550, "epoch": 3798} {"train_loss": -6.9887495040893555, "global_step": 159551, "epoch": 3798} {"train_loss": -7.013124942779541, "global_step": 159552, "epoch": 3798} {"train_loss": -7.015552520751953, "global_step": 159553, "epoch": 3798} {"train_loss": -6.9799981117248535, "global_step": 159554, "epoch": 3798} {"train_loss": -6.830313205718994, "global_step": 159555, "epoch": 3798} {"train_loss": -6.842437744140625, "global_step": 159556, "epoch": 3798} {"train_loss": -6.949909891401019, "global_step": 159557, "epoch": 3798, "val_loss": 79248.9375} {"train_loss": -6.981402397155762, "global_step": 159558, "epoch": 3799} {"train_loss": -6.9570817947387695, "global_step": 159559, "epoch": 3799} {"train_loss": -7.049871444702148, "global_step": 159560, "epoch": 3799} {"train_loss": -6.919882297515869, "global_step": 159561, "epoch": 3799} {"train_loss": -6.9853057861328125, "global_step": 159562, "epoch": 3799} {"train_loss": -6.980116844177246, "global_step": 159563, "epoch": 3799} {"train_loss": -6.9120378494262695, "global_step": 159564, "epoch": 3799} {"train_loss": -6.932619094848633, "global_step": 159565, "epoch": 3799} {"train_loss": -6.976200103759766, "global_step": 159566, "epoch": 3799} {"train_loss": -6.903324604034424, "global_step": 159567, "epoch": 3799} {"train_loss": -6.94080924987793, "global_step": 159568, "epoch": 3799} {"train_loss": -6.987162113189697, "global_step": 159569, "epoch": 3799} {"train_loss": -6.884621620178223, "global_step": 159570, "epoch": 3799} {"train_loss": -6.873263359069824, "global_step": 159571, "epoch": 3799} {"train_loss": -6.820572853088379, "global_step": 159572, "epoch": 3799} {"train_loss": -6.957271575927734, "global_step": 159573, "epoch": 3799} {"train_loss": -6.928014755249023, "global_step": 159574, "epoch": 3799} {"train_loss": -6.966300964355469, "global_step": 159575, "epoch": 3799} {"train_loss": -6.936661720275879, "global_step": 159576, "epoch": 3799} {"train_loss": -6.922483444213867, "global_step": 159577, "epoch": 3799} {"train_loss": -6.912925720214844, "global_step": 159578, "epoch": 3799} {"train_loss": -6.968341827392578, "global_step": 159579, "epoch": 3799} {"train_loss": -6.879192352294922, "global_step": 159580, "epoch": 3799} {"train_loss": -6.9315185546875, "global_step": 159581, "epoch": 3799} {"train_loss": -6.925081253051758, "global_step": 159582, "epoch": 3799} {"train_loss": -7.014120101928711, "global_step": 159583, "epoch": 3799} {"train_loss": -7.0265913009643555, "global_step": 159584, "epoch": 3799} {"train_loss": -7.002435684204102, "global_step": 159585, "epoch": 3799} {"train_loss": -6.956769943237305, "global_step": 159586, "epoch": 3799} {"train_loss": -6.958442687988281, "global_step": 159587, "epoch": 3799} {"train_loss": -6.973933219909668, "global_step": 159588, "epoch": 3799} {"train_loss": -6.919150352478027, "global_step": 159589, "epoch": 3799} {"train_loss": -6.896631240844727, "global_step": 159590, "epoch": 3799} {"train_loss": -6.923938751220703, "global_step": 159591, "epoch": 3799} {"train_loss": -6.921772003173828, "global_step": 159592, "epoch": 3799} {"train_loss": -7.005890369415283, "global_step": 159593, "epoch": 3799} {"train_loss": -6.915614128112793, "global_step": 159594, "epoch": 3799} {"train_loss": -6.986830711364746, "global_step": 159595, "epoch": 3799} {"train_loss": -6.998663902282715, "global_step": 159596, "epoch": 3799} {"train_loss": -6.957571029663086, "global_step": 159597, "epoch": 3799} {"train_loss": -6.842286109924316, "global_step": 159598, "epoch": 3799} {"train_loss": -6.943684736887614, "global_step": 159599, "epoch": 3799, "val_loss": 79182.03125} {"train_loss": -6.86923885345459, "global_step": 159600, "epoch": 3800} {"train_loss": -6.778652667999268, "global_step": 159601, "epoch": 3800} {"train_loss": -6.876367568969727, "global_step": 159602, "epoch": 3800} {"train_loss": -6.9620842933654785, "global_step": 159603, "epoch": 3800} {"train_loss": -6.8551788330078125, "global_step": 159604, "epoch": 3800} {"train_loss": -6.87331485748291, "global_step": 159605, "epoch": 3800} {"train_loss": -6.764681816101074, "global_step": 159606, "epoch": 3800} {"train_loss": -6.875423908233643, "global_step": 159607, "epoch": 3800} {"train_loss": -7.033817291259766, "global_step": 159608, "epoch": 3800} {"train_loss": -6.974580764770508, "global_step": 159609, "epoch": 3800} {"train_loss": -6.844820022583008, "global_step": 159610, "epoch": 3800} {"train_loss": -6.916049957275391, "global_step": 159611, "epoch": 3800} {"train_loss": -6.865351676940918, "global_step": 159612, "epoch": 3800} {"train_loss": -6.987337112426758, "global_step": 159613, "epoch": 3800} {"train_loss": -6.982132434844971, "global_step": 159614, "epoch": 3800} {"train_loss": -6.778654098510742, "global_step": 159615, "epoch": 3800} {"train_loss": -6.837894916534424, "global_step": 159616, "epoch": 3800} {"train_loss": -6.889370918273926, "global_step": 159617, "epoch": 3800} {"train_loss": -6.807547569274902, "global_step": 159618, "epoch": 3800} {"train_loss": -6.812183856964111, "global_step": 159619, "epoch": 3800} {"train_loss": -6.909162521362305, "global_step": 159620, "epoch": 3800} {"train_loss": -6.878775596618652, "global_step": 159621, "epoch": 3800} {"train_loss": -6.920088291168213, "global_step": 159622, "epoch": 3800} {"train_loss": -7.013045787811279, "global_step": 159623, "epoch": 3800} {"train_loss": -6.927506446838379, "global_step": 159624, "epoch": 3800} {"train_loss": -6.9150543212890625, "global_step": 159625, "epoch": 3800} {"train_loss": -6.88122034072876, "global_step": 159626, "epoch": 3800} {"train_loss": -6.79266357421875, "global_step": 159627, "epoch": 3800} {"train_loss": -6.8864665031433105, "global_step": 159628, "epoch": 3800} {"train_loss": -6.951079368591309, "global_step": 159629, "epoch": 3800} {"train_loss": -6.865427494049072, "global_step": 159630, "epoch": 3800} {"train_loss": -7.011581897735596, "global_step": 159631, "epoch": 3800} {"train_loss": -6.972362518310547, "global_step": 159632, "epoch": 3800} {"train_loss": -6.935441017150879, "global_step": 159633, "epoch": 3800} {"train_loss": -6.883875846862793, "global_step": 159634, "epoch": 3800} {"train_loss": -7.000434875488281, "global_step": 159635, "epoch": 3800} {"train_loss": -6.886335849761963, "global_step": 159636, "epoch": 3800} {"train_loss": -7.019546031951904, "global_step": 159637, "epoch": 3800} {"train_loss": -6.990774154663086, "global_step": 159638, "epoch": 3800} {"train_loss": -6.936624050140381, "global_step": 159639, "epoch": 3800} {"train_loss": -6.921602725982666, "global_step": 159640, "epoch": 3800} {"train_loss": -6.903616803033011, "global_step": 159641, "epoch": 3800, "train/sim_max_reward_0": 0.19534120869181754, "train/sim_max_reward_1": 0.9045295855875659, "train/sim_max_reward_2": 0.3854225715423504, "train/sim_max_reward_3": 0.15547932846030388, "train/sim_max_reward_4": 0.29798140715827925, "train/sim_max_reward_5": 0.9973698047903884, "test/sim_max_reward_4500000": 0.9206887842287794, "test/sim_max_reward_4500001": 0.9842924258858563, "test/sim_max_reward_4500002": 0.9583339465605498, "test/sim_max_reward_4500003": 0.9554551792433459, "test/sim_max_reward_4500004": 0.11790108553853296, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 0.865197943366603, "test/sim_max_reward_4500007": 0.9793254554299566, "test/sim_max_reward_4500008": 0.019765620363342944, "test/sim_max_reward_4500009": 0.05341364021203863, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.5350365099759505, "test/sim_max_reward_4500012": 0.5701270898887443, "test/sim_max_reward_4500013": 0.008435462241949923, "test/sim_max_reward_4500014": 0.8984466199379397, "test/sim_max_reward_4500015": 0.9624217811279391, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0874709148434452, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.9887935003697983, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9854017303999957, "test/sim_max_reward_4500022": 0.9745091984684029, "test/sim_max_reward_4500023": 0.674118601613486, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9433179923259883, "test/sim_max_reward_4500026": 0.913181725567623, "test/sim_max_reward_4500027": 0.9588192371118919, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.0455110263472825, "test/sim_max_reward_4500030": 0.9990926874172038, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04657564472436191, "test/sim_max_reward_4500033": 1.0, "test/sim_max_reward_4500034": 0.9439353292354581, "test/sim_max_reward_4500035": 0.9819572348920739, "test/sim_max_reward_4500036": 0.41559203469666556, "test/sim_max_reward_4500037": 0.9998590105385646, "test/sim_max_reward_4500038": 0.9621170366631192, "test/sim_max_reward_4500039": 0.9795016936907436, "test/sim_max_reward_4500040": 0.9613233030170697, "test/sim_max_reward_4500041": 0.7803371914456508, "test/sim_max_reward_4500042": 0.007061909733813467, "test/sim_max_reward_4500043": 0.9997955911453713, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.39325888992275954, "test/sim_max_reward_4500046": 0.22929347620977067, "test/sim_max_reward_4500047": 0.9015185065922066, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.48935398437178423, "test/mean_score": 0.5845869255385124, "val_loss": 79774.9375} {"train_loss": -6.830767631530762, "global_step": 159642, "epoch": 3801} {"train_loss": -6.911953926086426, "global_step": 159643, "epoch": 3801} {"train_loss": -6.948252201080322, "global_step": 159644, "epoch": 3801} {"train_loss": -6.923084735870361, "global_step": 159645, "epoch": 3801} {"train_loss": -6.8560791015625, "global_step": 159646, "epoch": 3801} {"train_loss": -6.963732719421387, "global_step": 159647, "epoch": 3801} {"train_loss": -6.874278545379639, "global_step": 159648, "epoch": 3801} {"train_loss": -7.000141620635986, "global_step": 159649, "epoch": 3801} {"train_loss": -6.968867301940918, "global_step": 159650, "epoch": 3801} {"train_loss": -6.97579288482666, "global_step": 159651, "epoch": 3801} {"train_loss": -6.949115753173828, "global_step": 159652, "epoch": 3801} {"train_loss": -7.0348920822143555, "global_step": 159653, "epoch": 3801} {"train_loss": -6.9405059814453125, "global_step": 159654, "epoch": 3801} {"train_loss": -7.06295108795166, "global_step": 159655, "epoch": 3801} {"train_loss": -6.923277854919434, "global_step": 159656, "epoch": 3801} {"train_loss": -7.0164289474487305, "global_step": 159657, "epoch": 3801} {"train_loss": -7.041550636291504, "global_step": 159658, "epoch": 3801} {"train_loss": -7.0275068283081055, "global_step": 159659, "epoch": 3801} {"train_loss": -6.902863502502441, "global_step": 159660, "epoch": 3801} {"train_loss": -7.046666145324707, "global_step": 159661, "epoch": 3801} {"train_loss": -6.895301342010498, "global_step": 159662, "epoch": 3801} {"train_loss": -6.8973283767700195, "global_step": 159663, "epoch": 3801} {"train_loss": -7.0528411865234375, "global_step": 159664, "epoch": 3801} {"train_loss": -6.942996501922607, "global_step": 159665, "epoch": 3801} {"train_loss": -6.8902363777160645, "global_step": 159666, "epoch": 3801} {"train_loss": -6.853207588195801, "global_step": 159667, "epoch": 3801} {"train_loss": -6.92227840423584, "global_step": 159668, "epoch": 3801} {"train_loss": -6.95944356918335, "global_step": 159669, "epoch": 3801} {"train_loss": -7.046868324279785, "global_step": 159670, "epoch": 3801} {"train_loss": -7.0495524406433105, "global_step": 159671, "epoch": 3801} {"train_loss": -6.90668249130249, "global_step": 159672, "epoch": 3801} {"train_loss": -6.958852291107178, "global_step": 159673, "epoch": 3801} {"train_loss": -6.913233757019043, "global_step": 159674, "epoch": 3801} {"train_loss": -7.038056373596191, "global_step": 159675, "epoch": 3801} {"train_loss": -6.958919525146484, "global_step": 159676, "epoch": 3801} {"train_loss": -6.996947765350342, "global_step": 159677, "epoch": 3801} {"train_loss": -6.961438179016113, "global_step": 159678, "epoch": 3801} {"train_loss": -6.933969497680664, "global_step": 159679, "epoch": 3801} {"train_loss": -6.9772210121154785, "global_step": 159680, "epoch": 3801} {"train_loss": -6.835379123687744, "global_step": 159681, "epoch": 3801} {"train_loss": -6.9334001541137695, "global_step": 159682, "epoch": 3801} {"train_loss": -6.952322959899902, "global_step": 159683, "epoch": 3801, "val_loss": 79482.3125} {"train_loss": -6.9527692794799805, "global_step": 159684, "epoch": 3802} {"train_loss": -7.073426246643066, "global_step": 159685, "epoch": 3802} {"train_loss": -6.910831451416016, "global_step": 159686, "epoch": 3802} {"train_loss": -6.881947040557861, "global_step": 159687, "epoch": 3802} {"train_loss": -6.96645450592041, "global_step": 159688, "epoch": 3802} {"train_loss": -6.876689434051514, "global_step": 159689, "epoch": 3802} {"train_loss": -6.952876091003418, "global_step": 159690, "epoch": 3802} {"train_loss": -7.067761421203613, "global_step": 159691, "epoch": 3802} {"train_loss": -6.97976016998291, "global_step": 159692, "epoch": 3802} {"train_loss": -6.899315357208252, "global_step": 159693, "epoch": 3802} {"train_loss": -6.9369330406188965, "global_step": 159694, "epoch": 3802} {"train_loss": -6.9506120681762695, "global_step": 159695, "epoch": 3802} {"train_loss": -6.956315517425537, "global_step": 159696, "epoch": 3802} {"train_loss": -7.024247169494629, "global_step": 159697, "epoch": 3802} {"train_loss": -6.91300630569458, "global_step": 159698, "epoch": 3802} {"train_loss": -7.01832389831543, "global_step": 159699, "epoch": 3802} {"train_loss": -6.968626022338867, "global_step": 159700, "epoch": 3802} {"train_loss": -6.88731575012207, "global_step": 159701, "epoch": 3802} {"train_loss": -6.879078388214111, "global_step": 159702, "epoch": 3802} {"train_loss": -6.989212989807129, "global_step": 159703, "epoch": 3802} {"train_loss": -7.036632537841797, "global_step": 159704, "epoch": 3802} {"train_loss": -6.901968955993652, "global_step": 159705, "epoch": 3802} {"train_loss": -7.107680320739746, "global_step": 159706, "epoch": 3802} {"train_loss": -7.050631523132324, "global_step": 159707, "epoch": 3802} {"train_loss": -6.92683219909668, "global_step": 159708, "epoch": 3802} {"train_loss": -6.9597063064575195, "global_step": 159709, "epoch": 3802} {"train_loss": -6.899479866027832, "global_step": 159710, "epoch": 3802} {"train_loss": -6.994791030883789, "global_step": 159711, "epoch": 3802} {"train_loss": -6.982297897338867, "global_step": 159712, "epoch": 3802} {"train_loss": -6.891360759735107, "global_step": 159713, "epoch": 3802} {"train_loss": -6.83018684387207, "global_step": 159714, "epoch": 3802} {"train_loss": -6.828037261962891, "global_step": 159715, "epoch": 3802} {"train_loss": -6.892031669616699, "global_step": 159716, "epoch": 3802} {"train_loss": -6.749934196472168, "global_step": 159717, "epoch": 3802} {"train_loss": -6.710538864135742, "global_step": 159718, "epoch": 3802} {"train_loss": -6.945284366607666, "global_step": 159719, "epoch": 3802} {"train_loss": -6.7701873779296875, "global_step": 159720, "epoch": 3802} {"train_loss": -6.8011250495910645, "global_step": 159721, "epoch": 3802} {"train_loss": -6.784889221191406, "global_step": 159722, "epoch": 3802} {"train_loss": -6.786336421966553, "global_step": 159723, "epoch": 3802} {"train_loss": -6.650774955749512, "global_step": 159724, "epoch": 3802} {"train_loss": -6.913733709426153, "global_step": 159725, "epoch": 3802, "val_loss": 79413.125} {"train_loss": -6.833187580108643, "global_step": 159726, "epoch": 3803} {"train_loss": -6.771223068237305, "global_step": 159727, "epoch": 3803} {"train_loss": -6.771231651306152, "global_step": 159728, "epoch": 3803} {"train_loss": -6.653432846069336, "global_step": 159729, "epoch": 3803} {"train_loss": -6.835355281829834, "global_step": 159730, "epoch": 3803} {"train_loss": -6.786132335662842, "global_step": 159731, "epoch": 3803} {"train_loss": -6.721903324127197, "global_step": 159732, "epoch": 3803} {"train_loss": -6.888308048248291, "global_step": 159733, "epoch": 3803} {"train_loss": -6.710657119750977, "global_step": 159734, "epoch": 3803} {"train_loss": -6.808945655822754, "global_step": 159735, "epoch": 3803} {"train_loss": -6.728329658508301, "global_step": 159736, "epoch": 3803} {"train_loss": -6.910667419433594, "global_step": 159737, "epoch": 3803} {"train_loss": -6.861618995666504, "global_step": 159738, "epoch": 3803} {"train_loss": -6.911635398864746, "global_step": 159739, "epoch": 3803} {"train_loss": -6.846926212310791, "global_step": 159740, "epoch": 3803} {"train_loss": -6.858781337738037, "global_step": 159741, "epoch": 3803} {"train_loss": -6.830108642578125, "global_step": 159742, "epoch": 3803} {"train_loss": -6.876972675323486, "global_step": 159743, "epoch": 3803} {"train_loss": -6.881269454956055, "global_step": 159744, "epoch": 3803} {"train_loss": -6.9051971435546875, "global_step": 159745, "epoch": 3803} {"train_loss": -6.960805892944336, "global_step": 159746, "epoch": 3803} {"train_loss": -7.011188507080078, "global_step": 159747, "epoch": 3803} {"train_loss": -6.955295562744141, "global_step": 159748, "epoch": 3803} {"train_loss": -6.994037628173828, "global_step": 159749, "epoch": 3803} {"train_loss": -6.9188642501831055, "global_step": 159750, "epoch": 3803} {"train_loss": -6.874789237976074, "global_step": 159751, "epoch": 3803} {"train_loss": -6.998038291931152, "global_step": 159752, "epoch": 3803} {"train_loss": -6.878461837768555, "global_step": 159753, "epoch": 3803} {"train_loss": -7.009990692138672, "global_step": 159754, "epoch": 3803} {"train_loss": -7.019339561462402, "global_step": 159755, "epoch": 3803} {"train_loss": -6.975161075592041, "global_step": 159756, "epoch": 3803} {"train_loss": -7.008609294891357, "global_step": 159757, "epoch": 3803} {"train_loss": -7.010534286499023, "global_step": 159758, "epoch": 3803} {"train_loss": -7.160987854003906, "global_step": 159759, "epoch": 3803} {"train_loss": -6.898888111114502, "global_step": 159760, "epoch": 3803} {"train_loss": -7.00771427154541, "global_step": 159761, "epoch": 3803} {"train_loss": -6.991306304931641, "global_step": 159762, "epoch": 3803} {"train_loss": -6.827506065368652, "global_step": 159763, "epoch": 3803} {"train_loss": -6.993956565856934, "global_step": 159764, "epoch": 3803} {"train_loss": -7.157944679260254, "global_step": 159765, "epoch": 3803} {"train_loss": -6.868720054626465, "global_step": 159766, "epoch": 3803} {"train_loss": -6.900267623719715, "global_step": 159767, "epoch": 3803, "val_loss": 79307.375} {"train_loss": -7.107278823852539, "global_step": 159768, "epoch": 3804} {"train_loss": -7.055990219116211, "global_step": 159769, "epoch": 3804} {"train_loss": -7.0557861328125, "global_step": 159770, "epoch": 3804} {"train_loss": -6.938170433044434, "global_step": 159771, "epoch": 3804} {"train_loss": -7.058561325073242, "global_step": 159772, "epoch": 3804} {"train_loss": -7.025046348571777, "global_step": 159773, "epoch": 3804} {"train_loss": -6.930414199829102, "global_step": 159774, "epoch": 3804} {"train_loss": -6.975761413574219, "global_step": 159775, "epoch": 3804} {"train_loss": -6.947428226470947, "global_step": 159776, "epoch": 3804} {"train_loss": -7.072974681854248, "global_step": 159777, "epoch": 3804} {"train_loss": -7.024955749511719, "global_step": 159778, "epoch": 3804} {"train_loss": -7.008705139160156, "global_step": 159779, "epoch": 3804} {"train_loss": -7.058150291442871, "global_step": 159780, "epoch": 3804} {"train_loss": -6.941633224487305, "global_step": 159781, "epoch": 3804} {"train_loss": -6.9756340980529785, "global_step": 159782, "epoch": 3804} {"train_loss": -7.076818466186523, "global_step": 159783, "epoch": 3804} {"train_loss": -7.001089572906494, "global_step": 159784, "epoch": 3804} {"train_loss": -7.005228042602539, "global_step": 159785, "epoch": 3804} {"train_loss": -7.1298017501831055, "global_step": 159786, "epoch": 3804} {"train_loss": -7.099890232086182, "global_step": 159787, "epoch": 3804} {"train_loss": -6.993747711181641, "global_step": 159788, "epoch": 3804} {"train_loss": -7.021381378173828, "global_step": 159789, "epoch": 3804} {"train_loss": -6.936797142028809, "global_step": 159790, "epoch": 3804} {"train_loss": -6.933904647827148, "global_step": 159791, "epoch": 3804} {"train_loss": -7.018910884857178, "global_step": 159792, "epoch": 3804} {"train_loss": -6.998284339904785, "global_step": 159793, "epoch": 3804} {"train_loss": -6.9893999099731445, "global_step": 159794, "epoch": 3804} {"train_loss": -7.019888877868652, "global_step": 159795, "epoch": 3804} {"train_loss": -6.962369441986084, "global_step": 159796, "epoch": 3804} {"train_loss": -6.901839256286621, "global_step": 159797, "epoch": 3804} {"train_loss": -6.993588924407959, "global_step": 159798, "epoch": 3804} {"train_loss": -6.898434638977051, "global_step": 159799, "epoch": 3804} {"train_loss": -6.932496070861816, "global_step": 159800, "epoch": 3804} {"train_loss": -6.897339344024658, "global_step": 159801, "epoch": 3804} {"train_loss": -7.064109802246094, "global_step": 159802, "epoch": 3804} {"train_loss": -6.884608268737793, "global_step": 159803, "epoch": 3804} {"train_loss": -6.933964729309082, "global_step": 159804, "epoch": 3804} {"train_loss": -6.954195976257324, "global_step": 159805, "epoch": 3804} {"train_loss": -6.9593729972839355, "global_step": 159806, "epoch": 3804} {"train_loss": -6.993358612060547, "global_step": 159807, "epoch": 3804} {"train_loss": -6.983422756195068, "global_step": 159808, "epoch": 3804} {"train_loss": -6.992148036048526, "global_step": 159809, "epoch": 3804, "val_loss": 79027.875} {"train_loss": -6.861313343048096, "global_step": 159810, "epoch": 3805} {"train_loss": -6.8976850509643555, "global_step": 159811, "epoch": 3805} {"train_loss": -6.915475845336914, "global_step": 159812, "epoch": 3805} {"train_loss": -6.887701988220215, "global_step": 159813, "epoch": 3805} {"train_loss": -6.998110771179199, "global_step": 159814, "epoch": 3805} {"train_loss": -6.954958915710449, "global_step": 159815, "epoch": 3805} {"train_loss": -6.940564155578613, "global_step": 159816, "epoch": 3805} {"train_loss": -7.061169624328613, "global_step": 159817, "epoch": 3805} {"train_loss": -6.890488147735596, "global_step": 159818, "epoch": 3805} {"train_loss": -7.002754211425781, "global_step": 159819, "epoch": 3805} {"train_loss": -7.025051116943359, "global_step": 159820, "epoch": 3805} {"train_loss": -6.94363260269165, "global_step": 159821, "epoch": 3805} {"train_loss": -6.849628448486328, "global_step": 159822, "epoch": 3805} {"train_loss": -6.892439842224121, "global_step": 159823, "epoch": 3805} {"train_loss": -6.923051834106445, "global_step": 159824, "epoch": 3805} {"train_loss": -6.99784517288208, "global_step": 159825, "epoch": 3805} {"train_loss": -6.870114803314209, "global_step": 159826, "epoch": 3805} {"train_loss": -6.886233329772949, "global_step": 159827, "epoch": 3805} {"train_loss": -6.8654327392578125, "global_step": 159828, "epoch": 3805} {"train_loss": -7.053642272949219, "global_step": 159829, "epoch": 3805} {"train_loss": -6.88740348815918, "global_step": 159830, "epoch": 3805} {"train_loss": -6.875370979309082, "global_step": 159831, "epoch": 3805} {"train_loss": -7.09523868560791, "global_step": 159832, "epoch": 3805} {"train_loss": -7.012028694152832, "global_step": 159833, "epoch": 3805} {"train_loss": -6.888949394226074, "global_step": 159834, "epoch": 3805} {"train_loss": -6.98356819152832, "global_step": 159835, "epoch": 3805} {"train_loss": -6.967324256896973, "global_step": 159836, "epoch": 3805} {"train_loss": -6.951286315917969, "global_step": 159837, "epoch": 3805} {"train_loss": -6.9055376052856445, "global_step": 159838, "epoch": 3805} {"train_loss": -6.832018852233887, "global_step": 159839, "epoch": 3805} {"train_loss": -6.970508575439453, "global_step": 159840, "epoch": 3805} {"train_loss": -7.001773357391357, "global_step": 159841, "epoch": 3805} {"train_loss": -6.912725448608398, "global_step": 159842, "epoch": 3805} {"train_loss": -6.978728771209717, "global_step": 159843, "epoch": 3805} {"train_loss": -6.887395858764648, "global_step": 159844, "epoch": 3805} {"train_loss": -6.861701011657715, "global_step": 159845, "epoch": 3805} {"train_loss": -6.977839469909668, "global_step": 159846, "epoch": 3805} {"train_loss": -6.823052406311035, "global_step": 159847, "epoch": 3805} {"train_loss": -6.81372594833374, "global_step": 159848, "epoch": 3805} {"train_loss": -7.000262260437012, "global_step": 159849, "epoch": 3805} {"train_loss": -6.768583297729492, "global_step": 159850, "epoch": 3805} {"train_loss": -6.933652752921695, "global_step": 159851, "epoch": 3805, "val_loss": 79634.3515625} {"train_loss": -6.902820110321045, "global_step": 159852, "epoch": 3806} {"train_loss": -6.952552318572998, "global_step": 159853, "epoch": 3806} {"train_loss": -6.9492082595825195, "global_step": 159854, "epoch": 3806} {"train_loss": -6.7286224365234375, "global_step": 159855, "epoch": 3806} {"train_loss": -6.837491989135742, "global_step": 159856, "epoch": 3806} {"train_loss": -6.8094682693481445, "global_step": 159857, "epoch": 3806} {"train_loss": -6.936366081237793, "global_step": 159858, "epoch": 3806} {"train_loss": -6.960591793060303, "global_step": 159859, "epoch": 3806} {"train_loss": -6.804142951965332, "global_step": 159860, "epoch": 3806} {"train_loss": -6.88822078704834, "global_step": 159861, "epoch": 3806} {"train_loss": -6.838257312774658, "global_step": 159862, "epoch": 3806} {"train_loss": -6.872067928314209, "global_step": 159863, "epoch": 3806} {"train_loss": -6.889540672302246, "global_step": 159864, "epoch": 3806} {"train_loss": -6.858233451843262, "global_step": 159865, "epoch": 3806} {"train_loss": -7.000051021575928, "global_step": 159866, "epoch": 3806} {"train_loss": -6.880545616149902, "global_step": 159867, "epoch": 3806} {"train_loss": -6.937437057495117, "global_step": 159868, "epoch": 3806} {"train_loss": -6.979975700378418, "global_step": 159869, "epoch": 3806} {"train_loss": -6.866483688354492, "global_step": 159870, "epoch": 3806} {"train_loss": -7.004261016845703, "global_step": 159871, "epoch": 3806} {"train_loss": -6.984033584594727, "global_step": 159872, "epoch": 3806} {"train_loss": -6.928620338439941, "global_step": 159873, "epoch": 3806} {"train_loss": -6.980151176452637, "global_step": 159874, "epoch": 3806} {"train_loss": -6.842026710510254, "global_step": 159875, "epoch": 3806} {"train_loss": -7.028302192687988, "global_step": 159876, "epoch": 3806} {"train_loss": -6.901617527008057, "global_step": 159877, "epoch": 3806} {"train_loss": -6.8871355056762695, "global_step": 159878, "epoch": 3806} {"train_loss": -6.999275207519531, "global_step": 159879, "epoch": 3806} {"train_loss": -6.8650617599487305, "global_step": 159880, "epoch": 3806} {"train_loss": -6.9222002029418945, "global_step": 159881, "epoch": 3806} {"train_loss": -6.954072952270508, "global_step": 159882, "epoch": 3806} {"train_loss": -6.90664005279541, "global_step": 159883, "epoch": 3806} {"train_loss": -7.043374538421631, "global_step": 159884, "epoch": 3806} {"train_loss": -6.945398330688477, "global_step": 159885, "epoch": 3806} {"train_loss": -6.927980422973633, "global_step": 159886, "epoch": 3806} {"train_loss": -6.876913070678711, "global_step": 159887, "epoch": 3806} {"train_loss": -6.940664291381836, "global_step": 159888, "epoch": 3806} {"train_loss": -6.8675079345703125, "global_step": 159889, "epoch": 3806} {"train_loss": -6.959817886352539, "global_step": 159890, "epoch": 3806} {"train_loss": -6.933643341064453, "global_step": 159891, "epoch": 3806} {"train_loss": -7.072481155395508, "global_step": 159892, "epoch": 3806} {"train_loss": -6.922721113477435, "global_step": 159893, "epoch": 3806, "val_loss": 79222.0859375} {"train_loss": -7.021819114685059, "global_step": 159894, "epoch": 3807} {"train_loss": -6.967596054077148, "global_step": 159895, "epoch": 3807} {"train_loss": -6.993026256561279, "global_step": 159896, "epoch": 3807} {"train_loss": -7.006817817687988, "global_step": 159897, "epoch": 3807} {"train_loss": -7.031297206878662, "global_step": 159898, "epoch": 3807} {"train_loss": -7.020017623901367, "global_step": 159899, "epoch": 3807} {"train_loss": -7.069921016693115, "global_step": 159900, "epoch": 3807} {"train_loss": -7.095532417297363, "global_step": 159901, "epoch": 3807} {"train_loss": -6.9214911460876465, "global_step": 159902, "epoch": 3807} {"train_loss": -6.914514541625977, "global_step": 159903, "epoch": 3807} {"train_loss": -7.054973125457764, "global_step": 159904, "epoch": 3807} {"train_loss": -7.016563415527344, "global_step": 159905, "epoch": 3807} {"train_loss": -7.03418493270874, "global_step": 159906, "epoch": 3807} {"train_loss": -7.0703935623168945, "global_step": 159907, "epoch": 3807} {"train_loss": -6.971170425415039, "global_step": 159908, "epoch": 3807} {"train_loss": -6.978680610656738, "global_step": 159909, "epoch": 3807} {"train_loss": -6.997736930847168, "global_step": 159910, "epoch": 3807} {"train_loss": -6.96103572845459, "global_step": 159911, "epoch": 3807} {"train_loss": -6.997296333312988, "global_step": 159912, "epoch": 3807} {"train_loss": -7.045638084411621, "global_step": 159913, "epoch": 3807} {"train_loss": -6.992544174194336, "global_step": 159914, "epoch": 3807} {"train_loss": -6.96613883972168, "global_step": 159915, "epoch": 3807} {"train_loss": -7.099729537963867, "global_step": 159916, "epoch": 3807} {"train_loss": -7.08342981338501, "global_step": 159917, "epoch": 3807} {"train_loss": -7.007874488830566, "global_step": 159918, "epoch": 3807} {"train_loss": -7.113546371459961, "global_step": 159919, "epoch": 3807} {"train_loss": -7.033389091491699, "global_step": 159920, "epoch": 3807} {"train_loss": -7.1312689781188965, "global_step": 159921, "epoch": 3807} {"train_loss": -6.942086219787598, "global_step": 159922, "epoch": 3807} {"train_loss": -6.980096817016602, "global_step": 159923, "epoch": 3807} {"train_loss": -6.999571323394775, "global_step": 159924, "epoch": 3807} {"train_loss": -6.965526580810547, "global_step": 159925, "epoch": 3807} {"train_loss": -7.070530891418457, "global_step": 159926, "epoch": 3807} {"train_loss": -6.997617721557617, "global_step": 159927, "epoch": 3807} {"train_loss": -7.011667251586914, "global_step": 159928, "epoch": 3807} {"train_loss": -6.934027194976807, "global_step": 159929, "epoch": 3807} {"train_loss": -6.9897308349609375, "global_step": 159930, "epoch": 3807} {"train_loss": -6.896181106567383, "global_step": 159931, "epoch": 3807} {"train_loss": -6.961453437805176, "global_step": 159932, "epoch": 3807} {"train_loss": -7.018039226531982, "global_step": 159933, "epoch": 3807} {"train_loss": -6.919348239898682, "global_step": 159934, "epoch": 3807} {"train_loss": -7.005121934981573, "global_step": 159935, "epoch": 3807, "val_loss": 79329.1484375} {"train_loss": -6.955549716949463, "global_step": 159936, "epoch": 3808} {"train_loss": -6.931631088256836, "global_step": 159937, "epoch": 3808} {"train_loss": -7.049295425415039, "global_step": 159938, "epoch": 3808} {"train_loss": -6.9504241943359375, "global_step": 159939, "epoch": 3808} {"train_loss": -6.963418960571289, "global_step": 159940, "epoch": 3808} {"train_loss": -6.907771110534668, "global_step": 159941, "epoch": 3808} {"train_loss": -6.983067512512207, "global_step": 159942, "epoch": 3808} {"train_loss": -7.076066970825195, "global_step": 159943, "epoch": 3808} {"train_loss": -6.941699981689453, "global_step": 159944, "epoch": 3808} {"train_loss": -6.894594192504883, "global_step": 159945, "epoch": 3808} {"train_loss": -6.91779899597168, "global_step": 159946, "epoch": 3808} {"train_loss": -6.963339328765869, "global_step": 159947, "epoch": 3808} {"train_loss": -6.917198181152344, "global_step": 159948, "epoch": 3808} {"train_loss": -6.881459712982178, "global_step": 159949, "epoch": 3808} {"train_loss": -7.044810771942139, "global_step": 159950, "epoch": 3808} {"train_loss": -6.864269256591797, "global_step": 159951, "epoch": 3808} {"train_loss": -6.962428092956543, "global_step": 159952, "epoch": 3808} {"train_loss": -7.052572250366211, "global_step": 159953, "epoch": 3808} {"train_loss": -6.805485248565674, "global_step": 159954, "epoch": 3808} {"train_loss": -6.85842227935791, "global_step": 159955, "epoch": 3808} {"train_loss": -6.888763427734375, "global_step": 159956, "epoch": 3808} {"train_loss": -6.816766738891602, "global_step": 159957, "epoch": 3808} {"train_loss": -7.066511154174805, "global_step": 159958, "epoch": 3808} {"train_loss": -6.798312664031982, "global_step": 159959, "epoch": 3808} {"train_loss": -6.760486602783203, "global_step": 159960, "epoch": 3808} {"train_loss": -6.801609516143799, "global_step": 159961, "epoch": 3808} {"train_loss": -6.836012840270996, "global_step": 159962, "epoch": 3808} {"train_loss": -6.88264274597168, "global_step": 159963, "epoch": 3808} {"train_loss": -6.812272071838379, "global_step": 159964, "epoch": 3808} {"train_loss": -7.01481819152832, "global_step": 159965, "epoch": 3808} {"train_loss": -6.780523300170898, "global_step": 159966, "epoch": 3808} {"train_loss": -6.866008281707764, "global_step": 159967, "epoch": 3808} {"train_loss": -6.936844825744629, "global_step": 159968, "epoch": 3808} {"train_loss": -6.795125961303711, "global_step": 159969, "epoch": 3808} {"train_loss": -6.92466926574707, "global_step": 159970, "epoch": 3808} {"train_loss": -6.798995018005371, "global_step": 159971, "epoch": 3808} {"train_loss": -7.027621269226074, "global_step": 159972, "epoch": 3808} {"train_loss": -6.8341217041015625, "global_step": 159973, "epoch": 3808} {"train_loss": -6.970357418060303, "global_step": 159974, "epoch": 3808} {"train_loss": -6.832058906555176, "global_step": 159975, "epoch": 3808} {"train_loss": -6.949894428253174, "global_step": 159976, "epoch": 3808} {"train_loss": -6.911326805750529, "global_step": 159977, "epoch": 3808, "val_loss": 79314.984375} {"train_loss": -6.999617576599121, "global_step": 159978, "epoch": 3809} {"train_loss": -7.024697303771973, "global_step": 159979, "epoch": 3809} {"train_loss": -6.865203380584717, "global_step": 159980, "epoch": 3809} {"train_loss": -6.941458702087402, "global_step": 159981, "epoch": 3809} {"train_loss": -6.807292938232422, "global_step": 159982, "epoch": 3809} {"train_loss": -6.996545314788818, "global_step": 159983, "epoch": 3809} {"train_loss": -7.005008697509766, "global_step": 159984, "epoch": 3809} {"train_loss": -7.050555229187012, "global_step": 159985, "epoch": 3809} {"train_loss": -6.966958999633789, "global_step": 159986, "epoch": 3809} {"train_loss": -6.960373878479004, "global_step": 159987, "epoch": 3809} {"train_loss": -7.036150932312012, "global_step": 159988, "epoch": 3809} {"train_loss": -7.047199249267578, "global_step": 159989, "epoch": 3809} {"train_loss": -6.9491376876831055, "global_step": 159990, "epoch": 3809} {"train_loss": -6.967672348022461, "global_step": 159991, "epoch": 3809} {"train_loss": -7.014431953430176, "global_step": 159992, "epoch": 3809} {"train_loss": -6.975411415100098, "global_step": 159993, "epoch": 3809} {"train_loss": -7.028935432434082, "global_step": 159994, "epoch": 3809} {"train_loss": -6.977313041687012, "global_step": 159995, "epoch": 3809} {"train_loss": -7.06537389755249, "global_step": 159996, "epoch": 3809} {"train_loss": -7.0077033042907715, "global_step": 159997, "epoch": 3809} {"train_loss": -7.2087507247924805, "global_step": 159998, "epoch": 3809} {"train_loss": -6.96071195602417, "global_step": 159999, "epoch": 3809} {"train_loss": -6.931571960449219, "global_step": 160000, "epoch": 3809} {"train_loss": -6.974836349487305, "global_step": 160001, "epoch": 3809} {"train_loss": -6.995519161224365, "global_step": 160002, "epoch": 3809} {"train_loss": -6.876464366912842, "global_step": 160003, "epoch": 3809} {"train_loss": -6.972332000732422, "global_step": 160004, "epoch": 3809} {"train_loss": -7.024502754211426, "global_step": 160005, "epoch": 3809} {"train_loss": -6.9468302726745605, "global_step": 160006, "epoch": 3809} {"train_loss": -7.018314361572266, "global_step": 160007, "epoch": 3809} {"train_loss": -6.898178577423096, "global_step": 160008, "epoch": 3809} {"train_loss": -6.903387069702148, "global_step": 160009, "epoch": 3809} {"train_loss": -6.962623596191406, "global_step": 160010, "epoch": 3809} {"train_loss": -6.8366379737854, "global_step": 160011, "epoch": 3809} {"train_loss": -6.812829494476318, "global_step": 160012, "epoch": 3809} {"train_loss": -6.9500627517700195, "global_step": 160013, "epoch": 3809} {"train_loss": -6.850589752197266, "global_step": 160014, "epoch": 3809} {"train_loss": -7.0172905921936035, "global_step": 160015, "epoch": 3809} {"train_loss": -6.865126609802246, "global_step": 160016, "epoch": 3809} {"train_loss": -6.878549575805664, "global_step": 160017, "epoch": 3809} {"train_loss": -6.950352668762207, "global_step": 160018, "epoch": 3809} {"train_loss": -6.964985586348034, "global_step": 160019, "epoch": 3809, "val_loss": 79241.6484375} {"train_loss": -6.849116802215576, "global_step": 160020, "epoch": 3810} {"train_loss": -7.030059814453125, "global_step": 160021, "epoch": 3810} {"train_loss": -6.944283485412598, "global_step": 160022, "epoch": 3810} {"train_loss": -6.957667350769043, "global_step": 160023, "epoch": 3810} {"train_loss": -6.773829936981201, "global_step": 160024, "epoch": 3810} {"train_loss": -6.952937126159668, "global_step": 160025, "epoch": 3810} {"train_loss": -6.798089027404785, "global_step": 160026, "epoch": 3810} {"train_loss": -6.816564083099365, "global_step": 160027, "epoch": 3810} {"train_loss": -7.034229278564453, "global_step": 160028, "epoch": 3810} {"train_loss": -6.857555389404297, "global_step": 160029, "epoch": 3810} {"train_loss": -6.8792619705200195, "global_step": 160030, "epoch": 3810} {"train_loss": -6.870770454406738, "global_step": 160031, "epoch": 3810} {"train_loss": -6.90676212310791, "global_step": 160032, "epoch": 3810} {"train_loss": -6.929110050201416, "global_step": 160033, "epoch": 3810} {"train_loss": -6.846273899078369, "global_step": 160034, "epoch": 3810} {"train_loss": -7.008004188537598, "global_step": 160035, "epoch": 3810} {"train_loss": -6.9332356452941895, "global_step": 160036, "epoch": 3810} {"train_loss": -6.956109046936035, "global_step": 160037, "epoch": 3810} {"train_loss": -6.883026599884033, "global_step": 160038, "epoch": 3810} {"train_loss": -6.890355110168457, "global_step": 160039, "epoch": 3810} {"train_loss": -6.974085807800293, "global_step": 160040, "epoch": 3810} {"train_loss": -7.039216041564941, "global_step": 160041, "epoch": 3810} {"train_loss": -6.980870246887207, "global_step": 160042, "epoch": 3810} {"train_loss": -6.98626708984375, "global_step": 160043, "epoch": 3810} {"train_loss": -6.905598163604736, "global_step": 160044, "epoch": 3810} {"train_loss": -6.89015007019043, "global_step": 160045, "epoch": 3810} {"train_loss": -6.889730453491211, "global_step": 160046, "epoch": 3810} {"train_loss": -6.851764678955078, "global_step": 160047, "epoch": 3810} {"train_loss": -6.88569450378418, "global_step": 160048, "epoch": 3810} {"train_loss": -6.938653469085693, "global_step": 160049, "epoch": 3810} {"train_loss": -6.964080810546875, "global_step": 160050, "epoch": 3810} {"train_loss": -6.961846351623535, "global_step": 160051, "epoch": 3810} {"train_loss": -6.957061767578125, "global_step": 160052, "epoch": 3810} {"train_loss": -6.900223731994629, "global_step": 160053, "epoch": 3810} {"train_loss": -6.923234939575195, "global_step": 160054, "epoch": 3810} {"train_loss": -6.936026096343994, "global_step": 160055, "epoch": 3810} {"train_loss": -6.885591506958008, "global_step": 160056, "epoch": 3810} {"train_loss": -6.9052934646606445, "global_step": 160057, "epoch": 3810} {"train_loss": -6.885006904602051, "global_step": 160058, "epoch": 3810} {"train_loss": -6.845772743225098, "global_step": 160059, "epoch": 3810} {"train_loss": -6.890777587890625, "global_step": 160060, "epoch": 3810} {"train_loss": -6.915855634780157, "global_step": 160061, "epoch": 3810, "val_loss": 79544.8046875} {"train_loss": -6.90498161315918, "global_step": 160062, "epoch": 3811} {"train_loss": -6.916120529174805, "global_step": 160063, "epoch": 3811} {"train_loss": -6.945205211639404, "global_step": 160064, "epoch": 3811} {"train_loss": -6.850083351135254, "global_step": 160065, "epoch": 3811} {"train_loss": -6.918515205383301, "global_step": 160066, "epoch": 3811} {"train_loss": -7.002418518066406, "global_step": 160067, "epoch": 3811} {"train_loss": -6.950193881988525, "global_step": 160068, "epoch": 3811} {"train_loss": -6.957573890686035, "global_step": 160069, "epoch": 3811} {"train_loss": -6.891173362731934, "global_step": 160070, "epoch": 3811} {"train_loss": -6.97811222076416, "global_step": 160071, "epoch": 3811} {"train_loss": -6.869207382202148, "global_step": 160072, "epoch": 3811} {"train_loss": -7.055893898010254, "global_step": 160073, "epoch": 3811} {"train_loss": -6.945323944091797, "global_step": 160074, "epoch": 3811} {"train_loss": -7.009818077087402, "global_step": 160075, "epoch": 3811} {"train_loss": -6.932294845581055, "global_step": 160076, "epoch": 3811} {"train_loss": -7.065758228302002, "global_step": 160077, "epoch": 3811} {"train_loss": -7.079346656799316, "global_step": 160078, "epoch": 3811} {"train_loss": -6.836864471435547, "global_step": 160079, "epoch": 3811} {"train_loss": -6.9883317947387695, "global_step": 160080, "epoch": 3811} {"train_loss": -6.968166351318359, "global_step": 160081, "epoch": 3811} {"train_loss": -6.864820957183838, "global_step": 160082, "epoch": 3811} {"train_loss": -6.945680618286133, "global_step": 160083, "epoch": 3811} {"train_loss": -6.80443000793457, "global_step": 160084, "epoch": 3811} {"train_loss": -6.875237464904785, "global_step": 160085, "epoch": 3811} {"train_loss": -7.0130767822265625, "global_step": 160086, "epoch": 3811} {"train_loss": -6.775884628295898, "global_step": 160087, "epoch": 3811} {"train_loss": -6.994590759277344, "global_step": 160088, "epoch": 3811} {"train_loss": -6.842716693878174, "global_step": 160089, "epoch": 3811} {"train_loss": -6.814323425292969, "global_step": 160090, "epoch": 3811} {"train_loss": -6.976770877838135, "global_step": 160091, "epoch": 3811} {"train_loss": -6.950049877166748, "global_step": 160092, "epoch": 3811} {"train_loss": -6.974725723266602, "global_step": 160093, "epoch": 3811} {"train_loss": -6.923543453216553, "global_step": 160094, "epoch": 3811} {"train_loss": -6.968467712402344, "global_step": 160095, "epoch": 3811} {"train_loss": -6.948143482208252, "global_step": 160096, "epoch": 3811} {"train_loss": -6.944408416748047, "global_step": 160097, "epoch": 3811} {"train_loss": -7.01436710357666, "global_step": 160098, "epoch": 3811} {"train_loss": -7.025261878967285, "global_step": 160099, "epoch": 3811} {"train_loss": -6.838529586791992, "global_step": 160100, "epoch": 3811} {"train_loss": -6.93363618850708, "global_step": 160101, "epoch": 3811} {"train_loss": -6.949573516845703, "global_step": 160102, "epoch": 3811} {"train_loss": -6.935983691896711, "global_step": 160103, "epoch": 3811, "val_loss": 79096.3203125} {"train_loss": -7.102716445922852, "global_step": 160104, "epoch": 3812} {"train_loss": -6.855658531188965, "global_step": 160105, "epoch": 3812} {"train_loss": -6.8657450675964355, "global_step": 160106, "epoch": 3812} {"train_loss": -6.928444862365723, "global_step": 160107, "epoch": 3812} {"train_loss": -6.982393264770508, "global_step": 160108, "epoch": 3812} {"train_loss": -6.812343597412109, "global_step": 160109, "epoch": 3812} {"train_loss": -6.973630905151367, "global_step": 160110, "epoch": 3812} {"train_loss": -6.9177937507629395, "global_step": 160111, "epoch": 3812} {"train_loss": -7.006342887878418, "global_step": 160112, "epoch": 3812} {"train_loss": -6.849621295928955, "global_step": 160113, "epoch": 3812} {"train_loss": -6.84660530090332, "global_step": 160114, "epoch": 3812} {"train_loss": -6.832666397094727, "global_step": 160115, "epoch": 3812} {"train_loss": -6.7775702476501465, "global_step": 160116, "epoch": 3812} {"train_loss": -6.9082112312316895, "global_step": 160117, "epoch": 3812} {"train_loss": -6.718935966491699, "global_step": 160118, "epoch": 3812} {"train_loss": -6.834390640258789, "global_step": 160119, "epoch": 3812} {"train_loss": -6.776876449584961, "global_step": 160120, "epoch": 3812} {"train_loss": -6.853961944580078, "global_step": 160121, "epoch": 3812} {"train_loss": -6.728110313415527, "global_step": 160122, "epoch": 3812} {"train_loss": -6.8790788650512695, "global_step": 160123, "epoch": 3812} {"train_loss": -6.927020072937012, "global_step": 160124, "epoch": 3812} {"train_loss": -6.765438079833984, "global_step": 160125, "epoch": 3812} {"train_loss": -6.796839714050293, "global_step": 160126, "epoch": 3812} {"train_loss": -6.911338806152344, "global_step": 160127, "epoch": 3812} {"train_loss": -6.928847789764404, "global_step": 160128, "epoch": 3812} {"train_loss": -6.871011734008789, "global_step": 160129, "epoch": 3812} {"train_loss": -6.8519744873046875, "global_step": 160130, "epoch": 3812} {"train_loss": -6.946073055267334, "global_step": 160131, "epoch": 3812} {"train_loss": -6.809235095977783, "global_step": 160132, "epoch": 3812} {"train_loss": -6.784233093261719, "global_step": 160133, "epoch": 3812} {"train_loss": -6.966118335723877, "global_step": 160134, "epoch": 3812} {"train_loss": -6.981332778930664, "global_step": 160135, "epoch": 3812} {"train_loss": -6.862592697143555, "global_step": 160136, "epoch": 3812} {"train_loss": -6.835095405578613, "global_step": 160137, "epoch": 3812} {"train_loss": -6.799807548522949, "global_step": 160138, "epoch": 3812} {"train_loss": -6.890313148498535, "global_step": 160139, "epoch": 3812} {"train_loss": -6.948314666748047, "global_step": 160140, "epoch": 3812} {"train_loss": -6.8261237144470215, "global_step": 160141, "epoch": 3812} {"train_loss": -6.897462844848633, "global_step": 160142, "epoch": 3812} {"train_loss": -6.84637451171875, "global_step": 160143, "epoch": 3812} {"train_loss": -7.015149116516113, "global_step": 160144, "epoch": 3812} {"train_loss": -6.879575638543992, "global_step": 160145, "epoch": 3812, "val_loss": 79451.234375} {"train_loss": -6.955989360809326, "global_step": 160146, "epoch": 3813} {"train_loss": -6.964581489562988, "global_step": 160147, "epoch": 3813} {"train_loss": -7.048831939697266, "global_step": 160148, "epoch": 3813} {"train_loss": -6.9366841316223145, "global_step": 160149, "epoch": 3813} {"train_loss": -6.846743583679199, "global_step": 160150, "epoch": 3813} {"train_loss": -6.979887962341309, "global_step": 160151, "epoch": 3813} {"train_loss": -6.946683883666992, "global_step": 160152, "epoch": 3813} {"train_loss": -6.964503288269043, "global_step": 160153, "epoch": 3813} {"train_loss": -6.803759574890137, "global_step": 160154, "epoch": 3813} {"train_loss": -7.03712797164917, "global_step": 160155, "epoch": 3813} {"train_loss": -7.057737827301025, "global_step": 160156, "epoch": 3813} {"train_loss": -7.00681734085083, "global_step": 160157, "epoch": 3813} {"train_loss": -7.1239118576049805, "global_step": 160158, "epoch": 3813} {"train_loss": -7.045742034912109, "global_step": 160159, "epoch": 3813} {"train_loss": -7.047574996948242, "global_step": 160160, "epoch": 3813} {"train_loss": -6.945023536682129, "global_step": 160161, "epoch": 3813} {"train_loss": -6.947737693786621, "global_step": 160162, "epoch": 3813} {"train_loss": -6.986485481262207, "global_step": 160163, "epoch": 3813} {"train_loss": -6.983386993408203, "global_step": 160164, "epoch": 3813} {"train_loss": -6.950983047485352, "global_step": 160165, "epoch": 3813} {"train_loss": -6.919610023498535, "global_step": 160166, "epoch": 3813} {"train_loss": -6.897627830505371, "global_step": 160167, "epoch": 3813} {"train_loss": -6.890252590179443, "global_step": 160168, "epoch": 3813} {"train_loss": -6.897753715515137, "global_step": 160169, "epoch": 3813} {"train_loss": -6.865467071533203, "global_step": 160170, "epoch": 3813} {"train_loss": -6.802487373352051, "global_step": 160171, "epoch": 3813} {"train_loss": -6.8799920082092285, "global_step": 160172, "epoch": 3813} {"train_loss": -6.795706748962402, "global_step": 160173, "epoch": 3813} {"train_loss": -7.001276016235352, "global_step": 160174, "epoch": 3813} {"train_loss": -6.910072326660156, "global_step": 160175, "epoch": 3813} {"train_loss": -6.7920122146606445, "global_step": 160176, "epoch": 3813} {"train_loss": -7.055492401123047, "global_step": 160177, "epoch": 3813} {"train_loss": -6.955129623413086, "global_step": 160178, "epoch": 3813} {"train_loss": -7.035235404968262, "global_step": 160179, "epoch": 3813} {"train_loss": -6.954944133758545, "global_step": 160180, "epoch": 3813} {"train_loss": -6.906516075134277, "global_step": 160181, "epoch": 3813} {"train_loss": -6.866462707519531, "global_step": 160182, "epoch": 3813} {"train_loss": -6.879420280456543, "global_step": 160183, "epoch": 3813} {"train_loss": -6.978077411651611, "global_step": 160184, "epoch": 3813} {"train_loss": -6.87587833404541, "global_step": 160185, "epoch": 3813} {"train_loss": -6.967114448547363, "global_step": 160186, "epoch": 3813} {"train_loss": -6.944461481911795, "global_step": 160187, "epoch": 3813, "val_loss": 79226.2890625} {"train_loss": -6.965407371520996, "global_step": 160188, "epoch": 3814} {"train_loss": -6.966414451599121, "global_step": 160189, "epoch": 3814} {"train_loss": -6.940828800201416, "global_step": 160190, "epoch": 3814} {"train_loss": -6.797022819519043, "global_step": 160191, "epoch": 3814} {"train_loss": -6.999578475952148, "global_step": 160192, "epoch": 3814} {"train_loss": -6.765576362609863, "global_step": 160193, "epoch": 3814} {"train_loss": -6.872014045715332, "global_step": 160194, "epoch": 3814} {"train_loss": -6.928645133972168, "global_step": 160195, "epoch": 3814} {"train_loss": -6.813112735748291, "global_step": 160196, "epoch": 3814} {"train_loss": -6.916049957275391, "global_step": 160197, "epoch": 3814} {"train_loss": -6.63650369644165, "global_step": 160198, "epoch": 3814} {"train_loss": -6.750612258911133, "global_step": 160199, "epoch": 3814} {"train_loss": -6.825407981872559, "global_step": 160200, "epoch": 3814} {"train_loss": -6.759042739868164, "global_step": 160201, "epoch": 3814} {"train_loss": -6.882782936096191, "global_step": 160202, "epoch": 3814} {"train_loss": -6.811434268951416, "global_step": 160203, "epoch": 3814} {"train_loss": -6.926920413970947, "global_step": 160204, "epoch": 3814} {"train_loss": -6.830680847167969, "global_step": 160205, "epoch": 3814} {"train_loss": -6.8976545333862305, "global_step": 160206, "epoch": 3814} {"train_loss": -6.840908050537109, "global_step": 160207, "epoch": 3814} {"train_loss": -6.807661056518555, "global_step": 160208, "epoch": 3814} {"train_loss": -6.876287460327148, "global_step": 160209, "epoch": 3814} {"train_loss": -6.888931751251221, "global_step": 160210, "epoch": 3814} {"train_loss": -6.947038650512695, "global_step": 160211, "epoch": 3814} {"train_loss": -6.712162971496582, "global_step": 160212, "epoch": 3814} {"train_loss": -6.927695274353027, "global_step": 160213, "epoch": 3814} {"train_loss": -6.923228740692139, "global_step": 160214, "epoch": 3814} {"train_loss": -7.049139976501465, "global_step": 160215, "epoch": 3814} {"train_loss": -7.044066905975342, "global_step": 160216, "epoch": 3814} {"train_loss": -6.948822021484375, "global_step": 160217, "epoch": 3814} {"train_loss": -6.891595363616943, "global_step": 160218, "epoch": 3814} {"train_loss": -6.983616828918457, "global_step": 160219, "epoch": 3814} {"train_loss": -6.9129180908203125, "global_step": 160220, "epoch": 3814} {"train_loss": -6.875367641448975, "global_step": 160221, "epoch": 3814} {"train_loss": -6.97110652923584, "global_step": 160222, "epoch": 3814} {"train_loss": -6.924224376678467, "global_step": 160223, "epoch": 3814} {"train_loss": -6.8611249923706055, "global_step": 160224, "epoch": 3814} {"train_loss": -6.922055244445801, "global_step": 160225, "epoch": 3814} {"train_loss": -7.011141777038574, "global_step": 160226, "epoch": 3814} {"train_loss": -7.093595504760742, "global_step": 160227, "epoch": 3814} {"train_loss": -6.9756269454956055, "global_step": 160228, "epoch": 3814} {"train_loss": -6.897785436539423, "global_step": 160229, "epoch": 3814, "val_loss": 79172.3203125} {"train_loss": -6.995444297790527, "global_step": 160230, "epoch": 3815} {"train_loss": -7.071573257446289, "global_step": 160231, "epoch": 3815} {"train_loss": -7.056239128112793, "global_step": 160232, "epoch": 3815} {"train_loss": -7.047868728637695, "global_step": 160233, "epoch": 3815} {"train_loss": -6.987918853759766, "global_step": 160234, "epoch": 3815} {"train_loss": -7.050930976867676, "global_step": 160235, "epoch": 3815} {"train_loss": -6.982791900634766, "global_step": 160236, "epoch": 3815} {"train_loss": -7.103127479553223, "global_step": 160237, "epoch": 3815} {"train_loss": -7.005908012390137, "global_step": 160238, "epoch": 3815} {"train_loss": -6.888883113861084, "global_step": 160239, "epoch": 3815} {"train_loss": -7.053404808044434, "global_step": 160240, "epoch": 3815} {"train_loss": -6.992074966430664, "global_step": 160241, "epoch": 3815} {"train_loss": -6.924065589904785, "global_step": 160242, "epoch": 3815} {"train_loss": -6.971500873565674, "global_step": 160243, "epoch": 3815} {"train_loss": -7.0237250328063965, "global_step": 160244, "epoch": 3815} {"train_loss": -7.002288818359375, "global_step": 160245, "epoch": 3815} {"train_loss": -6.98813533782959, "global_step": 160246, "epoch": 3815} {"train_loss": -7.060585021972656, "global_step": 160247, "epoch": 3815} {"train_loss": -6.992404937744141, "global_step": 160248, "epoch": 3815} {"train_loss": -6.782572269439697, "global_step": 160249, "epoch": 3815} {"train_loss": -7.052516937255859, "global_step": 160250, "epoch": 3815} {"train_loss": -6.982733249664307, "global_step": 160251, "epoch": 3815} {"train_loss": -6.879293441772461, "global_step": 160252, "epoch": 3815} {"train_loss": -6.917308330535889, "global_step": 160253, "epoch": 3815} {"train_loss": -6.8553266525268555, "global_step": 160254, "epoch": 3815} {"train_loss": -6.966256141662598, "global_step": 160255, "epoch": 3815} {"train_loss": -6.953592300415039, "global_step": 160256, "epoch": 3815} {"train_loss": -6.912679672241211, "global_step": 160257, "epoch": 3815} {"train_loss": -6.883473873138428, "global_step": 160258, "epoch": 3815} {"train_loss": -6.97044563293457, "global_step": 160259, "epoch": 3815} {"train_loss": -7.008387565612793, "global_step": 160260, "epoch": 3815} {"train_loss": -6.938989162445068, "global_step": 160261, "epoch": 3815} {"train_loss": -6.916669845581055, "global_step": 160262, "epoch": 3815} {"train_loss": -6.966697692871094, "global_step": 160263, "epoch": 3815} {"train_loss": -6.891912937164307, "global_step": 160264, "epoch": 3815} {"train_loss": -7.024524688720703, "global_step": 160265, "epoch": 3815} {"train_loss": -6.972166538238525, "global_step": 160266, "epoch": 3815} {"train_loss": -6.852336406707764, "global_step": 160267, "epoch": 3815} {"train_loss": -6.954891681671143, "global_step": 160268, "epoch": 3815} {"train_loss": -6.869298934936523, "global_step": 160269, "epoch": 3815} {"train_loss": -6.921388149261475, "global_step": 160270, "epoch": 3815} {"train_loss": -6.9664813450404575, "global_step": 160271, "epoch": 3815, "val_loss": 79296.4375} {"train_loss": -6.90306282043457, "global_step": 160272, "epoch": 3816} {"train_loss": -6.936106204986572, "global_step": 160273, "epoch": 3816} {"train_loss": -6.884273529052734, "global_step": 160274, "epoch": 3816} {"train_loss": -6.956606864929199, "global_step": 160275, "epoch": 3816} {"train_loss": -6.917719841003418, "global_step": 160276, "epoch": 3816} {"train_loss": -6.828180313110352, "global_step": 160277, "epoch": 3816} {"train_loss": -6.995585918426514, "global_step": 160278, "epoch": 3816} {"train_loss": -6.9646525382995605, "global_step": 160279, "epoch": 3816} {"train_loss": -6.86097526550293, "global_step": 160280, "epoch": 3816} {"train_loss": -6.956733703613281, "global_step": 160281, "epoch": 3816} {"train_loss": -6.9459028244018555, "global_step": 160282, "epoch": 3816} {"train_loss": -6.919589042663574, "global_step": 160283, "epoch": 3816} {"train_loss": -7.004059791564941, "global_step": 160284, "epoch": 3816} {"train_loss": -6.987920761108398, "global_step": 160285, "epoch": 3816} {"train_loss": -7.010847091674805, "global_step": 160286, "epoch": 3816} {"train_loss": -6.984292984008789, "global_step": 160287, "epoch": 3816} {"train_loss": -7.015918731689453, "global_step": 160288, "epoch": 3816} {"train_loss": -7.010044097900391, "global_step": 160289, "epoch": 3816} {"train_loss": -6.954627513885498, "global_step": 160290, "epoch": 3816} {"train_loss": -7.092379093170166, "global_step": 160291, "epoch": 3816} {"train_loss": -6.899569034576416, "global_step": 160292, "epoch": 3816} {"train_loss": -6.943002700805664, "global_step": 160293, "epoch": 3816} {"train_loss": -6.950161457061768, "global_step": 160294, "epoch": 3816} {"train_loss": -6.800042152404785, "global_step": 160295, "epoch": 3816} {"train_loss": -7.004678726196289, "global_step": 160296, "epoch": 3816} {"train_loss": -6.951045036315918, "global_step": 160297, "epoch": 3816} {"train_loss": -6.942922592163086, "global_step": 160298, "epoch": 3816} {"train_loss": -7.048528671264648, "global_step": 160299, "epoch": 3816} {"train_loss": -7.008745193481445, "global_step": 160300, "epoch": 3816} {"train_loss": -6.840005874633789, "global_step": 160301, "epoch": 3816} {"train_loss": -7.094066143035889, "global_step": 160302, "epoch": 3816} {"train_loss": -6.938912391662598, "global_step": 160303, "epoch": 3816} {"train_loss": -6.794466018676758, "global_step": 160304, "epoch": 3816} {"train_loss": -7.049537658691406, "global_step": 160305, "epoch": 3816} {"train_loss": -7.065788269042969, "global_step": 160306, "epoch": 3816} {"train_loss": -6.88470458984375, "global_step": 160307, "epoch": 3816} {"train_loss": -6.971704959869385, "global_step": 160308, "epoch": 3816} {"train_loss": -6.860925674438477, "global_step": 160309, "epoch": 3816} {"train_loss": -7.015504837036133, "global_step": 160310, "epoch": 3816} {"train_loss": -6.994353294372559, "global_step": 160311, "epoch": 3816} {"train_loss": -6.967742919921875, "global_step": 160312, "epoch": 3816} {"train_loss": -6.9580564839499335, "global_step": 160313, "epoch": 3816, "val_loss": 79286.8125} {"train_loss": -7.058608055114746, "global_step": 160314, "epoch": 3817} {"train_loss": -6.951756000518799, "global_step": 160315, "epoch": 3817} {"train_loss": -6.996792793273926, "global_step": 160316, "epoch": 3817} {"train_loss": -6.947567939758301, "global_step": 160317, "epoch": 3817} {"train_loss": -6.924684524536133, "global_step": 160318, "epoch": 3817} {"train_loss": -6.960283279418945, "global_step": 160319, "epoch": 3817} {"train_loss": -6.957535743713379, "global_step": 160320, "epoch": 3817} {"train_loss": -7.072267055511475, "global_step": 160321, "epoch": 3817} {"train_loss": -6.951632976531982, "global_step": 160322, "epoch": 3817} {"train_loss": -6.769373893737793, "global_step": 160323, "epoch": 3817} {"train_loss": -6.794517517089844, "global_step": 160324, "epoch": 3817} {"train_loss": -6.873894691467285, "global_step": 160325, "epoch": 3817} {"train_loss": -7.010522842407227, "global_step": 160326, "epoch": 3817} {"train_loss": -6.994330883026123, "global_step": 160327, "epoch": 3817} {"train_loss": -7.001007080078125, "global_step": 160328, "epoch": 3817} {"train_loss": -6.900623321533203, "global_step": 160329, "epoch": 3817} {"train_loss": -6.908902168273926, "global_step": 160330, "epoch": 3817} {"train_loss": -7.055643081665039, "global_step": 160331, "epoch": 3817} {"train_loss": -6.981790065765381, "global_step": 160332, "epoch": 3817} {"train_loss": -7.002626895904541, "global_step": 160333, "epoch": 3817} {"train_loss": -6.960914611816406, "global_step": 160334, "epoch": 3817} {"train_loss": -7.044488430023193, "global_step": 160335, "epoch": 3817} {"train_loss": -6.958554744720459, "global_step": 160336, "epoch": 3817} {"train_loss": -6.881616592407227, "global_step": 160337, "epoch": 3817} {"train_loss": -7.017574310302734, "global_step": 160338, "epoch": 3817} {"train_loss": -6.996225357055664, "global_step": 160339, "epoch": 3817} {"train_loss": -7.010278701782227, "global_step": 160340, "epoch": 3817} {"train_loss": -7.102656364440918, "global_step": 160341, "epoch": 3817} {"train_loss": -7.085394859313965, "global_step": 160342, "epoch": 3817} {"train_loss": -7.024857044219971, "global_step": 160343, "epoch": 3817} {"train_loss": -7.033658027648926, "global_step": 160344, "epoch": 3817} {"train_loss": -7.012821197509766, "global_step": 160345, "epoch": 3817} {"train_loss": -7.063522815704346, "global_step": 160346, "epoch": 3817} {"train_loss": -7.046694278717041, "global_step": 160347, "epoch": 3817} {"train_loss": -7.038995265960693, "global_step": 160348, "epoch": 3817} {"train_loss": -7.050693511962891, "global_step": 160349, "epoch": 3817} {"train_loss": -6.955678939819336, "global_step": 160350, "epoch": 3817} {"train_loss": -7.051344871520996, "global_step": 160351, "epoch": 3817} {"train_loss": -7.127814292907715, "global_step": 160352, "epoch": 3817} {"train_loss": -7.099780082702637, "global_step": 160353, "epoch": 3817} {"train_loss": -7.004319190979004, "global_step": 160354, "epoch": 3817} {"train_loss": -6.993402481079102, "global_step": 160355, "epoch": 3817, "val_loss": 79290.140625} {"train_loss": -7.033649921417236, "global_step": 160356, "epoch": 3818} {"train_loss": -6.971101760864258, "global_step": 160357, "epoch": 3818} {"train_loss": -6.890599250793457, "global_step": 160358, "epoch": 3818} {"train_loss": -6.9919328689575195, "global_step": 160359, "epoch": 3818} {"train_loss": -6.842564582824707, "global_step": 160360, "epoch": 3818} {"train_loss": -6.983365058898926, "global_step": 160361, "epoch": 3818} {"train_loss": -6.937731742858887, "global_step": 160362, "epoch": 3818} {"train_loss": -7.064058780670166, "global_step": 160363, "epoch": 3818} {"train_loss": -6.885207176208496, "global_step": 160364, "epoch": 3818} {"train_loss": -6.966021537780762, "global_step": 160365, "epoch": 3818} {"train_loss": -7.050130844116211, "global_step": 160366, "epoch": 3818} {"train_loss": -6.962852954864502, "global_step": 160367, "epoch": 3818} {"train_loss": -7.002016544342041, "global_step": 160368, "epoch": 3818} {"train_loss": -6.889437675476074, "global_step": 160369, "epoch": 3818} {"train_loss": -6.923666000366211, "global_step": 160370, "epoch": 3818} {"train_loss": -7.002810478210449, "global_step": 160371, "epoch": 3818} {"train_loss": -6.99970006942749, "global_step": 160372, "epoch": 3818} {"train_loss": -7.064249038696289, "global_step": 160373, "epoch": 3818} {"train_loss": -6.958042621612549, "global_step": 160374, "epoch": 3818} {"train_loss": -7.06397819519043, "global_step": 160375, "epoch": 3818} {"train_loss": -7.033128261566162, "global_step": 160376, "epoch": 3818} {"train_loss": -7.146417617797852, "global_step": 160377, "epoch": 3818} {"train_loss": -7.041960716247559, "global_step": 160378, "epoch": 3818} {"train_loss": -7.0570502281188965, "global_step": 160379, "epoch": 3818} {"train_loss": -7.005413055419922, "global_step": 160380, "epoch": 3818} {"train_loss": -7.061790466308594, "global_step": 160381, "epoch": 3818} {"train_loss": -7.030787467956543, "global_step": 160382, "epoch": 3818} {"train_loss": -7.129373550415039, "global_step": 160383, "epoch": 3818} {"train_loss": -6.975184440612793, "global_step": 160384, "epoch": 3818} {"train_loss": -7.024199485778809, "global_step": 160385, "epoch": 3818} {"train_loss": -6.889077663421631, "global_step": 160386, "epoch": 3818} {"train_loss": -6.921525955200195, "global_step": 160387, "epoch": 3818} {"train_loss": -6.9843902587890625, "global_step": 160388, "epoch": 3818} {"train_loss": -6.981207847595215, "global_step": 160389, "epoch": 3818} {"train_loss": -7.00419807434082, "global_step": 160390, "epoch": 3818} {"train_loss": -6.989376068115234, "global_step": 160391, "epoch": 3818} {"train_loss": -6.9829487800598145, "global_step": 160392, "epoch": 3818} {"train_loss": -6.981355667114258, "global_step": 160393, "epoch": 3818} {"train_loss": -6.887913227081299, "global_step": 160394, "epoch": 3818} {"train_loss": -7.068978786468506, "global_step": 160395, "epoch": 3818} {"train_loss": -6.84658145904541, "global_step": 160396, "epoch": 3818} {"train_loss": -6.987462214061192, "global_step": 160397, "epoch": 3818, "val_loss": 79304.8125} {"train_loss": -7.093780040740967, "global_step": 160398, "epoch": 3819} {"train_loss": -6.911751747131348, "global_step": 160399, "epoch": 3819} {"train_loss": -6.8382720947265625, "global_step": 160400, "epoch": 3819} {"train_loss": -7.014183044433594, "global_step": 160401, "epoch": 3819} {"train_loss": -6.847842216491699, "global_step": 160402, "epoch": 3819} {"train_loss": -6.938601493835449, "global_step": 160403, "epoch": 3819} {"train_loss": -7.026976585388184, "global_step": 160404, "epoch": 3819} {"train_loss": -6.89909553527832, "global_step": 160405, "epoch": 3819} {"train_loss": -6.7736101150512695, "global_step": 160406, "epoch": 3819} {"train_loss": -6.915604591369629, "global_step": 160407, "epoch": 3819} {"train_loss": -6.845578193664551, "global_step": 160408, "epoch": 3819} {"train_loss": -6.918431758880615, "global_step": 160409, "epoch": 3819} {"train_loss": -6.841577529907227, "global_step": 160410, "epoch": 3819} {"train_loss": -6.943236351013184, "global_step": 160411, "epoch": 3819} {"train_loss": -7.017217636108398, "global_step": 160412, "epoch": 3819} {"train_loss": -6.9786248207092285, "global_step": 160413, "epoch": 3819} {"train_loss": -6.942975044250488, "global_step": 160414, "epoch": 3819} {"train_loss": -6.825788497924805, "global_step": 160415, "epoch": 3819} {"train_loss": -6.94695520401001, "global_step": 160416, "epoch": 3819} {"train_loss": -6.997187614440918, "global_step": 160417, "epoch": 3819} {"train_loss": -6.805596351623535, "global_step": 160418, "epoch": 3819} {"train_loss": -6.913633346557617, "global_step": 160419, "epoch": 3819} {"train_loss": -6.937741279602051, "global_step": 160420, "epoch": 3819} {"train_loss": -6.916858673095703, "global_step": 160421, "epoch": 3819} {"train_loss": -6.879241466522217, "global_step": 160422, "epoch": 3819} {"train_loss": -6.89495325088501, "global_step": 160423, "epoch": 3819} {"train_loss": -6.8651814460754395, "global_step": 160424, "epoch": 3819} {"train_loss": -6.912652015686035, "global_step": 160425, "epoch": 3819} {"train_loss": -6.836010932922363, "global_step": 160426, "epoch": 3819} {"train_loss": -6.871402263641357, "global_step": 160427, "epoch": 3819} {"train_loss": -6.957961082458496, "global_step": 160428, "epoch": 3819} {"train_loss": -6.9792680740356445, "global_step": 160429, "epoch": 3819} {"train_loss": -6.9370269775390625, "global_step": 160430, "epoch": 3819} {"train_loss": -6.966799736022949, "global_step": 160431, "epoch": 3819} {"train_loss": -6.934240818023682, "global_step": 160432, "epoch": 3819} {"train_loss": -6.8242387771606445, "global_step": 160433, "epoch": 3819} {"train_loss": -6.932252883911133, "global_step": 160434, "epoch": 3819} {"train_loss": -7.029453754425049, "global_step": 160435, "epoch": 3819} {"train_loss": -7.052646636962891, "global_step": 160436, "epoch": 3819} {"train_loss": -6.885418891906738, "global_step": 160437, "epoch": 3819} {"train_loss": -6.941370010375977, "global_step": 160438, "epoch": 3819} {"train_loss": -6.924456267129807, "global_step": 160439, "epoch": 3819, "val_loss": 79136.375} {"train_loss": -6.971709251403809, "global_step": 160440, "epoch": 3820} {"train_loss": -6.929697036743164, "global_step": 160441, "epoch": 3820} {"train_loss": -6.968323707580566, "global_step": 160442, "epoch": 3820} {"train_loss": -6.9608869552612305, "global_step": 160443, "epoch": 3820} {"train_loss": -6.9165544509887695, "global_step": 160444, "epoch": 3820} {"train_loss": -6.9163312911987305, "global_step": 160445, "epoch": 3820} {"train_loss": -6.926373481750488, "global_step": 160446, "epoch": 3820} {"train_loss": -7.061952590942383, "global_step": 160447, "epoch": 3820} {"train_loss": -6.955333709716797, "global_step": 160448, "epoch": 3820} {"train_loss": -6.991513252258301, "global_step": 160449, "epoch": 3820} {"train_loss": -7.0654191970825195, "global_step": 160450, "epoch": 3820} {"train_loss": -6.941556453704834, "global_step": 160451, "epoch": 3820} {"train_loss": -6.971077919006348, "global_step": 160452, "epoch": 3820} {"train_loss": -6.895263671875, "global_step": 160453, "epoch": 3820} {"train_loss": -6.959994316101074, "global_step": 160454, "epoch": 3820} {"train_loss": -6.919349670410156, "global_step": 160455, "epoch": 3820} {"train_loss": -7.016077518463135, "global_step": 160456, "epoch": 3820} {"train_loss": -7.026841163635254, "global_step": 160457, "epoch": 3820} {"train_loss": -6.859834671020508, "global_step": 160458, "epoch": 3820} {"train_loss": -6.942364692687988, "global_step": 160459, "epoch": 3820} {"train_loss": -6.7516961097717285, "global_step": 160460, "epoch": 3820} {"train_loss": -6.996825218200684, "global_step": 160461, "epoch": 3820} {"train_loss": -6.867593765258789, "global_step": 160462, "epoch": 3820} {"train_loss": -6.981254577636719, "global_step": 160463, "epoch": 3820} {"train_loss": -7.048670768737793, "global_step": 160464, "epoch": 3820} {"train_loss": -6.966194152832031, "global_step": 160465, "epoch": 3820} {"train_loss": -7.017188549041748, "global_step": 160466, "epoch": 3820} {"train_loss": -6.9859113693237305, "global_step": 160467, "epoch": 3820} {"train_loss": -6.945789337158203, "global_step": 160468, "epoch": 3820} {"train_loss": -6.986278533935547, "global_step": 160469, "epoch": 3820} {"train_loss": -7.0721354484558105, "global_step": 160470, "epoch": 3820} {"train_loss": -7.011418342590332, "global_step": 160471, "epoch": 3820} {"train_loss": -6.900410175323486, "global_step": 160472, "epoch": 3820} {"train_loss": -6.947720527648926, "global_step": 160473, "epoch": 3820} {"train_loss": -7.086438179016113, "global_step": 160474, "epoch": 3820} {"train_loss": -7.020186424255371, "global_step": 160475, "epoch": 3820} {"train_loss": -6.931828498840332, "global_step": 160476, "epoch": 3820} {"train_loss": -7.001653671264648, "global_step": 160477, "epoch": 3820} {"train_loss": -6.997520446777344, "global_step": 160478, "epoch": 3820} {"train_loss": -6.949424743652344, "global_step": 160479, "epoch": 3820} {"train_loss": -6.901731491088867, "global_step": 160480, "epoch": 3820} {"train_loss": -6.964035692669096, "global_step": 160481, "epoch": 3820, "val_loss": 79272.640625} {"train_loss": -6.926047325134277, "global_step": 160482, "epoch": 3821} {"train_loss": -6.972817420959473, "global_step": 160483, "epoch": 3821} {"train_loss": -6.984746932983398, "global_step": 160484, "epoch": 3821} {"train_loss": -6.971856117248535, "global_step": 160485, "epoch": 3821} {"train_loss": -6.918609619140625, "global_step": 160486, "epoch": 3821} {"train_loss": -7.071036338806152, "global_step": 160487, "epoch": 3821} {"train_loss": -6.933147430419922, "global_step": 160488, "epoch": 3821} {"train_loss": -6.986597061157227, "global_step": 160489, "epoch": 3821} {"train_loss": -6.946369647979736, "global_step": 160490, "epoch": 3821} {"train_loss": -6.956411361694336, "global_step": 160491, "epoch": 3821} {"train_loss": -6.995998382568359, "global_step": 160492, "epoch": 3821} {"train_loss": -6.991786479949951, "global_step": 160493, "epoch": 3821} {"train_loss": -7.013658046722412, "global_step": 160494, "epoch": 3821} {"train_loss": -6.953404903411865, "global_step": 160495, "epoch": 3821} {"train_loss": -6.8350911140441895, "global_step": 160496, "epoch": 3821} {"train_loss": -7.0919976234436035, "global_step": 160497, "epoch": 3821} {"train_loss": -6.9680328369140625, "global_step": 160498, "epoch": 3821} {"train_loss": -6.969155311584473, "global_step": 160499, "epoch": 3821} {"train_loss": -6.884317874908447, "global_step": 160500, "epoch": 3821} {"train_loss": -7.0273637771606445, "global_step": 160501, "epoch": 3821} {"train_loss": -7.050415992736816, "global_step": 160502, "epoch": 3821} {"train_loss": -6.781951427459717, "global_step": 160503, "epoch": 3821} {"train_loss": -6.952578544616699, "global_step": 160504, "epoch": 3821} {"train_loss": -6.859927177429199, "global_step": 160505, "epoch": 3821} {"train_loss": -6.975454807281494, "global_step": 160506, "epoch": 3821} {"train_loss": -6.810459136962891, "global_step": 160507, "epoch": 3821} {"train_loss": -6.905733585357666, "global_step": 160508, "epoch": 3821} {"train_loss": -6.8663225173950195, "global_step": 160509, "epoch": 3821} {"train_loss": -6.921591281890869, "global_step": 160510, "epoch": 3821} {"train_loss": -6.900677680969238, "global_step": 160511, "epoch": 3821} {"train_loss": -6.9578776359558105, "global_step": 160512, "epoch": 3821} {"train_loss": -6.850891590118408, "global_step": 160513, "epoch": 3821} {"train_loss": -6.907286643981934, "global_step": 160514, "epoch": 3821} {"train_loss": -7.029698371887207, "global_step": 160515, "epoch": 3821} {"train_loss": -6.889217853546143, "global_step": 160516, "epoch": 3821} {"train_loss": -7.027179718017578, "global_step": 160517, "epoch": 3821} {"train_loss": -6.907907962799072, "global_step": 160518, "epoch": 3821} {"train_loss": -6.949496746063232, "global_step": 160519, "epoch": 3821} {"train_loss": -7.073468208312988, "global_step": 160520, "epoch": 3821} {"train_loss": -6.886260032653809, "global_step": 160521, "epoch": 3821} {"train_loss": -6.871152877807617, "global_step": 160522, "epoch": 3821} {"train_loss": -6.946765320641654, "global_step": 160523, "epoch": 3821, "val_loss": 79511.1328125} {"train_loss": -6.840181350708008, "global_step": 160524, "epoch": 3822} {"train_loss": -6.881904602050781, "global_step": 160525, "epoch": 3822} {"train_loss": -6.924049377441406, "global_step": 160526, "epoch": 3822} {"train_loss": -6.903975486755371, "global_step": 160527, "epoch": 3822} {"train_loss": -6.836994171142578, "global_step": 160528, "epoch": 3822} {"train_loss": -6.965475082397461, "global_step": 160529, "epoch": 3822} {"train_loss": -6.894695281982422, "global_step": 160530, "epoch": 3822} {"train_loss": -7.0231499671936035, "global_step": 160531, "epoch": 3822} {"train_loss": -6.771358489990234, "global_step": 160532, "epoch": 3822} {"train_loss": -6.921078681945801, "global_step": 160533, "epoch": 3822} {"train_loss": -6.809869289398193, "global_step": 160534, "epoch": 3822} {"train_loss": -6.837803363800049, "global_step": 160535, "epoch": 3822} {"train_loss": -6.883379936218262, "global_step": 160536, "epoch": 3822} {"train_loss": -6.989558219909668, "global_step": 160537, "epoch": 3822} {"train_loss": -6.98478889465332, "global_step": 160538, "epoch": 3822} {"train_loss": -6.9560933113098145, "global_step": 160539, "epoch": 3822} {"train_loss": -7.008561134338379, "global_step": 160540, "epoch": 3822} {"train_loss": -6.915332794189453, "global_step": 160541, "epoch": 3822} {"train_loss": -6.9104180335998535, "global_step": 160542, "epoch": 3822} {"train_loss": -7.05686092376709, "global_step": 160543, "epoch": 3822} {"train_loss": -6.865715503692627, "global_step": 160544, "epoch": 3822} {"train_loss": -6.919804573059082, "global_step": 160545, "epoch": 3822} {"train_loss": -6.962018013000488, "global_step": 160546, "epoch": 3822} {"train_loss": -6.968196392059326, "global_step": 160547, "epoch": 3822} {"train_loss": -6.9295549392700195, "global_step": 160548, "epoch": 3822} {"train_loss": -7.00229024887085, "global_step": 160549, "epoch": 3822} {"train_loss": -7.041409969329834, "global_step": 160550, "epoch": 3822} {"train_loss": -6.862507343292236, "global_step": 160551, "epoch": 3822} {"train_loss": -7.05246639251709, "global_step": 160552, "epoch": 3822} {"train_loss": -7.084901809692383, "global_step": 160553, "epoch": 3822} {"train_loss": -7.120728492736816, "global_step": 160554, "epoch": 3822} {"train_loss": -6.900021076202393, "global_step": 160555, "epoch": 3822} {"train_loss": -6.932051658630371, "global_step": 160556, "epoch": 3822} {"train_loss": -7.009477615356445, "global_step": 160557, "epoch": 3822} {"train_loss": -6.93827486038208, "global_step": 160558, "epoch": 3822} {"train_loss": -6.999421119689941, "global_step": 160559, "epoch": 3822} {"train_loss": -6.879781723022461, "global_step": 160560, "epoch": 3822} {"train_loss": -7.0642242431640625, "global_step": 160561, "epoch": 3822} {"train_loss": -6.88701868057251, "global_step": 160562, "epoch": 3822} {"train_loss": -6.688811302185059, "global_step": 160563, "epoch": 3822} {"train_loss": -7.03397274017334, "global_step": 160564, "epoch": 3822} {"train_loss": -6.934980505988712, "global_step": 160565, "epoch": 3822, "val_loss": 79293.6484375} {"train_loss": -6.874953269958496, "global_step": 160566, "epoch": 3823} {"train_loss": -6.942522048950195, "global_step": 160567, "epoch": 3823} {"train_loss": -6.882918357849121, "global_step": 160568, "epoch": 3823} {"train_loss": -6.970118045806885, "global_step": 160569, "epoch": 3823} {"train_loss": -6.922513961791992, "global_step": 160570, "epoch": 3823} {"train_loss": -6.888591766357422, "global_step": 160571, "epoch": 3823} {"train_loss": -6.935310363769531, "global_step": 160572, "epoch": 3823} {"train_loss": -6.965592384338379, "global_step": 160573, "epoch": 3823} {"train_loss": -6.89838981628418, "global_step": 160574, "epoch": 3823} {"train_loss": -6.8349409103393555, "global_step": 160575, "epoch": 3823} {"train_loss": -6.8416523933410645, "global_step": 160576, "epoch": 3823} {"train_loss": -6.966762542724609, "global_step": 160577, "epoch": 3823} {"train_loss": -6.835379600524902, "global_step": 160578, "epoch": 3823} {"train_loss": -6.875753879547119, "global_step": 160579, "epoch": 3823} {"train_loss": -6.925083160400391, "global_step": 160580, "epoch": 3823} {"train_loss": -6.9237141609191895, "global_step": 160581, "epoch": 3823} {"train_loss": -6.9463067054748535, "global_step": 160582, "epoch": 3823} {"train_loss": -6.924369812011719, "global_step": 160583, "epoch": 3823} {"train_loss": -7.090953350067139, "global_step": 160584, "epoch": 3823} {"train_loss": -7.0499467849731445, "global_step": 160585, "epoch": 3823} {"train_loss": -7.082125186920166, "global_step": 160586, "epoch": 3823} {"train_loss": -6.9673261642456055, "global_step": 160587, "epoch": 3823} {"train_loss": -7.021551132202148, "global_step": 160588, "epoch": 3823} {"train_loss": -6.930398464202881, "global_step": 160589, "epoch": 3823} {"train_loss": -6.926446914672852, "global_step": 160590, "epoch": 3823} {"train_loss": -6.9420037269592285, "global_step": 160591, "epoch": 3823} {"train_loss": -6.914971351623535, "global_step": 160592, "epoch": 3823} {"train_loss": -6.981837272644043, "global_step": 160593, "epoch": 3823} {"train_loss": -6.9588212966918945, "global_step": 160594, "epoch": 3823} {"train_loss": -7.023517608642578, "global_step": 160595, "epoch": 3823} {"train_loss": -7.019299507141113, "global_step": 160596, "epoch": 3823} {"train_loss": -6.953284740447998, "global_step": 160597, "epoch": 3823} {"train_loss": -6.9864501953125, "global_step": 160598, "epoch": 3823} {"train_loss": -6.966814994812012, "global_step": 160599, "epoch": 3823} {"train_loss": -6.940122604370117, "global_step": 160600, "epoch": 3823} {"train_loss": -6.947921276092529, "global_step": 160601, "epoch": 3823} {"train_loss": -6.895349025726318, "global_step": 160602, "epoch": 3823} {"train_loss": -6.949199676513672, "global_step": 160603, "epoch": 3823} {"train_loss": -6.96117639541626, "global_step": 160604, "epoch": 3823} {"train_loss": -6.944782257080078, "global_step": 160605, "epoch": 3823} {"train_loss": -6.956777572631836, "global_step": 160606, "epoch": 3823} {"train_loss": -6.946172362282162, "global_step": 160607, "epoch": 3823, "val_loss": 79519.2421875} {"train_loss": -6.972009181976318, "global_step": 160608, "epoch": 3824} {"train_loss": -6.9776177406311035, "global_step": 160609, "epoch": 3824} {"train_loss": -6.9246826171875, "global_step": 160610, "epoch": 3824} {"train_loss": -7.01780891418457, "global_step": 160611, "epoch": 3824} {"train_loss": -7.045136451721191, "global_step": 160612, "epoch": 3824} {"train_loss": -6.914384365081787, "global_step": 160613, "epoch": 3824} {"train_loss": -6.8846330642700195, "global_step": 160614, "epoch": 3824} {"train_loss": -7.100722312927246, "global_step": 160615, "epoch": 3824} {"train_loss": -7.020815849304199, "global_step": 160616, "epoch": 3824} {"train_loss": -6.91365909576416, "global_step": 160617, "epoch": 3824} {"train_loss": -7.022041320800781, "global_step": 160618, "epoch": 3824} {"train_loss": -7.007006645202637, "global_step": 160619, "epoch": 3824} {"train_loss": -7.019913196563721, "global_step": 160620, "epoch": 3824} {"train_loss": -7.028139114379883, "global_step": 160621, "epoch": 3824} {"train_loss": -6.902941703796387, "global_step": 160622, "epoch": 3824} {"train_loss": -6.885815620422363, "global_step": 160623, "epoch": 3824} {"train_loss": -6.9933695793151855, "global_step": 160624, "epoch": 3824} {"train_loss": -6.981802940368652, "global_step": 160625, "epoch": 3824} {"train_loss": -7.0769944190979, "global_step": 160626, "epoch": 3824} {"train_loss": -6.893301963806152, "global_step": 160627, "epoch": 3824} {"train_loss": -7.091554641723633, "global_step": 160628, "epoch": 3824} {"train_loss": -6.9486565589904785, "global_step": 160629, "epoch": 3824} {"train_loss": -6.891486644744873, "global_step": 160630, "epoch": 3824} {"train_loss": -7.052793502807617, "global_step": 160631, "epoch": 3824} {"train_loss": -6.875338554382324, "global_step": 160632, "epoch": 3824} {"train_loss": -6.989858627319336, "global_step": 160633, "epoch": 3824} {"train_loss": -6.944269180297852, "global_step": 160634, "epoch": 3824} {"train_loss": -6.853595733642578, "global_step": 160635, "epoch": 3824} {"train_loss": -6.960468292236328, "global_step": 160636, "epoch": 3824} {"train_loss": -7.055892467498779, "global_step": 160637, "epoch": 3824} {"train_loss": -6.852721214294434, "global_step": 160638, "epoch": 3824} {"train_loss": -6.953077793121338, "global_step": 160639, "epoch": 3824} {"train_loss": -6.98077917098999, "global_step": 160640, "epoch": 3824} {"train_loss": -7.1229987144470215, "global_step": 160641, "epoch": 3824} {"train_loss": -6.984555244445801, "global_step": 160642, "epoch": 3824} {"train_loss": -6.874493598937988, "global_step": 160643, "epoch": 3824} {"train_loss": -7.0812225341796875, "global_step": 160644, "epoch": 3824} {"train_loss": -6.857341289520264, "global_step": 160645, "epoch": 3824} {"train_loss": -6.91013240814209, "global_step": 160646, "epoch": 3824} {"train_loss": -6.970219612121582, "global_step": 160647, "epoch": 3824} {"train_loss": -6.95625114440918, "global_step": 160648, "epoch": 3824} {"train_loss": -6.968877622059414, "global_step": 160649, "epoch": 3824, "val_loss": 79404.859375} {"train_loss": -7.067686557769775, "global_step": 160650, "epoch": 3825} {"train_loss": -7.031822681427002, "global_step": 160651, "epoch": 3825} {"train_loss": -6.875125885009766, "global_step": 160652, "epoch": 3825} {"train_loss": -7.038434982299805, "global_step": 160653, "epoch": 3825} {"train_loss": -7.024697303771973, "global_step": 160654, "epoch": 3825} {"train_loss": -6.955677032470703, "global_step": 160655, "epoch": 3825} {"train_loss": -6.961722373962402, "global_step": 160656, "epoch": 3825} {"train_loss": -7.051504135131836, "global_step": 160657, "epoch": 3825} {"train_loss": -6.991137504577637, "global_step": 160658, "epoch": 3825} {"train_loss": -6.952367305755615, "global_step": 160659, "epoch": 3825} {"train_loss": -7.036540508270264, "global_step": 160660, "epoch": 3825} {"train_loss": -6.8239946365356445, "global_step": 160661, "epoch": 3825} {"train_loss": -6.9631733894348145, "global_step": 160662, "epoch": 3825} {"train_loss": -7.032858371734619, "global_step": 160663, "epoch": 3825} {"train_loss": -6.912935733795166, "global_step": 160664, "epoch": 3825} {"train_loss": -6.893861770629883, "global_step": 160665, "epoch": 3825} {"train_loss": -6.951630115509033, "global_step": 160666, "epoch": 3825} {"train_loss": -6.9212141036987305, "global_step": 160667, "epoch": 3825} {"train_loss": -6.952982425689697, "global_step": 160668, "epoch": 3825} {"train_loss": -6.898471355438232, "global_step": 160669, "epoch": 3825} {"train_loss": -6.954743385314941, "global_step": 160670, "epoch": 3825} {"train_loss": -6.829662322998047, "global_step": 160671, "epoch": 3825} {"train_loss": -6.999338150024414, "global_step": 160672, "epoch": 3825} {"train_loss": -6.859424591064453, "global_step": 160673, "epoch": 3825} {"train_loss": -6.857988357543945, "global_step": 160674, "epoch": 3825} {"train_loss": -6.95998477935791, "global_step": 160675, "epoch": 3825} {"train_loss": -6.944319248199463, "global_step": 160676, "epoch": 3825} {"train_loss": -6.887535095214844, "global_step": 160677, "epoch": 3825} {"train_loss": -7.057984352111816, "global_step": 160678, "epoch": 3825} {"train_loss": -6.956982135772705, "global_step": 160679, "epoch": 3825} {"train_loss": -6.9968342781066895, "global_step": 160680, "epoch": 3825} {"train_loss": -6.885268688201904, "global_step": 160681, "epoch": 3825} {"train_loss": -6.899749279022217, "global_step": 160682, "epoch": 3825} {"train_loss": -6.9648332595825195, "global_step": 160683, "epoch": 3825} {"train_loss": -7.011292457580566, "global_step": 160684, "epoch": 3825} {"train_loss": -7.025417804718018, "global_step": 160685, "epoch": 3825} {"train_loss": -6.932555198669434, "global_step": 160686, "epoch": 3825} {"train_loss": -7.070213317871094, "global_step": 160687, "epoch": 3825} {"train_loss": -6.96011209487915, "global_step": 160688, "epoch": 3825} {"train_loss": -7.018784046173096, "global_step": 160689, "epoch": 3825} {"train_loss": -7.065112590789795, "global_step": 160690, "epoch": 3825} {"train_loss": -6.96125146320888, "global_step": 160691, "epoch": 3825, "val_loss": 79274.140625} {"train_loss": -7.110908508300781, "global_step": 160692, "epoch": 3826} {"train_loss": -7.0883283615112305, "global_step": 160693, "epoch": 3826} {"train_loss": -6.967909812927246, "global_step": 160694, "epoch": 3826} {"train_loss": -7.130870342254639, "global_step": 160695, "epoch": 3826} {"train_loss": -7.027795791625977, "global_step": 160696, "epoch": 3826} {"train_loss": -7.066577911376953, "global_step": 160697, "epoch": 3826} {"train_loss": -7.130925178527832, "global_step": 160698, "epoch": 3826} {"train_loss": -7.061518669128418, "global_step": 160699, "epoch": 3826} {"train_loss": -7.092514991760254, "global_step": 160700, "epoch": 3826} {"train_loss": -7.042387962341309, "global_step": 160701, "epoch": 3826} {"train_loss": -6.911761283874512, "global_step": 160702, "epoch": 3826} {"train_loss": -7.068512916564941, "global_step": 160703, "epoch": 3826} {"train_loss": -6.9897074699401855, "global_step": 160704, "epoch": 3826} {"train_loss": -6.9899797439575195, "global_step": 160705, "epoch": 3826} {"train_loss": -7.070585250854492, "global_step": 160706, "epoch": 3826} {"train_loss": -6.950926303863525, "global_step": 160707, "epoch": 3826} {"train_loss": -6.958483695983887, "global_step": 160708, "epoch": 3826} {"train_loss": -7.026006698608398, "global_step": 160709, "epoch": 3826} {"train_loss": -6.990423202514648, "global_step": 160710, "epoch": 3826} {"train_loss": -7.108298301696777, "global_step": 160711, "epoch": 3826} {"train_loss": -6.944778919219971, "global_step": 160712, "epoch": 3826} {"train_loss": -6.9367265701293945, "global_step": 160713, "epoch": 3826} {"train_loss": -6.901031017303467, "global_step": 160714, "epoch": 3826} {"train_loss": -7.066628456115723, "global_step": 160715, "epoch": 3826} {"train_loss": -6.905439376831055, "global_step": 160716, "epoch": 3826} {"train_loss": -6.997531890869141, "global_step": 160717, "epoch": 3826} {"train_loss": -6.8970112800598145, "global_step": 160718, "epoch": 3826} {"train_loss": -6.890867233276367, "global_step": 160719, "epoch": 3826} {"train_loss": -6.908094882965088, "global_step": 160720, "epoch": 3826} {"train_loss": -6.971989154815674, "global_step": 160721, "epoch": 3826} {"train_loss": -6.92473840713501, "global_step": 160722, "epoch": 3826} {"train_loss": -6.883098125457764, "global_step": 160723, "epoch": 3826} {"train_loss": -6.865370750427246, "global_step": 160724, "epoch": 3826} {"train_loss": -6.869044303894043, "global_step": 160725, "epoch": 3826} {"train_loss": -6.943347454071045, "global_step": 160726, "epoch": 3826} {"train_loss": -7.004204750061035, "global_step": 160727, "epoch": 3826} {"train_loss": -6.967453956604004, "global_step": 160728, "epoch": 3826} {"train_loss": -6.984226226806641, "global_step": 160729, "epoch": 3826} {"train_loss": -6.9520158767700195, "global_step": 160730, "epoch": 3826} {"train_loss": -6.91325569152832, "global_step": 160731, "epoch": 3826} {"train_loss": -7.008092403411865, "global_step": 160732, "epoch": 3826} {"train_loss": -6.989204077493577, "global_step": 160733, "epoch": 3826, "val_loss": 79367.734375} {"train_loss": -7.022520542144775, "global_step": 160734, "epoch": 3827} {"train_loss": -6.985268592834473, "global_step": 160735, "epoch": 3827} {"train_loss": -7.063619613647461, "global_step": 160736, "epoch": 3827} {"train_loss": -7.008706569671631, "global_step": 160737, "epoch": 3827} {"train_loss": -7.02329158782959, "global_step": 160738, "epoch": 3827} {"train_loss": -7.002152919769287, "global_step": 160739, "epoch": 3827} {"train_loss": -6.975469589233398, "global_step": 160740, "epoch": 3827} {"train_loss": -6.944178581237793, "global_step": 160741, "epoch": 3827} {"train_loss": -6.988088130950928, "global_step": 160742, "epoch": 3827} {"train_loss": -6.955868721008301, "global_step": 160743, "epoch": 3827} {"train_loss": -6.8614959716796875, "global_step": 160744, "epoch": 3827} {"train_loss": -6.880825042724609, "global_step": 160745, "epoch": 3827} {"train_loss": -6.682738780975342, "global_step": 160746, "epoch": 3827} {"train_loss": -6.829730987548828, "global_step": 160747, "epoch": 3827} {"train_loss": -7.000092506408691, "global_step": 160748, "epoch": 3827} {"train_loss": -6.873204231262207, "global_step": 160749, "epoch": 3827} {"train_loss": -7.026949882507324, "global_step": 160750, "epoch": 3827} {"train_loss": -6.922040939331055, "global_step": 160751, "epoch": 3827} {"train_loss": -6.88580846786499, "global_step": 160752, "epoch": 3827} {"train_loss": -6.861507415771484, "global_step": 160753, "epoch": 3827} {"train_loss": -6.9125847816467285, "global_step": 160754, "epoch": 3827} {"train_loss": -6.816223621368408, "global_step": 160755, "epoch": 3827} {"train_loss": -6.952948093414307, "global_step": 160756, "epoch": 3827} {"train_loss": -6.860687732696533, "global_step": 160757, "epoch": 3827} {"train_loss": -6.91176700592041, "global_step": 160758, "epoch": 3827} {"train_loss": -6.941946029663086, "global_step": 160759, "epoch": 3827} {"train_loss": -6.798318862915039, "global_step": 160760, "epoch": 3827} {"train_loss": -6.910560607910156, "global_step": 160761, "epoch": 3827} {"train_loss": -6.973530292510986, "global_step": 160762, "epoch": 3827} {"train_loss": -6.881761074066162, "global_step": 160763, "epoch": 3827} {"train_loss": -7.006609916687012, "global_step": 160764, "epoch": 3827} {"train_loss": -6.869480133056641, "global_step": 160765, "epoch": 3827} {"train_loss": -7.00205135345459, "global_step": 160766, "epoch": 3827} {"train_loss": -6.94425630569458, "global_step": 160767, "epoch": 3827} {"train_loss": -6.981753826141357, "global_step": 160768, "epoch": 3827} {"train_loss": -6.877538681030273, "global_step": 160769, "epoch": 3827} {"train_loss": -7.089735507965088, "global_step": 160770, "epoch": 3827} {"train_loss": -6.940622806549072, "global_step": 160771, "epoch": 3827} {"train_loss": -7.005283355712891, "global_step": 160772, "epoch": 3827} {"train_loss": -7.110354423522949, "global_step": 160773, "epoch": 3827} {"train_loss": -6.922780990600586, "global_step": 160774, "epoch": 3827} {"train_loss": -6.942754041580927, "global_step": 160775, "epoch": 3827, "val_loss": 79194.625} {"train_loss": -7.063695907592773, "global_step": 160776, "epoch": 3828} {"train_loss": -7.057539939880371, "global_step": 160777, "epoch": 3828} {"train_loss": -6.840185165405273, "global_step": 160778, "epoch": 3828} {"train_loss": -7.06657600402832, "global_step": 160779, "epoch": 3828} {"train_loss": -7.054480075836182, "global_step": 160780, "epoch": 3828} {"train_loss": -7.008263111114502, "global_step": 160781, "epoch": 3828} {"train_loss": -6.941824913024902, "global_step": 160782, "epoch": 3828} {"train_loss": -6.978723526000977, "global_step": 160783, "epoch": 3828} {"train_loss": -7.066054821014404, "global_step": 160784, "epoch": 3828} {"train_loss": -7.074614524841309, "global_step": 160785, "epoch": 3828} {"train_loss": -6.897672176361084, "global_step": 160786, "epoch": 3828} {"train_loss": -7.104040145874023, "global_step": 160787, "epoch": 3828} {"train_loss": -6.982857704162598, "global_step": 160788, "epoch": 3828} {"train_loss": -6.9310832023620605, "global_step": 160789, "epoch": 3828} {"train_loss": -7.06476354598999, "global_step": 160790, "epoch": 3828} {"train_loss": -7.000701904296875, "global_step": 160791, "epoch": 3828} {"train_loss": -7.019098281860352, "global_step": 160792, "epoch": 3828} {"train_loss": -7.084059715270996, "global_step": 160793, "epoch": 3828} {"train_loss": -6.985608100891113, "global_step": 160794, "epoch": 3828} {"train_loss": -6.999621868133545, "global_step": 160795, "epoch": 3828} {"train_loss": -7.1359100341796875, "global_step": 160796, "epoch": 3828} {"train_loss": -7.112802028656006, "global_step": 160797, "epoch": 3828} {"train_loss": -6.96915864944458, "global_step": 160798, "epoch": 3828} {"train_loss": -7.1047468185424805, "global_step": 160799, "epoch": 3828} {"train_loss": -7.019037246704102, "global_step": 160800, "epoch": 3828} {"train_loss": -6.992003440856934, "global_step": 160801, "epoch": 3828} {"train_loss": -6.950095176696777, "global_step": 160802, "epoch": 3828} {"train_loss": -6.973733901977539, "global_step": 160803, "epoch": 3828} {"train_loss": -6.9113664627075195, "global_step": 160804, "epoch": 3828} {"train_loss": -6.922433376312256, "global_step": 160805, "epoch": 3828} {"train_loss": -7.012599468231201, "global_step": 160806, "epoch": 3828} {"train_loss": -7.093533992767334, "global_step": 160807, "epoch": 3828} {"train_loss": -6.972197532653809, "global_step": 160808, "epoch": 3828} {"train_loss": -7.015903949737549, "global_step": 160809, "epoch": 3828} {"train_loss": -7.182580947875977, "global_step": 160810, "epoch": 3828} {"train_loss": -6.914592742919922, "global_step": 160811, "epoch": 3828} {"train_loss": -7.128305912017822, "global_step": 160812, "epoch": 3828} {"train_loss": -6.9523491859436035, "global_step": 160813, "epoch": 3828} {"train_loss": -7.000057220458984, "global_step": 160814, "epoch": 3828} {"train_loss": -6.962981224060059, "global_step": 160815, "epoch": 3828} {"train_loss": -6.923250198364258, "global_step": 160816, "epoch": 3828} {"train_loss": -7.009418283190046, "global_step": 160817, "epoch": 3828, "val_loss": 79286.1328125} {"train_loss": -7.009252071380615, "global_step": 160818, "epoch": 3829} {"train_loss": -7.021109580993652, "global_step": 160819, "epoch": 3829} {"train_loss": -7.025958061218262, "global_step": 160820, "epoch": 3829} {"train_loss": -7.006667613983154, "global_step": 160821, "epoch": 3829} {"train_loss": -7.002239227294922, "global_step": 160822, "epoch": 3829} {"train_loss": -7.0057053565979, "global_step": 160823, "epoch": 3829} {"train_loss": -6.999734878540039, "global_step": 160824, "epoch": 3829} {"train_loss": -6.92915153503418, "global_step": 160825, "epoch": 3829} {"train_loss": -6.872574806213379, "global_step": 160826, "epoch": 3829} {"train_loss": -7.044826030731201, "global_step": 160827, "epoch": 3829} {"train_loss": -7.0327935218811035, "global_step": 160828, "epoch": 3829} {"train_loss": -6.934715747833252, "global_step": 160829, "epoch": 3829} {"train_loss": -7.082539081573486, "global_step": 160830, "epoch": 3829} {"train_loss": -6.917490005493164, "global_step": 160831, "epoch": 3829} {"train_loss": -6.880341529846191, "global_step": 160832, "epoch": 3829} {"train_loss": -6.83744478225708, "global_step": 160833, "epoch": 3829} {"train_loss": -6.958384037017822, "global_step": 160834, "epoch": 3829} {"train_loss": -6.942486763000488, "global_step": 160835, "epoch": 3829} {"train_loss": -6.856513977050781, "global_step": 160836, "epoch": 3829} {"train_loss": -6.905939102172852, "global_step": 160837, "epoch": 3829} {"train_loss": -6.777029037475586, "global_step": 160838, "epoch": 3829} {"train_loss": -6.8924560546875, "global_step": 160839, "epoch": 3829} {"train_loss": -6.837847709655762, "global_step": 160840, "epoch": 3829} {"train_loss": -6.813773155212402, "global_step": 160841, "epoch": 3829} {"train_loss": -7.014222145080566, "global_step": 160842, "epoch": 3829} {"train_loss": -6.845201015472412, "global_step": 160843, "epoch": 3829} {"train_loss": -6.889756202697754, "global_step": 160844, "epoch": 3829} {"train_loss": -6.920754432678223, "global_step": 160845, "epoch": 3829} {"train_loss": -6.829790115356445, "global_step": 160846, "epoch": 3829} {"train_loss": -6.939260482788086, "global_step": 160847, "epoch": 3829} {"train_loss": -6.998076438903809, "global_step": 160848, "epoch": 3829} {"train_loss": -6.731770038604736, "global_step": 160849, "epoch": 3829} {"train_loss": -6.926169395446777, "global_step": 160850, "epoch": 3829} {"train_loss": -6.876265048980713, "global_step": 160851, "epoch": 3829} {"train_loss": -6.857389450073242, "global_step": 160852, "epoch": 3829} {"train_loss": -6.818355083465576, "global_step": 160853, "epoch": 3829} {"train_loss": -6.8764824867248535, "global_step": 160854, "epoch": 3829} {"train_loss": -6.895647048950195, "global_step": 160855, "epoch": 3829} {"train_loss": -6.878149032592773, "global_step": 160856, "epoch": 3829} {"train_loss": -7.0049824714660645, "global_step": 160857, "epoch": 3829} {"train_loss": -6.918760776519775, "global_step": 160858, "epoch": 3829} {"train_loss": -6.921191056569417, "global_step": 160859, "epoch": 3829, "val_loss": 79655.21875} {"train_loss": -6.905531883239746, "global_step": 160860, "epoch": 3830} {"train_loss": -6.98345422744751, "global_step": 160861, "epoch": 3830} {"train_loss": -6.788283348083496, "global_step": 160862, "epoch": 3830} {"train_loss": -6.913130760192871, "global_step": 160863, "epoch": 3830} {"train_loss": -6.938403129577637, "global_step": 160864, "epoch": 3830} {"train_loss": -7.066849708557129, "global_step": 160865, "epoch": 3830} {"train_loss": -6.847806930541992, "global_step": 160866, "epoch": 3830} {"train_loss": -6.915663719177246, "global_step": 160867, "epoch": 3830} {"train_loss": -6.74793815612793, "global_step": 160868, "epoch": 3830} {"train_loss": -6.955924987792969, "global_step": 160869, "epoch": 3830} {"train_loss": -6.740531921386719, "global_step": 160870, "epoch": 3830} {"train_loss": -6.886672019958496, "global_step": 160871, "epoch": 3830} {"train_loss": -6.789085388183594, "global_step": 160872, "epoch": 3830} {"train_loss": -6.750683784484863, "global_step": 160873, "epoch": 3830} {"train_loss": -6.941130638122559, "global_step": 160874, "epoch": 3830} {"train_loss": -6.773571968078613, "global_step": 160875, "epoch": 3830} {"train_loss": -6.980644226074219, "global_step": 160876, "epoch": 3830} {"train_loss": -6.862222671508789, "global_step": 160877, "epoch": 3830} {"train_loss": -6.942438125610352, "global_step": 160878, "epoch": 3830} {"train_loss": -6.805685043334961, "global_step": 160879, "epoch": 3830} {"train_loss": -6.803225517272949, "global_step": 160880, "epoch": 3830} {"train_loss": -6.8582305908203125, "global_step": 160881, "epoch": 3830} {"train_loss": -6.950168132781982, "global_step": 160882, "epoch": 3830} {"train_loss": -7.058642387390137, "global_step": 160883, "epoch": 3830} {"train_loss": -7.000160217285156, "global_step": 160884, "epoch": 3830} {"train_loss": -6.963899612426758, "global_step": 160885, "epoch": 3830} {"train_loss": -6.913541793823242, "global_step": 160886, "epoch": 3830} {"train_loss": -6.924144268035889, "global_step": 160887, "epoch": 3830} {"train_loss": -6.840997695922852, "global_step": 160888, "epoch": 3830} {"train_loss": -6.880898475646973, "global_step": 160889, "epoch": 3830} {"train_loss": -6.973378658294678, "global_step": 160890, "epoch": 3830} {"train_loss": -6.92207145690918, "global_step": 160891, "epoch": 3830} {"train_loss": -6.955181121826172, "global_step": 160892, "epoch": 3830} {"train_loss": -7.033902168273926, "global_step": 160893, "epoch": 3830} {"train_loss": -6.952399253845215, "global_step": 160894, "epoch": 3830} {"train_loss": -6.930057525634766, "global_step": 160895, "epoch": 3830} {"train_loss": -6.943357467651367, "global_step": 160896, "epoch": 3830} {"train_loss": -7.012765884399414, "global_step": 160897, "epoch": 3830} {"train_loss": -6.912901878356934, "global_step": 160898, "epoch": 3830} {"train_loss": -6.997750759124756, "global_step": 160899, "epoch": 3830} {"train_loss": -6.992727279663086, "global_step": 160900, "epoch": 3830} {"train_loss": -6.91448400134132, "global_step": 160901, "epoch": 3830, "val_loss": 79367.3984375} {"train_loss": -7.040406227111816, "global_step": 160902, "epoch": 3831} {"train_loss": -7.048692226409912, "global_step": 160903, "epoch": 3831} {"train_loss": -6.942741394042969, "global_step": 160904, "epoch": 3831} {"train_loss": -7.018627166748047, "global_step": 160905, "epoch": 3831} {"train_loss": -6.9656219482421875, "global_step": 160906, "epoch": 3831} {"train_loss": -7.011733531951904, "global_step": 160907, "epoch": 3831} {"train_loss": -7.023073196411133, "global_step": 160908, "epoch": 3831} {"train_loss": -6.961949825286865, "global_step": 160909, "epoch": 3831} {"train_loss": -7.021060943603516, "global_step": 160910, "epoch": 3831} {"train_loss": -7.023654937744141, "global_step": 160911, "epoch": 3831} {"train_loss": -6.958187103271484, "global_step": 160912, "epoch": 3831} {"train_loss": -6.965871810913086, "global_step": 160913, "epoch": 3831} {"train_loss": -7.0693159103393555, "global_step": 160914, "epoch": 3831} {"train_loss": -7.072754859924316, "global_step": 160915, "epoch": 3831} {"train_loss": -6.965488910675049, "global_step": 160916, "epoch": 3831} {"train_loss": -7.079814434051514, "global_step": 160917, "epoch": 3831} {"train_loss": -6.975184440612793, "global_step": 160918, "epoch": 3831} {"train_loss": -6.964599132537842, "global_step": 160919, "epoch": 3831} {"train_loss": -7.0073957443237305, "global_step": 160920, "epoch": 3831} {"train_loss": -7.024270057678223, "global_step": 160921, "epoch": 3831} {"train_loss": -7.049515247344971, "global_step": 160922, "epoch": 3831} {"train_loss": -7.049883842468262, "global_step": 160923, "epoch": 3831} {"train_loss": -6.952550888061523, "global_step": 160924, "epoch": 3831} {"train_loss": -6.9635419845581055, "global_step": 160925, "epoch": 3831} {"train_loss": -6.97823429107666, "global_step": 160926, "epoch": 3831} {"train_loss": -7.002679824829102, "global_step": 160927, "epoch": 3831} {"train_loss": -6.908849239349365, "global_step": 160928, "epoch": 3831} {"train_loss": -6.9024858474731445, "global_step": 160929, "epoch": 3831} {"train_loss": -6.842192649841309, "global_step": 160930, "epoch": 3831} {"train_loss": -6.9576849937438965, "global_step": 160931, "epoch": 3831} {"train_loss": -6.917644500732422, "global_step": 160932, "epoch": 3831} {"train_loss": -6.893807888031006, "global_step": 160933, "epoch": 3831} {"train_loss": -7.0110321044921875, "global_step": 160934, "epoch": 3831} {"train_loss": -6.770648002624512, "global_step": 160935, "epoch": 3831} {"train_loss": -6.9353132247924805, "global_step": 160936, "epoch": 3831} {"train_loss": -6.8518476486206055, "global_step": 160937, "epoch": 3831} {"train_loss": -6.895781517028809, "global_step": 160938, "epoch": 3831} {"train_loss": -6.929737567901611, "global_step": 160939, "epoch": 3831} {"train_loss": -6.896981239318848, "global_step": 160940, "epoch": 3831} {"train_loss": -6.890926361083984, "global_step": 160941, "epoch": 3831} {"train_loss": -6.87905216217041, "global_step": 160942, "epoch": 3831} {"train_loss": -6.966211739040556, "global_step": 160943, "epoch": 3831, "val_loss": 79314.53125} {"train_loss": -6.9883222579956055, "global_step": 160944, "epoch": 3832} {"train_loss": -6.914690971374512, "global_step": 160945, "epoch": 3832} {"train_loss": -6.94174861907959, "global_step": 160946, "epoch": 3832} {"train_loss": -6.881383895874023, "global_step": 160947, "epoch": 3832} {"train_loss": -6.901044845581055, "global_step": 160948, "epoch": 3832} {"train_loss": -7.020853519439697, "global_step": 160949, "epoch": 3832} {"train_loss": -6.910306453704834, "global_step": 160950, "epoch": 3832} {"train_loss": -6.945982933044434, "global_step": 160951, "epoch": 3832} {"train_loss": -7.05201530456543, "global_step": 160952, "epoch": 3832} {"train_loss": -6.949615478515625, "global_step": 160953, "epoch": 3832} {"train_loss": -6.953555107116699, "global_step": 160954, "epoch": 3832} {"train_loss": -6.991826057434082, "global_step": 160955, "epoch": 3832} {"train_loss": -6.95835018157959, "global_step": 160956, "epoch": 3832} {"train_loss": -6.954606056213379, "global_step": 160957, "epoch": 3832} {"train_loss": -6.90435266494751, "global_step": 160958, "epoch": 3832} {"train_loss": -6.980329513549805, "global_step": 160959, "epoch": 3832} {"train_loss": -6.8588032722473145, "global_step": 160960, "epoch": 3832} {"train_loss": -6.957674980163574, "global_step": 160961, "epoch": 3832} {"train_loss": -6.848793029785156, "global_step": 160962, "epoch": 3832} {"train_loss": -6.986111164093018, "global_step": 160963, "epoch": 3832} {"train_loss": -6.90445613861084, "global_step": 160964, "epoch": 3832} {"train_loss": -6.9906816482543945, "global_step": 160965, "epoch": 3832} {"train_loss": -6.994015693664551, "global_step": 160966, "epoch": 3832} {"train_loss": -6.984601020812988, "global_step": 160967, "epoch": 3832} {"train_loss": -6.7489423751831055, "global_step": 160968, "epoch": 3832} {"train_loss": -6.949771881103516, "global_step": 160969, "epoch": 3832} {"train_loss": -6.9135212898254395, "global_step": 160970, "epoch": 3832} {"train_loss": -6.918966293334961, "global_step": 160971, "epoch": 3832} {"train_loss": -6.969398021697998, "global_step": 160972, "epoch": 3832} {"train_loss": -6.943571090698242, "global_step": 160973, "epoch": 3832} {"train_loss": -6.947453498840332, "global_step": 160974, "epoch": 3832} {"train_loss": -6.955789566040039, "global_step": 160975, "epoch": 3832} {"train_loss": -6.988426208496094, "global_step": 160976, "epoch": 3832} {"train_loss": -6.837708473205566, "global_step": 160977, "epoch": 3832} {"train_loss": -6.980193138122559, "global_step": 160978, "epoch": 3832} {"train_loss": -6.999155044555664, "global_step": 160979, "epoch": 3832} {"train_loss": -7.021170616149902, "global_step": 160980, "epoch": 3832} {"train_loss": -7.035891532897949, "global_step": 160981, "epoch": 3832} {"train_loss": -6.952016830444336, "global_step": 160982, "epoch": 3832} {"train_loss": -6.980069160461426, "global_step": 160983, "epoch": 3832} {"train_loss": -6.966423988342285, "global_step": 160984, "epoch": 3832} {"train_loss": -6.949453217642648, "global_step": 160985, "epoch": 3832, "val_loss": 79234.1796875} {"train_loss": -7.068277359008789, "global_step": 160986, "epoch": 3833} {"train_loss": -7.05629825592041, "global_step": 160987, "epoch": 3833} {"train_loss": -6.927575588226318, "global_step": 160988, "epoch": 3833} {"train_loss": -7.019418716430664, "global_step": 160989, "epoch": 3833} {"train_loss": -7.051794528961182, "global_step": 160990, "epoch": 3833} {"train_loss": -6.990426540374756, "global_step": 160991, "epoch": 3833} {"train_loss": -7.05502986907959, "global_step": 160992, "epoch": 3833} {"train_loss": -7.050626754760742, "global_step": 160993, "epoch": 3833} {"train_loss": -6.835967063903809, "global_step": 160994, "epoch": 3833} {"train_loss": -6.913507461547852, "global_step": 160995, "epoch": 3833} {"train_loss": -6.986464500427246, "global_step": 160996, "epoch": 3833} {"train_loss": -7.011733055114746, "global_step": 160997, "epoch": 3833} {"train_loss": -6.953490257263184, "global_step": 160998, "epoch": 3833} {"train_loss": -6.9614763259887695, "global_step": 160999, "epoch": 3833} {"train_loss": -7.04509162902832, "global_step": 161000, "epoch": 3833} {"train_loss": -7.084704875946045, "global_step": 161001, "epoch": 3833} {"train_loss": -6.985711097717285, "global_step": 161002, "epoch": 3833} {"train_loss": -6.9329514503479, "global_step": 161003, "epoch": 3833} {"train_loss": -7.063084602355957, "global_step": 161004, "epoch": 3833} {"train_loss": -7.018438816070557, "global_step": 161005, "epoch": 3833} {"train_loss": -6.982155799865723, "global_step": 161006, "epoch": 3833} {"train_loss": -6.966305255889893, "global_step": 161007, "epoch": 3833} {"train_loss": -7.0857768058776855, "global_step": 161008, "epoch": 3833} {"train_loss": -7.096234321594238, "global_step": 161009, "epoch": 3833} {"train_loss": -7.066017150878906, "global_step": 161010, "epoch": 3833} {"train_loss": -6.99085807800293, "global_step": 161011, "epoch": 3833} {"train_loss": -7.016872882843018, "global_step": 161012, "epoch": 3833} {"train_loss": -6.940590858459473, "global_step": 161013, "epoch": 3833} {"train_loss": -7.092597961425781, "global_step": 161014, "epoch": 3833} {"train_loss": -7.055253982543945, "global_step": 161015, "epoch": 3833} {"train_loss": -6.912049770355225, "global_step": 161016, "epoch": 3833} {"train_loss": -7.071946144104004, "global_step": 161017, "epoch": 3833} {"train_loss": -7.115267753601074, "global_step": 161018, "epoch": 3833} {"train_loss": -6.999074459075928, "global_step": 161019, "epoch": 3833} {"train_loss": -6.88939094543457, "global_step": 161020, "epoch": 3833} {"train_loss": -6.991837024688721, "global_step": 161021, "epoch": 3833} {"train_loss": -6.995452880859375, "global_step": 161022, "epoch": 3833} {"train_loss": -6.897340297698975, "global_step": 161023, "epoch": 3833} {"train_loss": -7.058104991912842, "global_step": 161024, "epoch": 3833} {"train_loss": -6.966133117675781, "global_step": 161025, "epoch": 3833} {"train_loss": -6.79524040222168, "global_step": 161026, "epoch": 3833} {"train_loss": -6.993470555260068, "global_step": 161027, "epoch": 3833, "val_loss": 79405.3671875} {"train_loss": -7.011285781860352, "global_step": 161028, "epoch": 3834} {"train_loss": -6.852269172668457, "global_step": 161029, "epoch": 3834} {"train_loss": -6.8872480392456055, "global_step": 161030, "epoch": 3834} {"train_loss": -7.068575382232666, "global_step": 161031, "epoch": 3834} {"train_loss": -6.9941277503967285, "global_step": 161032, "epoch": 3834} {"train_loss": -7.004752159118652, "global_step": 161033, "epoch": 3834} {"train_loss": -6.825251579284668, "global_step": 161034, "epoch": 3834} {"train_loss": -6.93494987487793, "global_step": 161035, "epoch": 3834} {"train_loss": -6.902288436889648, "global_step": 161036, "epoch": 3834} {"train_loss": -6.787487030029297, "global_step": 161037, "epoch": 3834} {"train_loss": -6.924490451812744, "global_step": 161038, "epoch": 3834} {"train_loss": -6.855615615844727, "global_step": 161039, "epoch": 3834} {"train_loss": -6.887218475341797, "global_step": 161040, "epoch": 3834} {"train_loss": -6.845118045806885, "global_step": 161041, "epoch": 3834} {"train_loss": -6.805853366851807, "global_step": 161042, "epoch": 3834} {"train_loss": -6.760915756225586, "global_step": 161043, "epoch": 3834} {"train_loss": -6.728370666503906, "global_step": 161044, "epoch": 3834} {"train_loss": -6.937431335449219, "global_step": 161045, "epoch": 3834} {"train_loss": -6.825737953186035, "global_step": 161046, "epoch": 3834} {"train_loss": -6.965580463409424, "global_step": 161047, "epoch": 3834} {"train_loss": -6.701773643493652, "global_step": 161048, "epoch": 3834} {"train_loss": -6.945855140686035, "global_step": 161049, "epoch": 3834} {"train_loss": -6.712289333343506, "global_step": 161050, "epoch": 3834} {"train_loss": -6.8428497314453125, "global_step": 161051, "epoch": 3834} {"train_loss": -6.906047821044922, "global_step": 161052, "epoch": 3834} {"train_loss": -6.858707427978516, "global_step": 161053, "epoch": 3834} {"train_loss": -6.8255767822265625, "global_step": 161054, "epoch": 3834} {"train_loss": -6.693471908569336, "global_step": 161055, "epoch": 3834} {"train_loss": -6.883548736572266, "global_step": 161056, "epoch": 3834} {"train_loss": -6.834230422973633, "global_step": 161057, "epoch": 3834} {"train_loss": -6.88247013092041, "global_step": 161058, "epoch": 3834} {"train_loss": -6.897617816925049, "global_step": 161059, "epoch": 3834} {"train_loss": -6.881025314331055, "global_step": 161060, "epoch": 3834} {"train_loss": -6.921157360076904, "global_step": 161061, "epoch": 3834} {"train_loss": -6.862165451049805, "global_step": 161062, "epoch": 3834} {"train_loss": -6.957802772521973, "global_step": 161063, "epoch": 3834} {"train_loss": -6.888858795166016, "global_step": 161064, "epoch": 3834} {"train_loss": -7.000100135803223, "global_step": 161065, "epoch": 3834} {"train_loss": -6.957118988037109, "global_step": 161066, "epoch": 3834} {"train_loss": -6.96369743347168, "global_step": 161067, "epoch": 3834} {"train_loss": -6.924813270568848, "global_step": 161068, "epoch": 3834} {"train_loss": -6.882456665947323, "global_step": 161069, "epoch": 3834, "val_loss": 79479.9375} {"train_loss": -6.965664863586426, "global_step": 161070, "epoch": 3835} {"train_loss": -7.018692970275879, "global_step": 161071, "epoch": 3835} {"train_loss": -7.002323150634766, "global_step": 161072, "epoch": 3835} {"train_loss": -6.889711856842041, "global_step": 161073, "epoch": 3835} {"train_loss": -6.8928070068359375, "global_step": 161074, "epoch": 3835} {"train_loss": -6.893617153167725, "global_step": 161075, "epoch": 3835} {"train_loss": -6.940533638000488, "global_step": 161076, "epoch": 3835} {"train_loss": -6.882114410400391, "global_step": 161077, "epoch": 3835} {"train_loss": -7.034468650817871, "global_step": 161078, "epoch": 3835} {"train_loss": -6.917807102203369, "global_step": 161079, "epoch": 3835} {"train_loss": -6.873603820800781, "global_step": 161080, "epoch": 3835} {"train_loss": -6.9921441078186035, "global_step": 161081, "epoch": 3835} {"train_loss": -6.947825908660889, "global_step": 161082, "epoch": 3835} {"train_loss": -6.91341495513916, "global_step": 161083, "epoch": 3835} {"train_loss": -7.051715850830078, "global_step": 161084, "epoch": 3835} {"train_loss": -7.074954032897949, "global_step": 161085, "epoch": 3835} {"train_loss": -7.030679702758789, "global_step": 161086, "epoch": 3835} {"train_loss": -7.056212425231934, "global_step": 161087, "epoch": 3835} {"train_loss": -7.073819160461426, "global_step": 161088, "epoch": 3835} {"train_loss": -6.862088203430176, "global_step": 161089, "epoch": 3835} {"train_loss": -6.97477912902832, "global_step": 161090, "epoch": 3835} {"train_loss": -7.0103044509887695, "global_step": 161091, "epoch": 3835} {"train_loss": -7.023499011993408, "global_step": 161092, "epoch": 3835} {"train_loss": -6.968485355377197, "global_step": 161093, "epoch": 3835} {"train_loss": -6.903267860412598, "global_step": 161094, "epoch": 3835} {"train_loss": -6.995936393737793, "global_step": 161095, "epoch": 3835} {"train_loss": -6.851736068725586, "global_step": 161096, "epoch": 3835} {"train_loss": -6.84699010848999, "global_step": 161097, "epoch": 3835} {"train_loss": -7.079209804534912, "global_step": 161098, "epoch": 3835} {"train_loss": -6.91450309753418, "global_step": 161099, "epoch": 3835} {"train_loss": -6.936073303222656, "global_step": 161100, "epoch": 3835} {"train_loss": -7.015180587768555, "global_step": 161101, "epoch": 3835} {"train_loss": -6.972184181213379, "global_step": 161102, "epoch": 3835} {"train_loss": -7.046003341674805, "global_step": 161103, "epoch": 3835} {"train_loss": -7.098897457122803, "global_step": 161104, "epoch": 3835} {"train_loss": -6.7760539054870605, "global_step": 161105, "epoch": 3835} {"train_loss": -6.8189311027526855, "global_step": 161106, "epoch": 3835} {"train_loss": -6.934469699859619, "global_step": 161107, "epoch": 3835} {"train_loss": -6.8495588302612305, "global_step": 161108, "epoch": 3835} {"train_loss": -6.966121673583984, "global_step": 161109, "epoch": 3835} {"train_loss": -7.061695098876953, "global_step": 161110, "epoch": 3835} {"train_loss": -6.958693799518404, "global_step": 161111, "epoch": 3835, "val_loss": 79375.1640625} {"train_loss": -7.051853656768799, "global_step": 161112, "epoch": 3836} {"train_loss": -6.96209192276001, "global_step": 161113, "epoch": 3836} {"train_loss": -6.9708757400512695, "global_step": 161114, "epoch": 3836} {"train_loss": -6.904623985290527, "global_step": 161115, "epoch": 3836} {"train_loss": -6.978799819946289, "global_step": 161116, "epoch": 3836} {"train_loss": -6.906610488891602, "global_step": 161117, "epoch": 3836} {"train_loss": -7.094904899597168, "global_step": 161118, "epoch": 3836} {"train_loss": -6.8966803550720215, "global_step": 161119, "epoch": 3836} {"train_loss": -6.971785545349121, "global_step": 161120, "epoch": 3836} {"train_loss": -6.936906814575195, "global_step": 161121, "epoch": 3836} {"train_loss": -7.01136589050293, "global_step": 161122, "epoch": 3836} {"train_loss": -6.941006660461426, "global_step": 161123, "epoch": 3836} {"train_loss": -6.9741106033325195, "global_step": 161124, "epoch": 3836} {"train_loss": -7.037583351135254, "global_step": 161125, "epoch": 3836} {"train_loss": -7.055680274963379, "global_step": 161126, "epoch": 3836} {"train_loss": -7.0512285232543945, "global_step": 161127, "epoch": 3836} {"train_loss": -7.07887077331543, "global_step": 161128, "epoch": 3836} {"train_loss": -7.022779941558838, "global_step": 161129, "epoch": 3836} {"train_loss": -6.982883453369141, "global_step": 161130, "epoch": 3836} {"train_loss": -7.049055099487305, "global_step": 161131, "epoch": 3836} {"train_loss": -7.079122543334961, "global_step": 161132, "epoch": 3836} {"train_loss": -6.946009635925293, "global_step": 161133, "epoch": 3836} {"train_loss": -7.062514305114746, "global_step": 161134, "epoch": 3836} {"train_loss": -7.03492546081543, "global_step": 161135, "epoch": 3836} {"train_loss": -7.10662841796875, "global_step": 161136, "epoch": 3836} {"train_loss": -6.982858657836914, "global_step": 161137, "epoch": 3836} {"train_loss": -6.867422103881836, "global_step": 161138, "epoch": 3836} {"train_loss": -7.144587516784668, "global_step": 161139, "epoch": 3836} {"train_loss": -6.889364242553711, "global_step": 161140, "epoch": 3836} {"train_loss": -7.068930149078369, "global_step": 161141, "epoch": 3836} {"train_loss": -6.880867004394531, "global_step": 161142, "epoch": 3836} {"train_loss": -6.950098991394043, "global_step": 161143, "epoch": 3836} {"train_loss": -6.892265319824219, "global_step": 161144, "epoch": 3836} {"train_loss": -6.8947553634643555, "global_step": 161145, "epoch": 3836} {"train_loss": -6.9063591957092285, "global_step": 161146, "epoch": 3836} {"train_loss": -6.999483585357666, "global_step": 161147, "epoch": 3836} {"train_loss": -7.042583465576172, "global_step": 161148, "epoch": 3836} {"train_loss": -7.076574325561523, "global_step": 161149, "epoch": 3836} {"train_loss": -6.820891857147217, "global_step": 161150, "epoch": 3836} {"train_loss": -7.0258588790893555, "global_step": 161151, "epoch": 3836} {"train_loss": -6.857915878295898, "global_step": 161152, "epoch": 3836} {"train_loss": -6.982903911953881, "global_step": 161153, "epoch": 3836, "val_loss": 79185.3203125} {"train_loss": -6.936986923217773, "global_step": 161154, "epoch": 3837} {"train_loss": -7.1540679931640625, "global_step": 161155, "epoch": 3837} {"train_loss": -7.1374053955078125, "global_step": 161156, "epoch": 3837} {"train_loss": -6.965100288391113, "global_step": 161157, "epoch": 3837} {"train_loss": -6.90803337097168, "global_step": 161158, "epoch": 3837} {"train_loss": -6.944927215576172, "global_step": 161159, "epoch": 3837} {"train_loss": -6.934299468994141, "global_step": 161160, "epoch": 3837} {"train_loss": -7.002301216125488, "global_step": 161161, "epoch": 3837} {"train_loss": -6.88616418838501, "global_step": 161162, "epoch": 3837} {"train_loss": -7.018683910369873, "global_step": 161163, "epoch": 3837} {"train_loss": -6.938810348510742, "global_step": 161164, "epoch": 3837} {"train_loss": -7.005964279174805, "global_step": 161165, "epoch": 3837} {"train_loss": -7.020471096038818, "global_step": 161166, "epoch": 3837} {"train_loss": -6.951127052307129, "global_step": 161167, "epoch": 3837} {"train_loss": -7.034926414489746, "global_step": 161168, "epoch": 3837} {"train_loss": -6.982555389404297, "global_step": 161169, "epoch": 3837} {"train_loss": -6.9904584884643555, "global_step": 161170, "epoch": 3837} {"train_loss": -6.882228851318359, "global_step": 161171, "epoch": 3837} {"train_loss": -6.96159553527832, "global_step": 161172, "epoch": 3837} {"train_loss": -6.969335556030273, "global_step": 161173, "epoch": 3837} {"train_loss": -6.812997817993164, "global_step": 161174, "epoch": 3837} {"train_loss": -6.872062683105469, "global_step": 161175, "epoch": 3837} {"train_loss": -6.925190448760986, "global_step": 161176, "epoch": 3837} {"train_loss": -6.821579933166504, "global_step": 161177, "epoch": 3837} {"train_loss": -6.921703815460205, "global_step": 161178, "epoch": 3837} {"train_loss": -6.8017425537109375, "global_step": 161179, "epoch": 3837} {"train_loss": -6.914420127868652, "global_step": 161180, "epoch": 3837} {"train_loss": -6.943105697631836, "global_step": 161181, "epoch": 3837} {"train_loss": -6.961569309234619, "global_step": 161182, "epoch": 3837} {"train_loss": -6.9340715408325195, "global_step": 161183, "epoch": 3837} {"train_loss": -6.918318748474121, "global_step": 161184, "epoch": 3837} {"train_loss": -7.0024871826171875, "global_step": 161185, "epoch": 3837} {"train_loss": -6.989758491516113, "global_step": 161186, "epoch": 3837} {"train_loss": -6.872873306274414, "global_step": 161187, "epoch": 3837} {"train_loss": -6.926613807678223, "global_step": 161188, "epoch": 3837} {"train_loss": -7.016561985015869, "global_step": 161189, "epoch": 3837} {"train_loss": -6.96658182144165, "global_step": 161190, "epoch": 3837} {"train_loss": -6.942440032958984, "global_step": 161191, "epoch": 3837} {"train_loss": -6.975508689880371, "global_step": 161192, "epoch": 3837} {"train_loss": -6.972814559936523, "global_step": 161193, "epoch": 3837} {"train_loss": -6.8655853271484375, "global_step": 161194, "epoch": 3837} {"train_loss": -6.952625796908424, "global_step": 161195, "epoch": 3837, "val_loss": 79394.2578125} {"train_loss": -7.052934169769287, "global_step": 161196, "epoch": 3838} {"train_loss": -6.935024261474609, "global_step": 161197, "epoch": 3838} {"train_loss": -6.873695373535156, "global_step": 161198, "epoch": 3838} {"train_loss": -6.865434169769287, "global_step": 161199, "epoch": 3838} {"train_loss": -6.940718650817871, "global_step": 161200, "epoch": 3838} {"train_loss": -6.738994121551514, "global_step": 161201, "epoch": 3838} {"train_loss": -6.949907302856445, "global_step": 161202, "epoch": 3838} {"train_loss": -6.971864223480225, "global_step": 161203, "epoch": 3838} {"train_loss": -6.853740692138672, "global_step": 161204, "epoch": 3838} {"train_loss": -7.079554557800293, "global_step": 161205, "epoch": 3838} {"train_loss": -6.8777875900268555, "global_step": 161206, "epoch": 3838} {"train_loss": -7.047120094299316, "global_step": 161207, "epoch": 3838} {"train_loss": -6.941415309906006, "global_step": 161208, "epoch": 3838} {"train_loss": -6.827507972717285, "global_step": 161209, "epoch": 3838} {"train_loss": -6.9823198318481445, "global_step": 161210, "epoch": 3838} {"train_loss": -6.949549198150635, "global_step": 161211, "epoch": 3838} {"train_loss": -6.9220991134643555, "global_step": 161212, "epoch": 3838} {"train_loss": -6.910704135894775, "global_step": 161213, "epoch": 3838} {"train_loss": -6.831640720367432, "global_step": 161214, "epoch": 3838} {"train_loss": -6.794464111328125, "global_step": 161215, "epoch": 3838} {"train_loss": -6.965391159057617, "global_step": 161216, "epoch": 3838} {"train_loss": -6.984487533569336, "global_step": 161217, "epoch": 3838} {"train_loss": -6.8710527420043945, "global_step": 161218, "epoch": 3838} {"train_loss": -6.913400173187256, "global_step": 161219, "epoch": 3838} {"train_loss": -6.990147590637207, "global_step": 161220, "epoch": 3838} {"train_loss": -6.93533182144165, "global_step": 161221, "epoch": 3838} {"train_loss": -6.873773574829102, "global_step": 161222, "epoch": 3838} {"train_loss": -6.967959403991699, "global_step": 161223, "epoch": 3838} {"train_loss": -6.924416542053223, "global_step": 161224, "epoch": 3838} {"train_loss": -6.927776336669922, "global_step": 161225, "epoch": 3838} {"train_loss": -6.854625701904297, "global_step": 161226, "epoch": 3838} {"train_loss": -6.8942108154296875, "global_step": 161227, "epoch": 3838} {"train_loss": -7.063651084899902, "global_step": 161228, "epoch": 3838} {"train_loss": -6.9347076416015625, "global_step": 161229, "epoch": 3838} {"train_loss": -6.8863205909729, "global_step": 161230, "epoch": 3838} {"train_loss": -7.041199207305908, "global_step": 161231, "epoch": 3838} {"train_loss": -6.927014350891113, "global_step": 161232, "epoch": 3838} {"train_loss": -6.953068733215332, "global_step": 161233, "epoch": 3838} {"train_loss": -6.8766889572143555, "global_step": 161234, "epoch": 3838} {"train_loss": -6.884591102600098, "global_step": 161235, "epoch": 3838} {"train_loss": -6.980799674987793, "global_step": 161236, "epoch": 3838} {"train_loss": -6.92677134559268, "global_step": 161237, "epoch": 3838, "val_loss": 79546.40625} {"train_loss": -6.94841194152832, "global_step": 161238, "epoch": 3839} {"train_loss": -6.9341840744018555, "global_step": 161239, "epoch": 3839} {"train_loss": -6.910240650177002, "global_step": 161240, "epoch": 3839} {"train_loss": -6.917941093444824, "global_step": 161241, "epoch": 3839} {"train_loss": -6.998629570007324, "global_step": 161242, "epoch": 3839} {"train_loss": -7.0137481689453125, "global_step": 161243, "epoch": 3839} {"train_loss": -7.131587028503418, "global_step": 161244, "epoch": 3839} {"train_loss": -7.0275397300720215, "global_step": 161245, "epoch": 3839} {"train_loss": -7.072844982147217, "global_step": 161246, "epoch": 3839} {"train_loss": -7.065418243408203, "global_step": 161247, "epoch": 3839} {"train_loss": -7.101978302001953, "global_step": 161248, "epoch": 3839} {"train_loss": -7.035076141357422, "global_step": 161249, "epoch": 3839} {"train_loss": -6.999260425567627, "global_step": 161250, "epoch": 3839} {"train_loss": -6.913200378417969, "global_step": 161251, "epoch": 3839} {"train_loss": -7.0303802490234375, "global_step": 161252, "epoch": 3839} {"train_loss": -6.953428745269775, "global_step": 161253, "epoch": 3839} {"train_loss": -6.9285888671875, "global_step": 161254, "epoch": 3839} {"train_loss": -6.808145523071289, "global_step": 161255, "epoch": 3839} {"train_loss": -6.922799110412598, "global_step": 161256, "epoch": 3839} {"train_loss": -6.904991149902344, "global_step": 161257, "epoch": 3839} {"train_loss": -6.9969000816345215, "global_step": 161258, "epoch": 3839} {"train_loss": -6.981749534606934, "global_step": 161259, "epoch": 3839} {"train_loss": -6.9667253494262695, "global_step": 161260, "epoch": 3839} {"train_loss": -6.969390869140625, "global_step": 161261, "epoch": 3839} {"train_loss": -7.015960693359375, "global_step": 161262, "epoch": 3839} {"train_loss": -6.932126522064209, "global_step": 161263, "epoch": 3839} {"train_loss": -6.89473819732666, "global_step": 161264, "epoch": 3839} {"train_loss": -6.988517761230469, "global_step": 161265, "epoch": 3839} {"train_loss": -6.999970436096191, "global_step": 161266, "epoch": 3839} {"train_loss": -6.986429214477539, "global_step": 161267, "epoch": 3839} {"train_loss": -6.959530353546143, "global_step": 161268, "epoch": 3839} {"train_loss": -7.057638168334961, "global_step": 161269, "epoch": 3839} {"train_loss": -6.9341936111450195, "global_step": 161270, "epoch": 3839} {"train_loss": -6.952154636383057, "global_step": 161271, "epoch": 3839} {"train_loss": -7.115536689758301, "global_step": 161272, "epoch": 3839} {"train_loss": -6.838233947753906, "global_step": 161273, "epoch": 3839} {"train_loss": -7.064554691314697, "global_step": 161274, "epoch": 3839} {"train_loss": -7.0491838455200195, "global_step": 161275, "epoch": 3839} {"train_loss": -7.002214431762695, "global_step": 161276, "epoch": 3839} {"train_loss": -7.103744029998779, "global_step": 161277, "epoch": 3839} {"train_loss": -6.962904930114746, "global_step": 161278, "epoch": 3839} {"train_loss": -6.983976216543288, "global_step": 161279, "epoch": 3839, "val_loss": 79482.2421875} {"train_loss": -7.075504302978516, "global_step": 161280, "epoch": 3840} {"train_loss": -7.0260186195373535, "global_step": 161281, "epoch": 3840} {"train_loss": -6.933785438537598, "global_step": 161282, "epoch": 3840} {"train_loss": -7.038772106170654, "global_step": 161283, "epoch": 3840} {"train_loss": -7.105788230895996, "global_step": 161284, "epoch": 3840} {"train_loss": -6.913430213928223, "global_step": 161285, "epoch": 3840} {"train_loss": -7.057199478149414, "global_step": 161286, "epoch": 3840} {"train_loss": -6.990366458892822, "global_step": 161287, "epoch": 3840} {"train_loss": -6.833390235900879, "global_step": 161288, "epoch": 3840} {"train_loss": -6.985784530639648, "global_step": 161289, "epoch": 3840} {"train_loss": -6.910131454467773, "global_step": 161290, "epoch": 3840} {"train_loss": -6.909049987792969, "global_step": 161291, "epoch": 3840} {"train_loss": -6.961180686950684, "global_step": 161292, "epoch": 3840} {"train_loss": -6.906065464019775, "global_step": 161293, "epoch": 3840} {"train_loss": -6.8602399826049805, "global_step": 161294, "epoch": 3840} {"train_loss": -6.9131011962890625, "global_step": 161295, "epoch": 3840} {"train_loss": -7.069007873535156, "global_step": 161296, "epoch": 3840} {"train_loss": -6.983315467834473, "global_step": 161297, "epoch": 3840} {"train_loss": -6.9537153244018555, "global_step": 161298, "epoch": 3840} {"train_loss": -6.978096961975098, "global_step": 161299, "epoch": 3840} {"train_loss": -6.983973979949951, "global_step": 161300, "epoch": 3840} {"train_loss": -6.971169948577881, "global_step": 161301, "epoch": 3840} {"train_loss": -7.065478801727295, "global_step": 161302, "epoch": 3840} {"train_loss": -6.9947943687438965, "global_step": 161303, "epoch": 3840} {"train_loss": -6.948860168457031, "global_step": 161304, "epoch": 3840} {"train_loss": -6.924431324005127, "global_step": 161305, "epoch": 3840} {"train_loss": -6.957729339599609, "global_step": 161306, "epoch": 3840} {"train_loss": -6.957857131958008, "global_step": 161307, "epoch": 3840} {"train_loss": -7.031656265258789, "global_step": 161308, "epoch": 3840} {"train_loss": -7.072834491729736, "global_step": 161309, "epoch": 3840} {"train_loss": -7.049600601196289, "global_step": 161310, "epoch": 3840} {"train_loss": -7.027897834777832, "global_step": 161311, "epoch": 3840} {"train_loss": -7.032963752746582, "global_step": 161312, "epoch": 3840} {"train_loss": -7.077385902404785, "global_step": 161313, "epoch": 3840} {"train_loss": -7.07834005355835, "global_step": 161314, "epoch": 3840} {"train_loss": -6.988726615905762, "global_step": 161315, "epoch": 3840} {"train_loss": -6.924565315246582, "global_step": 161316, "epoch": 3840} {"train_loss": -6.9238200187683105, "global_step": 161317, "epoch": 3840} {"train_loss": -7.049144268035889, "global_step": 161318, "epoch": 3840} {"train_loss": -6.969959259033203, "global_step": 161319, "epoch": 3840} {"train_loss": -6.924437522888184, "global_step": 161320, "epoch": 3840} {"train_loss": -6.986502545220511, "global_step": 161321, "epoch": 3840, "val_loss": 79516.265625} {"train_loss": -7.120804786682129, "global_step": 161322, "epoch": 3841} {"train_loss": -7.054510116577148, "global_step": 161323, "epoch": 3841} {"train_loss": -6.920194149017334, "global_step": 161324, "epoch": 3841} {"train_loss": -7.0282769203186035, "global_step": 161325, "epoch": 3841} {"train_loss": -6.918259620666504, "global_step": 161326, "epoch": 3841} {"train_loss": -7.082253456115723, "global_step": 161327, "epoch": 3841} {"train_loss": -6.9903883934021, "global_step": 161328, "epoch": 3841} {"train_loss": -7.061516284942627, "global_step": 161329, "epoch": 3841} {"train_loss": -7.159414291381836, "global_step": 161330, "epoch": 3841} {"train_loss": -6.963232040405273, "global_step": 161331, "epoch": 3841} {"train_loss": -7.04378604888916, "global_step": 161332, "epoch": 3841} {"train_loss": -6.946643352508545, "global_step": 161333, "epoch": 3841} {"train_loss": -7.028797149658203, "global_step": 161334, "epoch": 3841} {"train_loss": -6.977730751037598, "global_step": 161335, "epoch": 3841} {"train_loss": -7.047139644622803, "global_step": 161336, "epoch": 3841} {"train_loss": -6.9835405349731445, "global_step": 161337, "epoch": 3841} {"train_loss": -7.004841327667236, "global_step": 161338, "epoch": 3841} {"train_loss": -6.999980449676514, "global_step": 161339, "epoch": 3841} {"train_loss": -6.9488067626953125, "global_step": 161340, "epoch": 3841} {"train_loss": -7.013338088989258, "global_step": 161341, "epoch": 3841} {"train_loss": -7.018095016479492, "global_step": 161342, "epoch": 3841} {"train_loss": -7.072536468505859, "global_step": 161343, "epoch": 3841} {"train_loss": -6.884686470031738, "global_step": 161344, "epoch": 3841} {"train_loss": -7.018151760101318, "global_step": 161345, "epoch": 3841} {"train_loss": -6.956331253051758, "global_step": 161346, "epoch": 3841} {"train_loss": -6.956433296203613, "global_step": 161347, "epoch": 3841} {"train_loss": -6.992897033691406, "global_step": 161348, "epoch": 3841} {"train_loss": -7.0313873291015625, "global_step": 161349, "epoch": 3841} {"train_loss": -7.132822513580322, "global_step": 161350, "epoch": 3841} {"train_loss": -7.047414779663086, "global_step": 161351, "epoch": 3841} {"train_loss": -7.007968425750732, "global_step": 161352, "epoch": 3841} {"train_loss": -6.954972267150879, "global_step": 161353, "epoch": 3841} {"train_loss": -6.963726997375488, "global_step": 161354, "epoch": 3841} {"train_loss": -6.956896781921387, "global_step": 161355, "epoch": 3841} {"train_loss": -6.95963716506958, "global_step": 161356, "epoch": 3841} {"train_loss": -7.038222789764404, "global_step": 161357, "epoch": 3841} {"train_loss": -7.0088090896606445, "global_step": 161358, "epoch": 3841} {"train_loss": -6.987539291381836, "global_step": 161359, "epoch": 3841} {"train_loss": -6.943480491638184, "global_step": 161360, "epoch": 3841} {"train_loss": -7.022865295410156, "global_step": 161361, "epoch": 3841} {"train_loss": -6.931692123413086, "global_step": 161362, "epoch": 3841} {"train_loss": -7.000641130265736, "global_step": 161363, "epoch": 3841, "val_loss": 79484.2109375} {"train_loss": -7.024561882019043, "global_step": 161364, "epoch": 3842} {"train_loss": -6.973077774047852, "global_step": 161365, "epoch": 3842} {"train_loss": -6.985579013824463, "global_step": 161366, "epoch": 3842} {"train_loss": -7.042437553405762, "global_step": 161367, "epoch": 3842} {"train_loss": -6.899796962738037, "global_step": 161368, "epoch": 3842} {"train_loss": -7.05596399307251, "global_step": 161369, "epoch": 3842} {"train_loss": -7.012592792510986, "global_step": 161370, "epoch": 3842} {"train_loss": -6.811654090881348, "global_step": 161371, "epoch": 3842} {"train_loss": -6.837193489074707, "global_step": 161372, "epoch": 3842} {"train_loss": -6.923057556152344, "global_step": 161373, "epoch": 3842} {"train_loss": -6.788001537322998, "global_step": 161374, "epoch": 3842} {"train_loss": -6.981435775756836, "global_step": 161375, "epoch": 3842} {"train_loss": -6.915143966674805, "global_step": 161376, "epoch": 3842} {"train_loss": -6.988466262817383, "global_step": 161377, "epoch": 3842} {"train_loss": -6.93546199798584, "global_step": 161378, "epoch": 3842} {"train_loss": -6.882966041564941, "global_step": 161379, "epoch": 3842} {"train_loss": -6.914872169494629, "global_step": 161380, "epoch": 3842} {"train_loss": -6.879909992218018, "global_step": 161381, "epoch": 3842} {"train_loss": -6.8606462478637695, "global_step": 161382, "epoch": 3842} {"train_loss": -6.899542808532715, "global_step": 161383, "epoch": 3842} {"train_loss": -6.893474578857422, "global_step": 161384, "epoch": 3842} {"train_loss": -6.78898811340332, "global_step": 161385, "epoch": 3842} {"train_loss": -6.803439140319824, "global_step": 161386, "epoch": 3842} {"train_loss": -6.810555458068848, "global_step": 161387, "epoch": 3842} {"train_loss": -6.812719821929932, "global_step": 161388, "epoch": 3842} {"train_loss": -6.8387651443481445, "global_step": 161389, "epoch": 3842} {"train_loss": -6.969779014587402, "global_step": 161390, "epoch": 3842} {"train_loss": -6.768951416015625, "global_step": 161391, "epoch": 3842} {"train_loss": -6.993582725524902, "global_step": 161392, "epoch": 3842} {"train_loss": -6.833490371704102, "global_step": 161393, "epoch": 3842} {"train_loss": -6.962780952453613, "global_step": 161394, "epoch": 3842} {"train_loss": -6.893184661865234, "global_step": 161395, "epoch": 3842} {"train_loss": -6.942539691925049, "global_step": 161396, "epoch": 3842} {"train_loss": -6.884173393249512, "global_step": 161397, "epoch": 3842} {"train_loss": -6.959830284118652, "global_step": 161398, "epoch": 3842} {"train_loss": -6.92343282699585, "global_step": 161399, "epoch": 3842} {"train_loss": -6.974177360534668, "global_step": 161400, "epoch": 3842} {"train_loss": -6.982318878173828, "global_step": 161401, "epoch": 3842} {"train_loss": -6.859750747680664, "global_step": 161402, "epoch": 3842} {"train_loss": -6.923272132873535, "global_step": 161403, "epoch": 3842} {"train_loss": -7.055132865905762, "global_step": 161404, "epoch": 3842} {"train_loss": -6.911324444271269, "global_step": 161405, "epoch": 3842, "val_loss": 79142.8359375} {"train_loss": -6.884909629821777, "global_step": 161406, "epoch": 3843} {"train_loss": -7.068310737609863, "global_step": 161407, "epoch": 3843} {"train_loss": -6.876962661743164, "global_step": 161408, "epoch": 3843} {"train_loss": -6.988383769989014, "global_step": 161409, "epoch": 3843} {"train_loss": -6.928154945373535, "global_step": 161410, "epoch": 3843} {"train_loss": -6.937841892242432, "global_step": 161411, "epoch": 3843} {"train_loss": -6.848200798034668, "global_step": 161412, "epoch": 3843} {"train_loss": -6.998239040374756, "global_step": 161413, "epoch": 3843} {"train_loss": -6.884801864624023, "global_step": 161414, "epoch": 3843} {"train_loss": -6.811785697937012, "global_step": 161415, "epoch": 3843} {"train_loss": -6.936031818389893, "global_step": 161416, "epoch": 3843} {"train_loss": -6.849625587463379, "global_step": 161417, "epoch": 3843} {"train_loss": -6.907609462738037, "global_step": 161418, "epoch": 3843} {"train_loss": -6.929400444030762, "global_step": 161419, "epoch": 3843} {"train_loss": -6.9321393966674805, "global_step": 161420, "epoch": 3843} {"train_loss": -6.84169864654541, "global_step": 161421, "epoch": 3843} {"train_loss": -6.846470355987549, "global_step": 161422, "epoch": 3843} {"train_loss": -6.968581199645996, "global_step": 161423, "epoch": 3843} {"train_loss": -6.871770858764648, "global_step": 161424, "epoch": 3843} {"train_loss": -6.910712242126465, "global_step": 161425, "epoch": 3843} {"train_loss": -6.923740386962891, "global_step": 161426, "epoch": 3843} {"train_loss": -6.992362976074219, "global_step": 161427, "epoch": 3843} {"train_loss": -7.016997337341309, "global_step": 161428, "epoch": 3843} {"train_loss": -6.956876277923584, "global_step": 161429, "epoch": 3843} {"train_loss": -7.000115394592285, "global_step": 161430, "epoch": 3843} {"train_loss": -6.947029113769531, "global_step": 161431, "epoch": 3843} {"train_loss": -6.963521957397461, "global_step": 161432, "epoch": 3843} {"train_loss": -7.057635307312012, "global_step": 161433, "epoch": 3843} {"train_loss": -7.0866312980651855, "global_step": 161434, "epoch": 3843} {"train_loss": -6.964349746704102, "global_step": 161435, "epoch": 3843} {"train_loss": -6.981703758239746, "global_step": 161436, "epoch": 3843} {"train_loss": -6.947241306304932, "global_step": 161437, "epoch": 3843} {"train_loss": -7.028700351715088, "global_step": 161438, "epoch": 3843} {"train_loss": -6.886433124542236, "global_step": 161439, "epoch": 3843} {"train_loss": -7.015903472900391, "global_step": 161440, "epoch": 3843} {"train_loss": -7.044920921325684, "global_step": 161441, "epoch": 3843} {"train_loss": -6.917159080505371, "global_step": 161442, "epoch": 3843} {"train_loss": -7.068924903869629, "global_step": 161443, "epoch": 3843} {"train_loss": -6.964228630065918, "global_step": 161444, "epoch": 3843} {"train_loss": -6.96146297454834, "global_step": 161445, "epoch": 3843} {"train_loss": -7.057945251464844, "global_step": 161446, "epoch": 3843} {"train_loss": -6.952084484554472, "global_step": 161447, "epoch": 3843, "val_loss": 79296.3671875} {"train_loss": -6.950284957885742, "global_step": 161448, "epoch": 3844} {"train_loss": -7.123458385467529, "global_step": 161449, "epoch": 3844} {"train_loss": -6.957538604736328, "global_step": 161450, "epoch": 3844} {"train_loss": -6.969326972961426, "global_step": 161451, "epoch": 3844} {"train_loss": -6.922222137451172, "global_step": 161452, "epoch": 3844} {"train_loss": -6.989933013916016, "global_step": 161453, "epoch": 3844} {"train_loss": -7.041140556335449, "global_step": 161454, "epoch": 3844} {"train_loss": -6.8693695068359375, "global_step": 161455, "epoch": 3844} {"train_loss": -6.996726036071777, "global_step": 161456, "epoch": 3844} {"train_loss": -7.013226509094238, "global_step": 161457, "epoch": 3844} {"train_loss": -6.9326348304748535, "global_step": 161458, "epoch": 3844} {"train_loss": -7.088868141174316, "global_step": 161459, "epoch": 3844} {"train_loss": -7.054244041442871, "global_step": 161460, "epoch": 3844} {"train_loss": -6.906994342803955, "global_step": 161461, "epoch": 3844} {"train_loss": -7.040480613708496, "global_step": 161462, "epoch": 3844} {"train_loss": -6.990723609924316, "global_step": 161463, "epoch": 3844} {"train_loss": -6.9484639167785645, "global_step": 161464, "epoch": 3844} {"train_loss": -6.779996871948242, "global_step": 161465, "epoch": 3844} {"train_loss": -6.978247165679932, "global_step": 161466, "epoch": 3844} {"train_loss": -6.896222114562988, "global_step": 161467, "epoch": 3844} {"train_loss": -6.962242126464844, "global_step": 161468, "epoch": 3844} {"train_loss": -7.019975662231445, "global_step": 161469, "epoch": 3844} {"train_loss": -6.97369909286499, "global_step": 161470, "epoch": 3844} {"train_loss": -7.000885963439941, "global_step": 161471, "epoch": 3844} {"train_loss": -6.8905181884765625, "global_step": 161472, "epoch": 3844} {"train_loss": -7.06734037399292, "global_step": 161473, "epoch": 3844} {"train_loss": -6.890902519226074, "global_step": 161474, "epoch": 3844} {"train_loss": -7.000002861022949, "global_step": 161475, "epoch": 3844} {"train_loss": -6.895461082458496, "global_step": 161476, "epoch": 3844} {"train_loss": -7.00372314453125, "global_step": 161477, "epoch": 3844} {"train_loss": -6.977339744567871, "global_step": 161478, "epoch": 3844} {"train_loss": -6.864831924438477, "global_step": 161479, "epoch": 3844} {"train_loss": -6.7916436195373535, "global_step": 161480, "epoch": 3844} {"train_loss": -6.852395057678223, "global_step": 161481, "epoch": 3844} {"train_loss": -6.886729717254639, "global_step": 161482, "epoch": 3844} {"train_loss": -7.05847692489624, "global_step": 161483, "epoch": 3844} {"train_loss": -6.8724684715271, "global_step": 161484, "epoch": 3844} {"train_loss": -7.042774200439453, "global_step": 161485, "epoch": 3844} {"train_loss": -7.040290832519531, "global_step": 161486, "epoch": 3844} {"train_loss": -6.985921859741211, "global_step": 161487, "epoch": 3844} {"train_loss": -6.9363250732421875, "global_step": 161488, "epoch": 3844} {"train_loss": -6.963186309451149, "global_step": 161489, "epoch": 3844, "val_loss": 79268.8671875} {"train_loss": -7.103425025939941, "global_step": 161490, "epoch": 3845} {"train_loss": -6.974490165710449, "global_step": 161491, "epoch": 3845} {"train_loss": -7.049614906311035, "global_step": 161492, "epoch": 3845} {"train_loss": -6.938629150390625, "global_step": 161493, "epoch": 3845} {"train_loss": -7.025691032409668, "global_step": 161494, "epoch": 3845} {"train_loss": -7.058350563049316, "global_step": 161495, "epoch": 3845} {"train_loss": -7.052153587341309, "global_step": 161496, "epoch": 3845} {"train_loss": -7.0651960372924805, "global_step": 161497, "epoch": 3845} {"train_loss": -7.046436786651611, "global_step": 161498, "epoch": 3845} {"train_loss": -7.005084991455078, "global_step": 161499, "epoch": 3845} {"train_loss": -6.967514991760254, "global_step": 161500, "epoch": 3845} {"train_loss": -7.023697376251221, "global_step": 161501, "epoch": 3845} {"train_loss": -6.9611406326293945, "global_step": 161502, "epoch": 3845} {"train_loss": -7.005418300628662, "global_step": 161503, "epoch": 3845} {"train_loss": -6.919623374938965, "global_step": 161504, "epoch": 3845} {"train_loss": -6.8717522621154785, "global_step": 161505, "epoch": 3845} {"train_loss": -7.028535842895508, "global_step": 161506, "epoch": 3845} {"train_loss": -6.972116947174072, "global_step": 161507, "epoch": 3845} {"train_loss": -7.121366500854492, "global_step": 161508, "epoch": 3845} {"train_loss": -7.001121997833252, "global_step": 161509, "epoch": 3845} {"train_loss": -6.8951921463012695, "global_step": 161510, "epoch": 3845} {"train_loss": -7.007139682769775, "global_step": 161511, "epoch": 3845} {"train_loss": -6.986769676208496, "global_step": 161512, "epoch": 3845} {"train_loss": -6.8835930824279785, "global_step": 161513, "epoch": 3845} {"train_loss": -7.082766056060791, "global_step": 161514, "epoch": 3845} {"train_loss": -6.952986717224121, "global_step": 161515, "epoch": 3845} {"train_loss": -6.97801399230957, "global_step": 161516, "epoch": 3845} {"train_loss": -7.031408309936523, "global_step": 161517, "epoch": 3845} {"train_loss": -6.955312728881836, "global_step": 161518, "epoch": 3845} {"train_loss": -6.893222808837891, "global_step": 161519, "epoch": 3845} {"train_loss": -6.948558807373047, "global_step": 161520, "epoch": 3845} {"train_loss": -6.933667182922363, "global_step": 161521, "epoch": 3845} {"train_loss": -6.8952836990356445, "global_step": 161522, "epoch": 3845} {"train_loss": -7.063446044921875, "global_step": 161523, "epoch": 3845} {"train_loss": -6.937641620635986, "global_step": 161524, "epoch": 3845} {"train_loss": -6.9533233642578125, "global_step": 161525, "epoch": 3845} {"train_loss": -6.908375263214111, "global_step": 161526, "epoch": 3845} {"train_loss": -6.9456562995910645, "global_step": 161527, "epoch": 3845} {"train_loss": -6.84649658203125, "global_step": 161528, "epoch": 3845} {"train_loss": -6.842907905578613, "global_step": 161529, "epoch": 3845} {"train_loss": -7.065112590789795, "global_step": 161530, "epoch": 3845} {"train_loss": -6.976433765320551, "global_step": 161531, "epoch": 3845, "val_loss": 79400.4140625} {"train_loss": -6.951162815093994, "global_step": 161532, "epoch": 3846} {"train_loss": -7.06065559387207, "global_step": 161533, "epoch": 3846} {"train_loss": -6.857501029968262, "global_step": 161534, "epoch": 3846} {"train_loss": -6.916099548339844, "global_step": 161535, "epoch": 3846} {"train_loss": -6.8488969802856445, "global_step": 161536, "epoch": 3846} {"train_loss": -6.952795028686523, "global_step": 161537, "epoch": 3846} {"train_loss": -6.860018253326416, "global_step": 161538, "epoch": 3846} {"train_loss": -7.0179595947265625, "global_step": 161539, "epoch": 3846} {"train_loss": -6.879584312438965, "global_step": 161540, "epoch": 3846} {"train_loss": -6.968099594116211, "global_step": 161541, "epoch": 3846} {"train_loss": -6.998145580291748, "global_step": 161542, "epoch": 3846} {"train_loss": -7.050355911254883, "global_step": 161543, "epoch": 3846} {"train_loss": -6.911218643188477, "global_step": 161544, "epoch": 3846} {"train_loss": -6.888147354125977, "global_step": 161545, "epoch": 3846} {"train_loss": -6.960461616516113, "global_step": 161546, "epoch": 3846} {"train_loss": -6.87607479095459, "global_step": 161547, "epoch": 3846} {"train_loss": -7.03790283203125, "global_step": 161548, "epoch": 3846} {"train_loss": -7.104833602905273, "global_step": 161549, "epoch": 3846} {"train_loss": -7.09638786315918, "global_step": 161550, "epoch": 3846} {"train_loss": -6.914495468139648, "global_step": 161551, "epoch": 3846} {"train_loss": -6.945137977600098, "global_step": 161552, "epoch": 3846} {"train_loss": -6.9639201164245605, "global_step": 161553, "epoch": 3846} {"train_loss": -6.9474406242370605, "global_step": 161554, "epoch": 3846} {"train_loss": -6.8614182472229, "global_step": 161555, "epoch": 3846} {"train_loss": -6.861690998077393, "global_step": 161556, "epoch": 3846} {"train_loss": -6.975108623504639, "global_step": 161557, "epoch": 3846} {"train_loss": -6.999091625213623, "global_step": 161558, "epoch": 3846} {"train_loss": -6.984308242797852, "global_step": 161559, "epoch": 3846} {"train_loss": -7.017556190490723, "global_step": 161560, "epoch": 3846} {"train_loss": -7.006865978240967, "global_step": 161561, "epoch": 3846} {"train_loss": -6.969771862030029, "global_step": 161562, "epoch": 3846} {"train_loss": -7.0645976066589355, "global_step": 161563, "epoch": 3846} {"train_loss": -6.993027687072754, "global_step": 161564, "epoch": 3846} {"train_loss": -6.969204902648926, "global_step": 161565, "epoch": 3846} {"train_loss": -6.979849815368652, "global_step": 161566, "epoch": 3846} {"train_loss": -7.100888252258301, "global_step": 161567, "epoch": 3846} {"train_loss": -7.000155448913574, "global_step": 161568, "epoch": 3846} {"train_loss": -7.068996906280518, "global_step": 161569, "epoch": 3846} {"train_loss": -7.010563373565674, "global_step": 161570, "epoch": 3846} {"train_loss": -7.070751667022705, "global_step": 161571, "epoch": 3846} {"train_loss": -7.021663188934326, "global_step": 161572, "epoch": 3846} {"train_loss": -6.975725616727557, "global_step": 161573, "epoch": 3846, "val_loss": 79330.2578125} {"train_loss": -6.932053565979004, "global_step": 161574, "epoch": 3847} {"train_loss": -6.976126194000244, "global_step": 161575, "epoch": 3847} {"train_loss": -7.082719802856445, "global_step": 161576, "epoch": 3847} {"train_loss": -7.064621448516846, "global_step": 161577, "epoch": 3847} {"train_loss": -6.923583030700684, "global_step": 161578, "epoch": 3847} {"train_loss": -6.980181694030762, "global_step": 161579, "epoch": 3847} {"train_loss": -7.0726799964904785, "global_step": 161580, "epoch": 3847} {"train_loss": -7.030167579650879, "global_step": 161581, "epoch": 3847} {"train_loss": -6.9143476486206055, "global_step": 161582, "epoch": 3847} {"train_loss": -6.963566780090332, "global_step": 161583, "epoch": 3847} {"train_loss": -7.057065010070801, "global_step": 161584, "epoch": 3847} {"train_loss": -6.962320804595947, "global_step": 161585, "epoch": 3847} {"train_loss": -7.096433639526367, "global_step": 161586, "epoch": 3847} {"train_loss": -7.074957847595215, "global_step": 161587, "epoch": 3847} {"train_loss": -6.914254188537598, "global_step": 161588, "epoch": 3847} {"train_loss": -7.044284820556641, "global_step": 161589, "epoch": 3847} {"train_loss": -6.970273494720459, "global_step": 161590, "epoch": 3847} {"train_loss": -6.972179412841797, "global_step": 161591, "epoch": 3847} {"train_loss": -7.070643424987793, "global_step": 161592, "epoch": 3847} {"train_loss": -6.992702007293701, "global_step": 161593, "epoch": 3847} {"train_loss": -7.010311126708984, "global_step": 161594, "epoch": 3847} {"train_loss": -7.050829887390137, "global_step": 161595, "epoch": 3847} {"train_loss": -6.925488471984863, "global_step": 161596, "epoch": 3847} {"train_loss": -6.953745365142822, "global_step": 161597, "epoch": 3847} {"train_loss": -7.019474029541016, "global_step": 161598, "epoch": 3847} {"train_loss": -7.071577072143555, "global_step": 161599, "epoch": 3847} {"train_loss": -6.954682350158691, "global_step": 161600, "epoch": 3847} {"train_loss": -6.972299575805664, "global_step": 161601, "epoch": 3847} {"train_loss": -7.177835464477539, "global_step": 161602, "epoch": 3847} {"train_loss": -6.84147310256958, "global_step": 161603, "epoch": 3847} {"train_loss": -6.949005126953125, "global_step": 161604, "epoch": 3847} {"train_loss": -6.861723899841309, "global_step": 161605, "epoch": 3847} {"train_loss": -6.937786102294922, "global_step": 161606, "epoch": 3847} {"train_loss": -6.94409704208374, "global_step": 161607, "epoch": 3847} {"train_loss": -6.9544243812561035, "global_step": 161608, "epoch": 3847} {"train_loss": -6.8539533615112305, "global_step": 161609, "epoch": 3847} {"train_loss": -6.8826398849487305, "global_step": 161610, "epoch": 3847} {"train_loss": -6.9652323722839355, "global_step": 161611, "epoch": 3847} {"train_loss": -6.867077350616455, "global_step": 161612, "epoch": 3847} {"train_loss": -6.901004314422607, "global_step": 161613, "epoch": 3847} {"train_loss": -6.915279388427734, "global_step": 161614, "epoch": 3847} {"train_loss": -6.977068605877104, "global_step": 161615, "epoch": 3847, "val_loss": 79478.5078125} {"train_loss": -6.984118938446045, "global_step": 161616, "epoch": 3848} {"train_loss": -6.9683837890625, "global_step": 161617, "epoch": 3848} {"train_loss": -6.941332817077637, "global_step": 161618, "epoch": 3848} {"train_loss": -7.045586109161377, "global_step": 161619, "epoch": 3848} {"train_loss": -7.016587257385254, "global_step": 161620, "epoch": 3848} {"train_loss": -6.88987398147583, "global_step": 161621, "epoch": 3848} {"train_loss": -6.990547180175781, "global_step": 161622, "epoch": 3848} {"train_loss": -6.941736221313477, "global_step": 161623, "epoch": 3848} {"train_loss": -6.914060592651367, "global_step": 161624, "epoch": 3848} {"train_loss": -6.865151405334473, "global_step": 161625, "epoch": 3848} {"train_loss": -6.973779678344727, "global_step": 161626, "epoch": 3848} {"train_loss": -6.87052059173584, "global_step": 161627, "epoch": 3848} {"train_loss": -6.884946823120117, "global_step": 161628, "epoch": 3848} {"train_loss": -6.989436626434326, "global_step": 161629, "epoch": 3848} {"train_loss": -6.974372863769531, "global_step": 161630, "epoch": 3848} {"train_loss": -6.935247898101807, "global_step": 161631, "epoch": 3848} {"train_loss": -6.838408470153809, "global_step": 161632, "epoch": 3848} {"train_loss": -6.883883476257324, "global_step": 161633, "epoch": 3848} {"train_loss": -6.918644905090332, "global_step": 161634, "epoch": 3848} {"train_loss": -6.836568355560303, "global_step": 161635, "epoch": 3848} {"train_loss": -6.964815139770508, "global_step": 161636, "epoch": 3848} {"train_loss": -6.874261856079102, "global_step": 161637, "epoch": 3848} {"train_loss": -6.954277038574219, "global_step": 161638, "epoch": 3848} {"train_loss": -6.990677833557129, "global_step": 161639, "epoch": 3848} {"train_loss": -6.9129638671875, "global_step": 161640, "epoch": 3848} {"train_loss": -6.871547222137451, "global_step": 161641, "epoch": 3848} {"train_loss": -6.889504909515381, "global_step": 161642, "epoch": 3848} {"train_loss": -6.812137603759766, "global_step": 161643, "epoch": 3848} {"train_loss": -6.90609884262085, "global_step": 161644, "epoch": 3848} {"train_loss": -6.819318771362305, "global_step": 161645, "epoch": 3848} {"train_loss": -6.930002212524414, "global_step": 161646, "epoch": 3848} {"train_loss": -6.881521224975586, "global_step": 161647, "epoch": 3848} {"train_loss": -6.877327919006348, "global_step": 161648, "epoch": 3848} {"train_loss": -6.880636215209961, "global_step": 161649, "epoch": 3848} {"train_loss": -6.858391761779785, "global_step": 161650, "epoch": 3848} {"train_loss": -6.892910480499268, "global_step": 161651, "epoch": 3848} {"train_loss": -6.793793678283691, "global_step": 161652, "epoch": 3848} {"train_loss": -6.927189826965332, "global_step": 161653, "epoch": 3848} {"train_loss": -6.769033432006836, "global_step": 161654, "epoch": 3848} {"train_loss": -6.948920249938965, "global_step": 161655, "epoch": 3848} {"train_loss": -6.746923923492432, "global_step": 161656, "epoch": 3848} {"train_loss": -6.9079232556479315, "global_step": 161657, "epoch": 3848, "val_loss": 79220.59375} {"train_loss": -6.930785179138184, "global_step": 161658, "epoch": 3849} {"train_loss": -6.8355607986450195, "global_step": 161659, "epoch": 3849} {"train_loss": -7.050279140472412, "global_step": 161660, "epoch": 3849} {"train_loss": -6.928852081298828, "global_step": 161661, "epoch": 3849} {"train_loss": -6.908450603485107, "global_step": 161662, "epoch": 3849} {"train_loss": -7.010193824768066, "global_step": 161663, "epoch": 3849} {"train_loss": -6.975743770599365, "global_step": 161664, "epoch": 3849} {"train_loss": -7.004840850830078, "global_step": 161665, "epoch": 3849} {"train_loss": -6.854639053344727, "global_step": 161666, "epoch": 3849} {"train_loss": -6.981453895568848, "global_step": 161667, "epoch": 3849} {"train_loss": -6.942444324493408, "global_step": 161668, "epoch": 3849} {"train_loss": -7.02885627746582, "global_step": 161669, "epoch": 3849} {"train_loss": -6.845511436462402, "global_step": 161670, "epoch": 3849} {"train_loss": -6.942683219909668, "global_step": 161671, "epoch": 3849} {"train_loss": -6.896465301513672, "global_step": 161672, "epoch": 3849} {"train_loss": -6.904413223266602, "global_step": 161673, "epoch": 3849} {"train_loss": -6.815489768981934, "global_step": 161674, "epoch": 3849} {"train_loss": -6.900698661804199, "global_step": 161675, "epoch": 3849} {"train_loss": -6.954611778259277, "global_step": 161676, "epoch": 3849} {"train_loss": -6.937379837036133, "global_step": 161677, "epoch": 3849} {"train_loss": -6.8547139167785645, "global_step": 161678, "epoch": 3849} {"train_loss": -6.9162116050720215, "global_step": 161679, "epoch": 3849} {"train_loss": -6.853060245513916, "global_step": 161680, "epoch": 3849} {"train_loss": -6.96970272064209, "global_step": 161681, "epoch": 3849} {"train_loss": -7.018118858337402, "global_step": 161682, "epoch": 3849} {"train_loss": -6.836639404296875, "global_step": 161683, "epoch": 3849} {"train_loss": -6.910081386566162, "global_step": 161684, "epoch": 3849} {"train_loss": -6.953056335449219, "global_step": 161685, "epoch": 3849} {"train_loss": -6.980922222137451, "global_step": 161686, "epoch": 3849} {"train_loss": -7.06109094619751, "global_step": 161687, "epoch": 3849} {"train_loss": -6.9027581214904785, "global_step": 161688, "epoch": 3849} {"train_loss": -6.854941368103027, "global_step": 161689, "epoch": 3849} {"train_loss": -6.965201377868652, "global_step": 161690, "epoch": 3849} {"train_loss": -6.8996429443359375, "global_step": 161691, "epoch": 3849} {"train_loss": -6.957989692687988, "global_step": 161692, "epoch": 3849} {"train_loss": -6.929214954376221, "global_step": 161693, "epoch": 3849} {"train_loss": -6.930488586425781, "global_step": 161694, "epoch": 3849} {"train_loss": -6.925619125366211, "global_step": 161695, "epoch": 3849} {"train_loss": -6.9645609855651855, "global_step": 161696, "epoch": 3849} {"train_loss": -6.961703300476074, "global_step": 161697, "epoch": 3849} {"train_loss": -6.9973649978637695, "global_step": 161698, "epoch": 3849} {"train_loss": -6.933511892954509, "global_step": 161699, "epoch": 3849, "val_loss": 79252.1875} {"train_loss": -7.020184516906738, "global_step": 161700, "epoch": 3850} {"train_loss": -6.954482078552246, "global_step": 161701, "epoch": 3850} {"train_loss": -6.93123197555542, "global_step": 161702, "epoch": 3850} {"train_loss": -7.037631988525391, "global_step": 161703, "epoch": 3850} {"train_loss": -6.936642646789551, "global_step": 161704, "epoch": 3850} {"train_loss": -6.884747505187988, "global_step": 161705, "epoch": 3850} {"train_loss": -6.855955123901367, "global_step": 161706, "epoch": 3850} {"train_loss": -7.00827693939209, "global_step": 161707, "epoch": 3850} {"train_loss": -6.971037864685059, "global_step": 161708, "epoch": 3850} {"train_loss": -6.969288349151611, "global_step": 161709, "epoch": 3850} {"train_loss": -6.932671546936035, "global_step": 161710, "epoch": 3850} {"train_loss": -7.051924705505371, "global_step": 161711, "epoch": 3850} {"train_loss": -6.972304344177246, "global_step": 161712, "epoch": 3850} {"train_loss": -7.0398030281066895, "global_step": 161713, "epoch": 3850} {"train_loss": -6.934503555297852, "global_step": 161714, "epoch": 3850} {"train_loss": -6.946094989776611, "global_step": 161715, "epoch": 3850} {"train_loss": -7.0068464279174805, "global_step": 161716, "epoch": 3850} {"train_loss": -6.906933784484863, "global_step": 161717, "epoch": 3850} {"train_loss": -7.058249473571777, "global_step": 161718, "epoch": 3850} {"train_loss": -7.0003461837768555, "global_step": 161719, "epoch": 3850} {"train_loss": -6.921426773071289, "global_step": 161720, "epoch": 3850} {"train_loss": -6.974240303039551, "global_step": 161721, "epoch": 3850} {"train_loss": -7.038849353790283, "global_step": 161722, "epoch": 3850} {"train_loss": -6.909597396850586, "global_step": 161723, "epoch": 3850} {"train_loss": -6.988802909851074, "global_step": 161724, "epoch": 3850} {"train_loss": -6.894987106323242, "global_step": 161725, "epoch": 3850} {"train_loss": -6.8549604415893555, "global_step": 161726, "epoch": 3850} {"train_loss": -6.943414211273193, "global_step": 161727, "epoch": 3850} {"train_loss": -6.958559036254883, "global_step": 161728, "epoch": 3850} {"train_loss": -6.859428882598877, "global_step": 161729, "epoch": 3850} {"train_loss": -6.910571575164795, "global_step": 161730, "epoch": 3850} {"train_loss": -6.907994747161865, "global_step": 161731, "epoch": 3850} {"train_loss": -6.84014892578125, "global_step": 161732, "epoch": 3850} {"train_loss": -6.920090198516846, "global_step": 161733, "epoch": 3850} {"train_loss": -6.880617141723633, "global_step": 161734, "epoch": 3850} {"train_loss": -6.9370317459106445, "global_step": 161735, "epoch": 3850} {"train_loss": -6.959095001220703, "global_step": 161736, "epoch": 3850} {"train_loss": -7.023405075073242, "global_step": 161737, "epoch": 3850} {"train_loss": -6.9891157150268555, "global_step": 161738, "epoch": 3850} {"train_loss": -7.097865104675293, "global_step": 161739, "epoch": 3850} {"train_loss": -7.012309551239014, "global_step": 161740, "epoch": 3850} {"train_loss": -6.95489562125433, "global_step": 161741, "epoch": 3850, "train/sim_max_reward_0": 0.4078970218477655, "train/sim_max_reward_1": 0.9699221473043624, "train/sim_max_reward_2": 0.5384050295007899, "train/sim_max_reward_3": 0.15361547105939824, "train/sim_max_reward_4": 0.3184619969574493, "train/sim_max_reward_5": 0.5792720327455746, "test/sim_max_reward_4500000": 0.9819407992550673, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9460281475638386, "test/sim_max_reward_4500004": 0.1468642756712525, "test/sim_max_reward_4500005": 0.9541129925792373, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 0.8999191892348654, "test/sim_max_reward_4500008": 0.0008846114692284502, "test/sim_max_reward_4500009": 0.053444552973318696, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.8558018079969015, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.0009390847302207314, "test/sim_max_reward_4500014": 0.7885050041439333, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.10162635425711616, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.967958283338903, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9779604055688802, "test/sim_max_reward_4500022": 0.9362448109927747, "test/sim_max_reward_4500023": 0.8984013984253917, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8691530484585128, "test/sim_max_reward_4500026": 0.9164959698020511, "test/sim_max_reward_4500027": 0.9809680101481019, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.07780876403964575, "test/sim_max_reward_4500030": 0.8145160716879339, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.9839038129799934, "test/sim_max_reward_4500035": 0.8932023158299427, "test/sim_max_reward_4500036": 0.997067883087418, "test/sim_max_reward_4500037": 0.914569955456481, "test/sim_max_reward_4500038": 0.7391708149064203, "test/sim_max_reward_4500039": 0.9088567896746993, "test/sim_max_reward_4500040": 0.995979495927247, "test/sim_max_reward_4500041": 0.9905195366104049, "test/sim_max_reward_4500042": 0.03642962924406983, "test/sim_max_reward_4500043": 0.22388041115639234, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.4203964527739667, "test/sim_max_reward_4500046": 0.9659495852225635, "test/sim_max_reward_4500047": 0.9636839025903176, "test/sim_max_reward_4500048": 0.9803610938886144, "test/sim_max_reward_4500049": 1.0, "train/mean_score": 0.49459561656922335, "test/mean_score": 0.6087179899130476, "val_loss": 79438.6796875} {"train_loss": -6.985535621643066, "global_step": 161742, "epoch": 3851} {"train_loss": -6.876002311706543, "global_step": 161743, "epoch": 3851} {"train_loss": -7.024334907531738, "global_step": 161744, "epoch": 3851} {"train_loss": -6.995610237121582, "global_step": 161745, "epoch": 3851} {"train_loss": -6.843231201171875, "global_step": 161746, "epoch": 3851} {"train_loss": -7.068036079406738, "global_step": 161747, "epoch": 3851} {"train_loss": -6.885066032409668, "global_step": 161748, "epoch": 3851} {"train_loss": -6.923266887664795, "global_step": 161749, "epoch": 3851} {"train_loss": -6.905256271362305, "global_step": 161750, "epoch": 3851} {"train_loss": -6.901423931121826, "global_step": 161751, "epoch": 3851} {"train_loss": -6.879188537597656, "global_step": 161752, "epoch": 3851} {"train_loss": -6.926087856292725, "global_step": 161753, "epoch": 3851} {"train_loss": -6.85922908782959, "global_step": 161754, "epoch": 3851} {"train_loss": -7.024228572845459, "global_step": 161755, "epoch": 3851} {"train_loss": -6.971463203430176, "global_step": 161756, "epoch": 3851} {"train_loss": -6.855533599853516, "global_step": 161757, "epoch": 3851} {"train_loss": -6.8270978927612305, "global_step": 161758, "epoch": 3851} {"train_loss": -6.856279373168945, "global_step": 161759, "epoch": 3851} {"train_loss": -6.867071151733398, "global_step": 161760, "epoch": 3851} {"train_loss": -6.98811149597168, "global_step": 161761, "epoch": 3851} {"train_loss": -6.822100639343262, "global_step": 161762, "epoch": 3851} {"train_loss": -6.911808490753174, "global_step": 161763, "epoch": 3851} {"train_loss": -6.948837757110596, "global_step": 161764, "epoch": 3851} {"train_loss": -6.769071578979492, "global_step": 161765, "epoch": 3851} {"train_loss": -6.8940205574035645, "global_step": 161766, "epoch": 3851} {"train_loss": -6.869584560394287, "global_step": 161767, "epoch": 3851} {"train_loss": -6.824217319488525, "global_step": 161768, "epoch": 3851} {"train_loss": -6.910341262817383, "global_step": 161769, "epoch": 3851} {"train_loss": -6.86962890625, "global_step": 161770, "epoch": 3851} {"train_loss": -6.835882186889648, "global_step": 161771, "epoch": 3851} {"train_loss": -6.979546546936035, "global_step": 161772, "epoch": 3851} {"train_loss": -6.8566741943359375, "global_step": 161773, "epoch": 3851} {"train_loss": -6.911110877990723, "global_step": 161774, "epoch": 3851} {"train_loss": -6.855716705322266, "global_step": 161775, "epoch": 3851} {"train_loss": -6.998264312744141, "global_step": 161776, "epoch": 3851} {"train_loss": -6.84478759765625, "global_step": 161777, "epoch": 3851} {"train_loss": -6.925132751464844, "global_step": 161778, "epoch": 3851} {"train_loss": -6.9472761154174805, "global_step": 161779, "epoch": 3851} {"train_loss": -6.988029479980469, "global_step": 161780, "epoch": 3851} {"train_loss": -6.993795871734619, "global_step": 161781, "epoch": 3851} {"train_loss": -6.895015239715576, "global_step": 161782, "epoch": 3851} {"train_loss": -6.910013425917852, "global_step": 161783, "epoch": 3851, "val_loss": 79198.109375} {"train_loss": -7.015318870544434, "global_step": 161784, "epoch": 3852} {"train_loss": -6.957310676574707, "global_step": 161785, "epoch": 3852} {"train_loss": -6.928993225097656, "global_step": 161786, "epoch": 3852} {"train_loss": -6.921102046966553, "global_step": 161787, "epoch": 3852} {"train_loss": -6.891593933105469, "global_step": 161788, "epoch": 3852} {"train_loss": -6.943911552429199, "global_step": 161789, "epoch": 3852} {"train_loss": -6.864975452423096, "global_step": 161790, "epoch": 3852} {"train_loss": -6.956330299377441, "global_step": 161791, "epoch": 3852} {"train_loss": -6.888269901275635, "global_step": 161792, "epoch": 3852} {"train_loss": -6.834399700164795, "global_step": 161793, "epoch": 3852} {"train_loss": -6.949002265930176, "global_step": 161794, "epoch": 3852} {"train_loss": -6.883477210998535, "global_step": 161795, "epoch": 3852} {"train_loss": -7.086672782897949, "global_step": 161796, "epoch": 3852} {"train_loss": -6.88246488571167, "global_step": 161797, "epoch": 3852} {"train_loss": -6.975020885467529, "global_step": 161798, "epoch": 3852} {"train_loss": -6.896512508392334, "global_step": 161799, "epoch": 3852} {"train_loss": -7.00056266784668, "global_step": 161800, "epoch": 3852} {"train_loss": -7.047393798828125, "global_step": 161801, "epoch": 3852} {"train_loss": -7.020374298095703, "global_step": 161802, "epoch": 3852} {"train_loss": -6.96763277053833, "global_step": 161803, "epoch": 3852} {"train_loss": -6.909192085266113, "global_step": 161804, "epoch": 3852} {"train_loss": -6.952780723571777, "global_step": 161805, "epoch": 3852} {"train_loss": -6.924904823303223, "global_step": 161806, "epoch": 3852} {"train_loss": -6.947892189025879, "global_step": 161807, "epoch": 3852} {"train_loss": -6.994909286499023, "global_step": 161808, "epoch": 3852} {"train_loss": -7.019100666046143, "global_step": 161809, "epoch": 3852} {"train_loss": -7.009701728820801, "global_step": 161810, "epoch": 3852} {"train_loss": -7.021076202392578, "global_step": 161811, "epoch": 3852} {"train_loss": -7.051506519317627, "global_step": 161812, "epoch": 3852} {"train_loss": -6.944882392883301, "global_step": 161813, "epoch": 3852} {"train_loss": -6.892251014709473, "global_step": 161814, "epoch": 3852} {"train_loss": -6.887825012207031, "global_step": 161815, "epoch": 3852} {"train_loss": -7.005671501159668, "global_step": 161816, "epoch": 3852} {"train_loss": -7.043491840362549, "global_step": 161817, "epoch": 3852} {"train_loss": -6.975844860076904, "global_step": 161818, "epoch": 3852} {"train_loss": -7.031688213348389, "global_step": 161819, "epoch": 3852} {"train_loss": -6.938204765319824, "global_step": 161820, "epoch": 3852} {"train_loss": -6.942572116851807, "global_step": 161821, "epoch": 3852} {"train_loss": -6.841742515563965, "global_step": 161822, "epoch": 3852} {"train_loss": -6.958990097045898, "global_step": 161823, "epoch": 3852} {"train_loss": -7.012942314147949, "global_step": 161824, "epoch": 3852} {"train_loss": -6.954777320226033, "global_step": 161825, "epoch": 3852, "val_loss": 79379.8515625} {"train_loss": -6.915763854980469, "global_step": 161826, "epoch": 3853} {"train_loss": -6.977933883666992, "global_step": 161827, "epoch": 3853} {"train_loss": -6.972115516662598, "global_step": 161828, "epoch": 3853} {"train_loss": -6.946001052856445, "global_step": 161829, "epoch": 3853} {"train_loss": -6.997118949890137, "global_step": 161830, "epoch": 3853} {"train_loss": -6.9691267013549805, "global_step": 161831, "epoch": 3853} {"train_loss": -7.060279846191406, "global_step": 161832, "epoch": 3853} {"train_loss": -6.950865268707275, "global_step": 161833, "epoch": 3853} {"train_loss": -7.028249740600586, "global_step": 161834, "epoch": 3853} {"train_loss": -6.96780252456665, "global_step": 161835, "epoch": 3853} {"train_loss": -6.991335391998291, "global_step": 161836, "epoch": 3853} {"train_loss": -7.003953456878662, "global_step": 161837, "epoch": 3853} {"train_loss": -7.057477951049805, "global_step": 161838, "epoch": 3853} {"train_loss": -7.06004524230957, "global_step": 161839, "epoch": 3853} {"train_loss": -7.095920085906982, "global_step": 161840, "epoch": 3853} {"train_loss": -7.024312973022461, "global_step": 161841, "epoch": 3853} {"train_loss": -6.922610759735107, "global_step": 161842, "epoch": 3853} {"train_loss": -7.040475368499756, "global_step": 161843, "epoch": 3853} {"train_loss": -6.973729133605957, "global_step": 161844, "epoch": 3853} {"train_loss": -6.997098922729492, "global_step": 161845, "epoch": 3853} {"train_loss": -6.958391189575195, "global_step": 161846, "epoch": 3853} {"train_loss": -7.129584312438965, "global_step": 161847, "epoch": 3853} {"train_loss": -6.876106262207031, "global_step": 161848, "epoch": 3853} {"train_loss": -7.019347190856934, "global_step": 161849, "epoch": 3853} {"train_loss": -6.845312595367432, "global_step": 161850, "epoch": 3853} {"train_loss": -6.975818634033203, "global_step": 161851, "epoch": 3853} {"train_loss": -6.840264320373535, "global_step": 161852, "epoch": 3853} {"train_loss": -6.8108673095703125, "global_step": 161853, "epoch": 3853} {"train_loss": -6.972907066345215, "global_step": 161854, "epoch": 3853} {"train_loss": -7.025643348693848, "global_step": 161855, "epoch": 3853} {"train_loss": -6.974453926086426, "global_step": 161856, "epoch": 3853} {"train_loss": -6.859471321105957, "global_step": 161857, "epoch": 3853} {"train_loss": -6.864233016967773, "global_step": 161858, "epoch": 3853} {"train_loss": -6.945623397827148, "global_step": 161859, "epoch": 3853} {"train_loss": -6.88584041595459, "global_step": 161860, "epoch": 3853} {"train_loss": -6.912789344787598, "global_step": 161861, "epoch": 3853} {"train_loss": -6.880681037902832, "global_step": 161862, "epoch": 3853} {"train_loss": -6.820549964904785, "global_step": 161863, "epoch": 3853} {"train_loss": -6.900107383728027, "global_step": 161864, "epoch": 3853} {"train_loss": -6.888431072235107, "global_step": 161865, "epoch": 3853} {"train_loss": -6.8960394859313965, "global_step": 161866, "epoch": 3853} {"train_loss": -6.958449193409511, "global_step": 161867, "epoch": 3853, "val_loss": 79499.875} {"train_loss": -6.8357648849487305, "global_step": 161868, "epoch": 3854} {"train_loss": -6.872583389282227, "global_step": 161869, "epoch": 3854} {"train_loss": -6.88264274597168, "global_step": 161870, "epoch": 3854} {"train_loss": -6.9600324630737305, "global_step": 161871, "epoch": 3854} {"train_loss": -6.984698295593262, "global_step": 161872, "epoch": 3854} {"train_loss": -7.050320148468018, "global_step": 161873, "epoch": 3854} {"train_loss": -7.008993625640869, "global_step": 161874, "epoch": 3854} {"train_loss": -6.8498687744140625, "global_step": 161875, "epoch": 3854} {"train_loss": -7.00748348236084, "global_step": 161876, "epoch": 3854} {"train_loss": -6.991822719573975, "global_step": 161877, "epoch": 3854} {"train_loss": -6.970768928527832, "global_step": 161878, "epoch": 3854} {"train_loss": -6.996265888214111, "global_step": 161879, "epoch": 3854} {"train_loss": -6.974909782409668, "global_step": 161880, "epoch": 3854} {"train_loss": -6.922292232513428, "global_step": 161881, "epoch": 3854} {"train_loss": -6.947813034057617, "global_step": 161882, "epoch": 3854} {"train_loss": -6.950469017028809, "global_step": 161883, "epoch": 3854} {"train_loss": -7.003498554229736, "global_step": 161884, "epoch": 3854} {"train_loss": -6.978355407714844, "global_step": 161885, "epoch": 3854} {"train_loss": -6.961179256439209, "global_step": 161886, "epoch": 3854} {"train_loss": -7.005633354187012, "global_step": 161887, "epoch": 3854} {"train_loss": -6.993222236633301, "global_step": 161888, "epoch": 3854} {"train_loss": -6.948406219482422, "global_step": 161889, "epoch": 3854} {"train_loss": -6.840359687805176, "global_step": 161890, "epoch": 3854} {"train_loss": -7.013307571411133, "global_step": 161891, "epoch": 3854} {"train_loss": -7.022356033325195, "global_step": 161892, "epoch": 3854} {"train_loss": -7.001240253448486, "global_step": 161893, "epoch": 3854} {"train_loss": -6.900385856628418, "global_step": 161894, "epoch": 3854} {"train_loss": -6.96923828125, "global_step": 161895, "epoch": 3854} {"train_loss": -6.943119049072266, "global_step": 161896, "epoch": 3854} {"train_loss": -6.999676704406738, "global_step": 161897, "epoch": 3854} {"train_loss": -7.118719100952148, "global_step": 161898, "epoch": 3854} {"train_loss": -6.924295902252197, "global_step": 161899, "epoch": 3854} {"train_loss": -6.979926109313965, "global_step": 161900, "epoch": 3854} {"train_loss": -7.038848876953125, "global_step": 161901, "epoch": 3854} {"train_loss": -6.968057155609131, "global_step": 161902, "epoch": 3854} {"train_loss": -6.967578887939453, "global_step": 161903, "epoch": 3854} {"train_loss": -6.966157913208008, "global_step": 161904, "epoch": 3854} {"train_loss": -6.828529357910156, "global_step": 161905, "epoch": 3854} {"train_loss": -6.987464904785156, "global_step": 161906, "epoch": 3854} {"train_loss": -6.959309101104736, "global_step": 161907, "epoch": 3854} {"train_loss": -6.939613342285156, "global_step": 161908, "epoch": 3854} {"train_loss": -6.961686622528803, "global_step": 161909, "epoch": 3854, "val_loss": 79464.6875} {"train_loss": -6.920711517333984, "global_step": 161910, "epoch": 3855} {"train_loss": -6.862843036651611, "global_step": 161911, "epoch": 3855} {"train_loss": -6.9188642501831055, "global_step": 161912, "epoch": 3855} {"train_loss": -6.922225475311279, "global_step": 161913, "epoch": 3855} {"train_loss": -6.955428600311279, "global_step": 161914, "epoch": 3855} {"train_loss": -6.846549987792969, "global_step": 161915, "epoch": 3855} {"train_loss": -6.874624252319336, "global_step": 161916, "epoch": 3855} {"train_loss": -6.849401473999023, "global_step": 161917, "epoch": 3855} {"train_loss": -7.060370445251465, "global_step": 161918, "epoch": 3855} {"train_loss": -6.7449750900268555, "global_step": 161919, "epoch": 3855} {"train_loss": -6.974586486816406, "global_step": 161920, "epoch": 3855} {"train_loss": -6.961472511291504, "global_step": 161921, "epoch": 3855} {"train_loss": -6.877241611480713, "global_step": 161922, "epoch": 3855} {"train_loss": -6.796328067779541, "global_step": 161923, "epoch": 3855} {"train_loss": -6.808149814605713, "global_step": 161924, "epoch": 3855} {"train_loss": -6.927184104919434, "global_step": 161925, "epoch": 3855} {"train_loss": -6.864471912384033, "global_step": 161926, "epoch": 3855} {"train_loss": -6.941740989685059, "global_step": 161927, "epoch": 3855} {"train_loss": -6.950334548950195, "global_step": 161928, "epoch": 3855} {"train_loss": -6.809964179992676, "global_step": 161929, "epoch": 3855} {"train_loss": -6.8643341064453125, "global_step": 161930, "epoch": 3855} {"train_loss": -6.976398468017578, "global_step": 161931, "epoch": 3855} {"train_loss": -6.784071445465088, "global_step": 161932, "epoch": 3855} {"train_loss": -6.810690879821777, "global_step": 161933, "epoch": 3855} {"train_loss": -6.9139204025268555, "global_step": 161934, "epoch": 3855} {"train_loss": -6.903573036193848, "global_step": 161935, "epoch": 3855} {"train_loss": -6.890079498291016, "global_step": 161936, "epoch": 3855} {"train_loss": -6.889141082763672, "global_step": 161937, "epoch": 3855} {"train_loss": -6.981152534484863, "global_step": 161938, "epoch": 3855} {"train_loss": -6.893673419952393, "global_step": 161939, "epoch": 3855} {"train_loss": -6.9879302978515625, "global_step": 161940, "epoch": 3855} {"train_loss": -6.768303394317627, "global_step": 161941, "epoch": 3855} {"train_loss": -6.958301544189453, "global_step": 161942, "epoch": 3855} {"train_loss": -6.865447521209717, "global_step": 161943, "epoch": 3855} {"train_loss": -6.908530235290527, "global_step": 161944, "epoch": 3855} {"train_loss": -6.909492015838623, "global_step": 161945, "epoch": 3855} {"train_loss": -6.857461452484131, "global_step": 161946, "epoch": 3855} {"train_loss": -6.930356025695801, "global_step": 161947, "epoch": 3855} {"train_loss": -6.730853080749512, "global_step": 161948, "epoch": 3855} {"train_loss": -6.906338691711426, "global_step": 161949, "epoch": 3855} {"train_loss": -6.927258014678955, "global_step": 161950, "epoch": 3855} {"train_loss": -6.8927999791644865, "global_step": 161951, "epoch": 3855, "val_loss": 79912.6796875} {"train_loss": -6.867326736450195, "global_step": 161952, "epoch": 3856} {"train_loss": -6.888856887817383, "global_step": 161953, "epoch": 3856} {"train_loss": -6.843182563781738, "global_step": 161954, "epoch": 3856} {"train_loss": -6.908531665802002, "global_step": 161955, "epoch": 3856} {"train_loss": -6.9401140213012695, "global_step": 161956, "epoch": 3856} {"train_loss": -6.915472030639648, "global_step": 161957, "epoch": 3856} {"train_loss": -6.961102485656738, "global_step": 161958, "epoch": 3856} {"train_loss": -6.919922828674316, "global_step": 161959, "epoch": 3856} {"train_loss": -6.925431251525879, "global_step": 161960, "epoch": 3856} {"train_loss": -6.857163429260254, "global_step": 161961, "epoch": 3856} {"train_loss": -6.896317481994629, "global_step": 161962, "epoch": 3856} {"train_loss": -6.889129161834717, "global_step": 161963, "epoch": 3856} {"train_loss": -6.870109558105469, "global_step": 161964, "epoch": 3856} {"train_loss": -6.98330545425415, "global_step": 161965, "epoch": 3856} {"train_loss": -6.806844711303711, "global_step": 161966, "epoch": 3856} {"train_loss": -6.9043498039245605, "global_step": 161967, "epoch": 3856} {"train_loss": -6.895294666290283, "global_step": 161968, "epoch": 3856} {"train_loss": -6.833038330078125, "global_step": 161969, "epoch": 3856} {"train_loss": -7.0099945068359375, "global_step": 161970, "epoch": 3856} {"train_loss": -6.9871721267700195, "global_step": 161971, "epoch": 3856} {"train_loss": -6.972151279449463, "global_step": 161972, "epoch": 3856} {"train_loss": -7.05198860168457, "global_step": 161973, "epoch": 3856} {"train_loss": -6.787071228027344, "global_step": 161974, "epoch": 3856} {"train_loss": -7.041333198547363, "global_step": 161975, "epoch": 3856} {"train_loss": -6.92788028717041, "global_step": 161976, "epoch": 3856} {"train_loss": -6.828825950622559, "global_step": 161977, "epoch": 3856} {"train_loss": -7.024751663208008, "global_step": 161978, "epoch": 3856} {"train_loss": -6.871119022369385, "global_step": 161979, "epoch": 3856} {"train_loss": -7.042136192321777, "global_step": 161980, "epoch": 3856} {"train_loss": -6.946991920471191, "global_step": 161981, "epoch": 3856} {"train_loss": -6.843212127685547, "global_step": 161982, "epoch": 3856} {"train_loss": -7.025291442871094, "global_step": 161983, "epoch": 3856} {"train_loss": -6.895049571990967, "global_step": 161984, "epoch": 3856} {"train_loss": -6.970912933349609, "global_step": 161985, "epoch": 3856} {"train_loss": -6.947540760040283, "global_step": 161986, "epoch": 3856} {"train_loss": -6.933722496032715, "global_step": 161987, "epoch": 3856} {"train_loss": -7.059382438659668, "global_step": 161988, "epoch": 3856} {"train_loss": -7.09359884262085, "global_step": 161989, "epoch": 3856} {"train_loss": -7.020542144775391, "global_step": 161990, "epoch": 3856} {"train_loss": -7.032590389251709, "global_step": 161991, "epoch": 3856} {"train_loss": -7.061167240142822, "global_step": 161992, "epoch": 3856} {"train_loss": -6.938076098759969, "global_step": 161993, "epoch": 3856, "val_loss": 79404.953125} {"train_loss": -6.947340488433838, "global_step": 161994, "epoch": 3857} {"train_loss": -7.0334367752075195, "global_step": 161995, "epoch": 3857} {"train_loss": -7.095083236694336, "global_step": 161996, "epoch": 3857} {"train_loss": -6.93389892578125, "global_step": 161997, "epoch": 3857} {"train_loss": -7.071046829223633, "global_step": 161998, "epoch": 3857} {"train_loss": -6.968992233276367, "global_step": 161999, "epoch": 3857} {"train_loss": -7.012167930603027, "global_step": 162000, "epoch": 3857} {"train_loss": -7.009345531463623, "global_step": 162001, "epoch": 3857} {"train_loss": -6.994824409484863, "global_step": 162002, "epoch": 3857} {"train_loss": -6.974095344543457, "global_step": 162003, "epoch": 3857} {"train_loss": -6.988977909088135, "global_step": 162004, "epoch": 3857} {"train_loss": -6.9138641357421875, "global_step": 162005, "epoch": 3857} {"train_loss": -7.0809526443481445, "global_step": 162006, "epoch": 3857} {"train_loss": -7.031911849975586, "global_step": 162007, "epoch": 3857} {"train_loss": -6.885725021362305, "global_step": 162008, "epoch": 3857} {"train_loss": -6.944611549377441, "global_step": 162009, "epoch": 3857} {"train_loss": -7.008004665374756, "global_step": 162010, "epoch": 3857} {"train_loss": -6.839455604553223, "global_step": 162011, "epoch": 3857} {"train_loss": -6.913281440734863, "global_step": 162012, "epoch": 3857} {"train_loss": -6.938556671142578, "global_step": 162013, "epoch": 3857} {"train_loss": -6.698539733886719, "global_step": 162014, "epoch": 3857} {"train_loss": -7.076452255249023, "global_step": 162015, "epoch": 3857} {"train_loss": -7.031547546386719, "global_step": 162016, "epoch": 3857} {"train_loss": -6.906963348388672, "global_step": 162017, "epoch": 3857} {"train_loss": -6.915800094604492, "global_step": 162018, "epoch": 3857} {"train_loss": -6.779698371887207, "global_step": 162019, "epoch": 3857} {"train_loss": -6.821888446807861, "global_step": 162020, "epoch": 3857} {"train_loss": -6.801766395568848, "global_step": 162021, "epoch": 3857} {"train_loss": -6.909623146057129, "global_step": 162022, "epoch": 3857} {"train_loss": -6.996074199676514, "global_step": 162023, "epoch": 3857} {"train_loss": -6.915987968444824, "global_step": 162024, "epoch": 3857} {"train_loss": -6.946638107299805, "global_step": 162025, "epoch": 3857} {"train_loss": -6.90273904800415, "global_step": 162026, "epoch": 3857} {"train_loss": -6.888213157653809, "global_step": 162027, "epoch": 3857} {"train_loss": -7.008125305175781, "global_step": 162028, "epoch": 3857} {"train_loss": -6.838010787963867, "global_step": 162029, "epoch": 3857} {"train_loss": -6.9078803062438965, "global_step": 162030, "epoch": 3857} {"train_loss": -6.847109317779541, "global_step": 162031, "epoch": 3857} {"train_loss": -6.977662086486816, "global_step": 162032, "epoch": 3857} {"train_loss": -7.158528804779053, "global_step": 162033, "epoch": 3857} {"train_loss": -6.918950080871582, "global_step": 162034, "epoch": 3857} {"train_loss": -6.9465963159288675, "global_step": 162035, "epoch": 3857, "val_loss": 79688.875} {"train_loss": -7.024208068847656, "global_step": 162036, "epoch": 3858} {"train_loss": -6.934309005737305, "global_step": 162037, "epoch": 3858} {"train_loss": -6.864546775817871, "global_step": 162038, "epoch": 3858} {"train_loss": -6.9438629150390625, "global_step": 162039, "epoch": 3858} {"train_loss": -6.976070404052734, "global_step": 162040, "epoch": 3858} {"train_loss": -6.863284111022949, "global_step": 162041, "epoch": 3858} {"train_loss": -6.863640785217285, "global_step": 162042, "epoch": 3858} {"train_loss": -6.895932197570801, "global_step": 162043, "epoch": 3858} {"train_loss": -6.8253326416015625, "global_step": 162044, "epoch": 3858} {"train_loss": -6.771329879760742, "global_step": 162045, "epoch": 3858} {"train_loss": -7.011446952819824, "global_step": 162046, "epoch": 3858} {"train_loss": -6.659139633178711, "global_step": 162047, "epoch": 3858} {"train_loss": -6.981741428375244, "global_step": 162048, "epoch": 3858} {"train_loss": -6.828415870666504, "global_step": 162049, "epoch": 3858} {"train_loss": -6.953379154205322, "global_step": 162050, "epoch": 3858} {"train_loss": -6.847958087921143, "global_step": 162051, "epoch": 3858} {"train_loss": -6.8741655349731445, "global_step": 162052, "epoch": 3858} {"train_loss": -7.085688591003418, "global_step": 162053, "epoch": 3858} {"train_loss": -6.869467735290527, "global_step": 162054, "epoch": 3858} {"train_loss": -6.960922718048096, "global_step": 162055, "epoch": 3858} {"train_loss": -6.936304092407227, "global_step": 162056, "epoch": 3858} {"train_loss": -6.934554100036621, "global_step": 162057, "epoch": 3858} {"train_loss": -6.904577255249023, "global_step": 162058, "epoch": 3858} {"train_loss": -6.9151201248168945, "global_step": 162059, "epoch": 3858} {"train_loss": -6.923532485961914, "global_step": 162060, "epoch": 3858} {"train_loss": -6.939201354980469, "global_step": 162061, "epoch": 3858} {"train_loss": -7.060695171356201, "global_step": 162062, "epoch": 3858} {"train_loss": -7.040803909301758, "global_step": 162063, "epoch": 3858} {"train_loss": -7.016901969909668, "global_step": 162064, "epoch": 3858} {"train_loss": -6.999451637268066, "global_step": 162065, "epoch": 3858} {"train_loss": -7.088887691497803, "global_step": 162066, "epoch": 3858} {"train_loss": -7.043088912963867, "global_step": 162067, "epoch": 3858} {"train_loss": -7.010568618774414, "global_step": 162068, "epoch": 3858} {"train_loss": -7.034212589263916, "global_step": 162069, "epoch": 3858} {"train_loss": -7.007025241851807, "global_step": 162070, "epoch": 3858} {"train_loss": -7.02301025390625, "global_step": 162071, "epoch": 3858} {"train_loss": -7.028949737548828, "global_step": 162072, "epoch": 3858} {"train_loss": -7.037132263183594, "global_step": 162073, "epoch": 3858} {"train_loss": -6.950476169586182, "global_step": 162074, "epoch": 3858} {"train_loss": -7.093874931335449, "global_step": 162075, "epoch": 3858} {"train_loss": -7.024101257324219, "global_step": 162076, "epoch": 3858} {"train_loss": -6.951567275183542, "global_step": 162077, "epoch": 3858, "val_loss": 79500.7421875} {"train_loss": -7.081371307373047, "global_step": 162078, "epoch": 3859} {"train_loss": -7.045871734619141, "global_step": 162079, "epoch": 3859} {"train_loss": -7.145898818969727, "global_step": 162080, "epoch": 3859} {"train_loss": -6.969494342803955, "global_step": 162081, "epoch": 3859} {"train_loss": -7.040287017822266, "global_step": 162082, "epoch": 3859} {"train_loss": -7.04306697845459, "global_step": 162083, "epoch": 3859} {"train_loss": -7.050806045532227, "global_step": 162084, "epoch": 3859} {"train_loss": -7.090442657470703, "global_step": 162085, "epoch": 3859} {"train_loss": -7.107253074645996, "global_step": 162086, "epoch": 3859} {"train_loss": -7.01217794418335, "global_step": 162087, "epoch": 3859} {"train_loss": -7.022028923034668, "global_step": 162088, "epoch": 3859} {"train_loss": -7.112578392028809, "global_step": 162089, "epoch": 3859} {"train_loss": -7.016688346862793, "global_step": 162090, "epoch": 3859} {"train_loss": -7.077784538269043, "global_step": 162091, "epoch": 3859} {"train_loss": -7.075399398803711, "global_step": 162092, "epoch": 3859} {"train_loss": -7.087508678436279, "global_step": 162093, "epoch": 3859} {"train_loss": -7.026649475097656, "global_step": 162094, "epoch": 3859} {"train_loss": -7.004790782928467, "global_step": 162095, "epoch": 3859} {"train_loss": -7.022042274475098, "global_step": 162096, "epoch": 3859} {"train_loss": -7.0547943115234375, "global_step": 162097, "epoch": 3859} {"train_loss": -6.879120826721191, "global_step": 162098, "epoch": 3859} {"train_loss": -7.035661697387695, "global_step": 162099, "epoch": 3859} {"train_loss": -6.952001571655273, "global_step": 162100, "epoch": 3859} {"train_loss": -6.847060680389404, "global_step": 162101, "epoch": 3859} {"train_loss": -7.0430121421813965, "global_step": 162102, "epoch": 3859} {"train_loss": -6.9736433029174805, "global_step": 162103, "epoch": 3859} {"train_loss": -6.992920875549316, "global_step": 162104, "epoch": 3859} {"train_loss": -7.050609111785889, "global_step": 162105, "epoch": 3859} {"train_loss": -6.969254970550537, "global_step": 162106, "epoch": 3859} {"train_loss": -6.889240741729736, "global_step": 162107, "epoch": 3859} {"train_loss": -6.972296714782715, "global_step": 162108, "epoch": 3859} {"train_loss": -6.910374641418457, "global_step": 162109, "epoch": 3859} {"train_loss": -6.959048271179199, "global_step": 162110, "epoch": 3859} {"train_loss": -6.927935600280762, "global_step": 162111, "epoch": 3859} {"train_loss": -6.931382656097412, "global_step": 162112, "epoch": 3859} {"train_loss": -6.971733093261719, "global_step": 162113, "epoch": 3859} {"train_loss": -6.967349529266357, "global_step": 162114, "epoch": 3859} {"train_loss": -6.995566368103027, "global_step": 162115, "epoch": 3859} {"train_loss": -6.942625522613525, "global_step": 162116, "epoch": 3859} {"train_loss": -7.07352352142334, "global_step": 162117, "epoch": 3859} {"train_loss": -7.038077354431152, "global_step": 162118, "epoch": 3859} {"train_loss": -7.008616163617089, "global_step": 162119, "epoch": 3859, "val_loss": 79138.4921875} {"train_loss": -7.04055118560791, "global_step": 162120, "epoch": 3860} {"train_loss": -6.965826511383057, "global_step": 162121, "epoch": 3860} {"train_loss": -7.0173234939575195, "global_step": 162122, "epoch": 3860} {"train_loss": -7.035297393798828, "global_step": 162123, "epoch": 3860} {"train_loss": -6.871974468231201, "global_step": 162124, "epoch": 3860} {"train_loss": -6.948511123657227, "global_step": 162125, "epoch": 3860} {"train_loss": -6.949390411376953, "global_step": 162126, "epoch": 3860} {"train_loss": -6.919873237609863, "global_step": 162127, "epoch": 3860} {"train_loss": -6.916949272155762, "global_step": 162128, "epoch": 3860} {"train_loss": -6.835063934326172, "global_step": 162129, "epoch": 3860} {"train_loss": -6.959784507751465, "global_step": 162130, "epoch": 3860} {"train_loss": -7.098374366760254, "global_step": 162131, "epoch": 3860} {"train_loss": -6.92852783203125, "global_step": 162132, "epoch": 3860} {"train_loss": -6.888370990753174, "global_step": 162133, "epoch": 3860} {"train_loss": -7.069884777069092, "global_step": 162134, "epoch": 3860} {"train_loss": -7.033652305603027, "global_step": 162135, "epoch": 3860} {"train_loss": -7.0030436515808105, "global_step": 162136, "epoch": 3860} {"train_loss": -6.9552001953125, "global_step": 162137, "epoch": 3860} {"train_loss": -6.938735008239746, "global_step": 162138, "epoch": 3860} {"train_loss": -6.846248626708984, "global_step": 162139, "epoch": 3860} {"train_loss": -6.844902515411377, "global_step": 162140, "epoch": 3860} {"train_loss": -6.872321128845215, "global_step": 162141, "epoch": 3860} {"train_loss": -7.0038862228393555, "global_step": 162142, "epoch": 3860} {"train_loss": -6.955295562744141, "global_step": 162143, "epoch": 3860} {"train_loss": -6.874730110168457, "global_step": 162144, "epoch": 3860} {"train_loss": -6.98194694519043, "global_step": 162145, "epoch": 3860} {"train_loss": -6.926613807678223, "global_step": 162146, "epoch": 3860} {"train_loss": -7.058529853820801, "global_step": 162147, "epoch": 3860} {"train_loss": -6.956501007080078, "global_step": 162148, "epoch": 3860} {"train_loss": -6.971889495849609, "global_step": 162149, "epoch": 3860} {"train_loss": -7.090935707092285, "global_step": 162150, "epoch": 3860} {"train_loss": -6.856825351715088, "global_step": 162151, "epoch": 3860} {"train_loss": -6.972580432891846, "global_step": 162152, "epoch": 3860} {"train_loss": -6.872885227203369, "global_step": 162153, "epoch": 3860} {"train_loss": -6.8835015296936035, "global_step": 162154, "epoch": 3860} {"train_loss": -6.918949127197266, "global_step": 162155, "epoch": 3860} {"train_loss": -6.9331769943237305, "global_step": 162156, "epoch": 3860} {"train_loss": -6.938735008239746, "global_step": 162157, "epoch": 3860} {"train_loss": -6.979648590087891, "global_step": 162158, "epoch": 3860} {"train_loss": -6.844905853271484, "global_step": 162159, "epoch": 3860} {"train_loss": -6.9257659912109375, "global_step": 162160, "epoch": 3860} {"train_loss": -6.946809904915946, "global_step": 162161, "epoch": 3860, "val_loss": 79162.8359375} {"train_loss": -6.958357334136963, "global_step": 162162, "epoch": 3861} {"train_loss": -6.9054999351501465, "global_step": 162163, "epoch": 3861} {"train_loss": -6.967906475067139, "global_step": 162164, "epoch": 3861} {"train_loss": -6.974338531494141, "global_step": 162165, "epoch": 3861} {"train_loss": -6.9426069259643555, "global_step": 162166, "epoch": 3861} {"train_loss": -7.0414838790893555, "global_step": 162167, "epoch": 3861} {"train_loss": -6.869664669036865, "global_step": 162168, "epoch": 3861} {"train_loss": -6.96214485168457, "global_step": 162169, "epoch": 3861} {"train_loss": -7.005209922790527, "global_step": 162170, "epoch": 3861} {"train_loss": -6.973997592926025, "global_step": 162171, "epoch": 3861} {"train_loss": -6.867588520050049, "global_step": 162172, "epoch": 3861} {"train_loss": -6.956216812133789, "global_step": 162173, "epoch": 3861} {"train_loss": -6.975018501281738, "global_step": 162174, "epoch": 3861} {"train_loss": -7.032605171203613, "global_step": 162175, "epoch": 3861} {"train_loss": -6.989715576171875, "global_step": 162176, "epoch": 3861} {"train_loss": -7.045564651489258, "global_step": 162177, "epoch": 3861} {"train_loss": -6.919612884521484, "global_step": 162178, "epoch": 3861} {"train_loss": -6.9589033126831055, "global_step": 162179, "epoch": 3861} {"train_loss": -6.995923042297363, "global_step": 162180, "epoch": 3861} {"train_loss": -6.91319465637207, "global_step": 162181, "epoch": 3861} {"train_loss": -6.960910797119141, "global_step": 162182, "epoch": 3861} {"train_loss": -6.989788055419922, "global_step": 162183, "epoch": 3861} {"train_loss": -6.919605731964111, "global_step": 162184, "epoch": 3861} {"train_loss": -6.903351783752441, "global_step": 162185, "epoch": 3861} {"train_loss": -6.9149909019470215, "global_step": 162186, "epoch": 3861} {"train_loss": -6.947287559509277, "global_step": 162187, "epoch": 3861} {"train_loss": -6.899781227111816, "global_step": 162188, "epoch": 3861} {"train_loss": -6.963102340698242, "global_step": 162189, "epoch": 3861} {"train_loss": -7.005536079406738, "global_step": 162190, "epoch": 3861} {"train_loss": -6.967104911804199, "global_step": 162191, "epoch": 3861} {"train_loss": -6.9644880294799805, "global_step": 162192, "epoch": 3861} {"train_loss": -6.859264850616455, "global_step": 162193, "epoch": 3861} {"train_loss": -6.913002014160156, "global_step": 162194, "epoch": 3861} {"train_loss": -6.949177265167236, "global_step": 162195, "epoch": 3861} {"train_loss": -7.026683807373047, "global_step": 162196, "epoch": 3861} {"train_loss": -6.874602317810059, "global_step": 162197, "epoch": 3861} {"train_loss": -6.9242167472839355, "global_step": 162198, "epoch": 3861} {"train_loss": -7.050353050231934, "global_step": 162199, "epoch": 3861} {"train_loss": -6.843538761138916, "global_step": 162200, "epoch": 3861} {"train_loss": -6.994982719421387, "global_step": 162201, "epoch": 3861} {"train_loss": -6.981660842895508, "global_step": 162202, "epoch": 3861} {"train_loss": -6.9554929960341685, "global_step": 162203, "epoch": 3861, "val_loss": 79444.90625} {"train_loss": -6.977396488189697, "global_step": 162204, "epoch": 3862} {"train_loss": -7.035977840423584, "global_step": 162205, "epoch": 3862} {"train_loss": -7.056600570678711, "global_step": 162206, "epoch": 3862} {"train_loss": -7.021852016448975, "global_step": 162207, "epoch": 3862} {"train_loss": -7.051759719848633, "global_step": 162208, "epoch": 3862} {"train_loss": -7.007124900817871, "global_step": 162209, "epoch": 3862} {"train_loss": -7.040951728820801, "global_step": 162210, "epoch": 3862} {"train_loss": -7.096273422241211, "global_step": 162211, "epoch": 3862} {"train_loss": -6.95828914642334, "global_step": 162212, "epoch": 3862} {"train_loss": -6.897783279418945, "global_step": 162213, "epoch": 3862} {"train_loss": -7.002917289733887, "global_step": 162214, "epoch": 3862} {"train_loss": -7.041036128997803, "global_step": 162215, "epoch": 3862} {"train_loss": -6.966609954833984, "global_step": 162216, "epoch": 3862} {"train_loss": -7.032533645629883, "global_step": 162217, "epoch": 3862} {"train_loss": -6.990009307861328, "global_step": 162218, "epoch": 3862} {"train_loss": -7.0936079025268555, "global_step": 162219, "epoch": 3862} {"train_loss": -7.120750904083252, "global_step": 162220, "epoch": 3862} {"train_loss": -7.014740467071533, "global_step": 162221, "epoch": 3862} {"train_loss": -7.106381416320801, "global_step": 162222, "epoch": 3862} {"train_loss": -6.896615982055664, "global_step": 162223, "epoch": 3862} {"train_loss": -6.9582977294921875, "global_step": 162224, "epoch": 3862} {"train_loss": -7.024590492248535, "global_step": 162225, "epoch": 3862} {"train_loss": -6.924891948699951, "global_step": 162226, "epoch": 3862} {"train_loss": -6.946463584899902, "global_step": 162227, "epoch": 3862} {"train_loss": -6.980462551116943, "global_step": 162228, "epoch": 3862} {"train_loss": -7.085803508758545, "global_step": 162229, "epoch": 3862} {"train_loss": -7.0850725173950195, "global_step": 162230, "epoch": 3862} {"train_loss": -7.017159461975098, "global_step": 162231, "epoch": 3862} {"train_loss": -7.049439430236816, "global_step": 162232, "epoch": 3862} {"train_loss": -6.9661993980407715, "global_step": 162233, "epoch": 3862} {"train_loss": -7.129411220550537, "global_step": 162234, "epoch": 3862} {"train_loss": -7.016329765319824, "global_step": 162235, "epoch": 3862} {"train_loss": -7.07644510269165, "global_step": 162236, "epoch": 3862} {"train_loss": -7.030320167541504, "global_step": 162237, "epoch": 3862} {"train_loss": -7.066479682922363, "global_step": 162238, "epoch": 3862} {"train_loss": -7.005261421203613, "global_step": 162239, "epoch": 3862} {"train_loss": -7.128212928771973, "global_step": 162240, "epoch": 3862} {"train_loss": -6.978140354156494, "global_step": 162241, "epoch": 3862} {"train_loss": -7.052700519561768, "global_step": 162242, "epoch": 3862} {"train_loss": -6.994255542755127, "global_step": 162243, "epoch": 3862} {"train_loss": -6.996791839599609, "global_step": 162244, "epoch": 3862} {"train_loss": -7.021238190787179, "global_step": 162245, "epoch": 3862, "val_loss": 79352.4609375} {"train_loss": -7.087672710418701, "global_step": 162246, "epoch": 3863} {"train_loss": -6.993480205535889, "global_step": 162247, "epoch": 3863} {"train_loss": -6.943767547607422, "global_step": 162248, "epoch": 3863} {"train_loss": -6.93815803527832, "global_step": 162249, "epoch": 3863} {"train_loss": -6.969351768493652, "global_step": 162250, "epoch": 3863} {"train_loss": -6.977886199951172, "global_step": 162251, "epoch": 3863} {"train_loss": -6.890896797180176, "global_step": 162252, "epoch": 3863} {"train_loss": -7.002993583679199, "global_step": 162253, "epoch": 3863} {"train_loss": -6.999987602233887, "global_step": 162254, "epoch": 3863} {"train_loss": -7.00551176071167, "global_step": 162255, "epoch": 3863} {"train_loss": -7.107853889465332, "global_step": 162256, "epoch": 3863} {"train_loss": -6.960023880004883, "global_step": 162257, "epoch": 3863} {"train_loss": -7.022294998168945, "global_step": 162258, "epoch": 3863} {"train_loss": -6.973577499389648, "global_step": 162259, "epoch": 3863} {"train_loss": -6.998551368713379, "global_step": 162260, "epoch": 3863} {"train_loss": -6.9340314865112305, "global_step": 162261, "epoch": 3863} {"train_loss": -6.837610721588135, "global_step": 162262, "epoch": 3863} {"train_loss": -6.901256561279297, "global_step": 162263, "epoch": 3863} {"train_loss": -7.015420913696289, "global_step": 162264, "epoch": 3863} {"train_loss": -7.0784807205200195, "global_step": 162265, "epoch": 3863} {"train_loss": -6.962092399597168, "global_step": 162266, "epoch": 3863} {"train_loss": -6.98834228515625, "global_step": 162267, "epoch": 3863} {"train_loss": -6.98576545715332, "global_step": 162268, "epoch": 3863} {"train_loss": -7.043194770812988, "global_step": 162269, "epoch": 3863} {"train_loss": -7.049920082092285, "global_step": 162270, "epoch": 3863} {"train_loss": -6.918335437774658, "global_step": 162271, "epoch": 3863} {"train_loss": -6.972012519836426, "global_step": 162272, "epoch": 3863} {"train_loss": -6.894350051879883, "global_step": 162273, "epoch": 3863} {"train_loss": -7.026973724365234, "global_step": 162274, "epoch": 3863} {"train_loss": -7.039716720581055, "global_step": 162275, "epoch": 3863} {"train_loss": -7.008440017700195, "global_step": 162276, "epoch": 3863} {"train_loss": -7.054035186767578, "global_step": 162277, "epoch": 3863} {"train_loss": -6.951198577880859, "global_step": 162278, "epoch": 3863} {"train_loss": -6.884471416473389, "global_step": 162279, "epoch": 3863} {"train_loss": -6.9580183029174805, "global_step": 162280, "epoch": 3863} {"train_loss": -6.944799423217773, "global_step": 162281, "epoch": 3863} {"train_loss": -6.916953086853027, "global_step": 162282, "epoch": 3863} {"train_loss": -6.990765571594238, "global_step": 162283, "epoch": 3863} {"train_loss": -6.9952850341796875, "global_step": 162284, "epoch": 3863} {"train_loss": -7.064700126647949, "global_step": 162285, "epoch": 3863} {"train_loss": -7.045363426208496, "global_step": 162286, "epoch": 3863} {"train_loss": -6.986287434895833, "global_step": 162287, "epoch": 3863, "val_loss": 79620.9140625} {"train_loss": -7.029390811920166, "global_step": 162288, "epoch": 3864} {"train_loss": -6.952278137207031, "global_step": 162289, "epoch": 3864} {"train_loss": -7.000465393066406, "global_step": 162290, "epoch": 3864} {"train_loss": -6.98109245300293, "global_step": 162291, "epoch": 3864} {"train_loss": -7.165648937225342, "global_step": 162292, "epoch": 3864} {"train_loss": -7.0360870361328125, "global_step": 162293, "epoch": 3864} {"train_loss": -6.993203163146973, "global_step": 162294, "epoch": 3864} {"train_loss": -7.061262607574463, "global_step": 162295, "epoch": 3864} {"train_loss": -7.090865135192871, "global_step": 162296, "epoch": 3864} {"train_loss": -7.031838893890381, "global_step": 162297, "epoch": 3864} {"train_loss": -7.041607856750488, "global_step": 162298, "epoch": 3864} {"train_loss": -7.062556266784668, "global_step": 162299, "epoch": 3864} {"train_loss": -6.987161159515381, "global_step": 162300, "epoch": 3864} {"train_loss": -6.963540077209473, "global_step": 162301, "epoch": 3864} {"train_loss": -7.037130355834961, "global_step": 162302, "epoch": 3864} {"train_loss": -7.078552722930908, "global_step": 162303, "epoch": 3864} {"train_loss": -6.82791805267334, "global_step": 162304, "epoch": 3864} {"train_loss": -6.925721645355225, "global_step": 162305, "epoch": 3864} {"train_loss": -6.933347225189209, "global_step": 162306, "epoch": 3864} {"train_loss": -6.995982646942139, "global_step": 162307, "epoch": 3864} {"train_loss": -6.926163673400879, "global_step": 162308, "epoch": 3864} {"train_loss": -6.891721725463867, "global_step": 162309, "epoch": 3864} {"train_loss": -7.029237747192383, "global_step": 162310, "epoch": 3864} {"train_loss": -7.009674549102783, "global_step": 162311, "epoch": 3864} {"train_loss": -6.980676651000977, "global_step": 162312, "epoch": 3864} {"train_loss": -6.969032287597656, "global_step": 162313, "epoch": 3864} {"train_loss": -6.923639297485352, "global_step": 162314, "epoch": 3864} {"train_loss": -6.990123271942139, "global_step": 162315, "epoch": 3864} {"train_loss": -6.886472702026367, "global_step": 162316, "epoch": 3864} {"train_loss": -6.923151969909668, "global_step": 162317, "epoch": 3864} {"train_loss": -6.95930814743042, "global_step": 162318, "epoch": 3864} {"train_loss": -7.015617847442627, "global_step": 162319, "epoch": 3864} {"train_loss": -6.798877716064453, "global_step": 162320, "epoch": 3864} {"train_loss": -6.962645053863525, "global_step": 162321, "epoch": 3864} {"train_loss": -6.94120979309082, "global_step": 162322, "epoch": 3864} {"train_loss": -6.942541599273682, "global_step": 162323, "epoch": 3864} {"train_loss": -6.885555744171143, "global_step": 162324, "epoch": 3864} {"train_loss": -6.911396026611328, "global_step": 162325, "epoch": 3864} {"train_loss": -6.94918966293335, "global_step": 162326, "epoch": 3864} {"train_loss": -6.806116104125977, "global_step": 162327, "epoch": 3864} {"train_loss": -7.047430038452148, "global_step": 162328, "epoch": 3864} {"train_loss": -6.9723695913950605, "global_step": 162329, "epoch": 3864, "val_loss": 79443.03125} {"train_loss": -6.926700592041016, "global_step": 162330, "epoch": 3865} {"train_loss": -6.921030044555664, "global_step": 162331, "epoch": 3865} {"train_loss": -7.040761947631836, "global_step": 162332, "epoch": 3865} {"train_loss": -7.01253604888916, "global_step": 162333, "epoch": 3865} {"train_loss": -6.929342269897461, "global_step": 162334, "epoch": 3865} {"train_loss": -7.050495624542236, "global_step": 162335, "epoch": 3865} {"train_loss": -6.936803340911865, "global_step": 162336, "epoch": 3865} {"train_loss": -7.067523002624512, "global_step": 162337, "epoch": 3865} {"train_loss": -6.949213981628418, "global_step": 162338, "epoch": 3865} {"train_loss": -7.0539350509643555, "global_step": 162339, "epoch": 3865} {"train_loss": -6.957187175750732, "global_step": 162340, "epoch": 3865} {"train_loss": -7.005756855010986, "global_step": 162341, "epoch": 3865} {"train_loss": -6.945302963256836, "global_step": 162342, "epoch": 3865} {"train_loss": -6.996363639831543, "global_step": 162343, "epoch": 3865} {"train_loss": -6.945186138153076, "global_step": 162344, "epoch": 3865} {"train_loss": -6.921700477600098, "global_step": 162345, "epoch": 3865} {"train_loss": -6.943175315856934, "global_step": 162346, "epoch": 3865} {"train_loss": -6.955075740814209, "global_step": 162347, "epoch": 3865} {"train_loss": -7.078235149383545, "global_step": 162348, "epoch": 3865} {"train_loss": -6.9703145027160645, "global_step": 162349, "epoch": 3865} {"train_loss": -7.053227424621582, "global_step": 162350, "epoch": 3865} {"train_loss": -6.909330368041992, "global_step": 162351, "epoch": 3865} {"train_loss": -6.980813026428223, "global_step": 162352, "epoch": 3865} {"train_loss": -6.868634223937988, "global_step": 162353, "epoch": 3865} {"train_loss": -6.955299377441406, "global_step": 162354, "epoch": 3865} {"train_loss": -6.959781169891357, "global_step": 162355, "epoch": 3865} {"train_loss": -7.0353007316589355, "global_step": 162356, "epoch": 3865} {"train_loss": -6.950490951538086, "global_step": 162357, "epoch": 3865} {"train_loss": -6.987042427062988, "global_step": 162358, "epoch": 3865} {"train_loss": -6.949793338775635, "global_step": 162359, "epoch": 3865} {"train_loss": -6.798176288604736, "global_step": 162360, "epoch": 3865} {"train_loss": -6.783111095428467, "global_step": 162361, "epoch": 3865} {"train_loss": -6.8657450675964355, "global_step": 162362, "epoch": 3865} {"train_loss": -6.845297813415527, "global_step": 162363, "epoch": 3865} {"train_loss": -6.895730018615723, "global_step": 162364, "epoch": 3865} {"train_loss": -6.810587406158447, "global_step": 162365, "epoch": 3865} {"train_loss": -6.9094462394714355, "global_step": 162366, "epoch": 3865} {"train_loss": -6.828545570373535, "global_step": 162367, "epoch": 3865} {"train_loss": -6.841036796569824, "global_step": 162368, "epoch": 3865} {"train_loss": -6.901379585266113, "global_step": 162369, "epoch": 3865} {"train_loss": -6.878371238708496, "global_step": 162370, "epoch": 3865} {"train_loss": -6.941957371575492, "global_step": 162371, "epoch": 3865, "val_loss": 79715.78125} {"train_loss": -6.954791069030762, "global_step": 162372, "epoch": 3866} {"train_loss": -6.96999979019165, "global_step": 162373, "epoch": 3866} {"train_loss": -6.8790178298950195, "global_step": 162374, "epoch": 3866} {"train_loss": -6.914029121398926, "global_step": 162375, "epoch": 3866} {"train_loss": -7.057339191436768, "global_step": 162376, "epoch": 3866} {"train_loss": -6.92063045501709, "global_step": 162377, "epoch": 3866} {"train_loss": -6.922307014465332, "global_step": 162378, "epoch": 3866} {"train_loss": -6.9942145347595215, "global_step": 162379, "epoch": 3866} {"train_loss": -7.012945652008057, "global_step": 162380, "epoch": 3866} {"train_loss": -6.932712554931641, "global_step": 162381, "epoch": 3866} {"train_loss": -6.992490768432617, "global_step": 162382, "epoch": 3866} {"train_loss": -6.997939109802246, "global_step": 162383, "epoch": 3866} {"train_loss": -6.855219841003418, "global_step": 162384, "epoch": 3866} {"train_loss": -6.888717174530029, "global_step": 162385, "epoch": 3866} {"train_loss": -6.920121192932129, "global_step": 162386, "epoch": 3866} {"train_loss": -7.0326995849609375, "global_step": 162387, "epoch": 3866} {"train_loss": -6.91960334777832, "global_step": 162388, "epoch": 3866} {"train_loss": -6.9222259521484375, "global_step": 162389, "epoch": 3866} {"train_loss": -7.073197364807129, "global_step": 162390, "epoch": 3866} {"train_loss": -7.115516662597656, "global_step": 162391, "epoch": 3866} {"train_loss": -7.114310264587402, "global_step": 162392, "epoch": 3866} {"train_loss": -6.9184064865112305, "global_step": 162393, "epoch": 3866} {"train_loss": -7.001708984375, "global_step": 162394, "epoch": 3866} {"train_loss": -7.080461502075195, "global_step": 162395, "epoch": 3866} {"train_loss": -7.052817344665527, "global_step": 162396, "epoch": 3866} {"train_loss": -6.977838516235352, "global_step": 162397, "epoch": 3866} {"train_loss": -7.046357154846191, "global_step": 162398, "epoch": 3866} {"train_loss": -7.0157928466796875, "global_step": 162399, "epoch": 3866} {"train_loss": -7.048040390014648, "global_step": 162400, "epoch": 3866} {"train_loss": -6.962754249572754, "global_step": 162401, "epoch": 3866} {"train_loss": -6.968793869018555, "global_step": 162402, "epoch": 3866} {"train_loss": -6.969852924346924, "global_step": 162403, "epoch": 3866} {"train_loss": -7.0878376960754395, "global_step": 162404, "epoch": 3866} {"train_loss": -7.012928009033203, "global_step": 162405, "epoch": 3866} {"train_loss": -7.040009021759033, "global_step": 162406, "epoch": 3866} {"train_loss": -7.064576148986816, "global_step": 162407, "epoch": 3866} {"train_loss": -6.987896919250488, "global_step": 162408, "epoch": 3866} {"train_loss": -7.0059919357299805, "global_step": 162409, "epoch": 3866} {"train_loss": -6.947293281555176, "global_step": 162410, "epoch": 3866} {"train_loss": -6.937333106994629, "global_step": 162411, "epoch": 3866} {"train_loss": -6.955204963684082, "global_step": 162412, "epoch": 3866} {"train_loss": -6.98718093690418, "global_step": 162413, "epoch": 3866, "val_loss": 79497.53125} {"train_loss": -7.04378604888916, "global_step": 162414, "epoch": 3867} {"train_loss": -6.9710822105407715, "global_step": 162415, "epoch": 3867} {"train_loss": -7.010369300842285, "global_step": 162416, "epoch": 3867} {"train_loss": -7.071200370788574, "global_step": 162417, "epoch": 3867} {"train_loss": -6.985165596008301, "global_step": 162418, "epoch": 3867} {"train_loss": -6.996218681335449, "global_step": 162419, "epoch": 3867} {"train_loss": -6.986454486846924, "global_step": 162420, "epoch": 3867} {"train_loss": -7.03580904006958, "global_step": 162421, "epoch": 3867} {"train_loss": -6.921721458435059, "global_step": 162422, "epoch": 3867} {"train_loss": -7.030027389526367, "global_step": 162423, "epoch": 3867} {"train_loss": -7.004576206207275, "global_step": 162424, "epoch": 3867} {"train_loss": -6.911015510559082, "global_step": 162425, "epoch": 3867} {"train_loss": -7.141664505004883, "global_step": 162426, "epoch": 3867} {"train_loss": -6.933400630950928, "global_step": 162427, "epoch": 3867} {"train_loss": -6.938282489776611, "global_step": 162428, "epoch": 3867} {"train_loss": -7.081343173980713, "global_step": 162429, "epoch": 3867} {"train_loss": -6.942545413970947, "global_step": 162430, "epoch": 3867} {"train_loss": -6.965219497680664, "global_step": 162431, "epoch": 3867} {"train_loss": -7.111088752746582, "global_step": 162432, "epoch": 3867} {"train_loss": -7.016345024108887, "global_step": 162433, "epoch": 3867} {"train_loss": -6.847139358520508, "global_step": 162434, "epoch": 3867} {"train_loss": -7.057553291320801, "global_step": 162435, "epoch": 3867} {"train_loss": -6.886717319488525, "global_step": 162436, "epoch": 3867} {"train_loss": -6.936890602111816, "global_step": 162437, "epoch": 3867} {"train_loss": -6.980951309204102, "global_step": 162438, "epoch": 3867} {"train_loss": -6.912744998931885, "global_step": 162439, "epoch": 3867} {"train_loss": -6.855678558349609, "global_step": 162440, "epoch": 3867} {"train_loss": -6.862224102020264, "global_step": 162441, "epoch": 3867} {"train_loss": -6.712087631225586, "global_step": 162442, "epoch": 3867} {"train_loss": -6.81732177734375, "global_step": 162443, "epoch": 3867} {"train_loss": -6.949517250061035, "global_step": 162444, "epoch": 3867} {"train_loss": -6.675054550170898, "global_step": 162445, "epoch": 3867} {"train_loss": -6.931424140930176, "global_step": 162446, "epoch": 3867} {"train_loss": -6.834259986877441, "global_step": 162447, "epoch": 3867} {"train_loss": -6.72303581237793, "global_step": 162448, "epoch": 3867} {"train_loss": -6.857202529907227, "global_step": 162449, "epoch": 3867} {"train_loss": -6.691980361938477, "global_step": 162450, "epoch": 3867} {"train_loss": -6.9844560623168945, "global_step": 162451, "epoch": 3867} {"train_loss": -6.728658199310303, "global_step": 162452, "epoch": 3867} {"train_loss": -6.988361358642578, "global_step": 162453, "epoch": 3867} {"train_loss": -6.784176349639893, "global_step": 162454, "epoch": 3867} {"train_loss": -6.929590645290556, "global_step": 162455, "epoch": 3867, "val_loss": 79560.2734375} {"train_loss": -6.873832702636719, "global_step": 162456, "epoch": 3868} {"train_loss": -6.91574239730835, "global_step": 162457, "epoch": 3868} {"train_loss": -6.8155412673950195, "global_step": 162458, "epoch": 3868} {"train_loss": -6.819496154785156, "global_step": 162459, "epoch": 3868} {"train_loss": -6.805869102478027, "global_step": 162460, "epoch": 3868} {"train_loss": -6.910899639129639, "global_step": 162461, "epoch": 3868} {"train_loss": -6.9041748046875, "global_step": 162462, "epoch": 3868} {"train_loss": -6.9276885986328125, "global_step": 162463, "epoch": 3868} {"train_loss": -6.795083999633789, "global_step": 162464, "epoch": 3868} {"train_loss": -6.840597152709961, "global_step": 162465, "epoch": 3868} {"train_loss": -6.916328430175781, "global_step": 162466, "epoch": 3868} {"train_loss": -6.849280834197998, "global_step": 162467, "epoch": 3868} {"train_loss": -6.921200752258301, "global_step": 162468, "epoch": 3868} {"train_loss": -6.784549713134766, "global_step": 162469, "epoch": 3868} {"train_loss": -6.9676971435546875, "global_step": 162470, "epoch": 3868} {"train_loss": -6.961574554443359, "global_step": 162471, "epoch": 3868} {"train_loss": -6.900073051452637, "global_step": 162472, "epoch": 3868} {"train_loss": -6.9015889167785645, "global_step": 162473, "epoch": 3868} {"train_loss": -6.810308933258057, "global_step": 162474, "epoch": 3868} {"train_loss": -6.853216171264648, "global_step": 162475, "epoch": 3868} {"train_loss": -6.845566272735596, "global_step": 162476, "epoch": 3868} {"train_loss": -6.921005725860596, "global_step": 162477, "epoch": 3868} {"train_loss": -6.936394691467285, "global_step": 162478, "epoch": 3868} {"train_loss": -6.863077640533447, "global_step": 162479, "epoch": 3868} {"train_loss": -6.889255523681641, "global_step": 162480, "epoch": 3868} {"train_loss": -6.805500507354736, "global_step": 162481, "epoch": 3868} {"train_loss": -6.896431922912598, "global_step": 162482, "epoch": 3868} {"train_loss": -6.857494354248047, "global_step": 162483, "epoch": 3868} {"train_loss": -6.99700403213501, "global_step": 162484, "epoch": 3868} {"train_loss": -6.992546081542969, "global_step": 162485, "epoch": 3868} {"train_loss": -6.930380821228027, "global_step": 162486, "epoch": 3868} {"train_loss": -7.071952819824219, "global_step": 162487, "epoch": 3868} {"train_loss": -6.986684799194336, "global_step": 162488, "epoch": 3868} {"train_loss": -6.982893943786621, "global_step": 162489, "epoch": 3868} {"train_loss": -6.876837730407715, "global_step": 162490, "epoch": 3868} {"train_loss": -6.953571796417236, "global_step": 162491, "epoch": 3868} {"train_loss": -6.905590057373047, "global_step": 162492, "epoch": 3868} {"train_loss": -6.8767595291137695, "global_step": 162493, "epoch": 3868} {"train_loss": -7.085152626037598, "global_step": 162494, "epoch": 3868} {"train_loss": -6.95681095123291, "global_step": 162495, "epoch": 3868} {"train_loss": -7.116594314575195, "global_step": 162496, "epoch": 3868} {"train_loss": -6.9105657168797086, "global_step": 162497, "epoch": 3868, "val_loss": 79569.5859375} {"train_loss": -7.035589218139648, "global_step": 162498, "epoch": 3869} {"train_loss": -6.979578495025635, "global_step": 162499, "epoch": 3869} {"train_loss": -7.067613124847412, "global_step": 162500, "epoch": 3869} {"train_loss": -7.062026500701904, "global_step": 162501, "epoch": 3869} {"train_loss": -7.002047061920166, "global_step": 162502, "epoch": 3869} {"train_loss": -6.978841781616211, "global_step": 162503, "epoch": 3869} {"train_loss": -7.031354904174805, "global_step": 162504, "epoch": 3869} {"train_loss": -7.062195301055908, "global_step": 162505, "epoch": 3869} {"train_loss": -6.977514266967773, "global_step": 162506, "epoch": 3869} {"train_loss": -7.046702861785889, "global_step": 162507, "epoch": 3869} {"train_loss": -6.861998558044434, "global_step": 162508, "epoch": 3869} {"train_loss": -7.056850433349609, "global_step": 162509, "epoch": 3869} {"train_loss": -7.120532512664795, "global_step": 162510, "epoch": 3869} {"train_loss": -7.032234191894531, "global_step": 162511, "epoch": 3869} {"train_loss": -7.07761287689209, "global_step": 162512, "epoch": 3869} {"train_loss": -6.9952592849731445, "global_step": 162513, "epoch": 3869} {"train_loss": -6.9651007652282715, "global_step": 162514, "epoch": 3869} {"train_loss": -6.95778751373291, "global_step": 162515, "epoch": 3869} {"train_loss": -7.040663719177246, "global_step": 162516, "epoch": 3869} {"train_loss": -6.994256496429443, "global_step": 162517, "epoch": 3869} {"train_loss": -6.963398456573486, "global_step": 162518, "epoch": 3869} {"train_loss": -7.026050567626953, "global_step": 162519, "epoch": 3869} {"train_loss": -6.996660232543945, "global_step": 162520, "epoch": 3869} {"train_loss": -7.1194562911987305, "global_step": 162521, "epoch": 3869} {"train_loss": -7.06809139251709, "global_step": 162522, "epoch": 3869} {"train_loss": -6.9968581199646, "global_step": 162523, "epoch": 3869} {"train_loss": -6.998911380767822, "global_step": 162524, "epoch": 3869} {"train_loss": -6.927107810974121, "global_step": 162525, "epoch": 3869} {"train_loss": -7.061680316925049, "global_step": 162526, "epoch": 3869} {"train_loss": -6.923354148864746, "global_step": 162527, "epoch": 3869} {"train_loss": -6.993797779083252, "global_step": 162528, "epoch": 3869} {"train_loss": -7.06186580657959, "global_step": 162529, "epoch": 3869} {"train_loss": -7.090365886688232, "global_step": 162530, "epoch": 3869} {"train_loss": -6.916414260864258, "global_step": 162531, "epoch": 3869} {"train_loss": -7.074936866760254, "global_step": 162532, "epoch": 3869} {"train_loss": -6.998776435852051, "global_step": 162533, "epoch": 3869} {"train_loss": -7.050472259521484, "global_step": 162534, "epoch": 3869} {"train_loss": -7.1212921142578125, "global_step": 162535, "epoch": 3869} {"train_loss": -6.9014892578125, "global_step": 162536, "epoch": 3869} {"train_loss": -7.028965950012207, "global_step": 162537, "epoch": 3869} {"train_loss": -7.120667457580566, "global_step": 162538, "epoch": 3869} {"train_loss": -7.016886552174886, "global_step": 162539, "epoch": 3869, "val_loss": 79446.453125} {"train_loss": -7.127202987670898, "global_step": 162540, "epoch": 3870} {"train_loss": -7.018701553344727, "global_step": 162541, "epoch": 3870} {"train_loss": -6.962371826171875, "global_step": 162542, "epoch": 3870} {"train_loss": -6.993936538696289, "global_step": 162543, "epoch": 3870} {"train_loss": -7.055345058441162, "global_step": 162544, "epoch": 3870} {"train_loss": -6.835761070251465, "global_step": 162545, "epoch": 3870} {"train_loss": -6.992102146148682, "global_step": 162546, "epoch": 3870} {"train_loss": -6.9667649269104, "global_step": 162547, "epoch": 3870} {"train_loss": -6.868954658508301, "global_step": 162548, "epoch": 3870} {"train_loss": -7.077121734619141, "global_step": 162549, "epoch": 3870} {"train_loss": -6.897796630859375, "global_step": 162550, "epoch": 3870} {"train_loss": -6.883033752441406, "global_step": 162551, "epoch": 3870} {"train_loss": -7.05828332901001, "global_step": 162552, "epoch": 3870} {"train_loss": -6.869123458862305, "global_step": 162553, "epoch": 3870} {"train_loss": -7.060680866241455, "global_step": 162554, "epoch": 3870} {"train_loss": -6.890689849853516, "global_step": 162555, "epoch": 3870} {"train_loss": -6.889288902282715, "global_step": 162556, "epoch": 3870} {"train_loss": -6.98672342300415, "global_step": 162557, "epoch": 3870} {"train_loss": -6.849255084991455, "global_step": 162558, "epoch": 3870} {"train_loss": -6.94559907913208, "global_step": 162559, "epoch": 3870} {"train_loss": -6.919838905334473, "global_step": 162560, "epoch": 3870} {"train_loss": -6.881537914276123, "global_step": 162561, "epoch": 3870} {"train_loss": -6.927556037902832, "global_step": 162562, "epoch": 3870} {"train_loss": -6.991164207458496, "global_step": 162563, "epoch": 3870} {"train_loss": -6.916509628295898, "global_step": 162564, "epoch": 3870} {"train_loss": -6.968106269836426, "global_step": 162565, "epoch": 3870} {"train_loss": -6.946883678436279, "global_step": 162566, "epoch": 3870} {"train_loss": -6.99463415145874, "global_step": 162567, "epoch": 3870} {"train_loss": -7.002072334289551, "global_step": 162568, "epoch": 3870} {"train_loss": -7.026433944702148, "global_step": 162569, "epoch": 3870} {"train_loss": -6.8900299072265625, "global_step": 162570, "epoch": 3870} {"train_loss": -7.03543758392334, "global_step": 162571, "epoch": 3870} {"train_loss": -6.958242416381836, "global_step": 162572, "epoch": 3870} {"train_loss": -6.987213134765625, "global_step": 162573, "epoch": 3870} {"train_loss": -7.022150993347168, "global_step": 162574, "epoch": 3870} {"train_loss": -6.936853408813477, "global_step": 162575, "epoch": 3870} {"train_loss": -7.008645057678223, "global_step": 162576, "epoch": 3870} {"train_loss": -7.016805648803711, "global_step": 162577, "epoch": 3870} {"train_loss": -7.25907564163208, "global_step": 162578, "epoch": 3870} {"train_loss": -7.003262519836426, "global_step": 162579, "epoch": 3870} {"train_loss": -7.022201061248779, "global_step": 162580, "epoch": 3870} {"train_loss": -6.975628648485456, "global_step": 162581, "epoch": 3870, "val_loss": 79390.578125} {"train_loss": -6.980792045593262, "global_step": 162582, "epoch": 3871} {"train_loss": -6.969574928283691, "global_step": 162583, "epoch": 3871} {"train_loss": -7.086205005645752, "global_step": 162584, "epoch": 3871} {"train_loss": -7.072935104370117, "global_step": 162585, "epoch": 3871} {"train_loss": -7.0107622146606445, "global_step": 162586, "epoch": 3871} {"train_loss": -7.0247673988342285, "global_step": 162587, "epoch": 3871} {"train_loss": -6.901852607727051, "global_step": 162588, "epoch": 3871} {"train_loss": -7.096145153045654, "global_step": 162589, "epoch": 3871} {"train_loss": -6.989402770996094, "global_step": 162590, "epoch": 3871} {"train_loss": -6.993393898010254, "global_step": 162591, "epoch": 3871} {"train_loss": -6.935122489929199, "global_step": 162592, "epoch": 3871} {"train_loss": -7.089057922363281, "global_step": 162593, "epoch": 3871} {"train_loss": -7.002029895782471, "global_step": 162594, "epoch": 3871} {"train_loss": -6.930431365966797, "global_step": 162595, "epoch": 3871} {"train_loss": -6.923041820526123, "global_step": 162596, "epoch": 3871} {"train_loss": -6.965095520019531, "global_step": 162597, "epoch": 3871} {"train_loss": -6.9627156257629395, "global_step": 162598, "epoch": 3871} {"train_loss": -7.032195091247559, "global_step": 162599, "epoch": 3871} {"train_loss": -6.972078323364258, "global_step": 162600, "epoch": 3871} {"train_loss": -6.879398345947266, "global_step": 162601, "epoch": 3871} {"train_loss": -7.042990207672119, "global_step": 162602, "epoch": 3871} {"train_loss": -7.116452693939209, "global_step": 162603, "epoch": 3871} {"train_loss": -6.9311065673828125, "global_step": 162604, "epoch": 3871} {"train_loss": -6.948004245758057, "global_step": 162605, "epoch": 3871} {"train_loss": -7.052629470825195, "global_step": 162606, "epoch": 3871} {"train_loss": -7.015255451202393, "global_step": 162607, "epoch": 3871} {"train_loss": -6.997523307800293, "global_step": 162608, "epoch": 3871} {"train_loss": -6.986074447631836, "global_step": 162609, "epoch": 3871} {"train_loss": -7.027281761169434, "global_step": 162610, "epoch": 3871} {"train_loss": -7.082895278930664, "global_step": 162611, "epoch": 3871} {"train_loss": -6.947173118591309, "global_step": 162612, "epoch": 3871} {"train_loss": -7.0080156326293945, "global_step": 162613, "epoch": 3871} {"train_loss": -6.94716739654541, "global_step": 162614, "epoch": 3871} {"train_loss": -6.995271682739258, "global_step": 162615, "epoch": 3871} {"train_loss": -6.969799995422363, "global_step": 162616, "epoch": 3871} {"train_loss": -6.991243362426758, "global_step": 162617, "epoch": 3871} {"train_loss": -7.009123802185059, "global_step": 162618, "epoch": 3871} {"train_loss": -7.044867515563965, "global_step": 162619, "epoch": 3871} {"train_loss": -6.951265811920166, "global_step": 162620, "epoch": 3871} {"train_loss": -6.966315269470215, "global_step": 162621, "epoch": 3871} {"train_loss": -6.980005264282227, "global_step": 162622, "epoch": 3871} {"train_loss": -6.998088575544811, "global_step": 162623, "epoch": 3871, "val_loss": 79573.421875} {"train_loss": -7.0258073806762695, "global_step": 162624, "epoch": 3872} {"train_loss": -7.077602863311768, "global_step": 162625, "epoch": 3872} {"train_loss": -7.084438323974609, "global_step": 162626, "epoch": 3872} {"train_loss": -7.010871887207031, "global_step": 162627, "epoch": 3872} {"train_loss": -6.95987606048584, "global_step": 162628, "epoch": 3872} {"train_loss": -7.0476908683776855, "global_step": 162629, "epoch": 3872} {"train_loss": -6.915875434875488, "global_step": 162630, "epoch": 3872} {"train_loss": -6.75166654586792, "global_step": 162631, "epoch": 3872} {"train_loss": -6.999215126037598, "global_step": 162632, "epoch": 3872} {"train_loss": -6.98744010925293, "global_step": 162633, "epoch": 3872} {"train_loss": -6.88137149810791, "global_step": 162634, "epoch": 3872} {"train_loss": -7.053907871246338, "global_step": 162635, "epoch": 3872} {"train_loss": -6.994314193725586, "global_step": 162636, "epoch": 3872} {"train_loss": -6.977664470672607, "global_step": 162637, "epoch": 3872} {"train_loss": -7.027835845947266, "global_step": 162638, "epoch": 3872} {"train_loss": -6.957287311553955, "global_step": 162639, "epoch": 3872} {"train_loss": -6.8959245681762695, "global_step": 162640, "epoch": 3872} {"train_loss": -6.903354167938232, "global_step": 162641, "epoch": 3872} {"train_loss": -6.988373756408691, "global_step": 162642, "epoch": 3872} {"train_loss": -7.029393196105957, "global_step": 162643, "epoch": 3872} {"train_loss": -6.974949836730957, "global_step": 162644, "epoch": 3872} {"train_loss": -7.017306804656982, "global_step": 162645, "epoch": 3872} {"train_loss": -6.896191596984863, "global_step": 162646, "epoch": 3872} {"train_loss": -6.950441837310791, "global_step": 162647, "epoch": 3872} {"train_loss": -7.061028003692627, "global_step": 162648, "epoch": 3872} {"train_loss": -7.0111470222473145, "global_step": 162649, "epoch": 3872} {"train_loss": -6.997062683105469, "global_step": 162650, "epoch": 3872} {"train_loss": -7.010551452636719, "global_step": 162651, "epoch": 3872} {"train_loss": -7.0414581298828125, "global_step": 162652, "epoch": 3872} {"train_loss": -6.95896577835083, "global_step": 162653, "epoch": 3872} {"train_loss": -6.916158676147461, "global_step": 162654, "epoch": 3872} {"train_loss": -6.821173667907715, "global_step": 162655, "epoch": 3872} {"train_loss": -6.726601600646973, "global_step": 162656, "epoch": 3872} {"train_loss": -7.111528396606445, "global_step": 162657, "epoch": 3872} {"train_loss": -6.962888717651367, "global_step": 162658, "epoch": 3872} {"train_loss": -6.828945159912109, "global_step": 162659, "epoch": 3872} {"train_loss": -6.949810028076172, "global_step": 162660, "epoch": 3872} {"train_loss": -6.906729698181152, "global_step": 162661, "epoch": 3872} {"train_loss": -6.7726640701293945, "global_step": 162662, "epoch": 3872} {"train_loss": -6.9421281814575195, "global_step": 162663, "epoch": 3872} {"train_loss": -6.920537948608398, "global_step": 162664, "epoch": 3872} {"train_loss": -6.961251974105835, "global_step": 162665, "epoch": 3872, "val_loss": 79298.7578125} {"train_loss": -6.9826202392578125, "global_step": 162666, "epoch": 3873} {"train_loss": -6.966879844665527, "global_step": 162667, "epoch": 3873} {"train_loss": -6.955211639404297, "global_step": 162668, "epoch": 3873} {"train_loss": -7.044057369232178, "global_step": 162669, "epoch": 3873} {"train_loss": -7.008339881896973, "global_step": 162670, "epoch": 3873} {"train_loss": -6.8481950759887695, "global_step": 162671, "epoch": 3873} {"train_loss": -6.965859889984131, "global_step": 162672, "epoch": 3873} {"train_loss": -7.019763469696045, "global_step": 162673, "epoch": 3873} {"train_loss": -7.063289642333984, "global_step": 162674, "epoch": 3873} {"train_loss": -7.023221015930176, "global_step": 162675, "epoch": 3873} {"train_loss": -7.152327537536621, "global_step": 162676, "epoch": 3873} {"train_loss": -7.020617485046387, "global_step": 162677, "epoch": 3873} {"train_loss": -6.871317386627197, "global_step": 162678, "epoch": 3873} {"train_loss": -6.831080436706543, "global_step": 162679, "epoch": 3873} {"train_loss": -7.019312381744385, "global_step": 162680, "epoch": 3873} {"train_loss": -6.891866683959961, "global_step": 162681, "epoch": 3873} {"train_loss": -7.014509201049805, "global_step": 162682, "epoch": 3873} {"train_loss": -6.847503662109375, "global_step": 162683, "epoch": 3873} {"train_loss": -6.835760593414307, "global_step": 162684, "epoch": 3873} {"train_loss": -6.966217994689941, "global_step": 162685, "epoch": 3873} {"train_loss": -7.039054870605469, "global_step": 162686, "epoch": 3873} {"train_loss": -6.949193954467773, "global_step": 162687, "epoch": 3873} {"train_loss": -6.970523357391357, "global_step": 162688, "epoch": 3873} {"train_loss": -7.042160511016846, "global_step": 162689, "epoch": 3873} {"train_loss": -7.002630710601807, "global_step": 162690, "epoch": 3873} {"train_loss": -6.888706207275391, "global_step": 162691, "epoch": 3873} {"train_loss": -7.044606685638428, "global_step": 162692, "epoch": 3873} {"train_loss": -6.879841327667236, "global_step": 162693, "epoch": 3873} {"train_loss": -7.044793605804443, "global_step": 162694, "epoch": 3873} {"train_loss": -7.02193021774292, "global_step": 162695, "epoch": 3873} {"train_loss": -6.946223258972168, "global_step": 162696, "epoch": 3873} {"train_loss": -6.861790657043457, "global_step": 162697, "epoch": 3873} {"train_loss": -6.943137168884277, "global_step": 162698, "epoch": 3873} {"train_loss": -6.867425918579102, "global_step": 162699, "epoch": 3873} {"train_loss": -7.004231929779053, "global_step": 162700, "epoch": 3873} {"train_loss": -6.896859169006348, "global_step": 162701, "epoch": 3873} {"train_loss": -6.928084373474121, "global_step": 162702, "epoch": 3873} {"train_loss": -6.878626823425293, "global_step": 162703, "epoch": 3873} {"train_loss": -6.997944355010986, "global_step": 162704, "epoch": 3873} {"train_loss": -7.062837600708008, "global_step": 162705, "epoch": 3873} {"train_loss": -7.070060729980469, "global_step": 162706, "epoch": 3873} {"train_loss": -6.969794591267903, "global_step": 162707, "epoch": 3873, "val_loss": 79449.1640625} {"train_loss": -6.9915032386779785, "global_step": 162708, "epoch": 3874} {"train_loss": -7.089792251586914, "global_step": 162709, "epoch": 3874} {"train_loss": -6.917200088500977, "global_step": 162710, "epoch": 3874} {"train_loss": -7.02138614654541, "global_step": 162711, "epoch": 3874} {"train_loss": -7.066692352294922, "global_step": 162712, "epoch": 3874} {"train_loss": -7.002497673034668, "global_step": 162713, "epoch": 3874} {"train_loss": -6.927700996398926, "global_step": 162714, "epoch": 3874} {"train_loss": -7.052037239074707, "global_step": 162715, "epoch": 3874} {"train_loss": -7.036212921142578, "global_step": 162716, "epoch": 3874} {"train_loss": -7.052950859069824, "global_step": 162717, "epoch": 3874} {"train_loss": -6.978898048400879, "global_step": 162718, "epoch": 3874} {"train_loss": -7.013007164001465, "global_step": 162719, "epoch": 3874} {"train_loss": -7.047220230102539, "global_step": 162720, "epoch": 3874} {"train_loss": -6.8730902671813965, "global_step": 162721, "epoch": 3874} {"train_loss": -6.990329742431641, "global_step": 162722, "epoch": 3874} {"train_loss": -7.0028886795043945, "global_step": 162723, "epoch": 3874} {"train_loss": -7.088632583618164, "global_step": 162724, "epoch": 3874} {"train_loss": -7.013766288757324, "global_step": 162725, "epoch": 3874} {"train_loss": -7.003002643585205, "global_step": 162726, "epoch": 3874} {"train_loss": -6.971275806427002, "global_step": 162727, "epoch": 3874} {"train_loss": -7.025822639465332, "global_step": 162728, "epoch": 3874} {"train_loss": -6.749119281768799, "global_step": 162729, "epoch": 3874} {"train_loss": -6.9566121101379395, "global_step": 162730, "epoch": 3874} {"train_loss": -6.937701225280762, "global_step": 162731, "epoch": 3874} {"train_loss": -6.872005939483643, "global_step": 162732, "epoch": 3874} {"train_loss": -7.030231952667236, "global_step": 162733, "epoch": 3874} {"train_loss": -6.915609359741211, "global_step": 162734, "epoch": 3874} {"train_loss": -7.0071210861206055, "global_step": 162735, "epoch": 3874} {"train_loss": -7.089344501495361, "global_step": 162736, "epoch": 3874} {"train_loss": -7.064507007598877, "global_step": 162737, "epoch": 3874} {"train_loss": -7.04296875, "global_step": 162738, "epoch": 3874} {"train_loss": -7.008950233459473, "global_step": 162739, "epoch": 3874} {"train_loss": -6.943830490112305, "global_step": 162740, "epoch": 3874} {"train_loss": -7.002803802490234, "global_step": 162741, "epoch": 3874} {"train_loss": -6.970308303833008, "global_step": 162742, "epoch": 3874} {"train_loss": -7.010325908660889, "global_step": 162743, "epoch": 3874} {"train_loss": -7.015886306762695, "global_step": 162744, "epoch": 3874} {"train_loss": -6.91811466217041, "global_step": 162745, "epoch": 3874} {"train_loss": -7.029231071472168, "global_step": 162746, "epoch": 3874} {"train_loss": -6.954903602600098, "global_step": 162747, "epoch": 3874} {"train_loss": -7.025405406951904, "global_step": 162748, "epoch": 3874} {"train_loss": -6.992394254321144, "global_step": 162749, "epoch": 3874, "val_loss": 79423.7109375} {"train_loss": -6.922957420349121, "global_step": 162750, "epoch": 3875} {"train_loss": -6.969172477722168, "global_step": 162751, "epoch": 3875} {"train_loss": -6.952578544616699, "global_step": 162752, "epoch": 3875} {"train_loss": -7.000417232513428, "global_step": 162753, "epoch": 3875} {"train_loss": -7.010623455047607, "global_step": 162754, "epoch": 3875} {"train_loss": -7.022764682769775, "global_step": 162755, "epoch": 3875} {"train_loss": -7.160231590270996, "global_step": 162756, "epoch": 3875} {"train_loss": -7.015141010284424, "global_step": 162757, "epoch": 3875} {"train_loss": -6.999194622039795, "global_step": 162758, "epoch": 3875} {"train_loss": -7.044604778289795, "global_step": 162759, "epoch": 3875} {"train_loss": -7.0039167404174805, "global_step": 162760, "epoch": 3875} {"train_loss": -6.977270126342773, "global_step": 162761, "epoch": 3875} {"train_loss": -6.930492401123047, "global_step": 162762, "epoch": 3875} {"train_loss": -6.892411231994629, "global_step": 162763, "epoch": 3875} {"train_loss": -7.0655622482299805, "global_step": 162764, "epoch": 3875} {"train_loss": -6.860035419464111, "global_step": 162765, "epoch": 3875} {"train_loss": -6.939512252807617, "global_step": 162766, "epoch": 3875} {"train_loss": -7.134372234344482, "global_step": 162767, "epoch": 3875} {"train_loss": -6.928655624389648, "global_step": 162768, "epoch": 3875} {"train_loss": -7.00852632522583, "global_step": 162769, "epoch": 3875} {"train_loss": -6.909877777099609, "global_step": 162770, "epoch": 3875} {"train_loss": -7.071815490722656, "global_step": 162771, "epoch": 3875} {"train_loss": -6.970247268676758, "global_step": 162772, "epoch": 3875} {"train_loss": -7.008852481842041, "global_step": 162773, "epoch": 3875} {"train_loss": -7.0501813888549805, "global_step": 162774, "epoch": 3875} {"train_loss": -6.975808143615723, "global_step": 162775, "epoch": 3875} {"train_loss": -6.969268321990967, "global_step": 162776, "epoch": 3875} {"train_loss": -7.036792755126953, "global_step": 162777, "epoch": 3875} {"train_loss": -6.986244201660156, "global_step": 162778, "epoch": 3875} {"train_loss": -7.1405229568481445, "global_step": 162779, "epoch": 3875} {"train_loss": -7.044551849365234, "global_step": 162780, "epoch": 3875} {"train_loss": -6.969552993774414, "global_step": 162781, "epoch": 3875} {"train_loss": -7.056334495544434, "global_step": 162782, "epoch": 3875} {"train_loss": -7.031259536743164, "global_step": 162783, "epoch": 3875} {"train_loss": -7.051971912384033, "global_step": 162784, "epoch": 3875} {"train_loss": -7.032537460327148, "global_step": 162785, "epoch": 3875} {"train_loss": -6.948014736175537, "global_step": 162786, "epoch": 3875} {"train_loss": -6.953669548034668, "global_step": 162787, "epoch": 3875} {"train_loss": -7.0098876953125, "global_step": 162788, "epoch": 3875} {"train_loss": -7.015924453735352, "global_step": 162789, "epoch": 3875} {"train_loss": -6.884576797485352, "global_step": 162790, "epoch": 3875} {"train_loss": -6.997639213289533, "global_step": 162791, "epoch": 3875, "val_loss": 79500.9375} {"train_loss": -6.911062717437744, "global_step": 162792, "epoch": 3876} {"train_loss": -6.827107906341553, "global_step": 162793, "epoch": 3876} {"train_loss": -6.977974891662598, "global_step": 162794, "epoch": 3876} {"train_loss": -6.8677754402160645, "global_step": 162795, "epoch": 3876} {"train_loss": -6.693999290466309, "global_step": 162796, "epoch": 3876} {"train_loss": -6.957921504974365, "global_step": 162797, "epoch": 3876} {"train_loss": -6.695427417755127, "global_step": 162798, "epoch": 3876} {"train_loss": -6.940251350402832, "global_step": 162799, "epoch": 3876} {"train_loss": -7.010831832885742, "global_step": 162800, "epoch": 3876} {"train_loss": -6.802244663238525, "global_step": 162801, "epoch": 3876} {"train_loss": -7.061169147491455, "global_step": 162802, "epoch": 3876} {"train_loss": -6.826196670532227, "global_step": 162803, "epoch": 3876} {"train_loss": -6.995607852935791, "global_step": 162804, "epoch": 3876} {"train_loss": -6.855879783630371, "global_step": 162805, "epoch": 3876} {"train_loss": -6.952390670776367, "global_step": 162806, "epoch": 3876} {"train_loss": -6.954705238342285, "global_step": 162807, "epoch": 3876} {"train_loss": -7.0614142417907715, "global_step": 162808, "epoch": 3876} {"train_loss": -7.027838706970215, "global_step": 162809, "epoch": 3876} {"train_loss": -7.06780481338501, "global_step": 162810, "epoch": 3876} {"train_loss": -7.011703014373779, "global_step": 162811, "epoch": 3876} {"train_loss": -6.996122360229492, "global_step": 162812, "epoch": 3876} {"train_loss": -6.992931842803955, "global_step": 162813, "epoch": 3876} {"train_loss": -7.064748287200928, "global_step": 162814, "epoch": 3876} {"train_loss": -6.920036315917969, "global_step": 162815, "epoch": 3876} {"train_loss": -7.0037946701049805, "global_step": 162816, "epoch": 3876} {"train_loss": -7.0155744552612305, "global_step": 162817, "epoch": 3876} {"train_loss": -6.958793640136719, "global_step": 162818, "epoch": 3876} {"train_loss": -6.947187900543213, "global_step": 162819, "epoch": 3876} {"train_loss": -7.0165863037109375, "global_step": 162820, "epoch": 3876} {"train_loss": -7.071335792541504, "global_step": 162821, "epoch": 3876} {"train_loss": -7.040345191955566, "global_step": 162822, "epoch": 3876} {"train_loss": -7.069940567016602, "global_step": 162823, "epoch": 3876} {"train_loss": -7.081110954284668, "global_step": 162824, "epoch": 3876} {"train_loss": -7.049127101898193, "global_step": 162825, "epoch": 3876} {"train_loss": -6.999658584594727, "global_step": 162826, "epoch": 3876} {"train_loss": -6.912386894226074, "global_step": 162827, "epoch": 3876} {"train_loss": -6.991213798522949, "global_step": 162828, "epoch": 3876} {"train_loss": -7.03779411315918, "global_step": 162829, "epoch": 3876} {"train_loss": -6.949804782867432, "global_step": 162830, "epoch": 3876} {"train_loss": -7.086870193481445, "global_step": 162831, "epoch": 3876} {"train_loss": -7.150883674621582, "global_step": 162832, "epoch": 3876} {"train_loss": -6.973431019555955, "global_step": 162833, "epoch": 3876, "val_loss": 79425.7578125} {"train_loss": -7.011552333831787, "global_step": 162834, "epoch": 3877} {"train_loss": -6.964957237243652, "global_step": 162835, "epoch": 3877} {"train_loss": -7.054695129394531, "global_step": 162836, "epoch": 3877} {"train_loss": -6.859461307525635, "global_step": 162837, "epoch": 3877} {"train_loss": -7.057915687561035, "global_step": 162838, "epoch": 3877} {"train_loss": -7.016804218292236, "global_step": 162839, "epoch": 3877} {"train_loss": -6.996567726135254, "global_step": 162840, "epoch": 3877} {"train_loss": -7.024259090423584, "global_step": 162841, "epoch": 3877} {"train_loss": -7.137779712677002, "global_step": 162842, "epoch": 3877} {"train_loss": -6.924920082092285, "global_step": 162843, "epoch": 3877} {"train_loss": -6.9827494621276855, "global_step": 162844, "epoch": 3877} {"train_loss": -7.042715072631836, "global_step": 162845, "epoch": 3877} {"train_loss": -7.0701751708984375, "global_step": 162846, "epoch": 3877} {"train_loss": -7.0712738037109375, "global_step": 162847, "epoch": 3877} {"train_loss": -7.08100700378418, "global_step": 162848, "epoch": 3877} {"train_loss": -7.017876148223877, "global_step": 162849, "epoch": 3877} {"train_loss": -7.021667957305908, "global_step": 162850, "epoch": 3877} {"train_loss": -6.976868629455566, "global_step": 162851, "epoch": 3877} {"train_loss": -7.072163105010986, "global_step": 162852, "epoch": 3877} {"train_loss": -7.055253028869629, "global_step": 162853, "epoch": 3877} {"train_loss": -7.017880439758301, "global_step": 162854, "epoch": 3877} {"train_loss": -6.967525482177734, "global_step": 162855, "epoch": 3877} {"train_loss": -6.9659423828125, "global_step": 162856, "epoch": 3877} {"train_loss": -6.937376022338867, "global_step": 162857, "epoch": 3877} {"train_loss": -6.889456748962402, "global_step": 162858, "epoch": 3877} {"train_loss": -6.90304708480835, "global_step": 162859, "epoch": 3877} {"train_loss": -7.044577121734619, "global_step": 162860, "epoch": 3877} {"train_loss": -7.048983097076416, "global_step": 162861, "epoch": 3877} {"train_loss": -6.998495101928711, "global_step": 162862, "epoch": 3877} {"train_loss": -7.035154819488525, "global_step": 162863, "epoch": 3877} {"train_loss": -7.082638740539551, "global_step": 162864, "epoch": 3877} {"train_loss": -6.912134170532227, "global_step": 162865, "epoch": 3877} {"train_loss": -6.904780864715576, "global_step": 162866, "epoch": 3877} {"train_loss": -6.894564628601074, "global_step": 162867, "epoch": 3877} {"train_loss": -6.908801078796387, "global_step": 162868, "epoch": 3877} {"train_loss": -6.9488325119018555, "global_step": 162869, "epoch": 3877} {"train_loss": -6.939356803894043, "global_step": 162870, "epoch": 3877} {"train_loss": -7.017653942108154, "global_step": 162871, "epoch": 3877} {"train_loss": -7.021631717681885, "global_step": 162872, "epoch": 3877} {"train_loss": -7.076117515563965, "global_step": 162873, "epoch": 3877} {"train_loss": -7.048318862915039, "global_step": 162874, "epoch": 3877} {"train_loss": -6.9997534184228805, "global_step": 162875, "epoch": 3877, "val_loss": 79361.6875} {"train_loss": -6.976688385009766, "global_step": 162876, "epoch": 3878} {"train_loss": -6.9765777587890625, "global_step": 162877, "epoch": 3878} {"train_loss": -7.13694953918457, "global_step": 162878, "epoch": 3878} {"train_loss": -7.014763832092285, "global_step": 162879, "epoch": 3878} {"train_loss": -6.987598419189453, "global_step": 162880, "epoch": 3878} {"train_loss": -6.986026763916016, "global_step": 162881, "epoch": 3878} {"train_loss": -6.934953689575195, "global_step": 162882, "epoch": 3878} {"train_loss": -6.986568450927734, "global_step": 162883, "epoch": 3878} {"train_loss": -6.947170734405518, "global_step": 162884, "epoch": 3878} {"train_loss": -7.014892578125, "global_step": 162885, "epoch": 3878} {"train_loss": -6.931758880615234, "global_step": 162886, "epoch": 3878} {"train_loss": -6.9952392578125, "global_step": 162887, "epoch": 3878} {"train_loss": -6.8904876708984375, "global_step": 162888, "epoch": 3878} {"train_loss": -6.957736015319824, "global_step": 162889, "epoch": 3878} {"train_loss": -7.051581382751465, "global_step": 162890, "epoch": 3878} {"train_loss": -6.944253921508789, "global_step": 162891, "epoch": 3878} {"train_loss": -6.997535705566406, "global_step": 162892, "epoch": 3878} {"train_loss": -6.870227813720703, "global_step": 162893, "epoch": 3878} {"train_loss": -6.927145481109619, "global_step": 162894, "epoch": 3878} {"train_loss": -6.978082656860352, "global_step": 162895, "epoch": 3878} {"train_loss": -7.030498504638672, "global_step": 162896, "epoch": 3878} {"train_loss": -6.915534496307373, "global_step": 162897, "epoch": 3878} {"train_loss": -7.0343217849731445, "global_step": 162898, "epoch": 3878} {"train_loss": -6.995101451873779, "global_step": 162899, "epoch": 3878} {"train_loss": -7.055329322814941, "global_step": 162900, "epoch": 3878} {"train_loss": -6.981032371520996, "global_step": 162901, "epoch": 3878} {"train_loss": -6.996095657348633, "global_step": 162902, "epoch": 3878} {"train_loss": -7.069917678833008, "global_step": 162903, "epoch": 3878} {"train_loss": -6.854251861572266, "global_step": 162904, "epoch": 3878} {"train_loss": -6.997574806213379, "global_step": 162905, "epoch": 3878} {"train_loss": -6.951870918273926, "global_step": 162906, "epoch": 3878} {"train_loss": -7.062535762786865, "global_step": 162907, "epoch": 3878} {"train_loss": -7.013873100280762, "global_step": 162908, "epoch": 3878} {"train_loss": -7.065834045410156, "global_step": 162909, "epoch": 3878} {"train_loss": -7.027886867523193, "global_step": 162910, "epoch": 3878} {"train_loss": -6.874295234680176, "global_step": 162911, "epoch": 3878} {"train_loss": -7.025263786315918, "global_step": 162912, "epoch": 3878} {"train_loss": -7.096530437469482, "global_step": 162913, "epoch": 3878} {"train_loss": -6.885217189788818, "global_step": 162914, "epoch": 3878} {"train_loss": -7.033671855926514, "global_step": 162915, "epoch": 3878} {"train_loss": -7.073718547821045, "global_step": 162916, "epoch": 3878} {"train_loss": -6.987831274668376, "global_step": 162917, "epoch": 3878, "val_loss": 79404.953125} {"train_loss": -7.130894660949707, "global_step": 162918, "epoch": 3879} {"train_loss": -6.977707386016846, "global_step": 162919, "epoch": 3879} {"train_loss": -6.990529537200928, "global_step": 162920, "epoch": 3879} {"train_loss": -7.105232238769531, "global_step": 162921, "epoch": 3879} {"train_loss": -7.073531150817871, "global_step": 162922, "epoch": 3879} {"train_loss": -6.972146987915039, "global_step": 162923, "epoch": 3879} {"train_loss": -7.112922668457031, "global_step": 162924, "epoch": 3879} {"train_loss": -6.909555435180664, "global_step": 162925, "epoch": 3879} {"train_loss": -6.984213829040527, "global_step": 162926, "epoch": 3879} {"train_loss": -6.93223237991333, "global_step": 162927, "epoch": 3879} {"train_loss": -7.017890930175781, "global_step": 162928, "epoch": 3879} {"train_loss": -7.006186485290527, "global_step": 162929, "epoch": 3879} {"train_loss": -6.951395034790039, "global_step": 162930, "epoch": 3879} {"train_loss": -7.05975866317749, "global_step": 162931, "epoch": 3879} {"train_loss": -6.921624183654785, "global_step": 162932, "epoch": 3879} {"train_loss": -6.966031551361084, "global_step": 162933, "epoch": 3879} {"train_loss": -6.982928276062012, "global_step": 162934, "epoch": 3879} {"train_loss": -7.124145984649658, "global_step": 162935, "epoch": 3879} {"train_loss": -7.073339462280273, "global_step": 162936, "epoch": 3879} {"train_loss": -7.044669151306152, "global_step": 162937, "epoch": 3879} {"train_loss": -6.944070816040039, "global_step": 162938, "epoch": 3879} {"train_loss": -7.008395195007324, "global_step": 162939, "epoch": 3879} {"train_loss": -6.986335754394531, "global_step": 162940, "epoch": 3879} {"train_loss": -7.011034965515137, "global_step": 162941, "epoch": 3879} {"train_loss": -7.075813293457031, "global_step": 162942, "epoch": 3879} {"train_loss": -7.095538139343262, "global_step": 162943, "epoch": 3879} {"train_loss": -7.0439958572387695, "global_step": 162944, "epoch": 3879} {"train_loss": -7.027885437011719, "global_step": 162945, "epoch": 3879} {"train_loss": -6.976180553436279, "global_step": 162946, "epoch": 3879} {"train_loss": -6.933728218078613, "global_step": 162947, "epoch": 3879} {"train_loss": -6.863234519958496, "global_step": 162948, "epoch": 3879} {"train_loss": -6.959656238555908, "global_step": 162949, "epoch": 3879} {"train_loss": -6.926399230957031, "global_step": 162950, "epoch": 3879} {"train_loss": -6.919399261474609, "global_step": 162951, "epoch": 3879} {"train_loss": -6.9573073387146, "global_step": 162952, "epoch": 3879} {"train_loss": -6.884922027587891, "global_step": 162953, "epoch": 3879} {"train_loss": -7.038071155548096, "global_step": 162954, "epoch": 3879} {"train_loss": -6.947779655456543, "global_step": 162955, "epoch": 3879} {"train_loss": -6.8797407150268555, "global_step": 162956, "epoch": 3879} {"train_loss": -6.947031497955322, "global_step": 162957, "epoch": 3879} {"train_loss": -6.946537494659424, "global_step": 162958, "epoch": 3879} {"train_loss": -6.992156108220418, "global_step": 162959, "epoch": 3879, "val_loss": 79371.4140625} {"train_loss": -7.041930198669434, "global_step": 162960, "epoch": 3880} {"train_loss": -6.787942886352539, "global_step": 162961, "epoch": 3880} {"train_loss": -6.700471878051758, "global_step": 162962, "epoch": 3880} {"train_loss": -7.05802583694458, "global_step": 162963, "epoch": 3880} {"train_loss": -7.018546104431152, "global_step": 162964, "epoch": 3880} {"train_loss": -7.036957263946533, "global_step": 162965, "epoch": 3880} {"train_loss": -7.073725700378418, "global_step": 162966, "epoch": 3880} {"train_loss": -7.004049301147461, "global_step": 162967, "epoch": 3880} {"train_loss": -6.882630348205566, "global_step": 162968, "epoch": 3880} {"train_loss": -6.919361114501953, "global_step": 162969, "epoch": 3880} {"train_loss": -7.0685834884643555, "global_step": 162970, "epoch": 3880} {"train_loss": -6.9449920654296875, "global_step": 162971, "epoch": 3880} {"train_loss": -6.899770736694336, "global_step": 162972, "epoch": 3880} {"train_loss": -6.8797607421875, "global_step": 162973, "epoch": 3880} {"train_loss": -6.893097877502441, "global_step": 162974, "epoch": 3880} {"train_loss": -6.953216552734375, "global_step": 162975, "epoch": 3880} {"train_loss": -6.927290916442871, "global_step": 162976, "epoch": 3880} {"train_loss": -6.987380504608154, "global_step": 162977, "epoch": 3880} {"train_loss": -6.9915032386779785, "global_step": 162978, "epoch": 3880} {"train_loss": -6.914958477020264, "global_step": 162979, "epoch": 3880} {"train_loss": -6.874147415161133, "global_step": 162980, "epoch": 3880} {"train_loss": -7.045297145843506, "global_step": 162981, "epoch": 3880} {"train_loss": -6.967962741851807, "global_step": 162982, "epoch": 3880} {"train_loss": -7.039560794830322, "global_step": 162983, "epoch": 3880} {"train_loss": -6.967663764953613, "global_step": 162984, "epoch": 3880} {"train_loss": -7.031210899353027, "global_step": 162985, "epoch": 3880} {"train_loss": -6.935298919677734, "global_step": 162986, "epoch": 3880} {"train_loss": -7.020207405090332, "global_step": 162987, "epoch": 3880} {"train_loss": -7.0003886222839355, "global_step": 162988, "epoch": 3880} {"train_loss": -7.10189151763916, "global_step": 162989, "epoch": 3880} {"train_loss": -6.9855756759643555, "global_step": 162990, "epoch": 3880} {"train_loss": -6.904898643493652, "global_step": 162991, "epoch": 3880} {"train_loss": -7.0288238525390625, "global_step": 162992, "epoch": 3880} {"train_loss": -7.046788692474365, "global_step": 162993, "epoch": 3880} {"train_loss": -7.048644065856934, "global_step": 162994, "epoch": 3880} {"train_loss": -7.080338478088379, "global_step": 162995, "epoch": 3880} {"train_loss": -7.11079216003418, "global_step": 162996, "epoch": 3880} {"train_loss": -6.99825382232666, "global_step": 162997, "epoch": 3880} {"train_loss": -6.942712783813477, "global_step": 162998, "epoch": 3880} {"train_loss": -6.951560974121094, "global_step": 162999, "epoch": 3880} {"train_loss": -6.949211120605469, "global_step": 163000, "epoch": 3880} {"train_loss": -6.975206783839634, "global_step": 163001, "epoch": 3880, "val_loss": 79739.03125} {"train_loss": -6.985744476318359, "global_step": 163002, "epoch": 3881} {"train_loss": -7.042316913604736, "global_step": 163003, "epoch": 3881} {"train_loss": -7.0760979652404785, "global_step": 163004, "epoch": 3881} {"train_loss": -7.075527191162109, "global_step": 163005, "epoch": 3881} {"train_loss": -6.918242454528809, "global_step": 163006, "epoch": 3881} {"train_loss": -6.940248489379883, "global_step": 163007, "epoch": 3881} {"train_loss": -6.9838995933532715, "global_step": 163008, "epoch": 3881} {"train_loss": -6.850398063659668, "global_step": 163009, "epoch": 3881} {"train_loss": -7.080561637878418, "global_step": 163010, "epoch": 3881} {"train_loss": -7.031009197235107, "global_step": 163011, "epoch": 3881} {"train_loss": -7.020425796508789, "global_step": 163012, "epoch": 3881} {"train_loss": -6.986305236816406, "global_step": 163013, "epoch": 3881} {"train_loss": -7.139446258544922, "global_step": 163014, "epoch": 3881} {"train_loss": -7.082417011260986, "global_step": 163015, "epoch": 3881} {"train_loss": -7.024997234344482, "global_step": 163016, "epoch": 3881} {"train_loss": -7.031672954559326, "global_step": 163017, "epoch": 3881} {"train_loss": -7.038138389587402, "global_step": 163018, "epoch": 3881} {"train_loss": -7.1013102531433105, "global_step": 163019, "epoch": 3881} {"train_loss": -6.996997833251953, "global_step": 163020, "epoch": 3881} {"train_loss": -7.199045181274414, "global_step": 163021, "epoch": 3881} {"train_loss": -6.982610702514648, "global_step": 163022, "epoch": 3881} {"train_loss": -7.008139610290527, "global_step": 163023, "epoch": 3881} {"train_loss": -7.013941764831543, "global_step": 163024, "epoch": 3881} {"train_loss": -6.97865104675293, "global_step": 163025, "epoch": 3881} {"train_loss": -7.100107192993164, "global_step": 163026, "epoch": 3881} {"train_loss": -6.960605621337891, "global_step": 163027, "epoch": 3881} {"train_loss": -6.984189033508301, "global_step": 163028, "epoch": 3881} {"train_loss": -7.009126663208008, "global_step": 163029, "epoch": 3881} {"train_loss": -6.865114212036133, "global_step": 163030, "epoch": 3881} {"train_loss": -6.906497001647949, "global_step": 163031, "epoch": 3881} {"train_loss": -6.956502914428711, "global_step": 163032, "epoch": 3881} {"train_loss": -7.03053092956543, "global_step": 163033, "epoch": 3881} {"train_loss": -6.981860637664795, "global_step": 163034, "epoch": 3881} {"train_loss": -6.978260517120361, "global_step": 163035, "epoch": 3881} {"train_loss": -6.919196128845215, "global_step": 163036, "epoch": 3881} {"train_loss": -6.957917213439941, "global_step": 163037, "epoch": 3881} {"train_loss": -6.914545059204102, "global_step": 163038, "epoch": 3881} {"train_loss": -6.76509952545166, "global_step": 163039, "epoch": 3881} {"train_loss": -6.755444526672363, "global_step": 163040, "epoch": 3881} {"train_loss": -6.916543006896973, "global_step": 163041, "epoch": 3881} {"train_loss": -7.00443172454834, "global_step": 163042, "epoch": 3881} {"train_loss": -6.985366412571499, "global_step": 163043, "epoch": 3881, "val_loss": 79203.953125} {"train_loss": -6.970451831817627, "global_step": 163044, "epoch": 3882} {"train_loss": -6.963075637817383, "global_step": 163045, "epoch": 3882} {"train_loss": -6.799564361572266, "global_step": 163046, "epoch": 3882} {"train_loss": -6.970882892608643, "global_step": 163047, "epoch": 3882} {"train_loss": -6.966235160827637, "global_step": 163048, "epoch": 3882} {"train_loss": -6.882906436920166, "global_step": 163049, "epoch": 3882} {"train_loss": -6.852151393890381, "global_step": 163050, "epoch": 3882} {"train_loss": -6.91780424118042, "global_step": 163051, "epoch": 3882} {"train_loss": -7.008618354797363, "global_step": 163052, "epoch": 3882} {"train_loss": -6.915617942810059, "global_step": 163053, "epoch": 3882} {"train_loss": -6.866457462310791, "global_step": 163054, "epoch": 3882} {"train_loss": -6.989924430847168, "global_step": 163055, "epoch": 3882} {"train_loss": -6.904767990112305, "global_step": 163056, "epoch": 3882} {"train_loss": -6.910080909729004, "global_step": 163057, "epoch": 3882} {"train_loss": -6.941296577453613, "global_step": 163058, "epoch": 3882} {"train_loss": -6.903867721557617, "global_step": 163059, "epoch": 3882} {"train_loss": -7.048840522766113, "global_step": 163060, "epoch": 3882} {"train_loss": -6.936374187469482, "global_step": 163061, "epoch": 3882} {"train_loss": -6.994747161865234, "global_step": 163062, "epoch": 3882} {"train_loss": -6.948848247528076, "global_step": 163063, "epoch": 3882} {"train_loss": -6.857810974121094, "global_step": 163064, "epoch": 3882} {"train_loss": -6.877781391143799, "global_step": 163065, "epoch": 3882} {"train_loss": -7.010932922363281, "global_step": 163066, "epoch": 3882} {"train_loss": -6.752255916595459, "global_step": 163067, "epoch": 3882} {"train_loss": -6.865317344665527, "global_step": 163068, "epoch": 3882} {"train_loss": -6.946651935577393, "global_step": 163069, "epoch": 3882} {"train_loss": -6.80599308013916, "global_step": 163070, "epoch": 3882} {"train_loss": -6.927087783813477, "global_step": 163071, "epoch": 3882} {"train_loss": -6.891096591949463, "global_step": 163072, "epoch": 3882} {"train_loss": -6.8193864822387695, "global_step": 163073, "epoch": 3882} {"train_loss": -7.0346999168396, "global_step": 163074, "epoch": 3882} {"train_loss": -6.746891975402832, "global_step": 163075, "epoch": 3882} {"train_loss": -6.989622592926025, "global_step": 163076, "epoch": 3882} {"train_loss": -6.952000617980957, "global_step": 163077, "epoch": 3882} {"train_loss": -6.962729454040527, "global_step": 163078, "epoch": 3882} {"train_loss": -6.963877201080322, "global_step": 163079, "epoch": 3882} {"train_loss": -6.944042682647705, "global_step": 163080, "epoch": 3882} {"train_loss": -6.8262128829956055, "global_step": 163081, "epoch": 3882} {"train_loss": -6.956235885620117, "global_step": 163082, "epoch": 3882} {"train_loss": -6.8394999504089355, "global_step": 163083, "epoch": 3882} {"train_loss": -7.01092529296875, "global_step": 163084, "epoch": 3882} {"train_loss": -6.918941338857015, "global_step": 163085, "epoch": 3882, "val_loss": 79614.453125} {"train_loss": -6.8725128173828125, "global_step": 163086, "epoch": 3883} {"train_loss": -6.967971324920654, "global_step": 163087, "epoch": 3883} {"train_loss": -6.854857921600342, "global_step": 163088, "epoch": 3883} {"train_loss": -6.898158073425293, "global_step": 163089, "epoch": 3883} {"train_loss": -6.9813666343688965, "global_step": 163090, "epoch": 3883} {"train_loss": -6.850381851196289, "global_step": 163091, "epoch": 3883} {"train_loss": -6.921296119689941, "global_step": 163092, "epoch": 3883} {"train_loss": -6.887249946594238, "global_step": 163093, "epoch": 3883} {"train_loss": -7.027951240539551, "global_step": 163094, "epoch": 3883} {"train_loss": -7.022635459899902, "global_step": 163095, "epoch": 3883} {"train_loss": -7.031181335449219, "global_step": 163096, "epoch": 3883} {"train_loss": -6.997819900512695, "global_step": 163097, "epoch": 3883} {"train_loss": -6.959113597869873, "global_step": 163098, "epoch": 3883} {"train_loss": -6.911550998687744, "global_step": 163099, "epoch": 3883} {"train_loss": -6.9147772789001465, "global_step": 163100, "epoch": 3883} {"train_loss": -6.999942302703857, "global_step": 163101, "epoch": 3883} {"train_loss": -6.899648666381836, "global_step": 163102, "epoch": 3883} {"train_loss": -6.907015323638916, "global_step": 163103, "epoch": 3883} {"train_loss": -6.9130778312683105, "global_step": 163104, "epoch": 3883} {"train_loss": -6.945534706115723, "global_step": 163105, "epoch": 3883} {"train_loss": -7.002083778381348, "global_step": 163106, "epoch": 3883} {"train_loss": -6.861811637878418, "global_step": 163107, "epoch": 3883} {"train_loss": -6.982266426086426, "global_step": 163108, "epoch": 3883} {"train_loss": -7.028040409088135, "global_step": 163109, "epoch": 3883} {"train_loss": -6.96532678604126, "global_step": 163110, "epoch": 3883} {"train_loss": -6.944991111755371, "global_step": 163111, "epoch": 3883} {"train_loss": -6.864815711975098, "global_step": 163112, "epoch": 3883} {"train_loss": -6.9254326820373535, "global_step": 163113, "epoch": 3883} {"train_loss": -7.00754451751709, "global_step": 163114, "epoch": 3883} {"train_loss": -6.971127033233643, "global_step": 163115, "epoch": 3883} {"train_loss": -6.917267322540283, "global_step": 163116, "epoch": 3883} {"train_loss": -7.057950973510742, "global_step": 163117, "epoch": 3883} {"train_loss": -7.022577285766602, "global_step": 163118, "epoch": 3883} {"train_loss": -6.995445251464844, "global_step": 163119, "epoch": 3883} {"train_loss": -6.981401443481445, "global_step": 163120, "epoch": 3883} {"train_loss": -6.865542888641357, "global_step": 163121, "epoch": 3883} {"train_loss": -6.99028205871582, "global_step": 163122, "epoch": 3883} {"train_loss": -6.973092555999756, "global_step": 163123, "epoch": 3883} {"train_loss": -6.861939907073975, "global_step": 163124, "epoch": 3883} {"train_loss": -6.9817047119140625, "global_step": 163125, "epoch": 3883} {"train_loss": -6.987297058105469, "global_step": 163126, "epoch": 3883} {"train_loss": -6.951331467855544, "global_step": 163127, "epoch": 3883, "val_loss": 79420.828125} {"train_loss": -7.036795616149902, "global_step": 163128, "epoch": 3884} {"train_loss": -7.047332763671875, "global_step": 163129, "epoch": 3884} {"train_loss": -6.941067695617676, "global_step": 163130, "epoch": 3884} {"train_loss": -7.0571513175964355, "global_step": 163131, "epoch": 3884} {"train_loss": -7.036725997924805, "global_step": 163132, "epoch": 3884} {"train_loss": -6.980481147766113, "global_step": 163133, "epoch": 3884} {"train_loss": -6.97444486618042, "global_step": 163134, "epoch": 3884} {"train_loss": -6.873401641845703, "global_step": 163135, "epoch": 3884} {"train_loss": -7.078001976013184, "global_step": 163136, "epoch": 3884} {"train_loss": -6.913304328918457, "global_step": 163137, "epoch": 3884} {"train_loss": -6.995701789855957, "global_step": 163138, "epoch": 3884} {"train_loss": -6.971245765686035, "global_step": 163139, "epoch": 3884} {"train_loss": -6.945576190948486, "global_step": 163140, "epoch": 3884} {"train_loss": -6.985673427581787, "global_step": 163141, "epoch": 3884} {"train_loss": -6.979551792144775, "global_step": 163142, "epoch": 3884} {"train_loss": -6.816156387329102, "global_step": 163143, "epoch": 3884} {"train_loss": -6.931292533874512, "global_step": 163144, "epoch": 3884} {"train_loss": -6.9126973152160645, "global_step": 163145, "epoch": 3884} {"train_loss": -7.030092239379883, "global_step": 163146, "epoch": 3884} {"train_loss": -6.904607772827148, "global_step": 163147, "epoch": 3884} {"train_loss": -6.87989616394043, "global_step": 163148, "epoch": 3884} {"train_loss": -6.984228134155273, "global_step": 163149, "epoch": 3884} {"train_loss": -6.926620006561279, "global_step": 163150, "epoch": 3884} {"train_loss": -6.963088035583496, "global_step": 163151, "epoch": 3884} {"train_loss": -7.024265289306641, "global_step": 163152, "epoch": 3884} {"train_loss": -6.916672229766846, "global_step": 163153, "epoch": 3884} {"train_loss": -7.04927921295166, "global_step": 163154, "epoch": 3884} {"train_loss": -7.0309739112854, "global_step": 163155, "epoch": 3884} {"train_loss": -7.128606796264648, "global_step": 163156, "epoch": 3884} {"train_loss": -6.946168422698975, "global_step": 163157, "epoch": 3884} {"train_loss": -6.959729194641113, "global_step": 163158, "epoch": 3884} {"train_loss": -6.887992858886719, "global_step": 163159, "epoch": 3884} {"train_loss": -6.991969108581543, "global_step": 163160, "epoch": 3884} {"train_loss": -6.89979362487793, "global_step": 163161, "epoch": 3884} {"train_loss": -6.938995361328125, "global_step": 163162, "epoch": 3884} {"train_loss": -6.853012561798096, "global_step": 163163, "epoch": 3884} {"train_loss": -7.033858299255371, "global_step": 163164, "epoch": 3884} {"train_loss": -6.820556640625, "global_step": 163165, "epoch": 3884} {"train_loss": -6.86464786529541, "global_step": 163166, "epoch": 3884} {"train_loss": -6.884993076324463, "global_step": 163167, "epoch": 3884} {"train_loss": -6.9759931564331055, "global_step": 163168, "epoch": 3884} {"train_loss": -6.961461282911754, "global_step": 163169, "epoch": 3884, "val_loss": 79280.0390625} {"train_loss": -7.0401787757873535, "global_step": 163170, "epoch": 3885} {"train_loss": -7.015942573547363, "global_step": 163171, "epoch": 3885} {"train_loss": -7.07008695602417, "global_step": 163172, "epoch": 3885} {"train_loss": -6.858066558837891, "global_step": 163173, "epoch": 3885} {"train_loss": -6.8544511795043945, "global_step": 163174, "epoch": 3885} {"train_loss": -6.946490287780762, "global_step": 163175, "epoch": 3885} {"train_loss": -6.838258743286133, "global_step": 163176, "epoch": 3885} {"train_loss": -6.848221302032471, "global_step": 163177, "epoch": 3885} {"train_loss": -6.967020034790039, "global_step": 163178, "epoch": 3885} {"train_loss": -6.826796054840088, "global_step": 163179, "epoch": 3885} {"train_loss": -7.006202697753906, "global_step": 163180, "epoch": 3885} {"train_loss": -7.027902126312256, "global_step": 163181, "epoch": 3885} {"train_loss": -6.796904563903809, "global_step": 163182, "epoch": 3885} {"train_loss": -6.977447986602783, "global_step": 163183, "epoch": 3885} {"train_loss": -6.885074138641357, "global_step": 163184, "epoch": 3885} {"train_loss": -6.972996711730957, "global_step": 163185, "epoch": 3885} {"train_loss": -6.9553985595703125, "global_step": 163186, "epoch": 3885} {"train_loss": -6.923270225524902, "global_step": 163187, "epoch": 3885} {"train_loss": -7.016411781311035, "global_step": 163188, "epoch": 3885} {"train_loss": -6.932251930236816, "global_step": 163189, "epoch": 3885} {"train_loss": -6.969033718109131, "global_step": 163190, "epoch": 3885} {"train_loss": -7.0106353759765625, "global_step": 163191, "epoch": 3885} {"train_loss": -6.9842119216918945, "global_step": 163192, "epoch": 3885} {"train_loss": -6.958214282989502, "global_step": 163193, "epoch": 3885} {"train_loss": -7.016455173492432, "global_step": 163194, "epoch": 3885} {"train_loss": -7.014728546142578, "global_step": 163195, "epoch": 3885} {"train_loss": -7.01355504989624, "global_step": 163196, "epoch": 3885} {"train_loss": -6.949288368225098, "global_step": 163197, "epoch": 3885} {"train_loss": -6.9370293617248535, "global_step": 163198, "epoch": 3885} {"train_loss": -6.994852066040039, "global_step": 163199, "epoch": 3885} {"train_loss": -6.989520072937012, "global_step": 163200, "epoch": 3885} {"train_loss": -6.884035110473633, "global_step": 163201, "epoch": 3885} {"train_loss": -6.97929573059082, "global_step": 163202, "epoch": 3885} {"train_loss": -6.951507091522217, "global_step": 163203, "epoch": 3885} {"train_loss": -6.855940341949463, "global_step": 163204, "epoch": 3885} {"train_loss": -7.062402725219727, "global_step": 163205, "epoch": 3885} {"train_loss": -6.984087944030762, "global_step": 163206, "epoch": 3885} {"train_loss": -6.988981246948242, "global_step": 163207, "epoch": 3885} {"train_loss": -7.13446044921875, "global_step": 163208, "epoch": 3885} {"train_loss": -6.977015495300293, "global_step": 163209, "epoch": 3885} {"train_loss": -6.92787504196167, "global_step": 163210, "epoch": 3885} {"train_loss": -6.960633811496553, "global_step": 163211, "epoch": 3885, "val_loss": 79416.0} {"train_loss": -6.985300540924072, "global_step": 163212, "epoch": 3886} {"train_loss": -7.025893211364746, "global_step": 163213, "epoch": 3886} {"train_loss": -6.937239170074463, "global_step": 163214, "epoch": 3886} {"train_loss": -7.027729511260986, "global_step": 163215, "epoch": 3886} {"train_loss": -6.885563850402832, "global_step": 163216, "epoch": 3886} {"train_loss": -6.8573455810546875, "global_step": 163217, "epoch": 3886} {"train_loss": -7.039857864379883, "global_step": 163218, "epoch": 3886} {"train_loss": -6.994492053985596, "global_step": 163219, "epoch": 3886} {"train_loss": -7.0289764404296875, "global_step": 163220, "epoch": 3886} {"train_loss": -7.082220554351807, "global_step": 163221, "epoch": 3886} {"train_loss": -6.9827799797058105, "global_step": 163222, "epoch": 3886} {"train_loss": -7.043404579162598, "global_step": 163223, "epoch": 3886} {"train_loss": -7.057160377502441, "global_step": 163224, "epoch": 3886} {"train_loss": -6.952470302581787, "global_step": 163225, "epoch": 3886} {"train_loss": -7.044111251831055, "global_step": 163226, "epoch": 3886} {"train_loss": -6.971957683563232, "global_step": 163227, "epoch": 3886} {"train_loss": -6.955139636993408, "global_step": 163228, "epoch": 3886} {"train_loss": -7.01212215423584, "global_step": 163229, "epoch": 3886} {"train_loss": -6.959577560424805, "global_step": 163230, "epoch": 3886} {"train_loss": -6.963295936584473, "global_step": 163231, "epoch": 3886} {"train_loss": -6.921078205108643, "global_step": 163232, "epoch": 3886} {"train_loss": -6.790229797363281, "global_step": 163233, "epoch": 3886} {"train_loss": -6.9599151611328125, "global_step": 163234, "epoch": 3886} {"train_loss": -6.929076671600342, "global_step": 163235, "epoch": 3886} {"train_loss": -7.056621551513672, "global_step": 163236, "epoch": 3886} {"train_loss": -6.8422956466674805, "global_step": 163237, "epoch": 3886} {"train_loss": -6.921999454498291, "global_step": 163238, "epoch": 3886} {"train_loss": -6.911700248718262, "global_step": 163239, "epoch": 3886} {"train_loss": -6.808119773864746, "global_step": 163240, "epoch": 3886} {"train_loss": -6.956910133361816, "global_step": 163241, "epoch": 3886} {"train_loss": -6.870434761047363, "global_step": 163242, "epoch": 3886} {"train_loss": -6.90770149230957, "global_step": 163243, "epoch": 3886} {"train_loss": -6.900180816650391, "global_step": 163244, "epoch": 3886} {"train_loss": -6.96145486831665, "global_step": 163245, "epoch": 3886} {"train_loss": -6.934600830078125, "global_step": 163246, "epoch": 3886} {"train_loss": -6.97899866104126, "global_step": 163247, "epoch": 3886} {"train_loss": -6.964449405670166, "global_step": 163248, "epoch": 3886} {"train_loss": -6.857751846313477, "global_step": 163249, "epoch": 3886} {"train_loss": -7.040567398071289, "global_step": 163250, "epoch": 3886} {"train_loss": -7.001276969909668, "global_step": 163251, "epoch": 3886} {"train_loss": -7.005823135375977, "global_step": 163252, "epoch": 3886} {"train_loss": -6.961334864298503, "global_step": 163253, "epoch": 3886, "val_loss": 79309.46875} {"train_loss": -6.938497543334961, "global_step": 163254, "epoch": 3887} {"train_loss": -7.104776382446289, "global_step": 163255, "epoch": 3887} {"train_loss": -7.111335754394531, "global_step": 163256, "epoch": 3887} {"train_loss": -7.051506996154785, "global_step": 163257, "epoch": 3887} {"train_loss": -6.9922566413879395, "global_step": 163258, "epoch": 3887} {"train_loss": -7.068941593170166, "global_step": 163259, "epoch": 3887} {"train_loss": -7.006922245025635, "global_step": 163260, "epoch": 3887} {"train_loss": -7.022822380065918, "global_step": 163261, "epoch": 3887} {"train_loss": -6.93552303314209, "global_step": 163262, "epoch": 3887} {"train_loss": -7.156504154205322, "global_step": 163263, "epoch": 3887} {"train_loss": -7.01866340637207, "global_step": 163264, "epoch": 3887} {"train_loss": -6.998331546783447, "global_step": 163265, "epoch": 3887} {"train_loss": -7.088198184967041, "global_step": 163266, "epoch": 3887} {"train_loss": -7.0770769119262695, "global_step": 163267, "epoch": 3887} {"train_loss": -7.066906929016113, "global_step": 163268, "epoch": 3887} {"train_loss": -7.143161296844482, "global_step": 163269, "epoch": 3887} {"train_loss": -7.046344757080078, "global_step": 163270, "epoch": 3887} {"train_loss": -7.059845924377441, "global_step": 163271, "epoch": 3887} {"train_loss": -6.942802429199219, "global_step": 163272, "epoch": 3887} {"train_loss": -7.147209644317627, "global_step": 163273, "epoch": 3887} {"train_loss": -7.105717658996582, "global_step": 163274, "epoch": 3887} {"train_loss": -7.074947357177734, "global_step": 163275, "epoch": 3887} {"train_loss": -7.046982765197754, "global_step": 163276, "epoch": 3887} {"train_loss": -7.045524597167969, "global_step": 163277, "epoch": 3887} {"train_loss": -7.078800678253174, "global_step": 163278, "epoch": 3887} {"train_loss": -7.006158828735352, "global_step": 163279, "epoch": 3887} {"train_loss": -6.987419605255127, "global_step": 163280, "epoch": 3887} {"train_loss": -6.972569465637207, "global_step": 163281, "epoch": 3887} {"train_loss": -6.937275409698486, "global_step": 163282, "epoch": 3887} {"train_loss": -6.810087203979492, "global_step": 163283, "epoch": 3887} {"train_loss": -6.974925994873047, "global_step": 163284, "epoch": 3887} {"train_loss": -6.975017547607422, "global_step": 163285, "epoch": 3887} {"train_loss": -7.013160705566406, "global_step": 163286, "epoch": 3887} {"train_loss": -6.876316070556641, "global_step": 163287, "epoch": 3887} {"train_loss": -6.966825008392334, "global_step": 163288, "epoch": 3887} {"train_loss": -6.882484436035156, "global_step": 163289, "epoch": 3887} {"train_loss": -6.970232963562012, "global_step": 163290, "epoch": 3887} {"train_loss": -6.926911354064941, "global_step": 163291, "epoch": 3887} {"train_loss": -6.931393623352051, "global_step": 163292, "epoch": 3887} {"train_loss": -7.054946422576904, "global_step": 163293, "epoch": 3887} {"train_loss": -6.982522487640381, "global_step": 163294, "epoch": 3887} {"train_loss": -7.012493712561471, "global_step": 163295, "epoch": 3887, "val_loss": 79533.3984375} {"train_loss": -6.960926532745361, "global_step": 163296, "epoch": 3888} {"train_loss": -6.962980270385742, "global_step": 163297, "epoch": 3888} {"train_loss": -6.911533355712891, "global_step": 163298, "epoch": 3888} {"train_loss": -6.908067226409912, "global_step": 163299, "epoch": 3888} {"train_loss": -6.991698741912842, "global_step": 163300, "epoch": 3888} {"train_loss": -6.95242166519165, "global_step": 163301, "epoch": 3888} {"train_loss": -6.857295989990234, "global_step": 163302, "epoch": 3888} {"train_loss": -6.9690046310424805, "global_step": 163303, "epoch": 3888} {"train_loss": -7.015097141265869, "global_step": 163304, "epoch": 3888} {"train_loss": -6.822333335876465, "global_step": 163305, "epoch": 3888} {"train_loss": -7.013731956481934, "global_step": 163306, "epoch": 3888} {"train_loss": -6.875296115875244, "global_step": 163307, "epoch": 3888} {"train_loss": -6.799509525299072, "global_step": 163308, "epoch": 3888} {"train_loss": -6.876253128051758, "global_step": 163309, "epoch": 3888} {"train_loss": -6.949927806854248, "global_step": 163310, "epoch": 3888} {"train_loss": -6.712224006652832, "global_step": 163311, "epoch": 3888} {"train_loss": -7.026874542236328, "global_step": 163312, "epoch": 3888} {"train_loss": -6.88701057434082, "global_step": 163313, "epoch": 3888} {"train_loss": -6.883108615875244, "global_step": 163314, "epoch": 3888} {"train_loss": -6.909610748291016, "global_step": 163315, "epoch": 3888} {"train_loss": -6.679543972015381, "global_step": 163316, "epoch": 3888} {"train_loss": -6.96990966796875, "global_step": 163317, "epoch": 3888} {"train_loss": -6.875530242919922, "global_step": 163318, "epoch": 3888} {"train_loss": -6.895560264587402, "global_step": 163319, "epoch": 3888} {"train_loss": -6.93424129486084, "global_step": 163320, "epoch": 3888} {"train_loss": -6.96904182434082, "global_step": 163321, "epoch": 3888} {"train_loss": -6.953680992126465, "global_step": 163322, "epoch": 3888} {"train_loss": -6.920113563537598, "global_step": 163323, "epoch": 3888} {"train_loss": -7.016283988952637, "global_step": 163324, "epoch": 3888} {"train_loss": -6.981193542480469, "global_step": 163325, "epoch": 3888} {"train_loss": -6.987221717834473, "global_step": 163326, "epoch": 3888} {"train_loss": -6.99936580657959, "global_step": 163327, "epoch": 3888} {"train_loss": -6.895953178405762, "global_step": 163328, "epoch": 3888} {"train_loss": -7.09361457824707, "global_step": 163329, "epoch": 3888} {"train_loss": -7.023553848266602, "global_step": 163330, "epoch": 3888} {"train_loss": -6.930511474609375, "global_step": 163331, "epoch": 3888} {"train_loss": -6.917620658874512, "global_step": 163332, "epoch": 3888} {"train_loss": -6.987015724182129, "global_step": 163333, "epoch": 3888} {"train_loss": -6.874046325683594, "global_step": 163334, "epoch": 3888} {"train_loss": -7.053765296936035, "global_step": 163335, "epoch": 3888} {"train_loss": -6.990461826324463, "global_step": 163336, "epoch": 3888} {"train_loss": -6.933293989726475, "global_step": 163337, "epoch": 3888, "val_loss": 79623.7421875} {"train_loss": -6.950582504272461, "global_step": 163338, "epoch": 3889} {"train_loss": -6.954367637634277, "global_step": 163339, "epoch": 3889} {"train_loss": -7.040801048278809, "global_step": 163340, "epoch": 3889} {"train_loss": -7.041560649871826, "global_step": 163341, "epoch": 3889} {"train_loss": -7.017242431640625, "global_step": 163342, "epoch": 3889} {"train_loss": -6.9449663162231445, "global_step": 163343, "epoch": 3889} {"train_loss": -7.048481464385986, "global_step": 163344, "epoch": 3889} {"train_loss": -7.011093616485596, "global_step": 163345, "epoch": 3889} {"train_loss": -6.93726110458374, "global_step": 163346, "epoch": 3889} {"train_loss": -7.017699718475342, "global_step": 163347, "epoch": 3889} {"train_loss": -7.131587982177734, "global_step": 163348, "epoch": 3889} {"train_loss": -6.953850746154785, "global_step": 163349, "epoch": 3889} {"train_loss": -7.038006782531738, "global_step": 163350, "epoch": 3889} {"train_loss": -7.144261360168457, "global_step": 163351, "epoch": 3889} {"train_loss": -6.887535572052002, "global_step": 163352, "epoch": 3889} {"train_loss": -6.989249229431152, "global_step": 163353, "epoch": 3889} {"train_loss": -6.990357398986816, "global_step": 163354, "epoch": 3889} {"train_loss": -6.962146282196045, "global_step": 163355, "epoch": 3889} {"train_loss": -6.980416297912598, "global_step": 163356, "epoch": 3889} {"train_loss": -7.070018291473389, "global_step": 163357, "epoch": 3889} {"train_loss": -6.977451324462891, "global_step": 163358, "epoch": 3889} {"train_loss": -7.015300273895264, "global_step": 163359, "epoch": 3889} {"train_loss": -7.037372589111328, "global_step": 163360, "epoch": 3889} {"train_loss": -6.93575382232666, "global_step": 163361, "epoch": 3889} {"train_loss": -7.065247535705566, "global_step": 163362, "epoch": 3889} {"train_loss": -6.991959571838379, "global_step": 163363, "epoch": 3889} {"train_loss": -7.053290367126465, "global_step": 163364, "epoch": 3889} {"train_loss": -7.039607048034668, "global_step": 163365, "epoch": 3889} {"train_loss": -6.8781023025512695, "global_step": 163366, "epoch": 3889} {"train_loss": -6.958000659942627, "global_step": 163367, "epoch": 3889} {"train_loss": -7.049485206604004, "global_step": 163368, "epoch": 3889} {"train_loss": -7.099323272705078, "global_step": 163369, "epoch": 3889} {"train_loss": -7.0069732666015625, "global_step": 163370, "epoch": 3889} {"train_loss": -7.045104026794434, "global_step": 163371, "epoch": 3889} {"train_loss": -7.021640777587891, "global_step": 163372, "epoch": 3889} {"train_loss": -7.005610466003418, "global_step": 163373, "epoch": 3889} {"train_loss": -6.830832481384277, "global_step": 163374, "epoch": 3889} {"train_loss": -6.9465227127075195, "global_step": 163375, "epoch": 3889} {"train_loss": -6.965280532836914, "global_step": 163376, "epoch": 3889} {"train_loss": -6.932589530944824, "global_step": 163377, "epoch": 3889} {"train_loss": -6.972841262817383, "global_step": 163378, "epoch": 3889} {"train_loss": -6.997141088758196, "global_step": 163379, "epoch": 3889, "val_loss": 79555.6953125} {"train_loss": -7.012194633483887, "global_step": 163380, "epoch": 3890} {"train_loss": -6.876802444458008, "global_step": 163381, "epoch": 3890} {"train_loss": -7.006951332092285, "global_step": 163382, "epoch": 3890} {"train_loss": -6.955350875854492, "global_step": 163383, "epoch": 3890} {"train_loss": -7.008883476257324, "global_step": 163384, "epoch": 3890} {"train_loss": -6.9732770919799805, "global_step": 163385, "epoch": 3890} {"train_loss": -6.966663360595703, "global_step": 163386, "epoch": 3890} {"train_loss": -6.9196085929870605, "global_step": 163387, "epoch": 3890} {"train_loss": -7.011277675628662, "global_step": 163388, "epoch": 3890} {"train_loss": -7.053215026855469, "global_step": 163389, "epoch": 3890} {"train_loss": -7.012308120727539, "global_step": 163390, "epoch": 3890} {"train_loss": -6.891221523284912, "global_step": 163391, "epoch": 3890} {"train_loss": -7.007576942443848, "global_step": 163392, "epoch": 3890} {"train_loss": -6.953301429748535, "global_step": 163393, "epoch": 3890} {"train_loss": -6.970643520355225, "global_step": 163394, "epoch": 3890} {"train_loss": -6.92889404296875, "global_step": 163395, "epoch": 3890} {"train_loss": -7.086042881011963, "global_step": 163396, "epoch": 3890} {"train_loss": -6.840531826019287, "global_step": 163397, "epoch": 3890} {"train_loss": -7.055063724517822, "global_step": 163398, "epoch": 3890} {"train_loss": -6.99251651763916, "global_step": 163399, "epoch": 3890} {"train_loss": -6.955418109893799, "global_step": 163400, "epoch": 3890} {"train_loss": -6.909907817840576, "global_step": 163401, "epoch": 3890} {"train_loss": -6.898956298828125, "global_step": 163402, "epoch": 3890} {"train_loss": -7.053671836853027, "global_step": 163403, "epoch": 3890} {"train_loss": -6.962401390075684, "global_step": 163404, "epoch": 3890} {"train_loss": -6.941201210021973, "global_step": 163405, "epoch": 3890} {"train_loss": -6.859175682067871, "global_step": 163406, "epoch": 3890} {"train_loss": -7.075508117675781, "global_step": 163407, "epoch": 3890} {"train_loss": -6.979834079742432, "global_step": 163408, "epoch": 3890} {"train_loss": -6.859147071838379, "global_step": 163409, "epoch": 3890} {"train_loss": -6.967171669006348, "global_step": 163410, "epoch": 3890} {"train_loss": -6.907876968383789, "global_step": 163411, "epoch": 3890} {"train_loss": -6.968170166015625, "global_step": 163412, "epoch": 3890} {"train_loss": -6.8786163330078125, "global_step": 163413, "epoch": 3890} {"train_loss": -6.879748344421387, "global_step": 163414, "epoch": 3890} {"train_loss": -7.010276794433594, "global_step": 163415, "epoch": 3890} {"train_loss": -6.880399703979492, "global_step": 163416, "epoch": 3890} {"train_loss": -7.0965800285339355, "global_step": 163417, "epoch": 3890} {"train_loss": -6.900951385498047, "global_step": 163418, "epoch": 3890} {"train_loss": -6.923175811767578, "global_step": 163419, "epoch": 3890} {"train_loss": -6.82705020904541, "global_step": 163420, "epoch": 3890} {"train_loss": -6.956658840179443, "global_step": 163421, "epoch": 3890, "val_loss": 79428.234375} {"train_loss": -6.955577850341797, "global_step": 163422, "epoch": 3891} {"train_loss": -6.938278675079346, "global_step": 163423, "epoch": 3891} {"train_loss": -6.9357452392578125, "global_step": 163424, "epoch": 3891} {"train_loss": -6.834131240844727, "global_step": 163425, "epoch": 3891} {"train_loss": -6.9915618896484375, "global_step": 163426, "epoch": 3891} {"train_loss": -6.973204135894775, "global_step": 163427, "epoch": 3891} {"train_loss": -6.958049297332764, "global_step": 163428, "epoch": 3891} {"train_loss": -6.993320465087891, "global_step": 163429, "epoch": 3891} {"train_loss": -7.094953536987305, "global_step": 163430, "epoch": 3891} {"train_loss": -7.004215240478516, "global_step": 163431, "epoch": 3891} {"train_loss": -6.914048194885254, "global_step": 163432, "epoch": 3891} {"train_loss": -7.022193908691406, "global_step": 163433, "epoch": 3891} {"train_loss": -7.026966094970703, "global_step": 163434, "epoch": 3891} {"train_loss": -6.929142951965332, "global_step": 163435, "epoch": 3891} {"train_loss": -7.024090766906738, "global_step": 163436, "epoch": 3891} {"train_loss": -7.004703521728516, "global_step": 163437, "epoch": 3891} {"train_loss": -6.932225227355957, "global_step": 163438, "epoch": 3891} {"train_loss": -6.989620208740234, "global_step": 163439, "epoch": 3891} {"train_loss": -7.062559127807617, "global_step": 163440, "epoch": 3891} {"train_loss": -6.990822792053223, "global_step": 163441, "epoch": 3891} {"train_loss": -7.06754207611084, "global_step": 163442, "epoch": 3891} {"train_loss": -7.041626930236816, "global_step": 163443, "epoch": 3891} {"train_loss": -7.050549030303955, "global_step": 163444, "epoch": 3891} {"train_loss": -6.921656608581543, "global_step": 163445, "epoch": 3891} {"train_loss": -7.0886640548706055, "global_step": 163446, "epoch": 3891} {"train_loss": -6.939150810241699, "global_step": 163447, "epoch": 3891} {"train_loss": -6.927028656005859, "global_step": 163448, "epoch": 3891} {"train_loss": -6.927264213562012, "global_step": 163449, "epoch": 3891} {"train_loss": -6.908266067504883, "global_step": 163450, "epoch": 3891} {"train_loss": -6.920028209686279, "global_step": 163451, "epoch": 3891} {"train_loss": -6.991349220275879, "global_step": 163452, "epoch": 3891} {"train_loss": -6.999137878417969, "global_step": 163453, "epoch": 3891} {"train_loss": -7.054333686828613, "global_step": 163454, "epoch": 3891} {"train_loss": -6.953985691070557, "global_step": 163455, "epoch": 3891} {"train_loss": -7.037670135498047, "global_step": 163456, "epoch": 3891} {"train_loss": -7.135322570800781, "global_step": 163457, "epoch": 3891} {"train_loss": -7.030706405639648, "global_step": 163458, "epoch": 3891} {"train_loss": -7.018908500671387, "global_step": 163459, "epoch": 3891} {"train_loss": -7.065812587738037, "global_step": 163460, "epoch": 3891} {"train_loss": -7.011563301086426, "global_step": 163461, "epoch": 3891} {"train_loss": -6.885287761688232, "global_step": 163462, "epoch": 3891} {"train_loss": -6.991100265866234, "global_step": 163463, "epoch": 3891, "val_loss": 79372.109375} {"train_loss": -6.998366355895996, "global_step": 163464, "epoch": 3892} {"train_loss": -6.99542236328125, "global_step": 163465, "epoch": 3892} {"train_loss": -6.9651713371276855, "global_step": 163466, "epoch": 3892} {"train_loss": -6.926297664642334, "global_step": 163467, "epoch": 3892} {"train_loss": -7.00206995010376, "global_step": 163468, "epoch": 3892} {"train_loss": -7.033685684204102, "global_step": 163469, "epoch": 3892} {"train_loss": -6.952991485595703, "global_step": 163470, "epoch": 3892} {"train_loss": -7.067378044128418, "global_step": 163471, "epoch": 3892} {"train_loss": -7.107942581176758, "global_step": 163472, "epoch": 3892} {"train_loss": -7.049726963043213, "global_step": 163473, "epoch": 3892} {"train_loss": -7.174388885498047, "global_step": 163474, "epoch": 3892} {"train_loss": -6.90311336517334, "global_step": 163475, "epoch": 3892} {"train_loss": -7.054603576660156, "global_step": 163476, "epoch": 3892} {"train_loss": -7.012563705444336, "global_step": 163477, "epoch": 3892} {"train_loss": -6.915893077850342, "global_step": 163478, "epoch": 3892} {"train_loss": -7.008831024169922, "global_step": 163479, "epoch": 3892} {"train_loss": -7.124232292175293, "global_step": 163480, "epoch": 3892} {"train_loss": -6.8540849685668945, "global_step": 163481, "epoch": 3892} {"train_loss": -6.845398902893066, "global_step": 163482, "epoch": 3892} {"train_loss": -6.943568229675293, "global_step": 163483, "epoch": 3892} {"train_loss": -6.781124114990234, "global_step": 163484, "epoch": 3892} {"train_loss": -6.544703960418701, "global_step": 163485, "epoch": 3892} {"train_loss": -6.895252227783203, "global_step": 163486, "epoch": 3892} {"train_loss": -6.602832317352295, "global_step": 163487, "epoch": 3892} {"train_loss": -6.758044242858887, "global_step": 163488, "epoch": 3892} {"train_loss": -6.848942279815674, "global_step": 163489, "epoch": 3892} {"train_loss": -6.924020767211914, "global_step": 163490, "epoch": 3892} {"train_loss": -6.715605735778809, "global_step": 163491, "epoch": 3892} {"train_loss": -6.86591911315918, "global_step": 163492, "epoch": 3892} {"train_loss": -6.813121795654297, "global_step": 163493, "epoch": 3892} {"train_loss": -6.893776893615723, "global_step": 163494, "epoch": 3892} {"train_loss": -6.8757643699646, "global_step": 163495, "epoch": 3892} {"train_loss": -6.834619045257568, "global_step": 163496, "epoch": 3892} {"train_loss": -6.723485946655273, "global_step": 163497, "epoch": 3892} {"train_loss": -6.890783309936523, "global_step": 163498, "epoch": 3892} {"train_loss": -6.838644981384277, "global_step": 163499, "epoch": 3892} {"train_loss": -6.90994930267334, "global_step": 163500, "epoch": 3892} {"train_loss": -6.920740127563477, "global_step": 163501, "epoch": 3892} {"train_loss": -6.801225662231445, "global_step": 163502, "epoch": 3892} {"train_loss": -6.8399810791015625, "global_step": 163503, "epoch": 3892} {"train_loss": -6.879910469055176, "global_step": 163504, "epoch": 3892} {"train_loss": -6.905059632800874, "global_step": 163505, "epoch": 3892, "val_loss": 79455.2890625} {"train_loss": -7.032755374908447, "global_step": 163506, "epoch": 3893} {"train_loss": -6.9041852951049805, "global_step": 163507, "epoch": 3893} {"train_loss": -7.003743648529053, "global_step": 163508, "epoch": 3893} {"train_loss": -6.976385593414307, "global_step": 163509, "epoch": 3893} {"train_loss": -6.969801902770996, "global_step": 163510, "epoch": 3893} {"train_loss": -7.053140640258789, "global_step": 163511, "epoch": 3893} {"train_loss": -6.8608880043029785, "global_step": 163512, "epoch": 3893} {"train_loss": -7.157870292663574, "global_step": 163513, "epoch": 3893} {"train_loss": -7.020887851715088, "global_step": 163514, "epoch": 3893} {"train_loss": -7.020920753479004, "global_step": 163515, "epoch": 3893} {"train_loss": -6.832118988037109, "global_step": 163516, "epoch": 3893} {"train_loss": -6.960404396057129, "global_step": 163517, "epoch": 3893} {"train_loss": -6.958024024963379, "global_step": 163518, "epoch": 3893} {"train_loss": -6.951972484588623, "global_step": 163519, "epoch": 3893} {"train_loss": -7.082143783569336, "global_step": 163520, "epoch": 3893} {"train_loss": -6.918976306915283, "global_step": 163521, "epoch": 3893} {"train_loss": -6.990584373474121, "global_step": 163522, "epoch": 3893} {"train_loss": -6.974011421203613, "global_step": 163523, "epoch": 3893} {"train_loss": -6.956797122955322, "global_step": 163524, "epoch": 3893} {"train_loss": -7.1002302169799805, "global_step": 163525, "epoch": 3893} {"train_loss": -6.967548370361328, "global_step": 163526, "epoch": 3893} {"train_loss": -6.860906600952148, "global_step": 163527, "epoch": 3893} {"train_loss": -6.9416728019714355, "global_step": 163528, "epoch": 3893} {"train_loss": -6.927133560180664, "global_step": 163529, "epoch": 3893} {"train_loss": -6.948040008544922, "global_step": 163530, "epoch": 3893} {"train_loss": -7.019164085388184, "global_step": 163531, "epoch": 3893} {"train_loss": -6.984389305114746, "global_step": 163532, "epoch": 3893} {"train_loss": -7.136377811431885, "global_step": 163533, "epoch": 3893} {"train_loss": -7.0116119384765625, "global_step": 163534, "epoch": 3893} {"train_loss": -6.89398193359375, "global_step": 163535, "epoch": 3893} {"train_loss": -6.885882377624512, "global_step": 163536, "epoch": 3893} {"train_loss": -6.964172840118408, "global_step": 163537, "epoch": 3893} {"train_loss": -6.758752822875977, "global_step": 163538, "epoch": 3893} {"train_loss": -6.848371505737305, "global_step": 163539, "epoch": 3893} {"train_loss": -6.920289039611816, "global_step": 163540, "epoch": 3893} {"train_loss": -6.926932334899902, "global_step": 163541, "epoch": 3893} {"train_loss": -6.859284400939941, "global_step": 163542, "epoch": 3893} {"train_loss": -6.96183443069458, "global_step": 163543, "epoch": 3893} {"train_loss": -6.865732192993164, "global_step": 163544, "epoch": 3893} {"train_loss": -6.832080841064453, "global_step": 163545, "epoch": 3893} {"train_loss": -6.935257911682129, "global_step": 163546, "epoch": 3893} {"train_loss": -6.954104650588262, "global_step": 163547, "epoch": 3893, "val_loss": 79607.515625} {"train_loss": -6.927421569824219, "global_step": 163548, "epoch": 3894} {"train_loss": -7.040126800537109, "global_step": 163549, "epoch": 3894} {"train_loss": -6.7918701171875, "global_step": 163550, "epoch": 3894} {"train_loss": -7.00495719909668, "global_step": 163551, "epoch": 3894} {"train_loss": -6.790353775024414, "global_step": 163552, "epoch": 3894} {"train_loss": -6.904012203216553, "global_step": 163553, "epoch": 3894} {"train_loss": -6.825994491577148, "global_step": 163554, "epoch": 3894} {"train_loss": -6.895116806030273, "global_step": 163555, "epoch": 3894} {"train_loss": -6.939654350280762, "global_step": 163556, "epoch": 3894} {"train_loss": -7.027061462402344, "global_step": 163557, "epoch": 3894} {"train_loss": -6.9975457191467285, "global_step": 163558, "epoch": 3894} {"train_loss": -6.905971050262451, "global_step": 163559, "epoch": 3894} {"train_loss": -6.937241554260254, "global_step": 163560, "epoch": 3894} {"train_loss": -7.034762382507324, "global_step": 163561, "epoch": 3894} {"train_loss": -7.038424015045166, "global_step": 163562, "epoch": 3894} {"train_loss": -6.895951747894287, "global_step": 163563, "epoch": 3894} {"train_loss": -6.990457534790039, "global_step": 163564, "epoch": 3894} {"train_loss": -6.91217041015625, "global_step": 163565, "epoch": 3894} {"train_loss": -7.050472736358643, "global_step": 163566, "epoch": 3894} {"train_loss": -6.896395683288574, "global_step": 163567, "epoch": 3894} {"train_loss": -6.917888164520264, "global_step": 163568, "epoch": 3894} {"train_loss": -7.102246284484863, "global_step": 163569, "epoch": 3894} {"train_loss": -6.981688022613525, "global_step": 163570, "epoch": 3894} {"train_loss": -7.126124382019043, "global_step": 163571, "epoch": 3894} {"train_loss": -7.087983131408691, "global_step": 163572, "epoch": 3894} {"train_loss": -6.914409637451172, "global_step": 163573, "epoch": 3894} {"train_loss": -6.897895812988281, "global_step": 163574, "epoch": 3894} {"train_loss": -6.980645179748535, "global_step": 163575, "epoch": 3894} {"train_loss": -7.064419746398926, "global_step": 163576, "epoch": 3894} {"train_loss": -7.030150413513184, "global_step": 163577, "epoch": 3894} {"train_loss": -6.952603816986084, "global_step": 163578, "epoch": 3894} {"train_loss": -6.944631576538086, "global_step": 163579, "epoch": 3894} {"train_loss": -7.028747081756592, "global_step": 163580, "epoch": 3894} {"train_loss": -7.0311384201049805, "global_step": 163581, "epoch": 3894} {"train_loss": -6.941845893859863, "global_step": 163582, "epoch": 3894} {"train_loss": -7.005616188049316, "global_step": 163583, "epoch": 3894} {"train_loss": -6.949179649353027, "global_step": 163584, "epoch": 3894} {"train_loss": -6.95805549621582, "global_step": 163585, "epoch": 3894} {"train_loss": -7.0963592529296875, "global_step": 163586, "epoch": 3894} {"train_loss": -6.996227264404297, "global_step": 163587, "epoch": 3894} {"train_loss": -7.0628838539123535, "global_step": 163588, "epoch": 3894} {"train_loss": -6.970783846718924, "global_step": 163589, "epoch": 3894, "val_loss": 79180.2578125} {"train_loss": -6.981656551361084, "global_step": 163590, "epoch": 3895} {"train_loss": -7.021579742431641, "global_step": 163591, "epoch": 3895} {"train_loss": -7.0333380699157715, "global_step": 163592, "epoch": 3895} {"train_loss": -6.946069717407227, "global_step": 163593, "epoch": 3895} {"train_loss": -6.9748687744140625, "global_step": 163594, "epoch": 3895} {"train_loss": -7.083974838256836, "global_step": 163595, "epoch": 3895} {"train_loss": -6.980847358703613, "global_step": 163596, "epoch": 3895} {"train_loss": -6.996294975280762, "global_step": 163597, "epoch": 3895} {"train_loss": -6.966361999511719, "global_step": 163598, "epoch": 3895} {"train_loss": -7.0610151290893555, "global_step": 163599, "epoch": 3895} {"train_loss": -7.100887298583984, "global_step": 163600, "epoch": 3895} {"train_loss": -7.09779167175293, "global_step": 163601, "epoch": 3895} {"train_loss": -7.066529750823975, "global_step": 163602, "epoch": 3895} {"train_loss": -6.979128837585449, "global_step": 163603, "epoch": 3895} {"train_loss": -7.132165908813477, "global_step": 163604, "epoch": 3895} {"train_loss": -6.963829040527344, "global_step": 163605, "epoch": 3895} {"train_loss": -7.090667724609375, "global_step": 163606, "epoch": 3895} {"train_loss": -7.0098371505737305, "global_step": 163607, "epoch": 3895} {"train_loss": -7.131505012512207, "global_step": 163608, "epoch": 3895} {"train_loss": -7.119084358215332, "global_step": 163609, "epoch": 3895} {"train_loss": -6.971892833709717, "global_step": 163610, "epoch": 3895} {"train_loss": -7.0450286865234375, "global_step": 163611, "epoch": 3895} {"train_loss": -7.074892997741699, "global_step": 163612, "epoch": 3895} {"train_loss": -6.971656799316406, "global_step": 163613, "epoch": 3895} {"train_loss": -7.031586647033691, "global_step": 163614, "epoch": 3895} {"train_loss": -7.0586628913879395, "global_step": 163615, "epoch": 3895} {"train_loss": -7.053104877471924, "global_step": 163616, "epoch": 3895} {"train_loss": -7.033503532409668, "global_step": 163617, "epoch": 3895} {"train_loss": -7.006954669952393, "global_step": 163618, "epoch": 3895} {"train_loss": -7.161219120025635, "global_step": 163619, "epoch": 3895} {"train_loss": -7.047843933105469, "global_step": 163620, "epoch": 3895} {"train_loss": -7.052823543548584, "global_step": 163621, "epoch": 3895} {"train_loss": -7.025181770324707, "global_step": 163622, "epoch": 3895} {"train_loss": -6.9980058670043945, "global_step": 163623, "epoch": 3895} {"train_loss": -7.036113262176514, "global_step": 163624, "epoch": 3895} {"train_loss": -6.923915863037109, "global_step": 163625, "epoch": 3895} {"train_loss": -7.069583892822266, "global_step": 163626, "epoch": 3895} {"train_loss": -7.034547805786133, "global_step": 163627, "epoch": 3895} {"train_loss": -7.0084099769592285, "global_step": 163628, "epoch": 3895} {"train_loss": -7.193887710571289, "global_step": 163629, "epoch": 3895} {"train_loss": -7.045209884643555, "global_step": 163630, "epoch": 3895} {"train_loss": -7.038617009208316, "global_step": 163631, "epoch": 3895, "val_loss": 79444.453125} {"train_loss": -7.0868048667907715, "global_step": 163632, "epoch": 3896} {"train_loss": -6.976611614227295, "global_step": 163633, "epoch": 3896} {"train_loss": -7.1186113357543945, "global_step": 163634, "epoch": 3896} {"train_loss": -7.094893455505371, "global_step": 163635, "epoch": 3896} {"train_loss": -7.218116760253906, "global_step": 163636, "epoch": 3896} {"train_loss": -7.126989364624023, "global_step": 163637, "epoch": 3896} {"train_loss": -7.102411270141602, "global_step": 163638, "epoch": 3896} {"train_loss": -7.074286937713623, "global_step": 163639, "epoch": 3896} {"train_loss": -7.093605995178223, "global_step": 163640, "epoch": 3896} {"train_loss": -7.1736602783203125, "global_step": 163641, "epoch": 3896} {"train_loss": -7.040045261383057, "global_step": 163642, "epoch": 3896} {"train_loss": -7.038730144500732, "global_step": 163643, "epoch": 3896} {"train_loss": -6.997711181640625, "global_step": 163644, "epoch": 3896} {"train_loss": -7.06266450881958, "global_step": 163645, "epoch": 3896} {"train_loss": -7.031604766845703, "global_step": 163646, "epoch": 3896} {"train_loss": -7.018559455871582, "global_step": 163647, "epoch": 3896} {"train_loss": -7.148735046386719, "global_step": 163648, "epoch": 3896} {"train_loss": -7.055044174194336, "global_step": 163649, "epoch": 3896} {"train_loss": -7.078886032104492, "global_step": 163650, "epoch": 3896} {"train_loss": -7.03574800491333, "global_step": 163651, "epoch": 3896} {"train_loss": -6.93833065032959, "global_step": 163652, "epoch": 3896} {"train_loss": -6.912541389465332, "global_step": 163653, "epoch": 3896} {"train_loss": -6.897693634033203, "global_step": 163654, "epoch": 3896} {"train_loss": -7.015758037567139, "global_step": 163655, "epoch": 3896} {"train_loss": -6.97513484954834, "global_step": 163656, "epoch": 3896} {"train_loss": -7.053415298461914, "global_step": 163657, "epoch": 3896} {"train_loss": -7.019286155700684, "global_step": 163658, "epoch": 3896} {"train_loss": -7.144451141357422, "global_step": 163659, "epoch": 3896} {"train_loss": -7.038586616516113, "global_step": 163660, "epoch": 3896} {"train_loss": -7.010325908660889, "global_step": 163661, "epoch": 3896} {"train_loss": -6.970724105834961, "global_step": 163662, "epoch": 3896} {"train_loss": -7.061637878417969, "global_step": 163663, "epoch": 3896} {"train_loss": -6.891611099243164, "global_step": 163664, "epoch": 3896} {"train_loss": -6.9449872970581055, "global_step": 163665, "epoch": 3896} {"train_loss": -6.92006778717041, "global_step": 163666, "epoch": 3896} {"train_loss": -6.912172317504883, "global_step": 163667, "epoch": 3896} {"train_loss": -7.000443458557129, "global_step": 163668, "epoch": 3896} {"train_loss": -6.931496620178223, "global_step": 163669, "epoch": 3896} {"train_loss": -6.986638069152832, "global_step": 163670, "epoch": 3896} {"train_loss": -7.024706840515137, "global_step": 163671, "epoch": 3896} {"train_loss": -7.10569953918457, "global_step": 163672, "epoch": 3896} {"train_loss": -7.029422612417312, "global_step": 163673, "epoch": 3896, "val_loss": 79619.6953125} {"train_loss": -7.020590305328369, "global_step": 163674, "epoch": 3897} {"train_loss": -7.020846366882324, "global_step": 163675, "epoch": 3897} {"train_loss": -6.937981605529785, "global_step": 163676, "epoch": 3897} {"train_loss": -6.949626445770264, "global_step": 163677, "epoch": 3897} {"train_loss": -7.077536106109619, "global_step": 163678, "epoch": 3897} {"train_loss": -7.0318121910095215, "global_step": 163679, "epoch": 3897} {"train_loss": -6.939495086669922, "global_step": 163680, "epoch": 3897} {"train_loss": -7.038156986236572, "global_step": 163681, "epoch": 3897} {"train_loss": -6.815560817718506, "global_step": 163682, "epoch": 3897} {"train_loss": -6.95505428314209, "global_step": 163683, "epoch": 3897} {"train_loss": -7.079855918884277, "global_step": 163684, "epoch": 3897} {"train_loss": -6.905158996582031, "global_step": 163685, "epoch": 3897} {"train_loss": -6.967044353485107, "global_step": 163686, "epoch": 3897} {"train_loss": -6.9073567390441895, "global_step": 163687, "epoch": 3897} {"train_loss": -6.950384140014648, "global_step": 163688, "epoch": 3897} {"train_loss": -6.9564361572265625, "global_step": 163689, "epoch": 3897} {"train_loss": -6.96298360824585, "global_step": 163690, "epoch": 3897} {"train_loss": -7.029585838317871, "global_step": 163691, "epoch": 3897} {"train_loss": -6.980372428894043, "global_step": 163692, "epoch": 3897} {"train_loss": -6.965219974517822, "global_step": 163693, "epoch": 3897} {"train_loss": -6.912714004516602, "global_step": 163694, "epoch": 3897} {"train_loss": -7.021932601928711, "global_step": 163695, "epoch": 3897} {"train_loss": -6.98601770401001, "global_step": 163696, "epoch": 3897} {"train_loss": -6.977601051330566, "global_step": 163697, "epoch": 3897} {"train_loss": -7.006914138793945, "global_step": 163698, "epoch": 3897} {"train_loss": -6.965394973754883, "global_step": 163699, "epoch": 3897} {"train_loss": -7.005865573883057, "global_step": 163700, "epoch": 3897} {"train_loss": -6.840683460235596, "global_step": 163701, "epoch": 3897} {"train_loss": -6.83120059967041, "global_step": 163702, "epoch": 3897} {"train_loss": -7.032916069030762, "global_step": 163703, "epoch": 3897} {"train_loss": -6.922449111938477, "global_step": 163704, "epoch": 3897} {"train_loss": -6.90844202041626, "global_step": 163705, "epoch": 3897} {"train_loss": -6.846529483795166, "global_step": 163706, "epoch": 3897} {"train_loss": -7.001342296600342, "global_step": 163707, "epoch": 3897} {"train_loss": -7.058940887451172, "global_step": 163708, "epoch": 3897} {"train_loss": -6.904621124267578, "global_step": 163709, "epoch": 3897} {"train_loss": -6.926074504852295, "global_step": 163710, "epoch": 3897} {"train_loss": -6.858762741088867, "global_step": 163711, "epoch": 3897} {"train_loss": -6.9579315185546875, "global_step": 163712, "epoch": 3897} {"train_loss": -6.972966194152832, "global_step": 163713, "epoch": 3897} {"train_loss": -6.872107028961182, "global_step": 163714, "epoch": 3897} {"train_loss": -6.960941632588704, "global_step": 163715, "epoch": 3897, "val_loss": 79535.4453125} {"train_loss": -7.079194068908691, "global_step": 163716, "epoch": 3898} {"train_loss": -6.978906631469727, "global_step": 163717, "epoch": 3898} {"train_loss": -7.000499725341797, "global_step": 163718, "epoch": 3898} {"train_loss": -7.069851398468018, "global_step": 163719, "epoch": 3898} {"train_loss": -6.9451751708984375, "global_step": 163720, "epoch": 3898} {"train_loss": -6.950595855712891, "global_step": 163721, "epoch": 3898} {"train_loss": -6.826691627502441, "global_step": 163722, "epoch": 3898} {"train_loss": -6.899345397949219, "global_step": 163723, "epoch": 3898} {"train_loss": -6.978766918182373, "global_step": 163724, "epoch": 3898} {"train_loss": -6.943642616271973, "global_step": 163725, "epoch": 3898} {"train_loss": -6.908725738525391, "global_step": 163726, "epoch": 3898} {"train_loss": -7.023992538452148, "global_step": 163727, "epoch": 3898} {"train_loss": -6.97988224029541, "global_step": 163728, "epoch": 3898} {"train_loss": -7.015902519226074, "global_step": 163729, "epoch": 3898} {"train_loss": -7.048388957977295, "global_step": 163730, "epoch": 3898} {"train_loss": -6.931756019592285, "global_step": 163731, "epoch": 3898} {"train_loss": -7.02449893951416, "global_step": 163732, "epoch": 3898} {"train_loss": -6.855340003967285, "global_step": 163733, "epoch": 3898} {"train_loss": -7.066429615020752, "global_step": 163734, "epoch": 3898} {"train_loss": -6.8919291496276855, "global_step": 163735, "epoch": 3898} {"train_loss": -6.994555473327637, "global_step": 163736, "epoch": 3898} {"train_loss": -6.887772083282471, "global_step": 163737, "epoch": 3898} {"train_loss": -6.939140796661377, "global_step": 163738, "epoch": 3898} {"train_loss": -6.87362003326416, "global_step": 163739, "epoch": 3898} {"train_loss": -6.881659507751465, "global_step": 163740, "epoch": 3898} {"train_loss": -6.9772844314575195, "global_step": 163741, "epoch": 3898} {"train_loss": -6.809957027435303, "global_step": 163742, "epoch": 3898} {"train_loss": -6.998556137084961, "global_step": 163743, "epoch": 3898} {"train_loss": -6.850949764251709, "global_step": 163744, "epoch": 3898} {"train_loss": -6.815178871154785, "global_step": 163745, "epoch": 3898} {"train_loss": -7.023848056793213, "global_step": 163746, "epoch": 3898} {"train_loss": -6.930013656616211, "global_step": 163747, "epoch": 3898} {"train_loss": -7.066788196563721, "global_step": 163748, "epoch": 3898} {"train_loss": -7.079964637756348, "global_step": 163749, "epoch": 3898} {"train_loss": -6.970754623413086, "global_step": 163750, "epoch": 3898} {"train_loss": -6.777149200439453, "global_step": 163751, "epoch": 3898} {"train_loss": -6.8267292976379395, "global_step": 163752, "epoch": 3898} {"train_loss": -6.9336137771606445, "global_step": 163753, "epoch": 3898} {"train_loss": -6.852499961853027, "global_step": 163754, "epoch": 3898} {"train_loss": -7.084212303161621, "global_step": 163755, "epoch": 3898} {"train_loss": -6.908164024353027, "global_step": 163756, "epoch": 3898} {"train_loss": -6.947958367211478, "global_step": 163757, "epoch": 3898, "val_loss": 79460.0} {"train_loss": -6.914750099182129, "global_step": 163758, "epoch": 3899} {"train_loss": -6.955936431884766, "global_step": 163759, "epoch": 3899} {"train_loss": -6.912783622741699, "global_step": 163760, "epoch": 3899} {"train_loss": -6.999921798706055, "global_step": 163761, "epoch": 3899} {"train_loss": -7.026758193969727, "global_step": 163762, "epoch": 3899} {"train_loss": -7.056550979614258, "global_step": 163763, "epoch": 3899} {"train_loss": -6.947922706604004, "global_step": 163764, "epoch": 3899} {"train_loss": -6.964746475219727, "global_step": 163765, "epoch": 3899} {"train_loss": -6.977130889892578, "global_step": 163766, "epoch": 3899} {"train_loss": -7.050911903381348, "global_step": 163767, "epoch": 3899} {"train_loss": -6.97033166885376, "global_step": 163768, "epoch": 3899} {"train_loss": -7.016775131225586, "global_step": 163769, "epoch": 3899} {"train_loss": -6.971179008483887, "global_step": 163770, "epoch": 3899} {"train_loss": -6.980013847351074, "global_step": 163771, "epoch": 3899} {"train_loss": -7.013516902923584, "global_step": 163772, "epoch": 3899} {"train_loss": -7.045437812805176, "global_step": 163773, "epoch": 3899} {"train_loss": -6.969918727874756, "global_step": 163774, "epoch": 3899} {"train_loss": -7.040095329284668, "global_step": 163775, "epoch": 3899} {"train_loss": -6.977696895599365, "global_step": 163776, "epoch": 3899} {"train_loss": -7.148653030395508, "global_step": 163777, "epoch": 3899} {"train_loss": -7.17587947845459, "global_step": 163778, "epoch": 3899} {"train_loss": -7.039800643920898, "global_step": 163779, "epoch": 3899} {"train_loss": -7.009795188903809, "global_step": 163780, "epoch": 3899} {"train_loss": -7.11489200592041, "global_step": 163781, "epoch": 3899} {"train_loss": -7.014837265014648, "global_step": 163782, "epoch": 3899} {"train_loss": -7.048634052276611, "global_step": 163783, "epoch": 3899} {"train_loss": -7.030872821807861, "global_step": 163784, "epoch": 3899} {"train_loss": -7.023260593414307, "global_step": 163785, "epoch": 3899} {"train_loss": -7.040485382080078, "global_step": 163786, "epoch": 3899} {"train_loss": -6.930644989013672, "global_step": 163787, "epoch": 3899} {"train_loss": -7.053835868835449, "global_step": 163788, "epoch": 3899} {"train_loss": -6.9682512283325195, "global_step": 163789, "epoch": 3899} {"train_loss": -6.844272136688232, "global_step": 163790, "epoch": 3899} {"train_loss": -7.016956329345703, "global_step": 163791, "epoch": 3899} {"train_loss": -6.864231109619141, "global_step": 163792, "epoch": 3899} {"train_loss": -6.942361354827881, "global_step": 163793, "epoch": 3899} {"train_loss": -6.979207992553711, "global_step": 163794, "epoch": 3899} {"train_loss": -6.796871185302734, "global_step": 163795, "epoch": 3899} {"train_loss": -6.917107582092285, "global_step": 163796, "epoch": 3899} {"train_loss": -7.045759201049805, "global_step": 163797, "epoch": 3899} {"train_loss": -6.871212482452393, "global_step": 163798, "epoch": 3899} {"train_loss": -6.99336450440543, "global_step": 163799, "epoch": 3899, "val_loss": 79719.015625} {"train_loss": -6.96087646484375, "global_step": 163800, "epoch": 3900} {"train_loss": -6.968569755554199, "global_step": 163801, "epoch": 3900} {"train_loss": -7.037581443786621, "global_step": 163802, "epoch": 3900} {"train_loss": -7.0937395095825195, "global_step": 163803, "epoch": 3900} {"train_loss": -6.985452651977539, "global_step": 163804, "epoch": 3900} {"train_loss": -7.0070109367370605, "global_step": 163805, "epoch": 3900} {"train_loss": -6.858126640319824, "global_step": 163806, "epoch": 3900} {"train_loss": -7.040721893310547, "global_step": 163807, "epoch": 3900} {"train_loss": -7.0723876953125, "global_step": 163808, "epoch": 3900} {"train_loss": -6.917044639587402, "global_step": 163809, "epoch": 3900} {"train_loss": -6.976418972015381, "global_step": 163810, "epoch": 3900} {"train_loss": -6.9763383865356445, "global_step": 163811, "epoch": 3900} {"train_loss": -6.792516708374023, "global_step": 163812, "epoch": 3900} {"train_loss": -7.03548526763916, "global_step": 163813, "epoch": 3900} {"train_loss": -6.832042694091797, "global_step": 163814, "epoch": 3900} {"train_loss": -6.716093063354492, "global_step": 163815, "epoch": 3900} {"train_loss": -6.972202301025391, "global_step": 163816, "epoch": 3900} {"train_loss": -6.830240249633789, "global_step": 163817, "epoch": 3900} {"train_loss": -6.966913223266602, "global_step": 163818, "epoch": 3900} {"train_loss": -6.878865718841553, "global_step": 163819, "epoch": 3900} {"train_loss": -6.780320167541504, "global_step": 163820, "epoch": 3900} {"train_loss": -6.902570724487305, "global_step": 163821, "epoch": 3900} {"train_loss": -6.886700630187988, "global_step": 163822, "epoch": 3900} {"train_loss": -7.018958568572998, "global_step": 163823, "epoch": 3900} {"train_loss": -6.957266807556152, "global_step": 163824, "epoch": 3900} {"train_loss": -7.018362045288086, "global_step": 163825, "epoch": 3900} {"train_loss": -6.904007911682129, "global_step": 163826, "epoch": 3900} {"train_loss": -6.858763217926025, "global_step": 163827, "epoch": 3900} {"train_loss": -6.953860282897949, "global_step": 163828, "epoch": 3900} {"train_loss": -6.917436599731445, "global_step": 163829, "epoch": 3900} {"train_loss": -7.017673492431641, "global_step": 163830, "epoch": 3900} {"train_loss": -6.982405662536621, "global_step": 163831, "epoch": 3900} {"train_loss": -6.967491149902344, "global_step": 163832, "epoch": 3900} {"train_loss": -6.977368354797363, "global_step": 163833, "epoch": 3900} {"train_loss": -6.915576934814453, "global_step": 163834, "epoch": 3900} {"train_loss": -6.9829301834106445, "global_step": 163835, "epoch": 3900} {"train_loss": -6.95184326171875, "global_step": 163836, "epoch": 3900} {"train_loss": -6.903252601623535, "global_step": 163837, "epoch": 3900} {"train_loss": -7.033736228942871, "global_step": 163838, "epoch": 3900} {"train_loss": -6.970715522766113, "global_step": 163839, "epoch": 3900} {"train_loss": -6.956504821777344, "global_step": 163840, "epoch": 3900} {"train_loss": -6.945732321058001, "global_step": 163841, "epoch": 3900, "train/sim_max_reward_0": 0.7172141894118552, "train/sim_max_reward_1": 0.39928625953905184, "train/sim_max_reward_2": 0.5412171276525591, "train/sim_max_reward_3": 0.14766306619577196, "train/sim_max_reward_4": 0.8500471443594416, "train/sim_max_reward_5": 0.5662440338286685, "test/sim_max_reward_4500000": 0.9905294708930882, "test/sim_max_reward_4500001": 0.9059980209250642, "test/sim_max_reward_4500002": 0.8783487099474604, "test/sim_max_reward_4500003": 0.9624175728380508, "test/sim_max_reward_4500004": 0.1475477152573036, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 0.9209865458204626, "test/sim_max_reward_4500007": 0.8650190469435175, "test/sim_max_reward_4500008": 0.8035714780958769, "test/sim_max_reward_4500009": 0.05327496591758841, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.7816354998795417, "test/sim_max_reward_4500012": 0.8430391902899179, "test/sim_max_reward_4500013": 0.0031490295126387303, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.9515625278352057, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.14719007882396706, "test/sim_max_reward_4500018": 0.9657138986330293, "test/sim_max_reward_4500019": 0.9361490115097446, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8597255616970417, "test/sim_max_reward_4500022": 0.9290521071307773, "test/sim_max_reward_4500023": 0.5237368682595397, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9319749321177747, "test/sim_max_reward_4500026": 1.0, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.18998208045993598, "test/sim_max_reward_4500029": 0.060995347434674156, "test/sim_max_reward_4500030": 0.9840889410642704, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9720959067389806, "test/sim_max_reward_4500034": 0.9873070851898075, "test/sim_max_reward_4500035": 0.7452389002787917, "test/sim_max_reward_4500036": 0.5745684533801342, "test/sim_max_reward_4500037": 1.0, "test/sim_max_reward_4500038": 0.9588892221966662, "test/sim_max_reward_4500039": 0.9319347785878632, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.7955495685031001, "test/sim_max_reward_4500042": 0.03317160542874225, "test/sim_max_reward_4500043": 0.26586396446580607, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 1.0, "test/sim_max_reward_4500046": 0.919651175374691, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5369453034978914, "test/mean_score": 0.6381290511830778, "val_loss": 79429.0546875} {"train_loss": -6.975484848022461, "global_step": 163842, "epoch": 3901} {"train_loss": -6.952632904052734, "global_step": 163843, "epoch": 3901} {"train_loss": -7.025101184844971, "global_step": 163844, "epoch": 3901} {"train_loss": -6.930750846862793, "global_step": 163845, "epoch": 3901} {"train_loss": -6.88505744934082, "global_step": 163846, "epoch": 3901} {"train_loss": -6.971885681152344, "global_step": 163847, "epoch": 3901} {"train_loss": -6.960870742797852, "global_step": 163848, "epoch": 3901} {"train_loss": -6.88360595703125, "global_step": 163849, "epoch": 3901} {"train_loss": -6.900226593017578, "global_step": 163850, "epoch": 3901} {"train_loss": -6.7712202072143555, "global_step": 163851, "epoch": 3901} {"train_loss": -6.969236373901367, "global_step": 163852, "epoch": 3901} {"train_loss": -6.999190807342529, "global_step": 163853, "epoch": 3901} {"train_loss": -7.004354000091553, "global_step": 163854, "epoch": 3901} {"train_loss": -6.816648483276367, "global_step": 163855, "epoch": 3901} {"train_loss": -7.047337532043457, "global_step": 163856, "epoch": 3901} {"train_loss": -7.01541805267334, "global_step": 163857, "epoch": 3901} {"train_loss": -6.962183475494385, "global_step": 163858, "epoch": 3901} {"train_loss": -6.997805595397949, "global_step": 163859, "epoch": 3901} {"train_loss": -6.999103546142578, "global_step": 163860, "epoch": 3901} {"train_loss": -6.914726257324219, "global_step": 163861, "epoch": 3901} {"train_loss": -7.041627407073975, "global_step": 163862, "epoch": 3901} {"train_loss": -6.870294094085693, "global_step": 163863, "epoch": 3901} {"train_loss": -6.9435954093933105, "global_step": 163864, "epoch": 3901} {"train_loss": -6.986710548400879, "global_step": 163865, "epoch": 3901} {"train_loss": -6.874438285827637, "global_step": 163866, "epoch": 3901} {"train_loss": -6.971558094024658, "global_step": 163867, "epoch": 3901} {"train_loss": -6.90017032623291, "global_step": 163868, "epoch": 3901} {"train_loss": -6.990240573883057, "global_step": 163869, "epoch": 3901} {"train_loss": -6.944929122924805, "global_step": 163870, "epoch": 3901} {"train_loss": -6.9269304275512695, "global_step": 163871, "epoch": 3901} {"train_loss": -7.032997131347656, "global_step": 163872, "epoch": 3901} {"train_loss": -6.976494789123535, "global_step": 163873, "epoch": 3901} {"train_loss": -7.0243988037109375, "global_step": 163874, "epoch": 3901} {"train_loss": -7.03536319732666, "global_step": 163875, "epoch": 3901} {"train_loss": -6.975068092346191, "global_step": 163876, "epoch": 3901} {"train_loss": -7.081957817077637, "global_step": 163877, "epoch": 3901} {"train_loss": -6.954384803771973, "global_step": 163878, "epoch": 3901} {"train_loss": -6.974259853363037, "global_step": 163879, "epoch": 3901} {"train_loss": -6.949401378631592, "global_step": 163880, "epoch": 3901} {"train_loss": -6.929318428039551, "global_step": 163881, "epoch": 3901} {"train_loss": -7.071387767791748, "global_step": 163882, "epoch": 3901} {"train_loss": -6.959639674141293, "global_step": 163883, "epoch": 3901, "val_loss": 79266.4609375} {"train_loss": -6.973228454589844, "global_step": 163884, "epoch": 3902} {"train_loss": -6.975869655609131, "global_step": 163885, "epoch": 3902} {"train_loss": -6.8954315185546875, "global_step": 163886, "epoch": 3902} {"train_loss": -7.011036396026611, "global_step": 163887, "epoch": 3902} {"train_loss": -6.999868869781494, "global_step": 163888, "epoch": 3902} {"train_loss": -7.037229061126709, "global_step": 163889, "epoch": 3902} {"train_loss": -7.0150885581970215, "global_step": 163890, "epoch": 3902} {"train_loss": -6.987217903137207, "global_step": 163891, "epoch": 3902} {"train_loss": -6.955502510070801, "global_step": 163892, "epoch": 3902} {"train_loss": -6.985621452331543, "global_step": 163893, "epoch": 3902} {"train_loss": -6.973069190979004, "global_step": 163894, "epoch": 3902} {"train_loss": -7.045711517333984, "global_step": 163895, "epoch": 3902} {"train_loss": -6.921804428100586, "global_step": 163896, "epoch": 3902} {"train_loss": -7.107011318206787, "global_step": 163897, "epoch": 3902} {"train_loss": -7.009895324707031, "global_step": 163898, "epoch": 3902} {"train_loss": -7.016182899475098, "global_step": 163899, "epoch": 3902} {"train_loss": -7.025223731994629, "global_step": 163900, "epoch": 3902} {"train_loss": -6.956347465515137, "global_step": 163901, "epoch": 3902} {"train_loss": -7.05652379989624, "global_step": 163902, "epoch": 3902} {"train_loss": -7.063478469848633, "global_step": 163903, "epoch": 3902} {"train_loss": -7.054863929748535, "global_step": 163904, "epoch": 3902} {"train_loss": -6.933263301849365, "global_step": 163905, "epoch": 3902} {"train_loss": -7.082708358764648, "global_step": 163906, "epoch": 3902} {"train_loss": -6.952996253967285, "global_step": 163907, "epoch": 3902} {"train_loss": -6.949784755706787, "global_step": 163908, "epoch": 3902} {"train_loss": -7.037364482879639, "global_step": 163909, "epoch": 3902} {"train_loss": -6.88185453414917, "global_step": 163910, "epoch": 3902} {"train_loss": -6.922860622406006, "global_step": 163911, "epoch": 3902} {"train_loss": -7.0283966064453125, "global_step": 163912, "epoch": 3902} {"train_loss": -6.937291145324707, "global_step": 163913, "epoch": 3902} {"train_loss": -6.988408088684082, "global_step": 163914, "epoch": 3902} {"train_loss": -6.893945693969727, "global_step": 163915, "epoch": 3902} {"train_loss": -6.912684917449951, "global_step": 163916, "epoch": 3902} {"train_loss": -7.005428314208984, "global_step": 163917, "epoch": 3902} {"train_loss": -6.894623279571533, "global_step": 163918, "epoch": 3902} {"train_loss": -7.037410259246826, "global_step": 163919, "epoch": 3902} {"train_loss": -7.043156147003174, "global_step": 163920, "epoch": 3902} {"train_loss": -6.987558364868164, "global_step": 163921, "epoch": 3902} {"train_loss": -6.982642650604248, "global_step": 163922, "epoch": 3902} {"train_loss": -6.917242527008057, "global_step": 163923, "epoch": 3902} {"train_loss": -6.874795913696289, "global_step": 163924, "epoch": 3902} {"train_loss": -6.981748603639149, "global_step": 163925, "epoch": 3902, "val_loss": 79684.9453125} {"train_loss": -6.864907741546631, "global_step": 163926, "epoch": 3903} {"train_loss": -6.967018127441406, "global_step": 163927, "epoch": 3903} {"train_loss": -6.901004314422607, "global_step": 163928, "epoch": 3903} {"train_loss": -6.941409111022949, "global_step": 163929, "epoch": 3903} {"train_loss": -6.97528076171875, "global_step": 163930, "epoch": 3903} {"train_loss": -6.856115341186523, "global_step": 163931, "epoch": 3903} {"train_loss": -6.852016925811768, "global_step": 163932, "epoch": 3903} {"train_loss": -7.0584564208984375, "global_step": 163933, "epoch": 3903} {"train_loss": -6.853342533111572, "global_step": 163934, "epoch": 3903} {"train_loss": -6.946677207946777, "global_step": 163935, "epoch": 3903} {"train_loss": -6.861927032470703, "global_step": 163936, "epoch": 3903} {"train_loss": -6.866587162017822, "global_step": 163937, "epoch": 3903} {"train_loss": -6.976284980773926, "global_step": 163938, "epoch": 3903} {"train_loss": -6.986483097076416, "global_step": 163939, "epoch": 3903} {"train_loss": -6.792853832244873, "global_step": 163940, "epoch": 3903} {"train_loss": -6.860163688659668, "global_step": 163941, "epoch": 3903} {"train_loss": -6.961427211761475, "global_step": 163942, "epoch": 3903} {"train_loss": -6.752899646759033, "global_step": 163943, "epoch": 3903} {"train_loss": -6.803616523742676, "global_step": 163944, "epoch": 3903} {"train_loss": -6.878293037414551, "global_step": 163945, "epoch": 3903} {"train_loss": -6.893630027770996, "global_step": 163946, "epoch": 3903} {"train_loss": -7.055351257324219, "global_step": 163947, "epoch": 3903} {"train_loss": -6.790312767028809, "global_step": 163948, "epoch": 3903} {"train_loss": -6.915602207183838, "global_step": 163949, "epoch": 3903} {"train_loss": -6.952304840087891, "global_step": 163950, "epoch": 3903} {"train_loss": -7.060179710388184, "global_step": 163951, "epoch": 3903} {"train_loss": -6.882838249206543, "global_step": 163952, "epoch": 3903} {"train_loss": -6.958189964294434, "global_step": 163953, "epoch": 3903} {"train_loss": -7.060210227966309, "global_step": 163954, "epoch": 3903} {"train_loss": -6.764463424682617, "global_step": 163955, "epoch": 3903} {"train_loss": -7.010008335113525, "global_step": 163956, "epoch": 3903} {"train_loss": -6.895172119140625, "global_step": 163957, "epoch": 3903} {"train_loss": -7.031992435455322, "global_step": 163958, "epoch": 3903} {"train_loss": -6.92686128616333, "global_step": 163959, "epoch": 3903} {"train_loss": -6.908170700073242, "global_step": 163960, "epoch": 3903} {"train_loss": -6.942700386047363, "global_step": 163961, "epoch": 3903} {"train_loss": -6.959197521209717, "global_step": 163962, "epoch": 3903} {"train_loss": -6.953612327575684, "global_step": 163963, "epoch": 3903} {"train_loss": -6.968114852905273, "global_step": 163964, "epoch": 3903} {"train_loss": -6.9735918045043945, "global_step": 163965, "epoch": 3903} {"train_loss": -6.89639949798584, "global_step": 163966, "epoch": 3903} {"train_loss": -6.922021207355318, "global_step": 163967, "epoch": 3903, "val_loss": 79378.03125} {"train_loss": -7.010785102844238, "global_step": 163968, "epoch": 3904} {"train_loss": -6.934663772583008, "global_step": 163969, "epoch": 3904} {"train_loss": -6.824253082275391, "global_step": 163970, "epoch": 3904} {"train_loss": -7.00175666809082, "global_step": 163971, "epoch": 3904} {"train_loss": -6.875357627868652, "global_step": 163972, "epoch": 3904} {"train_loss": -6.991510391235352, "global_step": 163973, "epoch": 3904} {"train_loss": -7.084091663360596, "global_step": 163974, "epoch": 3904} {"train_loss": -7.056125164031982, "global_step": 163975, "epoch": 3904} {"train_loss": -6.924958229064941, "global_step": 163976, "epoch": 3904} {"train_loss": -6.9278998374938965, "global_step": 163977, "epoch": 3904} {"train_loss": -6.949770450592041, "global_step": 163978, "epoch": 3904} {"train_loss": -6.915099143981934, "global_step": 163979, "epoch": 3904} {"train_loss": -6.924822807312012, "global_step": 163980, "epoch": 3904} {"train_loss": -6.883545398712158, "global_step": 163981, "epoch": 3904} {"train_loss": -6.982066631317139, "global_step": 163982, "epoch": 3904} {"train_loss": -6.9786176681518555, "global_step": 163983, "epoch": 3904} {"train_loss": -6.836719989776611, "global_step": 163984, "epoch": 3904} {"train_loss": -6.912560939788818, "global_step": 163985, "epoch": 3904} {"train_loss": -6.9035539627075195, "global_step": 163986, "epoch": 3904} {"train_loss": -7.000980377197266, "global_step": 163987, "epoch": 3904} {"train_loss": -6.897761821746826, "global_step": 163988, "epoch": 3904} {"train_loss": -6.879367828369141, "global_step": 163989, "epoch": 3904} {"train_loss": -7.042196750640869, "global_step": 163990, "epoch": 3904} {"train_loss": -6.803597450256348, "global_step": 163991, "epoch": 3904} {"train_loss": -6.968928337097168, "global_step": 163992, "epoch": 3904} {"train_loss": -6.98264217376709, "global_step": 163993, "epoch": 3904} {"train_loss": -6.836556434631348, "global_step": 163994, "epoch": 3904} {"train_loss": -6.990900993347168, "global_step": 163995, "epoch": 3904} {"train_loss": -6.904995918273926, "global_step": 163996, "epoch": 3904} {"train_loss": -6.819108009338379, "global_step": 163997, "epoch": 3904} {"train_loss": -6.933516025543213, "global_step": 163998, "epoch": 3904} {"train_loss": -6.684247016906738, "global_step": 163999, "epoch": 3904} {"train_loss": -6.898025989532471, "global_step": 164000, "epoch": 3904} {"train_loss": -6.8798418045043945, "global_step": 164001, "epoch": 3904} {"train_loss": -6.877520561218262, "global_step": 164002, "epoch": 3904} {"train_loss": -6.889897346496582, "global_step": 164003, "epoch": 3904} {"train_loss": -6.90673828125, "global_step": 164004, "epoch": 3904} {"train_loss": -6.965632438659668, "global_step": 164005, "epoch": 3904} {"train_loss": -6.822870254516602, "global_step": 164006, "epoch": 3904} {"train_loss": -7.061049461364746, "global_step": 164007, "epoch": 3904} {"train_loss": -6.875619411468506, "global_step": 164008, "epoch": 3904} {"train_loss": -6.923777761913481, "global_step": 164009, "epoch": 3904, "val_loss": 79644.625} {"train_loss": -6.967623710632324, "global_step": 164010, "epoch": 3905} {"train_loss": -6.961244583129883, "global_step": 164011, "epoch": 3905} {"train_loss": -7.001501083374023, "global_step": 164012, "epoch": 3905} {"train_loss": -6.9141340255737305, "global_step": 164013, "epoch": 3905} {"train_loss": -7.0973663330078125, "global_step": 164014, "epoch": 3905} {"train_loss": -7.022763729095459, "global_step": 164015, "epoch": 3905} {"train_loss": -6.952061653137207, "global_step": 164016, "epoch": 3905} {"train_loss": -6.995484352111816, "global_step": 164017, "epoch": 3905} {"train_loss": -7.000784873962402, "global_step": 164018, "epoch": 3905} {"train_loss": -6.952053070068359, "global_step": 164019, "epoch": 3905} {"train_loss": -6.881927013397217, "global_step": 164020, "epoch": 3905} {"train_loss": -6.941322326660156, "global_step": 164021, "epoch": 3905} {"train_loss": -7.036559104919434, "global_step": 164022, "epoch": 3905} {"train_loss": -6.845429420471191, "global_step": 164023, "epoch": 3905} {"train_loss": -6.981116771697998, "global_step": 164024, "epoch": 3905} {"train_loss": -6.821563720703125, "global_step": 164025, "epoch": 3905} {"train_loss": -6.9645185470581055, "global_step": 164026, "epoch": 3905} {"train_loss": -6.984047889709473, "global_step": 164027, "epoch": 3905} {"train_loss": -6.923370361328125, "global_step": 164028, "epoch": 3905} {"train_loss": -6.932018280029297, "global_step": 164029, "epoch": 3905} {"train_loss": -6.946111679077148, "global_step": 164030, "epoch": 3905} {"train_loss": -6.911616325378418, "global_step": 164031, "epoch": 3905} {"train_loss": -6.918719291687012, "global_step": 164032, "epoch": 3905} {"train_loss": -6.874248504638672, "global_step": 164033, "epoch": 3905} {"train_loss": -6.874204635620117, "global_step": 164034, "epoch": 3905} {"train_loss": -6.924991607666016, "global_step": 164035, "epoch": 3905} {"train_loss": -7.056380271911621, "global_step": 164036, "epoch": 3905} {"train_loss": -6.9810919761657715, "global_step": 164037, "epoch": 3905} {"train_loss": -6.990760803222656, "global_step": 164038, "epoch": 3905} {"train_loss": -7.025193214416504, "global_step": 164039, "epoch": 3905} {"train_loss": -6.898926734924316, "global_step": 164040, "epoch": 3905} {"train_loss": -6.989556312561035, "global_step": 164041, "epoch": 3905} {"train_loss": -6.972675323486328, "global_step": 164042, "epoch": 3905} {"train_loss": -7.069127082824707, "global_step": 164043, "epoch": 3905} {"train_loss": -7.018740177154541, "global_step": 164044, "epoch": 3905} {"train_loss": -6.966989994049072, "global_step": 164045, "epoch": 3905} {"train_loss": -7.092014312744141, "global_step": 164046, "epoch": 3905} {"train_loss": -6.960386276245117, "global_step": 164047, "epoch": 3905} {"train_loss": -6.955120086669922, "global_step": 164048, "epoch": 3905} {"train_loss": -7.057339668273926, "global_step": 164049, "epoch": 3905} {"train_loss": -7.037143230438232, "global_step": 164050, "epoch": 3905} {"train_loss": -6.972128958929153, "global_step": 164051, "epoch": 3905, "val_loss": 79440.171875} {"train_loss": -7.053805351257324, "global_step": 164052, "epoch": 3906} {"train_loss": -7.003777503967285, "global_step": 164053, "epoch": 3906} {"train_loss": -7.010857105255127, "global_step": 164054, "epoch": 3906} {"train_loss": -6.897112846374512, "global_step": 164055, "epoch": 3906} {"train_loss": -7.069938659667969, "global_step": 164056, "epoch": 3906} {"train_loss": -7.008824348449707, "global_step": 164057, "epoch": 3906} {"train_loss": -7.0799479484558105, "global_step": 164058, "epoch": 3906} {"train_loss": -7.015679359436035, "global_step": 164059, "epoch": 3906} {"train_loss": -6.952265739440918, "global_step": 164060, "epoch": 3906} {"train_loss": -7.058832168579102, "global_step": 164061, "epoch": 3906} {"train_loss": -6.968648910522461, "global_step": 164062, "epoch": 3906} {"train_loss": -7.0332560539245605, "global_step": 164063, "epoch": 3906} {"train_loss": -7.015143871307373, "global_step": 164064, "epoch": 3906} {"train_loss": -6.933320999145508, "global_step": 164065, "epoch": 3906} {"train_loss": -7.086278915405273, "global_step": 164066, "epoch": 3906} {"train_loss": -6.955318450927734, "global_step": 164067, "epoch": 3906} {"train_loss": -6.987972259521484, "global_step": 164068, "epoch": 3906} {"train_loss": -7.095012664794922, "global_step": 164069, "epoch": 3906} {"train_loss": -6.906039237976074, "global_step": 164070, "epoch": 3906} {"train_loss": -6.9417266845703125, "global_step": 164071, "epoch": 3906} {"train_loss": -7.0035858154296875, "global_step": 164072, "epoch": 3906} {"train_loss": -6.982515811920166, "global_step": 164073, "epoch": 3906} {"train_loss": -6.968013763427734, "global_step": 164074, "epoch": 3906} {"train_loss": -7.063200950622559, "global_step": 164075, "epoch": 3906} {"train_loss": -7.033320426940918, "global_step": 164076, "epoch": 3906} {"train_loss": -7.034974575042725, "global_step": 164077, "epoch": 3906} {"train_loss": -7.006260395050049, "global_step": 164078, "epoch": 3906} {"train_loss": -7.099702835083008, "global_step": 164079, "epoch": 3906} {"train_loss": -6.985620498657227, "global_step": 164080, "epoch": 3906} {"train_loss": -7.038425445556641, "global_step": 164081, "epoch": 3906} {"train_loss": -7.079855918884277, "global_step": 164082, "epoch": 3906} {"train_loss": -6.993991374969482, "global_step": 164083, "epoch": 3906} {"train_loss": -7.112006187438965, "global_step": 164084, "epoch": 3906} {"train_loss": -6.965653419494629, "global_step": 164085, "epoch": 3906} {"train_loss": -7.1610565185546875, "global_step": 164086, "epoch": 3906} {"train_loss": -6.944894313812256, "global_step": 164087, "epoch": 3906} {"train_loss": -7.0259108543396, "global_step": 164088, "epoch": 3906} {"train_loss": -6.979106903076172, "global_step": 164089, "epoch": 3906} {"train_loss": -7.10673189163208, "global_step": 164090, "epoch": 3906} {"train_loss": -7.051117897033691, "global_step": 164091, "epoch": 3906} {"train_loss": -7.02468204498291, "global_step": 164092, "epoch": 3906} {"train_loss": -7.016740605944679, "global_step": 164093, "epoch": 3906, "val_loss": 79742.578125} {"train_loss": -6.984650611877441, "global_step": 164094, "epoch": 3907} {"train_loss": -7.037824630737305, "global_step": 164095, "epoch": 3907} {"train_loss": -6.968906402587891, "global_step": 164096, "epoch": 3907} {"train_loss": -7.037811279296875, "global_step": 164097, "epoch": 3907} {"train_loss": -6.999052047729492, "global_step": 164098, "epoch": 3907} {"train_loss": -7.083313465118408, "global_step": 164099, "epoch": 3907} {"train_loss": -7.018721580505371, "global_step": 164100, "epoch": 3907} {"train_loss": -7.0033488273620605, "global_step": 164101, "epoch": 3907} {"train_loss": -7.0164103507995605, "global_step": 164102, "epoch": 3907} {"train_loss": -7.021155834197998, "global_step": 164103, "epoch": 3907} {"train_loss": -7.004364967346191, "global_step": 164104, "epoch": 3907} {"train_loss": -6.991504669189453, "global_step": 164105, "epoch": 3907} {"train_loss": -6.982186317443848, "global_step": 164106, "epoch": 3907} {"train_loss": -7.00636100769043, "global_step": 164107, "epoch": 3907} {"train_loss": -6.831608772277832, "global_step": 164108, "epoch": 3907} {"train_loss": -7.043117523193359, "global_step": 164109, "epoch": 3907} {"train_loss": -7.133553504943848, "global_step": 164110, "epoch": 3907} {"train_loss": -7.0043439865112305, "global_step": 164111, "epoch": 3907} {"train_loss": -6.995813846588135, "global_step": 164112, "epoch": 3907} {"train_loss": -7.0586419105529785, "global_step": 164113, "epoch": 3907} {"train_loss": -6.948004722595215, "global_step": 164114, "epoch": 3907} {"train_loss": -6.9549150466918945, "global_step": 164115, "epoch": 3907} {"train_loss": -7.001142501831055, "global_step": 164116, "epoch": 3907} {"train_loss": -7.031269073486328, "global_step": 164117, "epoch": 3907} {"train_loss": -6.971138954162598, "global_step": 164118, "epoch": 3907} {"train_loss": -7.002387046813965, "global_step": 164119, "epoch": 3907} {"train_loss": -7.026938438415527, "global_step": 164120, "epoch": 3907} {"train_loss": -7.043038368225098, "global_step": 164121, "epoch": 3907} {"train_loss": -6.986177921295166, "global_step": 164122, "epoch": 3907} {"train_loss": -7.011814117431641, "global_step": 164123, "epoch": 3907} {"train_loss": -6.9946370124816895, "global_step": 164124, "epoch": 3907} {"train_loss": -6.954532623291016, "global_step": 164125, "epoch": 3907} {"train_loss": -6.929495811462402, "global_step": 164126, "epoch": 3907} {"train_loss": -6.973504066467285, "global_step": 164127, "epoch": 3907} {"train_loss": -7.098423004150391, "global_step": 164128, "epoch": 3907} {"train_loss": -7.099418640136719, "global_step": 164129, "epoch": 3907} {"train_loss": -6.969389915466309, "global_step": 164130, "epoch": 3907} {"train_loss": -7.044096946716309, "global_step": 164131, "epoch": 3907} {"train_loss": -6.97189998626709, "global_step": 164132, "epoch": 3907} {"train_loss": -7.052186489105225, "global_step": 164133, "epoch": 3907} {"train_loss": -7.137599945068359, "global_step": 164134, "epoch": 3907} {"train_loss": -7.009980928330195, "global_step": 164135, "epoch": 3907, "val_loss": 79532.421875} {"train_loss": -7.045653343200684, "global_step": 164136, "epoch": 3908} {"train_loss": -7.0157976150512695, "global_step": 164137, "epoch": 3908} {"train_loss": -7.041345596313477, "global_step": 164138, "epoch": 3908} {"train_loss": -6.921763896942139, "global_step": 164139, "epoch": 3908} {"train_loss": -6.991342544555664, "global_step": 164140, "epoch": 3908} {"train_loss": -6.966241359710693, "global_step": 164141, "epoch": 3908} {"train_loss": -6.9681525230407715, "global_step": 164142, "epoch": 3908} {"train_loss": -7.113023281097412, "global_step": 164143, "epoch": 3908} {"train_loss": -6.933232307434082, "global_step": 164144, "epoch": 3908} {"train_loss": -7.030592918395996, "global_step": 164145, "epoch": 3908} {"train_loss": -6.965034484863281, "global_step": 164146, "epoch": 3908} {"train_loss": -7.0201544761657715, "global_step": 164147, "epoch": 3908} {"train_loss": -6.974601745605469, "global_step": 164148, "epoch": 3908} {"train_loss": -6.977177143096924, "global_step": 164149, "epoch": 3908} {"train_loss": -7.010659217834473, "global_step": 164150, "epoch": 3908} {"train_loss": -6.927231788635254, "global_step": 164151, "epoch": 3908} {"train_loss": -7.001924991607666, "global_step": 164152, "epoch": 3908} {"train_loss": -6.964406967163086, "global_step": 164153, "epoch": 3908} {"train_loss": -6.904890060424805, "global_step": 164154, "epoch": 3908} {"train_loss": -7.010149955749512, "global_step": 164155, "epoch": 3908} {"train_loss": -6.959628105163574, "global_step": 164156, "epoch": 3908} {"train_loss": -6.966303825378418, "global_step": 164157, "epoch": 3908} {"train_loss": -7.154679298400879, "global_step": 164158, "epoch": 3908} {"train_loss": -7.076323509216309, "global_step": 164159, "epoch": 3908} {"train_loss": -7.005487442016602, "global_step": 164160, "epoch": 3908} {"train_loss": -7.041640281677246, "global_step": 164161, "epoch": 3908} {"train_loss": -7.067119121551514, "global_step": 164162, "epoch": 3908} {"train_loss": -6.960399627685547, "global_step": 164163, "epoch": 3908} {"train_loss": -7.016879081726074, "global_step": 164164, "epoch": 3908} {"train_loss": -7.036031723022461, "global_step": 164165, "epoch": 3908} {"train_loss": -7.129598140716553, "global_step": 164166, "epoch": 3908} {"train_loss": -7.076444625854492, "global_step": 164167, "epoch": 3908} {"train_loss": -7.037410736083984, "global_step": 164168, "epoch": 3908} {"train_loss": -7.026488304138184, "global_step": 164169, "epoch": 3908} {"train_loss": -7.02390193939209, "global_step": 164170, "epoch": 3908} {"train_loss": -7.03394889831543, "global_step": 164171, "epoch": 3908} {"train_loss": -7.102863311767578, "global_step": 164172, "epoch": 3908} {"train_loss": -7.035398483276367, "global_step": 164173, "epoch": 3908} {"train_loss": -7.103934288024902, "global_step": 164174, "epoch": 3908} {"train_loss": -6.979500770568848, "global_step": 164175, "epoch": 3908} {"train_loss": -7.060196399688721, "global_step": 164176, "epoch": 3908} {"train_loss": -7.01456930523827, "global_step": 164177, "epoch": 3908, "val_loss": 79298.734375} {"train_loss": -6.96523380279541, "global_step": 164178, "epoch": 3909} {"train_loss": -6.8988752365112305, "global_step": 164179, "epoch": 3909} {"train_loss": -6.999512195587158, "global_step": 164180, "epoch": 3909} {"train_loss": -6.99415397644043, "global_step": 164181, "epoch": 3909} {"train_loss": -6.9217424392700195, "global_step": 164182, "epoch": 3909} {"train_loss": -6.862344741821289, "global_step": 164183, "epoch": 3909} {"train_loss": -6.7644219398498535, "global_step": 164184, "epoch": 3909} {"train_loss": -6.897989749908447, "global_step": 164185, "epoch": 3909} {"train_loss": -6.930769443511963, "global_step": 164186, "epoch": 3909} {"train_loss": -6.85154914855957, "global_step": 164187, "epoch": 3909} {"train_loss": -6.853247165679932, "global_step": 164188, "epoch": 3909} {"train_loss": -6.779065132141113, "global_step": 164189, "epoch": 3909} {"train_loss": -6.853340148925781, "global_step": 164190, "epoch": 3909} {"train_loss": -6.859285354614258, "global_step": 164191, "epoch": 3909} {"train_loss": -6.982781410217285, "global_step": 164192, "epoch": 3909} {"train_loss": -6.925972938537598, "global_step": 164193, "epoch": 3909} {"train_loss": -7.0865912437438965, "global_step": 164194, "epoch": 3909} {"train_loss": -6.97999382019043, "global_step": 164195, "epoch": 3909} {"train_loss": -7.018179893493652, "global_step": 164196, "epoch": 3909} {"train_loss": -7.0319623947143555, "global_step": 164197, "epoch": 3909} {"train_loss": -6.981118202209473, "global_step": 164198, "epoch": 3909} {"train_loss": -7.036447525024414, "global_step": 164199, "epoch": 3909} {"train_loss": -7.035622596740723, "global_step": 164200, "epoch": 3909} {"train_loss": -6.96246337890625, "global_step": 164201, "epoch": 3909} {"train_loss": -6.967084884643555, "global_step": 164202, "epoch": 3909} {"train_loss": -7.091646194458008, "global_step": 164203, "epoch": 3909} {"train_loss": -7.054210186004639, "global_step": 164204, "epoch": 3909} {"train_loss": -7.0125885009765625, "global_step": 164205, "epoch": 3909} {"train_loss": -7.0045342445373535, "global_step": 164206, "epoch": 3909} {"train_loss": -7.063370704650879, "global_step": 164207, "epoch": 3909} {"train_loss": -7.002333164215088, "global_step": 164208, "epoch": 3909} {"train_loss": -6.921210289001465, "global_step": 164209, "epoch": 3909} {"train_loss": -7.009771823883057, "global_step": 164210, "epoch": 3909} {"train_loss": -7.026031494140625, "global_step": 164211, "epoch": 3909} {"train_loss": -6.989452362060547, "global_step": 164212, "epoch": 3909} {"train_loss": -6.968008041381836, "global_step": 164213, "epoch": 3909} {"train_loss": -7.048983573913574, "global_step": 164214, "epoch": 3909} {"train_loss": -6.937931060791016, "global_step": 164215, "epoch": 3909} {"train_loss": -6.83330774307251, "global_step": 164216, "epoch": 3909} {"train_loss": -7.004907608032227, "global_step": 164217, "epoch": 3909} {"train_loss": -7.005532741546631, "global_step": 164218, "epoch": 3909} {"train_loss": -6.964673099063692, "global_step": 164219, "epoch": 3909, "val_loss": 79410.8046875} {"train_loss": -6.970973968505859, "global_step": 164220, "epoch": 3910} {"train_loss": -7.024383544921875, "global_step": 164221, "epoch": 3910} {"train_loss": -7.092137336730957, "global_step": 164222, "epoch": 3910} {"train_loss": -7.002893447875977, "global_step": 164223, "epoch": 3910} {"train_loss": -7.110269546508789, "global_step": 164224, "epoch": 3910} {"train_loss": -6.904801368713379, "global_step": 164225, "epoch": 3910} {"train_loss": -6.971417427062988, "global_step": 164226, "epoch": 3910} {"train_loss": -7.00853157043457, "global_step": 164227, "epoch": 3910} {"train_loss": -6.8688578605651855, "global_step": 164228, "epoch": 3910} {"train_loss": -7.0669965744018555, "global_step": 164229, "epoch": 3910} {"train_loss": -7.019845962524414, "global_step": 164230, "epoch": 3910} {"train_loss": -6.9834885597229, "global_step": 164231, "epoch": 3910} {"train_loss": -7.027099132537842, "global_step": 164232, "epoch": 3910} {"train_loss": -7.034854888916016, "global_step": 164233, "epoch": 3910} {"train_loss": -7.000270843505859, "global_step": 164234, "epoch": 3910} {"train_loss": -7.045764923095703, "global_step": 164235, "epoch": 3910} {"train_loss": -7.001027584075928, "global_step": 164236, "epoch": 3910} {"train_loss": -6.9798383712768555, "global_step": 164237, "epoch": 3910} {"train_loss": -7.004500389099121, "global_step": 164238, "epoch": 3910} {"train_loss": -7.0473432540893555, "global_step": 164239, "epoch": 3910} {"train_loss": -7.071346759796143, "global_step": 164240, "epoch": 3910} {"train_loss": -6.998492240905762, "global_step": 164241, "epoch": 3910} {"train_loss": -7.0738043785095215, "global_step": 164242, "epoch": 3910} {"train_loss": -7.016491889953613, "global_step": 164243, "epoch": 3910} {"train_loss": -6.946077346801758, "global_step": 164244, "epoch": 3910} {"train_loss": -7.012105464935303, "global_step": 164245, "epoch": 3910} {"train_loss": -7.084829330444336, "global_step": 164246, "epoch": 3910} {"train_loss": -7.046432971954346, "global_step": 164247, "epoch": 3910} {"train_loss": -6.970340251922607, "global_step": 164248, "epoch": 3910} {"train_loss": -7.002882957458496, "global_step": 164249, "epoch": 3910} {"train_loss": -7.056617736816406, "global_step": 164250, "epoch": 3910} {"train_loss": -7.0007710456848145, "global_step": 164251, "epoch": 3910} {"train_loss": -6.8788557052612305, "global_step": 164252, "epoch": 3910} {"train_loss": -6.986273288726807, "global_step": 164253, "epoch": 3910} {"train_loss": -7.062001705169678, "global_step": 164254, "epoch": 3910} {"train_loss": -6.97216796875, "global_step": 164255, "epoch": 3910} {"train_loss": -6.9077863693237305, "global_step": 164256, "epoch": 3910} {"train_loss": -6.942255973815918, "global_step": 164257, "epoch": 3910} {"train_loss": -6.994354724884033, "global_step": 164258, "epoch": 3910} {"train_loss": -6.964704990386963, "global_step": 164259, "epoch": 3910} {"train_loss": -7.001420974731445, "global_step": 164260, "epoch": 3910} {"train_loss": -7.001457112176078, "global_step": 164261, "epoch": 3910, "val_loss": 79690.4609375} {"train_loss": -7.009243488311768, "global_step": 164262, "epoch": 3911} {"train_loss": -7.0723724365234375, "global_step": 164263, "epoch": 3911} {"train_loss": -7.069075584411621, "global_step": 164264, "epoch": 3911} {"train_loss": -6.955860614776611, "global_step": 164265, "epoch": 3911} {"train_loss": -6.9552083015441895, "global_step": 164266, "epoch": 3911} {"train_loss": -6.864534378051758, "global_step": 164267, "epoch": 3911} {"train_loss": -6.946687698364258, "global_step": 164268, "epoch": 3911} {"train_loss": -6.990800857543945, "global_step": 164269, "epoch": 3911} {"train_loss": -6.868730545043945, "global_step": 164270, "epoch": 3911} {"train_loss": -7.005553245544434, "global_step": 164271, "epoch": 3911} {"train_loss": -7.03870964050293, "global_step": 164272, "epoch": 3911} {"train_loss": -7.034209251403809, "global_step": 164273, "epoch": 3911} {"train_loss": -7.029514312744141, "global_step": 164274, "epoch": 3911} {"train_loss": -7.030659198760986, "global_step": 164275, "epoch": 3911} {"train_loss": -6.994232177734375, "global_step": 164276, "epoch": 3911} {"train_loss": -6.870814323425293, "global_step": 164277, "epoch": 3911} {"train_loss": -6.989336013793945, "global_step": 164278, "epoch": 3911} {"train_loss": -6.8422770500183105, "global_step": 164279, "epoch": 3911} {"train_loss": -6.915312767028809, "global_step": 164280, "epoch": 3911} {"train_loss": -6.907751560211182, "global_step": 164281, "epoch": 3911} {"train_loss": -6.852164268493652, "global_step": 164282, "epoch": 3911} {"train_loss": -6.964747428894043, "global_step": 164283, "epoch": 3911} {"train_loss": -6.821693420410156, "global_step": 164284, "epoch": 3911} {"train_loss": -7.007923126220703, "global_step": 164285, "epoch": 3911} {"train_loss": -6.9545087814331055, "global_step": 164286, "epoch": 3911} {"train_loss": -6.951678276062012, "global_step": 164287, "epoch": 3911} {"train_loss": -7.019899368286133, "global_step": 164288, "epoch": 3911} {"train_loss": -6.950114727020264, "global_step": 164289, "epoch": 3911} {"train_loss": -6.962409019470215, "global_step": 164290, "epoch": 3911} {"train_loss": -7.0446271896362305, "global_step": 164291, "epoch": 3911} {"train_loss": -6.976769924163818, "global_step": 164292, "epoch": 3911} {"train_loss": -6.887811660766602, "global_step": 164293, "epoch": 3911} {"train_loss": -6.9705939292907715, "global_step": 164294, "epoch": 3911} {"train_loss": -6.9053802490234375, "global_step": 164295, "epoch": 3911} {"train_loss": -6.992095947265625, "global_step": 164296, "epoch": 3911} {"train_loss": -7.096840858459473, "global_step": 164297, "epoch": 3911} {"train_loss": -6.906282901763916, "global_step": 164298, "epoch": 3911} {"train_loss": -7.0461883544921875, "global_step": 164299, "epoch": 3911} {"train_loss": -6.819360256195068, "global_step": 164300, "epoch": 3911} {"train_loss": -6.912006855010986, "global_step": 164301, "epoch": 3911} {"train_loss": -7.037650108337402, "global_step": 164302, "epoch": 3911} {"train_loss": -6.959075008119855, "global_step": 164303, "epoch": 3911, "val_loss": 79512.7734375} {"train_loss": -6.944424152374268, "global_step": 164304, "epoch": 3912} {"train_loss": -7.0392327308654785, "global_step": 164305, "epoch": 3912} {"train_loss": -6.907630920410156, "global_step": 164306, "epoch": 3912} {"train_loss": -7.030285835266113, "global_step": 164307, "epoch": 3912} {"train_loss": -7.018695831298828, "global_step": 164308, "epoch": 3912} {"train_loss": -6.871426582336426, "global_step": 164309, "epoch": 3912} {"train_loss": -6.793267250061035, "global_step": 164310, "epoch": 3912} {"train_loss": -6.996721267700195, "global_step": 164311, "epoch": 3912} {"train_loss": -6.918605804443359, "global_step": 164312, "epoch": 3912} {"train_loss": -6.913949489593506, "global_step": 164313, "epoch": 3912} {"train_loss": -6.8687591552734375, "global_step": 164314, "epoch": 3912} {"train_loss": -6.802862167358398, "global_step": 164315, "epoch": 3912} {"train_loss": -6.978944778442383, "global_step": 164316, "epoch": 3912} {"train_loss": -6.871857643127441, "global_step": 164317, "epoch": 3912} {"train_loss": -6.938784599304199, "global_step": 164318, "epoch": 3912} {"train_loss": -6.987719535827637, "global_step": 164319, "epoch": 3912} {"train_loss": -7.0267720222473145, "global_step": 164320, "epoch": 3912} {"train_loss": -6.8737473487854, "global_step": 164321, "epoch": 3912} {"train_loss": -6.881682395935059, "global_step": 164322, "epoch": 3912} {"train_loss": -6.972985744476318, "global_step": 164323, "epoch": 3912} {"train_loss": -6.938882827758789, "global_step": 164324, "epoch": 3912} {"train_loss": -6.868342399597168, "global_step": 164325, "epoch": 3912} {"train_loss": -7.012380599975586, "global_step": 164326, "epoch": 3912} {"train_loss": -7.106744766235352, "global_step": 164327, "epoch": 3912} {"train_loss": -7.038668632507324, "global_step": 164328, "epoch": 3912} {"train_loss": -7.032361030578613, "global_step": 164329, "epoch": 3912} {"train_loss": -6.907320976257324, "global_step": 164330, "epoch": 3912} {"train_loss": -6.975183486938477, "global_step": 164331, "epoch": 3912} {"train_loss": -7.001343727111816, "global_step": 164332, "epoch": 3912} {"train_loss": -6.963085174560547, "global_step": 164333, "epoch": 3912} {"train_loss": -7.023369789123535, "global_step": 164334, "epoch": 3912} {"train_loss": -6.88800048828125, "global_step": 164335, "epoch": 3912} {"train_loss": -6.941545009613037, "global_step": 164336, "epoch": 3912} {"train_loss": -6.933058738708496, "global_step": 164337, "epoch": 3912} {"train_loss": -6.942756652832031, "global_step": 164338, "epoch": 3912} {"train_loss": -6.982260227203369, "global_step": 164339, "epoch": 3912} {"train_loss": -7.025073051452637, "global_step": 164340, "epoch": 3912} {"train_loss": -7.040643215179443, "global_step": 164341, "epoch": 3912} {"train_loss": -6.979248523712158, "global_step": 164342, "epoch": 3912} {"train_loss": -6.871822357177734, "global_step": 164343, "epoch": 3912} {"train_loss": -6.990863800048828, "global_step": 164344, "epoch": 3912} {"train_loss": -6.955350024359567, "global_step": 164345, "epoch": 3912, "val_loss": 79525.5078125} {"train_loss": -6.977588176727295, "global_step": 164346, "epoch": 3913} {"train_loss": -7.077651023864746, "global_step": 164347, "epoch": 3913} {"train_loss": -7.176726341247559, "global_step": 164348, "epoch": 3913} {"train_loss": -6.982635498046875, "global_step": 164349, "epoch": 3913} {"train_loss": -6.890235900878906, "global_step": 164350, "epoch": 3913} {"train_loss": -7.012660026550293, "global_step": 164351, "epoch": 3913} {"train_loss": -6.937201499938965, "global_step": 164352, "epoch": 3913} {"train_loss": -7.070751190185547, "global_step": 164353, "epoch": 3913} {"train_loss": -7.0210957527160645, "global_step": 164354, "epoch": 3913} {"train_loss": -6.945834636688232, "global_step": 164355, "epoch": 3913} {"train_loss": -6.89818811416626, "global_step": 164356, "epoch": 3913} {"train_loss": -7.049568176269531, "global_step": 164357, "epoch": 3913} {"train_loss": -6.978420257568359, "global_step": 164358, "epoch": 3913} {"train_loss": -6.9257612228393555, "global_step": 164359, "epoch": 3913} {"train_loss": -6.916607856750488, "global_step": 164360, "epoch": 3913} {"train_loss": -6.898858070373535, "global_step": 164361, "epoch": 3913} {"train_loss": -6.764002799987793, "global_step": 164362, "epoch": 3913} {"train_loss": -6.963952541351318, "global_step": 164363, "epoch": 3913} {"train_loss": -7.088260650634766, "global_step": 164364, "epoch": 3913} {"train_loss": -7.007033348083496, "global_step": 164365, "epoch": 3913} {"train_loss": -6.920982360839844, "global_step": 164366, "epoch": 3913} {"train_loss": -6.943173408508301, "global_step": 164367, "epoch": 3913} {"train_loss": -6.9666595458984375, "global_step": 164368, "epoch": 3913} {"train_loss": -6.994502067565918, "global_step": 164369, "epoch": 3913} {"train_loss": -7.028077125549316, "global_step": 164370, "epoch": 3913} {"train_loss": -7.024088382720947, "global_step": 164371, "epoch": 3913} {"train_loss": -6.8235883712768555, "global_step": 164372, "epoch": 3913} {"train_loss": -6.992715835571289, "global_step": 164373, "epoch": 3913} {"train_loss": -6.9630961418151855, "global_step": 164374, "epoch": 3913} {"train_loss": -6.713051795959473, "global_step": 164375, "epoch": 3913} {"train_loss": -6.976413726806641, "global_step": 164376, "epoch": 3913} {"train_loss": -6.666216850280762, "global_step": 164377, "epoch": 3913} {"train_loss": -6.836493492126465, "global_step": 164378, "epoch": 3913} {"train_loss": -6.928596496582031, "global_step": 164379, "epoch": 3913} {"train_loss": -6.777876853942871, "global_step": 164380, "epoch": 3913} {"train_loss": -6.981873035430908, "global_step": 164381, "epoch": 3913} {"train_loss": -6.796484470367432, "global_step": 164382, "epoch": 3913} {"train_loss": -6.976471424102783, "global_step": 164383, "epoch": 3913} {"train_loss": -6.854734420776367, "global_step": 164384, "epoch": 3913} {"train_loss": -6.822202205657959, "global_step": 164385, "epoch": 3913} {"train_loss": -6.812256813049316, "global_step": 164386, "epoch": 3913} {"train_loss": -6.933573666073027, "global_step": 164387, "epoch": 3913, "val_loss": 79843.09375} {"train_loss": -6.866045951843262, "global_step": 164388, "epoch": 3914} {"train_loss": -6.996960639953613, "global_step": 164389, "epoch": 3914} {"train_loss": -6.741093635559082, "global_step": 164390, "epoch": 3914} {"train_loss": -7.026056289672852, "global_step": 164391, "epoch": 3914} {"train_loss": -6.943212509155273, "global_step": 164392, "epoch": 3914} {"train_loss": -6.912992477416992, "global_step": 164393, "epoch": 3914} {"train_loss": -6.935110092163086, "global_step": 164394, "epoch": 3914} {"train_loss": -6.9495463371276855, "global_step": 164395, "epoch": 3914} {"train_loss": -6.966860771179199, "global_step": 164396, "epoch": 3914} {"train_loss": -7.063655853271484, "global_step": 164397, "epoch": 3914} {"train_loss": -7.018423557281494, "global_step": 164398, "epoch": 3914} {"train_loss": -7.042446136474609, "global_step": 164399, "epoch": 3914} {"train_loss": -7.055213451385498, "global_step": 164400, "epoch": 3914} {"train_loss": -6.972534656524658, "global_step": 164401, "epoch": 3914} {"train_loss": -7.045111656188965, "global_step": 164402, "epoch": 3914} {"train_loss": -7.045269966125488, "global_step": 164403, "epoch": 3914} {"train_loss": -7.001816272735596, "global_step": 164404, "epoch": 3914} {"train_loss": -7.089888572692871, "global_step": 164405, "epoch": 3914} {"train_loss": -7.067041397094727, "global_step": 164406, "epoch": 3914} {"train_loss": -7.018925189971924, "global_step": 164407, "epoch": 3914} {"train_loss": -6.908702850341797, "global_step": 164408, "epoch": 3914} {"train_loss": -7.054479122161865, "global_step": 164409, "epoch": 3914} {"train_loss": -7.02603006362915, "global_step": 164410, "epoch": 3914} {"train_loss": -7.098536491394043, "global_step": 164411, "epoch": 3914} {"train_loss": -6.94882869720459, "global_step": 164412, "epoch": 3914} {"train_loss": -7.023382186889648, "global_step": 164413, "epoch": 3914} {"train_loss": -7.040817737579346, "global_step": 164414, "epoch": 3914} {"train_loss": -7.077062129974365, "global_step": 164415, "epoch": 3914} {"train_loss": -7.0943450927734375, "global_step": 164416, "epoch": 3914} {"train_loss": -6.932132244110107, "global_step": 164417, "epoch": 3914} {"train_loss": -7.106963157653809, "global_step": 164418, "epoch": 3914} {"train_loss": -6.998787879943848, "global_step": 164419, "epoch": 3914} {"train_loss": -7.078357696533203, "global_step": 164420, "epoch": 3914} {"train_loss": -7.001481056213379, "global_step": 164421, "epoch": 3914} {"train_loss": -6.956223487854004, "global_step": 164422, "epoch": 3914} {"train_loss": -7.033568859100342, "global_step": 164423, "epoch": 3914} {"train_loss": -6.920857906341553, "global_step": 164424, "epoch": 3914} {"train_loss": -6.9957051277160645, "global_step": 164425, "epoch": 3914} {"train_loss": -7.0626726150512695, "global_step": 164426, "epoch": 3914} {"train_loss": -7.0564985275268555, "global_step": 164427, "epoch": 3914} {"train_loss": -7.087097644805908, "global_step": 164428, "epoch": 3914} {"train_loss": -7.00560128121149, "global_step": 164429, "epoch": 3914, "val_loss": 79447.265625} {"train_loss": -7.084383010864258, "global_step": 164430, "epoch": 3915} {"train_loss": -6.896505355834961, "global_step": 164431, "epoch": 3915} {"train_loss": -7.091303825378418, "global_step": 164432, "epoch": 3915} {"train_loss": -7.012507915496826, "global_step": 164433, "epoch": 3915} {"train_loss": -7.049542427062988, "global_step": 164434, "epoch": 3915} {"train_loss": -7.054614543914795, "global_step": 164435, "epoch": 3915} {"train_loss": -7.13234806060791, "global_step": 164436, "epoch": 3915} {"train_loss": -7.001400947570801, "global_step": 164437, "epoch": 3915} {"train_loss": -7.089225769042969, "global_step": 164438, "epoch": 3915} {"train_loss": -6.989797592163086, "global_step": 164439, "epoch": 3915} {"train_loss": -7.029942035675049, "global_step": 164440, "epoch": 3915} {"train_loss": -6.954039573669434, "global_step": 164441, "epoch": 3915} {"train_loss": -7.057950019836426, "global_step": 164442, "epoch": 3915} {"train_loss": -6.9315385818481445, "global_step": 164443, "epoch": 3915} {"train_loss": -6.98793888092041, "global_step": 164444, "epoch": 3915} {"train_loss": -7.0303449630737305, "global_step": 164445, "epoch": 3915} {"train_loss": -6.996625900268555, "global_step": 164446, "epoch": 3915} {"train_loss": -6.960116386413574, "global_step": 164447, "epoch": 3915} {"train_loss": -7.048940658569336, "global_step": 164448, "epoch": 3915} {"train_loss": -7.099430084228516, "global_step": 164449, "epoch": 3915} {"train_loss": -7.078462600708008, "global_step": 164450, "epoch": 3915} {"train_loss": -7.052961349487305, "global_step": 164451, "epoch": 3915} {"train_loss": -7.136390686035156, "global_step": 164452, "epoch": 3915} {"train_loss": -7.076272964477539, "global_step": 164453, "epoch": 3915} {"train_loss": -6.998617172241211, "global_step": 164454, "epoch": 3915} {"train_loss": -6.976082801818848, "global_step": 164455, "epoch": 3915} {"train_loss": -6.960606575012207, "global_step": 164456, "epoch": 3915} {"train_loss": -7.093280792236328, "global_step": 164457, "epoch": 3915} {"train_loss": -7.008455276489258, "global_step": 164458, "epoch": 3915} {"train_loss": -7.101064682006836, "global_step": 164459, "epoch": 3915} {"train_loss": -7.031073093414307, "global_step": 164460, "epoch": 3915} {"train_loss": -7.046082019805908, "global_step": 164461, "epoch": 3915} {"train_loss": -7.074680328369141, "global_step": 164462, "epoch": 3915} {"train_loss": -6.934369087219238, "global_step": 164463, "epoch": 3915} {"train_loss": -6.998255729675293, "global_step": 164464, "epoch": 3915} {"train_loss": -6.9611592292785645, "global_step": 164465, "epoch": 3915} {"train_loss": -7.019779205322266, "global_step": 164466, "epoch": 3915} {"train_loss": -7.028217792510986, "global_step": 164467, "epoch": 3915} {"train_loss": -6.974423408508301, "global_step": 164468, "epoch": 3915} {"train_loss": -7.060986518859863, "global_step": 164469, "epoch": 3915} {"train_loss": -6.992722511291504, "global_step": 164470, "epoch": 3915} {"train_loss": -7.024574643089657, "global_step": 164471, "epoch": 3915, "val_loss": 79589.046875} {"train_loss": -7.001247406005859, "global_step": 164472, "epoch": 3916} {"train_loss": -7.031375408172607, "global_step": 164473, "epoch": 3916} {"train_loss": -6.912342548370361, "global_step": 164474, "epoch": 3916} {"train_loss": -7.003917217254639, "global_step": 164475, "epoch": 3916} {"train_loss": -7.080334186553955, "global_step": 164476, "epoch": 3916} {"train_loss": -6.986271858215332, "global_step": 164477, "epoch": 3916} {"train_loss": -6.882004737854004, "global_step": 164478, "epoch": 3916} {"train_loss": -6.87265157699585, "global_step": 164479, "epoch": 3916} {"train_loss": -6.98458194732666, "global_step": 164480, "epoch": 3916} {"train_loss": -6.8776655197143555, "global_step": 164481, "epoch": 3916} {"train_loss": -6.892607688903809, "global_step": 164482, "epoch": 3916} {"train_loss": -7.016730308532715, "global_step": 164483, "epoch": 3916} {"train_loss": -6.9207868576049805, "global_step": 164484, "epoch": 3916} {"train_loss": -7.029566764831543, "global_step": 164485, "epoch": 3916} {"train_loss": -6.9720048904418945, "global_step": 164486, "epoch": 3916} {"train_loss": -6.881384372711182, "global_step": 164487, "epoch": 3916} {"train_loss": -6.862098693847656, "global_step": 164488, "epoch": 3916} {"train_loss": -6.937475204467773, "global_step": 164489, "epoch": 3916} {"train_loss": -6.96558952331543, "global_step": 164490, "epoch": 3916} {"train_loss": -6.913644790649414, "global_step": 164491, "epoch": 3916} {"train_loss": -6.979047775268555, "global_step": 164492, "epoch": 3916} {"train_loss": -6.924601078033447, "global_step": 164493, "epoch": 3916} {"train_loss": -6.828500270843506, "global_step": 164494, "epoch": 3916} {"train_loss": -6.971608638763428, "global_step": 164495, "epoch": 3916} {"train_loss": -6.945408821105957, "global_step": 164496, "epoch": 3916} {"train_loss": -6.973769187927246, "global_step": 164497, "epoch": 3916} {"train_loss": -7.012037754058838, "global_step": 164498, "epoch": 3916} {"train_loss": -6.991639137268066, "global_step": 164499, "epoch": 3916} {"train_loss": -6.959855556488037, "global_step": 164500, "epoch": 3916} {"train_loss": -6.990030288696289, "global_step": 164501, "epoch": 3916} {"train_loss": -6.97457218170166, "global_step": 164502, "epoch": 3916} {"train_loss": -7.031987190246582, "global_step": 164503, "epoch": 3916} {"train_loss": -7.013769149780273, "global_step": 164504, "epoch": 3916} {"train_loss": -7.005046367645264, "global_step": 164505, "epoch": 3916} {"train_loss": -6.962002277374268, "global_step": 164506, "epoch": 3916} {"train_loss": -7.018620491027832, "global_step": 164507, "epoch": 3916} {"train_loss": -7.082550048828125, "global_step": 164508, "epoch": 3916} {"train_loss": -6.972217559814453, "global_step": 164509, "epoch": 3916} {"train_loss": -7.021383285522461, "global_step": 164510, "epoch": 3916} {"train_loss": -7.013134956359863, "global_step": 164511, "epoch": 3916} {"train_loss": -6.984001159667969, "global_step": 164512, "epoch": 3916} {"train_loss": -6.972306387765067, "global_step": 164513, "epoch": 3916, "val_loss": 79507.9609375} {"train_loss": -7.051285743713379, "global_step": 164514, "epoch": 3917} {"train_loss": -7.037754058837891, "global_step": 164515, "epoch": 3917} {"train_loss": -7.053114414215088, "global_step": 164516, "epoch": 3917} {"train_loss": -6.959634780883789, "global_step": 164517, "epoch": 3917} {"train_loss": -6.9815874099731445, "global_step": 164518, "epoch": 3917} {"train_loss": -7.074769973754883, "global_step": 164519, "epoch": 3917} {"train_loss": -7.068106174468994, "global_step": 164520, "epoch": 3917} {"train_loss": -7.060676574707031, "global_step": 164521, "epoch": 3917} {"train_loss": -7.105632305145264, "global_step": 164522, "epoch": 3917} {"train_loss": -7.024491310119629, "global_step": 164523, "epoch": 3917} {"train_loss": -7.030959606170654, "global_step": 164524, "epoch": 3917} {"train_loss": -7.152182579040527, "global_step": 164525, "epoch": 3917} {"train_loss": -7.0972795486450195, "global_step": 164526, "epoch": 3917} {"train_loss": -6.979239463806152, "global_step": 164527, "epoch": 3917} {"train_loss": -7.122583389282227, "global_step": 164528, "epoch": 3917} {"train_loss": -7.08989953994751, "global_step": 164529, "epoch": 3917} {"train_loss": -7.080442428588867, "global_step": 164530, "epoch": 3917} {"train_loss": -7.017512321472168, "global_step": 164531, "epoch": 3917} {"train_loss": -7.184364318847656, "global_step": 164532, "epoch": 3917} {"train_loss": -7.05516242980957, "global_step": 164533, "epoch": 3917} {"train_loss": -7.020261764526367, "global_step": 164534, "epoch": 3917} {"train_loss": -6.972963333129883, "global_step": 164535, "epoch": 3917} {"train_loss": -6.9091796875, "global_step": 164536, "epoch": 3917} {"train_loss": -6.97703218460083, "global_step": 164537, "epoch": 3917} {"train_loss": -7.089085102081299, "global_step": 164538, "epoch": 3917} {"train_loss": -7.044315814971924, "global_step": 164539, "epoch": 3917} {"train_loss": -6.93911075592041, "global_step": 164540, "epoch": 3917} {"train_loss": -6.926726341247559, "global_step": 164541, "epoch": 3917} {"train_loss": -7.046078205108643, "global_step": 164542, "epoch": 3917} {"train_loss": -6.938449859619141, "global_step": 164543, "epoch": 3917} {"train_loss": -6.971978187561035, "global_step": 164544, "epoch": 3917} {"train_loss": -6.967864036560059, "global_step": 164545, "epoch": 3917} {"train_loss": -6.993710517883301, "global_step": 164546, "epoch": 3917} {"train_loss": -6.950442314147949, "global_step": 164547, "epoch": 3917} {"train_loss": -6.820791244506836, "global_step": 164548, "epoch": 3917} {"train_loss": -6.9681196212768555, "global_step": 164549, "epoch": 3917} {"train_loss": -6.939117431640625, "global_step": 164550, "epoch": 3917} {"train_loss": -6.865461826324463, "global_step": 164551, "epoch": 3917} {"train_loss": -6.921123027801514, "global_step": 164552, "epoch": 3917} {"train_loss": -6.911802291870117, "global_step": 164553, "epoch": 3917} {"train_loss": -7.048172950744629, "global_step": 164554, "epoch": 3917} {"train_loss": -7.009097894032796, "global_step": 164555, "epoch": 3917, "val_loss": 79844.1015625} {"train_loss": -6.887531280517578, "global_step": 164556, "epoch": 3918} {"train_loss": -6.957210063934326, "global_step": 164557, "epoch": 3918} {"train_loss": -6.891764163970947, "global_step": 164558, "epoch": 3918} {"train_loss": -7.09332275390625, "global_step": 164559, "epoch": 3918} {"train_loss": -7.027109146118164, "global_step": 164560, "epoch": 3918} {"train_loss": -7.016806125640869, "global_step": 164561, "epoch": 3918} {"train_loss": -6.856704235076904, "global_step": 164562, "epoch": 3918} {"train_loss": -7.063847541809082, "global_step": 164563, "epoch": 3918} {"train_loss": -7.019699573516846, "global_step": 164564, "epoch": 3918} {"train_loss": -7.0229082107543945, "global_step": 164565, "epoch": 3918} {"train_loss": -7.04925537109375, "global_step": 164566, "epoch": 3918} {"train_loss": -7.107892990112305, "global_step": 164567, "epoch": 3918} {"train_loss": -7.092947483062744, "global_step": 164568, "epoch": 3918} {"train_loss": -7.077483654022217, "global_step": 164569, "epoch": 3918} {"train_loss": -7.056807518005371, "global_step": 164570, "epoch": 3918} {"train_loss": -7.070034980773926, "global_step": 164571, "epoch": 3918} {"train_loss": -7.050238132476807, "global_step": 164572, "epoch": 3918} {"train_loss": -7.067795753479004, "global_step": 164573, "epoch": 3918} {"train_loss": -6.894180774688721, "global_step": 164574, "epoch": 3918} {"train_loss": -6.931795597076416, "global_step": 164575, "epoch": 3918} {"train_loss": -7.008760452270508, "global_step": 164576, "epoch": 3918} {"train_loss": -7.034773826599121, "global_step": 164577, "epoch": 3918} {"train_loss": -6.9340314865112305, "global_step": 164578, "epoch": 3918} {"train_loss": -7.024013519287109, "global_step": 164579, "epoch": 3918} {"train_loss": -6.956724643707275, "global_step": 164580, "epoch": 3918} {"train_loss": -7.027083396911621, "global_step": 164581, "epoch": 3918} {"train_loss": -6.941709518432617, "global_step": 164582, "epoch": 3918} {"train_loss": -7.123992919921875, "global_step": 164583, "epoch": 3918} {"train_loss": -6.9981303215026855, "global_step": 164584, "epoch": 3918} {"train_loss": -7.028525352478027, "global_step": 164585, "epoch": 3918} {"train_loss": -6.9778032302856445, "global_step": 164586, "epoch": 3918} {"train_loss": -7.027753829956055, "global_step": 164587, "epoch": 3918} {"train_loss": -7.021910667419434, "global_step": 164588, "epoch": 3918} {"train_loss": -7.039638996124268, "global_step": 164589, "epoch": 3918} {"train_loss": -7.061956405639648, "global_step": 164590, "epoch": 3918} {"train_loss": -7.052393436431885, "global_step": 164591, "epoch": 3918} {"train_loss": -6.9977898597717285, "global_step": 164592, "epoch": 3918} {"train_loss": -7.028205871582031, "global_step": 164593, "epoch": 3918} {"train_loss": -7.0321760177612305, "global_step": 164594, "epoch": 3918} {"train_loss": -7.022170066833496, "global_step": 164595, "epoch": 3918} {"train_loss": -6.966489315032959, "global_step": 164596, "epoch": 3918} {"train_loss": -7.013788211913336, "global_step": 164597, "epoch": 3918, "val_loss": 79365.5390625} {"train_loss": -7.01145601272583, "global_step": 164598, "epoch": 3919} {"train_loss": -6.87255859375, "global_step": 164599, "epoch": 3919} {"train_loss": -7.112786293029785, "global_step": 164600, "epoch": 3919} {"train_loss": -6.844325542449951, "global_step": 164601, "epoch": 3919} {"train_loss": -6.971508502960205, "global_step": 164602, "epoch": 3919} {"train_loss": -7.073293685913086, "global_step": 164603, "epoch": 3919} {"train_loss": -6.8804473876953125, "global_step": 164604, "epoch": 3919} {"train_loss": -7.038431167602539, "global_step": 164605, "epoch": 3919} {"train_loss": -6.839054107666016, "global_step": 164606, "epoch": 3919} {"train_loss": -6.965644836425781, "global_step": 164607, "epoch": 3919} {"train_loss": -6.966242790222168, "global_step": 164608, "epoch": 3919} {"train_loss": -6.938045501708984, "global_step": 164609, "epoch": 3919} {"train_loss": -7.032909870147705, "global_step": 164610, "epoch": 3919} {"train_loss": -7.113508224487305, "global_step": 164611, "epoch": 3919} {"train_loss": -6.894186973571777, "global_step": 164612, "epoch": 3919} {"train_loss": -6.990668296813965, "global_step": 164613, "epoch": 3919} {"train_loss": -7.003791809082031, "global_step": 164614, "epoch": 3919} {"train_loss": -7.069583892822266, "global_step": 164615, "epoch": 3919} {"train_loss": -6.941204071044922, "global_step": 164616, "epoch": 3919} {"train_loss": -7.034979820251465, "global_step": 164617, "epoch": 3919} {"train_loss": -6.930482864379883, "global_step": 164618, "epoch": 3919} {"train_loss": -7.044150352478027, "global_step": 164619, "epoch": 3919} {"train_loss": -6.936147212982178, "global_step": 164620, "epoch": 3919} {"train_loss": -7.046628952026367, "global_step": 164621, "epoch": 3919} {"train_loss": -6.945315361022949, "global_step": 164622, "epoch": 3919} {"train_loss": -6.884554862976074, "global_step": 164623, "epoch": 3919} {"train_loss": -6.94925594329834, "global_step": 164624, "epoch": 3919} {"train_loss": -7.00760555267334, "global_step": 164625, "epoch": 3919} {"train_loss": -6.802330493927002, "global_step": 164626, "epoch": 3919} {"train_loss": -7.143259048461914, "global_step": 164627, "epoch": 3919} {"train_loss": -7.003971099853516, "global_step": 164628, "epoch": 3919} {"train_loss": -6.811695098876953, "global_step": 164629, "epoch": 3919} {"train_loss": -6.968605995178223, "global_step": 164630, "epoch": 3919} {"train_loss": -6.879122257232666, "global_step": 164631, "epoch": 3919} {"train_loss": -6.908927917480469, "global_step": 164632, "epoch": 3919} {"train_loss": -6.821880340576172, "global_step": 164633, "epoch": 3919} {"train_loss": -6.918943405151367, "global_step": 164634, "epoch": 3919} {"train_loss": -6.726748466491699, "global_step": 164635, "epoch": 3919} {"train_loss": -6.9059529304504395, "global_step": 164636, "epoch": 3919} {"train_loss": -6.931449890136719, "global_step": 164637, "epoch": 3919} {"train_loss": -6.836009979248047, "global_step": 164638, "epoch": 3919} {"train_loss": -6.948067824045817, "global_step": 164639, "epoch": 3919, "val_loss": 79506.2578125} {"train_loss": -6.968223571777344, "global_step": 164640, "epoch": 3920} {"train_loss": -6.891479969024658, "global_step": 164641, "epoch": 3920} {"train_loss": -6.955879211425781, "global_step": 164642, "epoch": 3920} {"train_loss": -6.834040641784668, "global_step": 164643, "epoch": 3920} {"train_loss": -6.925796031951904, "global_step": 164644, "epoch": 3920} {"train_loss": -6.816155433654785, "global_step": 164645, "epoch": 3920} {"train_loss": -6.987188339233398, "global_step": 164646, "epoch": 3920} {"train_loss": -6.920494556427002, "global_step": 164647, "epoch": 3920} {"train_loss": -7.041511058807373, "global_step": 164648, "epoch": 3920} {"train_loss": -6.8647685050964355, "global_step": 164649, "epoch": 3920} {"train_loss": -6.91357421875, "global_step": 164650, "epoch": 3920} {"train_loss": -7.090628623962402, "global_step": 164651, "epoch": 3920} {"train_loss": -7.053236961364746, "global_step": 164652, "epoch": 3920} {"train_loss": -6.938307762145996, "global_step": 164653, "epoch": 3920} {"train_loss": -6.989886283874512, "global_step": 164654, "epoch": 3920} {"train_loss": -7.036730766296387, "global_step": 164655, "epoch": 3920} {"train_loss": -7.058521747589111, "global_step": 164656, "epoch": 3920} {"train_loss": -7.040902614593506, "global_step": 164657, "epoch": 3920} {"train_loss": -7.07397985458374, "global_step": 164658, "epoch": 3920} {"train_loss": -6.836127281188965, "global_step": 164659, "epoch": 3920} {"train_loss": -7.142271518707275, "global_step": 164660, "epoch": 3920} {"train_loss": -7.018159866333008, "global_step": 164661, "epoch": 3920} {"train_loss": -6.882570266723633, "global_step": 164662, "epoch": 3920} {"train_loss": -6.983530521392822, "global_step": 164663, "epoch": 3920} {"train_loss": -7.038928508758545, "global_step": 164664, "epoch": 3920} {"train_loss": -7.055318355560303, "global_step": 164665, "epoch": 3920} {"train_loss": -7.140859127044678, "global_step": 164666, "epoch": 3920} {"train_loss": -7.149410724639893, "global_step": 164667, "epoch": 3920} {"train_loss": -7.168553829193115, "global_step": 164668, "epoch": 3920} {"train_loss": -6.974801063537598, "global_step": 164669, "epoch": 3920} {"train_loss": -7.004091262817383, "global_step": 164670, "epoch": 3920} {"train_loss": -6.971854209899902, "global_step": 164671, "epoch": 3920} {"train_loss": -6.957620620727539, "global_step": 164672, "epoch": 3920} {"train_loss": -6.841324806213379, "global_step": 164673, "epoch": 3920} {"train_loss": -7.0293869972229, "global_step": 164674, "epoch": 3920} {"train_loss": -6.936461925506592, "global_step": 164675, "epoch": 3920} {"train_loss": -7.00349235534668, "global_step": 164676, "epoch": 3920} {"train_loss": -6.92697811126709, "global_step": 164677, "epoch": 3920} {"train_loss": -7.053798675537109, "global_step": 164678, "epoch": 3920} {"train_loss": -6.983942031860352, "global_step": 164679, "epoch": 3920} {"train_loss": -6.913861274719238, "global_step": 164680, "epoch": 3920} {"train_loss": -6.984851519266765, "global_step": 164681, "epoch": 3920, "val_loss": 79395.875} {"train_loss": -7.043390274047852, "global_step": 164682, "epoch": 3921} {"train_loss": -7.003690242767334, "global_step": 164683, "epoch": 3921} {"train_loss": -7.055576324462891, "global_step": 164684, "epoch": 3921} {"train_loss": -6.939337730407715, "global_step": 164685, "epoch": 3921} {"train_loss": -7.07364559173584, "global_step": 164686, "epoch": 3921} {"train_loss": -7.061923980712891, "global_step": 164687, "epoch": 3921} {"train_loss": -7.012882232666016, "global_step": 164688, "epoch": 3921} {"train_loss": -7.029242515563965, "global_step": 164689, "epoch": 3921} {"train_loss": -7.089413642883301, "global_step": 164690, "epoch": 3921} {"train_loss": -7.043764114379883, "global_step": 164691, "epoch": 3921} {"train_loss": -6.99276065826416, "global_step": 164692, "epoch": 3921} {"train_loss": -6.917007923126221, "global_step": 164693, "epoch": 3921} {"train_loss": -7.003691673278809, "global_step": 164694, "epoch": 3921} {"train_loss": -6.998233795166016, "global_step": 164695, "epoch": 3921} {"train_loss": -7.0201416015625, "global_step": 164696, "epoch": 3921} {"train_loss": -6.985201358795166, "global_step": 164697, "epoch": 3921} {"train_loss": -7.108652114868164, "global_step": 164698, "epoch": 3921} {"train_loss": -7.064946174621582, "global_step": 164699, "epoch": 3921} {"train_loss": -6.9031572341918945, "global_step": 164700, "epoch": 3921} {"train_loss": -7.063458442687988, "global_step": 164701, "epoch": 3921} {"train_loss": -7.099015712738037, "global_step": 164702, "epoch": 3921} {"train_loss": -6.925568580627441, "global_step": 164703, "epoch": 3921} {"train_loss": -6.998952388763428, "global_step": 164704, "epoch": 3921} {"train_loss": -7.077678680419922, "global_step": 164705, "epoch": 3921} {"train_loss": -7.011102199554443, "global_step": 164706, "epoch": 3921} {"train_loss": -6.942324638366699, "global_step": 164707, "epoch": 3921} {"train_loss": -7.0397233963012695, "global_step": 164708, "epoch": 3921} {"train_loss": -7.059247016906738, "global_step": 164709, "epoch": 3921} {"train_loss": -7.017147064208984, "global_step": 164710, "epoch": 3921} {"train_loss": -7.030752658843994, "global_step": 164711, "epoch": 3921} {"train_loss": -6.964670181274414, "global_step": 164712, "epoch": 3921} {"train_loss": -6.995889663696289, "global_step": 164713, "epoch": 3921} {"train_loss": -7.038150310516357, "global_step": 164714, "epoch": 3921} {"train_loss": -6.994455814361572, "global_step": 164715, "epoch": 3921} {"train_loss": -6.993833541870117, "global_step": 164716, "epoch": 3921} {"train_loss": -7.120849609375, "global_step": 164717, "epoch": 3921} {"train_loss": -7.001802444458008, "global_step": 164718, "epoch": 3921} {"train_loss": -6.9774580001831055, "global_step": 164719, "epoch": 3921} {"train_loss": -6.968511581420898, "global_step": 164720, "epoch": 3921} {"train_loss": -6.949052810668945, "global_step": 164721, "epoch": 3921} {"train_loss": -7.063904285430908, "global_step": 164722, "epoch": 3921} {"train_loss": -7.015661568868728, "global_step": 164723, "epoch": 3921, "val_loss": 79728.3359375} {"train_loss": -7.178676605224609, "global_step": 164724, "epoch": 3922} {"train_loss": -6.8332977294921875, "global_step": 164725, "epoch": 3922} {"train_loss": -6.95784854888916, "global_step": 164726, "epoch": 3922} {"train_loss": -6.969757556915283, "global_step": 164727, "epoch": 3922} {"train_loss": -6.995467185974121, "global_step": 164728, "epoch": 3922} {"train_loss": -6.946638584136963, "global_step": 164729, "epoch": 3922} {"train_loss": -6.875080108642578, "global_step": 164730, "epoch": 3922} {"train_loss": -7.015588760375977, "global_step": 164731, "epoch": 3922} {"train_loss": -7.086023330688477, "global_step": 164732, "epoch": 3922} {"train_loss": -6.97086238861084, "global_step": 164733, "epoch": 3922} {"train_loss": -6.927842617034912, "global_step": 164734, "epoch": 3922} {"train_loss": -7.124604225158691, "global_step": 164735, "epoch": 3922} {"train_loss": -6.982254981994629, "global_step": 164736, "epoch": 3922} {"train_loss": -6.905758857727051, "global_step": 164737, "epoch": 3922} {"train_loss": -7.036544322967529, "global_step": 164738, "epoch": 3922} {"train_loss": -6.897345542907715, "global_step": 164739, "epoch": 3922} {"train_loss": -7.196615219116211, "global_step": 164740, "epoch": 3922} {"train_loss": -6.965332984924316, "global_step": 164741, "epoch": 3922} {"train_loss": -7.066013336181641, "global_step": 164742, "epoch": 3922} {"train_loss": -6.950273513793945, "global_step": 164743, "epoch": 3922} {"train_loss": -6.857276439666748, "global_step": 164744, "epoch": 3922} {"train_loss": -7.009876251220703, "global_step": 164745, "epoch": 3922} {"train_loss": -7.0015411376953125, "global_step": 164746, "epoch": 3922} {"train_loss": -6.949798583984375, "global_step": 164747, "epoch": 3922} {"train_loss": -6.971606731414795, "global_step": 164748, "epoch": 3922} {"train_loss": -7.010161399841309, "global_step": 164749, "epoch": 3922} {"train_loss": -6.935243129730225, "global_step": 164750, "epoch": 3922} {"train_loss": -7.004278182983398, "global_step": 164751, "epoch": 3922} {"train_loss": -6.992378234863281, "global_step": 164752, "epoch": 3922} {"train_loss": -6.901269912719727, "global_step": 164753, "epoch": 3922} {"train_loss": -7.046794414520264, "global_step": 164754, "epoch": 3922} {"train_loss": -6.993525505065918, "global_step": 164755, "epoch": 3922} {"train_loss": -6.901003360748291, "global_step": 164756, "epoch": 3922} {"train_loss": -7.078885555267334, "global_step": 164757, "epoch": 3922} {"train_loss": -7.02204704284668, "global_step": 164758, "epoch": 3922} {"train_loss": -6.985881328582764, "global_step": 164759, "epoch": 3922} {"train_loss": -7.015805244445801, "global_step": 164760, "epoch": 3922} {"train_loss": -7.021193504333496, "global_step": 164761, "epoch": 3922} {"train_loss": -7.040374755859375, "global_step": 164762, "epoch": 3922} {"train_loss": -7.029890060424805, "global_step": 164763, "epoch": 3922} {"train_loss": -7.044425964355469, "global_step": 164764, "epoch": 3922} {"train_loss": -6.992941549846104, "global_step": 164765, "epoch": 3922, "val_loss": 79721.640625} {"train_loss": -7.004047870635986, "global_step": 164766, "epoch": 3923} {"train_loss": -7.087512969970703, "global_step": 164767, "epoch": 3923} {"train_loss": -7.108876705169678, "global_step": 164768, "epoch": 3923} {"train_loss": -6.952106952667236, "global_step": 164769, "epoch": 3923} {"train_loss": -6.969733238220215, "global_step": 164770, "epoch": 3923} {"train_loss": -7.040112495422363, "global_step": 164771, "epoch": 3923} {"train_loss": -6.990861892700195, "global_step": 164772, "epoch": 3923} {"train_loss": -6.9398393630981445, "global_step": 164773, "epoch": 3923} {"train_loss": -6.940669059753418, "global_step": 164774, "epoch": 3923} {"train_loss": -6.9724040031433105, "global_step": 164775, "epoch": 3923} {"train_loss": -6.940415382385254, "global_step": 164776, "epoch": 3923} {"train_loss": -7.045598030090332, "global_step": 164777, "epoch": 3923} {"train_loss": -7.024474620819092, "global_step": 164778, "epoch": 3923} {"train_loss": -6.946447372436523, "global_step": 164779, "epoch": 3923} {"train_loss": -6.943532943725586, "global_step": 164780, "epoch": 3923} {"train_loss": -6.991655349731445, "global_step": 164781, "epoch": 3923} {"train_loss": -7.007105827331543, "global_step": 164782, "epoch": 3923} {"train_loss": -6.8785719871521, "global_step": 164783, "epoch": 3923} {"train_loss": -6.9291181564331055, "global_step": 164784, "epoch": 3923} {"train_loss": -7.0421857833862305, "global_step": 164785, "epoch": 3923} {"train_loss": -7.050662040710449, "global_step": 164786, "epoch": 3923} {"train_loss": -7.027010917663574, "global_step": 164787, "epoch": 3923} {"train_loss": -7.084632396697998, "global_step": 164788, "epoch": 3923} {"train_loss": -7.003304481506348, "global_step": 164789, "epoch": 3923} {"train_loss": -7.0473222732543945, "global_step": 164790, "epoch": 3923} {"train_loss": -6.991621017456055, "global_step": 164791, "epoch": 3923} {"train_loss": -7.093639373779297, "global_step": 164792, "epoch": 3923} {"train_loss": -6.9807939529418945, "global_step": 164793, "epoch": 3923} {"train_loss": -7.098282814025879, "global_step": 164794, "epoch": 3923} {"train_loss": -6.922127723693848, "global_step": 164795, "epoch": 3923} {"train_loss": -7.051905632019043, "global_step": 164796, "epoch": 3923} {"train_loss": -7.027364730834961, "global_step": 164797, "epoch": 3923} {"train_loss": -6.9817705154418945, "global_step": 164798, "epoch": 3923} {"train_loss": -7.005456924438477, "global_step": 164799, "epoch": 3923} {"train_loss": -7.097022533416748, "global_step": 164800, "epoch": 3923} {"train_loss": -6.983463287353516, "global_step": 164801, "epoch": 3923} {"train_loss": -7.199520111083984, "global_step": 164802, "epoch": 3923} {"train_loss": -6.938940048217773, "global_step": 164803, "epoch": 3923} {"train_loss": -7.059330940246582, "global_step": 164804, "epoch": 3923} {"train_loss": -7.059673309326172, "global_step": 164805, "epoch": 3923} {"train_loss": -7.019894599914551, "global_step": 164806, "epoch": 3923} {"train_loss": -7.011458692096529, "global_step": 164807, "epoch": 3923, "val_loss": 79795.8984375} {"train_loss": -7.048266887664795, "global_step": 164808, "epoch": 3924} {"train_loss": -7.1071906089782715, "global_step": 164809, "epoch": 3924} {"train_loss": -7.078733444213867, "global_step": 164810, "epoch": 3924} {"train_loss": -7.138993263244629, "global_step": 164811, "epoch": 3924} {"train_loss": -6.9723429679870605, "global_step": 164812, "epoch": 3924} {"train_loss": -7.064459800720215, "global_step": 164813, "epoch": 3924} {"train_loss": -7.1084136962890625, "global_step": 164814, "epoch": 3924} {"train_loss": -7.108506202697754, "global_step": 164815, "epoch": 3924} {"train_loss": -7.077399253845215, "global_step": 164816, "epoch": 3924} {"train_loss": -7.0220136642456055, "global_step": 164817, "epoch": 3924} {"train_loss": -6.898599147796631, "global_step": 164818, "epoch": 3924} {"train_loss": -6.965019226074219, "global_step": 164819, "epoch": 3924} {"train_loss": -6.93778133392334, "global_step": 164820, "epoch": 3924} {"train_loss": -6.9743523597717285, "global_step": 164821, "epoch": 3924} {"train_loss": -6.921759605407715, "global_step": 164822, "epoch": 3924} {"train_loss": -7.033603668212891, "global_step": 164823, "epoch": 3924} {"train_loss": -6.946504592895508, "global_step": 164824, "epoch": 3924} {"train_loss": -7.003147602081299, "global_step": 164825, "epoch": 3924} {"train_loss": -6.936975479125977, "global_step": 164826, "epoch": 3924} {"train_loss": -7.037892818450928, "global_step": 164827, "epoch": 3924} {"train_loss": -6.869483947753906, "global_step": 164828, "epoch": 3924} {"train_loss": -7.112950325012207, "global_step": 164829, "epoch": 3924} {"train_loss": -6.9849443435668945, "global_step": 164830, "epoch": 3924} {"train_loss": -7.035135269165039, "global_step": 164831, "epoch": 3924} {"train_loss": -6.999454498291016, "global_step": 164832, "epoch": 3924} {"train_loss": -7.088226318359375, "global_step": 164833, "epoch": 3924} {"train_loss": -6.932506561279297, "global_step": 164834, "epoch": 3924} {"train_loss": -7.121179580688477, "global_step": 164835, "epoch": 3924} {"train_loss": -6.916726112365723, "global_step": 164836, "epoch": 3924} {"train_loss": -6.946401596069336, "global_step": 164837, "epoch": 3924} {"train_loss": -6.949729919433594, "global_step": 164838, "epoch": 3924} {"train_loss": -7.056153774261475, "global_step": 164839, "epoch": 3924} {"train_loss": -7.052065849304199, "global_step": 164840, "epoch": 3924} {"train_loss": -7.029819011688232, "global_step": 164841, "epoch": 3924} {"train_loss": -7.043285369873047, "global_step": 164842, "epoch": 3924} {"train_loss": -6.974616050720215, "global_step": 164843, "epoch": 3924} {"train_loss": -7.024322032928467, "global_step": 164844, "epoch": 3924} {"train_loss": -7.168452739715576, "global_step": 164845, "epoch": 3924} {"train_loss": -7.030385494232178, "global_step": 164846, "epoch": 3924} {"train_loss": -7.144137382507324, "global_step": 164847, "epoch": 3924} {"train_loss": -7.028265953063965, "global_step": 164848, "epoch": 3924} {"train_loss": -7.019237109592983, "global_step": 164849, "epoch": 3924, "val_loss": 79510.453125} {"train_loss": -7.009009838104248, "global_step": 164850, "epoch": 3925} {"train_loss": -7.079960823059082, "global_step": 164851, "epoch": 3925} {"train_loss": -7.013502597808838, "global_step": 164852, "epoch": 3925} {"train_loss": -7.056539058685303, "global_step": 164853, "epoch": 3925} {"train_loss": -6.980591773986816, "global_step": 164854, "epoch": 3925} {"train_loss": -7.193081378936768, "global_step": 164855, "epoch": 3925} {"train_loss": -6.974128723144531, "global_step": 164856, "epoch": 3925} {"train_loss": -7.016328811645508, "global_step": 164857, "epoch": 3925} {"train_loss": -6.869625091552734, "global_step": 164858, "epoch": 3925} {"train_loss": -7.086276054382324, "global_step": 164859, "epoch": 3925} {"train_loss": -6.858428955078125, "global_step": 164860, "epoch": 3925} {"train_loss": -7.042608261108398, "global_step": 164861, "epoch": 3925} {"train_loss": -6.940478324890137, "global_step": 164862, "epoch": 3925} {"train_loss": -7.088997840881348, "global_step": 164863, "epoch": 3925} {"train_loss": -6.98856782913208, "global_step": 164864, "epoch": 3925} {"train_loss": -7.002442359924316, "global_step": 164865, "epoch": 3925} {"train_loss": -6.997995376586914, "global_step": 164866, "epoch": 3925} {"train_loss": -6.918516159057617, "global_step": 164867, "epoch": 3925} {"train_loss": -6.962452411651611, "global_step": 164868, "epoch": 3925} {"train_loss": -7.002718448638916, "global_step": 164869, "epoch": 3925} {"train_loss": -7.064789772033691, "global_step": 164870, "epoch": 3925} {"train_loss": -7.006896018981934, "global_step": 164871, "epoch": 3925} {"train_loss": -6.890387535095215, "global_step": 164872, "epoch": 3925} {"train_loss": -6.995659828186035, "global_step": 164873, "epoch": 3925} {"train_loss": -7.054820537567139, "global_step": 164874, "epoch": 3925} {"train_loss": -6.9848313331604, "global_step": 164875, "epoch": 3925} {"train_loss": -6.984969139099121, "global_step": 164876, "epoch": 3925} {"train_loss": -7.032834529876709, "global_step": 164877, "epoch": 3925} {"train_loss": -6.964504241943359, "global_step": 164878, "epoch": 3925} {"train_loss": -6.950562477111816, "global_step": 164879, "epoch": 3925} {"train_loss": -6.801945686340332, "global_step": 164880, "epoch": 3925} {"train_loss": -7.019018173217773, "global_step": 164881, "epoch": 3925} {"train_loss": -6.972294807434082, "global_step": 164882, "epoch": 3925} {"train_loss": -6.86195182800293, "global_step": 164883, "epoch": 3925} {"train_loss": -6.922059059143066, "global_step": 164884, "epoch": 3925} {"train_loss": -6.864947319030762, "global_step": 164885, "epoch": 3925} {"train_loss": -6.847141742706299, "global_step": 164886, "epoch": 3925} {"train_loss": -6.883133888244629, "global_step": 164887, "epoch": 3925} {"train_loss": -6.927986145019531, "global_step": 164888, "epoch": 3925} {"train_loss": -6.920570373535156, "global_step": 164889, "epoch": 3925} {"train_loss": -6.992361068725586, "global_step": 164890, "epoch": 3925} {"train_loss": -6.972183931441534, "global_step": 164891, "epoch": 3925, "val_loss": 79555.1875} {"train_loss": -7.0313944816589355, "global_step": 164892, "epoch": 3926} {"train_loss": -6.952447414398193, "global_step": 164893, "epoch": 3926} {"train_loss": -7.03956413269043, "global_step": 164894, "epoch": 3926} {"train_loss": -6.976493835449219, "global_step": 164895, "epoch": 3926} {"train_loss": -6.940610885620117, "global_step": 164896, "epoch": 3926} {"train_loss": -7.02855110168457, "global_step": 164897, "epoch": 3926} {"train_loss": -6.825991630554199, "global_step": 164898, "epoch": 3926} {"train_loss": -6.939489841461182, "global_step": 164899, "epoch": 3926} {"train_loss": -7.039172172546387, "global_step": 164900, "epoch": 3926} {"train_loss": -6.974647521972656, "global_step": 164901, "epoch": 3926} {"train_loss": -7.072502136230469, "global_step": 164902, "epoch": 3926} {"train_loss": -6.949282646179199, "global_step": 164903, "epoch": 3926} {"train_loss": -6.9123945236206055, "global_step": 164904, "epoch": 3926} {"train_loss": -6.983705520629883, "global_step": 164905, "epoch": 3926} {"train_loss": -6.926021099090576, "global_step": 164906, "epoch": 3926} {"train_loss": -7.014500141143799, "global_step": 164907, "epoch": 3926} {"train_loss": -7.083859443664551, "global_step": 164908, "epoch": 3926} {"train_loss": -7.021080017089844, "global_step": 164909, "epoch": 3926} {"train_loss": -6.930094242095947, "global_step": 164910, "epoch": 3926} {"train_loss": -6.951693534851074, "global_step": 164911, "epoch": 3926} {"train_loss": -7.087708473205566, "global_step": 164912, "epoch": 3926} {"train_loss": -6.950020790100098, "global_step": 164913, "epoch": 3926} {"train_loss": -7.063699722290039, "global_step": 164914, "epoch": 3926} {"train_loss": -6.960984230041504, "global_step": 164915, "epoch": 3926} {"train_loss": -7.038978576660156, "global_step": 164916, "epoch": 3926} {"train_loss": -7.12394905090332, "global_step": 164917, "epoch": 3926} {"train_loss": -7.044406890869141, "global_step": 164918, "epoch": 3926} {"train_loss": -7.0210442543029785, "global_step": 164919, "epoch": 3926} {"train_loss": -6.986686706542969, "global_step": 164920, "epoch": 3926} {"train_loss": -6.938449859619141, "global_step": 164921, "epoch": 3926} {"train_loss": -7.098748207092285, "global_step": 164922, "epoch": 3926} {"train_loss": -7.01513671875, "global_step": 164923, "epoch": 3926} {"train_loss": -6.974640846252441, "global_step": 164924, "epoch": 3926} {"train_loss": -6.988502502441406, "global_step": 164925, "epoch": 3926} {"train_loss": -7.063582420349121, "global_step": 164926, "epoch": 3926} {"train_loss": -7.02419376373291, "global_step": 164927, "epoch": 3926} {"train_loss": -6.872807502746582, "global_step": 164928, "epoch": 3926} {"train_loss": -7.076282501220703, "global_step": 164929, "epoch": 3926} {"train_loss": -6.951532363891602, "global_step": 164930, "epoch": 3926} {"train_loss": -7.045496940612793, "global_step": 164931, "epoch": 3926} {"train_loss": -7.07177734375, "global_step": 164932, "epoch": 3926} {"train_loss": -6.998676652000064, "global_step": 164933, "epoch": 3926, "val_loss": 79684.421875} {"train_loss": -7.036025047302246, "global_step": 164934, "epoch": 3927} {"train_loss": -7.0471086502075195, "global_step": 164935, "epoch": 3927} {"train_loss": -6.897205352783203, "global_step": 164936, "epoch": 3927} {"train_loss": -6.982930660247803, "global_step": 164937, "epoch": 3927} {"train_loss": -7.05064582824707, "global_step": 164938, "epoch": 3927} {"train_loss": -6.925787925720215, "global_step": 164939, "epoch": 3927} {"train_loss": -7.004664421081543, "global_step": 164940, "epoch": 3927} {"train_loss": -7.0165605545043945, "global_step": 164941, "epoch": 3927} {"train_loss": -6.971940517425537, "global_step": 164942, "epoch": 3927} {"train_loss": -6.986295700073242, "global_step": 164943, "epoch": 3927} {"train_loss": -7.03463077545166, "global_step": 164944, "epoch": 3927} {"train_loss": -7.045505523681641, "global_step": 164945, "epoch": 3927} {"train_loss": -7.02443790435791, "global_step": 164946, "epoch": 3927} {"train_loss": -7.0701904296875, "global_step": 164947, "epoch": 3927} {"train_loss": -6.970790863037109, "global_step": 164948, "epoch": 3927} {"train_loss": -6.855562210083008, "global_step": 164949, "epoch": 3927} {"train_loss": -7.025564670562744, "global_step": 164950, "epoch": 3927} {"train_loss": -6.9267706871032715, "global_step": 164951, "epoch": 3927} {"train_loss": -6.828922271728516, "global_step": 164952, "epoch": 3927} {"train_loss": -7.039773941040039, "global_step": 164953, "epoch": 3927} {"train_loss": -6.874372482299805, "global_step": 164954, "epoch": 3927} {"train_loss": -6.8398942947387695, "global_step": 164955, "epoch": 3927} {"train_loss": -6.941043853759766, "global_step": 164956, "epoch": 3927} {"train_loss": -6.920241355895996, "global_step": 164957, "epoch": 3927} {"train_loss": -6.941641330718994, "global_step": 164958, "epoch": 3927} {"train_loss": -6.932256698608398, "global_step": 164959, "epoch": 3927} {"train_loss": -6.881674766540527, "global_step": 164960, "epoch": 3927} {"train_loss": -6.895310878753662, "global_step": 164961, "epoch": 3927} {"train_loss": -6.936700344085693, "global_step": 164962, "epoch": 3927} {"train_loss": -6.956732749938965, "global_step": 164963, "epoch": 3927} {"train_loss": -7.0263261795043945, "global_step": 164964, "epoch": 3927} {"train_loss": -7.082405090332031, "global_step": 164965, "epoch": 3927} {"train_loss": -7.060935020446777, "global_step": 164966, "epoch": 3927} {"train_loss": -6.9180097579956055, "global_step": 164967, "epoch": 3927} {"train_loss": -7.135384559631348, "global_step": 164968, "epoch": 3927} {"train_loss": -7.002601623535156, "global_step": 164969, "epoch": 3927} {"train_loss": -6.959963798522949, "global_step": 164970, "epoch": 3927} {"train_loss": -6.947068214416504, "global_step": 164971, "epoch": 3927} {"train_loss": -7.096624374389648, "global_step": 164972, "epoch": 3927} {"train_loss": -7.060513973236084, "global_step": 164973, "epoch": 3927} {"train_loss": -7.0799713134765625, "global_step": 164974, "epoch": 3927} {"train_loss": -6.980290458315895, "global_step": 164975, "epoch": 3927, "val_loss": 79618.1953125} {"train_loss": -7.1080522537231445, "global_step": 164976, "epoch": 3928} {"train_loss": -7.064211368560791, "global_step": 164977, "epoch": 3928} {"train_loss": -7.035188674926758, "global_step": 164978, "epoch": 3928} {"train_loss": -6.9913811683654785, "global_step": 164979, "epoch": 3928} {"train_loss": -7.101727485656738, "global_step": 164980, "epoch": 3928} {"train_loss": -7.056922912597656, "global_step": 164981, "epoch": 3928} {"train_loss": -7.059088706970215, "global_step": 164982, "epoch": 3928} {"train_loss": -6.959733963012695, "global_step": 164983, "epoch": 3928} {"train_loss": -7.035213470458984, "global_step": 164984, "epoch": 3928} {"train_loss": -7.061641693115234, "global_step": 164985, "epoch": 3928} {"train_loss": -7.025848388671875, "global_step": 164986, "epoch": 3928} {"train_loss": -6.882763862609863, "global_step": 164987, "epoch": 3928} {"train_loss": -6.878466606140137, "global_step": 164988, "epoch": 3928} {"train_loss": -7.012284755706787, "global_step": 164989, "epoch": 3928} {"train_loss": -7.043715953826904, "global_step": 164990, "epoch": 3928} {"train_loss": -6.922444820404053, "global_step": 164991, "epoch": 3928} {"train_loss": -6.99383544921875, "global_step": 164992, "epoch": 3928} {"train_loss": -6.9112372398376465, "global_step": 164993, "epoch": 3928} {"train_loss": -6.942267417907715, "global_step": 164994, "epoch": 3928} {"train_loss": -6.965221881866455, "global_step": 164995, "epoch": 3928} {"train_loss": -6.797675609588623, "global_step": 164996, "epoch": 3928} {"train_loss": -6.906937599182129, "global_step": 164997, "epoch": 3928} {"train_loss": -6.899139404296875, "global_step": 164998, "epoch": 3928} {"train_loss": -6.853307723999023, "global_step": 164999, "epoch": 3928} {"train_loss": -7.016533851623535, "global_step": 165000, "epoch": 3928} {"train_loss": -6.8458251953125, "global_step": 165001, "epoch": 3928} {"train_loss": -6.938994407653809, "global_step": 165002, "epoch": 3928} {"train_loss": -6.758172035217285, "global_step": 165003, "epoch": 3928} {"train_loss": -7.032676696777344, "global_step": 165004, "epoch": 3928} {"train_loss": -6.907112121582031, "global_step": 165005, "epoch": 3928} {"train_loss": -6.912986755371094, "global_step": 165006, "epoch": 3928} {"train_loss": -6.922878265380859, "global_step": 165007, "epoch": 3928} {"train_loss": -6.79611873626709, "global_step": 165008, "epoch": 3928} {"train_loss": -6.965465068817139, "global_step": 165009, "epoch": 3928} {"train_loss": -7.039447784423828, "global_step": 165010, "epoch": 3928} {"train_loss": -6.92579984664917, "global_step": 165011, "epoch": 3928} {"train_loss": -6.9874725341796875, "global_step": 165012, "epoch": 3928} {"train_loss": -6.970268249511719, "global_step": 165013, "epoch": 3928} {"train_loss": -6.922719955444336, "global_step": 165014, "epoch": 3928} {"train_loss": -7.005097389221191, "global_step": 165015, "epoch": 3928} {"train_loss": -6.990600109100342, "global_step": 165016, "epoch": 3928} {"train_loss": -6.960246063414074, "global_step": 165017, "epoch": 3928, "val_loss": 79511.984375} {"train_loss": -6.991380214691162, "global_step": 165018, "epoch": 3929} {"train_loss": -6.955085277557373, "global_step": 165019, "epoch": 3929} {"train_loss": -7.019789695739746, "global_step": 165020, "epoch": 3929} {"train_loss": -6.915408134460449, "global_step": 165021, "epoch": 3929} {"train_loss": -6.884939193725586, "global_step": 165022, "epoch": 3929} {"train_loss": -6.917544841766357, "global_step": 165023, "epoch": 3929} {"train_loss": -6.943799018859863, "global_step": 165024, "epoch": 3929} {"train_loss": -7.027123928070068, "global_step": 165025, "epoch": 3929} {"train_loss": -7.00394344329834, "global_step": 165026, "epoch": 3929} {"train_loss": -6.910175800323486, "global_step": 165027, "epoch": 3929} {"train_loss": -7.013101100921631, "global_step": 165028, "epoch": 3929} {"train_loss": -6.954910755157471, "global_step": 165029, "epoch": 3929} {"train_loss": -7.02099084854126, "global_step": 165030, "epoch": 3929} {"train_loss": -7.092507839202881, "global_step": 165031, "epoch": 3929} {"train_loss": -7.006997108459473, "global_step": 165032, "epoch": 3929} {"train_loss": -6.954920768737793, "global_step": 165033, "epoch": 3929} {"train_loss": -7.023522853851318, "global_step": 165034, "epoch": 3929} {"train_loss": -6.907223701477051, "global_step": 165035, "epoch": 3929} {"train_loss": -7.005678176879883, "global_step": 165036, "epoch": 3929} {"train_loss": -7.077925682067871, "global_step": 165037, "epoch": 3929} {"train_loss": -7.051337718963623, "global_step": 165038, "epoch": 3929} {"train_loss": -7.001657485961914, "global_step": 165039, "epoch": 3929} {"train_loss": -7.015765190124512, "global_step": 165040, "epoch": 3929} {"train_loss": -7.026918888092041, "global_step": 165041, "epoch": 3929} {"train_loss": -7.1009135246276855, "global_step": 165042, "epoch": 3929} {"train_loss": -6.968293190002441, "global_step": 165043, "epoch": 3929} {"train_loss": -7.060401439666748, "global_step": 165044, "epoch": 3929} {"train_loss": -7.006185531616211, "global_step": 165045, "epoch": 3929} {"train_loss": -7.101062774658203, "global_step": 165046, "epoch": 3929} {"train_loss": -7.021772384643555, "global_step": 165047, "epoch": 3929} {"train_loss": -6.950664043426514, "global_step": 165048, "epoch": 3929} {"train_loss": -6.867515563964844, "global_step": 165049, "epoch": 3929} {"train_loss": -6.951046943664551, "global_step": 165050, "epoch": 3929} {"train_loss": -7.039430141448975, "global_step": 165051, "epoch": 3929} {"train_loss": -6.710956573486328, "global_step": 165052, "epoch": 3929} {"train_loss": -6.731196403503418, "global_step": 165053, "epoch": 3929} {"train_loss": -6.825203895568848, "global_step": 165054, "epoch": 3929} {"train_loss": -6.931365489959717, "global_step": 165055, "epoch": 3929} {"train_loss": -6.867345809936523, "global_step": 165056, "epoch": 3929} {"train_loss": -6.971339225769043, "global_step": 165057, "epoch": 3929} {"train_loss": -6.8860626220703125, "global_step": 165058, "epoch": 3929} {"train_loss": -6.967010168802171, "global_step": 165059, "epoch": 3929, "val_loss": 79312.953125} {"train_loss": -7.073095798492432, "global_step": 165060, "epoch": 3930} {"train_loss": -6.984851837158203, "global_step": 165061, "epoch": 3930} {"train_loss": -6.947277069091797, "global_step": 165062, "epoch": 3930} {"train_loss": -6.981882095336914, "global_step": 165063, "epoch": 3930} {"train_loss": -6.884318828582764, "global_step": 165064, "epoch": 3930} {"train_loss": -7.001872539520264, "global_step": 165065, "epoch": 3930} {"train_loss": -7.049460411071777, "global_step": 165066, "epoch": 3930} {"train_loss": -6.855461120605469, "global_step": 165067, "epoch": 3930} {"train_loss": -6.860321521759033, "global_step": 165068, "epoch": 3930} {"train_loss": -6.844147205352783, "global_step": 165069, "epoch": 3930} {"train_loss": -7.050266742706299, "global_step": 165070, "epoch": 3930} {"train_loss": -6.973997116088867, "global_step": 165071, "epoch": 3930} {"train_loss": -6.981607437133789, "global_step": 165072, "epoch": 3930} {"train_loss": -7.00630521774292, "global_step": 165073, "epoch": 3930} {"train_loss": -6.939619064331055, "global_step": 165074, "epoch": 3930} {"train_loss": -6.927812099456787, "global_step": 165075, "epoch": 3930} {"train_loss": -7.03824520111084, "global_step": 165076, "epoch": 3930} {"train_loss": -7.124207019805908, "global_step": 165077, "epoch": 3930} {"train_loss": -7.048473358154297, "global_step": 165078, "epoch": 3930} {"train_loss": -7.123325347900391, "global_step": 165079, "epoch": 3930} {"train_loss": -7.002674102783203, "global_step": 165080, "epoch": 3930} {"train_loss": -7.0077738761901855, "global_step": 165081, "epoch": 3930} {"train_loss": -7.002774715423584, "global_step": 165082, "epoch": 3930} {"train_loss": -7.028407096862793, "global_step": 165083, "epoch": 3930} {"train_loss": -7.01719331741333, "global_step": 165084, "epoch": 3930} {"train_loss": -6.851740837097168, "global_step": 165085, "epoch": 3930} {"train_loss": -6.880457878112793, "global_step": 165086, "epoch": 3930} {"train_loss": -7.1408233642578125, "global_step": 165087, "epoch": 3930} {"train_loss": -7.0588531494140625, "global_step": 165088, "epoch": 3930} {"train_loss": -6.97711706161499, "global_step": 165089, "epoch": 3930} {"train_loss": -6.9668731689453125, "global_step": 165090, "epoch": 3930} {"train_loss": -6.968747138977051, "global_step": 165091, "epoch": 3930} {"train_loss": -6.820533752441406, "global_step": 165092, "epoch": 3930} {"train_loss": -7.065865993499756, "global_step": 165093, "epoch": 3930} {"train_loss": -7.031704902648926, "global_step": 165094, "epoch": 3930} {"train_loss": -7.021255016326904, "global_step": 165095, "epoch": 3930} {"train_loss": -6.9582200050354, "global_step": 165096, "epoch": 3930} {"train_loss": -7.083735466003418, "global_step": 165097, "epoch": 3930} {"train_loss": -7.029271125793457, "global_step": 165098, "epoch": 3930} {"train_loss": -6.893166542053223, "global_step": 165099, "epoch": 3930} {"train_loss": -6.952970504760742, "global_step": 165100, "epoch": 3930} {"train_loss": -6.986378499439785, "global_step": 165101, "epoch": 3930, "val_loss": 79520.1953125} {"train_loss": -6.923440933227539, "global_step": 165102, "epoch": 3931} {"train_loss": -6.963997840881348, "global_step": 165103, "epoch": 3931} {"train_loss": -6.857594013214111, "global_step": 165104, "epoch": 3931} {"train_loss": -7.062409400939941, "global_step": 165105, "epoch": 3931} {"train_loss": -6.935428142547607, "global_step": 165106, "epoch": 3931} {"train_loss": -6.998061180114746, "global_step": 165107, "epoch": 3931} {"train_loss": -6.93533992767334, "global_step": 165108, "epoch": 3931} {"train_loss": -6.925484657287598, "global_step": 165109, "epoch": 3931} {"train_loss": -6.7850751876831055, "global_step": 165110, "epoch": 3931} {"train_loss": -6.781233310699463, "global_step": 165111, "epoch": 3931} {"train_loss": -6.83304500579834, "global_step": 165112, "epoch": 3931} {"train_loss": -7.070068359375, "global_step": 165113, "epoch": 3931} {"train_loss": -6.949772834777832, "global_step": 165114, "epoch": 3931} {"train_loss": -6.841311931610107, "global_step": 165115, "epoch": 3931} {"train_loss": -6.881746292114258, "global_step": 165116, "epoch": 3931} {"train_loss": -6.875388145446777, "global_step": 165117, "epoch": 3931} {"train_loss": -6.891404151916504, "global_step": 165118, "epoch": 3931} {"train_loss": -7.044171333312988, "global_step": 165119, "epoch": 3931} {"train_loss": -6.931534767150879, "global_step": 165120, "epoch": 3931} {"train_loss": -6.967729568481445, "global_step": 165121, "epoch": 3931} {"train_loss": -7.036926746368408, "global_step": 165122, "epoch": 3931} {"train_loss": -6.868429660797119, "global_step": 165123, "epoch": 3931} {"train_loss": -6.882394790649414, "global_step": 165124, "epoch": 3931} {"train_loss": -6.895380973815918, "global_step": 165125, "epoch": 3931} {"train_loss": -6.907430648803711, "global_step": 165126, "epoch": 3931} {"train_loss": -6.9186553955078125, "global_step": 165127, "epoch": 3931} {"train_loss": -6.744454383850098, "global_step": 165128, "epoch": 3931} {"train_loss": -7.00955867767334, "global_step": 165129, "epoch": 3931} {"train_loss": -6.9382805824279785, "global_step": 165130, "epoch": 3931} {"train_loss": -7.0506696701049805, "global_step": 165131, "epoch": 3931} {"train_loss": -6.975576400756836, "global_step": 165132, "epoch": 3931} {"train_loss": -6.8764495849609375, "global_step": 165133, "epoch": 3931} {"train_loss": -6.943995475769043, "global_step": 165134, "epoch": 3931} {"train_loss": -7.078591346740723, "global_step": 165135, "epoch": 3931} {"train_loss": -6.955413818359375, "global_step": 165136, "epoch": 3931} {"train_loss": -7.078866004943848, "global_step": 165137, "epoch": 3931} {"train_loss": -6.952328681945801, "global_step": 165138, "epoch": 3931} {"train_loss": -6.838440895080566, "global_step": 165139, "epoch": 3931} {"train_loss": -7.005638122558594, "global_step": 165140, "epoch": 3931} {"train_loss": -6.952160835266113, "global_step": 165141, "epoch": 3931} {"train_loss": -6.97264289855957, "global_step": 165142, "epoch": 3931} {"train_loss": -6.936090548833211, "global_step": 165143, "epoch": 3931, "val_loss": 79616.6953125} {"train_loss": -6.95762300491333, "global_step": 165144, "epoch": 3932} {"train_loss": -7.120665550231934, "global_step": 165145, "epoch": 3932} {"train_loss": -7.005322456359863, "global_step": 165146, "epoch": 3932} {"train_loss": -7.0326385498046875, "global_step": 165147, "epoch": 3932} {"train_loss": -7.016043186187744, "global_step": 165148, "epoch": 3932} {"train_loss": -6.930000305175781, "global_step": 165149, "epoch": 3932} {"train_loss": -7.057497024536133, "global_step": 165150, "epoch": 3932} {"train_loss": -7.084653854370117, "global_step": 165151, "epoch": 3932} {"train_loss": -7.051390647888184, "global_step": 165152, "epoch": 3932} {"train_loss": -7.025468826293945, "global_step": 165153, "epoch": 3932} {"train_loss": -7.096778869628906, "global_step": 165154, "epoch": 3932} {"train_loss": -6.878348350524902, "global_step": 165155, "epoch": 3932} {"train_loss": -7.032863616943359, "global_step": 165156, "epoch": 3932} {"train_loss": -7.132734775543213, "global_step": 165157, "epoch": 3932} {"train_loss": -6.987705230712891, "global_step": 165158, "epoch": 3932} {"train_loss": -6.956532001495361, "global_step": 165159, "epoch": 3932} {"train_loss": -6.953582763671875, "global_step": 165160, "epoch": 3932} {"train_loss": -6.991267204284668, "global_step": 165161, "epoch": 3932} {"train_loss": -6.967957973480225, "global_step": 165162, "epoch": 3932} {"train_loss": -7.007724761962891, "global_step": 165163, "epoch": 3932} {"train_loss": -6.990449905395508, "global_step": 165164, "epoch": 3932} {"train_loss": -7.01162052154541, "global_step": 165165, "epoch": 3932} {"train_loss": -7.017980575561523, "global_step": 165166, "epoch": 3932} {"train_loss": -7.048016548156738, "global_step": 165167, "epoch": 3932} {"train_loss": -7.083939075469971, "global_step": 165168, "epoch": 3932} {"train_loss": -7.057065963745117, "global_step": 165169, "epoch": 3932} {"train_loss": -6.941289901733398, "global_step": 165170, "epoch": 3932} {"train_loss": -6.944186210632324, "global_step": 165171, "epoch": 3932} {"train_loss": -6.902472972869873, "global_step": 165172, "epoch": 3932} {"train_loss": -7.001772880554199, "global_step": 165173, "epoch": 3932} {"train_loss": -7.103844165802002, "global_step": 165174, "epoch": 3932} {"train_loss": -7.091961860656738, "global_step": 165175, "epoch": 3932} {"train_loss": -7.08067512512207, "global_step": 165176, "epoch": 3932} {"train_loss": -7.070279598236084, "global_step": 165177, "epoch": 3932} {"train_loss": -6.973226070404053, "global_step": 165178, "epoch": 3932} {"train_loss": -7.001775741577148, "global_step": 165179, "epoch": 3932} {"train_loss": -6.954817771911621, "global_step": 165180, "epoch": 3932} {"train_loss": -6.97755241394043, "global_step": 165181, "epoch": 3932} {"train_loss": -7.010041236877441, "global_step": 165182, "epoch": 3932} {"train_loss": -7.044040679931641, "global_step": 165183, "epoch": 3932} {"train_loss": -6.977779388427734, "global_step": 165184, "epoch": 3932} {"train_loss": -7.014226141430083, "global_step": 165185, "epoch": 3932, "val_loss": 79530.1015625} {"train_loss": -7.1360182762146, "global_step": 165186, "epoch": 3933} {"train_loss": -6.996115684509277, "global_step": 165187, "epoch": 3933} {"train_loss": -7.021800994873047, "global_step": 165188, "epoch": 3933} {"train_loss": -6.879843235015869, "global_step": 165189, "epoch": 3933} {"train_loss": -6.789520263671875, "global_step": 165190, "epoch": 3933} {"train_loss": -7.10053825378418, "global_step": 165191, "epoch": 3933} {"train_loss": -6.857892990112305, "global_step": 165192, "epoch": 3933} {"train_loss": -7.080915451049805, "global_step": 165193, "epoch": 3933} {"train_loss": -6.975090026855469, "global_step": 165194, "epoch": 3933} {"train_loss": -6.948501110076904, "global_step": 165195, "epoch": 3933} {"train_loss": -7.110995292663574, "global_step": 165196, "epoch": 3933} {"train_loss": -7.017671585083008, "global_step": 165197, "epoch": 3933} {"train_loss": -6.895678520202637, "global_step": 165198, "epoch": 3933} {"train_loss": -6.889751434326172, "global_step": 165199, "epoch": 3933} {"train_loss": -7.073483943939209, "global_step": 165200, "epoch": 3933} {"train_loss": -7.007390022277832, "global_step": 165201, "epoch": 3933} {"train_loss": -6.9241180419921875, "global_step": 165202, "epoch": 3933} {"train_loss": -7.016299247741699, "global_step": 165203, "epoch": 3933} {"train_loss": -7.048840045928955, "global_step": 165204, "epoch": 3933} {"train_loss": -6.999871253967285, "global_step": 165205, "epoch": 3933} {"train_loss": -6.970531463623047, "global_step": 165206, "epoch": 3933} {"train_loss": -7.003404140472412, "global_step": 165207, "epoch": 3933} {"train_loss": -6.998101234436035, "global_step": 165208, "epoch": 3933} {"train_loss": -6.9963202476501465, "global_step": 165209, "epoch": 3933} {"train_loss": -7.06171989440918, "global_step": 165210, "epoch": 3933} {"train_loss": -7.071327209472656, "global_step": 165211, "epoch": 3933} {"train_loss": -6.910359859466553, "global_step": 165212, "epoch": 3933} {"train_loss": -6.981895446777344, "global_step": 165213, "epoch": 3933} {"train_loss": -7.00071382522583, "global_step": 165214, "epoch": 3933} {"train_loss": -6.914821624755859, "global_step": 165215, "epoch": 3933} {"train_loss": -7.001157760620117, "global_step": 165216, "epoch": 3933} {"train_loss": -6.861033916473389, "global_step": 165217, "epoch": 3933} {"train_loss": -6.91450834274292, "global_step": 165218, "epoch": 3933} {"train_loss": -6.896206855773926, "global_step": 165219, "epoch": 3933} {"train_loss": -7.074398994445801, "global_step": 165220, "epoch": 3933} {"train_loss": -7.0128679275512695, "global_step": 165221, "epoch": 3933} {"train_loss": -6.914695739746094, "global_step": 165222, "epoch": 3933} {"train_loss": -7.053074836730957, "global_step": 165223, "epoch": 3933} {"train_loss": -6.932804107666016, "global_step": 165224, "epoch": 3933} {"train_loss": -6.919802665710449, "global_step": 165225, "epoch": 3933} {"train_loss": -6.8502936363220215, "global_step": 165226, "epoch": 3933} {"train_loss": -6.9787924743834, "global_step": 165227, "epoch": 3933, "val_loss": 79784.9375} {"train_loss": -6.989784240722656, "global_step": 165228, "epoch": 3934} {"train_loss": -6.994724273681641, "global_step": 165229, "epoch": 3934} {"train_loss": -6.980549335479736, "global_step": 165230, "epoch": 3934} {"train_loss": -7.02653169631958, "global_step": 165231, "epoch": 3934} {"train_loss": -7.017051696777344, "global_step": 165232, "epoch": 3934} {"train_loss": -6.944309234619141, "global_step": 165233, "epoch": 3934} {"train_loss": -7.07339334487915, "global_step": 165234, "epoch": 3934} {"train_loss": -6.955879211425781, "global_step": 165235, "epoch": 3934} {"train_loss": -7.034165382385254, "global_step": 165236, "epoch": 3934} {"train_loss": -7.015083312988281, "global_step": 165237, "epoch": 3934} {"train_loss": -7.069969177246094, "global_step": 165238, "epoch": 3934} {"train_loss": -7.034229278564453, "global_step": 165239, "epoch": 3934} {"train_loss": -7.0589280128479, "global_step": 165240, "epoch": 3934} {"train_loss": -6.990956783294678, "global_step": 165241, "epoch": 3934} {"train_loss": -7.080159664154053, "global_step": 165242, "epoch": 3934} {"train_loss": -6.9816999435424805, "global_step": 165243, "epoch": 3934} {"train_loss": -6.954867362976074, "global_step": 165244, "epoch": 3934} {"train_loss": -6.952838897705078, "global_step": 165245, "epoch": 3934} {"train_loss": -6.853012561798096, "global_step": 165246, "epoch": 3934} {"train_loss": -6.909937381744385, "global_step": 165247, "epoch": 3934} {"train_loss": -7.00460147857666, "global_step": 165248, "epoch": 3934} {"train_loss": -6.983518123626709, "global_step": 165249, "epoch": 3934} {"train_loss": -6.970690727233887, "global_step": 165250, "epoch": 3934} {"train_loss": -7.003462314605713, "global_step": 165251, "epoch": 3934} {"train_loss": -6.861854076385498, "global_step": 165252, "epoch": 3934} {"train_loss": -7.010809898376465, "global_step": 165253, "epoch": 3934} {"train_loss": -7.021742820739746, "global_step": 165254, "epoch": 3934} {"train_loss": -6.891376972198486, "global_step": 165255, "epoch": 3934} {"train_loss": -7.07584810256958, "global_step": 165256, "epoch": 3934} {"train_loss": -6.927342414855957, "global_step": 165257, "epoch": 3934} {"train_loss": -7.158066749572754, "global_step": 165258, "epoch": 3934} {"train_loss": -6.956135272979736, "global_step": 165259, "epoch": 3934} {"train_loss": -7.102524280548096, "global_step": 165260, "epoch": 3934} {"train_loss": -7.072335243225098, "global_step": 165261, "epoch": 3934} {"train_loss": -7.01387882232666, "global_step": 165262, "epoch": 3934} {"train_loss": -7.034043312072754, "global_step": 165263, "epoch": 3934} {"train_loss": -6.874561309814453, "global_step": 165264, "epoch": 3934} {"train_loss": -7.033564567565918, "global_step": 165265, "epoch": 3934} {"train_loss": -6.821732521057129, "global_step": 165266, "epoch": 3934} {"train_loss": -6.9919915199279785, "global_step": 165267, "epoch": 3934} {"train_loss": -6.978405952453613, "global_step": 165268, "epoch": 3934} {"train_loss": -6.992310875938053, "global_step": 165269, "epoch": 3934, "val_loss": 79646.3671875} {"train_loss": -7.030927658081055, "global_step": 165270, "epoch": 3935} {"train_loss": -6.872939586639404, "global_step": 165271, "epoch": 3935} {"train_loss": -6.93589973449707, "global_step": 165272, "epoch": 3935} {"train_loss": -6.87885856628418, "global_step": 165273, "epoch": 3935} {"train_loss": -7.107048034667969, "global_step": 165274, "epoch": 3935} {"train_loss": -7.000240325927734, "global_step": 165275, "epoch": 3935} {"train_loss": -7.044190406799316, "global_step": 165276, "epoch": 3935} {"train_loss": -6.995968341827393, "global_step": 165277, "epoch": 3935} {"train_loss": -6.90610408782959, "global_step": 165278, "epoch": 3935} {"train_loss": -7.061176776885986, "global_step": 165279, "epoch": 3935} {"train_loss": -6.9735283851623535, "global_step": 165280, "epoch": 3935} {"train_loss": -6.989398002624512, "global_step": 165281, "epoch": 3935} {"train_loss": -6.967493057250977, "global_step": 165282, "epoch": 3935} {"train_loss": -6.818516254425049, "global_step": 165283, "epoch": 3935} {"train_loss": -6.96518087387085, "global_step": 165284, "epoch": 3935} {"train_loss": -6.928444862365723, "global_step": 165285, "epoch": 3935} {"train_loss": -7.009976387023926, "global_step": 165286, "epoch": 3935} {"train_loss": -6.977814674377441, "global_step": 165287, "epoch": 3935} {"train_loss": -6.993743419647217, "global_step": 165288, "epoch": 3935} {"train_loss": -7.107057094573975, "global_step": 165289, "epoch": 3935} {"train_loss": -7.028074741363525, "global_step": 165290, "epoch": 3935} {"train_loss": -7.026397228240967, "global_step": 165291, "epoch": 3935} {"train_loss": -7.033412933349609, "global_step": 165292, "epoch": 3935} {"train_loss": -7.011731147766113, "global_step": 165293, "epoch": 3935} {"train_loss": -7.0353827476501465, "global_step": 165294, "epoch": 3935} {"train_loss": -7.045360565185547, "global_step": 165295, "epoch": 3935} {"train_loss": -7.087707996368408, "global_step": 165296, "epoch": 3935} {"train_loss": -7.058908939361572, "global_step": 165297, "epoch": 3935} {"train_loss": -7.022035121917725, "global_step": 165298, "epoch": 3935} {"train_loss": -6.9355573654174805, "global_step": 165299, "epoch": 3935} {"train_loss": -7.037117004394531, "global_step": 165300, "epoch": 3935} {"train_loss": -6.884467124938965, "global_step": 165301, "epoch": 3935} {"train_loss": -7.062627792358398, "global_step": 165302, "epoch": 3935} {"train_loss": -7.036233425140381, "global_step": 165303, "epoch": 3935} {"train_loss": -6.9574360847473145, "global_step": 165304, "epoch": 3935} {"train_loss": -7.106131076812744, "global_step": 165305, "epoch": 3935} {"train_loss": -7.196446418762207, "global_step": 165306, "epoch": 3935} {"train_loss": -6.996890068054199, "global_step": 165307, "epoch": 3935} {"train_loss": -7.075806140899658, "global_step": 165308, "epoch": 3935} {"train_loss": -7.105615615844727, "global_step": 165309, "epoch": 3935} {"train_loss": -7.028679847717285, "global_step": 165310, "epoch": 3935} {"train_loss": -7.0076643625895185, "global_step": 165311, "epoch": 3935, "val_loss": 79289.375} {"train_loss": -6.945847034454346, "global_step": 165312, "epoch": 3936} {"train_loss": -6.950325012207031, "global_step": 165313, "epoch": 3936} {"train_loss": -7.002412796020508, "global_step": 165314, "epoch": 3936} {"train_loss": -6.954416275024414, "global_step": 165315, "epoch": 3936} {"train_loss": -6.858455657958984, "global_step": 165316, "epoch": 3936} {"train_loss": -7.115004539489746, "global_step": 165317, "epoch": 3936} {"train_loss": -7.08524227142334, "global_step": 165318, "epoch": 3936} {"train_loss": -7.105986595153809, "global_step": 165319, "epoch": 3936} {"train_loss": -7.071361541748047, "global_step": 165320, "epoch": 3936} {"train_loss": -7.058100700378418, "global_step": 165321, "epoch": 3936} {"train_loss": -6.953085899353027, "global_step": 165322, "epoch": 3936} {"train_loss": -6.92974328994751, "global_step": 165323, "epoch": 3936} {"train_loss": -6.9767255783081055, "global_step": 165324, "epoch": 3936} {"train_loss": -6.920392036437988, "global_step": 165325, "epoch": 3936} {"train_loss": -6.890286445617676, "global_step": 165326, "epoch": 3936} {"train_loss": -6.902862548828125, "global_step": 165327, "epoch": 3936} {"train_loss": -6.970029830932617, "global_step": 165328, "epoch": 3936} {"train_loss": -6.938365936279297, "global_step": 165329, "epoch": 3936} {"train_loss": -6.894320964813232, "global_step": 165330, "epoch": 3936} {"train_loss": -6.948704719543457, "global_step": 165331, "epoch": 3936} {"train_loss": -6.94003438949585, "global_step": 165332, "epoch": 3936} {"train_loss": -6.994612693786621, "global_step": 165333, "epoch": 3936} {"train_loss": -6.917050361633301, "global_step": 165334, "epoch": 3936} {"train_loss": -7.0058441162109375, "global_step": 165335, "epoch": 3936} {"train_loss": -6.9214582443237305, "global_step": 165336, "epoch": 3936} {"train_loss": -7.033807754516602, "global_step": 165337, "epoch": 3936} {"train_loss": -6.922266006469727, "global_step": 165338, "epoch": 3936} {"train_loss": -6.9958391189575195, "global_step": 165339, "epoch": 3936} {"train_loss": -6.902787685394287, "global_step": 165340, "epoch": 3936} {"train_loss": -7.028453350067139, "global_step": 165341, "epoch": 3936} {"train_loss": -6.968441963195801, "global_step": 165342, "epoch": 3936} {"train_loss": -6.981021881103516, "global_step": 165343, "epoch": 3936} {"train_loss": -6.980378150939941, "global_step": 165344, "epoch": 3936} {"train_loss": -7.059628963470459, "global_step": 165345, "epoch": 3936} {"train_loss": -6.928659439086914, "global_step": 165346, "epoch": 3936} {"train_loss": -6.9825029373168945, "global_step": 165347, "epoch": 3936} {"train_loss": -7.02957820892334, "global_step": 165348, "epoch": 3936} {"train_loss": -6.998293399810791, "global_step": 165349, "epoch": 3936} {"train_loss": -6.921923637390137, "global_step": 165350, "epoch": 3936} {"train_loss": -7.1100287437438965, "global_step": 165351, "epoch": 3936} {"train_loss": -7.006547451019287, "global_step": 165352, "epoch": 3936} {"train_loss": -6.977526721500215, "global_step": 165353, "epoch": 3936, "val_loss": 79756.53125} {"train_loss": -6.961918830871582, "global_step": 165354, "epoch": 3937} {"train_loss": -6.974293231964111, "global_step": 165355, "epoch": 3937} {"train_loss": -7.0174479484558105, "global_step": 165356, "epoch": 3937} {"train_loss": -6.910897254943848, "global_step": 165357, "epoch": 3937} {"train_loss": -7.015913963317871, "global_step": 165358, "epoch": 3937} {"train_loss": -6.867603302001953, "global_step": 165359, "epoch": 3937} {"train_loss": -6.863574028015137, "global_step": 165360, "epoch": 3937} {"train_loss": -6.931715965270996, "global_step": 165361, "epoch": 3937} {"train_loss": -7.008599281311035, "global_step": 165362, "epoch": 3937} {"train_loss": -6.925548076629639, "global_step": 165363, "epoch": 3937} {"train_loss": -7.063070297241211, "global_step": 165364, "epoch": 3937} {"train_loss": -6.924655914306641, "global_step": 165365, "epoch": 3937} {"train_loss": -7.070592403411865, "global_step": 165366, "epoch": 3937} {"train_loss": -7.022684574127197, "global_step": 165367, "epoch": 3937} {"train_loss": -6.917191505432129, "global_step": 165368, "epoch": 3937} {"train_loss": -6.968242645263672, "global_step": 165369, "epoch": 3937} {"train_loss": -6.803544044494629, "global_step": 165370, "epoch": 3937} {"train_loss": -7.005698204040527, "global_step": 165371, "epoch": 3937} {"train_loss": -6.981257438659668, "global_step": 165372, "epoch": 3937} {"train_loss": -6.941232204437256, "global_step": 165373, "epoch": 3937} {"train_loss": -6.9512763023376465, "global_step": 165374, "epoch": 3937} {"train_loss": -6.853102207183838, "global_step": 165375, "epoch": 3937} {"train_loss": -6.936324119567871, "global_step": 165376, "epoch": 3937} {"train_loss": -6.944623947143555, "global_step": 165377, "epoch": 3937} {"train_loss": -6.838315010070801, "global_step": 165378, "epoch": 3937} {"train_loss": -6.876107215881348, "global_step": 165379, "epoch": 3937} {"train_loss": -6.929594993591309, "global_step": 165380, "epoch": 3937} {"train_loss": -6.962231636047363, "global_step": 165381, "epoch": 3937} {"train_loss": -6.908337116241455, "global_step": 165382, "epoch": 3937} {"train_loss": -6.991468906402588, "global_step": 165383, "epoch": 3937} {"train_loss": -6.9092559814453125, "global_step": 165384, "epoch": 3937} {"train_loss": -6.965150356292725, "global_step": 165385, "epoch": 3937} {"train_loss": -7.018763542175293, "global_step": 165386, "epoch": 3937} {"train_loss": -6.864345550537109, "global_step": 165387, "epoch": 3937} {"train_loss": -6.960916519165039, "global_step": 165388, "epoch": 3937} {"train_loss": -6.959674835205078, "global_step": 165389, "epoch": 3937} {"train_loss": -6.936531066894531, "global_step": 165390, "epoch": 3937} {"train_loss": -7.009564399719238, "global_step": 165391, "epoch": 3937} {"train_loss": -6.999090671539307, "global_step": 165392, "epoch": 3937} {"train_loss": -7.047867298126221, "global_step": 165393, "epoch": 3937} {"train_loss": -6.981698989868164, "global_step": 165394, "epoch": 3937} {"train_loss": -6.952783925192697, "global_step": 165395, "epoch": 3937, "val_loss": 79633.2109375} {"train_loss": -7.02797794342041, "global_step": 165396, "epoch": 3938} {"train_loss": -7.033206939697266, "global_step": 165397, "epoch": 3938} {"train_loss": -7.077023506164551, "global_step": 165398, "epoch": 3938} {"train_loss": -6.970455169677734, "global_step": 165399, "epoch": 3938} {"train_loss": -6.972869396209717, "global_step": 165400, "epoch": 3938} {"train_loss": -6.901800632476807, "global_step": 165401, "epoch": 3938} {"train_loss": -7.040408611297607, "global_step": 165402, "epoch": 3938} {"train_loss": -7.053155899047852, "global_step": 165403, "epoch": 3938} {"train_loss": -7.040428161621094, "global_step": 165404, "epoch": 3938} {"train_loss": -6.946347236633301, "global_step": 165405, "epoch": 3938} {"train_loss": -7.077194690704346, "global_step": 165406, "epoch": 3938} {"train_loss": -7.085024833679199, "global_step": 165407, "epoch": 3938} {"train_loss": -6.846805572509766, "global_step": 165408, "epoch": 3938} {"train_loss": -6.901373386383057, "global_step": 165409, "epoch": 3938} {"train_loss": -6.950686454772949, "global_step": 165410, "epoch": 3938} {"train_loss": -6.800760746002197, "global_step": 165411, "epoch": 3938} {"train_loss": -6.966500282287598, "global_step": 165412, "epoch": 3938} {"train_loss": -6.981078147888184, "global_step": 165413, "epoch": 3938} {"train_loss": -7.02046012878418, "global_step": 165414, "epoch": 3938} {"train_loss": -6.896185874938965, "global_step": 165415, "epoch": 3938} {"train_loss": -6.966762542724609, "global_step": 165416, "epoch": 3938} {"train_loss": -6.986424922943115, "global_step": 165417, "epoch": 3938} {"train_loss": -6.950587272644043, "global_step": 165418, "epoch": 3938} {"train_loss": -6.934185981750488, "global_step": 165419, "epoch": 3938} {"train_loss": -6.9930419921875, "global_step": 165420, "epoch": 3938} {"train_loss": -6.995525360107422, "global_step": 165421, "epoch": 3938} {"train_loss": -6.989413261413574, "global_step": 165422, "epoch": 3938} {"train_loss": -7.0204877853393555, "global_step": 165423, "epoch": 3938} {"train_loss": -6.966638565063477, "global_step": 165424, "epoch": 3938} {"train_loss": -6.976635932922363, "global_step": 165425, "epoch": 3938} {"train_loss": -7.004667282104492, "global_step": 165426, "epoch": 3938} {"train_loss": -6.9184770584106445, "global_step": 165427, "epoch": 3938} {"train_loss": -7.1068315505981445, "global_step": 165428, "epoch": 3938} {"train_loss": -6.757900238037109, "global_step": 165429, "epoch": 3938} {"train_loss": -6.948436260223389, "global_step": 165430, "epoch": 3938} {"train_loss": -6.974628448486328, "global_step": 165431, "epoch": 3938} {"train_loss": -6.979630470275879, "global_step": 165432, "epoch": 3938} {"train_loss": -7.009190559387207, "global_step": 165433, "epoch": 3938} {"train_loss": -7.003444671630859, "global_step": 165434, "epoch": 3938} {"train_loss": -6.995940208435059, "global_step": 165435, "epoch": 3938} {"train_loss": -6.960038661956787, "global_step": 165436, "epoch": 3938} {"train_loss": -6.975365752265567, "global_step": 165437, "epoch": 3938, "val_loss": 79667.1015625} {"train_loss": -6.994553565979004, "global_step": 165438, "epoch": 3939} {"train_loss": -6.921331405639648, "global_step": 165439, "epoch": 3939} {"train_loss": -6.933564186096191, "global_step": 165440, "epoch": 3939} {"train_loss": -6.857457637786865, "global_step": 165441, "epoch": 3939} {"train_loss": -7.0201005935668945, "global_step": 165442, "epoch": 3939} {"train_loss": -7.024096965789795, "global_step": 165443, "epoch": 3939} {"train_loss": -6.922245979309082, "global_step": 165444, "epoch": 3939} {"train_loss": -6.952159404754639, "global_step": 165445, "epoch": 3939} {"train_loss": -6.96193790435791, "global_step": 165446, "epoch": 3939} {"train_loss": -6.883151054382324, "global_step": 165447, "epoch": 3939} {"train_loss": -6.971835136413574, "global_step": 165448, "epoch": 3939} {"train_loss": -7.026510238647461, "global_step": 165449, "epoch": 3939} {"train_loss": -6.80045223236084, "global_step": 165450, "epoch": 3939} {"train_loss": -7.058803558349609, "global_step": 165451, "epoch": 3939} {"train_loss": -7.024435043334961, "global_step": 165452, "epoch": 3939} {"train_loss": -7.05763578414917, "global_step": 165453, "epoch": 3939} {"train_loss": -6.964828014373779, "global_step": 165454, "epoch": 3939} {"train_loss": -7.137887477874756, "global_step": 165455, "epoch": 3939} {"train_loss": -6.987105369567871, "global_step": 165456, "epoch": 3939} {"train_loss": -7.001535415649414, "global_step": 165457, "epoch": 3939} {"train_loss": -7.059575080871582, "global_step": 165458, "epoch": 3939} {"train_loss": -6.927592754364014, "global_step": 165459, "epoch": 3939} {"train_loss": -7.008332252502441, "global_step": 165460, "epoch": 3939} {"train_loss": -7.096737384796143, "global_step": 165461, "epoch": 3939} {"train_loss": -7.085020542144775, "global_step": 165462, "epoch": 3939} {"train_loss": -6.97474479675293, "global_step": 165463, "epoch": 3939} {"train_loss": -7.041327476501465, "global_step": 165464, "epoch": 3939} {"train_loss": -7.13908576965332, "global_step": 165465, "epoch": 3939} {"train_loss": -6.905678749084473, "global_step": 165466, "epoch": 3939} {"train_loss": -6.925716400146484, "global_step": 165467, "epoch": 3939} {"train_loss": -6.961733341217041, "global_step": 165468, "epoch": 3939} {"train_loss": -7.035894393920898, "global_step": 165469, "epoch": 3939} {"train_loss": -6.995782852172852, "global_step": 165470, "epoch": 3939} {"train_loss": -6.891521453857422, "global_step": 165471, "epoch": 3939} {"train_loss": -7.009578704833984, "global_step": 165472, "epoch": 3939} {"train_loss": -6.915440082550049, "global_step": 165473, "epoch": 3939} {"train_loss": -6.944703102111816, "global_step": 165474, "epoch": 3939} {"train_loss": -6.956852912902832, "global_step": 165475, "epoch": 3939} {"train_loss": -6.963526725769043, "global_step": 165476, "epoch": 3939} {"train_loss": -6.873380661010742, "global_step": 165477, "epoch": 3939} {"train_loss": -6.94694185256958, "global_step": 165478, "epoch": 3939} {"train_loss": -6.980392013277326, "global_step": 165479, "epoch": 3939, "val_loss": 79428.46875} {"train_loss": -7.063826084136963, "global_step": 165480, "epoch": 3940} {"train_loss": -6.884514808654785, "global_step": 165481, "epoch": 3940} {"train_loss": -6.940594673156738, "global_step": 165482, "epoch": 3940} {"train_loss": -7.081375598907471, "global_step": 165483, "epoch": 3940} {"train_loss": -6.981550216674805, "global_step": 165484, "epoch": 3940} {"train_loss": -7.069098472595215, "global_step": 165485, "epoch": 3940} {"train_loss": -7.102005958557129, "global_step": 165486, "epoch": 3940} {"train_loss": -7.133265495300293, "global_step": 165487, "epoch": 3940} {"train_loss": -7.087793350219727, "global_step": 165488, "epoch": 3940} {"train_loss": -7.085941314697266, "global_step": 165489, "epoch": 3940} {"train_loss": -7.095259666442871, "global_step": 165490, "epoch": 3940} {"train_loss": -7.007000923156738, "global_step": 165491, "epoch": 3940} {"train_loss": -7.02138614654541, "global_step": 165492, "epoch": 3940} {"train_loss": -7.170520782470703, "global_step": 165493, "epoch": 3940} {"train_loss": -7.061878681182861, "global_step": 165494, "epoch": 3940} {"train_loss": -7.156227111816406, "global_step": 165495, "epoch": 3940} {"train_loss": -7.033024787902832, "global_step": 165496, "epoch": 3940} {"train_loss": -7.021182060241699, "global_step": 165497, "epoch": 3940} {"train_loss": -7.103511810302734, "global_step": 165498, "epoch": 3940} {"train_loss": -7.056970596313477, "global_step": 165499, "epoch": 3940} {"train_loss": -7.025848865509033, "global_step": 165500, "epoch": 3940} {"train_loss": -7.0332112312316895, "global_step": 165501, "epoch": 3940} {"train_loss": -6.971212863922119, "global_step": 165502, "epoch": 3940} {"train_loss": -6.9799652099609375, "global_step": 165503, "epoch": 3940} {"train_loss": -6.899120330810547, "global_step": 165504, "epoch": 3940} {"train_loss": -6.996194362640381, "global_step": 165505, "epoch": 3940} {"train_loss": -7.057171821594238, "global_step": 165506, "epoch": 3940} {"train_loss": -7.03355598449707, "global_step": 165507, "epoch": 3940} {"train_loss": -6.9425506591796875, "global_step": 165508, "epoch": 3940} {"train_loss": -7.090608596801758, "global_step": 165509, "epoch": 3940} {"train_loss": -7.02446174621582, "global_step": 165510, "epoch": 3940} {"train_loss": -6.967423439025879, "global_step": 165511, "epoch": 3940} {"train_loss": -7.066338539123535, "global_step": 165512, "epoch": 3940} {"train_loss": -7.050201416015625, "global_step": 165513, "epoch": 3940} {"train_loss": -7.12068510055542, "global_step": 165514, "epoch": 3940} {"train_loss": -7.061263084411621, "global_step": 165515, "epoch": 3940} {"train_loss": -6.970587730407715, "global_step": 165516, "epoch": 3940} {"train_loss": -6.987668037414551, "global_step": 165517, "epoch": 3940} {"train_loss": -7.0683441162109375, "global_step": 165518, "epoch": 3940} {"train_loss": -6.957686901092529, "global_step": 165519, "epoch": 3940} {"train_loss": -6.911503314971924, "global_step": 165520, "epoch": 3940} {"train_loss": -7.03235141436259, "global_step": 165521, "epoch": 3940, "val_loss": 79542.4921875} {"train_loss": -6.969974517822266, "global_step": 165522, "epoch": 3941} {"train_loss": -6.983216762542725, "global_step": 165523, "epoch": 3941} {"train_loss": -7.039828300476074, "global_step": 165524, "epoch": 3941} {"train_loss": -7.011712074279785, "global_step": 165525, "epoch": 3941} {"train_loss": -7.124701499938965, "global_step": 165526, "epoch": 3941} {"train_loss": -7.01467227935791, "global_step": 165527, "epoch": 3941} {"train_loss": -6.982037544250488, "global_step": 165528, "epoch": 3941} {"train_loss": -7.056763648986816, "global_step": 165529, "epoch": 3941} {"train_loss": -7.040328502655029, "global_step": 165530, "epoch": 3941} {"train_loss": -7.0381364822387695, "global_step": 165531, "epoch": 3941} {"train_loss": -7.007004737854004, "global_step": 165532, "epoch": 3941} {"train_loss": -7.059515476226807, "global_step": 165533, "epoch": 3941} {"train_loss": -6.994279384613037, "global_step": 165534, "epoch": 3941} {"train_loss": -6.815785884857178, "global_step": 165535, "epoch": 3941} {"train_loss": -6.980298042297363, "global_step": 165536, "epoch": 3941} {"train_loss": -6.9943132400512695, "global_step": 165537, "epoch": 3941} {"train_loss": -6.924924850463867, "global_step": 165538, "epoch": 3941} {"train_loss": -7.034392356872559, "global_step": 165539, "epoch": 3941} {"train_loss": -7.017550468444824, "global_step": 165540, "epoch": 3941} {"train_loss": -6.801339626312256, "global_step": 165541, "epoch": 3941} {"train_loss": -6.969062805175781, "global_step": 165542, "epoch": 3941} {"train_loss": -6.914559841156006, "global_step": 165543, "epoch": 3941} {"train_loss": -7.038527965545654, "global_step": 165544, "epoch": 3941} {"train_loss": -6.988601207733154, "global_step": 165545, "epoch": 3941} {"train_loss": -6.882060527801514, "global_step": 165546, "epoch": 3941} {"train_loss": -6.986213684082031, "global_step": 165547, "epoch": 3941} {"train_loss": -6.995065689086914, "global_step": 165548, "epoch": 3941} {"train_loss": -6.935962677001953, "global_step": 165549, "epoch": 3941} {"train_loss": -6.976508617401123, "global_step": 165550, "epoch": 3941} {"train_loss": -6.882294654846191, "global_step": 165551, "epoch": 3941} {"train_loss": -7.053981781005859, "global_step": 165552, "epoch": 3941} {"train_loss": -6.9380059242248535, "global_step": 165553, "epoch": 3941} {"train_loss": -7.0689191818237305, "global_step": 165554, "epoch": 3941} {"train_loss": -6.940736770629883, "global_step": 165555, "epoch": 3941} {"train_loss": -6.997170925140381, "global_step": 165556, "epoch": 3941} {"train_loss": -6.977096080780029, "global_step": 165557, "epoch": 3941} {"train_loss": -7.128505706787109, "global_step": 165558, "epoch": 3941} {"train_loss": -6.923701763153076, "global_step": 165559, "epoch": 3941} {"train_loss": -6.978734016418457, "global_step": 165560, "epoch": 3941} {"train_loss": -7.133127212524414, "global_step": 165561, "epoch": 3941} {"train_loss": -6.907283782958984, "global_step": 165562, "epoch": 3941} {"train_loss": -6.9892528511229015, "global_step": 165563, "epoch": 3941, "val_loss": 79632.0625} {"train_loss": -7.092680931091309, "global_step": 165564, "epoch": 3942} {"train_loss": -7.0364532470703125, "global_step": 165565, "epoch": 3942} {"train_loss": -7.07858943939209, "global_step": 165566, "epoch": 3942} {"train_loss": -7.05203104019165, "global_step": 165567, "epoch": 3942} {"train_loss": -7.097858428955078, "global_step": 165568, "epoch": 3942} {"train_loss": -7.015174865722656, "global_step": 165569, "epoch": 3942} {"train_loss": -6.999826431274414, "global_step": 165570, "epoch": 3942} {"train_loss": -7.11974573135376, "global_step": 165571, "epoch": 3942} {"train_loss": -6.915473461151123, "global_step": 165572, "epoch": 3942} {"train_loss": -6.980414390563965, "global_step": 165573, "epoch": 3942} {"train_loss": -6.971520900726318, "global_step": 165574, "epoch": 3942} {"train_loss": -6.985568046569824, "global_step": 165575, "epoch": 3942} {"train_loss": -7.0011091232299805, "global_step": 165576, "epoch": 3942} {"train_loss": -6.912530899047852, "global_step": 165577, "epoch": 3942} {"train_loss": -6.910306930541992, "global_step": 165578, "epoch": 3942} {"train_loss": -6.992483139038086, "global_step": 165579, "epoch": 3942} {"train_loss": -6.986697196960449, "global_step": 165580, "epoch": 3942} {"train_loss": -7.057577610015869, "global_step": 165581, "epoch": 3942} {"train_loss": -6.964365005493164, "global_step": 165582, "epoch": 3942} {"train_loss": -7.053003311157227, "global_step": 165583, "epoch": 3942} {"train_loss": -6.8783674240112305, "global_step": 165584, "epoch": 3942} {"train_loss": -6.982064723968506, "global_step": 165585, "epoch": 3942} {"train_loss": -6.936409950256348, "global_step": 165586, "epoch": 3942} {"train_loss": -6.906486511230469, "global_step": 165587, "epoch": 3942} {"train_loss": -6.9248151779174805, "global_step": 165588, "epoch": 3942} {"train_loss": -6.953548908233643, "global_step": 165589, "epoch": 3942} {"train_loss": -6.976372241973877, "global_step": 165590, "epoch": 3942} {"train_loss": -7.024264812469482, "global_step": 165591, "epoch": 3942} {"train_loss": -6.891758918762207, "global_step": 165592, "epoch": 3942} {"train_loss": -6.851675033569336, "global_step": 165593, "epoch": 3942} {"train_loss": -7.02205753326416, "global_step": 165594, "epoch": 3942} {"train_loss": -6.929723262786865, "global_step": 165595, "epoch": 3942} {"train_loss": -6.9371867179870605, "global_step": 165596, "epoch": 3942} {"train_loss": -6.965855598449707, "global_step": 165597, "epoch": 3942} {"train_loss": -6.8993635177612305, "global_step": 165598, "epoch": 3942} {"train_loss": -6.93675422668457, "global_step": 165599, "epoch": 3942} {"train_loss": -7.025989055633545, "global_step": 165600, "epoch": 3942} {"train_loss": -6.8711371421813965, "global_step": 165601, "epoch": 3942} {"train_loss": -7.018063545227051, "global_step": 165602, "epoch": 3942} {"train_loss": -6.939695835113525, "global_step": 165603, "epoch": 3942} {"train_loss": -7.006335258483887, "global_step": 165604, "epoch": 3942} {"train_loss": -6.974459091822307, "global_step": 165605, "epoch": 3942, "val_loss": 79905.7734375} {"train_loss": -6.930015563964844, "global_step": 165606, "epoch": 3943} {"train_loss": -6.940118312835693, "global_step": 165607, "epoch": 3943} {"train_loss": -6.896300315856934, "global_step": 165608, "epoch": 3943} {"train_loss": -6.975833892822266, "global_step": 165609, "epoch": 3943} {"train_loss": -6.972535133361816, "global_step": 165610, "epoch": 3943} {"train_loss": -7.126129150390625, "global_step": 165611, "epoch": 3943} {"train_loss": -7.053799629211426, "global_step": 165612, "epoch": 3943} {"train_loss": -6.978032112121582, "global_step": 165613, "epoch": 3943} {"train_loss": -7.030983924865723, "global_step": 165614, "epoch": 3943} {"train_loss": -7.096269607543945, "global_step": 165615, "epoch": 3943} {"train_loss": -7.001434326171875, "global_step": 165616, "epoch": 3943} {"train_loss": -6.953536033630371, "global_step": 165617, "epoch": 3943} {"train_loss": -6.9649457931518555, "global_step": 165618, "epoch": 3943} {"train_loss": -6.995792388916016, "global_step": 165619, "epoch": 3943} {"train_loss": -7.009833335876465, "global_step": 165620, "epoch": 3943} {"train_loss": -6.847622394561768, "global_step": 165621, "epoch": 3943} {"train_loss": -6.969281196594238, "global_step": 165622, "epoch": 3943} {"train_loss": -7.12455940246582, "global_step": 165623, "epoch": 3943} {"train_loss": -7.062513828277588, "global_step": 165624, "epoch": 3943} {"train_loss": -6.996959209442139, "global_step": 165625, "epoch": 3943} {"train_loss": -6.990650177001953, "global_step": 165626, "epoch": 3943} {"train_loss": -7.027948379516602, "global_step": 165627, "epoch": 3943} {"train_loss": -6.932497978210449, "global_step": 165628, "epoch": 3943} {"train_loss": -7.001712799072266, "global_step": 165629, "epoch": 3943} {"train_loss": -6.95939826965332, "global_step": 165630, "epoch": 3943} {"train_loss": -7.01898193359375, "global_step": 165631, "epoch": 3943} {"train_loss": -7.024188041687012, "global_step": 165632, "epoch": 3943} {"train_loss": -7.079273223876953, "global_step": 165633, "epoch": 3943} {"train_loss": -6.987179279327393, "global_step": 165634, "epoch": 3943} {"train_loss": -7.0225982666015625, "global_step": 165635, "epoch": 3943} {"train_loss": -7.035598278045654, "global_step": 165636, "epoch": 3943} {"train_loss": -6.913266181945801, "global_step": 165637, "epoch": 3943} {"train_loss": -6.788421630859375, "global_step": 165638, "epoch": 3943} {"train_loss": -6.930845737457275, "global_step": 165639, "epoch": 3943} {"train_loss": -7.09519100189209, "global_step": 165640, "epoch": 3943} {"train_loss": -6.947148323059082, "global_step": 165641, "epoch": 3943} {"train_loss": -6.9558258056640625, "global_step": 165642, "epoch": 3943} {"train_loss": -6.982949256896973, "global_step": 165643, "epoch": 3943} {"train_loss": -6.939108848571777, "global_step": 165644, "epoch": 3943} {"train_loss": -6.967016220092773, "global_step": 165645, "epoch": 3943} {"train_loss": -6.942609786987305, "global_step": 165646, "epoch": 3943} {"train_loss": -6.982710815611339, "global_step": 165647, "epoch": 3943, "val_loss": 79690.2265625} {"train_loss": -7.0111188888549805, "global_step": 165648, "epoch": 3944} {"train_loss": -7.009188652038574, "global_step": 165649, "epoch": 3944} {"train_loss": -6.930662155151367, "global_step": 165650, "epoch": 3944} {"train_loss": -7.157046794891357, "global_step": 165651, "epoch": 3944} {"train_loss": -7.0510573387146, "global_step": 165652, "epoch": 3944} {"train_loss": -7.023163795471191, "global_step": 165653, "epoch": 3944} {"train_loss": -7.016680717468262, "global_step": 165654, "epoch": 3944} {"train_loss": -6.995599746704102, "global_step": 165655, "epoch": 3944} {"train_loss": -6.994162559509277, "global_step": 165656, "epoch": 3944} {"train_loss": -6.963565826416016, "global_step": 165657, "epoch": 3944} {"train_loss": -7.107495307922363, "global_step": 165658, "epoch": 3944} {"train_loss": -6.973054885864258, "global_step": 165659, "epoch": 3944} {"train_loss": -6.9040446281433105, "global_step": 165660, "epoch": 3944} {"train_loss": -6.97783088684082, "global_step": 165661, "epoch": 3944} {"train_loss": -6.972859859466553, "global_step": 165662, "epoch": 3944} {"train_loss": -6.905263423919678, "global_step": 165663, "epoch": 3944} {"train_loss": -6.850982666015625, "global_step": 165664, "epoch": 3944} {"train_loss": -6.765921115875244, "global_step": 165665, "epoch": 3944} {"train_loss": -6.929691314697266, "global_step": 165666, "epoch": 3944} {"train_loss": -6.912898063659668, "global_step": 165667, "epoch": 3944} {"train_loss": -6.9629974365234375, "global_step": 165668, "epoch": 3944} {"train_loss": -7.029370307922363, "global_step": 165669, "epoch": 3944} {"train_loss": -7.041678428649902, "global_step": 165670, "epoch": 3944} {"train_loss": -6.938352584838867, "global_step": 165671, "epoch": 3944} {"train_loss": -7.012307643890381, "global_step": 165672, "epoch": 3944} {"train_loss": -6.894735336303711, "global_step": 165673, "epoch": 3944} {"train_loss": -6.976311683654785, "global_step": 165674, "epoch": 3944} {"train_loss": -6.932221412658691, "global_step": 165675, "epoch": 3944} {"train_loss": -6.901366710662842, "global_step": 165676, "epoch": 3944} {"train_loss": -6.836724281311035, "global_step": 165677, "epoch": 3944} {"train_loss": -6.8395538330078125, "global_step": 165678, "epoch": 3944} {"train_loss": -7.0614118576049805, "global_step": 165679, "epoch": 3944} {"train_loss": -6.9776530265808105, "global_step": 165680, "epoch": 3944} {"train_loss": -6.973898887634277, "global_step": 165681, "epoch": 3944} {"train_loss": -6.935506820678711, "global_step": 165682, "epoch": 3944} {"train_loss": -6.945392608642578, "global_step": 165683, "epoch": 3944} {"train_loss": -6.978310585021973, "global_step": 165684, "epoch": 3944} {"train_loss": -7.103028297424316, "global_step": 165685, "epoch": 3944} {"train_loss": -7.105646133422852, "global_step": 165686, "epoch": 3944} {"train_loss": -6.963942050933838, "global_step": 165687, "epoch": 3944} {"train_loss": -7.016982078552246, "global_step": 165688, "epoch": 3944} {"train_loss": -6.973107701256161, "global_step": 165689, "epoch": 3944, "val_loss": 79615.578125} {"train_loss": -6.970426082611084, "global_step": 165690, "epoch": 3945} {"train_loss": -6.948263168334961, "global_step": 165691, "epoch": 3945} {"train_loss": -7.038211345672607, "global_step": 165692, "epoch": 3945} {"train_loss": -6.971811294555664, "global_step": 165693, "epoch": 3945} {"train_loss": -7.083742141723633, "global_step": 165694, "epoch": 3945} {"train_loss": -6.925926685333252, "global_step": 165695, "epoch": 3945} {"train_loss": -7.070769309997559, "global_step": 165696, "epoch": 3945} {"train_loss": -7.010085582733154, "global_step": 165697, "epoch": 3945} {"train_loss": -6.878835201263428, "global_step": 165698, "epoch": 3945} {"train_loss": -7.13868522644043, "global_step": 165699, "epoch": 3945} {"train_loss": -6.922798156738281, "global_step": 165700, "epoch": 3945} {"train_loss": -7.083539009094238, "global_step": 165701, "epoch": 3945} {"train_loss": -6.9309234619140625, "global_step": 165702, "epoch": 3945} {"train_loss": -6.934803485870361, "global_step": 165703, "epoch": 3945} {"train_loss": -7.0867791175842285, "global_step": 165704, "epoch": 3945} {"train_loss": -6.97656774520874, "global_step": 165705, "epoch": 3945} {"train_loss": -6.973283767700195, "global_step": 165706, "epoch": 3945} {"train_loss": -7.067419052124023, "global_step": 165707, "epoch": 3945} {"train_loss": -6.945882320404053, "global_step": 165708, "epoch": 3945} {"train_loss": -7.073709487915039, "global_step": 165709, "epoch": 3945} {"train_loss": -6.988546848297119, "global_step": 165710, "epoch": 3945} {"train_loss": -7.0624799728393555, "global_step": 165711, "epoch": 3945} {"train_loss": -6.948045253753662, "global_step": 165712, "epoch": 3945} {"train_loss": -6.982714653015137, "global_step": 165713, "epoch": 3945} {"train_loss": -7.008030891418457, "global_step": 165714, "epoch": 3945} {"train_loss": -7.049066543579102, "global_step": 165715, "epoch": 3945} {"train_loss": -7.03939151763916, "global_step": 165716, "epoch": 3945} {"train_loss": -7.0572285652160645, "global_step": 165717, "epoch": 3945} {"train_loss": -6.955117702484131, "global_step": 165718, "epoch": 3945} {"train_loss": -6.991765022277832, "global_step": 165719, "epoch": 3945} {"train_loss": -7.0626220703125, "global_step": 165720, "epoch": 3945} {"train_loss": -6.994923114776611, "global_step": 165721, "epoch": 3945} {"train_loss": -6.965985298156738, "global_step": 165722, "epoch": 3945} {"train_loss": -7.05502462387085, "global_step": 165723, "epoch": 3945} {"train_loss": -6.975869655609131, "global_step": 165724, "epoch": 3945} {"train_loss": -6.986934661865234, "global_step": 165725, "epoch": 3945} {"train_loss": -6.840114593505859, "global_step": 165726, "epoch": 3945} {"train_loss": -7.054733753204346, "global_step": 165727, "epoch": 3945} {"train_loss": -6.944161415100098, "global_step": 165728, "epoch": 3945} {"train_loss": -7.067840576171875, "global_step": 165729, "epoch": 3945} {"train_loss": -7.003199577331543, "global_step": 165730, "epoch": 3945} {"train_loss": -6.99939006850833, "global_step": 165731, "epoch": 3945, "val_loss": 79663.8671875} {"train_loss": -6.930218696594238, "global_step": 165732, "epoch": 3946} {"train_loss": -6.918307304382324, "global_step": 165733, "epoch": 3946} {"train_loss": -7.0473408699035645, "global_step": 165734, "epoch": 3946} {"train_loss": -7.037020683288574, "global_step": 165735, "epoch": 3946} {"train_loss": -7.09664249420166, "global_step": 165736, "epoch": 3946} {"train_loss": -7.0139007568359375, "global_step": 165737, "epoch": 3946} {"train_loss": -6.94793176651001, "global_step": 165738, "epoch": 3946} {"train_loss": -7.024797439575195, "global_step": 165739, "epoch": 3946} {"train_loss": -6.980597972869873, "global_step": 165740, "epoch": 3946} {"train_loss": -7.12221097946167, "global_step": 165741, "epoch": 3946} {"train_loss": -7.014187812805176, "global_step": 165742, "epoch": 3946} {"train_loss": -6.984378337860107, "global_step": 165743, "epoch": 3946} {"train_loss": -6.973423957824707, "global_step": 165744, "epoch": 3946} {"train_loss": -6.999666690826416, "global_step": 165745, "epoch": 3946} {"train_loss": -7.079517364501953, "global_step": 165746, "epoch": 3946} {"train_loss": -7.05637788772583, "global_step": 165747, "epoch": 3946} {"train_loss": -7.082416534423828, "global_step": 165748, "epoch": 3946} {"train_loss": -7.060779571533203, "global_step": 165749, "epoch": 3946} {"train_loss": -7.144543170928955, "global_step": 165750, "epoch": 3946} {"train_loss": -7.14007568359375, "global_step": 165751, "epoch": 3946} {"train_loss": -7.135125637054443, "global_step": 165752, "epoch": 3946} {"train_loss": -7.037322044372559, "global_step": 165753, "epoch": 3946} {"train_loss": -6.965298175811768, "global_step": 165754, "epoch": 3946} {"train_loss": -7.016367435455322, "global_step": 165755, "epoch": 3946} {"train_loss": -7.027543544769287, "global_step": 165756, "epoch": 3946} {"train_loss": -7.104667663574219, "global_step": 165757, "epoch": 3946} {"train_loss": -6.971846580505371, "global_step": 165758, "epoch": 3946} {"train_loss": -7.0044989585876465, "global_step": 165759, "epoch": 3946} {"train_loss": -7.037809371948242, "global_step": 165760, "epoch": 3946} {"train_loss": -6.907484531402588, "global_step": 165761, "epoch": 3946} {"train_loss": -6.84531307220459, "global_step": 165762, "epoch": 3946} {"train_loss": -6.967507362365723, "global_step": 165763, "epoch": 3946} {"train_loss": -7.004581451416016, "global_step": 165764, "epoch": 3946} {"train_loss": -6.929588794708252, "global_step": 165765, "epoch": 3946} {"train_loss": -7.018742561340332, "global_step": 165766, "epoch": 3946} {"train_loss": -6.917757034301758, "global_step": 165767, "epoch": 3946} {"train_loss": -7.003719329833984, "global_step": 165768, "epoch": 3946} {"train_loss": -7.014349937438965, "global_step": 165769, "epoch": 3946} {"train_loss": -6.997812271118164, "global_step": 165770, "epoch": 3946} {"train_loss": -6.933961868286133, "global_step": 165771, "epoch": 3946} {"train_loss": -7.077746391296387, "global_step": 165772, "epoch": 3946} {"train_loss": -7.010978948502314, "global_step": 165773, "epoch": 3946, "val_loss": 79573.984375} {"train_loss": -6.99315071105957, "global_step": 165774, "epoch": 3947} {"train_loss": -6.999042510986328, "global_step": 165775, "epoch": 3947} {"train_loss": -7.002004623413086, "global_step": 165776, "epoch": 3947} {"train_loss": -7.081897735595703, "global_step": 165777, "epoch": 3947} {"train_loss": -7.047547340393066, "global_step": 165778, "epoch": 3947} {"train_loss": -6.950439929962158, "global_step": 165779, "epoch": 3947} {"train_loss": -7.091598033905029, "global_step": 165780, "epoch": 3947} {"train_loss": -7.043451309204102, "global_step": 165781, "epoch": 3947} {"train_loss": -7.003777027130127, "global_step": 165782, "epoch": 3947} {"train_loss": -7.046492576599121, "global_step": 165783, "epoch": 3947} {"train_loss": -6.971468925476074, "global_step": 165784, "epoch": 3947} {"train_loss": -7.150707244873047, "global_step": 165785, "epoch": 3947} {"train_loss": -7.066258430480957, "global_step": 165786, "epoch": 3947} {"train_loss": -7.095423221588135, "global_step": 165787, "epoch": 3947} {"train_loss": -7.009010314941406, "global_step": 165788, "epoch": 3947} {"train_loss": -7.079493522644043, "global_step": 165789, "epoch": 3947} {"train_loss": -7.005190372467041, "global_step": 165790, "epoch": 3947} {"train_loss": -7.074872970581055, "global_step": 165791, "epoch": 3947} {"train_loss": -7.078283786773682, "global_step": 165792, "epoch": 3947} {"train_loss": -6.996404647827148, "global_step": 165793, "epoch": 3947} {"train_loss": -6.967155456542969, "global_step": 165794, "epoch": 3947} {"train_loss": -7.011922836303711, "global_step": 165795, "epoch": 3947} {"train_loss": -6.944581508636475, "global_step": 165796, "epoch": 3947} {"train_loss": -6.924300670623779, "global_step": 165797, "epoch": 3947} {"train_loss": -6.898902416229248, "global_step": 165798, "epoch": 3947} {"train_loss": -6.92781925201416, "global_step": 165799, "epoch": 3947} {"train_loss": -7.041708946228027, "global_step": 165800, "epoch": 3947} {"train_loss": -6.913488388061523, "global_step": 165801, "epoch": 3947} {"train_loss": -7.0201921463012695, "global_step": 165802, "epoch": 3947} {"train_loss": -6.983033180236816, "global_step": 165803, "epoch": 3947} {"train_loss": -7.007059574127197, "global_step": 165804, "epoch": 3947} {"train_loss": -6.924755096435547, "global_step": 165805, "epoch": 3947} {"train_loss": -6.816102027893066, "global_step": 165806, "epoch": 3947} {"train_loss": -6.9268927574157715, "global_step": 165807, "epoch": 3947} {"train_loss": -7.005270481109619, "global_step": 165808, "epoch": 3947} {"train_loss": -7.0478386878967285, "global_step": 165809, "epoch": 3947} {"train_loss": -6.994274139404297, "global_step": 165810, "epoch": 3947} {"train_loss": -6.788682460784912, "global_step": 165811, "epoch": 3947} {"train_loss": -7.019428253173828, "global_step": 165812, "epoch": 3947} {"train_loss": -6.815016746520996, "global_step": 165813, "epoch": 3947} {"train_loss": -6.957614898681641, "global_step": 165814, "epoch": 3947} {"train_loss": -6.992523602076939, "global_step": 165815, "epoch": 3947, "val_loss": 79666.234375} {"train_loss": -6.8809638023376465, "global_step": 165816, "epoch": 3948} {"train_loss": -6.9751434326171875, "global_step": 165817, "epoch": 3948} {"train_loss": -6.953969955444336, "global_step": 165818, "epoch": 3948} {"train_loss": -7.006565093994141, "global_step": 165819, "epoch": 3948} {"train_loss": -6.909277439117432, "global_step": 165820, "epoch": 3948} {"train_loss": -7.004349708557129, "global_step": 165821, "epoch": 3948} {"train_loss": -6.903545379638672, "global_step": 165822, "epoch": 3948} {"train_loss": -7.056171417236328, "global_step": 165823, "epoch": 3948} {"train_loss": -6.9724440574646, "global_step": 165824, "epoch": 3948} {"train_loss": -6.923856258392334, "global_step": 165825, "epoch": 3948} {"train_loss": -7.0370001792907715, "global_step": 165826, "epoch": 3948} {"train_loss": -6.849676609039307, "global_step": 165827, "epoch": 3948} {"train_loss": -6.968645095825195, "global_step": 165828, "epoch": 3948} {"train_loss": -6.93036413192749, "global_step": 165829, "epoch": 3948} {"train_loss": -7.009119033813477, "global_step": 165830, "epoch": 3948} {"train_loss": -6.936281681060791, "global_step": 165831, "epoch": 3948} {"train_loss": -7.009222030639648, "global_step": 165832, "epoch": 3948} {"train_loss": -7.049623012542725, "global_step": 165833, "epoch": 3948} {"train_loss": -6.876522541046143, "global_step": 165834, "epoch": 3948} {"train_loss": -6.912849426269531, "global_step": 165835, "epoch": 3948} {"train_loss": -6.85511589050293, "global_step": 165836, "epoch": 3948} {"train_loss": -7.014344692230225, "global_step": 165837, "epoch": 3948} {"train_loss": -7.089596271514893, "global_step": 165838, "epoch": 3948} {"train_loss": -6.983839511871338, "global_step": 165839, "epoch": 3948} {"train_loss": -7.084778785705566, "global_step": 165840, "epoch": 3948} {"train_loss": -7.01478385925293, "global_step": 165841, "epoch": 3948} {"train_loss": -7.050702095031738, "global_step": 165842, "epoch": 3948} {"train_loss": -6.935260772705078, "global_step": 165843, "epoch": 3948} {"train_loss": -6.835668563842773, "global_step": 165844, "epoch": 3948} {"train_loss": -6.993679046630859, "global_step": 165845, "epoch": 3948} {"train_loss": -7.1601948738098145, "global_step": 165846, "epoch": 3948} {"train_loss": -6.990421772003174, "global_step": 165847, "epoch": 3948} {"train_loss": -6.985570907592773, "global_step": 165848, "epoch": 3948} {"train_loss": -7.104122161865234, "global_step": 165849, "epoch": 3948} {"train_loss": -7.0774922370910645, "global_step": 165850, "epoch": 3948} {"train_loss": -6.999939918518066, "global_step": 165851, "epoch": 3948} {"train_loss": -6.899515628814697, "global_step": 165852, "epoch": 3948} {"train_loss": -6.9406609535217285, "global_step": 165853, "epoch": 3948} {"train_loss": -7.115827560424805, "global_step": 165854, "epoch": 3948} {"train_loss": -7.032426834106445, "global_step": 165855, "epoch": 3948} {"train_loss": -7.0887908935546875, "global_step": 165856, "epoch": 3948} {"train_loss": -6.987528483072917, "global_step": 165857, "epoch": 3948, "val_loss": 79524.6015625} {"train_loss": -7.0180206298828125, "global_step": 165858, "epoch": 3949} {"train_loss": -7.002219200134277, "global_step": 165859, "epoch": 3949} {"train_loss": -7.021920204162598, "global_step": 165860, "epoch": 3949} {"train_loss": -7.0056071281433105, "global_step": 165861, "epoch": 3949} {"train_loss": -6.978688716888428, "global_step": 165862, "epoch": 3949} {"train_loss": -7.111123085021973, "global_step": 165863, "epoch": 3949} {"train_loss": -6.9196624755859375, "global_step": 165864, "epoch": 3949} {"train_loss": -6.978520393371582, "global_step": 165865, "epoch": 3949} {"train_loss": -6.965228080749512, "global_step": 165866, "epoch": 3949} {"train_loss": -6.9890851974487305, "global_step": 165867, "epoch": 3949} {"train_loss": -6.890491485595703, "global_step": 165868, "epoch": 3949} {"train_loss": -6.978891849517822, "global_step": 165869, "epoch": 3949} {"train_loss": -6.9363837242126465, "global_step": 165870, "epoch": 3949} {"train_loss": -6.9853034019470215, "global_step": 165871, "epoch": 3949} {"train_loss": -6.949556827545166, "global_step": 165872, "epoch": 3949} {"train_loss": -7.0058159828186035, "global_step": 165873, "epoch": 3949} {"train_loss": -6.858892917633057, "global_step": 165874, "epoch": 3949} {"train_loss": -6.963318824768066, "global_step": 165875, "epoch": 3949} {"train_loss": -6.8486762046813965, "global_step": 165876, "epoch": 3949} {"train_loss": -6.9520416259765625, "global_step": 165877, "epoch": 3949} {"train_loss": -7.047401428222656, "global_step": 165878, "epoch": 3949} {"train_loss": -6.885388374328613, "global_step": 165879, "epoch": 3949} {"train_loss": -6.890011310577393, "global_step": 165880, "epoch": 3949} {"train_loss": -6.896478652954102, "global_step": 165881, "epoch": 3949} {"train_loss": -7.0520339012146, "global_step": 165882, "epoch": 3949} {"train_loss": -6.9425129890441895, "global_step": 165883, "epoch": 3949} {"train_loss": -6.822724342346191, "global_step": 165884, "epoch": 3949} {"train_loss": -6.772970199584961, "global_step": 165885, "epoch": 3949} {"train_loss": -6.980469226837158, "global_step": 165886, "epoch": 3949} {"train_loss": -6.9785966873168945, "global_step": 165887, "epoch": 3949} {"train_loss": -6.87994909286499, "global_step": 165888, "epoch": 3949} {"train_loss": -6.921821594238281, "global_step": 165889, "epoch": 3949} {"train_loss": -6.87166690826416, "global_step": 165890, "epoch": 3949} {"train_loss": -6.956121444702148, "global_step": 165891, "epoch": 3949} {"train_loss": -6.874654769897461, "global_step": 165892, "epoch": 3949} {"train_loss": -6.979942321777344, "global_step": 165893, "epoch": 3949} {"train_loss": -6.992692470550537, "global_step": 165894, "epoch": 3949} {"train_loss": -7.00107479095459, "global_step": 165895, "epoch": 3949} {"train_loss": -7.008493423461914, "global_step": 165896, "epoch": 3949} {"train_loss": -7.02138090133667, "global_step": 165897, "epoch": 3949} {"train_loss": -7.1310930252075195, "global_step": 165898, "epoch": 3949} {"train_loss": -6.960145007996332, "global_step": 165899, "epoch": 3949, "val_loss": 79850.984375} {"train_loss": -7.034087181091309, "global_step": 165900, "epoch": 3950} {"train_loss": -7.040949821472168, "global_step": 165901, "epoch": 3950} {"train_loss": -7.111678600311279, "global_step": 165902, "epoch": 3950} {"train_loss": -7.098651885986328, "global_step": 165903, "epoch": 3950} {"train_loss": -7.074591636657715, "global_step": 165904, "epoch": 3950} {"train_loss": -7.041419982910156, "global_step": 165905, "epoch": 3950} {"train_loss": -6.923792362213135, "global_step": 165906, "epoch": 3950} {"train_loss": -7.109715461730957, "global_step": 165907, "epoch": 3950} {"train_loss": -7.10772705078125, "global_step": 165908, "epoch": 3950} {"train_loss": -7.114742279052734, "global_step": 165909, "epoch": 3950} {"train_loss": -6.994112491607666, "global_step": 165910, "epoch": 3950} {"train_loss": -7.0684003829956055, "global_step": 165911, "epoch": 3950} {"train_loss": -6.990257263183594, "global_step": 165912, "epoch": 3950} {"train_loss": -6.97236967086792, "global_step": 165913, "epoch": 3950} {"train_loss": -7.04345703125, "global_step": 165914, "epoch": 3950} {"train_loss": -6.994471549987793, "global_step": 165915, "epoch": 3950} {"train_loss": -7.067952632904053, "global_step": 165916, "epoch": 3950} {"train_loss": -6.966983795166016, "global_step": 165917, "epoch": 3950} {"train_loss": -7.045895576477051, "global_step": 165918, "epoch": 3950} {"train_loss": -7.012744903564453, "global_step": 165919, "epoch": 3950} {"train_loss": -6.997095108032227, "global_step": 165920, "epoch": 3950} {"train_loss": -7.115781784057617, "global_step": 165921, "epoch": 3950} {"train_loss": -7.029650688171387, "global_step": 165922, "epoch": 3950} {"train_loss": -7.089480400085449, "global_step": 165923, "epoch": 3950} {"train_loss": -7.076993465423584, "global_step": 165924, "epoch": 3950} {"train_loss": -6.997495651245117, "global_step": 165925, "epoch": 3950} {"train_loss": -6.9773268699646, "global_step": 165926, "epoch": 3950} {"train_loss": -7.051116943359375, "global_step": 165927, "epoch": 3950} {"train_loss": -7.050842761993408, "global_step": 165928, "epoch": 3950} {"train_loss": -7.155888557434082, "global_step": 165929, "epoch": 3950} {"train_loss": -7.094837188720703, "global_step": 165930, "epoch": 3950} {"train_loss": -6.877018928527832, "global_step": 165931, "epoch": 3950} {"train_loss": -6.976071357727051, "global_step": 165932, "epoch": 3950} {"train_loss": -7.043519020080566, "global_step": 165933, "epoch": 3950} {"train_loss": -7.163743019104004, "global_step": 165934, "epoch": 3950} {"train_loss": -7.119937419891357, "global_step": 165935, "epoch": 3950} {"train_loss": -6.980621337890625, "global_step": 165936, "epoch": 3950} {"train_loss": -7.1255106925964355, "global_step": 165937, "epoch": 3950} {"train_loss": -7.089298248291016, "global_step": 165938, "epoch": 3950} {"train_loss": -7.056464672088623, "global_step": 165939, "epoch": 3950} {"train_loss": -6.8496246337890625, "global_step": 165940, "epoch": 3950} {"train_loss": -7.041997648420788, "global_step": 165941, "epoch": 3950, "train/sim_max_reward_0": 0.6633007801094285, "train/sim_max_reward_1": 0.914027831262128, "train/sim_max_reward_2": 0.4252743029357105, "train/sim_max_reward_3": 0.14882883122479107, "train/sim_max_reward_4": 0.984294390369888, "train/sim_max_reward_5": 0.60238354900669, "test/sim_max_reward_4500000": 0.9788230252529256, "test/sim_max_reward_4500001": 0.9505568328855517, "test/sim_max_reward_4500002": 0.9749424310907332, "test/sim_max_reward_4500003": 0.49585682642773726, "test/sim_max_reward_4500004": 0.14410793590648663, "test/sim_max_reward_4500005": 0.38528726782216044, "test/sim_max_reward_4500006": 0.9384885533071564, "test/sim_max_reward_4500007": 0.9984774921293613, "test/sim_max_reward_4500008": 0.9223066732696321, "test/sim_max_reward_4500009": 0.0532816262417305, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9551030732173466, "test/sim_max_reward_4500012": 0.7432702702088076, "test/sim_max_reward_4500013": 0.003886635414656073, "test/sim_max_reward_4500014": 0.6264460901678269, "test/sim_max_reward_4500015": 0.9821952560388554, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.06188906480840297, "test/sim_max_reward_4500018": 0.5147313075589276, "test/sim_max_reward_4500019": 0.9903301533681551, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8945901852707103, "test/sim_max_reward_4500022": 0.9117203386524191, "test/sim_max_reward_4500023": 1.0, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9156248492727743, "test/sim_max_reward_4500026": 1.0, "test/sim_max_reward_4500027": 0.9697012987869662, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.09340789287013174, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9854291433820416, "test/sim_max_reward_4500034": 0.9795436662615153, "test/sim_max_reward_4500035": 0.8884633446618113, "test/sim_max_reward_4500036": 0.4744875637246707, "test/sim_max_reward_4500037": 0.9046307539086931, "test/sim_max_reward_4500038": 0.3261441770821716, "test/sim_max_reward_4500039": 1.0, "test/sim_max_reward_4500040": 0.951390587422256, "test/sim_max_reward_4500041": 0.9529646973363401, "test/sim_max_reward_4500042": 0.02204939404417752, "test/sim_max_reward_4500043": 0.6188128255458346, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9518984342460964, "test/sim_max_reward_4500046": 0.23272769599540719, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9585330830227812, "test/sim_max_reward_4500049": 0.8349575396081054, "train/mean_score": 0.6230182808181061, "test/mean_score": 0.5967857818960155, "val_loss": 79602.4609375} {"train_loss": -7.016942977905273, "global_step": 165942, "epoch": 3951} {"train_loss": -6.946043968200684, "global_step": 165943, "epoch": 3951} {"train_loss": -7.044192314147949, "global_step": 165944, "epoch": 3951} {"train_loss": -7.09906005859375, "global_step": 165945, "epoch": 3951} {"train_loss": -7.01185417175293, "global_step": 165946, "epoch": 3951} {"train_loss": -6.9309492111206055, "global_step": 165947, "epoch": 3951} {"train_loss": -7.027569770812988, "global_step": 165948, "epoch": 3951} {"train_loss": -6.965570449829102, "global_step": 165949, "epoch": 3951} {"train_loss": -6.935148239135742, "global_step": 165950, "epoch": 3951} {"train_loss": -7.129034042358398, "global_step": 165951, "epoch": 3951} {"train_loss": -6.979797840118408, "global_step": 165952, "epoch": 3951} {"train_loss": -6.94658088684082, "global_step": 165953, "epoch": 3951} {"train_loss": -7.01546573638916, "global_step": 165954, "epoch": 3951} {"train_loss": -6.9144744873046875, "global_step": 165955, "epoch": 3951} {"train_loss": -6.955016613006592, "global_step": 165956, "epoch": 3951} {"train_loss": -6.94682502746582, "global_step": 165957, "epoch": 3951} {"train_loss": -6.974721908569336, "global_step": 165958, "epoch": 3951} {"train_loss": -7.039289474487305, "global_step": 165959, "epoch": 3951} {"train_loss": -6.906792640686035, "global_step": 165960, "epoch": 3951} {"train_loss": -6.998876094818115, "global_step": 165961, "epoch": 3951} {"train_loss": -6.9294753074646, "global_step": 165962, "epoch": 3951} {"train_loss": -6.974320411682129, "global_step": 165963, "epoch": 3951} {"train_loss": -7.155277729034424, "global_step": 165964, "epoch": 3951} {"train_loss": -7.05419397354126, "global_step": 165965, "epoch": 3951} {"train_loss": -7.043863296508789, "global_step": 165966, "epoch": 3951} {"train_loss": -7.0462541580200195, "global_step": 165967, "epoch": 3951} {"train_loss": -7.031976699829102, "global_step": 165968, "epoch": 3951} {"train_loss": -7.097189903259277, "global_step": 165969, "epoch": 3951} {"train_loss": -6.982730865478516, "global_step": 165970, "epoch": 3951} {"train_loss": -7.086112022399902, "global_step": 165971, "epoch": 3951} {"train_loss": -7.110655307769775, "global_step": 165972, "epoch": 3951} {"train_loss": -6.937650680541992, "global_step": 165973, "epoch": 3951} {"train_loss": -7.021222114562988, "global_step": 165974, "epoch": 3951} {"train_loss": -7.008753776550293, "global_step": 165975, "epoch": 3951} {"train_loss": -6.96964168548584, "global_step": 165976, "epoch": 3951} {"train_loss": -7.100076675415039, "global_step": 165977, "epoch": 3951} {"train_loss": -6.933088302612305, "global_step": 165978, "epoch": 3951} {"train_loss": -6.959648609161377, "global_step": 165979, "epoch": 3951} {"train_loss": -7.12161111831665, "global_step": 165980, "epoch": 3951} {"train_loss": -6.906580924987793, "global_step": 165981, "epoch": 3951} {"train_loss": -7.200438976287842, "global_step": 165982, "epoch": 3951} {"train_loss": -7.008552755628314, "global_step": 165983, "epoch": 3951, "val_loss": 80049.1796875} {"train_loss": -6.848605632781982, "global_step": 165984, "epoch": 3952} {"train_loss": -7.037777900695801, "global_step": 165985, "epoch": 3952} {"train_loss": -7.07568883895874, "global_step": 165986, "epoch": 3952} {"train_loss": -6.989773750305176, "global_step": 165987, "epoch": 3952} {"train_loss": -6.9604997634887695, "global_step": 165988, "epoch": 3952} {"train_loss": -6.959120750427246, "global_step": 165989, "epoch": 3952} {"train_loss": -7.010171890258789, "global_step": 165990, "epoch": 3952} {"train_loss": -7.021567344665527, "global_step": 165991, "epoch": 3952} {"train_loss": -6.9290900230407715, "global_step": 165992, "epoch": 3952} {"train_loss": -6.906294345855713, "global_step": 165993, "epoch": 3952} {"train_loss": -6.8699951171875, "global_step": 165994, "epoch": 3952} {"train_loss": -6.919971466064453, "global_step": 165995, "epoch": 3952} {"train_loss": -6.979681968688965, "global_step": 165996, "epoch": 3952} {"train_loss": -7.082054138183594, "global_step": 165997, "epoch": 3952} {"train_loss": -7.004494667053223, "global_step": 165998, "epoch": 3952} {"train_loss": -7.006906509399414, "global_step": 165999, "epoch": 3952} {"train_loss": -7.08027458190918, "global_step": 166000, "epoch": 3952} {"train_loss": -6.964447975158691, "global_step": 166001, "epoch": 3952} {"train_loss": -7.044001579284668, "global_step": 166002, "epoch": 3952} {"train_loss": -7.052116394042969, "global_step": 166003, "epoch": 3952} {"train_loss": -6.98500394821167, "global_step": 166004, "epoch": 3952} {"train_loss": -7.020731449127197, "global_step": 166005, "epoch": 3952} {"train_loss": -6.9815568923950195, "global_step": 166006, "epoch": 3952} {"train_loss": -6.947587966918945, "global_step": 166007, "epoch": 3952} {"train_loss": -6.984210968017578, "global_step": 166008, "epoch": 3952} {"train_loss": -7.022067546844482, "global_step": 166009, "epoch": 3952} {"train_loss": -7.153307914733887, "global_step": 166010, "epoch": 3952} {"train_loss": -6.968929767608643, "global_step": 166011, "epoch": 3952} {"train_loss": -7.060980796813965, "global_step": 166012, "epoch": 3952} {"train_loss": -7.041502952575684, "global_step": 166013, "epoch": 3952} {"train_loss": -6.853397369384766, "global_step": 166014, "epoch": 3952} {"train_loss": -7.014059066772461, "global_step": 166015, "epoch": 3952} {"train_loss": -6.970868110656738, "global_step": 166016, "epoch": 3952} {"train_loss": -6.829211235046387, "global_step": 166017, "epoch": 3952} {"train_loss": -6.981050491333008, "global_step": 166018, "epoch": 3952} {"train_loss": -6.969234466552734, "global_step": 166019, "epoch": 3952} {"train_loss": -6.883139610290527, "global_step": 166020, "epoch": 3952} {"train_loss": -7.019026279449463, "global_step": 166021, "epoch": 3952} {"train_loss": -7.060539722442627, "global_step": 166022, "epoch": 3952} {"train_loss": -7.030317306518555, "global_step": 166023, "epoch": 3952} {"train_loss": -7.024219036102295, "global_step": 166024, "epoch": 3952} {"train_loss": -6.991014616830008, "global_step": 166025, "epoch": 3952, "val_loss": 79510.0859375} {"train_loss": -7.0705084800720215, "global_step": 166026, "epoch": 3953} {"train_loss": -7.018772602081299, "global_step": 166027, "epoch": 3953} {"train_loss": -7.0868144035339355, "global_step": 166028, "epoch": 3953} {"train_loss": -6.916102409362793, "global_step": 166029, "epoch": 3953} {"train_loss": -6.980404376983643, "global_step": 166030, "epoch": 3953} {"train_loss": -7.101224422454834, "global_step": 166031, "epoch": 3953} {"train_loss": -6.954834938049316, "global_step": 166032, "epoch": 3953} {"train_loss": -6.9390764236450195, "global_step": 166033, "epoch": 3953} {"train_loss": -7.182468414306641, "global_step": 166034, "epoch": 3953} {"train_loss": -7.047911167144775, "global_step": 166035, "epoch": 3953} {"train_loss": -6.949540615081787, "global_step": 166036, "epoch": 3953} {"train_loss": -7.062283039093018, "global_step": 166037, "epoch": 3953} {"train_loss": -7.211651802062988, "global_step": 166038, "epoch": 3953} {"train_loss": -7.173183441162109, "global_step": 166039, "epoch": 3953} {"train_loss": -6.994268417358398, "global_step": 166040, "epoch": 3953} {"train_loss": -6.987555503845215, "global_step": 166041, "epoch": 3953} {"train_loss": -6.987637519836426, "global_step": 166042, "epoch": 3953} {"train_loss": -6.95841121673584, "global_step": 166043, "epoch": 3953} {"train_loss": -7.143118858337402, "global_step": 166044, "epoch": 3953} {"train_loss": -7.130496025085449, "global_step": 166045, "epoch": 3953} {"train_loss": -7.044645309448242, "global_step": 166046, "epoch": 3953} {"train_loss": -7.0388994216918945, "global_step": 166047, "epoch": 3953} {"train_loss": -6.9536824226379395, "global_step": 166048, "epoch": 3953} {"train_loss": -7.053226470947266, "global_step": 166049, "epoch": 3953} {"train_loss": -6.918346881866455, "global_step": 166050, "epoch": 3953} {"train_loss": -6.9850664138793945, "global_step": 166051, "epoch": 3953} {"train_loss": -7.0013017654418945, "global_step": 166052, "epoch": 3953} {"train_loss": -7.012595176696777, "global_step": 166053, "epoch": 3953} {"train_loss": -6.932346820831299, "global_step": 166054, "epoch": 3953} {"train_loss": -7.054468154907227, "global_step": 166055, "epoch": 3953} {"train_loss": -6.904771327972412, "global_step": 166056, "epoch": 3953} {"train_loss": -6.861833572387695, "global_step": 166057, "epoch": 3953} {"train_loss": -6.936228275299072, "global_step": 166058, "epoch": 3953} {"train_loss": -6.9080119132995605, "global_step": 166059, "epoch": 3953} {"train_loss": -7.036043167114258, "global_step": 166060, "epoch": 3953} {"train_loss": -6.971020698547363, "global_step": 166061, "epoch": 3953} {"train_loss": -7.030985355377197, "global_step": 166062, "epoch": 3953} {"train_loss": -7.0476484298706055, "global_step": 166063, "epoch": 3953} {"train_loss": -6.866785049438477, "global_step": 166064, "epoch": 3953} {"train_loss": -7.002693176269531, "global_step": 166065, "epoch": 3953} {"train_loss": -6.9730424880981445, "global_step": 166066, "epoch": 3953} {"train_loss": -7.011535474232265, "global_step": 166067, "epoch": 3953, "val_loss": 79588.046875} {"train_loss": -7.028902053833008, "global_step": 166068, "epoch": 3954} {"train_loss": -7.081303596496582, "global_step": 166069, "epoch": 3954} {"train_loss": -6.943778038024902, "global_step": 166070, "epoch": 3954} {"train_loss": -7.07357120513916, "global_step": 166071, "epoch": 3954} {"train_loss": -7.05062198638916, "global_step": 166072, "epoch": 3954} {"train_loss": -7.029651641845703, "global_step": 166073, "epoch": 3954} {"train_loss": -6.939684867858887, "global_step": 166074, "epoch": 3954} {"train_loss": -7.094179153442383, "global_step": 166075, "epoch": 3954} {"train_loss": -7.051224231719971, "global_step": 166076, "epoch": 3954} {"train_loss": -6.899932384490967, "global_step": 166077, "epoch": 3954} {"train_loss": -6.901416301727295, "global_step": 166078, "epoch": 3954} {"train_loss": -7.05096435546875, "global_step": 166079, "epoch": 3954} {"train_loss": -6.993349075317383, "global_step": 166080, "epoch": 3954} {"train_loss": -7.122478485107422, "global_step": 166081, "epoch": 3954} {"train_loss": -6.998526573181152, "global_step": 166082, "epoch": 3954} {"train_loss": -7.040278911590576, "global_step": 166083, "epoch": 3954} {"train_loss": -7.041769981384277, "global_step": 166084, "epoch": 3954} {"train_loss": -7.031064033508301, "global_step": 166085, "epoch": 3954} {"train_loss": -7.016051769256592, "global_step": 166086, "epoch": 3954} {"train_loss": -7.04124641418457, "global_step": 166087, "epoch": 3954} {"train_loss": -6.944200038909912, "global_step": 166088, "epoch": 3954} {"train_loss": -7.053288459777832, "global_step": 166089, "epoch": 3954} {"train_loss": -7.041447639465332, "global_step": 166090, "epoch": 3954} {"train_loss": -7.032517433166504, "global_step": 166091, "epoch": 3954} {"train_loss": -7.011231422424316, "global_step": 166092, "epoch": 3954} {"train_loss": -7.136110305786133, "global_step": 166093, "epoch": 3954} {"train_loss": -7.029488563537598, "global_step": 166094, "epoch": 3954} {"train_loss": -7.1043314933776855, "global_step": 166095, "epoch": 3954} {"train_loss": -7.145196914672852, "global_step": 166096, "epoch": 3954} {"train_loss": -7.043606281280518, "global_step": 166097, "epoch": 3954} {"train_loss": -7.114917755126953, "global_step": 166098, "epoch": 3954} {"train_loss": -6.982239723205566, "global_step": 166099, "epoch": 3954} {"train_loss": -6.898382186889648, "global_step": 166100, "epoch": 3954} {"train_loss": -7.008476734161377, "global_step": 166101, "epoch": 3954} {"train_loss": -7.13472843170166, "global_step": 166102, "epoch": 3954} {"train_loss": -6.939206600189209, "global_step": 166103, "epoch": 3954} {"train_loss": -7.069790363311768, "global_step": 166104, "epoch": 3954} {"train_loss": -7.003957271575928, "global_step": 166105, "epoch": 3954} {"train_loss": -6.996991157531738, "global_step": 166106, "epoch": 3954} {"train_loss": -7.028707504272461, "global_step": 166107, "epoch": 3954} {"train_loss": -7.095367431640625, "global_step": 166108, "epoch": 3954} {"train_loss": -7.031478416352045, "global_step": 166109, "epoch": 3954, "val_loss": 79425.2578125} {"train_loss": -7.045807838439941, "global_step": 166110, "epoch": 3955} {"train_loss": -6.938488006591797, "global_step": 166111, "epoch": 3955} {"train_loss": -7.019247055053711, "global_step": 166112, "epoch": 3955} {"train_loss": -7.132341384887695, "global_step": 166113, "epoch": 3955} {"train_loss": -7.06264066696167, "global_step": 166114, "epoch": 3955} {"train_loss": -6.942890167236328, "global_step": 166115, "epoch": 3955} {"train_loss": -6.910880088806152, "global_step": 166116, "epoch": 3955} {"train_loss": -6.998408317565918, "global_step": 166117, "epoch": 3955} {"train_loss": -7.016363620758057, "global_step": 166118, "epoch": 3955} {"train_loss": -7.027677536010742, "global_step": 166119, "epoch": 3955} {"train_loss": -6.928912162780762, "global_step": 166120, "epoch": 3955} {"train_loss": -6.980607986450195, "global_step": 166121, "epoch": 3955} {"train_loss": -7.018967151641846, "global_step": 166122, "epoch": 3955} {"train_loss": -7.1528239250183105, "global_step": 166123, "epoch": 3955} {"train_loss": -7.015048027038574, "global_step": 166124, "epoch": 3955} {"train_loss": -7.022041320800781, "global_step": 166125, "epoch": 3955} {"train_loss": -7.143664360046387, "global_step": 166126, "epoch": 3955} {"train_loss": -7.004235744476318, "global_step": 166127, "epoch": 3955} {"train_loss": -6.962251663208008, "global_step": 166128, "epoch": 3955} {"train_loss": -6.941311836242676, "global_step": 166129, "epoch": 3955} {"train_loss": -7.076401710510254, "global_step": 166130, "epoch": 3955} {"train_loss": -7.099369049072266, "global_step": 166131, "epoch": 3955} {"train_loss": -7.045411109924316, "global_step": 166132, "epoch": 3955} {"train_loss": -7.016369819641113, "global_step": 166133, "epoch": 3955} {"train_loss": -6.973767280578613, "global_step": 166134, "epoch": 3955} {"train_loss": -6.934893608093262, "global_step": 166135, "epoch": 3955} {"train_loss": -6.990314483642578, "global_step": 166136, "epoch": 3955} {"train_loss": -6.90542459487915, "global_step": 166137, "epoch": 3955} {"train_loss": -7.053956031799316, "global_step": 166138, "epoch": 3955} {"train_loss": -6.989365100860596, "global_step": 166139, "epoch": 3955} {"train_loss": -6.903040885925293, "global_step": 166140, "epoch": 3955} {"train_loss": -7.194674491882324, "global_step": 166141, "epoch": 3955} {"train_loss": -6.971540451049805, "global_step": 166142, "epoch": 3955} {"train_loss": -6.922699928283691, "global_step": 166143, "epoch": 3955} {"train_loss": -7.026293754577637, "global_step": 166144, "epoch": 3955} {"train_loss": -7.055332183837891, "global_step": 166145, "epoch": 3955} {"train_loss": -6.934430122375488, "global_step": 166146, "epoch": 3955} {"train_loss": -7.044369220733643, "global_step": 166147, "epoch": 3955} {"train_loss": -6.965028762817383, "global_step": 166148, "epoch": 3955} {"train_loss": -7.01511287689209, "global_step": 166149, "epoch": 3955} {"train_loss": -6.959847450256348, "global_step": 166150, "epoch": 3955} {"train_loss": -7.009958868934994, "global_step": 166151, "epoch": 3955, "val_loss": 79764.109375} {"train_loss": -6.965604782104492, "global_step": 166152, "epoch": 3956} {"train_loss": -7.002748966217041, "global_step": 166153, "epoch": 3956} {"train_loss": -6.990601539611816, "global_step": 166154, "epoch": 3956} {"train_loss": -6.915379524230957, "global_step": 166155, "epoch": 3956} {"train_loss": -6.958728790283203, "global_step": 166156, "epoch": 3956} {"train_loss": -6.967726707458496, "global_step": 166157, "epoch": 3956} {"train_loss": -6.931089878082275, "global_step": 166158, "epoch": 3956} {"train_loss": -6.832948207855225, "global_step": 166159, "epoch": 3956} {"train_loss": -6.957432270050049, "global_step": 166160, "epoch": 3956} {"train_loss": -7.034501075744629, "global_step": 166161, "epoch": 3956} {"train_loss": -6.830633640289307, "global_step": 166162, "epoch": 3956} {"train_loss": -6.957249641418457, "global_step": 166163, "epoch": 3956} {"train_loss": -6.976868629455566, "global_step": 166164, "epoch": 3956} {"train_loss": -6.852248668670654, "global_step": 166165, "epoch": 3956} {"train_loss": -6.9808149337768555, "global_step": 166166, "epoch": 3956} {"train_loss": -6.9950079917907715, "global_step": 166167, "epoch": 3956} {"train_loss": -6.925812721252441, "global_step": 166168, "epoch": 3956} {"train_loss": -6.984460830688477, "global_step": 166169, "epoch": 3956} {"train_loss": -6.82857608795166, "global_step": 166170, "epoch": 3956} {"train_loss": -7.035828590393066, "global_step": 166171, "epoch": 3956} {"train_loss": -6.939802169799805, "global_step": 166172, "epoch": 3956} {"train_loss": -7.0069098472595215, "global_step": 166173, "epoch": 3956} {"train_loss": -6.980212688446045, "global_step": 166174, "epoch": 3956} {"train_loss": -7.008159637451172, "global_step": 166175, "epoch": 3956} {"train_loss": -6.919346332550049, "global_step": 166176, "epoch": 3956} {"train_loss": -7.0199737548828125, "global_step": 166177, "epoch": 3956} {"train_loss": -6.926967144012451, "global_step": 166178, "epoch": 3956} {"train_loss": -6.958391189575195, "global_step": 166179, "epoch": 3956} {"train_loss": -6.942328929901123, "global_step": 166180, "epoch": 3956} {"train_loss": -7.076460838317871, "global_step": 166181, "epoch": 3956} {"train_loss": -7.067937850952148, "global_step": 166182, "epoch": 3956} {"train_loss": -6.921246528625488, "global_step": 166183, "epoch": 3956} {"train_loss": -6.9374308586120605, "global_step": 166184, "epoch": 3956} {"train_loss": -7.101550102233887, "global_step": 166185, "epoch": 3956} {"train_loss": -7.0520782470703125, "global_step": 166186, "epoch": 3956} {"train_loss": -7.042529582977295, "global_step": 166187, "epoch": 3956} {"train_loss": -6.977855682373047, "global_step": 166188, "epoch": 3956} {"train_loss": -6.941629409790039, "global_step": 166189, "epoch": 3956} {"train_loss": -7.0083208084106445, "global_step": 166190, "epoch": 3956} {"train_loss": -6.945380210876465, "global_step": 166191, "epoch": 3956} {"train_loss": -6.7774658203125, "global_step": 166192, "epoch": 3956} {"train_loss": -6.963829210826328, "global_step": 166193, "epoch": 3956, "val_loss": 79686.1875} {"train_loss": -6.9410881996154785, "global_step": 166194, "epoch": 3957} {"train_loss": -6.839734077453613, "global_step": 166195, "epoch": 3957} {"train_loss": -6.949703216552734, "global_step": 166196, "epoch": 3957} {"train_loss": -7.015193939208984, "global_step": 166197, "epoch": 3957} {"train_loss": -6.957897186279297, "global_step": 166198, "epoch": 3957} {"train_loss": -7.038958549499512, "global_step": 166199, "epoch": 3957} {"train_loss": -6.862697124481201, "global_step": 166200, "epoch": 3957} {"train_loss": -7.062549591064453, "global_step": 166201, "epoch": 3957} {"train_loss": -6.990181922912598, "global_step": 166202, "epoch": 3957} {"train_loss": -6.97697639465332, "global_step": 166203, "epoch": 3957} {"train_loss": -6.913618087768555, "global_step": 166204, "epoch": 3957} {"train_loss": -6.911953926086426, "global_step": 166205, "epoch": 3957} {"train_loss": -7.015951633453369, "global_step": 166206, "epoch": 3957} {"train_loss": -6.964058876037598, "global_step": 166207, "epoch": 3957} {"train_loss": -6.94204044342041, "global_step": 166208, "epoch": 3957} {"train_loss": -6.975894927978516, "global_step": 166209, "epoch": 3957} {"train_loss": -6.853732585906982, "global_step": 166210, "epoch": 3957} {"train_loss": -7.174981117248535, "global_step": 166211, "epoch": 3957} {"train_loss": -6.862288951873779, "global_step": 166212, "epoch": 3957} {"train_loss": -6.995510101318359, "global_step": 166213, "epoch": 3957} {"train_loss": -7.121044158935547, "global_step": 166214, "epoch": 3957} {"train_loss": -6.929812908172607, "global_step": 166215, "epoch": 3957} {"train_loss": -7.082671642303467, "global_step": 166216, "epoch": 3957} {"train_loss": -6.9209489822387695, "global_step": 166217, "epoch": 3957} {"train_loss": -6.947447776794434, "global_step": 166218, "epoch": 3957} {"train_loss": -7.001779556274414, "global_step": 166219, "epoch": 3957} {"train_loss": -7.049199104309082, "global_step": 166220, "epoch": 3957} {"train_loss": -7.147119522094727, "global_step": 166221, "epoch": 3957} {"train_loss": -6.989993572235107, "global_step": 166222, "epoch": 3957} {"train_loss": -6.957327365875244, "global_step": 166223, "epoch": 3957} {"train_loss": -6.960396766662598, "global_step": 166224, "epoch": 3957} {"train_loss": -7.026879787445068, "global_step": 166225, "epoch": 3957} {"train_loss": -6.97895622253418, "global_step": 166226, "epoch": 3957} {"train_loss": -7.2045183181762695, "global_step": 166227, "epoch": 3957} {"train_loss": -6.966137886047363, "global_step": 166228, "epoch": 3957} {"train_loss": -6.94407844543457, "global_step": 166229, "epoch": 3957} {"train_loss": -6.909976959228516, "global_step": 166230, "epoch": 3957} {"train_loss": -6.708187103271484, "global_step": 166231, "epoch": 3957} {"train_loss": -6.933518409729004, "global_step": 166232, "epoch": 3957} {"train_loss": -6.756004810333252, "global_step": 166233, "epoch": 3957} {"train_loss": -6.866921424865723, "global_step": 166234, "epoch": 3957} {"train_loss": -6.969379981358846, "global_step": 166235, "epoch": 3957, "val_loss": 79632.171875} {"train_loss": -6.9401469230651855, "global_step": 166236, "epoch": 3958} {"train_loss": -6.950196266174316, "global_step": 166237, "epoch": 3958} {"train_loss": -6.8577680587768555, "global_step": 166238, "epoch": 3958} {"train_loss": -7.071957111358643, "global_step": 166239, "epoch": 3958} {"train_loss": -7.076613903045654, "global_step": 166240, "epoch": 3958} {"train_loss": -6.931042671203613, "global_step": 166241, "epoch": 3958} {"train_loss": -6.966013431549072, "global_step": 166242, "epoch": 3958} {"train_loss": -6.876821517944336, "global_step": 166243, "epoch": 3958} {"train_loss": -6.892181396484375, "global_step": 166244, "epoch": 3958} {"train_loss": -7.041330814361572, "global_step": 166245, "epoch": 3958} {"train_loss": -6.999391555786133, "global_step": 166246, "epoch": 3958} {"train_loss": -6.986532688140869, "global_step": 166247, "epoch": 3958} {"train_loss": -6.979620933532715, "global_step": 166248, "epoch": 3958} {"train_loss": -6.982231140136719, "global_step": 166249, "epoch": 3958} {"train_loss": -7.051495552062988, "global_step": 166250, "epoch": 3958} {"train_loss": -6.982518196105957, "global_step": 166251, "epoch": 3958} {"train_loss": -7.1655731201171875, "global_step": 166252, "epoch": 3958} {"train_loss": -7.054623603820801, "global_step": 166253, "epoch": 3958} {"train_loss": -7.0030412673950195, "global_step": 166254, "epoch": 3958} {"train_loss": -7.037167549133301, "global_step": 166255, "epoch": 3958} {"train_loss": -7.014922618865967, "global_step": 166256, "epoch": 3958} {"train_loss": -6.973665714263916, "global_step": 166257, "epoch": 3958} {"train_loss": -6.948566436767578, "global_step": 166258, "epoch": 3958} {"train_loss": -7.046679496765137, "global_step": 166259, "epoch": 3958} {"train_loss": -7.021059036254883, "global_step": 166260, "epoch": 3958} {"train_loss": -7.102075576782227, "global_step": 166261, "epoch": 3958} {"train_loss": -7.0738911628723145, "global_step": 166262, "epoch": 3958} {"train_loss": -7.0076398849487305, "global_step": 166263, "epoch": 3958} {"train_loss": -7.046429634094238, "global_step": 166264, "epoch": 3958} {"train_loss": -6.888408660888672, "global_step": 166265, "epoch": 3958} {"train_loss": -6.976198196411133, "global_step": 166266, "epoch": 3958} {"train_loss": -7.009222984313965, "global_step": 166267, "epoch": 3958} {"train_loss": -6.956517219543457, "global_step": 166268, "epoch": 3958} {"train_loss": -7.053483486175537, "global_step": 166269, "epoch": 3958} {"train_loss": -7.013180732727051, "global_step": 166270, "epoch": 3958} {"train_loss": -6.8275604248046875, "global_step": 166271, "epoch": 3958} {"train_loss": -7.029120445251465, "global_step": 166272, "epoch": 3958} {"train_loss": -7.025632381439209, "global_step": 166273, "epoch": 3958} {"train_loss": -6.856484413146973, "global_step": 166274, "epoch": 3958} {"train_loss": -7.11031436920166, "global_step": 166275, "epoch": 3958} {"train_loss": -6.934475898742676, "global_step": 166276, "epoch": 3958} {"train_loss": -6.99589805375962, "global_step": 166277, "epoch": 3958, "val_loss": 79796.375} {"train_loss": -7.1643147468566895, "global_step": 166278, "epoch": 3959} {"train_loss": -6.948419570922852, "global_step": 166279, "epoch": 3959} {"train_loss": -7.027131080627441, "global_step": 166280, "epoch": 3959} {"train_loss": -6.816287040710449, "global_step": 166281, "epoch": 3959} {"train_loss": -6.907189846038818, "global_step": 166282, "epoch": 3959} {"train_loss": -6.968776702880859, "global_step": 166283, "epoch": 3959} {"train_loss": -6.695443630218506, "global_step": 166284, "epoch": 3959} {"train_loss": -7.003987789154053, "global_step": 166285, "epoch": 3959} {"train_loss": -6.834601402282715, "global_step": 166286, "epoch": 3959} {"train_loss": -6.795188903808594, "global_step": 166287, "epoch": 3959} {"train_loss": -6.8967390060424805, "global_step": 166288, "epoch": 3959} {"train_loss": -6.892656326293945, "global_step": 166289, "epoch": 3959} {"train_loss": -6.875761032104492, "global_step": 166290, "epoch": 3959} {"train_loss": -6.8549628257751465, "global_step": 166291, "epoch": 3959} {"train_loss": -7.01559591293335, "global_step": 166292, "epoch": 3959} {"train_loss": -6.824506759643555, "global_step": 166293, "epoch": 3959} {"train_loss": -6.9148077964782715, "global_step": 166294, "epoch": 3959} {"train_loss": -6.986212730407715, "global_step": 166295, "epoch": 3959} {"train_loss": -6.900598049163818, "global_step": 166296, "epoch": 3959} {"train_loss": -6.859355926513672, "global_step": 166297, "epoch": 3959} {"train_loss": -7.080868721008301, "global_step": 166298, "epoch": 3959} {"train_loss": -6.8810601234436035, "global_step": 166299, "epoch": 3959} {"train_loss": -6.934353828430176, "global_step": 166300, "epoch": 3959} {"train_loss": -7.025435447692871, "global_step": 166301, "epoch": 3959} {"train_loss": -6.86691427230835, "global_step": 166302, "epoch": 3959} {"train_loss": -7.070034980773926, "global_step": 166303, "epoch": 3959} {"train_loss": -7.007876396179199, "global_step": 166304, "epoch": 3959} {"train_loss": -6.90219783782959, "global_step": 166305, "epoch": 3959} {"train_loss": -6.938502311706543, "global_step": 166306, "epoch": 3959} {"train_loss": -7.016366004943848, "global_step": 166307, "epoch": 3959} {"train_loss": -6.961490631103516, "global_step": 166308, "epoch": 3959} {"train_loss": -6.955842018127441, "global_step": 166309, "epoch": 3959} {"train_loss": -7.0455827713012695, "global_step": 166310, "epoch": 3959} {"train_loss": -6.916212558746338, "global_step": 166311, "epoch": 3959} {"train_loss": -6.979335308074951, "global_step": 166312, "epoch": 3959} {"train_loss": -6.973860263824463, "global_step": 166313, "epoch": 3959} {"train_loss": -7.023900985717773, "global_step": 166314, "epoch": 3959} {"train_loss": -6.985806941986084, "global_step": 166315, "epoch": 3959} {"train_loss": -6.938957214355469, "global_step": 166316, "epoch": 3959} {"train_loss": -6.833556175231934, "global_step": 166317, "epoch": 3959} {"train_loss": -7.091651916503906, "global_step": 166318, "epoch": 3959} {"train_loss": -6.942197527204241, "global_step": 166319, "epoch": 3959, "val_loss": 79498.1484375} {"train_loss": -7.004809379577637, "global_step": 166320, "epoch": 3960} {"train_loss": -7.03494930267334, "global_step": 166321, "epoch": 3960} {"train_loss": -6.989368915557861, "global_step": 166322, "epoch": 3960} {"train_loss": -6.958632469177246, "global_step": 166323, "epoch": 3960} {"train_loss": -6.96406364440918, "global_step": 166324, "epoch": 3960} {"train_loss": -7.070463180541992, "global_step": 166325, "epoch": 3960} {"train_loss": -6.891400337219238, "global_step": 166326, "epoch": 3960} {"train_loss": -6.9348297119140625, "global_step": 166327, "epoch": 3960} {"train_loss": -7.0585737228393555, "global_step": 166328, "epoch": 3960} {"train_loss": -7.035699844360352, "global_step": 166329, "epoch": 3960} {"train_loss": -6.998993873596191, "global_step": 166330, "epoch": 3960} {"train_loss": -7.051480293273926, "global_step": 166331, "epoch": 3960} {"train_loss": -7.059092044830322, "global_step": 166332, "epoch": 3960} {"train_loss": -7.187702178955078, "global_step": 166333, "epoch": 3960} {"train_loss": -7.010788917541504, "global_step": 166334, "epoch": 3960} {"train_loss": -7.0909833908081055, "global_step": 166335, "epoch": 3960} {"train_loss": -7.036894798278809, "global_step": 166336, "epoch": 3960} {"train_loss": -7.0278167724609375, "global_step": 166337, "epoch": 3960} {"train_loss": -7.046636581420898, "global_step": 166338, "epoch": 3960} {"train_loss": -6.991843223571777, "global_step": 166339, "epoch": 3960} {"train_loss": -6.981552600860596, "global_step": 166340, "epoch": 3960} {"train_loss": -7.145792007446289, "global_step": 166341, "epoch": 3960} {"train_loss": -7.073699474334717, "global_step": 166342, "epoch": 3960} {"train_loss": -7.065268516540527, "global_step": 166343, "epoch": 3960} {"train_loss": -6.967301368713379, "global_step": 166344, "epoch": 3960} {"train_loss": -7.033441543579102, "global_step": 166345, "epoch": 3960} {"train_loss": -6.980319023132324, "global_step": 166346, "epoch": 3960} {"train_loss": -7.023819923400879, "global_step": 166347, "epoch": 3960} {"train_loss": -7.032289028167725, "global_step": 166348, "epoch": 3960} {"train_loss": -6.962064743041992, "global_step": 166349, "epoch": 3960} {"train_loss": -6.988195419311523, "global_step": 166350, "epoch": 3960} {"train_loss": -7.033334732055664, "global_step": 166351, "epoch": 3960} {"train_loss": -6.920779228210449, "global_step": 166352, "epoch": 3960} {"train_loss": -7.070958137512207, "global_step": 166353, "epoch": 3960} {"train_loss": -6.942863464355469, "global_step": 166354, "epoch": 3960} {"train_loss": -7.102052688598633, "global_step": 166355, "epoch": 3960} {"train_loss": -6.948883056640625, "global_step": 166356, "epoch": 3960} {"train_loss": -6.994573593139648, "global_step": 166357, "epoch": 3960} {"train_loss": -6.983502388000488, "global_step": 166358, "epoch": 3960} {"train_loss": -7.031084060668945, "global_step": 166359, "epoch": 3960} {"train_loss": -7.080817222595215, "global_step": 166360, "epoch": 3960} {"train_loss": -7.01960775965736, "global_step": 166361, "epoch": 3960, "val_loss": 79645.8515625} {"train_loss": -7.022988319396973, "global_step": 166362, "epoch": 3961} {"train_loss": -6.91682243347168, "global_step": 166363, "epoch": 3961} {"train_loss": -7.101555347442627, "global_step": 166364, "epoch": 3961} {"train_loss": -7.071346282958984, "global_step": 166365, "epoch": 3961} {"train_loss": -7.219259262084961, "global_step": 166366, "epoch": 3961} {"train_loss": -7.019233703613281, "global_step": 166367, "epoch": 3961} {"train_loss": -7.03795051574707, "global_step": 166368, "epoch": 3961} {"train_loss": -6.9454216957092285, "global_step": 166369, "epoch": 3961} {"train_loss": -7.042909622192383, "global_step": 166370, "epoch": 3961} {"train_loss": -7.009479522705078, "global_step": 166371, "epoch": 3961} {"train_loss": -7.214999198913574, "global_step": 166372, "epoch": 3961} {"train_loss": -7.014053821563721, "global_step": 166373, "epoch": 3961} {"train_loss": -7.057434558868408, "global_step": 166374, "epoch": 3961} {"train_loss": -7.025415420532227, "global_step": 166375, "epoch": 3961} {"train_loss": -7.069476127624512, "global_step": 166376, "epoch": 3961} {"train_loss": -7.007078170776367, "global_step": 166377, "epoch": 3961} {"train_loss": -6.934911727905273, "global_step": 166378, "epoch": 3961} {"train_loss": -7.01260232925415, "global_step": 166379, "epoch": 3961} {"train_loss": -6.8883891105651855, "global_step": 166380, "epoch": 3961} {"train_loss": -6.995542526245117, "global_step": 166381, "epoch": 3961} {"train_loss": -7.0212907791137695, "global_step": 166382, "epoch": 3961} {"train_loss": -6.986273765563965, "global_step": 166383, "epoch": 3961} {"train_loss": -7.094419002532959, "global_step": 166384, "epoch": 3961} {"train_loss": -7.0060954093933105, "global_step": 166385, "epoch": 3961} {"train_loss": -6.92317533493042, "global_step": 166386, "epoch": 3961} {"train_loss": -6.952692031860352, "global_step": 166387, "epoch": 3961} {"train_loss": -6.956815719604492, "global_step": 166388, "epoch": 3961} {"train_loss": -7.208168983459473, "global_step": 166389, "epoch": 3961} {"train_loss": -7.063765525817871, "global_step": 166390, "epoch": 3961} {"train_loss": -7.074916839599609, "global_step": 166391, "epoch": 3961} {"train_loss": -6.9792327880859375, "global_step": 166392, "epoch": 3961} {"train_loss": -6.980530738830566, "global_step": 166393, "epoch": 3961} {"train_loss": -7.04676628112793, "global_step": 166394, "epoch": 3961} {"train_loss": -6.981197834014893, "global_step": 166395, "epoch": 3961} {"train_loss": -7.162935256958008, "global_step": 166396, "epoch": 3961} {"train_loss": -7.076746940612793, "global_step": 166397, "epoch": 3961} {"train_loss": -7.099666595458984, "global_step": 166398, "epoch": 3961} {"train_loss": -6.977967739105225, "global_step": 166399, "epoch": 3961} {"train_loss": -7.085573673248291, "global_step": 166400, "epoch": 3961} {"train_loss": -6.92144775390625, "global_step": 166401, "epoch": 3961} {"train_loss": -7.052462577819824, "global_step": 166402, "epoch": 3961} {"train_loss": -7.029856568291073, "global_step": 166403, "epoch": 3961, "val_loss": 79468.109375} {"train_loss": -6.995492935180664, "global_step": 166404, "epoch": 3962} {"train_loss": -7.097005844116211, "global_step": 166405, "epoch": 3962} {"train_loss": -7.007992744445801, "global_step": 166406, "epoch": 3962} {"train_loss": -7.071691513061523, "global_step": 166407, "epoch": 3962} {"train_loss": -6.933084011077881, "global_step": 166408, "epoch": 3962} {"train_loss": -6.9736433029174805, "global_step": 166409, "epoch": 3962} {"train_loss": -6.9409966468811035, "global_step": 166410, "epoch": 3962} {"train_loss": -7.021354675292969, "global_step": 166411, "epoch": 3962} {"train_loss": -6.964792251586914, "global_step": 166412, "epoch": 3962} {"train_loss": -7.027986526489258, "global_step": 166413, "epoch": 3962} {"train_loss": -7.075640678405762, "global_step": 166414, "epoch": 3962} {"train_loss": -7.0522003173828125, "global_step": 166415, "epoch": 3962} {"train_loss": -7.077178955078125, "global_step": 166416, "epoch": 3962} {"train_loss": -7.069875717163086, "global_step": 166417, "epoch": 3962} {"train_loss": -7.022801876068115, "global_step": 166418, "epoch": 3962} {"train_loss": -7.00377082824707, "global_step": 166419, "epoch": 3962} {"train_loss": -6.9691314697265625, "global_step": 166420, "epoch": 3962} {"train_loss": -6.899906158447266, "global_step": 166421, "epoch": 3962} {"train_loss": -7.0496954917907715, "global_step": 166422, "epoch": 3962} {"train_loss": -7.064393043518066, "global_step": 166423, "epoch": 3962} {"train_loss": -6.925753593444824, "global_step": 166424, "epoch": 3962} {"train_loss": -7.032717704772949, "global_step": 166425, "epoch": 3962} {"train_loss": -7.05556058883667, "global_step": 166426, "epoch": 3962} {"train_loss": -6.946878433227539, "global_step": 166427, "epoch": 3962} {"train_loss": -6.957950592041016, "global_step": 166428, "epoch": 3962} {"train_loss": -6.895992279052734, "global_step": 166429, "epoch": 3962} {"train_loss": -7.0853657722473145, "global_step": 166430, "epoch": 3962} {"train_loss": -7.072105407714844, "global_step": 166431, "epoch": 3962} {"train_loss": -7.000194072723389, "global_step": 166432, "epoch": 3962} {"train_loss": -7.0298261642456055, "global_step": 166433, "epoch": 3962} {"train_loss": -7.060333251953125, "global_step": 166434, "epoch": 3962} {"train_loss": -6.992773056030273, "global_step": 166435, "epoch": 3962} {"train_loss": -7.018345832824707, "global_step": 166436, "epoch": 3962} {"train_loss": -6.973665237426758, "global_step": 166437, "epoch": 3962} {"train_loss": -7.039467811584473, "global_step": 166438, "epoch": 3962} {"train_loss": -6.965313911437988, "global_step": 166439, "epoch": 3962} {"train_loss": -6.868274211883545, "global_step": 166440, "epoch": 3962} {"train_loss": -7.019169807434082, "global_step": 166441, "epoch": 3962} {"train_loss": -7.069784164428711, "global_step": 166442, "epoch": 3962} {"train_loss": -6.8508992195129395, "global_step": 166443, "epoch": 3962} {"train_loss": -7.021035194396973, "global_step": 166444, "epoch": 3962} {"train_loss": -7.003724722635178, "global_step": 166445, "epoch": 3962, "val_loss": 79624.0390625} {"train_loss": -7.0657854080200195, "global_step": 166446, "epoch": 3963} {"train_loss": -6.937765121459961, "global_step": 166447, "epoch": 3963} {"train_loss": -6.964972496032715, "global_step": 166448, "epoch": 3963} {"train_loss": -6.815903663635254, "global_step": 166449, "epoch": 3963} {"train_loss": -6.919572830200195, "global_step": 166450, "epoch": 3963} {"train_loss": -6.951398849487305, "global_step": 166451, "epoch": 3963} {"train_loss": -6.8634352684021, "global_step": 166452, "epoch": 3963} {"train_loss": -7.021862030029297, "global_step": 166453, "epoch": 3963} {"train_loss": -6.998446464538574, "global_step": 166454, "epoch": 3963} {"train_loss": -6.828057765960693, "global_step": 166455, "epoch": 3963} {"train_loss": -7.1744608879089355, "global_step": 166456, "epoch": 3963} {"train_loss": -6.930913925170898, "global_step": 166457, "epoch": 3963} {"train_loss": -7.010113716125488, "global_step": 166458, "epoch": 3963} {"train_loss": -6.963197231292725, "global_step": 166459, "epoch": 3963} {"train_loss": -6.973390579223633, "global_step": 166460, "epoch": 3963} {"train_loss": -6.97330379486084, "global_step": 166461, "epoch": 3963} {"train_loss": -6.982851505279541, "global_step": 166462, "epoch": 3963} {"train_loss": -6.951023101806641, "global_step": 166463, "epoch": 3963} {"train_loss": -6.939916610717773, "global_step": 166464, "epoch": 3963} {"train_loss": -6.979947090148926, "global_step": 166465, "epoch": 3963} {"train_loss": -6.9598588943481445, "global_step": 166466, "epoch": 3963} {"train_loss": -6.85720157623291, "global_step": 166467, "epoch": 3963} {"train_loss": -6.882915496826172, "global_step": 166468, "epoch": 3963} {"train_loss": -7.059253692626953, "global_step": 166469, "epoch": 3963} {"train_loss": -7.022710800170898, "global_step": 166470, "epoch": 3963} {"train_loss": -6.958950996398926, "global_step": 166471, "epoch": 3963} {"train_loss": -6.977597236633301, "global_step": 166472, "epoch": 3963} {"train_loss": -6.972212791442871, "global_step": 166473, "epoch": 3963} {"train_loss": -6.962517738342285, "global_step": 166474, "epoch": 3963} {"train_loss": -7.022469520568848, "global_step": 166475, "epoch": 3963} {"train_loss": -6.911153316497803, "global_step": 166476, "epoch": 3963} {"train_loss": -7.057900428771973, "global_step": 166477, "epoch": 3963} {"train_loss": -7.0517120361328125, "global_step": 166478, "epoch": 3963} {"train_loss": -7.010099411010742, "global_step": 166479, "epoch": 3963} {"train_loss": -6.969595909118652, "global_step": 166480, "epoch": 3963} {"train_loss": -6.9847002029418945, "global_step": 166481, "epoch": 3963} {"train_loss": -6.957769393920898, "global_step": 166482, "epoch": 3963} {"train_loss": -6.974585056304932, "global_step": 166483, "epoch": 3963} {"train_loss": -6.863044261932373, "global_step": 166484, "epoch": 3963} {"train_loss": -6.982395172119141, "global_step": 166485, "epoch": 3963} {"train_loss": -6.916522979736328, "global_step": 166486, "epoch": 3963} {"train_loss": -6.96458625793457, "global_step": 166487, "epoch": 3963, "val_loss": 79965.28125} {"train_loss": -6.91024112701416, "global_step": 166488, "epoch": 3964} {"train_loss": -6.910823822021484, "global_step": 166489, "epoch": 3964} {"train_loss": -6.96258544921875, "global_step": 166490, "epoch": 3964} {"train_loss": -6.988924026489258, "global_step": 166491, "epoch": 3964} {"train_loss": -7.09765100479126, "global_step": 166492, "epoch": 3964} {"train_loss": -6.993189811706543, "global_step": 166493, "epoch": 3964} {"train_loss": -7.040945053100586, "global_step": 166494, "epoch": 3964} {"train_loss": -6.942659378051758, "global_step": 166495, "epoch": 3964} {"train_loss": -7.007255554199219, "global_step": 166496, "epoch": 3964} {"train_loss": -6.990556240081787, "global_step": 166497, "epoch": 3964} {"train_loss": -7.038686275482178, "global_step": 166498, "epoch": 3964} {"train_loss": -6.929640293121338, "global_step": 166499, "epoch": 3964} {"train_loss": -6.96152400970459, "global_step": 166500, "epoch": 3964} {"train_loss": -7.015661239624023, "global_step": 166501, "epoch": 3964} {"train_loss": -6.99098539352417, "global_step": 166502, "epoch": 3964} {"train_loss": -7.024219036102295, "global_step": 166503, "epoch": 3964} {"train_loss": -6.981947898864746, "global_step": 166504, "epoch": 3964} {"train_loss": -6.969277381896973, "global_step": 166505, "epoch": 3964} {"train_loss": -6.998597621917725, "global_step": 166506, "epoch": 3964} {"train_loss": -7.029259204864502, "global_step": 166507, "epoch": 3964} {"train_loss": -7.07615327835083, "global_step": 166508, "epoch": 3964} {"train_loss": -7.018607139587402, "global_step": 166509, "epoch": 3964} {"train_loss": -7.11667537689209, "global_step": 166510, "epoch": 3964} {"train_loss": -6.93229866027832, "global_step": 166511, "epoch": 3964} {"train_loss": -7.004752159118652, "global_step": 166512, "epoch": 3964} {"train_loss": -7.018621444702148, "global_step": 166513, "epoch": 3964} {"train_loss": -6.9432806968688965, "global_step": 166514, "epoch": 3964} {"train_loss": -7.023458480834961, "global_step": 166515, "epoch": 3964} {"train_loss": -7.187623977661133, "global_step": 166516, "epoch": 3964} {"train_loss": -7.0010857582092285, "global_step": 166517, "epoch": 3964} {"train_loss": -6.978273391723633, "global_step": 166518, "epoch": 3964} {"train_loss": -7.055336952209473, "global_step": 166519, "epoch": 3964} {"train_loss": -6.877688407897949, "global_step": 166520, "epoch": 3964} {"train_loss": -6.9933366775512695, "global_step": 166521, "epoch": 3964} {"train_loss": -7.01193904876709, "global_step": 166522, "epoch": 3964} {"train_loss": -7.080571174621582, "global_step": 166523, "epoch": 3964} {"train_loss": -7.018106460571289, "global_step": 166524, "epoch": 3964} {"train_loss": -7.054569244384766, "global_step": 166525, "epoch": 3964} {"train_loss": -6.9702043533325195, "global_step": 166526, "epoch": 3964} {"train_loss": -6.895262718200684, "global_step": 166527, "epoch": 3964} {"train_loss": -6.963198661804199, "global_step": 166528, "epoch": 3964} {"train_loss": -6.999347164517357, "global_step": 166529, "epoch": 3964, "val_loss": 79446.53125} {"train_loss": -7.047759056091309, "global_step": 166530, "epoch": 3965} {"train_loss": -7.0704827308654785, "global_step": 166531, "epoch": 3965} {"train_loss": -6.8991498947143555, "global_step": 166532, "epoch": 3965} {"train_loss": -6.938620090484619, "global_step": 166533, "epoch": 3965} {"train_loss": -6.943515777587891, "global_step": 166534, "epoch": 3965} {"train_loss": -7.054559707641602, "global_step": 166535, "epoch": 3965} {"train_loss": -6.932448387145996, "global_step": 166536, "epoch": 3965} {"train_loss": -6.9508748054504395, "global_step": 166537, "epoch": 3965} {"train_loss": -6.967721462249756, "global_step": 166538, "epoch": 3965} {"train_loss": -6.958536624908447, "global_step": 166539, "epoch": 3965} {"train_loss": -7.021600723266602, "global_step": 166540, "epoch": 3965} {"train_loss": -6.852365016937256, "global_step": 166541, "epoch": 3965} {"train_loss": -6.965367317199707, "global_step": 166542, "epoch": 3965} {"train_loss": -6.925197601318359, "global_step": 166543, "epoch": 3965} {"train_loss": -6.844914436340332, "global_step": 166544, "epoch": 3965} {"train_loss": -6.833497524261475, "global_step": 166545, "epoch": 3965} {"train_loss": -6.902310371398926, "global_step": 166546, "epoch": 3965} {"train_loss": -6.835505485534668, "global_step": 166547, "epoch": 3965} {"train_loss": -6.862321853637695, "global_step": 166548, "epoch": 3965} {"train_loss": -6.86838960647583, "global_step": 166549, "epoch": 3965} {"train_loss": -7.002078056335449, "global_step": 166550, "epoch": 3965} {"train_loss": -6.995190620422363, "global_step": 166551, "epoch": 3965} {"train_loss": -7.016009330749512, "global_step": 166552, "epoch": 3965} {"train_loss": -6.958560943603516, "global_step": 166553, "epoch": 3965} {"train_loss": -7.093432903289795, "global_step": 166554, "epoch": 3965} {"train_loss": -6.843169689178467, "global_step": 166555, "epoch": 3965} {"train_loss": -6.982169151306152, "global_step": 166556, "epoch": 3965} {"train_loss": -6.980774402618408, "global_step": 166557, "epoch": 3965} {"train_loss": -6.970250129699707, "global_step": 166558, "epoch": 3965} {"train_loss": -6.961819648742676, "global_step": 166559, "epoch": 3965} {"train_loss": -7.027559757232666, "global_step": 166560, "epoch": 3965} {"train_loss": -6.961575984954834, "global_step": 166561, "epoch": 3965} {"train_loss": -7.044400215148926, "global_step": 166562, "epoch": 3965} {"train_loss": -7.0606231689453125, "global_step": 166563, "epoch": 3965} {"train_loss": -6.9868669509887695, "global_step": 166564, "epoch": 3965} {"train_loss": -6.987957000732422, "global_step": 166565, "epoch": 3965} {"train_loss": -7.080242156982422, "global_step": 166566, "epoch": 3965} {"train_loss": -7.024313926696777, "global_step": 166567, "epoch": 3965} {"train_loss": -7.10075044631958, "global_step": 166568, "epoch": 3965} {"train_loss": -7.123667240142822, "global_step": 166569, "epoch": 3965} {"train_loss": -7.0354509353637695, "global_step": 166570, "epoch": 3965} {"train_loss": -6.977145728610811, "global_step": 166571, "epoch": 3965, "val_loss": 79760.875} {"train_loss": -7.08126163482666, "global_step": 166572, "epoch": 3966} {"train_loss": -6.992119789123535, "global_step": 166573, "epoch": 3966} {"train_loss": -7.010035037994385, "global_step": 166574, "epoch": 3966} {"train_loss": -7.099749565124512, "global_step": 166575, "epoch": 3966} {"train_loss": -7.082402229309082, "global_step": 166576, "epoch": 3966} {"train_loss": -6.981352806091309, "global_step": 166577, "epoch": 3966} {"train_loss": -7.034013748168945, "global_step": 166578, "epoch": 3966} {"train_loss": -7.144153594970703, "global_step": 166579, "epoch": 3966} {"train_loss": -7.092715263366699, "global_step": 166580, "epoch": 3966} {"train_loss": -7.054906845092773, "global_step": 166581, "epoch": 3966} {"train_loss": -7.050902843475342, "global_step": 166582, "epoch": 3966} {"train_loss": -7.096302032470703, "global_step": 166583, "epoch": 3966} {"train_loss": -7.109037399291992, "global_step": 166584, "epoch": 3966} {"train_loss": -7.231879234313965, "global_step": 166585, "epoch": 3966} {"train_loss": -7.088788032531738, "global_step": 166586, "epoch": 3966} {"train_loss": -7.002964973449707, "global_step": 166587, "epoch": 3966} {"train_loss": -7.085555076599121, "global_step": 166588, "epoch": 3966} {"train_loss": -7.099769592285156, "global_step": 166589, "epoch": 3966} {"train_loss": -7.075520992279053, "global_step": 166590, "epoch": 3966} {"train_loss": -7.063558578491211, "global_step": 166591, "epoch": 3966} {"train_loss": -7.039639949798584, "global_step": 166592, "epoch": 3966} {"train_loss": -6.986228942871094, "global_step": 166593, "epoch": 3966} {"train_loss": -7.228968143463135, "global_step": 166594, "epoch": 3966} {"train_loss": -6.896129608154297, "global_step": 166595, "epoch": 3966} {"train_loss": -7.11378288269043, "global_step": 166596, "epoch": 3966} {"train_loss": -7.101685523986816, "global_step": 166597, "epoch": 3966} {"train_loss": -6.965544700622559, "global_step": 166598, "epoch": 3966} {"train_loss": -7.003527641296387, "global_step": 166599, "epoch": 3966} {"train_loss": -7.037446975708008, "global_step": 166600, "epoch": 3966} {"train_loss": -6.926491737365723, "global_step": 166601, "epoch": 3966} {"train_loss": -6.971330642700195, "global_step": 166602, "epoch": 3966} {"train_loss": -7.032681465148926, "global_step": 166603, "epoch": 3966} {"train_loss": -6.913774490356445, "global_step": 166604, "epoch": 3966} {"train_loss": -7.040497779846191, "global_step": 166605, "epoch": 3966} {"train_loss": -6.93402099609375, "global_step": 166606, "epoch": 3966} {"train_loss": -6.926388740539551, "global_step": 166607, "epoch": 3966} {"train_loss": -7.054477691650391, "global_step": 166608, "epoch": 3966} {"train_loss": -7.074295997619629, "global_step": 166609, "epoch": 3966} {"train_loss": -6.984096527099609, "global_step": 166610, "epoch": 3966} {"train_loss": -6.988976001739502, "global_step": 166611, "epoch": 3966} {"train_loss": -7.0120954513549805, "global_step": 166612, "epoch": 3966} {"train_loss": -7.0396989186604815, "global_step": 166613, "epoch": 3966, "val_loss": 79657.765625} {"train_loss": -6.970603942871094, "global_step": 166614, "epoch": 3967} {"train_loss": -7.113521575927734, "global_step": 166615, "epoch": 3967} {"train_loss": -6.964715957641602, "global_step": 166616, "epoch": 3967} {"train_loss": -7.040518283843994, "global_step": 166617, "epoch": 3967} {"train_loss": -7.067314147949219, "global_step": 166618, "epoch": 3967} {"train_loss": -7.008742332458496, "global_step": 166619, "epoch": 3967} {"train_loss": -6.944051742553711, "global_step": 166620, "epoch": 3967} {"train_loss": -6.987329483032227, "global_step": 166621, "epoch": 3967} {"train_loss": -7.109993934631348, "global_step": 166622, "epoch": 3967} {"train_loss": -6.9455766677856445, "global_step": 166623, "epoch": 3967} {"train_loss": -6.94976282119751, "global_step": 166624, "epoch": 3967} {"train_loss": -7.016568660736084, "global_step": 166625, "epoch": 3967} {"train_loss": -6.991156578063965, "global_step": 166626, "epoch": 3967} {"train_loss": -6.842802047729492, "global_step": 166627, "epoch": 3967} {"train_loss": -6.932765960693359, "global_step": 166628, "epoch": 3967} {"train_loss": -7.038816452026367, "global_step": 166629, "epoch": 3967} {"train_loss": -6.942343711853027, "global_step": 166630, "epoch": 3967} {"train_loss": -6.9600677490234375, "global_step": 166631, "epoch": 3967} {"train_loss": -7.039134502410889, "global_step": 166632, "epoch": 3967} {"train_loss": -7.0891547203063965, "global_step": 166633, "epoch": 3967} {"train_loss": -6.935490131378174, "global_step": 166634, "epoch": 3967} {"train_loss": -6.958371162414551, "global_step": 166635, "epoch": 3967} {"train_loss": -7.03090763092041, "global_step": 166636, "epoch": 3967} {"train_loss": -7.00364351272583, "global_step": 166637, "epoch": 3967} {"train_loss": -6.971090316772461, "global_step": 166638, "epoch": 3967} {"train_loss": -7.068799018859863, "global_step": 166639, "epoch": 3967} {"train_loss": -6.961379528045654, "global_step": 166640, "epoch": 3967} {"train_loss": -6.972549915313721, "global_step": 166641, "epoch": 3967} {"train_loss": -7.021958351135254, "global_step": 166642, "epoch": 3967} {"train_loss": -7.099897861480713, "global_step": 166643, "epoch": 3967} {"train_loss": -6.964890956878662, "global_step": 166644, "epoch": 3967} {"train_loss": -6.894320487976074, "global_step": 166645, "epoch": 3967} {"train_loss": -7.155577659606934, "global_step": 166646, "epoch": 3967} {"train_loss": -7.009781837463379, "global_step": 166647, "epoch": 3967} {"train_loss": -7.113034248352051, "global_step": 166648, "epoch": 3967} {"train_loss": -7.1078290939331055, "global_step": 166649, "epoch": 3967} {"train_loss": -7.030094146728516, "global_step": 166650, "epoch": 3967} {"train_loss": -7.003453254699707, "global_step": 166651, "epoch": 3967} {"train_loss": -6.972748756408691, "global_step": 166652, "epoch": 3967} {"train_loss": -7.098038673400879, "global_step": 166653, "epoch": 3967} {"train_loss": -7.065552711486816, "global_step": 166654, "epoch": 3967} {"train_loss": -7.010948010853359, "global_step": 166655, "epoch": 3967, "val_loss": 79363.390625} {"train_loss": -7.00602912902832, "global_step": 166656, "epoch": 3968} {"train_loss": -7.06696891784668, "global_step": 166657, "epoch": 3968} {"train_loss": -7.028210639953613, "global_step": 166658, "epoch": 3968} {"train_loss": -7.025630950927734, "global_step": 166659, "epoch": 3968} {"train_loss": -7.121899127960205, "global_step": 166660, "epoch": 3968} {"train_loss": -7.054255485534668, "global_step": 166661, "epoch": 3968} {"train_loss": -7.0168843269348145, "global_step": 166662, "epoch": 3968} {"train_loss": -6.995980262756348, "global_step": 166663, "epoch": 3968} {"train_loss": -6.983046531677246, "global_step": 166664, "epoch": 3968} {"train_loss": -6.964204788208008, "global_step": 166665, "epoch": 3968} {"train_loss": -7.0275115966796875, "global_step": 166666, "epoch": 3968} {"train_loss": -7.063836097717285, "global_step": 166667, "epoch": 3968} {"train_loss": -7.194941520690918, "global_step": 166668, "epoch": 3968} {"train_loss": -6.986504554748535, "global_step": 166669, "epoch": 3968} {"train_loss": -7.103758335113525, "global_step": 166670, "epoch": 3968} {"train_loss": -6.993083953857422, "global_step": 166671, "epoch": 3968} {"train_loss": -7.010114669799805, "global_step": 166672, "epoch": 3968} {"train_loss": -7.055238246917725, "global_step": 166673, "epoch": 3968} {"train_loss": -7.166159629821777, "global_step": 166674, "epoch": 3968} {"train_loss": -7.088004112243652, "global_step": 166675, "epoch": 3968} {"train_loss": -7.026236534118652, "global_step": 166676, "epoch": 3968} {"train_loss": -7.087489128112793, "global_step": 166677, "epoch": 3968} {"train_loss": -7.009769916534424, "global_step": 166678, "epoch": 3968} {"train_loss": -7.001971244812012, "global_step": 166679, "epoch": 3968} {"train_loss": -7.068138122558594, "global_step": 166680, "epoch": 3968} {"train_loss": -6.921583652496338, "global_step": 166681, "epoch": 3968} {"train_loss": -6.915850639343262, "global_step": 166682, "epoch": 3968} {"train_loss": -7.0632476806640625, "global_step": 166683, "epoch": 3968} {"train_loss": -6.936977863311768, "global_step": 166684, "epoch": 3968} {"train_loss": -6.960179328918457, "global_step": 166685, "epoch": 3968} {"train_loss": -6.943352699279785, "global_step": 166686, "epoch": 3968} {"train_loss": -6.900766849517822, "global_step": 166687, "epoch": 3968} {"train_loss": -7.090735912322998, "global_step": 166688, "epoch": 3968} {"train_loss": -6.785914421081543, "global_step": 166689, "epoch": 3968} {"train_loss": -6.837032318115234, "global_step": 166690, "epoch": 3968} {"train_loss": -6.950772285461426, "global_step": 166691, "epoch": 3968} {"train_loss": -6.881341457366943, "global_step": 166692, "epoch": 3968} {"train_loss": -6.7943010330200195, "global_step": 166693, "epoch": 3968} {"train_loss": -7.044661521911621, "global_step": 166694, "epoch": 3968} {"train_loss": -6.803733825683594, "global_step": 166695, "epoch": 3968} {"train_loss": -6.861973762512207, "global_step": 166696, "epoch": 3968} {"train_loss": -6.995067244484311, "global_step": 166697, "epoch": 3968, "val_loss": 79463.59375} {"train_loss": -6.8168745040893555, "global_step": 166698, "epoch": 3969} {"train_loss": -6.9013519287109375, "global_step": 166699, "epoch": 3969} {"train_loss": -6.9252119064331055, "global_step": 166700, "epoch": 3969} {"train_loss": -6.991998672485352, "global_step": 166701, "epoch": 3969} {"train_loss": -6.908542633056641, "global_step": 166702, "epoch": 3969} {"train_loss": -7.025639533996582, "global_step": 166703, "epoch": 3969} {"train_loss": -6.8423051834106445, "global_step": 166704, "epoch": 3969} {"train_loss": -7.013435363769531, "global_step": 166705, "epoch": 3969} {"train_loss": -6.893678665161133, "global_step": 166706, "epoch": 3969} {"train_loss": -6.969810485839844, "global_step": 166707, "epoch": 3969} {"train_loss": -6.839840888977051, "global_step": 166708, "epoch": 3969} {"train_loss": -6.974550247192383, "global_step": 166709, "epoch": 3969} {"train_loss": -7.007937431335449, "global_step": 166710, "epoch": 3969} {"train_loss": -7.097806930541992, "global_step": 166711, "epoch": 3969} {"train_loss": -7.007926940917969, "global_step": 166712, "epoch": 3969} {"train_loss": -6.990304470062256, "global_step": 166713, "epoch": 3969} {"train_loss": -6.949054718017578, "global_step": 166714, "epoch": 3969} {"train_loss": -6.907458782196045, "global_step": 166715, "epoch": 3969} {"train_loss": -7.017889976501465, "global_step": 166716, "epoch": 3969} {"train_loss": -7.008424758911133, "global_step": 166717, "epoch": 3969} {"train_loss": -6.94231653213501, "global_step": 166718, "epoch": 3969} {"train_loss": -6.901289463043213, "global_step": 166719, "epoch": 3969} {"train_loss": -6.9533796310424805, "global_step": 166720, "epoch": 3969} {"train_loss": -7.061203479766846, "global_step": 166721, "epoch": 3969} {"train_loss": -7.079679489135742, "global_step": 166722, "epoch": 3969} {"train_loss": -6.9962663650512695, "global_step": 166723, "epoch": 3969} {"train_loss": -7.0060319900512695, "global_step": 166724, "epoch": 3969} {"train_loss": -6.960333824157715, "global_step": 166725, "epoch": 3969} {"train_loss": -6.927645683288574, "global_step": 166726, "epoch": 3969} {"train_loss": -6.974738121032715, "global_step": 166727, "epoch": 3969} {"train_loss": -7.068243026733398, "global_step": 166728, "epoch": 3969} {"train_loss": -6.937904357910156, "global_step": 166729, "epoch": 3969} {"train_loss": -6.99627685546875, "global_step": 166730, "epoch": 3969} {"train_loss": -7.001705169677734, "global_step": 166731, "epoch": 3969} {"train_loss": -7.045654773712158, "global_step": 166732, "epoch": 3969} {"train_loss": -7.056015968322754, "global_step": 166733, "epoch": 3969} {"train_loss": -6.941608428955078, "global_step": 166734, "epoch": 3969} {"train_loss": -7.035831451416016, "global_step": 166735, "epoch": 3969} {"train_loss": -7.008498191833496, "global_step": 166736, "epoch": 3969} {"train_loss": -6.978407859802246, "global_step": 166737, "epoch": 3969} {"train_loss": -7.093238830566406, "global_step": 166738, "epoch": 3969} {"train_loss": -6.97839187440418, "global_step": 166739, "epoch": 3969, "val_loss": 79710.265625} {"train_loss": -7.007085800170898, "global_step": 166740, "epoch": 3970} {"train_loss": -6.960156440734863, "global_step": 166741, "epoch": 3970} {"train_loss": -7.0615386962890625, "global_step": 166742, "epoch": 3970} {"train_loss": -7.116053581237793, "global_step": 166743, "epoch": 3970} {"train_loss": -7.065812110900879, "global_step": 166744, "epoch": 3970} {"train_loss": -7.060552597045898, "global_step": 166745, "epoch": 3970} {"train_loss": -7.031825065612793, "global_step": 166746, "epoch": 3970} {"train_loss": -7.137473106384277, "global_step": 166747, "epoch": 3970} {"train_loss": -7.001319885253906, "global_step": 166748, "epoch": 3970} {"train_loss": -7.0762038230896, "global_step": 166749, "epoch": 3970} {"train_loss": -7.008106708526611, "global_step": 166750, "epoch": 3970} {"train_loss": -7.058820724487305, "global_step": 166751, "epoch": 3970} {"train_loss": -6.985777378082275, "global_step": 166752, "epoch": 3970} {"train_loss": -6.912587642669678, "global_step": 166753, "epoch": 3970} {"train_loss": -7.024447917938232, "global_step": 166754, "epoch": 3970} {"train_loss": -6.898492813110352, "global_step": 166755, "epoch": 3970} {"train_loss": -7.0688276290893555, "global_step": 166756, "epoch": 3970} {"train_loss": -7.045727729797363, "global_step": 166757, "epoch": 3970} {"train_loss": -6.850394248962402, "global_step": 166758, "epoch": 3970} {"train_loss": -7.086536884307861, "global_step": 166759, "epoch": 3970} {"train_loss": -7.009335994720459, "global_step": 166760, "epoch": 3970} {"train_loss": -6.99254035949707, "global_step": 166761, "epoch": 3970} {"train_loss": -7.059515476226807, "global_step": 166762, "epoch": 3970} {"train_loss": -6.954300880432129, "global_step": 166763, "epoch": 3970} {"train_loss": -7.020009994506836, "global_step": 166764, "epoch": 3970} {"train_loss": -6.937040328979492, "global_step": 166765, "epoch": 3970} {"train_loss": -7.010074138641357, "global_step": 166766, "epoch": 3970} {"train_loss": -6.91093111038208, "global_step": 166767, "epoch": 3970} {"train_loss": -6.919764518737793, "global_step": 166768, "epoch": 3970} {"train_loss": -6.944910049438477, "global_step": 166769, "epoch": 3970} {"train_loss": -6.812527179718018, "global_step": 166770, "epoch": 3970} {"train_loss": -6.869763374328613, "global_step": 166771, "epoch": 3970} {"train_loss": -6.835799217224121, "global_step": 166772, "epoch": 3970} {"train_loss": -7.000931739807129, "global_step": 166773, "epoch": 3970} {"train_loss": -6.8631978034973145, "global_step": 166774, "epoch": 3970} {"train_loss": -6.900554656982422, "global_step": 166775, "epoch": 3970} {"train_loss": -7.044466018676758, "global_step": 166776, "epoch": 3970} {"train_loss": -6.932736396789551, "global_step": 166777, "epoch": 3970} {"train_loss": -7.056440353393555, "global_step": 166778, "epoch": 3970} {"train_loss": -6.853786468505859, "global_step": 166779, "epoch": 3970} {"train_loss": -6.859151363372803, "global_step": 166780, "epoch": 3970} {"train_loss": -6.982355855760121, "global_step": 166781, "epoch": 3970, "val_loss": 79825.5625} {"train_loss": -6.889095306396484, "global_step": 166782, "epoch": 3971} {"train_loss": -6.971078872680664, "global_step": 166783, "epoch": 3971} {"train_loss": -6.88831901550293, "global_step": 166784, "epoch": 3971} {"train_loss": -6.956635475158691, "global_step": 166785, "epoch": 3971} {"train_loss": -6.9350385665893555, "global_step": 166786, "epoch": 3971} {"train_loss": -6.903092861175537, "global_step": 166787, "epoch": 3971} {"train_loss": -6.996183395385742, "global_step": 166788, "epoch": 3971} {"train_loss": -7.0528717041015625, "global_step": 166789, "epoch": 3971} {"train_loss": -6.998907089233398, "global_step": 166790, "epoch": 3971} {"train_loss": -6.949686050415039, "global_step": 166791, "epoch": 3971} {"train_loss": -6.924270153045654, "global_step": 166792, "epoch": 3971} {"train_loss": -7.051631450653076, "global_step": 166793, "epoch": 3971} {"train_loss": -7.029029846191406, "global_step": 166794, "epoch": 3971} {"train_loss": -6.852011680603027, "global_step": 166795, "epoch": 3971} {"train_loss": -7.148558139801025, "global_step": 166796, "epoch": 3971} {"train_loss": -7.0300726890563965, "global_step": 166797, "epoch": 3971} {"train_loss": -6.970473289489746, "global_step": 166798, "epoch": 3971} {"train_loss": -7.022093772888184, "global_step": 166799, "epoch": 3971} {"train_loss": -6.9906182289123535, "global_step": 166800, "epoch": 3971} {"train_loss": -7.003912448883057, "global_step": 166801, "epoch": 3971} {"train_loss": -6.925117492675781, "global_step": 166802, "epoch": 3971} {"train_loss": -6.994563102722168, "global_step": 166803, "epoch": 3971} {"train_loss": -6.886803150177002, "global_step": 166804, "epoch": 3971} {"train_loss": -7.01374626159668, "global_step": 166805, "epoch": 3971} {"train_loss": -7.044305324554443, "global_step": 166806, "epoch": 3971} {"train_loss": -7.058354377746582, "global_step": 166807, "epoch": 3971} {"train_loss": -7.12631368637085, "global_step": 166808, "epoch": 3971} {"train_loss": -6.989100456237793, "global_step": 166809, "epoch": 3971} {"train_loss": -6.91365909576416, "global_step": 166810, "epoch": 3971} {"train_loss": -7.092891693115234, "global_step": 166811, "epoch": 3971} {"train_loss": -6.983320236206055, "global_step": 166812, "epoch": 3971} {"train_loss": -7.063911437988281, "global_step": 166813, "epoch": 3971} {"train_loss": -6.940018653869629, "global_step": 166814, "epoch": 3971} {"train_loss": -7.098715782165527, "global_step": 166815, "epoch": 3971} {"train_loss": -7.128190994262695, "global_step": 166816, "epoch": 3971} {"train_loss": -7.111530780792236, "global_step": 166817, "epoch": 3971} {"train_loss": -7.07399845123291, "global_step": 166818, "epoch": 3971} {"train_loss": -6.98580265045166, "global_step": 166819, "epoch": 3971} {"train_loss": -6.958189964294434, "global_step": 166820, "epoch": 3971} {"train_loss": -7.060482025146484, "global_step": 166821, "epoch": 3971} {"train_loss": -7.056427955627441, "global_step": 166822, "epoch": 3971} {"train_loss": -7.001398041134789, "global_step": 166823, "epoch": 3971, "val_loss": 79621.7421875} {"train_loss": -7.087172985076904, "global_step": 166824, "epoch": 3972} {"train_loss": -7.027665615081787, "global_step": 166825, "epoch": 3972} {"train_loss": -6.932924747467041, "global_step": 166826, "epoch": 3972} {"train_loss": -6.9432692527771, "global_step": 166827, "epoch": 3972} {"train_loss": -6.983309268951416, "global_step": 166828, "epoch": 3972} {"train_loss": -6.966579437255859, "global_step": 166829, "epoch": 3972} {"train_loss": -7.014530181884766, "global_step": 166830, "epoch": 3972} {"train_loss": -6.990445137023926, "global_step": 166831, "epoch": 3972} {"train_loss": -7.055187702178955, "global_step": 166832, "epoch": 3972} {"train_loss": -7.120085716247559, "global_step": 166833, "epoch": 3972} {"train_loss": -7.056004524230957, "global_step": 166834, "epoch": 3972} {"train_loss": -7.172238349914551, "global_step": 166835, "epoch": 3972} {"train_loss": -7.102191925048828, "global_step": 166836, "epoch": 3972} {"train_loss": -6.992225170135498, "global_step": 166837, "epoch": 3972} {"train_loss": -7.034841537475586, "global_step": 166838, "epoch": 3972} {"train_loss": -7.052856922149658, "global_step": 166839, "epoch": 3972} {"train_loss": -7.008271217346191, "global_step": 166840, "epoch": 3972} {"train_loss": -7.018561363220215, "global_step": 166841, "epoch": 3972} {"train_loss": -6.970163822174072, "global_step": 166842, "epoch": 3972} {"train_loss": -7.023778915405273, "global_step": 166843, "epoch": 3972} {"train_loss": -6.971148490905762, "global_step": 166844, "epoch": 3972} {"train_loss": -7.043239116668701, "global_step": 166845, "epoch": 3972} {"train_loss": -6.904869079589844, "global_step": 166846, "epoch": 3972} {"train_loss": -7.012335777282715, "global_step": 166847, "epoch": 3972} {"train_loss": -7.099837303161621, "global_step": 166848, "epoch": 3972} {"train_loss": -7.036986351013184, "global_step": 166849, "epoch": 3972} {"train_loss": -6.912468910217285, "global_step": 166850, "epoch": 3972} {"train_loss": -7.031565189361572, "global_step": 166851, "epoch": 3972} {"train_loss": -7.063518047332764, "global_step": 166852, "epoch": 3972} {"train_loss": -6.995512008666992, "global_step": 166853, "epoch": 3972} {"train_loss": -7.077179908752441, "global_step": 166854, "epoch": 3972} {"train_loss": -7.108777046203613, "global_step": 166855, "epoch": 3972} {"train_loss": -6.967500686645508, "global_step": 166856, "epoch": 3972} {"train_loss": -7.056121826171875, "global_step": 166857, "epoch": 3972} {"train_loss": -7.071351528167725, "global_step": 166858, "epoch": 3972} {"train_loss": -6.936317443847656, "global_step": 166859, "epoch": 3972} {"train_loss": -6.998047828674316, "global_step": 166860, "epoch": 3972} {"train_loss": -6.948056221008301, "global_step": 166861, "epoch": 3972} {"train_loss": -7.0168304443359375, "global_step": 166862, "epoch": 3972} {"train_loss": -6.911694526672363, "global_step": 166863, "epoch": 3972} {"train_loss": -7.0427703857421875, "global_step": 166864, "epoch": 3972} {"train_loss": -7.01643849554516, "global_step": 166865, "epoch": 3972, "val_loss": 79761.09375} {"train_loss": -7.03456974029541, "global_step": 166866, "epoch": 3973} {"train_loss": -6.9987382888793945, "global_step": 166867, "epoch": 3973} {"train_loss": -6.899078369140625, "global_step": 166868, "epoch": 3973} {"train_loss": -7.043399810791016, "global_step": 166869, "epoch": 3973} {"train_loss": -7.028234481811523, "global_step": 166870, "epoch": 3973} {"train_loss": -7.018951416015625, "global_step": 166871, "epoch": 3973} {"train_loss": -6.929193496704102, "global_step": 166872, "epoch": 3973} {"train_loss": -6.909351348876953, "global_step": 166873, "epoch": 3973} {"train_loss": -6.9760942459106445, "global_step": 166874, "epoch": 3973} {"train_loss": -7.056431770324707, "global_step": 166875, "epoch": 3973} {"train_loss": -6.895223617553711, "global_step": 166876, "epoch": 3973} {"train_loss": -6.9653215408325195, "global_step": 166877, "epoch": 3973} {"train_loss": -6.980248928070068, "global_step": 166878, "epoch": 3973} {"train_loss": -6.88142204284668, "global_step": 166879, "epoch": 3973} {"train_loss": -6.9930901527404785, "global_step": 166880, "epoch": 3973} {"train_loss": -6.9688005447387695, "global_step": 166881, "epoch": 3973} {"train_loss": -6.898434162139893, "global_step": 166882, "epoch": 3973} {"train_loss": -6.855643272399902, "global_step": 166883, "epoch": 3973} {"train_loss": -6.893312454223633, "global_step": 166884, "epoch": 3973} {"train_loss": -6.938843250274658, "global_step": 166885, "epoch": 3973} {"train_loss": -6.957642555236816, "global_step": 166886, "epoch": 3973} {"train_loss": -6.879146099090576, "global_step": 166887, "epoch": 3973} {"train_loss": -6.982119560241699, "global_step": 166888, "epoch": 3973} {"train_loss": -7.077014923095703, "global_step": 166889, "epoch": 3973} {"train_loss": -6.916152000427246, "global_step": 166890, "epoch": 3973} {"train_loss": -7.107343673706055, "global_step": 166891, "epoch": 3973} {"train_loss": -6.940551280975342, "global_step": 166892, "epoch": 3973} {"train_loss": -6.921247482299805, "global_step": 166893, "epoch": 3973} {"train_loss": -6.896244049072266, "global_step": 166894, "epoch": 3973} {"train_loss": -7.022560119628906, "global_step": 166895, "epoch": 3973} {"train_loss": -7.001161575317383, "global_step": 166896, "epoch": 3973} {"train_loss": -6.800046920776367, "global_step": 166897, "epoch": 3973} {"train_loss": -6.91527795791626, "global_step": 166898, "epoch": 3973} {"train_loss": -6.95255184173584, "global_step": 166899, "epoch": 3973} {"train_loss": -6.940046310424805, "global_step": 166900, "epoch": 3973} {"train_loss": -6.942731857299805, "global_step": 166901, "epoch": 3973} {"train_loss": -7.043562412261963, "global_step": 166902, "epoch": 3973} {"train_loss": -7.04567813873291, "global_step": 166903, "epoch": 3973} {"train_loss": -6.933894157409668, "global_step": 166904, "epoch": 3973} {"train_loss": -7.093776702880859, "global_step": 166905, "epoch": 3973} {"train_loss": -6.980062484741211, "global_step": 166906, "epoch": 3973} {"train_loss": -6.964001224154518, "global_step": 166907, "epoch": 3973, "val_loss": 79856.4375} {"train_loss": -7.047039985656738, "global_step": 166908, "epoch": 3974} {"train_loss": -7.033440113067627, "global_step": 166909, "epoch": 3974} {"train_loss": -7.072793006896973, "global_step": 166910, "epoch": 3974} {"train_loss": -6.975505352020264, "global_step": 166911, "epoch": 3974} {"train_loss": -7.033090591430664, "global_step": 166912, "epoch": 3974} {"train_loss": -7.025759696960449, "global_step": 166913, "epoch": 3974} {"train_loss": -6.9343390464782715, "global_step": 166914, "epoch": 3974} {"train_loss": -7.089514255523682, "global_step": 166915, "epoch": 3974} {"train_loss": -6.865012168884277, "global_step": 166916, "epoch": 3974} {"train_loss": -7.007059097290039, "global_step": 166917, "epoch": 3974} {"train_loss": -6.973426342010498, "global_step": 166918, "epoch": 3974} {"train_loss": -7.097383499145508, "global_step": 166919, "epoch": 3974} {"train_loss": -7.0193986892700195, "global_step": 166920, "epoch": 3974} {"train_loss": -7.0126423835754395, "global_step": 166921, "epoch": 3974} {"train_loss": -7.1179633140563965, "global_step": 166922, "epoch": 3974} {"train_loss": -7.12061071395874, "global_step": 166923, "epoch": 3974} {"train_loss": -7.027660369873047, "global_step": 166924, "epoch": 3974} {"train_loss": -7.11916446685791, "global_step": 166925, "epoch": 3974} {"train_loss": -7.02443265914917, "global_step": 166926, "epoch": 3974} {"train_loss": -7.02531099319458, "global_step": 166927, "epoch": 3974} {"train_loss": -7.083919525146484, "global_step": 166928, "epoch": 3974} {"train_loss": -7.064356803894043, "global_step": 166929, "epoch": 3974} {"train_loss": -7.018064498901367, "global_step": 166930, "epoch": 3974} {"train_loss": -7.075394630432129, "global_step": 166931, "epoch": 3974} {"train_loss": -7.09737491607666, "global_step": 166932, "epoch": 3974} {"train_loss": -7.005793571472168, "global_step": 166933, "epoch": 3974} {"train_loss": -7.027169227600098, "global_step": 166934, "epoch": 3974} {"train_loss": -6.959227561950684, "global_step": 166935, "epoch": 3974} {"train_loss": -7.09630012512207, "global_step": 166936, "epoch": 3974} {"train_loss": -7.006329536437988, "global_step": 166937, "epoch": 3974} {"train_loss": -7.12519645690918, "global_step": 166938, "epoch": 3974} {"train_loss": -7.138849258422852, "global_step": 166939, "epoch": 3974} {"train_loss": -7.088393688201904, "global_step": 166940, "epoch": 3974} {"train_loss": -7.062572002410889, "global_step": 166941, "epoch": 3974} {"train_loss": -7.044831275939941, "global_step": 166942, "epoch": 3974} {"train_loss": -6.992729187011719, "global_step": 166943, "epoch": 3974} {"train_loss": -7.04466438293457, "global_step": 166944, "epoch": 3974} {"train_loss": -7.064231872558594, "global_step": 166945, "epoch": 3974} {"train_loss": -7.028001308441162, "global_step": 166946, "epoch": 3974} {"train_loss": -7.106675148010254, "global_step": 166947, "epoch": 3974} {"train_loss": -7.106029987335205, "global_step": 166948, "epoch": 3974} {"train_loss": -7.046030441919963, "global_step": 166949, "epoch": 3974, "val_loss": 79433.640625} {"train_loss": -7.110661506652832, "global_step": 166950, "epoch": 3975} {"train_loss": -7.039658069610596, "global_step": 166951, "epoch": 3975} {"train_loss": -7.069098472595215, "global_step": 166952, "epoch": 3975} {"train_loss": -7.104884147644043, "global_step": 166953, "epoch": 3975} {"train_loss": -7.009181022644043, "global_step": 166954, "epoch": 3975} {"train_loss": -7.139386177062988, "global_step": 166955, "epoch": 3975} {"train_loss": -6.923581123352051, "global_step": 166956, "epoch": 3975} {"train_loss": -7.129070281982422, "global_step": 166957, "epoch": 3975} {"train_loss": -7.024374485015869, "global_step": 166958, "epoch": 3975} {"train_loss": -7.000430583953857, "global_step": 166959, "epoch": 3975} {"train_loss": -7.070696830749512, "global_step": 166960, "epoch": 3975} {"train_loss": -7.0964555740356445, "global_step": 166961, "epoch": 3975} {"train_loss": -7.069877624511719, "global_step": 166962, "epoch": 3975} {"train_loss": -7.065691947937012, "global_step": 166963, "epoch": 3975} {"train_loss": -7.046457290649414, "global_step": 166964, "epoch": 3975} {"train_loss": -7.095628261566162, "global_step": 166965, "epoch": 3975} {"train_loss": -7.022677421569824, "global_step": 166966, "epoch": 3975} {"train_loss": -6.948042869567871, "global_step": 166967, "epoch": 3975} {"train_loss": -6.971529006958008, "global_step": 166968, "epoch": 3975} {"train_loss": -7.017032146453857, "global_step": 166969, "epoch": 3975} {"train_loss": -6.933645248413086, "global_step": 166970, "epoch": 3975} {"train_loss": -6.851017951965332, "global_step": 166971, "epoch": 3975} {"train_loss": -6.976436138153076, "global_step": 166972, "epoch": 3975} {"train_loss": -6.929169654846191, "global_step": 166973, "epoch": 3975} {"train_loss": -7.009716033935547, "global_step": 166974, "epoch": 3975} {"train_loss": -7.023504257202148, "global_step": 166975, "epoch": 3975} {"train_loss": -7.023188591003418, "global_step": 166976, "epoch": 3975} {"train_loss": -7.018582820892334, "global_step": 166977, "epoch": 3975} {"train_loss": -7.029643535614014, "global_step": 166978, "epoch": 3975} {"train_loss": -6.936553001403809, "global_step": 166979, "epoch": 3975} {"train_loss": -6.910257339477539, "global_step": 166980, "epoch": 3975} {"train_loss": -6.951339244842529, "global_step": 166981, "epoch": 3975} {"train_loss": -7.027961254119873, "global_step": 166982, "epoch": 3975} {"train_loss": -7.004458427429199, "global_step": 166983, "epoch": 3975} {"train_loss": -6.895802974700928, "global_step": 166984, "epoch": 3975} {"train_loss": -7.056878089904785, "global_step": 166985, "epoch": 3975} {"train_loss": -6.972002029418945, "global_step": 166986, "epoch": 3975} {"train_loss": -7.077149391174316, "global_step": 166987, "epoch": 3975} {"train_loss": -6.949605464935303, "global_step": 166988, "epoch": 3975} {"train_loss": -6.977039337158203, "global_step": 166989, "epoch": 3975} {"train_loss": -7.004435062408447, "global_step": 166990, "epoch": 3975} {"train_loss": -7.011502231870379, "global_step": 166991, "epoch": 3975, "val_loss": 79597.609375} {"train_loss": -7.004044532775879, "global_step": 166992, "epoch": 3976} {"train_loss": -7.0615949630737305, "global_step": 166993, "epoch": 3976} {"train_loss": -7.1201982498168945, "global_step": 166994, "epoch": 3976} {"train_loss": -6.9971418380737305, "global_step": 166995, "epoch": 3976} {"train_loss": -7.104857444763184, "global_step": 166996, "epoch": 3976} {"train_loss": -7.157487869262695, "global_step": 166997, "epoch": 3976} {"train_loss": -7.070713043212891, "global_step": 166998, "epoch": 3976} {"train_loss": -7.0596208572387695, "global_step": 166999, "epoch": 3976} {"train_loss": -6.938377380371094, "global_step": 167000, "epoch": 3976} {"train_loss": -7.136122226715088, "global_step": 167001, "epoch": 3976} {"train_loss": -7.081507682800293, "global_step": 167002, "epoch": 3976} {"train_loss": -6.9717206954956055, "global_step": 167003, "epoch": 3976} {"train_loss": -7.074353218078613, "global_step": 167004, "epoch": 3976} {"train_loss": -6.921652793884277, "global_step": 167005, "epoch": 3976} {"train_loss": -6.980053901672363, "global_step": 167006, "epoch": 3976} {"train_loss": -6.947544097900391, "global_step": 167007, "epoch": 3976} {"train_loss": -6.946413040161133, "global_step": 167008, "epoch": 3976} {"train_loss": -6.9798903465271, "global_step": 167009, "epoch": 3976} {"train_loss": -7.038774013519287, "global_step": 167010, "epoch": 3976} {"train_loss": -6.95210075378418, "global_step": 167011, "epoch": 3976} {"train_loss": -6.891819000244141, "global_step": 167012, "epoch": 3976} {"train_loss": -6.996595859527588, "global_step": 167013, "epoch": 3976} {"train_loss": -6.953073024749756, "global_step": 167014, "epoch": 3976} {"train_loss": -6.60888671875, "global_step": 167015, "epoch": 3976} {"train_loss": -6.883606433868408, "global_step": 167016, "epoch": 3976} {"train_loss": -7.009342670440674, "global_step": 167017, "epoch": 3976} {"train_loss": -6.680368423461914, "global_step": 167018, "epoch": 3976} {"train_loss": -6.986554145812988, "global_step": 167019, "epoch": 3976} {"train_loss": -6.665796279907227, "global_step": 167020, "epoch": 3976} {"train_loss": -6.853724479675293, "global_step": 167021, "epoch": 3976} {"train_loss": -6.812540054321289, "global_step": 167022, "epoch": 3976} {"train_loss": -6.790138244628906, "global_step": 167023, "epoch": 3976} {"train_loss": -6.7690277099609375, "global_step": 167024, "epoch": 3976} {"train_loss": -6.664511680603027, "global_step": 167025, "epoch": 3976} {"train_loss": -6.833260536193848, "global_step": 167026, "epoch": 3976} {"train_loss": -6.765321731567383, "global_step": 167027, "epoch": 3976} {"train_loss": -6.872385025024414, "global_step": 167028, "epoch": 3976} {"train_loss": -6.885868072509766, "global_step": 167029, "epoch": 3976} {"train_loss": -6.941656112670898, "global_step": 167030, "epoch": 3976} {"train_loss": -6.89493465423584, "global_step": 167031, "epoch": 3976} {"train_loss": -6.7572784423828125, "global_step": 167032, "epoch": 3976} {"train_loss": -6.926718087423415, "global_step": 167033, "epoch": 3976, "val_loss": 79764.0859375} {"train_loss": -6.8804121017456055, "global_step": 167034, "epoch": 3977} {"train_loss": -6.875038146972656, "global_step": 167035, "epoch": 3977} {"train_loss": -6.928962230682373, "global_step": 167036, "epoch": 3977} {"train_loss": -6.950467109680176, "global_step": 167037, "epoch": 3977} {"train_loss": -7.067841529846191, "global_step": 167038, "epoch": 3977} {"train_loss": -6.858244895935059, "global_step": 167039, "epoch": 3977} {"train_loss": -6.945080280303955, "global_step": 167040, "epoch": 3977} {"train_loss": -7.013490676879883, "global_step": 167041, "epoch": 3977} {"train_loss": -6.856145858764648, "global_step": 167042, "epoch": 3977} {"train_loss": -6.952901840209961, "global_step": 167043, "epoch": 3977} {"train_loss": -6.928159236907959, "global_step": 167044, "epoch": 3977} {"train_loss": -7.0467376708984375, "global_step": 167045, "epoch": 3977} {"train_loss": -7.025516510009766, "global_step": 167046, "epoch": 3977} {"train_loss": -7.038214683532715, "global_step": 167047, "epoch": 3977} {"train_loss": -6.968911170959473, "global_step": 167048, "epoch": 3977} {"train_loss": -7.072042465209961, "global_step": 167049, "epoch": 3977} {"train_loss": -6.927936553955078, "global_step": 167050, "epoch": 3977} {"train_loss": -6.999614715576172, "global_step": 167051, "epoch": 3977} {"train_loss": -6.9441704750061035, "global_step": 167052, "epoch": 3977} {"train_loss": -7.061551570892334, "global_step": 167053, "epoch": 3977} {"train_loss": -7.02169942855835, "global_step": 167054, "epoch": 3977} {"train_loss": -7.037662982940674, "global_step": 167055, "epoch": 3977} {"train_loss": -7.049984931945801, "global_step": 167056, "epoch": 3977} {"train_loss": -6.950193405151367, "global_step": 167057, "epoch": 3977} {"train_loss": -7.105775833129883, "global_step": 167058, "epoch": 3977} {"train_loss": -7.067289352416992, "global_step": 167059, "epoch": 3977} {"train_loss": -7.119080543518066, "global_step": 167060, "epoch": 3977} {"train_loss": -7.045077323913574, "global_step": 167061, "epoch": 3977} {"train_loss": -6.968869209289551, "global_step": 167062, "epoch": 3977} {"train_loss": -7.084484100341797, "global_step": 167063, "epoch": 3977} {"train_loss": -7.091221809387207, "global_step": 167064, "epoch": 3977} {"train_loss": -7.006845474243164, "global_step": 167065, "epoch": 3977} {"train_loss": -7.028505802154541, "global_step": 167066, "epoch": 3977} {"train_loss": -7.118551254272461, "global_step": 167067, "epoch": 3977} {"train_loss": -6.994894027709961, "global_step": 167068, "epoch": 3977} {"train_loss": -7.002546310424805, "global_step": 167069, "epoch": 3977} {"train_loss": -7.077608585357666, "global_step": 167070, "epoch": 3977} {"train_loss": -7.056457042694092, "global_step": 167071, "epoch": 3977} {"train_loss": -6.970022201538086, "global_step": 167072, "epoch": 3977} {"train_loss": -7.002727508544922, "global_step": 167073, "epoch": 3977} {"train_loss": -6.980132102966309, "global_step": 167074, "epoch": 3977} {"train_loss": -7.003855092184884, "global_step": 167075, "epoch": 3977, "val_loss": 79834.53125} {"train_loss": -6.990162372589111, "global_step": 167076, "epoch": 3978} {"train_loss": -6.942692756652832, "global_step": 167077, "epoch": 3978} {"train_loss": -7.198996543884277, "global_step": 167078, "epoch": 3978} {"train_loss": -7.097909927368164, "global_step": 167079, "epoch": 3978} {"train_loss": -6.915206432342529, "global_step": 167080, "epoch": 3978} {"train_loss": -7.073896884918213, "global_step": 167081, "epoch": 3978} {"train_loss": -7.032045364379883, "global_step": 167082, "epoch": 3978} {"train_loss": -6.999173641204834, "global_step": 167083, "epoch": 3978} {"train_loss": -7.080129146575928, "global_step": 167084, "epoch": 3978} {"train_loss": -7.01508903503418, "global_step": 167085, "epoch": 3978} {"train_loss": -6.945911407470703, "global_step": 167086, "epoch": 3978} {"train_loss": -7.002346038818359, "global_step": 167087, "epoch": 3978} {"train_loss": -7.067812919616699, "global_step": 167088, "epoch": 3978} {"train_loss": -6.964128494262695, "global_step": 167089, "epoch": 3978} {"train_loss": -7.0954389572143555, "global_step": 167090, "epoch": 3978} {"train_loss": -6.985901832580566, "global_step": 167091, "epoch": 3978} {"train_loss": -7.063328266143799, "global_step": 167092, "epoch": 3978} {"train_loss": -6.945133209228516, "global_step": 167093, "epoch": 3978} {"train_loss": -7.092780113220215, "global_step": 167094, "epoch": 3978} {"train_loss": -7.170919418334961, "global_step": 167095, "epoch": 3978} {"train_loss": -6.9385762214660645, "global_step": 167096, "epoch": 3978} {"train_loss": -7.08299446105957, "global_step": 167097, "epoch": 3978} {"train_loss": -7.049241542816162, "global_step": 167098, "epoch": 3978} {"train_loss": -7.123849868774414, "global_step": 167099, "epoch": 3978} {"train_loss": -7.051276206970215, "global_step": 167100, "epoch": 3978} {"train_loss": -6.944121837615967, "global_step": 167101, "epoch": 3978} {"train_loss": -6.956882476806641, "global_step": 167102, "epoch": 3978} {"train_loss": -7.025812149047852, "global_step": 167103, "epoch": 3978} {"train_loss": -6.9101715087890625, "global_step": 167104, "epoch": 3978} {"train_loss": -7.03990364074707, "global_step": 167105, "epoch": 3978} {"train_loss": -6.969686508178711, "global_step": 167106, "epoch": 3978} {"train_loss": -6.848001480102539, "global_step": 167107, "epoch": 3978} {"train_loss": -6.945130825042725, "global_step": 167108, "epoch": 3978} {"train_loss": -6.830051898956299, "global_step": 167109, "epoch": 3978} {"train_loss": -6.9563446044921875, "global_step": 167110, "epoch": 3978} {"train_loss": -6.93658447265625, "global_step": 167111, "epoch": 3978} {"train_loss": -6.965027809143066, "global_step": 167112, "epoch": 3978} {"train_loss": -6.929891586303711, "global_step": 167113, "epoch": 3978} {"train_loss": -6.947356224060059, "global_step": 167114, "epoch": 3978} {"train_loss": -7.067606449127197, "global_step": 167115, "epoch": 3978} {"train_loss": -6.991192817687988, "global_step": 167116, "epoch": 3978} {"train_loss": -7.004191693805513, "global_step": 167117, "epoch": 3978, "val_loss": 79691.3203125} {"train_loss": -6.95247220993042, "global_step": 167118, "epoch": 3979} {"train_loss": -7.042881011962891, "global_step": 167119, "epoch": 3979} {"train_loss": -7.05075740814209, "global_step": 167120, "epoch": 3979} {"train_loss": -6.992706298828125, "global_step": 167121, "epoch": 3979} {"train_loss": -6.99787712097168, "global_step": 167122, "epoch": 3979} {"train_loss": -7.069127082824707, "global_step": 167123, "epoch": 3979} {"train_loss": -7.147214889526367, "global_step": 167124, "epoch": 3979} {"train_loss": -7.000117301940918, "global_step": 167125, "epoch": 3979} {"train_loss": -6.981563568115234, "global_step": 167126, "epoch": 3979} {"train_loss": -7.011658668518066, "global_step": 167127, "epoch": 3979} {"train_loss": -7.0323166847229, "global_step": 167128, "epoch": 3979} {"train_loss": -7.0121612548828125, "global_step": 167129, "epoch": 3979} {"train_loss": -6.997649192810059, "global_step": 167130, "epoch": 3979} {"train_loss": -7.001196384429932, "global_step": 167131, "epoch": 3979} {"train_loss": -7.0698137283325195, "global_step": 167132, "epoch": 3979} {"train_loss": -7.151511192321777, "global_step": 167133, "epoch": 3979} {"train_loss": -7.061460494995117, "global_step": 167134, "epoch": 3979} {"train_loss": -6.999597072601318, "global_step": 167135, "epoch": 3979} {"train_loss": -6.956727027893066, "global_step": 167136, "epoch": 3979} {"train_loss": -7.085253715515137, "global_step": 167137, "epoch": 3979} {"train_loss": -6.909384727478027, "global_step": 167138, "epoch": 3979} {"train_loss": -6.998517990112305, "global_step": 167139, "epoch": 3979} {"train_loss": -7.094964504241943, "global_step": 167140, "epoch": 3979} {"train_loss": -7.043182373046875, "global_step": 167141, "epoch": 3979} {"train_loss": -7.101670742034912, "global_step": 167142, "epoch": 3979} {"train_loss": -7.00065803527832, "global_step": 167143, "epoch": 3979} {"train_loss": -7.010585784912109, "global_step": 167144, "epoch": 3979} {"train_loss": -7.091769218444824, "global_step": 167145, "epoch": 3979} {"train_loss": -6.951904773712158, "global_step": 167146, "epoch": 3979} {"train_loss": -7.010972023010254, "global_step": 167147, "epoch": 3979} {"train_loss": -7.031676292419434, "global_step": 167148, "epoch": 3979} {"train_loss": -6.907953262329102, "global_step": 167149, "epoch": 3979} {"train_loss": -7.014307022094727, "global_step": 167150, "epoch": 3979} {"train_loss": -7.064866065979004, "global_step": 167151, "epoch": 3979} {"train_loss": -6.888596534729004, "global_step": 167152, "epoch": 3979} {"train_loss": -7.147356986999512, "global_step": 167153, "epoch": 3979} {"train_loss": -6.919018745422363, "global_step": 167154, "epoch": 3979} {"train_loss": -6.877449989318848, "global_step": 167155, "epoch": 3979} {"train_loss": -6.951081275939941, "global_step": 167156, "epoch": 3979} {"train_loss": -6.916691303253174, "global_step": 167157, "epoch": 3979} {"train_loss": -7.012508869171143, "global_step": 167158, "epoch": 3979} {"train_loss": -7.01661813826788, "global_step": 167159, "epoch": 3979, "val_loss": 79639.6015625} {"train_loss": -7.003439426422119, "global_step": 167160, "epoch": 3980} {"train_loss": -6.946905136108398, "global_step": 167161, "epoch": 3980} {"train_loss": -7.008373260498047, "global_step": 167162, "epoch": 3980} {"train_loss": -6.973677635192871, "global_step": 167163, "epoch": 3980} {"train_loss": -7.106841087341309, "global_step": 167164, "epoch": 3980} {"train_loss": -7.042593002319336, "global_step": 167165, "epoch": 3980} {"train_loss": -7.035539627075195, "global_step": 167166, "epoch": 3980} {"train_loss": -7.030667304992676, "global_step": 167167, "epoch": 3980} {"train_loss": -7.007017135620117, "global_step": 167168, "epoch": 3980} {"train_loss": -7.041681289672852, "global_step": 167169, "epoch": 3980} {"train_loss": -7.043260097503662, "global_step": 167170, "epoch": 3980} {"train_loss": -7.1392364501953125, "global_step": 167171, "epoch": 3980} {"train_loss": -6.982970714569092, "global_step": 167172, "epoch": 3980} {"train_loss": -7.199178695678711, "global_step": 167173, "epoch": 3980} {"train_loss": -7.163486957550049, "global_step": 167174, "epoch": 3980} {"train_loss": -6.958307266235352, "global_step": 167175, "epoch": 3980} {"train_loss": -7.051572322845459, "global_step": 167176, "epoch": 3980} {"train_loss": -7.1382341384887695, "global_step": 167177, "epoch": 3980} {"train_loss": -6.999326705932617, "global_step": 167178, "epoch": 3980} {"train_loss": -7.04925012588501, "global_step": 167179, "epoch": 3980} {"train_loss": -7.077491760253906, "global_step": 167180, "epoch": 3980} {"train_loss": -7.098012447357178, "global_step": 167181, "epoch": 3980} {"train_loss": -7.041840553283691, "global_step": 167182, "epoch": 3980} {"train_loss": -7.1368865966796875, "global_step": 167183, "epoch": 3980} {"train_loss": -7.057333469390869, "global_step": 167184, "epoch": 3980} {"train_loss": -7.213631629943848, "global_step": 167185, "epoch": 3980} {"train_loss": -7.089378356933594, "global_step": 167186, "epoch": 3980} {"train_loss": -7.169524192810059, "global_step": 167187, "epoch": 3980} {"train_loss": -7.0979108810424805, "global_step": 167188, "epoch": 3980} {"train_loss": -7.181440353393555, "global_step": 167189, "epoch": 3980} {"train_loss": -7.026589870452881, "global_step": 167190, "epoch": 3980} {"train_loss": -6.873641490936279, "global_step": 167191, "epoch": 3980} {"train_loss": -7.050111293792725, "global_step": 167192, "epoch": 3980} {"train_loss": -7.085000514984131, "global_step": 167193, "epoch": 3980} {"train_loss": -7.07032585144043, "global_step": 167194, "epoch": 3980} {"train_loss": -7.050849914550781, "global_step": 167195, "epoch": 3980} {"train_loss": -7.076066970825195, "global_step": 167196, "epoch": 3980} {"train_loss": -6.953533172607422, "global_step": 167197, "epoch": 3980} {"train_loss": -7.095654487609863, "global_step": 167198, "epoch": 3980} {"train_loss": -7.097504615783691, "global_step": 167199, "epoch": 3980} {"train_loss": -7.041067123413086, "global_step": 167200, "epoch": 3980} {"train_loss": -7.061657269795735, "global_step": 167201, "epoch": 3980, "val_loss": 79744.6640625} {"train_loss": -7.156968116760254, "global_step": 167202, "epoch": 3981} {"train_loss": -7.1612749099731445, "global_step": 167203, "epoch": 3981} {"train_loss": -7.058389186859131, "global_step": 167204, "epoch": 3981} {"train_loss": -7.055414199829102, "global_step": 167205, "epoch": 3981} {"train_loss": -7.01733922958374, "global_step": 167206, "epoch": 3981} {"train_loss": -7.106608867645264, "global_step": 167207, "epoch": 3981} {"train_loss": -7.172179222106934, "global_step": 167208, "epoch": 3981} {"train_loss": -7.01564359664917, "global_step": 167209, "epoch": 3981} {"train_loss": -7.140636444091797, "global_step": 167210, "epoch": 3981} {"train_loss": -7.16776704788208, "global_step": 167211, "epoch": 3981} {"train_loss": -7.043913841247559, "global_step": 167212, "epoch": 3981} {"train_loss": -7.169476509094238, "global_step": 167213, "epoch": 3981} {"train_loss": -7.097052574157715, "global_step": 167214, "epoch": 3981} {"train_loss": -7.099415302276611, "global_step": 167215, "epoch": 3981} {"train_loss": -7.021272659301758, "global_step": 167216, "epoch": 3981} {"train_loss": -7.16035270690918, "global_step": 167217, "epoch": 3981} {"train_loss": -7.098100662231445, "global_step": 167218, "epoch": 3981} {"train_loss": -7.079811096191406, "global_step": 167219, "epoch": 3981} {"train_loss": -6.932184219360352, "global_step": 167220, "epoch": 3981} {"train_loss": -7.012497901916504, "global_step": 167221, "epoch": 3981} {"train_loss": -7.078946590423584, "global_step": 167222, "epoch": 3981} {"train_loss": -6.935857772827148, "global_step": 167223, "epoch": 3981} {"train_loss": -7.033079147338867, "global_step": 167224, "epoch": 3981} {"train_loss": -7.059758186340332, "global_step": 167225, "epoch": 3981} {"train_loss": -6.90830135345459, "global_step": 167226, "epoch": 3981} {"train_loss": -6.831186771392822, "global_step": 167227, "epoch": 3981} {"train_loss": -6.918638229370117, "global_step": 167228, "epoch": 3981} {"train_loss": -6.955397605895996, "global_step": 167229, "epoch": 3981} {"train_loss": -7.024893760681152, "global_step": 167230, "epoch": 3981} {"train_loss": -7.0380473136901855, "global_step": 167231, "epoch": 3981} {"train_loss": -7.027379512786865, "global_step": 167232, "epoch": 3981} {"train_loss": -6.994939804077148, "global_step": 167233, "epoch": 3981} {"train_loss": -6.993450164794922, "global_step": 167234, "epoch": 3981} {"train_loss": -7.024811267852783, "global_step": 167235, "epoch": 3981} {"train_loss": -6.897500991821289, "global_step": 167236, "epoch": 3981} {"train_loss": -7.01968240737915, "global_step": 167237, "epoch": 3981} {"train_loss": -6.90576171875, "global_step": 167238, "epoch": 3981} {"train_loss": -6.990422248840332, "global_step": 167239, "epoch": 3981} {"train_loss": -6.978111267089844, "global_step": 167240, "epoch": 3981} {"train_loss": -7.083148002624512, "global_step": 167241, "epoch": 3981} {"train_loss": -6.944497108459473, "global_step": 167242, "epoch": 3981} {"train_loss": -7.0343621004195445, "global_step": 167243, "epoch": 3981, "val_loss": 79490.453125} {"train_loss": -6.84173583984375, "global_step": 167244, "epoch": 3982} {"train_loss": -6.984708309173584, "global_step": 167245, "epoch": 3982} {"train_loss": -7.1075897216796875, "global_step": 167246, "epoch": 3982} {"train_loss": -6.89283561706543, "global_step": 167247, "epoch": 3982} {"train_loss": -6.881060600280762, "global_step": 167248, "epoch": 3982} {"train_loss": -7.038722991943359, "global_step": 167249, "epoch": 3982} {"train_loss": -7.163516521453857, "global_step": 167250, "epoch": 3982} {"train_loss": -6.9501729011535645, "global_step": 167251, "epoch": 3982} {"train_loss": -6.985450267791748, "global_step": 167252, "epoch": 3982} {"train_loss": -6.976665496826172, "global_step": 167253, "epoch": 3982} {"train_loss": -6.991034507751465, "global_step": 167254, "epoch": 3982} {"train_loss": -6.840641021728516, "global_step": 167255, "epoch": 3982} {"train_loss": -6.872464179992676, "global_step": 167256, "epoch": 3982} {"train_loss": -7.153835296630859, "global_step": 167257, "epoch": 3982} {"train_loss": -6.959441184997559, "global_step": 167258, "epoch": 3982} {"train_loss": -6.973423480987549, "global_step": 167259, "epoch": 3982} {"train_loss": -6.987372875213623, "global_step": 167260, "epoch": 3982} {"train_loss": -6.852031707763672, "global_step": 167261, "epoch": 3982} {"train_loss": -6.960187911987305, "global_step": 167262, "epoch": 3982} {"train_loss": -6.917428016662598, "global_step": 167263, "epoch": 3982} {"train_loss": -6.841281890869141, "global_step": 167264, "epoch": 3982} {"train_loss": -6.958131790161133, "global_step": 167265, "epoch": 3982} {"train_loss": -6.887328624725342, "global_step": 167266, "epoch": 3982} {"train_loss": -6.864780426025391, "global_step": 167267, "epoch": 3982} {"train_loss": -6.965404033660889, "global_step": 167268, "epoch": 3982} {"train_loss": -6.749439239501953, "global_step": 167269, "epoch": 3982} {"train_loss": -6.973932266235352, "global_step": 167270, "epoch": 3982} {"train_loss": -6.791956901550293, "global_step": 167271, "epoch": 3982} {"train_loss": -6.76898193359375, "global_step": 167272, "epoch": 3982} {"train_loss": -7.082831859588623, "global_step": 167273, "epoch": 3982} {"train_loss": -6.8609185218811035, "global_step": 167274, "epoch": 3982} {"train_loss": -6.8986077308654785, "global_step": 167275, "epoch": 3982} {"train_loss": -6.880352020263672, "global_step": 167276, "epoch": 3982} {"train_loss": -6.790003776550293, "global_step": 167277, "epoch": 3982} {"train_loss": -6.999943733215332, "global_step": 167278, "epoch": 3982} {"train_loss": -6.847375869750977, "global_step": 167279, "epoch": 3982} {"train_loss": -6.977810859680176, "global_step": 167280, "epoch": 3982} {"train_loss": -6.918848514556885, "global_step": 167281, "epoch": 3982} {"train_loss": -6.946903228759766, "global_step": 167282, "epoch": 3982} {"train_loss": -6.931362152099609, "global_step": 167283, "epoch": 3982} {"train_loss": -6.929174423217773, "global_step": 167284, "epoch": 3982} {"train_loss": -6.931575559434437, "global_step": 167285, "epoch": 3982, "val_loss": 79729.875} {"train_loss": -7.079678535461426, "global_step": 167286, "epoch": 3983} {"train_loss": -7.067300796508789, "global_step": 167287, "epoch": 3983} {"train_loss": -6.940515041351318, "global_step": 167288, "epoch": 3983} {"train_loss": -6.916103363037109, "global_step": 167289, "epoch": 3983} {"train_loss": -7.055310249328613, "global_step": 167290, "epoch": 3983} {"train_loss": -7.042758941650391, "global_step": 167291, "epoch": 3983} {"train_loss": -6.925770282745361, "global_step": 167292, "epoch": 3983} {"train_loss": -7.034232139587402, "global_step": 167293, "epoch": 3983} {"train_loss": -7.080333709716797, "global_step": 167294, "epoch": 3983} {"train_loss": -7.0552449226379395, "global_step": 167295, "epoch": 3983} {"train_loss": -6.931952953338623, "global_step": 167296, "epoch": 3983} {"train_loss": -6.981051445007324, "global_step": 167297, "epoch": 3983} {"train_loss": -6.975552558898926, "global_step": 167298, "epoch": 3983} {"train_loss": -6.942883491516113, "global_step": 167299, "epoch": 3983} {"train_loss": -6.9434685707092285, "global_step": 167300, "epoch": 3983} {"train_loss": -7.018955230712891, "global_step": 167301, "epoch": 3983} {"train_loss": -6.9163594245910645, "global_step": 167302, "epoch": 3983} {"train_loss": -6.869634628295898, "global_step": 167303, "epoch": 3983} {"train_loss": -6.879246234893799, "global_step": 167304, "epoch": 3983} {"train_loss": -7.035419464111328, "global_step": 167305, "epoch": 3983} {"train_loss": -7.0110182762146, "global_step": 167306, "epoch": 3983} {"train_loss": -6.94086217880249, "global_step": 167307, "epoch": 3983} {"train_loss": -6.996628761291504, "global_step": 167308, "epoch": 3983} {"train_loss": -6.928150177001953, "global_step": 167309, "epoch": 3983} {"train_loss": -6.943525791168213, "global_step": 167310, "epoch": 3983} {"train_loss": -7.02341365814209, "global_step": 167311, "epoch": 3983} {"train_loss": -6.93147087097168, "global_step": 167312, "epoch": 3983} {"train_loss": -7.075173854827881, "global_step": 167313, "epoch": 3983} {"train_loss": -7.051829814910889, "global_step": 167314, "epoch": 3983} {"train_loss": -7.125171661376953, "global_step": 167315, "epoch": 3983} {"train_loss": -7.121076583862305, "global_step": 167316, "epoch": 3983} {"train_loss": -7.182234764099121, "global_step": 167317, "epoch": 3983} {"train_loss": -7.052676677703857, "global_step": 167318, "epoch": 3983} {"train_loss": -7.0945963859558105, "global_step": 167319, "epoch": 3983} {"train_loss": -6.978259086608887, "global_step": 167320, "epoch": 3983} {"train_loss": -7.114093780517578, "global_step": 167321, "epoch": 3983} {"train_loss": -7.100647449493408, "global_step": 167322, "epoch": 3983} {"train_loss": -7.011209487915039, "global_step": 167323, "epoch": 3983} {"train_loss": -6.990004062652588, "global_step": 167324, "epoch": 3983} {"train_loss": -6.980445861816406, "global_step": 167325, "epoch": 3983} {"train_loss": -7.007750511169434, "global_step": 167326, "epoch": 3983} {"train_loss": -7.009060212544033, "global_step": 167327, "epoch": 3983, "val_loss": 79644.4453125} {"train_loss": -7.167119026184082, "global_step": 167328, "epoch": 3984} {"train_loss": -6.954887866973877, "global_step": 167329, "epoch": 3984} {"train_loss": -7.098749160766602, "global_step": 167330, "epoch": 3984} {"train_loss": -6.99074649810791, "global_step": 167331, "epoch": 3984} {"train_loss": -6.899078369140625, "global_step": 167332, "epoch": 3984} {"train_loss": -7.02055549621582, "global_step": 167333, "epoch": 3984} {"train_loss": -6.984831809997559, "global_step": 167334, "epoch": 3984} {"train_loss": -6.9672956466674805, "global_step": 167335, "epoch": 3984} {"train_loss": -7.008928298950195, "global_step": 167336, "epoch": 3984} {"train_loss": -6.99882173538208, "global_step": 167337, "epoch": 3984} {"train_loss": -7.0078349113464355, "global_step": 167338, "epoch": 3984} {"train_loss": -7.00616979598999, "global_step": 167339, "epoch": 3984} {"train_loss": -6.937358856201172, "global_step": 167340, "epoch": 3984} {"train_loss": -6.948894500732422, "global_step": 167341, "epoch": 3984} {"train_loss": -7.016457557678223, "global_step": 167342, "epoch": 3984} {"train_loss": -6.93865966796875, "global_step": 167343, "epoch": 3984} {"train_loss": -6.871754169464111, "global_step": 167344, "epoch": 3984} {"train_loss": -6.83013916015625, "global_step": 167345, "epoch": 3984} {"train_loss": -6.946533203125, "global_step": 167346, "epoch": 3984} {"train_loss": -6.841425895690918, "global_step": 167347, "epoch": 3984} {"train_loss": -6.923006057739258, "global_step": 167348, "epoch": 3984} {"train_loss": -6.873771667480469, "global_step": 167349, "epoch": 3984} {"train_loss": -6.831134796142578, "global_step": 167350, "epoch": 3984} {"train_loss": -7.026078224182129, "global_step": 167351, "epoch": 3984} {"train_loss": -6.931540489196777, "global_step": 167352, "epoch": 3984} {"train_loss": -6.967475891113281, "global_step": 167353, "epoch": 3984} {"train_loss": -6.963975429534912, "global_step": 167354, "epoch": 3984} {"train_loss": -6.874695777893066, "global_step": 167355, "epoch": 3984} {"train_loss": -6.995883941650391, "global_step": 167356, "epoch": 3984} {"train_loss": -6.873968124389648, "global_step": 167357, "epoch": 3984} {"train_loss": -6.976470947265625, "global_step": 167358, "epoch": 3984} {"train_loss": -6.945130825042725, "global_step": 167359, "epoch": 3984} {"train_loss": -7.031482696533203, "global_step": 167360, "epoch": 3984} {"train_loss": -6.968737602233887, "global_step": 167361, "epoch": 3984} {"train_loss": -6.903840065002441, "global_step": 167362, "epoch": 3984} {"train_loss": -7.025744438171387, "global_step": 167363, "epoch": 3984} {"train_loss": -6.964224815368652, "global_step": 167364, "epoch": 3984} {"train_loss": -7.057537078857422, "global_step": 167365, "epoch": 3984} {"train_loss": -6.899397850036621, "global_step": 167366, "epoch": 3984} {"train_loss": -7.050439834594727, "global_step": 167367, "epoch": 3984} {"train_loss": -7.025641441345215, "global_step": 167368, "epoch": 3984} {"train_loss": -6.964076541718983, "global_step": 167369, "epoch": 3984, "val_loss": 79831.9921875} {"train_loss": -6.936756134033203, "global_step": 167370, "epoch": 3985} {"train_loss": -7.07808780670166, "global_step": 167371, "epoch": 3985} {"train_loss": -6.966536521911621, "global_step": 167372, "epoch": 3985} {"train_loss": -7.004434585571289, "global_step": 167373, "epoch": 3985} {"train_loss": -6.95194673538208, "global_step": 167374, "epoch": 3985} {"train_loss": -6.948984146118164, "global_step": 167375, "epoch": 3985} {"train_loss": -7.144484519958496, "global_step": 167376, "epoch": 3985} {"train_loss": -7.024942398071289, "global_step": 167377, "epoch": 3985} {"train_loss": -7.0528340339660645, "global_step": 167378, "epoch": 3985} {"train_loss": -7.057854652404785, "global_step": 167379, "epoch": 3985} {"train_loss": -6.917959690093994, "global_step": 167380, "epoch": 3985} {"train_loss": -6.938450813293457, "global_step": 167381, "epoch": 3985} {"train_loss": -6.993839263916016, "global_step": 167382, "epoch": 3985} {"train_loss": -6.905912399291992, "global_step": 167383, "epoch": 3985} {"train_loss": -6.981645584106445, "global_step": 167384, "epoch": 3985} {"train_loss": -7.0671539306640625, "global_step": 167385, "epoch": 3985} {"train_loss": -7.09895133972168, "global_step": 167386, "epoch": 3985} {"train_loss": -7.0787763595581055, "global_step": 167387, "epoch": 3985} {"train_loss": -7.096338748931885, "global_step": 167388, "epoch": 3985} {"train_loss": -6.903587341308594, "global_step": 167389, "epoch": 3985} {"train_loss": -7.041429042816162, "global_step": 167390, "epoch": 3985} {"train_loss": -7.082021236419678, "global_step": 167391, "epoch": 3985} {"train_loss": -7.000853061676025, "global_step": 167392, "epoch": 3985} {"train_loss": -7.095668792724609, "global_step": 167393, "epoch": 3985} {"train_loss": -7.027932167053223, "global_step": 167394, "epoch": 3985} {"train_loss": -6.982419967651367, "global_step": 167395, "epoch": 3985} {"train_loss": -6.972533226013184, "global_step": 167396, "epoch": 3985} {"train_loss": -6.908638954162598, "global_step": 167397, "epoch": 3985} {"train_loss": -6.888497352600098, "global_step": 167398, "epoch": 3985} {"train_loss": -7.009566307067871, "global_step": 167399, "epoch": 3985} {"train_loss": -6.950437545776367, "global_step": 167400, "epoch": 3985} {"train_loss": -7.099038600921631, "global_step": 167401, "epoch": 3985} {"train_loss": -6.989609241485596, "global_step": 167402, "epoch": 3985} {"train_loss": -7.0570969581604, "global_step": 167403, "epoch": 3985} {"train_loss": -7.0219573974609375, "global_step": 167404, "epoch": 3985} {"train_loss": -7.046473503112793, "global_step": 167405, "epoch": 3985} {"train_loss": -7.118800163269043, "global_step": 167406, "epoch": 3985} {"train_loss": -6.943568229675293, "global_step": 167407, "epoch": 3985} {"train_loss": -6.912761688232422, "global_step": 167408, "epoch": 3985} {"train_loss": -7.1046671867370605, "global_step": 167409, "epoch": 3985} {"train_loss": -6.894598960876465, "global_step": 167410, "epoch": 3985} {"train_loss": -7.006878682545254, "global_step": 167411, "epoch": 3985, "val_loss": 79752.390625} {"train_loss": -7.050836086273193, "global_step": 167412, "epoch": 3986} {"train_loss": -7.026239395141602, "global_step": 167413, "epoch": 3986} {"train_loss": -7.036495208740234, "global_step": 167414, "epoch": 3986} {"train_loss": -7.121408462524414, "global_step": 167415, "epoch": 3986} {"train_loss": -6.977174758911133, "global_step": 167416, "epoch": 3986} {"train_loss": -7.07798957824707, "global_step": 167417, "epoch": 3986} {"train_loss": -7.0472283363342285, "global_step": 167418, "epoch": 3986} {"train_loss": -7.005286693572998, "global_step": 167419, "epoch": 3986} {"train_loss": -7.053794860839844, "global_step": 167420, "epoch": 3986} {"train_loss": -7.035388946533203, "global_step": 167421, "epoch": 3986} {"train_loss": -7.06284236907959, "global_step": 167422, "epoch": 3986} {"train_loss": -7.115165710449219, "global_step": 167423, "epoch": 3986} {"train_loss": -7.11003303527832, "global_step": 167424, "epoch": 3986} {"train_loss": -7.063085079193115, "global_step": 167425, "epoch": 3986} {"train_loss": -6.965553283691406, "global_step": 167426, "epoch": 3986} {"train_loss": -6.861611366271973, "global_step": 167427, "epoch": 3986} {"train_loss": -7.0093584060668945, "global_step": 167428, "epoch": 3986} {"train_loss": -7.113407135009766, "global_step": 167429, "epoch": 3986} {"train_loss": -7.20772647857666, "global_step": 167430, "epoch": 3986} {"train_loss": -7.117138862609863, "global_step": 167431, "epoch": 3986} {"train_loss": -7.101861476898193, "global_step": 167432, "epoch": 3986} {"train_loss": -7.021472930908203, "global_step": 167433, "epoch": 3986} {"train_loss": -7.120458602905273, "global_step": 167434, "epoch": 3986} {"train_loss": -7.156274795532227, "global_step": 167435, "epoch": 3986} {"train_loss": -7.0824432373046875, "global_step": 167436, "epoch": 3986} {"train_loss": -7.093563079833984, "global_step": 167437, "epoch": 3986} {"train_loss": -7.028048038482666, "global_step": 167438, "epoch": 3986} {"train_loss": -6.998135089874268, "global_step": 167439, "epoch": 3986} {"train_loss": -7.049732208251953, "global_step": 167440, "epoch": 3986} {"train_loss": -7.057395935058594, "global_step": 167441, "epoch": 3986} {"train_loss": -7.072705268859863, "global_step": 167442, "epoch": 3986} {"train_loss": -7.119161605834961, "global_step": 167443, "epoch": 3986} {"train_loss": -7.046806335449219, "global_step": 167444, "epoch": 3986} {"train_loss": -6.969721794128418, "global_step": 167445, "epoch": 3986} {"train_loss": -6.976282596588135, "global_step": 167446, "epoch": 3986} {"train_loss": -6.983218193054199, "global_step": 167447, "epoch": 3986} {"train_loss": -7.101476669311523, "global_step": 167448, "epoch": 3986} {"train_loss": -7.062252044677734, "global_step": 167449, "epoch": 3986} {"train_loss": -7.052397727966309, "global_step": 167450, "epoch": 3986} {"train_loss": -7.03665828704834, "global_step": 167451, "epoch": 3986} {"train_loss": -7.135259628295898, "global_step": 167452, "epoch": 3986} {"train_loss": -7.052830820991879, "global_step": 167453, "epoch": 3986, "val_loss": 79698.8203125} {"train_loss": -7.033634185791016, "global_step": 167454, "epoch": 3987} {"train_loss": -7.1345534324646, "global_step": 167455, "epoch": 3987} {"train_loss": -7.132308006286621, "global_step": 167456, "epoch": 3987} {"train_loss": -7.148555278778076, "global_step": 167457, "epoch": 3987} {"train_loss": -6.996241569519043, "global_step": 167458, "epoch": 3987} {"train_loss": -7.085699558258057, "global_step": 167459, "epoch": 3987} {"train_loss": -7.1624579429626465, "global_step": 167460, "epoch": 3987} {"train_loss": -7.0826616287231445, "global_step": 167461, "epoch": 3987} {"train_loss": -7.090963840484619, "global_step": 167462, "epoch": 3987} {"train_loss": -7.156124114990234, "global_step": 167463, "epoch": 3987} {"train_loss": -7.1312384605407715, "global_step": 167464, "epoch": 3987} {"train_loss": -7.108312129974365, "global_step": 167465, "epoch": 3987} {"train_loss": -7.055681228637695, "global_step": 167466, "epoch": 3987} {"train_loss": -7.118681907653809, "global_step": 167467, "epoch": 3987} {"train_loss": -7.043378829956055, "global_step": 167468, "epoch": 3987} {"train_loss": -7.089064598083496, "global_step": 167469, "epoch": 3987} {"train_loss": -7.012091636657715, "global_step": 167470, "epoch": 3987} {"train_loss": -7.162053108215332, "global_step": 167471, "epoch": 3987} {"train_loss": -7.00479793548584, "global_step": 167472, "epoch": 3987} {"train_loss": -7.02656888961792, "global_step": 167473, "epoch": 3987} {"train_loss": -7.0918169021606445, "global_step": 167474, "epoch": 3987} {"train_loss": -6.913531303405762, "global_step": 167475, "epoch": 3987} {"train_loss": -7.040566921234131, "global_step": 167476, "epoch": 3987} {"train_loss": -7.021903991699219, "global_step": 167477, "epoch": 3987} {"train_loss": -6.9697465896606445, "global_step": 167478, "epoch": 3987} {"train_loss": -7.006515979766846, "global_step": 167479, "epoch": 3987} {"train_loss": -6.901754856109619, "global_step": 167480, "epoch": 3987} {"train_loss": -6.990034103393555, "global_step": 167481, "epoch": 3987} {"train_loss": -7.10243034362793, "global_step": 167482, "epoch": 3987} {"train_loss": -6.947768211364746, "global_step": 167483, "epoch": 3987} {"train_loss": -6.894066333770752, "global_step": 167484, "epoch": 3987} {"train_loss": -6.989758491516113, "global_step": 167485, "epoch": 3987} {"train_loss": -6.98362922668457, "global_step": 167486, "epoch": 3987} {"train_loss": -6.95761775970459, "global_step": 167487, "epoch": 3987} {"train_loss": -6.82802677154541, "global_step": 167488, "epoch": 3987} {"train_loss": -6.981016159057617, "global_step": 167489, "epoch": 3987} {"train_loss": -6.956005573272705, "global_step": 167490, "epoch": 3987} {"train_loss": -6.952866077423096, "global_step": 167491, "epoch": 3987} {"train_loss": -6.907625198364258, "global_step": 167492, "epoch": 3987} {"train_loss": -7.028714656829834, "global_step": 167493, "epoch": 3987} {"train_loss": -7.079581260681152, "global_step": 167494, "epoch": 3987} {"train_loss": -7.031349102656047, "global_step": 167495, "epoch": 3987, "val_loss": 79671.7734375} {"train_loss": -7.037886619567871, "global_step": 167496, "epoch": 3988} {"train_loss": -7.04533052444458, "global_step": 167497, "epoch": 3988} {"train_loss": -7.1068572998046875, "global_step": 167498, "epoch": 3988} {"train_loss": -7.0628662109375, "global_step": 167499, "epoch": 3988} {"train_loss": -7.095498085021973, "global_step": 167500, "epoch": 3988} {"train_loss": -7.062811851501465, "global_step": 167501, "epoch": 3988} {"train_loss": -7.076930046081543, "global_step": 167502, "epoch": 3988} {"train_loss": -7.051413536071777, "global_step": 167503, "epoch": 3988} {"train_loss": -7.051627159118652, "global_step": 167504, "epoch": 3988} {"train_loss": -7.069609642028809, "global_step": 167505, "epoch": 3988} {"train_loss": -6.9919023513793945, "global_step": 167506, "epoch": 3988} {"train_loss": -7.063645362854004, "global_step": 167507, "epoch": 3988} {"train_loss": -7.036762714385986, "global_step": 167508, "epoch": 3988} {"train_loss": -7.084907531738281, "global_step": 167509, "epoch": 3988} {"train_loss": -7.075798511505127, "global_step": 167510, "epoch": 3988} {"train_loss": -6.9843597412109375, "global_step": 167511, "epoch": 3988} {"train_loss": -6.94509220123291, "global_step": 167512, "epoch": 3988} {"train_loss": -7.067811012268066, "global_step": 167513, "epoch": 3988} {"train_loss": -7.0114850997924805, "global_step": 167514, "epoch": 3988} {"train_loss": -7.053765773773193, "global_step": 167515, "epoch": 3988} {"train_loss": -7.086104393005371, "global_step": 167516, "epoch": 3988} {"train_loss": -7.117162704467773, "global_step": 167517, "epoch": 3988} {"train_loss": -7.067774772644043, "global_step": 167518, "epoch": 3988} {"train_loss": -7.124129772186279, "global_step": 167519, "epoch": 3988} {"train_loss": -7.002278804779053, "global_step": 167520, "epoch": 3988} {"train_loss": -7.016365051269531, "global_step": 167521, "epoch": 3988} {"train_loss": -7.105093955993652, "global_step": 167522, "epoch": 3988} {"train_loss": -7.021903038024902, "global_step": 167523, "epoch": 3988} {"train_loss": -7.082518577575684, "global_step": 167524, "epoch": 3988} {"train_loss": -6.906394958496094, "global_step": 167525, "epoch": 3988} {"train_loss": -7.017216682434082, "global_step": 167526, "epoch": 3988} {"train_loss": -7.012059211730957, "global_step": 167527, "epoch": 3988} {"train_loss": -7.088907241821289, "global_step": 167528, "epoch": 3988} {"train_loss": -7.048398971557617, "global_step": 167529, "epoch": 3988} {"train_loss": -7.032185077667236, "global_step": 167530, "epoch": 3988} {"train_loss": -6.962429046630859, "global_step": 167531, "epoch": 3988} {"train_loss": -7.085935592651367, "global_step": 167532, "epoch": 3988} {"train_loss": -7.00297737121582, "global_step": 167533, "epoch": 3988} {"train_loss": -6.8330254554748535, "global_step": 167534, "epoch": 3988} {"train_loss": -6.99810791015625, "global_step": 167535, "epoch": 3988} {"train_loss": -6.963573932647705, "global_step": 167536, "epoch": 3988} {"train_loss": -7.0359885692596436, "global_step": 167537, "epoch": 3988, "val_loss": 79505.2890625} {"train_loss": -7.053247451782227, "global_step": 167538, "epoch": 3989} {"train_loss": -6.923404693603516, "global_step": 167539, "epoch": 3989} {"train_loss": -6.956174373626709, "global_step": 167540, "epoch": 3989} {"train_loss": -6.929971694946289, "global_step": 167541, "epoch": 3989} {"train_loss": -6.925786018371582, "global_step": 167542, "epoch": 3989} {"train_loss": -6.904513835906982, "global_step": 167543, "epoch": 3989} {"train_loss": -6.986136436462402, "global_step": 167544, "epoch": 3989} {"train_loss": -6.989415168762207, "global_step": 167545, "epoch": 3989} {"train_loss": -6.97330379486084, "global_step": 167546, "epoch": 3989} {"train_loss": -6.985776901245117, "global_step": 167547, "epoch": 3989} {"train_loss": -7.043669700622559, "global_step": 167548, "epoch": 3989} {"train_loss": -7.022031784057617, "global_step": 167549, "epoch": 3989} {"train_loss": -6.916909694671631, "global_step": 167550, "epoch": 3989} {"train_loss": -7.042363166809082, "global_step": 167551, "epoch": 3989} {"train_loss": -6.896875858306885, "global_step": 167552, "epoch": 3989} {"train_loss": -6.9191412925720215, "global_step": 167553, "epoch": 3989} {"train_loss": -7.0314555168151855, "global_step": 167554, "epoch": 3989} {"train_loss": -6.8606367111206055, "global_step": 167555, "epoch": 3989} {"train_loss": -6.97529411315918, "global_step": 167556, "epoch": 3989} {"train_loss": -6.814123153686523, "global_step": 167557, "epoch": 3989} {"train_loss": -6.981139183044434, "global_step": 167558, "epoch": 3989} {"train_loss": -6.865251541137695, "global_step": 167559, "epoch": 3989} {"train_loss": -6.8165435791015625, "global_step": 167560, "epoch": 3989} {"train_loss": -6.999168872833252, "global_step": 167561, "epoch": 3989} {"train_loss": -6.740490436553955, "global_step": 167562, "epoch": 3989} {"train_loss": -6.828181743621826, "global_step": 167563, "epoch": 3989} {"train_loss": -6.624634742736816, "global_step": 167564, "epoch": 3989} {"train_loss": -6.937012195587158, "global_step": 167565, "epoch": 3989} {"train_loss": -6.79849910736084, "global_step": 167566, "epoch": 3989} {"train_loss": -6.892519474029541, "global_step": 167567, "epoch": 3989} {"train_loss": -6.963613986968994, "global_step": 167568, "epoch": 3989} {"train_loss": -6.834861755371094, "global_step": 167569, "epoch": 3989} {"train_loss": -6.969980239868164, "global_step": 167570, "epoch": 3989} {"train_loss": -6.879169464111328, "global_step": 167571, "epoch": 3989} {"train_loss": -6.987174987792969, "global_step": 167572, "epoch": 3989} {"train_loss": -6.8399505615234375, "global_step": 167573, "epoch": 3989} {"train_loss": -6.886120796203613, "global_step": 167574, "epoch": 3989} {"train_loss": -6.935140609741211, "global_step": 167575, "epoch": 3989} {"train_loss": -6.944789886474609, "global_step": 167576, "epoch": 3989} {"train_loss": -6.87431526184082, "global_step": 167577, "epoch": 3989} {"train_loss": -7.062837600708008, "global_step": 167578, "epoch": 3989} {"train_loss": -6.922780456997099, "global_step": 167579, "epoch": 3989, "val_loss": 79739.3359375} {"train_loss": -6.866196632385254, "global_step": 167580, "epoch": 3990} {"train_loss": -6.992893218994141, "global_step": 167581, "epoch": 3990} {"train_loss": -6.8914618492126465, "global_step": 167582, "epoch": 3990} {"train_loss": -7.03684139251709, "global_step": 167583, "epoch": 3990} {"train_loss": -6.974409580230713, "global_step": 167584, "epoch": 3990} {"train_loss": -6.9581451416015625, "global_step": 167585, "epoch": 3990} {"train_loss": -7.023448944091797, "global_step": 167586, "epoch": 3990} {"train_loss": -6.927037715911865, "global_step": 167587, "epoch": 3990} {"train_loss": -6.992721080780029, "global_step": 167588, "epoch": 3990} {"train_loss": -7.040477752685547, "global_step": 167589, "epoch": 3990} {"train_loss": -7.067948818206787, "global_step": 167590, "epoch": 3990} {"train_loss": -6.927608966827393, "global_step": 167591, "epoch": 3990} {"train_loss": -6.896151542663574, "global_step": 167592, "epoch": 3990} {"train_loss": -7.081562042236328, "global_step": 167593, "epoch": 3990} {"train_loss": -6.962977409362793, "global_step": 167594, "epoch": 3990} {"train_loss": -7.078538417816162, "global_step": 167595, "epoch": 3990} {"train_loss": -7.054347991943359, "global_step": 167596, "epoch": 3990} {"train_loss": -6.919560432434082, "global_step": 167597, "epoch": 3990} {"train_loss": -6.971288681030273, "global_step": 167598, "epoch": 3990} {"train_loss": -6.9576096534729, "global_step": 167599, "epoch": 3990} {"train_loss": -6.844994068145752, "global_step": 167600, "epoch": 3990} {"train_loss": -6.83949089050293, "global_step": 167601, "epoch": 3990} {"train_loss": -6.947230815887451, "global_step": 167602, "epoch": 3990} {"train_loss": -6.905115127563477, "global_step": 167603, "epoch": 3990} {"train_loss": -7.039098739624023, "global_step": 167604, "epoch": 3990} {"train_loss": -7.088048934936523, "global_step": 167605, "epoch": 3990} {"train_loss": -6.914132118225098, "global_step": 167606, "epoch": 3990} {"train_loss": -6.8535356521606445, "global_step": 167607, "epoch": 3990} {"train_loss": -6.996393203735352, "global_step": 167608, "epoch": 3990} {"train_loss": -6.988565444946289, "global_step": 167609, "epoch": 3990} {"train_loss": -7.01876163482666, "global_step": 167610, "epoch": 3990} {"train_loss": -6.911457538604736, "global_step": 167611, "epoch": 3990} {"train_loss": -6.986523628234863, "global_step": 167612, "epoch": 3990} {"train_loss": -6.8134002685546875, "global_step": 167613, "epoch": 3990} {"train_loss": -7.043879508972168, "global_step": 167614, "epoch": 3990} {"train_loss": -6.968580722808838, "global_step": 167615, "epoch": 3990} {"train_loss": -7.01220703125, "global_step": 167616, "epoch": 3990} {"train_loss": -6.992222785949707, "global_step": 167617, "epoch": 3990} {"train_loss": -6.910339832305908, "global_step": 167618, "epoch": 3990} {"train_loss": -6.908499240875244, "global_step": 167619, "epoch": 3990} {"train_loss": -6.877932071685791, "global_step": 167620, "epoch": 3990} {"train_loss": -6.965617236636934, "global_step": 167621, "epoch": 3990, "val_loss": 79946.234375} {"train_loss": -7.113182544708252, "global_step": 167622, "epoch": 3991} {"train_loss": -6.978740692138672, "global_step": 167623, "epoch": 3991} {"train_loss": -6.918055534362793, "global_step": 167624, "epoch": 3991} {"train_loss": -7.033376216888428, "global_step": 167625, "epoch": 3991} {"train_loss": -6.959773063659668, "global_step": 167626, "epoch": 3991} {"train_loss": -6.914813995361328, "global_step": 167627, "epoch": 3991} {"train_loss": -7.098516941070557, "global_step": 167628, "epoch": 3991} {"train_loss": -7.057453155517578, "global_step": 167629, "epoch": 3991} {"train_loss": -7.069698333740234, "global_step": 167630, "epoch": 3991} {"train_loss": -6.919285774230957, "global_step": 167631, "epoch": 3991} {"train_loss": -7.109841346740723, "global_step": 167632, "epoch": 3991} {"train_loss": -7.089749336242676, "global_step": 167633, "epoch": 3991} {"train_loss": -7.099216461181641, "global_step": 167634, "epoch": 3991} {"train_loss": -7.014081001281738, "global_step": 167635, "epoch": 3991} {"train_loss": -7.070876121520996, "global_step": 167636, "epoch": 3991} {"train_loss": -7.103915214538574, "global_step": 167637, "epoch": 3991} {"train_loss": -7.067468166351318, "global_step": 167638, "epoch": 3991} {"train_loss": -7.021437168121338, "global_step": 167639, "epoch": 3991} {"train_loss": -7.07658576965332, "global_step": 167640, "epoch": 3991} {"train_loss": -7.146603107452393, "global_step": 167641, "epoch": 3991} {"train_loss": -6.964405059814453, "global_step": 167642, "epoch": 3991} {"train_loss": -7.071744918823242, "global_step": 167643, "epoch": 3991} {"train_loss": -7.078791618347168, "global_step": 167644, "epoch": 3991} {"train_loss": -7.069674491882324, "global_step": 167645, "epoch": 3991} {"train_loss": -7.016575813293457, "global_step": 167646, "epoch": 3991} {"train_loss": -7.0669450759887695, "global_step": 167647, "epoch": 3991} {"train_loss": -6.987449645996094, "global_step": 167648, "epoch": 3991} {"train_loss": -7.140767574310303, "global_step": 167649, "epoch": 3991} {"train_loss": -6.953092575073242, "global_step": 167650, "epoch": 3991} {"train_loss": -6.9128193855285645, "global_step": 167651, "epoch": 3991} {"train_loss": -7.051763534545898, "global_step": 167652, "epoch": 3991} {"train_loss": -7.027695655822754, "global_step": 167653, "epoch": 3991} {"train_loss": -7.1357808113098145, "global_step": 167654, "epoch": 3991} {"train_loss": -7.019845962524414, "global_step": 167655, "epoch": 3991} {"train_loss": -6.916330337524414, "global_step": 167656, "epoch": 3991} {"train_loss": -7.051025390625, "global_step": 167657, "epoch": 3991} {"train_loss": -6.964256763458252, "global_step": 167658, "epoch": 3991} {"train_loss": -7.024948596954346, "global_step": 167659, "epoch": 3991} {"train_loss": -7.081755638122559, "global_step": 167660, "epoch": 3991} {"train_loss": -6.990653038024902, "global_step": 167661, "epoch": 3991} {"train_loss": -7.061701774597168, "global_step": 167662, "epoch": 3991} {"train_loss": -7.03374813851856, "global_step": 167663, "epoch": 3991, "val_loss": 79704.875} {"train_loss": -7.0667405128479, "global_step": 167664, "epoch": 3992} {"train_loss": -7.073939323425293, "global_step": 167665, "epoch": 3992} {"train_loss": -7.055248260498047, "global_step": 167666, "epoch": 3992} {"train_loss": -7.030351638793945, "global_step": 167667, "epoch": 3992} {"train_loss": -7.040342807769775, "global_step": 167668, "epoch": 3992} {"train_loss": -7.030750274658203, "global_step": 167669, "epoch": 3992} {"train_loss": -7.063912391662598, "global_step": 167670, "epoch": 3992} {"train_loss": -7.036993026733398, "global_step": 167671, "epoch": 3992} {"train_loss": -7.053164482116699, "global_step": 167672, "epoch": 3992} {"train_loss": -6.9914326667785645, "global_step": 167673, "epoch": 3992} {"train_loss": -7.107839107513428, "global_step": 167674, "epoch": 3992} {"train_loss": -7.051337242126465, "global_step": 167675, "epoch": 3992} {"train_loss": -7.077888488769531, "global_step": 167676, "epoch": 3992} {"train_loss": -7.014239311218262, "global_step": 167677, "epoch": 3992} {"train_loss": -6.936892032623291, "global_step": 167678, "epoch": 3992} {"train_loss": -7.161487579345703, "global_step": 167679, "epoch": 3992} {"train_loss": -7.072595596313477, "global_step": 167680, "epoch": 3992} {"train_loss": -6.981876373291016, "global_step": 167681, "epoch": 3992} {"train_loss": -7.065737724304199, "global_step": 167682, "epoch": 3992} {"train_loss": -7.084080696105957, "global_step": 167683, "epoch": 3992} {"train_loss": -7.016443729400635, "global_step": 167684, "epoch": 3992} {"train_loss": -6.903936386108398, "global_step": 167685, "epoch": 3992} {"train_loss": -7.089590072631836, "global_step": 167686, "epoch": 3992} {"train_loss": -6.966041088104248, "global_step": 167687, "epoch": 3992} {"train_loss": -6.913994312286377, "global_step": 167688, "epoch": 3992} {"train_loss": -6.952781677246094, "global_step": 167689, "epoch": 3992} {"train_loss": -7.0071702003479, "global_step": 167690, "epoch": 3992} {"train_loss": -7.0821638107299805, "global_step": 167691, "epoch": 3992} {"train_loss": -6.913466453552246, "global_step": 167692, "epoch": 3992} {"train_loss": -7.034610748291016, "global_step": 167693, "epoch": 3992} {"train_loss": -7.075296401977539, "global_step": 167694, "epoch": 3992} {"train_loss": -6.982349872589111, "global_step": 167695, "epoch": 3992} {"train_loss": -6.886882781982422, "global_step": 167696, "epoch": 3992} {"train_loss": -6.859529495239258, "global_step": 167697, "epoch": 3992} {"train_loss": -7.09384822845459, "global_step": 167698, "epoch": 3992} {"train_loss": -6.9824347496032715, "global_step": 167699, "epoch": 3992} {"train_loss": -7.067406177520752, "global_step": 167700, "epoch": 3992} {"train_loss": -6.9066619873046875, "global_step": 167701, "epoch": 3992} {"train_loss": -7.079507827758789, "global_step": 167702, "epoch": 3992} {"train_loss": -6.985199928283691, "global_step": 167703, "epoch": 3992} {"train_loss": -7.1387200355529785, "global_step": 167704, "epoch": 3992} {"train_loss": -7.022636663346064, "global_step": 167705, "epoch": 3992, "val_loss": 79524.171875} {"train_loss": -6.964798927307129, "global_step": 167706, "epoch": 3993} {"train_loss": -7.002089500427246, "global_step": 167707, "epoch": 3993} {"train_loss": -7.197262287139893, "global_step": 167708, "epoch": 3993} {"train_loss": -7.026413917541504, "global_step": 167709, "epoch": 3993} {"train_loss": -7.02357292175293, "global_step": 167710, "epoch": 3993} {"train_loss": -7.0086870193481445, "global_step": 167711, "epoch": 3993} {"train_loss": -6.984533309936523, "global_step": 167712, "epoch": 3993} {"train_loss": -6.995068550109863, "global_step": 167713, "epoch": 3993} {"train_loss": -7.0371856689453125, "global_step": 167714, "epoch": 3993} {"train_loss": -6.975797653198242, "global_step": 167715, "epoch": 3993} {"train_loss": -7.050589561462402, "global_step": 167716, "epoch": 3993} {"train_loss": -7.023914813995361, "global_step": 167717, "epoch": 3993} {"train_loss": -6.902140140533447, "global_step": 167718, "epoch": 3993} {"train_loss": -7.098235130310059, "global_step": 167719, "epoch": 3993} {"train_loss": -6.94956111907959, "global_step": 167720, "epoch": 3993} {"train_loss": -7.082823753356934, "global_step": 167721, "epoch": 3993} {"train_loss": -7.008217811584473, "global_step": 167722, "epoch": 3993} {"train_loss": -6.952005863189697, "global_step": 167723, "epoch": 3993} {"train_loss": -7.0508317947387695, "global_step": 167724, "epoch": 3993} {"train_loss": -6.98286247253418, "global_step": 167725, "epoch": 3993} {"train_loss": -7.043627738952637, "global_step": 167726, "epoch": 3993} {"train_loss": -7.050027847290039, "global_step": 167727, "epoch": 3993} {"train_loss": -6.962591171264648, "global_step": 167728, "epoch": 3993} {"train_loss": -7.000165939331055, "global_step": 167729, "epoch": 3993} {"train_loss": -7.10546350479126, "global_step": 167730, "epoch": 3993} {"train_loss": -6.9840545654296875, "global_step": 167731, "epoch": 3993} {"train_loss": -7.0576372146606445, "global_step": 167732, "epoch": 3993} {"train_loss": -7.1112470626831055, "global_step": 167733, "epoch": 3993} {"train_loss": -7.097395420074463, "global_step": 167734, "epoch": 3993} {"train_loss": -6.993587493896484, "global_step": 167735, "epoch": 3993} {"train_loss": -6.996250152587891, "global_step": 167736, "epoch": 3993} {"train_loss": -7.1419806480407715, "global_step": 167737, "epoch": 3993} {"train_loss": -7.144474506378174, "global_step": 167738, "epoch": 3993} {"train_loss": -7.163471698760986, "global_step": 167739, "epoch": 3993} {"train_loss": -7.081436634063721, "global_step": 167740, "epoch": 3993} {"train_loss": -7.0609846115112305, "global_step": 167741, "epoch": 3993} {"train_loss": -6.983619689941406, "global_step": 167742, "epoch": 3993} {"train_loss": -7.0986809730529785, "global_step": 167743, "epoch": 3993} {"train_loss": -7.051797866821289, "global_step": 167744, "epoch": 3993} {"train_loss": -7.040284633636475, "global_step": 167745, "epoch": 3993} {"train_loss": -6.997098922729492, "global_step": 167746, "epoch": 3993} {"train_loss": -7.034609851383028, "global_step": 167747, "epoch": 3993, "val_loss": 79644.8359375} {"train_loss": -7.116543292999268, "global_step": 167748, "epoch": 3994} {"train_loss": -7.013276100158691, "global_step": 167749, "epoch": 3994} {"train_loss": -7.0740509033203125, "global_step": 167750, "epoch": 3994} {"train_loss": -7.0687031745910645, "global_step": 167751, "epoch": 3994} {"train_loss": -7.209296226501465, "global_step": 167752, "epoch": 3994} {"train_loss": -7.09572696685791, "global_step": 167753, "epoch": 3994} {"train_loss": -7.084036827087402, "global_step": 167754, "epoch": 3994} {"train_loss": -7.004751682281494, "global_step": 167755, "epoch": 3994} {"train_loss": -7.032235145568848, "global_step": 167756, "epoch": 3994} {"train_loss": -6.953478813171387, "global_step": 167757, "epoch": 3994} {"train_loss": -7.161517143249512, "global_step": 167758, "epoch": 3994} {"train_loss": -6.962918281555176, "global_step": 167759, "epoch": 3994} {"train_loss": -6.9104509353637695, "global_step": 167760, "epoch": 3994} {"train_loss": -7.096714496612549, "global_step": 167761, "epoch": 3994} {"train_loss": -6.959378242492676, "global_step": 167762, "epoch": 3994} {"train_loss": -6.999562740325928, "global_step": 167763, "epoch": 3994} {"train_loss": -6.850471496582031, "global_step": 167764, "epoch": 3994} {"train_loss": -6.949212074279785, "global_step": 167765, "epoch": 3994} {"train_loss": -6.878460884094238, "global_step": 167766, "epoch": 3994} {"train_loss": -6.992602348327637, "global_step": 167767, "epoch": 3994} {"train_loss": -6.859767436981201, "global_step": 167768, "epoch": 3994} {"train_loss": -6.965747833251953, "global_step": 167769, "epoch": 3994} {"train_loss": -7.017665386199951, "global_step": 167770, "epoch": 3994} {"train_loss": -6.876583576202393, "global_step": 167771, "epoch": 3994} {"train_loss": -6.998234272003174, "global_step": 167772, "epoch": 3994} {"train_loss": -6.933370590209961, "global_step": 167773, "epoch": 3994} {"train_loss": -7.017940998077393, "global_step": 167774, "epoch": 3994} {"train_loss": -6.957880020141602, "global_step": 167775, "epoch": 3994} {"train_loss": -6.978680610656738, "global_step": 167776, "epoch": 3994} {"train_loss": -7.106204986572266, "global_step": 167777, "epoch": 3994} {"train_loss": -7.002715587615967, "global_step": 167778, "epoch": 3994} {"train_loss": -6.913845062255859, "global_step": 167779, "epoch": 3994} {"train_loss": -6.944955825805664, "global_step": 167780, "epoch": 3994} {"train_loss": -7.02302360534668, "global_step": 167781, "epoch": 3994} {"train_loss": -6.991480827331543, "global_step": 167782, "epoch": 3994} {"train_loss": -6.9069037437438965, "global_step": 167783, "epoch": 3994} {"train_loss": -7.066035270690918, "global_step": 167784, "epoch": 3994} {"train_loss": -6.921931743621826, "global_step": 167785, "epoch": 3994} {"train_loss": -6.933069229125977, "global_step": 167786, "epoch": 3994} {"train_loss": -6.938043117523193, "global_step": 167787, "epoch": 3994} {"train_loss": -7.000777244567871, "global_step": 167788, "epoch": 3994} {"train_loss": -6.994061208906627, "global_step": 167789, "epoch": 3994, "val_loss": 79465.3203125} {"train_loss": -6.958401203155518, "global_step": 167790, "epoch": 3995} {"train_loss": -7.071023464202881, "global_step": 167791, "epoch": 3995} {"train_loss": -7.056118965148926, "global_step": 167792, "epoch": 3995} {"train_loss": -7.0430169105529785, "global_step": 167793, "epoch": 3995} {"train_loss": -7.115171432495117, "global_step": 167794, "epoch": 3995} {"train_loss": -6.985969543457031, "global_step": 167795, "epoch": 3995} {"train_loss": -7.047738075256348, "global_step": 167796, "epoch": 3995} {"train_loss": -6.873229503631592, "global_step": 167797, "epoch": 3995} {"train_loss": -6.9728288650512695, "global_step": 167798, "epoch": 3995} {"train_loss": -6.9926438331604, "global_step": 167799, "epoch": 3995} {"train_loss": -7.034955978393555, "global_step": 167800, "epoch": 3995} {"train_loss": -7.068058013916016, "global_step": 167801, "epoch": 3995} {"train_loss": -7.078194618225098, "global_step": 167802, "epoch": 3995} {"train_loss": -7.004268646240234, "global_step": 167803, "epoch": 3995} {"train_loss": -6.987346649169922, "global_step": 167804, "epoch": 3995} {"train_loss": -7.08293342590332, "global_step": 167805, "epoch": 3995} {"train_loss": -7.207999229431152, "global_step": 167806, "epoch": 3995} {"train_loss": -7.075355529785156, "global_step": 167807, "epoch": 3995} {"train_loss": -7.056215286254883, "global_step": 167808, "epoch": 3995} {"train_loss": -7.01969575881958, "global_step": 167809, "epoch": 3995} {"train_loss": -7.04646110534668, "global_step": 167810, "epoch": 3995} {"train_loss": -7.001384735107422, "global_step": 167811, "epoch": 3995} {"train_loss": -7.075872421264648, "global_step": 167812, "epoch": 3995} {"train_loss": -7.103856086730957, "global_step": 167813, "epoch": 3995} {"train_loss": -6.8198652267456055, "global_step": 167814, "epoch": 3995} {"train_loss": -6.992267608642578, "global_step": 167815, "epoch": 3995} {"train_loss": -7.037618160247803, "global_step": 167816, "epoch": 3995} {"train_loss": -7.056123733520508, "global_step": 167817, "epoch": 3995} {"train_loss": -6.8526201248168945, "global_step": 167818, "epoch": 3995} {"train_loss": -6.984786033630371, "global_step": 167819, "epoch": 3995} {"train_loss": -6.850157260894775, "global_step": 167820, "epoch": 3995} {"train_loss": -7.012090682983398, "global_step": 167821, "epoch": 3995} {"train_loss": -6.787229537963867, "global_step": 167822, "epoch": 3995} {"train_loss": -6.9994964599609375, "global_step": 167823, "epoch": 3995} {"train_loss": -6.974446773529053, "global_step": 167824, "epoch": 3995} {"train_loss": -6.902497291564941, "global_step": 167825, "epoch": 3995} {"train_loss": -7.026020050048828, "global_step": 167826, "epoch": 3995} {"train_loss": -6.865390300750732, "global_step": 167827, "epoch": 3995} {"train_loss": -6.944799423217773, "global_step": 167828, "epoch": 3995} {"train_loss": -7.003576278686523, "global_step": 167829, "epoch": 3995} {"train_loss": -6.987894535064697, "global_step": 167830, "epoch": 3995} {"train_loss": -7.000604493277414, "global_step": 167831, "epoch": 3995, "val_loss": 79797.1875} {"train_loss": -6.976463317871094, "global_step": 167832, "epoch": 3996} {"train_loss": -7.009870529174805, "global_step": 167833, "epoch": 3996} {"train_loss": -7.029585361480713, "global_step": 167834, "epoch": 3996} {"train_loss": -7.011265754699707, "global_step": 167835, "epoch": 3996} {"train_loss": -6.98231315612793, "global_step": 167836, "epoch": 3996} {"train_loss": -6.987593650817871, "global_step": 167837, "epoch": 3996} {"train_loss": -7.1640305519104, "global_step": 167838, "epoch": 3996} {"train_loss": -7.109135627746582, "global_step": 167839, "epoch": 3996} {"train_loss": -7.185708999633789, "global_step": 167840, "epoch": 3996} {"train_loss": -7.067021369934082, "global_step": 167841, "epoch": 3996} {"train_loss": -7.014895439147949, "global_step": 167842, "epoch": 3996} {"train_loss": -7.079500198364258, "global_step": 167843, "epoch": 3996} {"train_loss": -6.92771053314209, "global_step": 167844, "epoch": 3996} {"train_loss": -7.067747116088867, "global_step": 167845, "epoch": 3996} {"train_loss": -7.066276550292969, "global_step": 167846, "epoch": 3996} {"train_loss": -7.107980251312256, "global_step": 167847, "epoch": 3996} {"train_loss": -7.040980815887451, "global_step": 167848, "epoch": 3996} {"train_loss": -7.07005500793457, "global_step": 167849, "epoch": 3996} {"train_loss": -6.962102890014648, "global_step": 167850, "epoch": 3996} {"train_loss": -7.097892761230469, "global_step": 167851, "epoch": 3996} {"train_loss": -7.042809963226318, "global_step": 167852, "epoch": 3996} {"train_loss": -7.027340888977051, "global_step": 167853, "epoch": 3996} {"train_loss": -7.049843788146973, "global_step": 167854, "epoch": 3996} {"train_loss": -7.0243144035339355, "global_step": 167855, "epoch": 3996} {"train_loss": -7.004378318786621, "global_step": 167856, "epoch": 3996} {"train_loss": -7.021203517913818, "global_step": 167857, "epoch": 3996} {"train_loss": -7.004061698913574, "global_step": 167858, "epoch": 3996} {"train_loss": -7.158410549163818, "global_step": 167859, "epoch": 3996} {"train_loss": -7.026292324066162, "global_step": 167860, "epoch": 3996} {"train_loss": -7.067466735839844, "global_step": 167861, "epoch": 3996} {"train_loss": -7.0475006103515625, "global_step": 167862, "epoch": 3996} {"train_loss": -7.095709800720215, "global_step": 167863, "epoch": 3996} {"train_loss": -6.959596633911133, "global_step": 167864, "epoch": 3996} {"train_loss": -7.090034484863281, "global_step": 167865, "epoch": 3996} {"train_loss": -7.116196155548096, "global_step": 167866, "epoch": 3996} {"train_loss": -7.085648536682129, "global_step": 167867, "epoch": 3996} {"train_loss": -7.020398139953613, "global_step": 167868, "epoch": 3996} {"train_loss": -7.05106258392334, "global_step": 167869, "epoch": 3996} {"train_loss": -7.063708305358887, "global_step": 167870, "epoch": 3996} {"train_loss": -7.022035121917725, "global_step": 167871, "epoch": 3996} {"train_loss": -6.990538597106934, "global_step": 167872, "epoch": 3996} {"train_loss": -7.04750809215364, "global_step": 167873, "epoch": 3996, "val_loss": 79559.859375} {"train_loss": -6.905016899108887, "global_step": 167874, "epoch": 3997} {"train_loss": -7.03873872756958, "global_step": 167875, "epoch": 3997} {"train_loss": -6.9673967361450195, "global_step": 167876, "epoch": 3997} {"train_loss": -7.054461479187012, "global_step": 167877, "epoch": 3997} {"train_loss": -7.07038688659668, "global_step": 167878, "epoch": 3997} {"train_loss": -7.128535270690918, "global_step": 167879, "epoch": 3997} {"train_loss": -7.003116607666016, "global_step": 167880, "epoch": 3997} {"train_loss": -7.000189781188965, "global_step": 167881, "epoch": 3997} {"train_loss": -7.057480812072754, "global_step": 167882, "epoch": 3997} {"train_loss": -7.0344462394714355, "global_step": 167883, "epoch": 3997} {"train_loss": -7.06903600692749, "global_step": 167884, "epoch": 3997} {"train_loss": -7.007143020629883, "global_step": 167885, "epoch": 3997} {"train_loss": -7.123876571655273, "global_step": 167886, "epoch": 3997} {"train_loss": -7.029638767242432, "global_step": 167887, "epoch": 3997} {"train_loss": -6.987016677856445, "global_step": 167888, "epoch": 3997} {"train_loss": -6.998220443725586, "global_step": 167889, "epoch": 3997} {"train_loss": -7.020079612731934, "global_step": 167890, "epoch": 3997} {"train_loss": -7.052964687347412, "global_step": 167891, "epoch": 3997} {"train_loss": -7.163334369659424, "global_step": 167892, "epoch": 3997} {"train_loss": -6.992406845092773, "global_step": 167893, "epoch": 3997} {"train_loss": -7.067544937133789, "global_step": 167894, "epoch": 3997} {"train_loss": -6.9816765785217285, "global_step": 167895, "epoch": 3997} {"train_loss": -6.962807655334473, "global_step": 167896, "epoch": 3997} {"train_loss": -7.090996742248535, "global_step": 167897, "epoch": 3997} {"train_loss": -7.009966850280762, "global_step": 167898, "epoch": 3997} {"train_loss": -6.976507186889648, "global_step": 167899, "epoch": 3997} {"train_loss": -6.997815132141113, "global_step": 167900, "epoch": 3997} {"train_loss": -6.8683905601501465, "global_step": 167901, "epoch": 3997} {"train_loss": -6.954107761383057, "global_step": 167902, "epoch": 3997} {"train_loss": -6.980503082275391, "global_step": 167903, "epoch": 3997} {"train_loss": -6.756222724914551, "global_step": 167904, "epoch": 3997} {"train_loss": -6.406576156616211, "global_step": 167905, "epoch": 3997} {"train_loss": -6.960366249084473, "global_step": 167906, "epoch": 3997} {"train_loss": -6.565730571746826, "global_step": 167907, "epoch": 3997} {"train_loss": -6.728450775146484, "global_step": 167908, "epoch": 3997} {"train_loss": -6.685057640075684, "global_step": 167909, "epoch": 3997} {"train_loss": -6.760015964508057, "global_step": 167910, "epoch": 3997} {"train_loss": -6.556803226470947, "global_step": 167911, "epoch": 3997} {"train_loss": -6.744052886962891, "global_step": 167912, "epoch": 3997} {"train_loss": -6.6853718757629395, "global_step": 167913, "epoch": 3997} {"train_loss": -6.696344375610352, "global_step": 167914, "epoch": 3997} {"train_loss": -6.924144347508748, "global_step": 167915, "epoch": 3997, "val_loss": 79828.4375} {"train_loss": -6.849235534667969, "global_step": 167916, "epoch": 3998} {"train_loss": -6.571110725402832, "global_step": 167917, "epoch": 3998} {"train_loss": -6.872018814086914, "global_step": 167918, "epoch": 3998} {"train_loss": -6.7950053215026855, "global_step": 167919, "epoch": 3998} {"train_loss": -6.726974010467529, "global_step": 167920, "epoch": 3998} {"train_loss": -6.773494720458984, "global_step": 167921, "epoch": 3998} {"train_loss": -6.765697479248047, "global_step": 167922, "epoch": 3998} {"train_loss": -6.827683448791504, "global_step": 167923, "epoch": 3998} {"train_loss": -6.938478469848633, "global_step": 167924, "epoch": 3998} {"train_loss": -6.793118000030518, "global_step": 167925, "epoch": 3998} {"train_loss": -6.750901699066162, "global_step": 167926, "epoch": 3998} {"train_loss": -6.927701473236084, "global_step": 167927, "epoch": 3998} {"train_loss": -6.792727470397949, "global_step": 167928, "epoch": 3998} {"train_loss": -6.87492561340332, "global_step": 167929, "epoch": 3998} {"train_loss": -6.895590782165527, "global_step": 167930, "epoch": 3998} {"train_loss": -6.803353309631348, "global_step": 167931, "epoch": 3998} {"train_loss": -6.814723968505859, "global_step": 167932, "epoch": 3998} {"train_loss": -7.00367546081543, "global_step": 167933, "epoch": 3998} {"train_loss": -6.899798393249512, "global_step": 167934, "epoch": 3998} {"train_loss": -6.912700176239014, "global_step": 167935, "epoch": 3998} {"train_loss": -6.950098037719727, "global_step": 167936, "epoch": 3998} {"train_loss": -6.916138648986816, "global_step": 167937, "epoch": 3998} {"train_loss": -6.961692810058594, "global_step": 167938, "epoch": 3998} {"train_loss": -6.957934856414795, "global_step": 167939, "epoch": 3998} {"train_loss": -6.93074893951416, "global_step": 167940, "epoch": 3998} {"train_loss": -6.974442005157471, "global_step": 167941, "epoch": 3998} {"train_loss": -7.164786338806152, "global_step": 167942, "epoch": 3998} {"train_loss": -6.953656196594238, "global_step": 167943, "epoch": 3998} {"train_loss": -6.999507904052734, "global_step": 167944, "epoch": 3998} {"train_loss": -6.9104156494140625, "global_step": 167945, "epoch": 3998} {"train_loss": -7.090166091918945, "global_step": 167946, "epoch": 3998} {"train_loss": -6.969773292541504, "global_step": 167947, "epoch": 3998} {"train_loss": -6.9891767501831055, "global_step": 167948, "epoch": 3998} {"train_loss": -7.079357624053955, "global_step": 167949, "epoch": 3998} {"train_loss": -7.041630744934082, "global_step": 167950, "epoch": 3998} {"train_loss": -6.987955093383789, "global_step": 167951, "epoch": 3998} {"train_loss": -7.0043110847473145, "global_step": 167952, "epoch": 3998} {"train_loss": -7.035539627075195, "global_step": 167953, "epoch": 3998} {"train_loss": -7.02128791809082, "global_step": 167954, "epoch": 3998} {"train_loss": -7.004948616027832, "global_step": 167955, "epoch": 3998} {"train_loss": -7.150847911834717, "global_step": 167956, "epoch": 3998} {"train_loss": -6.920115879603794, "global_step": 167957, "epoch": 3998, "val_loss": 79680.3984375} {"train_loss": -7.0782365798950195, "global_step": 167958, "epoch": 3999} {"train_loss": -7.145902633666992, "global_step": 167959, "epoch": 3999} {"train_loss": -7.039261817932129, "global_step": 167960, "epoch": 3999} {"train_loss": -7.05546760559082, "global_step": 167961, "epoch": 3999} {"train_loss": -6.925251007080078, "global_step": 167962, "epoch": 3999} {"train_loss": -7.0928730964660645, "global_step": 167963, "epoch": 3999} {"train_loss": -6.9970526695251465, "global_step": 167964, "epoch": 3999} {"train_loss": -6.876430988311768, "global_step": 167965, "epoch": 3999} {"train_loss": -6.98765754699707, "global_step": 167966, "epoch": 3999} {"train_loss": -6.907435417175293, "global_step": 167967, "epoch": 3999} {"train_loss": -7.079432487487793, "global_step": 167968, "epoch": 3999} {"train_loss": -7.056413650512695, "global_step": 167969, "epoch": 3999} {"train_loss": -7.002813339233398, "global_step": 167970, "epoch": 3999} {"train_loss": -7.146073341369629, "global_step": 167971, "epoch": 3999} {"train_loss": -6.988125324249268, "global_step": 167972, "epoch": 3999} {"train_loss": -7.060937881469727, "global_step": 167973, "epoch": 3999} {"train_loss": -7.055665016174316, "global_step": 167974, "epoch": 3999} {"train_loss": -6.940195560455322, "global_step": 167975, "epoch": 3999} {"train_loss": -6.993978023529053, "global_step": 167976, "epoch": 3999} {"train_loss": -6.881359577178955, "global_step": 167977, "epoch": 3999} {"train_loss": -6.995913505554199, "global_step": 167978, "epoch": 3999} {"train_loss": -6.94703483581543, "global_step": 167979, "epoch": 3999} {"train_loss": -6.954240322113037, "global_step": 167980, "epoch": 3999} {"train_loss": -6.8276567459106445, "global_step": 167981, "epoch": 3999} {"train_loss": -7.047457695007324, "global_step": 167982, "epoch": 3999} {"train_loss": -7.001589775085449, "global_step": 167983, "epoch": 3999} {"train_loss": -7.037797451019287, "global_step": 167984, "epoch": 3999} {"train_loss": -6.9849653244018555, "global_step": 167985, "epoch": 3999} {"train_loss": -7.032642841339111, "global_step": 167986, "epoch": 3999} {"train_loss": -6.952660083770752, "global_step": 167987, "epoch": 3999} {"train_loss": -7.00978946685791, "global_step": 167988, "epoch": 3999} {"train_loss": -6.922698974609375, "global_step": 167989, "epoch": 3999} {"train_loss": -7.01484489440918, "global_step": 167990, "epoch": 3999} {"train_loss": -6.9461259841918945, "global_step": 167991, "epoch": 3999} {"train_loss": -7.0561604499816895, "global_step": 167992, "epoch": 3999} {"train_loss": -7.052554607391357, "global_step": 167993, "epoch": 3999} {"train_loss": -7.001406669616699, "global_step": 167994, "epoch": 3999} {"train_loss": -6.962898254394531, "global_step": 167995, "epoch": 3999} {"train_loss": -7.102975368499756, "global_step": 167996, "epoch": 3999} {"train_loss": -7.0841288566589355, "global_step": 167997, "epoch": 3999} {"train_loss": -7.118090629577637, "global_step": 167998, "epoch": 3999} {"train_loss": -7.012115739640736, "global_step": 167999, "epoch": 3999, "val_loss": 79654.625} {"train_loss": -7.119492053985596, "global_step": 168000, "epoch": 4000} {"train_loss": -7.003360748291016, "global_step": 168001, "epoch": 4000} {"train_loss": -7.029903888702393, "global_step": 168002, "epoch": 4000} {"train_loss": -7.06027364730835, "global_step": 168003, "epoch": 4000} {"train_loss": -7.104719161987305, "global_step": 168004, "epoch": 4000} {"train_loss": -7.071933746337891, "global_step": 168005, "epoch": 4000} {"train_loss": -6.9667887687683105, "global_step": 168006, "epoch": 4000} {"train_loss": -6.976544380187988, "global_step": 168007, "epoch": 4000} {"train_loss": -6.991650581359863, "global_step": 168008, "epoch": 4000} {"train_loss": -7.0319719314575195, "global_step": 168009, "epoch": 4000} {"train_loss": -7.041448593139648, "global_step": 168010, "epoch": 4000} {"train_loss": -7.149127960205078, "global_step": 168011, "epoch": 4000} {"train_loss": -7.016660690307617, "global_step": 168012, "epoch": 4000} {"train_loss": -7.08558464050293, "global_step": 168013, "epoch": 4000} {"train_loss": -7.028061389923096, "global_step": 168014, "epoch": 4000} {"train_loss": -7.09744930267334, "global_step": 168015, "epoch": 4000} {"train_loss": -7.080287933349609, "global_step": 168016, "epoch": 4000} {"train_loss": -7.049054145812988, "global_step": 168017, "epoch": 4000} {"train_loss": -7.028450965881348, "global_step": 168018, "epoch": 4000} {"train_loss": -7.043716907501221, "global_step": 168019, "epoch": 4000} {"train_loss": -7.0078325271606445, "global_step": 168020, "epoch": 4000} {"train_loss": -6.9682297706604, "global_step": 168021, "epoch": 4000} {"train_loss": -6.980481147766113, "global_step": 168022, "epoch": 4000} {"train_loss": -6.94715690612793, "global_step": 168023, "epoch": 4000} {"train_loss": -6.906960487365723, "global_step": 168024, "epoch": 4000} {"train_loss": -7.102484226226807, "global_step": 168025, "epoch": 4000} {"train_loss": -7.088070392608643, "global_step": 168026, "epoch": 4000} {"train_loss": -7.046427249908447, "global_step": 168027, "epoch": 4000} {"train_loss": -7.049257278442383, "global_step": 168028, "epoch": 4000} {"train_loss": -7.090954780578613, "global_step": 168029, "epoch": 4000} {"train_loss": -7.045350074768066, "global_step": 168030, "epoch": 4000} {"train_loss": -7.069423675537109, "global_step": 168031, "epoch": 4000} {"train_loss": -7.124114036560059, "global_step": 168032, "epoch": 4000} {"train_loss": -7.0804009437561035, "global_step": 168033, "epoch": 4000} {"train_loss": -7.032162666320801, "global_step": 168034, "epoch": 4000} {"train_loss": -6.991433143615723, "global_step": 168035, "epoch": 4000} {"train_loss": -7.019985198974609, "global_step": 168036, "epoch": 4000} {"train_loss": -7.179184913635254, "global_step": 168037, "epoch": 4000} {"train_loss": -7.101815223693848, "global_step": 168038, "epoch": 4000} {"train_loss": -6.936158657073975, "global_step": 168039, "epoch": 4000} {"train_loss": -7.152685165405273, "global_step": 168040, "epoch": 4000} {"train_loss": -7.048636561348324, "global_step": 168041, "epoch": 4000, "train/sim_max_reward_0": 0.3961307312125305, "train/sim_max_reward_1": 0.9439048433130983, "train/sim_max_reward_2": 0.41623208607127365, "train/sim_max_reward_3": 0.5303169891355571, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.8941006958573476, "test/sim_max_reward_4500000": 0.6640224039830582, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9988810499662244, "test/sim_max_reward_4500003": 0.9022705083594038, "test/sim_max_reward_4500004": 0.1244492139989713, "test/sim_max_reward_4500005": 1.0, "test/sim_max_reward_4500006": 0.9179703894475423, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 1.0, "test/sim_max_reward_4500009": 0.05334389036714201, "test/sim_max_reward_4500010": 0.12224035418496132, "test/sim_max_reward_4500011": 0.42320626363194697, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.008300628030789712, "test/sim_max_reward_4500014": 0.7420159452668426, "test/sim_max_reward_4500015": 0.9849160233112145, "test/sim_max_reward_4500016": 0.02165391508935015, "test/sim_max_reward_4500017": 0.06855578208478284, "test/sim_max_reward_4500018": 0.4685720525245237, "test/sim_max_reward_4500019": 0.9133390152679542, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8924354305283796, "test/sim_max_reward_4500022": 0.9815301890866391, "test/sim_max_reward_4500023": 0.9163260116473186, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9024905811974416, "test/sim_max_reward_4500026": 0.8251432976454993, "test/sim_max_reward_4500027": 0.939932751331585, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.04799640771220801, "test/sim_max_reward_4500030": 0.9422494241398244, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.11469011921293591, "test/sim_max_reward_4500034": 0.9848119143947353, "test/sim_max_reward_4500035": 0.9936809666276069, "test/sim_max_reward_4500036": 0.37736964792625055, "test/sim_max_reward_4500037": 0.920207177711389, "test/sim_max_reward_4500038": 1.0, "test/sim_max_reward_4500039": 0.9778953190182003, "test/sim_max_reward_4500040": 0.9832694137486443, "test/sim_max_reward_4500041": 0.973652175119387, "test/sim_max_reward_4500042": 0.03225243493432692, "test/sim_max_reward_4500043": 0.9686884807869882, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.16879325736787462, "test/sim_max_reward_4500046": 0.1573878117485854, "test/sim_max_reward_4500047": 0.8868531182180451, "test/sim_max_reward_4500048": 0.9660155073661286, "test/sim_max_reward_4500049": 0.9107812479750251, "train/mean_score": 0.6967808909316345, "test/mean_score": 0.5902575414296911, "val_loss": 79696.7734375} {"train_loss": -7.193964958190918, "global_step": 168042, "epoch": 4001} {"train_loss": -6.893557548522949, "global_step": 168043, "epoch": 4001} {"train_loss": -7.0910210609436035, "global_step": 168044, "epoch": 4001} {"train_loss": -7.005796909332275, "global_step": 168045, "epoch": 4001} {"train_loss": -6.9805908203125, "global_step": 168046, "epoch": 4001} {"train_loss": -7.001101493835449, "global_step": 168047, "epoch": 4001} {"train_loss": -7.1491241455078125, "global_step": 168048, "epoch": 4001} {"train_loss": -7.076758861541748, "global_step": 168049, "epoch": 4001} {"train_loss": -7.118324279785156, "global_step": 168050, "epoch": 4001} {"train_loss": -7.206112861633301, "global_step": 168051, "epoch": 4001} {"train_loss": -7.148446083068848, "global_step": 168052, "epoch": 4001} {"train_loss": -7.010051727294922, "global_step": 168053, "epoch": 4001} {"train_loss": -6.979450702667236, "global_step": 168054, "epoch": 4001} {"train_loss": -7.107607841491699, "global_step": 168055, "epoch": 4001} {"train_loss": -7.047946929931641, "global_step": 168056, "epoch": 4001} {"train_loss": -7.079242706298828, "global_step": 168057, "epoch": 4001} {"train_loss": -7.0883917808532715, "global_step": 168058, "epoch": 4001} {"train_loss": -6.952949523925781, "global_step": 168059, "epoch": 4001} {"train_loss": -7.126346588134766, "global_step": 168060, "epoch": 4001} {"train_loss": -7.106054306030273, "global_step": 168061, "epoch": 4001} {"train_loss": -7.070636749267578, "global_step": 168062, "epoch": 4001} {"train_loss": -7.135835647583008, "global_step": 168063, "epoch": 4001} {"train_loss": -7.0941925048828125, "global_step": 168064, "epoch": 4001} {"train_loss": -7.046760082244873, "global_step": 168065, "epoch": 4001} {"train_loss": -7.181638717651367, "global_step": 168066, "epoch": 4001} {"train_loss": -7.267965793609619, "global_step": 168067, "epoch": 4001} {"train_loss": -6.964975357055664, "global_step": 168068, "epoch": 4001} {"train_loss": -6.996891975402832, "global_step": 168069, "epoch": 4001} {"train_loss": -7.020920753479004, "global_step": 168070, "epoch": 4001} {"train_loss": -7.020391464233398, "global_step": 168071, "epoch": 4001} {"train_loss": -6.848377704620361, "global_step": 168072, "epoch": 4001} {"train_loss": -7.02416467666626, "global_step": 168073, "epoch": 4001} {"train_loss": -6.920130252838135, "global_step": 168074, "epoch": 4001} {"train_loss": -6.9320831298828125, "global_step": 168075, "epoch": 4001} {"train_loss": -6.960812568664551, "global_step": 168076, "epoch": 4001} {"train_loss": -6.977059841156006, "global_step": 168077, "epoch": 4001} {"train_loss": -6.93314790725708, "global_step": 168078, "epoch": 4001} {"train_loss": -6.924356460571289, "global_step": 168079, "epoch": 4001} {"train_loss": -6.9401421546936035, "global_step": 168080, "epoch": 4001} {"train_loss": -7.001825332641602, "global_step": 168081, "epoch": 4001} {"train_loss": -6.9145588874816895, "global_step": 168082, "epoch": 4001} {"train_loss": -7.0374505406334285, "global_step": 168083, "epoch": 4001, "val_loss": 79602.5546875} {"train_loss": -6.93264102935791, "global_step": 168084, "epoch": 4002} {"train_loss": -7.0079345703125, "global_step": 168085, "epoch": 4002} {"train_loss": -6.976499557495117, "global_step": 168086, "epoch": 4002} {"train_loss": -7.117870330810547, "global_step": 168087, "epoch": 4002} {"train_loss": -6.916851997375488, "global_step": 168088, "epoch": 4002} {"train_loss": -6.970746994018555, "global_step": 168089, "epoch": 4002} {"train_loss": -7.039093017578125, "global_step": 168090, "epoch": 4002} {"train_loss": -7.054530143737793, "global_step": 168091, "epoch": 4002} {"train_loss": -7.068779468536377, "global_step": 168092, "epoch": 4002} {"train_loss": -6.931024074554443, "global_step": 168093, "epoch": 4002} {"train_loss": -6.998722076416016, "global_step": 168094, "epoch": 4002} {"train_loss": -7.023512840270996, "global_step": 168095, "epoch": 4002} {"train_loss": -6.9346723556518555, "global_step": 168096, "epoch": 4002} {"train_loss": -7.067811012268066, "global_step": 168097, "epoch": 4002} {"train_loss": -7.0725812911987305, "global_step": 168098, "epoch": 4002} {"train_loss": -7.035283088684082, "global_step": 168099, "epoch": 4002} {"train_loss": -6.900247573852539, "global_step": 168100, "epoch": 4002} {"train_loss": -7.194282531738281, "global_step": 168101, "epoch": 4002} {"train_loss": -7.1025309562683105, "global_step": 168102, "epoch": 4002} {"train_loss": -7.061203956604004, "global_step": 168103, "epoch": 4002} {"train_loss": -7.049839973449707, "global_step": 168104, "epoch": 4002} {"train_loss": -7.077306270599365, "global_step": 168105, "epoch": 4002} {"train_loss": -6.925933361053467, "global_step": 168106, "epoch": 4002} {"train_loss": -7.036834239959717, "global_step": 168107, "epoch": 4002} {"train_loss": -7.0790605545043945, "global_step": 168108, "epoch": 4002} {"train_loss": -7.114947319030762, "global_step": 168109, "epoch": 4002} {"train_loss": -6.960988521575928, "global_step": 168110, "epoch": 4002} {"train_loss": -6.999482154846191, "global_step": 168111, "epoch": 4002} {"train_loss": -6.941415786743164, "global_step": 168112, "epoch": 4002} {"train_loss": -6.9980998039245605, "global_step": 168113, "epoch": 4002} {"train_loss": -6.927568435668945, "global_step": 168114, "epoch": 4002} {"train_loss": -7.200695514678955, "global_step": 168115, "epoch": 4002} {"train_loss": -7.095310211181641, "global_step": 168116, "epoch": 4002} {"train_loss": -7.200741767883301, "global_step": 168117, "epoch": 4002} {"train_loss": -7.001387596130371, "global_step": 168118, "epoch": 4002} {"train_loss": -7.054376602172852, "global_step": 168119, "epoch": 4002} {"train_loss": -7.081798553466797, "global_step": 168120, "epoch": 4002} {"train_loss": -7.159190654754639, "global_step": 168121, "epoch": 4002} {"train_loss": -6.991738796234131, "global_step": 168122, "epoch": 4002} {"train_loss": -7.017620086669922, "global_step": 168123, "epoch": 4002} {"train_loss": -7.042416572570801, "global_step": 168124, "epoch": 4002} {"train_loss": -7.0314874194917225, "global_step": 168125, "epoch": 4002, "val_loss": 79623.0} {"train_loss": -7.043221473693848, "global_step": 168126, "epoch": 4003} {"train_loss": -7.080123424530029, "global_step": 168127, "epoch": 4003} {"train_loss": -7.027544021606445, "global_step": 168128, "epoch": 4003} {"train_loss": -7.0576910972595215, "global_step": 168129, "epoch": 4003} {"train_loss": -7.080977916717529, "global_step": 168130, "epoch": 4003} {"train_loss": -7.069433212280273, "global_step": 168131, "epoch": 4003} {"train_loss": -7.108390808105469, "global_step": 168132, "epoch": 4003} {"train_loss": -7.044259071350098, "global_step": 168133, "epoch": 4003} {"train_loss": -7.183995246887207, "global_step": 168134, "epoch": 4003} {"train_loss": -7.143084526062012, "global_step": 168135, "epoch": 4003} {"train_loss": -7.198681831359863, "global_step": 168136, "epoch": 4003} {"train_loss": -7.064393997192383, "global_step": 168137, "epoch": 4003} {"train_loss": -7.043436527252197, "global_step": 168138, "epoch": 4003} {"train_loss": -7.144561290740967, "global_step": 168139, "epoch": 4003} {"train_loss": -7.091416835784912, "global_step": 168140, "epoch": 4003} {"train_loss": -7.0926618576049805, "global_step": 168141, "epoch": 4003} {"train_loss": -7.097495079040527, "global_step": 168142, "epoch": 4003} {"train_loss": -7.104190349578857, "global_step": 168143, "epoch": 4003} {"train_loss": -7.076937675476074, "global_step": 168144, "epoch": 4003} {"train_loss": -7.134634494781494, "global_step": 168145, "epoch": 4003} {"train_loss": -7.117702007293701, "global_step": 168146, "epoch": 4003} {"train_loss": -7.00203800201416, "global_step": 168147, "epoch": 4003} {"train_loss": -7.045189380645752, "global_step": 168148, "epoch": 4003} {"train_loss": -7.024621486663818, "global_step": 168149, "epoch": 4003} {"train_loss": -7.033568382263184, "global_step": 168150, "epoch": 4003} {"train_loss": -7.119166374206543, "global_step": 168151, "epoch": 4003} {"train_loss": -7.104329586029053, "global_step": 168152, "epoch": 4003} {"train_loss": -7.020146369934082, "global_step": 168153, "epoch": 4003} {"train_loss": -7.014739036560059, "global_step": 168154, "epoch": 4003} {"train_loss": -7.045398712158203, "global_step": 168155, "epoch": 4003} {"train_loss": -7.007296562194824, "global_step": 168156, "epoch": 4003} {"train_loss": -7.103672981262207, "global_step": 168157, "epoch": 4003} {"train_loss": -7.136386871337891, "global_step": 168158, "epoch": 4003} {"train_loss": -7.090600967407227, "global_step": 168159, "epoch": 4003} {"train_loss": -6.9628190994262695, "global_step": 168160, "epoch": 4003} {"train_loss": -7.004240036010742, "global_step": 168161, "epoch": 4003} {"train_loss": -6.971944808959961, "global_step": 168162, "epoch": 4003} {"train_loss": -7.143299102783203, "global_step": 168163, "epoch": 4003} {"train_loss": -7.009650230407715, "global_step": 168164, "epoch": 4003} {"train_loss": -7.054670810699463, "global_step": 168165, "epoch": 4003} {"train_loss": -7.0472235679626465, "global_step": 168166, "epoch": 4003} {"train_loss": -7.071181149709792, "global_step": 168167, "epoch": 4003, "val_loss": 79997.2421875} {"train_loss": -7.072964668273926, "global_step": 168168, "epoch": 4004} {"train_loss": -7.040180206298828, "global_step": 168169, "epoch": 4004} {"train_loss": -7.1236572265625, "global_step": 168170, "epoch": 4004} {"train_loss": -6.998777389526367, "global_step": 168171, "epoch": 4004} {"train_loss": -7.049616813659668, "global_step": 168172, "epoch": 4004} {"train_loss": -7.004608154296875, "global_step": 168173, "epoch": 4004} {"train_loss": -7.1238603591918945, "global_step": 168174, "epoch": 4004} {"train_loss": -7.1285576820373535, "global_step": 168175, "epoch": 4004} {"train_loss": -7.050176620483398, "global_step": 168176, "epoch": 4004} {"train_loss": -7.047271728515625, "global_step": 168177, "epoch": 4004} {"train_loss": -6.956002235412598, "global_step": 168178, "epoch": 4004} {"train_loss": -7.004212379455566, "global_step": 168179, "epoch": 4004} {"train_loss": -7.085840225219727, "global_step": 168180, "epoch": 4004} {"train_loss": -7.047379493713379, "global_step": 168181, "epoch": 4004} {"train_loss": -7.086764335632324, "global_step": 168182, "epoch": 4004} {"train_loss": -7.117895603179932, "global_step": 168183, "epoch": 4004} {"train_loss": -7.132238388061523, "global_step": 168184, "epoch": 4004} {"train_loss": -7.1320061683654785, "global_step": 168185, "epoch": 4004} {"train_loss": -7.111325263977051, "global_step": 168186, "epoch": 4004} {"train_loss": -7.0882463455200195, "global_step": 168187, "epoch": 4004} {"train_loss": -7.0143890380859375, "global_step": 168188, "epoch": 4004} {"train_loss": -6.950763702392578, "global_step": 168189, "epoch": 4004} {"train_loss": -7.036444664001465, "global_step": 168190, "epoch": 4004} {"train_loss": -6.948611259460449, "global_step": 168191, "epoch": 4004} {"train_loss": -6.952635288238525, "global_step": 168192, "epoch": 4004} {"train_loss": -6.948999404907227, "global_step": 168193, "epoch": 4004} {"train_loss": -6.984655380249023, "global_step": 168194, "epoch": 4004} {"train_loss": -7.056558609008789, "global_step": 168195, "epoch": 4004} {"train_loss": -7.026794910430908, "global_step": 168196, "epoch": 4004} {"train_loss": -6.962474346160889, "global_step": 168197, "epoch": 4004} {"train_loss": -7.003073692321777, "global_step": 168198, "epoch": 4004} {"train_loss": -7.036711692810059, "global_step": 168199, "epoch": 4004} {"train_loss": -7.066744804382324, "global_step": 168200, "epoch": 4004} {"train_loss": -7.046130657196045, "global_step": 168201, "epoch": 4004} {"train_loss": -7.061805725097656, "global_step": 168202, "epoch": 4004} {"train_loss": -7.065589904785156, "global_step": 168203, "epoch": 4004} {"train_loss": -7.066171646118164, "global_step": 168204, "epoch": 4004} {"train_loss": -6.951376914978027, "global_step": 168205, "epoch": 4004} {"train_loss": -7.072229862213135, "global_step": 168206, "epoch": 4004} {"train_loss": -6.9726338386535645, "global_step": 168207, "epoch": 4004} {"train_loss": -6.994316577911377, "global_step": 168208, "epoch": 4004} {"train_loss": -7.041314511072068, "global_step": 168209, "epoch": 4004, "val_loss": 79692.859375} {"train_loss": -7.107905864715576, "global_step": 168210, "epoch": 4005} {"train_loss": -7.103967666625977, "global_step": 168211, "epoch": 4005} {"train_loss": -6.933015823364258, "global_step": 168212, "epoch": 4005} {"train_loss": -7.1419878005981445, "global_step": 168213, "epoch": 4005} {"train_loss": -7.0368170738220215, "global_step": 168214, "epoch": 4005} {"train_loss": -6.927633285522461, "global_step": 168215, "epoch": 4005} {"train_loss": -7.109496593475342, "global_step": 168216, "epoch": 4005} {"train_loss": -6.992236614227295, "global_step": 168217, "epoch": 4005} {"train_loss": -6.935238361358643, "global_step": 168218, "epoch": 4005} {"train_loss": -6.989531517028809, "global_step": 168219, "epoch": 4005} {"train_loss": -6.955903053283691, "global_step": 168220, "epoch": 4005} {"train_loss": -6.957966327667236, "global_step": 168221, "epoch": 4005} {"train_loss": -6.741553783416748, "global_step": 168222, "epoch": 4005} {"train_loss": -6.9307074546813965, "global_step": 168223, "epoch": 4005} {"train_loss": -7.068958282470703, "global_step": 168224, "epoch": 4005} {"train_loss": -6.914330959320068, "global_step": 168225, "epoch": 4005} {"train_loss": -6.98353910446167, "global_step": 168226, "epoch": 4005} {"train_loss": -7.042202949523926, "global_step": 168227, "epoch": 4005} {"train_loss": -7.026760101318359, "global_step": 168228, "epoch": 4005} {"train_loss": -6.992694854736328, "global_step": 168229, "epoch": 4005} {"train_loss": -7.0526838302612305, "global_step": 168230, "epoch": 4005} {"train_loss": -6.977699279785156, "global_step": 168231, "epoch": 4005} {"train_loss": -6.910020351409912, "global_step": 168232, "epoch": 4005} {"train_loss": -7.047234535217285, "global_step": 168233, "epoch": 4005} {"train_loss": -7.027710914611816, "global_step": 168234, "epoch": 4005} {"train_loss": -6.966598987579346, "global_step": 168235, "epoch": 4005} {"train_loss": -7.020711421966553, "global_step": 168236, "epoch": 4005} {"train_loss": -7.025283336639404, "global_step": 168237, "epoch": 4005} {"train_loss": -7.120977401733398, "global_step": 168238, "epoch": 4005} {"train_loss": -7.098464012145996, "global_step": 168239, "epoch": 4005} {"train_loss": -6.995447635650635, "global_step": 168240, "epoch": 4005} {"train_loss": -7.036556243896484, "global_step": 168241, "epoch": 4005} {"train_loss": -6.98171329498291, "global_step": 168242, "epoch": 4005} {"train_loss": -7.030706405639648, "global_step": 168243, "epoch": 4005} {"train_loss": -7.156726360321045, "global_step": 168244, "epoch": 4005} {"train_loss": -7.16757345199585, "global_step": 168245, "epoch": 4005} {"train_loss": -6.997196197509766, "global_step": 168246, "epoch": 4005} {"train_loss": -7.0572662353515625, "global_step": 168247, "epoch": 4005} {"train_loss": -6.98258113861084, "global_step": 168248, "epoch": 4005} {"train_loss": -7.050482749938965, "global_step": 168249, "epoch": 4005} {"train_loss": -7.089221954345703, "global_step": 168250, "epoch": 4005} {"train_loss": -7.017986036482311, "global_step": 168251, "epoch": 4005, "val_loss": 79885.265625} {"train_loss": -7.038008689880371, "global_step": 168252, "epoch": 4006} {"train_loss": -7.114929676055908, "global_step": 168253, "epoch": 4006} {"train_loss": -7.066812515258789, "global_step": 168254, "epoch": 4006} {"train_loss": -6.964543342590332, "global_step": 168255, "epoch": 4006} {"train_loss": -6.949685096740723, "global_step": 168256, "epoch": 4006} {"train_loss": -7.047740936279297, "global_step": 168257, "epoch": 4006} {"train_loss": -7.040658473968506, "global_step": 168258, "epoch": 4006} {"train_loss": -7.037567615509033, "global_step": 168259, "epoch": 4006} {"train_loss": -7.071157455444336, "global_step": 168260, "epoch": 4006} {"train_loss": -7.044805526733398, "global_step": 168261, "epoch": 4006} {"train_loss": -6.9799699783325195, "global_step": 168262, "epoch": 4006} {"train_loss": -7.017764091491699, "global_step": 168263, "epoch": 4006} {"train_loss": -7.077244281768799, "global_step": 168264, "epoch": 4006} {"train_loss": -7.0779619216918945, "global_step": 168265, "epoch": 4006} {"train_loss": -7.112747669219971, "global_step": 168266, "epoch": 4006} {"train_loss": -7.036190509796143, "global_step": 168267, "epoch": 4006} {"train_loss": -7.079383850097656, "global_step": 168268, "epoch": 4006} {"train_loss": -6.957197189331055, "global_step": 168269, "epoch": 4006} {"train_loss": -7.046734809875488, "global_step": 168270, "epoch": 4006} {"train_loss": -7.139023780822754, "global_step": 168271, "epoch": 4006} {"train_loss": -7.044624328613281, "global_step": 168272, "epoch": 4006} {"train_loss": -7.036382675170898, "global_step": 168273, "epoch": 4006} {"train_loss": -6.963983535766602, "global_step": 168274, "epoch": 4006} {"train_loss": -7.116625785827637, "global_step": 168275, "epoch": 4006} {"train_loss": -7.104726791381836, "global_step": 168276, "epoch": 4006} {"train_loss": -7.087791919708252, "global_step": 168277, "epoch": 4006} {"train_loss": -7.034029960632324, "global_step": 168278, "epoch": 4006} {"train_loss": -6.977262496948242, "global_step": 168279, "epoch": 4006} {"train_loss": -6.939639091491699, "global_step": 168280, "epoch": 4006} {"train_loss": -6.991987705230713, "global_step": 168281, "epoch": 4006} {"train_loss": -7.045437335968018, "global_step": 168282, "epoch": 4006} {"train_loss": -7.170920372009277, "global_step": 168283, "epoch": 4006} {"train_loss": -7.049818992614746, "global_step": 168284, "epoch": 4006} {"train_loss": -7.099211692810059, "global_step": 168285, "epoch": 4006} {"train_loss": -7.07586669921875, "global_step": 168286, "epoch": 4006} {"train_loss": -7.175451278686523, "global_step": 168287, "epoch": 4006} {"train_loss": -7.066545486450195, "global_step": 168288, "epoch": 4006} {"train_loss": -7.028347015380859, "global_step": 168289, "epoch": 4006} {"train_loss": -7.205560684204102, "global_step": 168290, "epoch": 4006} {"train_loss": -7.0798444747924805, "global_step": 168291, "epoch": 4006} {"train_loss": -7.093188762664795, "global_step": 168292, "epoch": 4006} {"train_loss": -7.057901280266898, "global_step": 168293, "epoch": 4006, "val_loss": 79799.640625} {"train_loss": -7.054620742797852, "global_step": 168294, "epoch": 4007} {"train_loss": -7.063591957092285, "global_step": 168295, "epoch": 4007} {"train_loss": -7.001762390136719, "global_step": 168296, "epoch": 4007} {"train_loss": -7.096165657043457, "global_step": 168297, "epoch": 4007} {"train_loss": -7.025650978088379, "global_step": 168298, "epoch": 4007} {"train_loss": -7.12945556640625, "global_step": 168299, "epoch": 4007} {"train_loss": -7.0206146240234375, "global_step": 168300, "epoch": 4007} {"train_loss": -7.063959121704102, "global_step": 168301, "epoch": 4007} {"train_loss": -7.010893821716309, "global_step": 168302, "epoch": 4007} {"train_loss": -7.004566192626953, "global_step": 168303, "epoch": 4007} {"train_loss": -7.051039695739746, "global_step": 168304, "epoch": 4007} {"train_loss": -7.003507614135742, "global_step": 168305, "epoch": 4007} {"train_loss": -6.943151473999023, "global_step": 168306, "epoch": 4007} {"train_loss": -6.995774269104004, "global_step": 168307, "epoch": 4007} {"train_loss": -7.007429122924805, "global_step": 168308, "epoch": 4007} {"train_loss": -7.033181190490723, "global_step": 168309, "epoch": 4007} {"train_loss": -6.805239677429199, "global_step": 168310, "epoch": 4007} {"train_loss": -6.940847873687744, "global_step": 168311, "epoch": 4007} {"train_loss": -7.062752723693848, "global_step": 168312, "epoch": 4007} {"train_loss": -6.953230381011963, "global_step": 168313, "epoch": 4007} {"train_loss": -6.897797584533691, "global_step": 168314, "epoch": 4007} {"train_loss": -6.959450721740723, "global_step": 168315, "epoch": 4007} {"train_loss": -7.010051727294922, "global_step": 168316, "epoch": 4007} {"train_loss": -6.965121269226074, "global_step": 168317, "epoch": 4007} {"train_loss": -6.862526893615723, "global_step": 168318, "epoch": 4007} {"train_loss": -6.919412136077881, "global_step": 168319, "epoch": 4007} {"train_loss": -6.998553276062012, "global_step": 168320, "epoch": 4007} {"train_loss": -6.943136692047119, "global_step": 168321, "epoch": 4007} {"train_loss": -6.883893966674805, "global_step": 168322, "epoch": 4007} {"train_loss": -6.938675880432129, "global_step": 168323, "epoch": 4007} {"train_loss": -7.028459548950195, "global_step": 168324, "epoch": 4007} {"train_loss": -6.986957550048828, "global_step": 168325, "epoch": 4007} {"train_loss": -6.893594264984131, "global_step": 168326, "epoch": 4007} {"train_loss": -6.925409317016602, "global_step": 168327, "epoch": 4007} {"train_loss": -6.952365875244141, "global_step": 168328, "epoch": 4007} {"train_loss": -6.952270030975342, "global_step": 168329, "epoch": 4007} {"train_loss": -6.9217119216918945, "global_step": 168330, "epoch": 4007} {"train_loss": -6.911365509033203, "global_step": 168331, "epoch": 4007} {"train_loss": -7.053717613220215, "global_step": 168332, "epoch": 4007} {"train_loss": -6.885749816894531, "global_step": 168333, "epoch": 4007} {"train_loss": -6.955351829528809, "global_step": 168334, "epoch": 4007} {"train_loss": -6.977300802866618, "global_step": 168335, "epoch": 4007, "val_loss": 80017.6015625} {"train_loss": -6.932356834411621, "global_step": 168336, "epoch": 4008} {"train_loss": -7.037750244140625, "global_step": 168337, "epoch": 4008} {"train_loss": -7.016807556152344, "global_step": 168338, "epoch": 4008} {"train_loss": -6.835882186889648, "global_step": 168339, "epoch": 4008} {"train_loss": -7.0027618408203125, "global_step": 168340, "epoch": 4008} {"train_loss": -6.9385271072387695, "global_step": 168341, "epoch": 4008} {"train_loss": -7.047370433807373, "global_step": 168342, "epoch": 4008} {"train_loss": -7.082719802856445, "global_step": 168343, "epoch": 4008} {"train_loss": -6.983314037322998, "global_step": 168344, "epoch": 4008} {"train_loss": -7.027020454406738, "global_step": 168345, "epoch": 4008} {"train_loss": -7.065141677856445, "global_step": 168346, "epoch": 4008} {"train_loss": -7.094821929931641, "global_step": 168347, "epoch": 4008} {"train_loss": -7.051264762878418, "global_step": 168348, "epoch": 4008} {"train_loss": -7.058897018432617, "global_step": 168349, "epoch": 4008} {"train_loss": -7.03746223449707, "global_step": 168350, "epoch": 4008} {"train_loss": -7.023277282714844, "global_step": 168351, "epoch": 4008} {"train_loss": -6.969165802001953, "global_step": 168352, "epoch": 4008} {"train_loss": -6.96450662612915, "global_step": 168353, "epoch": 4008} {"train_loss": -7.097894668579102, "global_step": 168354, "epoch": 4008} {"train_loss": -7.0108537673950195, "global_step": 168355, "epoch": 4008} {"train_loss": -7.060417175292969, "global_step": 168356, "epoch": 4008} {"train_loss": -7.004968643188477, "global_step": 168357, "epoch": 4008} {"train_loss": -7.087255477905273, "global_step": 168358, "epoch": 4008} {"train_loss": -7.083409786224365, "global_step": 168359, "epoch": 4008} {"train_loss": -7.051076889038086, "global_step": 168360, "epoch": 4008} {"train_loss": -7.203217506408691, "global_step": 168361, "epoch": 4008} {"train_loss": -7.064445495605469, "global_step": 168362, "epoch": 4008} {"train_loss": -6.95171594619751, "global_step": 168363, "epoch": 4008} {"train_loss": -7.046570301055908, "global_step": 168364, "epoch": 4008} {"train_loss": -7.061635971069336, "global_step": 168365, "epoch": 4008} {"train_loss": -6.979083061218262, "global_step": 168366, "epoch": 4008} {"train_loss": -7.030336380004883, "global_step": 168367, "epoch": 4008} {"train_loss": -7.0091094970703125, "global_step": 168368, "epoch": 4008} {"train_loss": -7.035104274749756, "global_step": 168369, "epoch": 4008} {"train_loss": -7.023072719573975, "global_step": 168370, "epoch": 4008} {"train_loss": -7.021527290344238, "global_step": 168371, "epoch": 4008} {"train_loss": -6.931974411010742, "global_step": 168372, "epoch": 4008} {"train_loss": -6.987562656402588, "global_step": 168373, "epoch": 4008} {"train_loss": -6.959493637084961, "global_step": 168374, "epoch": 4008} {"train_loss": -6.9976983070373535, "global_step": 168375, "epoch": 4008} {"train_loss": -6.961262226104736, "global_step": 168376, "epoch": 4008} {"train_loss": -7.018572614306495, "global_step": 168377, "epoch": 4008, "val_loss": 79712.984375} {"train_loss": -6.961777687072754, "global_step": 168378, "epoch": 4009} {"train_loss": -6.925775527954102, "global_step": 168379, "epoch": 4009} {"train_loss": -7.023038387298584, "global_step": 168380, "epoch": 4009} {"train_loss": -6.922787666320801, "global_step": 168381, "epoch": 4009} {"train_loss": -6.960179328918457, "global_step": 168382, "epoch": 4009} {"train_loss": -7.129117012023926, "global_step": 168383, "epoch": 4009} {"train_loss": -6.886258125305176, "global_step": 168384, "epoch": 4009} {"train_loss": -6.974734783172607, "global_step": 168385, "epoch": 4009} {"train_loss": -6.960855484008789, "global_step": 168386, "epoch": 4009} {"train_loss": -7.040651321411133, "global_step": 168387, "epoch": 4009} {"train_loss": -7.023900985717773, "global_step": 168388, "epoch": 4009} {"train_loss": -6.965497016906738, "global_step": 168389, "epoch": 4009} {"train_loss": -7.032806873321533, "global_step": 168390, "epoch": 4009} {"train_loss": -7.018853664398193, "global_step": 168391, "epoch": 4009} {"train_loss": -7.101744651794434, "global_step": 168392, "epoch": 4009} {"train_loss": -6.904461860656738, "global_step": 168393, "epoch": 4009} {"train_loss": -7.05312442779541, "global_step": 168394, "epoch": 4009} {"train_loss": -6.866461277008057, "global_step": 168395, "epoch": 4009} {"train_loss": -7.011838912963867, "global_step": 168396, "epoch": 4009} {"train_loss": -6.946963310241699, "global_step": 168397, "epoch": 4009} {"train_loss": -6.9349260330200195, "global_step": 168398, "epoch": 4009} {"train_loss": -6.981566905975342, "global_step": 168399, "epoch": 4009} {"train_loss": -6.905662536621094, "global_step": 168400, "epoch": 4009} {"train_loss": -6.953309535980225, "global_step": 168401, "epoch": 4009} {"train_loss": -7.0853590965271, "global_step": 168402, "epoch": 4009} {"train_loss": -6.928152084350586, "global_step": 168403, "epoch": 4009} {"train_loss": -7.014298439025879, "global_step": 168404, "epoch": 4009} {"train_loss": -6.971891403198242, "global_step": 168405, "epoch": 4009} {"train_loss": -7.054327964782715, "global_step": 168406, "epoch": 4009} {"train_loss": -7.007694244384766, "global_step": 168407, "epoch": 4009} {"train_loss": -6.997318267822266, "global_step": 168408, "epoch": 4009} {"train_loss": -6.986126899719238, "global_step": 168409, "epoch": 4009} {"train_loss": -7.035139083862305, "global_step": 168410, "epoch": 4009} {"train_loss": -7.039621353149414, "global_step": 168411, "epoch": 4009} {"train_loss": -7.116282939910889, "global_step": 168412, "epoch": 4009} {"train_loss": -7.018780708312988, "global_step": 168413, "epoch": 4009} {"train_loss": -7.056568145751953, "global_step": 168414, "epoch": 4009} {"train_loss": -6.934388160705566, "global_step": 168415, "epoch": 4009} {"train_loss": -7.075904369354248, "global_step": 168416, "epoch": 4009} {"train_loss": -7.051768779754639, "global_step": 168417, "epoch": 4009} {"train_loss": -7.043530464172363, "global_step": 168418, "epoch": 4009} {"train_loss": -6.9993843124026345, "global_step": 168419, "epoch": 4009, "val_loss": 79572.5} {"train_loss": -7.116613388061523, "global_step": 168420, "epoch": 4010} {"train_loss": -7.0934906005859375, "global_step": 168421, "epoch": 4010} {"train_loss": -7.046965599060059, "global_step": 168422, "epoch": 4010} {"train_loss": -6.948530197143555, "global_step": 168423, "epoch": 4010} {"train_loss": -7.040977954864502, "global_step": 168424, "epoch": 4010} {"train_loss": -7.073269367218018, "global_step": 168425, "epoch": 4010} {"train_loss": -7.056046485900879, "global_step": 168426, "epoch": 4010} {"train_loss": -7.050215721130371, "global_step": 168427, "epoch": 4010} {"train_loss": -6.976367950439453, "global_step": 168428, "epoch": 4010} {"train_loss": -7.090005397796631, "global_step": 168429, "epoch": 4010} {"train_loss": -7.131665229797363, "global_step": 168430, "epoch": 4010} {"train_loss": -7.120827674865723, "global_step": 168431, "epoch": 4010} {"train_loss": -7.129081726074219, "global_step": 168432, "epoch": 4010} {"train_loss": -6.961152076721191, "global_step": 168433, "epoch": 4010} {"train_loss": -6.979619026184082, "global_step": 168434, "epoch": 4010} {"train_loss": -7.054130554199219, "global_step": 168435, "epoch": 4010} {"train_loss": -6.965142250061035, "global_step": 168436, "epoch": 4010} {"train_loss": -6.956400394439697, "global_step": 168437, "epoch": 4010} {"train_loss": -7.188933372497559, "global_step": 168438, "epoch": 4010} {"train_loss": -7.017748832702637, "global_step": 168439, "epoch": 4010} {"train_loss": -6.978143692016602, "global_step": 168440, "epoch": 4010} {"train_loss": -7.013798236846924, "global_step": 168441, "epoch": 4010} {"train_loss": -7.150689125061035, "global_step": 168442, "epoch": 4010} {"train_loss": -6.908883094787598, "global_step": 168443, "epoch": 4010} {"train_loss": -7.022603988647461, "global_step": 168444, "epoch": 4010} {"train_loss": -6.883382797241211, "global_step": 168445, "epoch": 4010} {"train_loss": -7.1304216384887695, "global_step": 168446, "epoch": 4010} {"train_loss": -7.146915435791016, "global_step": 168447, "epoch": 4010} {"train_loss": -7.022666931152344, "global_step": 168448, "epoch": 4010} {"train_loss": -6.962192535400391, "global_step": 168449, "epoch": 4010} {"train_loss": -7.055061340332031, "global_step": 168450, "epoch": 4010} {"train_loss": -7.096487998962402, "global_step": 168451, "epoch": 4010} {"train_loss": -6.969866752624512, "global_step": 168452, "epoch": 4010} {"train_loss": -6.989511013031006, "global_step": 168453, "epoch": 4010} {"train_loss": -6.931790828704834, "global_step": 168454, "epoch": 4010} {"train_loss": -6.870139122009277, "global_step": 168455, "epoch": 4010} {"train_loss": -7.0464324951171875, "global_step": 168456, "epoch": 4010} {"train_loss": -6.836902141571045, "global_step": 168457, "epoch": 4010} {"train_loss": -6.9190897941589355, "global_step": 168458, "epoch": 4010} {"train_loss": -6.984510898590088, "global_step": 168459, "epoch": 4010} {"train_loss": -6.929649353027344, "global_step": 168460, "epoch": 4010} {"train_loss": -7.022963637397403, "global_step": 168461, "epoch": 4010, "val_loss": 79922.0625} {"train_loss": -6.802104473114014, "global_step": 168462, "epoch": 4011} {"train_loss": -6.945047378540039, "global_step": 168463, "epoch": 4011} {"train_loss": -6.837555885314941, "global_step": 168464, "epoch": 4011} {"train_loss": -6.98979377746582, "global_step": 168465, "epoch": 4011} {"train_loss": -6.951862812042236, "global_step": 168466, "epoch": 4011} {"train_loss": -6.975625038146973, "global_step": 168467, "epoch": 4011} {"train_loss": -6.850372314453125, "global_step": 168468, "epoch": 4011} {"train_loss": -6.979610443115234, "global_step": 168469, "epoch": 4011} {"train_loss": -6.956605911254883, "global_step": 168470, "epoch": 4011} {"train_loss": -7.14211368560791, "global_step": 168471, "epoch": 4011} {"train_loss": -7.066514492034912, "global_step": 168472, "epoch": 4011} {"train_loss": -7.073600769042969, "global_step": 168473, "epoch": 4011} {"train_loss": -7.082902908325195, "global_step": 168474, "epoch": 4011} {"train_loss": -7.0738725662231445, "global_step": 168475, "epoch": 4011} {"train_loss": -7.0428466796875, "global_step": 168476, "epoch": 4011} {"train_loss": -7.11733865737915, "global_step": 168477, "epoch": 4011} {"train_loss": -7.0299835205078125, "global_step": 168478, "epoch": 4011} {"train_loss": -7.074584007263184, "global_step": 168479, "epoch": 4011} {"train_loss": -7.0672221183776855, "global_step": 168480, "epoch": 4011} {"train_loss": -7.030330657958984, "global_step": 168481, "epoch": 4011} {"train_loss": -7.055564880371094, "global_step": 168482, "epoch": 4011} {"train_loss": -7.057442665100098, "global_step": 168483, "epoch": 4011} {"train_loss": -7.118829250335693, "global_step": 168484, "epoch": 4011} {"train_loss": -7.120152473449707, "global_step": 168485, "epoch": 4011} {"train_loss": -7.061708927154541, "global_step": 168486, "epoch": 4011} {"train_loss": -6.921512126922607, "global_step": 168487, "epoch": 4011} {"train_loss": -7.018534183502197, "global_step": 168488, "epoch": 4011} {"train_loss": -7.1546478271484375, "global_step": 168489, "epoch": 4011} {"train_loss": -7.04121208190918, "global_step": 168490, "epoch": 4011} {"train_loss": -7.073458671569824, "global_step": 168491, "epoch": 4011} {"train_loss": -7.050882339477539, "global_step": 168492, "epoch": 4011} {"train_loss": -7.156574249267578, "global_step": 168493, "epoch": 4011} {"train_loss": -7.033511161804199, "global_step": 168494, "epoch": 4011} {"train_loss": -7.029060363769531, "global_step": 168495, "epoch": 4011} {"train_loss": -7.018649578094482, "global_step": 168496, "epoch": 4011} {"train_loss": -7.012711048126221, "global_step": 168497, "epoch": 4011} {"train_loss": -6.916022300720215, "global_step": 168498, "epoch": 4011} {"train_loss": -6.750451564788818, "global_step": 168499, "epoch": 4011} {"train_loss": -7.0525221824646, "global_step": 168500, "epoch": 4011} {"train_loss": -7.0601606369018555, "global_step": 168501, "epoch": 4011} {"train_loss": -6.954941272735596, "global_step": 168502, "epoch": 4011} {"train_loss": -7.018136058534894, "global_step": 168503, "epoch": 4011, "val_loss": 79897.4140625} {"train_loss": -7.028069019317627, "global_step": 168504, "epoch": 4012} {"train_loss": -7.013033866882324, "global_step": 168505, "epoch": 4012} {"train_loss": -7.062968730926514, "global_step": 168506, "epoch": 4012} {"train_loss": -7.007004261016846, "global_step": 168507, "epoch": 4012} {"train_loss": -7.072776794433594, "global_step": 168508, "epoch": 4012} {"train_loss": -7.028485298156738, "global_step": 168509, "epoch": 4012} {"train_loss": -7.029303550720215, "global_step": 168510, "epoch": 4012} {"train_loss": -7.081812858581543, "global_step": 168511, "epoch": 4012} {"train_loss": -7.015751838684082, "global_step": 168512, "epoch": 4012} {"train_loss": -7.039256572723389, "global_step": 168513, "epoch": 4012} {"train_loss": -7.015542030334473, "global_step": 168514, "epoch": 4012} {"train_loss": -7.0513176918029785, "global_step": 168515, "epoch": 4012} {"train_loss": -7.145663261413574, "global_step": 168516, "epoch": 4012} {"train_loss": -7.041271686553955, "global_step": 168517, "epoch": 4012} {"train_loss": -7.1140031814575195, "global_step": 168518, "epoch": 4012} {"train_loss": -7.057259559631348, "global_step": 168519, "epoch": 4012} {"train_loss": -6.966200828552246, "global_step": 168520, "epoch": 4012} {"train_loss": -6.919556617736816, "global_step": 168521, "epoch": 4012} {"train_loss": -7.025651931762695, "global_step": 168522, "epoch": 4012} {"train_loss": -7.087968826293945, "global_step": 168523, "epoch": 4012} {"train_loss": -6.881016731262207, "global_step": 168524, "epoch": 4012} {"train_loss": -7.0495500564575195, "global_step": 168525, "epoch": 4012} {"train_loss": -7.0340352058410645, "global_step": 168526, "epoch": 4012} {"train_loss": -7.043403625488281, "global_step": 168527, "epoch": 4012} {"train_loss": -6.9954657554626465, "global_step": 168528, "epoch": 4012} {"train_loss": -7.0671796798706055, "global_step": 168529, "epoch": 4012} {"train_loss": -7.043848037719727, "global_step": 168530, "epoch": 4012} {"train_loss": -7.070297718048096, "global_step": 168531, "epoch": 4012} {"train_loss": -6.935484409332275, "global_step": 168532, "epoch": 4012} {"train_loss": -6.976523399353027, "global_step": 168533, "epoch": 4012} {"train_loss": -7.1053314208984375, "global_step": 168534, "epoch": 4012} {"train_loss": -6.905640602111816, "global_step": 168535, "epoch": 4012} {"train_loss": -6.918837547302246, "global_step": 168536, "epoch": 4012} {"train_loss": -7.015864372253418, "global_step": 168537, "epoch": 4012} {"train_loss": -6.982333183288574, "global_step": 168538, "epoch": 4012} {"train_loss": -7.056861877441406, "global_step": 168539, "epoch": 4012} {"train_loss": -6.932977676391602, "global_step": 168540, "epoch": 4012} {"train_loss": -7.0403523445129395, "global_step": 168541, "epoch": 4012} {"train_loss": -7.209114074707031, "global_step": 168542, "epoch": 4012} {"train_loss": -7.013420104980469, "global_step": 168543, "epoch": 4012} {"train_loss": -7.1517438888549805, "global_step": 168544, "epoch": 4012} {"train_loss": -7.030826489130656, "global_step": 168545, "epoch": 4012, "val_loss": 79809.4453125} {"train_loss": -7.115771293640137, "global_step": 168546, "epoch": 4013} {"train_loss": -7.048497200012207, "global_step": 168547, "epoch": 4013} {"train_loss": -7.062507629394531, "global_step": 168548, "epoch": 4013} {"train_loss": -7.122289657592773, "global_step": 168549, "epoch": 4013} {"train_loss": -7.146716117858887, "global_step": 168550, "epoch": 4013} {"train_loss": -7.117673873901367, "global_step": 168551, "epoch": 4013} {"train_loss": -7.119751930236816, "global_step": 168552, "epoch": 4013} {"train_loss": -7.045340538024902, "global_step": 168553, "epoch": 4013} {"train_loss": -7.094061851501465, "global_step": 168554, "epoch": 4013} {"train_loss": -6.972275733947754, "global_step": 168555, "epoch": 4013} {"train_loss": -7.143733024597168, "global_step": 168556, "epoch": 4013} {"train_loss": -7.080446243286133, "global_step": 168557, "epoch": 4013} {"train_loss": -7.123456954956055, "global_step": 168558, "epoch": 4013} {"train_loss": -7.04034423828125, "global_step": 168559, "epoch": 4013} {"train_loss": -7.189996719360352, "global_step": 168560, "epoch": 4013} {"train_loss": -7.157681465148926, "global_step": 168561, "epoch": 4013} {"train_loss": -7.130189418792725, "global_step": 168562, "epoch": 4013} {"train_loss": -6.940892219543457, "global_step": 168563, "epoch": 4013} {"train_loss": -7.101563453674316, "global_step": 168564, "epoch": 4013} {"train_loss": -6.971499919891357, "global_step": 168565, "epoch": 4013} {"train_loss": -6.904261589050293, "global_step": 168566, "epoch": 4013} {"train_loss": -7.081099033355713, "global_step": 168567, "epoch": 4013} {"train_loss": -7.0735368728637695, "global_step": 168568, "epoch": 4013} {"train_loss": -7.026419162750244, "global_step": 168569, "epoch": 4013} {"train_loss": -7.150125503540039, "global_step": 168570, "epoch": 4013} {"train_loss": -7.085555076599121, "global_step": 168571, "epoch": 4013} {"train_loss": -7.0398430824279785, "global_step": 168572, "epoch": 4013} {"train_loss": -7.043282985687256, "global_step": 168573, "epoch": 4013} {"train_loss": -7.016386032104492, "global_step": 168574, "epoch": 4013} {"train_loss": -7.012845993041992, "global_step": 168575, "epoch": 4013} {"train_loss": -7.121711254119873, "global_step": 168576, "epoch": 4013} {"train_loss": -7.049892902374268, "global_step": 168577, "epoch": 4013} {"train_loss": -7.086602210998535, "global_step": 168578, "epoch": 4013} {"train_loss": -7.009083271026611, "global_step": 168579, "epoch": 4013} {"train_loss": -7.1702880859375, "global_step": 168580, "epoch": 4013} {"train_loss": -7.0703935623168945, "global_step": 168581, "epoch": 4013} {"train_loss": -7.136817932128906, "global_step": 168582, "epoch": 4013} {"train_loss": -7.090545654296875, "global_step": 168583, "epoch": 4013} {"train_loss": -7.019813537597656, "global_step": 168584, "epoch": 4013} {"train_loss": -6.9597625732421875, "global_step": 168585, "epoch": 4013} {"train_loss": -7.090729713439941, "global_step": 168586, "epoch": 4013} {"train_loss": -7.072628963561285, "global_step": 168587, "epoch": 4013, "val_loss": 79851.28125} {"train_loss": -7.025419235229492, "global_step": 168588, "epoch": 4014} {"train_loss": -6.959921360015869, "global_step": 168589, "epoch": 4014} {"train_loss": -7.048346042633057, "global_step": 168590, "epoch": 4014} {"train_loss": -7.019598960876465, "global_step": 168591, "epoch": 4014} {"train_loss": -7.06997013092041, "global_step": 168592, "epoch": 4014} {"train_loss": -7.030362129211426, "global_step": 168593, "epoch": 4014} {"train_loss": -7.030254364013672, "global_step": 168594, "epoch": 4014} {"train_loss": -6.963543891906738, "global_step": 168595, "epoch": 4014} {"train_loss": -6.903985977172852, "global_step": 168596, "epoch": 4014} {"train_loss": -6.976540565490723, "global_step": 168597, "epoch": 4014} {"train_loss": -6.854138374328613, "global_step": 168598, "epoch": 4014} {"train_loss": -6.9249725341796875, "global_step": 168599, "epoch": 4014} {"train_loss": -6.947724342346191, "global_step": 168600, "epoch": 4014} {"train_loss": -6.985543251037598, "global_step": 168601, "epoch": 4014} {"train_loss": -6.9993181228637695, "global_step": 168602, "epoch": 4014} {"train_loss": -7.0409321784973145, "global_step": 168603, "epoch": 4014} {"train_loss": -7.045679092407227, "global_step": 168604, "epoch": 4014} {"train_loss": -7.011185646057129, "global_step": 168605, "epoch": 4014} {"train_loss": -6.973504066467285, "global_step": 168606, "epoch": 4014} {"train_loss": -7.002808570861816, "global_step": 168607, "epoch": 4014} {"train_loss": -7.021886825561523, "global_step": 168608, "epoch": 4014} {"train_loss": -6.998684406280518, "global_step": 168609, "epoch": 4014} {"train_loss": -7.047733306884766, "global_step": 168610, "epoch": 4014} {"train_loss": -7.090549468994141, "global_step": 168611, "epoch": 4014} {"train_loss": -6.966303825378418, "global_step": 168612, "epoch": 4014} {"train_loss": -7.08432149887085, "global_step": 168613, "epoch": 4014} {"train_loss": -7.058681488037109, "global_step": 168614, "epoch": 4014} {"train_loss": -7.087484359741211, "global_step": 168615, "epoch": 4014} {"train_loss": -6.94435977935791, "global_step": 168616, "epoch": 4014} {"train_loss": -7.0117998123168945, "global_step": 168617, "epoch": 4014} {"train_loss": -7.03460693359375, "global_step": 168618, "epoch": 4014} {"train_loss": -7.005265712738037, "global_step": 168619, "epoch": 4014} {"train_loss": -7.118420124053955, "global_step": 168620, "epoch": 4014} {"train_loss": -7.010279655456543, "global_step": 168621, "epoch": 4014} {"train_loss": -6.941229820251465, "global_step": 168622, "epoch": 4014} {"train_loss": -7.0694451332092285, "global_step": 168623, "epoch": 4014} {"train_loss": -7.014857292175293, "global_step": 168624, "epoch": 4014} {"train_loss": -7.065957069396973, "global_step": 168625, "epoch": 4014} {"train_loss": -6.992010593414307, "global_step": 168626, "epoch": 4014} {"train_loss": -7.067077159881592, "global_step": 168627, "epoch": 4014} {"train_loss": -7.156582832336426, "global_step": 168628, "epoch": 4014} {"train_loss": -7.015624443689982, "global_step": 168629, "epoch": 4014, "val_loss": 79607.4375} {"train_loss": -6.983034610748291, "global_step": 168630, "epoch": 4015} {"train_loss": -7.112526893615723, "global_step": 168631, "epoch": 4015} {"train_loss": -7.055180549621582, "global_step": 168632, "epoch": 4015} {"train_loss": -7.043040752410889, "global_step": 168633, "epoch": 4015} {"train_loss": -7.031552791595459, "global_step": 168634, "epoch": 4015} {"train_loss": -6.981541633605957, "global_step": 168635, "epoch": 4015} {"train_loss": -7.03167724609375, "global_step": 168636, "epoch": 4015} {"train_loss": -7.05660343170166, "global_step": 168637, "epoch": 4015} {"train_loss": -7.04466438293457, "global_step": 168638, "epoch": 4015} {"train_loss": -7.060325622558594, "global_step": 168639, "epoch": 4015} {"train_loss": -6.967153549194336, "global_step": 168640, "epoch": 4015} {"train_loss": -7.008705139160156, "global_step": 168641, "epoch": 4015} {"train_loss": -6.906591415405273, "global_step": 168642, "epoch": 4015} {"train_loss": -6.869543075561523, "global_step": 168643, "epoch": 4015} {"train_loss": -7.034399032592773, "global_step": 168644, "epoch": 4015} {"train_loss": -6.906682014465332, "global_step": 168645, "epoch": 4015} {"train_loss": -7.12590217590332, "global_step": 168646, "epoch": 4015} {"train_loss": -7.021500587463379, "global_step": 168647, "epoch": 4015} {"train_loss": -6.849167823791504, "global_step": 168648, "epoch": 4015} {"train_loss": -7.007065773010254, "global_step": 168649, "epoch": 4015} {"train_loss": -6.797816276550293, "global_step": 168650, "epoch": 4015} {"train_loss": -6.933496475219727, "global_step": 168651, "epoch": 4015} {"train_loss": -7.001369476318359, "global_step": 168652, "epoch": 4015} {"train_loss": -6.85982608795166, "global_step": 168653, "epoch": 4015} {"train_loss": -7.04367208480835, "global_step": 168654, "epoch": 4015} {"train_loss": -6.92588996887207, "global_step": 168655, "epoch": 4015} {"train_loss": -6.964015007019043, "global_step": 168656, "epoch": 4015} {"train_loss": -6.88488245010376, "global_step": 168657, "epoch": 4015} {"train_loss": -7.004185676574707, "global_step": 168658, "epoch": 4015} {"train_loss": -7.081658363342285, "global_step": 168659, "epoch": 4015} {"train_loss": -6.995593070983887, "global_step": 168660, "epoch": 4015} {"train_loss": -7.158353805541992, "global_step": 168661, "epoch": 4015} {"train_loss": -7.120393753051758, "global_step": 168662, "epoch": 4015} {"train_loss": -6.938602447509766, "global_step": 168663, "epoch": 4015} {"train_loss": -6.964319705963135, "global_step": 168664, "epoch": 4015} {"train_loss": -6.969392776489258, "global_step": 168665, "epoch": 4015} {"train_loss": -6.991641521453857, "global_step": 168666, "epoch": 4015} {"train_loss": -7.05008602142334, "global_step": 168667, "epoch": 4015} {"train_loss": -7.01603889465332, "global_step": 168668, "epoch": 4015} {"train_loss": -7.001084804534912, "global_step": 168669, "epoch": 4015} {"train_loss": -6.916374683380127, "global_step": 168670, "epoch": 4015} {"train_loss": -6.994343042373657, "global_step": 168671, "epoch": 4015, "val_loss": 79967.7734375} {"train_loss": -7.091253280639648, "global_step": 168672, "epoch": 4016} {"train_loss": -6.9433088302612305, "global_step": 168673, "epoch": 4016} {"train_loss": -7.189813137054443, "global_step": 168674, "epoch": 4016} {"train_loss": -6.9847822189331055, "global_step": 168675, "epoch": 4016} {"train_loss": -6.893110752105713, "global_step": 168676, "epoch": 4016} {"train_loss": -7.05947208404541, "global_step": 168677, "epoch": 4016} {"train_loss": -6.796714782714844, "global_step": 168678, "epoch": 4016} {"train_loss": -7.087724685668945, "global_step": 168679, "epoch": 4016} {"train_loss": -6.979006767272949, "global_step": 168680, "epoch": 4016} {"train_loss": -6.974047660827637, "global_step": 168681, "epoch": 4016} {"train_loss": -7.1114912033081055, "global_step": 168682, "epoch": 4016} {"train_loss": -7.084689140319824, "global_step": 168683, "epoch": 4016} {"train_loss": -6.969998359680176, "global_step": 168684, "epoch": 4016} {"train_loss": -7.0766401290893555, "global_step": 168685, "epoch": 4016} {"train_loss": -7.041365623474121, "global_step": 168686, "epoch": 4016} {"train_loss": -7.004149436950684, "global_step": 168687, "epoch": 4016} {"train_loss": -7.056536674499512, "global_step": 168688, "epoch": 4016} {"train_loss": -6.966607093811035, "global_step": 168689, "epoch": 4016} {"train_loss": -6.997870445251465, "global_step": 168690, "epoch": 4016} {"train_loss": -7.131829261779785, "global_step": 168691, "epoch": 4016} {"train_loss": -6.995152473449707, "global_step": 168692, "epoch": 4016} {"train_loss": -7.121657371520996, "global_step": 168693, "epoch": 4016} {"train_loss": -7.036685943603516, "global_step": 168694, "epoch": 4016} {"train_loss": -7.061487197875977, "global_step": 168695, "epoch": 4016} {"train_loss": -7.024298667907715, "global_step": 168696, "epoch": 4016} {"train_loss": -6.983449935913086, "global_step": 168697, "epoch": 4016} {"train_loss": -7.029445648193359, "global_step": 168698, "epoch": 4016} {"train_loss": -7.0840911865234375, "global_step": 168699, "epoch": 4016} {"train_loss": -7.114637851715088, "global_step": 168700, "epoch": 4016} {"train_loss": -7.074979782104492, "global_step": 168701, "epoch": 4016} {"train_loss": -7.082947731018066, "global_step": 168702, "epoch": 4016} {"train_loss": -7.120489120483398, "global_step": 168703, "epoch": 4016} {"train_loss": -7.08511209487915, "global_step": 168704, "epoch": 4016} {"train_loss": -7.082517623901367, "global_step": 168705, "epoch": 4016} {"train_loss": -7.115685939788818, "global_step": 168706, "epoch": 4016} {"train_loss": -7.0402116775512695, "global_step": 168707, "epoch": 4016} {"train_loss": -7.073864936828613, "global_step": 168708, "epoch": 4016} {"train_loss": -7.161550521850586, "global_step": 168709, "epoch": 4016} {"train_loss": -7.0245256423950195, "global_step": 168710, "epoch": 4016} {"train_loss": -7.0568389892578125, "global_step": 168711, "epoch": 4016} {"train_loss": -7.184436798095703, "global_step": 168712, "epoch": 4016} {"train_loss": -7.0482456002916605, "global_step": 168713, "epoch": 4016, "val_loss": 79896.90625} {"train_loss": -7.03787088394165, "global_step": 168714, "epoch": 4017} {"train_loss": -7.074349880218506, "global_step": 168715, "epoch": 4017} {"train_loss": -7.016725063323975, "global_step": 168716, "epoch": 4017} {"train_loss": -7.0291948318481445, "global_step": 168717, "epoch": 4017} {"train_loss": -7.0107879638671875, "global_step": 168718, "epoch": 4017} {"train_loss": -6.947482109069824, "global_step": 168719, "epoch": 4017} {"train_loss": -7.026021957397461, "global_step": 168720, "epoch": 4017} {"train_loss": -6.992792129516602, "global_step": 168721, "epoch": 4017} {"train_loss": -7.064174175262451, "global_step": 168722, "epoch": 4017} {"train_loss": -7.107939720153809, "global_step": 168723, "epoch": 4017} {"train_loss": -7.028202056884766, "global_step": 168724, "epoch": 4017} {"train_loss": -7.061836242675781, "global_step": 168725, "epoch": 4017} {"train_loss": -7.081954479217529, "global_step": 168726, "epoch": 4017} {"train_loss": -6.989647388458252, "global_step": 168727, "epoch": 4017} {"train_loss": -7.162479877471924, "global_step": 168728, "epoch": 4017} {"train_loss": -7.062784194946289, "global_step": 168729, "epoch": 4017} {"train_loss": -7.036818027496338, "global_step": 168730, "epoch": 4017} {"train_loss": -7.10274600982666, "global_step": 168731, "epoch": 4017} {"train_loss": -7.006261825561523, "global_step": 168732, "epoch": 4017} {"train_loss": -7.056033134460449, "global_step": 168733, "epoch": 4017} {"train_loss": -7.088499069213867, "global_step": 168734, "epoch": 4017} {"train_loss": -7.08341646194458, "global_step": 168735, "epoch": 4017} {"train_loss": -6.99847936630249, "global_step": 168736, "epoch": 4017} {"train_loss": -7.069558143615723, "global_step": 168737, "epoch": 4017} {"train_loss": -7.117676258087158, "global_step": 168738, "epoch": 4017} {"train_loss": -6.991881370544434, "global_step": 168739, "epoch": 4017} {"train_loss": -6.975058078765869, "global_step": 168740, "epoch": 4017} {"train_loss": -6.984235763549805, "global_step": 168741, "epoch": 4017} {"train_loss": -6.983613967895508, "global_step": 168742, "epoch": 4017} {"train_loss": -6.93638801574707, "global_step": 168743, "epoch": 4017} {"train_loss": -7.11952018737793, "global_step": 168744, "epoch": 4017} {"train_loss": -7.011582374572754, "global_step": 168745, "epoch": 4017} {"train_loss": -7.128707408905029, "global_step": 168746, "epoch": 4017} {"train_loss": -7.0180344581604, "global_step": 168747, "epoch": 4017} {"train_loss": -6.905428886413574, "global_step": 168748, "epoch": 4017} {"train_loss": -7.00084924697876, "global_step": 168749, "epoch": 4017} {"train_loss": -7.082823753356934, "global_step": 168750, "epoch": 4017} {"train_loss": -7.072895050048828, "global_step": 168751, "epoch": 4017} {"train_loss": -7.026165962219238, "global_step": 168752, "epoch": 4017} {"train_loss": -7.159397125244141, "global_step": 168753, "epoch": 4017} {"train_loss": -7.110415458679199, "global_step": 168754, "epoch": 4017} {"train_loss": -7.046661422366188, "global_step": 168755, "epoch": 4017, "val_loss": 79667.1953125} {"train_loss": -6.931989669799805, "global_step": 168756, "epoch": 4018} {"train_loss": -7.206949234008789, "global_step": 168757, "epoch": 4018} {"train_loss": -6.937281608581543, "global_step": 168758, "epoch": 4018} {"train_loss": -6.982760429382324, "global_step": 168759, "epoch": 4018} {"train_loss": -7.045077800750732, "global_step": 168760, "epoch": 4018} {"train_loss": -6.969839096069336, "global_step": 168761, "epoch": 4018} {"train_loss": -6.7360310554504395, "global_step": 168762, "epoch": 4018} {"train_loss": -6.8430562019348145, "global_step": 168763, "epoch": 4018} {"train_loss": -6.822425365447998, "global_step": 168764, "epoch": 4018} {"train_loss": -6.9196696281433105, "global_step": 168765, "epoch": 4018} {"train_loss": -6.87375545501709, "global_step": 168766, "epoch": 4018} {"train_loss": -6.912057399749756, "global_step": 168767, "epoch": 4018} {"train_loss": -6.795403480529785, "global_step": 168768, "epoch": 4018} {"train_loss": -6.758572578430176, "global_step": 168769, "epoch": 4018} {"train_loss": -6.914615631103516, "global_step": 168770, "epoch": 4018} {"train_loss": -6.827412128448486, "global_step": 168771, "epoch": 4018} {"train_loss": -6.680254936218262, "global_step": 168772, "epoch": 4018} {"train_loss": -6.657487869262695, "global_step": 168773, "epoch": 4018} {"train_loss": -6.8822832107543945, "global_step": 168774, "epoch": 4018} {"train_loss": -6.683231353759766, "global_step": 168775, "epoch": 4018} {"train_loss": -6.7612690925598145, "global_step": 168776, "epoch": 4018} {"train_loss": -6.795091152191162, "global_step": 168777, "epoch": 4018} {"train_loss": -6.9442596435546875, "global_step": 168778, "epoch": 4018} {"train_loss": -6.8757734298706055, "global_step": 168779, "epoch": 4018} {"train_loss": -6.867975234985352, "global_step": 168780, "epoch": 4018} {"train_loss": -6.849015235900879, "global_step": 168781, "epoch": 4018} {"train_loss": -6.789121150970459, "global_step": 168782, "epoch": 4018} {"train_loss": -6.8674468994140625, "global_step": 168783, "epoch": 4018} {"train_loss": -6.825813293457031, "global_step": 168784, "epoch": 4018} {"train_loss": -7.06010627746582, "global_step": 168785, "epoch": 4018} {"train_loss": -6.852330684661865, "global_step": 168786, "epoch": 4018} {"train_loss": -6.901340484619141, "global_step": 168787, "epoch": 4018} {"train_loss": -6.990817070007324, "global_step": 168788, "epoch": 4018} {"train_loss": -6.934928894042969, "global_step": 168789, "epoch": 4018} {"train_loss": -7.039480209350586, "global_step": 168790, "epoch": 4018} {"train_loss": -6.953180313110352, "global_step": 168791, "epoch": 4018} {"train_loss": -6.907281875610352, "global_step": 168792, "epoch": 4018} {"train_loss": -6.997177600860596, "global_step": 168793, "epoch": 4018} {"train_loss": -7.015228271484375, "global_step": 168794, "epoch": 4018} {"train_loss": -7.019309997558594, "global_step": 168795, "epoch": 4018} {"train_loss": -6.994180679321289, "global_step": 168796, "epoch": 4018} {"train_loss": -6.8969298884982155, "global_step": 168797, "epoch": 4018, "val_loss": 79745.453125} {"train_loss": -7.028519630432129, "global_step": 168798, "epoch": 4019} {"train_loss": -6.974823951721191, "global_step": 168799, "epoch": 4019} {"train_loss": -7.004998207092285, "global_step": 168800, "epoch": 4019} {"train_loss": -7.001377582550049, "global_step": 168801, "epoch": 4019} {"train_loss": -6.950862407684326, "global_step": 168802, "epoch": 4019} {"train_loss": -7.088953495025635, "global_step": 168803, "epoch": 4019} {"train_loss": -7.142409801483154, "global_step": 168804, "epoch": 4019} {"train_loss": -7.020928382873535, "global_step": 168805, "epoch": 4019} {"train_loss": -6.925359725952148, "global_step": 168806, "epoch": 4019} {"train_loss": -7.0229902267456055, "global_step": 168807, "epoch": 4019} {"train_loss": -7.036876678466797, "global_step": 168808, "epoch": 4019} {"train_loss": -7.071061611175537, "global_step": 168809, "epoch": 4019} {"train_loss": -7.138779163360596, "global_step": 168810, "epoch": 4019} {"train_loss": -6.986287593841553, "global_step": 168811, "epoch": 4019} {"train_loss": -7.1020002365112305, "global_step": 168812, "epoch": 4019} {"train_loss": -7.106108665466309, "global_step": 168813, "epoch": 4019} {"train_loss": -7.143631935119629, "global_step": 168814, "epoch": 4019} {"train_loss": -7.100973606109619, "global_step": 168815, "epoch": 4019} {"train_loss": -6.978873252868652, "global_step": 168816, "epoch": 4019} {"train_loss": -7.166500568389893, "global_step": 168817, "epoch": 4019} {"train_loss": -7.07212495803833, "global_step": 168818, "epoch": 4019} {"train_loss": -7.110396385192871, "global_step": 168819, "epoch": 4019} {"train_loss": -7.17039680480957, "global_step": 168820, "epoch": 4019} {"train_loss": -7.070586681365967, "global_step": 168821, "epoch": 4019} {"train_loss": -7.086858749389648, "global_step": 168822, "epoch": 4019} {"train_loss": -7.046932697296143, "global_step": 168823, "epoch": 4019} {"train_loss": -7.06709098815918, "global_step": 168824, "epoch": 4019} {"train_loss": -7.126649856567383, "global_step": 168825, "epoch": 4019} {"train_loss": -7.084229469299316, "global_step": 168826, "epoch": 4019} {"train_loss": -7.077345371246338, "global_step": 168827, "epoch": 4019} {"train_loss": -7.047368049621582, "global_step": 168828, "epoch": 4019} {"train_loss": -7.060360431671143, "global_step": 168829, "epoch": 4019} {"train_loss": -7.159368991851807, "global_step": 168830, "epoch": 4019} {"train_loss": -7.024718284606934, "global_step": 168831, "epoch": 4019} {"train_loss": -6.962466239929199, "global_step": 168832, "epoch": 4019} {"train_loss": -6.963122844696045, "global_step": 168833, "epoch": 4019} {"train_loss": -7.018576622009277, "global_step": 168834, "epoch": 4019} {"train_loss": -7.106358528137207, "global_step": 168835, "epoch": 4019} {"train_loss": -7.013556480407715, "global_step": 168836, "epoch": 4019} {"train_loss": -7.118895530700684, "global_step": 168837, "epoch": 4019} {"train_loss": -6.919592380523682, "global_step": 168838, "epoch": 4019} {"train_loss": -7.0565113226572675, "global_step": 168839, "epoch": 4019, "val_loss": 79768.9140625} {"train_loss": -7.05372953414917, "global_step": 168840, "epoch": 4020} {"train_loss": -7.003411293029785, "global_step": 168841, "epoch": 4020} {"train_loss": -7.053147315979004, "global_step": 168842, "epoch": 4020} {"train_loss": -6.955361366271973, "global_step": 168843, "epoch": 4020} {"train_loss": -6.895787239074707, "global_step": 168844, "epoch": 4020} {"train_loss": -7.03590202331543, "global_step": 168845, "epoch": 4020} {"train_loss": -6.854123115539551, "global_step": 168846, "epoch": 4020} {"train_loss": -6.8329620361328125, "global_step": 168847, "epoch": 4020} {"train_loss": -7.153814315795898, "global_step": 168848, "epoch": 4020} {"train_loss": -7.083054065704346, "global_step": 168849, "epoch": 4020} {"train_loss": -7.0073041915893555, "global_step": 168850, "epoch": 4020} {"train_loss": -7.022172451019287, "global_step": 168851, "epoch": 4020} {"train_loss": -6.994753837585449, "global_step": 168852, "epoch": 4020} {"train_loss": -6.918999671936035, "global_step": 168853, "epoch": 4020} {"train_loss": -7.089015007019043, "global_step": 168854, "epoch": 4020} {"train_loss": -6.96424674987793, "global_step": 168855, "epoch": 4020} {"train_loss": -6.929198265075684, "global_step": 168856, "epoch": 4020} {"train_loss": -7.01662540435791, "global_step": 168857, "epoch": 4020} {"train_loss": -7.070642471313477, "global_step": 168858, "epoch": 4020} {"train_loss": -7.123711585998535, "global_step": 168859, "epoch": 4020} {"train_loss": -6.990922451019287, "global_step": 168860, "epoch": 4020} {"train_loss": -7.039273262023926, "global_step": 168861, "epoch": 4020} {"train_loss": -6.930356979370117, "global_step": 168862, "epoch": 4020} {"train_loss": -7.045947074890137, "global_step": 168863, "epoch": 4020} {"train_loss": -6.974367618560791, "global_step": 168864, "epoch": 4020} {"train_loss": -7.002745151519775, "global_step": 168865, "epoch": 4020} {"train_loss": -7.015862941741943, "global_step": 168866, "epoch": 4020} {"train_loss": -6.903736114501953, "global_step": 168867, "epoch": 4020} {"train_loss": -7.0854082107543945, "global_step": 168868, "epoch": 4020} {"train_loss": -6.922581195831299, "global_step": 168869, "epoch": 4020} {"train_loss": -6.730287551879883, "global_step": 168870, "epoch": 4020} {"train_loss": -6.99826717376709, "global_step": 168871, "epoch": 4020} {"train_loss": -6.880792617797852, "global_step": 168872, "epoch": 4020} {"train_loss": -6.852703094482422, "global_step": 168873, "epoch": 4020} {"train_loss": -7.034661769866943, "global_step": 168874, "epoch": 4020} {"train_loss": -6.765151500701904, "global_step": 168875, "epoch": 4020} {"train_loss": -6.947961330413818, "global_step": 168876, "epoch": 4020} {"train_loss": -6.876960754394531, "global_step": 168877, "epoch": 4020} {"train_loss": -6.978394985198975, "global_step": 168878, "epoch": 4020} {"train_loss": -6.991044998168945, "global_step": 168879, "epoch": 4020} {"train_loss": -6.869041442871094, "global_step": 168880, "epoch": 4020} {"train_loss": -6.972107455843971, "global_step": 168881, "epoch": 4020, "val_loss": 79732.6640625} {"train_loss": -6.981196403503418, "global_step": 168882, "epoch": 4021} {"train_loss": -6.898561000823975, "global_step": 168883, "epoch": 4021} {"train_loss": -7.025535583496094, "global_step": 168884, "epoch": 4021} {"train_loss": -6.952760219573975, "global_step": 168885, "epoch": 4021} {"train_loss": -6.970355033874512, "global_step": 168886, "epoch": 4021} {"train_loss": -7.0355963706970215, "global_step": 168887, "epoch": 4021} {"train_loss": -7.020496368408203, "global_step": 168888, "epoch": 4021} {"train_loss": -7.0242414474487305, "global_step": 168889, "epoch": 4021} {"train_loss": -7.068188190460205, "global_step": 168890, "epoch": 4021} {"train_loss": -6.999113082885742, "global_step": 168891, "epoch": 4021} {"train_loss": -7.0100226402282715, "global_step": 168892, "epoch": 4021} {"train_loss": -7.043444633483887, "global_step": 168893, "epoch": 4021} {"train_loss": -6.894184112548828, "global_step": 168894, "epoch": 4021} {"train_loss": -7.034305572509766, "global_step": 168895, "epoch": 4021} {"train_loss": -6.976275444030762, "global_step": 168896, "epoch": 4021} {"train_loss": -6.9251837730407715, "global_step": 168897, "epoch": 4021} {"train_loss": -7.061666011810303, "global_step": 168898, "epoch": 4021} {"train_loss": -7.021773338317871, "global_step": 168899, "epoch": 4021} {"train_loss": -6.979283332824707, "global_step": 168900, "epoch": 4021} {"train_loss": -6.936282634735107, "global_step": 168901, "epoch": 4021} {"train_loss": -7.073939323425293, "global_step": 168902, "epoch": 4021} {"train_loss": -6.945587158203125, "global_step": 168903, "epoch": 4021} {"train_loss": -6.917166709899902, "global_step": 168904, "epoch": 4021} {"train_loss": -7.046195983886719, "global_step": 168905, "epoch": 4021} {"train_loss": -6.940412521362305, "global_step": 168906, "epoch": 4021} {"train_loss": -7.073065757751465, "global_step": 168907, "epoch": 4021} {"train_loss": -6.975724220275879, "global_step": 168908, "epoch": 4021} {"train_loss": -7.0739336013793945, "global_step": 168909, "epoch": 4021} {"train_loss": -7.0584187507629395, "global_step": 168910, "epoch": 4021} {"train_loss": -6.955115795135498, "global_step": 168911, "epoch": 4021} {"train_loss": -6.938826084136963, "global_step": 168912, "epoch": 4021} {"train_loss": -6.968865394592285, "global_step": 168913, "epoch": 4021} {"train_loss": -6.880406856536865, "global_step": 168914, "epoch": 4021} {"train_loss": -6.985210418701172, "global_step": 168915, "epoch": 4021} {"train_loss": -7.099581241607666, "global_step": 168916, "epoch": 4021} {"train_loss": -6.925830841064453, "global_step": 168917, "epoch": 4021} {"train_loss": -7.060399532318115, "global_step": 168918, "epoch": 4021} {"train_loss": -6.914844036102295, "global_step": 168919, "epoch": 4021} {"train_loss": -6.8631672859191895, "global_step": 168920, "epoch": 4021} {"train_loss": -7.051068305969238, "global_step": 168921, "epoch": 4021} {"train_loss": -6.940526962280273, "global_step": 168922, "epoch": 4021} {"train_loss": -6.988899730500721, "global_step": 168923, "epoch": 4021, "val_loss": 79755.2890625} {"train_loss": -7.085017204284668, "global_step": 168924, "epoch": 4022} {"train_loss": -7.0496826171875, "global_step": 168925, "epoch": 4022} {"train_loss": -6.98756217956543, "global_step": 168926, "epoch": 4022} {"train_loss": -7.1056318283081055, "global_step": 168927, "epoch": 4022} {"train_loss": -6.996986389160156, "global_step": 168928, "epoch": 4022} {"train_loss": -7.062345504760742, "global_step": 168929, "epoch": 4022} {"train_loss": -7.057992458343506, "global_step": 168930, "epoch": 4022} {"train_loss": -7.11842679977417, "global_step": 168931, "epoch": 4022} {"train_loss": -7.107612609863281, "global_step": 168932, "epoch": 4022} {"train_loss": -7.13557243347168, "global_step": 168933, "epoch": 4022} {"train_loss": -6.959552764892578, "global_step": 168934, "epoch": 4022} {"train_loss": -6.975395202636719, "global_step": 168935, "epoch": 4022} {"train_loss": -7.07119083404541, "global_step": 168936, "epoch": 4022} {"train_loss": -7.037969589233398, "global_step": 168937, "epoch": 4022} {"train_loss": -7.055279731750488, "global_step": 168938, "epoch": 4022} {"train_loss": -6.996079921722412, "global_step": 168939, "epoch": 4022} {"train_loss": -7.026283264160156, "global_step": 168940, "epoch": 4022} {"train_loss": -7.026169300079346, "global_step": 168941, "epoch": 4022} {"train_loss": -7.066414833068848, "global_step": 168942, "epoch": 4022} {"train_loss": -7.161162376403809, "global_step": 168943, "epoch": 4022} {"train_loss": -7.114331245422363, "global_step": 168944, "epoch": 4022} {"train_loss": -6.989120006561279, "global_step": 168945, "epoch": 4022} {"train_loss": -7.046632766723633, "global_step": 168946, "epoch": 4022} {"train_loss": -6.998635292053223, "global_step": 168947, "epoch": 4022} {"train_loss": -7.0583038330078125, "global_step": 168948, "epoch": 4022} {"train_loss": -7.0315680503845215, "global_step": 168949, "epoch": 4022} {"train_loss": -6.925084590911865, "global_step": 168950, "epoch": 4022} {"train_loss": -6.98957633972168, "global_step": 168951, "epoch": 4022} {"train_loss": -6.942032337188721, "global_step": 168952, "epoch": 4022} {"train_loss": -7.1025390625, "global_step": 168953, "epoch": 4022} {"train_loss": -7.051793098449707, "global_step": 168954, "epoch": 4022} {"train_loss": -6.971296310424805, "global_step": 168955, "epoch": 4022} {"train_loss": -7.158205032348633, "global_step": 168956, "epoch": 4022} {"train_loss": -7.026072978973389, "global_step": 168957, "epoch": 4022} {"train_loss": -6.944609642028809, "global_step": 168958, "epoch": 4022} {"train_loss": -7.085306167602539, "global_step": 168959, "epoch": 4022} {"train_loss": -7.0629987716674805, "global_step": 168960, "epoch": 4022} {"train_loss": -7.122152328491211, "global_step": 168961, "epoch": 4022} {"train_loss": -7.05757999420166, "global_step": 168962, "epoch": 4022} {"train_loss": -7.168089866638184, "global_step": 168963, "epoch": 4022} {"train_loss": -7.072854995727539, "global_step": 168964, "epoch": 4022} {"train_loss": -7.047784850710914, "global_step": 168965, "epoch": 4022, "val_loss": 79895.4921875} {"train_loss": -7.0325775146484375, "global_step": 168966, "epoch": 4023} {"train_loss": -7.013491153717041, "global_step": 168967, "epoch": 4023} {"train_loss": -7.017760276794434, "global_step": 168968, "epoch": 4023} {"train_loss": -7.082427501678467, "global_step": 168969, "epoch": 4023} {"train_loss": -7.0883283615112305, "global_step": 168970, "epoch": 4023} {"train_loss": -7.0397820472717285, "global_step": 168971, "epoch": 4023} {"train_loss": -7.110926628112793, "global_step": 168972, "epoch": 4023} {"train_loss": -6.9842352867126465, "global_step": 168973, "epoch": 4023} {"train_loss": -7.025490760803223, "global_step": 168974, "epoch": 4023} {"train_loss": -7.014029502868652, "global_step": 168975, "epoch": 4023} {"train_loss": -7.0888848304748535, "global_step": 168976, "epoch": 4023} {"train_loss": -7.069320201873779, "global_step": 168977, "epoch": 4023} {"train_loss": -7.0196123123168945, "global_step": 168978, "epoch": 4023} {"train_loss": -6.957004547119141, "global_step": 168979, "epoch": 4023} {"train_loss": -7.1891350746154785, "global_step": 168980, "epoch": 4023} {"train_loss": -7.017343997955322, "global_step": 168981, "epoch": 4023} {"train_loss": -7.09887170791626, "global_step": 168982, "epoch": 4023} {"train_loss": -7.1468915939331055, "global_step": 168983, "epoch": 4023} {"train_loss": -7.055039405822754, "global_step": 168984, "epoch": 4023} {"train_loss": -7.2054643630981445, "global_step": 168985, "epoch": 4023} {"train_loss": -7.072601318359375, "global_step": 168986, "epoch": 4023} {"train_loss": -7.170116424560547, "global_step": 168987, "epoch": 4023} {"train_loss": -6.993516445159912, "global_step": 168988, "epoch": 4023} {"train_loss": -7.091187477111816, "global_step": 168989, "epoch": 4023} {"train_loss": -7.124465465545654, "global_step": 168990, "epoch": 4023} {"train_loss": -7.1107354164123535, "global_step": 168991, "epoch": 4023} {"train_loss": -7.0136613845825195, "global_step": 168992, "epoch": 4023} {"train_loss": -7.104920864105225, "global_step": 168993, "epoch": 4023} {"train_loss": -7.1569390296936035, "global_step": 168994, "epoch": 4023} {"train_loss": -7.088613033294678, "global_step": 168995, "epoch": 4023} {"train_loss": -6.963676452636719, "global_step": 168996, "epoch": 4023} {"train_loss": -7.068355560302734, "global_step": 168997, "epoch": 4023} {"train_loss": -7.052777290344238, "global_step": 168998, "epoch": 4023} {"train_loss": -7.049186706542969, "global_step": 168999, "epoch": 4023} {"train_loss": -7.0146331787109375, "global_step": 169000, "epoch": 4023} {"train_loss": -6.874242782592773, "global_step": 169001, "epoch": 4023} {"train_loss": -7.136754989624023, "global_step": 169002, "epoch": 4023} {"train_loss": -7.183344841003418, "global_step": 169003, "epoch": 4023} {"train_loss": -6.931373596191406, "global_step": 169004, "epoch": 4023} {"train_loss": -7.059035778045654, "global_step": 169005, "epoch": 4023} {"train_loss": -6.997995376586914, "global_step": 169006, "epoch": 4023} {"train_loss": -7.059445506050473, "global_step": 169007, "epoch": 4023, "val_loss": 79841.4140625} {"train_loss": -7.030868053436279, "global_step": 169008, "epoch": 4024} {"train_loss": -7.010092258453369, "global_step": 169009, "epoch": 4024} {"train_loss": -7.051830291748047, "global_step": 169010, "epoch": 4024} {"train_loss": -7.022871494293213, "global_step": 169011, "epoch": 4024} {"train_loss": -7.017815589904785, "global_step": 169012, "epoch": 4024} {"train_loss": -7.001564025878906, "global_step": 169013, "epoch": 4024} {"train_loss": -7.054206848144531, "global_step": 169014, "epoch": 4024} {"train_loss": -6.982037544250488, "global_step": 169015, "epoch": 4024} {"train_loss": -6.943893909454346, "global_step": 169016, "epoch": 4024} {"train_loss": -7.161511421203613, "global_step": 169017, "epoch": 4024} {"train_loss": -7.037644863128662, "global_step": 169018, "epoch": 4024} {"train_loss": -6.989989757537842, "global_step": 169019, "epoch": 4024} {"train_loss": -7.046599864959717, "global_step": 169020, "epoch": 4024} {"train_loss": -7.018135070800781, "global_step": 169021, "epoch": 4024} {"train_loss": -6.94895601272583, "global_step": 169022, "epoch": 4024} {"train_loss": -7.0569963455200195, "global_step": 169023, "epoch": 4024} {"train_loss": -7.021671772003174, "global_step": 169024, "epoch": 4024} {"train_loss": -7.041591644287109, "global_step": 169025, "epoch": 4024} {"train_loss": -7.029443740844727, "global_step": 169026, "epoch": 4024} {"train_loss": -7.155357360839844, "global_step": 169027, "epoch": 4024} {"train_loss": -6.984004974365234, "global_step": 169028, "epoch": 4024} {"train_loss": -7.069357872009277, "global_step": 169029, "epoch": 4024} {"train_loss": -7.012104511260986, "global_step": 169030, "epoch": 4024} {"train_loss": -6.986517429351807, "global_step": 169031, "epoch": 4024} {"train_loss": -7.0345659255981445, "global_step": 169032, "epoch": 4024} {"train_loss": -6.874862194061279, "global_step": 169033, "epoch": 4024} {"train_loss": -7.095180511474609, "global_step": 169034, "epoch": 4024} {"train_loss": -7.013962745666504, "global_step": 169035, "epoch": 4024} {"train_loss": -7.120328903198242, "global_step": 169036, "epoch": 4024} {"train_loss": -7.062135696411133, "global_step": 169037, "epoch": 4024} {"train_loss": -7.0222554206848145, "global_step": 169038, "epoch": 4024} {"train_loss": -7.044186115264893, "global_step": 169039, "epoch": 4024} {"train_loss": -7.045690059661865, "global_step": 169040, "epoch": 4024} {"train_loss": -7.053879261016846, "global_step": 169041, "epoch": 4024} {"train_loss": -7.063005447387695, "global_step": 169042, "epoch": 4024} {"train_loss": -7.195769309997559, "global_step": 169043, "epoch": 4024} {"train_loss": -7.1389875411987305, "global_step": 169044, "epoch": 4024} {"train_loss": -7.044084072113037, "global_step": 169045, "epoch": 4024} {"train_loss": -7.019587516784668, "global_step": 169046, "epoch": 4024} {"train_loss": -7.142044544219971, "global_step": 169047, "epoch": 4024} {"train_loss": -7.099745273590088, "global_step": 169048, "epoch": 4024} {"train_loss": -7.042835360481625, "global_step": 169049, "epoch": 4024, "val_loss": 79880.234375} {"train_loss": -7.03029727935791, "global_step": 169050, "epoch": 4025} {"train_loss": -7.120026588439941, "global_step": 169051, "epoch": 4025} {"train_loss": -7.009554862976074, "global_step": 169052, "epoch": 4025} {"train_loss": -7.0007219314575195, "global_step": 169053, "epoch": 4025} {"train_loss": -7.128604412078857, "global_step": 169054, "epoch": 4025} {"train_loss": -7.066577911376953, "global_step": 169055, "epoch": 4025} {"train_loss": -7.132416725158691, "global_step": 169056, "epoch": 4025} {"train_loss": -7.06057071685791, "global_step": 169057, "epoch": 4025} {"train_loss": -7.151845455169678, "global_step": 169058, "epoch": 4025} {"train_loss": -7.158411502838135, "global_step": 169059, "epoch": 4025} {"train_loss": -7.01689338684082, "global_step": 169060, "epoch": 4025} {"train_loss": -7.051144599914551, "global_step": 169061, "epoch": 4025} {"train_loss": -6.994340896606445, "global_step": 169062, "epoch": 4025} {"train_loss": -6.979827880859375, "global_step": 169063, "epoch": 4025} {"train_loss": -7.162346839904785, "global_step": 169064, "epoch": 4025} {"train_loss": -7.0665178298950195, "global_step": 169065, "epoch": 4025} {"train_loss": -7.01535177230835, "global_step": 169066, "epoch": 4025} {"train_loss": -7.0369553565979, "global_step": 169067, "epoch": 4025} {"train_loss": -7.0183515548706055, "global_step": 169068, "epoch": 4025} {"train_loss": -6.990979194641113, "global_step": 169069, "epoch": 4025} {"train_loss": -7.123712539672852, "global_step": 169070, "epoch": 4025} {"train_loss": -7.095741271972656, "global_step": 169071, "epoch": 4025} {"train_loss": -7.191549301147461, "global_step": 169072, "epoch": 4025} {"train_loss": -6.94035005569458, "global_step": 169073, "epoch": 4025} {"train_loss": -7.029993534088135, "global_step": 169074, "epoch": 4025} {"train_loss": -7.0148820877075195, "global_step": 169075, "epoch": 4025} {"train_loss": -6.986370086669922, "global_step": 169076, "epoch": 4025} {"train_loss": -7.1382670402526855, "global_step": 169077, "epoch": 4025} {"train_loss": -7.076778411865234, "global_step": 169078, "epoch": 4025} {"train_loss": -7.078714370727539, "global_step": 169079, "epoch": 4025} {"train_loss": -7.0283074378967285, "global_step": 169080, "epoch": 4025} {"train_loss": -7.044371604919434, "global_step": 169081, "epoch": 4025} {"train_loss": -7.0517258644104, "global_step": 169082, "epoch": 4025} {"train_loss": -7.021485328674316, "global_step": 169083, "epoch": 4025} {"train_loss": -7.070216178894043, "global_step": 169084, "epoch": 4025} {"train_loss": -6.962533473968506, "global_step": 169085, "epoch": 4025} {"train_loss": -7.062103271484375, "global_step": 169086, "epoch": 4025} {"train_loss": -7.031520843505859, "global_step": 169087, "epoch": 4025} {"train_loss": -6.911562919616699, "global_step": 169088, "epoch": 4025} {"train_loss": -7.0236430168151855, "global_step": 169089, "epoch": 4025} {"train_loss": -7.0366315841674805, "global_step": 169090, "epoch": 4025} {"train_loss": -7.051271495364961, "global_step": 169091, "epoch": 4025, "val_loss": 79915.5390625} {"train_loss": -6.965963363647461, "global_step": 169092, "epoch": 4026} {"train_loss": -7.058750152587891, "global_step": 169093, "epoch": 4026} {"train_loss": -7.025650501251221, "global_step": 169094, "epoch": 4026} {"train_loss": -6.969461917877197, "global_step": 169095, "epoch": 4026} {"train_loss": -7.14521598815918, "global_step": 169096, "epoch": 4026} {"train_loss": -6.929645538330078, "global_step": 169097, "epoch": 4026} {"train_loss": -6.948838233947754, "global_step": 169098, "epoch": 4026} {"train_loss": -7.104803562164307, "global_step": 169099, "epoch": 4026} {"train_loss": -6.925200462341309, "global_step": 169100, "epoch": 4026} {"train_loss": -7.027198791503906, "global_step": 169101, "epoch": 4026} {"train_loss": -6.956650733947754, "global_step": 169102, "epoch": 4026} {"train_loss": -6.848973751068115, "global_step": 169103, "epoch": 4026} {"train_loss": -7.051547050476074, "global_step": 169104, "epoch": 4026} {"train_loss": -6.933913230895996, "global_step": 169105, "epoch": 4026} {"train_loss": -6.826139450073242, "global_step": 169106, "epoch": 4026} {"train_loss": -7.024694442749023, "global_step": 169107, "epoch": 4026} {"train_loss": -6.817163467407227, "global_step": 169108, "epoch": 4026} {"train_loss": -6.86988639831543, "global_step": 169109, "epoch": 4026} {"train_loss": -7.014171123504639, "global_step": 169110, "epoch": 4026} {"train_loss": -6.796515941619873, "global_step": 169111, "epoch": 4026} {"train_loss": -6.905914306640625, "global_step": 169112, "epoch": 4026} {"train_loss": -6.855042457580566, "global_step": 169113, "epoch": 4026} {"train_loss": -6.9131317138671875, "global_step": 169114, "epoch": 4026} {"train_loss": -6.812980651855469, "global_step": 169115, "epoch": 4026} {"train_loss": -6.833459854125977, "global_step": 169116, "epoch": 4026} {"train_loss": -6.987361907958984, "global_step": 169117, "epoch": 4026} {"train_loss": -6.821125030517578, "global_step": 169118, "epoch": 4026} {"train_loss": -7.019575119018555, "global_step": 169119, "epoch": 4026} {"train_loss": -6.868182182312012, "global_step": 169120, "epoch": 4026} {"train_loss": -6.892582893371582, "global_step": 169121, "epoch": 4026} {"train_loss": -6.8948283195495605, "global_step": 169122, "epoch": 4026} {"train_loss": -6.695125579833984, "global_step": 169123, "epoch": 4026} {"train_loss": -6.991668224334717, "global_step": 169124, "epoch": 4026} {"train_loss": -6.837071895599365, "global_step": 169125, "epoch": 4026} {"train_loss": -6.843229293823242, "global_step": 169126, "epoch": 4026} {"train_loss": -7.005701541900635, "global_step": 169127, "epoch": 4026} {"train_loss": -6.868071556091309, "global_step": 169128, "epoch": 4026} {"train_loss": -6.904483795166016, "global_step": 169129, "epoch": 4026} {"train_loss": -6.888854503631592, "global_step": 169130, "epoch": 4026} {"train_loss": -7.007594108581543, "global_step": 169131, "epoch": 4026} {"train_loss": -6.849733352661133, "global_step": 169132, "epoch": 4026} {"train_loss": -6.925982055209932, "global_step": 169133, "epoch": 4026, "val_loss": 80140.7265625} {"train_loss": -6.979516983032227, "global_step": 169134, "epoch": 4027} {"train_loss": -7.0358171463012695, "global_step": 169135, "epoch": 4027} {"train_loss": -6.905348300933838, "global_step": 169136, "epoch": 4027} {"train_loss": -6.863322734832764, "global_step": 169137, "epoch": 4027} {"train_loss": -7.029295921325684, "global_step": 169138, "epoch": 4027} {"train_loss": -6.986032485961914, "global_step": 169139, "epoch": 4027} {"train_loss": -7.079108715057373, "global_step": 169140, "epoch": 4027} {"train_loss": -6.989887237548828, "global_step": 169141, "epoch": 4027} {"train_loss": -6.985998630523682, "global_step": 169142, "epoch": 4027} {"train_loss": -7.092424392700195, "global_step": 169143, "epoch": 4027} {"train_loss": -6.9671478271484375, "global_step": 169144, "epoch": 4027} {"train_loss": -6.983299255371094, "global_step": 169145, "epoch": 4027} {"train_loss": -7.00732421875, "global_step": 169146, "epoch": 4027} {"train_loss": -7.079522132873535, "global_step": 169147, "epoch": 4027} {"train_loss": -7.100043296813965, "global_step": 169148, "epoch": 4027} {"train_loss": -7.057383060455322, "global_step": 169149, "epoch": 4027} {"train_loss": -7.037383079528809, "global_step": 169150, "epoch": 4027} {"train_loss": -6.9239020347595215, "global_step": 169151, "epoch": 4027} {"train_loss": -6.977888107299805, "global_step": 169152, "epoch": 4027} {"train_loss": -7.052949905395508, "global_step": 169153, "epoch": 4027} {"train_loss": -7.103648662567139, "global_step": 169154, "epoch": 4027} {"train_loss": -6.968283653259277, "global_step": 169155, "epoch": 4027} {"train_loss": -6.971210479736328, "global_step": 169156, "epoch": 4027} {"train_loss": -7.017731666564941, "global_step": 169157, "epoch": 4027} {"train_loss": -7.062040328979492, "global_step": 169158, "epoch": 4027} {"train_loss": -6.966670989990234, "global_step": 169159, "epoch": 4027} {"train_loss": -6.90179967880249, "global_step": 169160, "epoch": 4027} {"train_loss": -6.962861061096191, "global_step": 169161, "epoch": 4027} {"train_loss": -6.913188934326172, "global_step": 169162, "epoch": 4027} {"train_loss": -6.936083793640137, "global_step": 169163, "epoch": 4027} {"train_loss": -7.044877052307129, "global_step": 169164, "epoch": 4027} {"train_loss": -6.974700927734375, "global_step": 169165, "epoch": 4027} {"train_loss": -6.789340496063232, "global_step": 169166, "epoch": 4027} {"train_loss": -7.043880462646484, "global_step": 169167, "epoch": 4027} {"train_loss": -6.828925132751465, "global_step": 169168, "epoch": 4027} {"train_loss": -7.047571182250977, "global_step": 169169, "epoch": 4027} {"train_loss": -7.083694934844971, "global_step": 169170, "epoch": 4027} {"train_loss": -6.960416793823242, "global_step": 169171, "epoch": 4027} {"train_loss": -7.0279974937438965, "global_step": 169172, "epoch": 4027} {"train_loss": -6.824069499969482, "global_step": 169173, "epoch": 4027} {"train_loss": -6.909337043762207, "global_step": 169174, "epoch": 4027} {"train_loss": -6.987379244395664, "global_step": 169175, "epoch": 4027, "val_loss": 79848.0} {"train_loss": -6.7810468673706055, "global_step": 169176, "epoch": 4028} {"train_loss": -6.913496494293213, "global_step": 169177, "epoch": 4028} {"train_loss": -6.969454765319824, "global_step": 169178, "epoch": 4028} {"train_loss": -6.9830780029296875, "global_step": 169179, "epoch": 4028} {"train_loss": -7.096439361572266, "global_step": 169180, "epoch": 4028} {"train_loss": -7.064731597900391, "global_step": 169181, "epoch": 4028} {"train_loss": -6.9788384437561035, "global_step": 169182, "epoch": 4028} {"train_loss": -7.072216510772705, "global_step": 169183, "epoch": 4028} {"train_loss": -7.119126319885254, "global_step": 169184, "epoch": 4028} {"train_loss": -7.005311012268066, "global_step": 169185, "epoch": 4028} {"train_loss": -7.0814433097839355, "global_step": 169186, "epoch": 4028} {"train_loss": -7.0041279792785645, "global_step": 169187, "epoch": 4028} {"train_loss": -7.058119297027588, "global_step": 169188, "epoch": 4028} {"train_loss": -7.063423156738281, "global_step": 169189, "epoch": 4028} {"train_loss": -7.156642913818359, "global_step": 169190, "epoch": 4028} {"train_loss": -6.967395782470703, "global_step": 169191, "epoch": 4028} {"train_loss": -6.974053859710693, "global_step": 169192, "epoch": 4028} {"train_loss": -7.066238880157471, "global_step": 169193, "epoch": 4028} {"train_loss": -7.023255348205566, "global_step": 169194, "epoch": 4028} {"train_loss": -7.086849212646484, "global_step": 169195, "epoch": 4028} {"train_loss": -7.1002044677734375, "global_step": 169196, "epoch": 4028} {"train_loss": -7.071050643920898, "global_step": 169197, "epoch": 4028} {"train_loss": -7.132988929748535, "global_step": 169198, "epoch": 4028} {"train_loss": -6.9909868240356445, "global_step": 169199, "epoch": 4028} {"train_loss": -7.043485641479492, "global_step": 169200, "epoch": 4028} {"train_loss": -6.981839179992676, "global_step": 169201, "epoch": 4028} {"train_loss": -6.892369270324707, "global_step": 169202, "epoch": 4028} {"train_loss": -6.9885149002075195, "global_step": 169203, "epoch": 4028} {"train_loss": -7.081358909606934, "global_step": 169204, "epoch": 4028} {"train_loss": -7.0140180587768555, "global_step": 169205, "epoch": 4028} {"train_loss": -7.14818000793457, "global_step": 169206, "epoch": 4028} {"train_loss": -7.041661262512207, "global_step": 169207, "epoch": 4028} {"train_loss": -7.005573272705078, "global_step": 169208, "epoch": 4028} {"train_loss": -7.095365524291992, "global_step": 169209, "epoch": 4028} {"train_loss": -7.108974456787109, "global_step": 169210, "epoch": 4028} {"train_loss": -7.012674331665039, "global_step": 169211, "epoch": 4028} {"train_loss": -7.031545639038086, "global_step": 169212, "epoch": 4028} {"train_loss": -7.085826396942139, "global_step": 169213, "epoch": 4028} {"train_loss": -6.984508514404297, "global_step": 169214, "epoch": 4028} {"train_loss": -7.02051305770874, "global_step": 169215, "epoch": 4028} {"train_loss": -6.962131500244141, "global_step": 169216, "epoch": 4028} {"train_loss": -7.029637359437489, "global_step": 169217, "epoch": 4028, "val_loss": 79668.4921875} {"train_loss": -7.14694356918335, "global_step": 169218, "epoch": 4029} {"train_loss": -7.100004196166992, "global_step": 169219, "epoch": 4029} {"train_loss": -7.07931661605835, "global_step": 169220, "epoch": 4029} {"train_loss": -7.15662145614624, "global_step": 169221, "epoch": 4029} {"train_loss": -7.067819595336914, "global_step": 169222, "epoch": 4029} {"train_loss": -7.040957927703857, "global_step": 169223, "epoch": 4029} {"train_loss": -7.040637016296387, "global_step": 169224, "epoch": 4029} {"train_loss": -6.95943546295166, "global_step": 169225, "epoch": 4029} {"train_loss": -7.025772571563721, "global_step": 169226, "epoch": 4029} {"train_loss": -6.987829208374023, "global_step": 169227, "epoch": 4029} {"train_loss": -7.1338419914245605, "global_step": 169228, "epoch": 4029} {"train_loss": -7.15117073059082, "global_step": 169229, "epoch": 4029} {"train_loss": -7.131198883056641, "global_step": 169230, "epoch": 4029} {"train_loss": -7.076269149780273, "global_step": 169231, "epoch": 4029} {"train_loss": -7.066885948181152, "global_step": 169232, "epoch": 4029} {"train_loss": -7.028360843658447, "global_step": 169233, "epoch": 4029} {"train_loss": -7.151749610900879, "global_step": 169234, "epoch": 4029} {"train_loss": -7.030785083770752, "global_step": 169235, "epoch": 4029} {"train_loss": -7.105050086975098, "global_step": 169236, "epoch": 4029} {"train_loss": -7.101799964904785, "global_step": 169237, "epoch": 4029} {"train_loss": -7.025206089019775, "global_step": 169238, "epoch": 4029} {"train_loss": -7.075272560119629, "global_step": 169239, "epoch": 4029} {"train_loss": -7.045900821685791, "global_step": 169240, "epoch": 4029} {"train_loss": -7.00770378112793, "global_step": 169241, "epoch": 4029} {"train_loss": -7.007474422454834, "global_step": 169242, "epoch": 4029} {"train_loss": -7.112636566162109, "global_step": 169243, "epoch": 4029} {"train_loss": -7.051350116729736, "global_step": 169244, "epoch": 4029} {"train_loss": -7.147503852844238, "global_step": 169245, "epoch": 4029} {"train_loss": -7.023446083068848, "global_step": 169246, "epoch": 4029} {"train_loss": -7.138172149658203, "global_step": 169247, "epoch": 4029} {"train_loss": -7.167474269866943, "global_step": 169248, "epoch": 4029} {"train_loss": -7.093741416931152, "global_step": 169249, "epoch": 4029} {"train_loss": -7.083719253540039, "global_step": 169250, "epoch": 4029} {"train_loss": -7.081089019775391, "global_step": 169251, "epoch": 4029} {"train_loss": -7.082903861999512, "global_step": 169252, "epoch": 4029} {"train_loss": -7.033977508544922, "global_step": 169253, "epoch": 4029} {"train_loss": -6.971444606781006, "global_step": 169254, "epoch": 4029} {"train_loss": -7.102235794067383, "global_step": 169255, "epoch": 4029} {"train_loss": -7.025922775268555, "global_step": 169256, "epoch": 4029} {"train_loss": -7.0759172439575195, "global_step": 169257, "epoch": 4029} {"train_loss": -6.956516265869141, "global_step": 169258, "epoch": 4029} {"train_loss": -7.0705447764623734, "global_step": 169259, "epoch": 4029, "val_loss": 79686.8203125} {"train_loss": -7.085516452789307, "global_step": 169260, "epoch": 4030} {"train_loss": -7.0258941650390625, "global_step": 169261, "epoch": 4030} {"train_loss": -7.11623477935791, "global_step": 169262, "epoch": 4030} {"train_loss": -7.052252769470215, "global_step": 169263, "epoch": 4030} {"train_loss": -7.036377906799316, "global_step": 169264, "epoch": 4030} {"train_loss": -7.0654168128967285, "global_step": 169265, "epoch": 4030} {"train_loss": -6.967432498931885, "global_step": 169266, "epoch": 4030} {"train_loss": -7.029031753540039, "global_step": 169267, "epoch": 4030} {"train_loss": -7.0518975257873535, "global_step": 169268, "epoch": 4030} {"train_loss": -7.064731597900391, "global_step": 169269, "epoch": 4030} {"train_loss": -7.095882892608643, "global_step": 169270, "epoch": 4030} {"train_loss": -7.105559825897217, "global_step": 169271, "epoch": 4030} {"train_loss": -6.9744672775268555, "global_step": 169272, "epoch": 4030} {"train_loss": -6.985000133514404, "global_step": 169273, "epoch": 4030} {"train_loss": -7.086825370788574, "global_step": 169274, "epoch": 4030} {"train_loss": -6.961742401123047, "global_step": 169275, "epoch": 4030} {"train_loss": -7.031769275665283, "global_step": 169276, "epoch": 4030} {"train_loss": -7.037675380706787, "global_step": 169277, "epoch": 4030} {"train_loss": -7.003827095031738, "global_step": 169278, "epoch": 4030} {"train_loss": -7.064970016479492, "global_step": 169279, "epoch": 4030} {"train_loss": -7.041498184204102, "global_step": 169280, "epoch": 4030} {"train_loss": -6.936450004577637, "global_step": 169281, "epoch": 4030} {"train_loss": -7.085158348083496, "global_step": 169282, "epoch": 4030} {"train_loss": -7.044649600982666, "global_step": 169283, "epoch": 4030} {"train_loss": -7.033705234527588, "global_step": 169284, "epoch": 4030} {"train_loss": -7.062294006347656, "global_step": 169285, "epoch": 4030} {"train_loss": -6.9961066246032715, "global_step": 169286, "epoch": 4030} {"train_loss": -7.073123931884766, "global_step": 169287, "epoch": 4030} {"train_loss": -7.106037139892578, "global_step": 169288, "epoch": 4030} {"train_loss": -7.141944408416748, "global_step": 169289, "epoch": 4030} {"train_loss": -7.160696983337402, "global_step": 169290, "epoch": 4030} {"train_loss": -7.03879451751709, "global_step": 169291, "epoch": 4030} {"train_loss": -6.982970714569092, "global_step": 169292, "epoch": 4030} {"train_loss": -7.039246559143066, "global_step": 169293, "epoch": 4030} {"train_loss": -7.051442623138428, "global_step": 169294, "epoch": 4030} {"train_loss": -7.175385475158691, "global_step": 169295, "epoch": 4030} {"train_loss": -7.011922836303711, "global_step": 169296, "epoch": 4030} {"train_loss": -7.086413383483887, "global_step": 169297, "epoch": 4030} {"train_loss": -6.998337745666504, "global_step": 169298, "epoch": 4030} {"train_loss": -7.131118297576904, "global_step": 169299, "epoch": 4030} {"train_loss": -7.051213264465332, "global_step": 169300, "epoch": 4030} {"train_loss": -7.050619261605399, "global_step": 169301, "epoch": 4030, "val_loss": 79939.6796875} {"train_loss": -7.079453468322754, "global_step": 169302, "epoch": 4031} {"train_loss": -6.973395824432373, "global_step": 169303, "epoch": 4031} {"train_loss": -7.137497901916504, "global_step": 169304, "epoch": 4031} {"train_loss": -7.026590347290039, "global_step": 169305, "epoch": 4031} {"train_loss": -7.009646415710449, "global_step": 169306, "epoch": 4031} {"train_loss": -7.019824028015137, "global_step": 169307, "epoch": 4031} {"train_loss": -7.06380558013916, "global_step": 169308, "epoch": 4031} {"train_loss": -6.9455084800720215, "global_step": 169309, "epoch": 4031} {"train_loss": -6.990394592285156, "global_step": 169310, "epoch": 4031} {"train_loss": -6.992597579956055, "global_step": 169311, "epoch": 4031} {"train_loss": -7.020105361938477, "global_step": 169312, "epoch": 4031} {"train_loss": -6.950202941894531, "global_step": 169313, "epoch": 4031} {"train_loss": -6.954133033752441, "global_step": 169314, "epoch": 4031} {"train_loss": -7.0839128494262695, "global_step": 169315, "epoch": 4031} {"train_loss": -6.983590126037598, "global_step": 169316, "epoch": 4031} {"train_loss": -7.078243732452393, "global_step": 169317, "epoch": 4031} {"train_loss": -6.98196268081665, "global_step": 169318, "epoch": 4031} {"train_loss": -7.017974853515625, "global_step": 169319, "epoch": 4031} {"train_loss": -6.996088027954102, "global_step": 169320, "epoch": 4031} {"train_loss": -7.035881996154785, "global_step": 169321, "epoch": 4031} {"train_loss": -6.925580024719238, "global_step": 169322, "epoch": 4031} {"train_loss": -7.050667762756348, "global_step": 169323, "epoch": 4031} {"train_loss": -7.027813911437988, "global_step": 169324, "epoch": 4031} {"train_loss": -6.938756942749023, "global_step": 169325, "epoch": 4031} {"train_loss": -7.036121368408203, "global_step": 169326, "epoch": 4031} {"train_loss": -6.910334587097168, "global_step": 169327, "epoch": 4031} {"train_loss": -6.922327518463135, "global_step": 169328, "epoch": 4031} {"train_loss": -7.000481605529785, "global_step": 169329, "epoch": 4031} {"train_loss": -7.040778160095215, "global_step": 169330, "epoch": 4031} {"train_loss": -7.02512264251709, "global_step": 169331, "epoch": 4031} {"train_loss": -6.966349124908447, "global_step": 169332, "epoch": 4031} {"train_loss": -7.13568639755249, "global_step": 169333, "epoch": 4031} {"train_loss": -6.957232475280762, "global_step": 169334, "epoch": 4031} {"train_loss": -6.972354888916016, "global_step": 169335, "epoch": 4031} {"train_loss": -7.032876014709473, "global_step": 169336, "epoch": 4031} {"train_loss": -6.867794990539551, "global_step": 169337, "epoch": 4031} {"train_loss": -7.009208679199219, "global_step": 169338, "epoch": 4031} {"train_loss": -6.944673538208008, "global_step": 169339, "epoch": 4031} {"train_loss": -6.975552558898926, "global_step": 169340, "epoch": 4031} {"train_loss": -6.985748291015625, "global_step": 169341, "epoch": 4031} {"train_loss": -6.901239395141602, "global_step": 169342, "epoch": 4031} {"train_loss": -7.0005565484364825, "global_step": 169343, "epoch": 4031, "val_loss": 79698.625} {"train_loss": -6.840747356414795, "global_step": 169344, "epoch": 4032} {"train_loss": -6.935145378112793, "global_step": 169345, "epoch": 4032} {"train_loss": -7.105449199676514, "global_step": 169346, "epoch": 4032} {"train_loss": -6.8532209396362305, "global_step": 169347, "epoch": 4032} {"train_loss": -7.096454620361328, "global_step": 169348, "epoch": 4032} {"train_loss": -6.880068778991699, "global_step": 169349, "epoch": 4032} {"train_loss": -6.949471473693848, "global_step": 169350, "epoch": 4032} {"train_loss": -7.083498001098633, "global_step": 169351, "epoch": 4032} {"train_loss": -7.01279354095459, "global_step": 169352, "epoch": 4032} {"train_loss": -7.082919597625732, "global_step": 169353, "epoch": 4032} {"train_loss": -7.031669616699219, "global_step": 169354, "epoch": 4032} {"train_loss": -6.936413288116455, "global_step": 169355, "epoch": 4032} {"train_loss": -6.932738304138184, "global_step": 169356, "epoch": 4032} {"train_loss": -7.07332706451416, "global_step": 169357, "epoch": 4032} {"train_loss": -7.136386871337891, "global_step": 169358, "epoch": 4032} {"train_loss": -6.889095306396484, "global_step": 169359, "epoch": 4032} {"train_loss": -7.092185020446777, "global_step": 169360, "epoch": 4032} {"train_loss": -7.0462751388549805, "global_step": 169361, "epoch": 4032} {"train_loss": -7.018763065338135, "global_step": 169362, "epoch": 4032} {"train_loss": -7.037771701812744, "global_step": 169363, "epoch": 4032} {"train_loss": -7.1336445808410645, "global_step": 169364, "epoch": 4032} {"train_loss": -7.085996150970459, "global_step": 169365, "epoch": 4032} {"train_loss": -6.993893146514893, "global_step": 169366, "epoch": 4032} {"train_loss": -7.088819980621338, "global_step": 169367, "epoch": 4032} {"train_loss": -7.091576099395752, "global_step": 169368, "epoch": 4032} {"train_loss": -7.064409255981445, "global_step": 169369, "epoch": 4032} {"train_loss": -7.169869422912598, "global_step": 169370, "epoch": 4032} {"train_loss": -7.047911643981934, "global_step": 169371, "epoch": 4032} {"train_loss": -7.034526824951172, "global_step": 169372, "epoch": 4032} {"train_loss": -7.021365165710449, "global_step": 169373, "epoch": 4032} {"train_loss": -7.114278793334961, "global_step": 169374, "epoch": 4032} {"train_loss": -7.139184951782227, "global_step": 169375, "epoch": 4032} {"train_loss": -7.123275279998779, "global_step": 169376, "epoch": 4032} {"train_loss": -7.060781955718994, "global_step": 169377, "epoch": 4032} {"train_loss": -7.1126298904418945, "global_step": 169378, "epoch": 4032} {"train_loss": -7.09409761428833, "global_step": 169379, "epoch": 4032} {"train_loss": -7.08211612701416, "global_step": 169380, "epoch": 4032} {"train_loss": -7.164078712463379, "global_step": 169381, "epoch": 4032} {"train_loss": -7.152679443359375, "global_step": 169382, "epoch": 4032} {"train_loss": -7.105806827545166, "global_step": 169383, "epoch": 4032} {"train_loss": -7.110452175140381, "global_step": 169384, "epoch": 4032} {"train_loss": -7.049702803293864, "global_step": 169385, "epoch": 4032, "val_loss": 79913.5078125} {"train_loss": -7.12733793258667, "global_step": 169386, "epoch": 4033} {"train_loss": -7.100534915924072, "global_step": 169387, "epoch": 4033} {"train_loss": -7.122030258178711, "global_step": 169388, "epoch": 4033} {"train_loss": -7.124483108520508, "global_step": 169389, "epoch": 4033} {"train_loss": -7.099794387817383, "global_step": 169390, "epoch": 4033} {"train_loss": -7.113051891326904, "global_step": 169391, "epoch": 4033} {"train_loss": -7.000421524047852, "global_step": 169392, "epoch": 4033} {"train_loss": -7.190993309020996, "global_step": 169393, "epoch": 4033} {"train_loss": -7.077504634857178, "global_step": 169394, "epoch": 4033} {"train_loss": -7.0898542404174805, "global_step": 169395, "epoch": 4033} {"train_loss": -6.9122209548950195, "global_step": 169396, "epoch": 4033} {"train_loss": -7.121649265289307, "global_step": 169397, "epoch": 4033} {"train_loss": -7.054882526397705, "global_step": 169398, "epoch": 4033} {"train_loss": -6.93697452545166, "global_step": 169399, "epoch": 4033} {"train_loss": -7.158485412597656, "global_step": 169400, "epoch": 4033} {"train_loss": -7.090768814086914, "global_step": 169401, "epoch": 4033} {"train_loss": -7.092754364013672, "global_step": 169402, "epoch": 4033} {"train_loss": -7.095968246459961, "global_step": 169403, "epoch": 4033} {"train_loss": -7.051342010498047, "global_step": 169404, "epoch": 4033} {"train_loss": -7.098873138427734, "global_step": 169405, "epoch": 4033} {"train_loss": -7.112493515014648, "global_step": 169406, "epoch": 4033} {"train_loss": -7.076335906982422, "global_step": 169407, "epoch": 4033} {"train_loss": -7.184755325317383, "global_step": 169408, "epoch": 4033} {"train_loss": -7.066678524017334, "global_step": 169409, "epoch": 4033} {"train_loss": -7.067019462585449, "global_step": 169410, "epoch": 4033} {"train_loss": -7.112512588500977, "global_step": 169411, "epoch": 4033} {"train_loss": -7.1137166023254395, "global_step": 169412, "epoch": 4033} {"train_loss": -6.996692657470703, "global_step": 169413, "epoch": 4033} {"train_loss": -7.147197723388672, "global_step": 169414, "epoch": 4033} {"train_loss": -7.012598514556885, "global_step": 169415, "epoch": 4033} {"train_loss": -7.087337017059326, "global_step": 169416, "epoch": 4033} {"train_loss": -7.117072582244873, "global_step": 169417, "epoch": 4033} {"train_loss": -6.990318298339844, "global_step": 169418, "epoch": 4033} {"train_loss": -7.025138854980469, "global_step": 169419, "epoch": 4033} {"train_loss": -7.134340286254883, "global_step": 169420, "epoch": 4033} {"train_loss": -7.022221565246582, "global_step": 169421, "epoch": 4033} {"train_loss": -6.983243942260742, "global_step": 169422, "epoch": 4033} {"train_loss": -6.810072898864746, "global_step": 169423, "epoch": 4033} {"train_loss": -7.095797538757324, "global_step": 169424, "epoch": 4033} {"train_loss": -6.948895454406738, "global_step": 169425, "epoch": 4033} {"train_loss": -6.956878662109375, "global_step": 169426, "epoch": 4033} {"train_loss": -7.064329181398664, "global_step": 169427, "epoch": 4033, "val_loss": 79887.390625} {"train_loss": -6.946242809295654, "global_step": 169428, "epoch": 4034} {"train_loss": -6.974546432495117, "global_step": 169429, "epoch": 4034} {"train_loss": -6.94491720199585, "global_step": 169430, "epoch": 4034} {"train_loss": -6.930990695953369, "global_step": 169431, "epoch": 4034} {"train_loss": -6.930075168609619, "global_step": 169432, "epoch": 4034} {"train_loss": -7.018105506896973, "global_step": 169433, "epoch": 4034} {"train_loss": -7.083982467651367, "global_step": 169434, "epoch": 4034} {"train_loss": -7.125502109527588, "global_step": 169435, "epoch": 4034} {"train_loss": -7.01312255859375, "global_step": 169436, "epoch": 4034} {"train_loss": -6.99021053314209, "global_step": 169437, "epoch": 4034} {"train_loss": -7.110690116882324, "global_step": 169438, "epoch": 4034} {"train_loss": -7.082458972930908, "global_step": 169439, "epoch": 4034} {"train_loss": -7.031027793884277, "global_step": 169440, "epoch": 4034} {"train_loss": -6.946015357971191, "global_step": 169441, "epoch": 4034} {"train_loss": -7.043522834777832, "global_step": 169442, "epoch": 4034} {"train_loss": -7.065887451171875, "global_step": 169443, "epoch": 4034} {"train_loss": -6.998756408691406, "global_step": 169444, "epoch": 4034} {"train_loss": -6.987873077392578, "global_step": 169445, "epoch": 4034} {"train_loss": -7.099666118621826, "global_step": 169446, "epoch": 4034} {"train_loss": -7.0632405281066895, "global_step": 169447, "epoch": 4034} {"train_loss": -7.071784019470215, "global_step": 169448, "epoch": 4034} {"train_loss": -7.130141258239746, "global_step": 169449, "epoch": 4034} {"train_loss": -6.9431352615356445, "global_step": 169450, "epoch": 4034} {"train_loss": -7.130643844604492, "global_step": 169451, "epoch": 4034} {"train_loss": -7.043133735656738, "global_step": 169452, "epoch": 4034} {"train_loss": -7.010626316070557, "global_step": 169453, "epoch": 4034} {"train_loss": -7.033140182495117, "global_step": 169454, "epoch": 4034} {"train_loss": -6.985770225524902, "global_step": 169455, "epoch": 4034} {"train_loss": -7.1007256507873535, "global_step": 169456, "epoch": 4034} {"train_loss": -7.1665449142456055, "global_step": 169457, "epoch": 4034} {"train_loss": -7.030697822570801, "global_step": 169458, "epoch": 4034} {"train_loss": -7.061105728149414, "global_step": 169459, "epoch": 4034} {"train_loss": -7.204917907714844, "global_step": 169460, "epoch": 4034} {"train_loss": -7.110755920410156, "global_step": 169461, "epoch": 4034} {"train_loss": -7.14631462097168, "global_step": 169462, "epoch": 4034} {"train_loss": -6.9794158935546875, "global_step": 169463, "epoch": 4034} {"train_loss": -7.075895309448242, "global_step": 169464, "epoch": 4034} {"train_loss": -6.996374607086182, "global_step": 169465, "epoch": 4034} {"train_loss": -7.086116790771484, "global_step": 169466, "epoch": 4034} {"train_loss": -6.983016014099121, "global_step": 169467, "epoch": 4034} {"train_loss": -7.088014125823975, "global_step": 169468, "epoch": 4034} {"train_loss": -7.044762656802223, "global_step": 169469, "epoch": 4034, "val_loss": 79960.625} {"train_loss": -7.005584716796875, "global_step": 169470, "epoch": 4035} {"train_loss": -6.974425792694092, "global_step": 169471, "epoch": 4035} {"train_loss": -7.04809045791626, "global_step": 169472, "epoch": 4035} {"train_loss": -6.97471809387207, "global_step": 169473, "epoch": 4035} {"train_loss": -7.05889892578125, "global_step": 169474, "epoch": 4035} {"train_loss": -7.02079439163208, "global_step": 169475, "epoch": 4035} {"train_loss": -7.0954790115356445, "global_step": 169476, "epoch": 4035} {"train_loss": -7.033934116363525, "global_step": 169477, "epoch": 4035} {"train_loss": -6.935575485229492, "global_step": 169478, "epoch": 4035} {"train_loss": -6.953739643096924, "global_step": 169479, "epoch": 4035} {"train_loss": -6.944446563720703, "global_step": 169480, "epoch": 4035} {"train_loss": -7.063570976257324, "global_step": 169481, "epoch": 4035} {"train_loss": -7.051210880279541, "global_step": 169482, "epoch": 4035} {"train_loss": -6.8657660484313965, "global_step": 169483, "epoch": 4035} {"train_loss": -7.101656436920166, "global_step": 169484, "epoch": 4035} {"train_loss": -7.038886070251465, "global_step": 169485, "epoch": 4035} {"train_loss": -7.057904243469238, "global_step": 169486, "epoch": 4035} {"train_loss": -7.0583977699279785, "global_step": 169487, "epoch": 4035} {"train_loss": -6.922604560852051, "global_step": 169488, "epoch": 4035} {"train_loss": -7.059786796569824, "global_step": 169489, "epoch": 4035} {"train_loss": -7.055664539337158, "global_step": 169490, "epoch": 4035} {"train_loss": -7.04884672164917, "global_step": 169491, "epoch": 4035} {"train_loss": -7.157565116882324, "global_step": 169492, "epoch": 4035} {"train_loss": -6.949483871459961, "global_step": 169493, "epoch": 4035} {"train_loss": -6.980441093444824, "global_step": 169494, "epoch": 4035} {"train_loss": -7.117270469665527, "global_step": 169495, "epoch": 4035} {"train_loss": -7.060751438140869, "global_step": 169496, "epoch": 4035} {"train_loss": -7.149888515472412, "global_step": 169497, "epoch": 4035} {"train_loss": -6.961348533630371, "global_step": 169498, "epoch": 4035} {"train_loss": -7.098606109619141, "global_step": 169499, "epoch": 4035} {"train_loss": -7.117711544036865, "global_step": 169500, "epoch": 4035} {"train_loss": -7.065742492675781, "global_step": 169501, "epoch": 4035} {"train_loss": -7.048358917236328, "global_step": 169502, "epoch": 4035} {"train_loss": -7.049552917480469, "global_step": 169503, "epoch": 4035} {"train_loss": -7.073019504547119, "global_step": 169504, "epoch": 4035} {"train_loss": -7.087265968322754, "global_step": 169505, "epoch": 4035} {"train_loss": -7.103118419647217, "global_step": 169506, "epoch": 4035} {"train_loss": -7.041089057922363, "global_step": 169507, "epoch": 4035} {"train_loss": -6.943460464477539, "global_step": 169508, "epoch": 4035} {"train_loss": -6.917625427246094, "global_step": 169509, "epoch": 4035} {"train_loss": -6.952226161956787, "global_step": 169510, "epoch": 4035} {"train_loss": -7.029725835436866, "global_step": 169511, "epoch": 4035, "val_loss": 79612.21875} {"train_loss": -6.932326316833496, "global_step": 169512, "epoch": 4036} {"train_loss": -7.004749774932861, "global_step": 169513, "epoch": 4036} {"train_loss": -7.050365447998047, "global_step": 169514, "epoch": 4036} {"train_loss": -6.940515518188477, "global_step": 169515, "epoch": 4036} {"train_loss": -7.029062271118164, "global_step": 169516, "epoch": 4036} {"train_loss": -6.968278408050537, "global_step": 169517, "epoch": 4036} {"train_loss": -6.957073211669922, "global_step": 169518, "epoch": 4036} {"train_loss": -7.073214530944824, "global_step": 169519, "epoch": 4036} {"train_loss": -6.955780982971191, "global_step": 169520, "epoch": 4036} {"train_loss": -6.995682239532471, "global_step": 169521, "epoch": 4036} {"train_loss": -7.081939697265625, "global_step": 169522, "epoch": 4036} {"train_loss": -7.099362373352051, "global_step": 169523, "epoch": 4036} {"train_loss": -7.028051376342773, "global_step": 169524, "epoch": 4036} {"train_loss": -7.068525314331055, "global_step": 169525, "epoch": 4036} {"train_loss": -7.063541889190674, "global_step": 169526, "epoch": 4036} {"train_loss": -7.0079345703125, "global_step": 169527, "epoch": 4036} {"train_loss": -7.008490562438965, "global_step": 169528, "epoch": 4036} {"train_loss": -7.049069404602051, "global_step": 169529, "epoch": 4036} {"train_loss": -7.2273149490356445, "global_step": 169530, "epoch": 4036} {"train_loss": -6.972128868103027, "global_step": 169531, "epoch": 4036} {"train_loss": -7.113349914550781, "global_step": 169532, "epoch": 4036} {"train_loss": -7.069907188415527, "global_step": 169533, "epoch": 4036} {"train_loss": -7.040308952331543, "global_step": 169534, "epoch": 4036} {"train_loss": -6.993952751159668, "global_step": 169535, "epoch": 4036} {"train_loss": -7.095198631286621, "global_step": 169536, "epoch": 4036} {"train_loss": -7.0001935958862305, "global_step": 169537, "epoch": 4036} {"train_loss": -7.089746952056885, "global_step": 169538, "epoch": 4036} {"train_loss": -7.0073981285095215, "global_step": 169539, "epoch": 4036} {"train_loss": -7.044875144958496, "global_step": 169540, "epoch": 4036} {"train_loss": -6.965762615203857, "global_step": 169541, "epoch": 4036} {"train_loss": -7.02200984954834, "global_step": 169542, "epoch": 4036} {"train_loss": -6.928977966308594, "global_step": 169543, "epoch": 4036} {"train_loss": -7.061025619506836, "global_step": 169544, "epoch": 4036} {"train_loss": -7.063222408294678, "global_step": 169545, "epoch": 4036} {"train_loss": -7.056494235992432, "global_step": 169546, "epoch": 4036} {"train_loss": -7.018710136413574, "global_step": 169547, "epoch": 4036} {"train_loss": -7.047952651977539, "global_step": 169548, "epoch": 4036} {"train_loss": -7.138879776000977, "global_step": 169549, "epoch": 4036} {"train_loss": -7.204651832580566, "global_step": 169550, "epoch": 4036} {"train_loss": -7.109492301940918, "global_step": 169551, "epoch": 4036} {"train_loss": -7.048025608062744, "global_step": 169552, "epoch": 4036} {"train_loss": -7.040462130591983, "global_step": 169553, "epoch": 4036, "val_loss": 79814.7421875} {"train_loss": -7.146113872528076, "global_step": 169554, "epoch": 4037} {"train_loss": -7.073694229125977, "global_step": 169555, "epoch": 4037} {"train_loss": -6.968991279602051, "global_step": 169556, "epoch": 4037} {"train_loss": -6.932840347290039, "global_step": 169557, "epoch": 4037} {"train_loss": -6.921414375305176, "global_step": 169558, "epoch": 4037} {"train_loss": -7.055960655212402, "global_step": 169559, "epoch": 4037} {"train_loss": -7.033876419067383, "global_step": 169560, "epoch": 4037} {"train_loss": -7.100111484527588, "global_step": 169561, "epoch": 4037} {"train_loss": -7.050819396972656, "global_step": 169562, "epoch": 4037} {"train_loss": -7.0328240394592285, "global_step": 169563, "epoch": 4037} {"train_loss": -7.002889633178711, "global_step": 169564, "epoch": 4037} {"train_loss": -7.0924882888793945, "global_step": 169565, "epoch": 4037} {"train_loss": -7.066995620727539, "global_step": 169566, "epoch": 4037} {"train_loss": -7.140108108520508, "global_step": 169567, "epoch": 4037} {"train_loss": -7.0341572761535645, "global_step": 169568, "epoch": 4037} {"train_loss": -7.0500407218933105, "global_step": 169569, "epoch": 4037} {"train_loss": -7.120309829711914, "global_step": 169570, "epoch": 4037} {"train_loss": -7.121510982513428, "global_step": 169571, "epoch": 4037} {"train_loss": -7.028963088989258, "global_step": 169572, "epoch": 4037} {"train_loss": -7.046623229980469, "global_step": 169573, "epoch": 4037} {"train_loss": -7.07148551940918, "global_step": 169574, "epoch": 4037} {"train_loss": -7.084775924682617, "global_step": 169575, "epoch": 4037} {"train_loss": -7.177663803100586, "global_step": 169576, "epoch": 4037} {"train_loss": -7.090793609619141, "global_step": 169577, "epoch": 4037} {"train_loss": -6.961549758911133, "global_step": 169578, "epoch": 4037} {"train_loss": -7.123948097229004, "global_step": 169579, "epoch": 4037} {"train_loss": -7.094048500061035, "global_step": 169580, "epoch": 4037} {"train_loss": -7.129865646362305, "global_step": 169581, "epoch": 4037} {"train_loss": -7.044881820678711, "global_step": 169582, "epoch": 4037} {"train_loss": -7.058086395263672, "global_step": 169583, "epoch": 4037} {"train_loss": -7.040966033935547, "global_step": 169584, "epoch": 4037} {"train_loss": -7.027517318725586, "global_step": 169585, "epoch": 4037} {"train_loss": -7.023898601531982, "global_step": 169586, "epoch": 4037} {"train_loss": -6.901189804077148, "global_step": 169587, "epoch": 4037} {"train_loss": -6.941469669342041, "global_step": 169588, "epoch": 4037} {"train_loss": -6.9608564376831055, "global_step": 169589, "epoch": 4037} {"train_loss": -6.910916805267334, "global_step": 169590, "epoch": 4037} {"train_loss": -6.940589904785156, "global_step": 169591, "epoch": 4037} {"train_loss": -7.059076309204102, "global_step": 169592, "epoch": 4037} {"train_loss": -7.096742630004883, "global_step": 169593, "epoch": 4037} {"train_loss": -6.930377006530762, "global_step": 169594, "epoch": 4037} {"train_loss": -7.039399237859817, "global_step": 169595, "epoch": 4037, "val_loss": 79825.0} {"train_loss": -7.061300277709961, "global_step": 169596, "epoch": 4038} {"train_loss": -6.956980228424072, "global_step": 169597, "epoch": 4038} {"train_loss": -7.04086971282959, "global_step": 169598, "epoch": 4038} {"train_loss": -7.079259872436523, "global_step": 169599, "epoch": 4038} {"train_loss": -7.068676471710205, "global_step": 169600, "epoch": 4038} {"train_loss": -7.013934135437012, "global_step": 169601, "epoch": 4038} {"train_loss": -6.853943824768066, "global_step": 169602, "epoch": 4038} {"train_loss": -7.108987331390381, "global_step": 169603, "epoch": 4038} {"train_loss": -6.953848838806152, "global_step": 169604, "epoch": 4038} {"train_loss": -7.074373245239258, "global_step": 169605, "epoch": 4038} {"train_loss": -7.064914703369141, "global_step": 169606, "epoch": 4038} {"train_loss": -7.0083770751953125, "global_step": 169607, "epoch": 4038} {"train_loss": -6.915919303894043, "global_step": 169608, "epoch": 4038} {"train_loss": -7.055290222167969, "global_step": 169609, "epoch": 4038} {"train_loss": -6.917356967926025, "global_step": 169610, "epoch": 4038} {"train_loss": -7.0959062576293945, "global_step": 169611, "epoch": 4038} {"train_loss": -6.927781105041504, "global_step": 169612, "epoch": 4038} {"train_loss": -6.971156120300293, "global_step": 169613, "epoch": 4038} {"train_loss": -6.991306781768799, "global_step": 169614, "epoch": 4038} {"train_loss": -7.100758075714111, "global_step": 169615, "epoch": 4038} {"train_loss": -6.986886978149414, "global_step": 169616, "epoch": 4038} {"train_loss": -7.037891864776611, "global_step": 169617, "epoch": 4038} {"train_loss": -6.969177722930908, "global_step": 169618, "epoch": 4038} {"train_loss": -6.9652099609375, "global_step": 169619, "epoch": 4038} {"train_loss": -7.168430328369141, "global_step": 169620, "epoch": 4038} {"train_loss": -7.05791711807251, "global_step": 169621, "epoch": 4038} {"train_loss": -6.876534938812256, "global_step": 169622, "epoch": 4038} {"train_loss": -7.021132469177246, "global_step": 169623, "epoch": 4038} {"train_loss": -7.102631568908691, "global_step": 169624, "epoch": 4038} {"train_loss": -7.0298004150390625, "global_step": 169625, "epoch": 4038} {"train_loss": -7.016507148742676, "global_step": 169626, "epoch": 4038} {"train_loss": -6.962259769439697, "global_step": 169627, "epoch": 4038} {"train_loss": -7.013981819152832, "global_step": 169628, "epoch": 4038} {"train_loss": -6.985502243041992, "global_step": 169629, "epoch": 4038} {"train_loss": -6.985065460205078, "global_step": 169630, "epoch": 4038} {"train_loss": -6.885433197021484, "global_step": 169631, "epoch": 4038} {"train_loss": -7.067890167236328, "global_step": 169632, "epoch": 4038} {"train_loss": -6.96948766708374, "global_step": 169633, "epoch": 4038} {"train_loss": -7.0412774085998535, "global_step": 169634, "epoch": 4038} {"train_loss": -7.034265995025635, "global_step": 169635, "epoch": 4038} {"train_loss": -7.084567070007324, "global_step": 169636, "epoch": 4038} {"train_loss": -7.0129549616859075, "global_step": 169637, "epoch": 4038, "val_loss": 79977.609375} {"train_loss": -7.125205039978027, "global_step": 169638, "epoch": 4039} {"train_loss": -7.079853534698486, "global_step": 169639, "epoch": 4039} {"train_loss": -6.997861862182617, "global_step": 169640, "epoch": 4039} {"train_loss": -7.079087257385254, "global_step": 169641, "epoch": 4039} {"train_loss": -7.185256481170654, "global_step": 169642, "epoch": 4039} {"train_loss": -7.001372337341309, "global_step": 169643, "epoch": 4039} {"train_loss": -7.03169059753418, "global_step": 169644, "epoch": 4039} {"train_loss": -7.059573173522949, "global_step": 169645, "epoch": 4039} {"train_loss": -7.025435447692871, "global_step": 169646, "epoch": 4039} {"train_loss": -7.099401950836182, "global_step": 169647, "epoch": 4039} {"train_loss": -7.080379962921143, "global_step": 169648, "epoch": 4039} {"train_loss": -7.106215000152588, "global_step": 169649, "epoch": 4039} {"train_loss": -7.130285263061523, "global_step": 169650, "epoch": 4039} {"train_loss": -7.014482021331787, "global_step": 169651, "epoch": 4039} {"train_loss": -7.05755615234375, "global_step": 169652, "epoch": 4039} {"train_loss": -7.064234733581543, "global_step": 169653, "epoch": 4039} {"train_loss": -7.0957207679748535, "global_step": 169654, "epoch": 4039} {"train_loss": -7.058966159820557, "global_step": 169655, "epoch": 4039} {"train_loss": -7.1049346923828125, "global_step": 169656, "epoch": 4039} {"train_loss": -7.13226842880249, "global_step": 169657, "epoch": 4039} {"train_loss": -7.109518051147461, "global_step": 169658, "epoch": 4039} {"train_loss": -7.1094970703125, "global_step": 169659, "epoch": 4039} {"train_loss": -6.958277702331543, "global_step": 169660, "epoch": 4039} {"train_loss": -7.068704128265381, "global_step": 169661, "epoch": 4039} {"train_loss": -7.155903339385986, "global_step": 169662, "epoch": 4039} {"train_loss": -7.073634147644043, "global_step": 169663, "epoch": 4039} {"train_loss": -7.12700080871582, "global_step": 169664, "epoch": 4039} {"train_loss": -7.12336540222168, "global_step": 169665, "epoch": 4039} {"train_loss": -7.096902370452881, "global_step": 169666, "epoch": 4039} {"train_loss": -7.004457473754883, "global_step": 169667, "epoch": 4039} {"train_loss": -7.253483772277832, "global_step": 169668, "epoch": 4039} {"train_loss": -7.072185516357422, "global_step": 169669, "epoch": 4039} {"train_loss": -6.989306449890137, "global_step": 169670, "epoch": 4039} {"train_loss": -7.0519537925720215, "global_step": 169671, "epoch": 4039} {"train_loss": -6.957130432128906, "global_step": 169672, "epoch": 4039} {"train_loss": -7.137950897216797, "global_step": 169673, "epoch": 4039} {"train_loss": -7.057612419128418, "global_step": 169674, "epoch": 4039} {"train_loss": -7.09423828125, "global_step": 169675, "epoch": 4039} {"train_loss": -7.035816192626953, "global_step": 169676, "epoch": 4039} {"train_loss": -7.212636470794678, "global_step": 169677, "epoch": 4039} {"train_loss": -7.0700602531433105, "global_step": 169678, "epoch": 4039} {"train_loss": -7.0791396867661245, "global_step": 169679, "epoch": 4039, "val_loss": 79914.3671875} {"train_loss": -7.001550674438477, "global_step": 169680, "epoch": 4040} {"train_loss": -7.126775741577148, "global_step": 169681, "epoch": 4040} {"train_loss": -7.147938251495361, "global_step": 169682, "epoch": 4040} {"train_loss": -7.0841522216796875, "global_step": 169683, "epoch": 4040} {"train_loss": -7.079644680023193, "global_step": 169684, "epoch": 4040} {"train_loss": -7.147439002990723, "global_step": 169685, "epoch": 4040} {"train_loss": -6.9828009605407715, "global_step": 169686, "epoch": 4040} {"train_loss": -7.046459197998047, "global_step": 169687, "epoch": 4040} {"train_loss": -7.009565353393555, "global_step": 169688, "epoch": 4040} {"train_loss": -7.041045188903809, "global_step": 169689, "epoch": 4040} {"train_loss": -7.016922950744629, "global_step": 169690, "epoch": 4040} {"train_loss": -7.109128952026367, "global_step": 169691, "epoch": 4040} {"train_loss": -6.906041145324707, "global_step": 169692, "epoch": 4040} {"train_loss": -6.788322448730469, "global_step": 169693, "epoch": 4040} {"train_loss": -7.03505277633667, "global_step": 169694, "epoch": 4040} {"train_loss": -6.945202827453613, "global_step": 169695, "epoch": 4040} {"train_loss": -6.806277751922607, "global_step": 169696, "epoch": 4040} {"train_loss": -6.990406036376953, "global_step": 169697, "epoch": 4040} {"train_loss": -6.722766876220703, "global_step": 169698, "epoch": 4040} {"train_loss": -6.992729663848877, "global_step": 169699, "epoch": 4040} {"train_loss": -6.980018615722656, "global_step": 169700, "epoch": 4040} {"train_loss": -6.927280902862549, "global_step": 169701, "epoch": 4040} {"train_loss": -7.041586399078369, "global_step": 169702, "epoch": 4040} {"train_loss": -6.902807712554932, "global_step": 169703, "epoch": 4040} {"train_loss": -6.8904218673706055, "global_step": 169704, "epoch": 4040} {"train_loss": -6.858009338378906, "global_step": 169705, "epoch": 4040} {"train_loss": -6.888948440551758, "global_step": 169706, "epoch": 4040} {"train_loss": -6.924064636230469, "global_step": 169707, "epoch": 4040} {"train_loss": -6.968163013458252, "global_step": 169708, "epoch": 4040} {"train_loss": -6.871911525726318, "global_step": 169709, "epoch": 4040} {"train_loss": -6.90627384185791, "global_step": 169710, "epoch": 4040} {"train_loss": -7.087260723114014, "global_step": 169711, "epoch": 4040} {"train_loss": -6.927338600158691, "global_step": 169712, "epoch": 4040} {"train_loss": -6.989480018615723, "global_step": 169713, "epoch": 4040} {"train_loss": -6.951631546020508, "global_step": 169714, "epoch": 4040} {"train_loss": -6.9412407875061035, "global_step": 169715, "epoch": 4040} {"train_loss": -7.013895511627197, "global_step": 169716, "epoch": 4040} {"train_loss": -6.999682426452637, "global_step": 169717, "epoch": 4040} {"train_loss": -6.988968849182129, "global_step": 169718, "epoch": 4040} {"train_loss": -7.164303779602051, "global_step": 169719, "epoch": 4040} {"train_loss": -7.043516159057617, "global_step": 169720, "epoch": 4040} {"train_loss": -6.9838914303552535, "global_step": 169721, "epoch": 4040, "val_loss": 79910.0078125} {"train_loss": -7.074172019958496, "global_step": 169722, "epoch": 4041} {"train_loss": -7.050262451171875, "global_step": 169723, "epoch": 4041} {"train_loss": -7.07139778137207, "global_step": 169724, "epoch": 4041} {"train_loss": -7.159944534301758, "global_step": 169725, "epoch": 4041} {"train_loss": -7.14512825012207, "global_step": 169726, "epoch": 4041} {"train_loss": -7.002431869506836, "global_step": 169727, "epoch": 4041} {"train_loss": -7.138594150543213, "global_step": 169728, "epoch": 4041} {"train_loss": -7.148869514465332, "global_step": 169729, "epoch": 4041} {"train_loss": -7.055049419403076, "global_step": 169730, "epoch": 4041} {"train_loss": -7.045384883880615, "global_step": 169731, "epoch": 4041} {"train_loss": -7.112915992736816, "global_step": 169732, "epoch": 4041} {"train_loss": -7.022817611694336, "global_step": 169733, "epoch": 4041} {"train_loss": -7.042752742767334, "global_step": 169734, "epoch": 4041} {"train_loss": -7.040614128112793, "global_step": 169735, "epoch": 4041} {"train_loss": -6.874706268310547, "global_step": 169736, "epoch": 4041} {"train_loss": -7.06507682800293, "global_step": 169737, "epoch": 4041} {"train_loss": -7.063314437866211, "global_step": 169738, "epoch": 4041} {"train_loss": -6.976682186126709, "global_step": 169739, "epoch": 4041} {"train_loss": -7.009690761566162, "global_step": 169740, "epoch": 4041} {"train_loss": -7.0458245277404785, "global_step": 169741, "epoch": 4041} {"train_loss": -7.005992889404297, "global_step": 169742, "epoch": 4041} {"train_loss": -7.051159858703613, "global_step": 169743, "epoch": 4041} {"train_loss": -7.033683776855469, "global_step": 169744, "epoch": 4041} {"train_loss": -6.963010311126709, "global_step": 169745, "epoch": 4041} {"train_loss": -7.057509899139404, "global_step": 169746, "epoch": 4041} {"train_loss": -7.076043605804443, "global_step": 169747, "epoch": 4041} {"train_loss": -6.9547014236450195, "global_step": 169748, "epoch": 4041} {"train_loss": -7.005242347717285, "global_step": 169749, "epoch": 4041} {"train_loss": -7.09657096862793, "global_step": 169750, "epoch": 4041} {"train_loss": -6.947611331939697, "global_step": 169751, "epoch": 4041} {"train_loss": -7.079843521118164, "global_step": 169752, "epoch": 4041} {"train_loss": -7.07267951965332, "global_step": 169753, "epoch": 4041} {"train_loss": -7.034538269042969, "global_step": 169754, "epoch": 4041} {"train_loss": -6.986273765563965, "global_step": 169755, "epoch": 4041} {"train_loss": -7.099696159362793, "global_step": 169756, "epoch": 4041} {"train_loss": -6.944638729095459, "global_step": 169757, "epoch": 4041} {"train_loss": -7.128868579864502, "global_step": 169758, "epoch": 4041} {"train_loss": -6.996829032897949, "global_step": 169759, "epoch": 4041} {"train_loss": -7.091867923736572, "global_step": 169760, "epoch": 4041} {"train_loss": -7.007130146026611, "global_step": 169761, "epoch": 4041} {"train_loss": -7.005875587463379, "global_step": 169762, "epoch": 4041} {"train_loss": -7.045043423062279, "global_step": 169763, "epoch": 4041, "val_loss": 79804.4453125} {"train_loss": -6.945282459259033, "global_step": 169764, "epoch": 4042} {"train_loss": -7.064138412475586, "global_step": 169765, "epoch": 4042} {"train_loss": -7.093279838562012, "global_step": 169766, "epoch": 4042} {"train_loss": -7.053554534912109, "global_step": 169767, "epoch": 4042} {"train_loss": -6.985492706298828, "global_step": 169768, "epoch": 4042} {"train_loss": -7.125334739685059, "global_step": 169769, "epoch": 4042} {"train_loss": -7.181833267211914, "global_step": 169770, "epoch": 4042} {"train_loss": -7.028601169586182, "global_step": 169771, "epoch": 4042} {"train_loss": -7.181341171264648, "global_step": 169772, "epoch": 4042} {"train_loss": -7.113640785217285, "global_step": 169773, "epoch": 4042} {"train_loss": -7.028873920440674, "global_step": 169774, "epoch": 4042} {"train_loss": -7.1179046630859375, "global_step": 169775, "epoch": 4042} {"train_loss": -7.147216320037842, "global_step": 169776, "epoch": 4042} {"train_loss": -7.058955192565918, "global_step": 169777, "epoch": 4042} {"train_loss": -7.127622604370117, "global_step": 169778, "epoch": 4042} {"train_loss": -7.064509391784668, "global_step": 169779, "epoch": 4042} {"train_loss": -7.149974822998047, "global_step": 169780, "epoch": 4042} {"train_loss": -7.015475749969482, "global_step": 169781, "epoch": 4042} {"train_loss": -7.133095741271973, "global_step": 169782, "epoch": 4042} {"train_loss": -7.134557723999023, "global_step": 169783, "epoch": 4042} {"train_loss": -7.087087631225586, "global_step": 169784, "epoch": 4042} {"train_loss": -7.005847930908203, "global_step": 169785, "epoch": 4042} {"train_loss": -6.965712547302246, "global_step": 169786, "epoch": 4042} {"train_loss": -7.072675704956055, "global_step": 169787, "epoch": 4042} {"train_loss": -6.958743095397949, "global_step": 169788, "epoch": 4042} {"train_loss": -7.110414028167725, "global_step": 169789, "epoch": 4042} {"train_loss": -6.9937825202941895, "global_step": 169790, "epoch": 4042} {"train_loss": -7.020906448364258, "global_step": 169791, "epoch": 4042} {"train_loss": -7.0868916511535645, "global_step": 169792, "epoch": 4042} {"train_loss": -7.023403167724609, "global_step": 169793, "epoch": 4042} {"train_loss": -6.916861057281494, "global_step": 169794, "epoch": 4042} {"train_loss": -7.035543918609619, "global_step": 169795, "epoch": 4042} {"train_loss": -7.157194137573242, "global_step": 169796, "epoch": 4042} {"train_loss": -6.984713077545166, "global_step": 169797, "epoch": 4042} {"train_loss": -7.080264091491699, "global_step": 169798, "epoch": 4042} {"train_loss": -6.921293258666992, "global_step": 169799, "epoch": 4042} {"train_loss": -7.063194274902344, "global_step": 169800, "epoch": 4042} {"train_loss": -7.084499359130859, "global_step": 169801, "epoch": 4042} {"train_loss": -7.205069541931152, "global_step": 169802, "epoch": 4042} {"train_loss": -6.984598159790039, "global_step": 169803, "epoch": 4042} {"train_loss": -7.065338611602783, "global_step": 169804, "epoch": 4042} {"train_loss": -7.063888220559983, "global_step": 169805, "epoch": 4042, "val_loss": 79985.078125} {"train_loss": -6.9547858238220215, "global_step": 169806, "epoch": 4043} {"train_loss": -7.047423362731934, "global_step": 169807, "epoch": 4043} {"train_loss": -7.050967216491699, "global_step": 169808, "epoch": 4043} {"train_loss": -7.03907585144043, "global_step": 169809, "epoch": 4043} {"train_loss": -7.059413909912109, "global_step": 169810, "epoch": 4043} {"train_loss": -6.873384475708008, "global_step": 169811, "epoch": 4043} {"train_loss": -6.950871467590332, "global_step": 169812, "epoch": 4043} {"train_loss": -7.098799705505371, "global_step": 169813, "epoch": 4043} {"train_loss": -7.031784534454346, "global_step": 169814, "epoch": 4043} {"train_loss": -6.965332508087158, "global_step": 169815, "epoch": 4043} {"train_loss": -7.1110382080078125, "global_step": 169816, "epoch": 4043} {"train_loss": -6.944387912750244, "global_step": 169817, "epoch": 4043} {"train_loss": -7.014304161071777, "global_step": 169818, "epoch": 4043} {"train_loss": -7.073759078979492, "global_step": 169819, "epoch": 4043} {"train_loss": -7.1474385261535645, "global_step": 169820, "epoch": 4043} {"train_loss": -6.998166084289551, "global_step": 169821, "epoch": 4043} {"train_loss": -7.127056121826172, "global_step": 169822, "epoch": 4043} {"train_loss": -7.0540690422058105, "global_step": 169823, "epoch": 4043} {"train_loss": -6.966372966766357, "global_step": 169824, "epoch": 4043} {"train_loss": -7.147851943969727, "global_step": 169825, "epoch": 4043} {"train_loss": -7.058531761169434, "global_step": 169826, "epoch": 4043} {"train_loss": -7.046726703643799, "global_step": 169827, "epoch": 4043} {"train_loss": -7.063547134399414, "global_step": 169828, "epoch": 4043} {"train_loss": -7.062875270843506, "global_step": 169829, "epoch": 4043} {"train_loss": -7.203638076782227, "global_step": 169830, "epoch": 4043} {"train_loss": -7.001679420471191, "global_step": 169831, "epoch": 4043} {"train_loss": -7.052582740783691, "global_step": 169832, "epoch": 4043} {"train_loss": -6.992152214050293, "global_step": 169833, "epoch": 4043} {"train_loss": -7.19951057434082, "global_step": 169834, "epoch": 4043} {"train_loss": -7.071437358856201, "global_step": 169835, "epoch": 4043} {"train_loss": -7.042195796966553, "global_step": 169836, "epoch": 4043} {"train_loss": -6.921159267425537, "global_step": 169837, "epoch": 4043} {"train_loss": -6.980965614318848, "global_step": 169838, "epoch": 4043} {"train_loss": -7.1086883544921875, "global_step": 169839, "epoch": 4043} {"train_loss": -6.971915245056152, "global_step": 169840, "epoch": 4043} {"train_loss": -7.092467784881592, "global_step": 169841, "epoch": 4043} {"train_loss": -7.07954216003418, "global_step": 169842, "epoch": 4043} {"train_loss": -7.045161247253418, "global_step": 169843, "epoch": 4043} {"train_loss": -7.09816312789917, "global_step": 169844, "epoch": 4043} {"train_loss": -7.151330947875977, "global_step": 169845, "epoch": 4043} {"train_loss": -7.084877014160156, "global_step": 169846, "epoch": 4043} {"train_loss": -7.050843522662208, "global_step": 169847, "epoch": 4043, "val_loss": 79738.484375} {"train_loss": -7.136691093444824, "global_step": 169848, "epoch": 4044} {"train_loss": -6.988837242126465, "global_step": 169849, "epoch": 4044} {"train_loss": -7.108783721923828, "global_step": 169850, "epoch": 4044} {"train_loss": -7.056266784667969, "global_step": 169851, "epoch": 4044} {"train_loss": -6.96519660949707, "global_step": 169852, "epoch": 4044} {"train_loss": -7.133029937744141, "global_step": 169853, "epoch": 4044} {"train_loss": -7.132926940917969, "global_step": 169854, "epoch": 4044} {"train_loss": -7.149873733520508, "global_step": 169855, "epoch": 4044} {"train_loss": -6.991031646728516, "global_step": 169856, "epoch": 4044} {"train_loss": -7.114016532897949, "global_step": 169857, "epoch": 4044} {"train_loss": -7.122533798217773, "global_step": 169858, "epoch": 4044} {"train_loss": -7.119210243225098, "global_step": 169859, "epoch": 4044} {"train_loss": -7.097707748413086, "global_step": 169860, "epoch": 4044} {"train_loss": -7.085422515869141, "global_step": 169861, "epoch": 4044} {"train_loss": -7.148230075836182, "global_step": 169862, "epoch": 4044} {"train_loss": -7.034543514251709, "global_step": 169863, "epoch": 4044} {"train_loss": -7.120587348937988, "global_step": 169864, "epoch": 4044} {"train_loss": -7.127574920654297, "global_step": 169865, "epoch": 4044} {"train_loss": -7.126025199890137, "global_step": 169866, "epoch": 4044} {"train_loss": -7.13119649887085, "global_step": 169867, "epoch": 4044} {"train_loss": -7.089948654174805, "global_step": 169868, "epoch": 4044} {"train_loss": -7.110613822937012, "global_step": 169869, "epoch": 4044} {"train_loss": -7.021699905395508, "global_step": 169870, "epoch": 4044} {"train_loss": -6.969589710235596, "global_step": 169871, "epoch": 4044} {"train_loss": -7.043176651000977, "global_step": 169872, "epoch": 4044} {"train_loss": -7.021411895751953, "global_step": 169873, "epoch": 4044} {"train_loss": -6.844295978546143, "global_step": 169874, "epoch": 4044} {"train_loss": -6.986111164093018, "global_step": 169875, "epoch": 4044} {"train_loss": -7.065154075622559, "global_step": 169876, "epoch": 4044} {"train_loss": -6.763265132904053, "global_step": 169877, "epoch": 4044} {"train_loss": -6.921438694000244, "global_step": 169878, "epoch": 4044} {"train_loss": -7.0415496826171875, "global_step": 169879, "epoch": 4044} {"train_loss": -6.912877559661865, "global_step": 169880, "epoch": 4044} {"train_loss": -7.091301441192627, "global_step": 169881, "epoch": 4044} {"train_loss": -7.059025287628174, "global_step": 169882, "epoch": 4044} {"train_loss": -7.090323448181152, "global_step": 169883, "epoch": 4044} {"train_loss": -6.9039812088012695, "global_step": 169884, "epoch": 4044} {"train_loss": -7.075737476348877, "global_step": 169885, "epoch": 4044} {"train_loss": -6.9361491203308105, "global_step": 169886, "epoch": 4044} {"train_loss": -6.975511074066162, "global_step": 169887, "epoch": 4044} {"train_loss": -6.946934700012207, "global_step": 169888, "epoch": 4044} {"train_loss": -7.040150313150315, "global_step": 169889, "epoch": 4044, "val_loss": 79908.7421875} {"train_loss": -7.058387279510498, "global_step": 169890, "epoch": 4045} {"train_loss": -6.916973114013672, "global_step": 169891, "epoch": 4045} {"train_loss": -7.095192909240723, "global_step": 169892, "epoch": 4045} {"train_loss": -6.736610412597656, "global_step": 169893, "epoch": 4045} {"train_loss": -6.8576884269714355, "global_step": 169894, "epoch": 4045} {"train_loss": -6.936220169067383, "global_step": 169895, "epoch": 4045} {"train_loss": -6.870347499847412, "global_step": 169896, "epoch": 4045} {"train_loss": -7.038204669952393, "global_step": 169897, "epoch": 4045} {"train_loss": -6.915299415588379, "global_step": 169898, "epoch": 4045} {"train_loss": -6.964664459228516, "global_step": 169899, "epoch": 4045} {"train_loss": -6.892269134521484, "global_step": 169900, "epoch": 4045} {"train_loss": -6.9200639724731445, "global_step": 169901, "epoch": 4045} {"train_loss": -6.946256637573242, "global_step": 169902, "epoch": 4045} {"train_loss": -6.983855724334717, "global_step": 169903, "epoch": 4045} {"train_loss": -6.927539825439453, "global_step": 169904, "epoch": 4045} {"train_loss": -7.035704612731934, "global_step": 169905, "epoch": 4045} {"train_loss": -6.992642402648926, "global_step": 169906, "epoch": 4045} {"train_loss": -7.056707859039307, "global_step": 169907, "epoch": 4045} {"train_loss": -6.949959754943848, "global_step": 169908, "epoch": 4045} {"train_loss": -7.008542537689209, "global_step": 169909, "epoch": 4045} {"train_loss": -7.036467552185059, "global_step": 169910, "epoch": 4045} {"train_loss": -6.965821266174316, "global_step": 169911, "epoch": 4045} {"train_loss": -6.968441963195801, "global_step": 169912, "epoch": 4045} {"train_loss": -7.040138244628906, "global_step": 169913, "epoch": 4045} {"train_loss": -6.793888092041016, "global_step": 169914, "epoch": 4045} {"train_loss": -6.950779914855957, "global_step": 169915, "epoch": 4045} {"train_loss": -6.840691566467285, "global_step": 169916, "epoch": 4045} {"train_loss": -6.825314521789551, "global_step": 169917, "epoch": 4045} {"train_loss": -7.063448905944824, "global_step": 169918, "epoch": 4045} {"train_loss": -6.829388618469238, "global_step": 169919, "epoch": 4045} {"train_loss": -6.907929420471191, "global_step": 169920, "epoch": 4045} {"train_loss": -6.92034912109375, "global_step": 169921, "epoch": 4045} {"train_loss": -6.882360935211182, "global_step": 169922, "epoch": 4045} {"train_loss": -6.977591514587402, "global_step": 169923, "epoch": 4045} {"train_loss": -6.975946426391602, "global_step": 169924, "epoch": 4045} {"train_loss": -6.963683128356934, "global_step": 169925, "epoch": 4045} {"train_loss": -6.9296183586120605, "global_step": 169926, "epoch": 4045} {"train_loss": -7.075741767883301, "global_step": 169927, "epoch": 4045} {"train_loss": -6.930702209472656, "global_step": 169928, "epoch": 4045} {"train_loss": -6.956270217895508, "global_step": 169929, "epoch": 4045} {"train_loss": -7.037342548370361, "global_step": 169930, "epoch": 4045} {"train_loss": -6.953443493161883, "global_step": 169931, "epoch": 4045, "val_loss": 79936.8515625} {"train_loss": -6.952241897583008, "global_step": 169932, "epoch": 4046} {"train_loss": -6.980000972747803, "global_step": 169933, "epoch": 4046} {"train_loss": -7.088042259216309, "global_step": 169934, "epoch": 4046} {"train_loss": -7.106795310974121, "global_step": 169935, "epoch": 4046} {"train_loss": -7.034038543701172, "global_step": 169936, "epoch": 4046} {"train_loss": -7.069416046142578, "global_step": 169937, "epoch": 4046} {"train_loss": -7.017793655395508, "global_step": 169938, "epoch": 4046} {"train_loss": -7.058932304382324, "global_step": 169939, "epoch": 4046} {"train_loss": -7.056753158569336, "global_step": 169940, "epoch": 4046} {"train_loss": -7.180089473724365, "global_step": 169941, "epoch": 4046} {"train_loss": -6.964776992797852, "global_step": 169942, "epoch": 4046} {"train_loss": -7.0863237380981445, "global_step": 169943, "epoch": 4046} {"train_loss": -6.914055824279785, "global_step": 169944, "epoch": 4046} {"train_loss": -6.91596794128418, "global_step": 169945, "epoch": 4046} {"train_loss": -7.069946765899658, "global_step": 169946, "epoch": 4046} {"train_loss": -6.93570613861084, "global_step": 169947, "epoch": 4046} {"train_loss": -6.906874179840088, "global_step": 169948, "epoch": 4046} {"train_loss": -7.144138336181641, "global_step": 169949, "epoch": 4046} {"train_loss": -7.104503631591797, "global_step": 169950, "epoch": 4046} {"train_loss": -7.038322448730469, "global_step": 169951, "epoch": 4046} {"train_loss": -7.132277011871338, "global_step": 169952, "epoch": 4046} {"train_loss": -7.293809413909912, "global_step": 169953, "epoch": 4046} {"train_loss": -6.987462997436523, "global_step": 169954, "epoch": 4046} {"train_loss": -7.057806491851807, "global_step": 169955, "epoch": 4046} {"train_loss": -6.948999404907227, "global_step": 169956, "epoch": 4046} {"train_loss": -7.061473846435547, "global_step": 169957, "epoch": 4046} {"train_loss": -7.103752136230469, "global_step": 169958, "epoch": 4046} {"train_loss": -6.887750625610352, "global_step": 169959, "epoch": 4046} {"train_loss": -7.115267276763916, "global_step": 169960, "epoch": 4046} {"train_loss": -6.901597023010254, "global_step": 169961, "epoch": 4046} {"train_loss": -6.793727874755859, "global_step": 169962, "epoch": 4046} {"train_loss": -6.9463372230529785, "global_step": 169963, "epoch": 4046} {"train_loss": -6.942845344543457, "global_step": 169964, "epoch": 4046} {"train_loss": -6.892303466796875, "global_step": 169965, "epoch": 4046} {"train_loss": -6.92350435256958, "global_step": 169966, "epoch": 4046} {"train_loss": -7.028444766998291, "global_step": 169967, "epoch": 4046} {"train_loss": -6.931710243225098, "global_step": 169968, "epoch": 4046} {"train_loss": -7.085855484008789, "global_step": 169969, "epoch": 4046} {"train_loss": -6.937140464782715, "global_step": 169970, "epoch": 4046} {"train_loss": -6.936261177062988, "global_step": 169971, "epoch": 4046} {"train_loss": -7.024658203125, "global_step": 169972, "epoch": 4046} {"train_loss": -7.011409146445138, "global_step": 169973, "epoch": 4046, "val_loss": 79750.7578125} {"train_loss": -7.100307464599609, "global_step": 169974, "epoch": 4047} {"train_loss": -6.998588562011719, "global_step": 169975, "epoch": 4047} {"train_loss": -7.022672653198242, "global_step": 169976, "epoch": 4047} {"train_loss": -7.089679718017578, "global_step": 169977, "epoch": 4047} {"train_loss": -7.0647783279418945, "global_step": 169978, "epoch": 4047} {"train_loss": -7.055415630340576, "global_step": 169979, "epoch": 4047} {"train_loss": -7.099053382873535, "global_step": 169980, "epoch": 4047} {"train_loss": -7.060907363891602, "global_step": 169981, "epoch": 4047} {"train_loss": -7.062915325164795, "global_step": 169982, "epoch": 4047} {"train_loss": -7.046759605407715, "global_step": 169983, "epoch": 4047} {"train_loss": -6.981348514556885, "global_step": 169984, "epoch": 4047} {"train_loss": -7.087488174438477, "global_step": 169985, "epoch": 4047} {"train_loss": -6.935688018798828, "global_step": 169986, "epoch": 4047} {"train_loss": -7.097949981689453, "global_step": 169987, "epoch": 4047} {"train_loss": -7.176305770874023, "global_step": 169988, "epoch": 4047} {"train_loss": -6.998870849609375, "global_step": 169989, "epoch": 4047} {"train_loss": -7.083178520202637, "global_step": 169990, "epoch": 4047} {"train_loss": -7.092148303985596, "global_step": 169991, "epoch": 4047} {"train_loss": -7.057960510253906, "global_step": 169992, "epoch": 4047} {"train_loss": -7.127262115478516, "global_step": 169993, "epoch": 4047} {"train_loss": -7.067440032958984, "global_step": 169994, "epoch": 4047} {"train_loss": -7.036435127258301, "global_step": 169995, "epoch": 4047} {"train_loss": -7.007206439971924, "global_step": 169996, "epoch": 4047} {"train_loss": -7.016363143920898, "global_step": 169997, "epoch": 4047} {"train_loss": -6.9791388511657715, "global_step": 169998, "epoch": 4047} {"train_loss": -6.979432106018066, "global_step": 169999, "epoch": 4047} {"train_loss": -7.064970016479492, "global_step": 170000, "epoch": 4047} {"train_loss": -6.906203269958496, "global_step": 170001, "epoch": 4047} {"train_loss": -7.063830852508545, "global_step": 170002, "epoch": 4047} {"train_loss": -6.962623596191406, "global_step": 170003, "epoch": 4047} {"train_loss": -7.067605972290039, "global_step": 170004, "epoch": 4047} {"train_loss": -7.058438301086426, "global_step": 170005, "epoch": 4047} {"train_loss": -6.928106307983398, "global_step": 170006, "epoch": 4047} {"train_loss": -7.017412185668945, "global_step": 170007, "epoch": 4047} {"train_loss": -7.063030242919922, "global_step": 170008, "epoch": 4047} {"train_loss": -7.157473087310791, "global_step": 170009, "epoch": 4047} {"train_loss": -7.076169013977051, "global_step": 170010, "epoch": 4047} {"train_loss": -7.188959121704102, "global_step": 170011, "epoch": 4047} {"train_loss": -6.990824222564697, "global_step": 170012, "epoch": 4047} {"train_loss": -6.977060794830322, "global_step": 170013, "epoch": 4047} {"train_loss": -7.061537742614746, "global_step": 170014, "epoch": 4047} {"train_loss": -7.047753765469506, "global_step": 170015, "epoch": 4047, "val_loss": 79900.1875} {"train_loss": -7.018900394439697, "global_step": 170016, "epoch": 4048} {"train_loss": -7.076359272003174, "global_step": 170017, "epoch": 4048} {"train_loss": -7.091715335845947, "global_step": 170018, "epoch": 4048} {"train_loss": -6.999587059020996, "global_step": 170019, "epoch": 4048} {"train_loss": -7.015792369842529, "global_step": 170020, "epoch": 4048} {"train_loss": -6.9417314529418945, "global_step": 170021, "epoch": 4048} {"train_loss": -7.0969953536987305, "global_step": 170022, "epoch": 4048} {"train_loss": -6.956076622009277, "global_step": 170023, "epoch": 4048} {"train_loss": -7.043676376342773, "global_step": 170024, "epoch": 4048} {"train_loss": -7.061903476715088, "global_step": 170025, "epoch": 4048} {"train_loss": -6.967036724090576, "global_step": 170026, "epoch": 4048} {"train_loss": -7.043371677398682, "global_step": 170027, "epoch": 4048} {"train_loss": -6.957685947418213, "global_step": 170028, "epoch": 4048} {"train_loss": -7.0471296310424805, "global_step": 170029, "epoch": 4048} {"train_loss": -6.9615864753723145, "global_step": 170030, "epoch": 4048} {"train_loss": -6.960604190826416, "global_step": 170031, "epoch": 4048} {"train_loss": -6.915613174438477, "global_step": 170032, "epoch": 4048} {"train_loss": -6.862232685089111, "global_step": 170033, "epoch": 4048} {"train_loss": -7.072505950927734, "global_step": 170034, "epoch": 4048} {"train_loss": -7.014013290405273, "global_step": 170035, "epoch": 4048} {"train_loss": -7.115426540374756, "global_step": 170036, "epoch": 4048} {"train_loss": -7.045903205871582, "global_step": 170037, "epoch": 4048} {"train_loss": -7.017547130584717, "global_step": 170038, "epoch": 4048} {"train_loss": -6.973855018615723, "global_step": 170039, "epoch": 4048} {"train_loss": -7.057172775268555, "global_step": 170040, "epoch": 4048} {"train_loss": -7.149631977081299, "global_step": 170041, "epoch": 4048} {"train_loss": -7.056155204772949, "global_step": 170042, "epoch": 4048} {"train_loss": -7.101958274841309, "global_step": 170043, "epoch": 4048} {"train_loss": -7.099120140075684, "global_step": 170044, "epoch": 4048} {"train_loss": -7.045727252960205, "global_step": 170045, "epoch": 4048} {"train_loss": -6.988953113555908, "global_step": 170046, "epoch": 4048} {"train_loss": -7.041757583618164, "global_step": 170047, "epoch": 4048} {"train_loss": -7.094535827636719, "global_step": 170048, "epoch": 4048} {"train_loss": -6.978821277618408, "global_step": 170049, "epoch": 4048} {"train_loss": -7.036406517028809, "global_step": 170050, "epoch": 4048} {"train_loss": -7.122511863708496, "global_step": 170051, "epoch": 4048} {"train_loss": -7.052298545837402, "global_step": 170052, "epoch": 4048} {"train_loss": -6.934250831604004, "global_step": 170053, "epoch": 4048} {"train_loss": -6.845115661621094, "global_step": 170054, "epoch": 4048} {"train_loss": -7.046926021575928, "global_step": 170055, "epoch": 4048} {"train_loss": -7.028763771057129, "global_step": 170056, "epoch": 4048} {"train_loss": -7.019377867380778, "global_step": 170057, "epoch": 4048, "val_loss": 79798.6015625} {"train_loss": -7.007036209106445, "global_step": 170058, "epoch": 4049} {"train_loss": -6.974631309509277, "global_step": 170059, "epoch": 4049} {"train_loss": -7.065306663513184, "global_step": 170060, "epoch": 4049} {"train_loss": -6.961372375488281, "global_step": 170061, "epoch": 4049} {"train_loss": -6.865509986877441, "global_step": 170062, "epoch": 4049} {"train_loss": -6.919905662536621, "global_step": 170063, "epoch": 4049} {"train_loss": -6.742010116577148, "global_step": 170064, "epoch": 4049} {"train_loss": -6.91227912902832, "global_step": 170065, "epoch": 4049} {"train_loss": -6.841937065124512, "global_step": 170066, "epoch": 4049} {"train_loss": -6.862966537475586, "global_step": 170067, "epoch": 4049} {"train_loss": -6.876733303070068, "global_step": 170068, "epoch": 4049} {"train_loss": -6.95695686340332, "global_step": 170069, "epoch": 4049} {"train_loss": -7.042385578155518, "global_step": 170070, "epoch": 4049} {"train_loss": -6.921274185180664, "global_step": 170071, "epoch": 4049} {"train_loss": -6.829707145690918, "global_step": 170072, "epoch": 4049} {"train_loss": -6.912153244018555, "global_step": 170073, "epoch": 4049} {"train_loss": -6.9722747802734375, "global_step": 170074, "epoch": 4049} {"train_loss": -6.817385196685791, "global_step": 170075, "epoch": 4049} {"train_loss": -7.001160621643066, "global_step": 170076, "epoch": 4049} {"train_loss": -6.975538730621338, "global_step": 170077, "epoch": 4049} {"train_loss": -7.086551189422607, "global_step": 170078, "epoch": 4049} {"train_loss": -6.921730995178223, "global_step": 170079, "epoch": 4049} {"train_loss": -7.119235992431641, "global_step": 170080, "epoch": 4049} {"train_loss": -7.101525783538818, "global_step": 170081, "epoch": 4049} {"train_loss": -7.067839622497559, "global_step": 170082, "epoch": 4049} {"train_loss": -6.941934108734131, "global_step": 170083, "epoch": 4049} {"train_loss": -7.043317794799805, "global_step": 170084, "epoch": 4049} {"train_loss": -7.1453094482421875, "global_step": 170085, "epoch": 4049} {"train_loss": -6.945841312408447, "global_step": 170086, "epoch": 4049} {"train_loss": -7.06984806060791, "global_step": 170087, "epoch": 4049} {"train_loss": -6.98063850402832, "global_step": 170088, "epoch": 4049} {"train_loss": -7.087539196014404, "global_step": 170089, "epoch": 4049} {"train_loss": -7.0873260498046875, "global_step": 170090, "epoch": 4049} {"train_loss": -6.784660339355469, "global_step": 170091, "epoch": 4049} {"train_loss": -7.083837509155273, "global_step": 170092, "epoch": 4049} {"train_loss": -6.988941192626953, "global_step": 170093, "epoch": 4049} {"train_loss": -7.015031814575195, "global_step": 170094, "epoch": 4049} {"train_loss": -7.038930416107178, "global_step": 170095, "epoch": 4049} {"train_loss": -6.906822204589844, "global_step": 170096, "epoch": 4049} {"train_loss": -7.053957939147949, "global_step": 170097, "epoch": 4049} {"train_loss": -6.948243618011475, "global_step": 170098, "epoch": 4049} {"train_loss": -6.9756339845203215, "global_step": 170099, "epoch": 4049, "val_loss": 79842.734375} {"train_loss": -7.017322540283203, "global_step": 170100, "epoch": 4050} {"train_loss": -7.0248003005981445, "global_step": 170101, "epoch": 4050} {"train_loss": -7.04094934463501, "global_step": 170102, "epoch": 4050} {"train_loss": -6.96665620803833, "global_step": 170103, "epoch": 4050} {"train_loss": -7.013120174407959, "global_step": 170104, "epoch": 4050} {"train_loss": -6.966946601867676, "global_step": 170105, "epoch": 4050} {"train_loss": -6.960033416748047, "global_step": 170106, "epoch": 4050} {"train_loss": -6.9998979568481445, "global_step": 170107, "epoch": 4050} {"train_loss": -7.03101921081543, "global_step": 170108, "epoch": 4050} {"train_loss": -6.908520698547363, "global_step": 170109, "epoch": 4050} {"train_loss": -6.7833051681518555, "global_step": 170110, "epoch": 4050} {"train_loss": -7.146608829498291, "global_step": 170111, "epoch": 4050} {"train_loss": -7.060650825500488, "global_step": 170112, "epoch": 4050} {"train_loss": -6.9137678146362305, "global_step": 170113, "epoch": 4050} {"train_loss": -6.98223876953125, "global_step": 170114, "epoch": 4050} {"train_loss": -6.993851661682129, "global_step": 170115, "epoch": 4050} {"train_loss": -7.002260208129883, "global_step": 170116, "epoch": 4050} {"train_loss": -7.026468276977539, "global_step": 170117, "epoch": 4050} {"train_loss": -6.9738006591796875, "global_step": 170118, "epoch": 4050} {"train_loss": -7.130531311035156, "global_step": 170119, "epoch": 4050} {"train_loss": -6.960737228393555, "global_step": 170120, "epoch": 4050} {"train_loss": -7.079860687255859, "global_step": 170121, "epoch": 4050} {"train_loss": -6.9929962158203125, "global_step": 170122, "epoch": 4050} {"train_loss": -7.139989852905273, "global_step": 170123, "epoch": 4050} {"train_loss": -7.027405738830566, "global_step": 170124, "epoch": 4050} {"train_loss": -7.087995529174805, "global_step": 170125, "epoch": 4050} {"train_loss": -7.007610321044922, "global_step": 170126, "epoch": 4050} {"train_loss": -7.03814697265625, "global_step": 170127, "epoch": 4050} {"train_loss": -7.099084854125977, "global_step": 170128, "epoch": 4050} {"train_loss": -7.053503036499023, "global_step": 170129, "epoch": 4050} {"train_loss": -7.118427276611328, "global_step": 170130, "epoch": 4050} {"train_loss": -7.133941173553467, "global_step": 170131, "epoch": 4050} {"train_loss": -6.995967864990234, "global_step": 170132, "epoch": 4050} {"train_loss": -7.103575706481934, "global_step": 170133, "epoch": 4050} {"train_loss": -7.037930011749268, "global_step": 170134, "epoch": 4050} {"train_loss": -7.053600311279297, "global_step": 170135, "epoch": 4050} {"train_loss": -7.126823425292969, "global_step": 170136, "epoch": 4050} {"train_loss": -7.151950836181641, "global_step": 170137, "epoch": 4050} {"train_loss": -7.092860221862793, "global_step": 170138, "epoch": 4050} {"train_loss": -6.994773864746094, "global_step": 170139, "epoch": 4050} {"train_loss": -7.1176042556762695, "global_step": 170140, "epoch": 4050} {"train_loss": -7.03662017413548, "global_step": 170141, "epoch": 4050, "train/sim_max_reward_0": 0.4623619524723968, "train/sim_max_reward_1": 0.7972755485046662, "train/sim_max_reward_2": 0.5501389742061065, "train/sim_max_reward_3": 0.143569494867885, "train/sim_max_reward_4": 0.9093605023354475, "train/sim_max_reward_5": 0.7279259844356408, "test/sim_max_reward_4500000": 1.0, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9811966942185933, "test/sim_max_reward_4500003": 0.9561148443254961, "test/sim_max_reward_4500004": 0.8552987551004411, "test/sim_max_reward_4500005": 0.5180007613494468, "test/sim_max_reward_4500006": 0.8978017799922018, "test/sim_max_reward_4500007": 0.9876800825940762, "test/sim_max_reward_4500008": 0.9203550996623997, "test/sim_max_reward_4500009": 0.05318499480768012, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.916353061135083, "test/sim_max_reward_4500012": 0.9508824333173488, "test/sim_max_reward_4500013": 0.0035315080165541236, "test/sim_max_reward_4500014": 0.9575999158572746, "test/sim_max_reward_4500015": 0.9938510508845618, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0484064109931706, "test/sim_max_reward_4500018": 0.9850149424851558, "test/sim_max_reward_4500019": 0.9856467841179923, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9673451079021101, "test/sim_max_reward_4500022": 0.9776584550186102, "test/sim_max_reward_4500023": 0.9418035976960838, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9175506878861278, "test/sim_max_reward_4500026": 0.0, "test/sim_max_reward_4500027": 0.982855014483285, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.11154608551477876, "test/sim_max_reward_4500030": 0.9791121977724215, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9242968351030713, "test/sim_max_reward_4500034": 0.8865339877101294, "test/sim_max_reward_4500035": 0.996248155015528, "test/sim_max_reward_4500036": 0.934266323107952, "test/sim_max_reward_4500037": 0.8249100421392537, "test/sim_max_reward_4500038": 0.34959685725220424, "test/sim_max_reward_4500039": 0.9852120103587517, "test/sim_max_reward_4500040": 0.9821395756244252, "test/sim_max_reward_4500041": 0.964055205776908, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.9078737486248782, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.5813282493547125, "test/sim_max_reward_4500046": 0.9587314010291766, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.5984387428036905, "test/mean_score": 0.5891730682665478, "val_loss": 79639.109375} {"train_loss": -7.085296154022217, "global_step": 170142, "epoch": 4051} {"train_loss": -7.128356456756592, "global_step": 170143, "epoch": 4051} {"train_loss": -6.909951210021973, "global_step": 170144, "epoch": 4051} {"train_loss": -7.036557197570801, "global_step": 170145, "epoch": 4051} {"train_loss": -6.955455303192139, "global_step": 170146, "epoch": 4051} {"train_loss": -6.921162128448486, "global_step": 170147, "epoch": 4051} {"train_loss": -6.912784576416016, "global_step": 170148, "epoch": 4051} {"train_loss": -7.0849385261535645, "global_step": 170149, "epoch": 4051} {"train_loss": -6.8974432945251465, "global_step": 170150, "epoch": 4051} {"train_loss": -7.083323955535889, "global_step": 170151, "epoch": 4051} {"train_loss": -7.0962371826171875, "global_step": 170152, "epoch": 4051} {"train_loss": -7.126044750213623, "global_step": 170153, "epoch": 4051} {"train_loss": -7.001593589782715, "global_step": 170154, "epoch": 4051} {"train_loss": -7.0874223709106445, "global_step": 170155, "epoch": 4051} {"train_loss": -7.111536026000977, "global_step": 170156, "epoch": 4051} {"train_loss": -7.078719139099121, "global_step": 170157, "epoch": 4051} {"train_loss": -7.114178657531738, "global_step": 170158, "epoch": 4051} {"train_loss": -7.159407138824463, "global_step": 170159, "epoch": 4051} {"train_loss": -7.029701232910156, "global_step": 170160, "epoch": 4051} {"train_loss": -7.132213592529297, "global_step": 170161, "epoch": 4051} {"train_loss": -7.010863304138184, "global_step": 170162, "epoch": 4051} {"train_loss": -7.136961936950684, "global_step": 170163, "epoch": 4051} {"train_loss": -7.055070877075195, "global_step": 170164, "epoch": 4051} {"train_loss": -6.96844482421875, "global_step": 170165, "epoch": 4051} {"train_loss": -7.1658172607421875, "global_step": 170166, "epoch": 4051} {"train_loss": -7.164766311645508, "global_step": 170167, "epoch": 4051} {"train_loss": -7.165760040283203, "global_step": 170168, "epoch": 4051} {"train_loss": -7.006357192993164, "global_step": 170169, "epoch": 4051} {"train_loss": -7.084227085113525, "global_step": 170170, "epoch": 4051} {"train_loss": -7.0880022048950195, "global_step": 170171, "epoch": 4051} {"train_loss": -6.898757457733154, "global_step": 170172, "epoch": 4051} {"train_loss": -7.096261024475098, "global_step": 170173, "epoch": 4051} {"train_loss": -7.098871231079102, "global_step": 170174, "epoch": 4051} {"train_loss": -7.119243621826172, "global_step": 170175, "epoch": 4051} {"train_loss": -7.108360290527344, "global_step": 170176, "epoch": 4051} {"train_loss": -7.1431403160095215, "global_step": 170177, "epoch": 4051} {"train_loss": -7.082991123199463, "global_step": 170178, "epoch": 4051} {"train_loss": -7.065738677978516, "global_step": 170179, "epoch": 4051} {"train_loss": -6.929012775421143, "global_step": 170180, "epoch": 4051} {"train_loss": -7.083011150360107, "global_step": 170181, "epoch": 4051} {"train_loss": -7.228439807891846, "global_step": 170182, "epoch": 4051} {"train_loss": -7.066657327470326, "global_step": 170183, "epoch": 4051, "val_loss": 79798.125} {"train_loss": -7.178328037261963, "global_step": 170184, "epoch": 4052} {"train_loss": -7.20270299911499, "global_step": 170185, "epoch": 4052} {"train_loss": -7.087601184844971, "global_step": 170186, "epoch": 4052} {"train_loss": -7.185295104980469, "global_step": 170187, "epoch": 4052} {"train_loss": -7.001993656158447, "global_step": 170188, "epoch": 4052} {"train_loss": -7.033429145812988, "global_step": 170189, "epoch": 4052} {"train_loss": -7.135108947753906, "global_step": 170190, "epoch": 4052} {"train_loss": -7.060622692108154, "global_step": 170191, "epoch": 4052} {"train_loss": -7.024135589599609, "global_step": 170192, "epoch": 4052} {"train_loss": -7.022645473480225, "global_step": 170193, "epoch": 4052} {"train_loss": -7.126448631286621, "global_step": 170194, "epoch": 4052} {"train_loss": -7.122864723205566, "global_step": 170195, "epoch": 4052} {"train_loss": -6.987157344818115, "global_step": 170196, "epoch": 4052} {"train_loss": -7.148979663848877, "global_step": 170197, "epoch": 4052} {"train_loss": -7.101431369781494, "global_step": 170198, "epoch": 4052} {"train_loss": -7.191927909851074, "global_step": 170199, "epoch": 4052} {"train_loss": -7.090970993041992, "global_step": 170200, "epoch": 4052} {"train_loss": -7.192024230957031, "global_step": 170201, "epoch": 4052} {"train_loss": -7.130847454071045, "global_step": 170202, "epoch": 4052} {"train_loss": -7.1463212966918945, "global_step": 170203, "epoch": 4052} {"train_loss": -7.193900108337402, "global_step": 170204, "epoch": 4052} {"train_loss": -7.113558769226074, "global_step": 170205, "epoch": 4052} {"train_loss": -7.117144584655762, "global_step": 170206, "epoch": 4052} {"train_loss": -7.1885271072387695, "global_step": 170207, "epoch": 4052} {"train_loss": -7.183060646057129, "global_step": 170208, "epoch": 4052} {"train_loss": -7.147595405578613, "global_step": 170209, "epoch": 4052} {"train_loss": -7.208689212799072, "global_step": 170210, "epoch": 4052} {"train_loss": -7.074029922485352, "global_step": 170211, "epoch": 4052} {"train_loss": -7.235235691070557, "global_step": 170212, "epoch": 4052} {"train_loss": -7.057376861572266, "global_step": 170213, "epoch": 4052} {"train_loss": -7.072349548339844, "global_step": 170214, "epoch": 4052} {"train_loss": -7.090993881225586, "global_step": 170215, "epoch": 4052} {"train_loss": -7.180953025817871, "global_step": 170216, "epoch": 4052} {"train_loss": -7.169147491455078, "global_step": 170217, "epoch": 4052} {"train_loss": -7.073402404785156, "global_step": 170218, "epoch": 4052} {"train_loss": -7.034599304199219, "global_step": 170219, "epoch": 4052} {"train_loss": -7.093536376953125, "global_step": 170220, "epoch": 4052} {"train_loss": -7.090038299560547, "global_step": 170221, "epoch": 4052} {"train_loss": -7.082345008850098, "global_step": 170222, "epoch": 4052} {"train_loss": -7.052066802978516, "global_step": 170223, "epoch": 4052} {"train_loss": -6.9681267738342285, "global_step": 170224, "epoch": 4052} {"train_loss": -7.112138396217709, "global_step": 170225, "epoch": 4052, "val_loss": 79824.7421875} {"train_loss": -7.045104026794434, "global_step": 170226, "epoch": 4053} {"train_loss": -7.037548065185547, "global_step": 170227, "epoch": 4053} {"train_loss": -7.032537937164307, "global_step": 170228, "epoch": 4053} {"train_loss": -7.058412551879883, "global_step": 170229, "epoch": 4053} {"train_loss": -6.966554641723633, "global_step": 170230, "epoch": 4053} {"train_loss": -7.142716407775879, "global_step": 170231, "epoch": 4053} {"train_loss": -7.123777866363525, "global_step": 170232, "epoch": 4053} {"train_loss": -7.010640621185303, "global_step": 170233, "epoch": 4053} {"train_loss": -6.992101669311523, "global_step": 170234, "epoch": 4053} {"train_loss": -6.987612724304199, "global_step": 170235, "epoch": 4053} {"train_loss": -7.075033664703369, "global_step": 170236, "epoch": 4053} {"train_loss": -7.117588043212891, "global_step": 170237, "epoch": 4053} {"train_loss": -7.058811187744141, "global_step": 170238, "epoch": 4053} {"train_loss": -7.0663251876831055, "global_step": 170239, "epoch": 4053} {"train_loss": -7.10310173034668, "global_step": 170240, "epoch": 4053} {"train_loss": -7.060349941253662, "global_step": 170241, "epoch": 4053} {"train_loss": -6.879232406616211, "global_step": 170242, "epoch": 4053} {"train_loss": -6.84741735458374, "global_step": 170243, "epoch": 4053} {"train_loss": -7.107415676116943, "global_step": 170244, "epoch": 4053} {"train_loss": -6.710309028625488, "global_step": 170245, "epoch": 4053} {"train_loss": -6.89566707611084, "global_step": 170246, "epoch": 4053} {"train_loss": -6.973122596740723, "global_step": 170247, "epoch": 4053} {"train_loss": -6.78033447265625, "global_step": 170248, "epoch": 4053} {"train_loss": -6.974184989929199, "global_step": 170249, "epoch": 4053} {"train_loss": -6.879619598388672, "global_step": 170250, "epoch": 4053} {"train_loss": -6.868700981140137, "global_step": 170251, "epoch": 4053} {"train_loss": -6.87304162979126, "global_step": 170252, "epoch": 4053} {"train_loss": -6.992401123046875, "global_step": 170253, "epoch": 4053} {"train_loss": -6.967321395874023, "global_step": 170254, "epoch": 4053} {"train_loss": -6.915448188781738, "global_step": 170255, "epoch": 4053} {"train_loss": -6.814816474914551, "global_step": 170256, "epoch": 4053} {"train_loss": -6.901724338531494, "global_step": 170257, "epoch": 4053} {"train_loss": -6.917332649230957, "global_step": 170258, "epoch": 4053} {"train_loss": -6.941188335418701, "global_step": 170259, "epoch": 4053} {"train_loss": -6.931823253631592, "global_step": 170260, "epoch": 4053} {"train_loss": -6.8967084884643555, "global_step": 170261, "epoch": 4053} {"train_loss": -6.8653411865234375, "global_step": 170262, "epoch": 4053} {"train_loss": -6.982378005981445, "global_step": 170263, "epoch": 4053} {"train_loss": -6.949525356292725, "global_step": 170264, "epoch": 4053} {"train_loss": -7.011889457702637, "global_step": 170265, "epoch": 4053} {"train_loss": -6.798417568206787, "global_step": 170266, "epoch": 4053} {"train_loss": -6.966431515557425, "global_step": 170267, "epoch": 4053, "val_loss": 79921.2421875} {"train_loss": -7.038974285125732, "global_step": 170268, "epoch": 4054} {"train_loss": -6.961607456207275, "global_step": 170269, "epoch": 4054} {"train_loss": -6.984962463378906, "global_step": 170270, "epoch": 4054} {"train_loss": -7.04340124130249, "global_step": 170271, "epoch": 4054} {"train_loss": -6.945801734924316, "global_step": 170272, "epoch": 4054} {"train_loss": -6.968345642089844, "global_step": 170273, "epoch": 4054} {"train_loss": -6.940257549285889, "global_step": 170274, "epoch": 4054} {"train_loss": -6.956373691558838, "global_step": 170275, "epoch": 4054} {"train_loss": -7.0547685623168945, "global_step": 170276, "epoch": 4054} {"train_loss": -6.965827941894531, "global_step": 170277, "epoch": 4054} {"train_loss": -7.026644706726074, "global_step": 170278, "epoch": 4054} {"train_loss": -7.228647232055664, "global_step": 170279, "epoch": 4054} {"train_loss": -7.063703536987305, "global_step": 170280, "epoch": 4054} {"train_loss": -6.975874900817871, "global_step": 170281, "epoch": 4054} {"train_loss": -7.13327693939209, "global_step": 170282, "epoch": 4054} {"train_loss": -7.089781761169434, "global_step": 170283, "epoch": 4054} {"train_loss": -7.101106643676758, "global_step": 170284, "epoch": 4054} {"train_loss": -7.01992130279541, "global_step": 170285, "epoch": 4054} {"train_loss": -7.22412633895874, "global_step": 170286, "epoch": 4054} {"train_loss": -7.052733421325684, "global_step": 170287, "epoch": 4054} {"train_loss": -7.054259300231934, "global_step": 170288, "epoch": 4054} {"train_loss": -7.122651100158691, "global_step": 170289, "epoch": 4054} {"train_loss": -7.097736358642578, "global_step": 170290, "epoch": 4054} {"train_loss": -7.098952770233154, "global_step": 170291, "epoch": 4054} {"train_loss": -6.987415313720703, "global_step": 170292, "epoch": 4054} {"train_loss": -6.941383361816406, "global_step": 170293, "epoch": 4054} {"train_loss": -7.040653705596924, "global_step": 170294, "epoch": 4054} {"train_loss": -7.0789265632629395, "global_step": 170295, "epoch": 4054} {"train_loss": -7.166462421417236, "global_step": 170296, "epoch": 4054} {"train_loss": -7.080598831176758, "global_step": 170297, "epoch": 4054} {"train_loss": -7.000181198120117, "global_step": 170298, "epoch": 4054} {"train_loss": -6.972411632537842, "global_step": 170299, "epoch": 4054} {"train_loss": -7.143922328948975, "global_step": 170300, "epoch": 4054} {"train_loss": -7.069367408752441, "global_step": 170301, "epoch": 4054} {"train_loss": -7.0711259841918945, "global_step": 170302, "epoch": 4054} {"train_loss": -7.183109760284424, "global_step": 170303, "epoch": 4054} {"train_loss": -7.086790084838867, "global_step": 170304, "epoch": 4054} {"train_loss": -6.9846720695495605, "global_step": 170305, "epoch": 4054} {"train_loss": -7.057746887207031, "global_step": 170306, "epoch": 4054} {"train_loss": -7.132675647735596, "global_step": 170307, "epoch": 4054} {"train_loss": -6.980282306671143, "global_step": 170308, "epoch": 4054} {"train_loss": -7.050522895086379, "global_step": 170309, "epoch": 4054, "val_loss": 79757.6015625} {"train_loss": -7.14698600769043, "global_step": 170310, "epoch": 4055} {"train_loss": -7.1180267333984375, "global_step": 170311, "epoch": 4055} {"train_loss": -7.090542793273926, "global_step": 170312, "epoch": 4055} {"train_loss": -7.151851177215576, "global_step": 170313, "epoch": 4055} {"train_loss": -7.151361465454102, "global_step": 170314, "epoch": 4055} {"train_loss": -7.139362335205078, "global_step": 170315, "epoch": 4055} {"train_loss": -7.136968612670898, "global_step": 170316, "epoch": 4055} {"train_loss": -7.146640777587891, "global_step": 170317, "epoch": 4055} {"train_loss": -7.16295051574707, "global_step": 170318, "epoch": 4055} {"train_loss": -7.110805988311768, "global_step": 170319, "epoch": 4055} {"train_loss": -7.07826566696167, "global_step": 170320, "epoch": 4055} {"train_loss": -7.014155387878418, "global_step": 170321, "epoch": 4055} {"train_loss": -7.079168319702148, "global_step": 170322, "epoch": 4055} {"train_loss": -7.0744123458862305, "global_step": 170323, "epoch": 4055} {"train_loss": -7.027867317199707, "global_step": 170324, "epoch": 4055} {"train_loss": -7.057211875915527, "global_step": 170325, "epoch": 4055} {"train_loss": -6.998504161834717, "global_step": 170326, "epoch": 4055} {"train_loss": -6.869136810302734, "global_step": 170327, "epoch": 4055} {"train_loss": -6.968141555786133, "global_step": 170328, "epoch": 4055} {"train_loss": -7.152923107147217, "global_step": 170329, "epoch": 4055} {"train_loss": -6.928196907043457, "global_step": 170330, "epoch": 4055} {"train_loss": -7.021339416503906, "global_step": 170331, "epoch": 4055} {"train_loss": -6.971313953399658, "global_step": 170332, "epoch": 4055} {"train_loss": -6.996053695678711, "global_step": 170333, "epoch": 4055} {"train_loss": -7.076955795288086, "global_step": 170334, "epoch": 4055} {"train_loss": -6.843507766723633, "global_step": 170335, "epoch": 4055} {"train_loss": -7.027227878570557, "global_step": 170336, "epoch": 4055} {"train_loss": -7.013099193572998, "global_step": 170337, "epoch": 4055} {"train_loss": -6.92728328704834, "global_step": 170338, "epoch": 4055} {"train_loss": -6.919155120849609, "global_step": 170339, "epoch": 4055} {"train_loss": -6.913575172424316, "global_step": 170340, "epoch": 4055} {"train_loss": -7.0286736488342285, "global_step": 170341, "epoch": 4055} {"train_loss": -6.983766078948975, "global_step": 170342, "epoch": 4055} {"train_loss": -6.956384181976318, "global_step": 170343, "epoch": 4055} {"train_loss": -6.962007522583008, "global_step": 170344, "epoch": 4055} {"train_loss": -7.055646896362305, "global_step": 170345, "epoch": 4055} {"train_loss": -6.97817850112915, "global_step": 170346, "epoch": 4055} {"train_loss": -7.026982307434082, "global_step": 170347, "epoch": 4055} {"train_loss": -7.09761905670166, "global_step": 170348, "epoch": 4055} {"train_loss": -7.057724952697754, "global_step": 170349, "epoch": 4055} {"train_loss": -7.091156005859375, "global_step": 170350, "epoch": 4055} {"train_loss": -7.038100253968012, "global_step": 170351, "epoch": 4055, "val_loss": 79893.640625} {"train_loss": -7.061500549316406, "global_step": 170352, "epoch": 4056} {"train_loss": -7.0000762939453125, "global_step": 170353, "epoch": 4056} {"train_loss": -7.1013031005859375, "global_step": 170354, "epoch": 4056} {"train_loss": -7.104053974151611, "global_step": 170355, "epoch": 4056} {"train_loss": -6.997949600219727, "global_step": 170356, "epoch": 4056} {"train_loss": -6.944986343383789, "global_step": 170357, "epoch": 4056} {"train_loss": -6.989048957824707, "global_step": 170358, "epoch": 4056} {"train_loss": -7.070427417755127, "global_step": 170359, "epoch": 4056} {"train_loss": -7.023855209350586, "global_step": 170360, "epoch": 4056} {"train_loss": -7.058126449584961, "global_step": 170361, "epoch": 4056} {"train_loss": -7.11525821685791, "global_step": 170362, "epoch": 4056} {"train_loss": -7.1681108474731445, "global_step": 170363, "epoch": 4056} {"train_loss": -7.041179656982422, "global_step": 170364, "epoch": 4056} {"train_loss": -7.025681495666504, "global_step": 170365, "epoch": 4056} {"train_loss": -6.896290302276611, "global_step": 170366, "epoch": 4056} {"train_loss": -7.063164234161377, "global_step": 170367, "epoch": 4056} {"train_loss": -6.999699592590332, "global_step": 170368, "epoch": 4056} {"train_loss": -6.9330153465271, "global_step": 170369, "epoch": 4056} {"train_loss": -7.104530334472656, "global_step": 170370, "epoch": 4056} {"train_loss": -6.939464092254639, "global_step": 170371, "epoch": 4056} {"train_loss": -7.046570777893066, "global_step": 170372, "epoch": 4056} {"train_loss": -6.9826154708862305, "global_step": 170373, "epoch": 4056} {"train_loss": -7.015988826751709, "global_step": 170374, "epoch": 4056} {"train_loss": -7.033027648925781, "global_step": 170375, "epoch": 4056} {"train_loss": -7.14150333404541, "global_step": 170376, "epoch": 4056} {"train_loss": -6.9313225746154785, "global_step": 170377, "epoch": 4056} {"train_loss": -7.039554595947266, "global_step": 170378, "epoch": 4056} {"train_loss": -7.009801387786865, "global_step": 170379, "epoch": 4056} {"train_loss": -7.039564609527588, "global_step": 170380, "epoch": 4056} {"train_loss": -7.014150142669678, "global_step": 170381, "epoch": 4056} {"train_loss": -7.00079345703125, "global_step": 170382, "epoch": 4056} {"train_loss": -7.118587493896484, "global_step": 170383, "epoch": 4056} {"train_loss": -7.070856094360352, "global_step": 170384, "epoch": 4056} {"train_loss": -7.144456386566162, "global_step": 170385, "epoch": 4056} {"train_loss": -7.052177429199219, "global_step": 170386, "epoch": 4056} {"train_loss": -6.943231582641602, "global_step": 170387, "epoch": 4056} {"train_loss": -7.129280090332031, "global_step": 170388, "epoch": 4056} {"train_loss": -6.9681220054626465, "global_step": 170389, "epoch": 4056} {"train_loss": -7.133195877075195, "global_step": 170390, "epoch": 4056} {"train_loss": -7.05712890625, "global_step": 170391, "epoch": 4056} {"train_loss": -7.131658554077148, "global_step": 170392, "epoch": 4056} {"train_loss": -7.040427650724139, "global_step": 170393, "epoch": 4056, "val_loss": 79722.8359375} {"train_loss": -6.992593765258789, "global_step": 170394, "epoch": 4057} {"train_loss": -7.102477550506592, "global_step": 170395, "epoch": 4057} {"train_loss": -7.070396423339844, "global_step": 170396, "epoch": 4057} {"train_loss": -7.01302433013916, "global_step": 170397, "epoch": 4057} {"train_loss": -7.102982521057129, "global_step": 170398, "epoch": 4057} {"train_loss": -7.093684196472168, "global_step": 170399, "epoch": 4057} {"train_loss": -7.050349235534668, "global_step": 170400, "epoch": 4057} {"train_loss": -7.053471565246582, "global_step": 170401, "epoch": 4057} {"train_loss": -7.0429182052612305, "global_step": 170402, "epoch": 4057} {"train_loss": -7.012787818908691, "global_step": 170403, "epoch": 4057} {"train_loss": -7.04195499420166, "global_step": 170404, "epoch": 4057} {"train_loss": -7.074199676513672, "global_step": 170405, "epoch": 4057} {"train_loss": -7.05299186706543, "global_step": 170406, "epoch": 4057} {"train_loss": -7.072098731994629, "global_step": 170407, "epoch": 4057} {"train_loss": -7.13170051574707, "global_step": 170408, "epoch": 4057} {"train_loss": -7.053190231323242, "global_step": 170409, "epoch": 4057} {"train_loss": -6.987351417541504, "global_step": 170410, "epoch": 4057} {"train_loss": -7.115107536315918, "global_step": 170411, "epoch": 4057} {"train_loss": -7.012850284576416, "global_step": 170412, "epoch": 4057} {"train_loss": -7.044424057006836, "global_step": 170413, "epoch": 4057} {"train_loss": -7.073904037475586, "global_step": 170414, "epoch": 4057} {"train_loss": -6.9633588790893555, "global_step": 170415, "epoch": 4057} {"train_loss": -7.06124210357666, "global_step": 170416, "epoch": 4057} {"train_loss": -6.9274821281433105, "global_step": 170417, "epoch": 4057} {"train_loss": -7.044423580169678, "global_step": 170418, "epoch": 4057} {"train_loss": -6.881226539611816, "global_step": 170419, "epoch": 4057} {"train_loss": -6.861824989318848, "global_step": 170420, "epoch": 4057} {"train_loss": -7.0752272605896, "global_step": 170421, "epoch": 4057} {"train_loss": -6.943660736083984, "global_step": 170422, "epoch": 4057} {"train_loss": -7.141629219055176, "global_step": 170423, "epoch": 4057} {"train_loss": -6.99250602722168, "global_step": 170424, "epoch": 4057} {"train_loss": -6.956138610839844, "global_step": 170425, "epoch": 4057} {"train_loss": -6.988754749298096, "global_step": 170426, "epoch": 4057} {"train_loss": -6.966368675231934, "global_step": 170427, "epoch": 4057} {"train_loss": -6.996752738952637, "global_step": 170428, "epoch": 4057} {"train_loss": -6.902978420257568, "global_step": 170429, "epoch": 4057} {"train_loss": -6.9910454750061035, "global_step": 170430, "epoch": 4057} {"train_loss": -7.011053085327148, "global_step": 170431, "epoch": 4057} {"train_loss": -7.021185398101807, "global_step": 170432, "epoch": 4057} {"train_loss": -7.014400005340576, "global_step": 170433, "epoch": 4057} {"train_loss": -7.005902290344238, "global_step": 170434, "epoch": 4057} {"train_loss": -7.023202578226726, "global_step": 170435, "epoch": 4057, "val_loss": 79838.1875} {"train_loss": -7.155004024505615, "global_step": 170436, "epoch": 4058} {"train_loss": -7.04238224029541, "global_step": 170437, "epoch": 4058} {"train_loss": -6.999326229095459, "global_step": 170438, "epoch": 4058} {"train_loss": -7.012059688568115, "global_step": 170439, "epoch": 4058} {"train_loss": -7.073760986328125, "global_step": 170440, "epoch": 4058} {"train_loss": -7.042585372924805, "global_step": 170441, "epoch": 4058} {"train_loss": -7.10349178314209, "global_step": 170442, "epoch": 4058} {"train_loss": -7.003303050994873, "global_step": 170443, "epoch": 4058} {"train_loss": -7.151643753051758, "global_step": 170444, "epoch": 4058} {"train_loss": -7.097196102142334, "global_step": 170445, "epoch": 4058} {"train_loss": -7.117592811584473, "global_step": 170446, "epoch": 4058} {"train_loss": -7.048481464385986, "global_step": 170447, "epoch": 4058} {"train_loss": -7.048494815826416, "global_step": 170448, "epoch": 4058} {"train_loss": -7.07927942276001, "global_step": 170449, "epoch": 4058} {"train_loss": -7.007739067077637, "global_step": 170450, "epoch": 4058} {"train_loss": -7.065386772155762, "global_step": 170451, "epoch": 4058} {"train_loss": -6.9314165115356445, "global_step": 170452, "epoch": 4058} {"train_loss": -7.107665061950684, "global_step": 170453, "epoch": 4058} {"train_loss": -7.013730525970459, "global_step": 170454, "epoch": 4058} {"train_loss": -7.037372589111328, "global_step": 170455, "epoch": 4058} {"train_loss": -7.029193878173828, "global_step": 170456, "epoch": 4058} {"train_loss": -7.0564188957214355, "global_step": 170457, "epoch": 4058} {"train_loss": -7.106483459472656, "global_step": 170458, "epoch": 4058} {"train_loss": -7.006717205047607, "global_step": 170459, "epoch": 4058} {"train_loss": -6.92997407913208, "global_step": 170460, "epoch": 4058} {"train_loss": -7.051200866699219, "global_step": 170461, "epoch": 4058} {"train_loss": -6.933770656585693, "global_step": 170462, "epoch": 4058} {"train_loss": -7.036145210266113, "global_step": 170463, "epoch": 4058} {"train_loss": -7.05918025970459, "global_step": 170464, "epoch": 4058} {"train_loss": -7.032365798950195, "global_step": 170465, "epoch": 4058} {"train_loss": -6.984563827514648, "global_step": 170466, "epoch": 4058} {"train_loss": -7.049874305725098, "global_step": 170467, "epoch": 4058} {"train_loss": -7.062191009521484, "global_step": 170468, "epoch": 4058} {"train_loss": -6.9393415451049805, "global_step": 170469, "epoch": 4058} {"train_loss": -7.0550312995910645, "global_step": 170470, "epoch": 4058} {"train_loss": -6.958477020263672, "global_step": 170471, "epoch": 4058} {"train_loss": -6.9998979568481445, "global_step": 170472, "epoch": 4058} {"train_loss": -6.896035194396973, "global_step": 170473, "epoch": 4058} {"train_loss": -6.942567348480225, "global_step": 170474, "epoch": 4058} {"train_loss": -6.949763298034668, "global_step": 170475, "epoch": 4058} {"train_loss": -7.062342643737793, "global_step": 170476, "epoch": 4058} {"train_loss": -7.030621153967721, "global_step": 170477, "epoch": 4058, "val_loss": 79866.2421875} {"train_loss": -7.035273551940918, "global_step": 170478, "epoch": 4059} {"train_loss": -7.112137794494629, "global_step": 170479, "epoch": 4059} {"train_loss": -7.192493915557861, "global_step": 170480, "epoch": 4059} {"train_loss": -7.059508323669434, "global_step": 170481, "epoch": 4059} {"train_loss": -7.020280838012695, "global_step": 170482, "epoch": 4059} {"train_loss": -7.0758819580078125, "global_step": 170483, "epoch": 4059} {"train_loss": -7.130593299865723, "global_step": 170484, "epoch": 4059} {"train_loss": -7.043581485748291, "global_step": 170485, "epoch": 4059} {"train_loss": -7.05962610244751, "global_step": 170486, "epoch": 4059} {"train_loss": -7.009404182434082, "global_step": 170487, "epoch": 4059} {"train_loss": -7.066032886505127, "global_step": 170488, "epoch": 4059} {"train_loss": -6.983244895935059, "global_step": 170489, "epoch": 4059} {"train_loss": -7.009683609008789, "global_step": 170490, "epoch": 4059} {"train_loss": -7.030981063842773, "global_step": 170491, "epoch": 4059} {"train_loss": -6.997769355773926, "global_step": 170492, "epoch": 4059} {"train_loss": -7.000467300415039, "global_step": 170493, "epoch": 4059} {"train_loss": -7.111769676208496, "global_step": 170494, "epoch": 4059} {"train_loss": -6.998358726501465, "global_step": 170495, "epoch": 4059} {"train_loss": -7.098721981048584, "global_step": 170496, "epoch": 4059} {"train_loss": -7.169849395751953, "global_step": 170497, "epoch": 4059} {"train_loss": -7.023789405822754, "global_step": 170498, "epoch": 4059} {"train_loss": -7.098397254943848, "global_step": 170499, "epoch": 4059} {"train_loss": -7.050978660583496, "global_step": 170500, "epoch": 4059} {"train_loss": -7.090880393981934, "global_step": 170501, "epoch": 4059} {"train_loss": -7.117031097412109, "global_step": 170502, "epoch": 4059} {"train_loss": -6.897705078125, "global_step": 170503, "epoch": 4059} {"train_loss": -7.136290550231934, "global_step": 170504, "epoch": 4059} {"train_loss": -7.055082321166992, "global_step": 170505, "epoch": 4059} {"train_loss": -6.976742744445801, "global_step": 170506, "epoch": 4059} {"train_loss": -7.090878963470459, "global_step": 170507, "epoch": 4059} {"train_loss": -7.124897003173828, "global_step": 170508, "epoch": 4059} {"train_loss": -7.035508632659912, "global_step": 170509, "epoch": 4059} {"train_loss": -7.073139190673828, "global_step": 170510, "epoch": 4059} {"train_loss": -7.084535598754883, "global_step": 170511, "epoch": 4059} {"train_loss": -6.949667930603027, "global_step": 170512, "epoch": 4059} {"train_loss": -7.026375770568848, "global_step": 170513, "epoch": 4059} {"train_loss": -6.972487449645996, "global_step": 170514, "epoch": 4059} {"train_loss": -7.009180068969727, "global_step": 170515, "epoch": 4059} {"train_loss": -7.0621771812438965, "global_step": 170516, "epoch": 4059} {"train_loss": -6.9773969650268555, "global_step": 170517, "epoch": 4059} {"train_loss": -6.993264198303223, "global_step": 170518, "epoch": 4059} {"train_loss": -7.05249411719186, "global_step": 170519, "epoch": 4059, "val_loss": 80068.8515625} {"train_loss": -7.129538536071777, "global_step": 170520, "epoch": 4060} {"train_loss": -7.062985420227051, "global_step": 170521, "epoch": 4060} {"train_loss": -7.172301769256592, "global_step": 170522, "epoch": 4060} {"train_loss": -7.093504905700684, "global_step": 170523, "epoch": 4060} {"train_loss": -7.062833786010742, "global_step": 170524, "epoch": 4060} {"train_loss": -7.151954650878906, "global_step": 170525, "epoch": 4060} {"train_loss": -7.130247116088867, "global_step": 170526, "epoch": 4060} {"train_loss": -7.044846534729004, "global_step": 170527, "epoch": 4060} {"train_loss": -7.177179336547852, "global_step": 170528, "epoch": 4060} {"train_loss": -6.983436584472656, "global_step": 170529, "epoch": 4060} {"train_loss": -6.9703688621521, "global_step": 170530, "epoch": 4060} {"train_loss": -7.175638675689697, "global_step": 170531, "epoch": 4060} {"train_loss": -7.081418037414551, "global_step": 170532, "epoch": 4060} {"train_loss": -6.969851493835449, "global_step": 170533, "epoch": 4060} {"train_loss": -7.132943630218506, "global_step": 170534, "epoch": 4060} {"train_loss": -7.089644432067871, "global_step": 170535, "epoch": 4060} {"train_loss": -6.982516765594482, "global_step": 170536, "epoch": 4060} {"train_loss": -6.99497652053833, "global_step": 170537, "epoch": 4060} {"train_loss": -7.063638687133789, "global_step": 170538, "epoch": 4060} {"train_loss": -6.852419376373291, "global_step": 170539, "epoch": 4060} {"train_loss": -7.047357559204102, "global_step": 170540, "epoch": 4060} {"train_loss": -6.935376167297363, "global_step": 170541, "epoch": 4060} {"train_loss": -6.899267673492432, "global_step": 170542, "epoch": 4060} {"train_loss": -6.992197036743164, "global_step": 170543, "epoch": 4060} {"train_loss": -6.907365322113037, "global_step": 170544, "epoch": 4060} {"train_loss": -6.963420867919922, "global_step": 170545, "epoch": 4060} {"train_loss": -6.905203819274902, "global_step": 170546, "epoch": 4060} {"train_loss": -6.981278896331787, "global_step": 170547, "epoch": 4060} {"train_loss": -7.127127647399902, "global_step": 170548, "epoch": 4060} {"train_loss": -6.940960884094238, "global_step": 170549, "epoch": 4060} {"train_loss": -6.926579475402832, "global_step": 170550, "epoch": 4060} {"train_loss": -6.95142936706543, "global_step": 170551, "epoch": 4060} {"train_loss": -6.830569744110107, "global_step": 170552, "epoch": 4060} {"train_loss": -6.9960618019104, "global_step": 170553, "epoch": 4060} {"train_loss": -6.965323448181152, "global_step": 170554, "epoch": 4060} {"train_loss": -6.90806770324707, "global_step": 170555, "epoch": 4060} {"train_loss": -6.829931259155273, "global_step": 170556, "epoch": 4060} {"train_loss": -6.804584503173828, "global_step": 170557, "epoch": 4060} {"train_loss": -6.997395038604736, "global_step": 170558, "epoch": 4060} {"train_loss": -6.922854900360107, "global_step": 170559, "epoch": 4060} {"train_loss": -6.98588228225708, "global_step": 170560, "epoch": 4060} {"train_loss": -7.002846808660598, "global_step": 170561, "epoch": 4060, "val_loss": 79921.59375} {"train_loss": -6.992696762084961, "global_step": 170562, "epoch": 4061} {"train_loss": -7.00042200088501, "global_step": 170563, "epoch": 4061} {"train_loss": -6.861234664916992, "global_step": 170564, "epoch": 4061} {"train_loss": -6.992465972900391, "global_step": 170565, "epoch": 4061} {"train_loss": -6.953694820404053, "global_step": 170566, "epoch": 4061} {"train_loss": -6.99880313873291, "global_step": 170567, "epoch": 4061} {"train_loss": -6.974349021911621, "global_step": 170568, "epoch": 4061} {"train_loss": -6.9288010597229, "global_step": 170569, "epoch": 4061} {"train_loss": -6.920172691345215, "global_step": 170570, "epoch": 4061} {"train_loss": -6.99813175201416, "global_step": 170571, "epoch": 4061} {"train_loss": -6.9543657302856445, "global_step": 170572, "epoch": 4061} {"train_loss": -7.0279998779296875, "global_step": 170573, "epoch": 4061} {"train_loss": -7.038487911224365, "global_step": 170574, "epoch": 4061} {"train_loss": -7.074215888977051, "global_step": 170575, "epoch": 4061} {"train_loss": -7.002229690551758, "global_step": 170576, "epoch": 4061} {"train_loss": -7.052408218383789, "global_step": 170577, "epoch": 4061} {"train_loss": -7.042503833770752, "global_step": 170578, "epoch": 4061} {"train_loss": -6.925384521484375, "global_step": 170579, "epoch": 4061} {"train_loss": -6.919581890106201, "global_step": 170580, "epoch": 4061} {"train_loss": -7.127098083496094, "global_step": 170581, "epoch": 4061} {"train_loss": -7.0774664878845215, "global_step": 170582, "epoch": 4061} {"train_loss": -6.9053263664245605, "global_step": 170583, "epoch": 4061} {"train_loss": -7.034475803375244, "global_step": 170584, "epoch": 4061} {"train_loss": -6.985729217529297, "global_step": 170585, "epoch": 4061} {"train_loss": -6.996138095855713, "global_step": 170586, "epoch": 4061} {"train_loss": -7.009122848510742, "global_step": 170587, "epoch": 4061} {"train_loss": -6.950168609619141, "global_step": 170588, "epoch": 4061} {"train_loss": -7.038382053375244, "global_step": 170589, "epoch": 4061} {"train_loss": -6.995247840881348, "global_step": 170590, "epoch": 4061} {"train_loss": -6.955925464630127, "global_step": 170591, "epoch": 4061} {"train_loss": -7.023541450500488, "global_step": 170592, "epoch": 4061} {"train_loss": -6.933835983276367, "global_step": 170593, "epoch": 4061} {"train_loss": -7.028226375579834, "global_step": 170594, "epoch": 4061} {"train_loss": -7.098944664001465, "global_step": 170595, "epoch": 4061} {"train_loss": -6.994723320007324, "global_step": 170596, "epoch": 4061} {"train_loss": -7.075589179992676, "global_step": 170597, "epoch": 4061} {"train_loss": -7.048795700073242, "global_step": 170598, "epoch": 4061} {"train_loss": -6.958730697631836, "global_step": 170599, "epoch": 4061} {"train_loss": -7.024521827697754, "global_step": 170600, "epoch": 4061} {"train_loss": -7.022604942321777, "global_step": 170601, "epoch": 4061} {"train_loss": -6.964461326599121, "global_step": 170602, "epoch": 4061} {"train_loss": -6.999454373405094, "global_step": 170603, "epoch": 4061, "val_loss": 79790.109375} {"train_loss": -6.893991470336914, "global_step": 170604, "epoch": 4062} {"train_loss": -7.02539587020874, "global_step": 170605, "epoch": 4062} {"train_loss": -6.918222904205322, "global_step": 170606, "epoch": 4062} {"train_loss": -7.049664497375488, "global_step": 170607, "epoch": 4062} {"train_loss": -7.048966407775879, "global_step": 170608, "epoch": 4062} {"train_loss": -6.915258884429932, "global_step": 170609, "epoch": 4062} {"train_loss": -6.927350997924805, "global_step": 170610, "epoch": 4062} {"train_loss": -7.160878658294678, "global_step": 170611, "epoch": 4062} {"train_loss": -6.884579181671143, "global_step": 170612, "epoch": 4062} {"train_loss": -6.98900032043457, "global_step": 170613, "epoch": 4062} {"train_loss": -7.0473856925964355, "global_step": 170614, "epoch": 4062} {"train_loss": -7.009977340698242, "global_step": 170615, "epoch": 4062} {"train_loss": -7.055115222930908, "global_step": 170616, "epoch": 4062} {"train_loss": -6.986391067504883, "global_step": 170617, "epoch": 4062} {"train_loss": -6.987492561340332, "global_step": 170618, "epoch": 4062} {"train_loss": -7.145411968231201, "global_step": 170619, "epoch": 4062} {"train_loss": -7.069745063781738, "global_step": 170620, "epoch": 4062} {"train_loss": -7.13253927230835, "global_step": 170621, "epoch": 4062} {"train_loss": -7.091224670410156, "global_step": 170622, "epoch": 4062} {"train_loss": -7.111393928527832, "global_step": 170623, "epoch": 4062} {"train_loss": -6.9300737380981445, "global_step": 170624, "epoch": 4062} {"train_loss": -7.126011371612549, "global_step": 170625, "epoch": 4062} {"train_loss": -7.170464515686035, "global_step": 170626, "epoch": 4062} {"train_loss": -7.094498634338379, "global_step": 170627, "epoch": 4062} {"train_loss": -7.04534387588501, "global_step": 170628, "epoch": 4062} {"train_loss": -7.0577921867370605, "global_step": 170629, "epoch": 4062} {"train_loss": -7.043408393859863, "global_step": 170630, "epoch": 4062} {"train_loss": -6.932434558868408, "global_step": 170631, "epoch": 4062} {"train_loss": -7.03023624420166, "global_step": 170632, "epoch": 4062} {"train_loss": -7.134543418884277, "global_step": 170633, "epoch": 4062} {"train_loss": -7.0637922286987305, "global_step": 170634, "epoch": 4062} {"train_loss": -7.090517997741699, "global_step": 170635, "epoch": 4062} {"train_loss": -7.051321506500244, "global_step": 170636, "epoch": 4062} {"train_loss": -7.205692291259766, "global_step": 170637, "epoch": 4062} {"train_loss": -6.978361129760742, "global_step": 170638, "epoch": 4062} {"train_loss": -7.07667875289917, "global_step": 170639, "epoch": 4062} {"train_loss": -7.137095928192139, "global_step": 170640, "epoch": 4062} {"train_loss": -7.1199750900268555, "global_step": 170641, "epoch": 4062} {"train_loss": -7.142932415008545, "global_step": 170642, "epoch": 4062} {"train_loss": -7.229723930358887, "global_step": 170643, "epoch": 4062} {"train_loss": -7.001872539520264, "global_step": 170644, "epoch": 4062} {"train_loss": -7.049663941065471, "global_step": 170645, "epoch": 4062, "val_loss": 79715.5546875} {"train_loss": -6.949446678161621, "global_step": 170646, "epoch": 4063} {"train_loss": -7.192988395690918, "global_step": 170647, "epoch": 4063} {"train_loss": -7.03448486328125, "global_step": 170648, "epoch": 4063} {"train_loss": -7.191829681396484, "global_step": 170649, "epoch": 4063} {"train_loss": -7.109474182128906, "global_step": 170650, "epoch": 4063} {"train_loss": -7.052367210388184, "global_step": 170651, "epoch": 4063} {"train_loss": -7.131988525390625, "global_step": 170652, "epoch": 4063} {"train_loss": -7.153073310852051, "global_step": 170653, "epoch": 4063} {"train_loss": -6.9778337478637695, "global_step": 170654, "epoch": 4063} {"train_loss": -7.110172271728516, "global_step": 170655, "epoch": 4063} {"train_loss": -7.115487575531006, "global_step": 170656, "epoch": 4063} {"train_loss": -7.0537824630737305, "global_step": 170657, "epoch": 4063} {"train_loss": -7.032042026519775, "global_step": 170658, "epoch": 4063} {"train_loss": -6.989226341247559, "global_step": 170659, "epoch": 4063} {"train_loss": -7.07075834274292, "global_step": 170660, "epoch": 4063} {"train_loss": -7.072177886962891, "global_step": 170661, "epoch": 4063} {"train_loss": -7.0173749923706055, "global_step": 170662, "epoch": 4063} {"train_loss": -7.065530776977539, "global_step": 170663, "epoch": 4063} {"train_loss": -6.976006984710693, "global_step": 170664, "epoch": 4063} {"train_loss": -7.0330095291137695, "global_step": 170665, "epoch": 4063} {"train_loss": -6.979273796081543, "global_step": 170666, "epoch": 4063} {"train_loss": -7.039196968078613, "global_step": 170667, "epoch": 4063} {"train_loss": -6.998769283294678, "global_step": 170668, "epoch": 4063} {"train_loss": -7.066228866577148, "global_step": 170669, "epoch": 4063} {"train_loss": -7.064203262329102, "global_step": 170670, "epoch": 4063} {"train_loss": -7.175829887390137, "global_step": 170671, "epoch": 4063} {"train_loss": -7.062065124511719, "global_step": 170672, "epoch": 4063} {"train_loss": -7.143789291381836, "global_step": 170673, "epoch": 4063} {"train_loss": -7.078651428222656, "global_step": 170674, "epoch": 4063} {"train_loss": -7.118649959564209, "global_step": 170675, "epoch": 4063} {"train_loss": -7.014604568481445, "global_step": 170676, "epoch": 4063} {"train_loss": -7.1726884841918945, "global_step": 170677, "epoch": 4063} {"train_loss": -7.041569232940674, "global_step": 170678, "epoch": 4063} {"train_loss": -7.10764741897583, "global_step": 170679, "epoch": 4063} {"train_loss": -7.049597263336182, "global_step": 170680, "epoch": 4063} {"train_loss": -6.951378345489502, "global_step": 170681, "epoch": 4063} {"train_loss": -6.937804222106934, "global_step": 170682, "epoch": 4063} {"train_loss": -7.06088924407959, "global_step": 170683, "epoch": 4063} {"train_loss": -7.027536869049072, "global_step": 170684, "epoch": 4063} {"train_loss": -6.929705619812012, "global_step": 170685, "epoch": 4063} {"train_loss": -7.184641361236572, "global_step": 170686, "epoch": 4063} {"train_loss": -7.062364907491775, "global_step": 170687, "epoch": 4063, "val_loss": 80149.2109375} {"train_loss": -7.049337387084961, "global_step": 170688, "epoch": 4064} {"train_loss": -7.055507659912109, "global_step": 170689, "epoch": 4064} {"train_loss": -7.007165908813477, "global_step": 170690, "epoch": 4064} {"train_loss": -7.068784713745117, "global_step": 170691, "epoch": 4064} {"train_loss": -7.150582790374756, "global_step": 170692, "epoch": 4064} {"train_loss": -7.301531791687012, "global_step": 170693, "epoch": 4064} {"train_loss": -6.932864189147949, "global_step": 170694, "epoch": 4064} {"train_loss": -7.184405326843262, "global_step": 170695, "epoch": 4064} {"train_loss": -7.161097049713135, "global_step": 170696, "epoch": 4064} {"train_loss": -7.130248546600342, "global_step": 170697, "epoch": 4064} {"train_loss": -7.116665840148926, "global_step": 170698, "epoch": 4064} {"train_loss": -7.114575386047363, "global_step": 170699, "epoch": 4064} {"train_loss": -7.113237380981445, "global_step": 170700, "epoch": 4064} {"train_loss": -7.156033515930176, "global_step": 170701, "epoch": 4064} {"train_loss": -7.082386493682861, "global_step": 170702, "epoch": 4064} {"train_loss": -7.0394134521484375, "global_step": 170703, "epoch": 4064} {"train_loss": -7.1241350173950195, "global_step": 170704, "epoch": 4064} {"train_loss": -7.12406063079834, "global_step": 170705, "epoch": 4064} {"train_loss": -7.166024684906006, "global_step": 170706, "epoch": 4064} {"train_loss": -7.041188716888428, "global_step": 170707, "epoch": 4064} {"train_loss": -7.09572696685791, "global_step": 170708, "epoch": 4064} {"train_loss": -7.065131664276123, "global_step": 170709, "epoch": 4064} {"train_loss": -7.127830505371094, "global_step": 170710, "epoch": 4064} {"train_loss": -7.138683795928955, "global_step": 170711, "epoch": 4064} {"train_loss": -7.042004585266113, "global_step": 170712, "epoch": 4064} {"train_loss": -7.198990821838379, "global_step": 170713, "epoch": 4064} {"train_loss": -6.900868892669678, "global_step": 170714, "epoch": 4064} {"train_loss": -7.109612464904785, "global_step": 170715, "epoch": 4064} {"train_loss": -7.010865211486816, "global_step": 170716, "epoch": 4064} {"train_loss": -7.0223388671875, "global_step": 170717, "epoch": 4064} {"train_loss": -6.9297308921813965, "global_step": 170718, "epoch": 4064} {"train_loss": -6.929340362548828, "global_step": 170719, "epoch": 4064} {"train_loss": -7.147575378417969, "global_step": 170720, "epoch": 4064} {"train_loss": -6.982356071472168, "global_step": 170721, "epoch": 4064} {"train_loss": -7.131959915161133, "global_step": 170722, "epoch": 4064} {"train_loss": -7.014329433441162, "global_step": 170723, "epoch": 4064} {"train_loss": -7.107982635498047, "global_step": 170724, "epoch": 4064} {"train_loss": -7.172738075256348, "global_step": 170725, "epoch": 4064} {"train_loss": -7.114821434020996, "global_step": 170726, "epoch": 4064} {"train_loss": -7.128798484802246, "global_step": 170727, "epoch": 4064} {"train_loss": -6.98077917098999, "global_step": 170728, "epoch": 4064} {"train_loss": -7.084408317293439, "global_step": 170729, "epoch": 4064, "val_loss": 80073.734375} {"train_loss": -7.1305742263793945, "global_step": 170730, "epoch": 4065} {"train_loss": -7.137938499450684, "global_step": 170731, "epoch": 4065} {"train_loss": -7.095155239105225, "global_step": 170732, "epoch": 4065} {"train_loss": -7.119390487670898, "global_step": 170733, "epoch": 4065} {"train_loss": -6.996722221374512, "global_step": 170734, "epoch": 4065} {"train_loss": -7.042688369750977, "global_step": 170735, "epoch": 4065} {"train_loss": -6.9839630126953125, "global_step": 170736, "epoch": 4065} {"train_loss": -6.973443031311035, "global_step": 170737, "epoch": 4065} {"train_loss": -7.115904808044434, "global_step": 170738, "epoch": 4065} {"train_loss": -7.075789451599121, "global_step": 170739, "epoch": 4065} {"train_loss": -7.121811866760254, "global_step": 170740, "epoch": 4065} {"train_loss": -7.020426273345947, "global_step": 170741, "epoch": 4065} {"train_loss": -7.08186149597168, "global_step": 170742, "epoch": 4065} {"train_loss": -7.086219310760498, "global_step": 170743, "epoch": 4065} {"train_loss": -7.13181209564209, "global_step": 170744, "epoch": 4065} {"train_loss": -7.099721908569336, "global_step": 170745, "epoch": 4065} {"train_loss": -7.1079301834106445, "global_step": 170746, "epoch": 4065} {"train_loss": -7.066953182220459, "global_step": 170747, "epoch": 4065} {"train_loss": -7.055953025817871, "global_step": 170748, "epoch": 4065} {"train_loss": -7.112309455871582, "global_step": 170749, "epoch": 4065} {"train_loss": -7.166440010070801, "global_step": 170750, "epoch": 4065} {"train_loss": -6.996135711669922, "global_step": 170751, "epoch": 4065} {"train_loss": -7.087383270263672, "global_step": 170752, "epoch": 4065} {"train_loss": -7.084234714508057, "global_step": 170753, "epoch": 4065} {"train_loss": -7.080842971801758, "global_step": 170754, "epoch": 4065} {"train_loss": -7.127620220184326, "global_step": 170755, "epoch": 4065} {"train_loss": -7.076357364654541, "global_step": 170756, "epoch": 4065} {"train_loss": -6.9589715003967285, "global_step": 170757, "epoch": 4065} {"train_loss": -7.065764904022217, "global_step": 170758, "epoch": 4065} {"train_loss": -7.113519191741943, "global_step": 170759, "epoch": 4065} {"train_loss": -7.020776271820068, "global_step": 170760, "epoch": 4065} {"train_loss": -7.114449501037598, "global_step": 170761, "epoch": 4065} {"train_loss": -6.951101779937744, "global_step": 170762, "epoch": 4065} {"train_loss": -7.033236503601074, "global_step": 170763, "epoch": 4065} {"train_loss": -7.039190292358398, "global_step": 170764, "epoch": 4065} {"train_loss": -7.012637138366699, "global_step": 170765, "epoch": 4065} {"train_loss": -6.99753475189209, "global_step": 170766, "epoch": 4065} {"train_loss": -6.8792009353637695, "global_step": 170767, "epoch": 4065} {"train_loss": -7.108258247375488, "global_step": 170768, "epoch": 4065} {"train_loss": -7.038552284240723, "global_step": 170769, "epoch": 4065} {"train_loss": -6.969754219055176, "global_step": 170770, "epoch": 4065} {"train_loss": -7.061328422455561, "global_step": 170771, "epoch": 4065, "val_loss": 79889.515625} {"train_loss": -6.944109916687012, "global_step": 170772, "epoch": 4066} {"train_loss": -7.0569047927856445, "global_step": 170773, "epoch": 4066} {"train_loss": -6.971627235412598, "global_step": 170774, "epoch": 4066} {"train_loss": -7.069048881530762, "global_step": 170775, "epoch": 4066} {"train_loss": -7.055533409118652, "global_step": 170776, "epoch": 4066} {"train_loss": -7.2314958572387695, "global_step": 170777, "epoch": 4066} {"train_loss": -6.995161056518555, "global_step": 170778, "epoch": 4066} {"train_loss": -7.071444988250732, "global_step": 170779, "epoch": 4066} {"train_loss": -7.054568290710449, "global_step": 170780, "epoch": 4066} {"train_loss": -6.946955680847168, "global_step": 170781, "epoch": 4066} {"train_loss": -7.1445817947387695, "global_step": 170782, "epoch": 4066} {"train_loss": -6.913401126861572, "global_step": 170783, "epoch": 4066} {"train_loss": -7.053348541259766, "global_step": 170784, "epoch": 4066} {"train_loss": -6.988602638244629, "global_step": 170785, "epoch": 4066} {"train_loss": -7.026259422302246, "global_step": 170786, "epoch": 4066} {"train_loss": -6.95449686050415, "global_step": 170787, "epoch": 4066} {"train_loss": -7.033119201660156, "global_step": 170788, "epoch": 4066} {"train_loss": -7.1220879554748535, "global_step": 170789, "epoch": 4066} {"train_loss": -6.972599029541016, "global_step": 170790, "epoch": 4066} {"train_loss": -6.994656562805176, "global_step": 170791, "epoch": 4066} {"train_loss": -7.007208347320557, "global_step": 170792, "epoch": 4066} {"train_loss": -6.920563220977783, "global_step": 170793, "epoch": 4066} {"train_loss": -6.926469802856445, "global_step": 170794, "epoch": 4066} {"train_loss": -7.021202564239502, "global_step": 170795, "epoch": 4066} {"train_loss": -7.1551666259765625, "global_step": 170796, "epoch": 4066} {"train_loss": -6.831737518310547, "global_step": 170797, "epoch": 4066} {"train_loss": -7.062129020690918, "global_step": 170798, "epoch": 4066} {"train_loss": -6.980654239654541, "global_step": 170799, "epoch": 4066} {"train_loss": -6.938333034515381, "global_step": 170800, "epoch": 4066} {"train_loss": -7.047142028808594, "global_step": 170801, "epoch": 4066} {"train_loss": -6.986583232879639, "global_step": 170802, "epoch": 4066} {"train_loss": -7.016570091247559, "global_step": 170803, "epoch": 4066} {"train_loss": -6.9587554931640625, "global_step": 170804, "epoch": 4066} {"train_loss": -6.946936130523682, "global_step": 170805, "epoch": 4066} {"train_loss": -6.9989542961120605, "global_step": 170806, "epoch": 4066} {"train_loss": -6.989484786987305, "global_step": 170807, "epoch": 4066} {"train_loss": -6.90263557434082, "global_step": 170808, "epoch": 4066} {"train_loss": -6.955718994140625, "global_step": 170809, "epoch": 4066} {"train_loss": -7.025282859802246, "global_step": 170810, "epoch": 4066} {"train_loss": -6.95463228225708, "global_step": 170811, "epoch": 4066} {"train_loss": -7.0470733642578125, "global_step": 170812, "epoch": 4066} {"train_loss": -7.00731551079523, "global_step": 170813, "epoch": 4066, "val_loss": 80128.015625} {"train_loss": -7.013209342956543, "global_step": 170814, "epoch": 4067} {"train_loss": -6.919422626495361, "global_step": 170815, "epoch": 4067} {"train_loss": -6.945103645324707, "global_step": 170816, "epoch": 4067} {"train_loss": -7.073972702026367, "global_step": 170817, "epoch": 4067} {"train_loss": -7.101764678955078, "global_step": 170818, "epoch": 4067} {"train_loss": -7.087956428527832, "global_step": 170819, "epoch": 4067} {"train_loss": -7.114956855773926, "global_step": 170820, "epoch": 4067} {"train_loss": -7.108205795288086, "global_step": 170821, "epoch": 4067} {"train_loss": -7.071497917175293, "global_step": 170822, "epoch": 4067} {"train_loss": -7.046219825744629, "global_step": 170823, "epoch": 4067} {"train_loss": -7.208024978637695, "global_step": 170824, "epoch": 4067} {"train_loss": -6.976487159729004, "global_step": 170825, "epoch": 4067} {"train_loss": -7.114113807678223, "global_step": 170826, "epoch": 4067} {"train_loss": -7.020805835723877, "global_step": 170827, "epoch": 4067} {"train_loss": -7.149219512939453, "global_step": 170828, "epoch": 4067} {"train_loss": -7.120812892913818, "global_step": 170829, "epoch": 4067} {"train_loss": -7.127756595611572, "global_step": 170830, "epoch": 4067} {"train_loss": -7.037780284881592, "global_step": 170831, "epoch": 4067} {"train_loss": -7.033163070678711, "global_step": 170832, "epoch": 4067} {"train_loss": -7.071981430053711, "global_step": 170833, "epoch": 4067} {"train_loss": -7.138485908508301, "global_step": 170834, "epoch": 4067} {"train_loss": -6.978707313537598, "global_step": 170835, "epoch": 4067} {"train_loss": -7.079917907714844, "global_step": 170836, "epoch": 4067} {"train_loss": -7.060961723327637, "global_step": 170837, "epoch": 4067} {"train_loss": -6.915117263793945, "global_step": 170838, "epoch": 4067} {"train_loss": -7.020643711090088, "global_step": 170839, "epoch": 4067} {"train_loss": -6.9828667640686035, "global_step": 170840, "epoch": 4067} {"train_loss": -7.021812438964844, "global_step": 170841, "epoch": 4067} {"train_loss": -6.804539203643799, "global_step": 170842, "epoch": 4067} {"train_loss": -7.110300064086914, "global_step": 170843, "epoch": 4067} {"train_loss": -6.991961479187012, "global_step": 170844, "epoch": 4067} {"train_loss": -7.000388145446777, "global_step": 170845, "epoch": 4067} {"train_loss": -7.001753807067871, "global_step": 170846, "epoch": 4067} {"train_loss": -6.918113708496094, "global_step": 170847, "epoch": 4067} {"train_loss": -6.89312744140625, "global_step": 170848, "epoch": 4067} {"train_loss": -7.044007301330566, "global_step": 170849, "epoch": 4067} {"train_loss": -6.914153099060059, "global_step": 170850, "epoch": 4067} {"train_loss": -6.979088306427002, "global_step": 170851, "epoch": 4067} {"train_loss": -6.9927449226379395, "global_step": 170852, "epoch": 4067} {"train_loss": -7.059413433074951, "global_step": 170853, "epoch": 4067} {"train_loss": -6.929690837860107, "global_step": 170854, "epoch": 4067} {"train_loss": -7.03070676894415, "global_step": 170855, "epoch": 4067, "val_loss": 80082.46875} {"train_loss": -6.998082160949707, "global_step": 170856, "epoch": 4068} {"train_loss": -7.149575233459473, "global_step": 170857, "epoch": 4068} {"train_loss": -6.936854362487793, "global_step": 170858, "epoch": 4068} {"train_loss": -7.0418243408203125, "global_step": 170859, "epoch": 4068} {"train_loss": -7.143611431121826, "global_step": 170860, "epoch": 4068} {"train_loss": -7.036325454711914, "global_step": 170861, "epoch": 4068} {"train_loss": -6.935575485229492, "global_step": 170862, "epoch": 4068} {"train_loss": -7.0595903396606445, "global_step": 170863, "epoch": 4068} {"train_loss": -7.048137664794922, "global_step": 170864, "epoch": 4068} {"train_loss": -7.072598457336426, "global_step": 170865, "epoch": 4068} {"train_loss": -7.152339458465576, "global_step": 170866, "epoch": 4068} {"train_loss": -7.17605447769165, "global_step": 170867, "epoch": 4068} {"train_loss": -7.084238052368164, "global_step": 170868, "epoch": 4068} {"train_loss": -6.969381809234619, "global_step": 170869, "epoch": 4068} {"train_loss": -7.085262298583984, "global_step": 170870, "epoch": 4068} {"train_loss": -7.086341857910156, "global_step": 170871, "epoch": 4068} {"train_loss": -7.083622932434082, "global_step": 170872, "epoch": 4068} {"train_loss": -7.147966384887695, "global_step": 170873, "epoch": 4068} {"train_loss": -7.143818378448486, "global_step": 170874, "epoch": 4068} {"train_loss": -7.1715497970581055, "global_step": 170875, "epoch": 4068} {"train_loss": -7.205975532531738, "global_step": 170876, "epoch": 4068} {"train_loss": -7.06735897064209, "global_step": 170877, "epoch": 4068} {"train_loss": -7.059866905212402, "global_step": 170878, "epoch": 4068} {"train_loss": -7.0033135414123535, "global_step": 170879, "epoch": 4068} {"train_loss": -6.949148178100586, "global_step": 170880, "epoch": 4068} {"train_loss": -7.175519943237305, "global_step": 170881, "epoch": 4068} {"train_loss": -7.132177829742432, "global_step": 170882, "epoch": 4068} {"train_loss": -7.0672688484191895, "global_step": 170883, "epoch": 4068} {"train_loss": -7.039608001708984, "global_step": 170884, "epoch": 4068} {"train_loss": -7.088681221008301, "global_step": 170885, "epoch": 4068} {"train_loss": -7.0375165939331055, "global_step": 170886, "epoch": 4068} {"train_loss": -7.071403503417969, "global_step": 170887, "epoch": 4068} {"train_loss": -7.097599983215332, "global_step": 170888, "epoch": 4068} {"train_loss": -7.16963005065918, "global_step": 170889, "epoch": 4068} {"train_loss": -6.858614444732666, "global_step": 170890, "epoch": 4068} {"train_loss": -6.9538750648498535, "global_step": 170891, "epoch": 4068} {"train_loss": -7.028292655944824, "global_step": 170892, "epoch": 4068} {"train_loss": -6.965871334075928, "global_step": 170893, "epoch": 4068} {"train_loss": -6.954387664794922, "global_step": 170894, "epoch": 4068} {"train_loss": -6.99996280670166, "global_step": 170895, "epoch": 4068} {"train_loss": -6.845970153808594, "global_step": 170896, "epoch": 4068} {"train_loss": -7.053502378009615, "global_step": 170897, "epoch": 4068, "val_loss": 79864.171875} {"train_loss": -7.089133262634277, "global_step": 170898, "epoch": 4069} {"train_loss": -6.888466835021973, "global_step": 170899, "epoch": 4069} {"train_loss": -7.052657127380371, "global_step": 170900, "epoch": 4069} {"train_loss": -6.962556838989258, "global_step": 170901, "epoch": 4069} {"train_loss": -7.016955375671387, "global_step": 170902, "epoch": 4069} {"train_loss": -6.934299468994141, "global_step": 170903, "epoch": 4069} {"train_loss": -7.00625467300415, "global_step": 170904, "epoch": 4069} {"train_loss": -7.0548295974731445, "global_step": 170905, "epoch": 4069} {"train_loss": -6.951611518859863, "global_step": 170906, "epoch": 4069} {"train_loss": -7.05653190612793, "global_step": 170907, "epoch": 4069} {"train_loss": -7.166783332824707, "global_step": 170908, "epoch": 4069} {"train_loss": -7.019301414489746, "global_step": 170909, "epoch": 4069} {"train_loss": -7.039117336273193, "global_step": 170910, "epoch": 4069} {"train_loss": -7.030463218688965, "global_step": 170911, "epoch": 4069} {"train_loss": -7.073947429656982, "global_step": 170912, "epoch": 4069} {"train_loss": -7.023840427398682, "global_step": 170913, "epoch": 4069} {"train_loss": -7.091041088104248, "global_step": 170914, "epoch": 4069} {"train_loss": -7.078972816467285, "global_step": 170915, "epoch": 4069} {"train_loss": -7.015213966369629, "global_step": 170916, "epoch": 4069} {"train_loss": -7.028650283813477, "global_step": 170917, "epoch": 4069} {"train_loss": -6.990304946899414, "global_step": 170918, "epoch": 4069} {"train_loss": -7.112953186035156, "global_step": 170919, "epoch": 4069} {"train_loss": -7.185362815856934, "global_step": 170920, "epoch": 4069} {"train_loss": -6.885550022125244, "global_step": 170921, "epoch": 4069} {"train_loss": -7.056051731109619, "global_step": 170922, "epoch": 4069} {"train_loss": -7.15757942199707, "global_step": 170923, "epoch": 4069} {"train_loss": -7.120811462402344, "global_step": 170924, "epoch": 4069} {"train_loss": -7.128705978393555, "global_step": 170925, "epoch": 4069} {"train_loss": -7.10984992980957, "global_step": 170926, "epoch": 4069} {"train_loss": -7.039103984832764, "global_step": 170927, "epoch": 4069} {"train_loss": -7.0447492599487305, "global_step": 170928, "epoch": 4069} {"train_loss": -7.072197437286377, "global_step": 170929, "epoch": 4069} {"train_loss": -6.969475746154785, "global_step": 170930, "epoch": 4069} {"train_loss": -7.151725769042969, "global_step": 170931, "epoch": 4069} {"train_loss": -7.132109642028809, "global_step": 170932, "epoch": 4069} {"train_loss": -7.116180896759033, "global_step": 170933, "epoch": 4069} {"train_loss": -6.9537672996521, "global_step": 170934, "epoch": 4069} {"train_loss": -7.124532699584961, "global_step": 170935, "epoch": 4069} {"train_loss": -7.032370090484619, "global_step": 170936, "epoch": 4069} {"train_loss": -6.998323917388916, "global_step": 170937, "epoch": 4069} {"train_loss": -7.107970237731934, "global_step": 170938, "epoch": 4069} {"train_loss": -7.053248507635934, "global_step": 170939, "epoch": 4069, "val_loss": 80023.875} {"train_loss": -7.096460342407227, "global_step": 170940, "epoch": 4070} {"train_loss": -7.083833694458008, "global_step": 170941, "epoch": 4070} {"train_loss": -7.04378604888916, "global_step": 170942, "epoch": 4070} {"train_loss": -7.003809452056885, "global_step": 170943, "epoch": 4070} {"train_loss": -6.948940277099609, "global_step": 170944, "epoch": 4070} {"train_loss": -6.947279453277588, "global_step": 170945, "epoch": 4070} {"train_loss": -7.051031112670898, "global_step": 170946, "epoch": 4070} {"train_loss": -7.0141706466674805, "global_step": 170947, "epoch": 4070} {"train_loss": -7.033305644989014, "global_step": 170948, "epoch": 4070} {"train_loss": -7.007589340209961, "global_step": 170949, "epoch": 4070} {"train_loss": -7.022754669189453, "global_step": 170950, "epoch": 4070} {"train_loss": -7.12788200378418, "global_step": 170951, "epoch": 4070} {"train_loss": -6.926568508148193, "global_step": 170952, "epoch": 4070} {"train_loss": -6.894247055053711, "global_step": 170953, "epoch": 4070} {"train_loss": -7.032726287841797, "global_step": 170954, "epoch": 4070} {"train_loss": -7.006155490875244, "global_step": 170955, "epoch": 4070} {"train_loss": -7.101572513580322, "global_step": 170956, "epoch": 4070} {"train_loss": -7.002890110015869, "global_step": 170957, "epoch": 4070} {"train_loss": -7.137662410736084, "global_step": 170958, "epoch": 4070} {"train_loss": -7.088891983032227, "global_step": 170959, "epoch": 4070} {"train_loss": -7.0346293449401855, "global_step": 170960, "epoch": 4070} {"train_loss": -6.96303129196167, "global_step": 170961, "epoch": 4070} {"train_loss": -6.977960109710693, "global_step": 170962, "epoch": 4070} {"train_loss": -7.104111671447754, "global_step": 170963, "epoch": 4070} {"train_loss": -7.0547261238098145, "global_step": 170964, "epoch": 4070} {"train_loss": -6.966546535491943, "global_step": 170965, "epoch": 4070} {"train_loss": -6.928136348724365, "global_step": 170966, "epoch": 4070} {"train_loss": -6.923179626464844, "global_step": 170967, "epoch": 4070} {"train_loss": -6.989566802978516, "global_step": 170968, "epoch": 4070} {"train_loss": -6.986665725708008, "global_step": 170969, "epoch": 4070} {"train_loss": -6.931346893310547, "global_step": 170970, "epoch": 4070} {"train_loss": -6.9969258308410645, "global_step": 170971, "epoch": 4070} {"train_loss": -6.910904884338379, "global_step": 170972, "epoch": 4070} {"train_loss": -6.961518287658691, "global_step": 170973, "epoch": 4070} {"train_loss": -7.0023627281188965, "global_step": 170974, "epoch": 4070} {"train_loss": -7.089203834533691, "global_step": 170975, "epoch": 4070} {"train_loss": -7.014452934265137, "global_step": 170976, "epoch": 4070} {"train_loss": -6.9881062507629395, "global_step": 170977, "epoch": 4070} {"train_loss": -7.149809837341309, "global_step": 170978, "epoch": 4070} {"train_loss": -7.082935333251953, "global_step": 170979, "epoch": 4070} {"train_loss": -7.033760070800781, "global_step": 170980, "epoch": 4070} {"train_loss": -7.017567532403128, "global_step": 170981, "epoch": 4070, "val_loss": 79974.0859375} {"train_loss": -7.033822059631348, "global_step": 170982, "epoch": 4071} {"train_loss": -6.969010353088379, "global_step": 170983, "epoch": 4071} {"train_loss": -6.940523147583008, "global_step": 170984, "epoch": 4071} {"train_loss": -7.158748626708984, "global_step": 170985, "epoch": 4071} {"train_loss": -6.991628646850586, "global_step": 170986, "epoch": 4071} {"train_loss": -6.962546348571777, "global_step": 170987, "epoch": 4071} {"train_loss": -7.078806400299072, "global_step": 170988, "epoch": 4071} {"train_loss": -7.033700942993164, "global_step": 170989, "epoch": 4071} {"train_loss": -7.004350662231445, "global_step": 170990, "epoch": 4071} {"train_loss": -7.125854969024658, "global_step": 170991, "epoch": 4071} {"train_loss": -6.981435775756836, "global_step": 170992, "epoch": 4071} {"train_loss": -7.071911811828613, "global_step": 170993, "epoch": 4071} {"train_loss": -7.171243667602539, "global_step": 170994, "epoch": 4071} {"train_loss": -7.12044620513916, "global_step": 170995, "epoch": 4071} {"train_loss": -7.191363334655762, "global_step": 170996, "epoch": 4071} {"train_loss": -7.2255706787109375, "global_step": 170997, "epoch": 4071} {"train_loss": -7.189166069030762, "global_step": 170998, "epoch": 4071} {"train_loss": -7.146230697631836, "global_step": 170999, "epoch": 4071} {"train_loss": -7.1543965339660645, "global_step": 171000, "epoch": 4071} {"train_loss": -7.054773330688477, "global_step": 171001, "epoch": 4071} {"train_loss": -6.9971208572387695, "global_step": 171002, "epoch": 4071} {"train_loss": -7.058474540710449, "global_step": 171003, "epoch": 4071} {"train_loss": -7.0431108474731445, "global_step": 171004, "epoch": 4071} {"train_loss": -7.104118347167969, "global_step": 171005, "epoch": 4071} {"train_loss": -6.991722106933594, "global_step": 171006, "epoch": 4071} {"train_loss": -6.939596176147461, "global_step": 171007, "epoch": 4071} {"train_loss": -7.119324684143066, "global_step": 171008, "epoch": 4071} {"train_loss": -7.104982376098633, "global_step": 171009, "epoch": 4071} {"train_loss": -7.157474517822266, "global_step": 171010, "epoch": 4071} {"train_loss": -7.145114898681641, "global_step": 171011, "epoch": 4071} {"train_loss": -7.0440473556518555, "global_step": 171012, "epoch": 4071} {"train_loss": -7.027344703674316, "global_step": 171013, "epoch": 4071} {"train_loss": -7.00222110748291, "global_step": 171014, "epoch": 4071} {"train_loss": -7.14752721786499, "global_step": 171015, "epoch": 4071} {"train_loss": -7.020053863525391, "global_step": 171016, "epoch": 4071} {"train_loss": -7.045881271362305, "global_step": 171017, "epoch": 4071} {"train_loss": -6.956215858459473, "global_step": 171018, "epoch": 4071} {"train_loss": -6.936694145202637, "global_step": 171019, "epoch": 4071} {"train_loss": -7.082143306732178, "global_step": 171020, "epoch": 4071} {"train_loss": -6.958012580871582, "global_step": 171021, "epoch": 4071} {"train_loss": -6.749012470245361, "global_step": 171022, "epoch": 4071} {"train_loss": -7.053174779528663, "global_step": 171023, "epoch": 4071, "val_loss": 79849.46875} {"train_loss": -6.916177749633789, "global_step": 171024, "epoch": 4072} {"train_loss": -6.86013126373291, "global_step": 171025, "epoch": 4072} {"train_loss": -7.026649475097656, "global_step": 171026, "epoch": 4072} {"train_loss": -6.822976112365723, "global_step": 171027, "epoch": 4072} {"train_loss": -6.977546691894531, "global_step": 171028, "epoch": 4072} {"train_loss": -6.965299606323242, "global_step": 171029, "epoch": 4072} {"train_loss": -6.887395858764648, "global_step": 171030, "epoch": 4072} {"train_loss": -7.128286361694336, "global_step": 171031, "epoch": 4072} {"train_loss": -6.961237907409668, "global_step": 171032, "epoch": 4072} {"train_loss": -6.924175262451172, "global_step": 171033, "epoch": 4072} {"train_loss": -6.945402145385742, "global_step": 171034, "epoch": 4072} {"train_loss": -7.041085243225098, "global_step": 171035, "epoch": 4072} {"train_loss": -7.017665863037109, "global_step": 171036, "epoch": 4072} {"train_loss": -6.980367660522461, "global_step": 171037, "epoch": 4072} {"train_loss": -7.065562725067139, "global_step": 171038, "epoch": 4072} {"train_loss": -6.904563903808594, "global_step": 171039, "epoch": 4072} {"train_loss": -7.082549095153809, "global_step": 171040, "epoch": 4072} {"train_loss": -7.048947334289551, "global_step": 171041, "epoch": 4072} {"train_loss": -7.002717018127441, "global_step": 171042, "epoch": 4072} {"train_loss": -6.9769415855407715, "global_step": 171043, "epoch": 4072} {"train_loss": -6.969163417816162, "global_step": 171044, "epoch": 4072} {"train_loss": -7.0784592628479, "global_step": 171045, "epoch": 4072} {"train_loss": -6.966946125030518, "global_step": 171046, "epoch": 4072} {"train_loss": -7.031300067901611, "global_step": 171047, "epoch": 4072} {"train_loss": -7.094381332397461, "global_step": 171048, "epoch": 4072} {"train_loss": -6.974766731262207, "global_step": 171049, "epoch": 4072} {"train_loss": -7.099214553833008, "global_step": 171050, "epoch": 4072} {"train_loss": -7.041496276855469, "global_step": 171051, "epoch": 4072} {"train_loss": -7.140769958496094, "global_step": 171052, "epoch": 4072} {"train_loss": -7.145514488220215, "global_step": 171053, "epoch": 4072} {"train_loss": -7.042441368103027, "global_step": 171054, "epoch": 4072} {"train_loss": -7.131697654724121, "global_step": 171055, "epoch": 4072} {"train_loss": -6.896010398864746, "global_step": 171056, "epoch": 4072} {"train_loss": -7.067173957824707, "global_step": 171057, "epoch": 4072} {"train_loss": -7.138619422912598, "global_step": 171058, "epoch": 4072} {"train_loss": -6.984359264373779, "global_step": 171059, "epoch": 4072} {"train_loss": -6.957167625427246, "global_step": 171060, "epoch": 4072} {"train_loss": -7.042357444763184, "global_step": 171061, "epoch": 4072} {"train_loss": -6.976289749145508, "global_step": 171062, "epoch": 4072} {"train_loss": -6.995096683502197, "global_step": 171063, "epoch": 4072} {"train_loss": -7.067787170410156, "global_step": 171064, "epoch": 4072} {"train_loss": -7.006648018246605, "global_step": 171065, "epoch": 4072, "val_loss": 79821.3359375} {"train_loss": -7.0316925048828125, "global_step": 171066, "epoch": 4073} {"train_loss": -7.091268539428711, "global_step": 171067, "epoch": 4073} {"train_loss": -7.041194915771484, "global_step": 171068, "epoch": 4073} {"train_loss": -6.996771812438965, "global_step": 171069, "epoch": 4073} {"train_loss": -6.960253715515137, "global_step": 171070, "epoch": 4073} {"train_loss": -7.052306652069092, "global_step": 171071, "epoch": 4073} {"train_loss": -7.0666680335998535, "global_step": 171072, "epoch": 4073} {"train_loss": -6.9220709800720215, "global_step": 171073, "epoch": 4073} {"train_loss": -6.995813846588135, "global_step": 171074, "epoch": 4073} {"train_loss": -7.060293197631836, "global_step": 171075, "epoch": 4073} {"train_loss": -7.014529228210449, "global_step": 171076, "epoch": 4073} {"train_loss": -7.033267974853516, "global_step": 171077, "epoch": 4073} {"train_loss": -6.960986137390137, "global_step": 171078, "epoch": 4073} {"train_loss": -6.91888427734375, "global_step": 171079, "epoch": 4073} {"train_loss": -7.17111349105835, "global_step": 171080, "epoch": 4073} {"train_loss": -6.812882423400879, "global_step": 171081, "epoch": 4073} {"train_loss": -6.934618949890137, "global_step": 171082, "epoch": 4073} {"train_loss": -6.9202046394348145, "global_step": 171083, "epoch": 4073} {"train_loss": -6.9601850509643555, "global_step": 171084, "epoch": 4073} {"train_loss": -7.115239143371582, "global_step": 171085, "epoch": 4073} {"train_loss": -6.971941947937012, "global_step": 171086, "epoch": 4073} {"train_loss": -7.073117256164551, "global_step": 171087, "epoch": 4073} {"train_loss": -6.917575836181641, "global_step": 171088, "epoch": 4073} {"train_loss": -7.02386474609375, "global_step": 171089, "epoch": 4073} {"train_loss": -7.039843559265137, "global_step": 171090, "epoch": 4073} {"train_loss": -6.981328964233398, "global_step": 171091, "epoch": 4073} {"train_loss": -7.072841644287109, "global_step": 171092, "epoch": 4073} {"train_loss": -6.959621429443359, "global_step": 171093, "epoch": 4073} {"train_loss": -6.931090831756592, "global_step": 171094, "epoch": 4073} {"train_loss": -7.001349925994873, "global_step": 171095, "epoch": 4073} {"train_loss": -7.004149913787842, "global_step": 171096, "epoch": 4073} {"train_loss": -6.954030990600586, "global_step": 171097, "epoch": 4073} {"train_loss": -6.929934501647949, "global_step": 171098, "epoch": 4073} {"train_loss": -6.993515968322754, "global_step": 171099, "epoch": 4073} {"train_loss": -6.8182692527771, "global_step": 171100, "epoch": 4073} {"train_loss": -6.936669826507568, "global_step": 171101, "epoch": 4073} {"train_loss": -6.807788848876953, "global_step": 171102, "epoch": 4073} {"train_loss": -6.9595794677734375, "global_step": 171103, "epoch": 4073} {"train_loss": -6.829636573791504, "global_step": 171104, "epoch": 4073} {"train_loss": -6.9438042640686035, "global_step": 171105, "epoch": 4073} {"train_loss": -6.943361759185791, "global_step": 171106, "epoch": 4073} {"train_loss": -6.975805203119914, "global_step": 171107, "epoch": 4073, "val_loss": 79950.859375} {"train_loss": -7.043264389038086, "global_step": 171108, "epoch": 4074} {"train_loss": -6.965196132659912, "global_step": 171109, "epoch": 4074} {"train_loss": -6.936822414398193, "global_step": 171110, "epoch": 4074} {"train_loss": -6.904858112335205, "global_step": 171111, "epoch": 4074} {"train_loss": -7.109445095062256, "global_step": 171112, "epoch": 4074} {"train_loss": -6.996776580810547, "global_step": 171113, "epoch": 4074} {"train_loss": -7.044224262237549, "global_step": 171114, "epoch": 4074} {"train_loss": -6.988722324371338, "global_step": 171115, "epoch": 4074} {"train_loss": -6.9075846672058105, "global_step": 171116, "epoch": 4074} {"train_loss": -7.031500339508057, "global_step": 171117, "epoch": 4074} {"train_loss": -7.060670852661133, "global_step": 171118, "epoch": 4074} {"train_loss": -7.0745038986206055, "global_step": 171119, "epoch": 4074} {"train_loss": -6.91947078704834, "global_step": 171120, "epoch": 4074} {"train_loss": -7.019322872161865, "global_step": 171121, "epoch": 4074} {"train_loss": -7.146294593811035, "global_step": 171122, "epoch": 4074} {"train_loss": -7.096906661987305, "global_step": 171123, "epoch": 4074} {"train_loss": -7.073812961578369, "global_step": 171124, "epoch": 4074} {"train_loss": -7.04250955581665, "global_step": 171125, "epoch": 4074} {"train_loss": -7.0063371658325195, "global_step": 171126, "epoch": 4074} {"train_loss": -7.109355926513672, "global_step": 171127, "epoch": 4074} {"train_loss": -7.010861873626709, "global_step": 171128, "epoch": 4074} {"train_loss": -7.043362617492676, "global_step": 171129, "epoch": 4074} {"train_loss": -6.9326252937316895, "global_step": 171130, "epoch": 4074} {"train_loss": -7.088709831237793, "global_step": 171131, "epoch": 4074} {"train_loss": -6.969886779785156, "global_step": 171132, "epoch": 4074} {"train_loss": -7.038006782531738, "global_step": 171133, "epoch": 4074} {"train_loss": -7.039088249206543, "global_step": 171134, "epoch": 4074} {"train_loss": -7.050313472747803, "global_step": 171135, "epoch": 4074} {"train_loss": -7.166047096252441, "global_step": 171136, "epoch": 4074} {"train_loss": -7.115908145904541, "global_step": 171137, "epoch": 4074} {"train_loss": -7.021346092224121, "global_step": 171138, "epoch": 4074} {"train_loss": -7.058974266052246, "global_step": 171139, "epoch": 4074} {"train_loss": -7.099541187286377, "global_step": 171140, "epoch": 4074} {"train_loss": -7.068819046020508, "global_step": 171141, "epoch": 4074} {"train_loss": -7.113705158233643, "global_step": 171142, "epoch": 4074} {"train_loss": -7.055469512939453, "global_step": 171143, "epoch": 4074} {"train_loss": -7.160025596618652, "global_step": 171144, "epoch": 4074} {"train_loss": -7.188458442687988, "global_step": 171145, "epoch": 4074} {"train_loss": -7.166743278503418, "global_step": 171146, "epoch": 4074} {"train_loss": -7.083582878112793, "global_step": 171147, "epoch": 4074} {"train_loss": -7.094995021820068, "global_step": 171148, "epoch": 4074} {"train_loss": -7.051901181538899, "global_step": 171149, "epoch": 4074, "val_loss": 79779.4609375} {"train_loss": -7.014227867126465, "global_step": 171150, "epoch": 4075} {"train_loss": -7.15622615814209, "global_step": 171151, "epoch": 4075} {"train_loss": -7.161338806152344, "global_step": 171152, "epoch": 4075} {"train_loss": -7.093353271484375, "global_step": 171153, "epoch": 4075} {"train_loss": -7.097005844116211, "global_step": 171154, "epoch": 4075} {"train_loss": -7.0137939453125, "global_step": 171155, "epoch": 4075} {"train_loss": -7.138497352600098, "global_step": 171156, "epoch": 4075} {"train_loss": -7.150447845458984, "global_step": 171157, "epoch": 4075} {"train_loss": -7.102189540863037, "global_step": 171158, "epoch": 4075} {"train_loss": -7.0950093269348145, "global_step": 171159, "epoch": 4075} {"train_loss": -7.152395248413086, "global_step": 171160, "epoch": 4075} {"train_loss": -7.049089431762695, "global_step": 171161, "epoch": 4075} {"train_loss": -7.031790256500244, "global_step": 171162, "epoch": 4075} {"train_loss": -7.061370372772217, "global_step": 171163, "epoch": 4075} {"train_loss": -7.045344829559326, "global_step": 171164, "epoch": 4075} {"train_loss": -7.067150592803955, "global_step": 171165, "epoch": 4075} {"train_loss": -6.941995620727539, "global_step": 171166, "epoch": 4075} {"train_loss": -7.038052558898926, "global_step": 171167, "epoch": 4075} {"train_loss": -7.102482795715332, "global_step": 171168, "epoch": 4075} {"train_loss": -7.082276344299316, "global_step": 171169, "epoch": 4075} {"train_loss": -7.033833980560303, "global_step": 171170, "epoch": 4075} {"train_loss": -7.027929782867432, "global_step": 171171, "epoch": 4075} {"train_loss": -7.006799221038818, "global_step": 171172, "epoch": 4075} {"train_loss": -7.026047706604004, "global_step": 171173, "epoch": 4075} {"train_loss": -7.056324005126953, "global_step": 171174, "epoch": 4075} {"train_loss": -7.057950973510742, "global_step": 171175, "epoch": 4075} {"train_loss": -7.101449012756348, "global_step": 171176, "epoch": 4075} {"train_loss": -7.089789867401123, "global_step": 171177, "epoch": 4075} {"train_loss": -7.130324363708496, "global_step": 171178, "epoch": 4075} {"train_loss": -7.088688850402832, "global_step": 171179, "epoch": 4075} {"train_loss": -7.055485725402832, "global_step": 171180, "epoch": 4075} {"train_loss": -7.105107307434082, "global_step": 171181, "epoch": 4075} {"train_loss": -7.088794708251953, "global_step": 171182, "epoch": 4075} {"train_loss": -7.099979400634766, "global_step": 171183, "epoch": 4075} {"train_loss": -7.197906017303467, "global_step": 171184, "epoch": 4075} {"train_loss": -7.185336589813232, "global_step": 171185, "epoch": 4075} {"train_loss": -7.102175712585449, "global_step": 171186, "epoch": 4075} {"train_loss": -7.111676216125488, "global_step": 171187, "epoch": 4075} {"train_loss": -7.181783676147461, "global_step": 171188, "epoch": 4075} {"train_loss": -7.234136581420898, "global_step": 171189, "epoch": 4075} {"train_loss": -7.111833572387695, "global_step": 171190, "epoch": 4075} {"train_loss": -7.091458422797067, "global_step": 171191, "epoch": 4075, "val_loss": 79852.1640625} {"train_loss": -7.241930961608887, "global_step": 171192, "epoch": 4076} {"train_loss": -7.1897406578063965, "global_step": 171193, "epoch": 4076} {"train_loss": -7.168851852416992, "global_step": 171194, "epoch": 4076} {"train_loss": -7.131342887878418, "global_step": 171195, "epoch": 4076} {"train_loss": -7.12077522277832, "global_step": 171196, "epoch": 4076} {"train_loss": -7.150947570800781, "global_step": 171197, "epoch": 4076} {"train_loss": -7.062288761138916, "global_step": 171198, "epoch": 4076} {"train_loss": -7.087653160095215, "global_step": 171199, "epoch": 4076} {"train_loss": -7.073049545288086, "global_step": 171200, "epoch": 4076} {"train_loss": -7.204151153564453, "global_step": 171201, "epoch": 4076} {"train_loss": -7.026528358459473, "global_step": 171202, "epoch": 4076} {"train_loss": -7.085683822631836, "global_step": 171203, "epoch": 4076} {"train_loss": -7.249203681945801, "global_step": 171204, "epoch": 4076} {"train_loss": -7.0420122146606445, "global_step": 171205, "epoch": 4076} {"train_loss": -7.009148597717285, "global_step": 171206, "epoch": 4076} {"train_loss": -7.057868480682373, "global_step": 171207, "epoch": 4076} {"train_loss": -6.933377265930176, "global_step": 171208, "epoch": 4076} {"train_loss": -6.980461597442627, "global_step": 171209, "epoch": 4076} {"train_loss": -7.025393486022949, "global_step": 171210, "epoch": 4076} {"train_loss": -7.020710468292236, "global_step": 171211, "epoch": 4076} {"train_loss": -6.993639945983887, "global_step": 171212, "epoch": 4076} {"train_loss": -7.049344062805176, "global_step": 171213, "epoch": 4076} {"train_loss": -7.09805154800415, "global_step": 171214, "epoch": 4076} {"train_loss": -7.134487152099609, "global_step": 171215, "epoch": 4076} {"train_loss": -7.010527610778809, "global_step": 171216, "epoch": 4076} {"train_loss": -7.06496000289917, "global_step": 171217, "epoch": 4076} {"train_loss": -7.170918941497803, "global_step": 171218, "epoch": 4076} {"train_loss": -6.996059894561768, "global_step": 171219, "epoch": 4076} {"train_loss": -6.978784561157227, "global_step": 171220, "epoch": 4076} {"train_loss": -7.046657085418701, "global_step": 171221, "epoch": 4076} {"train_loss": -7.072770118713379, "global_step": 171222, "epoch": 4076} {"train_loss": -7.075492858886719, "global_step": 171223, "epoch": 4076} {"train_loss": -7.032225131988525, "global_step": 171224, "epoch": 4076} {"train_loss": -7.034187316894531, "global_step": 171225, "epoch": 4076} {"train_loss": -7.0246124267578125, "global_step": 171226, "epoch": 4076} {"train_loss": -6.976790428161621, "global_step": 171227, "epoch": 4076} {"train_loss": -7.057157516479492, "global_step": 171228, "epoch": 4076} {"train_loss": -6.976961612701416, "global_step": 171229, "epoch": 4076} {"train_loss": -7.064830780029297, "global_step": 171230, "epoch": 4076} {"train_loss": -7.072885036468506, "global_step": 171231, "epoch": 4076} {"train_loss": -6.949732780456543, "global_step": 171232, "epoch": 4076} {"train_loss": -7.067993266241891, "global_step": 171233, "epoch": 4076, "val_loss": 79880.546875} {"train_loss": -7.018769264221191, "global_step": 171234, "epoch": 4077} {"train_loss": -7.085529804229736, "global_step": 171235, "epoch": 4077} {"train_loss": -7.125286102294922, "global_step": 171236, "epoch": 4077} {"train_loss": -7.0642828941345215, "global_step": 171237, "epoch": 4077} {"train_loss": -7.021592617034912, "global_step": 171238, "epoch": 4077} {"train_loss": -7.041241645812988, "global_step": 171239, "epoch": 4077} {"train_loss": -6.976909160614014, "global_step": 171240, "epoch": 4077} {"train_loss": -7.1262993812561035, "global_step": 171241, "epoch": 4077} {"train_loss": -6.906249046325684, "global_step": 171242, "epoch": 4077} {"train_loss": -6.9633073806762695, "global_step": 171243, "epoch": 4077} {"train_loss": -7.008938789367676, "global_step": 171244, "epoch": 4077} {"train_loss": -6.870427131652832, "global_step": 171245, "epoch": 4077} {"train_loss": -6.964205741882324, "global_step": 171246, "epoch": 4077} {"train_loss": -7.027218818664551, "global_step": 171247, "epoch": 4077} {"train_loss": -6.947051048278809, "global_step": 171248, "epoch": 4077} {"train_loss": -6.927870750427246, "global_step": 171249, "epoch": 4077} {"train_loss": -6.990111351013184, "global_step": 171250, "epoch": 4077} {"train_loss": -6.855208396911621, "global_step": 171251, "epoch": 4077} {"train_loss": -7.083601951599121, "global_step": 171252, "epoch": 4077} {"train_loss": -6.9628472328186035, "global_step": 171253, "epoch": 4077} {"train_loss": -7.024541854858398, "global_step": 171254, "epoch": 4077} {"train_loss": -7.1071672439575195, "global_step": 171255, "epoch": 4077} {"train_loss": -7.012607574462891, "global_step": 171256, "epoch": 4077} {"train_loss": -7.112762451171875, "global_step": 171257, "epoch": 4077} {"train_loss": -7.108026504516602, "global_step": 171258, "epoch": 4077} {"train_loss": -7.032500267028809, "global_step": 171259, "epoch": 4077} {"train_loss": -6.94914436340332, "global_step": 171260, "epoch": 4077} {"train_loss": -7.086324214935303, "global_step": 171261, "epoch": 4077} {"train_loss": -6.9366912841796875, "global_step": 171262, "epoch": 4077} {"train_loss": -7.123088359832764, "global_step": 171263, "epoch": 4077} {"train_loss": -6.971738815307617, "global_step": 171264, "epoch": 4077} {"train_loss": -7.10981559753418, "global_step": 171265, "epoch": 4077} {"train_loss": -7.069270610809326, "global_step": 171266, "epoch": 4077} {"train_loss": -7.081537246704102, "global_step": 171267, "epoch": 4077} {"train_loss": -7.095577239990234, "global_step": 171268, "epoch": 4077} {"train_loss": -7.023035526275635, "global_step": 171269, "epoch": 4077} {"train_loss": -7.050081253051758, "global_step": 171270, "epoch": 4077} {"train_loss": -7.178713798522949, "global_step": 171271, "epoch": 4077} {"train_loss": -7.022937774658203, "global_step": 171272, "epoch": 4077} {"train_loss": -7.0820722579956055, "global_step": 171273, "epoch": 4077} {"train_loss": -7.05349063873291, "global_step": 171274, "epoch": 4077} {"train_loss": -7.032869736353557, "global_step": 171275, "epoch": 4077, "val_loss": 79894.6015625} {"train_loss": -7.118297576904297, "global_step": 171276, "epoch": 4078} {"train_loss": -7.019979476928711, "global_step": 171277, "epoch": 4078} {"train_loss": -7.158276557922363, "global_step": 171278, "epoch": 4078} {"train_loss": -7.150847434997559, "global_step": 171279, "epoch": 4078} {"train_loss": -7.142366409301758, "global_step": 171280, "epoch": 4078} {"train_loss": -7.178990364074707, "global_step": 171281, "epoch": 4078} {"train_loss": -7.046933174133301, "global_step": 171282, "epoch": 4078} {"train_loss": -7.096240043640137, "global_step": 171283, "epoch": 4078} {"train_loss": -7.019084453582764, "global_step": 171284, "epoch": 4078} {"train_loss": -7.1211347579956055, "global_step": 171285, "epoch": 4078} {"train_loss": -6.932623863220215, "global_step": 171286, "epoch": 4078} {"train_loss": -7.0345683097839355, "global_step": 171287, "epoch": 4078} {"train_loss": -7.045793533325195, "global_step": 171288, "epoch": 4078} {"train_loss": -7.057822227478027, "global_step": 171289, "epoch": 4078} {"train_loss": -7.032804489135742, "global_step": 171290, "epoch": 4078} {"train_loss": -7.038697242736816, "global_step": 171291, "epoch": 4078} {"train_loss": -7.030496120452881, "global_step": 171292, "epoch": 4078} {"train_loss": -7.06092643737793, "global_step": 171293, "epoch": 4078} {"train_loss": -7.0292816162109375, "global_step": 171294, "epoch": 4078} {"train_loss": -6.914271354675293, "global_step": 171295, "epoch": 4078} {"train_loss": -7.126307487487793, "global_step": 171296, "epoch": 4078} {"train_loss": -7.075387954711914, "global_step": 171297, "epoch": 4078} {"train_loss": -7.049938201904297, "global_step": 171298, "epoch": 4078} {"train_loss": -7.0312347412109375, "global_step": 171299, "epoch": 4078} {"train_loss": -6.979989051818848, "global_step": 171300, "epoch": 4078} {"train_loss": -7.166073322296143, "global_step": 171301, "epoch": 4078} {"train_loss": -7.122957706451416, "global_step": 171302, "epoch": 4078} {"train_loss": -7.03892183303833, "global_step": 171303, "epoch": 4078} {"train_loss": -7.097322463989258, "global_step": 171304, "epoch": 4078} {"train_loss": -7.002516746520996, "global_step": 171305, "epoch": 4078} {"train_loss": -7.189897537231445, "global_step": 171306, "epoch": 4078} {"train_loss": -7.043150901794434, "global_step": 171307, "epoch": 4078} {"train_loss": -7.016683578491211, "global_step": 171308, "epoch": 4078} {"train_loss": -7.027856349945068, "global_step": 171309, "epoch": 4078} {"train_loss": -7.097369194030762, "global_step": 171310, "epoch": 4078} {"train_loss": -7.096248626708984, "global_step": 171311, "epoch": 4078} {"train_loss": -7.093497276306152, "global_step": 171312, "epoch": 4078} {"train_loss": -7.099436283111572, "global_step": 171313, "epoch": 4078} {"train_loss": -7.084855079650879, "global_step": 171314, "epoch": 4078} {"train_loss": -7.092002868652344, "global_step": 171315, "epoch": 4078} {"train_loss": -7.103854656219482, "global_step": 171316, "epoch": 4078} {"train_loss": -7.071272123427618, "global_step": 171317, "epoch": 4078, "val_loss": 79893.0625} {"train_loss": -7.10310173034668, "global_step": 171318, "epoch": 4079} {"train_loss": -7.2223005294799805, "global_step": 171319, "epoch": 4079} {"train_loss": -7.07626485824585, "global_step": 171320, "epoch": 4079} {"train_loss": -7.127704620361328, "global_step": 171321, "epoch": 4079} {"train_loss": -7.1279826164245605, "global_step": 171322, "epoch": 4079} {"train_loss": -7.077507972717285, "global_step": 171323, "epoch": 4079} {"train_loss": -7.205684661865234, "global_step": 171324, "epoch": 4079} {"train_loss": -7.04216194152832, "global_step": 171325, "epoch": 4079} {"train_loss": -7.171975135803223, "global_step": 171326, "epoch": 4079} {"train_loss": -7.175499439239502, "global_step": 171327, "epoch": 4079} {"train_loss": -7.235376834869385, "global_step": 171328, "epoch": 4079} {"train_loss": -7.071592330932617, "global_step": 171329, "epoch": 4079} {"train_loss": -7.100338935852051, "global_step": 171330, "epoch": 4079} {"train_loss": -7.0765485763549805, "global_step": 171331, "epoch": 4079} {"train_loss": -7.104637145996094, "global_step": 171332, "epoch": 4079} {"train_loss": -7.092103004455566, "global_step": 171333, "epoch": 4079} {"train_loss": -7.043111801147461, "global_step": 171334, "epoch": 4079} {"train_loss": -7.230215072631836, "global_step": 171335, "epoch": 4079} {"train_loss": -7.055988311767578, "global_step": 171336, "epoch": 4079} {"train_loss": -7.0053839683532715, "global_step": 171337, "epoch": 4079} {"train_loss": -7.028043746948242, "global_step": 171338, "epoch": 4079} {"train_loss": -6.990560531616211, "global_step": 171339, "epoch": 4079} {"train_loss": -6.909392356872559, "global_step": 171340, "epoch": 4079} {"train_loss": -7.127485752105713, "global_step": 171341, "epoch": 4079} {"train_loss": -6.912421703338623, "global_step": 171342, "epoch": 4079} {"train_loss": -6.9246826171875, "global_step": 171343, "epoch": 4079} {"train_loss": -6.997215747833252, "global_step": 171344, "epoch": 4079} {"train_loss": -6.884128570556641, "global_step": 171345, "epoch": 4079} {"train_loss": -6.982659339904785, "global_step": 171346, "epoch": 4079} {"train_loss": -7.019415855407715, "global_step": 171347, "epoch": 4079} {"train_loss": -6.959338665008545, "global_step": 171348, "epoch": 4079} {"train_loss": -6.978520393371582, "global_step": 171349, "epoch": 4079} {"train_loss": -6.940853595733643, "global_step": 171350, "epoch": 4079} {"train_loss": -7.039178848266602, "global_step": 171351, "epoch": 4079} {"train_loss": -6.857094764709473, "global_step": 171352, "epoch": 4079} {"train_loss": -7.012859344482422, "global_step": 171353, "epoch": 4079} {"train_loss": -6.975599765777588, "global_step": 171354, "epoch": 4079} {"train_loss": -6.980103015899658, "global_step": 171355, "epoch": 4079} {"train_loss": -6.9603962898254395, "global_step": 171356, "epoch": 4079} {"train_loss": -6.958345890045166, "global_step": 171357, "epoch": 4079} {"train_loss": -6.951424598693848, "global_step": 171358, "epoch": 4079} {"train_loss": -7.042821066720145, "global_step": 171359, "epoch": 4079, "val_loss": 80014.40625} {"train_loss": -7.070804595947266, "global_step": 171360, "epoch": 4080} {"train_loss": -7.054477691650391, "global_step": 171361, "epoch": 4080} {"train_loss": -7.116095542907715, "global_step": 171362, "epoch": 4080} {"train_loss": -7.070108890533447, "global_step": 171363, "epoch": 4080} {"train_loss": -7.125837326049805, "global_step": 171364, "epoch": 4080} {"train_loss": -7.09303092956543, "global_step": 171365, "epoch": 4080} {"train_loss": -7.0375165939331055, "global_step": 171366, "epoch": 4080} {"train_loss": -7.056703567504883, "global_step": 171367, "epoch": 4080} {"train_loss": -7.129219055175781, "global_step": 171368, "epoch": 4080} {"train_loss": -7.231835842132568, "global_step": 171369, "epoch": 4080} {"train_loss": -7.113398551940918, "global_step": 171370, "epoch": 4080} {"train_loss": -7.206079483032227, "global_step": 171371, "epoch": 4080} {"train_loss": -7.166399002075195, "global_step": 171372, "epoch": 4080} {"train_loss": -7.053627014160156, "global_step": 171373, "epoch": 4080} {"train_loss": -7.032740116119385, "global_step": 171374, "epoch": 4080} {"train_loss": -7.1668596267700195, "global_step": 171375, "epoch": 4080} {"train_loss": -6.943346977233887, "global_step": 171376, "epoch": 4080} {"train_loss": -7.04187536239624, "global_step": 171377, "epoch": 4080} {"train_loss": -7.094646453857422, "global_step": 171378, "epoch": 4080} {"train_loss": -7.150531768798828, "global_step": 171379, "epoch": 4080} {"train_loss": -7.046726226806641, "global_step": 171380, "epoch": 4080} {"train_loss": -7.051255702972412, "global_step": 171381, "epoch": 4080} {"train_loss": -7.079766750335693, "global_step": 171382, "epoch": 4080} {"train_loss": -6.876101016998291, "global_step": 171383, "epoch": 4080} {"train_loss": -7.021876335144043, "global_step": 171384, "epoch": 4080} {"train_loss": -7.163844585418701, "global_step": 171385, "epoch": 4080} {"train_loss": -7.005209922790527, "global_step": 171386, "epoch": 4080} {"train_loss": -7.030159950256348, "global_step": 171387, "epoch": 4080} {"train_loss": -7.107089996337891, "global_step": 171388, "epoch": 4080} {"train_loss": -6.97829532623291, "global_step": 171389, "epoch": 4080} {"train_loss": -7.110753536224365, "global_step": 171390, "epoch": 4080} {"train_loss": -7.040759086608887, "global_step": 171391, "epoch": 4080} {"train_loss": -6.94868278503418, "global_step": 171392, "epoch": 4080} {"train_loss": -6.903207778930664, "global_step": 171393, "epoch": 4080} {"train_loss": -7.078817367553711, "global_step": 171394, "epoch": 4080} {"train_loss": -7.084654808044434, "global_step": 171395, "epoch": 4080} {"train_loss": -7.04311990737915, "global_step": 171396, "epoch": 4080} {"train_loss": -7.080450057983398, "global_step": 171397, "epoch": 4080} {"train_loss": -6.928064346313477, "global_step": 171398, "epoch": 4080} {"train_loss": -7.106895446777344, "global_step": 171399, "epoch": 4080} {"train_loss": -7.100059509277344, "global_step": 171400, "epoch": 4080} {"train_loss": -7.069542226337251, "global_step": 171401, "epoch": 4080, "val_loss": 79693.5} {"train_loss": -7.016249656677246, "global_step": 171402, "epoch": 4081} {"train_loss": -7.131380558013916, "global_step": 171403, "epoch": 4081} {"train_loss": -7.18364143371582, "global_step": 171404, "epoch": 4081} {"train_loss": -7.049027442932129, "global_step": 171405, "epoch": 4081} {"train_loss": -6.999567985534668, "global_step": 171406, "epoch": 4081} {"train_loss": -6.934479236602783, "global_step": 171407, "epoch": 4081} {"train_loss": -7.07033634185791, "global_step": 171408, "epoch": 4081} {"train_loss": -6.995624542236328, "global_step": 171409, "epoch": 4081} {"train_loss": -6.993058204650879, "global_step": 171410, "epoch": 4081} {"train_loss": -7.067903518676758, "global_step": 171411, "epoch": 4081} {"train_loss": -6.986132621765137, "global_step": 171412, "epoch": 4081} {"train_loss": -7.114254474639893, "global_step": 171413, "epoch": 4081} {"train_loss": -7.051329612731934, "global_step": 171414, "epoch": 4081} {"train_loss": -7.072673797607422, "global_step": 171415, "epoch": 4081} {"train_loss": -7.076483726501465, "global_step": 171416, "epoch": 4081} {"train_loss": -7.069759368896484, "global_step": 171417, "epoch": 4081} {"train_loss": -7.075544834136963, "global_step": 171418, "epoch": 4081} {"train_loss": -6.937898635864258, "global_step": 171419, "epoch": 4081} {"train_loss": -6.9444966316223145, "global_step": 171420, "epoch": 4081} {"train_loss": -6.951506614685059, "global_step": 171421, "epoch": 4081} {"train_loss": -7.099566459655762, "global_step": 171422, "epoch": 4081} {"train_loss": -7.068037509918213, "global_step": 171423, "epoch": 4081} {"train_loss": -7.039700984954834, "global_step": 171424, "epoch": 4081} {"train_loss": -7.007946968078613, "global_step": 171425, "epoch": 4081} {"train_loss": -7.060448169708252, "global_step": 171426, "epoch": 4081} {"train_loss": -7.038233757019043, "global_step": 171427, "epoch": 4081} {"train_loss": -6.967273712158203, "global_step": 171428, "epoch": 4081} {"train_loss": -7.060695648193359, "global_step": 171429, "epoch": 4081} {"train_loss": -7.079816818237305, "global_step": 171430, "epoch": 4081} {"train_loss": -7.07535457611084, "global_step": 171431, "epoch": 4081} {"train_loss": -7.125328063964844, "global_step": 171432, "epoch": 4081} {"train_loss": -7.035614967346191, "global_step": 171433, "epoch": 4081} {"train_loss": -7.002086162567139, "global_step": 171434, "epoch": 4081} {"train_loss": -7.109390735626221, "global_step": 171435, "epoch": 4081} {"train_loss": -7.014158725738525, "global_step": 171436, "epoch": 4081} {"train_loss": -7.002987384796143, "global_step": 171437, "epoch": 4081} {"train_loss": -7.004563808441162, "global_step": 171438, "epoch": 4081} {"train_loss": -7.073757171630859, "global_step": 171439, "epoch": 4081} {"train_loss": -6.971138954162598, "global_step": 171440, "epoch": 4081} {"train_loss": -7.004970550537109, "global_step": 171441, "epoch": 4081} {"train_loss": -7.065125942230225, "global_step": 171442, "epoch": 4081} {"train_loss": -7.0414272376469205, "global_step": 171443, "epoch": 4081, "val_loss": 80106.140625} {"train_loss": -7.121698379516602, "global_step": 171444, "epoch": 4082} {"train_loss": -7.00612735748291, "global_step": 171445, "epoch": 4082} {"train_loss": -6.979776859283447, "global_step": 171446, "epoch": 4082} {"train_loss": -6.968414306640625, "global_step": 171447, "epoch": 4082} {"train_loss": -7.121380805969238, "global_step": 171448, "epoch": 4082} {"train_loss": -7.002948760986328, "global_step": 171449, "epoch": 4082} {"train_loss": -6.938945770263672, "global_step": 171450, "epoch": 4082} {"train_loss": -7.126437187194824, "global_step": 171451, "epoch": 4082} {"train_loss": -7.060567855834961, "global_step": 171452, "epoch": 4082} {"train_loss": -7.037066459655762, "global_step": 171453, "epoch": 4082} {"train_loss": -6.986207485198975, "global_step": 171454, "epoch": 4082} {"train_loss": -7.007118225097656, "global_step": 171455, "epoch": 4082} {"train_loss": -7.046191692352295, "global_step": 171456, "epoch": 4082} {"train_loss": -7.135344505310059, "global_step": 171457, "epoch": 4082} {"train_loss": -6.814881324768066, "global_step": 171458, "epoch": 4082} {"train_loss": -7.078527450561523, "global_step": 171459, "epoch": 4082} {"train_loss": -7.005764007568359, "global_step": 171460, "epoch": 4082} {"train_loss": -6.944085121154785, "global_step": 171461, "epoch": 4082} {"train_loss": -7.034396171569824, "global_step": 171462, "epoch": 4082} {"train_loss": -6.9975762367248535, "global_step": 171463, "epoch": 4082} {"train_loss": -6.941928863525391, "global_step": 171464, "epoch": 4082} {"train_loss": -7.0268683433532715, "global_step": 171465, "epoch": 4082} {"train_loss": -6.853781700134277, "global_step": 171466, "epoch": 4082} {"train_loss": -6.91160249710083, "global_step": 171467, "epoch": 4082} {"train_loss": -7.037901401519775, "global_step": 171468, "epoch": 4082} {"train_loss": -6.911256790161133, "global_step": 171469, "epoch": 4082} {"train_loss": -6.955753803253174, "global_step": 171470, "epoch": 4082} {"train_loss": -6.960695743560791, "global_step": 171471, "epoch": 4082} {"train_loss": -6.967315673828125, "global_step": 171472, "epoch": 4082} {"train_loss": -7.050405979156494, "global_step": 171473, "epoch": 4082} {"train_loss": -6.982669353485107, "global_step": 171474, "epoch": 4082} {"train_loss": -7.0360846519470215, "global_step": 171475, "epoch": 4082} {"train_loss": -6.9299774169921875, "global_step": 171476, "epoch": 4082} {"train_loss": -7.08106803894043, "global_step": 171477, "epoch": 4082} {"train_loss": -7.092153549194336, "global_step": 171478, "epoch": 4082} {"train_loss": -6.956118583679199, "global_step": 171479, "epoch": 4082} {"train_loss": -6.951062202453613, "global_step": 171480, "epoch": 4082} {"train_loss": -7.065617561340332, "global_step": 171481, "epoch": 4082} {"train_loss": -6.959367752075195, "global_step": 171482, "epoch": 4082} {"train_loss": -7.005707263946533, "global_step": 171483, "epoch": 4082} {"train_loss": -6.989799499511719, "global_step": 171484, "epoch": 4082} {"train_loss": -6.998776163373675, "global_step": 171485, "epoch": 4082, "val_loss": 79851.265625} {"train_loss": -7.017291069030762, "global_step": 171486, "epoch": 4083} {"train_loss": -6.833877086639404, "global_step": 171487, "epoch": 4083} {"train_loss": -7.078365325927734, "global_step": 171488, "epoch": 4083} {"train_loss": -6.935595989227295, "global_step": 171489, "epoch": 4083} {"train_loss": -7.05729341506958, "global_step": 171490, "epoch": 4083} {"train_loss": -6.950355052947998, "global_step": 171491, "epoch": 4083} {"train_loss": -6.957718849182129, "global_step": 171492, "epoch": 4083} {"train_loss": -6.9844279289245605, "global_step": 171493, "epoch": 4083} {"train_loss": -7.032823085784912, "global_step": 171494, "epoch": 4083} {"train_loss": -7.053524971008301, "global_step": 171495, "epoch": 4083} {"train_loss": -6.911525249481201, "global_step": 171496, "epoch": 4083} {"train_loss": -6.966491222381592, "global_step": 171497, "epoch": 4083} {"train_loss": -7.0583696365356445, "global_step": 171498, "epoch": 4083} {"train_loss": -7.032557487487793, "global_step": 171499, "epoch": 4083} {"train_loss": -7.049561500549316, "global_step": 171500, "epoch": 4083} {"train_loss": -6.987539291381836, "global_step": 171501, "epoch": 4083} {"train_loss": -7.121130466461182, "global_step": 171502, "epoch": 4083} {"train_loss": -7.039253234863281, "global_step": 171503, "epoch": 4083} {"train_loss": -7.032681465148926, "global_step": 171504, "epoch": 4083} {"train_loss": -6.955844879150391, "global_step": 171505, "epoch": 4083} {"train_loss": -6.994258880615234, "global_step": 171506, "epoch": 4083} {"train_loss": -7.08944034576416, "global_step": 171507, "epoch": 4083} {"train_loss": -7.111323833465576, "global_step": 171508, "epoch": 4083} {"train_loss": -7.137739181518555, "global_step": 171509, "epoch": 4083} {"train_loss": -7.019679546356201, "global_step": 171510, "epoch": 4083} {"train_loss": -7.024180889129639, "global_step": 171511, "epoch": 4083} {"train_loss": -7.165064811706543, "global_step": 171512, "epoch": 4083} {"train_loss": -7.166220664978027, "global_step": 171513, "epoch": 4083} {"train_loss": -7.089290618896484, "global_step": 171514, "epoch": 4083} {"train_loss": -7.17835807800293, "global_step": 171515, "epoch": 4083} {"train_loss": -7.1206159591674805, "global_step": 171516, "epoch": 4083} {"train_loss": -7.147208213806152, "global_step": 171517, "epoch": 4083} {"train_loss": -7.08603572845459, "global_step": 171518, "epoch": 4083} {"train_loss": -7.005626678466797, "global_step": 171519, "epoch": 4083} {"train_loss": -7.083796977996826, "global_step": 171520, "epoch": 4083} {"train_loss": -7.015624046325684, "global_step": 171521, "epoch": 4083} {"train_loss": -7.048794746398926, "global_step": 171522, "epoch": 4083} {"train_loss": -7.033476829528809, "global_step": 171523, "epoch": 4083} {"train_loss": -7.147418975830078, "global_step": 171524, "epoch": 4083} {"train_loss": -7.08748722076416, "global_step": 171525, "epoch": 4083} {"train_loss": -7.03258752822876, "global_step": 171526, "epoch": 4083} {"train_loss": -7.047222568875267, "global_step": 171527, "epoch": 4083, "val_loss": 79932.7109375} {"train_loss": -7.084672927856445, "global_step": 171528, "epoch": 4084} {"train_loss": -6.968774795532227, "global_step": 171529, "epoch": 4084} {"train_loss": -7.089287757873535, "global_step": 171530, "epoch": 4084} {"train_loss": -7.067750453948975, "global_step": 171531, "epoch": 4084} {"train_loss": -7.026725769042969, "global_step": 171532, "epoch": 4084} {"train_loss": -6.940263748168945, "global_step": 171533, "epoch": 4084} {"train_loss": -7.0875139236450195, "global_step": 171534, "epoch": 4084} {"train_loss": -7.05731201171875, "global_step": 171535, "epoch": 4084} {"train_loss": -7.050829887390137, "global_step": 171536, "epoch": 4084} {"train_loss": -6.9978861808776855, "global_step": 171537, "epoch": 4084} {"train_loss": -7.093772888183594, "global_step": 171538, "epoch": 4084} {"train_loss": -7.069324016571045, "global_step": 171539, "epoch": 4084} {"train_loss": -7.066174507141113, "global_step": 171540, "epoch": 4084} {"train_loss": -7.097048759460449, "global_step": 171541, "epoch": 4084} {"train_loss": -7.068246364593506, "global_step": 171542, "epoch": 4084} {"train_loss": -7.148366928100586, "global_step": 171543, "epoch": 4084} {"train_loss": -7.064104080200195, "global_step": 171544, "epoch": 4084} {"train_loss": -7.08211612701416, "global_step": 171545, "epoch": 4084} {"train_loss": -7.0964202880859375, "global_step": 171546, "epoch": 4084} {"train_loss": -7.069155216217041, "global_step": 171547, "epoch": 4084} {"train_loss": -6.9956817626953125, "global_step": 171548, "epoch": 4084} {"train_loss": -7.016664505004883, "global_step": 171549, "epoch": 4084} {"train_loss": -7.142183303833008, "global_step": 171550, "epoch": 4084} {"train_loss": -6.96568489074707, "global_step": 171551, "epoch": 4084} {"train_loss": -7.150639533996582, "global_step": 171552, "epoch": 4084} {"train_loss": -7.08405876159668, "global_step": 171553, "epoch": 4084} {"train_loss": -7.022358417510986, "global_step": 171554, "epoch": 4084} {"train_loss": -7.093642234802246, "global_step": 171555, "epoch": 4084} {"train_loss": -7.043848514556885, "global_step": 171556, "epoch": 4084} {"train_loss": -7.081089973449707, "global_step": 171557, "epoch": 4084} {"train_loss": -7.10753059387207, "global_step": 171558, "epoch": 4084} {"train_loss": -7.087471008300781, "global_step": 171559, "epoch": 4084} {"train_loss": -7.0742106437683105, "global_step": 171560, "epoch": 4084} {"train_loss": -7.0641632080078125, "global_step": 171561, "epoch": 4084} {"train_loss": -6.958209991455078, "global_step": 171562, "epoch": 4084} {"train_loss": -7.006309509277344, "global_step": 171563, "epoch": 4084} {"train_loss": -7.026391506195068, "global_step": 171564, "epoch": 4084} {"train_loss": -7.118438720703125, "global_step": 171565, "epoch": 4084} {"train_loss": -6.890107154846191, "global_step": 171566, "epoch": 4084} {"train_loss": -6.996037483215332, "global_step": 171567, "epoch": 4084} {"train_loss": -6.896686553955078, "global_step": 171568, "epoch": 4084} {"train_loss": -7.0478089650472, "global_step": 171569, "epoch": 4084, "val_loss": 80208.734375} {"train_loss": -6.948061943054199, "global_step": 171570, "epoch": 4085} {"train_loss": -7.006465435028076, "global_step": 171571, "epoch": 4085} {"train_loss": -7.0077714920043945, "global_step": 171572, "epoch": 4085} {"train_loss": -6.977378845214844, "global_step": 171573, "epoch": 4085} {"train_loss": -7.153853416442871, "global_step": 171574, "epoch": 4085} {"train_loss": -6.964878559112549, "global_step": 171575, "epoch": 4085} {"train_loss": -7.158504486083984, "global_step": 171576, "epoch": 4085} {"train_loss": -7.042448997497559, "global_step": 171577, "epoch": 4085} {"train_loss": -7.112878799438477, "global_step": 171578, "epoch": 4085} {"train_loss": -7.063760757446289, "global_step": 171579, "epoch": 4085} {"train_loss": -7.140158176422119, "global_step": 171580, "epoch": 4085} {"train_loss": -7.0725603103637695, "global_step": 171581, "epoch": 4085} {"train_loss": -7.135269641876221, "global_step": 171582, "epoch": 4085} {"train_loss": -7.031467437744141, "global_step": 171583, "epoch": 4085} {"train_loss": -6.991600513458252, "global_step": 171584, "epoch": 4085} {"train_loss": -7.116859436035156, "global_step": 171585, "epoch": 4085} {"train_loss": -7.047950744628906, "global_step": 171586, "epoch": 4085} {"train_loss": -6.973948955535889, "global_step": 171587, "epoch": 4085} {"train_loss": -7.1202802658081055, "global_step": 171588, "epoch": 4085} {"train_loss": -7.087810039520264, "global_step": 171589, "epoch": 4085} {"train_loss": -7.0781097412109375, "global_step": 171590, "epoch": 4085} {"train_loss": -7.037309646606445, "global_step": 171591, "epoch": 4085} {"train_loss": -7.04866886138916, "global_step": 171592, "epoch": 4085} {"train_loss": -6.936213493347168, "global_step": 171593, "epoch": 4085} {"train_loss": -7.0763840675354, "global_step": 171594, "epoch": 4085} {"train_loss": -7.101587295532227, "global_step": 171595, "epoch": 4085} {"train_loss": -7.010960578918457, "global_step": 171596, "epoch": 4085} {"train_loss": -7.1337480545043945, "global_step": 171597, "epoch": 4085} {"train_loss": -7.120517730712891, "global_step": 171598, "epoch": 4085} {"train_loss": -7.105452060699463, "global_step": 171599, "epoch": 4085} {"train_loss": -7.142472743988037, "global_step": 171600, "epoch": 4085} {"train_loss": -7.103144645690918, "global_step": 171601, "epoch": 4085} {"train_loss": -7.0539774894714355, "global_step": 171602, "epoch": 4085} {"train_loss": -7.080638885498047, "global_step": 171603, "epoch": 4085} {"train_loss": -7.081472396850586, "global_step": 171604, "epoch": 4085} {"train_loss": -7.074873924255371, "global_step": 171605, "epoch": 4085} {"train_loss": -7.098837375640869, "global_step": 171606, "epoch": 4085} {"train_loss": -7.039002895355225, "global_step": 171607, "epoch": 4085} {"train_loss": -7.084812164306641, "global_step": 171608, "epoch": 4085} {"train_loss": -7.039210319519043, "global_step": 171609, "epoch": 4085} {"train_loss": -7.050851821899414, "global_step": 171610, "epoch": 4085} {"train_loss": -7.062767244520641, "global_step": 171611, "epoch": 4085, "val_loss": 80147.1484375} {"train_loss": -7.07996940612793, "global_step": 171612, "epoch": 4086} {"train_loss": -7.061375617980957, "global_step": 171613, "epoch": 4086} {"train_loss": -6.917062759399414, "global_step": 171614, "epoch": 4086} {"train_loss": -7.07716703414917, "global_step": 171615, "epoch": 4086} {"train_loss": -6.96712589263916, "global_step": 171616, "epoch": 4086} {"train_loss": -6.939901351928711, "global_step": 171617, "epoch": 4086} {"train_loss": -6.922521591186523, "global_step": 171618, "epoch": 4086} {"train_loss": -7.069305419921875, "global_step": 171619, "epoch": 4086} {"train_loss": -7.046535968780518, "global_step": 171620, "epoch": 4086} {"train_loss": -7.073859214782715, "global_step": 171621, "epoch": 4086} {"train_loss": -6.98256778717041, "global_step": 171622, "epoch": 4086} {"train_loss": -7.043236255645752, "global_step": 171623, "epoch": 4086} {"train_loss": -6.980807781219482, "global_step": 171624, "epoch": 4086} {"train_loss": -6.8293352127075195, "global_step": 171625, "epoch": 4086} {"train_loss": -7.035024642944336, "global_step": 171626, "epoch": 4086} {"train_loss": -7.035897254943848, "global_step": 171627, "epoch": 4086} {"train_loss": -6.95592737197876, "global_step": 171628, "epoch": 4086} {"train_loss": -7.005592346191406, "global_step": 171629, "epoch": 4086} {"train_loss": -7.1621599197387695, "global_step": 171630, "epoch": 4086} {"train_loss": -6.968725681304932, "global_step": 171631, "epoch": 4086} {"train_loss": -7.090362071990967, "global_step": 171632, "epoch": 4086} {"train_loss": -7.109250068664551, "global_step": 171633, "epoch": 4086} {"train_loss": -6.994966983795166, "global_step": 171634, "epoch": 4086} {"train_loss": -7.035248756408691, "global_step": 171635, "epoch": 4086} {"train_loss": -7.128695964813232, "global_step": 171636, "epoch": 4086} {"train_loss": -7.113430976867676, "global_step": 171637, "epoch": 4086} {"train_loss": -6.995497703552246, "global_step": 171638, "epoch": 4086} {"train_loss": -7.063082218170166, "global_step": 171639, "epoch": 4086} {"train_loss": -7.121249198913574, "global_step": 171640, "epoch": 4086} {"train_loss": -7.088057994842529, "global_step": 171641, "epoch": 4086} {"train_loss": -7.126434326171875, "global_step": 171642, "epoch": 4086} {"train_loss": -7.0973405838012695, "global_step": 171643, "epoch": 4086} {"train_loss": -7.16416597366333, "global_step": 171644, "epoch": 4086} {"train_loss": -7.1532440185546875, "global_step": 171645, "epoch": 4086} {"train_loss": -6.933121204376221, "global_step": 171646, "epoch": 4086} {"train_loss": -7.010513782501221, "global_step": 171647, "epoch": 4086} {"train_loss": -7.120429992675781, "global_step": 171648, "epoch": 4086} {"train_loss": -7.042901039123535, "global_step": 171649, "epoch": 4086} {"train_loss": -7.067086219787598, "global_step": 171650, "epoch": 4086} {"train_loss": -7.082591533660889, "global_step": 171651, "epoch": 4086} {"train_loss": -7.060792922973633, "global_step": 171652, "epoch": 4086} {"train_loss": -7.043943961461385, "global_step": 171653, "epoch": 4086, "val_loss": 80008.2578125} {"train_loss": -7.097763538360596, "global_step": 171654, "epoch": 4087} {"train_loss": -7.136692523956299, "global_step": 171655, "epoch": 4087} {"train_loss": -7.107091903686523, "global_step": 171656, "epoch": 4087} {"train_loss": -7.163552284240723, "global_step": 171657, "epoch": 4087} {"train_loss": -7.1175031661987305, "global_step": 171658, "epoch": 4087} {"train_loss": -7.158041000366211, "global_step": 171659, "epoch": 4087} {"train_loss": -7.036139488220215, "global_step": 171660, "epoch": 4087} {"train_loss": -7.035622596740723, "global_step": 171661, "epoch": 4087} {"train_loss": -7.138369083404541, "global_step": 171662, "epoch": 4087} {"train_loss": -7.026113510131836, "global_step": 171663, "epoch": 4087} {"train_loss": -7.125444412231445, "global_step": 171664, "epoch": 4087} {"train_loss": -7.153729438781738, "global_step": 171665, "epoch": 4087} {"train_loss": -7.117452621459961, "global_step": 171666, "epoch": 4087} {"train_loss": -6.954453468322754, "global_step": 171667, "epoch": 4087} {"train_loss": -7.024687767028809, "global_step": 171668, "epoch": 4087} {"train_loss": -7.1178436279296875, "global_step": 171669, "epoch": 4087} {"train_loss": -6.8612165451049805, "global_step": 171670, "epoch": 4087} {"train_loss": -7.221309661865234, "global_step": 171671, "epoch": 4087} {"train_loss": -7.1166791915893555, "global_step": 171672, "epoch": 4087} {"train_loss": -6.916828155517578, "global_step": 171673, "epoch": 4087} {"train_loss": -6.963339805603027, "global_step": 171674, "epoch": 4087} {"train_loss": -7.100201606750488, "global_step": 171675, "epoch": 4087} {"train_loss": -7.007735252380371, "global_step": 171676, "epoch": 4087} {"train_loss": -7.032066345214844, "global_step": 171677, "epoch": 4087} {"train_loss": -6.984249114990234, "global_step": 171678, "epoch": 4087} {"train_loss": -6.9458770751953125, "global_step": 171679, "epoch": 4087} {"train_loss": -6.98965311050415, "global_step": 171680, "epoch": 4087} {"train_loss": -6.993793487548828, "global_step": 171681, "epoch": 4087} {"train_loss": -7.004134654998779, "global_step": 171682, "epoch": 4087} {"train_loss": -6.991240978240967, "global_step": 171683, "epoch": 4087} {"train_loss": -6.810982704162598, "global_step": 171684, "epoch": 4087} {"train_loss": -6.963639259338379, "global_step": 171685, "epoch": 4087} {"train_loss": -6.960651397705078, "global_step": 171686, "epoch": 4087} {"train_loss": -7.121255874633789, "global_step": 171687, "epoch": 4087} {"train_loss": -6.9039201736450195, "global_step": 171688, "epoch": 4087} {"train_loss": -7.072398662567139, "global_step": 171689, "epoch": 4087} {"train_loss": -6.978325843811035, "global_step": 171690, "epoch": 4087} {"train_loss": -6.89003849029541, "global_step": 171691, "epoch": 4087} {"train_loss": -7.037339210510254, "global_step": 171692, "epoch": 4087} {"train_loss": -7.015636444091797, "global_step": 171693, "epoch": 4087} {"train_loss": -6.95366096496582, "global_step": 171694, "epoch": 4087} {"train_loss": -7.035428989501226, "global_step": 171695, "epoch": 4087, "val_loss": 79967.28125} {"train_loss": -7.1234517097473145, "global_step": 171696, "epoch": 4088} {"train_loss": -7.103643894195557, "global_step": 171697, "epoch": 4088} {"train_loss": -6.987592697143555, "global_step": 171698, "epoch": 4088} {"train_loss": -6.99545955657959, "global_step": 171699, "epoch": 4088} {"train_loss": -7.1448259353637695, "global_step": 171700, "epoch": 4088} {"train_loss": -6.995925426483154, "global_step": 171701, "epoch": 4088} {"train_loss": -7.1339521408081055, "global_step": 171702, "epoch": 4088} {"train_loss": -7.1611199378967285, "global_step": 171703, "epoch": 4088} {"train_loss": -7.177763938903809, "global_step": 171704, "epoch": 4088} {"train_loss": -7.065006256103516, "global_step": 171705, "epoch": 4088} {"train_loss": -7.127696990966797, "global_step": 171706, "epoch": 4088} {"train_loss": -6.976458549499512, "global_step": 171707, "epoch": 4088} {"train_loss": -7.161036491394043, "global_step": 171708, "epoch": 4088} {"train_loss": -7.1513800621032715, "global_step": 171709, "epoch": 4088} {"train_loss": -7.1005048751831055, "global_step": 171710, "epoch": 4088} {"train_loss": -7.058291435241699, "global_step": 171711, "epoch": 4088} {"train_loss": -7.121467590332031, "global_step": 171712, "epoch": 4088} {"train_loss": -7.060218811035156, "global_step": 171713, "epoch": 4088} {"train_loss": -7.070220947265625, "global_step": 171714, "epoch": 4088} {"train_loss": -7.027676582336426, "global_step": 171715, "epoch": 4088} {"train_loss": -7.094444751739502, "global_step": 171716, "epoch": 4088} {"train_loss": -6.970830917358398, "global_step": 171717, "epoch": 4088} {"train_loss": -7.23694372177124, "global_step": 171718, "epoch": 4088} {"train_loss": -7.022917747497559, "global_step": 171719, "epoch": 4088} {"train_loss": -6.901635646820068, "global_step": 171720, "epoch": 4088} {"train_loss": -6.947816848754883, "global_step": 171721, "epoch": 4088} {"train_loss": -6.981149196624756, "global_step": 171722, "epoch": 4088} {"train_loss": -7.06895112991333, "global_step": 171723, "epoch": 4088} {"train_loss": -6.844604015350342, "global_step": 171724, "epoch": 4088} {"train_loss": -6.946535110473633, "global_step": 171725, "epoch": 4088} {"train_loss": -6.9642815589904785, "global_step": 171726, "epoch": 4088} {"train_loss": -6.842897415161133, "global_step": 171727, "epoch": 4088} {"train_loss": -7.06837797164917, "global_step": 171728, "epoch": 4088} {"train_loss": -6.817139148712158, "global_step": 171729, "epoch": 4088} {"train_loss": -6.86027717590332, "global_step": 171730, "epoch": 4088} {"train_loss": -7.007900238037109, "global_step": 171731, "epoch": 4088} {"train_loss": -6.953592777252197, "global_step": 171732, "epoch": 4088} {"train_loss": -7.015982627868652, "global_step": 171733, "epoch": 4088} {"train_loss": -6.924430847167969, "global_step": 171734, "epoch": 4088} {"train_loss": -6.973398208618164, "global_step": 171735, "epoch": 4088} {"train_loss": -6.997807025909424, "global_step": 171736, "epoch": 4088} {"train_loss": -7.029034659976051, "global_step": 171737, "epoch": 4088, "val_loss": 79807.0859375} {"train_loss": -7.038819313049316, "global_step": 171738, "epoch": 4089} {"train_loss": -6.921903610229492, "global_step": 171739, "epoch": 4089} {"train_loss": -6.911235332489014, "global_step": 171740, "epoch": 4089} {"train_loss": -7.012257099151611, "global_step": 171741, "epoch": 4089} {"train_loss": -6.842919826507568, "global_step": 171742, "epoch": 4089} {"train_loss": -7.048117637634277, "global_step": 171743, "epoch": 4089} {"train_loss": -7.001336097717285, "global_step": 171744, "epoch": 4089} {"train_loss": -7.05767822265625, "global_step": 171745, "epoch": 4089} {"train_loss": -7.062755584716797, "global_step": 171746, "epoch": 4089} {"train_loss": -6.923767566680908, "global_step": 171747, "epoch": 4089} {"train_loss": -7.023279666900635, "global_step": 171748, "epoch": 4089} {"train_loss": -7.103879928588867, "global_step": 171749, "epoch": 4089} {"train_loss": -7.099813461303711, "global_step": 171750, "epoch": 4089} {"train_loss": -7.038513660430908, "global_step": 171751, "epoch": 4089} {"train_loss": -7.036278247833252, "global_step": 171752, "epoch": 4089} {"train_loss": -7.029244422912598, "global_step": 171753, "epoch": 4089} {"train_loss": -6.984402656555176, "global_step": 171754, "epoch": 4089} {"train_loss": -7.107903003692627, "global_step": 171755, "epoch": 4089} {"train_loss": -6.972204208374023, "global_step": 171756, "epoch": 4089} {"train_loss": -7.049473762512207, "global_step": 171757, "epoch": 4089} {"train_loss": -7.027239799499512, "global_step": 171758, "epoch": 4089} {"train_loss": -7.025321960449219, "global_step": 171759, "epoch": 4089} {"train_loss": -6.941799163818359, "global_step": 171760, "epoch": 4089} {"train_loss": -7.03557014465332, "global_step": 171761, "epoch": 4089} {"train_loss": -7.060681343078613, "global_step": 171762, "epoch": 4089} {"train_loss": -6.919317245483398, "global_step": 171763, "epoch": 4089} {"train_loss": -7.122402667999268, "global_step": 171764, "epoch": 4089} {"train_loss": -6.963773727416992, "global_step": 171765, "epoch": 4089} {"train_loss": -6.963863372802734, "global_step": 171766, "epoch": 4089} {"train_loss": -7.01983642578125, "global_step": 171767, "epoch": 4089} {"train_loss": -6.946376800537109, "global_step": 171768, "epoch": 4089} {"train_loss": -7.118464946746826, "global_step": 171769, "epoch": 4089} {"train_loss": -6.986481666564941, "global_step": 171770, "epoch": 4089} {"train_loss": -7.032406330108643, "global_step": 171771, "epoch": 4089} {"train_loss": -7.039957523345947, "global_step": 171772, "epoch": 4089} {"train_loss": -6.959311485290527, "global_step": 171773, "epoch": 4089} {"train_loss": -7.132500648498535, "global_step": 171774, "epoch": 4089} {"train_loss": -7.078883647918701, "global_step": 171775, "epoch": 4089} {"train_loss": -7.118062496185303, "global_step": 171776, "epoch": 4089} {"train_loss": -7.1360321044921875, "global_step": 171777, "epoch": 4089} {"train_loss": -7.047011852264404, "global_step": 171778, "epoch": 4089} {"train_loss": -7.024540356227329, "global_step": 171779, "epoch": 4089, "val_loss": 79834.03125} {"train_loss": -7.111905097961426, "global_step": 171780, "epoch": 4090} {"train_loss": -7.054361343383789, "global_step": 171781, "epoch": 4090} {"train_loss": -7.174781799316406, "global_step": 171782, "epoch": 4090} {"train_loss": -7.0953288078308105, "global_step": 171783, "epoch": 4090} {"train_loss": -7.0688395500183105, "global_step": 171784, "epoch": 4090} {"train_loss": -7.092954158782959, "global_step": 171785, "epoch": 4090} {"train_loss": -7.046601295471191, "global_step": 171786, "epoch": 4090} {"train_loss": -7.0813822746276855, "global_step": 171787, "epoch": 4090} {"train_loss": -7.061067581176758, "global_step": 171788, "epoch": 4090} {"train_loss": -6.997196197509766, "global_step": 171789, "epoch": 4090} {"train_loss": -6.922482967376709, "global_step": 171790, "epoch": 4090} {"train_loss": -6.956273078918457, "global_step": 171791, "epoch": 4090} {"train_loss": -6.994404315948486, "global_step": 171792, "epoch": 4090} {"train_loss": -7.034348487854004, "global_step": 171793, "epoch": 4090} {"train_loss": -7.0566558837890625, "global_step": 171794, "epoch": 4090} {"train_loss": -7.115167617797852, "global_step": 171795, "epoch": 4090} {"train_loss": -7.037003040313721, "global_step": 171796, "epoch": 4090} {"train_loss": -7.226871490478516, "global_step": 171797, "epoch": 4090} {"train_loss": -7.048156261444092, "global_step": 171798, "epoch": 4090} {"train_loss": -7.065956115722656, "global_step": 171799, "epoch": 4090} {"train_loss": -6.996820449829102, "global_step": 171800, "epoch": 4090} {"train_loss": -7.102578163146973, "global_step": 171801, "epoch": 4090} {"train_loss": -7.001943588256836, "global_step": 171802, "epoch": 4090} {"train_loss": -6.987865447998047, "global_step": 171803, "epoch": 4090} {"train_loss": -7.060635089874268, "global_step": 171804, "epoch": 4090} {"train_loss": -7.003933906555176, "global_step": 171805, "epoch": 4090} {"train_loss": -6.999574661254883, "global_step": 171806, "epoch": 4090} {"train_loss": -7.063112258911133, "global_step": 171807, "epoch": 4090} {"train_loss": -7.014569282531738, "global_step": 171808, "epoch": 4090} {"train_loss": -7.132084846496582, "global_step": 171809, "epoch": 4090} {"train_loss": -7.019968032836914, "global_step": 171810, "epoch": 4090} {"train_loss": -6.926616191864014, "global_step": 171811, "epoch": 4090} {"train_loss": -7.031384468078613, "global_step": 171812, "epoch": 4090} {"train_loss": -6.854369163513184, "global_step": 171813, "epoch": 4090} {"train_loss": -6.977297306060791, "global_step": 171814, "epoch": 4090} {"train_loss": -7.107285499572754, "global_step": 171815, "epoch": 4090} {"train_loss": -6.928704738616943, "global_step": 171816, "epoch": 4090} {"train_loss": -7.205236434936523, "global_step": 171817, "epoch": 4090} {"train_loss": -7.015109062194824, "global_step": 171818, "epoch": 4090} {"train_loss": -7.109590530395508, "global_step": 171819, "epoch": 4090} {"train_loss": -7.061340808868408, "global_step": 171820, "epoch": 4090} {"train_loss": -7.044254904701596, "global_step": 171821, "epoch": 4090, "val_loss": 80147.2578125} {"train_loss": -6.974207878112793, "global_step": 171822, "epoch": 4091} {"train_loss": -7.1127729415893555, "global_step": 171823, "epoch": 4091} {"train_loss": -7.15293025970459, "global_step": 171824, "epoch": 4091} {"train_loss": -7.118030548095703, "global_step": 171825, "epoch": 4091} {"train_loss": -7.094536781311035, "global_step": 171826, "epoch": 4091} {"train_loss": -7.0647783279418945, "global_step": 171827, "epoch": 4091} {"train_loss": -7.079833507537842, "global_step": 171828, "epoch": 4091} {"train_loss": -7.12603759765625, "global_step": 171829, "epoch": 4091} {"train_loss": -7.100620269775391, "global_step": 171830, "epoch": 4091} {"train_loss": -7.170375823974609, "global_step": 171831, "epoch": 4091} {"train_loss": -7.036123275756836, "global_step": 171832, "epoch": 4091} {"train_loss": -7.0665388107299805, "global_step": 171833, "epoch": 4091} {"train_loss": -6.942590236663818, "global_step": 171834, "epoch": 4091} {"train_loss": -7.099989891052246, "global_step": 171835, "epoch": 4091} {"train_loss": -7.084321975708008, "global_step": 171836, "epoch": 4091} {"train_loss": -7.013911724090576, "global_step": 171837, "epoch": 4091} {"train_loss": -7.054558753967285, "global_step": 171838, "epoch": 4091} {"train_loss": -7.069775581359863, "global_step": 171839, "epoch": 4091} {"train_loss": -7.214841842651367, "global_step": 171840, "epoch": 4091} {"train_loss": -7.018239974975586, "global_step": 171841, "epoch": 4091} {"train_loss": -6.916980743408203, "global_step": 171842, "epoch": 4091} {"train_loss": -7.05418586730957, "global_step": 171843, "epoch": 4091} {"train_loss": -6.944697380065918, "global_step": 171844, "epoch": 4091} {"train_loss": -6.980887413024902, "global_step": 171845, "epoch": 4091} {"train_loss": -7.023991584777832, "global_step": 171846, "epoch": 4091} {"train_loss": -7.114165306091309, "global_step": 171847, "epoch": 4091} {"train_loss": -7.1150617599487305, "global_step": 171848, "epoch": 4091} {"train_loss": -7.097978591918945, "global_step": 171849, "epoch": 4091} {"train_loss": -7.113689422607422, "global_step": 171850, "epoch": 4091} {"train_loss": -7.095109462738037, "global_step": 171851, "epoch": 4091} {"train_loss": -7.133500099182129, "global_step": 171852, "epoch": 4091} {"train_loss": -6.985359191894531, "global_step": 171853, "epoch": 4091} {"train_loss": -7.025968551635742, "global_step": 171854, "epoch": 4091} {"train_loss": -7.084775924682617, "global_step": 171855, "epoch": 4091} {"train_loss": -7.046187877655029, "global_step": 171856, "epoch": 4091} {"train_loss": -7.115012168884277, "global_step": 171857, "epoch": 4091} {"train_loss": -6.929211616516113, "global_step": 171858, "epoch": 4091} {"train_loss": -7.106233596801758, "global_step": 171859, "epoch": 4091} {"train_loss": -6.886954307556152, "global_step": 171860, "epoch": 4091} {"train_loss": -6.962628364562988, "global_step": 171861, "epoch": 4091} {"train_loss": -7.083951950073242, "global_step": 171862, "epoch": 4091} {"train_loss": -7.051422357559204, "global_step": 171863, "epoch": 4091, "val_loss": 79717.2890625} {"train_loss": -6.8788862228393555, "global_step": 171864, "epoch": 4092} {"train_loss": -7.073020935058594, "global_step": 171865, "epoch": 4092} {"train_loss": -6.890341281890869, "global_step": 171866, "epoch": 4092} {"train_loss": -6.97813606262207, "global_step": 171867, "epoch": 4092} {"train_loss": -6.85680627822876, "global_step": 171868, "epoch": 4092} {"train_loss": -6.92598819732666, "global_step": 171869, "epoch": 4092} {"train_loss": -6.900555610656738, "global_step": 171870, "epoch": 4092} {"train_loss": -6.954525947570801, "global_step": 171871, "epoch": 4092} {"train_loss": -6.986732482910156, "global_step": 171872, "epoch": 4092} {"train_loss": -6.960085868835449, "global_step": 171873, "epoch": 4092} {"train_loss": -7.080813407897949, "global_step": 171874, "epoch": 4092} {"train_loss": -6.997768402099609, "global_step": 171875, "epoch": 4092} {"train_loss": -6.951966762542725, "global_step": 171876, "epoch": 4092} {"train_loss": -7.058586120605469, "global_step": 171877, "epoch": 4092} {"train_loss": -7.077619552612305, "global_step": 171878, "epoch": 4092} {"train_loss": -7.029366970062256, "global_step": 171879, "epoch": 4092} {"train_loss": -6.952965259552002, "global_step": 171880, "epoch": 4092} {"train_loss": -7.060429573059082, "global_step": 171881, "epoch": 4092} {"train_loss": -7.040104866027832, "global_step": 171882, "epoch": 4092} {"train_loss": -7.092369079589844, "global_step": 171883, "epoch": 4092} {"train_loss": -7.047691345214844, "global_step": 171884, "epoch": 4092} {"train_loss": -7.1510910987854, "global_step": 171885, "epoch": 4092} {"train_loss": -7.054361820220947, "global_step": 171886, "epoch": 4092} {"train_loss": -7.097021102905273, "global_step": 171887, "epoch": 4092} {"train_loss": -7.007771968841553, "global_step": 171888, "epoch": 4092} {"train_loss": -7.034989356994629, "global_step": 171889, "epoch": 4092} {"train_loss": -7.170356750488281, "global_step": 171890, "epoch": 4092} {"train_loss": -6.9840850830078125, "global_step": 171891, "epoch": 4092} {"train_loss": -7.103067398071289, "global_step": 171892, "epoch": 4092} {"train_loss": -7.049341678619385, "global_step": 171893, "epoch": 4092} {"train_loss": -7.089367389678955, "global_step": 171894, "epoch": 4092} {"train_loss": -7.134100914001465, "global_step": 171895, "epoch": 4092} {"train_loss": -7.068422317504883, "global_step": 171896, "epoch": 4092} {"train_loss": -7.119963645935059, "global_step": 171897, "epoch": 4092} {"train_loss": -7.160556793212891, "global_step": 171898, "epoch": 4092} {"train_loss": -7.069489479064941, "global_step": 171899, "epoch": 4092} {"train_loss": -6.954221248626709, "global_step": 171900, "epoch": 4092} {"train_loss": -7.040670871734619, "global_step": 171901, "epoch": 4092} {"train_loss": -7.138450622558594, "global_step": 171902, "epoch": 4092} {"train_loss": -6.932376861572266, "global_step": 171903, "epoch": 4092} {"train_loss": -6.999921798706055, "global_step": 171904, "epoch": 4092} {"train_loss": -7.028937941505795, "global_step": 171905, "epoch": 4092, "val_loss": 79786.484375} {"train_loss": -7.114358901977539, "global_step": 171906, "epoch": 4093} {"train_loss": -6.931967735290527, "global_step": 171907, "epoch": 4093} {"train_loss": -7.096801280975342, "global_step": 171908, "epoch": 4093} {"train_loss": -7.065414905548096, "global_step": 171909, "epoch": 4093} {"train_loss": -6.950088977813721, "global_step": 171910, "epoch": 4093} {"train_loss": -7.058882236480713, "global_step": 171911, "epoch": 4093} {"train_loss": -7.035428524017334, "global_step": 171912, "epoch": 4093} {"train_loss": -6.9649763107299805, "global_step": 171913, "epoch": 4093} {"train_loss": -6.995359420776367, "global_step": 171914, "epoch": 4093} {"train_loss": -6.839201927185059, "global_step": 171915, "epoch": 4093} {"train_loss": -6.958157539367676, "global_step": 171916, "epoch": 4093} {"train_loss": -6.959835052490234, "global_step": 171917, "epoch": 4093} {"train_loss": -7.143232822418213, "global_step": 171918, "epoch": 4093} {"train_loss": -6.938211441040039, "global_step": 171919, "epoch": 4093} {"train_loss": -6.996254920959473, "global_step": 171920, "epoch": 4093} {"train_loss": -6.99006462097168, "global_step": 171921, "epoch": 4093} {"train_loss": -7.065593242645264, "global_step": 171922, "epoch": 4093} {"train_loss": -6.952086448669434, "global_step": 171923, "epoch": 4093} {"train_loss": -6.8510308265686035, "global_step": 171924, "epoch": 4093} {"train_loss": -7.009420394897461, "global_step": 171925, "epoch": 4093} {"train_loss": -7.005304336547852, "global_step": 171926, "epoch": 4093} {"train_loss": -6.973470211029053, "global_step": 171927, "epoch": 4093} {"train_loss": -6.959412574768066, "global_step": 171928, "epoch": 4093} {"train_loss": -6.926969528198242, "global_step": 171929, "epoch": 4093} {"train_loss": -6.994068145751953, "global_step": 171930, "epoch": 4093} {"train_loss": -6.956445693969727, "global_step": 171931, "epoch": 4093} {"train_loss": -6.9559783935546875, "global_step": 171932, "epoch": 4093} {"train_loss": -6.977917194366455, "global_step": 171933, "epoch": 4093} {"train_loss": -6.918482780456543, "global_step": 171934, "epoch": 4093} {"train_loss": -7.012561321258545, "global_step": 171935, "epoch": 4093} {"train_loss": -7.018489360809326, "global_step": 171936, "epoch": 4093} {"train_loss": -7.043830871582031, "global_step": 171937, "epoch": 4093} {"train_loss": -6.959828853607178, "global_step": 171938, "epoch": 4093} {"train_loss": -7.0736541748046875, "global_step": 171939, "epoch": 4093} {"train_loss": -6.9054155349731445, "global_step": 171940, "epoch": 4093} {"train_loss": -7.074582576751709, "global_step": 171941, "epoch": 4093} {"train_loss": -7.109828948974609, "global_step": 171942, "epoch": 4093} {"train_loss": -7.032651424407959, "global_step": 171943, "epoch": 4093} {"train_loss": -6.9300384521484375, "global_step": 171944, "epoch": 4093} {"train_loss": -6.9903564453125, "global_step": 171945, "epoch": 4093} {"train_loss": -6.999011993408203, "global_step": 171946, "epoch": 4093} {"train_loss": -6.995483602796282, "global_step": 171947, "epoch": 4093, "val_loss": 79924.453125} {"train_loss": -7.130699157714844, "global_step": 171948, "epoch": 4094} {"train_loss": -7.094768524169922, "global_step": 171949, "epoch": 4094} {"train_loss": -7.152261257171631, "global_step": 171950, "epoch": 4094} {"train_loss": -6.994920253753662, "global_step": 171951, "epoch": 4094} {"train_loss": -7.08546781539917, "global_step": 171952, "epoch": 4094} {"train_loss": -7.053544998168945, "global_step": 171953, "epoch": 4094} {"train_loss": -7.073543548583984, "global_step": 171954, "epoch": 4094} {"train_loss": -7.077402114868164, "global_step": 171955, "epoch": 4094} {"train_loss": -7.014720916748047, "global_step": 171956, "epoch": 4094} {"train_loss": -7.009890556335449, "global_step": 171957, "epoch": 4094} {"train_loss": -7.086567401885986, "global_step": 171958, "epoch": 4094} {"train_loss": -7.080234527587891, "global_step": 171959, "epoch": 4094} {"train_loss": -7.0975751876831055, "global_step": 171960, "epoch": 4094} {"train_loss": -7.05634069442749, "global_step": 171961, "epoch": 4094} {"train_loss": -6.956258773803711, "global_step": 171962, "epoch": 4094} {"train_loss": -7.101130485534668, "global_step": 171963, "epoch": 4094} {"train_loss": -7.103004455566406, "global_step": 171964, "epoch": 4094} {"train_loss": -7.104758262634277, "global_step": 171965, "epoch": 4094} {"train_loss": -7.044289588928223, "global_step": 171966, "epoch": 4094} {"train_loss": -7.163098335266113, "global_step": 171967, "epoch": 4094} {"train_loss": -7.0260210037231445, "global_step": 171968, "epoch": 4094} {"train_loss": -7.090198993682861, "global_step": 171969, "epoch": 4094} {"train_loss": -6.923276901245117, "global_step": 171970, "epoch": 4094} {"train_loss": -7.10275411605835, "global_step": 171971, "epoch": 4094} {"train_loss": -7.055489540100098, "global_step": 171972, "epoch": 4094} {"train_loss": -7.094249248504639, "global_step": 171973, "epoch": 4094} {"train_loss": -7.104504585266113, "global_step": 171974, "epoch": 4094} {"train_loss": -7.087446689605713, "global_step": 171975, "epoch": 4094} {"train_loss": -7.037198543548584, "global_step": 171976, "epoch": 4094} {"train_loss": -7.065210819244385, "global_step": 171977, "epoch": 4094} {"train_loss": -6.993776321411133, "global_step": 171978, "epoch": 4094} {"train_loss": -7.116247653961182, "global_step": 171979, "epoch": 4094} {"train_loss": -7.013766288757324, "global_step": 171980, "epoch": 4094} {"train_loss": -6.995974540710449, "global_step": 171981, "epoch": 4094} {"train_loss": -7.003375053405762, "global_step": 171982, "epoch": 4094} {"train_loss": -7.078761577606201, "global_step": 171983, "epoch": 4094} {"train_loss": -7.175994873046875, "global_step": 171984, "epoch": 4094} {"train_loss": -7.026062965393066, "global_step": 171985, "epoch": 4094} {"train_loss": -7.074954032897949, "global_step": 171986, "epoch": 4094} {"train_loss": -7.041101932525635, "global_step": 171987, "epoch": 4094} {"train_loss": -7.0064191818237305, "global_step": 171988, "epoch": 4094} {"train_loss": -7.060403619493757, "global_step": 171989, "epoch": 4094, "val_loss": 79877.2890625} {"train_loss": -7.149417877197266, "global_step": 171990, "epoch": 4095} {"train_loss": -7.185118675231934, "global_step": 171991, "epoch": 4095} {"train_loss": -7.096826553344727, "global_step": 171992, "epoch": 4095} {"train_loss": -7.027482986450195, "global_step": 171993, "epoch": 4095} {"train_loss": -7.077929973602295, "global_step": 171994, "epoch": 4095} {"train_loss": -7.109889984130859, "global_step": 171995, "epoch": 4095} {"train_loss": -7.076581001281738, "global_step": 171996, "epoch": 4095} {"train_loss": -7.057352066040039, "global_step": 171997, "epoch": 4095} {"train_loss": -7.057456970214844, "global_step": 171998, "epoch": 4095} {"train_loss": -7.136593818664551, "global_step": 171999, "epoch": 4095} {"train_loss": -7.014358043670654, "global_step": 172000, "epoch": 4095} {"train_loss": -7.050469875335693, "global_step": 172001, "epoch": 4095} {"train_loss": -7.165571212768555, "global_step": 172002, "epoch": 4095} {"train_loss": -6.973023414611816, "global_step": 172003, "epoch": 4095} {"train_loss": -7.0079264640808105, "global_step": 172004, "epoch": 4095} {"train_loss": -7.157173156738281, "global_step": 172005, "epoch": 4095} {"train_loss": -7.096526145935059, "global_step": 172006, "epoch": 4095} {"train_loss": -7.103490829467773, "global_step": 172007, "epoch": 4095} {"train_loss": -6.9956464767456055, "global_step": 172008, "epoch": 4095} {"train_loss": -7.030396461486816, "global_step": 172009, "epoch": 4095} {"train_loss": -7.110203742980957, "global_step": 172010, "epoch": 4095} {"train_loss": -7.072018623352051, "global_step": 172011, "epoch": 4095} {"train_loss": -6.975785255432129, "global_step": 172012, "epoch": 4095} {"train_loss": -7.141562461853027, "global_step": 172013, "epoch": 4095} {"train_loss": -7.1179280281066895, "global_step": 172014, "epoch": 4095} {"train_loss": -6.998438835144043, "global_step": 172015, "epoch": 4095} {"train_loss": -7.135795593261719, "global_step": 172016, "epoch": 4095} {"train_loss": -7.039257049560547, "global_step": 172017, "epoch": 4095} {"train_loss": -7.06668758392334, "global_step": 172018, "epoch": 4095} {"train_loss": -7.083927631378174, "global_step": 172019, "epoch": 4095} {"train_loss": -7.060238361358643, "global_step": 172020, "epoch": 4095} {"train_loss": -7.131669998168945, "global_step": 172021, "epoch": 4095} {"train_loss": -7.033755779266357, "global_step": 172022, "epoch": 4095} {"train_loss": -7.064536094665527, "global_step": 172023, "epoch": 4095} {"train_loss": -6.977999687194824, "global_step": 172024, "epoch": 4095} {"train_loss": -7.146470069885254, "global_step": 172025, "epoch": 4095} {"train_loss": -7.178918838500977, "global_step": 172026, "epoch": 4095} {"train_loss": -7.130987167358398, "global_step": 172027, "epoch": 4095} {"train_loss": -7.0535125732421875, "global_step": 172028, "epoch": 4095} {"train_loss": -7.066771984100342, "global_step": 172029, "epoch": 4095} {"train_loss": -6.94642448425293, "global_step": 172030, "epoch": 4095} {"train_loss": -7.072241226832072, "global_step": 172031, "epoch": 4095, "val_loss": 79743.546875} {"train_loss": -7.050925254821777, "global_step": 172032, "epoch": 4096} {"train_loss": -6.986390113830566, "global_step": 172033, "epoch": 4096} {"train_loss": -7.050025939941406, "global_step": 172034, "epoch": 4096} {"train_loss": -7.054001808166504, "global_step": 172035, "epoch": 4096} {"train_loss": -6.961238861083984, "global_step": 172036, "epoch": 4096} {"train_loss": -7.018423080444336, "global_step": 172037, "epoch": 4096} {"train_loss": -6.9595046043396, "global_step": 172038, "epoch": 4096} {"train_loss": -7.066741466522217, "global_step": 172039, "epoch": 4096} {"train_loss": -7.032235145568848, "global_step": 172040, "epoch": 4096} {"train_loss": -6.996526718139648, "global_step": 172041, "epoch": 4096} {"train_loss": -7.0571136474609375, "global_step": 172042, "epoch": 4096} {"train_loss": -7.087642669677734, "global_step": 172043, "epoch": 4096} {"train_loss": -7.037519454956055, "global_step": 172044, "epoch": 4096} {"train_loss": -7.091890811920166, "global_step": 172045, "epoch": 4096} {"train_loss": -7.087255001068115, "global_step": 172046, "epoch": 4096} {"train_loss": -7.036646842956543, "global_step": 172047, "epoch": 4096} {"train_loss": -6.945764064788818, "global_step": 172048, "epoch": 4096} {"train_loss": -6.919150352478027, "global_step": 172049, "epoch": 4096} {"train_loss": -7.013396263122559, "global_step": 172050, "epoch": 4096} {"train_loss": -7.028525352478027, "global_step": 172051, "epoch": 4096} {"train_loss": -7.034595012664795, "global_step": 172052, "epoch": 4096} {"train_loss": -7.041611194610596, "global_step": 172053, "epoch": 4096} {"train_loss": -7.138371467590332, "global_step": 172054, "epoch": 4096} {"train_loss": -7.027575492858887, "global_step": 172055, "epoch": 4096} {"train_loss": -7.010861396789551, "global_step": 172056, "epoch": 4096} {"train_loss": -7.064388275146484, "global_step": 172057, "epoch": 4096} {"train_loss": -7.1154632568359375, "global_step": 172058, "epoch": 4096} {"train_loss": -7.081852912902832, "global_step": 172059, "epoch": 4096} {"train_loss": -7.092434883117676, "global_step": 172060, "epoch": 4096} {"train_loss": -7.038259983062744, "global_step": 172061, "epoch": 4096} {"train_loss": -7.190440654754639, "global_step": 172062, "epoch": 4096} {"train_loss": -7.146585464477539, "global_step": 172063, "epoch": 4096} {"train_loss": -7.122711181640625, "global_step": 172064, "epoch": 4096} {"train_loss": -7.210310459136963, "global_step": 172065, "epoch": 4096} {"train_loss": -7.04611873626709, "global_step": 172066, "epoch": 4096} {"train_loss": -7.101951599121094, "global_step": 172067, "epoch": 4096} {"train_loss": -7.190074920654297, "global_step": 172068, "epoch": 4096} {"train_loss": -7.114568710327148, "global_step": 172069, "epoch": 4096} {"train_loss": -7.090108871459961, "global_step": 172070, "epoch": 4096} {"train_loss": -7.059556484222412, "global_step": 172071, "epoch": 4096} {"train_loss": -7.150463104248047, "global_step": 172072, "epoch": 4096} {"train_loss": -7.063225428263347, "global_step": 172073, "epoch": 4096, "val_loss": 80029.390625} {"train_loss": -7.113707542419434, "global_step": 172074, "epoch": 4097} {"train_loss": -7.10166072845459, "global_step": 172075, "epoch": 4097} {"train_loss": -7.158022880554199, "global_step": 172076, "epoch": 4097} {"train_loss": -7.1386799812316895, "global_step": 172077, "epoch": 4097} {"train_loss": -7.004725933074951, "global_step": 172078, "epoch": 4097} {"train_loss": -7.029524326324463, "global_step": 172079, "epoch": 4097} {"train_loss": -7.212124824523926, "global_step": 172080, "epoch": 4097} {"train_loss": -6.9861063957214355, "global_step": 172081, "epoch": 4097} {"train_loss": -7.012737274169922, "global_step": 172082, "epoch": 4097} {"train_loss": -7.210318565368652, "global_step": 172083, "epoch": 4097} {"train_loss": -7.023838520050049, "global_step": 172084, "epoch": 4097} {"train_loss": -7.086913108825684, "global_step": 172085, "epoch": 4097} {"train_loss": -7.060672760009766, "global_step": 172086, "epoch": 4097} {"train_loss": -7.148791313171387, "global_step": 172087, "epoch": 4097} {"train_loss": -7.040937423706055, "global_step": 172088, "epoch": 4097} {"train_loss": -7.093885898590088, "global_step": 172089, "epoch": 4097} {"train_loss": -6.8539018630981445, "global_step": 172090, "epoch": 4097} {"train_loss": -6.966727256774902, "global_step": 172091, "epoch": 4097} {"train_loss": -7.158913612365723, "global_step": 172092, "epoch": 4097} {"train_loss": -6.966102600097656, "global_step": 172093, "epoch": 4097} {"train_loss": -7.039620399475098, "global_step": 172094, "epoch": 4097} {"train_loss": -7.065400123596191, "global_step": 172095, "epoch": 4097} {"train_loss": -7.102989196777344, "global_step": 172096, "epoch": 4097} {"train_loss": -7.171265602111816, "global_step": 172097, "epoch": 4097} {"train_loss": -7.036501884460449, "global_step": 172098, "epoch": 4097} {"train_loss": -7.011775016784668, "global_step": 172099, "epoch": 4097} {"train_loss": -7.087423324584961, "global_step": 172100, "epoch": 4097} {"train_loss": -7.02744197845459, "global_step": 172101, "epoch": 4097} {"train_loss": -7.079527854919434, "global_step": 172102, "epoch": 4097} {"train_loss": -6.960747718811035, "global_step": 172103, "epoch": 4097} {"train_loss": -7.198925018310547, "global_step": 172104, "epoch": 4097} {"train_loss": -7.1212263107299805, "global_step": 172105, "epoch": 4097} {"train_loss": -7.0825910568237305, "global_step": 172106, "epoch": 4097} {"train_loss": -7.118626117706299, "global_step": 172107, "epoch": 4097} {"train_loss": -7.158596038818359, "global_step": 172108, "epoch": 4097} {"train_loss": -7.0721435546875, "global_step": 172109, "epoch": 4097} {"train_loss": -7.090398788452148, "global_step": 172110, "epoch": 4097} {"train_loss": -7.038471221923828, "global_step": 172111, "epoch": 4097} {"train_loss": -7.013450622558594, "global_step": 172112, "epoch": 4097} {"train_loss": -7.048956871032715, "global_step": 172113, "epoch": 4097} {"train_loss": -7.059645175933838, "global_step": 172114, "epoch": 4097} {"train_loss": -7.071128777095249, "global_step": 172115, "epoch": 4097, "val_loss": 79978.484375} {"train_loss": -7.129329681396484, "global_step": 172116, "epoch": 4098} {"train_loss": -7.161143779754639, "global_step": 172117, "epoch": 4098} {"train_loss": -7.011613845825195, "global_step": 172118, "epoch": 4098} {"train_loss": -7.143704414367676, "global_step": 172119, "epoch": 4098} {"train_loss": -7.097022533416748, "global_step": 172120, "epoch": 4098} {"train_loss": -7.0731940269470215, "global_step": 172121, "epoch": 4098} {"train_loss": -7.163125038146973, "global_step": 172122, "epoch": 4098} {"train_loss": -7.1446533203125, "global_step": 172123, "epoch": 4098} {"train_loss": -7.090765476226807, "global_step": 172124, "epoch": 4098} {"train_loss": -7.096969127655029, "global_step": 172125, "epoch": 4098} {"train_loss": -7.117640495300293, "global_step": 172126, "epoch": 4098} {"train_loss": -7.048050403594971, "global_step": 172127, "epoch": 4098} {"train_loss": -7.08525276184082, "global_step": 172128, "epoch": 4098} {"train_loss": -7.025985240936279, "global_step": 172129, "epoch": 4098} {"train_loss": -7.100964546203613, "global_step": 172130, "epoch": 4098} {"train_loss": -7.063870429992676, "global_step": 172131, "epoch": 4098} {"train_loss": -6.982488632202148, "global_step": 172132, "epoch": 4098} {"train_loss": -6.966052055358887, "global_step": 172133, "epoch": 4098} {"train_loss": -7.078973770141602, "global_step": 172134, "epoch": 4098} {"train_loss": -7.037599086761475, "global_step": 172135, "epoch": 4098} {"train_loss": -7.1077117919921875, "global_step": 172136, "epoch": 4098} {"train_loss": -7.1261677742004395, "global_step": 172137, "epoch": 4098} {"train_loss": -7.083848476409912, "global_step": 172138, "epoch": 4098} {"train_loss": -7.057016372680664, "global_step": 172139, "epoch": 4098} {"train_loss": -7.053544521331787, "global_step": 172140, "epoch": 4098} {"train_loss": -7.002370834350586, "global_step": 172141, "epoch": 4098} {"train_loss": -7.105313301086426, "global_step": 172142, "epoch": 4098} {"train_loss": -6.9612250328063965, "global_step": 172143, "epoch": 4098} {"train_loss": -6.9028754234313965, "global_step": 172144, "epoch": 4098} {"train_loss": -6.966975212097168, "global_step": 172145, "epoch": 4098} {"train_loss": -7.0115790367126465, "global_step": 172146, "epoch": 4098} {"train_loss": -7.061566352844238, "global_step": 172147, "epoch": 4098} {"train_loss": -7.037822246551514, "global_step": 172148, "epoch": 4098} {"train_loss": -6.837224960327148, "global_step": 172149, "epoch": 4098} {"train_loss": -7.0113325119018555, "global_step": 172150, "epoch": 4098} {"train_loss": -6.996291160583496, "global_step": 172151, "epoch": 4098} {"train_loss": -7.0360307693481445, "global_step": 172152, "epoch": 4098} {"train_loss": -7.00715970993042, "global_step": 172153, "epoch": 4098} {"train_loss": -6.994038105010986, "global_step": 172154, "epoch": 4098} {"train_loss": -6.981420040130615, "global_step": 172155, "epoch": 4098} {"train_loss": -7.0088043212890625, "global_step": 172156, "epoch": 4098} {"train_loss": -7.047060319355556, "global_step": 172157, "epoch": 4098, "val_loss": 80180.1484375} {"train_loss": -7.010117530822754, "global_step": 172158, "epoch": 4099} {"train_loss": -6.982058525085449, "global_step": 172159, "epoch": 4099} {"train_loss": -6.989527225494385, "global_step": 172160, "epoch": 4099} {"train_loss": -6.924015045166016, "global_step": 172161, "epoch": 4099} {"train_loss": -7.04984712600708, "global_step": 172162, "epoch": 4099} {"train_loss": -7.0540900230407715, "global_step": 172163, "epoch": 4099} {"train_loss": -6.958101272583008, "global_step": 172164, "epoch": 4099} {"train_loss": -7.05607795715332, "global_step": 172165, "epoch": 4099} {"train_loss": -6.940645217895508, "global_step": 172166, "epoch": 4099} {"train_loss": -7.027941703796387, "global_step": 172167, "epoch": 4099} {"train_loss": -7.011438369750977, "global_step": 172168, "epoch": 4099} {"train_loss": -7.10280179977417, "global_step": 172169, "epoch": 4099} {"train_loss": -6.884571075439453, "global_step": 172170, "epoch": 4099} {"train_loss": -7.018217086791992, "global_step": 172171, "epoch": 4099} {"train_loss": -6.947633266448975, "global_step": 172172, "epoch": 4099} {"train_loss": -7.054910659790039, "global_step": 172173, "epoch": 4099} {"train_loss": -6.997646808624268, "global_step": 172174, "epoch": 4099} {"train_loss": -7.041265487670898, "global_step": 172175, "epoch": 4099} {"train_loss": -6.9904069900512695, "global_step": 172176, "epoch": 4099} {"train_loss": -7.014288425445557, "global_step": 172177, "epoch": 4099} {"train_loss": -7.091338634490967, "global_step": 172178, "epoch": 4099} {"train_loss": -6.933775424957275, "global_step": 172179, "epoch": 4099} {"train_loss": -7.120039939880371, "global_step": 172180, "epoch": 4099} {"train_loss": -7.070404052734375, "global_step": 172181, "epoch": 4099} {"train_loss": -7.082526206970215, "global_step": 172182, "epoch": 4099} {"train_loss": -6.968996524810791, "global_step": 172183, "epoch": 4099} {"train_loss": -7.038640022277832, "global_step": 172184, "epoch": 4099} {"train_loss": -7.117869853973389, "global_step": 172185, "epoch": 4099} {"train_loss": -7.067300796508789, "global_step": 172186, "epoch": 4099} {"train_loss": -7.127013206481934, "global_step": 172187, "epoch": 4099} {"train_loss": -6.959481239318848, "global_step": 172188, "epoch": 4099} {"train_loss": -7.1537628173828125, "global_step": 172189, "epoch": 4099} {"train_loss": -7.126631259918213, "global_step": 172190, "epoch": 4099} {"train_loss": -7.044675827026367, "global_step": 172191, "epoch": 4099} {"train_loss": -7.073160171508789, "global_step": 172192, "epoch": 4099} {"train_loss": -7.1646270751953125, "global_step": 172193, "epoch": 4099} {"train_loss": -7.107942581176758, "global_step": 172194, "epoch": 4099} {"train_loss": -7.091721057891846, "global_step": 172195, "epoch": 4099} {"train_loss": -7.068044185638428, "global_step": 172196, "epoch": 4099} {"train_loss": -7.048858642578125, "global_step": 172197, "epoch": 4099} {"train_loss": -7.084501266479492, "global_step": 172198, "epoch": 4099} {"train_loss": -7.039149522781372, "global_step": 172199, "epoch": 4099, "val_loss": 79973.859375} {"train_loss": -7.084375381469727, "global_step": 172200, "epoch": 4100} {"train_loss": -7.155054092407227, "global_step": 172201, "epoch": 4100} {"train_loss": -7.008391380310059, "global_step": 172202, "epoch": 4100} {"train_loss": -7.083190441131592, "global_step": 172203, "epoch": 4100} {"train_loss": -7.08964729309082, "global_step": 172204, "epoch": 4100} {"train_loss": -6.995419025421143, "global_step": 172205, "epoch": 4100} {"train_loss": -7.053203582763672, "global_step": 172206, "epoch": 4100} {"train_loss": -7.003939628601074, "global_step": 172207, "epoch": 4100} {"train_loss": -7.122237682342529, "global_step": 172208, "epoch": 4100} {"train_loss": -7.024656295776367, "global_step": 172209, "epoch": 4100} {"train_loss": -6.927728652954102, "global_step": 172210, "epoch": 4100} {"train_loss": -6.942789077758789, "global_step": 172211, "epoch": 4100} {"train_loss": -6.868517875671387, "global_step": 172212, "epoch": 4100} {"train_loss": -7.013454914093018, "global_step": 172213, "epoch": 4100} {"train_loss": -6.86254358291626, "global_step": 172214, "epoch": 4100} {"train_loss": -7.177273750305176, "global_step": 172215, "epoch": 4100} {"train_loss": -7.090754985809326, "global_step": 172216, "epoch": 4100} {"train_loss": -6.964387893676758, "global_step": 172217, "epoch": 4100} {"train_loss": -7.0707244873046875, "global_step": 172218, "epoch": 4100} {"train_loss": -7.080132484436035, "global_step": 172219, "epoch": 4100} {"train_loss": -7.0882954597473145, "global_step": 172220, "epoch": 4100} {"train_loss": -7.055366516113281, "global_step": 172221, "epoch": 4100} {"train_loss": -7.054793834686279, "global_step": 172222, "epoch": 4100} {"train_loss": -7.038912296295166, "global_step": 172223, "epoch": 4100} {"train_loss": -7.0216193199157715, "global_step": 172224, "epoch": 4100} {"train_loss": -7.003036975860596, "global_step": 172225, "epoch": 4100} {"train_loss": -7.092979907989502, "global_step": 172226, "epoch": 4100} {"train_loss": -7.040506362915039, "global_step": 172227, "epoch": 4100} {"train_loss": -7.010858058929443, "global_step": 172228, "epoch": 4100} {"train_loss": -7.085901737213135, "global_step": 172229, "epoch": 4100} {"train_loss": -7.085357666015625, "global_step": 172230, "epoch": 4100} {"train_loss": -7.068461894989014, "global_step": 172231, "epoch": 4100} {"train_loss": -6.992217063903809, "global_step": 172232, "epoch": 4100} {"train_loss": -7.037818908691406, "global_step": 172233, "epoch": 4100} {"train_loss": -7.123300552368164, "global_step": 172234, "epoch": 4100} {"train_loss": -7.092090129852295, "global_step": 172235, "epoch": 4100} {"train_loss": -7.188015937805176, "global_step": 172236, "epoch": 4100} {"train_loss": -7.1354289054870605, "global_step": 172237, "epoch": 4100} {"train_loss": -7.135870933532715, "global_step": 172238, "epoch": 4100} {"train_loss": -7.141502380371094, "global_step": 172239, "epoch": 4100} {"train_loss": -7.169721603393555, "global_step": 172240, "epoch": 4100} {"train_loss": -7.05374162537711, "global_step": 172241, "epoch": 4100, "train/sim_max_reward_0": 0.19832928115799314, "train/sim_max_reward_1": 0.8918402105605646, "train/sim_max_reward_2": 0.3636473465368283, "train/sim_max_reward_3": 0.1364212790310955, "train/sim_max_reward_4": 0.32355509657049714, "train/sim_max_reward_5": 0.5672263481341414, "test/sim_max_reward_4500000": 0.9585494899825665, "test/sim_max_reward_4500001": 0.9614670804256003, "test/sim_max_reward_4500002": 0.995786240312368, "test/sim_max_reward_4500003": 0.9583534030775877, "test/sim_max_reward_4500004": 0.24571829765754613, "test/sim_max_reward_4500005": 0.9893566986953569, "test/sim_max_reward_4500006": 0.9525120621410885, "test/sim_max_reward_4500007": 0.9945583771403794, "test/sim_max_reward_4500008": 0.42041398661990625, "test/sim_max_reward_4500009": 0.05318760850326925, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9970700932977774, "test/sim_max_reward_4500012": 0.9824892985580764, "test/sim_max_reward_4500013": 0.0028357732037462605, "test/sim_max_reward_4500014": 0.7448660731869695, "test/sim_max_reward_4500015": 0.9710025525673863, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.09937181038695485, "test/sim_max_reward_4500018": 0.9891202340816374, "test/sim_max_reward_4500019": 0.956261399405966, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8620399972477901, "test/sim_max_reward_4500022": 0.9962385418148857, "test/sim_max_reward_4500023": 0.8621960679830106, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9404017835481757, "test/sim_max_reward_4500026": 0.9220083358589597, "test/sim_max_reward_4500027": 0.9872826668957295, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.11364525477199777, "test/sim_max_reward_4500030": 0.8892191663051823, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.04670993405069667, "test/sim_max_reward_4500033": 0.9532003034292791, "test/sim_max_reward_4500034": 0.8980417644163786, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 0.9763043903355746, "test/sim_max_reward_4500037": 0.905588747239501, "test/sim_max_reward_4500038": 0.3254403693392803, "test/sim_max_reward_4500039": 1.0, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.9782283185681734, "test/sim_max_reward_4500042": 0.061575802235446966, "test/sim_max_reward_4500043": 0.9425300216906539, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9021227090216346, "test/sim_max_reward_4500046": 0.23449537791406352, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9317774210481868, "test/sim_max_reward_4500049": 0.87285255731563, "train/mean_score": 0.41350326033185336, "test/mean_score": 0.6416108325543135, "val_loss": 79918.3125} {"train_loss": -7.155179977416992, "global_step": 172242, "epoch": 4101} {"train_loss": -7.180384159088135, "global_step": 172243, "epoch": 4101} {"train_loss": -7.116691589355469, "global_step": 172244, "epoch": 4101} {"train_loss": -7.1237897872924805, "global_step": 172245, "epoch": 4101} {"train_loss": -7.06403923034668, "global_step": 172246, "epoch": 4101} {"train_loss": -7.084444999694824, "global_step": 172247, "epoch": 4101} {"train_loss": -7.126235008239746, "global_step": 172248, "epoch": 4101} {"train_loss": -6.974515914916992, "global_step": 172249, "epoch": 4101} {"train_loss": -7.024540901184082, "global_step": 172250, "epoch": 4101} {"train_loss": -7.0606184005737305, "global_step": 172251, "epoch": 4101} {"train_loss": -7.053625106811523, "global_step": 172252, "epoch": 4101} {"train_loss": -7.061208248138428, "global_step": 172253, "epoch": 4101} {"train_loss": -7.035050392150879, "global_step": 172254, "epoch": 4101} {"train_loss": -7.112825870513916, "global_step": 172255, "epoch": 4101} {"train_loss": -7.082840919494629, "global_step": 172256, "epoch": 4101} {"train_loss": -6.957951545715332, "global_step": 172257, "epoch": 4101} {"train_loss": -7.070443153381348, "global_step": 172258, "epoch": 4101} {"train_loss": -7.008411407470703, "global_step": 172259, "epoch": 4101} {"train_loss": -6.907873153686523, "global_step": 172260, "epoch": 4101} {"train_loss": -7.128993034362793, "global_step": 172261, "epoch": 4101} {"train_loss": -6.942407131195068, "global_step": 172262, "epoch": 4101} {"train_loss": -6.902618885040283, "global_step": 172263, "epoch": 4101} {"train_loss": -6.9804229736328125, "global_step": 172264, "epoch": 4101} {"train_loss": -6.968235015869141, "global_step": 172265, "epoch": 4101} {"train_loss": -7.109805107116699, "global_step": 172266, "epoch": 4101} {"train_loss": -6.891472816467285, "global_step": 172267, "epoch": 4101} {"train_loss": -7.0458598136901855, "global_step": 172268, "epoch": 4101} {"train_loss": -7.129498481750488, "global_step": 172269, "epoch": 4101} {"train_loss": -7.054601669311523, "global_step": 172270, "epoch": 4101} {"train_loss": -7.156363010406494, "global_step": 172271, "epoch": 4101} {"train_loss": -7.099327087402344, "global_step": 172272, "epoch": 4101} {"train_loss": -6.986014366149902, "global_step": 172273, "epoch": 4101} {"train_loss": -6.919330596923828, "global_step": 172274, "epoch": 4101} {"train_loss": -7.019512176513672, "global_step": 172275, "epoch": 4101} {"train_loss": -7.097418785095215, "global_step": 172276, "epoch": 4101} {"train_loss": -6.992810249328613, "global_step": 172277, "epoch": 4101} {"train_loss": -7.108388900756836, "global_step": 172278, "epoch": 4101} {"train_loss": -7.121933460235596, "global_step": 172279, "epoch": 4101} {"train_loss": -7.066979885101318, "global_step": 172280, "epoch": 4101} {"train_loss": -7.013659477233887, "global_step": 172281, "epoch": 4101} {"train_loss": -7.051381587982178, "global_step": 172282, "epoch": 4101} {"train_loss": -7.049243824822562, "global_step": 172283, "epoch": 4101, "val_loss": 79832.4375} {"train_loss": -7.1480607986450195, "global_step": 172284, "epoch": 4102} {"train_loss": -7.097311973571777, "global_step": 172285, "epoch": 4102} {"train_loss": -7.106055736541748, "global_step": 172286, "epoch": 4102} {"train_loss": -7.206053256988525, "global_step": 172287, "epoch": 4102} {"train_loss": -7.0474629402160645, "global_step": 172288, "epoch": 4102} {"train_loss": -7.050795555114746, "global_step": 172289, "epoch": 4102} {"train_loss": -7.047667026519775, "global_step": 172290, "epoch": 4102} {"train_loss": -7.194700241088867, "global_step": 172291, "epoch": 4102} {"train_loss": -7.162347316741943, "global_step": 172292, "epoch": 4102} {"train_loss": -7.106777191162109, "global_step": 172293, "epoch": 4102} {"train_loss": -7.095947742462158, "global_step": 172294, "epoch": 4102} {"train_loss": -7.135771751403809, "global_step": 172295, "epoch": 4102} {"train_loss": -7.138858795166016, "global_step": 172296, "epoch": 4102} {"train_loss": -7.043654918670654, "global_step": 172297, "epoch": 4102} {"train_loss": -7.010204315185547, "global_step": 172298, "epoch": 4102} {"train_loss": -7.062780380249023, "global_step": 172299, "epoch": 4102} {"train_loss": -7.12625789642334, "global_step": 172300, "epoch": 4102} {"train_loss": -6.9928483963012695, "global_step": 172301, "epoch": 4102} {"train_loss": -7.094298839569092, "global_step": 172302, "epoch": 4102} {"train_loss": -7.0448198318481445, "global_step": 172303, "epoch": 4102} {"train_loss": -7.008024215698242, "global_step": 172304, "epoch": 4102} {"train_loss": -7.1251444816589355, "global_step": 172305, "epoch": 4102} {"train_loss": -7.150062084197998, "global_step": 172306, "epoch": 4102} {"train_loss": -7.1233601570129395, "global_step": 172307, "epoch": 4102} {"train_loss": -6.8712968826293945, "global_step": 172308, "epoch": 4102} {"train_loss": -7.11357307434082, "global_step": 172309, "epoch": 4102} {"train_loss": -7.028544902801514, "global_step": 172310, "epoch": 4102} {"train_loss": -6.963334560394287, "global_step": 172311, "epoch": 4102} {"train_loss": -7.224096775054932, "global_step": 172312, "epoch": 4102} {"train_loss": -7.0706634521484375, "global_step": 172313, "epoch": 4102} {"train_loss": -7.051896095275879, "global_step": 172314, "epoch": 4102} {"train_loss": -7.097759246826172, "global_step": 172315, "epoch": 4102} {"train_loss": -7.166407108306885, "global_step": 172316, "epoch": 4102} {"train_loss": -7.03162145614624, "global_step": 172317, "epoch": 4102} {"train_loss": -7.103389739990234, "global_step": 172318, "epoch": 4102} {"train_loss": -7.036728858947754, "global_step": 172319, "epoch": 4102} {"train_loss": -6.973109245300293, "global_step": 172320, "epoch": 4102} {"train_loss": -7.022157669067383, "global_step": 172321, "epoch": 4102} {"train_loss": -7.104377746582031, "global_step": 172322, "epoch": 4102} {"train_loss": -7.0540618896484375, "global_step": 172323, "epoch": 4102} {"train_loss": -7.079024791717529, "global_step": 172324, "epoch": 4102} {"train_loss": -7.078915800367083, "global_step": 172325, "epoch": 4102, "val_loss": 79938.6953125} {"train_loss": -7.0294084548950195, "global_step": 172326, "epoch": 4103} {"train_loss": -6.954866886138916, "global_step": 172327, "epoch": 4103} {"train_loss": -7.017067909240723, "global_step": 172328, "epoch": 4103} {"train_loss": -7.065446853637695, "global_step": 172329, "epoch": 4103} {"train_loss": -7.039523124694824, "global_step": 172330, "epoch": 4103} {"train_loss": -7.0102667808532715, "global_step": 172331, "epoch": 4103} {"train_loss": -7.011251449584961, "global_step": 172332, "epoch": 4103} {"train_loss": -7.132221221923828, "global_step": 172333, "epoch": 4103} {"train_loss": -7.073591232299805, "global_step": 172334, "epoch": 4103} {"train_loss": -7.1053314208984375, "global_step": 172335, "epoch": 4103} {"train_loss": -7.075592041015625, "global_step": 172336, "epoch": 4103} {"train_loss": -7.121281623840332, "global_step": 172337, "epoch": 4103} {"train_loss": -7.061141490936279, "global_step": 172338, "epoch": 4103} {"train_loss": -7.069797515869141, "global_step": 172339, "epoch": 4103} {"train_loss": -7.09725284576416, "global_step": 172340, "epoch": 4103} {"train_loss": -7.160225868225098, "global_step": 172341, "epoch": 4103} {"train_loss": -7.013132572174072, "global_step": 172342, "epoch": 4103} {"train_loss": -7.150373458862305, "global_step": 172343, "epoch": 4103} {"train_loss": -7.032114505767822, "global_step": 172344, "epoch": 4103} {"train_loss": -7.028301239013672, "global_step": 172345, "epoch": 4103} {"train_loss": -7.055302619934082, "global_step": 172346, "epoch": 4103} {"train_loss": -7.146103858947754, "global_step": 172347, "epoch": 4103} {"train_loss": -7.042690277099609, "global_step": 172348, "epoch": 4103} {"train_loss": -7.1166582107543945, "global_step": 172349, "epoch": 4103} {"train_loss": -7.070164680480957, "global_step": 172350, "epoch": 4103} {"train_loss": -7.078384876251221, "global_step": 172351, "epoch": 4103} {"train_loss": -7.202126979827881, "global_step": 172352, "epoch": 4103} {"train_loss": -7.208617210388184, "global_step": 172353, "epoch": 4103} {"train_loss": -7.115819931030273, "global_step": 172354, "epoch": 4103} {"train_loss": -7.0508623123168945, "global_step": 172355, "epoch": 4103} {"train_loss": -7.10141134262085, "global_step": 172356, "epoch": 4103} {"train_loss": -7.064367294311523, "global_step": 172357, "epoch": 4103} {"train_loss": -7.0148162841796875, "global_step": 172358, "epoch": 4103} {"train_loss": -6.980365753173828, "global_step": 172359, "epoch": 4103} {"train_loss": -7.092291831970215, "global_step": 172360, "epoch": 4103} {"train_loss": -7.07640266418457, "global_step": 172361, "epoch": 4103} {"train_loss": -7.055645942687988, "global_step": 172362, "epoch": 4103} {"train_loss": -6.910656929016113, "global_step": 172363, "epoch": 4103} {"train_loss": -7.019277095794678, "global_step": 172364, "epoch": 4103} {"train_loss": -7.098859786987305, "global_step": 172365, "epoch": 4103} {"train_loss": -6.95159912109375, "global_step": 172366, "epoch": 4103} {"train_loss": -7.064967291695731, "global_step": 172367, "epoch": 4103, "val_loss": 79968.484375} {"train_loss": -7.009869575500488, "global_step": 172368, "epoch": 4104} {"train_loss": -6.921270847320557, "global_step": 172369, "epoch": 4104} {"train_loss": -7.0812530517578125, "global_step": 172370, "epoch": 4104} {"train_loss": -6.960472106933594, "global_step": 172371, "epoch": 4104} {"train_loss": -7.075758934020996, "global_step": 172372, "epoch": 4104} {"train_loss": -6.910491943359375, "global_step": 172373, "epoch": 4104} {"train_loss": -7.10198974609375, "global_step": 172374, "epoch": 4104} {"train_loss": -7.011922359466553, "global_step": 172375, "epoch": 4104} {"train_loss": -7.043632507324219, "global_step": 172376, "epoch": 4104} {"train_loss": -7.025633811950684, "global_step": 172377, "epoch": 4104} {"train_loss": -7.007707595825195, "global_step": 172378, "epoch": 4104} {"train_loss": -7.106024742126465, "global_step": 172379, "epoch": 4104} {"train_loss": -6.917295455932617, "global_step": 172380, "epoch": 4104} {"train_loss": -7.062544822692871, "global_step": 172381, "epoch": 4104} {"train_loss": -7.0457000732421875, "global_step": 172382, "epoch": 4104} {"train_loss": -6.945761680603027, "global_step": 172383, "epoch": 4104} {"train_loss": -7.1237640380859375, "global_step": 172384, "epoch": 4104} {"train_loss": -6.893489837646484, "global_step": 172385, "epoch": 4104} {"train_loss": -7.073569297790527, "global_step": 172386, "epoch": 4104} {"train_loss": -6.933416843414307, "global_step": 172387, "epoch": 4104} {"train_loss": -7.104677200317383, "global_step": 172388, "epoch": 4104} {"train_loss": -7.093461990356445, "global_step": 172389, "epoch": 4104} {"train_loss": -7.032108306884766, "global_step": 172390, "epoch": 4104} {"train_loss": -7.200516223907471, "global_step": 172391, "epoch": 4104} {"train_loss": -7.049488067626953, "global_step": 172392, "epoch": 4104} {"train_loss": -7.076852798461914, "global_step": 172393, "epoch": 4104} {"train_loss": -7.162527561187744, "global_step": 172394, "epoch": 4104} {"train_loss": -7.003596305847168, "global_step": 172395, "epoch": 4104} {"train_loss": -7.119016647338867, "global_step": 172396, "epoch": 4104} {"train_loss": -6.988657474517822, "global_step": 172397, "epoch": 4104} {"train_loss": -7.069483757019043, "global_step": 172398, "epoch": 4104} {"train_loss": -7.125676155090332, "global_step": 172399, "epoch": 4104} {"train_loss": -7.1044087409973145, "global_step": 172400, "epoch": 4104} {"train_loss": -7.063766956329346, "global_step": 172401, "epoch": 4104} {"train_loss": -7.06384801864624, "global_step": 172402, "epoch": 4104} {"train_loss": -7.126554012298584, "global_step": 172403, "epoch": 4104} {"train_loss": -7.040672779083252, "global_step": 172404, "epoch": 4104} {"train_loss": -7.0152506828308105, "global_step": 172405, "epoch": 4104} {"train_loss": -7.082510948181152, "global_step": 172406, "epoch": 4104} {"train_loss": -7.1041340827941895, "global_step": 172407, "epoch": 4104} {"train_loss": -7.04534912109375, "global_step": 172408, "epoch": 4104} {"train_loss": -7.044079598926363, "global_step": 172409, "epoch": 4104, "val_loss": 80137.4140625} {"train_loss": -7.144600868225098, "global_step": 172410, "epoch": 4105} {"train_loss": -7.100201606750488, "global_step": 172411, "epoch": 4105} {"train_loss": -7.004299640655518, "global_step": 172412, "epoch": 4105} {"train_loss": -7.058417320251465, "global_step": 172413, "epoch": 4105} {"train_loss": -7.121599197387695, "global_step": 172414, "epoch": 4105} {"train_loss": -7.0420026779174805, "global_step": 172415, "epoch": 4105} {"train_loss": -7.104872703552246, "global_step": 172416, "epoch": 4105} {"train_loss": -7.021266937255859, "global_step": 172417, "epoch": 4105} {"train_loss": -7.021757125854492, "global_step": 172418, "epoch": 4105} {"train_loss": -7.082545280456543, "global_step": 172419, "epoch": 4105} {"train_loss": -7.160520553588867, "global_step": 172420, "epoch": 4105} {"train_loss": -7.043462753295898, "global_step": 172421, "epoch": 4105} {"train_loss": -7.105152130126953, "global_step": 172422, "epoch": 4105} {"train_loss": -7.134169578552246, "global_step": 172423, "epoch": 4105} {"train_loss": -7.059981346130371, "global_step": 172424, "epoch": 4105} {"train_loss": -7.140182018280029, "global_step": 172425, "epoch": 4105} {"train_loss": -7.085813522338867, "global_step": 172426, "epoch": 4105} {"train_loss": -7.135005950927734, "global_step": 172427, "epoch": 4105} {"train_loss": -7.07496976852417, "global_step": 172428, "epoch": 4105} {"train_loss": -7.077793598175049, "global_step": 172429, "epoch": 4105} {"train_loss": -7.125263214111328, "global_step": 172430, "epoch": 4105} {"train_loss": -7.120724678039551, "global_step": 172431, "epoch": 4105} {"train_loss": -7.0845441818237305, "global_step": 172432, "epoch": 4105} {"train_loss": -7.124176502227783, "global_step": 172433, "epoch": 4105} {"train_loss": -7.109219551086426, "global_step": 172434, "epoch": 4105} {"train_loss": -7.107244491577148, "global_step": 172435, "epoch": 4105} {"train_loss": -7.037848472595215, "global_step": 172436, "epoch": 4105} {"train_loss": -6.96549129486084, "global_step": 172437, "epoch": 4105} {"train_loss": -7.058097839355469, "global_step": 172438, "epoch": 4105} {"train_loss": -7.050709247589111, "global_step": 172439, "epoch": 4105} {"train_loss": -7.150252342224121, "global_step": 172440, "epoch": 4105} {"train_loss": -7.195086479187012, "global_step": 172441, "epoch": 4105} {"train_loss": -7.079007625579834, "global_step": 172442, "epoch": 4105} {"train_loss": -7.100315570831299, "global_step": 172443, "epoch": 4105} {"train_loss": -7.1226725578308105, "global_step": 172444, "epoch": 4105} {"train_loss": -7.155898094177246, "global_step": 172445, "epoch": 4105} {"train_loss": -7.035557746887207, "global_step": 172446, "epoch": 4105} {"train_loss": -7.159193992614746, "global_step": 172447, "epoch": 4105} {"train_loss": -6.996527194976807, "global_step": 172448, "epoch": 4105} {"train_loss": -7.0871686935424805, "global_step": 172449, "epoch": 4105} {"train_loss": -7.245803356170654, "global_step": 172450, "epoch": 4105} {"train_loss": -7.090509119487944, "global_step": 172451, "epoch": 4105, "val_loss": 79946.9140625} {"train_loss": -7.095592498779297, "global_step": 172452, "epoch": 4106} {"train_loss": -7.063982963562012, "global_step": 172453, "epoch": 4106} {"train_loss": -6.935457229614258, "global_step": 172454, "epoch": 4106} {"train_loss": -7.0744428634643555, "global_step": 172455, "epoch": 4106} {"train_loss": -7.205024719238281, "global_step": 172456, "epoch": 4106} {"train_loss": -7.071617126464844, "global_step": 172457, "epoch": 4106} {"train_loss": -7.145971775054932, "global_step": 172458, "epoch": 4106} {"train_loss": -7.100918292999268, "global_step": 172459, "epoch": 4106} {"train_loss": -7.1285223960876465, "global_step": 172460, "epoch": 4106} {"train_loss": -6.924449920654297, "global_step": 172461, "epoch": 4106} {"train_loss": -7.069582939147949, "global_step": 172462, "epoch": 4106} {"train_loss": -7.148268699645996, "global_step": 172463, "epoch": 4106} {"train_loss": -7.029504776000977, "global_step": 172464, "epoch": 4106} {"train_loss": -6.956989765167236, "global_step": 172465, "epoch": 4106} {"train_loss": -7.051894187927246, "global_step": 172466, "epoch": 4106} {"train_loss": -7.197136878967285, "global_step": 172467, "epoch": 4106} {"train_loss": -7.076478481292725, "global_step": 172468, "epoch": 4106} {"train_loss": -7.026847839355469, "global_step": 172469, "epoch": 4106} {"train_loss": -7.083335876464844, "global_step": 172470, "epoch": 4106} {"train_loss": -7.128533363342285, "global_step": 172471, "epoch": 4106} {"train_loss": -7.15291690826416, "global_step": 172472, "epoch": 4106} {"train_loss": -7.079684734344482, "global_step": 172473, "epoch": 4106} {"train_loss": -7.09018611907959, "global_step": 172474, "epoch": 4106} {"train_loss": -7.086756706237793, "global_step": 172475, "epoch": 4106} {"train_loss": -6.938836574554443, "global_step": 172476, "epoch": 4106} {"train_loss": -7.0758056640625, "global_step": 172477, "epoch": 4106} {"train_loss": -7.05858850479126, "global_step": 172478, "epoch": 4106} {"train_loss": -6.935430526733398, "global_step": 172479, "epoch": 4106} {"train_loss": -7.079198837280273, "global_step": 172480, "epoch": 4106} {"train_loss": -7.080517768859863, "global_step": 172481, "epoch": 4106} {"train_loss": -7.055737495422363, "global_step": 172482, "epoch": 4106} {"train_loss": -7.1438679695129395, "global_step": 172483, "epoch": 4106} {"train_loss": -7.057762622833252, "global_step": 172484, "epoch": 4106} {"train_loss": -7.074024677276611, "global_step": 172485, "epoch": 4106} {"train_loss": -7.041731357574463, "global_step": 172486, "epoch": 4106} {"train_loss": -7.024202346801758, "global_step": 172487, "epoch": 4106} {"train_loss": -7.003556251525879, "global_step": 172488, "epoch": 4106} {"train_loss": -7.079979419708252, "global_step": 172489, "epoch": 4106} {"train_loss": -7.143348693847656, "global_step": 172490, "epoch": 4106} {"train_loss": -6.9549055099487305, "global_step": 172491, "epoch": 4106} {"train_loss": -7.043519020080566, "global_step": 172492, "epoch": 4106} {"train_loss": -7.065873111997332, "global_step": 172493, "epoch": 4106, "val_loss": 79939.1015625} {"train_loss": -7.056314468383789, "global_step": 172494, "epoch": 4107} {"train_loss": -7.093379020690918, "global_step": 172495, "epoch": 4107} {"train_loss": -7.006827354431152, "global_step": 172496, "epoch": 4107} {"train_loss": -7.011963844299316, "global_step": 172497, "epoch": 4107} {"train_loss": -6.862636089324951, "global_step": 172498, "epoch": 4107} {"train_loss": -7.058075428009033, "global_step": 172499, "epoch": 4107} {"train_loss": -7.0416412353515625, "global_step": 172500, "epoch": 4107} {"train_loss": -6.817755699157715, "global_step": 172501, "epoch": 4107} {"train_loss": -7.011821746826172, "global_step": 172502, "epoch": 4107} {"train_loss": -6.972322463989258, "global_step": 172503, "epoch": 4107} {"train_loss": -6.991157531738281, "global_step": 172504, "epoch": 4107} {"train_loss": -6.881661415100098, "global_step": 172505, "epoch": 4107} {"train_loss": -7.046778678894043, "global_step": 172506, "epoch": 4107} {"train_loss": -7.01003885269165, "global_step": 172507, "epoch": 4107} {"train_loss": -7.0803608894348145, "global_step": 172508, "epoch": 4107} {"train_loss": -7.012648105621338, "global_step": 172509, "epoch": 4107} {"train_loss": -6.917733192443848, "global_step": 172510, "epoch": 4107} {"train_loss": -7.028824806213379, "global_step": 172511, "epoch": 4107} {"train_loss": -7.021976470947266, "global_step": 172512, "epoch": 4107} {"train_loss": -7.0347442626953125, "global_step": 172513, "epoch": 4107} {"train_loss": -7.087183952331543, "global_step": 172514, "epoch": 4107} {"train_loss": -7.043673038482666, "global_step": 172515, "epoch": 4107} {"train_loss": -6.979709148406982, "global_step": 172516, "epoch": 4107} {"train_loss": -7.132318496704102, "global_step": 172517, "epoch": 4107} {"train_loss": -6.918880462646484, "global_step": 172518, "epoch": 4107} {"train_loss": -7.084906101226807, "global_step": 172519, "epoch": 4107} {"train_loss": -7.109356880187988, "global_step": 172520, "epoch": 4107} {"train_loss": -7.004605770111084, "global_step": 172521, "epoch": 4107} {"train_loss": -7.148993015289307, "global_step": 172522, "epoch": 4107} {"train_loss": -6.927783966064453, "global_step": 172523, "epoch": 4107} {"train_loss": -7.135408401489258, "global_step": 172524, "epoch": 4107} {"train_loss": -7.097378730773926, "global_step": 172525, "epoch": 4107} {"train_loss": -6.911401748657227, "global_step": 172526, "epoch": 4107} {"train_loss": -7.0740485191345215, "global_step": 172527, "epoch": 4107} {"train_loss": -7.022933006286621, "global_step": 172528, "epoch": 4107} {"train_loss": -7.040467262268066, "global_step": 172529, "epoch": 4107} {"train_loss": -7.125011444091797, "global_step": 172530, "epoch": 4107} {"train_loss": -6.966802597045898, "global_step": 172531, "epoch": 4107} {"train_loss": -7.023613452911377, "global_step": 172532, "epoch": 4107} {"train_loss": -6.975353717803955, "global_step": 172533, "epoch": 4107} {"train_loss": -7.094871520996094, "global_step": 172534, "epoch": 4107} {"train_loss": -7.022324823197865, "global_step": 172535, "epoch": 4107, "val_loss": 79767.640625} {"train_loss": -7.053829669952393, "global_step": 172536, "epoch": 4108} {"train_loss": -7.058968544006348, "global_step": 172537, "epoch": 4108} {"train_loss": -7.1173095703125, "global_step": 172538, "epoch": 4108} {"train_loss": -6.968610763549805, "global_step": 172539, "epoch": 4108} {"train_loss": -6.978829383850098, "global_step": 172540, "epoch": 4108} {"train_loss": -7.0026116371154785, "global_step": 172541, "epoch": 4108} {"train_loss": -7.087497711181641, "global_step": 172542, "epoch": 4108} {"train_loss": -6.995516777038574, "global_step": 172543, "epoch": 4108} {"train_loss": -7.1372761726379395, "global_step": 172544, "epoch": 4108} {"train_loss": -7.037901401519775, "global_step": 172545, "epoch": 4108} {"train_loss": -7.084020614624023, "global_step": 172546, "epoch": 4108} {"train_loss": -6.823540687561035, "global_step": 172547, "epoch": 4108} {"train_loss": -7.078275680541992, "global_step": 172548, "epoch": 4108} {"train_loss": -6.951331615447998, "global_step": 172549, "epoch": 4108} {"train_loss": -7.058783531188965, "global_step": 172550, "epoch": 4108} {"train_loss": -7.008414268493652, "global_step": 172551, "epoch": 4108} {"train_loss": -6.998040199279785, "global_step": 172552, "epoch": 4108} {"train_loss": -6.899064064025879, "global_step": 172553, "epoch": 4108} {"train_loss": -6.965134620666504, "global_step": 172554, "epoch": 4108} {"train_loss": -6.943077087402344, "global_step": 172555, "epoch": 4108} {"train_loss": -6.934843063354492, "global_step": 172556, "epoch": 4108} {"train_loss": -7.041628837585449, "global_step": 172557, "epoch": 4108} {"train_loss": -7.00870943069458, "global_step": 172558, "epoch": 4108} {"train_loss": -7.137327194213867, "global_step": 172559, "epoch": 4108} {"train_loss": -7.056475639343262, "global_step": 172560, "epoch": 4108} {"train_loss": -6.950346946716309, "global_step": 172561, "epoch": 4108} {"train_loss": -7.04388427734375, "global_step": 172562, "epoch": 4108} {"train_loss": -7.0539326667785645, "global_step": 172563, "epoch": 4108} {"train_loss": -7.002012729644775, "global_step": 172564, "epoch": 4108} {"train_loss": -7.077119827270508, "global_step": 172565, "epoch": 4108} {"train_loss": -6.930667877197266, "global_step": 172566, "epoch": 4108} {"train_loss": -6.971103191375732, "global_step": 172567, "epoch": 4108} {"train_loss": -6.797005653381348, "global_step": 172568, "epoch": 4108} {"train_loss": -6.876345634460449, "global_step": 172569, "epoch": 4108} {"train_loss": -6.907580375671387, "global_step": 172570, "epoch": 4108} {"train_loss": -6.884852409362793, "global_step": 172571, "epoch": 4108} {"train_loss": -6.95501708984375, "global_step": 172572, "epoch": 4108} {"train_loss": -6.925148010253906, "global_step": 172573, "epoch": 4108} {"train_loss": -7.005219459533691, "global_step": 172574, "epoch": 4108} {"train_loss": -7.025938987731934, "global_step": 172575, "epoch": 4108} {"train_loss": -7.122322082519531, "global_step": 172576, "epoch": 4108} {"train_loss": -6.997185377847581, "global_step": 172577, "epoch": 4108, "val_loss": 80030.1328125} {"train_loss": -7.011571884155273, "global_step": 172578, "epoch": 4109} {"train_loss": -7.095920562744141, "global_step": 172579, "epoch": 4109} {"train_loss": -7.118656635284424, "global_step": 172580, "epoch": 4109} {"train_loss": -7.1119794845581055, "global_step": 172581, "epoch": 4109} {"train_loss": -6.904022693634033, "global_step": 172582, "epoch": 4109} {"train_loss": -7.064640998840332, "global_step": 172583, "epoch": 4109} {"train_loss": -7.068207740783691, "global_step": 172584, "epoch": 4109} {"train_loss": -7.06640625, "global_step": 172585, "epoch": 4109} {"train_loss": -6.975996971130371, "global_step": 172586, "epoch": 4109} {"train_loss": -6.962705612182617, "global_step": 172587, "epoch": 4109} {"train_loss": -6.8749918937683105, "global_step": 172588, "epoch": 4109} {"train_loss": -7.027532577514648, "global_step": 172589, "epoch": 4109} {"train_loss": -7.120361804962158, "global_step": 172590, "epoch": 4109} {"train_loss": -7.052690505981445, "global_step": 172591, "epoch": 4109} {"train_loss": -7.090557098388672, "global_step": 172592, "epoch": 4109} {"train_loss": -7.1286725997924805, "global_step": 172593, "epoch": 4109} {"train_loss": -6.999871253967285, "global_step": 172594, "epoch": 4109} {"train_loss": -7.122307777404785, "global_step": 172595, "epoch": 4109} {"train_loss": -7.040566444396973, "global_step": 172596, "epoch": 4109} {"train_loss": -6.968967914581299, "global_step": 172597, "epoch": 4109} {"train_loss": -7.017541885375977, "global_step": 172598, "epoch": 4109} {"train_loss": -7.063901901245117, "global_step": 172599, "epoch": 4109} {"train_loss": -6.9288835525512695, "global_step": 172600, "epoch": 4109} {"train_loss": -7.125749588012695, "global_step": 172601, "epoch": 4109} {"train_loss": -7.053744792938232, "global_step": 172602, "epoch": 4109} {"train_loss": -6.93436336517334, "global_step": 172603, "epoch": 4109} {"train_loss": -7.0395050048828125, "global_step": 172604, "epoch": 4109} {"train_loss": -6.869948387145996, "global_step": 172605, "epoch": 4109} {"train_loss": -7.055811882019043, "global_step": 172606, "epoch": 4109} {"train_loss": -6.977112770080566, "global_step": 172607, "epoch": 4109} {"train_loss": -7.0173659324646, "global_step": 172608, "epoch": 4109} {"train_loss": -7.041826248168945, "global_step": 172609, "epoch": 4109} {"train_loss": -7.036283493041992, "global_step": 172610, "epoch": 4109} {"train_loss": -6.986243724822998, "global_step": 172611, "epoch": 4109} {"train_loss": -7.042923927307129, "global_step": 172612, "epoch": 4109} {"train_loss": -7.1062517166137695, "global_step": 172613, "epoch": 4109} {"train_loss": -6.810731410980225, "global_step": 172614, "epoch": 4109} {"train_loss": -7.073819160461426, "global_step": 172615, "epoch": 4109} {"train_loss": -6.980887413024902, "global_step": 172616, "epoch": 4109} {"train_loss": -6.9884138107299805, "global_step": 172617, "epoch": 4109} {"train_loss": -6.903693675994873, "global_step": 172618, "epoch": 4109} {"train_loss": -7.0205716859726675, "global_step": 172619, "epoch": 4109, "val_loss": 80130.234375} {"train_loss": -7.052126884460449, "global_step": 172620, "epoch": 4110} {"train_loss": -6.9606523513793945, "global_step": 172621, "epoch": 4110} {"train_loss": -6.996685981750488, "global_step": 172622, "epoch": 4110} {"train_loss": -7.043863296508789, "global_step": 172623, "epoch": 4110} {"train_loss": -7.030583381652832, "global_step": 172624, "epoch": 4110} {"train_loss": -7.100457668304443, "global_step": 172625, "epoch": 4110} {"train_loss": -6.943058967590332, "global_step": 172626, "epoch": 4110} {"train_loss": -7.10814905166626, "global_step": 172627, "epoch": 4110} {"train_loss": -6.835582733154297, "global_step": 172628, "epoch": 4110} {"train_loss": -7.050650596618652, "global_step": 172629, "epoch": 4110} {"train_loss": -7.061234951019287, "global_step": 172630, "epoch": 4110} {"train_loss": -6.997469902038574, "global_step": 172631, "epoch": 4110} {"train_loss": -7.041424751281738, "global_step": 172632, "epoch": 4110} {"train_loss": -7.101541519165039, "global_step": 172633, "epoch": 4110} {"train_loss": -7.081745147705078, "global_step": 172634, "epoch": 4110} {"train_loss": -7.124475479125977, "global_step": 172635, "epoch": 4110} {"train_loss": -7.054062843322754, "global_step": 172636, "epoch": 4110} {"train_loss": -7.1091485023498535, "global_step": 172637, "epoch": 4110} {"train_loss": -7.079201698303223, "global_step": 172638, "epoch": 4110} {"train_loss": -7.099930763244629, "global_step": 172639, "epoch": 4110} {"train_loss": -7.154361724853516, "global_step": 172640, "epoch": 4110} {"train_loss": -7.1022562980651855, "global_step": 172641, "epoch": 4110} {"train_loss": -7.061017990112305, "global_step": 172642, "epoch": 4110} {"train_loss": -7.05810546875, "global_step": 172643, "epoch": 4110} {"train_loss": -7.069394111633301, "global_step": 172644, "epoch": 4110} {"train_loss": -7.046291828155518, "global_step": 172645, "epoch": 4110} {"train_loss": -7.119498252868652, "global_step": 172646, "epoch": 4110} {"train_loss": -7.161408424377441, "global_step": 172647, "epoch": 4110} {"train_loss": -7.176485061645508, "global_step": 172648, "epoch": 4110} {"train_loss": -7.189259052276611, "global_step": 172649, "epoch": 4110} {"train_loss": -7.137351036071777, "global_step": 172650, "epoch": 4110} {"train_loss": -7.060173034667969, "global_step": 172651, "epoch": 4110} {"train_loss": -7.224783897399902, "global_step": 172652, "epoch": 4110} {"train_loss": -7.172038555145264, "global_step": 172653, "epoch": 4110} {"train_loss": -7.204719543457031, "global_step": 172654, "epoch": 4110} {"train_loss": -7.152090072631836, "global_step": 172655, "epoch": 4110} {"train_loss": -7.043968200683594, "global_step": 172656, "epoch": 4110} {"train_loss": -7.13801383972168, "global_step": 172657, "epoch": 4110} {"train_loss": -7.000035762786865, "global_step": 172658, "epoch": 4110} {"train_loss": -7.002627372741699, "global_step": 172659, "epoch": 4110} {"train_loss": -7.041557312011719, "global_step": 172660, "epoch": 4110} {"train_loss": -7.076124406996227, "global_step": 172661, "epoch": 4110, "val_loss": 80052.46875} {"train_loss": -7.125080585479736, "global_step": 172662, "epoch": 4111} {"train_loss": -7.1581854820251465, "global_step": 172663, "epoch": 4111} {"train_loss": -7.13446569442749, "global_step": 172664, "epoch": 4111} {"train_loss": -7.141095161437988, "global_step": 172665, "epoch": 4111} {"train_loss": -7.037639617919922, "global_step": 172666, "epoch": 4111} {"train_loss": -7.048508644104004, "global_step": 172667, "epoch": 4111} {"train_loss": -7.040448188781738, "global_step": 172668, "epoch": 4111} {"train_loss": -7.017587184906006, "global_step": 172669, "epoch": 4111} {"train_loss": -7.095377445220947, "global_step": 172670, "epoch": 4111} {"train_loss": -6.958197116851807, "global_step": 172671, "epoch": 4111} {"train_loss": -7.062185287475586, "global_step": 172672, "epoch": 4111} {"train_loss": -7.166059494018555, "global_step": 172673, "epoch": 4111} {"train_loss": -7.1332011222839355, "global_step": 172674, "epoch": 4111} {"train_loss": -7.097201347351074, "global_step": 172675, "epoch": 4111} {"train_loss": -6.96345329284668, "global_step": 172676, "epoch": 4111} {"train_loss": -7.12384033203125, "global_step": 172677, "epoch": 4111} {"train_loss": -6.995746612548828, "global_step": 172678, "epoch": 4111} {"train_loss": -7.036471366882324, "global_step": 172679, "epoch": 4111} {"train_loss": -7.0862627029418945, "global_step": 172680, "epoch": 4111} {"train_loss": -7.15986442565918, "global_step": 172681, "epoch": 4111} {"train_loss": -7.001554489135742, "global_step": 172682, "epoch": 4111} {"train_loss": -6.977144718170166, "global_step": 172683, "epoch": 4111} {"train_loss": -7.013855934143066, "global_step": 172684, "epoch": 4111} {"train_loss": -6.9991607666015625, "global_step": 172685, "epoch": 4111} {"train_loss": -7.155921936035156, "global_step": 172686, "epoch": 4111} {"train_loss": -7.124100208282471, "global_step": 172687, "epoch": 4111} {"train_loss": -7.052469730377197, "global_step": 172688, "epoch": 4111} {"train_loss": -6.9872283935546875, "global_step": 172689, "epoch": 4111} {"train_loss": -7.000428199768066, "global_step": 172690, "epoch": 4111} {"train_loss": -6.994973182678223, "global_step": 172691, "epoch": 4111} {"train_loss": -7.132484436035156, "global_step": 172692, "epoch": 4111} {"train_loss": -6.997010707855225, "global_step": 172693, "epoch": 4111} {"train_loss": -7.032240867614746, "global_step": 172694, "epoch": 4111} {"train_loss": -6.949172496795654, "global_step": 172695, "epoch": 4111} {"train_loss": -7.037707805633545, "global_step": 172696, "epoch": 4111} {"train_loss": -7.139881134033203, "global_step": 172697, "epoch": 4111} {"train_loss": -7.118893623352051, "global_step": 172698, "epoch": 4111} {"train_loss": -6.959357261657715, "global_step": 172699, "epoch": 4111} {"train_loss": -7.106022834777832, "global_step": 172700, "epoch": 4111} {"train_loss": -7.037114143371582, "global_step": 172701, "epoch": 4111} {"train_loss": -7.111005783081055, "global_step": 172702, "epoch": 4111} {"train_loss": -7.062020017987206, "global_step": 172703, "epoch": 4111, "val_loss": 79965.6328125} {"train_loss": -7.1536970138549805, "global_step": 172704, "epoch": 4112} {"train_loss": -7.070337295532227, "global_step": 172705, "epoch": 4112} {"train_loss": -7.118664741516113, "global_step": 172706, "epoch": 4112} {"train_loss": -7.020540237426758, "global_step": 172707, "epoch": 4112} {"train_loss": -7.148671627044678, "global_step": 172708, "epoch": 4112} {"train_loss": -6.997349739074707, "global_step": 172709, "epoch": 4112} {"train_loss": -7.207110404968262, "global_step": 172710, "epoch": 4112} {"train_loss": -7.06188440322876, "global_step": 172711, "epoch": 4112} {"train_loss": -7.111639499664307, "global_step": 172712, "epoch": 4112} {"train_loss": -6.971200942993164, "global_step": 172713, "epoch": 4112} {"train_loss": -7.102305889129639, "global_step": 172714, "epoch": 4112} {"train_loss": -7.06784725189209, "global_step": 172715, "epoch": 4112} {"train_loss": -6.883888244628906, "global_step": 172716, "epoch": 4112} {"train_loss": -7.0068464279174805, "global_step": 172717, "epoch": 4112} {"train_loss": -7.0869550704956055, "global_step": 172718, "epoch": 4112} {"train_loss": -7.129411697387695, "global_step": 172719, "epoch": 4112} {"train_loss": -6.926644325256348, "global_step": 172720, "epoch": 4112} {"train_loss": -7.089420318603516, "global_step": 172721, "epoch": 4112} {"train_loss": -6.950216293334961, "global_step": 172722, "epoch": 4112} {"train_loss": -7.071221351623535, "global_step": 172723, "epoch": 4112} {"train_loss": -7.1907267570495605, "global_step": 172724, "epoch": 4112} {"train_loss": -7.137137413024902, "global_step": 172725, "epoch": 4112} {"train_loss": -7.050084590911865, "global_step": 172726, "epoch": 4112} {"train_loss": -7.103930473327637, "global_step": 172727, "epoch": 4112} {"train_loss": -7.056037425994873, "global_step": 172728, "epoch": 4112} {"train_loss": -7.210988521575928, "global_step": 172729, "epoch": 4112} {"train_loss": -6.945436477661133, "global_step": 172730, "epoch": 4112} {"train_loss": -7.167449951171875, "global_step": 172731, "epoch": 4112} {"train_loss": -7.131342887878418, "global_step": 172732, "epoch": 4112} {"train_loss": -6.988260269165039, "global_step": 172733, "epoch": 4112} {"train_loss": -7.065272331237793, "global_step": 172734, "epoch": 4112} {"train_loss": -7.057792663574219, "global_step": 172735, "epoch": 4112} {"train_loss": -7.033288478851318, "global_step": 172736, "epoch": 4112} {"train_loss": -7.073539733886719, "global_step": 172737, "epoch": 4112} {"train_loss": -7.086623191833496, "global_step": 172738, "epoch": 4112} {"train_loss": -7.135111331939697, "global_step": 172739, "epoch": 4112} {"train_loss": -7.1003522872924805, "global_step": 172740, "epoch": 4112} {"train_loss": -7.226500988006592, "global_step": 172741, "epoch": 4112} {"train_loss": -7.121151924133301, "global_step": 172742, "epoch": 4112} {"train_loss": -7.0472893714904785, "global_step": 172743, "epoch": 4112} {"train_loss": -7.053579330444336, "global_step": 172744, "epoch": 4112} {"train_loss": -7.075758525303432, "global_step": 172745, "epoch": 4112, "val_loss": 80160.140625} {"train_loss": -7.072297096252441, "global_step": 172746, "epoch": 4113} {"train_loss": -7.1132307052612305, "global_step": 172747, "epoch": 4113} {"train_loss": -6.971393585205078, "global_step": 172748, "epoch": 4113} {"train_loss": -6.9807329177856445, "global_step": 172749, "epoch": 4113} {"train_loss": -6.846802234649658, "global_step": 172750, "epoch": 4113} {"train_loss": -7.029573917388916, "global_step": 172751, "epoch": 4113} {"train_loss": -6.767301082611084, "global_step": 172752, "epoch": 4113} {"train_loss": -7.059974670410156, "global_step": 172753, "epoch": 4113} {"train_loss": -6.778408050537109, "global_step": 172754, "epoch": 4113} {"train_loss": -6.824380874633789, "global_step": 172755, "epoch": 4113} {"train_loss": -7.0694804191589355, "global_step": 172756, "epoch": 4113} {"train_loss": -6.894224166870117, "global_step": 172757, "epoch": 4113} {"train_loss": -7.027335166931152, "global_step": 172758, "epoch": 4113} {"train_loss": -7.037627696990967, "global_step": 172759, "epoch": 4113} {"train_loss": -6.9596357345581055, "global_step": 172760, "epoch": 4113} {"train_loss": -6.983753204345703, "global_step": 172761, "epoch": 4113} {"train_loss": -7.048467636108398, "global_step": 172762, "epoch": 4113} {"train_loss": -6.9184064865112305, "global_step": 172763, "epoch": 4113} {"train_loss": -6.91323709487915, "global_step": 172764, "epoch": 4113} {"train_loss": -6.872140884399414, "global_step": 172765, "epoch": 4113} {"train_loss": -6.999354839324951, "global_step": 172766, "epoch": 4113} {"train_loss": -6.846145153045654, "global_step": 172767, "epoch": 4113} {"train_loss": -7.018138408660889, "global_step": 172768, "epoch": 4113} {"train_loss": -6.914819717407227, "global_step": 172769, "epoch": 4113} {"train_loss": -6.932497024536133, "global_step": 172770, "epoch": 4113} {"train_loss": -6.789615631103516, "global_step": 172771, "epoch": 4113} {"train_loss": -6.927556991577148, "global_step": 172772, "epoch": 4113} {"train_loss": -7.117569923400879, "global_step": 172773, "epoch": 4113} {"train_loss": -7.056303977966309, "global_step": 172774, "epoch": 4113} {"train_loss": -6.894746780395508, "global_step": 172775, "epoch": 4113} {"train_loss": -7.029781341552734, "global_step": 172776, "epoch": 4113} {"train_loss": -6.956061363220215, "global_step": 172777, "epoch": 4113} {"train_loss": -7.052443504333496, "global_step": 172778, "epoch": 4113} {"train_loss": -7.104209899902344, "global_step": 172779, "epoch": 4113} {"train_loss": -7.076021671295166, "global_step": 172780, "epoch": 4113} {"train_loss": -7.119565010070801, "global_step": 172781, "epoch": 4113} {"train_loss": -7.132850646972656, "global_step": 172782, "epoch": 4113} {"train_loss": -6.978854179382324, "global_step": 172783, "epoch": 4113} {"train_loss": -7.110115051269531, "global_step": 172784, "epoch": 4113} {"train_loss": -7.013680458068848, "global_step": 172785, "epoch": 4113} {"train_loss": -7.018498420715332, "global_step": 172786, "epoch": 4113} {"train_loss": -6.985290357044765, "global_step": 172787, "epoch": 4113, "val_loss": 79869.9921875} {"train_loss": -7.115022659301758, "global_step": 172788, "epoch": 4114} {"train_loss": -7.049515724182129, "global_step": 172789, "epoch": 4114} {"train_loss": -7.105989933013916, "global_step": 172790, "epoch": 4114} {"train_loss": -7.152443885803223, "global_step": 172791, "epoch": 4114} {"train_loss": -7.2209367752075195, "global_step": 172792, "epoch": 4114} {"train_loss": -7.11744499206543, "global_step": 172793, "epoch": 4114} {"train_loss": -7.021422386169434, "global_step": 172794, "epoch": 4114} {"train_loss": -7.029217720031738, "global_step": 172795, "epoch": 4114} {"train_loss": -7.044933319091797, "global_step": 172796, "epoch": 4114} {"train_loss": -6.975582122802734, "global_step": 172797, "epoch": 4114} {"train_loss": -7.083953380584717, "global_step": 172798, "epoch": 4114} {"train_loss": -7.131557464599609, "global_step": 172799, "epoch": 4114} {"train_loss": -7.095658302307129, "global_step": 172800, "epoch": 4114} {"train_loss": -7.238070487976074, "global_step": 172801, "epoch": 4114} {"train_loss": -7.138724327087402, "global_step": 172802, "epoch": 4114} {"train_loss": -7.20539665222168, "global_step": 172803, "epoch": 4114} {"train_loss": -7.102133274078369, "global_step": 172804, "epoch": 4114} {"train_loss": -7.08646821975708, "global_step": 172805, "epoch": 4114} {"train_loss": -7.15366792678833, "global_step": 172806, "epoch": 4114} {"train_loss": -7.007872581481934, "global_step": 172807, "epoch": 4114} {"train_loss": -7.067496299743652, "global_step": 172808, "epoch": 4114} {"train_loss": -6.994544982910156, "global_step": 172809, "epoch": 4114} {"train_loss": -7.039682388305664, "global_step": 172810, "epoch": 4114} {"train_loss": -7.14438533782959, "global_step": 172811, "epoch": 4114} {"train_loss": -7.00788688659668, "global_step": 172812, "epoch": 4114} {"train_loss": -7.087210655212402, "global_step": 172813, "epoch": 4114} {"train_loss": -7.121855735778809, "global_step": 172814, "epoch": 4114} {"train_loss": -7.072539806365967, "global_step": 172815, "epoch": 4114} {"train_loss": -6.963100910186768, "global_step": 172816, "epoch": 4114} {"train_loss": -7.040518283843994, "global_step": 172817, "epoch": 4114} {"train_loss": -7.13344144821167, "global_step": 172818, "epoch": 4114} {"train_loss": -6.93326997756958, "global_step": 172819, "epoch": 4114} {"train_loss": -7.093980312347412, "global_step": 172820, "epoch": 4114} {"train_loss": -7.02224588394165, "global_step": 172821, "epoch": 4114} {"train_loss": -7.147540092468262, "global_step": 172822, "epoch": 4114} {"train_loss": -6.963172435760498, "global_step": 172823, "epoch": 4114} {"train_loss": -6.828788757324219, "global_step": 172824, "epoch": 4114} {"train_loss": -7.028990268707275, "global_step": 172825, "epoch": 4114} {"train_loss": -6.8965373039245605, "global_step": 172826, "epoch": 4114} {"train_loss": -6.910616397857666, "global_step": 172827, "epoch": 4114} {"train_loss": -7.075675964355469, "global_step": 172828, "epoch": 4114} {"train_loss": -7.063107320240566, "global_step": 172829, "epoch": 4114, "val_loss": 80176.7265625} {"train_loss": -6.879627227783203, "global_step": 172830, "epoch": 4115} {"train_loss": -7.025040149688721, "global_step": 172831, "epoch": 4115} {"train_loss": -7.009415626525879, "global_step": 172832, "epoch": 4115} {"train_loss": -6.874242782592773, "global_step": 172833, "epoch": 4115} {"train_loss": -7.028850555419922, "global_step": 172834, "epoch": 4115} {"train_loss": -6.900310516357422, "global_step": 172835, "epoch": 4115} {"train_loss": -6.91324520111084, "global_step": 172836, "epoch": 4115} {"train_loss": -6.843856334686279, "global_step": 172837, "epoch": 4115} {"train_loss": -7.018801689147949, "global_step": 172838, "epoch": 4115} {"train_loss": -7.030145168304443, "global_step": 172839, "epoch": 4115} {"train_loss": -6.978946685791016, "global_step": 172840, "epoch": 4115} {"train_loss": -7.05344820022583, "global_step": 172841, "epoch": 4115} {"train_loss": -6.97926139831543, "global_step": 172842, "epoch": 4115} {"train_loss": -6.915707588195801, "global_step": 172843, "epoch": 4115} {"train_loss": -7.040053367614746, "global_step": 172844, "epoch": 4115} {"train_loss": -6.900882720947266, "global_step": 172845, "epoch": 4115} {"train_loss": -6.962615013122559, "global_step": 172846, "epoch": 4115} {"train_loss": -7.08851432800293, "global_step": 172847, "epoch": 4115} {"train_loss": -6.96235466003418, "global_step": 172848, "epoch": 4115} {"train_loss": -6.934799671173096, "global_step": 172849, "epoch": 4115} {"train_loss": -7.041749477386475, "global_step": 172850, "epoch": 4115} {"train_loss": -6.980224609375, "global_step": 172851, "epoch": 4115} {"train_loss": -6.972046852111816, "global_step": 172852, "epoch": 4115} {"train_loss": -7.042386531829834, "global_step": 172853, "epoch": 4115} {"train_loss": -6.918552398681641, "global_step": 172854, "epoch": 4115} {"train_loss": -7.113433837890625, "global_step": 172855, "epoch": 4115} {"train_loss": -7.035623550415039, "global_step": 172856, "epoch": 4115} {"train_loss": -7.145828723907471, "global_step": 172857, "epoch": 4115} {"train_loss": -7.0232954025268555, "global_step": 172858, "epoch": 4115} {"train_loss": -7.075641632080078, "global_step": 172859, "epoch": 4115} {"train_loss": -7.146608352661133, "global_step": 172860, "epoch": 4115} {"train_loss": -7.088508605957031, "global_step": 172861, "epoch": 4115} {"train_loss": -7.288611888885498, "global_step": 172862, "epoch": 4115} {"train_loss": -7.029728412628174, "global_step": 172863, "epoch": 4115} {"train_loss": -7.1665849685668945, "global_step": 172864, "epoch": 4115} {"train_loss": -7.208456039428711, "global_step": 172865, "epoch": 4115} {"train_loss": -7.1690216064453125, "global_step": 172866, "epoch": 4115} {"train_loss": -7.237180709838867, "global_step": 172867, "epoch": 4115} {"train_loss": -7.146116256713867, "global_step": 172868, "epoch": 4115} {"train_loss": -7.155782699584961, "global_step": 172869, "epoch": 4115} {"train_loss": -7.2031660079956055, "global_step": 172870, "epoch": 4115} {"train_loss": -7.038422368821644, "global_step": 172871, "epoch": 4115, "val_loss": 80043.953125} {"train_loss": -7.232909202575684, "global_step": 172872, "epoch": 4116} {"train_loss": -7.040962219238281, "global_step": 172873, "epoch": 4116} {"train_loss": -7.112939834594727, "global_step": 172874, "epoch": 4116} {"train_loss": -7.129610538482666, "global_step": 172875, "epoch": 4116} {"train_loss": -6.988450050354004, "global_step": 172876, "epoch": 4116} {"train_loss": -7.083441734313965, "global_step": 172877, "epoch": 4116} {"train_loss": -7.161177635192871, "global_step": 172878, "epoch": 4116} {"train_loss": -7.098759651184082, "global_step": 172879, "epoch": 4116} {"train_loss": -6.7518157958984375, "global_step": 172880, "epoch": 4116} {"train_loss": -6.9685869216918945, "global_step": 172881, "epoch": 4116} {"train_loss": -7.0060529708862305, "global_step": 172882, "epoch": 4116} {"train_loss": -6.921599388122559, "global_step": 172883, "epoch": 4116} {"train_loss": -6.914445400238037, "global_step": 172884, "epoch": 4116} {"train_loss": -7.080082893371582, "global_step": 172885, "epoch": 4116} {"train_loss": -6.891343116760254, "global_step": 172886, "epoch": 4116} {"train_loss": -6.879952907562256, "global_step": 172887, "epoch": 4116} {"train_loss": -7.005064964294434, "global_step": 172888, "epoch": 4116} {"train_loss": -6.799734115600586, "global_step": 172889, "epoch": 4116} {"train_loss": -6.892023086547852, "global_step": 172890, "epoch": 4116} {"train_loss": -6.937777519226074, "global_step": 172891, "epoch": 4116} {"train_loss": -7.004825592041016, "global_step": 172892, "epoch": 4116} {"train_loss": -6.796661376953125, "global_step": 172893, "epoch": 4116} {"train_loss": -6.966571807861328, "global_step": 172894, "epoch": 4116} {"train_loss": -6.899510860443115, "global_step": 172895, "epoch": 4116} {"train_loss": -6.946435928344727, "global_step": 172896, "epoch": 4116} {"train_loss": -6.859340667724609, "global_step": 172897, "epoch": 4116} {"train_loss": -7.027747631072998, "global_step": 172898, "epoch": 4116} {"train_loss": -6.925981521606445, "global_step": 172899, "epoch": 4116} {"train_loss": -6.90245246887207, "global_step": 172900, "epoch": 4116} {"train_loss": -6.882229804992676, "global_step": 172901, "epoch": 4116} {"train_loss": -7.083454132080078, "global_step": 172902, "epoch": 4116} {"train_loss": -7.017328262329102, "global_step": 172903, "epoch": 4116} {"train_loss": -7.118941783905029, "global_step": 172904, "epoch": 4116} {"train_loss": -7.032450199127197, "global_step": 172905, "epoch": 4116} {"train_loss": -6.9780144691467285, "global_step": 172906, "epoch": 4116} {"train_loss": -6.985097885131836, "global_step": 172907, "epoch": 4116} {"train_loss": -7.0181708335876465, "global_step": 172908, "epoch": 4116} {"train_loss": -7.003528118133545, "global_step": 172909, "epoch": 4116} {"train_loss": -7.0275983810424805, "global_step": 172910, "epoch": 4116} {"train_loss": -6.908542633056641, "global_step": 172911, "epoch": 4116} {"train_loss": -6.974562168121338, "global_step": 172912, "epoch": 4116} {"train_loss": -6.979563168116978, "global_step": 172913, "epoch": 4116, "val_loss": 79797.8984375} {"train_loss": -6.93309211730957, "global_step": 172914, "epoch": 4117} {"train_loss": -7.030511856079102, "global_step": 172915, "epoch": 4117} {"train_loss": -7.056434631347656, "global_step": 172916, "epoch": 4117} {"train_loss": -6.997710227966309, "global_step": 172917, "epoch": 4117} {"train_loss": -6.96745491027832, "global_step": 172918, "epoch": 4117} {"train_loss": -7.017582416534424, "global_step": 172919, "epoch": 4117} {"train_loss": -7.001640796661377, "global_step": 172920, "epoch": 4117} {"train_loss": -7.088086128234863, "global_step": 172921, "epoch": 4117} {"train_loss": -7.025871276855469, "global_step": 172922, "epoch": 4117} {"train_loss": -7.031457901000977, "global_step": 172923, "epoch": 4117} {"train_loss": -7.009303092956543, "global_step": 172924, "epoch": 4117} {"train_loss": -7.097611427307129, "global_step": 172925, "epoch": 4117} {"train_loss": -7.090489387512207, "global_step": 172926, "epoch": 4117} {"train_loss": -7.065506935119629, "global_step": 172927, "epoch": 4117} {"train_loss": -7.069180488586426, "global_step": 172928, "epoch": 4117} {"train_loss": -7.068194389343262, "global_step": 172929, "epoch": 4117} {"train_loss": -7.166705131530762, "global_step": 172930, "epoch": 4117} {"train_loss": -7.032536029815674, "global_step": 172931, "epoch": 4117} {"train_loss": -7.114924430847168, "global_step": 172932, "epoch": 4117} {"train_loss": -7.1882734298706055, "global_step": 172933, "epoch": 4117} {"train_loss": -7.130148410797119, "global_step": 172934, "epoch": 4117} {"train_loss": -7.129734992980957, "global_step": 172935, "epoch": 4117} {"train_loss": -7.083208084106445, "global_step": 172936, "epoch": 4117} {"train_loss": -7.116386413574219, "global_step": 172937, "epoch": 4117} {"train_loss": -7.14784574508667, "global_step": 172938, "epoch": 4117} {"train_loss": -7.0575947761535645, "global_step": 172939, "epoch": 4117} {"train_loss": -6.9950971603393555, "global_step": 172940, "epoch": 4117} {"train_loss": -7.122563362121582, "global_step": 172941, "epoch": 4117} {"train_loss": -6.963885307312012, "global_step": 172942, "epoch": 4117} {"train_loss": -7.131217002868652, "global_step": 172943, "epoch": 4117} {"train_loss": -7.174495220184326, "global_step": 172944, "epoch": 4117} {"train_loss": -7.0016770362854, "global_step": 172945, "epoch": 4117} {"train_loss": -7.088427543640137, "global_step": 172946, "epoch": 4117} {"train_loss": -6.911368370056152, "global_step": 172947, "epoch": 4117} {"train_loss": -7.048616409301758, "global_step": 172948, "epoch": 4117} {"train_loss": -7.056797981262207, "global_step": 172949, "epoch": 4117} {"train_loss": -6.964387893676758, "global_step": 172950, "epoch": 4117} {"train_loss": -7.108129978179932, "global_step": 172951, "epoch": 4117} {"train_loss": -7.109230041503906, "global_step": 172952, "epoch": 4117} {"train_loss": -6.980868339538574, "global_step": 172953, "epoch": 4117} {"train_loss": -7.11604118347168, "global_step": 172954, "epoch": 4117} {"train_loss": -7.058052925836472, "global_step": 172955, "epoch": 4117, "val_loss": 80095.9609375} {"train_loss": -6.9570817947387695, "global_step": 172956, "epoch": 4118} {"train_loss": -7.145120620727539, "global_step": 172957, "epoch": 4118} {"train_loss": -6.939217567443848, "global_step": 172958, "epoch": 4118} {"train_loss": -7.113683223724365, "global_step": 172959, "epoch": 4118} {"train_loss": -7.051177024841309, "global_step": 172960, "epoch": 4118} {"train_loss": -7.058018684387207, "global_step": 172961, "epoch": 4118} {"train_loss": -7.069496154785156, "global_step": 172962, "epoch": 4118} {"train_loss": -6.955904483795166, "global_step": 172963, "epoch": 4118} {"train_loss": -7.054965972900391, "global_step": 172964, "epoch": 4118} {"train_loss": -7.053498268127441, "global_step": 172965, "epoch": 4118} {"train_loss": -7.053829193115234, "global_step": 172966, "epoch": 4118} {"train_loss": -7.073879241943359, "global_step": 172967, "epoch": 4118} {"train_loss": -7.111556529998779, "global_step": 172968, "epoch": 4118} {"train_loss": -7.104692459106445, "global_step": 172969, "epoch": 4118} {"train_loss": -7.1265177726745605, "global_step": 172970, "epoch": 4118} {"train_loss": -7.13800048828125, "global_step": 172971, "epoch": 4118} {"train_loss": -7.157470703125, "global_step": 172972, "epoch": 4118} {"train_loss": -7.090911865234375, "global_step": 172973, "epoch": 4118} {"train_loss": -7.014219284057617, "global_step": 172974, "epoch": 4118} {"train_loss": -7.173545837402344, "global_step": 172975, "epoch": 4118} {"train_loss": -7.085563659667969, "global_step": 172976, "epoch": 4118} {"train_loss": -7.042599678039551, "global_step": 172977, "epoch": 4118} {"train_loss": -7.042646408081055, "global_step": 172978, "epoch": 4118} {"train_loss": -7.160711765289307, "global_step": 172979, "epoch": 4118} {"train_loss": -7.07142972946167, "global_step": 172980, "epoch": 4118} {"train_loss": -7.146399021148682, "global_step": 172981, "epoch": 4118} {"train_loss": -7.117000102996826, "global_step": 172982, "epoch": 4118} {"train_loss": -7.119749546051025, "global_step": 172983, "epoch": 4118} {"train_loss": -7.119563102722168, "global_step": 172984, "epoch": 4118} {"train_loss": -7.097253799438477, "global_step": 172985, "epoch": 4118} {"train_loss": -7.298287868499756, "global_step": 172986, "epoch": 4118} {"train_loss": -7.026966094970703, "global_step": 172987, "epoch": 4118} {"train_loss": -7.1761016845703125, "global_step": 172988, "epoch": 4118} {"train_loss": -7.153799057006836, "global_step": 172989, "epoch": 4118} {"train_loss": -7.022245407104492, "global_step": 172990, "epoch": 4118} {"train_loss": -7.134984016418457, "global_step": 172991, "epoch": 4118} {"train_loss": -7.151030540466309, "global_step": 172992, "epoch": 4118} {"train_loss": -6.9956817626953125, "global_step": 172993, "epoch": 4118} {"train_loss": -7.064968109130859, "global_step": 172994, "epoch": 4118} {"train_loss": -7.222128391265869, "global_step": 172995, "epoch": 4118} {"train_loss": -7.2190351486206055, "global_step": 172996, "epoch": 4118} {"train_loss": -7.096184844062442, "global_step": 172997, "epoch": 4118, "val_loss": 79938.3046875} {"train_loss": -7.072481155395508, "global_step": 172998, "epoch": 4119} {"train_loss": -6.949678421020508, "global_step": 172999, "epoch": 4119} {"train_loss": -7.046645164489746, "global_step": 173000, "epoch": 4119} {"train_loss": -7.067714691162109, "global_step": 173001, "epoch": 4119} {"train_loss": -7.095916748046875, "global_step": 173002, "epoch": 4119} {"train_loss": -7.074174880981445, "global_step": 173003, "epoch": 4119} {"train_loss": -7.056903839111328, "global_step": 173004, "epoch": 4119} {"train_loss": -7.0035080909729, "global_step": 173005, "epoch": 4119} {"train_loss": -6.937253475189209, "global_step": 173006, "epoch": 4119} {"train_loss": -7.039211273193359, "global_step": 173007, "epoch": 4119} {"train_loss": -7.071854591369629, "global_step": 173008, "epoch": 4119} {"train_loss": -7.041810989379883, "global_step": 173009, "epoch": 4119} {"train_loss": -7.063765525817871, "global_step": 173010, "epoch": 4119} {"train_loss": -7.12320613861084, "global_step": 173011, "epoch": 4119} {"train_loss": -7.079620361328125, "global_step": 173012, "epoch": 4119} {"train_loss": -7.154264450073242, "global_step": 173013, "epoch": 4119} {"train_loss": -7.074824810028076, "global_step": 173014, "epoch": 4119} {"train_loss": -7.037839889526367, "global_step": 173015, "epoch": 4119} {"train_loss": -6.9958295822143555, "global_step": 173016, "epoch": 4119} {"train_loss": -7.103254318237305, "global_step": 173017, "epoch": 4119} {"train_loss": -7.0391998291015625, "global_step": 173018, "epoch": 4119} {"train_loss": -7.015252113342285, "global_step": 173019, "epoch": 4119} {"train_loss": -6.996655464172363, "global_step": 173020, "epoch": 4119} {"train_loss": -7.11965799331665, "global_step": 173021, "epoch": 4119} {"train_loss": -6.982656002044678, "global_step": 173022, "epoch": 4119} {"train_loss": -6.981712341308594, "global_step": 173023, "epoch": 4119} {"train_loss": -7.001820087432861, "global_step": 173024, "epoch": 4119} {"train_loss": -6.865377426147461, "global_step": 173025, "epoch": 4119} {"train_loss": -7.014865875244141, "global_step": 173026, "epoch": 4119} {"train_loss": -7.105096817016602, "global_step": 173027, "epoch": 4119} {"train_loss": -7.015340805053711, "global_step": 173028, "epoch": 4119} {"train_loss": -7.050492286682129, "global_step": 173029, "epoch": 4119} {"train_loss": -7.047921180725098, "global_step": 173030, "epoch": 4119} {"train_loss": -7.08740234375, "global_step": 173031, "epoch": 4119} {"train_loss": -7.054337501525879, "global_step": 173032, "epoch": 4119} {"train_loss": -6.994675636291504, "global_step": 173033, "epoch": 4119} {"train_loss": -7.112739086151123, "global_step": 173034, "epoch": 4119} {"train_loss": -7.046771049499512, "global_step": 173035, "epoch": 4119} {"train_loss": -6.948412895202637, "global_step": 173036, "epoch": 4119} {"train_loss": -7.133739471435547, "global_step": 173037, "epoch": 4119} {"train_loss": -7.068993091583252, "global_step": 173038, "epoch": 4119} {"train_loss": -7.044718083881197, "global_step": 173039, "epoch": 4119, "val_loss": 80098.0859375} {"train_loss": -7.134003639221191, "global_step": 173040, "epoch": 4120} {"train_loss": -7.071479797363281, "global_step": 173041, "epoch": 4120} {"train_loss": -7.110838413238525, "global_step": 173042, "epoch": 4120} {"train_loss": -7.107508659362793, "global_step": 173043, "epoch": 4120} {"train_loss": -7.003479957580566, "global_step": 173044, "epoch": 4120} {"train_loss": -6.9871039390563965, "global_step": 173045, "epoch": 4120} {"train_loss": -7.009631156921387, "global_step": 173046, "epoch": 4120} {"train_loss": -7.0975117683410645, "global_step": 173047, "epoch": 4120} {"train_loss": -7.044043064117432, "global_step": 173048, "epoch": 4120} {"train_loss": -7.032677173614502, "global_step": 173049, "epoch": 4120} {"train_loss": -7.026345252990723, "global_step": 173050, "epoch": 4120} {"train_loss": -6.999971389770508, "global_step": 173051, "epoch": 4120} {"train_loss": -7.031918525695801, "global_step": 173052, "epoch": 4120} {"train_loss": -7.047393321990967, "global_step": 173053, "epoch": 4120} {"train_loss": -6.948091506958008, "global_step": 173054, "epoch": 4120} {"train_loss": -7.07451057434082, "global_step": 173055, "epoch": 4120} {"train_loss": -7.040447235107422, "global_step": 173056, "epoch": 4120} {"train_loss": -7.019276142120361, "global_step": 173057, "epoch": 4120} {"train_loss": -7.045644760131836, "global_step": 173058, "epoch": 4120} {"train_loss": -6.971048355102539, "global_step": 173059, "epoch": 4120} {"train_loss": -7.026991844177246, "global_step": 173060, "epoch": 4120} {"train_loss": -7.1304097175598145, "global_step": 173061, "epoch": 4120} {"train_loss": -7.150088787078857, "global_step": 173062, "epoch": 4120} {"train_loss": -7.094061851501465, "global_step": 173063, "epoch": 4120} {"train_loss": -7.076534271240234, "global_step": 173064, "epoch": 4120} {"train_loss": -6.992726802825928, "global_step": 173065, "epoch": 4120} {"train_loss": -7.114925384521484, "global_step": 173066, "epoch": 4120} {"train_loss": -6.940865516662598, "global_step": 173067, "epoch": 4120} {"train_loss": -7.112014293670654, "global_step": 173068, "epoch": 4120} {"train_loss": -6.801239013671875, "global_step": 173069, "epoch": 4120} {"train_loss": -7.096133232116699, "global_step": 173070, "epoch": 4120} {"train_loss": -6.988855361938477, "global_step": 173071, "epoch": 4120} {"train_loss": -7.118224620819092, "global_step": 173072, "epoch": 4120} {"train_loss": -7.10505485534668, "global_step": 173073, "epoch": 4120} {"train_loss": -6.983713150024414, "global_step": 173074, "epoch": 4120} {"train_loss": -7.020481109619141, "global_step": 173075, "epoch": 4120} {"train_loss": -6.939718723297119, "global_step": 173076, "epoch": 4120} {"train_loss": -7.0424089431762695, "global_step": 173077, "epoch": 4120} {"train_loss": -7.0845112800598145, "global_step": 173078, "epoch": 4120} {"train_loss": -6.889077186584473, "global_step": 173079, "epoch": 4120} {"train_loss": -6.980381488800049, "global_step": 173080, "epoch": 4120} {"train_loss": -7.035783131917317, "global_step": 173081, "epoch": 4120, "val_loss": 80061.234375} {"train_loss": -6.9784674644470215, "global_step": 173082, "epoch": 4121} {"train_loss": -7.038936614990234, "global_step": 173083, "epoch": 4121} {"train_loss": -6.935421943664551, "global_step": 173084, "epoch": 4121} {"train_loss": -7.050652980804443, "global_step": 173085, "epoch": 4121} {"train_loss": -6.993823051452637, "global_step": 173086, "epoch": 4121} {"train_loss": -6.9639692306518555, "global_step": 173087, "epoch": 4121} {"train_loss": -7.0174384117126465, "global_step": 173088, "epoch": 4121} {"train_loss": -6.894402027130127, "global_step": 173089, "epoch": 4121} {"train_loss": -7.0328264236450195, "global_step": 173090, "epoch": 4121} {"train_loss": -6.912980556488037, "global_step": 173091, "epoch": 4121} {"train_loss": -7.068905830383301, "global_step": 173092, "epoch": 4121} {"train_loss": -7.005786895751953, "global_step": 173093, "epoch": 4121} {"train_loss": -6.962680339813232, "global_step": 173094, "epoch": 4121} {"train_loss": -7.108926773071289, "global_step": 173095, "epoch": 4121} {"train_loss": -6.9073076248168945, "global_step": 173096, "epoch": 4121} {"train_loss": -7.059210777282715, "global_step": 173097, "epoch": 4121} {"train_loss": -6.958615303039551, "global_step": 173098, "epoch": 4121} {"train_loss": -7.022004127502441, "global_step": 173099, "epoch": 4121} {"train_loss": -6.889833450317383, "global_step": 173100, "epoch": 4121} {"train_loss": -6.931558132171631, "global_step": 173101, "epoch": 4121} {"train_loss": -6.996926784515381, "global_step": 173102, "epoch": 4121} {"train_loss": -6.992683410644531, "global_step": 173103, "epoch": 4121} {"train_loss": -7.007162094116211, "global_step": 173104, "epoch": 4121} {"train_loss": -6.967157363891602, "global_step": 173105, "epoch": 4121} {"train_loss": -6.995746612548828, "global_step": 173106, "epoch": 4121} {"train_loss": -6.990164756774902, "global_step": 173107, "epoch": 4121} {"train_loss": -7.107057094573975, "global_step": 173108, "epoch": 4121} {"train_loss": -7.035600662231445, "global_step": 173109, "epoch": 4121} {"train_loss": -7.002556800842285, "global_step": 173110, "epoch": 4121} {"train_loss": -7.124777793884277, "global_step": 173111, "epoch": 4121} {"train_loss": -7.14218282699585, "global_step": 173112, "epoch": 4121} {"train_loss": -7.071404457092285, "global_step": 173113, "epoch": 4121} {"train_loss": -7.106419086456299, "global_step": 173114, "epoch": 4121} {"train_loss": -7.02938175201416, "global_step": 173115, "epoch": 4121} {"train_loss": -7.029970645904541, "global_step": 173116, "epoch": 4121} {"train_loss": -7.057499408721924, "global_step": 173117, "epoch": 4121} {"train_loss": -7.176573276519775, "global_step": 173118, "epoch": 4121} {"train_loss": -7.102980136871338, "global_step": 173119, "epoch": 4121} {"train_loss": -7.117161750793457, "global_step": 173120, "epoch": 4121} {"train_loss": -7.155829906463623, "global_step": 173121, "epoch": 4121} {"train_loss": -7.097716331481934, "global_step": 173122, "epoch": 4121} {"train_loss": -7.028662250155494, "global_step": 173123, "epoch": 4121, "val_loss": 79873.9921875} {"train_loss": -7.213832855224609, "global_step": 173124, "epoch": 4122} {"train_loss": -7.162777900695801, "global_step": 173125, "epoch": 4122} {"train_loss": -7.166340351104736, "global_step": 173126, "epoch": 4122} {"train_loss": -7.185878753662109, "global_step": 173127, "epoch": 4122} {"train_loss": -7.114875316619873, "global_step": 173128, "epoch": 4122} {"train_loss": -7.141911029815674, "global_step": 173129, "epoch": 4122} {"train_loss": -7.018816947937012, "global_step": 173130, "epoch": 4122} {"train_loss": -6.952470302581787, "global_step": 173131, "epoch": 4122} {"train_loss": -7.060467720031738, "global_step": 173132, "epoch": 4122} {"train_loss": -7.030014991760254, "global_step": 173133, "epoch": 4122} {"train_loss": -6.95128059387207, "global_step": 173134, "epoch": 4122} {"train_loss": -7.041937828063965, "global_step": 173135, "epoch": 4122} {"train_loss": -6.984684467315674, "global_step": 173136, "epoch": 4122} {"train_loss": -7.1131720542907715, "global_step": 173137, "epoch": 4122} {"train_loss": -7.010953903198242, "global_step": 173138, "epoch": 4122} {"train_loss": -7.071006774902344, "global_step": 173139, "epoch": 4122} {"train_loss": -7.113869667053223, "global_step": 173140, "epoch": 4122} {"train_loss": -7.09305477142334, "global_step": 173141, "epoch": 4122} {"train_loss": -7.038569450378418, "global_step": 173142, "epoch": 4122} {"train_loss": -7.090023040771484, "global_step": 173143, "epoch": 4122} {"train_loss": -7.075511932373047, "global_step": 173144, "epoch": 4122} {"train_loss": -7.156483173370361, "global_step": 173145, "epoch": 4122} {"train_loss": -7.059915542602539, "global_step": 173146, "epoch": 4122} {"train_loss": -7.156428337097168, "global_step": 173147, "epoch": 4122} {"train_loss": -7.073071002960205, "global_step": 173148, "epoch": 4122} {"train_loss": -7.062036991119385, "global_step": 173149, "epoch": 4122} {"train_loss": -7.12696647644043, "global_step": 173150, "epoch": 4122} {"train_loss": -7.188251495361328, "global_step": 173151, "epoch": 4122} {"train_loss": -7.044290542602539, "global_step": 173152, "epoch": 4122} {"train_loss": -7.269750595092773, "global_step": 173153, "epoch": 4122} {"train_loss": -7.09010648727417, "global_step": 173154, "epoch": 4122} {"train_loss": -7.003107070922852, "global_step": 173155, "epoch": 4122} {"train_loss": -7.091089248657227, "global_step": 173156, "epoch": 4122} {"train_loss": -7.092871189117432, "global_step": 173157, "epoch": 4122} {"train_loss": -7.018218517303467, "global_step": 173158, "epoch": 4122} {"train_loss": -7.165232181549072, "global_step": 173159, "epoch": 4122} {"train_loss": -7.149845123291016, "global_step": 173160, "epoch": 4122} {"train_loss": -7.167051315307617, "global_step": 173161, "epoch": 4122} {"train_loss": -7.062327861785889, "global_step": 173162, "epoch": 4122} {"train_loss": -7.082277297973633, "global_step": 173163, "epoch": 4122} {"train_loss": -7.1310200691223145, "global_step": 173164, "epoch": 4122} {"train_loss": -7.093727270762126, "global_step": 173165, "epoch": 4122, "val_loss": 79942.265625} {"train_loss": -7.027040481567383, "global_step": 173166, "epoch": 4123} {"train_loss": -7.190086364746094, "global_step": 173167, "epoch": 4123} {"train_loss": -7.061838626861572, "global_step": 173168, "epoch": 4123} {"train_loss": -7.206545829772949, "global_step": 173169, "epoch": 4123} {"train_loss": -7.154234886169434, "global_step": 173170, "epoch": 4123} {"train_loss": -7.129303932189941, "global_step": 173171, "epoch": 4123} {"train_loss": -7.0736775398254395, "global_step": 173172, "epoch": 4123} {"train_loss": -7.152066230773926, "global_step": 173173, "epoch": 4123} {"train_loss": -7.181462287902832, "global_step": 173174, "epoch": 4123} {"train_loss": -7.027064800262451, "global_step": 173175, "epoch": 4123} {"train_loss": -7.144986629486084, "global_step": 173176, "epoch": 4123} {"train_loss": -7.142242431640625, "global_step": 173177, "epoch": 4123} {"train_loss": -7.180757999420166, "global_step": 173178, "epoch": 4123} {"train_loss": -7.191366195678711, "global_step": 173179, "epoch": 4123} {"train_loss": -7.186826229095459, "global_step": 173180, "epoch": 4123} {"train_loss": -7.137791633605957, "global_step": 173181, "epoch": 4123} {"train_loss": -7.132457256317139, "global_step": 173182, "epoch": 4123} {"train_loss": -7.132014274597168, "global_step": 173183, "epoch": 4123} {"train_loss": -7.1524505615234375, "global_step": 173184, "epoch": 4123} {"train_loss": -7.175057411193848, "global_step": 173185, "epoch": 4123} {"train_loss": -7.205549716949463, "global_step": 173186, "epoch": 4123} {"train_loss": -7.08209228515625, "global_step": 173187, "epoch": 4123} {"train_loss": -7.084873199462891, "global_step": 173188, "epoch": 4123} {"train_loss": -7.236208915710449, "global_step": 173189, "epoch": 4123} {"train_loss": -7.0980119705200195, "global_step": 173190, "epoch": 4123} {"train_loss": -6.996678829193115, "global_step": 173191, "epoch": 4123} {"train_loss": -7.073496341705322, "global_step": 173192, "epoch": 4123} {"train_loss": -6.970483303070068, "global_step": 173193, "epoch": 4123} {"train_loss": -7.110410690307617, "global_step": 173194, "epoch": 4123} {"train_loss": -7.058786869049072, "global_step": 173195, "epoch": 4123} {"train_loss": -7.1524763107299805, "global_step": 173196, "epoch": 4123} {"train_loss": -6.98582649230957, "global_step": 173197, "epoch": 4123} {"train_loss": -7.183737754821777, "global_step": 173198, "epoch": 4123} {"train_loss": -6.985965728759766, "global_step": 173199, "epoch": 4123} {"train_loss": -7.0756964683532715, "global_step": 173200, "epoch": 4123} {"train_loss": -7.039587020874023, "global_step": 173201, "epoch": 4123} {"train_loss": -7.165702819824219, "global_step": 173202, "epoch": 4123} {"train_loss": -7.149386405944824, "global_step": 173203, "epoch": 4123} {"train_loss": -7.015510559082031, "global_step": 173204, "epoch": 4123} {"train_loss": -6.862856388092041, "global_step": 173205, "epoch": 4123} {"train_loss": -7.066946983337402, "global_step": 173206, "epoch": 4123} {"train_loss": -7.104511499404907, "global_step": 173207, "epoch": 4123, "val_loss": 80008.453125} {"train_loss": -7.079924583435059, "global_step": 173208, "epoch": 4124} {"train_loss": -7.1286773681640625, "global_step": 173209, "epoch": 4124} {"train_loss": -6.96116304397583, "global_step": 173210, "epoch": 4124} {"train_loss": -7.073092460632324, "global_step": 173211, "epoch": 4124} {"train_loss": -6.985751152038574, "global_step": 173212, "epoch": 4124} {"train_loss": -6.98386287689209, "global_step": 173213, "epoch": 4124} {"train_loss": -7.1059699058532715, "global_step": 173214, "epoch": 4124} {"train_loss": -7.018790245056152, "global_step": 173215, "epoch": 4124} {"train_loss": -7.10879373550415, "global_step": 173216, "epoch": 4124} {"train_loss": -7.073302745819092, "global_step": 173217, "epoch": 4124} {"train_loss": -6.9864702224731445, "global_step": 173218, "epoch": 4124} {"train_loss": -7.054507732391357, "global_step": 173219, "epoch": 4124} {"train_loss": -7.109115123748779, "global_step": 173220, "epoch": 4124} {"train_loss": -7.014286994934082, "global_step": 173221, "epoch": 4124} {"train_loss": -6.973241329193115, "global_step": 173222, "epoch": 4124} {"train_loss": -7.044736862182617, "global_step": 173223, "epoch": 4124} {"train_loss": -7.179512023925781, "global_step": 173224, "epoch": 4124} {"train_loss": -7.125340938568115, "global_step": 173225, "epoch": 4124} {"train_loss": -7.077579498291016, "global_step": 173226, "epoch": 4124} {"train_loss": -7.03938627243042, "global_step": 173227, "epoch": 4124} {"train_loss": -7.178413391113281, "global_step": 173228, "epoch": 4124} {"train_loss": -7.122544288635254, "global_step": 173229, "epoch": 4124} {"train_loss": -7.1551313400268555, "global_step": 173230, "epoch": 4124} {"train_loss": -7.1255598068237305, "global_step": 173231, "epoch": 4124} {"train_loss": -7.094422340393066, "global_step": 173232, "epoch": 4124} {"train_loss": -7.057433128356934, "global_step": 173233, "epoch": 4124} {"train_loss": -7.047279357910156, "global_step": 173234, "epoch": 4124} {"train_loss": -7.145739555358887, "global_step": 173235, "epoch": 4124} {"train_loss": -7.133284091949463, "global_step": 173236, "epoch": 4124} {"train_loss": -7.053380489349365, "global_step": 173237, "epoch": 4124} {"train_loss": -7.119910717010498, "global_step": 173238, "epoch": 4124} {"train_loss": -7.087136268615723, "global_step": 173239, "epoch": 4124} {"train_loss": -6.98280143737793, "global_step": 173240, "epoch": 4124} {"train_loss": -7.155175685882568, "global_step": 173241, "epoch": 4124} {"train_loss": -7.1287689208984375, "global_step": 173242, "epoch": 4124} {"train_loss": -7.048806190490723, "global_step": 173243, "epoch": 4124} {"train_loss": -7.0978312492370605, "global_step": 173244, "epoch": 4124} {"train_loss": -7.143967628479004, "global_step": 173245, "epoch": 4124} {"train_loss": -7.139965057373047, "global_step": 173246, "epoch": 4124} {"train_loss": -7.089660167694092, "global_step": 173247, "epoch": 4124} {"train_loss": -7.050894737243652, "global_step": 173248, "epoch": 4124} {"train_loss": -7.077722765150524, "global_step": 173249, "epoch": 4124, "val_loss": 79944.2734375} {"train_loss": -7.244425296783447, "global_step": 173250, "epoch": 4125} {"train_loss": -7.1404595375061035, "global_step": 173251, "epoch": 4125} {"train_loss": -7.207392692565918, "global_step": 173252, "epoch": 4125} {"train_loss": -7.164065837860107, "global_step": 173253, "epoch": 4125} {"train_loss": -7.141234397888184, "global_step": 173254, "epoch": 4125} {"train_loss": -7.158431053161621, "global_step": 173255, "epoch": 4125} {"train_loss": -7.1308393478393555, "global_step": 173256, "epoch": 4125} {"train_loss": -7.022580146789551, "global_step": 173257, "epoch": 4125} {"train_loss": -7.180590629577637, "global_step": 173258, "epoch": 4125} {"train_loss": -7.117702484130859, "global_step": 173259, "epoch": 4125} {"train_loss": -7.024572372436523, "global_step": 173260, "epoch": 4125} {"train_loss": -7.195096969604492, "global_step": 173261, "epoch": 4125} {"train_loss": -7.021982192993164, "global_step": 173262, "epoch": 4125} {"train_loss": -7.125947952270508, "global_step": 173263, "epoch": 4125} {"train_loss": -7.082868576049805, "global_step": 173264, "epoch": 4125} {"train_loss": -7.056853294372559, "global_step": 173265, "epoch": 4125} {"train_loss": -7.064359664916992, "global_step": 173266, "epoch": 4125} {"train_loss": -7.090048313140869, "global_step": 173267, "epoch": 4125} {"train_loss": -7.22430419921875, "global_step": 173268, "epoch": 4125} {"train_loss": -7.152993202209473, "global_step": 173269, "epoch": 4125} {"train_loss": -7.012782096862793, "global_step": 173270, "epoch": 4125} {"train_loss": -7.146759033203125, "global_step": 173271, "epoch": 4125} {"train_loss": -7.214426040649414, "global_step": 173272, "epoch": 4125} {"train_loss": -7.0384416580200195, "global_step": 173273, "epoch": 4125} {"train_loss": -7.115897178649902, "global_step": 173274, "epoch": 4125} {"train_loss": -7.108049392700195, "global_step": 173275, "epoch": 4125} {"train_loss": -7.166741371154785, "global_step": 173276, "epoch": 4125} {"train_loss": -7.060632705688477, "global_step": 173277, "epoch": 4125} {"train_loss": -7.092797756195068, "global_step": 173278, "epoch": 4125} {"train_loss": -7.1264801025390625, "global_step": 173279, "epoch": 4125} {"train_loss": -7.130817890167236, "global_step": 173280, "epoch": 4125} {"train_loss": -7.186227321624756, "global_step": 173281, "epoch": 4125} {"train_loss": -7.237049579620361, "global_step": 173282, "epoch": 4125} {"train_loss": -7.1597442626953125, "global_step": 173283, "epoch": 4125} {"train_loss": -7.082398414611816, "global_step": 173284, "epoch": 4125} {"train_loss": -7.089130401611328, "global_step": 173285, "epoch": 4125} {"train_loss": -7.090286731719971, "global_step": 173286, "epoch": 4125} {"train_loss": -7.2307329177856445, "global_step": 173287, "epoch": 4125} {"train_loss": -7.152286529541016, "global_step": 173288, "epoch": 4125} {"train_loss": -7.107731819152832, "global_step": 173289, "epoch": 4125} {"train_loss": -7.031669616699219, "global_step": 173290, "epoch": 4125} {"train_loss": -7.124287162508283, "global_step": 173291, "epoch": 4125, "val_loss": 80056.53125} {"train_loss": -7.013750076293945, "global_step": 173292, "epoch": 4126} {"train_loss": -7.087398052215576, "global_step": 173293, "epoch": 4126} {"train_loss": -7.125854969024658, "global_step": 173294, "epoch": 4126} {"train_loss": -7.2330403327941895, "global_step": 173295, "epoch": 4126} {"train_loss": -7.106996059417725, "global_step": 173296, "epoch": 4126} {"train_loss": -7.108737945556641, "global_step": 173297, "epoch": 4126} {"train_loss": -7.101251602172852, "global_step": 173298, "epoch": 4126} {"train_loss": -7.032293319702148, "global_step": 173299, "epoch": 4126} {"train_loss": -7.0106730461120605, "global_step": 173300, "epoch": 4126} {"train_loss": -7.066049098968506, "global_step": 173301, "epoch": 4126} {"train_loss": -7.067869186401367, "global_step": 173302, "epoch": 4126} {"train_loss": -7.034658432006836, "global_step": 173303, "epoch": 4126} {"train_loss": -7.132776260375977, "global_step": 173304, "epoch": 4126} {"train_loss": -7.019559860229492, "global_step": 173305, "epoch": 4126} {"train_loss": -7.042845726013184, "global_step": 173306, "epoch": 4126} {"train_loss": -7.078958034515381, "global_step": 173307, "epoch": 4126} {"train_loss": -7.12460470199585, "global_step": 173308, "epoch": 4126} {"train_loss": -7.034988880157471, "global_step": 173309, "epoch": 4126} {"train_loss": -7.036710739135742, "global_step": 173310, "epoch": 4126} {"train_loss": -7.103910446166992, "global_step": 173311, "epoch": 4126} {"train_loss": -7.035434722900391, "global_step": 173312, "epoch": 4126} {"train_loss": -7.080775260925293, "global_step": 173313, "epoch": 4126} {"train_loss": -7.012417316436768, "global_step": 173314, "epoch": 4126} {"train_loss": -7.215169429779053, "global_step": 173315, "epoch": 4126} {"train_loss": -7.157723903656006, "global_step": 173316, "epoch": 4126} {"train_loss": -7.281720161437988, "global_step": 173317, "epoch": 4126} {"train_loss": -7.102207183837891, "global_step": 173318, "epoch": 4126} {"train_loss": -7.066339015960693, "global_step": 173319, "epoch": 4126} {"train_loss": -7.179872512817383, "global_step": 173320, "epoch": 4126} {"train_loss": -6.926310062408447, "global_step": 173321, "epoch": 4126} {"train_loss": -7.017590522766113, "global_step": 173322, "epoch": 4126} {"train_loss": -7.118135929107666, "global_step": 173323, "epoch": 4126} {"train_loss": -7.064810752868652, "global_step": 173324, "epoch": 4126} {"train_loss": -6.976068496704102, "global_step": 173325, "epoch": 4126} {"train_loss": -7.122358322143555, "global_step": 173326, "epoch": 4126} {"train_loss": -6.95508337020874, "global_step": 173327, "epoch": 4126} {"train_loss": -6.937451362609863, "global_step": 173328, "epoch": 4126} {"train_loss": -6.979912757873535, "global_step": 173329, "epoch": 4126} {"train_loss": -7.033240795135498, "global_step": 173330, "epoch": 4126} {"train_loss": -6.946226119995117, "global_step": 173331, "epoch": 4126} {"train_loss": -6.899749279022217, "global_step": 173332, "epoch": 4126} {"train_loss": -7.06630726087661, "global_step": 173333, "epoch": 4126, "val_loss": 79917.9140625} {"train_loss": -6.8283514976501465, "global_step": 173334, "epoch": 4127} {"train_loss": -7.0004754066467285, "global_step": 173335, "epoch": 4127} {"train_loss": -7.077842712402344, "global_step": 173336, "epoch": 4127} {"train_loss": -7.106990814208984, "global_step": 173337, "epoch": 4127} {"train_loss": -7.083279609680176, "global_step": 173338, "epoch": 4127} {"train_loss": -6.9332475662231445, "global_step": 173339, "epoch": 4127} {"train_loss": -7.094342231750488, "global_step": 173340, "epoch": 4127} {"train_loss": -7.064940452575684, "global_step": 173341, "epoch": 4127} {"train_loss": -7.116035461425781, "global_step": 173342, "epoch": 4127} {"train_loss": -7.055312156677246, "global_step": 173343, "epoch": 4127} {"train_loss": -7.080595016479492, "global_step": 173344, "epoch": 4127} {"train_loss": -7.085331439971924, "global_step": 173345, "epoch": 4127} {"train_loss": -7.108473777770996, "global_step": 173346, "epoch": 4127} {"train_loss": -7.07341194152832, "global_step": 173347, "epoch": 4127} {"train_loss": -7.100239276885986, "global_step": 173348, "epoch": 4127} {"train_loss": -7.013867378234863, "global_step": 173349, "epoch": 4127} {"train_loss": -7.153717041015625, "global_step": 173350, "epoch": 4127} {"train_loss": -7.098170757293701, "global_step": 173351, "epoch": 4127} {"train_loss": -7.136996746063232, "global_step": 173352, "epoch": 4127} {"train_loss": -7.141543388366699, "global_step": 173353, "epoch": 4127} {"train_loss": -6.977118492126465, "global_step": 173354, "epoch": 4127} {"train_loss": -7.146963596343994, "global_step": 173355, "epoch": 4127} {"train_loss": -7.088213920593262, "global_step": 173356, "epoch": 4127} {"train_loss": -7.000470161437988, "global_step": 173357, "epoch": 4127} {"train_loss": -7.008793830871582, "global_step": 173358, "epoch": 4127} {"train_loss": -7.082047462463379, "global_step": 173359, "epoch": 4127} {"train_loss": -6.997923851013184, "global_step": 173360, "epoch": 4127} {"train_loss": -6.960290431976318, "global_step": 173361, "epoch": 4127} {"train_loss": -7.110747337341309, "global_step": 173362, "epoch": 4127} {"train_loss": -7.09465217590332, "global_step": 173363, "epoch": 4127} {"train_loss": -7.193403244018555, "global_step": 173364, "epoch": 4127} {"train_loss": -7.0922088623046875, "global_step": 173365, "epoch": 4127} {"train_loss": -7.113774299621582, "global_step": 173366, "epoch": 4127} {"train_loss": -7.047275543212891, "global_step": 173367, "epoch": 4127} {"train_loss": -7.048360824584961, "global_step": 173368, "epoch": 4127} {"train_loss": -7.123639106750488, "global_step": 173369, "epoch": 4127} {"train_loss": -7.124265193939209, "global_step": 173370, "epoch": 4127} {"train_loss": -7.014439582824707, "global_step": 173371, "epoch": 4127} {"train_loss": -7.144301414489746, "global_step": 173372, "epoch": 4127} {"train_loss": -7.134003639221191, "global_step": 173373, "epoch": 4127} {"train_loss": -7.1742448806762695, "global_step": 173374, "epoch": 4127} {"train_loss": -7.071935835338774, "global_step": 173375, "epoch": 4127, "val_loss": 79803.4609375} {"train_loss": -6.984695911407471, "global_step": 173376, "epoch": 4128} {"train_loss": -7.003155708312988, "global_step": 173377, "epoch": 4128} {"train_loss": -7.091843128204346, "global_step": 173378, "epoch": 4128} {"train_loss": -7.053305625915527, "global_step": 173379, "epoch": 4128} {"train_loss": -7.047926902770996, "global_step": 173380, "epoch": 4128} {"train_loss": -7.1102070808410645, "global_step": 173381, "epoch": 4128} {"train_loss": -7.067061424255371, "global_step": 173382, "epoch": 4128} {"train_loss": -7.043091773986816, "global_step": 173383, "epoch": 4128} {"train_loss": -6.9756574630737305, "global_step": 173384, "epoch": 4128} {"train_loss": -7.03656530380249, "global_step": 173385, "epoch": 4128} {"train_loss": -7.057734489440918, "global_step": 173386, "epoch": 4128} {"train_loss": -6.949585437774658, "global_step": 173387, "epoch": 4128} {"train_loss": -7.076324939727783, "global_step": 173388, "epoch": 4128} {"train_loss": -6.92820930480957, "global_step": 173389, "epoch": 4128} {"train_loss": -6.889698505401611, "global_step": 173390, "epoch": 4128} {"train_loss": -6.990838050842285, "global_step": 173391, "epoch": 4128} {"train_loss": -6.987142562866211, "global_step": 173392, "epoch": 4128} {"train_loss": -6.82730770111084, "global_step": 173393, "epoch": 4128} {"train_loss": -7.024514198303223, "global_step": 173394, "epoch": 4128} {"train_loss": -6.911831378936768, "global_step": 173395, "epoch": 4128} {"train_loss": -6.990065097808838, "global_step": 173396, "epoch": 4128} {"train_loss": -7.092477798461914, "global_step": 173397, "epoch": 4128} {"train_loss": -6.930698394775391, "global_step": 173398, "epoch": 4128} {"train_loss": -7.029478549957275, "global_step": 173399, "epoch": 4128} {"train_loss": -6.976553916931152, "global_step": 173400, "epoch": 4128} {"train_loss": -6.978792667388916, "global_step": 173401, "epoch": 4128} {"train_loss": -7.032707691192627, "global_step": 173402, "epoch": 4128} {"train_loss": -6.9464263916015625, "global_step": 173403, "epoch": 4128} {"train_loss": -6.924333572387695, "global_step": 173404, "epoch": 4128} {"train_loss": -7.037389755249023, "global_step": 173405, "epoch": 4128} {"train_loss": -6.936293601989746, "global_step": 173406, "epoch": 4128} {"train_loss": -7.024923801422119, "global_step": 173407, "epoch": 4128} {"train_loss": -6.99528169631958, "global_step": 173408, "epoch": 4128} {"train_loss": -6.875613689422607, "global_step": 173409, "epoch": 4128} {"train_loss": -7.004970550537109, "global_step": 173410, "epoch": 4128} {"train_loss": -7.016391754150391, "global_step": 173411, "epoch": 4128} {"train_loss": -7.080315589904785, "global_step": 173412, "epoch": 4128} {"train_loss": -6.9836883544921875, "global_step": 173413, "epoch": 4128} {"train_loss": -6.951496601104736, "global_step": 173414, "epoch": 4128} {"train_loss": -7.0163774490356445, "global_step": 173415, "epoch": 4128} {"train_loss": -7.109642028808594, "global_step": 173416, "epoch": 4128} {"train_loss": -7.001012223107474, "global_step": 173417, "epoch": 4128, "val_loss": 80060.125} {"train_loss": -7.0583086013793945, "global_step": 173418, "epoch": 4129} {"train_loss": -7.047609806060791, "global_step": 173419, "epoch": 4129} {"train_loss": -7.03179931640625, "global_step": 173420, "epoch": 4129} {"train_loss": -7.115604400634766, "global_step": 173421, "epoch": 4129} {"train_loss": -7.017149925231934, "global_step": 173422, "epoch": 4129} {"train_loss": -7.110418319702148, "global_step": 173423, "epoch": 4129} {"train_loss": -7.097501754760742, "global_step": 173424, "epoch": 4129} {"train_loss": -6.9855241775512695, "global_step": 173425, "epoch": 4129} {"train_loss": -7.090852737426758, "global_step": 173426, "epoch": 4129} {"train_loss": -7.015301704406738, "global_step": 173427, "epoch": 4129} {"train_loss": -7.036886215209961, "global_step": 173428, "epoch": 4129} {"train_loss": -7.137629508972168, "global_step": 173429, "epoch": 4129} {"train_loss": -6.994956016540527, "global_step": 173430, "epoch": 4129} {"train_loss": -7.107730865478516, "global_step": 173431, "epoch": 4129} {"train_loss": -7.064037322998047, "global_step": 173432, "epoch": 4129} {"train_loss": -7.0839338302612305, "global_step": 173433, "epoch": 4129} {"train_loss": -7.129324913024902, "global_step": 173434, "epoch": 4129} {"train_loss": -7.113170623779297, "global_step": 173435, "epoch": 4129} {"train_loss": -6.995659351348877, "global_step": 173436, "epoch": 4129} {"train_loss": -7.150421142578125, "global_step": 173437, "epoch": 4129} {"train_loss": -7.118330478668213, "global_step": 173438, "epoch": 4129} {"train_loss": -7.077537536621094, "global_step": 173439, "epoch": 4129} {"train_loss": -7.125292778015137, "global_step": 173440, "epoch": 4129} {"train_loss": -7.156162261962891, "global_step": 173441, "epoch": 4129} {"train_loss": -7.126303195953369, "global_step": 173442, "epoch": 4129} {"train_loss": -7.18413782119751, "global_step": 173443, "epoch": 4129} {"train_loss": -7.110478401184082, "global_step": 173444, "epoch": 4129} {"train_loss": -7.066446304321289, "global_step": 173445, "epoch": 4129} {"train_loss": -7.107752799987793, "global_step": 173446, "epoch": 4129} {"train_loss": -7.066263198852539, "global_step": 173447, "epoch": 4129} {"train_loss": -6.967827320098877, "global_step": 173448, "epoch": 4129} {"train_loss": -7.135371685028076, "global_step": 173449, "epoch": 4129} {"train_loss": -7.112113952636719, "global_step": 173450, "epoch": 4129} {"train_loss": -7.048988342285156, "global_step": 173451, "epoch": 4129} {"train_loss": -7.009889125823975, "global_step": 173452, "epoch": 4129} {"train_loss": -7.007915496826172, "global_step": 173453, "epoch": 4129} {"train_loss": -6.902130603790283, "global_step": 173454, "epoch": 4129} {"train_loss": -6.9987592697143555, "global_step": 173455, "epoch": 4129} {"train_loss": -6.998230934143066, "global_step": 173456, "epoch": 4129} {"train_loss": -6.932994842529297, "global_step": 173457, "epoch": 4129} {"train_loss": -7.007366180419922, "global_step": 173458, "epoch": 4129} {"train_loss": -7.062747399012248, "global_step": 173459, "epoch": 4129, "val_loss": 80083.03125} {"train_loss": -6.898355484008789, "global_step": 173460, "epoch": 4130} {"train_loss": -7.0771989822387695, "global_step": 173461, "epoch": 4130} {"train_loss": -6.895461559295654, "global_step": 173462, "epoch": 4130} {"train_loss": -6.98549747467041, "global_step": 173463, "epoch": 4130} {"train_loss": -7.073326110839844, "global_step": 173464, "epoch": 4130} {"train_loss": -7.127679824829102, "global_step": 173465, "epoch": 4130} {"train_loss": -7.024366855621338, "global_step": 173466, "epoch": 4130} {"train_loss": -7.09819221496582, "global_step": 173467, "epoch": 4130} {"train_loss": -7.142024040222168, "global_step": 173468, "epoch": 4130} {"train_loss": -6.989065647125244, "global_step": 173469, "epoch": 4130} {"train_loss": -7.1223835945129395, "global_step": 173470, "epoch": 4130} {"train_loss": -6.842119216918945, "global_step": 173471, "epoch": 4130} {"train_loss": -7.166755676269531, "global_step": 173472, "epoch": 4130} {"train_loss": -7.064779281616211, "global_step": 173473, "epoch": 4130} {"train_loss": -7.132848262786865, "global_step": 173474, "epoch": 4130} {"train_loss": -6.967517852783203, "global_step": 173475, "epoch": 4130} {"train_loss": -7.048811912536621, "global_step": 173476, "epoch": 4130} {"train_loss": -7.010225296020508, "global_step": 173477, "epoch": 4130} {"train_loss": -7.012732982635498, "global_step": 173478, "epoch": 4130} {"train_loss": -7.043967247009277, "global_step": 173479, "epoch": 4130} {"train_loss": -7.04208517074585, "global_step": 173480, "epoch": 4130} {"train_loss": -7.085264205932617, "global_step": 173481, "epoch": 4130} {"train_loss": -7.017157077789307, "global_step": 173482, "epoch": 4130} {"train_loss": -7.0367279052734375, "global_step": 173483, "epoch": 4130} {"train_loss": -7.114238739013672, "global_step": 173484, "epoch": 4130} {"train_loss": -7.117775917053223, "global_step": 173485, "epoch": 4130} {"train_loss": -7.176326751708984, "global_step": 173486, "epoch": 4130} {"train_loss": -7.149805068969727, "global_step": 173487, "epoch": 4130} {"train_loss": -7.147442817687988, "global_step": 173488, "epoch": 4130} {"train_loss": -7.027067184448242, "global_step": 173489, "epoch": 4130} {"train_loss": -7.1542863845825195, "global_step": 173490, "epoch": 4130} {"train_loss": -7.17894172668457, "global_step": 173491, "epoch": 4130} {"train_loss": -7.021243572235107, "global_step": 173492, "epoch": 4130} {"train_loss": -7.070509910583496, "global_step": 173493, "epoch": 4130} {"train_loss": -7.1624603271484375, "global_step": 173494, "epoch": 4130} {"train_loss": -7.113759517669678, "global_step": 173495, "epoch": 4130} {"train_loss": -7.039816856384277, "global_step": 173496, "epoch": 4130} {"train_loss": -7.0915961265563965, "global_step": 173497, "epoch": 4130} {"train_loss": -7.031374454498291, "global_step": 173498, "epoch": 4130} {"train_loss": -7.087274551391602, "global_step": 173499, "epoch": 4130} {"train_loss": -7.062773704528809, "global_step": 173500, "epoch": 4130} {"train_loss": -7.064696243831089, "global_step": 173501, "epoch": 4130, "val_loss": 80096.0390625} {"train_loss": -7.034012794494629, "global_step": 173502, "epoch": 4131} {"train_loss": -7.13309383392334, "global_step": 173503, "epoch": 4131} {"train_loss": -7.134638786315918, "global_step": 173504, "epoch": 4131} {"train_loss": -7.149225234985352, "global_step": 173505, "epoch": 4131} {"train_loss": -7.159485816955566, "global_step": 173506, "epoch": 4131} {"train_loss": -7.0575151443481445, "global_step": 173507, "epoch": 4131} {"train_loss": -7.187535762786865, "global_step": 173508, "epoch": 4131} {"train_loss": -7.17879581451416, "global_step": 173509, "epoch": 4131} {"train_loss": -7.123639106750488, "global_step": 173510, "epoch": 4131} {"train_loss": -7.1468000411987305, "global_step": 173511, "epoch": 4131} {"train_loss": -7.199037551879883, "global_step": 173512, "epoch": 4131} {"train_loss": -6.9809160232543945, "global_step": 173513, "epoch": 4131} {"train_loss": -7.058712959289551, "global_step": 173514, "epoch": 4131} {"train_loss": -7.12674617767334, "global_step": 173515, "epoch": 4131} {"train_loss": -7.065885543823242, "global_step": 173516, "epoch": 4131} {"train_loss": -7.098557472229004, "global_step": 173517, "epoch": 4131} {"train_loss": -7.128593444824219, "global_step": 173518, "epoch": 4131} {"train_loss": -7.09990119934082, "global_step": 173519, "epoch": 4131} {"train_loss": -7.023258209228516, "global_step": 173520, "epoch": 4131} {"train_loss": -7.120842933654785, "global_step": 173521, "epoch": 4131} {"train_loss": -7.190225601196289, "global_step": 173522, "epoch": 4131} {"train_loss": -7.1048479080200195, "global_step": 173523, "epoch": 4131} {"train_loss": -7.118077278137207, "global_step": 173524, "epoch": 4131} {"train_loss": -7.0592451095581055, "global_step": 173525, "epoch": 4131} {"train_loss": -7.074760437011719, "global_step": 173526, "epoch": 4131} {"train_loss": -7.049344539642334, "global_step": 173527, "epoch": 4131} {"train_loss": -7.070947647094727, "global_step": 173528, "epoch": 4131} {"train_loss": -7.111067295074463, "global_step": 173529, "epoch": 4131} {"train_loss": -7.167316436767578, "global_step": 173530, "epoch": 4131} {"train_loss": -6.893195152282715, "global_step": 173531, "epoch": 4131} {"train_loss": -7.250536918640137, "global_step": 173532, "epoch": 4131} {"train_loss": -7.118544101715088, "global_step": 173533, "epoch": 4131} {"train_loss": -6.959123611450195, "global_step": 173534, "epoch": 4131} {"train_loss": -7.12415885925293, "global_step": 173535, "epoch": 4131} {"train_loss": -6.988790512084961, "global_step": 173536, "epoch": 4131} {"train_loss": -7.060105800628662, "global_step": 173537, "epoch": 4131} {"train_loss": -7.1987104415893555, "global_step": 173538, "epoch": 4131} {"train_loss": -6.924843788146973, "global_step": 173539, "epoch": 4131} {"train_loss": -6.8500823974609375, "global_step": 173540, "epoch": 4131} {"train_loss": -7.172415733337402, "global_step": 173541, "epoch": 4131} {"train_loss": -6.886788845062256, "global_step": 173542, "epoch": 4131} {"train_loss": -7.087774208613804, "global_step": 173543, "epoch": 4131, "val_loss": 79964.0859375} {"train_loss": -6.948880195617676, "global_step": 173544, "epoch": 4132} {"train_loss": -6.788304328918457, "global_step": 173545, "epoch": 4132} {"train_loss": -7.124339580535889, "global_step": 173546, "epoch": 4132} {"train_loss": -6.9462385177612305, "global_step": 173547, "epoch": 4132} {"train_loss": -6.900352478027344, "global_step": 173548, "epoch": 4132} {"train_loss": -7.001826286315918, "global_step": 173549, "epoch": 4132} {"train_loss": -6.934035301208496, "global_step": 173550, "epoch": 4132} {"train_loss": -7.0239386558532715, "global_step": 173551, "epoch": 4132} {"train_loss": -6.937049865722656, "global_step": 173552, "epoch": 4132} {"train_loss": -7.010872840881348, "global_step": 173553, "epoch": 4132} {"train_loss": -7.021656036376953, "global_step": 173554, "epoch": 4132} {"train_loss": -7.0036187171936035, "global_step": 173555, "epoch": 4132} {"train_loss": -6.868953227996826, "global_step": 173556, "epoch": 4132} {"train_loss": -7.110252380371094, "global_step": 173557, "epoch": 4132} {"train_loss": -6.941027641296387, "global_step": 173558, "epoch": 4132} {"train_loss": -6.9409379959106445, "global_step": 173559, "epoch": 4132} {"train_loss": -7.084450721740723, "global_step": 173560, "epoch": 4132} {"train_loss": -6.904863357543945, "global_step": 173561, "epoch": 4132} {"train_loss": -7.077444076538086, "global_step": 173562, "epoch": 4132} {"train_loss": -7.092187404632568, "global_step": 173563, "epoch": 4132} {"train_loss": -7.017974853515625, "global_step": 173564, "epoch": 4132} {"train_loss": -7.031412124633789, "global_step": 173565, "epoch": 4132} {"train_loss": -6.925113677978516, "global_step": 173566, "epoch": 4132} {"train_loss": -6.993762969970703, "global_step": 173567, "epoch": 4132} {"train_loss": -7.085823059082031, "global_step": 173568, "epoch": 4132} {"train_loss": -7.068469047546387, "global_step": 173569, "epoch": 4132} {"train_loss": -6.803238391876221, "global_step": 173570, "epoch": 4132} {"train_loss": -7.061175346374512, "global_step": 173571, "epoch": 4132} {"train_loss": -6.882654666900635, "global_step": 173572, "epoch": 4132} {"train_loss": -6.833634853363037, "global_step": 173573, "epoch": 4132} {"train_loss": -7.003990173339844, "global_step": 173574, "epoch": 4132} {"train_loss": -6.831912994384766, "global_step": 173575, "epoch": 4132} {"train_loss": -7.0098676681518555, "global_step": 173576, "epoch": 4132} {"train_loss": -6.8427324295043945, "global_step": 173577, "epoch": 4132} {"train_loss": -6.824533462524414, "global_step": 173578, "epoch": 4132} {"train_loss": -6.8816962242126465, "global_step": 173579, "epoch": 4132} {"train_loss": -6.889485836029053, "global_step": 173580, "epoch": 4132} {"train_loss": -7.005841255187988, "global_step": 173581, "epoch": 4132} {"train_loss": -6.820889472961426, "global_step": 173582, "epoch": 4132} {"train_loss": -6.999013900756836, "global_step": 173583, "epoch": 4132} {"train_loss": -6.953537940979004, "global_step": 173584, "epoch": 4132} {"train_loss": -6.962330432165237, "global_step": 173585, "epoch": 4132, "val_loss": 79940.390625} {"train_loss": -6.9583282470703125, "global_step": 173586, "epoch": 4133} {"train_loss": -6.973320007324219, "global_step": 173587, "epoch": 4133} {"train_loss": -6.983798980712891, "global_step": 173588, "epoch": 4133} {"train_loss": -7.010658264160156, "global_step": 173589, "epoch": 4133} {"train_loss": -6.970870018005371, "global_step": 173590, "epoch": 4133} {"train_loss": -7.038732528686523, "global_step": 173591, "epoch": 4133} {"train_loss": -7.029106140136719, "global_step": 173592, "epoch": 4133} {"train_loss": -7.089426040649414, "global_step": 173593, "epoch": 4133} {"train_loss": -6.895802974700928, "global_step": 173594, "epoch": 4133} {"train_loss": -6.979229927062988, "global_step": 173595, "epoch": 4133} {"train_loss": -7.054807662963867, "global_step": 173596, "epoch": 4133} {"train_loss": -7.025233268737793, "global_step": 173597, "epoch": 4133} {"train_loss": -6.937708854675293, "global_step": 173598, "epoch": 4133} {"train_loss": -7.149969100952148, "global_step": 173599, "epoch": 4133} {"train_loss": -7.044728755950928, "global_step": 173600, "epoch": 4133} {"train_loss": -7.151913166046143, "global_step": 173601, "epoch": 4133} {"train_loss": -6.9240241050720215, "global_step": 173602, "epoch": 4133} {"train_loss": -7.117932319641113, "global_step": 173603, "epoch": 4133} {"train_loss": -7.060802459716797, "global_step": 173604, "epoch": 4133} {"train_loss": -7.033097743988037, "global_step": 173605, "epoch": 4133} {"train_loss": -7.107377052307129, "global_step": 173606, "epoch": 4133} {"train_loss": -7.134997367858887, "global_step": 173607, "epoch": 4133} {"train_loss": -7.1041975021362305, "global_step": 173608, "epoch": 4133} {"train_loss": -7.069862365722656, "global_step": 173609, "epoch": 4133} {"train_loss": -7.08293342590332, "global_step": 173610, "epoch": 4133} {"train_loss": -7.063792705535889, "global_step": 173611, "epoch": 4133} {"train_loss": -7.075924396514893, "global_step": 173612, "epoch": 4133} {"train_loss": -6.969069004058838, "global_step": 173613, "epoch": 4133} {"train_loss": -7.154750347137451, "global_step": 173614, "epoch": 4133} {"train_loss": -7.12685489654541, "global_step": 173615, "epoch": 4133} {"train_loss": -7.045488357543945, "global_step": 173616, "epoch": 4133} {"train_loss": -6.975470542907715, "global_step": 173617, "epoch": 4133} {"train_loss": -7.195529937744141, "global_step": 173618, "epoch": 4133} {"train_loss": -7.097866058349609, "global_step": 173619, "epoch": 4133} {"train_loss": -7.146299362182617, "global_step": 173620, "epoch": 4133} {"train_loss": -7.141120910644531, "global_step": 173621, "epoch": 4133} {"train_loss": -7.03375244140625, "global_step": 173622, "epoch": 4133} {"train_loss": -7.095828056335449, "global_step": 173623, "epoch": 4133} {"train_loss": -6.9965105056762695, "global_step": 173624, "epoch": 4133} {"train_loss": -7.087553024291992, "global_step": 173625, "epoch": 4133} {"train_loss": -7.164724349975586, "global_step": 173626, "epoch": 4133} {"train_loss": -7.05483113016401, "global_step": 173627, "epoch": 4133, "val_loss": 80167.578125} {"train_loss": -7.133284568786621, "global_step": 173628, "epoch": 4134} {"train_loss": -7.053797721862793, "global_step": 173629, "epoch": 4134} {"train_loss": -7.049439907073975, "global_step": 173630, "epoch": 4134} {"train_loss": -6.806519508361816, "global_step": 173631, "epoch": 4134} {"train_loss": -7.110391139984131, "global_step": 173632, "epoch": 4134} {"train_loss": -6.9894795417785645, "global_step": 173633, "epoch": 4134} {"train_loss": -6.884570121765137, "global_step": 173634, "epoch": 4134} {"train_loss": -7.126411437988281, "global_step": 173635, "epoch": 4134} {"train_loss": -7.0049896240234375, "global_step": 173636, "epoch": 4134} {"train_loss": -7.081101894378662, "global_step": 173637, "epoch": 4134} {"train_loss": -7.089751720428467, "global_step": 173638, "epoch": 4134} {"train_loss": -6.851449489593506, "global_step": 173639, "epoch": 4134} {"train_loss": -7.130707263946533, "global_step": 173640, "epoch": 4134} {"train_loss": -6.939828872680664, "global_step": 173641, "epoch": 4134} {"train_loss": -7.0582594871521, "global_step": 173642, "epoch": 4134} {"train_loss": -7.025732040405273, "global_step": 173643, "epoch": 4134} {"train_loss": -7.129654407501221, "global_step": 173644, "epoch": 4134} {"train_loss": -7.153783321380615, "global_step": 173645, "epoch": 4134} {"train_loss": -7.086210250854492, "global_step": 173646, "epoch": 4134} {"train_loss": -7.088433265686035, "global_step": 173647, "epoch": 4134} {"train_loss": -7.043203353881836, "global_step": 173648, "epoch": 4134} {"train_loss": -7.103231430053711, "global_step": 173649, "epoch": 4134} {"train_loss": -7.006438255310059, "global_step": 173650, "epoch": 4134} {"train_loss": -7.098781108856201, "global_step": 173651, "epoch": 4134} {"train_loss": -7.060487747192383, "global_step": 173652, "epoch": 4134} {"train_loss": -7.085507392883301, "global_step": 173653, "epoch": 4134} {"train_loss": -7.059297561645508, "global_step": 173654, "epoch": 4134} {"train_loss": -7.142609596252441, "global_step": 173655, "epoch": 4134} {"train_loss": -7.089106559753418, "global_step": 173656, "epoch": 4134} {"train_loss": -7.091555595397949, "global_step": 173657, "epoch": 4134} {"train_loss": -7.164923667907715, "global_step": 173658, "epoch": 4134} {"train_loss": -6.9739789962768555, "global_step": 173659, "epoch": 4134} {"train_loss": -7.074528217315674, "global_step": 173660, "epoch": 4134} {"train_loss": -6.970663547515869, "global_step": 173661, "epoch": 4134} {"train_loss": -6.98053503036499, "global_step": 173662, "epoch": 4134} {"train_loss": -7.023674488067627, "global_step": 173663, "epoch": 4134} {"train_loss": -6.948808670043945, "global_step": 173664, "epoch": 4134} {"train_loss": -6.8848419189453125, "global_step": 173665, "epoch": 4134} {"train_loss": -7.201404094696045, "global_step": 173666, "epoch": 4134} {"train_loss": -7.042366981506348, "global_step": 173667, "epoch": 4134} {"train_loss": -7.143428802490234, "global_step": 173668, "epoch": 4134} {"train_loss": -7.049410161517915, "global_step": 173669, "epoch": 4134, "val_loss": 80056.7421875} {"train_loss": -7.050737380981445, "global_step": 173670, "epoch": 4135} {"train_loss": -7.136760711669922, "global_step": 173671, "epoch": 4135} {"train_loss": -7.046301364898682, "global_step": 173672, "epoch": 4135} {"train_loss": -7.06313943862915, "global_step": 173673, "epoch": 4135} {"train_loss": -7.107706069946289, "global_step": 173674, "epoch": 4135} {"train_loss": -7.109333038330078, "global_step": 173675, "epoch": 4135} {"train_loss": -7.037759780883789, "global_step": 173676, "epoch": 4135} {"train_loss": -7.016077995300293, "global_step": 173677, "epoch": 4135} {"train_loss": -7.058884143829346, "global_step": 173678, "epoch": 4135} {"train_loss": -7.1201863288879395, "global_step": 173679, "epoch": 4135} {"train_loss": -6.852092266082764, "global_step": 173680, "epoch": 4135} {"train_loss": -7.090625762939453, "global_step": 173681, "epoch": 4135} {"train_loss": -7.024774551391602, "global_step": 173682, "epoch": 4135} {"train_loss": -7.043187141418457, "global_step": 173683, "epoch": 4135} {"train_loss": -7.085172653198242, "global_step": 173684, "epoch": 4135} {"train_loss": -7.03974723815918, "global_step": 173685, "epoch": 4135} {"train_loss": -6.972619533538818, "global_step": 173686, "epoch": 4135} {"train_loss": -7.010017395019531, "global_step": 173687, "epoch": 4135} {"train_loss": -7.000887870788574, "global_step": 173688, "epoch": 4135} {"train_loss": -7.020875930786133, "global_step": 173689, "epoch": 4135} {"train_loss": -6.969581604003906, "global_step": 173690, "epoch": 4135} {"train_loss": -6.969931125640869, "global_step": 173691, "epoch": 4135} {"train_loss": -7.042316436767578, "global_step": 173692, "epoch": 4135} {"train_loss": -6.96877384185791, "global_step": 173693, "epoch": 4135} {"train_loss": -6.9900898933410645, "global_step": 173694, "epoch": 4135} {"train_loss": -6.903403282165527, "global_step": 173695, "epoch": 4135} {"train_loss": -6.952353477478027, "global_step": 173696, "epoch": 4135} {"train_loss": -6.933191299438477, "global_step": 173697, "epoch": 4135} {"train_loss": -7.081371784210205, "global_step": 173698, "epoch": 4135} {"train_loss": -7.018594741821289, "global_step": 173699, "epoch": 4135} {"train_loss": -7.079937934875488, "global_step": 173700, "epoch": 4135} {"train_loss": -7.051264762878418, "global_step": 173701, "epoch": 4135} {"train_loss": -7.055050373077393, "global_step": 173702, "epoch": 4135} {"train_loss": -7.071575164794922, "global_step": 173703, "epoch": 4135} {"train_loss": -7.058041572570801, "global_step": 173704, "epoch": 4135} {"train_loss": -6.922340393066406, "global_step": 173705, "epoch": 4135} {"train_loss": -7.055527210235596, "global_step": 173706, "epoch": 4135} {"train_loss": -6.944245338439941, "global_step": 173707, "epoch": 4135} {"train_loss": -6.927798271179199, "global_step": 173708, "epoch": 4135} {"train_loss": -7.040267467498779, "global_step": 173709, "epoch": 4135} {"train_loss": -6.961205005645752, "global_step": 173710, "epoch": 4135} {"train_loss": -7.021352291107178, "global_step": 173711, "epoch": 4135, "val_loss": 79965.53125} {"train_loss": -7.01625919342041, "global_step": 173712, "epoch": 4136} {"train_loss": -6.999564170837402, "global_step": 173713, "epoch": 4136} {"train_loss": -6.968196868896484, "global_step": 173714, "epoch": 4136} {"train_loss": -6.870849132537842, "global_step": 173715, "epoch": 4136} {"train_loss": -6.997096061706543, "global_step": 173716, "epoch": 4136} {"train_loss": -6.938842296600342, "global_step": 173717, "epoch": 4136} {"train_loss": -7.136284828186035, "global_step": 173718, "epoch": 4136} {"train_loss": -6.970452785491943, "global_step": 173719, "epoch": 4136} {"train_loss": -7.019029140472412, "global_step": 173720, "epoch": 4136} {"train_loss": -7.063169002532959, "global_step": 173721, "epoch": 4136} {"train_loss": -6.979469299316406, "global_step": 173722, "epoch": 4136} {"train_loss": -6.990666389465332, "global_step": 173723, "epoch": 4136} {"train_loss": -6.9856133460998535, "global_step": 173724, "epoch": 4136} {"train_loss": -6.954761505126953, "global_step": 173725, "epoch": 4136} {"train_loss": -6.831483840942383, "global_step": 173726, "epoch": 4136} {"train_loss": -7.07615852355957, "global_step": 173727, "epoch": 4136} {"train_loss": -6.921725273132324, "global_step": 173728, "epoch": 4136} {"train_loss": -7.042544364929199, "global_step": 173729, "epoch": 4136} {"train_loss": -6.8939409255981445, "global_step": 173730, "epoch": 4136} {"train_loss": -7.001489162445068, "global_step": 173731, "epoch": 4136} {"train_loss": -7.001293659210205, "global_step": 173732, "epoch": 4136} {"train_loss": -6.944370269775391, "global_step": 173733, "epoch": 4136} {"train_loss": -6.920138359069824, "global_step": 173734, "epoch": 4136} {"train_loss": -7.063982009887695, "global_step": 173735, "epoch": 4136} {"train_loss": -6.997415542602539, "global_step": 173736, "epoch": 4136} {"train_loss": -7.030231475830078, "global_step": 173737, "epoch": 4136} {"train_loss": -7.147222518920898, "global_step": 173738, "epoch": 4136} {"train_loss": -6.931162357330322, "global_step": 173739, "epoch": 4136} {"train_loss": -7.0317182540893555, "global_step": 173740, "epoch": 4136} {"train_loss": -7.074010848999023, "global_step": 173741, "epoch": 4136} {"train_loss": -7.091798782348633, "global_step": 173742, "epoch": 4136} {"train_loss": -7.039394378662109, "global_step": 173743, "epoch": 4136} {"train_loss": -7.02501106262207, "global_step": 173744, "epoch": 4136} {"train_loss": -6.978878021240234, "global_step": 173745, "epoch": 4136} {"train_loss": -7.091891288757324, "global_step": 173746, "epoch": 4136} {"train_loss": -7.076972007751465, "global_step": 173747, "epoch": 4136} {"train_loss": -6.987631797790527, "global_step": 173748, "epoch": 4136} {"train_loss": -7.121978759765625, "global_step": 173749, "epoch": 4136} {"train_loss": -7.052090644836426, "global_step": 173750, "epoch": 4136} {"train_loss": -7.076587677001953, "global_step": 173751, "epoch": 4136} {"train_loss": -7.180923938751221, "global_step": 173752, "epoch": 4136} {"train_loss": -7.015559559776669, "global_step": 173753, "epoch": 4136, "val_loss": 79938.734375} {"train_loss": -7.0370330810546875, "global_step": 173754, "epoch": 4137} {"train_loss": -7.027060508728027, "global_step": 173755, "epoch": 4137} {"train_loss": -7.0616044998168945, "global_step": 173756, "epoch": 4137} {"train_loss": -7.196918964385986, "global_step": 173757, "epoch": 4137} {"train_loss": -6.896509170532227, "global_step": 173758, "epoch": 4137} {"train_loss": -7.1169633865356445, "global_step": 173759, "epoch": 4137} {"train_loss": -7.113523960113525, "global_step": 173760, "epoch": 4137} {"train_loss": -7.130998611450195, "global_step": 173761, "epoch": 4137} {"train_loss": -7.246098518371582, "global_step": 173762, "epoch": 4137} {"train_loss": -7.062286376953125, "global_step": 173763, "epoch": 4137} {"train_loss": -7.192766189575195, "global_step": 173764, "epoch": 4137} {"train_loss": -7.141904354095459, "global_step": 173765, "epoch": 4137} {"train_loss": -7.0629072189331055, "global_step": 173766, "epoch": 4137} {"train_loss": -7.0674967765808105, "global_step": 173767, "epoch": 4137} {"train_loss": -7.120392799377441, "global_step": 173768, "epoch": 4137} {"train_loss": -7.0494866371154785, "global_step": 173769, "epoch": 4137} {"train_loss": -7.125988483428955, "global_step": 173770, "epoch": 4137} {"train_loss": -7.0628662109375, "global_step": 173771, "epoch": 4137} {"train_loss": -7.170737266540527, "global_step": 173772, "epoch": 4137} {"train_loss": -7.128134727478027, "global_step": 173773, "epoch": 4137} {"train_loss": -7.044457912445068, "global_step": 173774, "epoch": 4137} {"train_loss": -7.0931854248046875, "global_step": 173775, "epoch": 4137} {"train_loss": -7.042278289794922, "global_step": 173776, "epoch": 4137} {"train_loss": -7.062248229980469, "global_step": 173777, "epoch": 4137} {"train_loss": -7.10086727142334, "global_step": 173778, "epoch": 4137} {"train_loss": -7.1010212898254395, "global_step": 173779, "epoch": 4137} {"train_loss": -7.1182942390441895, "global_step": 173780, "epoch": 4137} {"train_loss": -7.178874492645264, "global_step": 173781, "epoch": 4137} {"train_loss": -6.965289115905762, "global_step": 173782, "epoch": 4137} {"train_loss": -7.039196014404297, "global_step": 173783, "epoch": 4137} {"train_loss": -7.142692565917969, "global_step": 173784, "epoch": 4137} {"train_loss": -7.031081199645996, "global_step": 173785, "epoch": 4137} {"train_loss": -7.1401214599609375, "global_step": 173786, "epoch": 4137} {"train_loss": -6.9628400802612305, "global_step": 173787, "epoch": 4137} {"train_loss": -7.211647033691406, "global_step": 173788, "epoch": 4137} {"train_loss": -7.122221946716309, "global_step": 173789, "epoch": 4137} {"train_loss": -7.0709757804870605, "global_step": 173790, "epoch": 4137} {"train_loss": -7.12830924987793, "global_step": 173791, "epoch": 4137} {"train_loss": -7.021286964416504, "global_step": 173792, "epoch": 4137} {"train_loss": -7.077523708343506, "global_step": 173793, "epoch": 4137} {"train_loss": -6.9601593017578125, "global_step": 173794, "epoch": 4137} {"train_loss": -7.08931777590797, "global_step": 173795, "epoch": 4137, "val_loss": 80057.1953125} {"train_loss": -6.985909461975098, "global_step": 173796, "epoch": 4138} {"train_loss": -7.071998596191406, "global_step": 173797, "epoch": 4138} {"train_loss": -7.058319091796875, "global_step": 173798, "epoch": 4138} {"train_loss": -7.11100959777832, "global_step": 173799, "epoch": 4138} {"train_loss": -6.9641337394714355, "global_step": 173800, "epoch": 4138} {"train_loss": -7.089084625244141, "global_step": 173801, "epoch": 4138} {"train_loss": -7.09299373626709, "global_step": 173802, "epoch": 4138} {"train_loss": -6.947513103485107, "global_step": 173803, "epoch": 4138} {"train_loss": -6.988015174865723, "global_step": 173804, "epoch": 4138} {"train_loss": -7.135275840759277, "global_step": 173805, "epoch": 4138} {"train_loss": -7.004290580749512, "global_step": 173806, "epoch": 4138} {"train_loss": -7.043001174926758, "global_step": 173807, "epoch": 4138} {"train_loss": -7.16471529006958, "global_step": 173808, "epoch": 4138} {"train_loss": -6.9570722579956055, "global_step": 173809, "epoch": 4138} {"train_loss": -7.145965099334717, "global_step": 173810, "epoch": 4138} {"train_loss": -7.15948486328125, "global_step": 173811, "epoch": 4138} {"train_loss": -7.0182785987854, "global_step": 173812, "epoch": 4138} {"train_loss": -7.032135009765625, "global_step": 173813, "epoch": 4138} {"train_loss": -7.089560031890869, "global_step": 173814, "epoch": 4138} {"train_loss": -7.027530193328857, "global_step": 173815, "epoch": 4138} {"train_loss": -7.01215934753418, "global_step": 173816, "epoch": 4138} {"train_loss": -6.9870686531066895, "global_step": 173817, "epoch": 4138} {"train_loss": -7.161545753479004, "global_step": 173818, "epoch": 4138} {"train_loss": -7.222190856933594, "global_step": 173819, "epoch": 4138} {"train_loss": -6.958378314971924, "global_step": 173820, "epoch": 4138} {"train_loss": -7.009950160980225, "global_step": 173821, "epoch": 4138} {"train_loss": -7.050327301025391, "global_step": 173822, "epoch": 4138} {"train_loss": -7.1287841796875, "global_step": 173823, "epoch": 4138} {"train_loss": -7.086273193359375, "global_step": 173824, "epoch": 4138} {"train_loss": -7.150695323944092, "global_step": 173825, "epoch": 4138} {"train_loss": -7.048232078552246, "global_step": 173826, "epoch": 4138} {"train_loss": -6.899423599243164, "global_step": 173827, "epoch": 4138} {"train_loss": -7.237951278686523, "global_step": 173828, "epoch": 4138} {"train_loss": -7.131700038909912, "global_step": 173829, "epoch": 4138} {"train_loss": -7.030370712280273, "global_step": 173830, "epoch": 4138} {"train_loss": -7.155450820922852, "global_step": 173831, "epoch": 4138} {"train_loss": -7.184395790100098, "global_step": 173832, "epoch": 4138} {"train_loss": -7.131795883178711, "global_step": 173833, "epoch": 4138} {"train_loss": -7.120977401733398, "global_step": 173834, "epoch": 4138} {"train_loss": -7.105550765991211, "global_step": 173835, "epoch": 4138} {"train_loss": -7.076330184936523, "global_step": 173836, "epoch": 4138} {"train_loss": -7.074346122287569, "global_step": 173837, "epoch": 4138, "val_loss": 80157.2890625} {"train_loss": -7.163525104522705, "global_step": 173838, "epoch": 4139} {"train_loss": -7.176470756530762, "global_step": 173839, "epoch": 4139} {"train_loss": -7.164371013641357, "global_step": 173840, "epoch": 4139} {"train_loss": -7.152312278747559, "global_step": 173841, "epoch": 4139} {"train_loss": -6.988861560821533, "global_step": 173842, "epoch": 4139} {"train_loss": -7.074216842651367, "global_step": 173843, "epoch": 4139} {"train_loss": -7.033752918243408, "global_step": 173844, "epoch": 4139} {"train_loss": -7.090883255004883, "global_step": 173845, "epoch": 4139} {"train_loss": -7.011629104614258, "global_step": 173846, "epoch": 4139} {"train_loss": -7.087460994720459, "global_step": 173847, "epoch": 4139} {"train_loss": -7.0910420417785645, "global_step": 173848, "epoch": 4139} {"train_loss": -7.161710739135742, "global_step": 173849, "epoch": 4139} {"train_loss": -7.135989189147949, "global_step": 173850, "epoch": 4139} {"train_loss": -7.09737491607666, "global_step": 173851, "epoch": 4139} {"train_loss": -7.030890464782715, "global_step": 173852, "epoch": 4139} {"train_loss": -7.137697219848633, "global_step": 173853, "epoch": 4139} {"train_loss": -6.971878528594971, "global_step": 173854, "epoch": 4139} {"train_loss": -7.07047176361084, "global_step": 173855, "epoch": 4139} {"train_loss": -7.160154819488525, "global_step": 173856, "epoch": 4139} {"train_loss": -7.027492523193359, "global_step": 173857, "epoch": 4139} {"train_loss": -7.057391166687012, "global_step": 173858, "epoch": 4139} {"train_loss": -7.027825355529785, "global_step": 173859, "epoch": 4139} {"train_loss": -7.027815341949463, "global_step": 173860, "epoch": 4139} {"train_loss": -7.048127174377441, "global_step": 173861, "epoch": 4139} {"train_loss": -6.969804763793945, "global_step": 173862, "epoch": 4139} {"train_loss": -7.2850189208984375, "global_step": 173863, "epoch": 4139} {"train_loss": -7.054710388183594, "global_step": 173864, "epoch": 4139} {"train_loss": -7.026004791259766, "global_step": 173865, "epoch": 4139} {"train_loss": -7.076560974121094, "global_step": 173866, "epoch": 4139} {"train_loss": -7.066842079162598, "global_step": 173867, "epoch": 4139} {"train_loss": -7.167315483093262, "global_step": 173868, "epoch": 4139} {"train_loss": -7.101198196411133, "global_step": 173869, "epoch": 4139} {"train_loss": -6.976548194885254, "global_step": 173870, "epoch": 4139} {"train_loss": -7.167360305786133, "global_step": 173871, "epoch": 4139} {"train_loss": -7.119297027587891, "global_step": 173872, "epoch": 4139} {"train_loss": -7.108699798583984, "global_step": 173873, "epoch": 4139} {"train_loss": -7.059537887573242, "global_step": 173874, "epoch": 4139} {"train_loss": -7.165884971618652, "global_step": 173875, "epoch": 4139} {"train_loss": -7.075931072235107, "global_step": 173876, "epoch": 4139} {"train_loss": -7.062216281890869, "global_step": 173877, "epoch": 4139} {"train_loss": -6.970118522644043, "global_step": 173878, "epoch": 4139} {"train_loss": -7.083299511954898, "global_step": 173879, "epoch": 4139, "val_loss": 80214.6484375} {"train_loss": -7.053719520568848, "global_step": 173880, "epoch": 4140} {"train_loss": -7.094709396362305, "global_step": 173881, "epoch": 4140} {"train_loss": -7.117290496826172, "global_step": 173882, "epoch": 4140} {"train_loss": -7.041543006896973, "global_step": 173883, "epoch": 4140} {"train_loss": -7.034794330596924, "global_step": 173884, "epoch": 4140} {"train_loss": -7.05152702331543, "global_step": 173885, "epoch": 4140} {"train_loss": -7.073458671569824, "global_step": 173886, "epoch": 4140} {"train_loss": -7.154714584350586, "global_step": 173887, "epoch": 4140} {"train_loss": -7.119407653808594, "global_step": 173888, "epoch": 4140} {"train_loss": -7.004060745239258, "global_step": 173889, "epoch": 4140} {"train_loss": -7.168635368347168, "global_step": 173890, "epoch": 4140} {"train_loss": -7.014324188232422, "global_step": 173891, "epoch": 4140} {"train_loss": -6.984124183654785, "global_step": 173892, "epoch": 4140} {"train_loss": -7.055080413818359, "global_step": 173893, "epoch": 4140} {"train_loss": -7.085954189300537, "global_step": 173894, "epoch": 4140} {"train_loss": -7.133493423461914, "global_step": 173895, "epoch": 4140} {"train_loss": -7.151113033294678, "global_step": 173896, "epoch": 4140} {"train_loss": -7.107049942016602, "global_step": 173897, "epoch": 4140} {"train_loss": -7.134247779846191, "global_step": 173898, "epoch": 4140} {"train_loss": -7.070556163787842, "global_step": 173899, "epoch": 4140} {"train_loss": -7.087978363037109, "global_step": 173900, "epoch": 4140} {"train_loss": -7.050934791564941, "global_step": 173901, "epoch": 4140} {"train_loss": -7.034536361694336, "global_step": 173902, "epoch": 4140} {"train_loss": -6.972173690795898, "global_step": 173903, "epoch": 4140} {"train_loss": -6.979165077209473, "global_step": 173904, "epoch": 4140} {"train_loss": -7.114123344421387, "global_step": 173905, "epoch": 4140} {"train_loss": -7.0036444664001465, "global_step": 173906, "epoch": 4140} {"train_loss": -6.952546119689941, "global_step": 173907, "epoch": 4140} {"train_loss": -7.111830711364746, "global_step": 173908, "epoch": 4140} {"train_loss": -6.923322677612305, "global_step": 173909, "epoch": 4140} {"train_loss": -6.931375503540039, "global_step": 173910, "epoch": 4140} {"train_loss": -6.980266571044922, "global_step": 173911, "epoch": 4140} {"train_loss": -6.8583784103393555, "global_step": 173912, "epoch": 4140} {"train_loss": -7.07408332824707, "global_step": 173913, "epoch": 4140} {"train_loss": -6.967043399810791, "global_step": 173914, "epoch": 4140} {"train_loss": -6.952885150909424, "global_step": 173915, "epoch": 4140} {"train_loss": -7.074527263641357, "global_step": 173916, "epoch": 4140} {"train_loss": -6.93599271774292, "global_step": 173917, "epoch": 4140} {"train_loss": -6.96959114074707, "global_step": 173918, "epoch": 4140} {"train_loss": -7.023272514343262, "global_step": 173919, "epoch": 4140} {"train_loss": -6.997776985168457, "global_step": 173920, "epoch": 4140} {"train_loss": -7.040964603424072, "global_step": 173921, "epoch": 4140, "val_loss": 79988.453125} {"train_loss": -7.052090167999268, "global_step": 173922, "epoch": 4141} {"train_loss": -6.950536727905273, "global_step": 173923, "epoch": 4141} {"train_loss": -7.082146644592285, "global_step": 173924, "epoch": 4141} {"train_loss": -6.9951934814453125, "global_step": 173925, "epoch": 4141} {"train_loss": -6.98042106628418, "global_step": 173926, "epoch": 4141} {"train_loss": -7.062389373779297, "global_step": 173927, "epoch": 4141} {"train_loss": -7.1146392822265625, "global_step": 173928, "epoch": 4141} {"train_loss": -6.918707370758057, "global_step": 173929, "epoch": 4141} {"train_loss": -6.918540954589844, "global_step": 173930, "epoch": 4141} {"train_loss": -7.051469326019287, "global_step": 173931, "epoch": 4141} {"train_loss": -6.933492660522461, "global_step": 173932, "epoch": 4141} {"train_loss": -6.894296646118164, "global_step": 173933, "epoch": 4141} {"train_loss": -6.9811506271362305, "global_step": 173934, "epoch": 4141} {"train_loss": -7.028724670410156, "global_step": 173935, "epoch": 4141} {"train_loss": -6.972149848937988, "global_step": 173936, "epoch": 4141} {"train_loss": -7.024724960327148, "global_step": 173937, "epoch": 4141} {"train_loss": -7.031805038452148, "global_step": 173938, "epoch": 4141} {"train_loss": -7.109870910644531, "global_step": 173939, "epoch": 4141} {"train_loss": -7.040306091308594, "global_step": 173940, "epoch": 4141} {"train_loss": -7.160490989685059, "global_step": 173941, "epoch": 4141} {"train_loss": -7.082048416137695, "global_step": 173942, "epoch": 4141} {"train_loss": -6.989343166351318, "global_step": 173943, "epoch": 4141} {"train_loss": -6.96166467666626, "global_step": 173944, "epoch": 4141} {"train_loss": -7.060814380645752, "global_step": 173945, "epoch": 4141} {"train_loss": -7.0790581703186035, "global_step": 173946, "epoch": 4141} {"train_loss": -7.1302690505981445, "global_step": 173947, "epoch": 4141} {"train_loss": -7.158152103424072, "global_step": 173948, "epoch": 4141} {"train_loss": -7.0527520179748535, "global_step": 173949, "epoch": 4141} {"train_loss": -7.119447708129883, "global_step": 173950, "epoch": 4141} {"train_loss": -6.962100982666016, "global_step": 173951, "epoch": 4141} {"train_loss": -7.141422271728516, "global_step": 173952, "epoch": 4141} {"train_loss": -7.11972713470459, "global_step": 173953, "epoch": 4141} {"train_loss": -7.062124252319336, "global_step": 173954, "epoch": 4141} {"train_loss": -7.046561241149902, "global_step": 173955, "epoch": 4141} {"train_loss": -7.127197742462158, "global_step": 173956, "epoch": 4141} {"train_loss": -7.050213813781738, "global_step": 173957, "epoch": 4141} {"train_loss": -7.180556774139404, "global_step": 173958, "epoch": 4141} {"train_loss": -7.0070672035217285, "global_step": 173959, "epoch": 4141} {"train_loss": -7.108783721923828, "global_step": 173960, "epoch": 4141} {"train_loss": -7.111774921417236, "global_step": 173961, "epoch": 4141} {"train_loss": -7.050051689147949, "global_step": 173962, "epoch": 4141} {"train_loss": -7.047046309425717, "global_step": 173963, "epoch": 4141, "val_loss": 80277.28125} {"train_loss": -7.033501148223877, "global_step": 173964, "epoch": 4142} {"train_loss": -7.16758918762207, "global_step": 173965, "epoch": 4142} {"train_loss": -7.165761947631836, "global_step": 173966, "epoch": 4142} {"train_loss": -7.155919075012207, "global_step": 173967, "epoch": 4142} {"train_loss": -7.092807769775391, "global_step": 173968, "epoch": 4142} {"train_loss": -6.958698749542236, "global_step": 173969, "epoch": 4142} {"train_loss": -7.008049964904785, "global_step": 173970, "epoch": 4142} {"train_loss": -6.999362945556641, "global_step": 173971, "epoch": 4142} {"train_loss": -7.109933853149414, "global_step": 173972, "epoch": 4142} {"train_loss": -7.011509418487549, "global_step": 173973, "epoch": 4142} {"train_loss": -7.034459114074707, "global_step": 173974, "epoch": 4142} {"train_loss": -7.104856491088867, "global_step": 173975, "epoch": 4142} {"train_loss": -7.0774407386779785, "global_step": 173976, "epoch": 4142} {"train_loss": -7.027501583099365, "global_step": 173977, "epoch": 4142} {"train_loss": -7.07166862487793, "global_step": 173978, "epoch": 4142} {"train_loss": -7.0911455154418945, "global_step": 173979, "epoch": 4142} {"train_loss": -7.025881767272949, "global_step": 173980, "epoch": 4142} {"train_loss": -7.087417125701904, "global_step": 173981, "epoch": 4142} {"train_loss": -6.95297384262085, "global_step": 173982, "epoch": 4142} {"train_loss": -7.2084174156188965, "global_step": 173983, "epoch": 4142} {"train_loss": -7.068550109863281, "global_step": 173984, "epoch": 4142} {"train_loss": -7.172732353210449, "global_step": 173985, "epoch": 4142} {"train_loss": -7.129977226257324, "global_step": 173986, "epoch": 4142} {"train_loss": -7.113818645477295, "global_step": 173987, "epoch": 4142} {"train_loss": -7.175609111785889, "global_step": 173988, "epoch": 4142} {"train_loss": -7.0844621658325195, "global_step": 173989, "epoch": 4142} {"train_loss": -7.029205322265625, "global_step": 173990, "epoch": 4142} {"train_loss": -7.145352363586426, "global_step": 173991, "epoch": 4142} {"train_loss": -7.11572265625, "global_step": 173992, "epoch": 4142} {"train_loss": -6.985269069671631, "global_step": 173993, "epoch": 4142} {"train_loss": -7.173161029815674, "global_step": 173994, "epoch": 4142} {"train_loss": -7.094529628753662, "global_step": 173995, "epoch": 4142} {"train_loss": -7.083981513977051, "global_step": 173996, "epoch": 4142} {"train_loss": -7.145630836486816, "global_step": 173997, "epoch": 4142} {"train_loss": -7.029083728790283, "global_step": 173998, "epoch": 4142} {"train_loss": -7.115596771240234, "global_step": 173999, "epoch": 4142} {"train_loss": -7.236083984375, "global_step": 174000, "epoch": 4142} {"train_loss": -7.0596113204956055, "global_step": 174001, "epoch": 4142} {"train_loss": -7.090105056762695, "global_step": 174002, "epoch": 4142} {"train_loss": -6.9607768058776855, "global_step": 174003, "epoch": 4142} {"train_loss": -6.995652198791504, "global_step": 174004, "epoch": 4142} {"train_loss": -7.084247157687233, "global_step": 174005, "epoch": 4142, "val_loss": 80218.6015625} {"train_loss": -7.131576061248779, "global_step": 174006, "epoch": 4143} {"train_loss": -7.154917240142822, "global_step": 174007, "epoch": 4143} {"train_loss": -6.943881988525391, "global_step": 174008, "epoch": 4143} {"train_loss": -7.02718448638916, "global_step": 174009, "epoch": 4143} {"train_loss": -7.077244758605957, "global_step": 174010, "epoch": 4143} {"train_loss": -7.128767490386963, "global_step": 174011, "epoch": 4143} {"train_loss": -7.217131614685059, "global_step": 174012, "epoch": 4143} {"train_loss": -7.029150485992432, "global_step": 174013, "epoch": 4143} {"train_loss": -7.138317108154297, "global_step": 174014, "epoch": 4143} {"train_loss": -7.039769172668457, "global_step": 174015, "epoch": 4143} {"train_loss": -7.079670429229736, "global_step": 174016, "epoch": 4143} {"train_loss": -7.114169597625732, "global_step": 174017, "epoch": 4143} {"train_loss": -7.078609466552734, "global_step": 174018, "epoch": 4143} {"train_loss": -7.103738307952881, "global_step": 174019, "epoch": 4143} {"train_loss": -7.124212741851807, "global_step": 174020, "epoch": 4143} {"train_loss": -7.073328495025635, "global_step": 174021, "epoch": 4143} {"train_loss": -7.098387718200684, "global_step": 174022, "epoch": 4143} {"train_loss": -7.051544666290283, "global_step": 174023, "epoch": 4143} {"train_loss": -7.131443023681641, "global_step": 174024, "epoch": 4143} {"train_loss": -7.198699951171875, "global_step": 174025, "epoch": 4143} {"train_loss": -7.1389594078063965, "global_step": 174026, "epoch": 4143} {"train_loss": -7.091065406799316, "global_step": 174027, "epoch": 4143} {"train_loss": -7.104384422302246, "global_step": 174028, "epoch": 4143} {"train_loss": -7.041807174682617, "global_step": 174029, "epoch": 4143} {"train_loss": -7.186717987060547, "global_step": 174030, "epoch": 4143} {"train_loss": -7.111392021179199, "global_step": 174031, "epoch": 4143} {"train_loss": -7.076430320739746, "global_step": 174032, "epoch": 4143} {"train_loss": -7.110353946685791, "global_step": 174033, "epoch": 4143} {"train_loss": -7.1185784339904785, "global_step": 174034, "epoch": 4143} {"train_loss": -6.905751705169678, "global_step": 174035, "epoch": 4143} {"train_loss": -7.09929084777832, "global_step": 174036, "epoch": 4143} {"train_loss": -7.1429548263549805, "global_step": 174037, "epoch": 4143} {"train_loss": -7.0876312255859375, "global_step": 174038, "epoch": 4143} {"train_loss": -7.082037925720215, "global_step": 174039, "epoch": 4143} {"train_loss": -7.106723785400391, "global_step": 174040, "epoch": 4143} {"train_loss": -7.111099720001221, "global_step": 174041, "epoch": 4143} {"train_loss": -7.1378912925720215, "global_step": 174042, "epoch": 4143} {"train_loss": -7.119650840759277, "global_step": 174043, "epoch": 4143} {"train_loss": -7.221523761749268, "global_step": 174044, "epoch": 4143} {"train_loss": -7.189846992492676, "global_step": 174045, "epoch": 4143} {"train_loss": -7.08723258972168, "global_step": 174046, "epoch": 4143} {"train_loss": -7.103114718482608, "global_step": 174047, "epoch": 4143, "val_loss": 79951.328125} {"train_loss": -7.118009567260742, "global_step": 174048, "epoch": 4144} {"train_loss": -7.2362775802612305, "global_step": 174049, "epoch": 4144} {"train_loss": -7.095047950744629, "global_step": 174050, "epoch": 4144} {"train_loss": -7.093957424163818, "global_step": 174051, "epoch": 4144} {"train_loss": -7.13109016418457, "global_step": 174052, "epoch": 4144} {"train_loss": -7.107397556304932, "global_step": 174053, "epoch": 4144} {"train_loss": -7.03874397277832, "global_step": 174054, "epoch": 4144} {"train_loss": -7.156707763671875, "global_step": 174055, "epoch": 4144} {"train_loss": -7.072137832641602, "global_step": 174056, "epoch": 4144} {"train_loss": -6.927179336547852, "global_step": 174057, "epoch": 4144} {"train_loss": -6.924694538116455, "global_step": 174058, "epoch": 4144} {"train_loss": -7.0728759765625, "global_step": 174059, "epoch": 4144} {"train_loss": -6.988555431365967, "global_step": 174060, "epoch": 4144} {"train_loss": -7.041998863220215, "global_step": 174061, "epoch": 4144} {"train_loss": -7.206954002380371, "global_step": 174062, "epoch": 4144} {"train_loss": -7.034144401550293, "global_step": 174063, "epoch": 4144} {"train_loss": -7.071135520935059, "global_step": 174064, "epoch": 4144} {"train_loss": -7.05924129486084, "global_step": 174065, "epoch": 4144} {"train_loss": -7.031898498535156, "global_step": 174066, "epoch": 4144} {"train_loss": -7.033354759216309, "global_step": 174067, "epoch": 4144} {"train_loss": -7.07303524017334, "global_step": 174068, "epoch": 4144} {"train_loss": -6.943031311035156, "global_step": 174069, "epoch": 4144} {"train_loss": -7.09364652633667, "global_step": 174070, "epoch": 4144} {"train_loss": -7.069413185119629, "global_step": 174071, "epoch": 4144} {"train_loss": -7.035436630249023, "global_step": 174072, "epoch": 4144} {"train_loss": -7.130641937255859, "global_step": 174073, "epoch": 4144} {"train_loss": -7.045255184173584, "global_step": 174074, "epoch": 4144} {"train_loss": -7.062635898590088, "global_step": 174075, "epoch": 4144} {"train_loss": -6.903392791748047, "global_step": 174076, "epoch": 4144} {"train_loss": -7.0975022315979, "global_step": 174077, "epoch": 4144} {"train_loss": -7.217564582824707, "global_step": 174078, "epoch": 4144} {"train_loss": -7.192842483520508, "global_step": 174079, "epoch": 4144} {"train_loss": -6.996776580810547, "global_step": 174080, "epoch": 4144} {"train_loss": -7.144028186798096, "global_step": 174081, "epoch": 4144} {"train_loss": -7.0871663093566895, "global_step": 174082, "epoch": 4144} {"train_loss": -7.126667499542236, "global_step": 174083, "epoch": 4144} {"train_loss": -7.105992794036865, "global_step": 174084, "epoch": 4144} {"train_loss": -7.041868209838867, "global_step": 174085, "epoch": 4144} {"train_loss": -6.995217323303223, "global_step": 174086, "epoch": 4144} {"train_loss": -7.0563788414001465, "global_step": 174087, "epoch": 4144} {"train_loss": -7.070328712463379, "global_step": 174088, "epoch": 4144} {"train_loss": -7.068178017934163, "global_step": 174089, "epoch": 4144, "val_loss": 80145.7734375} {"train_loss": -7.161210536956787, "global_step": 174090, "epoch": 4145} {"train_loss": -7.126847267150879, "global_step": 174091, "epoch": 4145} {"train_loss": -7.074704170227051, "global_step": 174092, "epoch": 4145} {"train_loss": -7.063257217407227, "global_step": 174093, "epoch": 4145} {"train_loss": -7.136358261108398, "global_step": 174094, "epoch": 4145} {"train_loss": -7.028221130371094, "global_step": 174095, "epoch": 4145} {"train_loss": -7.017345428466797, "global_step": 174096, "epoch": 4145} {"train_loss": -7.044127464294434, "global_step": 174097, "epoch": 4145} {"train_loss": -6.929526329040527, "global_step": 174098, "epoch": 4145} {"train_loss": -7.001159191131592, "global_step": 174099, "epoch": 4145} {"train_loss": -6.994129180908203, "global_step": 174100, "epoch": 4145} {"train_loss": -7.130285263061523, "global_step": 174101, "epoch": 4145} {"train_loss": -7.054986476898193, "global_step": 174102, "epoch": 4145} {"train_loss": -7.0617570877075195, "global_step": 174103, "epoch": 4145} {"train_loss": -6.958603858947754, "global_step": 174104, "epoch": 4145} {"train_loss": -7.082912445068359, "global_step": 174105, "epoch": 4145} {"train_loss": -7.022357940673828, "global_step": 174106, "epoch": 4145} {"train_loss": -6.926573753356934, "global_step": 174107, "epoch": 4145} {"train_loss": -7.1342549324035645, "global_step": 174108, "epoch": 4145} {"train_loss": -7.136599540710449, "global_step": 174109, "epoch": 4145} {"train_loss": -7.168757438659668, "global_step": 174110, "epoch": 4145} {"train_loss": -7.163933277130127, "global_step": 174111, "epoch": 4145} {"train_loss": -7.17003870010376, "global_step": 174112, "epoch": 4145} {"train_loss": -7.156394004821777, "global_step": 174113, "epoch": 4145} {"train_loss": -7.009225845336914, "global_step": 174114, "epoch": 4145} {"train_loss": -7.137227535247803, "global_step": 174115, "epoch": 4145} {"train_loss": -7.0702104568481445, "global_step": 174116, "epoch": 4145} {"train_loss": -7.087126731872559, "global_step": 174117, "epoch": 4145} {"train_loss": -7.026938438415527, "global_step": 174118, "epoch": 4145} {"train_loss": -7.027973175048828, "global_step": 174119, "epoch": 4145} {"train_loss": -7.129072189331055, "global_step": 174120, "epoch": 4145} {"train_loss": -6.958880424499512, "global_step": 174121, "epoch": 4145} {"train_loss": -7.053796291351318, "global_step": 174122, "epoch": 4145} {"train_loss": -7.081699371337891, "global_step": 174123, "epoch": 4145} {"train_loss": -7.135903358459473, "global_step": 174124, "epoch": 4145} {"train_loss": -7.0109381675720215, "global_step": 174125, "epoch": 4145} {"train_loss": -7.022332191467285, "global_step": 174126, "epoch": 4145} {"train_loss": -7.020660877227783, "global_step": 174127, "epoch": 4145} {"train_loss": -7.073432922363281, "global_step": 174128, "epoch": 4145} {"train_loss": -7.063207626342773, "global_step": 174129, "epoch": 4145} {"train_loss": -7.211337089538574, "global_step": 174130, "epoch": 4145} {"train_loss": -7.070057460239956, "global_step": 174131, "epoch": 4145, "val_loss": 80122.2578125} {"train_loss": -7.09785270690918, "global_step": 174132, "epoch": 4146} {"train_loss": -7.188693046569824, "global_step": 174133, "epoch": 4146} {"train_loss": -6.953851699829102, "global_step": 174134, "epoch": 4146} {"train_loss": -6.933545112609863, "global_step": 174135, "epoch": 4146} {"train_loss": -7.07882022857666, "global_step": 174136, "epoch": 4146} {"train_loss": -7.081209182739258, "global_step": 174137, "epoch": 4146} {"train_loss": -6.928174018859863, "global_step": 174138, "epoch": 4146} {"train_loss": -7.177638053894043, "global_step": 174139, "epoch": 4146} {"train_loss": -7.179060935974121, "global_step": 174140, "epoch": 4146} {"train_loss": -6.971158027648926, "global_step": 174141, "epoch": 4146} {"train_loss": -7.052677154541016, "global_step": 174142, "epoch": 4146} {"train_loss": -7.105488300323486, "global_step": 174143, "epoch": 4146} {"train_loss": -7.109897613525391, "global_step": 174144, "epoch": 4146} {"train_loss": -7.08049201965332, "global_step": 174145, "epoch": 4146} {"train_loss": -6.934107780456543, "global_step": 174146, "epoch": 4146} {"train_loss": -7.023028373718262, "global_step": 174147, "epoch": 4146} {"train_loss": -6.994420528411865, "global_step": 174148, "epoch": 4146} {"train_loss": -7.034799575805664, "global_step": 174149, "epoch": 4146} {"train_loss": -7.054848670959473, "global_step": 174150, "epoch": 4146} {"train_loss": -6.875957489013672, "global_step": 174151, "epoch": 4146} {"train_loss": -7.152222633361816, "global_step": 174152, "epoch": 4146} {"train_loss": -7.0551910400390625, "global_step": 174153, "epoch": 4146} {"train_loss": -7.146936893463135, "global_step": 174154, "epoch": 4146} {"train_loss": -7.146128177642822, "global_step": 174155, "epoch": 4146} {"train_loss": -7.1089935302734375, "global_step": 174156, "epoch": 4146} {"train_loss": -7.079323768615723, "global_step": 174157, "epoch": 4146} {"train_loss": -7.113914489746094, "global_step": 174158, "epoch": 4146} {"train_loss": -7.0012102127075195, "global_step": 174159, "epoch": 4146} {"train_loss": -7.192404747009277, "global_step": 174160, "epoch": 4146} {"train_loss": -7.17407751083374, "global_step": 174161, "epoch": 4146} {"train_loss": -7.174578666687012, "global_step": 174162, "epoch": 4146} {"train_loss": -6.999297142028809, "global_step": 174163, "epoch": 4146} {"train_loss": -7.0722126960754395, "global_step": 174164, "epoch": 4146} {"train_loss": -7.196421146392822, "global_step": 174165, "epoch": 4146} {"train_loss": -7.138601303100586, "global_step": 174166, "epoch": 4146} {"train_loss": -7.108432769775391, "global_step": 174167, "epoch": 4146} {"train_loss": -7.151142120361328, "global_step": 174168, "epoch": 4146} {"train_loss": -7.051105499267578, "global_step": 174169, "epoch": 4146} {"train_loss": -7.074368476867676, "global_step": 174170, "epoch": 4146} {"train_loss": -7.03949499130249, "global_step": 174171, "epoch": 4146} {"train_loss": -7.0640363693237305, "global_step": 174172, "epoch": 4146} {"train_loss": -7.073356185640607, "global_step": 174173, "epoch": 4146, "val_loss": 80027.3125} {"train_loss": -7.032696723937988, "global_step": 174174, "epoch": 4147} {"train_loss": -7.175562381744385, "global_step": 174175, "epoch": 4147} {"train_loss": -7.150202751159668, "global_step": 174176, "epoch": 4147} {"train_loss": -7.073823928833008, "global_step": 174177, "epoch": 4147} {"train_loss": -7.199014663696289, "global_step": 174178, "epoch": 4147} {"train_loss": -7.126972198486328, "global_step": 174179, "epoch": 4147} {"train_loss": -7.199322700500488, "global_step": 174180, "epoch": 4147} {"train_loss": -7.105849742889404, "global_step": 174181, "epoch": 4147} {"train_loss": -7.057858467102051, "global_step": 174182, "epoch": 4147} {"train_loss": -7.219264507293701, "global_step": 174183, "epoch": 4147} {"train_loss": -7.172223091125488, "global_step": 174184, "epoch": 4147} {"train_loss": -7.145346641540527, "global_step": 174185, "epoch": 4147} {"train_loss": -7.114614963531494, "global_step": 174186, "epoch": 4147} {"train_loss": -7.075713157653809, "global_step": 174187, "epoch": 4147} {"train_loss": -7.084929943084717, "global_step": 174188, "epoch": 4147} {"train_loss": -7.069436073303223, "global_step": 174189, "epoch": 4147} {"train_loss": -7.1439738273620605, "global_step": 174190, "epoch": 4147} {"train_loss": -7.130096912384033, "global_step": 174191, "epoch": 4147} {"train_loss": -7.211201190948486, "global_step": 174192, "epoch": 4147} {"train_loss": -7.197259426116943, "global_step": 174193, "epoch": 4147} {"train_loss": -7.077650547027588, "global_step": 174194, "epoch": 4147} {"train_loss": -7.181793212890625, "global_step": 174195, "epoch": 4147} {"train_loss": -7.106353759765625, "global_step": 174196, "epoch": 4147} {"train_loss": -7.1254191398620605, "global_step": 174197, "epoch": 4147} {"train_loss": -7.156791687011719, "global_step": 174198, "epoch": 4147} {"train_loss": -7.110807418823242, "global_step": 174199, "epoch": 4147} {"train_loss": -7.059473514556885, "global_step": 174200, "epoch": 4147} {"train_loss": -6.999326705932617, "global_step": 174201, "epoch": 4147} {"train_loss": -7.052429676055908, "global_step": 174202, "epoch": 4147} {"train_loss": -6.973148345947266, "global_step": 174203, "epoch": 4147} {"train_loss": -7.064465045928955, "global_step": 174204, "epoch": 4147} {"train_loss": -7.015466690063477, "global_step": 174205, "epoch": 4147} {"train_loss": -7.153738975524902, "global_step": 174206, "epoch": 4147} {"train_loss": -7.020909309387207, "global_step": 174207, "epoch": 4147} {"train_loss": -7.088715553283691, "global_step": 174208, "epoch": 4147} {"train_loss": -7.099645614624023, "global_step": 174209, "epoch": 4147} {"train_loss": -7.017648696899414, "global_step": 174210, "epoch": 4147} {"train_loss": -7.067285537719727, "global_step": 174211, "epoch": 4147} {"train_loss": -7.036494255065918, "global_step": 174212, "epoch": 4147} {"train_loss": -7.0787811279296875, "global_step": 174213, "epoch": 4147} {"train_loss": -6.974066734313965, "global_step": 174214, "epoch": 4147} {"train_loss": -7.100125063033331, "global_step": 174215, "epoch": 4147, "val_loss": 80033.984375} {"train_loss": -7.110658168792725, "global_step": 174216, "epoch": 4148} {"train_loss": -6.952056884765625, "global_step": 174217, "epoch": 4148} {"train_loss": -7.172420024871826, "global_step": 174218, "epoch": 4148} {"train_loss": -7.110182285308838, "global_step": 174219, "epoch": 4148} {"train_loss": -7.014232635498047, "global_step": 174220, "epoch": 4148} {"train_loss": -7.057796478271484, "global_step": 174221, "epoch": 4148} {"train_loss": -7.091996192932129, "global_step": 174222, "epoch": 4148} {"train_loss": -7.068626880645752, "global_step": 174223, "epoch": 4148} {"train_loss": -7.121482849121094, "global_step": 174224, "epoch": 4148} {"train_loss": -7.0147247314453125, "global_step": 174225, "epoch": 4148} {"train_loss": -7.092803001403809, "global_step": 174226, "epoch": 4148} {"train_loss": -7.1619462966918945, "global_step": 174227, "epoch": 4148} {"train_loss": -7.057140350341797, "global_step": 174228, "epoch": 4148} {"train_loss": -7.127978801727295, "global_step": 174229, "epoch": 4148} {"train_loss": -6.967035293579102, "global_step": 174230, "epoch": 4148} {"train_loss": -7.049602508544922, "global_step": 174231, "epoch": 4148} {"train_loss": -7.118562698364258, "global_step": 174232, "epoch": 4148} {"train_loss": -6.9818878173828125, "global_step": 174233, "epoch": 4148} {"train_loss": -7.034970283508301, "global_step": 174234, "epoch": 4148} {"train_loss": -7.018132209777832, "global_step": 174235, "epoch": 4148} {"train_loss": -7.0709757804870605, "global_step": 174236, "epoch": 4148} {"train_loss": -7.020937919616699, "global_step": 174237, "epoch": 4148} {"train_loss": -7.070908546447754, "global_step": 174238, "epoch": 4148} {"train_loss": -7.185774803161621, "global_step": 174239, "epoch": 4148} {"train_loss": -6.992517948150635, "global_step": 174240, "epoch": 4148} {"train_loss": -7.017685413360596, "global_step": 174241, "epoch": 4148} {"train_loss": -7.229579925537109, "global_step": 174242, "epoch": 4148} {"train_loss": -7.151364326477051, "global_step": 174243, "epoch": 4148} {"train_loss": -7.0102643966674805, "global_step": 174244, "epoch": 4148} {"train_loss": -7.016076564788818, "global_step": 174245, "epoch": 4148} {"train_loss": -7.110433578491211, "global_step": 174246, "epoch": 4148} {"train_loss": -7.152910232543945, "global_step": 174247, "epoch": 4148} {"train_loss": -7.136414051055908, "global_step": 174248, "epoch": 4148} {"train_loss": -7.103782653808594, "global_step": 174249, "epoch": 4148} {"train_loss": -7.005801200866699, "global_step": 174250, "epoch": 4148} {"train_loss": -7.161317348480225, "global_step": 174251, "epoch": 4148} {"train_loss": -7.0187249183654785, "global_step": 174252, "epoch": 4148} {"train_loss": -7.059023857116699, "global_step": 174253, "epoch": 4148} {"train_loss": -7.193222999572754, "global_step": 174254, "epoch": 4148} {"train_loss": -7.056884288787842, "global_step": 174255, "epoch": 4148} {"train_loss": -7.003897190093994, "global_step": 174256, "epoch": 4148} {"train_loss": -7.071986028126308, "global_step": 174257, "epoch": 4148, "val_loss": 80150.921875} {"train_loss": -7.048853874206543, "global_step": 174258, "epoch": 4149} {"train_loss": -7.141026973724365, "global_step": 174259, "epoch": 4149} {"train_loss": -6.970433235168457, "global_step": 174260, "epoch": 4149} {"train_loss": -7.128086090087891, "global_step": 174261, "epoch": 4149} {"train_loss": -7.114811897277832, "global_step": 174262, "epoch": 4149} {"train_loss": -7.042595863342285, "global_step": 174263, "epoch": 4149} {"train_loss": -7.0693206787109375, "global_step": 174264, "epoch": 4149} {"train_loss": -7.125539779663086, "global_step": 174265, "epoch": 4149} {"train_loss": -7.012505531311035, "global_step": 174266, "epoch": 4149} {"train_loss": -7.223083972930908, "global_step": 174267, "epoch": 4149} {"train_loss": -7.231829643249512, "global_step": 174268, "epoch": 4149} {"train_loss": -7.231191158294678, "global_step": 174269, "epoch": 4149} {"train_loss": -7.247550964355469, "global_step": 174270, "epoch": 4149} {"train_loss": -7.142189025878906, "global_step": 174271, "epoch": 4149} {"train_loss": -7.17718505859375, "global_step": 174272, "epoch": 4149} {"train_loss": -7.062700271606445, "global_step": 174273, "epoch": 4149} {"train_loss": -7.104891777038574, "global_step": 174274, "epoch": 4149} {"train_loss": -7.168006420135498, "global_step": 174275, "epoch": 4149} {"train_loss": -7.089079856872559, "global_step": 174276, "epoch": 4149} {"train_loss": -7.090295791625977, "global_step": 174277, "epoch": 4149} {"train_loss": -7.121102809906006, "global_step": 174278, "epoch": 4149} {"train_loss": -7.157321929931641, "global_step": 174279, "epoch": 4149} {"train_loss": -7.15419340133667, "global_step": 174280, "epoch": 4149} {"train_loss": -7.069751739501953, "global_step": 174281, "epoch": 4149} {"train_loss": -7.052229881286621, "global_step": 174282, "epoch": 4149} {"train_loss": -7.085351943969727, "global_step": 174283, "epoch": 4149} {"train_loss": -7.066943645477295, "global_step": 174284, "epoch": 4149} {"train_loss": -7.149497032165527, "global_step": 174285, "epoch": 4149} {"train_loss": -7.145263671875, "global_step": 174286, "epoch": 4149} {"train_loss": -7.0696492195129395, "global_step": 174287, "epoch": 4149} {"train_loss": -7.035669326782227, "global_step": 174288, "epoch": 4149} {"train_loss": -7.137606143951416, "global_step": 174289, "epoch": 4149} {"train_loss": -7.132162570953369, "global_step": 174290, "epoch": 4149} {"train_loss": -6.996039867401123, "global_step": 174291, "epoch": 4149} {"train_loss": -7.095664024353027, "global_step": 174292, "epoch": 4149} {"train_loss": -7.019294738769531, "global_step": 174293, "epoch": 4149} {"train_loss": -7.087462425231934, "global_step": 174294, "epoch": 4149} {"train_loss": -7.040177345275879, "global_step": 174295, "epoch": 4149} {"train_loss": -7.175318717956543, "global_step": 174296, "epoch": 4149} {"train_loss": -7.1359944343566895, "global_step": 174297, "epoch": 4149} {"train_loss": -6.95003080368042, "global_step": 174298, "epoch": 4149} {"train_loss": -7.104727041153681, "global_step": 174299, "epoch": 4149, "val_loss": 80249.6328125} {"train_loss": -7.115102291107178, "global_step": 174300, "epoch": 4150} {"train_loss": -7.0779218673706055, "global_step": 174301, "epoch": 4150} {"train_loss": -7.044198989868164, "global_step": 174302, "epoch": 4150} {"train_loss": -7.155758857727051, "global_step": 174303, "epoch": 4150} {"train_loss": -7.145340919494629, "global_step": 174304, "epoch": 4150} {"train_loss": -7.0545654296875, "global_step": 174305, "epoch": 4150} {"train_loss": -7.058891296386719, "global_step": 174306, "epoch": 4150} {"train_loss": -6.974893093109131, "global_step": 174307, "epoch": 4150} {"train_loss": -7.0897722244262695, "global_step": 174308, "epoch": 4150} {"train_loss": -7.034772872924805, "global_step": 174309, "epoch": 4150} {"train_loss": -7.150139808654785, "global_step": 174310, "epoch": 4150} {"train_loss": -7.034549236297607, "global_step": 174311, "epoch": 4150} {"train_loss": -7.077358245849609, "global_step": 174312, "epoch": 4150} {"train_loss": -7.138425827026367, "global_step": 174313, "epoch": 4150} {"train_loss": -7.026129722595215, "global_step": 174314, "epoch": 4150} {"train_loss": -7.161677360534668, "global_step": 174315, "epoch": 4150} {"train_loss": -7.159687519073486, "global_step": 174316, "epoch": 4150} {"train_loss": -7.000844955444336, "global_step": 174317, "epoch": 4150} {"train_loss": -7.034303665161133, "global_step": 174318, "epoch": 4150} {"train_loss": -7.096474647521973, "global_step": 174319, "epoch": 4150} {"train_loss": -7.045468807220459, "global_step": 174320, "epoch": 4150} {"train_loss": -7.081496715545654, "global_step": 174321, "epoch": 4150} {"train_loss": -6.999288558959961, "global_step": 174322, "epoch": 4150} {"train_loss": -7.111562728881836, "global_step": 174323, "epoch": 4150} {"train_loss": -7.178106784820557, "global_step": 174324, "epoch": 4150} {"train_loss": -7.069803714752197, "global_step": 174325, "epoch": 4150} {"train_loss": -7.103745460510254, "global_step": 174326, "epoch": 4150} {"train_loss": -7.027523040771484, "global_step": 174327, "epoch": 4150} {"train_loss": -7.068255424499512, "global_step": 174328, "epoch": 4150} {"train_loss": -7.094635009765625, "global_step": 174329, "epoch": 4150} {"train_loss": -7.087571144104004, "global_step": 174330, "epoch": 4150} {"train_loss": -6.980381011962891, "global_step": 174331, "epoch": 4150} {"train_loss": -7.172610282897949, "global_step": 174332, "epoch": 4150} {"train_loss": -7.148780345916748, "global_step": 174333, "epoch": 4150} {"train_loss": -7.114955902099609, "global_step": 174334, "epoch": 4150} {"train_loss": -7.067238807678223, "global_step": 174335, "epoch": 4150} {"train_loss": -7.081501483917236, "global_step": 174336, "epoch": 4150} {"train_loss": -7.126603603363037, "global_step": 174337, "epoch": 4150} {"train_loss": -7.1141462326049805, "global_step": 174338, "epoch": 4150} {"train_loss": -7.099287986755371, "global_step": 174339, "epoch": 4150} {"train_loss": -7.051713943481445, "global_step": 174340, "epoch": 4150} {"train_loss": -7.085806403841291, "global_step": 174341, "epoch": 4150, "train/sim_max_reward_0": 0.19683335853847353, "train/sim_max_reward_1": 0.9271751163626182, "train/sim_max_reward_2": 0.4861174066584397, "train/sim_max_reward_3": 1.0, "train/sim_max_reward_4": 0.9676646594577716, "train/sim_max_reward_5": 0.935699114053431, "test/sim_max_reward_4500000": 0.9117417993829081, "test/sim_max_reward_4500001": 0.3201447913089219, "test/sim_max_reward_4500002": 0.9482958974108141, "test/sim_max_reward_4500003": 0.7664349619576628, "test/sim_max_reward_4500004": 0.23313114076654418, "test/sim_max_reward_4500005": 0.8443045141857882, "test/sim_max_reward_4500006": 0.9094197453439518, "test/sim_max_reward_4500007": 0.9354412159852733, "test/sim_max_reward_4500008": 0.9281979508663711, "test/sim_max_reward_4500009": 0.0531996532868105, "test/sim_max_reward_4500010": 0.005450436644204359, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 0.8591100705155819, "test/sim_max_reward_4500013": 0.0034759328969964014, "test/sim_max_reward_4500014": 0.9404795627877883, "test/sim_max_reward_4500015": 0.9763106191697639, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.09361956204647462, "test/sim_max_reward_4500018": 0.995135901831888, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9688032539708015, "test/sim_max_reward_4500022": 0.9196746703848937, "test/sim_max_reward_4500023": 0.9841035079661652, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.858598959903245, "test/sim_max_reward_4500026": 0.8756248119532969, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.13836885338729218, "test/sim_max_reward_4500030": 0.9438071244009903, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.7973220688617848, "test/sim_max_reward_4500034": 0.9530093154974963, "test/sim_max_reward_4500035": 0.8364816746871032, "test/sim_max_reward_4500036": 0.9864283784187948, "test/sim_max_reward_4500037": 0.8898063657913634, "test/sim_max_reward_4500038": 0.34797897479305206, "test/sim_max_reward_4500039": 0.7386701710239982, "test/sim_max_reward_4500040": 0.9819812352477661, "test/sim_max_reward_4500041": 0.9255964536505834, "test/sim_max_reward_4500042": 0.04929865283095395, "test/sim_max_reward_4500043": 0.3559601526910766, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.958779678621933, "test/sim_max_reward_4500046": 0.23468396196205432, "test/sim_max_reward_4500047": 0.9312252993200443, "test/sim_max_reward_4500048": 0.977075923591101, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.7522482758451222, "test/mean_score": 0.6130368800488608, "val_loss": 79707.625} {"train_loss": -6.958594799041748, "global_step": 174342, "epoch": 4151} {"train_loss": -6.9751715660095215, "global_step": 174343, "epoch": 4151} {"train_loss": -6.882720947265625, "global_step": 174344, "epoch": 4151} {"train_loss": -7.095097541809082, "global_step": 174345, "epoch": 4151} {"train_loss": -7.041298866271973, "global_step": 174346, "epoch": 4151} {"train_loss": -7.11065149307251, "global_step": 174347, "epoch": 4151} {"train_loss": -6.997348785400391, "global_step": 174348, "epoch": 4151} {"train_loss": -6.924283027648926, "global_step": 174349, "epoch": 4151} {"train_loss": -6.956745624542236, "global_step": 174350, "epoch": 4151} {"train_loss": -6.898846626281738, "global_step": 174351, "epoch": 4151} {"train_loss": -7.100329399108887, "global_step": 174352, "epoch": 4151} {"train_loss": -6.80994176864624, "global_step": 174353, "epoch": 4151} {"train_loss": -6.921485900878906, "global_step": 174354, "epoch": 4151} {"train_loss": -6.950000286102295, "global_step": 174355, "epoch": 4151} {"train_loss": -6.9874396324157715, "global_step": 174356, "epoch": 4151} {"train_loss": -6.907031536102295, "global_step": 174357, "epoch": 4151} {"train_loss": -6.917978286743164, "global_step": 174358, "epoch": 4151} {"train_loss": -6.991048336029053, "global_step": 174359, "epoch": 4151} {"train_loss": -6.911284923553467, "global_step": 174360, "epoch": 4151} {"train_loss": -7.093411445617676, "global_step": 174361, "epoch": 4151} {"train_loss": -6.929546356201172, "global_step": 174362, "epoch": 4151} {"train_loss": -6.994478225708008, "global_step": 174363, "epoch": 4151} {"train_loss": -7.02536678314209, "global_step": 174364, "epoch": 4151} {"train_loss": -7.007055759429932, "global_step": 174365, "epoch": 4151} {"train_loss": -6.944077491760254, "global_step": 174366, "epoch": 4151} {"train_loss": -7.031059265136719, "global_step": 174367, "epoch": 4151} {"train_loss": -7.130519390106201, "global_step": 174368, "epoch": 4151} {"train_loss": -6.862540245056152, "global_step": 174369, "epoch": 4151} {"train_loss": -7.008116245269775, "global_step": 174370, "epoch": 4151} {"train_loss": -7.07286262512207, "global_step": 174371, "epoch": 4151} {"train_loss": -6.994302749633789, "global_step": 174372, "epoch": 4151} {"train_loss": -7.130880355834961, "global_step": 174373, "epoch": 4151} {"train_loss": -7.106133460998535, "global_step": 174374, "epoch": 4151} {"train_loss": -7.047924041748047, "global_step": 174375, "epoch": 4151} {"train_loss": -7.029131889343262, "global_step": 174376, "epoch": 4151} {"train_loss": -7.029460430145264, "global_step": 174377, "epoch": 4151} {"train_loss": -7.085707664489746, "global_step": 174378, "epoch": 4151} {"train_loss": -7.150717258453369, "global_step": 174379, "epoch": 4151} {"train_loss": -6.940673828125, "global_step": 174380, "epoch": 4151} {"train_loss": -7.230896949768066, "global_step": 174381, "epoch": 4151} {"train_loss": -7.012689590454102, "global_step": 174382, "epoch": 4151} {"train_loss": -7.006322031929379, "global_step": 174383, "epoch": 4151, "val_loss": 79936.8046875} {"train_loss": -7.086068153381348, "global_step": 174384, "epoch": 4152} {"train_loss": -7.114833831787109, "global_step": 174385, "epoch": 4152} {"train_loss": -7.007434844970703, "global_step": 174386, "epoch": 4152} {"train_loss": -7.091527462005615, "global_step": 174387, "epoch": 4152} {"train_loss": -7.174674987792969, "global_step": 174388, "epoch": 4152} {"train_loss": -7.117824554443359, "global_step": 174389, "epoch": 4152} {"train_loss": -7.226161003112793, "global_step": 174390, "epoch": 4152} {"train_loss": -7.219173431396484, "global_step": 174391, "epoch": 4152} {"train_loss": -7.036616325378418, "global_step": 174392, "epoch": 4152} {"train_loss": -7.143492698669434, "global_step": 174393, "epoch": 4152} {"train_loss": -7.19305944442749, "global_step": 174394, "epoch": 4152} {"train_loss": -6.9121317863464355, "global_step": 174395, "epoch": 4152} {"train_loss": -7.010427474975586, "global_step": 174396, "epoch": 4152} {"train_loss": -7.007828712463379, "global_step": 174397, "epoch": 4152} {"train_loss": -7.009190559387207, "global_step": 174398, "epoch": 4152} {"train_loss": -7.144085884094238, "global_step": 174399, "epoch": 4152} {"train_loss": -6.916575908660889, "global_step": 174400, "epoch": 4152} {"train_loss": -7.027587413787842, "global_step": 174401, "epoch": 4152} {"train_loss": -7.0233001708984375, "global_step": 174402, "epoch": 4152} {"train_loss": -6.984797954559326, "global_step": 174403, "epoch": 4152} {"train_loss": -7.122080326080322, "global_step": 174404, "epoch": 4152} {"train_loss": -6.988476753234863, "global_step": 174405, "epoch": 4152} {"train_loss": -6.985936164855957, "global_step": 174406, "epoch": 4152} {"train_loss": -7.096518516540527, "global_step": 174407, "epoch": 4152} {"train_loss": -7.093597888946533, "global_step": 174408, "epoch": 4152} {"train_loss": -7.130667209625244, "global_step": 174409, "epoch": 4152} {"train_loss": -7.05092716217041, "global_step": 174410, "epoch": 4152} {"train_loss": -7.015951156616211, "global_step": 174411, "epoch": 4152} {"train_loss": -7.088754177093506, "global_step": 174412, "epoch": 4152} {"train_loss": -7.154289722442627, "global_step": 174413, "epoch": 4152} {"train_loss": -7.180689811706543, "global_step": 174414, "epoch": 4152} {"train_loss": -7.15103816986084, "global_step": 174415, "epoch": 4152} {"train_loss": -7.040037155151367, "global_step": 174416, "epoch": 4152} {"train_loss": -7.093883514404297, "global_step": 174417, "epoch": 4152} {"train_loss": -7.002862453460693, "global_step": 174418, "epoch": 4152} {"train_loss": -6.999060153961182, "global_step": 174419, "epoch": 4152} {"train_loss": -7.158397197723389, "global_step": 174420, "epoch": 4152} {"train_loss": -7.131227493286133, "global_step": 174421, "epoch": 4152} {"train_loss": -7.070795059204102, "global_step": 174422, "epoch": 4152} {"train_loss": -7.083049774169922, "global_step": 174423, "epoch": 4152} {"train_loss": -6.986325263977051, "global_step": 174424, "epoch": 4152} {"train_loss": -7.074920245579311, "global_step": 174425, "epoch": 4152, "val_loss": 80274.3359375} {"train_loss": -7.164922714233398, "global_step": 174426, "epoch": 4153} {"train_loss": -7.058732986450195, "global_step": 174427, "epoch": 4153} {"train_loss": -7.156774997711182, "global_step": 174428, "epoch": 4153} {"train_loss": -7.146361351013184, "global_step": 174429, "epoch": 4153} {"train_loss": -7.14755916595459, "global_step": 174430, "epoch": 4153} {"train_loss": -7.182343006134033, "global_step": 174431, "epoch": 4153} {"train_loss": -7.064424514770508, "global_step": 174432, "epoch": 4153} {"train_loss": -7.071989059448242, "global_step": 174433, "epoch": 4153} {"train_loss": -7.134086608886719, "global_step": 174434, "epoch": 4153} {"train_loss": -7.029559135437012, "global_step": 174435, "epoch": 4153} {"train_loss": -7.107415676116943, "global_step": 174436, "epoch": 4153} {"train_loss": -7.169486999511719, "global_step": 174437, "epoch": 4153} {"train_loss": -7.076438903808594, "global_step": 174438, "epoch": 4153} {"train_loss": -6.960781097412109, "global_step": 174439, "epoch": 4153} {"train_loss": -7.172296047210693, "global_step": 174440, "epoch": 4153} {"train_loss": -7.021730422973633, "global_step": 174441, "epoch": 4153} {"train_loss": -7.058956146240234, "global_step": 174442, "epoch": 4153} {"train_loss": -7.132382392883301, "global_step": 174443, "epoch": 4153} {"train_loss": -7.006019115447998, "global_step": 174444, "epoch": 4153} {"train_loss": -6.9205217361450195, "global_step": 174445, "epoch": 4153} {"train_loss": -7.074896812438965, "global_step": 174446, "epoch": 4153} {"train_loss": -7.121763229370117, "global_step": 174447, "epoch": 4153} {"train_loss": -7.003604888916016, "global_step": 174448, "epoch": 4153} {"train_loss": -7.207637786865234, "global_step": 174449, "epoch": 4153} {"train_loss": -6.94984245300293, "global_step": 174450, "epoch": 4153} {"train_loss": -7.076407432556152, "global_step": 174451, "epoch": 4153} {"train_loss": -7.03367805480957, "global_step": 174452, "epoch": 4153} {"train_loss": -7.125218868255615, "global_step": 174453, "epoch": 4153} {"train_loss": -6.98343563079834, "global_step": 174454, "epoch": 4153} {"train_loss": -7.1787214279174805, "global_step": 174455, "epoch": 4153} {"train_loss": -7.139240264892578, "global_step": 174456, "epoch": 4153} {"train_loss": -7.164287090301514, "global_step": 174457, "epoch": 4153} {"train_loss": -7.064882278442383, "global_step": 174458, "epoch": 4153} {"train_loss": -7.139651298522949, "global_step": 174459, "epoch": 4153} {"train_loss": -7.007412910461426, "global_step": 174460, "epoch": 4153} {"train_loss": -7.037449836730957, "global_step": 174461, "epoch": 4153} {"train_loss": -7.133528709411621, "global_step": 174462, "epoch": 4153} {"train_loss": -7.132030963897705, "global_step": 174463, "epoch": 4153} {"train_loss": -7.151424407958984, "global_step": 174464, "epoch": 4153} {"train_loss": -7.18726921081543, "global_step": 174465, "epoch": 4153} {"train_loss": -7.080740451812744, "global_step": 174466, "epoch": 4153} {"train_loss": -7.091221934273129, "global_step": 174467, "epoch": 4153, "val_loss": 80099.6953125} {"train_loss": -7.131330490112305, "global_step": 174468, "epoch": 4154} {"train_loss": -7.1522932052612305, "global_step": 174469, "epoch": 4154} {"train_loss": -7.142958164215088, "global_step": 174470, "epoch": 4154} {"train_loss": -7.063902378082275, "global_step": 174471, "epoch": 4154} {"train_loss": -7.139996528625488, "global_step": 174472, "epoch": 4154} {"train_loss": -7.040624141693115, "global_step": 174473, "epoch": 4154} {"train_loss": -7.055942535400391, "global_step": 174474, "epoch": 4154} {"train_loss": -7.1437225341796875, "global_step": 174475, "epoch": 4154} {"train_loss": -7.032994270324707, "global_step": 174476, "epoch": 4154} {"train_loss": -7.1303791999816895, "global_step": 174477, "epoch": 4154} {"train_loss": -7.0766777992248535, "global_step": 174478, "epoch": 4154} {"train_loss": -7.122699737548828, "global_step": 174479, "epoch": 4154} {"train_loss": -7.006014347076416, "global_step": 174480, "epoch": 4154} {"train_loss": -7.1131367683410645, "global_step": 174481, "epoch": 4154} {"train_loss": -7.0976996421813965, "global_step": 174482, "epoch": 4154} {"train_loss": -7.030647277832031, "global_step": 174483, "epoch": 4154} {"train_loss": -7.143326759338379, "global_step": 174484, "epoch": 4154} {"train_loss": -7.08541202545166, "global_step": 174485, "epoch": 4154} {"train_loss": -6.978838920593262, "global_step": 174486, "epoch": 4154} {"train_loss": -7.181271553039551, "global_step": 174487, "epoch": 4154} {"train_loss": -7.030061721801758, "global_step": 174488, "epoch": 4154} {"train_loss": -7.034869194030762, "global_step": 174489, "epoch": 4154} {"train_loss": -7.13484001159668, "global_step": 174490, "epoch": 4154} {"train_loss": -7.152507305145264, "global_step": 174491, "epoch": 4154} {"train_loss": -7.158000469207764, "global_step": 174492, "epoch": 4154} {"train_loss": -7.033430099487305, "global_step": 174493, "epoch": 4154} {"train_loss": -7.122356414794922, "global_step": 174494, "epoch": 4154} {"train_loss": -7.018429756164551, "global_step": 174495, "epoch": 4154} {"train_loss": -7.111815929412842, "global_step": 174496, "epoch": 4154} {"train_loss": -7.144032001495361, "global_step": 174497, "epoch": 4154} {"train_loss": -7.103330612182617, "global_step": 174498, "epoch": 4154} {"train_loss": -7.064378261566162, "global_step": 174499, "epoch": 4154} {"train_loss": -7.234192371368408, "global_step": 174500, "epoch": 4154} {"train_loss": -6.977529525756836, "global_step": 174501, "epoch": 4154} {"train_loss": -7.016366481781006, "global_step": 174502, "epoch": 4154} {"train_loss": -7.089428901672363, "global_step": 174503, "epoch": 4154} {"train_loss": -7.1874470710754395, "global_step": 174504, "epoch": 4154} {"train_loss": -7.110187530517578, "global_step": 174505, "epoch": 4154} {"train_loss": -7.184936046600342, "global_step": 174506, "epoch": 4154} {"train_loss": -7.070891857147217, "global_step": 174507, "epoch": 4154} {"train_loss": -7.063692092895508, "global_step": 174508, "epoch": 4154} {"train_loss": -7.094535248620169, "global_step": 174509, "epoch": 4154, "val_loss": 80262.7734375} {"train_loss": -7.1097869873046875, "global_step": 174510, "epoch": 4155} {"train_loss": -7.115520477294922, "global_step": 174511, "epoch": 4155} {"train_loss": -7.164080619812012, "global_step": 174512, "epoch": 4155} {"train_loss": -7.183670997619629, "global_step": 174513, "epoch": 4155} {"train_loss": -7.216716766357422, "global_step": 174514, "epoch": 4155} {"train_loss": -7.162607192993164, "global_step": 174515, "epoch": 4155} {"train_loss": -7.187132358551025, "global_step": 174516, "epoch": 4155} {"train_loss": -7.150395393371582, "global_step": 174517, "epoch": 4155} {"train_loss": -7.207558631896973, "global_step": 174518, "epoch": 4155} {"train_loss": -6.918522834777832, "global_step": 174519, "epoch": 4155} {"train_loss": -7.076290130615234, "global_step": 174520, "epoch": 4155} {"train_loss": -7.049652576446533, "global_step": 174521, "epoch": 4155} {"train_loss": -7.034127235412598, "global_step": 174522, "epoch": 4155} {"train_loss": -7.026290416717529, "global_step": 174523, "epoch": 4155} {"train_loss": -7.107172012329102, "global_step": 174524, "epoch": 4155} {"train_loss": -7.057199478149414, "global_step": 174525, "epoch": 4155} {"train_loss": -6.978470802307129, "global_step": 174526, "epoch": 4155} {"train_loss": -7.061301231384277, "global_step": 174527, "epoch": 4155} {"train_loss": -7.046320915222168, "global_step": 174528, "epoch": 4155} {"train_loss": -6.985626220703125, "global_step": 174529, "epoch": 4155} {"train_loss": -6.941163063049316, "global_step": 174530, "epoch": 4155} {"train_loss": -7.039474964141846, "global_step": 174531, "epoch": 4155} {"train_loss": -7.107556343078613, "global_step": 174532, "epoch": 4155} {"train_loss": -6.921954154968262, "global_step": 174533, "epoch": 4155} {"train_loss": -7.005141258239746, "global_step": 174534, "epoch": 4155} {"train_loss": -6.8704514503479, "global_step": 174535, "epoch": 4155} {"train_loss": -7.015486717224121, "global_step": 174536, "epoch": 4155} {"train_loss": -7.037553787231445, "global_step": 174537, "epoch": 4155} {"train_loss": -6.967673301696777, "global_step": 174538, "epoch": 4155} {"train_loss": -7.036547660827637, "global_step": 174539, "epoch": 4155} {"train_loss": -6.948704719543457, "global_step": 174540, "epoch": 4155} {"train_loss": -6.982405662536621, "global_step": 174541, "epoch": 4155} {"train_loss": -6.986445426940918, "global_step": 174542, "epoch": 4155} {"train_loss": -7.099167346954346, "global_step": 174543, "epoch": 4155} {"train_loss": -6.912237167358398, "global_step": 174544, "epoch": 4155} {"train_loss": -6.9805521965026855, "global_step": 174545, "epoch": 4155} {"train_loss": -7.095666885375977, "global_step": 174546, "epoch": 4155} {"train_loss": -6.989806652069092, "global_step": 174547, "epoch": 4155} {"train_loss": -7.111267566680908, "global_step": 174548, "epoch": 4155} {"train_loss": -6.988272190093994, "global_step": 174549, "epoch": 4155} {"train_loss": -7.134980201721191, "global_step": 174550, "epoch": 4155} {"train_loss": -7.04785882859003, "global_step": 174551, "epoch": 4155, "val_loss": 80145.5859375} {"train_loss": -6.98861026763916, "global_step": 174552, "epoch": 4156} {"train_loss": -6.984292030334473, "global_step": 174553, "epoch": 4156} {"train_loss": -6.970654487609863, "global_step": 174554, "epoch": 4156} {"train_loss": -7.09683895111084, "global_step": 174555, "epoch": 4156} {"train_loss": -7.047693729400635, "global_step": 174556, "epoch": 4156} {"train_loss": -7.12600040435791, "global_step": 174557, "epoch": 4156} {"train_loss": -6.989676475524902, "global_step": 174558, "epoch": 4156} {"train_loss": -7.020133972167969, "global_step": 174559, "epoch": 4156} {"train_loss": -7.024747848510742, "global_step": 174560, "epoch": 4156} {"train_loss": -6.980725288391113, "global_step": 174561, "epoch": 4156} {"train_loss": -7.116436958312988, "global_step": 174562, "epoch": 4156} {"train_loss": -7.08193302154541, "global_step": 174563, "epoch": 4156} {"train_loss": -7.032498359680176, "global_step": 174564, "epoch": 4156} {"train_loss": -7.081026554107666, "global_step": 174565, "epoch": 4156} {"train_loss": -6.97850227355957, "global_step": 174566, "epoch": 4156} {"train_loss": -7.048788070678711, "global_step": 174567, "epoch": 4156} {"train_loss": -7.0903639793396, "global_step": 174568, "epoch": 4156} {"train_loss": -7.051731109619141, "global_step": 174569, "epoch": 4156} {"train_loss": -7.058451175689697, "global_step": 174570, "epoch": 4156} {"train_loss": -7.128902435302734, "global_step": 174571, "epoch": 4156} {"train_loss": -7.117936134338379, "global_step": 174572, "epoch": 4156} {"train_loss": -7.050909996032715, "global_step": 174573, "epoch": 4156} {"train_loss": -7.084894180297852, "global_step": 174574, "epoch": 4156} {"train_loss": -7.080731391906738, "global_step": 174575, "epoch": 4156} {"train_loss": -7.110996246337891, "global_step": 174576, "epoch": 4156} {"train_loss": -7.0186285972595215, "global_step": 174577, "epoch": 4156} {"train_loss": -7.083437442779541, "global_step": 174578, "epoch": 4156} {"train_loss": -7.104235649108887, "global_step": 174579, "epoch": 4156} {"train_loss": -7.092467308044434, "global_step": 174580, "epoch": 4156} {"train_loss": -7.046966075897217, "global_step": 174581, "epoch": 4156} {"train_loss": -7.057641506195068, "global_step": 174582, "epoch": 4156} {"train_loss": -6.963616371154785, "global_step": 174583, "epoch": 4156} {"train_loss": -7.08860969543457, "global_step": 174584, "epoch": 4156} {"train_loss": -7.103450298309326, "global_step": 174585, "epoch": 4156} {"train_loss": -7.077347755432129, "global_step": 174586, "epoch": 4156} {"train_loss": -7.082034111022949, "global_step": 174587, "epoch": 4156} {"train_loss": -7.083579063415527, "global_step": 174588, "epoch": 4156} {"train_loss": -7.137878894805908, "global_step": 174589, "epoch": 4156} {"train_loss": -7.150643825531006, "global_step": 174590, "epoch": 4156} {"train_loss": -6.878073692321777, "global_step": 174591, "epoch": 4156} {"train_loss": -7.058037757873535, "global_step": 174592, "epoch": 4156} {"train_loss": -7.060530424118042, "global_step": 174593, "epoch": 4156, "val_loss": 80137.3984375} {"train_loss": -7.145719528198242, "global_step": 174594, "epoch": 4157} {"train_loss": -7.117393493652344, "global_step": 174595, "epoch": 4157} {"train_loss": -7.1604766845703125, "global_step": 174596, "epoch": 4157} {"train_loss": -7.091728210449219, "global_step": 174597, "epoch": 4157} {"train_loss": -7.0998053550720215, "global_step": 174598, "epoch": 4157} {"train_loss": -7.214694976806641, "global_step": 174599, "epoch": 4157} {"train_loss": -7.103251934051514, "global_step": 174600, "epoch": 4157} {"train_loss": -7.079400539398193, "global_step": 174601, "epoch": 4157} {"train_loss": -7.0896100997924805, "global_step": 174602, "epoch": 4157} {"train_loss": -7.185808181762695, "global_step": 174603, "epoch": 4157} {"train_loss": -7.157994270324707, "global_step": 174604, "epoch": 4157} {"train_loss": -7.038278102874756, "global_step": 174605, "epoch": 4157} {"train_loss": -7.109029769897461, "global_step": 174606, "epoch": 4157} {"train_loss": -7.045421600341797, "global_step": 174607, "epoch": 4157} {"train_loss": -7.087993144989014, "global_step": 174608, "epoch": 4157} {"train_loss": -7.074214935302734, "global_step": 174609, "epoch": 4157} {"train_loss": -7.008559226989746, "global_step": 174610, "epoch": 4157} {"train_loss": -7.00554084777832, "global_step": 174611, "epoch": 4157} {"train_loss": -7.181524276733398, "global_step": 174612, "epoch": 4157} {"train_loss": -6.958611488342285, "global_step": 174613, "epoch": 4157} {"train_loss": -7.138619422912598, "global_step": 174614, "epoch": 4157} {"train_loss": -6.971840858459473, "global_step": 174615, "epoch": 4157} {"train_loss": -7.047468185424805, "global_step": 174616, "epoch": 4157} {"train_loss": -7.028912544250488, "global_step": 174617, "epoch": 4157} {"train_loss": -6.980293273925781, "global_step": 174618, "epoch": 4157} {"train_loss": -6.951001167297363, "global_step": 174619, "epoch": 4157} {"train_loss": -7.061492919921875, "global_step": 174620, "epoch": 4157} {"train_loss": -7.071966171264648, "global_step": 174621, "epoch": 4157} {"train_loss": -7.11616325378418, "global_step": 174622, "epoch": 4157} {"train_loss": -7.039841651916504, "global_step": 174623, "epoch": 4157} {"train_loss": -7.044732093811035, "global_step": 174624, "epoch": 4157} {"train_loss": -7.152138710021973, "global_step": 174625, "epoch": 4157} {"train_loss": -7.077452659606934, "global_step": 174626, "epoch": 4157} {"train_loss": -7.062412738800049, "global_step": 174627, "epoch": 4157} {"train_loss": -6.990440845489502, "global_step": 174628, "epoch": 4157} {"train_loss": -7.124873638153076, "global_step": 174629, "epoch": 4157} {"train_loss": -6.9791460037231445, "global_step": 174630, "epoch": 4157} {"train_loss": -7.042647838592529, "global_step": 174631, "epoch": 4157} {"train_loss": -7.066482067108154, "global_step": 174632, "epoch": 4157} {"train_loss": -6.99215030670166, "global_step": 174633, "epoch": 4157} {"train_loss": -7.1204915046691895, "global_step": 174634, "epoch": 4157} {"train_loss": -7.071314119157337, "global_step": 174635, "epoch": 4157, "val_loss": 79869.421875} {"train_loss": -7.08298397064209, "global_step": 174636, "epoch": 4158} {"train_loss": -7.024073600769043, "global_step": 174637, "epoch": 4158} {"train_loss": -7.220327377319336, "global_step": 174638, "epoch": 4158} {"train_loss": -7.1153106689453125, "global_step": 174639, "epoch": 4158} {"train_loss": -7.105779647827148, "global_step": 174640, "epoch": 4158} {"train_loss": -7.0264058113098145, "global_step": 174641, "epoch": 4158} {"train_loss": -7.06492280960083, "global_step": 174642, "epoch": 4158} {"train_loss": -7.074078559875488, "global_step": 174643, "epoch": 4158} {"train_loss": -7.1512346267700195, "global_step": 174644, "epoch": 4158} {"train_loss": -7.106254577636719, "global_step": 174645, "epoch": 4158} {"train_loss": -7.078402996063232, "global_step": 174646, "epoch": 4158} {"train_loss": -7.084224700927734, "global_step": 174647, "epoch": 4158} {"train_loss": -7.095952987670898, "global_step": 174648, "epoch": 4158} {"train_loss": -7.064508438110352, "global_step": 174649, "epoch": 4158} {"train_loss": -7.046241760253906, "global_step": 174650, "epoch": 4158} {"train_loss": -6.974170207977295, "global_step": 174651, "epoch": 4158} {"train_loss": -7.109247207641602, "global_step": 174652, "epoch": 4158} {"train_loss": -6.97951602935791, "global_step": 174653, "epoch": 4158} {"train_loss": -7.129766941070557, "global_step": 174654, "epoch": 4158} {"train_loss": -7.087860107421875, "global_step": 174655, "epoch": 4158} {"train_loss": -6.991696357727051, "global_step": 174656, "epoch": 4158} {"train_loss": -6.970192909240723, "global_step": 174657, "epoch": 4158} {"train_loss": -7.135171890258789, "global_step": 174658, "epoch": 4158} {"train_loss": -7.057793140411377, "global_step": 174659, "epoch": 4158} {"train_loss": -7.165030479431152, "global_step": 174660, "epoch": 4158} {"train_loss": -7.080131530761719, "global_step": 174661, "epoch": 4158} {"train_loss": -6.982762336730957, "global_step": 174662, "epoch": 4158} {"train_loss": -7.115941047668457, "global_step": 174663, "epoch": 4158} {"train_loss": -7.1071038246154785, "global_step": 174664, "epoch": 4158} {"train_loss": -7.089089870452881, "global_step": 174665, "epoch": 4158} {"train_loss": -7.052128791809082, "global_step": 174666, "epoch": 4158} {"train_loss": -7.090850830078125, "global_step": 174667, "epoch": 4158} {"train_loss": -6.943779468536377, "global_step": 174668, "epoch": 4158} {"train_loss": -7.069247245788574, "global_step": 174669, "epoch": 4158} {"train_loss": -7.191464900970459, "global_step": 174670, "epoch": 4158} {"train_loss": -7.1478095054626465, "global_step": 174671, "epoch": 4158} {"train_loss": -7.083468437194824, "global_step": 174672, "epoch": 4158} {"train_loss": -7.144737243652344, "global_step": 174673, "epoch": 4158} {"train_loss": -7.141780853271484, "global_step": 174674, "epoch": 4158} {"train_loss": -7.206443786621094, "global_step": 174675, "epoch": 4158} {"train_loss": -7.109408378601074, "global_step": 174676, "epoch": 4158} {"train_loss": -7.08600774265471, "global_step": 174677, "epoch": 4158, "val_loss": 80354.1875} {"train_loss": -7.048230171203613, "global_step": 174678, "epoch": 4159} {"train_loss": -7.116277694702148, "global_step": 174679, "epoch": 4159} {"train_loss": -7.1286091804504395, "global_step": 174680, "epoch": 4159} {"train_loss": -7.13211727142334, "global_step": 174681, "epoch": 4159} {"train_loss": -7.145897388458252, "global_step": 174682, "epoch": 4159} {"train_loss": -7.18939733505249, "global_step": 174683, "epoch": 4159} {"train_loss": -7.099752902984619, "global_step": 174684, "epoch": 4159} {"train_loss": -6.963905334472656, "global_step": 174685, "epoch": 4159} {"train_loss": -7.184731483459473, "global_step": 174686, "epoch": 4159} {"train_loss": -7.115749835968018, "global_step": 174687, "epoch": 4159} {"train_loss": -7.109956741333008, "global_step": 174688, "epoch": 4159} {"train_loss": -7.138728141784668, "global_step": 174689, "epoch": 4159} {"train_loss": -7.1538405418396, "global_step": 174690, "epoch": 4159} {"train_loss": -6.998448371887207, "global_step": 174691, "epoch": 4159} {"train_loss": -7.098271369934082, "global_step": 174692, "epoch": 4159} {"train_loss": -7.188530921936035, "global_step": 174693, "epoch": 4159} {"train_loss": -7.196662902832031, "global_step": 174694, "epoch": 4159} {"train_loss": -7.180500507354736, "global_step": 174695, "epoch": 4159} {"train_loss": -7.133761405944824, "global_step": 174696, "epoch": 4159} {"train_loss": -7.091828346252441, "global_step": 174697, "epoch": 4159} {"train_loss": -7.058060646057129, "global_step": 174698, "epoch": 4159} {"train_loss": -7.14286994934082, "global_step": 174699, "epoch": 4159} {"train_loss": -7.06643009185791, "global_step": 174700, "epoch": 4159} {"train_loss": -7.259401798248291, "global_step": 174701, "epoch": 4159} {"train_loss": -7.003851890563965, "global_step": 174702, "epoch": 4159} {"train_loss": -7.210699558258057, "global_step": 174703, "epoch": 4159} {"train_loss": -7.076571464538574, "global_step": 174704, "epoch": 4159} {"train_loss": -7.1281328201293945, "global_step": 174705, "epoch": 4159} {"train_loss": -7.103941917419434, "global_step": 174706, "epoch": 4159} {"train_loss": -7.157810211181641, "global_step": 174707, "epoch": 4159} {"train_loss": -7.162317752838135, "global_step": 174708, "epoch": 4159} {"train_loss": -7.187898635864258, "global_step": 174709, "epoch": 4159} {"train_loss": -7.151422500610352, "global_step": 174710, "epoch": 4159} {"train_loss": -7.048657417297363, "global_step": 174711, "epoch": 4159} {"train_loss": -7.108381748199463, "global_step": 174712, "epoch": 4159} {"train_loss": -7.079617023468018, "global_step": 174713, "epoch": 4159} {"train_loss": -7.074151039123535, "global_step": 174714, "epoch": 4159} {"train_loss": -7.105735778808594, "global_step": 174715, "epoch": 4159} {"train_loss": -7.183471202850342, "global_step": 174716, "epoch": 4159} {"train_loss": -7.254390239715576, "global_step": 174717, "epoch": 4159} {"train_loss": -7.119653701782227, "global_step": 174718, "epoch": 4159} {"train_loss": -7.12666992914109, "global_step": 174719, "epoch": 4159, "val_loss": 80161.59375} {"train_loss": -7.1512956619262695, "global_step": 174720, "epoch": 4160} {"train_loss": -7.169138431549072, "global_step": 174721, "epoch": 4160} {"train_loss": -7.1717023849487305, "global_step": 174722, "epoch": 4160} {"train_loss": -7.219671249389648, "global_step": 174723, "epoch": 4160} {"train_loss": -7.261037826538086, "global_step": 174724, "epoch": 4160} {"train_loss": -7.120095252990723, "global_step": 174725, "epoch": 4160} {"train_loss": -6.989225387573242, "global_step": 174726, "epoch": 4160} {"train_loss": -7.238297462463379, "global_step": 174727, "epoch": 4160} {"train_loss": -7.106400489807129, "global_step": 174728, "epoch": 4160} {"train_loss": -7.187376022338867, "global_step": 174729, "epoch": 4160} {"train_loss": -6.930286407470703, "global_step": 174730, "epoch": 4160} {"train_loss": -7.154986381530762, "global_step": 174731, "epoch": 4160} {"train_loss": -7.151725769042969, "global_step": 174732, "epoch": 4160} {"train_loss": -7.160530090332031, "global_step": 174733, "epoch": 4160} {"train_loss": -7.159899711608887, "global_step": 174734, "epoch": 4160} {"train_loss": -7.095120906829834, "global_step": 174735, "epoch": 4160} {"train_loss": -7.177240371704102, "global_step": 174736, "epoch": 4160} {"train_loss": -7.102759838104248, "global_step": 174737, "epoch": 4160} {"train_loss": -7.018791198730469, "global_step": 174738, "epoch": 4160} {"train_loss": -7.026843070983887, "global_step": 174739, "epoch": 4160} {"train_loss": -7.195411682128906, "global_step": 174740, "epoch": 4160} {"train_loss": -7.07832145690918, "global_step": 174741, "epoch": 4160} {"train_loss": -6.965566158294678, "global_step": 174742, "epoch": 4160} {"train_loss": -6.988436222076416, "global_step": 174743, "epoch": 4160} {"train_loss": -7.123329162597656, "global_step": 174744, "epoch": 4160} {"train_loss": -7.120176792144775, "global_step": 174745, "epoch": 4160} {"train_loss": -6.95620059967041, "global_step": 174746, "epoch": 4160} {"train_loss": -7.001640319824219, "global_step": 174747, "epoch": 4160} {"train_loss": -7.022182941436768, "global_step": 174748, "epoch": 4160} {"train_loss": -7.1030707359313965, "global_step": 174749, "epoch": 4160} {"train_loss": -7.020424842834473, "global_step": 174750, "epoch": 4160} {"train_loss": -6.9231743812561035, "global_step": 174751, "epoch": 4160} {"train_loss": -6.910041809082031, "global_step": 174752, "epoch": 4160} {"train_loss": -7.030491352081299, "global_step": 174753, "epoch": 4160} {"train_loss": -6.994910717010498, "global_step": 174754, "epoch": 4160} {"train_loss": -7.21079158782959, "global_step": 174755, "epoch": 4160} {"train_loss": -6.888525009155273, "global_step": 174756, "epoch": 4160} {"train_loss": -7.052119255065918, "global_step": 174757, "epoch": 4160} {"train_loss": -7.03090763092041, "global_step": 174758, "epoch": 4160} {"train_loss": -6.755525588989258, "global_step": 174759, "epoch": 4160} {"train_loss": -7.047345161437988, "global_step": 174760, "epoch": 4160} {"train_loss": -7.070768958046322, "global_step": 174761, "epoch": 4160, "val_loss": 80136.9453125} {"train_loss": -6.947158336639404, "global_step": 174762, "epoch": 4161} {"train_loss": -7.014691352844238, "global_step": 174763, "epoch": 4161} {"train_loss": -6.978547096252441, "global_step": 174764, "epoch": 4161} {"train_loss": -7.056421756744385, "global_step": 174765, "epoch": 4161} {"train_loss": -7.006718635559082, "global_step": 174766, "epoch": 4161} {"train_loss": -6.956887245178223, "global_step": 174767, "epoch": 4161} {"train_loss": -6.976966857910156, "global_step": 174768, "epoch": 4161} {"train_loss": -7.067381858825684, "global_step": 174769, "epoch": 4161} {"train_loss": -7.102443695068359, "global_step": 174770, "epoch": 4161} {"train_loss": -7.137049198150635, "global_step": 174771, "epoch": 4161} {"train_loss": -7.05099630355835, "global_step": 174772, "epoch": 4161} {"train_loss": -6.9523515701293945, "global_step": 174773, "epoch": 4161} {"train_loss": -7.137121677398682, "global_step": 174774, "epoch": 4161} {"train_loss": -7.0156168937683105, "global_step": 174775, "epoch": 4161} {"train_loss": -7.1156182289123535, "global_step": 174776, "epoch": 4161} {"train_loss": -7.118515968322754, "global_step": 174777, "epoch": 4161} {"train_loss": -7.041415214538574, "global_step": 174778, "epoch": 4161} {"train_loss": -7.184178829193115, "global_step": 174779, "epoch": 4161} {"train_loss": -7.138910293579102, "global_step": 174780, "epoch": 4161} {"train_loss": -7.060338973999023, "global_step": 174781, "epoch": 4161} {"train_loss": -7.059863567352295, "global_step": 174782, "epoch": 4161} {"train_loss": -7.135727405548096, "global_step": 174783, "epoch": 4161} {"train_loss": -7.036791801452637, "global_step": 174784, "epoch": 4161} {"train_loss": -7.029418468475342, "global_step": 174785, "epoch": 4161} {"train_loss": -7.123863220214844, "global_step": 174786, "epoch": 4161} {"train_loss": -7.107705593109131, "global_step": 174787, "epoch": 4161} {"train_loss": -7.097784996032715, "global_step": 174788, "epoch": 4161} {"train_loss": -6.965521812438965, "global_step": 174789, "epoch": 4161} {"train_loss": -7.027093887329102, "global_step": 174790, "epoch": 4161} {"train_loss": -7.145578384399414, "global_step": 174791, "epoch": 4161} {"train_loss": -6.938691139221191, "global_step": 174792, "epoch": 4161} {"train_loss": -7.086301803588867, "global_step": 174793, "epoch": 4161} {"train_loss": -7.145385265350342, "global_step": 174794, "epoch": 4161} {"train_loss": -6.981328010559082, "global_step": 174795, "epoch": 4161} {"train_loss": -7.151772975921631, "global_step": 174796, "epoch": 4161} {"train_loss": -7.138366222381592, "global_step": 174797, "epoch": 4161} {"train_loss": -7.043998718261719, "global_step": 174798, "epoch": 4161} {"train_loss": -6.995135307312012, "global_step": 174799, "epoch": 4161} {"train_loss": -6.9643635749816895, "global_step": 174800, "epoch": 4161} {"train_loss": -7.067953109741211, "global_step": 174801, "epoch": 4161} {"train_loss": -7.136007308959961, "global_step": 174802, "epoch": 4161} {"train_loss": -7.058148054849534, "global_step": 174803, "epoch": 4161, "val_loss": 80227.078125} {"train_loss": -7.042024612426758, "global_step": 174804, "epoch": 4162} {"train_loss": -7.172323226928711, "global_step": 174805, "epoch": 4162} {"train_loss": -7.124970436096191, "global_step": 174806, "epoch": 4162} {"train_loss": -7.046327114105225, "global_step": 174807, "epoch": 4162} {"train_loss": -7.047191143035889, "global_step": 174808, "epoch": 4162} {"train_loss": -7.156654357910156, "global_step": 174809, "epoch": 4162} {"train_loss": -7.173048496246338, "global_step": 174810, "epoch": 4162} {"train_loss": -7.16331672668457, "global_step": 174811, "epoch": 4162} {"train_loss": -7.098670482635498, "global_step": 174812, "epoch": 4162} {"train_loss": -7.01171875, "global_step": 174813, "epoch": 4162} {"train_loss": -7.086625099182129, "global_step": 174814, "epoch": 4162} {"train_loss": -7.134824752807617, "global_step": 174815, "epoch": 4162} {"train_loss": -7.205840110778809, "global_step": 174816, "epoch": 4162} {"train_loss": -7.0742340087890625, "global_step": 174817, "epoch": 4162} {"train_loss": -7.109275817871094, "global_step": 174818, "epoch": 4162} {"train_loss": -7.197238922119141, "global_step": 174819, "epoch": 4162} {"train_loss": -7.13877010345459, "global_step": 174820, "epoch": 4162} {"train_loss": -7.131072044372559, "global_step": 174821, "epoch": 4162} {"train_loss": -7.049372673034668, "global_step": 174822, "epoch": 4162} {"train_loss": -7.255637168884277, "global_step": 174823, "epoch": 4162} {"train_loss": -7.023217678070068, "global_step": 174824, "epoch": 4162} {"train_loss": -7.075784683227539, "global_step": 174825, "epoch": 4162} {"train_loss": -7.092095375061035, "global_step": 174826, "epoch": 4162} {"train_loss": -7.059464931488037, "global_step": 174827, "epoch": 4162} {"train_loss": -7.091620445251465, "global_step": 174828, "epoch": 4162} {"train_loss": -7.055158615112305, "global_step": 174829, "epoch": 4162} {"train_loss": -7.068061828613281, "global_step": 174830, "epoch": 4162} {"train_loss": -6.856410980224609, "global_step": 174831, "epoch": 4162} {"train_loss": -7.168123245239258, "global_step": 174832, "epoch": 4162} {"train_loss": -7.056026458740234, "global_step": 174833, "epoch": 4162} {"train_loss": -7.087620258331299, "global_step": 174834, "epoch": 4162} {"train_loss": -7.019197463989258, "global_step": 174835, "epoch": 4162} {"train_loss": -6.947274208068848, "global_step": 174836, "epoch": 4162} {"train_loss": -6.940248966217041, "global_step": 174837, "epoch": 4162} {"train_loss": -7.07110595703125, "global_step": 174838, "epoch": 4162} {"train_loss": -7.01812744140625, "global_step": 174839, "epoch": 4162} {"train_loss": -7.142190933227539, "global_step": 174840, "epoch": 4162} {"train_loss": -7.0344085693359375, "global_step": 174841, "epoch": 4162} {"train_loss": -7.046238422393799, "global_step": 174842, "epoch": 4162} {"train_loss": -7.086091041564941, "global_step": 174843, "epoch": 4162} {"train_loss": -7.115447998046875, "global_step": 174844, "epoch": 4162} {"train_loss": -7.087610948653448, "global_step": 174845, "epoch": 4162, "val_loss": 80209.984375} {"train_loss": -7.064556121826172, "global_step": 174846, "epoch": 4163} {"train_loss": -7.173246383666992, "global_step": 174847, "epoch": 4163} {"train_loss": -7.142679691314697, "global_step": 174848, "epoch": 4163} {"train_loss": -7.170721530914307, "global_step": 174849, "epoch": 4163} {"train_loss": -7.061038017272949, "global_step": 174850, "epoch": 4163} {"train_loss": -7.158334255218506, "global_step": 174851, "epoch": 4163} {"train_loss": -7.187713623046875, "global_step": 174852, "epoch": 4163} {"train_loss": -7.196022987365723, "global_step": 174853, "epoch": 4163} {"train_loss": -7.217263698577881, "global_step": 174854, "epoch": 4163} {"train_loss": -7.134249210357666, "global_step": 174855, "epoch": 4163} {"train_loss": -7.110633373260498, "global_step": 174856, "epoch": 4163} {"train_loss": -7.048505783081055, "global_step": 174857, "epoch": 4163} {"train_loss": -7.101778984069824, "global_step": 174858, "epoch": 4163} {"train_loss": -6.945738792419434, "global_step": 174859, "epoch": 4163} {"train_loss": -7.125016212463379, "global_step": 174860, "epoch": 4163} {"train_loss": -7.114825248718262, "global_step": 174861, "epoch": 4163} {"train_loss": -7.003742218017578, "global_step": 174862, "epoch": 4163} {"train_loss": -6.920938491821289, "global_step": 174863, "epoch": 4163} {"train_loss": -7.08144474029541, "global_step": 174864, "epoch": 4163} {"train_loss": -7.070311546325684, "global_step": 174865, "epoch": 4163} {"train_loss": -7.063093662261963, "global_step": 174866, "epoch": 4163} {"train_loss": -7.181827545166016, "global_step": 174867, "epoch": 4163} {"train_loss": -7.099189758300781, "global_step": 174868, "epoch": 4163} {"train_loss": -6.990485191345215, "global_step": 174869, "epoch": 4163} {"train_loss": -7.188713073730469, "global_step": 174870, "epoch": 4163} {"train_loss": -6.903006553649902, "global_step": 174871, "epoch": 4163} {"train_loss": -7.112924575805664, "global_step": 174872, "epoch": 4163} {"train_loss": -6.981024742126465, "global_step": 174873, "epoch": 4163} {"train_loss": -7.065091609954834, "global_step": 174874, "epoch": 4163} {"train_loss": -7.006598472595215, "global_step": 174875, "epoch": 4163} {"train_loss": -7.103743553161621, "global_step": 174876, "epoch": 4163} {"train_loss": -7.037903785705566, "global_step": 174877, "epoch": 4163} {"train_loss": -6.96273136138916, "global_step": 174878, "epoch": 4163} {"train_loss": -7.140664100646973, "global_step": 174879, "epoch": 4163} {"train_loss": -7.077741622924805, "global_step": 174880, "epoch": 4163} {"train_loss": -7.1620073318481445, "global_step": 174881, "epoch": 4163} {"train_loss": -7.093326568603516, "global_step": 174882, "epoch": 4163} {"train_loss": -7.069701671600342, "global_step": 174883, "epoch": 4163} {"train_loss": -7.056060791015625, "global_step": 174884, "epoch": 4163} {"train_loss": -7.133223533630371, "global_step": 174885, "epoch": 4163} {"train_loss": -6.9389801025390625, "global_step": 174886, "epoch": 4163} {"train_loss": -7.081110102789743, "global_step": 174887, "epoch": 4163, "val_loss": 80122.9375} {"train_loss": -7.16723108291626, "global_step": 174888, "epoch": 4164} {"train_loss": -7.047837257385254, "global_step": 174889, "epoch": 4164} {"train_loss": -7.115832328796387, "global_step": 174890, "epoch": 4164} {"train_loss": -7.199097156524658, "global_step": 174891, "epoch": 4164} {"train_loss": -7.161591529846191, "global_step": 174892, "epoch": 4164} {"train_loss": -7.076122760772705, "global_step": 174893, "epoch": 4164} {"train_loss": -7.1386919021606445, "global_step": 174894, "epoch": 4164} {"train_loss": -7.1780219078063965, "global_step": 174895, "epoch": 4164} {"train_loss": -7.0905232429504395, "global_step": 174896, "epoch": 4164} {"train_loss": -7.187436580657959, "global_step": 174897, "epoch": 4164} {"train_loss": -7.234270095825195, "global_step": 174898, "epoch": 4164} {"train_loss": -7.159855365753174, "global_step": 174899, "epoch": 4164} {"train_loss": -7.00501823425293, "global_step": 174900, "epoch": 4164} {"train_loss": -7.017629623413086, "global_step": 174901, "epoch": 4164} {"train_loss": -7.192346572875977, "global_step": 174902, "epoch": 4164} {"train_loss": -7.062668800354004, "global_step": 174903, "epoch": 4164} {"train_loss": -7.0551276206970215, "global_step": 174904, "epoch": 4164} {"train_loss": -7.05429744720459, "global_step": 174905, "epoch": 4164} {"train_loss": -7.162143707275391, "global_step": 174906, "epoch": 4164} {"train_loss": -7.147542476654053, "global_step": 174907, "epoch": 4164} {"train_loss": -7.102412223815918, "global_step": 174908, "epoch": 4164} {"train_loss": -7.202001571655273, "global_step": 174909, "epoch": 4164} {"train_loss": -7.126109600067139, "global_step": 174910, "epoch": 4164} {"train_loss": -7.185484886169434, "global_step": 174911, "epoch": 4164} {"train_loss": -7.090512752532959, "global_step": 174912, "epoch": 4164} {"train_loss": -7.06582498550415, "global_step": 174913, "epoch": 4164} {"train_loss": -7.085049152374268, "global_step": 174914, "epoch": 4164} {"train_loss": -7.142928600311279, "global_step": 174915, "epoch": 4164} {"train_loss": -7.054547309875488, "global_step": 174916, "epoch": 4164} {"train_loss": -7.116148948669434, "global_step": 174917, "epoch": 4164} {"train_loss": -7.081634044647217, "global_step": 174918, "epoch": 4164} {"train_loss": -7.12811279296875, "global_step": 174919, "epoch": 4164} {"train_loss": -7.073877334594727, "global_step": 174920, "epoch": 4164} {"train_loss": -7.0773491859436035, "global_step": 174921, "epoch": 4164} {"train_loss": -7.175075531005859, "global_step": 174922, "epoch": 4164} {"train_loss": -7.076196670532227, "global_step": 174923, "epoch": 4164} {"train_loss": -6.962406635284424, "global_step": 174924, "epoch": 4164} {"train_loss": -7.074231147766113, "global_step": 174925, "epoch": 4164} {"train_loss": -7.0001220703125, "global_step": 174926, "epoch": 4164} {"train_loss": -7.235639572143555, "global_step": 174927, "epoch": 4164} {"train_loss": -7.2246832847595215, "global_step": 174928, "epoch": 4164} {"train_loss": -7.117033016114008, "global_step": 174929, "epoch": 4164, "val_loss": 79937.0390625} {"train_loss": -7.142980575561523, "global_step": 174930, "epoch": 4165} {"train_loss": -7.164044380187988, "global_step": 174931, "epoch": 4165} {"train_loss": -7.205587387084961, "global_step": 174932, "epoch": 4165} {"train_loss": -7.146999835968018, "global_step": 174933, "epoch": 4165} {"train_loss": -7.112892150878906, "global_step": 174934, "epoch": 4165} {"train_loss": -7.112971305847168, "global_step": 174935, "epoch": 4165} {"train_loss": -7.047919750213623, "global_step": 174936, "epoch": 4165} {"train_loss": -7.201406955718994, "global_step": 174937, "epoch": 4165} {"train_loss": -7.009325981140137, "global_step": 174938, "epoch": 4165} {"train_loss": -7.07696008682251, "global_step": 174939, "epoch": 4165} {"train_loss": -7.142121315002441, "global_step": 174940, "epoch": 4165} {"train_loss": -7.0586700439453125, "global_step": 174941, "epoch": 4165} {"train_loss": -7.189006805419922, "global_step": 174942, "epoch": 4165} {"train_loss": -7.0830535888671875, "global_step": 174943, "epoch": 4165} {"train_loss": -7.0534515380859375, "global_step": 174944, "epoch": 4165} {"train_loss": -7.10142183303833, "global_step": 174945, "epoch": 4165} {"train_loss": -7.070330619812012, "global_step": 174946, "epoch": 4165} {"train_loss": -7.128697395324707, "global_step": 174947, "epoch": 4165} {"train_loss": -7.028815269470215, "global_step": 174948, "epoch": 4165} {"train_loss": -7.096094608306885, "global_step": 174949, "epoch": 4165} {"train_loss": -7.04191780090332, "global_step": 174950, "epoch": 4165} {"train_loss": -7.128942966461182, "global_step": 174951, "epoch": 4165} {"train_loss": -7.180676460266113, "global_step": 174952, "epoch": 4165} {"train_loss": -7.161455154418945, "global_step": 174953, "epoch": 4165} {"train_loss": -7.04535436630249, "global_step": 174954, "epoch": 4165} {"train_loss": -7.009984970092773, "global_step": 174955, "epoch": 4165} {"train_loss": -7.013083457946777, "global_step": 174956, "epoch": 4165} {"train_loss": -7.08008337020874, "global_step": 174957, "epoch": 4165} {"train_loss": -7.067626476287842, "global_step": 174958, "epoch": 4165} {"train_loss": -7.088076591491699, "global_step": 174959, "epoch": 4165} {"train_loss": -7.077487945556641, "global_step": 174960, "epoch": 4165} {"train_loss": -7.047499656677246, "global_step": 174961, "epoch": 4165} {"train_loss": -7.036811828613281, "global_step": 174962, "epoch": 4165} {"train_loss": -6.99525785446167, "global_step": 174963, "epoch": 4165} {"train_loss": -7.0355329513549805, "global_step": 174964, "epoch": 4165} {"train_loss": -7.035614013671875, "global_step": 174965, "epoch": 4165} {"train_loss": -7.056027889251709, "global_step": 174966, "epoch": 4165} {"train_loss": -6.954784393310547, "global_step": 174967, "epoch": 4165} {"train_loss": -7.03370475769043, "global_step": 174968, "epoch": 4165} {"train_loss": -6.921823501586914, "global_step": 174969, "epoch": 4165} {"train_loss": -7.0121331214904785, "global_step": 174970, "epoch": 4165} {"train_loss": -7.078180267697289, "global_step": 174971, "epoch": 4165, "val_loss": 80396.6328125} {"train_loss": -7.001884937286377, "global_step": 174972, "epoch": 4166} {"train_loss": -7.150768756866455, "global_step": 174973, "epoch": 4166} {"train_loss": -7.102155685424805, "global_step": 174974, "epoch": 4166} {"train_loss": -6.980315208435059, "global_step": 174975, "epoch": 4166} {"train_loss": -6.93494987487793, "global_step": 174976, "epoch": 4166} {"train_loss": -6.9191741943359375, "global_step": 174977, "epoch": 4166} {"train_loss": -6.87026309967041, "global_step": 174978, "epoch": 4166} {"train_loss": -7.017406463623047, "global_step": 174979, "epoch": 4166} {"train_loss": -7.0402021408081055, "global_step": 174980, "epoch": 4166} {"train_loss": -6.969745635986328, "global_step": 174981, "epoch": 4166} {"train_loss": -7.133034706115723, "global_step": 174982, "epoch": 4166} {"train_loss": -6.970712184906006, "global_step": 174983, "epoch": 4166} {"train_loss": -7.117554664611816, "global_step": 174984, "epoch": 4166} {"train_loss": -7.0676116943359375, "global_step": 174985, "epoch": 4166} {"train_loss": -6.980879783630371, "global_step": 174986, "epoch": 4166} {"train_loss": -6.999324321746826, "global_step": 174987, "epoch": 4166} {"train_loss": -6.96517276763916, "global_step": 174988, "epoch": 4166} {"train_loss": -7.161927223205566, "global_step": 174989, "epoch": 4166} {"train_loss": -6.958929061889648, "global_step": 174990, "epoch": 4166} {"train_loss": -7.12145471572876, "global_step": 174991, "epoch": 4166} {"train_loss": -7.016354560852051, "global_step": 174992, "epoch": 4166} {"train_loss": -7.148399353027344, "global_step": 174993, "epoch": 4166} {"train_loss": -7.065247058868408, "global_step": 174994, "epoch": 4166} {"train_loss": -7.083442687988281, "global_step": 174995, "epoch": 4166} {"train_loss": -7.2206034660339355, "global_step": 174996, "epoch": 4166} {"train_loss": -7.154962539672852, "global_step": 174997, "epoch": 4166} {"train_loss": -7.147767066955566, "global_step": 174998, "epoch": 4166} {"train_loss": -7.062963962554932, "global_step": 174999, "epoch": 4166} {"train_loss": -7.115534782409668, "global_step": 175000, "epoch": 4166} {"train_loss": -7.099164962768555, "global_step": 175001, "epoch": 4166} {"train_loss": -7.028106689453125, "global_step": 175002, "epoch": 4166} {"train_loss": -7.06976318359375, "global_step": 175003, "epoch": 4166} {"train_loss": -7.112713813781738, "global_step": 175004, "epoch": 4166} {"train_loss": -6.906434535980225, "global_step": 175005, "epoch": 4166} {"train_loss": -6.8851776123046875, "global_step": 175006, "epoch": 4166} {"train_loss": -7.096390247344971, "global_step": 175007, "epoch": 4166} {"train_loss": -6.899136543273926, "global_step": 175008, "epoch": 4166} {"train_loss": -7.003820419311523, "global_step": 175009, "epoch": 4166} {"train_loss": -7.057361125946045, "global_step": 175010, "epoch": 4166} {"train_loss": -6.973987579345703, "global_step": 175011, "epoch": 4166} {"train_loss": -6.9854888916015625, "global_step": 175012, "epoch": 4166} {"train_loss": -7.038769347327096, "global_step": 175013, "epoch": 4166, "val_loss": 80041.5} {"train_loss": -6.992861747741699, "global_step": 175014, "epoch": 4167} {"train_loss": -6.953736305236816, "global_step": 175015, "epoch": 4167} {"train_loss": -7.02004861831665, "global_step": 175016, "epoch": 4167} {"train_loss": -7.008223533630371, "global_step": 175017, "epoch": 4167} {"train_loss": -6.988495349884033, "global_step": 175018, "epoch": 4167} {"train_loss": -7.037024021148682, "global_step": 175019, "epoch": 4167} {"train_loss": -7.033621311187744, "global_step": 175020, "epoch": 4167} {"train_loss": -6.997376441955566, "global_step": 175021, "epoch": 4167} {"train_loss": -7.0648274421691895, "global_step": 175022, "epoch": 4167} {"train_loss": -6.951475143432617, "global_step": 175023, "epoch": 4167} {"train_loss": -6.946131706237793, "global_step": 175024, "epoch": 4167} {"train_loss": -7.0243072509765625, "global_step": 175025, "epoch": 4167} {"train_loss": -6.985299587249756, "global_step": 175026, "epoch": 4167} {"train_loss": -7.055477142333984, "global_step": 175027, "epoch": 4167} {"train_loss": -6.955883502960205, "global_step": 175028, "epoch": 4167} {"train_loss": -7.064353942871094, "global_step": 175029, "epoch": 4167} {"train_loss": -7.190672397613525, "global_step": 175030, "epoch": 4167} {"train_loss": -7.07241153717041, "global_step": 175031, "epoch": 4167} {"train_loss": -7.145489692687988, "global_step": 175032, "epoch": 4167} {"train_loss": -7.07598876953125, "global_step": 175033, "epoch": 4167} {"train_loss": -7.066812515258789, "global_step": 175034, "epoch": 4167} {"train_loss": -7.157805442810059, "global_step": 175035, "epoch": 4167} {"train_loss": -7.094788551330566, "global_step": 175036, "epoch": 4167} {"train_loss": -7.136194229125977, "global_step": 175037, "epoch": 4167} {"train_loss": -7.157703399658203, "global_step": 175038, "epoch": 4167} {"train_loss": -7.122800350189209, "global_step": 175039, "epoch": 4167} {"train_loss": -7.232596397399902, "global_step": 175040, "epoch": 4167} {"train_loss": -7.0215678215026855, "global_step": 175041, "epoch": 4167} {"train_loss": -7.241925239562988, "global_step": 175042, "epoch": 4167} {"train_loss": -7.037277698516846, "global_step": 175043, "epoch": 4167} {"train_loss": -7.041749477386475, "global_step": 175044, "epoch": 4167} {"train_loss": -6.971919059753418, "global_step": 175045, "epoch": 4167} {"train_loss": -7.030782699584961, "global_step": 175046, "epoch": 4167} {"train_loss": -6.991454124450684, "global_step": 175047, "epoch": 4167} {"train_loss": -6.946645259857178, "global_step": 175048, "epoch": 4167} {"train_loss": -7.10797119140625, "global_step": 175049, "epoch": 4167} {"train_loss": -7.166285514831543, "global_step": 175050, "epoch": 4167} {"train_loss": -7.036542892456055, "global_step": 175051, "epoch": 4167} {"train_loss": -7.124758720397949, "global_step": 175052, "epoch": 4167} {"train_loss": -7.1113433837890625, "global_step": 175053, "epoch": 4167} {"train_loss": -6.901500701904297, "global_step": 175054, "epoch": 4167} {"train_loss": -7.057620718365624, "global_step": 175055, "epoch": 4167, "val_loss": 79949.8515625} {"train_loss": -6.904787063598633, "global_step": 175056, "epoch": 4168} {"train_loss": -7.124181747436523, "global_step": 175057, "epoch": 4168} {"train_loss": -6.98951530456543, "global_step": 175058, "epoch": 4168} {"train_loss": -7.034710884094238, "global_step": 175059, "epoch": 4168} {"train_loss": -7.045937538146973, "global_step": 175060, "epoch": 4168} {"train_loss": -6.9583635330200195, "global_step": 175061, "epoch": 4168} {"train_loss": -7.236413478851318, "global_step": 175062, "epoch": 4168} {"train_loss": -7.080840587615967, "global_step": 175063, "epoch": 4168} {"train_loss": -7.10300874710083, "global_step": 175064, "epoch": 4168} {"train_loss": -7.162112712860107, "global_step": 175065, "epoch": 4168} {"train_loss": -7.095629692077637, "global_step": 175066, "epoch": 4168} {"train_loss": -7.161494255065918, "global_step": 175067, "epoch": 4168} {"train_loss": -6.97990608215332, "global_step": 175068, "epoch": 4168} {"train_loss": -7.094538688659668, "global_step": 175069, "epoch": 4168} {"train_loss": -7.067343711853027, "global_step": 175070, "epoch": 4168} {"train_loss": -7.124288558959961, "global_step": 175071, "epoch": 4168} {"train_loss": -7.17348051071167, "global_step": 175072, "epoch": 4168} {"train_loss": -7.073863506317139, "global_step": 175073, "epoch": 4168} {"train_loss": -7.065249919891357, "global_step": 175074, "epoch": 4168} {"train_loss": -6.957572937011719, "global_step": 175075, "epoch": 4168} {"train_loss": -7.110562801361084, "global_step": 175076, "epoch": 4168} {"train_loss": -7.092496871948242, "global_step": 175077, "epoch": 4168} {"train_loss": -7.1024627685546875, "global_step": 175078, "epoch": 4168} {"train_loss": -7.187780380249023, "global_step": 175079, "epoch": 4168} {"train_loss": -7.023432731628418, "global_step": 175080, "epoch": 4168} {"train_loss": -7.101222991943359, "global_step": 175081, "epoch": 4168} {"train_loss": -7.153726100921631, "global_step": 175082, "epoch": 4168} {"train_loss": -6.992494106292725, "global_step": 175083, "epoch": 4168} {"train_loss": -7.171678066253662, "global_step": 175084, "epoch": 4168} {"train_loss": -7.015743255615234, "global_step": 175085, "epoch": 4168} {"train_loss": -7.066137790679932, "global_step": 175086, "epoch": 4168} {"train_loss": -7.064128875732422, "global_step": 175087, "epoch": 4168} {"train_loss": -6.967128753662109, "global_step": 175088, "epoch": 4168} {"train_loss": -6.96730899810791, "global_step": 175089, "epoch": 4168} {"train_loss": -6.998574256896973, "global_step": 175090, "epoch": 4168} {"train_loss": -7.112481117248535, "global_step": 175091, "epoch": 4168} {"train_loss": -7.132301330566406, "global_step": 175092, "epoch": 4168} {"train_loss": -7.1022539138793945, "global_step": 175093, "epoch": 4168} {"train_loss": -7.156923294067383, "global_step": 175094, "epoch": 4168} {"train_loss": -7.063680648803711, "global_step": 175095, "epoch": 4168} {"train_loss": -7.111872673034668, "global_step": 175096, "epoch": 4168} {"train_loss": -7.078976994469052, "global_step": 175097, "epoch": 4168, "val_loss": 80025.640625} {"train_loss": -7.136298656463623, "global_step": 175098, "epoch": 4169} {"train_loss": -7.159320831298828, "global_step": 175099, "epoch": 4169} {"train_loss": -7.116687774658203, "global_step": 175100, "epoch": 4169} {"train_loss": -7.167320251464844, "global_step": 175101, "epoch": 4169} {"train_loss": -7.1876044273376465, "global_step": 175102, "epoch": 4169} {"train_loss": -7.065098762512207, "global_step": 175103, "epoch": 4169} {"train_loss": -7.1695356369018555, "global_step": 175104, "epoch": 4169} {"train_loss": -7.172784805297852, "global_step": 175105, "epoch": 4169} {"train_loss": -7.026360511779785, "global_step": 175106, "epoch": 4169} {"train_loss": -7.098031520843506, "global_step": 175107, "epoch": 4169} {"train_loss": -7.186075687408447, "global_step": 175108, "epoch": 4169} {"train_loss": -7.104753494262695, "global_step": 175109, "epoch": 4169} {"train_loss": -7.075064659118652, "global_step": 175110, "epoch": 4169} {"train_loss": -7.196178436279297, "global_step": 175111, "epoch": 4169} {"train_loss": -7.132706165313721, "global_step": 175112, "epoch": 4169} {"train_loss": -7.068571090698242, "global_step": 175113, "epoch": 4169} {"train_loss": -7.231551170349121, "global_step": 175114, "epoch": 4169} {"train_loss": -7.206828594207764, "global_step": 175115, "epoch": 4169} {"train_loss": -7.205985069274902, "global_step": 175116, "epoch": 4169} {"train_loss": -7.076432228088379, "global_step": 175117, "epoch": 4169} {"train_loss": -7.135784149169922, "global_step": 175118, "epoch": 4169} {"train_loss": -7.244046211242676, "global_step": 175119, "epoch": 4169} {"train_loss": -7.227238655090332, "global_step": 175120, "epoch": 4169} {"train_loss": -7.088137626647949, "global_step": 175121, "epoch": 4169} {"train_loss": -7.010283946990967, "global_step": 175122, "epoch": 4169} {"train_loss": -7.079196929931641, "global_step": 175123, "epoch": 4169} {"train_loss": -7.084587097167969, "global_step": 175124, "epoch": 4169} {"train_loss": -7.075422286987305, "global_step": 175125, "epoch": 4169} {"train_loss": -7.1065545082092285, "global_step": 175126, "epoch": 4169} {"train_loss": -6.977446556091309, "global_step": 175127, "epoch": 4169} {"train_loss": -7.123712062835693, "global_step": 175128, "epoch": 4169} {"train_loss": -7.078416347503662, "global_step": 175129, "epoch": 4169} {"train_loss": -7.060084819793701, "global_step": 175130, "epoch": 4169} {"train_loss": -7.001630783081055, "global_step": 175131, "epoch": 4169} {"train_loss": -7.172481060028076, "global_step": 175132, "epoch": 4169} {"train_loss": -6.973751068115234, "global_step": 175133, "epoch": 4169} {"train_loss": -7.1916680335998535, "global_step": 175134, "epoch": 4169} {"train_loss": -6.959964752197266, "global_step": 175135, "epoch": 4169} {"train_loss": -6.890497207641602, "global_step": 175136, "epoch": 4169} {"train_loss": -7.014348030090332, "global_step": 175137, "epoch": 4169} {"train_loss": -6.912170886993408, "global_step": 175138, "epoch": 4169} {"train_loss": -7.092640354519799, "global_step": 175139, "epoch": 4169, "val_loss": 80134.71875} {"train_loss": -7.090975761413574, "global_step": 175140, "epoch": 4170} {"train_loss": -6.850886344909668, "global_step": 175141, "epoch": 4170} {"train_loss": -6.861725330352783, "global_step": 175142, "epoch": 4170} {"train_loss": -6.9757280349731445, "global_step": 175143, "epoch": 4170} {"train_loss": -6.818968296051025, "global_step": 175144, "epoch": 4170} {"train_loss": -7.017435073852539, "global_step": 175145, "epoch": 4170} {"train_loss": -6.850439071655273, "global_step": 175146, "epoch": 4170} {"train_loss": -6.872283458709717, "global_step": 175147, "epoch": 4170} {"train_loss": -7.026876926422119, "global_step": 175148, "epoch": 4170} {"train_loss": -6.903293609619141, "global_step": 175149, "epoch": 4170} {"train_loss": -7.022393703460693, "global_step": 175150, "epoch": 4170} {"train_loss": -6.904096603393555, "global_step": 175151, "epoch": 4170} {"train_loss": -6.868321895599365, "global_step": 175152, "epoch": 4170} {"train_loss": -6.873617172241211, "global_step": 175153, "epoch": 4170} {"train_loss": -6.902222633361816, "global_step": 175154, "epoch": 4170} {"train_loss": -7.076892375946045, "global_step": 175155, "epoch": 4170} {"train_loss": -6.8473711013793945, "global_step": 175156, "epoch": 4170} {"train_loss": -7.049803733825684, "global_step": 175157, "epoch": 4170} {"train_loss": -6.963599681854248, "global_step": 175158, "epoch": 4170} {"train_loss": -6.8731842041015625, "global_step": 175159, "epoch": 4170} {"train_loss": -7.00433349609375, "global_step": 175160, "epoch": 4170} {"train_loss": -7.064907073974609, "global_step": 175161, "epoch": 4170} {"train_loss": -7.120995044708252, "global_step": 175162, "epoch": 4170} {"train_loss": -7.043148040771484, "global_step": 175163, "epoch": 4170} {"train_loss": -7.063474655151367, "global_step": 175164, "epoch": 4170} {"train_loss": -7.148648262023926, "global_step": 175165, "epoch": 4170} {"train_loss": -7.055450916290283, "global_step": 175166, "epoch": 4170} {"train_loss": -7.024447441101074, "global_step": 175167, "epoch": 4170} {"train_loss": -7.118898391723633, "global_step": 175168, "epoch": 4170} {"train_loss": -7.058989524841309, "global_step": 175169, "epoch": 4170} {"train_loss": -7.085024356842041, "global_step": 175170, "epoch": 4170} {"train_loss": -7.067737579345703, "global_step": 175171, "epoch": 4170} {"train_loss": -7.144944190979004, "global_step": 175172, "epoch": 4170} {"train_loss": -7.129162788391113, "global_step": 175173, "epoch": 4170} {"train_loss": -7.12396240234375, "global_step": 175174, "epoch": 4170} {"train_loss": -7.134530067443848, "global_step": 175175, "epoch": 4170} {"train_loss": -7.051571846008301, "global_step": 175176, "epoch": 4170} {"train_loss": -7.065074920654297, "global_step": 175177, "epoch": 4170} {"train_loss": -7.225376129150391, "global_step": 175178, "epoch": 4170} {"train_loss": -7.0418901443481445, "global_step": 175179, "epoch": 4170} {"train_loss": -7.0210700035095215, "global_step": 175180, "epoch": 4170} {"train_loss": -7.013332014992123, "global_step": 175181, "epoch": 4170, "val_loss": 80030.3203125} {"train_loss": -7.062690734863281, "global_step": 175182, "epoch": 4171} {"train_loss": -7.074861526489258, "global_step": 175183, "epoch": 4171} {"train_loss": -7.117107391357422, "global_step": 175184, "epoch": 4171} {"train_loss": -6.97982120513916, "global_step": 175185, "epoch": 4171} {"train_loss": -7.055373191833496, "global_step": 175186, "epoch": 4171} {"train_loss": -7.209563255310059, "global_step": 175187, "epoch": 4171} {"train_loss": -7.212674617767334, "global_step": 175188, "epoch": 4171} {"train_loss": -7.104833602905273, "global_step": 175189, "epoch": 4171} {"train_loss": -7.083971977233887, "global_step": 175190, "epoch": 4171} {"train_loss": -7.135820388793945, "global_step": 175191, "epoch": 4171} {"train_loss": -7.11013126373291, "global_step": 175192, "epoch": 4171} {"train_loss": -7.182244777679443, "global_step": 175193, "epoch": 4171} {"train_loss": -7.231232643127441, "global_step": 175194, "epoch": 4171} {"train_loss": -7.036534309387207, "global_step": 175195, "epoch": 4171} {"train_loss": -7.074332237243652, "global_step": 175196, "epoch": 4171} {"train_loss": -7.117247104644775, "global_step": 175197, "epoch": 4171} {"train_loss": -7.106297492980957, "global_step": 175198, "epoch": 4171} {"train_loss": -7.1889448165893555, "global_step": 175199, "epoch": 4171} {"train_loss": -7.165477752685547, "global_step": 175200, "epoch": 4171} {"train_loss": -7.162668228149414, "global_step": 175201, "epoch": 4171} {"train_loss": -7.067998886108398, "global_step": 175202, "epoch": 4171} {"train_loss": -7.138019561767578, "global_step": 175203, "epoch": 4171} {"train_loss": -7.114129066467285, "global_step": 175204, "epoch": 4171} {"train_loss": -7.100456237792969, "global_step": 175205, "epoch": 4171} {"train_loss": -7.149640083312988, "global_step": 175206, "epoch": 4171} {"train_loss": -6.994805812835693, "global_step": 175207, "epoch": 4171} {"train_loss": -7.143465042114258, "global_step": 175208, "epoch": 4171} {"train_loss": -7.179192543029785, "global_step": 175209, "epoch": 4171} {"train_loss": -7.0804033279418945, "global_step": 175210, "epoch": 4171} {"train_loss": -7.1122822761535645, "global_step": 175211, "epoch": 4171} {"train_loss": -7.042049407958984, "global_step": 175212, "epoch": 4171} {"train_loss": -7.039774417877197, "global_step": 175213, "epoch": 4171} {"train_loss": -7.078188896179199, "global_step": 175214, "epoch": 4171} {"train_loss": -6.974888324737549, "global_step": 175215, "epoch": 4171} {"train_loss": -7.0518083572387695, "global_step": 175216, "epoch": 4171} {"train_loss": -7.119976997375488, "global_step": 175217, "epoch": 4171} {"train_loss": -7.104447841644287, "global_step": 175218, "epoch": 4171} {"train_loss": -6.972539901733398, "global_step": 175219, "epoch": 4171} {"train_loss": -7.112949371337891, "global_step": 175220, "epoch": 4171} {"train_loss": -7.005701065063477, "global_step": 175221, "epoch": 4171} {"train_loss": -6.949967861175537, "global_step": 175222, "epoch": 4171} {"train_loss": -7.096084742319016, "global_step": 175223, "epoch": 4171, "val_loss": 80174.90625} {"train_loss": -7.031573295593262, "global_step": 175224, "epoch": 4172} {"train_loss": -7.005824565887451, "global_step": 175225, "epoch": 4172} {"train_loss": -7.08935546875, "global_step": 175226, "epoch": 4172} {"train_loss": -6.882033348083496, "global_step": 175227, "epoch": 4172} {"train_loss": -7.105644226074219, "global_step": 175228, "epoch": 4172} {"train_loss": -7.135278701782227, "global_step": 175229, "epoch": 4172} {"train_loss": -7.106388568878174, "global_step": 175230, "epoch": 4172} {"train_loss": -7.158849716186523, "global_step": 175231, "epoch": 4172} {"train_loss": -7.074085235595703, "global_step": 175232, "epoch": 4172} {"train_loss": -7.191831588745117, "global_step": 175233, "epoch": 4172} {"train_loss": -7.1710734367370605, "global_step": 175234, "epoch": 4172} {"train_loss": -7.10820198059082, "global_step": 175235, "epoch": 4172} {"train_loss": -7.179134368896484, "global_step": 175236, "epoch": 4172} {"train_loss": -7.152425765991211, "global_step": 175237, "epoch": 4172} {"train_loss": -7.08543062210083, "global_step": 175238, "epoch": 4172} {"train_loss": -7.129509925842285, "global_step": 175239, "epoch": 4172} {"train_loss": -7.10324764251709, "global_step": 175240, "epoch": 4172} {"train_loss": -7.146146774291992, "global_step": 175241, "epoch": 4172} {"train_loss": -7.059032440185547, "global_step": 175242, "epoch": 4172} {"train_loss": -7.157724380493164, "global_step": 175243, "epoch": 4172} {"train_loss": -7.086851119995117, "global_step": 175244, "epoch": 4172} {"train_loss": -7.028306007385254, "global_step": 175245, "epoch": 4172} {"train_loss": -7.109461784362793, "global_step": 175246, "epoch": 4172} {"train_loss": -7.099632740020752, "global_step": 175247, "epoch": 4172} {"train_loss": -7.139246940612793, "global_step": 175248, "epoch": 4172} {"train_loss": -7.120476722717285, "global_step": 175249, "epoch": 4172} {"train_loss": -6.881159782409668, "global_step": 175250, "epoch": 4172} {"train_loss": -7.115623950958252, "global_step": 175251, "epoch": 4172} {"train_loss": -7.0951313972473145, "global_step": 175252, "epoch": 4172} {"train_loss": -7.036746025085449, "global_step": 175253, "epoch": 4172} {"train_loss": -7.105203628540039, "global_step": 175254, "epoch": 4172} {"train_loss": -7.072813034057617, "global_step": 175255, "epoch": 4172} {"train_loss": -7.155812740325928, "global_step": 175256, "epoch": 4172} {"train_loss": -7.113926410675049, "global_step": 175257, "epoch": 4172} {"train_loss": -7.1511993408203125, "global_step": 175258, "epoch": 4172} {"train_loss": -7.088255882263184, "global_step": 175259, "epoch": 4172} {"train_loss": -7.040707111358643, "global_step": 175260, "epoch": 4172} {"train_loss": -7.137224197387695, "global_step": 175261, "epoch": 4172} {"train_loss": -7.07684326171875, "global_step": 175262, "epoch": 4172} {"train_loss": -6.926264762878418, "global_step": 175263, "epoch": 4172} {"train_loss": -7.0829315185546875, "global_step": 175264, "epoch": 4172} {"train_loss": -7.092861572901408, "global_step": 175265, "epoch": 4172, "val_loss": 80213.4609375} {"train_loss": -6.928614139556885, "global_step": 175266, "epoch": 4173} {"train_loss": -7.08139705657959, "global_step": 175267, "epoch": 4173} {"train_loss": -7.0761566162109375, "global_step": 175268, "epoch": 4173} {"train_loss": -6.938977241516113, "global_step": 175269, "epoch": 4173} {"train_loss": -6.883566856384277, "global_step": 175270, "epoch": 4173} {"train_loss": -7.010784149169922, "global_step": 175271, "epoch": 4173} {"train_loss": -7.106949806213379, "global_step": 175272, "epoch": 4173} {"train_loss": -6.958120822906494, "global_step": 175273, "epoch": 4173} {"train_loss": -7.125000953674316, "global_step": 175274, "epoch": 4173} {"train_loss": -6.90875244140625, "global_step": 175275, "epoch": 4173} {"train_loss": -6.848146438598633, "global_step": 175276, "epoch": 4173} {"train_loss": -6.948586463928223, "global_step": 175277, "epoch": 4173} {"train_loss": -6.973982334136963, "global_step": 175278, "epoch": 4173} {"train_loss": -7.000842094421387, "global_step": 175279, "epoch": 4173} {"train_loss": -6.920109748840332, "global_step": 175280, "epoch": 4173} {"train_loss": -6.961417198181152, "global_step": 175281, "epoch": 4173} {"train_loss": -7.008222579956055, "global_step": 175282, "epoch": 4173} {"train_loss": -7.079531669616699, "global_step": 175283, "epoch": 4173} {"train_loss": -7.021184921264648, "global_step": 175284, "epoch": 4173} {"train_loss": -7.024646759033203, "global_step": 175285, "epoch": 4173} {"train_loss": -6.9923858642578125, "global_step": 175286, "epoch": 4173} {"train_loss": -7.060239791870117, "global_step": 175287, "epoch": 4173} {"train_loss": -7.057004928588867, "global_step": 175288, "epoch": 4173} {"train_loss": -6.925705909729004, "global_step": 175289, "epoch": 4173} {"train_loss": -7.011094093322754, "global_step": 175290, "epoch": 4173} {"train_loss": -7.090798854827881, "global_step": 175291, "epoch": 4173} {"train_loss": -7.063354969024658, "global_step": 175292, "epoch": 4173} {"train_loss": -7.048453330993652, "global_step": 175293, "epoch": 4173} {"train_loss": -7.01703405380249, "global_step": 175294, "epoch": 4173} {"train_loss": -6.993826389312744, "global_step": 175295, "epoch": 4173} {"train_loss": -7.082560062408447, "global_step": 175296, "epoch": 4173} {"train_loss": -6.955597400665283, "global_step": 175297, "epoch": 4173} {"train_loss": -7.091333389282227, "global_step": 175298, "epoch": 4173} {"train_loss": -6.997641563415527, "global_step": 175299, "epoch": 4173} {"train_loss": -7.0540008544921875, "global_step": 175300, "epoch": 4173} {"train_loss": -7.125652313232422, "global_step": 175301, "epoch": 4173} {"train_loss": -6.9860639572143555, "global_step": 175302, "epoch": 4173} {"train_loss": -7.196727275848389, "global_step": 175303, "epoch": 4173} {"train_loss": -6.917596340179443, "global_step": 175304, "epoch": 4173} {"train_loss": -6.9295830726623535, "global_step": 175305, "epoch": 4173} {"train_loss": -7.104138374328613, "global_step": 175306, "epoch": 4173} {"train_loss": -7.011248406909761, "global_step": 175307, "epoch": 4173, "val_loss": 80124.8125} {"train_loss": -7.108170509338379, "global_step": 175308, "epoch": 4174} {"train_loss": -7.039542198181152, "global_step": 175309, "epoch": 4174} {"train_loss": -6.894624710083008, "global_step": 175310, "epoch": 4174} {"train_loss": -6.994142055511475, "global_step": 175311, "epoch": 4174} {"train_loss": -7.102056503295898, "global_step": 175312, "epoch": 4174} {"train_loss": -7.034355640411377, "global_step": 175313, "epoch": 4174} {"train_loss": -6.961580753326416, "global_step": 175314, "epoch": 4174} {"train_loss": -7.155965328216553, "global_step": 175315, "epoch": 4174} {"train_loss": -7.063507080078125, "global_step": 175316, "epoch": 4174} {"train_loss": -7.082834243774414, "global_step": 175317, "epoch": 4174} {"train_loss": -7.079806327819824, "global_step": 175318, "epoch": 4174} {"train_loss": -7.192440032958984, "global_step": 175319, "epoch": 4174} {"train_loss": -7.033581256866455, "global_step": 175320, "epoch": 4174} {"train_loss": -7.147223472595215, "global_step": 175321, "epoch": 4174} {"train_loss": -7.128493309020996, "global_step": 175322, "epoch": 4174} {"train_loss": -7.065033912658691, "global_step": 175323, "epoch": 4174} {"train_loss": -7.008003234863281, "global_step": 175324, "epoch": 4174} {"train_loss": -7.075196266174316, "global_step": 175325, "epoch": 4174} {"train_loss": -7.104517936706543, "global_step": 175326, "epoch": 4174} {"train_loss": -7.096330642700195, "global_step": 175327, "epoch": 4174} {"train_loss": -6.982504844665527, "global_step": 175328, "epoch": 4174} {"train_loss": -7.184427261352539, "global_step": 175329, "epoch": 4174} {"train_loss": -7.080209732055664, "global_step": 175330, "epoch": 4174} {"train_loss": -7.0855560302734375, "global_step": 175331, "epoch": 4174} {"train_loss": -7.098702907562256, "global_step": 175332, "epoch": 4174} {"train_loss": -7.174559116363525, "global_step": 175333, "epoch": 4174} {"train_loss": -7.076192855834961, "global_step": 175334, "epoch": 4174} {"train_loss": -7.091334342956543, "global_step": 175335, "epoch": 4174} {"train_loss": -6.946453094482422, "global_step": 175336, "epoch": 4174} {"train_loss": -6.985498905181885, "global_step": 175337, "epoch": 4174} {"train_loss": -7.101525783538818, "global_step": 175338, "epoch": 4174} {"train_loss": -7.000248432159424, "global_step": 175339, "epoch": 4174} {"train_loss": -7.149417400360107, "global_step": 175340, "epoch": 4174} {"train_loss": -7.018918991088867, "global_step": 175341, "epoch": 4174} {"train_loss": -7.228825569152832, "global_step": 175342, "epoch": 4174} {"train_loss": -6.967957019805908, "global_step": 175343, "epoch": 4174} {"train_loss": -7.1521477699279785, "global_step": 175344, "epoch": 4174} {"train_loss": -7.087801933288574, "global_step": 175345, "epoch": 4174} {"train_loss": -7.153461456298828, "global_step": 175346, "epoch": 4174} {"train_loss": -7.002936363220215, "global_step": 175347, "epoch": 4174} {"train_loss": -7.0010666847229, "global_step": 175348, "epoch": 4174} {"train_loss": -7.072052955627441, "global_step": 175349, "epoch": 4174, "val_loss": 80118.4921875} {"train_loss": -7.147472381591797, "global_step": 175350, "epoch": 4175} {"train_loss": -7.005838394165039, "global_step": 175351, "epoch": 4175} {"train_loss": -7.065685272216797, "global_step": 175352, "epoch": 4175} {"train_loss": -7.01741886138916, "global_step": 175353, "epoch": 4175} {"train_loss": -7.014520645141602, "global_step": 175354, "epoch": 4175} {"train_loss": -7.060768127441406, "global_step": 175355, "epoch": 4175} {"train_loss": -7.056004524230957, "global_step": 175356, "epoch": 4175} {"train_loss": -7.168932914733887, "global_step": 175357, "epoch": 4175} {"train_loss": -7.017604351043701, "global_step": 175358, "epoch": 4175} {"train_loss": -7.10605525970459, "global_step": 175359, "epoch": 4175} {"train_loss": -7.106505393981934, "global_step": 175360, "epoch": 4175} {"train_loss": -7.123400688171387, "global_step": 175361, "epoch": 4175} {"train_loss": -7.053299903869629, "global_step": 175362, "epoch": 4175} {"train_loss": -7.142332077026367, "global_step": 175363, "epoch": 4175} {"train_loss": -7.100153923034668, "global_step": 175364, "epoch": 4175} {"train_loss": -7.123937606811523, "global_step": 175365, "epoch": 4175} {"train_loss": -7.110300064086914, "global_step": 175366, "epoch": 4175} {"train_loss": -7.164937496185303, "global_step": 175367, "epoch": 4175} {"train_loss": -7.023862361907959, "global_step": 175368, "epoch": 4175} {"train_loss": -6.943637847900391, "global_step": 175369, "epoch": 4175} {"train_loss": -7.091672897338867, "global_step": 175370, "epoch": 4175} {"train_loss": -7.131016731262207, "global_step": 175371, "epoch": 4175} {"train_loss": -7.197182655334473, "global_step": 175372, "epoch": 4175} {"train_loss": -7.142792701721191, "global_step": 175373, "epoch": 4175} {"train_loss": -7.171950817108154, "global_step": 175374, "epoch": 4175} {"train_loss": -7.111136436462402, "global_step": 175375, "epoch": 4175} {"train_loss": -7.25844669342041, "global_step": 175376, "epoch": 4175} {"train_loss": -7.0463056564331055, "global_step": 175377, "epoch": 4175} {"train_loss": -7.140774250030518, "global_step": 175378, "epoch": 4175} {"train_loss": -7.072666168212891, "global_step": 175379, "epoch": 4175} {"train_loss": -7.017329216003418, "global_step": 175380, "epoch": 4175} {"train_loss": -7.033298492431641, "global_step": 175381, "epoch": 4175} {"train_loss": -7.155030250549316, "global_step": 175382, "epoch": 4175} {"train_loss": -7.125768661499023, "global_step": 175383, "epoch": 4175} {"train_loss": -7.146111488342285, "global_step": 175384, "epoch": 4175} {"train_loss": -7.1287994384765625, "global_step": 175385, "epoch": 4175} {"train_loss": -7.138359546661377, "global_step": 175386, "epoch": 4175} {"train_loss": -7.075879096984863, "global_step": 175387, "epoch": 4175} {"train_loss": -7.196104049682617, "global_step": 175388, "epoch": 4175} {"train_loss": -7.173609733581543, "global_step": 175389, "epoch": 4175} {"train_loss": -7.086832046508789, "global_step": 175390, "epoch": 4175} {"train_loss": -7.100680124192011, "global_step": 175391, "epoch": 4175, "val_loss": 79867.8984375} {"train_loss": -7.07575798034668, "global_step": 175392, "epoch": 4176} {"train_loss": -7.082627296447754, "global_step": 175393, "epoch": 4176} {"train_loss": -7.174954414367676, "global_step": 175394, "epoch": 4176} {"train_loss": -7.032111167907715, "global_step": 175395, "epoch": 4176} {"train_loss": -7.0826416015625, "global_step": 175396, "epoch": 4176} {"train_loss": -7.015545845031738, "global_step": 175397, "epoch": 4176} {"train_loss": -7.00835657119751, "global_step": 175398, "epoch": 4176} {"train_loss": -7.037179946899414, "global_step": 175399, "epoch": 4176} {"train_loss": -7.090584754943848, "global_step": 175400, "epoch": 4176} {"train_loss": -7.0582685470581055, "global_step": 175401, "epoch": 4176} {"train_loss": -6.929895401000977, "global_step": 175402, "epoch": 4176} {"train_loss": -6.949969291687012, "global_step": 175403, "epoch": 4176} {"train_loss": -6.9272661209106445, "global_step": 175404, "epoch": 4176} {"train_loss": -7.088254928588867, "global_step": 175405, "epoch": 4176} {"train_loss": -6.947593688964844, "global_step": 175406, "epoch": 4176} {"train_loss": -7.092457294464111, "global_step": 175407, "epoch": 4176} {"train_loss": -6.73582649230957, "global_step": 175408, "epoch": 4176} {"train_loss": -6.987381935119629, "global_step": 175409, "epoch": 4176} {"train_loss": -7.0336456298828125, "global_step": 175410, "epoch": 4176} {"train_loss": -6.852084159851074, "global_step": 175411, "epoch": 4176} {"train_loss": -7.044938087463379, "global_step": 175412, "epoch": 4176} {"train_loss": -6.877873420715332, "global_step": 175413, "epoch": 4176} {"train_loss": -7.036823272705078, "global_step": 175414, "epoch": 4176} {"train_loss": -6.862305641174316, "global_step": 175415, "epoch": 4176} {"train_loss": -6.928974151611328, "global_step": 175416, "epoch": 4176} {"train_loss": -6.958869934082031, "global_step": 175417, "epoch": 4176} {"train_loss": -6.97990608215332, "global_step": 175418, "epoch": 4176} {"train_loss": -7.085597038269043, "global_step": 175419, "epoch": 4176} {"train_loss": -7.044157981872559, "global_step": 175420, "epoch": 4176} {"train_loss": -7.047539234161377, "global_step": 175421, "epoch": 4176} {"train_loss": -7.005640506744385, "global_step": 175422, "epoch": 4176} {"train_loss": -6.91644287109375, "global_step": 175423, "epoch": 4176} {"train_loss": -7.036220550537109, "global_step": 175424, "epoch": 4176} {"train_loss": -6.997633934020996, "global_step": 175425, "epoch": 4176} {"train_loss": -6.98244571685791, "global_step": 175426, "epoch": 4176} {"train_loss": -7.135631561279297, "global_step": 175427, "epoch": 4176} {"train_loss": -7.070642948150635, "global_step": 175428, "epoch": 4176} {"train_loss": -7.0944061279296875, "global_step": 175429, "epoch": 4176} {"train_loss": -7.052443027496338, "global_step": 175430, "epoch": 4176} {"train_loss": -7.03443717956543, "global_step": 175431, "epoch": 4176} {"train_loss": -6.940202713012695, "global_step": 175432, "epoch": 4176} {"train_loss": -7.010259605589367, "global_step": 175433, "epoch": 4176, "val_loss": 80135.234375} {"train_loss": -6.9757795333862305, "global_step": 175434, "epoch": 4177} {"train_loss": -6.958054065704346, "global_step": 175435, "epoch": 4177} {"train_loss": -7.103236198425293, "global_step": 175436, "epoch": 4177} {"train_loss": -7.1308488845825195, "global_step": 175437, "epoch": 4177} {"train_loss": -7.050030708312988, "global_step": 175438, "epoch": 4177} {"train_loss": -7.118856430053711, "global_step": 175439, "epoch": 4177} {"train_loss": -7.103551864624023, "global_step": 175440, "epoch": 4177} {"train_loss": -7.071081638336182, "global_step": 175441, "epoch": 4177} {"train_loss": -7.069805145263672, "global_step": 175442, "epoch": 4177} {"train_loss": -7.261956214904785, "global_step": 175443, "epoch": 4177} {"train_loss": -7.175358772277832, "global_step": 175444, "epoch": 4177} {"train_loss": -7.094024181365967, "global_step": 175445, "epoch": 4177} {"train_loss": -7.052254676818848, "global_step": 175446, "epoch": 4177} {"train_loss": -7.100569248199463, "global_step": 175447, "epoch": 4177} {"train_loss": -7.121548652648926, "global_step": 175448, "epoch": 4177} {"train_loss": -7.204516410827637, "global_step": 175449, "epoch": 4177} {"train_loss": -7.167169570922852, "global_step": 175450, "epoch": 4177} {"train_loss": -7.206587791442871, "global_step": 175451, "epoch": 4177} {"train_loss": -7.071406364440918, "global_step": 175452, "epoch": 4177} {"train_loss": -7.126310348510742, "global_step": 175453, "epoch": 4177} {"train_loss": -7.147421836853027, "global_step": 175454, "epoch": 4177} {"train_loss": -7.156018257141113, "global_step": 175455, "epoch": 4177} {"train_loss": -7.214353561401367, "global_step": 175456, "epoch": 4177} {"train_loss": -7.080702304840088, "global_step": 175457, "epoch": 4177} {"train_loss": -7.073705673217773, "global_step": 175458, "epoch": 4177} {"train_loss": -7.1113715171813965, "global_step": 175459, "epoch": 4177} {"train_loss": -7.091348171234131, "global_step": 175460, "epoch": 4177} {"train_loss": -7.11033296585083, "global_step": 175461, "epoch": 4177} {"train_loss": -6.985952854156494, "global_step": 175462, "epoch": 4177} {"train_loss": -7.015830993652344, "global_step": 175463, "epoch": 4177} {"train_loss": -7.093776226043701, "global_step": 175464, "epoch": 4177} {"train_loss": -6.958853721618652, "global_step": 175465, "epoch": 4177} {"train_loss": -7.034666061401367, "global_step": 175466, "epoch": 4177} {"train_loss": -7.069941520690918, "global_step": 175467, "epoch": 4177} {"train_loss": -7.196152687072754, "global_step": 175468, "epoch": 4177} {"train_loss": -6.950777530670166, "global_step": 175469, "epoch": 4177} {"train_loss": -7.080374240875244, "global_step": 175470, "epoch": 4177} {"train_loss": -7.063843727111816, "global_step": 175471, "epoch": 4177} {"train_loss": -7.095765113830566, "global_step": 175472, "epoch": 4177} {"train_loss": -7.019957065582275, "global_step": 175473, "epoch": 4177} {"train_loss": -7.128463268280029, "global_step": 175474, "epoch": 4177} {"train_loss": -7.094506377265567, "global_step": 175475, "epoch": 4177, "val_loss": 80103.390625} {"train_loss": -7.00064754486084, "global_step": 175476, "epoch": 4178} {"train_loss": -7.022128582000732, "global_step": 175477, "epoch": 4178} {"train_loss": -7.158358097076416, "global_step": 175478, "epoch": 4178} {"train_loss": -7.102283477783203, "global_step": 175479, "epoch": 4178} {"train_loss": -7.167999267578125, "global_step": 175480, "epoch": 4178} {"train_loss": -7.063275337219238, "global_step": 175481, "epoch": 4178} {"train_loss": -7.215723037719727, "global_step": 175482, "epoch": 4178} {"train_loss": -7.096132755279541, "global_step": 175483, "epoch": 4178} {"train_loss": -7.094690322875977, "global_step": 175484, "epoch": 4178} {"train_loss": -7.017999649047852, "global_step": 175485, "epoch": 4178} {"train_loss": -7.141838550567627, "global_step": 175486, "epoch": 4178} {"train_loss": -7.119390487670898, "global_step": 175487, "epoch": 4178} {"train_loss": -7.096486568450928, "global_step": 175488, "epoch": 4178} {"train_loss": -7.168796539306641, "global_step": 175489, "epoch": 4178} {"train_loss": -7.207742691040039, "global_step": 175490, "epoch": 4178} {"train_loss": -7.12070369720459, "global_step": 175491, "epoch": 4178} {"train_loss": -7.108050346374512, "global_step": 175492, "epoch": 4178} {"train_loss": -7.142694473266602, "global_step": 175493, "epoch": 4178} {"train_loss": -7.031896114349365, "global_step": 175494, "epoch": 4178} {"train_loss": -7.06923770904541, "global_step": 175495, "epoch": 4178} {"train_loss": -7.100866794586182, "global_step": 175496, "epoch": 4178} {"train_loss": -7.259867191314697, "global_step": 175497, "epoch": 4178} {"train_loss": -7.113620758056641, "global_step": 175498, "epoch": 4178} {"train_loss": -7.125836372375488, "global_step": 175499, "epoch": 4178} {"train_loss": -7.143642425537109, "global_step": 175500, "epoch": 4178} {"train_loss": -7.180599212646484, "global_step": 175501, "epoch": 4178} {"train_loss": -6.937664985656738, "global_step": 175502, "epoch": 4178} {"train_loss": -7.101417541503906, "global_step": 175503, "epoch": 4178} {"train_loss": -7.054531097412109, "global_step": 175504, "epoch": 4178} {"train_loss": -7.076757907867432, "global_step": 175505, "epoch": 4178} {"train_loss": -7.095522880554199, "global_step": 175506, "epoch": 4178} {"train_loss": -7.041311264038086, "global_step": 175507, "epoch": 4178} {"train_loss": -7.031015396118164, "global_step": 175508, "epoch": 4178} {"train_loss": -7.05474853515625, "global_step": 175509, "epoch": 4178} {"train_loss": -7.139038562774658, "global_step": 175510, "epoch": 4178} {"train_loss": -7.074557304382324, "global_step": 175511, "epoch": 4178} {"train_loss": -7.142193794250488, "global_step": 175512, "epoch": 4178} {"train_loss": -7.2342915534973145, "global_step": 175513, "epoch": 4178} {"train_loss": -7.09982442855835, "global_step": 175514, "epoch": 4178} {"train_loss": -7.145750045776367, "global_step": 175515, "epoch": 4178} {"train_loss": -7.180352210998535, "global_step": 175516, "epoch": 4178} {"train_loss": -7.1088102885655, "global_step": 175517, "epoch": 4178, "val_loss": 80141.0859375} {"train_loss": -7.133408069610596, "global_step": 175518, "epoch": 4179} {"train_loss": -7.049293518066406, "global_step": 175519, "epoch": 4179} {"train_loss": -6.968886375427246, "global_step": 175520, "epoch": 4179} {"train_loss": -7.087486267089844, "global_step": 175521, "epoch": 4179} {"train_loss": -6.996244430541992, "global_step": 175522, "epoch": 4179} {"train_loss": -7.115113258361816, "global_step": 175523, "epoch": 4179} {"train_loss": -7.055933952331543, "global_step": 175524, "epoch": 4179} {"train_loss": -7.0789289474487305, "global_step": 175525, "epoch": 4179} {"train_loss": -7.04667329788208, "global_step": 175526, "epoch": 4179} {"train_loss": -7.163607597351074, "global_step": 175527, "epoch": 4179} {"train_loss": -7.088589668273926, "global_step": 175528, "epoch": 4179} {"train_loss": -7.1881608963012695, "global_step": 175529, "epoch": 4179} {"train_loss": -7.057493686676025, "global_step": 175530, "epoch": 4179} {"train_loss": -7.147555351257324, "global_step": 175531, "epoch": 4179} {"train_loss": -6.974596977233887, "global_step": 175532, "epoch": 4179} {"train_loss": -7.076051712036133, "global_step": 175533, "epoch": 4179} {"train_loss": -7.114803791046143, "global_step": 175534, "epoch": 4179} {"train_loss": -7.019620895385742, "global_step": 175535, "epoch": 4179} {"train_loss": -7.246189594268799, "global_step": 175536, "epoch": 4179} {"train_loss": -6.984770774841309, "global_step": 175537, "epoch": 4179} {"train_loss": -6.976357460021973, "global_step": 175538, "epoch": 4179} {"train_loss": -7.0218048095703125, "global_step": 175539, "epoch": 4179} {"train_loss": -7.095284461975098, "global_step": 175540, "epoch": 4179} {"train_loss": -7.107929229736328, "global_step": 175541, "epoch": 4179} {"train_loss": -7.145376205444336, "global_step": 175542, "epoch": 4179} {"train_loss": -7.164217948913574, "global_step": 175543, "epoch": 4179} {"train_loss": -7.089527606964111, "global_step": 175544, "epoch": 4179} {"train_loss": -7.177482604980469, "global_step": 175545, "epoch": 4179} {"train_loss": -7.1818952560424805, "global_step": 175546, "epoch": 4179} {"train_loss": -7.166929244995117, "global_step": 175547, "epoch": 4179} {"train_loss": -7.019979476928711, "global_step": 175548, "epoch": 4179} {"train_loss": -7.182736873626709, "global_step": 175549, "epoch": 4179} {"train_loss": -7.1296000480651855, "global_step": 175550, "epoch": 4179} {"train_loss": -7.126394271850586, "global_step": 175551, "epoch": 4179} {"train_loss": -7.042068958282471, "global_step": 175552, "epoch": 4179} {"train_loss": -7.1448187828063965, "global_step": 175553, "epoch": 4179} {"train_loss": -7.175466060638428, "global_step": 175554, "epoch": 4179} {"train_loss": -7.152044296264648, "global_step": 175555, "epoch": 4179} {"train_loss": -7.118487358093262, "global_step": 175556, "epoch": 4179} {"train_loss": -7.188262462615967, "global_step": 175557, "epoch": 4179} {"train_loss": -7.1408233642578125, "global_step": 175558, "epoch": 4179} {"train_loss": -7.104056074505761, "global_step": 175559, "epoch": 4179, "val_loss": 80152.5} {"train_loss": -7.141847133636475, "global_step": 175560, "epoch": 4180} {"train_loss": -7.178088188171387, "global_step": 175561, "epoch": 4180} {"train_loss": -7.221047401428223, "global_step": 175562, "epoch": 4180} {"train_loss": -7.236580848693848, "global_step": 175563, "epoch": 4180} {"train_loss": -7.189788818359375, "global_step": 175564, "epoch": 4180} {"train_loss": -7.143866539001465, "global_step": 175565, "epoch": 4180} {"train_loss": -7.17250919342041, "global_step": 175566, "epoch": 4180} {"train_loss": -7.094794273376465, "global_step": 175567, "epoch": 4180} {"train_loss": -6.991238594055176, "global_step": 175568, "epoch": 4180} {"train_loss": -7.128091335296631, "global_step": 175569, "epoch": 4180} {"train_loss": -7.233846187591553, "global_step": 175570, "epoch": 4180} {"train_loss": -7.125277519226074, "global_step": 175571, "epoch": 4180} {"train_loss": -7.188735008239746, "global_step": 175572, "epoch": 4180} {"train_loss": -7.037391662597656, "global_step": 175573, "epoch": 4180} {"train_loss": -7.089877128601074, "global_step": 175574, "epoch": 4180} {"train_loss": -6.971355438232422, "global_step": 175575, "epoch": 4180} {"train_loss": -7.1779937744140625, "global_step": 175576, "epoch": 4180} {"train_loss": -7.059257507324219, "global_step": 175577, "epoch": 4180} {"train_loss": -6.98306941986084, "global_step": 175578, "epoch": 4180} {"train_loss": -7.085525989532471, "global_step": 175579, "epoch": 4180} {"train_loss": -7.098212718963623, "global_step": 175580, "epoch": 4180} {"train_loss": -7.112631797790527, "global_step": 175581, "epoch": 4180} {"train_loss": -7.102974891662598, "global_step": 175582, "epoch": 4180} {"train_loss": -7.085269927978516, "global_step": 175583, "epoch": 4180} {"train_loss": -7.025810241699219, "global_step": 175584, "epoch": 4180} {"train_loss": -7.024178504943848, "global_step": 175585, "epoch": 4180} {"train_loss": -7.072085380554199, "global_step": 175586, "epoch": 4180} {"train_loss": -7.119144439697266, "global_step": 175587, "epoch": 4180} {"train_loss": -7.100901126861572, "global_step": 175588, "epoch": 4180} {"train_loss": -6.9778947830200195, "global_step": 175589, "epoch": 4180} {"train_loss": -7.101616382598877, "global_step": 175590, "epoch": 4180} {"train_loss": -6.949965476989746, "global_step": 175591, "epoch": 4180} {"train_loss": -6.921230316162109, "global_step": 175592, "epoch": 4180} {"train_loss": -6.8814191818237305, "global_step": 175593, "epoch": 4180} {"train_loss": -6.8161211013793945, "global_step": 175594, "epoch": 4180} {"train_loss": -6.931902885437012, "global_step": 175595, "epoch": 4180} {"train_loss": -6.960636138916016, "global_step": 175596, "epoch": 4180} {"train_loss": -6.945550918579102, "global_step": 175597, "epoch": 4180} {"train_loss": -7.074696063995361, "global_step": 175598, "epoch": 4180} {"train_loss": -7.040028095245361, "global_step": 175599, "epoch": 4180} {"train_loss": -7.0531005859375, "global_step": 175600, "epoch": 4180} {"train_loss": -7.063265357698713, "global_step": 175601, "epoch": 4180, "val_loss": 80139.3984375} {"train_loss": -7.130135536193848, "global_step": 175602, "epoch": 4181} {"train_loss": -7.069579601287842, "global_step": 175603, "epoch": 4181} {"train_loss": -6.885879039764404, "global_step": 175604, "epoch": 4181} {"train_loss": -7.100879192352295, "global_step": 175605, "epoch": 4181} {"train_loss": -6.98206901550293, "global_step": 175606, "epoch": 4181} {"train_loss": -7.008726119995117, "global_step": 175607, "epoch": 4181} {"train_loss": -7.08892297744751, "global_step": 175608, "epoch": 4181} {"train_loss": -7.114951133728027, "global_step": 175609, "epoch": 4181} {"train_loss": -7.037117004394531, "global_step": 175610, "epoch": 4181} {"train_loss": -7.061560153961182, "global_step": 175611, "epoch": 4181} {"train_loss": -7.072074890136719, "global_step": 175612, "epoch": 4181} {"train_loss": -7.121084213256836, "global_step": 175613, "epoch": 4181} {"train_loss": -7.077479362487793, "global_step": 175614, "epoch": 4181} {"train_loss": -7.0944719314575195, "global_step": 175615, "epoch": 4181} {"train_loss": -7.132043361663818, "global_step": 175616, "epoch": 4181} {"train_loss": -7.165863037109375, "global_step": 175617, "epoch": 4181} {"train_loss": -7.047637939453125, "global_step": 175618, "epoch": 4181} {"train_loss": -7.005738735198975, "global_step": 175619, "epoch": 4181} {"train_loss": -7.129559516906738, "global_step": 175620, "epoch": 4181} {"train_loss": -7.043293476104736, "global_step": 175621, "epoch": 4181} {"train_loss": -7.130331516265869, "global_step": 175622, "epoch": 4181} {"train_loss": -7.1817827224731445, "global_step": 175623, "epoch": 4181} {"train_loss": -7.0500807762146, "global_step": 175624, "epoch": 4181} {"train_loss": -7.108521938323975, "global_step": 175625, "epoch": 4181} {"train_loss": -7.1542158126831055, "global_step": 175626, "epoch": 4181} {"train_loss": -7.037025451660156, "global_step": 175627, "epoch": 4181} {"train_loss": -7.105499267578125, "global_step": 175628, "epoch": 4181} {"train_loss": -7.051870822906494, "global_step": 175629, "epoch": 4181} {"train_loss": -7.089956283569336, "global_step": 175630, "epoch": 4181} {"train_loss": -7.169617652893066, "global_step": 175631, "epoch": 4181} {"train_loss": -7.113006591796875, "global_step": 175632, "epoch": 4181} {"train_loss": -7.0038299560546875, "global_step": 175633, "epoch": 4181} {"train_loss": -7.07374906539917, "global_step": 175634, "epoch": 4181} {"train_loss": -6.99453067779541, "global_step": 175635, "epoch": 4181} {"train_loss": -7.027716636657715, "global_step": 175636, "epoch": 4181} {"train_loss": -7.038384437561035, "global_step": 175637, "epoch": 4181} {"train_loss": -6.919447898864746, "global_step": 175638, "epoch": 4181} {"train_loss": -7.176067352294922, "global_step": 175639, "epoch": 4181} {"train_loss": -7.067836761474609, "global_step": 175640, "epoch": 4181} {"train_loss": -7.084847450256348, "global_step": 175641, "epoch": 4181} {"train_loss": -7.161983489990234, "global_step": 175642, "epoch": 4181} {"train_loss": -7.0755563009352915, "global_step": 175643, "epoch": 4181, "val_loss": 80062.7578125} {"train_loss": -7.094578742980957, "global_step": 175644, "epoch": 4182} {"train_loss": -7.222814559936523, "global_step": 175645, "epoch": 4182} {"train_loss": -7.169784069061279, "global_step": 175646, "epoch": 4182} {"train_loss": -7.034367561340332, "global_step": 175647, "epoch": 4182} {"train_loss": -7.1690568923950195, "global_step": 175648, "epoch": 4182} {"train_loss": -7.147090911865234, "global_step": 175649, "epoch": 4182} {"train_loss": -7.144059658050537, "global_step": 175650, "epoch": 4182} {"train_loss": -7.133606910705566, "global_step": 175651, "epoch": 4182} {"train_loss": -7.136126518249512, "global_step": 175652, "epoch": 4182} {"train_loss": -7.095179080963135, "global_step": 175653, "epoch": 4182} {"train_loss": -7.179500579833984, "global_step": 175654, "epoch": 4182} {"train_loss": -7.1582465171813965, "global_step": 175655, "epoch": 4182} {"train_loss": -7.1577677726745605, "global_step": 175656, "epoch": 4182} {"train_loss": -7.149865627288818, "global_step": 175657, "epoch": 4182} {"train_loss": -7.1950836181640625, "global_step": 175658, "epoch": 4182} {"train_loss": -7.142465591430664, "global_step": 175659, "epoch": 4182} {"train_loss": -7.117117404937744, "global_step": 175660, "epoch": 4182} {"train_loss": -7.119668960571289, "global_step": 175661, "epoch": 4182} {"train_loss": -7.029519557952881, "global_step": 175662, "epoch": 4182} {"train_loss": -7.205204963684082, "global_step": 175663, "epoch": 4182} {"train_loss": -7.215638160705566, "global_step": 175664, "epoch": 4182} {"train_loss": -7.1465535163879395, "global_step": 175665, "epoch": 4182} {"train_loss": -7.115575313568115, "global_step": 175666, "epoch": 4182} {"train_loss": -7.075847625732422, "global_step": 175667, "epoch": 4182} {"train_loss": -7.097894191741943, "global_step": 175668, "epoch": 4182} {"train_loss": -7.086535453796387, "global_step": 175669, "epoch": 4182} {"train_loss": -7.088076591491699, "global_step": 175670, "epoch": 4182} {"train_loss": -7.106110572814941, "global_step": 175671, "epoch": 4182} {"train_loss": -7.18869686126709, "global_step": 175672, "epoch": 4182} {"train_loss": -7.111164569854736, "global_step": 175673, "epoch": 4182} {"train_loss": -7.129622936248779, "global_step": 175674, "epoch": 4182} {"train_loss": -7.059032440185547, "global_step": 175675, "epoch": 4182} {"train_loss": -7.058753967285156, "global_step": 175676, "epoch": 4182} {"train_loss": -7.037295341491699, "global_step": 175677, "epoch": 4182} {"train_loss": -7.138830184936523, "global_step": 175678, "epoch": 4182} {"train_loss": -7.149883270263672, "global_step": 175679, "epoch": 4182} {"train_loss": -7.114316940307617, "global_step": 175680, "epoch": 4182} {"train_loss": -7.108430862426758, "global_step": 175681, "epoch": 4182} {"train_loss": -7.137383460998535, "global_step": 175682, "epoch": 4182} {"train_loss": -7.208252906799316, "global_step": 175683, "epoch": 4182} {"train_loss": -7.0620245933532715, "global_step": 175684, "epoch": 4182} {"train_loss": -7.1286494845435735, "global_step": 175685, "epoch": 4182, "val_loss": 80281.1796875} {"train_loss": -7.184967994689941, "global_step": 175686, "epoch": 4183} {"train_loss": -7.086024284362793, "global_step": 175687, "epoch": 4183} {"train_loss": -7.1927080154418945, "global_step": 175688, "epoch": 4183} {"train_loss": -7.209980010986328, "global_step": 175689, "epoch": 4183} {"train_loss": -7.141024589538574, "global_step": 175690, "epoch": 4183} {"train_loss": -7.10940408706665, "global_step": 175691, "epoch": 4183} {"train_loss": -7.176211357116699, "global_step": 175692, "epoch": 4183} {"train_loss": -7.155702590942383, "global_step": 175693, "epoch": 4183} {"train_loss": -7.101658821105957, "global_step": 175694, "epoch": 4183} {"train_loss": -7.105774402618408, "global_step": 175695, "epoch": 4183} {"train_loss": -7.131647109985352, "global_step": 175696, "epoch": 4183} {"train_loss": -7.197380065917969, "global_step": 175697, "epoch": 4183} {"train_loss": -7.072772026062012, "global_step": 175698, "epoch": 4183} {"train_loss": -7.213414192199707, "global_step": 175699, "epoch": 4183} {"train_loss": -7.057826995849609, "global_step": 175700, "epoch": 4183} {"train_loss": -7.189587593078613, "global_step": 175701, "epoch": 4183} {"train_loss": -7.053022384643555, "global_step": 175702, "epoch": 4183} {"train_loss": -6.9831132888793945, "global_step": 175703, "epoch": 4183} {"train_loss": -7.042083263397217, "global_step": 175704, "epoch": 4183} {"train_loss": -7.003684997558594, "global_step": 175705, "epoch": 4183} {"train_loss": -6.999940872192383, "global_step": 175706, "epoch": 4183} {"train_loss": -7.023744583129883, "global_step": 175707, "epoch": 4183} {"train_loss": -7.1335954666137695, "global_step": 175708, "epoch": 4183} {"train_loss": -7.081182479858398, "global_step": 175709, "epoch": 4183} {"train_loss": -7.004260063171387, "global_step": 175710, "epoch": 4183} {"train_loss": -7.032279014587402, "global_step": 175711, "epoch": 4183} {"train_loss": -7.0575408935546875, "global_step": 175712, "epoch": 4183} {"train_loss": -7.071490287780762, "global_step": 175713, "epoch": 4183} {"train_loss": -7.0536298751831055, "global_step": 175714, "epoch": 4183} {"train_loss": -6.991401672363281, "global_step": 175715, "epoch": 4183} {"train_loss": -7.069512844085693, "global_step": 175716, "epoch": 4183} {"train_loss": -7.081634044647217, "global_step": 175717, "epoch": 4183} {"train_loss": -7.035148620605469, "global_step": 175718, "epoch": 4183} {"train_loss": -7.150262832641602, "global_step": 175719, "epoch": 4183} {"train_loss": -6.898310661315918, "global_step": 175720, "epoch": 4183} {"train_loss": -7.122419357299805, "global_step": 175721, "epoch": 4183} {"train_loss": -7.062615394592285, "global_step": 175722, "epoch": 4183} {"train_loss": -6.92938232421875, "global_step": 175723, "epoch": 4183} {"train_loss": -7.090368270874023, "global_step": 175724, "epoch": 4183} {"train_loss": -7.187885284423828, "global_step": 175725, "epoch": 4183} {"train_loss": -7.006841659545898, "global_step": 175726, "epoch": 4183} {"train_loss": -7.086181175141108, "global_step": 175727, "epoch": 4183, "val_loss": 80256.5390625} {"train_loss": -6.900879859924316, "global_step": 175728, "epoch": 4184} {"train_loss": -7.071039199829102, "global_step": 175729, "epoch": 4184} {"train_loss": -7.0167236328125, "global_step": 175730, "epoch": 4184} {"train_loss": -6.938056945800781, "global_step": 175731, "epoch": 4184} {"train_loss": -7.0247087478637695, "global_step": 175732, "epoch": 4184} {"train_loss": -6.957856178283691, "global_step": 175733, "epoch": 4184} {"train_loss": -7.021026611328125, "global_step": 175734, "epoch": 4184} {"train_loss": -7.076931953430176, "global_step": 175735, "epoch": 4184} {"train_loss": -7.060758113861084, "global_step": 175736, "epoch": 4184} {"train_loss": -6.930322647094727, "global_step": 175737, "epoch": 4184} {"train_loss": -6.993005752563477, "global_step": 175738, "epoch": 4184} {"train_loss": -6.943475723266602, "global_step": 175739, "epoch": 4184} {"train_loss": -7.039617538452148, "global_step": 175740, "epoch": 4184} {"train_loss": -7.094085216522217, "global_step": 175741, "epoch": 4184} {"train_loss": -7.115600109100342, "global_step": 175742, "epoch": 4184} {"train_loss": -7.084792137145996, "global_step": 175743, "epoch": 4184} {"train_loss": -7.002172946929932, "global_step": 175744, "epoch": 4184} {"train_loss": -6.99123477935791, "global_step": 175745, "epoch": 4184} {"train_loss": -7.011896133422852, "global_step": 175746, "epoch": 4184} {"train_loss": -7.1100873947143555, "global_step": 175747, "epoch": 4184} {"train_loss": -7.002635955810547, "global_step": 175748, "epoch": 4184} {"train_loss": -7.031794548034668, "global_step": 175749, "epoch": 4184} {"train_loss": -7.038297653198242, "global_step": 175750, "epoch": 4184} {"train_loss": -7.044950485229492, "global_step": 175751, "epoch": 4184} {"train_loss": -7.103394031524658, "global_step": 175752, "epoch": 4184} {"train_loss": -7.196223258972168, "global_step": 175753, "epoch": 4184} {"train_loss": -7.076626777648926, "global_step": 175754, "epoch": 4184} {"train_loss": -7.208303451538086, "global_step": 175755, "epoch": 4184} {"train_loss": -7.050805568695068, "global_step": 175756, "epoch": 4184} {"train_loss": -7.161848068237305, "global_step": 175757, "epoch": 4184} {"train_loss": -7.158342361450195, "global_step": 175758, "epoch": 4184} {"train_loss": -7.029687881469727, "global_step": 175759, "epoch": 4184} {"train_loss": -7.156349182128906, "global_step": 175760, "epoch": 4184} {"train_loss": -7.057299613952637, "global_step": 175761, "epoch": 4184} {"train_loss": -6.978042125701904, "global_step": 175762, "epoch": 4184} {"train_loss": -7.11527681350708, "global_step": 175763, "epoch": 4184} {"train_loss": -7.117815017700195, "global_step": 175764, "epoch": 4184} {"train_loss": -7.046000957489014, "global_step": 175765, "epoch": 4184} {"train_loss": -7.121979713439941, "global_step": 175766, "epoch": 4184} {"train_loss": -7.065438270568848, "global_step": 175767, "epoch": 4184} {"train_loss": -7.103237152099609, "global_step": 175768, "epoch": 4184} {"train_loss": -7.055242458979289, "global_step": 175769, "epoch": 4184, "val_loss": 80163.0546875} {"train_loss": -7.056194305419922, "global_step": 175770, "epoch": 4185} {"train_loss": -7.079881191253662, "global_step": 175771, "epoch": 4185} {"train_loss": -7.1113972663879395, "global_step": 175772, "epoch": 4185} {"train_loss": -6.987125396728516, "global_step": 175773, "epoch": 4185} {"train_loss": -7.039546012878418, "global_step": 175774, "epoch": 4185} {"train_loss": -7.062999725341797, "global_step": 175775, "epoch": 4185} {"train_loss": -7.06130838394165, "global_step": 175776, "epoch": 4185} {"train_loss": -7.038100242614746, "global_step": 175777, "epoch": 4185} {"train_loss": -7.110090732574463, "global_step": 175778, "epoch": 4185} {"train_loss": -7.068812847137451, "global_step": 175779, "epoch": 4185} {"train_loss": -7.06920051574707, "global_step": 175780, "epoch": 4185} {"train_loss": -7.067480087280273, "global_step": 175781, "epoch": 4185} {"train_loss": -7.087730884552002, "global_step": 175782, "epoch": 4185} {"train_loss": -7.0829033851623535, "global_step": 175783, "epoch": 4185} {"train_loss": -7.091708183288574, "global_step": 175784, "epoch": 4185} {"train_loss": -7.142343521118164, "global_step": 175785, "epoch": 4185} {"train_loss": -7.006036281585693, "global_step": 175786, "epoch": 4185} {"train_loss": -7.173918724060059, "global_step": 175787, "epoch": 4185} {"train_loss": -7.21766471862793, "global_step": 175788, "epoch": 4185} {"train_loss": -7.238426208496094, "global_step": 175789, "epoch": 4185} {"train_loss": -7.071080207824707, "global_step": 175790, "epoch": 4185} {"train_loss": -7.127568244934082, "global_step": 175791, "epoch": 4185} {"train_loss": -7.123684883117676, "global_step": 175792, "epoch": 4185} {"train_loss": -7.097273349761963, "global_step": 175793, "epoch": 4185} {"train_loss": -7.17235803604126, "global_step": 175794, "epoch": 4185} {"train_loss": -7.10073184967041, "global_step": 175795, "epoch": 4185} {"train_loss": -7.020693778991699, "global_step": 175796, "epoch": 4185} {"train_loss": -7.0023040771484375, "global_step": 175797, "epoch": 4185} {"train_loss": -7.188666343688965, "global_step": 175798, "epoch": 4185} {"train_loss": -7.051673889160156, "global_step": 175799, "epoch": 4185} {"train_loss": -7.0824432373046875, "global_step": 175800, "epoch": 4185} {"train_loss": -7.143280982971191, "global_step": 175801, "epoch": 4185} {"train_loss": -7.084486961364746, "global_step": 175802, "epoch": 4185} {"train_loss": -7.023358345031738, "global_step": 175803, "epoch": 4185} {"train_loss": -7.05569314956665, "global_step": 175804, "epoch": 4185} {"train_loss": -7.062539577484131, "global_step": 175805, "epoch": 4185} {"train_loss": -7.07602071762085, "global_step": 175806, "epoch": 4185} {"train_loss": -7.1201677322387695, "global_step": 175807, "epoch": 4185} {"train_loss": -7.126639366149902, "global_step": 175808, "epoch": 4185} {"train_loss": -6.988984107971191, "global_step": 175809, "epoch": 4185} {"train_loss": -7.0845866203308105, "global_step": 175810, "epoch": 4185} {"train_loss": -7.087782825742449, "global_step": 175811, "epoch": 4185, "val_loss": 80155.484375} {"train_loss": -7.153109550476074, "global_step": 175812, "epoch": 4186} {"train_loss": -7.26207160949707, "global_step": 175813, "epoch": 4186} {"train_loss": -7.124088764190674, "global_step": 175814, "epoch": 4186} {"train_loss": -7.162606239318848, "global_step": 175815, "epoch": 4186} {"train_loss": -7.106212615966797, "global_step": 175816, "epoch": 4186} {"train_loss": -7.220938205718994, "global_step": 175817, "epoch": 4186} {"train_loss": -7.075259208679199, "global_step": 175818, "epoch": 4186} {"train_loss": -7.197736740112305, "global_step": 175819, "epoch": 4186} {"train_loss": -7.007097244262695, "global_step": 175820, "epoch": 4186} {"train_loss": -7.201208591461182, "global_step": 175821, "epoch": 4186} {"train_loss": -7.137603282928467, "global_step": 175822, "epoch": 4186} {"train_loss": -7.09576416015625, "global_step": 175823, "epoch": 4186} {"train_loss": -7.177940368652344, "global_step": 175824, "epoch": 4186} {"train_loss": -7.097009658813477, "global_step": 175825, "epoch": 4186} {"train_loss": -7.083280563354492, "global_step": 175826, "epoch": 4186} {"train_loss": -7.138152122497559, "global_step": 175827, "epoch": 4186} {"train_loss": -7.002301216125488, "global_step": 175828, "epoch": 4186} {"train_loss": -7.063085556030273, "global_step": 175829, "epoch": 4186} {"train_loss": -7.055488109588623, "global_step": 175830, "epoch": 4186} {"train_loss": -7.156682014465332, "global_step": 175831, "epoch": 4186} {"train_loss": -7.10239839553833, "global_step": 175832, "epoch": 4186} {"train_loss": -7.107455253601074, "global_step": 175833, "epoch": 4186} {"train_loss": -7.171353816986084, "global_step": 175834, "epoch": 4186} {"train_loss": -7.003016948699951, "global_step": 175835, "epoch": 4186} {"train_loss": -7.184081077575684, "global_step": 175836, "epoch": 4186} {"train_loss": -7.179742813110352, "global_step": 175837, "epoch": 4186} {"train_loss": -7.0985002517700195, "global_step": 175838, "epoch": 4186} {"train_loss": -7.013347625732422, "global_step": 175839, "epoch": 4186} {"train_loss": -7.146827697753906, "global_step": 175840, "epoch": 4186} {"train_loss": -7.113151550292969, "global_step": 175841, "epoch": 4186} {"train_loss": -7.064774513244629, "global_step": 175842, "epoch": 4186} {"train_loss": -7.165896415710449, "global_step": 175843, "epoch": 4186} {"train_loss": -7.06568717956543, "global_step": 175844, "epoch": 4186} {"train_loss": -7.118752956390381, "global_step": 175845, "epoch": 4186} {"train_loss": -7.161749839782715, "global_step": 175846, "epoch": 4186} {"train_loss": -7.112770080566406, "global_step": 175847, "epoch": 4186} {"train_loss": -7.016366004943848, "global_step": 175848, "epoch": 4186} {"train_loss": -7.070265769958496, "global_step": 175849, "epoch": 4186} {"train_loss": -7.129044055938721, "global_step": 175850, "epoch": 4186} {"train_loss": -7.003511428833008, "global_step": 175851, "epoch": 4186} {"train_loss": -7.097805976867676, "global_step": 175852, "epoch": 4186} {"train_loss": -7.112170310247512, "global_step": 175853, "epoch": 4186, "val_loss": 80138.6953125} {"train_loss": -7.07509183883667, "global_step": 175854, "epoch": 4187} {"train_loss": -7.130302429199219, "global_step": 175855, "epoch": 4187} {"train_loss": -7.136425971984863, "global_step": 175856, "epoch": 4187} {"train_loss": -7.023044586181641, "global_step": 175857, "epoch": 4187} {"train_loss": -7.1608734130859375, "global_step": 175858, "epoch": 4187} {"train_loss": -7.1487860679626465, "global_step": 175859, "epoch": 4187} {"train_loss": -7.074256896972656, "global_step": 175860, "epoch": 4187} {"train_loss": -7.048513412475586, "global_step": 175861, "epoch": 4187} {"train_loss": -6.982634544372559, "global_step": 175862, "epoch": 4187} {"train_loss": -7.121698379516602, "global_step": 175863, "epoch": 4187} {"train_loss": -7.009354114532471, "global_step": 175864, "epoch": 4187} {"train_loss": -7.164874076843262, "global_step": 175865, "epoch": 4187} {"train_loss": -7.174272060394287, "global_step": 175866, "epoch": 4187} {"train_loss": -7.124723434448242, "global_step": 175867, "epoch": 4187} {"train_loss": -7.160195350646973, "global_step": 175868, "epoch": 4187} {"train_loss": -6.980595588684082, "global_step": 175869, "epoch": 4187} {"train_loss": -7.122684001922607, "global_step": 175870, "epoch": 4187} {"train_loss": -7.097525596618652, "global_step": 175871, "epoch": 4187} {"train_loss": -7.059121131896973, "global_step": 175872, "epoch": 4187} {"train_loss": -7.114683628082275, "global_step": 175873, "epoch": 4187} {"train_loss": -7.08064603805542, "global_step": 175874, "epoch": 4187} {"train_loss": -6.998873233795166, "global_step": 175875, "epoch": 4187} {"train_loss": -7.054078578948975, "global_step": 175876, "epoch": 4187} {"train_loss": -7.18182897567749, "global_step": 175877, "epoch": 4187} {"train_loss": -7.096108436584473, "global_step": 175878, "epoch": 4187} {"train_loss": -7.116486549377441, "global_step": 175879, "epoch": 4187} {"train_loss": -7.064156532287598, "global_step": 175880, "epoch": 4187} {"train_loss": -7.099667549133301, "global_step": 175881, "epoch": 4187} {"train_loss": -7.19258975982666, "global_step": 175882, "epoch": 4187} {"train_loss": -7.082093238830566, "global_step": 175883, "epoch": 4187} {"train_loss": -7.0984649658203125, "global_step": 175884, "epoch": 4187} {"train_loss": -7.063975811004639, "global_step": 175885, "epoch": 4187} {"train_loss": -7.038520812988281, "global_step": 175886, "epoch": 4187} {"train_loss": -7.115704536437988, "global_step": 175887, "epoch": 4187} {"train_loss": -7.098184585571289, "global_step": 175888, "epoch": 4187} {"train_loss": -7.07090425491333, "global_step": 175889, "epoch": 4187} {"train_loss": -7.083191871643066, "global_step": 175890, "epoch": 4187} {"train_loss": -7.134958267211914, "global_step": 175891, "epoch": 4187} {"train_loss": -7.046536922454834, "global_step": 175892, "epoch": 4187} {"train_loss": -7.042807579040527, "global_step": 175893, "epoch": 4187} {"train_loss": -7.163092613220215, "global_step": 175894, "epoch": 4187} {"train_loss": -7.091443765731085, "global_step": 175895, "epoch": 4187, "val_loss": 80097.4453125} {"train_loss": -6.939937591552734, "global_step": 175896, "epoch": 4188} {"train_loss": -7.135313987731934, "global_step": 175897, "epoch": 4188} {"train_loss": -7.185941696166992, "global_step": 175898, "epoch": 4188} {"train_loss": -7.09164571762085, "global_step": 175899, "epoch": 4188} {"train_loss": -7.122267723083496, "global_step": 175900, "epoch": 4188} {"train_loss": -7.06732177734375, "global_step": 175901, "epoch": 4188} {"train_loss": -7.086265563964844, "global_step": 175902, "epoch": 4188} {"train_loss": -7.14493465423584, "global_step": 175903, "epoch": 4188} {"train_loss": -7.087499618530273, "global_step": 175904, "epoch": 4188} {"train_loss": -7.145910263061523, "global_step": 175905, "epoch": 4188} {"train_loss": -7.190313339233398, "global_step": 175906, "epoch": 4188} {"train_loss": -7.011023998260498, "global_step": 175907, "epoch": 4188} {"train_loss": -7.089264869689941, "global_step": 175908, "epoch": 4188} {"train_loss": -7.1728434562683105, "global_step": 175909, "epoch": 4188} {"train_loss": -7.10014533996582, "global_step": 175910, "epoch": 4188} {"train_loss": -7.179325103759766, "global_step": 175911, "epoch": 4188} {"train_loss": -7.020616054534912, "global_step": 175912, "epoch": 4188} {"train_loss": -7.035707950592041, "global_step": 175913, "epoch": 4188} {"train_loss": -7.221891403198242, "global_step": 175914, "epoch": 4188} {"train_loss": -6.976283073425293, "global_step": 175915, "epoch": 4188} {"train_loss": -7.2184553146362305, "global_step": 175916, "epoch": 4188} {"train_loss": -6.9526214599609375, "global_step": 175917, "epoch": 4188} {"train_loss": -6.982760906219482, "global_step": 175918, "epoch": 4188} {"train_loss": -7.09877872467041, "global_step": 175919, "epoch": 4188} {"train_loss": -7.061633110046387, "global_step": 175920, "epoch": 4188} {"train_loss": -7.084549903869629, "global_step": 175921, "epoch": 4188} {"train_loss": -7.139857292175293, "global_step": 175922, "epoch": 4188} {"train_loss": -7.100979804992676, "global_step": 175923, "epoch": 4188} {"train_loss": -7.050029277801514, "global_step": 175924, "epoch": 4188} {"train_loss": -6.975177764892578, "global_step": 175925, "epoch": 4188} {"train_loss": -7.025653839111328, "global_step": 175926, "epoch": 4188} {"train_loss": -6.952489376068115, "global_step": 175927, "epoch": 4188} {"train_loss": -7.064251899719238, "global_step": 175928, "epoch": 4188} {"train_loss": -7.167614459991455, "global_step": 175929, "epoch": 4188} {"train_loss": -7.041867256164551, "global_step": 175930, "epoch": 4188} {"train_loss": -7.070734977722168, "global_step": 175931, "epoch": 4188} {"train_loss": -7.099381446838379, "global_step": 175932, "epoch": 4188} {"train_loss": -7.106006622314453, "global_step": 175933, "epoch": 4188} {"train_loss": -7.1002702713012695, "global_step": 175934, "epoch": 4188} {"train_loss": -6.9745588302612305, "global_step": 175935, "epoch": 4188} {"train_loss": -7.083049297332764, "global_step": 175936, "epoch": 4188} {"train_loss": -7.081799404961722, "global_step": 175937, "epoch": 4188, "val_loss": 80374.3125} {"train_loss": -7.043731212615967, "global_step": 175938, "epoch": 4189} {"train_loss": -7.214837074279785, "global_step": 175939, "epoch": 4189} {"train_loss": -7.102582931518555, "global_step": 175940, "epoch": 4189} {"train_loss": -7.136181831359863, "global_step": 175941, "epoch": 4189} {"train_loss": -7.151012420654297, "global_step": 175942, "epoch": 4189} {"train_loss": -7.116840839385986, "global_step": 175943, "epoch": 4189} {"train_loss": -7.077646255493164, "global_step": 175944, "epoch": 4189} {"train_loss": -7.087161064147949, "global_step": 175945, "epoch": 4189} {"train_loss": -7.057401657104492, "global_step": 175946, "epoch": 4189} {"train_loss": -7.180824279785156, "global_step": 175947, "epoch": 4189} {"train_loss": -7.106812953948975, "global_step": 175948, "epoch": 4189} {"train_loss": -7.08054256439209, "global_step": 175949, "epoch": 4189} {"train_loss": -7.110882759094238, "global_step": 175950, "epoch": 4189} {"train_loss": -6.968951225280762, "global_step": 175951, "epoch": 4189} {"train_loss": -6.937647819519043, "global_step": 175952, "epoch": 4189} {"train_loss": -7.118007659912109, "global_step": 175953, "epoch": 4189} {"train_loss": -7.149061679840088, "global_step": 175954, "epoch": 4189} {"train_loss": -6.947775840759277, "global_step": 175955, "epoch": 4189} {"train_loss": -7.116547584533691, "global_step": 175956, "epoch": 4189} {"train_loss": -7.004703998565674, "global_step": 175957, "epoch": 4189} {"train_loss": -7.051828384399414, "global_step": 175958, "epoch": 4189} {"train_loss": -7.226265907287598, "global_step": 175959, "epoch": 4189} {"train_loss": -6.977004051208496, "global_step": 175960, "epoch": 4189} {"train_loss": -7.216166973114014, "global_step": 175961, "epoch": 4189} {"train_loss": -7.093405246734619, "global_step": 175962, "epoch": 4189} {"train_loss": -6.967999458312988, "global_step": 175963, "epoch": 4189} {"train_loss": -7.034749984741211, "global_step": 175964, "epoch": 4189} {"train_loss": -7.109335422515869, "global_step": 175965, "epoch": 4189} {"train_loss": -7.064027309417725, "global_step": 175966, "epoch": 4189} {"train_loss": -7.020367622375488, "global_step": 175967, "epoch": 4189} {"train_loss": -7.041351318359375, "global_step": 175968, "epoch": 4189} {"train_loss": -7.056522846221924, "global_step": 175969, "epoch": 4189} {"train_loss": -7.034605503082275, "global_step": 175970, "epoch": 4189} {"train_loss": -7.107203483581543, "global_step": 175971, "epoch": 4189} {"train_loss": -7.175874710083008, "global_step": 175972, "epoch": 4189} {"train_loss": -6.948306560516357, "global_step": 175973, "epoch": 4189} {"train_loss": -7.061406135559082, "global_step": 175974, "epoch": 4189} {"train_loss": -7.08026123046875, "global_step": 175975, "epoch": 4189} {"train_loss": -7.0202717781066895, "global_step": 175976, "epoch": 4189} {"train_loss": -7.018992900848389, "global_step": 175977, "epoch": 4189} {"train_loss": -7.10251522064209, "global_step": 175978, "epoch": 4189} {"train_loss": -7.0780885219573975, "global_step": 175979, "epoch": 4189, "val_loss": 80386.2890625} {"train_loss": -7.260610580444336, "global_step": 175980, "epoch": 4190} {"train_loss": -7.250860214233398, "global_step": 175981, "epoch": 4190} {"train_loss": -7.149312973022461, "global_step": 175982, "epoch": 4190} {"train_loss": -7.100240707397461, "global_step": 175983, "epoch": 4190} {"train_loss": -7.163364410400391, "global_step": 175984, "epoch": 4190} {"train_loss": -7.0805158615112305, "global_step": 175985, "epoch": 4190} {"train_loss": -7.204356670379639, "global_step": 175986, "epoch": 4190} {"train_loss": -7.219108581542969, "global_step": 175987, "epoch": 4190} {"train_loss": -7.121671199798584, "global_step": 175988, "epoch": 4190} {"train_loss": -7.172239303588867, "global_step": 175989, "epoch": 4190} {"train_loss": -7.109525680541992, "global_step": 175990, "epoch": 4190} {"train_loss": -7.301867961883545, "global_step": 175991, "epoch": 4190} {"train_loss": -7.204622268676758, "global_step": 175992, "epoch": 4190} {"train_loss": -7.211668014526367, "global_step": 175993, "epoch": 4190} {"train_loss": -7.166848182678223, "global_step": 175994, "epoch": 4190} {"train_loss": -7.156927108764648, "global_step": 175995, "epoch": 4190} {"train_loss": -7.13551139831543, "global_step": 175996, "epoch": 4190} {"train_loss": -7.123133182525635, "global_step": 175997, "epoch": 4190} {"train_loss": -7.048948764801025, "global_step": 175998, "epoch": 4190} {"train_loss": -7.026200294494629, "global_step": 175999, "epoch": 4190} {"train_loss": -7.114701271057129, "global_step": 176000, "epoch": 4190} {"train_loss": -6.9236602783203125, "global_step": 176001, "epoch": 4190} {"train_loss": -6.778003692626953, "global_step": 176002, "epoch": 4190} {"train_loss": -6.9442853927612305, "global_step": 176003, "epoch": 4190} {"train_loss": -6.9208574295043945, "global_step": 176004, "epoch": 4190} {"train_loss": -6.855863571166992, "global_step": 176005, "epoch": 4190} {"train_loss": -7.019108295440674, "global_step": 176006, "epoch": 4190} {"train_loss": -7.024641036987305, "global_step": 176007, "epoch": 4190} {"train_loss": -7.060281753540039, "global_step": 176008, "epoch": 4190} {"train_loss": -6.9774394035339355, "global_step": 176009, "epoch": 4190} {"train_loss": -7.112619876861572, "global_step": 176010, "epoch": 4190} {"train_loss": -7.10187292098999, "global_step": 176011, "epoch": 4190} {"train_loss": -7.003266334533691, "global_step": 176012, "epoch": 4190} {"train_loss": -7.1016340255737305, "global_step": 176013, "epoch": 4190} {"train_loss": -6.906942844390869, "global_step": 176014, "epoch": 4190} {"train_loss": -7.052956581115723, "global_step": 176015, "epoch": 4190} {"train_loss": -7.002995014190674, "global_step": 176016, "epoch": 4190} {"train_loss": -7.117721080780029, "global_step": 176017, "epoch": 4190} {"train_loss": -6.993515968322754, "global_step": 176018, "epoch": 4190} {"train_loss": -7.050459861755371, "global_step": 176019, "epoch": 4190} {"train_loss": -7.034987449645996, "global_step": 176020, "epoch": 4190} {"train_loss": -7.08373296828497, "global_step": 176021, "epoch": 4190, "val_loss": 80181.265625} {"train_loss": -7.276015281677246, "global_step": 176022, "epoch": 4191} {"train_loss": -7.026121139526367, "global_step": 176023, "epoch": 4191} {"train_loss": -7.096285820007324, "global_step": 176024, "epoch": 4191} {"train_loss": -7.049984931945801, "global_step": 176025, "epoch": 4191} {"train_loss": -7.122551918029785, "global_step": 176026, "epoch": 4191} {"train_loss": -7.085884094238281, "global_step": 176027, "epoch": 4191} {"train_loss": -7.188141345977783, "global_step": 176028, "epoch": 4191} {"train_loss": -7.086294174194336, "global_step": 176029, "epoch": 4191} {"train_loss": -7.199798583984375, "global_step": 176030, "epoch": 4191} {"train_loss": -7.200394630432129, "global_step": 176031, "epoch": 4191} {"train_loss": -7.161140441894531, "global_step": 176032, "epoch": 4191} {"train_loss": -7.096310138702393, "global_step": 176033, "epoch": 4191} {"train_loss": -7.094754219055176, "global_step": 176034, "epoch": 4191} {"train_loss": -7.11005163192749, "global_step": 176035, "epoch": 4191} {"train_loss": -7.0815277099609375, "global_step": 176036, "epoch": 4191} {"train_loss": -7.162411212921143, "global_step": 176037, "epoch": 4191} {"train_loss": -7.199329853057861, "global_step": 176038, "epoch": 4191} {"train_loss": -7.140987873077393, "global_step": 176039, "epoch": 4191} {"train_loss": -7.05794620513916, "global_step": 176040, "epoch": 4191} {"train_loss": -7.238306999206543, "global_step": 176041, "epoch": 4191} {"train_loss": -7.037024974822998, "global_step": 176042, "epoch": 4191} {"train_loss": -7.09807014465332, "global_step": 176043, "epoch": 4191} {"train_loss": -7.14909553527832, "global_step": 176044, "epoch": 4191} {"train_loss": -7.0193915367126465, "global_step": 176045, "epoch": 4191} {"train_loss": -6.975277900695801, "global_step": 176046, "epoch": 4191} {"train_loss": -7.116453170776367, "global_step": 176047, "epoch": 4191} {"train_loss": -7.078008651733398, "global_step": 176048, "epoch": 4191} {"train_loss": -7.1598052978515625, "global_step": 176049, "epoch": 4191} {"train_loss": -7.095887660980225, "global_step": 176050, "epoch": 4191} {"train_loss": -7.100915431976318, "global_step": 176051, "epoch": 4191} {"train_loss": -7.093529224395752, "global_step": 176052, "epoch": 4191} {"train_loss": -6.984587669372559, "global_step": 176053, "epoch": 4191} {"train_loss": -7.107039451599121, "global_step": 176054, "epoch": 4191} {"train_loss": -6.936783790588379, "global_step": 176055, "epoch": 4191} {"train_loss": -7.0504279136657715, "global_step": 176056, "epoch": 4191} {"train_loss": -6.909043312072754, "global_step": 176057, "epoch": 4191} {"train_loss": -6.786876678466797, "global_step": 176058, "epoch": 4191} {"train_loss": -6.994786262512207, "global_step": 176059, "epoch": 4191} {"train_loss": -6.638337135314941, "global_step": 176060, "epoch": 4191} {"train_loss": -7.001649856567383, "global_step": 176061, "epoch": 4191} {"train_loss": -6.787029266357422, "global_step": 176062, "epoch": 4191} {"train_loss": -7.063463199706304, "global_step": 176063, "epoch": 4191, "val_loss": 80459.9453125} {"train_loss": -6.828197956085205, "global_step": 176064, "epoch": 4192} {"train_loss": -6.766746520996094, "global_step": 176065, "epoch": 4192} {"train_loss": -6.992107391357422, "global_step": 176066, "epoch": 4192} {"train_loss": -6.818033218383789, "global_step": 176067, "epoch": 4192} {"train_loss": -6.8826799392700195, "global_step": 176068, "epoch": 4192} {"train_loss": -6.725973606109619, "global_step": 176069, "epoch": 4192} {"train_loss": -7.046146869659424, "global_step": 176070, "epoch": 4192} {"train_loss": -6.878359317779541, "global_step": 176071, "epoch": 4192} {"train_loss": -6.9924821853637695, "global_step": 176072, "epoch": 4192} {"train_loss": -6.873080730438232, "global_step": 176073, "epoch": 4192} {"train_loss": -6.856760025024414, "global_step": 176074, "epoch": 4192} {"train_loss": -7.0020833015441895, "global_step": 176075, "epoch": 4192} {"train_loss": -6.983241081237793, "global_step": 176076, "epoch": 4192} {"train_loss": -6.975419044494629, "global_step": 176077, "epoch": 4192} {"train_loss": -6.998320579528809, "global_step": 176078, "epoch": 4192} {"train_loss": -6.989989280700684, "global_step": 176079, "epoch": 4192} {"train_loss": -7.066405296325684, "global_step": 176080, "epoch": 4192} {"train_loss": -7.018294334411621, "global_step": 176081, "epoch": 4192} {"train_loss": -7.182684421539307, "global_step": 176082, "epoch": 4192} {"train_loss": -7.094385147094727, "global_step": 176083, "epoch": 4192} {"train_loss": -7.151405334472656, "global_step": 176084, "epoch": 4192} {"train_loss": -6.965662956237793, "global_step": 176085, "epoch": 4192} {"train_loss": -7.070844650268555, "global_step": 176086, "epoch": 4192} {"train_loss": -7.111357688903809, "global_step": 176087, "epoch": 4192} {"train_loss": -7.132246017456055, "global_step": 176088, "epoch": 4192} {"train_loss": -7.0585150718688965, "global_step": 176089, "epoch": 4192} {"train_loss": -7.1550703048706055, "global_step": 176090, "epoch": 4192} {"train_loss": -7.078309059143066, "global_step": 176091, "epoch": 4192} {"train_loss": -6.944670677185059, "global_step": 176092, "epoch": 4192} {"train_loss": -7.115419387817383, "global_step": 176093, "epoch": 4192} {"train_loss": -7.1394243240356445, "global_step": 176094, "epoch": 4192} {"train_loss": -7.208486557006836, "global_step": 176095, "epoch": 4192} {"train_loss": -7.0850067138671875, "global_step": 176096, "epoch": 4192} {"train_loss": -7.201019287109375, "global_step": 176097, "epoch": 4192} {"train_loss": -7.129339694976807, "global_step": 176098, "epoch": 4192} {"train_loss": -7.178130149841309, "global_step": 176099, "epoch": 4192} {"train_loss": -7.179430961608887, "global_step": 176100, "epoch": 4192} {"train_loss": -7.040158748626709, "global_step": 176101, "epoch": 4192} {"train_loss": -7.110904216766357, "global_step": 176102, "epoch": 4192} {"train_loss": -7.110262870788574, "global_step": 176103, "epoch": 4192} {"train_loss": -7.013365268707275, "global_step": 176104, "epoch": 4192} {"train_loss": -7.030821402867635, "global_step": 176105, "epoch": 4192, "val_loss": 79997.7421875} {"train_loss": -7.073036193847656, "global_step": 176106, "epoch": 4193} {"train_loss": -7.0350518226623535, "global_step": 176107, "epoch": 4193} {"train_loss": -7.155106544494629, "global_step": 176108, "epoch": 4193} {"train_loss": -7.092672824859619, "global_step": 176109, "epoch": 4193} {"train_loss": -7.09880256652832, "global_step": 176110, "epoch": 4193} {"train_loss": -7.070718765258789, "global_step": 176111, "epoch": 4193} {"train_loss": -7.137016296386719, "global_step": 176112, "epoch": 4193} {"train_loss": -7.188971519470215, "global_step": 176113, "epoch": 4193} {"train_loss": -7.102412223815918, "global_step": 176114, "epoch": 4193} {"train_loss": -7.1519975662231445, "global_step": 176115, "epoch": 4193} {"train_loss": -7.118376731872559, "global_step": 176116, "epoch": 4193} {"train_loss": -7.133095741271973, "global_step": 176117, "epoch": 4193} {"train_loss": -7.06271505355835, "global_step": 176118, "epoch": 4193} {"train_loss": -7.133907318115234, "global_step": 176119, "epoch": 4193} {"train_loss": -7.160599231719971, "global_step": 176120, "epoch": 4193} {"train_loss": -7.063807010650635, "global_step": 176121, "epoch": 4193} {"train_loss": -7.172589302062988, "global_step": 176122, "epoch": 4193} {"train_loss": -7.19748067855835, "global_step": 176123, "epoch": 4193} {"train_loss": -7.107771873474121, "global_step": 176124, "epoch": 4193} {"train_loss": -7.23153018951416, "global_step": 176125, "epoch": 4193} {"train_loss": -7.19288444519043, "global_step": 176126, "epoch": 4193} {"train_loss": -6.997961521148682, "global_step": 176127, "epoch": 4193} {"train_loss": -7.255373001098633, "global_step": 176128, "epoch": 4193} {"train_loss": -7.191411018371582, "global_step": 176129, "epoch": 4193} {"train_loss": -7.209833145141602, "global_step": 176130, "epoch": 4193} {"train_loss": -7.220101356506348, "global_step": 176131, "epoch": 4193} {"train_loss": -7.104736804962158, "global_step": 176132, "epoch": 4193} {"train_loss": -7.204069137573242, "global_step": 176133, "epoch": 4193} {"train_loss": -7.027999401092529, "global_step": 176134, "epoch": 4193} {"train_loss": -7.173791885375977, "global_step": 176135, "epoch": 4193} {"train_loss": -7.084190368652344, "global_step": 176136, "epoch": 4193} {"train_loss": -7.16560697555542, "global_step": 176137, "epoch": 4193} {"train_loss": -7.13189697265625, "global_step": 176138, "epoch": 4193} {"train_loss": -7.0199151039123535, "global_step": 176139, "epoch": 4193} {"train_loss": -7.174467086791992, "global_step": 176140, "epoch": 4193} {"train_loss": -7.117657661437988, "global_step": 176141, "epoch": 4193} {"train_loss": -7.0068230628967285, "global_step": 176142, "epoch": 4193} {"train_loss": -7.084284782409668, "global_step": 176143, "epoch": 4193} {"train_loss": -7.011007785797119, "global_step": 176144, "epoch": 4193} {"train_loss": -7.1067962646484375, "global_step": 176145, "epoch": 4193} {"train_loss": -7.054051399230957, "global_step": 176146, "epoch": 4193} {"train_loss": -7.122891471499488, "global_step": 176147, "epoch": 4193, "val_loss": 80321.96875} {"train_loss": -7.049223899841309, "global_step": 176148, "epoch": 4194} {"train_loss": -7.009607791900635, "global_step": 176149, "epoch": 4194} {"train_loss": -7.0767741203308105, "global_step": 176150, "epoch": 4194} {"train_loss": -7.118546485900879, "global_step": 176151, "epoch": 4194} {"train_loss": -7.08723258972168, "global_step": 176152, "epoch": 4194} {"train_loss": -7.066768169403076, "global_step": 176153, "epoch": 4194} {"train_loss": -7.00745964050293, "global_step": 176154, "epoch": 4194} {"train_loss": -7.029005527496338, "global_step": 176155, "epoch": 4194} {"train_loss": -6.990514755249023, "global_step": 176156, "epoch": 4194} {"train_loss": -7.08086633682251, "global_step": 176157, "epoch": 4194} {"train_loss": -7.08512020111084, "global_step": 176158, "epoch": 4194} {"train_loss": -7.159265518188477, "global_step": 176159, "epoch": 4194} {"train_loss": -7.110177993774414, "global_step": 176160, "epoch": 4194} {"train_loss": -6.980708122253418, "global_step": 176161, "epoch": 4194} {"train_loss": -7.095881938934326, "global_step": 176162, "epoch": 4194} {"train_loss": -7.03339958190918, "global_step": 176163, "epoch": 4194} {"train_loss": -7.136402130126953, "global_step": 176164, "epoch": 4194} {"train_loss": -7.138249397277832, "global_step": 176165, "epoch": 4194} {"train_loss": -6.905725002288818, "global_step": 176166, "epoch": 4194} {"train_loss": -7.030242919921875, "global_step": 176167, "epoch": 4194} {"train_loss": -7.116659641265869, "global_step": 176168, "epoch": 4194} {"train_loss": -7.00389289855957, "global_step": 176169, "epoch": 4194} {"train_loss": -7.103763580322266, "global_step": 176170, "epoch": 4194} {"train_loss": -7.113865852355957, "global_step": 176171, "epoch": 4194} {"train_loss": -7.073430061340332, "global_step": 176172, "epoch": 4194} {"train_loss": -7.090822219848633, "global_step": 176173, "epoch": 4194} {"train_loss": -7.030241966247559, "global_step": 176174, "epoch": 4194} {"train_loss": -7.064146518707275, "global_step": 176175, "epoch": 4194} {"train_loss": -6.949143886566162, "global_step": 176176, "epoch": 4194} {"train_loss": -7.040724754333496, "global_step": 176177, "epoch": 4194} {"train_loss": -7.032622337341309, "global_step": 176178, "epoch": 4194} {"train_loss": -7.118371963500977, "global_step": 176179, "epoch": 4194} {"train_loss": -6.82426118850708, "global_step": 176180, "epoch": 4194} {"train_loss": -7.093279838562012, "global_step": 176181, "epoch": 4194} {"train_loss": -7.014868259429932, "global_step": 176182, "epoch": 4194} {"train_loss": -7.176240921020508, "global_step": 176183, "epoch": 4194} {"train_loss": -7.175820350646973, "global_step": 176184, "epoch": 4194} {"train_loss": -7.053956985473633, "global_step": 176185, "epoch": 4194} {"train_loss": -7.035093307495117, "global_step": 176186, "epoch": 4194} {"train_loss": -7.062017440795898, "global_step": 176187, "epoch": 4194} {"train_loss": -7.135909080505371, "global_step": 176188, "epoch": 4194} {"train_loss": -7.060282343909854, "global_step": 176189, "epoch": 4194, "val_loss": 80136.09375} {"train_loss": -7.092864990234375, "global_step": 176190, "epoch": 4195} {"train_loss": -7.07712984085083, "global_step": 176191, "epoch": 4195} {"train_loss": -7.152266502380371, "global_step": 176192, "epoch": 4195} {"train_loss": -6.951245307922363, "global_step": 176193, "epoch": 4195} {"train_loss": -6.96451997756958, "global_step": 176194, "epoch": 4195} {"train_loss": -7.065830230712891, "global_step": 176195, "epoch": 4195} {"train_loss": -6.982004165649414, "global_step": 176196, "epoch": 4195} {"train_loss": -7.097150802612305, "global_step": 176197, "epoch": 4195} {"train_loss": -7.01508092880249, "global_step": 176198, "epoch": 4195} {"train_loss": -7.029682159423828, "global_step": 176199, "epoch": 4195} {"train_loss": -7.036651611328125, "global_step": 176200, "epoch": 4195} {"train_loss": -6.97821044921875, "global_step": 176201, "epoch": 4195} {"train_loss": -6.9171319007873535, "global_step": 176202, "epoch": 4195} {"train_loss": -7.056031703948975, "global_step": 176203, "epoch": 4195} {"train_loss": -7.093991279602051, "global_step": 176204, "epoch": 4195} {"train_loss": -6.935791969299316, "global_step": 176205, "epoch": 4195} {"train_loss": -7.083295822143555, "global_step": 176206, "epoch": 4195} {"train_loss": -7.121064186096191, "global_step": 176207, "epoch": 4195} {"train_loss": -6.9660820960998535, "global_step": 176208, "epoch": 4195} {"train_loss": -7.012444972991943, "global_step": 176209, "epoch": 4195} {"train_loss": -6.993810653686523, "global_step": 176210, "epoch": 4195} {"train_loss": -7.238253593444824, "global_step": 176211, "epoch": 4195} {"train_loss": -7.031590461730957, "global_step": 176212, "epoch": 4195} {"train_loss": -7.134710311889648, "global_step": 176213, "epoch": 4195} {"train_loss": -7.169613361358643, "global_step": 176214, "epoch": 4195} {"train_loss": -6.949129104614258, "global_step": 176215, "epoch": 4195} {"train_loss": -7.106089115142822, "global_step": 176216, "epoch": 4195} {"train_loss": -7.135554313659668, "global_step": 176217, "epoch": 4195} {"train_loss": -7.110714435577393, "global_step": 176218, "epoch": 4195} {"train_loss": -7.029550075531006, "global_step": 176219, "epoch": 4195} {"train_loss": -7.056889533996582, "global_step": 176220, "epoch": 4195} {"train_loss": -7.169678688049316, "global_step": 176221, "epoch": 4195} {"train_loss": -7.062736988067627, "global_step": 176222, "epoch": 4195} {"train_loss": -7.017409324645996, "global_step": 176223, "epoch": 4195} {"train_loss": -7.086390495300293, "global_step": 176224, "epoch": 4195} {"train_loss": -7.0131120681762695, "global_step": 176225, "epoch": 4195} {"train_loss": -7.059606552124023, "global_step": 176226, "epoch": 4195} {"train_loss": -6.957810401916504, "global_step": 176227, "epoch": 4195} {"train_loss": -7.053670406341553, "global_step": 176228, "epoch": 4195} {"train_loss": -6.9735541343688965, "global_step": 176229, "epoch": 4195} {"train_loss": -7.094509601593018, "global_step": 176230, "epoch": 4195} {"train_loss": -7.049653859365554, "global_step": 176231, "epoch": 4195, "val_loss": 80355.609375} {"train_loss": -7.123745441436768, "global_step": 176232, "epoch": 4196} {"train_loss": -7.043087005615234, "global_step": 176233, "epoch": 4196} {"train_loss": -7.079750061035156, "global_step": 176234, "epoch": 4196} {"train_loss": -7.032655239105225, "global_step": 176235, "epoch": 4196} {"train_loss": -7.207880020141602, "global_step": 176236, "epoch": 4196} {"train_loss": -6.955619812011719, "global_step": 176237, "epoch": 4196} {"train_loss": -7.088646411895752, "global_step": 176238, "epoch": 4196} {"train_loss": -7.131495475769043, "global_step": 176239, "epoch": 4196} {"train_loss": -7.099725723266602, "global_step": 176240, "epoch": 4196} {"train_loss": -7.1183247566223145, "global_step": 176241, "epoch": 4196} {"train_loss": -7.049201965332031, "global_step": 176242, "epoch": 4196} {"train_loss": -7.097156524658203, "global_step": 176243, "epoch": 4196} {"train_loss": -7.059234619140625, "global_step": 176244, "epoch": 4196} {"train_loss": -7.179036617279053, "global_step": 176245, "epoch": 4196} {"train_loss": -7.068145751953125, "global_step": 176246, "epoch": 4196} {"train_loss": -7.060921669006348, "global_step": 176247, "epoch": 4196} {"train_loss": -6.885571479797363, "global_step": 176248, "epoch": 4196} {"train_loss": -7.093703746795654, "global_step": 176249, "epoch": 4196} {"train_loss": -7.032357215881348, "global_step": 176250, "epoch": 4196} {"train_loss": -6.959689140319824, "global_step": 176251, "epoch": 4196} {"train_loss": -7.04599666595459, "global_step": 176252, "epoch": 4196} {"train_loss": -7.159344673156738, "global_step": 176253, "epoch": 4196} {"train_loss": -7.007162570953369, "global_step": 176254, "epoch": 4196} {"train_loss": -7.163784980773926, "global_step": 176255, "epoch": 4196} {"train_loss": -7.176207542419434, "global_step": 176256, "epoch": 4196} {"train_loss": -7.152610778808594, "global_step": 176257, "epoch": 4196} {"train_loss": -7.162979602813721, "global_step": 176258, "epoch": 4196} {"train_loss": -7.166738033294678, "global_step": 176259, "epoch": 4196} {"train_loss": -7.089259147644043, "global_step": 176260, "epoch": 4196} {"train_loss": -7.187692642211914, "global_step": 176261, "epoch": 4196} {"train_loss": -7.001939296722412, "global_step": 176262, "epoch": 4196} {"train_loss": -7.198878765106201, "global_step": 176263, "epoch": 4196} {"train_loss": -7.164122104644775, "global_step": 176264, "epoch": 4196} {"train_loss": -7.116723537445068, "global_step": 176265, "epoch": 4196} {"train_loss": -7.14717960357666, "global_step": 176266, "epoch": 4196} {"train_loss": -7.221975326538086, "global_step": 176267, "epoch": 4196} {"train_loss": -7.074587821960449, "global_step": 176268, "epoch": 4196} {"train_loss": -6.993940353393555, "global_step": 176269, "epoch": 4196} {"train_loss": -7.083307266235352, "global_step": 176270, "epoch": 4196} {"train_loss": -7.120652198791504, "global_step": 176271, "epoch": 4196} {"train_loss": -7.086784839630127, "global_step": 176272, "epoch": 4196} {"train_loss": -7.095799616404942, "global_step": 176273, "epoch": 4196, "val_loss": 80236.4140625} {"train_loss": -7.108412742614746, "global_step": 176274, "epoch": 4197} {"train_loss": -7.080394744873047, "global_step": 176275, "epoch": 4197} {"train_loss": -7.19627571105957, "global_step": 176276, "epoch": 4197} {"train_loss": -7.078202247619629, "global_step": 176277, "epoch": 4197} {"train_loss": -7.049069404602051, "global_step": 176278, "epoch": 4197} {"train_loss": -7.150084018707275, "global_step": 176279, "epoch": 4197} {"train_loss": -7.1237077713012695, "global_step": 176280, "epoch": 4197} {"train_loss": -7.073091983795166, "global_step": 176281, "epoch": 4197} {"train_loss": -7.121532440185547, "global_step": 176282, "epoch": 4197} {"train_loss": -7.1419291496276855, "global_step": 176283, "epoch": 4197} {"train_loss": -7.132912635803223, "global_step": 176284, "epoch": 4197} {"train_loss": -7.241211414337158, "global_step": 176285, "epoch": 4197} {"train_loss": -7.094130516052246, "global_step": 176286, "epoch": 4197} {"train_loss": -7.097470283508301, "global_step": 176287, "epoch": 4197} {"train_loss": -7.193848609924316, "global_step": 176288, "epoch": 4197} {"train_loss": -7.071290016174316, "global_step": 176289, "epoch": 4197} {"train_loss": -7.10553503036499, "global_step": 176290, "epoch": 4197} {"train_loss": -7.044641494750977, "global_step": 176291, "epoch": 4197} {"train_loss": -7.253902435302734, "global_step": 176292, "epoch": 4197} {"train_loss": -7.1518449783325195, "global_step": 176293, "epoch": 4197} {"train_loss": -7.106388568878174, "global_step": 176294, "epoch": 4197} {"train_loss": -7.119670867919922, "global_step": 176295, "epoch": 4197} {"train_loss": -7.304938316345215, "global_step": 176296, "epoch": 4197} {"train_loss": -7.20253849029541, "global_step": 176297, "epoch": 4197} {"train_loss": -7.194140434265137, "global_step": 176298, "epoch": 4197} {"train_loss": -7.14188814163208, "global_step": 176299, "epoch": 4197} {"train_loss": -7.156996726989746, "global_step": 176300, "epoch": 4197} {"train_loss": -7.146754741668701, "global_step": 176301, "epoch": 4197} {"train_loss": -7.232993125915527, "global_step": 176302, "epoch": 4197} {"train_loss": -7.160120964050293, "global_step": 176303, "epoch": 4197} {"train_loss": -7.151289463043213, "global_step": 176304, "epoch": 4197} {"train_loss": -7.117922782897949, "global_step": 176305, "epoch": 4197} {"train_loss": -7.099067211151123, "global_step": 176306, "epoch": 4197} {"train_loss": -7.077383995056152, "global_step": 176307, "epoch": 4197} {"train_loss": -7.074958801269531, "global_step": 176308, "epoch": 4197} {"train_loss": -7.088865280151367, "global_step": 176309, "epoch": 4197} {"train_loss": -7.023516654968262, "global_step": 176310, "epoch": 4197} {"train_loss": -7.022904396057129, "global_step": 176311, "epoch": 4197} {"train_loss": -6.845379829406738, "global_step": 176312, "epoch": 4197} {"train_loss": -7.091559410095215, "global_step": 176313, "epoch": 4197} {"train_loss": -7.025887489318848, "global_step": 176314, "epoch": 4197} {"train_loss": -7.116679747899373, "global_step": 176315, "epoch": 4197, "val_loss": 80147.921875} {"train_loss": -7.063384532928467, "global_step": 176316, "epoch": 4198} {"train_loss": -7.111806869506836, "global_step": 176317, "epoch": 4198} {"train_loss": -7.11149787902832, "global_step": 176318, "epoch": 4198} {"train_loss": -7.1481781005859375, "global_step": 176319, "epoch": 4198} {"train_loss": -6.88022518157959, "global_step": 176320, "epoch": 4198} {"train_loss": -6.943346977233887, "global_step": 176321, "epoch": 4198} {"train_loss": -6.892035961151123, "global_step": 176322, "epoch": 4198} {"train_loss": -7.118764400482178, "global_step": 176323, "epoch": 4198} {"train_loss": -7.033297061920166, "global_step": 176324, "epoch": 4198} {"train_loss": -6.972151279449463, "global_step": 176325, "epoch": 4198} {"train_loss": -7.008563041687012, "global_step": 176326, "epoch": 4198} {"train_loss": -6.998435020446777, "global_step": 176327, "epoch": 4198} {"train_loss": -7.122835159301758, "global_step": 176328, "epoch": 4198} {"train_loss": -7.039298057556152, "global_step": 176329, "epoch": 4198} {"train_loss": -7.112515449523926, "global_step": 176330, "epoch": 4198} {"train_loss": -7.045559406280518, "global_step": 176331, "epoch": 4198} {"train_loss": -7.179815292358398, "global_step": 176332, "epoch": 4198} {"train_loss": -7.099983215332031, "global_step": 176333, "epoch": 4198} {"train_loss": -7.054275035858154, "global_step": 176334, "epoch": 4198} {"train_loss": -7.03513240814209, "global_step": 176335, "epoch": 4198} {"train_loss": -7.111179351806641, "global_step": 176336, "epoch": 4198} {"train_loss": -7.120530605316162, "global_step": 176337, "epoch": 4198} {"train_loss": -7.139834403991699, "global_step": 176338, "epoch": 4198} {"train_loss": -7.161752700805664, "global_step": 176339, "epoch": 4198} {"train_loss": -7.139377593994141, "global_step": 176340, "epoch": 4198} {"train_loss": -7.055062294006348, "global_step": 176341, "epoch": 4198} {"train_loss": -7.213967323303223, "global_step": 176342, "epoch": 4198} {"train_loss": -7.049072265625, "global_step": 176343, "epoch": 4198} {"train_loss": -7.021197319030762, "global_step": 176344, "epoch": 4198} {"train_loss": -7.157950401306152, "global_step": 176345, "epoch": 4198} {"train_loss": -7.111804485321045, "global_step": 176346, "epoch": 4198} {"train_loss": -7.071311950683594, "global_step": 176347, "epoch": 4198} {"train_loss": -7.210517406463623, "global_step": 176348, "epoch": 4198} {"train_loss": -7.0576677322387695, "global_step": 176349, "epoch": 4198} {"train_loss": -7.112192153930664, "global_step": 176350, "epoch": 4198} {"train_loss": -7.086020469665527, "global_step": 176351, "epoch": 4198} {"train_loss": -7.185881614685059, "global_step": 176352, "epoch": 4198} {"train_loss": -7.121237754821777, "global_step": 176353, "epoch": 4198} {"train_loss": -7.107547760009766, "global_step": 176354, "epoch": 4198} {"train_loss": -7.093700408935547, "global_step": 176355, "epoch": 4198} {"train_loss": -7.043267726898193, "global_step": 176356, "epoch": 4198} {"train_loss": -7.080594312577021, "global_step": 176357, "epoch": 4198, "val_loss": 80111.5625} {"train_loss": -7.013129234313965, "global_step": 176358, "epoch": 4199} {"train_loss": -7.028751373291016, "global_step": 176359, "epoch": 4199} {"train_loss": -7.1317338943481445, "global_step": 176360, "epoch": 4199} {"train_loss": -7.057769298553467, "global_step": 176361, "epoch": 4199} {"train_loss": -7.063604354858398, "global_step": 176362, "epoch": 4199} {"train_loss": -7.091485977172852, "global_step": 176363, "epoch": 4199} {"train_loss": -7.112082004547119, "global_step": 176364, "epoch": 4199} {"train_loss": -7.0449018478393555, "global_step": 176365, "epoch": 4199} {"train_loss": -7.112854957580566, "global_step": 176366, "epoch": 4199} {"train_loss": -7.045321941375732, "global_step": 176367, "epoch": 4199} {"train_loss": -7.07172966003418, "global_step": 176368, "epoch": 4199} {"train_loss": -7.033548355102539, "global_step": 176369, "epoch": 4199} {"train_loss": -7.010368347167969, "global_step": 176370, "epoch": 4199} {"train_loss": -7.064059257507324, "global_step": 176371, "epoch": 4199} {"train_loss": -6.950677394866943, "global_step": 176372, "epoch": 4199} {"train_loss": -6.883843421936035, "global_step": 176373, "epoch": 4199} {"train_loss": -7.179646015167236, "global_step": 176374, "epoch": 4199} {"train_loss": -7.012350082397461, "global_step": 176375, "epoch": 4199} {"train_loss": -7.012939453125, "global_step": 176376, "epoch": 4199} {"train_loss": -7.086709022521973, "global_step": 176377, "epoch": 4199} {"train_loss": -7.180541515350342, "global_step": 176378, "epoch": 4199} {"train_loss": -7.169952869415283, "global_step": 176379, "epoch": 4199} {"train_loss": -7.0489583015441895, "global_step": 176380, "epoch": 4199} {"train_loss": -7.0408935546875, "global_step": 176381, "epoch": 4199} {"train_loss": -7.0731000900268555, "global_step": 176382, "epoch": 4199} {"train_loss": -7.171457290649414, "global_step": 176383, "epoch": 4199} {"train_loss": -7.136292457580566, "global_step": 176384, "epoch": 4199} {"train_loss": -7.077685356140137, "global_step": 176385, "epoch": 4199} {"train_loss": -7.048124313354492, "global_step": 176386, "epoch": 4199} {"train_loss": -7.05512809753418, "global_step": 176387, "epoch": 4199} {"train_loss": -6.965034484863281, "global_step": 176388, "epoch": 4199} {"train_loss": -7.0642547607421875, "global_step": 176389, "epoch": 4199} {"train_loss": -7.091457843780518, "global_step": 176390, "epoch": 4199} {"train_loss": -7.121103286743164, "global_step": 176391, "epoch": 4199} {"train_loss": -7.128252029418945, "global_step": 176392, "epoch": 4199} {"train_loss": -7.223409652709961, "global_step": 176393, "epoch": 4199} {"train_loss": -7.096332550048828, "global_step": 176394, "epoch": 4199} {"train_loss": -7.221488952636719, "global_step": 176395, "epoch": 4199} {"train_loss": -7.225394248962402, "global_step": 176396, "epoch": 4199} {"train_loss": -7.223247528076172, "global_step": 176397, "epoch": 4199} {"train_loss": -7.2198896408081055, "global_step": 176398, "epoch": 4199} {"train_loss": -7.085653657004947, "global_step": 176399, "epoch": 4199, "val_loss": 80195.6953125} {"train_loss": -7.031706809997559, "global_step": 176400, "epoch": 4200} {"train_loss": -7.287285804748535, "global_step": 176401, "epoch": 4200} {"train_loss": -7.18583869934082, "global_step": 176402, "epoch": 4200} {"train_loss": -7.091864585876465, "global_step": 176403, "epoch": 4200} {"train_loss": -7.231626510620117, "global_step": 176404, "epoch": 4200} {"train_loss": -7.054737567901611, "global_step": 176405, "epoch": 4200} {"train_loss": -7.092532634735107, "global_step": 176406, "epoch": 4200} {"train_loss": -7.171268939971924, "global_step": 176407, "epoch": 4200} {"train_loss": -7.2607622146606445, "global_step": 176408, "epoch": 4200} {"train_loss": -7.153838634490967, "global_step": 176409, "epoch": 4200} {"train_loss": -6.984750747680664, "global_step": 176410, "epoch": 4200} {"train_loss": -7.18051815032959, "global_step": 176411, "epoch": 4200} {"train_loss": -7.0219550132751465, "global_step": 176412, "epoch": 4200} {"train_loss": -7.144523620605469, "global_step": 176413, "epoch": 4200} {"train_loss": -7.258131980895996, "global_step": 176414, "epoch": 4200} {"train_loss": -7.14015531539917, "global_step": 176415, "epoch": 4200} {"train_loss": -7.1396484375, "global_step": 176416, "epoch": 4200} {"train_loss": -7.065585613250732, "global_step": 176417, "epoch": 4200} {"train_loss": -7.082853317260742, "global_step": 176418, "epoch": 4200} {"train_loss": -7.180621147155762, "global_step": 176419, "epoch": 4200} {"train_loss": -7.1325154304504395, "global_step": 176420, "epoch": 4200} {"train_loss": -7.088502883911133, "global_step": 176421, "epoch": 4200} {"train_loss": -7.172691345214844, "global_step": 176422, "epoch": 4200} {"train_loss": -7.042488098144531, "global_step": 176423, "epoch": 4200} {"train_loss": -7.077434539794922, "global_step": 176424, "epoch": 4200} {"train_loss": -7.134049892425537, "global_step": 176425, "epoch": 4200} {"train_loss": -7.152047157287598, "global_step": 176426, "epoch": 4200} {"train_loss": -7.16310977935791, "global_step": 176427, "epoch": 4200} {"train_loss": -7.068700790405273, "global_step": 176428, "epoch": 4200} {"train_loss": -7.049151420593262, "global_step": 176429, "epoch": 4200} {"train_loss": -7.207245826721191, "global_step": 176430, "epoch": 4200} {"train_loss": -7.152716159820557, "global_step": 176431, "epoch": 4200} {"train_loss": -7.102963447570801, "global_step": 176432, "epoch": 4200} {"train_loss": -7.134937763214111, "global_step": 176433, "epoch": 4200} {"train_loss": -7.116002082824707, "global_step": 176434, "epoch": 4200} {"train_loss": -7.2177414894104, "global_step": 176435, "epoch": 4200} {"train_loss": -6.985124111175537, "global_step": 176436, "epoch": 4200} {"train_loss": -7.127364158630371, "global_step": 176437, "epoch": 4200} {"train_loss": -7.123823165893555, "global_step": 176438, "epoch": 4200} {"train_loss": -7.11417818069458, "global_step": 176439, "epoch": 4200} {"train_loss": -6.953232288360596, "global_step": 176440, "epoch": 4200} {"train_loss": -7.123352822803316, "global_step": 176441, "epoch": 4200, "train/sim_max_reward_0": 0.9825650406068737, "train/sim_max_reward_1": 0.9282429624311228, "train/sim_max_reward_2": 0.8726718412186936, "train/sim_max_reward_3": 0.15204896644734528, "train/sim_max_reward_4": 0.47189244941488534, "train/sim_max_reward_5": 0.9170821473303075, "test/sim_max_reward_4500000": 0.5790008766145631, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.794648986059077, "test/sim_max_reward_4500004": 0.18568972104366013, "test/sim_max_reward_4500005": 0.9461577125830842, "test/sim_max_reward_4500006": 0.9102929013310468, "test/sim_max_reward_4500007": 0.9262483366184957, "test/sim_max_reward_4500008": 0.9678733147990999, "test/sim_max_reward_4500009": 0.05310937225605138, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 1.0, "test/sim_max_reward_4500012": 0.8427414674246145, "test/sim_max_reward_4500013": 0.006733193489289844, "test/sim_max_reward_4500014": 0.9765616160999264, "test/sim_max_reward_4500015": 0.8736902918244143, "test/sim_max_reward_4500016": 0.025897655305570127, "test/sim_max_reward_4500017": 0.08374188409047428, "test/sim_max_reward_4500018": 0.4011039256229228, "test/sim_max_reward_4500019": 0.9851624664867408, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9585159368311598, "test/sim_max_reward_4500022": 0.9594905483233171, "test/sim_max_reward_4500023": 0.9955230827198983, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.34183262194807934, "test/sim_max_reward_4500026": 0.976589052454253, "test/sim_max_reward_4500027": 0.9972284500545754, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.09995144765616996, "test/sim_max_reward_4500030": 0.8975250304533354, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.6601029455664336, "test/sim_max_reward_4500034": 0.9144232511625653, "test/sim_max_reward_4500035": 0.9779456063735699, "test/sim_max_reward_4500036": 0.7983586165484052, "test/sim_max_reward_4500037": 1.0, "test/sim_max_reward_4500038": 0.3254289839707665, "test/sim_max_reward_4500039": 0.0, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.8652442216238768, "test/sim_max_reward_4500042": 0.04451483534087922, "test/sim_max_reward_4500043": 0.5503076701175046, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9467415240037498, "test/sim_max_reward_4500046": 0.20504360262645416, "test/sim_max_reward_4500047": 0.9782933903687302, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 1.0, "train/mean_score": 0.7207505679082047, "test/mean_score": 0.5857280298063516, "val_loss": 80302.8359375} {"train_loss": -6.910864353179932, "global_step": 176442, "epoch": 4201} {"train_loss": -7.11719274520874, "global_step": 176443, "epoch": 4201} {"train_loss": -7.024009704589844, "global_step": 176444, "epoch": 4201} {"train_loss": -7.0911865234375, "global_step": 176445, "epoch": 4201} {"train_loss": -7.047674655914307, "global_step": 176446, "epoch": 4201} {"train_loss": -7.12138557434082, "global_step": 176447, "epoch": 4201} {"train_loss": -7.075273036956787, "global_step": 176448, "epoch": 4201} {"train_loss": -7.135441780090332, "global_step": 176449, "epoch": 4201} {"train_loss": -7.1246209144592285, "global_step": 176450, "epoch": 4201} {"train_loss": -7.1500701904296875, "global_step": 176451, "epoch": 4201} {"train_loss": -7.133659362792969, "global_step": 176452, "epoch": 4201} {"train_loss": -7.095373153686523, "global_step": 176453, "epoch": 4201} {"train_loss": -7.138759136199951, "global_step": 176454, "epoch": 4201} {"train_loss": -7.151176452636719, "global_step": 176455, "epoch": 4201} {"train_loss": -7.089723587036133, "global_step": 176456, "epoch": 4201} {"train_loss": -7.0731377601623535, "global_step": 176457, "epoch": 4201} {"train_loss": -7.184691429138184, "global_step": 176458, "epoch": 4201} {"train_loss": -7.088671684265137, "global_step": 176459, "epoch": 4201} {"train_loss": -7.153196334838867, "global_step": 176460, "epoch": 4201} {"train_loss": -7.123022556304932, "global_step": 176461, "epoch": 4201} {"train_loss": -7.093546390533447, "global_step": 176462, "epoch": 4201} {"train_loss": -7.039163112640381, "global_step": 176463, "epoch": 4201} {"train_loss": -7.147026062011719, "global_step": 176464, "epoch": 4201} {"train_loss": -7.059345722198486, "global_step": 176465, "epoch": 4201} {"train_loss": -7.053217887878418, "global_step": 176466, "epoch": 4201} {"train_loss": -7.095292091369629, "global_step": 176467, "epoch": 4201} {"train_loss": -7.012115478515625, "global_step": 176468, "epoch": 4201} {"train_loss": -7.251016616821289, "global_step": 176469, "epoch": 4201} {"train_loss": -7.01288366317749, "global_step": 176470, "epoch": 4201} {"train_loss": -7.017119407653809, "global_step": 176471, "epoch": 4201} {"train_loss": -7.009660243988037, "global_step": 176472, "epoch": 4201} {"train_loss": -6.980515003204346, "global_step": 176473, "epoch": 4201} {"train_loss": -7.107526779174805, "global_step": 176474, "epoch": 4201} {"train_loss": -7.006073951721191, "global_step": 176475, "epoch": 4201} {"train_loss": -7.117495536804199, "global_step": 176476, "epoch": 4201} {"train_loss": -7.164073944091797, "global_step": 176477, "epoch": 4201} {"train_loss": -7.0755486488342285, "global_step": 176478, "epoch": 4201} {"train_loss": -7.230751991271973, "global_step": 176479, "epoch": 4201} {"train_loss": -7.1461501121521, "global_step": 176480, "epoch": 4201} {"train_loss": -7.138888835906982, "global_step": 176481, "epoch": 4201} {"train_loss": -7.106647491455078, "global_step": 176482, "epoch": 4201} {"train_loss": -7.09398873647054, "global_step": 176483, "epoch": 4201, "val_loss": 80262.0390625} {"train_loss": -7.148276329040527, "global_step": 176484, "epoch": 4202} {"train_loss": -7.138591766357422, "global_step": 176485, "epoch": 4202} {"train_loss": -7.220911979675293, "global_step": 176486, "epoch": 4202} {"train_loss": -7.13948917388916, "global_step": 176487, "epoch": 4202} {"train_loss": -7.086188316345215, "global_step": 176488, "epoch": 4202} {"train_loss": -7.202306270599365, "global_step": 176489, "epoch": 4202} {"train_loss": -7.011899948120117, "global_step": 176490, "epoch": 4202} {"train_loss": -7.040656089782715, "global_step": 176491, "epoch": 4202} {"train_loss": -7.01493501663208, "global_step": 176492, "epoch": 4202} {"train_loss": -7.10521125793457, "global_step": 176493, "epoch": 4202} {"train_loss": -7.104465961456299, "global_step": 176494, "epoch": 4202} {"train_loss": -7.15822172164917, "global_step": 176495, "epoch": 4202} {"train_loss": -6.981759071350098, "global_step": 176496, "epoch": 4202} {"train_loss": -7.0371246337890625, "global_step": 176497, "epoch": 4202} {"train_loss": -7.099135398864746, "global_step": 176498, "epoch": 4202} {"train_loss": -7.122048377990723, "global_step": 176499, "epoch": 4202} {"train_loss": -7.14359188079834, "global_step": 176500, "epoch": 4202} {"train_loss": -7.07186222076416, "global_step": 176501, "epoch": 4202} {"train_loss": -7.055572509765625, "global_step": 176502, "epoch": 4202} {"train_loss": -7.123722076416016, "global_step": 176503, "epoch": 4202} {"train_loss": -7.065078258514404, "global_step": 176504, "epoch": 4202} {"train_loss": -6.947089195251465, "global_step": 176505, "epoch": 4202} {"train_loss": -7.058414936065674, "global_step": 176506, "epoch": 4202} {"train_loss": -7.148961067199707, "global_step": 176507, "epoch": 4202} {"train_loss": -7.091131210327148, "global_step": 176508, "epoch": 4202} {"train_loss": -7.013335704803467, "global_step": 176509, "epoch": 4202} {"train_loss": -7.057321071624756, "global_step": 176510, "epoch": 4202} {"train_loss": -7.03176212310791, "global_step": 176511, "epoch": 4202} {"train_loss": -7.026237487792969, "global_step": 176512, "epoch": 4202} {"train_loss": -7.070240020751953, "global_step": 176513, "epoch": 4202} {"train_loss": -7.125248432159424, "global_step": 176514, "epoch": 4202} {"train_loss": -7.126142501831055, "global_step": 176515, "epoch": 4202} {"train_loss": -7.070873737335205, "global_step": 176516, "epoch": 4202} {"train_loss": -7.057149887084961, "global_step": 176517, "epoch": 4202} {"train_loss": -7.050382137298584, "global_step": 176518, "epoch": 4202} {"train_loss": -7.065212249755859, "global_step": 176519, "epoch": 4202} {"train_loss": -7.137499809265137, "global_step": 176520, "epoch": 4202} {"train_loss": -7.087443828582764, "global_step": 176521, "epoch": 4202} {"train_loss": -7.060868263244629, "global_step": 176522, "epoch": 4202} {"train_loss": -7.124260425567627, "global_step": 176523, "epoch": 4202} {"train_loss": -7.040057182312012, "global_step": 176524, "epoch": 4202} {"train_loss": -7.084497065771194, "global_step": 176525, "epoch": 4202, "val_loss": 80285.921875} {"train_loss": -7.081390380859375, "global_step": 176526, "epoch": 4203} {"train_loss": -7.071142673492432, "global_step": 176527, "epoch": 4203} {"train_loss": -7.166749954223633, "global_step": 176528, "epoch": 4203} {"train_loss": -7.0331315994262695, "global_step": 176529, "epoch": 4203} {"train_loss": -7.090394973754883, "global_step": 176530, "epoch": 4203} {"train_loss": -7.241117477416992, "global_step": 176531, "epoch": 4203} {"train_loss": -7.118993282318115, "global_step": 176532, "epoch": 4203} {"train_loss": -7.118633270263672, "global_step": 176533, "epoch": 4203} {"train_loss": -7.030974388122559, "global_step": 176534, "epoch": 4203} {"train_loss": -7.228212356567383, "global_step": 176535, "epoch": 4203} {"train_loss": -7.238480567932129, "global_step": 176536, "epoch": 4203} {"train_loss": -7.034002304077148, "global_step": 176537, "epoch": 4203} {"train_loss": -7.1219964027404785, "global_step": 176538, "epoch": 4203} {"train_loss": -7.216732025146484, "global_step": 176539, "epoch": 4203} {"train_loss": -7.046363830566406, "global_step": 176540, "epoch": 4203} {"train_loss": -7.0548787117004395, "global_step": 176541, "epoch": 4203} {"train_loss": -7.133239269256592, "global_step": 176542, "epoch": 4203} {"train_loss": -7.14865779876709, "global_step": 176543, "epoch": 4203} {"train_loss": -7.042369842529297, "global_step": 176544, "epoch": 4203} {"train_loss": -7.168720245361328, "global_step": 176545, "epoch": 4203} {"train_loss": -7.077008247375488, "global_step": 176546, "epoch": 4203} {"train_loss": -7.117033004760742, "global_step": 176547, "epoch": 4203} {"train_loss": -6.985302448272705, "global_step": 176548, "epoch": 4203} {"train_loss": -7.019858360290527, "global_step": 176549, "epoch": 4203} {"train_loss": -7.184391975402832, "global_step": 176550, "epoch": 4203} {"train_loss": -6.968168258666992, "global_step": 176551, "epoch": 4203} {"train_loss": -7.053862571716309, "global_step": 176552, "epoch": 4203} {"train_loss": -7.117652416229248, "global_step": 176553, "epoch": 4203} {"train_loss": -6.9739861488342285, "global_step": 176554, "epoch": 4203} {"train_loss": -6.942391395568848, "global_step": 176555, "epoch": 4203} {"train_loss": -7.1153950691223145, "global_step": 176556, "epoch": 4203} {"train_loss": -7.07429313659668, "global_step": 176557, "epoch": 4203} {"train_loss": -6.92992639541626, "global_step": 176558, "epoch": 4203} {"train_loss": -7.082057476043701, "global_step": 176559, "epoch": 4203} {"train_loss": -6.93532657623291, "global_step": 176560, "epoch": 4203} {"train_loss": -7.120833396911621, "global_step": 176561, "epoch": 4203} {"train_loss": -7.202470302581787, "global_step": 176562, "epoch": 4203} {"train_loss": -7.1783881187438965, "global_step": 176563, "epoch": 4203} {"train_loss": -7.129556179046631, "global_step": 176564, "epoch": 4203} {"train_loss": -7.050520896911621, "global_step": 176565, "epoch": 4203} {"train_loss": -7.090630054473877, "global_step": 176566, "epoch": 4203} {"train_loss": -7.090019294193813, "global_step": 176567, "epoch": 4203, "val_loss": 80126.03125} {"train_loss": -7.015215873718262, "global_step": 176568, "epoch": 4204} {"train_loss": -7.142850875854492, "global_step": 176569, "epoch": 4204} {"train_loss": -7.146617889404297, "global_step": 176570, "epoch": 4204} {"train_loss": -7.134859561920166, "global_step": 176571, "epoch": 4204} {"train_loss": -7.137714385986328, "global_step": 176572, "epoch": 4204} {"train_loss": -7.092935562133789, "global_step": 176573, "epoch": 4204} {"train_loss": -7.159003257751465, "global_step": 176574, "epoch": 4204} {"train_loss": -7.06839656829834, "global_step": 176575, "epoch": 4204} {"train_loss": -7.1659698486328125, "global_step": 176576, "epoch": 4204} {"train_loss": -7.180548667907715, "global_step": 176577, "epoch": 4204} {"train_loss": -7.209172248840332, "global_step": 176578, "epoch": 4204} {"train_loss": -7.098883628845215, "global_step": 176579, "epoch": 4204} {"train_loss": -7.1438117027282715, "global_step": 176580, "epoch": 4204} {"train_loss": -7.138040542602539, "global_step": 176581, "epoch": 4204} {"train_loss": -7.100103378295898, "global_step": 176582, "epoch": 4204} {"train_loss": -7.200822830200195, "global_step": 176583, "epoch": 4204} {"train_loss": -7.057532787322998, "global_step": 176584, "epoch": 4204} {"train_loss": -6.897849082946777, "global_step": 176585, "epoch": 4204} {"train_loss": -7.176847457885742, "global_step": 176586, "epoch": 4204} {"train_loss": -6.929841995239258, "global_step": 176587, "epoch": 4204} {"train_loss": -6.9805521965026855, "global_step": 176588, "epoch": 4204} {"train_loss": -7.046600341796875, "global_step": 176589, "epoch": 4204} {"train_loss": -6.987421035766602, "global_step": 176590, "epoch": 4204} {"train_loss": -7.051024436950684, "global_step": 176591, "epoch": 4204} {"train_loss": -7.063610076904297, "global_step": 176592, "epoch": 4204} {"train_loss": -7.07373046875, "global_step": 176593, "epoch": 4204} {"train_loss": -7.121637344360352, "global_step": 176594, "epoch": 4204} {"train_loss": -7.14828634262085, "global_step": 176595, "epoch": 4204} {"train_loss": -7.079296112060547, "global_step": 176596, "epoch": 4204} {"train_loss": -7.18059778213501, "global_step": 176597, "epoch": 4204} {"train_loss": -7.052884578704834, "global_step": 176598, "epoch": 4204} {"train_loss": -7.079986095428467, "global_step": 176599, "epoch": 4204} {"train_loss": -7.006911277770996, "global_step": 176600, "epoch": 4204} {"train_loss": -7.149208068847656, "global_step": 176601, "epoch": 4204} {"train_loss": -7.113926887512207, "global_step": 176602, "epoch": 4204} {"train_loss": -6.976025581359863, "global_step": 176603, "epoch": 4204} {"train_loss": -7.013861656188965, "global_step": 176604, "epoch": 4204} {"train_loss": -6.955510139465332, "global_step": 176605, "epoch": 4204} {"train_loss": -7.024252891540527, "global_step": 176606, "epoch": 4204} {"train_loss": -7.129181861877441, "global_step": 176607, "epoch": 4204} {"train_loss": -7.067099571228027, "global_step": 176608, "epoch": 4204} {"train_loss": -7.082979020618257, "global_step": 176609, "epoch": 4204, "val_loss": 80203.640625} {"train_loss": -6.937285423278809, "global_step": 176610, "epoch": 4205} {"train_loss": -7.139212608337402, "global_step": 176611, "epoch": 4205} {"train_loss": -6.870866775512695, "global_step": 176612, "epoch": 4205} {"train_loss": -7.012474536895752, "global_step": 176613, "epoch": 4205} {"train_loss": -7.143739223480225, "global_step": 176614, "epoch": 4205} {"train_loss": -6.797000885009766, "global_step": 176615, "epoch": 4205} {"train_loss": -6.995705604553223, "global_step": 176616, "epoch": 4205} {"train_loss": -7.128811836242676, "global_step": 176617, "epoch": 4205} {"train_loss": -7.089024543762207, "global_step": 176618, "epoch": 4205} {"train_loss": -7.065390586853027, "global_step": 176619, "epoch": 4205} {"train_loss": -6.991654396057129, "global_step": 176620, "epoch": 4205} {"train_loss": -7.118894577026367, "global_step": 176621, "epoch": 4205} {"train_loss": -7.020577907562256, "global_step": 176622, "epoch": 4205} {"train_loss": -6.959902763366699, "global_step": 176623, "epoch": 4205} {"train_loss": -7.148259162902832, "global_step": 176624, "epoch": 4205} {"train_loss": -7.015537738800049, "global_step": 176625, "epoch": 4205} {"train_loss": -7.026177883148193, "global_step": 176626, "epoch": 4205} {"train_loss": -7.07819128036499, "global_step": 176627, "epoch": 4205} {"train_loss": -7.00982666015625, "global_step": 176628, "epoch": 4205} {"train_loss": -7.108003616333008, "global_step": 176629, "epoch": 4205} {"train_loss": -7.104787826538086, "global_step": 176630, "epoch": 4205} {"train_loss": -7.168431282043457, "global_step": 176631, "epoch": 4205} {"train_loss": -6.984708309173584, "global_step": 176632, "epoch": 4205} {"train_loss": -7.057268142700195, "global_step": 176633, "epoch": 4205} {"train_loss": -7.038187503814697, "global_step": 176634, "epoch": 4205} {"train_loss": -7.095237731933594, "global_step": 176635, "epoch": 4205} {"train_loss": -7.225527763366699, "global_step": 176636, "epoch": 4205} {"train_loss": -7.058528900146484, "global_step": 176637, "epoch": 4205} {"train_loss": -7.155920028686523, "global_step": 176638, "epoch": 4205} {"train_loss": -7.099664688110352, "global_step": 176639, "epoch": 4205} {"train_loss": -7.208915710449219, "global_step": 176640, "epoch": 4205} {"train_loss": -7.1353759765625, "global_step": 176641, "epoch": 4205} {"train_loss": -7.063778877258301, "global_step": 176642, "epoch": 4205} {"train_loss": -7.108087539672852, "global_step": 176643, "epoch": 4205} {"train_loss": -7.11700439453125, "global_step": 176644, "epoch": 4205} {"train_loss": -7.153102874755859, "global_step": 176645, "epoch": 4205} {"train_loss": -7.184291362762451, "global_step": 176646, "epoch": 4205} {"train_loss": -7.0894622802734375, "global_step": 176647, "epoch": 4205} {"train_loss": -7.154958724975586, "global_step": 176648, "epoch": 4205} {"train_loss": -7.260062217712402, "global_step": 176649, "epoch": 4205} {"train_loss": -7.197829723358154, "global_step": 176650, "epoch": 4205} {"train_loss": -7.083980776014782, "global_step": 176651, "epoch": 4205, "val_loss": 80000.765625} {"train_loss": -7.175714492797852, "global_step": 176652, "epoch": 4206} {"train_loss": -7.188704967498779, "global_step": 176653, "epoch": 4206} {"train_loss": -7.095038890838623, "global_step": 176654, "epoch": 4206} {"train_loss": -7.15079402923584, "global_step": 176655, "epoch": 4206} {"train_loss": -7.098435401916504, "global_step": 176656, "epoch": 4206} {"train_loss": -7.065362930297852, "global_step": 176657, "epoch": 4206} {"train_loss": -7.206318378448486, "global_step": 176658, "epoch": 4206} {"train_loss": -7.182436943054199, "global_step": 176659, "epoch": 4206} {"train_loss": -7.114114761352539, "global_step": 176660, "epoch": 4206} {"train_loss": -7.225996494293213, "global_step": 176661, "epoch": 4206} {"train_loss": -7.094362258911133, "global_step": 176662, "epoch": 4206} {"train_loss": -7.093647480010986, "global_step": 176663, "epoch": 4206} {"train_loss": -7.100460052490234, "global_step": 176664, "epoch": 4206} {"train_loss": -7.2772088050842285, "global_step": 176665, "epoch": 4206} {"train_loss": -7.117544174194336, "global_step": 176666, "epoch": 4206} {"train_loss": -7.1597394943237305, "global_step": 176667, "epoch": 4206} {"train_loss": -7.071017265319824, "global_step": 176668, "epoch": 4206} {"train_loss": -7.098930358886719, "global_step": 176669, "epoch": 4206} {"train_loss": -7.145139217376709, "global_step": 176670, "epoch": 4206} {"train_loss": -7.031214237213135, "global_step": 176671, "epoch": 4206} {"train_loss": -7.050661087036133, "global_step": 176672, "epoch": 4206} {"train_loss": -7.10411262512207, "global_step": 176673, "epoch": 4206} {"train_loss": -7.124733924865723, "global_step": 176674, "epoch": 4206} {"train_loss": -6.967104911804199, "global_step": 176675, "epoch": 4206} {"train_loss": -6.9281325340271, "global_step": 176676, "epoch": 4206} {"train_loss": -7.166780471801758, "global_step": 176677, "epoch": 4206} {"train_loss": -6.968010902404785, "global_step": 176678, "epoch": 4206} {"train_loss": -7.165704727172852, "global_step": 176679, "epoch": 4206} {"train_loss": -7.009238243103027, "global_step": 176680, "epoch": 4206} {"train_loss": -7.0163702964782715, "global_step": 176681, "epoch": 4206} {"train_loss": -7.089249134063721, "global_step": 176682, "epoch": 4206} {"train_loss": -7.039230823516846, "global_step": 176683, "epoch": 4206} {"train_loss": -6.976480007171631, "global_step": 176684, "epoch": 4206} {"train_loss": -7.015138149261475, "global_step": 176685, "epoch": 4206} {"train_loss": -7.0755615234375, "global_step": 176686, "epoch": 4206} {"train_loss": -7.083308219909668, "global_step": 176687, "epoch": 4206} {"train_loss": -6.976466178894043, "global_step": 176688, "epoch": 4206} {"train_loss": -7.06459903717041, "global_step": 176689, "epoch": 4206} {"train_loss": -7.111684799194336, "global_step": 176690, "epoch": 4206} {"train_loss": -7.03957986831665, "global_step": 176691, "epoch": 4206} {"train_loss": -6.992062568664551, "global_step": 176692, "epoch": 4206} {"train_loss": -7.088387171427409, "global_step": 176693, "epoch": 4206, "val_loss": 80137.6796875} {"train_loss": -7.1654558181762695, "global_step": 176694, "epoch": 4207} {"train_loss": -6.983729839324951, "global_step": 176695, "epoch": 4207} {"train_loss": -7.188302040100098, "global_step": 176696, "epoch": 4207} {"train_loss": -6.984158515930176, "global_step": 176697, "epoch": 4207} {"train_loss": -7.17972469329834, "global_step": 176698, "epoch": 4207} {"train_loss": -7.106112957000732, "global_step": 176699, "epoch": 4207} {"train_loss": -7.109485149383545, "global_step": 176700, "epoch": 4207} {"train_loss": -7.204854965209961, "global_step": 176701, "epoch": 4207} {"train_loss": -7.027063369750977, "global_step": 176702, "epoch": 4207} {"train_loss": -7.105266571044922, "global_step": 176703, "epoch": 4207} {"train_loss": -7.1204118728637695, "global_step": 176704, "epoch": 4207} {"train_loss": -7.008833408355713, "global_step": 176705, "epoch": 4207} {"train_loss": -7.18458890914917, "global_step": 176706, "epoch": 4207} {"train_loss": -7.1281585693359375, "global_step": 176707, "epoch": 4207} {"train_loss": -7.115725040435791, "global_step": 176708, "epoch": 4207} {"train_loss": -7.024123191833496, "global_step": 176709, "epoch": 4207} {"train_loss": -7.054376125335693, "global_step": 176710, "epoch": 4207} {"train_loss": -6.920773029327393, "global_step": 176711, "epoch": 4207} {"train_loss": -7.143978118896484, "global_step": 176712, "epoch": 4207} {"train_loss": -7.007907390594482, "global_step": 176713, "epoch": 4207} {"train_loss": -6.889822959899902, "global_step": 176714, "epoch": 4207} {"train_loss": -7.061976432800293, "global_step": 176715, "epoch": 4207} {"train_loss": -6.960827827453613, "global_step": 176716, "epoch": 4207} {"train_loss": -7.036330223083496, "global_step": 176717, "epoch": 4207} {"train_loss": -7.011191368103027, "global_step": 176718, "epoch": 4207} {"train_loss": -6.832491874694824, "global_step": 176719, "epoch": 4207} {"train_loss": -7.055816650390625, "global_step": 176720, "epoch": 4207} {"train_loss": -6.9673662185668945, "global_step": 176721, "epoch": 4207} {"train_loss": -6.925844192504883, "global_step": 176722, "epoch": 4207} {"train_loss": -7.099244594573975, "global_step": 176723, "epoch": 4207} {"train_loss": -6.992964744567871, "global_step": 176724, "epoch": 4207} {"train_loss": -7.117047309875488, "global_step": 176725, "epoch": 4207} {"train_loss": -6.915821075439453, "global_step": 176726, "epoch": 4207} {"train_loss": -7.037959575653076, "global_step": 176727, "epoch": 4207} {"train_loss": -7.175472259521484, "global_step": 176728, "epoch": 4207} {"train_loss": -6.984825611114502, "global_step": 176729, "epoch": 4207} {"train_loss": -7.009222030639648, "global_step": 176730, "epoch": 4207} {"train_loss": -7.12271785736084, "global_step": 176731, "epoch": 4207} {"train_loss": -6.9985151290893555, "global_step": 176732, "epoch": 4207} {"train_loss": -7.112404823303223, "global_step": 176733, "epoch": 4207} {"train_loss": -7.055899620056152, "global_step": 176734, "epoch": 4207} {"train_loss": -7.04966139793396, "global_step": 176735, "epoch": 4207, "val_loss": 80148.59375} {"train_loss": -7.085068702697754, "global_step": 176736, "epoch": 4208} {"train_loss": -7.052431106567383, "global_step": 176737, "epoch": 4208} {"train_loss": -6.999958515167236, "global_step": 176738, "epoch": 4208} {"train_loss": -7.146266937255859, "global_step": 176739, "epoch": 4208} {"train_loss": -6.896859645843506, "global_step": 176740, "epoch": 4208} {"train_loss": -6.958629608154297, "global_step": 176741, "epoch": 4208} {"train_loss": -6.865939617156982, "global_step": 176742, "epoch": 4208} {"train_loss": -6.91270637512207, "global_step": 176743, "epoch": 4208} {"train_loss": -7.049306869506836, "global_step": 176744, "epoch": 4208} {"train_loss": -6.948176383972168, "global_step": 176745, "epoch": 4208} {"train_loss": -6.845498561859131, "global_step": 176746, "epoch": 4208} {"train_loss": -7.023056983947754, "global_step": 176747, "epoch": 4208} {"train_loss": -6.939108848571777, "global_step": 176748, "epoch": 4208} {"train_loss": -7.04831075668335, "global_step": 176749, "epoch": 4208} {"train_loss": -6.996603965759277, "global_step": 176750, "epoch": 4208} {"train_loss": -7.027759552001953, "global_step": 176751, "epoch": 4208} {"train_loss": -7.110064506530762, "global_step": 176752, "epoch": 4208} {"train_loss": -7.131926536560059, "global_step": 176753, "epoch": 4208} {"train_loss": -7.087660789489746, "global_step": 176754, "epoch": 4208} {"train_loss": -6.973943710327148, "global_step": 176755, "epoch": 4208} {"train_loss": -7.059053421020508, "global_step": 176756, "epoch": 4208} {"train_loss": -7.048386573791504, "global_step": 176757, "epoch": 4208} {"train_loss": -7.1313862800598145, "global_step": 176758, "epoch": 4208} {"train_loss": -7.090967178344727, "global_step": 176759, "epoch": 4208} {"train_loss": -7.040581703186035, "global_step": 176760, "epoch": 4208} {"train_loss": -7.152801036834717, "global_step": 176761, "epoch": 4208} {"train_loss": -7.082695960998535, "global_step": 176762, "epoch": 4208} {"train_loss": -7.072380542755127, "global_step": 176763, "epoch": 4208} {"train_loss": -7.146097660064697, "global_step": 176764, "epoch": 4208} {"train_loss": -7.186180114746094, "global_step": 176765, "epoch": 4208} {"train_loss": -7.157017707824707, "global_step": 176766, "epoch": 4208} {"train_loss": -7.192763805389404, "global_step": 176767, "epoch": 4208} {"train_loss": -7.105273723602295, "global_step": 176768, "epoch": 4208} {"train_loss": -7.188196659088135, "global_step": 176769, "epoch": 4208} {"train_loss": -7.219728469848633, "global_step": 176770, "epoch": 4208} {"train_loss": -7.1938629150390625, "global_step": 176771, "epoch": 4208} {"train_loss": -7.08735466003418, "global_step": 176772, "epoch": 4208} {"train_loss": -7.159185886383057, "global_step": 176773, "epoch": 4208} {"train_loss": -7.137985706329346, "global_step": 176774, "epoch": 4208} {"train_loss": -7.179931640625, "global_step": 176775, "epoch": 4208} {"train_loss": -7.16225528717041, "global_step": 176776, "epoch": 4208} {"train_loss": -7.0744895821525935, "global_step": 176777, "epoch": 4208, "val_loss": 80168.2265625} {"train_loss": -7.173928260803223, "global_step": 176778, "epoch": 4209} {"train_loss": -7.048153400421143, "global_step": 176779, "epoch": 4209} {"train_loss": -6.964995384216309, "global_step": 176780, "epoch": 4209} {"train_loss": -7.070796012878418, "global_step": 176781, "epoch": 4209} {"train_loss": -7.1625776290893555, "global_step": 176782, "epoch": 4209} {"train_loss": -7.169399738311768, "global_step": 176783, "epoch": 4209} {"train_loss": -7.041835784912109, "global_step": 176784, "epoch": 4209} {"train_loss": -7.2348222732543945, "global_step": 176785, "epoch": 4209} {"train_loss": -6.917324066162109, "global_step": 176786, "epoch": 4209} {"train_loss": -6.966949939727783, "global_step": 176787, "epoch": 4209} {"train_loss": -7.121978759765625, "global_step": 176788, "epoch": 4209} {"train_loss": -7.046855926513672, "global_step": 176789, "epoch": 4209} {"train_loss": -7.142824172973633, "global_step": 176790, "epoch": 4209} {"train_loss": -7.1404829025268555, "global_step": 176791, "epoch": 4209} {"train_loss": -6.972794055938721, "global_step": 176792, "epoch": 4209} {"train_loss": -7.011223793029785, "global_step": 176793, "epoch": 4209} {"train_loss": -6.992282867431641, "global_step": 176794, "epoch": 4209} {"train_loss": -7.026500701904297, "global_step": 176795, "epoch": 4209} {"train_loss": -7.018311977386475, "global_step": 176796, "epoch": 4209} {"train_loss": -7.073849201202393, "global_step": 176797, "epoch": 4209} {"train_loss": -7.1203508377075195, "global_step": 176798, "epoch": 4209} {"train_loss": -6.95074462890625, "global_step": 176799, "epoch": 4209} {"train_loss": -7.021552085876465, "global_step": 176800, "epoch": 4209} {"train_loss": -7.077849864959717, "global_step": 176801, "epoch": 4209} {"train_loss": -7.030331134796143, "global_step": 176802, "epoch": 4209} {"train_loss": -7.115070343017578, "global_step": 176803, "epoch": 4209} {"train_loss": -7.0318779945373535, "global_step": 176804, "epoch": 4209} {"train_loss": -7.079993724822998, "global_step": 176805, "epoch": 4209} {"train_loss": -7.034587860107422, "global_step": 176806, "epoch": 4209} {"train_loss": -7.064563274383545, "global_step": 176807, "epoch": 4209} {"train_loss": -7.148716926574707, "global_step": 176808, "epoch": 4209} {"train_loss": -7.080706596374512, "global_step": 176809, "epoch": 4209} {"train_loss": -7.18070650100708, "global_step": 176810, "epoch": 4209} {"train_loss": -7.119561672210693, "global_step": 176811, "epoch": 4209} {"train_loss": -6.999724864959717, "global_step": 176812, "epoch": 4209} {"train_loss": -7.029163360595703, "global_step": 176813, "epoch": 4209} {"train_loss": -7.049963474273682, "global_step": 176814, "epoch": 4209} {"train_loss": -7.000925064086914, "global_step": 176815, "epoch": 4209} {"train_loss": -6.983001708984375, "global_step": 176816, "epoch": 4209} {"train_loss": -7.180343151092529, "global_step": 176817, "epoch": 4209} {"train_loss": -7.0304975509643555, "global_step": 176818, "epoch": 4209} {"train_loss": -7.066050370534261, "global_step": 176819, "epoch": 4209, "val_loss": 80205.734375} {"train_loss": -7.1272430419921875, "global_step": 176820, "epoch": 4210} {"train_loss": -7.079102516174316, "global_step": 176821, "epoch": 4210} {"train_loss": -7.044146537780762, "global_step": 176822, "epoch": 4210} {"train_loss": -7.018825054168701, "global_step": 176823, "epoch": 4210} {"train_loss": -7.065143585205078, "global_step": 176824, "epoch": 4210} {"train_loss": -7.0190229415893555, "global_step": 176825, "epoch": 4210} {"train_loss": -7.158421993255615, "global_step": 176826, "epoch": 4210} {"train_loss": -7.071402549743652, "global_step": 176827, "epoch": 4210} {"train_loss": -7.10756254196167, "global_step": 176828, "epoch": 4210} {"train_loss": -6.969886779785156, "global_step": 176829, "epoch": 4210} {"train_loss": -7.150278091430664, "global_step": 176830, "epoch": 4210} {"train_loss": -7.144756317138672, "global_step": 176831, "epoch": 4210} {"train_loss": -7.175055980682373, "global_step": 176832, "epoch": 4210} {"train_loss": -6.915285587310791, "global_step": 176833, "epoch": 4210} {"train_loss": -7.005403518676758, "global_step": 176834, "epoch": 4210} {"train_loss": -7.074037075042725, "global_step": 176835, "epoch": 4210} {"train_loss": -6.823830604553223, "global_step": 176836, "epoch": 4210} {"train_loss": -7.026021480560303, "global_step": 176837, "epoch": 4210} {"train_loss": -7.013372421264648, "global_step": 176838, "epoch": 4210} {"train_loss": -6.896433353424072, "global_step": 176839, "epoch": 4210} {"train_loss": -7.137922286987305, "global_step": 176840, "epoch": 4210} {"train_loss": -7.0345540046691895, "global_step": 176841, "epoch": 4210} {"train_loss": -7.0220947265625, "global_step": 176842, "epoch": 4210} {"train_loss": -6.981044292449951, "global_step": 176843, "epoch": 4210} {"train_loss": -7.029653549194336, "global_step": 176844, "epoch": 4210} {"train_loss": -7.005358695983887, "global_step": 176845, "epoch": 4210} {"train_loss": -6.980478286743164, "global_step": 176846, "epoch": 4210} {"train_loss": -7.1131591796875, "global_step": 176847, "epoch": 4210} {"train_loss": -7.01834774017334, "global_step": 176848, "epoch": 4210} {"train_loss": -7.037659645080566, "global_step": 176849, "epoch": 4210} {"train_loss": -7.005973815917969, "global_step": 176850, "epoch": 4210} {"train_loss": -7.03398323059082, "global_step": 176851, "epoch": 4210} {"train_loss": -7.005084991455078, "global_step": 176852, "epoch": 4210} {"train_loss": -7.128851890563965, "global_step": 176853, "epoch": 4210} {"train_loss": -7.059432029724121, "global_step": 176854, "epoch": 4210} {"train_loss": -7.051575183868408, "global_step": 176855, "epoch": 4210} {"train_loss": -7.094518661499023, "global_step": 176856, "epoch": 4210} {"train_loss": -7.1547112464904785, "global_step": 176857, "epoch": 4210} {"train_loss": -7.1643385887146, "global_step": 176858, "epoch": 4210} {"train_loss": -7.140321731567383, "global_step": 176859, "epoch": 4210} {"train_loss": -7.202540874481201, "global_step": 176860, "epoch": 4210} {"train_loss": -7.05648117973691, "global_step": 176861, "epoch": 4210, "val_loss": 80059.09375} {"train_loss": -7.252194404602051, "global_step": 176862, "epoch": 4211} {"train_loss": -7.055570125579834, "global_step": 176863, "epoch": 4211} {"train_loss": -7.062891960144043, "global_step": 176864, "epoch": 4211} {"train_loss": -7.082507133483887, "global_step": 176865, "epoch": 4211} {"train_loss": -7.010188102722168, "global_step": 176866, "epoch": 4211} {"train_loss": -7.196184158325195, "global_step": 176867, "epoch": 4211} {"train_loss": -7.16458797454834, "global_step": 176868, "epoch": 4211} {"train_loss": -7.088201522827148, "global_step": 176869, "epoch": 4211} {"train_loss": -7.134493827819824, "global_step": 176870, "epoch": 4211} {"train_loss": -7.215989589691162, "global_step": 176871, "epoch": 4211} {"train_loss": -7.204431533813477, "global_step": 176872, "epoch": 4211} {"train_loss": -7.243556499481201, "global_step": 176873, "epoch": 4211} {"train_loss": -7.031866073608398, "global_step": 176874, "epoch": 4211} {"train_loss": -7.062358856201172, "global_step": 176875, "epoch": 4211} {"train_loss": -7.188147068023682, "global_step": 176876, "epoch": 4211} {"train_loss": -7.10600471496582, "global_step": 176877, "epoch": 4211} {"train_loss": -7.121545791625977, "global_step": 176878, "epoch": 4211} {"train_loss": -7.028988838195801, "global_step": 176879, "epoch": 4211} {"train_loss": -7.128902435302734, "global_step": 176880, "epoch": 4211} {"train_loss": -7.05403995513916, "global_step": 176881, "epoch": 4211} {"train_loss": -7.064729690551758, "global_step": 176882, "epoch": 4211} {"train_loss": -7.05967903137207, "global_step": 176883, "epoch": 4211} {"train_loss": -7.234724998474121, "global_step": 176884, "epoch": 4211} {"train_loss": -7.219249248504639, "global_step": 176885, "epoch": 4211} {"train_loss": -7.104916572570801, "global_step": 176886, "epoch": 4211} {"train_loss": -7.049830913543701, "global_step": 176887, "epoch": 4211} {"train_loss": -7.128238677978516, "global_step": 176888, "epoch": 4211} {"train_loss": -7.034032821655273, "global_step": 176889, "epoch": 4211} {"train_loss": -7.142945766448975, "global_step": 176890, "epoch": 4211} {"train_loss": -7.115388870239258, "global_step": 176891, "epoch": 4211} {"train_loss": -7.130038261413574, "global_step": 176892, "epoch": 4211} {"train_loss": -7.058534622192383, "global_step": 176893, "epoch": 4211} {"train_loss": -7.076018333435059, "global_step": 176894, "epoch": 4211} {"train_loss": -7.199681282043457, "global_step": 176895, "epoch": 4211} {"train_loss": -7.138564109802246, "global_step": 176896, "epoch": 4211} {"train_loss": -7.02421236038208, "global_step": 176897, "epoch": 4211} {"train_loss": -7.146486282348633, "global_step": 176898, "epoch": 4211} {"train_loss": -7.080646514892578, "global_step": 176899, "epoch": 4211} {"train_loss": -7.162481784820557, "global_step": 176900, "epoch": 4211} {"train_loss": -7.13420295715332, "global_step": 176901, "epoch": 4211} {"train_loss": -7.155194282531738, "global_step": 176902, "epoch": 4211} {"train_loss": -7.119884343374343, "global_step": 176903, "epoch": 4211, "val_loss": 80017.5} {"train_loss": -6.929973125457764, "global_step": 176904, "epoch": 4212} {"train_loss": -7.187982559204102, "global_step": 176905, "epoch": 4212} {"train_loss": -7.046927452087402, "global_step": 176906, "epoch": 4212} {"train_loss": -6.928444862365723, "global_step": 176907, "epoch": 4212} {"train_loss": -7.166536331176758, "global_step": 176908, "epoch": 4212} {"train_loss": -6.95886754989624, "global_step": 176909, "epoch": 4212} {"train_loss": -7.197465419769287, "global_step": 176910, "epoch": 4212} {"train_loss": -7.219277381896973, "global_step": 176911, "epoch": 4212} {"train_loss": -7.105299949645996, "global_step": 176912, "epoch": 4212} {"train_loss": -7.157161712646484, "global_step": 176913, "epoch": 4212} {"train_loss": -7.05886173248291, "global_step": 176914, "epoch": 4212} {"train_loss": -7.156886100769043, "global_step": 176915, "epoch": 4212} {"train_loss": -7.007899284362793, "global_step": 176916, "epoch": 4212} {"train_loss": -7.266029357910156, "global_step": 176917, "epoch": 4212} {"train_loss": -7.026467800140381, "global_step": 176918, "epoch": 4212} {"train_loss": -6.981017112731934, "global_step": 176919, "epoch": 4212} {"train_loss": -7.097907543182373, "global_step": 176920, "epoch": 4212} {"train_loss": -7.176782608032227, "global_step": 176921, "epoch": 4212} {"train_loss": -7.148589611053467, "global_step": 176922, "epoch": 4212} {"train_loss": -7.200101852416992, "global_step": 176923, "epoch": 4212} {"train_loss": -7.034331321716309, "global_step": 176924, "epoch": 4212} {"train_loss": -7.054708480834961, "global_step": 176925, "epoch": 4212} {"train_loss": -7.1169891357421875, "global_step": 176926, "epoch": 4212} {"train_loss": -7.142831802368164, "global_step": 176927, "epoch": 4212} {"train_loss": -7.065483093261719, "global_step": 176928, "epoch": 4212} {"train_loss": -7.121193885803223, "global_step": 176929, "epoch": 4212} {"train_loss": -7.102153301239014, "global_step": 176930, "epoch": 4212} {"train_loss": -7.087799072265625, "global_step": 176931, "epoch": 4212} {"train_loss": -7.202460289001465, "global_step": 176932, "epoch": 4212} {"train_loss": -7.156601905822754, "global_step": 176933, "epoch": 4212} {"train_loss": -7.107309341430664, "global_step": 176934, "epoch": 4212} {"train_loss": -7.13486385345459, "global_step": 176935, "epoch": 4212} {"train_loss": -7.2535786628723145, "global_step": 176936, "epoch": 4212} {"train_loss": -7.067681312561035, "global_step": 176937, "epoch": 4212} {"train_loss": -7.241754531860352, "global_step": 176938, "epoch": 4212} {"train_loss": -7.193910598754883, "global_step": 176939, "epoch": 4212} {"train_loss": -7.174932479858398, "global_step": 176940, "epoch": 4212} {"train_loss": -7.161377906799316, "global_step": 176941, "epoch": 4212} {"train_loss": -7.316174507141113, "global_step": 176942, "epoch": 4212} {"train_loss": -7.267274856567383, "global_step": 176943, "epoch": 4212} {"train_loss": -7.210933685302734, "global_step": 176944, "epoch": 4212} {"train_loss": -7.12791429247175, "global_step": 176945, "epoch": 4212, "val_loss": 79974.453125} {"train_loss": -7.196510314941406, "global_step": 176946, "epoch": 4213} {"train_loss": -7.18655252456665, "global_step": 176947, "epoch": 4213} {"train_loss": -7.172511577606201, "global_step": 176948, "epoch": 4213} {"train_loss": -7.154584884643555, "global_step": 176949, "epoch": 4213} {"train_loss": -7.19697904586792, "global_step": 176950, "epoch": 4213} {"train_loss": -7.112546920776367, "global_step": 176951, "epoch": 4213} {"train_loss": -7.002169609069824, "global_step": 176952, "epoch": 4213} {"train_loss": -7.136667728424072, "global_step": 176953, "epoch": 4213} {"train_loss": -7.069882869720459, "global_step": 176954, "epoch": 4213} {"train_loss": -7.064716339111328, "global_step": 176955, "epoch": 4213} {"train_loss": -6.879748821258545, "global_step": 176956, "epoch": 4213} {"train_loss": -7.049638748168945, "global_step": 176957, "epoch": 4213} {"train_loss": -7.089078903198242, "global_step": 176958, "epoch": 4213} {"train_loss": -6.962793350219727, "global_step": 176959, "epoch": 4213} {"train_loss": -7.141546726226807, "global_step": 176960, "epoch": 4213} {"train_loss": -6.960325241088867, "global_step": 176961, "epoch": 4213} {"train_loss": -6.927734851837158, "global_step": 176962, "epoch": 4213} {"train_loss": -7.051799297332764, "global_step": 176963, "epoch": 4213} {"train_loss": -6.8200812339782715, "global_step": 176964, "epoch": 4213} {"train_loss": -7.023176193237305, "global_step": 176965, "epoch": 4213} {"train_loss": -6.589741230010986, "global_step": 176966, "epoch": 4213} {"train_loss": -7.0053558349609375, "global_step": 176967, "epoch": 4213} {"train_loss": -6.9057207107543945, "global_step": 176968, "epoch": 4213} {"train_loss": -6.834692001342773, "global_step": 176969, "epoch": 4213} {"train_loss": -6.845986366271973, "global_step": 176970, "epoch": 4213} {"train_loss": -6.894231796264648, "global_step": 176971, "epoch": 4213} {"train_loss": -6.887554168701172, "global_step": 176972, "epoch": 4213} {"train_loss": -6.855203628540039, "global_step": 176973, "epoch": 4213} {"train_loss": -6.927603721618652, "global_step": 176974, "epoch": 4213} {"train_loss": -6.9576802253723145, "global_step": 176975, "epoch": 4213} {"train_loss": -6.963582992553711, "global_step": 176976, "epoch": 4213} {"train_loss": -6.8654632568359375, "global_step": 176977, "epoch": 4213} {"train_loss": -7.0257978439331055, "global_step": 176978, "epoch": 4213} {"train_loss": -6.954242706298828, "global_step": 176979, "epoch": 4213} {"train_loss": -7.024219512939453, "global_step": 176980, "epoch": 4213} {"train_loss": -6.985996246337891, "global_step": 176981, "epoch": 4213} {"train_loss": -6.939631462097168, "global_step": 176982, "epoch": 4213} {"train_loss": -7.150529861450195, "global_step": 176983, "epoch": 4213} {"train_loss": -7.123368740081787, "global_step": 176984, "epoch": 4213} {"train_loss": -7.034343242645264, "global_step": 176985, "epoch": 4213} {"train_loss": -7.104253768920898, "global_step": 176986, "epoch": 4213} {"train_loss": -7.005212306976318, "global_step": 176987, "epoch": 4213, "val_loss": 80156.140625} {"train_loss": -7.179834365844727, "global_step": 176988, "epoch": 4214} {"train_loss": -7.132580757141113, "global_step": 176989, "epoch": 4214} {"train_loss": -7.037243366241455, "global_step": 176990, "epoch": 4214} {"train_loss": -7.114802837371826, "global_step": 176991, "epoch": 4214} {"train_loss": -7.0162882804870605, "global_step": 176992, "epoch": 4214} {"train_loss": -7.014629364013672, "global_step": 176993, "epoch": 4214} {"train_loss": -7.087629795074463, "global_step": 176994, "epoch": 4214} {"train_loss": -7.059993743896484, "global_step": 176995, "epoch": 4214} {"train_loss": -7.0935564041137695, "global_step": 176996, "epoch": 4214} {"train_loss": -7.190993309020996, "global_step": 176997, "epoch": 4214} {"train_loss": -7.071536064147949, "global_step": 176998, "epoch": 4214} {"train_loss": -7.244150638580322, "global_step": 176999, "epoch": 4214} {"train_loss": -7.230314254760742, "global_step": 177000, "epoch": 4214} {"train_loss": -7.194397926330566, "global_step": 177001, "epoch": 4214} {"train_loss": -7.218038558959961, "global_step": 177002, "epoch": 4214} {"train_loss": -7.196442127227783, "global_step": 177003, "epoch": 4214} {"train_loss": -7.285370826721191, "global_step": 177004, "epoch": 4214} {"train_loss": -7.161143779754639, "global_step": 177005, "epoch": 4214} {"train_loss": -7.050356388092041, "global_step": 177006, "epoch": 4214} {"train_loss": -7.266536712646484, "global_step": 177007, "epoch": 4214} {"train_loss": -7.133530616760254, "global_step": 177008, "epoch": 4214} {"train_loss": -7.25390100479126, "global_step": 177009, "epoch": 4214} {"train_loss": -7.125667572021484, "global_step": 177010, "epoch": 4214} {"train_loss": -7.153532981872559, "global_step": 177011, "epoch": 4214} {"train_loss": -7.185783386230469, "global_step": 177012, "epoch": 4214} {"train_loss": -7.188421249389648, "global_step": 177013, "epoch": 4214} {"train_loss": -7.10551643371582, "global_step": 177014, "epoch": 4214} {"train_loss": -7.270991325378418, "global_step": 177015, "epoch": 4214} {"train_loss": -7.1636061668396, "global_step": 177016, "epoch": 4214} {"train_loss": -7.1047468185424805, "global_step": 177017, "epoch": 4214} {"train_loss": -7.085415840148926, "global_step": 177018, "epoch": 4214} {"train_loss": -7.148151874542236, "global_step": 177019, "epoch": 4214} {"train_loss": -7.134105682373047, "global_step": 177020, "epoch": 4214} {"train_loss": -7.007156848907471, "global_step": 177021, "epoch": 4214} {"train_loss": -7.133586883544922, "global_step": 177022, "epoch": 4214} {"train_loss": -6.934866905212402, "global_step": 177023, "epoch": 4214} {"train_loss": -7.005878448486328, "global_step": 177024, "epoch": 4214} {"train_loss": -7.107269287109375, "global_step": 177025, "epoch": 4214} {"train_loss": -7.122297286987305, "global_step": 177026, "epoch": 4214} {"train_loss": -7.0253801345825195, "global_step": 177027, "epoch": 4214} {"train_loss": -7.213376998901367, "global_step": 177028, "epoch": 4214} {"train_loss": -7.127684740793137, "global_step": 177029, "epoch": 4214, "val_loss": 80306.8046875} {"train_loss": -7.085418701171875, "global_step": 177030, "epoch": 4215} {"train_loss": -7.202670574188232, "global_step": 177031, "epoch": 4215} {"train_loss": -7.195437431335449, "global_step": 177032, "epoch": 4215} {"train_loss": -7.120798587799072, "global_step": 177033, "epoch": 4215} {"train_loss": -7.214237213134766, "global_step": 177034, "epoch": 4215} {"train_loss": -7.136527061462402, "global_step": 177035, "epoch": 4215} {"train_loss": -7.0883283615112305, "global_step": 177036, "epoch": 4215} {"train_loss": -7.1127028465271, "global_step": 177037, "epoch": 4215} {"train_loss": -7.0846967697143555, "global_step": 177038, "epoch": 4215} {"train_loss": -7.152392864227295, "global_step": 177039, "epoch": 4215} {"train_loss": -7.169172286987305, "global_step": 177040, "epoch": 4215} {"train_loss": -7.204832077026367, "global_step": 177041, "epoch": 4215} {"train_loss": -7.187475681304932, "global_step": 177042, "epoch": 4215} {"train_loss": -7.080639839172363, "global_step": 177043, "epoch": 4215} {"train_loss": -7.120929718017578, "global_step": 177044, "epoch": 4215} {"train_loss": -7.23277473449707, "global_step": 177045, "epoch": 4215} {"train_loss": -7.258693218231201, "global_step": 177046, "epoch": 4215} {"train_loss": -7.259373664855957, "global_step": 177047, "epoch": 4215} {"train_loss": -7.240119934082031, "global_step": 177048, "epoch": 4215} {"train_loss": -7.102574825286865, "global_step": 177049, "epoch": 4215} {"train_loss": -7.106256008148193, "global_step": 177050, "epoch": 4215} {"train_loss": -7.187673568725586, "global_step": 177051, "epoch": 4215} {"train_loss": -7.04338264465332, "global_step": 177052, "epoch": 4215} {"train_loss": -7.1109619140625, "global_step": 177053, "epoch": 4215} {"train_loss": -7.115184783935547, "global_step": 177054, "epoch": 4215} {"train_loss": -7.172718524932861, "global_step": 177055, "epoch": 4215} {"train_loss": -7.221811771392822, "global_step": 177056, "epoch": 4215} {"train_loss": -7.150055885314941, "global_step": 177057, "epoch": 4215} {"train_loss": -7.073422908782959, "global_step": 177058, "epoch": 4215} {"train_loss": -7.127256393432617, "global_step": 177059, "epoch": 4215} {"train_loss": -7.128363609313965, "global_step": 177060, "epoch": 4215} {"train_loss": -7.1366448402404785, "global_step": 177061, "epoch": 4215} {"train_loss": -7.202605247497559, "global_step": 177062, "epoch": 4215} {"train_loss": -7.126633644104004, "global_step": 177063, "epoch": 4215} {"train_loss": -7.0997819900512695, "global_step": 177064, "epoch": 4215} {"train_loss": -7.187065124511719, "global_step": 177065, "epoch": 4215} {"train_loss": -7.119363784790039, "global_step": 177066, "epoch": 4215} {"train_loss": -7.086933135986328, "global_step": 177067, "epoch": 4215} {"train_loss": -7.077599048614502, "global_step": 177068, "epoch": 4215} {"train_loss": -7.10642147064209, "global_step": 177069, "epoch": 4215} {"train_loss": -7.1035356521606445, "global_step": 177070, "epoch": 4215} {"train_loss": -7.145678270430792, "global_step": 177071, "epoch": 4215, "val_loss": 80046.2265625} {"train_loss": -7.132828712463379, "global_step": 177072, "epoch": 4216} {"train_loss": -7.157466888427734, "global_step": 177073, "epoch": 4216} {"train_loss": -7.069351673126221, "global_step": 177074, "epoch": 4216} {"train_loss": -7.043688774108887, "global_step": 177075, "epoch": 4216} {"train_loss": -7.15614128112793, "global_step": 177076, "epoch": 4216} {"train_loss": -7.136395454406738, "global_step": 177077, "epoch": 4216} {"train_loss": -7.077239990234375, "global_step": 177078, "epoch": 4216} {"train_loss": -7.168248653411865, "global_step": 177079, "epoch": 4216} {"train_loss": -7.153537750244141, "global_step": 177080, "epoch": 4216} {"train_loss": -7.0978312492370605, "global_step": 177081, "epoch": 4216} {"train_loss": -7.168598175048828, "global_step": 177082, "epoch": 4216} {"train_loss": -7.209712982177734, "global_step": 177083, "epoch": 4216} {"train_loss": -7.184154987335205, "global_step": 177084, "epoch": 4216} {"train_loss": -7.015080451965332, "global_step": 177085, "epoch": 4216} {"train_loss": -7.049591064453125, "global_step": 177086, "epoch": 4216} {"train_loss": -7.255291938781738, "global_step": 177087, "epoch": 4216} {"train_loss": -7.219717502593994, "global_step": 177088, "epoch": 4216} {"train_loss": -7.166484355926514, "global_step": 177089, "epoch": 4216} {"train_loss": -7.184809684753418, "global_step": 177090, "epoch": 4216} {"train_loss": -7.138577461242676, "global_step": 177091, "epoch": 4216} {"train_loss": -7.088740348815918, "global_step": 177092, "epoch": 4216} {"train_loss": -7.246258735656738, "global_step": 177093, "epoch": 4216} {"train_loss": -7.081965446472168, "global_step": 177094, "epoch": 4216} {"train_loss": -7.08145809173584, "global_step": 177095, "epoch": 4216} {"train_loss": -7.18692684173584, "global_step": 177096, "epoch": 4216} {"train_loss": -7.154038906097412, "global_step": 177097, "epoch": 4216} {"train_loss": -7.094615936279297, "global_step": 177098, "epoch": 4216} {"train_loss": -7.096503734588623, "global_step": 177099, "epoch": 4216} {"train_loss": -7.019063949584961, "global_step": 177100, "epoch": 4216} {"train_loss": -7.083422660827637, "global_step": 177101, "epoch": 4216} {"train_loss": -7.174576282501221, "global_step": 177102, "epoch": 4216} {"train_loss": -7.190401077270508, "global_step": 177103, "epoch": 4216} {"train_loss": -7.165931701660156, "global_step": 177104, "epoch": 4216} {"train_loss": -7.1893310546875, "global_step": 177105, "epoch": 4216} {"train_loss": -7.037918567657471, "global_step": 177106, "epoch": 4216} {"train_loss": -7.2171125411987305, "global_step": 177107, "epoch": 4216} {"train_loss": -7.115167617797852, "global_step": 177108, "epoch": 4216} {"train_loss": -7.087708473205566, "global_step": 177109, "epoch": 4216} {"train_loss": -7.284040451049805, "global_step": 177110, "epoch": 4216} {"train_loss": -7.249077320098877, "global_step": 177111, "epoch": 4216} {"train_loss": -7.146465301513672, "global_step": 177112, "epoch": 4216} {"train_loss": -7.141371738343012, "global_step": 177113, "epoch": 4216, "val_loss": 80258.921875} {"train_loss": -7.186189651489258, "global_step": 177114, "epoch": 4217} {"train_loss": -7.268845558166504, "global_step": 177115, "epoch": 4217} {"train_loss": -7.083225250244141, "global_step": 177116, "epoch": 4217} {"train_loss": -7.107251167297363, "global_step": 177117, "epoch": 4217} {"train_loss": -7.053991794586182, "global_step": 177118, "epoch": 4217} {"train_loss": -7.167471885681152, "global_step": 177119, "epoch": 4217} {"train_loss": -7.172220230102539, "global_step": 177120, "epoch": 4217} {"train_loss": -6.9300618171691895, "global_step": 177121, "epoch": 4217} {"train_loss": -6.9066901206970215, "global_step": 177122, "epoch": 4217} {"train_loss": -7.2092485427856445, "global_step": 177123, "epoch": 4217} {"train_loss": -6.974238872528076, "global_step": 177124, "epoch": 4217} {"train_loss": -6.979001998901367, "global_step": 177125, "epoch": 4217} {"train_loss": -7.015998840332031, "global_step": 177126, "epoch": 4217} {"train_loss": -6.921548843383789, "global_step": 177127, "epoch": 4217} {"train_loss": -7.100432395935059, "global_step": 177128, "epoch": 4217} {"train_loss": -7.058910369873047, "global_step": 177129, "epoch": 4217} {"train_loss": -7.0602874755859375, "global_step": 177130, "epoch": 4217} {"train_loss": -7.12449312210083, "global_step": 177131, "epoch": 4217} {"train_loss": -6.942199230194092, "global_step": 177132, "epoch": 4217} {"train_loss": -7.0506367683410645, "global_step": 177133, "epoch": 4217} {"train_loss": -7.002261161804199, "global_step": 177134, "epoch": 4217} {"train_loss": -6.988391876220703, "global_step": 177135, "epoch": 4217} {"train_loss": -7.084103584289551, "global_step": 177136, "epoch": 4217} {"train_loss": -6.984221458435059, "global_step": 177137, "epoch": 4217} {"train_loss": -7.058187484741211, "global_step": 177138, "epoch": 4217} {"train_loss": -6.960750579833984, "global_step": 177139, "epoch": 4217} {"train_loss": -7.046860694885254, "global_step": 177140, "epoch": 4217} {"train_loss": -6.896663188934326, "global_step": 177141, "epoch": 4217} {"train_loss": -7.0777974128723145, "global_step": 177142, "epoch": 4217} {"train_loss": -7.089130401611328, "global_step": 177143, "epoch": 4217} {"train_loss": -6.9061665534973145, "global_step": 177144, "epoch": 4217} {"train_loss": -6.962466239929199, "global_step": 177145, "epoch": 4217} {"train_loss": -7.008941650390625, "global_step": 177146, "epoch": 4217} {"train_loss": -7.160650730133057, "global_step": 177147, "epoch": 4217} {"train_loss": -7.096637725830078, "global_step": 177148, "epoch": 4217} {"train_loss": -7.04149055480957, "global_step": 177149, "epoch": 4217} {"train_loss": -7.052485466003418, "global_step": 177150, "epoch": 4217} {"train_loss": -7.0525360107421875, "global_step": 177151, "epoch": 4217} {"train_loss": -7.10168981552124, "global_step": 177152, "epoch": 4217} {"train_loss": -7.074593544006348, "global_step": 177153, "epoch": 4217} {"train_loss": -7.097931861877441, "global_step": 177154, "epoch": 4217} {"train_loss": -7.052815096718924, "global_step": 177155, "epoch": 4217, "val_loss": 80328.484375} {"train_loss": -7.077178955078125, "global_step": 177156, "epoch": 4218} {"train_loss": -7.098145484924316, "global_step": 177157, "epoch": 4218} {"train_loss": -7.125225067138672, "global_step": 177158, "epoch": 4218} {"train_loss": -7.215723037719727, "global_step": 177159, "epoch": 4218} {"train_loss": -7.145279884338379, "global_step": 177160, "epoch": 4218} {"train_loss": -7.050835609436035, "global_step": 177161, "epoch": 4218} {"train_loss": -7.077768325805664, "global_step": 177162, "epoch": 4218} {"train_loss": -7.1214728355407715, "global_step": 177163, "epoch": 4218} {"train_loss": -6.943027973175049, "global_step": 177164, "epoch": 4218} {"train_loss": -7.160051345825195, "global_step": 177165, "epoch": 4218} {"train_loss": -7.123266220092773, "global_step": 177166, "epoch": 4218} {"train_loss": -7.116957187652588, "global_step": 177167, "epoch": 4218} {"train_loss": -7.130851745605469, "global_step": 177168, "epoch": 4218} {"train_loss": -7.129268646240234, "global_step": 177169, "epoch": 4218} {"train_loss": -7.152912616729736, "global_step": 177170, "epoch": 4218} {"train_loss": -6.999188423156738, "global_step": 177171, "epoch": 4218} {"train_loss": -7.0964508056640625, "global_step": 177172, "epoch": 4218} {"train_loss": -7.190686225891113, "global_step": 177173, "epoch": 4218} {"train_loss": -7.012768745422363, "global_step": 177174, "epoch": 4218} {"train_loss": -7.121517181396484, "global_step": 177175, "epoch": 4218} {"train_loss": -6.990630149841309, "global_step": 177176, "epoch": 4218} {"train_loss": -7.0347514152526855, "global_step": 177177, "epoch": 4218} {"train_loss": -7.175183296203613, "global_step": 177178, "epoch": 4218} {"train_loss": -7.092378616333008, "global_step": 177179, "epoch": 4218} {"train_loss": -7.128905296325684, "global_step": 177180, "epoch": 4218} {"train_loss": -6.9023118019104, "global_step": 177181, "epoch": 4218} {"train_loss": -7.045554161071777, "global_step": 177182, "epoch": 4218} {"train_loss": -7.1508588790893555, "global_step": 177183, "epoch": 4218} {"train_loss": -7.029376029968262, "global_step": 177184, "epoch": 4218} {"train_loss": -7.157428741455078, "global_step": 177185, "epoch": 4218} {"train_loss": -7.111368179321289, "global_step": 177186, "epoch": 4218} {"train_loss": -7.046348571777344, "global_step": 177187, "epoch": 4218} {"train_loss": -7.070817947387695, "global_step": 177188, "epoch": 4218} {"train_loss": -7.112810134887695, "global_step": 177189, "epoch": 4218} {"train_loss": -7.081013202667236, "global_step": 177190, "epoch": 4218} {"train_loss": -7.0300092697143555, "global_step": 177191, "epoch": 4218} {"train_loss": -7.166296005249023, "global_step": 177192, "epoch": 4218} {"train_loss": -7.137089252471924, "global_step": 177193, "epoch": 4218} {"train_loss": -7.0700483322143555, "global_step": 177194, "epoch": 4218} {"train_loss": -7.012325286865234, "global_step": 177195, "epoch": 4218} {"train_loss": -7.13286018371582, "global_step": 177196, "epoch": 4218} {"train_loss": -7.091169573011852, "global_step": 177197, "epoch": 4218, "val_loss": 80349.328125} {"train_loss": -7.08966064453125, "global_step": 177198, "epoch": 4219} {"train_loss": -7.119654178619385, "global_step": 177199, "epoch": 4219} {"train_loss": -7.099874019622803, "global_step": 177200, "epoch": 4219} {"train_loss": -7.263519287109375, "global_step": 177201, "epoch": 4219} {"train_loss": -7.082947731018066, "global_step": 177202, "epoch": 4219} {"train_loss": -7.145601272583008, "global_step": 177203, "epoch": 4219} {"train_loss": -7.166186332702637, "global_step": 177204, "epoch": 4219} {"train_loss": -6.991106986999512, "global_step": 177205, "epoch": 4219} {"train_loss": -7.141244888305664, "global_step": 177206, "epoch": 4219} {"train_loss": -7.138641357421875, "global_step": 177207, "epoch": 4219} {"train_loss": -7.109648704528809, "global_step": 177208, "epoch": 4219} {"train_loss": -7.127069473266602, "global_step": 177209, "epoch": 4219} {"train_loss": -7.201846122741699, "global_step": 177210, "epoch": 4219} {"train_loss": -7.144235134124756, "global_step": 177211, "epoch": 4219} {"train_loss": -7.075772762298584, "global_step": 177212, "epoch": 4219} {"train_loss": -7.060450553894043, "global_step": 177213, "epoch": 4219} {"train_loss": -7.053322792053223, "global_step": 177214, "epoch": 4219} {"train_loss": -6.989017963409424, "global_step": 177215, "epoch": 4219} {"train_loss": -7.153382778167725, "global_step": 177216, "epoch": 4219} {"train_loss": -7.018810272216797, "global_step": 177217, "epoch": 4219} {"train_loss": -6.972334861755371, "global_step": 177218, "epoch": 4219} {"train_loss": -7.086128234863281, "global_step": 177219, "epoch": 4219} {"train_loss": -7.027303695678711, "global_step": 177220, "epoch": 4219} {"train_loss": -7.162862300872803, "global_step": 177221, "epoch": 4219} {"train_loss": -6.980251312255859, "global_step": 177222, "epoch": 4219} {"train_loss": -6.8877339363098145, "global_step": 177223, "epoch": 4219} {"train_loss": -7.032785415649414, "global_step": 177224, "epoch": 4219} {"train_loss": -7.142453193664551, "global_step": 177225, "epoch": 4219} {"train_loss": -7.027041912078857, "global_step": 177226, "epoch": 4219} {"train_loss": -6.963588714599609, "global_step": 177227, "epoch": 4219} {"train_loss": -7.172118186950684, "global_step": 177228, "epoch": 4219} {"train_loss": -7.124449729919434, "global_step": 177229, "epoch": 4219} {"train_loss": -7.077364921569824, "global_step": 177230, "epoch": 4219} {"train_loss": -7.211581230163574, "global_step": 177231, "epoch": 4219} {"train_loss": -7.018229961395264, "global_step": 177232, "epoch": 4219} {"train_loss": -6.999770641326904, "global_step": 177233, "epoch": 4219} {"train_loss": -7.11256742477417, "global_step": 177234, "epoch": 4219} {"train_loss": -7.097750663757324, "global_step": 177235, "epoch": 4219} {"train_loss": -7.147001266479492, "global_step": 177236, "epoch": 4219} {"train_loss": -7.1418561935424805, "global_step": 177237, "epoch": 4219} {"train_loss": -7.10336971282959, "global_step": 177238, "epoch": 4219} {"train_loss": -7.087437958944411, "global_step": 177239, "epoch": 4219, "val_loss": 80241.3984375} {"train_loss": -7.156829357147217, "global_step": 177240, "epoch": 4220} {"train_loss": -7.113499641418457, "global_step": 177241, "epoch": 4220} {"train_loss": -7.065089225769043, "global_step": 177242, "epoch": 4220} {"train_loss": -7.056726932525635, "global_step": 177243, "epoch": 4220} {"train_loss": -7.192108631134033, "global_step": 177244, "epoch": 4220} {"train_loss": -7.1573486328125, "global_step": 177245, "epoch": 4220} {"train_loss": -7.151220321655273, "global_step": 177246, "epoch": 4220} {"train_loss": -7.175692558288574, "global_step": 177247, "epoch": 4220} {"train_loss": -7.112853050231934, "global_step": 177248, "epoch": 4220} {"train_loss": -7.112879753112793, "global_step": 177249, "epoch": 4220} {"train_loss": -7.121103286743164, "global_step": 177250, "epoch": 4220} {"train_loss": -7.011744499206543, "global_step": 177251, "epoch": 4220} {"train_loss": -7.0314226150512695, "global_step": 177252, "epoch": 4220} {"train_loss": -7.105551242828369, "global_step": 177253, "epoch": 4220} {"train_loss": -7.04661750793457, "global_step": 177254, "epoch": 4220} {"train_loss": -7.040836811065674, "global_step": 177255, "epoch": 4220} {"train_loss": -7.08585786819458, "global_step": 177256, "epoch": 4220} {"train_loss": -6.959270477294922, "global_step": 177257, "epoch": 4220} {"train_loss": -6.995819091796875, "global_step": 177258, "epoch": 4220} {"train_loss": -7.071750640869141, "global_step": 177259, "epoch": 4220} {"train_loss": -7.085237503051758, "global_step": 177260, "epoch": 4220} {"train_loss": -7.090470314025879, "global_step": 177261, "epoch": 4220} {"train_loss": -7.08212423324585, "global_step": 177262, "epoch": 4220} {"train_loss": -7.106568813323975, "global_step": 177263, "epoch": 4220} {"train_loss": -6.99130916595459, "global_step": 177264, "epoch": 4220} {"train_loss": -6.973804473876953, "global_step": 177265, "epoch": 4220} {"train_loss": -7.11274528503418, "global_step": 177266, "epoch": 4220} {"train_loss": -6.885589599609375, "global_step": 177267, "epoch": 4220} {"train_loss": -7.0356855392456055, "global_step": 177268, "epoch": 4220} {"train_loss": -7.082574844360352, "global_step": 177269, "epoch": 4220} {"train_loss": -7.086448669433594, "global_step": 177270, "epoch": 4220} {"train_loss": -7.198490142822266, "global_step": 177271, "epoch": 4220} {"train_loss": -7.010578155517578, "global_step": 177272, "epoch": 4220} {"train_loss": -7.075173377990723, "global_step": 177273, "epoch": 4220} {"train_loss": -7.018545150756836, "global_step": 177274, "epoch": 4220} {"train_loss": -7.112979888916016, "global_step": 177275, "epoch": 4220} {"train_loss": -7.037583351135254, "global_step": 177276, "epoch": 4220} {"train_loss": -7.136519432067871, "global_step": 177277, "epoch": 4220} {"train_loss": -7.070398330688477, "global_step": 177278, "epoch": 4220} {"train_loss": -7.0042829513549805, "global_step": 177279, "epoch": 4220} {"train_loss": -7.073653221130371, "global_step": 177280, "epoch": 4220} {"train_loss": -7.0743496645064585, "global_step": 177281, "epoch": 4220, "val_loss": 80427.2578125} {"train_loss": -7.092751502990723, "global_step": 177282, "epoch": 4221} {"train_loss": -7.135407447814941, "global_step": 177283, "epoch": 4221} {"train_loss": -7.090611457824707, "global_step": 177284, "epoch": 4221} {"train_loss": -7.137093544006348, "global_step": 177285, "epoch": 4221} {"train_loss": -7.249295711517334, "global_step": 177286, "epoch": 4221} {"train_loss": -7.072518348693848, "global_step": 177287, "epoch": 4221} {"train_loss": -7.123492240905762, "global_step": 177288, "epoch": 4221} {"train_loss": -7.102686882019043, "global_step": 177289, "epoch": 4221} {"train_loss": -7.201318264007568, "global_step": 177290, "epoch": 4221} {"train_loss": -7.121426582336426, "global_step": 177291, "epoch": 4221} {"train_loss": -7.030026912689209, "global_step": 177292, "epoch": 4221} {"train_loss": -7.069151878356934, "global_step": 177293, "epoch": 4221} {"train_loss": -7.049034118652344, "global_step": 177294, "epoch": 4221} {"train_loss": -7.185501575469971, "global_step": 177295, "epoch": 4221} {"train_loss": -6.994840621948242, "global_step": 177296, "epoch": 4221} {"train_loss": -7.107254981994629, "global_step": 177297, "epoch": 4221} {"train_loss": -7.109740257263184, "global_step": 177298, "epoch": 4221} {"train_loss": -7.133523941040039, "global_step": 177299, "epoch": 4221} {"train_loss": -7.126339912414551, "global_step": 177300, "epoch": 4221} {"train_loss": -7.085843086242676, "global_step": 177301, "epoch": 4221} {"train_loss": -7.039153099060059, "global_step": 177302, "epoch": 4221} {"train_loss": -7.002719879150391, "global_step": 177303, "epoch": 4221} {"train_loss": -7.140651702880859, "global_step": 177304, "epoch": 4221} {"train_loss": -7.173245429992676, "global_step": 177305, "epoch": 4221} {"train_loss": -7.224135398864746, "global_step": 177306, "epoch": 4221} {"train_loss": -7.157877445220947, "global_step": 177307, "epoch": 4221} {"train_loss": -7.188244819641113, "global_step": 177308, "epoch": 4221} {"train_loss": -7.213188171386719, "global_step": 177309, "epoch": 4221} {"train_loss": -7.14631462097168, "global_step": 177310, "epoch": 4221} {"train_loss": -7.211289405822754, "global_step": 177311, "epoch": 4221} {"train_loss": -7.058777332305908, "global_step": 177312, "epoch": 4221} {"train_loss": -7.16378927230835, "global_step": 177313, "epoch": 4221} {"train_loss": -7.202373027801514, "global_step": 177314, "epoch": 4221} {"train_loss": -7.0657758712768555, "global_step": 177315, "epoch": 4221} {"train_loss": -7.183465957641602, "global_step": 177316, "epoch": 4221} {"train_loss": -7.092461109161377, "global_step": 177317, "epoch": 4221} {"train_loss": -7.1392903327941895, "global_step": 177318, "epoch": 4221} {"train_loss": -7.01556921005249, "global_step": 177319, "epoch": 4221} {"train_loss": -6.981986045837402, "global_step": 177320, "epoch": 4221} {"train_loss": -7.111466407775879, "global_step": 177321, "epoch": 4221} {"train_loss": -6.9827470779418945, "global_step": 177322, "epoch": 4221} {"train_loss": -7.112394014994304, "global_step": 177323, "epoch": 4221, "val_loss": 79991.2578125} {"train_loss": -7.068442344665527, "global_step": 177324, "epoch": 4222} {"train_loss": -7.046265602111816, "global_step": 177325, "epoch": 4222} {"train_loss": -7.160155296325684, "global_step": 177326, "epoch": 4222} {"train_loss": -7.1426472663879395, "global_step": 177327, "epoch": 4222} {"train_loss": -6.9242424964904785, "global_step": 177328, "epoch": 4222} {"train_loss": -7.046887397766113, "global_step": 177329, "epoch": 4222} {"train_loss": -7.051616668701172, "global_step": 177330, "epoch": 4222} {"train_loss": -7.166073799133301, "global_step": 177331, "epoch": 4222} {"train_loss": -7.10087776184082, "global_step": 177332, "epoch": 4222} {"train_loss": -7.080265045166016, "global_step": 177333, "epoch": 4222} {"train_loss": -7.141202926635742, "global_step": 177334, "epoch": 4222} {"train_loss": -7.029634952545166, "global_step": 177335, "epoch": 4222} {"train_loss": -7.144054412841797, "global_step": 177336, "epoch": 4222} {"train_loss": -7.057710647583008, "global_step": 177337, "epoch": 4222} {"train_loss": -7.099033355712891, "global_step": 177338, "epoch": 4222} {"train_loss": -7.113582611083984, "global_step": 177339, "epoch": 4222} {"train_loss": -7.137019157409668, "global_step": 177340, "epoch": 4222} {"train_loss": -6.9844136238098145, "global_step": 177341, "epoch": 4222} {"train_loss": -7.134979248046875, "global_step": 177342, "epoch": 4222} {"train_loss": -6.9355597496032715, "global_step": 177343, "epoch": 4222} {"train_loss": -7.0058488845825195, "global_step": 177344, "epoch": 4222} {"train_loss": -7.035856246948242, "global_step": 177345, "epoch": 4222} {"train_loss": -6.932593822479248, "global_step": 177346, "epoch": 4222} {"train_loss": -6.828950881958008, "global_step": 177347, "epoch": 4222} {"train_loss": -6.89255952835083, "global_step": 177348, "epoch": 4222} {"train_loss": -6.95792293548584, "global_step": 177349, "epoch": 4222} {"train_loss": -7.019362449645996, "global_step": 177350, "epoch": 4222} {"train_loss": -7.034257888793945, "global_step": 177351, "epoch": 4222} {"train_loss": -6.932541847229004, "global_step": 177352, "epoch": 4222} {"train_loss": -6.999967575073242, "global_step": 177353, "epoch": 4222} {"train_loss": -6.956815242767334, "global_step": 177354, "epoch": 4222} {"train_loss": -7.016161918640137, "global_step": 177355, "epoch": 4222} {"train_loss": -7.07813835144043, "global_step": 177356, "epoch": 4222} {"train_loss": -6.980688095092773, "global_step": 177357, "epoch": 4222} {"train_loss": -7.112728118896484, "global_step": 177358, "epoch": 4222} {"train_loss": -7.008814811706543, "global_step": 177359, "epoch": 4222} {"train_loss": -7.030863285064697, "global_step": 177360, "epoch": 4222} {"train_loss": -7.017511367797852, "global_step": 177361, "epoch": 4222} {"train_loss": -7.003501892089844, "global_step": 177362, "epoch": 4222} {"train_loss": -7.0773420333862305, "global_step": 177363, "epoch": 4222} {"train_loss": -7.105130672454834, "global_step": 177364, "epoch": 4222} {"train_loss": -7.039142222631545, "global_step": 177365, "epoch": 4222, "val_loss": 80460.375} {"train_loss": -7.001668930053711, "global_step": 177366, "epoch": 4223} {"train_loss": -7.021570205688477, "global_step": 177367, "epoch": 4223} {"train_loss": -7.06508731842041, "global_step": 177368, "epoch": 4223} {"train_loss": -7.074272155761719, "global_step": 177369, "epoch": 4223} {"train_loss": -7.200073719024658, "global_step": 177370, "epoch": 4223} {"train_loss": -7.077880382537842, "global_step": 177371, "epoch": 4223} {"train_loss": -7.062845706939697, "global_step": 177372, "epoch": 4223} {"train_loss": -7.010898113250732, "global_step": 177373, "epoch": 4223} {"train_loss": -7.134856700897217, "global_step": 177374, "epoch": 4223} {"train_loss": -7.026579856872559, "global_step": 177375, "epoch": 4223} {"train_loss": -7.147516250610352, "global_step": 177376, "epoch": 4223} {"train_loss": -7.242530822753906, "global_step": 177377, "epoch": 4223} {"train_loss": -7.1676201820373535, "global_step": 177378, "epoch": 4223} {"train_loss": -7.097786903381348, "global_step": 177379, "epoch": 4223} {"train_loss": -7.255876541137695, "global_step": 177380, "epoch": 4223} {"train_loss": -7.145832061767578, "global_step": 177381, "epoch": 4223} {"train_loss": -7.2326579093933105, "global_step": 177382, "epoch": 4223} {"train_loss": -7.127189636230469, "global_step": 177383, "epoch": 4223} {"train_loss": -7.12088680267334, "global_step": 177384, "epoch": 4223} {"train_loss": -7.235097885131836, "global_step": 177385, "epoch": 4223} {"train_loss": -7.155115127563477, "global_step": 177386, "epoch": 4223} {"train_loss": -7.274299621582031, "global_step": 177387, "epoch": 4223} {"train_loss": -7.184330940246582, "global_step": 177388, "epoch": 4223} {"train_loss": -7.160671710968018, "global_step": 177389, "epoch": 4223} {"train_loss": -7.251067161560059, "global_step": 177390, "epoch": 4223} {"train_loss": -7.212930679321289, "global_step": 177391, "epoch": 4223} {"train_loss": -7.1701178550720215, "global_step": 177392, "epoch": 4223} {"train_loss": -7.25297737121582, "global_step": 177393, "epoch": 4223} {"train_loss": -7.104313850402832, "global_step": 177394, "epoch": 4223} {"train_loss": -7.075770854949951, "global_step": 177395, "epoch": 4223} {"train_loss": -7.063647270202637, "global_step": 177396, "epoch": 4223} {"train_loss": -7.154836654663086, "global_step": 177397, "epoch": 4223} {"train_loss": -7.059037208557129, "global_step": 177398, "epoch": 4223} {"train_loss": -7.037576675415039, "global_step": 177399, "epoch": 4223} {"train_loss": -7.061373710632324, "global_step": 177400, "epoch": 4223} {"train_loss": -7.141562461853027, "global_step": 177401, "epoch": 4223} {"train_loss": -7.051557540893555, "global_step": 177402, "epoch": 4223} {"train_loss": -6.941986083984375, "global_step": 177403, "epoch": 4223} {"train_loss": -7.042407035827637, "global_step": 177404, "epoch": 4223} {"train_loss": -7.151180267333984, "global_step": 177405, "epoch": 4223} {"train_loss": -6.940754413604736, "global_step": 177406, "epoch": 4223} {"train_loss": -7.1181039696648005, "global_step": 177407, "epoch": 4223, "val_loss": 80470.8125} {"train_loss": -7.022866249084473, "global_step": 177408, "epoch": 4224} {"train_loss": -7.09527587890625, "global_step": 177409, "epoch": 4224} {"train_loss": -7.090204238891602, "global_step": 177410, "epoch": 4224} {"train_loss": -7.006802082061768, "global_step": 177411, "epoch": 4224} {"train_loss": -7.055441856384277, "global_step": 177412, "epoch": 4224} {"train_loss": -7.0625200271606445, "global_step": 177413, "epoch": 4224} {"train_loss": -6.940862655639648, "global_step": 177414, "epoch": 4224} {"train_loss": -7.100224018096924, "global_step": 177415, "epoch": 4224} {"train_loss": -7.1570916175842285, "global_step": 177416, "epoch": 4224} {"train_loss": -7.168763637542725, "global_step": 177417, "epoch": 4224} {"train_loss": -7.035799026489258, "global_step": 177418, "epoch": 4224} {"train_loss": -7.1340837478637695, "global_step": 177419, "epoch": 4224} {"train_loss": -7.228417873382568, "global_step": 177420, "epoch": 4224} {"train_loss": -7.182256698608398, "global_step": 177421, "epoch": 4224} {"train_loss": -7.283361434936523, "global_step": 177422, "epoch": 4224} {"train_loss": -7.038516998291016, "global_step": 177423, "epoch": 4224} {"train_loss": -7.16103458404541, "global_step": 177424, "epoch": 4224} {"train_loss": -7.054987907409668, "global_step": 177425, "epoch": 4224} {"train_loss": -7.096861839294434, "global_step": 177426, "epoch": 4224} {"train_loss": -7.068403720855713, "global_step": 177427, "epoch": 4224} {"train_loss": -7.156279563903809, "global_step": 177428, "epoch": 4224} {"train_loss": -7.148279190063477, "global_step": 177429, "epoch": 4224} {"train_loss": -7.151740074157715, "global_step": 177430, "epoch": 4224} {"train_loss": -7.107600212097168, "global_step": 177431, "epoch": 4224} {"train_loss": -7.118109703063965, "global_step": 177432, "epoch": 4224} {"train_loss": -7.260799407958984, "global_step": 177433, "epoch": 4224} {"train_loss": -7.0696330070495605, "global_step": 177434, "epoch": 4224} {"train_loss": -6.965875625610352, "global_step": 177435, "epoch": 4224} {"train_loss": -7.116646766662598, "global_step": 177436, "epoch": 4224} {"train_loss": -7.06081485748291, "global_step": 177437, "epoch": 4224} {"train_loss": -7.128531455993652, "global_step": 177438, "epoch": 4224} {"train_loss": -7.178741455078125, "global_step": 177439, "epoch": 4224} {"train_loss": -7.022431373596191, "global_step": 177440, "epoch": 4224} {"train_loss": -6.9010772705078125, "global_step": 177441, "epoch": 4224} {"train_loss": -7.072328567504883, "global_step": 177442, "epoch": 4224} {"train_loss": -7.019946098327637, "global_step": 177443, "epoch": 4224} {"train_loss": -7.165909767150879, "global_step": 177444, "epoch": 4224} {"train_loss": -6.988961219787598, "global_step": 177445, "epoch": 4224} {"train_loss": -7.027896404266357, "global_step": 177446, "epoch": 4224} {"train_loss": -6.968329429626465, "global_step": 177447, "epoch": 4224} {"train_loss": -7.016842842102051, "global_step": 177448, "epoch": 4224} {"train_loss": -7.087121713729132, "global_step": 177449, "epoch": 4224, "val_loss": 80521.09375} {"train_loss": -7.009052276611328, "global_step": 177450, "epoch": 4225} {"train_loss": -7.12758207321167, "global_step": 177451, "epoch": 4225} {"train_loss": -7.220032691955566, "global_step": 177452, "epoch": 4225} {"train_loss": -7.089898109436035, "global_step": 177453, "epoch": 4225} {"train_loss": -7.111997604370117, "global_step": 177454, "epoch": 4225} {"train_loss": -7.051444053649902, "global_step": 177455, "epoch": 4225} {"train_loss": -6.99110221862793, "global_step": 177456, "epoch": 4225} {"train_loss": -7.072025299072266, "global_step": 177457, "epoch": 4225} {"train_loss": -7.150247097015381, "global_step": 177458, "epoch": 4225} {"train_loss": -7.118374347686768, "global_step": 177459, "epoch": 4225} {"train_loss": -7.083225727081299, "global_step": 177460, "epoch": 4225} {"train_loss": -7.082258701324463, "global_step": 177461, "epoch": 4225} {"train_loss": -7.188156604766846, "global_step": 177462, "epoch": 4225} {"train_loss": -7.1609907150268555, "global_step": 177463, "epoch": 4225} {"train_loss": -7.157519340515137, "global_step": 177464, "epoch": 4225} {"train_loss": -7.097108840942383, "global_step": 177465, "epoch": 4225} {"train_loss": -7.117901802062988, "global_step": 177466, "epoch": 4225} {"train_loss": -7.137049198150635, "global_step": 177467, "epoch": 4225} {"train_loss": -7.106024265289307, "global_step": 177468, "epoch": 4225} {"train_loss": -7.176494121551514, "global_step": 177469, "epoch": 4225} {"train_loss": -7.2401580810546875, "global_step": 177470, "epoch": 4225} {"train_loss": -7.16087007522583, "global_step": 177471, "epoch": 4225} {"train_loss": -7.210349082946777, "global_step": 177472, "epoch": 4225} {"train_loss": -7.061031818389893, "global_step": 177473, "epoch": 4225} {"train_loss": -7.029219627380371, "global_step": 177474, "epoch": 4225} {"train_loss": -7.196229934692383, "global_step": 177475, "epoch": 4225} {"train_loss": -7.1325273513793945, "global_step": 177476, "epoch": 4225} {"train_loss": -7.240396499633789, "global_step": 177477, "epoch": 4225} {"train_loss": -7.092860221862793, "global_step": 177478, "epoch": 4225} {"train_loss": -7.142417907714844, "global_step": 177479, "epoch": 4225} {"train_loss": -7.156970977783203, "global_step": 177480, "epoch": 4225} {"train_loss": -7.173566818237305, "global_step": 177481, "epoch": 4225} {"train_loss": -7.0511884689331055, "global_step": 177482, "epoch": 4225} {"train_loss": -7.153228282928467, "global_step": 177483, "epoch": 4225} {"train_loss": -7.090803146362305, "global_step": 177484, "epoch": 4225} {"train_loss": -7.111525058746338, "global_step": 177485, "epoch": 4225} {"train_loss": -7.221076011657715, "global_step": 177486, "epoch": 4225} {"train_loss": -6.988580226898193, "global_step": 177487, "epoch": 4225} {"train_loss": -7.1905198097229, "global_step": 177488, "epoch": 4225} {"train_loss": -7.076233386993408, "global_step": 177489, "epoch": 4225} {"train_loss": -7.186241149902344, "global_step": 177490, "epoch": 4225} {"train_loss": -7.125057197752453, "global_step": 177491, "epoch": 4225, "val_loss": 80377.734375} {"train_loss": -7.004748344421387, "global_step": 177492, "epoch": 4226} {"train_loss": -7.078632354736328, "global_step": 177493, "epoch": 4226} {"train_loss": -7.165027618408203, "global_step": 177494, "epoch": 4226} {"train_loss": -7.067363262176514, "global_step": 177495, "epoch": 4226} {"train_loss": -7.214885234832764, "global_step": 177496, "epoch": 4226} {"train_loss": -7.101465225219727, "global_step": 177497, "epoch": 4226} {"train_loss": -7.044579982757568, "global_step": 177498, "epoch": 4226} {"train_loss": -7.131413459777832, "global_step": 177499, "epoch": 4226} {"train_loss": -7.080092430114746, "global_step": 177500, "epoch": 4226} {"train_loss": -7.097318649291992, "global_step": 177501, "epoch": 4226} {"train_loss": -7.102688789367676, "global_step": 177502, "epoch": 4226} {"train_loss": -6.9910359382629395, "global_step": 177503, "epoch": 4226} {"train_loss": -7.147275924682617, "global_step": 177504, "epoch": 4226} {"train_loss": -7.04035758972168, "global_step": 177505, "epoch": 4226} {"train_loss": -7.06698751449585, "global_step": 177506, "epoch": 4226} {"train_loss": -7.0755815505981445, "global_step": 177507, "epoch": 4226} {"train_loss": -6.975985527038574, "global_step": 177508, "epoch": 4226} {"train_loss": -7.050488471984863, "global_step": 177509, "epoch": 4226} {"train_loss": -7.050093173980713, "global_step": 177510, "epoch": 4226} {"train_loss": -6.929891109466553, "global_step": 177511, "epoch": 4226} {"train_loss": -7.114128589630127, "global_step": 177512, "epoch": 4226} {"train_loss": -7.020029067993164, "global_step": 177513, "epoch": 4226} {"train_loss": -6.984560012817383, "global_step": 177514, "epoch": 4226} {"train_loss": -7.077875137329102, "global_step": 177515, "epoch": 4226} {"train_loss": -7.009465217590332, "global_step": 177516, "epoch": 4226} {"train_loss": -7.137552261352539, "global_step": 177517, "epoch": 4226} {"train_loss": -7.089804649353027, "global_step": 177518, "epoch": 4226} {"train_loss": -7.1852006912231445, "global_step": 177519, "epoch": 4226} {"train_loss": -7.02741003036499, "global_step": 177520, "epoch": 4226} {"train_loss": -7.059230804443359, "global_step": 177521, "epoch": 4226} {"train_loss": -7.076333999633789, "global_step": 177522, "epoch": 4226} {"train_loss": -7.17372989654541, "global_step": 177523, "epoch": 4226} {"train_loss": -7.010890007019043, "global_step": 177524, "epoch": 4226} {"train_loss": -7.161354064941406, "global_step": 177525, "epoch": 4226} {"train_loss": -7.034938812255859, "global_step": 177526, "epoch": 4226} {"train_loss": -7.084686279296875, "global_step": 177527, "epoch": 4226} {"train_loss": -7.190692901611328, "global_step": 177528, "epoch": 4226} {"train_loss": -7.076281547546387, "global_step": 177529, "epoch": 4226} {"train_loss": -7.089472770690918, "global_step": 177530, "epoch": 4226} {"train_loss": -7.046664237976074, "global_step": 177531, "epoch": 4226} {"train_loss": -7.13063907623291, "global_step": 177532, "epoch": 4226} {"train_loss": -7.076111975170317, "global_step": 177533, "epoch": 4226, "val_loss": 80275.6015625} {"train_loss": -6.816901206970215, "global_step": 177534, "epoch": 4227} {"train_loss": -7.073822975158691, "global_step": 177535, "epoch": 4227} {"train_loss": -6.996918678283691, "global_step": 177536, "epoch": 4227} {"train_loss": -7.009768009185791, "global_step": 177537, "epoch": 4227} {"train_loss": -7.055127143859863, "global_step": 177538, "epoch": 4227} {"train_loss": -6.899959564208984, "global_step": 177539, "epoch": 4227} {"train_loss": -7.050974369049072, "global_step": 177540, "epoch": 4227} {"train_loss": -6.733214378356934, "global_step": 177541, "epoch": 4227} {"train_loss": -7.102363586425781, "global_step": 177542, "epoch": 4227} {"train_loss": -6.900067329406738, "global_step": 177543, "epoch": 4227} {"train_loss": -6.952815055847168, "global_step": 177544, "epoch": 4227} {"train_loss": -6.919157028198242, "global_step": 177545, "epoch": 4227} {"train_loss": -7.022834777832031, "global_step": 177546, "epoch": 4227} {"train_loss": -7.015619277954102, "global_step": 177547, "epoch": 4227} {"train_loss": -7.068035125732422, "global_step": 177548, "epoch": 4227} {"train_loss": -6.592935085296631, "global_step": 177549, "epoch": 4227} {"train_loss": -7.01666784286499, "global_step": 177550, "epoch": 4227} {"train_loss": -6.710755825042725, "global_step": 177551, "epoch": 4227} {"train_loss": -6.969417572021484, "global_step": 177552, "epoch": 4227} {"train_loss": -6.993376731872559, "global_step": 177553, "epoch": 4227} {"train_loss": -6.8056721687316895, "global_step": 177554, "epoch": 4227} {"train_loss": -6.899734973907471, "global_step": 177555, "epoch": 4227} {"train_loss": -6.968348503112793, "global_step": 177556, "epoch": 4227} {"train_loss": -7.121233940124512, "global_step": 177557, "epoch": 4227} {"train_loss": -6.909612655639648, "global_step": 177558, "epoch": 4227} {"train_loss": -7.040922164916992, "global_step": 177559, "epoch": 4227} {"train_loss": -6.940222263336182, "global_step": 177560, "epoch": 4227} {"train_loss": -7.034202575683594, "global_step": 177561, "epoch": 4227} {"train_loss": -7.0751190185546875, "global_step": 177562, "epoch": 4227} {"train_loss": -7.123553276062012, "global_step": 177563, "epoch": 4227} {"train_loss": -7.044751167297363, "global_step": 177564, "epoch": 4227} {"train_loss": -7.125995635986328, "global_step": 177565, "epoch": 4227} {"train_loss": -7.082193374633789, "global_step": 177566, "epoch": 4227} {"train_loss": -7.173626899719238, "global_step": 177567, "epoch": 4227} {"train_loss": -7.1150431632995605, "global_step": 177568, "epoch": 4227} {"train_loss": -7.110433578491211, "global_step": 177569, "epoch": 4227} {"train_loss": -7.110185623168945, "global_step": 177570, "epoch": 4227} {"train_loss": -7.113397598266602, "global_step": 177571, "epoch": 4227} {"train_loss": -7.037041664123535, "global_step": 177572, "epoch": 4227} {"train_loss": -7.113162994384766, "global_step": 177573, "epoch": 4227} {"train_loss": -7.151186466217041, "global_step": 177574, "epoch": 4227} {"train_loss": -7.004625433967227, "global_step": 177575, "epoch": 4227, "val_loss": 80299.453125} {"train_loss": -7.195250511169434, "global_step": 177576, "epoch": 4228} {"train_loss": -7.214298248291016, "global_step": 177577, "epoch": 4228} {"train_loss": -7.152514457702637, "global_step": 177578, "epoch": 4228} {"train_loss": -7.152561187744141, "global_step": 177579, "epoch": 4228} {"train_loss": -7.167025089263916, "global_step": 177580, "epoch": 4228} {"train_loss": -7.063673973083496, "global_step": 177581, "epoch": 4228} {"train_loss": -7.165980339050293, "global_step": 177582, "epoch": 4228} {"train_loss": -7.147576808929443, "global_step": 177583, "epoch": 4228} {"train_loss": -7.120683193206787, "global_step": 177584, "epoch": 4228} {"train_loss": -7.050978660583496, "global_step": 177585, "epoch": 4228} {"train_loss": -7.211360931396484, "global_step": 177586, "epoch": 4228} {"train_loss": -7.250258922576904, "global_step": 177587, "epoch": 4228} {"train_loss": -6.902796745300293, "global_step": 177588, "epoch": 4228} {"train_loss": -7.089570999145508, "global_step": 177589, "epoch": 4228} {"train_loss": -7.179594993591309, "global_step": 177590, "epoch": 4228} {"train_loss": -7.043790817260742, "global_step": 177591, "epoch": 4228} {"train_loss": -6.963388442993164, "global_step": 177592, "epoch": 4228} {"train_loss": -7.165613174438477, "global_step": 177593, "epoch": 4228} {"train_loss": -7.174677848815918, "global_step": 177594, "epoch": 4228} {"train_loss": -7.212169647216797, "global_step": 177595, "epoch": 4228} {"train_loss": -7.128606796264648, "global_step": 177596, "epoch": 4228} {"train_loss": -7.189533233642578, "global_step": 177597, "epoch": 4228} {"train_loss": -7.141800880432129, "global_step": 177598, "epoch": 4228} {"train_loss": -7.1737847328186035, "global_step": 177599, "epoch": 4228} {"train_loss": -7.282217979431152, "global_step": 177600, "epoch": 4228} {"train_loss": -7.181999206542969, "global_step": 177601, "epoch": 4228} {"train_loss": -7.225133419036865, "global_step": 177602, "epoch": 4228} {"train_loss": -7.25697135925293, "global_step": 177603, "epoch": 4228} {"train_loss": -7.150667667388916, "global_step": 177604, "epoch": 4228} {"train_loss": -7.120932579040527, "global_step": 177605, "epoch": 4228} {"train_loss": -7.07170295715332, "global_step": 177606, "epoch": 4228} {"train_loss": -7.2110419273376465, "global_step": 177607, "epoch": 4228} {"train_loss": -7.247401237487793, "global_step": 177608, "epoch": 4228} {"train_loss": -7.141801357269287, "global_step": 177609, "epoch": 4228} {"train_loss": -7.111645698547363, "global_step": 177610, "epoch": 4228} {"train_loss": -7.157865524291992, "global_step": 177611, "epoch": 4228} {"train_loss": -7.121427536010742, "global_step": 177612, "epoch": 4228} {"train_loss": -7.255552291870117, "global_step": 177613, "epoch": 4228} {"train_loss": -7.198253631591797, "global_step": 177614, "epoch": 4228} {"train_loss": -7.2312164306640625, "global_step": 177615, "epoch": 4228} {"train_loss": -7.223712921142578, "global_step": 177616, "epoch": 4228} {"train_loss": -7.1569813546680265, "global_step": 177617, "epoch": 4228, "val_loss": 80264.9921875} {"train_loss": -7.233414649963379, "global_step": 177618, "epoch": 4229} {"train_loss": -7.145247459411621, "global_step": 177619, "epoch": 4229} {"train_loss": -7.208460807800293, "global_step": 177620, "epoch": 4229} {"train_loss": -7.182765007019043, "global_step": 177621, "epoch": 4229} {"train_loss": -7.248236656188965, "global_step": 177622, "epoch": 4229} {"train_loss": -7.19733190536499, "global_step": 177623, "epoch": 4229} {"train_loss": -7.153543472290039, "global_step": 177624, "epoch": 4229} {"train_loss": -7.37345027923584, "global_step": 177625, "epoch": 4229} {"train_loss": -7.22850227355957, "global_step": 177626, "epoch": 4229} {"train_loss": -7.172062873840332, "global_step": 177627, "epoch": 4229} {"train_loss": -7.066608905792236, "global_step": 177628, "epoch": 4229} {"train_loss": -7.016911506652832, "global_step": 177629, "epoch": 4229} {"train_loss": -7.138730049133301, "global_step": 177630, "epoch": 4229} {"train_loss": -7.079809665679932, "global_step": 177631, "epoch": 4229} {"train_loss": -7.156987190246582, "global_step": 177632, "epoch": 4229} {"train_loss": -7.0048980712890625, "global_step": 177633, "epoch": 4229} {"train_loss": -7.200962543487549, "global_step": 177634, "epoch": 4229} {"train_loss": -6.992859840393066, "global_step": 177635, "epoch": 4229} {"train_loss": -7.096353530883789, "global_step": 177636, "epoch": 4229} {"train_loss": -7.117948532104492, "global_step": 177637, "epoch": 4229} {"train_loss": -7.042612075805664, "global_step": 177638, "epoch": 4229} {"train_loss": -7.185163974761963, "global_step": 177639, "epoch": 4229} {"train_loss": -7.089950084686279, "global_step": 177640, "epoch": 4229} {"train_loss": -7.06751823425293, "global_step": 177641, "epoch": 4229} {"train_loss": -7.083395004272461, "global_step": 177642, "epoch": 4229} {"train_loss": -7.047760963439941, "global_step": 177643, "epoch": 4229} {"train_loss": -7.063276290893555, "global_step": 177644, "epoch": 4229} {"train_loss": -7.113781929016113, "global_step": 177645, "epoch": 4229} {"train_loss": -6.969046592712402, "global_step": 177646, "epoch": 4229} {"train_loss": -6.978880882263184, "global_step": 177647, "epoch": 4229} {"train_loss": -7.119716644287109, "global_step": 177648, "epoch": 4229} {"train_loss": -7.062382698059082, "global_step": 177649, "epoch": 4229} {"train_loss": -7.100589752197266, "global_step": 177650, "epoch": 4229} {"train_loss": -7.029585361480713, "global_step": 177651, "epoch": 4229} {"train_loss": -7.102812767028809, "global_step": 177652, "epoch": 4229} {"train_loss": -7.009538650512695, "global_step": 177653, "epoch": 4229} {"train_loss": -6.974215030670166, "global_step": 177654, "epoch": 4229} {"train_loss": -7.025871276855469, "global_step": 177655, "epoch": 4229} {"train_loss": -7.128978729248047, "global_step": 177656, "epoch": 4229} {"train_loss": -7.024517059326172, "global_step": 177657, "epoch": 4229} {"train_loss": -7.1066179275512695, "global_step": 177658, "epoch": 4229} {"train_loss": -7.105230899084182, "global_step": 177659, "epoch": 4229, "val_loss": 80255.53125} {"train_loss": -7.057961940765381, "global_step": 177660, "epoch": 4230} {"train_loss": -7.171177864074707, "global_step": 177661, "epoch": 4230} {"train_loss": -7.050769805908203, "global_step": 177662, "epoch": 4230} {"train_loss": -7.077296257019043, "global_step": 177663, "epoch": 4230} {"train_loss": -7.192523002624512, "global_step": 177664, "epoch": 4230} {"train_loss": -7.197772026062012, "global_step": 177665, "epoch": 4230} {"train_loss": -7.100586891174316, "global_step": 177666, "epoch": 4230} {"train_loss": -7.096687316894531, "global_step": 177667, "epoch": 4230} {"train_loss": -7.134515285491943, "global_step": 177668, "epoch": 4230} {"train_loss": -7.141069412231445, "global_step": 177669, "epoch": 4230} {"train_loss": -7.119139671325684, "global_step": 177670, "epoch": 4230} {"train_loss": -7.008474826812744, "global_step": 177671, "epoch": 4230} {"train_loss": -7.175671100616455, "global_step": 177672, "epoch": 4230} {"train_loss": -7.135608196258545, "global_step": 177673, "epoch": 4230} {"train_loss": -7.013389587402344, "global_step": 177674, "epoch": 4230} {"train_loss": -7.110015869140625, "global_step": 177675, "epoch": 4230} {"train_loss": -7.092270374298096, "global_step": 177676, "epoch": 4230} {"train_loss": -6.938727378845215, "global_step": 177677, "epoch": 4230} {"train_loss": -7.049314498901367, "global_step": 177678, "epoch": 4230} {"train_loss": -6.93798828125, "global_step": 177679, "epoch": 4230} {"train_loss": -7.014492988586426, "global_step": 177680, "epoch": 4230} {"train_loss": -7.064391136169434, "global_step": 177681, "epoch": 4230} {"train_loss": -7.1774749755859375, "global_step": 177682, "epoch": 4230} {"train_loss": -7.116959571838379, "global_step": 177683, "epoch": 4230} {"train_loss": -6.986027717590332, "global_step": 177684, "epoch": 4230} {"train_loss": -6.940530776977539, "global_step": 177685, "epoch": 4230} {"train_loss": -7.008296012878418, "global_step": 177686, "epoch": 4230} {"train_loss": -6.979580402374268, "global_step": 177687, "epoch": 4230} {"train_loss": -6.828268051147461, "global_step": 177688, "epoch": 4230} {"train_loss": -7.073572158813477, "global_step": 177689, "epoch": 4230} {"train_loss": -7.0352091789245605, "global_step": 177690, "epoch": 4230} {"train_loss": -7.000729084014893, "global_step": 177691, "epoch": 4230} {"train_loss": -7.020695209503174, "global_step": 177692, "epoch": 4230} {"train_loss": -6.9875593185424805, "global_step": 177693, "epoch": 4230} {"train_loss": -7.079896926879883, "global_step": 177694, "epoch": 4230} {"train_loss": -7.044103622436523, "global_step": 177695, "epoch": 4230} {"train_loss": -7.203681468963623, "global_step": 177696, "epoch": 4230} {"train_loss": -7.058964729309082, "global_step": 177697, "epoch": 4230} {"train_loss": -7.15467643737793, "global_step": 177698, "epoch": 4230} {"train_loss": -6.925010681152344, "global_step": 177699, "epoch": 4230} {"train_loss": -7.002584457397461, "global_step": 177700, "epoch": 4230} {"train_loss": -7.061657485507784, "global_step": 177701, "epoch": 4230, "val_loss": 80595.015625} {"train_loss": -7.0576066970825195, "global_step": 177702, "epoch": 4231} {"train_loss": -7.106285095214844, "global_step": 177703, "epoch": 4231} {"train_loss": -7.057928085327148, "global_step": 177704, "epoch": 4231} {"train_loss": -7.033239364624023, "global_step": 177705, "epoch": 4231} {"train_loss": -7.094211578369141, "global_step": 177706, "epoch": 4231} {"train_loss": -6.943700790405273, "global_step": 177707, "epoch": 4231} {"train_loss": -7.083804607391357, "global_step": 177708, "epoch": 4231} {"train_loss": -7.102380752563477, "global_step": 177709, "epoch": 4231} {"train_loss": -6.967606544494629, "global_step": 177710, "epoch": 4231} {"train_loss": -7.010452747344971, "global_step": 177711, "epoch": 4231} {"train_loss": -6.9764299392700195, "global_step": 177712, "epoch": 4231} {"train_loss": -7.038122653961182, "global_step": 177713, "epoch": 4231} {"train_loss": -7.099097728729248, "global_step": 177714, "epoch": 4231} {"train_loss": -6.950714111328125, "global_step": 177715, "epoch": 4231} {"train_loss": -7.158718109130859, "global_step": 177716, "epoch": 4231} {"train_loss": -7.083416938781738, "global_step": 177717, "epoch": 4231} {"train_loss": -7.020695686340332, "global_step": 177718, "epoch": 4231} {"train_loss": -7.113298416137695, "global_step": 177719, "epoch": 4231} {"train_loss": -7.241324424743652, "global_step": 177720, "epoch": 4231} {"train_loss": -7.132165908813477, "global_step": 177721, "epoch": 4231} {"train_loss": -7.014359951019287, "global_step": 177722, "epoch": 4231} {"train_loss": -7.1152448654174805, "global_step": 177723, "epoch": 4231} {"train_loss": -7.141252040863037, "global_step": 177724, "epoch": 4231} {"train_loss": -7.06981086730957, "global_step": 177725, "epoch": 4231} {"train_loss": -7.037162780761719, "global_step": 177726, "epoch": 4231} {"train_loss": -7.028443813323975, "global_step": 177727, "epoch": 4231} {"train_loss": -7.126748085021973, "global_step": 177728, "epoch": 4231} {"train_loss": -6.923943996429443, "global_step": 177729, "epoch": 4231} {"train_loss": -7.057575702667236, "global_step": 177730, "epoch": 4231} {"train_loss": -7.052666187286377, "global_step": 177731, "epoch": 4231} {"train_loss": -6.920205116271973, "global_step": 177732, "epoch": 4231} {"train_loss": -7.162961483001709, "global_step": 177733, "epoch": 4231} {"train_loss": -6.8464555740356445, "global_step": 177734, "epoch": 4231} {"train_loss": -7.12650203704834, "global_step": 177735, "epoch": 4231} {"train_loss": -7.079279899597168, "global_step": 177736, "epoch": 4231} {"train_loss": -6.967332363128662, "global_step": 177737, "epoch": 4231} {"train_loss": -7.1446990966796875, "global_step": 177738, "epoch": 4231} {"train_loss": -6.886086940765381, "global_step": 177739, "epoch": 4231} {"train_loss": -7.133423328399658, "global_step": 177740, "epoch": 4231} {"train_loss": -6.938081741333008, "global_step": 177741, "epoch": 4231} {"train_loss": -6.953202247619629, "global_step": 177742, "epoch": 4231} {"train_loss": -7.044051601773217, "global_step": 177743, "epoch": 4231, "val_loss": 80238.3125} {"train_loss": -7.174261093139648, "global_step": 177744, "epoch": 4232} {"train_loss": -6.952640056610107, "global_step": 177745, "epoch": 4232} {"train_loss": -7.012326240539551, "global_step": 177746, "epoch": 4232} {"train_loss": -7.043420791625977, "global_step": 177747, "epoch": 4232} {"train_loss": -6.95372200012207, "global_step": 177748, "epoch": 4232} {"train_loss": -6.958184719085693, "global_step": 177749, "epoch": 4232} {"train_loss": -7.029092788696289, "global_step": 177750, "epoch": 4232} {"train_loss": -6.850975036621094, "global_step": 177751, "epoch": 4232} {"train_loss": -7.085999488830566, "global_step": 177752, "epoch": 4232} {"train_loss": -7.0352582931518555, "global_step": 177753, "epoch": 4232} {"train_loss": -7.121362209320068, "global_step": 177754, "epoch": 4232} {"train_loss": -7.099541187286377, "global_step": 177755, "epoch": 4232} {"train_loss": -7.085073471069336, "global_step": 177756, "epoch": 4232} {"train_loss": -7.11445426940918, "global_step": 177757, "epoch": 4232} {"train_loss": -7.051001071929932, "global_step": 177758, "epoch": 4232} {"train_loss": -7.000814437866211, "global_step": 177759, "epoch": 4232} {"train_loss": -6.906425476074219, "global_step": 177760, "epoch": 4232} {"train_loss": -7.112292289733887, "global_step": 177761, "epoch": 4232} {"train_loss": -7.004058837890625, "global_step": 177762, "epoch": 4232} {"train_loss": -7.088123321533203, "global_step": 177763, "epoch": 4232} {"train_loss": -7.009888648986816, "global_step": 177764, "epoch": 4232} {"train_loss": -7.153629302978516, "global_step": 177765, "epoch": 4232} {"train_loss": -7.002450466156006, "global_step": 177766, "epoch": 4232} {"train_loss": -7.030214309692383, "global_step": 177767, "epoch": 4232} {"train_loss": -7.0861101150512695, "global_step": 177768, "epoch": 4232} {"train_loss": -7.23000431060791, "global_step": 177769, "epoch": 4232} {"train_loss": -7.074715614318848, "global_step": 177770, "epoch": 4232} {"train_loss": -7.0362982749938965, "global_step": 177771, "epoch": 4232} {"train_loss": -7.066136360168457, "global_step": 177772, "epoch": 4232} {"train_loss": -7.190985202789307, "global_step": 177773, "epoch": 4232} {"train_loss": -7.125060558319092, "global_step": 177774, "epoch": 4232} {"train_loss": -7.249963760375977, "global_step": 177775, "epoch": 4232} {"train_loss": -7.205117225646973, "global_step": 177776, "epoch": 4232} {"train_loss": -7.14202880859375, "global_step": 177777, "epoch": 4232} {"train_loss": -7.1163530349731445, "global_step": 177778, "epoch": 4232} {"train_loss": -7.242886543273926, "global_step": 177779, "epoch": 4232} {"train_loss": -7.267271041870117, "global_step": 177780, "epoch": 4232} {"train_loss": -7.217881679534912, "global_step": 177781, "epoch": 4232} {"train_loss": -7.283134460449219, "global_step": 177782, "epoch": 4232} {"train_loss": -7.145753383636475, "global_step": 177783, "epoch": 4232} {"train_loss": -7.131845951080322, "global_step": 177784, "epoch": 4232} {"train_loss": -7.090159700030372, "global_step": 177785, "epoch": 4232, "val_loss": 80225.4921875} {"train_loss": -7.119564056396484, "global_step": 177786, "epoch": 4233} {"train_loss": -7.1549530029296875, "global_step": 177787, "epoch": 4233} {"train_loss": -7.206277847290039, "global_step": 177788, "epoch": 4233} {"train_loss": -7.268424034118652, "global_step": 177789, "epoch": 4233} {"train_loss": -7.1457085609436035, "global_step": 177790, "epoch": 4233} {"train_loss": -7.252368450164795, "global_step": 177791, "epoch": 4233} {"train_loss": -7.281503677368164, "global_step": 177792, "epoch": 4233} {"train_loss": -7.22659969329834, "global_step": 177793, "epoch": 4233} {"train_loss": -7.11213493347168, "global_step": 177794, "epoch": 4233} {"train_loss": -7.096467018127441, "global_step": 177795, "epoch": 4233} {"train_loss": -7.181180000305176, "global_step": 177796, "epoch": 4233} {"train_loss": -6.925053119659424, "global_step": 177797, "epoch": 4233} {"train_loss": -7.159276962280273, "global_step": 177798, "epoch": 4233} {"train_loss": -7.108619689941406, "global_step": 177799, "epoch": 4233} {"train_loss": -7.049140930175781, "global_step": 177800, "epoch": 4233} {"train_loss": -7.1215949058532715, "global_step": 177801, "epoch": 4233} {"train_loss": -7.050549030303955, "global_step": 177802, "epoch": 4233} {"train_loss": -7.05380916595459, "global_step": 177803, "epoch": 4233} {"train_loss": -7.097219944000244, "global_step": 177804, "epoch": 4233} {"train_loss": -7.114978790283203, "global_step": 177805, "epoch": 4233} {"train_loss": -7.173288822174072, "global_step": 177806, "epoch": 4233} {"train_loss": -6.959198951721191, "global_step": 177807, "epoch": 4233} {"train_loss": -7.050290107727051, "global_step": 177808, "epoch": 4233} {"train_loss": -7.198426246643066, "global_step": 177809, "epoch": 4233} {"train_loss": -7.181360244750977, "global_step": 177810, "epoch": 4233} {"train_loss": -7.172492504119873, "global_step": 177811, "epoch": 4233} {"train_loss": -7.133030891418457, "global_step": 177812, "epoch": 4233} {"train_loss": -7.1658782958984375, "global_step": 177813, "epoch": 4233} {"train_loss": -7.114450931549072, "global_step": 177814, "epoch": 4233} {"train_loss": -7.1512956619262695, "global_step": 177815, "epoch": 4233} {"train_loss": -7.142047882080078, "global_step": 177816, "epoch": 4233} {"train_loss": -7.197549819946289, "global_step": 177817, "epoch": 4233} {"train_loss": -7.197575569152832, "global_step": 177818, "epoch": 4233} {"train_loss": -7.222555160522461, "global_step": 177819, "epoch": 4233} {"train_loss": -7.182418346405029, "global_step": 177820, "epoch": 4233} {"train_loss": -7.1565752029418945, "global_step": 177821, "epoch": 4233} {"train_loss": -7.150161266326904, "global_step": 177822, "epoch": 4233} {"train_loss": -7.220380783081055, "global_step": 177823, "epoch": 4233} {"train_loss": -7.2666473388671875, "global_step": 177824, "epoch": 4233} {"train_loss": -7.14293098449707, "global_step": 177825, "epoch": 4233} {"train_loss": -7.135167598724365, "global_step": 177826, "epoch": 4233} {"train_loss": -7.147140934353783, "global_step": 177827, "epoch": 4233, "val_loss": 80042.6640625} {"train_loss": -7.018986225128174, "global_step": 177828, "epoch": 4234} {"train_loss": -7.014951705932617, "global_step": 177829, "epoch": 4234} {"train_loss": -6.986353397369385, "global_step": 177830, "epoch": 4234} {"train_loss": -7.072394371032715, "global_step": 177831, "epoch": 4234} {"train_loss": -7.108859539031982, "global_step": 177832, "epoch": 4234} {"train_loss": -6.948044300079346, "global_step": 177833, "epoch": 4234} {"train_loss": -6.936931133270264, "global_step": 177834, "epoch": 4234} {"train_loss": -7.151897430419922, "global_step": 177835, "epoch": 4234} {"train_loss": -6.9236674308776855, "global_step": 177836, "epoch": 4234} {"train_loss": -7.149163246154785, "global_step": 177837, "epoch": 4234} {"train_loss": -7.087391376495361, "global_step": 177838, "epoch": 4234} {"train_loss": -7.021844863891602, "global_step": 177839, "epoch": 4234} {"train_loss": -7.130077362060547, "global_step": 177840, "epoch": 4234} {"train_loss": -6.957606315612793, "global_step": 177841, "epoch": 4234} {"train_loss": -7.001762390136719, "global_step": 177842, "epoch": 4234} {"train_loss": -6.988071918487549, "global_step": 177843, "epoch": 4234} {"train_loss": -7.083706378936768, "global_step": 177844, "epoch": 4234} {"train_loss": -6.963710308074951, "global_step": 177845, "epoch": 4234} {"train_loss": -7.054823398590088, "global_step": 177846, "epoch": 4234} {"train_loss": -7.023595809936523, "global_step": 177847, "epoch": 4234} {"train_loss": -7.069779396057129, "global_step": 177848, "epoch": 4234} {"train_loss": -7.068195343017578, "global_step": 177849, "epoch": 4234} {"train_loss": -7.069394588470459, "global_step": 177850, "epoch": 4234} {"train_loss": -6.994951248168945, "global_step": 177851, "epoch": 4234} {"train_loss": -7.1167073249816895, "global_step": 177852, "epoch": 4234} {"train_loss": -7.155247211456299, "global_step": 177853, "epoch": 4234} {"train_loss": -7.138208866119385, "global_step": 177854, "epoch": 4234} {"train_loss": -7.0747599601745605, "global_step": 177855, "epoch": 4234} {"train_loss": -7.092470645904541, "global_step": 177856, "epoch": 4234} {"train_loss": -7.080325126647949, "global_step": 177857, "epoch": 4234} {"train_loss": -7.222146511077881, "global_step": 177858, "epoch": 4234} {"train_loss": -7.092767238616943, "global_step": 177859, "epoch": 4234} {"train_loss": -7.17854642868042, "global_step": 177860, "epoch": 4234} {"train_loss": -7.12101936340332, "global_step": 177861, "epoch": 4234} {"train_loss": -7.208055019378662, "global_step": 177862, "epoch": 4234} {"train_loss": -7.242513656616211, "global_step": 177863, "epoch": 4234} {"train_loss": -7.083632469177246, "global_step": 177864, "epoch": 4234} {"train_loss": -7.1683030128479, "global_step": 177865, "epoch": 4234} {"train_loss": -7.103584289550781, "global_step": 177866, "epoch": 4234} {"train_loss": -7.197946548461914, "global_step": 177867, "epoch": 4234} {"train_loss": -6.999641418457031, "global_step": 177868, "epoch": 4234} {"train_loss": -7.0768317722138905, "global_step": 177869, "epoch": 4234, "val_loss": 80186.53125} {"train_loss": -7.076590061187744, "global_step": 177870, "epoch": 4235} {"train_loss": -7.210386753082275, "global_step": 177871, "epoch": 4235} {"train_loss": -7.136234283447266, "global_step": 177872, "epoch": 4235} {"train_loss": -7.178933620452881, "global_step": 177873, "epoch": 4235} {"train_loss": -7.060091018676758, "global_step": 177874, "epoch": 4235} {"train_loss": -7.190459251403809, "global_step": 177875, "epoch": 4235} {"train_loss": -7.217670440673828, "global_step": 177876, "epoch": 4235} {"train_loss": -7.198214530944824, "global_step": 177877, "epoch": 4235} {"train_loss": -7.047765731811523, "global_step": 177878, "epoch": 4235} {"train_loss": -7.1144609451293945, "global_step": 177879, "epoch": 4235} {"train_loss": -7.204282760620117, "global_step": 177880, "epoch": 4235} {"train_loss": -7.2664289474487305, "global_step": 177881, "epoch": 4235} {"train_loss": -7.230649948120117, "global_step": 177882, "epoch": 4235} {"train_loss": -7.169794082641602, "global_step": 177883, "epoch": 4235} {"train_loss": -7.251620292663574, "global_step": 177884, "epoch": 4235} {"train_loss": -7.200080871582031, "global_step": 177885, "epoch": 4235} {"train_loss": -7.204914093017578, "global_step": 177886, "epoch": 4235} {"train_loss": -7.110445022583008, "global_step": 177887, "epoch": 4235} {"train_loss": -7.139642238616943, "global_step": 177888, "epoch": 4235} {"train_loss": -7.084507465362549, "global_step": 177889, "epoch": 4235} {"train_loss": -7.074326515197754, "global_step": 177890, "epoch": 4235} {"train_loss": -7.067449569702148, "global_step": 177891, "epoch": 4235} {"train_loss": -7.1302618980407715, "global_step": 177892, "epoch": 4235} {"train_loss": -7.1291093826293945, "global_step": 177893, "epoch": 4235} {"train_loss": -7.173093795776367, "global_step": 177894, "epoch": 4235} {"train_loss": -7.071332931518555, "global_step": 177895, "epoch": 4235} {"train_loss": -7.112499237060547, "global_step": 177896, "epoch": 4235} {"train_loss": -6.951615333557129, "global_step": 177897, "epoch": 4235} {"train_loss": -7.137248992919922, "global_step": 177898, "epoch": 4235} {"train_loss": -7.039511203765869, "global_step": 177899, "epoch": 4235} {"train_loss": -7.111510276794434, "global_step": 177900, "epoch": 4235} {"train_loss": -7.027362823486328, "global_step": 177901, "epoch": 4235} {"train_loss": -7.079800605773926, "global_step": 177902, "epoch": 4235} {"train_loss": -7.185815811157227, "global_step": 177903, "epoch": 4235} {"train_loss": -7.0339155197143555, "global_step": 177904, "epoch": 4235} {"train_loss": -7.083157062530518, "global_step": 177905, "epoch": 4235} {"train_loss": -7.155678749084473, "global_step": 177906, "epoch": 4235} {"train_loss": -7.083099842071533, "global_step": 177907, "epoch": 4235} {"train_loss": -7.19987154006958, "global_step": 177908, "epoch": 4235} {"train_loss": -7.016262054443359, "global_step": 177909, "epoch": 4235} {"train_loss": -6.991842269897461, "global_step": 177910, "epoch": 4235} {"train_loss": -7.12535235995338, "global_step": 177911, "epoch": 4235, "val_loss": 80318.109375} {"train_loss": -7.085794448852539, "global_step": 177912, "epoch": 4236} {"train_loss": -7.091546058654785, "global_step": 177913, "epoch": 4236} {"train_loss": -6.983002662658691, "global_step": 177914, "epoch": 4236} {"train_loss": -7.176409721374512, "global_step": 177915, "epoch": 4236} {"train_loss": -7.087583065032959, "global_step": 177916, "epoch": 4236} {"train_loss": -6.920953750610352, "global_step": 177917, "epoch": 4236} {"train_loss": -7.127182960510254, "global_step": 177918, "epoch": 4236} {"train_loss": -6.977085590362549, "global_step": 177919, "epoch": 4236} {"train_loss": -7.110736846923828, "global_step": 177920, "epoch": 4236} {"train_loss": -7.125247001647949, "global_step": 177921, "epoch": 4236} {"train_loss": -6.994839668273926, "global_step": 177922, "epoch": 4236} {"train_loss": -7.199649810791016, "global_step": 177923, "epoch": 4236} {"train_loss": -7.15410041809082, "global_step": 177924, "epoch": 4236} {"train_loss": -7.044000625610352, "global_step": 177925, "epoch": 4236} {"train_loss": -7.173996925354004, "global_step": 177926, "epoch": 4236} {"train_loss": -7.133150100708008, "global_step": 177927, "epoch": 4236} {"train_loss": -7.099903583526611, "global_step": 177928, "epoch": 4236} {"train_loss": -7.205711364746094, "global_step": 177929, "epoch": 4236} {"train_loss": -7.073137283325195, "global_step": 177930, "epoch": 4236} {"train_loss": -7.077156066894531, "global_step": 177931, "epoch": 4236} {"train_loss": -7.111008644104004, "global_step": 177932, "epoch": 4236} {"train_loss": -7.054560661315918, "global_step": 177933, "epoch": 4236} {"train_loss": -7.066238880157471, "global_step": 177934, "epoch": 4236} {"train_loss": -6.8967132568359375, "global_step": 177935, "epoch": 4236} {"train_loss": -7.092013359069824, "global_step": 177936, "epoch": 4236} {"train_loss": -7.103201866149902, "global_step": 177937, "epoch": 4236} {"train_loss": -7.047718524932861, "global_step": 177938, "epoch": 4236} {"train_loss": -7.092104434967041, "global_step": 177939, "epoch": 4236} {"train_loss": -6.993160247802734, "global_step": 177940, "epoch": 4236} {"train_loss": -7.150482177734375, "global_step": 177941, "epoch": 4236} {"train_loss": -7.061523914337158, "global_step": 177942, "epoch": 4236} {"train_loss": -7.111877918243408, "global_step": 177943, "epoch": 4236} {"train_loss": -7.0572404861450195, "global_step": 177944, "epoch": 4236} {"train_loss": -7.072464942932129, "global_step": 177945, "epoch": 4236} {"train_loss": -7.134740829467773, "global_step": 177946, "epoch": 4236} {"train_loss": -7.159173965454102, "global_step": 177947, "epoch": 4236} {"train_loss": -7.096199035644531, "global_step": 177948, "epoch": 4236} {"train_loss": -7.073838233947754, "global_step": 177949, "epoch": 4236} {"train_loss": -7.023674011230469, "global_step": 177950, "epoch": 4236} {"train_loss": -7.0752058029174805, "global_step": 177951, "epoch": 4236} {"train_loss": -7.223532676696777, "global_step": 177952, "epoch": 4236} {"train_loss": -7.08590274765378, "global_step": 177953, "epoch": 4236, "val_loss": 80172.4609375} {"train_loss": -7.25695276260376, "global_step": 177954, "epoch": 4237} {"train_loss": -7.099122047424316, "global_step": 177955, "epoch": 4237} {"train_loss": -7.195391654968262, "global_step": 177956, "epoch": 4237} {"train_loss": -7.127955436706543, "global_step": 177957, "epoch": 4237} {"train_loss": -7.19511079788208, "global_step": 177958, "epoch": 4237} {"train_loss": -7.123438835144043, "global_step": 177959, "epoch": 4237} {"train_loss": -6.940110206604004, "global_step": 177960, "epoch": 4237} {"train_loss": -7.153988838195801, "global_step": 177961, "epoch": 4237} {"train_loss": -7.190779685974121, "global_step": 177962, "epoch": 4237} {"train_loss": -7.007604598999023, "global_step": 177963, "epoch": 4237} {"train_loss": -6.985201358795166, "global_step": 177964, "epoch": 4237} {"train_loss": -7.115330696105957, "global_step": 177965, "epoch": 4237} {"train_loss": -7.040384769439697, "global_step": 177966, "epoch": 4237} {"train_loss": -7.198879241943359, "global_step": 177967, "epoch": 4237} {"train_loss": -7.08644962310791, "global_step": 177968, "epoch": 4237} {"train_loss": -7.158904075622559, "global_step": 177969, "epoch": 4237} {"train_loss": -7.302044868469238, "global_step": 177970, "epoch": 4237} {"train_loss": -7.100231170654297, "global_step": 177971, "epoch": 4237} {"train_loss": -7.107272624969482, "global_step": 177972, "epoch": 4237} {"train_loss": -7.065082550048828, "global_step": 177973, "epoch": 4237} {"train_loss": -7.1776275634765625, "global_step": 177974, "epoch": 4237} {"train_loss": -7.1574506759643555, "global_step": 177975, "epoch": 4237} {"train_loss": -7.18234920501709, "global_step": 177976, "epoch": 4237} {"train_loss": -7.172786712646484, "global_step": 177977, "epoch": 4237} {"train_loss": -7.07203483581543, "global_step": 177978, "epoch": 4237} {"train_loss": -7.24757194519043, "global_step": 177979, "epoch": 4237} {"train_loss": -7.072304725646973, "global_step": 177980, "epoch": 4237} {"train_loss": -7.157725811004639, "global_step": 177981, "epoch": 4237} {"train_loss": -7.162069320678711, "global_step": 177982, "epoch": 4237} {"train_loss": -7.205306053161621, "global_step": 177983, "epoch": 4237} {"train_loss": -7.3234758377075195, "global_step": 177984, "epoch": 4237} {"train_loss": -7.236183166503906, "global_step": 177985, "epoch": 4237} {"train_loss": -7.219392776489258, "global_step": 177986, "epoch": 4237} {"train_loss": -7.16526985168457, "global_step": 177987, "epoch": 4237} {"train_loss": -7.211600303649902, "global_step": 177988, "epoch": 4237} {"train_loss": -7.194300651550293, "global_step": 177989, "epoch": 4237} {"train_loss": -7.089428424835205, "global_step": 177990, "epoch": 4237} {"train_loss": -7.168346405029297, "global_step": 177991, "epoch": 4237} {"train_loss": -7.202568531036377, "global_step": 177992, "epoch": 4237} {"train_loss": -7.149641036987305, "global_step": 177993, "epoch": 4237} {"train_loss": -7.072696685791016, "global_step": 177994, "epoch": 4237} {"train_loss": -7.149433476584298, "global_step": 177995, "epoch": 4237, "val_loss": 80379.21875} {"train_loss": -7.128005504608154, "global_step": 177996, "epoch": 4238} {"train_loss": -7.028463840484619, "global_step": 177997, "epoch": 4238} {"train_loss": -7.023859024047852, "global_step": 177998, "epoch": 4238} {"train_loss": -7.2166643142700195, "global_step": 177999, "epoch": 4238} {"train_loss": -7.1231889724731445, "global_step": 178000, "epoch": 4238} {"train_loss": -6.939887046813965, "global_step": 178001, "epoch": 4238} {"train_loss": -7.0145487785339355, "global_step": 178002, "epoch": 4238} {"train_loss": -7.145221710205078, "global_step": 178003, "epoch": 4238} {"train_loss": -7.06361198425293, "global_step": 178004, "epoch": 4238} {"train_loss": -7.017270565032959, "global_step": 178005, "epoch": 4238} {"train_loss": -7.146452903747559, "global_step": 178006, "epoch": 4238} {"train_loss": -6.954843044281006, "global_step": 178007, "epoch": 4238} {"train_loss": -7.114399433135986, "global_step": 178008, "epoch": 4238} {"train_loss": -7.19551944732666, "global_step": 178009, "epoch": 4238} {"train_loss": -7.058196544647217, "global_step": 178010, "epoch": 4238} {"train_loss": -7.141872406005859, "global_step": 178011, "epoch": 4238} {"train_loss": -7.208595275878906, "global_step": 178012, "epoch": 4238} {"train_loss": -7.063014507293701, "global_step": 178013, "epoch": 4238} {"train_loss": -7.171781539916992, "global_step": 178014, "epoch": 4238} {"train_loss": -7.17750883102417, "global_step": 178015, "epoch": 4238} {"train_loss": -7.163912296295166, "global_step": 178016, "epoch": 4238} {"train_loss": -7.010784149169922, "global_step": 178017, "epoch": 4238} {"train_loss": -7.035917282104492, "global_step": 178018, "epoch": 4238} {"train_loss": -7.066778182983398, "global_step": 178019, "epoch": 4238} {"train_loss": -7.0980682373046875, "global_step": 178020, "epoch": 4238} {"train_loss": -7.168139457702637, "global_step": 178021, "epoch": 4238} {"train_loss": -7.044297695159912, "global_step": 178022, "epoch": 4238} {"train_loss": -7.2242841720581055, "global_step": 178023, "epoch": 4238} {"train_loss": -7.086359977722168, "global_step": 178024, "epoch": 4238} {"train_loss": -7.053316593170166, "global_step": 178025, "epoch": 4238} {"train_loss": -7.06502103805542, "global_step": 178026, "epoch": 4238} {"train_loss": -6.948940753936768, "global_step": 178027, "epoch": 4238} {"train_loss": -7.040417671203613, "global_step": 178028, "epoch": 4238} {"train_loss": -7.04628849029541, "global_step": 178029, "epoch": 4238} {"train_loss": -7.05971622467041, "global_step": 178030, "epoch": 4238} {"train_loss": -6.993126392364502, "global_step": 178031, "epoch": 4238} {"train_loss": -7.135720252990723, "global_step": 178032, "epoch": 4238} {"train_loss": -7.025514602661133, "global_step": 178033, "epoch": 4238} {"train_loss": -7.182703018188477, "global_step": 178034, "epoch": 4238} {"train_loss": -7.04099702835083, "global_step": 178035, "epoch": 4238} {"train_loss": -6.978236198425293, "global_step": 178036, "epoch": 4238} {"train_loss": -7.0866461254301525, "global_step": 178037, "epoch": 4238, "val_loss": 80167.0546875} {"train_loss": -7.092350006103516, "global_step": 178038, "epoch": 4239} {"train_loss": -7.132539749145508, "global_step": 178039, "epoch": 4239} {"train_loss": -7.068934917449951, "global_step": 178040, "epoch": 4239} {"train_loss": -7.078201770782471, "global_step": 178041, "epoch": 4239} {"train_loss": -7.074868679046631, "global_step": 178042, "epoch": 4239} {"train_loss": -7.070605278015137, "global_step": 178043, "epoch": 4239} {"train_loss": -7.096083641052246, "global_step": 178044, "epoch": 4239} {"train_loss": -7.024016380310059, "global_step": 178045, "epoch": 4239} {"train_loss": -7.087305545806885, "global_step": 178046, "epoch": 4239} {"train_loss": -7.033992767333984, "global_step": 178047, "epoch": 4239} {"train_loss": -7.1339335441589355, "global_step": 178048, "epoch": 4239} {"train_loss": -7.141511917114258, "global_step": 178049, "epoch": 4239} {"train_loss": -7.0226287841796875, "global_step": 178050, "epoch": 4239} {"train_loss": -7.234396934509277, "global_step": 178051, "epoch": 4239} {"train_loss": -7.108639717102051, "global_step": 178052, "epoch": 4239} {"train_loss": -7.222748279571533, "global_step": 178053, "epoch": 4239} {"train_loss": -7.14312744140625, "global_step": 178054, "epoch": 4239} {"train_loss": -7.117231369018555, "global_step": 178055, "epoch": 4239} {"train_loss": -7.101567268371582, "global_step": 178056, "epoch": 4239} {"train_loss": -7.160040378570557, "global_step": 178057, "epoch": 4239} {"train_loss": -7.086674213409424, "global_step": 178058, "epoch": 4239} {"train_loss": -7.226822376251221, "global_step": 178059, "epoch": 4239} {"train_loss": -7.110560417175293, "global_step": 178060, "epoch": 4239} {"train_loss": -7.185647487640381, "global_step": 178061, "epoch": 4239} {"train_loss": -7.129477500915527, "global_step": 178062, "epoch": 4239} {"train_loss": -7.0453972816467285, "global_step": 178063, "epoch": 4239} {"train_loss": -7.063744068145752, "global_step": 178064, "epoch": 4239} {"train_loss": -7.112896919250488, "global_step": 178065, "epoch": 4239} {"train_loss": -7.0542497634887695, "global_step": 178066, "epoch": 4239} {"train_loss": -7.109258651733398, "global_step": 178067, "epoch": 4239} {"train_loss": -6.913669586181641, "global_step": 178068, "epoch": 4239} {"train_loss": -7.075207233428955, "global_step": 178069, "epoch": 4239} {"train_loss": -6.964463710784912, "global_step": 178070, "epoch": 4239} {"train_loss": -7.141615867614746, "global_step": 178071, "epoch": 4239} {"train_loss": -7.083255767822266, "global_step": 178072, "epoch": 4239} {"train_loss": -6.938666343688965, "global_step": 178073, "epoch": 4239} {"train_loss": -7.14565372467041, "global_step": 178074, "epoch": 4239} {"train_loss": -6.95206356048584, "global_step": 178075, "epoch": 4239} {"train_loss": -7.007674217224121, "global_step": 178076, "epoch": 4239} {"train_loss": -7.007096290588379, "global_step": 178077, "epoch": 4239} {"train_loss": -7.030545711517334, "global_step": 178078, "epoch": 4239} {"train_loss": -7.084937458946591, "global_step": 178079, "epoch": 4239, "val_loss": 80269.109375} {"train_loss": -6.973764896392822, "global_step": 178080, "epoch": 4240} {"train_loss": -6.971400260925293, "global_step": 178081, "epoch": 4240} {"train_loss": -7.09928035736084, "global_step": 178082, "epoch": 4240} {"train_loss": -7.040998458862305, "global_step": 178083, "epoch": 4240} {"train_loss": -7.14703369140625, "global_step": 178084, "epoch": 4240} {"train_loss": -7.0439772605896, "global_step": 178085, "epoch": 4240} {"train_loss": -7.081835746765137, "global_step": 178086, "epoch": 4240} {"train_loss": -7.08978271484375, "global_step": 178087, "epoch": 4240} {"train_loss": -7.088656425476074, "global_step": 178088, "epoch": 4240} {"train_loss": -7.053743362426758, "global_step": 178089, "epoch": 4240} {"train_loss": -7.086451530456543, "global_step": 178090, "epoch": 4240} {"train_loss": -6.996583938598633, "global_step": 178091, "epoch": 4240} {"train_loss": -7.081884860992432, "global_step": 178092, "epoch": 4240} {"train_loss": -7.079351425170898, "global_step": 178093, "epoch": 4240} {"train_loss": -6.991389274597168, "global_step": 178094, "epoch": 4240} {"train_loss": -7.1773881912231445, "global_step": 178095, "epoch": 4240} {"train_loss": -7.266287803649902, "global_step": 178096, "epoch": 4240} {"train_loss": -7.117900848388672, "global_step": 178097, "epoch": 4240} {"train_loss": -7.010093688964844, "global_step": 178098, "epoch": 4240} {"train_loss": -7.109108924865723, "global_step": 178099, "epoch": 4240} {"train_loss": -7.085559368133545, "global_step": 178100, "epoch": 4240} {"train_loss": -6.970855236053467, "global_step": 178101, "epoch": 4240} {"train_loss": -6.9818878173828125, "global_step": 178102, "epoch": 4240} {"train_loss": -7.143704414367676, "global_step": 178103, "epoch": 4240} {"train_loss": -7.106815338134766, "global_step": 178104, "epoch": 4240} {"train_loss": -7.06334114074707, "global_step": 178105, "epoch": 4240} {"train_loss": -7.057397842407227, "global_step": 178106, "epoch": 4240} {"train_loss": -7.036789894104004, "global_step": 178107, "epoch": 4240} {"train_loss": -6.949919700622559, "global_step": 178108, "epoch": 4240} {"train_loss": -7.190507411956787, "global_step": 178109, "epoch": 4240} {"train_loss": -7.102934837341309, "global_step": 178110, "epoch": 4240} {"train_loss": -7.164648056030273, "global_step": 178111, "epoch": 4240} {"train_loss": -7.100334644317627, "global_step": 178112, "epoch": 4240} {"train_loss": -7.020447731018066, "global_step": 178113, "epoch": 4240} {"train_loss": -7.016533374786377, "global_step": 178114, "epoch": 4240} {"train_loss": -7.028389930725098, "global_step": 178115, "epoch": 4240} {"train_loss": -7.179654121398926, "global_step": 178116, "epoch": 4240} {"train_loss": -6.971807479858398, "global_step": 178117, "epoch": 4240} {"train_loss": -7.092596054077148, "global_step": 178118, "epoch": 4240} {"train_loss": -7.0670623779296875, "global_step": 178119, "epoch": 4240} {"train_loss": -6.97370719909668, "global_step": 178120, "epoch": 4240} {"train_loss": -7.071177005767822, "global_step": 178121, "epoch": 4240, "val_loss": 80327.9375} {"train_loss": -7.081799507141113, "global_step": 178122, "epoch": 4241} {"train_loss": -7.133140563964844, "global_step": 178123, "epoch": 4241} {"train_loss": -7.1273274421691895, "global_step": 178124, "epoch": 4241} {"train_loss": -7.03884744644165, "global_step": 178125, "epoch": 4241} {"train_loss": -7.158495903015137, "global_step": 178126, "epoch": 4241} {"train_loss": -7.038139820098877, "global_step": 178127, "epoch": 4241} {"train_loss": -7.141120910644531, "global_step": 178128, "epoch": 4241} {"train_loss": -7.169414520263672, "global_step": 178129, "epoch": 4241} {"train_loss": -7.061808109283447, "global_step": 178130, "epoch": 4241} {"train_loss": -7.198208808898926, "global_step": 178131, "epoch": 4241} {"train_loss": -7.040144920349121, "global_step": 178132, "epoch": 4241} {"train_loss": -7.148866653442383, "global_step": 178133, "epoch": 4241} {"train_loss": -7.158938407897949, "global_step": 178134, "epoch": 4241} {"train_loss": -7.046531677246094, "global_step": 178135, "epoch": 4241} {"train_loss": -7.063423156738281, "global_step": 178136, "epoch": 4241} {"train_loss": -7.035846710205078, "global_step": 178137, "epoch": 4241} {"train_loss": -6.995595932006836, "global_step": 178138, "epoch": 4241} {"train_loss": -7.297250747680664, "global_step": 178139, "epoch": 4241} {"train_loss": -7.043591499328613, "global_step": 178140, "epoch": 4241} {"train_loss": -7.098117351531982, "global_step": 178141, "epoch": 4241} {"train_loss": -7.150498390197754, "global_step": 178142, "epoch": 4241} {"train_loss": -7.126034736633301, "global_step": 178143, "epoch": 4241} {"train_loss": -7.100207328796387, "global_step": 178144, "epoch": 4241} {"train_loss": -7.185291290283203, "global_step": 178145, "epoch": 4241} {"train_loss": -7.190591812133789, "global_step": 178146, "epoch": 4241} {"train_loss": -7.139331817626953, "global_step": 178147, "epoch": 4241} {"train_loss": -7.113273620605469, "global_step": 178148, "epoch": 4241} {"train_loss": -7.059082508087158, "global_step": 178149, "epoch": 4241} {"train_loss": -7.067050933837891, "global_step": 178150, "epoch": 4241} {"train_loss": -7.129781723022461, "global_step": 178151, "epoch": 4241} {"train_loss": -7.032033920288086, "global_step": 178152, "epoch": 4241} {"train_loss": -7.105840682983398, "global_step": 178153, "epoch": 4241} {"train_loss": -7.03459358215332, "global_step": 178154, "epoch": 4241} {"train_loss": -7.050352573394775, "global_step": 178155, "epoch": 4241} {"train_loss": -7.225371837615967, "global_step": 178156, "epoch": 4241} {"train_loss": -7.081569671630859, "global_step": 178157, "epoch": 4241} {"train_loss": -7.075373649597168, "global_step": 178158, "epoch": 4241} {"train_loss": -6.955728530883789, "global_step": 178159, "epoch": 4241} {"train_loss": -7.114264011383057, "global_step": 178160, "epoch": 4241} {"train_loss": -7.203996181488037, "global_step": 178161, "epoch": 4241} {"train_loss": -7.089136123657227, "global_step": 178162, "epoch": 4241} {"train_loss": -7.104444117773147, "global_step": 178163, "epoch": 4241, "val_loss": 80234.46875} {"train_loss": -7.103653430938721, "global_step": 178164, "epoch": 4242} {"train_loss": -7.088329315185547, "global_step": 178165, "epoch": 4242} {"train_loss": -7.124739646911621, "global_step": 178166, "epoch": 4242} {"train_loss": -7.130393981933594, "global_step": 178167, "epoch": 4242} {"train_loss": -7.170598030090332, "global_step": 178168, "epoch": 4242} {"train_loss": -6.9910054206848145, "global_step": 178169, "epoch": 4242} {"train_loss": -7.114556312561035, "global_step": 178170, "epoch": 4242} {"train_loss": -7.231814861297607, "global_step": 178171, "epoch": 4242} {"train_loss": -7.134851455688477, "global_step": 178172, "epoch": 4242} {"train_loss": -7.118671417236328, "global_step": 178173, "epoch": 4242} {"train_loss": -7.1091766357421875, "global_step": 178174, "epoch": 4242} {"train_loss": -7.127826690673828, "global_step": 178175, "epoch": 4242} {"train_loss": -7.2063140869140625, "global_step": 178176, "epoch": 4242} {"train_loss": -7.028555870056152, "global_step": 178177, "epoch": 4242} {"train_loss": -7.12877893447876, "global_step": 178178, "epoch": 4242} {"train_loss": -7.138672828674316, "global_step": 178179, "epoch": 4242} {"train_loss": -7.166934490203857, "global_step": 178180, "epoch": 4242} {"train_loss": -7.179584980010986, "global_step": 178181, "epoch": 4242} {"train_loss": -7.140219211578369, "global_step": 178182, "epoch": 4242} {"train_loss": -7.200318336486816, "global_step": 178183, "epoch": 4242} {"train_loss": -7.124847412109375, "global_step": 178184, "epoch": 4242} {"train_loss": -7.107850074768066, "global_step": 178185, "epoch": 4242} {"train_loss": -7.101122856140137, "global_step": 178186, "epoch": 4242} {"train_loss": -7.092371463775635, "global_step": 178187, "epoch": 4242} {"train_loss": -7.042932510375977, "global_step": 178188, "epoch": 4242} {"train_loss": -7.112996578216553, "global_step": 178189, "epoch": 4242} {"train_loss": -7.0716705322265625, "global_step": 178190, "epoch": 4242} {"train_loss": -6.998711585998535, "global_step": 178191, "epoch": 4242} {"train_loss": -6.964393138885498, "global_step": 178192, "epoch": 4242} {"train_loss": -7.012231826782227, "global_step": 178193, "epoch": 4242} {"train_loss": -7.012842655181885, "global_step": 178194, "epoch": 4242} {"train_loss": -6.952397346496582, "global_step": 178195, "epoch": 4242} {"train_loss": -7.144330978393555, "global_step": 178196, "epoch": 4242} {"train_loss": -6.975257873535156, "global_step": 178197, "epoch": 4242} {"train_loss": -7.14277458190918, "global_step": 178198, "epoch": 4242} {"train_loss": -7.000917434692383, "global_step": 178199, "epoch": 4242} {"train_loss": -7.134468078613281, "global_step": 178200, "epoch": 4242} {"train_loss": -6.936956405639648, "global_step": 178201, "epoch": 4242} {"train_loss": -7.091463088989258, "global_step": 178202, "epoch": 4242} {"train_loss": -7.033846855163574, "global_step": 178203, "epoch": 4242} {"train_loss": -6.9443864822387695, "global_step": 178204, "epoch": 4242} {"train_loss": -7.089401835487003, "global_step": 178205, "epoch": 4242, "val_loss": 80372.3203125} {"train_loss": -7.08193826675415, "global_step": 178206, "epoch": 4243} {"train_loss": -7.157614707946777, "global_step": 178207, "epoch": 4243} {"train_loss": -6.98018741607666, "global_step": 178208, "epoch": 4243} {"train_loss": -6.846121788024902, "global_step": 178209, "epoch": 4243} {"train_loss": -6.928838729858398, "global_step": 178210, "epoch": 4243} {"train_loss": -7.004755020141602, "global_step": 178211, "epoch": 4243} {"train_loss": -7.042671203613281, "global_step": 178212, "epoch": 4243} {"train_loss": -7.123690605163574, "global_step": 178213, "epoch": 4243} {"train_loss": -6.94869327545166, "global_step": 178214, "epoch": 4243} {"train_loss": -7.157739639282227, "global_step": 178215, "epoch": 4243} {"train_loss": -7.024425506591797, "global_step": 178216, "epoch": 4243} {"train_loss": -7.0809454917907715, "global_step": 178217, "epoch": 4243} {"train_loss": -7.102400302886963, "global_step": 178218, "epoch": 4243} {"train_loss": -7.10060977935791, "global_step": 178219, "epoch": 4243} {"train_loss": -7.1511125564575195, "global_step": 178220, "epoch": 4243} {"train_loss": -7.133031368255615, "global_step": 178221, "epoch": 4243} {"train_loss": -7.153258323669434, "global_step": 178222, "epoch": 4243} {"train_loss": -7.062506198883057, "global_step": 178223, "epoch": 4243} {"train_loss": -7.076385498046875, "global_step": 178224, "epoch": 4243} {"train_loss": -7.080726146697998, "global_step": 178225, "epoch": 4243} {"train_loss": -7.155275821685791, "global_step": 178226, "epoch": 4243} {"train_loss": -7.054079055786133, "global_step": 178227, "epoch": 4243} {"train_loss": -7.172636032104492, "global_step": 178228, "epoch": 4243} {"train_loss": -7.139645576477051, "global_step": 178229, "epoch": 4243} {"train_loss": -7.2084150314331055, "global_step": 178230, "epoch": 4243} {"train_loss": -7.0709028244018555, "global_step": 178231, "epoch": 4243} {"train_loss": -7.071166038513184, "global_step": 178232, "epoch": 4243} {"train_loss": -7.124448776245117, "global_step": 178233, "epoch": 4243} {"train_loss": -7.12783145904541, "global_step": 178234, "epoch": 4243} {"train_loss": -6.960196495056152, "global_step": 178235, "epoch": 4243} {"train_loss": -7.127045154571533, "global_step": 178236, "epoch": 4243} {"train_loss": -7.126867294311523, "global_step": 178237, "epoch": 4243} {"train_loss": -7.108606338500977, "global_step": 178238, "epoch": 4243} {"train_loss": -7.183682441711426, "global_step": 178239, "epoch": 4243} {"train_loss": -7.158272743225098, "global_step": 178240, "epoch": 4243} {"train_loss": -7.205013275146484, "global_step": 178241, "epoch": 4243} {"train_loss": -7.114017486572266, "global_step": 178242, "epoch": 4243} {"train_loss": -7.188631057739258, "global_step": 178243, "epoch": 4243} {"train_loss": -7.163735389709473, "global_step": 178244, "epoch": 4243} {"train_loss": -7.233701705932617, "global_step": 178245, "epoch": 4243} {"train_loss": -7.064034461975098, "global_step": 178246, "epoch": 4243} {"train_loss": -7.097423190162296, "global_step": 178247, "epoch": 4243, "val_loss": 80192.8515625} {"train_loss": -7.219204902648926, "global_step": 178248, "epoch": 4244} {"train_loss": -7.227800369262695, "global_step": 178249, "epoch": 4244} {"train_loss": -7.1562957763671875, "global_step": 178250, "epoch": 4244} {"train_loss": -7.209590911865234, "global_step": 178251, "epoch": 4244} {"train_loss": -7.213184833526611, "global_step": 178252, "epoch": 4244} {"train_loss": -7.164842128753662, "global_step": 178253, "epoch": 4244} {"train_loss": -7.1204729080200195, "global_step": 178254, "epoch": 4244} {"train_loss": -7.102748870849609, "global_step": 178255, "epoch": 4244} {"train_loss": -7.218172073364258, "global_step": 178256, "epoch": 4244} {"train_loss": -7.203774452209473, "global_step": 178257, "epoch": 4244} {"train_loss": -7.022956848144531, "global_step": 178258, "epoch": 4244} {"train_loss": -7.212969779968262, "global_step": 178259, "epoch": 4244} {"train_loss": -7.2434916496276855, "global_step": 178260, "epoch": 4244} {"train_loss": -7.17877197265625, "global_step": 178261, "epoch": 4244} {"train_loss": -7.219676971435547, "global_step": 178262, "epoch": 4244} {"train_loss": -7.251206398010254, "global_step": 178263, "epoch": 4244} {"train_loss": -7.088918685913086, "global_step": 178264, "epoch": 4244} {"train_loss": -7.120771408081055, "global_step": 178265, "epoch": 4244} {"train_loss": -7.077458381652832, "global_step": 178266, "epoch": 4244} {"train_loss": -7.1557230949401855, "global_step": 178267, "epoch": 4244} {"train_loss": -7.083022117614746, "global_step": 178268, "epoch": 4244} {"train_loss": -7.1147308349609375, "global_step": 178269, "epoch": 4244} {"train_loss": -7.160713195800781, "global_step": 178270, "epoch": 4244} {"train_loss": -7.100341320037842, "global_step": 178271, "epoch": 4244} {"train_loss": -7.21428108215332, "global_step": 178272, "epoch": 4244} {"train_loss": -7.060657024383545, "global_step": 178273, "epoch": 4244} {"train_loss": -6.992717742919922, "global_step": 178274, "epoch": 4244} {"train_loss": -7.114005088806152, "global_step": 178275, "epoch": 4244} {"train_loss": -7.124875068664551, "global_step": 178276, "epoch": 4244} {"train_loss": -7.096452713012695, "global_step": 178277, "epoch": 4244} {"train_loss": -7.151325702667236, "global_step": 178278, "epoch": 4244} {"train_loss": -7.0114593505859375, "global_step": 178279, "epoch": 4244} {"train_loss": -7.194523811340332, "global_step": 178280, "epoch": 4244} {"train_loss": -6.99354362487793, "global_step": 178281, "epoch": 4244} {"train_loss": -6.924051761627197, "global_step": 178282, "epoch": 4244} {"train_loss": -7.172759056091309, "global_step": 178283, "epoch": 4244} {"train_loss": -7.0124897956848145, "global_step": 178284, "epoch": 4244} {"train_loss": -7.038300514221191, "global_step": 178285, "epoch": 4244} {"train_loss": -7.060251712799072, "global_step": 178286, "epoch": 4244} {"train_loss": -7.032020092010498, "global_step": 178287, "epoch": 4244} {"train_loss": -7.018261909484863, "global_step": 178288, "epoch": 4244} {"train_loss": -7.123299598693848, "global_step": 178289, "epoch": 4244, "val_loss": 80482.6484375} {"train_loss": -7.138970851898193, "global_step": 178290, "epoch": 4245} {"train_loss": -7.042167663574219, "global_step": 178291, "epoch": 4245} {"train_loss": -7.099764823913574, "global_step": 178292, "epoch": 4245} {"train_loss": -7.122945785522461, "global_step": 178293, "epoch": 4245} {"train_loss": -7.161291122436523, "global_step": 178294, "epoch": 4245} {"train_loss": -7.073678016662598, "global_step": 178295, "epoch": 4245} {"train_loss": -7.064249038696289, "global_step": 178296, "epoch": 4245} {"train_loss": -7.171079635620117, "global_step": 178297, "epoch": 4245} {"train_loss": -7.006932258605957, "global_step": 178298, "epoch": 4245} {"train_loss": -6.994848251342773, "global_step": 178299, "epoch": 4245} {"train_loss": -7.045477390289307, "global_step": 178300, "epoch": 4245} {"train_loss": -7.0705084800720215, "global_step": 178301, "epoch": 4245} {"train_loss": -7.1213788986206055, "global_step": 178302, "epoch": 4245} {"train_loss": -6.883007526397705, "global_step": 178303, "epoch": 4245} {"train_loss": -7.150114059448242, "global_step": 178304, "epoch": 4245} {"train_loss": -6.985821723937988, "global_step": 178305, "epoch": 4245} {"train_loss": -7.065730094909668, "global_step": 178306, "epoch": 4245} {"train_loss": -7.039251327514648, "global_step": 178307, "epoch": 4245} {"train_loss": -7.064306259155273, "global_step": 178308, "epoch": 4245} {"train_loss": -7.027965068817139, "global_step": 178309, "epoch": 4245} {"train_loss": -7.0129618644714355, "global_step": 178310, "epoch": 4245} {"train_loss": -6.956162452697754, "global_step": 178311, "epoch": 4245} {"train_loss": -7.076982021331787, "global_step": 178312, "epoch": 4245} {"train_loss": -6.826262474060059, "global_step": 178313, "epoch": 4245} {"train_loss": -6.894624710083008, "global_step": 178314, "epoch": 4245} {"train_loss": -7.068824291229248, "global_step": 178315, "epoch": 4245} {"train_loss": -6.900061130523682, "global_step": 178316, "epoch": 4245} {"train_loss": -6.956952095031738, "global_step": 178317, "epoch": 4245} {"train_loss": -6.979072570800781, "global_step": 178318, "epoch": 4245} {"train_loss": -6.820407867431641, "global_step": 178319, "epoch": 4245} {"train_loss": -7.022387981414795, "global_step": 178320, "epoch": 4245} {"train_loss": -6.672904014587402, "global_step": 178321, "epoch": 4245} {"train_loss": -6.877270698547363, "global_step": 178322, "epoch": 4245} {"train_loss": -6.941956996917725, "global_step": 178323, "epoch": 4245} {"train_loss": -6.972813606262207, "global_step": 178324, "epoch": 4245} {"train_loss": -6.97963285446167, "global_step": 178325, "epoch": 4245} {"train_loss": -6.995988845825195, "global_step": 178326, "epoch": 4245} {"train_loss": -7.053997039794922, "global_step": 178327, "epoch": 4245} {"train_loss": -6.934839248657227, "global_step": 178328, "epoch": 4245} {"train_loss": -7.004093170166016, "global_step": 178329, "epoch": 4245} {"train_loss": -7.010908603668213, "global_step": 178330, "epoch": 4245} {"train_loss": -7.008881137484596, "global_step": 178331, "epoch": 4245, "val_loss": 80191.6796875} {"train_loss": -7.005836009979248, "global_step": 178332, "epoch": 4246} {"train_loss": -7.100666046142578, "global_step": 178333, "epoch": 4246} {"train_loss": -7.065314292907715, "global_step": 178334, "epoch": 4246} {"train_loss": -7.03849983215332, "global_step": 178335, "epoch": 4246} {"train_loss": -7.164017677307129, "global_step": 178336, "epoch": 4246} {"train_loss": -7.103890419006348, "global_step": 178337, "epoch": 4246} {"train_loss": -7.010684967041016, "global_step": 178338, "epoch": 4246} {"train_loss": -7.099212646484375, "global_step": 178339, "epoch": 4246} {"train_loss": -7.11201810836792, "global_step": 178340, "epoch": 4246} {"train_loss": -7.044425964355469, "global_step": 178341, "epoch": 4246} {"train_loss": -7.006303787231445, "global_step": 178342, "epoch": 4246} {"train_loss": -7.076065540313721, "global_step": 178343, "epoch": 4246} {"train_loss": -7.177130699157715, "global_step": 178344, "epoch": 4246} {"train_loss": -7.072024345397949, "global_step": 178345, "epoch": 4246} {"train_loss": -7.0815629959106445, "global_step": 178346, "epoch": 4246} {"train_loss": -7.156398773193359, "global_step": 178347, "epoch": 4246} {"train_loss": -6.963469982147217, "global_step": 178348, "epoch": 4246} {"train_loss": -7.095409393310547, "global_step": 178349, "epoch": 4246} {"train_loss": -7.160381317138672, "global_step": 178350, "epoch": 4246} {"train_loss": -7.0778679847717285, "global_step": 178351, "epoch": 4246} {"train_loss": -7.192956447601318, "global_step": 178352, "epoch": 4246} {"train_loss": -7.094052314758301, "global_step": 178353, "epoch": 4246} {"train_loss": -7.068255424499512, "global_step": 178354, "epoch": 4246} {"train_loss": -7.177469253540039, "global_step": 178355, "epoch": 4246} {"train_loss": -7.205513000488281, "global_step": 178356, "epoch": 4246} {"train_loss": -7.180569648742676, "global_step": 178357, "epoch": 4246} {"train_loss": -7.207763671875, "global_step": 178358, "epoch": 4246} {"train_loss": -7.1690168380737305, "global_step": 178359, "epoch": 4246} {"train_loss": -7.153293132781982, "global_step": 178360, "epoch": 4246} {"train_loss": -7.179450988769531, "global_step": 178361, "epoch": 4246} {"train_loss": -7.1510419845581055, "global_step": 178362, "epoch": 4246} {"train_loss": -7.275638103485107, "global_step": 178363, "epoch": 4246} {"train_loss": -7.246258735656738, "global_step": 178364, "epoch": 4246} {"train_loss": -7.122759819030762, "global_step": 178365, "epoch": 4246} {"train_loss": -7.109007835388184, "global_step": 178366, "epoch": 4246} {"train_loss": -7.192039489746094, "global_step": 178367, "epoch": 4246} {"train_loss": -7.171955585479736, "global_step": 178368, "epoch": 4246} {"train_loss": -7.224019527435303, "global_step": 178369, "epoch": 4246} {"train_loss": -7.1488847732543945, "global_step": 178370, "epoch": 4246} {"train_loss": -7.21176815032959, "global_step": 178371, "epoch": 4246} {"train_loss": -7.161632061004639, "global_step": 178372, "epoch": 4246} {"train_loss": -7.131348746163504, "global_step": 178373, "epoch": 4246, "val_loss": 80105.53125} {"train_loss": -7.16948127746582, "global_step": 178374, "epoch": 4247} {"train_loss": -7.261211395263672, "global_step": 178375, "epoch": 4247} {"train_loss": -7.341761589050293, "global_step": 178376, "epoch": 4247} {"train_loss": -7.118200302124023, "global_step": 178377, "epoch": 4247} {"train_loss": -7.180520057678223, "global_step": 178378, "epoch": 4247} {"train_loss": -7.2670369148254395, "global_step": 178379, "epoch": 4247} {"train_loss": -7.126214981079102, "global_step": 178380, "epoch": 4247} {"train_loss": -7.120264053344727, "global_step": 178381, "epoch": 4247} {"train_loss": -7.145400047302246, "global_step": 178382, "epoch": 4247} {"train_loss": -7.245702743530273, "global_step": 178383, "epoch": 4247} {"train_loss": -7.086156845092773, "global_step": 178384, "epoch": 4247} {"train_loss": -7.164052963256836, "global_step": 178385, "epoch": 4247} {"train_loss": -7.287272930145264, "global_step": 178386, "epoch": 4247} {"train_loss": -7.227415084838867, "global_step": 178387, "epoch": 4247} {"train_loss": -7.233368873596191, "global_step": 178388, "epoch": 4247} {"train_loss": -7.122332572937012, "global_step": 178389, "epoch": 4247} {"train_loss": -7.300826549530029, "global_step": 178390, "epoch": 4247} {"train_loss": -7.129935264587402, "global_step": 178391, "epoch": 4247} {"train_loss": -7.213621139526367, "global_step": 178392, "epoch": 4247} {"train_loss": -7.198960304260254, "global_step": 178393, "epoch": 4247} {"train_loss": -7.077502727508545, "global_step": 178394, "epoch": 4247} {"train_loss": -7.2467217445373535, "global_step": 178395, "epoch": 4247} {"train_loss": -7.132099628448486, "global_step": 178396, "epoch": 4247} {"train_loss": -7.260301113128662, "global_step": 178397, "epoch": 4247} {"train_loss": -7.283188343048096, "global_step": 178398, "epoch": 4247} {"train_loss": -6.967327117919922, "global_step": 178399, "epoch": 4247} {"train_loss": -7.112336158752441, "global_step": 178400, "epoch": 4247} {"train_loss": -7.093698024749756, "global_step": 178401, "epoch": 4247} {"train_loss": -7.033575057983398, "global_step": 178402, "epoch": 4247} {"train_loss": -6.973536491394043, "global_step": 178403, "epoch": 4247} {"train_loss": -7.03746223449707, "global_step": 178404, "epoch": 4247} {"train_loss": -7.065066337585449, "global_step": 178405, "epoch": 4247} {"train_loss": -7.013577461242676, "global_step": 178406, "epoch": 4247} {"train_loss": -7.188058853149414, "global_step": 178407, "epoch": 4247} {"train_loss": -7.0941572189331055, "global_step": 178408, "epoch": 4247} {"train_loss": -7.144378662109375, "global_step": 178409, "epoch": 4247} {"train_loss": -7.081009864807129, "global_step": 178410, "epoch": 4247} {"train_loss": -7.139230728149414, "global_step": 178411, "epoch": 4247} {"train_loss": -6.999133110046387, "global_step": 178412, "epoch": 4247} {"train_loss": -6.97420597076416, "global_step": 178413, "epoch": 4247} {"train_loss": -7.100166320800781, "global_step": 178414, "epoch": 4247} {"train_loss": -7.1394993123554045, "global_step": 178415, "epoch": 4247, "val_loss": 80388.1796875} {"train_loss": -7.107031345367432, "global_step": 178416, "epoch": 4248} {"train_loss": -7.176393508911133, "global_step": 178417, "epoch": 4248} {"train_loss": -6.978737831115723, "global_step": 178418, "epoch": 4248} {"train_loss": -7.0588154792785645, "global_step": 178419, "epoch": 4248} {"train_loss": -6.951210021972656, "global_step": 178420, "epoch": 4248} {"train_loss": -7.076599597930908, "global_step": 178421, "epoch": 4248} {"train_loss": -6.947587966918945, "global_step": 178422, "epoch": 4248} {"train_loss": -7.0796284675598145, "global_step": 178423, "epoch": 4248} {"train_loss": -7.013106346130371, "global_step": 178424, "epoch": 4248} {"train_loss": -7.034965991973877, "global_step": 178425, "epoch": 4248} {"train_loss": -7.039965629577637, "global_step": 178426, "epoch": 4248} {"train_loss": -6.963006496429443, "global_step": 178427, "epoch": 4248} {"train_loss": -7.013736724853516, "global_step": 178428, "epoch": 4248} {"train_loss": -7.082635879516602, "global_step": 178429, "epoch": 4248} {"train_loss": -7.087053298950195, "global_step": 178430, "epoch": 4248} {"train_loss": -7.091618537902832, "global_step": 178431, "epoch": 4248} {"train_loss": -7.037787437438965, "global_step": 178432, "epoch": 4248} {"train_loss": -7.078317642211914, "global_step": 178433, "epoch": 4248} {"train_loss": -7.037969589233398, "global_step": 178434, "epoch": 4248} {"train_loss": -7.119332313537598, "global_step": 178435, "epoch": 4248} {"train_loss": -7.089040756225586, "global_step": 178436, "epoch": 4248} {"train_loss": -7.025732517242432, "global_step": 178437, "epoch": 4248} {"train_loss": -7.090864181518555, "global_step": 178438, "epoch": 4248} {"train_loss": -7.210328578948975, "global_step": 178439, "epoch": 4248} {"train_loss": -7.193847179412842, "global_step": 178440, "epoch": 4248} {"train_loss": -7.213101863861084, "global_step": 178441, "epoch": 4248} {"train_loss": -7.120662689208984, "global_step": 178442, "epoch": 4248} {"train_loss": -7.203522682189941, "global_step": 178443, "epoch": 4248} {"train_loss": -7.111867427825928, "global_step": 178444, "epoch": 4248} {"train_loss": -7.152281761169434, "global_step": 178445, "epoch": 4248} {"train_loss": -7.202550888061523, "global_step": 178446, "epoch": 4248} {"train_loss": -7.159677982330322, "global_step": 178447, "epoch": 4248} {"train_loss": -7.129731178283691, "global_step": 178448, "epoch": 4248} {"train_loss": -7.20382022857666, "global_step": 178449, "epoch": 4248} {"train_loss": -7.150851249694824, "global_step": 178450, "epoch": 4248} {"train_loss": -7.051136016845703, "global_step": 178451, "epoch": 4248} {"train_loss": -7.132651329040527, "global_step": 178452, "epoch": 4248} {"train_loss": -7.1686930656433105, "global_step": 178453, "epoch": 4248} {"train_loss": -7.027782440185547, "global_step": 178454, "epoch": 4248} {"train_loss": -7.158882141113281, "global_step": 178455, "epoch": 4248} {"train_loss": -7.075263977050781, "global_step": 178456, "epoch": 4248} {"train_loss": -7.095147110167003, "global_step": 178457, "epoch": 4248, "val_loss": 80239.1640625} {"train_loss": -7.125859260559082, "global_step": 178458, "epoch": 4249} {"train_loss": -7.189659118652344, "global_step": 178459, "epoch": 4249} {"train_loss": -7.105837821960449, "global_step": 178460, "epoch": 4249} {"train_loss": -7.147391319274902, "global_step": 178461, "epoch": 4249} {"train_loss": -7.214414596557617, "global_step": 178462, "epoch": 4249} {"train_loss": -7.085151672363281, "global_step": 178463, "epoch": 4249} {"train_loss": -7.1942291259765625, "global_step": 178464, "epoch": 4249} {"train_loss": -7.22268009185791, "global_step": 178465, "epoch": 4249} {"train_loss": -7.130695343017578, "global_step": 178466, "epoch": 4249} {"train_loss": -7.132403373718262, "global_step": 178467, "epoch": 4249} {"train_loss": -7.131847381591797, "global_step": 178468, "epoch": 4249} {"train_loss": -7.111023902893066, "global_step": 178469, "epoch": 4249} {"train_loss": -7.030668258666992, "global_step": 178470, "epoch": 4249} {"train_loss": -7.181802749633789, "global_step": 178471, "epoch": 4249} {"train_loss": -7.183716773986816, "global_step": 178472, "epoch": 4249} {"train_loss": -7.120754241943359, "global_step": 178473, "epoch": 4249} {"train_loss": -7.167696952819824, "global_step": 178474, "epoch": 4249} {"train_loss": -7.065767288208008, "global_step": 178475, "epoch": 4249} {"train_loss": -7.150296688079834, "global_step": 178476, "epoch": 4249} {"train_loss": -7.147760391235352, "global_step": 178477, "epoch": 4249} {"train_loss": -7.109745979309082, "global_step": 178478, "epoch": 4249} {"train_loss": -7.066697120666504, "global_step": 178479, "epoch": 4249} {"train_loss": -7.086373805999756, "global_step": 178480, "epoch": 4249} {"train_loss": -7.0421295166015625, "global_step": 178481, "epoch": 4249} {"train_loss": -7.1610307693481445, "global_step": 178482, "epoch": 4249} {"train_loss": -7.153731346130371, "global_step": 178483, "epoch": 4249} {"train_loss": -7.119603633880615, "global_step": 178484, "epoch": 4249} {"train_loss": -7.172242641448975, "global_step": 178485, "epoch": 4249} {"train_loss": -6.993998050689697, "global_step": 178486, "epoch": 4249} {"train_loss": -7.210204124450684, "global_step": 178487, "epoch": 4249} {"train_loss": -7.016305923461914, "global_step": 178488, "epoch": 4249} {"train_loss": -7.1471710205078125, "global_step": 178489, "epoch": 4249} {"train_loss": -7.118985176086426, "global_step": 178490, "epoch": 4249} {"train_loss": -7.088239669799805, "global_step": 178491, "epoch": 4249} {"train_loss": -7.065559387207031, "global_step": 178492, "epoch": 4249} {"train_loss": -7.200017929077148, "global_step": 178493, "epoch": 4249} {"train_loss": -6.937904357910156, "global_step": 178494, "epoch": 4249} {"train_loss": -7.103718280792236, "global_step": 178495, "epoch": 4249} {"train_loss": -7.124263763427734, "global_step": 178496, "epoch": 4249} {"train_loss": -7.161687850952148, "global_step": 178497, "epoch": 4249} {"train_loss": -6.966596603393555, "global_step": 178498, "epoch": 4249} {"train_loss": -7.117874452045986, "global_step": 178499, "epoch": 4249, "val_loss": 80288.0390625} {"train_loss": -7.1421709060668945, "global_step": 178500, "epoch": 4250} {"train_loss": -7.103130340576172, "global_step": 178501, "epoch": 4250} {"train_loss": -7.041098117828369, "global_step": 178502, "epoch": 4250} {"train_loss": -7.029783725738525, "global_step": 178503, "epoch": 4250} {"train_loss": -6.944892883300781, "global_step": 178504, "epoch": 4250} {"train_loss": -7.108760833740234, "global_step": 178505, "epoch": 4250} {"train_loss": -7.073870658874512, "global_step": 178506, "epoch": 4250} {"train_loss": -7.0149383544921875, "global_step": 178507, "epoch": 4250} {"train_loss": -7.0635576248168945, "global_step": 178508, "epoch": 4250} {"train_loss": -6.887404441833496, "global_step": 178509, "epoch": 4250} {"train_loss": -6.985482215881348, "global_step": 178510, "epoch": 4250} {"train_loss": -7.176312446594238, "global_step": 178511, "epoch": 4250} {"train_loss": -7.011645793914795, "global_step": 178512, "epoch": 4250} {"train_loss": -6.992711544036865, "global_step": 178513, "epoch": 4250} {"train_loss": -6.8903961181640625, "global_step": 178514, "epoch": 4250} {"train_loss": -6.997368335723877, "global_step": 178515, "epoch": 4250} {"train_loss": -7.001954078674316, "global_step": 178516, "epoch": 4250} {"train_loss": -7.00745153427124, "global_step": 178517, "epoch": 4250} {"train_loss": -7.013916015625, "global_step": 178518, "epoch": 4250} {"train_loss": -7.000347137451172, "global_step": 178519, "epoch": 4250} {"train_loss": -7.099061965942383, "global_step": 178520, "epoch": 4250} {"train_loss": -6.926539421081543, "global_step": 178521, "epoch": 4250} {"train_loss": -7.098239898681641, "global_step": 178522, "epoch": 4250} {"train_loss": -7.129990100860596, "global_step": 178523, "epoch": 4250} {"train_loss": -7.012816905975342, "global_step": 178524, "epoch": 4250} {"train_loss": -7.066869735717773, "global_step": 178525, "epoch": 4250} {"train_loss": -7.209039688110352, "global_step": 178526, "epoch": 4250} {"train_loss": -7.108359336853027, "global_step": 178527, "epoch": 4250} {"train_loss": -7.121350288391113, "global_step": 178528, "epoch": 4250} {"train_loss": -7.081766605377197, "global_step": 178529, "epoch": 4250} {"train_loss": -7.114495277404785, "global_step": 178530, "epoch": 4250} {"train_loss": -7.038705348968506, "global_step": 178531, "epoch": 4250} {"train_loss": -7.059048652648926, "global_step": 178532, "epoch": 4250} {"train_loss": -6.9735541343688965, "global_step": 178533, "epoch": 4250} {"train_loss": -6.956265449523926, "global_step": 178534, "epoch": 4250} {"train_loss": -7.097714424133301, "global_step": 178535, "epoch": 4250} {"train_loss": -7.0316314697265625, "global_step": 178536, "epoch": 4250} {"train_loss": -7.007136821746826, "global_step": 178537, "epoch": 4250} {"train_loss": -6.999309062957764, "global_step": 178538, "epoch": 4250} {"train_loss": -7.111483573913574, "global_step": 178539, "epoch": 4250} {"train_loss": -7.012340545654297, "global_step": 178540, "epoch": 4250} {"train_loss": -7.043768224262056, "global_step": 178541, "epoch": 4250, "train/sim_max_reward_0": 0.7573133431895358, "train/sim_max_reward_1": 1.0, "train/sim_max_reward_2": 0.37579671266681675, "train/sim_max_reward_3": 0.14250441426788035, "train/sim_max_reward_4": 0.8772051933294058, "train/sim_max_reward_5": 0.5573079883144144, "test/sim_max_reward_4500000": 0.9114734018672357, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9246466954036385, "test/sim_max_reward_4500003": 0.9319135198928943, "test/sim_max_reward_4500004": 0.1408855946102421, "test/sim_max_reward_4500005": 0.9767603500921124, "test/sim_max_reward_4500006": 0.9928572363923922, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.3144588168508254, "test/sim_max_reward_4500009": 0.05318638823313134, "test/sim_max_reward_4500010": 0.04603215611968801, "test/sim_max_reward_4500011": 0.4821843509490448, "test/sim_max_reward_4500012": 0.8623813694768221, "test/sim_max_reward_4500013": 0.007631603174749365, "test/sim_max_reward_4500014": 0.982921678361623, "test/sim_max_reward_4500015": 0.9566181661554382, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.07473589835439212, "test/sim_max_reward_4500018": 0.9666395294171599, "test/sim_max_reward_4500019": 0.8628219404356232, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8668713157488726, "test/sim_max_reward_4500022": 0.9342224044683984, "test/sim_max_reward_4500023": 0.9218777635420765, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9986850025511911, "test/sim_max_reward_4500026": 0.9345398911751909, "test/sim_max_reward_4500027": 0.9618148577873411, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.10833610304129816, "test/sim_max_reward_4500030": 0.9480387339281094, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.9246099610289709, "test/sim_max_reward_4500035": 0.9805461801440482, "test/sim_max_reward_4500036": 0.4261963842879168, "test/sim_max_reward_4500037": 0.9538727089878184, "test/sim_max_reward_4500038": 0.3393215556868878, "test/sim_max_reward_4500039": 1.0, "test/sim_max_reward_4500040": 0.9520448151675331, "test/sim_max_reward_4500041": 0.843909929476444, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.34483176012217714, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.8519558749113995, "test/sim_max_reward_4500046": 0.20591910157111762, "test/sim_max_reward_4500047": 0.899227224009129, "test/sim_max_reward_4500048": 0.9710605329743186, "test/sim_max_reward_4500049": 0.9598657759963103, "train/mean_score": 0.6183546086280088, "test/mean_score": 0.5813650161272047, "val_loss": 80478.9140625} {"train_loss": -6.9901580810546875, "global_step": 178542, "epoch": 4251} {"train_loss": -6.999652862548828, "global_step": 178543, "epoch": 4251} {"train_loss": -7.181985855102539, "global_step": 178544, "epoch": 4251} {"train_loss": -7.0171284675598145, "global_step": 178545, "epoch": 4251} {"train_loss": -7.16413688659668, "global_step": 178546, "epoch": 4251} {"train_loss": -7.027040481567383, "global_step": 178547, "epoch": 4251} {"train_loss": -7.058701992034912, "global_step": 178548, "epoch": 4251} {"train_loss": -7.017363548278809, "global_step": 178549, "epoch": 4251} {"train_loss": -7.028744697570801, "global_step": 178550, "epoch": 4251} {"train_loss": -7.044998645782471, "global_step": 178551, "epoch": 4251} {"train_loss": -7.172363758087158, "global_step": 178552, "epoch": 4251} {"train_loss": -7.121264457702637, "global_step": 178553, "epoch": 4251} {"train_loss": -7.149561882019043, "global_step": 178554, "epoch": 4251} {"train_loss": -7.1414947509765625, "global_step": 178555, "epoch": 4251} {"train_loss": -7.096391677856445, "global_step": 178556, "epoch": 4251} {"train_loss": -7.231821060180664, "global_step": 178557, "epoch": 4251} {"train_loss": -7.210794925689697, "global_step": 178558, "epoch": 4251} {"train_loss": -7.085053443908691, "global_step": 178559, "epoch": 4251} {"train_loss": -7.051551818847656, "global_step": 178560, "epoch": 4251} {"train_loss": -7.067309379577637, "global_step": 178561, "epoch": 4251} {"train_loss": -7.122413158416748, "global_step": 178562, "epoch": 4251} {"train_loss": -7.175885200500488, "global_step": 178563, "epoch": 4251} {"train_loss": -7.099514961242676, "global_step": 178564, "epoch": 4251} {"train_loss": -7.1556596755981445, "global_step": 178565, "epoch": 4251} {"train_loss": -7.09906530380249, "global_step": 178566, "epoch": 4251} {"train_loss": -7.119923114776611, "global_step": 178567, "epoch": 4251} {"train_loss": -7.163247108459473, "global_step": 178568, "epoch": 4251} {"train_loss": -7.108109474182129, "global_step": 178569, "epoch": 4251} {"train_loss": -7.127053737640381, "global_step": 178570, "epoch": 4251} {"train_loss": -7.120381832122803, "global_step": 178571, "epoch": 4251} {"train_loss": -7.197383880615234, "global_step": 178572, "epoch": 4251} {"train_loss": -7.1168084144592285, "global_step": 178573, "epoch": 4251} {"train_loss": -7.22677755355835, "global_step": 178574, "epoch": 4251} {"train_loss": -7.173169136047363, "global_step": 178575, "epoch": 4251} {"train_loss": -7.100922584533691, "global_step": 178576, "epoch": 4251} {"train_loss": -7.283724308013916, "global_step": 178577, "epoch": 4251} {"train_loss": -7.252119064331055, "global_step": 178578, "epoch": 4251} {"train_loss": -7.227550983428955, "global_step": 178579, "epoch": 4251} {"train_loss": -7.1304779052734375, "global_step": 178580, "epoch": 4251} {"train_loss": -7.076665878295898, "global_step": 178581, "epoch": 4251} {"train_loss": -7.077419281005859, "global_step": 178582, "epoch": 4251} {"train_loss": -7.124899171647572, "global_step": 178583, "epoch": 4251, "val_loss": 80400.59375} {"train_loss": -7.122757911682129, "global_step": 178584, "epoch": 4252} {"train_loss": -7.2861528396606445, "global_step": 178585, "epoch": 4252} {"train_loss": -7.237988471984863, "global_step": 178586, "epoch": 4252} {"train_loss": -7.074063301086426, "global_step": 178587, "epoch": 4252} {"train_loss": -7.173553466796875, "global_step": 178588, "epoch": 4252} {"train_loss": -7.127171516418457, "global_step": 178589, "epoch": 4252} {"train_loss": -7.1877360343933105, "global_step": 178590, "epoch": 4252} {"train_loss": -7.243988037109375, "global_step": 178591, "epoch": 4252} {"train_loss": -7.292624473571777, "global_step": 178592, "epoch": 4252} {"train_loss": -7.214977264404297, "global_step": 178593, "epoch": 4252} {"train_loss": -7.232977867126465, "global_step": 178594, "epoch": 4252} {"train_loss": -7.31558084487915, "global_step": 178595, "epoch": 4252} {"train_loss": -7.078454971313477, "global_step": 178596, "epoch": 4252} {"train_loss": -7.172143936157227, "global_step": 178597, "epoch": 4252} {"train_loss": -7.045228958129883, "global_step": 178598, "epoch": 4252} {"train_loss": -7.117860317230225, "global_step": 178599, "epoch": 4252} {"train_loss": -7.126153945922852, "global_step": 178600, "epoch": 4252} {"train_loss": -7.146447658538818, "global_step": 178601, "epoch": 4252} {"train_loss": -7.1495866775512695, "global_step": 178602, "epoch": 4252} {"train_loss": -7.242180824279785, "global_step": 178603, "epoch": 4252} {"train_loss": -7.250560283660889, "global_step": 178604, "epoch": 4252} {"train_loss": -6.9144182205200195, "global_step": 178605, "epoch": 4252} {"train_loss": -7.085890293121338, "global_step": 178606, "epoch": 4252} {"train_loss": -7.218159198760986, "global_step": 178607, "epoch": 4252} {"train_loss": -7.0052080154418945, "global_step": 178608, "epoch": 4252} {"train_loss": -7.19335412979126, "global_step": 178609, "epoch": 4252} {"train_loss": -7.173614501953125, "global_step": 178610, "epoch": 4252} {"train_loss": -7.043502330780029, "global_step": 178611, "epoch": 4252} {"train_loss": -7.078661918640137, "global_step": 178612, "epoch": 4252} {"train_loss": -7.211664199829102, "global_step": 178613, "epoch": 4252} {"train_loss": -6.9721221923828125, "global_step": 178614, "epoch": 4252} {"train_loss": -7.215173721313477, "global_step": 178615, "epoch": 4252} {"train_loss": -7.030667781829834, "global_step": 178616, "epoch": 4252} {"train_loss": -7.165121555328369, "global_step": 178617, "epoch": 4252} {"train_loss": -7.110450744628906, "global_step": 178618, "epoch": 4252} {"train_loss": -7.018337249755859, "global_step": 178619, "epoch": 4252} {"train_loss": -7.134021759033203, "global_step": 178620, "epoch": 4252} {"train_loss": -7.111090183258057, "global_step": 178621, "epoch": 4252} {"train_loss": -7.137886047363281, "global_step": 178622, "epoch": 4252} {"train_loss": -6.911996841430664, "global_step": 178623, "epoch": 4252} {"train_loss": -7.008946418762207, "global_step": 178624, "epoch": 4252} {"train_loss": -7.135659955796742, "global_step": 178625, "epoch": 4252, "val_loss": 80436.09375} {"train_loss": -7.057086944580078, "global_step": 178626, "epoch": 4253} {"train_loss": -7.189459800720215, "global_step": 178627, "epoch": 4253} {"train_loss": -7.075029373168945, "global_step": 178628, "epoch": 4253} {"train_loss": -7.0750532150268555, "global_step": 178629, "epoch": 4253} {"train_loss": -6.99288272857666, "global_step": 178630, "epoch": 4253} {"train_loss": -6.926506042480469, "global_step": 178631, "epoch": 4253} {"train_loss": -7.13953161239624, "global_step": 178632, "epoch": 4253} {"train_loss": -7.162345886230469, "global_step": 178633, "epoch": 4253} {"train_loss": -7.088352203369141, "global_step": 178634, "epoch": 4253} {"train_loss": -7.0496745109558105, "global_step": 178635, "epoch": 4253} {"train_loss": -7.010551452636719, "global_step": 178636, "epoch": 4253} {"train_loss": -7.208718299865723, "global_step": 178637, "epoch": 4253} {"train_loss": -7.04067325592041, "global_step": 178638, "epoch": 4253} {"train_loss": -7.125818252563477, "global_step": 178639, "epoch": 4253} {"train_loss": -7.156598091125488, "global_step": 178640, "epoch": 4253} {"train_loss": -7.148218154907227, "global_step": 178641, "epoch": 4253} {"train_loss": -7.075148582458496, "global_step": 178642, "epoch": 4253} {"train_loss": -7.245378494262695, "global_step": 178643, "epoch": 4253} {"train_loss": -7.009592056274414, "global_step": 178644, "epoch": 4253} {"train_loss": -7.171438217163086, "global_step": 178645, "epoch": 4253} {"train_loss": -7.186638832092285, "global_step": 178646, "epoch": 4253} {"train_loss": -7.02675724029541, "global_step": 178647, "epoch": 4253} {"train_loss": -7.101408958435059, "global_step": 178648, "epoch": 4253} {"train_loss": -7.242444038391113, "global_step": 178649, "epoch": 4253} {"train_loss": -7.078729629516602, "global_step": 178650, "epoch": 4253} {"train_loss": -7.179753303527832, "global_step": 178651, "epoch": 4253} {"train_loss": -7.164645195007324, "global_step": 178652, "epoch": 4253} {"train_loss": -7.162478923797607, "global_step": 178653, "epoch": 4253} {"train_loss": -7.11390495300293, "global_step": 178654, "epoch": 4253} {"train_loss": -7.1238555908203125, "global_step": 178655, "epoch": 4253} {"train_loss": -7.131261825561523, "global_step": 178656, "epoch": 4253} {"train_loss": -7.172298431396484, "global_step": 178657, "epoch": 4253} {"train_loss": -7.131405830383301, "global_step": 178658, "epoch": 4253} {"train_loss": -7.073946475982666, "global_step": 178659, "epoch": 4253} {"train_loss": -6.985688209533691, "global_step": 178660, "epoch": 4253} {"train_loss": -7.042791366577148, "global_step": 178661, "epoch": 4253} {"train_loss": -7.220802307128906, "global_step": 178662, "epoch": 4253} {"train_loss": -6.938788414001465, "global_step": 178663, "epoch": 4253} {"train_loss": -7.019700050354004, "global_step": 178664, "epoch": 4253} {"train_loss": -7.096460342407227, "global_step": 178665, "epoch": 4253} {"train_loss": -7.014472007751465, "global_step": 178666, "epoch": 4253} {"train_loss": -7.100666977110363, "global_step": 178667, "epoch": 4253, "val_loss": 80299.3515625} {"train_loss": -7.0471272468566895, "global_step": 178668, "epoch": 4254} {"train_loss": -7.125733375549316, "global_step": 178669, "epoch": 4254} {"train_loss": -7.130202770233154, "global_step": 178670, "epoch": 4254} {"train_loss": -7.0084733963012695, "global_step": 178671, "epoch": 4254} {"train_loss": -7.129311561584473, "global_step": 178672, "epoch": 4254} {"train_loss": -7.120372295379639, "global_step": 178673, "epoch": 4254} {"train_loss": -7.09373664855957, "global_step": 178674, "epoch": 4254} {"train_loss": -7.110301971435547, "global_step": 178675, "epoch": 4254} {"train_loss": -7.146357536315918, "global_step": 178676, "epoch": 4254} {"train_loss": -7.057079315185547, "global_step": 178677, "epoch": 4254} {"train_loss": -7.224152565002441, "global_step": 178678, "epoch": 4254} {"train_loss": -7.169033527374268, "global_step": 178679, "epoch": 4254} {"train_loss": -7.21016788482666, "global_step": 178680, "epoch": 4254} {"train_loss": -7.246708393096924, "global_step": 178681, "epoch": 4254} {"train_loss": -7.111630916595459, "global_step": 178682, "epoch": 4254} {"train_loss": -7.184761047363281, "global_step": 178683, "epoch": 4254} {"train_loss": -7.1899003982543945, "global_step": 178684, "epoch": 4254} {"train_loss": -7.069652080535889, "global_step": 178685, "epoch": 4254} {"train_loss": -7.038403511047363, "global_step": 178686, "epoch": 4254} {"train_loss": -7.1555070877075195, "global_step": 178687, "epoch": 4254} {"train_loss": -7.03399658203125, "global_step": 178688, "epoch": 4254} {"train_loss": -7.109763145446777, "global_step": 178689, "epoch": 4254} {"train_loss": -7.149151802062988, "global_step": 178690, "epoch": 4254} {"train_loss": -7.150740623474121, "global_step": 178691, "epoch": 4254} {"train_loss": -7.132311820983887, "global_step": 178692, "epoch": 4254} {"train_loss": -7.166226863861084, "global_step": 178693, "epoch": 4254} {"train_loss": -7.1122331619262695, "global_step": 178694, "epoch": 4254} {"train_loss": -7.138769149780273, "global_step": 178695, "epoch": 4254} {"train_loss": -7.101738929748535, "global_step": 178696, "epoch": 4254} {"train_loss": -7.201238632202148, "global_step": 178697, "epoch": 4254} {"train_loss": -7.242753028869629, "global_step": 178698, "epoch": 4254} {"train_loss": -7.205606937408447, "global_step": 178699, "epoch": 4254} {"train_loss": -7.077700138092041, "global_step": 178700, "epoch": 4254} {"train_loss": -7.036850929260254, "global_step": 178701, "epoch": 4254} {"train_loss": -7.175665855407715, "global_step": 178702, "epoch": 4254} {"train_loss": -6.8710222244262695, "global_step": 178703, "epoch": 4254} {"train_loss": -7.054416179656982, "global_step": 178704, "epoch": 4254} {"train_loss": -7.189255237579346, "global_step": 178705, "epoch": 4254} {"train_loss": -6.905783653259277, "global_step": 178706, "epoch": 4254} {"train_loss": -7.058531761169434, "global_step": 178707, "epoch": 4254} {"train_loss": -7.09688663482666, "global_step": 178708, "epoch": 4254} {"train_loss": -7.113465502148583, "global_step": 178709, "epoch": 4254, "val_loss": 80480.7109375} {"train_loss": -7.0535125732421875, "global_step": 178710, "epoch": 4255} {"train_loss": -7.045519828796387, "global_step": 178711, "epoch": 4255} {"train_loss": -7.085907936096191, "global_step": 178712, "epoch": 4255} {"train_loss": -6.831521034240723, "global_step": 178713, "epoch": 4255} {"train_loss": -7.001496315002441, "global_step": 178714, "epoch": 4255} {"train_loss": -7.038869857788086, "global_step": 178715, "epoch": 4255} {"train_loss": -7.028090000152588, "global_step": 178716, "epoch": 4255} {"train_loss": -7.1360368728637695, "global_step": 178717, "epoch": 4255} {"train_loss": -6.9524664878845215, "global_step": 178718, "epoch": 4255} {"train_loss": -7.136420726776123, "global_step": 178719, "epoch": 4255} {"train_loss": -7.181801795959473, "global_step": 178720, "epoch": 4255} {"train_loss": -7.088072776794434, "global_step": 178721, "epoch": 4255} {"train_loss": -6.931486129760742, "global_step": 178722, "epoch": 4255} {"train_loss": -7.1600494384765625, "global_step": 178723, "epoch": 4255} {"train_loss": -7.030156135559082, "global_step": 178724, "epoch": 4255} {"train_loss": -7.123647689819336, "global_step": 178725, "epoch": 4255} {"train_loss": -7.078025817871094, "global_step": 178726, "epoch": 4255} {"train_loss": -7.099358558654785, "global_step": 178727, "epoch": 4255} {"train_loss": -7.042236804962158, "global_step": 178728, "epoch": 4255} {"train_loss": -7.035475254058838, "global_step": 178729, "epoch": 4255} {"train_loss": -7.102171897888184, "global_step": 178730, "epoch": 4255} {"train_loss": -7.036712646484375, "global_step": 178731, "epoch": 4255} {"train_loss": -7.030647277832031, "global_step": 178732, "epoch": 4255} {"train_loss": -7.008172035217285, "global_step": 178733, "epoch": 4255} {"train_loss": -7.079270362854004, "global_step": 178734, "epoch": 4255} {"train_loss": -7.1200056076049805, "global_step": 178735, "epoch": 4255} {"train_loss": -7.095149040222168, "global_step": 178736, "epoch": 4255} {"train_loss": -7.029090881347656, "global_step": 178737, "epoch": 4255} {"train_loss": -7.100571632385254, "global_step": 178738, "epoch": 4255} {"train_loss": -7.0190300941467285, "global_step": 178739, "epoch": 4255} {"train_loss": -7.085981845855713, "global_step": 178740, "epoch": 4255} {"train_loss": -7.049923896789551, "global_step": 178741, "epoch": 4255} {"train_loss": -7.204669952392578, "global_step": 178742, "epoch": 4255} {"train_loss": -7.194953441619873, "global_step": 178743, "epoch": 4255} {"train_loss": -7.153235912322998, "global_step": 178744, "epoch": 4255} {"train_loss": -7.064615726470947, "global_step": 178745, "epoch": 4255} {"train_loss": -7.142821311950684, "global_step": 178746, "epoch": 4255} {"train_loss": -7.0273637771606445, "global_step": 178747, "epoch": 4255} {"train_loss": -6.989357948303223, "global_step": 178748, "epoch": 4255} {"train_loss": -7.131856441497803, "global_step": 178749, "epoch": 4255} {"train_loss": -7.141297340393066, "global_step": 178750, "epoch": 4255} {"train_loss": -7.070470730463664, "global_step": 178751, "epoch": 4255, "val_loss": 80348.6328125} {"train_loss": -7.1940016746521, "global_step": 178752, "epoch": 4256} {"train_loss": -6.975196838378906, "global_step": 178753, "epoch": 4256} {"train_loss": -7.168766975402832, "global_step": 178754, "epoch": 4256} {"train_loss": -7.195029258728027, "global_step": 178755, "epoch": 4256} {"train_loss": -7.118053436279297, "global_step": 178756, "epoch": 4256} {"train_loss": -7.129461288452148, "global_step": 178757, "epoch": 4256} {"train_loss": -7.088360786437988, "global_step": 178758, "epoch": 4256} {"train_loss": -7.068743705749512, "global_step": 178759, "epoch": 4256} {"train_loss": -7.184920787811279, "global_step": 178760, "epoch": 4256} {"train_loss": -7.059774398803711, "global_step": 178761, "epoch": 4256} {"train_loss": -7.1752214431762695, "global_step": 178762, "epoch": 4256} {"train_loss": -7.114937782287598, "global_step": 178763, "epoch": 4256} {"train_loss": -7.090186595916748, "global_step": 178764, "epoch": 4256} {"train_loss": -7.116501808166504, "global_step": 178765, "epoch": 4256} {"train_loss": -7.13470458984375, "global_step": 178766, "epoch": 4256} {"train_loss": -7.1438398361206055, "global_step": 178767, "epoch": 4256} {"train_loss": -7.135883331298828, "global_step": 178768, "epoch": 4256} {"train_loss": -7.086887359619141, "global_step": 178769, "epoch": 4256} {"train_loss": -7.048752784729004, "global_step": 178770, "epoch": 4256} {"train_loss": -7.223679542541504, "global_step": 178771, "epoch": 4256} {"train_loss": -6.985630989074707, "global_step": 178772, "epoch": 4256} {"train_loss": -7.169826984405518, "global_step": 178773, "epoch": 4256} {"train_loss": -7.1473565101623535, "global_step": 178774, "epoch": 4256} {"train_loss": -7.13768196105957, "global_step": 178775, "epoch": 4256} {"train_loss": -7.254971504211426, "global_step": 178776, "epoch": 4256} {"train_loss": -7.193161964416504, "global_step": 178777, "epoch": 4256} {"train_loss": -7.186936378479004, "global_step": 178778, "epoch": 4256} {"train_loss": -7.14995813369751, "global_step": 178779, "epoch": 4256} {"train_loss": -7.116426467895508, "global_step": 178780, "epoch": 4256} {"train_loss": -7.125235557556152, "global_step": 178781, "epoch": 4256} {"train_loss": -7.212525367736816, "global_step": 178782, "epoch": 4256} {"train_loss": -7.107021331787109, "global_step": 178783, "epoch": 4256} {"train_loss": -7.090965270996094, "global_step": 178784, "epoch": 4256} {"train_loss": -7.131890296936035, "global_step": 178785, "epoch": 4256} {"train_loss": -7.047988414764404, "global_step": 178786, "epoch": 4256} {"train_loss": -7.145377159118652, "global_step": 178787, "epoch": 4256} {"train_loss": -7.160101890563965, "global_step": 178788, "epoch": 4256} {"train_loss": -7.124858856201172, "global_step": 178789, "epoch": 4256} {"train_loss": -7.069915294647217, "global_step": 178790, "epoch": 4256} {"train_loss": -7.0201215744018555, "global_step": 178791, "epoch": 4256} {"train_loss": -7.166747093200684, "global_step": 178792, "epoch": 4256} {"train_loss": -7.128989912214733, "global_step": 178793, "epoch": 4256, "val_loss": 80537.3515625} {"train_loss": -7.155615329742432, "global_step": 178794, "epoch": 4257} {"train_loss": -7.163470268249512, "global_step": 178795, "epoch": 4257} {"train_loss": -7.0872344970703125, "global_step": 178796, "epoch": 4257} {"train_loss": -7.002107620239258, "global_step": 178797, "epoch": 4257} {"train_loss": -7.234921455383301, "global_step": 178798, "epoch": 4257} {"train_loss": -7.051369667053223, "global_step": 178799, "epoch": 4257} {"train_loss": -7.035611152648926, "global_step": 178800, "epoch": 4257} {"train_loss": -7.119359493255615, "global_step": 178801, "epoch": 4257} {"train_loss": -6.940892696380615, "global_step": 178802, "epoch": 4257} {"train_loss": -7.0629801750183105, "global_step": 178803, "epoch": 4257} {"train_loss": -7.14083194732666, "global_step": 178804, "epoch": 4257} {"train_loss": -7.062802791595459, "global_step": 178805, "epoch": 4257} {"train_loss": -7.154088020324707, "global_step": 178806, "epoch": 4257} {"train_loss": -7.0849409103393555, "global_step": 178807, "epoch": 4257} {"train_loss": -7.0261688232421875, "global_step": 178808, "epoch": 4257} {"train_loss": -6.902704238891602, "global_step": 178809, "epoch": 4257} {"train_loss": -7.052024841308594, "global_step": 178810, "epoch": 4257} {"train_loss": -7.02586555480957, "global_step": 178811, "epoch": 4257} {"train_loss": -7.055612564086914, "global_step": 178812, "epoch": 4257} {"train_loss": -7.103705883026123, "global_step": 178813, "epoch": 4257} {"train_loss": -7.0090718269348145, "global_step": 178814, "epoch": 4257} {"train_loss": -7.155794143676758, "global_step": 178815, "epoch": 4257} {"train_loss": -7.047216892242432, "global_step": 178816, "epoch": 4257} {"train_loss": -7.156230926513672, "global_step": 178817, "epoch": 4257} {"train_loss": -7.164109706878662, "global_step": 178818, "epoch": 4257} {"train_loss": -6.999874114990234, "global_step": 178819, "epoch": 4257} {"train_loss": -7.003590106964111, "global_step": 178820, "epoch": 4257} {"train_loss": -7.007338523864746, "global_step": 178821, "epoch": 4257} {"train_loss": -7.087541580200195, "global_step": 178822, "epoch": 4257} {"train_loss": -7.0434699058532715, "global_step": 178823, "epoch": 4257} {"train_loss": -7.139092445373535, "global_step": 178824, "epoch": 4257} {"train_loss": -7.118793487548828, "global_step": 178825, "epoch": 4257} {"train_loss": -7.05399227142334, "global_step": 178826, "epoch": 4257} {"train_loss": -7.113516330718994, "global_step": 178827, "epoch": 4257} {"train_loss": -7.0255327224731445, "global_step": 178828, "epoch": 4257} {"train_loss": -7.152338027954102, "global_step": 178829, "epoch": 4257} {"train_loss": -7.190167427062988, "global_step": 178830, "epoch": 4257} {"train_loss": -7.068233013153076, "global_step": 178831, "epoch": 4257} {"train_loss": -7.148608207702637, "global_step": 178832, "epoch": 4257} {"train_loss": -7.117551803588867, "global_step": 178833, "epoch": 4257} {"train_loss": -7.180706977844238, "global_step": 178834, "epoch": 4257} {"train_loss": -7.08566157023112, "global_step": 178835, "epoch": 4257, "val_loss": 80306.5078125} {"train_loss": -7.154088020324707, "global_step": 178836, "epoch": 4258} {"train_loss": -7.075954437255859, "global_step": 178837, "epoch": 4258} {"train_loss": -7.112049102783203, "global_step": 178838, "epoch": 4258} {"train_loss": -7.034438133239746, "global_step": 178839, "epoch": 4258} {"train_loss": -7.045831680297852, "global_step": 178840, "epoch": 4258} {"train_loss": -7.13444709777832, "global_step": 178841, "epoch": 4258} {"train_loss": -7.214260101318359, "global_step": 178842, "epoch": 4258} {"train_loss": -7.0999040603637695, "global_step": 178843, "epoch": 4258} {"train_loss": -7.108807563781738, "global_step": 178844, "epoch": 4258} {"train_loss": -7.061142921447754, "global_step": 178845, "epoch": 4258} {"train_loss": -7.031999588012695, "global_step": 178846, "epoch": 4258} {"train_loss": -7.184868812561035, "global_step": 178847, "epoch": 4258} {"train_loss": -6.993694305419922, "global_step": 178848, "epoch": 4258} {"train_loss": -7.057500839233398, "global_step": 178849, "epoch": 4258} {"train_loss": -7.1484293937683105, "global_step": 178850, "epoch": 4258} {"train_loss": -7.087453842163086, "global_step": 178851, "epoch": 4258} {"train_loss": -7.15422248840332, "global_step": 178852, "epoch": 4258} {"train_loss": -7.134358882904053, "global_step": 178853, "epoch": 4258} {"train_loss": -7.215394973754883, "global_step": 178854, "epoch": 4258} {"train_loss": -7.134193420410156, "global_step": 178855, "epoch": 4258} {"train_loss": -7.161230087280273, "global_step": 178856, "epoch": 4258} {"train_loss": -7.044683933258057, "global_step": 178857, "epoch": 4258} {"train_loss": -7.111278533935547, "global_step": 178858, "epoch": 4258} {"train_loss": -7.021085262298584, "global_step": 178859, "epoch": 4258} {"train_loss": -7.035385608673096, "global_step": 178860, "epoch": 4258} {"train_loss": -7.213220119476318, "global_step": 178861, "epoch": 4258} {"train_loss": -7.088101387023926, "global_step": 178862, "epoch": 4258} {"train_loss": -7.13625431060791, "global_step": 178863, "epoch": 4258} {"train_loss": -7.209173202514648, "global_step": 178864, "epoch": 4258} {"train_loss": -7.129786968231201, "global_step": 178865, "epoch": 4258} {"train_loss": -7.168479919433594, "global_step": 178866, "epoch": 4258} {"train_loss": -7.260324478149414, "global_step": 178867, "epoch": 4258} {"train_loss": -7.056626319885254, "global_step": 178868, "epoch": 4258} {"train_loss": -7.095516204833984, "global_step": 178869, "epoch": 4258} {"train_loss": -7.066658020019531, "global_step": 178870, "epoch": 4258} {"train_loss": -6.9795331954956055, "global_step": 178871, "epoch": 4258} {"train_loss": -7.1766462326049805, "global_step": 178872, "epoch": 4258} {"train_loss": -7.098995208740234, "global_step": 178873, "epoch": 4258} {"train_loss": -7.136775016784668, "global_step": 178874, "epoch": 4258} {"train_loss": -7.083684921264648, "global_step": 178875, "epoch": 4258} {"train_loss": -6.970037460327148, "global_step": 178876, "epoch": 4258} {"train_loss": -7.109845967519851, "global_step": 178877, "epoch": 4258, "val_loss": 80447.4453125} {"train_loss": -7.08366584777832, "global_step": 178878, "epoch": 4259} {"train_loss": -7.101558685302734, "global_step": 178879, "epoch": 4259} {"train_loss": -7.195737838745117, "global_step": 178880, "epoch": 4259} {"train_loss": -7.047800064086914, "global_step": 178881, "epoch": 4259} {"train_loss": -7.1393232345581055, "global_step": 178882, "epoch": 4259} {"train_loss": -7.036665439605713, "global_step": 178883, "epoch": 4259} {"train_loss": -7.191291332244873, "global_step": 178884, "epoch": 4259} {"train_loss": -7.237367630004883, "global_step": 178885, "epoch": 4259} {"train_loss": -7.170357704162598, "global_step": 178886, "epoch": 4259} {"train_loss": -7.106996059417725, "global_step": 178887, "epoch": 4259} {"train_loss": -7.067018985748291, "global_step": 178888, "epoch": 4259} {"train_loss": -7.191683769226074, "global_step": 178889, "epoch": 4259} {"train_loss": -7.081720352172852, "global_step": 178890, "epoch": 4259} {"train_loss": -7.038646221160889, "global_step": 178891, "epoch": 4259} {"train_loss": -7.09261417388916, "global_step": 178892, "epoch": 4259} {"train_loss": -7.036378860473633, "global_step": 178893, "epoch": 4259} {"train_loss": -7.124058246612549, "global_step": 178894, "epoch": 4259} {"train_loss": -7.184353828430176, "global_step": 178895, "epoch": 4259} {"train_loss": -7.183979511260986, "global_step": 178896, "epoch": 4259} {"train_loss": -7.233001708984375, "global_step": 178897, "epoch": 4259} {"train_loss": -7.044647216796875, "global_step": 178898, "epoch": 4259} {"train_loss": -7.177103042602539, "global_step": 178899, "epoch": 4259} {"train_loss": -7.133870601654053, "global_step": 178900, "epoch": 4259} {"train_loss": -7.182896614074707, "global_step": 178901, "epoch": 4259} {"train_loss": -7.104330062866211, "global_step": 178902, "epoch": 4259} {"train_loss": -7.124073028564453, "global_step": 178903, "epoch": 4259} {"train_loss": -7.031683921813965, "global_step": 178904, "epoch": 4259} {"train_loss": -7.076581001281738, "global_step": 178905, "epoch": 4259} {"train_loss": -7.136158466339111, "global_step": 178906, "epoch": 4259} {"train_loss": -7.124581813812256, "global_step": 178907, "epoch": 4259} {"train_loss": -7.238885402679443, "global_step": 178908, "epoch": 4259} {"train_loss": -7.03394889831543, "global_step": 178909, "epoch": 4259} {"train_loss": -7.169197082519531, "global_step": 178910, "epoch": 4259} {"train_loss": -7.098763465881348, "global_step": 178911, "epoch": 4259} {"train_loss": -7.189042568206787, "global_step": 178912, "epoch": 4259} {"train_loss": -7.169308662414551, "global_step": 178913, "epoch": 4259} {"train_loss": -7.159162521362305, "global_step": 178914, "epoch": 4259} {"train_loss": -7.194048881530762, "global_step": 178915, "epoch": 4259} {"train_loss": -7.1899261474609375, "global_step": 178916, "epoch": 4259} {"train_loss": -7.21696662902832, "global_step": 178917, "epoch": 4259} {"train_loss": -7.22540807723999, "global_step": 178918, "epoch": 4259} {"train_loss": -7.137783254895892, "global_step": 178919, "epoch": 4259, "val_loss": 80297.96875} {"train_loss": -7.154107570648193, "global_step": 178920, "epoch": 4260} {"train_loss": -7.135951042175293, "global_step": 178921, "epoch": 4260} {"train_loss": -7.21054744720459, "global_step": 178922, "epoch": 4260} {"train_loss": -7.333559989929199, "global_step": 178923, "epoch": 4260} {"train_loss": -7.1204514503479, "global_step": 178924, "epoch": 4260} {"train_loss": -7.124046325683594, "global_step": 178925, "epoch": 4260} {"train_loss": -7.040785789489746, "global_step": 178926, "epoch": 4260} {"train_loss": -7.22787618637085, "global_step": 178927, "epoch": 4260} {"train_loss": -7.298837661743164, "global_step": 178928, "epoch": 4260} {"train_loss": -7.194225311279297, "global_step": 178929, "epoch": 4260} {"train_loss": -7.144713878631592, "global_step": 178930, "epoch": 4260} {"train_loss": -7.112187385559082, "global_step": 178931, "epoch": 4260} {"train_loss": -7.144073009490967, "global_step": 178932, "epoch": 4260} {"train_loss": -7.23076057434082, "global_step": 178933, "epoch": 4260} {"train_loss": -7.264497756958008, "global_step": 178934, "epoch": 4260} {"train_loss": -7.203062534332275, "global_step": 178935, "epoch": 4260} {"train_loss": -7.232172966003418, "global_step": 178936, "epoch": 4260} {"train_loss": -7.21891450881958, "global_step": 178937, "epoch": 4260} {"train_loss": -7.318508148193359, "global_step": 178938, "epoch": 4260} {"train_loss": -7.283437728881836, "global_step": 178939, "epoch": 4260} {"train_loss": -7.237705707550049, "global_step": 178940, "epoch": 4260} {"train_loss": -7.210740566253662, "global_step": 178941, "epoch": 4260} {"train_loss": -7.077661037445068, "global_step": 178942, "epoch": 4260} {"train_loss": -7.124154090881348, "global_step": 178943, "epoch": 4260} {"train_loss": -7.144989967346191, "global_step": 178944, "epoch": 4260} {"train_loss": -7.2044548988342285, "global_step": 178945, "epoch": 4260} {"train_loss": -7.086487770080566, "global_step": 178946, "epoch": 4260} {"train_loss": -7.0145721435546875, "global_step": 178947, "epoch": 4260} {"train_loss": -7.194042205810547, "global_step": 178948, "epoch": 4260} {"train_loss": -7.06298828125, "global_step": 178949, "epoch": 4260} {"train_loss": -7.0566205978393555, "global_step": 178950, "epoch": 4260} {"train_loss": -7.19396448135376, "global_step": 178951, "epoch": 4260} {"train_loss": -7.146012306213379, "global_step": 178952, "epoch": 4260} {"train_loss": -7.124948978424072, "global_step": 178953, "epoch": 4260} {"train_loss": -7.11970853805542, "global_step": 178954, "epoch": 4260} {"train_loss": -7.160237789154053, "global_step": 178955, "epoch": 4260} {"train_loss": -7.031957626342773, "global_step": 178956, "epoch": 4260} {"train_loss": -7.10063362121582, "global_step": 178957, "epoch": 4260} {"train_loss": -7.006777763366699, "global_step": 178958, "epoch": 4260} {"train_loss": -7.0302734375, "global_step": 178959, "epoch": 4260} {"train_loss": -7.0790205001831055, "global_step": 178960, "epoch": 4260} {"train_loss": -7.155791101001558, "global_step": 178961, "epoch": 4260, "val_loss": 80525.390625} {"train_loss": -7.180464267730713, "global_step": 178962, "epoch": 4261} {"train_loss": -7.052324295043945, "global_step": 178963, "epoch": 4261} {"train_loss": -7.0492377281188965, "global_step": 178964, "epoch": 4261} {"train_loss": -7.054848670959473, "global_step": 178965, "epoch": 4261} {"train_loss": -7.1201395988464355, "global_step": 178966, "epoch": 4261} {"train_loss": -7.081271171569824, "global_step": 178967, "epoch": 4261} {"train_loss": -7.076086044311523, "global_step": 178968, "epoch": 4261} {"train_loss": -7.134368896484375, "global_step": 178969, "epoch": 4261} {"train_loss": -7.152806282043457, "global_step": 178970, "epoch": 4261} {"train_loss": -6.98585319519043, "global_step": 178971, "epoch": 4261} {"train_loss": -7.03182315826416, "global_step": 178972, "epoch": 4261} {"train_loss": -7.154873847961426, "global_step": 178973, "epoch": 4261} {"train_loss": -7.05340576171875, "global_step": 178974, "epoch": 4261} {"train_loss": -7.045869827270508, "global_step": 178975, "epoch": 4261} {"train_loss": -7.017657279968262, "global_step": 178976, "epoch": 4261} {"train_loss": -6.961587905883789, "global_step": 178977, "epoch": 4261} {"train_loss": -6.951089859008789, "global_step": 178978, "epoch": 4261} {"train_loss": -7.096621990203857, "global_step": 178979, "epoch": 4261} {"train_loss": -7.124704837799072, "global_step": 178980, "epoch": 4261} {"train_loss": -7.101737022399902, "global_step": 178981, "epoch": 4261} {"train_loss": -6.972526550292969, "global_step": 178982, "epoch": 4261} {"train_loss": -7.096632957458496, "global_step": 178983, "epoch": 4261} {"train_loss": -7.128049373626709, "global_step": 178984, "epoch": 4261} {"train_loss": -7.0154924392700195, "global_step": 178985, "epoch": 4261} {"train_loss": -7.131396293640137, "global_step": 178986, "epoch": 4261} {"train_loss": -7.055525779724121, "global_step": 178987, "epoch": 4261} {"train_loss": -7.057832717895508, "global_step": 178988, "epoch": 4261} {"train_loss": -7.108864784240723, "global_step": 178989, "epoch": 4261} {"train_loss": -7.073741912841797, "global_step": 178990, "epoch": 4261} {"train_loss": -7.102546691894531, "global_step": 178991, "epoch": 4261} {"train_loss": -7.162515163421631, "global_step": 178992, "epoch": 4261} {"train_loss": -7.042726993560791, "global_step": 178993, "epoch": 4261} {"train_loss": -7.08070182800293, "global_step": 178994, "epoch": 4261} {"train_loss": -7.017273426055908, "global_step": 178995, "epoch": 4261} {"train_loss": -7.172045707702637, "global_step": 178996, "epoch": 4261} {"train_loss": -7.070914268493652, "global_step": 178997, "epoch": 4261} {"train_loss": -7.136914253234863, "global_step": 178998, "epoch": 4261} {"train_loss": -7.066390514373779, "global_step": 178999, "epoch": 4261} {"train_loss": -7.080845355987549, "global_step": 179000, "epoch": 4261} {"train_loss": -7.157242774963379, "global_step": 179001, "epoch": 4261} {"train_loss": -7.045783996582031, "global_step": 179002, "epoch": 4261} {"train_loss": -7.080957730611165, "global_step": 179003, "epoch": 4261, "val_loss": 80272.9609375} {"train_loss": -7.011638164520264, "global_step": 179004, "epoch": 4262} {"train_loss": -7.121063232421875, "global_step": 179005, "epoch": 4262} {"train_loss": -7.121703624725342, "global_step": 179006, "epoch": 4262} {"train_loss": -7.0852556228637695, "global_step": 179007, "epoch": 4262} {"train_loss": -7.085341453552246, "global_step": 179008, "epoch": 4262} {"train_loss": -7.044244289398193, "global_step": 179009, "epoch": 4262} {"train_loss": -7.126360893249512, "global_step": 179010, "epoch": 4262} {"train_loss": -7.223845481872559, "global_step": 179011, "epoch": 4262} {"train_loss": -7.114866256713867, "global_step": 179012, "epoch": 4262} {"train_loss": -7.217779159545898, "global_step": 179013, "epoch": 4262} {"train_loss": -7.055227756500244, "global_step": 179014, "epoch": 4262} {"train_loss": -7.111446380615234, "global_step": 179015, "epoch": 4262} {"train_loss": -7.004220962524414, "global_step": 179016, "epoch": 4262} {"train_loss": -7.015725135803223, "global_step": 179017, "epoch": 4262} {"train_loss": -7.124380588531494, "global_step": 179018, "epoch": 4262} {"train_loss": -6.8470377922058105, "global_step": 179019, "epoch": 4262} {"train_loss": -7.126082420349121, "global_step": 179020, "epoch": 4262} {"train_loss": -7.077083587646484, "global_step": 179021, "epoch": 4262} {"train_loss": -7.274465560913086, "global_step": 179022, "epoch": 4262} {"train_loss": -7.04171085357666, "global_step": 179023, "epoch": 4262} {"train_loss": -7.065974712371826, "global_step": 179024, "epoch": 4262} {"train_loss": -7.0926666259765625, "global_step": 179025, "epoch": 4262} {"train_loss": -7.061216354370117, "global_step": 179026, "epoch": 4262} {"train_loss": -7.131425857543945, "global_step": 179027, "epoch": 4262} {"train_loss": -7.035496711730957, "global_step": 179028, "epoch": 4262} {"train_loss": -7.067481517791748, "global_step": 179029, "epoch": 4262} {"train_loss": -7.17498254776001, "global_step": 179030, "epoch": 4262} {"train_loss": -7.0586090087890625, "global_step": 179031, "epoch": 4262} {"train_loss": -7.046826362609863, "global_step": 179032, "epoch": 4262} {"train_loss": -7.129019737243652, "global_step": 179033, "epoch": 4262} {"train_loss": -7.051411151885986, "global_step": 179034, "epoch": 4262} {"train_loss": -7.213352680206299, "global_step": 179035, "epoch": 4262} {"train_loss": -7.161808013916016, "global_step": 179036, "epoch": 4262} {"train_loss": -7.034125328063965, "global_step": 179037, "epoch": 4262} {"train_loss": -6.938250541687012, "global_step": 179038, "epoch": 4262} {"train_loss": -7.085685729980469, "global_step": 179039, "epoch": 4262} {"train_loss": -7.012895107269287, "global_step": 179040, "epoch": 4262} {"train_loss": -7.055122375488281, "global_step": 179041, "epoch": 4262} {"train_loss": -7.050044536590576, "global_step": 179042, "epoch": 4262} {"train_loss": -7.0610151290893555, "global_step": 179043, "epoch": 4262} {"train_loss": -7.016138076782227, "global_step": 179044, "epoch": 4262} {"train_loss": -7.079064425967989, "global_step": 179045, "epoch": 4262, "val_loss": 80325.4375} {"train_loss": -7.116584777832031, "global_step": 179046, "epoch": 4263} {"train_loss": -7.008575439453125, "global_step": 179047, "epoch": 4263} {"train_loss": -7.126465797424316, "global_step": 179048, "epoch": 4263} {"train_loss": -7.1493611335754395, "global_step": 179049, "epoch": 4263} {"train_loss": -7.187674522399902, "global_step": 179050, "epoch": 4263} {"train_loss": -7.16970682144165, "global_step": 179051, "epoch": 4263} {"train_loss": -7.101323127746582, "global_step": 179052, "epoch": 4263} {"train_loss": -7.234454154968262, "global_step": 179053, "epoch": 4263} {"train_loss": -7.232515335083008, "global_step": 179054, "epoch": 4263} {"train_loss": -7.17661190032959, "global_step": 179055, "epoch": 4263} {"train_loss": -7.153590202331543, "global_step": 179056, "epoch": 4263} {"train_loss": -7.247674942016602, "global_step": 179057, "epoch": 4263} {"train_loss": -7.159603118896484, "global_step": 179058, "epoch": 4263} {"train_loss": -7.19165563583374, "global_step": 179059, "epoch": 4263} {"train_loss": -7.134797096252441, "global_step": 179060, "epoch": 4263} {"train_loss": -7.179132461547852, "global_step": 179061, "epoch": 4263} {"train_loss": -7.174959182739258, "global_step": 179062, "epoch": 4263} {"train_loss": -7.184706687927246, "global_step": 179063, "epoch": 4263} {"train_loss": -7.14313268661499, "global_step": 179064, "epoch": 4263} {"train_loss": -7.109255790710449, "global_step": 179065, "epoch": 4263} {"train_loss": -7.103118896484375, "global_step": 179066, "epoch": 4263} {"train_loss": -7.007458686828613, "global_step": 179067, "epoch": 4263} {"train_loss": -7.202823638916016, "global_step": 179068, "epoch": 4263} {"train_loss": -7.124258518218994, "global_step": 179069, "epoch": 4263} {"train_loss": -7.017635345458984, "global_step": 179070, "epoch": 4263} {"train_loss": -7.189813613891602, "global_step": 179071, "epoch": 4263} {"train_loss": -7.16810941696167, "global_step": 179072, "epoch": 4263} {"train_loss": -7.139422416687012, "global_step": 179073, "epoch": 4263} {"train_loss": -7.153496742248535, "global_step": 179074, "epoch": 4263} {"train_loss": -7.139312744140625, "global_step": 179075, "epoch": 4263} {"train_loss": -7.106172561645508, "global_step": 179076, "epoch": 4263} {"train_loss": -7.041088104248047, "global_step": 179077, "epoch": 4263} {"train_loss": -7.20753288269043, "global_step": 179078, "epoch": 4263} {"train_loss": -7.135643005371094, "global_step": 179079, "epoch": 4263} {"train_loss": -7.119149208068848, "global_step": 179080, "epoch": 4263} {"train_loss": -7.1793975830078125, "global_step": 179081, "epoch": 4263} {"train_loss": -7.21453857421875, "global_step": 179082, "epoch": 4263} {"train_loss": -7.142445087432861, "global_step": 179083, "epoch": 4263} {"train_loss": -7.032243251800537, "global_step": 179084, "epoch": 4263} {"train_loss": -7.186949729919434, "global_step": 179085, "epoch": 4263} {"train_loss": -7.171506881713867, "global_step": 179086, "epoch": 4263} {"train_loss": -7.145090988704136, "global_step": 179087, "epoch": 4263, "val_loss": 80229.4921875} {"train_loss": -7.316247940063477, "global_step": 179088, "epoch": 4264} {"train_loss": -7.21855354309082, "global_step": 179089, "epoch": 4264} {"train_loss": -7.163021564483643, "global_step": 179090, "epoch": 4264} {"train_loss": -7.20041561126709, "global_step": 179091, "epoch": 4264} {"train_loss": -7.045812129974365, "global_step": 179092, "epoch": 4264} {"train_loss": -6.982935428619385, "global_step": 179093, "epoch": 4264} {"train_loss": -7.092856407165527, "global_step": 179094, "epoch": 4264} {"train_loss": -7.054712295532227, "global_step": 179095, "epoch": 4264} {"train_loss": -7.118559837341309, "global_step": 179096, "epoch": 4264} {"train_loss": -7.068380355834961, "global_step": 179097, "epoch": 4264} {"train_loss": -6.98587703704834, "global_step": 179098, "epoch": 4264} {"train_loss": -7.010749816894531, "global_step": 179099, "epoch": 4264} {"train_loss": -6.976193428039551, "global_step": 179100, "epoch": 4264} {"train_loss": -6.976698398590088, "global_step": 179101, "epoch": 4264} {"train_loss": -6.996002197265625, "global_step": 179102, "epoch": 4264} {"train_loss": -7.006202220916748, "global_step": 179103, "epoch": 4264} {"train_loss": -7.078264236450195, "global_step": 179104, "epoch": 4264} {"train_loss": -7.139718055725098, "global_step": 179105, "epoch": 4264} {"train_loss": -6.857487678527832, "global_step": 179106, "epoch": 4264} {"train_loss": -7.027873992919922, "global_step": 179107, "epoch": 4264} {"train_loss": -7.006213665008545, "global_step": 179108, "epoch": 4264} {"train_loss": -7.0242156982421875, "global_step": 179109, "epoch": 4264} {"train_loss": -7.0117106437683105, "global_step": 179110, "epoch": 4264} {"train_loss": -6.8560991287231445, "global_step": 179111, "epoch": 4264} {"train_loss": -6.995635986328125, "global_step": 179112, "epoch": 4264} {"train_loss": -6.962517738342285, "global_step": 179113, "epoch": 4264} {"train_loss": -7.105609893798828, "global_step": 179114, "epoch": 4264} {"train_loss": -7.042893409729004, "global_step": 179115, "epoch": 4264} {"train_loss": -7.072974681854248, "global_step": 179116, "epoch": 4264} {"train_loss": -7.029107093811035, "global_step": 179117, "epoch": 4264} {"train_loss": -7.016867637634277, "global_step": 179118, "epoch": 4264} {"train_loss": -7.119401931762695, "global_step": 179119, "epoch": 4264} {"train_loss": -7.047461986541748, "global_step": 179120, "epoch": 4264} {"train_loss": -7.179880142211914, "global_step": 179121, "epoch": 4264} {"train_loss": -7.086812973022461, "global_step": 179122, "epoch": 4264} {"train_loss": -7.1554951667785645, "global_step": 179123, "epoch": 4264} {"train_loss": -7.083683967590332, "global_step": 179124, "epoch": 4264} {"train_loss": -7.093935012817383, "global_step": 179125, "epoch": 4264} {"train_loss": -7.152692794799805, "global_step": 179126, "epoch": 4264} {"train_loss": -7.207805633544922, "global_step": 179127, "epoch": 4264} {"train_loss": -7.1745452880859375, "global_step": 179128, "epoch": 4264} {"train_loss": -7.067681028729393, "global_step": 179129, "epoch": 4264, "val_loss": 80308.1484375} {"train_loss": -7.154648780822754, "global_step": 179130, "epoch": 4265} {"train_loss": -7.002765655517578, "global_step": 179131, "epoch": 4265} {"train_loss": -7.065598487854004, "global_step": 179132, "epoch": 4265} {"train_loss": -7.18176794052124, "global_step": 179133, "epoch": 4265} {"train_loss": -7.093812942504883, "global_step": 179134, "epoch": 4265} {"train_loss": -7.205425262451172, "global_step": 179135, "epoch": 4265} {"train_loss": -7.309979438781738, "global_step": 179136, "epoch": 4265} {"train_loss": -7.279632568359375, "global_step": 179137, "epoch": 4265} {"train_loss": -7.26255989074707, "global_step": 179138, "epoch": 4265} {"train_loss": -7.269186019897461, "global_step": 179139, "epoch": 4265} {"train_loss": -7.199372291564941, "global_step": 179140, "epoch": 4265} {"train_loss": -7.219825267791748, "global_step": 179141, "epoch": 4265} {"train_loss": -7.198404312133789, "global_step": 179142, "epoch": 4265} {"train_loss": -7.224286079406738, "global_step": 179143, "epoch": 4265} {"train_loss": -7.268925666809082, "global_step": 179144, "epoch": 4265} {"train_loss": -7.2732744216918945, "global_step": 179145, "epoch": 4265} {"train_loss": -7.163812637329102, "global_step": 179146, "epoch": 4265} {"train_loss": -6.980072021484375, "global_step": 179147, "epoch": 4265} {"train_loss": -7.125417709350586, "global_step": 179148, "epoch": 4265} {"train_loss": -7.128166198730469, "global_step": 179149, "epoch": 4265} {"train_loss": -7.101960182189941, "global_step": 179150, "epoch": 4265} {"train_loss": -7.072166919708252, "global_step": 179151, "epoch": 4265} {"train_loss": -7.086735248565674, "global_step": 179152, "epoch": 4265} {"train_loss": -7.184060096740723, "global_step": 179153, "epoch": 4265} {"train_loss": -7.169026851654053, "global_step": 179154, "epoch": 4265} {"train_loss": -7.206566333770752, "global_step": 179155, "epoch": 4265} {"train_loss": -7.244162082672119, "global_step": 179156, "epoch": 4265} {"train_loss": -7.196653842926025, "global_step": 179157, "epoch": 4265} {"train_loss": -7.14101505279541, "global_step": 179158, "epoch": 4265} {"train_loss": -7.201087951660156, "global_step": 179159, "epoch": 4265} {"train_loss": -7.231558799743652, "global_step": 179160, "epoch": 4265} {"train_loss": -7.14225435256958, "global_step": 179161, "epoch": 4265} {"train_loss": -7.175934791564941, "global_step": 179162, "epoch": 4265} {"train_loss": -7.071044921875, "global_step": 179163, "epoch": 4265} {"train_loss": -7.218717098236084, "global_step": 179164, "epoch": 4265} {"train_loss": -7.098581790924072, "global_step": 179165, "epoch": 4265} {"train_loss": -7.1650390625, "global_step": 179166, "epoch": 4265} {"train_loss": -7.2109551429748535, "global_step": 179167, "epoch": 4265} {"train_loss": -7.023492336273193, "global_step": 179168, "epoch": 4265} {"train_loss": -7.131547927856445, "global_step": 179169, "epoch": 4265} {"train_loss": -7.117603302001953, "global_step": 179170, "epoch": 4265} {"train_loss": -7.16480142729623, "global_step": 179171, "epoch": 4265, "val_loss": 80170.3984375} {"train_loss": -7.052579402923584, "global_step": 179172, "epoch": 4266} {"train_loss": -7.128231048583984, "global_step": 179173, "epoch": 4266} {"train_loss": -6.965209007263184, "global_step": 179174, "epoch": 4266} {"train_loss": -7.125632286071777, "global_step": 179175, "epoch": 4266} {"train_loss": -6.975301742553711, "global_step": 179176, "epoch": 4266} {"train_loss": -7.210827827453613, "global_step": 179177, "epoch": 4266} {"train_loss": -7.265636444091797, "global_step": 179178, "epoch": 4266} {"train_loss": -7.044279098510742, "global_step": 179179, "epoch": 4266} {"train_loss": -7.110109329223633, "global_step": 179180, "epoch": 4266} {"train_loss": -7.133268356323242, "global_step": 179181, "epoch": 4266} {"train_loss": -7.015006065368652, "global_step": 179182, "epoch": 4266} {"train_loss": -6.987489700317383, "global_step": 179183, "epoch": 4266} {"train_loss": -7.118518829345703, "global_step": 179184, "epoch": 4266} {"train_loss": -6.928807258605957, "global_step": 179185, "epoch": 4266} {"train_loss": -6.892534255981445, "global_step": 179186, "epoch": 4266} {"train_loss": -6.921164035797119, "global_step": 179187, "epoch": 4266} {"train_loss": -6.713346481323242, "global_step": 179188, "epoch": 4266} {"train_loss": -6.962400436401367, "global_step": 179189, "epoch": 4266} {"train_loss": -7.110684394836426, "global_step": 179190, "epoch": 4266} {"train_loss": -6.921341896057129, "global_step": 179191, "epoch": 4266} {"train_loss": -7.089287757873535, "global_step": 179192, "epoch": 4266} {"train_loss": -6.930064678192139, "global_step": 179193, "epoch": 4266} {"train_loss": -7.12466287612915, "global_step": 179194, "epoch": 4266} {"train_loss": -7.147401332855225, "global_step": 179195, "epoch": 4266} {"train_loss": -6.982120513916016, "global_step": 179196, "epoch": 4266} {"train_loss": -7.14893913269043, "global_step": 179197, "epoch": 4266} {"train_loss": -7.0892333984375, "global_step": 179198, "epoch": 4266} {"train_loss": -7.049925804138184, "global_step": 179199, "epoch": 4266} {"train_loss": -7.07327127456665, "global_step": 179200, "epoch": 4266} {"train_loss": -7.131735324859619, "global_step": 179201, "epoch": 4266} {"train_loss": -7.140368461608887, "global_step": 179202, "epoch": 4266} {"train_loss": -7.184309005737305, "global_step": 179203, "epoch": 4266} {"train_loss": -7.040251731872559, "global_step": 179204, "epoch": 4266} {"train_loss": -7.1620025634765625, "global_step": 179205, "epoch": 4266} {"train_loss": -7.257749557495117, "global_step": 179206, "epoch": 4266} {"train_loss": -7.254825115203857, "global_step": 179207, "epoch": 4266} {"train_loss": -7.084944248199463, "global_step": 179208, "epoch": 4266} {"train_loss": -7.258041858673096, "global_step": 179209, "epoch": 4266} {"train_loss": -7.058176040649414, "global_step": 179210, "epoch": 4266} {"train_loss": -7.172368049621582, "global_step": 179211, "epoch": 4266} {"train_loss": -7.147549629211426, "global_step": 179212, "epoch": 4266} {"train_loss": -7.078491086051578, "global_step": 179213, "epoch": 4266, "val_loss": 80370.8125} {"train_loss": -7.054300308227539, "global_step": 179214, "epoch": 4267} {"train_loss": -7.078998565673828, "global_step": 179215, "epoch": 4267} {"train_loss": -7.199118614196777, "global_step": 179216, "epoch": 4267} {"train_loss": -7.0493364334106445, "global_step": 179217, "epoch": 4267} {"train_loss": -7.17564582824707, "global_step": 179218, "epoch": 4267} {"train_loss": -7.135735511779785, "global_step": 179219, "epoch": 4267} {"train_loss": -7.176101207733154, "global_step": 179220, "epoch": 4267} {"train_loss": -7.155804634094238, "global_step": 179221, "epoch": 4267} {"train_loss": -7.17593240737915, "global_step": 179222, "epoch": 4267} {"train_loss": -7.057682514190674, "global_step": 179223, "epoch": 4267} {"train_loss": -7.229840278625488, "global_step": 179224, "epoch": 4267} {"train_loss": -7.120983600616455, "global_step": 179225, "epoch": 4267} {"train_loss": -6.956025123596191, "global_step": 179226, "epoch": 4267} {"train_loss": -7.198808670043945, "global_step": 179227, "epoch": 4267} {"train_loss": -7.178912162780762, "global_step": 179228, "epoch": 4267} {"train_loss": -7.075490951538086, "global_step": 179229, "epoch": 4267} {"train_loss": -7.0814924240112305, "global_step": 179230, "epoch": 4267} {"train_loss": -7.038207054138184, "global_step": 179231, "epoch": 4267} {"train_loss": -7.188841819763184, "global_step": 179232, "epoch": 4267} {"train_loss": -7.112651824951172, "global_step": 179233, "epoch": 4267} {"train_loss": -7.034168243408203, "global_step": 179234, "epoch": 4267} {"train_loss": -7.222422122955322, "global_step": 179235, "epoch": 4267} {"train_loss": -7.211520671844482, "global_step": 179236, "epoch": 4267} {"train_loss": -7.0288405418396, "global_step": 179237, "epoch": 4267} {"train_loss": -7.113900184631348, "global_step": 179238, "epoch": 4267} {"train_loss": -7.148192405700684, "global_step": 179239, "epoch": 4267} {"train_loss": -7.104302406311035, "global_step": 179240, "epoch": 4267} {"train_loss": -7.098928451538086, "global_step": 179241, "epoch": 4267} {"train_loss": -7.202775955200195, "global_step": 179242, "epoch": 4267} {"train_loss": -7.197882652282715, "global_step": 179243, "epoch": 4267} {"train_loss": -7.110058784484863, "global_step": 179244, "epoch": 4267} {"train_loss": -7.180855751037598, "global_step": 179245, "epoch": 4267} {"train_loss": -7.214973449707031, "global_step": 179246, "epoch": 4267} {"train_loss": -7.164533615112305, "global_step": 179247, "epoch": 4267} {"train_loss": -7.103304386138916, "global_step": 179248, "epoch": 4267} {"train_loss": -7.12667989730835, "global_step": 179249, "epoch": 4267} {"train_loss": -7.187291622161865, "global_step": 179250, "epoch": 4267} {"train_loss": -7.135404586791992, "global_step": 179251, "epoch": 4267} {"train_loss": -7.117710113525391, "global_step": 179252, "epoch": 4267} {"train_loss": -7.102724552154541, "global_step": 179253, "epoch": 4267} {"train_loss": -7.174569606781006, "global_step": 179254, "epoch": 4267} {"train_loss": -7.131190084275746, "global_step": 179255, "epoch": 4267, "val_loss": 80580.1484375} {"train_loss": -7.200743675231934, "global_step": 179256, "epoch": 4268} {"train_loss": -7.199753761291504, "global_step": 179257, "epoch": 4268} {"train_loss": -7.12766170501709, "global_step": 179258, "epoch": 4268} {"train_loss": -7.063436985015869, "global_step": 179259, "epoch": 4268} {"train_loss": -7.098483562469482, "global_step": 179260, "epoch": 4268} {"train_loss": -7.144057750701904, "global_step": 179261, "epoch": 4268} {"train_loss": -7.121105194091797, "global_step": 179262, "epoch": 4268} {"train_loss": -7.238911151885986, "global_step": 179263, "epoch": 4268} {"train_loss": -7.1378326416015625, "global_step": 179264, "epoch": 4268} {"train_loss": -7.198620796203613, "global_step": 179265, "epoch": 4268} {"train_loss": -7.146281719207764, "global_step": 179266, "epoch": 4268} {"train_loss": -7.187205791473389, "global_step": 179267, "epoch": 4268} {"train_loss": -7.219593048095703, "global_step": 179268, "epoch": 4268} {"train_loss": -7.041724681854248, "global_step": 179269, "epoch": 4268} {"train_loss": -7.104395866394043, "global_step": 179270, "epoch": 4268} {"train_loss": -7.079571723937988, "global_step": 179271, "epoch": 4268} {"train_loss": -7.216383934020996, "global_step": 179272, "epoch": 4268} {"train_loss": -7.0431671142578125, "global_step": 179273, "epoch": 4268} {"train_loss": -7.225183010101318, "global_step": 179274, "epoch": 4268} {"train_loss": -7.048829555511475, "global_step": 179275, "epoch": 4268} {"train_loss": -7.1355485916137695, "global_step": 179276, "epoch": 4268} {"train_loss": -7.077594757080078, "global_step": 179277, "epoch": 4268} {"train_loss": -7.1994123458862305, "global_step": 179278, "epoch": 4268} {"train_loss": -7.073094844818115, "global_step": 179279, "epoch": 4268} {"train_loss": -7.193776607513428, "global_step": 179280, "epoch": 4268} {"train_loss": -7.116143226623535, "global_step": 179281, "epoch": 4268} {"train_loss": -7.208517074584961, "global_step": 179282, "epoch": 4268} {"train_loss": -6.982677459716797, "global_step": 179283, "epoch": 4268} {"train_loss": -7.121874809265137, "global_step": 179284, "epoch": 4268} {"train_loss": -7.184820652008057, "global_step": 179285, "epoch": 4268} {"train_loss": -7.017972469329834, "global_step": 179286, "epoch": 4268} {"train_loss": -7.1300458908081055, "global_step": 179287, "epoch": 4268} {"train_loss": -7.077653884887695, "global_step": 179288, "epoch": 4268} {"train_loss": -7.071017265319824, "global_step": 179289, "epoch": 4268} {"train_loss": -7.035481929779053, "global_step": 179290, "epoch": 4268} {"train_loss": -7.0640082359313965, "global_step": 179291, "epoch": 4268} {"train_loss": -6.913419723510742, "global_step": 179292, "epoch": 4268} {"train_loss": -7.049838066101074, "global_step": 179293, "epoch": 4268} {"train_loss": -7.024074554443359, "global_step": 179294, "epoch": 4268} {"train_loss": -7.061214447021484, "global_step": 179295, "epoch": 4268} {"train_loss": -7.196215629577637, "global_step": 179296, "epoch": 4268} {"train_loss": -7.113908279509771, "global_step": 179297, "epoch": 4268, "val_loss": 80351.515625} {"train_loss": -7.036374092102051, "global_step": 179298, "epoch": 4269} {"train_loss": -7.0918989181518555, "global_step": 179299, "epoch": 4269} {"train_loss": -7.019363880157471, "global_step": 179300, "epoch": 4269} {"train_loss": -7.156208038330078, "global_step": 179301, "epoch": 4269} {"train_loss": -7.159614086151123, "global_step": 179302, "epoch": 4269} {"train_loss": -7.154711723327637, "global_step": 179303, "epoch": 4269} {"train_loss": -7.151352882385254, "global_step": 179304, "epoch": 4269} {"train_loss": -6.998538970947266, "global_step": 179305, "epoch": 4269} {"train_loss": -7.084356307983398, "global_step": 179306, "epoch": 4269} {"train_loss": -7.093308448791504, "global_step": 179307, "epoch": 4269} {"train_loss": -7.1426897048950195, "global_step": 179308, "epoch": 4269} {"train_loss": -7.085425853729248, "global_step": 179309, "epoch": 4269} {"train_loss": -7.151290416717529, "global_step": 179310, "epoch": 4269} {"train_loss": -7.158611297607422, "global_step": 179311, "epoch": 4269} {"train_loss": -7.10598087310791, "global_step": 179312, "epoch": 4269} {"train_loss": -7.093889236450195, "global_step": 179313, "epoch": 4269} {"train_loss": -7.197675704956055, "global_step": 179314, "epoch": 4269} {"train_loss": -7.169132709503174, "global_step": 179315, "epoch": 4269} {"train_loss": -7.122318267822266, "global_step": 179316, "epoch": 4269} {"train_loss": -7.149430274963379, "global_step": 179317, "epoch": 4269} {"train_loss": -7.122914791107178, "global_step": 179318, "epoch": 4269} {"train_loss": -7.104460716247559, "global_step": 179319, "epoch": 4269} {"train_loss": -7.185070514678955, "global_step": 179320, "epoch": 4269} {"train_loss": -7.218103408813477, "global_step": 179321, "epoch": 4269} {"train_loss": -7.0398125648498535, "global_step": 179322, "epoch": 4269} {"train_loss": -7.098961353302002, "global_step": 179323, "epoch": 4269} {"train_loss": -7.268767356872559, "global_step": 179324, "epoch": 4269} {"train_loss": -7.071585655212402, "global_step": 179325, "epoch": 4269} {"train_loss": -7.143726348876953, "global_step": 179326, "epoch": 4269} {"train_loss": -7.1752142906188965, "global_step": 179327, "epoch": 4269} {"train_loss": -7.228955268859863, "global_step": 179328, "epoch": 4269} {"train_loss": -7.18569803237915, "global_step": 179329, "epoch": 4269} {"train_loss": -7.233485221862793, "global_step": 179330, "epoch": 4269} {"train_loss": -7.223806858062744, "global_step": 179331, "epoch": 4269} {"train_loss": -7.049588203430176, "global_step": 179332, "epoch": 4269} {"train_loss": -7.08538818359375, "global_step": 179333, "epoch": 4269} {"train_loss": -7.007997989654541, "global_step": 179334, "epoch": 4269} {"train_loss": -7.061624526977539, "global_step": 179335, "epoch": 4269} {"train_loss": -6.923318862915039, "global_step": 179336, "epoch": 4269} {"train_loss": -7.106936454772949, "global_step": 179337, "epoch": 4269} {"train_loss": -7.112582683563232, "global_step": 179338, "epoch": 4269} {"train_loss": -7.118996824537005, "global_step": 179339, "epoch": 4269, "val_loss": 80385.984375} {"train_loss": -6.949957847595215, "global_step": 179340, "epoch": 4270} {"train_loss": -7.016836166381836, "global_step": 179341, "epoch": 4270} {"train_loss": -6.988171577453613, "global_step": 179342, "epoch": 4270} {"train_loss": -7.123318195343018, "global_step": 179343, "epoch": 4270} {"train_loss": -6.894106864929199, "global_step": 179344, "epoch": 4270} {"train_loss": -7.153226852416992, "global_step": 179345, "epoch": 4270} {"train_loss": -7.07466459274292, "global_step": 179346, "epoch": 4270} {"train_loss": -7.036916255950928, "global_step": 179347, "epoch": 4270} {"train_loss": -7.145290374755859, "global_step": 179348, "epoch": 4270} {"train_loss": -6.981936931610107, "global_step": 179349, "epoch": 4270} {"train_loss": -6.999954700469971, "global_step": 179350, "epoch": 4270} {"train_loss": -7.181743621826172, "global_step": 179351, "epoch": 4270} {"train_loss": -7.024382591247559, "global_step": 179352, "epoch": 4270} {"train_loss": -6.991997718811035, "global_step": 179353, "epoch": 4270} {"train_loss": -7.066091060638428, "global_step": 179354, "epoch": 4270} {"train_loss": -7.156510353088379, "global_step": 179355, "epoch": 4270} {"train_loss": -7.07060432434082, "global_step": 179356, "epoch": 4270} {"train_loss": -7.149367332458496, "global_step": 179357, "epoch": 4270} {"train_loss": -7.124127388000488, "global_step": 179358, "epoch": 4270} {"train_loss": -7.120408058166504, "global_step": 179359, "epoch": 4270} {"train_loss": -7.0568671226501465, "global_step": 179360, "epoch": 4270} {"train_loss": -7.038175106048584, "global_step": 179361, "epoch": 4270} {"train_loss": -7.1438398361206055, "global_step": 179362, "epoch": 4270} {"train_loss": -6.992534160614014, "global_step": 179363, "epoch": 4270} {"train_loss": -7.017293930053711, "global_step": 179364, "epoch": 4270} {"train_loss": -7.017595291137695, "global_step": 179365, "epoch": 4270} {"train_loss": -7.077018737792969, "global_step": 179366, "epoch": 4270} {"train_loss": -7.05197811126709, "global_step": 179367, "epoch": 4270} {"train_loss": -7.173257827758789, "global_step": 179368, "epoch": 4270} {"train_loss": -7.12571907043457, "global_step": 179369, "epoch": 4270} {"train_loss": -7.135550022125244, "global_step": 179370, "epoch": 4270} {"train_loss": -7.139571666717529, "global_step": 179371, "epoch": 4270} {"train_loss": -7.096185684204102, "global_step": 179372, "epoch": 4270} {"train_loss": -7.265505790710449, "global_step": 179373, "epoch": 4270} {"train_loss": -7.101236820220947, "global_step": 179374, "epoch": 4270} {"train_loss": -7.138328552246094, "global_step": 179375, "epoch": 4270} {"train_loss": -7.035769462585449, "global_step": 179376, "epoch": 4270} {"train_loss": -7.155198097229004, "global_step": 179377, "epoch": 4270} {"train_loss": -7.235485076904297, "global_step": 179378, "epoch": 4270} {"train_loss": -7.163674354553223, "global_step": 179379, "epoch": 4270} {"train_loss": -7.014374732971191, "global_step": 179380, "epoch": 4270} {"train_loss": -7.0852758430299305, "global_step": 179381, "epoch": 4270, "val_loss": 80349.5546875} {"train_loss": -7.229865074157715, "global_step": 179382, "epoch": 4271} {"train_loss": -7.117287635803223, "global_step": 179383, "epoch": 4271} {"train_loss": -7.1669230461120605, "global_step": 179384, "epoch": 4271} {"train_loss": -7.152318954467773, "global_step": 179385, "epoch": 4271} {"train_loss": -7.155422687530518, "global_step": 179386, "epoch": 4271} {"train_loss": -7.152340888977051, "global_step": 179387, "epoch": 4271} {"train_loss": -7.065403938293457, "global_step": 179388, "epoch": 4271} {"train_loss": -7.118905544281006, "global_step": 179389, "epoch": 4271} {"train_loss": -7.209524154663086, "global_step": 179390, "epoch": 4271} {"train_loss": -7.279290199279785, "global_step": 179391, "epoch": 4271} {"train_loss": -7.155506134033203, "global_step": 179392, "epoch": 4271} {"train_loss": -7.278235912322998, "global_step": 179393, "epoch": 4271} {"train_loss": -7.08527135848999, "global_step": 179394, "epoch": 4271} {"train_loss": -7.187692642211914, "global_step": 179395, "epoch": 4271} {"train_loss": -7.142600059509277, "global_step": 179396, "epoch": 4271} {"train_loss": -7.206864356994629, "global_step": 179397, "epoch": 4271} {"train_loss": -7.178468704223633, "global_step": 179398, "epoch": 4271} {"train_loss": -7.105199337005615, "global_step": 179399, "epoch": 4271} {"train_loss": -7.0990447998046875, "global_step": 179400, "epoch": 4271} {"train_loss": -7.119701385498047, "global_step": 179401, "epoch": 4271} {"train_loss": -7.102051258087158, "global_step": 179402, "epoch": 4271} {"train_loss": -7.155896186828613, "global_step": 179403, "epoch": 4271} {"train_loss": -7.115157604217529, "global_step": 179404, "epoch": 4271} {"train_loss": -7.125753402709961, "global_step": 179405, "epoch": 4271} {"train_loss": -7.106858253479004, "global_step": 179406, "epoch": 4271} {"train_loss": -7.3071489334106445, "global_step": 179407, "epoch": 4271} {"train_loss": -7.1654815673828125, "global_step": 179408, "epoch": 4271} {"train_loss": -7.242759704589844, "global_step": 179409, "epoch": 4271} {"train_loss": -7.19393253326416, "global_step": 179410, "epoch": 4271} {"train_loss": -7.145361423492432, "global_step": 179411, "epoch": 4271} {"train_loss": -7.204473495483398, "global_step": 179412, "epoch": 4271} {"train_loss": -7.121270656585693, "global_step": 179413, "epoch": 4271} {"train_loss": -7.071084022521973, "global_step": 179414, "epoch": 4271} {"train_loss": -7.2089738845825195, "global_step": 179415, "epoch": 4271} {"train_loss": -7.10509729385376, "global_step": 179416, "epoch": 4271} {"train_loss": -7.167453765869141, "global_step": 179417, "epoch": 4271} {"train_loss": -7.264649868011475, "global_step": 179418, "epoch": 4271} {"train_loss": -7.187407493591309, "global_step": 179419, "epoch": 4271} {"train_loss": -7.033527851104736, "global_step": 179420, "epoch": 4271} {"train_loss": -6.9844770431518555, "global_step": 179421, "epoch": 4271} {"train_loss": -7.141268730163574, "global_step": 179422, "epoch": 4271} {"train_loss": -7.155333768753779, "global_step": 179423, "epoch": 4271, "val_loss": 80288.890625} {"train_loss": -7.071159362792969, "global_step": 179424, "epoch": 4272} {"train_loss": -7.117575645446777, "global_step": 179425, "epoch": 4272} {"train_loss": -6.937836647033691, "global_step": 179426, "epoch": 4272} {"train_loss": -7.109842300415039, "global_step": 179427, "epoch": 4272} {"train_loss": -7.049335479736328, "global_step": 179428, "epoch": 4272} {"train_loss": -6.945295333862305, "global_step": 179429, "epoch": 4272} {"train_loss": -6.96835470199585, "global_step": 179430, "epoch": 4272} {"train_loss": -7.112707138061523, "global_step": 179431, "epoch": 4272} {"train_loss": -6.989378929138184, "global_step": 179432, "epoch": 4272} {"train_loss": -6.972220420837402, "global_step": 179433, "epoch": 4272} {"train_loss": -7.130712509155273, "global_step": 179434, "epoch": 4272} {"train_loss": -7.127824783325195, "global_step": 179435, "epoch": 4272} {"train_loss": -7.061100959777832, "global_step": 179436, "epoch": 4272} {"train_loss": -7.120037078857422, "global_step": 179437, "epoch": 4272} {"train_loss": -7.218808174133301, "global_step": 179438, "epoch": 4272} {"train_loss": -7.2344255447387695, "global_step": 179439, "epoch": 4272} {"train_loss": -7.144484519958496, "global_step": 179440, "epoch": 4272} {"train_loss": -7.078042030334473, "global_step": 179441, "epoch": 4272} {"train_loss": -7.131342887878418, "global_step": 179442, "epoch": 4272} {"train_loss": -7.0759477615356445, "global_step": 179443, "epoch": 4272} {"train_loss": -7.173300743103027, "global_step": 179444, "epoch": 4272} {"train_loss": -7.129659652709961, "global_step": 179445, "epoch": 4272} {"train_loss": -7.064878940582275, "global_step": 179446, "epoch": 4272} {"train_loss": -7.133769989013672, "global_step": 179447, "epoch": 4272} {"train_loss": -7.162222385406494, "global_step": 179448, "epoch": 4272} {"train_loss": -7.154448509216309, "global_step": 179449, "epoch": 4272} {"train_loss": -7.134056091308594, "global_step": 179450, "epoch": 4272} {"train_loss": -7.1303300857543945, "global_step": 179451, "epoch": 4272} {"train_loss": -7.220936298370361, "global_step": 179452, "epoch": 4272} {"train_loss": -7.145169258117676, "global_step": 179453, "epoch": 4272} {"train_loss": -7.086304187774658, "global_step": 179454, "epoch": 4272} {"train_loss": -7.149755954742432, "global_step": 179455, "epoch": 4272} {"train_loss": -7.159462928771973, "global_step": 179456, "epoch": 4272} {"train_loss": -6.9494547843933105, "global_step": 179457, "epoch": 4272} {"train_loss": -6.921034812927246, "global_step": 179458, "epoch": 4272} {"train_loss": -7.083413124084473, "global_step": 179459, "epoch": 4272} {"train_loss": -7.107061862945557, "global_step": 179460, "epoch": 4272} {"train_loss": -7.0426130294799805, "global_step": 179461, "epoch": 4272} {"train_loss": -7.106688976287842, "global_step": 179462, "epoch": 4272} {"train_loss": -7.142290115356445, "global_step": 179463, "epoch": 4272} {"train_loss": -7.064321517944336, "global_step": 179464, "epoch": 4272} {"train_loss": -7.09305495307559, "global_step": 179465, "epoch": 4272, "val_loss": 80496.109375} {"train_loss": -7.090567588806152, "global_step": 179466, "epoch": 4273} {"train_loss": -7.033680438995361, "global_step": 179467, "epoch": 4273} {"train_loss": -7.012956142425537, "global_step": 179468, "epoch": 4273} {"train_loss": -7.071978569030762, "global_step": 179469, "epoch": 4273} {"train_loss": -6.998053073883057, "global_step": 179470, "epoch": 4273} {"train_loss": -7.050013542175293, "global_step": 179471, "epoch": 4273} {"train_loss": -7.151700019836426, "global_step": 179472, "epoch": 4273} {"train_loss": -7.031198501586914, "global_step": 179473, "epoch": 4273} {"train_loss": -7.20943546295166, "global_step": 179474, "epoch": 4273} {"train_loss": -7.0958733558654785, "global_step": 179475, "epoch": 4273} {"train_loss": -7.0624680519104, "global_step": 179476, "epoch": 4273} {"train_loss": -7.126087188720703, "global_step": 179477, "epoch": 4273} {"train_loss": -7.0666680335998535, "global_step": 179478, "epoch": 4273} {"train_loss": -7.130489349365234, "global_step": 179479, "epoch": 4273} {"train_loss": -6.986851692199707, "global_step": 179480, "epoch": 4273} {"train_loss": -7.1845598220825195, "global_step": 179481, "epoch": 4273} {"train_loss": -7.003013610839844, "global_step": 179482, "epoch": 4273} {"train_loss": -7.107753753662109, "global_step": 179483, "epoch": 4273} {"train_loss": -7.144942283630371, "global_step": 179484, "epoch": 4273} {"train_loss": -6.868008136749268, "global_step": 179485, "epoch": 4273} {"train_loss": -7.173007011413574, "global_step": 179486, "epoch": 4273} {"train_loss": -7.010040283203125, "global_step": 179487, "epoch": 4273} {"train_loss": -7.138027191162109, "global_step": 179488, "epoch": 4273} {"train_loss": -7.146813869476318, "global_step": 179489, "epoch": 4273} {"train_loss": -7.052558422088623, "global_step": 179490, "epoch": 4273} {"train_loss": -7.08373498916626, "global_step": 179491, "epoch": 4273} {"train_loss": -7.020611763000488, "global_step": 179492, "epoch": 4273} {"train_loss": -7.068192481994629, "global_step": 179493, "epoch": 4273} {"train_loss": -7.080699443817139, "global_step": 179494, "epoch": 4273} {"train_loss": -7.203983306884766, "global_step": 179495, "epoch": 4273} {"train_loss": -7.186054706573486, "global_step": 179496, "epoch": 4273} {"train_loss": -7.051968574523926, "global_step": 179497, "epoch": 4273} {"train_loss": -7.164991855621338, "global_step": 179498, "epoch": 4273} {"train_loss": -7.110438346862793, "global_step": 179499, "epoch": 4273} {"train_loss": -7.1320295333862305, "global_step": 179500, "epoch": 4273} {"train_loss": -7.166133880615234, "global_step": 179501, "epoch": 4273} {"train_loss": -7.068650245666504, "global_step": 179502, "epoch": 4273} {"train_loss": -7.225241661071777, "global_step": 179503, "epoch": 4273} {"train_loss": -7.129335403442383, "global_step": 179504, "epoch": 4273} {"train_loss": -7.210568428039551, "global_step": 179505, "epoch": 4273} {"train_loss": -7.207495212554932, "global_step": 179506, "epoch": 4273} {"train_loss": -7.098384403047108, "global_step": 179507, "epoch": 4273, "val_loss": 80390.859375} {"train_loss": -7.195255756378174, "global_step": 179508, "epoch": 4274} {"train_loss": -7.211655616760254, "global_step": 179509, "epoch": 4274} {"train_loss": -7.2009663581848145, "global_step": 179510, "epoch": 4274} {"train_loss": -7.145218372344971, "global_step": 179511, "epoch": 4274} {"train_loss": -7.169651031494141, "global_step": 179512, "epoch": 4274} {"train_loss": -7.132883071899414, "global_step": 179513, "epoch": 4274} {"train_loss": -7.095675945281982, "global_step": 179514, "epoch": 4274} {"train_loss": -7.214184761047363, "global_step": 179515, "epoch": 4274} {"train_loss": -7.0980072021484375, "global_step": 179516, "epoch": 4274} {"train_loss": -7.264605522155762, "global_step": 179517, "epoch": 4274} {"train_loss": -7.09992790222168, "global_step": 179518, "epoch": 4274} {"train_loss": -7.220149040222168, "global_step": 179519, "epoch": 4274} {"train_loss": -7.167294502258301, "global_step": 179520, "epoch": 4274} {"train_loss": -7.099030494689941, "global_step": 179521, "epoch": 4274} {"train_loss": -7.222270488739014, "global_step": 179522, "epoch": 4274} {"train_loss": -7.154959201812744, "global_step": 179523, "epoch": 4274} {"train_loss": -7.11473274230957, "global_step": 179524, "epoch": 4274} {"train_loss": -7.212260723114014, "global_step": 179525, "epoch": 4274} {"train_loss": -7.318041801452637, "global_step": 179526, "epoch": 4274} {"train_loss": -7.12214469909668, "global_step": 179527, "epoch": 4274} {"train_loss": -7.087076187133789, "global_step": 179528, "epoch": 4274} {"train_loss": -7.154445648193359, "global_step": 179529, "epoch": 4274} {"train_loss": -7.113107204437256, "global_step": 179530, "epoch": 4274} {"train_loss": -7.183618545532227, "global_step": 179531, "epoch": 4274} {"train_loss": -7.141587734222412, "global_step": 179532, "epoch": 4274} {"train_loss": -7.131348609924316, "global_step": 179533, "epoch": 4274} {"train_loss": -7.2176947593688965, "global_step": 179534, "epoch": 4274} {"train_loss": -7.203958511352539, "global_step": 179535, "epoch": 4274} {"train_loss": -7.101821422576904, "global_step": 179536, "epoch": 4274} {"train_loss": -7.122203826904297, "global_step": 179537, "epoch": 4274} {"train_loss": -7.204649925231934, "global_step": 179538, "epoch": 4274} {"train_loss": -7.084908962249756, "global_step": 179539, "epoch": 4274} {"train_loss": -7.157689094543457, "global_step": 179540, "epoch": 4274} {"train_loss": -7.089650630950928, "global_step": 179541, "epoch": 4274} {"train_loss": -7.115514755249023, "global_step": 179542, "epoch": 4274} {"train_loss": -6.941936016082764, "global_step": 179543, "epoch": 4274} {"train_loss": -7.205592632293701, "global_step": 179544, "epoch": 4274} {"train_loss": -7.126897811889648, "global_step": 179545, "epoch": 4274} {"train_loss": -6.985415458679199, "global_step": 179546, "epoch": 4274} {"train_loss": -7.044590950012207, "global_step": 179547, "epoch": 4274} {"train_loss": -7.131635665893555, "global_step": 179548, "epoch": 4274} {"train_loss": -7.141951367968605, "global_step": 179549, "epoch": 4274, "val_loss": 80501.71875} {"train_loss": -7.17022705078125, "global_step": 179550, "epoch": 4275} {"train_loss": -6.971775054931641, "global_step": 179551, "epoch": 4275} {"train_loss": -7.033198356628418, "global_step": 179552, "epoch": 4275} {"train_loss": -7.107688903808594, "global_step": 179553, "epoch": 4275} {"train_loss": -7.067637920379639, "global_step": 179554, "epoch": 4275} {"train_loss": -7.052326679229736, "global_step": 179555, "epoch": 4275} {"train_loss": -7.101461410522461, "global_step": 179556, "epoch": 4275} {"train_loss": -7.162233829498291, "global_step": 179557, "epoch": 4275} {"train_loss": -7.072661876678467, "global_step": 179558, "epoch": 4275} {"train_loss": -7.14132833480835, "global_step": 179559, "epoch": 4275} {"train_loss": -7.053091049194336, "global_step": 179560, "epoch": 4275} {"train_loss": -7.022876262664795, "global_step": 179561, "epoch": 4275} {"train_loss": -7.130366325378418, "global_step": 179562, "epoch": 4275} {"train_loss": -7.065123081207275, "global_step": 179563, "epoch": 4275} {"train_loss": -7.1357574462890625, "global_step": 179564, "epoch": 4275} {"train_loss": -7.201286792755127, "global_step": 179565, "epoch": 4275} {"train_loss": -7.122996807098389, "global_step": 179566, "epoch": 4275} {"train_loss": -7.001992702484131, "global_step": 179567, "epoch": 4275} {"train_loss": -6.954232215881348, "global_step": 179568, "epoch": 4275} {"train_loss": -7.1419677734375, "global_step": 179569, "epoch": 4275} {"train_loss": -6.975863933563232, "global_step": 179570, "epoch": 4275} {"train_loss": -6.804291725158691, "global_step": 179571, "epoch": 4275} {"train_loss": -6.98440408706665, "global_step": 179572, "epoch": 4275} {"train_loss": -6.8249664306640625, "global_step": 179573, "epoch": 4275} {"train_loss": -7.151213645935059, "global_step": 179574, "epoch": 4275} {"train_loss": -7.1598687171936035, "global_step": 179575, "epoch": 4275} {"train_loss": -7.0361409187316895, "global_step": 179576, "epoch": 4275} {"train_loss": -7.004026412963867, "global_step": 179577, "epoch": 4275} {"train_loss": -7.106711387634277, "global_step": 179578, "epoch": 4275} {"train_loss": -7.1885247230529785, "global_step": 179579, "epoch": 4275} {"train_loss": -7.193861484527588, "global_step": 179580, "epoch": 4275} {"train_loss": -7.100068092346191, "global_step": 179581, "epoch": 4275} {"train_loss": -7.28150749206543, "global_step": 179582, "epoch": 4275} {"train_loss": -7.100752353668213, "global_step": 179583, "epoch": 4275} {"train_loss": -6.996122360229492, "global_step": 179584, "epoch": 4275} {"train_loss": -7.226169586181641, "global_step": 179585, "epoch": 4275} {"train_loss": -7.1454339027404785, "global_step": 179586, "epoch": 4275} {"train_loss": -7.147320747375488, "global_step": 179587, "epoch": 4275} {"train_loss": -7.208217620849609, "global_step": 179588, "epoch": 4275} {"train_loss": -6.928195476531982, "global_step": 179589, "epoch": 4275} {"train_loss": -7.041454792022705, "global_step": 179590, "epoch": 4275} {"train_loss": -7.0825656822749545, "global_step": 179591, "epoch": 4275, "val_loss": 80349.9609375} {"train_loss": -7.037843704223633, "global_step": 179592, "epoch": 4276} {"train_loss": -6.987253189086914, "global_step": 179593, "epoch": 4276} {"train_loss": -6.993730545043945, "global_step": 179594, "epoch": 4276} {"train_loss": -6.947214603424072, "global_step": 179595, "epoch": 4276} {"train_loss": -6.989162921905518, "global_step": 179596, "epoch": 4276} {"train_loss": -7.043543815612793, "global_step": 179597, "epoch": 4276} {"train_loss": -7.0769195556640625, "global_step": 179598, "epoch": 4276} {"train_loss": -7.070141792297363, "global_step": 179599, "epoch": 4276} {"train_loss": -7.0458269119262695, "global_step": 179600, "epoch": 4276} {"train_loss": -7.12776517868042, "global_step": 179601, "epoch": 4276} {"train_loss": -7.05078125, "global_step": 179602, "epoch": 4276} {"train_loss": -7.112583160400391, "global_step": 179603, "epoch": 4276} {"train_loss": -7.325369834899902, "global_step": 179604, "epoch": 4276} {"train_loss": -6.910038471221924, "global_step": 179605, "epoch": 4276} {"train_loss": -7.235677242279053, "global_step": 179606, "epoch": 4276} {"train_loss": -7.109267234802246, "global_step": 179607, "epoch": 4276} {"train_loss": -7.132345199584961, "global_step": 179608, "epoch": 4276} {"train_loss": -7.192054748535156, "global_step": 179609, "epoch": 4276} {"train_loss": -7.180290222167969, "global_step": 179610, "epoch": 4276} {"train_loss": -7.000727653503418, "global_step": 179611, "epoch": 4276} {"train_loss": -7.019257545471191, "global_step": 179612, "epoch": 4276} {"train_loss": -7.070833206176758, "global_step": 179613, "epoch": 4276} {"train_loss": -7.050699710845947, "global_step": 179614, "epoch": 4276} {"train_loss": -7.06655216217041, "global_step": 179615, "epoch": 4276} {"train_loss": -7.135014533996582, "global_step": 179616, "epoch": 4276} {"train_loss": -7.050872802734375, "global_step": 179617, "epoch": 4276} {"train_loss": -6.988809585571289, "global_step": 179618, "epoch": 4276} {"train_loss": -7.010737419128418, "global_step": 179619, "epoch": 4276} {"train_loss": -7.083630084991455, "global_step": 179620, "epoch": 4276} {"train_loss": -7.154348373413086, "global_step": 179621, "epoch": 4276} {"train_loss": -6.983250617980957, "global_step": 179622, "epoch": 4276} {"train_loss": -6.981175422668457, "global_step": 179623, "epoch": 4276} {"train_loss": -7.0220417976379395, "global_step": 179624, "epoch": 4276} {"train_loss": -7.194768905639648, "global_step": 179625, "epoch": 4276} {"train_loss": -7.106952667236328, "global_step": 179626, "epoch": 4276} {"train_loss": -7.1545515060424805, "global_step": 179627, "epoch": 4276} {"train_loss": -7.080611705780029, "global_step": 179628, "epoch": 4276} {"train_loss": -7.052606582641602, "global_step": 179629, "epoch": 4276} {"train_loss": -7.058633804321289, "global_step": 179630, "epoch": 4276} {"train_loss": -7.1690521240234375, "global_step": 179631, "epoch": 4276} {"train_loss": -7.039124011993408, "global_step": 179632, "epoch": 4276} {"train_loss": -7.0728533154442195, "global_step": 179633, "epoch": 4276, "val_loss": 80714.6640625} {"train_loss": -7.084267616271973, "global_step": 179634, "epoch": 4277} {"train_loss": -7.053016662597656, "global_step": 179635, "epoch": 4277} {"train_loss": -7.057415962219238, "global_step": 179636, "epoch": 4277} {"train_loss": -6.826714992523193, "global_step": 179637, "epoch": 4277} {"train_loss": -7.096070289611816, "global_step": 179638, "epoch": 4277} {"train_loss": -6.9594621658325195, "global_step": 179639, "epoch": 4277} {"train_loss": -6.90750789642334, "global_step": 179640, "epoch": 4277} {"train_loss": -7.0507707595825195, "global_step": 179641, "epoch": 4277} {"train_loss": -6.8547163009643555, "global_step": 179642, "epoch": 4277} {"train_loss": -7.020416259765625, "global_step": 179643, "epoch": 4277} {"train_loss": -6.84345817565918, "global_step": 179644, "epoch": 4277} {"train_loss": -7.0151214599609375, "global_step": 179645, "epoch": 4277} {"train_loss": -6.975822448730469, "global_step": 179646, "epoch": 4277} {"train_loss": -7.070708274841309, "global_step": 179647, "epoch": 4277} {"train_loss": -7.139895439147949, "global_step": 179648, "epoch": 4277} {"train_loss": -6.985586643218994, "global_step": 179649, "epoch": 4277} {"train_loss": -7.043292045593262, "global_step": 179650, "epoch": 4277} {"train_loss": -7.172965049743652, "global_step": 179651, "epoch": 4277} {"train_loss": -7.121773719787598, "global_step": 179652, "epoch": 4277} {"train_loss": -7.080641746520996, "global_step": 179653, "epoch": 4277} {"train_loss": -7.104403972625732, "global_step": 179654, "epoch": 4277} {"train_loss": -7.059111595153809, "global_step": 179655, "epoch": 4277} {"train_loss": -7.135034561157227, "global_step": 179656, "epoch": 4277} {"train_loss": -7.180856704711914, "global_step": 179657, "epoch": 4277} {"train_loss": -7.121743202209473, "global_step": 179658, "epoch": 4277} {"train_loss": -7.110533714294434, "global_step": 179659, "epoch": 4277} {"train_loss": -7.003471374511719, "global_step": 179660, "epoch": 4277} {"train_loss": -7.26023006439209, "global_step": 179661, "epoch": 4277} {"train_loss": -7.117270469665527, "global_step": 179662, "epoch": 4277} {"train_loss": -7.235998153686523, "global_step": 179663, "epoch": 4277} {"train_loss": -7.12084436416626, "global_step": 179664, "epoch": 4277} {"train_loss": -7.044759750366211, "global_step": 179665, "epoch": 4277} {"train_loss": -7.09340763092041, "global_step": 179666, "epoch": 4277} {"train_loss": -7.10366678237915, "global_step": 179667, "epoch": 4277} {"train_loss": -6.97562313079834, "global_step": 179668, "epoch": 4277} {"train_loss": -7.181504249572754, "global_step": 179669, "epoch": 4277} {"train_loss": -7.006154537200928, "global_step": 179670, "epoch": 4277} {"train_loss": -7.030455112457275, "global_step": 179671, "epoch": 4277} {"train_loss": -7.017496109008789, "global_step": 179672, "epoch": 4277} {"train_loss": -7.047373294830322, "global_step": 179673, "epoch": 4277} {"train_loss": -7.155078887939453, "global_step": 179674, "epoch": 4277} {"train_loss": -7.058396396182832, "global_step": 179675, "epoch": 4277, "val_loss": 80158.2109375} {"train_loss": -7.052253723144531, "global_step": 179676, "epoch": 4278} {"train_loss": -7.030962944030762, "global_step": 179677, "epoch": 4278} {"train_loss": -6.914985179901123, "global_step": 179678, "epoch": 4278} {"train_loss": -7.009233474731445, "global_step": 179679, "epoch": 4278} {"train_loss": -7.067363739013672, "global_step": 179680, "epoch": 4278} {"train_loss": -7.039407730102539, "global_step": 179681, "epoch": 4278} {"train_loss": -6.94351863861084, "global_step": 179682, "epoch": 4278} {"train_loss": -7.203925132751465, "global_step": 179683, "epoch": 4278} {"train_loss": -7.160058975219727, "global_step": 179684, "epoch": 4278} {"train_loss": -7.065007209777832, "global_step": 179685, "epoch": 4278} {"train_loss": -7.100123405456543, "global_step": 179686, "epoch": 4278} {"train_loss": -7.110762119293213, "global_step": 179687, "epoch": 4278} {"train_loss": -7.089322566986084, "global_step": 179688, "epoch": 4278} {"train_loss": -7.150671005249023, "global_step": 179689, "epoch": 4278} {"train_loss": -7.1060991287231445, "global_step": 179690, "epoch": 4278} {"train_loss": -7.084048748016357, "global_step": 179691, "epoch": 4278} {"train_loss": -7.069979667663574, "global_step": 179692, "epoch": 4278} {"train_loss": -7.061755180358887, "global_step": 179693, "epoch": 4278} {"train_loss": -7.1270647048950195, "global_step": 179694, "epoch": 4278} {"train_loss": -7.140878677368164, "global_step": 179695, "epoch": 4278} {"train_loss": -7.062276363372803, "global_step": 179696, "epoch": 4278} {"train_loss": -7.119462013244629, "global_step": 179697, "epoch": 4278} {"train_loss": -7.026541709899902, "global_step": 179698, "epoch": 4278} {"train_loss": -7.066062927246094, "global_step": 179699, "epoch": 4278} {"train_loss": -7.126503944396973, "global_step": 179700, "epoch": 4278} {"train_loss": -7.169934272766113, "global_step": 179701, "epoch": 4278} {"train_loss": -6.988883972167969, "global_step": 179702, "epoch": 4278} {"train_loss": -7.013484954833984, "global_step": 179703, "epoch": 4278} {"train_loss": -7.194380283355713, "global_step": 179704, "epoch": 4278} {"train_loss": -7.0148820877075195, "global_step": 179705, "epoch": 4278} {"train_loss": -7.0948262214660645, "global_step": 179706, "epoch": 4278} {"train_loss": -7.129508972167969, "global_step": 179707, "epoch": 4278} {"train_loss": -7.225729942321777, "global_step": 179708, "epoch": 4278} {"train_loss": -7.17833137512207, "global_step": 179709, "epoch": 4278} {"train_loss": -7.120257377624512, "global_step": 179710, "epoch": 4278} {"train_loss": -7.174740791320801, "global_step": 179711, "epoch": 4278} {"train_loss": -7.112290859222412, "global_step": 179712, "epoch": 4278} {"train_loss": -7.066283226013184, "global_step": 179713, "epoch": 4278} {"train_loss": -7.046110153198242, "global_step": 179714, "epoch": 4278} {"train_loss": -7.282073020935059, "global_step": 179715, "epoch": 4278} {"train_loss": -7.08006477355957, "global_step": 179716, "epoch": 4278} {"train_loss": -7.096875099908738, "global_step": 179717, "epoch": 4278, "val_loss": 80395.9375} {"train_loss": -7.098396301269531, "global_step": 179718, "epoch": 4279} {"train_loss": -7.097968101501465, "global_step": 179719, "epoch": 4279} {"train_loss": -7.186061382293701, "global_step": 179720, "epoch": 4279} {"train_loss": -7.140750885009766, "global_step": 179721, "epoch": 4279} {"train_loss": -7.059730529785156, "global_step": 179722, "epoch": 4279} {"train_loss": -7.023407936096191, "global_step": 179723, "epoch": 4279} {"train_loss": -7.233857154846191, "global_step": 179724, "epoch": 4279} {"train_loss": -7.094052314758301, "global_step": 179725, "epoch": 4279} {"train_loss": -7.191394805908203, "global_step": 179726, "epoch": 4279} {"train_loss": -7.106396675109863, "global_step": 179727, "epoch": 4279} {"train_loss": -7.091430187225342, "global_step": 179728, "epoch": 4279} {"train_loss": -7.247265815734863, "global_step": 179729, "epoch": 4279} {"train_loss": -7.105830192565918, "global_step": 179730, "epoch": 4279} {"train_loss": -7.256787300109863, "global_step": 179731, "epoch": 4279} {"train_loss": -7.016498565673828, "global_step": 179732, "epoch": 4279} {"train_loss": -7.0761332511901855, "global_step": 179733, "epoch": 4279} {"train_loss": -7.15700626373291, "global_step": 179734, "epoch": 4279} {"train_loss": -7.157263278961182, "global_step": 179735, "epoch": 4279} {"train_loss": -7.153789043426514, "global_step": 179736, "epoch": 4279} {"train_loss": -7.180264472961426, "global_step": 179737, "epoch": 4279} {"train_loss": -7.2245774269104, "global_step": 179738, "epoch": 4279} {"train_loss": -7.1991119384765625, "global_step": 179739, "epoch": 4279} {"train_loss": -7.188204765319824, "global_step": 179740, "epoch": 4279} {"train_loss": -7.192895412445068, "global_step": 179741, "epoch": 4279} {"train_loss": -7.03203010559082, "global_step": 179742, "epoch": 4279} {"train_loss": -7.2127366065979, "global_step": 179743, "epoch": 4279} {"train_loss": -7.071486949920654, "global_step": 179744, "epoch": 4279} {"train_loss": -7.046698093414307, "global_step": 179745, "epoch": 4279} {"train_loss": -7.092367172241211, "global_step": 179746, "epoch": 4279} {"train_loss": -7.196918487548828, "global_step": 179747, "epoch": 4279} {"train_loss": -7.085394382476807, "global_step": 179748, "epoch": 4279} {"train_loss": -7.086360454559326, "global_step": 179749, "epoch": 4279} {"train_loss": -7.1628947257995605, "global_step": 179750, "epoch": 4279} {"train_loss": -7.277205467224121, "global_step": 179751, "epoch": 4279} {"train_loss": -7.210670471191406, "global_step": 179752, "epoch": 4279} {"train_loss": -7.169013500213623, "global_step": 179753, "epoch": 4279} {"train_loss": -7.174628257751465, "global_step": 179754, "epoch": 4279} {"train_loss": -7.181291103363037, "global_step": 179755, "epoch": 4279} {"train_loss": -7.109363555908203, "global_step": 179756, "epoch": 4279} {"train_loss": -7.17404842376709, "global_step": 179757, "epoch": 4279} {"train_loss": -7.073359966278076, "global_step": 179758, "epoch": 4279} {"train_loss": -7.14300012588501, "global_step": 179759, "epoch": 4279, "val_loss": 80497.1484375} {"train_loss": -7.047732353210449, "global_step": 179760, "epoch": 4280} {"train_loss": -7.100284576416016, "global_step": 179761, "epoch": 4280} {"train_loss": -7.012672424316406, "global_step": 179762, "epoch": 4280} {"train_loss": -7.131559371948242, "global_step": 179763, "epoch": 4280} {"train_loss": -7.121884346008301, "global_step": 179764, "epoch": 4280} {"train_loss": -7.10529899597168, "global_step": 179765, "epoch": 4280} {"train_loss": -7.222148895263672, "global_step": 179766, "epoch": 4280} {"train_loss": -7.263344764709473, "global_step": 179767, "epoch": 4280} {"train_loss": -7.0796427726745605, "global_step": 179768, "epoch": 4280} {"train_loss": -7.104255199432373, "global_step": 179769, "epoch": 4280} {"train_loss": -7.259613513946533, "global_step": 179770, "epoch": 4280} {"train_loss": -6.973087310791016, "global_step": 179771, "epoch": 4280} {"train_loss": -7.011933326721191, "global_step": 179772, "epoch": 4280} {"train_loss": -7.105175018310547, "global_step": 179773, "epoch": 4280} {"train_loss": -7.135318756103516, "global_step": 179774, "epoch": 4280} {"train_loss": -6.994882583618164, "global_step": 179775, "epoch": 4280} {"train_loss": -7.144289493560791, "global_step": 179776, "epoch": 4280} {"train_loss": -6.807826042175293, "global_step": 179777, "epoch": 4280} {"train_loss": -7.113574981689453, "global_step": 179778, "epoch": 4280} {"train_loss": -7.081476211547852, "global_step": 179779, "epoch": 4280} {"train_loss": -6.910451889038086, "global_step": 179780, "epoch": 4280} {"train_loss": -7.041797637939453, "global_step": 179781, "epoch": 4280} {"train_loss": -6.813004493713379, "global_step": 179782, "epoch": 4280} {"train_loss": -6.9707136154174805, "global_step": 179783, "epoch": 4280} {"train_loss": -6.933859825134277, "global_step": 179784, "epoch": 4280} {"train_loss": -7.102388381958008, "global_step": 179785, "epoch": 4280} {"train_loss": -7.108748435974121, "global_step": 179786, "epoch": 4280} {"train_loss": -6.974271774291992, "global_step": 179787, "epoch": 4280} {"train_loss": -7.155844211578369, "global_step": 179788, "epoch": 4280} {"train_loss": -6.977530479431152, "global_step": 179789, "epoch": 4280} {"train_loss": -7.099799156188965, "global_step": 179790, "epoch": 4280} {"train_loss": -7.043498992919922, "global_step": 179791, "epoch": 4280} {"train_loss": -7.106882095336914, "global_step": 179792, "epoch": 4280} {"train_loss": -7.10679817199707, "global_step": 179793, "epoch": 4280} {"train_loss": -6.986915111541748, "global_step": 179794, "epoch": 4280} {"train_loss": -7.163933753967285, "global_step": 179795, "epoch": 4280} {"train_loss": -7.23432731628418, "global_step": 179796, "epoch": 4280} {"train_loss": -7.079418182373047, "global_step": 179797, "epoch": 4280} {"train_loss": -7.072703838348389, "global_step": 179798, "epoch": 4280} {"train_loss": -7.0960798263549805, "global_step": 179799, "epoch": 4280} {"train_loss": -7.054485321044922, "global_step": 179800, "epoch": 4280} {"train_loss": -7.072692314783732, "global_step": 179801, "epoch": 4280, "val_loss": 80109.6640625} {"train_loss": -6.977439880371094, "global_step": 179802, "epoch": 4281} {"train_loss": -7.0392045974731445, "global_step": 179803, "epoch": 4281} {"train_loss": -7.112587928771973, "global_step": 179804, "epoch": 4281} {"train_loss": -7.100661754608154, "global_step": 179805, "epoch": 4281} {"train_loss": -7.039775371551514, "global_step": 179806, "epoch": 4281} {"train_loss": -7.110129356384277, "global_step": 179807, "epoch": 4281} {"train_loss": -7.0802226066589355, "global_step": 179808, "epoch": 4281} {"train_loss": -6.971696853637695, "global_step": 179809, "epoch": 4281} {"train_loss": -7.099523544311523, "global_step": 179810, "epoch": 4281} {"train_loss": -6.974907875061035, "global_step": 179811, "epoch": 4281} {"train_loss": -7.078222274780273, "global_step": 179812, "epoch": 4281} {"train_loss": -7.056169509887695, "global_step": 179813, "epoch": 4281} {"train_loss": -7.040850639343262, "global_step": 179814, "epoch": 4281} {"train_loss": -7.151187896728516, "global_step": 179815, "epoch": 4281} {"train_loss": -7.002257823944092, "global_step": 179816, "epoch": 4281} {"train_loss": -7.06483268737793, "global_step": 179817, "epoch": 4281} {"train_loss": -7.032283782958984, "global_step": 179818, "epoch": 4281} {"train_loss": -7.10638427734375, "global_step": 179819, "epoch": 4281} {"train_loss": -7.120325088500977, "global_step": 179820, "epoch": 4281} {"train_loss": -7.042738914489746, "global_step": 179821, "epoch": 4281} {"train_loss": -7.0724687576293945, "global_step": 179822, "epoch": 4281} {"train_loss": -7.165175914764404, "global_step": 179823, "epoch": 4281} {"train_loss": -7.140468597412109, "global_step": 179824, "epoch": 4281} {"train_loss": -7.1500654220581055, "global_step": 179825, "epoch": 4281} {"train_loss": -7.231756210327148, "global_step": 179826, "epoch": 4281} {"train_loss": -7.263075828552246, "global_step": 179827, "epoch": 4281} {"train_loss": -7.133429527282715, "global_step": 179828, "epoch": 4281} {"train_loss": -7.183444499969482, "global_step": 179829, "epoch": 4281} {"train_loss": -7.186193466186523, "global_step": 179830, "epoch": 4281} {"train_loss": -7.235476016998291, "global_step": 179831, "epoch": 4281} {"train_loss": -7.109186172485352, "global_step": 179832, "epoch": 4281} {"train_loss": -7.173765182495117, "global_step": 179833, "epoch": 4281} {"train_loss": -7.227172374725342, "global_step": 179834, "epoch": 4281} {"train_loss": -7.128620624542236, "global_step": 179835, "epoch": 4281} {"train_loss": -7.090786933898926, "global_step": 179836, "epoch": 4281} {"train_loss": -7.186404228210449, "global_step": 179837, "epoch": 4281} {"train_loss": -7.204146862030029, "global_step": 179838, "epoch": 4281} {"train_loss": -7.186611175537109, "global_step": 179839, "epoch": 4281} {"train_loss": -7.108682632446289, "global_step": 179840, "epoch": 4281} {"train_loss": -7.066171646118164, "global_step": 179841, "epoch": 4281} {"train_loss": -7.12749719619751, "global_step": 179842, "epoch": 4281} {"train_loss": -7.111896832784017, "global_step": 179843, "epoch": 4281, "val_loss": 80345.0625} {"train_loss": -7.242356300354004, "global_step": 179844, "epoch": 4282} {"train_loss": -7.050544738769531, "global_step": 179845, "epoch": 4282} {"train_loss": -7.164670944213867, "global_step": 179846, "epoch": 4282} {"train_loss": -7.109631061553955, "global_step": 179847, "epoch": 4282} {"train_loss": -7.029014587402344, "global_step": 179848, "epoch": 4282} {"train_loss": -7.094160556793213, "global_step": 179849, "epoch": 4282} {"train_loss": -7.243259429931641, "global_step": 179850, "epoch": 4282} {"train_loss": -7.121234893798828, "global_step": 179851, "epoch": 4282} {"train_loss": -7.109033107757568, "global_step": 179852, "epoch": 4282} {"train_loss": -7.125576019287109, "global_step": 179853, "epoch": 4282} {"train_loss": -7.183454990386963, "global_step": 179854, "epoch": 4282} {"train_loss": -7.189798355102539, "global_step": 179855, "epoch": 4282} {"train_loss": -7.1736063957214355, "global_step": 179856, "epoch": 4282} {"train_loss": -7.204015254974365, "global_step": 179857, "epoch": 4282} {"train_loss": -7.128566741943359, "global_step": 179858, "epoch": 4282} {"train_loss": -7.072495460510254, "global_step": 179859, "epoch": 4282} {"train_loss": -7.16106653213501, "global_step": 179860, "epoch": 4282} {"train_loss": -7.155808925628662, "global_step": 179861, "epoch": 4282} {"train_loss": -7.13439416885376, "global_step": 179862, "epoch": 4282} {"train_loss": -7.092536926269531, "global_step": 179863, "epoch": 4282} {"train_loss": -7.100941181182861, "global_step": 179864, "epoch": 4282} {"train_loss": -7.017541408538818, "global_step": 179865, "epoch": 4282} {"train_loss": -7.137333869934082, "global_step": 179866, "epoch": 4282} {"train_loss": -7.2212233543396, "global_step": 179867, "epoch": 4282} {"train_loss": -7.124732971191406, "global_step": 179868, "epoch": 4282} {"train_loss": -7.1277875900268555, "global_step": 179869, "epoch": 4282} {"train_loss": -7.192137241363525, "global_step": 179870, "epoch": 4282} {"train_loss": -7.1872735023498535, "global_step": 179871, "epoch": 4282} {"train_loss": -7.216841697692871, "global_step": 179872, "epoch": 4282} {"train_loss": -7.13393497467041, "global_step": 179873, "epoch": 4282} {"train_loss": -7.174127101898193, "global_step": 179874, "epoch": 4282} {"train_loss": -7.139926910400391, "global_step": 179875, "epoch": 4282} {"train_loss": -7.1110944747924805, "global_step": 179876, "epoch": 4282} {"train_loss": -7.147353172302246, "global_step": 179877, "epoch": 4282} {"train_loss": -7.233212471008301, "global_step": 179878, "epoch": 4282} {"train_loss": -7.103338718414307, "global_step": 179879, "epoch": 4282} {"train_loss": -7.10055685043335, "global_step": 179880, "epoch": 4282} {"train_loss": -7.049845218658447, "global_step": 179881, "epoch": 4282} {"train_loss": -7.144556045532227, "global_step": 179882, "epoch": 4282} {"train_loss": -7.095651626586914, "global_step": 179883, "epoch": 4282} {"train_loss": -7.0244221687316895, "global_step": 179884, "epoch": 4282} {"train_loss": -7.135024581636701, "global_step": 179885, "epoch": 4282, "val_loss": 80418.578125} {"train_loss": -7.187357425689697, "global_step": 179886, "epoch": 4283} {"train_loss": -7.114587306976318, "global_step": 179887, "epoch": 4283} {"train_loss": -7.1055169105529785, "global_step": 179888, "epoch": 4283} {"train_loss": -7.133829116821289, "global_step": 179889, "epoch": 4283} {"train_loss": -7.033400058746338, "global_step": 179890, "epoch": 4283} {"train_loss": -6.959197998046875, "global_step": 179891, "epoch": 4283} {"train_loss": -7.0944600105285645, "global_step": 179892, "epoch": 4283} {"train_loss": -7.076991081237793, "global_step": 179893, "epoch": 4283} {"train_loss": -7.229175567626953, "global_step": 179894, "epoch": 4283} {"train_loss": -7.1695942878723145, "global_step": 179895, "epoch": 4283} {"train_loss": -7.071160316467285, "global_step": 179896, "epoch": 4283} {"train_loss": -7.032111644744873, "global_step": 179897, "epoch": 4283} {"train_loss": -7.215869426727295, "global_step": 179898, "epoch": 4283} {"train_loss": -7.062150001525879, "global_step": 179899, "epoch": 4283} {"train_loss": -7.095816612243652, "global_step": 179900, "epoch": 4283} {"train_loss": -6.986364841461182, "global_step": 179901, "epoch": 4283} {"train_loss": -7.069943428039551, "global_step": 179902, "epoch": 4283} {"train_loss": -7.068512916564941, "global_step": 179903, "epoch": 4283} {"train_loss": -7.10951042175293, "global_step": 179904, "epoch": 4283} {"train_loss": -7.133710861206055, "global_step": 179905, "epoch": 4283} {"train_loss": -7.025757789611816, "global_step": 179906, "epoch": 4283} {"train_loss": -7.077329635620117, "global_step": 179907, "epoch": 4283} {"train_loss": -7.1073408126831055, "global_step": 179908, "epoch": 4283} {"train_loss": -7.0550713539123535, "global_step": 179909, "epoch": 4283} {"train_loss": -7.036741256713867, "global_step": 179910, "epoch": 4283} {"train_loss": -7.124831676483154, "global_step": 179911, "epoch": 4283} {"train_loss": -6.9664812088012695, "global_step": 179912, "epoch": 4283} {"train_loss": -7.164651870727539, "global_step": 179913, "epoch": 4283} {"train_loss": -7.037832260131836, "global_step": 179914, "epoch": 4283} {"train_loss": -7.083443641662598, "global_step": 179915, "epoch": 4283} {"train_loss": -7.032699108123779, "global_step": 179916, "epoch": 4283} {"train_loss": -7.0460076332092285, "global_step": 179917, "epoch": 4283} {"train_loss": -7.0129852294921875, "global_step": 179918, "epoch": 4283} {"train_loss": -7.017308235168457, "global_step": 179919, "epoch": 4283} {"train_loss": -6.9103593826293945, "global_step": 179920, "epoch": 4283} {"train_loss": -7.067600727081299, "global_step": 179921, "epoch": 4283} {"train_loss": -7.031825065612793, "global_step": 179922, "epoch": 4283} {"train_loss": -6.951357841491699, "global_step": 179923, "epoch": 4283} {"train_loss": -7.10841178894043, "global_step": 179924, "epoch": 4283} {"train_loss": -6.9836530685424805, "global_step": 179925, "epoch": 4283} {"train_loss": -7.133845806121826, "global_step": 179926, "epoch": 4283} {"train_loss": -7.069352047783988, "global_step": 179927, "epoch": 4283, "val_loss": 80401.109375} {"train_loss": -6.988865852355957, "global_step": 179928, "epoch": 4284} {"train_loss": -7.066819190979004, "global_step": 179929, "epoch": 4284} {"train_loss": -7.097045421600342, "global_step": 179930, "epoch": 4284} {"train_loss": -6.981945991516113, "global_step": 179931, "epoch": 4284} {"train_loss": -6.943456172943115, "global_step": 179932, "epoch": 4284} {"train_loss": -7.060181617736816, "global_step": 179933, "epoch": 4284} {"train_loss": -7.237403869628906, "global_step": 179934, "epoch": 4284} {"train_loss": -7.0411882400512695, "global_step": 179935, "epoch": 4284} {"train_loss": -7.15051794052124, "global_step": 179936, "epoch": 4284} {"train_loss": -7.155969619750977, "global_step": 179937, "epoch": 4284} {"train_loss": -7.107940196990967, "global_step": 179938, "epoch": 4284} {"train_loss": -7.179114818572998, "global_step": 179939, "epoch": 4284} {"train_loss": -7.080705642700195, "global_step": 179940, "epoch": 4284} {"train_loss": -7.079365253448486, "global_step": 179941, "epoch": 4284} {"train_loss": -7.183517932891846, "global_step": 179942, "epoch": 4284} {"train_loss": -7.231523513793945, "global_step": 179943, "epoch": 4284} {"train_loss": -7.1695756912231445, "global_step": 179944, "epoch": 4284} {"train_loss": -7.247730255126953, "global_step": 179945, "epoch": 4284} {"train_loss": -7.1070404052734375, "global_step": 179946, "epoch": 4284} {"train_loss": -7.080777168273926, "global_step": 179947, "epoch": 4284} {"train_loss": -7.077290058135986, "global_step": 179948, "epoch": 4284} {"train_loss": -7.2247209548950195, "global_step": 179949, "epoch": 4284} {"train_loss": -7.160808563232422, "global_step": 179950, "epoch": 4284} {"train_loss": -7.120538711547852, "global_step": 179951, "epoch": 4284} {"train_loss": -7.193940162658691, "global_step": 179952, "epoch": 4284} {"train_loss": -7.1730217933654785, "global_step": 179953, "epoch": 4284} {"train_loss": -7.046660423278809, "global_step": 179954, "epoch": 4284} {"train_loss": -6.984503746032715, "global_step": 179955, "epoch": 4284} {"train_loss": -6.888586521148682, "global_step": 179956, "epoch": 4284} {"train_loss": -7.087761878967285, "global_step": 179957, "epoch": 4284} {"train_loss": -6.923081398010254, "global_step": 179958, "epoch": 4284} {"train_loss": -6.955224990844727, "global_step": 179959, "epoch": 4284} {"train_loss": -7.048350811004639, "global_step": 179960, "epoch": 4284} {"train_loss": -6.912500381469727, "global_step": 179961, "epoch": 4284} {"train_loss": -6.966238021850586, "global_step": 179962, "epoch": 4284} {"train_loss": -6.951674461364746, "global_step": 179963, "epoch": 4284} {"train_loss": -7.131331920623779, "global_step": 179964, "epoch": 4284} {"train_loss": -6.962042808532715, "global_step": 179965, "epoch": 4284} {"train_loss": -7.055171966552734, "global_step": 179966, "epoch": 4284} {"train_loss": -7.178328990936279, "global_step": 179967, "epoch": 4284} {"train_loss": -6.983940124511719, "global_step": 179968, "epoch": 4284} {"train_loss": -7.0778004214877175, "global_step": 179969, "epoch": 4284, "val_loss": 80484.1875} {"train_loss": -7.0506792068481445, "global_step": 179970, "epoch": 4285} {"train_loss": -7.0068678855896, "global_step": 179971, "epoch": 4285} {"train_loss": -7.004150390625, "global_step": 179972, "epoch": 4285} {"train_loss": -7.065422058105469, "global_step": 179973, "epoch": 4285} {"train_loss": -7.049499034881592, "global_step": 179974, "epoch": 4285} {"train_loss": -7.073463439941406, "global_step": 179975, "epoch": 4285} {"train_loss": -7.1029276847839355, "global_step": 179976, "epoch": 4285} {"train_loss": -7.1100263595581055, "global_step": 179977, "epoch": 4285} {"train_loss": -7.181123733520508, "global_step": 179978, "epoch": 4285} {"train_loss": -7.105098724365234, "global_step": 179979, "epoch": 4285} {"train_loss": -7.066834449768066, "global_step": 179980, "epoch": 4285} {"train_loss": -7.179232120513916, "global_step": 179981, "epoch": 4285} {"train_loss": -7.083130836486816, "global_step": 179982, "epoch": 4285} {"train_loss": -7.1216349601745605, "global_step": 179983, "epoch": 4285} {"train_loss": -7.191644668579102, "global_step": 179984, "epoch": 4285} {"train_loss": -7.115139007568359, "global_step": 179985, "epoch": 4285} {"train_loss": -7.115397930145264, "global_step": 179986, "epoch": 4285} {"train_loss": -7.1134514808654785, "global_step": 179987, "epoch": 4285} {"train_loss": -7.095219612121582, "global_step": 179988, "epoch": 4285} {"train_loss": -7.221306800842285, "global_step": 179989, "epoch": 4285} {"train_loss": -7.148615837097168, "global_step": 179990, "epoch": 4285} {"train_loss": -7.166916847229004, "global_step": 179991, "epoch": 4285} {"train_loss": -7.114583969116211, "global_step": 179992, "epoch": 4285} {"train_loss": -7.267234802246094, "global_step": 179993, "epoch": 4285} {"train_loss": -7.180059432983398, "global_step": 179994, "epoch": 4285} {"train_loss": -7.116205215454102, "global_step": 179995, "epoch": 4285} {"train_loss": -7.16011381149292, "global_step": 179996, "epoch": 4285} {"train_loss": -7.097267150878906, "global_step": 179997, "epoch": 4285} {"train_loss": -7.135442733764648, "global_step": 179998, "epoch": 4285} {"train_loss": -7.1595072746276855, "global_step": 179999, "epoch": 4285} {"train_loss": -7.250673770904541, "global_step": 180000, "epoch": 4285} {"train_loss": -7.152859687805176, "global_step": 180001, "epoch": 4285} {"train_loss": -7.129100799560547, "global_step": 180002, "epoch": 4285} {"train_loss": -7.120888710021973, "global_step": 180003, "epoch": 4285} {"train_loss": -7.190347671508789, "global_step": 180004, "epoch": 4285} {"train_loss": -7.227636337280273, "global_step": 180005, "epoch": 4285} {"train_loss": -7.159575462341309, "global_step": 180006, "epoch": 4285} {"train_loss": -6.926405906677246, "global_step": 180007, "epoch": 4285} {"train_loss": -7.070304870605469, "global_step": 180008, "epoch": 4285} {"train_loss": -7.1127800941467285, "global_step": 180009, "epoch": 4285} {"train_loss": -7.176963806152344, "global_step": 180010, "epoch": 4285} {"train_loss": -7.123698166438511, "global_step": 180011, "epoch": 4285, "val_loss": 80606.8984375} {"train_loss": -7.104981422424316, "global_step": 180012, "epoch": 4286} {"train_loss": -7.182662010192871, "global_step": 180013, "epoch": 4286} {"train_loss": -7.07621955871582, "global_step": 180014, "epoch": 4286} {"train_loss": -7.173440933227539, "global_step": 180015, "epoch": 4286} {"train_loss": -7.138195991516113, "global_step": 180016, "epoch": 4286} {"train_loss": -7.281215667724609, "global_step": 180017, "epoch": 4286} {"train_loss": -7.2350172996521, "global_step": 180018, "epoch": 4286} {"train_loss": -7.113041877746582, "global_step": 180019, "epoch": 4286} {"train_loss": -7.2750349044799805, "global_step": 180020, "epoch": 4286} {"train_loss": -7.187068939208984, "global_step": 180021, "epoch": 4286} {"train_loss": -7.0946044921875, "global_step": 180022, "epoch": 4286} {"train_loss": -7.153295516967773, "global_step": 180023, "epoch": 4286} {"train_loss": -7.107296466827393, "global_step": 180024, "epoch": 4286} {"train_loss": -7.2295403480529785, "global_step": 180025, "epoch": 4286} {"train_loss": -7.127091884613037, "global_step": 180026, "epoch": 4286} {"train_loss": -7.121933937072754, "global_step": 180027, "epoch": 4286} {"train_loss": -7.0418195724487305, "global_step": 180028, "epoch": 4286} {"train_loss": -7.0284810066223145, "global_step": 180029, "epoch": 4286} {"train_loss": -7.144208908081055, "global_step": 180030, "epoch": 4286} {"train_loss": -7.10361385345459, "global_step": 180031, "epoch": 4286} {"train_loss": -7.0113654136657715, "global_step": 180032, "epoch": 4286} {"train_loss": -7.221897125244141, "global_step": 180033, "epoch": 4286} {"train_loss": -7.161410331726074, "global_step": 180034, "epoch": 4286} {"train_loss": -7.1936187744140625, "global_step": 180035, "epoch": 4286} {"train_loss": -7.1865386962890625, "global_step": 180036, "epoch": 4286} {"train_loss": -7.136673927307129, "global_step": 180037, "epoch": 4286} {"train_loss": -7.200686454772949, "global_step": 180038, "epoch": 4286} {"train_loss": -7.1223626136779785, "global_step": 180039, "epoch": 4286} {"train_loss": -7.161138534545898, "global_step": 180040, "epoch": 4286} {"train_loss": -6.994956016540527, "global_step": 180041, "epoch": 4286} {"train_loss": -7.1479058265686035, "global_step": 180042, "epoch": 4286} {"train_loss": -7.124748229980469, "global_step": 180043, "epoch": 4286} {"train_loss": -7.078314781188965, "global_step": 180044, "epoch": 4286} {"train_loss": -7.068007469177246, "global_step": 180045, "epoch": 4286} {"train_loss": -7.163819313049316, "global_step": 180046, "epoch": 4286} {"train_loss": -7.086736679077148, "global_step": 180047, "epoch": 4286} {"train_loss": -7.179996013641357, "global_step": 180048, "epoch": 4286} {"train_loss": -7.081501007080078, "global_step": 180049, "epoch": 4286} {"train_loss": -7.016963005065918, "global_step": 180050, "epoch": 4286} {"train_loss": -7.082751750946045, "global_step": 180051, "epoch": 4286} {"train_loss": -6.949070453643799, "global_step": 180052, "epoch": 4286} {"train_loss": -7.12572455406189, "global_step": 180053, "epoch": 4286, "val_loss": 80420.6640625} {"train_loss": -7.114170551300049, "global_step": 180054, "epoch": 4287} {"train_loss": -7.031661033630371, "global_step": 180055, "epoch": 4287} {"train_loss": -7.091568946838379, "global_step": 180056, "epoch": 4287} {"train_loss": -7.098241806030273, "global_step": 180057, "epoch": 4287} {"train_loss": -7.123013973236084, "global_step": 180058, "epoch": 4287} {"train_loss": -7.0978593826293945, "global_step": 180059, "epoch": 4287} {"train_loss": -7.182991027832031, "global_step": 180060, "epoch": 4287} {"train_loss": -7.0534868240356445, "global_step": 180061, "epoch": 4287} {"train_loss": -7.144435405731201, "global_step": 180062, "epoch": 4287} {"train_loss": -7.173071384429932, "global_step": 180063, "epoch": 4287} {"train_loss": -7.093417167663574, "global_step": 180064, "epoch": 4287} {"train_loss": -7.1739115715026855, "global_step": 180065, "epoch": 4287} {"train_loss": -7.117033958435059, "global_step": 180066, "epoch": 4287} {"train_loss": -7.1770853996276855, "global_step": 180067, "epoch": 4287} {"train_loss": -7.140143394470215, "global_step": 180068, "epoch": 4287} {"train_loss": -7.213091850280762, "global_step": 180069, "epoch": 4287} {"train_loss": -7.165336608886719, "global_step": 180070, "epoch": 4287} {"train_loss": -7.177247047424316, "global_step": 180071, "epoch": 4287} {"train_loss": -7.165028095245361, "global_step": 180072, "epoch": 4287} {"train_loss": -7.219732284545898, "global_step": 180073, "epoch": 4287} {"train_loss": -7.160727500915527, "global_step": 180074, "epoch": 4287} {"train_loss": -7.101169109344482, "global_step": 180075, "epoch": 4287} {"train_loss": -7.087067127227783, "global_step": 180076, "epoch": 4287} {"train_loss": -7.199268341064453, "global_step": 180077, "epoch": 4287} {"train_loss": -7.159022331237793, "global_step": 180078, "epoch": 4287} {"train_loss": -7.104302406311035, "global_step": 180079, "epoch": 4287} {"train_loss": -7.172369480133057, "global_step": 180080, "epoch": 4287} {"train_loss": -7.182738304138184, "global_step": 180081, "epoch": 4287} {"train_loss": -7.032891273498535, "global_step": 180082, "epoch": 4287} {"train_loss": -7.096431255340576, "global_step": 180083, "epoch": 4287} {"train_loss": -7.12480354309082, "global_step": 180084, "epoch": 4287} {"train_loss": -7.2291975021362305, "global_step": 180085, "epoch": 4287} {"train_loss": -7.086874008178711, "global_step": 180086, "epoch": 4287} {"train_loss": -7.0302958488464355, "global_step": 180087, "epoch": 4287} {"train_loss": -7.15560245513916, "global_step": 180088, "epoch": 4287} {"train_loss": -7.0792765617370605, "global_step": 180089, "epoch": 4287} {"train_loss": -7.135390281677246, "global_step": 180090, "epoch": 4287} {"train_loss": -7.289572715759277, "global_step": 180091, "epoch": 4287} {"train_loss": -7.195481300354004, "global_step": 180092, "epoch": 4287} {"train_loss": -7.211702823638916, "global_step": 180093, "epoch": 4287} {"train_loss": -7.136904716491699, "global_step": 180094, "epoch": 4287} {"train_loss": -7.138083151408604, "global_step": 180095, "epoch": 4287, "val_loss": 80435.953125} {"train_loss": -7.19537353515625, "global_step": 180096, "epoch": 4288} {"train_loss": -7.052792072296143, "global_step": 180097, "epoch": 4288} {"train_loss": -7.212471961975098, "global_step": 180098, "epoch": 4288} {"train_loss": -7.2482147216796875, "global_step": 180099, "epoch": 4288} {"train_loss": -7.049627304077148, "global_step": 180100, "epoch": 4288} {"train_loss": -7.137908458709717, "global_step": 180101, "epoch": 4288} {"train_loss": -7.171545028686523, "global_step": 180102, "epoch": 4288} {"train_loss": -7.047914505004883, "global_step": 180103, "epoch": 4288} {"train_loss": -7.19869327545166, "global_step": 180104, "epoch": 4288} {"train_loss": -7.1638994216918945, "global_step": 180105, "epoch": 4288} {"train_loss": -7.224204063415527, "global_step": 180106, "epoch": 4288} {"train_loss": -7.1967363357543945, "global_step": 180107, "epoch": 4288} {"train_loss": -7.177164077758789, "global_step": 180108, "epoch": 4288} {"train_loss": -7.118227481842041, "global_step": 180109, "epoch": 4288} {"train_loss": -7.142304420471191, "global_step": 180110, "epoch": 4288} {"train_loss": -7.285492897033691, "global_step": 180111, "epoch": 4288} {"train_loss": -7.1151509284973145, "global_step": 180112, "epoch": 4288} {"train_loss": -7.22230339050293, "global_step": 180113, "epoch": 4288} {"train_loss": -7.106168746948242, "global_step": 180114, "epoch": 4288} {"train_loss": -7.248691558837891, "global_step": 180115, "epoch": 4288} {"train_loss": -7.157954692840576, "global_step": 180116, "epoch": 4288} {"train_loss": -7.1949849128723145, "global_step": 180117, "epoch": 4288} {"train_loss": -7.233030796051025, "global_step": 180118, "epoch": 4288} {"train_loss": -7.140354633331299, "global_step": 180119, "epoch": 4288} {"train_loss": -7.159870147705078, "global_step": 180120, "epoch": 4288} {"train_loss": -7.165313720703125, "global_step": 180121, "epoch": 4288} {"train_loss": -7.2710371017456055, "global_step": 180122, "epoch": 4288} {"train_loss": -7.2072906494140625, "global_step": 180123, "epoch": 4288} {"train_loss": -7.169915676116943, "global_step": 180124, "epoch": 4288} {"train_loss": -7.174987316131592, "global_step": 180125, "epoch": 4288} {"train_loss": -7.1371564865112305, "global_step": 180126, "epoch": 4288} {"train_loss": -7.215306758880615, "global_step": 180127, "epoch": 4288} {"train_loss": -7.236104965209961, "global_step": 180128, "epoch": 4288} {"train_loss": -7.144478797912598, "global_step": 180129, "epoch": 4288} {"train_loss": -7.161504745483398, "global_step": 180130, "epoch": 4288} {"train_loss": -7.131172180175781, "global_step": 180131, "epoch": 4288} {"train_loss": -7.088920593261719, "global_step": 180132, "epoch": 4288} {"train_loss": -7.12286901473999, "global_step": 180133, "epoch": 4288} {"train_loss": -7.303104400634766, "global_step": 180134, "epoch": 4288} {"train_loss": -7.225775718688965, "global_step": 180135, "epoch": 4288} {"train_loss": -7.060181617736816, "global_step": 180136, "epoch": 4288} {"train_loss": -7.168563195637295, "global_step": 180137, "epoch": 4288, "val_loss": 80331.8671875} {"train_loss": -7.198665618896484, "global_step": 180138, "epoch": 4289} {"train_loss": -7.114300727844238, "global_step": 180139, "epoch": 4289} {"train_loss": -7.19908332824707, "global_step": 180140, "epoch": 4289} {"train_loss": -7.118796348571777, "global_step": 180141, "epoch": 4289} {"train_loss": -7.238569259643555, "global_step": 180142, "epoch": 4289} {"train_loss": -7.168418884277344, "global_step": 180143, "epoch": 4289} {"train_loss": -7.234889984130859, "global_step": 180144, "epoch": 4289} {"train_loss": -7.213752746582031, "global_step": 180145, "epoch": 4289} {"train_loss": -7.101334571838379, "global_step": 180146, "epoch": 4289} {"train_loss": -7.0842604637146, "global_step": 180147, "epoch": 4289} {"train_loss": -7.173322677612305, "global_step": 180148, "epoch": 4289} {"train_loss": -7.138682842254639, "global_step": 180149, "epoch": 4289} {"train_loss": -7.209929943084717, "global_step": 180150, "epoch": 4289} {"train_loss": -7.3061747550964355, "global_step": 180151, "epoch": 4289} {"train_loss": -7.12411642074585, "global_step": 180152, "epoch": 4289} {"train_loss": -7.328068733215332, "global_step": 180153, "epoch": 4289} {"train_loss": -7.162018775939941, "global_step": 180154, "epoch": 4289} {"train_loss": -7.149996757507324, "global_step": 180155, "epoch": 4289} {"train_loss": -7.216760635375977, "global_step": 180156, "epoch": 4289} {"train_loss": -7.251711845397949, "global_step": 180157, "epoch": 4289} {"train_loss": -7.1058454513549805, "global_step": 180158, "epoch": 4289} {"train_loss": -7.038993835449219, "global_step": 180159, "epoch": 4289} {"train_loss": -7.074639797210693, "global_step": 180160, "epoch": 4289} {"train_loss": -7.240601539611816, "global_step": 180161, "epoch": 4289} {"train_loss": -7.193472385406494, "global_step": 180162, "epoch": 4289} {"train_loss": -7.148728370666504, "global_step": 180163, "epoch": 4289} {"train_loss": -7.102012634277344, "global_step": 180164, "epoch": 4289} {"train_loss": -7.220885276794434, "global_step": 180165, "epoch": 4289} {"train_loss": -7.205047607421875, "global_step": 180166, "epoch": 4289} {"train_loss": -7.2046356201171875, "global_step": 180167, "epoch": 4289} {"train_loss": -7.18695068359375, "global_step": 180168, "epoch": 4289} {"train_loss": -7.096697807312012, "global_step": 180169, "epoch": 4289} {"train_loss": -7.172497272491455, "global_step": 180170, "epoch": 4289} {"train_loss": -7.112848281860352, "global_step": 180171, "epoch": 4289} {"train_loss": -7.049378871917725, "global_step": 180172, "epoch": 4289} {"train_loss": -7.211291313171387, "global_step": 180173, "epoch": 4289} {"train_loss": -7.102117538452148, "global_step": 180174, "epoch": 4289} {"train_loss": -7.003447532653809, "global_step": 180175, "epoch": 4289} {"train_loss": -6.982940673828125, "global_step": 180176, "epoch": 4289} {"train_loss": -7.265451431274414, "global_step": 180177, "epoch": 4289} {"train_loss": -7.1098504066467285, "global_step": 180178, "epoch": 4289} {"train_loss": -7.1573454311915805, "global_step": 180179, "epoch": 4289, "val_loss": 80483.5625} {"train_loss": -7.16507625579834, "global_step": 180180, "epoch": 4290} {"train_loss": -6.94938325881958, "global_step": 180181, "epoch": 4290} {"train_loss": -7.15854549407959, "global_step": 180182, "epoch": 4290} {"train_loss": -7.047667980194092, "global_step": 180183, "epoch": 4290} {"train_loss": -6.9314751625061035, "global_step": 180184, "epoch": 4290} {"train_loss": -7.026557445526123, "global_step": 180185, "epoch": 4290} {"train_loss": -7.075937747955322, "global_step": 180186, "epoch": 4290} {"train_loss": -7.0488080978393555, "global_step": 180187, "epoch": 4290} {"train_loss": -7.032050609588623, "global_step": 180188, "epoch": 4290} {"train_loss": -7.06057071685791, "global_step": 180189, "epoch": 4290} {"train_loss": -7.089673042297363, "global_step": 180190, "epoch": 4290} {"train_loss": -6.9603729248046875, "global_step": 180191, "epoch": 4290} {"train_loss": -6.987344264984131, "global_step": 180192, "epoch": 4290} {"train_loss": -6.977772235870361, "global_step": 180193, "epoch": 4290} {"train_loss": -6.963338375091553, "global_step": 180194, "epoch": 4290} {"train_loss": -6.935770034790039, "global_step": 180195, "epoch": 4290} {"train_loss": -6.90217399597168, "global_step": 180196, "epoch": 4290} {"train_loss": -7.124178886413574, "global_step": 180197, "epoch": 4290} {"train_loss": -6.951646327972412, "global_step": 180198, "epoch": 4290} {"train_loss": -7.121740341186523, "global_step": 180199, "epoch": 4290} {"train_loss": -6.954659461975098, "global_step": 180200, "epoch": 4290} {"train_loss": -7.081021308898926, "global_step": 180201, "epoch": 4290} {"train_loss": -7.0079345703125, "global_step": 180202, "epoch": 4290} {"train_loss": -7.051107406616211, "global_step": 180203, "epoch": 4290} {"train_loss": -7.019384860992432, "global_step": 180204, "epoch": 4290} {"train_loss": -7.087607383728027, "global_step": 180205, "epoch": 4290} {"train_loss": -7.143723011016846, "global_step": 180206, "epoch": 4290} {"train_loss": -6.948694705963135, "global_step": 180207, "epoch": 4290} {"train_loss": -7.078240871429443, "global_step": 180208, "epoch": 4290} {"train_loss": -6.842532157897949, "global_step": 180209, "epoch": 4290} {"train_loss": -7.0978851318359375, "global_step": 180210, "epoch": 4290} {"train_loss": -7.05439567565918, "global_step": 180211, "epoch": 4290} {"train_loss": -7.247509479522705, "global_step": 180212, "epoch": 4290} {"train_loss": -7.212306022644043, "global_step": 180213, "epoch": 4290} {"train_loss": -7.17726993560791, "global_step": 180214, "epoch": 4290} {"train_loss": -7.120603561401367, "global_step": 180215, "epoch": 4290} {"train_loss": -7.091002941131592, "global_step": 180216, "epoch": 4290} {"train_loss": -7.108441352844238, "global_step": 180217, "epoch": 4290} {"train_loss": -7.128735542297363, "global_step": 180218, "epoch": 4290} {"train_loss": -7.203605651855469, "global_step": 180219, "epoch": 4290} {"train_loss": -7.035087585449219, "global_step": 180220, "epoch": 4290} {"train_loss": -7.056559233438401, "global_step": 180221, "epoch": 4290, "val_loss": 80149.1875} {"train_loss": -7.132421970367432, "global_step": 180222, "epoch": 4291} {"train_loss": -7.087460517883301, "global_step": 180223, "epoch": 4291} {"train_loss": -7.244311332702637, "global_step": 180224, "epoch": 4291} {"train_loss": -7.051021099090576, "global_step": 180225, "epoch": 4291} {"train_loss": -6.985498428344727, "global_step": 180226, "epoch": 4291} {"train_loss": -7.053151607513428, "global_step": 180227, "epoch": 4291} {"train_loss": -7.110072135925293, "global_step": 180228, "epoch": 4291} {"train_loss": -6.95574951171875, "global_step": 180229, "epoch": 4291} {"train_loss": -7.054889678955078, "global_step": 180230, "epoch": 4291} {"train_loss": -7.136552810668945, "global_step": 180231, "epoch": 4291} {"train_loss": -6.767571926116943, "global_step": 180232, "epoch": 4291} {"train_loss": -6.977447032928467, "global_step": 180233, "epoch": 4291} {"train_loss": -7.111992835998535, "global_step": 180234, "epoch": 4291} {"train_loss": -7.068341255187988, "global_step": 180235, "epoch": 4291} {"train_loss": -7.024277687072754, "global_step": 180236, "epoch": 4291} {"train_loss": -7.06671142578125, "global_step": 180237, "epoch": 4291} {"train_loss": -6.957446575164795, "global_step": 180238, "epoch": 4291} {"train_loss": -7.156007766723633, "global_step": 180239, "epoch": 4291} {"train_loss": -7.0331010818481445, "global_step": 180240, "epoch": 4291} {"train_loss": -7.099367618560791, "global_step": 180241, "epoch": 4291} {"train_loss": -7.109521865844727, "global_step": 180242, "epoch": 4291} {"train_loss": -7.119855880737305, "global_step": 180243, "epoch": 4291} {"train_loss": -7.1450324058532715, "global_step": 180244, "epoch": 4291} {"train_loss": -7.118142604827881, "global_step": 180245, "epoch": 4291} {"train_loss": -7.090502738952637, "global_step": 180246, "epoch": 4291} {"train_loss": -7.114392280578613, "global_step": 180247, "epoch": 4291} {"train_loss": -7.171397686004639, "global_step": 180248, "epoch": 4291} {"train_loss": -7.124972343444824, "global_step": 180249, "epoch": 4291} {"train_loss": -7.151801109313965, "global_step": 180250, "epoch": 4291} {"train_loss": -7.024623870849609, "global_step": 180251, "epoch": 4291} {"train_loss": -6.981853485107422, "global_step": 180252, "epoch": 4291} {"train_loss": -7.0352935791015625, "global_step": 180253, "epoch": 4291} {"train_loss": -7.227251052856445, "global_step": 180254, "epoch": 4291} {"train_loss": -7.3185272216796875, "global_step": 180255, "epoch": 4291} {"train_loss": -7.116720199584961, "global_step": 180256, "epoch": 4291} {"train_loss": -7.171875, "global_step": 180257, "epoch": 4291} {"train_loss": -7.168766975402832, "global_step": 180258, "epoch": 4291} {"train_loss": -7.159893989562988, "global_step": 180259, "epoch": 4291} {"train_loss": -7.135649681091309, "global_step": 180260, "epoch": 4291} {"train_loss": -7.0240254402160645, "global_step": 180261, "epoch": 4291} {"train_loss": -7.094875335693359, "global_step": 180262, "epoch": 4291} {"train_loss": -7.09058640116737, "global_step": 180263, "epoch": 4291, "val_loss": 80491.6953125} {"train_loss": -7.123818397521973, "global_step": 180264, "epoch": 4292} {"train_loss": -7.120128631591797, "global_step": 180265, "epoch": 4292} {"train_loss": -7.068447113037109, "global_step": 180266, "epoch": 4292} {"train_loss": -7.050436973571777, "global_step": 180267, "epoch": 4292} {"train_loss": -7.003255844116211, "global_step": 180268, "epoch": 4292} {"train_loss": -7.11219596862793, "global_step": 180269, "epoch": 4292} {"train_loss": -7.065534591674805, "global_step": 180270, "epoch": 4292} {"train_loss": -6.899738311767578, "global_step": 180271, "epoch": 4292} {"train_loss": -7.064845085144043, "global_step": 180272, "epoch": 4292} {"train_loss": -7.037785053253174, "global_step": 180273, "epoch": 4292} {"train_loss": -7.034355163574219, "global_step": 180274, "epoch": 4292} {"train_loss": -7.090394020080566, "global_step": 180275, "epoch": 4292} {"train_loss": -6.98670768737793, "global_step": 180276, "epoch": 4292} {"train_loss": -7.019015312194824, "global_step": 180277, "epoch": 4292} {"train_loss": -7.091015815734863, "global_step": 180278, "epoch": 4292} {"train_loss": -7.015111923217773, "global_step": 180279, "epoch": 4292} {"train_loss": -7.008176803588867, "global_step": 180280, "epoch": 4292} {"train_loss": -7.108299255371094, "global_step": 180281, "epoch": 4292} {"train_loss": -7.036075592041016, "global_step": 180282, "epoch": 4292} {"train_loss": -7.080848217010498, "global_step": 180283, "epoch": 4292} {"train_loss": -7.155338287353516, "global_step": 180284, "epoch": 4292} {"train_loss": -7.230452537536621, "global_step": 180285, "epoch": 4292} {"train_loss": -7.1644134521484375, "global_step": 180286, "epoch": 4292} {"train_loss": -7.029232025146484, "global_step": 180287, "epoch": 4292} {"train_loss": -7.153774738311768, "global_step": 180288, "epoch": 4292} {"train_loss": -7.1607890129089355, "global_step": 180289, "epoch": 4292} {"train_loss": -7.198418617248535, "global_step": 180290, "epoch": 4292} {"train_loss": -7.128628730773926, "global_step": 180291, "epoch": 4292} {"train_loss": -7.169628143310547, "global_step": 180292, "epoch": 4292} {"train_loss": -7.109066009521484, "global_step": 180293, "epoch": 4292} {"train_loss": -7.210290431976318, "global_step": 180294, "epoch": 4292} {"train_loss": -7.234369277954102, "global_step": 180295, "epoch": 4292} {"train_loss": -7.1546196937561035, "global_step": 180296, "epoch": 4292} {"train_loss": -7.044652938842773, "global_step": 180297, "epoch": 4292} {"train_loss": -7.140071868896484, "global_step": 180298, "epoch": 4292} {"train_loss": -7.178260803222656, "global_step": 180299, "epoch": 4292} {"train_loss": -7.160190105438232, "global_step": 180300, "epoch": 4292} {"train_loss": -7.123143196105957, "global_step": 180301, "epoch": 4292} {"train_loss": -7.160379886627197, "global_step": 180302, "epoch": 4292} {"train_loss": -7.004141807556152, "global_step": 180303, "epoch": 4292} {"train_loss": -7.155879020690918, "global_step": 180304, "epoch": 4292} {"train_loss": -7.101580619812012, "global_step": 180305, "epoch": 4292, "val_loss": 80471.53125} {"train_loss": -7.138643264770508, "global_step": 180306, "epoch": 4293} {"train_loss": -7.226287841796875, "global_step": 180307, "epoch": 4293} {"train_loss": -7.251398086547852, "global_step": 180308, "epoch": 4293} {"train_loss": -7.200061798095703, "global_step": 180309, "epoch": 4293} {"train_loss": -7.103950500488281, "global_step": 180310, "epoch": 4293} {"train_loss": -7.133166313171387, "global_step": 180311, "epoch": 4293} {"train_loss": -7.235894680023193, "global_step": 180312, "epoch": 4293} {"train_loss": -7.18887996673584, "global_step": 180313, "epoch": 4293} {"train_loss": -7.153644561767578, "global_step": 180314, "epoch": 4293} {"train_loss": -7.152307510375977, "global_step": 180315, "epoch": 4293} {"train_loss": -7.064754962921143, "global_step": 180316, "epoch": 4293} {"train_loss": -7.0357255935668945, "global_step": 180317, "epoch": 4293} {"train_loss": -7.069998741149902, "global_step": 180318, "epoch": 4293} {"train_loss": -7.0692243576049805, "global_step": 180319, "epoch": 4293} {"train_loss": -7.258057594299316, "global_step": 180320, "epoch": 4293} {"train_loss": -7.193984031677246, "global_step": 180321, "epoch": 4293} {"train_loss": -7.1941070556640625, "global_step": 180322, "epoch": 4293} {"train_loss": -7.203181266784668, "global_step": 180323, "epoch": 4293} {"train_loss": -7.122404098510742, "global_step": 180324, "epoch": 4293} {"train_loss": -7.186197280883789, "global_step": 180325, "epoch": 4293} {"train_loss": -7.068838119506836, "global_step": 180326, "epoch": 4293} {"train_loss": -7.252616882324219, "global_step": 180327, "epoch": 4293} {"train_loss": -7.041491985321045, "global_step": 180328, "epoch": 4293} {"train_loss": -7.117435455322266, "global_step": 180329, "epoch": 4293} {"train_loss": -7.1884765625, "global_step": 180330, "epoch": 4293} {"train_loss": -7.138517379760742, "global_step": 180331, "epoch": 4293} {"train_loss": -7.08659553527832, "global_step": 180332, "epoch": 4293} {"train_loss": -7.098489761352539, "global_step": 180333, "epoch": 4293} {"train_loss": -7.083404541015625, "global_step": 180334, "epoch": 4293} {"train_loss": -7.127840995788574, "global_step": 180335, "epoch": 4293} {"train_loss": -7.10379695892334, "global_step": 180336, "epoch": 4293} {"train_loss": -7.291736125946045, "global_step": 180337, "epoch": 4293} {"train_loss": -7.077743053436279, "global_step": 180338, "epoch": 4293} {"train_loss": -7.092529296875, "global_step": 180339, "epoch": 4293} {"train_loss": -7.1014509201049805, "global_step": 180340, "epoch": 4293} {"train_loss": -7.029424667358398, "global_step": 180341, "epoch": 4293} {"train_loss": -7.148872375488281, "global_step": 180342, "epoch": 4293} {"train_loss": -7.161576271057129, "global_step": 180343, "epoch": 4293} {"train_loss": -7.047188758850098, "global_step": 180344, "epoch": 4293} {"train_loss": -7.131863117218018, "global_step": 180345, "epoch": 4293} {"train_loss": -6.919084548950195, "global_step": 180346, "epoch": 4293} {"train_loss": -7.1315962473551435, "global_step": 180347, "epoch": 4293, "val_loss": 80706.6640625} {"train_loss": -7.074291229248047, "global_step": 180348, "epoch": 4294} {"train_loss": -6.985260963439941, "global_step": 180349, "epoch": 4294} {"train_loss": -7.127792835235596, "global_step": 180350, "epoch": 4294} {"train_loss": -7.143815517425537, "global_step": 180351, "epoch": 4294} {"train_loss": -7.02973747253418, "global_step": 180352, "epoch": 4294} {"train_loss": -7.115963459014893, "global_step": 180353, "epoch": 4294} {"train_loss": -7.040891170501709, "global_step": 180354, "epoch": 4294} {"train_loss": -7.1543755531311035, "global_step": 180355, "epoch": 4294} {"train_loss": -6.948262691497803, "global_step": 180356, "epoch": 4294} {"train_loss": -6.942392349243164, "global_step": 180357, "epoch": 4294} {"train_loss": -7.016984939575195, "global_step": 180358, "epoch": 4294} {"train_loss": -7.113927841186523, "global_step": 180359, "epoch": 4294} {"train_loss": -7.158454895019531, "global_step": 180360, "epoch": 4294} {"train_loss": -7.238786697387695, "global_step": 180361, "epoch": 4294} {"train_loss": -7.094948768615723, "global_step": 180362, "epoch": 4294} {"train_loss": -7.2186994552612305, "global_step": 180363, "epoch": 4294} {"train_loss": -7.126309394836426, "global_step": 180364, "epoch": 4294} {"train_loss": -7.150744438171387, "global_step": 180365, "epoch": 4294} {"train_loss": -7.097977638244629, "global_step": 180366, "epoch": 4294} {"train_loss": -7.020813941955566, "global_step": 180367, "epoch": 4294} {"train_loss": -7.190441131591797, "global_step": 180368, "epoch": 4294} {"train_loss": -7.030599594116211, "global_step": 180369, "epoch": 4294} {"train_loss": -7.2738213539123535, "global_step": 180370, "epoch": 4294} {"train_loss": -7.17424201965332, "global_step": 180371, "epoch": 4294} {"train_loss": -7.150371551513672, "global_step": 180372, "epoch": 4294} {"train_loss": -7.179871559143066, "global_step": 180373, "epoch": 4294} {"train_loss": -7.146028995513916, "global_step": 180374, "epoch": 4294} {"train_loss": -7.084455966949463, "global_step": 180375, "epoch": 4294} {"train_loss": -7.214244842529297, "global_step": 180376, "epoch": 4294} {"train_loss": -7.062097072601318, "global_step": 180377, "epoch": 4294} {"train_loss": -7.054111480712891, "global_step": 180378, "epoch": 4294} {"train_loss": -7.146793365478516, "global_step": 180379, "epoch": 4294} {"train_loss": -7.235771179199219, "global_step": 180380, "epoch": 4294} {"train_loss": -7.154047966003418, "global_step": 180381, "epoch": 4294} {"train_loss": -7.23149299621582, "global_step": 180382, "epoch": 4294} {"train_loss": -7.123011112213135, "global_step": 180383, "epoch": 4294} {"train_loss": -7.1708526611328125, "global_step": 180384, "epoch": 4294} {"train_loss": -7.170919418334961, "global_step": 180385, "epoch": 4294} {"train_loss": -7.191997528076172, "global_step": 180386, "epoch": 4294} {"train_loss": -7.164381504058838, "global_step": 180387, "epoch": 4294} {"train_loss": -6.999892234802246, "global_step": 180388, "epoch": 4294} {"train_loss": -7.122695570900326, "global_step": 180389, "epoch": 4294, "val_loss": 80254.9375} {"train_loss": -7.262861251831055, "global_step": 180390, "epoch": 4295} {"train_loss": -7.124363899230957, "global_step": 180391, "epoch": 4295} {"train_loss": -7.060733318328857, "global_step": 180392, "epoch": 4295} {"train_loss": -7.241427421569824, "global_step": 180393, "epoch": 4295} {"train_loss": -7.153526306152344, "global_step": 180394, "epoch": 4295} {"train_loss": -7.166159629821777, "global_step": 180395, "epoch": 4295} {"train_loss": -7.225438117980957, "global_step": 180396, "epoch": 4295} {"train_loss": -7.199085235595703, "global_step": 180397, "epoch": 4295} {"train_loss": -7.211920738220215, "global_step": 180398, "epoch": 4295} {"train_loss": -7.009585380554199, "global_step": 180399, "epoch": 4295} {"train_loss": -7.214921951293945, "global_step": 180400, "epoch": 4295} {"train_loss": -7.127120494842529, "global_step": 180401, "epoch": 4295} {"train_loss": -7.220403671264648, "global_step": 180402, "epoch": 4295} {"train_loss": -7.214201927185059, "global_step": 180403, "epoch": 4295} {"train_loss": -7.179678916931152, "global_step": 180404, "epoch": 4295} {"train_loss": -7.187617778778076, "global_step": 180405, "epoch": 4295} {"train_loss": -7.075791835784912, "global_step": 180406, "epoch": 4295} {"train_loss": -7.027535438537598, "global_step": 180407, "epoch": 4295} {"train_loss": -7.203199863433838, "global_step": 180408, "epoch": 4295} {"train_loss": -7.123563766479492, "global_step": 180409, "epoch": 4295} {"train_loss": -7.047773361206055, "global_step": 180410, "epoch": 4295} {"train_loss": -7.073753356933594, "global_step": 180411, "epoch": 4295} {"train_loss": -7.154749393463135, "global_step": 180412, "epoch": 4295} {"train_loss": -7.14768123626709, "global_step": 180413, "epoch": 4295} {"train_loss": -7.275673866271973, "global_step": 180414, "epoch": 4295} {"train_loss": -7.085515975952148, "global_step": 180415, "epoch": 4295} {"train_loss": -7.168854713439941, "global_step": 180416, "epoch": 4295} {"train_loss": -7.129528045654297, "global_step": 180417, "epoch": 4295} {"train_loss": -6.9349541664123535, "global_step": 180418, "epoch": 4295} {"train_loss": -7.133395195007324, "global_step": 180419, "epoch": 4295} {"train_loss": -7.130894184112549, "global_step": 180420, "epoch": 4295} {"train_loss": -7.3057169914245605, "global_step": 180421, "epoch": 4295} {"train_loss": -7.114819526672363, "global_step": 180422, "epoch": 4295} {"train_loss": -7.111165523529053, "global_step": 180423, "epoch": 4295} {"train_loss": -7.220308780670166, "global_step": 180424, "epoch": 4295} {"train_loss": -7.148475646972656, "global_step": 180425, "epoch": 4295} {"train_loss": -7.165602684020996, "global_step": 180426, "epoch": 4295} {"train_loss": -7.147372245788574, "global_step": 180427, "epoch": 4295} {"train_loss": -7.0834879875183105, "global_step": 180428, "epoch": 4295} {"train_loss": -7.042486667633057, "global_step": 180429, "epoch": 4295} {"train_loss": -7.0717315673828125, "global_step": 180430, "epoch": 4295} {"train_loss": -7.145269870758057, "global_step": 180431, "epoch": 4295, "val_loss": 80483.015625} {"train_loss": -7.1022515296936035, "global_step": 180432, "epoch": 4296} {"train_loss": -7.17022705078125, "global_step": 180433, "epoch": 4296} {"train_loss": -7.0446457862854, "global_step": 180434, "epoch": 4296} {"train_loss": -7.036633014678955, "global_step": 180435, "epoch": 4296} {"train_loss": -7.137843132019043, "global_step": 180436, "epoch": 4296} {"train_loss": -7.29184103012085, "global_step": 180437, "epoch": 4296} {"train_loss": -7.090261459350586, "global_step": 180438, "epoch": 4296} {"train_loss": -7.181343078613281, "global_step": 180439, "epoch": 4296} {"train_loss": -7.11391544342041, "global_step": 180440, "epoch": 4296} {"train_loss": -7.201798439025879, "global_step": 180441, "epoch": 4296} {"train_loss": -7.118839263916016, "global_step": 180442, "epoch": 4296} {"train_loss": -7.131209373474121, "global_step": 180443, "epoch": 4296} {"train_loss": -7.194063186645508, "global_step": 180444, "epoch": 4296} {"train_loss": -7.175002098083496, "global_step": 180445, "epoch": 4296} {"train_loss": -7.182614326477051, "global_step": 180446, "epoch": 4296} {"train_loss": -7.131935119628906, "global_step": 180447, "epoch": 4296} {"train_loss": -7.243890762329102, "global_step": 180448, "epoch": 4296} {"train_loss": -7.217206001281738, "global_step": 180449, "epoch": 4296} {"train_loss": -7.191218376159668, "global_step": 180450, "epoch": 4296} {"train_loss": -7.152287483215332, "global_step": 180451, "epoch": 4296} {"train_loss": -7.0706377029418945, "global_step": 180452, "epoch": 4296} {"train_loss": -7.185914993286133, "global_step": 180453, "epoch": 4296} {"train_loss": -7.002138137817383, "global_step": 180454, "epoch": 4296} {"train_loss": -7.019270420074463, "global_step": 180455, "epoch": 4296} {"train_loss": -7.112762928009033, "global_step": 180456, "epoch": 4296} {"train_loss": -7.0346879959106445, "global_step": 180457, "epoch": 4296} {"train_loss": -7.199489116668701, "global_step": 180458, "epoch": 4296} {"train_loss": -7.146306991577148, "global_step": 180459, "epoch": 4296} {"train_loss": -7.094892501831055, "global_step": 180460, "epoch": 4296} {"train_loss": -7.187502861022949, "global_step": 180461, "epoch": 4296} {"train_loss": -7.228878498077393, "global_step": 180462, "epoch": 4296} {"train_loss": -7.1286516189575195, "global_step": 180463, "epoch": 4296} {"train_loss": -7.121835231781006, "global_step": 180464, "epoch": 4296} {"train_loss": -7.176091194152832, "global_step": 180465, "epoch": 4296} {"train_loss": -7.091217994689941, "global_step": 180466, "epoch": 4296} {"train_loss": -7.049728870391846, "global_step": 180467, "epoch": 4296} {"train_loss": -7.129010200500488, "global_step": 180468, "epoch": 4296} {"train_loss": -6.884690284729004, "global_step": 180469, "epoch": 4296} {"train_loss": -7.160865783691406, "global_step": 180470, "epoch": 4296} {"train_loss": -7.035828113555908, "global_step": 180471, "epoch": 4296} {"train_loss": -6.872326850891113, "global_step": 180472, "epoch": 4296} {"train_loss": -7.120583204996018, "global_step": 180473, "epoch": 4296, "val_loss": 80499.828125} {"train_loss": -6.968565464019775, "global_step": 180474, "epoch": 4297} {"train_loss": -6.957210540771484, "global_step": 180475, "epoch": 4297} {"train_loss": -7.1211371421813965, "global_step": 180476, "epoch": 4297} {"train_loss": -7.0972747802734375, "global_step": 180477, "epoch": 4297} {"train_loss": -7.017850399017334, "global_step": 180478, "epoch": 4297} {"train_loss": -7.060234069824219, "global_step": 180479, "epoch": 4297} {"train_loss": -7.1581926345825195, "global_step": 180480, "epoch": 4297} {"train_loss": -7.034084796905518, "global_step": 180481, "epoch": 4297} {"train_loss": -7.246837615966797, "global_step": 180482, "epoch": 4297} {"train_loss": -7.131800651550293, "global_step": 180483, "epoch": 4297} {"train_loss": -7.1246867179870605, "global_step": 180484, "epoch": 4297} {"train_loss": -6.960272312164307, "global_step": 180485, "epoch": 4297} {"train_loss": -7.094992637634277, "global_step": 180486, "epoch": 4297} {"train_loss": -7.144168853759766, "global_step": 180487, "epoch": 4297} {"train_loss": -7.249082565307617, "global_step": 180488, "epoch": 4297} {"train_loss": -7.212757110595703, "global_step": 180489, "epoch": 4297} {"train_loss": -7.0985331535339355, "global_step": 180490, "epoch": 4297} {"train_loss": -7.189452171325684, "global_step": 180491, "epoch": 4297} {"train_loss": -7.064414024353027, "global_step": 180492, "epoch": 4297} {"train_loss": -7.193316459655762, "global_step": 180493, "epoch": 4297} {"train_loss": -7.161492824554443, "global_step": 180494, "epoch": 4297} {"train_loss": -7.182442665100098, "global_step": 180495, "epoch": 4297} {"train_loss": -7.099571228027344, "global_step": 180496, "epoch": 4297} {"train_loss": -7.130252361297607, "global_step": 180497, "epoch": 4297} {"train_loss": -7.283685684204102, "global_step": 180498, "epoch": 4297} {"train_loss": -7.151666164398193, "global_step": 180499, "epoch": 4297} {"train_loss": -7.180809020996094, "global_step": 180500, "epoch": 4297} {"train_loss": -7.228762149810791, "global_step": 180501, "epoch": 4297} {"train_loss": -7.2552971839904785, "global_step": 180502, "epoch": 4297} {"train_loss": -7.244505882263184, "global_step": 180503, "epoch": 4297} {"train_loss": -7.197079658508301, "global_step": 180504, "epoch": 4297} {"train_loss": -7.150671005249023, "global_step": 180505, "epoch": 4297} {"train_loss": -7.167829513549805, "global_step": 180506, "epoch": 4297} {"train_loss": -7.307117462158203, "global_step": 180507, "epoch": 4297} {"train_loss": -7.152866363525391, "global_step": 180508, "epoch": 4297} {"train_loss": -7.0905585289001465, "global_step": 180509, "epoch": 4297} {"train_loss": -7.038992881774902, "global_step": 180510, "epoch": 4297} {"train_loss": -7.1061015129089355, "global_step": 180511, "epoch": 4297} {"train_loss": -7.067305564880371, "global_step": 180512, "epoch": 4297} {"train_loss": -6.967659950256348, "global_step": 180513, "epoch": 4297} {"train_loss": -6.969532012939453, "global_step": 180514, "epoch": 4297} {"train_loss": -7.128844158990042, "global_step": 180515, "epoch": 4297, "val_loss": 80533.109375} {"train_loss": -7.036494255065918, "global_step": 180516, "epoch": 4298} {"train_loss": -7.129766464233398, "global_step": 180517, "epoch": 4298} {"train_loss": -7.101505279541016, "global_step": 180518, "epoch": 4298} {"train_loss": -7.050731182098389, "global_step": 180519, "epoch": 4298} {"train_loss": -7.0847063064575195, "global_step": 180520, "epoch": 4298} {"train_loss": -7.122663497924805, "global_step": 180521, "epoch": 4298} {"train_loss": -7.170768737792969, "global_step": 180522, "epoch": 4298} {"train_loss": -7.021430015563965, "global_step": 180523, "epoch": 4298} {"train_loss": -7.050166606903076, "global_step": 180524, "epoch": 4298} {"train_loss": -7.027335166931152, "global_step": 180525, "epoch": 4298} {"train_loss": -6.990159034729004, "global_step": 180526, "epoch": 4298} {"train_loss": -7.118025779724121, "global_step": 180527, "epoch": 4298} {"train_loss": -6.988624572753906, "global_step": 180528, "epoch": 4298} {"train_loss": -7.061796188354492, "global_step": 180529, "epoch": 4298} {"train_loss": -7.052628993988037, "global_step": 180530, "epoch": 4298} {"train_loss": -7.102768421173096, "global_step": 180531, "epoch": 4298} {"train_loss": -7.19156551361084, "global_step": 180532, "epoch": 4298} {"train_loss": -7.021697044372559, "global_step": 180533, "epoch": 4298} {"train_loss": -7.177913665771484, "global_step": 180534, "epoch": 4298} {"train_loss": -7.198505401611328, "global_step": 180535, "epoch": 4298} {"train_loss": -7.217032432556152, "global_step": 180536, "epoch": 4298} {"train_loss": -7.1162238121032715, "global_step": 180537, "epoch": 4298} {"train_loss": -6.820857524871826, "global_step": 180538, "epoch": 4298} {"train_loss": -7.185708045959473, "global_step": 180539, "epoch": 4298} {"train_loss": -7.0274577140808105, "global_step": 180540, "epoch": 4298} {"train_loss": -7.06472635269165, "global_step": 180541, "epoch": 4298} {"train_loss": -7.161218643188477, "global_step": 180542, "epoch": 4298} {"train_loss": -7.087615966796875, "global_step": 180543, "epoch": 4298} {"train_loss": -7.211201190948486, "global_step": 180544, "epoch": 4298} {"train_loss": -6.97286319732666, "global_step": 180545, "epoch": 4298} {"train_loss": -7.064001083374023, "global_step": 180546, "epoch": 4298} {"train_loss": -7.20491886138916, "global_step": 180547, "epoch": 4298} {"train_loss": -7.115974426269531, "global_step": 180548, "epoch": 4298} {"train_loss": -7.0349273681640625, "global_step": 180549, "epoch": 4298} {"train_loss": -7.055856704711914, "global_step": 180550, "epoch": 4298} {"train_loss": -7.168123245239258, "global_step": 180551, "epoch": 4298} {"train_loss": -7.118319511413574, "global_step": 180552, "epoch": 4298} {"train_loss": -7.143040657043457, "global_step": 180553, "epoch": 4298} {"train_loss": -7.16968297958374, "global_step": 180554, "epoch": 4298} {"train_loss": -7.214134216308594, "global_step": 180555, "epoch": 4298} {"train_loss": -7.036440849304199, "global_step": 180556, "epoch": 4298} {"train_loss": -7.098217805226644, "global_step": 180557, "epoch": 4298, "val_loss": 80409.4140625} {"train_loss": -7.060331344604492, "global_step": 180558, "epoch": 4299} {"train_loss": -7.190967559814453, "global_step": 180559, "epoch": 4299} {"train_loss": -7.296257972717285, "global_step": 180560, "epoch": 4299} {"train_loss": -7.0950798988342285, "global_step": 180561, "epoch": 4299} {"train_loss": -7.115771293640137, "global_step": 180562, "epoch": 4299} {"train_loss": -7.158162593841553, "global_step": 180563, "epoch": 4299} {"train_loss": -7.219263076782227, "global_step": 180564, "epoch": 4299} {"train_loss": -7.057151794433594, "global_step": 180565, "epoch": 4299} {"train_loss": -7.155991077423096, "global_step": 180566, "epoch": 4299} {"train_loss": -7.078885078430176, "global_step": 180567, "epoch": 4299} {"train_loss": -7.136031150817871, "global_step": 180568, "epoch": 4299} {"train_loss": -7.202972412109375, "global_step": 180569, "epoch": 4299} {"train_loss": -7.2284698486328125, "global_step": 180570, "epoch": 4299} {"train_loss": -7.237362861633301, "global_step": 180571, "epoch": 4299} {"train_loss": -7.214323043823242, "global_step": 180572, "epoch": 4299} {"train_loss": -7.129115104675293, "global_step": 180573, "epoch": 4299} {"train_loss": -7.11708402633667, "global_step": 180574, "epoch": 4299} {"train_loss": -7.120936393737793, "global_step": 180575, "epoch": 4299} {"train_loss": -7.093869209289551, "global_step": 180576, "epoch": 4299} {"train_loss": -7.21053409576416, "global_step": 180577, "epoch": 4299} {"train_loss": -7.020906448364258, "global_step": 180578, "epoch": 4299} {"train_loss": -7.093230247497559, "global_step": 180579, "epoch": 4299} {"train_loss": -7.131430149078369, "global_step": 180580, "epoch": 4299} {"train_loss": -7.030642032623291, "global_step": 180581, "epoch": 4299} {"train_loss": -7.0677595138549805, "global_step": 180582, "epoch": 4299} {"train_loss": -7.246781826019287, "global_step": 180583, "epoch": 4299} {"train_loss": -7.089962005615234, "global_step": 180584, "epoch": 4299} {"train_loss": -7.1959919929504395, "global_step": 180585, "epoch": 4299} {"train_loss": -7.1999006271362305, "global_step": 180586, "epoch": 4299} {"train_loss": -7.201579570770264, "global_step": 180587, "epoch": 4299} {"train_loss": -7.119936943054199, "global_step": 180588, "epoch": 4299} {"train_loss": -7.215207099914551, "global_step": 180589, "epoch": 4299} {"train_loss": -7.193143844604492, "global_step": 180590, "epoch": 4299} {"train_loss": -7.188438892364502, "global_step": 180591, "epoch": 4299} {"train_loss": -7.076561450958252, "global_step": 180592, "epoch": 4299} {"train_loss": -7.0925445556640625, "global_step": 180593, "epoch": 4299} {"train_loss": -7.141462326049805, "global_step": 180594, "epoch": 4299} {"train_loss": -7.088855266571045, "global_step": 180595, "epoch": 4299} {"train_loss": -7.112116813659668, "global_step": 180596, "epoch": 4299} {"train_loss": -7.056439399719238, "global_step": 180597, "epoch": 4299} {"train_loss": -7.141242980957031, "global_step": 180598, "epoch": 4299} {"train_loss": -7.1415544010344005, "global_step": 180599, "epoch": 4299, "val_loss": 80411.484375} {"train_loss": -7.1163506507873535, "global_step": 180600, "epoch": 4300} {"train_loss": -7.150376319885254, "global_step": 180601, "epoch": 4300} {"train_loss": -6.995903015136719, "global_step": 180602, "epoch": 4300} {"train_loss": -7.087861061096191, "global_step": 180603, "epoch": 4300} {"train_loss": -7.072900772094727, "global_step": 180604, "epoch": 4300} {"train_loss": -6.891700267791748, "global_step": 180605, "epoch": 4300} {"train_loss": -7.166717052459717, "global_step": 180606, "epoch": 4300} {"train_loss": -7.112429618835449, "global_step": 180607, "epoch": 4300} {"train_loss": -7.145051002502441, "global_step": 180608, "epoch": 4300} {"train_loss": -7.236547946929932, "global_step": 180609, "epoch": 4300} {"train_loss": -7.011590003967285, "global_step": 180610, "epoch": 4300} {"train_loss": -7.186129570007324, "global_step": 180611, "epoch": 4300} {"train_loss": -7.060392379760742, "global_step": 180612, "epoch": 4300} {"train_loss": -6.961070537567139, "global_step": 180613, "epoch": 4300} {"train_loss": -7.145449161529541, "global_step": 180614, "epoch": 4300} {"train_loss": -7.049713134765625, "global_step": 180615, "epoch": 4300} {"train_loss": -6.927949905395508, "global_step": 180616, "epoch": 4300} {"train_loss": -7.093020915985107, "global_step": 180617, "epoch": 4300} {"train_loss": -7.005475997924805, "global_step": 180618, "epoch": 4300} {"train_loss": -7.001120567321777, "global_step": 180619, "epoch": 4300} {"train_loss": -7.035305976867676, "global_step": 180620, "epoch": 4300} {"train_loss": -7.0661702156066895, "global_step": 180621, "epoch": 4300} {"train_loss": -6.946672439575195, "global_step": 180622, "epoch": 4300} {"train_loss": -6.984699249267578, "global_step": 180623, "epoch": 4300} {"train_loss": -7.113350868225098, "global_step": 180624, "epoch": 4300} {"train_loss": -6.947694778442383, "global_step": 180625, "epoch": 4300} {"train_loss": -7.0238237380981445, "global_step": 180626, "epoch": 4300} {"train_loss": -7.089317321777344, "global_step": 180627, "epoch": 4300} {"train_loss": -6.90012264251709, "global_step": 180628, "epoch": 4300} {"train_loss": -7.068282127380371, "global_step": 180629, "epoch": 4300} {"train_loss": -6.956465721130371, "global_step": 180630, "epoch": 4300} {"train_loss": -6.872671127319336, "global_step": 180631, "epoch": 4300} {"train_loss": -6.972667694091797, "global_step": 180632, "epoch": 4300} {"train_loss": -7.054974555969238, "global_step": 180633, "epoch": 4300} {"train_loss": -6.978884220123291, "global_step": 180634, "epoch": 4300} {"train_loss": -7.069587707519531, "global_step": 180635, "epoch": 4300} {"train_loss": -6.963326454162598, "global_step": 180636, "epoch": 4300} {"train_loss": -7.133862018585205, "global_step": 180637, "epoch": 4300} {"train_loss": -7.078727722167969, "global_step": 180638, "epoch": 4300} {"train_loss": -7.084268569946289, "global_step": 180639, "epoch": 4300} {"train_loss": -7.130054473876953, "global_step": 180640, "epoch": 4300} {"train_loss": -7.0467556317647295, "global_step": 180641, "epoch": 4300, "train/sim_max_reward_0": 0.8620060018813362, "train/sim_max_reward_1": 0.8254755597152246, "train/sim_max_reward_2": 0.37871427615760517, "train/sim_max_reward_3": 0.15014292398341514, "train/sim_max_reward_4": 0.9026899951714684, "train/sim_max_reward_5": 0.559023117314533, "test/sim_max_reward_4500000": 0.9197980430663499, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9378183821254977, "test/sim_max_reward_4500004": 0.23165638047032872, "test/sim_max_reward_4500005": 0.9359010653296063, "test/sim_max_reward_4500006": 0.933443099548527, "test/sim_max_reward_4500007": 0.9170737351960684, "test/sim_max_reward_4500008": 0.9160920238853041, "test/sim_max_reward_4500009": 0.05308651183519292, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9571712349674886, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.002491683096749649, "test/sim_max_reward_4500014": 0.9953071649262079, "test/sim_max_reward_4500015": 0.960874253497853, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.048162084216774044, "test/sim_max_reward_4500018": 0.6190028014236848, "test/sim_max_reward_4500019": 0.9575393166377589, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9620775539210191, "test/sim_max_reward_4500022": 0.45008685981780855, "test/sim_max_reward_4500023": 0.5442594204050626, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 1.0, "test/sim_max_reward_4500026": 0.9062820400733481, "test/sim_max_reward_4500027": 0.9903618958905962, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.09324678183729887, "test/sim_max_reward_4500030": 0.8261763487643912, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9670526401092042, "test/sim_max_reward_4500034": 1.0, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 0.9434968143466448, "test/sim_max_reward_4500037": 0.8071131079189447, "test/sim_max_reward_4500038": 0.3414481875757178, "test/sim_max_reward_4500039": 0.9265737894371882, "test/sim_max_reward_4500040": 0.9175442636233797, "test/sim_max_reward_4500041": 0.8887239188810198, "test/sim_max_reward_4500042": 0.03873049330744391, "test/sim_max_reward_4500043": 0.3671560161482282, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.405628309545732, "test/sim_max_reward_4500046": 0.20164839434517437, "test/sim_max_reward_4500047": 0.9731894302013551, "test/sim_max_reward_4500048": 0.0402897280100342, "test/sim_max_reward_4500049": 0.8862916296680406, "train/mean_score": 0.6130086457039304, "test/mean_score": 0.5823005302528087, "val_loss": 80462.4453125} {"train_loss": -7.058546543121338, "global_step": 180642, "epoch": 4301} {"train_loss": -7.020263671875, "global_step": 180643, "epoch": 4301} {"train_loss": -7.073451519012451, "global_step": 180644, "epoch": 4301} {"train_loss": -7.116314888000488, "global_step": 180645, "epoch": 4301} {"train_loss": -7.151542663574219, "global_step": 180646, "epoch": 4301} {"train_loss": -7.031444072723389, "global_step": 180647, "epoch": 4301} {"train_loss": -7.108784198760986, "global_step": 180648, "epoch": 4301} {"train_loss": -7.202200412750244, "global_step": 180649, "epoch": 4301} {"train_loss": -7.123360633850098, "global_step": 180650, "epoch": 4301} {"train_loss": -7.048839569091797, "global_step": 180651, "epoch": 4301} {"train_loss": -7.122821807861328, "global_step": 180652, "epoch": 4301} {"train_loss": -7.140329837799072, "global_step": 180653, "epoch": 4301} {"train_loss": -7.041378021240234, "global_step": 180654, "epoch": 4301} {"train_loss": -7.205173492431641, "global_step": 180655, "epoch": 4301} {"train_loss": -7.119339942932129, "global_step": 180656, "epoch": 4301} {"train_loss": -7.177745819091797, "global_step": 180657, "epoch": 4301} {"train_loss": -7.091838359832764, "global_step": 180658, "epoch": 4301} {"train_loss": -7.16835880279541, "global_step": 180659, "epoch": 4301} {"train_loss": -7.198534965515137, "global_step": 180660, "epoch": 4301} {"train_loss": -7.1654815673828125, "global_step": 180661, "epoch": 4301} {"train_loss": -7.2273101806640625, "global_step": 180662, "epoch": 4301} {"train_loss": -7.22579288482666, "global_step": 180663, "epoch": 4301} {"train_loss": -7.1539459228515625, "global_step": 180664, "epoch": 4301} {"train_loss": -7.2357330322265625, "global_step": 180665, "epoch": 4301} {"train_loss": -7.15771484375, "global_step": 180666, "epoch": 4301} {"train_loss": -7.125253677368164, "global_step": 180667, "epoch": 4301} {"train_loss": -7.182267189025879, "global_step": 180668, "epoch": 4301} {"train_loss": -7.150238037109375, "global_step": 180669, "epoch": 4301} {"train_loss": -7.061046600341797, "global_step": 180670, "epoch": 4301} {"train_loss": -7.243786811828613, "global_step": 180671, "epoch": 4301} {"train_loss": -7.2912373542785645, "global_step": 180672, "epoch": 4301} {"train_loss": -7.18428897857666, "global_step": 180673, "epoch": 4301} {"train_loss": -7.272228240966797, "global_step": 180674, "epoch": 4301} {"train_loss": -7.089943885803223, "global_step": 180675, "epoch": 4301} {"train_loss": -7.311715126037598, "global_step": 180676, "epoch": 4301} {"train_loss": -7.227000713348389, "global_step": 180677, "epoch": 4301} {"train_loss": -7.167032241821289, "global_step": 180678, "epoch": 4301} {"train_loss": -7.120038986206055, "global_step": 180679, "epoch": 4301} {"train_loss": -7.134555339813232, "global_step": 180680, "epoch": 4301} {"train_loss": -7.130458354949951, "global_step": 180681, "epoch": 4301} {"train_loss": -7.077937602996826, "global_step": 180682, "epoch": 4301} {"train_loss": -7.149826980772472, "global_step": 180683, "epoch": 4301, "val_loss": 80399.0} {"train_loss": -7.13212776184082, "global_step": 180684, "epoch": 4302} {"train_loss": -7.231316566467285, "global_step": 180685, "epoch": 4302} {"train_loss": -7.1716203689575195, "global_step": 180686, "epoch": 4302} {"train_loss": -7.082188606262207, "global_step": 180687, "epoch": 4302} {"train_loss": -7.138888359069824, "global_step": 180688, "epoch": 4302} {"train_loss": -7.155765533447266, "global_step": 180689, "epoch": 4302} {"train_loss": -7.067132949829102, "global_step": 180690, "epoch": 4302} {"train_loss": -7.1672773361206055, "global_step": 180691, "epoch": 4302} {"train_loss": -7.170426368713379, "global_step": 180692, "epoch": 4302} {"train_loss": -7.188415050506592, "global_step": 180693, "epoch": 4302} {"train_loss": -7.11906623840332, "global_step": 180694, "epoch": 4302} {"train_loss": -7.012152671813965, "global_step": 180695, "epoch": 4302} {"train_loss": -7.0660624504089355, "global_step": 180696, "epoch": 4302} {"train_loss": -7.167674541473389, "global_step": 180697, "epoch": 4302} {"train_loss": -7.121959209442139, "global_step": 180698, "epoch": 4302} {"train_loss": -7.1520586013793945, "global_step": 180699, "epoch": 4302} {"train_loss": -7.042573928833008, "global_step": 180700, "epoch": 4302} {"train_loss": -7.161291122436523, "global_step": 180701, "epoch": 4302} {"train_loss": -7.142202377319336, "global_step": 180702, "epoch": 4302} {"train_loss": -7.146551609039307, "global_step": 180703, "epoch": 4302} {"train_loss": -7.144239902496338, "global_step": 180704, "epoch": 4302} {"train_loss": -7.149146556854248, "global_step": 180705, "epoch": 4302} {"train_loss": -7.092164039611816, "global_step": 180706, "epoch": 4302} {"train_loss": -7.139412879943848, "global_step": 180707, "epoch": 4302} {"train_loss": -7.114872932434082, "global_step": 180708, "epoch": 4302} {"train_loss": -7.18341064453125, "global_step": 180709, "epoch": 4302} {"train_loss": -7.064380645751953, "global_step": 180710, "epoch": 4302} {"train_loss": -7.1757917404174805, "global_step": 180711, "epoch": 4302} {"train_loss": -7.13621711730957, "global_step": 180712, "epoch": 4302} {"train_loss": -7.017846584320068, "global_step": 180713, "epoch": 4302} {"train_loss": -6.975031852722168, "global_step": 180714, "epoch": 4302} {"train_loss": -7.126996994018555, "global_step": 180715, "epoch": 4302} {"train_loss": -7.152218341827393, "global_step": 180716, "epoch": 4302} {"train_loss": -7.101910591125488, "global_step": 180717, "epoch": 4302} {"train_loss": -7.118328094482422, "global_step": 180718, "epoch": 4302} {"train_loss": -7.132401943206787, "global_step": 180719, "epoch": 4302} {"train_loss": -7.135332107543945, "global_step": 180720, "epoch": 4302} {"train_loss": -7.089243412017822, "global_step": 180721, "epoch": 4302} {"train_loss": -6.9886369705200195, "global_step": 180722, "epoch": 4302} {"train_loss": -7.036761283874512, "global_step": 180723, "epoch": 4302} {"train_loss": -7.138116359710693, "global_step": 180724, "epoch": 4302} {"train_loss": -7.117088295164562, "global_step": 180725, "epoch": 4302, "val_loss": 80414.5859375} {"train_loss": -6.963174819946289, "global_step": 180726, "epoch": 4303} {"train_loss": -7.111847400665283, "global_step": 180727, "epoch": 4303} {"train_loss": -6.947547435760498, "global_step": 180728, "epoch": 4303} {"train_loss": -7.204178810119629, "global_step": 180729, "epoch": 4303} {"train_loss": -7.0833821296691895, "global_step": 180730, "epoch": 4303} {"train_loss": -7.110440254211426, "global_step": 180731, "epoch": 4303} {"train_loss": -7.175927639007568, "global_step": 180732, "epoch": 4303} {"train_loss": -7.138955116271973, "global_step": 180733, "epoch": 4303} {"train_loss": -7.0963897705078125, "global_step": 180734, "epoch": 4303} {"train_loss": -7.137985706329346, "global_step": 180735, "epoch": 4303} {"train_loss": -7.233064651489258, "global_step": 180736, "epoch": 4303} {"train_loss": -7.181911468505859, "global_step": 180737, "epoch": 4303} {"train_loss": -7.089820861816406, "global_step": 180738, "epoch": 4303} {"train_loss": -7.111787796020508, "global_step": 180739, "epoch": 4303} {"train_loss": -7.07563591003418, "global_step": 180740, "epoch": 4303} {"train_loss": -7.221054553985596, "global_step": 180741, "epoch": 4303} {"train_loss": -6.980678081512451, "global_step": 180742, "epoch": 4303} {"train_loss": -7.128808975219727, "global_step": 180743, "epoch": 4303} {"train_loss": -7.085019111633301, "global_step": 180744, "epoch": 4303} {"train_loss": -7.146535873413086, "global_step": 180745, "epoch": 4303} {"train_loss": -7.235182285308838, "global_step": 180746, "epoch": 4303} {"train_loss": -7.081661224365234, "global_step": 180747, "epoch": 4303} {"train_loss": -6.961523056030273, "global_step": 180748, "epoch": 4303} {"train_loss": -7.012042999267578, "global_step": 180749, "epoch": 4303} {"train_loss": -7.19701623916626, "global_step": 180750, "epoch": 4303} {"train_loss": -6.980884075164795, "global_step": 180751, "epoch": 4303} {"train_loss": -7.263079643249512, "global_step": 180752, "epoch": 4303} {"train_loss": -7.171905994415283, "global_step": 180753, "epoch": 4303} {"train_loss": -7.075930595397949, "global_step": 180754, "epoch": 4303} {"train_loss": -7.217092037200928, "global_step": 180755, "epoch": 4303} {"train_loss": -7.1575846672058105, "global_step": 180756, "epoch": 4303} {"train_loss": -7.016676425933838, "global_step": 180757, "epoch": 4303} {"train_loss": -7.081024646759033, "global_step": 180758, "epoch": 4303} {"train_loss": -7.017794609069824, "global_step": 180759, "epoch": 4303} {"train_loss": -6.995690822601318, "global_step": 180760, "epoch": 4303} {"train_loss": -7.184392929077148, "global_step": 180761, "epoch": 4303} {"train_loss": -7.1463799476623535, "global_step": 180762, "epoch": 4303} {"train_loss": -7.2193450927734375, "global_step": 180763, "epoch": 4303} {"train_loss": -7.111772537231445, "global_step": 180764, "epoch": 4303} {"train_loss": -7.197340965270996, "global_step": 180765, "epoch": 4303} {"train_loss": -7.214984893798828, "global_step": 180766, "epoch": 4303} {"train_loss": -7.116802647000267, "global_step": 180767, "epoch": 4303, "val_loss": 80591.875} {"train_loss": -7.214284420013428, "global_step": 180768, "epoch": 4304} {"train_loss": -7.148209571838379, "global_step": 180769, "epoch": 4304} {"train_loss": -7.210212707519531, "global_step": 180770, "epoch": 4304} {"train_loss": -7.197248458862305, "global_step": 180771, "epoch": 4304} {"train_loss": -7.153943061828613, "global_step": 180772, "epoch": 4304} {"train_loss": -7.247806549072266, "global_step": 180773, "epoch": 4304} {"train_loss": -7.246689796447754, "global_step": 180774, "epoch": 4304} {"train_loss": -7.050232887268066, "global_step": 180775, "epoch": 4304} {"train_loss": -7.154580593109131, "global_step": 180776, "epoch": 4304} {"train_loss": -7.197994232177734, "global_step": 180777, "epoch": 4304} {"train_loss": -7.108372688293457, "global_step": 180778, "epoch": 4304} {"train_loss": -7.212248802185059, "global_step": 180779, "epoch": 4304} {"train_loss": -7.177609443664551, "global_step": 180780, "epoch": 4304} {"train_loss": -7.216969966888428, "global_step": 180781, "epoch": 4304} {"train_loss": -7.0898542404174805, "global_step": 180782, "epoch": 4304} {"train_loss": -7.201571464538574, "global_step": 180783, "epoch": 4304} {"train_loss": -7.172307968139648, "global_step": 180784, "epoch": 4304} {"train_loss": -7.1714253425598145, "global_step": 180785, "epoch": 4304} {"train_loss": -7.097482681274414, "global_step": 180786, "epoch": 4304} {"train_loss": -7.080197334289551, "global_step": 180787, "epoch": 4304} {"train_loss": -7.144153118133545, "global_step": 180788, "epoch": 4304} {"train_loss": -7.003269195556641, "global_step": 180789, "epoch": 4304} {"train_loss": -7.109566688537598, "global_step": 180790, "epoch": 4304} {"train_loss": -7.177988529205322, "global_step": 180791, "epoch": 4304} {"train_loss": -7.17070198059082, "global_step": 180792, "epoch": 4304} {"train_loss": -7.2466607093811035, "global_step": 180793, "epoch": 4304} {"train_loss": -7.19239616394043, "global_step": 180794, "epoch": 4304} {"train_loss": -7.338497161865234, "global_step": 180795, "epoch": 4304} {"train_loss": -7.262540817260742, "global_step": 180796, "epoch": 4304} {"train_loss": -7.22133731842041, "global_step": 180797, "epoch": 4304} {"train_loss": -7.2684783935546875, "global_step": 180798, "epoch": 4304} {"train_loss": -7.230277061462402, "global_step": 180799, "epoch": 4304} {"train_loss": -7.169780254364014, "global_step": 180800, "epoch": 4304} {"train_loss": -7.266740798950195, "global_step": 180801, "epoch": 4304} {"train_loss": -7.146048545837402, "global_step": 180802, "epoch": 4304} {"train_loss": -7.09375, "global_step": 180803, "epoch": 4304} {"train_loss": -7.236043930053711, "global_step": 180804, "epoch": 4304} {"train_loss": -7.141811370849609, "global_step": 180805, "epoch": 4304} {"train_loss": -7.173796653747559, "global_step": 180806, "epoch": 4304} {"train_loss": -7.187591552734375, "global_step": 180807, "epoch": 4304} {"train_loss": -7.214648246765137, "global_step": 180808, "epoch": 4304} {"train_loss": -7.17850569316319, "global_step": 180809, "epoch": 4304, "val_loss": 80531.2890625} {"train_loss": -7.3220133781433105, "global_step": 180810, "epoch": 4305} {"train_loss": -7.260880947113037, "global_step": 180811, "epoch": 4305} {"train_loss": -7.154201507568359, "global_step": 180812, "epoch": 4305} {"train_loss": -7.145112991333008, "global_step": 180813, "epoch": 4305} {"train_loss": -7.261820316314697, "global_step": 180814, "epoch": 4305} {"train_loss": -7.1866455078125, "global_step": 180815, "epoch": 4305} {"train_loss": -7.214427947998047, "global_step": 180816, "epoch": 4305} {"train_loss": -7.212593078613281, "global_step": 180817, "epoch": 4305} {"train_loss": -7.232834815979004, "global_step": 180818, "epoch": 4305} {"train_loss": -7.029479026794434, "global_step": 180819, "epoch": 4305} {"train_loss": -7.062699794769287, "global_step": 180820, "epoch": 4305} {"train_loss": -7.158290863037109, "global_step": 180821, "epoch": 4305} {"train_loss": -7.14467191696167, "global_step": 180822, "epoch": 4305} {"train_loss": -7.071608543395996, "global_step": 180823, "epoch": 4305} {"train_loss": -7.152473449707031, "global_step": 180824, "epoch": 4305} {"train_loss": -7.164177417755127, "global_step": 180825, "epoch": 4305} {"train_loss": -7.063828468322754, "global_step": 180826, "epoch": 4305} {"train_loss": -7.036299705505371, "global_step": 180827, "epoch": 4305} {"train_loss": -7.119504928588867, "global_step": 180828, "epoch": 4305} {"train_loss": -7.0128679275512695, "global_step": 180829, "epoch": 4305} {"train_loss": -7.115910053253174, "global_step": 180830, "epoch": 4305} {"train_loss": -7.023840427398682, "global_step": 180831, "epoch": 4305} {"train_loss": -6.941826343536377, "global_step": 180832, "epoch": 4305} {"train_loss": -7.243147850036621, "global_step": 180833, "epoch": 4305} {"train_loss": -7.093093395233154, "global_step": 180834, "epoch": 4305} {"train_loss": -7.026505947113037, "global_step": 180835, "epoch": 4305} {"train_loss": -6.998410224914551, "global_step": 180836, "epoch": 4305} {"train_loss": -7.115800380706787, "global_step": 180837, "epoch": 4305} {"train_loss": -7.03732967376709, "global_step": 180838, "epoch": 4305} {"train_loss": -7.0572638511657715, "global_step": 180839, "epoch": 4305} {"train_loss": -7.045331954956055, "global_step": 180840, "epoch": 4305} {"train_loss": -7.112862586975098, "global_step": 180841, "epoch": 4305} {"train_loss": -7.205850601196289, "global_step": 180842, "epoch": 4305} {"train_loss": -7.114377021789551, "global_step": 180843, "epoch": 4305} {"train_loss": -7.052817344665527, "global_step": 180844, "epoch": 4305} {"train_loss": -7.157688140869141, "global_step": 180845, "epoch": 4305} {"train_loss": -7.018210411071777, "global_step": 180846, "epoch": 4305} {"train_loss": -7.2589921951293945, "global_step": 180847, "epoch": 4305} {"train_loss": -7.207527160644531, "global_step": 180848, "epoch": 4305} {"train_loss": -7.177591323852539, "global_step": 180849, "epoch": 4305} {"train_loss": -7.0711894035339355, "global_step": 180850, "epoch": 4305} {"train_loss": -7.123001041866484, "global_step": 180851, "epoch": 4305, "val_loss": 80535.4375} {"train_loss": -7.111819267272949, "global_step": 180852, "epoch": 4306} {"train_loss": -7.160748481750488, "global_step": 180853, "epoch": 4306} {"train_loss": -7.034000396728516, "global_step": 180854, "epoch": 4306} {"train_loss": -7.145255088806152, "global_step": 180855, "epoch": 4306} {"train_loss": -7.101316452026367, "global_step": 180856, "epoch": 4306} {"train_loss": -7.071659088134766, "global_step": 180857, "epoch": 4306} {"train_loss": -7.0564351081848145, "global_step": 180858, "epoch": 4306} {"train_loss": -6.996716499328613, "global_step": 180859, "epoch": 4306} {"train_loss": -7.053189754486084, "global_step": 180860, "epoch": 4306} {"train_loss": -7.039727687835693, "global_step": 180861, "epoch": 4306} {"train_loss": -7.06083869934082, "global_step": 180862, "epoch": 4306} {"train_loss": -7.073477745056152, "global_step": 180863, "epoch": 4306} {"train_loss": -7.183346748352051, "global_step": 180864, "epoch": 4306} {"train_loss": -7.009246349334717, "global_step": 180865, "epoch": 4306} {"train_loss": -7.128357887268066, "global_step": 180866, "epoch": 4306} {"train_loss": -7.05415153503418, "global_step": 180867, "epoch": 4306} {"train_loss": -7.1173176765441895, "global_step": 180868, "epoch": 4306} {"train_loss": -7.040469169616699, "global_step": 180869, "epoch": 4306} {"train_loss": -7.224353790283203, "global_step": 180870, "epoch": 4306} {"train_loss": -7.074515342712402, "global_step": 180871, "epoch": 4306} {"train_loss": -7.075131893157959, "global_step": 180872, "epoch": 4306} {"train_loss": -7.017941951751709, "global_step": 180873, "epoch": 4306} {"train_loss": -6.998961448669434, "global_step": 180874, "epoch": 4306} {"train_loss": -7.052680969238281, "global_step": 180875, "epoch": 4306} {"train_loss": -7.113930702209473, "global_step": 180876, "epoch": 4306} {"train_loss": -7.0965094566345215, "global_step": 180877, "epoch": 4306} {"train_loss": -7.000993251800537, "global_step": 180878, "epoch": 4306} {"train_loss": -7.007211208343506, "global_step": 180879, "epoch": 4306} {"train_loss": -7.093435287475586, "global_step": 180880, "epoch": 4306} {"train_loss": -7.085231781005859, "global_step": 180881, "epoch": 4306} {"train_loss": -6.983645915985107, "global_step": 180882, "epoch": 4306} {"train_loss": -7.193145275115967, "global_step": 180883, "epoch": 4306} {"train_loss": -7.005763053894043, "global_step": 180884, "epoch": 4306} {"train_loss": -7.105265140533447, "global_step": 180885, "epoch": 4306} {"train_loss": -6.962591171264648, "global_step": 180886, "epoch": 4306} {"train_loss": -7.055018424987793, "global_step": 180887, "epoch": 4306} {"train_loss": -7.028912544250488, "global_step": 180888, "epoch": 4306} {"train_loss": -6.956648349761963, "global_step": 180889, "epoch": 4306} {"train_loss": -7.079814910888672, "global_step": 180890, "epoch": 4306} {"train_loss": -7.087164878845215, "global_step": 180891, "epoch": 4306} {"train_loss": -7.112353801727295, "global_step": 180892, "epoch": 4306} {"train_loss": -7.067806743440174, "global_step": 180893, "epoch": 4306, "val_loss": 80309.71875} {"train_loss": -7.048689842224121, "global_step": 180894, "epoch": 4307} {"train_loss": -7.040626525878906, "global_step": 180895, "epoch": 4307} {"train_loss": -7.022185325622559, "global_step": 180896, "epoch": 4307} {"train_loss": -7.07250452041626, "global_step": 180897, "epoch": 4307} {"train_loss": -7.104743480682373, "global_step": 180898, "epoch": 4307} {"train_loss": -7.138513565063477, "global_step": 180899, "epoch": 4307} {"train_loss": -6.991800308227539, "global_step": 180900, "epoch": 4307} {"train_loss": -7.083344459533691, "global_step": 180901, "epoch": 4307} {"train_loss": -7.125896453857422, "global_step": 180902, "epoch": 4307} {"train_loss": -7.189648628234863, "global_step": 180903, "epoch": 4307} {"train_loss": -7.282691478729248, "global_step": 180904, "epoch": 4307} {"train_loss": -7.090970993041992, "global_step": 180905, "epoch": 4307} {"train_loss": -7.186703681945801, "global_step": 180906, "epoch": 4307} {"train_loss": -7.0580034255981445, "global_step": 180907, "epoch": 4307} {"train_loss": -7.171273708343506, "global_step": 180908, "epoch": 4307} {"train_loss": -7.083949089050293, "global_step": 180909, "epoch": 4307} {"train_loss": -7.200396537780762, "global_step": 180910, "epoch": 4307} {"train_loss": -7.119374752044678, "global_step": 180911, "epoch": 4307} {"train_loss": -7.0174055099487305, "global_step": 180912, "epoch": 4307} {"train_loss": -7.087182998657227, "global_step": 180913, "epoch": 4307} {"train_loss": -7.107237815856934, "global_step": 180914, "epoch": 4307} {"train_loss": -7.044130325317383, "global_step": 180915, "epoch": 4307} {"train_loss": -7.099337577819824, "global_step": 180916, "epoch": 4307} {"train_loss": -7.112829208374023, "global_step": 180917, "epoch": 4307} {"train_loss": -6.9920334815979, "global_step": 180918, "epoch": 4307} {"train_loss": -7.097846031188965, "global_step": 180919, "epoch": 4307} {"train_loss": -7.226998329162598, "global_step": 180920, "epoch": 4307} {"train_loss": -7.13102912902832, "global_step": 180921, "epoch": 4307} {"train_loss": -7.17323112487793, "global_step": 180922, "epoch": 4307} {"train_loss": -7.2483415603637695, "global_step": 180923, "epoch": 4307} {"train_loss": -7.026974678039551, "global_step": 180924, "epoch": 4307} {"train_loss": -7.2247772216796875, "global_step": 180925, "epoch": 4307} {"train_loss": -7.093059539794922, "global_step": 180926, "epoch": 4307} {"train_loss": -7.212996482849121, "global_step": 180927, "epoch": 4307} {"train_loss": -7.208995819091797, "global_step": 180928, "epoch": 4307} {"train_loss": -7.057978630065918, "global_step": 180929, "epoch": 4307} {"train_loss": -7.099049091339111, "global_step": 180930, "epoch": 4307} {"train_loss": -7.073122024536133, "global_step": 180931, "epoch": 4307} {"train_loss": -7.129515647888184, "global_step": 180932, "epoch": 4307} {"train_loss": -7.05064582824707, "global_step": 180933, "epoch": 4307} {"train_loss": -7.107773780822754, "global_step": 180934, "epoch": 4307} {"train_loss": -7.113218579973493, "global_step": 180935, "epoch": 4307, "val_loss": 80601.015625} {"train_loss": -7.0168633460998535, "global_step": 180936, "epoch": 4308} {"train_loss": -7.045704364776611, "global_step": 180937, "epoch": 4308} {"train_loss": -7.1146745681762695, "global_step": 180938, "epoch": 4308} {"train_loss": -6.9891228675842285, "global_step": 180939, "epoch": 4308} {"train_loss": -7.1247148513793945, "global_step": 180940, "epoch": 4308} {"train_loss": -7.009598731994629, "global_step": 180941, "epoch": 4308} {"train_loss": -6.9619526863098145, "global_step": 180942, "epoch": 4308} {"train_loss": -7.056640148162842, "global_step": 180943, "epoch": 4308} {"train_loss": -6.967535018920898, "global_step": 180944, "epoch": 4308} {"train_loss": -7.0129289627075195, "global_step": 180945, "epoch": 4308} {"train_loss": -6.979455471038818, "global_step": 180946, "epoch": 4308} {"train_loss": -7.0333685874938965, "global_step": 180947, "epoch": 4308} {"train_loss": -7.0626373291015625, "global_step": 180948, "epoch": 4308} {"train_loss": -7.004894733428955, "global_step": 180949, "epoch": 4308} {"train_loss": -6.988673210144043, "global_step": 180950, "epoch": 4308} {"train_loss": -7.123924732208252, "global_step": 180951, "epoch": 4308} {"train_loss": -6.933361053466797, "global_step": 180952, "epoch": 4308} {"train_loss": -7.100177764892578, "global_step": 180953, "epoch": 4308} {"train_loss": -6.971418380737305, "global_step": 180954, "epoch": 4308} {"train_loss": -7.0128679275512695, "global_step": 180955, "epoch": 4308} {"train_loss": -7.068255424499512, "global_step": 180956, "epoch": 4308} {"train_loss": -7.041582107543945, "global_step": 180957, "epoch": 4308} {"train_loss": -7.179421424865723, "global_step": 180958, "epoch": 4308} {"train_loss": -6.948603630065918, "global_step": 180959, "epoch": 4308} {"train_loss": -7.145388126373291, "global_step": 180960, "epoch": 4308} {"train_loss": -7.096724033355713, "global_step": 180961, "epoch": 4308} {"train_loss": -7.024402618408203, "global_step": 180962, "epoch": 4308} {"train_loss": -7.211023807525635, "global_step": 180963, "epoch": 4308} {"train_loss": -7.043895721435547, "global_step": 180964, "epoch": 4308} {"train_loss": -7.100451469421387, "global_step": 180965, "epoch": 4308} {"train_loss": -7.101702690124512, "global_step": 180966, "epoch": 4308} {"train_loss": -7.0649003982543945, "global_step": 180967, "epoch": 4308} {"train_loss": -7.1496758460998535, "global_step": 180968, "epoch": 4308} {"train_loss": -7.134513854980469, "global_step": 180969, "epoch": 4308} {"train_loss": -7.102502346038818, "global_step": 180970, "epoch": 4308} {"train_loss": -7.1783857345581055, "global_step": 180971, "epoch": 4308} {"train_loss": -7.176906585693359, "global_step": 180972, "epoch": 4308} {"train_loss": -7.187510967254639, "global_step": 180973, "epoch": 4308} {"train_loss": -7.092170715332031, "global_step": 180974, "epoch": 4308} {"train_loss": -7.152078628540039, "global_step": 180975, "epoch": 4308} {"train_loss": -7.151567459106445, "global_step": 180976, "epoch": 4308} {"train_loss": -7.072757255463373, "global_step": 180977, "epoch": 4308, "val_loss": 80534.640625} {"train_loss": -7.172443389892578, "global_step": 180978, "epoch": 4309} {"train_loss": -7.08236026763916, "global_step": 180979, "epoch": 4309} {"train_loss": -7.169302940368652, "global_step": 180980, "epoch": 4309} {"train_loss": -7.232060432434082, "global_step": 180981, "epoch": 4309} {"train_loss": -7.275115013122559, "global_step": 180982, "epoch": 4309} {"train_loss": -7.162553787231445, "global_step": 180983, "epoch": 4309} {"train_loss": -7.232171058654785, "global_step": 180984, "epoch": 4309} {"train_loss": -7.145829200744629, "global_step": 180985, "epoch": 4309} {"train_loss": -7.226552963256836, "global_step": 180986, "epoch": 4309} {"train_loss": -7.146234512329102, "global_step": 180987, "epoch": 4309} {"train_loss": -7.167543411254883, "global_step": 180988, "epoch": 4309} {"train_loss": -7.124456882476807, "global_step": 180989, "epoch": 4309} {"train_loss": -7.26713228225708, "global_step": 180990, "epoch": 4309} {"train_loss": -7.222715377807617, "global_step": 180991, "epoch": 4309} {"train_loss": -7.119969367980957, "global_step": 180992, "epoch": 4309} {"train_loss": -7.146881580352783, "global_step": 180993, "epoch": 4309} {"train_loss": -7.154326915740967, "global_step": 180994, "epoch": 4309} {"train_loss": -7.186380386352539, "global_step": 180995, "epoch": 4309} {"train_loss": -7.209683418273926, "global_step": 180996, "epoch": 4309} {"train_loss": -7.127376556396484, "global_step": 180997, "epoch": 4309} {"train_loss": -7.252677917480469, "global_step": 180998, "epoch": 4309} {"train_loss": -7.179098606109619, "global_step": 180999, "epoch": 4309} {"train_loss": -7.153776168823242, "global_step": 181000, "epoch": 4309} {"train_loss": -7.171911239624023, "global_step": 181001, "epoch": 4309} {"train_loss": -7.145390510559082, "global_step": 181002, "epoch": 4309} {"train_loss": -7.297341346740723, "global_step": 181003, "epoch": 4309} {"train_loss": -7.109767913818359, "global_step": 181004, "epoch": 4309} {"train_loss": -7.311637878417969, "global_step": 181005, "epoch": 4309} {"train_loss": -7.142380714416504, "global_step": 181006, "epoch": 4309} {"train_loss": -7.245458126068115, "global_step": 181007, "epoch": 4309} {"train_loss": -7.189346790313721, "global_step": 181008, "epoch": 4309} {"train_loss": -7.161062240600586, "global_step": 181009, "epoch": 4309} {"train_loss": -7.193831443786621, "global_step": 181010, "epoch": 4309} {"train_loss": -7.198963642120361, "global_step": 181011, "epoch": 4309} {"train_loss": -7.266965866088867, "global_step": 181012, "epoch": 4309} {"train_loss": -7.227117538452148, "global_step": 181013, "epoch": 4309} {"train_loss": -7.17668342590332, "global_step": 181014, "epoch": 4309} {"train_loss": -7.1714677810668945, "global_step": 181015, "epoch": 4309} {"train_loss": -7.2522478103637695, "global_step": 181016, "epoch": 4309} {"train_loss": -7.237780570983887, "global_step": 181017, "epoch": 4309} {"train_loss": -7.242918491363525, "global_step": 181018, "epoch": 4309} {"train_loss": -7.19492304892767, "global_step": 181019, "epoch": 4309, "val_loss": 80515.2578125} {"train_loss": -7.2442450523376465, "global_step": 181020, "epoch": 4310} {"train_loss": -7.266515731811523, "global_step": 181021, "epoch": 4310} {"train_loss": -7.169764518737793, "global_step": 181022, "epoch": 4310} {"train_loss": -7.11991548538208, "global_step": 181023, "epoch": 4310} {"train_loss": -7.0694899559021, "global_step": 181024, "epoch": 4310} {"train_loss": -7.143444538116455, "global_step": 181025, "epoch": 4310} {"train_loss": -7.187507629394531, "global_step": 181026, "epoch": 4310} {"train_loss": -7.196588039398193, "global_step": 181027, "epoch": 4310} {"train_loss": -7.242231369018555, "global_step": 181028, "epoch": 4310} {"train_loss": -7.3009843826293945, "global_step": 181029, "epoch": 4310} {"train_loss": -7.128536224365234, "global_step": 181030, "epoch": 4310} {"train_loss": -7.263607025146484, "global_step": 181031, "epoch": 4310} {"train_loss": -7.24362850189209, "global_step": 181032, "epoch": 4310} {"train_loss": -7.233607292175293, "global_step": 181033, "epoch": 4310} {"train_loss": -7.24542236328125, "global_step": 181034, "epoch": 4310} {"train_loss": -7.251259803771973, "global_step": 181035, "epoch": 4310} {"train_loss": -7.225954532623291, "global_step": 181036, "epoch": 4310} {"train_loss": -7.153320789337158, "global_step": 181037, "epoch": 4310} {"train_loss": -7.289504528045654, "global_step": 181038, "epoch": 4310} {"train_loss": -7.15584135055542, "global_step": 181039, "epoch": 4310} {"train_loss": -7.128946304321289, "global_step": 181040, "epoch": 4310} {"train_loss": -7.081240177154541, "global_step": 181041, "epoch": 4310} {"train_loss": -7.2061967849731445, "global_step": 181042, "epoch": 4310} {"train_loss": -7.151037216186523, "global_step": 181043, "epoch": 4310} {"train_loss": -7.199565887451172, "global_step": 181044, "epoch": 4310} {"train_loss": -7.234063148498535, "global_step": 181045, "epoch": 4310} {"train_loss": -7.107126235961914, "global_step": 181046, "epoch": 4310} {"train_loss": -7.118603229522705, "global_step": 181047, "epoch": 4310} {"train_loss": -7.196149826049805, "global_step": 181048, "epoch": 4310} {"train_loss": -7.036168575286865, "global_step": 181049, "epoch": 4310} {"train_loss": -7.118040084838867, "global_step": 181050, "epoch": 4310} {"train_loss": -7.114407539367676, "global_step": 181051, "epoch": 4310} {"train_loss": -7.1440277099609375, "global_step": 181052, "epoch": 4310} {"train_loss": -7.027498245239258, "global_step": 181053, "epoch": 4310} {"train_loss": -7.171957015991211, "global_step": 181054, "epoch": 4310} {"train_loss": -7.007990837097168, "global_step": 181055, "epoch": 4310} {"train_loss": -7.154825687408447, "global_step": 181056, "epoch": 4310} {"train_loss": -7.0910139083862305, "global_step": 181057, "epoch": 4310} {"train_loss": -7.010674953460693, "global_step": 181058, "epoch": 4310} {"train_loss": -7.154908657073975, "global_step": 181059, "epoch": 4310} {"train_loss": -7.203161239624023, "global_step": 181060, "epoch": 4310} {"train_loss": -7.162701913288662, "global_step": 181061, "epoch": 4310, "val_loss": 80456.2890625} {"train_loss": -7.134444236755371, "global_step": 181062, "epoch": 4311} {"train_loss": -7.110806465148926, "global_step": 181063, "epoch": 4311} {"train_loss": -7.126466751098633, "global_step": 181064, "epoch": 4311} {"train_loss": -7.2000412940979, "global_step": 181065, "epoch": 4311} {"train_loss": -7.143959045410156, "global_step": 181066, "epoch": 4311} {"train_loss": -7.221039295196533, "global_step": 181067, "epoch": 4311} {"train_loss": -7.023736476898193, "global_step": 181068, "epoch": 4311} {"train_loss": -7.256309509277344, "global_step": 181069, "epoch": 4311} {"train_loss": -7.167633056640625, "global_step": 181070, "epoch": 4311} {"train_loss": -7.219278335571289, "global_step": 181071, "epoch": 4311} {"train_loss": -7.262979984283447, "global_step": 181072, "epoch": 4311} {"train_loss": -7.209023952484131, "global_step": 181073, "epoch": 4311} {"train_loss": -7.172574043273926, "global_step": 181074, "epoch": 4311} {"train_loss": -7.070209503173828, "global_step": 181075, "epoch": 4311} {"train_loss": -7.078924179077148, "global_step": 181076, "epoch": 4311} {"train_loss": -7.113020420074463, "global_step": 181077, "epoch": 4311} {"train_loss": -7.122929573059082, "global_step": 181078, "epoch": 4311} {"train_loss": -7.066929817199707, "global_step": 181079, "epoch": 4311} {"train_loss": -7.150813102722168, "global_step": 181080, "epoch": 4311} {"train_loss": -7.149308681488037, "global_step": 181081, "epoch": 4311} {"train_loss": -7.163619518280029, "global_step": 181082, "epoch": 4311} {"train_loss": -7.166441440582275, "global_step": 181083, "epoch": 4311} {"train_loss": -7.154038906097412, "global_step": 181084, "epoch": 4311} {"train_loss": -7.079425811767578, "global_step": 181085, "epoch": 4311} {"train_loss": -7.15811014175415, "global_step": 181086, "epoch": 4311} {"train_loss": -7.180693626403809, "global_step": 181087, "epoch": 4311} {"train_loss": -7.163278102874756, "global_step": 181088, "epoch": 4311} {"train_loss": -7.171120643615723, "global_step": 181089, "epoch": 4311} {"train_loss": -7.155596733093262, "global_step": 181090, "epoch": 4311} {"train_loss": -7.106756210327148, "global_step": 181091, "epoch": 4311} {"train_loss": -7.08451509475708, "global_step": 181092, "epoch": 4311} {"train_loss": -7.073884010314941, "global_step": 181093, "epoch": 4311} {"train_loss": -7.084344387054443, "global_step": 181094, "epoch": 4311} {"train_loss": -7.143406391143799, "global_step": 181095, "epoch": 4311} {"train_loss": -7.164884567260742, "global_step": 181096, "epoch": 4311} {"train_loss": -7.103322982788086, "global_step": 181097, "epoch": 4311} {"train_loss": -7.0860595703125, "global_step": 181098, "epoch": 4311} {"train_loss": -7.179121971130371, "global_step": 181099, "epoch": 4311} {"train_loss": -7.043237686157227, "global_step": 181100, "epoch": 4311} {"train_loss": -7.104611396789551, "global_step": 181101, "epoch": 4311} {"train_loss": -7.014219284057617, "global_step": 181102, "epoch": 4311} {"train_loss": -7.134934868131365, "global_step": 181103, "epoch": 4311, "val_loss": 80766.8125} {"train_loss": -7.222485542297363, "global_step": 181104, "epoch": 4312} {"train_loss": -6.994373321533203, "global_step": 181105, "epoch": 4312} {"train_loss": -7.087726593017578, "global_step": 181106, "epoch": 4312} {"train_loss": -7.123023509979248, "global_step": 181107, "epoch": 4312} {"train_loss": -7.119880199432373, "global_step": 181108, "epoch": 4312} {"train_loss": -7.071276664733887, "global_step": 181109, "epoch": 4312} {"train_loss": -7.099523544311523, "global_step": 181110, "epoch": 4312} {"train_loss": -7.078179836273193, "global_step": 181111, "epoch": 4312} {"train_loss": -7.1196489334106445, "global_step": 181112, "epoch": 4312} {"train_loss": -7.16897439956665, "global_step": 181113, "epoch": 4312} {"train_loss": -7.0919508934021, "global_step": 181114, "epoch": 4312} {"train_loss": -7.096733093261719, "global_step": 181115, "epoch": 4312} {"train_loss": -6.9935503005981445, "global_step": 181116, "epoch": 4312} {"train_loss": -7.133144855499268, "global_step": 181117, "epoch": 4312} {"train_loss": -7.148653030395508, "global_step": 181118, "epoch": 4312} {"train_loss": -7.05820369720459, "global_step": 181119, "epoch": 4312} {"train_loss": -7.140897750854492, "global_step": 181120, "epoch": 4312} {"train_loss": -7.128476142883301, "global_step": 181121, "epoch": 4312} {"train_loss": -7.163329124450684, "global_step": 181122, "epoch": 4312} {"train_loss": -7.0957441329956055, "global_step": 181123, "epoch": 4312} {"train_loss": -7.092704772949219, "global_step": 181124, "epoch": 4312} {"train_loss": -7.258202075958252, "global_step": 181125, "epoch": 4312} {"train_loss": -7.190195083618164, "global_step": 181126, "epoch": 4312} {"train_loss": -7.070342063903809, "global_step": 181127, "epoch": 4312} {"train_loss": -7.235658645629883, "global_step": 181128, "epoch": 4312} {"train_loss": -7.168591499328613, "global_step": 181129, "epoch": 4312} {"train_loss": -7.156552314758301, "global_step": 181130, "epoch": 4312} {"train_loss": -7.118842124938965, "global_step": 181131, "epoch": 4312} {"train_loss": -7.091883182525635, "global_step": 181132, "epoch": 4312} {"train_loss": -7.10800838470459, "global_step": 181133, "epoch": 4312} {"train_loss": -7.117466926574707, "global_step": 181134, "epoch": 4312} {"train_loss": -7.109192848205566, "global_step": 181135, "epoch": 4312} {"train_loss": -6.878175735473633, "global_step": 181136, "epoch": 4312} {"train_loss": -6.937954425811768, "global_step": 181137, "epoch": 4312} {"train_loss": -6.924120903015137, "global_step": 181138, "epoch": 4312} {"train_loss": -6.884393215179443, "global_step": 181139, "epoch": 4312} {"train_loss": -7.088486671447754, "global_step": 181140, "epoch": 4312} {"train_loss": -6.823102951049805, "global_step": 181141, "epoch": 4312} {"train_loss": -7.019474029541016, "global_step": 181142, "epoch": 4312} {"train_loss": -6.987706661224365, "global_step": 181143, "epoch": 4312} {"train_loss": -7.051999092102051, "global_step": 181144, "epoch": 4312} {"train_loss": -7.085158972513108, "global_step": 181145, "epoch": 4312, "val_loss": 80658.4140625} {"train_loss": -7.05085563659668, "global_step": 181146, "epoch": 4313} {"train_loss": -7.1057353019714355, "global_step": 181147, "epoch": 4313} {"train_loss": -7.067788600921631, "global_step": 181148, "epoch": 4313} {"train_loss": -7.183929443359375, "global_step": 181149, "epoch": 4313} {"train_loss": -7.111084938049316, "global_step": 181150, "epoch": 4313} {"train_loss": -7.027815341949463, "global_step": 181151, "epoch": 4313} {"train_loss": -7.106869697570801, "global_step": 181152, "epoch": 4313} {"train_loss": -6.984633922576904, "global_step": 181153, "epoch": 4313} {"train_loss": -7.111105918884277, "global_step": 181154, "epoch": 4313} {"train_loss": -7.068911552429199, "global_step": 181155, "epoch": 4313} {"train_loss": -7.083902835845947, "global_step": 181156, "epoch": 4313} {"train_loss": -7.023571014404297, "global_step": 181157, "epoch": 4313} {"train_loss": -7.176558494567871, "global_step": 181158, "epoch": 4313} {"train_loss": -7.146280288696289, "global_step": 181159, "epoch": 4313} {"train_loss": -7.291263580322266, "global_step": 181160, "epoch": 4313} {"train_loss": -7.156608581542969, "global_step": 181161, "epoch": 4313} {"train_loss": -7.207435607910156, "global_step": 181162, "epoch": 4313} {"train_loss": -7.007868766784668, "global_step": 181163, "epoch": 4313} {"train_loss": -7.149064540863037, "global_step": 181164, "epoch": 4313} {"train_loss": -7.1490678787231445, "global_step": 181165, "epoch": 4313} {"train_loss": -7.155486106872559, "global_step": 181166, "epoch": 4313} {"train_loss": -7.153142929077148, "global_step": 181167, "epoch": 4313} {"train_loss": -7.118679046630859, "global_step": 181168, "epoch": 4313} {"train_loss": -7.185150146484375, "global_step": 181169, "epoch": 4313} {"train_loss": -7.224416732788086, "global_step": 181170, "epoch": 4313} {"train_loss": -7.159637928009033, "global_step": 181171, "epoch": 4313} {"train_loss": -7.164096355438232, "global_step": 181172, "epoch": 4313} {"train_loss": -7.113386631011963, "global_step": 181173, "epoch": 4313} {"train_loss": -7.0049285888671875, "global_step": 181174, "epoch": 4313} {"train_loss": -7.18699836730957, "global_step": 181175, "epoch": 4313} {"train_loss": -7.049700736999512, "global_step": 181176, "epoch": 4313} {"train_loss": -7.100991725921631, "global_step": 181177, "epoch": 4313} {"train_loss": -7.099856376647949, "global_step": 181178, "epoch": 4313} {"train_loss": -7.127948760986328, "global_step": 181179, "epoch": 4313} {"train_loss": -7.096789360046387, "global_step": 181180, "epoch": 4313} {"train_loss": -7.105073928833008, "global_step": 181181, "epoch": 4313} {"train_loss": -7.1791157722473145, "global_step": 181182, "epoch": 4313} {"train_loss": -7.147515773773193, "global_step": 181183, "epoch": 4313} {"train_loss": -7.216552734375, "global_step": 181184, "epoch": 4313} {"train_loss": -7.225004196166992, "global_step": 181185, "epoch": 4313} {"train_loss": -7.232124328613281, "global_step": 181186, "epoch": 4313} {"train_loss": -7.131373677934919, "global_step": 181187, "epoch": 4313, "val_loss": 80461.3515625} {"train_loss": -7.262402534484863, "global_step": 181188, "epoch": 4314} {"train_loss": -7.169002056121826, "global_step": 181189, "epoch": 4314} {"train_loss": -7.081275463104248, "global_step": 181190, "epoch": 4314} {"train_loss": -7.270439147949219, "global_step": 181191, "epoch": 4314} {"train_loss": -7.252799987792969, "global_step": 181192, "epoch": 4314} {"train_loss": -7.198055744171143, "global_step": 181193, "epoch": 4314} {"train_loss": -7.2404890060424805, "global_step": 181194, "epoch": 4314} {"train_loss": -7.186552047729492, "global_step": 181195, "epoch": 4314} {"train_loss": -7.054448127746582, "global_step": 181196, "epoch": 4314} {"train_loss": -7.160647392272949, "global_step": 181197, "epoch": 4314} {"train_loss": -7.129900932312012, "global_step": 181198, "epoch": 4314} {"train_loss": -7.165671348571777, "global_step": 181199, "epoch": 4314} {"train_loss": -7.059913635253906, "global_step": 181200, "epoch": 4314} {"train_loss": -7.256840705871582, "global_step": 181201, "epoch": 4314} {"train_loss": -7.134665489196777, "global_step": 181202, "epoch": 4314} {"train_loss": -7.170844078063965, "global_step": 181203, "epoch": 4314} {"train_loss": -7.191255569458008, "global_step": 181204, "epoch": 4314} {"train_loss": -7.118322372436523, "global_step": 181205, "epoch": 4314} {"train_loss": -7.238897800445557, "global_step": 181206, "epoch": 4314} {"train_loss": -7.226839065551758, "global_step": 181207, "epoch": 4314} {"train_loss": -7.144143581390381, "global_step": 181208, "epoch": 4314} {"train_loss": -7.181386947631836, "global_step": 181209, "epoch": 4314} {"train_loss": -7.158186912536621, "global_step": 181210, "epoch": 4314} {"train_loss": -7.153977394104004, "global_step": 181211, "epoch": 4314} {"train_loss": -7.212874412536621, "global_step": 181212, "epoch": 4314} {"train_loss": -7.17726993560791, "global_step": 181213, "epoch": 4314} {"train_loss": -7.154646396636963, "global_step": 181214, "epoch": 4314} {"train_loss": -7.227383613586426, "global_step": 181215, "epoch": 4314} {"train_loss": -7.107483863830566, "global_step": 181216, "epoch": 4314} {"train_loss": -7.116491317749023, "global_step": 181217, "epoch": 4314} {"train_loss": -7.227599620819092, "global_step": 181218, "epoch": 4314} {"train_loss": -7.093745708465576, "global_step": 181219, "epoch": 4314} {"train_loss": -7.028236389160156, "global_step": 181220, "epoch": 4314} {"train_loss": -7.03727388381958, "global_step": 181221, "epoch": 4314} {"train_loss": -7.092622756958008, "global_step": 181222, "epoch": 4314} {"train_loss": -6.996677398681641, "global_step": 181223, "epoch": 4314} {"train_loss": -7.053427696228027, "global_step": 181224, "epoch": 4314} {"train_loss": -6.884903907775879, "global_step": 181225, "epoch": 4314} {"train_loss": -6.995330810546875, "global_step": 181226, "epoch": 4314} {"train_loss": -6.993020057678223, "global_step": 181227, "epoch": 4314} {"train_loss": -6.95806884765625, "global_step": 181228, "epoch": 4314} {"train_loss": -7.134566976910546, "global_step": 181229, "epoch": 4314, "val_loss": 80765.9140625} {"train_loss": -6.802504539489746, "global_step": 181230, "epoch": 4315} {"train_loss": -7.020476341247559, "global_step": 181231, "epoch": 4315} {"train_loss": -7.0422797203063965, "global_step": 181232, "epoch": 4315} {"train_loss": -6.991281986236572, "global_step": 181233, "epoch": 4315} {"train_loss": -7.061271667480469, "global_step": 181234, "epoch": 4315} {"train_loss": -7.08756160736084, "global_step": 181235, "epoch": 4315} {"train_loss": -7.074119567871094, "global_step": 181236, "epoch": 4315} {"train_loss": -6.978155136108398, "global_step": 181237, "epoch": 4315} {"train_loss": -7.107065200805664, "global_step": 181238, "epoch": 4315} {"train_loss": -7.080908298492432, "global_step": 181239, "epoch": 4315} {"train_loss": -7.105475425720215, "global_step": 181240, "epoch": 4315} {"train_loss": -7.041675567626953, "global_step": 181241, "epoch": 4315} {"train_loss": -7.141069412231445, "global_step": 181242, "epoch": 4315} {"train_loss": -7.070566177368164, "global_step": 181243, "epoch": 4315} {"train_loss": -7.106369495391846, "global_step": 181244, "epoch": 4315} {"train_loss": -7.134408950805664, "global_step": 181245, "epoch": 4315} {"train_loss": -7.105484485626221, "global_step": 181246, "epoch": 4315} {"train_loss": -7.195093154907227, "global_step": 181247, "epoch": 4315} {"train_loss": -7.024555206298828, "global_step": 181248, "epoch": 4315} {"train_loss": -7.1063690185546875, "global_step": 181249, "epoch": 4315} {"train_loss": -7.085790634155273, "global_step": 181250, "epoch": 4315} {"train_loss": -7.165957450866699, "global_step": 181251, "epoch": 4315} {"train_loss": -7.178493976593018, "global_step": 181252, "epoch": 4315} {"train_loss": -7.1128764152526855, "global_step": 181253, "epoch": 4315} {"train_loss": -6.95088005065918, "global_step": 181254, "epoch": 4315} {"train_loss": -7.084792613983154, "global_step": 181255, "epoch": 4315} {"train_loss": -7.119449138641357, "global_step": 181256, "epoch": 4315} {"train_loss": -6.88565731048584, "global_step": 181257, "epoch": 4315} {"train_loss": -7.1891069412231445, "global_step": 181258, "epoch": 4315} {"train_loss": -7.024507522583008, "global_step": 181259, "epoch": 4315} {"train_loss": -7.002780914306641, "global_step": 181260, "epoch": 4315} {"train_loss": -7.1220316886901855, "global_step": 181261, "epoch": 4315} {"train_loss": -6.889871597290039, "global_step": 181262, "epoch": 4315} {"train_loss": -7.175354957580566, "global_step": 181263, "epoch": 4315} {"train_loss": -7.175463676452637, "global_step": 181264, "epoch": 4315} {"train_loss": -7.114096641540527, "global_step": 181265, "epoch": 4315} {"train_loss": -7.18351936340332, "global_step": 181266, "epoch": 4315} {"train_loss": -7.157573223114014, "global_step": 181267, "epoch": 4315} {"train_loss": -7.054060935974121, "global_step": 181268, "epoch": 4315} {"train_loss": -7.241566181182861, "global_step": 181269, "epoch": 4315} {"train_loss": -7.024834632873535, "global_step": 181270, "epoch": 4315} {"train_loss": -7.077807244800386, "global_step": 181271, "epoch": 4315, "val_loss": 80429.2109375} {"train_loss": -7.17101526260376, "global_step": 181272, "epoch": 4316} {"train_loss": -7.1020026206970215, "global_step": 181273, "epoch": 4316} {"train_loss": -7.043628692626953, "global_step": 181274, "epoch": 4316} {"train_loss": -7.096938133239746, "global_step": 181275, "epoch": 4316} {"train_loss": -7.173737525939941, "global_step": 181276, "epoch": 4316} {"train_loss": -7.243370056152344, "global_step": 181277, "epoch": 4316} {"train_loss": -7.117801666259766, "global_step": 181278, "epoch": 4316} {"train_loss": -7.154067039489746, "global_step": 181279, "epoch": 4316} {"train_loss": -7.194401741027832, "global_step": 181280, "epoch": 4316} {"train_loss": -7.0024027824401855, "global_step": 181281, "epoch": 4316} {"train_loss": -7.14841890335083, "global_step": 181282, "epoch": 4316} {"train_loss": -6.956964015960693, "global_step": 181283, "epoch": 4316} {"train_loss": -7.169188022613525, "global_step": 181284, "epoch": 4316} {"train_loss": -7.088253974914551, "global_step": 181285, "epoch": 4316} {"train_loss": -7.0658698081970215, "global_step": 181286, "epoch": 4316} {"train_loss": -7.119089126586914, "global_step": 181287, "epoch": 4316} {"train_loss": -6.941900253295898, "global_step": 181288, "epoch": 4316} {"train_loss": -7.161035060882568, "global_step": 181289, "epoch": 4316} {"train_loss": -6.925534248352051, "global_step": 181290, "epoch": 4316} {"train_loss": -6.975109577178955, "global_step": 181291, "epoch": 4316} {"train_loss": -7.123954772949219, "global_step": 181292, "epoch": 4316} {"train_loss": -7.121181011199951, "global_step": 181293, "epoch": 4316} {"train_loss": -7.079715251922607, "global_step": 181294, "epoch": 4316} {"train_loss": -7.036773681640625, "global_step": 181295, "epoch": 4316} {"train_loss": -6.85756254196167, "global_step": 181296, "epoch": 4316} {"train_loss": -7.065052509307861, "global_step": 181297, "epoch": 4316} {"train_loss": -6.929421901702881, "global_step": 181298, "epoch": 4316} {"train_loss": -7.040698051452637, "global_step": 181299, "epoch": 4316} {"train_loss": -7.120933532714844, "global_step": 181300, "epoch": 4316} {"train_loss": -7.095841407775879, "global_step": 181301, "epoch": 4316} {"train_loss": -7.008946418762207, "global_step": 181302, "epoch": 4316} {"train_loss": -7.168915748596191, "global_step": 181303, "epoch": 4316} {"train_loss": -7.088263988494873, "global_step": 181304, "epoch": 4316} {"train_loss": -7.104372024536133, "global_step": 181305, "epoch": 4316} {"train_loss": -7.107643127441406, "global_step": 181306, "epoch": 4316} {"train_loss": -7.105300426483154, "global_step": 181307, "epoch": 4316} {"train_loss": -7.006092548370361, "global_step": 181308, "epoch": 4316} {"train_loss": -7.2085771560668945, "global_step": 181309, "epoch": 4316} {"train_loss": -7.104279518127441, "global_step": 181310, "epoch": 4316} {"train_loss": -7.234430313110352, "global_step": 181311, "epoch": 4316} {"train_loss": -7.126727104187012, "global_step": 181312, "epoch": 4316} {"train_loss": -7.087188709349859, "global_step": 181313, "epoch": 4316, "val_loss": 80267.3515625} {"train_loss": -7.189599514007568, "global_step": 181314, "epoch": 4317} {"train_loss": -7.11583948135376, "global_step": 181315, "epoch": 4317} {"train_loss": -7.081265926361084, "global_step": 181316, "epoch": 4317} {"train_loss": -7.049663066864014, "global_step": 181317, "epoch": 4317} {"train_loss": -7.227528095245361, "global_step": 181318, "epoch": 4317} {"train_loss": -7.088260650634766, "global_step": 181319, "epoch": 4317} {"train_loss": -7.114524841308594, "global_step": 181320, "epoch": 4317} {"train_loss": -6.9675092697143555, "global_step": 181321, "epoch": 4317} {"train_loss": -7.066950798034668, "global_step": 181322, "epoch": 4317} {"train_loss": -7.237903594970703, "global_step": 181323, "epoch": 4317} {"train_loss": -7.242828369140625, "global_step": 181324, "epoch": 4317} {"train_loss": -7.051819801330566, "global_step": 181325, "epoch": 4317} {"train_loss": -7.117193222045898, "global_step": 181326, "epoch": 4317} {"train_loss": -7.101831436157227, "global_step": 181327, "epoch": 4317} {"train_loss": -7.092185974121094, "global_step": 181328, "epoch": 4317} {"train_loss": -7.061794757843018, "global_step": 181329, "epoch": 4317} {"train_loss": -7.155356407165527, "global_step": 181330, "epoch": 4317} {"train_loss": -7.172222137451172, "global_step": 181331, "epoch": 4317} {"train_loss": -7.220710754394531, "global_step": 181332, "epoch": 4317} {"train_loss": -7.0759992599487305, "global_step": 181333, "epoch": 4317} {"train_loss": -7.125506401062012, "global_step": 181334, "epoch": 4317} {"train_loss": -7.1120195388793945, "global_step": 181335, "epoch": 4317} {"train_loss": -7.129079341888428, "global_step": 181336, "epoch": 4317} {"train_loss": -7.148799896240234, "global_step": 181337, "epoch": 4317} {"train_loss": -6.955019474029541, "global_step": 181338, "epoch": 4317} {"train_loss": -7.19622802734375, "global_step": 181339, "epoch": 4317} {"train_loss": -7.112828731536865, "global_step": 181340, "epoch": 4317} {"train_loss": -7.105428218841553, "global_step": 181341, "epoch": 4317} {"train_loss": -7.135263442993164, "global_step": 181342, "epoch": 4317} {"train_loss": -7.071010112762451, "global_step": 181343, "epoch": 4317} {"train_loss": -7.213529586791992, "global_step": 181344, "epoch": 4317} {"train_loss": -7.125878810882568, "global_step": 181345, "epoch": 4317} {"train_loss": -7.185105800628662, "global_step": 181346, "epoch": 4317} {"train_loss": -7.246746063232422, "global_step": 181347, "epoch": 4317} {"train_loss": -7.1344146728515625, "global_step": 181348, "epoch": 4317} {"train_loss": -7.172724723815918, "global_step": 181349, "epoch": 4317} {"train_loss": -7.105046272277832, "global_step": 181350, "epoch": 4317} {"train_loss": -7.100257396697998, "global_step": 181351, "epoch": 4317} {"train_loss": -7.122640609741211, "global_step": 181352, "epoch": 4317} {"train_loss": -7.18696403503418, "global_step": 181353, "epoch": 4317} {"train_loss": -7.1864728927612305, "global_step": 181354, "epoch": 4317} {"train_loss": -7.13087272644043, "global_step": 181355, "epoch": 4317, "val_loss": 80455.078125} {"train_loss": -7.11741828918457, "global_step": 181356, "epoch": 4318} {"train_loss": -7.087580680847168, "global_step": 181357, "epoch": 4318} {"train_loss": -7.063918113708496, "global_step": 181358, "epoch": 4318} {"train_loss": -7.168342590332031, "global_step": 181359, "epoch": 4318} {"train_loss": -6.911921977996826, "global_step": 181360, "epoch": 4318} {"train_loss": -7.259164810180664, "global_step": 181361, "epoch": 4318} {"train_loss": -7.082474708557129, "global_step": 181362, "epoch": 4318} {"train_loss": -7.07938289642334, "global_step": 181363, "epoch": 4318} {"train_loss": -7.0685224533081055, "global_step": 181364, "epoch": 4318} {"train_loss": -7.058596611022949, "global_step": 181365, "epoch": 4318} {"train_loss": -7.132973670959473, "global_step": 181366, "epoch": 4318} {"train_loss": -7.023745536804199, "global_step": 181367, "epoch": 4318} {"train_loss": -7.31887149810791, "global_step": 181368, "epoch": 4318} {"train_loss": -7.087760925292969, "global_step": 181369, "epoch": 4318} {"train_loss": -7.120906829833984, "global_step": 181370, "epoch": 4318} {"train_loss": -7.2494683265686035, "global_step": 181371, "epoch": 4318} {"train_loss": -7.258123397827148, "global_step": 181372, "epoch": 4318} {"train_loss": -7.106492519378662, "global_step": 181373, "epoch": 4318} {"train_loss": -7.266919136047363, "global_step": 181374, "epoch": 4318} {"train_loss": -7.175511837005615, "global_step": 181375, "epoch": 4318} {"train_loss": -7.047876358032227, "global_step": 181376, "epoch": 4318} {"train_loss": -7.142348766326904, "global_step": 181377, "epoch": 4318} {"train_loss": -7.260209560394287, "global_step": 181378, "epoch": 4318} {"train_loss": -7.153573989868164, "global_step": 181379, "epoch": 4318} {"train_loss": -7.14095401763916, "global_step": 181380, "epoch": 4318} {"train_loss": -7.2685065269470215, "global_step": 181381, "epoch": 4318} {"train_loss": -7.175901412963867, "global_step": 181382, "epoch": 4318} {"train_loss": -7.181678295135498, "global_step": 181383, "epoch": 4318} {"train_loss": -7.258146286010742, "global_step": 181384, "epoch": 4318} {"train_loss": -7.193080425262451, "global_step": 181385, "epoch": 4318} {"train_loss": -7.074498176574707, "global_step": 181386, "epoch": 4318} {"train_loss": -7.135294437408447, "global_step": 181387, "epoch": 4318} {"train_loss": -7.182611465454102, "global_step": 181388, "epoch": 4318} {"train_loss": -7.236894607543945, "global_step": 181389, "epoch": 4318} {"train_loss": -7.233859062194824, "global_step": 181390, "epoch": 4318} {"train_loss": -7.179827690124512, "global_step": 181391, "epoch": 4318} {"train_loss": -7.208857536315918, "global_step": 181392, "epoch": 4318} {"train_loss": -7.24169921875, "global_step": 181393, "epoch": 4318} {"train_loss": -7.235381126403809, "global_step": 181394, "epoch": 4318} {"train_loss": -7.1320600509643555, "global_step": 181395, "epoch": 4318} {"train_loss": -7.11055850982666, "global_step": 181396, "epoch": 4318} {"train_loss": -7.157269262132191, "global_step": 181397, "epoch": 4318, "val_loss": 80459.5625} {"train_loss": -7.138444423675537, "global_step": 181398, "epoch": 4319} {"train_loss": -7.195605278015137, "global_step": 181399, "epoch": 4319} {"train_loss": -7.2822370529174805, "global_step": 181400, "epoch": 4319} {"train_loss": -7.191818714141846, "global_step": 181401, "epoch": 4319} {"train_loss": -7.197220802307129, "global_step": 181402, "epoch": 4319} {"train_loss": -7.220771789550781, "global_step": 181403, "epoch": 4319} {"train_loss": -7.113402366638184, "global_step": 181404, "epoch": 4319} {"train_loss": -7.2230424880981445, "global_step": 181405, "epoch": 4319} {"train_loss": -7.176524639129639, "global_step": 181406, "epoch": 4319} {"train_loss": -6.972017288208008, "global_step": 181407, "epoch": 4319} {"train_loss": -6.969298839569092, "global_step": 181408, "epoch": 4319} {"train_loss": -7.145479202270508, "global_step": 181409, "epoch": 4319} {"train_loss": -7.097211837768555, "global_step": 181410, "epoch": 4319} {"train_loss": -7.100648880004883, "global_step": 181411, "epoch": 4319} {"train_loss": -7.187897682189941, "global_step": 181412, "epoch": 4319} {"train_loss": -7.116973876953125, "global_step": 181413, "epoch": 4319} {"train_loss": -7.015439033508301, "global_step": 181414, "epoch": 4319} {"train_loss": -7.32179069519043, "global_step": 181415, "epoch": 4319} {"train_loss": -7.017076015472412, "global_step": 181416, "epoch": 4319} {"train_loss": -7.115283012390137, "global_step": 181417, "epoch": 4319} {"train_loss": -7.166343688964844, "global_step": 181418, "epoch": 4319} {"train_loss": -6.993634223937988, "global_step": 181419, "epoch": 4319} {"train_loss": -7.264094352722168, "global_step": 181420, "epoch": 4319} {"train_loss": -7.078930377960205, "global_step": 181421, "epoch": 4319} {"train_loss": -7.095408916473389, "global_step": 181422, "epoch": 4319} {"train_loss": -7.166051864624023, "global_step": 181423, "epoch": 4319} {"train_loss": -7.036327362060547, "global_step": 181424, "epoch": 4319} {"train_loss": -7.153536319732666, "global_step": 181425, "epoch": 4319} {"train_loss": -7.1259307861328125, "global_step": 181426, "epoch": 4319} {"train_loss": -7.036230087280273, "global_step": 181427, "epoch": 4319} {"train_loss": -7.1834869384765625, "global_step": 181428, "epoch": 4319} {"train_loss": -7.077474594116211, "global_step": 181429, "epoch": 4319} {"train_loss": -7.226865768432617, "global_step": 181430, "epoch": 4319} {"train_loss": -7.2221479415893555, "global_step": 181431, "epoch": 4319} {"train_loss": -7.185330390930176, "global_step": 181432, "epoch": 4319} {"train_loss": -7.104883193969727, "global_step": 181433, "epoch": 4319} {"train_loss": -7.083500862121582, "global_step": 181434, "epoch": 4319} {"train_loss": -7.285057067871094, "global_step": 181435, "epoch": 4319} {"train_loss": -7.197171688079834, "global_step": 181436, "epoch": 4319} {"train_loss": -7.220391273498535, "global_step": 181437, "epoch": 4319} {"train_loss": -7.1959943771362305, "global_step": 181438, "epoch": 4319} {"train_loss": -7.145127421333676, "global_step": 181439, "epoch": 4319, "val_loss": 80617.0625} {"train_loss": -7.237781047821045, "global_step": 181440, "epoch": 4320} {"train_loss": -7.20436954498291, "global_step": 181441, "epoch": 4320} {"train_loss": -7.306036949157715, "global_step": 181442, "epoch": 4320} {"train_loss": -7.185308933258057, "global_step": 181443, "epoch": 4320} {"train_loss": -7.138428688049316, "global_step": 181444, "epoch": 4320} {"train_loss": -7.160212516784668, "global_step": 181445, "epoch": 4320} {"train_loss": -7.222324848175049, "global_step": 181446, "epoch": 4320} {"train_loss": -7.1462225914001465, "global_step": 181447, "epoch": 4320} {"train_loss": -7.2540364265441895, "global_step": 181448, "epoch": 4320} {"train_loss": -7.219744682312012, "global_step": 181449, "epoch": 4320} {"train_loss": -7.184499740600586, "global_step": 181450, "epoch": 4320} {"train_loss": -7.124112129211426, "global_step": 181451, "epoch": 4320} {"train_loss": -7.12400484085083, "global_step": 181452, "epoch": 4320} {"train_loss": -7.22417688369751, "global_step": 181453, "epoch": 4320} {"train_loss": -7.1850385665893555, "global_step": 181454, "epoch": 4320} {"train_loss": -7.098446846008301, "global_step": 181455, "epoch": 4320} {"train_loss": -7.158487319946289, "global_step": 181456, "epoch": 4320} {"train_loss": -7.139029026031494, "global_step": 181457, "epoch": 4320} {"train_loss": -7.130170822143555, "global_step": 181458, "epoch": 4320} {"train_loss": -7.105107307434082, "global_step": 181459, "epoch": 4320} {"train_loss": -7.191810131072998, "global_step": 181460, "epoch": 4320} {"train_loss": -7.239405155181885, "global_step": 181461, "epoch": 4320} {"train_loss": -7.022177696228027, "global_step": 181462, "epoch": 4320} {"train_loss": -7.096490383148193, "global_step": 181463, "epoch": 4320} {"train_loss": -7.159714698791504, "global_step": 181464, "epoch": 4320} {"train_loss": -7.081051826477051, "global_step": 181465, "epoch": 4320} {"train_loss": -7.0996270179748535, "global_step": 181466, "epoch": 4320} {"train_loss": -7.160005569458008, "global_step": 181467, "epoch": 4320} {"train_loss": -7.148140907287598, "global_step": 181468, "epoch": 4320} {"train_loss": -7.351978778839111, "global_step": 181469, "epoch": 4320} {"train_loss": -7.01021671295166, "global_step": 181470, "epoch": 4320} {"train_loss": -7.1346235275268555, "global_step": 181471, "epoch": 4320} {"train_loss": -7.101680755615234, "global_step": 181472, "epoch": 4320} {"train_loss": -7.167844295501709, "global_step": 181473, "epoch": 4320} {"train_loss": -7.115139961242676, "global_step": 181474, "epoch": 4320} {"train_loss": -7.070586204528809, "global_step": 181475, "epoch": 4320} {"train_loss": -7.115342617034912, "global_step": 181476, "epoch": 4320} {"train_loss": -7.151115894317627, "global_step": 181477, "epoch": 4320} {"train_loss": -7.063990116119385, "global_step": 181478, "epoch": 4320} {"train_loss": -7.072910785675049, "global_step": 181479, "epoch": 4320} {"train_loss": -7.158034324645996, "global_step": 181480, "epoch": 4320} {"train_loss": -7.151396467572167, "global_step": 181481, "epoch": 4320, "val_loss": 80553.953125} {"train_loss": -7.180392265319824, "global_step": 181482, "epoch": 4321} {"train_loss": -7.130354881286621, "global_step": 181483, "epoch": 4321} {"train_loss": -7.148163795471191, "global_step": 181484, "epoch": 4321} {"train_loss": -7.09984016418457, "global_step": 181485, "epoch": 4321} {"train_loss": -7.079678535461426, "global_step": 181486, "epoch": 4321} {"train_loss": -7.156089782714844, "global_step": 181487, "epoch": 4321} {"train_loss": -7.148431777954102, "global_step": 181488, "epoch": 4321} {"train_loss": -7.1290130615234375, "global_step": 181489, "epoch": 4321} {"train_loss": -7.191727161407471, "global_step": 181490, "epoch": 4321} {"train_loss": -7.08732795715332, "global_step": 181491, "epoch": 4321} {"train_loss": -7.237292289733887, "global_step": 181492, "epoch": 4321} {"train_loss": -7.196828365325928, "global_step": 181493, "epoch": 4321} {"train_loss": -7.150979042053223, "global_step": 181494, "epoch": 4321} {"train_loss": -7.202142238616943, "global_step": 181495, "epoch": 4321} {"train_loss": -7.138363361358643, "global_step": 181496, "epoch": 4321} {"train_loss": -7.206838607788086, "global_step": 181497, "epoch": 4321} {"train_loss": -7.115255355834961, "global_step": 181498, "epoch": 4321} {"train_loss": -7.1124067306518555, "global_step": 181499, "epoch": 4321} {"train_loss": -7.154348850250244, "global_step": 181500, "epoch": 4321} {"train_loss": -7.204855918884277, "global_step": 181501, "epoch": 4321} {"train_loss": -7.185423374176025, "global_step": 181502, "epoch": 4321} {"train_loss": -7.169769287109375, "global_step": 181503, "epoch": 4321} {"train_loss": -7.151974678039551, "global_step": 181504, "epoch": 4321} {"train_loss": -7.093014717102051, "global_step": 181505, "epoch": 4321} {"train_loss": -7.204364776611328, "global_step": 181506, "epoch": 4321} {"train_loss": -7.1460466384887695, "global_step": 181507, "epoch": 4321} {"train_loss": -7.194241046905518, "global_step": 181508, "epoch": 4321} {"train_loss": -7.230437278747559, "global_step": 181509, "epoch": 4321} {"train_loss": -7.090965270996094, "global_step": 181510, "epoch": 4321} {"train_loss": -7.184140205383301, "global_step": 181511, "epoch": 4321} {"train_loss": -7.133755207061768, "global_step": 181512, "epoch": 4321} {"train_loss": -7.02346134185791, "global_step": 181513, "epoch": 4321} {"train_loss": -7.082278251647949, "global_step": 181514, "epoch": 4321} {"train_loss": -7.006923198699951, "global_step": 181515, "epoch": 4321} {"train_loss": -7.23253870010376, "global_step": 181516, "epoch": 4321} {"train_loss": -7.142302989959717, "global_step": 181517, "epoch": 4321} {"train_loss": -6.988783836364746, "global_step": 181518, "epoch": 4321} {"train_loss": -7.083866119384766, "global_step": 181519, "epoch": 4321} {"train_loss": -7.123801231384277, "global_step": 181520, "epoch": 4321} {"train_loss": -7.132097244262695, "global_step": 181521, "epoch": 4321} {"train_loss": -7.009779930114746, "global_step": 181522, "epoch": 4321} {"train_loss": -7.138443163463047, "global_step": 181523, "epoch": 4321, "val_loss": 80533.3046875} {"train_loss": -7.12306022644043, "global_step": 181524, "epoch": 4322} {"train_loss": -7.079296112060547, "global_step": 181525, "epoch": 4322} {"train_loss": -7.228296279907227, "global_step": 181526, "epoch": 4322} {"train_loss": -7.116116523742676, "global_step": 181527, "epoch": 4322} {"train_loss": -7.092273712158203, "global_step": 181528, "epoch": 4322} {"train_loss": -7.172468185424805, "global_step": 181529, "epoch": 4322} {"train_loss": -7.158249855041504, "global_step": 181530, "epoch": 4322} {"train_loss": -7.104021072387695, "global_step": 181531, "epoch": 4322} {"train_loss": -7.134526252746582, "global_step": 181532, "epoch": 4322} {"train_loss": -7.090204238891602, "global_step": 181533, "epoch": 4322} {"train_loss": -7.198737144470215, "global_step": 181534, "epoch": 4322} {"train_loss": -7.041504383087158, "global_step": 181535, "epoch": 4322} {"train_loss": -7.2314982414245605, "global_step": 181536, "epoch": 4322} {"train_loss": -7.228884696960449, "global_step": 181537, "epoch": 4322} {"train_loss": -7.15700101852417, "global_step": 181538, "epoch": 4322} {"train_loss": -7.145476341247559, "global_step": 181539, "epoch": 4322} {"train_loss": -7.164634704589844, "global_step": 181540, "epoch": 4322} {"train_loss": -7.255662441253662, "global_step": 181541, "epoch": 4322} {"train_loss": -7.222177028656006, "global_step": 181542, "epoch": 4322} {"train_loss": -7.337166786193848, "global_step": 181543, "epoch": 4322} {"train_loss": -7.209023475646973, "global_step": 181544, "epoch": 4322} {"train_loss": -7.286870956420898, "global_step": 181545, "epoch": 4322} {"train_loss": -7.130518913269043, "global_step": 181546, "epoch": 4322} {"train_loss": -7.181323051452637, "global_step": 181547, "epoch": 4322} {"train_loss": -7.160418510437012, "global_step": 181548, "epoch": 4322} {"train_loss": -7.261398792266846, "global_step": 181549, "epoch": 4322} {"train_loss": -7.12693977355957, "global_step": 181550, "epoch": 4322} {"train_loss": -7.083806991577148, "global_step": 181551, "epoch": 4322} {"train_loss": -7.170670032501221, "global_step": 181552, "epoch": 4322} {"train_loss": -7.062610626220703, "global_step": 181553, "epoch": 4322} {"train_loss": -7.103758811950684, "global_step": 181554, "epoch": 4322} {"train_loss": -7.058210372924805, "global_step": 181555, "epoch": 4322} {"train_loss": -7.273773670196533, "global_step": 181556, "epoch": 4322} {"train_loss": -7.188154220581055, "global_step": 181557, "epoch": 4322} {"train_loss": -7.136528968811035, "global_step": 181558, "epoch": 4322} {"train_loss": -7.116699695587158, "global_step": 181559, "epoch": 4322} {"train_loss": -7.147233009338379, "global_step": 181560, "epoch": 4322} {"train_loss": -7.055797576904297, "global_step": 181561, "epoch": 4322} {"train_loss": -7.150596618652344, "global_step": 181562, "epoch": 4322} {"train_loss": -7.090303421020508, "global_step": 181563, "epoch": 4322} {"train_loss": -7.12131929397583, "global_step": 181564, "epoch": 4322} {"train_loss": -7.152246497926258, "global_step": 181565, "epoch": 4322, "val_loss": 80743.8046875} {"train_loss": -7.186238765716553, "global_step": 181566, "epoch": 4323} {"train_loss": -7.0755615234375, "global_step": 181567, "epoch": 4323} {"train_loss": -7.060153007507324, "global_step": 181568, "epoch": 4323} {"train_loss": -7.1260504722595215, "global_step": 181569, "epoch": 4323} {"train_loss": -7.008130073547363, "global_step": 181570, "epoch": 4323} {"train_loss": -7.059248924255371, "global_step": 181571, "epoch": 4323} {"train_loss": -7.014064788818359, "global_step": 181572, "epoch": 4323} {"train_loss": -6.893341064453125, "global_step": 181573, "epoch": 4323} {"train_loss": -6.977524280548096, "global_step": 181574, "epoch": 4323} {"train_loss": -7.043819427490234, "global_step": 181575, "epoch": 4323} {"train_loss": -6.941226005554199, "global_step": 181576, "epoch": 4323} {"train_loss": -6.922465801239014, "global_step": 181577, "epoch": 4323} {"train_loss": -6.9113593101501465, "global_step": 181578, "epoch": 4323} {"train_loss": -7.00745964050293, "global_step": 181579, "epoch": 4323} {"train_loss": -7.011335372924805, "global_step": 181580, "epoch": 4323} {"train_loss": -7.144195556640625, "global_step": 181581, "epoch": 4323} {"train_loss": -6.91340446472168, "global_step": 181582, "epoch": 4323} {"train_loss": -6.900818824768066, "global_step": 181583, "epoch": 4323} {"train_loss": -6.970719337463379, "global_step": 181584, "epoch": 4323} {"train_loss": -7.019880771636963, "global_step": 181585, "epoch": 4323} {"train_loss": -7.011150360107422, "global_step": 181586, "epoch": 4323} {"train_loss": -7.129654884338379, "global_step": 181587, "epoch": 4323} {"train_loss": -7.043216705322266, "global_step": 181588, "epoch": 4323} {"train_loss": -7.059762001037598, "global_step": 181589, "epoch": 4323} {"train_loss": -7.121922492980957, "global_step": 181590, "epoch": 4323} {"train_loss": -7.012447834014893, "global_step": 181591, "epoch": 4323} {"train_loss": -7.030758857727051, "global_step": 181592, "epoch": 4323} {"train_loss": -6.9487714767456055, "global_step": 181593, "epoch": 4323} {"train_loss": -7.076699256896973, "global_step": 181594, "epoch": 4323} {"train_loss": -7.133358955383301, "global_step": 181595, "epoch": 4323} {"train_loss": -7.089745044708252, "global_step": 181596, "epoch": 4323} {"train_loss": -7.078889846801758, "global_step": 181597, "epoch": 4323} {"train_loss": -7.142688751220703, "global_step": 181598, "epoch": 4323} {"train_loss": -7.08839750289917, "global_step": 181599, "epoch": 4323} {"train_loss": -7.017180442810059, "global_step": 181600, "epoch": 4323} {"train_loss": -7.204501628875732, "global_step": 181601, "epoch": 4323} {"train_loss": -7.153008460998535, "global_step": 181602, "epoch": 4323} {"train_loss": -7.075963973999023, "global_step": 181603, "epoch": 4323} {"train_loss": -7.140015602111816, "global_step": 181604, "epoch": 4323} {"train_loss": -7.096733093261719, "global_step": 181605, "epoch": 4323} {"train_loss": -7.234857559204102, "global_step": 181606, "epoch": 4323} {"train_loss": -7.052344310851324, "global_step": 181607, "epoch": 4323, "val_loss": 80499.6015625} {"train_loss": -7.060239315032959, "global_step": 181608, "epoch": 4324} {"train_loss": -7.191110610961914, "global_step": 181609, "epoch": 4324} {"train_loss": -7.188097953796387, "global_step": 181610, "epoch": 4324} {"train_loss": -7.200553894042969, "global_step": 181611, "epoch": 4324} {"train_loss": -7.157679557800293, "global_step": 181612, "epoch": 4324} {"train_loss": -7.25342321395874, "global_step": 181613, "epoch": 4324} {"train_loss": -7.192265033721924, "global_step": 181614, "epoch": 4324} {"train_loss": -7.020001411437988, "global_step": 181615, "epoch": 4324} {"train_loss": -7.217803955078125, "global_step": 181616, "epoch": 4324} {"train_loss": -7.170503616333008, "global_step": 181617, "epoch": 4324} {"train_loss": -7.29016637802124, "global_step": 181618, "epoch": 4324} {"train_loss": -7.25545072555542, "global_step": 181619, "epoch": 4324} {"train_loss": -7.226375579833984, "global_step": 181620, "epoch": 4324} {"train_loss": -7.241182327270508, "global_step": 181621, "epoch": 4324} {"train_loss": -7.104294776916504, "global_step": 181622, "epoch": 4324} {"train_loss": -7.2096757888793945, "global_step": 181623, "epoch": 4324} {"train_loss": -7.221625328063965, "global_step": 181624, "epoch": 4324} {"train_loss": -7.126270294189453, "global_step": 181625, "epoch": 4324} {"train_loss": -7.149889945983887, "global_step": 181626, "epoch": 4324} {"train_loss": -7.213565826416016, "global_step": 181627, "epoch": 4324} {"train_loss": -7.250135898590088, "global_step": 181628, "epoch": 4324} {"train_loss": -7.223705768585205, "global_step": 181629, "epoch": 4324} {"train_loss": -7.117710113525391, "global_step": 181630, "epoch": 4324} {"train_loss": -7.3636088371276855, "global_step": 181631, "epoch": 4324} {"train_loss": -7.258065223693848, "global_step": 181632, "epoch": 4324} {"train_loss": -7.097173690795898, "global_step": 181633, "epoch": 4324} {"train_loss": -7.060060501098633, "global_step": 181634, "epoch": 4324} {"train_loss": -7.17014741897583, "global_step": 181635, "epoch": 4324} {"train_loss": -7.128066062927246, "global_step": 181636, "epoch": 4324} {"train_loss": -7.151883602142334, "global_step": 181637, "epoch": 4324} {"train_loss": -7.2534685134887695, "global_step": 181638, "epoch": 4324} {"train_loss": -7.194100379943848, "global_step": 181639, "epoch": 4324} {"train_loss": -7.185385227203369, "global_step": 181640, "epoch": 4324} {"train_loss": -7.230833053588867, "global_step": 181641, "epoch": 4324} {"train_loss": -7.154841423034668, "global_step": 181642, "epoch": 4324} {"train_loss": -7.197115421295166, "global_step": 181643, "epoch": 4324} {"train_loss": -7.037908554077148, "global_step": 181644, "epoch": 4324} {"train_loss": -7.1680474281311035, "global_step": 181645, "epoch": 4324} {"train_loss": -7.073535442352295, "global_step": 181646, "epoch": 4324} {"train_loss": -7.054150581359863, "global_step": 181647, "epoch": 4324} {"train_loss": -7.170804023742676, "global_step": 181648, "epoch": 4324} {"train_loss": -7.1757154691787, "global_step": 181649, "epoch": 4324, "val_loss": 80549.515625} {"train_loss": -7.171932220458984, "global_step": 181650, "epoch": 4325} {"train_loss": -7.204882621765137, "global_step": 181651, "epoch": 4325} {"train_loss": -7.158425331115723, "global_step": 181652, "epoch": 4325} {"train_loss": -7.194746971130371, "global_step": 181653, "epoch": 4325} {"train_loss": -7.101909160614014, "global_step": 181654, "epoch": 4325} {"train_loss": -7.191155910491943, "global_step": 181655, "epoch": 4325} {"train_loss": -7.107229232788086, "global_step": 181656, "epoch": 4325} {"train_loss": -7.204722881317139, "global_step": 181657, "epoch": 4325} {"train_loss": -7.126857757568359, "global_step": 181658, "epoch": 4325} {"train_loss": -7.223203182220459, "global_step": 181659, "epoch": 4325} {"train_loss": -7.097733974456787, "global_step": 181660, "epoch": 4325} {"train_loss": -7.221296310424805, "global_step": 181661, "epoch": 4325} {"train_loss": -7.223546981811523, "global_step": 181662, "epoch": 4325} {"train_loss": -7.080772876739502, "global_step": 181663, "epoch": 4325} {"train_loss": -7.184772491455078, "global_step": 181664, "epoch": 4325} {"train_loss": -7.1659626960754395, "global_step": 181665, "epoch": 4325} {"train_loss": -7.172966957092285, "global_step": 181666, "epoch": 4325} {"train_loss": -7.151518821716309, "global_step": 181667, "epoch": 4325} {"train_loss": -7.230902671813965, "global_step": 181668, "epoch": 4325} {"train_loss": -7.204008102416992, "global_step": 181669, "epoch": 4325} {"train_loss": -7.108643531799316, "global_step": 181670, "epoch": 4325} {"train_loss": -7.243981838226318, "global_step": 181671, "epoch": 4325} {"train_loss": -7.138399600982666, "global_step": 181672, "epoch": 4325} {"train_loss": -7.1756815910339355, "global_step": 181673, "epoch": 4325} {"train_loss": -7.015507698059082, "global_step": 181674, "epoch": 4325} {"train_loss": -7.149420261383057, "global_step": 181675, "epoch": 4325} {"train_loss": -7.07649040222168, "global_step": 181676, "epoch": 4325} {"train_loss": -7.0659565925598145, "global_step": 181677, "epoch": 4325} {"train_loss": -7.294973373413086, "global_step": 181678, "epoch": 4325} {"train_loss": -7.070078372955322, "global_step": 181679, "epoch": 4325} {"train_loss": -7.124199867248535, "global_step": 181680, "epoch": 4325} {"train_loss": -7.058271408081055, "global_step": 181681, "epoch": 4325} {"train_loss": -7.056900978088379, "global_step": 181682, "epoch": 4325} {"train_loss": -7.082552433013916, "global_step": 181683, "epoch": 4325} {"train_loss": -7.02447509765625, "global_step": 181684, "epoch": 4325} {"train_loss": -7.195173740386963, "global_step": 181685, "epoch": 4325} {"train_loss": -7.116809844970703, "global_step": 181686, "epoch": 4325} {"train_loss": -7.007009506225586, "global_step": 181687, "epoch": 4325} {"train_loss": -7.124756813049316, "global_step": 181688, "epoch": 4325} {"train_loss": -7.098906517028809, "global_step": 181689, "epoch": 4325} {"train_loss": -7.055804252624512, "global_step": 181690, "epoch": 4325} {"train_loss": -7.135975996653239, "global_step": 181691, "epoch": 4325, "val_loss": 80583.0} {"train_loss": -6.939064025878906, "global_step": 181692, "epoch": 4326} {"train_loss": -7.033474445343018, "global_step": 181693, "epoch": 4326} {"train_loss": -7.165027141571045, "global_step": 181694, "epoch": 4326} {"train_loss": -7.092884063720703, "global_step": 181695, "epoch": 4326} {"train_loss": -7.0621337890625, "global_step": 181696, "epoch": 4326} {"train_loss": -7.02232027053833, "global_step": 181697, "epoch": 4326} {"train_loss": -7.112628936767578, "global_step": 181698, "epoch": 4326} {"train_loss": -7.083259582519531, "global_step": 181699, "epoch": 4326} {"train_loss": -7.121553897857666, "global_step": 181700, "epoch": 4326} {"train_loss": -7.180598735809326, "global_step": 181701, "epoch": 4326} {"train_loss": -7.1521806716918945, "global_step": 181702, "epoch": 4326} {"train_loss": -7.166353225708008, "global_step": 181703, "epoch": 4326} {"train_loss": -7.120718002319336, "global_step": 181704, "epoch": 4326} {"train_loss": -7.260123252868652, "global_step": 181705, "epoch": 4326} {"train_loss": -7.167120933532715, "global_step": 181706, "epoch": 4326} {"train_loss": -7.131385803222656, "global_step": 181707, "epoch": 4326} {"train_loss": -7.206038475036621, "global_step": 181708, "epoch": 4326} {"train_loss": -7.233416557312012, "global_step": 181709, "epoch": 4326} {"train_loss": -7.151841163635254, "global_step": 181710, "epoch": 4326} {"train_loss": -7.161234378814697, "global_step": 181711, "epoch": 4326} {"train_loss": -7.128870010375977, "global_step": 181712, "epoch": 4326} {"train_loss": -7.2225494384765625, "global_step": 181713, "epoch": 4326} {"train_loss": -7.201839923858643, "global_step": 181714, "epoch": 4326} {"train_loss": -7.1564531326293945, "global_step": 181715, "epoch": 4326} {"train_loss": -7.174445629119873, "global_step": 181716, "epoch": 4326} {"train_loss": -7.1969146728515625, "global_step": 181717, "epoch": 4326} {"train_loss": -7.075465202331543, "global_step": 181718, "epoch": 4326} {"train_loss": -7.220146656036377, "global_step": 181719, "epoch": 4326} {"train_loss": -7.132279872894287, "global_step": 181720, "epoch": 4326} {"train_loss": -7.24563455581665, "global_step": 181721, "epoch": 4326} {"train_loss": -7.191256999969482, "global_step": 181722, "epoch": 4326} {"train_loss": -7.226683139801025, "global_step": 181723, "epoch": 4326} {"train_loss": -7.226675033569336, "global_step": 181724, "epoch": 4326} {"train_loss": -7.152846336364746, "global_step": 181725, "epoch": 4326} {"train_loss": -7.190503120422363, "global_step": 181726, "epoch": 4326} {"train_loss": -7.183446884155273, "global_step": 181727, "epoch": 4326} {"train_loss": -7.231887340545654, "global_step": 181728, "epoch": 4326} {"train_loss": -7.1881914138793945, "global_step": 181729, "epoch": 4326} {"train_loss": -6.978362560272217, "global_step": 181730, "epoch": 4326} {"train_loss": -7.138797760009766, "global_step": 181731, "epoch": 4326} {"train_loss": -7.161698341369629, "global_step": 181732, "epoch": 4326} {"train_loss": -7.146442504156203, "global_step": 181733, "epoch": 4326, "val_loss": 80526.375} {"train_loss": -7.117124080657959, "global_step": 181734, "epoch": 4327} {"train_loss": -7.205472946166992, "global_step": 181735, "epoch": 4327} {"train_loss": -6.893847465515137, "global_step": 181736, "epoch": 4327} {"train_loss": -7.144712924957275, "global_step": 181737, "epoch": 4327} {"train_loss": -7.120306015014648, "global_step": 181738, "epoch": 4327} {"train_loss": -6.895477294921875, "global_step": 181739, "epoch": 4327} {"train_loss": -7.217011451721191, "global_step": 181740, "epoch": 4327} {"train_loss": -6.976652145385742, "global_step": 181741, "epoch": 4327} {"train_loss": -7.184144020080566, "global_step": 181742, "epoch": 4327} {"train_loss": -6.952131748199463, "global_step": 181743, "epoch": 4327} {"train_loss": -6.958922386169434, "global_step": 181744, "epoch": 4327} {"train_loss": -7.090450763702393, "global_step": 181745, "epoch": 4327} {"train_loss": -7.021583080291748, "global_step": 181746, "epoch": 4327} {"train_loss": -7.217698097229004, "global_step": 181747, "epoch": 4327} {"train_loss": -6.992159843444824, "global_step": 181748, "epoch": 4327} {"train_loss": -7.158993721008301, "global_step": 181749, "epoch": 4327} {"train_loss": -6.982585906982422, "global_step": 181750, "epoch": 4327} {"train_loss": -7.065412521362305, "global_step": 181751, "epoch": 4327} {"train_loss": -7.035397529602051, "global_step": 181752, "epoch": 4327} {"train_loss": -7.082489013671875, "global_step": 181753, "epoch": 4327} {"train_loss": -7.093960762023926, "global_step": 181754, "epoch": 4327} {"train_loss": -7.211326599121094, "global_step": 181755, "epoch": 4327} {"train_loss": -7.090953826904297, "global_step": 181756, "epoch": 4327} {"train_loss": -7.046513080596924, "global_step": 181757, "epoch": 4327} {"train_loss": -7.157854080200195, "global_step": 181758, "epoch": 4327} {"train_loss": -7.132047653198242, "global_step": 181759, "epoch": 4327} {"train_loss": -7.042254447937012, "global_step": 181760, "epoch": 4327} {"train_loss": -6.951345443725586, "global_step": 181761, "epoch": 4327} {"train_loss": -7.093855381011963, "global_step": 181762, "epoch": 4327} {"train_loss": -7.21487283706665, "global_step": 181763, "epoch": 4327} {"train_loss": -6.995506763458252, "global_step": 181764, "epoch": 4327} {"train_loss": -6.981751441955566, "global_step": 181765, "epoch": 4327} {"train_loss": -7.133685111999512, "global_step": 181766, "epoch": 4327} {"train_loss": -7.070003032684326, "global_step": 181767, "epoch": 4327} {"train_loss": -7.140505790710449, "global_step": 181768, "epoch": 4327} {"train_loss": -7.111957550048828, "global_step": 181769, "epoch": 4327} {"train_loss": -7.043357849121094, "global_step": 181770, "epoch": 4327} {"train_loss": -6.994114398956299, "global_step": 181771, "epoch": 4327} {"train_loss": -7.121120452880859, "global_step": 181772, "epoch": 4327} {"train_loss": -7.044297218322754, "global_step": 181773, "epoch": 4327} {"train_loss": -7.133790969848633, "global_step": 181774, "epoch": 4327} {"train_loss": -7.07721437726702, "global_step": 181775, "epoch": 4327, "val_loss": 80570.1328125} {"train_loss": -6.934109687805176, "global_step": 181776, "epoch": 4328} {"train_loss": -7.079954624176025, "global_step": 181777, "epoch": 4328} {"train_loss": -7.028514385223389, "global_step": 181778, "epoch": 4328} {"train_loss": -7.156915664672852, "global_step": 181779, "epoch": 4328} {"train_loss": -7.185940742492676, "global_step": 181780, "epoch": 4328} {"train_loss": -7.110238552093506, "global_step": 181781, "epoch": 4328} {"train_loss": -7.130796432495117, "global_step": 181782, "epoch": 4328} {"train_loss": -7.032737731933594, "global_step": 181783, "epoch": 4328} {"train_loss": -7.235198497772217, "global_step": 181784, "epoch": 4328} {"train_loss": -7.064164161682129, "global_step": 181785, "epoch": 4328} {"train_loss": -7.184028148651123, "global_step": 181786, "epoch": 4328} {"train_loss": -7.202793121337891, "global_step": 181787, "epoch": 4328} {"train_loss": -7.006801605224609, "global_step": 181788, "epoch": 4328} {"train_loss": -7.085244178771973, "global_step": 181789, "epoch": 4328} {"train_loss": -7.01555061340332, "global_step": 181790, "epoch": 4328} {"train_loss": -7.217325210571289, "global_step": 181791, "epoch": 4328} {"train_loss": -6.99884557723999, "global_step": 181792, "epoch": 4328} {"train_loss": -7.168201923370361, "global_step": 181793, "epoch": 4328} {"train_loss": -7.035111427307129, "global_step": 181794, "epoch": 4328} {"train_loss": -7.117682456970215, "global_step": 181795, "epoch": 4328} {"train_loss": -7.043456077575684, "global_step": 181796, "epoch": 4328} {"train_loss": -7.097476005554199, "global_step": 181797, "epoch": 4328} {"train_loss": -7.025534629821777, "global_step": 181798, "epoch": 4328} {"train_loss": -7.2081146240234375, "global_step": 181799, "epoch": 4328} {"train_loss": -7.220668315887451, "global_step": 181800, "epoch": 4328} {"train_loss": -7.036210536956787, "global_step": 181801, "epoch": 4328} {"train_loss": -7.1142120361328125, "global_step": 181802, "epoch": 4328} {"train_loss": -6.999835968017578, "global_step": 181803, "epoch": 4328} {"train_loss": -7.165787696838379, "global_step": 181804, "epoch": 4328} {"train_loss": -7.0746307373046875, "global_step": 181805, "epoch": 4328} {"train_loss": -7.080102920532227, "global_step": 181806, "epoch": 4328} {"train_loss": -7.072616100311279, "global_step": 181807, "epoch": 4328} {"train_loss": -7.111617088317871, "global_step": 181808, "epoch": 4328} {"train_loss": -7.076834678649902, "global_step": 181809, "epoch": 4328} {"train_loss": -6.9553022384643555, "global_step": 181810, "epoch": 4328} {"train_loss": -7.132030487060547, "global_step": 181811, "epoch": 4328} {"train_loss": -7.049455165863037, "global_step": 181812, "epoch": 4328} {"train_loss": -7.166787147521973, "global_step": 181813, "epoch": 4328} {"train_loss": -7.142696380615234, "global_step": 181814, "epoch": 4328} {"train_loss": -7.232175827026367, "global_step": 181815, "epoch": 4328} {"train_loss": -7.176631927490234, "global_step": 181816, "epoch": 4328} {"train_loss": -7.1019944576990035, "global_step": 181817, "epoch": 4328, "val_loss": 80404.453125} {"train_loss": -7.237799167633057, "global_step": 181818, "epoch": 4329} {"train_loss": -7.131777286529541, "global_step": 181819, "epoch": 4329} {"train_loss": -7.145770072937012, "global_step": 181820, "epoch": 4329} {"train_loss": -7.261662006378174, "global_step": 181821, "epoch": 4329} {"train_loss": -7.1827850341796875, "global_step": 181822, "epoch": 4329} {"train_loss": -7.309807777404785, "global_step": 181823, "epoch": 4329} {"train_loss": -7.135384559631348, "global_step": 181824, "epoch": 4329} {"train_loss": -7.206153869628906, "global_step": 181825, "epoch": 4329} {"train_loss": -7.06491756439209, "global_step": 181826, "epoch": 4329} {"train_loss": -7.107089042663574, "global_step": 181827, "epoch": 4329} {"train_loss": -7.13443660736084, "global_step": 181828, "epoch": 4329} {"train_loss": -6.967536926269531, "global_step": 181829, "epoch": 4329} {"train_loss": -6.999191761016846, "global_step": 181830, "epoch": 4329} {"train_loss": -7.292001247406006, "global_step": 181831, "epoch": 4329} {"train_loss": -7.189580917358398, "global_step": 181832, "epoch": 4329} {"train_loss": -7.131255149841309, "global_step": 181833, "epoch": 4329} {"train_loss": -7.108189582824707, "global_step": 181834, "epoch": 4329} {"train_loss": -7.177186012268066, "global_step": 181835, "epoch": 4329} {"train_loss": -7.258297920227051, "global_step": 181836, "epoch": 4329} {"train_loss": -7.257213592529297, "global_step": 181837, "epoch": 4329} {"train_loss": -7.12807559967041, "global_step": 181838, "epoch": 4329} {"train_loss": -7.099839210510254, "global_step": 181839, "epoch": 4329} {"train_loss": -7.218891620635986, "global_step": 181840, "epoch": 4329} {"train_loss": -7.207073211669922, "global_step": 181841, "epoch": 4329} {"train_loss": -7.180747985839844, "global_step": 181842, "epoch": 4329} {"train_loss": -7.216681003570557, "global_step": 181843, "epoch": 4329} {"train_loss": -7.111457347869873, "global_step": 181844, "epoch": 4329} {"train_loss": -7.191091537475586, "global_step": 181845, "epoch": 4329} {"train_loss": -7.15247917175293, "global_step": 181846, "epoch": 4329} {"train_loss": -7.194960117340088, "global_step": 181847, "epoch": 4329} {"train_loss": -7.1831817626953125, "global_step": 181848, "epoch": 4329} {"train_loss": -7.0835676193237305, "global_step": 181849, "epoch": 4329} {"train_loss": -7.11326789855957, "global_step": 181850, "epoch": 4329} {"train_loss": -7.266574382781982, "global_step": 181851, "epoch": 4329} {"train_loss": -7.180515766143799, "global_step": 181852, "epoch": 4329} {"train_loss": -7.2448225021362305, "global_step": 181853, "epoch": 4329} {"train_loss": -7.204493045806885, "global_step": 181854, "epoch": 4329} {"train_loss": -7.199782371520996, "global_step": 181855, "epoch": 4329} {"train_loss": -7.152738094329834, "global_step": 181856, "epoch": 4329} {"train_loss": -7.191310882568359, "global_step": 181857, "epoch": 4329} {"train_loss": -6.985469818115234, "global_step": 181858, "epoch": 4329} {"train_loss": -7.161279769170852, "global_step": 181859, "epoch": 4329, "val_loss": 80641.3203125} {"train_loss": -7.133304119110107, "global_step": 181860, "epoch": 4330} {"train_loss": -6.949950695037842, "global_step": 181861, "epoch": 4330} {"train_loss": -7.131450653076172, "global_step": 181862, "epoch": 4330} {"train_loss": -7.185137748718262, "global_step": 181863, "epoch": 4330} {"train_loss": -7.094660758972168, "global_step": 181864, "epoch": 4330} {"train_loss": -7.172362327575684, "global_step": 181865, "epoch": 4330} {"train_loss": -7.123108863830566, "global_step": 181866, "epoch": 4330} {"train_loss": -7.082181453704834, "global_step": 181867, "epoch": 4330} {"train_loss": -7.085018157958984, "global_step": 181868, "epoch": 4330} {"train_loss": -7.16328239440918, "global_step": 181869, "epoch": 4330} {"train_loss": -7.151571273803711, "global_step": 181870, "epoch": 4330} {"train_loss": -7.121405601501465, "global_step": 181871, "epoch": 4330} {"train_loss": -7.081863880157471, "global_step": 181872, "epoch": 4330} {"train_loss": -7.105738162994385, "global_step": 181873, "epoch": 4330} {"train_loss": -7.117620944976807, "global_step": 181874, "epoch": 4330} {"train_loss": -7.029965400695801, "global_step": 181875, "epoch": 4330} {"train_loss": -7.147902488708496, "global_step": 181876, "epoch": 4330} {"train_loss": -7.085467338562012, "global_step": 181877, "epoch": 4330} {"train_loss": -7.031500816345215, "global_step": 181878, "epoch": 4330} {"train_loss": -7.164779186248779, "global_step": 181879, "epoch": 4330} {"train_loss": -7.033707141876221, "global_step": 181880, "epoch": 4330} {"train_loss": -7.073549270629883, "global_step": 181881, "epoch": 4330} {"train_loss": -7.0905561447143555, "global_step": 181882, "epoch": 4330} {"train_loss": -7.153460502624512, "global_step": 181883, "epoch": 4330} {"train_loss": -7.128432750701904, "global_step": 181884, "epoch": 4330} {"train_loss": -7.020479202270508, "global_step": 181885, "epoch": 4330} {"train_loss": -7.135806560516357, "global_step": 181886, "epoch": 4330} {"train_loss": -7.23772668838501, "global_step": 181887, "epoch": 4330} {"train_loss": -7.055263042449951, "global_step": 181888, "epoch": 4330} {"train_loss": -7.187312602996826, "global_step": 181889, "epoch": 4330} {"train_loss": -7.114285945892334, "global_step": 181890, "epoch": 4330} {"train_loss": -7.188051700592041, "global_step": 181891, "epoch": 4330} {"train_loss": -7.176643371582031, "global_step": 181892, "epoch": 4330} {"train_loss": -7.144176483154297, "global_step": 181893, "epoch": 4330} {"train_loss": -7.202430725097656, "global_step": 181894, "epoch": 4330} {"train_loss": -7.053830146789551, "global_step": 181895, "epoch": 4330} {"train_loss": -7.124815940856934, "global_step": 181896, "epoch": 4330} {"train_loss": -7.214358329772949, "global_step": 181897, "epoch": 4330} {"train_loss": -7.123291015625, "global_step": 181898, "epoch": 4330} {"train_loss": -7.050896644592285, "global_step": 181899, "epoch": 4330} {"train_loss": -7.157949447631836, "global_step": 181900, "epoch": 4330} {"train_loss": -7.118280740011306, "global_step": 181901, "epoch": 4330, "val_loss": 80605.359375} {"train_loss": -7.243225574493408, "global_step": 181902, "epoch": 4331} {"train_loss": -7.189125061035156, "global_step": 181903, "epoch": 4331} {"train_loss": -7.093743801116943, "global_step": 181904, "epoch": 4331} {"train_loss": -7.1925811767578125, "global_step": 181905, "epoch": 4331} {"train_loss": -7.165454387664795, "global_step": 181906, "epoch": 4331} {"train_loss": -7.206789016723633, "global_step": 181907, "epoch": 4331} {"train_loss": -7.1316914558410645, "global_step": 181908, "epoch": 4331} {"train_loss": -7.259574890136719, "global_step": 181909, "epoch": 4331} {"train_loss": -7.20327091217041, "global_step": 181910, "epoch": 4331} {"train_loss": -7.039550304412842, "global_step": 181911, "epoch": 4331} {"train_loss": -7.156778335571289, "global_step": 181912, "epoch": 4331} {"train_loss": -7.022774696350098, "global_step": 181913, "epoch": 4331} {"train_loss": -7.194300651550293, "global_step": 181914, "epoch": 4331} {"train_loss": -7.1868815422058105, "global_step": 181915, "epoch": 4331} {"train_loss": -7.058969974517822, "global_step": 181916, "epoch": 4331} {"train_loss": -7.079307556152344, "global_step": 181917, "epoch": 4331} {"train_loss": -7.152554512023926, "global_step": 181918, "epoch": 4331} {"train_loss": -7.060805320739746, "global_step": 181919, "epoch": 4331} {"train_loss": -7.052886962890625, "global_step": 181920, "epoch": 4331} {"train_loss": -7.138609886169434, "global_step": 181921, "epoch": 4331} {"train_loss": -7.209421157836914, "global_step": 181922, "epoch": 4331} {"train_loss": -7.127119541168213, "global_step": 181923, "epoch": 4331} {"train_loss": -7.124449253082275, "global_step": 181924, "epoch": 4331} {"train_loss": -7.1209306716918945, "global_step": 181925, "epoch": 4331} {"train_loss": -6.916231632232666, "global_step": 181926, "epoch": 4331} {"train_loss": -7.1211137771606445, "global_step": 181927, "epoch": 4331} {"train_loss": -6.863398551940918, "global_step": 181928, "epoch": 4331} {"train_loss": -6.931227684020996, "global_step": 181929, "epoch": 4331} {"train_loss": -7.090066432952881, "global_step": 181930, "epoch": 4331} {"train_loss": -6.782146453857422, "global_step": 181931, "epoch": 4331} {"train_loss": -7.155810832977295, "global_step": 181932, "epoch": 4331} {"train_loss": -6.977226257324219, "global_step": 181933, "epoch": 4331} {"train_loss": -7.14031982421875, "global_step": 181934, "epoch": 4331} {"train_loss": -7.11355447769165, "global_step": 181935, "epoch": 4331} {"train_loss": -7.112490177154541, "global_step": 181936, "epoch": 4331} {"train_loss": -7.153597354888916, "global_step": 181937, "epoch": 4331} {"train_loss": -7.039503574371338, "global_step": 181938, "epoch": 4331} {"train_loss": -7.195914268493652, "global_step": 181939, "epoch": 4331} {"train_loss": -7.113560676574707, "global_step": 181940, "epoch": 4331} {"train_loss": -7.114963531494141, "global_step": 181941, "epoch": 4331} {"train_loss": -7.108382225036621, "global_step": 181942, "epoch": 4331} {"train_loss": -7.107430968965803, "global_step": 181943, "epoch": 4331, "val_loss": 80641.890625} {"train_loss": -7.153561592102051, "global_step": 181944, "epoch": 4332} {"train_loss": -7.177141189575195, "global_step": 181945, "epoch": 4332} {"train_loss": -7.133853912353516, "global_step": 181946, "epoch": 4332} {"train_loss": -7.039813041687012, "global_step": 181947, "epoch": 4332} {"train_loss": -7.230392932891846, "global_step": 181948, "epoch": 4332} {"train_loss": -7.1204681396484375, "global_step": 181949, "epoch": 4332} {"train_loss": -7.154810905456543, "global_step": 181950, "epoch": 4332} {"train_loss": -7.217848777770996, "global_step": 181951, "epoch": 4332} {"train_loss": -7.173009872436523, "global_step": 181952, "epoch": 4332} {"train_loss": -7.218596458435059, "global_step": 181953, "epoch": 4332} {"train_loss": -7.282535076141357, "global_step": 181954, "epoch": 4332} {"train_loss": -7.113458633422852, "global_step": 181955, "epoch": 4332} {"train_loss": -7.237003326416016, "global_step": 181956, "epoch": 4332} {"train_loss": -7.1975789070129395, "global_step": 181957, "epoch": 4332} {"train_loss": -7.057745933532715, "global_step": 181958, "epoch": 4332} {"train_loss": -7.221795558929443, "global_step": 181959, "epoch": 4332} {"train_loss": -7.207047462463379, "global_step": 181960, "epoch": 4332} {"train_loss": -7.1526947021484375, "global_step": 181961, "epoch": 4332} {"train_loss": -7.196884632110596, "global_step": 181962, "epoch": 4332} {"train_loss": -7.174285888671875, "global_step": 181963, "epoch": 4332} {"train_loss": -7.172419548034668, "global_step": 181964, "epoch": 4332} {"train_loss": -7.210136413574219, "global_step": 181965, "epoch": 4332} {"train_loss": -7.14228630065918, "global_step": 181966, "epoch": 4332} {"train_loss": -7.254743576049805, "global_step": 181967, "epoch": 4332} {"train_loss": -7.311473846435547, "global_step": 181968, "epoch": 4332} {"train_loss": -7.271914958953857, "global_step": 181969, "epoch": 4332} {"train_loss": -7.175729751586914, "global_step": 181970, "epoch": 4332} {"train_loss": -7.089503765106201, "global_step": 181971, "epoch": 4332} {"train_loss": -7.096542835235596, "global_step": 181972, "epoch": 4332} {"train_loss": -7.228841781616211, "global_step": 181973, "epoch": 4332} {"train_loss": -7.089203357696533, "global_step": 181974, "epoch": 4332} {"train_loss": -7.086056709289551, "global_step": 181975, "epoch": 4332} {"train_loss": -7.024383544921875, "global_step": 181976, "epoch": 4332} {"train_loss": -6.973732948303223, "global_step": 181977, "epoch": 4332} {"train_loss": -7.182778358459473, "global_step": 181978, "epoch": 4332} {"train_loss": -7.059750556945801, "global_step": 181979, "epoch": 4332} {"train_loss": -7.06108283996582, "global_step": 181980, "epoch": 4332} {"train_loss": -7.225639343261719, "global_step": 181981, "epoch": 4332} {"train_loss": -7.078237533569336, "global_step": 181982, "epoch": 4332} {"train_loss": -7.021735191345215, "global_step": 181983, "epoch": 4332} {"train_loss": -7.049671649932861, "global_step": 181984, "epoch": 4332} {"train_loss": -7.153606766746158, "global_step": 181985, "epoch": 4332, "val_loss": 80969.609375} {"train_loss": -7.024921417236328, "global_step": 181986, "epoch": 4333} {"train_loss": -7.183651924133301, "global_step": 181987, "epoch": 4333} {"train_loss": -6.950358867645264, "global_step": 181988, "epoch": 4333} {"train_loss": -7.011723041534424, "global_step": 181989, "epoch": 4333} {"train_loss": -7.111340522766113, "global_step": 181990, "epoch": 4333} {"train_loss": -7.07835578918457, "global_step": 181991, "epoch": 4333} {"train_loss": -7.178761959075928, "global_step": 181992, "epoch": 4333} {"train_loss": -7.111645698547363, "global_step": 181993, "epoch": 4333} {"train_loss": -7.051704406738281, "global_step": 181994, "epoch": 4333} {"train_loss": -7.034653663635254, "global_step": 181995, "epoch": 4333} {"train_loss": -7.066206932067871, "global_step": 181996, "epoch": 4333} {"train_loss": -7.131333351135254, "global_step": 181997, "epoch": 4333} {"train_loss": -7.079050064086914, "global_step": 181998, "epoch": 4333} {"train_loss": -7.10288143157959, "global_step": 181999, "epoch": 4333} {"train_loss": -7.049386501312256, "global_step": 182000, "epoch": 4333} {"train_loss": -7.110274314880371, "global_step": 182001, "epoch": 4333} {"train_loss": -7.185695171356201, "global_step": 182002, "epoch": 4333} {"train_loss": -7.080618858337402, "global_step": 182003, "epoch": 4333} {"train_loss": -7.098845481872559, "global_step": 182004, "epoch": 4333} {"train_loss": -7.119332313537598, "global_step": 182005, "epoch": 4333} {"train_loss": -7.081071853637695, "global_step": 182006, "epoch": 4333} {"train_loss": -7.122801780700684, "global_step": 182007, "epoch": 4333} {"train_loss": -7.194948673248291, "global_step": 182008, "epoch": 4333} {"train_loss": -7.107804775238037, "global_step": 182009, "epoch": 4333} {"train_loss": -7.148224830627441, "global_step": 182010, "epoch": 4333} {"train_loss": -7.10629940032959, "global_step": 182011, "epoch": 4333} {"train_loss": -7.10711669921875, "global_step": 182012, "epoch": 4333} {"train_loss": -7.1412177085876465, "global_step": 182013, "epoch": 4333} {"train_loss": -7.230008125305176, "global_step": 182014, "epoch": 4333} {"train_loss": -7.127596855163574, "global_step": 182015, "epoch": 4333} {"train_loss": -7.088188648223877, "global_step": 182016, "epoch": 4333} {"train_loss": -7.176764488220215, "global_step": 182017, "epoch": 4333} {"train_loss": -7.077143669128418, "global_step": 182018, "epoch": 4333} {"train_loss": -7.098624229431152, "global_step": 182019, "epoch": 4333} {"train_loss": -7.152771949768066, "global_step": 182020, "epoch": 4333} {"train_loss": -7.199348449707031, "global_step": 182021, "epoch": 4333} {"train_loss": -7.2165913581848145, "global_step": 182022, "epoch": 4333} {"train_loss": -7.1670684814453125, "global_step": 182023, "epoch": 4333} {"train_loss": -7.230592727661133, "global_step": 182024, "epoch": 4333} {"train_loss": -7.228795528411865, "global_step": 182025, "epoch": 4333} {"train_loss": -7.22939395904541, "global_step": 182026, "epoch": 4333} {"train_loss": -7.123510247185116, "global_step": 182027, "epoch": 4333, "val_loss": 80549.078125} {"train_loss": -7.302073001861572, "global_step": 182028, "epoch": 4334} {"train_loss": -7.361750602722168, "global_step": 182029, "epoch": 4334} {"train_loss": -7.167015552520752, "global_step": 182030, "epoch": 4334} {"train_loss": -7.255795955657959, "global_step": 182031, "epoch": 4334} {"train_loss": -7.228079319000244, "global_step": 182032, "epoch": 4334} {"train_loss": -7.207653999328613, "global_step": 182033, "epoch": 4334} {"train_loss": -7.241083145141602, "global_step": 182034, "epoch": 4334} {"train_loss": -7.171156406402588, "global_step": 182035, "epoch": 4334} {"train_loss": -7.279915809631348, "global_step": 182036, "epoch": 4334} {"train_loss": -7.306911945343018, "global_step": 182037, "epoch": 4334} {"train_loss": -7.2745771408081055, "global_step": 182038, "epoch": 4334} {"train_loss": -7.24338436126709, "global_step": 182039, "epoch": 4334} {"train_loss": -7.162193775177002, "global_step": 182040, "epoch": 4334} {"train_loss": -7.186092376708984, "global_step": 182041, "epoch": 4334} {"train_loss": -7.2576446533203125, "global_step": 182042, "epoch": 4334} {"train_loss": -7.2332000732421875, "global_step": 182043, "epoch": 4334} {"train_loss": -7.184886932373047, "global_step": 182044, "epoch": 4334} {"train_loss": -7.221435070037842, "global_step": 182045, "epoch": 4334} {"train_loss": -7.180942535400391, "global_step": 182046, "epoch": 4334} {"train_loss": -7.3179473876953125, "global_step": 182047, "epoch": 4334} {"train_loss": -7.2179179191589355, "global_step": 182048, "epoch": 4334} {"train_loss": -7.173643112182617, "global_step": 182049, "epoch": 4334} {"train_loss": -7.316476821899414, "global_step": 182050, "epoch": 4334} {"train_loss": -7.238467216491699, "global_step": 182051, "epoch": 4334} {"train_loss": -7.213287830352783, "global_step": 182052, "epoch": 4334} {"train_loss": -7.294325828552246, "global_step": 182053, "epoch": 4334} {"train_loss": -7.161134719848633, "global_step": 182054, "epoch": 4334} {"train_loss": -7.096491813659668, "global_step": 182055, "epoch": 4334} {"train_loss": -7.185051441192627, "global_step": 182056, "epoch": 4334} {"train_loss": -7.0695390701293945, "global_step": 182057, "epoch": 4334} {"train_loss": -7.0154194831848145, "global_step": 182058, "epoch": 4334} {"train_loss": -7.208682060241699, "global_step": 182059, "epoch": 4334} {"train_loss": -7.1841559410095215, "global_step": 182060, "epoch": 4334} {"train_loss": -7.0136237144470215, "global_step": 182061, "epoch": 4334} {"train_loss": -6.999004364013672, "global_step": 182062, "epoch": 4334} {"train_loss": -7.246403217315674, "global_step": 182063, "epoch": 4334} {"train_loss": -7.144711494445801, "global_step": 182064, "epoch": 4334} {"train_loss": -7.055266857147217, "global_step": 182065, "epoch": 4334} {"train_loss": -7.277451038360596, "global_step": 182066, "epoch": 4334} {"train_loss": -7.083845138549805, "global_step": 182067, "epoch": 4334} {"train_loss": -7.074616432189941, "global_step": 182068, "epoch": 4334} {"train_loss": -7.194246791657948, "global_step": 182069, "epoch": 4334, "val_loss": 80900.6640625} {"train_loss": -7.15880012512207, "global_step": 182070, "epoch": 4335} {"train_loss": -7.1478471755981445, "global_step": 182071, "epoch": 4335} {"train_loss": -7.139225959777832, "global_step": 182072, "epoch": 4335} {"train_loss": -7.155857086181641, "global_step": 182073, "epoch": 4335} {"train_loss": -7.067073822021484, "global_step": 182074, "epoch": 4335} {"train_loss": -7.207520961761475, "global_step": 182075, "epoch": 4335} {"train_loss": -7.1013994216918945, "global_step": 182076, "epoch": 4335} {"train_loss": -7.130865573883057, "global_step": 182077, "epoch": 4335} {"train_loss": -7.1664958000183105, "global_step": 182078, "epoch": 4335} {"train_loss": -7.249390125274658, "global_step": 182079, "epoch": 4335} {"train_loss": -7.176032543182373, "global_step": 182080, "epoch": 4335} {"train_loss": -7.1887102127075195, "global_step": 182081, "epoch": 4335} {"train_loss": -7.215706825256348, "global_step": 182082, "epoch": 4335} {"train_loss": -7.1010966300964355, "global_step": 182083, "epoch": 4335} {"train_loss": -7.169417381286621, "global_step": 182084, "epoch": 4335} {"train_loss": -7.18897008895874, "global_step": 182085, "epoch": 4335} {"train_loss": -7.2265424728393555, "global_step": 182086, "epoch": 4335} {"train_loss": -7.046572685241699, "global_step": 182087, "epoch": 4335} {"train_loss": -7.126609802246094, "global_step": 182088, "epoch": 4335} {"train_loss": -7.160894393920898, "global_step": 182089, "epoch": 4335} {"train_loss": -7.004332065582275, "global_step": 182090, "epoch": 4335} {"train_loss": -7.204676151275635, "global_step": 182091, "epoch": 4335} {"train_loss": -7.042943477630615, "global_step": 182092, "epoch": 4335} {"train_loss": -6.9704742431640625, "global_step": 182093, "epoch": 4335} {"train_loss": -6.987795352935791, "global_step": 182094, "epoch": 4335} {"train_loss": -7.047035217285156, "global_step": 182095, "epoch": 4335} {"train_loss": -7.182244300842285, "global_step": 182096, "epoch": 4335} {"train_loss": -7.013703346252441, "global_step": 182097, "epoch": 4335} {"train_loss": -7.17787504196167, "global_step": 182098, "epoch": 4335} {"train_loss": -6.9524431228637695, "global_step": 182099, "epoch": 4335} {"train_loss": -6.961153030395508, "global_step": 182100, "epoch": 4335} {"train_loss": -7.0670013427734375, "global_step": 182101, "epoch": 4335} {"train_loss": -6.949647426605225, "global_step": 182102, "epoch": 4335} {"train_loss": -7.18828010559082, "global_step": 182103, "epoch": 4335} {"train_loss": -6.853523254394531, "global_step": 182104, "epoch": 4335} {"train_loss": -7.02976131439209, "global_step": 182105, "epoch": 4335} {"train_loss": -6.987421035766602, "global_step": 182106, "epoch": 4335} {"train_loss": -6.930764198303223, "global_step": 182107, "epoch": 4335} {"train_loss": -7.038081645965576, "global_step": 182108, "epoch": 4335} {"train_loss": -6.906021595001221, "global_step": 182109, "epoch": 4335} {"train_loss": -7.11773681640625, "global_step": 182110, "epoch": 4335} {"train_loss": -7.090196405138288, "global_step": 182111, "epoch": 4335, "val_loss": 80737.109375} {"train_loss": -7.086864471435547, "global_step": 182112, "epoch": 4336} {"train_loss": -7.093709945678711, "global_step": 182113, "epoch": 4336} {"train_loss": -7.129535675048828, "global_step": 182114, "epoch": 4336} {"train_loss": -7.070216655731201, "global_step": 182115, "epoch": 4336} {"train_loss": -7.082767486572266, "global_step": 182116, "epoch": 4336} {"train_loss": -7.0926513671875, "global_step": 182117, "epoch": 4336} {"train_loss": -7.044557571411133, "global_step": 182118, "epoch": 4336} {"train_loss": -7.015113830566406, "global_step": 182119, "epoch": 4336} {"train_loss": -7.0799760818481445, "global_step": 182120, "epoch": 4336} {"train_loss": -7.122374057769775, "global_step": 182121, "epoch": 4336} {"train_loss": -6.948134899139404, "global_step": 182122, "epoch": 4336} {"train_loss": -7.0009894371032715, "global_step": 182123, "epoch": 4336} {"train_loss": -7.071771621704102, "global_step": 182124, "epoch": 4336} {"train_loss": -7.114343643188477, "global_step": 182125, "epoch": 4336} {"train_loss": -7.089303016662598, "global_step": 182126, "epoch": 4336} {"train_loss": -7.203817367553711, "global_step": 182127, "epoch": 4336} {"train_loss": -7.138489723205566, "global_step": 182128, "epoch": 4336} {"train_loss": -7.048223495483398, "global_step": 182129, "epoch": 4336} {"train_loss": -7.100407123565674, "global_step": 182130, "epoch": 4336} {"train_loss": -7.11929988861084, "global_step": 182131, "epoch": 4336} {"train_loss": -7.112310409545898, "global_step": 182132, "epoch": 4336} {"train_loss": -7.16077995300293, "global_step": 182133, "epoch": 4336} {"train_loss": -7.231586456298828, "global_step": 182134, "epoch": 4336} {"train_loss": -6.99692440032959, "global_step": 182135, "epoch": 4336} {"train_loss": -7.102730751037598, "global_step": 182136, "epoch": 4336} {"train_loss": -7.050910949707031, "global_step": 182137, "epoch": 4336} {"train_loss": -7.025688648223877, "global_step": 182138, "epoch": 4336} {"train_loss": -7.104444980621338, "global_step": 182139, "epoch": 4336} {"train_loss": -6.947577953338623, "global_step": 182140, "epoch": 4336} {"train_loss": -6.9981369972229, "global_step": 182141, "epoch": 4336} {"train_loss": -7.210779190063477, "global_step": 182142, "epoch": 4336} {"train_loss": -7.0095930099487305, "global_step": 182143, "epoch": 4336} {"train_loss": -7.2031755447387695, "global_step": 182144, "epoch": 4336} {"train_loss": -6.8956298828125, "global_step": 182145, "epoch": 4336} {"train_loss": -7.036494255065918, "global_step": 182146, "epoch": 4336} {"train_loss": -7.115468978881836, "global_step": 182147, "epoch": 4336} {"train_loss": -7.026304721832275, "global_step": 182148, "epoch": 4336} {"train_loss": -7.098782539367676, "global_step": 182149, "epoch": 4336} {"train_loss": -7.1169753074646, "global_step": 182150, "epoch": 4336} {"train_loss": -7.0682244300842285, "global_step": 182151, "epoch": 4336} {"train_loss": -7.170709133148193, "global_step": 182152, "epoch": 4336} {"train_loss": -7.0814009961627775, "global_step": 182153, "epoch": 4336, "val_loss": 80543.625} {"train_loss": -7.087247371673584, "global_step": 182154, "epoch": 4337} {"train_loss": -7.144097805023193, "global_step": 182155, "epoch": 4337} {"train_loss": -7.21013879776001, "global_step": 182156, "epoch": 4337} {"train_loss": -7.162343978881836, "global_step": 182157, "epoch": 4337} {"train_loss": -7.130388259887695, "global_step": 182158, "epoch": 4337} {"train_loss": -7.170459747314453, "global_step": 182159, "epoch": 4337} {"train_loss": -7.099039077758789, "global_step": 182160, "epoch": 4337} {"train_loss": -7.180163383483887, "global_step": 182161, "epoch": 4337} {"train_loss": -7.109524726867676, "global_step": 182162, "epoch": 4337} {"train_loss": -7.209283351898193, "global_step": 182163, "epoch": 4337} {"train_loss": -7.269779205322266, "global_step": 182164, "epoch": 4337} {"train_loss": -7.14356803894043, "global_step": 182165, "epoch": 4337} {"train_loss": -7.151803970336914, "global_step": 182166, "epoch": 4337} {"train_loss": -7.176094055175781, "global_step": 182167, "epoch": 4337} {"train_loss": -7.15962028503418, "global_step": 182168, "epoch": 4337} {"train_loss": -7.164175987243652, "global_step": 182169, "epoch": 4337} {"train_loss": -7.110804557800293, "global_step": 182170, "epoch": 4337} {"train_loss": -7.147515296936035, "global_step": 182171, "epoch": 4337} {"train_loss": -7.130993843078613, "global_step": 182172, "epoch": 4337} {"train_loss": -7.158841609954834, "global_step": 182173, "epoch": 4337} {"train_loss": -7.178884506225586, "global_step": 182174, "epoch": 4337} {"train_loss": -7.118038177490234, "global_step": 182175, "epoch": 4337} {"train_loss": -7.135501861572266, "global_step": 182176, "epoch": 4337} {"train_loss": -7.124744415283203, "global_step": 182177, "epoch": 4337} {"train_loss": -7.164358615875244, "global_step": 182178, "epoch": 4337} {"train_loss": -6.979726791381836, "global_step": 182179, "epoch": 4337} {"train_loss": -7.109827995300293, "global_step": 182180, "epoch": 4337} {"train_loss": -7.274823188781738, "global_step": 182181, "epoch": 4337} {"train_loss": -7.087894439697266, "global_step": 182182, "epoch": 4337} {"train_loss": -7.092442512512207, "global_step": 182183, "epoch": 4337} {"train_loss": -7.202437400817871, "global_step": 182184, "epoch": 4337} {"train_loss": -7.148110389709473, "global_step": 182185, "epoch": 4337} {"train_loss": -7.207599639892578, "global_step": 182186, "epoch": 4337} {"train_loss": -7.041781425476074, "global_step": 182187, "epoch": 4337} {"train_loss": -7.070284843444824, "global_step": 182188, "epoch": 4337} {"train_loss": -6.89564847946167, "global_step": 182189, "epoch": 4337} {"train_loss": -7.204714775085449, "global_step": 182190, "epoch": 4337} {"train_loss": -6.952159404754639, "global_step": 182191, "epoch": 4337} {"train_loss": -7.004650115966797, "global_step": 182192, "epoch": 4337} {"train_loss": -7.167957305908203, "global_step": 182193, "epoch": 4337} {"train_loss": -7.045795440673828, "global_step": 182194, "epoch": 4337} {"train_loss": -7.132159823463077, "global_step": 182195, "epoch": 4337, "val_loss": 80892.0625} {"train_loss": -7.197514533996582, "global_step": 182196, "epoch": 4338} {"train_loss": -7.211240291595459, "global_step": 182197, "epoch": 4338} {"train_loss": -7.06573486328125, "global_step": 182198, "epoch": 4338} {"train_loss": -7.261316299438477, "global_step": 182199, "epoch": 4338} {"train_loss": -7.123480796813965, "global_step": 182200, "epoch": 4338} {"train_loss": -7.065067291259766, "global_step": 182201, "epoch": 4338} {"train_loss": -7.140746116638184, "global_step": 182202, "epoch": 4338} {"train_loss": -7.073673248291016, "global_step": 182203, "epoch": 4338} {"train_loss": -7.232216835021973, "global_step": 182204, "epoch": 4338} {"train_loss": -7.230731964111328, "global_step": 182205, "epoch": 4338} {"train_loss": -7.140813827514648, "global_step": 182206, "epoch": 4338} {"train_loss": -7.292222023010254, "global_step": 182207, "epoch": 4338} {"train_loss": -7.1630539894104, "global_step": 182208, "epoch": 4338} {"train_loss": -7.2140889167785645, "global_step": 182209, "epoch": 4338} {"train_loss": -7.134024620056152, "global_step": 182210, "epoch": 4338} {"train_loss": -7.309324264526367, "global_step": 182211, "epoch": 4338} {"train_loss": -7.222385406494141, "global_step": 182212, "epoch": 4338} {"train_loss": -7.206317901611328, "global_step": 182213, "epoch": 4338} {"train_loss": -7.182229042053223, "global_step": 182214, "epoch": 4338} {"train_loss": -7.143704414367676, "global_step": 182215, "epoch": 4338} {"train_loss": -7.308676719665527, "global_step": 182216, "epoch": 4338} {"train_loss": -7.148375511169434, "global_step": 182217, "epoch": 4338} {"train_loss": -7.300912857055664, "global_step": 182218, "epoch": 4338} {"train_loss": -7.152239799499512, "global_step": 182219, "epoch": 4338} {"train_loss": -7.23320198059082, "global_step": 182220, "epoch": 4338} {"train_loss": -7.166219711303711, "global_step": 182221, "epoch": 4338} {"train_loss": -7.041498184204102, "global_step": 182222, "epoch": 4338} {"train_loss": -7.172788619995117, "global_step": 182223, "epoch": 4338} {"train_loss": -7.066316604614258, "global_step": 182224, "epoch": 4338} {"train_loss": -7.157632827758789, "global_step": 182225, "epoch": 4338} {"train_loss": -6.865436553955078, "global_step": 182226, "epoch": 4338} {"train_loss": -6.959756851196289, "global_step": 182227, "epoch": 4338} {"train_loss": -7.078632831573486, "global_step": 182228, "epoch": 4338} {"train_loss": -7.031426906585693, "global_step": 182229, "epoch": 4338} {"train_loss": -6.976235389709473, "global_step": 182230, "epoch": 4338} {"train_loss": -7.077152252197266, "global_step": 182231, "epoch": 4338} {"train_loss": -7.087955474853516, "global_step": 182232, "epoch": 4338} {"train_loss": -7.020596981048584, "global_step": 182233, "epoch": 4338} {"train_loss": -6.967634201049805, "global_step": 182234, "epoch": 4338} {"train_loss": -6.8960113525390625, "global_step": 182235, "epoch": 4338} {"train_loss": -7.033977031707764, "global_step": 182236, "epoch": 4338} {"train_loss": -7.130880333128429, "global_step": 182237, "epoch": 4338, "val_loss": 80846.1484375} {"train_loss": -6.98884391784668, "global_step": 182238, "epoch": 4339} {"train_loss": -7.220034599304199, "global_step": 182239, "epoch": 4339} {"train_loss": -7.101583957672119, "global_step": 182240, "epoch": 4339} {"train_loss": -7.039440155029297, "global_step": 182241, "epoch": 4339} {"train_loss": -7.062823295593262, "global_step": 182242, "epoch": 4339} {"train_loss": -7.108354091644287, "global_step": 182243, "epoch": 4339} {"train_loss": -7.063168525695801, "global_step": 182244, "epoch": 4339} {"train_loss": -7.00835657119751, "global_step": 182245, "epoch": 4339} {"train_loss": -7.079850196838379, "global_step": 182246, "epoch": 4339} {"train_loss": -7.152617931365967, "global_step": 182247, "epoch": 4339} {"train_loss": -7.11630916595459, "global_step": 182248, "epoch": 4339} {"train_loss": -7.092800140380859, "global_step": 182249, "epoch": 4339} {"train_loss": -7.064070701599121, "global_step": 182250, "epoch": 4339} {"train_loss": -7.112919807434082, "global_step": 182251, "epoch": 4339} {"train_loss": -7.116646766662598, "global_step": 182252, "epoch": 4339} {"train_loss": -7.095309257507324, "global_step": 182253, "epoch": 4339} {"train_loss": -7.151104927062988, "global_step": 182254, "epoch": 4339} {"train_loss": -7.027981758117676, "global_step": 182255, "epoch": 4339} {"train_loss": -7.088497161865234, "global_step": 182256, "epoch": 4339} {"train_loss": -7.141417980194092, "global_step": 182257, "epoch": 4339} {"train_loss": -7.130829811096191, "global_step": 182258, "epoch": 4339} {"train_loss": -7.159826755523682, "global_step": 182259, "epoch": 4339} {"train_loss": -7.258801460266113, "global_step": 182260, "epoch": 4339} {"train_loss": -7.127981185913086, "global_step": 182261, "epoch": 4339} {"train_loss": -7.139043807983398, "global_step": 182262, "epoch": 4339} {"train_loss": -7.143188953399658, "global_step": 182263, "epoch": 4339} {"train_loss": -7.165346622467041, "global_step": 182264, "epoch": 4339} {"train_loss": -7.186493873596191, "global_step": 182265, "epoch": 4339} {"train_loss": -7.163232803344727, "global_step": 182266, "epoch": 4339} {"train_loss": -7.175243377685547, "global_step": 182267, "epoch": 4339} {"train_loss": -7.167342185974121, "global_step": 182268, "epoch": 4339} {"train_loss": -7.180742263793945, "global_step": 182269, "epoch": 4339} {"train_loss": -7.1221537590026855, "global_step": 182270, "epoch": 4339} {"train_loss": -7.064307689666748, "global_step": 182271, "epoch": 4339} {"train_loss": -7.1685791015625, "global_step": 182272, "epoch": 4339} {"train_loss": -7.18464469909668, "global_step": 182273, "epoch": 4339} {"train_loss": -7.110751152038574, "global_step": 182274, "epoch": 4339} {"train_loss": -7.2689056396484375, "global_step": 182275, "epoch": 4339} {"train_loss": -7.048535346984863, "global_step": 182276, "epoch": 4339} {"train_loss": -7.107389450073242, "global_step": 182277, "epoch": 4339} {"train_loss": -7.275391578674316, "global_step": 182278, "epoch": 4339} {"train_loss": -7.1281028020949595, "global_step": 182279, "epoch": 4339, "val_loss": 80628.09375} {"train_loss": -7.239045143127441, "global_step": 182280, "epoch": 4340} {"train_loss": -7.167934417724609, "global_step": 182281, "epoch": 4340} {"train_loss": -7.204185485839844, "global_step": 182282, "epoch": 4340} {"train_loss": -7.16045618057251, "global_step": 182283, "epoch": 4340} {"train_loss": -7.226498603820801, "global_step": 182284, "epoch": 4340} {"train_loss": -7.16213321685791, "global_step": 182285, "epoch": 4340} {"train_loss": -7.151960372924805, "global_step": 182286, "epoch": 4340} {"train_loss": -7.163928985595703, "global_step": 182287, "epoch": 4340} {"train_loss": -7.177310943603516, "global_step": 182288, "epoch": 4340} {"train_loss": -7.182551383972168, "global_step": 182289, "epoch": 4340} {"train_loss": -7.244359970092773, "global_step": 182290, "epoch": 4340} {"train_loss": -7.180215835571289, "global_step": 182291, "epoch": 4340} {"train_loss": -7.172853469848633, "global_step": 182292, "epoch": 4340} {"train_loss": -7.21567440032959, "global_step": 182293, "epoch": 4340} {"train_loss": -7.253114700317383, "global_step": 182294, "epoch": 4340} {"train_loss": -7.086782932281494, "global_step": 182295, "epoch": 4340} {"train_loss": -7.13060188293457, "global_step": 182296, "epoch": 4340} {"train_loss": -7.1081156730651855, "global_step": 182297, "epoch": 4340} {"train_loss": -7.049749851226807, "global_step": 182298, "epoch": 4340} {"train_loss": -7.053662300109863, "global_step": 182299, "epoch": 4340} {"train_loss": -7.098169326782227, "global_step": 182300, "epoch": 4340} {"train_loss": -6.98190975189209, "global_step": 182301, "epoch": 4340} {"train_loss": -7.106231689453125, "global_step": 182302, "epoch": 4340} {"train_loss": -7.1359639167785645, "global_step": 182303, "epoch": 4340} {"train_loss": -7.070666790008545, "global_step": 182304, "epoch": 4340} {"train_loss": -7.114995956420898, "global_step": 182305, "epoch": 4340} {"train_loss": -6.988125801086426, "global_step": 182306, "epoch": 4340} {"train_loss": -7.14970064163208, "global_step": 182307, "epoch": 4340} {"train_loss": -7.1762375831604, "global_step": 182308, "epoch": 4340} {"train_loss": -7.012509822845459, "global_step": 182309, "epoch": 4340} {"train_loss": -7.088099002838135, "global_step": 182310, "epoch": 4340} {"train_loss": -7.042484283447266, "global_step": 182311, "epoch": 4340} {"train_loss": -6.935967922210693, "global_step": 182312, "epoch": 4340} {"train_loss": -7.163645267486572, "global_step": 182313, "epoch": 4340} {"train_loss": -7.045205593109131, "global_step": 182314, "epoch": 4340} {"train_loss": -7.045154571533203, "global_step": 182315, "epoch": 4340} {"train_loss": -7.008699893951416, "global_step": 182316, "epoch": 4340} {"train_loss": -7.080160140991211, "global_step": 182317, "epoch": 4340} {"train_loss": -7.032759666442871, "global_step": 182318, "epoch": 4340} {"train_loss": -7.110472679138184, "global_step": 182319, "epoch": 4340} {"train_loss": -7.143198013305664, "global_step": 182320, "epoch": 4340} {"train_loss": -7.119497912270682, "global_step": 182321, "epoch": 4340, "val_loss": 80706.2734375} {"train_loss": -7.160864353179932, "global_step": 182322, "epoch": 4341} {"train_loss": -7.0885210037231445, "global_step": 182323, "epoch": 4341} {"train_loss": -7.103219509124756, "global_step": 182324, "epoch": 4341} {"train_loss": -7.027336120605469, "global_step": 182325, "epoch": 4341} {"train_loss": -7.120977401733398, "global_step": 182326, "epoch": 4341} {"train_loss": -7.034121513366699, "global_step": 182327, "epoch": 4341} {"train_loss": -7.175725936889648, "global_step": 182328, "epoch": 4341} {"train_loss": -7.156551361083984, "global_step": 182329, "epoch": 4341} {"train_loss": -7.138113975524902, "global_step": 182330, "epoch": 4341} {"train_loss": -7.074957847595215, "global_step": 182331, "epoch": 4341} {"train_loss": -7.106756210327148, "global_step": 182332, "epoch": 4341} {"train_loss": -7.101983070373535, "global_step": 182333, "epoch": 4341} {"train_loss": -7.173859596252441, "global_step": 182334, "epoch": 4341} {"train_loss": -7.100996494293213, "global_step": 182335, "epoch": 4341} {"train_loss": -7.110476970672607, "global_step": 182336, "epoch": 4341} {"train_loss": -7.026856422424316, "global_step": 182337, "epoch": 4341} {"train_loss": -7.245084762573242, "global_step": 182338, "epoch": 4341} {"train_loss": -7.040422439575195, "global_step": 182339, "epoch": 4341} {"train_loss": -7.082182884216309, "global_step": 182340, "epoch": 4341} {"train_loss": -7.150841236114502, "global_step": 182341, "epoch": 4341} {"train_loss": -7.168621063232422, "global_step": 182342, "epoch": 4341} {"train_loss": -7.14387321472168, "global_step": 182343, "epoch": 4341} {"train_loss": -6.983041286468506, "global_step": 182344, "epoch": 4341} {"train_loss": -7.083345413208008, "global_step": 182345, "epoch": 4341} {"train_loss": -7.093988418579102, "global_step": 182346, "epoch": 4341} {"train_loss": -7.186429977416992, "global_step": 182347, "epoch": 4341} {"train_loss": -7.209049224853516, "global_step": 182348, "epoch": 4341} {"train_loss": -7.100160598754883, "global_step": 182349, "epoch": 4341} {"train_loss": -7.095752716064453, "global_step": 182350, "epoch": 4341} {"train_loss": -7.126189231872559, "global_step": 182351, "epoch": 4341} {"train_loss": -7.20692253112793, "global_step": 182352, "epoch": 4341} {"train_loss": -7.2416300773620605, "global_step": 182353, "epoch": 4341} {"train_loss": -7.214072227478027, "global_step": 182354, "epoch": 4341} {"train_loss": -7.10386848449707, "global_step": 182355, "epoch": 4341} {"train_loss": -7.157369613647461, "global_step": 182356, "epoch": 4341} {"train_loss": -7.114616394042969, "global_step": 182357, "epoch": 4341} {"train_loss": -7.228207588195801, "global_step": 182358, "epoch": 4341} {"train_loss": -7.140456199645996, "global_step": 182359, "epoch": 4341} {"train_loss": -7.148370265960693, "global_step": 182360, "epoch": 4341} {"train_loss": -7.1620588302612305, "global_step": 182361, "epoch": 4341} {"train_loss": -6.914134979248047, "global_step": 182362, "epoch": 4341} {"train_loss": -7.121720938455491, "global_step": 182363, "epoch": 4341, "val_loss": 80483.3515625} {"train_loss": -7.137723445892334, "global_step": 182364, "epoch": 4342} {"train_loss": -7.221804141998291, "global_step": 182365, "epoch": 4342} {"train_loss": -7.160710334777832, "global_step": 182366, "epoch": 4342} {"train_loss": -7.132722854614258, "global_step": 182367, "epoch": 4342} {"train_loss": -7.05174446105957, "global_step": 182368, "epoch": 4342} {"train_loss": -7.080968856811523, "global_step": 182369, "epoch": 4342} {"train_loss": -6.9770002365112305, "global_step": 182370, "epoch": 4342} {"train_loss": -7.12374210357666, "global_step": 182371, "epoch": 4342} {"train_loss": -7.080187797546387, "global_step": 182372, "epoch": 4342} {"train_loss": -7.162938594818115, "global_step": 182373, "epoch": 4342} {"train_loss": -7.0247802734375, "global_step": 182374, "epoch": 4342} {"train_loss": -7.13250732421875, "global_step": 182375, "epoch": 4342} {"train_loss": -7.038841724395752, "global_step": 182376, "epoch": 4342} {"train_loss": -7.112689971923828, "global_step": 182377, "epoch": 4342} {"train_loss": -7.068745136260986, "global_step": 182378, "epoch": 4342} {"train_loss": -7.08271598815918, "global_step": 182379, "epoch": 4342} {"train_loss": -7.136504173278809, "global_step": 182380, "epoch": 4342} {"train_loss": -6.97399377822876, "global_step": 182381, "epoch": 4342} {"train_loss": -7.025835037231445, "global_step": 182382, "epoch": 4342} {"train_loss": -7.203200340270996, "global_step": 182383, "epoch": 4342} {"train_loss": -7.059680938720703, "global_step": 182384, "epoch": 4342} {"train_loss": -7.192765235900879, "global_step": 182385, "epoch": 4342} {"train_loss": -7.11700439453125, "global_step": 182386, "epoch": 4342} {"train_loss": -7.124183654785156, "global_step": 182387, "epoch": 4342} {"train_loss": -7.22585391998291, "global_step": 182388, "epoch": 4342} {"train_loss": -7.117054462432861, "global_step": 182389, "epoch": 4342} {"train_loss": -7.150305271148682, "global_step": 182390, "epoch": 4342} {"train_loss": -7.152037143707275, "global_step": 182391, "epoch": 4342} {"train_loss": -7.1353325843811035, "global_step": 182392, "epoch": 4342} {"train_loss": -7.198759078979492, "global_step": 182393, "epoch": 4342} {"train_loss": -7.351742744445801, "global_step": 182394, "epoch": 4342} {"train_loss": -7.231796741485596, "global_step": 182395, "epoch": 4342} {"train_loss": -7.201162338256836, "global_step": 182396, "epoch": 4342} {"train_loss": -7.114006042480469, "global_step": 182397, "epoch": 4342} {"train_loss": -7.168984889984131, "global_step": 182398, "epoch": 4342} {"train_loss": -7.20925760269165, "global_step": 182399, "epoch": 4342} {"train_loss": -7.140754699707031, "global_step": 182400, "epoch": 4342} {"train_loss": -7.284566879272461, "global_step": 182401, "epoch": 4342} {"train_loss": -7.256831169128418, "global_step": 182402, "epoch": 4342} {"train_loss": -7.207309722900391, "global_step": 182403, "epoch": 4342} {"train_loss": -7.29680061340332, "global_step": 182404, "epoch": 4342} {"train_loss": -7.14400205158052, "global_step": 182405, "epoch": 4342, "val_loss": 80711.0390625} {"train_loss": -7.297954082489014, "global_step": 182406, "epoch": 4343} {"train_loss": -7.168471336364746, "global_step": 182407, "epoch": 4343} {"train_loss": -7.207799911499023, "global_step": 182408, "epoch": 4343} {"train_loss": -7.202278137207031, "global_step": 182409, "epoch": 4343} {"train_loss": -7.1861653327941895, "global_step": 182410, "epoch": 4343} {"train_loss": -7.229896545410156, "global_step": 182411, "epoch": 4343} {"train_loss": -7.229031562805176, "global_step": 182412, "epoch": 4343} {"train_loss": -7.2177886962890625, "global_step": 182413, "epoch": 4343} {"train_loss": -7.211652755737305, "global_step": 182414, "epoch": 4343} {"train_loss": -7.140264511108398, "global_step": 182415, "epoch": 4343} {"train_loss": -7.327178955078125, "global_step": 182416, "epoch": 4343} {"train_loss": -7.217857837677002, "global_step": 182417, "epoch": 4343} {"train_loss": -7.34160041809082, "global_step": 182418, "epoch": 4343} {"train_loss": -7.230523109436035, "global_step": 182419, "epoch": 4343} {"train_loss": -7.260195255279541, "global_step": 182420, "epoch": 4343} {"train_loss": -7.275419235229492, "global_step": 182421, "epoch": 4343} {"train_loss": -7.3226399421691895, "global_step": 182422, "epoch": 4343} {"train_loss": -7.253814697265625, "global_step": 182423, "epoch": 4343} {"train_loss": -7.188094139099121, "global_step": 182424, "epoch": 4343} {"train_loss": -7.15028190612793, "global_step": 182425, "epoch": 4343} {"train_loss": -7.275969505310059, "global_step": 182426, "epoch": 4343} {"train_loss": -7.270755290985107, "global_step": 182427, "epoch": 4343} {"train_loss": -7.06132698059082, "global_step": 182428, "epoch": 4343} {"train_loss": -7.233329772949219, "global_step": 182429, "epoch": 4343} {"train_loss": -7.15619421005249, "global_step": 182430, "epoch": 4343} {"train_loss": -7.166065216064453, "global_step": 182431, "epoch": 4343} {"train_loss": -7.209003448486328, "global_step": 182432, "epoch": 4343} {"train_loss": -7.091621398925781, "global_step": 182433, "epoch": 4343} {"train_loss": -7.099917411804199, "global_step": 182434, "epoch": 4343} {"train_loss": -7.121390342712402, "global_step": 182435, "epoch": 4343} {"train_loss": -7.138803482055664, "global_step": 182436, "epoch": 4343} {"train_loss": -7.093559741973877, "global_step": 182437, "epoch": 4343} {"train_loss": -7.08748722076416, "global_step": 182438, "epoch": 4343} {"train_loss": -7.092296123504639, "global_step": 182439, "epoch": 4343} {"train_loss": -7.171582221984863, "global_step": 182440, "epoch": 4343} {"train_loss": -7.138631820678711, "global_step": 182441, "epoch": 4343} {"train_loss": -7.061764717102051, "global_step": 182442, "epoch": 4343} {"train_loss": -7.06299352645874, "global_step": 182443, "epoch": 4343} {"train_loss": -7.203670501708984, "global_step": 182444, "epoch": 4343} {"train_loss": -7.131866455078125, "global_step": 182445, "epoch": 4343} {"train_loss": -7.106805801391602, "global_step": 182446, "epoch": 4343} {"train_loss": -7.188127778825306, "global_step": 182447, "epoch": 4343, "val_loss": 80663.421875} {"train_loss": -7.077567100524902, "global_step": 182448, "epoch": 4344} {"train_loss": -6.969740867614746, "global_step": 182449, "epoch": 4344} {"train_loss": -7.187430381774902, "global_step": 182450, "epoch": 4344} {"train_loss": -7.219515800476074, "global_step": 182451, "epoch": 4344} {"train_loss": -7.0524797439575195, "global_step": 182452, "epoch": 4344} {"train_loss": -7.2028656005859375, "global_step": 182453, "epoch": 4344} {"train_loss": -7.103569030761719, "global_step": 182454, "epoch": 4344} {"train_loss": -7.177526473999023, "global_step": 182455, "epoch": 4344} {"train_loss": -7.122756004333496, "global_step": 182456, "epoch": 4344} {"train_loss": -7.069127082824707, "global_step": 182457, "epoch": 4344} {"train_loss": -7.069577217102051, "global_step": 182458, "epoch": 4344} {"train_loss": -7.038940906524658, "global_step": 182459, "epoch": 4344} {"train_loss": -7.060498237609863, "global_step": 182460, "epoch": 4344} {"train_loss": -7.178532123565674, "global_step": 182461, "epoch": 4344} {"train_loss": -7.089353561401367, "global_step": 182462, "epoch": 4344} {"train_loss": -7.155973434448242, "global_step": 182463, "epoch": 4344} {"train_loss": -7.1129679679870605, "global_step": 182464, "epoch": 4344} {"train_loss": -7.164885520935059, "global_step": 182465, "epoch": 4344} {"train_loss": -7.06661319732666, "global_step": 182466, "epoch": 4344} {"train_loss": -7.116763591766357, "global_step": 182467, "epoch": 4344} {"train_loss": -6.992207050323486, "global_step": 182468, "epoch": 4344} {"train_loss": -7.018237113952637, "global_step": 182469, "epoch": 4344} {"train_loss": -7.11517333984375, "global_step": 182470, "epoch": 4344} {"train_loss": -6.985278606414795, "global_step": 182471, "epoch": 4344} {"train_loss": -6.983427047729492, "global_step": 182472, "epoch": 4344} {"train_loss": -7.05086612701416, "global_step": 182473, "epoch": 4344} {"train_loss": -7.025324821472168, "global_step": 182474, "epoch": 4344} {"train_loss": -7.17078161239624, "global_step": 182475, "epoch": 4344} {"train_loss": -6.997402191162109, "global_step": 182476, "epoch": 4344} {"train_loss": -7.013877868652344, "global_step": 182477, "epoch": 4344} {"train_loss": -7.059123992919922, "global_step": 182478, "epoch": 4344} {"train_loss": -6.97891902923584, "global_step": 182479, "epoch": 4344} {"train_loss": -7.064518928527832, "global_step": 182480, "epoch": 4344} {"train_loss": -7.038971424102783, "global_step": 182481, "epoch": 4344} {"train_loss": -7.0198469161987305, "global_step": 182482, "epoch": 4344} {"train_loss": -7.058436870574951, "global_step": 182483, "epoch": 4344} {"train_loss": -7.112135887145996, "global_step": 182484, "epoch": 4344} {"train_loss": -6.903304100036621, "global_step": 182485, "epoch": 4344} {"train_loss": -7.175272464752197, "global_step": 182486, "epoch": 4344} {"train_loss": -6.98842716217041, "global_step": 182487, "epoch": 4344} {"train_loss": -7.053471565246582, "global_step": 182488, "epoch": 4344} {"train_loss": -7.0750816095443, "global_step": 182489, "epoch": 4344, "val_loss": 80576.28125} {"train_loss": -6.981704235076904, "global_step": 182490, "epoch": 4345} {"train_loss": -7.085848808288574, "global_step": 182491, "epoch": 4345} {"train_loss": -6.931079387664795, "global_step": 182492, "epoch": 4345} {"train_loss": -7.289853096008301, "global_step": 182493, "epoch": 4345} {"train_loss": -7.026780128479004, "global_step": 182494, "epoch": 4345} {"train_loss": -7.121584415435791, "global_step": 182495, "epoch": 4345} {"train_loss": -7.125434875488281, "global_step": 182496, "epoch": 4345} {"train_loss": -7.126276969909668, "global_step": 182497, "epoch": 4345} {"train_loss": -7.099002838134766, "global_step": 182498, "epoch": 4345} {"train_loss": -7.117864608764648, "global_step": 182499, "epoch": 4345} {"train_loss": -7.106834411621094, "global_step": 182500, "epoch": 4345} {"train_loss": -7.172550201416016, "global_step": 182501, "epoch": 4345} {"train_loss": -7.143481731414795, "global_step": 182502, "epoch": 4345} {"train_loss": -7.139009475708008, "global_step": 182503, "epoch": 4345} {"train_loss": -7.159210205078125, "global_step": 182504, "epoch": 4345} {"train_loss": -7.187962532043457, "global_step": 182505, "epoch": 4345} {"train_loss": -7.221122741699219, "global_step": 182506, "epoch": 4345} {"train_loss": -7.215516090393066, "global_step": 182507, "epoch": 4345} {"train_loss": -7.2206621170043945, "global_step": 182508, "epoch": 4345} {"train_loss": -7.081960678100586, "global_step": 182509, "epoch": 4345} {"train_loss": -7.023818016052246, "global_step": 182510, "epoch": 4345} {"train_loss": -7.216879844665527, "global_step": 182511, "epoch": 4345} {"train_loss": -7.132416248321533, "global_step": 182512, "epoch": 4345} {"train_loss": -7.1758270263671875, "global_step": 182513, "epoch": 4345} {"train_loss": -7.210024833679199, "global_step": 182514, "epoch": 4345} {"train_loss": -7.121211051940918, "global_step": 182515, "epoch": 4345} {"train_loss": -7.180054664611816, "global_step": 182516, "epoch": 4345} {"train_loss": -7.150749683380127, "global_step": 182517, "epoch": 4345} {"train_loss": -7.146605014801025, "global_step": 182518, "epoch": 4345} {"train_loss": -7.245811939239502, "global_step": 182519, "epoch": 4345} {"train_loss": -7.255925178527832, "global_step": 182520, "epoch": 4345} {"train_loss": -7.231466293334961, "global_step": 182521, "epoch": 4345} {"train_loss": -7.247445106506348, "global_step": 182522, "epoch": 4345} {"train_loss": -7.20579719543457, "global_step": 182523, "epoch": 4345} {"train_loss": -7.267818450927734, "global_step": 182524, "epoch": 4345} {"train_loss": -7.147335052490234, "global_step": 182525, "epoch": 4345} {"train_loss": -7.165862083435059, "global_step": 182526, "epoch": 4345} {"train_loss": -7.25937032699585, "global_step": 182527, "epoch": 4345} {"train_loss": -7.123291969299316, "global_step": 182528, "epoch": 4345} {"train_loss": -7.103816986083984, "global_step": 182529, "epoch": 4345} {"train_loss": -7.254692554473877, "global_step": 182530, "epoch": 4345} {"train_loss": -7.156220958346412, "global_step": 182531, "epoch": 4345, "val_loss": 80475.5078125} {"train_loss": -7.187068462371826, "global_step": 182532, "epoch": 4346} {"train_loss": -7.089598655700684, "global_step": 182533, "epoch": 4346} {"train_loss": -7.1894073486328125, "global_step": 182534, "epoch": 4346} {"train_loss": -7.241525650024414, "global_step": 182535, "epoch": 4346} {"train_loss": -7.227704048156738, "global_step": 182536, "epoch": 4346} {"train_loss": -7.136104583740234, "global_step": 182537, "epoch": 4346} {"train_loss": -7.1971282958984375, "global_step": 182538, "epoch": 4346} {"train_loss": -7.218560218811035, "global_step": 182539, "epoch": 4346} {"train_loss": -7.2579851150512695, "global_step": 182540, "epoch": 4346} {"train_loss": -7.286772727966309, "global_step": 182541, "epoch": 4346} {"train_loss": -7.256916046142578, "global_step": 182542, "epoch": 4346} {"train_loss": -7.115073204040527, "global_step": 182543, "epoch": 4346} {"train_loss": -7.244470119476318, "global_step": 182544, "epoch": 4346} {"train_loss": -7.138522148132324, "global_step": 182545, "epoch": 4346} {"train_loss": -7.042036533355713, "global_step": 182546, "epoch": 4346} {"train_loss": -7.126518249511719, "global_step": 182547, "epoch": 4346} {"train_loss": -7.201496601104736, "global_step": 182548, "epoch": 4346} {"train_loss": -7.234642028808594, "global_step": 182549, "epoch": 4346} {"train_loss": -7.148254871368408, "global_step": 182550, "epoch": 4346} {"train_loss": -7.191842079162598, "global_step": 182551, "epoch": 4346} {"train_loss": -7.1338887214660645, "global_step": 182552, "epoch": 4346} {"train_loss": -7.105481147766113, "global_step": 182553, "epoch": 4346} {"train_loss": -7.166778087615967, "global_step": 182554, "epoch": 4346} {"train_loss": -7.2110772132873535, "global_step": 182555, "epoch": 4346} {"train_loss": -7.143589019775391, "global_step": 182556, "epoch": 4346} {"train_loss": -7.066989898681641, "global_step": 182557, "epoch": 4346} {"train_loss": -7.23956823348999, "global_step": 182558, "epoch": 4346} {"train_loss": -7.120088577270508, "global_step": 182559, "epoch": 4346} {"train_loss": -7.218838691711426, "global_step": 182560, "epoch": 4346} {"train_loss": -7.193301200866699, "global_step": 182561, "epoch": 4346} {"train_loss": -7.2644734382629395, "global_step": 182562, "epoch": 4346} {"train_loss": -7.203923225402832, "global_step": 182563, "epoch": 4346} {"train_loss": -7.176529407501221, "global_step": 182564, "epoch": 4346} {"train_loss": -7.166184425354004, "global_step": 182565, "epoch": 4346} {"train_loss": -7.279213905334473, "global_step": 182566, "epoch": 4346} {"train_loss": -7.176961421966553, "global_step": 182567, "epoch": 4346} {"train_loss": -7.086928844451904, "global_step": 182568, "epoch": 4346} {"train_loss": -7.255252838134766, "global_step": 182569, "epoch": 4346} {"train_loss": -7.157249450683594, "global_step": 182570, "epoch": 4346} {"train_loss": -7.019972324371338, "global_step": 182571, "epoch": 4346} {"train_loss": -7.0743865966796875, "global_step": 182572, "epoch": 4346} {"train_loss": -7.172835440862746, "global_step": 182573, "epoch": 4346, "val_loss": 80685.359375} {"train_loss": -7.058013916015625, "global_step": 182574, "epoch": 4347} {"train_loss": -7.231254577636719, "global_step": 182575, "epoch": 4347} {"train_loss": -6.930975914001465, "global_step": 182576, "epoch": 4347} {"train_loss": -7.089847564697266, "global_step": 182577, "epoch": 4347} {"train_loss": -7.191374778747559, "global_step": 182578, "epoch": 4347} {"train_loss": -6.993897438049316, "global_step": 182579, "epoch": 4347} {"train_loss": -6.953476905822754, "global_step": 182580, "epoch": 4347} {"train_loss": -7.129649639129639, "global_step": 182581, "epoch": 4347} {"train_loss": -7.011275291442871, "global_step": 182582, "epoch": 4347} {"train_loss": -7.110592842102051, "global_step": 182583, "epoch": 4347} {"train_loss": -7.025589942932129, "global_step": 182584, "epoch": 4347} {"train_loss": -6.87905216217041, "global_step": 182585, "epoch": 4347} {"train_loss": -7.028217792510986, "global_step": 182586, "epoch": 4347} {"train_loss": -7.009951591491699, "global_step": 182587, "epoch": 4347} {"train_loss": -6.952237129211426, "global_step": 182588, "epoch": 4347} {"train_loss": -7.203754901885986, "global_step": 182589, "epoch": 4347} {"train_loss": -6.881335258483887, "global_step": 182590, "epoch": 4347} {"train_loss": -7.067364692687988, "global_step": 182591, "epoch": 4347} {"train_loss": -7.050561904907227, "global_step": 182592, "epoch": 4347} {"train_loss": -6.906750202178955, "global_step": 182593, "epoch": 4347} {"train_loss": -7.103869438171387, "global_step": 182594, "epoch": 4347} {"train_loss": -6.994036674499512, "global_step": 182595, "epoch": 4347} {"train_loss": -7.159917831420898, "global_step": 182596, "epoch": 4347} {"train_loss": -7.068206310272217, "global_step": 182597, "epoch": 4347} {"train_loss": -7.161078453063965, "global_step": 182598, "epoch": 4347} {"train_loss": -6.868973731994629, "global_step": 182599, "epoch": 4347} {"train_loss": -7.085793972015381, "global_step": 182600, "epoch": 4347} {"train_loss": -6.9846391677856445, "global_step": 182601, "epoch": 4347} {"train_loss": -7.189365386962891, "global_step": 182602, "epoch": 4347} {"train_loss": -7.095920085906982, "global_step": 182603, "epoch": 4347} {"train_loss": -7.107844352722168, "global_step": 182604, "epoch": 4347} {"train_loss": -6.977212905883789, "global_step": 182605, "epoch": 4347} {"train_loss": -7.138453006744385, "global_step": 182606, "epoch": 4347} {"train_loss": -7.031411170959473, "global_step": 182607, "epoch": 4347} {"train_loss": -7.142797470092773, "global_step": 182608, "epoch": 4347} {"train_loss": -7.15324592590332, "global_step": 182609, "epoch": 4347} {"train_loss": -7.1237335205078125, "global_step": 182610, "epoch": 4347} {"train_loss": -7.146834373474121, "global_step": 182611, "epoch": 4347} {"train_loss": -7.223628997802734, "global_step": 182612, "epoch": 4347} {"train_loss": -7.098151683807373, "global_step": 182613, "epoch": 4347} {"train_loss": -7.037710189819336, "global_step": 182614, "epoch": 4347} {"train_loss": -7.061377661568778, "global_step": 182615, "epoch": 4347, "val_loss": 80838.015625} {"train_loss": -7.1069793701171875, "global_step": 182616, "epoch": 4348} {"train_loss": -7.03731107711792, "global_step": 182617, "epoch": 4348} {"train_loss": -7.102834224700928, "global_step": 182618, "epoch": 4348} {"train_loss": -7.183095932006836, "global_step": 182619, "epoch": 4348} {"train_loss": -6.99533748626709, "global_step": 182620, "epoch": 4348} {"train_loss": -7.095755577087402, "global_step": 182621, "epoch": 4348} {"train_loss": -6.983710765838623, "global_step": 182622, "epoch": 4348} {"train_loss": -7.288021564483643, "global_step": 182623, "epoch": 4348} {"train_loss": -7.151397705078125, "global_step": 182624, "epoch": 4348} {"train_loss": -7.297667503356934, "global_step": 182625, "epoch": 4348} {"train_loss": -7.221272945404053, "global_step": 182626, "epoch": 4348} {"train_loss": -7.209883689880371, "global_step": 182627, "epoch": 4348} {"train_loss": -7.219202995300293, "global_step": 182628, "epoch": 4348} {"train_loss": -7.188907623291016, "global_step": 182629, "epoch": 4348} {"train_loss": -7.23444938659668, "global_step": 182630, "epoch": 4348} {"train_loss": -7.111443042755127, "global_step": 182631, "epoch": 4348} {"train_loss": -7.127778053283691, "global_step": 182632, "epoch": 4348} {"train_loss": -7.26110315322876, "global_step": 182633, "epoch": 4348} {"train_loss": -7.241236686706543, "global_step": 182634, "epoch": 4348} {"train_loss": -7.127719879150391, "global_step": 182635, "epoch": 4348} {"train_loss": -7.123668670654297, "global_step": 182636, "epoch": 4348} {"train_loss": -7.193835258483887, "global_step": 182637, "epoch": 4348} {"train_loss": -7.269972801208496, "global_step": 182638, "epoch": 4348} {"train_loss": -7.131308555603027, "global_step": 182639, "epoch": 4348} {"train_loss": -7.166909694671631, "global_step": 182640, "epoch": 4348} {"train_loss": -7.186408042907715, "global_step": 182641, "epoch": 4348} {"train_loss": -7.11761474609375, "global_step": 182642, "epoch": 4348} {"train_loss": -7.1559953689575195, "global_step": 182643, "epoch": 4348} {"train_loss": -7.246463775634766, "global_step": 182644, "epoch": 4348} {"train_loss": -7.171694755554199, "global_step": 182645, "epoch": 4348} {"train_loss": -7.118165493011475, "global_step": 182646, "epoch": 4348} {"train_loss": -7.31611442565918, "global_step": 182647, "epoch": 4348} {"train_loss": -7.1810503005981445, "global_step": 182648, "epoch": 4348} {"train_loss": -7.182173252105713, "global_step": 182649, "epoch": 4348} {"train_loss": -7.192323684692383, "global_step": 182650, "epoch": 4348} {"train_loss": -7.156912803649902, "global_step": 182651, "epoch": 4348} {"train_loss": -7.073183059692383, "global_step": 182652, "epoch": 4348} {"train_loss": -7.149718761444092, "global_step": 182653, "epoch": 4348} {"train_loss": -7.125974655151367, "global_step": 182654, "epoch": 4348} {"train_loss": -7.151833534240723, "global_step": 182655, "epoch": 4348} {"train_loss": -7.208273887634277, "global_step": 182656, "epoch": 4348} {"train_loss": -7.1648312750316805, "global_step": 182657, "epoch": 4348, "val_loss": 80596.53125} {"train_loss": -7.1484880447387695, "global_step": 182658, "epoch": 4349} {"train_loss": -7.178206443786621, "global_step": 182659, "epoch": 4349} {"train_loss": -7.114448547363281, "global_step": 182660, "epoch": 4349} {"train_loss": -7.116687774658203, "global_step": 182661, "epoch": 4349} {"train_loss": -7.22834587097168, "global_step": 182662, "epoch": 4349} {"train_loss": -7.261533737182617, "global_step": 182663, "epoch": 4349} {"train_loss": -7.228515625, "global_step": 182664, "epoch": 4349} {"train_loss": -7.11944580078125, "global_step": 182665, "epoch": 4349} {"train_loss": -7.158467769622803, "global_step": 182666, "epoch": 4349} {"train_loss": -7.21710729598999, "global_step": 182667, "epoch": 4349} {"train_loss": -7.155645370483398, "global_step": 182668, "epoch": 4349} {"train_loss": -7.179175853729248, "global_step": 182669, "epoch": 4349} {"train_loss": -7.190363883972168, "global_step": 182670, "epoch": 4349} {"train_loss": -7.183902740478516, "global_step": 182671, "epoch": 4349} {"train_loss": -7.221841335296631, "global_step": 182672, "epoch": 4349} {"train_loss": -7.026431083679199, "global_step": 182673, "epoch": 4349} {"train_loss": -7.229887008666992, "global_step": 182674, "epoch": 4349} {"train_loss": -7.1867876052856445, "global_step": 182675, "epoch": 4349} {"train_loss": -7.0692853927612305, "global_step": 182676, "epoch": 4349} {"train_loss": -7.20588493347168, "global_step": 182677, "epoch": 4349} {"train_loss": -7.183903694152832, "global_step": 182678, "epoch": 4349} {"train_loss": -7.173593521118164, "global_step": 182679, "epoch": 4349} {"train_loss": -7.1222686767578125, "global_step": 182680, "epoch": 4349} {"train_loss": -7.164671897888184, "global_step": 182681, "epoch": 4349} {"train_loss": -7.098219871520996, "global_step": 182682, "epoch": 4349} {"train_loss": -7.203057289123535, "global_step": 182683, "epoch": 4349} {"train_loss": -7.068417549133301, "global_step": 182684, "epoch": 4349} {"train_loss": -7.131860733032227, "global_step": 182685, "epoch": 4349} {"train_loss": -7.103632926940918, "global_step": 182686, "epoch": 4349} {"train_loss": -7.129084587097168, "global_step": 182687, "epoch": 4349} {"train_loss": -7.148797035217285, "global_step": 182688, "epoch": 4349} {"train_loss": -7.17950439453125, "global_step": 182689, "epoch": 4349} {"train_loss": -7.17832088470459, "global_step": 182690, "epoch": 4349} {"train_loss": -7.064567565917969, "global_step": 182691, "epoch": 4349} {"train_loss": -7.118021011352539, "global_step": 182692, "epoch": 4349} {"train_loss": -7.234948635101318, "global_step": 182693, "epoch": 4349} {"train_loss": -7.190488815307617, "global_step": 182694, "epoch": 4349} {"train_loss": -7.123715400695801, "global_step": 182695, "epoch": 4349} {"train_loss": -7.111895561218262, "global_step": 182696, "epoch": 4349} {"train_loss": -7.052637100219727, "global_step": 182697, "epoch": 4349} {"train_loss": -7.1190056800842285, "global_step": 182698, "epoch": 4349} {"train_loss": -7.153841995057606, "global_step": 182699, "epoch": 4349, "val_loss": 80674.71875} {"train_loss": -7.166651725769043, "global_step": 182700, "epoch": 4350} {"train_loss": -7.102664470672607, "global_step": 182701, "epoch": 4350} {"train_loss": -7.0641279220581055, "global_step": 182702, "epoch": 4350} {"train_loss": -7.310401916503906, "global_step": 182703, "epoch": 4350} {"train_loss": -7.1399688720703125, "global_step": 182704, "epoch": 4350} {"train_loss": -7.215478897094727, "global_step": 182705, "epoch": 4350} {"train_loss": -7.096879482269287, "global_step": 182706, "epoch": 4350} {"train_loss": -7.102045059204102, "global_step": 182707, "epoch": 4350} {"train_loss": -7.2186408042907715, "global_step": 182708, "epoch": 4350} {"train_loss": -7.1790056228637695, "global_step": 182709, "epoch": 4350} {"train_loss": -7.1241865158081055, "global_step": 182710, "epoch": 4350} {"train_loss": -7.0972418785095215, "global_step": 182711, "epoch": 4350} {"train_loss": -7.088074684143066, "global_step": 182712, "epoch": 4350} {"train_loss": -7.107297420501709, "global_step": 182713, "epoch": 4350} {"train_loss": -7.171302795410156, "global_step": 182714, "epoch": 4350} {"train_loss": -7.149875640869141, "global_step": 182715, "epoch": 4350} {"train_loss": -7.2729811668396, "global_step": 182716, "epoch": 4350} {"train_loss": -7.094389915466309, "global_step": 182717, "epoch": 4350} {"train_loss": -7.121186256408691, "global_step": 182718, "epoch": 4350} {"train_loss": -7.189608097076416, "global_step": 182719, "epoch": 4350} {"train_loss": -6.9715576171875, "global_step": 182720, "epoch": 4350} {"train_loss": -7.159412384033203, "global_step": 182721, "epoch": 4350} {"train_loss": -7.227897644042969, "global_step": 182722, "epoch": 4350} {"train_loss": -7.278188705444336, "global_step": 182723, "epoch": 4350} {"train_loss": -7.047205924987793, "global_step": 182724, "epoch": 4350} {"train_loss": -7.067975044250488, "global_step": 182725, "epoch": 4350} {"train_loss": -7.117679119110107, "global_step": 182726, "epoch": 4350} {"train_loss": -7.268550872802734, "global_step": 182727, "epoch": 4350} {"train_loss": -7.138493537902832, "global_step": 182728, "epoch": 4350} {"train_loss": -7.211524963378906, "global_step": 182729, "epoch": 4350} {"train_loss": -7.162988662719727, "global_step": 182730, "epoch": 4350} {"train_loss": -7.0711188316345215, "global_step": 182731, "epoch": 4350} {"train_loss": -7.203248500823975, "global_step": 182732, "epoch": 4350} {"train_loss": -7.101845741271973, "global_step": 182733, "epoch": 4350} {"train_loss": -7.186677932739258, "global_step": 182734, "epoch": 4350} {"train_loss": -7.143566131591797, "global_step": 182735, "epoch": 4350} {"train_loss": -7.1082987785339355, "global_step": 182736, "epoch": 4350} {"train_loss": -7.076617240905762, "global_step": 182737, "epoch": 4350} {"train_loss": -7.195725440979004, "global_step": 182738, "epoch": 4350} {"train_loss": -7.066174507141113, "global_step": 182739, "epoch": 4350} {"train_loss": -7.091671943664551, "global_step": 182740, "epoch": 4350} {"train_loss": -7.143804470698039, "global_step": 182741, "epoch": 4350, "train/sim_max_reward_0": 0.4079929737795392, "train/sim_max_reward_1": 0.957791005234654, "train/sim_max_reward_2": 0.5527054045482418, "train/sim_max_reward_3": 0.13376980475468203, "train/sim_max_reward_4": 0.2317521793012011, "train/sim_max_reward_5": 0.5675956029215968, "test/sim_max_reward_4500000": 0.9980567331085219, "test/sim_max_reward_4500001": 0.9503655418349682, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9790970709956841, "test/sim_max_reward_4500004": 0.14380599599983596, "test/sim_max_reward_4500005": 0.8392226005431188, "test/sim_max_reward_4500006": 0.9655853894822631, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.3418965852456021, "test/sim_max_reward_4500009": 0.9311223985567582, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.9006796948536824, "test/sim_max_reward_4500012": 0.9453535853795637, "test/sim_max_reward_4500013": 0.002835757249481858, "test/sim_max_reward_4500014": 0.38957988804951754, "test/sim_max_reward_4500015": 0.12697801389752286, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.05992571688709724, "test/sim_max_reward_4500018": 0.4666082544299352, "test/sim_max_reward_4500019": 0.9154919057275657, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.8893521156451839, "test/sim_max_reward_4500023": 0.8646433514086198, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 1.0, "test/sim_max_reward_4500026": 0.9661706978613778, "test/sim_max_reward_4500027": 0.9885120745622814, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.04163460642148004, "test/sim_max_reward_4500030": 0.9904259314557806, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.24634146586950323, "test/sim_max_reward_4500034": 0.8976306407464001, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 0.9966414209374815, "test/sim_max_reward_4500037": 1.0, "test/sim_max_reward_4500038": 0.36146749354584273, "test/sim_max_reward_4500039": 0.9273345468319245, "test/sim_max_reward_4500040": 0.9823120055266118, "test/sim_max_reward_4500041": 0.9808387629115162, "test/sim_max_reward_4500042": 0.04104758704238243, "test/sim_max_reward_4500043": 0.370188150771393, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.601080486734783, "test/sim_max_reward_4500046": 0.08914073810283256, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.986302154476007, "test/sim_max_reward_4500049": 0.945186189612682, "train/mean_score": 0.47526782842331916, "test/mean_score": 0.5875017332258924, "val_loss": 80798.4140625} {"train_loss": -7.106068134307861, "global_step": 182742, "epoch": 4351} {"train_loss": -7.037538528442383, "global_step": 182743, "epoch": 4351} {"train_loss": -7.1752424240112305, "global_step": 182744, "epoch": 4351} {"train_loss": -7.140316009521484, "global_step": 182745, "epoch": 4351} {"train_loss": -7.135153293609619, "global_step": 182746, "epoch": 4351} {"train_loss": -6.9322357177734375, "global_step": 182747, "epoch": 4351} {"train_loss": -7.220005989074707, "global_step": 182748, "epoch": 4351} {"train_loss": -7.07126522064209, "global_step": 182749, "epoch": 4351} {"train_loss": -7.126370429992676, "global_step": 182750, "epoch": 4351} {"train_loss": -7.02385139465332, "global_step": 182751, "epoch": 4351} {"train_loss": -7.07810115814209, "global_step": 182752, "epoch": 4351} {"train_loss": -7.164614200592041, "global_step": 182753, "epoch": 4351} {"train_loss": -7.099691867828369, "global_step": 182754, "epoch": 4351} {"train_loss": -7.109500885009766, "global_step": 182755, "epoch": 4351} {"train_loss": -7.060171604156494, "global_step": 182756, "epoch": 4351} {"train_loss": -7.159355640411377, "global_step": 182757, "epoch": 4351} {"train_loss": -7.124078273773193, "global_step": 182758, "epoch": 4351} {"train_loss": -7.054749488830566, "global_step": 182759, "epoch": 4351} {"train_loss": -7.2142133712768555, "global_step": 182760, "epoch": 4351} {"train_loss": -7.124695777893066, "global_step": 182761, "epoch": 4351} {"train_loss": -7.110791206359863, "global_step": 182762, "epoch": 4351} {"train_loss": -7.200623035430908, "global_step": 182763, "epoch": 4351} {"train_loss": -7.1649980545043945, "global_step": 182764, "epoch": 4351} {"train_loss": -7.299578666687012, "global_step": 182765, "epoch": 4351} {"train_loss": -7.149991989135742, "global_step": 182766, "epoch": 4351} {"train_loss": -7.207228660583496, "global_step": 182767, "epoch": 4351} {"train_loss": -7.224994659423828, "global_step": 182768, "epoch": 4351} {"train_loss": -7.0086469650268555, "global_step": 182769, "epoch": 4351} {"train_loss": -7.343610763549805, "global_step": 182770, "epoch": 4351} {"train_loss": -7.124892234802246, "global_step": 182771, "epoch": 4351} {"train_loss": -7.163722515106201, "global_step": 182772, "epoch": 4351} {"train_loss": -7.1425371170043945, "global_step": 182773, "epoch": 4351} {"train_loss": -7.221410751342773, "global_step": 182774, "epoch": 4351} {"train_loss": -7.169919013977051, "global_step": 182775, "epoch": 4351} {"train_loss": -7.151651382446289, "global_step": 182776, "epoch": 4351} {"train_loss": -7.12015438079834, "global_step": 182777, "epoch": 4351} {"train_loss": -7.127987861633301, "global_step": 182778, "epoch": 4351} {"train_loss": -7.180059432983398, "global_step": 182779, "epoch": 4351} {"train_loss": -7.090570449829102, "global_step": 182780, "epoch": 4351} {"train_loss": -7.048513889312744, "global_step": 182781, "epoch": 4351} {"train_loss": -7.213010787963867, "global_step": 182782, "epoch": 4351} {"train_loss": -7.136990445000785, "global_step": 182783, "epoch": 4351, "val_loss": 80594.3046875} {"train_loss": -7.171123027801514, "global_step": 182784, "epoch": 4352} {"train_loss": -7.2241106033325195, "global_step": 182785, "epoch": 4352} {"train_loss": -7.116018772125244, "global_step": 182786, "epoch": 4352} {"train_loss": -7.126211643218994, "global_step": 182787, "epoch": 4352} {"train_loss": -7.199824333190918, "global_step": 182788, "epoch": 4352} {"train_loss": -7.003263473510742, "global_step": 182789, "epoch": 4352} {"train_loss": -7.2012128829956055, "global_step": 182790, "epoch": 4352} {"train_loss": -7.142075538635254, "global_step": 182791, "epoch": 4352} {"train_loss": -7.040281772613525, "global_step": 182792, "epoch": 4352} {"train_loss": -7.134888172149658, "global_step": 182793, "epoch": 4352} {"train_loss": -6.9539899826049805, "global_step": 182794, "epoch": 4352} {"train_loss": -7.074795722961426, "global_step": 182795, "epoch": 4352} {"train_loss": -7.043076515197754, "global_step": 182796, "epoch": 4352} {"train_loss": -7.138284683227539, "global_step": 182797, "epoch": 4352} {"train_loss": -7.105348587036133, "global_step": 182798, "epoch": 4352} {"train_loss": -7.068159103393555, "global_step": 182799, "epoch": 4352} {"train_loss": -7.17665958404541, "global_step": 182800, "epoch": 4352} {"train_loss": -6.975827693939209, "global_step": 182801, "epoch": 4352} {"train_loss": -7.004045486450195, "global_step": 182802, "epoch": 4352} {"train_loss": -7.103796005249023, "global_step": 182803, "epoch": 4352} {"train_loss": -7.092994689941406, "global_step": 182804, "epoch": 4352} {"train_loss": -7.156429290771484, "global_step": 182805, "epoch": 4352} {"train_loss": -7.120278358459473, "global_step": 182806, "epoch": 4352} {"train_loss": -7.056731700897217, "global_step": 182807, "epoch": 4352} {"train_loss": -7.02926778793335, "global_step": 182808, "epoch": 4352} {"train_loss": -7.15182638168335, "global_step": 182809, "epoch": 4352} {"train_loss": -6.9506940841674805, "global_step": 182810, "epoch": 4352} {"train_loss": -7.109039783477783, "global_step": 182811, "epoch": 4352} {"train_loss": -7.020832538604736, "global_step": 182812, "epoch": 4352} {"train_loss": -7.102827548980713, "global_step": 182813, "epoch": 4352} {"train_loss": -7.156588554382324, "global_step": 182814, "epoch": 4352} {"train_loss": -6.956165313720703, "global_step": 182815, "epoch": 4352} {"train_loss": -7.210948944091797, "global_step": 182816, "epoch": 4352} {"train_loss": -7.174176216125488, "global_step": 182817, "epoch": 4352} {"train_loss": -7.128583908081055, "global_step": 182818, "epoch": 4352} {"train_loss": -7.201506614685059, "global_step": 182819, "epoch": 4352} {"train_loss": -6.997331142425537, "global_step": 182820, "epoch": 4352} {"train_loss": -7.082943916320801, "global_step": 182821, "epoch": 4352} {"train_loss": -7.119290351867676, "global_step": 182822, "epoch": 4352} {"train_loss": -7.206695556640625, "global_step": 182823, "epoch": 4352} {"train_loss": -7.194732189178467, "global_step": 182824, "epoch": 4352} {"train_loss": -7.10554930141994, "global_step": 182825, "epoch": 4352, "val_loss": 80684.4375} {"train_loss": -7.147339820861816, "global_step": 182826, "epoch": 4353} {"train_loss": -7.256504535675049, "global_step": 182827, "epoch": 4353} {"train_loss": -7.17354679107666, "global_step": 182828, "epoch": 4353} {"train_loss": -7.2330522537231445, "global_step": 182829, "epoch": 4353} {"train_loss": -7.325967788696289, "global_step": 182830, "epoch": 4353} {"train_loss": -7.1878156661987305, "global_step": 182831, "epoch": 4353} {"train_loss": -7.13388729095459, "global_step": 182832, "epoch": 4353} {"train_loss": -7.121617317199707, "global_step": 182833, "epoch": 4353} {"train_loss": -7.071792125701904, "global_step": 182834, "epoch": 4353} {"train_loss": -7.182263374328613, "global_step": 182835, "epoch": 4353} {"train_loss": -7.022124290466309, "global_step": 182836, "epoch": 4353} {"train_loss": -7.12939453125, "global_step": 182837, "epoch": 4353} {"train_loss": -7.155476093292236, "global_step": 182838, "epoch": 4353} {"train_loss": -7.185311317443848, "global_step": 182839, "epoch": 4353} {"train_loss": -7.145299911499023, "global_step": 182840, "epoch": 4353} {"train_loss": -7.080464839935303, "global_step": 182841, "epoch": 4353} {"train_loss": -7.146332740783691, "global_step": 182842, "epoch": 4353} {"train_loss": -7.194337844848633, "global_step": 182843, "epoch": 4353} {"train_loss": -7.127174377441406, "global_step": 182844, "epoch": 4353} {"train_loss": -7.104909896850586, "global_step": 182845, "epoch": 4353} {"train_loss": -7.209578514099121, "global_step": 182846, "epoch": 4353} {"train_loss": -7.01920223236084, "global_step": 182847, "epoch": 4353} {"train_loss": -7.129507064819336, "global_step": 182848, "epoch": 4353} {"train_loss": -7.240865707397461, "global_step": 182849, "epoch": 4353} {"train_loss": -7.240298271179199, "global_step": 182850, "epoch": 4353} {"train_loss": -7.11846923828125, "global_step": 182851, "epoch": 4353} {"train_loss": -7.27610445022583, "global_step": 182852, "epoch": 4353} {"train_loss": -7.12445068359375, "global_step": 182853, "epoch": 4353} {"train_loss": -7.314499378204346, "global_step": 182854, "epoch": 4353} {"train_loss": -7.121531963348389, "global_step": 182855, "epoch": 4353} {"train_loss": -7.1717848777771, "global_step": 182856, "epoch": 4353} {"train_loss": -7.087120056152344, "global_step": 182857, "epoch": 4353} {"train_loss": -7.100738525390625, "global_step": 182858, "epoch": 4353} {"train_loss": -7.100374698638916, "global_step": 182859, "epoch": 4353} {"train_loss": -7.269464492797852, "global_step": 182860, "epoch": 4353} {"train_loss": -7.181585311889648, "global_step": 182861, "epoch": 4353} {"train_loss": -7.0874552726745605, "global_step": 182862, "epoch": 4353} {"train_loss": -7.107109546661377, "global_step": 182863, "epoch": 4353} {"train_loss": -7.127559661865234, "global_step": 182864, "epoch": 4353} {"train_loss": -7.214814186096191, "global_step": 182865, "epoch": 4353} {"train_loss": -7.125909805297852, "global_step": 182866, "epoch": 4353} {"train_loss": -7.155991179602487, "global_step": 182867, "epoch": 4353, "val_loss": 80605.046875} {"train_loss": -7.232524394989014, "global_step": 182868, "epoch": 4354} {"train_loss": -7.1626787185668945, "global_step": 182869, "epoch": 4354} {"train_loss": -7.151062965393066, "global_step": 182870, "epoch": 4354} {"train_loss": -7.194069862365723, "global_step": 182871, "epoch": 4354} {"train_loss": -7.079093933105469, "global_step": 182872, "epoch": 4354} {"train_loss": -7.139962673187256, "global_step": 182873, "epoch": 4354} {"train_loss": -7.056736946105957, "global_step": 182874, "epoch": 4354} {"train_loss": -7.176285743713379, "global_step": 182875, "epoch": 4354} {"train_loss": -7.275720596313477, "global_step": 182876, "epoch": 4354} {"train_loss": -7.138523578643799, "global_step": 182877, "epoch": 4354} {"train_loss": -7.167882919311523, "global_step": 182878, "epoch": 4354} {"train_loss": -7.190454959869385, "global_step": 182879, "epoch": 4354} {"train_loss": -7.312344074249268, "global_step": 182880, "epoch": 4354} {"train_loss": -7.241131782531738, "global_step": 182881, "epoch": 4354} {"train_loss": -7.117039680480957, "global_step": 182882, "epoch": 4354} {"train_loss": -7.229091167449951, "global_step": 182883, "epoch": 4354} {"train_loss": -7.102499961853027, "global_step": 182884, "epoch": 4354} {"train_loss": -7.085033893585205, "global_step": 182885, "epoch": 4354} {"train_loss": -7.148867607116699, "global_step": 182886, "epoch": 4354} {"train_loss": -7.042186737060547, "global_step": 182887, "epoch": 4354} {"train_loss": -7.134493827819824, "global_step": 182888, "epoch": 4354} {"train_loss": -7.013967990875244, "global_step": 182889, "epoch": 4354} {"train_loss": -6.906623840332031, "global_step": 182890, "epoch": 4354} {"train_loss": -7.078540802001953, "global_step": 182891, "epoch": 4354} {"train_loss": -6.935530662536621, "global_step": 182892, "epoch": 4354} {"train_loss": -7.157251358032227, "global_step": 182893, "epoch": 4354} {"train_loss": -7.007970333099365, "global_step": 182894, "epoch": 4354} {"train_loss": -7.208856582641602, "global_step": 182895, "epoch": 4354} {"train_loss": -7.122410774230957, "global_step": 182896, "epoch": 4354} {"train_loss": -7.249075889587402, "global_step": 182897, "epoch": 4354} {"train_loss": -7.226845741271973, "global_step": 182898, "epoch": 4354} {"train_loss": -7.292141914367676, "global_step": 182899, "epoch": 4354} {"train_loss": -7.168249130249023, "global_step": 182900, "epoch": 4354} {"train_loss": -7.184917449951172, "global_step": 182901, "epoch": 4354} {"train_loss": -7.16902494430542, "global_step": 182902, "epoch": 4354} {"train_loss": -7.2677693367004395, "global_step": 182903, "epoch": 4354} {"train_loss": -7.190484046936035, "global_step": 182904, "epoch": 4354} {"train_loss": -7.148565769195557, "global_step": 182905, "epoch": 4354} {"train_loss": -7.144842147827148, "global_step": 182906, "epoch": 4354} {"train_loss": -7.161376953125, "global_step": 182907, "epoch": 4354} {"train_loss": -7.053203582763672, "global_step": 182908, "epoch": 4354} {"train_loss": -7.147321553457351, "global_step": 182909, "epoch": 4354, "val_loss": 80488.421875} {"train_loss": -6.968130111694336, "global_step": 182910, "epoch": 4355} {"train_loss": -7.079568386077881, "global_step": 182911, "epoch": 4355} {"train_loss": -7.188316822052002, "global_step": 182912, "epoch": 4355} {"train_loss": -7.259975433349609, "global_step": 182913, "epoch": 4355} {"train_loss": -7.128233909606934, "global_step": 182914, "epoch": 4355} {"train_loss": -7.098109722137451, "global_step": 182915, "epoch": 4355} {"train_loss": -7.209284782409668, "global_step": 182916, "epoch": 4355} {"train_loss": -7.162693023681641, "global_step": 182917, "epoch": 4355} {"train_loss": -7.234318733215332, "global_step": 182918, "epoch": 4355} {"train_loss": -7.013943672180176, "global_step": 182919, "epoch": 4355} {"train_loss": -7.197162628173828, "global_step": 182920, "epoch": 4355} {"train_loss": -7.080483436584473, "global_step": 182921, "epoch": 4355} {"train_loss": -7.1425604820251465, "global_step": 182922, "epoch": 4355} {"train_loss": -7.13522481918335, "global_step": 182923, "epoch": 4355} {"train_loss": -7.3157243728637695, "global_step": 182924, "epoch": 4355} {"train_loss": -6.96358585357666, "global_step": 182925, "epoch": 4355} {"train_loss": -6.952329635620117, "global_step": 182926, "epoch": 4355} {"train_loss": -7.210238933563232, "global_step": 182927, "epoch": 4355} {"train_loss": -7.08273458480835, "global_step": 182928, "epoch": 4355} {"train_loss": -7.152830600738525, "global_step": 182929, "epoch": 4355} {"train_loss": -7.144481658935547, "global_step": 182930, "epoch": 4355} {"train_loss": -7.014196872711182, "global_step": 182931, "epoch": 4355} {"train_loss": -7.052711486816406, "global_step": 182932, "epoch": 4355} {"train_loss": -6.938257694244385, "global_step": 182933, "epoch": 4355} {"train_loss": -7.049897193908691, "global_step": 182934, "epoch": 4355} {"train_loss": -7.028728008270264, "global_step": 182935, "epoch": 4355} {"train_loss": -7.019087791442871, "global_step": 182936, "epoch": 4355} {"train_loss": -6.963822364807129, "global_step": 182937, "epoch": 4355} {"train_loss": -7.007831573486328, "global_step": 182938, "epoch": 4355} {"train_loss": -7.083802223205566, "global_step": 182939, "epoch": 4355} {"train_loss": -7.034910678863525, "global_step": 182940, "epoch": 4355} {"train_loss": -7.036646842956543, "global_step": 182941, "epoch": 4355} {"train_loss": -7.0717291831970215, "global_step": 182942, "epoch": 4355} {"train_loss": -6.882925987243652, "global_step": 182943, "epoch": 4355} {"train_loss": -7.041247367858887, "global_step": 182944, "epoch": 4355} {"train_loss": -7.010478973388672, "global_step": 182945, "epoch": 4355} {"train_loss": -7.071319580078125, "global_step": 182946, "epoch": 4355} {"train_loss": -7.065798759460449, "global_step": 182947, "epoch": 4355} {"train_loss": -7.109378814697266, "global_step": 182948, "epoch": 4355} {"train_loss": -6.965300559997559, "global_step": 182949, "epoch": 4355} {"train_loss": -7.047897815704346, "global_step": 182950, "epoch": 4355} {"train_loss": -7.079060849689302, "global_step": 182951, "epoch": 4355, "val_loss": 80646.109375} {"train_loss": -7.043336868286133, "global_step": 182952, "epoch": 4356} {"train_loss": -7.089038848876953, "global_step": 182953, "epoch": 4356} {"train_loss": -7.081363677978516, "global_step": 182954, "epoch": 4356} {"train_loss": -7.135821342468262, "global_step": 182955, "epoch": 4356} {"train_loss": -7.0100202560424805, "global_step": 182956, "epoch": 4356} {"train_loss": -7.132569789886475, "global_step": 182957, "epoch": 4356} {"train_loss": -7.056131362915039, "global_step": 182958, "epoch": 4356} {"train_loss": -7.130246162414551, "global_step": 182959, "epoch": 4356} {"train_loss": -7.215803146362305, "global_step": 182960, "epoch": 4356} {"train_loss": -7.119545936584473, "global_step": 182961, "epoch": 4356} {"train_loss": -7.139758586883545, "global_step": 182962, "epoch": 4356} {"train_loss": -7.167239189147949, "global_step": 182963, "epoch": 4356} {"train_loss": -7.215659141540527, "global_step": 182964, "epoch": 4356} {"train_loss": -7.229190349578857, "global_step": 182965, "epoch": 4356} {"train_loss": -7.1290669441223145, "global_step": 182966, "epoch": 4356} {"train_loss": -7.254171848297119, "global_step": 182967, "epoch": 4356} {"train_loss": -7.164623737335205, "global_step": 182968, "epoch": 4356} {"train_loss": -7.091573715209961, "global_step": 182969, "epoch": 4356} {"train_loss": -7.128559112548828, "global_step": 182970, "epoch": 4356} {"train_loss": -7.15777063369751, "global_step": 182971, "epoch": 4356} {"train_loss": -7.229541778564453, "global_step": 182972, "epoch": 4356} {"train_loss": -7.240335464477539, "global_step": 182973, "epoch": 4356} {"train_loss": -7.122134208679199, "global_step": 182974, "epoch": 4356} {"train_loss": -7.11519193649292, "global_step": 182975, "epoch": 4356} {"train_loss": -7.223759651184082, "global_step": 182976, "epoch": 4356} {"train_loss": -7.035148620605469, "global_step": 182977, "epoch": 4356} {"train_loss": -7.27083683013916, "global_step": 182978, "epoch": 4356} {"train_loss": -7.148669242858887, "global_step": 182979, "epoch": 4356} {"train_loss": -7.241194248199463, "global_step": 182980, "epoch": 4356} {"train_loss": -7.124115943908691, "global_step": 182981, "epoch": 4356} {"train_loss": -7.295113563537598, "global_step": 182982, "epoch": 4356} {"train_loss": -7.168023586273193, "global_step": 182983, "epoch": 4356} {"train_loss": -7.271836280822754, "global_step": 182984, "epoch": 4356} {"train_loss": -7.164165019989014, "global_step": 182985, "epoch": 4356} {"train_loss": -7.151222229003906, "global_step": 182986, "epoch": 4356} {"train_loss": -7.152650356292725, "global_step": 182987, "epoch": 4356} {"train_loss": -7.328808307647705, "global_step": 182988, "epoch": 4356} {"train_loss": -7.172685623168945, "global_step": 182989, "epoch": 4356} {"train_loss": -7.330182075500488, "global_step": 182990, "epoch": 4356} {"train_loss": -7.1593828201293945, "global_step": 182991, "epoch": 4356} {"train_loss": -7.060328006744385, "global_step": 182992, "epoch": 4356} {"train_loss": -7.162021988914127, "global_step": 182993, "epoch": 4356, "val_loss": 80438.6640625} {"train_loss": -7.1833906173706055, "global_step": 182994, "epoch": 4357} {"train_loss": -7.117575645446777, "global_step": 182995, "epoch": 4357} {"train_loss": -7.176336288452148, "global_step": 182996, "epoch": 4357} {"train_loss": -7.112796306610107, "global_step": 182997, "epoch": 4357} {"train_loss": -7.101717948913574, "global_step": 182998, "epoch": 4357} {"train_loss": -7.148948669433594, "global_step": 182999, "epoch": 4357} {"train_loss": -7.21895694732666, "global_step": 183000, "epoch": 4357} {"train_loss": -7.241922378540039, "global_step": 183001, "epoch": 4357} {"train_loss": -7.247861385345459, "global_step": 183002, "epoch": 4357} {"train_loss": -7.364160537719727, "global_step": 183003, "epoch": 4357} {"train_loss": -7.106419086456299, "global_step": 183004, "epoch": 4357} {"train_loss": -7.275968074798584, "global_step": 183005, "epoch": 4357} {"train_loss": -7.136567115783691, "global_step": 183006, "epoch": 4357} {"train_loss": -7.078305244445801, "global_step": 183007, "epoch": 4357} {"train_loss": -7.216372489929199, "global_step": 183008, "epoch": 4357} {"train_loss": -7.105040550231934, "global_step": 183009, "epoch": 4357} {"train_loss": -7.188753128051758, "global_step": 183010, "epoch": 4357} {"train_loss": -7.178679466247559, "global_step": 183011, "epoch": 4357} {"train_loss": -7.18339729309082, "global_step": 183012, "epoch": 4357} {"train_loss": -7.0447516441345215, "global_step": 183013, "epoch": 4357} {"train_loss": -6.969455718994141, "global_step": 183014, "epoch": 4357} {"train_loss": -7.179518222808838, "global_step": 183015, "epoch": 4357} {"train_loss": -7.246213436126709, "global_step": 183016, "epoch": 4357} {"train_loss": -7.100363731384277, "global_step": 183017, "epoch": 4357} {"train_loss": -7.207849502563477, "global_step": 183018, "epoch": 4357} {"train_loss": -6.973352432250977, "global_step": 183019, "epoch": 4357} {"train_loss": -7.096249580383301, "global_step": 183020, "epoch": 4357} {"train_loss": -7.182337760925293, "global_step": 183021, "epoch": 4357} {"train_loss": -7.082483291625977, "global_step": 183022, "epoch": 4357} {"train_loss": -7.171575546264648, "global_step": 183023, "epoch": 4357} {"train_loss": -7.073546409606934, "global_step": 183024, "epoch": 4357} {"train_loss": -7.2727251052856445, "global_step": 183025, "epoch": 4357} {"train_loss": -7.1138811111450195, "global_step": 183026, "epoch": 4357} {"train_loss": -7.105759620666504, "global_step": 183027, "epoch": 4357} {"train_loss": -7.158242225646973, "global_step": 183028, "epoch": 4357} {"train_loss": -7.077641487121582, "global_step": 183029, "epoch": 4357} {"train_loss": -7.143136501312256, "global_step": 183030, "epoch": 4357} {"train_loss": -7.116521835327148, "global_step": 183031, "epoch": 4357} {"train_loss": -7.176948070526123, "global_step": 183032, "epoch": 4357} {"train_loss": -7.120574474334717, "global_step": 183033, "epoch": 4357} {"train_loss": -7.217580318450928, "global_step": 183034, "epoch": 4357} {"train_loss": -7.150694211324056, "global_step": 183035, "epoch": 4357, "val_loss": 80649.828125} {"train_loss": -7.196816444396973, "global_step": 183036, "epoch": 4358} {"train_loss": -7.124076843261719, "global_step": 183037, "epoch": 4358} {"train_loss": -7.116677284240723, "global_step": 183038, "epoch": 4358} {"train_loss": -7.2123799324035645, "global_step": 183039, "epoch": 4358} {"train_loss": -7.097321510314941, "global_step": 183040, "epoch": 4358} {"train_loss": -7.256556510925293, "global_step": 183041, "epoch": 4358} {"train_loss": -7.211399555206299, "global_step": 183042, "epoch": 4358} {"train_loss": -7.139268398284912, "global_step": 183043, "epoch": 4358} {"train_loss": -7.25090217590332, "global_step": 183044, "epoch": 4358} {"train_loss": -7.192621231079102, "global_step": 183045, "epoch": 4358} {"train_loss": -7.176843643188477, "global_step": 183046, "epoch": 4358} {"train_loss": -7.207006454467773, "global_step": 183047, "epoch": 4358} {"train_loss": -7.249509334564209, "global_step": 183048, "epoch": 4358} {"train_loss": -7.300580978393555, "global_step": 183049, "epoch": 4358} {"train_loss": -7.150134086608887, "global_step": 183050, "epoch": 4358} {"train_loss": -7.167204856872559, "global_step": 183051, "epoch": 4358} {"train_loss": -7.234803676605225, "global_step": 183052, "epoch": 4358} {"train_loss": -7.2161455154418945, "global_step": 183053, "epoch": 4358} {"train_loss": -7.296562194824219, "global_step": 183054, "epoch": 4358} {"train_loss": -7.29180383682251, "global_step": 183055, "epoch": 4358} {"train_loss": -7.36021614074707, "global_step": 183056, "epoch": 4358} {"train_loss": -7.196950912475586, "global_step": 183057, "epoch": 4358} {"train_loss": -7.161232948303223, "global_step": 183058, "epoch": 4358} {"train_loss": -7.233647346496582, "global_step": 183059, "epoch": 4358} {"train_loss": -7.238576412200928, "global_step": 183060, "epoch": 4358} {"train_loss": -7.221179008483887, "global_step": 183061, "epoch": 4358} {"train_loss": -7.126276969909668, "global_step": 183062, "epoch": 4358} {"train_loss": -7.22163724899292, "global_step": 183063, "epoch": 4358} {"train_loss": -7.216320037841797, "global_step": 183064, "epoch": 4358} {"train_loss": -7.264123916625977, "global_step": 183065, "epoch": 4358} {"train_loss": -7.119527816772461, "global_step": 183066, "epoch": 4358} {"train_loss": -7.137703895568848, "global_step": 183067, "epoch": 4358} {"train_loss": -7.125511169433594, "global_step": 183068, "epoch": 4358} {"train_loss": -7.272660732269287, "global_step": 183069, "epoch": 4358} {"train_loss": -7.1891679763793945, "global_step": 183070, "epoch": 4358} {"train_loss": -7.086636543273926, "global_step": 183071, "epoch": 4358} {"train_loss": -7.20796012878418, "global_step": 183072, "epoch": 4358} {"train_loss": -7.155155658721924, "global_step": 183073, "epoch": 4358} {"train_loss": -7.235516548156738, "global_step": 183074, "epoch": 4358} {"train_loss": -7.175951957702637, "global_step": 183075, "epoch": 4358} {"train_loss": -7.1220622062683105, "global_step": 183076, "epoch": 4358} {"train_loss": -7.195919695354643, "global_step": 183077, "epoch": 4358, "val_loss": 80498.3515625} {"train_loss": -6.83656644821167, "global_step": 183078, "epoch": 4359} {"train_loss": -6.91605281829834, "global_step": 183079, "epoch": 4359} {"train_loss": -7.126717567443848, "global_step": 183080, "epoch": 4359} {"train_loss": -6.678267478942871, "global_step": 183081, "epoch": 4359} {"train_loss": -6.965175628662109, "global_step": 183082, "epoch": 4359} {"train_loss": -7.00810432434082, "global_step": 183083, "epoch": 4359} {"train_loss": -6.660818099975586, "global_step": 183084, "epoch": 4359} {"train_loss": -7.078683853149414, "global_step": 183085, "epoch": 4359} {"train_loss": -6.897521018981934, "global_step": 183086, "epoch": 4359} {"train_loss": -7.035977363586426, "global_step": 183087, "epoch": 4359} {"train_loss": -6.89724063873291, "global_step": 183088, "epoch": 4359} {"train_loss": -6.8657989501953125, "global_step": 183089, "epoch": 4359} {"train_loss": -6.899075984954834, "global_step": 183090, "epoch": 4359} {"train_loss": -6.974760055541992, "global_step": 183091, "epoch": 4359} {"train_loss": -6.9891252517700195, "global_step": 183092, "epoch": 4359} {"train_loss": -6.999628067016602, "global_step": 183093, "epoch": 4359} {"train_loss": -7.079285144805908, "global_step": 183094, "epoch": 4359} {"train_loss": -6.887628555297852, "global_step": 183095, "epoch": 4359} {"train_loss": -7.066783905029297, "global_step": 183096, "epoch": 4359} {"train_loss": -7.115394592285156, "global_step": 183097, "epoch": 4359} {"train_loss": -7.081001281738281, "global_step": 183098, "epoch": 4359} {"train_loss": -7.0025529861450195, "global_step": 183099, "epoch": 4359} {"train_loss": -7.073432445526123, "global_step": 183100, "epoch": 4359} {"train_loss": -7.125096321105957, "global_step": 183101, "epoch": 4359} {"train_loss": -7.189872741699219, "global_step": 183102, "epoch": 4359} {"train_loss": -7.049506187438965, "global_step": 183103, "epoch": 4359} {"train_loss": -7.062870025634766, "global_step": 183104, "epoch": 4359} {"train_loss": -7.071112632751465, "global_step": 183105, "epoch": 4359} {"train_loss": -7.202198028564453, "global_step": 183106, "epoch": 4359} {"train_loss": -7.09503173828125, "global_step": 183107, "epoch": 4359} {"train_loss": -7.171361446380615, "global_step": 183108, "epoch": 4359} {"train_loss": -7.005128383636475, "global_step": 183109, "epoch": 4359} {"train_loss": -7.143925666809082, "global_step": 183110, "epoch": 4359} {"train_loss": -7.216846466064453, "global_step": 183111, "epoch": 4359} {"train_loss": -6.9799418449401855, "global_step": 183112, "epoch": 4359} {"train_loss": -7.126579761505127, "global_step": 183113, "epoch": 4359} {"train_loss": -7.166110038757324, "global_step": 183114, "epoch": 4359} {"train_loss": -7.1182637214660645, "global_step": 183115, "epoch": 4359} {"train_loss": -7.173417568206787, "global_step": 183116, "epoch": 4359} {"train_loss": -7.035676956176758, "global_step": 183117, "epoch": 4359} {"train_loss": -7.249934196472168, "global_step": 183118, "epoch": 4359} {"train_loss": -7.03226934160505, "global_step": 183119, "epoch": 4359, "val_loss": 80544.328125} {"train_loss": -7.106605052947998, "global_step": 183120, "epoch": 4360} {"train_loss": -7.187291622161865, "global_step": 183121, "epoch": 4360} {"train_loss": -7.121915340423584, "global_step": 183122, "epoch": 4360} {"train_loss": -7.306341171264648, "global_step": 183123, "epoch": 4360} {"train_loss": -7.173161506652832, "global_step": 183124, "epoch": 4360} {"train_loss": -7.147322654724121, "global_step": 183125, "epoch": 4360} {"train_loss": -7.176087379455566, "global_step": 183126, "epoch": 4360} {"train_loss": -7.119423866271973, "global_step": 183127, "epoch": 4360} {"train_loss": -7.151660919189453, "global_step": 183128, "epoch": 4360} {"train_loss": -7.119401931762695, "global_step": 183129, "epoch": 4360} {"train_loss": -7.270132064819336, "global_step": 183130, "epoch": 4360} {"train_loss": -7.230066299438477, "global_step": 183131, "epoch": 4360} {"train_loss": -7.098010063171387, "global_step": 183132, "epoch": 4360} {"train_loss": -7.173587799072266, "global_step": 183133, "epoch": 4360} {"train_loss": -7.076077461242676, "global_step": 183134, "epoch": 4360} {"train_loss": -7.268906593322754, "global_step": 183135, "epoch": 4360} {"train_loss": -7.077208518981934, "global_step": 183136, "epoch": 4360} {"train_loss": -7.172245025634766, "global_step": 183137, "epoch": 4360} {"train_loss": -7.122330665588379, "global_step": 183138, "epoch": 4360} {"train_loss": -7.1537628173828125, "global_step": 183139, "epoch": 4360} {"train_loss": -7.017179012298584, "global_step": 183140, "epoch": 4360} {"train_loss": -7.114828586578369, "global_step": 183141, "epoch": 4360} {"train_loss": -7.073010444641113, "global_step": 183142, "epoch": 4360} {"train_loss": -7.153687477111816, "global_step": 183143, "epoch": 4360} {"train_loss": -7.05933952331543, "global_step": 183144, "epoch": 4360} {"train_loss": -7.073308944702148, "global_step": 183145, "epoch": 4360} {"train_loss": -7.022256374359131, "global_step": 183146, "epoch": 4360} {"train_loss": -7.115548133850098, "global_step": 183147, "epoch": 4360} {"train_loss": -7.256992340087891, "global_step": 183148, "epoch": 4360} {"train_loss": -6.995545387268066, "global_step": 183149, "epoch": 4360} {"train_loss": -7.107691764831543, "global_step": 183150, "epoch": 4360} {"train_loss": -6.953375816345215, "global_step": 183151, "epoch": 4360} {"train_loss": -7.109158515930176, "global_step": 183152, "epoch": 4360} {"train_loss": -7.088047027587891, "global_step": 183153, "epoch": 4360} {"train_loss": -7.03431510925293, "global_step": 183154, "epoch": 4360} {"train_loss": -7.070631504058838, "global_step": 183155, "epoch": 4360} {"train_loss": -7.087186336517334, "global_step": 183156, "epoch": 4360} {"train_loss": -7.110608100891113, "global_step": 183157, "epoch": 4360} {"train_loss": -6.999696254730225, "global_step": 183158, "epoch": 4360} {"train_loss": -7.06257438659668, "global_step": 183159, "epoch": 4360} {"train_loss": -7.177700996398926, "global_step": 183160, "epoch": 4360} {"train_loss": -7.1165322689783, "global_step": 183161, "epoch": 4360, "val_loss": 80881.8046875} {"train_loss": -7.101356029510498, "global_step": 183162, "epoch": 4361} {"train_loss": -7.025066375732422, "global_step": 183163, "epoch": 4361} {"train_loss": -7.015657424926758, "global_step": 183164, "epoch": 4361} {"train_loss": -7.041109085083008, "global_step": 183165, "epoch": 4361} {"train_loss": -7.028400421142578, "global_step": 183166, "epoch": 4361} {"train_loss": -7.038782119750977, "global_step": 183167, "epoch": 4361} {"train_loss": -6.986600875854492, "global_step": 183168, "epoch": 4361} {"train_loss": -7.057583808898926, "global_step": 183169, "epoch": 4361} {"train_loss": -7.055513381958008, "global_step": 183170, "epoch": 4361} {"train_loss": -6.822782516479492, "global_step": 183171, "epoch": 4361} {"train_loss": -7.1966376304626465, "global_step": 183172, "epoch": 4361} {"train_loss": -7.001592636108398, "global_step": 183173, "epoch": 4361} {"train_loss": -7.2224440574646, "global_step": 183174, "epoch": 4361} {"train_loss": -7.0600385665893555, "global_step": 183175, "epoch": 4361} {"train_loss": -7.328110694885254, "global_step": 183176, "epoch": 4361} {"train_loss": -6.992111682891846, "global_step": 183177, "epoch": 4361} {"train_loss": -7.231164932250977, "global_step": 183178, "epoch": 4361} {"train_loss": -7.076157093048096, "global_step": 183179, "epoch": 4361} {"train_loss": -7.197561740875244, "global_step": 183180, "epoch": 4361} {"train_loss": -7.210662841796875, "global_step": 183181, "epoch": 4361} {"train_loss": -7.111755847930908, "global_step": 183182, "epoch": 4361} {"train_loss": -7.164503574371338, "global_step": 183183, "epoch": 4361} {"train_loss": -7.13913106918335, "global_step": 183184, "epoch": 4361} {"train_loss": -7.108058929443359, "global_step": 183185, "epoch": 4361} {"train_loss": -7.031777858734131, "global_step": 183186, "epoch": 4361} {"train_loss": -7.078473091125488, "global_step": 183187, "epoch": 4361} {"train_loss": -7.124044418334961, "global_step": 183188, "epoch": 4361} {"train_loss": -7.166985511779785, "global_step": 183189, "epoch": 4361} {"train_loss": -7.032817840576172, "global_step": 183190, "epoch": 4361} {"train_loss": -7.21237850189209, "global_step": 183191, "epoch": 4361} {"train_loss": -7.183384895324707, "global_step": 183192, "epoch": 4361} {"train_loss": -7.0954999923706055, "global_step": 183193, "epoch": 4361} {"train_loss": -7.075143814086914, "global_step": 183194, "epoch": 4361} {"train_loss": -7.269820690155029, "global_step": 183195, "epoch": 4361} {"train_loss": -7.249485492706299, "global_step": 183196, "epoch": 4361} {"train_loss": -7.135210037231445, "global_step": 183197, "epoch": 4361} {"train_loss": -7.170760154724121, "global_step": 183198, "epoch": 4361} {"train_loss": -7.1119585037231445, "global_step": 183199, "epoch": 4361} {"train_loss": -7.23779296875, "global_step": 183200, "epoch": 4361} {"train_loss": -7.18930721282959, "global_step": 183201, "epoch": 4361} {"train_loss": -7.146475791931152, "global_step": 183202, "epoch": 4361} {"train_loss": -7.113388458887736, "global_step": 183203, "epoch": 4361, "val_loss": 80310.765625} {"train_loss": -7.161226272583008, "global_step": 183204, "epoch": 4362} {"train_loss": -7.177011489868164, "global_step": 183205, "epoch": 4362} {"train_loss": -7.016948699951172, "global_step": 183206, "epoch": 4362} {"train_loss": -7.15870475769043, "global_step": 183207, "epoch": 4362} {"train_loss": -7.05517578125, "global_step": 183208, "epoch": 4362} {"train_loss": -7.145014762878418, "global_step": 183209, "epoch": 4362} {"train_loss": -7.225255012512207, "global_step": 183210, "epoch": 4362} {"train_loss": -7.09398889541626, "global_step": 183211, "epoch": 4362} {"train_loss": -7.068238258361816, "global_step": 183212, "epoch": 4362} {"train_loss": -6.995408535003662, "global_step": 183213, "epoch": 4362} {"train_loss": -7.134041786193848, "global_step": 183214, "epoch": 4362} {"train_loss": -7.114792823791504, "global_step": 183215, "epoch": 4362} {"train_loss": -7.1515398025512695, "global_step": 183216, "epoch": 4362} {"train_loss": -7.189857482910156, "global_step": 183217, "epoch": 4362} {"train_loss": -7.052247047424316, "global_step": 183218, "epoch": 4362} {"train_loss": -7.075106143951416, "global_step": 183219, "epoch": 4362} {"train_loss": -7.007253646850586, "global_step": 183220, "epoch": 4362} {"train_loss": -7.091643333435059, "global_step": 183221, "epoch": 4362} {"train_loss": -7.141689777374268, "global_step": 183222, "epoch": 4362} {"train_loss": -7.154156684875488, "global_step": 183223, "epoch": 4362} {"train_loss": -7.149130344390869, "global_step": 183224, "epoch": 4362} {"train_loss": -7.066616058349609, "global_step": 183225, "epoch": 4362} {"train_loss": -7.047303199768066, "global_step": 183226, "epoch": 4362} {"train_loss": -7.082851886749268, "global_step": 183227, "epoch": 4362} {"train_loss": -6.984210014343262, "global_step": 183228, "epoch": 4362} {"train_loss": -7.022339820861816, "global_step": 183229, "epoch": 4362} {"train_loss": -7.111145973205566, "global_step": 183230, "epoch": 4362} {"train_loss": -7.011434555053711, "global_step": 183231, "epoch": 4362} {"train_loss": -7.182982444763184, "global_step": 183232, "epoch": 4362} {"train_loss": -7.205570697784424, "global_step": 183233, "epoch": 4362} {"train_loss": -7.032313346862793, "global_step": 183234, "epoch": 4362} {"train_loss": -7.236769676208496, "global_step": 183235, "epoch": 4362} {"train_loss": -7.128928184509277, "global_step": 183236, "epoch": 4362} {"train_loss": -7.128755569458008, "global_step": 183237, "epoch": 4362} {"train_loss": -7.206306457519531, "global_step": 183238, "epoch": 4362} {"train_loss": -7.155815601348877, "global_step": 183239, "epoch": 4362} {"train_loss": -7.197998046875, "global_step": 183240, "epoch": 4362} {"train_loss": -7.148166179656982, "global_step": 183241, "epoch": 4362} {"train_loss": -7.162138938903809, "global_step": 183242, "epoch": 4362} {"train_loss": -7.2427802085876465, "global_step": 183243, "epoch": 4362} {"train_loss": -7.137155055999756, "global_step": 183244, "epoch": 4362} {"train_loss": -7.120241255987258, "global_step": 183245, "epoch": 4362, "val_loss": 80651.59375} {"train_loss": -7.269536018371582, "global_step": 183246, "epoch": 4363} {"train_loss": -7.216556072235107, "global_step": 183247, "epoch": 4363} {"train_loss": -7.141921043395996, "global_step": 183248, "epoch": 4363} {"train_loss": -7.118620872497559, "global_step": 183249, "epoch": 4363} {"train_loss": -7.138737678527832, "global_step": 183250, "epoch": 4363} {"train_loss": -7.258501052856445, "global_step": 183251, "epoch": 4363} {"train_loss": -7.242827892303467, "global_step": 183252, "epoch": 4363} {"train_loss": -7.236478805541992, "global_step": 183253, "epoch": 4363} {"train_loss": -7.186849594116211, "global_step": 183254, "epoch": 4363} {"train_loss": -7.1774444580078125, "global_step": 183255, "epoch": 4363} {"train_loss": -7.262361526489258, "global_step": 183256, "epoch": 4363} {"train_loss": -7.160493850708008, "global_step": 183257, "epoch": 4363} {"train_loss": -7.170217514038086, "global_step": 183258, "epoch": 4363} {"train_loss": -7.098236083984375, "global_step": 183259, "epoch": 4363} {"train_loss": -7.207756042480469, "global_step": 183260, "epoch": 4363} {"train_loss": -7.177310943603516, "global_step": 183261, "epoch": 4363} {"train_loss": -7.151607513427734, "global_step": 183262, "epoch": 4363} {"train_loss": -7.114313125610352, "global_step": 183263, "epoch": 4363} {"train_loss": -7.101874351501465, "global_step": 183264, "epoch": 4363} {"train_loss": -7.193920135498047, "global_step": 183265, "epoch": 4363} {"train_loss": -7.199746131896973, "global_step": 183266, "epoch": 4363} {"train_loss": -7.1124114990234375, "global_step": 183267, "epoch": 4363} {"train_loss": -7.151162147521973, "global_step": 183268, "epoch": 4363} {"train_loss": -7.092321395874023, "global_step": 183269, "epoch": 4363} {"train_loss": -7.208956718444824, "global_step": 183270, "epoch": 4363} {"train_loss": -7.3031110763549805, "global_step": 183271, "epoch": 4363} {"train_loss": -7.141294002532959, "global_step": 183272, "epoch": 4363} {"train_loss": -7.213300704956055, "global_step": 183273, "epoch": 4363} {"train_loss": -7.164595127105713, "global_step": 183274, "epoch": 4363} {"train_loss": -7.203418731689453, "global_step": 183275, "epoch": 4363} {"train_loss": -7.1361985206604, "global_step": 183276, "epoch": 4363} {"train_loss": -7.252276420593262, "global_step": 183277, "epoch": 4363} {"train_loss": -7.142241477966309, "global_step": 183278, "epoch": 4363} {"train_loss": -7.210761070251465, "global_step": 183279, "epoch": 4363} {"train_loss": -7.138848304748535, "global_step": 183280, "epoch": 4363} {"train_loss": -7.09052848815918, "global_step": 183281, "epoch": 4363} {"train_loss": -7.285826683044434, "global_step": 183282, "epoch": 4363} {"train_loss": -7.236445426940918, "global_step": 183283, "epoch": 4363} {"train_loss": -7.118846416473389, "global_step": 183284, "epoch": 4363} {"train_loss": -7.070995330810547, "global_step": 183285, "epoch": 4363} {"train_loss": -7.098472595214844, "global_step": 183286, "epoch": 4363} {"train_loss": -7.16978425071353, "global_step": 183287, "epoch": 4363, "val_loss": 80678.7890625} {"train_loss": -7.1635661125183105, "global_step": 183288, "epoch": 4364} {"train_loss": -7.140301704406738, "global_step": 183289, "epoch": 4364} {"train_loss": -6.987348556518555, "global_step": 183290, "epoch": 4364} {"train_loss": -7.134937286376953, "global_step": 183291, "epoch": 4364} {"train_loss": -7.058589935302734, "global_step": 183292, "epoch": 4364} {"train_loss": -7.03415584564209, "global_step": 183293, "epoch": 4364} {"train_loss": -7.039694786071777, "global_step": 183294, "epoch": 4364} {"train_loss": -7.128337860107422, "global_step": 183295, "epoch": 4364} {"train_loss": -7.164483547210693, "global_step": 183296, "epoch": 4364} {"train_loss": -7.157236576080322, "global_step": 183297, "epoch": 4364} {"train_loss": -7.167104721069336, "global_step": 183298, "epoch": 4364} {"train_loss": -7.248345375061035, "global_step": 183299, "epoch": 4364} {"train_loss": -7.115478515625, "global_step": 183300, "epoch": 4364} {"train_loss": -7.147670269012451, "global_step": 183301, "epoch": 4364} {"train_loss": -7.142025947570801, "global_step": 183302, "epoch": 4364} {"train_loss": -7.186275482177734, "global_step": 183303, "epoch": 4364} {"train_loss": -7.183782577514648, "global_step": 183304, "epoch": 4364} {"train_loss": -7.190679550170898, "global_step": 183305, "epoch": 4364} {"train_loss": -7.1402997970581055, "global_step": 183306, "epoch": 4364} {"train_loss": -7.248610496520996, "global_step": 183307, "epoch": 4364} {"train_loss": -7.166223526000977, "global_step": 183308, "epoch": 4364} {"train_loss": -7.218465805053711, "global_step": 183309, "epoch": 4364} {"train_loss": -7.213896751403809, "global_step": 183310, "epoch": 4364} {"train_loss": -7.155552864074707, "global_step": 183311, "epoch": 4364} {"train_loss": -7.1507344245910645, "global_step": 183312, "epoch": 4364} {"train_loss": -7.173414707183838, "global_step": 183313, "epoch": 4364} {"train_loss": -7.1721954345703125, "global_step": 183314, "epoch": 4364} {"train_loss": -7.010485649108887, "global_step": 183315, "epoch": 4364} {"train_loss": -7.250509262084961, "global_step": 183316, "epoch": 4364} {"train_loss": -7.221200466156006, "global_step": 183317, "epoch": 4364} {"train_loss": -7.156979560852051, "global_step": 183318, "epoch": 4364} {"train_loss": -7.191389560699463, "global_step": 183319, "epoch": 4364} {"train_loss": -7.246170997619629, "global_step": 183320, "epoch": 4364} {"train_loss": -7.168063163757324, "global_step": 183321, "epoch": 4364} {"train_loss": -7.113328456878662, "global_step": 183322, "epoch": 4364} {"train_loss": -7.126707077026367, "global_step": 183323, "epoch": 4364} {"train_loss": -7.042911529541016, "global_step": 183324, "epoch": 4364} {"train_loss": -7.141153335571289, "global_step": 183325, "epoch": 4364} {"train_loss": -7.218497276306152, "global_step": 183326, "epoch": 4364} {"train_loss": -7.174415588378906, "global_step": 183327, "epoch": 4364} {"train_loss": -7.0874104499816895, "global_step": 183328, "epoch": 4364} {"train_loss": -7.151994625727336, "global_step": 183329, "epoch": 4364, "val_loss": 80673.125} {"train_loss": -7.18193244934082, "global_step": 183330, "epoch": 4365} {"train_loss": -7.199859142303467, "global_step": 183331, "epoch": 4365} {"train_loss": -7.160700798034668, "global_step": 183332, "epoch": 4365} {"train_loss": -7.11142110824585, "global_step": 183333, "epoch": 4365} {"train_loss": -7.089590072631836, "global_step": 183334, "epoch": 4365} {"train_loss": -7.156111717224121, "global_step": 183335, "epoch": 4365} {"train_loss": -7.233928680419922, "global_step": 183336, "epoch": 4365} {"train_loss": -7.20662784576416, "global_step": 183337, "epoch": 4365} {"train_loss": -7.165891170501709, "global_step": 183338, "epoch": 4365} {"train_loss": -7.15521240234375, "global_step": 183339, "epoch": 4365} {"train_loss": -7.22045373916626, "global_step": 183340, "epoch": 4365} {"train_loss": -7.1171345710754395, "global_step": 183341, "epoch": 4365} {"train_loss": -7.117667198181152, "global_step": 183342, "epoch": 4365} {"train_loss": -7.181291580200195, "global_step": 183343, "epoch": 4365} {"train_loss": -7.192590236663818, "global_step": 183344, "epoch": 4365} {"train_loss": -7.205169677734375, "global_step": 183345, "epoch": 4365} {"train_loss": -7.129898548126221, "global_step": 183346, "epoch": 4365} {"train_loss": -7.170022010803223, "global_step": 183347, "epoch": 4365} {"train_loss": -7.119606971740723, "global_step": 183348, "epoch": 4365} {"train_loss": -7.180356025695801, "global_step": 183349, "epoch": 4365} {"train_loss": -7.176247596740723, "global_step": 183350, "epoch": 4365} {"train_loss": -7.180869102478027, "global_step": 183351, "epoch": 4365} {"train_loss": -7.035759925842285, "global_step": 183352, "epoch": 4365} {"train_loss": -7.169285774230957, "global_step": 183353, "epoch": 4365} {"train_loss": -7.178535461425781, "global_step": 183354, "epoch": 4365} {"train_loss": -7.212193489074707, "global_step": 183355, "epoch": 4365} {"train_loss": -7.282001972198486, "global_step": 183356, "epoch": 4365} {"train_loss": -7.289250373840332, "global_step": 183357, "epoch": 4365} {"train_loss": -7.226687431335449, "global_step": 183358, "epoch": 4365} {"train_loss": -7.258301258087158, "global_step": 183359, "epoch": 4365} {"train_loss": -7.198399543762207, "global_step": 183360, "epoch": 4365} {"train_loss": -7.026677131652832, "global_step": 183361, "epoch": 4365} {"train_loss": -7.179281234741211, "global_step": 183362, "epoch": 4365} {"train_loss": -7.194388389587402, "global_step": 183363, "epoch": 4365} {"train_loss": -7.221123695373535, "global_step": 183364, "epoch": 4365} {"train_loss": -7.164318084716797, "global_step": 183365, "epoch": 4365} {"train_loss": -7.139786720275879, "global_step": 183366, "epoch": 4365} {"train_loss": -7.098860740661621, "global_step": 183367, "epoch": 4365} {"train_loss": -7.2337141036987305, "global_step": 183368, "epoch": 4365} {"train_loss": -7.138681411743164, "global_step": 183369, "epoch": 4365} {"train_loss": -7.179969787597656, "global_step": 183370, "epoch": 4365} {"train_loss": -7.173612980615525, "global_step": 183371, "epoch": 4365, "val_loss": 80506.140625} {"train_loss": -7.042206764221191, "global_step": 183372, "epoch": 4366} {"train_loss": -7.080550670623779, "global_step": 183373, "epoch": 4366} {"train_loss": -7.152407646179199, "global_step": 183374, "epoch": 4366} {"train_loss": -7.200594902038574, "global_step": 183375, "epoch": 4366} {"train_loss": -7.1394147872924805, "global_step": 183376, "epoch": 4366} {"train_loss": -7.121380805969238, "global_step": 183377, "epoch": 4366} {"train_loss": -7.241448402404785, "global_step": 183378, "epoch": 4366} {"train_loss": -7.248924255371094, "global_step": 183379, "epoch": 4366} {"train_loss": -7.052051067352295, "global_step": 183380, "epoch": 4366} {"train_loss": -7.258130073547363, "global_step": 183381, "epoch": 4366} {"train_loss": -7.189532279968262, "global_step": 183382, "epoch": 4366} {"train_loss": -7.2169318199157715, "global_step": 183383, "epoch": 4366} {"train_loss": -7.258655548095703, "global_step": 183384, "epoch": 4366} {"train_loss": -7.1525654792785645, "global_step": 183385, "epoch": 4366} {"train_loss": -7.116044998168945, "global_step": 183386, "epoch": 4366} {"train_loss": -7.140913009643555, "global_step": 183387, "epoch": 4366} {"train_loss": -7.3151092529296875, "global_step": 183388, "epoch": 4366} {"train_loss": -7.131101608276367, "global_step": 183389, "epoch": 4366} {"train_loss": -7.167723655700684, "global_step": 183390, "epoch": 4366} {"train_loss": -7.142021179199219, "global_step": 183391, "epoch": 4366} {"train_loss": -7.067026615142822, "global_step": 183392, "epoch": 4366} {"train_loss": -7.152758598327637, "global_step": 183393, "epoch": 4366} {"train_loss": -7.193002700805664, "global_step": 183394, "epoch": 4366} {"train_loss": -7.213115692138672, "global_step": 183395, "epoch": 4366} {"train_loss": -7.152859687805176, "global_step": 183396, "epoch": 4366} {"train_loss": -7.237844467163086, "global_step": 183397, "epoch": 4366} {"train_loss": -7.127767562866211, "global_step": 183398, "epoch": 4366} {"train_loss": -7.253820419311523, "global_step": 183399, "epoch": 4366} {"train_loss": -7.235725402832031, "global_step": 183400, "epoch": 4366} {"train_loss": -7.305654048919678, "global_step": 183401, "epoch": 4366} {"train_loss": -7.150077819824219, "global_step": 183402, "epoch": 4366} {"train_loss": -7.071531295776367, "global_step": 183403, "epoch": 4366} {"train_loss": -7.177730560302734, "global_step": 183404, "epoch": 4366} {"train_loss": -7.211817741394043, "global_step": 183405, "epoch": 4366} {"train_loss": -7.07792854309082, "global_step": 183406, "epoch": 4366} {"train_loss": -6.998045444488525, "global_step": 183407, "epoch": 4366} {"train_loss": -7.142451286315918, "global_step": 183408, "epoch": 4366} {"train_loss": -7.100202560424805, "global_step": 183409, "epoch": 4366} {"train_loss": -7.144682884216309, "global_step": 183410, "epoch": 4366} {"train_loss": -7.132575988769531, "global_step": 183411, "epoch": 4366} {"train_loss": -7.028611660003662, "global_step": 183412, "epoch": 4366} {"train_loss": -7.159111897150676, "global_step": 183413, "epoch": 4366, "val_loss": 80546.3984375} {"train_loss": -7.103168487548828, "global_step": 183414, "epoch": 4367} {"train_loss": -7.208009719848633, "global_step": 183415, "epoch": 4367} {"train_loss": -7.145464897155762, "global_step": 183416, "epoch": 4367} {"train_loss": -7.108651161193848, "global_step": 183417, "epoch": 4367} {"train_loss": -7.156566619873047, "global_step": 183418, "epoch": 4367} {"train_loss": -7.079658508300781, "global_step": 183419, "epoch": 4367} {"train_loss": -7.176119327545166, "global_step": 183420, "epoch": 4367} {"train_loss": -7.116180419921875, "global_step": 183421, "epoch": 4367} {"train_loss": -7.1466145515441895, "global_step": 183422, "epoch": 4367} {"train_loss": -7.2407002449035645, "global_step": 183423, "epoch": 4367} {"train_loss": -7.235722541809082, "global_step": 183424, "epoch": 4367} {"train_loss": -7.25477933883667, "global_step": 183425, "epoch": 4367} {"train_loss": -7.128312587738037, "global_step": 183426, "epoch": 4367} {"train_loss": -7.202394485473633, "global_step": 183427, "epoch": 4367} {"train_loss": -7.254842758178711, "global_step": 183428, "epoch": 4367} {"train_loss": -7.099453449249268, "global_step": 183429, "epoch": 4367} {"train_loss": -7.263165473937988, "global_step": 183430, "epoch": 4367} {"train_loss": -7.299921035766602, "global_step": 183431, "epoch": 4367} {"train_loss": -7.156033992767334, "global_step": 183432, "epoch": 4367} {"train_loss": -7.1673583984375, "global_step": 183433, "epoch": 4367} {"train_loss": -7.200117588043213, "global_step": 183434, "epoch": 4367} {"train_loss": -7.201887607574463, "global_step": 183435, "epoch": 4367} {"train_loss": -7.202946662902832, "global_step": 183436, "epoch": 4367} {"train_loss": -7.1675238609313965, "global_step": 183437, "epoch": 4367} {"train_loss": -7.250953674316406, "global_step": 183438, "epoch": 4367} {"train_loss": -7.10021448135376, "global_step": 183439, "epoch": 4367} {"train_loss": -7.189825534820557, "global_step": 183440, "epoch": 4367} {"train_loss": -7.224925994873047, "global_step": 183441, "epoch": 4367} {"train_loss": -7.099379062652588, "global_step": 183442, "epoch": 4367} {"train_loss": -7.141927242279053, "global_step": 183443, "epoch": 4367} {"train_loss": -7.046277046203613, "global_step": 183444, "epoch": 4367} {"train_loss": -7.11595344543457, "global_step": 183445, "epoch": 4367} {"train_loss": -7.114086151123047, "global_step": 183446, "epoch": 4367} {"train_loss": -7.1046247482299805, "global_step": 183447, "epoch": 4367} {"train_loss": -6.976455211639404, "global_step": 183448, "epoch": 4367} {"train_loss": -7.266597747802734, "global_step": 183449, "epoch": 4367} {"train_loss": -7.108173370361328, "global_step": 183450, "epoch": 4367} {"train_loss": -7.082056999206543, "global_step": 183451, "epoch": 4367} {"train_loss": -7.1219401359558105, "global_step": 183452, "epoch": 4367} {"train_loss": -7.167509078979492, "global_step": 183453, "epoch": 4367} {"train_loss": -6.970580101013184, "global_step": 183454, "epoch": 4367} {"train_loss": -7.157551504316784, "global_step": 183455, "epoch": 4367, "val_loss": 80804.5546875} {"train_loss": -7.019099235534668, "global_step": 183456, "epoch": 4368} {"train_loss": -7.007028579711914, "global_step": 183457, "epoch": 4368} {"train_loss": -7.232031345367432, "global_step": 183458, "epoch": 4368} {"train_loss": -7.0146894454956055, "global_step": 183459, "epoch": 4368} {"train_loss": -7.000709056854248, "global_step": 183460, "epoch": 4368} {"train_loss": -7.195160865783691, "global_step": 183461, "epoch": 4368} {"train_loss": -7.111621379852295, "global_step": 183462, "epoch": 4368} {"train_loss": -7.114763259887695, "global_step": 183463, "epoch": 4368} {"train_loss": -7.018993377685547, "global_step": 183464, "epoch": 4368} {"train_loss": -7.067232131958008, "global_step": 183465, "epoch": 4368} {"train_loss": -7.158507347106934, "global_step": 183466, "epoch": 4368} {"train_loss": -6.94948673248291, "global_step": 183467, "epoch": 4368} {"train_loss": -7.126187324523926, "global_step": 183468, "epoch": 4368} {"train_loss": -7.056609153747559, "global_step": 183469, "epoch": 4368} {"train_loss": -7.088189125061035, "global_step": 183470, "epoch": 4368} {"train_loss": -7.231019973754883, "global_step": 183471, "epoch": 4368} {"train_loss": -7.238916397094727, "global_step": 183472, "epoch": 4368} {"train_loss": -7.024731159210205, "global_step": 183473, "epoch": 4368} {"train_loss": -7.112004280090332, "global_step": 183474, "epoch": 4368} {"train_loss": -7.147916793823242, "global_step": 183475, "epoch": 4368} {"train_loss": -6.9583001136779785, "global_step": 183476, "epoch": 4368} {"train_loss": -7.199376583099365, "global_step": 183477, "epoch": 4368} {"train_loss": -7.071635723114014, "global_step": 183478, "epoch": 4368} {"train_loss": -6.984421730041504, "global_step": 183479, "epoch": 4368} {"train_loss": -7.100332736968994, "global_step": 183480, "epoch": 4368} {"train_loss": -6.966965675354004, "global_step": 183481, "epoch": 4368} {"train_loss": -7.107064723968506, "global_step": 183482, "epoch": 4368} {"train_loss": -7.171658515930176, "global_step": 183483, "epoch": 4368} {"train_loss": -7.009550094604492, "global_step": 183484, "epoch": 4368} {"train_loss": -7.228127479553223, "global_step": 183485, "epoch": 4368} {"train_loss": -7.013164520263672, "global_step": 183486, "epoch": 4368} {"train_loss": -6.891124725341797, "global_step": 183487, "epoch": 4368} {"train_loss": -7.120750427246094, "global_step": 183488, "epoch": 4368} {"train_loss": -7.062662124633789, "global_step": 183489, "epoch": 4368} {"train_loss": -7.14950704574585, "global_step": 183490, "epoch": 4368} {"train_loss": -7.0567779541015625, "global_step": 183491, "epoch": 4368} {"train_loss": -7.067173957824707, "global_step": 183492, "epoch": 4368} {"train_loss": -7.112554550170898, "global_step": 183493, "epoch": 4368} {"train_loss": -6.990437984466553, "global_step": 183494, "epoch": 4368} {"train_loss": -7.230175018310547, "global_step": 183495, "epoch": 4368} {"train_loss": -6.921895980834961, "global_step": 183496, "epoch": 4368} {"train_loss": -7.080049707776024, "global_step": 183497, "epoch": 4368, "val_loss": 80358.9453125} {"train_loss": -7.016977787017822, "global_step": 183498, "epoch": 4369} {"train_loss": -7.139889717102051, "global_step": 183499, "epoch": 4369} {"train_loss": -7.121670722961426, "global_step": 183500, "epoch": 4369} {"train_loss": -7.13430118560791, "global_step": 183501, "epoch": 4369} {"train_loss": -7.188455581665039, "global_step": 183502, "epoch": 4369} {"train_loss": -7.00705623626709, "global_step": 183503, "epoch": 4369} {"train_loss": -7.148202896118164, "global_step": 183504, "epoch": 4369} {"train_loss": -7.138702392578125, "global_step": 183505, "epoch": 4369} {"train_loss": -7.142075538635254, "global_step": 183506, "epoch": 4369} {"train_loss": -7.141072750091553, "global_step": 183507, "epoch": 4369} {"train_loss": -7.116950035095215, "global_step": 183508, "epoch": 4369} {"train_loss": -7.2186384201049805, "global_step": 183509, "epoch": 4369} {"train_loss": -6.968932628631592, "global_step": 183510, "epoch": 4369} {"train_loss": -7.20298957824707, "global_step": 183511, "epoch": 4369} {"train_loss": -7.079675674438477, "global_step": 183512, "epoch": 4369} {"train_loss": -7.104702472686768, "global_step": 183513, "epoch": 4369} {"train_loss": -7.232234001159668, "global_step": 183514, "epoch": 4369} {"train_loss": -7.2462358474731445, "global_step": 183515, "epoch": 4369} {"train_loss": -7.181687355041504, "global_step": 183516, "epoch": 4369} {"train_loss": -7.219331741333008, "global_step": 183517, "epoch": 4369} {"train_loss": -7.194169044494629, "global_step": 183518, "epoch": 4369} {"train_loss": -7.194375038146973, "global_step": 183519, "epoch": 4369} {"train_loss": -7.300038814544678, "global_step": 183520, "epoch": 4369} {"train_loss": -7.182190418243408, "global_step": 183521, "epoch": 4369} {"train_loss": -7.112104415893555, "global_step": 183522, "epoch": 4369} {"train_loss": -7.2625956535339355, "global_step": 183523, "epoch": 4369} {"train_loss": -7.147029876708984, "global_step": 183524, "epoch": 4369} {"train_loss": -7.188148021697998, "global_step": 183525, "epoch": 4369} {"train_loss": -7.249939918518066, "global_step": 183526, "epoch": 4369} {"train_loss": -7.2343220710754395, "global_step": 183527, "epoch": 4369} {"train_loss": -7.109944820404053, "global_step": 183528, "epoch": 4369} {"train_loss": -7.268317222595215, "global_step": 183529, "epoch": 4369} {"train_loss": -7.176647186279297, "global_step": 183530, "epoch": 4369} {"train_loss": -7.234289169311523, "global_step": 183531, "epoch": 4369} {"train_loss": -7.204639434814453, "global_step": 183532, "epoch": 4369} {"train_loss": -7.147245407104492, "global_step": 183533, "epoch": 4369} {"train_loss": -7.143750190734863, "global_step": 183534, "epoch": 4369} {"train_loss": -7.183023452758789, "global_step": 183535, "epoch": 4369} {"train_loss": -7.100799083709717, "global_step": 183536, "epoch": 4369} {"train_loss": -7.119452953338623, "global_step": 183537, "epoch": 4369} {"train_loss": -7.1189680099487305, "global_step": 183538, "epoch": 4369} {"train_loss": -7.160754453568232, "global_step": 183539, "epoch": 4369, "val_loss": 80749.1640625} {"train_loss": -7.1522955894470215, "global_step": 183540, "epoch": 4370} {"train_loss": -7.225327014923096, "global_step": 183541, "epoch": 4370} {"train_loss": -7.221317291259766, "global_step": 183542, "epoch": 4370} {"train_loss": -7.039519786834717, "global_step": 183543, "epoch": 4370} {"train_loss": -7.2216949462890625, "global_step": 183544, "epoch": 4370} {"train_loss": -7.142997741699219, "global_step": 183545, "epoch": 4370} {"train_loss": -7.195394992828369, "global_step": 183546, "epoch": 4370} {"train_loss": -7.091100692749023, "global_step": 183547, "epoch": 4370} {"train_loss": -7.176163673400879, "global_step": 183548, "epoch": 4370} {"train_loss": -7.211573600769043, "global_step": 183549, "epoch": 4370} {"train_loss": -7.1680145263671875, "global_step": 183550, "epoch": 4370} {"train_loss": -7.166952133178711, "global_step": 183551, "epoch": 4370} {"train_loss": -7.1584320068359375, "global_step": 183552, "epoch": 4370} {"train_loss": -7.094822883605957, "global_step": 183553, "epoch": 4370} {"train_loss": -7.22702169418335, "global_step": 183554, "epoch": 4370} {"train_loss": -7.049106121063232, "global_step": 183555, "epoch": 4370} {"train_loss": -7.149413108825684, "global_step": 183556, "epoch": 4370} {"train_loss": -7.186285495758057, "global_step": 183557, "epoch": 4370} {"train_loss": -7.133387565612793, "global_step": 183558, "epoch": 4370} {"train_loss": -7.230804920196533, "global_step": 183559, "epoch": 4370} {"train_loss": -7.027776718139648, "global_step": 183560, "epoch": 4370} {"train_loss": -7.188990592956543, "global_step": 183561, "epoch": 4370} {"train_loss": -7.177607536315918, "global_step": 183562, "epoch": 4370} {"train_loss": -7.171318531036377, "global_step": 183563, "epoch": 4370} {"train_loss": -7.2792863845825195, "global_step": 183564, "epoch": 4370} {"train_loss": -7.087133884429932, "global_step": 183565, "epoch": 4370} {"train_loss": -7.156060218811035, "global_step": 183566, "epoch": 4370} {"train_loss": -7.352621555328369, "global_step": 183567, "epoch": 4370} {"train_loss": -7.248133659362793, "global_step": 183568, "epoch": 4370} {"train_loss": -7.315251350402832, "global_step": 183569, "epoch": 4370} {"train_loss": -7.275669574737549, "global_step": 183570, "epoch": 4370} {"train_loss": -7.224842071533203, "global_step": 183571, "epoch": 4370} {"train_loss": -7.126262664794922, "global_step": 183572, "epoch": 4370} {"train_loss": -7.184731483459473, "global_step": 183573, "epoch": 4370} {"train_loss": -7.157297611236572, "global_step": 183574, "epoch": 4370} {"train_loss": -7.282467842102051, "global_step": 183575, "epoch": 4370} {"train_loss": -7.315105438232422, "global_step": 183576, "epoch": 4370} {"train_loss": -7.185586452484131, "global_step": 183577, "epoch": 4370} {"train_loss": -7.32882022857666, "global_step": 183578, "epoch": 4370} {"train_loss": -7.254785060882568, "global_step": 183579, "epoch": 4370} {"train_loss": -7.317873001098633, "global_step": 183580, "epoch": 4370} {"train_loss": -7.19188506262643, "global_step": 183581, "epoch": 4370, "val_loss": 80529.5625} {"train_loss": -7.247375965118408, "global_step": 183582, "epoch": 4371} {"train_loss": -7.076240539550781, "global_step": 183583, "epoch": 4371} {"train_loss": -7.193987846374512, "global_step": 183584, "epoch": 4371} {"train_loss": -7.072110176086426, "global_step": 183585, "epoch": 4371} {"train_loss": -7.164544105529785, "global_step": 183586, "epoch": 4371} {"train_loss": -7.182655334472656, "global_step": 183587, "epoch": 4371} {"train_loss": -7.053307056427002, "global_step": 183588, "epoch": 4371} {"train_loss": -7.1640119552612305, "global_step": 183589, "epoch": 4371} {"train_loss": -7.218585014343262, "global_step": 183590, "epoch": 4371} {"train_loss": -7.216821670532227, "global_step": 183591, "epoch": 4371} {"train_loss": -7.170629024505615, "global_step": 183592, "epoch": 4371} {"train_loss": -7.086807727813721, "global_step": 183593, "epoch": 4371} {"train_loss": -7.282567024230957, "global_step": 183594, "epoch": 4371} {"train_loss": -7.091212272644043, "global_step": 183595, "epoch": 4371} {"train_loss": -7.043287754058838, "global_step": 183596, "epoch": 4371} {"train_loss": -7.089169502258301, "global_step": 183597, "epoch": 4371} {"train_loss": -7.1448163986206055, "global_step": 183598, "epoch": 4371} {"train_loss": -7.208244323730469, "global_step": 183599, "epoch": 4371} {"train_loss": -7.211376190185547, "global_step": 183600, "epoch": 4371} {"train_loss": -7.126782417297363, "global_step": 183601, "epoch": 4371} {"train_loss": -7.1439619064331055, "global_step": 183602, "epoch": 4371} {"train_loss": -7.19850492477417, "global_step": 183603, "epoch": 4371} {"train_loss": -7.083412170410156, "global_step": 183604, "epoch": 4371} {"train_loss": -7.198528289794922, "global_step": 183605, "epoch": 4371} {"train_loss": -7.142180919647217, "global_step": 183606, "epoch": 4371} {"train_loss": -7.152650833129883, "global_step": 183607, "epoch": 4371} {"train_loss": -7.264009952545166, "global_step": 183608, "epoch": 4371} {"train_loss": -7.202062606811523, "global_step": 183609, "epoch": 4371} {"train_loss": -7.164044380187988, "global_step": 183610, "epoch": 4371} {"train_loss": -7.183978080749512, "global_step": 183611, "epoch": 4371} {"train_loss": -7.272642612457275, "global_step": 183612, "epoch": 4371} {"train_loss": -7.240711688995361, "global_step": 183613, "epoch": 4371} {"train_loss": -7.01048469543457, "global_step": 183614, "epoch": 4371} {"train_loss": -7.308544158935547, "global_step": 183615, "epoch": 4371} {"train_loss": -7.23723840713501, "global_step": 183616, "epoch": 4371} {"train_loss": -7.089095115661621, "global_step": 183617, "epoch": 4371} {"train_loss": -7.054777145385742, "global_step": 183618, "epoch": 4371} {"train_loss": -7.154677867889404, "global_step": 183619, "epoch": 4371} {"train_loss": -7.2113728523254395, "global_step": 183620, "epoch": 4371} {"train_loss": -7.249063491821289, "global_step": 183621, "epoch": 4371} {"train_loss": -7.191061496734619, "global_step": 183622, "epoch": 4371} {"train_loss": -7.165286291213262, "global_step": 183623, "epoch": 4371, "val_loss": 80583.1875} {"train_loss": -7.18889045715332, "global_step": 183624, "epoch": 4372} {"train_loss": -7.222947120666504, "global_step": 183625, "epoch": 4372} {"train_loss": -7.3030595779418945, "global_step": 183626, "epoch": 4372} {"train_loss": -7.181888580322266, "global_step": 183627, "epoch": 4372} {"train_loss": -7.249577522277832, "global_step": 183628, "epoch": 4372} {"train_loss": -7.212891101837158, "global_step": 183629, "epoch": 4372} {"train_loss": -7.16790771484375, "global_step": 183630, "epoch": 4372} {"train_loss": -7.12650203704834, "global_step": 183631, "epoch": 4372} {"train_loss": -7.245963096618652, "global_step": 183632, "epoch": 4372} {"train_loss": -7.0947675704956055, "global_step": 183633, "epoch": 4372} {"train_loss": -6.89992618560791, "global_step": 183634, "epoch": 4372} {"train_loss": -7.141617774963379, "global_step": 183635, "epoch": 4372} {"train_loss": -6.923313140869141, "global_step": 183636, "epoch": 4372} {"train_loss": -7.017735004425049, "global_step": 183637, "epoch": 4372} {"train_loss": -6.95390510559082, "global_step": 183638, "epoch": 4372} {"train_loss": -6.9755144119262695, "global_step": 183639, "epoch": 4372} {"train_loss": -7.034945011138916, "global_step": 183640, "epoch": 4372} {"train_loss": -7.00990104675293, "global_step": 183641, "epoch": 4372} {"train_loss": -6.964796543121338, "global_step": 183642, "epoch": 4372} {"train_loss": -7.13576078414917, "global_step": 183643, "epoch": 4372} {"train_loss": -7.078402519226074, "global_step": 183644, "epoch": 4372} {"train_loss": -6.939177989959717, "global_step": 183645, "epoch": 4372} {"train_loss": -7.130856513977051, "global_step": 183646, "epoch": 4372} {"train_loss": -7.148007869720459, "global_step": 183647, "epoch": 4372} {"train_loss": -7.108211517333984, "global_step": 183648, "epoch": 4372} {"train_loss": -7.0803375244140625, "global_step": 183649, "epoch": 4372} {"train_loss": -7.150701522827148, "global_step": 183650, "epoch": 4372} {"train_loss": -7.099339485168457, "global_step": 183651, "epoch": 4372} {"train_loss": -7.082353591918945, "global_step": 183652, "epoch": 4372} {"train_loss": -7.127891540527344, "global_step": 183653, "epoch": 4372} {"train_loss": -7.291941165924072, "global_step": 183654, "epoch": 4372} {"train_loss": -7.095564842224121, "global_step": 183655, "epoch": 4372} {"train_loss": -7.206249713897705, "global_step": 183656, "epoch": 4372} {"train_loss": -7.130253791809082, "global_step": 183657, "epoch": 4372} {"train_loss": -7.1945414543151855, "global_step": 183658, "epoch": 4372} {"train_loss": -7.114386558532715, "global_step": 183659, "epoch": 4372} {"train_loss": -7.0892767906188965, "global_step": 183660, "epoch": 4372} {"train_loss": -7.2455220222473145, "global_step": 183661, "epoch": 4372} {"train_loss": -7.106701850891113, "global_step": 183662, "epoch": 4372} {"train_loss": -7.148141860961914, "global_step": 183663, "epoch": 4372} {"train_loss": -7.1382951736450195, "global_step": 183664, "epoch": 4372} {"train_loss": -7.115333057585216, "global_step": 183665, "epoch": 4372, "val_loss": 80635.109375} {"train_loss": -7.2835164070129395, "global_step": 183666, "epoch": 4373} {"train_loss": -7.107802391052246, "global_step": 183667, "epoch": 4373} {"train_loss": -7.264720916748047, "global_step": 183668, "epoch": 4373} {"train_loss": -7.219944953918457, "global_step": 183669, "epoch": 4373} {"train_loss": -7.238292694091797, "global_step": 183670, "epoch": 4373} {"train_loss": -7.158310413360596, "global_step": 183671, "epoch": 4373} {"train_loss": -7.146388053894043, "global_step": 183672, "epoch": 4373} {"train_loss": -7.156715393066406, "global_step": 183673, "epoch": 4373} {"train_loss": -7.063238620758057, "global_step": 183674, "epoch": 4373} {"train_loss": -7.197285175323486, "global_step": 183675, "epoch": 4373} {"train_loss": -7.3411054611206055, "global_step": 183676, "epoch": 4373} {"train_loss": -7.216727256774902, "global_step": 183677, "epoch": 4373} {"train_loss": -7.169196605682373, "global_step": 183678, "epoch": 4373} {"train_loss": -7.219972133636475, "global_step": 183679, "epoch": 4373} {"train_loss": -7.199460983276367, "global_step": 183680, "epoch": 4373} {"train_loss": -7.062952518463135, "global_step": 183681, "epoch": 4373} {"train_loss": -7.2671966552734375, "global_step": 183682, "epoch": 4373} {"train_loss": -7.231738090515137, "global_step": 183683, "epoch": 4373} {"train_loss": -7.246506214141846, "global_step": 183684, "epoch": 4373} {"train_loss": -7.324471473693848, "global_step": 183685, "epoch": 4373} {"train_loss": -7.189828872680664, "global_step": 183686, "epoch": 4373} {"train_loss": -7.184901237487793, "global_step": 183687, "epoch": 4373} {"train_loss": -7.161657810211182, "global_step": 183688, "epoch": 4373} {"train_loss": -7.211094856262207, "global_step": 183689, "epoch": 4373} {"train_loss": -7.056304931640625, "global_step": 183690, "epoch": 4373} {"train_loss": -7.17008113861084, "global_step": 183691, "epoch": 4373} {"train_loss": -7.194812774658203, "global_step": 183692, "epoch": 4373} {"train_loss": -7.13857364654541, "global_step": 183693, "epoch": 4373} {"train_loss": -7.178371906280518, "global_step": 183694, "epoch": 4373} {"train_loss": -7.062945365905762, "global_step": 183695, "epoch": 4373} {"train_loss": -7.2075581550598145, "global_step": 183696, "epoch": 4373} {"train_loss": -7.121497631072998, "global_step": 183697, "epoch": 4373} {"train_loss": -7.1538472175598145, "global_step": 183698, "epoch": 4373} {"train_loss": -7.06788444519043, "global_step": 183699, "epoch": 4373} {"train_loss": -7.080031394958496, "global_step": 183700, "epoch": 4373} {"train_loss": -7.08300256729126, "global_step": 183701, "epoch": 4373} {"train_loss": -7.206674575805664, "global_step": 183702, "epoch": 4373} {"train_loss": -7.026767730712891, "global_step": 183703, "epoch": 4373} {"train_loss": -7.10251522064209, "global_step": 183704, "epoch": 4373} {"train_loss": -7.042452812194824, "global_step": 183705, "epoch": 4373} {"train_loss": -7.112790107727051, "global_step": 183706, "epoch": 4373} {"train_loss": -7.165718158086141, "global_step": 183707, "epoch": 4373, "val_loss": 80713.4140625} {"train_loss": -7.161360740661621, "global_step": 183708, "epoch": 4374} {"train_loss": -7.131566047668457, "global_step": 183709, "epoch": 4374} {"train_loss": -7.218177795410156, "global_step": 183710, "epoch": 4374} {"train_loss": -7.154153823852539, "global_step": 183711, "epoch": 4374} {"train_loss": -6.991290092468262, "global_step": 183712, "epoch": 4374} {"train_loss": -7.196876525878906, "global_step": 183713, "epoch": 4374} {"train_loss": -7.009019374847412, "global_step": 183714, "epoch": 4374} {"train_loss": -7.209267616271973, "global_step": 183715, "epoch": 4374} {"train_loss": -7.086817741394043, "global_step": 183716, "epoch": 4374} {"train_loss": -7.061866283416748, "global_step": 183717, "epoch": 4374} {"train_loss": -7.026548385620117, "global_step": 183718, "epoch": 4374} {"train_loss": -7.087319374084473, "global_step": 183719, "epoch": 4374} {"train_loss": -7.220301628112793, "global_step": 183720, "epoch": 4374} {"train_loss": -6.999234676361084, "global_step": 183721, "epoch": 4374} {"train_loss": -7.146288871765137, "global_step": 183722, "epoch": 4374} {"train_loss": -7.136849403381348, "global_step": 183723, "epoch": 4374} {"train_loss": -7.161989212036133, "global_step": 183724, "epoch": 4374} {"train_loss": -7.235964775085449, "global_step": 183725, "epoch": 4374} {"train_loss": -7.2717180252075195, "global_step": 183726, "epoch": 4374} {"train_loss": -7.154882431030273, "global_step": 183727, "epoch": 4374} {"train_loss": -7.2043890953063965, "global_step": 183728, "epoch": 4374} {"train_loss": -7.259817600250244, "global_step": 183729, "epoch": 4374} {"train_loss": -7.21849250793457, "global_step": 183730, "epoch": 4374} {"train_loss": -7.27554988861084, "global_step": 183731, "epoch": 4374} {"train_loss": -7.289881706237793, "global_step": 183732, "epoch": 4374} {"train_loss": -7.252618789672852, "global_step": 183733, "epoch": 4374} {"train_loss": -7.307318687438965, "global_step": 183734, "epoch": 4374} {"train_loss": -7.137234210968018, "global_step": 183735, "epoch": 4374} {"train_loss": -7.168813228607178, "global_step": 183736, "epoch": 4374} {"train_loss": -7.2537055015563965, "global_step": 183737, "epoch": 4374} {"train_loss": -7.167575836181641, "global_step": 183738, "epoch": 4374} {"train_loss": -7.236595153808594, "global_step": 183739, "epoch": 4374} {"train_loss": -7.046670913696289, "global_step": 183740, "epoch": 4374} {"train_loss": -7.026337623596191, "global_step": 183741, "epoch": 4374} {"train_loss": -7.222749710083008, "global_step": 183742, "epoch": 4374} {"train_loss": -7.133975982666016, "global_step": 183743, "epoch": 4374} {"train_loss": -7.2268218994140625, "global_step": 183744, "epoch": 4374} {"train_loss": -7.20725154876709, "global_step": 183745, "epoch": 4374} {"train_loss": -7.023184776306152, "global_step": 183746, "epoch": 4374} {"train_loss": -7.115621566772461, "global_step": 183747, "epoch": 4374} {"train_loss": -7.164388656616211, "global_step": 183748, "epoch": 4374} {"train_loss": -7.161250443685622, "global_step": 183749, "epoch": 4374, "val_loss": 80644.421875} {"train_loss": -7.273301124572754, "global_step": 183750, "epoch": 4375} {"train_loss": -7.147486209869385, "global_step": 183751, "epoch": 4375} {"train_loss": -7.273456573486328, "global_step": 183752, "epoch": 4375} {"train_loss": -7.27774715423584, "global_step": 183753, "epoch": 4375} {"train_loss": -7.20642614364624, "global_step": 183754, "epoch": 4375} {"train_loss": -7.18773078918457, "global_step": 183755, "epoch": 4375} {"train_loss": -7.150852680206299, "global_step": 183756, "epoch": 4375} {"train_loss": -7.039650917053223, "global_step": 183757, "epoch": 4375} {"train_loss": -7.149042129516602, "global_step": 183758, "epoch": 4375} {"train_loss": -7.180392265319824, "global_step": 183759, "epoch": 4375} {"train_loss": -7.142068386077881, "global_step": 183760, "epoch": 4375} {"train_loss": -7.1178998947143555, "global_step": 183761, "epoch": 4375} {"train_loss": -7.193903923034668, "global_step": 183762, "epoch": 4375} {"train_loss": -7.103332996368408, "global_step": 183763, "epoch": 4375} {"train_loss": -7.144950866699219, "global_step": 183764, "epoch": 4375} {"train_loss": -7.214122772216797, "global_step": 183765, "epoch": 4375} {"train_loss": -7.054648399353027, "global_step": 183766, "epoch": 4375} {"train_loss": -6.996438980102539, "global_step": 183767, "epoch": 4375} {"train_loss": -7.066814422607422, "global_step": 183768, "epoch": 4375} {"train_loss": -7.275815963745117, "global_step": 183769, "epoch": 4375} {"train_loss": -7.110747814178467, "global_step": 183770, "epoch": 4375} {"train_loss": -6.934666633605957, "global_step": 183771, "epoch": 4375} {"train_loss": -7.155083179473877, "global_step": 183772, "epoch": 4375} {"train_loss": -7.138901233673096, "global_step": 183773, "epoch": 4375} {"train_loss": -7.041065216064453, "global_step": 183774, "epoch": 4375} {"train_loss": -7.183199882507324, "global_step": 183775, "epoch": 4375} {"train_loss": -6.942938804626465, "global_step": 183776, "epoch": 4375} {"train_loss": -7.21953010559082, "global_step": 183777, "epoch": 4375} {"train_loss": -7.075911045074463, "global_step": 183778, "epoch": 4375} {"train_loss": -7.155860900878906, "global_step": 183779, "epoch": 4375} {"train_loss": -6.986401557922363, "global_step": 183780, "epoch": 4375} {"train_loss": -6.934155464172363, "global_step": 183781, "epoch": 4375} {"train_loss": -7.088772773742676, "global_step": 183782, "epoch": 4375} {"train_loss": -6.986116886138916, "global_step": 183783, "epoch": 4375} {"train_loss": -7.139505386352539, "global_step": 183784, "epoch": 4375} {"train_loss": -6.970775604248047, "global_step": 183785, "epoch": 4375} {"train_loss": -7.015873908996582, "global_step": 183786, "epoch": 4375} {"train_loss": -6.913804054260254, "global_step": 183787, "epoch": 4375} {"train_loss": -7.111249923706055, "global_step": 183788, "epoch": 4375} {"train_loss": -6.967684745788574, "global_step": 183789, "epoch": 4375} {"train_loss": -6.940428256988525, "global_step": 183790, "epoch": 4375} {"train_loss": -7.098901056108021, "global_step": 183791, "epoch": 4375, "val_loss": 80835.125} {"train_loss": -6.9167680740356445, "global_step": 183792, "epoch": 4376} {"train_loss": -7.07194709777832, "global_step": 183793, "epoch": 4376} {"train_loss": -7.070800304412842, "global_step": 183794, "epoch": 4376} {"train_loss": -7.024292469024658, "global_step": 183795, "epoch": 4376} {"train_loss": -7.004231929779053, "global_step": 183796, "epoch": 4376} {"train_loss": -7.178753852844238, "global_step": 183797, "epoch": 4376} {"train_loss": -7.027713775634766, "global_step": 183798, "epoch": 4376} {"train_loss": -7.090177536010742, "global_step": 183799, "epoch": 4376} {"train_loss": -7.076652526855469, "global_step": 183800, "epoch": 4376} {"train_loss": -7.069915771484375, "global_step": 183801, "epoch": 4376} {"train_loss": -6.981996059417725, "global_step": 183802, "epoch": 4376} {"train_loss": -7.225826740264893, "global_step": 183803, "epoch": 4376} {"train_loss": -7.072333335876465, "global_step": 183804, "epoch": 4376} {"train_loss": -7.177802562713623, "global_step": 183805, "epoch": 4376} {"train_loss": -7.113802909851074, "global_step": 183806, "epoch": 4376} {"train_loss": -7.254878044128418, "global_step": 183807, "epoch": 4376} {"train_loss": -7.151575088500977, "global_step": 183808, "epoch": 4376} {"train_loss": -7.169886112213135, "global_step": 183809, "epoch": 4376} {"train_loss": -7.152276039123535, "global_step": 183810, "epoch": 4376} {"train_loss": -7.124243259429932, "global_step": 183811, "epoch": 4376} {"train_loss": -7.175598621368408, "global_step": 183812, "epoch": 4376} {"train_loss": -7.316621780395508, "global_step": 183813, "epoch": 4376} {"train_loss": -7.218925476074219, "global_step": 183814, "epoch": 4376} {"train_loss": -7.101184844970703, "global_step": 183815, "epoch": 4376} {"train_loss": -7.150417327880859, "global_step": 183816, "epoch": 4376} {"train_loss": -7.1256608963012695, "global_step": 183817, "epoch": 4376} {"train_loss": -7.188272476196289, "global_step": 183818, "epoch": 4376} {"train_loss": -7.313590049743652, "global_step": 183819, "epoch": 4376} {"train_loss": -7.19894552230835, "global_step": 183820, "epoch": 4376} {"train_loss": -7.139680862426758, "global_step": 183821, "epoch": 4376} {"train_loss": -7.1389617919921875, "global_step": 183822, "epoch": 4376} {"train_loss": -7.137698173522949, "global_step": 183823, "epoch": 4376} {"train_loss": -7.120533466339111, "global_step": 183824, "epoch": 4376} {"train_loss": -7.269770622253418, "global_step": 183825, "epoch": 4376} {"train_loss": -7.108022689819336, "global_step": 183826, "epoch": 4376} {"train_loss": -7.1558308601379395, "global_step": 183827, "epoch": 4376} {"train_loss": -7.208327293395996, "global_step": 183828, "epoch": 4376} {"train_loss": -7.233355522155762, "global_step": 183829, "epoch": 4376} {"train_loss": -7.278897285461426, "global_step": 183830, "epoch": 4376} {"train_loss": -7.099301338195801, "global_step": 183831, "epoch": 4376} {"train_loss": -7.078386306762695, "global_step": 183832, "epoch": 4376} {"train_loss": -7.139812844140189, "global_step": 183833, "epoch": 4376, "val_loss": 80705.9921875} {"train_loss": -7.1661577224731445, "global_step": 183834, "epoch": 4377} {"train_loss": -7.266668319702148, "global_step": 183835, "epoch": 4377} {"train_loss": -7.1608476638793945, "global_step": 183836, "epoch": 4377} {"train_loss": -7.1549072265625, "global_step": 183837, "epoch": 4377} {"train_loss": -7.1760711669921875, "global_step": 183838, "epoch": 4377} {"train_loss": -7.172259330749512, "global_step": 183839, "epoch": 4377} {"train_loss": -7.085737228393555, "global_step": 183840, "epoch": 4377} {"train_loss": -7.273326873779297, "global_step": 183841, "epoch": 4377} {"train_loss": -7.106278419494629, "global_step": 183842, "epoch": 4377} {"train_loss": -7.249135971069336, "global_step": 183843, "epoch": 4377} {"train_loss": -7.21182918548584, "global_step": 183844, "epoch": 4377} {"train_loss": -7.142193794250488, "global_step": 183845, "epoch": 4377} {"train_loss": -7.213481903076172, "global_step": 183846, "epoch": 4377} {"train_loss": -7.25999116897583, "global_step": 183847, "epoch": 4377} {"train_loss": -7.11286735534668, "global_step": 183848, "epoch": 4377} {"train_loss": -7.187945365905762, "global_step": 183849, "epoch": 4377} {"train_loss": -7.2313761711120605, "global_step": 183850, "epoch": 4377} {"train_loss": -7.1929931640625, "global_step": 183851, "epoch": 4377} {"train_loss": -7.23963737487793, "global_step": 183852, "epoch": 4377} {"train_loss": -7.236408710479736, "global_step": 183853, "epoch": 4377} {"train_loss": -7.156888961791992, "global_step": 183854, "epoch": 4377} {"train_loss": -7.125086784362793, "global_step": 183855, "epoch": 4377} {"train_loss": -7.264203071594238, "global_step": 183856, "epoch": 4377} {"train_loss": -7.162072658538818, "global_step": 183857, "epoch": 4377} {"train_loss": -7.272075176239014, "global_step": 183858, "epoch": 4377} {"train_loss": -7.1599531173706055, "global_step": 183859, "epoch": 4377} {"train_loss": -7.255077362060547, "global_step": 183860, "epoch": 4377} {"train_loss": -7.0375542640686035, "global_step": 183861, "epoch": 4377} {"train_loss": -7.186161041259766, "global_step": 183862, "epoch": 4377} {"train_loss": -7.166045188903809, "global_step": 183863, "epoch": 4377} {"train_loss": -7.15805196762085, "global_step": 183864, "epoch": 4377} {"train_loss": -7.170103073120117, "global_step": 183865, "epoch": 4377} {"train_loss": -7.16377592086792, "global_step": 183866, "epoch": 4377} {"train_loss": -7.094074249267578, "global_step": 183867, "epoch": 4377} {"train_loss": -7.222907066345215, "global_step": 183868, "epoch": 4377} {"train_loss": -7.226376533508301, "global_step": 183869, "epoch": 4377} {"train_loss": -7.14198112487793, "global_step": 183870, "epoch": 4377} {"train_loss": -7.1291584968566895, "global_step": 183871, "epoch": 4377} {"train_loss": -7.054349899291992, "global_step": 183872, "epoch": 4377} {"train_loss": -7.236840724945068, "global_step": 183873, "epoch": 4377} {"train_loss": -7.0021209716796875, "global_step": 183874, "epoch": 4377} {"train_loss": -7.174773011888776, "global_step": 183875, "epoch": 4377, "val_loss": 80589.5390625} {"train_loss": -7.206419944763184, "global_step": 183876, "epoch": 4378} {"train_loss": -7.156098365783691, "global_step": 183877, "epoch": 4378} {"train_loss": -7.129657745361328, "global_step": 183878, "epoch": 4378} {"train_loss": -7.147015571594238, "global_step": 183879, "epoch": 4378} {"train_loss": -7.113449573516846, "global_step": 183880, "epoch": 4378} {"train_loss": -7.229389667510986, "global_step": 183881, "epoch": 4378} {"train_loss": -7.119560718536377, "global_step": 183882, "epoch": 4378} {"train_loss": -7.260124206542969, "global_step": 183883, "epoch": 4378} {"train_loss": -7.132101058959961, "global_step": 183884, "epoch": 4378} {"train_loss": -7.168513298034668, "global_step": 183885, "epoch": 4378} {"train_loss": -7.164895057678223, "global_step": 183886, "epoch": 4378} {"train_loss": -7.257943153381348, "global_step": 183887, "epoch": 4378} {"train_loss": -7.245893478393555, "global_step": 183888, "epoch": 4378} {"train_loss": -7.217778205871582, "global_step": 183889, "epoch": 4378} {"train_loss": -7.234101295471191, "global_step": 183890, "epoch": 4378} {"train_loss": -7.1541643142700195, "global_step": 183891, "epoch": 4378} {"train_loss": -7.192909240722656, "global_step": 183892, "epoch": 4378} {"train_loss": -7.309853553771973, "global_step": 183893, "epoch": 4378} {"train_loss": -7.232937812805176, "global_step": 183894, "epoch": 4378} {"train_loss": -7.286598205566406, "global_step": 183895, "epoch": 4378} {"train_loss": -7.142168998718262, "global_step": 183896, "epoch": 4378} {"train_loss": -7.123773574829102, "global_step": 183897, "epoch": 4378} {"train_loss": -7.204717636108398, "global_step": 183898, "epoch": 4378} {"train_loss": -7.173712253570557, "global_step": 183899, "epoch": 4378} {"train_loss": -7.180268287658691, "global_step": 183900, "epoch": 4378} {"train_loss": -7.1346211433410645, "global_step": 183901, "epoch": 4378} {"train_loss": -7.211857318878174, "global_step": 183902, "epoch": 4378} {"train_loss": -7.147119998931885, "global_step": 183903, "epoch": 4378} {"train_loss": -7.211609840393066, "global_step": 183904, "epoch": 4378} {"train_loss": -7.103489875793457, "global_step": 183905, "epoch": 4378} {"train_loss": -7.105727195739746, "global_step": 183906, "epoch": 4378} {"train_loss": -7.223575592041016, "global_step": 183907, "epoch": 4378} {"train_loss": -7.1436357498168945, "global_step": 183908, "epoch": 4378} {"train_loss": -7.163432598114014, "global_step": 183909, "epoch": 4378} {"train_loss": -7.2376322746276855, "global_step": 183910, "epoch": 4378} {"train_loss": -7.091676235198975, "global_step": 183911, "epoch": 4378} {"train_loss": -7.2030463218688965, "global_step": 183912, "epoch": 4378} {"train_loss": -7.2675933837890625, "global_step": 183913, "epoch": 4378} {"train_loss": -7.056131362915039, "global_step": 183914, "epoch": 4378} {"train_loss": -7.20925235748291, "global_step": 183915, "epoch": 4378} {"train_loss": -7.171844959259033, "global_step": 183916, "epoch": 4378} {"train_loss": -7.181049346923828, "global_step": 183917, "epoch": 4378, "val_loss": 80578.0390625} {"train_loss": -7.201230049133301, "global_step": 183918, "epoch": 4379} {"train_loss": -7.343782424926758, "global_step": 183919, "epoch": 4379} {"train_loss": -7.128870010375977, "global_step": 183920, "epoch": 4379} {"train_loss": -7.180451393127441, "global_step": 183921, "epoch": 4379} {"train_loss": -7.102745056152344, "global_step": 183922, "epoch": 4379} {"train_loss": -7.164703369140625, "global_step": 183923, "epoch": 4379} {"train_loss": -7.2681779861450195, "global_step": 183924, "epoch": 4379} {"train_loss": -7.193732738494873, "global_step": 183925, "epoch": 4379} {"train_loss": -7.212892532348633, "global_step": 183926, "epoch": 4379} {"train_loss": -7.234921455383301, "global_step": 183927, "epoch": 4379} {"train_loss": -7.1793293952941895, "global_step": 183928, "epoch": 4379} {"train_loss": -7.195195198059082, "global_step": 183929, "epoch": 4379} {"train_loss": -7.1085920333862305, "global_step": 183930, "epoch": 4379} {"train_loss": -7.092700958251953, "global_step": 183931, "epoch": 4379} {"train_loss": -7.23837947845459, "global_step": 183932, "epoch": 4379} {"train_loss": -7.103669166564941, "global_step": 183933, "epoch": 4379} {"train_loss": -7.199735641479492, "global_step": 183934, "epoch": 4379} {"train_loss": -7.190793037414551, "global_step": 183935, "epoch": 4379} {"train_loss": -7.153088092803955, "global_step": 183936, "epoch": 4379} {"train_loss": -7.146608829498291, "global_step": 183937, "epoch": 4379} {"train_loss": -7.218328952789307, "global_step": 183938, "epoch": 4379} {"train_loss": -6.879871368408203, "global_step": 183939, "epoch": 4379} {"train_loss": -7.179901123046875, "global_step": 183940, "epoch": 4379} {"train_loss": -7.173233985900879, "global_step": 183941, "epoch": 4379} {"train_loss": -7.108768939971924, "global_step": 183942, "epoch": 4379} {"train_loss": -7.209026336669922, "global_step": 183943, "epoch": 4379} {"train_loss": -7.116485595703125, "global_step": 183944, "epoch": 4379} {"train_loss": -7.0753679275512695, "global_step": 183945, "epoch": 4379} {"train_loss": -7.141557216644287, "global_step": 183946, "epoch": 4379} {"train_loss": -7.123560905456543, "global_step": 183947, "epoch": 4379} {"train_loss": -7.0779008865356445, "global_step": 183948, "epoch": 4379} {"train_loss": -6.896234512329102, "global_step": 183949, "epoch": 4379} {"train_loss": -7.104658603668213, "global_step": 183950, "epoch": 4379} {"train_loss": -6.9272871017456055, "global_step": 183951, "epoch": 4379} {"train_loss": -6.878928184509277, "global_step": 183952, "epoch": 4379} {"train_loss": -6.929144382476807, "global_step": 183953, "epoch": 4379} {"train_loss": -6.846179962158203, "global_step": 183954, "epoch": 4379} {"train_loss": -7.217890739440918, "global_step": 183955, "epoch": 4379} {"train_loss": -6.992395401000977, "global_step": 183956, "epoch": 4379} {"train_loss": -7.180517673492432, "global_step": 183957, "epoch": 4379} {"train_loss": -7.024477005004883, "global_step": 183958, "epoch": 4379} {"train_loss": -7.119955710002354, "global_step": 183959, "epoch": 4379, "val_loss": 80767.078125} {"train_loss": -7.097904205322266, "global_step": 183960, "epoch": 4380} {"train_loss": -7.120245933532715, "global_step": 183961, "epoch": 4380} {"train_loss": -7.128793716430664, "global_step": 183962, "epoch": 4380} {"train_loss": -6.96019172668457, "global_step": 183963, "epoch": 4380} {"train_loss": -7.111450672149658, "global_step": 183964, "epoch": 4380} {"train_loss": -6.990785598754883, "global_step": 183965, "epoch": 4380} {"train_loss": -7.238999843597412, "global_step": 183966, "epoch": 4380} {"train_loss": -6.899375915527344, "global_step": 183967, "epoch": 4380} {"train_loss": -7.058258056640625, "global_step": 183968, "epoch": 4380} {"train_loss": -6.983529567718506, "global_step": 183969, "epoch": 4380} {"train_loss": -7.077476978302002, "global_step": 183970, "epoch": 4380} {"train_loss": -7.056936740875244, "global_step": 183971, "epoch": 4380} {"train_loss": -7.042938232421875, "global_step": 183972, "epoch": 4380} {"train_loss": -7.2063140869140625, "global_step": 183973, "epoch": 4380} {"train_loss": -7.016331195831299, "global_step": 183974, "epoch": 4380} {"train_loss": -7.062690734863281, "global_step": 183975, "epoch": 4380} {"train_loss": -7.116745948791504, "global_step": 183976, "epoch": 4380} {"train_loss": -6.979351043701172, "global_step": 183977, "epoch": 4380} {"train_loss": -7.053069114685059, "global_step": 183978, "epoch": 4380} {"train_loss": -7.070143222808838, "global_step": 183979, "epoch": 4380} {"train_loss": -7.021777153015137, "global_step": 183980, "epoch": 4380} {"train_loss": -7.034946441650391, "global_step": 183981, "epoch": 4380} {"train_loss": -6.822445869445801, "global_step": 183982, "epoch": 4380} {"train_loss": -7.19109582901001, "global_step": 183983, "epoch": 4380} {"train_loss": -6.985888481140137, "global_step": 183984, "epoch": 4380} {"train_loss": -6.95481014251709, "global_step": 183985, "epoch": 4380} {"train_loss": -7.117428779602051, "global_step": 183986, "epoch": 4380} {"train_loss": -6.749647617340088, "global_step": 183987, "epoch": 4380} {"train_loss": -7.158027648925781, "global_step": 183988, "epoch": 4380} {"train_loss": -6.908454895019531, "global_step": 183989, "epoch": 4380} {"train_loss": -7.015057563781738, "global_step": 183990, "epoch": 4380} {"train_loss": -7.075777530670166, "global_step": 183991, "epoch": 4380} {"train_loss": -7.0144195556640625, "global_step": 183992, "epoch": 4380} {"train_loss": -6.994540214538574, "global_step": 183993, "epoch": 4380} {"train_loss": -7.148110389709473, "global_step": 183994, "epoch": 4380} {"train_loss": -7.007157325744629, "global_step": 183995, "epoch": 4380} {"train_loss": -7.103508472442627, "global_step": 183996, "epoch": 4380} {"train_loss": -7.143528938293457, "global_step": 183997, "epoch": 4380} {"train_loss": -7.067957401275635, "global_step": 183998, "epoch": 4380} {"train_loss": -7.105160713195801, "global_step": 183999, "epoch": 4380} {"train_loss": -6.985926151275635, "global_step": 184000, "epoch": 4380} {"train_loss": -7.049022436141968, "global_step": 184001, "epoch": 4380, "val_loss": 80813.9453125} {"train_loss": -7.125027656555176, "global_step": 184002, "epoch": 4381} {"train_loss": -7.095677375793457, "global_step": 184003, "epoch": 4381} {"train_loss": -7.145276069641113, "global_step": 184004, "epoch": 4381} {"train_loss": -7.227472305297852, "global_step": 184005, "epoch": 4381} {"train_loss": -7.084103584289551, "global_step": 184006, "epoch": 4381} {"train_loss": -7.206887245178223, "global_step": 184007, "epoch": 4381} {"train_loss": -7.1403093338012695, "global_step": 184008, "epoch": 4381} {"train_loss": -7.132284641265869, "global_step": 184009, "epoch": 4381} {"train_loss": -7.148628234863281, "global_step": 184010, "epoch": 4381} {"train_loss": -7.123657703399658, "global_step": 184011, "epoch": 4381} {"train_loss": -7.2545247077941895, "global_step": 184012, "epoch": 4381} {"train_loss": -7.049625396728516, "global_step": 184013, "epoch": 4381} {"train_loss": -7.116397857666016, "global_step": 184014, "epoch": 4381} {"train_loss": -7.121445655822754, "global_step": 184015, "epoch": 4381} {"train_loss": -7.120604991912842, "global_step": 184016, "epoch": 4381} {"train_loss": -7.0883002281188965, "global_step": 184017, "epoch": 4381} {"train_loss": -7.046596527099609, "global_step": 184018, "epoch": 4381} {"train_loss": -7.160552978515625, "global_step": 184019, "epoch": 4381} {"train_loss": -7.2822980880737305, "global_step": 184020, "epoch": 4381} {"train_loss": -7.092202663421631, "global_step": 184021, "epoch": 4381} {"train_loss": -7.110088348388672, "global_step": 184022, "epoch": 4381} {"train_loss": -7.211561679840088, "global_step": 184023, "epoch": 4381} {"train_loss": -7.221419334411621, "global_step": 184024, "epoch": 4381} {"train_loss": -7.072955131530762, "global_step": 184025, "epoch": 4381} {"train_loss": -7.117288589477539, "global_step": 184026, "epoch": 4381} {"train_loss": -7.159657001495361, "global_step": 184027, "epoch": 4381} {"train_loss": -7.196523189544678, "global_step": 184028, "epoch": 4381} {"train_loss": -7.197474479675293, "global_step": 184029, "epoch": 4381} {"train_loss": -7.129118919372559, "global_step": 184030, "epoch": 4381} {"train_loss": -7.139782905578613, "global_step": 184031, "epoch": 4381} {"train_loss": -7.076582908630371, "global_step": 184032, "epoch": 4381} {"train_loss": -7.241103172302246, "global_step": 184033, "epoch": 4381} {"train_loss": -7.224061012268066, "global_step": 184034, "epoch": 4381} {"train_loss": -7.215896129608154, "global_step": 184035, "epoch": 4381} {"train_loss": -7.221671104431152, "global_step": 184036, "epoch": 4381} {"train_loss": -7.208824634552002, "global_step": 184037, "epoch": 4381} {"train_loss": -7.151144027709961, "global_step": 184038, "epoch": 4381} {"train_loss": -7.084207057952881, "global_step": 184039, "epoch": 4381} {"train_loss": -7.202291488647461, "global_step": 184040, "epoch": 4381} {"train_loss": -7.050886154174805, "global_step": 184041, "epoch": 4381} {"train_loss": -7.18290376663208, "global_step": 184042, "epoch": 4381} {"train_loss": -7.150786592846825, "global_step": 184043, "epoch": 4381, "val_loss": 80477.2734375} {"train_loss": -7.1983842849731445, "global_step": 184044, "epoch": 4382} {"train_loss": -7.144112586975098, "global_step": 184045, "epoch": 4382} {"train_loss": -7.146026134490967, "global_step": 184046, "epoch": 4382} {"train_loss": -7.2258501052856445, "global_step": 184047, "epoch": 4382} {"train_loss": -7.188684463500977, "global_step": 184048, "epoch": 4382} {"train_loss": -7.18611478805542, "global_step": 184049, "epoch": 4382} {"train_loss": -7.135796070098877, "global_step": 184050, "epoch": 4382} {"train_loss": -7.195962905883789, "global_step": 184051, "epoch": 4382} {"train_loss": -7.194461345672607, "global_step": 184052, "epoch": 4382} {"train_loss": -7.164360046386719, "global_step": 184053, "epoch": 4382} {"train_loss": -7.256705284118652, "global_step": 184054, "epoch": 4382} {"train_loss": -7.248776435852051, "global_step": 184055, "epoch": 4382} {"train_loss": -7.217623710632324, "global_step": 184056, "epoch": 4382} {"train_loss": -7.235139846801758, "global_step": 184057, "epoch": 4382} {"train_loss": -7.300406455993652, "global_step": 184058, "epoch": 4382} {"train_loss": -7.2344970703125, "global_step": 184059, "epoch": 4382} {"train_loss": -7.212315559387207, "global_step": 184060, "epoch": 4382} {"train_loss": -7.077190399169922, "global_step": 184061, "epoch": 4382} {"train_loss": -7.207846641540527, "global_step": 184062, "epoch": 4382} {"train_loss": -7.131163597106934, "global_step": 184063, "epoch": 4382} {"train_loss": -7.164734840393066, "global_step": 184064, "epoch": 4382} {"train_loss": -7.266098976135254, "global_step": 184065, "epoch": 4382} {"train_loss": -7.183788299560547, "global_step": 184066, "epoch": 4382} {"train_loss": -7.172689437866211, "global_step": 184067, "epoch": 4382} {"train_loss": -7.227738857269287, "global_step": 184068, "epoch": 4382} {"train_loss": -7.1759796142578125, "global_step": 184069, "epoch": 4382} {"train_loss": -7.201842308044434, "global_step": 184070, "epoch": 4382} {"train_loss": -7.3035054206848145, "global_step": 184071, "epoch": 4382} {"train_loss": -7.173332214355469, "global_step": 184072, "epoch": 4382} {"train_loss": -7.106230735778809, "global_step": 184073, "epoch": 4382} {"train_loss": -7.1629958152771, "global_step": 184074, "epoch": 4382} {"train_loss": -7.174783229827881, "global_step": 184075, "epoch": 4382} {"train_loss": -7.1836018562316895, "global_step": 184076, "epoch": 4382} {"train_loss": -7.218452453613281, "global_step": 184077, "epoch": 4382} {"train_loss": -7.235544204711914, "global_step": 184078, "epoch": 4382} {"train_loss": -7.141373634338379, "global_step": 184079, "epoch": 4382} {"train_loss": -7.268505096435547, "global_step": 184080, "epoch": 4382} {"train_loss": -7.271760940551758, "global_step": 184081, "epoch": 4382} {"train_loss": -7.192231178283691, "global_step": 184082, "epoch": 4382} {"train_loss": -7.241281986236572, "global_step": 184083, "epoch": 4382} {"train_loss": -7.257574081420898, "global_step": 184084, "epoch": 4382} {"train_loss": -7.1953999655587335, "global_step": 184085, "epoch": 4382, "val_loss": 80597.4140625} {"train_loss": -7.238128662109375, "global_step": 184086, "epoch": 4383} {"train_loss": -7.182884216308594, "global_step": 184087, "epoch": 4383} {"train_loss": -7.126887321472168, "global_step": 184088, "epoch": 4383} {"train_loss": -7.224328994750977, "global_step": 184089, "epoch": 4383} {"train_loss": -7.204665184020996, "global_step": 184090, "epoch": 4383} {"train_loss": -7.067902565002441, "global_step": 184091, "epoch": 4383} {"train_loss": -7.314282417297363, "global_step": 184092, "epoch": 4383} {"train_loss": -7.281805038452148, "global_step": 184093, "epoch": 4383} {"train_loss": -7.212198734283447, "global_step": 184094, "epoch": 4383} {"train_loss": -7.257246971130371, "global_step": 184095, "epoch": 4383} {"train_loss": -7.173295497894287, "global_step": 184096, "epoch": 4383} {"train_loss": -7.1703386306762695, "global_step": 184097, "epoch": 4383} {"train_loss": -7.171201705932617, "global_step": 184098, "epoch": 4383} {"train_loss": -7.335333347320557, "global_step": 184099, "epoch": 4383} {"train_loss": -7.159575939178467, "global_step": 184100, "epoch": 4383} {"train_loss": -7.261105537414551, "global_step": 184101, "epoch": 4383} {"train_loss": -7.183090686798096, "global_step": 184102, "epoch": 4383} {"train_loss": -7.26421594619751, "global_step": 184103, "epoch": 4383} {"train_loss": -7.072052001953125, "global_step": 184104, "epoch": 4383} {"train_loss": -7.040972709655762, "global_step": 184105, "epoch": 4383} {"train_loss": -7.157122611999512, "global_step": 184106, "epoch": 4383} {"train_loss": -7.171054840087891, "global_step": 184107, "epoch": 4383} {"train_loss": -7.054267883300781, "global_step": 184108, "epoch": 4383} {"train_loss": -7.217184543609619, "global_step": 184109, "epoch": 4383} {"train_loss": -7.076285362243652, "global_step": 184110, "epoch": 4383} {"train_loss": -7.11817741394043, "global_step": 184111, "epoch": 4383} {"train_loss": -7.133863925933838, "global_step": 184112, "epoch": 4383} {"train_loss": -7.182920455932617, "global_step": 184113, "epoch": 4383} {"train_loss": -7.078358173370361, "global_step": 184114, "epoch": 4383} {"train_loss": -7.125478744506836, "global_step": 184115, "epoch": 4383} {"train_loss": -7.259092330932617, "global_step": 184116, "epoch": 4383} {"train_loss": -7.110844135284424, "global_step": 184117, "epoch": 4383} {"train_loss": -7.034543037414551, "global_step": 184118, "epoch": 4383} {"train_loss": -7.205618858337402, "global_step": 184119, "epoch": 4383} {"train_loss": -7.234642028808594, "global_step": 184120, "epoch": 4383} {"train_loss": -7.045464515686035, "global_step": 184121, "epoch": 4383} {"train_loss": -7.213523864746094, "global_step": 184122, "epoch": 4383} {"train_loss": -7.278956890106201, "global_step": 184123, "epoch": 4383} {"train_loss": -7.025330066680908, "global_step": 184124, "epoch": 4383} {"train_loss": -7.0715742111206055, "global_step": 184125, "epoch": 4383} {"train_loss": -7.0720295906066895, "global_step": 184126, "epoch": 4383} {"train_loss": -7.16328087307158, "global_step": 184127, "epoch": 4383, "val_loss": 80976.1328125} {"train_loss": -7.146981716156006, "global_step": 184128, "epoch": 4384} {"train_loss": -7.169567108154297, "global_step": 184129, "epoch": 4384} {"train_loss": -7.149293422698975, "global_step": 184130, "epoch": 4384} {"train_loss": -7.047260284423828, "global_step": 184131, "epoch": 4384} {"train_loss": -7.106357574462891, "global_step": 184132, "epoch": 4384} {"train_loss": -7.062308311462402, "global_step": 184133, "epoch": 4384} {"train_loss": -7.225821495056152, "global_step": 184134, "epoch": 4384} {"train_loss": -7.246939182281494, "global_step": 184135, "epoch": 4384} {"train_loss": -7.153717041015625, "global_step": 184136, "epoch": 4384} {"train_loss": -7.126594543457031, "global_step": 184137, "epoch": 4384} {"train_loss": -7.217833042144775, "global_step": 184138, "epoch": 4384} {"train_loss": -7.215127468109131, "global_step": 184139, "epoch": 4384} {"train_loss": -7.2528228759765625, "global_step": 184140, "epoch": 4384} {"train_loss": -7.104872703552246, "global_step": 184141, "epoch": 4384} {"train_loss": -7.149847030639648, "global_step": 184142, "epoch": 4384} {"train_loss": -7.159455299377441, "global_step": 184143, "epoch": 4384} {"train_loss": -7.003812789916992, "global_step": 184144, "epoch": 4384} {"train_loss": -7.1828460693359375, "global_step": 184145, "epoch": 4384} {"train_loss": -7.086390495300293, "global_step": 184146, "epoch": 4384} {"train_loss": -7.095689296722412, "global_step": 184147, "epoch": 4384} {"train_loss": -7.2300004959106445, "global_step": 184148, "epoch": 4384} {"train_loss": -7.172024726867676, "global_step": 184149, "epoch": 4384} {"train_loss": -7.226558685302734, "global_step": 184150, "epoch": 4384} {"train_loss": -7.146902084350586, "global_step": 184151, "epoch": 4384} {"train_loss": -7.113824367523193, "global_step": 184152, "epoch": 4384} {"train_loss": -7.210354804992676, "global_step": 184153, "epoch": 4384} {"train_loss": -7.133655548095703, "global_step": 184154, "epoch": 4384} {"train_loss": -6.953892707824707, "global_step": 184155, "epoch": 4384} {"train_loss": -7.202960014343262, "global_step": 184156, "epoch": 4384} {"train_loss": -7.215060234069824, "global_step": 184157, "epoch": 4384} {"train_loss": -7.1284003257751465, "global_step": 184158, "epoch": 4384} {"train_loss": -7.161561012268066, "global_step": 184159, "epoch": 4384} {"train_loss": -7.185600280761719, "global_step": 184160, "epoch": 4384} {"train_loss": -7.027130126953125, "global_step": 184161, "epoch": 4384} {"train_loss": -7.108121395111084, "global_step": 184162, "epoch": 4384} {"train_loss": -7.070361137390137, "global_step": 184163, "epoch": 4384} {"train_loss": -7.227710723876953, "global_step": 184164, "epoch": 4384} {"train_loss": -7.154542922973633, "global_step": 184165, "epoch": 4384} {"train_loss": -7.136220455169678, "global_step": 184166, "epoch": 4384} {"train_loss": -7.179781913757324, "global_step": 184167, "epoch": 4384} {"train_loss": -7.176565170288086, "global_step": 184168, "epoch": 4384} {"train_loss": -7.146390267780849, "global_step": 184169, "epoch": 4384, "val_loss": 80896.3125} {"train_loss": -7.158770561218262, "global_step": 184170, "epoch": 4385} {"train_loss": -7.069085121154785, "global_step": 184171, "epoch": 4385} {"train_loss": -7.177955627441406, "global_step": 184172, "epoch": 4385} {"train_loss": -7.012363433837891, "global_step": 184173, "epoch": 4385} {"train_loss": -7.144235134124756, "global_step": 184174, "epoch": 4385} {"train_loss": -7.226967811584473, "global_step": 184175, "epoch": 4385} {"train_loss": -7.210370063781738, "global_step": 184176, "epoch": 4385} {"train_loss": -7.012288570404053, "global_step": 184177, "epoch": 4385} {"train_loss": -7.1041388511657715, "global_step": 184178, "epoch": 4385} {"train_loss": -7.130160808563232, "global_step": 184179, "epoch": 4385} {"train_loss": -7.114727020263672, "global_step": 184180, "epoch": 4385} {"train_loss": -7.099846363067627, "global_step": 184181, "epoch": 4385} {"train_loss": -7.143326759338379, "global_step": 184182, "epoch": 4385} {"train_loss": -7.226159572601318, "global_step": 184183, "epoch": 4385} {"train_loss": -7.1192121505737305, "global_step": 184184, "epoch": 4385} {"train_loss": -7.194139003753662, "global_step": 184185, "epoch": 4385} {"train_loss": -7.219234466552734, "global_step": 184186, "epoch": 4385} {"train_loss": -7.147981643676758, "global_step": 184187, "epoch": 4385} {"train_loss": -7.14674186706543, "global_step": 184188, "epoch": 4385} {"train_loss": -7.131316184997559, "global_step": 184189, "epoch": 4385} {"train_loss": -7.108489990234375, "global_step": 184190, "epoch": 4385} {"train_loss": -7.207685947418213, "global_step": 184191, "epoch": 4385} {"train_loss": -7.160388469696045, "global_step": 184192, "epoch": 4385} {"train_loss": -7.136390686035156, "global_step": 184193, "epoch": 4385} {"train_loss": -7.219377517700195, "global_step": 184194, "epoch": 4385} {"train_loss": -7.076113224029541, "global_step": 184195, "epoch": 4385} {"train_loss": -7.14970588684082, "global_step": 184196, "epoch": 4385} {"train_loss": -7.141812324523926, "global_step": 184197, "epoch": 4385} {"train_loss": -7.131382465362549, "global_step": 184198, "epoch": 4385} {"train_loss": -7.197454929351807, "global_step": 184199, "epoch": 4385} {"train_loss": -7.105266571044922, "global_step": 184200, "epoch": 4385} {"train_loss": -7.134819030761719, "global_step": 184201, "epoch": 4385} {"train_loss": -7.129059314727783, "global_step": 184202, "epoch": 4385} {"train_loss": -7.123128414154053, "global_step": 184203, "epoch": 4385} {"train_loss": -7.2129130363464355, "global_step": 184204, "epoch": 4385} {"train_loss": -7.15695858001709, "global_step": 184205, "epoch": 4385} {"train_loss": -7.200946807861328, "global_step": 184206, "epoch": 4385} {"train_loss": -7.118575096130371, "global_step": 184207, "epoch": 4385} {"train_loss": -7.109206676483154, "global_step": 184208, "epoch": 4385} {"train_loss": -7.264731407165527, "global_step": 184209, "epoch": 4385} {"train_loss": -7.168518543243408, "global_step": 184210, "epoch": 4385} {"train_loss": -7.147769530614217, "global_step": 184211, "epoch": 4385, "val_loss": 80635.3515625} {"train_loss": -6.991391658782959, "global_step": 184212, "epoch": 4386} {"train_loss": -7.1004638671875, "global_step": 184213, "epoch": 4386} {"train_loss": -7.1812639236450195, "global_step": 184214, "epoch": 4386} {"train_loss": -7.0738630294799805, "global_step": 184215, "epoch": 4386} {"train_loss": -7.105550289154053, "global_step": 184216, "epoch": 4386} {"train_loss": -7.1181440353393555, "global_step": 184217, "epoch": 4386} {"train_loss": -7.144289970397949, "global_step": 184218, "epoch": 4386} {"train_loss": -7.101896286010742, "global_step": 184219, "epoch": 4386} {"train_loss": -7.098623275756836, "global_step": 184220, "epoch": 4386} {"train_loss": -7.07756233215332, "global_step": 184221, "epoch": 4386} {"train_loss": -7.122406005859375, "global_step": 184222, "epoch": 4386} {"train_loss": -7.216379165649414, "global_step": 184223, "epoch": 4386} {"train_loss": -7.0371198654174805, "global_step": 184224, "epoch": 4386} {"train_loss": -7.178969383239746, "global_step": 184225, "epoch": 4386} {"train_loss": -7.121955871582031, "global_step": 184226, "epoch": 4386} {"train_loss": -7.095934867858887, "global_step": 184227, "epoch": 4386} {"train_loss": -7.202075004577637, "global_step": 184228, "epoch": 4386} {"train_loss": -7.1887593269348145, "global_step": 184229, "epoch": 4386} {"train_loss": -7.165532112121582, "global_step": 184230, "epoch": 4386} {"train_loss": -7.217128753662109, "global_step": 184231, "epoch": 4386} {"train_loss": -7.129103660583496, "global_step": 184232, "epoch": 4386} {"train_loss": -7.181096076965332, "global_step": 184233, "epoch": 4386} {"train_loss": -7.093927383422852, "global_step": 184234, "epoch": 4386} {"train_loss": -7.141888618469238, "global_step": 184235, "epoch": 4386} {"train_loss": -7.269196033477783, "global_step": 184236, "epoch": 4386} {"train_loss": -7.150812149047852, "global_step": 184237, "epoch": 4386} {"train_loss": -7.2625274658203125, "global_step": 184238, "epoch": 4386} {"train_loss": -7.219673156738281, "global_step": 184239, "epoch": 4386} {"train_loss": -7.205286026000977, "global_step": 184240, "epoch": 4386} {"train_loss": -7.125048637390137, "global_step": 184241, "epoch": 4386} {"train_loss": -7.283718585968018, "global_step": 184242, "epoch": 4386} {"train_loss": -7.233229637145996, "global_step": 184243, "epoch": 4386} {"train_loss": -7.257997512817383, "global_step": 184244, "epoch": 4386} {"train_loss": -7.193337440490723, "global_step": 184245, "epoch": 4386} {"train_loss": -7.262479305267334, "global_step": 184246, "epoch": 4386} {"train_loss": -7.18618631362915, "global_step": 184247, "epoch": 4386} {"train_loss": -7.234066963195801, "global_step": 184248, "epoch": 4386} {"train_loss": -7.306390762329102, "global_step": 184249, "epoch": 4386} {"train_loss": -7.139581203460693, "global_step": 184250, "epoch": 4386} {"train_loss": -7.235353946685791, "global_step": 184251, "epoch": 4386} {"train_loss": -7.145771026611328, "global_step": 184252, "epoch": 4386} {"train_loss": -7.16560655548459, "global_step": 184253, "epoch": 4386, "val_loss": 80764.828125} {"train_loss": -7.255241394042969, "global_step": 184254, "epoch": 4387} {"train_loss": -7.30394983291626, "global_step": 184255, "epoch": 4387} {"train_loss": -7.1241960525512695, "global_step": 184256, "epoch": 4387} {"train_loss": -7.151033401489258, "global_step": 184257, "epoch": 4387} {"train_loss": -7.225635528564453, "global_step": 184258, "epoch": 4387} {"train_loss": -7.2784223556518555, "global_step": 184259, "epoch": 4387} {"train_loss": -7.340831279754639, "global_step": 184260, "epoch": 4387} {"train_loss": -7.051789283752441, "global_step": 184261, "epoch": 4387} {"train_loss": -7.226133346557617, "global_step": 184262, "epoch": 4387} {"train_loss": -7.10678768157959, "global_step": 184263, "epoch": 4387} {"train_loss": -7.181666374206543, "global_step": 184264, "epoch": 4387} {"train_loss": -7.152396202087402, "global_step": 184265, "epoch": 4387} {"train_loss": -7.235261917114258, "global_step": 184266, "epoch": 4387} {"train_loss": -7.148545265197754, "global_step": 184267, "epoch": 4387} {"train_loss": -7.045389175415039, "global_step": 184268, "epoch": 4387} {"train_loss": -7.198667526245117, "global_step": 184269, "epoch": 4387} {"train_loss": -7.151889801025391, "global_step": 184270, "epoch": 4387} {"train_loss": -7.089902877807617, "global_step": 184271, "epoch": 4387} {"train_loss": -7.100345611572266, "global_step": 184272, "epoch": 4387} {"train_loss": -6.98972225189209, "global_step": 184273, "epoch": 4387} {"train_loss": -7.141632080078125, "global_step": 184274, "epoch": 4387} {"train_loss": -7.207531929016113, "global_step": 184275, "epoch": 4387} {"train_loss": -7.153253555297852, "global_step": 184276, "epoch": 4387} {"train_loss": -7.206236839294434, "global_step": 184277, "epoch": 4387} {"train_loss": -7.006800651550293, "global_step": 184278, "epoch": 4387} {"train_loss": -7.145040035247803, "global_step": 184279, "epoch": 4387} {"train_loss": -7.229963302612305, "global_step": 184280, "epoch": 4387} {"train_loss": -7.183932781219482, "global_step": 184281, "epoch": 4387} {"train_loss": -7.201637268066406, "global_step": 184282, "epoch": 4387} {"train_loss": -7.066797733306885, "global_step": 184283, "epoch": 4387} {"train_loss": -7.141945838928223, "global_step": 184284, "epoch": 4387} {"train_loss": -7.2012200355529785, "global_step": 184285, "epoch": 4387} {"train_loss": -7.07077169418335, "global_step": 184286, "epoch": 4387} {"train_loss": -7.05446720123291, "global_step": 184287, "epoch": 4387} {"train_loss": -7.155057430267334, "global_step": 184288, "epoch": 4387} {"train_loss": -7.021871566772461, "global_step": 184289, "epoch": 4387} {"train_loss": -7.199776649475098, "global_step": 184290, "epoch": 4387} {"train_loss": -7.252617835998535, "global_step": 184291, "epoch": 4387} {"train_loss": -7.194461822509766, "global_step": 184292, "epoch": 4387} {"train_loss": -7.06134033203125, "global_step": 184293, "epoch": 4387} {"train_loss": -7.158077716827393, "global_step": 184294, "epoch": 4387} {"train_loss": -7.153769356863839, "global_step": 184295, "epoch": 4387, "val_loss": 80725.3203125} {"train_loss": -7.20815372467041, "global_step": 184296, "epoch": 4388} {"train_loss": -7.221351623535156, "global_step": 184297, "epoch": 4388} {"train_loss": -7.0862531661987305, "global_step": 184298, "epoch": 4388} {"train_loss": -7.179086685180664, "global_step": 184299, "epoch": 4388} {"train_loss": -7.183225631713867, "global_step": 184300, "epoch": 4388} {"train_loss": -7.152597427368164, "global_step": 184301, "epoch": 4388} {"train_loss": -7.2502241134643555, "global_step": 184302, "epoch": 4388} {"train_loss": -7.310864448547363, "global_step": 184303, "epoch": 4388} {"train_loss": -7.209822654724121, "global_step": 184304, "epoch": 4388} {"train_loss": -7.327408790588379, "global_step": 184305, "epoch": 4388} {"train_loss": -7.230274200439453, "global_step": 184306, "epoch": 4388} {"train_loss": -7.292235374450684, "global_step": 184307, "epoch": 4388} {"train_loss": -7.252035140991211, "global_step": 184308, "epoch": 4388} {"train_loss": -7.253726959228516, "global_step": 184309, "epoch": 4388} {"train_loss": -7.262462615966797, "global_step": 184310, "epoch": 4388} {"train_loss": -7.226479530334473, "global_step": 184311, "epoch": 4388} {"train_loss": -7.275331974029541, "global_step": 184312, "epoch": 4388} {"train_loss": -7.124830722808838, "global_step": 184313, "epoch": 4388} {"train_loss": -7.161678314208984, "global_step": 184314, "epoch": 4388} {"train_loss": -7.250017166137695, "global_step": 184315, "epoch": 4388} {"train_loss": -7.208003044128418, "global_step": 184316, "epoch": 4388} {"train_loss": -7.155578136444092, "global_step": 184317, "epoch": 4388} {"train_loss": -7.117377758026123, "global_step": 184318, "epoch": 4388} {"train_loss": -7.128708362579346, "global_step": 184319, "epoch": 4388} {"train_loss": -7.192144393920898, "global_step": 184320, "epoch": 4388} {"train_loss": -7.1586737632751465, "global_step": 184321, "epoch": 4388} {"train_loss": -7.172111511230469, "global_step": 184322, "epoch": 4388} {"train_loss": -7.1484293937683105, "global_step": 184323, "epoch": 4388} {"train_loss": -7.152420997619629, "global_step": 184324, "epoch": 4388} {"train_loss": -7.3050007820129395, "global_step": 184325, "epoch": 4388} {"train_loss": -7.071970462799072, "global_step": 184326, "epoch": 4388} {"train_loss": -7.188142776489258, "global_step": 184327, "epoch": 4388} {"train_loss": -7.237532615661621, "global_step": 184328, "epoch": 4388} {"train_loss": -7.1407670974731445, "global_step": 184329, "epoch": 4388} {"train_loss": -7.183223724365234, "global_step": 184330, "epoch": 4388} {"train_loss": -7.016396999359131, "global_step": 184331, "epoch": 4388} {"train_loss": -7.191874980926514, "global_step": 184332, "epoch": 4388} {"train_loss": -7.157393932342529, "global_step": 184333, "epoch": 4388} {"train_loss": -7.115725994110107, "global_step": 184334, "epoch": 4388} {"train_loss": -7.086692810058594, "global_step": 184335, "epoch": 4388} {"train_loss": -7.129796504974365, "global_step": 184336, "epoch": 4388} {"train_loss": -7.189814238321214, "global_step": 184337, "epoch": 4388, "val_loss": 80571.078125} {"train_loss": -7.086093425750732, "global_step": 184338, "epoch": 4389} {"train_loss": -7.163276672363281, "global_step": 184339, "epoch": 4389} {"train_loss": -7.118556499481201, "global_step": 184340, "epoch": 4389} {"train_loss": -7.241163730621338, "global_step": 184341, "epoch": 4389} {"train_loss": -7.184635162353516, "global_step": 184342, "epoch": 4389} {"train_loss": -7.064792633056641, "global_step": 184343, "epoch": 4389} {"train_loss": -7.1374053955078125, "global_step": 184344, "epoch": 4389} {"train_loss": -7.243148326873779, "global_step": 184345, "epoch": 4389} {"train_loss": -7.142780303955078, "global_step": 184346, "epoch": 4389} {"train_loss": -7.176154136657715, "global_step": 184347, "epoch": 4389} {"train_loss": -7.163616180419922, "global_step": 184348, "epoch": 4389} {"train_loss": -7.163942337036133, "global_step": 184349, "epoch": 4389} {"train_loss": -7.192744255065918, "global_step": 184350, "epoch": 4389} {"train_loss": -7.142304420471191, "global_step": 184351, "epoch": 4389} {"train_loss": -7.124417304992676, "global_step": 184352, "epoch": 4389} {"train_loss": -7.156668186187744, "global_step": 184353, "epoch": 4389} {"train_loss": -7.090005874633789, "global_step": 184354, "epoch": 4389} {"train_loss": -7.112333297729492, "global_step": 184355, "epoch": 4389} {"train_loss": -7.1086931228637695, "global_step": 184356, "epoch": 4389} {"train_loss": -7.080415725708008, "global_step": 184357, "epoch": 4389} {"train_loss": -7.21309232711792, "global_step": 184358, "epoch": 4389} {"train_loss": -7.08671760559082, "global_step": 184359, "epoch": 4389} {"train_loss": -7.167670249938965, "global_step": 184360, "epoch": 4389} {"train_loss": -6.934231758117676, "global_step": 184361, "epoch": 4389} {"train_loss": -7.095561981201172, "global_step": 184362, "epoch": 4389} {"train_loss": -7.05833101272583, "global_step": 184363, "epoch": 4389} {"train_loss": -6.932595729827881, "global_step": 184364, "epoch": 4389} {"train_loss": -7.154329299926758, "global_step": 184365, "epoch": 4389} {"train_loss": -6.927896499633789, "global_step": 184366, "epoch": 4389} {"train_loss": -7.054868698120117, "global_step": 184367, "epoch": 4389} {"train_loss": -7.02187442779541, "global_step": 184368, "epoch": 4389} {"train_loss": -6.962194442749023, "global_step": 184369, "epoch": 4389} {"train_loss": -7.0749616622924805, "global_step": 184370, "epoch": 4389} {"train_loss": -7.169817924499512, "global_step": 184371, "epoch": 4389} {"train_loss": -7.1056694984436035, "global_step": 184372, "epoch": 4389} {"train_loss": -7.19312858581543, "global_step": 184373, "epoch": 4389} {"train_loss": -7.120321273803711, "global_step": 184374, "epoch": 4389} {"train_loss": -7.239917755126953, "global_step": 184375, "epoch": 4389} {"train_loss": -7.043395042419434, "global_step": 184376, "epoch": 4389} {"train_loss": -7.154440879821777, "global_step": 184377, "epoch": 4389} {"train_loss": -7.079229354858398, "global_step": 184378, "epoch": 4389} {"train_loss": -7.112857591538202, "global_step": 184379, "epoch": 4389, "val_loss": 80870.78125} {"train_loss": -7.140507698059082, "global_step": 184380, "epoch": 4390} {"train_loss": -7.184598922729492, "global_step": 184381, "epoch": 4390} {"train_loss": -7.145194053649902, "global_step": 184382, "epoch": 4390} {"train_loss": -7.203803539276123, "global_step": 184383, "epoch": 4390} {"train_loss": -7.0951409339904785, "global_step": 184384, "epoch": 4390} {"train_loss": -7.202043533325195, "global_step": 184385, "epoch": 4390} {"train_loss": -7.1537370681762695, "global_step": 184386, "epoch": 4390} {"train_loss": -7.094902515411377, "global_step": 184387, "epoch": 4390} {"train_loss": -7.2264204025268555, "global_step": 184388, "epoch": 4390} {"train_loss": -7.131224632263184, "global_step": 184389, "epoch": 4390} {"train_loss": -7.137127876281738, "global_step": 184390, "epoch": 4390} {"train_loss": -7.226423263549805, "global_step": 184391, "epoch": 4390} {"train_loss": -7.198207855224609, "global_step": 184392, "epoch": 4390} {"train_loss": -7.118923664093018, "global_step": 184393, "epoch": 4390} {"train_loss": -7.057049751281738, "global_step": 184394, "epoch": 4390} {"train_loss": -7.178110122680664, "global_step": 184395, "epoch": 4390} {"train_loss": -7.135326862335205, "global_step": 184396, "epoch": 4390} {"train_loss": -7.055355072021484, "global_step": 184397, "epoch": 4390} {"train_loss": -7.145224571228027, "global_step": 184398, "epoch": 4390} {"train_loss": -7.2011847496032715, "global_step": 184399, "epoch": 4390} {"train_loss": -7.000235557556152, "global_step": 184400, "epoch": 4390} {"train_loss": -7.100285053253174, "global_step": 184401, "epoch": 4390} {"train_loss": -7.115335464477539, "global_step": 184402, "epoch": 4390} {"train_loss": -7.135128021240234, "global_step": 184403, "epoch": 4390} {"train_loss": -7.284262657165527, "global_step": 184404, "epoch": 4390} {"train_loss": -7.152042388916016, "global_step": 184405, "epoch": 4390} {"train_loss": -7.18251895904541, "global_step": 184406, "epoch": 4390} {"train_loss": -7.227022171020508, "global_step": 184407, "epoch": 4390} {"train_loss": -7.205757141113281, "global_step": 184408, "epoch": 4390} {"train_loss": -7.105329990386963, "global_step": 184409, "epoch": 4390} {"train_loss": -7.222408294677734, "global_step": 184410, "epoch": 4390} {"train_loss": -7.1999053955078125, "global_step": 184411, "epoch": 4390} {"train_loss": -7.070084095001221, "global_step": 184412, "epoch": 4390} {"train_loss": -7.231956481933594, "global_step": 184413, "epoch": 4390} {"train_loss": -7.229315280914307, "global_step": 184414, "epoch": 4390} {"train_loss": -7.014588356018066, "global_step": 184415, "epoch": 4390} {"train_loss": -7.10256814956665, "global_step": 184416, "epoch": 4390} {"train_loss": -7.176555156707764, "global_step": 184417, "epoch": 4390} {"train_loss": -7.059783935546875, "global_step": 184418, "epoch": 4390} {"train_loss": -7.162094593048096, "global_step": 184419, "epoch": 4390} {"train_loss": -7.199184417724609, "global_step": 184420, "epoch": 4390} {"train_loss": -7.15348516191755, "global_step": 184421, "epoch": 4390, "val_loss": 80772.4609375} {"train_loss": -7.171348571777344, "global_step": 184422, "epoch": 4391} {"train_loss": -7.213009834289551, "global_step": 184423, "epoch": 4391} {"train_loss": -7.205466270446777, "global_step": 184424, "epoch": 4391} {"train_loss": -7.282174587249756, "global_step": 184425, "epoch": 4391} {"train_loss": -7.236019134521484, "global_step": 184426, "epoch": 4391} {"train_loss": -7.144111633300781, "global_step": 184427, "epoch": 4391} {"train_loss": -7.190940856933594, "global_step": 184428, "epoch": 4391} {"train_loss": -7.187603950500488, "global_step": 184429, "epoch": 4391} {"train_loss": -7.216916084289551, "global_step": 184430, "epoch": 4391} {"train_loss": -7.156074523925781, "global_step": 184431, "epoch": 4391} {"train_loss": -7.063714504241943, "global_step": 184432, "epoch": 4391} {"train_loss": -7.031073570251465, "global_step": 184433, "epoch": 4391} {"train_loss": -7.097707748413086, "global_step": 184434, "epoch": 4391} {"train_loss": -7.124075889587402, "global_step": 184435, "epoch": 4391} {"train_loss": -7.081212043762207, "global_step": 184436, "epoch": 4391} {"train_loss": -7.199036598205566, "global_step": 184437, "epoch": 4391} {"train_loss": -7.171257972717285, "global_step": 184438, "epoch": 4391} {"train_loss": -7.010044097900391, "global_step": 184439, "epoch": 4391} {"train_loss": -7.096527099609375, "global_step": 184440, "epoch": 4391} {"train_loss": -7.061483383178711, "global_step": 184441, "epoch": 4391} {"train_loss": -7.0438408851623535, "global_step": 184442, "epoch": 4391} {"train_loss": -7.02851676940918, "global_step": 184443, "epoch": 4391} {"train_loss": -6.928793430328369, "global_step": 184444, "epoch": 4391} {"train_loss": -7.154427528381348, "global_step": 184445, "epoch": 4391} {"train_loss": -6.950125217437744, "global_step": 184446, "epoch": 4391} {"train_loss": -7.034061431884766, "global_step": 184447, "epoch": 4391} {"train_loss": -7.066982269287109, "global_step": 184448, "epoch": 4391} {"train_loss": -7.113969326019287, "global_step": 184449, "epoch": 4391} {"train_loss": -6.942090034484863, "global_step": 184450, "epoch": 4391} {"train_loss": -7.093183517456055, "global_step": 184451, "epoch": 4391} {"train_loss": -7.130349636077881, "global_step": 184452, "epoch": 4391} {"train_loss": -7.146820068359375, "global_step": 184453, "epoch": 4391} {"train_loss": -7.181606292724609, "global_step": 184454, "epoch": 4391} {"train_loss": -7.144218444824219, "global_step": 184455, "epoch": 4391} {"train_loss": -7.093582630157471, "global_step": 184456, "epoch": 4391} {"train_loss": -7.183947563171387, "global_step": 184457, "epoch": 4391} {"train_loss": -7.1935505867004395, "global_step": 184458, "epoch": 4391} {"train_loss": -7.058846473693848, "global_step": 184459, "epoch": 4391} {"train_loss": -7.200101375579834, "global_step": 184460, "epoch": 4391} {"train_loss": -7.125988006591797, "global_step": 184461, "epoch": 4391} {"train_loss": -7.150676727294922, "global_step": 184462, "epoch": 4391} {"train_loss": -7.118974265598116, "global_step": 184463, "epoch": 4391, "val_loss": 80491.6328125} {"train_loss": -7.21912956237793, "global_step": 184464, "epoch": 4392} {"train_loss": -7.0105133056640625, "global_step": 184465, "epoch": 4392} {"train_loss": -7.259178161621094, "global_step": 184466, "epoch": 4392} {"train_loss": -7.060295104980469, "global_step": 184467, "epoch": 4392} {"train_loss": -7.103880882263184, "global_step": 184468, "epoch": 4392} {"train_loss": -7.212590217590332, "global_step": 184469, "epoch": 4392} {"train_loss": -7.025279998779297, "global_step": 184470, "epoch": 4392} {"train_loss": -7.134124755859375, "global_step": 184471, "epoch": 4392} {"train_loss": -7.12867546081543, "global_step": 184472, "epoch": 4392} {"train_loss": -7.1299591064453125, "global_step": 184473, "epoch": 4392} {"train_loss": -7.156935691833496, "global_step": 184474, "epoch": 4392} {"train_loss": -7.112660884857178, "global_step": 184475, "epoch": 4392} {"train_loss": -7.166937351226807, "global_step": 184476, "epoch": 4392} {"train_loss": -7.235851287841797, "global_step": 184477, "epoch": 4392} {"train_loss": -7.170938014984131, "global_step": 184478, "epoch": 4392} {"train_loss": -7.21010684967041, "global_step": 184479, "epoch": 4392} {"train_loss": -7.164273262023926, "global_step": 184480, "epoch": 4392} {"train_loss": -7.1465044021606445, "global_step": 184481, "epoch": 4392} {"train_loss": -7.194436073303223, "global_step": 184482, "epoch": 4392} {"train_loss": -7.195706367492676, "global_step": 184483, "epoch": 4392} {"train_loss": -7.274302959442139, "global_step": 184484, "epoch": 4392} {"train_loss": -7.129240036010742, "global_step": 184485, "epoch": 4392} {"train_loss": -7.126631736755371, "global_step": 184486, "epoch": 4392} {"train_loss": -7.123979568481445, "global_step": 184487, "epoch": 4392} {"train_loss": -7.129114151000977, "global_step": 184488, "epoch": 4392} {"train_loss": -7.198192596435547, "global_step": 184489, "epoch": 4392} {"train_loss": -7.190444469451904, "global_step": 184490, "epoch": 4392} {"train_loss": -7.266300678253174, "global_step": 184491, "epoch": 4392} {"train_loss": -7.275332450866699, "global_step": 184492, "epoch": 4392} {"train_loss": -7.2013702392578125, "global_step": 184493, "epoch": 4392} {"train_loss": -7.201211929321289, "global_step": 184494, "epoch": 4392} {"train_loss": -7.263404846191406, "global_step": 184495, "epoch": 4392} {"train_loss": -7.151381492614746, "global_step": 184496, "epoch": 4392} {"train_loss": -7.1892595291137695, "global_step": 184497, "epoch": 4392} {"train_loss": -7.16923189163208, "global_step": 184498, "epoch": 4392} {"train_loss": -7.1004228591918945, "global_step": 184499, "epoch": 4392} {"train_loss": -7.105093002319336, "global_step": 184500, "epoch": 4392} {"train_loss": -7.223677158355713, "global_step": 184501, "epoch": 4392} {"train_loss": -7.071997165679932, "global_step": 184502, "epoch": 4392} {"train_loss": -7.159685134887695, "global_step": 184503, "epoch": 4392} {"train_loss": -7.077543258666992, "global_step": 184504, "epoch": 4392} {"train_loss": -7.164521807716007, "global_step": 184505, "epoch": 4392, "val_loss": 80699.1875} {"train_loss": -7.25347900390625, "global_step": 184506, "epoch": 4393} {"train_loss": -7.138397693634033, "global_step": 184507, "epoch": 4393} {"train_loss": -7.285121917724609, "global_step": 184508, "epoch": 4393} {"train_loss": -7.288689613342285, "global_step": 184509, "epoch": 4393} {"train_loss": -7.14351224899292, "global_step": 184510, "epoch": 4393} {"train_loss": -7.179224014282227, "global_step": 184511, "epoch": 4393} {"train_loss": -7.159467697143555, "global_step": 184512, "epoch": 4393} {"train_loss": -6.937672138214111, "global_step": 184513, "epoch": 4393} {"train_loss": -7.02388334274292, "global_step": 184514, "epoch": 4393} {"train_loss": -7.019729137420654, "global_step": 184515, "epoch": 4393} {"train_loss": -7.027188301086426, "global_step": 184516, "epoch": 4393} {"train_loss": -7.127973556518555, "global_step": 184517, "epoch": 4393} {"train_loss": -7.185858726501465, "global_step": 184518, "epoch": 4393} {"train_loss": -7.077939033508301, "global_step": 184519, "epoch": 4393} {"train_loss": -7.155428886413574, "global_step": 184520, "epoch": 4393} {"train_loss": -7.0026750564575195, "global_step": 184521, "epoch": 4393} {"train_loss": -7.077856063842773, "global_step": 184522, "epoch": 4393} {"train_loss": -7.097958087921143, "global_step": 184523, "epoch": 4393} {"train_loss": -7.042843341827393, "global_step": 184524, "epoch": 4393} {"train_loss": -7.063076019287109, "global_step": 184525, "epoch": 4393} {"train_loss": -7.054248332977295, "global_step": 184526, "epoch": 4393} {"train_loss": -7.1227192878723145, "global_step": 184527, "epoch": 4393} {"train_loss": -7.0749053955078125, "global_step": 184528, "epoch": 4393} {"train_loss": -7.103209495544434, "global_step": 184529, "epoch": 4393} {"train_loss": -7.19371223449707, "global_step": 184530, "epoch": 4393} {"train_loss": -7.187763214111328, "global_step": 184531, "epoch": 4393} {"train_loss": -7.0669846534729, "global_step": 184532, "epoch": 4393} {"train_loss": -7.100888252258301, "global_step": 184533, "epoch": 4393} {"train_loss": -7.159626007080078, "global_step": 184534, "epoch": 4393} {"train_loss": -7.0499587059021, "global_step": 184535, "epoch": 4393} {"train_loss": -7.100133895874023, "global_step": 184536, "epoch": 4393} {"train_loss": -7.144975662231445, "global_step": 184537, "epoch": 4393} {"train_loss": -7.117537498474121, "global_step": 184538, "epoch": 4393} {"train_loss": -7.140771389007568, "global_step": 184539, "epoch": 4393} {"train_loss": -7.143577575683594, "global_step": 184540, "epoch": 4393} {"train_loss": -7.174356937408447, "global_step": 184541, "epoch": 4393} {"train_loss": -7.217099189758301, "global_step": 184542, "epoch": 4393} {"train_loss": -7.180914878845215, "global_step": 184543, "epoch": 4393} {"train_loss": -7.255370140075684, "global_step": 184544, "epoch": 4393} {"train_loss": -7.121114730834961, "global_step": 184545, "epoch": 4393} {"train_loss": -7.1345977783203125, "global_step": 184546, "epoch": 4393} {"train_loss": -7.126279070263817, "global_step": 184547, "epoch": 4393, "val_loss": 80564.0546875} {"train_loss": -7.116507530212402, "global_step": 184548, "epoch": 4394} {"train_loss": -7.28371524810791, "global_step": 184549, "epoch": 4394} {"train_loss": -7.131280899047852, "global_step": 184550, "epoch": 4394} {"train_loss": -7.211308002471924, "global_step": 184551, "epoch": 4394} {"train_loss": -7.0680975914001465, "global_step": 184552, "epoch": 4394} {"train_loss": -7.20923376083374, "global_step": 184553, "epoch": 4394} {"train_loss": -7.169894218444824, "global_step": 184554, "epoch": 4394} {"train_loss": -7.118165493011475, "global_step": 184555, "epoch": 4394} {"train_loss": -7.242987632751465, "global_step": 184556, "epoch": 4394} {"train_loss": -7.118578910827637, "global_step": 184557, "epoch": 4394} {"train_loss": -7.192728519439697, "global_step": 184558, "epoch": 4394} {"train_loss": -7.091263771057129, "global_step": 184559, "epoch": 4394} {"train_loss": -7.236260414123535, "global_step": 184560, "epoch": 4394} {"train_loss": -7.229003429412842, "global_step": 184561, "epoch": 4394} {"train_loss": -7.203204154968262, "global_step": 184562, "epoch": 4394} {"train_loss": -7.242815971374512, "global_step": 184563, "epoch": 4394} {"train_loss": -7.244738578796387, "global_step": 184564, "epoch": 4394} {"train_loss": -7.236620903015137, "global_step": 184565, "epoch": 4394} {"train_loss": -7.1620001792907715, "global_step": 184566, "epoch": 4394} {"train_loss": -7.124398708343506, "global_step": 184567, "epoch": 4394} {"train_loss": -7.206578254699707, "global_step": 184568, "epoch": 4394} {"train_loss": -7.234375476837158, "global_step": 184569, "epoch": 4394} {"train_loss": -7.227679252624512, "global_step": 184570, "epoch": 4394} {"train_loss": -7.168580055236816, "global_step": 184571, "epoch": 4394} {"train_loss": -7.1347761154174805, "global_step": 184572, "epoch": 4394} {"train_loss": -7.2626633644104, "global_step": 184573, "epoch": 4394} {"train_loss": -7.255681037902832, "global_step": 184574, "epoch": 4394} {"train_loss": -7.13625431060791, "global_step": 184575, "epoch": 4394} {"train_loss": -7.2546491622924805, "global_step": 184576, "epoch": 4394} {"train_loss": -7.25975227355957, "global_step": 184577, "epoch": 4394} {"train_loss": -7.28195333480835, "global_step": 184578, "epoch": 4394} {"train_loss": -7.133576393127441, "global_step": 184579, "epoch": 4394} {"train_loss": -7.1981916427612305, "global_step": 184580, "epoch": 4394} {"train_loss": -7.217586517333984, "global_step": 184581, "epoch": 4394} {"train_loss": -7.10218620300293, "global_step": 184582, "epoch": 4394} {"train_loss": -7.232817649841309, "global_step": 184583, "epoch": 4394} {"train_loss": -7.062784194946289, "global_step": 184584, "epoch": 4394} {"train_loss": -7.084847927093506, "global_step": 184585, "epoch": 4394} {"train_loss": -7.171278476715088, "global_step": 184586, "epoch": 4394} {"train_loss": -7.138871192932129, "global_step": 184587, "epoch": 4394} {"train_loss": -7.138246059417725, "global_step": 184588, "epoch": 4394} {"train_loss": -7.184493553070795, "global_step": 184589, "epoch": 4394, "val_loss": 80868.828125} {"train_loss": -7.170045852661133, "global_step": 184590, "epoch": 4395} {"train_loss": -7.2150187492370605, "global_step": 184591, "epoch": 4395} {"train_loss": -7.1518754959106445, "global_step": 184592, "epoch": 4395} {"train_loss": -7.268792152404785, "global_step": 184593, "epoch": 4395} {"train_loss": -7.222002983093262, "global_step": 184594, "epoch": 4395} {"train_loss": -7.151359558105469, "global_step": 184595, "epoch": 4395} {"train_loss": -7.038214683532715, "global_step": 184596, "epoch": 4395} {"train_loss": -7.318779945373535, "global_step": 184597, "epoch": 4395} {"train_loss": -7.093730926513672, "global_step": 184598, "epoch": 4395} {"train_loss": -7.234071731567383, "global_step": 184599, "epoch": 4395} {"train_loss": -7.196196556091309, "global_step": 184600, "epoch": 4395} {"train_loss": -7.127866744995117, "global_step": 184601, "epoch": 4395} {"train_loss": -7.026895046234131, "global_step": 184602, "epoch": 4395} {"train_loss": -7.222023010253906, "global_step": 184603, "epoch": 4395} {"train_loss": -7.134411811828613, "global_step": 184604, "epoch": 4395} {"train_loss": -7.180660724639893, "global_step": 184605, "epoch": 4395} {"train_loss": -7.1692118644714355, "global_step": 184606, "epoch": 4395} {"train_loss": -7.198237895965576, "global_step": 184607, "epoch": 4395} {"train_loss": -7.014559745788574, "global_step": 184608, "epoch": 4395} {"train_loss": -7.1003007888793945, "global_step": 184609, "epoch": 4395} {"train_loss": -7.21224308013916, "global_step": 184610, "epoch": 4395} {"train_loss": -7.17426872253418, "global_step": 184611, "epoch": 4395} {"train_loss": -7.236841201782227, "global_step": 184612, "epoch": 4395} {"train_loss": -7.247698783874512, "global_step": 184613, "epoch": 4395} {"train_loss": -7.230384349822998, "global_step": 184614, "epoch": 4395} {"train_loss": -7.193376064300537, "global_step": 184615, "epoch": 4395} {"train_loss": -7.2187042236328125, "global_step": 184616, "epoch": 4395} {"train_loss": -7.283549785614014, "global_step": 184617, "epoch": 4395} {"train_loss": -7.268461227416992, "global_step": 184618, "epoch": 4395} {"train_loss": -7.105632781982422, "global_step": 184619, "epoch": 4395} {"train_loss": -7.140527725219727, "global_step": 184620, "epoch": 4395} {"train_loss": -7.171784400939941, "global_step": 184621, "epoch": 4395} {"train_loss": -7.1961870193481445, "global_step": 184622, "epoch": 4395} {"train_loss": -7.039289951324463, "global_step": 184623, "epoch": 4395} {"train_loss": -7.09022331237793, "global_step": 184624, "epoch": 4395} {"train_loss": -7.163490295410156, "global_step": 184625, "epoch": 4395} {"train_loss": -7.2183027267456055, "global_step": 184626, "epoch": 4395} {"train_loss": -7.1488494873046875, "global_step": 184627, "epoch": 4395} {"train_loss": -7.170310974121094, "global_step": 184628, "epoch": 4395} {"train_loss": -7.1140594482421875, "global_step": 184629, "epoch": 4395} {"train_loss": -7.241267204284668, "global_step": 184630, "epoch": 4395} {"train_loss": -7.173242557616461, "global_step": 184631, "epoch": 4395, "val_loss": 80703.9375} {"train_loss": -7.270516872406006, "global_step": 184632, "epoch": 4396} {"train_loss": -7.168445110321045, "global_step": 184633, "epoch": 4396} {"train_loss": -7.241015911102295, "global_step": 184634, "epoch": 4396} {"train_loss": -7.202971458435059, "global_step": 184635, "epoch": 4396} {"train_loss": -7.220803260803223, "global_step": 184636, "epoch": 4396} {"train_loss": -7.101240634918213, "global_step": 184637, "epoch": 4396} {"train_loss": -7.229047775268555, "global_step": 184638, "epoch": 4396} {"train_loss": -7.092596054077148, "global_step": 184639, "epoch": 4396} {"train_loss": -7.253225326538086, "global_step": 184640, "epoch": 4396} {"train_loss": -7.215577125549316, "global_step": 184641, "epoch": 4396} {"train_loss": -7.094386577606201, "global_step": 184642, "epoch": 4396} {"train_loss": -7.249429702758789, "global_step": 184643, "epoch": 4396} {"train_loss": -7.176177978515625, "global_step": 184644, "epoch": 4396} {"train_loss": -7.138696193695068, "global_step": 184645, "epoch": 4396} {"train_loss": -7.2438836097717285, "global_step": 184646, "epoch": 4396} {"train_loss": -7.132889747619629, "global_step": 184647, "epoch": 4396} {"train_loss": -7.263009071350098, "global_step": 184648, "epoch": 4396} {"train_loss": -7.279149055480957, "global_step": 184649, "epoch": 4396} {"train_loss": -7.249993801116943, "global_step": 184650, "epoch": 4396} {"train_loss": -7.140562057495117, "global_step": 184651, "epoch": 4396} {"train_loss": -7.170923233032227, "global_step": 184652, "epoch": 4396} {"train_loss": -7.193571090698242, "global_step": 184653, "epoch": 4396} {"train_loss": -7.117443561553955, "global_step": 184654, "epoch": 4396} {"train_loss": -7.184722900390625, "global_step": 184655, "epoch": 4396} {"train_loss": -7.177568435668945, "global_step": 184656, "epoch": 4396} {"train_loss": -7.157508850097656, "global_step": 184657, "epoch": 4396} {"train_loss": -7.234630584716797, "global_step": 184658, "epoch": 4396} {"train_loss": -7.164471626281738, "global_step": 184659, "epoch": 4396} {"train_loss": -7.154784202575684, "global_step": 184660, "epoch": 4396} {"train_loss": -7.209262847900391, "global_step": 184661, "epoch": 4396} {"train_loss": -7.095147132873535, "global_step": 184662, "epoch": 4396} {"train_loss": -7.184381008148193, "global_step": 184663, "epoch": 4396} {"train_loss": -7.160127639770508, "global_step": 184664, "epoch": 4396} {"train_loss": -7.14274787902832, "global_step": 184665, "epoch": 4396} {"train_loss": -7.253912925720215, "global_step": 184666, "epoch": 4396} {"train_loss": -7.264397144317627, "global_step": 184667, "epoch": 4396} {"train_loss": -7.2512664794921875, "global_step": 184668, "epoch": 4396} {"train_loss": -7.112179756164551, "global_step": 184669, "epoch": 4396} {"train_loss": -7.221270561218262, "global_step": 184670, "epoch": 4396} {"train_loss": -7.1511077880859375, "global_step": 184671, "epoch": 4396} {"train_loss": -7.2255144119262695, "global_step": 184672, "epoch": 4396} {"train_loss": -7.1924221856253485, "global_step": 184673, "epoch": 4396, "val_loss": 80605.96875} {"train_loss": -7.238348484039307, "global_step": 184674, "epoch": 4397} {"train_loss": -7.145280361175537, "global_step": 184675, "epoch": 4397} {"train_loss": -7.274392127990723, "global_step": 184676, "epoch": 4397} {"train_loss": -7.192564010620117, "global_step": 184677, "epoch": 4397} {"train_loss": -7.127908706665039, "global_step": 184678, "epoch": 4397} {"train_loss": -7.075977802276611, "global_step": 184679, "epoch": 4397} {"train_loss": -7.21829891204834, "global_step": 184680, "epoch": 4397} {"train_loss": -7.203396320343018, "global_step": 184681, "epoch": 4397} {"train_loss": -7.0358195304870605, "global_step": 184682, "epoch": 4397} {"train_loss": -7.165040493011475, "global_step": 184683, "epoch": 4397} {"train_loss": -7.139436721801758, "global_step": 184684, "epoch": 4397} {"train_loss": -7.096626281738281, "global_step": 184685, "epoch": 4397} {"train_loss": -7.207929611206055, "global_step": 184686, "epoch": 4397} {"train_loss": -7.211888313293457, "global_step": 184687, "epoch": 4397} {"train_loss": -7.195350646972656, "global_step": 184688, "epoch": 4397} {"train_loss": -7.200905799865723, "global_step": 184689, "epoch": 4397} {"train_loss": -7.278441429138184, "global_step": 184690, "epoch": 4397} {"train_loss": -7.19809627532959, "global_step": 184691, "epoch": 4397} {"train_loss": -7.3062896728515625, "global_step": 184692, "epoch": 4397} {"train_loss": -7.140017986297607, "global_step": 184693, "epoch": 4397} {"train_loss": -7.215607643127441, "global_step": 184694, "epoch": 4397} {"train_loss": -7.26218318939209, "global_step": 184695, "epoch": 4397} {"train_loss": -7.240935325622559, "global_step": 184696, "epoch": 4397} {"train_loss": -7.216673851013184, "global_step": 184697, "epoch": 4397} {"train_loss": -7.151508331298828, "global_step": 184698, "epoch": 4397} {"train_loss": -7.176881313323975, "global_step": 184699, "epoch": 4397} {"train_loss": -7.112081527709961, "global_step": 184700, "epoch": 4397} {"train_loss": -7.212455749511719, "global_step": 184701, "epoch": 4397} {"train_loss": -7.114858627319336, "global_step": 184702, "epoch": 4397} {"train_loss": -7.104456901550293, "global_step": 184703, "epoch": 4397} {"train_loss": -7.224989414215088, "global_step": 184704, "epoch": 4397} {"train_loss": -7.247352600097656, "global_step": 184705, "epoch": 4397} {"train_loss": -7.111043930053711, "global_step": 184706, "epoch": 4397} {"train_loss": -7.189183235168457, "global_step": 184707, "epoch": 4397} {"train_loss": -7.072392463684082, "global_step": 184708, "epoch": 4397} {"train_loss": -7.086614608764648, "global_step": 184709, "epoch": 4397} {"train_loss": -7.095048904418945, "global_step": 184710, "epoch": 4397} {"train_loss": -7.125552654266357, "global_step": 184711, "epoch": 4397} {"train_loss": -7.086313247680664, "global_step": 184712, "epoch": 4397} {"train_loss": -7.0463056564331055, "global_step": 184713, "epoch": 4397} {"train_loss": -7.179571151733398, "global_step": 184714, "epoch": 4397} {"train_loss": -7.166903132484073, "global_step": 184715, "epoch": 4397, "val_loss": 80857.6953125} {"train_loss": -7.077936172485352, "global_step": 184716, "epoch": 4398} {"train_loss": -6.938831329345703, "global_step": 184717, "epoch": 4398} {"train_loss": -7.145498275756836, "global_step": 184718, "epoch": 4398} {"train_loss": -7.083468437194824, "global_step": 184719, "epoch": 4398} {"train_loss": -7.109646797180176, "global_step": 184720, "epoch": 4398} {"train_loss": -7.074326515197754, "global_step": 184721, "epoch": 4398} {"train_loss": -7.131135940551758, "global_step": 184722, "epoch": 4398} {"train_loss": -7.036623477935791, "global_step": 184723, "epoch": 4398} {"train_loss": -7.059452056884766, "global_step": 184724, "epoch": 4398} {"train_loss": -7.07681941986084, "global_step": 184725, "epoch": 4398} {"train_loss": -7.107061386108398, "global_step": 184726, "epoch": 4398} {"train_loss": -7.081316947937012, "global_step": 184727, "epoch": 4398} {"train_loss": -7.158960342407227, "global_step": 184728, "epoch": 4398} {"train_loss": -7.140304088592529, "global_step": 184729, "epoch": 4398} {"train_loss": -7.141441345214844, "global_step": 184730, "epoch": 4398} {"train_loss": -7.0717620849609375, "global_step": 184731, "epoch": 4398} {"train_loss": -7.18125057220459, "global_step": 184732, "epoch": 4398} {"train_loss": -7.095800399780273, "global_step": 184733, "epoch": 4398} {"train_loss": -7.109879016876221, "global_step": 184734, "epoch": 4398} {"train_loss": -7.126489639282227, "global_step": 184735, "epoch": 4398} {"train_loss": -7.139060974121094, "global_step": 184736, "epoch": 4398} {"train_loss": -7.165422439575195, "global_step": 184737, "epoch": 4398} {"train_loss": -7.062676429748535, "global_step": 184738, "epoch": 4398} {"train_loss": -7.117987632751465, "global_step": 184739, "epoch": 4398} {"train_loss": -7.137619972229004, "global_step": 184740, "epoch": 4398} {"train_loss": -7.0896430015563965, "global_step": 184741, "epoch": 4398} {"train_loss": -7.1271281242370605, "global_step": 184742, "epoch": 4398} {"train_loss": -7.187197685241699, "global_step": 184743, "epoch": 4398} {"train_loss": -7.204813480377197, "global_step": 184744, "epoch": 4398} {"train_loss": -7.1716437339782715, "global_step": 184745, "epoch": 4398} {"train_loss": -7.121627330780029, "global_step": 184746, "epoch": 4398} {"train_loss": -7.215293884277344, "global_step": 184747, "epoch": 4398} {"train_loss": -7.139839172363281, "global_step": 184748, "epoch": 4398} {"train_loss": -7.163856506347656, "global_step": 184749, "epoch": 4398} {"train_loss": -7.139387607574463, "global_step": 184750, "epoch": 4398} {"train_loss": -7.076078414916992, "global_step": 184751, "epoch": 4398} {"train_loss": -7.18996000289917, "global_step": 184752, "epoch": 4398} {"train_loss": -7.121535778045654, "global_step": 184753, "epoch": 4398} {"train_loss": -7.082462310791016, "global_step": 184754, "epoch": 4398} {"train_loss": -7.1595001220703125, "global_step": 184755, "epoch": 4398} {"train_loss": -7.224157333374023, "global_step": 184756, "epoch": 4398} {"train_loss": -7.118330115363712, "global_step": 184757, "epoch": 4398, "val_loss": 81008.2890625} {"train_loss": -7.051342964172363, "global_step": 184758, "epoch": 4399} {"train_loss": -7.231428146362305, "global_step": 184759, "epoch": 4399} {"train_loss": -7.102020740509033, "global_step": 184760, "epoch": 4399} {"train_loss": -7.092756271362305, "global_step": 184761, "epoch": 4399} {"train_loss": -7.038002014160156, "global_step": 184762, "epoch": 4399} {"train_loss": -7.08565616607666, "global_step": 184763, "epoch": 4399} {"train_loss": -6.999570369720459, "global_step": 184764, "epoch": 4399} {"train_loss": -7.116656303405762, "global_step": 184765, "epoch": 4399} {"train_loss": -7.2686944007873535, "global_step": 184766, "epoch": 4399} {"train_loss": -7.012922763824463, "global_step": 184767, "epoch": 4399} {"train_loss": -7.105109691619873, "global_step": 184768, "epoch": 4399} {"train_loss": -7.103965759277344, "global_step": 184769, "epoch": 4399} {"train_loss": -7.077373504638672, "global_step": 184770, "epoch": 4399} {"train_loss": -7.173986434936523, "global_step": 184771, "epoch": 4399} {"train_loss": -7.2270379066467285, "global_step": 184772, "epoch": 4399} {"train_loss": -7.0416412353515625, "global_step": 184773, "epoch": 4399} {"train_loss": -7.1612548828125, "global_step": 184774, "epoch": 4399} {"train_loss": -7.135554790496826, "global_step": 184775, "epoch": 4399} {"train_loss": -7.101572513580322, "global_step": 184776, "epoch": 4399} {"train_loss": -7.127917766571045, "global_step": 184777, "epoch": 4399} {"train_loss": -7.1546149253845215, "global_step": 184778, "epoch": 4399} {"train_loss": -7.187132835388184, "global_step": 184779, "epoch": 4399} {"train_loss": -7.135516166687012, "global_step": 184780, "epoch": 4399} {"train_loss": -7.118278980255127, "global_step": 184781, "epoch": 4399} {"train_loss": -7.114522933959961, "global_step": 184782, "epoch": 4399} {"train_loss": -7.229617118835449, "global_step": 184783, "epoch": 4399} {"train_loss": -7.098354339599609, "global_step": 184784, "epoch": 4399} {"train_loss": -7.100472927093506, "global_step": 184785, "epoch": 4399} {"train_loss": -7.147499084472656, "global_step": 184786, "epoch": 4399} {"train_loss": -7.195953369140625, "global_step": 184787, "epoch": 4399} {"train_loss": -7.08753776550293, "global_step": 184788, "epoch": 4399} {"train_loss": -7.1652607917785645, "global_step": 184789, "epoch": 4399} {"train_loss": -7.15297794342041, "global_step": 184790, "epoch": 4399} {"train_loss": -7.1388139724731445, "global_step": 184791, "epoch": 4399} {"train_loss": -7.152544021606445, "global_step": 184792, "epoch": 4399} {"train_loss": -7.194025039672852, "global_step": 184793, "epoch": 4399} {"train_loss": -7.162807941436768, "global_step": 184794, "epoch": 4399} {"train_loss": -7.231296539306641, "global_step": 184795, "epoch": 4399} {"train_loss": -7.171448707580566, "global_step": 184796, "epoch": 4399} {"train_loss": -7.260534286499023, "global_step": 184797, "epoch": 4399} {"train_loss": -7.2431511878967285, "global_step": 184798, "epoch": 4399} {"train_loss": -7.139560563223703, "global_step": 184799, "epoch": 4399, "val_loss": 80825.3359375} {"train_loss": -7.129086494445801, "global_step": 184800, "epoch": 4400} {"train_loss": -7.061556816101074, "global_step": 184801, "epoch": 4400} {"train_loss": -7.06500244140625, "global_step": 184802, "epoch": 4400} {"train_loss": -7.152148246765137, "global_step": 184803, "epoch": 4400} {"train_loss": -7.077960968017578, "global_step": 184804, "epoch": 4400} {"train_loss": -7.243967533111572, "global_step": 184805, "epoch": 4400} {"train_loss": -7.197054862976074, "global_step": 184806, "epoch": 4400} {"train_loss": -7.197322368621826, "global_step": 184807, "epoch": 4400} {"train_loss": -7.255638122558594, "global_step": 184808, "epoch": 4400} {"train_loss": -7.179222106933594, "global_step": 184809, "epoch": 4400} {"train_loss": -7.135682106018066, "global_step": 184810, "epoch": 4400} {"train_loss": -7.311478614807129, "global_step": 184811, "epoch": 4400} {"train_loss": -7.152133941650391, "global_step": 184812, "epoch": 4400} {"train_loss": -7.165585041046143, "global_step": 184813, "epoch": 4400} {"train_loss": -7.172797203063965, "global_step": 184814, "epoch": 4400} {"train_loss": -7.077696323394775, "global_step": 184815, "epoch": 4400} {"train_loss": -7.1726484298706055, "global_step": 184816, "epoch": 4400} {"train_loss": -7.166519641876221, "global_step": 184817, "epoch": 4400} {"train_loss": -6.9735188484191895, "global_step": 184818, "epoch": 4400} {"train_loss": -7.129639625549316, "global_step": 184819, "epoch": 4400} {"train_loss": -7.173320770263672, "global_step": 184820, "epoch": 4400} {"train_loss": -7.066523551940918, "global_step": 184821, "epoch": 4400} {"train_loss": -7.161199569702148, "global_step": 184822, "epoch": 4400} {"train_loss": -7.109667778015137, "global_step": 184823, "epoch": 4400} {"train_loss": -7.193160533905029, "global_step": 184824, "epoch": 4400} {"train_loss": -7.177216529846191, "global_step": 184825, "epoch": 4400} {"train_loss": -7.292478084564209, "global_step": 184826, "epoch": 4400} {"train_loss": -7.194498062133789, "global_step": 184827, "epoch": 4400} {"train_loss": -7.191295623779297, "global_step": 184828, "epoch": 4400} {"train_loss": -7.203690528869629, "global_step": 184829, "epoch": 4400} {"train_loss": -7.096762180328369, "global_step": 184830, "epoch": 4400} {"train_loss": -6.991363525390625, "global_step": 184831, "epoch": 4400} {"train_loss": -7.152077674865723, "global_step": 184832, "epoch": 4400} {"train_loss": -7.123288154602051, "global_step": 184833, "epoch": 4400} {"train_loss": -6.968609809875488, "global_step": 184834, "epoch": 4400} {"train_loss": -7.188760280609131, "global_step": 184835, "epoch": 4400} {"train_loss": -7.0316386222839355, "global_step": 184836, "epoch": 4400} {"train_loss": -7.23193359375, "global_step": 184837, "epoch": 4400} {"train_loss": -7.148258209228516, "global_step": 184838, "epoch": 4400} {"train_loss": -7.208719730377197, "global_step": 184839, "epoch": 4400} {"train_loss": -7.168842315673828, "global_step": 184840, "epoch": 4400} {"train_loss": -7.149063337416876, "global_step": 184841, "epoch": 4400, "train/sim_max_reward_0": 0.4219127512073014, "train/sim_max_reward_1": 0.8940427296882196, "train/sim_max_reward_2": 0.573235657456964, "train/sim_max_reward_3": 0.1307198134854566, "train/sim_max_reward_4": 0.9876045274355795, "train/sim_max_reward_5": 0.5747412392840556, "test/sim_max_reward_4500000": 0.9499985269877348, "test/sim_max_reward_4500001": 0.9945268098853306, "test/sim_max_reward_4500002": 0.9037700875171497, "test/sim_max_reward_4500003": 0.6455496934353908, "test/sim_max_reward_4500004": 0.12152095127408169, "test/sim_max_reward_4500005": 0.9204929761406683, "test/sim_max_reward_4500006": 0.9936070028593891, "test/sim_max_reward_4500007": 0.9887029609929368, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.05301379824035588, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.8984083263441027, "test/sim_max_reward_4500012": 0.9663271100242435, "test/sim_max_reward_4500013": 0.006984824858618961, "test/sim_max_reward_4500014": 0.7136362958240614, "test/sim_max_reward_4500015": 0.9167860427240534, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.06344234513644023, "test/sim_max_reward_4500018": 0.7156519384882, "test/sim_max_reward_4500019": 0.9498845905466969, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9853332238247795, "test/sim_max_reward_4500022": 0.9113922767247069, "test/sim_max_reward_4500023": 0.979634659343044, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.7609883438990751, "test/sim_max_reward_4500026": 0.9851889494666709, "test/sim_max_reward_4500027": 0.8453288581227675, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.1316589329094592, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9824503206453977, "test/sim_max_reward_4500034": 0.9010703172373711, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 1.0, "test/sim_max_reward_4500037": 0.9990364062782565, "test/sim_max_reward_4500038": 0.8593310771855605, "test/sim_max_reward_4500039": 0.9809220143754082, "test/sim_max_reward_4500040": 0.9474552302807846, "test/sim_max_reward_4500041": 0.95745153633908, "test/sim_max_reward_4500042": 0.02347475116549851, "test/sim_max_reward_4500043": 0.9712376301173343, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9975032132627116, "test/sim_max_reward_4500046": 0.6868838591978659, "test/sim_max_reward_4500047": 0.0, "test/sim_max_reward_4500048": 0.9960693766431336, "test/sim_max_reward_4500049": 0.9652527727624863, "train/mean_score": 0.5970427864262627, "test/mean_score": 0.6384439827930053, "val_loss": 80846.3125} {"train_loss": -7.13964319229126, "global_step": 184842, "epoch": 4401} {"train_loss": -7.255133152008057, "global_step": 184843, "epoch": 4401} {"train_loss": -7.146804332733154, "global_step": 184844, "epoch": 4401} {"train_loss": -7.271685600280762, "global_step": 184845, "epoch": 4401} {"train_loss": -7.29960823059082, "global_step": 184846, "epoch": 4401} {"train_loss": -7.103153705596924, "global_step": 184847, "epoch": 4401} {"train_loss": -7.254495620727539, "global_step": 184848, "epoch": 4401} {"train_loss": -7.250065803527832, "global_step": 184849, "epoch": 4401} {"train_loss": -7.2822370529174805, "global_step": 184850, "epoch": 4401} {"train_loss": -7.298406600952148, "global_step": 184851, "epoch": 4401} {"train_loss": -7.190682888031006, "global_step": 184852, "epoch": 4401} {"train_loss": -7.241071701049805, "global_step": 184853, "epoch": 4401} {"train_loss": -7.218867778778076, "global_step": 184854, "epoch": 4401} {"train_loss": -7.2173285484313965, "global_step": 184855, "epoch": 4401} {"train_loss": -7.082457542419434, "global_step": 184856, "epoch": 4401} {"train_loss": -7.250850677490234, "global_step": 184857, "epoch": 4401} {"train_loss": -7.058091163635254, "global_step": 184858, "epoch": 4401} {"train_loss": -7.134016036987305, "global_step": 184859, "epoch": 4401} {"train_loss": -7.1180524826049805, "global_step": 184860, "epoch": 4401} {"train_loss": -7.179914474487305, "global_step": 184861, "epoch": 4401} {"train_loss": -7.209336757659912, "global_step": 184862, "epoch": 4401} {"train_loss": -7.165773391723633, "global_step": 184863, "epoch": 4401} {"train_loss": -6.876367568969727, "global_step": 184864, "epoch": 4401} {"train_loss": -7.143047332763672, "global_step": 184865, "epoch": 4401} {"train_loss": -7.059849739074707, "global_step": 184866, "epoch": 4401} {"train_loss": -7.128664970397949, "global_step": 184867, "epoch": 4401} {"train_loss": -7.084613800048828, "global_step": 184868, "epoch": 4401} {"train_loss": -7.143030166625977, "global_step": 184869, "epoch": 4401} {"train_loss": -7.072299003601074, "global_step": 184870, "epoch": 4401} {"train_loss": -7.132256507873535, "global_step": 184871, "epoch": 4401} {"train_loss": -7.1271820068359375, "global_step": 184872, "epoch": 4401} {"train_loss": -7.13191032409668, "global_step": 184873, "epoch": 4401} {"train_loss": -7.189587593078613, "global_step": 184874, "epoch": 4401} {"train_loss": -7.104485511779785, "global_step": 184875, "epoch": 4401} {"train_loss": -7.157177925109863, "global_step": 184876, "epoch": 4401} {"train_loss": -7.24706506729126, "global_step": 184877, "epoch": 4401} {"train_loss": -7.206575393676758, "global_step": 184878, "epoch": 4401} {"train_loss": -7.130532264709473, "global_step": 184879, "epoch": 4401} {"train_loss": -7.191950798034668, "global_step": 184880, "epoch": 4401} {"train_loss": -7.197938919067383, "global_step": 184881, "epoch": 4401} {"train_loss": -7.091418743133545, "global_step": 184882, "epoch": 4401} {"train_loss": -7.166268428166707, "global_step": 184883, "epoch": 4401, "val_loss": 80856.1875} {"train_loss": -7.211916923522949, "global_step": 184884, "epoch": 4402} {"train_loss": -7.188449859619141, "global_step": 184885, "epoch": 4402} {"train_loss": -7.224881172180176, "global_step": 184886, "epoch": 4402} {"train_loss": -7.18170690536499, "global_step": 184887, "epoch": 4402} {"train_loss": -7.163196086883545, "global_step": 184888, "epoch": 4402} {"train_loss": -7.1480536460876465, "global_step": 184889, "epoch": 4402} {"train_loss": -7.182426452636719, "global_step": 184890, "epoch": 4402} {"train_loss": -7.102923393249512, "global_step": 184891, "epoch": 4402} {"train_loss": -7.1976847648620605, "global_step": 184892, "epoch": 4402} {"train_loss": -7.29812479019165, "global_step": 184893, "epoch": 4402} {"train_loss": -7.072261810302734, "global_step": 184894, "epoch": 4402} {"train_loss": -7.205906867980957, "global_step": 184895, "epoch": 4402} {"train_loss": -7.118664264678955, "global_step": 184896, "epoch": 4402} {"train_loss": -7.10293436050415, "global_step": 184897, "epoch": 4402} {"train_loss": -7.122795581817627, "global_step": 184898, "epoch": 4402} {"train_loss": -7.2503228187561035, "global_step": 184899, "epoch": 4402} {"train_loss": -7.223598480224609, "global_step": 184900, "epoch": 4402} {"train_loss": -7.145599365234375, "global_step": 184901, "epoch": 4402} {"train_loss": -7.215242385864258, "global_step": 184902, "epoch": 4402} {"train_loss": -7.2342705726623535, "global_step": 184903, "epoch": 4402} {"train_loss": -7.078670501708984, "global_step": 184904, "epoch": 4402} {"train_loss": -7.117976665496826, "global_step": 184905, "epoch": 4402} {"train_loss": -7.1190667152404785, "global_step": 184906, "epoch": 4402} {"train_loss": -7.090639114379883, "global_step": 184907, "epoch": 4402} {"train_loss": -7.240553855895996, "global_step": 184908, "epoch": 4402} {"train_loss": -7.244634628295898, "global_step": 184909, "epoch": 4402} {"train_loss": -7.266800403594971, "global_step": 184910, "epoch": 4402} {"train_loss": -7.175039768218994, "global_step": 184911, "epoch": 4402} {"train_loss": -7.16366720199585, "global_step": 184912, "epoch": 4402} {"train_loss": -7.206143379211426, "global_step": 184913, "epoch": 4402} {"train_loss": -7.183452606201172, "global_step": 184914, "epoch": 4402} {"train_loss": -7.2426886558532715, "global_step": 184915, "epoch": 4402} {"train_loss": -7.166597366333008, "global_step": 184916, "epoch": 4402} {"train_loss": -7.316062927246094, "global_step": 184917, "epoch": 4402} {"train_loss": -7.190905570983887, "global_step": 184918, "epoch": 4402} {"train_loss": -7.282522201538086, "global_step": 184919, "epoch": 4402} {"train_loss": -7.192889213562012, "global_step": 184920, "epoch": 4402} {"train_loss": -7.188020706176758, "global_step": 184921, "epoch": 4402} {"train_loss": -7.156023979187012, "global_step": 184922, "epoch": 4402} {"train_loss": -7.1953277587890625, "global_step": 184923, "epoch": 4402} {"train_loss": -7.022659778594971, "global_step": 184924, "epoch": 4402} {"train_loss": -7.182677859351749, "global_step": 184925, "epoch": 4402, "val_loss": 80564.109375} {"train_loss": -7.180751323699951, "global_step": 184926, "epoch": 4403} {"train_loss": -7.119051456451416, "global_step": 184927, "epoch": 4403} {"train_loss": -7.169978141784668, "global_step": 184928, "epoch": 4403} {"train_loss": -7.20380973815918, "global_step": 184929, "epoch": 4403} {"train_loss": -7.071577072143555, "global_step": 184930, "epoch": 4403} {"train_loss": -7.141762733459473, "global_step": 184931, "epoch": 4403} {"train_loss": -7.125430583953857, "global_step": 184932, "epoch": 4403} {"train_loss": -7.227296352386475, "global_step": 184933, "epoch": 4403} {"train_loss": -7.1067891120910645, "global_step": 184934, "epoch": 4403} {"train_loss": -7.0108747482299805, "global_step": 184935, "epoch": 4403} {"train_loss": -7.140724182128906, "global_step": 184936, "epoch": 4403} {"train_loss": -7.141103267669678, "global_step": 184937, "epoch": 4403} {"train_loss": -7.15019416809082, "global_step": 184938, "epoch": 4403} {"train_loss": -7.190218925476074, "global_step": 184939, "epoch": 4403} {"train_loss": -7.092385768890381, "global_step": 184940, "epoch": 4403} {"train_loss": -7.106210708618164, "global_step": 184941, "epoch": 4403} {"train_loss": -7.238402366638184, "global_step": 184942, "epoch": 4403} {"train_loss": -7.109163761138916, "global_step": 184943, "epoch": 4403} {"train_loss": -7.101471900939941, "global_step": 184944, "epoch": 4403} {"train_loss": -7.203601837158203, "global_step": 184945, "epoch": 4403} {"train_loss": -7.076759338378906, "global_step": 184946, "epoch": 4403} {"train_loss": -7.173371315002441, "global_step": 184947, "epoch": 4403} {"train_loss": -7.071640491485596, "global_step": 184948, "epoch": 4403} {"train_loss": -7.24929141998291, "global_step": 184949, "epoch": 4403} {"train_loss": -7.2212300300598145, "global_step": 184950, "epoch": 4403} {"train_loss": -7.189279079437256, "global_step": 184951, "epoch": 4403} {"train_loss": -7.2081732749938965, "global_step": 184952, "epoch": 4403} {"train_loss": -7.2080183029174805, "global_step": 184953, "epoch": 4403} {"train_loss": -7.140315055847168, "global_step": 184954, "epoch": 4403} {"train_loss": -7.149565696716309, "global_step": 184955, "epoch": 4403} {"train_loss": -7.195592880249023, "global_step": 184956, "epoch": 4403} {"train_loss": -7.1150407791137695, "global_step": 184957, "epoch": 4403} {"train_loss": -7.299637794494629, "global_step": 184958, "epoch": 4403} {"train_loss": -7.193023681640625, "global_step": 184959, "epoch": 4403} {"train_loss": -7.171487331390381, "global_step": 184960, "epoch": 4403} {"train_loss": -7.218290328979492, "global_step": 184961, "epoch": 4403} {"train_loss": -7.2487335205078125, "global_step": 184962, "epoch": 4403} {"train_loss": -7.203581809997559, "global_step": 184963, "epoch": 4403} {"train_loss": -7.163791656494141, "global_step": 184964, "epoch": 4403} {"train_loss": -7.203540802001953, "global_step": 184965, "epoch": 4403} {"train_loss": -7.2777252197265625, "global_step": 184966, "epoch": 4403} {"train_loss": -7.167799416042509, "global_step": 184967, "epoch": 4403, "val_loss": 80411.578125} {"train_loss": -7.223317623138428, "global_step": 184968, "epoch": 4404} {"train_loss": -7.286498546600342, "global_step": 184969, "epoch": 4404} {"train_loss": -7.179877758026123, "global_step": 184970, "epoch": 4404} {"train_loss": -7.107612609863281, "global_step": 184971, "epoch": 4404} {"train_loss": -7.2195281982421875, "global_step": 184972, "epoch": 4404} {"train_loss": -7.230970859527588, "global_step": 184973, "epoch": 4404} {"train_loss": -7.286982536315918, "global_step": 184974, "epoch": 4404} {"train_loss": -7.151780605316162, "global_step": 184975, "epoch": 4404} {"train_loss": -7.125154972076416, "global_step": 184976, "epoch": 4404} {"train_loss": -7.213106155395508, "global_step": 184977, "epoch": 4404} {"train_loss": -7.313431739807129, "global_step": 184978, "epoch": 4404} {"train_loss": -6.984647750854492, "global_step": 184979, "epoch": 4404} {"train_loss": -7.159730434417725, "global_step": 184980, "epoch": 4404} {"train_loss": -7.167504787445068, "global_step": 184981, "epoch": 4404} {"train_loss": -7.2058024406433105, "global_step": 184982, "epoch": 4404} {"train_loss": -7.19502067565918, "global_step": 184983, "epoch": 4404} {"train_loss": -7.156847953796387, "global_step": 184984, "epoch": 4404} {"train_loss": -7.137650489807129, "global_step": 184985, "epoch": 4404} {"train_loss": -7.127226829528809, "global_step": 184986, "epoch": 4404} {"train_loss": -7.183863639831543, "global_step": 184987, "epoch": 4404} {"train_loss": -7.255157947540283, "global_step": 184988, "epoch": 4404} {"train_loss": -7.287528991699219, "global_step": 184989, "epoch": 4404} {"train_loss": -7.286437511444092, "global_step": 184990, "epoch": 4404} {"train_loss": -7.146265029907227, "global_step": 184991, "epoch": 4404} {"train_loss": -7.174584865570068, "global_step": 184992, "epoch": 4404} {"train_loss": -7.228189468383789, "global_step": 184993, "epoch": 4404} {"train_loss": -7.16930627822876, "global_step": 184994, "epoch": 4404} {"train_loss": -7.176639556884766, "global_step": 184995, "epoch": 4404} {"train_loss": -7.248046875, "global_step": 184996, "epoch": 4404} {"train_loss": -7.230201244354248, "global_step": 184997, "epoch": 4404} {"train_loss": -7.166877269744873, "global_step": 184998, "epoch": 4404} {"train_loss": -7.0950469970703125, "global_step": 184999, "epoch": 4404} {"train_loss": -7.068841934204102, "global_step": 185000, "epoch": 4404} {"train_loss": -7.047453880310059, "global_step": 185001, "epoch": 4404} {"train_loss": -7.202988624572754, "global_step": 185002, "epoch": 4404} {"train_loss": -7.095842361450195, "global_step": 185003, "epoch": 4404} {"train_loss": -7.052506446838379, "global_step": 185004, "epoch": 4404} {"train_loss": -7.185082912445068, "global_step": 185005, "epoch": 4404} {"train_loss": -6.966121673583984, "global_step": 185006, "epoch": 4404} {"train_loss": -6.915399551391602, "global_step": 185007, "epoch": 4404} {"train_loss": -7.006146430969238, "global_step": 185008, "epoch": 4404} {"train_loss": -7.160030569349017, "global_step": 185009, "epoch": 4404, "val_loss": 80678.9140625} {"train_loss": -7.057031154632568, "global_step": 185010, "epoch": 4405} {"train_loss": -6.968640327453613, "global_step": 185011, "epoch": 4405} {"train_loss": -7.146247386932373, "global_step": 185012, "epoch": 4405} {"train_loss": -6.896617889404297, "global_step": 185013, "epoch": 4405} {"train_loss": -6.945980548858643, "global_step": 185014, "epoch": 4405} {"train_loss": -6.991689682006836, "global_step": 185015, "epoch": 4405} {"train_loss": -6.968271255493164, "global_step": 185016, "epoch": 4405} {"train_loss": -7.100777626037598, "global_step": 185017, "epoch": 4405} {"train_loss": -7.095819473266602, "global_step": 185018, "epoch": 4405} {"train_loss": -7.082757949829102, "global_step": 185019, "epoch": 4405} {"train_loss": -7.139340400695801, "global_step": 185020, "epoch": 4405} {"train_loss": -7.0788774490356445, "global_step": 185021, "epoch": 4405} {"train_loss": -7.09781551361084, "global_step": 185022, "epoch": 4405} {"train_loss": -7.164778232574463, "global_step": 185023, "epoch": 4405} {"train_loss": -7.244745254516602, "global_step": 185024, "epoch": 4405} {"train_loss": -7.196343421936035, "global_step": 185025, "epoch": 4405} {"train_loss": -7.067424297332764, "global_step": 185026, "epoch": 4405} {"train_loss": -7.1123046875, "global_step": 185027, "epoch": 4405} {"train_loss": -7.125482559204102, "global_step": 185028, "epoch": 4405} {"train_loss": -7.2316389083862305, "global_step": 185029, "epoch": 4405} {"train_loss": -7.132133960723877, "global_step": 185030, "epoch": 4405} {"train_loss": -7.1794562339782715, "global_step": 185031, "epoch": 4405} {"train_loss": -7.291077613830566, "global_step": 185032, "epoch": 4405} {"train_loss": -7.368408679962158, "global_step": 185033, "epoch": 4405} {"train_loss": -7.146710395812988, "global_step": 185034, "epoch": 4405} {"train_loss": -7.213278770446777, "global_step": 185035, "epoch": 4405} {"train_loss": -7.2299041748046875, "global_step": 185036, "epoch": 4405} {"train_loss": -7.202553749084473, "global_step": 185037, "epoch": 4405} {"train_loss": -7.213431358337402, "global_step": 185038, "epoch": 4405} {"train_loss": -7.174654960632324, "global_step": 185039, "epoch": 4405} {"train_loss": -7.342870712280273, "global_step": 185040, "epoch": 4405} {"train_loss": -7.244839668273926, "global_step": 185041, "epoch": 4405} {"train_loss": -7.136652946472168, "global_step": 185042, "epoch": 4405} {"train_loss": -7.182985305786133, "global_step": 185043, "epoch": 4405} {"train_loss": -7.260456562042236, "global_step": 185044, "epoch": 4405} {"train_loss": -7.207843780517578, "global_step": 185045, "epoch": 4405} {"train_loss": -7.126129150390625, "global_step": 185046, "epoch": 4405} {"train_loss": -7.174097061157227, "global_step": 185047, "epoch": 4405} {"train_loss": -7.32920503616333, "global_step": 185048, "epoch": 4405} {"train_loss": -7.166872978210449, "global_step": 185049, "epoch": 4405} {"train_loss": -7.230164527893066, "global_step": 185050, "epoch": 4405} {"train_loss": -7.1543416522798085, "global_step": 185051, "epoch": 4405, "val_loss": 80565.8046875} {"train_loss": -7.211221694946289, "global_step": 185052, "epoch": 4406} {"train_loss": -7.213868618011475, "global_step": 185053, "epoch": 4406} {"train_loss": -7.269136428833008, "global_step": 185054, "epoch": 4406} {"train_loss": -7.17284631729126, "global_step": 185055, "epoch": 4406} {"train_loss": -7.089312553405762, "global_step": 185056, "epoch": 4406} {"train_loss": -7.265658855438232, "global_step": 185057, "epoch": 4406} {"train_loss": -7.061131000518799, "global_step": 185058, "epoch": 4406} {"train_loss": -7.304888725280762, "global_step": 185059, "epoch": 4406} {"train_loss": -7.2847394943237305, "global_step": 185060, "epoch": 4406} {"train_loss": -7.052585601806641, "global_step": 185061, "epoch": 4406} {"train_loss": -7.151950836181641, "global_step": 185062, "epoch": 4406} {"train_loss": -7.078686714172363, "global_step": 185063, "epoch": 4406} {"train_loss": -7.007773399353027, "global_step": 185064, "epoch": 4406} {"train_loss": -7.1727190017700195, "global_step": 185065, "epoch": 4406} {"train_loss": -7.177641868591309, "global_step": 185066, "epoch": 4406} {"train_loss": -7.062946319580078, "global_step": 185067, "epoch": 4406} {"train_loss": -7.036264419555664, "global_step": 185068, "epoch": 4406} {"train_loss": -7.102755546569824, "global_step": 185069, "epoch": 4406} {"train_loss": -7.203136920928955, "global_step": 185070, "epoch": 4406} {"train_loss": -7.1165385246276855, "global_step": 185071, "epoch": 4406} {"train_loss": -7.099408149719238, "global_step": 185072, "epoch": 4406} {"train_loss": -7.187359809875488, "global_step": 185073, "epoch": 4406} {"train_loss": -7.000087738037109, "global_step": 185074, "epoch": 4406} {"train_loss": -7.131696701049805, "global_step": 185075, "epoch": 4406} {"train_loss": -7.097702980041504, "global_step": 185076, "epoch": 4406} {"train_loss": -6.998588562011719, "global_step": 185077, "epoch": 4406} {"train_loss": -6.9825897216796875, "global_step": 185078, "epoch": 4406} {"train_loss": -7.079283714294434, "global_step": 185079, "epoch": 4406} {"train_loss": -7.043454170227051, "global_step": 185080, "epoch": 4406} {"train_loss": -7.062797546386719, "global_step": 185081, "epoch": 4406} {"train_loss": -7.064484596252441, "global_step": 185082, "epoch": 4406} {"train_loss": -6.911383628845215, "global_step": 185083, "epoch": 4406} {"train_loss": -7.171384811401367, "global_step": 185084, "epoch": 4406} {"train_loss": -7.117724418640137, "global_step": 185085, "epoch": 4406} {"train_loss": -7.038234710693359, "global_step": 185086, "epoch": 4406} {"train_loss": -7.068477630615234, "global_step": 185087, "epoch": 4406} {"train_loss": -6.969391345977783, "global_step": 185088, "epoch": 4406} {"train_loss": -7.14111328125, "global_step": 185089, "epoch": 4406} {"train_loss": -7.114311695098877, "global_step": 185090, "epoch": 4406} {"train_loss": -7.043612480163574, "global_step": 185091, "epoch": 4406} {"train_loss": -7.034381866455078, "global_step": 185092, "epoch": 4406} {"train_loss": -7.1033166363125755, "global_step": 185093, "epoch": 4406, "val_loss": 80931.8671875} {"train_loss": -7.114218711853027, "global_step": 185094, "epoch": 4407} {"train_loss": -6.897494316101074, "global_step": 185095, "epoch": 4407} {"train_loss": -7.178868293762207, "global_step": 185096, "epoch": 4407} {"train_loss": -7.147147178649902, "global_step": 185097, "epoch": 4407} {"train_loss": -7.0774312019348145, "global_step": 185098, "epoch": 4407} {"train_loss": -7.040194511413574, "global_step": 185099, "epoch": 4407} {"train_loss": -7.149348735809326, "global_step": 185100, "epoch": 4407} {"train_loss": -7.055436134338379, "global_step": 185101, "epoch": 4407} {"train_loss": -7.117557525634766, "global_step": 185102, "epoch": 4407} {"train_loss": -7.137790679931641, "global_step": 185103, "epoch": 4407} {"train_loss": -7.0425519943237305, "global_step": 185104, "epoch": 4407} {"train_loss": -7.087994575500488, "global_step": 185105, "epoch": 4407} {"train_loss": -7.160185813903809, "global_step": 185106, "epoch": 4407} {"train_loss": -7.239818096160889, "global_step": 185107, "epoch": 4407} {"train_loss": -7.230988502502441, "global_step": 185108, "epoch": 4407} {"train_loss": -7.24785041809082, "global_step": 185109, "epoch": 4407} {"train_loss": -7.254763603210449, "global_step": 185110, "epoch": 4407} {"train_loss": -7.234138488769531, "global_step": 185111, "epoch": 4407} {"train_loss": -7.0669074058532715, "global_step": 185112, "epoch": 4407} {"train_loss": -7.182835578918457, "global_step": 185113, "epoch": 4407} {"train_loss": -7.122074127197266, "global_step": 185114, "epoch": 4407} {"train_loss": -7.245601654052734, "global_step": 185115, "epoch": 4407} {"train_loss": -7.083857536315918, "global_step": 185116, "epoch": 4407} {"train_loss": -7.0890936851501465, "global_step": 185117, "epoch": 4407} {"train_loss": -7.235443592071533, "global_step": 185118, "epoch": 4407} {"train_loss": -7.113208770751953, "global_step": 185119, "epoch": 4407} {"train_loss": -7.33437967300415, "global_step": 185120, "epoch": 4407} {"train_loss": -7.264969825744629, "global_step": 185121, "epoch": 4407} {"train_loss": -7.087650299072266, "global_step": 185122, "epoch": 4407} {"train_loss": -7.125805377960205, "global_step": 185123, "epoch": 4407} {"train_loss": -7.146551132202148, "global_step": 185124, "epoch": 4407} {"train_loss": -7.155276298522949, "global_step": 185125, "epoch": 4407} {"train_loss": -7.177408218383789, "global_step": 185126, "epoch": 4407} {"train_loss": -7.097156524658203, "global_step": 185127, "epoch": 4407} {"train_loss": -7.149409294128418, "global_step": 185128, "epoch": 4407} {"train_loss": -7.0964155197143555, "global_step": 185129, "epoch": 4407} {"train_loss": -7.058486461639404, "global_step": 185130, "epoch": 4407} {"train_loss": -7.139706611633301, "global_step": 185131, "epoch": 4407} {"train_loss": -7.263591766357422, "global_step": 185132, "epoch": 4407} {"train_loss": -7.147253513336182, "global_step": 185133, "epoch": 4407} {"train_loss": -7.08709716796875, "global_step": 185134, "epoch": 4407} {"train_loss": -7.144749119168236, "global_step": 185135, "epoch": 4407, "val_loss": 80494.5546875} {"train_loss": -7.11369514465332, "global_step": 185136, "epoch": 4408} {"train_loss": -7.191322326660156, "global_step": 185137, "epoch": 4408} {"train_loss": -7.261348724365234, "global_step": 185138, "epoch": 4408} {"train_loss": -7.121780872344971, "global_step": 185139, "epoch": 4408} {"train_loss": -7.1732563972473145, "global_step": 185140, "epoch": 4408} {"train_loss": -7.092447280883789, "global_step": 185141, "epoch": 4408} {"train_loss": -7.249985694885254, "global_step": 185142, "epoch": 4408} {"train_loss": -7.161072731018066, "global_step": 185143, "epoch": 4408} {"train_loss": -7.165142059326172, "global_step": 185144, "epoch": 4408} {"train_loss": -7.199204921722412, "global_step": 185145, "epoch": 4408} {"train_loss": -7.202099800109863, "global_step": 185146, "epoch": 4408} {"train_loss": -7.24631404876709, "global_step": 185147, "epoch": 4408} {"train_loss": -7.1146931648254395, "global_step": 185148, "epoch": 4408} {"train_loss": -7.207414150238037, "global_step": 185149, "epoch": 4408} {"train_loss": -7.189453125, "global_step": 185150, "epoch": 4408} {"train_loss": -6.973979949951172, "global_step": 185151, "epoch": 4408} {"train_loss": -6.983283996582031, "global_step": 185152, "epoch": 4408} {"train_loss": -7.095046043395996, "global_step": 185153, "epoch": 4408} {"train_loss": -7.091534614562988, "global_step": 185154, "epoch": 4408} {"train_loss": -6.922709941864014, "global_step": 185155, "epoch": 4408} {"train_loss": -7.096216201782227, "global_step": 185156, "epoch": 4408} {"train_loss": -6.903675556182861, "global_step": 185157, "epoch": 4408} {"train_loss": -7.026891231536865, "global_step": 185158, "epoch": 4408} {"train_loss": -7.069087028503418, "global_step": 185159, "epoch": 4408} {"train_loss": -7.16903018951416, "global_step": 185160, "epoch": 4408} {"train_loss": -7.135114669799805, "global_step": 185161, "epoch": 4408} {"train_loss": -6.995136260986328, "global_step": 185162, "epoch": 4408} {"train_loss": -7.260133743286133, "global_step": 185163, "epoch": 4408} {"train_loss": -7.163735389709473, "global_step": 185164, "epoch": 4408} {"train_loss": -7.244622230529785, "global_step": 185165, "epoch": 4408} {"train_loss": -7.156556606292725, "global_step": 185166, "epoch": 4408} {"train_loss": -7.163381099700928, "global_step": 185167, "epoch": 4408} {"train_loss": -7.229443550109863, "global_step": 185168, "epoch": 4408} {"train_loss": -7.1067376136779785, "global_step": 185169, "epoch": 4408} {"train_loss": -7.160553932189941, "global_step": 185170, "epoch": 4408} {"train_loss": -7.156302452087402, "global_step": 185171, "epoch": 4408} {"train_loss": -7.236433982849121, "global_step": 185172, "epoch": 4408} {"train_loss": -7.100399017333984, "global_step": 185173, "epoch": 4408} {"train_loss": -7.041485786437988, "global_step": 185174, "epoch": 4408} {"train_loss": -7.195866584777832, "global_step": 185175, "epoch": 4408} {"train_loss": -7.120377063751221, "global_step": 185176, "epoch": 4408} {"train_loss": -7.1381355580829435, "global_step": 185177, "epoch": 4408, "val_loss": 80751.6640625} {"train_loss": -7.284938812255859, "global_step": 185178, "epoch": 4409} {"train_loss": -7.107020378112793, "global_step": 185179, "epoch": 4409} {"train_loss": -7.22821569442749, "global_step": 185180, "epoch": 4409} {"train_loss": -7.0499773025512695, "global_step": 185181, "epoch": 4409} {"train_loss": -7.092074394226074, "global_step": 185182, "epoch": 4409} {"train_loss": -7.091667652130127, "global_step": 185183, "epoch": 4409} {"train_loss": -7.2109375, "global_step": 185184, "epoch": 4409} {"train_loss": -7.0861921310424805, "global_step": 185185, "epoch": 4409} {"train_loss": -7.188227653503418, "global_step": 185186, "epoch": 4409} {"train_loss": -7.136300086975098, "global_step": 185187, "epoch": 4409} {"train_loss": -7.0638604164123535, "global_step": 185188, "epoch": 4409} {"train_loss": -7.224987983703613, "global_step": 185189, "epoch": 4409} {"train_loss": -7.124804496765137, "global_step": 185190, "epoch": 4409} {"train_loss": -7.122158527374268, "global_step": 185191, "epoch": 4409} {"train_loss": -7.208717346191406, "global_step": 185192, "epoch": 4409} {"train_loss": -7.099448204040527, "global_step": 185193, "epoch": 4409} {"train_loss": -7.213983535766602, "global_step": 185194, "epoch": 4409} {"train_loss": -7.198772430419922, "global_step": 185195, "epoch": 4409} {"train_loss": -7.205829620361328, "global_step": 185196, "epoch": 4409} {"train_loss": -7.139703750610352, "global_step": 185197, "epoch": 4409} {"train_loss": -7.219703674316406, "global_step": 185198, "epoch": 4409} {"train_loss": -7.226366996765137, "global_step": 185199, "epoch": 4409} {"train_loss": -7.135919570922852, "global_step": 185200, "epoch": 4409} {"train_loss": -7.207254886627197, "global_step": 185201, "epoch": 4409} {"train_loss": -7.165182590484619, "global_step": 185202, "epoch": 4409} {"train_loss": -7.07914400100708, "global_step": 185203, "epoch": 4409} {"train_loss": -7.210465431213379, "global_step": 185204, "epoch": 4409} {"train_loss": -7.199702262878418, "global_step": 185205, "epoch": 4409} {"train_loss": -7.121737480163574, "global_step": 185206, "epoch": 4409} {"train_loss": -7.182139873504639, "global_step": 185207, "epoch": 4409} {"train_loss": -7.134731292724609, "global_step": 185208, "epoch": 4409} {"train_loss": -7.143348693847656, "global_step": 185209, "epoch": 4409} {"train_loss": -7.197452545166016, "global_step": 185210, "epoch": 4409} {"train_loss": -7.048517227172852, "global_step": 185211, "epoch": 4409} {"train_loss": -7.149672508239746, "global_step": 185212, "epoch": 4409} {"train_loss": -7.143213272094727, "global_step": 185213, "epoch": 4409} {"train_loss": -7.082612037658691, "global_step": 185214, "epoch": 4409} {"train_loss": -7.186017036437988, "global_step": 185215, "epoch": 4409} {"train_loss": -7.050694465637207, "global_step": 185216, "epoch": 4409} {"train_loss": -7.082761764526367, "global_step": 185217, "epoch": 4409} {"train_loss": -6.909152507781982, "global_step": 185218, "epoch": 4409} {"train_loss": -7.141672929128011, "global_step": 185219, "epoch": 4409, "val_loss": 80740.5625} {"train_loss": -7.072209358215332, "global_step": 185220, "epoch": 4410} {"train_loss": -7.025411605834961, "global_step": 185221, "epoch": 4410} {"train_loss": -7.0785932540893555, "global_step": 185222, "epoch": 4410} {"train_loss": -6.981884956359863, "global_step": 185223, "epoch": 4410} {"train_loss": -7.161435127258301, "global_step": 185224, "epoch": 4410} {"train_loss": -7.09811544418335, "global_step": 185225, "epoch": 4410} {"train_loss": -7.1501922607421875, "global_step": 185226, "epoch": 4410} {"train_loss": -7.042499542236328, "global_step": 185227, "epoch": 4410} {"train_loss": -7.237031936645508, "global_step": 185228, "epoch": 4410} {"train_loss": -7.163577079772949, "global_step": 185229, "epoch": 4410} {"train_loss": -7.078254699707031, "global_step": 185230, "epoch": 4410} {"train_loss": -7.185341835021973, "global_step": 185231, "epoch": 4410} {"train_loss": -7.0902605056762695, "global_step": 185232, "epoch": 4410} {"train_loss": -7.13358211517334, "global_step": 185233, "epoch": 4410} {"train_loss": -6.976675987243652, "global_step": 185234, "epoch": 4410} {"train_loss": -7.10787296295166, "global_step": 185235, "epoch": 4410} {"train_loss": -6.973466873168945, "global_step": 185236, "epoch": 4410} {"train_loss": -7.140074253082275, "global_step": 185237, "epoch": 4410} {"train_loss": -7.068282127380371, "global_step": 185238, "epoch": 4410} {"train_loss": -7.126328468322754, "global_step": 185239, "epoch": 4410} {"train_loss": -7.154669761657715, "global_step": 185240, "epoch": 4410} {"train_loss": -7.14001989364624, "global_step": 185241, "epoch": 4410} {"train_loss": -7.156335353851318, "global_step": 185242, "epoch": 4410} {"train_loss": -6.989776134490967, "global_step": 185243, "epoch": 4410} {"train_loss": -7.238009452819824, "global_step": 185244, "epoch": 4410} {"train_loss": -7.034364700317383, "global_step": 185245, "epoch": 4410} {"train_loss": -7.15140438079834, "global_step": 185246, "epoch": 4410} {"train_loss": -6.938791275024414, "global_step": 185247, "epoch": 4410} {"train_loss": -7.135557174682617, "global_step": 185248, "epoch": 4410} {"train_loss": -7.14401912689209, "global_step": 185249, "epoch": 4410} {"train_loss": -6.994567394256592, "global_step": 185250, "epoch": 4410} {"train_loss": -7.116033554077148, "global_step": 185251, "epoch": 4410} {"train_loss": -7.092947006225586, "global_step": 185252, "epoch": 4410} {"train_loss": -7.026245594024658, "global_step": 185253, "epoch": 4410} {"train_loss": -7.067540168762207, "global_step": 185254, "epoch": 4410} {"train_loss": -7.076351165771484, "global_step": 185255, "epoch": 4410} {"train_loss": -6.944610595703125, "global_step": 185256, "epoch": 4410} {"train_loss": -7.023615837097168, "global_step": 185257, "epoch": 4410} {"train_loss": -7.007180213928223, "global_step": 185258, "epoch": 4410} {"train_loss": -7.083556175231934, "global_step": 185259, "epoch": 4410} {"train_loss": -7.070717811584473, "global_step": 185260, "epoch": 4410} {"train_loss": -7.085040875843593, "global_step": 185261, "epoch": 4410, "val_loss": 80890.1796875} {"train_loss": -7.14681339263916, "global_step": 185262, "epoch": 4411} {"train_loss": -7.108766555786133, "global_step": 185263, "epoch": 4411} {"train_loss": -7.16386604309082, "global_step": 185264, "epoch": 4411} {"train_loss": -7.198925018310547, "global_step": 185265, "epoch": 4411} {"train_loss": -7.169548988342285, "global_step": 185266, "epoch": 4411} {"train_loss": -7.252006530761719, "global_step": 185267, "epoch": 4411} {"train_loss": -7.093007564544678, "global_step": 185268, "epoch": 4411} {"train_loss": -7.178846836090088, "global_step": 185269, "epoch": 4411} {"train_loss": -7.046722412109375, "global_step": 185270, "epoch": 4411} {"train_loss": -7.138420581817627, "global_step": 185271, "epoch": 4411} {"train_loss": -7.005563259124756, "global_step": 185272, "epoch": 4411} {"train_loss": -7.218197822570801, "global_step": 185273, "epoch": 4411} {"train_loss": -7.126299858093262, "global_step": 185274, "epoch": 4411} {"train_loss": -7.186789035797119, "global_step": 185275, "epoch": 4411} {"train_loss": -6.992142200469971, "global_step": 185276, "epoch": 4411} {"train_loss": -7.026309967041016, "global_step": 185277, "epoch": 4411} {"train_loss": -7.240198135375977, "global_step": 185278, "epoch": 4411} {"train_loss": -7.068188190460205, "global_step": 185279, "epoch": 4411} {"train_loss": -7.164947032928467, "global_step": 185280, "epoch": 4411} {"train_loss": -7.137972831726074, "global_step": 185281, "epoch": 4411} {"train_loss": -7.046599388122559, "global_step": 185282, "epoch": 4411} {"train_loss": -7.122745990753174, "global_step": 185283, "epoch": 4411} {"train_loss": -7.131964683532715, "global_step": 185284, "epoch": 4411} {"train_loss": -7.1466288566589355, "global_step": 185285, "epoch": 4411} {"train_loss": -7.185942649841309, "global_step": 185286, "epoch": 4411} {"train_loss": -7.1949543952941895, "global_step": 185287, "epoch": 4411} {"train_loss": -7.202914237976074, "global_step": 185288, "epoch": 4411} {"train_loss": -7.248111724853516, "global_step": 185289, "epoch": 4411} {"train_loss": -7.0120649337768555, "global_step": 185290, "epoch": 4411} {"train_loss": -7.087198257446289, "global_step": 185291, "epoch": 4411} {"train_loss": -7.110681056976318, "global_step": 185292, "epoch": 4411} {"train_loss": -7.158141136169434, "global_step": 185293, "epoch": 4411} {"train_loss": -7.050429344177246, "global_step": 185294, "epoch": 4411} {"train_loss": -7.090087890625, "global_step": 185295, "epoch": 4411} {"train_loss": -7.0808258056640625, "global_step": 185296, "epoch": 4411} {"train_loss": -7.084816932678223, "global_step": 185297, "epoch": 4411} {"train_loss": -7.182760238647461, "global_step": 185298, "epoch": 4411} {"train_loss": -7.1255364418029785, "global_step": 185299, "epoch": 4411} {"train_loss": -7.112669944763184, "global_step": 185300, "epoch": 4411} {"train_loss": -7.091494560241699, "global_step": 185301, "epoch": 4411} {"train_loss": -7.206671237945557, "global_step": 185302, "epoch": 4411} {"train_loss": -7.130749236969721, "global_step": 185303, "epoch": 4411, "val_loss": 80758.2890625} {"train_loss": -7.163725852966309, "global_step": 185304, "epoch": 4412} {"train_loss": -7.089916229248047, "global_step": 185305, "epoch": 4412} {"train_loss": -7.220423698425293, "global_step": 185306, "epoch": 4412} {"train_loss": -7.200038909912109, "global_step": 185307, "epoch": 4412} {"train_loss": -7.244697570800781, "global_step": 185308, "epoch": 4412} {"train_loss": -7.188723087310791, "global_step": 185309, "epoch": 4412} {"train_loss": -7.2826385498046875, "global_step": 185310, "epoch": 4412} {"train_loss": -7.294196128845215, "global_step": 185311, "epoch": 4412} {"train_loss": -7.204995155334473, "global_step": 185312, "epoch": 4412} {"train_loss": -7.296204566955566, "global_step": 185313, "epoch": 4412} {"train_loss": -7.217551231384277, "global_step": 185314, "epoch": 4412} {"train_loss": -7.250070095062256, "global_step": 185315, "epoch": 4412} {"train_loss": -7.227956771850586, "global_step": 185316, "epoch": 4412} {"train_loss": -7.099023818969727, "global_step": 185317, "epoch": 4412} {"train_loss": -7.1041436195373535, "global_step": 185318, "epoch": 4412} {"train_loss": -7.160228729248047, "global_step": 185319, "epoch": 4412} {"train_loss": -7.132248878479004, "global_step": 185320, "epoch": 4412} {"train_loss": -7.070401191711426, "global_step": 185321, "epoch": 4412} {"train_loss": -7.166329383850098, "global_step": 185322, "epoch": 4412} {"train_loss": -7.171014785766602, "global_step": 185323, "epoch": 4412} {"train_loss": -7.105051517486572, "global_step": 185324, "epoch": 4412} {"train_loss": -7.187302589416504, "global_step": 185325, "epoch": 4412} {"train_loss": -7.126808166503906, "global_step": 185326, "epoch": 4412} {"train_loss": -7.1237287521362305, "global_step": 185327, "epoch": 4412} {"train_loss": -7.234319686889648, "global_step": 185328, "epoch": 4412} {"train_loss": -7.236412048339844, "global_step": 185329, "epoch": 4412} {"train_loss": -7.245724678039551, "global_step": 185330, "epoch": 4412} {"train_loss": -7.22243595123291, "global_step": 185331, "epoch": 4412} {"train_loss": -7.257131099700928, "global_step": 185332, "epoch": 4412} {"train_loss": -7.251105308532715, "global_step": 185333, "epoch": 4412} {"train_loss": -7.192405700683594, "global_step": 185334, "epoch": 4412} {"train_loss": -7.27121639251709, "global_step": 185335, "epoch": 4412} {"train_loss": -7.193368911743164, "global_step": 185336, "epoch": 4412} {"train_loss": -7.158529758453369, "global_step": 185337, "epoch": 4412} {"train_loss": -7.192842483520508, "global_step": 185338, "epoch": 4412} {"train_loss": -7.2438459396362305, "global_step": 185339, "epoch": 4412} {"train_loss": -7.111424446105957, "global_step": 185340, "epoch": 4412} {"train_loss": -7.230422019958496, "global_step": 185341, "epoch": 4412} {"train_loss": -7.250940799713135, "global_step": 185342, "epoch": 4412} {"train_loss": -7.252839088439941, "global_step": 185343, "epoch": 4412} {"train_loss": -7.314558506011963, "global_step": 185344, "epoch": 4412} {"train_loss": -7.200221549896967, "global_step": 185345, "epoch": 4412, "val_loss": 80779.4375} {"train_loss": -7.1156744956970215, "global_step": 185346, "epoch": 4413} {"train_loss": -7.207335472106934, "global_step": 185347, "epoch": 4413} {"train_loss": -7.2430830001831055, "global_step": 185348, "epoch": 4413} {"train_loss": -7.142640590667725, "global_step": 185349, "epoch": 4413} {"train_loss": -7.290323257446289, "global_step": 185350, "epoch": 4413} {"train_loss": -7.216168403625488, "global_step": 185351, "epoch": 4413} {"train_loss": -7.135668754577637, "global_step": 185352, "epoch": 4413} {"train_loss": -7.231263637542725, "global_step": 185353, "epoch": 4413} {"train_loss": -7.20393180847168, "global_step": 185354, "epoch": 4413} {"train_loss": -7.124242305755615, "global_step": 185355, "epoch": 4413} {"train_loss": -7.222623348236084, "global_step": 185356, "epoch": 4413} {"train_loss": -7.295807838439941, "global_step": 185357, "epoch": 4413} {"train_loss": -7.243153095245361, "global_step": 185358, "epoch": 4413} {"train_loss": -7.126275062561035, "global_step": 185359, "epoch": 4413} {"train_loss": -7.252394676208496, "global_step": 185360, "epoch": 4413} {"train_loss": -7.23324728012085, "global_step": 185361, "epoch": 4413} {"train_loss": -7.11175537109375, "global_step": 185362, "epoch": 4413} {"train_loss": -7.173460960388184, "global_step": 185363, "epoch": 4413} {"train_loss": -7.186404228210449, "global_step": 185364, "epoch": 4413} {"train_loss": -6.970929145812988, "global_step": 185365, "epoch": 4413} {"train_loss": -7.160592079162598, "global_step": 185366, "epoch": 4413} {"train_loss": -7.080137252807617, "global_step": 185367, "epoch": 4413} {"train_loss": -7.138420104980469, "global_step": 185368, "epoch": 4413} {"train_loss": -7.142786026000977, "global_step": 185369, "epoch": 4413} {"train_loss": -7.174363613128662, "global_step": 185370, "epoch": 4413} {"train_loss": -7.172661781311035, "global_step": 185371, "epoch": 4413} {"train_loss": -7.30654764175415, "global_step": 185372, "epoch": 4413} {"train_loss": -7.125101566314697, "global_step": 185373, "epoch": 4413} {"train_loss": -7.155059814453125, "global_step": 185374, "epoch": 4413} {"train_loss": -7.210049152374268, "global_step": 185375, "epoch": 4413} {"train_loss": -7.093145847320557, "global_step": 185376, "epoch": 4413} {"train_loss": -7.263418197631836, "global_step": 185377, "epoch": 4413} {"train_loss": -7.180751800537109, "global_step": 185378, "epoch": 4413} {"train_loss": -7.255016326904297, "global_step": 185379, "epoch": 4413} {"train_loss": -7.163661479949951, "global_step": 185380, "epoch": 4413} {"train_loss": -7.151484489440918, "global_step": 185381, "epoch": 4413} {"train_loss": -7.045192718505859, "global_step": 185382, "epoch": 4413} {"train_loss": -7.210448265075684, "global_step": 185383, "epoch": 4413} {"train_loss": -7.206565856933594, "global_step": 185384, "epoch": 4413} {"train_loss": -7.202668190002441, "global_step": 185385, "epoch": 4413} {"train_loss": -7.235262870788574, "global_step": 185386, "epoch": 4413} {"train_loss": -7.183664480845134, "global_step": 185387, "epoch": 4413, "val_loss": 80699.2421875} {"train_loss": -7.233885765075684, "global_step": 185388, "epoch": 4414} {"train_loss": -7.246979236602783, "global_step": 185389, "epoch": 4414} {"train_loss": -7.196885108947754, "global_step": 185390, "epoch": 4414} {"train_loss": -7.2548112869262695, "global_step": 185391, "epoch": 4414} {"train_loss": -7.173131942749023, "global_step": 185392, "epoch": 4414} {"train_loss": -7.208643913269043, "global_step": 185393, "epoch": 4414} {"train_loss": -7.076363563537598, "global_step": 185394, "epoch": 4414} {"train_loss": -7.198176383972168, "global_step": 185395, "epoch": 4414} {"train_loss": -7.210561752319336, "global_step": 185396, "epoch": 4414} {"train_loss": -7.260281085968018, "global_step": 185397, "epoch": 4414} {"train_loss": -7.143281936645508, "global_step": 185398, "epoch": 4414} {"train_loss": -7.090434551239014, "global_step": 185399, "epoch": 4414} {"train_loss": -7.046473026275635, "global_step": 185400, "epoch": 4414} {"train_loss": -7.163839340209961, "global_step": 185401, "epoch": 4414} {"train_loss": -7.267485618591309, "global_step": 185402, "epoch": 4414} {"train_loss": -7.3309736251831055, "global_step": 185403, "epoch": 4414} {"train_loss": -7.115523815155029, "global_step": 185404, "epoch": 4414} {"train_loss": -7.284200668334961, "global_step": 185405, "epoch": 4414} {"train_loss": -7.188017845153809, "global_step": 185406, "epoch": 4414} {"train_loss": -7.131534576416016, "global_step": 185407, "epoch": 4414} {"train_loss": -7.209403991699219, "global_step": 185408, "epoch": 4414} {"train_loss": -7.126228332519531, "global_step": 185409, "epoch": 4414} {"train_loss": -7.143442153930664, "global_step": 185410, "epoch": 4414} {"train_loss": -7.205968856811523, "global_step": 185411, "epoch": 4414} {"train_loss": -7.122804641723633, "global_step": 185412, "epoch": 4414} {"train_loss": -7.122381210327148, "global_step": 185413, "epoch": 4414} {"train_loss": -7.146875858306885, "global_step": 185414, "epoch": 4414} {"train_loss": -7.100440979003906, "global_step": 185415, "epoch": 4414} {"train_loss": -7.283862590789795, "global_step": 185416, "epoch": 4414} {"train_loss": -7.141819477081299, "global_step": 185417, "epoch": 4414} {"train_loss": -7.185447692871094, "global_step": 185418, "epoch": 4414} {"train_loss": -7.096739292144775, "global_step": 185419, "epoch": 4414} {"train_loss": -7.091859817504883, "global_step": 185420, "epoch": 4414} {"train_loss": -7.104133605957031, "global_step": 185421, "epoch": 4414} {"train_loss": -7.0251264572143555, "global_step": 185422, "epoch": 4414} {"train_loss": -7.223838806152344, "global_step": 185423, "epoch": 4414} {"train_loss": -7.1521196365356445, "global_step": 185424, "epoch": 4414} {"train_loss": -7.123257637023926, "global_step": 185425, "epoch": 4414} {"train_loss": -7.183757781982422, "global_step": 185426, "epoch": 4414} {"train_loss": -7.129281997680664, "global_step": 185427, "epoch": 4414} {"train_loss": -7.074008941650391, "global_step": 185428, "epoch": 4414} {"train_loss": -7.16515208425976, "global_step": 185429, "epoch": 4414, "val_loss": 80707.9453125} {"train_loss": -7.144059658050537, "global_step": 185430, "epoch": 4415} {"train_loss": -7.247779369354248, "global_step": 185431, "epoch": 4415} {"train_loss": -7.183688163757324, "global_step": 185432, "epoch": 4415} {"train_loss": -7.06304931640625, "global_step": 185433, "epoch": 4415} {"train_loss": -7.141179084777832, "global_step": 185434, "epoch": 4415} {"train_loss": -7.193440914154053, "global_step": 185435, "epoch": 4415} {"train_loss": -7.033968448638916, "global_step": 185436, "epoch": 4415} {"train_loss": -7.237637519836426, "global_step": 185437, "epoch": 4415} {"train_loss": -7.112367153167725, "global_step": 185438, "epoch": 4415} {"train_loss": -7.125106334686279, "global_step": 185439, "epoch": 4415} {"train_loss": -7.152866363525391, "global_step": 185440, "epoch": 4415} {"train_loss": -7.146413803100586, "global_step": 185441, "epoch": 4415} {"train_loss": -7.1342878341674805, "global_step": 185442, "epoch": 4415} {"train_loss": -7.262637615203857, "global_step": 185443, "epoch": 4415} {"train_loss": -7.083627700805664, "global_step": 185444, "epoch": 4415} {"train_loss": -7.184261798858643, "global_step": 185445, "epoch": 4415} {"train_loss": -7.11804723739624, "global_step": 185446, "epoch": 4415} {"train_loss": -7.223783493041992, "global_step": 185447, "epoch": 4415} {"train_loss": -7.135451316833496, "global_step": 185448, "epoch": 4415} {"train_loss": -7.146372318267822, "global_step": 185449, "epoch": 4415} {"train_loss": -7.166203498840332, "global_step": 185450, "epoch": 4415} {"train_loss": -7.043898582458496, "global_step": 185451, "epoch": 4415} {"train_loss": -6.962845802307129, "global_step": 185452, "epoch": 4415} {"train_loss": -7.198187828063965, "global_step": 185453, "epoch": 4415} {"train_loss": -7.185877799987793, "global_step": 185454, "epoch": 4415} {"train_loss": -7.14037561416626, "global_step": 185455, "epoch": 4415} {"train_loss": -7.128520965576172, "global_step": 185456, "epoch": 4415} {"train_loss": -7.209933757781982, "global_step": 185457, "epoch": 4415} {"train_loss": -7.164004325866699, "global_step": 185458, "epoch": 4415} {"train_loss": -7.14434814453125, "global_step": 185459, "epoch": 4415} {"train_loss": -7.107151985168457, "global_step": 185460, "epoch": 4415} {"train_loss": -7.232206344604492, "global_step": 185461, "epoch": 4415} {"train_loss": -7.134167671203613, "global_step": 185462, "epoch": 4415} {"train_loss": -7.204827785491943, "global_step": 185463, "epoch": 4415} {"train_loss": -7.15522575378418, "global_step": 185464, "epoch": 4415} {"train_loss": -7.105878829956055, "global_step": 185465, "epoch": 4415} {"train_loss": -7.117598533630371, "global_step": 185466, "epoch": 4415} {"train_loss": -7.183978080749512, "global_step": 185467, "epoch": 4415} {"train_loss": -7.2868876457214355, "global_step": 185468, "epoch": 4415} {"train_loss": -7.282138824462891, "global_step": 185469, "epoch": 4415} {"train_loss": -7.125023365020752, "global_step": 185470, "epoch": 4415} {"train_loss": -7.1561858881087534, "global_step": 185471, "epoch": 4415, "val_loss": 80836.7109375} {"train_loss": -7.207760810852051, "global_step": 185472, "epoch": 4416} {"train_loss": -7.224122524261475, "global_step": 185473, "epoch": 4416} {"train_loss": -7.204418659210205, "global_step": 185474, "epoch": 4416} {"train_loss": -7.19492769241333, "global_step": 185475, "epoch": 4416} {"train_loss": -7.281207084655762, "global_step": 185476, "epoch": 4416} {"train_loss": -7.1598711013793945, "global_step": 185477, "epoch": 4416} {"train_loss": -7.091316223144531, "global_step": 185478, "epoch": 4416} {"train_loss": -7.209024429321289, "global_step": 185479, "epoch": 4416} {"train_loss": -7.216271877288818, "global_step": 185480, "epoch": 4416} {"train_loss": -7.1780009269714355, "global_step": 185481, "epoch": 4416} {"train_loss": -7.274085998535156, "global_step": 185482, "epoch": 4416} {"train_loss": -7.227855682373047, "global_step": 185483, "epoch": 4416} {"train_loss": -7.2397565841674805, "global_step": 185484, "epoch": 4416} {"train_loss": -7.263137340545654, "global_step": 185485, "epoch": 4416} {"train_loss": -7.172440528869629, "global_step": 185486, "epoch": 4416} {"train_loss": -7.162351608276367, "global_step": 185487, "epoch": 4416} {"train_loss": -7.134855270385742, "global_step": 185488, "epoch": 4416} {"train_loss": -7.198522567749023, "global_step": 185489, "epoch": 4416} {"train_loss": -7.207057476043701, "global_step": 185490, "epoch": 4416} {"train_loss": -7.170142650604248, "global_step": 185491, "epoch": 4416} {"train_loss": -7.188583850860596, "global_step": 185492, "epoch": 4416} {"train_loss": -7.192248344421387, "global_step": 185493, "epoch": 4416} {"train_loss": -7.193624019622803, "global_step": 185494, "epoch": 4416} {"train_loss": -7.164150238037109, "global_step": 185495, "epoch": 4416} {"train_loss": -7.135660171508789, "global_step": 185496, "epoch": 4416} {"train_loss": -7.298715591430664, "global_step": 185497, "epoch": 4416} {"train_loss": -7.078248500823975, "global_step": 185498, "epoch": 4416} {"train_loss": -7.206830978393555, "global_step": 185499, "epoch": 4416} {"train_loss": -7.129439353942871, "global_step": 185500, "epoch": 4416} {"train_loss": -7.2305779457092285, "global_step": 185501, "epoch": 4416} {"train_loss": -7.2630391120910645, "global_step": 185502, "epoch": 4416} {"train_loss": -7.214041709899902, "global_step": 185503, "epoch": 4416} {"train_loss": -7.196577072143555, "global_step": 185504, "epoch": 4416} {"train_loss": -7.381659507751465, "global_step": 185505, "epoch": 4416} {"train_loss": -7.172308921813965, "global_step": 185506, "epoch": 4416} {"train_loss": -7.238012313842773, "global_step": 185507, "epoch": 4416} {"train_loss": -7.267120361328125, "global_step": 185508, "epoch": 4416} {"train_loss": -7.161838531494141, "global_step": 185509, "epoch": 4416} {"train_loss": -7.088832378387451, "global_step": 185510, "epoch": 4416} {"train_loss": -7.201747417449951, "global_step": 185511, "epoch": 4416} {"train_loss": -7.1803483963012695, "global_step": 185512, "epoch": 4416} {"train_loss": -7.1959760302589055, "global_step": 185513, "epoch": 4416, "val_loss": 80909.0546875} {"train_loss": -7.072851181030273, "global_step": 185514, "epoch": 4417} {"train_loss": -7.116851806640625, "global_step": 185515, "epoch": 4417} {"train_loss": -7.03068733215332, "global_step": 185516, "epoch": 4417} {"train_loss": -7.008119106292725, "global_step": 185517, "epoch": 4417} {"train_loss": -7.19795036315918, "global_step": 185518, "epoch": 4417} {"train_loss": -7.200301170349121, "global_step": 185519, "epoch": 4417} {"train_loss": -7.075740814208984, "global_step": 185520, "epoch": 4417} {"train_loss": -7.154741287231445, "global_step": 185521, "epoch": 4417} {"train_loss": -7.171056747436523, "global_step": 185522, "epoch": 4417} {"train_loss": -7.097527503967285, "global_step": 185523, "epoch": 4417} {"train_loss": -7.0675740242004395, "global_step": 185524, "epoch": 4417} {"train_loss": -7.177588939666748, "global_step": 185525, "epoch": 4417} {"train_loss": -7.202699661254883, "global_step": 185526, "epoch": 4417} {"train_loss": -7.0631608963012695, "global_step": 185527, "epoch": 4417} {"train_loss": -7.1188812255859375, "global_step": 185528, "epoch": 4417} {"train_loss": -7.22647762298584, "global_step": 185529, "epoch": 4417} {"train_loss": -7.007262229919434, "global_step": 185530, "epoch": 4417} {"train_loss": -7.091135025024414, "global_step": 185531, "epoch": 4417} {"train_loss": -7.173733711242676, "global_step": 185532, "epoch": 4417} {"train_loss": -7.105752944946289, "global_step": 185533, "epoch": 4417} {"train_loss": -7.025639533996582, "global_step": 185534, "epoch": 4417} {"train_loss": -7.08920955657959, "global_step": 185535, "epoch": 4417} {"train_loss": -7.184015274047852, "global_step": 185536, "epoch": 4417} {"train_loss": -7.103670120239258, "global_step": 185537, "epoch": 4417} {"train_loss": -7.071061134338379, "global_step": 185538, "epoch": 4417} {"train_loss": -7.006533145904541, "global_step": 185539, "epoch": 4417} {"train_loss": -6.977303504943848, "global_step": 185540, "epoch": 4417} {"train_loss": -7.1668171882629395, "global_step": 185541, "epoch": 4417} {"train_loss": -7.113245010375977, "global_step": 185542, "epoch": 4417} {"train_loss": -7.198239803314209, "global_step": 185543, "epoch": 4417} {"train_loss": -6.982300758361816, "global_step": 185544, "epoch": 4417} {"train_loss": -7.223882675170898, "global_step": 185545, "epoch": 4417} {"train_loss": -7.111473083496094, "global_step": 185546, "epoch": 4417} {"train_loss": -7.070613861083984, "global_step": 185547, "epoch": 4417} {"train_loss": -7.060065746307373, "global_step": 185548, "epoch": 4417} {"train_loss": -7.135342597961426, "global_step": 185549, "epoch": 4417} {"train_loss": -6.868368148803711, "global_step": 185550, "epoch": 4417} {"train_loss": -7.081019878387451, "global_step": 185551, "epoch": 4417} {"train_loss": -7.052219390869141, "global_step": 185552, "epoch": 4417} {"train_loss": -7.1935014724731445, "global_step": 185553, "epoch": 4417} {"train_loss": -7.007092475891113, "global_step": 185554, "epoch": 4417} {"train_loss": -7.099811905906314, "global_step": 185555, "epoch": 4417, "val_loss": 80595.90625} {"train_loss": -7.031832695007324, "global_step": 185556, "epoch": 4418} {"train_loss": -7.117031574249268, "global_step": 185557, "epoch": 4418} {"train_loss": -7.082764625549316, "global_step": 185558, "epoch": 4418} {"train_loss": -7.013483047485352, "global_step": 185559, "epoch": 4418} {"train_loss": -7.137694358825684, "global_step": 185560, "epoch": 4418} {"train_loss": -7.1050615310668945, "global_step": 185561, "epoch": 4418} {"train_loss": -7.17344856262207, "global_step": 185562, "epoch": 4418} {"train_loss": -7.198957920074463, "global_step": 185563, "epoch": 4418} {"train_loss": -7.135471343994141, "global_step": 185564, "epoch": 4418} {"train_loss": -7.0397539138793945, "global_step": 185565, "epoch": 4418} {"train_loss": -7.297364711761475, "global_step": 185566, "epoch": 4418} {"train_loss": -7.22464656829834, "global_step": 185567, "epoch": 4418} {"train_loss": -7.12468957901001, "global_step": 185568, "epoch": 4418} {"train_loss": -7.183152198791504, "global_step": 185569, "epoch": 4418} {"train_loss": -7.130671501159668, "global_step": 185570, "epoch": 4418} {"train_loss": -7.108279228210449, "global_step": 185571, "epoch": 4418} {"train_loss": -7.147132873535156, "global_step": 185572, "epoch": 4418} {"train_loss": -7.120710849761963, "global_step": 185573, "epoch": 4418} {"train_loss": -7.16584587097168, "global_step": 185574, "epoch": 4418} {"train_loss": -7.187752723693848, "global_step": 185575, "epoch": 4418} {"train_loss": -7.14137077331543, "global_step": 185576, "epoch": 4418} {"train_loss": -7.2427167892456055, "global_step": 185577, "epoch": 4418} {"train_loss": -7.167442321777344, "global_step": 185578, "epoch": 4418} {"train_loss": -7.312726020812988, "global_step": 185579, "epoch": 4418} {"train_loss": -7.313056468963623, "global_step": 185580, "epoch": 4418} {"train_loss": -7.281712532043457, "global_step": 185581, "epoch": 4418} {"train_loss": -7.152870178222656, "global_step": 185582, "epoch": 4418} {"train_loss": -7.2830281257629395, "global_step": 185583, "epoch": 4418} {"train_loss": -7.2002081871032715, "global_step": 185584, "epoch": 4418} {"train_loss": -7.217865943908691, "global_step": 185585, "epoch": 4418} {"train_loss": -7.255400657653809, "global_step": 185586, "epoch": 4418} {"train_loss": -7.275678634643555, "global_step": 185587, "epoch": 4418} {"train_loss": -7.2130842208862305, "global_step": 185588, "epoch": 4418} {"train_loss": -7.205207347869873, "global_step": 185589, "epoch": 4418} {"train_loss": -7.1967453956604, "global_step": 185590, "epoch": 4418} {"train_loss": -7.1540021896362305, "global_step": 185591, "epoch": 4418} {"train_loss": -7.139436721801758, "global_step": 185592, "epoch": 4418} {"train_loss": -7.205349445343018, "global_step": 185593, "epoch": 4418} {"train_loss": -7.274044990539551, "global_step": 185594, "epoch": 4418} {"train_loss": -7.001887798309326, "global_step": 185595, "epoch": 4418} {"train_loss": -7.194855690002441, "global_step": 185596, "epoch": 4418} {"train_loss": -7.176677340552921, "global_step": 185597, "epoch": 4418, "val_loss": 80727.96875} {"train_loss": -7.145984649658203, "global_step": 185598, "epoch": 4419} {"train_loss": -7.249227523803711, "global_step": 185599, "epoch": 4419} {"train_loss": -7.222274303436279, "global_step": 185600, "epoch": 4419} {"train_loss": -7.22755765914917, "global_step": 185601, "epoch": 4419} {"train_loss": -7.179167747497559, "global_step": 185602, "epoch": 4419} {"train_loss": -7.098845481872559, "global_step": 185603, "epoch": 4419} {"train_loss": -7.198336601257324, "global_step": 185604, "epoch": 4419} {"train_loss": -7.154910087585449, "global_step": 185605, "epoch": 4419} {"train_loss": -7.161741256713867, "global_step": 185606, "epoch": 4419} {"train_loss": -7.151829242706299, "global_step": 185607, "epoch": 4419} {"train_loss": -7.187200546264648, "global_step": 185608, "epoch": 4419} {"train_loss": -7.102290153503418, "global_step": 185609, "epoch": 4419} {"train_loss": -7.192141532897949, "global_step": 185610, "epoch": 4419} {"train_loss": -7.162494659423828, "global_step": 185611, "epoch": 4419} {"train_loss": -7.2032880783081055, "global_step": 185612, "epoch": 4419} {"train_loss": -7.283738136291504, "global_step": 185613, "epoch": 4419} {"train_loss": -7.21698522567749, "global_step": 185614, "epoch": 4419} {"train_loss": -7.194491863250732, "global_step": 185615, "epoch": 4419} {"train_loss": -7.127915382385254, "global_step": 185616, "epoch": 4419} {"train_loss": -7.156284809112549, "global_step": 185617, "epoch": 4419} {"train_loss": -7.221614360809326, "global_step": 185618, "epoch": 4419} {"train_loss": -7.201489448547363, "global_step": 185619, "epoch": 4419} {"train_loss": -7.089323997497559, "global_step": 185620, "epoch": 4419} {"train_loss": -7.231001853942871, "global_step": 185621, "epoch": 4419} {"train_loss": -7.10326623916626, "global_step": 185622, "epoch": 4419} {"train_loss": -7.114282131195068, "global_step": 185623, "epoch": 4419} {"train_loss": -7.1554365158081055, "global_step": 185624, "epoch": 4419} {"train_loss": -7.1339874267578125, "global_step": 185625, "epoch": 4419} {"train_loss": -7.212203502655029, "global_step": 185626, "epoch": 4419} {"train_loss": -7.175528526306152, "global_step": 185627, "epoch": 4419} {"train_loss": -7.119690418243408, "global_step": 185628, "epoch": 4419} {"train_loss": -7.241637229919434, "global_step": 185629, "epoch": 4419} {"train_loss": -7.132790565490723, "global_step": 185630, "epoch": 4419} {"train_loss": -7.132115364074707, "global_step": 185631, "epoch": 4419} {"train_loss": -7.049138069152832, "global_step": 185632, "epoch": 4419} {"train_loss": -7.195551872253418, "global_step": 185633, "epoch": 4419} {"train_loss": -7.134708404541016, "global_step": 185634, "epoch": 4419} {"train_loss": -7.252618789672852, "global_step": 185635, "epoch": 4419} {"train_loss": -7.174613952636719, "global_step": 185636, "epoch": 4419} {"train_loss": -7.098204612731934, "global_step": 185637, "epoch": 4419} {"train_loss": -7.173579216003418, "global_step": 185638, "epoch": 4419} {"train_loss": -7.171059233801706, "global_step": 185639, "epoch": 4419, "val_loss": 80721.4921875} {"train_loss": -7.185522556304932, "global_step": 185640, "epoch": 4420} {"train_loss": -7.213599681854248, "global_step": 185641, "epoch": 4420} {"train_loss": -7.188702583312988, "global_step": 185642, "epoch": 4420} {"train_loss": -7.185222625732422, "global_step": 185643, "epoch": 4420} {"train_loss": -7.179889678955078, "global_step": 185644, "epoch": 4420} {"train_loss": -7.198233127593994, "global_step": 185645, "epoch": 4420} {"train_loss": -7.267853260040283, "global_step": 185646, "epoch": 4420} {"train_loss": -7.052453994750977, "global_step": 185647, "epoch": 4420} {"train_loss": -7.225841999053955, "global_step": 185648, "epoch": 4420} {"train_loss": -7.374712944030762, "global_step": 185649, "epoch": 4420} {"train_loss": -7.139322280883789, "global_step": 185650, "epoch": 4420} {"train_loss": -7.218955039978027, "global_step": 185651, "epoch": 4420} {"train_loss": -7.066429615020752, "global_step": 185652, "epoch": 4420} {"train_loss": -7.208322048187256, "global_step": 185653, "epoch": 4420} {"train_loss": -7.250531196594238, "global_step": 185654, "epoch": 4420} {"train_loss": -7.165136337280273, "global_step": 185655, "epoch": 4420} {"train_loss": -7.228733062744141, "global_step": 185656, "epoch": 4420} {"train_loss": -7.185097694396973, "global_step": 185657, "epoch": 4420} {"train_loss": -7.255974769592285, "global_step": 185658, "epoch": 4420} {"train_loss": -7.234934329986572, "global_step": 185659, "epoch": 4420} {"train_loss": -7.068176746368408, "global_step": 185660, "epoch": 4420} {"train_loss": -7.262635231018066, "global_step": 185661, "epoch": 4420} {"train_loss": -7.2621564865112305, "global_step": 185662, "epoch": 4420} {"train_loss": -7.297064781188965, "global_step": 185663, "epoch": 4420} {"train_loss": -7.22750186920166, "global_step": 185664, "epoch": 4420} {"train_loss": -7.178407669067383, "global_step": 185665, "epoch": 4420} {"train_loss": -7.240662097930908, "global_step": 185666, "epoch": 4420} {"train_loss": -7.184967517852783, "global_step": 185667, "epoch": 4420} {"train_loss": -7.127822399139404, "global_step": 185668, "epoch": 4420} {"train_loss": -7.204194068908691, "global_step": 185669, "epoch": 4420} {"train_loss": -7.274715423583984, "global_step": 185670, "epoch": 4420} {"train_loss": -7.191296577453613, "global_step": 185671, "epoch": 4420} {"train_loss": -7.0300493240356445, "global_step": 185672, "epoch": 4420} {"train_loss": -7.17304801940918, "global_step": 185673, "epoch": 4420} {"train_loss": -7.1113128662109375, "global_step": 185674, "epoch": 4420} {"train_loss": -7.113544464111328, "global_step": 185675, "epoch": 4420} {"train_loss": -7.224456310272217, "global_step": 185676, "epoch": 4420} {"train_loss": -7.242953777313232, "global_step": 185677, "epoch": 4420} {"train_loss": -7.122296333312988, "global_step": 185678, "epoch": 4420} {"train_loss": -7.193581581115723, "global_step": 185679, "epoch": 4420} {"train_loss": -7.147054672241211, "global_step": 185680, "epoch": 4420} {"train_loss": -7.190415598097301, "global_step": 185681, "epoch": 4420, "val_loss": 80817.734375} {"train_loss": -7.125170707702637, "global_step": 185682, "epoch": 4421} {"train_loss": -7.201982021331787, "global_step": 185683, "epoch": 4421} {"train_loss": -7.207808971405029, "global_step": 185684, "epoch": 4421} {"train_loss": -7.196165084838867, "global_step": 185685, "epoch": 4421} {"train_loss": -7.204667568206787, "global_step": 185686, "epoch": 4421} {"train_loss": -7.226437568664551, "global_step": 185687, "epoch": 4421} {"train_loss": -7.309857368469238, "global_step": 185688, "epoch": 4421} {"train_loss": -7.133638858795166, "global_step": 185689, "epoch": 4421} {"train_loss": -7.200042724609375, "global_step": 185690, "epoch": 4421} {"train_loss": -7.185351848602295, "global_step": 185691, "epoch": 4421} {"train_loss": -7.126049041748047, "global_step": 185692, "epoch": 4421} {"train_loss": -7.257720947265625, "global_step": 185693, "epoch": 4421} {"train_loss": -7.293785095214844, "global_step": 185694, "epoch": 4421} {"train_loss": -7.185639381408691, "global_step": 185695, "epoch": 4421} {"train_loss": -7.269603729248047, "global_step": 185696, "epoch": 4421} {"train_loss": -7.192705154418945, "global_step": 185697, "epoch": 4421} {"train_loss": -7.113758563995361, "global_step": 185698, "epoch": 4421} {"train_loss": -7.192907333374023, "global_step": 185699, "epoch": 4421} {"train_loss": -7.18171501159668, "global_step": 185700, "epoch": 4421} {"train_loss": -7.212839603424072, "global_step": 185701, "epoch": 4421} {"train_loss": -7.255949974060059, "global_step": 185702, "epoch": 4421} {"train_loss": -7.332274436950684, "global_step": 185703, "epoch": 4421} {"train_loss": -7.146251201629639, "global_step": 185704, "epoch": 4421} {"train_loss": -7.179213523864746, "global_step": 185705, "epoch": 4421} {"train_loss": -7.044041633605957, "global_step": 185706, "epoch": 4421} {"train_loss": -6.966155052185059, "global_step": 185707, "epoch": 4421} {"train_loss": -7.219344139099121, "global_step": 185708, "epoch": 4421} {"train_loss": -7.109740257263184, "global_step": 185709, "epoch": 4421} {"train_loss": -7.087462425231934, "global_step": 185710, "epoch": 4421} {"train_loss": -7.122363090515137, "global_step": 185711, "epoch": 4421} {"train_loss": -7.0862016677856445, "global_step": 185712, "epoch": 4421} {"train_loss": -7.148377418518066, "global_step": 185713, "epoch": 4421} {"train_loss": -7.258960723876953, "global_step": 185714, "epoch": 4421} {"train_loss": -7.1339497566223145, "global_step": 185715, "epoch": 4421} {"train_loss": -7.0308685302734375, "global_step": 185716, "epoch": 4421} {"train_loss": -7.0218000411987305, "global_step": 185717, "epoch": 4421} {"train_loss": -7.23063850402832, "global_step": 185718, "epoch": 4421} {"train_loss": -7.213586807250977, "global_step": 185719, "epoch": 4421} {"train_loss": -7.215977668762207, "global_step": 185720, "epoch": 4421} {"train_loss": -7.04998779296875, "global_step": 185721, "epoch": 4421} {"train_loss": -7.212597370147705, "global_step": 185722, "epoch": 4421} {"train_loss": -7.170605228060768, "global_step": 185723, "epoch": 4421, "val_loss": 80946.03125} {"train_loss": -7.10352897644043, "global_step": 185724, "epoch": 4422} {"train_loss": -7.226649284362793, "global_step": 185725, "epoch": 4422} {"train_loss": -7.171563625335693, "global_step": 185726, "epoch": 4422} {"train_loss": -7.144736289978027, "global_step": 185727, "epoch": 4422} {"train_loss": -7.243261337280273, "global_step": 185728, "epoch": 4422} {"train_loss": -7.217050075531006, "global_step": 185729, "epoch": 4422} {"train_loss": -7.2903242111206055, "global_step": 185730, "epoch": 4422} {"train_loss": -7.120917320251465, "global_step": 185731, "epoch": 4422} {"train_loss": -7.09184455871582, "global_step": 185732, "epoch": 4422} {"train_loss": -7.167591571807861, "global_step": 185733, "epoch": 4422} {"train_loss": -7.189145565032959, "global_step": 185734, "epoch": 4422} {"train_loss": -7.162382125854492, "global_step": 185735, "epoch": 4422} {"train_loss": -7.313190460205078, "global_step": 185736, "epoch": 4422} {"train_loss": -7.1498494148254395, "global_step": 185737, "epoch": 4422} {"train_loss": -7.049078464508057, "global_step": 185738, "epoch": 4422} {"train_loss": -7.151224136352539, "global_step": 185739, "epoch": 4422} {"train_loss": -7.178989410400391, "global_step": 185740, "epoch": 4422} {"train_loss": -7.245125770568848, "global_step": 185741, "epoch": 4422} {"train_loss": -7.0778656005859375, "global_step": 185742, "epoch": 4422} {"train_loss": -7.129203796386719, "global_step": 185743, "epoch": 4422} {"train_loss": -7.087413787841797, "global_step": 185744, "epoch": 4422} {"train_loss": -7.194683074951172, "global_step": 185745, "epoch": 4422} {"train_loss": -7.2483415603637695, "global_step": 185746, "epoch": 4422} {"train_loss": -7.079312801361084, "global_step": 185747, "epoch": 4422} {"train_loss": -7.108013153076172, "global_step": 185748, "epoch": 4422} {"train_loss": -7.123522758483887, "global_step": 185749, "epoch": 4422} {"train_loss": -6.987632751464844, "global_step": 185750, "epoch": 4422} {"train_loss": -7.133082866668701, "global_step": 185751, "epoch": 4422} {"train_loss": -7.029793739318848, "global_step": 185752, "epoch": 4422} {"train_loss": -7.156492710113525, "global_step": 185753, "epoch": 4422} {"train_loss": -7.232102394104004, "global_step": 185754, "epoch": 4422} {"train_loss": -7.08099889755249, "global_step": 185755, "epoch": 4422} {"train_loss": -7.164525985717773, "global_step": 185756, "epoch": 4422} {"train_loss": -7.1777424812316895, "global_step": 185757, "epoch": 4422} {"train_loss": -7.134497165679932, "global_step": 185758, "epoch": 4422} {"train_loss": -7.139815330505371, "global_step": 185759, "epoch": 4422} {"train_loss": -7.111693382263184, "global_step": 185760, "epoch": 4422} {"train_loss": -7.172865867614746, "global_step": 185761, "epoch": 4422} {"train_loss": -7.163567543029785, "global_step": 185762, "epoch": 4422} {"train_loss": -7.277562141418457, "global_step": 185763, "epoch": 4422} {"train_loss": -7.169439315795898, "global_step": 185764, "epoch": 4422} {"train_loss": -7.158226989564442, "global_step": 185765, "epoch": 4422, "val_loss": 80801.6640625} {"train_loss": -7.147069931030273, "global_step": 185766, "epoch": 4423} {"train_loss": -7.089550971984863, "global_step": 185767, "epoch": 4423} {"train_loss": -7.173168182373047, "global_step": 185768, "epoch": 4423} {"train_loss": -7.188516616821289, "global_step": 185769, "epoch": 4423} {"train_loss": -7.189667701721191, "global_step": 185770, "epoch": 4423} {"train_loss": -7.200786590576172, "global_step": 185771, "epoch": 4423} {"train_loss": -7.171826362609863, "global_step": 185772, "epoch": 4423} {"train_loss": -7.225540637969971, "global_step": 185773, "epoch": 4423} {"train_loss": -7.1161017417907715, "global_step": 185774, "epoch": 4423} {"train_loss": -7.140179634094238, "global_step": 185775, "epoch": 4423} {"train_loss": -7.266878604888916, "global_step": 185776, "epoch": 4423} {"train_loss": -7.111697673797607, "global_step": 185777, "epoch": 4423} {"train_loss": -7.250431060791016, "global_step": 185778, "epoch": 4423} {"train_loss": -7.182065010070801, "global_step": 185779, "epoch": 4423} {"train_loss": -7.191699028015137, "global_step": 185780, "epoch": 4423} {"train_loss": -7.196300983428955, "global_step": 185781, "epoch": 4423} {"train_loss": -7.154569149017334, "global_step": 185782, "epoch": 4423} {"train_loss": -7.265013217926025, "global_step": 185783, "epoch": 4423} {"train_loss": -7.099855422973633, "global_step": 185784, "epoch": 4423} {"train_loss": -7.115325927734375, "global_step": 185785, "epoch": 4423} {"train_loss": -7.238471984863281, "global_step": 185786, "epoch": 4423} {"train_loss": -7.072209358215332, "global_step": 185787, "epoch": 4423} {"train_loss": -6.971735954284668, "global_step": 185788, "epoch": 4423} {"train_loss": -7.1293511390686035, "global_step": 185789, "epoch": 4423} {"train_loss": -6.9085693359375, "global_step": 185790, "epoch": 4423} {"train_loss": -7.062543869018555, "global_step": 185791, "epoch": 4423} {"train_loss": -6.9534406661987305, "global_step": 185792, "epoch": 4423} {"train_loss": -6.991935729980469, "global_step": 185793, "epoch": 4423} {"train_loss": -7.0960493087768555, "global_step": 185794, "epoch": 4423} {"train_loss": -6.883455276489258, "global_step": 185795, "epoch": 4423} {"train_loss": -7.150287628173828, "global_step": 185796, "epoch": 4423} {"train_loss": -6.860592842102051, "global_step": 185797, "epoch": 4423} {"train_loss": -7.136239051818848, "global_step": 185798, "epoch": 4423} {"train_loss": -7.0976457595825195, "global_step": 185799, "epoch": 4423} {"train_loss": -7.068384170532227, "global_step": 185800, "epoch": 4423} {"train_loss": -6.91663932800293, "global_step": 185801, "epoch": 4423} {"train_loss": -7.071035861968994, "global_step": 185802, "epoch": 4423} {"train_loss": -7.119190216064453, "global_step": 185803, "epoch": 4423} {"train_loss": -6.8791022300720215, "global_step": 185804, "epoch": 4423} {"train_loss": -7.201393127441406, "global_step": 185805, "epoch": 4423} {"train_loss": -6.921010971069336, "global_step": 185806, "epoch": 4423} {"train_loss": -7.103995811371576, "global_step": 185807, "epoch": 4423, "val_loss": 80543.9453125} {"train_loss": -7.104672908782959, "global_step": 185808, "epoch": 4424} {"train_loss": -7.1693830490112305, "global_step": 185809, "epoch": 4424} {"train_loss": -7.019566059112549, "global_step": 185810, "epoch": 4424} {"train_loss": -7.176342964172363, "global_step": 185811, "epoch": 4424} {"train_loss": -7.0611138343811035, "global_step": 185812, "epoch": 4424} {"train_loss": -7.185794830322266, "global_step": 185813, "epoch": 4424} {"train_loss": -7.0583815574646, "global_step": 185814, "epoch": 4424} {"train_loss": -7.0989227294921875, "global_step": 185815, "epoch": 4424} {"train_loss": -7.027887344360352, "global_step": 185816, "epoch": 4424} {"train_loss": -7.1982221603393555, "global_step": 185817, "epoch": 4424} {"train_loss": -7.093347549438477, "global_step": 185818, "epoch": 4424} {"train_loss": -7.1654157638549805, "global_step": 185819, "epoch": 4424} {"train_loss": -7.245539665222168, "global_step": 185820, "epoch": 4424} {"train_loss": -7.026699066162109, "global_step": 185821, "epoch": 4424} {"train_loss": -7.2084736824035645, "global_step": 185822, "epoch": 4424} {"train_loss": -7.167708873748779, "global_step": 185823, "epoch": 4424} {"train_loss": -7.080146789550781, "global_step": 185824, "epoch": 4424} {"train_loss": -7.194622993469238, "global_step": 185825, "epoch": 4424} {"train_loss": -7.162503242492676, "global_step": 185826, "epoch": 4424} {"train_loss": -7.103606224060059, "global_step": 185827, "epoch": 4424} {"train_loss": -7.214792251586914, "global_step": 185828, "epoch": 4424} {"train_loss": -7.243358135223389, "global_step": 185829, "epoch": 4424} {"train_loss": -7.193885803222656, "global_step": 185830, "epoch": 4424} {"train_loss": -7.173064708709717, "global_step": 185831, "epoch": 4424} {"train_loss": -7.094963073730469, "global_step": 185832, "epoch": 4424} {"train_loss": -7.108170509338379, "global_step": 185833, "epoch": 4424} {"train_loss": -7.107764720916748, "global_step": 185834, "epoch": 4424} {"train_loss": -7.075849533081055, "global_step": 185835, "epoch": 4424} {"train_loss": -7.098851680755615, "global_step": 185836, "epoch": 4424} {"train_loss": -7.072634220123291, "global_step": 185837, "epoch": 4424} {"train_loss": -7.059112548828125, "global_step": 185838, "epoch": 4424} {"train_loss": -7.111800670623779, "global_step": 185839, "epoch": 4424} {"train_loss": -7.040322303771973, "global_step": 185840, "epoch": 4424} {"train_loss": -7.207348823547363, "global_step": 185841, "epoch": 4424} {"train_loss": -7.1872992515563965, "global_step": 185842, "epoch": 4424} {"train_loss": -7.092355728149414, "global_step": 185843, "epoch": 4424} {"train_loss": -7.178306579589844, "global_step": 185844, "epoch": 4424} {"train_loss": -7.245360374450684, "global_step": 185845, "epoch": 4424} {"train_loss": -7.261502265930176, "global_step": 185846, "epoch": 4424} {"train_loss": -7.126086235046387, "global_step": 185847, "epoch": 4424} {"train_loss": -7.242519855499268, "global_step": 185848, "epoch": 4424} {"train_loss": -7.139658780325027, "global_step": 185849, "epoch": 4424, "val_loss": 81031.0} {"train_loss": -7.1539530754089355, "global_step": 185850, "epoch": 4425} {"train_loss": -7.1329193115234375, "global_step": 185851, "epoch": 4425} {"train_loss": -7.1641082763671875, "global_step": 185852, "epoch": 4425} {"train_loss": -7.236723899841309, "global_step": 185853, "epoch": 4425} {"train_loss": -7.204934120178223, "global_step": 185854, "epoch": 4425} {"train_loss": -7.142812728881836, "global_step": 185855, "epoch": 4425} {"train_loss": -7.240594387054443, "global_step": 185856, "epoch": 4425} {"train_loss": -7.167322635650635, "global_step": 185857, "epoch": 4425} {"train_loss": -7.160375595092773, "global_step": 185858, "epoch": 4425} {"train_loss": -7.238403797149658, "global_step": 185859, "epoch": 4425} {"train_loss": -7.220460414886475, "global_step": 185860, "epoch": 4425} {"train_loss": -7.213841438293457, "global_step": 185861, "epoch": 4425} {"train_loss": -7.23567533493042, "global_step": 185862, "epoch": 4425} {"train_loss": -7.208700656890869, "global_step": 185863, "epoch": 4425} {"train_loss": -7.244658946990967, "global_step": 185864, "epoch": 4425} {"train_loss": -7.100214958190918, "global_step": 185865, "epoch": 4425} {"train_loss": -7.247442722320557, "global_step": 185866, "epoch": 4425} {"train_loss": -7.180908679962158, "global_step": 185867, "epoch": 4425} {"train_loss": -7.176595211029053, "global_step": 185868, "epoch": 4425} {"train_loss": -7.372709274291992, "global_step": 185869, "epoch": 4425} {"train_loss": -7.105253219604492, "global_step": 185870, "epoch": 4425} {"train_loss": -7.240949630737305, "global_step": 185871, "epoch": 4425} {"train_loss": -7.248269557952881, "global_step": 185872, "epoch": 4425} {"train_loss": -7.075769424438477, "global_step": 185873, "epoch": 4425} {"train_loss": -7.182613372802734, "global_step": 185874, "epoch": 4425} {"train_loss": -7.245553016662598, "global_step": 185875, "epoch": 4425} {"train_loss": -7.134527206420898, "global_step": 185876, "epoch": 4425} {"train_loss": -7.095060348510742, "global_step": 185877, "epoch": 4425} {"train_loss": -7.276200294494629, "global_step": 185878, "epoch": 4425} {"train_loss": -7.257989883422852, "global_step": 185879, "epoch": 4425} {"train_loss": -7.222048759460449, "global_step": 185880, "epoch": 4425} {"train_loss": -7.215325355529785, "global_step": 185881, "epoch": 4425} {"train_loss": -7.1110124588012695, "global_step": 185882, "epoch": 4425} {"train_loss": -7.082943439483643, "global_step": 185883, "epoch": 4425} {"train_loss": -7.227047920227051, "global_step": 185884, "epoch": 4425} {"train_loss": -7.0290021896362305, "global_step": 185885, "epoch": 4425} {"train_loss": -7.109453201293945, "global_step": 185886, "epoch": 4425} {"train_loss": -7.154745101928711, "global_step": 185887, "epoch": 4425} {"train_loss": -7.090009689331055, "global_step": 185888, "epoch": 4425} {"train_loss": -7.20574951171875, "global_step": 185889, "epoch": 4425} {"train_loss": -7.124067306518555, "global_step": 185890, "epoch": 4425} {"train_loss": -7.180458091554188, "global_step": 185891, "epoch": 4425, "val_loss": 80882.6875} {"train_loss": -7.272534370422363, "global_step": 185892, "epoch": 4426} {"train_loss": -7.251245498657227, "global_step": 185893, "epoch": 4426} {"train_loss": -7.192505359649658, "global_step": 185894, "epoch": 4426} {"train_loss": -7.217280387878418, "global_step": 185895, "epoch": 4426} {"train_loss": -7.327701568603516, "global_step": 185896, "epoch": 4426} {"train_loss": -7.221286773681641, "global_step": 185897, "epoch": 4426} {"train_loss": -7.269618988037109, "global_step": 185898, "epoch": 4426} {"train_loss": -7.152454376220703, "global_step": 185899, "epoch": 4426} {"train_loss": -7.161165714263916, "global_step": 185900, "epoch": 4426} {"train_loss": -7.133461952209473, "global_step": 185901, "epoch": 4426} {"train_loss": -7.279092788696289, "global_step": 185902, "epoch": 4426} {"train_loss": -7.224631309509277, "global_step": 185903, "epoch": 4426} {"train_loss": -7.254510879516602, "global_step": 185904, "epoch": 4426} {"train_loss": -7.26645040512085, "global_step": 185905, "epoch": 4426} {"train_loss": -7.199917793273926, "global_step": 185906, "epoch": 4426} {"train_loss": -7.245689392089844, "global_step": 185907, "epoch": 4426} {"train_loss": -7.293705463409424, "global_step": 185908, "epoch": 4426} {"train_loss": -7.211685657501221, "global_step": 185909, "epoch": 4426} {"train_loss": -7.212180137634277, "global_step": 185910, "epoch": 4426} {"train_loss": -7.1013078689575195, "global_step": 185911, "epoch": 4426} {"train_loss": -7.164314270019531, "global_step": 185912, "epoch": 4426} {"train_loss": -7.223176002502441, "global_step": 185913, "epoch": 4426} {"train_loss": -7.234579563140869, "global_step": 185914, "epoch": 4426} {"train_loss": -7.288536071777344, "global_step": 185915, "epoch": 4426} {"train_loss": -7.265172958374023, "global_step": 185916, "epoch": 4426} {"train_loss": -7.25707483291626, "global_step": 185917, "epoch": 4426} {"train_loss": -7.212100982666016, "global_step": 185918, "epoch": 4426} {"train_loss": -7.123452186584473, "global_step": 185919, "epoch": 4426} {"train_loss": -7.286348342895508, "global_step": 185920, "epoch": 4426} {"train_loss": -7.135987281799316, "global_step": 185921, "epoch": 4426} {"train_loss": -7.166444301605225, "global_step": 185922, "epoch": 4426} {"train_loss": -7.058549880981445, "global_step": 185923, "epoch": 4426} {"train_loss": -7.219520568847656, "global_step": 185924, "epoch": 4426} {"train_loss": -7.262111186981201, "global_step": 185925, "epoch": 4426} {"train_loss": -7.087523460388184, "global_step": 185926, "epoch": 4426} {"train_loss": -7.036340236663818, "global_step": 185927, "epoch": 4426} {"train_loss": -7.185518264770508, "global_step": 185928, "epoch": 4426} {"train_loss": -7.16666316986084, "global_step": 185929, "epoch": 4426} {"train_loss": -7.149400234222412, "global_step": 185930, "epoch": 4426} {"train_loss": -7.105949401855469, "global_step": 185931, "epoch": 4426} {"train_loss": -7.18759822845459, "global_step": 185932, "epoch": 4426} {"train_loss": -7.201662131718227, "global_step": 185933, "epoch": 4426, "val_loss": 80716.21875} {"train_loss": -7.125162601470947, "global_step": 185934, "epoch": 4427} {"train_loss": -7.210201263427734, "global_step": 185935, "epoch": 4427} {"train_loss": -7.254056930541992, "global_step": 185936, "epoch": 4427} {"train_loss": -7.004010200500488, "global_step": 185937, "epoch": 4427} {"train_loss": -7.094303131103516, "global_step": 185938, "epoch": 4427} {"train_loss": -7.2285871505737305, "global_step": 185939, "epoch": 4427} {"train_loss": -7.107118606567383, "global_step": 185940, "epoch": 4427} {"train_loss": -7.198559761047363, "global_step": 185941, "epoch": 4427} {"train_loss": -7.210475921630859, "global_step": 185942, "epoch": 4427} {"train_loss": -7.089236736297607, "global_step": 185943, "epoch": 4427} {"train_loss": -7.157262325286865, "global_step": 185944, "epoch": 4427} {"train_loss": -7.1501617431640625, "global_step": 185945, "epoch": 4427} {"train_loss": -7.206108093261719, "global_step": 185946, "epoch": 4427} {"train_loss": -7.162583351135254, "global_step": 185947, "epoch": 4427} {"train_loss": -7.228894233703613, "global_step": 185948, "epoch": 4427} {"train_loss": -7.197203159332275, "global_step": 185949, "epoch": 4427} {"train_loss": -7.066115856170654, "global_step": 185950, "epoch": 4427} {"train_loss": -7.22603702545166, "global_step": 185951, "epoch": 4427} {"train_loss": -7.078409194946289, "global_step": 185952, "epoch": 4427} {"train_loss": -7.243479251861572, "global_step": 185953, "epoch": 4427} {"train_loss": -7.248411655426025, "global_step": 185954, "epoch": 4427} {"train_loss": -7.183967590332031, "global_step": 185955, "epoch": 4427} {"train_loss": -7.208046913146973, "global_step": 185956, "epoch": 4427} {"train_loss": -7.244593620300293, "global_step": 185957, "epoch": 4427} {"train_loss": -7.23112678527832, "global_step": 185958, "epoch": 4427} {"train_loss": -7.236871719360352, "global_step": 185959, "epoch": 4427} {"train_loss": -7.18106746673584, "global_step": 185960, "epoch": 4427} {"train_loss": -7.177305698394775, "global_step": 185961, "epoch": 4427} {"train_loss": -7.153363227844238, "global_step": 185962, "epoch": 4427} {"train_loss": -7.2676682472229, "global_step": 185963, "epoch": 4427} {"train_loss": -7.262747287750244, "global_step": 185964, "epoch": 4427} {"train_loss": -7.147687911987305, "global_step": 185965, "epoch": 4427} {"train_loss": -7.214864730834961, "global_step": 185966, "epoch": 4427} {"train_loss": -7.162097930908203, "global_step": 185967, "epoch": 4427} {"train_loss": -7.1620612144470215, "global_step": 185968, "epoch": 4427} {"train_loss": -7.119345664978027, "global_step": 185969, "epoch": 4427} {"train_loss": -7.213213920593262, "global_step": 185970, "epoch": 4427} {"train_loss": -7.037159442901611, "global_step": 185971, "epoch": 4427} {"train_loss": -7.1406097412109375, "global_step": 185972, "epoch": 4427} {"train_loss": -7.208617210388184, "global_step": 185973, "epoch": 4427} {"train_loss": -7.144774913787842, "global_step": 185974, "epoch": 4427} {"train_loss": -7.174239147277105, "global_step": 185975, "epoch": 4427, "val_loss": 80882.640625} {"train_loss": -7.132205009460449, "global_step": 185976, "epoch": 4428} {"train_loss": -7.149880409240723, "global_step": 185977, "epoch": 4428} {"train_loss": -7.140114784240723, "global_step": 185978, "epoch": 4428} {"train_loss": -7.256353378295898, "global_step": 185979, "epoch": 4428} {"train_loss": -7.067540168762207, "global_step": 185980, "epoch": 4428} {"train_loss": -7.028186798095703, "global_step": 185981, "epoch": 4428} {"train_loss": -7.279904842376709, "global_step": 185982, "epoch": 4428} {"train_loss": -7.248798370361328, "global_step": 185983, "epoch": 4428} {"train_loss": -7.12711238861084, "global_step": 185984, "epoch": 4428} {"train_loss": -7.232470989227295, "global_step": 185985, "epoch": 4428} {"train_loss": -7.21038293838501, "global_step": 185986, "epoch": 4428} {"train_loss": -7.275723457336426, "global_step": 185987, "epoch": 4428} {"train_loss": -7.084291458129883, "global_step": 185988, "epoch": 4428} {"train_loss": -7.206376075744629, "global_step": 185989, "epoch": 4428} {"train_loss": -7.12635612487793, "global_step": 185990, "epoch": 4428} {"train_loss": -7.081817626953125, "global_step": 185991, "epoch": 4428} {"train_loss": -7.21417236328125, "global_step": 185992, "epoch": 4428} {"train_loss": -7.081516742706299, "global_step": 185993, "epoch": 4428} {"train_loss": -7.075069904327393, "global_step": 185994, "epoch": 4428} {"train_loss": -7.140667915344238, "global_step": 185995, "epoch": 4428} {"train_loss": -7.103114128112793, "global_step": 185996, "epoch": 4428} {"train_loss": -7.237015724182129, "global_step": 185997, "epoch": 4428} {"train_loss": -7.263887405395508, "global_step": 185998, "epoch": 4428} {"train_loss": -7.202319145202637, "global_step": 185999, "epoch": 4428} {"train_loss": -7.137116432189941, "global_step": 186000, "epoch": 4428} {"train_loss": -7.160240173339844, "global_step": 186001, "epoch": 4428} {"train_loss": -7.028533935546875, "global_step": 186002, "epoch": 4428} {"train_loss": -7.184839248657227, "global_step": 186003, "epoch": 4428} {"train_loss": -7.006673812866211, "global_step": 186004, "epoch": 4428} {"train_loss": -7.085367202758789, "global_step": 186005, "epoch": 4428} {"train_loss": -7.268083095550537, "global_step": 186006, "epoch": 4428} {"train_loss": -7.076569080352783, "global_step": 186007, "epoch": 4428} {"train_loss": -7.1643571853637695, "global_step": 186008, "epoch": 4428} {"train_loss": -7.148573875427246, "global_step": 186009, "epoch": 4428} {"train_loss": -7.019490718841553, "global_step": 186010, "epoch": 4428} {"train_loss": -7.126559257507324, "global_step": 186011, "epoch": 4428} {"train_loss": -6.980604648590088, "global_step": 186012, "epoch": 4428} {"train_loss": -7.072602272033691, "global_step": 186013, "epoch": 4428} {"train_loss": -7.111686706542969, "global_step": 186014, "epoch": 4428} {"train_loss": -7.13088321685791, "global_step": 186015, "epoch": 4428} {"train_loss": -7.1071038246154785, "global_step": 186016, "epoch": 4428} {"train_loss": -7.136085521607172, "global_step": 186017, "epoch": 4428, "val_loss": 80837.3203125} {"train_loss": -7.0978288650512695, "global_step": 186018, "epoch": 4429} {"train_loss": -7.039222240447998, "global_step": 186019, "epoch": 4429} {"train_loss": -7.158268928527832, "global_step": 186020, "epoch": 4429} {"train_loss": -6.939510345458984, "global_step": 186021, "epoch": 4429} {"train_loss": -7.139174461364746, "global_step": 186022, "epoch": 4429} {"train_loss": -6.975876808166504, "global_step": 186023, "epoch": 4429} {"train_loss": -7.10539436340332, "global_step": 186024, "epoch": 4429} {"train_loss": -7.236478805541992, "global_step": 186025, "epoch": 4429} {"train_loss": -7.006870269775391, "global_step": 186026, "epoch": 4429} {"train_loss": -7.101511001586914, "global_step": 186027, "epoch": 4429} {"train_loss": -7.019844055175781, "global_step": 186028, "epoch": 4429} {"train_loss": -7.052335262298584, "global_step": 186029, "epoch": 4429} {"train_loss": -7.102898597717285, "global_step": 186030, "epoch": 4429} {"train_loss": -7.117125511169434, "global_step": 186031, "epoch": 4429} {"train_loss": -7.107046127319336, "global_step": 186032, "epoch": 4429} {"train_loss": -7.195599555969238, "global_step": 186033, "epoch": 4429} {"train_loss": -7.280023574829102, "global_step": 186034, "epoch": 4429} {"train_loss": -7.176793098449707, "global_step": 186035, "epoch": 4429} {"train_loss": -7.199337005615234, "global_step": 186036, "epoch": 4429} {"train_loss": -7.243571758270264, "global_step": 186037, "epoch": 4429} {"train_loss": -7.239419460296631, "global_step": 186038, "epoch": 4429} {"train_loss": -7.190825462341309, "global_step": 186039, "epoch": 4429} {"train_loss": -7.211790084838867, "global_step": 186040, "epoch": 4429} {"train_loss": -7.115790367126465, "global_step": 186041, "epoch": 4429} {"train_loss": -7.223766326904297, "global_step": 186042, "epoch": 4429} {"train_loss": -7.261148929595947, "global_step": 186043, "epoch": 4429} {"train_loss": -7.1960320472717285, "global_step": 186044, "epoch": 4429} {"train_loss": -7.188413143157959, "global_step": 186045, "epoch": 4429} {"train_loss": -7.217729568481445, "global_step": 186046, "epoch": 4429} {"train_loss": -7.30301570892334, "global_step": 186047, "epoch": 4429} {"train_loss": -7.263093948364258, "global_step": 186048, "epoch": 4429} {"train_loss": -7.176811218261719, "global_step": 186049, "epoch": 4429} {"train_loss": -7.213377952575684, "global_step": 186050, "epoch": 4429} {"train_loss": -7.193552494049072, "global_step": 186051, "epoch": 4429} {"train_loss": -7.2305145263671875, "global_step": 186052, "epoch": 4429} {"train_loss": -7.217589855194092, "global_step": 186053, "epoch": 4429} {"train_loss": -7.16752290725708, "global_step": 186054, "epoch": 4429} {"train_loss": -7.2237653732299805, "global_step": 186055, "epoch": 4429} {"train_loss": -7.192836284637451, "global_step": 186056, "epoch": 4429} {"train_loss": -7.250170707702637, "global_step": 186057, "epoch": 4429} {"train_loss": -7.11055326461792, "global_step": 186058, "epoch": 4429} {"train_loss": -7.164503733317058, "global_step": 186059, "epoch": 4429, "val_loss": 81046.1328125} {"train_loss": -7.093429088592529, "global_step": 186060, "epoch": 4430} {"train_loss": -7.1183905601501465, "global_step": 186061, "epoch": 4430} {"train_loss": -7.1592254638671875, "global_step": 186062, "epoch": 4430} {"train_loss": -7.027525901794434, "global_step": 186063, "epoch": 4430} {"train_loss": -7.1696929931640625, "global_step": 186064, "epoch": 4430} {"train_loss": -7.148299217224121, "global_step": 186065, "epoch": 4430} {"train_loss": -7.087898254394531, "global_step": 186066, "epoch": 4430} {"train_loss": -7.231625556945801, "global_step": 186067, "epoch": 4430} {"train_loss": -7.075628757476807, "global_step": 186068, "epoch": 4430} {"train_loss": -7.007985591888428, "global_step": 186069, "epoch": 4430} {"train_loss": -7.182289123535156, "global_step": 186070, "epoch": 4430} {"train_loss": -7.062658786773682, "global_step": 186071, "epoch": 4430} {"train_loss": -7.23338508605957, "global_step": 186072, "epoch": 4430} {"train_loss": -7.075445175170898, "global_step": 186073, "epoch": 4430} {"train_loss": -7.103573799133301, "global_step": 186074, "epoch": 4430} {"train_loss": -7.198954105377197, "global_step": 186075, "epoch": 4430} {"train_loss": -7.186095237731934, "global_step": 186076, "epoch": 4430} {"train_loss": -7.253902435302734, "global_step": 186077, "epoch": 4430} {"train_loss": -7.161037445068359, "global_step": 186078, "epoch": 4430} {"train_loss": -7.177778244018555, "global_step": 186079, "epoch": 4430} {"train_loss": -7.205014228820801, "global_step": 186080, "epoch": 4430} {"train_loss": -7.114822864532471, "global_step": 186081, "epoch": 4430} {"train_loss": -7.324699401855469, "global_step": 186082, "epoch": 4430} {"train_loss": -7.197792053222656, "global_step": 186083, "epoch": 4430} {"train_loss": -7.2110090255737305, "global_step": 186084, "epoch": 4430} {"train_loss": -7.141767501831055, "global_step": 186085, "epoch": 4430} {"train_loss": -7.22799015045166, "global_step": 186086, "epoch": 4430} {"train_loss": -7.272747993469238, "global_step": 186087, "epoch": 4430} {"train_loss": -7.271712779998779, "global_step": 186088, "epoch": 4430} {"train_loss": -7.186153888702393, "global_step": 186089, "epoch": 4430} {"train_loss": -7.188755989074707, "global_step": 186090, "epoch": 4430} {"train_loss": -7.273972511291504, "global_step": 186091, "epoch": 4430} {"train_loss": -7.203640937805176, "global_step": 186092, "epoch": 4430} {"train_loss": -7.306069374084473, "global_step": 186093, "epoch": 4430} {"train_loss": -7.274114608764648, "global_step": 186094, "epoch": 4430} {"train_loss": -7.321626663208008, "global_step": 186095, "epoch": 4430} {"train_loss": -7.155362606048584, "global_step": 186096, "epoch": 4430} {"train_loss": -7.263184547424316, "global_step": 186097, "epoch": 4430} {"train_loss": -7.257479190826416, "global_step": 186098, "epoch": 4430} {"train_loss": -7.1520280838012695, "global_step": 186099, "epoch": 4430} {"train_loss": -7.269073486328125, "global_step": 186100, "epoch": 4430} {"train_loss": -7.187127567472912, "global_step": 186101, "epoch": 4430, "val_loss": 80602.3984375} {"train_loss": -7.269776344299316, "global_step": 186102, "epoch": 4431} {"train_loss": -7.234209060668945, "global_step": 186103, "epoch": 4431} {"train_loss": -7.313138961791992, "global_step": 186104, "epoch": 4431} {"train_loss": -7.1831769943237305, "global_step": 186105, "epoch": 4431} {"train_loss": -7.182685852050781, "global_step": 186106, "epoch": 4431} {"train_loss": -7.080596923828125, "global_step": 186107, "epoch": 4431} {"train_loss": -7.187416076660156, "global_step": 186108, "epoch": 4431} {"train_loss": -7.213425636291504, "global_step": 186109, "epoch": 4431} {"train_loss": -7.126152992248535, "global_step": 186110, "epoch": 4431} {"train_loss": -7.182521820068359, "global_step": 186111, "epoch": 4431} {"train_loss": -7.145551681518555, "global_step": 186112, "epoch": 4431} {"train_loss": -7.03544807434082, "global_step": 186113, "epoch": 4431} {"train_loss": -7.219837188720703, "global_step": 186114, "epoch": 4431} {"train_loss": -7.1983489990234375, "global_step": 186115, "epoch": 4431} {"train_loss": -7.052486419677734, "global_step": 186116, "epoch": 4431} {"train_loss": -7.168008804321289, "global_step": 186117, "epoch": 4431} {"train_loss": -7.145041465759277, "global_step": 186118, "epoch": 4431} {"train_loss": -7.043312072753906, "global_step": 186119, "epoch": 4431} {"train_loss": -7.256486415863037, "global_step": 186120, "epoch": 4431} {"train_loss": -6.903210639953613, "global_step": 186121, "epoch": 4431} {"train_loss": -6.9478349685668945, "global_step": 186122, "epoch": 4431} {"train_loss": -7.033082962036133, "global_step": 186123, "epoch": 4431} {"train_loss": -7.081433296203613, "global_step": 186124, "epoch": 4431} {"train_loss": -7.010442733764648, "global_step": 186125, "epoch": 4431} {"train_loss": -6.942925453186035, "global_step": 186126, "epoch": 4431} {"train_loss": -7.092130661010742, "global_step": 186127, "epoch": 4431} {"train_loss": -7.127725601196289, "global_step": 186128, "epoch": 4431} {"train_loss": -6.988414287567139, "global_step": 186129, "epoch": 4431} {"train_loss": -7.207447052001953, "global_step": 186130, "epoch": 4431} {"train_loss": -7.19936466217041, "global_step": 186131, "epoch": 4431} {"train_loss": -7.10801887512207, "global_step": 186132, "epoch": 4431} {"train_loss": -7.200407028198242, "global_step": 186133, "epoch": 4431} {"train_loss": -7.076674938201904, "global_step": 186134, "epoch": 4431} {"train_loss": -7.0180134773254395, "global_step": 186135, "epoch": 4431} {"train_loss": -7.084794044494629, "global_step": 186136, "epoch": 4431} {"train_loss": -7.0552659034729, "global_step": 186137, "epoch": 4431} {"train_loss": -7.076586723327637, "global_step": 186138, "epoch": 4431} {"train_loss": -7.251758575439453, "global_step": 186139, "epoch": 4431} {"train_loss": -7.090744972229004, "global_step": 186140, "epoch": 4431} {"train_loss": -7.190460205078125, "global_step": 186141, "epoch": 4431} {"train_loss": -7.134443283081055, "global_step": 186142, "epoch": 4431} {"train_loss": -7.125799894332886, "global_step": 186143, "epoch": 4431, "val_loss": 80635.1875} {"train_loss": -7.133920669555664, "global_step": 186144, "epoch": 4432} {"train_loss": -7.203927040100098, "global_step": 186145, "epoch": 4432} {"train_loss": -7.263856887817383, "global_step": 186146, "epoch": 4432} {"train_loss": -7.106753826141357, "global_step": 186147, "epoch": 4432} {"train_loss": -7.241506576538086, "global_step": 186148, "epoch": 4432} {"train_loss": -7.149805545806885, "global_step": 186149, "epoch": 4432} {"train_loss": -7.0152177810668945, "global_step": 186150, "epoch": 4432} {"train_loss": -7.280494689941406, "global_step": 186151, "epoch": 4432} {"train_loss": -7.202450752258301, "global_step": 186152, "epoch": 4432} {"train_loss": -7.155228614807129, "global_step": 186153, "epoch": 4432} {"train_loss": -7.251706123352051, "global_step": 186154, "epoch": 4432} {"train_loss": -7.086621284484863, "global_step": 186155, "epoch": 4432} {"train_loss": -7.317356586456299, "global_step": 186156, "epoch": 4432} {"train_loss": -7.235462665557861, "global_step": 186157, "epoch": 4432} {"train_loss": -7.3754377365112305, "global_step": 186158, "epoch": 4432} {"train_loss": -7.256953716278076, "global_step": 186159, "epoch": 4432} {"train_loss": -7.328453063964844, "global_step": 186160, "epoch": 4432} {"train_loss": -7.2177557945251465, "global_step": 186161, "epoch": 4432} {"train_loss": -7.196451187133789, "global_step": 186162, "epoch": 4432} {"train_loss": -7.240978240966797, "global_step": 186163, "epoch": 4432} {"train_loss": -7.2709245681762695, "global_step": 186164, "epoch": 4432} {"train_loss": -7.291501045227051, "global_step": 186165, "epoch": 4432} {"train_loss": -7.039039134979248, "global_step": 186166, "epoch": 4432} {"train_loss": -7.174889087677002, "global_step": 186167, "epoch": 4432} {"train_loss": -7.289147853851318, "global_step": 186168, "epoch": 4432} {"train_loss": -7.205604553222656, "global_step": 186169, "epoch": 4432} {"train_loss": -7.169932842254639, "global_step": 186170, "epoch": 4432} {"train_loss": -7.16817569732666, "global_step": 186171, "epoch": 4432} {"train_loss": -7.117449760437012, "global_step": 186172, "epoch": 4432} {"train_loss": -7.113541603088379, "global_step": 186173, "epoch": 4432} {"train_loss": -7.092138290405273, "global_step": 186174, "epoch": 4432} {"train_loss": -7.206869125366211, "global_step": 186175, "epoch": 4432} {"train_loss": -7.219120979309082, "global_step": 186176, "epoch": 4432} {"train_loss": -7.22183084487915, "global_step": 186177, "epoch": 4432} {"train_loss": -7.165039539337158, "global_step": 186178, "epoch": 4432} {"train_loss": -7.206370830535889, "global_step": 186179, "epoch": 4432} {"train_loss": -7.16327428817749, "global_step": 186180, "epoch": 4432} {"train_loss": -7.160490989685059, "global_step": 186181, "epoch": 4432} {"train_loss": -7.151968955993652, "global_step": 186182, "epoch": 4432} {"train_loss": -7.0816216468811035, "global_step": 186183, "epoch": 4432} {"train_loss": -7.155844688415527, "global_step": 186184, "epoch": 4432} {"train_loss": -7.1948137283325195, "global_step": 186185, "epoch": 4432, "val_loss": 80805.4140625} {"train_loss": -7.101205348968506, "global_step": 186186, "epoch": 4433} {"train_loss": -7.1535797119140625, "global_step": 186187, "epoch": 4433} {"train_loss": -7.302035808563232, "global_step": 186188, "epoch": 4433} {"train_loss": -7.186971664428711, "global_step": 186189, "epoch": 4433} {"train_loss": -7.106316566467285, "global_step": 186190, "epoch": 4433} {"train_loss": -7.202911376953125, "global_step": 186191, "epoch": 4433} {"train_loss": -7.16910982131958, "global_step": 186192, "epoch": 4433} {"train_loss": -7.168307781219482, "global_step": 186193, "epoch": 4433} {"train_loss": -7.265786170959473, "global_step": 186194, "epoch": 4433} {"train_loss": -7.210095405578613, "global_step": 186195, "epoch": 4433} {"train_loss": -7.118378639221191, "global_step": 186196, "epoch": 4433} {"train_loss": -7.2829694747924805, "global_step": 186197, "epoch": 4433} {"train_loss": -7.172550201416016, "global_step": 186198, "epoch": 4433} {"train_loss": -7.0662431716918945, "global_step": 186199, "epoch": 4433} {"train_loss": -7.136251449584961, "global_step": 186200, "epoch": 4433} {"train_loss": -7.220941066741943, "global_step": 186201, "epoch": 4433} {"train_loss": -6.876351356506348, "global_step": 186202, "epoch": 4433} {"train_loss": -7.0838775634765625, "global_step": 186203, "epoch": 4433} {"train_loss": -7.1199798583984375, "global_step": 186204, "epoch": 4433} {"train_loss": -7.154909610748291, "global_step": 186205, "epoch": 4433} {"train_loss": -7.116583347320557, "global_step": 186206, "epoch": 4433} {"train_loss": -7.14184045791626, "global_step": 186207, "epoch": 4433} {"train_loss": -7.128752708435059, "global_step": 186208, "epoch": 4433} {"train_loss": -7.218694686889648, "global_step": 186209, "epoch": 4433} {"train_loss": -7.1916656494140625, "global_step": 186210, "epoch": 4433} {"train_loss": -7.186094284057617, "global_step": 186211, "epoch": 4433} {"train_loss": -7.098723888397217, "global_step": 186212, "epoch": 4433} {"train_loss": -7.170446395874023, "global_step": 186213, "epoch": 4433} {"train_loss": -7.273709297180176, "global_step": 186214, "epoch": 4433} {"train_loss": -7.184836387634277, "global_step": 186215, "epoch": 4433} {"train_loss": -7.163303375244141, "global_step": 186216, "epoch": 4433} {"train_loss": -7.220333576202393, "global_step": 186217, "epoch": 4433} {"train_loss": -7.177735328674316, "global_step": 186218, "epoch": 4433} {"train_loss": -7.262177467346191, "global_step": 186219, "epoch": 4433} {"train_loss": -7.174381256103516, "global_step": 186220, "epoch": 4433} {"train_loss": -7.223641395568848, "global_step": 186221, "epoch": 4433} {"train_loss": -7.273749351501465, "global_step": 186222, "epoch": 4433} {"train_loss": -7.241858005523682, "global_step": 186223, "epoch": 4433} {"train_loss": -7.229632377624512, "global_step": 186224, "epoch": 4433} {"train_loss": -7.283049583435059, "global_step": 186225, "epoch": 4433} {"train_loss": -7.3122477531433105, "global_step": 186226, "epoch": 4433} {"train_loss": -7.180615356990269, "global_step": 186227, "epoch": 4433, "val_loss": 80644.609375} {"train_loss": -7.2672200202941895, "global_step": 186228, "epoch": 4434} {"train_loss": -7.295370578765869, "global_step": 186229, "epoch": 4434} {"train_loss": -7.19682502746582, "global_step": 186230, "epoch": 4434} {"train_loss": -7.201545715332031, "global_step": 186231, "epoch": 4434} {"train_loss": -7.234683990478516, "global_step": 186232, "epoch": 4434} {"train_loss": -7.260770320892334, "global_step": 186233, "epoch": 4434} {"train_loss": -7.2761430740356445, "global_step": 186234, "epoch": 4434} {"train_loss": -7.262949466705322, "global_step": 186235, "epoch": 4434} {"train_loss": -7.088560581207275, "global_step": 186236, "epoch": 4434} {"train_loss": -7.195594787597656, "global_step": 186237, "epoch": 4434} {"train_loss": -7.201915264129639, "global_step": 186238, "epoch": 4434} {"train_loss": -7.187854766845703, "global_step": 186239, "epoch": 4434} {"train_loss": -7.351130962371826, "global_step": 186240, "epoch": 4434} {"train_loss": -7.201785087585449, "global_step": 186241, "epoch": 4434} {"train_loss": -7.198089599609375, "global_step": 186242, "epoch": 4434} {"train_loss": -7.202571868896484, "global_step": 186243, "epoch": 4434} {"train_loss": -7.222784042358398, "global_step": 186244, "epoch": 4434} {"train_loss": -7.2308349609375, "global_step": 186245, "epoch": 4434} {"train_loss": -7.234133243560791, "global_step": 186246, "epoch": 4434} {"train_loss": -7.206086158752441, "global_step": 186247, "epoch": 4434} {"train_loss": -7.177196979522705, "global_step": 186248, "epoch": 4434} {"train_loss": -7.1320085525512695, "global_step": 186249, "epoch": 4434} {"train_loss": -7.342301368713379, "global_step": 186250, "epoch": 4434} {"train_loss": -7.2636871337890625, "global_step": 186251, "epoch": 4434} {"train_loss": -7.204061508178711, "global_step": 186252, "epoch": 4434} {"train_loss": -7.165227890014648, "global_step": 186253, "epoch": 4434} {"train_loss": -7.246603012084961, "global_step": 186254, "epoch": 4434} {"train_loss": -7.156096458435059, "global_step": 186255, "epoch": 4434} {"train_loss": -7.237760543823242, "global_step": 186256, "epoch": 4434} {"train_loss": -7.238663673400879, "global_step": 186257, "epoch": 4434} {"train_loss": -7.063250541687012, "global_step": 186258, "epoch": 4434} {"train_loss": -7.155419826507568, "global_step": 186259, "epoch": 4434} {"train_loss": -7.043489456176758, "global_step": 186260, "epoch": 4434} {"train_loss": -7.082085609436035, "global_step": 186261, "epoch": 4434} {"train_loss": -7.122494697570801, "global_step": 186262, "epoch": 4434} {"train_loss": -7.09323787689209, "global_step": 186263, "epoch": 4434} {"train_loss": -7.191420078277588, "global_step": 186264, "epoch": 4434} {"train_loss": -7.183481216430664, "global_step": 186265, "epoch": 4434} {"train_loss": -7.073765754699707, "global_step": 186266, "epoch": 4434} {"train_loss": -6.978156089782715, "global_step": 186267, "epoch": 4434} {"train_loss": -6.879674434661865, "global_step": 186268, "epoch": 4434} {"train_loss": -7.183364266440982, "global_step": 186269, "epoch": 4434, "val_loss": 80829.453125} {"train_loss": -7.03662109375, "global_step": 186270, "epoch": 4435} {"train_loss": -7.0364298820495605, "global_step": 186271, "epoch": 4435} {"train_loss": -7.177705764770508, "global_step": 186272, "epoch": 4435} {"train_loss": -6.944413661956787, "global_step": 186273, "epoch": 4435} {"train_loss": -7.07630729675293, "global_step": 186274, "epoch": 4435} {"train_loss": -6.940783500671387, "global_step": 186275, "epoch": 4435} {"train_loss": -6.975311279296875, "global_step": 186276, "epoch": 4435} {"train_loss": -7.053645133972168, "global_step": 186277, "epoch": 4435} {"train_loss": -6.867499351501465, "global_step": 186278, "epoch": 4435} {"train_loss": -7.126331806182861, "global_step": 186279, "epoch": 4435} {"train_loss": -7.098191261291504, "global_step": 186280, "epoch": 4435} {"train_loss": -7.026451587677002, "global_step": 186281, "epoch": 4435} {"train_loss": -6.966181755065918, "global_step": 186282, "epoch": 4435} {"train_loss": -7.02664852142334, "global_step": 186283, "epoch": 4435} {"train_loss": -7.123378276824951, "global_step": 186284, "epoch": 4435} {"train_loss": -7.080959320068359, "global_step": 186285, "epoch": 4435} {"train_loss": -7.086941719055176, "global_step": 186286, "epoch": 4435} {"train_loss": -7.059721946716309, "global_step": 186287, "epoch": 4435} {"train_loss": -7.007142543792725, "global_step": 186288, "epoch": 4435} {"train_loss": -7.101907730102539, "global_step": 186289, "epoch": 4435} {"train_loss": -7.216698169708252, "global_step": 186290, "epoch": 4435} {"train_loss": -7.119354248046875, "global_step": 186291, "epoch": 4435} {"train_loss": -7.192471027374268, "global_step": 186292, "epoch": 4435} {"train_loss": -7.133759498596191, "global_step": 186293, "epoch": 4435} {"train_loss": -7.055584907531738, "global_step": 186294, "epoch": 4435} {"train_loss": -7.215623378753662, "global_step": 186295, "epoch": 4435} {"train_loss": -7.1582512855529785, "global_step": 186296, "epoch": 4435} {"train_loss": -7.181094646453857, "global_step": 186297, "epoch": 4435} {"train_loss": -7.15322732925415, "global_step": 186298, "epoch": 4435} {"train_loss": -7.074872016906738, "global_step": 186299, "epoch": 4435} {"train_loss": -7.191811561584473, "global_step": 186300, "epoch": 4435} {"train_loss": -7.149483680725098, "global_step": 186301, "epoch": 4435} {"train_loss": -7.0903120040893555, "global_step": 186302, "epoch": 4435} {"train_loss": -7.1991987228393555, "global_step": 186303, "epoch": 4435} {"train_loss": -7.128931045532227, "global_step": 186304, "epoch": 4435} {"train_loss": -7.213797569274902, "global_step": 186305, "epoch": 4435} {"train_loss": -7.101876735687256, "global_step": 186306, "epoch": 4435} {"train_loss": -7.153602123260498, "global_step": 186307, "epoch": 4435} {"train_loss": -7.1404128074646, "global_step": 186308, "epoch": 4435} {"train_loss": -7.038631439208984, "global_step": 186309, "epoch": 4435} {"train_loss": -7.174933433532715, "global_step": 186310, "epoch": 4435} {"train_loss": -7.096163352330525, "global_step": 186311, "epoch": 4435, "val_loss": 80826.6484375} {"train_loss": -7.316779136657715, "global_step": 186312, "epoch": 4436} {"train_loss": -7.127529144287109, "global_step": 186313, "epoch": 4436} {"train_loss": -7.169836044311523, "global_step": 186314, "epoch": 4436} {"train_loss": -7.211208343505859, "global_step": 186315, "epoch": 4436} {"train_loss": -7.189345359802246, "global_step": 186316, "epoch": 4436} {"train_loss": -7.237817764282227, "global_step": 186317, "epoch": 4436} {"train_loss": -7.199692726135254, "global_step": 186318, "epoch": 4436} {"train_loss": -7.216770172119141, "global_step": 186319, "epoch": 4436} {"train_loss": -7.159787178039551, "global_step": 186320, "epoch": 4436} {"train_loss": -7.156531810760498, "global_step": 186321, "epoch": 4436} {"train_loss": -7.169620037078857, "global_step": 186322, "epoch": 4436} {"train_loss": -7.0378737449646, "global_step": 186323, "epoch": 4436} {"train_loss": -7.203002452850342, "global_step": 186324, "epoch": 4436} {"train_loss": -7.045083999633789, "global_step": 186325, "epoch": 4436} {"train_loss": -7.043149471282959, "global_step": 186326, "epoch": 4436} {"train_loss": -7.2516984939575195, "global_step": 186327, "epoch": 4436} {"train_loss": -7.046848297119141, "global_step": 186328, "epoch": 4436} {"train_loss": -7.099365234375, "global_step": 186329, "epoch": 4436} {"train_loss": -7.202945232391357, "global_step": 186330, "epoch": 4436} {"train_loss": -7.0611042976379395, "global_step": 186331, "epoch": 4436} {"train_loss": -7.191529273986816, "global_step": 186332, "epoch": 4436} {"train_loss": -7.090496063232422, "global_step": 186333, "epoch": 4436} {"train_loss": -6.971400260925293, "global_step": 186334, "epoch": 4436} {"train_loss": -7.1399993896484375, "global_step": 186335, "epoch": 4436} {"train_loss": -7.125816345214844, "global_step": 186336, "epoch": 4436} {"train_loss": -7.110334396362305, "global_step": 186337, "epoch": 4436} {"train_loss": -7.105960845947266, "global_step": 186338, "epoch": 4436} {"train_loss": -7.038777828216553, "global_step": 186339, "epoch": 4436} {"train_loss": -7.183605194091797, "global_step": 186340, "epoch": 4436} {"train_loss": -7.069055080413818, "global_step": 186341, "epoch": 4436} {"train_loss": -7.14171028137207, "global_step": 186342, "epoch": 4436} {"train_loss": -7.141822338104248, "global_step": 186343, "epoch": 4436} {"train_loss": -7.080395698547363, "global_step": 186344, "epoch": 4436} {"train_loss": -7.197428226470947, "global_step": 186345, "epoch": 4436} {"train_loss": -7.151571273803711, "global_step": 186346, "epoch": 4436} {"train_loss": -7.255515098571777, "global_step": 186347, "epoch": 4436} {"train_loss": -7.122650146484375, "global_step": 186348, "epoch": 4436} {"train_loss": -7.177936553955078, "global_step": 186349, "epoch": 4436} {"train_loss": -7.084586143493652, "global_step": 186350, "epoch": 4436} {"train_loss": -7.123476982116699, "global_step": 186351, "epoch": 4436} {"train_loss": -7.156306266784668, "global_step": 186352, "epoch": 4436} {"train_loss": -7.143101431074596, "global_step": 186353, "epoch": 4436, "val_loss": 80711.28125} {"train_loss": -7.024021148681641, "global_step": 186354, "epoch": 4437} {"train_loss": -7.252886772155762, "global_step": 186355, "epoch": 4437} {"train_loss": -7.144382953643799, "global_step": 186356, "epoch": 4437} {"train_loss": -7.177068710327148, "global_step": 186357, "epoch": 4437} {"train_loss": -7.320106506347656, "global_step": 186358, "epoch": 4437} {"train_loss": -7.091577529907227, "global_step": 186359, "epoch": 4437} {"train_loss": -7.103343486785889, "global_step": 186360, "epoch": 4437} {"train_loss": -7.165665149688721, "global_step": 186361, "epoch": 4437} {"train_loss": -7.131435394287109, "global_step": 186362, "epoch": 4437} {"train_loss": -7.177106857299805, "global_step": 186363, "epoch": 4437} {"train_loss": -7.227408409118652, "global_step": 186364, "epoch": 4437} {"train_loss": -7.232334136962891, "global_step": 186365, "epoch": 4437} {"train_loss": -7.157289981842041, "global_step": 186366, "epoch": 4437} {"train_loss": -7.071323871612549, "global_step": 186367, "epoch": 4437} {"train_loss": -7.274872779846191, "global_step": 186368, "epoch": 4437} {"train_loss": -7.226773262023926, "global_step": 186369, "epoch": 4437} {"train_loss": -7.050817489624023, "global_step": 186370, "epoch": 4437} {"train_loss": -7.249682903289795, "global_step": 186371, "epoch": 4437} {"train_loss": -7.194806098937988, "global_step": 186372, "epoch": 4437} {"train_loss": -7.224517822265625, "global_step": 186373, "epoch": 4437} {"train_loss": -7.218211650848389, "global_step": 186374, "epoch": 4437} {"train_loss": -7.230836868286133, "global_step": 186375, "epoch": 4437} {"train_loss": -7.093445777893066, "global_step": 186376, "epoch": 4437} {"train_loss": -7.118902683258057, "global_step": 186377, "epoch": 4437} {"train_loss": -7.201509475708008, "global_step": 186378, "epoch": 4437} {"train_loss": -7.081094741821289, "global_step": 186379, "epoch": 4437} {"train_loss": -7.0905303955078125, "global_step": 186380, "epoch": 4437} {"train_loss": -6.975292205810547, "global_step": 186381, "epoch": 4437} {"train_loss": -6.909660339355469, "global_step": 186382, "epoch": 4437} {"train_loss": -6.9117584228515625, "global_step": 186383, "epoch": 4437} {"train_loss": -7.125966548919678, "global_step": 186384, "epoch": 4437} {"train_loss": -6.8456220626831055, "global_step": 186385, "epoch": 4437} {"train_loss": -6.996866226196289, "global_step": 186386, "epoch": 4437} {"train_loss": -6.885929584503174, "global_step": 186387, "epoch": 4437} {"train_loss": -6.891387939453125, "global_step": 186388, "epoch": 4437} {"train_loss": -6.996406555175781, "global_step": 186389, "epoch": 4437} {"train_loss": -7.017213821411133, "global_step": 186390, "epoch": 4437} {"train_loss": -7.077644348144531, "global_step": 186391, "epoch": 4437} {"train_loss": -7.161099910736084, "global_step": 186392, "epoch": 4437} {"train_loss": -7.135211944580078, "global_step": 186393, "epoch": 4437} {"train_loss": -6.936417102813721, "global_step": 186394, "epoch": 4437} {"train_loss": -7.105651946294875, "global_step": 186395, "epoch": 4437, "val_loss": 81012.734375} {"train_loss": -7.17105770111084, "global_step": 186396, "epoch": 4438} {"train_loss": -7.002872467041016, "global_step": 186397, "epoch": 4438} {"train_loss": -7.082212924957275, "global_step": 186398, "epoch": 4438} {"train_loss": -6.998775959014893, "global_step": 186399, "epoch": 4438} {"train_loss": -7.027406692504883, "global_step": 186400, "epoch": 4438} {"train_loss": -7.188005447387695, "global_step": 186401, "epoch": 4438} {"train_loss": -7.146778106689453, "global_step": 186402, "epoch": 4438} {"train_loss": -7.208520889282227, "global_step": 186403, "epoch": 4438} {"train_loss": -7.156403064727783, "global_step": 186404, "epoch": 4438} {"train_loss": -7.120194911956787, "global_step": 186405, "epoch": 4438} {"train_loss": -7.145479202270508, "global_step": 186406, "epoch": 4438} {"train_loss": -7.12555456161499, "global_step": 186407, "epoch": 4438} {"train_loss": -7.174620628356934, "global_step": 186408, "epoch": 4438} {"train_loss": -7.094973087310791, "global_step": 186409, "epoch": 4438} {"train_loss": -7.247289657592773, "global_step": 186410, "epoch": 4438} {"train_loss": -7.132080078125, "global_step": 186411, "epoch": 4438} {"train_loss": -7.183318138122559, "global_step": 186412, "epoch": 4438} {"train_loss": -7.191740036010742, "global_step": 186413, "epoch": 4438} {"train_loss": -7.203865051269531, "global_step": 186414, "epoch": 4438} {"train_loss": -7.268378734588623, "global_step": 186415, "epoch": 4438} {"train_loss": -7.189772605895996, "global_step": 186416, "epoch": 4438} {"train_loss": -7.175553798675537, "global_step": 186417, "epoch": 4438} {"train_loss": -7.200709342956543, "global_step": 186418, "epoch": 4438} {"train_loss": -7.118891716003418, "global_step": 186419, "epoch": 4438} {"train_loss": -7.297124862670898, "global_step": 186420, "epoch": 4438} {"train_loss": -7.223152160644531, "global_step": 186421, "epoch": 4438} {"train_loss": -7.212428092956543, "global_step": 186422, "epoch": 4438} {"train_loss": -7.099626541137695, "global_step": 186423, "epoch": 4438} {"train_loss": -7.203168869018555, "global_step": 186424, "epoch": 4438} {"train_loss": -7.172239303588867, "global_step": 186425, "epoch": 4438} {"train_loss": -7.260169982910156, "global_step": 186426, "epoch": 4438} {"train_loss": -7.137847423553467, "global_step": 186427, "epoch": 4438} {"train_loss": -7.034187316894531, "global_step": 186428, "epoch": 4438} {"train_loss": -7.211195945739746, "global_step": 186429, "epoch": 4438} {"train_loss": -7.063260555267334, "global_step": 186430, "epoch": 4438} {"train_loss": -7.070211410522461, "global_step": 186431, "epoch": 4438} {"train_loss": -7.232953071594238, "global_step": 186432, "epoch": 4438} {"train_loss": -7.127313613891602, "global_step": 186433, "epoch": 4438} {"train_loss": -7.148340702056885, "global_step": 186434, "epoch": 4438} {"train_loss": -7.199474811553955, "global_step": 186435, "epoch": 4438} {"train_loss": -7.270462989807129, "global_step": 186436, "epoch": 4438} {"train_loss": -7.158987885429745, "global_step": 186437, "epoch": 4438, "val_loss": 80746.5546875} {"train_loss": -7.0979509353637695, "global_step": 186438, "epoch": 4439} {"train_loss": -7.057686805725098, "global_step": 186439, "epoch": 4439} {"train_loss": -7.186348915100098, "global_step": 186440, "epoch": 4439} {"train_loss": -7.174255847930908, "global_step": 186441, "epoch": 4439} {"train_loss": -7.220209121704102, "global_step": 186442, "epoch": 4439} {"train_loss": -7.192023754119873, "global_step": 186443, "epoch": 4439} {"train_loss": -7.212344169616699, "global_step": 186444, "epoch": 4439} {"train_loss": -7.261723518371582, "global_step": 186445, "epoch": 4439} {"train_loss": -7.177957534790039, "global_step": 186446, "epoch": 4439} {"train_loss": -7.250088214874268, "global_step": 186447, "epoch": 4439} {"train_loss": -7.3532280921936035, "global_step": 186448, "epoch": 4439} {"train_loss": -7.2547478675842285, "global_step": 186449, "epoch": 4439} {"train_loss": -7.201464653015137, "global_step": 186450, "epoch": 4439} {"train_loss": -7.350029945373535, "global_step": 186451, "epoch": 4439} {"train_loss": -7.281365871429443, "global_step": 186452, "epoch": 4439} {"train_loss": -7.245577812194824, "global_step": 186453, "epoch": 4439} {"train_loss": -7.245737075805664, "global_step": 186454, "epoch": 4439} {"train_loss": -7.1310715675354, "global_step": 186455, "epoch": 4439} {"train_loss": -7.198123931884766, "global_step": 186456, "epoch": 4439} {"train_loss": -7.296282768249512, "global_step": 186457, "epoch": 4439} {"train_loss": -7.247261047363281, "global_step": 186458, "epoch": 4439} {"train_loss": -7.347658157348633, "global_step": 186459, "epoch": 4439} {"train_loss": -7.1544294357299805, "global_step": 186460, "epoch": 4439} {"train_loss": -7.242665767669678, "global_step": 186461, "epoch": 4439} {"train_loss": -7.28260612487793, "global_step": 186462, "epoch": 4439} {"train_loss": -7.227405548095703, "global_step": 186463, "epoch": 4439} {"train_loss": -7.286249160766602, "global_step": 186464, "epoch": 4439} {"train_loss": -7.162341117858887, "global_step": 186465, "epoch": 4439} {"train_loss": -7.235624313354492, "global_step": 186466, "epoch": 4439} {"train_loss": -7.157374382019043, "global_step": 186467, "epoch": 4439} {"train_loss": -7.2685546875, "global_step": 186468, "epoch": 4439} {"train_loss": -7.081708908081055, "global_step": 186469, "epoch": 4439} {"train_loss": -7.086811065673828, "global_step": 186470, "epoch": 4439} {"train_loss": -7.158152103424072, "global_step": 186471, "epoch": 4439} {"train_loss": -7.141136169433594, "global_step": 186472, "epoch": 4439} {"train_loss": -7.047647953033447, "global_step": 186473, "epoch": 4439} {"train_loss": -7.146456718444824, "global_step": 186474, "epoch": 4439} {"train_loss": -7.042967796325684, "global_step": 186475, "epoch": 4439} {"train_loss": -7.150937557220459, "global_step": 186476, "epoch": 4439} {"train_loss": -7.03378438949585, "global_step": 186477, "epoch": 4439} {"train_loss": -7.1990180015563965, "global_step": 186478, "epoch": 4439} {"train_loss": -7.194551422482445, "global_step": 186479, "epoch": 4439, "val_loss": 80796.921875} {"train_loss": -7.203265190124512, "global_step": 186480, "epoch": 4440} {"train_loss": -7.213974952697754, "global_step": 186481, "epoch": 4440} {"train_loss": -7.170214653015137, "global_step": 186482, "epoch": 4440} {"train_loss": -7.104272842407227, "global_step": 186483, "epoch": 4440} {"train_loss": -7.121111869812012, "global_step": 186484, "epoch": 4440} {"train_loss": -7.2454681396484375, "global_step": 186485, "epoch": 4440} {"train_loss": -7.219407558441162, "global_step": 186486, "epoch": 4440} {"train_loss": -7.124499797821045, "global_step": 186487, "epoch": 4440} {"train_loss": -7.182792663574219, "global_step": 186488, "epoch": 4440} {"train_loss": -7.222841262817383, "global_step": 186489, "epoch": 4440} {"train_loss": -7.129729270935059, "global_step": 186490, "epoch": 4440} {"train_loss": -7.182035446166992, "global_step": 186491, "epoch": 4440} {"train_loss": -7.150779724121094, "global_step": 186492, "epoch": 4440} {"train_loss": -7.217909812927246, "global_step": 186493, "epoch": 4440} {"train_loss": -7.132794380187988, "global_step": 186494, "epoch": 4440} {"train_loss": -7.267673492431641, "global_step": 186495, "epoch": 4440} {"train_loss": -7.133044242858887, "global_step": 186496, "epoch": 4440} {"train_loss": -7.061556339263916, "global_step": 186497, "epoch": 4440} {"train_loss": -7.327118873596191, "global_step": 186498, "epoch": 4440} {"train_loss": -7.220318794250488, "global_step": 186499, "epoch": 4440} {"train_loss": -7.2905964851379395, "global_step": 186500, "epoch": 4440} {"train_loss": -7.103399276733398, "global_step": 186501, "epoch": 4440} {"train_loss": -7.148972511291504, "global_step": 186502, "epoch": 4440} {"train_loss": -7.250575065612793, "global_step": 186503, "epoch": 4440} {"train_loss": -7.223702430725098, "global_step": 186504, "epoch": 4440} {"train_loss": -7.1852946281433105, "global_step": 186505, "epoch": 4440} {"train_loss": -7.179909706115723, "global_step": 186506, "epoch": 4440} {"train_loss": -7.249741077423096, "global_step": 186507, "epoch": 4440} {"train_loss": -7.241787910461426, "global_step": 186508, "epoch": 4440} {"train_loss": -7.328441619873047, "global_step": 186509, "epoch": 4440} {"train_loss": -7.298789978027344, "global_step": 186510, "epoch": 4440} {"train_loss": -7.260795593261719, "global_step": 186511, "epoch": 4440} {"train_loss": -7.210564613342285, "global_step": 186512, "epoch": 4440} {"train_loss": -7.210604667663574, "global_step": 186513, "epoch": 4440} {"train_loss": -7.159930229187012, "global_step": 186514, "epoch": 4440} {"train_loss": -7.266523838043213, "global_step": 186515, "epoch": 4440} {"train_loss": -7.1107177734375, "global_step": 186516, "epoch": 4440} {"train_loss": -7.14732551574707, "global_step": 186517, "epoch": 4440} {"train_loss": -7.150649547576904, "global_step": 186518, "epoch": 4440} {"train_loss": -7.197098731994629, "global_step": 186519, "epoch": 4440} {"train_loss": -7.1637115478515625, "global_step": 186520, "epoch": 4440} {"train_loss": -7.196609417597453, "global_step": 186521, "epoch": 4440, "val_loss": 81097.53125} {"train_loss": -7.068431854248047, "global_step": 186522, "epoch": 4441} {"train_loss": -7.111383438110352, "global_step": 186523, "epoch": 4441} {"train_loss": -7.104877948760986, "global_step": 186524, "epoch": 4441} {"train_loss": -7.139313697814941, "global_step": 186525, "epoch": 4441} {"train_loss": -7.239305019378662, "global_step": 186526, "epoch": 4441} {"train_loss": -7.142782688140869, "global_step": 186527, "epoch": 4441} {"train_loss": -7.196719169616699, "global_step": 186528, "epoch": 4441} {"train_loss": -7.069365978240967, "global_step": 186529, "epoch": 4441} {"train_loss": -7.154362678527832, "global_step": 186530, "epoch": 4441} {"train_loss": -7.299099922180176, "global_step": 186531, "epoch": 4441} {"train_loss": -7.133678436279297, "global_step": 186532, "epoch": 4441} {"train_loss": -7.248164176940918, "global_step": 186533, "epoch": 4441} {"train_loss": -7.230842590332031, "global_step": 186534, "epoch": 4441} {"train_loss": -7.241861343383789, "global_step": 186535, "epoch": 4441} {"train_loss": -7.215048789978027, "global_step": 186536, "epoch": 4441} {"train_loss": -7.205636024475098, "global_step": 186537, "epoch": 4441} {"train_loss": -7.15098237991333, "global_step": 186538, "epoch": 4441} {"train_loss": -7.126307487487793, "global_step": 186539, "epoch": 4441} {"train_loss": -7.154077529907227, "global_step": 186540, "epoch": 4441} {"train_loss": -7.16237735748291, "global_step": 186541, "epoch": 4441} {"train_loss": -7.209942817687988, "global_step": 186542, "epoch": 4441} {"train_loss": -7.214763641357422, "global_step": 186543, "epoch": 4441} {"train_loss": -7.16350793838501, "global_step": 186544, "epoch": 4441} {"train_loss": -7.243266582489014, "global_step": 186545, "epoch": 4441} {"train_loss": -7.218402862548828, "global_step": 186546, "epoch": 4441} {"train_loss": -7.088230133056641, "global_step": 186547, "epoch": 4441} {"train_loss": -7.152531623840332, "global_step": 186548, "epoch": 4441} {"train_loss": -7.088284492492676, "global_step": 186549, "epoch": 4441} {"train_loss": -7.095439434051514, "global_step": 186550, "epoch": 4441} {"train_loss": -7.106951713562012, "global_step": 186551, "epoch": 4441} {"train_loss": -7.000586032867432, "global_step": 186552, "epoch": 4441} {"train_loss": -7.1224751472473145, "global_step": 186553, "epoch": 4441} {"train_loss": -7.2315521240234375, "global_step": 186554, "epoch": 4441} {"train_loss": -7.21073055267334, "global_step": 186555, "epoch": 4441} {"train_loss": -7.110179424285889, "global_step": 186556, "epoch": 4441} {"train_loss": -7.125479698181152, "global_step": 186557, "epoch": 4441} {"train_loss": -7.244347095489502, "global_step": 186558, "epoch": 4441} {"train_loss": -7.2021613121032715, "global_step": 186559, "epoch": 4441} {"train_loss": -7.229475498199463, "global_step": 186560, "epoch": 4441} {"train_loss": -7.150177478790283, "global_step": 186561, "epoch": 4441} {"train_loss": -7.242794036865234, "global_step": 186562, "epoch": 4441} {"train_loss": -7.167258705411639, "global_step": 186563, "epoch": 4441, "val_loss": 81146.7578125} {"train_loss": -7.22635555267334, "global_step": 186564, "epoch": 4442} {"train_loss": -7.269801139831543, "global_step": 186565, "epoch": 4442} {"train_loss": -7.166897773742676, "global_step": 186566, "epoch": 4442} {"train_loss": -7.22291374206543, "global_step": 186567, "epoch": 4442} {"train_loss": -7.19236946105957, "global_step": 186568, "epoch": 4442} {"train_loss": -7.11680793762207, "global_step": 186569, "epoch": 4442} {"train_loss": -7.198709487915039, "global_step": 186570, "epoch": 4442} {"train_loss": -7.164767265319824, "global_step": 186571, "epoch": 4442} {"train_loss": -7.23488712310791, "global_step": 186572, "epoch": 4442} {"train_loss": -7.21696138381958, "global_step": 186573, "epoch": 4442} {"train_loss": -7.207851409912109, "global_step": 186574, "epoch": 4442} {"train_loss": -7.1809892654418945, "global_step": 186575, "epoch": 4442} {"train_loss": -7.152755260467529, "global_step": 186576, "epoch": 4442} {"train_loss": -7.088227272033691, "global_step": 186577, "epoch": 4442} {"train_loss": -7.25372314453125, "global_step": 186578, "epoch": 4442} {"train_loss": -7.148184299468994, "global_step": 186579, "epoch": 4442} {"train_loss": -7.187068939208984, "global_step": 186580, "epoch": 4442} {"train_loss": -7.211704254150391, "global_step": 186581, "epoch": 4442} {"train_loss": -7.25054931640625, "global_step": 186582, "epoch": 4442} {"train_loss": -7.221532344818115, "global_step": 186583, "epoch": 4442} {"train_loss": -7.1930975914001465, "global_step": 186584, "epoch": 4442} {"train_loss": -7.162639617919922, "global_step": 186585, "epoch": 4442} {"train_loss": -7.328408241271973, "global_step": 186586, "epoch": 4442} {"train_loss": -7.228025436401367, "global_step": 186587, "epoch": 4442} {"train_loss": -7.296124458312988, "global_step": 186588, "epoch": 4442} {"train_loss": -7.209556579589844, "global_step": 186589, "epoch": 4442} {"train_loss": -7.315900802612305, "global_step": 186590, "epoch": 4442} {"train_loss": -7.229074478149414, "global_step": 186591, "epoch": 4442} {"train_loss": -7.356289386749268, "global_step": 186592, "epoch": 4442} {"train_loss": -7.3588480949401855, "global_step": 186593, "epoch": 4442} {"train_loss": -7.133199691772461, "global_step": 186594, "epoch": 4442} {"train_loss": -7.270159721374512, "global_step": 186595, "epoch": 4442} {"train_loss": -7.29401969909668, "global_step": 186596, "epoch": 4442} {"train_loss": -7.245190143585205, "global_step": 186597, "epoch": 4442} {"train_loss": -7.320071220397949, "global_step": 186598, "epoch": 4442} {"train_loss": -7.13368034362793, "global_step": 186599, "epoch": 4442} {"train_loss": -7.225980281829834, "global_step": 186600, "epoch": 4442} {"train_loss": -7.140632629394531, "global_step": 186601, "epoch": 4442} {"train_loss": -7.210319995880127, "global_step": 186602, "epoch": 4442} {"train_loss": -7.157026290893555, "global_step": 186603, "epoch": 4442} {"train_loss": -7.103215217590332, "global_step": 186604, "epoch": 4442} {"train_loss": -7.215327489943731, "global_step": 186605, "epoch": 4442, "val_loss": 80909.5078125} {"train_loss": -7.091377258300781, "global_step": 186606, "epoch": 4443} {"train_loss": -7.117947578430176, "global_step": 186607, "epoch": 4443} {"train_loss": -7.191458702087402, "global_step": 186608, "epoch": 4443} {"train_loss": -7.130297660827637, "global_step": 186609, "epoch": 4443} {"train_loss": -7.189473628997803, "global_step": 186610, "epoch": 4443} {"train_loss": -7.20387077331543, "global_step": 186611, "epoch": 4443} {"train_loss": -7.1574602127075195, "global_step": 186612, "epoch": 4443} {"train_loss": -7.227939605712891, "global_step": 186613, "epoch": 4443} {"train_loss": -7.137216567993164, "global_step": 186614, "epoch": 4443} {"train_loss": -7.009117126464844, "global_step": 186615, "epoch": 4443} {"train_loss": -7.166647911071777, "global_step": 186616, "epoch": 4443} {"train_loss": -7.105978012084961, "global_step": 186617, "epoch": 4443} {"train_loss": -7.000457286834717, "global_step": 186618, "epoch": 4443} {"train_loss": -7.131818771362305, "global_step": 186619, "epoch": 4443} {"train_loss": -7.123868942260742, "global_step": 186620, "epoch": 4443} {"train_loss": -7.24153995513916, "global_step": 186621, "epoch": 4443} {"train_loss": -7.055605411529541, "global_step": 186622, "epoch": 4443} {"train_loss": -7.036823749542236, "global_step": 186623, "epoch": 4443} {"train_loss": -7.0834736824035645, "global_step": 186624, "epoch": 4443} {"train_loss": -7.119147777557373, "global_step": 186625, "epoch": 4443} {"train_loss": -7.022873878479004, "global_step": 186626, "epoch": 4443} {"train_loss": -7.092028617858887, "global_step": 186627, "epoch": 4443} {"train_loss": -7.1908464431762695, "global_step": 186628, "epoch": 4443} {"train_loss": -7.13685417175293, "global_step": 186629, "epoch": 4443} {"train_loss": -7.060546875, "global_step": 186630, "epoch": 4443} {"train_loss": -7.153408527374268, "global_step": 186631, "epoch": 4443} {"train_loss": -7.351372718811035, "global_step": 186632, "epoch": 4443} {"train_loss": -7.0319108963012695, "global_step": 186633, "epoch": 4443} {"train_loss": -7.129339218139648, "global_step": 186634, "epoch": 4443} {"train_loss": -7.150289535522461, "global_step": 186635, "epoch": 4443} {"train_loss": -7.032426357269287, "global_step": 186636, "epoch": 4443} {"train_loss": -7.22648811340332, "global_step": 186637, "epoch": 4443} {"train_loss": -7.148917198181152, "global_step": 186638, "epoch": 4443} {"train_loss": -7.020485877990723, "global_step": 186639, "epoch": 4443} {"train_loss": -7.079288959503174, "global_step": 186640, "epoch": 4443} {"train_loss": -7.146391868591309, "global_step": 186641, "epoch": 4443} {"train_loss": -7.042879104614258, "global_step": 186642, "epoch": 4443} {"train_loss": -7.097706317901611, "global_step": 186643, "epoch": 4443} {"train_loss": -7.144258975982666, "global_step": 186644, "epoch": 4443} {"train_loss": -7.025777816772461, "global_step": 186645, "epoch": 4443} {"train_loss": -7.14194393157959, "global_step": 186646, "epoch": 4443} {"train_loss": -7.122541393552508, "global_step": 186647, "epoch": 4443, "val_loss": 81029.328125} {"train_loss": -7.1191864013671875, "global_step": 186648, "epoch": 4444} {"train_loss": -7.061014175415039, "global_step": 186649, "epoch": 4444} {"train_loss": -7.304660797119141, "global_step": 186650, "epoch": 4444} {"train_loss": -7.151194095611572, "global_step": 186651, "epoch": 4444} {"train_loss": -7.100803375244141, "global_step": 186652, "epoch": 4444} {"train_loss": -7.2466936111450195, "global_step": 186653, "epoch": 4444} {"train_loss": -7.134016036987305, "global_step": 186654, "epoch": 4444} {"train_loss": -7.119779586791992, "global_step": 186655, "epoch": 4444} {"train_loss": -7.191301345825195, "global_step": 186656, "epoch": 4444} {"train_loss": -7.168436050415039, "global_step": 186657, "epoch": 4444} {"train_loss": -7.233733654022217, "global_step": 186658, "epoch": 4444} {"train_loss": -7.249207496643066, "global_step": 186659, "epoch": 4444} {"train_loss": -7.235508918762207, "global_step": 186660, "epoch": 4444} {"train_loss": -7.262132167816162, "global_step": 186661, "epoch": 4444} {"train_loss": -7.235320568084717, "global_step": 186662, "epoch": 4444} {"train_loss": -7.277914047241211, "global_step": 186663, "epoch": 4444} {"train_loss": -7.243142127990723, "global_step": 186664, "epoch": 4444} {"train_loss": -7.062474727630615, "global_step": 186665, "epoch": 4444} {"train_loss": -7.146797180175781, "global_step": 186666, "epoch": 4444} {"train_loss": -7.200814247131348, "global_step": 186667, "epoch": 4444} {"train_loss": -7.093764305114746, "global_step": 186668, "epoch": 4444} {"train_loss": -7.004027843475342, "global_step": 186669, "epoch": 4444} {"train_loss": -7.246952056884766, "global_step": 186670, "epoch": 4444} {"train_loss": -7.132209777832031, "global_step": 186671, "epoch": 4444} {"train_loss": -7.2026166915893555, "global_step": 186672, "epoch": 4444} {"train_loss": -7.273838043212891, "global_step": 186673, "epoch": 4444} {"train_loss": -7.1613874435424805, "global_step": 186674, "epoch": 4444} {"train_loss": -7.23390007019043, "global_step": 186675, "epoch": 4444} {"train_loss": -7.247196197509766, "global_step": 186676, "epoch": 4444} {"train_loss": -7.215095520019531, "global_step": 186677, "epoch": 4444} {"train_loss": -7.2275896072387695, "global_step": 186678, "epoch": 4444} {"train_loss": -7.172039985656738, "global_step": 186679, "epoch": 4444} {"train_loss": -7.279247283935547, "global_step": 186680, "epoch": 4444} {"train_loss": -7.208049774169922, "global_step": 186681, "epoch": 4444} {"train_loss": -7.199333190917969, "global_step": 186682, "epoch": 4444} {"train_loss": -7.216640949249268, "global_step": 186683, "epoch": 4444} {"train_loss": -7.1231608390808105, "global_step": 186684, "epoch": 4444} {"train_loss": -7.334463119506836, "global_step": 186685, "epoch": 4444} {"train_loss": -7.18649435043335, "global_step": 186686, "epoch": 4444} {"train_loss": -7.226605415344238, "global_step": 186687, "epoch": 4444} {"train_loss": -7.348024368286133, "global_step": 186688, "epoch": 4444} {"train_loss": -7.195603995096116, "global_step": 186689, "epoch": 4444, "val_loss": 80727.2265625} {"train_loss": -7.096019744873047, "global_step": 186690, "epoch": 4445} {"train_loss": -7.217205047607422, "global_step": 186691, "epoch": 4445} {"train_loss": -7.230453014373779, "global_step": 186692, "epoch": 4445} {"train_loss": -7.343545436859131, "global_step": 186693, "epoch": 4445} {"train_loss": -7.2379961013793945, "global_step": 186694, "epoch": 4445} {"train_loss": -7.26981258392334, "global_step": 186695, "epoch": 4445} {"train_loss": -7.181417465209961, "global_step": 186696, "epoch": 4445} {"train_loss": -7.291230201721191, "global_step": 186697, "epoch": 4445} {"train_loss": -7.205852508544922, "global_step": 186698, "epoch": 4445} {"train_loss": -7.070253849029541, "global_step": 186699, "epoch": 4445} {"train_loss": -7.222343921661377, "global_step": 186700, "epoch": 4445} {"train_loss": -7.187143325805664, "global_step": 186701, "epoch": 4445} {"train_loss": -7.105319976806641, "global_step": 186702, "epoch": 4445} {"train_loss": -7.254078388214111, "global_step": 186703, "epoch": 4445} {"train_loss": -7.250602722167969, "global_step": 186704, "epoch": 4445} {"train_loss": -7.2512335777282715, "global_step": 186705, "epoch": 4445} {"train_loss": -7.060147285461426, "global_step": 186706, "epoch": 4445} {"train_loss": -7.159428596496582, "global_step": 186707, "epoch": 4445} {"train_loss": -7.172026634216309, "global_step": 186708, "epoch": 4445} {"train_loss": -7.147677421569824, "global_step": 186709, "epoch": 4445} {"train_loss": -7.12540340423584, "global_step": 186710, "epoch": 4445} {"train_loss": -7.126128673553467, "global_step": 186711, "epoch": 4445} {"train_loss": -7.135569095611572, "global_step": 186712, "epoch": 4445} {"train_loss": -7.218297004699707, "global_step": 186713, "epoch": 4445} {"train_loss": -7.157586097717285, "global_step": 186714, "epoch": 4445} {"train_loss": -7.12166690826416, "global_step": 186715, "epoch": 4445} {"train_loss": -7.190738677978516, "global_step": 186716, "epoch": 4445} {"train_loss": -7.181851863861084, "global_step": 186717, "epoch": 4445} {"train_loss": -7.20412015914917, "global_step": 186718, "epoch": 4445} {"train_loss": -7.028868198394775, "global_step": 186719, "epoch": 4445} {"train_loss": -7.121425628662109, "global_step": 186720, "epoch": 4445} {"train_loss": -7.153164863586426, "global_step": 186721, "epoch": 4445} {"train_loss": -7.09072208404541, "global_step": 186722, "epoch": 4445} {"train_loss": -7.206223487854004, "global_step": 186723, "epoch": 4445} {"train_loss": -7.205034255981445, "global_step": 186724, "epoch": 4445} {"train_loss": -7.234713554382324, "global_step": 186725, "epoch": 4445} {"train_loss": -7.262796401977539, "global_step": 186726, "epoch": 4445} {"train_loss": -7.1610612869262695, "global_step": 186727, "epoch": 4445} {"train_loss": -7.123443126678467, "global_step": 186728, "epoch": 4445} {"train_loss": -7.304027080535889, "global_step": 186729, "epoch": 4445} {"train_loss": -7.1158246994018555, "global_step": 186730, "epoch": 4445} {"train_loss": -7.178298870722453, "global_step": 186731, "epoch": 4445, "val_loss": 80680.046875} {"train_loss": -7.160600662231445, "global_step": 186732, "epoch": 4446} {"train_loss": -7.10256290435791, "global_step": 186733, "epoch": 4446} {"train_loss": -7.269491195678711, "global_step": 186734, "epoch": 4446} {"train_loss": -7.111252307891846, "global_step": 186735, "epoch": 4446} {"train_loss": -6.976292610168457, "global_step": 186736, "epoch": 4446} {"train_loss": -7.185798168182373, "global_step": 186737, "epoch": 4446} {"train_loss": -7.267383575439453, "global_step": 186738, "epoch": 4446} {"train_loss": -7.08928918838501, "global_step": 186739, "epoch": 4446} {"train_loss": -7.150810241699219, "global_step": 186740, "epoch": 4446} {"train_loss": -6.983129024505615, "global_step": 186741, "epoch": 4446} {"train_loss": -6.9540791511535645, "global_step": 186742, "epoch": 4446} {"train_loss": -7.177340507507324, "global_step": 186743, "epoch": 4446} {"train_loss": -7.016520977020264, "global_step": 186744, "epoch": 4446} {"train_loss": -7.1214141845703125, "global_step": 186745, "epoch": 4446} {"train_loss": -6.8394775390625, "global_step": 186746, "epoch": 4446} {"train_loss": -7.201748371124268, "global_step": 186747, "epoch": 4446} {"train_loss": -7.048465251922607, "global_step": 186748, "epoch": 4446} {"train_loss": -7.2542266845703125, "global_step": 186749, "epoch": 4446} {"train_loss": -6.926146507263184, "global_step": 186750, "epoch": 4446} {"train_loss": -7.123711585998535, "global_step": 186751, "epoch": 4446} {"train_loss": -7.024486064910889, "global_step": 186752, "epoch": 4446} {"train_loss": -7.136048793792725, "global_step": 186753, "epoch": 4446} {"train_loss": -6.988048076629639, "global_step": 186754, "epoch": 4446} {"train_loss": -7.151088714599609, "global_step": 186755, "epoch": 4446} {"train_loss": -7.03489875793457, "global_step": 186756, "epoch": 4446} {"train_loss": -7.171885967254639, "global_step": 186757, "epoch": 4446} {"train_loss": -7.011665344238281, "global_step": 186758, "epoch": 4446} {"train_loss": -6.992771148681641, "global_step": 186759, "epoch": 4446} {"train_loss": -7.1016387939453125, "global_step": 186760, "epoch": 4446} {"train_loss": -6.947527885437012, "global_step": 186761, "epoch": 4446} {"train_loss": -7.130161285400391, "global_step": 186762, "epoch": 4446} {"train_loss": -7.178131580352783, "global_step": 186763, "epoch": 4446} {"train_loss": -6.969204425811768, "global_step": 186764, "epoch": 4446} {"train_loss": -6.988880157470703, "global_step": 186765, "epoch": 4446} {"train_loss": -7.23435115814209, "global_step": 186766, "epoch": 4446} {"train_loss": -7.098817348480225, "global_step": 186767, "epoch": 4446} {"train_loss": -7.179088592529297, "global_step": 186768, "epoch": 4446} {"train_loss": -7.1752824783325195, "global_step": 186769, "epoch": 4446} {"train_loss": -7.189294815063477, "global_step": 186770, "epoch": 4446} {"train_loss": -7.078678607940674, "global_step": 186771, "epoch": 4446} {"train_loss": -7.207040786743164, "global_step": 186772, "epoch": 4446} {"train_loss": -7.0945212841033936, "global_step": 186773, "epoch": 4446, "val_loss": 80789.40625} {"train_loss": -7.177403450012207, "global_step": 186774, "epoch": 4447} {"train_loss": -7.022258758544922, "global_step": 186775, "epoch": 4447} {"train_loss": -7.070469856262207, "global_step": 186776, "epoch": 4447} {"train_loss": -7.106117248535156, "global_step": 186777, "epoch": 4447} {"train_loss": -7.082533836364746, "global_step": 186778, "epoch": 4447} {"train_loss": -7.157650947570801, "global_step": 186779, "epoch": 4447} {"train_loss": -7.216794490814209, "global_step": 186780, "epoch": 4447} {"train_loss": -7.115350246429443, "global_step": 186781, "epoch": 4447} {"train_loss": -7.1165666580200195, "global_step": 186782, "epoch": 4447} {"train_loss": -7.029283046722412, "global_step": 186783, "epoch": 4447} {"train_loss": -7.228228569030762, "global_step": 186784, "epoch": 4447} {"train_loss": -7.1352152824401855, "global_step": 186785, "epoch": 4447} {"train_loss": -7.167426586151123, "global_step": 186786, "epoch": 4447} {"train_loss": -7.208595275878906, "global_step": 186787, "epoch": 4447} {"train_loss": -7.089567184448242, "global_step": 186788, "epoch": 4447} {"train_loss": -7.172530174255371, "global_step": 186789, "epoch": 4447} {"train_loss": -7.082440376281738, "global_step": 186790, "epoch": 4447} {"train_loss": -7.178619384765625, "global_step": 186791, "epoch": 4447} {"train_loss": -7.193268775939941, "global_step": 186792, "epoch": 4447} {"train_loss": -7.086610317230225, "global_step": 186793, "epoch": 4447} {"train_loss": -7.2430219650268555, "global_step": 186794, "epoch": 4447} {"train_loss": -7.09759521484375, "global_step": 186795, "epoch": 4447} {"train_loss": -7.259744167327881, "global_step": 186796, "epoch": 4447} {"train_loss": -7.105599403381348, "global_step": 186797, "epoch": 4447} {"train_loss": -7.164958477020264, "global_step": 186798, "epoch": 4447} {"train_loss": -7.1145100593566895, "global_step": 186799, "epoch": 4447} {"train_loss": -7.255926132202148, "global_step": 186800, "epoch": 4447} {"train_loss": -7.19815731048584, "global_step": 186801, "epoch": 4447} {"train_loss": -7.1834821701049805, "global_step": 186802, "epoch": 4447} {"train_loss": -7.223348617553711, "global_step": 186803, "epoch": 4447} {"train_loss": -7.1449174880981445, "global_step": 186804, "epoch": 4447} {"train_loss": -7.206439018249512, "global_step": 186805, "epoch": 4447} {"train_loss": -7.18870210647583, "global_step": 186806, "epoch": 4447} {"train_loss": -7.159173965454102, "global_step": 186807, "epoch": 4447} {"train_loss": -7.222891807556152, "global_step": 186808, "epoch": 4447} {"train_loss": -7.285346984863281, "global_step": 186809, "epoch": 4447} {"train_loss": -7.1063551902771, "global_step": 186810, "epoch": 4447} {"train_loss": -7.2368268966674805, "global_step": 186811, "epoch": 4447} {"train_loss": -7.29733943939209, "global_step": 186812, "epoch": 4447} {"train_loss": -7.188360214233398, "global_step": 186813, "epoch": 4447} {"train_loss": -7.228362083435059, "global_step": 186814, "epoch": 4447} {"train_loss": -7.166159266517276, "global_step": 186815, "epoch": 4447, "val_loss": 80723.0} {"train_loss": -7.1405205726623535, "global_step": 186816, "epoch": 4448} {"train_loss": -7.27622127532959, "global_step": 186817, "epoch": 4448} {"train_loss": -7.298557281494141, "global_step": 186818, "epoch": 4448} {"train_loss": -7.126199245452881, "global_step": 186819, "epoch": 4448} {"train_loss": -7.286418914794922, "global_step": 186820, "epoch": 4448} {"train_loss": -7.222197532653809, "global_step": 186821, "epoch": 4448} {"train_loss": -7.25270414352417, "global_step": 186822, "epoch": 4448} {"train_loss": -7.1375651359558105, "global_step": 186823, "epoch": 4448} {"train_loss": -7.233071327209473, "global_step": 186824, "epoch": 4448} {"train_loss": -7.196005821228027, "global_step": 186825, "epoch": 4448} {"train_loss": -7.24674129486084, "global_step": 186826, "epoch": 4448} {"train_loss": -7.210526466369629, "global_step": 186827, "epoch": 4448} {"train_loss": -7.301421165466309, "global_step": 186828, "epoch": 4448} {"train_loss": -7.206151008605957, "global_step": 186829, "epoch": 4448} {"train_loss": -7.294495582580566, "global_step": 186830, "epoch": 4448} {"train_loss": -7.254488945007324, "global_step": 186831, "epoch": 4448} {"train_loss": -7.247845649719238, "global_step": 186832, "epoch": 4448} {"train_loss": -7.19539737701416, "global_step": 186833, "epoch": 4448} {"train_loss": -7.241878986358643, "global_step": 186834, "epoch": 4448} {"train_loss": -7.3067450523376465, "global_step": 186835, "epoch": 4448} {"train_loss": -7.338980674743652, "global_step": 186836, "epoch": 4448} {"train_loss": -7.274058818817139, "global_step": 186837, "epoch": 4448} {"train_loss": -7.224917888641357, "global_step": 186838, "epoch": 4448} {"train_loss": -7.260128498077393, "global_step": 186839, "epoch": 4448} {"train_loss": -7.289364814758301, "global_step": 186840, "epoch": 4448} {"train_loss": -7.2996721267700195, "global_step": 186841, "epoch": 4448} {"train_loss": -7.267801284790039, "global_step": 186842, "epoch": 4448} {"train_loss": -7.2984819412231445, "global_step": 186843, "epoch": 4448} {"train_loss": -7.232707977294922, "global_step": 186844, "epoch": 4448} {"train_loss": -7.306723117828369, "global_step": 186845, "epoch": 4448} {"train_loss": -7.132350444793701, "global_step": 186846, "epoch": 4448} {"train_loss": -7.132610321044922, "global_step": 186847, "epoch": 4448} {"train_loss": -7.18698787689209, "global_step": 186848, "epoch": 4448} {"train_loss": -7.209609031677246, "global_step": 186849, "epoch": 4448} {"train_loss": -7.256959915161133, "global_step": 186850, "epoch": 4448} {"train_loss": -7.11403226852417, "global_step": 186851, "epoch": 4448} {"train_loss": -7.23889684677124, "global_step": 186852, "epoch": 4448} {"train_loss": -7.121455669403076, "global_step": 186853, "epoch": 4448} {"train_loss": -7.181750774383545, "global_step": 186854, "epoch": 4448} {"train_loss": -7.107168197631836, "global_step": 186855, "epoch": 4448} {"train_loss": -7.040610313415527, "global_step": 186856, "epoch": 4448} {"train_loss": -7.224796227046421, "global_step": 186857, "epoch": 4448, "val_loss": 80881.546875} {"train_loss": -7.1740264892578125, "global_step": 186858, "epoch": 4449} {"train_loss": -7.073855400085449, "global_step": 186859, "epoch": 4449} {"train_loss": -7.179728984832764, "global_step": 186860, "epoch": 4449} {"train_loss": -7.232005596160889, "global_step": 186861, "epoch": 4449} {"train_loss": -7.218367576599121, "global_step": 186862, "epoch": 4449} {"train_loss": -7.182368278503418, "global_step": 186863, "epoch": 4449} {"train_loss": -7.255975723266602, "global_step": 186864, "epoch": 4449} {"train_loss": -7.288066864013672, "global_step": 186865, "epoch": 4449} {"train_loss": -7.143165111541748, "global_step": 186866, "epoch": 4449} {"train_loss": -7.1576738357543945, "global_step": 186867, "epoch": 4449} {"train_loss": -7.299820423126221, "global_step": 186868, "epoch": 4449} {"train_loss": -7.176527976989746, "global_step": 186869, "epoch": 4449} {"train_loss": -7.207335948944092, "global_step": 186870, "epoch": 4449} {"train_loss": -7.148739814758301, "global_step": 186871, "epoch": 4449} {"train_loss": -7.1882123947143555, "global_step": 186872, "epoch": 4449} {"train_loss": -7.083771228790283, "global_step": 186873, "epoch": 4449} {"train_loss": -7.137479782104492, "global_step": 186874, "epoch": 4449} {"train_loss": -7.176303863525391, "global_step": 186875, "epoch": 4449} {"train_loss": -7.095843315124512, "global_step": 186876, "epoch": 4449} {"train_loss": -7.122544288635254, "global_step": 186877, "epoch": 4449} {"train_loss": -7.181039810180664, "global_step": 186878, "epoch": 4449} {"train_loss": -7.1743011474609375, "global_step": 186879, "epoch": 4449} {"train_loss": -6.943940162658691, "global_step": 186880, "epoch": 4449} {"train_loss": -7.157184600830078, "global_step": 186881, "epoch": 4449} {"train_loss": -7.194244384765625, "global_step": 186882, "epoch": 4449} {"train_loss": -7.156527519226074, "global_step": 186883, "epoch": 4449} {"train_loss": -7.178118705749512, "global_step": 186884, "epoch": 4449} {"train_loss": -7.129156112670898, "global_step": 186885, "epoch": 4449} {"train_loss": -7.041983604431152, "global_step": 186886, "epoch": 4449} {"train_loss": -7.090075492858887, "global_step": 186887, "epoch": 4449} {"train_loss": -7.078058242797852, "global_step": 186888, "epoch": 4449} {"train_loss": -7.093898296356201, "global_step": 186889, "epoch": 4449} {"train_loss": -7.1284685134887695, "global_step": 186890, "epoch": 4449} {"train_loss": -7.092221260070801, "global_step": 186891, "epoch": 4449} {"train_loss": -7.144717216491699, "global_step": 186892, "epoch": 4449} {"train_loss": -7.04705810546875, "global_step": 186893, "epoch": 4449} {"train_loss": -7.118005752563477, "global_step": 186894, "epoch": 4449} {"train_loss": -7.276332855224609, "global_step": 186895, "epoch": 4449} {"train_loss": -7.02754020690918, "global_step": 186896, "epoch": 4449} {"train_loss": -7.211406707763672, "global_step": 186897, "epoch": 4449} {"train_loss": -7.20102071762085, "global_step": 186898, "epoch": 4449} {"train_loss": -7.15055911881583, "global_step": 186899, "epoch": 4449, "val_loss": 80777.8125} {"train_loss": -7.199626922607422, "global_step": 186900, "epoch": 4450} {"train_loss": -7.174055099487305, "global_step": 186901, "epoch": 4450} {"train_loss": -7.130678176879883, "global_step": 186902, "epoch": 4450} {"train_loss": -7.111863136291504, "global_step": 186903, "epoch": 4450} {"train_loss": -7.1554765701293945, "global_step": 186904, "epoch": 4450} {"train_loss": -7.070749282836914, "global_step": 186905, "epoch": 4450} {"train_loss": -7.165778160095215, "global_step": 186906, "epoch": 4450} {"train_loss": -7.247295379638672, "global_step": 186907, "epoch": 4450} {"train_loss": -7.158316612243652, "global_step": 186908, "epoch": 4450} {"train_loss": -7.196800708770752, "global_step": 186909, "epoch": 4450} {"train_loss": -7.1596784591674805, "global_step": 186910, "epoch": 4450} {"train_loss": -7.173543453216553, "global_step": 186911, "epoch": 4450} {"train_loss": -7.114223957061768, "global_step": 186912, "epoch": 4450} {"train_loss": -7.104920387268066, "global_step": 186913, "epoch": 4450} {"train_loss": -7.204885482788086, "global_step": 186914, "epoch": 4450} {"train_loss": -7.1637983322143555, "global_step": 186915, "epoch": 4450} {"train_loss": -7.245632171630859, "global_step": 186916, "epoch": 4450} {"train_loss": -7.231448173522949, "global_step": 186917, "epoch": 4450} {"train_loss": -7.261133193969727, "global_step": 186918, "epoch": 4450} {"train_loss": -7.087510585784912, "global_step": 186919, "epoch": 4450} {"train_loss": -7.125344276428223, "global_step": 186920, "epoch": 4450} {"train_loss": -7.236026763916016, "global_step": 186921, "epoch": 4450} {"train_loss": -7.17095947265625, "global_step": 186922, "epoch": 4450} {"train_loss": -7.255857944488525, "global_step": 186923, "epoch": 4450} {"train_loss": -7.21473503112793, "global_step": 186924, "epoch": 4450} {"train_loss": -7.156454086303711, "global_step": 186925, "epoch": 4450} {"train_loss": -7.232419967651367, "global_step": 186926, "epoch": 4450} {"train_loss": -7.149809837341309, "global_step": 186927, "epoch": 4450} {"train_loss": -7.232369422912598, "global_step": 186928, "epoch": 4450} {"train_loss": -7.213353633880615, "global_step": 186929, "epoch": 4450} {"train_loss": -7.1952104568481445, "global_step": 186930, "epoch": 4450} {"train_loss": -7.289425849914551, "global_step": 186931, "epoch": 4450} {"train_loss": -7.3112335205078125, "global_step": 186932, "epoch": 4450} {"train_loss": -7.189511299133301, "global_step": 186933, "epoch": 4450} {"train_loss": -7.323263168334961, "global_step": 186934, "epoch": 4450} {"train_loss": -7.205401420593262, "global_step": 186935, "epoch": 4450} {"train_loss": -7.154877185821533, "global_step": 186936, "epoch": 4450} {"train_loss": -7.183082580566406, "global_step": 186937, "epoch": 4450} {"train_loss": -7.169311046600342, "global_step": 186938, "epoch": 4450} {"train_loss": -7.1896562576293945, "global_step": 186939, "epoch": 4450} {"train_loss": -7.226008415222168, "global_step": 186940, "epoch": 4450} {"train_loss": -7.188730762118385, "global_step": 186941, "epoch": 4450, "train/sim_max_reward_0": 0.9133320138114007, "train/sim_max_reward_1": 0.9870185395999823, "train/sim_max_reward_2": 0.4647298386578739, "train/sim_max_reward_3": 0.5715663653461739, "train/sim_max_reward_4": 0.8863130512743271, "train/sim_max_reward_5": 0.5825549369815849, "test/sim_max_reward_4500000": 0.9794342546870153, "test/sim_max_reward_4500001": 0.9814792547443499, "test/sim_max_reward_4500002": 0.9852619086395121, "test/sim_max_reward_4500003": 0.16612352843893619, "test/sim_max_reward_4500004": 0.11021855472620881, "test/sim_max_reward_4500005": 0.48343328096792043, "test/sim_max_reward_4500006": 0.9609285662857632, "test/sim_max_reward_4500007": 0.9270713516605376, "test/sim_max_reward_4500008": 0.9906589486916179, "test/sim_max_reward_4500009": 0.05333894837771452, "test/sim_max_reward_4500010": 0.08493073273961133, "test/sim_max_reward_4500011": 0.9326868069243434, "test/sim_max_reward_4500012": 0.9654033437175887, "test/sim_max_reward_4500013": 0.006852391729544142, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.9503275860424824, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.017473235069328043, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.9529606327016632, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 1.0, "test/sim_max_reward_4500022": 0.4340541490112706, "test/sim_max_reward_4500023": 0.635001799126707, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9191101836930274, "test/sim_max_reward_4500026": 0.8053198858303555, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.05083789017917047, "test/sim_max_reward_4500030": 0.9902732382911751, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9943929985913591, "test/sim_max_reward_4500034": 0.9538933810430051, "test/sim_max_reward_4500035": 0.9801243215522291, "test/sim_max_reward_4500036": 0.9142594665948673, "test/sim_max_reward_4500037": 0.7972173523947577, "test/sim_max_reward_4500038": 0.32590587388182013, "test/sim_max_reward_4500039": 1.0, "test/sim_max_reward_4500040": 0.965595747364882, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.054824192968281046, "test/sim_max_reward_4500043": 0.6592228589713929, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9461429562518882, "test/sim_max_reward_4500046": 0.18331113643139585, "test/sim_max_reward_4500047": 0.9460128060443717, "test/sim_max_reward_4500048": 1.0, "test/sim_max_reward_4500049": 0.8897097541680798, "train/mean_score": 0.7342524576118904, "test/mean_score": 0.6249204885424718, "val_loss": 80720.59375} {"train_loss": -7.142034530639648, "global_step": 186942, "epoch": 4451} {"train_loss": -7.170544147491455, "global_step": 186943, "epoch": 4451} {"train_loss": -7.207535743713379, "global_step": 186944, "epoch": 4451} {"train_loss": -7.2567548751831055, "global_step": 186945, "epoch": 4451} {"train_loss": -7.198699951171875, "global_step": 186946, "epoch": 4451} {"train_loss": -7.287441730499268, "global_step": 186947, "epoch": 4451} {"train_loss": -7.16745662689209, "global_step": 186948, "epoch": 4451} {"train_loss": -7.145235061645508, "global_step": 186949, "epoch": 4451} {"train_loss": -7.127647399902344, "global_step": 186950, "epoch": 4451} {"train_loss": -7.269697189331055, "global_step": 186951, "epoch": 4451} {"train_loss": -7.254768371582031, "global_step": 186952, "epoch": 4451} {"train_loss": -7.123478889465332, "global_step": 186953, "epoch": 4451} {"train_loss": -7.100944995880127, "global_step": 186954, "epoch": 4451} {"train_loss": -6.99827766418457, "global_step": 186955, "epoch": 4451} {"train_loss": -7.191625595092773, "global_step": 186956, "epoch": 4451} {"train_loss": -7.183426856994629, "global_step": 186957, "epoch": 4451} {"train_loss": -7.128169536590576, "global_step": 186958, "epoch": 4451} {"train_loss": -7.184165954589844, "global_step": 186959, "epoch": 4451} {"train_loss": -7.065811634063721, "global_step": 186960, "epoch": 4451} {"train_loss": -7.097386360168457, "global_step": 186961, "epoch": 4451} {"train_loss": -7.049542427062988, "global_step": 186962, "epoch": 4451} {"train_loss": -7.14022159576416, "global_step": 186963, "epoch": 4451} {"train_loss": -7.238566875457764, "global_step": 186964, "epoch": 4451} {"train_loss": -7.093626976013184, "global_step": 186965, "epoch": 4451} {"train_loss": -7.157695770263672, "global_step": 186966, "epoch": 4451} {"train_loss": -7.123777389526367, "global_step": 186967, "epoch": 4451} {"train_loss": -7.132791996002197, "global_step": 186968, "epoch": 4451} {"train_loss": -7.183435440063477, "global_step": 186969, "epoch": 4451} {"train_loss": -7.081398963928223, "global_step": 186970, "epoch": 4451} {"train_loss": -7.130609512329102, "global_step": 186971, "epoch": 4451} {"train_loss": -7.02941370010376, "global_step": 186972, "epoch": 4451} {"train_loss": -7.0642595291137695, "global_step": 186973, "epoch": 4451} {"train_loss": -7.139960289001465, "global_step": 186974, "epoch": 4451} {"train_loss": -7.184473991394043, "global_step": 186975, "epoch": 4451} {"train_loss": -7.134632110595703, "global_step": 186976, "epoch": 4451} {"train_loss": -7.138053894042969, "global_step": 186977, "epoch": 4451} {"train_loss": -7.248196601867676, "global_step": 186978, "epoch": 4451} {"train_loss": -7.117640495300293, "global_step": 186979, "epoch": 4451} {"train_loss": -7.062685489654541, "global_step": 186980, "epoch": 4451} {"train_loss": -7.229452133178711, "global_step": 186981, "epoch": 4451} {"train_loss": -7.010660171508789, "global_step": 186982, "epoch": 4451} {"train_loss": -7.1466250987279984, "global_step": 186983, "epoch": 4451, "val_loss": 80937.9609375} {"train_loss": -7.048101425170898, "global_step": 186984, "epoch": 4452} {"train_loss": -7.144235610961914, "global_step": 186985, "epoch": 4452} {"train_loss": -7.106315612792969, "global_step": 186986, "epoch": 4452} {"train_loss": -7.17744255065918, "global_step": 186987, "epoch": 4452} {"train_loss": -7.135617256164551, "global_step": 186988, "epoch": 4452} {"train_loss": -7.127462863922119, "global_step": 186989, "epoch": 4452} {"train_loss": -7.257685661315918, "global_step": 186990, "epoch": 4452} {"train_loss": -7.231057167053223, "global_step": 186991, "epoch": 4452} {"train_loss": -7.231878757476807, "global_step": 186992, "epoch": 4452} {"train_loss": -7.159878730773926, "global_step": 186993, "epoch": 4452} {"train_loss": -7.217272758483887, "global_step": 186994, "epoch": 4452} {"train_loss": -7.093760013580322, "global_step": 186995, "epoch": 4452} {"train_loss": -7.213174819946289, "global_step": 186996, "epoch": 4452} {"train_loss": -7.187133312225342, "global_step": 186997, "epoch": 4452} {"train_loss": -7.112883567810059, "global_step": 186998, "epoch": 4452} {"train_loss": -7.307432174682617, "global_step": 186999, "epoch": 4452} {"train_loss": -7.250521659851074, "global_step": 187000, "epoch": 4452} {"train_loss": -7.077863693237305, "global_step": 187001, "epoch": 4452} {"train_loss": -7.239467144012451, "global_step": 187002, "epoch": 4452} {"train_loss": -7.22169303894043, "global_step": 187003, "epoch": 4452} {"train_loss": -7.2030839920043945, "global_step": 187004, "epoch": 4452} {"train_loss": -7.277576923370361, "global_step": 187005, "epoch": 4452} {"train_loss": -7.274662971496582, "global_step": 187006, "epoch": 4452} {"train_loss": -7.194990158081055, "global_step": 187007, "epoch": 4452} {"train_loss": -7.283997535705566, "global_step": 187008, "epoch": 4452} {"train_loss": -7.325624465942383, "global_step": 187009, "epoch": 4452} {"train_loss": -7.276055335998535, "global_step": 187010, "epoch": 4452} {"train_loss": -7.112483501434326, "global_step": 187011, "epoch": 4452} {"train_loss": -7.13157320022583, "global_step": 187012, "epoch": 4452} {"train_loss": -7.2419633865356445, "global_step": 187013, "epoch": 4452} {"train_loss": -7.254860877990723, "global_step": 187014, "epoch": 4452} {"train_loss": -7.216582298278809, "global_step": 187015, "epoch": 4452} {"train_loss": -7.229351997375488, "global_step": 187016, "epoch": 4452} {"train_loss": -7.2627668380737305, "global_step": 187017, "epoch": 4452} {"train_loss": -7.210076332092285, "global_step": 187018, "epoch": 4452} {"train_loss": -7.237822532653809, "global_step": 187019, "epoch": 4452} {"train_loss": -7.209785461425781, "global_step": 187020, "epoch": 4452} {"train_loss": -7.160862922668457, "global_step": 187021, "epoch": 4452} {"train_loss": -7.0557098388671875, "global_step": 187022, "epoch": 4452} {"train_loss": -7.188255310058594, "global_step": 187023, "epoch": 4452} {"train_loss": -7.262984752655029, "global_step": 187024, "epoch": 4452} {"train_loss": -7.19974110240028, "global_step": 187025, "epoch": 4452, "val_loss": 80862.78125} {"train_loss": -7.265661239624023, "global_step": 187026, "epoch": 4453} {"train_loss": -7.2717156410217285, "global_step": 187027, "epoch": 4453} {"train_loss": -7.269864082336426, "global_step": 187028, "epoch": 4453} {"train_loss": -7.254539489746094, "global_step": 187029, "epoch": 4453} {"train_loss": -7.2259321212768555, "global_step": 187030, "epoch": 4453} {"train_loss": -7.237053871154785, "global_step": 187031, "epoch": 4453} {"train_loss": -7.424416542053223, "global_step": 187032, "epoch": 4453} {"train_loss": -7.226372241973877, "global_step": 187033, "epoch": 4453} {"train_loss": -7.221222877502441, "global_step": 187034, "epoch": 4453} {"train_loss": -7.263241767883301, "global_step": 187035, "epoch": 4453} {"train_loss": -7.238096237182617, "global_step": 187036, "epoch": 4453} {"train_loss": -7.234971046447754, "global_step": 187037, "epoch": 4453} {"train_loss": -7.2500152587890625, "global_step": 187038, "epoch": 4453} {"train_loss": -7.236629962921143, "global_step": 187039, "epoch": 4453} {"train_loss": -7.239996910095215, "global_step": 187040, "epoch": 4453} {"train_loss": -7.275091171264648, "global_step": 187041, "epoch": 4453} {"train_loss": -7.2746782302856445, "global_step": 187042, "epoch": 4453} {"train_loss": -7.178482532501221, "global_step": 187043, "epoch": 4453} {"train_loss": -7.207070827484131, "global_step": 187044, "epoch": 4453} {"train_loss": -7.207424640655518, "global_step": 187045, "epoch": 4453} {"train_loss": -7.188621997833252, "global_step": 187046, "epoch": 4453} {"train_loss": -7.242259502410889, "global_step": 187047, "epoch": 4453} {"train_loss": -7.258297920227051, "global_step": 187048, "epoch": 4453} {"train_loss": -7.416472434997559, "global_step": 187049, "epoch": 4453} {"train_loss": -7.1978607177734375, "global_step": 187050, "epoch": 4453} {"train_loss": -7.2313947677612305, "global_step": 187051, "epoch": 4453} {"train_loss": -7.133731365203857, "global_step": 187052, "epoch": 4453} {"train_loss": -7.231893062591553, "global_step": 187053, "epoch": 4453} {"train_loss": -7.22676944732666, "global_step": 187054, "epoch": 4453} {"train_loss": -7.207921981811523, "global_step": 187055, "epoch": 4453} {"train_loss": -7.248327732086182, "global_step": 187056, "epoch": 4453} {"train_loss": -7.202620983123779, "global_step": 187057, "epoch": 4453} {"train_loss": -7.067376613616943, "global_step": 187058, "epoch": 4453} {"train_loss": -7.12729024887085, "global_step": 187059, "epoch": 4453} {"train_loss": -7.288804531097412, "global_step": 187060, "epoch": 4453} {"train_loss": -7.240781307220459, "global_step": 187061, "epoch": 4453} {"train_loss": -7.243015766143799, "global_step": 187062, "epoch": 4453} {"train_loss": -7.326967716217041, "global_step": 187063, "epoch": 4453} {"train_loss": -7.192560195922852, "global_step": 187064, "epoch": 4453} {"train_loss": -7.236105918884277, "global_step": 187065, "epoch": 4453} {"train_loss": -7.271081924438477, "global_step": 187066, "epoch": 4453} {"train_loss": -7.237451031094506, "global_step": 187067, "epoch": 4453, "val_loss": 81014.0} {"train_loss": -7.273396015167236, "global_step": 187068, "epoch": 4454} {"train_loss": -7.2719855308532715, "global_step": 187069, "epoch": 4454} {"train_loss": -7.264842987060547, "global_step": 187070, "epoch": 4454} {"train_loss": -7.30314826965332, "global_step": 187071, "epoch": 4454} {"train_loss": -7.374120235443115, "global_step": 187072, "epoch": 4454} {"train_loss": -7.071394920349121, "global_step": 187073, "epoch": 4454} {"train_loss": -7.106064796447754, "global_step": 187074, "epoch": 4454} {"train_loss": -7.10939884185791, "global_step": 187075, "epoch": 4454} {"train_loss": -7.073662281036377, "global_step": 187076, "epoch": 4454} {"train_loss": -7.145695686340332, "global_step": 187077, "epoch": 4454} {"train_loss": -7.176119804382324, "global_step": 187078, "epoch": 4454} {"train_loss": -7.17017936706543, "global_step": 187079, "epoch": 4454} {"train_loss": -7.10695743560791, "global_step": 187080, "epoch": 4454} {"train_loss": -7.223018169403076, "global_step": 187081, "epoch": 4454} {"train_loss": -7.15778923034668, "global_step": 187082, "epoch": 4454} {"train_loss": -7.10234260559082, "global_step": 187083, "epoch": 4454} {"train_loss": -7.2291975021362305, "global_step": 187084, "epoch": 4454} {"train_loss": -7.107027053833008, "global_step": 187085, "epoch": 4454} {"train_loss": -7.25269889831543, "global_step": 187086, "epoch": 4454} {"train_loss": -7.196780204772949, "global_step": 187087, "epoch": 4454} {"train_loss": -7.184925079345703, "global_step": 187088, "epoch": 4454} {"train_loss": -7.157253265380859, "global_step": 187089, "epoch": 4454} {"train_loss": -7.253288269042969, "global_step": 187090, "epoch": 4454} {"train_loss": -7.212817192077637, "global_step": 187091, "epoch": 4454} {"train_loss": -7.1236066818237305, "global_step": 187092, "epoch": 4454} {"train_loss": -7.109711647033691, "global_step": 187093, "epoch": 4454} {"train_loss": -7.1924591064453125, "global_step": 187094, "epoch": 4454} {"train_loss": -7.240755081176758, "global_step": 187095, "epoch": 4454} {"train_loss": -7.184636116027832, "global_step": 187096, "epoch": 4454} {"train_loss": -7.011600494384766, "global_step": 187097, "epoch": 4454} {"train_loss": -7.166604995727539, "global_step": 187098, "epoch": 4454} {"train_loss": -7.137067794799805, "global_step": 187099, "epoch": 4454} {"train_loss": -7.1629204750061035, "global_step": 187100, "epoch": 4454} {"train_loss": -7.150974273681641, "global_step": 187101, "epoch": 4454} {"train_loss": -7.164766311645508, "global_step": 187102, "epoch": 4454} {"train_loss": -7.213624477386475, "global_step": 187103, "epoch": 4454} {"train_loss": -7.063370704650879, "global_step": 187104, "epoch": 4454} {"train_loss": -7.188852310180664, "global_step": 187105, "epoch": 4454} {"train_loss": -7.164769172668457, "global_step": 187106, "epoch": 4454} {"train_loss": -7.190627098083496, "global_step": 187107, "epoch": 4454} {"train_loss": -7.1433820724487305, "global_step": 187108, "epoch": 4454} {"train_loss": -7.172871759959629, "global_step": 187109, "epoch": 4454, "val_loss": 81015.09375} {"train_loss": -7.1694464683532715, "global_step": 187110, "epoch": 4455} {"train_loss": -7.212416172027588, "global_step": 187111, "epoch": 4455} {"train_loss": -7.175601959228516, "global_step": 187112, "epoch": 4455} {"train_loss": -7.166265487670898, "global_step": 187113, "epoch": 4455} {"train_loss": -7.229889869689941, "global_step": 187114, "epoch": 4455} {"train_loss": -7.166924476623535, "global_step": 187115, "epoch": 4455} {"train_loss": -7.08345890045166, "global_step": 187116, "epoch": 4455} {"train_loss": -7.2742109298706055, "global_step": 187117, "epoch": 4455} {"train_loss": -7.2588605880737305, "global_step": 187118, "epoch": 4455} {"train_loss": -7.131437301635742, "global_step": 187119, "epoch": 4455} {"train_loss": -7.236935138702393, "global_step": 187120, "epoch": 4455} {"train_loss": -7.094654083251953, "global_step": 187121, "epoch": 4455} {"train_loss": -7.168530464172363, "global_step": 187122, "epoch": 4455} {"train_loss": -7.174973487854004, "global_step": 187123, "epoch": 4455} {"train_loss": -7.202767372131348, "global_step": 187124, "epoch": 4455} {"train_loss": -7.1277337074279785, "global_step": 187125, "epoch": 4455} {"train_loss": -7.129289627075195, "global_step": 187126, "epoch": 4455} {"train_loss": -7.1736345291137695, "global_step": 187127, "epoch": 4455} {"train_loss": -7.107254505157471, "global_step": 187128, "epoch": 4455} {"train_loss": -7.159653663635254, "global_step": 187129, "epoch": 4455} {"train_loss": -7.148859024047852, "global_step": 187130, "epoch": 4455} {"train_loss": -7.117746353149414, "global_step": 187131, "epoch": 4455} {"train_loss": -7.109746932983398, "global_step": 187132, "epoch": 4455} {"train_loss": -7.172539234161377, "global_step": 187133, "epoch": 4455} {"train_loss": -7.141824245452881, "global_step": 187134, "epoch": 4455} {"train_loss": -7.126178741455078, "global_step": 187135, "epoch": 4455} {"train_loss": -7.183507919311523, "global_step": 187136, "epoch": 4455} {"train_loss": -7.058450698852539, "global_step": 187137, "epoch": 4455} {"train_loss": -7.164167404174805, "global_step": 187138, "epoch": 4455} {"train_loss": -7.081508636474609, "global_step": 187139, "epoch": 4455} {"train_loss": -7.179036617279053, "global_step": 187140, "epoch": 4455} {"train_loss": -7.136948585510254, "global_step": 187141, "epoch": 4455} {"train_loss": -7.087026596069336, "global_step": 187142, "epoch": 4455} {"train_loss": -7.119868278503418, "global_step": 187143, "epoch": 4455} {"train_loss": -7.2137451171875, "global_step": 187144, "epoch": 4455} {"train_loss": -7.052492141723633, "global_step": 187145, "epoch": 4455} {"train_loss": -7.132382392883301, "global_step": 187146, "epoch": 4455} {"train_loss": -7.156220436096191, "global_step": 187147, "epoch": 4455} {"train_loss": -7.262030124664307, "global_step": 187148, "epoch": 4455} {"train_loss": -7.215916633605957, "global_step": 187149, "epoch": 4455} {"train_loss": -7.152366638183594, "global_step": 187150, "epoch": 4455} {"train_loss": -7.158006565911429, "global_step": 187151, "epoch": 4455, "val_loss": 80933.1015625} {"train_loss": -7.211013317108154, "global_step": 187152, "epoch": 4456} {"train_loss": -7.2107744216918945, "global_step": 187153, "epoch": 4456} {"train_loss": -7.188631534576416, "global_step": 187154, "epoch": 4456} {"train_loss": -7.172484397888184, "global_step": 187155, "epoch": 4456} {"train_loss": -7.209112167358398, "global_step": 187156, "epoch": 4456} {"train_loss": -7.131816864013672, "global_step": 187157, "epoch": 4456} {"train_loss": -7.194582939147949, "global_step": 187158, "epoch": 4456} {"train_loss": -7.187492370605469, "global_step": 187159, "epoch": 4456} {"train_loss": -7.120722770690918, "global_step": 187160, "epoch": 4456} {"train_loss": -7.077338695526123, "global_step": 187161, "epoch": 4456} {"train_loss": -7.199179649353027, "global_step": 187162, "epoch": 4456} {"train_loss": -7.18983268737793, "global_step": 187163, "epoch": 4456} {"train_loss": -7.250670433044434, "global_step": 187164, "epoch": 4456} {"train_loss": -7.280210971832275, "global_step": 187165, "epoch": 4456} {"train_loss": -7.211381435394287, "global_step": 187166, "epoch": 4456} {"train_loss": -7.258161544799805, "global_step": 187167, "epoch": 4456} {"train_loss": -7.107928276062012, "global_step": 187168, "epoch": 4456} {"train_loss": -7.183948516845703, "global_step": 187169, "epoch": 4456} {"train_loss": -7.183164596557617, "global_step": 187170, "epoch": 4456} {"train_loss": -7.153439044952393, "global_step": 187171, "epoch": 4456} {"train_loss": -7.253993988037109, "global_step": 187172, "epoch": 4456} {"train_loss": -7.2939558029174805, "global_step": 187173, "epoch": 4456} {"train_loss": -7.1578450202941895, "global_step": 187174, "epoch": 4456} {"train_loss": -7.251901626586914, "global_step": 187175, "epoch": 4456} {"train_loss": -7.1921515464782715, "global_step": 187176, "epoch": 4456} {"train_loss": -7.14351749420166, "global_step": 187177, "epoch": 4456} {"train_loss": -7.312335014343262, "global_step": 187178, "epoch": 4456} {"train_loss": -7.186281681060791, "global_step": 187179, "epoch": 4456} {"train_loss": -7.2324981689453125, "global_step": 187180, "epoch": 4456} {"train_loss": -7.2086286544799805, "global_step": 187181, "epoch": 4456} {"train_loss": -7.229618072509766, "global_step": 187182, "epoch": 4456} {"train_loss": -7.184602737426758, "global_step": 187183, "epoch": 4456} {"train_loss": -7.104203224182129, "global_step": 187184, "epoch": 4456} {"train_loss": -7.170657157897949, "global_step": 187185, "epoch": 4456} {"train_loss": -7.194775104522705, "global_step": 187186, "epoch": 4456} {"train_loss": -7.163180828094482, "global_step": 187187, "epoch": 4456} {"train_loss": -7.201205253601074, "global_step": 187188, "epoch": 4456} {"train_loss": -7.298041343688965, "global_step": 187189, "epoch": 4456} {"train_loss": -7.094743728637695, "global_step": 187190, "epoch": 4456} {"train_loss": -7.260371208190918, "global_step": 187191, "epoch": 4456} {"train_loss": -7.299539566040039, "global_step": 187192, "epoch": 4456} {"train_loss": -7.196534917468116, "global_step": 187193, "epoch": 4456, "val_loss": 81035.6953125} {"train_loss": -7.273667812347412, "global_step": 187194, "epoch": 4457} {"train_loss": -7.16860818862915, "global_step": 187195, "epoch": 4457} {"train_loss": -7.253450870513916, "global_step": 187196, "epoch": 4457} {"train_loss": -7.184210300445557, "global_step": 187197, "epoch": 4457} {"train_loss": -7.3622636795043945, "global_step": 187198, "epoch": 4457} {"train_loss": -7.281989097595215, "global_step": 187199, "epoch": 4457} {"train_loss": -7.2445244789123535, "global_step": 187200, "epoch": 4457} {"train_loss": -7.348211288452148, "global_step": 187201, "epoch": 4457} {"train_loss": -7.282681941986084, "global_step": 187202, "epoch": 4457} {"train_loss": -7.089289665222168, "global_step": 187203, "epoch": 4457} {"train_loss": -7.222278594970703, "global_step": 187204, "epoch": 4457} {"train_loss": -7.176113605499268, "global_step": 187205, "epoch": 4457} {"train_loss": -6.996624946594238, "global_step": 187206, "epoch": 4457} {"train_loss": -7.182250022888184, "global_step": 187207, "epoch": 4457} {"train_loss": -7.274670600891113, "global_step": 187208, "epoch": 4457} {"train_loss": -6.989101409912109, "global_step": 187209, "epoch": 4457} {"train_loss": -7.220001220703125, "global_step": 187210, "epoch": 4457} {"train_loss": -7.187183380126953, "global_step": 187211, "epoch": 4457} {"train_loss": -6.992779731750488, "global_step": 187212, "epoch": 4457} {"train_loss": -7.079187393188477, "global_step": 187213, "epoch": 4457} {"train_loss": -7.206470489501953, "global_step": 187214, "epoch": 4457} {"train_loss": -7.160065650939941, "global_step": 187215, "epoch": 4457} {"train_loss": -7.067228317260742, "global_step": 187216, "epoch": 4457} {"train_loss": -7.094550132751465, "global_step": 187217, "epoch": 4457} {"train_loss": -6.942197799682617, "global_step": 187218, "epoch": 4457} {"train_loss": -6.9361467361450195, "global_step": 187219, "epoch": 4457} {"train_loss": -7.121044158935547, "global_step": 187220, "epoch": 4457} {"train_loss": -7.009644508361816, "global_step": 187221, "epoch": 4457} {"train_loss": -7.106802463531494, "global_step": 187222, "epoch": 4457} {"train_loss": -6.986579418182373, "global_step": 187223, "epoch": 4457} {"train_loss": -6.906909942626953, "global_step": 187224, "epoch": 4457} {"train_loss": -7.10522985458374, "global_step": 187225, "epoch": 4457} {"train_loss": -6.970331192016602, "global_step": 187226, "epoch": 4457} {"train_loss": -6.962529182434082, "global_step": 187227, "epoch": 4457} {"train_loss": -6.973766326904297, "global_step": 187228, "epoch": 4457} {"train_loss": -7.121050834655762, "global_step": 187229, "epoch": 4457} {"train_loss": -6.861185073852539, "global_step": 187230, "epoch": 4457} {"train_loss": -7.264065742492676, "global_step": 187231, "epoch": 4457} {"train_loss": -6.860231399536133, "global_step": 187232, "epoch": 4457} {"train_loss": -7.093225479125977, "global_step": 187233, "epoch": 4457} {"train_loss": -6.9457197189331055, "global_step": 187234, "epoch": 4457} {"train_loss": -7.110409191676548, "global_step": 187235, "epoch": 4457, "val_loss": 80717.0625} {"train_loss": -7.138416290283203, "global_step": 187236, "epoch": 4458} {"train_loss": -7.09815788269043, "global_step": 187237, "epoch": 4458} {"train_loss": -7.137929916381836, "global_step": 187238, "epoch": 4458} {"train_loss": -7.1380157470703125, "global_step": 187239, "epoch": 4458} {"train_loss": -7.088549613952637, "global_step": 187240, "epoch": 4458} {"train_loss": -7.0609130859375, "global_step": 187241, "epoch": 4458} {"train_loss": -7.068380355834961, "global_step": 187242, "epoch": 4458} {"train_loss": -7.169810771942139, "global_step": 187243, "epoch": 4458} {"train_loss": -7.0793633460998535, "global_step": 187244, "epoch": 4458} {"train_loss": -7.284067153930664, "global_step": 187245, "epoch": 4458} {"train_loss": -7.222066402435303, "global_step": 187246, "epoch": 4458} {"train_loss": -7.237531661987305, "global_step": 187247, "epoch": 4458} {"train_loss": -7.059909820556641, "global_step": 187248, "epoch": 4458} {"train_loss": -7.096234321594238, "global_step": 187249, "epoch": 4458} {"train_loss": -7.123247146606445, "global_step": 187250, "epoch": 4458} {"train_loss": -7.042330265045166, "global_step": 187251, "epoch": 4458} {"train_loss": -7.145169258117676, "global_step": 187252, "epoch": 4458} {"train_loss": -7.10819673538208, "global_step": 187253, "epoch": 4458} {"train_loss": -7.114292144775391, "global_step": 187254, "epoch": 4458} {"train_loss": -7.149338722229004, "global_step": 187255, "epoch": 4458} {"train_loss": -7.036791801452637, "global_step": 187256, "epoch": 4458} {"train_loss": -6.951727867126465, "global_step": 187257, "epoch": 4458} {"train_loss": -7.160723686218262, "global_step": 187258, "epoch": 4458} {"train_loss": -7.143801689147949, "global_step": 187259, "epoch": 4458} {"train_loss": -7.027942657470703, "global_step": 187260, "epoch": 4458} {"train_loss": -7.1942362785339355, "global_step": 187261, "epoch": 4458} {"train_loss": -7.101893424987793, "global_step": 187262, "epoch": 4458} {"train_loss": -7.166543960571289, "global_step": 187263, "epoch": 4458} {"train_loss": -7.173459053039551, "global_step": 187264, "epoch": 4458} {"train_loss": -7.051357746124268, "global_step": 187265, "epoch": 4458} {"train_loss": -7.20340633392334, "global_step": 187266, "epoch": 4458} {"train_loss": -7.135475158691406, "global_step": 187267, "epoch": 4458} {"train_loss": -7.098595142364502, "global_step": 187268, "epoch": 4458} {"train_loss": -7.104591369628906, "global_step": 187269, "epoch": 4458} {"train_loss": -7.081699371337891, "global_step": 187270, "epoch": 4458} {"train_loss": -7.023495197296143, "global_step": 187271, "epoch": 4458} {"train_loss": -7.024036407470703, "global_step": 187272, "epoch": 4458} {"train_loss": -7.148588180541992, "global_step": 187273, "epoch": 4458} {"train_loss": -7.0704545974731445, "global_step": 187274, "epoch": 4458} {"train_loss": -7.0737104415893555, "global_step": 187275, "epoch": 4458} {"train_loss": -7.150942802429199, "global_step": 187276, "epoch": 4458} {"train_loss": -7.112843581608364, "global_step": 187277, "epoch": 4458, "val_loss": 80882.46875} {"train_loss": -7.1295695304870605, "global_step": 187278, "epoch": 4459} {"train_loss": -7.048384189605713, "global_step": 187279, "epoch": 4459} {"train_loss": -7.067405700683594, "global_step": 187280, "epoch": 4459} {"train_loss": -7.039643287658691, "global_step": 187281, "epoch": 4459} {"train_loss": -7.094856262207031, "global_step": 187282, "epoch": 4459} {"train_loss": -7.216787338256836, "global_step": 187283, "epoch": 4459} {"train_loss": -6.9665021896362305, "global_step": 187284, "epoch": 4459} {"train_loss": -7.001522064208984, "global_step": 187285, "epoch": 4459} {"train_loss": -7.1273908615112305, "global_step": 187286, "epoch": 4459} {"train_loss": -7.157464504241943, "global_step": 187287, "epoch": 4459} {"train_loss": -7.110899925231934, "global_step": 187288, "epoch": 4459} {"train_loss": -7.195365905761719, "global_step": 187289, "epoch": 4459} {"train_loss": -7.111202239990234, "global_step": 187290, "epoch": 4459} {"train_loss": -7.161172866821289, "global_step": 187291, "epoch": 4459} {"train_loss": -7.138606548309326, "global_step": 187292, "epoch": 4459} {"train_loss": -7.118000030517578, "global_step": 187293, "epoch": 4459} {"train_loss": -7.182770252227783, "global_step": 187294, "epoch": 4459} {"train_loss": -7.174703598022461, "global_step": 187295, "epoch": 4459} {"train_loss": -7.246370315551758, "global_step": 187296, "epoch": 4459} {"train_loss": -7.201452732086182, "global_step": 187297, "epoch": 4459} {"train_loss": -7.189155578613281, "global_step": 187298, "epoch": 4459} {"train_loss": -7.238269805908203, "global_step": 187299, "epoch": 4459} {"train_loss": -7.254158020019531, "global_step": 187300, "epoch": 4459} {"train_loss": -7.198355674743652, "global_step": 187301, "epoch": 4459} {"train_loss": -7.076224327087402, "global_step": 187302, "epoch": 4459} {"train_loss": -7.203183174133301, "global_step": 187303, "epoch": 4459} {"train_loss": -7.303137302398682, "global_step": 187304, "epoch": 4459} {"train_loss": -7.211454391479492, "global_step": 187305, "epoch": 4459} {"train_loss": -7.254511833190918, "global_step": 187306, "epoch": 4459} {"train_loss": -7.301552772521973, "global_step": 187307, "epoch": 4459} {"train_loss": -7.1890974044799805, "global_step": 187308, "epoch": 4459} {"train_loss": -7.303046226501465, "global_step": 187309, "epoch": 4459} {"train_loss": -7.269355773925781, "global_step": 187310, "epoch": 4459} {"train_loss": -7.214823246002197, "global_step": 187311, "epoch": 4459} {"train_loss": -7.208281517028809, "global_step": 187312, "epoch": 4459} {"train_loss": -7.192085266113281, "global_step": 187313, "epoch": 4459} {"train_loss": -7.220493316650391, "global_step": 187314, "epoch": 4459} {"train_loss": -7.253202438354492, "global_step": 187315, "epoch": 4459} {"train_loss": -7.262454032897949, "global_step": 187316, "epoch": 4459} {"train_loss": -7.182953834533691, "global_step": 187317, "epoch": 4459} {"train_loss": -7.292527675628662, "global_step": 187318, "epoch": 4459} {"train_loss": -7.180585724966867, "global_step": 187319, "epoch": 4459, "val_loss": 80654.6640625} {"train_loss": -7.313129901885986, "global_step": 187320, "epoch": 4460} {"train_loss": -7.188570976257324, "global_step": 187321, "epoch": 4460} {"train_loss": -7.248138427734375, "global_step": 187322, "epoch": 4460} {"train_loss": -7.396759033203125, "global_step": 187323, "epoch": 4460} {"train_loss": -7.316753387451172, "global_step": 187324, "epoch": 4460} {"train_loss": -7.271095275878906, "global_step": 187325, "epoch": 4460} {"train_loss": -7.395869731903076, "global_step": 187326, "epoch": 4460} {"train_loss": -7.187127113342285, "global_step": 187327, "epoch": 4460} {"train_loss": -7.124755859375, "global_step": 187328, "epoch": 4460} {"train_loss": -7.159952163696289, "global_step": 187329, "epoch": 4460} {"train_loss": -7.199296951293945, "global_step": 187330, "epoch": 4460} {"train_loss": -7.375942230224609, "global_step": 187331, "epoch": 4460} {"train_loss": -7.046631813049316, "global_step": 187332, "epoch": 4460} {"train_loss": -7.1817169189453125, "global_step": 187333, "epoch": 4460} {"train_loss": -7.109094619750977, "global_step": 187334, "epoch": 4460} {"train_loss": -7.181995391845703, "global_step": 187335, "epoch": 4460} {"train_loss": -7.283468246459961, "global_step": 187336, "epoch": 4460} {"train_loss": -7.129975318908691, "global_step": 187337, "epoch": 4460} {"train_loss": -7.354061603546143, "global_step": 187338, "epoch": 4460} {"train_loss": -7.187746047973633, "global_step": 187339, "epoch": 4460} {"train_loss": -7.156988143920898, "global_step": 187340, "epoch": 4460} {"train_loss": -7.079207420349121, "global_step": 187341, "epoch": 4460} {"train_loss": -7.2369890213012695, "global_step": 187342, "epoch": 4460} {"train_loss": -7.254979133605957, "global_step": 187343, "epoch": 4460} {"train_loss": -7.1675615310668945, "global_step": 187344, "epoch": 4460} {"train_loss": -7.248945236206055, "global_step": 187345, "epoch": 4460} {"train_loss": -7.20977258682251, "global_step": 187346, "epoch": 4460} {"train_loss": -7.214208602905273, "global_step": 187347, "epoch": 4460} {"train_loss": -7.220873832702637, "global_step": 187348, "epoch": 4460} {"train_loss": -7.209920883178711, "global_step": 187349, "epoch": 4460} {"train_loss": -7.172970771789551, "global_step": 187350, "epoch": 4460} {"train_loss": -7.325615882873535, "global_step": 187351, "epoch": 4460} {"train_loss": -7.109084606170654, "global_step": 187352, "epoch": 4460} {"train_loss": -7.266406536102295, "global_step": 187353, "epoch": 4460} {"train_loss": -7.1384968757629395, "global_step": 187354, "epoch": 4460} {"train_loss": -7.2554168701171875, "global_step": 187355, "epoch": 4460} {"train_loss": -7.326841831207275, "global_step": 187356, "epoch": 4460} {"train_loss": -7.196500778198242, "global_step": 187357, "epoch": 4460} {"train_loss": -7.205631256103516, "global_step": 187358, "epoch": 4460} {"train_loss": -7.250418663024902, "global_step": 187359, "epoch": 4460} {"train_loss": -7.022693634033203, "global_step": 187360, "epoch": 4460} {"train_loss": -7.2178222224825905, "global_step": 187361, "epoch": 4460, "val_loss": 80482.046875} {"train_loss": -7.281430244445801, "global_step": 187362, "epoch": 4461} {"train_loss": -7.132072448730469, "global_step": 187363, "epoch": 4461} {"train_loss": -7.194126129150391, "global_step": 187364, "epoch": 4461} {"train_loss": -7.23750638961792, "global_step": 187365, "epoch": 4461} {"train_loss": -7.172486305236816, "global_step": 187366, "epoch": 4461} {"train_loss": -7.269197463989258, "global_step": 187367, "epoch": 4461} {"train_loss": -7.217097282409668, "global_step": 187368, "epoch": 4461} {"train_loss": -7.093877792358398, "global_step": 187369, "epoch": 4461} {"train_loss": -7.095543384552002, "global_step": 187370, "epoch": 4461} {"train_loss": -7.202445983886719, "global_step": 187371, "epoch": 4461} {"train_loss": -7.207093238830566, "global_step": 187372, "epoch": 4461} {"train_loss": -7.057208061218262, "global_step": 187373, "epoch": 4461} {"train_loss": -7.211653709411621, "global_step": 187374, "epoch": 4461} {"train_loss": -7.164915084838867, "global_step": 187375, "epoch": 4461} {"train_loss": -7.012220859527588, "global_step": 187376, "epoch": 4461} {"train_loss": -7.169628143310547, "global_step": 187377, "epoch": 4461} {"train_loss": -7.178758144378662, "global_step": 187378, "epoch": 4461} {"train_loss": -7.241498947143555, "global_step": 187379, "epoch": 4461} {"train_loss": -7.178256988525391, "global_step": 187380, "epoch": 4461} {"train_loss": -7.2275495529174805, "global_step": 187381, "epoch": 4461} {"train_loss": -7.294709205627441, "global_step": 187382, "epoch": 4461} {"train_loss": -7.254211902618408, "global_step": 187383, "epoch": 4461} {"train_loss": -7.277554988861084, "global_step": 187384, "epoch": 4461} {"train_loss": -7.124473571777344, "global_step": 187385, "epoch": 4461} {"train_loss": -7.347138404846191, "global_step": 187386, "epoch": 4461} {"train_loss": -7.22486686706543, "global_step": 187387, "epoch": 4461} {"train_loss": -7.232808589935303, "global_step": 187388, "epoch": 4461} {"train_loss": -7.28012752532959, "global_step": 187389, "epoch": 4461} {"train_loss": -7.246729850769043, "global_step": 187390, "epoch": 4461} {"train_loss": -7.294927597045898, "global_step": 187391, "epoch": 4461} {"train_loss": -7.207254409790039, "global_step": 187392, "epoch": 4461} {"train_loss": -7.276126861572266, "global_step": 187393, "epoch": 4461} {"train_loss": -7.130173683166504, "global_step": 187394, "epoch": 4461} {"train_loss": -7.206177711486816, "global_step": 187395, "epoch": 4461} {"train_loss": -7.212465286254883, "global_step": 187396, "epoch": 4461} {"train_loss": -7.2512617111206055, "global_step": 187397, "epoch": 4461} {"train_loss": -7.2751874923706055, "global_step": 187398, "epoch": 4461} {"train_loss": -7.147616386413574, "global_step": 187399, "epoch": 4461} {"train_loss": -7.107661247253418, "global_step": 187400, "epoch": 4461} {"train_loss": -7.150814533233643, "global_step": 187401, "epoch": 4461} {"train_loss": -7.233577728271484, "global_step": 187402, "epoch": 4461} {"train_loss": -7.202752011162894, "global_step": 187403, "epoch": 4461, "val_loss": 81005.140625} {"train_loss": -7.166746139526367, "global_step": 187404, "epoch": 4462} {"train_loss": -7.137141227722168, "global_step": 187405, "epoch": 4462} {"train_loss": -7.248245716094971, "global_step": 187406, "epoch": 4462} {"train_loss": -7.199203014373779, "global_step": 187407, "epoch": 4462} {"train_loss": -7.1890082359313965, "global_step": 187408, "epoch": 4462} {"train_loss": -6.921994686126709, "global_step": 187409, "epoch": 4462} {"train_loss": -7.026076793670654, "global_step": 187410, "epoch": 4462} {"train_loss": -7.13195276260376, "global_step": 187411, "epoch": 4462} {"train_loss": -7.168089866638184, "global_step": 187412, "epoch": 4462} {"train_loss": -7.159167289733887, "global_step": 187413, "epoch": 4462} {"train_loss": -7.195895671844482, "global_step": 187414, "epoch": 4462} {"train_loss": -7.156748294830322, "global_step": 187415, "epoch": 4462} {"train_loss": -7.15907096862793, "global_step": 187416, "epoch": 4462} {"train_loss": -7.199827194213867, "global_step": 187417, "epoch": 4462} {"train_loss": -7.159120559692383, "global_step": 187418, "epoch": 4462} {"train_loss": -7.1498823165893555, "global_step": 187419, "epoch": 4462} {"train_loss": -7.19154167175293, "global_step": 187420, "epoch": 4462} {"train_loss": -7.094852924346924, "global_step": 187421, "epoch": 4462} {"train_loss": -7.115639686584473, "global_step": 187422, "epoch": 4462} {"train_loss": -7.141780853271484, "global_step": 187423, "epoch": 4462} {"train_loss": -7.160539627075195, "global_step": 187424, "epoch": 4462} {"train_loss": -7.2022528648376465, "global_step": 187425, "epoch": 4462} {"train_loss": -7.305736064910889, "global_step": 187426, "epoch": 4462} {"train_loss": -7.04542350769043, "global_step": 187427, "epoch": 4462} {"train_loss": -7.119634628295898, "global_step": 187428, "epoch": 4462} {"train_loss": -7.186034202575684, "global_step": 187429, "epoch": 4462} {"train_loss": -7.239784240722656, "global_step": 187430, "epoch": 4462} {"train_loss": -7.2024946212768555, "global_step": 187431, "epoch": 4462} {"train_loss": -7.247436046600342, "global_step": 187432, "epoch": 4462} {"train_loss": -7.218121528625488, "global_step": 187433, "epoch": 4462} {"train_loss": -7.2492756843566895, "global_step": 187434, "epoch": 4462} {"train_loss": -7.144458770751953, "global_step": 187435, "epoch": 4462} {"train_loss": -7.2477707862854, "global_step": 187436, "epoch": 4462} {"train_loss": -7.198497772216797, "global_step": 187437, "epoch": 4462} {"train_loss": -7.150750160217285, "global_step": 187438, "epoch": 4462} {"train_loss": -7.296817302703857, "global_step": 187439, "epoch": 4462} {"train_loss": -7.088658332824707, "global_step": 187440, "epoch": 4462} {"train_loss": -7.05647087097168, "global_step": 187441, "epoch": 4462} {"train_loss": -7.135359764099121, "global_step": 187442, "epoch": 4462} {"train_loss": -7.166479110717773, "global_step": 187443, "epoch": 4462} {"train_loss": -7.101504802703857, "global_step": 187444, "epoch": 4462} {"train_loss": -7.164374839691889, "global_step": 187445, "epoch": 4462, "val_loss": 80936.3359375} {"train_loss": -7.227415084838867, "global_step": 187446, "epoch": 4463} {"train_loss": -7.056623935699463, "global_step": 187447, "epoch": 4463} {"train_loss": -7.17192268371582, "global_step": 187448, "epoch": 4463} {"train_loss": -7.1103410720825195, "global_step": 187449, "epoch": 4463} {"train_loss": -7.208009719848633, "global_step": 187450, "epoch": 4463} {"train_loss": -7.196502685546875, "global_step": 187451, "epoch": 4463} {"train_loss": -7.168907165527344, "global_step": 187452, "epoch": 4463} {"train_loss": -7.133665084838867, "global_step": 187453, "epoch": 4463} {"train_loss": -7.146981239318848, "global_step": 187454, "epoch": 4463} {"train_loss": -7.166500091552734, "global_step": 187455, "epoch": 4463} {"train_loss": -7.06076717376709, "global_step": 187456, "epoch": 4463} {"train_loss": -6.998378276824951, "global_step": 187457, "epoch": 4463} {"train_loss": -7.179687976837158, "global_step": 187458, "epoch": 4463} {"train_loss": -6.9543256759643555, "global_step": 187459, "epoch": 4463} {"train_loss": -7.182555198669434, "global_step": 187460, "epoch": 4463} {"train_loss": -7.123295783996582, "global_step": 187461, "epoch": 4463} {"train_loss": -7.128599166870117, "global_step": 187462, "epoch": 4463} {"train_loss": -7.108631610870361, "global_step": 187463, "epoch": 4463} {"train_loss": -6.962713241577148, "global_step": 187464, "epoch": 4463} {"train_loss": -7.219547271728516, "global_step": 187465, "epoch": 4463} {"train_loss": -7.0698442459106445, "global_step": 187466, "epoch": 4463} {"train_loss": -7.196463108062744, "global_step": 187467, "epoch": 4463} {"train_loss": -7.064298629760742, "global_step": 187468, "epoch": 4463} {"train_loss": -7.118879318237305, "global_step": 187469, "epoch": 4463} {"train_loss": -7.135405540466309, "global_step": 187470, "epoch": 4463} {"train_loss": -7.0980072021484375, "global_step": 187471, "epoch": 4463} {"train_loss": -7.049312591552734, "global_step": 187472, "epoch": 4463} {"train_loss": -7.154448986053467, "global_step": 187473, "epoch": 4463} {"train_loss": -7.082334995269775, "global_step": 187474, "epoch": 4463} {"train_loss": -7.184120178222656, "global_step": 187475, "epoch": 4463} {"train_loss": -7.095828056335449, "global_step": 187476, "epoch": 4463} {"train_loss": -7.168996810913086, "global_step": 187477, "epoch": 4463} {"train_loss": -7.247562408447266, "global_step": 187478, "epoch": 4463} {"train_loss": -7.123405456542969, "global_step": 187479, "epoch": 4463} {"train_loss": -7.245265960693359, "global_step": 187480, "epoch": 4463} {"train_loss": -7.103359222412109, "global_step": 187481, "epoch": 4463} {"train_loss": -7.0864152908325195, "global_step": 187482, "epoch": 4463} {"train_loss": -7.244960308074951, "global_step": 187483, "epoch": 4463} {"train_loss": -7.267879486083984, "global_step": 187484, "epoch": 4463} {"train_loss": -7.295353889465332, "global_step": 187485, "epoch": 4463} {"train_loss": -7.179248809814453, "global_step": 187486, "epoch": 4463} {"train_loss": -7.140020790554228, "global_step": 187487, "epoch": 4463, "val_loss": 80880.359375} {"train_loss": -7.111873149871826, "global_step": 187488, "epoch": 4464} {"train_loss": -7.239098072052002, "global_step": 187489, "epoch": 4464} {"train_loss": -7.190794944763184, "global_step": 187490, "epoch": 4464} {"train_loss": -7.053564071655273, "global_step": 187491, "epoch": 4464} {"train_loss": -7.194232940673828, "global_step": 187492, "epoch": 4464} {"train_loss": -7.217702865600586, "global_step": 187493, "epoch": 4464} {"train_loss": -7.15919303894043, "global_step": 187494, "epoch": 4464} {"train_loss": -7.293741226196289, "global_step": 187495, "epoch": 4464} {"train_loss": -7.057132720947266, "global_step": 187496, "epoch": 4464} {"train_loss": -7.271389961242676, "global_step": 187497, "epoch": 4464} {"train_loss": -7.103602886199951, "global_step": 187498, "epoch": 4464} {"train_loss": -7.141156196594238, "global_step": 187499, "epoch": 4464} {"train_loss": -7.18363094329834, "global_step": 187500, "epoch": 4464} {"train_loss": -7.288168907165527, "global_step": 187501, "epoch": 4464} {"train_loss": -7.039679527282715, "global_step": 187502, "epoch": 4464} {"train_loss": -7.118010520935059, "global_step": 187503, "epoch": 4464} {"train_loss": -7.138350486755371, "global_step": 187504, "epoch": 4464} {"train_loss": -7.281289100646973, "global_step": 187505, "epoch": 4464} {"train_loss": -7.190680503845215, "global_step": 187506, "epoch": 4464} {"train_loss": -7.261959075927734, "global_step": 187507, "epoch": 4464} {"train_loss": -7.309836387634277, "global_step": 187508, "epoch": 4464} {"train_loss": -7.152524948120117, "global_step": 187509, "epoch": 4464} {"train_loss": -7.211983680725098, "global_step": 187510, "epoch": 4464} {"train_loss": -7.1454291343688965, "global_step": 187511, "epoch": 4464} {"train_loss": -7.146051406860352, "global_step": 187512, "epoch": 4464} {"train_loss": -7.182362079620361, "global_step": 187513, "epoch": 4464} {"train_loss": -7.06492280960083, "global_step": 187514, "epoch": 4464} {"train_loss": -7.2297163009643555, "global_step": 187515, "epoch": 4464} {"train_loss": -7.114987850189209, "global_step": 187516, "epoch": 4464} {"train_loss": -7.029376029968262, "global_step": 187517, "epoch": 4464} {"train_loss": -7.200008392333984, "global_step": 187518, "epoch": 4464} {"train_loss": -7.064521789550781, "global_step": 187519, "epoch": 4464} {"train_loss": -7.2053351402282715, "global_step": 187520, "epoch": 4464} {"train_loss": -7.160345077514648, "global_step": 187521, "epoch": 4464} {"train_loss": -7.002372741699219, "global_step": 187522, "epoch": 4464} {"train_loss": -7.1815290451049805, "global_step": 187523, "epoch": 4464} {"train_loss": -7.022966384887695, "global_step": 187524, "epoch": 4464} {"train_loss": -7.171378135681152, "global_step": 187525, "epoch": 4464} {"train_loss": -7.182717323303223, "global_step": 187526, "epoch": 4464} {"train_loss": -7.061390399932861, "global_step": 187527, "epoch": 4464} {"train_loss": -7.081695556640625, "global_step": 187528, "epoch": 4464} {"train_loss": -7.157238210950579, "global_step": 187529, "epoch": 4464, "val_loss": 80910.8046875} {"train_loss": -7.280279636383057, "global_step": 187530, "epoch": 4465} {"train_loss": -7.186929702758789, "global_step": 187531, "epoch": 4465} {"train_loss": -7.111532211303711, "global_step": 187532, "epoch": 4465} {"train_loss": -7.15829610824585, "global_step": 187533, "epoch": 4465} {"train_loss": -7.0852155685424805, "global_step": 187534, "epoch": 4465} {"train_loss": -7.236295700073242, "global_step": 187535, "epoch": 4465} {"train_loss": -7.178263187408447, "global_step": 187536, "epoch": 4465} {"train_loss": -7.130555152893066, "global_step": 187537, "epoch": 4465} {"train_loss": -7.1465654373168945, "global_step": 187538, "epoch": 4465} {"train_loss": -7.123044013977051, "global_step": 187539, "epoch": 4465} {"train_loss": -7.1537275314331055, "global_step": 187540, "epoch": 4465} {"train_loss": -7.158374786376953, "global_step": 187541, "epoch": 4465} {"train_loss": -7.152673244476318, "global_step": 187542, "epoch": 4465} {"train_loss": -7.126559257507324, "global_step": 187543, "epoch": 4465} {"train_loss": -7.199333667755127, "global_step": 187544, "epoch": 4465} {"train_loss": -7.182526111602783, "global_step": 187545, "epoch": 4465} {"train_loss": -7.163289546966553, "global_step": 187546, "epoch": 4465} {"train_loss": -7.294363498687744, "global_step": 187547, "epoch": 4465} {"train_loss": -7.214729309082031, "global_step": 187548, "epoch": 4465} {"train_loss": -7.27964448928833, "global_step": 187549, "epoch": 4465} {"train_loss": -7.213143348693848, "global_step": 187550, "epoch": 4465} {"train_loss": -7.301400184631348, "global_step": 187551, "epoch": 4465} {"train_loss": -7.274845123291016, "global_step": 187552, "epoch": 4465} {"train_loss": -7.191790580749512, "global_step": 187553, "epoch": 4465} {"train_loss": -7.159235954284668, "global_step": 187554, "epoch": 4465} {"train_loss": -7.151467323303223, "global_step": 187555, "epoch": 4465} {"train_loss": -7.137253284454346, "global_step": 187556, "epoch": 4465} {"train_loss": -7.172872543334961, "global_step": 187557, "epoch": 4465} {"train_loss": -7.268795013427734, "global_step": 187558, "epoch": 4465} {"train_loss": -7.213628768920898, "global_step": 187559, "epoch": 4465} {"train_loss": -7.288237571716309, "global_step": 187560, "epoch": 4465} {"train_loss": -7.183322429656982, "global_step": 187561, "epoch": 4465} {"train_loss": -7.101146697998047, "global_step": 187562, "epoch": 4465} {"train_loss": -7.212285041809082, "global_step": 187563, "epoch": 4465} {"train_loss": -7.13666296005249, "global_step": 187564, "epoch": 4465} {"train_loss": -7.219304084777832, "global_step": 187565, "epoch": 4465} {"train_loss": -7.1585798263549805, "global_step": 187566, "epoch": 4465} {"train_loss": -7.186733245849609, "global_step": 187567, "epoch": 4465} {"train_loss": -7.1802191734313965, "global_step": 187568, "epoch": 4465} {"train_loss": -7.278451919555664, "global_step": 187569, "epoch": 4465} {"train_loss": -7.236634254455566, "global_step": 187570, "epoch": 4465} {"train_loss": -7.190397364752633, "global_step": 187571, "epoch": 4465, "val_loss": 80592.59375} {"train_loss": -7.140165328979492, "global_step": 187572, "epoch": 4466} {"train_loss": -7.2173871994018555, "global_step": 187573, "epoch": 4466} {"train_loss": -7.298077583312988, "global_step": 187574, "epoch": 4466} {"train_loss": -7.320503234863281, "global_step": 187575, "epoch": 4466} {"train_loss": -7.111794471740723, "global_step": 187576, "epoch": 4466} {"train_loss": -7.2621002197265625, "global_step": 187577, "epoch": 4466} {"train_loss": -7.331778526306152, "global_step": 187578, "epoch": 4466} {"train_loss": -7.397856712341309, "global_step": 187579, "epoch": 4466} {"train_loss": -7.1950764656066895, "global_step": 187580, "epoch": 4466} {"train_loss": -7.34063720703125, "global_step": 187581, "epoch": 4466} {"train_loss": -7.20528507232666, "global_step": 187582, "epoch": 4466} {"train_loss": -7.224636077880859, "global_step": 187583, "epoch": 4466} {"train_loss": -7.220122814178467, "global_step": 187584, "epoch": 4466} {"train_loss": -7.245107650756836, "global_step": 187585, "epoch": 4466} {"train_loss": -7.181718349456787, "global_step": 187586, "epoch": 4466} {"train_loss": -7.060546875, "global_step": 187587, "epoch": 4466} {"train_loss": -7.103236675262451, "global_step": 187588, "epoch": 4466} {"train_loss": -7.082553863525391, "global_step": 187589, "epoch": 4466} {"train_loss": -6.964800834655762, "global_step": 187590, "epoch": 4466} {"train_loss": -7.148504257202148, "global_step": 187591, "epoch": 4466} {"train_loss": -7.1325578689575195, "global_step": 187592, "epoch": 4466} {"train_loss": -6.897531032562256, "global_step": 187593, "epoch": 4466} {"train_loss": -7.052588939666748, "global_step": 187594, "epoch": 4466} {"train_loss": -7.0499267578125, "global_step": 187595, "epoch": 4466} {"train_loss": -6.971896171569824, "global_step": 187596, "epoch": 4466} {"train_loss": -7.143155097961426, "global_step": 187597, "epoch": 4466} {"train_loss": -7.07840633392334, "global_step": 187598, "epoch": 4466} {"train_loss": -7.139510154724121, "global_step": 187599, "epoch": 4466} {"train_loss": -7.194540023803711, "global_step": 187600, "epoch": 4466} {"train_loss": -7.128987789154053, "global_step": 187601, "epoch": 4466} {"train_loss": -7.115160942077637, "global_step": 187602, "epoch": 4466} {"train_loss": -7.179165840148926, "global_step": 187603, "epoch": 4466} {"train_loss": -7.173715591430664, "global_step": 187604, "epoch": 4466} {"train_loss": -7.137250900268555, "global_step": 187605, "epoch": 4466} {"train_loss": -7.130691051483154, "global_step": 187606, "epoch": 4466} {"train_loss": -7.140933990478516, "global_step": 187607, "epoch": 4466} {"train_loss": -7.168513298034668, "global_step": 187608, "epoch": 4466} {"train_loss": -6.933260917663574, "global_step": 187609, "epoch": 4466} {"train_loss": -7.211741924285889, "global_step": 187610, "epoch": 4466} {"train_loss": -7.177491188049316, "global_step": 187611, "epoch": 4466} {"train_loss": -7.240185260772705, "global_step": 187612, "epoch": 4466} {"train_loss": -7.157993748074486, "global_step": 187613, "epoch": 4466, "val_loss": 80993.1015625} {"train_loss": -7.145762920379639, "global_step": 187614, "epoch": 4467} {"train_loss": -7.170191764831543, "global_step": 187615, "epoch": 4467} {"train_loss": -7.242520332336426, "global_step": 187616, "epoch": 4467} {"train_loss": -7.256272315979004, "global_step": 187617, "epoch": 4467} {"train_loss": -7.23979377746582, "global_step": 187618, "epoch": 4467} {"train_loss": -7.284122467041016, "global_step": 187619, "epoch": 4467} {"train_loss": -7.246304035186768, "global_step": 187620, "epoch": 4467} {"train_loss": -7.223734378814697, "global_step": 187621, "epoch": 4467} {"train_loss": -7.310747146606445, "global_step": 187622, "epoch": 4467} {"train_loss": -7.286005020141602, "global_step": 187623, "epoch": 4467} {"train_loss": -7.261203765869141, "global_step": 187624, "epoch": 4467} {"train_loss": -7.292896747589111, "global_step": 187625, "epoch": 4467} {"train_loss": -7.142364501953125, "global_step": 187626, "epoch": 4467} {"train_loss": -7.1247124671936035, "global_step": 187627, "epoch": 4467} {"train_loss": -7.19293212890625, "global_step": 187628, "epoch": 4467} {"train_loss": -7.1659135818481445, "global_step": 187629, "epoch": 4467} {"train_loss": -7.163869857788086, "global_step": 187630, "epoch": 4467} {"train_loss": -7.2532548904418945, "global_step": 187631, "epoch": 4467} {"train_loss": -7.145910739898682, "global_step": 187632, "epoch": 4467} {"train_loss": -7.16592264175415, "global_step": 187633, "epoch": 4467} {"train_loss": -7.191255569458008, "global_step": 187634, "epoch": 4467} {"train_loss": -7.146062850952148, "global_step": 187635, "epoch": 4467} {"train_loss": -7.236059188842773, "global_step": 187636, "epoch": 4467} {"train_loss": -7.176930904388428, "global_step": 187637, "epoch": 4467} {"train_loss": -7.302034854888916, "global_step": 187638, "epoch": 4467} {"train_loss": -7.184093475341797, "global_step": 187639, "epoch": 4467} {"train_loss": -7.190303325653076, "global_step": 187640, "epoch": 4467} {"train_loss": -7.328128337860107, "global_step": 187641, "epoch": 4467} {"train_loss": -7.1664228439331055, "global_step": 187642, "epoch": 4467} {"train_loss": -7.255919933319092, "global_step": 187643, "epoch": 4467} {"train_loss": -7.172187805175781, "global_step": 187644, "epoch": 4467} {"train_loss": -7.1718926429748535, "global_step": 187645, "epoch": 4467} {"train_loss": -7.256156921386719, "global_step": 187646, "epoch": 4467} {"train_loss": -7.180458068847656, "global_step": 187647, "epoch": 4467} {"train_loss": -7.144070148468018, "global_step": 187648, "epoch": 4467} {"train_loss": -7.319183349609375, "global_step": 187649, "epoch": 4467} {"train_loss": -7.081779479980469, "global_step": 187650, "epoch": 4467} {"train_loss": -7.206137657165527, "global_step": 187651, "epoch": 4467} {"train_loss": -6.997103691101074, "global_step": 187652, "epoch": 4467} {"train_loss": -7.132090091705322, "global_step": 187653, "epoch": 4467} {"train_loss": -7.138895034790039, "global_step": 187654, "epoch": 4467} {"train_loss": -7.2033234891437345, "global_step": 187655, "epoch": 4467, "val_loss": 80947.0859375} {"train_loss": -7.151876449584961, "global_step": 187656, "epoch": 4468} {"train_loss": -7.190032958984375, "global_step": 187657, "epoch": 4468} {"train_loss": -7.210773944854736, "global_step": 187658, "epoch": 4468} {"train_loss": -7.170426845550537, "global_step": 187659, "epoch": 4468} {"train_loss": -7.205554008483887, "global_step": 187660, "epoch": 4468} {"train_loss": -7.277740478515625, "global_step": 187661, "epoch": 4468} {"train_loss": -7.247093200683594, "global_step": 187662, "epoch": 4468} {"train_loss": -7.066335678100586, "global_step": 187663, "epoch": 4468} {"train_loss": -7.142317771911621, "global_step": 187664, "epoch": 4468} {"train_loss": -7.146358489990234, "global_step": 187665, "epoch": 4468} {"train_loss": -7.150056838989258, "global_step": 187666, "epoch": 4468} {"train_loss": -7.184478759765625, "global_step": 187667, "epoch": 4468} {"train_loss": -7.160491466522217, "global_step": 187668, "epoch": 4468} {"train_loss": -7.146345138549805, "global_step": 187669, "epoch": 4468} {"train_loss": -7.182730674743652, "global_step": 187670, "epoch": 4468} {"train_loss": -7.240409851074219, "global_step": 187671, "epoch": 4468} {"train_loss": -7.141113758087158, "global_step": 187672, "epoch": 4468} {"train_loss": -7.289917945861816, "global_step": 187673, "epoch": 4468} {"train_loss": -7.200974941253662, "global_step": 187674, "epoch": 4468} {"train_loss": -7.22364616394043, "global_step": 187675, "epoch": 4468} {"train_loss": -7.173007965087891, "global_step": 187676, "epoch": 4468} {"train_loss": -7.190160274505615, "global_step": 187677, "epoch": 4468} {"train_loss": -7.287909507751465, "global_step": 187678, "epoch": 4468} {"train_loss": -7.187709808349609, "global_step": 187679, "epoch": 4468} {"train_loss": -7.2798285484313965, "global_step": 187680, "epoch": 4468} {"train_loss": -7.204370498657227, "global_step": 187681, "epoch": 4468} {"train_loss": -7.2223711013793945, "global_step": 187682, "epoch": 4468} {"train_loss": -7.1581315994262695, "global_step": 187683, "epoch": 4468} {"train_loss": -7.124450206756592, "global_step": 187684, "epoch": 4468} {"train_loss": -7.173988342285156, "global_step": 187685, "epoch": 4468} {"train_loss": -7.136065483093262, "global_step": 187686, "epoch": 4468} {"train_loss": -7.0867156982421875, "global_step": 187687, "epoch": 4468} {"train_loss": -7.098532676696777, "global_step": 187688, "epoch": 4468} {"train_loss": -7.17573881149292, "global_step": 187689, "epoch": 4468} {"train_loss": -7.119610786437988, "global_step": 187690, "epoch": 4468} {"train_loss": -6.988396644592285, "global_step": 187691, "epoch": 4468} {"train_loss": -7.210430145263672, "global_step": 187692, "epoch": 4468} {"train_loss": -7.200677871704102, "global_step": 187693, "epoch": 4468} {"train_loss": -7.1070332527160645, "global_step": 187694, "epoch": 4468} {"train_loss": -7.183745384216309, "global_step": 187695, "epoch": 4468} {"train_loss": -7.098345756530762, "global_step": 187696, "epoch": 4468} {"train_loss": -7.172091643015544, "global_step": 187697, "epoch": 4468, "val_loss": 81078.546875} {"train_loss": -6.9086103439331055, "global_step": 187698, "epoch": 4469} {"train_loss": -7.251856803894043, "global_step": 187699, "epoch": 4469} {"train_loss": -7.13134765625, "global_step": 187700, "epoch": 4469} {"train_loss": -7.069796562194824, "global_step": 187701, "epoch": 4469} {"train_loss": -7.104198455810547, "global_step": 187702, "epoch": 4469} {"train_loss": -7.127673149108887, "global_step": 187703, "epoch": 4469} {"train_loss": -7.290427207946777, "global_step": 187704, "epoch": 4469} {"train_loss": -6.996615409851074, "global_step": 187705, "epoch": 4469} {"train_loss": -7.185003280639648, "global_step": 187706, "epoch": 4469} {"train_loss": -7.121821880340576, "global_step": 187707, "epoch": 4469} {"train_loss": -7.029335975646973, "global_step": 187708, "epoch": 4469} {"train_loss": -7.126791000366211, "global_step": 187709, "epoch": 4469} {"train_loss": -7.091896057128906, "global_step": 187710, "epoch": 4469} {"train_loss": -7.101134300231934, "global_step": 187711, "epoch": 4469} {"train_loss": -7.217475891113281, "global_step": 187712, "epoch": 4469} {"train_loss": -7.2591776847839355, "global_step": 187713, "epoch": 4469} {"train_loss": -7.112554550170898, "global_step": 187714, "epoch": 4469} {"train_loss": -7.186494827270508, "global_step": 187715, "epoch": 4469} {"train_loss": -7.243501663208008, "global_step": 187716, "epoch": 4469} {"train_loss": -7.097690105438232, "global_step": 187717, "epoch": 4469} {"train_loss": -7.14796257019043, "global_step": 187718, "epoch": 4469} {"train_loss": -7.105212211608887, "global_step": 187719, "epoch": 4469} {"train_loss": -7.039677619934082, "global_step": 187720, "epoch": 4469} {"train_loss": -7.12808895111084, "global_step": 187721, "epoch": 4469} {"train_loss": -7.273290157318115, "global_step": 187722, "epoch": 4469} {"train_loss": -7.109167098999023, "global_step": 187723, "epoch": 4469} {"train_loss": -7.184269428253174, "global_step": 187724, "epoch": 4469} {"train_loss": -7.105027198791504, "global_step": 187725, "epoch": 4469} {"train_loss": -7.151933670043945, "global_step": 187726, "epoch": 4469} {"train_loss": -7.211615562438965, "global_step": 187727, "epoch": 4469} {"train_loss": -7.102451324462891, "global_step": 187728, "epoch": 4469} {"train_loss": -7.241560459136963, "global_step": 187729, "epoch": 4469} {"train_loss": -7.2460551261901855, "global_step": 187730, "epoch": 4469} {"train_loss": -7.066869258880615, "global_step": 187731, "epoch": 4469} {"train_loss": -7.223465919494629, "global_step": 187732, "epoch": 4469} {"train_loss": -7.148342609405518, "global_step": 187733, "epoch": 4469} {"train_loss": -7.137948036193848, "global_step": 187734, "epoch": 4469} {"train_loss": -7.086313724517822, "global_step": 187735, "epoch": 4469} {"train_loss": -7.274269104003906, "global_step": 187736, "epoch": 4469} {"train_loss": -7.140661716461182, "global_step": 187737, "epoch": 4469} {"train_loss": -7.258382797241211, "global_step": 187738, "epoch": 4469} {"train_loss": -7.147144578752064, "global_step": 187739, "epoch": 4469, "val_loss": 81021.4453125} {"train_loss": -7.002345561981201, "global_step": 187740, "epoch": 4470} {"train_loss": -7.2484283447265625, "global_step": 187741, "epoch": 4470} {"train_loss": -7.073220252990723, "global_step": 187742, "epoch": 4470} {"train_loss": -7.0895233154296875, "global_step": 187743, "epoch": 4470} {"train_loss": -7.218384742736816, "global_step": 187744, "epoch": 4470} {"train_loss": -7.1091084480285645, "global_step": 187745, "epoch": 4470} {"train_loss": -7.186636447906494, "global_step": 187746, "epoch": 4470} {"train_loss": -7.057116508483887, "global_step": 187747, "epoch": 4470} {"train_loss": -7.232070446014404, "global_step": 187748, "epoch": 4470} {"train_loss": -7.243898391723633, "global_step": 187749, "epoch": 4470} {"train_loss": -7.143520355224609, "global_step": 187750, "epoch": 4470} {"train_loss": -7.240121841430664, "global_step": 187751, "epoch": 4470} {"train_loss": -7.2434844970703125, "global_step": 187752, "epoch": 4470} {"train_loss": -7.14747428894043, "global_step": 187753, "epoch": 4470} {"train_loss": -7.1893768310546875, "global_step": 187754, "epoch": 4470} {"train_loss": -7.244427680969238, "global_step": 187755, "epoch": 4470} {"train_loss": -7.280919075012207, "global_step": 187756, "epoch": 4470} {"train_loss": -7.221141815185547, "global_step": 187757, "epoch": 4470} {"train_loss": -7.26704740524292, "global_step": 187758, "epoch": 4470} {"train_loss": -7.134519577026367, "global_step": 187759, "epoch": 4470} {"train_loss": -7.158091068267822, "global_step": 187760, "epoch": 4470} {"train_loss": -7.296667098999023, "global_step": 187761, "epoch": 4470} {"train_loss": -7.187659740447998, "global_step": 187762, "epoch": 4470} {"train_loss": -7.211639404296875, "global_step": 187763, "epoch": 4470} {"train_loss": -7.285333633422852, "global_step": 187764, "epoch": 4470} {"train_loss": -7.193376064300537, "global_step": 187765, "epoch": 4470} {"train_loss": -7.20646333694458, "global_step": 187766, "epoch": 4470} {"train_loss": -7.204094886779785, "global_step": 187767, "epoch": 4470} {"train_loss": -7.284104824066162, "global_step": 187768, "epoch": 4470} {"train_loss": -7.240655899047852, "global_step": 187769, "epoch": 4470} {"train_loss": -7.328704833984375, "global_step": 187770, "epoch": 4470} {"train_loss": -7.193682670593262, "global_step": 187771, "epoch": 4470} {"train_loss": -7.256680488586426, "global_step": 187772, "epoch": 4470} {"train_loss": -7.32591438293457, "global_step": 187773, "epoch": 4470} {"train_loss": -7.271827697753906, "global_step": 187774, "epoch": 4470} {"train_loss": -7.23922872543335, "global_step": 187775, "epoch": 4470} {"train_loss": -7.2294816970825195, "global_step": 187776, "epoch": 4470} {"train_loss": -7.225200653076172, "global_step": 187777, "epoch": 4470} {"train_loss": -7.195585250854492, "global_step": 187778, "epoch": 4470} {"train_loss": -7.189004898071289, "global_step": 187779, "epoch": 4470} {"train_loss": -7.172173500061035, "global_step": 187780, "epoch": 4470} {"train_loss": -7.207556815374465, "global_step": 187781, "epoch": 4470, "val_loss": 80694.1015625} {"train_loss": -7.260012149810791, "global_step": 187782, "epoch": 4471} {"train_loss": -7.153942108154297, "global_step": 187783, "epoch": 4471} {"train_loss": -7.2422590255737305, "global_step": 187784, "epoch": 4471} {"train_loss": -7.142436981201172, "global_step": 187785, "epoch": 4471} {"train_loss": -7.203711032867432, "global_step": 187786, "epoch": 4471} {"train_loss": -7.280263900756836, "global_step": 187787, "epoch": 4471} {"train_loss": -7.225038051605225, "global_step": 187788, "epoch": 4471} {"train_loss": -7.205133438110352, "global_step": 187789, "epoch": 4471} {"train_loss": -7.320959091186523, "global_step": 187790, "epoch": 4471} {"train_loss": -7.197345733642578, "global_step": 187791, "epoch": 4471} {"train_loss": -7.3177337646484375, "global_step": 187792, "epoch": 4471} {"train_loss": -7.148283958435059, "global_step": 187793, "epoch": 4471} {"train_loss": -7.2640862464904785, "global_step": 187794, "epoch": 4471} {"train_loss": -7.30538272857666, "global_step": 187795, "epoch": 4471} {"train_loss": -7.2386627197265625, "global_step": 187796, "epoch": 4471} {"train_loss": -7.239401817321777, "global_step": 187797, "epoch": 4471} {"train_loss": -7.3191752433776855, "global_step": 187798, "epoch": 4471} {"train_loss": -7.167893409729004, "global_step": 187799, "epoch": 4471} {"train_loss": -7.29075813293457, "global_step": 187800, "epoch": 4471} {"train_loss": -7.171516418457031, "global_step": 187801, "epoch": 4471} {"train_loss": -7.264360427856445, "global_step": 187802, "epoch": 4471} {"train_loss": -7.171450614929199, "global_step": 187803, "epoch": 4471} {"train_loss": -7.215075969696045, "global_step": 187804, "epoch": 4471} {"train_loss": -7.1572771072387695, "global_step": 187805, "epoch": 4471} {"train_loss": -7.209179401397705, "global_step": 187806, "epoch": 4471} {"train_loss": -7.1672163009643555, "global_step": 187807, "epoch": 4471} {"train_loss": -7.025264263153076, "global_step": 187808, "epoch": 4471} {"train_loss": -7.277612686157227, "global_step": 187809, "epoch": 4471} {"train_loss": -7.217074394226074, "global_step": 187810, "epoch": 4471} {"train_loss": -7.2501983642578125, "global_step": 187811, "epoch": 4471} {"train_loss": -7.153626441955566, "global_step": 187812, "epoch": 4471} {"train_loss": -7.135320663452148, "global_step": 187813, "epoch": 4471} {"train_loss": -7.172889709472656, "global_step": 187814, "epoch": 4471} {"train_loss": -7.236396789550781, "global_step": 187815, "epoch": 4471} {"train_loss": -7.158840179443359, "global_step": 187816, "epoch": 4471} {"train_loss": -7.209929466247559, "global_step": 187817, "epoch": 4471} {"train_loss": -7.188475608825684, "global_step": 187818, "epoch": 4471} {"train_loss": -7.077076435089111, "global_step": 187819, "epoch": 4471} {"train_loss": -7.225870132446289, "global_step": 187820, "epoch": 4471} {"train_loss": -7.21699333190918, "global_step": 187821, "epoch": 4471} {"train_loss": -6.9860758781433105, "global_step": 187822, "epoch": 4471} {"train_loss": -7.203773566654751, "global_step": 187823, "epoch": 4471, "val_loss": 81003.6484375} {"train_loss": -7.237274169921875, "global_step": 187824, "epoch": 4472} {"train_loss": -7.245276927947998, "global_step": 187825, "epoch": 4472} {"train_loss": -7.029736518859863, "global_step": 187826, "epoch": 4472} {"train_loss": -7.1652679443359375, "global_step": 187827, "epoch": 4472} {"train_loss": -7.0747880935668945, "global_step": 187828, "epoch": 4472} {"train_loss": -7.2283501625061035, "global_step": 187829, "epoch": 4472} {"train_loss": -7.128874778747559, "global_step": 187830, "epoch": 4472} {"train_loss": -7.267481803894043, "global_step": 187831, "epoch": 4472} {"train_loss": -7.226494312286377, "global_step": 187832, "epoch": 4472} {"train_loss": -7.169989109039307, "global_step": 187833, "epoch": 4472} {"train_loss": -7.183651924133301, "global_step": 187834, "epoch": 4472} {"train_loss": -7.165975093841553, "global_step": 187835, "epoch": 4472} {"train_loss": -7.138383388519287, "global_step": 187836, "epoch": 4472} {"train_loss": -7.212284088134766, "global_step": 187837, "epoch": 4472} {"train_loss": -7.097344398498535, "global_step": 187838, "epoch": 4472} {"train_loss": -7.17678689956665, "global_step": 187839, "epoch": 4472} {"train_loss": -7.232587814331055, "global_step": 187840, "epoch": 4472} {"train_loss": -7.102667808532715, "global_step": 187841, "epoch": 4472} {"train_loss": -7.1185784339904785, "global_step": 187842, "epoch": 4472} {"train_loss": -7.201883316040039, "global_step": 187843, "epoch": 4472} {"train_loss": -7.315191268920898, "global_step": 187844, "epoch": 4472} {"train_loss": -7.101312637329102, "global_step": 187845, "epoch": 4472} {"train_loss": -7.196225166320801, "global_step": 187846, "epoch": 4472} {"train_loss": -7.264951705932617, "global_step": 187847, "epoch": 4472} {"train_loss": -7.342232704162598, "global_step": 187848, "epoch": 4472} {"train_loss": -7.275643825531006, "global_step": 187849, "epoch": 4472} {"train_loss": -7.114961624145508, "global_step": 187850, "epoch": 4472} {"train_loss": -7.223574638366699, "global_step": 187851, "epoch": 4472} {"train_loss": -7.124520301818848, "global_step": 187852, "epoch": 4472} {"train_loss": -7.248599529266357, "global_step": 187853, "epoch": 4472} {"train_loss": -7.262204170227051, "global_step": 187854, "epoch": 4472} {"train_loss": -7.279487133026123, "global_step": 187855, "epoch": 4472} {"train_loss": -7.23388671875, "global_step": 187856, "epoch": 4472} {"train_loss": -7.195781707763672, "global_step": 187857, "epoch": 4472} {"train_loss": -7.101145267486572, "global_step": 187858, "epoch": 4472} {"train_loss": -7.2098588943481445, "global_step": 187859, "epoch": 4472} {"train_loss": -7.1983232498168945, "global_step": 187860, "epoch": 4472} {"train_loss": -7.251265525817871, "global_step": 187861, "epoch": 4472} {"train_loss": -7.273105621337891, "global_step": 187862, "epoch": 4472} {"train_loss": -7.258135795593262, "global_step": 187863, "epoch": 4472} {"train_loss": -7.189058303833008, "global_step": 187864, "epoch": 4472} {"train_loss": -7.1990319320133755, "global_step": 187865, "epoch": 4472, "val_loss": 80819.0} {"train_loss": -7.11224889755249, "global_step": 187866, "epoch": 4473} {"train_loss": -7.121865749359131, "global_step": 187867, "epoch": 4473} {"train_loss": -7.0262346267700195, "global_step": 187868, "epoch": 4473} {"train_loss": -7.176902770996094, "global_step": 187869, "epoch": 4473} {"train_loss": -7.199272155761719, "global_step": 187870, "epoch": 4473} {"train_loss": -7.078078269958496, "global_step": 187871, "epoch": 4473} {"train_loss": -7.342511177062988, "global_step": 187872, "epoch": 4473} {"train_loss": -7.212790012359619, "global_step": 187873, "epoch": 4473} {"train_loss": -7.186025142669678, "global_step": 187874, "epoch": 4473} {"train_loss": -7.2147979736328125, "global_step": 187875, "epoch": 4473} {"train_loss": -7.112361907958984, "global_step": 187876, "epoch": 4473} {"train_loss": -7.196954250335693, "global_step": 187877, "epoch": 4473} {"train_loss": -7.196311950683594, "global_step": 187878, "epoch": 4473} {"train_loss": -7.127900123596191, "global_step": 187879, "epoch": 4473} {"train_loss": -7.295370101928711, "global_step": 187880, "epoch": 4473} {"train_loss": -7.1712870597839355, "global_step": 187881, "epoch": 4473} {"train_loss": -7.248075485229492, "global_step": 187882, "epoch": 4473} {"train_loss": -7.127711296081543, "global_step": 187883, "epoch": 4473} {"train_loss": -7.236300468444824, "global_step": 187884, "epoch": 4473} {"train_loss": -7.1631693840026855, "global_step": 187885, "epoch": 4473} {"train_loss": -7.1488494873046875, "global_step": 187886, "epoch": 4473} {"train_loss": -7.181465148925781, "global_step": 187887, "epoch": 4473} {"train_loss": -7.286797046661377, "global_step": 187888, "epoch": 4473} {"train_loss": -7.232699394226074, "global_step": 187889, "epoch": 4473} {"train_loss": -7.215900421142578, "global_step": 187890, "epoch": 4473} {"train_loss": -7.1356658935546875, "global_step": 187891, "epoch": 4473} {"train_loss": -7.180810451507568, "global_step": 187892, "epoch": 4473} {"train_loss": -7.113629341125488, "global_step": 187893, "epoch": 4473} {"train_loss": -7.147204399108887, "global_step": 187894, "epoch": 4473} {"train_loss": -7.342239856719971, "global_step": 187895, "epoch": 4473} {"train_loss": -6.940516471862793, "global_step": 187896, "epoch": 4473} {"train_loss": -7.147078037261963, "global_step": 187897, "epoch": 4473} {"train_loss": -7.260808944702148, "global_step": 187898, "epoch": 4473} {"train_loss": -7.019604206085205, "global_step": 187899, "epoch": 4473} {"train_loss": -7.132510185241699, "global_step": 187900, "epoch": 4473} {"train_loss": -7.270144939422607, "global_step": 187901, "epoch": 4473} {"train_loss": -7.023656845092773, "global_step": 187902, "epoch": 4473} {"train_loss": -7.143425941467285, "global_step": 187903, "epoch": 4473} {"train_loss": -7.109549522399902, "global_step": 187904, "epoch": 4473} {"train_loss": -7.059981346130371, "global_step": 187905, "epoch": 4473} {"train_loss": -7.1954474449157715, "global_step": 187906, "epoch": 4473} {"train_loss": -7.167848689215524, "global_step": 187907, "epoch": 4473, "val_loss": 81163.3671875} {"train_loss": -7.167162895202637, "global_step": 187908, "epoch": 4474} {"train_loss": -7.26004695892334, "global_step": 187909, "epoch": 4474} {"train_loss": -7.169201850891113, "global_step": 187910, "epoch": 4474} {"train_loss": -7.093245506286621, "global_step": 187911, "epoch": 4474} {"train_loss": -7.156793117523193, "global_step": 187912, "epoch": 4474} {"train_loss": -7.074100494384766, "global_step": 187913, "epoch": 4474} {"train_loss": -7.311408996582031, "global_step": 187914, "epoch": 4474} {"train_loss": -7.0277099609375, "global_step": 187915, "epoch": 4474} {"train_loss": -7.206995487213135, "global_step": 187916, "epoch": 4474} {"train_loss": -7.176119804382324, "global_step": 187917, "epoch": 4474} {"train_loss": -7.2189531326293945, "global_step": 187918, "epoch": 4474} {"train_loss": -7.206103324890137, "global_step": 187919, "epoch": 4474} {"train_loss": -7.164433479309082, "global_step": 187920, "epoch": 4474} {"train_loss": -7.176633358001709, "global_step": 187921, "epoch": 4474} {"train_loss": -7.1618146896362305, "global_step": 187922, "epoch": 4474} {"train_loss": -7.12089729309082, "global_step": 187923, "epoch": 4474} {"train_loss": -7.229887962341309, "global_step": 187924, "epoch": 4474} {"train_loss": -7.084268569946289, "global_step": 187925, "epoch": 4474} {"train_loss": -7.141094207763672, "global_step": 187926, "epoch": 4474} {"train_loss": -7.102178573608398, "global_step": 187927, "epoch": 4474} {"train_loss": -7.136999130249023, "global_step": 187928, "epoch": 4474} {"train_loss": -7.205606937408447, "global_step": 187929, "epoch": 4474} {"train_loss": -7.058351516723633, "global_step": 187930, "epoch": 4474} {"train_loss": -7.188140869140625, "global_step": 187931, "epoch": 4474} {"train_loss": -7.131888389587402, "global_step": 187932, "epoch": 4474} {"train_loss": -7.206088542938232, "global_step": 187933, "epoch": 4474} {"train_loss": -7.188746452331543, "global_step": 187934, "epoch": 4474} {"train_loss": -7.201212406158447, "global_step": 187935, "epoch": 4474} {"train_loss": -7.131076812744141, "global_step": 187936, "epoch": 4474} {"train_loss": -7.084559917449951, "global_step": 187937, "epoch": 4474} {"train_loss": -7.207118034362793, "global_step": 187938, "epoch": 4474} {"train_loss": -7.159036636352539, "global_step": 187939, "epoch": 4474} {"train_loss": -7.0613813400268555, "global_step": 187940, "epoch": 4474} {"train_loss": -7.20952033996582, "global_step": 187941, "epoch": 4474} {"train_loss": -7.232564926147461, "global_step": 187942, "epoch": 4474} {"train_loss": -7.152871131896973, "global_step": 187943, "epoch": 4474} {"train_loss": -7.185024261474609, "global_step": 187944, "epoch": 4474} {"train_loss": -7.230502128601074, "global_step": 187945, "epoch": 4474} {"train_loss": -7.098084449768066, "global_step": 187946, "epoch": 4474} {"train_loss": -7.250358581542969, "global_step": 187947, "epoch": 4474} {"train_loss": -7.1081390380859375, "global_step": 187948, "epoch": 4474} {"train_loss": -7.164680855614798, "global_step": 187949, "epoch": 4474, "val_loss": 80901.5625} {"train_loss": -7.141007423400879, "global_step": 187950, "epoch": 4475} {"train_loss": -7.033938407897949, "global_step": 187951, "epoch": 4475} {"train_loss": -6.929604530334473, "global_step": 187952, "epoch": 4475} {"train_loss": -7.168835163116455, "global_step": 187953, "epoch": 4475} {"train_loss": -7.020592212677002, "global_step": 187954, "epoch": 4475} {"train_loss": -7.186707496643066, "global_step": 187955, "epoch": 4475} {"train_loss": -7.011753082275391, "global_step": 187956, "epoch": 4475} {"train_loss": -7.179001808166504, "global_step": 187957, "epoch": 4475} {"train_loss": -7.21565055847168, "global_step": 187958, "epoch": 4475} {"train_loss": -6.956916332244873, "global_step": 187959, "epoch": 4475} {"train_loss": -7.044372081756592, "global_step": 187960, "epoch": 4475} {"train_loss": -7.089868068695068, "global_step": 187961, "epoch": 4475} {"train_loss": -7.061520576477051, "global_step": 187962, "epoch": 4475} {"train_loss": -7.011669158935547, "global_step": 187963, "epoch": 4475} {"train_loss": -7.329439163208008, "global_step": 187964, "epoch": 4475} {"train_loss": -7.050075531005859, "global_step": 187965, "epoch": 4475} {"train_loss": -7.269613265991211, "global_step": 187966, "epoch": 4475} {"train_loss": -7.043022155761719, "global_step": 187967, "epoch": 4475} {"train_loss": -7.1188788414001465, "global_step": 187968, "epoch": 4475} {"train_loss": -7.112824440002441, "global_step": 187969, "epoch": 4475} {"train_loss": -7.145342826843262, "global_step": 187970, "epoch": 4475} {"train_loss": -7.074746608734131, "global_step": 187971, "epoch": 4475} {"train_loss": -7.22266960144043, "global_step": 187972, "epoch": 4475} {"train_loss": -7.021764755249023, "global_step": 187973, "epoch": 4475} {"train_loss": -7.255982875823975, "global_step": 187974, "epoch": 4475} {"train_loss": -7.120785236358643, "global_step": 187975, "epoch": 4475} {"train_loss": -6.9143877029418945, "global_step": 187976, "epoch": 4475} {"train_loss": -6.988531112670898, "global_step": 187977, "epoch": 4475} {"train_loss": -7.141516208648682, "global_step": 187978, "epoch": 4475} {"train_loss": -7.111952781677246, "global_step": 187979, "epoch": 4475} {"train_loss": -7.0133256912231445, "global_step": 187980, "epoch": 4475} {"train_loss": -7.146457672119141, "global_step": 187981, "epoch": 4475} {"train_loss": -7.144899368286133, "global_step": 187982, "epoch": 4475} {"train_loss": -7.270059585571289, "global_step": 187983, "epoch": 4475} {"train_loss": -7.12887716293335, "global_step": 187984, "epoch": 4475} {"train_loss": -7.219336986541748, "global_step": 187985, "epoch": 4475} {"train_loss": -7.077425956726074, "global_step": 187986, "epoch": 4475} {"train_loss": -7.185628890991211, "global_step": 187987, "epoch": 4475} {"train_loss": -7.116254806518555, "global_step": 187988, "epoch": 4475} {"train_loss": -7.214010238647461, "global_step": 187989, "epoch": 4475} {"train_loss": -7.195903778076172, "global_step": 187990, "epoch": 4475} {"train_loss": -7.116517259961083, "global_step": 187991, "epoch": 4475, "val_loss": 80722.6796875} {"train_loss": -7.172794342041016, "global_step": 187992, "epoch": 4476} {"train_loss": -7.161526203155518, "global_step": 187993, "epoch": 4476} {"train_loss": -7.180814266204834, "global_step": 187994, "epoch": 4476} {"train_loss": -7.154529571533203, "global_step": 187995, "epoch": 4476} {"train_loss": -7.251962661743164, "global_step": 187996, "epoch": 4476} {"train_loss": -7.225620269775391, "global_step": 187997, "epoch": 4476} {"train_loss": -7.220520496368408, "global_step": 187998, "epoch": 4476} {"train_loss": -7.205558776855469, "global_step": 187999, "epoch": 4476} {"train_loss": -7.153223037719727, "global_step": 188000, "epoch": 4476} {"train_loss": -7.167020797729492, "global_step": 188001, "epoch": 4476} {"train_loss": -7.275638580322266, "global_step": 188002, "epoch": 4476} {"train_loss": -7.271624565124512, "global_step": 188003, "epoch": 4476} {"train_loss": -7.232936859130859, "global_step": 188004, "epoch": 4476} {"train_loss": -7.190686225891113, "global_step": 188005, "epoch": 4476} {"train_loss": -7.2109055519104, "global_step": 188006, "epoch": 4476} {"train_loss": -7.246318817138672, "global_step": 188007, "epoch": 4476} {"train_loss": -7.131145000457764, "global_step": 188008, "epoch": 4476} {"train_loss": -7.185651779174805, "global_step": 188009, "epoch": 4476} {"train_loss": -7.254367828369141, "global_step": 188010, "epoch": 4476} {"train_loss": -7.175138473510742, "global_step": 188011, "epoch": 4476} {"train_loss": -7.201516151428223, "global_step": 188012, "epoch": 4476} {"train_loss": -7.264606475830078, "global_step": 188013, "epoch": 4476} {"train_loss": -7.185070991516113, "global_step": 188014, "epoch": 4476} {"train_loss": -7.009838581085205, "global_step": 188015, "epoch": 4476} {"train_loss": -7.195201396942139, "global_step": 188016, "epoch": 4476} {"train_loss": -7.275848388671875, "global_step": 188017, "epoch": 4476} {"train_loss": -7.0540266036987305, "global_step": 188018, "epoch": 4476} {"train_loss": -7.237318992614746, "global_step": 188019, "epoch": 4476} {"train_loss": -7.158080101013184, "global_step": 188020, "epoch": 4476} {"train_loss": -7.155848026275635, "global_step": 188021, "epoch": 4476} {"train_loss": -7.175716400146484, "global_step": 188022, "epoch": 4476} {"train_loss": -7.283720016479492, "global_step": 188023, "epoch": 4476} {"train_loss": -7.1138176918029785, "global_step": 188024, "epoch": 4476} {"train_loss": -7.145538330078125, "global_step": 188025, "epoch": 4476} {"train_loss": -7.167243957519531, "global_step": 188026, "epoch": 4476} {"train_loss": -7.179276466369629, "global_step": 188027, "epoch": 4476} {"train_loss": -7.180785179138184, "global_step": 188028, "epoch": 4476} {"train_loss": -7.264479637145996, "global_step": 188029, "epoch": 4476} {"train_loss": -7.108307838439941, "global_step": 188030, "epoch": 4476} {"train_loss": -7.149669647216797, "global_step": 188031, "epoch": 4476} {"train_loss": -7.205832481384277, "global_step": 188032, "epoch": 4476} {"train_loss": -7.188628548667545, "global_step": 188033, "epoch": 4476, "val_loss": 81176.1484375} {"train_loss": -7.185418128967285, "global_step": 188034, "epoch": 4477} {"train_loss": -7.258117198944092, "global_step": 188035, "epoch": 4477} {"train_loss": -7.204875469207764, "global_step": 188036, "epoch": 4477} {"train_loss": -7.152948379516602, "global_step": 188037, "epoch": 4477} {"train_loss": -7.363496780395508, "global_step": 188038, "epoch": 4477} {"train_loss": -7.255578994750977, "global_step": 188039, "epoch": 4477} {"train_loss": -7.111722946166992, "global_step": 188040, "epoch": 4477} {"train_loss": -7.245433330535889, "global_step": 188041, "epoch": 4477} {"train_loss": -7.187197208404541, "global_step": 188042, "epoch": 4477} {"train_loss": -7.16541051864624, "global_step": 188043, "epoch": 4477} {"train_loss": -7.018647193908691, "global_step": 188044, "epoch": 4477} {"train_loss": -7.05470085144043, "global_step": 188045, "epoch": 4477} {"train_loss": -7.29727840423584, "global_step": 188046, "epoch": 4477} {"train_loss": -7.143177032470703, "global_step": 188047, "epoch": 4477} {"train_loss": -7.207843780517578, "global_step": 188048, "epoch": 4477} {"train_loss": -7.205225944519043, "global_step": 188049, "epoch": 4477} {"train_loss": -7.182866096496582, "global_step": 188050, "epoch": 4477} {"train_loss": -7.1754302978515625, "global_step": 188051, "epoch": 4477} {"train_loss": -7.21510648727417, "global_step": 188052, "epoch": 4477} {"train_loss": -7.2304368019104, "global_step": 188053, "epoch": 4477} {"train_loss": -7.094757080078125, "global_step": 188054, "epoch": 4477} {"train_loss": -7.1912922859191895, "global_step": 188055, "epoch": 4477} {"train_loss": -7.186348915100098, "global_step": 188056, "epoch": 4477} {"train_loss": -7.066637992858887, "global_step": 188057, "epoch": 4477} {"train_loss": -7.198570251464844, "global_step": 188058, "epoch": 4477} {"train_loss": -7.309010982513428, "global_step": 188059, "epoch": 4477} {"train_loss": -7.174410343170166, "global_step": 188060, "epoch": 4477} {"train_loss": -7.296229839324951, "global_step": 188061, "epoch": 4477} {"train_loss": -7.176953315734863, "global_step": 188062, "epoch": 4477} {"train_loss": -7.294595718383789, "global_step": 188063, "epoch": 4477} {"train_loss": -7.218019962310791, "global_step": 188064, "epoch": 4477} {"train_loss": -7.237967491149902, "global_step": 188065, "epoch": 4477} {"train_loss": -7.303460121154785, "global_step": 188066, "epoch": 4477} {"train_loss": -7.166333198547363, "global_step": 188067, "epoch": 4477} {"train_loss": -7.269101619720459, "global_step": 188068, "epoch": 4477} {"train_loss": -7.261863708496094, "global_step": 188069, "epoch": 4477} {"train_loss": -7.236750602722168, "global_step": 188070, "epoch": 4477} {"train_loss": -7.212900161743164, "global_step": 188071, "epoch": 4477} {"train_loss": -7.162596702575684, "global_step": 188072, "epoch": 4477} {"train_loss": -7.2953033447265625, "global_step": 188073, "epoch": 4477} {"train_loss": -7.188506126403809, "global_step": 188074, "epoch": 4477} {"train_loss": -7.206210011527652, "global_step": 188075, "epoch": 4477, "val_loss": 80889.8125} {"train_loss": -7.256888389587402, "global_step": 188076, "epoch": 4478} {"train_loss": -7.273541450500488, "global_step": 188077, "epoch": 4478} {"train_loss": -7.239588737487793, "global_step": 188078, "epoch": 4478} {"train_loss": -7.101933479309082, "global_step": 188079, "epoch": 4478} {"train_loss": -7.270493984222412, "global_step": 188080, "epoch": 4478} {"train_loss": -7.360881328582764, "global_step": 188081, "epoch": 4478} {"train_loss": -7.144870758056641, "global_step": 188082, "epoch": 4478} {"train_loss": -7.174872875213623, "global_step": 188083, "epoch": 4478} {"train_loss": -7.250744819641113, "global_step": 188084, "epoch": 4478} {"train_loss": -7.218456268310547, "global_step": 188085, "epoch": 4478} {"train_loss": -7.167434215545654, "global_step": 188086, "epoch": 4478} {"train_loss": -7.107228755950928, "global_step": 188087, "epoch": 4478} {"train_loss": -7.063695430755615, "global_step": 188088, "epoch": 4478} {"train_loss": -6.973530292510986, "global_step": 188089, "epoch": 4478} {"train_loss": -7.14003849029541, "global_step": 188090, "epoch": 4478} {"train_loss": -6.857903480529785, "global_step": 188091, "epoch": 4478} {"train_loss": -7.0425848960876465, "global_step": 188092, "epoch": 4478} {"train_loss": -6.9983320236206055, "global_step": 188093, "epoch": 4478} {"train_loss": -6.933610439300537, "global_step": 188094, "epoch": 4478} {"train_loss": -7.114204406738281, "global_step": 188095, "epoch": 4478} {"train_loss": -7.116033554077148, "global_step": 188096, "epoch": 4478} {"train_loss": -7.088685989379883, "global_step": 188097, "epoch": 4478} {"train_loss": -7.028499126434326, "global_step": 188098, "epoch": 4478} {"train_loss": -7.17793083190918, "global_step": 188099, "epoch": 4478} {"train_loss": -7.108039855957031, "global_step": 188100, "epoch": 4478} {"train_loss": -7.231439590454102, "global_step": 188101, "epoch": 4478} {"train_loss": -6.9805989265441895, "global_step": 188102, "epoch": 4478} {"train_loss": -7.130763053894043, "global_step": 188103, "epoch": 4478} {"train_loss": -7.095633506774902, "global_step": 188104, "epoch": 4478} {"train_loss": -7.067198753356934, "global_step": 188105, "epoch": 4478} {"train_loss": -7.073410511016846, "global_step": 188106, "epoch": 4478} {"train_loss": -7.068964004516602, "global_step": 188107, "epoch": 4478} {"train_loss": -7.167690277099609, "global_step": 188108, "epoch": 4478} {"train_loss": -7.102008819580078, "global_step": 188109, "epoch": 4478} {"train_loss": -7.170974254608154, "global_step": 188110, "epoch": 4478} {"train_loss": -7.004171371459961, "global_step": 188111, "epoch": 4478} {"train_loss": -7.04897403717041, "global_step": 188112, "epoch": 4478} {"train_loss": -7.105837821960449, "global_step": 188113, "epoch": 4478} {"train_loss": -7.057289123535156, "global_step": 188114, "epoch": 4478} {"train_loss": -7.177698135375977, "global_step": 188115, "epoch": 4478} {"train_loss": -7.105974197387695, "global_step": 188116, "epoch": 4478} {"train_loss": -7.118660677047003, "global_step": 188117, "epoch": 4478, "val_loss": 80992.1875} {"train_loss": -7.236303806304932, "global_step": 188118, "epoch": 4479} {"train_loss": -7.177689552307129, "global_step": 188119, "epoch": 4479} {"train_loss": -7.3149003982543945, "global_step": 188120, "epoch": 4479} {"train_loss": -7.202503204345703, "global_step": 188121, "epoch": 4479} {"train_loss": -7.205511569976807, "global_step": 188122, "epoch": 4479} {"train_loss": -7.16918420791626, "global_step": 188123, "epoch": 4479} {"train_loss": -7.193886756896973, "global_step": 188124, "epoch": 4479} {"train_loss": -7.218172073364258, "global_step": 188125, "epoch": 4479} {"train_loss": -7.2492876052856445, "global_step": 188126, "epoch": 4479} {"train_loss": -7.21242094039917, "global_step": 188127, "epoch": 4479} {"train_loss": -7.21790075302124, "global_step": 188128, "epoch": 4479} {"train_loss": -7.195222854614258, "global_step": 188129, "epoch": 4479} {"train_loss": -7.280672073364258, "global_step": 188130, "epoch": 4479} {"train_loss": -7.277071475982666, "global_step": 188131, "epoch": 4479} {"train_loss": -7.202479362487793, "global_step": 188132, "epoch": 4479} {"train_loss": -7.246960163116455, "global_step": 188133, "epoch": 4479} {"train_loss": -7.295375347137451, "global_step": 188134, "epoch": 4479} {"train_loss": -7.19096565246582, "global_step": 188135, "epoch": 4479} {"train_loss": -7.196999549865723, "global_step": 188136, "epoch": 4479} {"train_loss": -7.309202194213867, "global_step": 188137, "epoch": 4479} {"train_loss": -7.20582389831543, "global_step": 188138, "epoch": 4479} {"train_loss": -7.099366664886475, "global_step": 188139, "epoch": 4479} {"train_loss": -7.324868202209473, "global_step": 188140, "epoch": 4479} {"train_loss": -7.132361888885498, "global_step": 188141, "epoch": 4479} {"train_loss": -7.047863960266113, "global_step": 188142, "epoch": 4479} {"train_loss": -7.304867744445801, "global_step": 188143, "epoch": 4479} {"train_loss": -7.215455055236816, "global_step": 188144, "epoch": 4479} {"train_loss": -7.146892070770264, "global_step": 188145, "epoch": 4479} {"train_loss": -7.184013366699219, "global_step": 188146, "epoch": 4479} {"train_loss": -7.197258949279785, "global_step": 188147, "epoch": 4479} {"train_loss": -7.100797653198242, "global_step": 188148, "epoch": 4479} {"train_loss": -7.26593542098999, "global_step": 188149, "epoch": 4479} {"train_loss": -7.202223777770996, "global_step": 188150, "epoch": 4479} {"train_loss": -7.195014953613281, "global_step": 188151, "epoch": 4479} {"train_loss": -7.283764839172363, "global_step": 188152, "epoch": 4479} {"train_loss": -7.214580535888672, "global_step": 188153, "epoch": 4479} {"train_loss": -7.249106407165527, "global_step": 188154, "epoch": 4479} {"train_loss": -7.18568229675293, "global_step": 188155, "epoch": 4479} {"train_loss": -7.257030010223389, "global_step": 188156, "epoch": 4479} {"train_loss": -7.133193492889404, "global_step": 188157, "epoch": 4479} {"train_loss": -7.240331172943115, "global_step": 188158, "epoch": 4479} {"train_loss": -7.213933161326817, "global_step": 188159, "epoch": 4479, "val_loss": 80966.734375} {"train_loss": -7.237552165985107, "global_step": 188160, "epoch": 4480} {"train_loss": -7.209399223327637, "global_step": 188161, "epoch": 4480} {"train_loss": -7.1396355628967285, "global_step": 188162, "epoch": 4480} {"train_loss": -7.151569843292236, "global_step": 188163, "epoch": 4480} {"train_loss": -7.219121932983398, "global_step": 188164, "epoch": 4480} {"train_loss": -7.2071733474731445, "global_step": 188165, "epoch": 4480} {"train_loss": -7.247778415679932, "global_step": 188166, "epoch": 4480} {"train_loss": -7.308656692504883, "global_step": 188167, "epoch": 4480} {"train_loss": -7.214077472686768, "global_step": 188168, "epoch": 4480} {"train_loss": -7.264479637145996, "global_step": 188169, "epoch": 4480} {"train_loss": -7.343287467956543, "global_step": 188170, "epoch": 4480} {"train_loss": -7.042478561401367, "global_step": 188171, "epoch": 4480} {"train_loss": -7.20114803314209, "global_step": 188172, "epoch": 4480} {"train_loss": -7.185581207275391, "global_step": 188173, "epoch": 4480} {"train_loss": -7.134772300720215, "global_step": 188174, "epoch": 4480} {"train_loss": -7.293344020843506, "global_step": 188175, "epoch": 4480} {"train_loss": -7.237696647644043, "global_step": 188176, "epoch": 4480} {"train_loss": -7.217322826385498, "global_step": 188177, "epoch": 4480} {"train_loss": -7.183812618255615, "global_step": 188178, "epoch": 4480} {"train_loss": -7.2195725440979, "global_step": 188179, "epoch": 4480} {"train_loss": -7.3054938316345215, "global_step": 188180, "epoch": 4480} {"train_loss": -7.170419216156006, "global_step": 188181, "epoch": 4480} {"train_loss": -7.1164679527282715, "global_step": 188182, "epoch": 4480} {"train_loss": -7.313149452209473, "global_step": 188183, "epoch": 4480} {"train_loss": -7.10936164855957, "global_step": 188184, "epoch": 4480} {"train_loss": -7.207492828369141, "global_step": 188185, "epoch": 4480} {"train_loss": -7.050573348999023, "global_step": 188186, "epoch": 4480} {"train_loss": -7.120121955871582, "global_step": 188187, "epoch": 4480} {"train_loss": -7.251102924346924, "global_step": 188188, "epoch": 4480} {"train_loss": -6.955207824707031, "global_step": 188189, "epoch": 4480} {"train_loss": -7.088555335998535, "global_step": 188190, "epoch": 4480} {"train_loss": -7.198844909667969, "global_step": 188191, "epoch": 4480} {"train_loss": -6.971199989318848, "global_step": 188192, "epoch": 4480} {"train_loss": -7.105957508087158, "global_step": 188193, "epoch": 4480} {"train_loss": -7.079864025115967, "global_step": 188194, "epoch": 4480} {"train_loss": -7.092964172363281, "global_step": 188195, "epoch": 4480} {"train_loss": -7.126346588134766, "global_step": 188196, "epoch": 4480} {"train_loss": -7.113147735595703, "global_step": 188197, "epoch": 4480} {"train_loss": -7.178471565246582, "global_step": 188198, "epoch": 4480} {"train_loss": -6.985454559326172, "global_step": 188199, "epoch": 4480} {"train_loss": -7.179684638977051, "global_step": 188200, "epoch": 4480} {"train_loss": -7.16577749025254, "global_step": 188201, "epoch": 4480, "val_loss": 80823.6953125} {"train_loss": -7.172009468078613, "global_step": 188202, "epoch": 4481} {"train_loss": -7.060358047485352, "global_step": 188203, "epoch": 4481} {"train_loss": -7.160679817199707, "global_step": 188204, "epoch": 4481} {"train_loss": -7.07048225402832, "global_step": 188205, "epoch": 4481} {"train_loss": -7.059643745422363, "global_step": 188206, "epoch": 4481} {"train_loss": -7.19981050491333, "global_step": 188207, "epoch": 4481} {"train_loss": -7.1724419593811035, "global_step": 188208, "epoch": 4481} {"train_loss": -7.033802509307861, "global_step": 188209, "epoch": 4481} {"train_loss": -7.171464443206787, "global_step": 188210, "epoch": 4481} {"train_loss": -7.121029853820801, "global_step": 188211, "epoch": 4481} {"train_loss": -7.084177017211914, "global_step": 188212, "epoch": 4481} {"train_loss": -7.167285919189453, "global_step": 188213, "epoch": 4481} {"train_loss": -7.034743785858154, "global_step": 188214, "epoch": 4481} {"train_loss": -7.210021018981934, "global_step": 188215, "epoch": 4481} {"train_loss": -7.146955490112305, "global_step": 188216, "epoch": 4481} {"train_loss": -7.184720039367676, "global_step": 188217, "epoch": 4481} {"train_loss": -7.185686111450195, "global_step": 188218, "epoch": 4481} {"train_loss": -7.18610954284668, "global_step": 188219, "epoch": 4481} {"train_loss": -7.1379218101501465, "global_step": 188220, "epoch": 4481} {"train_loss": -7.254794120788574, "global_step": 188221, "epoch": 4481} {"train_loss": -7.294294834136963, "global_step": 188222, "epoch": 4481} {"train_loss": -7.194924354553223, "global_step": 188223, "epoch": 4481} {"train_loss": -7.232731819152832, "global_step": 188224, "epoch": 4481} {"train_loss": -7.165205001831055, "global_step": 188225, "epoch": 4481} {"train_loss": -7.317839622497559, "global_step": 188226, "epoch": 4481} {"train_loss": -7.225232124328613, "global_step": 188227, "epoch": 4481} {"train_loss": -7.203121185302734, "global_step": 188228, "epoch": 4481} {"train_loss": -7.277912139892578, "global_step": 188229, "epoch": 4481} {"train_loss": -7.174996852874756, "global_step": 188230, "epoch": 4481} {"train_loss": -7.202107906341553, "global_step": 188231, "epoch": 4481} {"train_loss": -7.208847999572754, "global_step": 188232, "epoch": 4481} {"train_loss": -7.377343654632568, "global_step": 188233, "epoch": 4481} {"train_loss": -7.251126289367676, "global_step": 188234, "epoch": 4481} {"train_loss": -7.255002021789551, "global_step": 188235, "epoch": 4481} {"train_loss": -7.2051472663879395, "global_step": 188236, "epoch": 4481} {"train_loss": -7.292934417724609, "global_step": 188237, "epoch": 4481} {"train_loss": -7.236015319824219, "global_step": 188238, "epoch": 4481} {"train_loss": -7.30657958984375, "global_step": 188239, "epoch": 4481} {"train_loss": -7.180701732635498, "global_step": 188240, "epoch": 4481} {"train_loss": -7.256255149841309, "global_step": 188241, "epoch": 4481} {"train_loss": -7.250062465667725, "global_step": 188242, "epoch": 4481} {"train_loss": -7.1953738530476885, "global_step": 188243, "epoch": 4481, "val_loss": 80759.125} {"train_loss": -7.240442276000977, "global_step": 188244, "epoch": 4482} {"train_loss": -7.270645618438721, "global_step": 188245, "epoch": 4482} {"train_loss": -7.2159600257873535, "global_step": 188246, "epoch": 4482} {"train_loss": -7.326659202575684, "global_step": 188247, "epoch": 4482} {"train_loss": -7.248196601867676, "global_step": 188248, "epoch": 4482} {"train_loss": -7.206694602966309, "global_step": 188249, "epoch": 4482} {"train_loss": -7.241943359375, "global_step": 188250, "epoch": 4482} {"train_loss": -7.203672409057617, "global_step": 188251, "epoch": 4482} {"train_loss": -7.235396385192871, "global_step": 188252, "epoch": 4482} {"train_loss": -7.2579665184021, "global_step": 188253, "epoch": 4482} {"train_loss": -7.149113178253174, "global_step": 188254, "epoch": 4482} {"train_loss": -7.253868103027344, "global_step": 188255, "epoch": 4482} {"train_loss": -7.320614814758301, "global_step": 188256, "epoch": 4482} {"train_loss": -7.286861419677734, "global_step": 188257, "epoch": 4482} {"train_loss": -7.096487045288086, "global_step": 188258, "epoch": 4482} {"train_loss": -7.158397674560547, "global_step": 188259, "epoch": 4482} {"train_loss": -7.151724815368652, "global_step": 188260, "epoch": 4482} {"train_loss": -7.160231590270996, "global_step": 188261, "epoch": 4482} {"train_loss": -7.241884231567383, "global_step": 188262, "epoch": 4482} {"train_loss": -7.365260124206543, "global_step": 188263, "epoch": 4482} {"train_loss": -7.219693183898926, "global_step": 188264, "epoch": 4482} {"train_loss": -7.220060348510742, "global_step": 188265, "epoch": 4482} {"train_loss": -7.296833038330078, "global_step": 188266, "epoch": 4482} {"train_loss": -7.257783889770508, "global_step": 188267, "epoch": 4482} {"train_loss": -7.243295192718506, "global_step": 188268, "epoch": 4482} {"train_loss": -7.207546234130859, "global_step": 188269, "epoch": 4482} {"train_loss": -7.231897354125977, "global_step": 188270, "epoch": 4482} {"train_loss": -7.247903823852539, "global_step": 188271, "epoch": 4482} {"train_loss": -7.196030616760254, "global_step": 188272, "epoch": 4482} {"train_loss": -7.254151344299316, "global_step": 188273, "epoch": 4482} {"train_loss": -7.253445625305176, "global_step": 188274, "epoch": 4482} {"train_loss": -7.315465927124023, "global_step": 188275, "epoch": 4482} {"train_loss": -7.252973556518555, "global_step": 188276, "epoch": 4482} {"train_loss": -7.228365898132324, "global_step": 188277, "epoch": 4482} {"train_loss": -7.183382034301758, "global_step": 188278, "epoch": 4482} {"train_loss": -7.237082481384277, "global_step": 188279, "epoch": 4482} {"train_loss": -7.2709856033325195, "global_step": 188280, "epoch": 4482} {"train_loss": -7.210538864135742, "global_step": 188281, "epoch": 4482} {"train_loss": -7.295830726623535, "global_step": 188282, "epoch": 4482} {"train_loss": -7.2872209548950195, "global_step": 188283, "epoch": 4482} {"train_loss": -7.161773681640625, "global_step": 188284, "epoch": 4482} {"train_loss": -7.235799766722179, "global_step": 188285, "epoch": 4482, "val_loss": 80996.921875} {"train_loss": -7.165478706359863, "global_step": 188286, "epoch": 4483} {"train_loss": -7.283233165740967, "global_step": 188287, "epoch": 4483} {"train_loss": -7.254408836364746, "global_step": 188288, "epoch": 4483} {"train_loss": -7.215749263763428, "global_step": 188289, "epoch": 4483} {"train_loss": -7.227825164794922, "global_step": 188290, "epoch": 4483} {"train_loss": -7.234875679016113, "global_step": 188291, "epoch": 4483} {"train_loss": -7.192886829376221, "global_step": 188292, "epoch": 4483} {"train_loss": -7.133266925811768, "global_step": 188293, "epoch": 4483} {"train_loss": -7.289795875549316, "global_step": 188294, "epoch": 4483} {"train_loss": -7.2518768310546875, "global_step": 188295, "epoch": 4483} {"train_loss": -7.18696928024292, "global_step": 188296, "epoch": 4483} {"train_loss": -7.257918834686279, "global_step": 188297, "epoch": 4483} {"train_loss": -7.27717399597168, "global_step": 188298, "epoch": 4483} {"train_loss": -7.324065685272217, "global_step": 188299, "epoch": 4483} {"train_loss": -7.295282363891602, "global_step": 188300, "epoch": 4483} {"train_loss": -7.22613525390625, "global_step": 188301, "epoch": 4483} {"train_loss": -7.332870960235596, "global_step": 188302, "epoch": 4483} {"train_loss": -7.213841438293457, "global_step": 188303, "epoch": 4483} {"train_loss": -7.229885578155518, "global_step": 188304, "epoch": 4483} {"train_loss": -7.231785774230957, "global_step": 188305, "epoch": 4483} {"train_loss": -7.2494916915893555, "global_step": 188306, "epoch": 4483} {"train_loss": -7.1955461502075195, "global_step": 188307, "epoch": 4483} {"train_loss": -7.208251953125, "global_step": 188308, "epoch": 4483} {"train_loss": -7.029423236846924, "global_step": 188309, "epoch": 4483} {"train_loss": -7.136645317077637, "global_step": 188310, "epoch": 4483} {"train_loss": -7.1523284912109375, "global_step": 188311, "epoch": 4483} {"train_loss": -7.073488235473633, "global_step": 188312, "epoch": 4483} {"train_loss": -6.931687831878662, "global_step": 188313, "epoch": 4483} {"train_loss": -7.0426788330078125, "global_step": 188314, "epoch": 4483} {"train_loss": -6.890312194824219, "global_step": 188315, "epoch": 4483} {"train_loss": -6.877720832824707, "global_step": 188316, "epoch": 4483} {"train_loss": -6.994142532348633, "global_step": 188317, "epoch": 4483} {"train_loss": -6.729157447814941, "global_step": 188318, "epoch": 4483} {"train_loss": -6.892154693603516, "global_step": 188319, "epoch": 4483} {"train_loss": -6.957688331604004, "global_step": 188320, "epoch": 4483} {"train_loss": -6.847703456878662, "global_step": 188321, "epoch": 4483} {"train_loss": -7.029636383056641, "global_step": 188322, "epoch": 4483} {"train_loss": -6.866988182067871, "global_step": 188323, "epoch": 4483} {"train_loss": -6.908134937286377, "global_step": 188324, "epoch": 4483} {"train_loss": -7.078198432922363, "global_step": 188325, "epoch": 4483} {"train_loss": -6.909090995788574, "global_step": 188326, "epoch": 4483} {"train_loss": -7.111335561389015, "global_step": 188327, "epoch": 4483, "val_loss": 81209.8046875} {"train_loss": -7.055761337280273, "global_step": 188328, "epoch": 4484} {"train_loss": -6.972812652587891, "global_step": 188329, "epoch": 4484} {"train_loss": -6.854593276977539, "global_step": 188330, "epoch": 4484} {"train_loss": -6.942165851593018, "global_step": 188331, "epoch": 4484} {"train_loss": -7.046148300170898, "global_step": 188332, "epoch": 4484} {"train_loss": -6.92589807510376, "global_step": 188333, "epoch": 4484} {"train_loss": -7.016452789306641, "global_step": 188334, "epoch": 4484} {"train_loss": -7.028782844543457, "global_step": 188335, "epoch": 4484} {"train_loss": -6.971209526062012, "global_step": 188336, "epoch": 4484} {"train_loss": -7.059648513793945, "global_step": 188337, "epoch": 4484} {"train_loss": -7.076441764831543, "global_step": 188338, "epoch": 4484} {"train_loss": -7.064239978790283, "global_step": 188339, "epoch": 4484} {"train_loss": -7.110212326049805, "global_step": 188340, "epoch": 4484} {"train_loss": -7.1232123374938965, "global_step": 188341, "epoch": 4484} {"train_loss": -7.046465873718262, "global_step": 188342, "epoch": 4484} {"train_loss": -7.073880195617676, "global_step": 188343, "epoch": 4484} {"train_loss": -7.192634105682373, "global_step": 188344, "epoch": 4484} {"train_loss": -7.06768274307251, "global_step": 188345, "epoch": 4484} {"train_loss": -7.248475551605225, "global_step": 188346, "epoch": 4484} {"train_loss": -7.1115336418151855, "global_step": 188347, "epoch": 4484} {"train_loss": -7.236478328704834, "global_step": 188348, "epoch": 4484} {"train_loss": -7.154938697814941, "global_step": 188349, "epoch": 4484} {"train_loss": -7.186562538146973, "global_step": 188350, "epoch": 4484} {"train_loss": -7.092486381530762, "global_step": 188351, "epoch": 4484} {"train_loss": -7.204137802124023, "global_step": 188352, "epoch": 4484} {"train_loss": -7.353156089782715, "global_step": 188353, "epoch": 4484} {"train_loss": -7.1287431716918945, "global_step": 188354, "epoch": 4484} {"train_loss": -7.239765167236328, "global_step": 188355, "epoch": 4484} {"train_loss": -7.242966651916504, "global_step": 188356, "epoch": 4484} {"train_loss": -7.206404685974121, "global_step": 188357, "epoch": 4484} {"train_loss": -7.128749847412109, "global_step": 188358, "epoch": 4484} {"train_loss": -7.384849548339844, "global_step": 188359, "epoch": 4484} {"train_loss": -7.3733367919921875, "global_step": 188360, "epoch": 4484} {"train_loss": -7.264359474182129, "global_step": 188361, "epoch": 4484} {"train_loss": -7.111607551574707, "global_step": 188362, "epoch": 4484} {"train_loss": -7.257610321044922, "global_step": 188363, "epoch": 4484} {"train_loss": -7.275512218475342, "global_step": 188364, "epoch": 4484} {"train_loss": -7.109503746032715, "global_step": 188365, "epoch": 4484} {"train_loss": -7.320146560668945, "global_step": 188366, "epoch": 4484} {"train_loss": -7.267266750335693, "global_step": 188367, "epoch": 4484} {"train_loss": -7.184363842010498, "global_step": 188368, "epoch": 4484} {"train_loss": -7.14424272945949, "global_step": 188369, "epoch": 4484, "val_loss": 80909.1640625} {"train_loss": -7.266786575317383, "global_step": 188370, "epoch": 4485} {"train_loss": -7.193739891052246, "global_step": 188371, "epoch": 4485} {"train_loss": -7.19755744934082, "global_step": 188372, "epoch": 4485} {"train_loss": -7.2290496826171875, "global_step": 188373, "epoch": 4485} {"train_loss": -7.14503288269043, "global_step": 188374, "epoch": 4485} {"train_loss": -7.175396919250488, "global_step": 188375, "epoch": 4485} {"train_loss": -7.30880880355835, "global_step": 188376, "epoch": 4485} {"train_loss": -7.145600318908691, "global_step": 188377, "epoch": 4485} {"train_loss": -7.243833541870117, "global_step": 188378, "epoch": 4485} {"train_loss": -7.392608165740967, "global_step": 188379, "epoch": 4485} {"train_loss": -7.141534805297852, "global_step": 188380, "epoch": 4485} {"train_loss": -7.138439655303955, "global_step": 188381, "epoch": 4485} {"train_loss": -7.223923206329346, "global_step": 188382, "epoch": 4485} {"train_loss": -7.078230857849121, "global_step": 188383, "epoch": 4485} {"train_loss": -7.15360689163208, "global_step": 188384, "epoch": 4485} {"train_loss": -7.105623245239258, "global_step": 188385, "epoch": 4485} {"train_loss": -7.140181064605713, "global_step": 188386, "epoch": 4485} {"train_loss": -7.098360061645508, "global_step": 188387, "epoch": 4485} {"train_loss": -7.10493803024292, "global_step": 188388, "epoch": 4485} {"train_loss": -7.0613298416137695, "global_step": 188389, "epoch": 4485} {"train_loss": -7.226840972900391, "global_step": 188390, "epoch": 4485} {"train_loss": -7.092909812927246, "global_step": 188391, "epoch": 4485} {"train_loss": -7.13783597946167, "global_step": 188392, "epoch": 4485} {"train_loss": -7.198662757873535, "global_step": 188393, "epoch": 4485} {"train_loss": -7.227484703063965, "global_step": 188394, "epoch": 4485} {"train_loss": -7.183226108551025, "global_step": 188395, "epoch": 4485} {"train_loss": -7.228206634521484, "global_step": 188396, "epoch": 4485} {"train_loss": -7.2278151512146, "global_step": 188397, "epoch": 4485} {"train_loss": -7.23383903503418, "global_step": 188398, "epoch": 4485} {"train_loss": -7.184932708740234, "global_step": 188399, "epoch": 4485} {"train_loss": -7.171150207519531, "global_step": 188400, "epoch": 4485} {"train_loss": -7.153260707855225, "global_step": 188401, "epoch": 4485} {"train_loss": -7.24407958984375, "global_step": 188402, "epoch": 4485} {"train_loss": -7.390697479248047, "global_step": 188403, "epoch": 4485} {"train_loss": -7.1717119216918945, "global_step": 188404, "epoch": 4485} {"train_loss": -7.095048904418945, "global_step": 188405, "epoch": 4485} {"train_loss": -7.187715530395508, "global_step": 188406, "epoch": 4485} {"train_loss": -7.20737361907959, "global_step": 188407, "epoch": 4485} {"train_loss": -7.138365745544434, "global_step": 188408, "epoch": 4485} {"train_loss": -7.274566650390625, "global_step": 188409, "epoch": 4485} {"train_loss": -7.100605010986328, "global_step": 188410, "epoch": 4485} {"train_loss": -7.1853740101768855, "global_step": 188411, "epoch": 4485, "val_loss": 80872.390625} {"train_loss": -7.282146453857422, "global_step": 188412, "epoch": 4486} {"train_loss": -7.220203399658203, "global_step": 188413, "epoch": 4486} {"train_loss": -7.134164810180664, "global_step": 188414, "epoch": 4486} {"train_loss": -7.210777282714844, "global_step": 188415, "epoch": 4486} {"train_loss": -7.2584733963012695, "global_step": 188416, "epoch": 4486} {"train_loss": -7.22266960144043, "global_step": 188417, "epoch": 4486} {"train_loss": -7.2462615966796875, "global_step": 188418, "epoch": 4486} {"train_loss": -7.246159553527832, "global_step": 188419, "epoch": 4486} {"train_loss": -7.195377349853516, "global_step": 188420, "epoch": 4486} {"train_loss": -7.185988426208496, "global_step": 188421, "epoch": 4486} {"train_loss": -7.153068542480469, "global_step": 188422, "epoch": 4486} {"train_loss": -7.279321670532227, "global_step": 188423, "epoch": 4486} {"train_loss": -7.342688083648682, "global_step": 188424, "epoch": 4486} {"train_loss": -7.218018531799316, "global_step": 188425, "epoch": 4486} {"train_loss": -7.356131553649902, "global_step": 188426, "epoch": 4486} {"train_loss": -7.1487884521484375, "global_step": 188427, "epoch": 4486} {"train_loss": -7.172080993652344, "global_step": 188428, "epoch": 4486} {"train_loss": -7.239386558532715, "global_step": 188429, "epoch": 4486} {"train_loss": -7.249890327453613, "global_step": 188430, "epoch": 4486} {"train_loss": -7.2118072509765625, "global_step": 188431, "epoch": 4486} {"train_loss": -7.295792579650879, "global_step": 188432, "epoch": 4486} {"train_loss": -7.295656204223633, "global_step": 188433, "epoch": 4486} {"train_loss": -7.2400617599487305, "global_step": 188434, "epoch": 4486} {"train_loss": -7.2048187255859375, "global_step": 188435, "epoch": 4486} {"train_loss": -7.169395446777344, "global_step": 188436, "epoch": 4486} {"train_loss": -7.186858177185059, "global_step": 188437, "epoch": 4486} {"train_loss": -7.224740505218506, "global_step": 188438, "epoch": 4486} {"train_loss": -7.2957539558410645, "global_step": 188439, "epoch": 4486} {"train_loss": -7.165367126464844, "global_step": 188440, "epoch": 4486} {"train_loss": -7.261950492858887, "global_step": 188441, "epoch": 4486} {"train_loss": -7.243278980255127, "global_step": 188442, "epoch": 4486} {"train_loss": -7.296704292297363, "global_step": 188443, "epoch": 4486} {"train_loss": -7.238037109375, "global_step": 188444, "epoch": 4486} {"train_loss": -7.197127342224121, "global_step": 188445, "epoch": 4486} {"train_loss": -7.256311416625977, "global_step": 188446, "epoch": 4486} {"train_loss": -7.086889266967773, "global_step": 188447, "epoch": 4486} {"train_loss": -7.286215305328369, "global_step": 188448, "epoch": 4486} {"train_loss": -7.289396286010742, "global_step": 188449, "epoch": 4486} {"train_loss": -7.179694652557373, "global_step": 188450, "epoch": 4486} {"train_loss": -7.227591514587402, "global_step": 188451, "epoch": 4486} {"train_loss": -7.243676662445068, "global_step": 188452, "epoch": 4486} {"train_loss": -7.232703265689668, "global_step": 188453, "epoch": 4486, "val_loss": 80764.40625} {"train_loss": -7.30238151550293, "global_step": 188454, "epoch": 4487} {"train_loss": -7.285625457763672, "global_step": 188455, "epoch": 4487} {"train_loss": -7.285070419311523, "global_step": 188456, "epoch": 4487} {"train_loss": -7.269822120666504, "global_step": 188457, "epoch": 4487} {"train_loss": -7.229615688323975, "global_step": 188458, "epoch": 4487} {"train_loss": -7.246513366699219, "global_step": 188459, "epoch": 4487} {"train_loss": -7.1886887550354, "global_step": 188460, "epoch": 4487} {"train_loss": -7.3935370445251465, "global_step": 188461, "epoch": 4487} {"train_loss": -7.168917179107666, "global_step": 188462, "epoch": 4487} {"train_loss": -7.286056995391846, "global_step": 188463, "epoch": 4487} {"train_loss": -7.128478527069092, "global_step": 188464, "epoch": 4487} {"train_loss": -7.13505744934082, "global_step": 188465, "epoch": 4487} {"train_loss": -7.268795967102051, "global_step": 188466, "epoch": 4487} {"train_loss": -7.122025489807129, "global_step": 188467, "epoch": 4487} {"train_loss": -7.322755813598633, "global_step": 188468, "epoch": 4487} {"train_loss": -7.241018772125244, "global_step": 188469, "epoch": 4487} {"train_loss": -7.189937591552734, "global_step": 188470, "epoch": 4487} {"train_loss": -7.236081600189209, "global_step": 188471, "epoch": 4487} {"train_loss": -7.254918098449707, "global_step": 188472, "epoch": 4487} {"train_loss": -7.126705169677734, "global_step": 188473, "epoch": 4487} {"train_loss": -7.099394798278809, "global_step": 188474, "epoch": 4487} {"train_loss": -7.097803592681885, "global_step": 188475, "epoch": 4487} {"train_loss": -7.176910400390625, "global_step": 188476, "epoch": 4487} {"train_loss": -7.202375411987305, "global_step": 188477, "epoch": 4487} {"train_loss": -7.068607807159424, "global_step": 188478, "epoch": 4487} {"train_loss": -7.128114700317383, "global_step": 188479, "epoch": 4487} {"train_loss": -7.166099548339844, "global_step": 188480, "epoch": 4487} {"train_loss": -7.1403961181640625, "global_step": 188481, "epoch": 4487} {"train_loss": -7.109770774841309, "global_step": 188482, "epoch": 4487} {"train_loss": -7.0246171951293945, "global_step": 188483, "epoch": 4487} {"train_loss": -7.19419002532959, "global_step": 188484, "epoch": 4487} {"train_loss": -7.199300765991211, "global_step": 188485, "epoch": 4487} {"train_loss": -7.131241321563721, "global_step": 188486, "epoch": 4487} {"train_loss": -7.226388454437256, "global_step": 188487, "epoch": 4487} {"train_loss": -7.27671480178833, "global_step": 188488, "epoch": 4487} {"train_loss": -7.244232177734375, "global_step": 188489, "epoch": 4487} {"train_loss": -7.152674674987793, "global_step": 188490, "epoch": 4487} {"train_loss": -7.003155708312988, "global_step": 188491, "epoch": 4487} {"train_loss": -7.250577449798584, "global_step": 188492, "epoch": 4487} {"train_loss": -7.115677356719971, "global_step": 188493, "epoch": 4487} {"train_loss": -6.978662490844727, "global_step": 188494, "epoch": 4487} {"train_loss": -7.187471037819272, "global_step": 188495, "epoch": 4487, "val_loss": 81161.3671875} {"train_loss": -7.0511474609375, "global_step": 188496, "epoch": 4488} {"train_loss": -7.24638032913208, "global_step": 188497, "epoch": 4488} {"train_loss": -7.084060192108154, "global_step": 188498, "epoch": 4488} {"train_loss": -7.11703634262085, "global_step": 188499, "epoch": 4488} {"train_loss": -7.128035068511963, "global_step": 188500, "epoch": 4488} {"train_loss": -7.160545349121094, "global_step": 188501, "epoch": 4488} {"train_loss": -7.114635944366455, "global_step": 188502, "epoch": 4488} {"train_loss": -7.196527481079102, "global_step": 188503, "epoch": 4488} {"train_loss": -7.174072742462158, "global_step": 188504, "epoch": 4488} {"train_loss": -7.214247703552246, "global_step": 188505, "epoch": 4488} {"train_loss": -7.4069600105285645, "global_step": 188506, "epoch": 4488} {"train_loss": -7.240863800048828, "global_step": 188507, "epoch": 4488} {"train_loss": -7.233354568481445, "global_step": 188508, "epoch": 4488} {"train_loss": -7.185989856719971, "global_step": 188509, "epoch": 4488} {"train_loss": -7.2207722663879395, "global_step": 188510, "epoch": 4488} {"train_loss": -7.189352989196777, "global_step": 188511, "epoch": 4488} {"train_loss": -7.19942045211792, "global_step": 188512, "epoch": 4488} {"train_loss": -7.283663749694824, "global_step": 188513, "epoch": 4488} {"train_loss": -7.193694591522217, "global_step": 188514, "epoch": 4488} {"train_loss": -7.33912992477417, "global_step": 188515, "epoch": 4488} {"train_loss": -7.241338729858398, "global_step": 188516, "epoch": 4488} {"train_loss": -7.184739589691162, "global_step": 188517, "epoch": 4488} {"train_loss": -7.250618934631348, "global_step": 188518, "epoch": 4488} {"train_loss": -7.211405277252197, "global_step": 188519, "epoch": 4488} {"train_loss": -6.988768577575684, "global_step": 188520, "epoch": 4488} {"train_loss": -7.187849998474121, "global_step": 188521, "epoch": 4488} {"train_loss": -7.120194435119629, "global_step": 188522, "epoch": 4488} {"train_loss": -7.115383148193359, "global_step": 188523, "epoch": 4488} {"train_loss": -7.333855628967285, "global_step": 188524, "epoch": 4488} {"train_loss": -7.164929389953613, "global_step": 188525, "epoch": 4488} {"train_loss": -7.22089958190918, "global_step": 188526, "epoch": 4488} {"train_loss": -7.159487724304199, "global_step": 188527, "epoch": 4488} {"train_loss": -7.248716354370117, "global_step": 188528, "epoch": 4488} {"train_loss": -7.250876426696777, "global_step": 188529, "epoch": 4488} {"train_loss": -7.181111812591553, "global_step": 188530, "epoch": 4488} {"train_loss": -7.204153060913086, "global_step": 188531, "epoch": 4488} {"train_loss": -7.260191917419434, "global_step": 188532, "epoch": 4488} {"train_loss": -7.110943794250488, "global_step": 188533, "epoch": 4488} {"train_loss": -7.248867034912109, "global_step": 188534, "epoch": 4488} {"train_loss": -7.067148208618164, "global_step": 188535, "epoch": 4488} {"train_loss": -7.108841419219971, "global_step": 188536, "epoch": 4488} {"train_loss": -7.1926295303163075, "global_step": 188537, "epoch": 4488, "val_loss": 81150.2109375} {"train_loss": -7.096418380737305, "global_step": 188538, "epoch": 4489} {"train_loss": -7.20007848739624, "global_step": 188539, "epoch": 4489} {"train_loss": -7.185385704040527, "global_step": 188540, "epoch": 4489} {"train_loss": -7.101269721984863, "global_step": 188541, "epoch": 4489} {"train_loss": -7.297862529754639, "global_step": 188542, "epoch": 4489} {"train_loss": -7.07427978515625, "global_step": 188543, "epoch": 4489} {"train_loss": -7.114143371582031, "global_step": 188544, "epoch": 4489} {"train_loss": -7.052279949188232, "global_step": 188545, "epoch": 4489} {"train_loss": -7.068653106689453, "global_step": 188546, "epoch": 4489} {"train_loss": -7.2469940185546875, "global_step": 188547, "epoch": 4489} {"train_loss": -7.2084641456604, "global_step": 188548, "epoch": 4489} {"train_loss": -7.0914812088012695, "global_step": 188549, "epoch": 4489} {"train_loss": -7.202077865600586, "global_step": 188550, "epoch": 4489} {"train_loss": -7.085717678070068, "global_step": 188551, "epoch": 4489} {"train_loss": -7.266303539276123, "global_step": 188552, "epoch": 4489} {"train_loss": -7.043926239013672, "global_step": 188553, "epoch": 4489} {"train_loss": -7.201259613037109, "global_step": 188554, "epoch": 4489} {"train_loss": -7.06483793258667, "global_step": 188555, "epoch": 4489} {"train_loss": -7.233147621154785, "global_step": 188556, "epoch": 4489} {"train_loss": -7.212564945220947, "global_step": 188557, "epoch": 4489} {"train_loss": -7.21946382522583, "global_step": 188558, "epoch": 4489} {"train_loss": -7.226462364196777, "global_step": 188559, "epoch": 4489} {"train_loss": -7.202737808227539, "global_step": 188560, "epoch": 4489} {"train_loss": -7.196511268615723, "global_step": 188561, "epoch": 4489} {"train_loss": -7.130543231964111, "global_step": 188562, "epoch": 4489} {"train_loss": -7.240431308746338, "global_step": 188563, "epoch": 4489} {"train_loss": -7.1949849128723145, "global_step": 188564, "epoch": 4489} {"train_loss": -7.225613594055176, "global_step": 188565, "epoch": 4489} {"train_loss": -7.268904685974121, "global_step": 188566, "epoch": 4489} {"train_loss": -7.239569187164307, "global_step": 188567, "epoch": 4489} {"train_loss": -7.185556888580322, "global_step": 188568, "epoch": 4489} {"train_loss": -7.258187770843506, "global_step": 188569, "epoch": 4489} {"train_loss": -7.218429088592529, "global_step": 188570, "epoch": 4489} {"train_loss": -7.156473159790039, "global_step": 188571, "epoch": 4489} {"train_loss": -7.280342102050781, "global_step": 188572, "epoch": 4489} {"train_loss": -7.148117542266846, "global_step": 188573, "epoch": 4489} {"train_loss": -7.156075954437256, "global_step": 188574, "epoch": 4489} {"train_loss": -7.0972723960876465, "global_step": 188575, "epoch": 4489} {"train_loss": -7.16893196105957, "global_step": 188576, "epoch": 4489} {"train_loss": -7.137894630432129, "global_step": 188577, "epoch": 4489} {"train_loss": -7.129143714904785, "global_step": 188578, "epoch": 4489} {"train_loss": -7.172153597786313, "global_step": 188579, "epoch": 4489, "val_loss": 80902.4375} {"train_loss": -7.122994422912598, "global_step": 188580, "epoch": 4490} {"train_loss": -7.111813545227051, "global_step": 188581, "epoch": 4490} {"train_loss": -7.168994903564453, "global_step": 188582, "epoch": 4490} {"train_loss": -7.022660255432129, "global_step": 188583, "epoch": 4490} {"train_loss": -7.233198165893555, "global_step": 188584, "epoch": 4490} {"train_loss": -7.252052307128906, "global_step": 188585, "epoch": 4490} {"train_loss": -7.124259948730469, "global_step": 188586, "epoch": 4490} {"train_loss": -7.226332664489746, "global_step": 188587, "epoch": 4490} {"train_loss": -7.064631462097168, "global_step": 188588, "epoch": 4490} {"train_loss": -7.0930495262146, "global_step": 188589, "epoch": 4490} {"train_loss": -7.218135833740234, "global_step": 188590, "epoch": 4490} {"train_loss": -7.076709270477295, "global_step": 188591, "epoch": 4490} {"train_loss": -7.05421257019043, "global_step": 188592, "epoch": 4490} {"train_loss": -7.045422077178955, "global_step": 188593, "epoch": 4490} {"train_loss": -7.22119140625, "global_step": 188594, "epoch": 4490} {"train_loss": -7.023060321807861, "global_step": 188595, "epoch": 4490} {"train_loss": -7.228372097015381, "global_step": 188596, "epoch": 4490} {"train_loss": -6.948653221130371, "global_step": 188597, "epoch": 4490} {"train_loss": -7.119040012359619, "global_step": 188598, "epoch": 4490} {"train_loss": -6.963054656982422, "global_step": 188599, "epoch": 4490} {"train_loss": -7.118463516235352, "global_step": 188600, "epoch": 4490} {"train_loss": -7.168806076049805, "global_step": 188601, "epoch": 4490} {"train_loss": -7.100573539733887, "global_step": 188602, "epoch": 4490} {"train_loss": -7.050615310668945, "global_step": 188603, "epoch": 4490} {"train_loss": -7.047720909118652, "global_step": 188604, "epoch": 4490} {"train_loss": -7.177765846252441, "global_step": 188605, "epoch": 4490} {"train_loss": -7.1108717918396, "global_step": 188606, "epoch": 4490} {"train_loss": -7.215055465698242, "global_step": 188607, "epoch": 4490} {"train_loss": -7.017674446105957, "global_step": 188608, "epoch": 4490} {"train_loss": -7.147971153259277, "global_step": 188609, "epoch": 4490} {"train_loss": -7.1170806884765625, "global_step": 188610, "epoch": 4490} {"train_loss": -7.129067897796631, "global_step": 188611, "epoch": 4490} {"train_loss": -7.225517272949219, "global_step": 188612, "epoch": 4490} {"train_loss": -7.123065948486328, "global_step": 188613, "epoch": 4490} {"train_loss": -7.224057197570801, "global_step": 188614, "epoch": 4490} {"train_loss": -7.154171943664551, "global_step": 188615, "epoch": 4490} {"train_loss": -7.142108917236328, "global_step": 188616, "epoch": 4490} {"train_loss": -7.210132598876953, "global_step": 188617, "epoch": 4490} {"train_loss": -7.328596591949463, "global_step": 188618, "epoch": 4490} {"train_loss": -7.14854097366333, "global_step": 188619, "epoch": 4490} {"train_loss": -7.223692893981934, "global_step": 188620, "epoch": 4490} {"train_loss": -7.136076018923805, "global_step": 188621, "epoch": 4490, "val_loss": 81002.8515625} {"train_loss": -7.239224910736084, "global_step": 188622, "epoch": 4491} {"train_loss": -7.202415466308594, "global_step": 188623, "epoch": 4491} {"train_loss": -7.23548698425293, "global_step": 188624, "epoch": 4491} {"train_loss": -7.32414436340332, "global_step": 188625, "epoch": 4491} {"train_loss": -7.215065002441406, "global_step": 188626, "epoch": 4491} {"train_loss": -7.149452209472656, "global_step": 188627, "epoch": 4491} {"train_loss": -7.292612552642822, "global_step": 188628, "epoch": 4491} {"train_loss": -7.337965965270996, "global_step": 188629, "epoch": 4491} {"train_loss": -7.141375541687012, "global_step": 188630, "epoch": 4491} {"train_loss": -7.229238510131836, "global_step": 188631, "epoch": 4491} {"train_loss": -7.280104637145996, "global_step": 188632, "epoch": 4491} {"train_loss": -7.457126617431641, "global_step": 188633, "epoch": 4491} {"train_loss": -7.27375602722168, "global_step": 188634, "epoch": 4491} {"train_loss": -7.266628742218018, "global_step": 188635, "epoch": 4491} {"train_loss": -7.295313358306885, "global_step": 188636, "epoch": 4491} {"train_loss": -7.23101282119751, "global_step": 188637, "epoch": 4491} {"train_loss": -7.335577964782715, "global_step": 188638, "epoch": 4491} {"train_loss": -7.099633693695068, "global_step": 188639, "epoch": 4491} {"train_loss": -7.388815879821777, "global_step": 188640, "epoch": 4491} {"train_loss": -7.273970127105713, "global_step": 188641, "epoch": 4491} {"train_loss": -7.183901786804199, "global_step": 188642, "epoch": 4491} {"train_loss": -7.113211631774902, "global_step": 188643, "epoch": 4491} {"train_loss": -7.243584156036377, "global_step": 188644, "epoch": 4491} {"train_loss": -7.269872188568115, "global_step": 188645, "epoch": 4491} {"train_loss": -7.165136337280273, "global_step": 188646, "epoch": 4491} {"train_loss": -7.204490661621094, "global_step": 188647, "epoch": 4491} {"train_loss": -7.200389862060547, "global_step": 188648, "epoch": 4491} {"train_loss": -7.197416305541992, "global_step": 188649, "epoch": 4491} {"train_loss": -7.255592346191406, "global_step": 188650, "epoch": 4491} {"train_loss": -7.217907428741455, "global_step": 188651, "epoch": 4491} {"train_loss": -7.2509660720825195, "global_step": 188652, "epoch": 4491} {"train_loss": -7.248917579650879, "global_step": 188653, "epoch": 4491} {"train_loss": -7.175110816955566, "global_step": 188654, "epoch": 4491} {"train_loss": -7.286487579345703, "global_step": 188655, "epoch": 4491} {"train_loss": -7.271896839141846, "global_step": 188656, "epoch": 4491} {"train_loss": -7.1512651443481445, "global_step": 188657, "epoch": 4491} {"train_loss": -7.285836219787598, "global_step": 188658, "epoch": 4491} {"train_loss": -7.181454658508301, "global_step": 188659, "epoch": 4491} {"train_loss": -7.256983757019043, "global_step": 188660, "epoch": 4491} {"train_loss": -7.335847854614258, "global_step": 188661, "epoch": 4491} {"train_loss": -7.3041229248046875, "global_step": 188662, "epoch": 4491} {"train_loss": -7.242767549696422, "global_step": 188663, "epoch": 4491, "val_loss": 80807.4375} {"train_loss": -7.306910991668701, "global_step": 188664, "epoch": 4492} {"train_loss": -7.178981781005859, "global_step": 188665, "epoch": 4492} {"train_loss": -7.2409257888793945, "global_step": 188666, "epoch": 4492} {"train_loss": -7.32014799118042, "global_step": 188667, "epoch": 4492} {"train_loss": -7.19562292098999, "global_step": 188668, "epoch": 4492} {"train_loss": -7.018513202667236, "global_step": 188669, "epoch": 4492} {"train_loss": -7.130152702331543, "global_step": 188670, "epoch": 4492} {"train_loss": -7.061501502990723, "global_step": 188671, "epoch": 4492} {"train_loss": -7.175755500793457, "global_step": 188672, "epoch": 4492} {"train_loss": -7.247875690460205, "global_step": 188673, "epoch": 4492} {"train_loss": -7.098114967346191, "global_step": 188674, "epoch": 4492} {"train_loss": -7.131397247314453, "global_step": 188675, "epoch": 4492} {"train_loss": -7.245551586151123, "global_step": 188676, "epoch": 4492} {"train_loss": -7.155839920043945, "global_step": 188677, "epoch": 4492} {"train_loss": -7.206228256225586, "global_step": 188678, "epoch": 4492} {"train_loss": -7.152578353881836, "global_step": 188679, "epoch": 4492} {"train_loss": -7.225822925567627, "global_step": 188680, "epoch": 4492} {"train_loss": -7.295502662658691, "global_step": 188681, "epoch": 4492} {"train_loss": -7.150460243225098, "global_step": 188682, "epoch": 4492} {"train_loss": -7.162251949310303, "global_step": 188683, "epoch": 4492} {"train_loss": -7.151827335357666, "global_step": 188684, "epoch": 4492} {"train_loss": -7.141057014465332, "global_step": 188685, "epoch": 4492} {"train_loss": -7.158351898193359, "global_step": 188686, "epoch": 4492} {"train_loss": -7.194957733154297, "global_step": 188687, "epoch": 4492} {"train_loss": -7.161778926849365, "global_step": 188688, "epoch": 4492} {"train_loss": -7.188383102416992, "global_step": 188689, "epoch": 4492} {"train_loss": -7.17666482925415, "global_step": 188690, "epoch": 4492} {"train_loss": -7.153535842895508, "global_step": 188691, "epoch": 4492} {"train_loss": -7.292903423309326, "global_step": 188692, "epoch": 4492} {"train_loss": -7.175278663635254, "global_step": 188693, "epoch": 4492} {"train_loss": -7.162310600280762, "global_step": 188694, "epoch": 4492} {"train_loss": -7.174989700317383, "global_step": 188695, "epoch": 4492} {"train_loss": -7.167259216308594, "global_step": 188696, "epoch": 4492} {"train_loss": -7.180534362792969, "global_step": 188697, "epoch": 4492} {"train_loss": -7.228500843048096, "global_step": 188698, "epoch": 4492} {"train_loss": -7.104981422424316, "global_step": 188699, "epoch": 4492} {"train_loss": -7.155916213989258, "global_step": 188700, "epoch": 4492} {"train_loss": -7.196351528167725, "global_step": 188701, "epoch": 4492} {"train_loss": -6.98438024520874, "global_step": 188702, "epoch": 4492} {"train_loss": -7.270442485809326, "global_step": 188703, "epoch": 4492} {"train_loss": -7.247181415557861, "global_step": 188704, "epoch": 4492} {"train_loss": -7.183841410137358, "global_step": 188705, "epoch": 4492, "val_loss": 80930.046875} {"train_loss": -7.216213226318359, "global_step": 188706, "epoch": 4493} {"train_loss": -7.307861328125, "global_step": 188707, "epoch": 4493} {"train_loss": -7.33962345123291, "global_step": 188708, "epoch": 4493} {"train_loss": -7.231990337371826, "global_step": 188709, "epoch": 4493} {"train_loss": -7.115025043487549, "global_step": 188710, "epoch": 4493} {"train_loss": -7.249541282653809, "global_step": 188711, "epoch": 4493} {"train_loss": -7.191420555114746, "global_step": 188712, "epoch": 4493} {"train_loss": -7.2349090576171875, "global_step": 188713, "epoch": 4493} {"train_loss": -7.211092948913574, "global_step": 188714, "epoch": 4493} {"train_loss": -7.233598709106445, "global_step": 188715, "epoch": 4493} {"train_loss": -7.153810977935791, "global_step": 188716, "epoch": 4493} {"train_loss": -7.235600471496582, "global_step": 188717, "epoch": 4493} {"train_loss": -7.213918685913086, "global_step": 188718, "epoch": 4493} {"train_loss": -7.284769058227539, "global_step": 188719, "epoch": 4493} {"train_loss": -7.195913314819336, "global_step": 188720, "epoch": 4493} {"train_loss": -7.269581317901611, "global_step": 188721, "epoch": 4493} {"train_loss": -7.200084686279297, "global_step": 188722, "epoch": 4493} {"train_loss": -7.286245346069336, "global_step": 188723, "epoch": 4493} {"train_loss": -7.1501922607421875, "global_step": 188724, "epoch": 4493} {"train_loss": -7.167763710021973, "global_step": 188725, "epoch": 4493} {"train_loss": -7.261977195739746, "global_step": 188726, "epoch": 4493} {"train_loss": -7.122258186340332, "global_step": 188727, "epoch": 4493} {"train_loss": -7.340636253356934, "global_step": 188728, "epoch": 4493} {"train_loss": -7.297817707061768, "global_step": 188729, "epoch": 4493} {"train_loss": -7.228089332580566, "global_step": 188730, "epoch": 4493} {"train_loss": -7.1454949378967285, "global_step": 188731, "epoch": 4493} {"train_loss": -7.261185169219971, "global_step": 188732, "epoch": 4493} {"train_loss": -7.160228729248047, "global_step": 188733, "epoch": 4493} {"train_loss": -7.082106590270996, "global_step": 188734, "epoch": 4493} {"train_loss": -7.151022911071777, "global_step": 188735, "epoch": 4493} {"train_loss": -7.279496192932129, "global_step": 188736, "epoch": 4493} {"train_loss": -7.2781782150268555, "global_step": 188737, "epoch": 4493} {"train_loss": -7.186178207397461, "global_step": 188738, "epoch": 4493} {"train_loss": -7.16939640045166, "global_step": 188739, "epoch": 4493} {"train_loss": -7.24819278717041, "global_step": 188740, "epoch": 4493} {"train_loss": -7.172050476074219, "global_step": 188741, "epoch": 4493} {"train_loss": -7.140443801879883, "global_step": 188742, "epoch": 4493} {"train_loss": -7.279866695404053, "global_step": 188743, "epoch": 4493} {"train_loss": -7.191204071044922, "global_step": 188744, "epoch": 4493} {"train_loss": -7.211176872253418, "global_step": 188745, "epoch": 4493} {"train_loss": -7.23721170425415, "global_step": 188746, "epoch": 4493} {"train_loss": -7.217554762249901, "global_step": 188747, "epoch": 4493, "val_loss": 81144.7109375} {"train_loss": -7.174420356750488, "global_step": 188748, "epoch": 4494} {"train_loss": -7.2234907150268555, "global_step": 188749, "epoch": 4494} {"train_loss": -7.261615753173828, "global_step": 188750, "epoch": 4494} {"train_loss": -7.306343078613281, "global_step": 188751, "epoch": 4494} {"train_loss": -7.298344135284424, "global_step": 188752, "epoch": 4494} {"train_loss": -7.209441184997559, "global_step": 188753, "epoch": 4494} {"train_loss": -7.369383811950684, "global_step": 188754, "epoch": 4494} {"train_loss": -7.373697280883789, "global_step": 188755, "epoch": 4494} {"train_loss": -7.313734531402588, "global_step": 188756, "epoch": 4494} {"train_loss": -7.3143229484558105, "global_step": 188757, "epoch": 4494} {"train_loss": -7.340489864349365, "global_step": 188758, "epoch": 4494} {"train_loss": -7.358821392059326, "global_step": 188759, "epoch": 4494} {"train_loss": -7.366689682006836, "global_step": 188760, "epoch": 4494} {"train_loss": -7.330418586730957, "global_step": 188761, "epoch": 4494} {"train_loss": -7.35170316696167, "global_step": 188762, "epoch": 4494} {"train_loss": -7.292248725891113, "global_step": 188763, "epoch": 4494} {"train_loss": -7.249730587005615, "global_step": 188764, "epoch": 4494} {"train_loss": -7.28141450881958, "global_step": 188765, "epoch": 4494} {"train_loss": -7.326248645782471, "global_step": 188766, "epoch": 4494} {"train_loss": -7.247988700866699, "global_step": 188767, "epoch": 4494} {"train_loss": -7.291295051574707, "global_step": 188768, "epoch": 4494} {"train_loss": -7.208615303039551, "global_step": 188769, "epoch": 4494} {"train_loss": -7.234706878662109, "global_step": 188770, "epoch": 4494} {"train_loss": -7.186159133911133, "global_step": 188771, "epoch": 4494} {"train_loss": -7.2264204025268555, "global_step": 188772, "epoch": 4494} {"train_loss": -7.2938337326049805, "global_step": 188773, "epoch": 4494} {"train_loss": -7.24107027053833, "global_step": 188774, "epoch": 4494} {"train_loss": -7.2568511962890625, "global_step": 188775, "epoch": 4494} {"train_loss": -7.199458122253418, "global_step": 188776, "epoch": 4494} {"train_loss": -7.24677038192749, "global_step": 188777, "epoch": 4494} {"train_loss": -7.257389068603516, "global_step": 188778, "epoch": 4494} {"train_loss": -7.200603008270264, "global_step": 188779, "epoch": 4494} {"train_loss": -7.2865095138549805, "global_step": 188780, "epoch": 4494} {"train_loss": -7.201113224029541, "global_step": 188781, "epoch": 4494} {"train_loss": -7.076136112213135, "global_step": 188782, "epoch": 4494} {"train_loss": -7.135906219482422, "global_step": 188783, "epoch": 4494} {"train_loss": -7.1715497970581055, "global_step": 188784, "epoch": 4494} {"train_loss": -7.039853096008301, "global_step": 188785, "epoch": 4494} {"train_loss": -7.042179584503174, "global_step": 188786, "epoch": 4494} {"train_loss": -7.238503456115723, "global_step": 188787, "epoch": 4494} {"train_loss": -6.909449100494385, "global_step": 188788, "epoch": 4494} {"train_loss": -7.241411765416463, "global_step": 188789, "epoch": 4494, "val_loss": 81204.859375} {"train_loss": -7.042660236358643, "global_step": 188790, "epoch": 4495} {"train_loss": -7.075740337371826, "global_step": 188791, "epoch": 4495} {"train_loss": -7.041985511779785, "global_step": 188792, "epoch": 4495} {"train_loss": -7.03563928604126, "global_step": 188793, "epoch": 4495} {"train_loss": -6.972123146057129, "global_step": 188794, "epoch": 4495} {"train_loss": -7.097563743591309, "global_step": 188795, "epoch": 4495} {"train_loss": -7.183377265930176, "global_step": 188796, "epoch": 4495} {"train_loss": -7.209787368774414, "global_step": 188797, "epoch": 4495} {"train_loss": -7.172012805938721, "global_step": 188798, "epoch": 4495} {"train_loss": -7.1083784103393555, "global_step": 188799, "epoch": 4495} {"train_loss": -7.195337295532227, "global_step": 188800, "epoch": 4495} {"train_loss": -7.111955642700195, "global_step": 188801, "epoch": 4495} {"train_loss": -7.218102931976318, "global_step": 188802, "epoch": 4495} {"train_loss": -7.203853130340576, "global_step": 188803, "epoch": 4495} {"train_loss": -7.115655899047852, "global_step": 188804, "epoch": 4495} {"train_loss": -7.265251636505127, "global_step": 188805, "epoch": 4495} {"train_loss": -7.115842819213867, "global_step": 188806, "epoch": 4495} {"train_loss": -7.305798530578613, "global_step": 188807, "epoch": 4495} {"train_loss": -7.240866661071777, "global_step": 188808, "epoch": 4495} {"train_loss": -7.273677825927734, "global_step": 188809, "epoch": 4495} {"train_loss": -7.370574951171875, "global_step": 188810, "epoch": 4495} {"train_loss": -7.263430595397949, "global_step": 188811, "epoch": 4495} {"train_loss": -7.209629058837891, "global_step": 188812, "epoch": 4495} {"train_loss": -7.238692760467529, "global_step": 188813, "epoch": 4495} {"train_loss": -7.230524063110352, "global_step": 188814, "epoch": 4495} {"train_loss": -7.227675437927246, "global_step": 188815, "epoch": 4495} {"train_loss": -7.226230621337891, "global_step": 188816, "epoch": 4495} {"train_loss": -7.179941654205322, "global_step": 188817, "epoch": 4495} {"train_loss": -7.392569541931152, "global_step": 188818, "epoch": 4495} {"train_loss": -7.278890609741211, "global_step": 188819, "epoch": 4495} {"train_loss": -7.168646335601807, "global_step": 188820, "epoch": 4495} {"train_loss": -7.229162216186523, "global_step": 188821, "epoch": 4495} {"train_loss": -7.182720184326172, "global_step": 188822, "epoch": 4495} {"train_loss": -7.3067946434021, "global_step": 188823, "epoch": 4495} {"train_loss": -7.240050315856934, "global_step": 188824, "epoch": 4495} {"train_loss": -7.2521562576293945, "global_step": 188825, "epoch": 4495} {"train_loss": -7.252891540527344, "global_step": 188826, "epoch": 4495} {"train_loss": -7.128105163574219, "global_step": 188827, "epoch": 4495} {"train_loss": -7.226872444152832, "global_step": 188828, "epoch": 4495} {"train_loss": -7.296234607696533, "global_step": 188829, "epoch": 4495} {"train_loss": -7.209468841552734, "global_step": 188830, "epoch": 4495} {"train_loss": -7.196168967655727, "global_step": 188831, "epoch": 4495, "val_loss": 81021.1953125} {"train_loss": -7.21856689453125, "global_step": 188832, "epoch": 4496} {"train_loss": -7.251981258392334, "global_step": 188833, "epoch": 4496} {"train_loss": -7.214047431945801, "global_step": 188834, "epoch": 4496} {"train_loss": -7.294514179229736, "global_step": 188835, "epoch": 4496} {"train_loss": -7.1591596603393555, "global_step": 188836, "epoch": 4496} {"train_loss": -7.291991233825684, "global_step": 188837, "epoch": 4496} {"train_loss": -7.352041244506836, "global_step": 188838, "epoch": 4496} {"train_loss": -7.210020065307617, "global_step": 188839, "epoch": 4496} {"train_loss": -7.220674514770508, "global_step": 188840, "epoch": 4496} {"train_loss": -7.138937473297119, "global_step": 188841, "epoch": 4496} {"train_loss": -7.235679626464844, "global_step": 188842, "epoch": 4496} {"train_loss": -7.349575519561768, "global_step": 188843, "epoch": 4496} {"train_loss": -7.24885368347168, "global_step": 188844, "epoch": 4496} {"train_loss": -7.149331569671631, "global_step": 188845, "epoch": 4496} {"train_loss": -7.373849391937256, "global_step": 188846, "epoch": 4496} {"train_loss": -7.292257308959961, "global_step": 188847, "epoch": 4496} {"train_loss": -7.404623031616211, "global_step": 188848, "epoch": 4496} {"train_loss": -7.226381301879883, "global_step": 188849, "epoch": 4496} {"train_loss": -7.296753883361816, "global_step": 188850, "epoch": 4496} {"train_loss": -7.190989971160889, "global_step": 188851, "epoch": 4496} {"train_loss": -7.33007287979126, "global_step": 188852, "epoch": 4496} {"train_loss": -7.214948654174805, "global_step": 188853, "epoch": 4496} {"train_loss": -7.260615348815918, "global_step": 188854, "epoch": 4496} {"train_loss": -7.243938446044922, "global_step": 188855, "epoch": 4496} {"train_loss": -7.269346237182617, "global_step": 188856, "epoch": 4496} {"train_loss": -7.1876935958862305, "global_step": 188857, "epoch": 4496} {"train_loss": -7.182698726654053, "global_step": 188858, "epoch": 4496} {"train_loss": -7.279630184173584, "global_step": 188859, "epoch": 4496} {"train_loss": -7.071120262145996, "global_step": 188860, "epoch": 4496} {"train_loss": -7.06865119934082, "global_step": 188861, "epoch": 4496} {"train_loss": -7.246207237243652, "global_step": 188862, "epoch": 4496} {"train_loss": -7.144956588745117, "global_step": 188863, "epoch": 4496} {"train_loss": -7.237881660461426, "global_step": 188864, "epoch": 4496} {"train_loss": -7.3019022941589355, "global_step": 188865, "epoch": 4496} {"train_loss": -7.146769046783447, "global_step": 188866, "epoch": 4496} {"train_loss": -7.207796096801758, "global_step": 188867, "epoch": 4496} {"train_loss": -7.212695121765137, "global_step": 188868, "epoch": 4496} {"train_loss": -7.073564529418945, "global_step": 188869, "epoch": 4496} {"train_loss": -7.188393592834473, "global_step": 188870, "epoch": 4496} {"train_loss": -7.170463562011719, "global_step": 188871, "epoch": 4496} {"train_loss": -7.113911151885986, "global_step": 188872, "epoch": 4496} {"train_loss": -7.225067479269845, "global_step": 188873, "epoch": 4496, "val_loss": 80865.3125} {"train_loss": -7.250676155090332, "global_step": 188874, "epoch": 4497} {"train_loss": -7.165811538696289, "global_step": 188875, "epoch": 4497} {"train_loss": -7.144250869750977, "global_step": 188876, "epoch": 4497} {"train_loss": -7.292522430419922, "global_step": 188877, "epoch": 4497} {"train_loss": -7.201468467712402, "global_step": 188878, "epoch": 4497} {"train_loss": -7.311717987060547, "global_step": 188879, "epoch": 4497} {"train_loss": -7.2784929275512695, "global_step": 188880, "epoch": 4497} {"train_loss": -7.226768493652344, "global_step": 188881, "epoch": 4497} {"train_loss": -7.24397087097168, "global_step": 188882, "epoch": 4497} {"train_loss": -7.228947639465332, "global_step": 188883, "epoch": 4497} {"train_loss": -7.247134208679199, "global_step": 188884, "epoch": 4497} {"train_loss": -7.195632457733154, "global_step": 188885, "epoch": 4497} {"train_loss": -7.27262020111084, "global_step": 188886, "epoch": 4497} {"train_loss": -7.246869087219238, "global_step": 188887, "epoch": 4497} {"train_loss": -7.14178991317749, "global_step": 188888, "epoch": 4497} {"train_loss": -7.177394866943359, "global_step": 188889, "epoch": 4497} {"train_loss": -7.171780109405518, "global_step": 188890, "epoch": 4497} {"train_loss": -7.22893762588501, "global_step": 188891, "epoch": 4497} {"train_loss": -7.186572074890137, "global_step": 188892, "epoch": 4497} {"train_loss": -7.165838718414307, "global_step": 188893, "epoch": 4497} {"train_loss": -7.248184680938721, "global_step": 188894, "epoch": 4497} {"train_loss": -7.118192672729492, "global_step": 188895, "epoch": 4497} {"train_loss": -7.221551418304443, "global_step": 188896, "epoch": 4497} {"train_loss": -7.229635238647461, "global_step": 188897, "epoch": 4497} {"train_loss": -7.1368818283081055, "global_step": 188898, "epoch": 4497} {"train_loss": -7.199338436126709, "global_step": 188899, "epoch": 4497} {"train_loss": -7.183860778808594, "global_step": 188900, "epoch": 4497} {"train_loss": -7.226475238800049, "global_step": 188901, "epoch": 4497} {"train_loss": -7.287853240966797, "global_step": 188902, "epoch": 4497} {"train_loss": -7.263859748840332, "global_step": 188903, "epoch": 4497} {"train_loss": -7.229950904846191, "global_step": 188904, "epoch": 4497} {"train_loss": -7.268240451812744, "global_step": 188905, "epoch": 4497} {"train_loss": -7.133886814117432, "global_step": 188906, "epoch": 4497} {"train_loss": -7.194404602050781, "global_step": 188907, "epoch": 4497} {"train_loss": -7.1983418464660645, "global_step": 188908, "epoch": 4497} {"train_loss": -7.083142280578613, "global_step": 188909, "epoch": 4497} {"train_loss": -7.233933448791504, "global_step": 188910, "epoch": 4497} {"train_loss": -7.235867023468018, "global_step": 188911, "epoch": 4497} {"train_loss": -7.196690559387207, "global_step": 188912, "epoch": 4497} {"train_loss": -7.079593658447266, "global_step": 188913, "epoch": 4497} {"train_loss": -7.148005962371826, "global_step": 188914, "epoch": 4497} {"train_loss": -7.210461537043254, "global_step": 188915, "epoch": 4497, "val_loss": 81192.734375} {"train_loss": -7.156079292297363, "global_step": 188916, "epoch": 4498} {"train_loss": -7.09627103805542, "global_step": 188917, "epoch": 4498} {"train_loss": -7.260665416717529, "global_step": 188918, "epoch": 4498} {"train_loss": -7.12398099899292, "global_step": 188919, "epoch": 4498} {"train_loss": -7.064022064208984, "global_step": 188920, "epoch": 4498} {"train_loss": -7.162086486816406, "global_step": 188921, "epoch": 4498} {"train_loss": -7.195635795593262, "global_step": 188922, "epoch": 4498} {"train_loss": -7.13109016418457, "global_step": 188923, "epoch": 4498} {"train_loss": -7.217076301574707, "global_step": 188924, "epoch": 4498} {"train_loss": -7.28860330581665, "global_step": 188925, "epoch": 4498} {"train_loss": -7.231966018676758, "global_step": 188926, "epoch": 4498} {"train_loss": -7.227057933807373, "global_step": 188927, "epoch": 4498} {"train_loss": -7.2106828689575195, "global_step": 188928, "epoch": 4498} {"train_loss": -7.1108717918396, "global_step": 188929, "epoch": 4498} {"train_loss": -7.271756172180176, "global_step": 188930, "epoch": 4498} {"train_loss": -7.158779144287109, "global_step": 188931, "epoch": 4498} {"train_loss": -7.2083659172058105, "global_step": 188932, "epoch": 4498} {"train_loss": -7.235038757324219, "global_step": 188933, "epoch": 4498} {"train_loss": -7.199588775634766, "global_step": 188934, "epoch": 4498} {"train_loss": -7.229884147644043, "global_step": 188935, "epoch": 4498} {"train_loss": -7.149881839752197, "global_step": 188936, "epoch": 4498} {"train_loss": -7.283113956451416, "global_step": 188937, "epoch": 4498} {"train_loss": -7.20339298248291, "global_step": 188938, "epoch": 4498} {"train_loss": -7.110136032104492, "global_step": 188939, "epoch": 4498} {"train_loss": -7.168127059936523, "global_step": 188940, "epoch": 4498} {"train_loss": -7.0744709968566895, "global_step": 188941, "epoch": 4498} {"train_loss": -7.287569046020508, "global_step": 188942, "epoch": 4498} {"train_loss": -7.278133869171143, "global_step": 188943, "epoch": 4498} {"train_loss": -7.224034309387207, "global_step": 188944, "epoch": 4498} {"train_loss": -7.186149597167969, "global_step": 188945, "epoch": 4498} {"train_loss": -7.210102081298828, "global_step": 188946, "epoch": 4498} {"train_loss": -7.227097034454346, "global_step": 188947, "epoch": 4498} {"train_loss": -7.1690826416015625, "global_step": 188948, "epoch": 4498} {"train_loss": -7.197877407073975, "global_step": 188949, "epoch": 4498} {"train_loss": -7.344773292541504, "global_step": 188950, "epoch": 4498} {"train_loss": -7.2949299812316895, "global_step": 188951, "epoch": 4498} {"train_loss": -7.231975555419922, "global_step": 188952, "epoch": 4498} {"train_loss": -7.30219030380249, "global_step": 188953, "epoch": 4498} {"train_loss": -7.244572639465332, "global_step": 188954, "epoch": 4498} {"train_loss": -7.144349098205566, "global_step": 188955, "epoch": 4498} {"train_loss": -7.191578388214111, "global_step": 188956, "epoch": 4498} {"train_loss": -7.203261647905622, "global_step": 188957, "epoch": 4498, "val_loss": 81018.359375} {"train_loss": -7.151150703430176, "global_step": 188958, "epoch": 4499} {"train_loss": -7.132912635803223, "global_step": 188959, "epoch": 4499} {"train_loss": -7.332355499267578, "global_step": 188960, "epoch": 4499} {"train_loss": -7.127171039581299, "global_step": 188961, "epoch": 4499} {"train_loss": -7.129072189331055, "global_step": 188962, "epoch": 4499} {"train_loss": -7.234331130981445, "global_step": 188963, "epoch": 4499} {"train_loss": -7.052394866943359, "global_step": 188964, "epoch": 4499} {"train_loss": -7.117918014526367, "global_step": 188965, "epoch": 4499} {"train_loss": -7.200450897216797, "global_step": 188966, "epoch": 4499} {"train_loss": -7.1057515144348145, "global_step": 188967, "epoch": 4499} {"train_loss": -7.31248664855957, "global_step": 188968, "epoch": 4499} {"train_loss": -7.101158142089844, "global_step": 188969, "epoch": 4499} {"train_loss": -7.1779375076293945, "global_step": 188970, "epoch": 4499} {"train_loss": -7.124599933624268, "global_step": 188971, "epoch": 4499} {"train_loss": -7.104654312133789, "global_step": 188972, "epoch": 4499} {"train_loss": -7.063772678375244, "global_step": 188973, "epoch": 4499} {"train_loss": -7.20050048828125, "global_step": 188974, "epoch": 4499} {"train_loss": -7.213590621948242, "global_step": 188975, "epoch": 4499} {"train_loss": -7.107677459716797, "global_step": 188976, "epoch": 4499} {"train_loss": -7.183992385864258, "global_step": 188977, "epoch": 4499} {"train_loss": -7.1547698974609375, "global_step": 188978, "epoch": 4499} {"train_loss": -7.114704608917236, "global_step": 188979, "epoch": 4499} {"train_loss": -7.028189659118652, "global_step": 188980, "epoch": 4499} {"train_loss": -7.015748023986816, "global_step": 188981, "epoch": 4499} {"train_loss": -6.882364749908447, "global_step": 188982, "epoch": 4499} {"train_loss": -6.875877380371094, "global_step": 188983, "epoch": 4499} {"train_loss": -7.02878475189209, "global_step": 188984, "epoch": 4499} {"train_loss": -6.996783256530762, "global_step": 188985, "epoch": 4499} {"train_loss": -7.025609970092773, "global_step": 188986, "epoch": 4499} {"train_loss": -6.986695289611816, "global_step": 188987, "epoch": 4499} {"train_loss": -6.949869155883789, "global_step": 188988, "epoch": 4499} {"train_loss": -7.081136703491211, "global_step": 188989, "epoch": 4499} {"train_loss": -7.011563777923584, "global_step": 188990, "epoch": 4499} {"train_loss": -7.225882053375244, "global_step": 188991, "epoch": 4499} {"train_loss": -7.053328990936279, "global_step": 188992, "epoch": 4499} {"train_loss": -7.015715599060059, "global_step": 188993, "epoch": 4499} {"train_loss": -7.0918169021606445, "global_step": 188994, "epoch": 4499} {"train_loss": -7.112288475036621, "global_step": 188995, "epoch": 4499} {"train_loss": -7.037625312805176, "global_step": 188996, "epoch": 4499} {"train_loss": -7.1403961181640625, "global_step": 188997, "epoch": 4499} {"train_loss": -7.134332656860352, "global_step": 188998, "epoch": 4499} {"train_loss": -7.1017440387180875, "global_step": 188999, "epoch": 4499, "val_loss": 81226.7890625} {"train_loss": -7.168405532836914, "global_step": 189000, "epoch": 4500} {"train_loss": -7.199848175048828, "global_step": 189001, "epoch": 4500} {"train_loss": -7.191949367523193, "global_step": 189002, "epoch": 4500} {"train_loss": -7.251300811767578, "global_step": 189003, "epoch": 4500} {"train_loss": -7.221707820892334, "global_step": 189004, "epoch": 4500} {"train_loss": -7.218236923217773, "global_step": 189005, "epoch": 4500} {"train_loss": -7.090314865112305, "global_step": 189006, "epoch": 4500} {"train_loss": -7.216483116149902, "global_step": 189007, "epoch": 4500} {"train_loss": -7.235064506530762, "global_step": 189008, "epoch": 4500} {"train_loss": -7.305756568908691, "global_step": 189009, "epoch": 4500} {"train_loss": -7.197906970977783, "global_step": 189010, "epoch": 4500} {"train_loss": -7.279273986816406, "global_step": 189011, "epoch": 4500} {"train_loss": -7.284932613372803, "global_step": 189012, "epoch": 4500} {"train_loss": -7.235300064086914, "global_step": 189013, "epoch": 4500} {"train_loss": -7.328404426574707, "global_step": 189014, "epoch": 4500} {"train_loss": -7.18237829208374, "global_step": 189015, "epoch": 4500} {"train_loss": -7.2902398109436035, "global_step": 189016, "epoch": 4500} {"train_loss": -7.1074090003967285, "global_step": 189017, "epoch": 4500} {"train_loss": -7.257139205932617, "global_step": 189018, "epoch": 4500} {"train_loss": -7.1644816398620605, "global_step": 189019, "epoch": 4500} {"train_loss": -7.25640869140625, "global_step": 189020, "epoch": 4500} {"train_loss": -7.264284133911133, "global_step": 189021, "epoch": 4500} {"train_loss": -7.157101631164551, "global_step": 189022, "epoch": 4500} {"train_loss": -7.199492454528809, "global_step": 189023, "epoch": 4500} {"train_loss": -7.346165657043457, "global_step": 189024, "epoch": 4500} {"train_loss": -7.153136730194092, "global_step": 189025, "epoch": 4500} {"train_loss": -7.260478973388672, "global_step": 189026, "epoch": 4500} {"train_loss": -7.260209083557129, "global_step": 189027, "epoch": 4500} {"train_loss": -7.289697647094727, "global_step": 189028, "epoch": 4500} {"train_loss": -7.250952243804932, "global_step": 189029, "epoch": 4500} {"train_loss": -7.326321601867676, "global_step": 189030, "epoch": 4500} {"train_loss": -7.251711368560791, "global_step": 189031, "epoch": 4500} {"train_loss": -7.2888689041137695, "global_step": 189032, "epoch": 4500} {"train_loss": -7.249198913574219, "global_step": 189033, "epoch": 4500} {"train_loss": -7.2190775871276855, "global_step": 189034, "epoch": 4500} {"train_loss": -7.200795650482178, "global_step": 189035, "epoch": 4500} {"train_loss": -7.2605390548706055, "global_step": 189036, "epoch": 4500} {"train_loss": -7.225826740264893, "global_step": 189037, "epoch": 4500} {"train_loss": -7.15765380859375, "global_step": 189038, "epoch": 4500} {"train_loss": -7.237558364868164, "global_step": 189039, "epoch": 4500} {"train_loss": -7.187211036682129, "global_step": 189040, "epoch": 4500} {"train_loss": -7.230357681001935, "global_step": 189041, "epoch": 4500, "train/sim_max_reward_0": 0.8997659983535161, "train/sim_max_reward_1": 0.9441795640768597, "train/sim_max_reward_2": 0.43925121181062493, "train/sim_max_reward_3": 0.13056039451560375, "train/sim_max_reward_4": 0.9550788436671029, "train/sim_max_reward_5": 0.6772025430872686, "test/sim_max_reward_4500000": 0.9174849100469831, "test/sim_max_reward_4500001": 0.7724933254632281, "test/sim_max_reward_4500002": 0.9274559378866373, "test/sim_max_reward_4500003": 0.5279362527292178, "test/sim_max_reward_4500004": 0.22502353369932307, "test/sim_max_reward_4500005": 0.35485528044755804, "test/sim_max_reward_4500006": 0.9373639566090859, "test/sim_max_reward_4500007": 0.780747729384071, "test/sim_max_reward_4500008": 0.3482278656645282, "test/sim_max_reward_4500009": 0.918160507674513, "test/sim_max_reward_4500010": 0.03323826414288851, "test/sim_max_reward_4500011": 0.4495196058234032, "test/sim_max_reward_4500012": 0.9109540208684228, "test/sim_max_reward_4500013": 0.004839149899348276, "test/sim_max_reward_4500014": 0.9940492513605804, "test/sim_max_reward_4500015": 0.9806846307122845, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.037746717495214854, "test/sim_max_reward_4500018": 0.4319194398810529, "test/sim_max_reward_4500019": 0.9857855645111263, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9311222080591658, "test/sim_max_reward_4500022": 0.9397474168707256, "test/sim_max_reward_4500023": 0.8796973890174089, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8188180232314098, "test/sim_max_reward_4500026": 0.862532814201021, "test/sim_max_reward_4500027": 0.9936001087293644, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.06121053259108276, "test/sim_max_reward_4500030": 0.9997702709818301, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 1.0, "test/sim_max_reward_4500034": 0.9326021750006519, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 0.9539637453779686, "test/sim_max_reward_4500037": 0.8745043362730478, "test/sim_max_reward_4500038": 0.33127383514090586, "test/sim_max_reward_4500039": 1.0, "test/sim_max_reward_4500040": 0.9987059623595068, "test/sim_max_reward_4500041": 0.8916426669338937, "test/sim_max_reward_4500042": 0.04134424616855581, "test/sim_max_reward_4500043": 0.5006518401249355, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9453824464987951, "test/sim_max_reward_4500046": 0.24633829608411056, "test/sim_max_reward_4500047": 0.9512410220524369, "test/sim_max_reward_4500048": 0.8754838606077958, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.6743397592518293, "test/mean_score": 0.5968557979540718, "val_loss": 81050.171875} {"train_loss": -7.176827907562256, "global_step": 189042, "epoch": 4501} {"train_loss": -7.401955604553223, "global_step": 189043, "epoch": 4501} {"train_loss": -7.17212438583374, "global_step": 189044, "epoch": 4501} {"train_loss": -6.990608215332031, "global_step": 189045, "epoch": 4501} {"train_loss": -7.238134384155273, "global_step": 189046, "epoch": 4501} {"train_loss": -7.098550796508789, "global_step": 189047, "epoch": 4501} {"train_loss": -7.203351974487305, "global_step": 189048, "epoch": 4501} {"train_loss": -7.175816535949707, "global_step": 189049, "epoch": 4501} {"train_loss": -7.1872148513793945, "global_step": 189050, "epoch": 4501} {"train_loss": -7.203790664672852, "global_step": 189051, "epoch": 4501} {"train_loss": -7.138567924499512, "global_step": 189052, "epoch": 4501} {"train_loss": -7.179747581481934, "global_step": 189053, "epoch": 4501} {"train_loss": -7.198698997497559, "global_step": 189054, "epoch": 4501} {"train_loss": -7.104177474975586, "global_step": 189055, "epoch": 4501} {"train_loss": -7.210756301879883, "global_step": 189056, "epoch": 4501} {"train_loss": -7.213994026184082, "global_step": 189057, "epoch": 4501} {"train_loss": -7.18928861618042, "global_step": 189058, "epoch": 4501} {"train_loss": -7.302069664001465, "global_step": 189059, "epoch": 4501} {"train_loss": -7.16961145401001, "global_step": 189060, "epoch": 4501} {"train_loss": -7.283257961273193, "global_step": 189061, "epoch": 4501} {"train_loss": -7.169835090637207, "global_step": 189062, "epoch": 4501} {"train_loss": -7.269775390625, "global_step": 189063, "epoch": 4501} {"train_loss": -7.2425217628479, "global_step": 189064, "epoch": 4501} {"train_loss": -7.188607692718506, "global_step": 189065, "epoch": 4501} {"train_loss": -7.262226581573486, "global_step": 189066, "epoch": 4501} {"train_loss": -7.164028167724609, "global_step": 189067, "epoch": 4501} {"train_loss": -7.282772064208984, "global_step": 189068, "epoch": 4501} {"train_loss": -7.277754783630371, "global_step": 189069, "epoch": 4501} {"train_loss": -7.203667640686035, "global_step": 189070, "epoch": 4501} {"train_loss": -7.294933319091797, "global_step": 189071, "epoch": 4501} {"train_loss": -7.219013214111328, "global_step": 189072, "epoch": 4501} {"train_loss": -7.254554271697998, "global_step": 189073, "epoch": 4501} {"train_loss": -7.260887145996094, "global_step": 189074, "epoch": 4501} {"train_loss": -7.221463680267334, "global_step": 189075, "epoch": 4501} {"train_loss": -7.268474578857422, "global_step": 189076, "epoch": 4501} {"train_loss": -7.29971981048584, "global_step": 189077, "epoch": 4501} {"train_loss": -7.175952911376953, "global_step": 189078, "epoch": 4501} {"train_loss": -7.311469078063965, "global_step": 189079, "epoch": 4501} {"train_loss": -7.340360641479492, "global_step": 189080, "epoch": 4501} {"train_loss": -7.184142112731934, "global_step": 189081, "epoch": 4501} {"train_loss": -7.291682243347168, "global_step": 189082, "epoch": 4501} {"train_loss": -7.220843156178792, "global_step": 189083, "epoch": 4501, "val_loss": 80888.5625} {"train_loss": -7.192656517028809, "global_step": 189084, "epoch": 4502} {"train_loss": -7.346616744995117, "global_step": 189085, "epoch": 4502} {"train_loss": -7.171921730041504, "global_step": 189086, "epoch": 4502} {"train_loss": -7.131363868713379, "global_step": 189087, "epoch": 4502} {"train_loss": -7.146055221557617, "global_step": 189088, "epoch": 4502} {"train_loss": -7.251248836517334, "global_step": 189089, "epoch": 4502} {"train_loss": -7.085559844970703, "global_step": 189090, "epoch": 4502} {"train_loss": -7.133736610412598, "global_step": 189091, "epoch": 4502} {"train_loss": -7.214519500732422, "global_step": 189092, "epoch": 4502} {"train_loss": -7.094611167907715, "global_step": 189093, "epoch": 4502} {"train_loss": -7.206282615661621, "global_step": 189094, "epoch": 4502} {"train_loss": -7.244509696960449, "global_step": 189095, "epoch": 4502} {"train_loss": -7.058229923248291, "global_step": 189096, "epoch": 4502} {"train_loss": -7.2115159034729, "global_step": 189097, "epoch": 4502} {"train_loss": -7.042904376983643, "global_step": 189098, "epoch": 4502} {"train_loss": -7.166510581970215, "global_step": 189099, "epoch": 4502} {"train_loss": -7.187167167663574, "global_step": 189100, "epoch": 4502} {"train_loss": -7.063991546630859, "global_step": 189101, "epoch": 4502} {"train_loss": -7.2000861167907715, "global_step": 189102, "epoch": 4502} {"train_loss": -7.162594318389893, "global_step": 189103, "epoch": 4502} {"train_loss": -7.22157621383667, "global_step": 189104, "epoch": 4502} {"train_loss": -7.236016750335693, "global_step": 189105, "epoch": 4502} {"train_loss": -7.261955261230469, "global_step": 189106, "epoch": 4502} {"train_loss": -7.197887420654297, "global_step": 189107, "epoch": 4502} {"train_loss": -7.215740203857422, "global_step": 189108, "epoch": 4502} {"train_loss": -7.263967990875244, "global_step": 189109, "epoch": 4502} {"train_loss": -7.176809310913086, "global_step": 189110, "epoch": 4502} {"train_loss": -7.129733562469482, "global_step": 189111, "epoch": 4502} {"train_loss": -7.209709167480469, "global_step": 189112, "epoch": 4502} {"train_loss": -7.133162498474121, "global_step": 189113, "epoch": 4502} {"train_loss": -7.281201362609863, "global_step": 189114, "epoch": 4502} {"train_loss": -7.23922872543335, "global_step": 189115, "epoch": 4502} {"train_loss": -7.187077045440674, "global_step": 189116, "epoch": 4502} {"train_loss": -7.134190559387207, "global_step": 189117, "epoch": 4502} {"train_loss": -7.273369312286377, "global_step": 189118, "epoch": 4502} {"train_loss": -7.069099426269531, "global_step": 189119, "epoch": 4502} {"train_loss": -7.273921012878418, "global_step": 189120, "epoch": 4502} {"train_loss": -7.166894912719727, "global_step": 189121, "epoch": 4502} {"train_loss": -7.263042449951172, "global_step": 189122, "epoch": 4502} {"train_loss": -7.12777042388916, "global_step": 189123, "epoch": 4502} {"train_loss": -7.0294189453125, "global_step": 189124, "epoch": 4502} {"train_loss": -7.179847036089216, "global_step": 189125, "epoch": 4502, "val_loss": 81326.8125} {"train_loss": -7.023268222808838, "global_step": 189126, "epoch": 4503} {"train_loss": -7.136816024780273, "global_step": 189127, "epoch": 4503} {"train_loss": -7.108386039733887, "global_step": 189128, "epoch": 4503} {"train_loss": -7.1490936279296875, "global_step": 189129, "epoch": 4503} {"train_loss": -7.1947736740112305, "global_step": 189130, "epoch": 4503} {"train_loss": -7.08497428894043, "global_step": 189131, "epoch": 4503} {"train_loss": -7.087549209594727, "global_step": 189132, "epoch": 4503} {"train_loss": -6.976953506469727, "global_step": 189133, "epoch": 4503} {"train_loss": -7.221085548400879, "global_step": 189134, "epoch": 4503} {"train_loss": -7.205606460571289, "global_step": 189135, "epoch": 4503} {"train_loss": -7.133425712585449, "global_step": 189136, "epoch": 4503} {"train_loss": -7.26825475692749, "global_step": 189137, "epoch": 4503} {"train_loss": -7.169368743896484, "global_step": 189138, "epoch": 4503} {"train_loss": -7.135031700134277, "global_step": 189139, "epoch": 4503} {"train_loss": -7.1357197761535645, "global_step": 189140, "epoch": 4503} {"train_loss": -7.101377010345459, "global_step": 189141, "epoch": 4503} {"train_loss": -7.131410121917725, "global_step": 189142, "epoch": 4503} {"train_loss": -7.180488586425781, "global_step": 189143, "epoch": 4503} {"train_loss": -7.094392776489258, "global_step": 189144, "epoch": 4503} {"train_loss": -7.198213577270508, "global_step": 189145, "epoch": 4503} {"train_loss": -7.198520660400391, "global_step": 189146, "epoch": 4503} {"train_loss": -7.227115631103516, "global_step": 189147, "epoch": 4503} {"train_loss": -7.0880937576293945, "global_step": 189148, "epoch": 4503} {"train_loss": -7.101024627685547, "global_step": 189149, "epoch": 4503} {"train_loss": -7.231987953186035, "global_step": 189150, "epoch": 4503} {"train_loss": -7.192200660705566, "global_step": 189151, "epoch": 4503} {"train_loss": -7.225038528442383, "global_step": 189152, "epoch": 4503} {"train_loss": -7.2983245849609375, "global_step": 189153, "epoch": 4503} {"train_loss": -7.216763019561768, "global_step": 189154, "epoch": 4503} {"train_loss": -7.111438751220703, "global_step": 189155, "epoch": 4503} {"train_loss": -7.163901329040527, "global_step": 189156, "epoch": 4503} {"train_loss": -7.07135534286499, "global_step": 189157, "epoch": 4503} {"train_loss": -6.892186164855957, "global_step": 189158, "epoch": 4503} {"train_loss": -7.247903823852539, "global_step": 189159, "epoch": 4503} {"train_loss": -7.043205738067627, "global_step": 189160, "epoch": 4503} {"train_loss": -7.054492950439453, "global_step": 189161, "epoch": 4503} {"train_loss": -7.130313873291016, "global_step": 189162, "epoch": 4503} {"train_loss": -7.1375274658203125, "global_step": 189163, "epoch": 4503} {"train_loss": -7.116137504577637, "global_step": 189164, "epoch": 4503} {"train_loss": -7.087496280670166, "global_step": 189165, "epoch": 4503} {"train_loss": -7.002613067626953, "global_step": 189166, "epoch": 4503} {"train_loss": -7.136544363839286, "global_step": 189167, "epoch": 4503, "val_loss": 80946.7890625} {"train_loss": -7.0781755447387695, "global_step": 189168, "epoch": 4504} {"train_loss": -7.139870643615723, "global_step": 189169, "epoch": 4504} {"train_loss": -7.20540714263916, "global_step": 189170, "epoch": 4504} {"train_loss": -7.331942558288574, "global_step": 189171, "epoch": 4504} {"train_loss": -7.166213512420654, "global_step": 189172, "epoch": 4504} {"train_loss": -7.304156303405762, "global_step": 189173, "epoch": 4504} {"train_loss": -7.131897926330566, "global_step": 189174, "epoch": 4504} {"train_loss": -7.273863792419434, "global_step": 189175, "epoch": 4504} {"train_loss": -7.3346967697143555, "global_step": 189176, "epoch": 4504} {"train_loss": -7.339995384216309, "global_step": 189177, "epoch": 4504} {"train_loss": -7.160175323486328, "global_step": 189178, "epoch": 4504} {"train_loss": -7.1476640701293945, "global_step": 189179, "epoch": 4504} {"train_loss": -7.167353630065918, "global_step": 189180, "epoch": 4504} {"train_loss": -7.428372383117676, "global_step": 189181, "epoch": 4504} {"train_loss": -7.182250499725342, "global_step": 189182, "epoch": 4504} {"train_loss": -7.159723281860352, "global_step": 189183, "epoch": 4504} {"train_loss": -7.162939071655273, "global_step": 189184, "epoch": 4504} {"train_loss": -7.251856327056885, "global_step": 189185, "epoch": 4504} {"train_loss": -7.257754325866699, "global_step": 189186, "epoch": 4504} {"train_loss": -7.276895999908447, "global_step": 189187, "epoch": 4504} {"train_loss": -7.179525852203369, "global_step": 189188, "epoch": 4504} {"train_loss": -7.162165641784668, "global_step": 189189, "epoch": 4504} {"train_loss": -7.362173080444336, "global_step": 189190, "epoch": 4504} {"train_loss": -7.177977561950684, "global_step": 189191, "epoch": 4504} {"train_loss": -7.202032089233398, "global_step": 189192, "epoch": 4504} {"train_loss": -7.284294128417969, "global_step": 189193, "epoch": 4504} {"train_loss": -7.26512336730957, "global_step": 189194, "epoch": 4504} {"train_loss": -7.254171371459961, "global_step": 189195, "epoch": 4504} {"train_loss": -7.216867446899414, "global_step": 189196, "epoch": 4504} {"train_loss": -7.201810836791992, "global_step": 189197, "epoch": 4504} {"train_loss": -7.32266902923584, "global_step": 189198, "epoch": 4504} {"train_loss": -7.194794178009033, "global_step": 189199, "epoch": 4504} {"train_loss": -7.2173871994018555, "global_step": 189200, "epoch": 4504} {"train_loss": -7.171768665313721, "global_step": 189201, "epoch": 4504} {"train_loss": -7.196459770202637, "global_step": 189202, "epoch": 4504} {"train_loss": -7.264565467834473, "global_step": 189203, "epoch": 4504} {"train_loss": -7.193567276000977, "global_step": 189204, "epoch": 4504} {"train_loss": -7.1412811279296875, "global_step": 189205, "epoch": 4504} {"train_loss": -7.13032865524292, "global_step": 189206, "epoch": 4504} {"train_loss": -7.127871513366699, "global_step": 189207, "epoch": 4504} {"train_loss": -7.330817699432373, "global_step": 189208, "epoch": 4504} {"train_loss": -7.220521847407023, "global_step": 189209, "epoch": 4504, "val_loss": 80867.8984375} {"train_loss": -7.258086681365967, "global_step": 189210, "epoch": 4505} {"train_loss": -7.2125139236450195, "global_step": 189211, "epoch": 4505} {"train_loss": -7.262971878051758, "global_step": 189212, "epoch": 4505} {"train_loss": -7.26359748840332, "global_step": 189213, "epoch": 4505} {"train_loss": -7.146385669708252, "global_step": 189214, "epoch": 4505} {"train_loss": -7.300325393676758, "global_step": 189215, "epoch": 4505} {"train_loss": -7.170929908752441, "global_step": 189216, "epoch": 4505} {"train_loss": -7.215818405151367, "global_step": 189217, "epoch": 4505} {"train_loss": -7.274587154388428, "global_step": 189218, "epoch": 4505} {"train_loss": -7.077676773071289, "global_step": 189219, "epoch": 4505} {"train_loss": -7.141955852508545, "global_step": 189220, "epoch": 4505} {"train_loss": -7.270108222961426, "global_step": 189221, "epoch": 4505} {"train_loss": -7.154862403869629, "global_step": 189222, "epoch": 4505} {"train_loss": -7.226759910583496, "global_step": 189223, "epoch": 4505} {"train_loss": -7.2770094871521, "global_step": 189224, "epoch": 4505} {"train_loss": -7.122679233551025, "global_step": 189225, "epoch": 4505} {"train_loss": -7.272571563720703, "global_step": 189226, "epoch": 4505} {"train_loss": -7.0701189041137695, "global_step": 189227, "epoch": 4505} {"train_loss": -7.152460098266602, "global_step": 189228, "epoch": 4505} {"train_loss": -7.143056869506836, "global_step": 189229, "epoch": 4505} {"train_loss": -7.155734062194824, "global_step": 189230, "epoch": 4505} {"train_loss": -7.144707679748535, "global_step": 189231, "epoch": 4505} {"train_loss": -7.059659481048584, "global_step": 189232, "epoch": 4505} {"train_loss": -6.944478511810303, "global_step": 189233, "epoch": 4505} {"train_loss": -7.179752349853516, "global_step": 189234, "epoch": 4505} {"train_loss": -7.0348310470581055, "global_step": 189235, "epoch": 4505} {"train_loss": -6.983179092407227, "global_step": 189236, "epoch": 4505} {"train_loss": -7.096654891967773, "global_step": 189237, "epoch": 4505} {"train_loss": -7.085309982299805, "global_step": 189238, "epoch": 4505} {"train_loss": -7.10488224029541, "global_step": 189239, "epoch": 4505} {"train_loss": -7.231470108032227, "global_step": 189240, "epoch": 4505} {"train_loss": -7.114317893981934, "global_step": 189241, "epoch": 4505} {"train_loss": -7.137228012084961, "global_step": 189242, "epoch": 4505} {"train_loss": -7.179419994354248, "global_step": 189243, "epoch": 4505} {"train_loss": -7.207510948181152, "global_step": 189244, "epoch": 4505} {"train_loss": -7.2373046875, "global_step": 189245, "epoch": 4505} {"train_loss": -7.196422576904297, "global_step": 189246, "epoch": 4505} {"train_loss": -7.235856056213379, "global_step": 189247, "epoch": 4505} {"train_loss": -7.300647735595703, "global_step": 189248, "epoch": 4505} {"train_loss": -7.142740249633789, "global_step": 189249, "epoch": 4505} {"train_loss": -7.241842269897461, "global_step": 189250, "epoch": 4505} {"train_loss": -7.172912347884405, "global_step": 189251, "epoch": 4505, "val_loss": 80763.953125} {"train_loss": -7.326342582702637, "global_step": 189252, "epoch": 4506} {"train_loss": -7.199212074279785, "global_step": 189253, "epoch": 4506} {"train_loss": -7.2289934158325195, "global_step": 189254, "epoch": 4506} {"train_loss": -7.258658409118652, "global_step": 189255, "epoch": 4506} {"train_loss": -7.210235595703125, "global_step": 189256, "epoch": 4506} {"train_loss": -7.267352104187012, "global_step": 189257, "epoch": 4506} {"train_loss": -7.1594557762146, "global_step": 189258, "epoch": 4506} {"train_loss": -7.0453901290893555, "global_step": 189259, "epoch": 4506} {"train_loss": -7.284156799316406, "global_step": 189260, "epoch": 4506} {"train_loss": -7.247357368469238, "global_step": 189261, "epoch": 4506} {"train_loss": -7.105416297912598, "global_step": 189262, "epoch": 4506} {"train_loss": -7.196128845214844, "global_step": 189263, "epoch": 4506} {"train_loss": -7.237154006958008, "global_step": 189264, "epoch": 4506} {"train_loss": -7.075788497924805, "global_step": 189265, "epoch": 4506} {"train_loss": -7.180673122406006, "global_step": 189266, "epoch": 4506} {"train_loss": -7.131731033325195, "global_step": 189267, "epoch": 4506} {"train_loss": -7.259466648101807, "global_step": 189268, "epoch": 4506} {"train_loss": -7.042808532714844, "global_step": 189269, "epoch": 4506} {"train_loss": -7.156088352203369, "global_step": 189270, "epoch": 4506} {"train_loss": -7.25844669342041, "global_step": 189271, "epoch": 4506} {"train_loss": -7.142270088195801, "global_step": 189272, "epoch": 4506} {"train_loss": -7.21654748916626, "global_step": 189273, "epoch": 4506} {"train_loss": -7.1252031326293945, "global_step": 189274, "epoch": 4506} {"train_loss": -7.148166656494141, "global_step": 189275, "epoch": 4506} {"train_loss": -7.1975908279418945, "global_step": 189276, "epoch": 4506} {"train_loss": -7.099189758300781, "global_step": 189277, "epoch": 4506} {"train_loss": -7.089045524597168, "global_step": 189278, "epoch": 4506} {"train_loss": -7.093408584594727, "global_step": 189279, "epoch": 4506} {"train_loss": -7.076469898223877, "global_step": 189280, "epoch": 4506} {"train_loss": -7.1107635498046875, "global_step": 189281, "epoch": 4506} {"train_loss": -7.111453533172607, "global_step": 189282, "epoch": 4506} {"train_loss": -7.167356967926025, "global_step": 189283, "epoch": 4506} {"train_loss": -7.100307464599609, "global_step": 189284, "epoch": 4506} {"train_loss": -7.098680019378662, "global_step": 189285, "epoch": 4506} {"train_loss": -7.039946556091309, "global_step": 189286, "epoch": 4506} {"train_loss": -7.086936950683594, "global_step": 189287, "epoch": 4506} {"train_loss": -7.092429161071777, "global_step": 189288, "epoch": 4506} {"train_loss": -7.032678604125977, "global_step": 189289, "epoch": 4506} {"train_loss": -7.112451076507568, "global_step": 189290, "epoch": 4506} {"train_loss": -7.137561321258545, "global_step": 189291, "epoch": 4506} {"train_loss": -7.185900688171387, "global_step": 189292, "epoch": 4506} {"train_loss": -7.154140256700062, "global_step": 189293, "epoch": 4506, "val_loss": 80958.234375} {"train_loss": -7.203328609466553, "global_step": 189294, "epoch": 4507} {"train_loss": -7.043524742126465, "global_step": 189295, "epoch": 4507} {"train_loss": -7.1222076416015625, "global_step": 189296, "epoch": 4507} {"train_loss": -7.112812519073486, "global_step": 189297, "epoch": 4507} {"train_loss": -7.145788192749023, "global_step": 189298, "epoch": 4507} {"train_loss": -7.174506187438965, "global_step": 189299, "epoch": 4507} {"train_loss": -7.21249532699585, "global_step": 189300, "epoch": 4507} {"train_loss": -7.184770584106445, "global_step": 189301, "epoch": 4507} {"train_loss": -7.225714683532715, "global_step": 189302, "epoch": 4507} {"train_loss": -7.2500691413879395, "global_step": 189303, "epoch": 4507} {"train_loss": -7.258444786071777, "global_step": 189304, "epoch": 4507} {"train_loss": -7.333800315856934, "global_step": 189305, "epoch": 4507} {"train_loss": -7.255313873291016, "global_step": 189306, "epoch": 4507} {"train_loss": -7.257168769836426, "global_step": 189307, "epoch": 4507} {"train_loss": -7.2117815017700195, "global_step": 189308, "epoch": 4507} {"train_loss": -7.284813404083252, "global_step": 189309, "epoch": 4507} {"train_loss": -7.2218828201293945, "global_step": 189310, "epoch": 4507} {"train_loss": -7.352399826049805, "global_step": 189311, "epoch": 4507} {"train_loss": -7.26865291595459, "global_step": 189312, "epoch": 4507} {"train_loss": -7.138091087341309, "global_step": 189313, "epoch": 4507} {"train_loss": -7.209974765777588, "global_step": 189314, "epoch": 4507} {"train_loss": -7.191070556640625, "global_step": 189315, "epoch": 4507} {"train_loss": -7.315426826477051, "global_step": 189316, "epoch": 4507} {"train_loss": -7.288901329040527, "global_step": 189317, "epoch": 4507} {"train_loss": -7.3336687088012695, "global_step": 189318, "epoch": 4507} {"train_loss": -7.26763916015625, "global_step": 189319, "epoch": 4507} {"train_loss": -7.2661919593811035, "global_step": 189320, "epoch": 4507} {"train_loss": -7.203726291656494, "global_step": 189321, "epoch": 4507} {"train_loss": -7.197731018066406, "global_step": 189322, "epoch": 4507} {"train_loss": -7.305095672607422, "global_step": 189323, "epoch": 4507} {"train_loss": -7.219057083129883, "global_step": 189324, "epoch": 4507} {"train_loss": -7.245791435241699, "global_step": 189325, "epoch": 4507} {"train_loss": -7.191801071166992, "global_step": 189326, "epoch": 4507} {"train_loss": -7.314711570739746, "global_step": 189327, "epoch": 4507} {"train_loss": -7.353298187255859, "global_step": 189328, "epoch": 4507} {"train_loss": -7.205019474029541, "global_step": 189329, "epoch": 4507} {"train_loss": -7.183150768280029, "global_step": 189330, "epoch": 4507} {"train_loss": -7.206455230712891, "global_step": 189331, "epoch": 4507} {"train_loss": -7.346667289733887, "global_step": 189332, "epoch": 4507} {"train_loss": -7.331831932067871, "global_step": 189333, "epoch": 4507} {"train_loss": -7.286202430725098, "global_step": 189334, "epoch": 4507} {"train_loss": -7.23873325756618, "global_step": 189335, "epoch": 4507, "val_loss": 80892.2734375} {"train_loss": -7.279607772827148, "global_step": 189336, "epoch": 4508} {"train_loss": -7.28228759765625, "global_step": 189337, "epoch": 4508} {"train_loss": -7.404224395751953, "global_step": 189338, "epoch": 4508} {"train_loss": -7.294036865234375, "global_step": 189339, "epoch": 4508} {"train_loss": -7.289002418518066, "global_step": 189340, "epoch": 4508} {"train_loss": -7.240334510803223, "global_step": 189341, "epoch": 4508} {"train_loss": -7.286869049072266, "global_step": 189342, "epoch": 4508} {"train_loss": -7.332780838012695, "global_step": 189343, "epoch": 4508} {"train_loss": -7.266125679016113, "global_step": 189344, "epoch": 4508} {"train_loss": -7.334659099578857, "global_step": 189345, "epoch": 4508} {"train_loss": -7.379456520080566, "global_step": 189346, "epoch": 4508} {"train_loss": -7.315280914306641, "global_step": 189347, "epoch": 4508} {"train_loss": -7.317961692810059, "global_step": 189348, "epoch": 4508} {"train_loss": -7.211884498596191, "global_step": 189349, "epoch": 4508} {"train_loss": -7.203444480895996, "global_step": 189350, "epoch": 4508} {"train_loss": -7.2931227684021, "global_step": 189351, "epoch": 4508} {"train_loss": -7.089358806610107, "global_step": 189352, "epoch": 4508} {"train_loss": -7.1116180419921875, "global_step": 189353, "epoch": 4508} {"train_loss": -7.216799736022949, "global_step": 189354, "epoch": 4508} {"train_loss": -7.251519203186035, "global_step": 189355, "epoch": 4508} {"train_loss": -7.145752429962158, "global_step": 189356, "epoch": 4508} {"train_loss": -7.239190101623535, "global_step": 189357, "epoch": 4508} {"train_loss": -7.1722211837768555, "global_step": 189358, "epoch": 4508} {"train_loss": -7.216747283935547, "global_step": 189359, "epoch": 4508} {"train_loss": -7.11929988861084, "global_step": 189360, "epoch": 4508} {"train_loss": -7.232835292816162, "global_step": 189361, "epoch": 4508} {"train_loss": -7.1353654861450195, "global_step": 189362, "epoch": 4508} {"train_loss": -7.167207717895508, "global_step": 189363, "epoch": 4508} {"train_loss": -7.234870910644531, "global_step": 189364, "epoch": 4508} {"train_loss": -7.245847702026367, "global_step": 189365, "epoch": 4508} {"train_loss": -7.21572732925415, "global_step": 189366, "epoch": 4508} {"train_loss": -7.15274715423584, "global_step": 189367, "epoch": 4508} {"train_loss": -7.238056182861328, "global_step": 189368, "epoch": 4508} {"train_loss": -7.1351118087768555, "global_step": 189369, "epoch": 4508} {"train_loss": -7.243521690368652, "global_step": 189370, "epoch": 4508} {"train_loss": -7.16942024230957, "global_step": 189371, "epoch": 4508} {"train_loss": -7.217548370361328, "global_step": 189372, "epoch": 4508} {"train_loss": -7.23376989364624, "global_step": 189373, "epoch": 4508} {"train_loss": -7.0917229652404785, "global_step": 189374, "epoch": 4508} {"train_loss": -7.192898750305176, "global_step": 189375, "epoch": 4508} {"train_loss": -7.164338111877441, "global_step": 189376, "epoch": 4508} {"train_loss": -7.225028003965106, "global_step": 189377, "epoch": 4508, "val_loss": 81324.0} {"train_loss": -7.076591968536377, "global_step": 189378, "epoch": 4509} {"train_loss": -7.254323959350586, "global_step": 189379, "epoch": 4509} {"train_loss": -7.021008491516113, "global_step": 189380, "epoch": 4509} {"train_loss": -7.09618616104126, "global_step": 189381, "epoch": 4509} {"train_loss": -7.141061782836914, "global_step": 189382, "epoch": 4509} {"train_loss": -7.016279697418213, "global_step": 189383, "epoch": 4509} {"train_loss": -7.167170524597168, "global_step": 189384, "epoch": 4509} {"train_loss": -7.16779088973999, "global_step": 189385, "epoch": 4509} {"train_loss": -7.108633995056152, "global_step": 189386, "epoch": 4509} {"train_loss": -7.19432258605957, "global_step": 189387, "epoch": 4509} {"train_loss": -7.222641944885254, "global_step": 189388, "epoch": 4509} {"train_loss": -7.1162309646606445, "global_step": 189389, "epoch": 4509} {"train_loss": -7.104245662689209, "global_step": 189390, "epoch": 4509} {"train_loss": -7.210761070251465, "global_step": 189391, "epoch": 4509} {"train_loss": -7.261275291442871, "global_step": 189392, "epoch": 4509} {"train_loss": -7.103329181671143, "global_step": 189393, "epoch": 4509} {"train_loss": -7.143582344055176, "global_step": 189394, "epoch": 4509} {"train_loss": -7.235081672668457, "global_step": 189395, "epoch": 4509} {"train_loss": -7.07612419128418, "global_step": 189396, "epoch": 4509} {"train_loss": -7.125641822814941, "global_step": 189397, "epoch": 4509} {"train_loss": -7.21726131439209, "global_step": 189398, "epoch": 4509} {"train_loss": -7.154136657714844, "global_step": 189399, "epoch": 4509} {"train_loss": -7.173061847686768, "global_step": 189400, "epoch": 4509} {"train_loss": -7.117390155792236, "global_step": 189401, "epoch": 4509} {"train_loss": -7.121849060058594, "global_step": 189402, "epoch": 4509} {"train_loss": -7.236889839172363, "global_step": 189403, "epoch": 4509} {"train_loss": -7.149252414703369, "global_step": 189404, "epoch": 4509} {"train_loss": -7.180211544036865, "global_step": 189405, "epoch": 4509} {"train_loss": -7.373126029968262, "global_step": 189406, "epoch": 4509} {"train_loss": -7.211296558380127, "global_step": 189407, "epoch": 4509} {"train_loss": -7.139594078063965, "global_step": 189408, "epoch": 4509} {"train_loss": -7.147496223449707, "global_step": 189409, "epoch": 4509} {"train_loss": -7.137096405029297, "global_step": 189410, "epoch": 4509} {"train_loss": -7.129741668701172, "global_step": 189411, "epoch": 4509} {"train_loss": -7.158230781555176, "global_step": 189412, "epoch": 4509} {"train_loss": -7.259514808654785, "global_step": 189413, "epoch": 4509} {"train_loss": -7.250367641448975, "global_step": 189414, "epoch": 4509} {"train_loss": -7.188925743103027, "global_step": 189415, "epoch": 4509} {"train_loss": -7.224719047546387, "global_step": 189416, "epoch": 4509} {"train_loss": -7.1870880126953125, "global_step": 189417, "epoch": 4509} {"train_loss": -7.231091022491455, "global_step": 189418, "epoch": 4509} {"train_loss": -7.1639594577607655, "global_step": 189419, "epoch": 4509, "val_loss": 80691.828125} {"train_loss": -7.182909965515137, "global_step": 189420, "epoch": 4510} {"train_loss": -7.167852401733398, "global_step": 189421, "epoch": 4510} {"train_loss": -7.249088287353516, "global_step": 189422, "epoch": 4510} {"train_loss": -7.173580169677734, "global_step": 189423, "epoch": 4510} {"train_loss": -7.199490070343018, "global_step": 189424, "epoch": 4510} {"train_loss": -7.221092700958252, "global_step": 189425, "epoch": 4510} {"train_loss": -7.116148948669434, "global_step": 189426, "epoch": 4510} {"train_loss": -7.135422706604004, "global_step": 189427, "epoch": 4510} {"train_loss": -7.199325084686279, "global_step": 189428, "epoch": 4510} {"train_loss": -7.151327133178711, "global_step": 189429, "epoch": 4510} {"train_loss": -7.255539894104004, "global_step": 189430, "epoch": 4510} {"train_loss": -7.156050682067871, "global_step": 189431, "epoch": 4510} {"train_loss": -7.22000789642334, "global_step": 189432, "epoch": 4510} {"train_loss": -7.214423179626465, "global_step": 189433, "epoch": 4510} {"train_loss": -7.235738277435303, "global_step": 189434, "epoch": 4510} {"train_loss": -7.1109819412231445, "global_step": 189435, "epoch": 4510} {"train_loss": -7.04987096786499, "global_step": 189436, "epoch": 4510} {"train_loss": -7.085208892822266, "global_step": 189437, "epoch": 4510} {"train_loss": -7.049350738525391, "global_step": 189438, "epoch": 4510} {"train_loss": -7.188687324523926, "global_step": 189439, "epoch": 4510} {"train_loss": -7.0872650146484375, "global_step": 189440, "epoch": 4510} {"train_loss": -7.016191482543945, "global_step": 189441, "epoch": 4510} {"train_loss": -7.111379146575928, "global_step": 189442, "epoch": 4510} {"train_loss": -6.96229887008667, "global_step": 189443, "epoch": 4510} {"train_loss": -7.252283096313477, "global_step": 189444, "epoch": 4510} {"train_loss": -7.106839656829834, "global_step": 189445, "epoch": 4510} {"train_loss": -7.223381042480469, "global_step": 189446, "epoch": 4510} {"train_loss": -7.130889415740967, "global_step": 189447, "epoch": 4510} {"train_loss": -7.0068769454956055, "global_step": 189448, "epoch": 4510} {"train_loss": -7.026432991027832, "global_step": 189449, "epoch": 4510} {"train_loss": -6.988189697265625, "global_step": 189450, "epoch": 4510} {"train_loss": -7.273383140563965, "global_step": 189451, "epoch": 4510} {"train_loss": -7.064206123352051, "global_step": 189452, "epoch": 4510} {"train_loss": -7.184026718139648, "global_step": 189453, "epoch": 4510} {"train_loss": -7.096834659576416, "global_step": 189454, "epoch": 4510} {"train_loss": -7.109642505645752, "global_step": 189455, "epoch": 4510} {"train_loss": -6.978634357452393, "global_step": 189456, "epoch": 4510} {"train_loss": -7.21663761138916, "global_step": 189457, "epoch": 4510} {"train_loss": -7.155797958374023, "global_step": 189458, "epoch": 4510} {"train_loss": -7.13026237487793, "global_step": 189459, "epoch": 4510} {"train_loss": -7.183555603027344, "global_step": 189460, "epoch": 4510} {"train_loss": -7.138958965029035, "global_step": 189461, "epoch": 4510, "val_loss": 80952.015625} {"train_loss": -7.09899377822876, "global_step": 189462, "epoch": 4511} {"train_loss": -7.114108562469482, "global_step": 189463, "epoch": 4511} {"train_loss": -7.206011772155762, "global_step": 189464, "epoch": 4511} {"train_loss": -7.247576713562012, "global_step": 189465, "epoch": 4511} {"train_loss": -6.907364845275879, "global_step": 189466, "epoch": 4511} {"train_loss": -6.803661346435547, "global_step": 189467, "epoch": 4511} {"train_loss": -7.155962944030762, "global_step": 189468, "epoch": 4511} {"train_loss": -7.122238636016846, "global_step": 189469, "epoch": 4511} {"train_loss": -7.107841491699219, "global_step": 189470, "epoch": 4511} {"train_loss": -7.115871906280518, "global_step": 189471, "epoch": 4511} {"train_loss": -7.143885612487793, "global_step": 189472, "epoch": 4511} {"train_loss": -7.150992393493652, "global_step": 189473, "epoch": 4511} {"train_loss": -7.154388904571533, "global_step": 189474, "epoch": 4511} {"train_loss": -6.963926315307617, "global_step": 189475, "epoch": 4511} {"train_loss": -7.197835922241211, "global_step": 189476, "epoch": 4511} {"train_loss": -7.062253475189209, "global_step": 189477, "epoch": 4511} {"train_loss": -6.983363628387451, "global_step": 189478, "epoch": 4511} {"train_loss": -7.227892875671387, "global_step": 189479, "epoch": 4511} {"train_loss": -7.024048805236816, "global_step": 189480, "epoch": 4511} {"train_loss": -7.065370082855225, "global_step": 189481, "epoch": 4511} {"train_loss": -7.104403495788574, "global_step": 189482, "epoch": 4511} {"train_loss": -7.074605941772461, "global_step": 189483, "epoch": 4511} {"train_loss": -7.111598968505859, "global_step": 189484, "epoch": 4511} {"train_loss": -7.053064823150635, "global_step": 189485, "epoch": 4511} {"train_loss": -7.203913688659668, "global_step": 189486, "epoch": 4511} {"train_loss": -7.075352668762207, "global_step": 189487, "epoch": 4511} {"train_loss": -7.1254706382751465, "global_step": 189488, "epoch": 4511} {"train_loss": -7.184399604797363, "global_step": 189489, "epoch": 4511} {"train_loss": -7.095146179199219, "global_step": 189490, "epoch": 4511} {"train_loss": -7.121976852416992, "global_step": 189491, "epoch": 4511} {"train_loss": -7.178054332733154, "global_step": 189492, "epoch": 4511} {"train_loss": -7.167680740356445, "global_step": 189493, "epoch": 4511} {"train_loss": -7.109851837158203, "global_step": 189494, "epoch": 4511} {"train_loss": -7.107387542724609, "global_step": 189495, "epoch": 4511} {"train_loss": -7.213181018829346, "global_step": 189496, "epoch": 4511} {"train_loss": -7.114332675933838, "global_step": 189497, "epoch": 4511} {"train_loss": -7.187432289123535, "global_step": 189498, "epoch": 4511} {"train_loss": -7.11737060546875, "global_step": 189499, "epoch": 4511} {"train_loss": -7.1962056159973145, "global_step": 189500, "epoch": 4511} {"train_loss": -7.189752578735352, "global_step": 189501, "epoch": 4511} {"train_loss": -7.143214225769043, "global_step": 189502, "epoch": 4511} {"train_loss": -7.113064141500564, "global_step": 189503, "epoch": 4511, "val_loss": 80804.078125} {"train_loss": -7.264986038208008, "global_step": 189504, "epoch": 4512} {"train_loss": -7.152157783508301, "global_step": 189505, "epoch": 4512} {"train_loss": -7.2897562980651855, "global_step": 189506, "epoch": 4512} {"train_loss": -7.073013782501221, "global_step": 189507, "epoch": 4512} {"train_loss": -7.270768642425537, "global_step": 189508, "epoch": 4512} {"train_loss": -7.262503623962402, "global_step": 189509, "epoch": 4512} {"train_loss": -7.270720958709717, "global_step": 189510, "epoch": 4512} {"train_loss": -7.205459117889404, "global_step": 189511, "epoch": 4512} {"train_loss": -7.172173500061035, "global_step": 189512, "epoch": 4512} {"train_loss": -7.166902542114258, "global_step": 189513, "epoch": 4512} {"train_loss": -7.100357532501221, "global_step": 189514, "epoch": 4512} {"train_loss": -7.155529975891113, "global_step": 189515, "epoch": 4512} {"train_loss": -7.335866928100586, "global_step": 189516, "epoch": 4512} {"train_loss": -7.217336177825928, "global_step": 189517, "epoch": 4512} {"train_loss": -7.156255722045898, "global_step": 189518, "epoch": 4512} {"train_loss": -7.3137311935424805, "global_step": 189519, "epoch": 4512} {"train_loss": -7.178005218505859, "global_step": 189520, "epoch": 4512} {"train_loss": -7.240344047546387, "global_step": 189521, "epoch": 4512} {"train_loss": -7.266705513000488, "global_step": 189522, "epoch": 4512} {"train_loss": -7.199206829071045, "global_step": 189523, "epoch": 4512} {"train_loss": -7.356059551239014, "global_step": 189524, "epoch": 4512} {"train_loss": -7.301065444946289, "global_step": 189525, "epoch": 4512} {"train_loss": -7.28928804397583, "global_step": 189526, "epoch": 4512} {"train_loss": -7.206305503845215, "global_step": 189527, "epoch": 4512} {"train_loss": -7.253314971923828, "global_step": 189528, "epoch": 4512} {"train_loss": -7.307159900665283, "global_step": 189529, "epoch": 4512} {"train_loss": -7.19733190536499, "global_step": 189530, "epoch": 4512} {"train_loss": -7.180010795593262, "global_step": 189531, "epoch": 4512} {"train_loss": -7.184191703796387, "global_step": 189532, "epoch": 4512} {"train_loss": -7.166102886199951, "global_step": 189533, "epoch": 4512} {"train_loss": -7.2761945724487305, "global_step": 189534, "epoch": 4512} {"train_loss": -7.188604354858398, "global_step": 189535, "epoch": 4512} {"train_loss": -7.249689102172852, "global_step": 189536, "epoch": 4512} {"train_loss": -7.137936115264893, "global_step": 189537, "epoch": 4512} {"train_loss": -7.225533485412598, "global_step": 189538, "epoch": 4512} {"train_loss": -7.133855819702148, "global_step": 189539, "epoch": 4512} {"train_loss": -7.311007499694824, "global_step": 189540, "epoch": 4512} {"train_loss": -7.257083892822266, "global_step": 189541, "epoch": 4512} {"train_loss": -7.280923843383789, "global_step": 189542, "epoch": 4512} {"train_loss": -7.258011817932129, "global_step": 189543, "epoch": 4512} {"train_loss": -7.233175277709961, "global_step": 189544, "epoch": 4512} {"train_loss": -7.227840877714611, "global_step": 189545, "epoch": 4512, "val_loss": 80966.125} {"train_loss": -7.316946983337402, "global_step": 189546, "epoch": 4513} {"train_loss": -7.183749198913574, "global_step": 189547, "epoch": 4513} {"train_loss": -7.157803058624268, "global_step": 189548, "epoch": 4513} {"train_loss": -7.24064826965332, "global_step": 189549, "epoch": 4513} {"train_loss": -7.253620147705078, "global_step": 189550, "epoch": 4513} {"train_loss": -7.1883769035339355, "global_step": 189551, "epoch": 4513} {"train_loss": -7.082067012786865, "global_step": 189552, "epoch": 4513} {"train_loss": -7.226261138916016, "global_step": 189553, "epoch": 4513} {"train_loss": -7.189840316772461, "global_step": 189554, "epoch": 4513} {"train_loss": -7.105656623840332, "global_step": 189555, "epoch": 4513} {"train_loss": -7.034273147583008, "global_step": 189556, "epoch": 4513} {"train_loss": -6.9944868087768555, "global_step": 189557, "epoch": 4513} {"train_loss": -7.127197265625, "global_step": 189558, "epoch": 4513} {"train_loss": -6.990678787231445, "global_step": 189559, "epoch": 4513} {"train_loss": -7.018740653991699, "global_step": 189560, "epoch": 4513} {"train_loss": -7.081385612487793, "global_step": 189561, "epoch": 4513} {"train_loss": -7.013260841369629, "global_step": 189562, "epoch": 4513} {"train_loss": -7.005694389343262, "global_step": 189563, "epoch": 4513} {"train_loss": -7.110622406005859, "global_step": 189564, "epoch": 4513} {"train_loss": -7.01461935043335, "global_step": 189565, "epoch": 4513} {"train_loss": -7.164085865020752, "global_step": 189566, "epoch": 4513} {"train_loss": -7.070178031921387, "global_step": 189567, "epoch": 4513} {"train_loss": -7.212834358215332, "global_step": 189568, "epoch": 4513} {"train_loss": -7.063088893890381, "global_step": 189569, "epoch": 4513} {"train_loss": -7.073165416717529, "global_step": 189570, "epoch": 4513} {"train_loss": -7.130427360534668, "global_step": 189571, "epoch": 4513} {"train_loss": -7.112865447998047, "global_step": 189572, "epoch": 4513} {"train_loss": -7.005159854888916, "global_step": 189573, "epoch": 4513} {"train_loss": -7.125751495361328, "global_step": 189574, "epoch": 4513} {"train_loss": -6.971124172210693, "global_step": 189575, "epoch": 4513} {"train_loss": -7.117275238037109, "global_step": 189576, "epoch": 4513} {"train_loss": -7.039135456085205, "global_step": 189577, "epoch": 4513} {"train_loss": -7.131363868713379, "global_step": 189578, "epoch": 4513} {"train_loss": -7.063743591308594, "global_step": 189579, "epoch": 4513} {"train_loss": -7.176281929016113, "global_step": 189580, "epoch": 4513} {"train_loss": -6.948468208312988, "global_step": 189581, "epoch": 4513} {"train_loss": -7.073790550231934, "global_step": 189582, "epoch": 4513} {"train_loss": -7.037142753601074, "global_step": 189583, "epoch": 4513} {"train_loss": -7.041003227233887, "global_step": 189584, "epoch": 4513} {"train_loss": -7.151365280151367, "global_step": 189585, "epoch": 4513} {"train_loss": -7.036078453063965, "global_step": 189586, "epoch": 4513} {"train_loss": -7.101678621201288, "global_step": 189587, "epoch": 4513, "val_loss": 81204.9140625} {"train_loss": -7.213122367858887, "global_step": 189588, "epoch": 4514} {"train_loss": -7.07874870300293, "global_step": 189589, "epoch": 4514} {"train_loss": -7.079187393188477, "global_step": 189590, "epoch": 4514} {"train_loss": -7.0946044921875, "global_step": 189591, "epoch": 4514} {"train_loss": -7.305645942687988, "global_step": 189592, "epoch": 4514} {"train_loss": -7.099127769470215, "global_step": 189593, "epoch": 4514} {"train_loss": -7.210503578186035, "global_step": 189594, "epoch": 4514} {"train_loss": -7.271457672119141, "global_step": 189595, "epoch": 4514} {"train_loss": -7.22652530670166, "global_step": 189596, "epoch": 4514} {"train_loss": -7.187813758850098, "global_step": 189597, "epoch": 4514} {"train_loss": -7.141241073608398, "global_step": 189598, "epoch": 4514} {"train_loss": -7.2945709228515625, "global_step": 189599, "epoch": 4514} {"train_loss": -7.261861801147461, "global_step": 189600, "epoch": 4514} {"train_loss": -7.128956317901611, "global_step": 189601, "epoch": 4514} {"train_loss": -7.177164554595947, "global_step": 189602, "epoch": 4514} {"train_loss": -7.299368858337402, "global_step": 189603, "epoch": 4514} {"train_loss": -7.178430557250977, "global_step": 189604, "epoch": 4514} {"train_loss": -7.352725028991699, "global_step": 189605, "epoch": 4514} {"train_loss": -7.295231819152832, "global_step": 189606, "epoch": 4514} {"train_loss": -7.21727180480957, "global_step": 189607, "epoch": 4514} {"train_loss": -7.181349754333496, "global_step": 189608, "epoch": 4514} {"train_loss": -7.167398929595947, "global_step": 189609, "epoch": 4514} {"train_loss": -7.199045181274414, "global_step": 189610, "epoch": 4514} {"train_loss": -7.245573043823242, "global_step": 189611, "epoch": 4514} {"train_loss": -7.133520603179932, "global_step": 189612, "epoch": 4514} {"train_loss": -7.190974235534668, "global_step": 189613, "epoch": 4514} {"train_loss": -7.261268615722656, "global_step": 189614, "epoch": 4514} {"train_loss": -7.120499610900879, "global_step": 189615, "epoch": 4514} {"train_loss": -7.0868425369262695, "global_step": 189616, "epoch": 4514} {"train_loss": -7.241856575012207, "global_step": 189617, "epoch": 4514} {"train_loss": -7.073467254638672, "global_step": 189618, "epoch": 4514} {"train_loss": -7.300684452056885, "global_step": 189619, "epoch": 4514} {"train_loss": -7.007542610168457, "global_step": 189620, "epoch": 4514} {"train_loss": -7.2470927238464355, "global_step": 189621, "epoch": 4514} {"train_loss": -7.023873329162598, "global_step": 189622, "epoch": 4514} {"train_loss": -7.26578950881958, "global_step": 189623, "epoch": 4514} {"train_loss": -7.152221202850342, "global_step": 189624, "epoch": 4514} {"train_loss": -7.188302040100098, "global_step": 189625, "epoch": 4514} {"train_loss": -7.1554718017578125, "global_step": 189626, "epoch": 4514} {"train_loss": -7.143013000488281, "global_step": 189627, "epoch": 4514} {"train_loss": -7.2957916259765625, "global_step": 189628, "epoch": 4514} {"train_loss": -7.191275642031715, "global_step": 189629, "epoch": 4514, "val_loss": 80924.9921875} {"train_loss": -7.208053112030029, "global_step": 189630, "epoch": 4515} {"train_loss": -7.141031742095947, "global_step": 189631, "epoch": 4515} {"train_loss": -7.329185485839844, "global_step": 189632, "epoch": 4515} {"train_loss": -7.187475681304932, "global_step": 189633, "epoch": 4515} {"train_loss": -7.184665679931641, "global_step": 189634, "epoch": 4515} {"train_loss": -7.2196550369262695, "global_step": 189635, "epoch": 4515} {"train_loss": -7.144233703613281, "global_step": 189636, "epoch": 4515} {"train_loss": -7.160071849822998, "global_step": 189637, "epoch": 4515} {"train_loss": -7.261770248413086, "global_step": 189638, "epoch": 4515} {"train_loss": -7.16702127456665, "global_step": 189639, "epoch": 4515} {"train_loss": -7.184906959533691, "global_step": 189640, "epoch": 4515} {"train_loss": -7.080331802368164, "global_step": 189641, "epoch": 4515} {"train_loss": -7.198124885559082, "global_step": 189642, "epoch": 4515} {"train_loss": -7.152015209197998, "global_step": 189643, "epoch": 4515} {"train_loss": -7.099253177642822, "global_step": 189644, "epoch": 4515} {"train_loss": -7.152278423309326, "global_step": 189645, "epoch": 4515} {"train_loss": -7.13175106048584, "global_step": 189646, "epoch": 4515} {"train_loss": -7.215416431427002, "global_step": 189647, "epoch": 4515} {"train_loss": -7.2677459716796875, "global_step": 189648, "epoch": 4515} {"train_loss": -7.35372257232666, "global_step": 189649, "epoch": 4515} {"train_loss": -7.271363735198975, "global_step": 189650, "epoch": 4515} {"train_loss": -7.163163661956787, "global_step": 189651, "epoch": 4515} {"train_loss": -7.246068000793457, "global_step": 189652, "epoch": 4515} {"train_loss": -7.199598789215088, "global_step": 189653, "epoch": 4515} {"train_loss": -7.205816268920898, "global_step": 189654, "epoch": 4515} {"train_loss": -7.28182315826416, "global_step": 189655, "epoch": 4515} {"train_loss": -7.158977508544922, "global_step": 189656, "epoch": 4515} {"train_loss": -7.075617790222168, "global_step": 189657, "epoch": 4515} {"train_loss": -7.215788841247559, "global_step": 189658, "epoch": 4515} {"train_loss": -7.225391387939453, "global_step": 189659, "epoch": 4515} {"train_loss": -7.176907539367676, "global_step": 189660, "epoch": 4515} {"train_loss": -7.177394866943359, "global_step": 189661, "epoch": 4515} {"train_loss": -7.127354621887207, "global_step": 189662, "epoch": 4515} {"train_loss": -7.204540729522705, "global_step": 189663, "epoch": 4515} {"train_loss": -7.3409295082092285, "global_step": 189664, "epoch": 4515} {"train_loss": -7.1148576736450195, "global_step": 189665, "epoch": 4515} {"train_loss": -7.276678085327148, "global_step": 189666, "epoch": 4515} {"train_loss": -7.3236589431762695, "global_step": 189667, "epoch": 4515} {"train_loss": -7.256507873535156, "global_step": 189668, "epoch": 4515} {"train_loss": -7.098511695861816, "global_step": 189669, "epoch": 4515} {"train_loss": -7.171807765960693, "global_step": 189670, "epoch": 4515} {"train_loss": -7.19804699080331, "global_step": 189671, "epoch": 4515, "val_loss": 81189.984375} {"train_loss": -6.898534297943115, "global_step": 189672, "epoch": 4516} {"train_loss": -7.197959899902344, "global_step": 189673, "epoch": 4516} {"train_loss": -7.254733085632324, "global_step": 189674, "epoch": 4516} {"train_loss": -6.940515518188477, "global_step": 189675, "epoch": 4516} {"train_loss": -7.059581756591797, "global_step": 189676, "epoch": 4516} {"train_loss": -7.213523864746094, "global_step": 189677, "epoch": 4516} {"train_loss": -7.127001762390137, "global_step": 189678, "epoch": 4516} {"train_loss": -7.065607070922852, "global_step": 189679, "epoch": 4516} {"train_loss": -7.306134223937988, "global_step": 189680, "epoch": 4516} {"train_loss": -7.116396903991699, "global_step": 189681, "epoch": 4516} {"train_loss": -7.186210632324219, "global_step": 189682, "epoch": 4516} {"train_loss": -7.199162483215332, "global_step": 189683, "epoch": 4516} {"train_loss": -7.189852714538574, "global_step": 189684, "epoch": 4516} {"train_loss": -7.192388534545898, "global_step": 189685, "epoch": 4516} {"train_loss": -7.058108806610107, "global_step": 189686, "epoch": 4516} {"train_loss": -7.202519416809082, "global_step": 189687, "epoch": 4516} {"train_loss": -7.166262626647949, "global_step": 189688, "epoch": 4516} {"train_loss": -7.132706165313721, "global_step": 189689, "epoch": 4516} {"train_loss": -7.271327018737793, "global_step": 189690, "epoch": 4516} {"train_loss": -7.2608642578125, "global_step": 189691, "epoch": 4516} {"train_loss": -7.222206115722656, "global_step": 189692, "epoch": 4516} {"train_loss": -7.366158485412598, "global_step": 189693, "epoch": 4516} {"train_loss": -7.267546653747559, "global_step": 189694, "epoch": 4516} {"train_loss": -7.234816551208496, "global_step": 189695, "epoch": 4516} {"train_loss": -7.224316596984863, "global_step": 189696, "epoch": 4516} {"train_loss": -7.259746551513672, "global_step": 189697, "epoch": 4516} {"train_loss": -7.2592363357543945, "global_step": 189698, "epoch": 4516} {"train_loss": -7.352137565612793, "global_step": 189699, "epoch": 4516} {"train_loss": -7.232120513916016, "global_step": 189700, "epoch": 4516} {"train_loss": -7.192866325378418, "global_step": 189701, "epoch": 4516} {"train_loss": -7.357668876647949, "global_step": 189702, "epoch": 4516} {"train_loss": -7.262764930725098, "global_step": 189703, "epoch": 4516} {"train_loss": -7.222507953643799, "global_step": 189704, "epoch": 4516} {"train_loss": -7.342348098754883, "global_step": 189705, "epoch": 4516} {"train_loss": -7.208806991577148, "global_step": 189706, "epoch": 4516} {"train_loss": -7.202665328979492, "global_step": 189707, "epoch": 4516} {"train_loss": -7.286896228790283, "global_step": 189708, "epoch": 4516} {"train_loss": -7.412037372589111, "global_step": 189709, "epoch": 4516} {"train_loss": -7.069151401519775, "global_step": 189710, "epoch": 4516} {"train_loss": -7.286672592163086, "global_step": 189711, "epoch": 4516} {"train_loss": -7.147433280944824, "global_step": 189712, "epoch": 4516} {"train_loss": -7.2028054509844095, "global_step": 189713, "epoch": 4516, "val_loss": 81037.28125} {"train_loss": -7.195873260498047, "global_step": 189714, "epoch": 4517} {"train_loss": -7.332518577575684, "global_step": 189715, "epoch": 4517} {"train_loss": -7.24019718170166, "global_step": 189716, "epoch": 4517} {"train_loss": -7.189382553100586, "global_step": 189717, "epoch": 4517} {"train_loss": -7.192211627960205, "global_step": 189718, "epoch": 4517} {"train_loss": -7.068144798278809, "global_step": 189719, "epoch": 4517} {"train_loss": -7.2581024169921875, "global_step": 189720, "epoch": 4517} {"train_loss": -7.095088958740234, "global_step": 189721, "epoch": 4517} {"train_loss": -7.220038414001465, "global_step": 189722, "epoch": 4517} {"train_loss": -7.323829174041748, "global_step": 189723, "epoch": 4517} {"train_loss": -7.081984519958496, "global_step": 189724, "epoch": 4517} {"train_loss": -7.133368492126465, "global_step": 189725, "epoch": 4517} {"train_loss": -7.150412559509277, "global_step": 189726, "epoch": 4517} {"train_loss": -7.150267601013184, "global_step": 189727, "epoch": 4517} {"train_loss": -7.04200553894043, "global_step": 189728, "epoch": 4517} {"train_loss": -7.116878509521484, "global_step": 189729, "epoch": 4517} {"train_loss": -7.314153671264648, "global_step": 189730, "epoch": 4517} {"train_loss": -7.211848258972168, "global_step": 189731, "epoch": 4517} {"train_loss": -7.185710906982422, "global_step": 189732, "epoch": 4517} {"train_loss": -7.183511734008789, "global_step": 189733, "epoch": 4517} {"train_loss": -7.258853435516357, "global_step": 189734, "epoch": 4517} {"train_loss": -7.223910331726074, "global_step": 189735, "epoch": 4517} {"train_loss": -7.297597885131836, "global_step": 189736, "epoch": 4517} {"train_loss": -7.217820167541504, "global_step": 189737, "epoch": 4517} {"train_loss": -7.381709098815918, "global_step": 189738, "epoch": 4517} {"train_loss": -7.184551239013672, "global_step": 189739, "epoch": 4517} {"train_loss": -7.313255310058594, "global_step": 189740, "epoch": 4517} {"train_loss": -7.271628379821777, "global_step": 189741, "epoch": 4517} {"train_loss": -7.252098083496094, "global_step": 189742, "epoch": 4517} {"train_loss": -7.181846618652344, "global_step": 189743, "epoch": 4517} {"train_loss": -7.334360122680664, "global_step": 189744, "epoch": 4517} {"train_loss": -7.300458908081055, "global_step": 189745, "epoch": 4517} {"train_loss": -7.304391860961914, "global_step": 189746, "epoch": 4517} {"train_loss": -7.238332748413086, "global_step": 189747, "epoch": 4517} {"train_loss": -7.303836822509766, "global_step": 189748, "epoch": 4517} {"train_loss": -7.265527725219727, "global_step": 189749, "epoch": 4517} {"train_loss": -7.226794719696045, "global_step": 189750, "epoch": 4517} {"train_loss": -7.1924004554748535, "global_step": 189751, "epoch": 4517} {"train_loss": -7.215795516967773, "global_step": 189752, "epoch": 4517} {"train_loss": -7.177455902099609, "global_step": 189753, "epoch": 4517} {"train_loss": -7.32840633392334, "global_step": 189754, "epoch": 4517} {"train_loss": -7.2246526309422086, "global_step": 189755, "epoch": 4517, "val_loss": 80948.484375} {"train_loss": -7.118232727050781, "global_step": 189756, "epoch": 4518} {"train_loss": -7.117657661437988, "global_step": 189757, "epoch": 4518} {"train_loss": -7.345155239105225, "global_step": 189758, "epoch": 4518} {"train_loss": -7.069680690765381, "global_step": 189759, "epoch": 4518} {"train_loss": -7.155134201049805, "global_step": 189760, "epoch": 4518} {"train_loss": -7.382956027984619, "global_step": 189761, "epoch": 4518} {"train_loss": -7.237950325012207, "global_step": 189762, "epoch": 4518} {"train_loss": -7.257823944091797, "global_step": 189763, "epoch": 4518} {"train_loss": -7.238590240478516, "global_step": 189764, "epoch": 4518} {"train_loss": -7.288524627685547, "global_step": 189765, "epoch": 4518} {"train_loss": -7.249834060668945, "global_step": 189766, "epoch": 4518} {"train_loss": -7.271025657653809, "global_step": 189767, "epoch": 4518} {"train_loss": -7.371779441833496, "global_step": 189768, "epoch": 4518} {"train_loss": -7.278984546661377, "global_step": 189769, "epoch": 4518} {"train_loss": -7.368997573852539, "global_step": 189770, "epoch": 4518} {"train_loss": -7.246448040008545, "global_step": 189771, "epoch": 4518} {"train_loss": -7.155991554260254, "global_step": 189772, "epoch": 4518} {"train_loss": -7.288559436798096, "global_step": 189773, "epoch": 4518} {"train_loss": -7.280612945556641, "global_step": 189774, "epoch": 4518} {"train_loss": -7.303018569946289, "global_step": 189775, "epoch": 4518} {"train_loss": -7.279916763305664, "global_step": 189776, "epoch": 4518} {"train_loss": -7.263896465301514, "global_step": 189777, "epoch": 4518} {"train_loss": -7.159336090087891, "global_step": 189778, "epoch": 4518} {"train_loss": -7.392088890075684, "global_step": 189779, "epoch": 4518} {"train_loss": -7.2617950439453125, "global_step": 189780, "epoch": 4518} {"train_loss": -7.17087984085083, "global_step": 189781, "epoch": 4518} {"train_loss": -7.198753356933594, "global_step": 189782, "epoch": 4518} {"train_loss": -7.227047920227051, "global_step": 189783, "epoch": 4518} {"train_loss": -7.178735733032227, "global_step": 189784, "epoch": 4518} {"train_loss": -7.153800010681152, "global_step": 189785, "epoch": 4518} {"train_loss": -7.292189598083496, "global_step": 189786, "epoch": 4518} {"train_loss": -7.256574630737305, "global_step": 189787, "epoch": 4518} {"train_loss": -7.171600341796875, "global_step": 189788, "epoch": 4518} {"train_loss": -7.272714614868164, "global_step": 189789, "epoch": 4518} {"train_loss": -7.169939994812012, "global_step": 189790, "epoch": 4518} {"train_loss": -7.120566368103027, "global_step": 189791, "epoch": 4518} {"train_loss": -7.214201927185059, "global_step": 189792, "epoch": 4518} {"train_loss": -7.307250022888184, "global_step": 189793, "epoch": 4518} {"train_loss": -7.173471450805664, "global_step": 189794, "epoch": 4518} {"train_loss": -7.217384338378906, "global_step": 189795, "epoch": 4518} {"train_loss": -7.214021682739258, "global_step": 189796, "epoch": 4518} {"train_loss": -7.2338813827151345, "global_step": 189797, "epoch": 4518, "val_loss": 80939.921875} {"train_loss": -7.2622599601745605, "global_step": 189798, "epoch": 4519} {"train_loss": -7.266596794128418, "global_step": 189799, "epoch": 4519} {"train_loss": -7.1429123878479, "global_step": 189800, "epoch": 4519} {"train_loss": -7.206908226013184, "global_step": 189801, "epoch": 4519} {"train_loss": -7.182697296142578, "global_step": 189802, "epoch": 4519} {"train_loss": -7.2259321212768555, "global_step": 189803, "epoch": 4519} {"train_loss": -7.289419651031494, "global_step": 189804, "epoch": 4519} {"train_loss": -7.284175395965576, "global_step": 189805, "epoch": 4519} {"train_loss": -7.156607627868652, "global_step": 189806, "epoch": 4519} {"train_loss": -7.155019283294678, "global_step": 189807, "epoch": 4519} {"train_loss": -7.418642044067383, "global_step": 189808, "epoch": 4519} {"train_loss": -7.24490213394165, "global_step": 189809, "epoch": 4519} {"train_loss": -7.151151180267334, "global_step": 189810, "epoch": 4519} {"train_loss": -7.298397064208984, "global_step": 189811, "epoch": 4519} {"train_loss": -7.165226459503174, "global_step": 189812, "epoch": 4519} {"train_loss": -7.3680830001831055, "global_step": 189813, "epoch": 4519} {"train_loss": -7.372879981994629, "global_step": 189814, "epoch": 4519} {"train_loss": -7.233258247375488, "global_step": 189815, "epoch": 4519} {"train_loss": -7.338462829589844, "global_step": 189816, "epoch": 4519} {"train_loss": -7.2208428382873535, "global_step": 189817, "epoch": 4519} {"train_loss": -7.221920013427734, "global_step": 189818, "epoch": 4519} {"train_loss": -7.267120361328125, "global_step": 189819, "epoch": 4519} {"train_loss": -7.238755226135254, "global_step": 189820, "epoch": 4519} {"train_loss": -7.165566444396973, "global_step": 189821, "epoch": 4519} {"train_loss": -7.166236400604248, "global_step": 189822, "epoch": 4519} {"train_loss": -7.33779239654541, "global_step": 189823, "epoch": 4519} {"train_loss": -7.154584884643555, "global_step": 189824, "epoch": 4519} {"train_loss": -7.233394145965576, "global_step": 189825, "epoch": 4519} {"train_loss": -7.299988746643066, "global_step": 189826, "epoch": 4519} {"train_loss": -7.204224586486816, "global_step": 189827, "epoch": 4519} {"train_loss": -7.083634376525879, "global_step": 189828, "epoch": 4519} {"train_loss": -7.1046013832092285, "global_step": 189829, "epoch": 4519} {"train_loss": -7.134482383728027, "global_step": 189830, "epoch": 4519} {"train_loss": -7.295170783996582, "global_step": 189831, "epoch": 4519} {"train_loss": -7.189015865325928, "global_step": 189832, "epoch": 4519} {"train_loss": -7.305551528930664, "global_step": 189833, "epoch": 4519} {"train_loss": -7.200525760650635, "global_step": 189834, "epoch": 4519} {"train_loss": -7.204504013061523, "global_step": 189835, "epoch": 4519} {"train_loss": -7.191196918487549, "global_step": 189836, "epoch": 4519} {"train_loss": -7.164775848388672, "global_step": 189837, "epoch": 4519} {"train_loss": -7.13304328918457, "global_step": 189838, "epoch": 4519} {"train_loss": -7.227819987705776, "global_step": 189839, "epoch": 4519, "val_loss": 81026.2578125} {"train_loss": -7.209539413452148, "global_step": 189840, "epoch": 4520} {"train_loss": -7.116896629333496, "global_step": 189841, "epoch": 4520} {"train_loss": -7.277943134307861, "global_step": 189842, "epoch": 4520} {"train_loss": -7.318154811859131, "global_step": 189843, "epoch": 4520} {"train_loss": -7.1154985427856445, "global_step": 189844, "epoch": 4520} {"train_loss": -7.255152702331543, "global_step": 189845, "epoch": 4520} {"train_loss": -7.205679893493652, "global_step": 189846, "epoch": 4520} {"train_loss": -7.21788215637207, "global_step": 189847, "epoch": 4520} {"train_loss": -7.244852066040039, "global_step": 189848, "epoch": 4520} {"train_loss": -7.242232322692871, "global_step": 189849, "epoch": 4520} {"train_loss": -7.188739776611328, "global_step": 189850, "epoch": 4520} {"train_loss": -7.214882850646973, "global_step": 189851, "epoch": 4520} {"train_loss": -7.231173038482666, "global_step": 189852, "epoch": 4520} {"train_loss": -7.207162857055664, "global_step": 189853, "epoch": 4520} {"train_loss": -7.2400665283203125, "global_step": 189854, "epoch": 4520} {"train_loss": -7.228003978729248, "global_step": 189855, "epoch": 4520} {"train_loss": -7.299890518188477, "global_step": 189856, "epoch": 4520} {"train_loss": -7.170939922332764, "global_step": 189857, "epoch": 4520} {"train_loss": -7.248983383178711, "global_step": 189858, "epoch": 4520} {"train_loss": -7.258268356323242, "global_step": 189859, "epoch": 4520} {"train_loss": -7.217700958251953, "global_step": 189860, "epoch": 4520} {"train_loss": -7.314485549926758, "global_step": 189861, "epoch": 4520} {"train_loss": -7.323245048522949, "global_step": 189862, "epoch": 4520} {"train_loss": -7.231493949890137, "global_step": 189863, "epoch": 4520} {"train_loss": -7.235860824584961, "global_step": 189864, "epoch": 4520} {"train_loss": -7.294401168823242, "global_step": 189865, "epoch": 4520} {"train_loss": -7.192082405090332, "global_step": 189866, "epoch": 4520} {"train_loss": -7.237493515014648, "global_step": 189867, "epoch": 4520} {"train_loss": -7.2243547439575195, "global_step": 189868, "epoch": 4520} {"train_loss": -7.2680206298828125, "global_step": 189869, "epoch": 4520} {"train_loss": -7.264644622802734, "global_step": 189870, "epoch": 4520} {"train_loss": -7.236445426940918, "global_step": 189871, "epoch": 4520} {"train_loss": -7.248453617095947, "global_step": 189872, "epoch": 4520} {"train_loss": -7.336544990539551, "global_step": 189873, "epoch": 4520} {"train_loss": -7.333959579467773, "global_step": 189874, "epoch": 4520} {"train_loss": -7.15811824798584, "global_step": 189875, "epoch": 4520} {"train_loss": -7.249740123748779, "global_step": 189876, "epoch": 4520} {"train_loss": -7.236416816711426, "global_step": 189877, "epoch": 4520} {"train_loss": -7.314959526062012, "global_step": 189878, "epoch": 4520} {"train_loss": -7.133049488067627, "global_step": 189879, "epoch": 4520} {"train_loss": -7.2722883224487305, "global_step": 189880, "epoch": 4520} {"train_loss": -7.239400488989694, "global_step": 189881, "epoch": 4520, "val_loss": 80996.953125} {"train_loss": -7.365687370300293, "global_step": 189882, "epoch": 4521} {"train_loss": -7.242127418518066, "global_step": 189883, "epoch": 4521} {"train_loss": -7.343060493469238, "global_step": 189884, "epoch": 4521} {"train_loss": -7.223779678344727, "global_step": 189885, "epoch": 4521} {"train_loss": -7.236074924468994, "global_step": 189886, "epoch": 4521} {"train_loss": -7.253151893615723, "global_step": 189887, "epoch": 4521} {"train_loss": -7.30363130569458, "global_step": 189888, "epoch": 4521} {"train_loss": -7.27754545211792, "global_step": 189889, "epoch": 4521} {"train_loss": -7.108791351318359, "global_step": 189890, "epoch": 4521} {"train_loss": -7.12176513671875, "global_step": 189891, "epoch": 4521} {"train_loss": -7.274297714233398, "global_step": 189892, "epoch": 4521} {"train_loss": -7.185667037963867, "global_step": 189893, "epoch": 4521} {"train_loss": -7.109039306640625, "global_step": 189894, "epoch": 4521} {"train_loss": -7.168726921081543, "global_step": 189895, "epoch": 4521} {"train_loss": -7.144287109375, "global_step": 189896, "epoch": 4521} {"train_loss": -7.163059234619141, "global_step": 189897, "epoch": 4521} {"train_loss": -7.131686687469482, "global_step": 189898, "epoch": 4521} {"train_loss": -7.125836372375488, "global_step": 189899, "epoch": 4521} {"train_loss": -7.113887786865234, "global_step": 189900, "epoch": 4521} {"train_loss": -6.937542915344238, "global_step": 189901, "epoch": 4521} {"train_loss": -7.18337345123291, "global_step": 189902, "epoch": 4521} {"train_loss": -7.1821208000183105, "global_step": 189903, "epoch": 4521} {"train_loss": -7.090966701507568, "global_step": 189904, "epoch": 4521} {"train_loss": -7.120169639587402, "global_step": 189905, "epoch": 4521} {"train_loss": -7.058045387268066, "global_step": 189906, "epoch": 4521} {"train_loss": -7.070219039916992, "global_step": 189907, "epoch": 4521} {"train_loss": -7.030547618865967, "global_step": 189908, "epoch": 4521} {"train_loss": -7.262620449066162, "global_step": 189909, "epoch": 4521} {"train_loss": -6.9889140129089355, "global_step": 189910, "epoch": 4521} {"train_loss": -7.136519908905029, "global_step": 189911, "epoch": 4521} {"train_loss": -7.149294853210449, "global_step": 189912, "epoch": 4521} {"train_loss": -7.204093933105469, "global_step": 189913, "epoch": 4521} {"train_loss": -7.15565299987793, "global_step": 189914, "epoch": 4521} {"train_loss": -7.135605335235596, "global_step": 189915, "epoch": 4521} {"train_loss": -7.217230796813965, "global_step": 189916, "epoch": 4521} {"train_loss": -7.176797866821289, "global_step": 189917, "epoch": 4521} {"train_loss": -7.146592140197754, "global_step": 189918, "epoch": 4521} {"train_loss": -7.123356819152832, "global_step": 189919, "epoch": 4521} {"train_loss": -7.168972492218018, "global_step": 189920, "epoch": 4521} {"train_loss": -7.0170087814331055, "global_step": 189921, "epoch": 4521} {"train_loss": -7.192121982574463, "global_step": 189922, "epoch": 4521} {"train_loss": -7.162597667603266, "global_step": 189923, "epoch": 4521, "val_loss": 81108.7109375} {"train_loss": -7.326011657714844, "global_step": 189924, "epoch": 4522} {"train_loss": -7.186185836791992, "global_step": 189925, "epoch": 4522} {"train_loss": -7.195006370544434, "global_step": 189926, "epoch": 4522} {"train_loss": -7.192954063415527, "global_step": 189927, "epoch": 4522} {"train_loss": -7.178462982177734, "global_step": 189928, "epoch": 4522} {"train_loss": -7.212957382202148, "global_step": 189929, "epoch": 4522} {"train_loss": -7.213879585266113, "global_step": 189930, "epoch": 4522} {"train_loss": -7.211675643920898, "global_step": 189931, "epoch": 4522} {"train_loss": -7.216573715209961, "global_step": 189932, "epoch": 4522} {"train_loss": -7.235010147094727, "global_step": 189933, "epoch": 4522} {"train_loss": -7.315385341644287, "global_step": 189934, "epoch": 4522} {"train_loss": -7.210173606872559, "global_step": 189935, "epoch": 4522} {"train_loss": -7.414467811584473, "global_step": 189936, "epoch": 4522} {"train_loss": -7.207141399383545, "global_step": 189937, "epoch": 4522} {"train_loss": -7.08782958984375, "global_step": 189938, "epoch": 4522} {"train_loss": -7.312758445739746, "global_step": 189939, "epoch": 4522} {"train_loss": -7.166688919067383, "global_step": 189940, "epoch": 4522} {"train_loss": -7.2453155517578125, "global_step": 189941, "epoch": 4522} {"train_loss": -7.272009372711182, "global_step": 189942, "epoch": 4522} {"train_loss": -7.255231857299805, "global_step": 189943, "epoch": 4522} {"train_loss": -7.27449893951416, "global_step": 189944, "epoch": 4522} {"train_loss": -7.261446952819824, "global_step": 189945, "epoch": 4522} {"train_loss": -7.280602931976318, "global_step": 189946, "epoch": 4522} {"train_loss": -7.226761341094971, "global_step": 189947, "epoch": 4522} {"train_loss": -7.251246452331543, "global_step": 189948, "epoch": 4522} {"train_loss": -7.24289083480835, "global_step": 189949, "epoch": 4522} {"train_loss": -7.246084213256836, "global_step": 189950, "epoch": 4522} {"train_loss": -7.18809700012207, "global_step": 189951, "epoch": 4522} {"train_loss": -7.088691711425781, "global_step": 189952, "epoch": 4522} {"train_loss": -7.1967997550964355, "global_step": 189953, "epoch": 4522} {"train_loss": -7.261356353759766, "global_step": 189954, "epoch": 4522} {"train_loss": -7.176156997680664, "global_step": 189955, "epoch": 4522} {"train_loss": -7.1762237548828125, "global_step": 189956, "epoch": 4522} {"train_loss": -7.159560203552246, "global_step": 189957, "epoch": 4522} {"train_loss": -7.2551422119140625, "global_step": 189958, "epoch": 4522} {"train_loss": -7.222443580627441, "global_step": 189959, "epoch": 4522} {"train_loss": -7.095436096191406, "global_step": 189960, "epoch": 4522} {"train_loss": -7.214944839477539, "global_step": 189961, "epoch": 4522} {"train_loss": -7.168682098388672, "global_step": 189962, "epoch": 4522} {"train_loss": -7.14599084854126, "global_step": 189963, "epoch": 4522} {"train_loss": -7.266542911529541, "global_step": 189964, "epoch": 4522} {"train_loss": -7.219604526247297, "global_step": 189965, "epoch": 4522, "val_loss": 81112.828125} {"train_loss": -7.207162857055664, "global_step": 189966, "epoch": 4523} {"train_loss": -7.22821044921875, "global_step": 189967, "epoch": 4523} {"train_loss": -7.223699569702148, "global_step": 189968, "epoch": 4523} {"train_loss": -7.203883171081543, "global_step": 189969, "epoch": 4523} {"train_loss": -7.243189811706543, "global_step": 189970, "epoch": 4523} {"train_loss": -7.290095329284668, "global_step": 189971, "epoch": 4523} {"train_loss": -7.265140533447266, "global_step": 189972, "epoch": 4523} {"train_loss": -7.24617862701416, "global_step": 189973, "epoch": 4523} {"train_loss": -7.151556968688965, "global_step": 189974, "epoch": 4523} {"train_loss": -7.239426612854004, "global_step": 189975, "epoch": 4523} {"train_loss": -7.226872444152832, "global_step": 189976, "epoch": 4523} {"train_loss": -7.155559539794922, "global_step": 189977, "epoch": 4523} {"train_loss": -7.261132717132568, "global_step": 189978, "epoch": 4523} {"train_loss": -7.172915458679199, "global_step": 189979, "epoch": 4523} {"train_loss": -7.191446781158447, "global_step": 189980, "epoch": 4523} {"train_loss": -7.2275285720825195, "global_step": 189981, "epoch": 4523} {"train_loss": -7.276338577270508, "global_step": 189982, "epoch": 4523} {"train_loss": -7.195006370544434, "global_step": 189983, "epoch": 4523} {"train_loss": -7.12168025970459, "global_step": 189984, "epoch": 4523} {"train_loss": -7.2431440353393555, "global_step": 189985, "epoch": 4523} {"train_loss": -7.291555881500244, "global_step": 189986, "epoch": 4523} {"train_loss": -7.308652877807617, "global_step": 189987, "epoch": 4523} {"train_loss": -7.084375381469727, "global_step": 189988, "epoch": 4523} {"train_loss": -7.153910160064697, "global_step": 189989, "epoch": 4523} {"train_loss": -7.25642204284668, "global_step": 189990, "epoch": 4523} {"train_loss": -7.16755485534668, "global_step": 189991, "epoch": 4523} {"train_loss": -7.422357082366943, "global_step": 189992, "epoch": 4523} {"train_loss": -7.203474521636963, "global_step": 189993, "epoch": 4523} {"train_loss": -7.326653480529785, "global_step": 189994, "epoch": 4523} {"train_loss": -7.31741189956665, "global_step": 189995, "epoch": 4523} {"train_loss": -7.139976978302002, "global_step": 189996, "epoch": 4523} {"train_loss": -7.238101959228516, "global_step": 189997, "epoch": 4523} {"train_loss": -7.299694538116455, "global_step": 189998, "epoch": 4523} {"train_loss": -7.279608726501465, "global_step": 189999, "epoch": 4523} {"train_loss": -7.210885047912598, "global_step": 190000, "epoch": 4523} {"train_loss": -7.312664031982422, "global_step": 190001, "epoch": 4523} {"train_loss": -7.246356964111328, "global_step": 190002, "epoch": 4523} {"train_loss": -7.265854835510254, "global_step": 190003, "epoch": 4523} {"train_loss": -7.312080383300781, "global_step": 190004, "epoch": 4523} {"train_loss": -7.274096488952637, "global_step": 190005, "epoch": 4523} {"train_loss": -7.226604461669922, "global_step": 190006, "epoch": 4523} {"train_loss": -7.236325536455427, "global_step": 190007, "epoch": 4523, "val_loss": 80958.5078125} {"train_loss": -7.218366622924805, "global_step": 190008, "epoch": 4524} {"train_loss": -7.186090469360352, "global_step": 190009, "epoch": 4524} {"train_loss": -7.213841438293457, "global_step": 190010, "epoch": 4524} {"train_loss": -7.2580742835998535, "global_step": 190011, "epoch": 4524} {"train_loss": -7.253231048583984, "global_step": 190012, "epoch": 4524} {"train_loss": -7.3075666427612305, "global_step": 190013, "epoch": 4524} {"train_loss": -7.320944786071777, "global_step": 190014, "epoch": 4524} {"train_loss": -7.333578586578369, "global_step": 190015, "epoch": 4524} {"train_loss": -7.304986000061035, "global_step": 190016, "epoch": 4524} {"train_loss": -7.404421806335449, "global_step": 190017, "epoch": 4524} {"train_loss": -7.204349040985107, "global_step": 190018, "epoch": 4524} {"train_loss": -7.24326229095459, "global_step": 190019, "epoch": 4524} {"train_loss": -7.252897262573242, "global_step": 190020, "epoch": 4524} {"train_loss": -7.175388813018799, "global_step": 190021, "epoch": 4524} {"train_loss": -7.253426551818848, "global_step": 190022, "epoch": 4524} {"train_loss": -7.193423271179199, "global_step": 190023, "epoch": 4524} {"train_loss": -7.348415851593018, "global_step": 190024, "epoch": 4524} {"train_loss": -7.235594272613525, "global_step": 190025, "epoch": 4524} {"train_loss": -7.349887847900391, "global_step": 190026, "epoch": 4524} {"train_loss": -7.24024772644043, "global_step": 190027, "epoch": 4524} {"train_loss": -7.104670524597168, "global_step": 190028, "epoch": 4524} {"train_loss": -7.310481071472168, "global_step": 190029, "epoch": 4524} {"train_loss": -7.199872016906738, "global_step": 190030, "epoch": 4524} {"train_loss": -7.304245948791504, "global_step": 190031, "epoch": 4524} {"train_loss": -7.125998020172119, "global_step": 190032, "epoch": 4524} {"train_loss": -7.320652008056641, "global_step": 190033, "epoch": 4524} {"train_loss": -7.195810317993164, "global_step": 190034, "epoch": 4524} {"train_loss": -7.258729934692383, "global_step": 190035, "epoch": 4524} {"train_loss": -7.183005332946777, "global_step": 190036, "epoch": 4524} {"train_loss": -7.23500919342041, "global_step": 190037, "epoch": 4524} {"train_loss": -7.194341659545898, "global_step": 190038, "epoch": 4524} {"train_loss": -7.230309009552002, "global_step": 190039, "epoch": 4524} {"train_loss": -7.322266578674316, "global_step": 190040, "epoch": 4524} {"train_loss": -7.156736373901367, "global_step": 190041, "epoch": 4524} {"train_loss": -7.176231384277344, "global_step": 190042, "epoch": 4524} {"train_loss": -7.352422714233398, "global_step": 190043, "epoch": 4524} {"train_loss": -7.179405212402344, "global_step": 190044, "epoch": 4524} {"train_loss": -7.294428825378418, "global_step": 190045, "epoch": 4524} {"train_loss": -7.205644130706787, "global_step": 190046, "epoch": 4524} {"train_loss": -7.152965545654297, "global_step": 190047, "epoch": 4524} {"train_loss": -7.243634223937988, "global_step": 190048, "epoch": 4524} {"train_loss": -7.244586842400687, "global_step": 190049, "epoch": 4524, "val_loss": 80849.6796875} {"train_loss": -7.175364971160889, "global_step": 190050, "epoch": 4525} {"train_loss": -7.251169681549072, "global_step": 190051, "epoch": 4525} {"train_loss": -7.315934181213379, "global_step": 190052, "epoch": 4525} {"train_loss": -7.14042854309082, "global_step": 190053, "epoch": 4525} {"train_loss": -7.12178897857666, "global_step": 190054, "epoch": 4525} {"train_loss": -7.263175010681152, "global_step": 190055, "epoch": 4525} {"train_loss": -6.987394332885742, "global_step": 190056, "epoch": 4525} {"train_loss": -7.090862274169922, "global_step": 190057, "epoch": 4525} {"train_loss": -7.125982284545898, "global_step": 190058, "epoch": 4525} {"train_loss": -7.050122261047363, "global_step": 190059, "epoch": 4525} {"train_loss": -7.182389736175537, "global_step": 190060, "epoch": 4525} {"train_loss": -7.068650245666504, "global_step": 190061, "epoch": 4525} {"train_loss": -7.013946533203125, "global_step": 190062, "epoch": 4525} {"train_loss": -7.168416976928711, "global_step": 190063, "epoch": 4525} {"train_loss": -7.1293721199035645, "global_step": 190064, "epoch": 4525} {"train_loss": -7.03336238861084, "global_step": 190065, "epoch": 4525} {"train_loss": -7.17311954498291, "global_step": 190066, "epoch": 4525} {"train_loss": -7.179417610168457, "global_step": 190067, "epoch": 4525} {"train_loss": -7.180977821350098, "global_step": 190068, "epoch": 4525} {"train_loss": -7.204873561859131, "global_step": 190069, "epoch": 4525} {"train_loss": -7.190381050109863, "global_step": 190070, "epoch": 4525} {"train_loss": -7.243666648864746, "global_step": 190071, "epoch": 4525} {"train_loss": -7.151165962219238, "global_step": 190072, "epoch": 4525} {"train_loss": -7.1643595695495605, "global_step": 190073, "epoch": 4525} {"train_loss": -7.24778938293457, "global_step": 190074, "epoch": 4525} {"train_loss": -7.145961761474609, "global_step": 190075, "epoch": 4525} {"train_loss": -7.147336483001709, "global_step": 190076, "epoch": 4525} {"train_loss": -7.203502655029297, "global_step": 190077, "epoch": 4525} {"train_loss": -7.207374572753906, "global_step": 190078, "epoch": 4525} {"train_loss": -7.246284008026123, "global_step": 190079, "epoch": 4525} {"train_loss": -7.015664577484131, "global_step": 190080, "epoch": 4525} {"train_loss": -7.249096870422363, "global_step": 190081, "epoch": 4525} {"train_loss": -7.163465976715088, "global_step": 190082, "epoch": 4525} {"train_loss": -7.184046745300293, "global_step": 190083, "epoch": 4525} {"train_loss": -7.1483635902404785, "global_step": 190084, "epoch": 4525} {"train_loss": -7.29443359375, "global_step": 190085, "epoch": 4525} {"train_loss": -7.1988725662231445, "global_step": 190086, "epoch": 4525} {"train_loss": -7.156745910644531, "global_step": 190087, "epoch": 4525} {"train_loss": -7.09849214553833, "global_step": 190088, "epoch": 4525} {"train_loss": -7.095015525817871, "global_step": 190089, "epoch": 4525} {"train_loss": -7.133670806884766, "global_step": 190090, "epoch": 4525} {"train_loss": -7.154404549371629, "global_step": 190091, "epoch": 4525, "val_loss": 80742.8515625} {"train_loss": -7.131721019744873, "global_step": 190092, "epoch": 4526} {"train_loss": -6.983150482177734, "global_step": 190093, "epoch": 4526} {"train_loss": -7.164862632751465, "global_step": 190094, "epoch": 4526} {"train_loss": -7.060027122497559, "global_step": 190095, "epoch": 4526} {"train_loss": -7.0714430809021, "global_step": 190096, "epoch": 4526} {"train_loss": -7.1809401512146, "global_step": 190097, "epoch": 4526} {"train_loss": -7.083313941955566, "global_step": 190098, "epoch": 4526} {"train_loss": -7.146235466003418, "global_step": 190099, "epoch": 4526} {"train_loss": -7.079317092895508, "global_step": 190100, "epoch": 4526} {"train_loss": -6.973446846008301, "global_step": 190101, "epoch": 4526} {"train_loss": -7.101691246032715, "global_step": 190102, "epoch": 4526} {"train_loss": -7.094296455383301, "global_step": 190103, "epoch": 4526} {"train_loss": -7.088134765625, "global_step": 190104, "epoch": 4526} {"train_loss": -7.1240129470825195, "global_step": 190105, "epoch": 4526} {"train_loss": -7.221930980682373, "global_step": 190106, "epoch": 4526} {"train_loss": -7.169817924499512, "global_step": 190107, "epoch": 4526} {"train_loss": -7.2996649742126465, "global_step": 190108, "epoch": 4526} {"train_loss": -7.253813743591309, "global_step": 190109, "epoch": 4526} {"train_loss": -7.235926151275635, "global_step": 190110, "epoch": 4526} {"train_loss": -7.169262409210205, "global_step": 190111, "epoch": 4526} {"train_loss": -7.2943525314331055, "global_step": 190112, "epoch": 4526} {"train_loss": -7.1816487312316895, "global_step": 190113, "epoch": 4526} {"train_loss": -7.238282203674316, "global_step": 190114, "epoch": 4526} {"train_loss": -7.190769195556641, "global_step": 190115, "epoch": 4526} {"train_loss": -7.233666896820068, "global_step": 190116, "epoch": 4526} {"train_loss": -7.177676677703857, "global_step": 190117, "epoch": 4526} {"train_loss": -7.21458625793457, "global_step": 190118, "epoch": 4526} {"train_loss": -7.137547016143799, "global_step": 190119, "epoch": 4526} {"train_loss": -7.147663116455078, "global_step": 190120, "epoch": 4526} {"train_loss": -7.216885566711426, "global_step": 190121, "epoch": 4526} {"train_loss": -7.297783851623535, "global_step": 190122, "epoch": 4526} {"train_loss": -7.170866012573242, "global_step": 190123, "epoch": 4526} {"train_loss": -7.251811981201172, "global_step": 190124, "epoch": 4526} {"train_loss": -7.281390190124512, "global_step": 190125, "epoch": 4526} {"train_loss": -7.352220058441162, "global_step": 190126, "epoch": 4526} {"train_loss": -7.147704124450684, "global_step": 190127, "epoch": 4526} {"train_loss": -7.234166145324707, "global_step": 190128, "epoch": 4526} {"train_loss": -7.252636432647705, "global_step": 190129, "epoch": 4526} {"train_loss": -7.194568634033203, "global_step": 190130, "epoch": 4526} {"train_loss": -7.169345855712891, "global_step": 190131, "epoch": 4526} {"train_loss": -7.232414722442627, "global_step": 190132, "epoch": 4526} {"train_loss": -7.178063415345692, "global_step": 190133, "epoch": 4526, "val_loss": 80904.2421875} {"train_loss": -7.362200736999512, "global_step": 190134, "epoch": 4527} {"train_loss": -7.173563003540039, "global_step": 190135, "epoch": 4527} {"train_loss": -7.308999061584473, "global_step": 190136, "epoch": 4527} {"train_loss": -7.169217109680176, "global_step": 190137, "epoch": 4527} {"train_loss": -7.168038845062256, "global_step": 190138, "epoch": 4527} {"train_loss": -7.1545610427856445, "global_step": 190139, "epoch": 4527} {"train_loss": -7.198601245880127, "global_step": 190140, "epoch": 4527} {"train_loss": -7.193734645843506, "global_step": 190141, "epoch": 4527} {"train_loss": -7.204848766326904, "global_step": 190142, "epoch": 4527} {"train_loss": -7.268450736999512, "global_step": 190143, "epoch": 4527} {"train_loss": -7.157758712768555, "global_step": 190144, "epoch": 4527} {"train_loss": -7.301155090332031, "global_step": 190145, "epoch": 4527} {"train_loss": -7.341809272766113, "global_step": 190146, "epoch": 4527} {"train_loss": -7.224941730499268, "global_step": 190147, "epoch": 4527} {"train_loss": -7.247195720672607, "global_step": 190148, "epoch": 4527} {"train_loss": -7.229557991027832, "global_step": 190149, "epoch": 4527} {"train_loss": -7.26096773147583, "global_step": 190150, "epoch": 4527} {"train_loss": -7.2349138259887695, "global_step": 190151, "epoch": 4527} {"train_loss": -7.2345685958862305, "global_step": 190152, "epoch": 4527} {"train_loss": -7.287522315979004, "global_step": 190153, "epoch": 4527} {"train_loss": -7.346804618835449, "global_step": 190154, "epoch": 4527} {"train_loss": -7.271284580230713, "global_step": 190155, "epoch": 4527} {"train_loss": -7.185147762298584, "global_step": 190156, "epoch": 4527} {"train_loss": -7.330673694610596, "global_step": 190157, "epoch": 4527} {"train_loss": -7.34696102142334, "global_step": 190158, "epoch": 4527} {"train_loss": -7.291094779968262, "global_step": 190159, "epoch": 4527} {"train_loss": -7.311427116394043, "global_step": 190160, "epoch": 4527} {"train_loss": -7.191980361938477, "global_step": 190161, "epoch": 4527} {"train_loss": -7.262171745300293, "global_step": 190162, "epoch": 4527} {"train_loss": -7.132821083068848, "global_step": 190163, "epoch": 4527} {"train_loss": -7.170938491821289, "global_step": 190164, "epoch": 4527} {"train_loss": -7.089931964874268, "global_step": 190165, "epoch": 4527} {"train_loss": -7.321065425872803, "global_step": 190166, "epoch": 4527} {"train_loss": -7.2479047775268555, "global_step": 190167, "epoch": 4527} {"train_loss": -7.258581161499023, "global_step": 190168, "epoch": 4527} {"train_loss": -7.295971870422363, "global_step": 190169, "epoch": 4527} {"train_loss": -7.33641242980957, "global_step": 190170, "epoch": 4527} {"train_loss": -7.264133453369141, "global_step": 190171, "epoch": 4527} {"train_loss": -7.167158126831055, "global_step": 190172, "epoch": 4527} {"train_loss": -7.272971153259277, "global_step": 190173, "epoch": 4527} {"train_loss": -7.237451553344727, "global_step": 190174, "epoch": 4527} {"train_loss": -7.2443208921523325, "global_step": 190175, "epoch": 4527, "val_loss": 81088.921875} {"train_loss": -7.2111663818359375, "global_step": 190176, "epoch": 4528} {"train_loss": -7.32033109664917, "global_step": 190177, "epoch": 4528} {"train_loss": -7.1572465896606445, "global_step": 190178, "epoch": 4528} {"train_loss": -7.212131500244141, "global_step": 190179, "epoch": 4528} {"train_loss": -7.25136661529541, "global_step": 190180, "epoch": 4528} {"train_loss": -7.259848594665527, "global_step": 190181, "epoch": 4528} {"train_loss": -7.269015312194824, "global_step": 190182, "epoch": 4528} {"train_loss": -7.283274173736572, "global_step": 190183, "epoch": 4528} {"train_loss": -7.207137584686279, "global_step": 190184, "epoch": 4528} {"train_loss": -7.284052848815918, "global_step": 190185, "epoch": 4528} {"train_loss": -7.289865493774414, "global_step": 190186, "epoch": 4528} {"train_loss": -7.198946952819824, "global_step": 190187, "epoch": 4528} {"train_loss": -7.2351531982421875, "global_step": 190188, "epoch": 4528} {"train_loss": -7.265608787536621, "global_step": 190189, "epoch": 4528} {"train_loss": -7.236878871917725, "global_step": 190190, "epoch": 4528} {"train_loss": -7.260530471801758, "global_step": 190191, "epoch": 4528} {"train_loss": -7.237098693847656, "global_step": 190192, "epoch": 4528} {"train_loss": -7.206658363342285, "global_step": 190193, "epoch": 4528} {"train_loss": -7.278304576873779, "global_step": 190194, "epoch": 4528} {"train_loss": -7.194461822509766, "global_step": 190195, "epoch": 4528} {"train_loss": -7.074013710021973, "global_step": 190196, "epoch": 4528} {"train_loss": -7.192787170410156, "global_step": 190197, "epoch": 4528} {"train_loss": -7.237678527832031, "global_step": 190198, "epoch": 4528} {"train_loss": -7.031556606292725, "global_step": 190199, "epoch": 4528} {"train_loss": -7.248354434967041, "global_step": 190200, "epoch": 4528} {"train_loss": -7.193799018859863, "global_step": 190201, "epoch": 4528} {"train_loss": -7.209184169769287, "global_step": 190202, "epoch": 4528} {"train_loss": -7.245471000671387, "global_step": 190203, "epoch": 4528} {"train_loss": -7.028799533843994, "global_step": 190204, "epoch": 4528} {"train_loss": -7.262944221496582, "global_step": 190205, "epoch": 4528} {"train_loss": -7.284734725952148, "global_step": 190206, "epoch": 4528} {"train_loss": -7.021728515625, "global_step": 190207, "epoch": 4528} {"train_loss": -7.187281608581543, "global_step": 190208, "epoch": 4528} {"train_loss": -7.178013801574707, "global_step": 190209, "epoch": 4528} {"train_loss": -7.291043281555176, "global_step": 190210, "epoch": 4528} {"train_loss": -7.157151222229004, "global_step": 190211, "epoch": 4528} {"train_loss": -7.130054473876953, "global_step": 190212, "epoch": 4528} {"train_loss": -7.11241340637207, "global_step": 190213, "epoch": 4528} {"train_loss": -7.10257625579834, "global_step": 190214, "epoch": 4528} {"train_loss": -7.235467910766602, "global_step": 190215, "epoch": 4528} {"train_loss": -7.173923492431641, "global_step": 190216, "epoch": 4528} {"train_loss": -7.205960126150222, "global_step": 190217, "epoch": 4528, "val_loss": 80817.7890625} {"train_loss": -7.295421600341797, "global_step": 190218, "epoch": 4529} {"train_loss": -7.121774196624756, "global_step": 190219, "epoch": 4529} {"train_loss": -7.158290863037109, "global_step": 190220, "epoch": 4529} {"train_loss": -7.135679244995117, "global_step": 190221, "epoch": 4529} {"train_loss": -7.176020622253418, "global_step": 190222, "epoch": 4529} {"train_loss": -7.211082458496094, "global_step": 190223, "epoch": 4529} {"train_loss": -7.138642311096191, "global_step": 190224, "epoch": 4529} {"train_loss": -7.066920280456543, "global_step": 190225, "epoch": 4529} {"train_loss": -7.134238243103027, "global_step": 190226, "epoch": 4529} {"train_loss": -7.207937717437744, "global_step": 190227, "epoch": 4529} {"train_loss": -6.825545310974121, "global_step": 190228, "epoch": 4529} {"train_loss": -7.027299880981445, "global_step": 190229, "epoch": 4529} {"train_loss": -7.074151992797852, "global_step": 190230, "epoch": 4529} {"train_loss": -7.082274436950684, "global_step": 190231, "epoch": 4529} {"train_loss": -7.125280857086182, "global_step": 190232, "epoch": 4529} {"train_loss": -7.032422065734863, "global_step": 190233, "epoch": 4529} {"train_loss": -7.13705587387085, "global_step": 190234, "epoch": 4529} {"train_loss": -7.091220855712891, "global_step": 190235, "epoch": 4529} {"train_loss": -7.111341953277588, "global_step": 190236, "epoch": 4529} {"train_loss": -7.076789855957031, "global_step": 190237, "epoch": 4529} {"train_loss": -7.1444091796875, "global_step": 190238, "epoch": 4529} {"train_loss": -7.024935722351074, "global_step": 190239, "epoch": 4529} {"train_loss": -7.207512855529785, "global_step": 190240, "epoch": 4529} {"train_loss": -7.028275489807129, "global_step": 190241, "epoch": 4529} {"train_loss": -7.160199165344238, "global_step": 190242, "epoch": 4529} {"train_loss": -7.042657375335693, "global_step": 190243, "epoch": 4529} {"train_loss": -7.169373512268066, "global_step": 190244, "epoch": 4529} {"train_loss": -7.121461391448975, "global_step": 190245, "epoch": 4529} {"train_loss": -7.024236679077148, "global_step": 190246, "epoch": 4529} {"train_loss": -7.125279903411865, "global_step": 190247, "epoch": 4529} {"train_loss": -7.057381629943848, "global_step": 190248, "epoch": 4529} {"train_loss": -7.1340532302856445, "global_step": 190249, "epoch": 4529} {"train_loss": -7.076325416564941, "global_step": 190250, "epoch": 4529} {"train_loss": -7.187912940979004, "global_step": 190251, "epoch": 4529} {"train_loss": -7.078563690185547, "global_step": 190252, "epoch": 4529} {"train_loss": -7.117944240570068, "global_step": 190253, "epoch": 4529} {"train_loss": -7.006549835205078, "global_step": 190254, "epoch": 4529} {"train_loss": -7.075312614440918, "global_step": 190255, "epoch": 4529} {"train_loss": -7.058402061462402, "global_step": 190256, "epoch": 4529} {"train_loss": -7.185290336608887, "global_step": 190257, "epoch": 4529} {"train_loss": -7.129535675048828, "global_step": 190258, "epoch": 4529} {"train_loss": -7.108523187183199, "global_step": 190259, "epoch": 4529, "val_loss": 81067.1640625} {"train_loss": -7.194312572479248, "global_step": 190260, "epoch": 4530} {"train_loss": -7.063076019287109, "global_step": 190261, "epoch": 4530} {"train_loss": -7.292247772216797, "global_step": 190262, "epoch": 4530} {"train_loss": -7.11197566986084, "global_step": 190263, "epoch": 4530} {"train_loss": -7.0794477462768555, "global_step": 190264, "epoch": 4530} {"train_loss": -7.1057305335998535, "global_step": 190265, "epoch": 4530} {"train_loss": -7.194916725158691, "global_step": 190266, "epoch": 4530} {"train_loss": -7.165701866149902, "global_step": 190267, "epoch": 4530} {"train_loss": -7.103603363037109, "global_step": 190268, "epoch": 4530} {"train_loss": -7.081713676452637, "global_step": 190269, "epoch": 4530} {"train_loss": -7.235064506530762, "global_step": 190270, "epoch": 4530} {"train_loss": -7.107639312744141, "global_step": 190271, "epoch": 4530} {"train_loss": -7.308692932128906, "global_step": 190272, "epoch": 4530} {"train_loss": -7.148013114929199, "global_step": 190273, "epoch": 4530} {"train_loss": -7.203033447265625, "global_step": 190274, "epoch": 4530} {"train_loss": -7.101868629455566, "global_step": 190275, "epoch": 4530} {"train_loss": -7.2848711013793945, "global_step": 190276, "epoch": 4530} {"train_loss": -7.020377159118652, "global_step": 190277, "epoch": 4530} {"train_loss": -7.027063369750977, "global_step": 190278, "epoch": 4530} {"train_loss": -7.176851749420166, "global_step": 190279, "epoch": 4530} {"train_loss": -7.208239555358887, "global_step": 190280, "epoch": 4530} {"train_loss": -7.152921676635742, "global_step": 190281, "epoch": 4530} {"train_loss": -7.1419677734375, "global_step": 190282, "epoch": 4530} {"train_loss": -7.058708190917969, "global_step": 190283, "epoch": 4530} {"train_loss": -7.128827095031738, "global_step": 190284, "epoch": 4530} {"train_loss": -7.2389020919799805, "global_step": 190285, "epoch": 4530} {"train_loss": -7.225937843322754, "global_step": 190286, "epoch": 4530} {"train_loss": -7.164466857910156, "global_step": 190287, "epoch": 4530} {"train_loss": -7.20249080657959, "global_step": 190288, "epoch": 4530} {"train_loss": -7.207716941833496, "global_step": 190289, "epoch": 4530} {"train_loss": -7.123737335205078, "global_step": 190290, "epoch": 4530} {"train_loss": -7.196192741394043, "global_step": 190291, "epoch": 4530} {"train_loss": -7.132526397705078, "global_step": 190292, "epoch": 4530} {"train_loss": -7.259646415710449, "global_step": 190293, "epoch": 4530} {"train_loss": -7.177840232849121, "global_step": 190294, "epoch": 4530} {"train_loss": -7.213801383972168, "global_step": 190295, "epoch": 4530} {"train_loss": -7.296169281005859, "global_step": 190296, "epoch": 4530} {"train_loss": -7.212099552154541, "global_step": 190297, "epoch": 4530} {"train_loss": -7.222932815551758, "global_step": 190298, "epoch": 4530} {"train_loss": -7.136721134185791, "global_step": 190299, "epoch": 4530} {"train_loss": -7.257840633392334, "global_step": 190300, "epoch": 4530} {"train_loss": -7.1684223129635765, "global_step": 190301, "epoch": 4530, "val_loss": 81079.6953125} {"train_loss": -7.259674072265625, "global_step": 190302, "epoch": 4531} {"train_loss": -7.308297634124756, "global_step": 190303, "epoch": 4531} {"train_loss": -7.290339469909668, "global_step": 190304, "epoch": 4531} {"train_loss": -7.180638313293457, "global_step": 190305, "epoch": 4531} {"train_loss": -7.308643817901611, "global_step": 190306, "epoch": 4531} {"train_loss": -7.225929260253906, "global_step": 190307, "epoch": 4531} {"train_loss": -7.229346752166748, "global_step": 190308, "epoch": 4531} {"train_loss": -7.280368804931641, "global_step": 190309, "epoch": 4531} {"train_loss": -7.1677141189575195, "global_step": 190310, "epoch": 4531} {"train_loss": -7.169872283935547, "global_step": 190311, "epoch": 4531} {"train_loss": -7.184535503387451, "global_step": 190312, "epoch": 4531} {"train_loss": -7.278852939605713, "global_step": 190313, "epoch": 4531} {"train_loss": -7.2702836990356445, "global_step": 190314, "epoch": 4531} {"train_loss": -7.367042541503906, "global_step": 190315, "epoch": 4531} {"train_loss": -7.211954116821289, "global_step": 190316, "epoch": 4531} {"train_loss": -7.244907379150391, "global_step": 190317, "epoch": 4531} {"train_loss": -7.320786952972412, "global_step": 190318, "epoch": 4531} {"train_loss": -7.175807476043701, "global_step": 190319, "epoch": 4531} {"train_loss": -7.136653900146484, "global_step": 190320, "epoch": 4531} {"train_loss": -7.282087326049805, "global_step": 190321, "epoch": 4531} {"train_loss": -7.269923686981201, "global_step": 190322, "epoch": 4531} {"train_loss": -7.103151321411133, "global_step": 190323, "epoch": 4531} {"train_loss": -7.1922688484191895, "global_step": 190324, "epoch": 4531} {"train_loss": -7.238461017608643, "global_step": 190325, "epoch": 4531} {"train_loss": -7.314950942993164, "global_step": 190326, "epoch": 4531} {"train_loss": -7.375903606414795, "global_step": 190327, "epoch": 4531} {"train_loss": -7.255071640014648, "global_step": 190328, "epoch": 4531} {"train_loss": -7.181816101074219, "global_step": 190329, "epoch": 4531} {"train_loss": -7.321581840515137, "global_step": 190330, "epoch": 4531} {"train_loss": -7.1649274826049805, "global_step": 190331, "epoch": 4531} {"train_loss": -7.365670204162598, "global_step": 190332, "epoch": 4531} {"train_loss": -7.327426433563232, "global_step": 190333, "epoch": 4531} {"train_loss": -7.096653938293457, "global_step": 190334, "epoch": 4531} {"train_loss": -7.209061622619629, "global_step": 190335, "epoch": 4531} {"train_loss": -7.117328643798828, "global_step": 190336, "epoch": 4531} {"train_loss": -7.196183681488037, "global_step": 190337, "epoch": 4531} {"train_loss": -7.3087873458862305, "global_step": 190338, "epoch": 4531} {"train_loss": -7.179711818695068, "global_step": 190339, "epoch": 4531} {"train_loss": -7.140316009521484, "global_step": 190340, "epoch": 4531} {"train_loss": -7.169658184051514, "global_step": 190341, "epoch": 4531} {"train_loss": -7.140969276428223, "global_step": 190342, "epoch": 4531} {"train_loss": -7.230771655128116, "global_step": 190343, "epoch": 4531, "val_loss": 80801.9140625} {"train_loss": -7.198424339294434, "global_step": 190344, "epoch": 4532} {"train_loss": -7.132627487182617, "global_step": 190345, "epoch": 4532} {"train_loss": -7.269935607910156, "global_step": 190346, "epoch": 4532} {"train_loss": -7.046843528747559, "global_step": 190347, "epoch": 4532} {"train_loss": -7.206031799316406, "global_step": 190348, "epoch": 4532} {"train_loss": -7.252992630004883, "global_step": 190349, "epoch": 4532} {"train_loss": -7.185891151428223, "global_step": 190350, "epoch": 4532} {"train_loss": -7.170843124389648, "global_step": 190351, "epoch": 4532} {"train_loss": -7.128504753112793, "global_step": 190352, "epoch": 4532} {"train_loss": -7.286890983581543, "global_step": 190353, "epoch": 4532} {"train_loss": -7.288558006286621, "global_step": 190354, "epoch": 4532} {"train_loss": -7.022572994232178, "global_step": 190355, "epoch": 4532} {"train_loss": -7.216324329376221, "global_step": 190356, "epoch": 4532} {"train_loss": -7.18928337097168, "global_step": 190357, "epoch": 4532} {"train_loss": -7.189937591552734, "global_step": 190358, "epoch": 4532} {"train_loss": -7.242868423461914, "global_step": 190359, "epoch": 4532} {"train_loss": -7.2561492919921875, "global_step": 190360, "epoch": 4532} {"train_loss": -7.231070518493652, "global_step": 190361, "epoch": 4532} {"train_loss": -7.165129661560059, "global_step": 190362, "epoch": 4532} {"train_loss": -7.210714340209961, "global_step": 190363, "epoch": 4532} {"train_loss": -7.241701126098633, "global_step": 190364, "epoch": 4532} {"train_loss": -7.011479377746582, "global_step": 190365, "epoch": 4532} {"train_loss": -7.155487060546875, "global_step": 190366, "epoch": 4532} {"train_loss": -7.206297874450684, "global_step": 190367, "epoch": 4532} {"train_loss": -7.220460891723633, "global_step": 190368, "epoch": 4532} {"train_loss": -7.273507118225098, "global_step": 190369, "epoch": 4532} {"train_loss": -7.169577121734619, "global_step": 190370, "epoch": 4532} {"train_loss": -7.252774238586426, "global_step": 190371, "epoch": 4532} {"train_loss": -7.243136405944824, "global_step": 190372, "epoch": 4532} {"train_loss": -7.212703704833984, "global_step": 190373, "epoch": 4532} {"train_loss": -7.186862468719482, "global_step": 190374, "epoch": 4532} {"train_loss": -7.230063438415527, "global_step": 190375, "epoch": 4532} {"train_loss": -7.172928810119629, "global_step": 190376, "epoch": 4532} {"train_loss": -7.212740421295166, "global_step": 190377, "epoch": 4532} {"train_loss": -7.249005317687988, "global_step": 190378, "epoch": 4532} {"train_loss": -7.206489562988281, "global_step": 190379, "epoch": 4532} {"train_loss": -7.262209892272949, "global_step": 190380, "epoch": 4532} {"train_loss": -7.229629039764404, "global_step": 190381, "epoch": 4532} {"train_loss": -7.225542068481445, "global_step": 190382, "epoch": 4532} {"train_loss": -7.214590549468994, "global_step": 190383, "epoch": 4532} {"train_loss": -7.043381214141846, "global_step": 190384, "epoch": 4532} {"train_loss": -7.198597431182861, "global_step": 190385, "epoch": 4532, "val_loss": 80884.4375} {"train_loss": -7.059506416320801, "global_step": 190386, "epoch": 4533} {"train_loss": -7.204106330871582, "global_step": 190387, "epoch": 4533} {"train_loss": -7.2537994384765625, "global_step": 190388, "epoch": 4533} {"train_loss": -7.291210651397705, "global_step": 190389, "epoch": 4533} {"train_loss": -7.231574058532715, "global_step": 190390, "epoch": 4533} {"train_loss": -7.109007835388184, "global_step": 190391, "epoch": 4533} {"train_loss": -7.224344253540039, "global_step": 190392, "epoch": 4533} {"train_loss": -7.334054946899414, "global_step": 190393, "epoch": 4533} {"train_loss": -7.298535346984863, "global_step": 190394, "epoch": 4533} {"train_loss": -7.28127384185791, "global_step": 190395, "epoch": 4533} {"train_loss": -7.291059494018555, "global_step": 190396, "epoch": 4533} {"train_loss": -7.300346374511719, "global_step": 190397, "epoch": 4533} {"train_loss": -7.356939315795898, "global_step": 190398, "epoch": 4533} {"train_loss": -7.323351860046387, "global_step": 190399, "epoch": 4533} {"train_loss": -7.284066200256348, "global_step": 190400, "epoch": 4533} {"train_loss": -7.207723140716553, "global_step": 190401, "epoch": 4533} {"train_loss": -7.235241889953613, "global_step": 190402, "epoch": 4533} {"train_loss": -7.263847827911377, "global_step": 190403, "epoch": 4533} {"train_loss": -7.159934043884277, "global_step": 190404, "epoch": 4533} {"train_loss": -7.21311092376709, "global_step": 190405, "epoch": 4533} {"train_loss": -7.299996376037598, "global_step": 190406, "epoch": 4533} {"train_loss": -7.245363235473633, "global_step": 190407, "epoch": 4533} {"train_loss": -7.24568510055542, "global_step": 190408, "epoch": 4533} {"train_loss": -7.25380802154541, "global_step": 190409, "epoch": 4533} {"train_loss": -7.151027679443359, "global_step": 190410, "epoch": 4533} {"train_loss": -7.11937141418457, "global_step": 190411, "epoch": 4533} {"train_loss": -7.350240707397461, "global_step": 190412, "epoch": 4533} {"train_loss": -7.2160468101501465, "global_step": 190413, "epoch": 4533} {"train_loss": -7.2178754806518555, "global_step": 190414, "epoch": 4533} {"train_loss": -7.212759017944336, "global_step": 190415, "epoch": 4533} {"train_loss": -7.226473808288574, "global_step": 190416, "epoch": 4533} {"train_loss": -7.203705787658691, "global_step": 190417, "epoch": 4533} {"train_loss": -7.231197357177734, "global_step": 190418, "epoch": 4533} {"train_loss": -7.205065727233887, "global_step": 190419, "epoch": 4533} {"train_loss": -7.117802619934082, "global_step": 190420, "epoch": 4533} {"train_loss": -7.116156101226807, "global_step": 190421, "epoch": 4533} {"train_loss": -7.016049385070801, "global_step": 190422, "epoch": 4533} {"train_loss": -7.2938232421875, "global_step": 190423, "epoch": 4533} {"train_loss": -7.2659711837768555, "global_step": 190424, "epoch": 4533} {"train_loss": -7.219425201416016, "global_step": 190425, "epoch": 4533} {"train_loss": -7.257512092590332, "global_step": 190426, "epoch": 4533} {"train_loss": -7.227574961526053, "global_step": 190427, "epoch": 4533, "val_loss": 80946.90625} {"train_loss": -7.231507301330566, "global_step": 190428, "epoch": 4534} {"train_loss": -7.24716854095459, "global_step": 190429, "epoch": 4534} {"train_loss": -7.17673397064209, "global_step": 190430, "epoch": 4534} {"train_loss": -7.247107982635498, "global_step": 190431, "epoch": 4534} {"train_loss": -7.2899980545043945, "global_step": 190432, "epoch": 4534} {"train_loss": -7.23570442199707, "global_step": 190433, "epoch": 4534} {"train_loss": -7.189281463623047, "global_step": 190434, "epoch": 4534} {"train_loss": -7.210284233093262, "global_step": 190435, "epoch": 4534} {"train_loss": -7.206042289733887, "global_step": 190436, "epoch": 4534} {"train_loss": -7.332430839538574, "global_step": 190437, "epoch": 4534} {"train_loss": -7.196831703186035, "global_step": 190438, "epoch": 4534} {"train_loss": -7.036369800567627, "global_step": 190439, "epoch": 4534} {"train_loss": -7.291204929351807, "global_step": 190440, "epoch": 4534} {"train_loss": -7.087149620056152, "global_step": 190441, "epoch": 4534} {"train_loss": -7.1006760597229, "global_step": 190442, "epoch": 4534} {"train_loss": -7.211069107055664, "global_step": 190443, "epoch": 4534} {"train_loss": -7.143171787261963, "global_step": 190444, "epoch": 4534} {"train_loss": -7.01992130279541, "global_step": 190445, "epoch": 4534} {"train_loss": -7.139009952545166, "global_step": 190446, "epoch": 4534} {"train_loss": -7.222438812255859, "global_step": 190447, "epoch": 4534} {"train_loss": -7.102747917175293, "global_step": 190448, "epoch": 4534} {"train_loss": -7.211867332458496, "global_step": 190449, "epoch": 4534} {"train_loss": -7.212364196777344, "global_step": 190450, "epoch": 4534} {"train_loss": -7.281023979187012, "global_step": 190451, "epoch": 4534} {"train_loss": -7.194818019866943, "global_step": 190452, "epoch": 4534} {"train_loss": -7.149116039276123, "global_step": 190453, "epoch": 4534} {"train_loss": -7.104874610900879, "global_step": 190454, "epoch": 4534} {"train_loss": -7.160346031188965, "global_step": 190455, "epoch": 4534} {"train_loss": -7.118060111999512, "global_step": 190456, "epoch": 4534} {"train_loss": -7.160481929779053, "global_step": 190457, "epoch": 4534} {"train_loss": -7.113869667053223, "global_step": 190458, "epoch": 4534} {"train_loss": -7.156282424926758, "global_step": 190459, "epoch": 4534} {"train_loss": -7.346933841705322, "global_step": 190460, "epoch": 4534} {"train_loss": -7.2726263999938965, "global_step": 190461, "epoch": 4534} {"train_loss": -7.260440826416016, "global_step": 190462, "epoch": 4534} {"train_loss": -7.203115463256836, "global_step": 190463, "epoch": 4534} {"train_loss": -7.162374973297119, "global_step": 190464, "epoch": 4534} {"train_loss": -7.171485900878906, "global_step": 190465, "epoch": 4534} {"train_loss": -7.243166923522949, "global_step": 190466, "epoch": 4534} {"train_loss": -7.1724677085876465, "global_step": 190467, "epoch": 4534} {"train_loss": -7.300717353820801, "global_step": 190468, "epoch": 4534} {"train_loss": -7.1945105620792935, "global_step": 190469, "epoch": 4534, "val_loss": 81156.984375} {"train_loss": -7.084709167480469, "global_step": 190470, "epoch": 4535} {"train_loss": -7.396821975708008, "global_step": 190471, "epoch": 4535} {"train_loss": -7.27680778503418, "global_step": 190472, "epoch": 4535} {"train_loss": -7.113760948181152, "global_step": 190473, "epoch": 4535} {"train_loss": -7.140660762786865, "global_step": 190474, "epoch": 4535} {"train_loss": -7.252593994140625, "global_step": 190475, "epoch": 4535} {"train_loss": -7.1116132736206055, "global_step": 190476, "epoch": 4535} {"train_loss": -7.308550834655762, "global_step": 190477, "epoch": 4535} {"train_loss": -7.012266635894775, "global_step": 190478, "epoch": 4535} {"train_loss": -7.186799049377441, "global_step": 190479, "epoch": 4535} {"train_loss": -7.23306941986084, "global_step": 190480, "epoch": 4535} {"train_loss": -7.147111892700195, "global_step": 190481, "epoch": 4535} {"train_loss": -7.273816108703613, "global_step": 190482, "epoch": 4535} {"train_loss": -7.225149154663086, "global_step": 190483, "epoch": 4535} {"train_loss": -7.263543605804443, "global_step": 190484, "epoch": 4535} {"train_loss": -7.073087692260742, "global_step": 190485, "epoch": 4535} {"train_loss": -7.387975692749023, "global_step": 190486, "epoch": 4535} {"train_loss": -7.1527252197265625, "global_step": 190487, "epoch": 4535} {"train_loss": -7.2022294998168945, "global_step": 190488, "epoch": 4535} {"train_loss": -7.202886581420898, "global_step": 190489, "epoch": 4535} {"train_loss": -7.1295576095581055, "global_step": 190490, "epoch": 4535} {"train_loss": -7.169441223144531, "global_step": 190491, "epoch": 4535} {"train_loss": -7.284948348999023, "global_step": 190492, "epoch": 4535} {"train_loss": -7.004150867462158, "global_step": 190493, "epoch": 4535} {"train_loss": -7.163600444793701, "global_step": 190494, "epoch": 4535} {"train_loss": -7.1318464279174805, "global_step": 190495, "epoch": 4535} {"train_loss": -7.145607948303223, "global_step": 190496, "epoch": 4535} {"train_loss": -7.0739946365356445, "global_step": 190497, "epoch": 4535} {"train_loss": -7.2431864738464355, "global_step": 190498, "epoch": 4535} {"train_loss": -7.195040225982666, "global_step": 190499, "epoch": 4535} {"train_loss": -7.073246002197266, "global_step": 190500, "epoch": 4535} {"train_loss": -7.270998001098633, "global_step": 190501, "epoch": 4535} {"train_loss": -7.276204586029053, "global_step": 190502, "epoch": 4535} {"train_loss": -7.247920036315918, "global_step": 190503, "epoch": 4535} {"train_loss": -7.117170810699463, "global_step": 190504, "epoch": 4535} {"train_loss": -7.173183441162109, "global_step": 190505, "epoch": 4535} {"train_loss": -7.284275054931641, "global_step": 190506, "epoch": 4535} {"train_loss": -7.2115020751953125, "global_step": 190507, "epoch": 4535} {"train_loss": -7.043229103088379, "global_step": 190508, "epoch": 4535} {"train_loss": -7.095728874206543, "global_step": 190509, "epoch": 4535} {"train_loss": -7.244647979736328, "global_step": 190510, "epoch": 4535} {"train_loss": -7.1876561641693115, "global_step": 190511, "epoch": 4535, "val_loss": 81056.390625} {"train_loss": -7.201602458953857, "global_step": 190512, "epoch": 4536} {"train_loss": -7.241105079650879, "global_step": 190513, "epoch": 4536} {"train_loss": -7.228727340698242, "global_step": 190514, "epoch": 4536} {"train_loss": -7.222487449645996, "global_step": 190515, "epoch": 4536} {"train_loss": -7.172586917877197, "global_step": 190516, "epoch": 4536} {"train_loss": -7.184390544891357, "global_step": 190517, "epoch": 4536} {"train_loss": -7.303123474121094, "global_step": 190518, "epoch": 4536} {"train_loss": -7.2924933433532715, "global_step": 190519, "epoch": 4536} {"train_loss": -7.277588844299316, "global_step": 190520, "epoch": 4536} {"train_loss": -7.255875587463379, "global_step": 190521, "epoch": 4536} {"train_loss": -7.233320236206055, "global_step": 190522, "epoch": 4536} {"train_loss": -7.144836902618408, "global_step": 190523, "epoch": 4536} {"train_loss": -7.222288131713867, "global_step": 190524, "epoch": 4536} {"train_loss": -7.221887111663818, "global_step": 190525, "epoch": 4536} {"train_loss": -7.266425609588623, "global_step": 190526, "epoch": 4536} {"train_loss": -7.242910385131836, "global_step": 190527, "epoch": 4536} {"train_loss": -7.171372890472412, "global_step": 190528, "epoch": 4536} {"train_loss": -7.197805404663086, "global_step": 190529, "epoch": 4536} {"train_loss": -7.237244606018066, "global_step": 190530, "epoch": 4536} {"train_loss": -7.132805347442627, "global_step": 190531, "epoch": 4536} {"train_loss": -7.212175369262695, "global_step": 190532, "epoch": 4536} {"train_loss": -7.2989091873168945, "global_step": 190533, "epoch": 4536} {"train_loss": -7.140438079833984, "global_step": 190534, "epoch": 4536} {"train_loss": -7.351266860961914, "global_step": 190535, "epoch": 4536} {"train_loss": -7.215181350708008, "global_step": 190536, "epoch": 4536} {"train_loss": -7.336845397949219, "global_step": 190537, "epoch": 4536} {"train_loss": -7.204658508300781, "global_step": 190538, "epoch": 4536} {"train_loss": -7.2989115715026855, "global_step": 190539, "epoch": 4536} {"train_loss": -7.155423164367676, "global_step": 190540, "epoch": 4536} {"train_loss": -7.1675825119018555, "global_step": 190541, "epoch": 4536} {"train_loss": -7.2363362312316895, "global_step": 190542, "epoch": 4536} {"train_loss": -7.277370452880859, "global_step": 190543, "epoch": 4536} {"train_loss": -7.210158824920654, "global_step": 190544, "epoch": 4536} {"train_loss": -7.197081565856934, "global_step": 190545, "epoch": 4536} {"train_loss": -7.384614944458008, "global_step": 190546, "epoch": 4536} {"train_loss": -7.1408796310424805, "global_step": 190547, "epoch": 4536} {"train_loss": -7.231179237365723, "global_step": 190548, "epoch": 4536} {"train_loss": -7.2225799560546875, "global_step": 190549, "epoch": 4536} {"train_loss": -7.208524703979492, "global_step": 190550, "epoch": 4536} {"train_loss": -7.1419878005981445, "global_step": 190551, "epoch": 4536} {"train_loss": -7.205005168914795, "global_step": 190552, "epoch": 4536} {"train_loss": -7.226289340427944, "global_step": 190553, "epoch": 4536, "val_loss": 81252.4375} {"train_loss": -7.20271635055542, "global_step": 190554, "epoch": 4537} {"train_loss": -7.25962495803833, "global_step": 190555, "epoch": 4537} {"train_loss": -7.196516036987305, "global_step": 190556, "epoch": 4537} {"train_loss": -7.271735191345215, "global_step": 190557, "epoch": 4537} {"train_loss": -7.111660957336426, "global_step": 190558, "epoch": 4537} {"train_loss": -7.229875564575195, "global_step": 190559, "epoch": 4537} {"train_loss": -7.160076141357422, "global_step": 190560, "epoch": 4537} {"train_loss": -7.18892240524292, "global_step": 190561, "epoch": 4537} {"train_loss": -7.244251251220703, "global_step": 190562, "epoch": 4537} {"train_loss": -7.2726593017578125, "global_step": 190563, "epoch": 4537} {"train_loss": -7.116008758544922, "global_step": 190564, "epoch": 4537} {"train_loss": -7.319729804992676, "global_step": 190565, "epoch": 4537} {"train_loss": -6.988753318786621, "global_step": 190566, "epoch": 4537} {"train_loss": -7.217714786529541, "global_step": 190567, "epoch": 4537} {"train_loss": -7.217076301574707, "global_step": 190568, "epoch": 4537} {"train_loss": -7.221668720245361, "global_step": 190569, "epoch": 4537} {"train_loss": -7.253183841705322, "global_step": 190570, "epoch": 4537} {"train_loss": -7.2609758377075195, "global_step": 190571, "epoch": 4537} {"train_loss": -7.197109222412109, "global_step": 190572, "epoch": 4537} {"train_loss": -7.2233099937438965, "global_step": 190573, "epoch": 4537} {"train_loss": -7.269970893859863, "global_step": 190574, "epoch": 4537} {"train_loss": -7.223657608032227, "global_step": 190575, "epoch": 4537} {"train_loss": -7.309868812561035, "global_step": 190576, "epoch": 4537} {"train_loss": -7.310667514801025, "global_step": 190577, "epoch": 4537} {"train_loss": -7.220802307128906, "global_step": 190578, "epoch": 4537} {"train_loss": -7.246438026428223, "global_step": 190579, "epoch": 4537} {"train_loss": -7.250834941864014, "global_step": 190580, "epoch": 4537} {"train_loss": -7.2557268142700195, "global_step": 190581, "epoch": 4537} {"train_loss": -7.280790328979492, "global_step": 190582, "epoch": 4537} {"train_loss": -7.149280548095703, "global_step": 190583, "epoch": 4537} {"train_loss": -7.225063323974609, "global_step": 190584, "epoch": 4537} {"train_loss": -7.317254066467285, "global_step": 190585, "epoch": 4537} {"train_loss": -7.260647773742676, "global_step": 190586, "epoch": 4537} {"train_loss": -7.274198532104492, "global_step": 190587, "epoch": 4537} {"train_loss": -7.25523567199707, "global_step": 190588, "epoch": 4537} {"train_loss": -7.295533657073975, "global_step": 190589, "epoch": 4537} {"train_loss": -7.295144081115723, "global_step": 190590, "epoch": 4537} {"train_loss": -7.3349833488464355, "global_step": 190591, "epoch": 4537} {"train_loss": -7.39867639541626, "global_step": 190592, "epoch": 4537} {"train_loss": -7.296253204345703, "global_step": 190593, "epoch": 4537} {"train_loss": -7.053784370422363, "global_step": 190594, "epoch": 4537} {"train_loss": -7.238373597462972, "global_step": 190595, "epoch": 4537, "val_loss": 81074.671875} {"train_loss": -7.3082427978515625, "global_step": 190596, "epoch": 4538} {"train_loss": -7.3777594566345215, "global_step": 190597, "epoch": 4538} {"train_loss": -7.252725601196289, "global_step": 190598, "epoch": 4538} {"train_loss": -7.238707065582275, "global_step": 190599, "epoch": 4538} {"train_loss": -7.269387722015381, "global_step": 190600, "epoch": 4538} {"train_loss": -7.229434967041016, "global_step": 190601, "epoch": 4538} {"train_loss": -7.205539703369141, "global_step": 190602, "epoch": 4538} {"train_loss": -7.16546630859375, "global_step": 190603, "epoch": 4538} {"train_loss": -7.169760704040527, "global_step": 190604, "epoch": 4538} {"train_loss": -7.231685161590576, "global_step": 190605, "epoch": 4538} {"train_loss": -7.241117477416992, "global_step": 190606, "epoch": 4538} {"train_loss": -7.299181938171387, "global_step": 190607, "epoch": 4538} {"train_loss": -7.233295440673828, "global_step": 190608, "epoch": 4538} {"train_loss": -7.2645263671875, "global_step": 190609, "epoch": 4538} {"train_loss": -7.244851112365723, "global_step": 190610, "epoch": 4538} {"train_loss": -7.2655744552612305, "global_step": 190611, "epoch": 4538} {"train_loss": -7.095990180969238, "global_step": 190612, "epoch": 4538} {"train_loss": -7.248856544494629, "global_step": 190613, "epoch": 4538} {"train_loss": -7.103725433349609, "global_step": 190614, "epoch": 4538} {"train_loss": -7.1895904541015625, "global_step": 190615, "epoch": 4538} {"train_loss": -7.216155052185059, "global_step": 190616, "epoch": 4538} {"train_loss": -7.288187503814697, "global_step": 190617, "epoch": 4538} {"train_loss": -7.24803352355957, "global_step": 190618, "epoch": 4538} {"train_loss": -7.405263423919678, "global_step": 190619, "epoch": 4538} {"train_loss": -7.356046676635742, "global_step": 190620, "epoch": 4538} {"train_loss": -7.23859977722168, "global_step": 190621, "epoch": 4538} {"train_loss": -7.284567832946777, "global_step": 190622, "epoch": 4538} {"train_loss": -7.211574554443359, "global_step": 190623, "epoch": 4538} {"train_loss": -7.202475070953369, "global_step": 190624, "epoch": 4538} {"train_loss": -7.27152156829834, "global_step": 190625, "epoch": 4538} {"train_loss": -7.3058319091796875, "global_step": 190626, "epoch": 4538} {"train_loss": -7.263241291046143, "global_step": 190627, "epoch": 4538} {"train_loss": -7.363290786743164, "global_step": 190628, "epoch": 4538} {"train_loss": -7.2443928718566895, "global_step": 190629, "epoch": 4538} {"train_loss": -7.318782806396484, "global_step": 190630, "epoch": 4538} {"train_loss": -7.312460899353027, "global_step": 190631, "epoch": 4538} {"train_loss": -7.246289253234863, "global_step": 190632, "epoch": 4538} {"train_loss": -7.229139804840088, "global_step": 190633, "epoch": 4538} {"train_loss": -7.292366981506348, "global_step": 190634, "epoch": 4538} {"train_loss": -7.2096428871154785, "global_step": 190635, "epoch": 4538} {"train_loss": -7.208284854888916, "global_step": 190636, "epoch": 4538} {"train_loss": -7.252732254209972, "global_step": 190637, "epoch": 4538, "val_loss": 80914.46875} {"train_loss": -7.255119323730469, "global_step": 190638, "epoch": 4539} {"train_loss": -7.2716779708862305, "global_step": 190639, "epoch": 4539} {"train_loss": -7.18087911605835, "global_step": 190640, "epoch": 4539} {"train_loss": -7.231639862060547, "global_step": 190641, "epoch": 4539} {"train_loss": -7.192134380340576, "global_step": 190642, "epoch": 4539} {"train_loss": -7.133139610290527, "global_step": 190643, "epoch": 4539} {"train_loss": -7.283829689025879, "global_step": 190644, "epoch": 4539} {"train_loss": -7.296477317810059, "global_step": 190645, "epoch": 4539} {"train_loss": -7.203413963317871, "global_step": 190646, "epoch": 4539} {"train_loss": -7.2226243019104, "global_step": 190647, "epoch": 4539} {"train_loss": -7.166920185089111, "global_step": 190648, "epoch": 4539} {"train_loss": -7.2159624099731445, "global_step": 190649, "epoch": 4539} {"train_loss": -7.143202304840088, "global_step": 190650, "epoch": 4539} {"train_loss": -7.217707633972168, "global_step": 190651, "epoch": 4539} {"train_loss": -7.238187313079834, "global_step": 190652, "epoch": 4539} {"train_loss": -7.240256309509277, "global_step": 190653, "epoch": 4539} {"train_loss": -7.2424468994140625, "global_step": 190654, "epoch": 4539} {"train_loss": -7.199765205383301, "global_step": 190655, "epoch": 4539} {"train_loss": -7.332727432250977, "global_step": 190656, "epoch": 4539} {"train_loss": -7.207147121429443, "global_step": 190657, "epoch": 4539} {"train_loss": -7.280343055725098, "global_step": 190658, "epoch": 4539} {"train_loss": -7.299283027648926, "global_step": 190659, "epoch": 4539} {"train_loss": -7.235133171081543, "global_step": 190660, "epoch": 4539} {"train_loss": -7.232048034667969, "global_step": 190661, "epoch": 4539} {"train_loss": -7.284820079803467, "global_step": 190662, "epoch": 4539} {"train_loss": -7.289250373840332, "global_step": 190663, "epoch": 4539} {"train_loss": -7.357667922973633, "global_step": 190664, "epoch": 4539} {"train_loss": -7.269436836242676, "global_step": 190665, "epoch": 4539} {"train_loss": -7.183694839477539, "global_step": 190666, "epoch": 4539} {"train_loss": -7.371558666229248, "global_step": 190667, "epoch": 4539} {"train_loss": -7.239640235900879, "global_step": 190668, "epoch": 4539} {"train_loss": -7.353774547576904, "global_step": 190669, "epoch": 4539} {"train_loss": -7.29026985168457, "global_step": 190670, "epoch": 4539} {"train_loss": -7.3241868019104, "global_step": 190671, "epoch": 4539} {"train_loss": -7.164616584777832, "global_step": 190672, "epoch": 4539} {"train_loss": -7.2528839111328125, "global_step": 190673, "epoch": 4539} {"train_loss": -7.271456241607666, "global_step": 190674, "epoch": 4539} {"train_loss": -7.318558692932129, "global_step": 190675, "epoch": 4539} {"train_loss": -7.298556327819824, "global_step": 190676, "epoch": 4539} {"train_loss": -7.162937641143799, "global_step": 190677, "epoch": 4539} {"train_loss": -7.134449005126953, "global_step": 190678, "epoch": 4539} {"train_loss": -7.248649722053891, "global_step": 190679, "epoch": 4539, "val_loss": 81037.515625} {"train_loss": -7.264667510986328, "global_step": 190680, "epoch": 4540} {"train_loss": -7.306278705596924, "global_step": 190681, "epoch": 4540} {"train_loss": -7.341331481933594, "global_step": 190682, "epoch": 4540} {"train_loss": -7.257369041442871, "global_step": 190683, "epoch": 4540} {"train_loss": -7.358554840087891, "global_step": 190684, "epoch": 4540} {"train_loss": -7.270796298980713, "global_step": 190685, "epoch": 4540} {"train_loss": -7.217967987060547, "global_step": 190686, "epoch": 4540} {"train_loss": -7.274672508239746, "global_step": 190687, "epoch": 4540} {"train_loss": -7.360589027404785, "global_step": 190688, "epoch": 4540} {"train_loss": -7.280091285705566, "global_step": 190689, "epoch": 4540} {"train_loss": -7.2929558753967285, "global_step": 190690, "epoch": 4540} {"train_loss": -7.370361328125, "global_step": 190691, "epoch": 4540} {"train_loss": -7.249446392059326, "global_step": 190692, "epoch": 4540} {"train_loss": -7.290218353271484, "global_step": 190693, "epoch": 4540} {"train_loss": -7.337331771850586, "global_step": 190694, "epoch": 4540} {"train_loss": -7.244051933288574, "global_step": 190695, "epoch": 4540} {"train_loss": -7.426893711090088, "global_step": 190696, "epoch": 4540} {"train_loss": -7.325222969055176, "global_step": 190697, "epoch": 4540} {"train_loss": -7.186332702636719, "global_step": 190698, "epoch": 4540} {"train_loss": -7.248639106750488, "global_step": 190699, "epoch": 4540} {"train_loss": -7.2784857749938965, "global_step": 190700, "epoch": 4540} {"train_loss": -7.334271430969238, "global_step": 190701, "epoch": 4540} {"train_loss": -7.214417934417725, "global_step": 190702, "epoch": 4540} {"train_loss": -7.310894012451172, "global_step": 190703, "epoch": 4540} {"train_loss": -7.289858818054199, "global_step": 190704, "epoch": 4540} {"train_loss": -7.289260387420654, "global_step": 190705, "epoch": 4540} {"train_loss": -7.177809238433838, "global_step": 190706, "epoch": 4540} {"train_loss": -7.3165459632873535, "global_step": 190707, "epoch": 4540} {"train_loss": -7.380803108215332, "global_step": 190708, "epoch": 4540} {"train_loss": -7.2076826095581055, "global_step": 190709, "epoch": 4540} {"train_loss": -7.340951919555664, "global_step": 190710, "epoch": 4540} {"train_loss": -7.29078483581543, "global_step": 190711, "epoch": 4540} {"train_loss": -7.3604326248168945, "global_step": 190712, "epoch": 4540} {"train_loss": -7.3256988525390625, "global_step": 190713, "epoch": 4540} {"train_loss": -7.337296485900879, "global_step": 190714, "epoch": 4540} {"train_loss": -7.343687057495117, "global_step": 190715, "epoch": 4540} {"train_loss": -7.263113021850586, "global_step": 190716, "epoch": 4540} {"train_loss": -7.210315704345703, "global_step": 190717, "epoch": 4540} {"train_loss": -7.080977916717529, "global_step": 190718, "epoch": 4540} {"train_loss": -7.1581597328186035, "global_step": 190719, "epoch": 4540} {"train_loss": -7.271340847015381, "global_step": 190720, "epoch": 4540} {"train_loss": -7.284077281043643, "global_step": 190721, "epoch": 4540, "val_loss": 80907.8671875} {"train_loss": -7.024324417114258, "global_step": 190722, "epoch": 4541} {"train_loss": -7.2325663566589355, "global_step": 190723, "epoch": 4541} {"train_loss": -7.194020748138428, "global_step": 190724, "epoch": 4541} {"train_loss": -6.887376308441162, "global_step": 190725, "epoch": 4541} {"train_loss": -7.139430999755859, "global_step": 190726, "epoch": 4541} {"train_loss": -7.081414222717285, "global_step": 190727, "epoch": 4541} {"train_loss": -6.972509384155273, "global_step": 190728, "epoch": 4541} {"train_loss": -7.204626560211182, "global_step": 190729, "epoch": 4541} {"train_loss": -7.099903106689453, "global_step": 190730, "epoch": 4541} {"train_loss": -7.188024520874023, "global_step": 190731, "epoch": 4541} {"train_loss": -7.112796783447266, "global_step": 190732, "epoch": 4541} {"train_loss": -7.209987640380859, "global_step": 190733, "epoch": 4541} {"train_loss": -7.160161972045898, "global_step": 190734, "epoch": 4541} {"train_loss": -7.055356979370117, "global_step": 190735, "epoch": 4541} {"train_loss": -7.076148986816406, "global_step": 190736, "epoch": 4541} {"train_loss": -7.182929039001465, "global_step": 190737, "epoch": 4541} {"train_loss": -7.173339366912842, "global_step": 190738, "epoch": 4541} {"train_loss": -7.108726501464844, "global_step": 190739, "epoch": 4541} {"train_loss": -7.196481227874756, "global_step": 190740, "epoch": 4541} {"train_loss": -6.992772102355957, "global_step": 190741, "epoch": 4541} {"train_loss": -7.131748676300049, "global_step": 190742, "epoch": 4541} {"train_loss": -7.1885223388671875, "global_step": 190743, "epoch": 4541} {"train_loss": -7.034595966339111, "global_step": 190744, "epoch": 4541} {"train_loss": -7.075985908508301, "global_step": 190745, "epoch": 4541} {"train_loss": -7.226600646972656, "global_step": 190746, "epoch": 4541} {"train_loss": -7.147629261016846, "global_step": 190747, "epoch": 4541} {"train_loss": -7.134624481201172, "global_step": 190748, "epoch": 4541} {"train_loss": -7.080038070678711, "global_step": 190749, "epoch": 4541} {"train_loss": -7.214758396148682, "global_step": 190750, "epoch": 4541} {"train_loss": -7.301315784454346, "global_step": 190751, "epoch": 4541} {"train_loss": -7.1608991622924805, "global_step": 190752, "epoch": 4541} {"train_loss": -7.139266014099121, "global_step": 190753, "epoch": 4541} {"train_loss": -7.092142105102539, "global_step": 190754, "epoch": 4541} {"train_loss": -7.134444713592529, "global_step": 190755, "epoch": 4541} {"train_loss": -7.305956840515137, "global_step": 190756, "epoch": 4541} {"train_loss": -7.137508869171143, "global_step": 190757, "epoch": 4541} {"train_loss": -7.295100212097168, "global_step": 190758, "epoch": 4541} {"train_loss": -7.186820983886719, "global_step": 190759, "epoch": 4541} {"train_loss": -7.170889377593994, "global_step": 190760, "epoch": 4541} {"train_loss": -7.1912126541137695, "global_step": 190761, "epoch": 4541} {"train_loss": -7.145296096801758, "global_step": 190762, "epoch": 4541} {"train_loss": -7.140775192351568, "global_step": 190763, "epoch": 4541, "val_loss": 80952.5859375} {"train_loss": -7.263998031616211, "global_step": 190764, "epoch": 4542} {"train_loss": -7.204278945922852, "global_step": 190765, "epoch": 4542} {"train_loss": -7.197237014770508, "global_step": 190766, "epoch": 4542} {"train_loss": -7.104901313781738, "global_step": 190767, "epoch": 4542} {"train_loss": -7.175893783569336, "global_step": 190768, "epoch": 4542} {"train_loss": -7.1491289138793945, "global_step": 190769, "epoch": 4542} {"train_loss": -7.027864456176758, "global_step": 190770, "epoch": 4542} {"train_loss": -7.171166896820068, "global_step": 190771, "epoch": 4542} {"train_loss": -7.185507297515869, "global_step": 190772, "epoch": 4542} {"train_loss": -7.065468788146973, "global_step": 190773, "epoch": 4542} {"train_loss": -7.287042617797852, "global_step": 190774, "epoch": 4542} {"train_loss": -7.159276008605957, "global_step": 190775, "epoch": 4542} {"train_loss": -7.0471391677856445, "global_step": 190776, "epoch": 4542} {"train_loss": -7.250692367553711, "global_step": 190777, "epoch": 4542} {"train_loss": -7.213513374328613, "global_step": 190778, "epoch": 4542} {"train_loss": -7.122170448303223, "global_step": 190779, "epoch": 4542} {"train_loss": -7.1335039138793945, "global_step": 190780, "epoch": 4542} {"train_loss": -7.213252544403076, "global_step": 190781, "epoch": 4542} {"train_loss": -7.101498603820801, "global_step": 190782, "epoch": 4542} {"train_loss": -7.103704929351807, "global_step": 190783, "epoch": 4542} {"train_loss": -7.185046195983887, "global_step": 190784, "epoch": 4542} {"train_loss": -7.027843475341797, "global_step": 190785, "epoch": 4542} {"train_loss": -7.214534759521484, "global_step": 190786, "epoch": 4542} {"train_loss": -7.106555938720703, "global_step": 190787, "epoch": 4542} {"train_loss": -7.2154622077941895, "global_step": 190788, "epoch": 4542} {"train_loss": -7.191006660461426, "global_step": 190789, "epoch": 4542} {"train_loss": -7.005071640014648, "global_step": 190790, "epoch": 4542} {"train_loss": -7.288097381591797, "global_step": 190791, "epoch": 4542} {"train_loss": -7.136090278625488, "global_step": 190792, "epoch": 4542} {"train_loss": -7.159755706787109, "global_step": 190793, "epoch": 4542} {"train_loss": -7.186041355133057, "global_step": 190794, "epoch": 4542} {"train_loss": -7.170921325683594, "global_step": 190795, "epoch": 4542} {"train_loss": -7.2435760498046875, "global_step": 190796, "epoch": 4542} {"train_loss": -7.180916786193848, "global_step": 190797, "epoch": 4542} {"train_loss": -7.171169757843018, "global_step": 190798, "epoch": 4542} {"train_loss": -7.105210304260254, "global_step": 190799, "epoch": 4542} {"train_loss": -7.309416770935059, "global_step": 190800, "epoch": 4542} {"train_loss": -7.181051254272461, "global_step": 190801, "epoch": 4542} {"train_loss": -7.174922466278076, "global_step": 190802, "epoch": 4542} {"train_loss": -7.106987953186035, "global_step": 190803, "epoch": 4542} {"train_loss": -7.280828475952148, "global_step": 190804, "epoch": 4542} {"train_loss": -7.168194464274815, "global_step": 190805, "epoch": 4542, "val_loss": 80900.8125} {"train_loss": -7.253029823303223, "global_step": 190806, "epoch": 4543} {"train_loss": -7.29559850692749, "global_step": 190807, "epoch": 4543} {"train_loss": -7.323334217071533, "global_step": 190808, "epoch": 4543} {"train_loss": -7.340418338775635, "global_step": 190809, "epoch": 4543} {"train_loss": -7.2655439376831055, "global_step": 190810, "epoch": 4543} {"train_loss": -7.318506240844727, "global_step": 190811, "epoch": 4543} {"train_loss": -7.34766960144043, "global_step": 190812, "epoch": 4543} {"train_loss": -7.3097333908081055, "global_step": 190813, "epoch": 4543} {"train_loss": -7.322541236877441, "global_step": 190814, "epoch": 4543} {"train_loss": -7.150979042053223, "global_step": 190815, "epoch": 4543} {"train_loss": -7.340853691101074, "global_step": 190816, "epoch": 4543} {"train_loss": -7.235023498535156, "global_step": 190817, "epoch": 4543} {"train_loss": -7.31541633605957, "global_step": 190818, "epoch": 4543} {"train_loss": -7.3216705322265625, "global_step": 190819, "epoch": 4543} {"train_loss": -7.248321533203125, "global_step": 190820, "epoch": 4543} {"train_loss": -7.2855963706970215, "global_step": 190821, "epoch": 4543} {"train_loss": -7.280508041381836, "global_step": 190822, "epoch": 4543} {"train_loss": -7.094484329223633, "global_step": 190823, "epoch": 4543} {"train_loss": -7.25478458404541, "global_step": 190824, "epoch": 4543} {"train_loss": -7.158372402191162, "global_step": 190825, "epoch": 4543} {"train_loss": -7.303173542022705, "global_step": 190826, "epoch": 4543} {"train_loss": -7.133440971374512, "global_step": 190827, "epoch": 4543} {"train_loss": -7.280082702636719, "global_step": 190828, "epoch": 4543} {"train_loss": -7.146915435791016, "global_step": 190829, "epoch": 4543} {"train_loss": -7.334531307220459, "global_step": 190830, "epoch": 4543} {"train_loss": -7.226043701171875, "global_step": 190831, "epoch": 4543} {"train_loss": -7.184459686279297, "global_step": 190832, "epoch": 4543} {"train_loss": -7.308497905731201, "global_step": 190833, "epoch": 4543} {"train_loss": -7.185816764831543, "global_step": 190834, "epoch": 4543} {"train_loss": -7.150064468383789, "global_step": 190835, "epoch": 4543} {"train_loss": -7.082632064819336, "global_step": 190836, "epoch": 4543} {"train_loss": -7.124412536621094, "global_step": 190837, "epoch": 4543} {"train_loss": -7.217324733734131, "global_step": 190838, "epoch": 4543} {"train_loss": -7.073490142822266, "global_step": 190839, "epoch": 4543} {"train_loss": -7.139169692993164, "global_step": 190840, "epoch": 4543} {"train_loss": -7.280319690704346, "global_step": 190841, "epoch": 4543} {"train_loss": -7.261409282684326, "global_step": 190842, "epoch": 4543} {"train_loss": -7.100429058074951, "global_step": 190843, "epoch": 4543} {"train_loss": -7.252760887145996, "global_step": 190844, "epoch": 4543} {"train_loss": -7.136926651000977, "global_step": 190845, "epoch": 4543} {"train_loss": -7.298890113830566, "global_step": 190846, "epoch": 4543} {"train_loss": -7.235801026934669, "global_step": 190847, "epoch": 4543, "val_loss": 81127.859375} {"train_loss": -7.254027366638184, "global_step": 190848, "epoch": 4544} {"train_loss": -7.234852313995361, "global_step": 190849, "epoch": 4544} {"train_loss": -7.261809349060059, "global_step": 190850, "epoch": 4544} {"train_loss": -7.186053276062012, "global_step": 190851, "epoch": 4544} {"train_loss": -7.139307022094727, "global_step": 190852, "epoch": 4544} {"train_loss": -7.234826564788818, "global_step": 190853, "epoch": 4544} {"train_loss": -7.251492500305176, "global_step": 190854, "epoch": 4544} {"train_loss": -7.223898887634277, "global_step": 190855, "epoch": 4544} {"train_loss": -7.147105693817139, "global_step": 190856, "epoch": 4544} {"train_loss": -7.212040901184082, "global_step": 190857, "epoch": 4544} {"train_loss": -7.300501823425293, "global_step": 190858, "epoch": 4544} {"train_loss": -7.286669731140137, "global_step": 190859, "epoch": 4544} {"train_loss": -7.257593631744385, "global_step": 190860, "epoch": 4544} {"train_loss": -7.2164106369018555, "global_step": 190861, "epoch": 4544} {"train_loss": -7.233808994293213, "global_step": 190862, "epoch": 4544} {"train_loss": -7.191736221313477, "global_step": 190863, "epoch": 4544} {"train_loss": -7.213740825653076, "global_step": 190864, "epoch": 4544} {"train_loss": -7.246572017669678, "global_step": 190865, "epoch": 4544} {"train_loss": -7.206737041473389, "global_step": 190866, "epoch": 4544} {"train_loss": -7.183571815490723, "global_step": 190867, "epoch": 4544} {"train_loss": -7.256564140319824, "global_step": 190868, "epoch": 4544} {"train_loss": -7.198792457580566, "global_step": 190869, "epoch": 4544} {"train_loss": -7.169939041137695, "global_step": 190870, "epoch": 4544} {"train_loss": -7.284310817718506, "global_step": 190871, "epoch": 4544} {"train_loss": -7.322222709655762, "global_step": 190872, "epoch": 4544} {"train_loss": -7.153757095336914, "global_step": 190873, "epoch": 4544} {"train_loss": -7.348926544189453, "global_step": 190874, "epoch": 4544} {"train_loss": -7.255543231964111, "global_step": 190875, "epoch": 4544} {"train_loss": -7.281084060668945, "global_step": 190876, "epoch": 4544} {"train_loss": -7.250097274780273, "global_step": 190877, "epoch": 4544} {"train_loss": -7.214079856872559, "global_step": 190878, "epoch": 4544} {"train_loss": -7.171253204345703, "global_step": 190879, "epoch": 4544} {"train_loss": -7.1765923500061035, "global_step": 190880, "epoch": 4544} {"train_loss": -7.2799272537231445, "global_step": 190881, "epoch": 4544} {"train_loss": -7.310558795928955, "global_step": 190882, "epoch": 4544} {"train_loss": -7.148109436035156, "global_step": 190883, "epoch": 4544} {"train_loss": -7.176788330078125, "global_step": 190884, "epoch": 4544} {"train_loss": -7.291591167449951, "global_step": 190885, "epoch": 4544} {"train_loss": -7.1205902099609375, "global_step": 190886, "epoch": 4544} {"train_loss": -7.191679954528809, "global_step": 190887, "epoch": 4544} {"train_loss": -7.197788238525391, "global_step": 190888, "epoch": 4544} {"train_loss": -7.226343983695621, "global_step": 190889, "epoch": 4544, "val_loss": 81194.046875} {"train_loss": -7.292690753936768, "global_step": 190890, "epoch": 4545} {"train_loss": -7.176183700561523, "global_step": 190891, "epoch": 4545} {"train_loss": -7.070809841156006, "global_step": 190892, "epoch": 4545} {"train_loss": -7.197705268859863, "global_step": 190893, "epoch": 4545} {"train_loss": -7.216282367706299, "global_step": 190894, "epoch": 4545} {"train_loss": -7.118180751800537, "global_step": 190895, "epoch": 4545} {"train_loss": -7.138365745544434, "global_step": 190896, "epoch": 4545} {"train_loss": -7.237914562225342, "global_step": 190897, "epoch": 4545} {"train_loss": -7.2415595054626465, "global_step": 190898, "epoch": 4545} {"train_loss": -7.215940475463867, "global_step": 190899, "epoch": 4545} {"train_loss": -7.344777584075928, "global_step": 190900, "epoch": 4545} {"train_loss": -7.2201128005981445, "global_step": 190901, "epoch": 4545} {"train_loss": -7.219974040985107, "global_step": 190902, "epoch": 4545} {"train_loss": -7.275748252868652, "global_step": 190903, "epoch": 4545} {"train_loss": -7.165903568267822, "global_step": 190904, "epoch": 4545} {"train_loss": -7.21257209777832, "global_step": 190905, "epoch": 4545} {"train_loss": -7.186308860778809, "global_step": 190906, "epoch": 4545} {"train_loss": -7.183025360107422, "global_step": 190907, "epoch": 4545} {"train_loss": -7.282744884490967, "global_step": 190908, "epoch": 4545} {"train_loss": -7.182959079742432, "global_step": 190909, "epoch": 4545} {"train_loss": -7.331124305725098, "global_step": 190910, "epoch": 4545} {"train_loss": -7.291778564453125, "global_step": 190911, "epoch": 4545} {"train_loss": -7.096009731292725, "global_step": 190912, "epoch": 4545} {"train_loss": -7.115150451660156, "global_step": 190913, "epoch": 4545} {"train_loss": -7.220594882965088, "global_step": 190914, "epoch": 4545} {"train_loss": -7.204488754272461, "global_step": 190915, "epoch": 4545} {"train_loss": -7.18747615814209, "global_step": 190916, "epoch": 4545} {"train_loss": -7.250003814697266, "global_step": 190917, "epoch": 4545} {"train_loss": -7.256977081298828, "global_step": 190918, "epoch": 4545} {"train_loss": -7.244880676269531, "global_step": 190919, "epoch": 4545} {"train_loss": -7.265607833862305, "global_step": 190920, "epoch": 4545} {"train_loss": -7.216996669769287, "global_step": 190921, "epoch": 4545} {"train_loss": -7.242938995361328, "global_step": 190922, "epoch": 4545} {"train_loss": -7.23614501953125, "global_step": 190923, "epoch": 4545} {"train_loss": -7.109261512756348, "global_step": 190924, "epoch": 4545} {"train_loss": -7.280209541320801, "global_step": 190925, "epoch": 4545} {"train_loss": -7.005213737487793, "global_step": 190926, "epoch": 4545} {"train_loss": -7.168515682220459, "global_step": 190927, "epoch": 4545} {"train_loss": -7.265226364135742, "global_step": 190928, "epoch": 4545} {"train_loss": -7.178488254547119, "global_step": 190929, "epoch": 4545} {"train_loss": -7.214288711547852, "global_step": 190930, "epoch": 4545} {"train_loss": -7.203977823257446, "global_step": 190931, "epoch": 4545, "val_loss": 81072.9140625} {"train_loss": -7.276954650878906, "global_step": 190932, "epoch": 4546} {"train_loss": -7.1998748779296875, "global_step": 190933, "epoch": 4546} {"train_loss": -7.127037048339844, "global_step": 190934, "epoch": 4546} {"train_loss": -7.223903656005859, "global_step": 190935, "epoch": 4546} {"train_loss": -7.29252815246582, "global_step": 190936, "epoch": 4546} {"train_loss": -7.289642333984375, "global_step": 190937, "epoch": 4546} {"train_loss": -7.198702335357666, "global_step": 190938, "epoch": 4546} {"train_loss": -7.106341361999512, "global_step": 190939, "epoch": 4546} {"train_loss": -7.1903886795043945, "global_step": 190940, "epoch": 4546} {"train_loss": -7.137058258056641, "global_step": 190941, "epoch": 4546} {"train_loss": -7.095782279968262, "global_step": 190942, "epoch": 4546} {"train_loss": -7.212942600250244, "global_step": 190943, "epoch": 4546} {"train_loss": -7.263036727905273, "global_step": 190944, "epoch": 4546} {"train_loss": -7.134797096252441, "global_step": 190945, "epoch": 4546} {"train_loss": -7.188878059387207, "global_step": 190946, "epoch": 4546} {"train_loss": -7.148313045501709, "global_step": 190947, "epoch": 4546} {"train_loss": -7.125114440917969, "global_step": 190948, "epoch": 4546} {"train_loss": -7.166128635406494, "global_step": 190949, "epoch": 4546} {"train_loss": -7.277576923370361, "global_step": 190950, "epoch": 4546} {"train_loss": -7.171895980834961, "global_step": 190951, "epoch": 4546} {"train_loss": -7.305537223815918, "global_step": 190952, "epoch": 4546} {"train_loss": -7.20166540145874, "global_step": 190953, "epoch": 4546} {"train_loss": -7.2711381912231445, "global_step": 190954, "epoch": 4546} {"train_loss": -7.283714294433594, "global_step": 190955, "epoch": 4546} {"train_loss": -7.3142900466918945, "global_step": 190956, "epoch": 4546} {"train_loss": -7.2957611083984375, "global_step": 190957, "epoch": 4546} {"train_loss": -7.389023780822754, "global_step": 190958, "epoch": 4546} {"train_loss": -7.2631731033325195, "global_step": 190959, "epoch": 4546} {"train_loss": -7.336067199707031, "global_step": 190960, "epoch": 4546} {"train_loss": -7.197988986968994, "global_step": 190961, "epoch": 4546} {"train_loss": -7.31185245513916, "global_step": 190962, "epoch": 4546} {"train_loss": -7.24517822265625, "global_step": 190963, "epoch": 4546} {"train_loss": -7.277251243591309, "global_step": 190964, "epoch": 4546} {"train_loss": -7.277475357055664, "global_step": 190965, "epoch": 4546} {"train_loss": -7.1653594970703125, "global_step": 190966, "epoch": 4546} {"train_loss": -7.2536725997924805, "global_step": 190967, "epoch": 4546} {"train_loss": -7.132452011108398, "global_step": 190968, "epoch": 4546} {"train_loss": -7.167513370513916, "global_step": 190969, "epoch": 4546} {"train_loss": -7.162615776062012, "global_step": 190970, "epoch": 4546} {"train_loss": -7.306879043579102, "global_step": 190971, "epoch": 4546} {"train_loss": -7.2804412841796875, "global_step": 190972, "epoch": 4546} {"train_loss": -7.226132233937581, "global_step": 190973, "epoch": 4546, "val_loss": 81094.4609375} {"train_loss": -7.2272138595581055, "global_step": 190974, "epoch": 4547} {"train_loss": -7.269366264343262, "global_step": 190975, "epoch": 4547} {"train_loss": -7.2405595779418945, "global_step": 190976, "epoch": 4547} {"train_loss": -7.22541618347168, "global_step": 190977, "epoch": 4547} {"train_loss": -7.185997009277344, "global_step": 190978, "epoch": 4547} {"train_loss": -7.370614051818848, "global_step": 190979, "epoch": 4547} {"train_loss": -7.157724380493164, "global_step": 190980, "epoch": 4547} {"train_loss": -7.289707183837891, "global_step": 190981, "epoch": 4547} {"train_loss": -7.210646629333496, "global_step": 190982, "epoch": 4547} {"train_loss": -7.171133995056152, "global_step": 190983, "epoch": 4547} {"train_loss": -7.171411991119385, "global_step": 190984, "epoch": 4547} {"train_loss": -7.272579669952393, "global_step": 190985, "epoch": 4547} {"train_loss": -7.2575883865356445, "global_step": 190986, "epoch": 4547} {"train_loss": -7.082885265350342, "global_step": 190987, "epoch": 4547} {"train_loss": -7.1067094802856445, "global_step": 190988, "epoch": 4547} {"train_loss": -7.177219390869141, "global_step": 190989, "epoch": 4547} {"train_loss": -7.094130516052246, "global_step": 190990, "epoch": 4547} {"train_loss": -7.046168804168701, "global_step": 190991, "epoch": 4547} {"train_loss": -7.164318084716797, "global_step": 190992, "epoch": 4547} {"train_loss": -7.17747688293457, "global_step": 190993, "epoch": 4547} {"train_loss": -7.216174602508545, "global_step": 190994, "epoch": 4547} {"train_loss": -7.080784797668457, "global_step": 190995, "epoch": 4547} {"train_loss": -7.199733257293701, "global_step": 190996, "epoch": 4547} {"train_loss": -7.134144306182861, "global_step": 190997, "epoch": 4547} {"train_loss": -7.225074768066406, "global_step": 190998, "epoch": 4547} {"train_loss": -7.212449073791504, "global_step": 190999, "epoch": 4547} {"train_loss": -7.202845573425293, "global_step": 191000, "epoch": 4547} {"train_loss": -7.263365268707275, "global_step": 191001, "epoch": 4547} {"train_loss": -7.210127830505371, "global_step": 191002, "epoch": 4547} {"train_loss": -7.308818817138672, "global_step": 191003, "epoch": 4547} {"train_loss": -7.285983085632324, "global_step": 191004, "epoch": 4547} {"train_loss": -7.217440605163574, "global_step": 191005, "epoch": 4547} {"train_loss": -7.210803508758545, "global_step": 191006, "epoch": 4547} {"train_loss": -7.135532379150391, "global_step": 191007, "epoch": 4547} {"train_loss": -7.2892656326293945, "global_step": 191008, "epoch": 4547} {"train_loss": -7.179757118225098, "global_step": 191009, "epoch": 4547} {"train_loss": -7.349946022033691, "global_step": 191010, "epoch": 4547} {"train_loss": -7.115277290344238, "global_step": 191011, "epoch": 4547} {"train_loss": -7.162441253662109, "global_step": 191012, "epoch": 4547} {"train_loss": -7.319077968597412, "global_step": 191013, "epoch": 4547} {"train_loss": -7.134346008300781, "global_step": 191014, "epoch": 4547} {"train_loss": -7.202826965422857, "global_step": 191015, "epoch": 4547, "val_loss": 81178.28125} {"train_loss": -7.309288024902344, "global_step": 191016, "epoch": 4548} {"train_loss": -7.11429500579834, "global_step": 191017, "epoch": 4548} {"train_loss": -6.969006538391113, "global_step": 191018, "epoch": 4548} {"train_loss": -7.274254322052002, "global_step": 191019, "epoch": 4548} {"train_loss": -7.1402506828308105, "global_step": 191020, "epoch": 4548} {"train_loss": -7.044058799743652, "global_step": 191021, "epoch": 4548} {"train_loss": -7.299200057983398, "global_step": 191022, "epoch": 4548} {"train_loss": -6.997316360473633, "global_step": 191023, "epoch": 4548} {"train_loss": -7.1665496826171875, "global_step": 191024, "epoch": 4548} {"train_loss": -7.155001640319824, "global_step": 191025, "epoch": 4548} {"train_loss": -7.039813995361328, "global_step": 191026, "epoch": 4548} {"train_loss": -7.230671405792236, "global_step": 191027, "epoch": 4548} {"train_loss": -7.153478622436523, "global_step": 191028, "epoch": 4548} {"train_loss": -7.276227951049805, "global_step": 191029, "epoch": 4548} {"train_loss": -7.2593913078308105, "global_step": 191030, "epoch": 4548} {"train_loss": -7.196504592895508, "global_step": 191031, "epoch": 4548} {"train_loss": -7.2347846031188965, "global_step": 191032, "epoch": 4548} {"train_loss": -7.214172840118408, "global_step": 191033, "epoch": 4548} {"train_loss": -7.270555019378662, "global_step": 191034, "epoch": 4548} {"train_loss": -7.248291015625, "global_step": 191035, "epoch": 4548} {"train_loss": -7.149267673492432, "global_step": 191036, "epoch": 4548} {"train_loss": -7.216305732727051, "global_step": 191037, "epoch": 4548} {"train_loss": -7.144190788269043, "global_step": 191038, "epoch": 4548} {"train_loss": -7.181192874908447, "global_step": 191039, "epoch": 4548} {"train_loss": -7.209436416625977, "global_step": 191040, "epoch": 4548} {"train_loss": -7.291222095489502, "global_step": 191041, "epoch": 4548} {"train_loss": -7.140047073364258, "global_step": 191042, "epoch": 4548} {"train_loss": -7.2209954261779785, "global_step": 191043, "epoch": 4548} {"train_loss": -7.211816310882568, "global_step": 191044, "epoch": 4548} {"train_loss": -7.214999675750732, "global_step": 191045, "epoch": 4548} {"train_loss": -7.251405715942383, "global_step": 191046, "epoch": 4548} {"train_loss": -7.077633857727051, "global_step": 191047, "epoch": 4548} {"train_loss": -7.23722505569458, "global_step": 191048, "epoch": 4548} {"train_loss": -7.118951797485352, "global_step": 191049, "epoch": 4548} {"train_loss": -7.225383758544922, "global_step": 191050, "epoch": 4548} {"train_loss": -7.166257858276367, "global_step": 191051, "epoch": 4548} {"train_loss": -7.1692609786987305, "global_step": 191052, "epoch": 4548} {"train_loss": -7.175510883331299, "global_step": 191053, "epoch": 4548} {"train_loss": -7.103464603424072, "global_step": 191054, "epoch": 4548} {"train_loss": -7.201281547546387, "global_step": 191055, "epoch": 4548} {"train_loss": -7.247398853302002, "global_step": 191056, "epoch": 4548} {"train_loss": -7.183773540315174, "global_step": 191057, "epoch": 4548, "val_loss": 80944.0} {"train_loss": -7.268994331359863, "global_step": 191058, "epoch": 4549} {"train_loss": -7.246106147766113, "global_step": 191059, "epoch": 4549} {"train_loss": -7.178861141204834, "global_step": 191060, "epoch": 4549} {"train_loss": -7.252796649932861, "global_step": 191061, "epoch": 4549} {"train_loss": -7.223156929016113, "global_step": 191062, "epoch": 4549} {"train_loss": -7.198032379150391, "global_step": 191063, "epoch": 4549} {"train_loss": -7.3041605949401855, "global_step": 191064, "epoch": 4549} {"train_loss": -7.223296642303467, "global_step": 191065, "epoch": 4549} {"train_loss": -7.243319511413574, "global_step": 191066, "epoch": 4549} {"train_loss": -7.2018585205078125, "global_step": 191067, "epoch": 4549} {"train_loss": -7.312457084655762, "global_step": 191068, "epoch": 4549} {"train_loss": -7.155630111694336, "global_step": 191069, "epoch": 4549} {"train_loss": -7.354734420776367, "global_step": 191070, "epoch": 4549} {"train_loss": -7.097916603088379, "global_step": 191071, "epoch": 4549} {"train_loss": -7.155840873718262, "global_step": 191072, "epoch": 4549} {"train_loss": -7.295675277709961, "global_step": 191073, "epoch": 4549} {"train_loss": -7.170807838439941, "global_step": 191074, "epoch": 4549} {"train_loss": -7.2717695236206055, "global_step": 191075, "epoch": 4549} {"train_loss": -7.211971282958984, "global_step": 191076, "epoch": 4549} {"train_loss": -7.234431743621826, "global_step": 191077, "epoch": 4549} {"train_loss": -7.302289009094238, "global_step": 191078, "epoch": 4549} {"train_loss": -7.291799545288086, "global_step": 191079, "epoch": 4549} {"train_loss": -7.187380790710449, "global_step": 191080, "epoch": 4549} {"train_loss": -7.15052604675293, "global_step": 191081, "epoch": 4549} {"train_loss": -7.27156400680542, "global_step": 191082, "epoch": 4549} {"train_loss": -7.238785266876221, "global_step": 191083, "epoch": 4549} {"train_loss": -7.182367324829102, "global_step": 191084, "epoch": 4549} {"train_loss": -7.258153915405273, "global_step": 191085, "epoch": 4549} {"train_loss": -7.310981750488281, "global_step": 191086, "epoch": 4549} {"train_loss": -7.201044082641602, "global_step": 191087, "epoch": 4549} {"train_loss": -7.2265849113464355, "global_step": 191088, "epoch": 4549} {"train_loss": -7.269537925720215, "global_step": 191089, "epoch": 4549} {"train_loss": -7.214641571044922, "global_step": 191090, "epoch": 4549} {"train_loss": -7.168145179748535, "global_step": 191091, "epoch": 4549} {"train_loss": -7.253203392028809, "global_step": 191092, "epoch": 4549} {"train_loss": -7.346034526824951, "global_step": 191093, "epoch": 4549} {"train_loss": -7.316460609436035, "global_step": 191094, "epoch": 4549} {"train_loss": -7.222736358642578, "global_step": 191095, "epoch": 4549} {"train_loss": -7.252758026123047, "global_step": 191096, "epoch": 4549} {"train_loss": -7.322319030761719, "global_step": 191097, "epoch": 4549} {"train_loss": -7.160364151000977, "global_step": 191098, "epoch": 4549} {"train_loss": -7.237535431271508, "global_step": 191099, "epoch": 4549, "val_loss": 80957.6875} {"train_loss": -7.116471290588379, "global_step": 191100, "epoch": 4550} {"train_loss": -7.209510803222656, "global_step": 191101, "epoch": 4550} {"train_loss": -7.289176940917969, "global_step": 191102, "epoch": 4550} {"train_loss": -7.284453392028809, "global_step": 191103, "epoch": 4550} {"train_loss": -7.331040382385254, "global_step": 191104, "epoch": 4550} {"train_loss": -7.242728233337402, "global_step": 191105, "epoch": 4550} {"train_loss": -7.205691814422607, "global_step": 191106, "epoch": 4550} {"train_loss": -7.16942024230957, "global_step": 191107, "epoch": 4550} {"train_loss": -7.154353141784668, "global_step": 191108, "epoch": 4550} {"train_loss": -7.210290908813477, "global_step": 191109, "epoch": 4550} {"train_loss": -7.131017684936523, "global_step": 191110, "epoch": 4550} {"train_loss": -7.234931945800781, "global_step": 191111, "epoch": 4550} {"train_loss": -7.235013484954834, "global_step": 191112, "epoch": 4550} {"train_loss": -7.2154364585876465, "global_step": 191113, "epoch": 4550} {"train_loss": -7.187461853027344, "global_step": 191114, "epoch": 4550} {"train_loss": -7.16365909576416, "global_step": 191115, "epoch": 4550} {"train_loss": -7.095816135406494, "global_step": 191116, "epoch": 4550} {"train_loss": -7.030401229858398, "global_step": 191117, "epoch": 4550} {"train_loss": -7.1515092849731445, "global_step": 191118, "epoch": 4550} {"train_loss": -7.167707443237305, "global_step": 191119, "epoch": 4550} {"train_loss": -7.275871276855469, "global_step": 191120, "epoch": 4550} {"train_loss": -7.206717491149902, "global_step": 191121, "epoch": 4550} {"train_loss": -7.195746421813965, "global_step": 191122, "epoch": 4550} {"train_loss": -7.156494140625, "global_step": 191123, "epoch": 4550} {"train_loss": -7.258386611938477, "global_step": 191124, "epoch": 4550} {"train_loss": -7.296263217926025, "global_step": 191125, "epoch": 4550} {"train_loss": -7.216168403625488, "global_step": 191126, "epoch": 4550} {"train_loss": -7.280255317687988, "global_step": 191127, "epoch": 4550} {"train_loss": -7.25123405456543, "global_step": 191128, "epoch": 4550} {"train_loss": -7.130542755126953, "global_step": 191129, "epoch": 4550} {"train_loss": -7.236029624938965, "global_step": 191130, "epoch": 4550} {"train_loss": -7.295375823974609, "global_step": 191131, "epoch": 4550} {"train_loss": -7.210038185119629, "global_step": 191132, "epoch": 4550} {"train_loss": -7.1834211349487305, "global_step": 191133, "epoch": 4550} {"train_loss": -7.230069637298584, "global_step": 191134, "epoch": 4550} {"train_loss": -7.2204718589782715, "global_step": 191135, "epoch": 4550} {"train_loss": -7.191488742828369, "global_step": 191136, "epoch": 4550} {"train_loss": -7.215320110321045, "global_step": 191137, "epoch": 4550} {"train_loss": -7.214590072631836, "global_step": 191138, "epoch": 4550} {"train_loss": -7.070706844329834, "global_step": 191139, "epoch": 4550} {"train_loss": -7.193813323974609, "global_step": 191140, "epoch": 4550} {"train_loss": -7.202801500047956, "global_step": 191141, "epoch": 4550, "train/sim_max_reward_0": 0.4078263769078436, "train/sim_max_reward_1": 0.9383990187846459, "train/sim_max_reward_2": 0.3070723604953713, "train/sim_max_reward_3": 0.13797175922161822, "train/sim_max_reward_4": 0.8864037773554776, "train/sim_max_reward_5": 0.5895545387610241, "test/sim_max_reward_4500000": 0.3480561567655976, "test/sim_max_reward_4500001": 0.977677821980938, "test/sim_max_reward_4500002": 0.9067369240156266, "test/sim_max_reward_4500003": 0.8558796350189634, "test/sim_max_reward_4500004": 0.18638635279550883, "test/sim_max_reward_4500005": 0.8681573020095873, "test/sim_max_reward_4500006": 0.8863754340253485, "test/sim_max_reward_4500007": 0.8938820052879477, "test/sim_max_reward_4500008": 0.15081807382718018, "test/sim_max_reward_4500009": 0.052967403546343675, "test/sim_max_reward_4500010": 0.14036283103900915, "test/sim_max_reward_4500011": 0.4939915891331505, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.007315157209564955, "test/sim_max_reward_4500014": 0.49503053952920645, "test/sim_max_reward_4500015": 0.9774243760456247, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.10340629426335375, "test/sim_max_reward_4500018": 0.9495421336822688, "test/sim_max_reward_4500019": 1.0, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.997017550081177, "test/sim_max_reward_4500022": 0.8940470561285252, "test/sim_max_reward_4500023": 0.8297874830825626, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9953112534538877, "test/sim_max_reward_4500026": 1.0, "test/sim_max_reward_4500027": 0.973629229338409, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.08502604006903408, "test/sim_max_reward_4500030": 0.9866417938473644, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.7235199736995366, "test/sim_max_reward_4500034": 0.6156381901467235, "test/sim_max_reward_4500035": 0.8020828687155709, "test/sim_max_reward_4500036": 0.9653173429897111, "test/sim_max_reward_4500037": 0.9161171716899154, "test/sim_max_reward_4500038": 0.328338488245423, "test/sim_max_reward_4500039": 0.9131565915314883, "test/sim_max_reward_4500040": 0.91890247233202, "test/sim_max_reward_4500041": 0.3482861551426226, "test/sim_max_reward_4500042": 0.06353791089118752, "test/sim_max_reward_4500043": 0.38554005839881617, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.2736807877213186, "test/sim_max_reward_4500046": 0.17757733231948236, "test/sim_max_reward_4500047": 0.8777357394558106, "test/sim_max_reward_4500048": 0.0, "test/sim_max_reward_4500049": 0.9465855707524954, "train/mean_score": 0.5445379719209967, "test/mean_score": 0.5512743639759543, "val_loss": 80864.890625} {"train_loss": -7.043334007263184, "global_step": 191142, "epoch": 4551} {"train_loss": -7.2139387130737305, "global_step": 191143, "epoch": 4551} {"train_loss": -7.25450325012207, "global_step": 191144, "epoch": 4551} {"train_loss": -7.2070393562316895, "global_step": 191145, "epoch": 4551} {"train_loss": -7.360217094421387, "global_step": 191146, "epoch": 4551} {"train_loss": -7.083250522613525, "global_step": 191147, "epoch": 4551} {"train_loss": -7.165012359619141, "global_step": 191148, "epoch": 4551} {"train_loss": -7.15459680557251, "global_step": 191149, "epoch": 4551} {"train_loss": -7.116508483886719, "global_step": 191150, "epoch": 4551} {"train_loss": -7.107601165771484, "global_step": 191151, "epoch": 4551} {"train_loss": -7.139671325683594, "global_step": 191152, "epoch": 4551} {"train_loss": -7.249053955078125, "global_step": 191153, "epoch": 4551} {"train_loss": -7.242284297943115, "global_step": 191154, "epoch": 4551} {"train_loss": -7.099759101867676, "global_step": 191155, "epoch": 4551} {"train_loss": -7.206226825714111, "global_step": 191156, "epoch": 4551} {"train_loss": -7.121227264404297, "global_step": 191157, "epoch": 4551} {"train_loss": -7.2056684494018555, "global_step": 191158, "epoch": 4551} {"train_loss": -7.137363433837891, "global_step": 191159, "epoch": 4551} {"train_loss": -7.186498641967773, "global_step": 191160, "epoch": 4551} {"train_loss": -7.217284679412842, "global_step": 191161, "epoch": 4551} {"train_loss": -7.2588911056518555, "global_step": 191162, "epoch": 4551} {"train_loss": -7.170834541320801, "global_step": 191163, "epoch": 4551} {"train_loss": -7.1677093505859375, "global_step": 191164, "epoch": 4551} {"train_loss": -7.232929229736328, "global_step": 191165, "epoch": 4551} {"train_loss": -7.176069259643555, "global_step": 191166, "epoch": 4551} {"train_loss": -7.228427886962891, "global_step": 191167, "epoch": 4551} {"train_loss": -7.262711524963379, "global_step": 191168, "epoch": 4551} {"train_loss": -7.35257625579834, "global_step": 191169, "epoch": 4551} {"train_loss": -7.21013069152832, "global_step": 191170, "epoch": 4551} {"train_loss": -7.304093837738037, "global_step": 191171, "epoch": 4551} {"train_loss": -7.23969030380249, "global_step": 191172, "epoch": 4551} {"train_loss": -7.244568824768066, "global_step": 191173, "epoch": 4551} {"train_loss": -7.256093502044678, "global_step": 191174, "epoch": 4551} {"train_loss": -7.267366409301758, "global_step": 191175, "epoch": 4551} {"train_loss": -7.189179420471191, "global_step": 191176, "epoch": 4551} {"train_loss": -7.16960334777832, "global_step": 191177, "epoch": 4551} {"train_loss": -7.3219499588012695, "global_step": 191178, "epoch": 4551} {"train_loss": -7.255739688873291, "global_step": 191179, "epoch": 4551} {"train_loss": -7.292299747467041, "global_step": 191180, "epoch": 4551} {"train_loss": -7.313234329223633, "global_step": 191181, "epoch": 4551} {"train_loss": -7.185997486114502, "global_step": 191182, "epoch": 4551} {"train_loss": -7.211372420901344, "global_step": 191183, "epoch": 4551, "val_loss": 80987.5546875} {"train_loss": -7.23703670501709, "global_step": 191184, "epoch": 4552} {"train_loss": -7.217430114746094, "global_step": 191185, "epoch": 4552} {"train_loss": -7.227828025817871, "global_step": 191186, "epoch": 4552} {"train_loss": -7.115365982055664, "global_step": 191187, "epoch": 4552} {"train_loss": -7.213035583496094, "global_step": 191188, "epoch": 4552} {"train_loss": -7.224893569946289, "global_step": 191189, "epoch": 4552} {"train_loss": -7.329710960388184, "global_step": 191190, "epoch": 4552} {"train_loss": -7.430552005767822, "global_step": 191191, "epoch": 4552} {"train_loss": -7.3068060874938965, "global_step": 191192, "epoch": 4552} {"train_loss": -7.11082649230957, "global_step": 191193, "epoch": 4552} {"train_loss": -7.225868225097656, "global_step": 191194, "epoch": 4552} {"train_loss": -7.215790748596191, "global_step": 191195, "epoch": 4552} {"train_loss": -7.277256011962891, "global_step": 191196, "epoch": 4552} {"train_loss": -7.198114395141602, "global_step": 191197, "epoch": 4552} {"train_loss": -7.184744834899902, "global_step": 191198, "epoch": 4552} {"train_loss": -7.228490352630615, "global_step": 191199, "epoch": 4552} {"train_loss": -7.221424102783203, "global_step": 191200, "epoch": 4552} {"train_loss": -7.231770992279053, "global_step": 191201, "epoch": 4552} {"train_loss": -7.210132598876953, "global_step": 191202, "epoch": 4552} {"train_loss": -7.240300178527832, "global_step": 191203, "epoch": 4552} {"train_loss": -7.17214298248291, "global_step": 191204, "epoch": 4552} {"train_loss": -7.184333324432373, "global_step": 191205, "epoch": 4552} {"train_loss": -7.173226356506348, "global_step": 191206, "epoch": 4552} {"train_loss": -7.294716835021973, "global_step": 191207, "epoch": 4552} {"train_loss": -7.201192855834961, "global_step": 191208, "epoch": 4552} {"train_loss": -7.118865966796875, "global_step": 191209, "epoch": 4552} {"train_loss": -7.268823623657227, "global_step": 191210, "epoch": 4552} {"train_loss": -7.1875, "global_step": 191211, "epoch": 4552} {"train_loss": -7.206022262573242, "global_step": 191212, "epoch": 4552} {"train_loss": -7.245582580566406, "global_step": 191213, "epoch": 4552} {"train_loss": -7.253963947296143, "global_step": 191214, "epoch": 4552} {"train_loss": -7.157937526702881, "global_step": 191215, "epoch": 4552} {"train_loss": -7.066423416137695, "global_step": 191216, "epoch": 4552} {"train_loss": -7.187034606933594, "global_step": 191217, "epoch": 4552} {"train_loss": -7.127214431762695, "global_step": 191218, "epoch": 4552} {"train_loss": -7.2001471519470215, "global_step": 191219, "epoch": 4552} {"train_loss": -7.286415100097656, "global_step": 191220, "epoch": 4552} {"train_loss": -7.1461687088012695, "global_step": 191221, "epoch": 4552} {"train_loss": -7.355250835418701, "global_step": 191222, "epoch": 4552} {"train_loss": -7.047684669494629, "global_step": 191223, "epoch": 4552} {"train_loss": -7.0841965675354, "global_step": 191224, "epoch": 4552} {"train_loss": -7.209594647089641, "global_step": 191225, "epoch": 4552, "val_loss": 81175.640625} {"train_loss": -7.143852233886719, "global_step": 191226, "epoch": 4553} {"train_loss": -7.060825347900391, "global_step": 191227, "epoch": 4553} {"train_loss": -7.089615821838379, "global_step": 191228, "epoch": 4553} {"train_loss": -6.853991508483887, "global_step": 191229, "epoch": 4553} {"train_loss": -7.124471187591553, "global_step": 191230, "epoch": 4553} {"train_loss": -6.990027904510498, "global_step": 191231, "epoch": 4553} {"train_loss": -7.056212425231934, "global_step": 191232, "epoch": 4553} {"train_loss": -7.028202056884766, "global_step": 191233, "epoch": 4553} {"train_loss": -7.023462295532227, "global_step": 191234, "epoch": 4553} {"train_loss": -7.033766746520996, "global_step": 191235, "epoch": 4553} {"train_loss": -7.108708381652832, "global_step": 191236, "epoch": 4553} {"train_loss": -7.03994083404541, "global_step": 191237, "epoch": 4553} {"train_loss": -7.1176252365112305, "global_step": 191238, "epoch": 4553} {"train_loss": -7.110980987548828, "global_step": 191239, "epoch": 4553} {"train_loss": -7.087005615234375, "global_step": 191240, "epoch": 4553} {"train_loss": -7.242463111877441, "global_step": 191241, "epoch": 4553} {"train_loss": -7.195528030395508, "global_step": 191242, "epoch": 4553} {"train_loss": -7.051845550537109, "global_step": 191243, "epoch": 4553} {"train_loss": -7.085252285003662, "global_step": 191244, "epoch": 4553} {"train_loss": -7.154642105102539, "global_step": 191245, "epoch": 4553} {"train_loss": -7.172807693481445, "global_step": 191246, "epoch": 4553} {"train_loss": -7.082334995269775, "global_step": 191247, "epoch": 4553} {"train_loss": -7.150328159332275, "global_step": 191248, "epoch": 4553} {"train_loss": -7.128147125244141, "global_step": 191249, "epoch": 4553} {"train_loss": -7.151885032653809, "global_step": 191250, "epoch": 4553} {"train_loss": -7.065554141998291, "global_step": 191251, "epoch": 4553} {"train_loss": -7.216907501220703, "global_step": 191252, "epoch": 4553} {"train_loss": -7.1003828048706055, "global_step": 191253, "epoch": 4553} {"train_loss": -7.13249397277832, "global_step": 191254, "epoch": 4553} {"train_loss": -7.218519687652588, "global_step": 191255, "epoch": 4553} {"train_loss": -7.234819412231445, "global_step": 191256, "epoch": 4553} {"train_loss": -7.272829532623291, "global_step": 191257, "epoch": 4553} {"train_loss": -7.194128036499023, "global_step": 191258, "epoch": 4553} {"train_loss": -7.283230781555176, "global_step": 191259, "epoch": 4553} {"train_loss": -7.164031505584717, "global_step": 191260, "epoch": 4553} {"train_loss": -7.309449195861816, "global_step": 191261, "epoch": 4553} {"train_loss": -7.309701919555664, "global_step": 191262, "epoch": 4553} {"train_loss": -7.3594489097595215, "global_step": 191263, "epoch": 4553} {"train_loss": -7.302199840545654, "global_step": 191264, "epoch": 4553} {"train_loss": -7.390803337097168, "global_step": 191265, "epoch": 4553} {"train_loss": -7.27128791809082, "global_step": 191266, "epoch": 4553} {"train_loss": -7.15319097609747, "global_step": 191267, "epoch": 4553, "val_loss": 80954.03125} {"train_loss": -7.228044509887695, "global_step": 191268, "epoch": 4554} {"train_loss": -7.245288372039795, "global_step": 191269, "epoch": 4554} {"train_loss": -7.261844635009766, "global_step": 191270, "epoch": 4554} {"train_loss": -7.368308067321777, "global_step": 191271, "epoch": 4554} {"train_loss": -7.197372913360596, "global_step": 191272, "epoch": 4554} {"train_loss": -7.2684431076049805, "global_step": 191273, "epoch": 4554} {"train_loss": -7.204922199249268, "global_step": 191274, "epoch": 4554} {"train_loss": -7.234053611755371, "global_step": 191275, "epoch": 4554} {"train_loss": -7.264329433441162, "global_step": 191276, "epoch": 4554} {"train_loss": -7.1524505615234375, "global_step": 191277, "epoch": 4554} {"train_loss": -7.126394271850586, "global_step": 191278, "epoch": 4554} {"train_loss": -7.142064571380615, "global_step": 191279, "epoch": 4554} {"train_loss": -7.13906192779541, "global_step": 191280, "epoch": 4554} {"train_loss": -7.075608253479004, "global_step": 191281, "epoch": 4554} {"train_loss": -7.157027244567871, "global_step": 191282, "epoch": 4554} {"train_loss": -7.12816858291626, "global_step": 191283, "epoch": 4554} {"train_loss": -7.016199111938477, "global_step": 191284, "epoch": 4554} {"train_loss": -7.206371307373047, "global_step": 191285, "epoch": 4554} {"train_loss": -7.17495059967041, "global_step": 191286, "epoch": 4554} {"train_loss": -7.117223739624023, "global_step": 191287, "epoch": 4554} {"train_loss": -7.282395839691162, "global_step": 191288, "epoch": 4554} {"train_loss": -7.234364032745361, "global_step": 191289, "epoch": 4554} {"train_loss": -7.314221382141113, "global_step": 191290, "epoch": 4554} {"train_loss": -7.2213921546936035, "global_step": 191291, "epoch": 4554} {"train_loss": -7.256689548492432, "global_step": 191292, "epoch": 4554} {"train_loss": -7.205320358276367, "global_step": 191293, "epoch": 4554} {"train_loss": -7.18656063079834, "global_step": 191294, "epoch": 4554} {"train_loss": -7.232264041900635, "global_step": 191295, "epoch": 4554} {"train_loss": -7.2647857666015625, "global_step": 191296, "epoch": 4554} {"train_loss": -7.129545211791992, "global_step": 191297, "epoch": 4554} {"train_loss": -7.367997169494629, "global_step": 191298, "epoch": 4554} {"train_loss": -7.288524627685547, "global_step": 191299, "epoch": 4554} {"train_loss": -7.239284992218018, "global_step": 191300, "epoch": 4554} {"train_loss": -7.189462661743164, "global_step": 191301, "epoch": 4554} {"train_loss": -7.296151638031006, "global_step": 191302, "epoch": 4554} {"train_loss": -7.26678466796875, "global_step": 191303, "epoch": 4554} {"train_loss": -7.206173896789551, "global_step": 191304, "epoch": 4554} {"train_loss": -7.309161186218262, "global_step": 191305, "epoch": 4554} {"train_loss": -7.178723335266113, "global_step": 191306, "epoch": 4554} {"train_loss": -7.2878217697143555, "global_step": 191307, "epoch": 4554} {"train_loss": -7.313055038452148, "global_step": 191308, "epoch": 4554} {"train_loss": -7.217870871225993, "global_step": 191309, "epoch": 4554, "val_loss": 80909.265625} {"train_loss": -7.185127258300781, "global_step": 191310, "epoch": 4555} {"train_loss": -7.304462432861328, "global_step": 191311, "epoch": 4555} {"train_loss": -7.067014694213867, "global_step": 191312, "epoch": 4555} {"train_loss": -7.192401885986328, "global_step": 191313, "epoch": 4555} {"train_loss": -7.234042167663574, "global_step": 191314, "epoch": 4555} {"train_loss": -7.267773151397705, "global_step": 191315, "epoch": 4555} {"train_loss": -7.308808326721191, "global_step": 191316, "epoch": 4555} {"train_loss": -7.262407302856445, "global_step": 191317, "epoch": 4555} {"train_loss": -7.153445243835449, "global_step": 191318, "epoch": 4555} {"train_loss": -7.332546234130859, "global_step": 191319, "epoch": 4555} {"train_loss": -7.0521016120910645, "global_step": 191320, "epoch": 4555} {"train_loss": -7.0772624015808105, "global_step": 191321, "epoch": 4555} {"train_loss": -7.201730251312256, "global_step": 191322, "epoch": 4555} {"train_loss": -7.162574768066406, "global_step": 191323, "epoch": 4555} {"train_loss": -7.280774116516113, "global_step": 191324, "epoch": 4555} {"train_loss": -7.172475814819336, "global_step": 191325, "epoch": 4555} {"train_loss": -7.267093658447266, "global_step": 191326, "epoch": 4555} {"train_loss": -7.215962886810303, "global_step": 191327, "epoch": 4555} {"train_loss": -7.219779968261719, "global_step": 191328, "epoch": 4555} {"train_loss": -7.211162567138672, "global_step": 191329, "epoch": 4555} {"train_loss": -7.020853042602539, "global_step": 191330, "epoch": 4555} {"train_loss": -7.200728416442871, "global_step": 191331, "epoch": 4555} {"train_loss": -7.203971862792969, "global_step": 191332, "epoch": 4555} {"train_loss": -7.112326622009277, "global_step": 191333, "epoch": 4555} {"train_loss": -7.225606918334961, "global_step": 191334, "epoch": 4555} {"train_loss": -7.12867546081543, "global_step": 191335, "epoch": 4555} {"train_loss": -7.120128631591797, "global_step": 191336, "epoch": 4555} {"train_loss": -7.121265888214111, "global_step": 191337, "epoch": 4555} {"train_loss": -7.179571151733398, "global_step": 191338, "epoch": 4555} {"train_loss": -7.041720390319824, "global_step": 191339, "epoch": 4555} {"train_loss": -7.2420244216918945, "global_step": 191340, "epoch": 4555} {"train_loss": -7.199118614196777, "global_step": 191341, "epoch": 4555} {"train_loss": -7.164003849029541, "global_step": 191342, "epoch": 4555} {"train_loss": -7.170679092407227, "global_step": 191343, "epoch": 4555} {"train_loss": -7.025474548339844, "global_step": 191344, "epoch": 4555} {"train_loss": -7.2211408615112305, "global_step": 191345, "epoch": 4555} {"train_loss": -7.1991071701049805, "global_step": 191346, "epoch": 4555} {"train_loss": -7.191913604736328, "global_step": 191347, "epoch": 4555} {"train_loss": -7.22752046585083, "global_step": 191348, "epoch": 4555} {"train_loss": -7.116586685180664, "global_step": 191349, "epoch": 4555} {"train_loss": -7.216914176940918, "global_step": 191350, "epoch": 4555} {"train_loss": -7.183143400010609, "global_step": 191351, "epoch": 4555, "val_loss": 81068.46875} {"train_loss": -7.193951606750488, "global_step": 191352, "epoch": 4556} {"train_loss": -7.115217208862305, "global_step": 191353, "epoch": 4556} {"train_loss": -7.274988651275635, "global_step": 191354, "epoch": 4556} {"train_loss": -7.093698501586914, "global_step": 191355, "epoch": 4556} {"train_loss": -7.246059417724609, "global_step": 191356, "epoch": 4556} {"train_loss": -7.274848937988281, "global_step": 191357, "epoch": 4556} {"train_loss": -7.135278224945068, "global_step": 191358, "epoch": 4556} {"train_loss": -7.154018402099609, "global_step": 191359, "epoch": 4556} {"train_loss": -7.255190372467041, "global_step": 191360, "epoch": 4556} {"train_loss": -7.260849952697754, "global_step": 191361, "epoch": 4556} {"train_loss": -7.178856372833252, "global_step": 191362, "epoch": 4556} {"train_loss": -7.268560886383057, "global_step": 191363, "epoch": 4556} {"train_loss": -7.244607448577881, "global_step": 191364, "epoch": 4556} {"train_loss": -7.299596786499023, "global_step": 191365, "epoch": 4556} {"train_loss": -7.0752410888671875, "global_step": 191366, "epoch": 4556} {"train_loss": -7.300276279449463, "global_step": 191367, "epoch": 4556} {"train_loss": -7.307796478271484, "global_step": 191368, "epoch": 4556} {"train_loss": -7.127246856689453, "global_step": 191369, "epoch": 4556} {"train_loss": -7.225994110107422, "global_step": 191370, "epoch": 4556} {"train_loss": -7.226262092590332, "global_step": 191371, "epoch": 4556} {"train_loss": -7.181290626525879, "global_step": 191372, "epoch": 4556} {"train_loss": -7.200300216674805, "global_step": 191373, "epoch": 4556} {"train_loss": -7.235156536102295, "global_step": 191374, "epoch": 4556} {"train_loss": -7.176832675933838, "global_step": 191375, "epoch": 4556} {"train_loss": -7.268078804016113, "global_step": 191376, "epoch": 4556} {"train_loss": -7.297176361083984, "global_step": 191377, "epoch": 4556} {"train_loss": -7.180174350738525, "global_step": 191378, "epoch": 4556} {"train_loss": -7.278532981872559, "global_step": 191379, "epoch": 4556} {"train_loss": -7.256035804748535, "global_step": 191380, "epoch": 4556} {"train_loss": -7.188802719116211, "global_step": 191381, "epoch": 4556} {"train_loss": -7.136857986450195, "global_step": 191382, "epoch": 4556} {"train_loss": -7.287679195404053, "global_step": 191383, "epoch": 4556} {"train_loss": -7.332904815673828, "global_step": 191384, "epoch": 4556} {"train_loss": -7.291311264038086, "global_step": 191385, "epoch": 4556} {"train_loss": -7.2357683181762695, "global_step": 191386, "epoch": 4556} {"train_loss": -7.360930442810059, "global_step": 191387, "epoch": 4556} {"train_loss": -7.342801570892334, "global_step": 191388, "epoch": 4556} {"train_loss": -7.234575271606445, "global_step": 191389, "epoch": 4556} {"train_loss": -7.2370710372924805, "global_step": 191390, "epoch": 4556} {"train_loss": -7.281541347503662, "global_step": 191391, "epoch": 4556} {"train_loss": -7.314260482788086, "global_step": 191392, "epoch": 4556} {"train_loss": -7.232218288239979, "global_step": 191393, "epoch": 4556, "val_loss": 81202.3359375} {"train_loss": -7.305401802062988, "global_step": 191394, "epoch": 4557} {"train_loss": -7.436148643493652, "global_step": 191395, "epoch": 4557} {"train_loss": -7.290797233581543, "global_step": 191396, "epoch": 4557} {"train_loss": -7.301227569580078, "global_step": 191397, "epoch": 4557} {"train_loss": -7.276259422302246, "global_step": 191398, "epoch": 4557} {"train_loss": -7.2437543869018555, "global_step": 191399, "epoch": 4557} {"train_loss": -7.244231224060059, "global_step": 191400, "epoch": 4557} {"train_loss": -7.29049015045166, "global_step": 191401, "epoch": 4557} {"train_loss": -7.128232002258301, "global_step": 191402, "epoch": 4557} {"train_loss": -7.13828182220459, "global_step": 191403, "epoch": 4557} {"train_loss": -7.289155006408691, "global_step": 191404, "epoch": 4557} {"train_loss": -7.16511869430542, "global_step": 191405, "epoch": 4557} {"train_loss": -7.218879699707031, "global_step": 191406, "epoch": 4557} {"train_loss": -7.231729507446289, "global_step": 191407, "epoch": 4557} {"train_loss": -7.183974742889404, "global_step": 191408, "epoch": 4557} {"train_loss": -7.224775314331055, "global_step": 191409, "epoch": 4557} {"train_loss": -7.244483470916748, "global_step": 191410, "epoch": 4557} {"train_loss": -7.1611785888671875, "global_step": 191411, "epoch": 4557} {"train_loss": -7.113556861877441, "global_step": 191412, "epoch": 4557} {"train_loss": -7.170283317565918, "global_step": 191413, "epoch": 4557} {"train_loss": -7.1529436111450195, "global_step": 191414, "epoch": 4557} {"train_loss": -7.057898998260498, "global_step": 191415, "epoch": 4557} {"train_loss": -7.2179412841796875, "global_step": 191416, "epoch": 4557} {"train_loss": -7.036757469177246, "global_step": 191417, "epoch": 4557} {"train_loss": -7.110883712768555, "global_step": 191418, "epoch": 4557} {"train_loss": -7.1343464851379395, "global_step": 191419, "epoch": 4557} {"train_loss": -7.11414909362793, "global_step": 191420, "epoch": 4557} {"train_loss": -7.112525939941406, "global_step": 191421, "epoch": 4557} {"train_loss": -7.1125640869140625, "global_step": 191422, "epoch": 4557} {"train_loss": -7.1637115478515625, "global_step": 191423, "epoch": 4557} {"train_loss": -6.964499473571777, "global_step": 191424, "epoch": 4557} {"train_loss": -7.254733085632324, "global_step": 191425, "epoch": 4557} {"train_loss": -7.214504241943359, "global_step": 191426, "epoch": 4557} {"train_loss": -7.198219299316406, "global_step": 191427, "epoch": 4557} {"train_loss": -7.137642860412598, "global_step": 191428, "epoch": 4557} {"train_loss": -7.201294898986816, "global_step": 191429, "epoch": 4557} {"train_loss": -7.179471015930176, "global_step": 191430, "epoch": 4557} {"train_loss": -7.232937812805176, "global_step": 191431, "epoch": 4557} {"train_loss": -7.175561904907227, "global_step": 191432, "epoch": 4557} {"train_loss": -7.2121195793151855, "global_step": 191433, "epoch": 4557} {"train_loss": -7.2580437660217285, "global_step": 191434, "epoch": 4557} {"train_loss": -7.194128819874355, "global_step": 191435, "epoch": 4557, "val_loss": 81012.46875} {"train_loss": -7.13939094543457, "global_step": 191436, "epoch": 4558} {"train_loss": -7.155033111572266, "global_step": 191437, "epoch": 4558} {"train_loss": -7.149314880371094, "global_step": 191438, "epoch": 4558} {"train_loss": -7.0827531814575195, "global_step": 191439, "epoch": 4558} {"train_loss": -7.1892852783203125, "global_step": 191440, "epoch": 4558} {"train_loss": -7.098721504211426, "global_step": 191441, "epoch": 4558} {"train_loss": -7.2044854164123535, "global_step": 191442, "epoch": 4558} {"train_loss": -7.181855201721191, "global_step": 191443, "epoch": 4558} {"train_loss": -7.027632713317871, "global_step": 191444, "epoch": 4558} {"train_loss": -7.28023099899292, "global_step": 191445, "epoch": 4558} {"train_loss": -7.205733299255371, "global_step": 191446, "epoch": 4558} {"train_loss": -7.124711513519287, "global_step": 191447, "epoch": 4558} {"train_loss": -7.265295028686523, "global_step": 191448, "epoch": 4558} {"train_loss": -7.3433709144592285, "global_step": 191449, "epoch": 4558} {"train_loss": -7.057662010192871, "global_step": 191450, "epoch": 4558} {"train_loss": -7.247844696044922, "global_step": 191451, "epoch": 4558} {"train_loss": -7.1175856590271, "global_step": 191452, "epoch": 4558} {"train_loss": -7.082156658172607, "global_step": 191453, "epoch": 4558} {"train_loss": -7.3133320808410645, "global_step": 191454, "epoch": 4558} {"train_loss": -7.20322847366333, "global_step": 191455, "epoch": 4558} {"train_loss": -7.222022533416748, "global_step": 191456, "epoch": 4558} {"train_loss": -7.13437032699585, "global_step": 191457, "epoch": 4558} {"train_loss": -7.110422611236572, "global_step": 191458, "epoch": 4558} {"train_loss": -7.262383937835693, "global_step": 191459, "epoch": 4558} {"train_loss": -7.2045087814331055, "global_step": 191460, "epoch": 4558} {"train_loss": -7.137169361114502, "global_step": 191461, "epoch": 4558} {"train_loss": -7.1626386642456055, "global_step": 191462, "epoch": 4558} {"train_loss": -7.107682228088379, "global_step": 191463, "epoch": 4558} {"train_loss": -7.146032810211182, "global_step": 191464, "epoch": 4558} {"train_loss": -7.268265724182129, "global_step": 191465, "epoch": 4558} {"train_loss": -7.213033676147461, "global_step": 191466, "epoch": 4558} {"train_loss": -7.258891582489014, "global_step": 191467, "epoch": 4558} {"train_loss": -7.253875732421875, "global_step": 191468, "epoch": 4558} {"train_loss": -7.237523078918457, "global_step": 191469, "epoch": 4558} {"train_loss": -7.344914436340332, "global_step": 191470, "epoch": 4558} {"train_loss": -7.240583896636963, "global_step": 191471, "epoch": 4558} {"train_loss": -7.3194684982299805, "global_step": 191472, "epoch": 4558} {"train_loss": -7.352744102478027, "global_step": 191473, "epoch": 4558} {"train_loss": -7.265222549438477, "global_step": 191474, "epoch": 4558} {"train_loss": -7.232044219970703, "global_step": 191475, "epoch": 4558} {"train_loss": -7.075732231140137, "global_step": 191476, "epoch": 4558} {"train_loss": -7.19676609266372, "global_step": 191477, "epoch": 4558, "val_loss": 80991.9453125} {"train_loss": -7.2849884033203125, "global_step": 191478, "epoch": 4559} {"train_loss": -7.2032270431518555, "global_step": 191479, "epoch": 4559} {"train_loss": -7.241025924682617, "global_step": 191480, "epoch": 4559} {"train_loss": -7.314235687255859, "global_step": 191481, "epoch": 4559} {"train_loss": -7.129670143127441, "global_step": 191482, "epoch": 4559} {"train_loss": -7.2227783203125, "global_step": 191483, "epoch": 4559} {"train_loss": -7.208881378173828, "global_step": 191484, "epoch": 4559} {"train_loss": -7.316384315490723, "global_step": 191485, "epoch": 4559} {"train_loss": -7.137554168701172, "global_step": 191486, "epoch": 4559} {"train_loss": -7.270751953125, "global_step": 191487, "epoch": 4559} {"train_loss": -7.267985820770264, "global_step": 191488, "epoch": 4559} {"train_loss": -7.114994525909424, "global_step": 191489, "epoch": 4559} {"train_loss": -7.161628723144531, "global_step": 191490, "epoch": 4559} {"train_loss": -7.13273286819458, "global_step": 191491, "epoch": 4559} {"train_loss": -7.148004055023193, "global_step": 191492, "epoch": 4559} {"train_loss": -7.002864360809326, "global_step": 191493, "epoch": 4559} {"train_loss": -7.209810256958008, "global_step": 191494, "epoch": 4559} {"train_loss": -7.179680824279785, "global_step": 191495, "epoch": 4559} {"train_loss": -6.99189567565918, "global_step": 191496, "epoch": 4559} {"train_loss": -7.170405387878418, "global_step": 191497, "epoch": 4559} {"train_loss": -7.064217567443848, "global_step": 191498, "epoch": 4559} {"train_loss": -7.139670372009277, "global_step": 191499, "epoch": 4559} {"train_loss": -7.1715593338012695, "global_step": 191500, "epoch": 4559} {"train_loss": -7.144725799560547, "global_step": 191501, "epoch": 4559} {"train_loss": -7.185903549194336, "global_step": 191502, "epoch": 4559} {"train_loss": -7.127751350402832, "global_step": 191503, "epoch": 4559} {"train_loss": -7.161664009094238, "global_step": 191504, "epoch": 4559} {"train_loss": -7.301939010620117, "global_step": 191505, "epoch": 4559} {"train_loss": -7.170624256134033, "global_step": 191506, "epoch": 4559} {"train_loss": -7.29442024230957, "global_step": 191507, "epoch": 4559} {"train_loss": -7.159604072570801, "global_step": 191508, "epoch": 4559} {"train_loss": -7.14876651763916, "global_step": 191509, "epoch": 4559} {"train_loss": -7.248795509338379, "global_step": 191510, "epoch": 4559} {"train_loss": -7.2348127365112305, "global_step": 191511, "epoch": 4559} {"train_loss": -7.172605037689209, "global_step": 191512, "epoch": 4559} {"train_loss": -7.15516471862793, "global_step": 191513, "epoch": 4559} {"train_loss": -7.2400383949279785, "global_step": 191514, "epoch": 4559} {"train_loss": -7.268819808959961, "global_step": 191515, "epoch": 4559} {"train_loss": -7.1866912841796875, "global_step": 191516, "epoch": 4559} {"train_loss": -7.147979736328125, "global_step": 191517, "epoch": 4559} {"train_loss": -7.053443908691406, "global_step": 191518, "epoch": 4559} {"train_loss": -7.182161524182274, "global_step": 191519, "epoch": 4559, "val_loss": 80884.8046875} {"train_loss": -7.22966194152832, "global_step": 191520, "epoch": 4560} {"train_loss": -7.135840892791748, "global_step": 191521, "epoch": 4560} {"train_loss": -7.297508239746094, "global_step": 191522, "epoch": 4560} {"train_loss": -7.271999359130859, "global_step": 191523, "epoch": 4560} {"train_loss": -7.160989761352539, "global_step": 191524, "epoch": 4560} {"train_loss": -7.203129291534424, "global_step": 191525, "epoch": 4560} {"train_loss": -7.129918098449707, "global_step": 191526, "epoch": 4560} {"train_loss": -7.202380180358887, "global_step": 191527, "epoch": 4560} {"train_loss": -7.262071132659912, "global_step": 191528, "epoch": 4560} {"train_loss": -7.245856761932373, "global_step": 191529, "epoch": 4560} {"train_loss": -7.169224262237549, "global_step": 191530, "epoch": 4560} {"train_loss": -7.167271137237549, "global_step": 191531, "epoch": 4560} {"train_loss": -7.273454666137695, "global_step": 191532, "epoch": 4560} {"train_loss": -7.225120544433594, "global_step": 191533, "epoch": 4560} {"train_loss": -7.20862340927124, "global_step": 191534, "epoch": 4560} {"train_loss": -7.182575702667236, "global_step": 191535, "epoch": 4560} {"train_loss": -7.0384416580200195, "global_step": 191536, "epoch": 4560} {"train_loss": -7.316666126251221, "global_step": 191537, "epoch": 4560} {"train_loss": -7.213772296905518, "global_step": 191538, "epoch": 4560} {"train_loss": -7.217247009277344, "global_step": 191539, "epoch": 4560} {"train_loss": -7.285434722900391, "global_step": 191540, "epoch": 4560} {"train_loss": -7.018651962280273, "global_step": 191541, "epoch": 4560} {"train_loss": -7.182595252990723, "global_step": 191542, "epoch": 4560} {"train_loss": -7.149197578430176, "global_step": 191543, "epoch": 4560} {"train_loss": -7.157232761383057, "global_step": 191544, "epoch": 4560} {"train_loss": -7.105323791503906, "global_step": 191545, "epoch": 4560} {"train_loss": -7.203128814697266, "global_step": 191546, "epoch": 4560} {"train_loss": -7.03049373626709, "global_step": 191547, "epoch": 4560} {"train_loss": -7.288098335266113, "global_step": 191548, "epoch": 4560} {"train_loss": -7.131520748138428, "global_step": 191549, "epoch": 4560} {"train_loss": -7.152883052825928, "global_step": 191550, "epoch": 4560} {"train_loss": -7.190280914306641, "global_step": 191551, "epoch": 4560} {"train_loss": -7.139727592468262, "global_step": 191552, "epoch": 4560} {"train_loss": -7.116642951965332, "global_step": 191553, "epoch": 4560} {"train_loss": -7.0091986656188965, "global_step": 191554, "epoch": 4560} {"train_loss": -7.17136287689209, "global_step": 191555, "epoch": 4560} {"train_loss": -7.123312950134277, "global_step": 191556, "epoch": 4560} {"train_loss": -7.1433000564575195, "global_step": 191557, "epoch": 4560} {"train_loss": -7.114440441131592, "global_step": 191558, "epoch": 4560} {"train_loss": -7.270212173461914, "global_step": 191559, "epoch": 4560} {"train_loss": -7.2932891845703125, "global_step": 191560, "epoch": 4560} {"train_loss": -7.181995017187936, "global_step": 191561, "epoch": 4560, "val_loss": 81170.8046875} {"train_loss": -7.144265174865723, "global_step": 191562, "epoch": 4561} {"train_loss": -7.173978805541992, "global_step": 191563, "epoch": 4561} {"train_loss": -7.369144439697266, "global_step": 191564, "epoch": 4561} {"train_loss": -7.244237899780273, "global_step": 191565, "epoch": 4561} {"train_loss": -7.263323783874512, "global_step": 191566, "epoch": 4561} {"train_loss": -7.245089530944824, "global_step": 191567, "epoch": 4561} {"train_loss": -7.296597480773926, "global_step": 191568, "epoch": 4561} {"train_loss": -7.236835479736328, "global_step": 191569, "epoch": 4561} {"train_loss": -7.249558925628662, "global_step": 191570, "epoch": 4561} {"train_loss": -7.19647216796875, "global_step": 191571, "epoch": 4561} {"train_loss": -7.313891410827637, "global_step": 191572, "epoch": 4561} {"train_loss": -7.304366111755371, "global_step": 191573, "epoch": 4561} {"train_loss": -7.298803329467773, "global_step": 191574, "epoch": 4561} {"train_loss": -7.34883451461792, "global_step": 191575, "epoch": 4561} {"train_loss": -7.221787452697754, "global_step": 191576, "epoch": 4561} {"train_loss": -7.157138347625732, "global_step": 191577, "epoch": 4561} {"train_loss": -7.279752731323242, "global_step": 191578, "epoch": 4561} {"train_loss": -7.3271589279174805, "global_step": 191579, "epoch": 4561} {"train_loss": -7.343623161315918, "global_step": 191580, "epoch": 4561} {"train_loss": -7.27765417098999, "global_step": 191581, "epoch": 4561} {"train_loss": -7.30429220199585, "global_step": 191582, "epoch": 4561} {"train_loss": -7.239625930786133, "global_step": 191583, "epoch": 4561} {"train_loss": -7.357656002044678, "global_step": 191584, "epoch": 4561} {"train_loss": -7.271145820617676, "global_step": 191585, "epoch": 4561} {"train_loss": -7.148013114929199, "global_step": 191586, "epoch": 4561} {"train_loss": -7.317744255065918, "global_step": 191587, "epoch": 4561} {"train_loss": -7.318939208984375, "global_step": 191588, "epoch": 4561} {"train_loss": -7.21512508392334, "global_step": 191589, "epoch": 4561} {"train_loss": -7.123332977294922, "global_step": 191590, "epoch": 4561} {"train_loss": -7.289793014526367, "global_step": 191591, "epoch": 4561} {"train_loss": -7.2038164138793945, "global_step": 191592, "epoch": 4561} {"train_loss": -7.2841668128967285, "global_step": 191593, "epoch": 4561} {"train_loss": -7.208139419555664, "global_step": 191594, "epoch": 4561} {"train_loss": -7.209531784057617, "global_step": 191595, "epoch": 4561} {"train_loss": -7.337520122528076, "global_step": 191596, "epoch": 4561} {"train_loss": -7.253596782684326, "global_step": 191597, "epoch": 4561} {"train_loss": -7.266010761260986, "global_step": 191598, "epoch": 4561} {"train_loss": -7.2035980224609375, "global_step": 191599, "epoch": 4561} {"train_loss": -7.327598571777344, "global_step": 191600, "epoch": 4561} {"train_loss": -7.254883766174316, "global_step": 191601, "epoch": 4561} {"train_loss": -7.20555305480957, "global_step": 191602, "epoch": 4561} {"train_loss": -7.261257875533331, "global_step": 191603, "epoch": 4561, "val_loss": 81177.390625} {"train_loss": -7.233042240142822, "global_step": 191604, "epoch": 4562} {"train_loss": -7.313703536987305, "global_step": 191605, "epoch": 4562} {"train_loss": -7.2760162353515625, "global_step": 191606, "epoch": 4562} {"train_loss": -7.231729507446289, "global_step": 191607, "epoch": 4562} {"train_loss": -7.293061256408691, "global_step": 191608, "epoch": 4562} {"train_loss": -7.181346893310547, "global_step": 191609, "epoch": 4562} {"train_loss": -7.239084243774414, "global_step": 191610, "epoch": 4562} {"train_loss": -7.219209671020508, "global_step": 191611, "epoch": 4562} {"train_loss": -7.303966999053955, "global_step": 191612, "epoch": 4562} {"train_loss": -7.315708160400391, "global_step": 191613, "epoch": 4562} {"train_loss": -7.240900993347168, "global_step": 191614, "epoch": 4562} {"train_loss": -7.204137325286865, "global_step": 191615, "epoch": 4562} {"train_loss": -7.26910400390625, "global_step": 191616, "epoch": 4562} {"train_loss": -7.330526351928711, "global_step": 191617, "epoch": 4562} {"train_loss": -7.3240556716918945, "global_step": 191618, "epoch": 4562} {"train_loss": -7.258715629577637, "global_step": 191619, "epoch": 4562} {"train_loss": -7.254235744476318, "global_step": 191620, "epoch": 4562} {"train_loss": -7.280839920043945, "global_step": 191621, "epoch": 4562} {"train_loss": -7.282254219055176, "global_step": 191622, "epoch": 4562} {"train_loss": -7.006333351135254, "global_step": 191623, "epoch": 4562} {"train_loss": -7.193286895751953, "global_step": 191624, "epoch": 4562} {"train_loss": -7.222241401672363, "global_step": 191625, "epoch": 4562} {"train_loss": -7.140714645385742, "global_step": 191626, "epoch": 4562} {"train_loss": -7.230185508728027, "global_step": 191627, "epoch": 4562} {"train_loss": -7.288580894470215, "global_step": 191628, "epoch": 4562} {"train_loss": -7.236936092376709, "global_step": 191629, "epoch": 4562} {"train_loss": -7.272968292236328, "global_step": 191630, "epoch": 4562} {"train_loss": -7.203850746154785, "global_step": 191631, "epoch": 4562} {"train_loss": -7.215655326843262, "global_step": 191632, "epoch": 4562} {"train_loss": -7.234523773193359, "global_step": 191633, "epoch": 4562} {"train_loss": -7.190122604370117, "global_step": 191634, "epoch": 4562} {"train_loss": -7.358553409576416, "global_step": 191635, "epoch": 4562} {"train_loss": -7.245453834533691, "global_step": 191636, "epoch": 4562} {"train_loss": -7.244152069091797, "global_step": 191637, "epoch": 4562} {"train_loss": -7.333649635314941, "global_step": 191638, "epoch": 4562} {"train_loss": -7.239875793457031, "global_step": 191639, "epoch": 4562} {"train_loss": -7.165510177612305, "global_step": 191640, "epoch": 4562} {"train_loss": -7.262967109680176, "global_step": 191641, "epoch": 4562} {"train_loss": -7.170716285705566, "global_step": 191642, "epoch": 4562} {"train_loss": -7.1335320472717285, "global_step": 191643, "epoch": 4562} {"train_loss": -7.133352756500244, "global_step": 191644, "epoch": 4562} {"train_loss": -7.234294085275559, "global_step": 191645, "epoch": 4562, "val_loss": 81042.9375} {"train_loss": -7.116800785064697, "global_step": 191646, "epoch": 4563} {"train_loss": -7.143623352050781, "global_step": 191647, "epoch": 4563} {"train_loss": -7.188937187194824, "global_step": 191648, "epoch": 4563} {"train_loss": -7.226173400878906, "global_step": 191649, "epoch": 4563} {"train_loss": -7.188156604766846, "global_step": 191650, "epoch": 4563} {"train_loss": -7.180887222290039, "global_step": 191651, "epoch": 4563} {"train_loss": -7.290858268737793, "global_step": 191652, "epoch": 4563} {"train_loss": -7.049162864685059, "global_step": 191653, "epoch": 4563} {"train_loss": -7.206728935241699, "global_step": 191654, "epoch": 4563} {"train_loss": -7.32570743560791, "global_step": 191655, "epoch": 4563} {"train_loss": -7.160567283630371, "global_step": 191656, "epoch": 4563} {"train_loss": -7.12544584274292, "global_step": 191657, "epoch": 4563} {"train_loss": -7.139923095703125, "global_step": 191658, "epoch": 4563} {"train_loss": -7.190576553344727, "global_step": 191659, "epoch": 4563} {"train_loss": -7.23639440536499, "global_step": 191660, "epoch": 4563} {"train_loss": -7.20628023147583, "global_step": 191661, "epoch": 4563} {"train_loss": -7.146270751953125, "global_step": 191662, "epoch": 4563} {"train_loss": -7.173544883728027, "global_step": 191663, "epoch": 4563} {"train_loss": -7.236523628234863, "global_step": 191664, "epoch": 4563} {"train_loss": -7.318119049072266, "global_step": 191665, "epoch": 4563} {"train_loss": -7.281461238861084, "global_step": 191666, "epoch": 4563} {"train_loss": -7.234424114227295, "global_step": 191667, "epoch": 4563} {"train_loss": -7.1738739013671875, "global_step": 191668, "epoch": 4563} {"train_loss": -7.2267656326293945, "global_step": 191669, "epoch": 4563} {"train_loss": -7.372119903564453, "global_step": 191670, "epoch": 4563} {"train_loss": -7.281153678894043, "global_step": 191671, "epoch": 4563} {"train_loss": -7.0736165046691895, "global_step": 191672, "epoch": 4563} {"train_loss": -7.090051174163818, "global_step": 191673, "epoch": 4563} {"train_loss": -7.277596473693848, "global_step": 191674, "epoch": 4563} {"train_loss": -7.205915451049805, "global_step": 191675, "epoch": 4563} {"train_loss": -7.3781538009643555, "global_step": 191676, "epoch": 4563} {"train_loss": -7.158612251281738, "global_step": 191677, "epoch": 4563} {"train_loss": -7.132370948791504, "global_step": 191678, "epoch": 4563} {"train_loss": -7.146020889282227, "global_step": 191679, "epoch": 4563} {"train_loss": -7.159527778625488, "global_step": 191680, "epoch": 4563} {"train_loss": -7.141720771789551, "global_step": 191681, "epoch": 4563} {"train_loss": -7.243429183959961, "global_step": 191682, "epoch": 4563} {"train_loss": -7.232276439666748, "global_step": 191683, "epoch": 4563} {"train_loss": -7.240223407745361, "global_step": 191684, "epoch": 4563} {"train_loss": -7.298511505126953, "global_step": 191685, "epoch": 4563} {"train_loss": -7.288483619689941, "global_step": 191686, "epoch": 4563} {"train_loss": -7.210143554778326, "global_step": 191687, "epoch": 4563, "val_loss": 81106.109375} {"train_loss": -7.23967170715332, "global_step": 191688, "epoch": 4564} {"train_loss": -7.237342834472656, "global_step": 191689, "epoch": 4564} {"train_loss": -7.258889198303223, "global_step": 191690, "epoch": 4564} {"train_loss": -7.2286176681518555, "global_step": 191691, "epoch": 4564} {"train_loss": -7.364560604095459, "global_step": 191692, "epoch": 4564} {"train_loss": -7.229592800140381, "global_step": 191693, "epoch": 4564} {"train_loss": -7.255575656890869, "global_step": 191694, "epoch": 4564} {"train_loss": -7.194511413574219, "global_step": 191695, "epoch": 4564} {"train_loss": -7.287796974182129, "global_step": 191696, "epoch": 4564} {"train_loss": -7.3344292640686035, "global_step": 191697, "epoch": 4564} {"train_loss": -7.3046112060546875, "global_step": 191698, "epoch": 4564} {"train_loss": -7.284692764282227, "global_step": 191699, "epoch": 4564} {"train_loss": -7.331208229064941, "global_step": 191700, "epoch": 4564} {"train_loss": -7.193864822387695, "global_step": 191701, "epoch": 4564} {"train_loss": -7.215590953826904, "global_step": 191702, "epoch": 4564} {"train_loss": -7.386056423187256, "global_step": 191703, "epoch": 4564} {"train_loss": -7.2021026611328125, "global_step": 191704, "epoch": 4564} {"train_loss": -7.092735290527344, "global_step": 191705, "epoch": 4564} {"train_loss": -7.221249580383301, "global_step": 191706, "epoch": 4564} {"train_loss": -7.332552433013916, "global_step": 191707, "epoch": 4564} {"train_loss": -7.1949238777160645, "global_step": 191708, "epoch": 4564} {"train_loss": -7.050274848937988, "global_step": 191709, "epoch": 4564} {"train_loss": -7.246748447418213, "global_step": 191710, "epoch": 4564} {"train_loss": -7.138163089752197, "global_step": 191711, "epoch": 4564} {"train_loss": -7.269611358642578, "global_step": 191712, "epoch": 4564} {"train_loss": -7.284109115600586, "global_step": 191713, "epoch": 4564} {"train_loss": -7.124902248382568, "global_step": 191714, "epoch": 4564} {"train_loss": -7.246413230895996, "global_step": 191715, "epoch": 4564} {"train_loss": -7.250614166259766, "global_step": 191716, "epoch": 4564} {"train_loss": -7.224853515625, "global_step": 191717, "epoch": 4564} {"train_loss": -7.11998176574707, "global_step": 191718, "epoch": 4564} {"train_loss": -7.230711936950684, "global_step": 191719, "epoch": 4564} {"train_loss": -7.168187618255615, "global_step": 191720, "epoch": 4564} {"train_loss": -7.350545883178711, "global_step": 191721, "epoch": 4564} {"train_loss": -7.22477388381958, "global_step": 191722, "epoch": 4564} {"train_loss": -7.075756072998047, "global_step": 191723, "epoch": 4564} {"train_loss": -7.26600980758667, "global_step": 191724, "epoch": 4564} {"train_loss": -7.164894104003906, "global_step": 191725, "epoch": 4564} {"train_loss": -7.168727397918701, "global_step": 191726, "epoch": 4564} {"train_loss": -7.209179401397705, "global_step": 191727, "epoch": 4564} {"train_loss": -7.074776649475098, "global_step": 191728, "epoch": 4564} {"train_loss": -7.226136968249366, "global_step": 191729, "epoch": 4564, "val_loss": 81014.828125} {"train_loss": -7.313632011413574, "global_step": 191730, "epoch": 4565} {"train_loss": -7.129565715789795, "global_step": 191731, "epoch": 4565} {"train_loss": -7.256073951721191, "global_step": 191732, "epoch": 4565} {"train_loss": -7.058441162109375, "global_step": 191733, "epoch": 4565} {"train_loss": -7.1738200187683105, "global_step": 191734, "epoch": 4565} {"train_loss": -7.269423961639404, "global_step": 191735, "epoch": 4565} {"train_loss": -7.159578800201416, "global_step": 191736, "epoch": 4565} {"train_loss": -7.118044376373291, "global_step": 191737, "epoch": 4565} {"train_loss": -7.199257850646973, "global_step": 191738, "epoch": 4565} {"train_loss": -7.25075626373291, "global_step": 191739, "epoch": 4565} {"train_loss": -7.239519119262695, "global_step": 191740, "epoch": 4565} {"train_loss": -7.301892280578613, "global_step": 191741, "epoch": 4565} {"train_loss": -7.380605697631836, "global_step": 191742, "epoch": 4565} {"train_loss": -7.312621593475342, "global_step": 191743, "epoch": 4565} {"train_loss": -7.326803207397461, "global_step": 191744, "epoch": 4565} {"train_loss": -7.342111587524414, "global_step": 191745, "epoch": 4565} {"train_loss": -7.357998847961426, "global_step": 191746, "epoch": 4565} {"train_loss": -7.188908576965332, "global_step": 191747, "epoch": 4565} {"train_loss": -7.305475234985352, "global_step": 191748, "epoch": 4565} {"train_loss": -7.139070510864258, "global_step": 191749, "epoch": 4565} {"train_loss": -7.262361526489258, "global_step": 191750, "epoch": 4565} {"train_loss": -7.375718116760254, "global_step": 191751, "epoch": 4565} {"train_loss": -7.252705097198486, "global_step": 191752, "epoch": 4565} {"train_loss": -7.2857255935668945, "global_step": 191753, "epoch": 4565} {"train_loss": -7.266529083251953, "global_step": 191754, "epoch": 4565} {"train_loss": -7.173558712005615, "global_step": 191755, "epoch": 4565} {"train_loss": -7.196609020233154, "global_step": 191756, "epoch": 4565} {"train_loss": -7.339622974395752, "global_step": 191757, "epoch": 4565} {"train_loss": -7.271234035491943, "global_step": 191758, "epoch": 4565} {"train_loss": -7.164884090423584, "global_step": 191759, "epoch": 4565} {"train_loss": -7.267369747161865, "global_step": 191760, "epoch": 4565} {"train_loss": -7.202220439910889, "global_step": 191761, "epoch": 4565} {"train_loss": -7.229328632354736, "global_step": 191762, "epoch": 4565} {"train_loss": -7.331418991088867, "global_step": 191763, "epoch": 4565} {"train_loss": -7.095884323120117, "global_step": 191764, "epoch": 4565} {"train_loss": -7.13658332824707, "global_step": 191765, "epoch": 4565} {"train_loss": -7.200315475463867, "global_step": 191766, "epoch": 4565} {"train_loss": -7.1456780433654785, "global_step": 191767, "epoch": 4565} {"train_loss": -7.189554214477539, "global_step": 191768, "epoch": 4565} {"train_loss": -7.332954406738281, "global_step": 191769, "epoch": 4565} {"train_loss": -7.157409191131592, "global_step": 191770, "epoch": 4565} {"train_loss": -7.2381842249915715, "global_step": 191771, "epoch": 4565, "val_loss": 81217.859375} {"train_loss": -7.351929664611816, "global_step": 191772, "epoch": 4566} {"train_loss": -7.217787265777588, "global_step": 191773, "epoch": 4566} {"train_loss": -7.197678565979004, "global_step": 191774, "epoch": 4566} {"train_loss": -7.225094318389893, "global_step": 191775, "epoch": 4566} {"train_loss": -7.2607927322387695, "global_step": 191776, "epoch": 4566} {"train_loss": -7.3317975997924805, "global_step": 191777, "epoch": 4566} {"train_loss": -7.277783393859863, "global_step": 191778, "epoch": 4566} {"train_loss": -7.212204933166504, "global_step": 191779, "epoch": 4566} {"train_loss": -7.376506805419922, "global_step": 191780, "epoch": 4566} {"train_loss": -7.202421188354492, "global_step": 191781, "epoch": 4566} {"train_loss": -7.278046607971191, "global_step": 191782, "epoch": 4566} {"train_loss": -7.247598648071289, "global_step": 191783, "epoch": 4566} {"train_loss": -7.196259498596191, "global_step": 191784, "epoch": 4566} {"train_loss": -7.171241283416748, "global_step": 191785, "epoch": 4566} {"train_loss": -7.078714370727539, "global_step": 191786, "epoch": 4566} {"train_loss": -7.173608303070068, "global_step": 191787, "epoch": 4566} {"train_loss": -7.19140625, "global_step": 191788, "epoch": 4566} {"train_loss": -7.058259010314941, "global_step": 191789, "epoch": 4566} {"train_loss": -7.182785987854004, "global_step": 191790, "epoch": 4566} {"train_loss": -7.1504974365234375, "global_step": 191791, "epoch": 4566} {"train_loss": -7.166177749633789, "global_step": 191792, "epoch": 4566} {"train_loss": -7.272787094116211, "global_step": 191793, "epoch": 4566} {"train_loss": -7.218955993652344, "global_step": 191794, "epoch": 4566} {"train_loss": -7.019824028015137, "global_step": 191795, "epoch": 4566} {"train_loss": -7.1288251876831055, "global_step": 191796, "epoch": 4566} {"train_loss": -7.039822101593018, "global_step": 191797, "epoch": 4566} {"train_loss": -7.100202560424805, "global_step": 191798, "epoch": 4566} {"train_loss": -7.075932502746582, "global_step": 191799, "epoch": 4566} {"train_loss": -7.039738655090332, "global_step": 191800, "epoch": 4566} {"train_loss": -7.062911510467529, "global_step": 191801, "epoch": 4566} {"train_loss": -7.077564239501953, "global_step": 191802, "epoch": 4566} {"train_loss": -7.018620491027832, "global_step": 191803, "epoch": 4566} {"train_loss": -7.205103874206543, "global_step": 191804, "epoch": 4566} {"train_loss": -7.107111930847168, "global_step": 191805, "epoch": 4566} {"train_loss": -6.987797737121582, "global_step": 191806, "epoch": 4566} {"train_loss": -7.1304473876953125, "global_step": 191807, "epoch": 4566} {"train_loss": -7.092228889465332, "global_step": 191808, "epoch": 4566} {"train_loss": -7.14863920211792, "global_step": 191809, "epoch": 4566} {"train_loss": -7.116667747497559, "global_step": 191810, "epoch": 4566} {"train_loss": -7.1376471519470215, "global_step": 191811, "epoch": 4566} {"train_loss": -7.139430999755859, "global_step": 191812, "epoch": 4566} {"train_loss": -7.162631591161092, "global_step": 191813, "epoch": 4566, "val_loss": 81100.21875} {"train_loss": -7.071171760559082, "global_step": 191814, "epoch": 4567} {"train_loss": -7.185399055480957, "global_step": 191815, "epoch": 4567} {"train_loss": -7.272832870483398, "global_step": 191816, "epoch": 4567} {"train_loss": -7.186556816101074, "global_step": 191817, "epoch": 4567} {"train_loss": -7.110837459564209, "global_step": 191818, "epoch": 4567} {"train_loss": -7.136122703552246, "global_step": 191819, "epoch": 4567} {"train_loss": -7.218829154968262, "global_step": 191820, "epoch": 4567} {"train_loss": -7.25046443939209, "global_step": 191821, "epoch": 4567} {"train_loss": -7.3112382888793945, "global_step": 191822, "epoch": 4567} {"train_loss": -7.169436931610107, "global_step": 191823, "epoch": 4567} {"train_loss": -7.255453109741211, "global_step": 191824, "epoch": 4567} {"train_loss": -7.172407150268555, "global_step": 191825, "epoch": 4567} {"train_loss": -7.163137435913086, "global_step": 191826, "epoch": 4567} {"train_loss": -7.270872592926025, "global_step": 191827, "epoch": 4567} {"train_loss": -7.1497697830200195, "global_step": 191828, "epoch": 4567} {"train_loss": -7.43054723739624, "global_step": 191829, "epoch": 4567} {"train_loss": -7.326398849487305, "global_step": 191830, "epoch": 4567} {"train_loss": -7.260343551635742, "global_step": 191831, "epoch": 4567} {"train_loss": -7.30145263671875, "global_step": 191832, "epoch": 4567} {"train_loss": -7.270145416259766, "global_step": 191833, "epoch": 4567} {"train_loss": -7.2879557609558105, "global_step": 191834, "epoch": 4567} {"train_loss": -7.239066123962402, "global_step": 191835, "epoch": 4567} {"train_loss": -7.245882511138916, "global_step": 191836, "epoch": 4567} {"train_loss": -7.332162857055664, "global_step": 191837, "epoch": 4567} {"train_loss": -7.162985801696777, "global_step": 191838, "epoch": 4567} {"train_loss": -7.183687210083008, "global_step": 191839, "epoch": 4567} {"train_loss": -7.150073528289795, "global_step": 191840, "epoch": 4567} {"train_loss": -7.3472065925598145, "global_step": 191841, "epoch": 4567} {"train_loss": -7.200437068939209, "global_step": 191842, "epoch": 4567} {"train_loss": -7.313900947570801, "global_step": 191843, "epoch": 4567} {"train_loss": -7.321192264556885, "global_step": 191844, "epoch": 4567} {"train_loss": -7.171998500823975, "global_step": 191845, "epoch": 4567} {"train_loss": -7.342860698699951, "global_step": 191846, "epoch": 4567} {"train_loss": -7.392820358276367, "global_step": 191847, "epoch": 4567} {"train_loss": -7.259210586547852, "global_step": 191848, "epoch": 4567} {"train_loss": -7.290140628814697, "global_step": 191849, "epoch": 4567} {"train_loss": -7.2105302810668945, "global_step": 191850, "epoch": 4567} {"train_loss": -7.2690019607543945, "global_step": 191851, "epoch": 4567} {"train_loss": -7.135684967041016, "global_step": 191852, "epoch": 4567} {"train_loss": -7.321340084075928, "global_step": 191853, "epoch": 4567} {"train_loss": -7.292690277099609, "global_step": 191854, "epoch": 4567} {"train_loss": -7.243086042858305, "global_step": 191855, "epoch": 4567, "val_loss": 81174.59375} {"train_loss": -7.235507011413574, "global_step": 191856, "epoch": 4568} {"train_loss": -7.28182315826416, "global_step": 191857, "epoch": 4568} {"train_loss": -7.323630332946777, "global_step": 191858, "epoch": 4568} {"train_loss": -7.2633161544799805, "global_step": 191859, "epoch": 4568} {"train_loss": -7.305671691894531, "global_step": 191860, "epoch": 4568} {"train_loss": -7.292026042938232, "global_step": 191861, "epoch": 4568} {"train_loss": -7.188241958618164, "global_step": 191862, "epoch": 4568} {"train_loss": -7.237837791442871, "global_step": 191863, "epoch": 4568} {"train_loss": -7.393261909484863, "global_step": 191864, "epoch": 4568} {"train_loss": -7.294771194458008, "global_step": 191865, "epoch": 4568} {"train_loss": -7.218357563018799, "global_step": 191866, "epoch": 4568} {"train_loss": -7.271007061004639, "global_step": 191867, "epoch": 4568} {"train_loss": -7.371107578277588, "global_step": 191868, "epoch": 4568} {"train_loss": -7.202597618103027, "global_step": 191869, "epoch": 4568} {"train_loss": -7.332043647766113, "global_step": 191870, "epoch": 4568} {"train_loss": -7.108929634094238, "global_step": 191871, "epoch": 4568} {"train_loss": -7.210303783416748, "global_step": 191872, "epoch": 4568} {"train_loss": -7.211996078491211, "global_step": 191873, "epoch": 4568} {"train_loss": -7.233489990234375, "global_step": 191874, "epoch": 4568} {"train_loss": -7.051184177398682, "global_step": 191875, "epoch": 4568} {"train_loss": -7.281356334686279, "global_step": 191876, "epoch": 4568} {"train_loss": -7.091168403625488, "global_step": 191877, "epoch": 4568} {"train_loss": -7.143800735473633, "global_step": 191878, "epoch": 4568} {"train_loss": -7.217790126800537, "global_step": 191879, "epoch": 4568} {"train_loss": -7.172366142272949, "global_step": 191880, "epoch": 4568} {"train_loss": -7.115909099578857, "global_step": 191881, "epoch": 4568} {"train_loss": -7.091475963592529, "global_step": 191882, "epoch": 4568} {"train_loss": -7.153775691986084, "global_step": 191883, "epoch": 4568} {"train_loss": -7.125920295715332, "global_step": 191884, "epoch": 4568} {"train_loss": -7.293303966522217, "global_step": 191885, "epoch": 4568} {"train_loss": -7.120507717132568, "global_step": 191886, "epoch": 4568} {"train_loss": -7.234305381774902, "global_step": 191887, "epoch": 4568} {"train_loss": -7.171687126159668, "global_step": 191888, "epoch": 4568} {"train_loss": -7.2104644775390625, "global_step": 191889, "epoch": 4568} {"train_loss": -7.103482246398926, "global_step": 191890, "epoch": 4568} {"train_loss": -7.173122882843018, "global_step": 191891, "epoch": 4568} {"train_loss": -7.185070991516113, "global_step": 191892, "epoch": 4568} {"train_loss": -7.16526985168457, "global_step": 191893, "epoch": 4568} {"train_loss": -7.231758117675781, "global_step": 191894, "epoch": 4568} {"train_loss": -7.2747602462768555, "global_step": 191895, "epoch": 4568} {"train_loss": -7.174248218536377, "global_step": 191896, "epoch": 4568} {"train_loss": -7.215486174538022, "global_step": 191897, "epoch": 4568, "val_loss": 80861.265625} {"train_loss": -7.089931488037109, "global_step": 191898, "epoch": 4569} {"train_loss": -7.270715236663818, "global_step": 191899, "epoch": 4569} {"train_loss": -7.141737461090088, "global_step": 191900, "epoch": 4569} {"train_loss": -7.17500114440918, "global_step": 191901, "epoch": 4569} {"train_loss": -7.183300495147705, "global_step": 191902, "epoch": 4569} {"train_loss": -7.245359420776367, "global_step": 191903, "epoch": 4569} {"train_loss": -7.316446304321289, "global_step": 191904, "epoch": 4569} {"train_loss": -7.177911758422852, "global_step": 191905, "epoch": 4569} {"train_loss": -7.355249404907227, "global_step": 191906, "epoch": 4569} {"train_loss": -7.398589611053467, "global_step": 191907, "epoch": 4569} {"train_loss": -7.24254846572876, "global_step": 191908, "epoch": 4569} {"train_loss": -7.298834800720215, "global_step": 191909, "epoch": 4569} {"train_loss": -7.260725975036621, "global_step": 191910, "epoch": 4569} {"train_loss": -7.183840274810791, "global_step": 191911, "epoch": 4569} {"train_loss": -7.178584098815918, "global_step": 191912, "epoch": 4569} {"train_loss": -7.192941665649414, "global_step": 191913, "epoch": 4569} {"train_loss": -7.265578269958496, "global_step": 191914, "epoch": 4569} {"train_loss": -7.241199970245361, "global_step": 191915, "epoch": 4569} {"train_loss": -7.262105464935303, "global_step": 191916, "epoch": 4569} {"train_loss": -7.1882123947143555, "global_step": 191917, "epoch": 4569} {"train_loss": -7.305992126464844, "global_step": 191918, "epoch": 4569} {"train_loss": -7.258105278015137, "global_step": 191919, "epoch": 4569} {"train_loss": -7.202500343322754, "global_step": 191920, "epoch": 4569} {"train_loss": -7.160688877105713, "global_step": 191921, "epoch": 4569} {"train_loss": -7.2284932136535645, "global_step": 191922, "epoch": 4569} {"train_loss": -7.414083480834961, "global_step": 191923, "epoch": 4569} {"train_loss": -7.30706787109375, "global_step": 191924, "epoch": 4569} {"train_loss": -7.338834762573242, "global_step": 191925, "epoch": 4569} {"train_loss": -7.239639759063721, "global_step": 191926, "epoch": 4569} {"train_loss": -7.290388107299805, "global_step": 191927, "epoch": 4569} {"train_loss": -7.318666934967041, "global_step": 191928, "epoch": 4569} {"train_loss": -7.249374866485596, "global_step": 191929, "epoch": 4569} {"train_loss": -7.2663164138793945, "global_step": 191930, "epoch": 4569} {"train_loss": -7.126795768737793, "global_step": 191931, "epoch": 4569} {"train_loss": -7.23674201965332, "global_step": 191932, "epoch": 4569} {"train_loss": -7.093767166137695, "global_step": 191933, "epoch": 4569} {"train_loss": -7.151636123657227, "global_step": 191934, "epoch": 4569} {"train_loss": -7.2098307609558105, "global_step": 191935, "epoch": 4569} {"train_loss": -7.185268402099609, "global_step": 191936, "epoch": 4569} {"train_loss": -7.080539226531982, "global_step": 191937, "epoch": 4569} {"train_loss": -7.284473419189453, "global_step": 191938, "epoch": 4569} {"train_loss": -7.232608079910278, "global_step": 191939, "epoch": 4569, "val_loss": 81196.6953125} {"train_loss": -7.230778694152832, "global_step": 191940, "epoch": 4570} {"train_loss": -7.10283088684082, "global_step": 191941, "epoch": 4570} {"train_loss": -7.2275824546813965, "global_step": 191942, "epoch": 4570} {"train_loss": -7.323012828826904, "global_step": 191943, "epoch": 4570} {"train_loss": -7.078317642211914, "global_step": 191944, "epoch": 4570} {"train_loss": -7.193117141723633, "global_step": 191945, "epoch": 4570} {"train_loss": -7.079860687255859, "global_step": 191946, "epoch": 4570} {"train_loss": -7.26982307434082, "global_step": 191947, "epoch": 4570} {"train_loss": -7.094273567199707, "global_step": 191948, "epoch": 4570} {"train_loss": -7.165884494781494, "global_step": 191949, "epoch": 4570} {"train_loss": -7.145938873291016, "global_step": 191950, "epoch": 4570} {"train_loss": -7.167863845825195, "global_step": 191951, "epoch": 4570} {"train_loss": -7.131061553955078, "global_step": 191952, "epoch": 4570} {"train_loss": -7.22145938873291, "global_step": 191953, "epoch": 4570} {"train_loss": -7.233996391296387, "global_step": 191954, "epoch": 4570} {"train_loss": -7.266162395477295, "global_step": 191955, "epoch": 4570} {"train_loss": -7.247638702392578, "global_step": 191956, "epoch": 4570} {"train_loss": -7.273688793182373, "global_step": 191957, "epoch": 4570} {"train_loss": -7.206445693969727, "global_step": 191958, "epoch": 4570} {"train_loss": -7.239079475402832, "global_step": 191959, "epoch": 4570} {"train_loss": -7.22932243347168, "global_step": 191960, "epoch": 4570} {"train_loss": -7.276679039001465, "global_step": 191961, "epoch": 4570} {"train_loss": -7.321842193603516, "global_step": 191962, "epoch": 4570} {"train_loss": -7.2496819496154785, "global_step": 191963, "epoch": 4570} {"train_loss": -7.242592811584473, "global_step": 191964, "epoch": 4570} {"train_loss": -7.275589942932129, "global_step": 191965, "epoch": 4570} {"train_loss": -7.268564224243164, "global_step": 191966, "epoch": 4570} {"train_loss": -7.122117519378662, "global_step": 191967, "epoch": 4570} {"train_loss": -7.166037559509277, "global_step": 191968, "epoch": 4570} {"train_loss": -7.174455642700195, "global_step": 191969, "epoch": 4570} {"train_loss": -7.378634452819824, "global_step": 191970, "epoch": 4570} {"train_loss": -7.212728977203369, "global_step": 191971, "epoch": 4570} {"train_loss": -7.305859088897705, "global_step": 191972, "epoch": 4570} {"train_loss": -7.2583537101745605, "global_step": 191973, "epoch": 4570} {"train_loss": -7.173137664794922, "global_step": 191974, "epoch": 4570} {"train_loss": -7.121819496154785, "global_step": 191975, "epoch": 4570} {"train_loss": -7.165299415588379, "global_step": 191976, "epoch": 4570} {"train_loss": -7.250791549682617, "global_step": 191977, "epoch": 4570} {"train_loss": -7.147525787353516, "global_step": 191978, "epoch": 4570} {"train_loss": -7.206015586853027, "global_step": 191979, "epoch": 4570} {"train_loss": -7.271579742431641, "global_step": 191980, "epoch": 4570} {"train_loss": -7.209954693203881, "global_step": 191981, "epoch": 4570, "val_loss": 81085.8359375} {"train_loss": -7.247337341308594, "global_step": 191982, "epoch": 4571} {"train_loss": -7.268917083740234, "global_step": 191983, "epoch": 4571} {"train_loss": -7.252808570861816, "global_step": 191984, "epoch": 4571} {"train_loss": -7.134438991546631, "global_step": 191985, "epoch": 4571} {"train_loss": -7.219605922698975, "global_step": 191986, "epoch": 4571} {"train_loss": -7.1644439697265625, "global_step": 191987, "epoch": 4571} {"train_loss": -7.309408187866211, "global_step": 191988, "epoch": 4571} {"train_loss": -7.197901725769043, "global_step": 191989, "epoch": 4571} {"train_loss": -7.148464202880859, "global_step": 191990, "epoch": 4571} {"train_loss": -7.1611175537109375, "global_step": 191991, "epoch": 4571} {"train_loss": -7.176414966583252, "global_step": 191992, "epoch": 4571} {"train_loss": -7.158577919006348, "global_step": 191993, "epoch": 4571} {"train_loss": -7.237828254699707, "global_step": 191994, "epoch": 4571} {"train_loss": -7.282031536102295, "global_step": 191995, "epoch": 4571} {"train_loss": -7.278114318847656, "global_step": 191996, "epoch": 4571} {"train_loss": -7.316013336181641, "global_step": 191997, "epoch": 4571} {"train_loss": -7.135422229766846, "global_step": 191998, "epoch": 4571} {"train_loss": -7.3068389892578125, "global_step": 191999, "epoch": 4571} {"train_loss": -7.343802452087402, "global_step": 192000, "epoch": 4571} {"train_loss": -7.133449554443359, "global_step": 192001, "epoch": 4571} {"train_loss": -7.270114421844482, "global_step": 192002, "epoch": 4571} {"train_loss": -7.23178768157959, "global_step": 192003, "epoch": 4571} {"train_loss": -7.164921760559082, "global_step": 192004, "epoch": 4571} {"train_loss": -7.212946891784668, "global_step": 192005, "epoch": 4571} {"train_loss": -7.234160423278809, "global_step": 192006, "epoch": 4571} {"train_loss": -7.151236057281494, "global_step": 192007, "epoch": 4571} {"train_loss": -7.277370452880859, "global_step": 192008, "epoch": 4571} {"train_loss": -7.246273040771484, "global_step": 192009, "epoch": 4571} {"train_loss": -7.17624568939209, "global_step": 192010, "epoch": 4571} {"train_loss": -7.198574542999268, "global_step": 192011, "epoch": 4571} {"train_loss": -7.126552104949951, "global_step": 192012, "epoch": 4571} {"train_loss": -7.227373123168945, "global_step": 192013, "epoch": 4571} {"train_loss": -7.285489082336426, "global_step": 192014, "epoch": 4571} {"train_loss": -7.1141357421875, "global_step": 192015, "epoch": 4571} {"train_loss": -7.16775369644165, "global_step": 192016, "epoch": 4571} {"train_loss": -7.169200897216797, "global_step": 192017, "epoch": 4571} {"train_loss": -7.281526565551758, "global_step": 192018, "epoch": 4571} {"train_loss": -7.243483066558838, "global_step": 192019, "epoch": 4571} {"train_loss": -7.3003387451171875, "global_step": 192020, "epoch": 4571} {"train_loss": -7.198047637939453, "global_step": 192021, "epoch": 4571} {"train_loss": -7.262502670288086, "global_step": 192022, "epoch": 4571} {"train_loss": -7.218278566996257, "global_step": 192023, "epoch": 4571, "val_loss": 81026.1640625} {"train_loss": -7.3044257164001465, "global_step": 192024, "epoch": 4572} {"train_loss": -7.225597381591797, "global_step": 192025, "epoch": 4572} {"train_loss": -7.3039984703063965, "global_step": 192026, "epoch": 4572} {"train_loss": -7.140587329864502, "global_step": 192027, "epoch": 4572} {"train_loss": -7.253483772277832, "global_step": 192028, "epoch": 4572} {"train_loss": -7.226800918579102, "global_step": 192029, "epoch": 4572} {"train_loss": -7.076513767242432, "global_step": 192030, "epoch": 4572} {"train_loss": -7.2008562088012695, "global_step": 192031, "epoch": 4572} {"train_loss": -7.167283058166504, "global_step": 192032, "epoch": 4572} {"train_loss": -7.324217796325684, "global_step": 192033, "epoch": 4572} {"train_loss": -7.118507385253906, "global_step": 192034, "epoch": 4572} {"train_loss": -7.171107292175293, "global_step": 192035, "epoch": 4572} {"train_loss": -7.211434364318848, "global_step": 192036, "epoch": 4572} {"train_loss": -7.168308734893799, "global_step": 192037, "epoch": 4572} {"train_loss": -7.196310520172119, "global_step": 192038, "epoch": 4572} {"train_loss": -7.210912227630615, "global_step": 192039, "epoch": 4572} {"train_loss": -7.082067489624023, "global_step": 192040, "epoch": 4572} {"train_loss": -7.290685176849365, "global_step": 192041, "epoch": 4572} {"train_loss": -7.225671768188477, "global_step": 192042, "epoch": 4572} {"train_loss": -7.243495464324951, "global_step": 192043, "epoch": 4572} {"train_loss": -7.28727912902832, "global_step": 192044, "epoch": 4572} {"train_loss": -7.2202301025390625, "global_step": 192045, "epoch": 4572} {"train_loss": -7.249018669128418, "global_step": 192046, "epoch": 4572} {"train_loss": -7.227421760559082, "global_step": 192047, "epoch": 4572} {"train_loss": -7.220917701721191, "global_step": 192048, "epoch": 4572} {"train_loss": -7.210572242736816, "global_step": 192049, "epoch": 4572} {"train_loss": -7.206193923950195, "global_step": 192050, "epoch": 4572} {"train_loss": -7.24029541015625, "global_step": 192051, "epoch": 4572} {"train_loss": -7.289441108703613, "global_step": 192052, "epoch": 4572} {"train_loss": -7.380998134613037, "global_step": 192053, "epoch": 4572} {"train_loss": -7.273221969604492, "global_step": 192054, "epoch": 4572} {"train_loss": -7.343363285064697, "global_step": 192055, "epoch": 4572} {"train_loss": -7.1986236572265625, "global_step": 192056, "epoch": 4572} {"train_loss": -7.221532344818115, "global_step": 192057, "epoch": 4572} {"train_loss": -7.376585006713867, "global_step": 192058, "epoch": 4572} {"train_loss": -7.371161460876465, "global_step": 192059, "epoch": 4572} {"train_loss": -7.2505364418029785, "global_step": 192060, "epoch": 4572} {"train_loss": -7.219322681427002, "global_step": 192061, "epoch": 4572} {"train_loss": -7.347577095031738, "global_step": 192062, "epoch": 4572} {"train_loss": -7.22832727432251, "global_step": 192063, "epoch": 4572} {"train_loss": -7.168997764587402, "global_step": 192064, "epoch": 4572} {"train_loss": -7.233467011224656, "global_step": 192065, "epoch": 4572, "val_loss": 81148.609375} {"train_loss": -7.277569770812988, "global_step": 192066, "epoch": 4573} {"train_loss": -7.113343238830566, "global_step": 192067, "epoch": 4573} {"train_loss": -7.155735969543457, "global_step": 192068, "epoch": 4573} {"train_loss": -7.279988765716553, "global_step": 192069, "epoch": 4573} {"train_loss": -7.2342400550842285, "global_step": 192070, "epoch": 4573} {"train_loss": -7.066559314727783, "global_step": 192071, "epoch": 4573} {"train_loss": -7.18472957611084, "global_step": 192072, "epoch": 4573} {"train_loss": -7.166315078735352, "global_step": 192073, "epoch": 4573} {"train_loss": -7.010111331939697, "global_step": 192074, "epoch": 4573} {"train_loss": -7.218686103820801, "global_step": 192075, "epoch": 4573} {"train_loss": -6.962681293487549, "global_step": 192076, "epoch": 4573} {"train_loss": -6.994458198547363, "global_step": 192077, "epoch": 4573} {"train_loss": -7.1063714027404785, "global_step": 192078, "epoch": 4573} {"train_loss": -6.938652038574219, "global_step": 192079, "epoch": 4573} {"train_loss": -7.1861419677734375, "global_step": 192080, "epoch": 4573} {"train_loss": -7.043156623840332, "global_step": 192081, "epoch": 4573} {"train_loss": -7.1167216300964355, "global_step": 192082, "epoch": 4573} {"train_loss": -7.085871696472168, "global_step": 192083, "epoch": 4573} {"train_loss": -7.056158542633057, "global_step": 192084, "epoch": 4573} {"train_loss": -7.250495910644531, "global_step": 192085, "epoch": 4573} {"train_loss": -7.052864074707031, "global_step": 192086, "epoch": 4573} {"train_loss": -7.253131866455078, "global_step": 192087, "epoch": 4573} {"train_loss": -7.256956577301025, "global_step": 192088, "epoch": 4573} {"train_loss": -7.216343879699707, "global_step": 192089, "epoch": 4573} {"train_loss": -7.228332996368408, "global_step": 192090, "epoch": 4573} {"train_loss": -7.06461238861084, "global_step": 192091, "epoch": 4573} {"train_loss": -7.113656520843506, "global_step": 192092, "epoch": 4573} {"train_loss": -7.005528450012207, "global_step": 192093, "epoch": 4573} {"train_loss": -7.1190595626831055, "global_step": 192094, "epoch": 4573} {"train_loss": -7.072142601013184, "global_step": 192095, "epoch": 4573} {"train_loss": -7.1366682052612305, "global_step": 192096, "epoch": 4573} {"train_loss": -7.2421159744262695, "global_step": 192097, "epoch": 4573} {"train_loss": -7.156694412231445, "global_step": 192098, "epoch": 4573} {"train_loss": -7.241947174072266, "global_step": 192099, "epoch": 4573} {"train_loss": -7.1510443687438965, "global_step": 192100, "epoch": 4573} {"train_loss": -7.241294860839844, "global_step": 192101, "epoch": 4573} {"train_loss": -7.194436073303223, "global_step": 192102, "epoch": 4573} {"train_loss": -7.213448524475098, "global_step": 192103, "epoch": 4573} {"train_loss": -7.320412635803223, "global_step": 192104, "epoch": 4573} {"train_loss": -7.266915798187256, "global_step": 192105, "epoch": 4573} {"train_loss": -7.0970563888549805, "global_step": 192106, "epoch": 4573} {"train_loss": -7.149710291907901, "global_step": 192107, "epoch": 4573, "val_loss": 80871.1875} {"train_loss": -7.255307197570801, "global_step": 192108, "epoch": 4574} {"train_loss": -7.211012840270996, "global_step": 192109, "epoch": 4574} {"train_loss": -7.260397911071777, "global_step": 192110, "epoch": 4574} {"train_loss": -7.261770248413086, "global_step": 192111, "epoch": 4574} {"train_loss": -7.28568172454834, "global_step": 192112, "epoch": 4574} {"train_loss": -7.28177547454834, "global_step": 192113, "epoch": 4574} {"train_loss": -7.186417102813721, "global_step": 192114, "epoch": 4574} {"train_loss": -7.290029525756836, "global_step": 192115, "epoch": 4574} {"train_loss": -7.300536632537842, "global_step": 192116, "epoch": 4574} {"train_loss": -7.198721885681152, "global_step": 192117, "epoch": 4574} {"train_loss": -7.267538547515869, "global_step": 192118, "epoch": 4574} {"train_loss": -7.305958271026611, "global_step": 192119, "epoch": 4574} {"train_loss": -7.254734039306641, "global_step": 192120, "epoch": 4574} {"train_loss": -7.3864641189575195, "global_step": 192121, "epoch": 4574} {"train_loss": -7.415493011474609, "global_step": 192122, "epoch": 4574} {"train_loss": -7.304862976074219, "global_step": 192123, "epoch": 4574} {"train_loss": -7.194294452667236, "global_step": 192124, "epoch": 4574} {"train_loss": -7.316493988037109, "global_step": 192125, "epoch": 4574} {"train_loss": -7.182701110839844, "global_step": 192126, "epoch": 4574} {"train_loss": -7.212558269500732, "global_step": 192127, "epoch": 4574} {"train_loss": -7.2259345054626465, "global_step": 192128, "epoch": 4574} {"train_loss": -7.138145446777344, "global_step": 192129, "epoch": 4574} {"train_loss": -7.047122955322266, "global_step": 192130, "epoch": 4574} {"train_loss": -7.127924919128418, "global_step": 192131, "epoch": 4574} {"train_loss": -7.116718769073486, "global_step": 192132, "epoch": 4574} {"train_loss": -7.155442237854004, "global_step": 192133, "epoch": 4574} {"train_loss": -7.057155132293701, "global_step": 192134, "epoch": 4574} {"train_loss": -7.083271503448486, "global_step": 192135, "epoch": 4574} {"train_loss": -7.277033805847168, "global_step": 192136, "epoch": 4574} {"train_loss": -7.218429088592529, "global_step": 192137, "epoch": 4574} {"train_loss": -7.201016902923584, "global_step": 192138, "epoch": 4574} {"train_loss": -7.165233612060547, "global_step": 192139, "epoch": 4574} {"train_loss": -7.21945858001709, "global_step": 192140, "epoch": 4574} {"train_loss": -7.219286918640137, "global_step": 192141, "epoch": 4574} {"train_loss": -7.216328144073486, "global_step": 192142, "epoch": 4574} {"train_loss": -7.2405290603637695, "global_step": 192143, "epoch": 4574} {"train_loss": -7.167482376098633, "global_step": 192144, "epoch": 4574} {"train_loss": -7.250366687774658, "global_step": 192145, "epoch": 4574} {"train_loss": -7.233198642730713, "global_step": 192146, "epoch": 4574} {"train_loss": -7.242552757263184, "global_step": 192147, "epoch": 4574} {"train_loss": -7.118167877197266, "global_step": 192148, "epoch": 4574} {"train_loss": -7.2205365271795365, "global_step": 192149, "epoch": 4574, "val_loss": 81087.90625} {"train_loss": -7.100403308868408, "global_step": 192150, "epoch": 4575} {"train_loss": -7.194523334503174, "global_step": 192151, "epoch": 4575} {"train_loss": -7.044379234313965, "global_step": 192152, "epoch": 4575} {"train_loss": -7.111808776855469, "global_step": 192153, "epoch": 4575} {"train_loss": -7.160226821899414, "global_step": 192154, "epoch": 4575} {"train_loss": -6.8826398849487305, "global_step": 192155, "epoch": 4575} {"train_loss": -7.177059650421143, "global_step": 192156, "epoch": 4575} {"train_loss": -6.868897438049316, "global_step": 192157, "epoch": 4575} {"train_loss": -7.025208950042725, "global_step": 192158, "epoch": 4575} {"train_loss": -7.244786262512207, "global_step": 192159, "epoch": 4575} {"train_loss": -6.9323225021362305, "global_step": 192160, "epoch": 4575} {"train_loss": -7.064981460571289, "global_step": 192161, "epoch": 4575} {"train_loss": -7.117422103881836, "global_step": 192162, "epoch": 4575} {"train_loss": -7.130313873291016, "global_step": 192163, "epoch": 4575} {"train_loss": -7.072905540466309, "global_step": 192164, "epoch": 4575} {"train_loss": -7.191795349121094, "global_step": 192165, "epoch": 4575} {"train_loss": -6.986166000366211, "global_step": 192166, "epoch": 4575} {"train_loss": -7.162773132324219, "global_step": 192167, "epoch": 4575} {"train_loss": -7.232922554016113, "global_step": 192168, "epoch": 4575} {"train_loss": -7.182229995727539, "global_step": 192169, "epoch": 4575} {"train_loss": -7.116921901702881, "global_step": 192170, "epoch": 4575} {"train_loss": -7.132803440093994, "global_step": 192171, "epoch": 4575} {"train_loss": -7.200873851776123, "global_step": 192172, "epoch": 4575} {"train_loss": -7.2176289558410645, "global_step": 192173, "epoch": 4575} {"train_loss": -7.121628284454346, "global_step": 192174, "epoch": 4575} {"train_loss": -7.225745677947998, "global_step": 192175, "epoch": 4575} {"train_loss": -7.095418930053711, "global_step": 192176, "epoch": 4575} {"train_loss": -7.110257625579834, "global_step": 192177, "epoch": 4575} {"train_loss": -7.187614917755127, "global_step": 192178, "epoch": 4575} {"train_loss": -7.217077255249023, "global_step": 192179, "epoch": 4575} {"train_loss": -7.1476969718933105, "global_step": 192180, "epoch": 4575} {"train_loss": -7.266776084899902, "global_step": 192181, "epoch": 4575} {"train_loss": -7.128113746643066, "global_step": 192182, "epoch": 4575} {"train_loss": -7.335623741149902, "global_step": 192183, "epoch": 4575} {"train_loss": -7.146928310394287, "global_step": 192184, "epoch": 4575} {"train_loss": -7.245948791503906, "global_step": 192185, "epoch": 4575} {"train_loss": -7.1756463050842285, "global_step": 192186, "epoch": 4575} {"train_loss": -7.249085903167725, "global_step": 192187, "epoch": 4575} {"train_loss": -7.255263328552246, "global_step": 192188, "epoch": 4575} {"train_loss": -7.268110275268555, "global_step": 192189, "epoch": 4575} {"train_loss": -7.295923233032227, "global_step": 192190, "epoch": 4575} {"train_loss": -7.150132065727597, "global_step": 192191, "epoch": 4575, "val_loss": 81278.453125} {"train_loss": -7.200529098510742, "global_step": 192192, "epoch": 4576} {"train_loss": -7.242368221282959, "global_step": 192193, "epoch": 4576} {"train_loss": -7.236744403839111, "global_step": 192194, "epoch": 4576} {"train_loss": -7.07572078704834, "global_step": 192195, "epoch": 4576} {"train_loss": -7.208392143249512, "global_step": 192196, "epoch": 4576} {"train_loss": -7.237858772277832, "global_step": 192197, "epoch": 4576} {"train_loss": -7.285576343536377, "global_step": 192198, "epoch": 4576} {"train_loss": -7.233405113220215, "global_step": 192199, "epoch": 4576} {"train_loss": -7.053059101104736, "global_step": 192200, "epoch": 4576} {"train_loss": -7.192187786102295, "global_step": 192201, "epoch": 4576} {"train_loss": -7.089084625244141, "global_step": 192202, "epoch": 4576} {"train_loss": -7.350537300109863, "global_step": 192203, "epoch": 4576} {"train_loss": -7.209023475646973, "global_step": 192204, "epoch": 4576} {"train_loss": -7.112434387207031, "global_step": 192205, "epoch": 4576} {"train_loss": -7.237807273864746, "global_step": 192206, "epoch": 4576} {"train_loss": -7.158097267150879, "global_step": 192207, "epoch": 4576} {"train_loss": -7.278338432312012, "global_step": 192208, "epoch": 4576} {"train_loss": -7.229344844818115, "global_step": 192209, "epoch": 4576} {"train_loss": -7.203973770141602, "global_step": 192210, "epoch": 4576} {"train_loss": -7.216089248657227, "global_step": 192211, "epoch": 4576} {"train_loss": -7.037792682647705, "global_step": 192212, "epoch": 4576} {"train_loss": -7.280085563659668, "global_step": 192213, "epoch": 4576} {"train_loss": -7.176126003265381, "global_step": 192214, "epoch": 4576} {"train_loss": -7.161552429199219, "global_step": 192215, "epoch": 4576} {"train_loss": -7.255457878112793, "global_step": 192216, "epoch": 4576} {"train_loss": -7.1752824783325195, "global_step": 192217, "epoch": 4576} {"train_loss": -7.374915599822998, "global_step": 192218, "epoch": 4576} {"train_loss": -7.1045002937316895, "global_step": 192219, "epoch": 4576} {"train_loss": -7.223697662353516, "global_step": 192220, "epoch": 4576} {"train_loss": -7.1366868019104, "global_step": 192221, "epoch": 4576} {"train_loss": -7.2839508056640625, "global_step": 192222, "epoch": 4576} {"train_loss": -7.162906646728516, "global_step": 192223, "epoch": 4576} {"train_loss": -7.1902947425842285, "global_step": 192224, "epoch": 4576} {"train_loss": -7.117666244506836, "global_step": 192225, "epoch": 4576} {"train_loss": -7.191242694854736, "global_step": 192226, "epoch": 4576} {"train_loss": -7.413606643676758, "global_step": 192227, "epoch": 4576} {"train_loss": -7.224637985229492, "global_step": 192228, "epoch": 4576} {"train_loss": -7.2137346267700195, "global_step": 192229, "epoch": 4576} {"train_loss": -7.290013313293457, "global_step": 192230, "epoch": 4576} {"train_loss": -7.2195234298706055, "global_step": 192231, "epoch": 4576} {"train_loss": -7.325852394104004, "global_step": 192232, "epoch": 4576} {"train_loss": -7.211690403166271, "global_step": 192233, "epoch": 4576, "val_loss": 81254.53125} {"train_loss": -7.314774990081787, "global_step": 192234, "epoch": 4577} {"train_loss": -7.18428897857666, "global_step": 192235, "epoch": 4577} {"train_loss": -7.26054573059082, "global_step": 192236, "epoch": 4577} {"train_loss": -7.277609825134277, "global_step": 192237, "epoch": 4577} {"train_loss": -7.102053642272949, "global_step": 192238, "epoch": 4577} {"train_loss": -7.304316997528076, "global_step": 192239, "epoch": 4577} {"train_loss": -7.214591026306152, "global_step": 192240, "epoch": 4577} {"train_loss": -7.261773109436035, "global_step": 192241, "epoch": 4577} {"train_loss": -7.272472858428955, "global_step": 192242, "epoch": 4577} {"train_loss": -7.3149800300598145, "global_step": 192243, "epoch": 4577} {"train_loss": -7.287891864776611, "global_step": 192244, "epoch": 4577} {"train_loss": -7.314560890197754, "global_step": 192245, "epoch": 4577} {"train_loss": -7.286559104919434, "global_step": 192246, "epoch": 4577} {"train_loss": -7.415914535522461, "global_step": 192247, "epoch": 4577} {"train_loss": -7.2765655517578125, "global_step": 192248, "epoch": 4577} {"train_loss": -7.325117588043213, "global_step": 192249, "epoch": 4577} {"train_loss": -7.345598220825195, "global_step": 192250, "epoch": 4577} {"train_loss": -7.361268520355225, "global_step": 192251, "epoch": 4577} {"train_loss": -7.332794189453125, "global_step": 192252, "epoch": 4577} {"train_loss": -7.253602504730225, "global_step": 192253, "epoch": 4577} {"train_loss": -7.204701900482178, "global_step": 192254, "epoch": 4577} {"train_loss": -7.300073623657227, "global_step": 192255, "epoch": 4577} {"train_loss": -7.29312801361084, "global_step": 192256, "epoch": 4577} {"train_loss": -7.259792327880859, "global_step": 192257, "epoch": 4577} {"train_loss": -7.357942581176758, "global_step": 192258, "epoch": 4577} {"train_loss": -7.3267412185668945, "global_step": 192259, "epoch": 4577} {"train_loss": -7.307247161865234, "global_step": 192260, "epoch": 4577} {"train_loss": -7.168839931488037, "global_step": 192261, "epoch": 4577} {"train_loss": -7.178139686584473, "global_step": 192262, "epoch": 4577} {"train_loss": -7.336825370788574, "global_step": 192263, "epoch": 4577} {"train_loss": -7.176499366760254, "global_step": 192264, "epoch": 4577} {"train_loss": -7.116192817687988, "global_step": 192265, "epoch": 4577} {"train_loss": -7.170646667480469, "global_step": 192266, "epoch": 4577} {"train_loss": -7.228928089141846, "global_step": 192267, "epoch": 4577} {"train_loss": -7.249086856842041, "global_step": 192268, "epoch": 4577} {"train_loss": -7.185542106628418, "global_step": 192269, "epoch": 4577} {"train_loss": -7.229391098022461, "global_step": 192270, "epoch": 4577} {"train_loss": -7.2886552810668945, "global_step": 192271, "epoch": 4577} {"train_loss": -7.072757720947266, "global_step": 192272, "epoch": 4577} {"train_loss": -7.276712894439697, "global_step": 192273, "epoch": 4577} {"train_loss": -7.224156379699707, "global_step": 192274, "epoch": 4577} {"train_loss": -7.257069383348737, "global_step": 192275, "epoch": 4577, "val_loss": 81164.4921875} {"train_loss": -7.174581527709961, "global_step": 192276, "epoch": 4578} {"train_loss": -7.068016052246094, "global_step": 192277, "epoch": 4578} {"train_loss": -7.066876411437988, "global_step": 192278, "epoch": 4578} {"train_loss": -7.2310872077941895, "global_step": 192279, "epoch": 4578} {"train_loss": -7.104021072387695, "global_step": 192280, "epoch": 4578} {"train_loss": -7.132905006408691, "global_step": 192281, "epoch": 4578} {"train_loss": -7.153049945831299, "global_step": 192282, "epoch": 4578} {"train_loss": -7.271997451782227, "global_step": 192283, "epoch": 4578} {"train_loss": -7.08287239074707, "global_step": 192284, "epoch": 4578} {"train_loss": -7.171794891357422, "global_step": 192285, "epoch": 4578} {"train_loss": -7.1433515548706055, "global_step": 192286, "epoch": 4578} {"train_loss": -7.257497787475586, "global_step": 192287, "epoch": 4578} {"train_loss": -7.204866886138916, "global_step": 192288, "epoch": 4578} {"train_loss": -7.257358551025391, "global_step": 192289, "epoch": 4578} {"train_loss": -7.194087982177734, "global_step": 192290, "epoch": 4578} {"train_loss": -7.2391510009765625, "global_step": 192291, "epoch": 4578} {"train_loss": -7.258975505828857, "global_step": 192292, "epoch": 4578} {"train_loss": -7.277799606323242, "global_step": 192293, "epoch": 4578} {"train_loss": -7.170838832855225, "global_step": 192294, "epoch": 4578} {"train_loss": -7.173733234405518, "global_step": 192295, "epoch": 4578} {"train_loss": -7.181524753570557, "global_step": 192296, "epoch": 4578} {"train_loss": -7.2371826171875, "global_step": 192297, "epoch": 4578} {"train_loss": -7.209752559661865, "global_step": 192298, "epoch": 4578} {"train_loss": -7.270166873931885, "global_step": 192299, "epoch": 4578} {"train_loss": -7.258816719055176, "global_step": 192300, "epoch": 4578} {"train_loss": -7.158454418182373, "global_step": 192301, "epoch": 4578} {"train_loss": -7.1906561851501465, "global_step": 192302, "epoch": 4578} {"train_loss": -7.256915092468262, "global_step": 192303, "epoch": 4578} {"train_loss": -7.096632480621338, "global_step": 192304, "epoch": 4578} {"train_loss": -7.119743347167969, "global_step": 192305, "epoch": 4578} {"train_loss": -7.144644737243652, "global_step": 192306, "epoch": 4578} {"train_loss": -7.1668524742126465, "global_step": 192307, "epoch": 4578} {"train_loss": -7.392975807189941, "global_step": 192308, "epoch": 4578} {"train_loss": -7.197786331176758, "global_step": 192309, "epoch": 4578} {"train_loss": -7.163348197937012, "global_step": 192310, "epoch": 4578} {"train_loss": -7.248720169067383, "global_step": 192311, "epoch": 4578} {"train_loss": -7.123122692108154, "global_step": 192312, "epoch": 4578} {"train_loss": -7.263095855712891, "global_step": 192313, "epoch": 4578} {"train_loss": -7.073653697967529, "global_step": 192314, "epoch": 4578} {"train_loss": -7.112002849578857, "global_step": 192315, "epoch": 4578} {"train_loss": -7.090487480163574, "global_step": 192316, "epoch": 4578} {"train_loss": -7.181979168029058, "global_step": 192317, "epoch": 4578, "val_loss": 80977.90625} {"train_loss": -7.067949295043945, "global_step": 192318, "epoch": 4579} {"train_loss": -7.070145606994629, "global_step": 192319, "epoch": 4579} {"train_loss": -7.134958267211914, "global_step": 192320, "epoch": 4579} {"train_loss": -7.1655707359313965, "global_step": 192321, "epoch": 4579} {"train_loss": -7.267847061157227, "global_step": 192322, "epoch": 4579} {"train_loss": -7.192474365234375, "global_step": 192323, "epoch": 4579} {"train_loss": -7.198904514312744, "global_step": 192324, "epoch": 4579} {"train_loss": -7.190168380737305, "global_step": 192325, "epoch": 4579} {"train_loss": -7.238799571990967, "global_step": 192326, "epoch": 4579} {"train_loss": -7.2605791091918945, "global_step": 192327, "epoch": 4579} {"train_loss": -7.238397598266602, "global_step": 192328, "epoch": 4579} {"train_loss": -7.234071254730225, "global_step": 192329, "epoch": 4579} {"train_loss": -7.350918769836426, "global_step": 192330, "epoch": 4579} {"train_loss": -7.257915019989014, "global_step": 192331, "epoch": 4579} {"train_loss": -7.177022457122803, "global_step": 192332, "epoch": 4579} {"train_loss": -7.09291934967041, "global_step": 192333, "epoch": 4579} {"train_loss": -7.169213771820068, "global_step": 192334, "epoch": 4579} {"train_loss": -7.246164321899414, "global_step": 192335, "epoch": 4579} {"train_loss": -7.188972473144531, "global_step": 192336, "epoch": 4579} {"train_loss": -7.226562976837158, "global_step": 192337, "epoch": 4579} {"train_loss": -7.292670249938965, "global_step": 192338, "epoch": 4579} {"train_loss": -7.262619972229004, "global_step": 192339, "epoch": 4579} {"train_loss": -7.276185989379883, "global_step": 192340, "epoch": 4579} {"train_loss": -7.324145793914795, "global_step": 192341, "epoch": 4579} {"train_loss": -7.292346954345703, "global_step": 192342, "epoch": 4579} {"train_loss": -7.291049957275391, "global_step": 192343, "epoch": 4579} {"train_loss": -7.19473934173584, "global_step": 192344, "epoch": 4579} {"train_loss": -7.330820083618164, "global_step": 192345, "epoch": 4579} {"train_loss": -7.239867210388184, "global_step": 192346, "epoch": 4579} {"train_loss": -7.340724468231201, "global_step": 192347, "epoch": 4579} {"train_loss": -7.1414079666137695, "global_step": 192348, "epoch": 4579} {"train_loss": -7.311507225036621, "global_step": 192349, "epoch": 4579} {"train_loss": -7.22091007232666, "global_step": 192350, "epoch": 4579} {"train_loss": -7.18428897857666, "global_step": 192351, "epoch": 4579} {"train_loss": -7.313606262207031, "global_step": 192352, "epoch": 4579} {"train_loss": -7.245870590209961, "global_step": 192353, "epoch": 4579} {"train_loss": -7.23655891418457, "global_step": 192354, "epoch": 4579} {"train_loss": -7.268489837646484, "global_step": 192355, "epoch": 4579} {"train_loss": -7.3091888427734375, "global_step": 192356, "epoch": 4579} {"train_loss": -7.208375930786133, "global_step": 192357, "epoch": 4579} {"train_loss": -7.2533955574035645, "global_step": 192358, "epoch": 4579} {"train_loss": -7.230148394902547, "global_step": 192359, "epoch": 4579, "val_loss": 81149.921875} {"train_loss": -7.304570198059082, "global_step": 192360, "epoch": 4580} {"train_loss": -7.260077476501465, "global_step": 192361, "epoch": 4580} {"train_loss": -7.218871116638184, "global_step": 192362, "epoch": 4580} {"train_loss": -7.305920600891113, "global_step": 192363, "epoch": 4580} {"train_loss": -7.182013511657715, "global_step": 192364, "epoch": 4580} {"train_loss": -7.226353645324707, "global_step": 192365, "epoch": 4580} {"train_loss": -7.182682991027832, "global_step": 192366, "epoch": 4580} {"train_loss": -7.137810707092285, "global_step": 192367, "epoch": 4580} {"train_loss": -7.1923933029174805, "global_step": 192368, "epoch": 4580} {"train_loss": -7.208217620849609, "global_step": 192369, "epoch": 4580} {"train_loss": -7.248578071594238, "global_step": 192370, "epoch": 4580} {"train_loss": -7.158558368682861, "global_step": 192371, "epoch": 4580} {"train_loss": -7.069997787475586, "global_step": 192372, "epoch": 4580} {"train_loss": -7.120903491973877, "global_step": 192373, "epoch": 4580} {"train_loss": -7.272438049316406, "global_step": 192374, "epoch": 4580} {"train_loss": -7.125008583068848, "global_step": 192375, "epoch": 4580} {"train_loss": -7.323792934417725, "global_step": 192376, "epoch": 4580} {"train_loss": -7.268382549285889, "global_step": 192377, "epoch": 4580} {"train_loss": -7.153185844421387, "global_step": 192378, "epoch": 4580} {"train_loss": -7.213343620300293, "global_step": 192379, "epoch": 4580} {"train_loss": -7.2506842613220215, "global_step": 192380, "epoch": 4580} {"train_loss": -7.174970626831055, "global_step": 192381, "epoch": 4580} {"train_loss": -7.163655757904053, "global_step": 192382, "epoch": 4580} {"train_loss": -7.2360124588012695, "global_step": 192383, "epoch": 4580} {"train_loss": -7.164297103881836, "global_step": 192384, "epoch": 4580} {"train_loss": -7.24472188949585, "global_step": 192385, "epoch": 4580} {"train_loss": -7.269960880279541, "global_step": 192386, "epoch": 4580} {"train_loss": -7.2107391357421875, "global_step": 192387, "epoch": 4580} {"train_loss": -7.274926662445068, "global_step": 192388, "epoch": 4580} {"train_loss": -7.2175421714782715, "global_step": 192389, "epoch": 4580} {"train_loss": -7.17244291305542, "global_step": 192390, "epoch": 4580} {"train_loss": -7.1410136222839355, "global_step": 192391, "epoch": 4580} {"train_loss": -7.275118350982666, "global_step": 192392, "epoch": 4580} {"train_loss": -7.236263275146484, "global_step": 192393, "epoch": 4580} {"train_loss": -7.224188804626465, "global_step": 192394, "epoch": 4580} {"train_loss": -7.2453718185424805, "global_step": 192395, "epoch": 4580} {"train_loss": -7.220193862915039, "global_step": 192396, "epoch": 4580} {"train_loss": -7.279285430908203, "global_step": 192397, "epoch": 4580} {"train_loss": -7.2241082191467285, "global_step": 192398, "epoch": 4580} {"train_loss": -7.240146636962891, "global_step": 192399, "epoch": 4580} {"train_loss": -7.1656341552734375, "global_step": 192400, "epoch": 4580} {"train_loss": -7.214343627293904, "global_step": 192401, "epoch": 4580, "val_loss": 81047.2734375} {"train_loss": -7.201983451843262, "global_step": 192402, "epoch": 4581} {"train_loss": -7.237301826477051, "global_step": 192403, "epoch": 4581} {"train_loss": -7.280068874359131, "global_step": 192404, "epoch": 4581} {"train_loss": -7.336485385894775, "global_step": 192405, "epoch": 4581} {"train_loss": -7.243582248687744, "global_step": 192406, "epoch": 4581} {"train_loss": -7.128620624542236, "global_step": 192407, "epoch": 4581} {"train_loss": -7.225883483886719, "global_step": 192408, "epoch": 4581} {"train_loss": -7.232203960418701, "global_step": 192409, "epoch": 4581} {"train_loss": -7.286689758300781, "global_step": 192410, "epoch": 4581} {"train_loss": -7.181667804718018, "global_step": 192411, "epoch": 4581} {"train_loss": -7.086342811584473, "global_step": 192412, "epoch": 4581} {"train_loss": -7.190218448638916, "global_step": 192413, "epoch": 4581} {"train_loss": -7.1644439697265625, "global_step": 192414, "epoch": 4581} {"train_loss": -7.22269344329834, "global_step": 192415, "epoch": 4581} {"train_loss": -7.324389457702637, "global_step": 192416, "epoch": 4581} {"train_loss": -7.150986671447754, "global_step": 192417, "epoch": 4581} {"train_loss": -7.303283214569092, "global_step": 192418, "epoch": 4581} {"train_loss": -7.264225959777832, "global_step": 192419, "epoch": 4581} {"train_loss": -7.186715126037598, "global_step": 192420, "epoch": 4581} {"train_loss": -7.202372074127197, "global_step": 192421, "epoch": 4581} {"train_loss": -7.244853973388672, "global_step": 192422, "epoch": 4581} {"train_loss": -7.257894515991211, "global_step": 192423, "epoch": 4581} {"train_loss": -7.2619428634643555, "global_step": 192424, "epoch": 4581} {"train_loss": -7.21646785736084, "global_step": 192425, "epoch": 4581} {"train_loss": -7.209304332733154, "global_step": 192426, "epoch": 4581} {"train_loss": -7.350417137145996, "global_step": 192427, "epoch": 4581} {"train_loss": -7.157719135284424, "global_step": 192428, "epoch": 4581} {"train_loss": -7.3286237716674805, "global_step": 192429, "epoch": 4581} {"train_loss": -7.3136749267578125, "global_step": 192430, "epoch": 4581} {"train_loss": -7.230991363525391, "global_step": 192431, "epoch": 4581} {"train_loss": -7.255622863769531, "global_step": 192432, "epoch": 4581} {"train_loss": -7.217576026916504, "global_step": 192433, "epoch": 4581} {"train_loss": -7.329318523406982, "global_step": 192434, "epoch": 4581} {"train_loss": -7.312632083892822, "global_step": 192435, "epoch": 4581} {"train_loss": -7.1800031661987305, "global_step": 192436, "epoch": 4581} {"train_loss": -7.166252136230469, "global_step": 192437, "epoch": 4581} {"train_loss": -7.342206001281738, "global_step": 192438, "epoch": 4581} {"train_loss": -7.231684684753418, "global_step": 192439, "epoch": 4581} {"train_loss": -7.291024208068848, "global_step": 192440, "epoch": 4581} {"train_loss": -7.217770099639893, "global_step": 192441, "epoch": 4581} {"train_loss": -7.24494743347168, "global_step": 192442, "epoch": 4581} {"train_loss": -7.237886769430978, "global_step": 192443, "epoch": 4581, "val_loss": 81272.9375} {"train_loss": -7.2460126876831055, "global_step": 192444, "epoch": 4582} {"train_loss": -7.216056823730469, "global_step": 192445, "epoch": 4582} {"train_loss": -7.151011943817139, "global_step": 192446, "epoch": 4582} {"train_loss": -7.168068885803223, "global_step": 192447, "epoch": 4582} {"train_loss": -7.256627082824707, "global_step": 192448, "epoch": 4582} {"train_loss": -7.104612827301025, "global_step": 192449, "epoch": 4582} {"train_loss": -7.248318195343018, "global_step": 192450, "epoch": 4582} {"train_loss": -7.046980381011963, "global_step": 192451, "epoch": 4582} {"train_loss": -6.9381208419799805, "global_step": 192452, "epoch": 4582} {"train_loss": -7.134560585021973, "global_step": 192453, "epoch": 4582} {"train_loss": -7.237939834594727, "global_step": 192454, "epoch": 4582} {"train_loss": -7.2334065437316895, "global_step": 192455, "epoch": 4582} {"train_loss": -7.073084354400635, "global_step": 192456, "epoch": 4582} {"train_loss": -7.209299087524414, "global_step": 192457, "epoch": 4582} {"train_loss": -7.253713607788086, "global_step": 192458, "epoch": 4582} {"train_loss": -7.145299911499023, "global_step": 192459, "epoch": 4582} {"train_loss": -7.235169410705566, "global_step": 192460, "epoch": 4582} {"train_loss": -7.1653852462768555, "global_step": 192461, "epoch": 4582} {"train_loss": -7.320150852203369, "global_step": 192462, "epoch": 4582} {"train_loss": -7.274128437042236, "global_step": 192463, "epoch": 4582} {"train_loss": -7.192831993103027, "global_step": 192464, "epoch": 4582} {"train_loss": -7.257637977600098, "global_step": 192465, "epoch": 4582} {"train_loss": -7.190767765045166, "global_step": 192466, "epoch": 4582} {"train_loss": -7.239300727844238, "global_step": 192467, "epoch": 4582} {"train_loss": -7.212818622589111, "global_step": 192468, "epoch": 4582} {"train_loss": -7.325249671936035, "global_step": 192469, "epoch": 4582} {"train_loss": -7.307971477508545, "global_step": 192470, "epoch": 4582} {"train_loss": -7.277383804321289, "global_step": 192471, "epoch": 4582} {"train_loss": -7.208931922912598, "global_step": 192472, "epoch": 4582} {"train_loss": -7.204156875610352, "global_step": 192473, "epoch": 4582} {"train_loss": -7.2948222160339355, "global_step": 192474, "epoch": 4582} {"train_loss": -7.341261386871338, "global_step": 192475, "epoch": 4582} {"train_loss": -7.249727725982666, "global_step": 192476, "epoch": 4582} {"train_loss": -7.374879837036133, "global_step": 192477, "epoch": 4582} {"train_loss": -7.141880989074707, "global_step": 192478, "epoch": 4582} {"train_loss": -7.2113566398620605, "global_step": 192479, "epoch": 4582} {"train_loss": -7.067569732666016, "global_step": 192480, "epoch": 4582} {"train_loss": -7.199472904205322, "global_step": 192481, "epoch": 4582} {"train_loss": -7.190051078796387, "global_step": 192482, "epoch": 4582} {"train_loss": -7.1335344314575195, "global_step": 192483, "epoch": 4582} {"train_loss": -7.1905107498168945, "global_step": 192484, "epoch": 4582} {"train_loss": -7.205282495135353, "global_step": 192485, "epoch": 4582, "val_loss": 81458.9609375} {"train_loss": -7.1794514656066895, "global_step": 192486, "epoch": 4583} {"train_loss": -7.283435821533203, "global_step": 192487, "epoch": 4583} {"train_loss": -7.159979820251465, "global_step": 192488, "epoch": 4583} {"train_loss": -7.105133533477783, "global_step": 192489, "epoch": 4583} {"train_loss": -7.145814895629883, "global_step": 192490, "epoch": 4583} {"train_loss": -7.187923431396484, "global_step": 192491, "epoch": 4583} {"train_loss": -7.193220138549805, "global_step": 192492, "epoch": 4583} {"train_loss": -7.219391345977783, "global_step": 192493, "epoch": 4583} {"train_loss": -7.271119117736816, "global_step": 192494, "epoch": 4583} {"train_loss": -7.092394828796387, "global_step": 192495, "epoch": 4583} {"train_loss": -7.138640403747559, "global_step": 192496, "epoch": 4583} {"train_loss": -6.916064262390137, "global_step": 192497, "epoch": 4583} {"train_loss": -7.205966472625732, "global_step": 192498, "epoch": 4583} {"train_loss": -7.174734592437744, "global_step": 192499, "epoch": 4583} {"train_loss": -7.055561065673828, "global_step": 192500, "epoch": 4583} {"train_loss": -7.234872817993164, "global_step": 192501, "epoch": 4583} {"train_loss": -7.0139479637146, "global_step": 192502, "epoch": 4583} {"train_loss": -7.199731826782227, "global_step": 192503, "epoch": 4583} {"train_loss": -7.176021575927734, "global_step": 192504, "epoch": 4583} {"train_loss": -7.060871124267578, "global_step": 192505, "epoch": 4583} {"train_loss": -7.054256916046143, "global_step": 192506, "epoch": 4583} {"train_loss": -7.137696266174316, "global_step": 192507, "epoch": 4583} {"train_loss": -7.09305477142334, "global_step": 192508, "epoch": 4583} {"train_loss": -7.032750129699707, "global_step": 192509, "epoch": 4583} {"train_loss": -7.283828258514404, "global_step": 192510, "epoch": 4583} {"train_loss": -7.1684160232543945, "global_step": 192511, "epoch": 4583} {"train_loss": -7.314164638519287, "global_step": 192512, "epoch": 4583} {"train_loss": -7.147827625274658, "global_step": 192513, "epoch": 4583} {"train_loss": -7.170539379119873, "global_step": 192514, "epoch": 4583} {"train_loss": -7.304440021514893, "global_step": 192515, "epoch": 4583} {"train_loss": -7.176380157470703, "global_step": 192516, "epoch": 4583} {"train_loss": -7.174625396728516, "global_step": 192517, "epoch": 4583} {"train_loss": -7.150704860687256, "global_step": 192518, "epoch": 4583} {"train_loss": -7.239621162414551, "global_step": 192519, "epoch": 4583} {"train_loss": -7.181723117828369, "global_step": 192520, "epoch": 4583} {"train_loss": -7.225645065307617, "global_step": 192521, "epoch": 4583} {"train_loss": -7.18816614151001, "global_step": 192522, "epoch": 4583} {"train_loss": -7.2580461502075195, "global_step": 192523, "epoch": 4583} {"train_loss": -7.168403625488281, "global_step": 192524, "epoch": 4583} {"train_loss": -7.224501609802246, "global_step": 192525, "epoch": 4583} {"train_loss": -7.074943542480469, "global_step": 192526, "epoch": 4583} {"train_loss": -7.1644174825577505, "global_step": 192527, "epoch": 4583, "val_loss": 81269.0078125} {"train_loss": -7.119304180145264, "global_step": 192528, "epoch": 4584} {"train_loss": -7.229849338531494, "global_step": 192529, "epoch": 4584} {"train_loss": -7.151492595672607, "global_step": 192530, "epoch": 4584} {"train_loss": -7.260944366455078, "global_step": 192531, "epoch": 4584} {"train_loss": -7.276175022125244, "global_step": 192532, "epoch": 4584} {"train_loss": -7.061060428619385, "global_step": 192533, "epoch": 4584} {"train_loss": -7.382752418518066, "global_step": 192534, "epoch": 4584} {"train_loss": -7.146413803100586, "global_step": 192535, "epoch": 4584} {"train_loss": -7.314831256866455, "global_step": 192536, "epoch": 4584} {"train_loss": -7.127982139587402, "global_step": 192537, "epoch": 4584} {"train_loss": -7.306276321411133, "global_step": 192538, "epoch": 4584} {"train_loss": -7.179223537445068, "global_step": 192539, "epoch": 4584} {"train_loss": -7.282985687255859, "global_step": 192540, "epoch": 4584} {"train_loss": -7.311959266662598, "global_step": 192541, "epoch": 4584} {"train_loss": -7.232814788818359, "global_step": 192542, "epoch": 4584} {"train_loss": -7.230038642883301, "global_step": 192543, "epoch": 4584} {"train_loss": -7.274314880371094, "global_step": 192544, "epoch": 4584} {"train_loss": -7.252877235412598, "global_step": 192545, "epoch": 4584} {"train_loss": -7.241223335266113, "global_step": 192546, "epoch": 4584} {"train_loss": -7.31876277923584, "global_step": 192547, "epoch": 4584} {"train_loss": -7.162665367126465, "global_step": 192548, "epoch": 4584} {"train_loss": -7.302770137786865, "global_step": 192549, "epoch": 4584} {"train_loss": -7.224855422973633, "global_step": 192550, "epoch": 4584} {"train_loss": -7.321345329284668, "global_step": 192551, "epoch": 4584} {"train_loss": -7.223379611968994, "global_step": 192552, "epoch": 4584} {"train_loss": -7.372198104858398, "global_step": 192553, "epoch": 4584} {"train_loss": -7.132837295532227, "global_step": 192554, "epoch": 4584} {"train_loss": -7.282943248748779, "global_step": 192555, "epoch": 4584} {"train_loss": -7.2265729904174805, "global_step": 192556, "epoch": 4584} {"train_loss": -7.199257850646973, "global_step": 192557, "epoch": 4584} {"train_loss": -7.2742815017700195, "global_step": 192558, "epoch": 4584} {"train_loss": -7.241214752197266, "global_step": 192559, "epoch": 4584} {"train_loss": -7.288227558135986, "global_step": 192560, "epoch": 4584} {"train_loss": -7.095885276794434, "global_step": 192561, "epoch": 4584} {"train_loss": -7.13702392578125, "global_step": 192562, "epoch": 4584} {"train_loss": -7.309447288513184, "global_step": 192563, "epoch": 4584} {"train_loss": -7.175869941711426, "global_step": 192564, "epoch": 4584} {"train_loss": -7.277132987976074, "global_step": 192565, "epoch": 4584} {"train_loss": -7.291303634643555, "global_step": 192566, "epoch": 4584} {"train_loss": -7.257550239562988, "global_step": 192567, "epoch": 4584} {"train_loss": -7.219655990600586, "global_step": 192568, "epoch": 4584} {"train_loss": -7.236091182345436, "global_step": 192569, "epoch": 4584, "val_loss": 80985.9453125} {"train_loss": -7.3187947273254395, "global_step": 192570, "epoch": 4585} {"train_loss": -7.266094207763672, "global_step": 192571, "epoch": 4585} {"train_loss": -7.271884918212891, "global_step": 192572, "epoch": 4585} {"train_loss": -7.269044399261475, "global_step": 192573, "epoch": 4585} {"train_loss": -7.283214092254639, "global_step": 192574, "epoch": 4585} {"train_loss": -7.323507308959961, "global_step": 192575, "epoch": 4585} {"train_loss": -7.195777416229248, "global_step": 192576, "epoch": 4585} {"train_loss": -7.1623640060424805, "global_step": 192577, "epoch": 4585} {"train_loss": -7.253047466278076, "global_step": 192578, "epoch": 4585} {"train_loss": -7.369549751281738, "global_step": 192579, "epoch": 4585} {"train_loss": -7.343543529510498, "global_step": 192580, "epoch": 4585} {"train_loss": -7.228577613830566, "global_step": 192581, "epoch": 4585} {"train_loss": -7.2537841796875, "global_step": 192582, "epoch": 4585} {"train_loss": -7.2821044921875, "global_step": 192583, "epoch": 4585} {"train_loss": -7.171059608459473, "global_step": 192584, "epoch": 4585} {"train_loss": -7.060900688171387, "global_step": 192585, "epoch": 4585} {"train_loss": -7.277582168579102, "global_step": 192586, "epoch": 4585} {"train_loss": -7.189200401306152, "global_step": 192587, "epoch": 4585} {"train_loss": -7.100908279418945, "global_step": 192588, "epoch": 4585} {"train_loss": -7.227334976196289, "global_step": 192589, "epoch": 4585} {"train_loss": -7.112506866455078, "global_step": 192590, "epoch": 4585} {"train_loss": -7.023224830627441, "global_step": 192591, "epoch": 4585} {"train_loss": -7.268280982971191, "global_step": 192592, "epoch": 4585} {"train_loss": -7.161871910095215, "global_step": 192593, "epoch": 4585} {"train_loss": -7.076005458831787, "global_step": 192594, "epoch": 4585} {"train_loss": -7.260489463806152, "global_step": 192595, "epoch": 4585} {"train_loss": -7.2328290939331055, "global_step": 192596, "epoch": 4585} {"train_loss": -7.221731185913086, "global_step": 192597, "epoch": 4585} {"train_loss": -7.320539474487305, "global_step": 192598, "epoch": 4585} {"train_loss": -7.115148544311523, "global_step": 192599, "epoch": 4585} {"train_loss": -7.26652717590332, "global_step": 192600, "epoch": 4585} {"train_loss": -7.275153160095215, "global_step": 192601, "epoch": 4585} {"train_loss": -7.225856781005859, "global_step": 192602, "epoch": 4585} {"train_loss": -7.204867839813232, "global_step": 192603, "epoch": 4585} {"train_loss": -7.212202072143555, "global_step": 192604, "epoch": 4585} {"train_loss": -7.302013397216797, "global_step": 192605, "epoch": 4585} {"train_loss": -7.237349987030029, "global_step": 192606, "epoch": 4585} {"train_loss": -7.28516960144043, "global_step": 192607, "epoch": 4585} {"train_loss": -7.166045188903809, "global_step": 192608, "epoch": 4585} {"train_loss": -7.237534523010254, "global_step": 192609, "epoch": 4585} {"train_loss": -7.198128700256348, "global_step": 192610, "epoch": 4585} {"train_loss": -7.224828663326445, "global_step": 192611, "epoch": 4585, "val_loss": 81420.421875} {"train_loss": -7.127102851867676, "global_step": 192612, "epoch": 4586} {"train_loss": -7.30996561050415, "global_step": 192613, "epoch": 4586} {"train_loss": -7.161636829376221, "global_step": 192614, "epoch": 4586} {"train_loss": -7.264777183532715, "global_step": 192615, "epoch": 4586} {"train_loss": -7.260514259338379, "global_step": 192616, "epoch": 4586} {"train_loss": -7.208078384399414, "global_step": 192617, "epoch": 4586} {"train_loss": -7.195944786071777, "global_step": 192618, "epoch": 4586} {"train_loss": -7.188724517822266, "global_step": 192619, "epoch": 4586} {"train_loss": -7.262630462646484, "global_step": 192620, "epoch": 4586} {"train_loss": -7.272828102111816, "global_step": 192621, "epoch": 4586} {"train_loss": -7.293895721435547, "global_step": 192622, "epoch": 4586} {"train_loss": -7.2648515701293945, "global_step": 192623, "epoch": 4586} {"train_loss": -7.261878967285156, "global_step": 192624, "epoch": 4586} {"train_loss": -7.172028541564941, "global_step": 192625, "epoch": 4586} {"train_loss": -7.218291282653809, "global_step": 192626, "epoch": 4586} {"train_loss": -7.376748085021973, "global_step": 192627, "epoch": 4586} {"train_loss": -7.307316780090332, "global_step": 192628, "epoch": 4586} {"train_loss": -7.238208770751953, "global_step": 192629, "epoch": 4586} {"train_loss": -7.264893531799316, "global_step": 192630, "epoch": 4586} {"train_loss": -7.423215389251709, "global_step": 192631, "epoch": 4586} {"train_loss": -7.261102676391602, "global_step": 192632, "epoch": 4586} {"train_loss": -7.2487688064575195, "global_step": 192633, "epoch": 4586} {"train_loss": -7.244542598724365, "global_step": 192634, "epoch": 4586} {"train_loss": -7.224287033081055, "global_step": 192635, "epoch": 4586} {"train_loss": -7.323695182800293, "global_step": 192636, "epoch": 4586} {"train_loss": -7.259249687194824, "global_step": 192637, "epoch": 4586} {"train_loss": -7.25090217590332, "global_step": 192638, "epoch": 4586} {"train_loss": -7.315008163452148, "global_step": 192639, "epoch": 4586} {"train_loss": -7.268988609313965, "global_step": 192640, "epoch": 4586} {"train_loss": -7.297177314758301, "global_step": 192641, "epoch": 4586} {"train_loss": -7.299211025238037, "global_step": 192642, "epoch": 4586} {"train_loss": -7.3547515869140625, "global_step": 192643, "epoch": 4586} {"train_loss": -7.250181674957275, "global_step": 192644, "epoch": 4586} {"train_loss": -7.346416473388672, "global_step": 192645, "epoch": 4586} {"train_loss": -7.336291313171387, "global_step": 192646, "epoch": 4586} {"train_loss": -7.23689603805542, "global_step": 192647, "epoch": 4586} {"train_loss": -7.2673139572143555, "global_step": 192648, "epoch": 4586} {"train_loss": -7.237709999084473, "global_step": 192649, "epoch": 4586} {"train_loss": -7.322094440460205, "global_step": 192650, "epoch": 4586} {"train_loss": -7.348250865936279, "global_step": 192651, "epoch": 4586} {"train_loss": -7.203171253204346, "global_step": 192652, "epoch": 4586} {"train_loss": -7.266308909370785, "global_step": 192653, "epoch": 4586, "val_loss": 81045.9140625} {"train_loss": -7.370091438293457, "global_step": 192654, "epoch": 4587} {"train_loss": -7.384021759033203, "global_step": 192655, "epoch": 4587} {"train_loss": -7.2937331199646, "global_step": 192656, "epoch": 4587} {"train_loss": -7.277805328369141, "global_step": 192657, "epoch": 4587} {"train_loss": -7.228402137756348, "global_step": 192658, "epoch": 4587} {"train_loss": -7.305329322814941, "global_step": 192659, "epoch": 4587} {"train_loss": -7.267204284667969, "global_step": 192660, "epoch": 4587} {"train_loss": -7.407684326171875, "global_step": 192661, "epoch": 4587} {"train_loss": -7.281506538391113, "global_step": 192662, "epoch": 4587} {"train_loss": -7.316216468811035, "global_step": 192663, "epoch": 4587} {"train_loss": -7.333959579467773, "global_step": 192664, "epoch": 4587} {"train_loss": -7.222116947174072, "global_step": 192665, "epoch": 4587} {"train_loss": -7.266145706176758, "global_step": 192666, "epoch": 4587} {"train_loss": -7.284107208251953, "global_step": 192667, "epoch": 4587} {"train_loss": -7.2621002197265625, "global_step": 192668, "epoch": 4587} {"train_loss": -7.393795967102051, "global_step": 192669, "epoch": 4587} {"train_loss": -7.30435848236084, "global_step": 192670, "epoch": 4587} {"train_loss": -7.233511924743652, "global_step": 192671, "epoch": 4587} {"train_loss": -7.28971004486084, "global_step": 192672, "epoch": 4587} {"train_loss": -7.356419563293457, "global_step": 192673, "epoch": 4587} {"train_loss": -7.203871726989746, "global_step": 192674, "epoch": 4587} {"train_loss": -7.25586462020874, "global_step": 192675, "epoch": 4587} {"train_loss": -7.257742881774902, "global_step": 192676, "epoch": 4587} {"train_loss": -7.286658763885498, "global_step": 192677, "epoch": 4587} {"train_loss": -7.338474750518799, "global_step": 192678, "epoch": 4587} {"train_loss": -7.372703552246094, "global_step": 192679, "epoch": 4587} {"train_loss": -7.293490409851074, "global_step": 192680, "epoch": 4587} {"train_loss": -7.240004539489746, "global_step": 192681, "epoch": 4587} {"train_loss": -7.352161407470703, "global_step": 192682, "epoch": 4587} {"train_loss": -7.25253438949585, "global_step": 192683, "epoch": 4587} {"train_loss": -7.277935028076172, "global_step": 192684, "epoch": 4587} {"train_loss": -7.162467002868652, "global_step": 192685, "epoch": 4587} {"train_loss": -7.3957037925720215, "global_step": 192686, "epoch": 4587} {"train_loss": -7.28891658782959, "global_step": 192687, "epoch": 4587} {"train_loss": -7.172420024871826, "global_step": 192688, "epoch": 4587} {"train_loss": -7.1816301345825195, "global_step": 192689, "epoch": 4587} {"train_loss": -7.208527565002441, "global_step": 192690, "epoch": 4587} {"train_loss": -7.165175437927246, "global_step": 192691, "epoch": 4587} {"train_loss": -7.167871475219727, "global_step": 192692, "epoch": 4587} {"train_loss": -7.20355224609375, "global_step": 192693, "epoch": 4587} {"train_loss": -7.032872200012207, "global_step": 192694, "epoch": 4587} {"train_loss": -7.267080170767648, "global_step": 192695, "epoch": 4587, "val_loss": 81236.53125} {"train_loss": -7.1779937744140625, "global_step": 192696, "epoch": 4588} {"train_loss": -7.064169883728027, "global_step": 192697, "epoch": 4588} {"train_loss": -7.110805511474609, "global_step": 192698, "epoch": 4588} {"train_loss": -7.030308723449707, "global_step": 192699, "epoch": 4588} {"train_loss": -6.969664573669434, "global_step": 192700, "epoch": 4588} {"train_loss": -7.205781936645508, "global_step": 192701, "epoch": 4588} {"train_loss": -6.919795989990234, "global_step": 192702, "epoch": 4588} {"train_loss": -7.140382289886475, "global_step": 192703, "epoch": 4588} {"train_loss": -6.959680557250977, "global_step": 192704, "epoch": 4588} {"train_loss": -7.153685569763184, "global_step": 192705, "epoch": 4588} {"train_loss": -7.16497802734375, "global_step": 192706, "epoch": 4588} {"train_loss": -7.068706035614014, "global_step": 192707, "epoch": 4588} {"train_loss": -7.161267280578613, "global_step": 192708, "epoch": 4588} {"train_loss": -7.033029556274414, "global_step": 192709, "epoch": 4588} {"train_loss": -7.263741493225098, "global_step": 192710, "epoch": 4588} {"train_loss": -7.189822196960449, "global_step": 192711, "epoch": 4588} {"train_loss": -7.15694522857666, "global_step": 192712, "epoch": 4588} {"train_loss": -7.162303924560547, "global_step": 192713, "epoch": 4588} {"train_loss": -7.250576496124268, "global_step": 192714, "epoch": 4588} {"train_loss": -7.206804275512695, "global_step": 192715, "epoch": 4588} {"train_loss": -7.177522659301758, "global_step": 192716, "epoch": 4588} {"train_loss": -7.189113140106201, "global_step": 192717, "epoch": 4588} {"train_loss": -7.185266971588135, "global_step": 192718, "epoch": 4588} {"train_loss": -7.245744228363037, "global_step": 192719, "epoch": 4588} {"train_loss": -7.290044784545898, "global_step": 192720, "epoch": 4588} {"train_loss": -7.2516703605651855, "global_step": 192721, "epoch": 4588} {"train_loss": -7.215069770812988, "global_step": 192722, "epoch": 4588} {"train_loss": -7.234063148498535, "global_step": 192723, "epoch": 4588} {"train_loss": -7.200940132141113, "global_step": 192724, "epoch": 4588} {"train_loss": -7.2510247230529785, "global_step": 192725, "epoch": 4588} {"train_loss": -7.222211837768555, "global_step": 192726, "epoch": 4588} {"train_loss": -7.234450340270996, "global_step": 192727, "epoch": 4588} {"train_loss": -7.290271759033203, "global_step": 192728, "epoch": 4588} {"train_loss": -7.132095813751221, "global_step": 192729, "epoch": 4588} {"train_loss": -7.2046966552734375, "global_step": 192730, "epoch": 4588} {"train_loss": -7.277254581451416, "global_step": 192731, "epoch": 4588} {"train_loss": -7.218064308166504, "global_step": 192732, "epoch": 4588} {"train_loss": -7.239536285400391, "global_step": 192733, "epoch": 4588} {"train_loss": -7.268942832946777, "global_step": 192734, "epoch": 4588} {"train_loss": -7.295351982116699, "global_step": 192735, "epoch": 4588} {"train_loss": -7.309917449951172, "global_step": 192736, "epoch": 4588} {"train_loss": -7.180166562398274, "global_step": 192737, "epoch": 4588, "val_loss": 81169.890625} {"train_loss": -7.298314571380615, "global_step": 192738, "epoch": 4589} {"train_loss": -7.404397487640381, "global_step": 192739, "epoch": 4589} {"train_loss": -7.300246238708496, "global_step": 192740, "epoch": 4589} {"train_loss": -7.371664047241211, "global_step": 192741, "epoch": 4589} {"train_loss": -7.299853324890137, "global_step": 192742, "epoch": 4589} {"train_loss": -7.251047611236572, "global_step": 192743, "epoch": 4589} {"train_loss": -7.258580207824707, "global_step": 192744, "epoch": 4589} {"train_loss": -7.278221607208252, "global_step": 192745, "epoch": 4589} {"train_loss": -7.339566230773926, "global_step": 192746, "epoch": 4589} {"train_loss": -7.207935333251953, "global_step": 192747, "epoch": 4589} {"train_loss": -7.201641082763672, "global_step": 192748, "epoch": 4589} {"train_loss": -7.224298477172852, "global_step": 192749, "epoch": 4589} {"train_loss": -7.180383682250977, "global_step": 192750, "epoch": 4589} {"train_loss": -7.112836837768555, "global_step": 192751, "epoch": 4589} {"train_loss": -7.16074275970459, "global_step": 192752, "epoch": 4589} {"train_loss": -7.014501094818115, "global_step": 192753, "epoch": 4589} {"train_loss": -7.055609703063965, "global_step": 192754, "epoch": 4589} {"train_loss": -7.085031509399414, "global_step": 192755, "epoch": 4589} {"train_loss": -7.115588188171387, "global_step": 192756, "epoch": 4589} {"train_loss": -7.033912658691406, "global_step": 192757, "epoch": 4589} {"train_loss": -7.141890525817871, "global_step": 192758, "epoch": 4589} {"train_loss": -6.973505973815918, "global_step": 192759, "epoch": 4589} {"train_loss": -7.176972389221191, "global_step": 192760, "epoch": 4589} {"train_loss": -6.993528366088867, "global_step": 192761, "epoch": 4589} {"train_loss": -7.058427810668945, "global_step": 192762, "epoch": 4589} {"train_loss": -7.00468635559082, "global_step": 192763, "epoch": 4589} {"train_loss": -7.145318984985352, "global_step": 192764, "epoch": 4589} {"train_loss": -7.0599870681762695, "global_step": 192765, "epoch": 4589} {"train_loss": -7.189970016479492, "global_step": 192766, "epoch": 4589} {"train_loss": -7.114768028259277, "global_step": 192767, "epoch": 4589} {"train_loss": -7.138727188110352, "global_step": 192768, "epoch": 4589} {"train_loss": -7.176621437072754, "global_step": 192769, "epoch": 4589} {"train_loss": -7.179498672485352, "global_step": 192770, "epoch": 4589} {"train_loss": -7.176772594451904, "global_step": 192771, "epoch": 4589} {"train_loss": -7.154146194458008, "global_step": 192772, "epoch": 4589} {"train_loss": -7.194271564483643, "global_step": 192773, "epoch": 4589} {"train_loss": -7.14289665222168, "global_step": 192774, "epoch": 4589} {"train_loss": -7.195328235626221, "global_step": 192775, "epoch": 4589} {"train_loss": -7.286892890930176, "global_step": 192776, "epoch": 4589} {"train_loss": -7.198317527770996, "global_step": 192777, "epoch": 4589} {"train_loss": -7.19356632232666, "global_step": 192778, "epoch": 4589} {"train_loss": -7.1753194105057485, "global_step": 192779, "epoch": 4589, "val_loss": 81155.03125} {"train_loss": -7.272339344024658, "global_step": 192780, "epoch": 4590} {"train_loss": -7.187652587890625, "global_step": 192781, "epoch": 4590} {"train_loss": -7.307052135467529, "global_step": 192782, "epoch": 4590} {"train_loss": -7.273972511291504, "global_step": 192783, "epoch": 4590} {"train_loss": -7.278114318847656, "global_step": 192784, "epoch": 4590} {"train_loss": -7.337213516235352, "global_step": 192785, "epoch": 4590} {"train_loss": -7.215250015258789, "global_step": 192786, "epoch": 4590} {"train_loss": -7.221515655517578, "global_step": 192787, "epoch": 4590} {"train_loss": -7.104958534240723, "global_step": 192788, "epoch": 4590} {"train_loss": -7.208892822265625, "global_step": 192789, "epoch": 4590} {"train_loss": -7.225951194763184, "global_step": 192790, "epoch": 4590} {"train_loss": -7.209774971008301, "global_step": 192791, "epoch": 4590} {"train_loss": -7.3106207847595215, "global_step": 192792, "epoch": 4590} {"train_loss": -7.266927242279053, "global_step": 192793, "epoch": 4590} {"train_loss": -7.243551731109619, "global_step": 192794, "epoch": 4590} {"train_loss": -7.219509124755859, "global_step": 192795, "epoch": 4590} {"train_loss": -7.233662128448486, "global_step": 192796, "epoch": 4590} {"train_loss": -7.276053428649902, "global_step": 192797, "epoch": 4590} {"train_loss": -7.2367143630981445, "global_step": 192798, "epoch": 4590} {"train_loss": -7.303318977355957, "global_step": 192799, "epoch": 4590} {"train_loss": -7.3275675773620605, "global_step": 192800, "epoch": 4590} {"train_loss": -7.231977462768555, "global_step": 192801, "epoch": 4590} {"train_loss": -7.121950149536133, "global_step": 192802, "epoch": 4590} {"train_loss": -7.199248790740967, "global_step": 192803, "epoch": 4590} {"train_loss": -7.232404708862305, "global_step": 192804, "epoch": 4590} {"train_loss": -7.247548580169678, "global_step": 192805, "epoch": 4590} {"train_loss": -7.247262954711914, "global_step": 192806, "epoch": 4590} {"train_loss": -7.305948257446289, "global_step": 192807, "epoch": 4590} {"train_loss": -7.065402507781982, "global_step": 192808, "epoch": 4590} {"train_loss": -7.112916469573975, "global_step": 192809, "epoch": 4590} {"train_loss": -7.1986823081970215, "global_step": 192810, "epoch": 4590} {"train_loss": -7.097198486328125, "global_step": 192811, "epoch": 4590} {"train_loss": -7.244146347045898, "global_step": 192812, "epoch": 4590} {"train_loss": -7.211052417755127, "global_step": 192813, "epoch": 4590} {"train_loss": -7.148896217346191, "global_step": 192814, "epoch": 4590} {"train_loss": -7.217867851257324, "global_step": 192815, "epoch": 4590} {"train_loss": -7.182787895202637, "global_step": 192816, "epoch": 4590} {"train_loss": -7.170986175537109, "global_step": 192817, "epoch": 4590} {"train_loss": -7.296966552734375, "global_step": 192818, "epoch": 4590} {"train_loss": -7.154451847076416, "global_step": 192819, "epoch": 4590} {"train_loss": -7.225553035736084, "global_step": 192820, "epoch": 4590} {"train_loss": -7.223427511396862, "global_step": 192821, "epoch": 4590, "val_loss": 80988.9921875} {"train_loss": -7.216371536254883, "global_step": 192822, "epoch": 4591} {"train_loss": -7.170595169067383, "global_step": 192823, "epoch": 4591} {"train_loss": -7.17610502243042, "global_step": 192824, "epoch": 4591} {"train_loss": -7.213074207305908, "global_step": 192825, "epoch": 4591} {"train_loss": -7.195889472961426, "global_step": 192826, "epoch": 4591} {"train_loss": -7.242796897888184, "global_step": 192827, "epoch": 4591} {"train_loss": -7.125197410583496, "global_step": 192828, "epoch": 4591} {"train_loss": -7.0514421463012695, "global_step": 192829, "epoch": 4591} {"train_loss": -7.191436767578125, "global_step": 192830, "epoch": 4591} {"train_loss": -7.1717681884765625, "global_step": 192831, "epoch": 4591} {"train_loss": -7.196409702301025, "global_step": 192832, "epoch": 4591} {"train_loss": -7.088451385498047, "global_step": 192833, "epoch": 4591} {"train_loss": -7.237307071685791, "global_step": 192834, "epoch": 4591} {"train_loss": -7.2383012771606445, "global_step": 192835, "epoch": 4591} {"train_loss": -7.251148223876953, "global_step": 192836, "epoch": 4591} {"train_loss": -7.175817012786865, "global_step": 192837, "epoch": 4591} {"train_loss": -7.280595302581787, "global_step": 192838, "epoch": 4591} {"train_loss": -7.0798444747924805, "global_step": 192839, "epoch": 4591} {"train_loss": -7.281209468841553, "global_step": 192840, "epoch": 4591} {"train_loss": -7.234435081481934, "global_step": 192841, "epoch": 4591} {"train_loss": -7.073513984680176, "global_step": 192842, "epoch": 4591} {"train_loss": -7.2797956466674805, "global_step": 192843, "epoch": 4591} {"train_loss": -7.223316192626953, "global_step": 192844, "epoch": 4591} {"train_loss": -7.264222145080566, "global_step": 192845, "epoch": 4591} {"train_loss": -7.103344917297363, "global_step": 192846, "epoch": 4591} {"train_loss": -7.222965717315674, "global_step": 192847, "epoch": 4591} {"train_loss": -7.165151596069336, "global_step": 192848, "epoch": 4591} {"train_loss": -7.176254749298096, "global_step": 192849, "epoch": 4591} {"train_loss": -7.252301216125488, "global_step": 192850, "epoch": 4591} {"train_loss": -7.244678497314453, "global_step": 192851, "epoch": 4591} {"train_loss": -7.264362812042236, "global_step": 192852, "epoch": 4591} {"train_loss": -7.23045015335083, "global_step": 192853, "epoch": 4591} {"train_loss": -7.2225799560546875, "global_step": 192854, "epoch": 4591} {"train_loss": -7.152751922607422, "global_step": 192855, "epoch": 4591} {"train_loss": -7.1826910972595215, "global_step": 192856, "epoch": 4591} {"train_loss": -7.362074851989746, "global_step": 192857, "epoch": 4591} {"train_loss": -7.180327415466309, "global_step": 192858, "epoch": 4591} {"train_loss": -7.1098785400390625, "global_step": 192859, "epoch": 4591} {"train_loss": -7.233523845672607, "global_step": 192860, "epoch": 4591} {"train_loss": -7.1549577713012695, "global_step": 192861, "epoch": 4591} {"train_loss": -7.135790824890137, "global_step": 192862, "epoch": 4591} {"train_loss": -7.19607899302528, "global_step": 192863, "epoch": 4591, "val_loss": 81315.7265625} {"train_loss": -7.198122024536133, "global_step": 192864, "epoch": 4592} {"train_loss": -7.25861120223999, "global_step": 192865, "epoch": 4592} {"train_loss": -7.321076393127441, "global_step": 192866, "epoch": 4592} {"train_loss": -7.226907730102539, "global_step": 192867, "epoch": 4592} {"train_loss": -7.3363494873046875, "global_step": 192868, "epoch": 4592} {"train_loss": -7.322804927825928, "global_step": 192869, "epoch": 4592} {"train_loss": -7.241325855255127, "global_step": 192870, "epoch": 4592} {"train_loss": -7.29301643371582, "global_step": 192871, "epoch": 4592} {"train_loss": -7.325647354125977, "global_step": 192872, "epoch": 4592} {"train_loss": -7.263832092285156, "global_step": 192873, "epoch": 4592} {"train_loss": -7.25192928314209, "global_step": 192874, "epoch": 4592} {"train_loss": -7.1836748123168945, "global_step": 192875, "epoch": 4592} {"train_loss": -7.264809608459473, "global_step": 192876, "epoch": 4592} {"train_loss": -7.160101890563965, "global_step": 192877, "epoch": 4592} {"train_loss": -7.207333564758301, "global_step": 192878, "epoch": 4592} {"train_loss": -7.125733375549316, "global_step": 192879, "epoch": 4592} {"train_loss": -7.052962303161621, "global_step": 192880, "epoch": 4592} {"train_loss": -7.068394660949707, "global_step": 192881, "epoch": 4592} {"train_loss": -7.235160827636719, "global_step": 192882, "epoch": 4592} {"train_loss": -7.0718512535095215, "global_step": 192883, "epoch": 4592} {"train_loss": -7.166769981384277, "global_step": 192884, "epoch": 4592} {"train_loss": -7.177877902984619, "global_step": 192885, "epoch": 4592} {"train_loss": -7.133415222167969, "global_step": 192886, "epoch": 4592} {"train_loss": -7.165872573852539, "global_step": 192887, "epoch": 4592} {"train_loss": -7.321600437164307, "global_step": 192888, "epoch": 4592} {"train_loss": -7.2463698387146, "global_step": 192889, "epoch": 4592} {"train_loss": -7.141707420349121, "global_step": 192890, "epoch": 4592} {"train_loss": -7.218077659606934, "global_step": 192891, "epoch": 4592} {"train_loss": -7.32836389541626, "global_step": 192892, "epoch": 4592} {"train_loss": -7.03233003616333, "global_step": 192893, "epoch": 4592} {"train_loss": -7.195981025695801, "global_step": 192894, "epoch": 4592} {"train_loss": -7.281429767608643, "global_step": 192895, "epoch": 4592} {"train_loss": -7.178408622741699, "global_step": 192896, "epoch": 4592} {"train_loss": -7.248118877410889, "global_step": 192897, "epoch": 4592} {"train_loss": -7.130819797515869, "global_step": 192898, "epoch": 4592} {"train_loss": -7.271428108215332, "global_step": 192899, "epoch": 4592} {"train_loss": -7.232016086578369, "global_step": 192900, "epoch": 4592} {"train_loss": -7.197322845458984, "global_step": 192901, "epoch": 4592} {"train_loss": -7.210172653198242, "global_step": 192902, "epoch": 4592} {"train_loss": -7.240530014038086, "global_step": 192903, "epoch": 4592} {"train_loss": -7.294316291809082, "global_step": 192904, "epoch": 4592} {"train_loss": -7.214761972427368, "global_step": 192905, "epoch": 4592, "val_loss": 81171.5390625} {"train_loss": -7.255023956298828, "global_step": 192906, "epoch": 4593} {"train_loss": -7.218052864074707, "global_step": 192907, "epoch": 4593} {"train_loss": -7.269669532775879, "global_step": 192908, "epoch": 4593} {"train_loss": -7.242133617401123, "global_step": 192909, "epoch": 4593} {"train_loss": -7.257988929748535, "global_step": 192910, "epoch": 4593} {"train_loss": -7.257623672485352, "global_step": 192911, "epoch": 4593} {"train_loss": -7.266077041625977, "global_step": 192912, "epoch": 4593} {"train_loss": -7.309253692626953, "global_step": 192913, "epoch": 4593} {"train_loss": -7.18588924407959, "global_step": 192914, "epoch": 4593} {"train_loss": -7.186748027801514, "global_step": 192915, "epoch": 4593} {"train_loss": -7.139957427978516, "global_step": 192916, "epoch": 4593} {"train_loss": -7.315954208374023, "global_step": 192917, "epoch": 4593} {"train_loss": -7.323035717010498, "global_step": 192918, "epoch": 4593} {"train_loss": -7.267435550689697, "global_step": 192919, "epoch": 4593} {"train_loss": -7.241837978363037, "global_step": 192920, "epoch": 4593} {"train_loss": -7.311380386352539, "global_step": 192921, "epoch": 4593} {"train_loss": -7.259857654571533, "global_step": 192922, "epoch": 4593} {"train_loss": -7.187043190002441, "global_step": 192923, "epoch": 4593} {"train_loss": -7.186615943908691, "global_step": 192924, "epoch": 4593} {"train_loss": -7.1780924797058105, "global_step": 192925, "epoch": 4593} {"train_loss": -7.258790016174316, "global_step": 192926, "epoch": 4593} {"train_loss": -7.132404327392578, "global_step": 192927, "epoch": 4593} {"train_loss": -7.267663955688477, "global_step": 192928, "epoch": 4593} {"train_loss": -7.182791709899902, "global_step": 192929, "epoch": 4593} {"train_loss": -7.302723407745361, "global_step": 192930, "epoch": 4593} {"train_loss": -7.203963279724121, "global_step": 192931, "epoch": 4593} {"train_loss": -7.256381034851074, "global_step": 192932, "epoch": 4593} {"train_loss": -7.270861625671387, "global_step": 192933, "epoch": 4593} {"train_loss": -7.216019630432129, "global_step": 192934, "epoch": 4593} {"train_loss": -7.284465789794922, "global_step": 192935, "epoch": 4593} {"train_loss": -7.172513008117676, "global_step": 192936, "epoch": 4593} {"train_loss": -7.339019775390625, "global_step": 192937, "epoch": 4593} {"train_loss": -7.325129985809326, "global_step": 192938, "epoch": 4593} {"train_loss": -7.204059600830078, "global_step": 192939, "epoch": 4593} {"train_loss": -7.132543563842773, "global_step": 192940, "epoch": 4593} {"train_loss": -7.297692775726318, "global_step": 192941, "epoch": 4593} {"train_loss": -7.284870147705078, "global_step": 192942, "epoch": 4593} {"train_loss": -7.312858581542969, "global_step": 192943, "epoch": 4593} {"train_loss": -7.367505073547363, "global_step": 192944, "epoch": 4593} {"train_loss": -7.175938129425049, "global_step": 192945, "epoch": 4593} {"train_loss": -7.2575764656066895, "global_step": 192946, "epoch": 4593} {"train_loss": -7.244366373334612, "global_step": 192947, "epoch": 4593, "val_loss": 80947.015625} {"train_loss": -7.285398483276367, "global_step": 192948, "epoch": 4594} {"train_loss": -7.313177108764648, "global_step": 192949, "epoch": 4594} {"train_loss": -7.24329948425293, "global_step": 192950, "epoch": 4594} {"train_loss": -7.235529899597168, "global_step": 192951, "epoch": 4594} {"train_loss": -7.160776138305664, "global_step": 192952, "epoch": 4594} {"train_loss": -7.322352409362793, "global_step": 192953, "epoch": 4594} {"train_loss": -7.10244083404541, "global_step": 192954, "epoch": 4594} {"train_loss": -7.196075439453125, "global_step": 192955, "epoch": 4594} {"train_loss": -7.2023162841796875, "global_step": 192956, "epoch": 4594} {"train_loss": -7.2261481285095215, "global_step": 192957, "epoch": 4594} {"train_loss": -7.145575046539307, "global_step": 192958, "epoch": 4594} {"train_loss": -7.126341342926025, "global_step": 192959, "epoch": 4594} {"train_loss": -7.264389991760254, "global_step": 192960, "epoch": 4594} {"train_loss": -7.243804931640625, "global_step": 192961, "epoch": 4594} {"train_loss": -7.166404724121094, "global_step": 192962, "epoch": 4594} {"train_loss": -7.291567325592041, "global_step": 192963, "epoch": 4594} {"train_loss": -7.2392578125, "global_step": 192964, "epoch": 4594} {"train_loss": -7.204833030700684, "global_step": 192965, "epoch": 4594} {"train_loss": -7.126440048217773, "global_step": 192966, "epoch": 4594} {"train_loss": -7.175602912902832, "global_step": 192967, "epoch": 4594} {"train_loss": -7.328098297119141, "global_step": 192968, "epoch": 4594} {"train_loss": -7.1902971267700195, "global_step": 192969, "epoch": 4594} {"train_loss": -7.242919445037842, "global_step": 192970, "epoch": 4594} {"train_loss": -7.256505966186523, "global_step": 192971, "epoch": 4594} {"train_loss": -7.171921253204346, "global_step": 192972, "epoch": 4594} {"train_loss": -7.247503757476807, "global_step": 192973, "epoch": 4594} {"train_loss": -7.318431377410889, "global_step": 192974, "epoch": 4594} {"train_loss": -7.240457534790039, "global_step": 192975, "epoch": 4594} {"train_loss": -7.2756147384643555, "global_step": 192976, "epoch": 4594} {"train_loss": -7.2284135818481445, "global_step": 192977, "epoch": 4594} {"train_loss": -7.220424652099609, "global_step": 192978, "epoch": 4594} {"train_loss": -7.173740863800049, "global_step": 192979, "epoch": 4594} {"train_loss": -7.437342643737793, "global_step": 192980, "epoch": 4594} {"train_loss": -7.205965042114258, "global_step": 192981, "epoch": 4594} {"train_loss": -7.34239387512207, "global_step": 192982, "epoch": 4594} {"train_loss": -7.25372314453125, "global_step": 192983, "epoch": 4594} {"train_loss": -7.36895751953125, "global_step": 192984, "epoch": 4594} {"train_loss": -7.290930271148682, "global_step": 192985, "epoch": 4594} {"train_loss": -7.301619052886963, "global_step": 192986, "epoch": 4594} {"train_loss": -7.250694274902344, "global_step": 192987, "epoch": 4594} {"train_loss": -7.404502868652344, "global_step": 192988, "epoch": 4594} {"train_loss": -7.245282479694912, "global_step": 192989, "epoch": 4594, "val_loss": 81084.4453125} {"train_loss": -7.269049644470215, "global_step": 192990, "epoch": 4595} {"train_loss": -7.2957868576049805, "global_step": 192991, "epoch": 4595} {"train_loss": -7.314937114715576, "global_step": 192992, "epoch": 4595} {"train_loss": -7.290518760681152, "global_step": 192993, "epoch": 4595} {"train_loss": -7.271471977233887, "global_step": 192994, "epoch": 4595} {"train_loss": -7.253639221191406, "global_step": 192995, "epoch": 4595} {"train_loss": -7.2993927001953125, "global_step": 192996, "epoch": 4595} {"train_loss": -7.177241325378418, "global_step": 192997, "epoch": 4595} {"train_loss": -7.272068023681641, "global_step": 192998, "epoch": 4595} {"train_loss": -7.325003623962402, "global_step": 192999, "epoch": 4595} {"train_loss": -7.315591812133789, "global_step": 193000, "epoch": 4595} {"train_loss": -7.216899871826172, "global_step": 193001, "epoch": 4595} {"train_loss": -7.277194023132324, "global_step": 193002, "epoch": 4595} {"train_loss": -7.220015525817871, "global_step": 193003, "epoch": 4595} {"train_loss": -7.271877288818359, "global_step": 193004, "epoch": 4595} {"train_loss": -7.194499492645264, "global_step": 193005, "epoch": 4595} {"train_loss": -7.164634704589844, "global_step": 193006, "epoch": 4595} {"train_loss": -7.2596940994262695, "global_step": 193007, "epoch": 4595} {"train_loss": -7.173879623413086, "global_step": 193008, "epoch": 4595} {"train_loss": -7.313305854797363, "global_step": 193009, "epoch": 4595} {"train_loss": -7.158825874328613, "global_step": 193010, "epoch": 4595} {"train_loss": -7.315937042236328, "global_step": 193011, "epoch": 4595} {"train_loss": -7.39848518371582, "global_step": 193012, "epoch": 4595} {"train_loss": -7.2715229988098145, "global_step": 193013, "epoch": 4595} {"train_loss": -7.133662223815918, "global_step": 193014, "epoch": 4595} {"train_loss": -7.294402122497559, "global_step": 193015, "epoch": 4595} {"train_loss": -7.159826278686523, "global_step": 193016, "epoch": 4595} {"train_loss": -7.0740766525268555, "global_step": 193017, "epoch": 4595} {"train_loss": -7.171586990356445, "global_step": 193018, "epoch": 4595} {"train_loss": -7.164850234985352, "global_step": 193019, "epoch": 4595} {"train_loss": -7.138425827026367, "global_step": 193020, "epoch": 4595} {"train_loss": -7.073264122009277, "global_step": 193021, "epoch": 4595} {"train_loss": -7.090034008026123, "global_step": 193022, "epoch": 4595} {"train_loss": -7.069343566894531, "global_step": 193023, "epoch": 4595} {"train_loss": -7.045374870300293, "global_step": 193024, "epoch": 4595} {"train_loss": -7.1368818283081055, "global_step": 193025, "epoch": 4595} {"train_loss": -7.2032246589660645, "global_step": 193026, "epoch": 4595} {"train_loss": -7.1830339431762695, "global_step": 193027, "epoch": 4595} {"train_loss": -7.2219343185424805, "global_step": 193028, "epoch": 4595} {"train_loss": -7.242042541503906, "global_step": 193029, "epoch": 4595} {"train_loss": -7.124243259429932, "global_step": 193030, "epoch": 4595} {"train_loss": -7.215044407617478, "global_step": 193031, "epoch": 4595, "val_loss": 81034.1875} {"train_loss": -7.024576187133789, "global_step": 193032, "epoch": 4596} {"train_loss": -7.241197109222412, "global_step": 193033, "epoch": 4596} {"train_loss": -7.125629425048828, "global_step": 193034, "epoch": 4596} {"train_loss": -7.131110191345215, "global_step": 193035, "epoch": 4596} {"train_loss": -7.306885719299316, "global_step": 193036, "epoch": 4596} {"train_loss": -7.031894683837891, "global_step": 193037, "epoch": 4596} {"train_loss": -7.197761535644531, "global_step": 193038, "epoch": 4596} {"train_loss": -7.213854789733887, "global_step": 193039, "epoch": 4596} {"train_loss": -7.105727195739746, "global_step": 193040, "epoch": 4596} {"train_loss": -7.323454856872559, "global_step": 193041, "epoch": 4596} {"train_loss": -7.1989946365356445, "global_step": 193042, "epoch": 4596} {"train_loss": -7.273625373840332, "global_step": 193043, "epoch": 4596} {"train_loss": -7.234775543212891, "global_step": 193044, "epoch": 4596} {"train_loss": -7.270522117614746, "global_step": 193045, "epoch": 4596} {"train_loss": -7.210496425628662, "global_step": 193046, "epoch": 4596} {"train_loss": -7.194675922393799, "global_step": 193047, "epoch": 4596} {"train_loss": -7.197583198547363, "global_step": 193048, "epoch": 4596} {"train_loss": -7.153717994689941, "global_step": 193049, "epoch": 4596} {"train_loss": -7.13414192199707, "global_step": 193050, "epoch": 4596} {"train_loss": -7.228914260864258, "global_step": 193051, "epoch": 4596} {"train_loss": -7.2657790184021, "global_step": 193052, "epoch": 4596} {"train_loss": -7.23818826675415, "global_step": 193053, "epoch": 4596} {"train_loss": -7.244651794433594, "global_step": 193054, "epoch": 4596} {"train_loss": -7.260524749755859, "global_step": 193055, "epoch": 4596} {"train_loss": -7.130559921264648, "global_step": 193056, "epoch": 4596} {"train_loss": -7.137414932250977, "global_step": 193057, "epoch": 4596} {"train_loss": -7.267977714538574, "global_step": 193058, "epoch": 4596} {"train_loss": -7.139969348907471, "global_step": 193059, "epoch": 4596} {"train_loss": -7.263886451721191, "global_step": 193060, "epoch": 4596} {"train_loss": -7.1198320388793945, "global_step": 193061, "epoch": 4596} {"train_loss": -7.242660999298096, "global_step": 193062, "epoch": 4596} {"train_loss": -7.259611129760742, "global_step": 193063, "epoch": 4596} {"train_loss": -7.301641464233398, "global_step": 193064, "epoch": 4596} {"train_loss": -7.237524032592773, "global_step": 193065, "epoch": 4596} {"train_loss": -7.253460884094238, "global_step": 193066, "epoch": 4596} {"train_loss": -7.198110580444336, "global_step": 193067, "epoch": 4596} {"train_loss": -7.28741455078125, "global_step": 193068, "epoch": 4596} {"train_loss": -7.250717639923096, "global_step": 193069, "epoch": 4596} {"train_loss": -7.317933559417725, "global_step": 193070, "epoch": 4596} {"train_loss": -7.232308864593506, "global_step": 193071, "epoch": 4596} {"train_loss": -7.168184757232666, "global_step": 193072, "epoch": 4596} {"train_loss": -7.213221050444103, "global_step": 193073, "epoch": 4596, "val_loss": 81319.109375} {"train_loss": -7.274330139160156, "global_step": 193074, "epoch": 4597} {"train_loss": -7.234529495239258, "global_step": 193075, "epoch": 4597} {"train_loss": -7.139941692352295, "global_step": 193076, "epoch": 4597} {"train_loss": -7.315674781799316, "global_step": 193077, "epoch": 4597} {"train_loss": -7.235907554626465, "global_step": 193078, "epoch": 4597} {"train_loss": -7.332465648651123, "global_step": 193079, "epoch": 4597} {"train_loss": -7.188345909118652, "global_step": 193080, "epoch": 4597} {"train_loss": -7.163052558898926, "global_step": 193081, "epoch": 4597} {"train_loss": -7.152215957641602, "global_step": 193082, "epoch": 4597} {"train_loss": -7.201274871826172, "global_step": 193083, "epoch": 4597} {"train_loss": -7.183431625366211, "global_step": 193084, "epoch": 4597} {"train_loss": -7.186642646789551, "global_step": 193085, "epoch": 4597} {"train_loss": -7.292655944824219, "global_step": 193086, "epoch": 4597} {"train_loss": -7.212219715118408, "global_step": 193087, "epoch": 4597} {"train_loss": -7.196576118469238, "global_step": 193088, "epoch": 4597} {"train_loss": -7.200102806091309, "global_step": 193089, "epoch": 4597} {"train_loss": -7.192795753479004, "global_step": 193090, "epoch": 4597} {"train_loss": -7.225679874420166, "global_step": 193091, "epoch": 4597} {"train_loss": -7.086051940917969, "global_step": 193092, "epoch": 4597} {"train_loss": -7.165228843688965, "global_step": 193093, "epoch": 4597} {"train_loss": -7.138950347900391, "global_step": 193094, "epoch": 4597} {"train_loss": -7.212612152099609, "global_step": 193095, "epoch": 4597} {"train_loss": -7.211728096008301, "global_step": 193096, "epoch": 4597} {"train_loss": -7.292236804962158, "global_step": 193097, "epoch": 4597} {"train_loss": -7.165191650390625, "global_step": 193098, "epoch": 4597} {"train_loss": -7.227954864501953, "global_step": 193099, "epoch": 4597} {"train_loss": -7.13604736328125, "global_step": 193100, "epoch": 4597} {"train_loss": -7.310563087463379, "global_step": 193101, "epoch": 4597} {"train_loss": -7.159984588623047, "global_step": 193102, "epoch": 4597} {"train_loss": -7.156368732452393, "global_step": 193103, "epoch": 4597} {"train_loss": -7.260158538818359, "global_step": 193104, "epoch": 4597} {"train_loss": -7.164855003356934, "global_step": 193105, "epoch": 4597} {"train_loss": -7.17317008972168, "global_step": 193106, "epoch": 4597} {"train_loss": -7.237792491912842, "global_step": 193107, "epoch": 4597} {"train_loss": -7.174712657928467, "global_step": 193108, "epoch": 4597} {"train_loss": -7.301329135894775, "global_step": 193109, "epoch": 4597} {"train_loss": -7.111337661743164, "global_step": 193110, "epoch": 4597} {"train_loss": -7.354528427124023, "global_step": 193111, "epoch": 4597} {"train_loss": -7.124722480773926, "global_step": 193112, "epoch": 4597} {"train_loss": -7.220121383666992, "global_step": 193113, "epoch": 4597} {"train_loss": -7.272113800048828, "global_step": 193114, "epoch": 4597} {"train_loss": -7.206960723513649, "global_step": 193115, "epoch": 4597, "val_loss": 81253.3125} {"train_loss": -7.245236873626709, "global_step": 193116, "epoch": 4598} {"train_loss": -7.182571887969971, "global_step": 193117, "epoch": 4598} {"train_loss": -7.073593616485596, "global_step": 193118, "epoch": 4598} {"train_loss": -7.118023872375488, "global_step": 193119, "epoch": 4598} {"train_loss": -7.069538116455078, "global_step": 193120, "epoch": 4598} {"train_loss": -7.169608116149902, "global_step": 193121, "epoch": 4598} {"train_loss": -7.11367130279541, "global_step": 193122, "epoch": 4598} {"train_loss": -7.111858367919922, "global_step": 193123, "epoch": 4598} {"train_loss": -7.209257125854492, "global_step": 193124, "epoch": 4598} {"train_loss": -7.148409843444824, "global_step": 193125, "epoch": 4598} {"train_loss": -7.265096664428711, "global_step": 193126, "epoch": 4598} {"train_loss": -7.043163299560547, "global_step": 193127, "epoch": 4598} {"train_loss": -7.110754013061523, "global_step": 193128, "epoch": 4598} {"train_loss": -7.0514326095581055, "global_step": 193129, "epoch": 4598} {"train_loss": -7.133974075317383, "global_step": 193130, "epoch": 4598} {"train_loss": -7.039138317108154, "global_step": 193131, "epoch": 4598} {"train_loss": -7.094817161560059, "global_step": 193132, "epoch": 4598} {"train_loss": -7.010679721832275, "global_step": 193133, "epoch": 4598} {"train_loss": -7.13997745513916, "global_step": 193134, "epoch": 4598} {"train_loss": -7.052534103393555, "global_step": 193135, "epoch": 4598} {"train_loss": -7.096736907958984, "global_step": 193136, "epoch": 4598} {"train_loss": -7.156113624572754, "global_step": 193137, "epoch": 4598} {"train_loss": -7.100285053253174, "global_step": 193138, "epoch": 4598} {"train_loss": -7.274143218994141, "global_step": 193139, "epoch": 4598} {"train_loss": -7.097405433654785, "global_step": 193140, "epoch": 4598} {"train_loss": -7.224748611450195, "global_step": 193141, "epoch": 4598} {"train_loss": -7.209837913513184, "global_step": 193142, "epoch": 4598} {"train_loss": -7.343024730682373, "global_step": 193143, "epoch": 4598} {"train_loss": -7.238303184509277, "global_step": 193144, "epoch": 4598} {"train_loss": -7.251780033111572, "global_step": 193145, "epoch": 4598} {"train_loss": -7.123797416687012, "global_step": 193146, "epoch": 4598} {"train_loss": -7.25472354888916, "global_step": 193147, "epoch": 4598} {"train_loss": -7.093749523162842, "global_step": 193148, "epoch": 4598} {"train_loss": -7.218594074249268, "global_step": 193149, "epoch": 4598} {"train_loss": -7.202021598815918, "global_step": 193150, "epoch": 4598} {"train_loss": -7.081005096435547, "global_step": 193151, "epoch": 4598} {"train_loss": -7.291228294372559, "global_step": 193152, "epoch": 4598} {"train_loss": -7.228788375854492, "global_step": 193153, "epoch": 4598} {"train_loss": -7.166416168212891, "global_step": 193154, "epoch": 4598} {"train_loss": -7.095463752746582, "global_step": 193155, "epoch": 4598} {"train_loss": -7.275800704956055, "global_step": 193156, "epoch": 4598} {"train_loss": -7.159217289515904, "global_step": 193157, "epoch": 4598, "val_loss": 81158.140625} {"train_loss": -7.22091007232666, "global_step": 193158, "epoch": 4599} {"train_loss": -7.258332252502441, "global_step": 193159, "epoch": 4599} {"train_loss": -7.184998512268066, "global_step": 193160, "epoch": 4599} {"train_loss": -7.237683296203613, "global_step": 193161, "epoch": 4599} {"train_loss": -7.256319522857666, "global_step": 193162, "epoch": 4599} {"train_loss": -7.28122615814209, "global_step": 193163, "epoch": 4599} {"train_loss": -7.309995174407959, "global_step": 193164, "epoch": 4599} {"train_loss": -7.339616775512695, "global_step": 193165, "epoch": 4599} {"train_loss": -7.258315086364746, "global_step": 193166, "epoch": 4599} {"train_loss": -7.306814193725586, "global_step": 193167, "epoch": 4599} {"train_loss": -7.310042858123779, "global_step": 193168, "epoch": 4599} {"train_loss": -7.219161033630371, "global_step": 193169, "epoch": 4599} {"train_loss": -7.2213029861450195, "global_step": 193170, "epoch": 4599} {"train_loss": -7.2232561111450195, "global_step": 193171, "epoch": 4599} {"train_loss": -7.13337516784668, "global_step": 193172, "epoch": 4599} {"train_loss": -7.322021961212158, "global_step": 193173, "epoch": 4599} {"train_loss": -7.303046703338623, "global_step": 193174, "epoch": 4599} {"train_loss": -7.32778263092041, "global_step": 193175, "epoch": 4599} {"train_loss": -7.360158920288086, "global_step": 193176, "epoch": 4599} {"train_loss": -7.274269104003906, "global_step": 193177, "epoch": 4599} {"train_loss": -7.293854713439941, "global_step": 193178, "epoch": 4599} {"train_loss": -7.2322187423706055, "global_step": 193179, "epoch": 4599} {"train_loss": -7.121461868286133, "global_step": 193180, "epoch": 4599} {"train_loss": -7.240052223205566, "global_step": 193181, "epoch": 4599} {"train_loss": -7.228579044342041, "global_step": 193182, "epoch": 4599} {"train_loss": -7.100376129150391, "global_step": 193183, "epoch": 4599} {"train_loss": -7.235684871673584, "global_step": 193184, "epoch": 4599} {"train_loss": -7.2691192626953125, "global_step": 193185, "epoch": 4599} {"train_loss": -7.329078674316406, "global_step": 193186, "epoch": 4599} {"train_loss": -7.247920036315918, "global_step": 193187, "epoch": 4599} {"train_loss": -7.238617897033691, "global_step": 193188, "epoch": 4599} {"train_loss": -7.174431324005127, "global_step": 193189, "epoch": 4599} {"train_loss": -7.236819267272949, "global_step": 193190, "epoch": 4599} {"train_loss": -7.210406303405762, "global_step": 193191, "epoch": 4599} {"train_loss": -7.172943115234375, "global_step": 193192, "epoch": 4599} {"train_loss": -7.299542427062988, "global_step": 193193, "epoch": 4599} {"train_loss": -7.1697235107421875, "global_step": 193194, "epoch": 4599} {"train_loss": -7.183510780334473, "global_step": 193195, "epoch": 4599} {"train_loss": -7.356451988220215, "global_step": 193196, "epoch": 4599} {"train_loss": -7.266712188720703, "global_step": 193197, "epoch": 4599} {"train_loss": -7.199986457824707, "global_step": 193198, "epoch": 4599} {"train_loss": -7.249867223557972, "global_step": 193199, "epoch": 4599, "val_loss": 80931.9609375} {"train_loss": -7.239685535430908, "global_step": 193200, "epoch": 4600} {"train_loss": -7.357174396514893, "global_step": 193201, "epoch": 4600} {"train_loss": -7.305685043334961, "global_step": 193202, "epoch": 4600} {"train_loss": -7.302573204040527, "global_step": 193203, "epoch": 4600} {"train_loss": -7.318913459777832, "global_step": 193204, "epoch": 4600} {"train_loss": -7.2798614501953125, "global_step": 193205, "epoch": 4600} {"train_loss": -7.2662506103515625, "global_step": 193206, "epoch": 4600} {"train_loss": -7.237968444824219, "global_step": 193207, "epoch": 4600} {"train_loss": -7.1853179931640625, "global_step": 193208, "epoch": 4600} {"train_loss": -7.265229225158691, "global_step": 193209, "epoch": 4600} {"train_loss": -7.196646690368652, "global_step": 193210, "epoch": 4600} {"train_loss": -7.283160209655762, "global_step": 193211, "epoch": 4600} {"train_loss": -7.294699668884277, "global_step": 193212, "epoch": 4600} {"train_loss": -7.110630035400391, "global_step": 193213, "epoch": 4600} {"train_loss": -7.37912130355835, "global_step": 193214, "epoch": 4600} {"train_loss": -7.14879035949707, "global_step": 193215, "epoch": 4600} {"train_loss": -7.192670822143555, "global_step": 193216, "epoch": 4600} {"train_loss": -7.324533462524414, "global_step": 193217, "epoch": 4600} {"train_loss": -7.24252462387085, "global_step": 193218, "epoch": 4600} {"train_loss": -7.323816299438477, "global_step": 193219, "epoch": 4600} {"train_loss": -7.235197067260742, "global_step": 193220, "epoch": 4600} {"train_loss": -7.095873832702637, "global_step": 193221, "epoch": 4600} {"train_loss": -7.24668550491333, "global_step": 193222, "epoch": 4600} {"train_loss": -7.127040863037109, "global_step": 193223, "epoch": 4600} {"train_loss": -7.146760940551758, "global_step": 193224, "epoch": 4600} {"train_loss": -7.0562744140625, "global_step": 193225, "epoch": 4600} {"train_loss": -7.1319355964660645, "global_step": 193226, "epoch": 4600} {"train_loss": -7.186890602111816, "global_step": 193227, "epoch": 4600} {"train_loss": -7.148852825164795, "global_step": 193228, "epoch": 4600} {"train_loss": -7.177469253540039, "global_step": 193229, "epoch": 4600} {"train_loss": -7.111464500427246, "global_step": 193230, "epoch": 4600} {"train_loss": -7.138728618621826, "global_step": 193231, "epoch": 4600} {"train_loss": -7.320441246032715, "global_step": 193232, "epoch": 4600} {"train_loss": -7.178060531616211, "global_step": 193233, "epoch": 4600} {"train_loss": -7.219963073730469, "global_step": 193234, "epoch": 4600} {"train_loss": -7.097745418548584, "global_step": 193235, "epoch": 4600} {"train_loss": -7.133550643920898, "global_step": 193236, "epoch": 4600} {"train_loss": -6.999755859375, "global_step": 193237, "epoch": 4600} {"train_loss": -7.122980117797852, "global_step": 193238, "epoch": 4600} {"train_loss": -7.238246917724609, "global_step": 193239, "epoch": 4600} {"train_loss": -7.200934410095215, "global_step": 193240, "epoch": 4600} {"train_loss": -7.207926466351464, "global_step": 193241, "epoch": 4600, "train/sim_max_reward_0": 0.5017991833272539, "train/sim_max_reward_1": 0.7106338955259192, "train/sim_max_reward_2": 0.5122482440568913, "train/sim_max_reward_3": 0.1362678944558133, "train/sim_max_reward_4": 1.0, "train/sim_max_reward_5": 0.975524132918064, "test/sim_max_reward_4500000": 0.37192661149125367, "test/sim_max_reward_4500001": 0.9435504128705329, "test/sim_max_reward_4500002": 0.9634524552144909, "test/sim_max_reward_4500003": 0.9427789675330486, "test/sim_max_reward_4500004": 0.20308516807882263, "test/sim_max_reward_4500005": 0.17436120472981093, "test/sim_max_reward_4500006": 0.9042456455966873, "test/sim_max_reward_4500007": 0.9713444498326547, "test/sim_max_reward_4500008": 0.9225659782860072, "test/sim_max_reward_4500009": 0.053182315160357374, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.43400709619542505, "test/sim_max_reward_4500012": 0.9723238156218611, "test/sim_max_reward_4500013": 0.26796798049549747, "test/sim_max_reward_4500014": 0.9594149265987569, "test/sim_max_reward_4500015": 1.0, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.09842194963596465, "test/sim_max_reward_4500018": 1.0, "test/sim_max_reward_4500019": 0.9338051070828236, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.921802255275553, "test/sim_max_reward_4500022": 0.42110228453272736, "test/sim_max_reward_4500023": 0.922646877495783, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.3952017711033147, "test/sim_max_reward_4500026": 0.4192420123810004, "test/sim_max_reward_4500027": 0.995839801354743, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.12595940515176277, "test/sim_max_reward_4500030": 0.9748937621615903, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.3412502329153079, "test/sim_max_reward_4500034": 0.929593950107148, "test/sim_max_reward_4500035": 0.996805088785498, "test/sim_max_reward_4500036": 0.9873529121172363, "test/sim_max_reward_4500037": 0.9864703958393096, "test/sim_max_reward_4500038": 0.9756021335644794, "test/sim_max_reward_4500039": 0.7781226276674283, "test/sim_max_reward_4500040": 0.967162818986668, "test/sim_max_reward_4500041": 0.9313936444386205, "test/sim_max_reward_4500042": 0.04699949104198542, "test/sim_max_reward_4500043": 0.8989000470184125, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9432197632751249, "test/sim_max_reward_4500046": 0.10409775925873906, "test/sim_max_reward_4500047": 0.9789815913408547, "test/sim_max_reward_4500048": 0.8865723120418889, "test/sim_max_reward_4500049": 0.7962881185237307, "train/mean_score": 0.6394122250473236, "test/mean_score": 0.6018833249878464, "val_loss": 81242.6875} {"train_loss": -7.2267656326293945, "global_step": 193242, "epoch": 4601} {"train_loss": -7.259868621826172, "global_step": 193243, "epoch": 4601} {"train_loss": -7.249916076660156, "global_step": 193244, "epoch": 4601} {"train_loss": -7.167367935180664, "global_step": 193245, "epoch": 4601} {"train_loss": -7.280200481414795, "global_step": 193246, "epoch": 4601} {"train_loss": -7.291294574737549, "global_step": 193247, "epoch": 4601} {"train_loss": -7.220816135406494, "global_step": 193248, "epoch": 4601} {"train_loss": -7.238953590393066, "global_step": 193249, "epoch": 4601} {"train_loss": -7.258739948272705, "global_step": 193250, "epoch": 4601} {"train_loss": -7.2454304695129395, "global_step": 193251, "epoch": 4601} {"train_loss": -7.17903470993042, "global_step": 193252, "epoch": 4601} {"train_loss": -7.356706619262695, "global_step": 193253, "epoch": 4601} {"train_loss": -7.196259021759033, "global_step": 193254, "epoch": 4601} {"train_loss": -7.296953201293945, "global_step": 193255, "epoch": 4601} {"train_loss": -7.2638092041015625, "global_step": 193256, "epoch": 4601} {"train_loss": -7.236407279968262, "global_step": 193257, "epoch": 4601} {"train_loss": -7.203882217407227, "global_step": 193258, "epoch": 4601} {"train_loss": -7.287785053253174, "global_step": 193259, "epoch": 4601} {"train_loss": -7.235047817230225, "global_step": 193260, "epoch": 4601} {"train_loss": -7.253247261047363, "global_step": 193261, "epoch": 4601} {"train_loss": -7.2085771560668945, "global_step": 193262, "epoch": 4601} {"train_loss": -7.265034198760986, "global_step": 193263, "epoch": 4601} {"train_loss": -7.251463890075684, "global_step": 193264, "epoch": 4601} {"train_loss": -7.109315395355225, "global_step": 193265, "epoch": 4601} {"train_loss": -7.256426811218262, "global_step": 193266, "epoch": 4601} {"train_loss": -7.264353275299072, "global_step": 193267, "epoch": 4601} {"train_loss": -7.157144069671631, "global_step": 193268, "epoch": 4601} {"train_loss": -7.302386283874512, "global_step": 193269, "epoch": 4601} {"train_loss": -7.140758514404297, "global_step": 193270, "epoch": 4601} {"train_loss": -7.099149703979492, "global_step": 193271, "epoch": 4601} {"train_loss": -7.187498092651367, "global_step": 193272, "epoch": 4601} {"train_loss": -7.11220645904541, "global_step": 193273, "epoch": 4601} {"train_loss": -7.064121723175049, "global_step": 193274, "epoch": 4601} {"train_loss": -7.056380271911621, "global_step": 193275, "epoch": 4601} {"train_loss": -7.03139066696167, "global_step": 193276, "epoch": 4601} {"train_loss": -7.00745964050293, "global_step": 193277, "epoch": 4601} {"train_loss": -7.228678226470947, "global_step": 193278, "epoch": 4601} {"train_loss": -7.150371074676514, "global_step": 193279, "epoch": 4601} {"train_loss": -7.158590316772461, "global_step": 193280, "epoch": 4601} {"train_loss": -7.124549388885498, "global_step": 193281, "epoch": 4601} {"train_loss": -7.050608158111572, "global_step": 193282, "epoch": 4601} {"train_loss": -7.196767511821928, "global_step": 193283, "epoch": 4601, "val_loss": 81386.359375} {"train_loss": -7.1304121017456055, "global_step": 193284, "epoch": 4602} {"train_loss": -7.111391067504883, "global_step": 193285, "epoch": 4602} {"train_loss": -7.133818626403809, "global_step": 193286, "epoch": 4602} {"train_loss": -7.169855117797852, "global_step": 193287, "epoch": 4602} {"train_loss": -7.196427345275879, "global_step": 193288, "epoch": 4602} {"train_loss": -7.166759490966797, "global_step": 193289, "epoch": 4602} {"train_loss": -7.134829998016357, "global_step": 193290, "epoch": 4602} {"train_loss": -7.153875350952148, "global_step": 193291, "epoch": 4602} {"train_loss": -7.191636562347412, "global_step": 193292, "epoch": 4602} {"train_loss": -7.2539286613464355, "global_step": 193293, "epoch": 4602} {"train_loss": -7.102672576904297, "global_step": 193294, "epoch": 4602} {"train_loss": -7.132851600646973, "global_step": 193295, "epoch": 4602} {"train_loss": -7.126712799072266, "global_step": 193296, "epoch": 4602} {"train_loss": -7.237303733825684, "global_step": 193297, "epoch": 4602} {"train_loss": -7.145580768585205, "global_step": 193298, "epoch": 4602} {"train_loss": -7.262198448181152, "global_step": 193299, "epoch": 4602} {"train_loss": -7.238198280334473, "global_step": 193300, "epoch": 4602} {"train_loss": -7.228706359863281, "global_step": 193301, "epoch": 4602} {"train_loss": -7.228614807128906, "global_step": 193302, "epoch": 4602} {"train_loss": -7.235116481781006, "global_step": 193303, "epoch": 4602} {"train_loss": -7.32064151763916, "global_step": 193304, "epoch": 4602} {"train_loss": -7.211541175842285, "global_step": 193305, "epoch": 4602} {"train_loss": -7.16600227355957, "global_step": 193306, "epoch": 4602} {"train_loss": -7.253531455993652, "global_step": 193307, "epoch": 4602} {"train_loss": -7.117902755737305, "global_step": 193308, "epoch": 4602} {"train_loss": -7.219773292541504, "global_step": 193309, "epoch": 4602} {"train_loss": -7.14362907409668, "global_step": 193310, "epoch": 4602} {"train_loss": -7.254167556762695, "global_step": 193311, "epoch": 4602} {"train_loss": -7.170984745025635, "global_step": 193312, "epoch": 4602} {"train_loss": -7.222163200378418, "global_step": 193313, "epoch": 4602} {"train_loss": -7.283312797546387, "global_step": 193314, "epoch": 4602} {"train_loss": -7.1951141357421875, "global_step": 193315, "epoch": 4602} {"train_loss": -7.307535171508789, "global_step": 193316, "epoch": 4602} {"train_loss": -7.094270706176758, "global_step": 193317, "epoch": 4602} {"train_loss": -7.200613498687744, "global_step": 193318, "epoch": 4602} {"train_loss": -7.260841369628906, "global_step": 193319, "epoch": 4602} {"train_loss": -7.163064956665039, "global_step": 193320, "epoch": 4602} {"train_loss": -7.286931991577148, "global_step": 193321, "epoch": 4602} {"train_loss": -7.234475135803223, "global_step": 193322, "epoch": 4602} {"train_loss": -7.229610443115234, "global_step": 193323, "epoch": 4602} {"train_loss": -7.307678699493408, "global_step": 193324, "epoch": 4602} {"train_loss": -7.199336188180106, "global_step": 193325, "epoch": 4602, "val_loss": 81012.640625} {"train_loss": -7.25737190246582, "global_step": 193326, "epoch": 4603} {"train_loss": -7.346465110778809, "global_step": 193327, "epoch": 4603} {"train_loss": -7.208627700805664, "global_step": 193328, "epoch": 4603} {"train_loss": -7.171591758728027, "global_step": 193329, "epoch": 4603} {"train_loss": -7.043524742126465, "global_step": 193330, "epoch": 4603} {"train_loss": -7.187105655670166, "global_step": 193331, "epoch": 4603} {"train_loss": -7.226077079772949, "global_step": 193332, "epoch": 4603} {"train_loss": -7.149332046508789, "global_step": 193333, "epoch": 4603} {"train_loss": -7.350019454956055, "global_step": 193334, "epoch": 4603} {"train_loss": -7.1939826011657715, "global_step": 193335, "epoch": 4603} {"train_loss": -7.2653422355651855, "global_step": 193336, "epoch": 4603} {"train_loss": -7.237807273864746, "global_step": 193337, "epoch": 4603} {"train_loss": -7.3755106925964355, "global_step": 193338, "epoch": 4603} {"train_loss": -7.206700325012207, "global_step": 193339, "epoch": 4603} {"train_loss": -7.207333564758301, "global_step": 193340, "epoch": 4603} {"train_loss": -7.23503303527832, "global_step": 193341, "epoch": 4603} {"train_loss": -7.269946575164795, "global_step": 193342, "epoch": 4603} {"train_loss": -7.271360874176025, "global_step": 193343, "epoch": 4603} {"train_loss": -7.247159004211426, "global_step": 193344, "epoch": 4603} {"train_loss": -7.256133079528809, "global_step": 193345, "epoch": 4603} {"train_loss": -7.280218601226807, "global_step": 193346, "epoch": 4603} {"train_loss": -7.301074504852295, "global_step": 193347, "epoch": 4603} {"train_loss": -7.298912048339844, "global_step": 193348, "epoch": 4603} {"train_loss": -7.280359268188477, "global_step": 193349, "epoch": 4603} {"train_loss": -7.229135513305664, "global_step": 193350, "epoch": 4603} {"train_loss": -7.205599784851074, "global_step": 193351, "epoch": 4603} {"train_loss": -7.087063789367676, "global_step": 193352, "epoch": 4603} {"train_loss": -7.186426162719727, "global_step": 193353, "epoch": 4603} {"train_loss": -7.170421123504639, "global_step": 193354, "epoch": 4603} {"train_loss": -6.9765424728393555, "global_step": 193355, "epoch": 4603} {"train_loss": -7.206427097320557, "global_step": 193356, "epoch": 4603} {"train_loss": -7.059267997741699, "global_step": 193357, "epoch": 4603} {"train_loss": -7.15950870513916, "global_step": 193358, "epoch": 4603} {"train_loss": -7.094122409820557, "global_step": 193359, "epoch": 4603} {"train_loss": -7.140104293823242, "global_step": 193360, "epoch": 4603} {"train_loss": -7.1747727394104, "global_step": 193361, "epoch": 4603} {"train_loss": -6.9855875968933105, "global_step": 193362, "epoch": 4603} {"train_loss": -7.110115051269531, "global_step": 193363, "epoch": 4603} {"train_loss": -6.967329502105713, "global_step": 193364, "epoch": 4603} {"train_loss": -7.206716537475586, "global_step": 193365, "epoch": 4603} {"train_loss": -7.013669967651367, "global_step": 193366, "epoch": 4603} {"train_loss": -7.187379768916538, "global_step": 193367, "epoch": 4603, "val_loss": 81279.1953125} {"train_loss": -7.185021877288818, "global_step": 193368, "epoch": 4604} {"train_loss": -7.071434020996094, "global_step": 193369, "epoch": 4604} {"train_loss": -7.094950199127197, "global_step": 193370, "epoch": 4604} {"train_loss": -7.12342643737793, "global_step": 193371, "epoch": 4604} {"train_loss": -7.283771991729736, "global_step": 193372, "epoch": 4604} {"train_loss": -7.175968170166016, "global_step": 193373, "epoch": 4604} {"train_loss": -7.1103925704956055, "global_step": 193374, "epoch": 4604} {"train_loss": -7.150875091552734, "global_step": 193375, "epoch": 4604} {"train_loss": -7.179056644439697, "global_step": 193376, "epoch": 4604} {"train_loss": -7.168606758117676, "global_step": 193377, "epoch": 4604} {"train_loss": -7.215874671936035, "global_step": 193378, "epoch": 4604} {"train_loss": -7.223703861236572, "global_step": 193379, "epoch": 4604} {"train_loss": -7.202449798583984, "global_step": 193380, "epoch": 4604} {"train_loss": -7.253542900085449, "global_step": 193381, "epoch": 4604} {"train_loss": -7.1214189529418945, "global_step": 193382, "epoch": 4604} {"train_loss": -7.192384719848633, "global_step": 193383, "epoch": 4604} {"train_loss": -7.209616661071777, "global_step": 193384, "epoch": 4604} {"train_loss": -7.25893497467041, "global_step": 193385, "epoch": 4604} {"train_loss": -7.158185958862305, "global_step": 193386, "epoch": 4604} {"train_loss": -7.267316818237305, "global_step": 193387, "epoch": 4604} {"train_loss": -7.238439559936523, "global_step": 193388, "epoch": 4604} {"train_loss": -7.325063705444336, "global_step": 193389, "epoch": 4604} {"train_loss": -7.215932846069336, "global_step": 193390, "epoch": 4604} {"train_loss": -7.333223342895508, "global_step": 193391, "epoch": 4604} {"train_loss": -7.332311153411865, "global_step": 193392, "epoch": 4604} {"train_loss": -7.311889171600342, "global_step": 193393, "epoch": 4604} {"train_loss": -7.269244194030762, "global_step": 193394, "epoch": 4604} {"train_loss": -7.313403129577637, "global_step": 193395, "epoch": 4604} {"train_loss": -7.155762672424316, "global_step": 193396, "epoch": 4604} {"train_loss": -7.245636463165283, "global_step": 193397, "epoch": 4604} {"train_loss": -7.348611831665039, "global_step": 193398, "epoch": 4604} {"train_loss": -7.145650863647461, "global_step": 193399, "epoch": 4604} {"train_loss": -7.281830787658691, "global_step": 193400, "epoch": 4604} {"train_loss": -7.331315040588379, "global_step": 193401, "epoch": 4604} {"train_loss": -7.377994537353516, "global_step": 193402, "epoch": 4604} {"train_loss": -7.332767486572266, "global_step": 193403, "epoch": 4604} {"train_loss": -7.286197662353516, "global_step": 193404, "epoch": 4604} {"train_loss": -7.248226642608643, "global_step": 193405, "epoch": 4604} {"train_loss": -7.328588485717773, "global_step": 193406, "epoch": 4604} {"train_loss": -7.284436225891113, "global_step": 193407, "epoch": 4604} {"train_loss": -7.192404747009277, "global_step": 193408, "epoch": 4604} {"train_loss": -7.233853181203206, "global_step": 193409, "epoch": 4604, "val_loss": 81432.53125} {"train_loss": -7.275909423828125, "global_step": 193410, "epoch": 4605} {"train_loss": -7.249048233032227, "global_step": 193411, "epoch": 4605} {"train_loss": -7.295172691345215, "global_step": 193412, "epoch": 4605} {"train_loss": -7.3492631912231445, "global_step": 193413, "epoch": 4605} {"train_loss": -7.284488677978516, "global_step": 193414, "epoch": 4605} {"train_loss": -7.277755260467529, "global_step": 193415, "epoch": 4605} {"train_loss": -7.241340160369873, "global_step": 193416, "epoch": 4605} {"train_loss": -7.208195686340332, "global_step": 193417, "epoch": 4605} {"train_loss": -7.233927249908447, "global_step": 193418, "epoch": 4605} {"train_loss": -7.408349514007568, "global_step": 193419, "epoch": 4605} {"train_loss": -7.221926689147949, "global_step": 193420, "epoch": 4605} {"train_loss": -7.175939559936523, "global_step": 193421, "epoch": 4605} {"train_loss": -7.307807445526123, "global_step": 193422, "epoch": 4605} {"train_loss": -7.0826826095581055, "global_step": 193423, "epoch": 4605} {"train_loss": -7.174703121185303, "global_step": 193424, "epoch": 4605} {"train_loss": -7.285081386566162, "global_step": 193425, "epoch": 4605} {"train_loss": -7.01326847076416, "global_step": 193426, "epoch": 4605} {"train_loss": -7.303512096405029, "global_step": 193427, "epoch": 4605} {"train_loss": -7.318280220031738, "global_step": 193428, "epoch": 4605} {"train_loss": -7.232417106628418, "global_step": 193429, "epoch": 4605} {"train_loss": -7.362565040588379, "global_step": 193430, "epoch": 4605} {"train_loss": -7.199594497680664, "global_step": 193431, "epoch": 4605} {"train_loss": -7.272806167602539, "global_step": 193432, "epoch": 4605} {"train_loss": -7.2730913162231445, "global_step": 193433, "epoch": 4605} {"train_loss": -7.199208736419678, "global_step": 193434, "epoch": 4605} {"train_loss": -7.242122650146484, "global_step": 193435, "epoch": 4605} {"train_loss": -7.380893707275391, "global_step": 193436, "epoch": 4605} {"train_loss": -7.265497207641602, "global_step": 193437, "epoch": 4605} {"train_loss": -7.233222961425781, "global_step": 193438, "epoch": 4605} {"train_loss": -7.257204055786133, "global_step": 193439, "epoch": 4605} {"train_loss": -7.2321648597717285, "global_step": 193440, "epoch": 4605} {"train_loss": -7.374855995178223, "global_step": 193441, "epoch": 4605} {"train_loss": -7.263864040374756, "global_step": 193442, "epoch": 4605} {"train_loss": -7.284860134124756, "global_step": 193443, "epoch": 4605} {"train_loss": -7.251421928405762, "global_step": 193444, "epoch": 4605} {"train_loss": -7.258805274963379, "global_step": 193445, "epoch": 4605} {"train_loss": -7.385924816131592, "global_step": 193446, "epoch": 4605} {"train_loss": -7.217879295349121, "global_step": 193447, "epoch": 4605} {"train_loss": -7.404812812805176, "global_step": 193448, "epoch": 4605} {"train_loss": -7.3612284660339355, "global_step": 193449, "epoch": 4605} {"train_loss": -7.271542549133301, "global_step": 193450, "epoch": 4605} {"train_loss": -7.264548574175153, "global_step": 193451, "epoch": 4605, "val_loss": 81121.6328125} {"train_loss": -7.249171257019043, "global_step": 193452, "epoch": 4606} {"train_loss": -7.314927577972412, "global_step": 193453, "epoch": 4606} {"train_loss": -7.342952728271484, "global_step": 193454, "epoch": 4606} {"train_loss": -7.39475154876709, "global_step": 193455, "epoch": 4606} {"train_loss": -7.27324104309082, "global_step": 193456, "epoch": 4606} {"train_loss": -7.207747459411621, "global_step": 193457, "epoch": 4606} {"train_loss": -7.393941879272461, "global_step": 193458, "epoch": 4606} {"train_loss": -7.247873783111572, "global_step": 193459, "epoch": 4606} {"train_loss": -7.139169692993164, "global_step": 193460, "epoch": 4606} {"train_loss": -7.17189884185791, "global_step": 193461, "epoch": 4606} {"train_loss": -7.173573017120361, "global_step": 193462, "epoch": 4606} {"train_loss": -7.084234237670898, "global_step": 193463, "epoch": 4606} {"train_loss": -7.128103256225586, "global_step": 193464, "epoch": 4606} {"train_loss": -7.066585540771484, "global_step": 193465, "epoch": 4606} {"train_loss": -6.915319442749023, "global_step": 193466, "epoch": 4606} {"train_loss": -7.204596519470215, "global_step": 193467, "epoch": 4606} {"train_loss": -7.0507893562316895, "global_step": 193468, "epoch": 4606} {"train_loss": -7.111778259277344, "global_step": 193469, "epoch": 4606} {"train_loss": -7.127463340759277, "global_step": 193470, "epoch": 4606} {"train_loss": -7.024836540222168, "global_step": 193471, "epoch": 4606} {"train_loss": -7.107362270355225, "global_step": 193472, "epoch": 4606} {"train_loss": -6.896178722381592, "global_step": 193473, "epoch": 4606} {"train_loss": -7.092522621154785, "global_step": 193474, "epoch": 4606} {"train_loss": -7.03336238861084, "global_step": 193475, "epoch": 4606} {"train_loss": -7.097986221313477, "global_step": 193476, "epoch": 4606} {"train_loss": -7.111758232116699, "global_step": 193477, "epoch": 4606} {"train_loss": -7.148895263671875, "global_step": 193478, "epoch": 4606} {"train_loss": -7.087119102478027, "global_step": 193479, "epoch": 4606} {"train_loss": -7.139509201049805, "global_step": 193480, "epoch": 4606} {"train_loss": -7.16689920425415, "global_step": 193481, "epoch": 4606} {"train_loss": -7.205419540405273, "global_step": 193482, "epoch": 4606} {"train_loss": -7.068418502807617, "global_step": 193483, "epoch": 4606} {"train_loss": -7.067102432250977, "global_step": 193484, "epoch": 4606} {"train_loss": -7.095314979553223, "global_step": 193485, "epoch": 4606} {"train_loss": -7.141921520233154, "global_step": 193486, "epoch": 4606} {"train_loss": -7.217480182647705, "global_step": 193487, "epoch": 4606} {"train_loss": -7.165294647216797, "global_step": 193488, "epoch": 4606} {"train_loss": -7.139327049255371, "global_step": 193489, "epoch": 4606} {"train_loss": -7.108985900878906, "global_step": 193490, "epoch": 4606} {"train_loss": -7.14674186706543, "global_step": 193491, "epoch": 4606} {"train_loss": -7.137921333312988, "global_step": 193492, "epoch": 4606} {"train_loss": -7.149585451398577, "global_step": 193493, "epoch": 4606, "val_loss": 81170.09375} {"train_loss": -7.225845813751221, "global_step": 193494, "epoch": 4607} {"train_loss": -7.160463809967041, "global_step": 193495, "epoch": 4607} {"train_loss": -7.219992637634277, "global_step": 193496, "epoch": 4607} {"train_loss": -7.3216962814331055, "global_step": 193497, "epoch": 4607} {"train_loss": -7.241955280303955, "global_step": 193498, "epoch": 4607} {"train_loss": -7.273285865783691, "global_step": 193499, "epoch": 4607} {"train_loss": -7.283536434173584, "global_step": 193500, "epoch": 4607} {"train_loss": -7.2259521484375, "global_step": 193501, "epoch": 4607} {"train_loss": -7.358312606811523, "global_step": 193502, "epoch": 4607} {"train_loss": -7.282419204711914, "global_step": 193503, "epoch": 4607} {"train_loss": -7.381600379943848, "global_step": 193504, "epoch": 4607} {"train_loss": -7.272153854370117, "global_step": 193505, "epoch": 4607} {"train_loss": -7.3761305809021, "global_step": 193506, "epoch": 4607} {"train_loss": -7.287697792053223, "global_step": 193507, "epoch": 4607} {"train_loss": -7.2018280029296875, "global_step": 193508, "epoch": 4607} {"train_loss": -7.206046104431152, "global_step": 193509, "epoch": 4607} {"train_loss": -7.2691521644592285, "global_step": 193510, "epoch": 4607} {"train_loss": -7.228186130523682, "global_step": 193511, "epoch": 4607} {"train_loss": -7.219308853149414, "global_step": 193512, "epoch": 4607} {"train_loss": -7.208922386169434, "global_step": 193513, "epoch": 4607} {"train_loss": -7.231309413909912, "global_step": 193514, "epoch": 4607} {"train_loss": -7.261458396911621, "global_step": 193515, "epoch": 4607} {"train_loss": -7.224674701690674, "global_step": 193516, "epoch": 4607} {"train_loss": -7.284173011779785, "global_step": 193517, "epoch": 4607} {"train_loss": -7.22231388092041, "global_step": 193518, "epoch": 4607} {"train_loss": -7.08144474029541, "global_step": 193519, "epoch": 4607} {"train_loss": -7.1515278816223145, "global_step": 193520, "epoch": 4607} {"train_loss": -7.138538360595703, "global_step": 193521, "epoch": 4607} {"train_loss": -7.143865585327148, "global_step": 193522, "epoch": 4607} {"train_loss": -7.106602668762207, "global_step": 193523, "epoch": 4607} {"train_loss": -7.110991954803467, "global_step": 193524, "epoch": 4607} {"train_loss": -7.3790974617004395, "global_step": 193525, "epoch": 4607} {"train_loss": -7.06291389465332, "global_step": 193526, "epoch": 4607} {"train_loss": -7.259364128112793, "global_step": 193527, "epoch": 4607} {"train_loss": -7.365877151489258, "global_step": 193528, "epoch": 4607} {"train_loss": -7.19251823425293, "global_step": 193529, "epoch": 4607} {"train_loss": -7.200573921203613, "global_step": 193530, "epoch": 4607} {"train_loss": -7.253698825836182, "global_step": 193531, "epoch": 4607} {"train_loss": -7.212170600891113, "global_step": 193532, "epoch": 4607} {"train_loss": -7.1516852378845215, "global_step": 193533, "epoch": 4607} {"train_loss": -7.225144386291504, "global_step": 193534, "epoch": 4607} {"train_loss": -7.234365781148274, "global_step": 193535, "epoch": 4607, "val_loss": 81134.6015625} {"train_loss": -7.31134033203125, "global_step": 193536, "epoch": 4608} {"train_loss": -7.282532691955566, "global_step": 193537, "epoch": 4608} {"train_loss": -7.231563568115234, "global_step": 193538, "epoch": 4608} {"train_loss": -7.305720806121826, "global_step": 193539, "epoch": 4608} {"train_loss": -7.24559211730957, "global_step": 193540, "epoch": 4608} {"train_loss": -7.319732666015625, "global_step": 193541, "epoch": 4608} {"train_loss": -7.324846267700195, "global_step": 193542, "epoch": 4608} {"train_loss": -7.293071746826172, "global_step": 193543, "epoch": 4608} {"train_loss": -7.232275009155273, "global_step": 193544, "epoch": 4608} {"train_loss": -7.460539817810059, "global_step": 193545, "epoch": 4608} {"train_loss": -7.314332008361816, "global_step": 193546, "epoch": 4608} {"train_loss": -7.296205997467041, "global_step": 193547, "epoch": 4608} {"train_loss": -7.332543849945068, "global_step": 193548, "epoch": 4608} {"train_loss": -7.24830436706543, "global_step": 193549, "epoch": 4608} {"train_loss": -7.237922668457031, "global_step": 193550, "epoch": 4608} {"train_loss": -7.2647223472595215, "global_step": 193551, "epoch": 4608} {"train_loss": -7.258796691894531, "global_step": 193552, "epoch": 4608} {"train_loss": -7.318955421447754, "global_step": 193553, "epoch": 4608} {"train_loss": -7.1975507736206055, "global_step": 193554, "epoch": 4608} {"train_loss": -7.395051002502441, "global_step": 193555, "epoch": 4608} {"train_loss": -7.256347179412842, "global_step": 193556, "epoch": 4608} {"train_loss": -7.324031352996826, "global_step": 193557, "epoch": 4608} {"train_loss": -7.339334487915039, "global_step": 193558, "epoch": 4608} {"train_loss": -7.359332084655762, "global_step": 193559, "epoch": 4608} {"train_loss": -7.2585649490356445, "global_step": 193560, "epoch": 4608} {"train_loss": -7.2628374099731445, "global_step": 193561, "epoch": 4608} {"train_loss": -7.171177864074707, "global_step": 193562, "epoch": 4608} {"train_loss": -7.359189510345459, "global_step": 193563, "epoch": 4608} {"train_loss": -7.1882171630859375, "global_step": 193564, "epoch": 4608} {"train_loss": -7.264446258544922, "global_step": 193565, "epoch": 4608} {"train_loss": -7.274040222167969, "global_step": 193566, "epoch": 4608} {"train_loss": -7.396754264831543, "global_step": 193567, "epoch": 4608} {"train_loss": -7.226472854614258, "global_step": 193568, "epoch": 4608} {"train_loss": -7.403623580932617, "global_step": 193569, "epoch": 4608} {"train_loss": -7.287344932556152, "global_step": 193570, "epoch": 4608} {"train_loss": -7.248244285583496, "global_step": 193571, "epoch": 4608} {"train_loss": -7.232414245605469, "global_step": 193572, "epoch": 4608} {"train_loss": -7.310843467712402, "global_step": 193573, "epoch": 4608} {"train_loss": -7.2896599769592285, "global_step": 193574, "epoch": 4608} {"train_loss": -7.468034744262695, "global_step": 193575, "epoch": 4608} {"train_loss": -7.190373420715332, "global_step": 193576, "epoch": 4608} {"train_loss": -7.291680279232207, "global_step": 193577, "epoch": 4608, "val_loss": 81173.6484375} {"train_loss": -7.3069562911987305, "global_step": 193578, "epoch": 4609} {"train_loss": -7.389470100402832, "global_step": 193579, "epoch": 4609} {"train_loss": -7.325407981872559, "global_step": 193580, "epoch": 4609} {"train_loss": -7.363953113555908, "global_step": 193581, "epoch": 4609} {"train_loss": -7.285895347595215, "global_step": 193582, "epoch": 4609} {"train_loss": -7.282888889312744, "global_step": 193583, "epoch": 4609} {"train_loss": -7.330941200256348, "global_step": 193584, "epoch": 4609} {"train_loss": -7.403789520263672, "global_step": 193585, "epoch": 4609} {"train_loss": -7.129719257354736, "global_step": 193586, "epoch": 4609} {"train_loss": -7.253993988037109, "global_step": 193587, "epoch": 4609} {"train_loss": -7.3722357749938965, "global_step": 193588, "epoch": 4609} {"train_loss": -7.20517635345459, "global_step": 193589, "epoch": 4609} {"train_loss": -7.302682399749756, "global_step": 193590, "epoch": 4609} {"train_loss": -7.267091751098633, "global_step": 193591, "epoch": 4609} {"train_loss": -7.154140472412109, "global_step": 193592, "epoch": 4609} {"train_loss": -7.235549449920654, "global_step": 193593, "epoch": 4609} {"train_loss": -7.205652236938477, "global_step": 193594, "epoch": 4609} {"train_loss": -7.291278839111328, "global_step": 193595, "epoch": 4609} {"train_loss": -7.194494247436523, "global_step": 193596, "epoch": 4609} {"train_loss": -7.212158679962158, "global_step": 193597, "epoch": 4609} {"train_loss": -7.171928405761719, "global_step": 193598, "epoch": 4609} {"train_loss": -7.2606635093688965, "global_step": 193599, "epoch": 4609} {"train_loss": -7.096166610717773, "global_step": 193600, "epoch": 4609} {"train_loss": -7.292741298675537, "global_step": 193601, "epoch": 4609} {"train_loss": -7.227799892425537, "global_step": 193602, "epoch": 4609} {"train_loss": -7.189445972442627, "global_step": 193603, "epoch": 4609} {"train_loss": -7.0841474533081055, "global_step": 193604, "epoch": 4609} {"train_loss": -7.145937919616699, "global_step": 193605, "epoch": 4609} {"train_loss": -7.226747035980225, "global_step": 193606, "epoch": 4609} {"train_loss": -7.156631946563721, "global_step": 193607, "epoch": 4609} {"train_loss": -7.201610565185547, "global_step": 193608, "epoch": 4609} {"train_loss": -7.108708381652832, "global_step": 193609, "epoch": 4609} {"train_loss": -7.097140312194824, "global_step": 193610, "epoch": 4609} {"train_loss": -7.1992506980896, "global_step": 193611, "epoch": 4609} {"train_loss": -7.2938761711120605, "global_step": 193612, "epoch": 4609} {"train_loss": -7.154249668121338, "global_step": 193613, "epoch": 4609} {"train_loss": -7.114326477050781, "global_step": 193614, "epoch": 4609} {"train_loss": -7.195740222930908, "global_step": 193615, "epoch": 4609} {"train_loss": -7.166630268096924, "global_step": 193616, "epoch": 4609} {"train_loss": -7.11795711517334, "global_step": 193617, "epoch": 4609} {"train_loss": -7.141768455505371, "global_step": 193618, "epoch": 4609} {"train_loss": -7.21838363011678, "global_step": 193619, "epoch": 4609, "val_loss": 81046.2890625} {"train_loss": -7.020184516906738, "global_step": 193620, "epoch": 4610} {"train_loss": -7.081658363342285, "global_step": 193621, "epoch": 4610} {"train_loss": -6.994102954864502, "global_step": 193622, "epoch": 4610} {"train_loss": -7.087300777435303, "global_step": 193623, "epoch": 4610} {"train_loss": -7.039788246154785, "global_step": 193624, "epoch": 4610} {"train_loss": -7.154599189758301, "global_step": 193625, "epoch": 4610} {"train_loss": -7.040587425231934, "global_step": 193626, "epoch": 4610} {"train_loss": -6.978214263916016, "global_step": 193627, "epoch": 4610} {"train_loss": -7.174050331115723, "global_step": 193628, "epoch": 4610} {"train_loss": -6.933140754699707, "global_step": 193629, "epoch": 4610} {"train_loss": -7.17746639251709, "global_step": 193630, "epoch": 4610} {"train_loss": -7.083779811859131, "global_step": 193631, "epoch": 4610} {"train_loss": -7.060090065002441, "global_step": 193632, "epoch": 4610} {"train_loss": -7.056529998779297, "global_step": 193633, "epoch": 4610} {"train_loss": -7.093484401702881, "global_step": 193634, "epoch": 4610} {"train_loss": -7.231376647949219, "global_step": 193635, "epoch": 4610} {"train_loss": -7.145268440246582, "global_step": 193636, "epoch": 4610} {"train_loss": -7.172939777374268, "global_step": 193637, "epoch": 4610} {"train_loss": -6.993599891662598, "global_step": 193638, "epoch": 4610} {"train_loss": -7.154254913330078, "global_step": 193639, "epoch": 4610} {"train_loss": -7.152838706970215, "global_step": 193640, "epoch": 4610} {"train_loss": -7.2060956954956055, "global_step": 193641, "epoch": 4610} {"train_loss": -7.119776725769043, "global_step": 193642, "epoch": 4610} {"train_loss": -7.301700592041016, "global_step": 193643, "epoch": 4610} {"train_loss": -7.129631996154785, "global_step": 193644, "epoch": 4610} {"train_loss": -7.232065677642822, "global_step": 193645, "epoch": 4610} {"train_loss": -7.213523864746094, "global_step": 193646, "epoch": 4610} {"train_loss": -7.199775695800781, "global_step": 193647, "epoch": 4610} {"train_loss": -7.277326583862305, "global_step": 193648, "epoch": 4610} {"train_loss": -7.229251384735107, "global_step": 193649, "epoch": 4610} {"train_loss": -7.176607131958008, "global_step": 193650, "epoch": 4610} {"train_loss": -7.151608467102051, "global_step": 193651, "epoch": 4610} {"train_loss": -7.277901649475098, "global_step": 193652, "epoch": 4610} {"train_loss": -7.325672149658203, "global_step": 193653, "epoch": 4610} {"train_loss": -7.260401725769043, "global_step": 193654, "epoch": 4610} {"train_loss": -7.28541898727417, "global_step": 193655, "epoch": 4610} {"train_loss": -7.315980911254883, "global_step": 193656, "epoch": 4610} {"train_loss": -7.280368804931641, "global_step": 193657, "epoch": 4610} {"train_loss": -7.3160905838012695, "global_step": 193658, "epoch": 4610} {"train_loss": -7.227352142333984, "global_step": 193659, "epoch": 4610} {"train_loss": -7.300396919250488, "global_step": 193660, "epoch": 4610} {"train_loss": -7.164018188204084, "global_step": 193661, "epoch": 4610, "val_loss": 80946.2265625} {"train_loss": -7.274420261383057, "global_step": 193662, "epoch": 4611} {"train_loss": -7.296792984008789, "global_step": 193663, "epoch": 4611} {"train_loss": -7.278728008270264, "global_step": 193664, "epoch": 4611} {"train_loss": -7.319929122924805, "global_step": 193665, "epoch": 4611} {"train_loss": -7.262993335723877, "global_step": 193666, "epoch": 4611} {"train_loss": -7.266603469848633, "global_step": 193667, "epoch": 4611} {"train_loss": -7.240351676940918, "global_step": 193668, "epoch": 4611} {"train_loss": -7.33950662612915, "global_step": 193669, "epoch": 4611} {"train_loss": -7.292430877685547, "global_step": 193670, "epoch": 4611} {"train_loss": -7.221123695373535, "global_step": 193671, "epoch": 4611} {"train_loss": -7.233852386474609, "global_step": 193672, "epoch": 4611} {"train_loss": -7.373991012573242, "global_step": 193673, "epoch": 4611} {"train_loss": -7.3163957595825195, "global_step": 193674, "epoch": 4611} {"train_loss": -7.236539363861084, "global_step": 193675, "epoch": 4611} {"train_loss": -7.262392044067383, "global_step": 193676, "epoch": 4611} {"train_loss": -7.321827411651611, "global_step": 193677, "epoch": 4611} {"train_loss": -7.3696208000183105, "global_step": 193678, "epoch": 4611} {"train_loss": -7.370006084442139, "global_step": 193679, "epoch": 4611} {"train_loss": -7.292292594909668, "global_step": 193680, "epoch": 4611} {"train_loss": -7.329984188079834, "global_step": 193681, "epoch": 4611} {"train_loss": -7.335007190704346, "global_step": 193682, "epoch": 4611} {"train_loss": -7.26271915435791, "global_step": 193683, "epoch": 4611} {"train_loss": -7.317776203155518, "global_step": 193684, "epoch": 4611} {"train_loss": -7.356658935546875, "global_step": 193685, "epoch": 4611} {"train_loss": -7.266161918640137, "global_step": 193686, "epoch": 4611} {"train_loss": -7.282710075378418, "global_step": 193687, "epoch": 4611} {"train_loss": -7.3238115310668945, "global_step": 193688, "epoch": 4611} {"train_loss": -7.412222385406494, "global_step": 193689, "epoch": 4611} {"train_loss": -7.351707458496094, "global_step": 193690, "epoch": 4611} {"train_loss": -7.345928192138672, "global_step": 193691, "epoch": 4611} {"train_loss": -7.33510160446167, "global_step": 193692, "epoch": 4611} {"train_loss": -7.256364822387695, "global_step": 193693, "epoch": 4611} {"train_loss": -7.280597686767578, "global_step": 193694, "epoch": 4611} {"train_loss": -7.319887161254883, "global_step": 193695, "epoch": 4611} {"train_loss": -7.309731960296631, "global_step": 193696, "epoch": 4611} {"train_loss": -7.291659355163574, "global_step": 193697, "epoch": 4611} {"train_loss": -7.238463878631592, "global_step": 193698, "epoch": 4611} {"train_loss": -7.250523567199707, "global_step": 193699, "epoch": 4611} {"train_loss": -7.309676647186279, "global_step": 193700, "epoch": 4611} {"train_loss": -7.227880477905273, "global_step": 193701, "epoch": 4611} {"train_loss": -7.305215358734131, "global_step": 193702, "epoch": 4611} {"train_loss": -7.299940359024775, "global_step": 193703, "epoch": 4611, "val_loss": 81233.53125} {"train_loss": -7.319677829742432, "global_step": 193704, "epoch": 4612} {"train_loss": -7.364085674285889, "global_step": 193705, "epoch": 4612} {"train_loss": -7.096596717834473, "global_step": 193706, "epoch": 4612} {"train_loss": -7.210509300231934, "global_step": 193707, "epoch": 4612} {"train_loss": -7.3950605392456055, "global_step": 193708, "epoch": 4612} {"train_loss": -7.088351726531982, "global_step": 193709, "epoch": 4612} {"train_loss": -7.295123100280762, "global_step": 193710, "epoch": 4612} {"train_loss": -7.343436241149902, "global_step": 193711, "epoch": 4612} {"train_loss": -7.176809310913086, "global_step": 193712, "epoch": 4612} {"train_loss": -7.250153541564941, "global_step": 193713, "epoch": 4612} {"train_loss": -7.207224369049072, "global_step": 193714, "epoch": 4612} {"train_loss": -7.046982288360596, "global_step": 193715, "epoch": 4612} {"train_loss": -7.231450080871582, "global_step": 193716, "epoch": 4612} {"train_loss": -7.169432640075684, "global_step": 193717, "epoch": 4612} {"train_loss": -7.205034255981445, "global_step": 193718, "epoch": 4612} {"train_loss": -7.3495612144470215, "global_step": 193719, "epoch": 4612} {"train_loss": -7.317770957946777, "global_step": 193720, "epoch": 4612} {"train_loss": -7.275903224945068, "global_step": 193721, "epoch": 4612} {"train_loss": -7.263363838195801, "global_step": 193722, "epoch": 4612} {"train_loss": -7.246994495391846, "global_step": 193723, "epoch": 4612} {"train_loss": -7.292786598205566, "global_step": 193724, "epoch": 4612} {"train_loss": -7.209874153137207, "global_step": 193725, "epoch": 4612} {"train_loss": -7.351408958435059, "global_step": 193726, "epoch": 4612} {"train_loss": -7.250594139099121, "global_step": 193727, "epoch": 4612} {"train_loss": -7.3057379722595215, "global_step": 193728, "epoch": 4612} {"train_loss": -7.15500545501709, "global_step": 193729, "epoch": 4612} {"train_loss": -7.25922966003418, "global_step": 193730, "epoch": 4612} {"train_loss": -7.202248573303223, "global_step": 193731, "epoch": 4612} {"train_loss": -7.204958438873291, "global_step": 193732, "epoch": 4612} {"train_loss": -7.274680137634277, "global_step": 193733, "epoch": 4612} {"train_loss": -7.301889419555664, "global_step": 193734, "epoch": 4612} {"train_loss": -7.239132404327393, "global_step": 193735, "epoch": 4612} {"train_loss": -7.326235294342041, "global_step": 193736, "epoch": 4612} {"train_loss": -7.2956085205078125, "global_step": 193737, "epoch": 4612} {"train_loss": -7.178849220275879, "global_step": 193738, "epoch": 4612} {"train_loss": -7.301308631896973, "global_step": 193739, "epoch": 4612} {"train_loss": -7.2423624992370605, "global_step": 193740, "epoch": 4612} {"train_loss": -7.334914684295654, "global_step": 193741, "epoch": 4612} {"train_loss": -7.296952247619629, "global_step": 193742, "epoch": 4612} {"train_loss": -7.334936618804932, "global_step": 193743, "epoch": 4612} {"train_loss": -7.3027873039245605, "global_step": 193744, "epoch": 4612} {"train_loss": -7.256243092673166, "global_step": 193745, "epoch": 4612, "val_loss": 81239.2421875} {"train_loss": -7.2985124588012695, "global_step": 193746, "epoch": 4613} {"train_loss": -7.321074485778809, "global_step": 193747, "epoch": 4613} {"train_loss": -7.365496635437012, "global_step": 193748, "epoch": 4613} {"train_loss": -7.287626266479492, "global_step": 193749, "epoch": 4613} {"train_loss": -7.2901811599731445, "global_step": 193750, "epoch": 4613} {"train_loss": -7.283571243286133, "global_step": 193751, "epoch": 4613} {"train_loss": -7.32268762588501, "global_step": 193752, "epoch": 4613} {"train_loss": -7.342775344848633, "global_step": 193753, "epoch": 4613} {"train_loss": -7.358384132385254, "global_step": 193754, "epoch": 4613} {"train_loss": -7.224308013916016, "global_step": 193755, "epoch": 4613} {"train_loss": -7.245975017547607, "global_step": 193756, "epoch": 4613} {"train_loss": -7.269323348999023, "global_step": 193757, "epoch": 4613} {"train_loss": -7.397688865661621, "global_step": 193758, "epoch": 4613} {"train_loss": -7.190979957580566, "global_step": 193759, "epoch": 4613} {"train_loss": -7.215943336486816, "global_step": 193760, "epoch": 4613} {"train_loss": -7.180248737335205, "global_step": 193761, "epoch": 4613} {"train_loss": -7.164094924926758, "global_step": 193762, "epoch": 4613} {"train_loss": -7.290154457092285, "global_step": 193763, "epoch": 4613} {"train_loss": -7.079311370849609, "global_step": 193764, "epoch": 4613} {"train_loss": -7.09896993637085, "global_step": 193765, "epoch": 4613} {"train_loss": -6.981346130371094, "global_step": 193766, "epoch": 4613} {"train_loss": -7.150945663452148, "global_step": 193767, "epoch": 4613} {"train_loss": -6.978049278259277, "global_step": 193768, "epoch": 4613} {"train_loss": -6.9775543212890625, "global_step": 193769, "epoch": 4613} {"train_loss": -7.038448333740234, "global_step": 193770, "epoch": 4613} {"train_loss": -7.119758605957031, "global_step": 193771, "epoch": 4613} {"train_loss": -6.934842109680176, "global_step": 193772, "epoch": 4613} {"train_loss": -7.159121513366699, "global_step": 193773, "epoch": 4613} {"train_loss": -6.9086456298828125, "global_step": 193774, "epoch": 4613} {"train_loss": -7.024393081665039, "global_step": 193775, "epoch": 4613} {"train_loss": -6.961587429046631, "global_step": 193776, "epoch": 4613} {"train_loss": -7.144186019897461, "global_step": 193777, "epoch": 4613} {"train_loss": -7.104084491729736, "global_step": 193778, "epoch": 4613} {"train_loss": -7.083276271820068, "global_step": 193779, "epoch": 4613} {"train_loss": -7.162230014801025, "global_step": 193780, "epoch": 4613} {"train_loss": -7.028642654418945, "global_step": 193781, "epoch": 4613} {"train_loss": -7.143704414367676, "global_step": 193782, "epoch": 4613} {"train_loss": -7.073060035705566, "global_step": 193783, "epoch": 4613} {"train_loss": -7.131374359130859, "global_step": 193784, "epoch": 4613} {"train_loss": -7.172338485717773, "global_step": 193785, "epoch": 4613} {"train_loss": -7.0351152420043945, "global_step": 193786, "epoch": 4613} {"train_loss": -7.15948672521682, "global_step": 193787, "epoch": 4613, "val_loss": 81384.5859375} {"train_loss": -7.124052047729492, "global_step": 193788, "epoch": 4614} {"train_loss": -7.2720232009887695, "global_step": 193789, "epoch": 4614} {"train_loss": -7.1958208084106445, "global_step": 193790, "epoch": 4614} {"train_loss": -7.291133403778076, "global_step": 193791, "epoch": 4614} {"train_loss": -7.210118293762207, "global_step": 193792, "epoch": 4614} {"train_loss": -7.21340274810791, "global_step": 193793, "epoch": 4614} {"train_loss": -7.226921081542969, "global_step": 193794, "epoch": 4614} {"train_loss": -7.27171516418457, "global_step": 193795, "epoch": 4614} {"train_loss": -7.220478057861328, "global_step": 193796, "epoch": 4614} {"train_loss": -7.335844039916992, "global_step": 193797, "epoch": 4614} {"train_loss": -7.294079303741455, "global_step": 193798, "epoch": 4614} {"train_loss": -7.231910705566406, "global_step": 193799, "epoch": 4614} {"train_loss": -7.262686729431152, "global_step": 193800, "epoch": 4614} {"train_loss": -7.280881881713867, "global_step": 193801, "epoch": 4614} {"train_loss": -7.323709011077881, "global_step": 193802, "epoch": 4614} {"train_loss": -7.260679244995117, "global_step": 193803, "epoch": 4614} {"train_loss": -7.338338375091553, "global_step": 193804, "epoch": 4614} {"train_loss": -7.302861213684082, "global_step": 193805, "epoch": 4614} {"train_loss": -7.251137733459473, "global_step": 193806, "epoch": 4614} {"train_loss": -7.335178375244141, "global_step": 193807, "epoch": 4614} {"train_loss": -7.330119609832764, "global_step": 193808, "epoch": 4614} {"train_loss": -7.296572208404541, "global_step": 193809, "epoch": 4614} {"train_loss": -7.248706817626953, "global_step": 193810, "epoch": 4614} {"train_loss": -7.246151924133301, "global_step": 193811, "epoch": 4614} {"train_loss": -7.351781368255615, "global_step": 193812, "epoch": 4614} {"train_loss": -7.299701690673828, "global_step": 193813, "epoch": 4614} {"train_loss": -7.254271030426025, "global_step": 193814, "epoch": 4614} {"train_loss": -7.280932426452637, "global_step": 193815, "epoch": 4614} {"train_loss": -7.189764976501465, "global_step": 193816, "epoch": 4614} {"train_loss": -7.3699951171875, "global_step": 193817, "epoch": 4614} {"train_loss": -7.4214277267456055, "global_step": 193818, "epoch": 4614} {"train_loss": -7.219123840332031, "global_step": 193819, "epoch": 4614} {"train_loss": -7.291043758392334, "global_step": 193820, "epoch": 4614} {"train_loss": -7.259921550750732, "global_step": 193821, "epoch": 4614} {"train_loss": -7.282546043395996, "global_step": 193822, "epoch": 4614} {"train_loss": -7.368566989898682, "global_step": 193823, "epoch": 4614} {"train_loss": -7.2085347175598145, "global_step": 193824, "epoch": 4614} {"train_loss": -7.256522178649902, "global_step": 193825, "epoch": 4614} {"train_loss": -7.261656284332275, "global_step": 193826, "epoch": 4614} {"train_loss": -7.311203956604004, "global_step": 193827, "epoch": 4614} {"train_loss": -7.203792572021484, "global_step": 193828, "epoch": 4614} {"train_loss": -7.274270750227428, "global_step": 193829, "epoch": 4614, "val_loss": 80953.734375} {"train_loss": -7.244614124298096, "global_step": 193830, "epoch": 4615} {"train_loss": -7.310552597045898, "global_step": 193831, "epoch": 4615} {"train_loss": -7.235598564147949, "global_step": 193832, "epoch": 4615} {"train_loss": -7.334170341491699, "global_step": 193833, "epoch": 4615} {"train_loss": -7.3618011474609375, "global_step": 193834, "epoch": 4615} {"train_loss": -7.322540283203125, "global_step": 193835, "epoch": 4615} {"train_loss": -7.325251579284668, "global_step": 193836, "epoch": 4615} {"train_loss": -7.229877471923828, "global_step": 193837, "epoch": 4615} {"train_loss": -7.2091264724731445, "global_step": 193838, "epoch": 4615} {"train_loss": -7.309776782989502, "global_step": 193839, "epoch": 4615} {"train_loss": -7.242883682250977, "global_step": 193840, "epoch": 4615} {"train_loss": -7.277497291564941, "global_step": 193841, "epoch": 4615} {"train_loss": -7.157841682434082, "global_step": 193842, "epoch": 4615} {"train_loss": -7.229848861694336, "global_step": 193843, "epoch": 4615} {"train_loss": -7.160287380218506, "global_step": 193844, "epoch": 4615} {"train_loss": -7.256946086883545, "global_step": 193845, "epoch": 4615} {"train_loss": -7.266341209411621, "global_step": 193846, "epoch": 4615} {"train_loss": -7.082579612731934, "global_step": 193847, "epoch": 4615} {"train_loss": -7.283483982086182, "global_step": 193848, "epoch": 4615} {"train_loss": -7.392468452453613, "global_step": 193849, "epoch": 4615} {"train_loss": -7.122203826904297, "global_step": 193850, "epoch": 4615} {"train_loss": -7.226241111755371, "global_step": 193851, "epoch": 4615} {"train_loss": -7.1727423667907715, "global_step": 193852, "epoch": 4615} {"train_loss": -7.04396915435791, "global_step": 193853, "epoch": 4615} {"train_loss": -7.316861152648926, "global_step": 193854, "epoch": 4615} {"train_loss": -7.2386980056762695, "global_step": 193855, "epoch": 4615} {"train_loss": -7.202846527099609, "global_step": 193856, "epoch": 4615} {"train_loss": -7.249478340148926, "global_step": 193857, "epoch": 4615} {"train_loss": -7.16950798034668, "global_step": 193858, "epoch": 4615} {"train_loss": -7.289793968200684, "global_step": 193859, "epoch": 4615} {"train_loss": -7.293720245361328, "global_step": 193860, "epoch": 4615} {"train_loss": -7.153581619262695, "global_step": 193861, "epoch": 4615} {"train_loss": -7.221506595611572, "global_step": 193862, "epoch": 4615} {"train_loss": -7.220725059509277, "global_step": 193863, "epoch": 4615} {"train_loss": -7.203292369842529, "global_step": 193864, "epoch": 4615} {"train_loss": -7.219903469085693, "global_step": 193865, "epoch": 4615} {"train_loss": -7.148083686828613, "global_step": 193866, "epoch": 4615} {"train_loss": -7.337028503417969, "global_step": 193867, "epoch": 4615} {"train_loss": -7.171093940734863, "global_step": 193868, "epoch": 4615} {"train_loss": -7.2050886154174805, "global_step": 193869, "epoch": 4615} {"train_loss": -7.238254547119141, "global_step": 193870, "epoch": 4615} {"train_loss": -7.236727260407948, "global_step": 193871, "epoch": 4615, "val_loss": 81043.3046875} {"train_loss": -7.313676834106445, "global_step": 193872, "epoch": 4616} {"train_loss": -7.190752029418945, "global_step": 193873, "epoch": 4616} {"train_loss": -7.257020950317383, "global_step": 193874, "epoch": 4616} {"train_loss": -7.282357692718506, "global_step": 193875, "epoch": 4616} {"train_loss": -7.214484214782715, "global_step": 193876, "epoch": 4616} {"train_loss": -7.381030559539795, "global_step": 193877, "epoch": 4616} {"train_loss": -7.193753719329834, "global_step": 193878, "epoch": 4616} {"train_loss": -7.274753570556641, "global_step": 193879, "epoch": 4616} {"train_loss": -7.2369279861450195, "global_step": 193880, "epoch": 4616} {"train_loss": -7.26158332824707, "global_step": 193881, "epoch": 4616} {"train_loss": -7.2123703956604, "global_step": 193882, "epoch": 4616} {"train_loss": -7.316219329833984, "global_step": 193883, "epoch": 4616} {"train_loss": -7.220074653625488, "global_step": 193884, "epoch": 4616} {"train_loss": -7.255718231201172, "global_step": 193885, "epoch": 4616} {"train_loss": -7.360377311706543, "global_step": 193886, "epoch": 4616} {"train_loss": -7.290520668029785, "global_step": 193887, "epoch": 4616} {"train_loss": -7.23707389831543, "global_step": 193888, "epoch": 4616} {"train_loss": -7.2944231033325195, "global_step": 193889, "epoch": 4616} {"train_loss": -7.168524742126465, "global_step": 193890, "epoch": 4616} {"train_loss": -7.063036918640137, "global_step": 193891, "epoch": 4616} {"train_loss": -7.3076171875, "global_step": 193892, "epoch": 4616} {"train_loss": -7.306626319885254, "global_step": 193893, "epoch": 4616} {"train_loss": -7.235099792480469, "global_step": 193894, "epoch": 4616} {"train_loss": -7.128568172454834, "global_step": 193895, "epoch": 4616} {"train_loss": -7.129071235656738, "global_step": 193896, "epoch": 4616} {"train_loss": -7.285830497741699, "global_step": 193897, "epoch": 4616} {"train_loss": -7.2044267654418945, "global_step": 193898, "epoch": 4616} {"train_loss": -7.279126167297363, "global_step": 193899, "epoch": 4616} {"train_loss": -7.267557144165039, "global_step": 193900, "epoch": 4616} {"train_loss": -7.247513771057129, "global_step": 193901, "epoch": 4616} {"train_loss": -7.219055652618408, "global_step": 193902, "epoch": 4616} {"train_loss": -7.316341400146484, "global_step": 193903, "epoch": 4616} {"train_loss": -7.224688529968262, "global_step": 193904, "epoch": 4616} {"train_loss": -7.245549201965332, "global_step": 193905, "epoch": 4616} {"train_loss": -7.189313888549805, "global_step": 193906, "epoch": 4616} {"train_loss": -7.155035018920898, "global_step": 193907, "epoch": 4616} {"train_loss": -7.24492883682251, "global_step": 193908, "epoch": 4616} {"train_loss": -7.231319904327393, "global_step": 193909, "epoch": 4616} {"train_loss": -7.337119102478027, "global_step": 193910, "epoch": 4616} {"train_loss": -7.232354164123535, "global_step": 193911, "epoch": 4616} {"train_loss": -7.280508995056152, "global_step": 193912, "epoch": 4616} {"train_loss": -7.248034454527355, "global_step": 193913, "epoch": 4616, "val_loss": 80975.140625} {"train_loss": -7.239140033721924, "global_step": 193914, "epoch": 4617} {"train_loss": -7.184520721435547, "global_step": 193915, "epoch": 4617} {"train_loss": -7.077741622924805, "global_step": 193916, "epoch": 4617} {"train_loss": -7.174415588378906, "global_step": 193917, "epoch": 4617} {"train_loss": -7.189930438995361, "global_step": 193918, "epoch": 4617} {"train_loss": -7.244711875915527, "global_step": 193919, "epoch": 4617} {"train_loss": -7.223127365112305, "global_step": 193920, "epoch": 4617} {"train_loss": -7.2437849044799805, "global_step": 193921, "epoch": 4617} {"train_loss": -7.296589374542236, "global_step": 193922, "epoch": 4617} {"train_loss": -7.138469219207764, "global_step": 193923, "epoch": 4617} {"train_loss": -7.249377250671387, "global_step": 193924, "epoch": 4617} {"train_loss": -7.182605266571045, "global_step": 193925, "epoch": 4617} {"train_loss": -7.285896301269531, "global_step": 193926, "epoch": 4617} {"train_loss": -7.174905776977539, "global_step": 193927, "epoch": 4617} {"train_loss": -7.1993207931518555, "global_step": 193928, "epoch": 4617} {"train_loss": -7.081637382507324, "global_step": 193929, "epoch": 4617} {"train_loss": -7.200042247772217, "global_step": 193930, "epoch": 4617} {"train_loss": -7.160749912261963, "global_step": 193931, "epoch": 4617} {"train_loss": -7.090921401977539, "global_step": 193932, "epoch": 4617} {"train_loss": -7.260424613952637, "global_step": 193933, "epoch": 4617} {"train_loss": -7.205765724182129, "global_step": 193934, "epoch": 4617} {"train_loss": -7.165731430053711, "global_step": 193935, "epoch": 4617} {"train_loss": -7.134875297546387, "global_step": 193936, "epoch": 4617} {"train_loss": -7.043020248413086, "global_step": 193937, "epoch": 4617} {"train_loss": -7.196885108947754, "global_step": 193938, "epoch": 4617} {"train_loss": -6.938538551330566, "global_step": 193939, "epoch": 4617} {"train_loss": -7.241959571838379, "global_step": 193940, "epoch": 4617} {"train_loss": -7.069713592529297, "global_step": 193941, "epoch": 4617} {"train_loss": -6.820782661437988, "global_step": 193942, "epoch": 4617} {"train_loss": -7.116119384765625, "global_step": 193943, "epoch": 4617} {"train_loss": -6.875178337097168, "global_step": 193944, "epoch": 4617} {"train_loss": -6.965829849243164, "global_step": 193945, "epoch": 4617} {"train_loss": -7.115878105163574, "global_step": 193946, "epoch": 4617} {"train_loss": -7.177067279815674, "global_step": 193947, "epoch": 4617} {"train_loss": -7.109251022338867, "global_step": 193948, "epoch": 4617} {"train_loss": -7.070867538452148, "global_step": 193949, "epoch": 4617} {"train_loss": -7.118521690368652, "global_step": 193950, "epoch": 4617} {"train_loss": -7.151073455810547, "global_step": 193951, "epoch": 4617} {"train_loss": -7.156398296356201, "global_step": 193952, "epoch": 4617} {"train_loss": -7.126839637756348, "global_step": 193953, "epoch": 4617} {"train_loss": -7.1337690353393555, "global_step": 193954, "epoch": 4617} {"train_loss": -7.141843296232677, "global_step": 193955, "epoch": 4617, "val_loss": 80899.8359375} {"train_loss": -7.217380523681641, "global_step": 193956, "epoch": 4618} {"train_loss": -7.054378509521484, "global_step": 193957, "epoch": 4618} {"train_loss": -7.205095291137695, "global_step": 193958, "epoch": 4618} {"train_loss": -7.142934799194336, "global_step": 193959, "epoch": 4618} {"train_loss": -7.192502021789551, "global_step": 193960, "epoch": 4618} {"train_loss": -7.128193378448486, "global_step": 193961, "epoch": 4618} {"train_loss": -7.143101215362549, "global_step": 193962, "epoch": 4618} {"train_loss": -7.300374984741211, "global_step": 193963, "epoch": 4618} {"train_loss": -7.2355875968933105, "global_step": 193964, "epoch": 4618} {"train_loss": -7.271296501159668, "global_step": 193965, "epoch": 4618} {"train_loss": -7.294595718383789, "global_step": 193966, "epoch": 4618} {"train_loss": -7.2042717933654785, "global_step": 193967, "epoch": 4618} {"train_loss": -7.235560417175293, "global_step": 193968, "epoch": 4618} {"train_loss": -7.3369646072387695, "global_step": 193969, "epoch": 4618} {"train_loss": -7.221403121948242, "global_step": 193970, "epoch": 4618} {"train_loss": -7.263608932495117, "global_step": 193971, "epoch": 4618} {"train_loss": -7.284134864807129, "global_step": 193972, "epoch": 4618} {"train_loss": -7.24908447265625, "global_step": 193973, "epoch": 4618} {"train_loss": -7.192144393920898, "global_step": 193974, "epoch": 4618} {"train_loss": -7.2600884437561035, "global_step": 193975, "epoch": 4618} {"train_loss": -7.133620262145996, "global_step": 193976, "epoch": 4618} {"train_loss": -7.151281356811523, "global_step": 193977, "epoch": 4618} {"train_loss": -7.173578262329102, "global_step": 193978, "epoch": 4618} {"train_loss": -7.06348991394043, "global_step": 193979, "epoch": 4618} {"train_loss": -7.06959342956543, "global_step": 193980, "epoch": 4618} {"train_loss": -7.1030049324035645, "global_step": 193981, "epoch": 4618} {"train_loss": -7.051876544952393, "global_step": 193982, "epoch": 4618} {"train_loss": -7.090027332305908, "global_step": 193983, "epoch": 4618} {"train_loss": -6.979589462280273, "global_step": 193984, "epoch": 4618} {"train_loss": -7.098639965057373, "global_step": 193985, "epoch": 4618} {"train_loss": -7.000493049621582, "global_step": 193986, "epoch": 4618} {"train_loss": -7.226882457733154, "global_step": 193987, "epoch": 4618} {"train_loss": -6.983062744140625, "global_step": 193988, "epoch": 4618} {"train_loss": -7.081206321716309, "global_step": 193989, "epoch": 4618} {"train_loss": -6.9976582527160645, "global_step": 193990, "epoch": 4618} {"train_loss": -7.0366621017456055, "global_step": 193991, "epoch": 4618} {"train_loss": -7.059297561645508, "global_step": 193992, "epoch": 4618} {"train_loss": -7.050388813018799, "global_step": 193993, "epoch": 4618} {"train_loss": -7.02257776260376, "global_step": 193994, "epoch": 4618} {"train_loss": -7.110872745513916, "global_step": 193995, "epoch": 4618} {"train_loss": -7.089509010314941, "global_step": 193996, "epoch": 4618} {"train_loss": -7.144498302823021, "global_step": 193997, "epoch": 4618, "val_loss": 81508.2734375} {"train_loss": -7.130627632141113, "global_step": 193998, "epoch": 4619} {"train_loss": -7.0526251792907715, "global_step": 193999, "epoch": 4619} {"train_loss": -7.161803245544434, "global_step": 194000, "epoch": 4619} {"train_loss": -7.120515823364258, "global_step": 194001, "epoch": 4619} {"train_loss": -7.265771865844727, "global_step": 194002, "epoch": 4619} {"train_loss": -7.200841903686523, "global_step": 194003, "epoch": 4619} {"train_loss": -7.239053249359131, "global_step": 194004, "epoch": 4619} {"train_loss": -7.201331615447998, "global_step": 194005, "epoch": 4619} {"train_loss": -7.228078365325928, "global_step": 194006, "epoch": 4619} {"train_loss": -7.2349042892456055, "global_step": 194007, "epoch": 4619} {"train_loss": -7.188128471374512, "global_step": 194008, "epoch": 4619} {"train_loss": -7.153221130371094, "global_step": 194009, "epoch": 4619} {"train_loss": -7.187859058380127, "global_step": 194010, "epoch": 4619} {"train_loss": -7.2045698165893555, "global_step": 194011, "epoch": 4619} {"train_loss": -7.179141998291016, "global_step": 194012, "epoch": 4619} {"train_loss": -7.167675495147705, "global_step": 194013, "epoch": 4619} {"train_loss": -7.099891662597656, "global_step": 194014, "epoch": 4619} {"train_loss": -7.176252365112305, "global_step": 194015, "epoch": 4619} {"train_loss": -7.246671676635742, "global_step": 194016, "epoch": 4619} {"train_loss": -7.273221015930176, "global_step": 194017, "epoch": 4619} {"train_loss": -7.135041236877441, "global_step": 194018, "epoch": 4619} {"train_loss": -7.232670783996582, "global_step": 194019, "epoch": 4619} {"train_loss": -7.298616409301758, "global_step": 194020, "epoch": 4619} {"train_loss": -7.283576965332031, "global_step": 194021, "epoch": 4619} {"train_loss": -7.347671985626221, "global_step": 194022, "epoch": 4619} {"train_loss": -7.370176315307617, "global_step": 194023, "epoch": 4619} {"train_loss": -7.222347259521484, "global_step": 194024, "epoch": 4619} {"train_loss": -7.3178181648254395, "global_step": 194025, "epoch": 4619} {"train_loss": -7.2908101081848145, "global_step": 194026, "epoch": 4619} {"train_loss": -7.1835174560546875, "global_step": 194027, "epoch": 4619} {"train_loss": -7.296947479248047, "global_step": 194028, "epoch": 4619} {"train_loss": -7.352858066558838, "global_step": 194029, "epoch": 4619} {"train_loss": -7.295947551727295, "global_step": 194030, "epoch": 4619} {"train_loss": -7.181894302368164, "global_step": 194031, "epoch": 4619} {"train_loss": -7.226929187774658, "global_step": 194032, "epoch": 4619} {"train_loss": -7.436079978942871, "global_step": 194033, "epoch": 4619} {"train_loss": -7.284919738769531, "global_step": 194034, "epoch": 4619} {"train_loss": -7.400115013122559, "global_step": 194035, "epoch": 4619} {"train_loss": -7.287540435791016, "global_step": 194036, "epoch": 4619} {"train_loss": -7.365633487701416, "global_step": 194037, "epoch": 4619} {"train_loss": -7.362367630004883, "global_step": 194038, "epoch": 4619} {"train_loss": -7.242687906537737, "global_step": 194039, "epoch": 4619, "val_loss": 81297.546875} {"train_loss": -7.220609664916992, "global_step": 194040, "epoch": 4620} {"train_loss": -7.261968612670898, "global_step": 194041, "epoch": 4620} {"train_loss": -7.328899383544922, "global_step": 194042, "epoch": 4620} {"train_loss": -7.306455612182617, "global_step": 194043, "epoch": 4620} {"train_loss": -7.287741184234619, "global_step": 194044, "epoch": 4620} {"train_loss": -7.307671546936035, "global_step": 194045, "epoch": 4620} {"train_loss": -7.28516149520874, "global_step": 194046, "epoch": 4620} {"train_loss": -7.274495601654053, "global_step": 194047, "epoch": 4620} {"train_loss": -7.3487067222595215, "global_step": 194048, "epoch": 4620} {"train_loss": -7.168810844421387, "global_step": 194049, "epoch": 4620} {"train_loss": -7.307847499847412, "global_step": 194050, "epoch": 4620} {"train_loss": -7.106160640716553, "global_step": 194051, "epoch": 4620} {"train_loss": -7.2452239990234375, "global_step": 194052, "epoch": 4620} {"train_loss": -7.254909515380859, "global_step": 194053, "epoch": 4620} {"train_loss": -7.251103401184082, "global_step": 194054, "epoch": 4620} {"train_loss": -7.334778785705566, "global_step": 194055, "epoch": 4620} {"train_loss": -7.363951206207275, "global_step": 194056, "epoch": 4620} {"train_loss": -7.210667610168457, "global_step": 194057, "epoch": 4620} {"train_loss": -7.250432968139648, "global_step": 194058, "epoch": 4620} {"train_loss": -7.200915336608887, "global_step": 194059, "epoch": 4620} {"train_loss": -7.148900985717773, "global_step": 194060, "epoch": 4620} {"train_loss": -7.136919021606445, "global_step": 194061, "epoch": 4620} {"train_loss": -7.231925010681152, "global_step": 194062, "epoch": 4620} {"train_loss": -7.3101701736450195, "global_step": 194063, "epoch": 4620} {"train_loss": -7.147274017333984, "global_step": 194064, "epoch": 4620} {"train_loss": -6.989938259124756, "global_step": 194065, "epoch": 4620} {"train_loss": -7.367011070251465, "global_step": 194066, "epoch": 4620} {"train_loss": -7.137148380279541, "global_step": 194067, "epoch": 4620} {"train_loss": -7.079319953918457, "global_step": 194068, "epoch": 4620} {"train_loss": -7.208038330078125, "global_step": 194069, "epoch": 4620} {"train_loss": -7.325011253356934, "global_step": 194070, "epoch": 4620} {"train_loss": -7.219836235046387, "global_step": 194071, "epoch": 4620} {"train_loss": -7.2614569664001465, "global_step": 194072, "epoch": 4620} {"train_loss": -7.27819299697876, "global_step": 194073, "epoch": 4620} {"train_loss": -7.316736221313477, "global_step": 194074, "epoch": 4620} {"train_loss": -7.318515777587891, "global_step": 194075, "epoch": 4620} {"train_loss": -7.269576072692871, "global_step": 194076, "epoch": 4620} {"train_loss": -7.323209762573242, "global_step": 194077, "epoch": 4620} {"train_loss": -7.242018699645996, "global_step": 194078, "epoch": 4620} {"train_loss": -7.239058017730713, "global_step": 194079, "epoch": 4620} {"train_loss": -7.402298927307129, "global_step": 194080, "epoch": 4620} {"train_loss": -7.251390525272915, "global_step": 194081, "epoch": 4620, "val_loss": 81244.5} {"train_loss": -7.35768985748291, "global_step": 194082, "epoch": 4621} {"train_loss": -7.272727012634277, "global_step": 194083, "epoch": 4621} {"train_loss": -7.28127908706665, "global_step": 194084, "epoch": 4621} {"train_loss": -7.351837158203125, "global_step": 194085, "epoch": 4621} {"train_loss": -7.468052387237549, "global_step": 194086, "epoch": 4621} {"train_loss": -7.340535640716553, "global_step": 194087, "epoch": 4621} {"train_loss": -7.315647125244141, "global_step": 194088, "epoch": 4621} {"train_loss": -7.3148112297058105, "global_step": 194089, "epoch": 4621} {"train_loss": -7.225566387176514, "global_step": 194090, "epoch": 4621} {"train_loss": -7.283387660980225, "global_step": 194091, "epoch": 4621} {"train_loss": -7.26181697845459, "global_step": 194092, "epoch": 4621} {"train_loss": -7.250243186950684, "global_step": 194093, "epoch": 4621} {"train_loss": -7.3649067878723145, "global_step": 194094, "epoch": 4621} {"train_loss": -7.299966335296631, "global_step": 194095, "epoch": 4621} {"train_loss": -7.220393657684326, "global_step": 194096, "epoch": 4621} {"train_loss": -7.293184280395508, "global_step": 194097, "epoch": 4621} {"train_loss": -7.233051776885986, "global_step": 194098, "epoch": 4621} {"train_loss": -7.3061981201171875, "global_step": 194099, "epoch": 4621} {"train_loss": -7.316859245300293, "global_step": 194100, "epoch": 4621} {"train_loss": -7.225676536560059, "global_step": 194101, "epoch": 4621} {"train_loss": -7.230033874511719, "global_step": 194102, "epoch": 4621} {"train_loss": -7.173137664794922, "global_step": 194103, "epoch": 4621} {"train_loss": -7.2813615798950195, "global_step": 194104, "epoch": 4621} {"train_loss": -7.306156158447266, "global_step": 194105, "epoch": 4621} {"train_loss": -7.089458465576172, "global_step": 194106, "epoch": 4621} {"train_loss": -7.157107353210449, "global_step": 194107, "epoch": 4621} {"train_loss": -7.239278793334961, "global_step": 194108, "epoch": 4621} {"train_loss": -7.260457992553711, "global_step": 194109, "epoch": 4621} {"train_loss": -7.152864933013916, "global_step": 194110, "epoch": 4621} {"train_loss": -7.292309284210205, "global_step": 194111, "epoch": 4621} {"train_loss": -7.318010330200195, "global_step": 194112, "epoch": 4621} {"train_loss": -7.197035789489746, "global_step": 194113, "epoch": 4621} {"train_loss": -7.244502067565918, "global_step": 194114, "epoch": 4621} {"train_loss": -7.2029547691345215, "global_step": 194115, "epoch": 4621} {"train_loss": -7.010305404663086, "global_step": 194116, "epoch": 4621} {"train_loss": -7.177087783813477, "global_step": 194117, "epoch": 4621} {"train_loss": -7.189827919006348, "global_step": 194118, "epoch": 4621} {"train_loss": -7.239891052246094, "global_step": 194119, "epoch": 4621} {"train_loss": -7.224875450134277, "global_step": 194120, "epoch": 4621} {"train_loss": -7.103571891784668, "global_step": 194121, "epoch": 4621} {"train_loss": -7.193153381347656, "global_step": 194122, "epoch": 4621} {"train_loss": -7.249843892597017, "global_step": 194123, "epoch": 4621, "val_loss": 81296.90625} {"train_loss": -7.313921928405762, "global_step": 194124, "epoch": 4622} {"train_loss": -7.223069190979004, "global_step": 194125, "epoch": 4622} {"train_loss": -7.273612976074219, "global_step": 194126, "epoch": 4622} {"train_loss": -7.129976749420166, "global_step": 194127, "epoch": 4622} {"train_loss": -7.1299967765808105, "global_step": 194128, "epoch": 4622} {"train_loss": -7.246269226074219, "global_step": 194129, "epoch": 4622} {"train_loss": -7.1631364822387695, "global_step": 194130, "epoch": 4622} {"train_loss": -7.267467498779297, "global_step": 194131, "epoch": 4622} {"train_loss": -7.188246726989746, "global_step": 194132, "epoch": 4622} {"train_loss": -7.269510269165039, "global_step": 194133, "epoch": 4622} {"train_loss": -7.3286638259887695, "global_step": 194134, "epoch": 4622} {"train_loss": -7.273797512054443, "global_step": 194135, "epoch": 4622} {"train_loss": -7.3117170333862305, "global_step": 194136, "epoch": 4622} {"train_loss": -7.38075065612793, "global_step": 194137, "epoch": 4622} {"train_loss": -7.256307125091553, "global_step": 194138, "epoch": 4622} {"train_loss": -7.230480194091797, "global_step": 194139, "epoch": 4622} {"train_loss": -7.352581977844238, "global_step": 194140, "epoch": 4622} {"train_loss": -7.315914154052734, "global_step": 194141, "epoch": 4622} {"train_loss": -7.312786102294922, "global_step": 194142, "epoch": 4622} {"train_loss": -7.339947700500488, "global_step": 194143, "epoch": 4622} {"train_loss": -7.376018524169922, "global_step": 194144, "epoch": 4622} {"train_loss": -7.296853065490723, "global_step": 194145, "epoch": 4622} {"train_loss": -7.342034816741943, "global_step": 194146, "epoch": 4622} {"train_loss": -7.361310958862305, "global_step": 194147, "epoch": 4622} {"train_loss": -7.298407554626465, "global_step": 194148, "epoch": 4622} {"train_loss": -7.367290019989014, "global_step": 194149, "epoch": 4622} {"train_loss": -7.255041122436523, "global_step": 194150, "epoch": 4622} {"train_loss": -7.362180709838867, "global_step": 194151, "epoch": 4622} {"train_loss": -7.266422748565674, "global_step": 194152, "epoch": 4622} {"train_loss": -7.421483516693115, "global_step": 194153, "epoch": 4622} {"train_loss": -7.241119861602783, "global_step": 194154, "epoch": 4622} {"train_loss": -7.125771522521973, "global_step": 194155, "epoch": 4622} {"train_loss": -7.287781715393066, "global_step": 194156, "epoch": 4622} {"train_loss": -7.2466230392456055, "global_step": 194157, "epoch": 4622} {"train_loss": -7.119131088256836, "global_step": 194158, "epoch": 4622} {"train_loss": -7.263875484466553, "global_step": 194159, "epoch": 4622} {"train_loss": -7.302512168884277, "global_step": 194160, "epoch": 4622} {"train_loss": -7.225586891174316, "global_step": 194161, "epoch": 4622} {"train_loss": -7.279602527618408, "global_step": 194162, "epoch": 4622} {"train_loss": -7.231827259063721, "global_step": 194163, "epoch": 4622} {"train_loss": -7.157384872436523, "global_step": 194164, "epoch": 4622} {"train_loss": -7.270828723907471, "global_step": 194165, "epoch": 4622, "val_loss": 81258.2890625} {"train_loss": -7.311807632446289, "global_step": 194166, "epoch": 4623} {"train_loss": -7.209919452667236, "global_step": 194167, "epoch": 4623} {"train_loss": -7.202518939971924, "global_step": 194168, "epoch": 4623} {"train_loss": -7.313882827758789, "global_step": 194169, "epoch": 4623} {"train_loss": -7.233044624328613, "global_step": 194170, "epoch": 4623} {"train_loss": -7.171714782714844, "global_step": 194171, "epoch": 4623} {"train_loss": -7.267665863037109, "global_step": 194172, "epoch": 4623} {"train_loss": -7.2547149658203125, "global_step": 194173, "epoch": 4623} {"train_loss": -7.199069023132324, "global_step": 194174, "epoch": 4623} {"train_loss": -7.321124076843262, "global_step": 194175, "epoch": 4623} {"train_loss": -7.266756534576416, "global_step": 194176, "epoch": 4623} {"train_loss": -7.163387298583984, "global_step": 194177, "epoch": 4623} {"train_loss": -7.246511459350586, "global_step": 194178, "epoch": 4623} {"train_loss": -7.294063091278076, "global_step": 194179, "epoch": 4623} {"train_loss": -7.29896354675293, "global_step": 194180, "epoch": 4623} {"train_loss": -7.225411415100098, "global_step": 194181, "epoch": 4623} {"train_loss": -7.244406700134277, "global_step": 194182, "epoch": 4623} {"train_loss": -7.385193824768066, "global_step": 194183, "epoch": 4623} {"train_loss": -7.310776710510254, "global_step": 194184, "epoch": 4623} {"train_loss": -7.352511405944824, "global_step": 194185, "epoch": 4623} {"train_loss": -7.359927177429199, "global_step": 194186, "epoch": 4623} {"train_loss": -7.286293983459473, "global_step": 194187, "epoch": 4623} {"train_loss": -7.2293782234191895, "global_step": 194188, "epoch": 4623} {"train_loss": -7.3462018966674805, "global_step": 194189, "epoch": 4623} {"train_loss": -7.263797760009766, "global_step": 194190, "epoch": 4623} {"train_loss": -7.245296478271484, "global_step": 194191, "epoch": 4623} {"train_loss": -7.436716079711914, "global_step": 194192, "epoch": 4623} {"train_loss": -7.291303634643555, "global_step": 194193, "epoch": 4623} {"train_loss": -7.359215259552002, "global_step": 194194, "epoch": 4623} {"train_loss": -7.259659767150879, "global_step": 194195, "epoch": 4623} {"train_loss": -7.28985595703125, "global_step": 194196, "epoch": 4623} {"train_loss": -7.317845821380615, "global_step": 194197, "epoch": 4623} {"train_loss": -7.248528480529785, "global_step": 194198, "epoch": 4623} {"train_loss": -7.305832862854004, "global_step": 194199, "epoch": 4623} {"train_loss": -7.219794273376465, "global_step": 194200, "epoch": 4623} {"train_loss": -7.270928382873535, "global_step": 194201, "epoch": 4623} {"train_loss": -7.217752933502197, "global_step": 194202, "epoch": 4623} {"train_loss": -7.250716209411621, "global_step": 194203, "epoch": 4623} {"train_loss": -7.271965980529785, "global_step": 194204, "epoch": 4623} {"train_loss": -7.218526840209961, "global_step": 194205, "epoch": 4623} {"train_loss": -7.316429138183594, "global_step": 194206, "epoch": 4623} {"train_loss": -7.273689644677298, "global_step": 194207, "epoch": 4623, "val_loss": 81348.015625} {"train_loss": -7.131335258483887, "global_step": 194208, "epoch": 4624} {"train_loss": -7.241578102111816, "global_step": 194209, "epoch": 4624} {"train_loss": -7.2528910636901855, "global_step": 194210, "epoch": 4624} {"train_loss": -7.129645824432373, "global_step": 194211, "epoch": 4624} {"train_loss": -7.238996505737305, "global_step": 194212, "epoch": 4624} {"train_loss": -7.16890287399292, "global_step": 194213, "epoch": 4624} {"train_loss": -7.302639961242676, "global_step": 194214, "epoch": 4624} {"train_loss": -7.151052951812744, "global_step": 194215, "epoch": 4624} {"train_loss": -7.28110933303833, "global_step": 194216, "epoch": 4624} {"train_loss": -7.188019752502441, "global_step": 194217, "epoch": 4624} {"train_loss": -7.2608642578125, "global_step": 194218, "epoch": 4624} {"train_loss": -7.332934379577637, "global_step": 194219, "epoch": 4624} {"train_loss": -7.166583061218262, "global_step": 194220, "epoch": 4624} {"train_loss": -7.266132354736328, "global_step": 194221, "epoch": 4624} {"train_loss": -7.218329429626465, "global_step": 194222, "epoch": 4624} {"train_loss": -7.1381635665893555, "global_step": 194223, "epoch": 4624} {"train_loss": -7.28773307800293, "global_step": 194224, "epoch": 4624} {"train_loss": -7.24687385559082, "global_step": 194225, "epoch": 4624} {"train_loss": -7.286694526672363, "global_step": 194226, "epoch": 4624} {"train_loss": -7.29418420791626, "global_step": 194227, "epoch": 4624} {"train_loss": -7.229404449462891, "global_step": 194228, "epoch": 4624} {"train_loss": -7.296201229095459, "global_step": 194229, "epoch": 4624} {"train_loss": -7.202352523803711, "global_step": 194230, "epoch": 4624} {"train_loss": -7.261206150054932, "global_step": 194231, "epoch": 4624} {"train_loss": -7.127467632293701, "global_step": 194232, "epoch": 4624} {"train_loss": -7.365323066711426, "global_step": 194233, "epoch": 4624} {"train_loss": -7.251171112060547, "global_step": 194234, "epoch": 4624} {"train_loss": -7.2660627365112305, "global_step": 194235, "epoch": 4624} {"train_loss": -7.21512508392334, "global_step": 194236, "epoch": 4624} {"train_loss": -7.1804022789001465, "global_step": 194237, "epoch": 4624} {"train_loss": -7.233941078186035, "global_step": 194238, "epoch": 4624} {"train_loss": -7.09446907043457, "global_step": 194239, "epoch": 4624} {"train_loss": -7.266437530517578, "global_step": 194240, "epoch": 4624} {"train_loss": -7.148444652557373, "global_step": 194241, "epoch": 4624} {"train_loss": -7.25734806060791, "global_step": 194242, "epoch": 4624} {"train_loss": -7.197021007537842, "global_step": 194243, "epoch": 4624} {"train_loss": -7.280610084533691, "global_step": 194244, "epoch": 4624} {"train_loss": -7.214188575744629, "global_step": 194245, "epoch": 4624} {"train_loss": -7.13638162612915, "global_step": 194246, "epoch": 4624} {"train_loss": -7.308762550354004, "global_step": 194247, "epoch": 4624} {"train_loss": -7.2055439949035645, "global_step": 194248, "epoch": 4624} {"train_loss": -7.227733771006267, "global_step": 194249, "epoch": 4624, "val_loss": 81335.1796875} {"train_loss": -7.102217197418213, "global_step": 194250, "epoch": 4625} {"train_loss": -7.209004878997803, "global_step": 194251, "epoch": 4625} {"train_loss": -7.274613857269287, "global_step": 194252, "epoch": 4625} {"train_loss": -7.227569103240967, "global_step": 194253, "epoch": 4625} {"train_loss": -7.24801778793335, "global_step": 194254, "epoch": 4625} {"train_loss": -7.083929061889648, "global_step": 194255, "epoch": 4625} {"train_loss": -7.294826507568359, "global_step": 194256, "epoch": 4625} {"train_loss": -7.2715911865234375, "global_step": 194257, "epoch": 4625} {"train_loss": -7.230802536010742, "global_step": 194258, "epoch": 4625} {"train_loss": -7.309111595153809, "global_step": 194259, "epoch": 4625} {"train_loss": -7.261525630950928, "global_step": 194260, "epoch": 4625} {"train_loss": -7.344057083129883, "global_step": 194261, "epoch": 4625} {"train_loss": -7.184201240539551, "global_step": 194262, "epoch": 4625} {"train_loss": -7.1230926513671875, "global_step": 194263, "epoch": 4625} {"train_loss": -7.317131042480469, "global_step": 194264, "epoch": 4625} {"train_loss": -7.034455299377441, "global_step": 194265, "epoch": 4625} {"train_loss": -7.214662551879883, "global_step": 194266, "epoch": 4625} {"train_loss": -7.342361927032471, "global_step": 194267, "epoch": 4625} {"train_loss": -7.264575004577637, "global_step": 194268, "epoch": 4625} {"train_loss": -7.273182392120361, "global_step": 194269, "epoch": 4625} {"train_loss": -7.3575334548950195, "global_step": 194270, "epoch": 4625} {"train_loss": -7.137737274169922, "global_step": 194271, "epoch": 4625} {"train_loss": -7.351737022399902, "global_step": 194272, "epoch": 4625} {"train_loss": -7.363705635070801, "global_step": 194273, "epoch": 4625} {"train_loss": -7.236922264099121, "global_step": 194274, "epoch": 4625} {"train_loss": -7.171728134155273, "global_step": 194275, "epoch": 4625} {"train_loss": -7.321399688720703, "global_step": 194276, "epoch": 4625} {"train_loss": -7.336159706115723, "global_step": 194277, "epoch": 4625} {"train_loss": -7.272006034851074, "global_step": 194278, "epoch": 4625} {"train_loss": -7.2384934425354, "global_step": 194279, "epoch": 4625} {"train_loss": -7.19069242477417, "global_step": 194280, "epoch": 4625} {"train_loss": -7.260114669799805, "global_step": 194281, "epoch": 4625} {"train_loss": -7.320121765136719, "global_step": 194282, "epoch": 4625} {"train_loss": -7.354700088500977, "global_step": 194283, "epoch": 4625} {"train_loss": -7.077996730804443, "global_step": 194284, "epoch": 4625} {"train_loss": -7.30335807800293, "global_step": 194285, "epoch": 4625} {"train_loss": -7.2111663818359375, "global_step": 194286, "epoch": 4625} {"train_loss": -7.20082950592041, "global_step": 194287, "epoch": 4625} {"train_loss": -7.211637020111084, "global_step": 194288, "epoch": 4625} {"train_loss": -7.333668231964111, "global_step": 194289, "epoch": 4625} {"train_loss": -7.342517852783203, "global_step": 194290, "epoch": 4625} {"train_loss": -7.248226018179031, "global_step": 194291, "epoch": 4625, "val_loss": 80997.921875} {"train_loss": -7.330229759216309, "global_step": 194292, "epoch": 4626} {"train_loss": -7.264645099639893, "global_step": 194293, "epoch": 4626} {"train_loss": -7.29765510559082, "global_step": 194294, "epoch": 4626} {"train_loss": -7.247962951660156, "global_step": 194295, "epoch": 4626} {"train_loss": -7.300285816192627, "global_step": 194296, "epoch": 4626} {"train_loss": -7.2440690994262695, "global_step": 194297, "epoch": 4626} {"train_loss": -7.20147705078125, "global_step": 194298, "epoch": 4626} {"train_loss": -7.244524002075195, "global_step": 194299, "epoch": 4626} {"train_loss": -7.3856520652771, "global_step": 194300, "epoch": 4626} {"train_loss": -7.332406044006348, "global_step": 194301, "epoch": 4626} {"train_loss": -7.382145881652832, "global_step": 194302, "epoch": 4626} {"train_loss": -7.172464370727539, "global_step": 194303, "epoch": 4626} {"train_loss": -7.265921592712402, "global_step": 194304, "epoch": 4626} {"train_loss": -7.243844985961914, "global_step": 194305, "epoch": 4626} {"train_loss": -7.224470138549805, "global_step": 194306, "epoch": 4626} {"train_loss": -7.222041130065918, "global_step": 194307, "epoch": 4626} {"train_loss": -7.307978630065918, "global_step": 194308, "epoch": 4626} {"train_loss": -7.285671710968018, "global_step": 194309, "epoch": 4626} {"train_loss": -6.996589183807373, "global_step": 194310, "epoch": 4626} {"train_loss": -7.223170280456543, "global_step": 194311, "epoch": 4626} {"train_loss": -7.171947479248047, "global_step": 194312, "epoch": 4626} {"train_loss": -7.133669853210449, "global_step": 194313, "epoch": 4626} {"train_loss": -7.361147880554199, "global_step": 194314, "epoch": 4626} {"train_loss": -7.017806053161621, "global_step": 194315, "epoch": 4626} {"train_loss": -7.09531307220459, "global_step": 194316, "epoch": 4626} {"train_loss": -7.181519985198975, "global_step": 194317, "epoch": 4626} {"train_loss": -6.9743733406066895, "global_step": 194318, "epoch": 4626} {"train_loss": -7.108829498291016, "global_step": 194319, "epoch": 4626} {"train_loss": -7.19529390335083, "global_step": 194320, "epoch": 4626} {"train_loss": -6.962760925292969, "global_step": 194321, "epoch": 4626} {"train_loss": -7.1704206466674805, "global_step": 194322, "epoch": 4626} {"train_loss": -7.040016174316406, "global_step": 194323, "epoch": 4626} {"train_loss": -7.115820407867432, "global_step": 194324, "epoch": 4626} {"train_loss": -7.215216159820557, "global_step": 194325, "epoch": 4626} {"train_loss": -7.158780097961426, "global_step": 194326, "epoch": 4626} {"train_loss": -7.15325927734375, "global_step": 194327, "epoch": 4626} {"train_loss": -7.266932487487793, "global_step": 194328, "epoch": 4626} {"train_loss": -7.152799129486084, "global_step": 194329, "epoch": 4626} {"train_loss": -7.230237007141113, "global_step": 194330, "epoch": 4626} {"train_loss": -7.116736888885498, "global_step": 194331, "epoch": 4626} {"train_loss": -7.257314205169678, "global_step": 194332, "epoch": 4626} {"train_loss": -7.201857623599825, "global_step": 194333, "epoch": 4626, "val_loss": 81170.2265625} {"train_loss": -7.218033790588379, "global_step": 194334, "epoch": 4627} {"train_loss": -7.212738037109375, "global_step": 194335, "epoch": 4627} {"train_loss": -7.271617412567139, "global_step": 194336, "epoch": 4627} {"train_loss": -7.1581926345825195, "global_step": 194337, "epoch": 4627} {"train_loss": -7.347621440887451, "global_step": 194338, "epoch": 4627} {"train_loss": -7.291866302490234, "global_step": 194339, "epoch": 4627} {"train_loss": -7.270143508911133, "global_step": 194340, "epoch": 4627} {"train_loss": -7.235565662384033, "global_step": 194341, "epoch": 4627} {"train_loss": -7.282430648803711, "global_step": 194342, "epoch": 4627} {"train_loss": -7.285067081451416, "global_step": 194343, "epoch": 4627} {"train_loss": -7.198660850524902, "global_step": 194344, "epoch": 4627} {"train_loss": -7.154085159301758, "global_step": 194345, "epoch": 4627} {"train_loss": -7.107687950134277, "global_step": 194346, "epoch": 4627} {"train_loss": -7.191584587097168, "global_step": 194347, "epoch": 4627} {"train_loss": -7.173352241516113, "global_step": 194348, "epoch": 4627} {"train_loss": -7.2082133293151855, "global_step": 194349, "epoch": 4627} {"train_loss": -7.211269378662109, "global_step": 194350, "epoch": 4627} {"train_loss": -7.194087505340576, "global_step": 194351, "epoch": 4627} {"train_loss": -7.153969764709473, "global_step": 194352, "epoch": 4627} {"train_loss": -7.167159080505371, "global_step": 194353, "epoch": 4627} {"train_loss": -7.167581081390381, "global_step": 194354, "epoch": 4627} {"train_loss": -7.229958534240723, "global_step": 194355, "epoch": 4627} {"train_loss": -7.214071750640869, "global_step": 194356, "epoch": 4627} {"train_loss": -7.271000862121582, "global_step": 194357, "epoch": 4627} {"train_loss": -7.2895989418029785, "global_step": 194358, "epoch": 4627} {"train_loss": -7.245138168334961, "global_step": 194359, "epoch": 4627} {"train_loss": -7.326661109924316, "global_step": 194360, "epoch": 4627} {"train_loss": -7.417313098907471, "global_step": 194361, "epoch": 4627} {"train_loss": -7.281373977661133, "global_step": 194362, "epoch": 4627} {"train_loss": -7.2624311447143555, "global_step": 194363, "epoch": 4627} {"train_loss": -7.332706451416016, "global_step": 194364, "epoch": 4627} {"train_loss": -7.352288246154785, "global_step": 194365, "epoch": 4627} {"train_loss": -7.259537220001221, "global_step": 194366, "epoch": 4627} {"train_loss": -7.309103012084961, "global_step": 194367, "epoch": 4627} {"train_loss": -7.143956661224365, "global_step": 194368, "epoch": 4627} {"train_loss": -7.337791442871094, "global_step": 194369, "epoch": 4627} {"train_loss": -7.383105278015137, "global_step": 194370, "epoch": 4627} {"train_loss": -7.317782878875732, "global_step": 194371, "epoch": 4627} {"train_loss": -7.300689697265625, "global_step": 194372, "epoch": 4627} {"train_loss": -7.250907897949219, "global_step": 194373, "epoch": 4627} {"train_loss": -7.315469264984131, "global_step": 194374, "epoch": 4627} {"train_loss": -7.253683510280791, "global_step": 194375, "epoch": 4627, "val_loss": 81234.234375} {"train_loss": -7.2960286140441895, "global_step": 194376, "epoch": 4628} {"train_loss": -7.346681118011475, "global_step": 194377, "epoch": 4628} {"train_loss": -7.245414733886719, "global_step": 194378, "epoch": 4628} {"train_loss": -7.3233113288879395, "global_step": 194379, "epoch": 4628} {"train_loss": -7.393683433532715, "global_step": 194380, "epoch": 4628} {"train_loss": -7.394691467285156, "global_step": 194381, "epoch": 4628} {"train_loss": -7.2147216796875, "global_step": 194382, "epoch": 4628} {"train_loss": -7.386441230773926, "global_step": 194383, "epoch": 4628} {"train_loss": -7.21607780456543, "global_step": 194384, "epoch": 4628} {"train_loss": -7.354140281677246, "global_step": 194385, "epoch": 4628} {"train_loss": -7.189369201660156, "global_step": 194386, "epoch": 4628} {"train_loss": -7.286243438720703, "global_step": 194387, "epoch": 4628} {"train_loss": -7.310064315795898, "global_step": 194388, "epoch": 4628} {"train_loss": -7.276200294494629, "global_step": 194389, "epoch": 4628} {"train_loss": -7.242177963256836, "global_step": 194390, "epoch": 4628} {"train_loss": -7.390102863311768, "global_step": 194391, "epoch": 4628} {"train_loss": -7.263976097106934, "global_step": 194392, "epoch": 4628} {"train_loss": -7.321268081665039, "global_step": 194393, "epoch": 4628} {"train_loss": -7.258553504943848, "global_step": 194394, "epoch": 4628} {"train_loss": -7.226685047149658, "global_step": 194395, "epoch": 4628} {"train_loss": -7.412839889526367, "global_step": 194396, "epoch": 4628} {"train_loss": -7.2031965255737305, "global_step": 194397, "epoch": 4628} {"train_loss": -7.321172714233398, "global_step": 194398, "epoch": 4628} {"train_loss": -7.336305618286133, "global_step": 194399, "epoch": 4628} {"train_loss": -7.299482822418213, "global_step": 194400, "epoch": 4628} {"train_loss": -7.265694618225098, "global_step": 194401, "epoch": 4628} {"train_loss": -7.232991695404053, "global_step": 194402, "epoch": 4628} {"train_loss": -7.362668991088867, "global_step": 194403, "epoch": 4628} {"train_loss": -7.283799648284912, "global_step": 194404, "epoch": 4628} {"train_loss": -7.294270992279053, "global_step": 194405, "epoch": 4628} {"train_loss": -7.346294403076172, "global_step": 194406, "epoch": 4628} {"train_loss": -7.151736259460449, "global_step": 194407, "epoch": 4628} {"train_loss": -7.332371711730957, "global_step": 194408, "epoch": 4628} {"train_loss": -7.273151397705078, "global_step": 194409, "epoch": 4628} {"train_loss": -7.357639312744141, "global_step": 194410, "epoch": 4628} {"train_loss": -7.268618583679199, "global_step": 194411, "epoch": 4628} {"train_loss": -7.35356330871582, "global_step": 194412, "epoch": 4628} {"train_loss": -7.244657516479492, "global_step": 194413, "epoch": 4628} {"train_loss": -7.319255828857422, "global_step": 194414, "epoch": 4628} {"train_loss": -7.252084732055664, "global_step": 194415, "epoch": 4628} {"train_loss": -7.34226655960083, "global_step": 194416, "epoch": 4628} {"train_loss": -7.295580625534058, "global_step": 194417, "epoch": 4628, "val_loss": 81294.8203125} {"train_loss": -7.319525718688965, "global_step": 194418, "epoch": 4629} {"train_loss": -7.399968147277832, "global_step": 194419, "epoch": 4629} {"train_loss": -7.164737701416016, "global_step": 194420, "epoch": 4629} {"train_loss": -7.331694602966309, "global_step": 194421, "epoch": 4629} {"train_loss": -7.380711078643799, "global_step": 194422, "epoch": 4629} {"train_loss": -7.206622123718262, "global_step": 194423, "epoch": 4629} {"train_loss": -7.2671403884887695, "global_step": 194424, "epoch": 4629} {"train_loss": -7.227414131164551, "global_step": 194425, "epoch": 4629} {"train_loss": -7.14005184173584, "global_step": 194426, "epoch": 4629} {"train_loss": -7.273751258850098, "global_step": 194427, "epoch": 4629} {"train_loss": -7.259273529052734, "global_step": 194428, "epoch": 4629} {"train_loss": -7.21579647064209, "global_step": 194429, "epoch": 4629} {"train_loss": -7.124082565307617, "global_step": 194430, "epoch": 4629} {"train_loss": -7.207729816436768, "global_step": 194431, "epoch": 4629} {"train_loss": -7.224020957946777, "global_step": 194432, "epoch": 4629} {"train_loss": -7.242879867553711, "global_step": 194433, "epoch": 4629} {"train_loss": -7.063046932220459, "global_step": 194434, "epoch": 4629} {"train_loss": -7.222866535186768, "global_step": 194435, "epoch": 4629} {"train_loss": -7.171104431152344, "global_step": 194436, "epoch": 4629} {"train_loss": -7.282680511474609, "global_step": 194437, "epoch": 4629} {"train_loss": -7.215555191040039, "global_step": 194438, "epoch": 4629} {"train_loss": -7.153482437133789, "global_step": 194439, "epoch": 4629} {"train_loss": -7.126277446746826, "global_step": 194440, "epoch": 4629} {"train_loss": -7.2118706703186035, "global_step": 194441, "epoch": 4629} {"train_loss": -7.244841575622559, "global_step": 194442, "epoch": 4629} {"train_loss": -7.278835773468018, "global_step": 194443, "epoch": 4629} {"train_loss": -7.31658411026001, "global_step": 194444, "epoch": 4629} {"train_loss": -7.364947319030762, "global_step": 194445, "epoch": 4629} {"train_loss": -7.354855537414551, "global_step": 194446, "epoch": 4629} {"train_loss": -7.319701671600342, "global_step": 194447, "epoch": 4629} {"train_loss": -7.309051036834717, "global_step": 194448, "epoch": 4629} {"train_loss": -7.305665016174316, "global_step": 194449, "epoch": 4629} {"train_loss": -7.305530548095703, "global_step": 194450, "epoch": 4629} {"train_loss": -7.455691814422607, "global_step": 194451, "epoch": 4629} {"train_loss": -7.283904552459717, "global_step": 194452, "epoch": 4629} {"train_loss": -7.346796989440918, "global_step": 194453, "epoch": 4629} {"train_loss": -7.326110363006592, "global_step": 194454, "epoch": 4629} {"train_loss": -7.312170028686523, "global_step": 194455, "epoch": 4629} {"train_loss": -7.441842079162598, "global_step": 194456, "epoch": 4629} {"train_loss": -7.340208053588867, "global_step": 194457, "epoch": 4629} {"train_loss": -7.435953140258789, "global_step": 194458, "epoch": 4629} {"train_loss": -7.271569944563366, "global_step": 194459, "epoch": 4629, "val_loss": 81128.71875} {"train_loss": -7.349787712097168, "global_step": 194460, "epoch": 4630} {"train_loss": -7.296576499938965, "global_step": 194461, "epoch": 4630} {"train_loss": -7.329004764556885, "global_step": 194462, "epoch": 4630} {"train_loss": -7.081008434295654, "global_step": 194463, "epoch": 4630} {"train_loss": -7.163343906402588, "global_step": 194464, "epoch": 4630} {"train_loss": -7.388045787811279, "global_step": 194465, "epoch": 4630} {"train_loss": -7.272209167480469, "global_step": 194466, "epoch": 4630} {"train_loss": -7.2101287841796875, "global_step": 194467, "epoch": 4630} {"train_loss": -7.082853317260742, "global_step": 194468, "epoch": 4630} {"train_loss": -7.314722061157227, "global_step": 194469, "epoch": 4630} {"train_loss": -7.005014419555664, "global_step": 194470, "epoch": 4630} {"train_loss": -7.068479537963867, "global_step": 194471, "epoch": 4630} {"train_loss": -7.195126056671143, "global_step": 194472, "epoch": 4630} {"train_loss": -7.21408748626709, "global_step": 194473, "epoch": 4630} {"train_loss": -7.093860149383545, "global_step": 194474, "epoch": 4630} {"train_loss": -7.204596042633057, "global_step": 194475, "epoch": 4630} {"train_loss": -7.090548515319824, "global_step": 194476, "epoch": 4630} {"train_loss": -7.175711631774902, "global_step": 194477, "epoch": 4630} {"train_loss": -7.186927795410156, "global_step": 194478, "epoch": 4630} {"train_loss": -7.013934135437012, "global_step": 194479, "epoch": 4630} {"train_loss": -7.199980735778809, "global_step": 194480, "epoch": 4630} {"train_loss": -7.04203987121582, "global_step": 194481, "epoch": 4630} {"train_loss": -7.115627765655518, "global_step": 194482, "epoch": 4630} {"train_loss": -7.035640716552734, "global_step": 194483, "epoch": 4630} {"train_loss": -6.964025974273682, "global_step": 194484, "epoch": 4630} {"train_loss": -7.07535457611084, "global_step": 194485, "epoch": 4630} {"train_loss": -6.892873764038086, "global_step": 194486, "epoch": 4630} {"train_loss": -7.183906555175781, "global_step": 194487, "epoch": 4630} {"train_loss": -7.064522743225098, "global_step": 194488, "epoch": 4630} {"train_loss": -7.188441276550293, "global_step": 194489, "epoch": 4630} {"train_loss": -7.083438396453857, "global_step": 194490, "epoch": 4630} {"train_loss": -7.185975074768066, "global_step": 194491, "epoch": 4630} {"train_loss": -7.077523231506348, "global_step": 194492, "epoch": 4630} {"train_loss": -7.001070976257324, "global_step": 194493, "epoch": 4630} {"train_loss": -7.257694244384766, "global_step": 194494, "epoch": 4630} {"train_loss": -7.075186729431152, "global_step": 194495, "epoch": 4630} {"train_loss": -7.237087249755859, "global_step": 194496, "epoch": 4630} {"train_loss": -7.135893821716309, "global_step": 194497, "epoch": 4630} {"train_loss": -7.256183624267578, "global_step": 194498, "epoch": 4630} {"train_loss": -7.188048839569092, "global_step": 194499, "epoch": 4630} {"train_loss": -7.252900123596191, "global_step": 194500, "epoch": 4630} {"train_loss": -7.153465566181001, "global_step": 194501, "epoch": 4630, "val_loss": 81156.5859375} {"train_loss": -7.210878372192383, "global_step": 194502, "epoch": 4631} {"train_loss": -7.36710262298584, "global_step": 194503, "epoch": 4631} {"train_loss": -7.120326519012451, "global_step": 194504, "epoch": 4631} {"train_loss": -7.255288124084473, "global_step": 194505, "epoch": 4631} {"train_loss": -7.30673885345459, "global_step": 194506, "epoch": 4631} {"train_loss": -7.136775493621826, "global_step": 194507, "epoch": 4631} {"train_loss": -7.113643646240234, "global_step": 194508, "epoch": 4631} {"train_loss": -7.414690971374512, "global_step": 194509, "epoch": 4631} {"train_loss": -7.270552158355713, "global_step": 194510, "epoch": 4631} {"train_loss": -7.3897576332092285, "global_step": 194511, "epoch": 4631} {"train_loss": -7.2363457679748535, "global_step": 194512, "epoch": 4631} {"train_loss": -7.288482666015625, "global_step": 194513, "epoch": 4631} {"train_loss": -7.231886863708496, "global_step": 194514, "epoch": 4631} {"train_loss": -7.275232791900635, "global_step": 194515, "epoch": 4631} {"train_loss": -7.300543785095215, "global_step": 194516, "epoch": 4631} {"train_loss": -7.340505599975586, "global_step": 194517, "epoch": 4631} {"train_loss": -7.364219665527344, "global_step": 194518, "epoch": 4631} {"train_loss": -7.278996467590332, "global_step": 194519, "epoch": 4631} {"train_loss": -7.3754682540893555, "global_step": 194520, "epoch": 4631} {"train_loss": -7.232835292816162, "global_step": 194521, "epoch": 4631} {"train_loss": -7.268170356750488, "global_step": 194522, "epoch": 4631} {"train_loss": -7.269240856170654, "global_step": 194523, "epoch": 4631} {"train_loss": -7.118382453918457, "global_step": 194524, "epoch": 4631} {"train_loss": -7.256326675415039, "global_step": 194525, "epoch": 4631} {"train_loss": -7.188920974731445, "global_step": 194526, "epoch": 4631} {"train_loss": -7.145784378051758, "global_step": 194527, "epoch": 4631} {"train_loss": -7.296044826507568, "global_step": 194528, "epoch": 4631} {"train_loss": -7.125380039215088, "global_step": 194529, "epoch": 4631} {"train_loss": -7.076744079589844, "global_step": 194530, "epoch": 4631} {"train_loss": -7.1108598709106445, "global_step": 194531, "epoch": 4631} {"train_loss": -7.072269439697266, "global_step": 194532, "epoch": 4631} {"train_loss": -7.098862648010254, "global_step": 194533, "epoch": 4631} {"train_loss": -7.187690734863281, "global_step": 194534, "epoch": 4631} {"train_loss": -7.1123199462890625, "global_step": 194535, "epoch": 4631} {"train_loss": -7.102063179016113, "global_step": 194536, "epoch": 4631} {"train_loss": -7.234507083892822, "global_step": 194537, "epoch": 4631} {"train_loss": -7.114485740661621, "global_step": 194538, "epoch": 4631} {"train_loss": -7.206271171569824, "global_step": 194539, "epoch": 4631} {"train_loss": -7.178330898284912, "global_step": 194540, "epoch": 4631} {"train_loss": -7.224773406982422, "global_step": 194541, "epoch": 4631} {"train_loss": -7.233955383300781, "global_step": 194542, "epoch": 4631} {"train_loss": -7.2203092348007925, "global_step": 194543, "epoch": 4631, "val_loss": 81160.1875} {"train_loss": -7.231919288635254, "global_step": 194544, "epoch": 4632} {"train_loss": -7.2855448722839355, "global_step": 194545, "epoch": 4632} {"train_loss": -7.246730804443359, "global_step": 194546, "epoch": 4632} {"train_loss": -7.226862907409668, "global_step": 194547, "epoch": 4632} {"train_loss": -7.2257280349731445, "global_step": 194548, "epoch": 4632} {"train_loss": -7.215115547180176, "global_step": 194549, "epoch": 4632} {"train_loss": -7.33498477935791, "global_step": 194550, "epoch": 4632} {"train_loss": -7.302346229553223, "global_step": 194551, "epoch": 4632} {"train_loss": -7.32539176940918, "global_step": 194552, "epoch": 4632} {"train_loss": -7.282680988311768, "global_step": 194553, "epoch": 4632} {"train_loss": -7.269792556762695, "global_step": 194554, "epoch": 4632} {"train_loss": -7.2227783203125, "global_step": 194555, "epoch": 4632} {"train_loss": -7.272907733917236, "global_step": 194556, "epoch": 4632} {"train_loss": -7.318177223205566, "global_step": 194557, "epoch": 4632} {"train_loss": -7.201136112213135, "global_step": 194558, "epoch": 4632} {"train_loss": -7.321335315704346, "global_step": 194559, "epoch": 4632} {"train_loss": -7.382484436035156, "global_step": 194560, "epoch": 4632} {"train_loss": -7.262763977050781, "global_step": 194561, "epoch": 4632} {"train_loss": -7.3050689697265625, "global_step": 194562, "epoch": 4632} {"train_loss": -7.396516799926758, "global_step": 194563, "epoch": 4632} {"train_loss": -7.321441650390625, "global_step": 194564, "epoch": 4632} {"train_loss": -7.284902572631836, "global_step": 194565, "epoch": 4632} {"train_loss": -7.25257682800293, "global_step": 194566, "epoch": 4632} {"train_loss": -7.306974411010742, "global_step": 194567, "epoch": 4632} {"train_loss": -7.31911039352417, "global_step": 194568, "epoch": 4632} {"train_loss": -7.325069427490234, "global_step": 194569, "epoch": 4632} {"train_loss": -7.312042236328125, "global_step": 194570, "epoch": 4632} {"train_loss": -7.316616058349609, "global_step": 194571, "epoch": 4632} {"train_loss": -7.373364448547363, "global_step": 194572, "epoch": 4632} {"train_loss": -7.297004699707031, "global_step": 194573, "epoch": 4632} {"train_loss": -7.230070114135742, "global_step": 194574, "epoch": 4632} {"train_loss": -7.221367359161377, "global_step": 194575, "epoch": 4632} {"train_loss": -7.361583232879639, "global_step": 194576, "epoch": 4632} {"train_loss": -7.360315322875977, "global_step": 194577, "epoch": 4632} {"train_loss": -7.205883979797363, "global_step": 194578, "epoch": 4632} {"train_loss": -7.19711971282959, "global_step": 194579, "epoch": 4632} {"train_loss": -7.335223197937012, "global_step": 194580, "epoch": 4632} {"train_loss": -7.219121932983398, "global_step": 194581, "epoch": 4632} {"train_loss": -7.376659393310547, "global_step": 194582, "epoch": 4632} {"train_loss": -7.369553565979004, "global_step": 194583, "epoch": 4632} {"train_loss": -7.3767170906066895, "global_step": 194584, "epoch": 4632} {"train_loss": -7.29422604470026, "global_step": 194585, "epoch": 4632, "val_loss": 81197.671875} {"train_loss": -7.329263210296631, "global_step": 194586, "epoch": 4633} {"train_loss": -7.314913749694824, "global_step": 194587, "epoch": 4633} {"train_loss": -7.408548355102539, "global_step": 194588, "epoch": 4633} {"train_loss": -7.428003311157227, "global_step": 194589, "epoch": 4633} {"train_loss": -7.293907165527344, "global_step": 194590, "epoch": 4633} {"train_loss": -7.3117852210998535, "global_step": 194591, "epoch": 4633} {"train_loss": -7.346560478210449, "global_step": 194592, "epoch": 4633} {"train_loss": -7.249440670013428, "global_step": 194593, "epoch": 4633} {"train_loss": -7.3030314445495605, "global_step": 194594, "epoch": 4633} {"train_loss": -7.402640342712402, "global_step": 194595, "epoch": 4633} {"train_loss": -7.209954261779785, "global_step": 194596, "epoch": 4633} {"train_loss": -7.234309196472168, "global_step": 194597, "epoch": 4633} {"train_loss": -7.084404945373535, "global_step": 194598, "epoch": 4633} {"train_loss": -7.1983795166015625, "global_step": 194599, "epoch": 4633} {"train_loss": -7.27708625793457, "global_step": 194600, "epoch": 4633} {"train_loss": -7.165604591369629, "global_step": 194601, "epoch": 4633} {"train_loss": -7.257174968719482, "global_step": 194602, "epoch": 4633} {"train_loss": -7.196112632751465, "global_step": 194603, "epoch": 4633} {"train_loss": -7.237098217010498, "global_step": 194604, "epoch": 4633} {"train_loss": -7.270133018493652, "global_step": 194605, "epoch": 4633} {"train_loss": -7.20111608505249, "global_step": 194606, "epoch": 4633} {"train_loss": -7.096869468688965, "global_step": 194607, "epoch": 4633} {"train_loss": -7.264752388000488, "global_step": 194608, "epoch": 4633} {"train_loss": -7.281937599182129, "global_step": 194609, "epoch": 4633} {"train_loss": -7.199848175048828, "global_step": 194610, "epoch": 4633} {"train_loss": -7.14439582824707, "global_step": 194611, "epoch": 4633} {"train_loss": -7.217015266418457, "global_step": 194612, "epoch": 4633} {"train_loss": -7.153398513793945, "global_step": 194613, "epoch": 4633} {"train_loss": -7.102558135986328, "global_step": 194614, "epoch": 4633} {"train_loss": -7.12619686126709, "global_step": 194615, "epoch": 4633} {"train_loss": -7.060079097747803, "global_step": 194616, "epoch": 4633} {"train_loss": -7.23001766204834, "global_step": 194617, "epoch": 4633} {"train_loss": -7.114768981933594, "global_step": 194618, "epoch": 4633} {"train_loss": -7.224333763122559, "global_step": 194619, "epoch": 4633} {"train_loss": -7.1122236251831055, "global_step": 194620, "epoch": 4633} {"train_loss": -7.166301727294922, "global_step": 194621, "epoch": 4633} {"train_loss": -7.141632080078125, "global_step": 194622, "epoch": 4633} {"train_loss": -7.237484931945801, "global_step": 194623, "epoch": 4633} {"train_loss": -7.066109657287598, "global_step": 194624, "epoch": 4633} {"train_loss": -7.301478385925293, "global_step": 194625, "epoch": 4633} {"train_loss": -7.077390670776367, "global_step": 194626, "epoch": 4633} {"train_loss": -7.219889674867902, "global_step": 194627, "epoch": 4633, "val_loss": 81285.09375} {"train_loss": -7.185844421386719, "global_step": 194628, "epoch": 4634} {"train_loss": -7.297711372375488, "global_step": 194629, "epoch": 4634} {"train_loss": -7.247109413146973, "global_step": 194630, "epoch": 4634} {"train_loss": -7.245620250701904, "global_step": 194631, "epoch": 4634} {"train_loss": -7.254289150238037, "global_step": 194632, "epoch": 4634} {"train_loss": -7.100035667419434, "global_step": 194633, "epoch": 4634} {"train_loss": -7.16041898727417, "global_step": 194634, "epoch": 4634} {"train_loss": -7.137788772583008, "global_step": 194635, "epoch": 4634} {"train_loss": -7.186008453369141, "global_step": 194636, "epoch": 4634} {"train_loss": -7.285202980041504, "global_step": 194637, "epoch": 4634} {"train_loss": -7.198888301849365, "global_step": 194638, "epoch": 4634} {"train_loss": -7.252250671386719, "global_step": 194639, "epoch": 4634} {"train_loss": -7.190725326538086, "global_step": 194640, "epoch": 4634} {"train_loss": -7.287379264831543, "global_step": 194641, "epoch": 4634} {"train_loss": -7.226006984710693, "global_step": 194642, "epoch": 4634} {"train_loss": -7.110957145690918, "global_step": 194643, "epoch": 4634} {"train_loss": -7.271524906158447, "global_step": 194644, "epoch": 4634} {"train_loss": -7.307260513305664, "global_step": 194645, "epoch": 4634} {"train_loss": -7.389556884765625, "global_step": 194646, "epoch": 4634} {"train_loss": -7.325469493865967, "global_step": 194647, "epoch": 4634} {"train_loss": -7.221806526184082, "global_step": 194648, "epoch": 4634} {"train_loss": -7.305721282958984, "global_step": 194649, "epoch": 4634} {"train_loss": -7.238469123840332, "global_step": 194650, "epoch": 4634} {"train_loss": -7.223323822021484, "global_step": 194651, "epoch": 4634} {"train_loss": -7.2982282638549805, "global_step": 194652, "epoch": 4634} {"train_loss": -7.189242362976074, "global_step": 194653, "epoch": 4634} {"train_loss": -7.238317489624023, "global_step": 194654, "epoch": 4634} {"train_loss": -7.318634986877441, "global_step": 194655, "epoch": 4634} {"train_loss": -7.292354583740234, "global_step": 194656, "epoch": 4634} {"train_loss": -7.238282203674316, "global_step": 194657, "epoch": 4634} {"train_loss": -7.352877616882324, "global_step": 194658, "epoch": 4634} {"train_loss": -7.227956771850586, "global_step": 194659, "epoch": 4634} {"train_loss": -7.24216365814209, "global_step": 194660, "epoch": 4634} {"train_loss": -7.2939300537109375, "global_step": 194661, "epoch": 4634} {"train_loss": -7.177649974822998, "global_step": 194662, "epoch": 4634} {"train_loss": -7.2626423835754395, "global_step": 194663, "epoch": 4634} {"train_loss": -7.2798848152160645, "global_step": 194664, "epoch": 4634} {"train_loss": -7.270073890686035, "global_step": 194665, "epoch": 4634} {"train_loss": -7.3072710037231445, "global_step": 194666, "epoch": 4634} {"train_loss": -7.238171577453613, "global_step": 194667, "epoch": 4634} {"train_loss": -7.249399185180664, "global_step": 194668, "epoch": 4634} {"train_loss": -7.248777366819835, "global_step": 194669, "epoch": 4634, "val_loss": 81160.1484375} {"train_loss": -7.300958633422852, "global_step": 194670, "epoch": 4635} {"train_loss": -7.26273250579834, "global_step": 194671, "epoch": 4635} {"train_loss": -7.25590705871582, "global_step": 194672, "epoch": 4635} {"train_loss": -7.3153862953186035, "global_step": 194673, "epoch": 4635} {"train_loss": -7.3113508224487305, "global_step": 194674, "epoch": 4635} {"train_loss": -7.281367301940918, "global_step": 194675, "epoch": 4635} {"train_loss": -7.27957820892334, "global_step": 194676, "epoch": 4635} {"train_loss": -7.355120658874512, "global_step": 194677, "epoch": 4635} {"train_loss": -7.296607971191406, "global_step": 194678, "epoch": 4635} {"train_loss": -7.320824146270752, "global_step": 194679, "epoch": 4635} {"train_loss": -7.312602996826172, "global_step": 194680, "epoch": 4635} {"train_loss": -7.396626949310303, "global_step": 194681, "epoch": 4635} {"train_loss": -7.2288103103637695, "global_step": 194682, "epoch": 4635} {"train_loss": -7.200288772583008, "global_step": 194683, "epoch": 4635} {"train_loss": -7.203613758087158, "global_step": 194684, "epoch": 4635} {"train_loss": -7.239195823669434, "global_step": 194685, "epoch": 4635} {"train_loss": -7.240111351013184, "global_step": 194686, "epoch": 4635} {"train_loss": -7.31102180480957, "global_step": 194687, "epoch": 4635} {"train_loss": -7.366876602172852, "global_step": 194688, "epoch": 4635} {"train_loss": -7.064421653747559, "global_step": 194689, "epoch": 4635} {"train_loss": -7.172036170959473, "global_step": 194690, "epoch": 4635} {"train_loss": -7.116333961486816, "global_step": 194691, "epoch": 4635} {"train_loss": -7.2285661697387695, "global_step": 194692, "epoch": 4635} {"train_loss": -7.246387481689453, "global_step": 194693, "epoch": 4635} {"train_loss": -7.201238632202148, "global_step": 194694, "epoch": 4635} {"train_loss": -7.095867156982422, "global_step": 194695, "epoch": 4635} {"train_loss": -7.187541484832764, "global_step": 194696, "epoch": 4635} {"train_loss": -7.198150634765625, "global_step": 194697, "epoch": 4635} {"train_loss": -7.259481906890869, "global_step": 194698, "epoch": 4635} {"train_loss": -7.263552665710449, "global_step": 194699, "epoch": 4635} {"train_loss": -7.156340599060059, "global_step": 194700, "epoch": 4635} {"train_loss": -7.252838134765625, "global_step": 194701, "epoch": 4635} {"train_loss": -7.219256401062012, "global_step": 194702, "epoch": 4635} {"train_loss": -7.312122344970703, "global_step": 194703, "epoch": 4635} {"train_loss": -7.290127754211426, "global_step": 194704, "epoch": 4635} {"train_loss": -7.351280212402344, "global_step": 194705, "epoch": 4635} {"train_loss": -7.2956438064575195, "global_step": 194706, "epoch": 4635} {"train_loss": -7.2250471115112305, "global_step": 194707, "epoch": 4635} {"train_loss": -7.302214622497559, "global_step": 194708, "epoch": 4635} {"train_loss": -7.222907066345215, "global_step": 194709, "epoch": 4635} {"train_loss": -7.218868255615234, "global_step": 194710, "epoch": 4635} {"train_loss": -7.249803781509399, "global_step": 194711, "epoch": 4635, "val_loss": 81127.0859375} {"train_loss": -7.145200252532959, "global_step": 194712, "epoch": 4636} {"train_loss": -7.214649677276611, "global_step": 194713, "epoch": 4636} {"train_loss": -7.178808689117432, "global_step": 194714, "epoch": 4636} {"train_loss": -7.169619560241699, "global_step": 194715, "epoch": 4636} {"train_loss": -7.230425834655762, "global_step": 194716, "epoch": 4636} {"train_loss": -7.151060104370117, "global_step": 194717, "epoch": 4636} {"train_loss": -7.326537132263184, "global_step": 194718, "epoch": 4636} {"train_loss": -7.183830261230469, "global_step": 194719, "epoch": 4636} {"train_loss": -7.268833160400391, "global_step": 194720, "epoch": 4636} {"train_loss": -7.307805061340332, "global_step": 194721, "epoch": 4636} {"train_loss": -7.300207138061523, "global_step": 194722, "epoch": 4636} {"train_loss": -7.307293891906738, "global_step": 194723, "epoch": 4636} {"train_loss": -7.201290130615234, "global_step": 194724, "epoch": 4636} {"train_loss": -7.227980613708496, "global_step": 194725, "epoch": 4636} {"train_loss": -7.203398704528809, "global_step": 194726, "epoch": 4636} {"train_loss": -7.098270416259766, "global_step": 194727, "epoch": 4636} {"train_loss": -7.019279479980469, "global_step": 194728, "epoch": 4636} {"train_loss": -7.077732086181641, "global_step": 194729, "epoch": 4636} {"train_loss": -7.304573059082031, "global_step": 194730, "epoch": 4636} {"train_loss": -7.1082916259765625, "global_step": 194731, "epoch": 4636} {"train_loss": -7.07816743850708, "global_step": 194732, "epoch": 4636} {"train_loss": -7.135082244873047, "global_step": 194733, "epoch": 4636} {"train_loss": -7.160792350769043, "global_step": 194734, "epoch": 4636} {"train_loss": -7.185630798339844, "global_step": 194735, "epoch": 4636} {"train_loss": -7.240420818328857, "global_step": 194736, "epoch": 4636} {"train_loss": -7.21455192565918, "global_step": 194737, "epoch": 4636} {"train_loss": -7.221718788146973, "global_step": 194738, "epoch": 4636} {"train_loss": -7.162287712097168, "global_step": 194739, "epoch": 4636} {"train_loss": -7.360352516174316, "global_step": 194740, "epoch": 4636} {"train_loss": -7.070700168609619, "global_step": 194741, "epoch": 4636} {"train_loss": -7.204627513885498, "global_step": 194742, "epoch": 4636} {"train_loss": -7.180850028991699, "global_step": 194743, "epoch": 4636} {"train_loss": -7.142582893371582, "global_step": 194744, "epoch": 4636} {"train_loss": -7.294814109802246, "global_step": 194745, "epoch": 4636} {"train_loss": -7.1818437576293945, "global_step": 194746, "epoch": 4636} {"train_loss": -7.16457462310791, "global_step": 194747, "epoch": 4636} {"train_loss": -7.274646282196045, "global_step": 194748, "epoch": 4636} {"train_loss": -7.1424102783203125, "global_step": 194749, "epoch": 4636} {"train_loss": -7.281051158905029, "global_step": 194750, "epoch": 4636} {"train_loss": -7.262147426605225, "global_step": 194751, "epoch": 4636} {"train_loss": -7.147765636444092, "global_step": 194752, "epoch": 4636} {"train_loss": -7.196806839534214, "global_step": 194753, "epoch": 4636, "val_loss": 81431.953125} {"train_loss": -7.166819095611572, "global_step": 194754, "epoch": 4637} {"train_loss": -7.189436912536621, "global_step": 194755, "epoch": 4637} {"train_loss": -7.180152893066406, "global_step": 194756, "epoch": 4637} {"train_loss": -7.219919204711914, "global_step": 194757, "epoch": 4637} {"train_loss": -7.176939010620117, "global_step": 194758, "epoch": 4637} {"train_loss": -7.207982063293457, "global_step": 194759, "epoch": 4637} {"train_loss": -7.372220993041992, "global_step": 194760, "epoch": 4637} {"train_loss": -7.2314043045043945, "global_step": 194761, "epoch": 4637} {"train_loss": -7.15215539932251, "global_step": 194762, "epoch": 4637} {"train_loss": -7.302062034606934, "global_step": 194763, "epoch": 4637} {"train_loss": -7.2902021408081055, "global_step": 194764, "epoch": 4637} {"train_loss": -7.233450889587402, "global_step": 194765, "epoch": 4637} {"train_loss": -7.297562122344971, "global_step": 194766, "epoch": 4637} {"train_loss": -7.272261619567871, "global_step": 194767, "epoch": 4637} {"train_loss": -7.339108467102051, "global_step": 194768, "epoch": 4637} {"train_loss": -7.266034126281738, "global_step": 194769, "epoch": 4637} {"train_loss": -7.254334449768066, "global_step": 194770, "epoch": 4637} {"train_loss": -7.292147159576416, "global_step": 194771, "epoch": 4637} {"train_loss": -7.228172302246094, "global_step": 194772, "epoch": 4637} {"train_loss": -7.319910526275635, "global_step": 194773, "epoch": 4637} {"train_loss": -7.167694091796875, "global_step": 194774, "epoch": 4637} {"train_loss": -7.247740745544434, "global_step": 194775, "epoch": 4637} {"train_loss": -7.254048824310303, "global_step": 194776, "epoch": 4637} {"train_loss": -7.190406799316406, "global_step": 194777, "epoch": 4637} {"train_loss": -7.311899662017822, "global_step": 194778, "epoch": 4637} {"train_loss": -7.131551265716553, "global_step": 194779, "epoch": 4637} {"train_loss": -7.195718288421631, "global_step": 194780, "epoch": 4637} {"train_loss": -7.250706672668457, "global_step": 194781, "epoch": 4637} {"train_loss": -7.320888519287109, "global_step": 194782, "epoch": 4637} {"train_loss": -7.395368576049805, "global_step": 194783, "epoch": 4637} {"train_loss": -7.24080753326416, "global_step": 194784, "epoch": 4637} {"train_loss": -7.237669944763184, "global_step": 194785, "epoch": 4637} {"train_loss": -7.327754020690918, "global_step": 194786, "epoch": 4637} {"train_loss": -7.273868560791016, "global_step": 194787, "epoch": 4637} {"train_loss": -7.19340705871582, "global_step": 194788, "epoch": 4637} {"train_loss": -7.158899307250977, "global_step": 194789, "epoch": 4637} {"train_loss": -7.259040355682373, "global_step": 194790, "epoch": 4637} {"train_loss": -7.298513412475586, "global_step": 194791, "epoch": 4637} {"train_loss": -7.274240493774414, "global_step": 194792, "epoch": 4637} {"train_loss": -7.196521759033203, "global_step": 194793, "epoch": 4637} {"train_loss": -7.266401290893555, "global_step": 194794, "epoch": 4637} {"train_loss": -7.2476832412538075, "global_step": 194795, "epoch": 4637, "val_loss": 81226.0625} {"train_loss": -7.185882568359375, "global_step": 194796, "epoch": 4638} {"train_loss": -7.173179626464844, "global_step": 194797, "epoch": 4638} {"train_loss": -7.092444896697998, "global_step": 194798, "epoch": 4638} {"train_loss": -7.164870738983154, "global_step": 194799, "epoch": 4638} {"train_loss": -7.104340076446533, "global_step": 194800, "epoch": 4638} {"train_loss": -7.119233131408691, "global_step": 194801, "epoch": 4638} {"train_loss": -7.2061848640441895, "global_step": 194802, "epoch": 4638} {"train_loss": -7.178805351257324, "global_step": 194803, "epoch": 4638} {"train_loss": -7.088663101196289, "global_step": 194804, "epoch": 4638} {"train_loss": -7.155570030212402, "global_step": 194805, "epoch": 4638} {"train_loss": -7.149709224700928, "global_step": 194806, "epoch": 4638} {"train_loss": -7.358640670776367, "global_step": 194807, "epoch": 4638} {"train_loss": -7.147148132324219, "global_step": 194808, "epoch": 4638} {"train_loss": -7.231181621551514, "global_step": 194809, "epoch": 4638} {"train_loss": -7.195425987243652, "global_step": 194810, "epoch": 4638} {"train_loss": -7.1852874755859375, "global_step": 194811, "epoch": 4638} {"train_loss": -7.179324150085449, "global_step": 194812, "epoch": 4638} {"train_loss": -7.059483528137207, "global_step": 194813, "epoch": 4638} {"train_loss": -7.245577335357666, "global_step": 194814, "epoch": 4638} {"train_loss": -7.113088130950928, "global_step": 194815, "epoch": 4638} {"train_loss": -7.246481895446777, "global_step": 194816, "epoch": 4638} {"train_loss": -7.186736583709717, "global_step": 194817, "epoch": 4638} {"train_loss": -7.227446556091309, "global_step": 194818, "epoch": 4638} {"train_loss": -7.086966514587402, "global_step": 194819, "epoch": 4638} {"train_loss": -7.216980934143066, "global_step": 194820, "epoch": 4638} {"train_loss": -7.226140975952148, "global_step": 194821, "epoch": 4638} {"train_loss": -7.143448829650879, "global_step": 194822, "epoch": 4638} {"train_loss": -7.185347557067871, "global_step": 194823, "epoch": 4638} {"train_loss": -7.122648239135742, "global_step": 194824, "epoch": 4638} {"train_loss": -7.282181739807129, "global_step": 194825, "epoch": 4638} {"train_loss": -7.230592727661133, "global_step": 194826, "epoch": 4638} {"train_loss": -7.2138214111328125, "global_step": 194827, "epoch": 4638} {"train_loss": -7.152976989746094, "global_step": 194828, "epoch": 4638} {"train_loss": -7.218569755554199, "global_step": 194829, "epoch": 4638} {"train_loss": -7.171679496765137, "global_step": 194830, "epoch": 4638} {"train_loss": -7.290007591247559, "global_step": 194831, "epoch": 4638} {"train_loss": -7.233579158782959, "global_step": 194832, "epoch": 4638} {"train_loss": -7.1900715827941895, "global_step": 194833, "epoch": 4638} {"train_loss": -7.330508232116699, "global_step": 194834, "epoch": 4638} {"train_loss": -7.235043048858643, "global_step": 194835, "epoch": 4638} {"train_loss": -7.267635345458984, "global_step": 194836, "epoch": 4638} {"train_loss": -7.192547344026112, "global_step": 194837, "epoch": 4638, "val_loss": 81322.7109375} {"train_loss": -7.323237419128418, "global_step": 194838, "epoch": 4639} {"train_loss": -7.371013641357422, "global_step": 194839, "epoch": 4639} {"train_loss": -7.210631847381592, "global_step": 194840, "epoch": 4639} {"train_loss": -7.365440368652344, "global_step": 194841, "epoch": 4639} {"train_loss": -7.292600631713867, "global_step": 194842, "epoch": 4639} {"train_loss": -7.203962802886963, "global_step": 194843, "epoch": 4639} {"train_loss": -7.219761848449707, "global_step": 194844, "epoch": 4639} {"train_loss": -7.183224678039551, "global_step": 194845, "epoch": 4639} {"train_loss": -7.331122398376465, "global_step": 194846, "epoch": 4639} {"train_loss": -7.35602331161499, "global_step": 194847, "epoch": 4639} {"train_loss": -7.174358367919922, "global_step": 194848, "epoch": 4639} {"train_loss": -7.3075642585754395, "global_step": 194849, "epoch": 4639} {"train_loss": -7.370038986206055, "global_step": 194850, "epoch": 4639} {"train_loss": -7.226215362548828, "global_step": 194851, "epoch": 4639} {"train_loss": -7.272260665893555, "global_step": 194852, "epoch": 4639} {"train_loss": -7.416741847991943, "global_step": 194853, "epoch": 4639} {"train_loss": -7.285820007324219, "global_step": 194854, "epoch": 4639} {"train_loss": -7.245930194854736, "global_step": 194855, "epoch": 4639} {"train_loss": -7.31226921081543, "global_step": 194856, "epoch": 4639} {"train_loss": -7.237118721008301, "global_step": 194857, "epoch": 4639} {"train_loss": -7.3381195068359375, "global_step": 194858, "epoch": 4639} {"train_loss": -7.19802188873291, "global_step": 194859, "epoch": 4639} {"train_loss": -7.314265251159668, "global_step": 194860, "epoch": 4639} {"train_loss": -7.347432613372803, "global_step": 194861, "epoch": 4639} {"train_loss": -7.1512041091918945, "global_step": 194862, "epoch": 4639} {"train_loss": -7.166897773742676, "global_step": 194863, "epoch": 4639} {"train_loss": -7.232558250427246, "global_step": 194864, "epoch": 4639} {"train_loss": -7.259791374206543, "global_step": 194865, "epoch": 4639} {"train_loss": -7.284640789031982, "global_step": 194866, "epoch": 4639} {"train_loss": -7.275833606719971, "global_step": 194867, "epoch": 4639} {"train_loss": -7.2714409828186035, "global_step": 194868, "epoch": 4639} {"train_loss": -7.335028648376465, "global_step": 194869, "epoch": 4639} {"train_loss": -7.289919376373291, "global_step": 194870, "epoch": 4639} {"train_loss": -7.349000930786133, "global_step": 194871, "epoch": 4639} {"train_loss": -7.432756423950195, "global_step": 194872, "epoch": 4639} {"train_loss": -7.408914089202881, "global_step": 194873, "epoch": 4639} {"train_loss": -7.223860740661621, "global_step": 194874, "epoch": 4639} {"train_loss": -7.328648567199707, "global_step": 194875, "epoch": 4639} {"train_loss": -7.189418315887451, "global_step": 194876, "epoch": 4639} {"train_loss": -7.124914169311523, "global_step": 194877, "epoch": 4639} {"train_loss": -7.281913757324219, "global_step": 194878, "epoch": 4639} {"train_loss": -7.280272199994042, "global_step": 194879, "epoch": 4639, "val_loss": 81424.4375} {"train_loss": -7.294180870056152, "global_step": 194880, "epoch": 4640} {"train_loss": -7.2477898597717285, "global_step": 194881, "epoch": 4640} {"train_loss": -7.185760498046875, "global_step": 194882, "epoch": 4640} {"train_loss": -7.120333671569824, "global_step": 194883, "epoch": 4640} {"train_loss": -7.193319320678711, "global_step": 194884, "epoch": 4640} {"train_loss": -7.195707321166992, "global_step": 194885, "epoch": 4640} {"train_loss": -7.101633071899414, "global_step": 194886, "epoch": 4640} {"train_loss": -7.278462886810303, "global_step": 194887, "epoch": 4640} {"train_loss": -6.992123603820801, "global_step": 194888, "epoch": 4640} {"train_loss": -6.986428260803223, "global_step": 194889, "epoch": 4640} {"train_loss": -7.160933971405029, "global_step": 194890, "epoch": 4640} {"train_loss": -6.967769145965576, "global_step": 194891, "epoch": 4640} {"train_loss": -7.162078857421875, "global_step": 194892, "epoch": 4640} {"train_loss": -7.218805313110352, "global_step": 194893, "epoch": 4640} {"train_loss": -7.036449432373047, "global_step": 194894, "epoch": 4640} {"train_loss": -7.187150001525879, "global_step": 194895, "epoch": 4640} {"train_loss": -7.094344615936279, "global_step": 194896, "epoch": 4640} {"train_loss": -7.169989109039307, "global_step": 194897, "epoch": 4640} {"train_loss": -7.1337456703186035, "global_step": 194898, "epoch": 4640} {"train_loss": -7.107274532318115, "global_step": 194899, "epoch": 4640} {"train_loss": -7.160832405090332, "global_step": 194900, "epoch": 4640} {"train_loss": -7.204309940338135, "global_step": 194901, "epoch": 4640} {"train_loss": -7.219018936157227, "global_step": 194902, "epoch": 4640} {"train_loss": -7.194008827209473, "global_step": 194903, "epoch": 4640} {"train_loss": -7.2047929763793945, "global_step": 194904, "epoch": 4640} {"train_loss": -7.1924357414245605, "global_step": 194905, "epoch": 4640} {"train_loss": -7.343791484832764, "global_step": 194906, "epoch": 4640} {"train_loss": -7.2771806716918945, "global_step": 194907, "epoch": 4640} {"train_loss": -7.219475746154785, "global_step": 194908, "epoch": 4640} {"train_loss": -7.212523460388184, "global_step": 194909, "epoch": 4640} {"train_loss": -7.232327938079834, "global_step": 194910, "epoch": 4640} {"train_loss": -7.319295883178711, "global_step": 194911, "epoch": 4640} {"train_loss": -7.337387561798096, "global_step": 194912, "epoch": 4640} {"train_loss": -7.291589736938477, "global_step": 194913, "epoch": 4640} {"train_loss": -7.275933265686035, "global_step": 194914, "epoch": 4640} {"train_loss": -7.373878479003906, "global_step": 194915, "epoch": 4640} {"train_loss": -7.301954746246338, "global_step": 194916, "epoch": 4640} {"train_loss": -7.380346298217773, "global_step": 194917, "epoch": 4640} {"train_loss": -7.3598222732543945, "global_step": 194918, "epoch": 4640} {"train_loss": -7.341407775878906, "global_step": 194919, "epoch": 4640} {"train_loss": -7.270288467407227, "global_step": 194920, "epoch": 4640} {"train_loss": -7.211353915078299, "global_step": 194921, "epoch": 4640, "val_loss": 81206.375} {"train_loss": -7.388321876525879, "global_step": 194922, "epoch": 4641} {"train_loss": -7.361123561859131, "global_step": 194923, "epoch": 4641} {"train_loss": -7.253908634185791, "global_step": 194924, "epoch": 4641} {"train_loss": -7.249294281005859, "global_step": 194925, "epoch": 4641} {"train_loss": -7.298762321472168, "global_step": 194926, "epoch": 4641} {"train_loss": -7.263607978820801, "global_step": 194927, "epoch": 4641} {"train_loss": -7.386837482452393, "global_step": 194928, "epoch": 4641} {"train_loss": -7.199573516845703, "global_step": 194929, "epoch": 4641} {"train_loss": -7.366828918457031, "global_step": 194930, "epoch": 4641} {"train_loss": -7.384055137634277, "global_step": 194931, "epoch": 4641} {"train_loss": -7.270442962646484, "global_step": 194932, "epoch": 4641} {"train_loss": -7.340047836303711, "global_step": 194933, "epoch": 4641} {"train_loss": -7.292824745178223, "global_step": 194934, "epoch": 4641} {"train_loss": -7.434739589691162, "global_step": 194935, "epoch": 4641} {"train_loss": -7.286600589752197, "global_step": 194936, "epoch": 4641} {"train_loss": -7.304010391235352, "global_step": 194937, "epoch": 4641} {"train_loss": -7.2875776290893555, "global_step": 194938, "epoch": 4641} {"train_loss": -7.331714630126953, "global_step": 194939, "epoch": 4641} {"train_loss": -7.408504486083984, "global_step": 194940, "epoch": 4641} {"train_loss": -7.349678039550781, "global_step": 194941, "epoch": 4641} {"train_loss": -7.304307460784912, "global_step": 194942, "epoch": 4641} {"train_loss": -7.4650774002075195, "global_step": 194943, "epoch": 4641} {"train_loss": -7.25184440612793, "global_step": 194944, "epoch": 4641} {"train_loss": -7.26544189453125, "global_step": 194945, "epoch": 4641} {"train_loss": -7.333822727203369, "global_step": 194946, "epoch": 4641} {"train_loss": -7.336454391479492, "global_step": 194947, "epoch": 4641} {"train_loss": -7.272278308868408, "global_step": 194948, "epoch": 4641} {"train_loss": -7.321469306945801, "global_step": 194949, "epoch": 4641} {"train_loss": -7.247466087341309, "global_step": 194950, "epoch": 4641} {"train_loss": -7.2989912033081055, "global_step": 194951, "epoch": 4641} {"train_loss": -7.231619358062744, "global_step": 194952, "epoch": 4641} {"train_loss": -7.204071044921875, "global_step": 194953, "epoch": 4641} {"train_loss": -7.277629852294922, "global_step": 194954, "epoch": 4641} {"train_loss": -6.834488868713379, "global_step": 194955, "epoch": 4641} {"train_loss": -7.095501899719238, "global_step": 194956, "epoch": 4641} {"train_loss": -7.180928707122803, "global_step": 194957, "epoch": 4641} {"train_loss": -7.067746162414551, "global_step": 194958, "epoch": 4641} {"train_loss": -7.184528827667236, "global_step": 194959, "epoch": 4641} {"train_loss": -7.294632434844971, "global_step": 194960, "epoch": 4641} {"train_loss": -7.1659626960754395, "global_step": 194961, "epoch": 4641} {"train_loss": -7.166306972503662, "global_step": 194962, "epoch": 4641} {"train_loss": -7.269456375212896, "global_step": 194963, "epoch": 4641, "val_loss": 81156.859375} {"train_loss": -7.043709754943848, "global_step": 194964, "epoch": 4642} {"train_loss": -7.261413097381592, "global_step": 194965, "epoch": 4642} {"train_loss": -7.1941070556640625, "global_step": 194966, "epoch": 4642} {"train_loss": -7.068264484405518, "global_step": 194967, "epoch": 4642} {"train_loss": -7.144063472747803, "global_step": 194968, "epoch": 4642} {"train_loss": -7.229442596435547, "global_step": 194969, "epoch": 4642} {"train_loss": -7.204151153564453, "global_step": 194970, "epoch": 4642} {"train_loss": -7.028378486633301, "global_step": 194971, "epoch": 4642} {"train_loss": -7.215182781219482, "global_step": 194972, "epoch": 4642} {"train_loss": -7.200942516326904, "global_step": 194973, "epoch": 4642} {"train_loss": -7.1752424240112305, "global_step": 194974, "epoch": 4642} {"train_loss": -7.207257270812988, "global_step": 194975, "epoch": 4642} {"train_loss": -7.225715637207031, "global_step": 194976, "epoch": 4642} {"train_loss": -7.232455253601074, "global_step": 194977, "epoch": 4642} {"train_loss": -7.210345268249512, "global_step": 194978, "epoch": 4642} {"train_loss": -7.232346534729004, "global_step": 194979, "epoch": 4642} {"train_loss": -7.11207914352417, "global_step": 194980, "epoch": 4642} {"train_loss": -7.266810417175293, "global_step": 194981, "epoch": 4642} {"train_loss": -7.14862060546875, "global_step": 194982, "epoch": 4642} {"train_loss": -7.185735702514648, "global_step": 194983, "epoch": 4642} {"train_loss": -7.096521377563477, "global_step": 194984, "epoch": 4642} {"train_loss": -7.191408157348633, "global_step": 194985, "epoch": 4642} {"train_loss": -7.278617858886719, "global_step": 194986, "epoch": 4642} {"train_loss": -7.187484264373779, "global_step": 194987, "epoch": 4642} {"train_loss": -7.282398700714111, "global_step": 194988, "epoch": 4642} {"train_loss": -7.203454971313477, "global_step": 194989, "epoch": 4642} {"train_loss": -7.204484462738037, "global_step": 194990, "epoch": 4642} {"train_loss": -7.251002311706543, "global_step": 194991, "epoch": 4642} {"train_loss": -7.200080871582031, "global_step": 194992, "epoch": 4642} {"train_loss": -7.294581413269043, "global_step": 194993, "epoch": 4642} {"train_loss": -7.246525764465332, "global_step": 194994, "epoch": 4642} {"train_loss": -7.222943305969238, "global_step": 194995, "epoch": 4642} {"train_loss": -7.312538146972656, "global_step": 194996, "epoch": 4642} {"train_loss": -7.204113960266113, "global_step": 194997, "epoch": 4642} {"train_loss": -7.270340919494629, "global_step": 194998, "epoch": 4642} {"train_loss": -7.39492130279541, "global_step": 194999, "epoch": 4642} {"train_loss": -7.238667964935303, "global_step": 195000, "epoch": 4642} {"train_loss": -7.257501602172852, "global_step": 195001, "epoch": 4642} {"train_loss": -7.32889461517334, "global_step": 195002, "epoch": 4642} {"train_loss": -7.226679801940918, "global_step": 195003, "epoch": 4642} {"train_loss": -7.224326133728027, "global_step": 195004, "epoch": 4642} {"train_loss": -7.213831231707618, "global_step": 195005, "epoch": 4642, "val_loss": 80944.171875} {"train_loss": -7.211294174194336, "global_step": 195006, "epoch": 4643} {"train_loss": -7.342165470123291, "global_step": 195007, "epoch": 4643} {"train_loss": -7.276966571807861, "global_step": 195008, "epoch": 4643} {"train_loss": -7.303470134735107, "global_step": 195009, "epoch": 4643} {"train_loss": -7.185498237609863, "global_step": 195010, "epoch": 4643} {"train_loss": -7.394079208374023, "global_step": 195011, "epoch": 4643} {"train_loss": -7.217698097229004, "global_step": 195012, "epoch": 4643} {"train_loss": -7.360012054443359, "global_step": 195013, "epoch": 4643} {"train_loss": -7.234547138214111, "global_step": 195014, "epoch": 4643} {"train_loss": -7.132134437561035, "global_step": 195015, "epoch": 4643} {"train_loss": -7.218941688537598, "global_step": 195016, "epoch": 4643} {"train_loss": -7.171509742736816, "global_step": 195017, "epoch": 4643} {"train_loss": -7.251120567321777, "global_step": 195018, "epoch": 4643} {"train_loss": -7.125080108642578, "global_step": 195019, "epoch": 4643} {"train_loss": -7.121796607971191, "global_step": 195020, "epoch": 4643} {"train_loss": -7.31165885925293, "global_step": 195021, "epoch": 4643} {"train_loss": -7.188248634338379, "global_step": 195022, "epoch": 4643} {"train_loss": -7.181843280792236, "global_step": 195023, "epoch": 4643} {"train_loss": -7.201099872589111, "global_step": 195024, "epoch": 4643} {"train_loss": -7.228672981262207, "global_step": 195025, "epoch": 4643} {"train_loss": -7.256134510040283, "global_step": 195026, "epoch": 4643} {"train_loss": -7.298095703125, "global_step": 195027, "epoch": 4643} {"train_loss": -7.248425006866455, "global_step": 195028, "epoch": 4643} {"train_loss": -7.355670928955078, "global_step": 195029, "epoch": 4643} {"train_loss": -7.136538505554199, "global_step": 195030, "epoch": 4643} {"train_loss": -7.255385398864746, "global_step": 195031, "epoch": 4643} {"train_loss": -7.225231647491455, "global_step": 195032, "epoch": 4643} {"train_loss": -7.335156440734863, "global_step": 195033, "epoch": 4643} {"train_loss": -7.27992582321167, "global_step": 195034, "epoch": 4643} {"train_loss": -7.24367618560791, "global_step": 195035, "epoch": 4643} {"train_loss": -7.225854873657227, "global_step": 195036, "epoch": 4643} {"train_loss": -7.235527515411377, "global_step": 195037, "epoch": 4643} {"train_loss": -7.391458988189697, "global_step": 195038, "epoch": 4643} {"train_loss": -7.265841960906982, "global_step": 195039, "epoch": 4643} {"train_loss": -7.422486305236816, "global_step": 195040, "epoch": 4643} {"train_loss": -7.307028293609619, "global_step": 195041, "epoch": 4643} {"train_loss": -7.280521392822266, "global_step": 195042, "epoch": 4643} {"train_loss": -7.332034111022949, "global_step": 195043, "epoch": 4643} {"train_loss": -7.330869674682617, "global_step": 195044, "epoch": 4643} {"train_loss": -7.375906467437744, "global_step": 195045, "epoch": 4643} {"train_loss": -7.3441243171691895, "global_step": 195046, "epoch": 4643} {"train_loss": -7.264512890861148, "global_step": 195047, "epoch": 4643, "val_loss": 81154.8203125} {"train_loss": -7.342329025268555, "global_step": 195048, "epoch": 4644} {"train_loss": -7.274410247802734, "global_step": 195049, "epoch": 4644} {"train_loss": -7.262001037597656, "global_step": 195050, "epoch": 4644} {"train_loss": -7.286881446838379, "global_step": 195051, "epoch": 4644} {"train_loss": -7.216836452484131, "global_step": 195052, "epoch": 4644} {"train_loss": -7.326881408691406, "global_step": 195053, "epoch": 4644} {"train_loss": -7.32058572769165, "global_step": 195054, "epoch": 4644} {"train_loss": -7.326013088226318, "global_step": 195055, "epoch": 4644} {"train_loss": -7.402398586273193, "global_step": 195056, "epoch": 4644} {"train_loss": -7.208599090576172, "global_step": 195057, "epoch": 4644} {"train_loss": -7.2634477615356445, "global_step": 195058, "epoch": 4644} {"train_loss": -7.23053503036499, "global_step": 195059, "epoch": 4644} {"train_loss": -7.228964805603027, "global_step": 195060, "epoch": 4644} {"train_loss": -7.200958728790283, "global_step": 195061, "epoch": 4644} {"train_loss": -7.301793098449707, "global_step": 195062, "epoch": 4644} {"train_loss": -7.300918102264404, "global_step": 195063, "epoch": 4644} {"train_loss": -7.2852783203125, "global_step": 195064, "epoch": 4644} {"train_loss": -7.206303596496582, "global_step": 195065, "epoch": 4644} {"train_loss": -7.19551944732666, "global_step": 195066, "epoch": 4644} {"train_loss": -7.152066230773926, "global_step": 195067, "epoch": 4644} {"train_loss": -7.222111701965332, "global_step": 195068, "epoch": 4644} {"train_loss": -7.381196975708008, "global_step": 195069, "epoch": 4644} {"train_loss": -7.18212366104126, "global_step": 195070, "epoch": 4644} {"train_loss": -7.230682373046875, "global_step": 195071, "epoch": 4644} {"train_loss": -7.30694580078125, "global_step": 195072, "epoch": 4644} {"train_loss": -7.196799278259277, "global_step": 195073, "epoch": 4644} {"train_loss": -7.243321895599365, "global_step": 195074, "epoch": 4644} {"train_loss": -7.105459690093994, "global_step": 195075, "epoch": 4644} {"train_loss": -7.238866806030273, "global_step": 195076, "epoch": 4644} {"train_loss": -7.234020233154297, "global_step": 195077, "epoch": 4644} {"train_loss": -7.255578517913818, "global_step": 195078, "epoch": 4644} {"train_loss": -7.168940544128418, "global_step": 195079, "epoch": 4644} {"train_loss": -7.071646690368652, "global_step": 195080, "epoch": 4644} {"train_loss": -7.290668487548828, "global_step": 195081, "epoch": 4644} {"train_loss": -7.13111686706543, "global_step": 195082, "epoch": 4644} {"train_loss": -7.364719390869141, "global_step": 195083, "epoch": 4644} {"train_loss": -7.195704936981201, "global_step": 195084, "epoch": 4644} {"train_loss": -7.274530410766602, "global_step": 195085, "epoch": 4644} {"train_loss": -7.219367504119873, "global_step": 195086, "epoch": 4644} {"train_loss": -7.226929664611816, "global_step": 195087, "epoch": 4644} {"train_loss": -7.283198356628418, "global_step": 195088, "epoch": 4644} {"train_loss": -7.246213685898554, "global_step": 195089, "epoch": 4644, "val_loss": 81247.59375} {"train_loss": -7.310693740844727, "global_step": 195090, "epoch": 4645} {"train_loss": -7.1421661376953125, "global_step": 195091, "epoch": 4645} {"train_loss": -7.246466159820557, "global_step": 195092, "epoch": 4645} {"train_loss": -7.279060363769531, "global_step": 195093, "epoch": 4645} {"train_loss": -7.355306148529053, "global_step": 195094, "epoch": 4645} {"train_loss": -7.243432998657227, "global_step": 195095, "epoch": 4645} {"train_loss": -7.300878524780273, "global_step": 195096, "epoch": 4645} {"train_loss": -7.269776821136475, "global_step": 195097, "epoch": 4645} {"train_loss": -7.277984142303467, "global_step": 195098, "epoch": 4645} {"train_loss": -7.172061443328857, "global_step": 195099, "epoch": 4645} {"train_loss": -7.332773685455322, "global_step": 195100, "epoch": 4645} {"train_loss": -7.333538055419922, "global_step": 195101, "epoch": 4645} {"train_loss": -7.28675651550293, "global_step": 195102, "epoch": 4645} {"train_loss": -7.2373433113098145, "global_step": 195103, "epoch": 4645} {"train_loss": -7.26389741897583, "global_step": 195104, "epoch": 4645} {"train_loss": -7.352994918823242, "global_step": 195105, "epoch": 4645} {"train_loss": -7.197061061859131, "global_step": 195106, "epoch": 4645} {"train_loss": -7.20821475982666, "global_step": 195107, "epoch": 4645} {"train_loss": -7.164972305297852, "global_step": 195108, "epoch": 4645} {"train_loss": -7.229034423828125, "global_step": 195109, "epoch": 4645} {"train_loss": -7.236053943634033, "global_step": 195110, "epoch": 4645} {"train_loss": -7.034787178039551, "global_step": 195111, "epoch": 4645} {"train_loss": -7.184456825256348, "global_step": 195112, "epoch": 4645} {"train_loss": -7.2400407791137695, "global_step": 195113, "epoch": 4645} {"train_loss": -7.066598415374756, "global_step": 195114, "epoch": 4645} {"train_loss": -7.082297325134277, "global_step": 195115, "epoch": 4645} {"train_loss": -7.152125358581543, "global_step": 195116, "epoch": 4645} {"train_loss": -7.156808853149414, "global_step": 195117, "epoch": 4645} {"train_loss": -7.153432369232178, "global_step": 195118, "epoch": 4645} {"train_loss": -7.011877059936523, "global_step": 195119, "epoch": 4645} {"train_loss": -7.000732898712158, "global_step": 195120, "epoch": 4645} {"train_loss": -7.323760032653809, "global_step": 195121, "epoch": 4645} {"train_loss": -7.1867523193359375, "global_step": 195122, "epoch": 4645} {"train_loss": -7.218249797821045, "global_step": 195123, "epoch": 4645} {"train_loss": -7.165189266204834, "global_step": 195124, "epoch": 4645} {"train_loss": -7.214883804321289, "global_step": 195125, "epoch": 4645} {"train_loss": -7.2401885986328125, "global_step": 195126, "epoch": 4645} {"train_loss": -7.281308174133301, "global_step": 195127, "epoch": 4645} {"train_loss": -7.150202751159668, "global_step": 195128, "epoch": 4645} {"train_loss": -7.131576061248779, "global_step": 195129, "epoch": 4645} {"train_loss": -7.151132583618164, "global_step": 195130, "epoch": 4645} {"train_loss": -7.20841417993818, "global_step": 195131, "epoch": 4645, "val_loss": 81169.3203125} {"train_loss": -7.241154670715332, "global_step": 195132, "epoch": 4646} {"train_loss": -7.138209819793701, "global_step": 195133, "epoch": 4646} {"train_loss": -7.374090671539307, "global_step": 195134, "epoch": 4646} {"train_loss": -7.236286640167236, "global_step": 195135, "epoch": 4646} {"train_loss": -7.16966438293457, "global_step": 195136, "epoch": 4646} {"train_loss": -7.190696716308594, "global_step": 195137, "epoch": 4646} {"train_loss": -7.202771186828613, "global_step": 195138, "epoch": 4646} {"train_loss": -7.158321380615234, "global_step": 195139, "epoch": 4646} {"train_loss": -7.2886199951171875, "global_step": 195140, "epoch": 4646} {"train_loss": -7.217094421386719, "global_step": 195141, "epoch": 4646} {"train_loss": -7.162126541137695, "global_step": 195142, "epoch": 4646} {"train_loss": -7.246410846710205, "global_step": 195143, "epoch": 4646} {"train_loss": -7.20822286605835, "global_step": 195144, "epoch": 4646} {"train_loss": -7.314295291900635, "global_step": 195145, "epoch": 4646} {"train_loss": -7.230603218078613, "global_step": 195146, "epoch": 4646} {"train_loss": -7.267237663269043, "global_step": 195147, "epoch": 4646} {"train_loss": -7.293255805969238, "global_step": 195148, "epoch": 4646} {"train_loss": -7.265260696411133, "global_step": 195149, "epoch": 4646} {"train_loss": -7.2998552322387695, "global_step": 195150, "epoch": 4646} {"train_loss": -7.310087203979492, "global_step": 195151, "epoch": 4646} {"train_loss": -7.260226249694824, "global_step": 195152, "epoch": 4646} {"train_loss": -7.234352111816406, "global_step": 195153, "epoch": 4646} {"train_loss": -7.21611213684082, "global_step": 195154, "epoch": 4646} {"train_loss": -7.258625507354736, "global_step": 195155, "epoch": 4646} {"train_loss": -7.270029544830322, "global_step": 195156, "epoch": 4646} {"train_loss": -7.148756980895996, "global_step": 195157, "epoch": 4646} {"train_loss": -7.102243423461914, "global_step": 195158, "epoch": 4646} {"train_loss": -7.265322208404541, "global_step": 195159, "epoch": 4646} {"train_loss": -6.961515426635742, "global_step": 195160, "epoch": 4646} {"train_loss": -7.276250839233398, "global_step": 195161, "epoch": 4646} {"train_loss": -7.0683674812316895, "global_step": 195162, "epoch": 4646} {"train_loss": -6.985280990600586, "global_step": 195163, "epoch": 4646} {"train_loss": -7.309767723083496, "global_step": 195164, "epoch": 4646} {"train_loss": -7.123991966247559, "global_step": 195165, "epoch": 4646} {"train_loss": -7.162202835083008, "global_step": 195166, "epoch": 4646} {"train_loss": -7.16337776184082, "global_step": 195167, "epoch": 4646} {"train_loss": -7.175686836242676, "global_step": 195168, "epoch": 4646} {"train_loss": -7.34530782699585, "global_step": 195169, "epoch": 4646} {"train_loss": -7.247978210449219, "global_step": 195170, "epoch": 4646} {"train_loss": -7.208553314208984, "global_step": 195171, "epoch": 4646} {"train_loss": -7.084451675415039, "global_step": 195172, "epoch": 4646} {"train_loss": -7.213578644252959, "global_step": 195173, "epoch": 4646, "val_loss": 81320.71875} {"train_loss": -7.0519609451293945, "global_step": 195174, "epoch": 4647} {"train_loss": -7.225170135498047, "global_step": 195175, "epoch": 4647} {"train_loss": -7.275317192077637, "global_step": 195176, "epoch": 4647} {"train_loss": -7.28025484085083, "global_step": 195177, "epoch": 4647} {"train_loss": -7.228601932525635, "global_step": 195178, "epoch": 4647} {"train_loss": -7.230950355529785, "global_step": 195179, "epoch": 4647} {"train_loss": -7.240163803100586, "global_step": 195180, "epoch": 4647} {"train_loss": -7.231293678283691, "global_step": 195181, "epoch": 4647} {"train_loss": -7.299229145050049, "global_step": 195182, "epoch": 4647} {"train_loss": -7.229335308074951, "global_step": 195183, "epoch": 4647} {"train_loss": -7.344173431396484, "global_step": 195184, "epoch": 4647} {"train_loss": -7.251554489135742, "global_step": 195185, "epoch": 4647} {"train_loss": -7.3359375, "global_step": 195186, "epoch": 4647} {"train_loss": -7.399921417236328, "global_step": 195187, "epoch": 4647} {"train_loss": -7.234616756439209, "global_step": 195188, "epoch": 4647} {"train_loss": -7.27238655090332, "global_step": 195189, "epoch": 4647} {"train_loss": -7.333729267120361, "global_step": 195190, "epoch": 4647} {"train_loss": -7.143394470214844, "global_step": 195191, "epoch": 4647} {"train_loss": -7.199489593505859, "global_step": 195192, "epoch": 4647} {"train_loss": -7.228176116943359, "global_step": 195193, "epoch": 4647} {"train_loss": -7.131652355194092, "global_step": 195194, "epoch": 4647} {"train_loss": -7.221102714538574, "global_step": 195195, "epoch": 4647} {"train_loss": -7.349448204040527, "global_step": 195196, "epoch": 4647} {"train_loss": -7.2032856941223145, "global_step": 195197, "epoch": 4647} {"train_loss": -7.295567512512207, "global_step": 195198, "epoch": 4647} {"train_loss": -7.335015773773193, "global_step": 195199, "epoch": 4647} {"train_loss": -7.149375915527344, "global_step": 195200, "epoch": 4647} {"train_loss": -7.19011116027832, "global_step": 195201, "epoch": 4647} {"train_loss": -7.216825485229492, "global_step": 195202, "epoch": 4647} {"train_loss": -7.065515995025635, "global_step": 195203, "epoch": 4647} {"train_loss": -7.218929290771484, "global_step": 195204, "epoch": 4647} {"train_loss": -7.277188777923584, "global_step": 195205, "epoch": 4647} {"train_loss": -7.227236747741699, "global_step": 195206, "epoch": 4647} {"train_loss": -7.348167896270752, "global_step": 195207, "epoch": 4647} {"train_loss": -7.231040000915527, "global_step": 195208, "epoch": 4647} {"train_loss": -7.208075523376465, "global_step": 195209, "epoch": 4647} {"train_loss": -7.358701705932617, "global_step": 195210, "epoch": 4647} {"train_loss": -7.239556789398193, "global_step": 195211, "epoch": 4647} {"train_loss": -7.112636089324951, "global_step": 195212, "epoch": 4647} {"train_loss": -7.29146146774292, "global_step": 195213, "epoch": 4647} {"train_loss": -7.24416446685791, "global_step": 195214, "epoch": 4647} {"train_loss": -7.240751879555838, "global_step": 195215, "epoch": 4647, "val_loss": 81131.6640625} {"train_loss": -7.29714298248291, "global_step": 195216, "epoch": 4648} {"train_loss": -7.166772365570068, "global_step": 195217, "epoch": 4648} {"train_loss": -7.211023807525635, "global_step": 195218, "epoch": 4648} {"train_loss": -7.208935260772705, "global_step": 195219, "epoch": 4648} {"train_loss": -7.217129707336426, "global_step": 195220, "epoch": 4648} {"train_loss": -7.224373817443848, "global_step": 195221, "epoch": 4648} {"train_loss": -7.234348773956299, "global_step": 195222, "epoch": 4648} {"train_loss": -7.2011003494262695, "global_step": 195223, "epoch": 4648} {"train_loss": -7.347019195556641, "global_step": 195224, "epoch": 4648} {"train_loss": -7.229837417602539, "global_step": 195225, "epoch": 4648} {"train_loss": -7.179632186889648, "global_step": 195226, "epoch": 4648} {"train_loss": -7.229646682739258, "global_step": 195227, "epoch": 4648} {"train_loss": -7.254908561706543, "global_step": 195228, "epoch": 4648} {"train_loss": -7.258340835571289, "global_step": 195229, "epoch": 4648} {"train_loss": -7.100931167602539, "global_step": 195230, "epoch": 4648} {"train_loss": -7.1845383644104, "global_step": 195231, "epoch": 4648} {"train_loss": -7.117392539978027, "global_step": 195232, "epoch": 4648} {"train_loss": -7.29219913482666, "global_step": 195233, "epoch": 4648} {"train_loss": -7.297771453857422, "global_step": 195234, "epoch": 4648} {"train_loss": -7.195889949798584, "global_step": 195235, "epoch": 4648} {"train_loss": -7.236617565155029, "global_step": 195236, "epoch": 4648} {"train_loss": -7.129647254943848, "global_step": 195237, "epoch": 4648} {"train_loss": -7.217680931091309, "global_step": 195238, "epoch": 4648} {"train_loss": -7.23604679107666, "global_step": 195239, "epoch": 4648} {"train_loss": -7.235276699066162, "global_step": 195240, "epoch": 4648} {"train_loss": -7.180025100708008, "global_step": 195241, "epoch": 4648} {"train_loss": -7.208439826965332, "global_step": 195242, "epoch": 4648} {"train_loss": -7.253131866455078, "global_step": 195243, "epoch": 4648} {"train_loss": -7.215738296508789, "global_step": 195244, "epoch": 4648} {"train_loss": -7.221981048583984, "global_step": 195245, "epoch": 4648} {"train_loss": -7.185693264007568, "global_step": 195246, "epoch": 4648} {"train_loss": -7.240884304046631, "global_step": 195247, "epoch": 4648} {"train_loss": -7.116060256958008, "global_step": 195248, "epoch": 4648} {"train_loss": -7.1846818923950195, "global_step": 195249, "epoch": 4648} {"train_loss": -7.326167583465576, "global_step": 195250, "epoch": 4648} {"train_loss": -7.2907514572143555, "global_step": 195251, "epoch": 4648} {"train_loss": -7.287200927734375, "global_step": 195252, "epoch": 4648} {"train_loss": -7.18938684463501, "global_step": 195253, "epoch": 4648} {"train_loss": -7.302642822265625, "global_step": 195254, "epoch": 4648} {"train_loss": -7.194334983825684, "global_step": 195255, "epoch": 4648} {"train_loss": -7.207034111022949, "global_step": 195256, "epoch": 4648} {"train_loss": -7.223176729111445, "global_step": 195257, "epoch": 4648, "val_loss": 81168.046875} {"train_loss": -7.252104759216309, "global_step": 195258, "epoch": 4649} {"train_loss": -7.228172779083252, "global_step": 195259, "epoch": 4649} {"train_loss": -7.308009147644043, "global_step": 195260, "epoch": 4649} {"train_loss": -7.342117786407471, "global_step": 195261, "epoch": 4649} {"train_loss": -7.290961265563965, "global_step": 195262, "epoch": 4649} {"train_loss": -7.286891937255859, "global_step": 195263, "epoch": 4649} {"train_loss": -7.354521751403809, "global_step": 195264, "epoch": 4649} {"train_loss": -7.396757125854492, "global_step": 195265, "epoch": 4649} {"train_loss": -7.210402488708496, "global_step": 195266, "epoch": 4649} {"train_loss": -7.263786315917969, "global_step": 195267, "epoch": 4649} {"train_loss": -7.2467732429504395, "global_step": 195268, "epoch": 4649} {"train_loss": -7.263408660888672, "global_step": 195269, "epoch": 4649} {"train_loss": -7.447798728942871, "global_step": 195270, "epoch": 4649} {"train_loss": -7.26020622253418, "global_step": 195271, "epoch": 4649} {"train_loss": -7.281264781951904, "global_step": 195272, "epoch": 4649} {"train_loss": -7.388671875, "global_step": 195273, "epoch": 4649} {"train_loss": -7.374736785888672, "global_step": 195274, "epoch": 4649} {"train_loss": -7.429443836212158, "global_step": 195275, "epoch": 4649} {"train_loss": -7.416811943054199, "global_step": 195276, "epoch": 4649} {"train_loss": -7.164687633514404, "global_step": 195277, "epoch": 4649} {"train_loss": -7.314836025238037, "global_step": 195278, "epoch": 4649} {"train_loss": -7.2591142654418945, "global_step": 195279, "epoch": 4649} {"train_loss": -7.222095489501953, "global_step": 195280, "epoch": 4649} {"train_loss": -7.325529098510742, "global_step": 195281, "epoch": 4649} {"train_loss": -7.283211708068848, "global_step": 195282, "epoch": 4649} {"train_loss": -7.268126964569092, "global_step": 195283, "epoch": 4649} {"train_loss": -7.273797035217285, "global_step": 195284, "epoch": 4649} {"train_loss": -7.317800045013428, "global_step": 195285, "epoch": 4649} {"train_loss": -7.266119956970215, "global_step": 195286, "epoch": 4649} {"train_loss": -7.179137229919434, "global_step": 195287, "epoch": 4649} {"train_loss": -7.358665943145752, "global_step": 195288, "epoch": 4649} {"train_loss": -7.272457599639893, "global_step": 195289, "epoch": 4649} {"train_loss": -7.269796371459961, "global_step": 195290, "epoch": 4649} {"train_loss": -7.33528995513916, "global_step": 195291, "epoch": 4649} {"train_loss": -7.059869766235352, "global_step": 195292, "epoch": 4649} {"train_loss": -7.048401832580566, "global_step": 195293, "epoch": 4649} {"train_loss": -7.107738494873047, "global_step": 195294, "epoch": 4649} {"train_loss": -7.200625896453857, "global_step": 195295, "epoch": 4649} {"train_loss": -7.102558612823486, "global_step": 195296, "epoch": 4649} {"train_loss": -7.090510368347168, "global_step": 195297, "epoch": 4649} {"train_loss": -7.093331336975098, "global_step": 195298, "epoch": 4649} {"train_loss": -7.2613472030276345, "global_step": 195299, "epoch": 4649, "val_loss": 81249.265625} {"train_loss": -7.2916789054870605, "global_step": 195300, "epoch": 4650} {"train_loss": -7.172878742218018, "global_step": 195301, "epoch": 4650} {"train_loss": -7.266047477722168, "global_step": 195302, "epoch": 4650} {"train_loss": -7.29514217376709, "global_step": 195303, "epoch": 4650} {"train_loss": -7.191096305847168, "global_step": 195304, "epoch": 4650} {"train_loss": -7.220334529876709, "global_step": 195305, "epoch": 4650} {"train_loss": -7.299983501434326, "global_step": 195306, "epoch": 4650} {"train_loss": -7.209549903869629, "global_step": 195307, "epoch": 4650} {"train_loss": -7.256831645965576, "global_step": 195308, "epoch": 4650} {"train_loss": -7.289532661437988, "global_step": 195309, "epoch": 4650} {"train_loss": -7.1583170890808105, "global_step": 195310, "epoch": 4650} {"train_loss": -7.337660789489746, "global_step": 195311, "epoch": 4650} {"train_loss": -7.2489423751831055, "global_step": 195312, "epoch": 4650} {"train_loss": -7.323687553405762, "global_step": 195313, "epoch": 4650} {"train_loss": -7.311910629272461, "global_step": 195314, "epoch": 4650} {"train_loss": -7.166929244995117, "global_step": 195315, "epoch": 4650} {"train_loss": -7.385880470275879, "global_step": 195316, "epoch": 4650} {"train_loss": -7.273664474487305, "global_step": 195317, "epoch": 4650} {"train_loss": -7.162487506866455, "global_step": 195318, "epoch": 4650} {"train_loss": -7.315669059753418, "global_step": 195319, "epoch": 4650} {"train_loss": -7.2224555015563965, "global_step": 195320, "epoch": 4650} {"train_loss": -7.169034957885742, "global_step": 195321, "epoch": 4650} {"train_loss": -7.363654613494873, "global_step": 195322, "epoch": 4650} {"train_loss": -7.336375713348389, "global_step": 195323, "epoch": 4650} {"train_loss": -7.171167373657227, "global_step": 195324, "epoch": 4650} {"train_loss": -7.251649856567383, "global_step": 195325, "epoch": 4650} {"train_loss": -7.193848609924316, "global_step": 195326, "epoch": 4650} {"train_loss": -7.2852888107299805, "global_step": 195327, "epoch": 4650} {"train_loss": -7.315325736999512, "global_step": 195328, "epoch": 4650} {"train_loss": -7.221189498901367, "global_step": 195329, "epoch": 4650} {"train_loss": -7.299566745758057, "global_step": 195330, "epoch": 4650} {"train_loss": -7.120207786560059, "global_step": 195331, "epoch": 4650} {"train_loss": -7.205296039581299, "global_step": 195332, "epoch": 4650} {"train_loss": -7.141600608825684, "global_step": 195333, "epoch": 4650} {"train_loss": -7.047791004180908, "global_step": 195334, "epoch": 4650} {"train_loss": -7.372500419616699, "global_step": 195335, "epoch": 4650} {"train_loss": -7.276716709136963, "global_step": 195336, "epoch": 4650} {"train_loss": -7.1702375411987305, "global_step": 195337, "epoch": 4650} {"train_loss": -7.232892990112305, "global_step": 195338, "epoch": 4650} {"train_loss": -7.099147796630859, "global_step": 195339, "epoch": 4650} {"train_loss": -7.194606781005859, "global_step": 195340, "epoch": 4650} {"train_loss": -7.239089772814796, "global_step": 195341, "epoch": 4650, "train/sim_max_reward_0": 0.2659995079822289, "train/sim_max_reward_1": 0.9533969026247155, "train/sim_max_reward_2": 0.3102972038394684, "train/sim_max_reward_3": 0.1482811445909901, "train/sim_max_reward_4": 0.41903291016078487, "train/sim_max_reward_5": 0.9625997949915539, "test/sim_max_reward_4500000": 0.9447997695177197, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9532792970334786, "test/sim_max_reward_4500004": 0.15902842435853043, "test/sim_max_reward_4500005": 0.18493997166469406, "test/sim_max_reward_4500006": 0.8733814293141853, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.14774863886302964, "test/sim_max_reward_4500009": 0.05304639352128416, "test/sim_max_reward_4500010": 0.11933189353453136, "test/sim_max_reward_4500011": 0.059829530371475606, "test/sim_max_reward_4500012": 1.0, "test/sim_max_reward_4500013": 0.42665618803510647, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.9955973307887043, "test/sim_max_reward_4500016": 0.016961657281076407, "test/sim_max_reward_4500017": 0.05895488550163935, "test/sim_max_reward_4500018": 0.7420929518003577, "test/sim_max_reward_4500019": 0.9910350928273123, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.4713447608814831, "test/sim_max_reward_4500022": 0.9571007831888836, "test/sim_max_reward_4500023": 0.9405253808029891, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8721789468988639, "test/sim_max_reward_4500026": 0.23735430279179118, "test/sim_max_reward_4500027": 0.8946298222227351, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.06940379861651115, "test/sim_max_reward_4500030": 0.9086023162135574, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.7482921892705903, "test/sim_max_reward_4500034": 0.8772152970229959, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 0.9836249840919004, "test/sim_max_reward_4500037": 0.969259898249763, "test/sim_max_reward_4500038": 0.8703197201775944, "test/sim_max_reward_4500039": 0.9963850629474879, "test/sim_max_reward_4500040": 0.9732726054321239, "test/sim_max_reward_4500041": 0.9889834660461093, "test/sim_max_reward_4500042": 0.036974246717543444, "test/sim_max_reward_4500043": 0.4710482792682415, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.3896725041282857, "test/sim_max_reward_4500046": 0.3745055827176852, "test/sim_max_reward_4500047": 0.8407134594745921, "test/sim_max_reward_4500048": 0.9224107267360335, "test/sim_max_reward_4500049": 0.022439648510091094, "train/mean_score": 0.509934577364957, "test/mean_score": 0.555552563746916, "val_loss": 80992.984375} {"train_loss": -7.204031944274902, "global_step": 195342, "epoch": 4651} {"train_loss": -7.2081074714660645, "global_step": 195343, "epoch": 4651} {"train_loss": -7.237054347991943, "global_step": 195344, "epoch": 4651} {"train_loss": -7.162103176116943, "global_step": 195345, "epoch": 4651} {"train_loss": -7.223809242248535, "global_step": 195346, "epoch": 4651} {"train_loss": -7.110220909118652, "global_step": 195347, "epoch": 4651} {"train_loss": -7.079298973083496, "global_step": 195348, "epoch": 4651} {"train_loss": -7.268067359924316, "global_step": 195349, "epoch": 4651} {"train_loss": -7.137021064758301, "global_step": 195350, "epoch": 4651} {"train_loss": -7.149591445922852, "global_step": 195351, "epoch": 4651} {"train_loss": -7.172482013702393, "global_step": 195352, "epoch": 4651} {"train_loss": -7.20770263671875, "global_step": 195353, "epoch": 4651} {"train_loss": -7.303439140319824, "global_step": 195354, "epoch": 4651} {"train_loss": -7.080554962158203, "global_step": 195355, "epoch": 4651} {"train_loss": -7.261567115783691, "global_step": 195356, "epoch": 4651} {"train_loss": -7.029791831970215, "global_step": 195357, "epoch": 4651} {"train_loss": -7.160801887512207, "global_step": 195358, "epoch": 4651} {"train_loss": -7.264536380767822, "global_step": 195359, "epoch": 4651} {"train_loss": -7.073418617248535, "global_step": 195360, "epoch": 4651} {"train_loss": -7.161238193511963, "global_step": 195361, "epoch": 4651} {"train_loss": -7.065238952636719, "global_step": 195362, "epoch": 4651} {"train_loss": -7.1434807777404785, "global_step": 195363, "epoch": 4651} {"train_loss": -7.176623344421387, "global_step": 195364, "epoch": 4651} {"train_loss": -7.171444892883301, "global_step": 195365, "epoch": 4651} {"train_loss": -7.115042209625244, "global_step": 195366, "epoch": 4651} {"train_loss": -7.208258628845215, "global_step": 195367, "epoch": 4651} {"train_loss": -7.179010391235352, "global_step": 195368, "epoch": 4651} {"train_loss": -7.1710100173950195, "global_step": 195369, "epoch": 4651} {"train_loss": -7.137442588806152, "global_step": 195370, "epoch": 4651} {"train_loss": -7.2300825119018555, "global_step": 195371, "epoch": 4651} {"train_loss": -7.184349060058594, "global_step": 195372, "epoch": 4651} {"train_loss": -7.108155250549316, "global_step": 195373, "epoch": 4651} {"train_loss": -7.132014751434326, "global_step": 195374, "epoch": 4651} {"train_loss": -7.238026142120361, "global_step": 195375, "epoch": 4651} {"train_loss": -7.312647819519043, "global_step": 195376, "epoch": 4651} {"train_loss": -7.249467372894287, "global_step": 195377, "epoch": 4651} {"train_loss": -7.162911415100098, "global_step": 195378, "epoch": 4651} {"train_loss": -7.202789306640625, "global_step": 195379, "epoch": 4651} {"train_loss": -7.1964545249938965, "global_step": 195380, "epoch": 4651} {"train_loss": -7.128544807434082, "global_step": 195381, "epoch": 4651} {"train_loss": -7.126012802124023, "global_step": 195382, "epoch": 4651} {"train_loss": -7.1753224191211515, "global_step": 195383, "epoch": 4651, "val_loss": 81372.140625} {"train_loss": -7.135036945343018, "global_step": 195384, "epoch": 4652} {"train_loss": -7.1479692459106445, "global_step": 195385, "epoch": 4652} {"train_loss": -7.180840492248535, "global_step": 195386, "epoch": 4652} {"train_loss": -7.185240745544434, "global_step": 195387, "epoch": 4652} {"train_loss": -7.297746658325195, "global_step": 195388, "epoch": 4652} {"train_loss": -7.2900800704956055, "global_step": 195389, "epoch": 4652} {"train_loss": -7.334829330444336, "global_step": 195390, "epoch": 4652} {"train_loss": -7.156678199768066, "global_step": 195391, "epoch": 4652} {"train_loss": -7.378987789154053, "global_step": 195392, "epoch": 4652} {"train_loss": -7.335563659667969, "global_step": 195393, "epoch": 4652} {"train_loss": -7.1551513671875, "global_step": 195394, "epoch": 4652} {"train_loss": -7.271350860595703, "global_step": 195395, "epoch": 4652} {"train_loss": -7.299505233764648, "global_step": 195396, "epoch": 4652} {"train_loss": -7.145293235778809, "global_step": 195397, "epoch": 4652} {"train_loss": -7.2886128425598145, "global_step": 195398, "epoch": 4652} {"train_loss": -7.354084014892578, "global_step": 195399, "epoch": 4652} {"train_loss": -7.220086097717285, "global_step": 195400, "epoch": 4652} {"train_loss": -7.2744293212890625, "global_step": 195401, "epoch": 4652} {"train_loss": -7.333630561828613, "global_step": 195402, "epoch": 4652} {"train_loss": -7.362494468688965, "global_step": 195403, "epoch": 4652} {"train_loss": -7.43333625793457, "global_step": 195404, "epoch": 4652} {"train_loss": -7.349116325378418, "global_step": 195405, "epoch": 4652} {"train_loss": -7.361240863800049, "global_step": 195406, "epoch": 4652} {"train_loss": -7.343278408050537, "global_step": 195407, "epoch": 4652} {"train_loss": -7.1798810958862305, "global_step": 195408, "epoch": 4652} {"train_loss": -7.218560695648193, "global_step": 195409, "epoch": 4652} {"train_loss": -7.269463539123535, "global_step": 195410, "epoch": 4652} {"train_loss": -7.386375904083252, "global_step": 195411, "epoch": 4652} {"train_loss": -7.27537727355957, "global_step": 195412, "epoch": 4652} {"train_loss": -7.274713039398193, "global_step": 195413, "epoch": 4652} {"train_loss": -7.235934257507324, "global_step": 195414, "epoch": 4652} {"train_loss": -7.204232692718506, "global_step": 195415, "epoch": 4652} {"train_loss": -7.421802520751953, "global_step": 195416, "epoch": 4652} {"train_loss": -7.212774753570557, "global_step": 195417, "epoch": 4652} {"train_loss": -7.258347511291504, "global_step": 195418, "epoch": 4652} {"train_loss": -7.21380615234375, "global_step": 195419, "epoch": 4652} {"train_loss": -7.266887664794922, "global_step": 195420, "epoch": 4652} {"train_loss": -7.273448467254639, "global_step": 195421, "epoch": 4652} {"train_loss": -7.146154403686523, "global_step": 195422, "epoch": 4652} {"train_loss": -7.107330322265625, "global_step": 195423, "epoch": 4652} {"train_loss": -7.174895286560059, "global_step": 195424, "epoch": 4652} {"train_loss": -7.260545934949603, "global_step": 195425, "epoch": 4652, "val_loss": 81104.375} {"train_loss": -7.107714653015137, "global_step": 195426, "epoch": 4653} {"train_loss": -7.233325481414795, "global_step": 195427, "epoch": 4653} {"train_loss": -7.237722396850586, "global_step": 195428, "epoch": 4653} {"train_loss": -7.1605987548828125, "global_step": 195429, "epoch": 4653} {"train_loss": -7.258519172668457, "global_step": 195430, "epoch": 4653} {"train_loss": -7.138858318328857, "global_step": 195431, "epoch": 4653} {"train_loss": -7.315028667449951, "global_step": 195432, "epoch": 4653} {"train_loss": -7.158495903015137, "global_step": 195433, "epoch": 4653} {"train_loss": -7.23242712020874, "global_step": 195434, "epoch": 4653} {"train_loss": -7.223793029785156, "global_step": 195435, "epoch": 4653} {"train_loss": -7.290373802185059, "global_step": 195436, "epoch": 4653} {"train_loss": -7.2349629402160645, "global_step": 195437, "epoch": 4653} {"train_loss": -7.257584095001221, "global_step": 195438, "epoch": 4653} {"train_loss": -7.368228912353516, "global_step": 195439, "epoch": 4653} {"train_loss": -7.2441887855529785, "global_step": 195440, "epoch": 4653} {"train_loss": -7.273526191711426, "global_step": 195441, "epoch": 4653} {"train_loss": -7.249926567077637, "global_step": 195442, "epoch": 4653} {"train_loss": -7.1714887619018555, "global_step": 195443, "epoch": 4653} {"train_loss": -7.2192792892456055, "global_step": 195444, "epoch": 4653} {"train_loss": -7.228572368621826, "global_step": 195445, "epoch": 4653} {"train_loss": -7.445598602294922, "global_step": 195446, "epoch": 4653} {"train_loss": -7.2905168533325195, "global_step": 195447, "epoch": 4653} {"train_loss": -7.321866989135742, "global_step": 195448, "epoch": 4653} {"train_loss": -7.036579132080078, "global_step": 195449, "epoch": 4653} {"train_loss": -7.068736553192139, "global_step": 195450, "epoch": 4653} {"train_loss": -7.307576656341553, "global_step": 195451, "epoch": 4653} {"train_loss": -7.150254249572754, "global_step": 195452, "epoch": 4653} {"train_loss": -7.1818342208862305, "global_step": 195453, "epoch": 4653} {"train_loss": -7.130001068115234, "global_step": 195454, "epoch": 4653} {"train_loss": -7.151863098144531, "global_step": 195455, "epoch": 4653} {"train_loss": -7.192410469055176, "global_step": 195456, "epoch": 4653} {"train_loss": -7.167173862457275, "global_step": 195457, "epoch": 4653} {"train_loss": -7.252246856689453, "global_step": 195458, "epoch": 4653} {"train_loss": -7.194873332977295, "global_step": 195459, "epoch": 4653} {"train_loss": -7.069589614868164, "global_step": 195460, "epoch": 4653} {"train_loss": -7.157329082489014, "global_step": 195461, "epoch": 4653} {"train_loss": -7.141263008117676, "global_step": 195462, "epoch": 4653} {"train_loss": -7.221042633056641, "global_step": 195463, "epoch": 4653} {"train_loss": -7.209633827209473, "global_step": 195464, "epoch": 4653} {"train_loss": -7.273953914642334, "global_step": 195465, "epoch": 4653} {"train_loss": -7.083752632141113, "global_step": 195466, "epoch": 4653} {"train_loss": -7.212412641161964, "global_step": 195467, "epoch": 4653, "val_loss": 81294.7578125} {"train_loss": -7.162322998046875, "global_step": 195468, "epoch": 4654} {"train_loss": -7.18875789642334, "global_step": 195469, "epoch": 4654} {"train_loss": -7.251113414764404, "global_step": 195470, "epoch": 4654} {"train_loss": -7.226403713226318, "global_step": 195471, "epoch": 4654} {"train_loss": -7.221279144287109, "global_step": 195472, "epoch": 4654} {"train_loss": -7.295164108276367, "global_step": 195473, "epoch": 4654} {"train_loss": -7.21877908706665, "global_step": 195474, "epoch": 4654} {"train_loss": -7.184831619262695, "global_step": 195475, "epoch": 4654} {"train_loss": -7.288785934448242, "global_step": 195476, "epoch": 4654} {"train_loss": -7.356095314025879, "global_step": 195477, "epoch": 4654} {"train_loss": -7.287117958068848, "global_step": 195478, "epoch": 4654} {"train_loss": -7.256923198699951, "global_step": 195479, "epoch": 4654} {"train_loss": -7.336123466491699, "global_step": 195480, "epoch": 4654} {"train_loss": -7.218939781188965, "global_step": 195481, "epoch": 4654} {"train_loss": -7.241208076477051, "global_step": 195482, "epoch": 4654} {"train_loss": -7.193406105041504, "global_step": 195483, "epoch": 4654} {"train_loss": -7.144372940063477, "global_step": 195484, "epoch": 4654} {"train_loss": -7.135115623474121, "global_step": 195485, "epoch": 4654} {"train_loss": -7.236452579498291, "global_step": 195486, "epoch": 4654} {"train_loss": -7.173424243927002, "global_step": 195487, "epoch": 4654} {"train_loss": -7.239215850830078, "global_step": 195488, "epoch": 4654} {"train_loss": -7.150493621826172, "global_step": 195489, "epoch": 4654} {"train_loss": -7.196206092834473, "global_step": 195490, "epoch": 4654} {"train_loss": -7.074771881103516, "global_step": 195491, "epoch": 4654} {"train_loss": -7.141180992126465, "global_step": 195492, "epoch": 4654} {"train_loss": -7.217815399169922, "global_step": 195493, "epoch": 4654} {"train_loss": -7.2722578048706055, "global_step": 195494, "epoch": 4654} {"train_loss": -7.17410945892334, "global_step": 195495, "epoch": 4654} {"train_loss": -7.226685523986816, "global_step": 195496, "epoch": 4654} {"train_loss": -7.211194038391113, "global_step": 195497, "epoch": 4654} {"train_loss": -7.248393535614014, "global_step": 195498, "epoch": 4654} {"train_loss": -7.176654815673828, "global_step": 195499, "epoch": 4654} {"train_loss": -7.229098796844482, "global_step": 195500, "epoch": 4654} {"train_loss": -7.222409248352051, "global_step": 195501, "epoch": 4654} {"train_loss": -7.34854793548584, "global_step": 195502, "epoch": 4654} {"train_loss": -7.215396881103516, "global_step": 195503, "epoch": 4654} {"train_loss": -7.200525283813477, "global_step": 195504, "epoch": 4654} {"train_loss": -7.325098991394043, "global_step": 195505, "epoch": 4654} {"train_loss": -7.281470775604248, "global_step": 195506, "epoch": 4654} {"train_loss": -7.266454696655273, "global_step": 195507, "epoch": 4654} {"train_loss": -7.271454811096191, "global_step": 195508, "epoch": 4654} {"train_loss": -7.230356375376384, "global_step": 195509, "epoch": 4654, "val_loss": 81276.3671875} {"train_loss": -7.372463226318359, "global_step": 195510, "epoch": 4655} {"train_loss": -7.255265235900879, "global_step": 195511, "epoch": 4655} {"train_loss": -7.330535411834717, "global_step": 195512, "epoch": 4655} {"train_loss": -7.288419723510742, "global_step": 195513, "epoch": 4655} {"train_loss": -7.294464588165283, "global_step": 195514, "epoch": 4655} {"train_loss": -7.329949378967285, "global_step": 195515, "epoch": 4655} {"train_loss": -7.302445411682129, "global_step": 195516, "epoch": 4655} {"train_loss": -7.250204086303711, "global_step": 195517, "epoch": 4655} {"train_loss": -7.305270195007324, "global_step": 195518, "epoch": 4655} {"train_loss": -7.317474365234375, "global_step": 195519, "epoch": 4655} {"train_loss": -7.316604137420654, "global_step": 195520, "epoch": 4655} {"train_loss": -7.325629234313965, "global_step": 195521, "epoch": 4655} {"train_loss": -7.229262351989746, "global_step": 195522, "epoch": 4655} {"train_loss": -7.231230735778809, "global_step": 195523, "epoch": 4655} {"train_loss": -7.3321943283081055, "global_step": 195524, "epoch": 4655} {"train_loss": -7.353872776031494, "global_step": 195525, "epoch": 4655} {"train_loss": -7.275877475738525, "global_step": 195526, "epoch": 4655} {"train_loss": -7.373798370361328, "global_step": 195527, "epoch": 4655} {"train_loss": -7.289144515991211, "global_step": 195528, "epoch": 4655} {"train_loss": -7.399574279785156, "global_step": 195529, "epoch": 4655} {"train_loss": -7.221245765686035, "global_step": 195530, "epoch": 4655} {"train_loss": -7.457103729248047, "global_step": 195531, "epoch": 4655} {"train_loss": -7.330628871917725, "global_step": 195532, "epoch": 4655} {"train_loss": -7.3814377784729, "global_step": 195533, "epoch": 4655} {"train_loss": -7.301318168640137, "global_step": 195534, "epoch": 4655} {"train_loss": -7.356173515319824, "global_step": 195535, "epoch": 4655} {"train_loss": -7.351043701171875, "global_step": 195536, "epoch": 4655} {"train_loss": -7.24711799621582, "global_step": 195537, "epoch": 4655} {"train_loss": -7.264835357666016, "global_step": 195538, "epoch": 4655} {"train_loss": -7.412757396697998, "global_step": 195539, "epoch": 4655} {"train_loss": -7.296677589416504, "global_step": 195540, "epoch": 4655} {"train_loss": -7.228386878967285, "global_step": 195541, "epoch": 4655} {"train_loss": -7.297525405883789, "global_step": 195542, "epoch": 4655} {"train_loss": -7.219435691833496, "global_step": 195543, "epoch": 4655} {"train_loss": -7.376324653625488, "global_step": 195544, "epoch": 4655} {"train_loss": -7.278947830200195, "global_step": 195545, "epoch": 4655} {"train_loss": -7.292364597320557, "global_step": 195546, "epoch": 4655} {"train_loss": -7.280160427093506, "global_step": 195547, "epoch": 4655} {"train_loss": -7.321554183959961, "global_step": 195548, "epoch": 4655} {"train_loss": -7.227901458740234, "global_step": 195549, "epoch": 4655} {"train_loss": -7.381660461425781, "global_step": 195550, "epoch": 4655} {"train_loss": -7.310420592625936, "global_step": 195551, "epoch": 4655, "val_loss": 81223.859375} {"train_loss": -7.2499003410339355, "global_step": 195552, "epoch": 4656} {"train_loss": -7.295160293579102, "global_step": 195553, "epoch": 4656} {"train_loss": -7.314846992492676, "global_step": 195554, "epoch": 4656} {"train_loss": -7.332047939300537, "global_step": 195555, "epoch": 4656} {"train_loss": -7.266088962554932, "global_step": 195556, "epoch": 4656} {"train_loss": -7.418217182159424, "global_step": 195557, "epoch": 4656} {"train_loss": -7.28780460357666, "global_step": 195558, "epoch": 4656} {"train_loss": -7.312016487121582, "global_step": 195559, "epoch": 4656} {"train_loss": -7.326472282409668, "global_step": 195560, "epoch": 4656} {"train_loss": -7.280141830444336, "global_step": 195561, "epoch": 4656} {"train_loss": -7.2346296310424805, "global_step": 195562, "epoch": 4656} {"train_loss": -7.242664337158203, "global_step": 195563, "epoch": 4656} {"train_loss": -7.324360370635986, "global_step": 195564, "epoch": 4656} {"train_loss": -7.221675872802734, "global_step": 195565, "epoch": 4656} {"train_loss": -7.277952194213867, "global_step": 195566, "epoch": 4656} {"train_loss": -7.285134792327881, "global_step": 195567, "epoch": 4656} {"train_loss": -7.230907440185547, "global_step": 195568, "epoch": 4656} {"train_loss": -7.308441638946533, "global_step": 195569, "epoch": 4656} {"train_loss": -7.191629409790039, "global_step": 195570, "epoch": 4656} {"train_loss": -7.263553619384766, "global_step": 195571, "epoch": 4656} {"train_loss": -7.15681791305542, "global_step": 195572, "epoch": 4656} {"train_loss": -7.139925956726074, "global_step": 195573, "epoch": 4656} {"train_loss": -7.299500465393066, "global_step": 195574, "epoch": 4656} {"train_loss": -7.243298530578613, "global_step": 195575, "epoch": 4656} {"train_loss": -7.311629295349121, "global_step": 195576, "epoch": 4656} {"train_loss": -7.309410095214844, "global_step": 195577, "epoch": 4656} {"train_loss": -7.211329936981201, "global_step": 195578, "epoch": 4656} {"train_loss": -7.3047194480896, "global_step": 195579, "epoch": 4656} {"train_loss": -7.306817054748535, "global_step": 195580, "epoch": 4656} {"train_loss": -7.219847202301025, "global_step": 195581, "epoch": 4656} {"train_loss": -7.311237335205078, "global_step": 195582, "epoch": 4656} {"train_loss": -7.222128868103027, "global_step": 195583, "epoch": 4656} {"train_loss": -7.344261169433594, "global_step": 195584, "epoch": 4656} {"train_loss": -7.157482624053955, "global_step": 195585, "epoch": 4656} {"train_loss": -7.287622451782227, "global_step": 195586, "epoch": 4656} {"train_loss": -7.196196556091309, "global_step": 195587, "epoch": 4656} {"train_loss": -7.290241718292236, "global_step": 195588, "epoch": 4656} {"train_loss": -7.123963356018066, "global_step": 195589, "epoch": 4656} {"train_loss": -7.210379600524902, "global_step": 195590, "epoch": 4656} {"train_loss": -7.237704277038574, "global_step": 195591, "epoch": 4656} {"train_loss": -7.109596252441406, "global_step": 195592, "epoch": 4656} {"train_loss": -7.257778326670329, "global_step": 195593, "epoch": 4656, "val_loss": 81478.8125} {"train_loss": -7.171799659729004, "global_step": 195594, "epoch": 4657} {"train_loss": -7.0634613037109375, "global_step": 195595, "epoch": 4657} {"train_loss": -7.333941459655762, "global_step": 195596, "epoch": 4657} {"train_loss": -7.253141403198242, "global_step": 195597, "epoch": 4657} {"train_loss": -7.176319122314453, "global_step": 195598, "epoch": 4657} {"train_loss": -7.365357398986816, "global_step": 195599, "epoch": 4657} {"train_loss": -7.292229652404785, "global_step": 195600, "epoch": 4657} {"train_loss": -7.2954301834106445, "global_step": 195601, "epoch": 4657} {"train_loss": -7.276268005371094, "global_step": 195602, "epoch": 4657} {"train_loss": -7.284856796264648, "global_step": 195603, "epoch": 4657} {"train_loss": -7.309844017028809, "global_step": 195604, "epoch": 4657} {"train_loss": -7.318597793579102, "global_step": 195605, "epoch": 4657} {"train_loss": -7.2837066650390625, "global_step": 195606, "epoch": 4657} {"train_loss": -7.299659729003906, "global_step": 195607, "epoch": 4657} {"train_loss": -7.363792419433594, "global_step": 195608, "epoch": 4657} {"train_loss": -7.458950996398926, "global_step": 195609, "epoch": 4657} {"train_loss": -7.319827556610107, "global_step": 195610, "epoch": 4657} {"train_loss": -7.350155830383301, "global_step": 195611, "epoch": 4657} {"train_loss": -7.360601425170898, "global_step": 195612, "epoch": 4657} {"train_loss": -7.250139236450195, "global_step": 195613, "epoch": 4657} {"train_loss": -7.158306121826172, "global_step": 195614, "epoch": 4657} {"train_loss": -7.278253555297852, "global_step": 195615, "epoch": 4657} {"train_loss": -7.208276748657227, "global_step": 195616, "epoch": 4657} {"train_loss": -7.299503326416016, "global_step": 195617, "epoch": 4657} {"train_loss": -7.150473117828369, "global_step": 195618, "epoch": 4657} {"train_loss": -7.367962837219238, "global_step": 195619, "epoch": 4657} {"train_loss": -7.301372051239014, "global_step": 195620, "epoch": 4657} {"train_loss": -7.29485559463501, "global_step": 195621, "epoch": 4657} {"train_loss": -7.285505294799805, "global_step": 195622, "epoch": 4657} {"train_loss": -7.356127738952637, "global_step": 195623, "epoch": 4657} {"train_loss": -7.130383491516113, "global_step": 195624, "epoch": 4657} {"train_loss": -7.159976005554199, "global_step": 195625, "epoch": 4657} {"train_loss": -7.289229869842529, "global_step": 195626, "epoch": 4657} {"train_loss": -7.328071117401123, "global_step": 195627, "epoch": 4657} {"train_loss": -7.257033348083496, "global_step": 195628, "epoch": 4657} {"train_loss": -7.3180341720581055, "global_step": 195629, "epoch": 4657} {"train_loss": -7.157980442047119, "global_step": 195630, "epoch": 4657} {"train_loss": -7.279921054840088, "global_step": 195631, "epoch": 4657} {"train_loss": -7.368622779846191, "global_step": 195632, "epoch": 4657} {"train_loss": -7.285955429077148, "global_step": 195633, "epoch": 4657} {"train_loss": -7.299539566040039, "global_step": 195634, "epoch": 4657} {"train_loss": -7.278724568230765, "global_step": 195635, "epoch": 4657, "val_loss": 81357.7265625} {"train_loss": -7.198906421661377, "global_step": 195636, "epoch": 4658} {"train_loss": -7.266452789306641, "global_step": 195637, "epoch": 4658} {"train_loss": -7.342392921447754, "global_step": 195638, "epoch": 4658} {"train_loss": -7.312971115112305, "global_step": 195639, "epoch": 4658} {"train_loss": -7.265911102294922, "global_step": 195640, "epoch": 4658} {"train_loss": -7.29117488861084, "global_step": 195641, "epoch": 4658} {"train_loss": -7.1652936935424805, "global_step": 195642, "epoch": 4658} {"train_loss": -7.3716630935668945, "global_step": 195643, "epoch": 4658} {"train_loss": -7.315591812133789, "global_step": 195644, "epoch": 4658} {"train_loss": -7.33000373840332, "global_step": 195645, "epoch": 4658} {"train_loss": -7.247722625732422, "global_step": 195646, "epoch": 4658} {"train_loss": -7.262116432189941, "global_step": 195647, "epoch": 4658} {"train_loss": -7.361185073852539, "global_step": 195648, "epoch": 4658} {"train_loss": -7.37370491027832, "global_step": 195649, "epoch": 4658} {"train_loss": -7.281313896179199, "global_step": 195650, "epoch": 4658} {"train_loss": -7.174717903137207, "global_step": 195651, "epoch": 4658} {"train_loss": -7.2259111404418945, "global_step": 195652, "epoch": 4658} {"train_loss": -7.31194543838501, "global_step": 195653, "epoch": 4658} {"train_loss": -7.266567230224609, "global_step": 195654, "epoch": 4658} {"train_loss": -7.143328666687012, "global_step": 195655, "epoch": 4658} {"train_loss": -7.144455909729004, "global_step": 195656, "epoch": 4658} {"train_loss": -7.341452121734619, "global_step": 195657, "epoch": 4658} {"train_loss": -7.185900688171387, "global_step": 195658, "epoch": 4658} {"train_loss": -6.9030585289001465, "global_step": 195659, "epoch": 4658} {"train_loss": -7.265069961547852, "global_step": 195660, "epoch": 4658} {"train_loss": -7.122340679168701, "global_step": 195661, "epoch": 4658} {"train_loss": -6.972650527954102, "global_step": 195662, "epoch": 4658} {"train_loss": -7.23684024810791, "global_step": 195663, "epoch": 4658} {"train_loss": -7.187864303588867, "global_step": 195664, "epoch": 4658} {"train_loss": -7.07304573059082, "global_step": 195665, "epoch": 4658} {"train_loss": -7.133640289306641, "global_step": 195666, "epoch": 4658} {"train_loss": -7.272339820861816, "global_step": 195667, "epoch": 4658} {"train_loss": -7.0613789558410645, "global_step": 195668, "epoch": 4658} {"train_loss": -7.240864276885986, "global_step": 195669, "epoch": 4658} {"train_loss": -7.130494594573975, "global_step": 195670, "epoch": 4658} {"train_loss": -7.169978618621826, "global_step": 195671, "epoch": 4658} {"train_loss": -7.290154457092285, "global_step": 195672, "epoch": 4658} {"train_loss": -7.233416557312012, "global_step": 195673, "epoch": 4658} {"train_loss": -7.196990489959717, "global_step": 195674, "epoch": 4658} {"train_loss": -7.056462287902832, "global_step": 195675, "epoch": 4658} {"train_loss": -7.217679977416992, "global_step": 195676, "epoch": 4658} {"train_loss": -7.21552898770287, "global_step": 195677, "epoch": 4658, "val_loss": 81402.0859375} {"train_loss": -7.204694747924805, "global_step": 195678, "epoch": 4659} {"train_loss": -7.209226608276367, "global_step": 195679, "epoch": 4659} {"train_loss": -7.08748722076416, "global_step": 195680, "epoch": 4659} {"train_loss": -7.1443305015563965, "global_step": 195681, "epoch": 4659} {"train_loss": -7.267401218414307, "global_step": 195682, "epoch": 4659} {"train_loss": -7.233778953552246, "global_step": 195683, "epoch": 4659} {"train_loss": -7.269758224487305, "global_step": 195684, "epoch": 4659} {"train_loss": -7.221490383148193, "global_step": 195685, "epoch": 4659} {"train_loss": -7.323695182800293, "global_step": 195686, "epoch": 4659} {"train_loss": -7.155025482177734, "global_step": 195687, "epoch": 4659} {"train_loss": -7.337589740753174, "global_step": 195688, "epoch": 4659} {"train_loss": -7.186628818511963, "global_step": 195689, "epoch": 4659} {"train_loss": -7.11277437210083, "global_step": 195690, "epoch": 4659} {"train_loss": -7.125452041625977, "global_step": 195691, "epoch": 4659} {"train_loss": -7.128904819488525, "global_step": 195692, "epoch": 4659} {"train_loss": -7.147286415100098, "global_step": 195693, "epoch": 4659} {"train_loss": -7.214040279388428, "global_step": 195694, "epoch": 4659} {"train_loss": -7.187553405761719, "global_step": 195695, "epoch": 4659} {"train_loss": -7.169460296630859, "global_step": 195696, "epoch": 4659} {"train_loss": -7.244278907775879, "global_step": 195697, "epoch": 4659} {"train_loss": -7.186490058898926, "global_step": 195698, "epoch": 4659} {"train_loss": -7.226284027099609, "global_step": 195699, "epoch": 4659} {"train_loss": -7.192130088806152, "global_step": 195700, "epoch": 4659} {"train_loss": -7.130382537841797, "global_step": 195701, "epoch": 4659} {"train_loss": -7.265419006347656, "global_step": 195702, "epoch": 4659} {"train_loss": -7.1494550704956055, "global_step": 195703, "epoch": 4659} {"train_loss": -7.150322437286377, "global_step": 195704, "epoch": 4659} {"train_loss": -7.217820167541504, "global_step": 195705, "epoch": 4659} {"train_loss": -7.093442916870117, "global_step": 195706, "epoch": 4659} {"train_loss": -7.3270134925842285, "global_step": 195707, "epoch": 4659} {"train_loss": -7.143508434295654, "global_step": 195708, "epoch": 4659} {"train_loss": -7.175401210784912, "global_step": 195709, "epoch": 4659} {"train_loss": -7.274303436279297, "global_step": 195710, "epoch": 4659} {"train_loss": -7.311953544616699, "global_step": 195711, "epoch": 4659} {"train_loss": -7.266434669494629, "global_step": 195712, "epoch": 4659} {"train_loss": -7.304268836975098, "global_step": 195713, "epoch": 4659} {"train_loss": -7.28729248046875, "global_step": 195714, "epoch": 4659} {"train_loss": -7.392402648925781, "global_step": 195715, "epoch": 4659} {"train_loss": -7.31125020980835, "global_step": 195716, "epoch": 4659} {"train_loss": -7.486775875091553, "global_step": 195717, "epoch": 4659} {"train_loss": -7.326794147491455, "global_step": 195718, "epoch": 4659} {"train_loss": -7.2257113343193415, "global_step": 195719, "epoch": 4659, "val_loss": 81257.3203125} {"train_loss": -7.32762336730957, "global_step": 195720, "epoch": 4660} {"train_loss": -7.38077449798584, "global_step": 195721, "epoch": 4660} {"train_loss": -7.340314865112305, "global_step": 195722, "epoch": 4660} {"train_loss": -7.3251800537109375, "global_step": 195723, "epoch": 4660} {"train_loss": -7.306720733642578, "global_step": 195724, "epoch": 4660} {"train_loss": -7.280041217803955, "global_step": 195725, "epoch": 4660} {"train_loss": -7.2928619384765625, "global_step": 195726, "epoch": 4660} {"train_loss": -7.180224895477295, "global_step": 195727, "epoch": 4660} {"train_loss": -7.324795722961426, "global_step": 195728, "epoch": 4660} {"train_loss": -7.315328598022461, "global_step": 195729, "epoch": 4660} {"train_loss": -7.305113792419434, "global_step": 195730, "epoch": 4660} {"train_loss": -7.231975555419922, "global_step": 195731, "epoch": 4660} {"train_loss": -7.171683311462402, "global_step": 195732, "epoch": 4660} {"train_loss": -7.157776355743408, "global_step": 195733, "epoch": 4660} {"train_loss": -7.257483005523682, "global_step": 195734, "epoch": 4660} {"train_loss": -7.294478893280029, "global_step": 195735, "epoch": 4660} {"train_loss": -7.154457092285156, "global_step": 195736, "epoch": 4660} {"train_loss": -7.244944095611572, "global_step": 195737, "epoch": 4660} {"train_loss": -7.114021301269531, "global_step": 195738, "epoch": 4660} {"train_loss": -7.189111709594727, "global_step": 195739, "epoch": 4660} {"train_loss": -7.2342400550842285, "global_step": 195740, "epoch": 4660} {"train_loss": -7.122085094451904, "global_step": 195741, "epoch": 4660} {"train_loss": -7.221189975738525, "global_step": 195742, "epoch": 4660} {"train_loss": -7.02884578704834, "global_step": 195743, "epoch": 4660} {"train_loss": -7.139458656311035, "global_step": 195744, "epoch": 4660} {"train_loss": -7.102583408355713, "global_step": 195745, "epoch": 4660} {"train_loss": -7.202765464782715, "global_step": 195746, "epoch": 4660} {"train_loss": -7.221899032592773, "global_step": 195747, "epoch": 4660} {"train_loss": -7.170934200286865, "global_step": 195748, "epoch": 4660} {"train_loss": -7.116894721984863, "global_step": 195749, "epoch": 4660} {"train_loss": -7.032085418701172, "global_step": 195750, "epoch": 4660} {"train_loss": -7.1731438636779785, "global_step": 195751, "epoch": 4660} {"train_loss": -7.149117946624756, "global_step": 195752, "epoch": 4660} {"train_loss": -7.156736373901367, "global_step": 195753, "epoch": 4660} {"train_loss": -7.232430458068848, "global_step": 195754, "epoch": 4660} {"train_loss": -7.041070938110352, "global_step": 195755, "epoch": 4660} {"train_loss": -7.198596954345703, "global_step": 195756, "epoch": 4660} {"train_loss": -7.0869293212890625, "global_step": 195757, "epoch": 4660} {"train_loss": -7.064426422119141, "global_step": 195758, "epoch": 4660} {"train_loss": -7.152475357055664, "global_step": 195759, "epoch": 4660} {"train_loss": -7.279528617858887, "global_step": 195760, "epoch": 4660} {"train_loss": -7.2029147034599665, "global_step": 195761, "epoch": 4660, "val_loss": 81366.1328125} {"train_loss": -7.220365524291992, "global_step": 195762, "epoch": 4661} {"train_loss": -7.33442497253418, "global_step": 195763, "epoch": 4661} {"train_loss": -7.244505405426025, "global_step": 195764, "epoch": 4661} {"train_loss": -7.241067409515381, "global_step": 195765, "epoch": 4661} {"train_loss": -7.275106430053711, "global_step": 195766, "epoch": 4661} {"train_loss": -7.268711566925049, "global_step": 195767, "epoch": 4661} {"train_loss": -7.288390159606934, "global_step": 195768, "epoch": 4661} {"train_loss": -7.271451473236084, "global_step": 195769, "epoch": 4661} {"train_loss": -7.297760486602783, "global_step": 195770, "epoch": 4661} {"train_loss": -7.307213306427002, "global_step": 195771, "epoch": 4661} {"train_loss": -7.256204605102539, "global_step": 195772, "epoch": 4661} {"train_loss": -7.255407810211182, "global_step": 195773, "epoch": 4661} {"train_loss": -7.288476943969727, "global_step": 195774, "epoch": 4661} {"train_loss": -7.248752593994141, "global_step": 195775, "epoch": 4661} {"train_loss": -7.380852699279785, "global_step": 195776, "epoch": 4661} {"train_loss": -7.257815361022949, "global_step": 195777, "epoch": 4661} {"train_loss": -7.276111125946045, "global_step": 195778, "epoch": 4661} {"train_loss": -7.302835464477539, "global_step": 195779, "epoch": 4661} {"train_loss": -7.267152786254883, "global_step": 195780, "epoch": 4661} {"train_loss": -7.226465225219727, "global_step": 195781, "epoch": 4661} {"train_loss": -7.296176433563232, "global_step": 195782, "epoch": 4661} {"train_loss": -7.288928031921387, "global_step": 195783, "epoch": 4661} {"train_loss": -7.311087131500244, "global_step": 195784, "epoch": 4661} {"train_loss": -7.361821174621582, "global_step": 195785, "epoch": 4661} {"train_loss": -7.332280158996582, "global_step": 195786, "epoch": 4661} {"train_loss": -7.358552932739258, "global_step": 195787, "epoch": 4661} {"train_loss": -7.31711483001709, "global_step": 195788, "epoch": 4661} {"train_loss": -7.316440105438232, "global_step": 195789, "epoch": 4661} {"train_loss": -7.310118198394775, "global_step": 195790, "epoch": 4661} {"train_loss": -7.466989517211914, "global_step": 195791, "epoch": 4661} {"train_loss": -7.354518890380859, "global_step": 195792, "epoch": 4661} {"train_loss": -7.225172996520996, "global_step": 195793, "epoch": 4661} {"train_loss": -7.362596035003662, "global_step": 195794, "epoch": 4661} {"train_loss": -7.265826225280762, "global_step": 195795, "epoch": 4661} {"train_loss": -7.216287612915039, "global_step": 195796, "epoch": 4661} {"train_loss": -7.407428741455078, "global_step": 195797, "epoch": 4661} {"train_loss": -7.3627400398254395, "global_step": 195798, "epoch": 4661} {"train_loss": -7.3458571434021, "global_step": 195799, "epoch": 4661} {"train_loss": -7.230484962463379, "global_step": 195800, "epoch": 4661} {"train_loss": -7.291343688964844, "global_step": 195801, "epoch": 4661} {"train_loss": -7.298763751983643, "global_step": 195802, "epoch": 4661} {"train_loss": -7.298036881855556, "global_step": 195803, "epoch": 4661, "val_loss": 81265.2109375} {"train_loss": -7.407837867736816, "global_step": 195804, "epoch": 4662} {"train_loss": -7.256551742553711, "global_step": 195805, "epoch": 4662} {"train_loss": -7.402743816375732, "global_step": 195806, "epoch": 4662} {"train_loss": -7.1645097732543945, "global_step": 195807, "epoch": 4662} {"train_loss": -7.2765679359436035, "global_step": 195808, "epoch": 4662} {"train_loss": -7.416537284851074, "global_step": 195809, "epoch": 4662} {"train_loss": -7.271003246307373, "global_step": 195810, "epoch": 4662} {"train_loss": -7.301202774047852, "global_step": 195811, "epoch": 4662} {"train_loss": -7.243630409240723, "global_step": 195812, "epoch": 4662} {"train_loss": -7.181982040405273, "global_step": 195813, "epoch": 4662} {"train_loss": -7.143160343170166, "global_step": 195814, "epoch": 4662} {"train_loss": -6.980251312255859, "global_step": 195815, "epoch": 4662} {"train_loss": -7.156610488891602, "global_step": 195816, "epoch": 4662} {"train_loss": -7.10045051574707, "global_step": 195817, "epoch": 4662} {"train_loss": -6.917415142059326, "global_step": 195818, "epoch": 4662} {"train_loss": -7.0391035079956055, "global_step": 195819, "epoch": 4662} {"train_loss": -7.15274715423584, "global_step": 195820, "epoch": 4662} {"train_loss": -6.968719482421875, "global_step": 195821, "epoch": 4662} {"train_loss": -7.114310264587402, "global_step": 195822, "epoch": 4662} {"train_loss": -7.0504679679870605, "global_step": 195823, "epoch": 4662} {"train_loss": -7.008289813995361, "global_step": 195824, "epoch": 4662} {"train_loss": -6.996817588806152, "global_step": 195825, "epoch": 4662} {"train_loss": -7.02244758605957, "global_step": 195826, "epoch": 4662} {"train_loss": -7.024921417236328, "global_step": 195827, "epoch": 4662} {"train_loss": -6.987009048461914, "global_step": 195828, "epoch": 4662} {"train_loss": -6.933452606201172, "global_step": 195829, "epoch": 4662} {"train_loss": -7.062360763549805, "global_step": 195830, "epoch": 4662} {"train_loss": -7.065333366394043, "global_step": 195831, "epoch": 4662} {"train_loss": -7.062270164489746, "global_step": 195832, "epoch": 4662} {"train_loss": -6.932191848754883, "global_step": 195833, "epoch": 4662} {"train_loss": -7.211879253387451, "global_step": 195834, "epoch": 4662} {"train_loss": -7.082095146179199, "global_step": 195835, "epoch": 4662} {"train_loss": -7.137206077575684, "global_step": 195836, "epoch": 4662} {"train_loss": -7.097942352294922, "global_step": 195837, "epoch": 4662} {"train_loss": -7.178471565246582, "global_step": 195838, "epoch": 4662} {"train_loss": -7.0791473388671875, "global_step": 195839, "epoch": 4662} {"train_loss": -7.12052059173584, "global_step": 195840, "epoch": 4662} {"train_loss": -7.0322418212890625, "global_step": 195841, "epoch": 4662} {"train_loss": -7.078466415405273, "global_step": 195842, "epoch": 4662} {"train_loss": -7.111908912658691, "global_step": 195843, "epoch": 4662} {"train_loss": -7.14440393447876, "global_step": 195844, "epoch": 4662} {"train_loss": -7.122208799634661, "global_step": 195845, "epoch": 4662, "val_loss": 81420.4921875} {"train_loss": -7.327179431915283, "global_step": 195846, "epoch": 4663} {"train_loss": -7.191622734069824, "global_step": 195847, "epoch": 4663} {"train_loss": -7.193940162658691, "global_step": 195848, "epoch": 4663} {"train_loss": -7.155494689941406, "global_step": 195849, "epoch": 4663} {"train_loss": -7.326563835144043, "global_step": 195850, "epoch": 4663} {"train_loss": -7.20289945602417, "global_step": 195851, "epoch": 4663} {"train_loss": -7.1633710861206055, "global_step": 195852, "epoch": 4663} {"train_loss": -7.298293113708496, "global_step": 195853, "epoch": 4663} {"train_loss": -7.233057975769043, "global_step": 195854, "epoch": 4663} {"train_loss": -7.177585601806641, "global_step": 195855, "epoch": 4663} {"train_loss": -7.19251823425293, "global_step": 195856, "epoch": 4663} {"train_loss": -7.203205108642578, "global_step": 195857, "epoch": 4663} {"train_loss": -7.273149490356445, "global_step": 195858, "epoch": 4663} {"train_loss": -7.235030174255371, "global_step": 195859, "epoch": 4663} {"train_loss": -7.282888412475586, "global_step": 195860, "epoch": 4663} {"train_loss": -7.2441229820251465, "global_step": 195861, "epoch": 4663} {"train_loss": -7.224602222442627, "global_step": 195862, "epoch": 4663} {"train_loss": -7.251494407653809, "global_step": 195863, "epoch": 4663} {"train_loss": -7.260708808898926, "global_step": 195864, "epoch": 4663} {"train_loss": -7.22785758972168, "global_step": 195865, "epoch": 4663} {"train_loss": -7.301975727081299, "global_step": 195866, "epoch": 4663} {"train_loss": -7.268943786621094, "global_step": 195867, "epoch": 4663} {"train_loss": -7.216243743896484, "global_step": 195868, "epoch": 4663} {"train_loss": -7.2184343338012695, "global_step": 195869, "epoch": 4663} {"train_loss": -7.238553524017334, "global_step": 195870, "epoch": 4663} {"train_loss": -7.304122447967529, "global_step": 195871, "epoch": 4663} {"train_loss": -7.211967468261719, "global_step": 195872, "epoch": 4663} {"train_loss": -7.275440216064453, "global_step": 195873, "epoch": 4663} {"train_loss": -7.264636993408203, "global_step": 195874, "epoch": 4663} {"train_loss": -7.227058410644531, "global_step": 195875, "epoch": 4663} {"train_loss": -7.37745475769043, "global_step": 195876, "epoch": 4663} {"train_loss": -7.31225061416626, "global_step": 195877, "epoch": 4663} {"train_loss": -7.2604193687438965, "global_step": 195878, "epoch": 4663} {"train_loss": -7.216755390167236, "global_step": 195879, "epoch": 4663} {"train_loss": -7.314687728881836, "global_step": 195880, "epoch": 4663} {"train_loss": -7.233414649963379, "global_step": 195881, "epoch": 4663} {"train_loss": -7.310423851013184, "global_step": 195882, "epoch": 4663} {"train_loss": -7.386164665222168, "global_step": 195883, "epoch": 4663} {"train_loss": -7.201703071594238, "global_step": 195884, "epoch": 4663} {"train_loss": -7.308245658874512, "global_step": 195885, "epoch": 4663} {"train_loss": -7.28525447845459, "global_step": 195886, "epoch": 4663} {"train_loss": -7.252321061633882, "global_step": 195887, "epoch": 4663, "val_loss": 81372.3203125} {"train_loss": -7.249983310699463, "global_step": 195888, "epoch": 4664} {"train_loss": -7.287949085235596, "global_step": 195889, "epoch": 4664} {"train_loss": -7.19989013671875, "global_step": 195890, "epoch": 4664} {"train_loss": -7.304361343383789, "global_step": 195891, "epoch": 4664} {"train_loss": -7.165405750274658, "global_step": 195892, "epoch": 4664} {"train_loss": -7.253558158874512, "global_step": 195893, "epoch": 4664} {"train_loss": -7.2578535079956055, "global_step": 195894, "epoch": 4664} {"train_loss": -7.219137191772461, "global_step": 195895, "epoch": 4664} {"train_loss": -7.1700239181518555, "global_step": 195896, "epoch": 4664} {"train_loss": -7.197771072387695, "global_step": 195897, "epoch": 4664} {"train_loss": -7.216014385223389, "global_step": 195898, "epoch": 4664} {"train_loss": -7.15928316116333, "global_step": 195899, "epoch": 4664} {"train_loss": -7.203037261962891, "global_step": 195900, "epoch": 4664} {"train_loss": -7.154583930969238, "global_step": 195901, "epoch": 4664} {"train_loss": -7.227842330932617, "global_step": 195902, "epoch": 4664} {"train_loss": -7.258783340454102, "global_step": 195903, "epoch": 4664} {"train_loss": -7.124451637268066, "global_step": 195904, "epoch": 4664} {"train_loss": -7.2385149002075195, "global_step": 195905, "epoch": 4664} {"train_loss": -7.224755764007568, "global_step": 195906, "epoch": 4664} {"train_loss": -7.009776592254639, "global_step": 195907, "epoch": 4664} {"train_loss": -7.211204528808594, "global_step": 195908, "epoch": 4664} {"train_loss": -7.176801681518555, "global_step": 195909, "epoch": 4664} {"train_loss": -7.199106216430664, "global_step": 195910, "epoch": 4664} {"train_loss": -7.026473522186279, "global_step": 195911, "epoch": 4664} {"train_loss": -7.155951976776123, "global_step": 195912, "epoch": 4664} {"train_loss": -7.137913227081299, "global_step": 195913, "epoch": 4664} {"train_loss": -7.24903678894043, "global_step": 195914, "epoch": 4664} {"train_loss": -7.143196105957031, "global_step": 195915, "epoch": 4664} {"train_loss": -7.341709136962891, "global_step": 195916, "epoch": 4664} {"train_loss": -7.124448776245117, "global_step": 195917, "epoch": 4664} {"train_loss": -7.166487216949463, "global_step": 195918, "epoch": 4664} {"train_loss": -7.287502765655518, "global_step": 195919, "epoch": 4664} {"train_loss": -7.174253940582275, "global_step": 195920, "epoch": 4664} {"train_loss": -7.23786735534668, "global_step": 195921, "epoch": 4664} {"train_loss": -7.228150844573975, "global_step": 195922, "epoch": 4664} {"train_loss": -7.2954912185668945, "global_step": 195923, "epoch": 4664} {"train_loss": -7.2574872970581055, "global_step": 195924, "epoch": 4664} {"train_loss": -7.283292770385742, "global_step": 195925, "epoch": 4664} {"train_loss": -7.279880523681641, "global_step": 195926, "epoch": 4664} {"train_loss": -7.219381809234619, "global_step": 195927, "epoch": 4664} {"train_loss": -7.2313995361328125, "global_step": 195928, "epoch": 4664} {"train_loss": -7.21248934382484, "global_step": 195929, "epoch": 4664, "val_loss": 81236.171875} {"train_loss": -7.309907913208008, "global_step": 195930, "epoch": 4665} {"train_loss": -7.29954719543457, "global_step": 195931, "epoch": 4665} {"train_loss": -7.345001220703125, "global_step": 195932, "epoch": 4665} {"train_loss": -7.24753999710083, "global_step": 195933, "epoch": 4665} {"train_loss": -7.282400608062744, "global_step": 195934, "epoch": 4665} {"train_loss": -7.348746299743652, "global_step": 195935, "epoch": 4665} {"train_loss": -7.164708137512207, "global_step": 195936, "epoch": 4665} {"train_loss": -7.251051902770996, "global_step": 195937, "epoch": 4665} {"train_loss": -7.373047828674316, "global_step": 195938, "epoch": 4665} {"train_loss": -7.330483436584473, "global_step": 195939, "epoch": 4665} {"train_loss": -7.332623481750488, "global_step": 195940, "epoch": 4665} {"train_loss": -7.253093242645264, "global_step": 195941, "epoch": 4665} {"train_loss": -7.340102195739746, "global_step": 195942, "epoch": 4665} {"train_loss": -7.269313812255859, "global_step": 195943, "epoch": 4665} {"train_loss": -7.271614074707031, "global_step": 195944, "epoch": 4665} {"train_loss": -7.288439750671387, "global_step": 195945, "epoch": 4665} {"train_loss": -7.296780586242676, "global_step": 195946, "epoch": 4665} {"train_loss": -7.232248306274414, "global_step": 195947, "epoch": 4665} {"train_loss": -7.166800498962402, "global_step": 195948, "epoch": 4665} {"train_loss": -7.284039497375488, "global_step": 195949, "epoch": 4665} {"train_loss": -7.256343841552734, "global_step": 195950, "epoch": 4665} {"train_loss": -7.314721584320068, "global_step": 195951, "epoch": 4665} {"train_loss": -7.349207878112793, "global_step": 195952, "epoch": 4665} {"train_loss": -7.255982875823975, "global_step": 195953, "epoch": 4665} {"train_loss": -7.407896995544434, "global_step": 195954, "epoch": 4665} {"train_loss": -7.290785789489746, "global_step": 195955, "epoch": 4665} {"train_loss": -7.270307540893555, "global_step": 195956, "epoch": 4665} {"train_loss": -7.315300941467285, "global_step": 195957, "epoch": 4665} {"train_loss": -7.193597793579102, "global_step": 195958, "epoch": 4665} {"train_loss": -7.268491744995117, "global_step": 195959, "epoch": 4665} {"train_loss": -7.315742492675781, "global_step": 195960, "epoch": 4665} {"train_loss": -7.381641387939453, "global_step": 195961, "epoch": 4665} {"train_loss": -7.314026355743408, "global_step": 195962, "epoch": 4665} {"train_loss": -7.333610534667969, "global_step": 195963, "epoch": 4665} {"train_loss": -7.378020286560059, "global_step": 195964, "epoch": 4665} {"train_loss": -7.354859352111816, "global_step": 195965, "epoch": 4665} {"train_loss": -7.3160295486450195, "global_step": 195966, "epoch": 4665} {"train_loss": -7.288687229156494, "global_step": 195967, "epoch": 4665} {"train_loss": -7.256852149963379, "global_step": 195968, "epoch": 4665} {"train_loss": -7.448074817657471, "global_step": 195969, "epoch": 4665} {"train_loss": -7.18762731552124, "global_step": 195970, "epoch": 4665} {"train_loss": -7.29749702271961, "global_step": 195971, "epoch": 4665, "val_loss": 81279.109375} {"train_loss": -7.440031051635742, "global_step": 195972, "epoch": 4666} {"train_loss": -7.33876895904541, "global_step": 195973, "epoch": 4666} {"train_loss": -7.30567741394043, "global_step": 195974, "epoch": 4666} {"train_loss": -7.2430524826049805, "global_step": 195975, "epoch": 4666} {"train_loss": -7.510565757751465, "global_step": 195976, "epoch": 4666} {"train_loss": -7.233277320861816, "global_step": 195977, "epoch": 4666} {"train_loss": -7.182069778442383, "global_step": 195978, "epoch": 4666} {"train_loss": -7.339961051940918, "global_step": 195979, "epoch": 4666} {"train_loss": -7.358491897583008, "global_step": 195980, "epoch": 4666} {"train_loss": -7.2882890701293945, "global_step": 195981, "epoch": 4666} {"train_loss": -7.174687385559082, "global_step": 195982, "epoch": 4666} {"train_loss": -7.18976354598999, "global_step": 195983, "epoch": 4666} {"train_loss": -7.041454315185547, "global_step": 195984, "epoch": 4666} {"train_loss": -7.120189189910889, "global_step": 195985, "epoch": 4666} {"train_loss": -7.254274845123291, "global_step": 195986, "epoch": 4666} {"train_loss": -7.113104820251465, "global_step": 195987, "epoch": 4666} {"train_loss": -7.129422187805176, "global_step": 195988, "epoch": 4666} {"train_loss": -6.9885454177856445, "global_step": 195989, "epoch": 4666} {"train_loss": -6.939579010009766, "global_step": 195990, "epoch": 4666} {"train_loss": -6.993769645690918, "global_step": 195991, "epoch": 4666} {"train_loss": -7.083009243011475, "global_step": 195992, "epoch": 4666} {"train_loss": -7.002060890197754, "global_step": 195993, "epoch": 4666} {"train_loss": -7.013980865478516, "global_step": 195994, "epoch": 4666} {"train_loss": -7.176653861999512, "global_step": 195995, "epoch": 4666} {"train_loss": -6.960937023162842, "global_step": 195996, "epoch": 4666} {"train_loss": -7.118233680725098, "global_step": 195997, "epoch": 4666} {"train_loss": -7.064994812011719, "global_step": 195998, "epoch": 4666} {"train_loss": -7.066073417663574, "global_step": 195999, "epoch": 4666} {"train_loss": -7.125794887542725, "global_step": 196000, "epoch": 4666} {"train_loss": -6.979674339294434, "global_step": 196001, "epoch": 4666} {"train_loss": -7.114431858062744, "global_step": 196002, "epoch": 4666} {"train_loss": -7.005919456481934, "global_step": 196003, "epoch": 4666} {"train_loss": -7.140024662017822, "global_step": 196004, "epoch": 4666} {"train_loss": -7.053153991699219, "global_step": 196005, "epoch": 4666} {"train_loss": -6.934588432312012, "global_step": 196006, "epoch": 4666} {"train_loss": -7.16288948059082, "global_step": 196007, "epoch": 4666} {"train_loss": -7.113361358642578, "global_step": 196008, "epoch": 4666} {"train_loss": -7.021600246429443, "global_step": 196009, "epoch": 4666} {"train_loss": -7.197755813598633, "global_step": 196010, "epoch": 4666} {"train_loss": -7.13957405090332, "global_step": 196011, "epoch": 4666} {"train_loss": -7.138032913208008, "global_step": 196012, "epoch": 4666} {"train_loss": -7.140099377859206, "global_step": 196013, "epoch": 4666, "val_loss": 81663.6015625} {"train_loss": -7.129539489746094, "global_step": 196014, "epoch": 4667} {"train_loss": -7.146562576293945, "global_step": 196015, "epoch": 4667} {"train_loss": -7.179663181304932, "global_step": 196016, "epoch": 4667} {"train_loss": -7.119584083557129, "global_step": 196017, "epoch": 4667} {"train_loss": -7.268272399902344, "global_step": 196018, "epoch": 4667} {"train_loss": -7.152353286743164, "global_step": 196019, "epoch": 4667} {"train_loss": -7.216374397277832, "global_step": 196020, "epoch": 4667} {"train_loss": -7.267524242401123, "global_step": 196021, "epoch": 4667} {"train_loss": -7.217155456542969, "global_step": 196022, "epoch": 4667} {"train_loss": -7.167043209075928, "global_step": 196023, "epoch": 4667} {"train_loss": -7.202847957611084, "global_step": 196024, "epoch": 4667} {"train_loss": -7.333325386047363, "global_step": 196025, "epoch": 4667} {"train_loss": -7.30793571472168, "global_step": 196026, "epoch": 4667} {"train_loss": -7.2505998611450195, "global_step": 196027, "epoch": 4667} {"train_loss": -7.31637716293335, "global_step": 196028, "epoch": 4667} {"train_loss": -7.224222183227539, "global_step": 196029, "epoch": 4667} {"train_loss": -7.2909393310546875, "global_step": 196030, "epoch": 4667} {"train_loss": -7.167577743530273, "global_step": 196031, "epoch": 4667} {"train_loss": -7.16309928894043, "global_step": 196032, "epoch": 4667} {"train_loss": -7.232810974121094, "global_step": 196033, "epoch": 4667} {"train_loss": -7.2076215744018555, "global_step": 196034, "epoch": 4667} {"train_loss": -7.225949287414551, "global_step": 196035, "epoch": 4667} {"train_loss": -7.167751312255859, "global_step": 196036, "epoch": 4667} {"train_loss": -7.32305908203125, "global_step": 196037, "epoch": 4667} {"train_loss": -7.250185966491699, "global_step": 196038, "epoch": 4667} {"train_loss": -7.287769317626953, "global_step": 196039, "epoch": 4667} {"train_loss": -7.224899768829346, "global_step": 196040, "epoch": 4667} {"train_loss": -7.206681251525879, "global_step": 196041, "epoch": 4667} {"train_loss": -7.301482200622559, "global_step": 196042, "epoch": 4667} {"train_loss": -7.209873676300049, "global_step": 196043, "epoch": 4667} {"train_loss": -7.219757080078125, "global_step": 196044, "epoch": 4667} {"train_loss": -7.2030930519104, "global_step": 196045, "epoch": 4667} {"train_loss": -7.3590288162231445, "global_step": 196046, "epoch": 4667} {"train_loss": -7.148392200469971, "global_step": 196047, "epoch": 4667} {"train_loss": -7.2073869705200195, "global_step": 196048, "epoch": 4667} {"train_loss": -7.241511344909668, "global_step": 196049, "epoch": 4667} {"train_loss": -7.077108383178711, "global_step": 196050, "epoch": 4667} {"train_loss": -7.234577178955078, "global_step": 196051, "epoch": 4667} {"train_loss": -7.226393699645996, "global_step": 196052, "epoch": 4667} {"train_loss": -7.219122409820557, "global_step": 196053, "epoch": 4667} {"train_loss": -7.291096210479736, "global_step": 196054, "epoch": 4667} {"train_loss": -7.2214349792117165, "global_step": 196055, "epoch": 4667, "val_loss": 81534.6640625} {"train_loss": -7.204177379608154, "global_step": 196056, "epoch": 4668} {"train_loss": -7.3041510581970215, "global_step": 196057, "epoch": 4668} {"train_loss": -7.163256645202637, "global_step": 196058, "epoch": 4668} {"train_loss": -7.2488579750061035, "global_step": 196059, "epoch": 4668} {"train_loss": -7.1815266609191895, "global_step": 196060, "epoch": 4668} {"train_loss": -7.289529800415039, "global_step": 196061, "epoch": 4668} {"train_loss": -7.191315174102783, "global_step": 196062, "epoch": 4668} {"train_loss": -7.151646614074707, "global_step": 196063, "epoch": 4668} {"train_loss": -7.3005571365356445, "global_step": 196064, "epoch": 4668} {"train_loss": -7.211706638336182, "global_step": 196065, "epoch": 4668} {"train_loss": -7.1904401779174805, "global_step": 196066, "epoch": 4668} {"train_loss": -7.2427778244018555, "global_step": 196067, "epoch": 4668} {"train_loss": -7.306074142456055, "global_step": 196068, "epoch": 4668} {"train_loss": -7.175537109375, "global_step": 196069, "epoch": 4668} {"train_loss": -7.080077171325684, "global_step": 196070, "epoch": 4668} {"train_loss": -7.267423152923584, "global_step": 196071, "epoch": 4668} {"train_loss": -7.314088821411133, "global_step": 196072, "epoch": 4668} {"train_loss": -7.232125282287598, "global_step": 196073, "epoch": 4668} {"train_loss": -7.303974151611328, "global_step": 196074, "epoch": 4668} {"train_loss": -7.2815704345703125, "global_step": 196075, "epoch": 4668} {"train_loss": -7.313891887664795, "global_step": 196076, "epoch": 4668} {"train_loss": -7.252931594848633, "global_step": 196077, "epoch": 4668} {"train_loss": -7.22325325012207, "global_step": 196078, "epoch": 4668} {"train_loss": -7.131632328033447, "global_step": 196079, "epoch": 4668} {"train_loss": -7.315573692321777, "global_step": 196080, "epoch": 4668} {"train_loss": -7.129039764404297, "global_step": 196081, "epoch": 4668} {"train_loss": -7.338278770446777, "global_step": 196082, "epoch": 4668} {"train_loss": -7.240248203277588, "global_step": 196083, "epoch": 4668} {"train_loss": -7.281844139099121, "global_step": 196084, "epoch": 4668} {"train_loss": -7.2288818359375, "global_step": 196085, "epoch": 4668} {"train_loss": -7.039900302886963, "global_step": 196086, "epoch": 4668} {"train_loss": -7.307365417480469, "global_step": 196087, "epoch": 4668} {"train_loss": -7.300697326660156, "global_step": 196088, "epoch": 4668} {"train_loss": -7.240251541137695, "global_step": 196089, "epoch": 4668} {"train_loss": -7.2606401443481445, "global_step": 196090, "epoch": 4668} {"train_loss": -7.181576728820801, "global_step": 196091, "epoch": 4668} {"train_loss": -7.182619571685791, "global_step": 196092, "epoch": 4668} {"train_loss": -7.208968162536621, "global_step": 196093, "epoch": 4668} {"train_loss": -7.190284729003906, "global_step": 196094, "epoch": 4668} {"train_loss": -7.2499494552612305, "global_step": 196095, "epoch": 4668} {"train_loss": -7.195038318634033, "global_step": 196096, "epoch": 4668} {"train_loss": -7.23007625625247, "global_step": 196097, "epoch": 4668, "val_loss": 81267.7890625} {"train_loss": -7.187310695648193, "global_step": 196098, "epoch": 4669} {"train_loss": -7.120682716369629, "global_step": 196099, "epoch": 4669} {"train_loss": -7.327153205871582, "global_step": 196100, "epoch": 4669} {"train_loss": -7.2055206298828125, "global_step": 196101, "epoch": 4669} {"train_loss": -7.070374965667725, "global_step": 196102, "epoch": 4669} {"train_loss": -7.131772041320801, "global_step": 196103, "epoch": 4669} {"train_loss": -7.194705963134766, "global_step": 196104, "epoch": 4669} {"train_loss": -7.260133743286133, "global_step": 196105, "epoch": 4669} {"train_loss": -7.185348987579346, "global_step": 196106, "epoch": 4669} {"train_loss": -7.282853126525879, "global_step": 196107, "epoch": 4669} {"train_loss": -7.361328125, "global_step": 196108, "epoch": 4669} {"train_loss": -7.126626968383789, "global_step": 196109, "epoch": 4669} {"train_loss": -7.309825420379639, "global_step": 196110, "epoch": 4669} {"train_loss": -7.339717388153076, "global_step": 196111, "epoch": 4669} {"train_loss": -7.344083309173584, "global_step": 196112, "epoch": 4669} {"train_loss": -7.219358444213867, "global_step": 196113, "epoch": 4669} {"train_loss": -7.276726722717285, "global_step": 196114, "epoch": 4669} {"train_loss": -7.37060546875, "global_step": 196115, "epoch": 4669} {"train_loss": -7.292633533477783, "global_step": 196116, "epoch": 4669} {"train_loss": -7.285061836242676, "global_step": 196117, "epoch": 4669} {"train_loss": -7.339221000671387, "global_step": 196118, "epoch": 4669} {"train_loss": -7.386655807495117, "global_step": 196119, "epoch": 4669} {"train_loss": -7.355465888977051, "global_step": 196120, "epoch": 4669} {"train_loss": -7.302281379699707, "global_step": 196121, "epoch": 4669} {"train_loss": -7.236877918243408, "global_step": 196122, "epoch": 4669} {"train_loss": -7.319897651672363, "global_step": 196123, "epoch": 4669} {"train_loss": -7.343029022216797, "global_step": 196124, "epoch": 4669} {"train_loss": -7.3521809577941895, "global_step": 196125, "epoch": 4669} {"train_loss": -7.2908735275268555, "global_step": 196126, "epoch": 4669} {"train_loss": -7.317663192749023, "global_step": 196127, "epoch": 4669} {"train_loss": -7.265927791595459, "global_step": 196128, "epoch": 4669} {"train_loss": -7.401362895965576, "global_step": 196129, "epoch": 4669} {"train_loss": -7.359423637390137, "global_step": 196130, "epoch": 4669} {"train_loss": -7.310384750366211, "global_step": 196131, "epoch": 4669} {"train_loss": -7.271552085876465, "global_step": 196132, "epoch": 4669} {"train_loss": -7.405541896820068, "global_step": 196133, "epoch": 4669} {"train_loss": -7.273524761199951, "global_step": 196134, "epoch": 4669} {"train_loss": -7.301968574523926, "global_step": 196135, "epoch": 4669} {"train_loss": -7.3575592041015625, "global_step": 196136, "epoch": 4669} {"train_loss": -7.348471164703369, "global_step": 196137, "epoch": 4669} {"train_loss": -7.414283752441406, "global_step": 196138, "epoch": 4669} {"train_loss": -7.289961848940168, "global_step": 196139, "epoch": 4669, "val_loss": 81174.015625} {"train_loss": -7.419475555419922, "global_step": 196140, "epoch": 4670} {"train_loss": -7.391962051391602, "global_step": 196141, "epoch": 4670} {"train_loss": -7.306271553039551, "global_step": 196142, "epoch": 4670} {"train_loss": -7.2994704246521, "global_step": 196143, "epoch": 4670} {"train_loss": -7.25049352645874, "global_step": 196144, "epoch": 4670} {"train_loss": -7.362085819244385, "global_step": 196145, "epoch": 4670} {"train_loss": -7.300771713256836, "global_step": 196146, "epoch": 4670} {"train_loss": -7.3670806884765625, "global_step": 196147, "epoch": 4670} {"train_loss": -7.219752788543701, "global_step": 196148, "epoch": 4670} {"train_loss": -7.25506591796875, "global_step": 196149, "epoch": 4670} {"train_loss": -7.223082065582275, "global_step": 196150, "epoch": 4670} {"train_loss": -7.150091171264648, "global_step": 196151, "epoch": 4670} {"train_loss": -7.1680402755737305, "global_step": 196152, "epoch": 4670} {"train_loss": -7.277222633361816, "global_step": 196153, "epoch": 4670} {"train_loss": -6.993526458740234, "global_step": 196154, "epoch": 4670} {"train_loss": -7.1529107093811035, "global_step": 196155, "epoch": 4670} {"train_loss": -7.194526672363281, "global_step": 196156, "epoch": 4670} {"train_loss": -7.01303768157959, "global_step": 196157, "epoch": 4670} {"train_loss": -7.331046104431152, "global_step": 196158, "epoch": 4670} {"train_loss": -7.171470642089844, "global_step": 196159, "epoch": 4670} {"train_loss": -7.137932777404785, "global_step": 196160, "epoch": 4670} {"train_loss": -7.225951194763184, "global_step": 196161, "epoch": 4670} {"train_loss": -7.044977188110352, "global_step": 196162, "epoch": 4670} {"train_loss": -7.211447715759277, "global_step": 196163, "epoch": 4670} {"train_loss": -7.222746849060059, "global_step": 196164, "epoch": 4670} {"train_loss": -7.222665786743164, "global_step": 196165, "epoch": 4670} {"train_loss": -7.227714538574219, "global_step": 196166, "epoch": 4670} {"train_loss": -7.183070659637451, "global_step": 196167, "epoch": 4670} {"train_loss": -7.278248310089111, "global_step": 196168, "epoch": 4670} {"train_loss": -7.256260871887207, "global_step": 196169, "epoch": 4670} {"train_loss": -7.317526817321777, "global_step": 196170, "epoch": 4670} {"train_loss": -7.224649429321289, "global_step": 196171, "epoch": 4670} {"train_loss": -7.34517765045166, "global_step": 196172, "epoch": 4670} {"train_loss": -7.2391676902771, "global_step": 196173, "epoch": 4670} {"train_loss": -7.341708183288574, "global_step": 196174, "epoch": 4670} {"train_loss": -7.280239105224609, "global_step": 196175, "epoch": 4670} {"train_loss": -7.1355085372924805, "global_step": 196176, "epoch": 4670} {"train_loss": -7.348174095153809, "global_step": 196177, "epoch": 4670} {"train_loss": -7.206189155578613, "global_step": 196178, "epoch": 4670} {"train_loss": -7.316227436065674, "global_step": 196179, "epoch": 4670} {"train_loss": -7.197386264801025, "global_step": 196180, "epoch": 4670} {"train_loss": -7.242041360764277, "global_step": 196181, "epoch": 4670, "val_loss": 81359.2890625} {"train_loss": -7.240077018737793, "global_step": 196182, "epoch": 4671} {"train_loss": -7.268440246582031, "global_step": 196183, "epoch": 4671} {"train_loss": -7.221783638000488, "global_step": 196184, "epoch": 4671} {"train_loss": -7.126276969909668, "global_step": 196185, "epoch": 4671} {"train_loss": -7.19743537902832, "global_step": 196186, "epoch": 4671} {"train_loss": -7.175542831420898, "global_step": 196187, "epoch": 4671} {"train_loss": -7.095746994018555, "global_step": 196188, "epoch": 4671} {"train_loss": -7.33486270904541, "global_step": 196189, "epoch": 4671} {"train_loss": -7.020377159118652, "global_step": 196190, "epoch": 4671} {"train_loss": -7.1197404861450195, "global_step": 196191, "epoch": 4671} {"train_loss": -7.330774307250977, "global_step": 196192, "epoch": 4671} {"train_loss": -7.326146125793457, "global_step": 196193, "epoch": 4671} {"train_loss": -7.322649955749512, "global_step": 196194, "epoch": 4671} {"train_loss": -7.207049369812012, "global_step": 196195, "epoch": 4671} {"train_loss": -7.1645731925964355, "global_step": 196196, "epoch": 4671} {"train_loss": -7.277090072631836, "global_step": 196197, "epoch": 4671} {"train_loss": -7.241185188293457, "global_step": 196198, "epoch": 4671} {"train_loss": -7.357527732849121, "global_step": 196199, "epoch": 4671} {"train_loss": -7.32692813873291, "global_step": 196200, "epoch": 4671} {"train_loss": -7.3494157791137695, "global_step": 196201, "epoch": 4671} {"train_loss": -7.30598258972168, "global_step": 196202, "epoch": 4671} {"train_loss": -7.398415565490723, "global_step": 196203, "epoch": 4671} {"train_loss": -7.350711345672607, "global_step": 196204, "epoch": 4671} {"train_loss": -7.419316291809082, "global_step": 196205, "epoch": 4671} {"train_loss": -7.312565803527832, "global_step": 196206, "epoch": 4671} {"train_loss": -7.288390636444092, "global_step": 196207, "epoch": 4671} {"train_loss": -7.296358108520508, "global_step": 196208, "epoch": 4671} {"train_loss": -7.339670658111572, "global_step": 196209, "epoch": 4671} {"train_loss": -7.305225849151611, "global_step": 196210, "epoch": 4671} {"train_loss": -7.280307769775391, "global_step": 196211, "epoch": 4671} {"train_loss": -7.277474880218506, "global_step": 196212, "epoch": 4671} {"train_loss": -7.231473922729492, "global_step": 196213, "epoch": 4671} {"train_loss": -7.324429988861084, "global_step": 196214, "epoch": 4671} {"train_loss": -7.350952625274658, "global_step": 196215, "epoch": 4671} {"train_loss": -7.427790641784668, "global_step": 196216, "epoch": 4671} {"train_loss": -7.3772783279418945, "global_step": 196217, "epoch": 4671} {"train_loss": -7.386264324188232, "global_step": 196218, "epoch": 4671} {"train_loss": -7.321091175079346, "global_step": 196219, "epoch": 4671} {"train_loss": -7.383993148803711, "global_step": 196220, "epoch": 4671} {"train_loss": -7.3511643409729, "global_step": 196221, "epoch": 4671} {"train_loss": -7.4027204513549805, "global_step": 196222, "epoch": 4671} {"train_loss": -7.287420499892462, "global_step": 196223, "epoch": 4671, "val_loss": 81179.71875} {"train_loss": -7.224731922149658, "global_step": 196224, "epoch": 4672} {"train_loss": -7.117511749267578, "global_step": 196225, "epoch": 4672} {"train_loss": -7.33637809753418, "global_step": 196226, "epoch": 4672} {"train_loss": -7.236301422119141, "global_step": 196227, "epoch": 4672} {"train_loss": -7.320029258728027, "global_step": 196228, "epoch": 4672} {"train_loss": -7.198777198791504, "global_step": 196229, "epoch": 4672} {"train_loss": -7.152786731719971, "global_step": 196230, "epoch": 4672} {"train_loss": -7.126729488372803, "global_step": 196231, "epoch": 4672} {"train_loss": -7.331000328063965, "global_step": 196232, "epoch": 4672} {"train_loss": -7.26651668548584, "global_step": 196233, "epoch": 4672} {"train_loss": -7.219046592712402, "global_step": 196234, "epoch": 4672} {"train_loss": -7.367071628570557, "global_step": 196235, "epoch": 4672} {"train_loss": -7.238650798797607, "global_step": 196236, "epoch": 4672} {"train_loss": -7.2464447021484375, "global_step": 196237, "epoch": 4672} {"train_loss": -7.303659439086914, "global_step": 196238, "epoch": 4672} {"train_loss": -7.310364723205566, "global_step": 196239, "epoch": 4672} {"train_loss": -7.335213661193848, "global_step": 196240, "epoch": 4672} {"train_loss": -7.31080436706543, "global_step": 196241, "epoch": 4672} {"train_loss": -7.314518928527832, "global_step": 196242, "epoch": 4672} {"train_loss": -7.283344268798828, "global_step": 196243, "epoch": 4672} {"train_loss": -7.210351943969727, "global_step": 196244, "epoch": 4672} {"train_loss": -7.247680187225342, "global_step": 196245, "epoch": 4672} {"train_loss": -7.268637657165527, "global_step": 196246, "epoch": 4672} {"train_loss": -7.230788230895996, "global_step": 196247, "epoch": 4672} {"train_loss": -7.2626118659973145, "global_step": 196248, "epoch": 4672} {"train_loss": -7.19409704208374, "global_step": 196249, "epoch": 4672} {"train_loss": -7.166869163513184, "global_step": 196250, "epoch": 4672} {"train_loss": -7.3251953125, "global_step": 196251, "epoch": 4672} {"train_loss": -7.201385021209717, "global_step": 196252, "epoch": 4672} {"train_loss": -7.246262550354004, "global_step": 196253, "epoch": 4672} {"train_loss": -7.263811111450195, "global_step": 196254, "epoch": 4672} {"train_loss": -7.21147346496582, "global_step": 196255, "epoch": 4672} {"train_loss": -7.192383766174316, "global_step": 196256, "epoch": 4672} {"train_loss": -7.191015243530273, "global_step": 196257, "epoch": 4672} {"train_loss": -7.2890472412109375, "global_step": 196258, "epoch": 4672} {"train_loss": -7.258125305175781, "global_step": 196259, "epoch": 4672} {"train_loss": -7.219634056091309, "global_step": 196260, "epoch": 4672} {"train_loss": -7.268046855926514, "global_step": 196261, "epoch": 4672} {"train_loss": -7.226926326751709, "global_step": 196262, "epoch": 4672} {"train_loss": -7.198779106140137, "global_step": 196263, "epoch": 4672} {"train_loss": -7.245570182800293, "global_step": 196264, "epoch": 4672} {"train_loss": -7.2484321026575, "global_step": 196265, "epoch": 4672, "val_loss": 81129.9921875} {"train_loss": -7.2727274894714355, "global_step": 196266, "epoch": 4673} {"train_loss": -7.299821853637695, "global_step": 196267, "epoch": 4673} {"train_loss": -7.290724754333496, "global_step": 196268, "epoch": 4673} {"train_loss": -7.252789497375488, "global_step": 196269, "epoch": 4673} {"train_loss": -7.268570899963379, "global_step": 196270, "epoch": 4673} {"train_loss": -7.109635829925537, "global_step": 196271, "epoch": 4673} {"train_loss": -7.256623268127441, "global_step": 196272, "epoch": 4673} {"train_loss": -7.350278377532959, "global_step": 196273, "epoch": 4673} {"train_loss": -7.146424293518066, "global_step": 196274, "epoch": 4673} {"train_loss": -7.312628269195557, "global_step": 196275, "epoch": 4673} {"train_loss": -7.293882369995117, "global_step": 196276, "epoch": 4673} {"train_loss": -7.215104103088379, "global_step": 196277, "epoch": 4673} {"train_loss": -7.26767635345459, "global_step": 196278, "epoch": 4673} {"train_loss": -7.378687858581543, "global_step": 196279, "epoch": 4673} {"train_loss": -7.30640172958374, "global_step": 196280, "epoch": 4673} {"train_loss": -7.277453422546387, "global_step": 196281, "epoch": 4673} {"train_loss": -7.373706817626953, "global_step": 196282, "epoch": 4673} {"train_loss": -7.343612194061279, "global_step": 196283, "epoch": 4673} {"train_loss": -7.239548683166504, "global_step": 196284, "epoch": 4673} {"train_loss": -7.349166393280029, "global_step": 196285, "epoch": 4673} {"train_loss": -7.203459739685059, "global_step": 196286, "epoch": 4673} {"train_loss": -7.203168869018555, "global_step": 196287, "epoch": 4673} {"train_loss": -7.339325904846191, "global_step": 196288, "epoch": 4673} {"train_loss": -7.307199478149414, "global_step": 196289, "epoch": 4673} {"train_loss": -7.264348983764648, "global_step": 196290, "epoch": 4673} {"train_loss": -7.165733814239502, "global_step": 196291, "epoch": 4673} {"train_loss": -7.410400390625, "global_step": 196292, "epoch": 4673} {"train_loss": -7.163389682769775, "global_step": 196293, "epoch": 4673} {"train_loss": -7.116130828857422, "global_step": 196294, "epoch": 4673} {"train_loss": -7.2478861808776855, "global_step": 196295, "epoch": 4673} {"train_loss": -7.238089561462402, "global_step": 196296, "epoch": 4673} {"train_loss": -7.238251209259033, "global_step": 196297, "epoch": 4673} {"train_loss": -7.231212615966797, "global_step": 196298, "epoch": 4673} {"train_loss": -7.2499566078186035, "global_step": 196299, "epoch": 4673} {"train_loss": -7.2431135177612305, "global_step": 196300, "epoch": 4673} {"train_loss": -7.095129013061523, "global_step": 196301, "epoch": 4673} {"train_loss": -7.230537414550781, "global_step": 196302, "epoch": 4673} {"train_loss": -7.338962078094482, "global_step": 196303, "epoch": 4673} {"train_loss": -7.1495161056518555, "global_step": 196304, "epoch": 4673} {"train_loss": -7.214946746826172, "global_step": 196305, "epoch": 4673} {"train_loss": -7.301860809326172, "global_step": 196306, "epoch": 4673} {"train_loss": -7.2570050330389115, "global_step": 196307, "epoch": 4673, "val_loss": 81033.015625} {"train_loss": -7.157857418060303, "global_step": 196308, "epoch": 4674} {"train_loss": -7.314247131347656, "global_step": 196309, "epoch": 4674} {"train_loss": -7.1697306632995605, "global_step": 196310, "epoch": 4674} {"train_loss": -7.419629096984863, "global_step": 196311, "epoch": 4674} {"train_loss": -7.255596160888672, "global_step": 196312, "epoch": 4674} {"train_loss": -7.181447505950928, "global_step": 196313, "epoch": 4674} {"train_loss": -7.0643391609191895, "global_step": 196314, "epoch": 4674} {"train_loss": -7.151610374450684, "global_step": 196315, "epoch": 4674} {"train_loss": -7.292098045349121, "global_step": 196316, "epoch": 4674} {"train_loss": -7.205948829650879, "global_step": 196317, "epoch": 4674} {"train_loss": -7.1601457595825195, "global_step": 196318, "epoch": 4674} {"train_loss": -7.31166410446167, "global_step": 196319, "epoch": 4674} {"train_loss": -7.292902946472168, "global_step": 196320, "epoch": 4674} {"train_loss": -7.333288192749023, "global_step": 196321, "epoch": 4674} {"train_loss": -7.215747833251953, "global_step": 196322, "epoch": 4674} {"train_loss": -7.327261924743652, "global_step": 196323, "epoch": 4674} {"train_loss": -7.267088890075684, "global_step": 196324, "epoch": 4674} {"train_loss": -7.2466325759887695, "global_step": 196325, "epoch": 4674} {"train_loss": -7.115242958068848, "global_step": 196326, "epoch": 4674} {"train_loss": -7.384661674499512, "global_step": 196327, "epoch": 4674} {"train_loss": -7.244447708129883, "global_step": 196328, "epoch": 4674} {"train_loss": -7.29971981048584, "global_step": 196329, "epoch": 4674} {"train_loss": -7.387074947357178, "global_step": 196330, "epoch": 4674} {"train_loss": -7.3728766441345215, "global_step": 196331, "epoch": 4674} {"train_loss": -7.363238334655762, "global_step": 196332, "epoch": 4674} {"train_loss": -7.211103439331055, "global_step": 196333, "epoch": 4674} {"train_loss": -7.332716941833496, "global_step": 196334, "epoch": 4674} {"train_loss": -7.341352462768555, "global_step": 196335, "epoch": 4674} {"train_loss": -7.380411148071289, "global_step": 196336, "epoch": 4674} {"train_loss": -7.273780345916748, "global_step": 196337, "epoch": 4674} {"train_loss": -7.368433952331543, "global_step": 196338, "epoch": 4674} {"train_loss": -7.391814231872559, "global_step": 196339, "epoch": 4674} {"train_loss": -7.25953483581543, "global_step": 196340, "epoch": 4674} {"train_loss": -7.349142074584961, "global_step": 196341, "epoch": 4674} {"train_loss": -7.317150592803955, "global_step": 196342, "epoch": 4674} {"train_loss": -7.305695533752441, "global_step": 196343, "epoch": 4674} {"train_loss": -7.374810695648193, "global_step": 196344, "epoch": 4674} {"train_loss": -7.27069091796875, "global_step": 196345, "epoch": 4674} {"train_loss": -7.377746105194092, "global_step": 196346, "epoch": 4674} {"train_loss": -7.319085121154785, "global_step": 196347, "epoch": 4674} {"train_loss": -7.199243545532227, "global_step": 196348, "epoch": 4674} {"train_loss": -7.282680454708281, "global_step": 196349, "epoch": 4674, "val_loss": 81357.5546875} {"train_loss": -7.3518171310424805, "global_step": 196350, "epoch": 4675} {"train_loss": -7.196016788482666, "global_step": 196351, "epoch": 4675} {"train_loss": -7.243292808532715, "global_step": 196352, "epoch": 4675} {"train_loss": -7.272198677062988, "global_step": 196353, "epoch": 4675} {"train_loss": -7.271258354187012, "global_step": 196354, "epoch": 4675} {"train_loss": -7.391536712646484, "global_step": 196355, "epoch": 4675} {"train_loss": -7.280557632446289, "global_step": 196356, "epoch": 4675} {"train_loss": -7.2039995193481445, "global_step": 196357, "epoch": 4675} {"train_loss": -7.397943496704102, "global_step": 196358, "epoch": 4675} {"train_loss": -7.186161041259766, "global_step": 196359, "epoch": 4675} {"train_loss": -7.322044372558594, "global_step": 196360, "epoch": 4675} {"train_loss": -7.2615766525268555, "global_step": 196361, "epoch": 4675} {"train_loss": -7.27406644821167, "global_step": 196362, "epoch": 4675} {"train_loss": -7.30802059173584, "global_step": 196363, "epoch": 4675} {"train_loss": -7.317813873291016, "global_step": 196364, "epoch": 4675} {"train_loss": -7.336681365966797, "global_step": 196365, "epoch": 4675} {"train_loss": -7.364077568054199, "global_step": 196366, "epoch": 4675} {"train_loss": -7.361854076385498, "global_step": 196367, "epoch": 4675} {"train_loss": -7.220694541931152, "global_step": 196368, "epoch": 4675} {"train_loss": -7.172818660736084, "global_step": 196369, "epoch": 4675} {"train_loss": -7.149396896362305, "global_step": 196370, "epoch": 4675} {"train_loss": -7.227776527404785, "global_step": 196371, "epoch": 4675} {"train_loss": -7.3108930587768555, "global_step": 196372, "epoch": 4675} {"train_loss": -7.2057929039001465, "global_step": 196373, "epoch": 4675} {"train_loss": -7.134757041931152, "global_step": 196374, "epoch": 4675} {"train_loss": -7.2942376136779785, "global_step": 196375, "epoch": 4675} {"train_loss": -7.2277398109436035, "global_step": 196376, "epoch": 4675} {"train_loss": -7.152492523193359, "global_step": 196377, "epoch": 4675} {"train_loss": -7.315523147583008, "global_step": 196378, "epoch": 4675} {"train_loss": -7.269183158874512, "global_step": 196379, "epoch": 4675} {"train_loss": -7.198624134063721, "global_step": 196380, "epoch": 4675} {"train_loss": -7.13167667388916, "global_step": 196381, "epoch": 4675} {"train_loss": -7.242611885070801, "global_step": 196382, "epoch": 4675} {"train_loss": -7.128225326538086, "global_step": 196383, "epoch": 4675} {"train_loss": -7.3498759269714355, "global_step": 196384, "epoch": 4675} {"train_loss": -7.214935779571533, "global_step": 196385, "epoch": 4675} {"train_loss": -7.139856338500977, "global_step": 196386, "epoch": 4675} {"train_loss": -7.2743330001831055, "global_step": 196387, "epoch": 4675} {"train_loss": -7.087963581085205, "global_step": 196388, "epoch": 4675} {"train_loss": -7.250540256500244, "global_step": 196389, "epoch": 4675} {"train_loss": -7.238209247589111, "global_step": 196390, "epoch": 4675} {"train_loss": -7.250930229822795, "global_step": 196391, "epoch": 4675, "val_loss": 81292.6484375} {"train_loss": -7.334819316864014, "global_step": 196392, "epoch": 4676} {"train_loss": -7.185643196105957, "global_step": 196393, "epoch": 4676} {"train_loss": -7.276846885681152, "global_step": 196394, "epoch": 4676} {"train_loss": -7.202821254730225, "global_step": 196395, "epoch": 4676} {"train_loss": -7.1969099044799805, "global_step": 196396, "epoch": 4676} {"train_loss": -7.286497592926025, "global_step": 196397, "epoch": 4676} {"train_loss": -7.265200138092041, "global_step": 196398, "epoch": 4676} {"train_loss": -7.3534088134765625, "global_step": 196399, "epoch": 4676} {"train_loss": -7.268791198730469, "global_step": 196400, "epoch": 4676} {"train_loss": -7.281172752380371, "global_step": 196401, "epoch": 4676} {"train_loss": -7.260046005249023, "global_step": 196402, "epoch": 4676} {"train_loss": -7.2379560470581055, "global_step": 196403, "epoch": 4676} {"train_loss": -7.151288032531738, "global_step": 196404, "epoch": 4676} {"train_loss": -7.257025718688965, "global_step": 196405, "epoch": 4676} {"train_loss": -7.368946075439453, "global_step": 196406, "epoch": 4676} {"train_loss": -7.312288284301758, "global_step": 196407, "epoch": 4676} {"train_loss": -7.3305158615112305, "global_step": 196408, "epoch": 4676} {"train_loss": -7.346321105957031, "global_step": 196409, "epoch": 4676} {"train_loss": -7.200078010559082, "global_step": 196410, "epoch": 4676} {"train_loss": -7.235169410705566, "global_step": 196411, "epoch": 4676} {"train_loss": -7.209003448486328, "global_step": 196412, "epoch": 4676} {"train_loss": -7.381630897521973, "global_step": 196413, "epoch": 4676} {"train_loss": -7.193521499633789, "global_step": 196414, "epoch": 4676} {"train_loss": -7.306557655334473, "global_step": 196415, "epoch": 4676} {"train_loss": -7.189652442932129, "global_step": 196416, "epoch": 4676} {"train_loss": -7.14623498916626, "global_step": 196417, "epoch": 4676} {"train_loss": -7.258717060089111, "global_step": 196418, "epoch": 4676} {"train_loss": -7.168970108032227, "global_step": 196419, "epoch": 4676} {"train_loss": -7.15565299987793, "global_step": 196420, "epoch": 4676} {"train_loss": -7.24340295791626, "global_step": 196421, "epoch": 4676} {"train_loss": -7.211752891540527, "global_step": 196422, "epoch": 4676} {"train_loss": -7.203227996826172, "global_step": 196423, "epoch": 4676} {"train_loss": -7.304191589355469, "global_step": 196424, "epoch": 4676} {"train_loss": -7.392326831817627, "global_step": 196425, "epoch": 4676} {"train_loss": -7.168430328369141, "global_step": 196426, "epoch": 4676} {"train_loss": -7.2071638107299805, "global_step": 196427, "epoch": 4676} {"train_loss": -7.28564453125, "global_step": 196428, "epoch": 4676} {"train_loss": -7.080416679382324, "global_step": 196429, "epoch": 4676} {"train_loss": -7.2223029136657715, "global_step": 196430, "epoch": 4676} {"train_loss": -7.18864631652832, "global_step": 196431, "epoch": 4676} {"train_loss": -7.1906561851501465, "global_step": 196432, "epoch": 4676} {"train_loss": -7.244488261994862, "global_step": 196433, "epoch": 4676, "val_loss": 81101.8515625} {"train_loss": -7.365604400634766, "global_step": 196434, "epoch": 4677} {"train_loss": -7.230273246765137, "global_step": 196435, "epoch": 4677} {"train_loss": -7.13254451751709, "global_step": 196436, "epoch": 4677} {"train_loss": -7.407853126525879, "global_step": 196437, "epoch": 4677} {"train_loss": -7.272442817687988, "global_step": 196438, "epoch": 4677} {"train_loss": -7.2251482009887695, "global_step": 196439, "epoch": 4677} {"train_loss": -7.165909290313721, "global_step": 196440, "epoch": 4677} {"train_loss": -7.189024925231934, "global_step": 196441, "epoch": 4677} {"train_loss": -7.30586051940918, "global_step": 196442, "epoch": 4677} {"train_loss": -7.2516069412231445, "global_step": 196443, "epoch": 4677} {"train_loss": -7.201392650604248, "global_step": 196444, "epoch": 4677} {"train_loss": -7.322643280029297, "global_step": 196445, "epoch": 4677} {"train_loss": -7.194025993347168, "global_step": 196446, "epoch": 4677} {"train_loss": -7.22169303894043, "global_step": 196447, "epoch": 4677} {"train_loss": -7.288389205932617, "global_step": 196448, "epoch": 4677} {"train_loss": -7.222203731536865, "global_step": 196449, "epoch": 4677} {"train_loss": -7.1704912185668945, "global_step": 196450, "epoch": 4677} {"train_loss": -7.279117584228516, "global_step": 196451, "epoch": 4677} {"train_loss": -7.039267539978027, "global_step": 196452, "epoch": 4677} {"train_loss": -7.229610443115234, "global_step": 196453, "epoch": 4677} {"train_loss": -7.350341796875, "global_step": 196454, "epoch": 4677} {"train_loss": -7.246476173400879, "global_step": 196455, "epoch": 4677} {"train_loss": -7.282776355743408, "global_step": 196456, "epoch": 4677} {"train_loss": -7.231655120849609, "global_step": 196457, "epoch": 4677} {"train_loss": -7.273353576660156, "global_step": 196458, "epoch": 4677} {"train_loss": -7.28807258605957, "global_step": 196459, "epoch": 4677} {"train_loss": -7.211954116821289, "global_step": 196460, "epoch": 4677} {"train_loss": -7.280555725097656, "global_step": 196461, "epoch": 4677} {"train_loss": -7.132312774658203, "global_step": 196462, "epoch": 4677} {"train_loss": -7.244489669799805, "global_step": 196463, "epoch": 4677} {"train_loss": -7.279430389404297, "global_step": 196464, "epoch": 4677} {"train_loss": -7.136731147766113, "global_step": 196465, "epoch": 4677} {"train_loss": -7.137941360473633, "global_step": 196466, "epoch": 4677} {"train_loss": -7.314883232116699, "global_step": 196467, "epoch": 4677} {"train_loss": -7.304718971252441, "global_step": 196468, "epoch": 4677} {"train_loss": -7.191695690155029, "global_step": 196469, "epoch": 4677} {"train_loss": -7.287808418273926, "global_step": 196470, "epoch": 4677} {"train_loss": -7.176033973693848, "global_step": 196471, "epoch": 4677} {"train_loss": -7.260384559631348, "global_step": 196472, "epoch": 4677} {"train_loss": -7.106095790863037, "global_step": 196473, "epoch": 4677} {"train_loss": -7.217697620391846, "global_step": 196474, "epoch": 4677} {"train_loss": -7.236671197982061, "global_step": 196475, "epoch": 4677, "val_loss": 81159.8671875} {"train_loss": -7.1430816650390625, "global_step": 196476, "epoch": 4678} {"train_loss": -7.425361633300781, "global_step": 196477, "epoch": 4678} {"train_loss": -7.0590925216674805, "global_step": 196478, "epoch": 4678} {"train_loss": -7.1463775634765625, "global_step": 196479, "epoch": 4678} {"train_loss": -7.254762649536133, "global_step": 196480, "epoch": 4678} {"train_loss": -7.199652671813965, "global_step": 196481, "epoch": 4678} {"train_loss": -7.139552593231201, "global_step": 196482, "epoch": 4678} {"train_loss": -7.276820659637451, "global_step": 196483, "epoch": 4678} {"train_loss": -7.179343223571777, "global_step": 196484, "epoch": 4678} {"train_loss": -7.34859561920166, "global_step": 196485, "epoch": 4678} {"train_loss": -7.320131301879883, "global_step": 196486, "epoch": 4678} {"train_loss": -7.252528190612793, "global_step": 196487, "epoch": 4678} {"train_loss": -7.26030158996582, "global_step": 196488, "epoch": 4678} {"train_loss": -7.242636203765869, "global_step": 196489, "epoch": 4678} {"train_loss": -7.243276596069336, "global_step": 196490, "epoch": 4678} {"train_loss": -7.1776604652404785, "global_step": 196491, "epoch": 4678} {"train_loss": -7.193264007568359, "global_step": 196492, "epoch": 4678} {"train_loss": -7.2813720703125, "global_step": 196493, "epoch": 4678} {"train_loss": -7.170570373535156, "global_step": 196494, "epoch": 4678} {"train_loss": -7.2458600997924805, "global_step": 196495, "epoch": 4678} {"train_loss": -7.30104923248291, "global_step": 196496, "epoch": 4678} {"train_loss": -7.298824310302734, "global_step": 196497, "epoch": 4678} {"train_loss": -7.203927516937256, "global_step": 196498, "epoch": 4678} {"train_loss": -7.236783027648926, "global_step": 196499, "epoch": 4678} {"train_loss": -7.331980228424072, "global_step": 196500, "epoch": 4678} {"train_loss": -7.222708225250244, "global_step": 196501, "epoch": 4678} {"train_loss": -7.24044132232666, "global_step": 196502, "epoch": 4678} {"train_loss": -7.311899185180664, "global_step": 196503, "epoch": 4678} {"train_loss": -7.29634952545166, "global_step": 196504, "epoch": 4678} {"train_loss": -7.479099273681641, "global_step": 196505, "epoch": 4678} {"train_loss": -7.311367034912109, "global_step": 196506, "epoch": 4678} {"train_loss": -7.29686164855957, "global_step": 196507, "epoch": 4678} {"train_loss": -7.314914703369141, "global_step": 196508, "epoch": 4678} {"train_loss": -7.1874542236328125, "global_step": 196509, "epoch": 4678} {"train_loss": -7.154241561889648, "global_step": 196510, "epoch": 4678} {"train_loss": -7.296629428863525, "global_step": 196511, "epoch": 4678} {"train_loss": -7.310530662536621, "global_step": 196512, "epoch": 4678} {"train_loss": -7.03851842880249, "global_step": 196513, "epoch": 4678} {"train_loss": -7.0934295654296875, "global_step": 196514, "epoch": 4678} {"train_loss": -7.325740337371826, "global_step": 196515, "epoch": 4678} {"train_loss": -7.318029403686523, "global_step": 196516, "epoch": 4678} {"train_loss": -7.245472442536127, "global_step": 196517, "epoch": 4678, "val_loss": 81456.2109375} {"train_loss": -7.305667877197266, "global_step": 196518, "epoch": 4679} {"train_loss": -7.108912467956543, "global_step": 196519, "epoch": 4679} {"train_loss": -7.238381862640381, "global_step": 196520, "epoch": 4679} {"train_loss": -7.444888114929199, "global_step": 196521, "epoch": 4679} {"train_loss": -7.218699932098389, "global_step": 196522, "epoch": 4679} {"train_loss": -7.222728729248047, "global_step": 196523, "epoch": 4679} {"train_loss": -7.219534873962402, "global_step": 196524, "epoch": 4679} {"train_loss": -7.140053749084473, "global_step": 196525, "epoch": 4679} {"train_loss": -7.191915512084961, "global_step": 196526, "epoch": 4679} {"train_loss": -7.2287187576293945, "global_step": 196527, "epoch": 4679} {"train_loss": -7.174865245819092, "global_step": 196528, "epoch": 4679} {"train_loss": -7.280162334442139, "global_step": 196529, "epoch": 4679} {"train_loss": -7.314703941345215, "global_step": 196530, "epoch": 4679} {"train_loss": -7.32758092880249, "global_step": 196531, "epoch": 4679} {"train_loss": -7.277019500732422, "global_step": 196532, "epoch": 4679} {"train_loss": -7.176947593688965, "global_step": 196533, "epoch": 4679} {"train_loss": -7.217557907104492, "global_step": 196534, "epoch": 4679} {"train_loss": -7.279416084289551, "global_step": 196535, "epoch": 4679} {"train_loss": -7.40323543548584, "global_step": 196536, "epoch": 4679} {"train_loss": -7.146609306335449, "global_step": 196537, "epoch": 4679} {"train_loss": -7.255130767822266, "global_step": 196538, "epoch": 4679} {"train_loss": -7.120288848876953, "global_step": 196539, "epoch": 4679} {"train_loss": -7.215718746185303, "global_step": 196540, "epoch": 4679} {"train_loss": -7.272562026977539, "global_step": 196541, "epoch": 4679} {"train_loss": -7.283019065856934, "global_step": 196542, "epoch": 4679} {"train_loss": -7.085229873657227, "global_step": 196543, "epoch": 4679} {"train_loss": -7.2661871910095215, "global_step": 196544, "epoch": 4679} {"train_loss": -7.32088565826416, "global_step": 196545, "epoch": 4679} {"train_loss": -7.241921901702881, "global_step": 196546, "epoch": 4679} {"train_loss": -7.243564605712891, "global_step": 196547, "epoch": 4679} {"train_loss": -7.101241111755371, "global_step": 196548, "epoch": 4679} {"train_loss": -7.231661796569824, "global_step": 196549, "epoch": 4679} {"train_loss": -7.126308441162109, "global_step": 196550, "epoch": 4679} {"train_loss": -7.185876846313477, "global_step": 196551, "epoch": 4679} {"train_loss": -7.209250450134277, "global_step": 196552, "epoch": 4679} {"train_loss": -7.174177169799805, "global_step": 196553, "epoch": 4679} {"train_loss": -7.220611572265625, "global_step": 196554, "epoch": 4679} {"train_loss": -7.16006326675415, "global_step": 196555, "epoch": 4679} {"train_loss": -7.117946624755859, "global_step": 196556, "epoch": 4679} {"train_loss": -7.2074689865112305, "global_step": 196557, "epoch": 4679} {"train_loss": -7.150263786315918, "global_step": 196558, "epoch": 4679} {"train_loss": -7.22252691359747, "global_step": 196559, "epoch": 4679, "val_loss": 81307.625} {"train_loss": -7.221031188964844, "global_step": 196560, "epoch": 4680} {"train_loss": -7.122095584869385, "global_step": 196561, "epoch": 4680} {"train_loss": -7.112345218658447, "global_step": 196562, "epoch": 4680} {"train_loss": -7.362770080566406, "global_step": 196563, "epoch": 4680} {"train_loss": -7.2763848304748535, "global_step": 196564, "epoch": 4680} {"train_loss": -7.269512176513672, "global_step": 196565, "epoch": 4680} {"train_loss": -7.373046398162842, "global_step": 196566, "epoch": 4680} {"train_loss": -7.194610118865967, "global_step": 196567, "epoch": 4680} {"train_loss": -7.344765663146973, "global_step": 196568, "epoch": 4680} {"train_loss": -7.227132797241211, "global_step": 196569, "epoch": 4680} {"train_loss": -7.394259452819824, "global_step": 196570, "epoch": 4680} {"train_loss": -7.345237731933594, "global_step": 196571, "epoch": 4680} {"train_loss": -7.219328880310059, "global_step": 196572, "epoch": 4680} {"train_loss": -7.2680840492248535, "global_step": 196573, "epoch": 4680} {"train_loss": -7.351099014282227, "global_step": 196574, "epoch": 4680} {"train_loss": -7.225345134735107, "global_step": 196575, "epoch": 4680} {"train_loss": -7.276710510253906, "global_step": 196576, "epoch": 4680} {"train_loss": -7.300254821777344, "global_step": 196577, "epoch": 4680} {"train_loss": -7.204775810241699, "global_step": 196578, "epoch": 4680} {"train_loss": -7.32356071472168, "global_step": 196579, "epoch": 4680} {"train_loss": -7.35100793838501, "global_step": 196580, "epoch": 4680} {"train_loss": -7.252770900726318, "global_step": 196581, "epoch": 4680} {"train_loss": -7.231395244598389, "global_step": 196582, "epoch": 4680} {"train_loss": -7.292941093444824, "global_step": 196583, "epoch": 4680} {"train_loss": -7.162609100341797, "global_step": 196584, "epoch": 4680} {"train_loss": -7.152407646179199, "global_step": 196585, "epoch": 4680} {"train_loss": -7.215278625488281, "global_step": 196586, "epoch": 4680} {"train_loss": -7.1427202224731445, "global_step": 196587, "epoch": 4680} {"train_loss": -7.198750972747803, "global_step": 196588, "epoch": 4680} {"train_loss": -7.284213066101074, "global_step": 196589, "epoch": 4680} {"train_loss": -7.206118583679199, "global_step": 196590, "epoch": 4680} {"train_loss": -7.211697578430176, "global_step": 196591, "epoch": 4680} {"train_loss": -7.242566108703613, "global_step": 196592, "epoch": 4680} {"train_loss": -7.201948642730713, "global_step": 196593, "epoch": 4680} {"train_loss": -7.289084434509277, "global_step": 196594, "epoch": 4680} {"train_loss": -7.271723747253418, "global_step": 196595, "epoch": 4680} {"train_loss": -7.26774787902832, "global_step": 196596, "epoch": 4680} {"train_loss": -7.249575614929199, "global_step": 196597, "epoch": 4680} {"train_loss": -7.257157802581787, "global_step": 196598, "epoch": 4680} {"train_loss": -7.263050079345703, "global_step": 196599, "epoch": 4680} {"train_loss": -7.360457897186279, "global_step": 196600, "epoch": 4680} {"train_loss": -7.257278680801392, "global_step": 196601, "epoch": 4680, "val_loss": 81213.2890625} {"train_loss": -7.22372579574585, "global_step": 196602, "epoch": 4681} {"train_loss": -7.336539268493652, "global_step": 196603, "epoch": 4681} {"train_loss": -7.311404228210449, "global_step": 196604, "epoch": 4681} {"train_loss": -7.291882514953613, "global_step": 196605, "epoch": 4681} {"train_loss": -7.320121765136719, "global_step": 196606, "epoch": 4681} {"train_loss": -7.385342121124268, "global_step": 196607, "epoch": 4681} {"train_loss": -7.371925354003906, "global_step": 196608, "epoch": 4681} {"train_loss": -7.353547096252441, "global_step": 196609, "epoch": 4681} {"train_loss": -7.384933948516846, "global_step": 196610, "epoch": 4681} {"train_loss": -7.174152851104736, "global_step": 196611, "epoch": 4681} {"train_loss": -7.329714298248291, "global_step": 196612, "epoch": 4681} {"train_loss": -7.248161315917969, "global_step": 196613, "epoch": 4681} {"train_loss": -7.334094047546387, "global_step": 196614, "epoch": 4681} {"train_loss": -7.3911542892456055, "global_step": 196615, "epoch": 4681} {"train_loss": -7.285707473754883, "global_step": 196616, "epoch": 4681} {"train_loss": -7.369688034057617, "global_step": 196617, "epoch": 4681} {"train_loss": -7.172649383544922, "global_step": 196618, "epoch": 4681} {"train_loss": -7.383482933044434, "global_step": 196619, "epoch": 4681} {"train_loss": -7.328535079956055, "global_step": 196620, "epoch": 4681} {"train_loss": -7.2097578048706055, "global_step": 196621, "epoch": 4681} {"train_loss": -7.256871223449707, "global_step": 196622, "epoch": 4681} {"train_loss": -7.187161445617676, "global_step": 196623, "epoch": 4681} {"train_loss": -7.1448750495910645, "global_step": 196624, "epoch": 4681} {"train_loss": -7.125598907470703, "global_step": 196625, "epoch": 4681} {"train_loss": -7.234682083129883, "global_step": 196626, "epoch": 4681} {"train_loss": -7.259381294250488, "global_step": 196627, "epoch": 4681} {"train_loss": -7.1279296875, "global_step": 196628, "epoch": 4681} {"train_loss": -7.168017864227295, "global_step": 196629, "epoch": 4681} {"train_loss": -7.138406753540039, "global_step": 196630, "epoch": 4681} {"train_loss": -7.236401081085205, "global_step": 196631, "epoch": 4681} {"train_loss": -7.211325645446777, "global_step": 196632, "epoch": 4681} {"train_loss": -7.30063533782959, "global_step": 196633, "epoch": 4681} {"train_loss": -7.153772830963135, "global_step": 196634, "epoch": 4681} {"train_loss": -7.204653739929199, "global_step": 196635, "epoch": 4681} {"train_loss": -7.256315231323242, "global_step": 196636, "epoch": 4681} {"train_loss": -7.1616315841674805, "global_step": 196637, "epoch": 4681} {"train_loss": -7.172858238220215, "global_step": 196638, "epoch": 4681} {"train_loss": -7.2591047286987305, "global_step": 196639, "epoch": 4681} {"train_loss": -7.129773139953613, "global_step": 196640, "epoch": 4681} {"train_loss": -7.217618942260742, "global_step": 196641, "epoch": 4681} {"train_loss": -7.0748748779296875, "global_step": 196642, "epoch": 4681} {"train_loss": -7.245545705159505, "global_step": 196643, "epoch": 4681, "val_loss": 81483.0390625} {"train_loss": -7.194723129272461, "global_step": 196644, "epoch": 4682} {"train_loss": -7.1207427978515625, "global_step": 196645, "epoch": 4682} {"train_loss": -7.159296035766602, "global_step": 196646, "epoch": 4682} {"train_loss": -7.094681262969971, "global_step": 196647, "epoch": 4682} {"train_loss": -7.3730878829956055, "global_step": 196648, "epoch": 4682} {"train_loss": -7.151431083679199, "global_step": 196649, "epoch": 4682} {"train_loss": -7.126043796539307, "global_step": 196650, "epoch": 4682} {"train_loss": -7.35987663269043, "global_step": 196651, "epoch": 4682} {"train_loss": -7.162352561950684, "global_step": 196652, "epoch": 4682} {"train_loss": -7.266294002532959, "global_step": 196653, "epoch": 4682} {"train_loss": -7.283576965332031, "global_step": 196654, "epoch": 4682} {"train_loss": -7.201812744140625, "global_step": 196655, "epoch": 4682} {"train_loss": -7.330896854400635, "global_step": 196656, "epoch": 4682} {"train_loss": -7.170834541320801, "global_step": 196657, "epoch": 4682} {"train_loss": -7.323188781738281, "global_step": 196658, "epoch": 4682} {"train_loss": -7.215579032897949, "global_step": 196659, "epoch": 4682} {"train_loss": -7.203970909118652, "global_step": 196660, "epoch": 4682} {"train_loss": -7.275439739227295, "global_step": 196661, "epoch": 4682} {"train_loss": -7.278692245483398, "global_step": 196662, "epoch": 4682} {"train_loss": -7.280346870422363, "global_step": 196663, "epoch": 4682} {"train_loss": -7.244791030883789, "global_step": 196664, "epoch": 4682} {"train_loss": -7.262079238891602, "global_step": 196665, "epoch": 4682} {"train_loss": -7.3990864753723145, "global_step": 196666, "epoch": 4682} {"train_loss": -7.214780807495117, "global_step": 196667, "epoch": 4682} {"train_loss": -7.302660942077637, "global_step": 196668, "epoch": 4682} {"train_loss": -7.265133857727051, "global_step": 196669, "epoch": 4682} {"train_loss": -7.240010738372803, "global_step": 196670, "epoch": 4682} {"train_loss": -7.38136100769043, "global_step": 196671, "epoch": 4682} {"train_loss": -7.3055596351623535, "global_step": 196672, "epoch": 4682} {"train_loss": -7.322516441345215, "global_step": 196673, "epoch": 4682} {"train_loss": -7.285506725311279, "global_step": 196674, "epoch": 4682} {"train_loss": -7.228937149047852, "global_step": 196675, "epoch": 4682} {"train_loss": -7.284939765930176, "global_step": 196676, "epoch": 4682} {"train_loss": -7.279654502868652, "global_step": 196677, "epoch": 4682} {"train_loss": -7.312223434448242, "global_step": 196678, "epoch": 4682} {"train_loss": -7.259467124938965, "global_step": 196679, "epoch": 4682} {"train_loss": -7.274052619934082, "global_step": 196680, "epoch": 4682} {"train_loss": -7.2972211837768555, "global_step": 196681, "epoch": 4682} {"train_loss": -7.238110542297363, "global_step": 196682, "epoch": 4682} {"train_loss": -7.223656177520752, "global_step": 196683, "epoch": 4682} {"train_loss": -7.396599769592285, "global_step": 196684, "epoch": 4682} {"train_loss": -7.259041400182815, "global_step": 196685, "epoch": 4682, "val_loss": 81108.3203125} {"train_loss": -7.342532157897949, "global_step": 196686, "epoch": 4683} {"train_loss": -7.214048385620117, "global_step": 196687, "epoch": 4683} {"train_loss": -7.285489082336426, "global_step": 196688, "epoch": 4683} {"train_loss": -7.208423614501953, "global_step": 196689, "epoch": 4683} {"train_loss": -7.274275779724121, "global_step": 196690, "epoch": 4683} {"train_loss": -7.097978591918945, "global_step": 196691, "epoch": 4683} {"train_loss": -7.204801559448242, "global_step": 196692, "epoch": 4683} {"train_loss": -7.204502105712891, "global_step": 196693, "epoch": 4683} {"train_loss": -7.201672077178955, "global_step": 196694, "epoch": 4683} {"train_loss": -7.223341941833496, "global_step": 196695, "epoch": 4683} {"train_loss": -7.197589874267578, "global_step": 196696, "epoch": 4683} {"train_loss": -7.216659069061279, "global_step": 196697, "epoch": 4683} {"train_loss": -7.239463806152344, "global_step": 196698, "epoch": 4683} {"train_loss": -7.218334674835205, "global_step": 196699, "epoch": 4683} {"train_loss": -7.222062110900879, "global_step": 196700, "epoch": 4683} {"train_loss": -7.2926177978515625, "global_step": 196701, "epoch": 4683} {"train_loss": -7.247710227966309, "global_step": 196702, "epoch": 4683} {"train_loss": -7.285094261169434, "global_step": 196703, "epoch": 4683} {"train_loss": -7.190829277038574, "global_step": 196704, "epoch": 4683} {"train_loss": -7.1843647956848145, "global_step": 196705, "epoch": 4683} {"train_loss": -7.130062103271484, "global_step": 196706, "epoch": 4683} {"train_loss": -7.211148262023926, "global_step": 196707, "epoch": 4683} {"train_loss": -7.240042686462402, "global_step": 196708, "epoch": 4683} {"train_loss": -7.302748680114746, "global_step": 196709, "epoch": 4683} {"train_loss": -7.230185031890869, "global_step": 196710, "epoch": 4683} {"train_loss": -7.160792827606201, "global_step": 196711, "epoch": 4683} {"train_loss": -7.144264221191406, "global_step": 196712, "epoch": 4683} {"train_loss": -7.168345928192139, "global_step": 196713, "epoch": 4683} {"train_loss": -7.208332061767578, "global_step": 196714, "epoch": 4683} {"train_loss": -7.089245796203613, "global_step": 196715, "epoch": 4683} {"train_loss": -7.203541278839111, "global_step": 196716, "epoch": 4683} {"train_loss": -7.257396697998047, "global_step": 196717, "epoch": 4683} {"train_loss": -7.18873929977417, "global_step": 196718, "epoch": 4683} {"train_loss": -7.175707817077637, "global_step": 196719, "epoch": 4683} {"train_loss": -7.21706485748291, "global_step": 196720, "epoch": 4683} {"train_loss": -7.199586868286133, "global_step": 196721, "epoch": 4683} {"train_loss": -7.200677394866943, "global_step": 196722, "epoch": 4683} {"train_loss": -7.198736190795898, "global_step": 196723, "epoch": 4683} {"train_loss": -7.188896179199219, "global_step": 196724, "epoch": 4683} {"train_loss": -7.18760347366333, "global_step": 196725, "epoch": 4683} {"train_loss": -7.183444976806641, "global_step": 196726, "epoch": 4683} {"train_loss": -7.213803790864491, "global_step": 196727, "epoch": 4683, "val_loss": 81354.1640625} {"train_loss": -7.324761867523193, "global_step": 196728, "epoch": 4684} {"train_loss": -7.133519649505615, "global_step": 196729, "epoch": 4684} {"train_loss": -7.2873616218566895, "global_step": 196730, "epoch": 4684} {"train_loss": -7.237906455993652, "global_step": 196731, "epoch": 4684} {"train_loss": -7.328183174133301, "global_step": 196732, "epoch": 4684} {"train_loss": -7.26322078704834, "global_step": 196733, "epoch": 4684} {"train_loss": -7.213286399841309, "global_step": 196734, "epoch": 4684} {"train_loss": -7.271132469177246, "global_step": 196735, "epoch": 4684} {"train_loss": -7.280551910400391, "global_step": 196736, "epoch": 4684} {"train_loss": -7.438167572021484, "global_step": 196737, "epoch": 4684} {"train_loss": -7.207188606262207, "global_step": 196738, "epoch": 4684} {"train_loss": -7.200187683105469, "global_step": 196739, "epoch": 4684} {"train_loss": -7.2716498374938965, "global_step": 196740, "epoch": 4684} {"train_loss": -7.2660722732543945, "global_step": 196741, "epoch": 4684} {"train_loss": -7.264566898345947, "global_step": 196742, "epoch": 4684} {"train_loss": -7.17366886138916, "global_step": 196743, "epoch": 4684} {"train_loss": -7.262303352355957, "global_step": 196744, "epoch": 4684} {"train_loss": -7.211779594421387, "global_step": 196745, "epoch": 4684} {"train_loss": -7.189590930938721, "global_step": 196746, "epoch": 4684} {"train_loss": -7.166659355163574, "global_step": 196747, "epoch": 4684} {"train_loss": -7.272902488708496, "global_step": 196748, "epoch": 4684} {"train_loss": -7.2935380935668945, "global_step": 196749, "epoch": 4684} {"train_loss": -7.201958179473877, "global_step": 196750, "epoch": 4684} {"train_loss": -7.314048767089844, "global_step": 196751, "epoch": 4684} {"train_loss": -7.406565189361572, "global_step": 196752, "epoch": 4684} {"train_loss": -7.362710952758789, "global_step": 196753, "epoch": 4684} {"train_loss": -7.363440990447998, "global_step": 196754, "epoch": 4684} {"train_loss": -7.1657938957214355, "global_step": 196755, "epoch": 4684} {"train_loss": -7.258380889892578, "global_step": 196756, "epoch": 4684} {"train_loss": -7.338133811950684, "global_step": 196757, "epoch": 4684} {"train_loss": -7.154749870300293, "global_step": 196758, "epoch": 4684} {"train_loss": -7.2898640632629395, "global_step": 196759, "epoch": 4684} {"train_loss": -7.181868553161621, "global_step": 196760, "epoch": 4684} {"train_loss": -7.288417339324951, "global_step": 196761, "epoch": 4684} {"train_loss": -7.191740989685059, "global_step": 196762, "epoch": 4684} {"train_loss": -7.267939567565918, "global_step": 196763, "epoch": 4684} {"train_loss": -7.203710079193115, "global_step": 196764, "epoch": 4684} {"train_loss": -7.304699897766113, "global_step": 196765, "epoch": 4684} {"train_loss": -7.295544624328613, "global_step": 196766, "epoch": 4684} {"train_loss": -7.2942352294921875, "global_step": 196767, "epoch": 4684} {"train_loss": -7.2672119140625, "global_step": 196768, "epoch": 4684} {"train_loss": -7.262241465704782, "global_step": 196769, "epoch": 4684, "val_loss": 81406.21875} {"train_loss": -7.261056900024414, "global_step": 196770, "epoch": 4685} {"train_loss": -7.181496620178223, "global_step": 196771, "epoch": 4685} {"train_loss": -7.2697296142578125, "global_step": 196772, "epoch": 4685} {"train_loss": -7.2390289306640625, "global_step": 196773, "epoch": 4685} {"train_loss": -7.260496139526367, "global_step": 196774, "epoch": 4685} {"train_loss": -7.237773895263672, "global_step": 196775, "epoch": 4685} {"train_loss": -7.073138236999512, "global_step": 196776, "epoch": 4685} {"train_loss": -7.1475114822387695, "global_step": 196777, "epoch": 4685} {"train_loss": -7.285989761352539, "global_step": 196778, "epoch": 4685} {"train_loss": -7.106826305389404, "global_step": 196779, "epoch": 4685} {"train_loss": -7.093005657196045, "global_step": 196780, "epoch": 4685} {"train_loss": -7.2010087966918945, "global_step": 196781, "epoch": 4685} {"train_loss": -7.143709659576416, "global_step": 196782, "epoch": 4685} {"train_loss": -7.230029106140137, "global_step": 196783, "epoch": 4685} {"train_loss": -7.096782684326172, "global_step": 196784, "epoch": 4685} {"train_loss": -7.213753700256348, "global_step": 196785, "epoch": 4685} {"train_loss": -7.231845378875732, "global_step": 196786, "epoch": 4685} {"train_loss": -7.077395439147949, "global_step": 196787, "epoch": 4685} {"train_loss": -7.1010308265686035, "global_step": 196788, "epoch": 4685} {"train_loss": -7.092223167419434, "global_step": 196789, "epoch": 4685} {"train_loss": -7.105381488800049, "global_step": 196790, "epoch": 4685} {"train_loss": -7.160160064697266, "global_step": 196791, "epoch": 4685} {"train_loss": -7.179320335388184, "global_step": 196792, "epoch": 4685} {"train_loss": -7.14531135559082, "global_step": 196793, "epoch": 4685} {"train_loss": -7.056023597717285, "global_step": 196794, "epoch": 4685} {"train_loss": -7.134258270263672, "global_step": 196795, "epoch": 4685} {"train_loss": -7.05409049987793, "global_step": 196796, "epoch": 4685} {"train_loss": -7.221646785736084, "global_step": 196797, "epoch": 4685} {"train_loss": -7.162168979644775, "global_step": 196798, "epoch": 4685} {"train_loss": -7.086315155029297, "global_step": 196799, "epoch": 4685} {"train_loss": -7.2747039794921875, "global_step": 196800, "epoch": 4685} {"train_loss": -7.210789203643799, "global_step": 196801, "epoch": 4685} {"train_loss": -7.217964172363281, "global_step": 196802, "epoch": 4685} {"train_loss": -7.252826690673828, "global_step": 196803, "epoch": 4685} {"train_loss": -7.197728633880615, "global_step": 196804, "epoch": 4685} {"train_loss": -7.23391056060791, "global_step": 196805, "epoch": 4685} {"train_loss": -7.191470146179199, "global_step": 196806, "epoch": 4685} {"train_loss": -7.224140167236328, "global_step": 196807, "epoch": 4685} {"train_loss": -7.204521179199219, "global_step": 196808, "epoch": 4685} {"train_loss": -7.214338302612305, "global_step": 196809, "epoch": 4685} {"train_loss": -7.160404205322266, "global_step": 196810, "epoch": 4685} {"train_loss": -7.180710962840489, "global_step": 196811, "epoch": 4685, "val_loss": 81156.2265625} {"train_loss": -7.196842670440674, "global_step": 196812, "epoch": 4686} {"train_loss": -7.238376140594482, "global_step": 196813, "epoch": 4686} {"train_loss": -7.297728538513184, "global_step": 196814, "epoch": 4686} {"train_loss": -7.317910671234131, "global_step": 196815, "epoch": 4686} {"train_loss": -7.330841064453125, "global_step": 196816, "epoch": 4686} {"train_loss": -7.258270263671875, "global_step": 196817, "epoch": 4686} {"train_loss": -7.355066776275635, "global_step": 196818, "epoch": 4686} {"train_loss": -7.418995380401611, "global_step": 196819, "epoch": 4686} {"train_loss": -7.374438285827637, "global_step": 196820, "epoch": 4686} {"train_loss": -7.355288505554199, "global_step": 196821, "epoch": 4686} {"train_loss": -7.32088565826416, "global_step": 196822, "epoch": 4686} {"train_loss": -7.4686760902404785, "global_step": 196823, "epoch": 4686} {"train_loss": -7.307480812072754, "global_step": 196824, "epoch": 4686} {"train_loss": -7.276803016662598, "global_step": 196825, "epoch": 4686} {"train_loss": -7.416507720947266, "global_step": 196826, "epoch": 4686} {"train_loss": -7.368154525756836, "global_step": 196827, "epoch": 4686} {"train_loss": -7.244720458984375, "global_step": 196828, "epoch": 4686} {"train_loss": -7.313976287841797, "global_step": 196829, "epoch": 4686} {"train_loss": -7.281266689300537, "global_step": 196830, "epoch": 4686} {"train_loss": -7.17289400100708, "global_step": 196831, "epoch": 4686} {"train_loss": -7.282040119171143, "global_step": 196832, "epoch": 4686} {"train_loss": -7.283914089202881, "global_step": 196833, "epoch": 4686} {"train_loss": -7.217822074890137, "global_step": 196834, "epoch": 4686} {"train_loss": -7.3038740158081055, "global_step": 196835, "epoch": 4686} {"train_loss": -7.280472755432129, "global_step": 196836, "epoch": 4686} {"train_loss": -7.194175720214844, "global_step": 196837, "epoch": 4686} {"train_loss": -7.3385515213012695, "global_step": 196838, "epoch": 4686} {"train_loss": -7.223170280456543, "global_step": 196839, "epoch": 4686} {"train_loss": -7.122828483581543, "global_step": 196840, "epoch": 4686} {"train_loss": -7.355870246887207, "global_step": 196841, "epoch": 4686} {"train_loss": -7.117060661315918, "global_step": 196842, "epoch": 4686} {"train_loss": -7.233971118927002, "global_step": 196843, "epoch": 4686} {"train_loss": -7.448206901550293, "global_step": 196844, "epoch": 4686} {"train_loss": -7.112793922424316, "global_step": 196845, "epoch": 4686} {"train_loss": -7.239620208740234, "global_step": 196846, "epoch": 4686} {"train_loss": -7.256519794464111, "global_step": 196847, "epoch": 4686} {"train_loss": -7.264012336730957, "global_step": 196848, "epoch": 4686} {"train_loss": -7.314611911773682, "global_step": 196849, "epoch": 4686} {"train_loss": -7.239607334136963, "global_step": 196850, "epoch": 4686} {"train_loss": -7.231660842895508, "global_step": 196851, "epoch": 4686} {"train_loss": -7.332524299621582, "global_step": 196852, "epoch": 4686} {"train_loss": -7.283164217358544, "global_step": 196853, "epoch": 4686, "val_loss": 81400.3203125} {"train_loss": -7.3100385665893555, "global_step": 196854, "epoch": 4687} {"train_loss": -7.287935256958008, "global_step": 196855, "epoch": 4687} {"train_loss": -7.259510517120361, "global_step": 196856, "epoch": 4687} {"train_loss": -7.315223693847656, "global_step": 196857, "epoch": 4687} {"train_loss": -7.350135803222656, "global_step": 196858, "epoch": 4687} {"train_loss": -7.231132507324219, "global_step": 196859, "epoch": 4687} {"train_loss": -7.27370548248291, "global_step": 196860, "epoch": 4687} {"train_loss": -7.358719825744629, "global_step": 196861, "epoch": 4687} {"train_loss": -7.299600601196289, "global_step": 196862, "epoch": 4687} {"train_loss": -7.44239616394043, "global_step": 196863, "epoch": 4687} {"train_loss": -7.178809642791748, "global_step": 196864, "epoch": 4687} {"train_loss": -7.22808837890625, "global_step": 196865, "epoch": 4687} {"train_loss": -7.228342056274414, "global_step": 196866, "epoch": 4687} {"train_loss": -7.240006446838379, "global_step": 196867, "epoch": 4687} {"train_loss": -7.3685455322265625, "global_step": 196868, "epoch": 4687} {"train_loss": -7.384669780731201, "global_step": 196869, "epoch": 4687} {"train_loss": -7.190214157104492, "global_step": 196870, "epoch": 4687} {"train_loss": -7.276363372802734, "global_step": 196871, "epoch": 4687} {"train_loss": -7.362284183502197, "global_step": 196872, "epoch": 4687} {"train_loss": -7.2030839920043945, "global_step": 196873, "epoch": 4687} {"train_loss": -7.2083258628845215, "global_step": 196874, "epoch": 4687} {"train_loss": -7.340019226074219, "global_step": 196875, "epoch": 4687} {"train_loss": -7.263439178466797, "global_step": 196876, "epoch": 4687} {"train_loss": -7.203850269317627, "global_step": 196877, "epoch": 4687} {"train_loss": -7.32087516784668, "global_step": 196878, "epoch": 4687} {"train_loss": -7.147043228149414, "global_step": 196879, "epoch": 4687} {"train_loss": -7.114872932434082, "global_step": 196880, "epoch": 4687} {"train_loss": -7.221002578735352, "global_step": 196881, "epoch": 4687} {"train_loss": -7.123047828674316, "global_step": 196882, "epoch": 4687} {"train_loss": -7.303683280944824, "global_step": 196883, "epoch": 4687} {"train_loss": -7.232005596160889, "global_step": 196884, "epoch": 4687} {"train_loss": -7.2038068771362305, "global_step": 196885, "epoch": 4687} {"train_loss": -7.206383228302002, "global_step": 196886, "epoch": 4687} {"train_loss": -7.343116283416748, "global_step": 196887, "epoch": 4687} {"train_loss": -7.1952290534973145, "global_step": 196888, "epoch": 4687} {"train_loss": -7.270202159881592, "global_step": 196889, "epoch": 4687} {"train_loss": -7.1540751457214355, "global_step": 196890, "epoch": 4687} {"train_loss": -7.151505470275879, "global_step": 196891, "epoch": 4687} {"train_loss": -7.125700950622559, "global_step": 196892, "epoch": 4687} {"train_loss": -7.223624229431152, "global_step": 196893, "epoch": 4687} {"train_loss": -7.123539447784424, "global_step": 196894, "epoch": 4687} {"train_loss": -7.24980430375962, "global_step": 196895, "epoch": 4687, "val_loss": 81293.1484375} {"train_loss": -7.140777587890625, "global_step": 196896, "epoch": 4688} {"train_loss": -7.285515308380127, "global_step": 196897, "epoch": 4688} {"train_loss": -7.239383220672607, "global_step": 196898, "epoch": 4688} {"train_loss": -7.297628402709961, "global_step": 196899, "epoch": 4688} {"train_loss": -7.251828193664551, "global_step": 196900, "epoch": 4688} {"train_loss": -7.2905778884887695, "global_step": 196901, "epoch": 4688} {"train_loss": -7.181379318237305, "global_step": 196902, "epoch": 4688} {"train_loss": -7.327384948730469, "global_step": 196903, "epoch": 4688} {"train_loss": -7.347353935241699, "global_step": 196904, "epoch": 4688} {"train_loss": -7.311785697937012, "global_step": 196905, "epoch": 4688} {"train_loss": -7.349963188171387, "global_step": 196906, "epoch": 4688} {"train_loss": -7.241086006164551, "global_step": 196907, "epoch": 4688} {"train_loss": -7.283895969390869, "global_step": 196908, "epoch": 4688} {"train_loss": -7.3177947998046875, "global_step": 196909, "epoch": 4688} {"train_loss": -7.359195232391357, "global_step": 196910, "epoch": 4688} {"train_loss": -7.3064961433410645, "global_step": 196911, "epoch": 4688} {"train_loss": -7.332529067993164, "global_step": 196912, "epoch": 4688} {"train_loss": -7.259756565093994, "global_step": 196913, "epoch": 4688} {"train_loss": -7.305065155029297, "global_step": 196914, "epoch": 4688} {"train_loss": -7.318762302398682, "global_step": 196915, "epoch": 4688} {"train_loss": -7.357177257537842, "global_step": 196916, "epoch": 4688} {"train_loss": -7.352289199829102, "global_step": 196917, "epoch": 4688} {"train_loss": -7.418553352355957, "global_step": 196918, "epoch": 4688} {"train_loss": -7.204504013061523, "global_step": 196919, "epoch": 4688} {"train_loss": -7.285498142242432, "global_step": 196920, "epoch": 4688} {"train_loss": -7.299323081970215, "global_step": 196921, "epoch": 4688} {"train_loss": -7.267822742462158, "global_step": 196922, "epoch": 4688} {"train_loss": -7.243837833404541, "global_step": 196923, "epoch": 4688} {"train_loss": -7.387284278869629, "global_step": 196924, "epoch": 4688} {"train_loss": -7.321276664733887, "global_step": 196925, "epoch": 4688} {"train_loss": -7.216217041015625, "global_step": 196926, "epoch": 4688} {"train_loss": -7.211612701416016, "global_step": 196927, "epoch": 4688} {"train_loss": -7.258264541625977, "global_step": 196928, "epoch": 4688} {"train_loss": -7.209611892700195, "global_step": 196929, "epoch": 4688} {"train_loss": -7.284854888916016, "global_step": 196930, "epoch": 4688} {"train_loss": -7.308913230895996, "global_step": 196931, "epoch": 4688} {"train_loss": -7.154840469360352, "global_step": 196932, "epoch": 4688} {"train_loss": -7.243244171142578, "global_step": 196933, "epoch": 4688} {"train_loss": -7.1967010498046875, "global_step": 196934, "epoch": 4688} {"train_loss": -7.294778823852539, "global_step": 196935, "epoch": 4688} {"train_loss": -7.2362518310546875, "global_step": 196936, "epoch": 4688} {"train_loss": -7.282470612298875, "global_step": 196937, "epoch": 4688, "val_loss": 81271.90625} {"train_loss": -7.355780601501465, "global_step": 196938, "epoch": 4689} {"train_loss": -7.278804302215576, "global_step": 196939, "epoch": 4689} {"train_loss": -7.208096027374268, "global_step": 196940, "epoch": 4689} {"train_loss": -7.300617694854736, "global_step": 196941, "epoch": 4689} {"train_loss": -7.235752105712891, "global_step": 196942, "epoch": 4689} {"train_loss": -7.123918056488037, "global_step": 196943, "epoch": 4689} {"train_loss": -7.300396919250488, "global_step": 196944, "epoch": 4689} {"train_loss": -7.250993728637695, "global_step": 196945, "epoch": 4689} {"train_loss": -7.234485626220703, "global_step": 196946, "epoch": 4689} {"train_loss": -7.111288070678711, "global_step": 196947, "epoch": 4689} {"train_loss": -7.204217433929443, "global_step": 196948, "epoch": 4689} {"train_loss": -7.193892478942871, "global_step": 196949, "epoch": 4689} {"train_loss": -7.237894058227539, "global_step": 196950, "epoch": 4689} {"train_loss": -7.280484676361084, "global_step": 196951, "epoch": 4689} {"train_loss": -7.216758728027344, "global_step": 196952, "epoch": 4689} {"train_loss": -7.274239540100098, "global_step": 196953, "epoch": 4689} {"train_loss": -7.238994598388672, "global_step": 196954, "epoch": 4689} {"train_loss": -7.348113059997559, "global_step": 196955, "epoch": 4689} {"train_loss": -7.325989723205566, "global_step": 196956, "epoch": 4689} {"train_loss": -7.152029991149902, "global_step": 196957, "epoch": 4689} {"train_loss": -7.317174434661865, "global_step": 196958, "epoch": 4689} {"train_loss": -7.2714457511901855, "global_step": 196959, "epoch": 4689} {"train_loss": -7.185989856719971, "global_step": 196960, "epoch": 4689} {"train_loss": -7.249968528747559, "global_step": 196961, "epoch": 4689} {"train_loss": -7.284339427947998, "global_step": 196962, "epoch": 4689} {"train_loss": -7.292366027832031, "global_step": 196963, "epoch": 4689} {"train_loss": -7.2161760330200195, "global_step": 196964, "epoch": 4689} {"train_loss": -7.207668781280518, "global_step": 196965, "epoch": 4689} {"train_loss": -7.308866500854492, "global_step": 196966, "epoch": 4689} {"train_loss": -7.248018264770508, "global_step": 196967, "epoch": 4689} {"train_loss": -7.331260681152344, "global_step": 196968, "epoch": 4689} {"train_loss": -7.336062431335449, "global_step": 196969, "epoch": 4689} {"train_loss": -7.240720748901367, "global_step": 196970, "epoch": 4689} {"train_loss": -7.323517322540283, "global_step": 196971, "epoch": 4689} {"train_loss": -7.315135478973389, "global_step": 196972, "epoch": 4689} {"train_loss": -7.289683818817139, "global_step": 196973, "epoch": 4689} {"train_loss": -7.237365245819092, "global_step": 196974, "epoch": 4689} {"train_loss": -7.135478496551514, "global_step": 196975, "epoch": 4689} {"train_loss": -7.261857032775879, "global_step": 196976, "epoch": 4689} {"train_loss": -7.1662750244140625, "global_step": 196977, "epoch": 4689} {"train_loss": -7.305507659912109, "global_step": 196978, "epoch": 4689} {"train_loss": -7.251435359319051, "global_step": 196979, "epoch": 4689, "val_loss": 81374.5} {"train_loss": -7.357824325561523, "global_step": 196980, "epoch": 4690} {"train_loss": -7.0147294998168945, "global_step": 196981, "epoch": 4690} {"train_loss": -7.1427693367004395, "global_step": 196982, "epoch": 4690} {"train_loss": -7.099423408508301, "global_step": 196983, "epoch": 4690} {"train_loss": -7.279792785644531, "global_step": 196984, "epoch": 4690} {"train_loss": -7.239696979522705, "global_step": 196985, "epoch": 4690} {"train_loss": -7.319409370422363, "global_step": 196986, "epoch": 4690} {"train_loss": -7.29510498046875, "global_step": 196987, "epoch": 4690} {"train_loss": -7.231581687927246, "global_step": 196988, "epoch": 4690} {"train_loss": -7.284641265869141, "global_step": 196989, "epoch": 4690} {"train_loss": -7.3262434005737305, "global_step": 196990, "epoch": 4690} {"train_loss": -7.366283416748047, "global_step": 196991, "epoch": 4690} {"train_loss": -7.200628757476807, "global_step": 196992, "epoch": 4690} {"train_loss": -7.252602577209473, "global_step": 196993, "epoch": 4690} {"train_loss": -7.320426940917969, "global_step": 196994, "epoch": 4690} {"train_loss": -7.17735481262207, "global_step": 196995, "epoch": 4690} {"train_loss": -7.316239356994629, "global_step": 196996, "epoch": 4690} {"train_loss": -7.215917587280273, "global_step": 196997, "epoch": 4690} {"train_loss": -7.316003799438477, "global_step": 196998, "epoch": 4690} {"train_loss": -7.138394355773926, "global_step": 196999, "epoch": 4690} {"train_loss": -7.263759613037109, "global_step": 197000, "epoch": 4690} {"train_loss": -7.284003734588623, "global_step": 197001, "epoch": 4690} {"train_loss": -7.215795040130615, "global_step": 197002, "epoch": 4690} {"train_loss": -7.199881553649902, "global_step": 197003, "epoch": 4690} {"train_loss": -7.249642848968506, "global_step": 197004, "epoch": 4690} {"train_loss": -7.212428092956543, "global_step": 197005, "epoch": 4690} {"train_loss": -7.248903274536133, "global_step": 197006, "epoch": 4690} {"train_loss": -7.28049373626709, "global_step": 197007, "epoch": 4690} {"train_loss": -7.21668004989624, "global_step": 197008, "epoch": 4690} {"train_loss": -7.17527961730957, "global_step": 197009, "epoch": 4690} {"train_loss": -7.240169525146484, "global_step": 197010, "epoch": 4690} {"train_loss": -7.2355499267578125, "global_step": 197011, "epoch": 4690} {"train_loss": -7.244104385375977, "global_step": 197012, "epoch": 4690} {"train_loss": -7.109940528869629, "global_step": 197013, "epoch": 4690} {"train_loss": -6.983617305755615, "global_step": 197014, "epoch": 4690} {"train_loss": -7.196622848510742, "global_step": 197015, "epoch": 4690} {"train_loss": -7.078127861022949, "global_step": 197016, "epoch": 4690} {"train_loss": -7.306735038757324, "global_step": 197017, "epoch": 4690} {"train_loss": -7.101650238037109, "global_step": 197018, "epoch": 4690} {"train_loss": -7.173250198364258, "global_step": 197019, "epoch": 4690} {"train_loss": -7.204173564910889, "global_step": 197020, "epoch": 4690} {"train_loss": -7.2205591315314885, "global_step": 197021, "epoch": 4690, "val_loss": 81378.09375} {"train_loss": -7.266364097595215, "global_step": 197022, "epoch": 4691} {"train_loss": -7.048914432525635, "global_step": 197023, "epoch": 4691} {"train_loss": -7.113108158111572, "global_step": 197024, "epoch": 4691} {"train_loss": -7.178070068359375, "global_step": 197025, "epoch": 4691} {"train_loss": -7.190757751464844, "global_step": 197026, "epoch": 4691} {"train_loss": -7.088970184326172, "global_step": 197027, "epoch": 4691} {"train_loss": -7.148524761199951, "global_step": 197028, "epoch": 4691} {"train_loss": -7.120702743530273, "global_step": 197029, "epoch": 4691} {"train_loss": -7.174328327178955, "global_step": 197030, "epoch": 4691} {"train_loss": -7.241042137145996, "global_step": 197031, "epoch": 4691} {"train_loss": -7.151350975036621, "global_step": 197032, "epoch": 4691} {"train_loss": -7.253089904785156, "global_step": 197033, "epoch": 4691} {"train_loss": -7.255839824676514, "global_step": 197034, "epoch": 4691} {"train_loss": -7.249265670776367, "global_step": 197035, "epoch": 4691} {"train_loss": -7.227665901184082, "global_step": 197036, "epoch": 4691} {"train_loss": -7.244957447052002, "global_step": 197037, "epoch": 4691} {"train_loss": -7.282824516296387, "global_step": 197038, "epoch": 4691} {"train_loss": -7.105973243713379, "global_step": 197039, "epoch": 4691} {"train_loss": -7.195235252380371, "global_step": 197040, "epoch": 4691} {"train_loss": -7.315124988555908, "global_step": 197041, "epoch": 4691} {"train_loss": -7.282808303833008, "global_step": 197042, "epoch": 4691} {"train_loss": -7.311297416687012, "global_step": 197043, "epoch": 4691} {"train_loss": -7.309624671936035, "global_step": 197044, "epoch": 4691} {"train_loss": -7.178492546081543, "global_step": 197045, "epoch": 4691} {"train_loss": -7.240318775177002, "global_step": 197046, "epoch": 4691} {"train_loss": -7.337272644042969, "global_step": 197047, "epoch": 4691} {"train_loss": -7.205897331237793, "global_step": 197048, "epoch": 4691} {"train_loss": -7.2054595947265625, "global_step": 197049, "epoch": 4691} {"train_loss": -7.151203155517578, "global_step": 197050, "epoch": 4691} {"train_loss": -7.13191032409668, "global_step": 197051, "epoch": 4691} {"train_loss": -7.284797668457031, "global_step": 197052, "epoch": 4691} {"train_loss": -7.357047080993652, "global_step": 197053, "epoch": 4691} {"train_loss": -7.245898246765137, "global_step": 197054, "epoch": 4691} {"train_loss": -7.322009086608887, "global_step": 197055, "epoch": 4691} {"train_loss": -7.282773971557617, "global_step": 197056, "epoch": 4691} {"train_loss": -7.224390029907227, "global_step": 197057, "epoch": 4691} {"train_loss": -7.329537391662598, "global_step": 197058, "epoch": 4691} {"train_loss": -7.231125831604004, "global_step": 197059, "epoch": 4691} {"train_loss": -7.144898414611816, "global_step": 197060, "epoch": 4691} {"train_loss": -7.181841850280762, "global_step": 197061, "epoch": 4691} {"train_loss": -7.330854415893555, "global_step": 197062, "epoch": 4691} {"train_loss": -7.222787652696882, "global_step": 197063, "epoch": 4691, "val_loss": 81341.1796875} {"train_loss": -7.297415733337402, "global_step": 197064, "epoch": 4692} {"train_loss": -7.3131561279296875, "global_step": 197065, "epoch": 4692} {"train_loss": -7.261799335479736, "global_step": 197066, "epoch": 4692} {"train_loss": -7.316755294799805, "global_step": 197067, "epoch": 4692} {"train_loss": -7.292065620422363, "global_step": 197068, "epoch": 4692} {"train_loss": -7.261575698852539, "global_step": 197069, "epoch": 4692} {"train_loss": -7.291753768920898, "global_step": 197070, "epoch": 4692} {"train_loss": -7.334521293640137, "global_step": 197071, "epoch": 4692} {"train_loss": -7.248928070068359, "global_step": 197072, "epoch": 4692} {"train_loss": -7.197208881378174, "global_step": 197073, "epoch": 4692} {"train_loss": -7.251941680908203, "global_step": 197074, "epoch": 4692} {"train_loss": -7.3217854499816895, "global_step": 197075, "epoch": 4692} {"train_loss": -7.291634559631348, "global_step": 197076, "epoch": 4692} {"train_loss": -7.2270636558532715, "global_step": 197077, "epoch": 4692} {"train_loss": -7.28098201751709, "global_step": 197078, "epoch": 4692} {"train_loss": -7.3118896484375, "global_step": 197079, "epoch": 4692} {"train_loss": -7.24631404876709, "global_step": 197080, "epoch": 4692} {"train_loss": -7.301414966583252, "global_step": 197081, "epoch": 4692} {"train_loss": -7.375574111938477, "global_step": 197082, "epoch": 4692} {"train_loss": -7.336215019226074, "global_step": 197083, "epoch": 4692} {"train_loss": -7.329050064086914, "global_step": 197084, "epoch": 4692} {"train_loss": -7.232787132263184, "global_step": 197085, "epoch": 4692} {"train_loss": -7.2754225730896, "global_step": 197086, "epoch": 4692} {"train_loss": -7.420568466186523, "global_step": 197087, "epoch": 4692} {"train_loss": -7.278944492340088, "global_step": 197088, "epoch": 4692} {"train_loss": -7.308272361755371, "global_step": 197089, "epoch": 4692} {"train_loss": -7.334019660949707, "global_step": 197090, "epoch": 4692} {"train_loss": -7.2342071533203125, "global_step": 197091, "epoch": 4692} {"train_loss": -7.277169227600098, "global_step": 197092, "epoch": 4692} {"train_loss": -7.2656073570251465, "global_step": 197093, "epoch": 4692} {"train_loss": -7.207417964935303, "global_step": 197094, "epoch": 4692} {"train_loss": -7.308351039886475, "global_step": 197095, "epoch": 4692} {"train_loss": -7.419818878173828, "global_step": 197096, "epoch": 4692} {"train_loss": -7.177992820739746, "global_step": 197097, "epoch": 4692} {"train_loss": -7.280420303344727, "global_step": 197098, "epoch": 4692} {"train_loss": -7.348602771759033, "global_step": 197099, "epoch": 4692} {"train_loss": -7.213623046875, "global_step": 197100, "epoch": 4692} {"train_loss": -7.318990707397461, "global_step": 197101, "epoch": 4692} {"train_loss": -7.266345024108887, "global_step": 197102, "epoch": 4692} {"train_loss": -7.1790361404418945, "global_step": 197103, "epoch": 4692} {"train_loss": -7.340151786804199, "global_step": 197104, "epoch": 4692} {"train_loss": -7.278535184406099, "global_step": 197105, "epoch": 4692, "val_loss": 81424.8515625} {"train_loss": -7.127549648284912, "global_step": 197106, "epoch": 4693} {"train_loss": -7.3193769454956055, "global_step": 197107, "epoch": 4693} {"train_loss": -7.086384296417236, "global_step": 197108, "epoch": 4693} {"train_loss": -7.226206302642822, "global_step": 197109, "epoch": 4693} {"train_loss": -7.321297645568848, "global_step": 197110, "epoch": 4693} {"train_loss": -7.2366766929626465, "global_step": 197111, "epoch": 4693} {"train_loss": -7.27152156829834, "global_step": 197112, "epoch": 4693} {"train_loss": -7.209921836853027, "global_step": 197113, "epoch": 4693} {"train_loss": -7.279910564422607, "global_step": 197114, "epoch": 4693} {"train_loss": -7.156322002410889, "global_step": 197115, "epoch": 4693} {"train_loss": -7.26798152923584, "global_step": 197116, "epoch": 4693} {"train_loss": -7.182559013366699, "global_step": 197117, "epoch": 4693} {"train_loss": -7.255176544189453, "global_step": 197118, "epoch": 4693} {"train_loss": -7.209551811218262, "global_step": 197119, "epoch": 4693} {"train_loss": -7.246755599975586, "global_step": 197120, "epoch": 4693} {"train_loss": -7.403809070587158, "global_step": 197121, "epoch": 4693} {"train_loss": -7.199792861938477, "global_step": 197122, "epoch": 4693} {"train_loss": -7.320797443389893, "global_step": 197123, "epoch": 4693} {"train_loss": -7.219410419464111, "global_step": 197124, "epoch": 4693} {"train_loss": -7.256102085113525, "global_step": 197125, "epoch": 4693} {"train_loss": -7.250373840332031, "global_step": 197126, "epoch": 4693} {"train_loss": -7.22718620300293, "global_step": 197127, "epoch": 4693} {"train_loss": -7.169905662536621, "global_step": 197128, "epoch": 4693} {"train_loss": -7.294264316558838, "global_step": 197129, "epoch": 4693} {"train_loss": -7.161879539489746, "global_step": 197130, "epoch": 4693} {"train_loss": -7.305936813354492, "global_step": 197131, "epoch": 4693} {"train_loss": -7.181465148925781, "global_step": 197132, "epoch": 4693} {"train_loss": -7.25040340423584, "global_step": 197133, "epoch": 4693} {"train_loss": -7.085764408111572, "global_step": 197134, "epoch": 4693} {"train_loss": -7.222368240356445, "global_step": 197135, "epoch": 4693} {"train_loss": -7.230314254760742, "global_step": 197136, "epoch": 4693} {"train_loss": -7.200130462646484, "global_step": 197137, "epoch": 4693} {"train_loss": -7.242047309875488, "global_step": 197138, "epoch": 4693} {"train_loss": -7.184737205505371, "global_step": 197139, "epoch": 4693} {"train_loss": -7.298367500305176, "global_step": 197140, "epoch": 4693} {"train_loss": -7.185457229614258, "global_step": 197141, "epoch": 4693} {"train_loss": -7.1954569816589355, "global_step": 197142, "epoch": 4693} {"train_loss": -7.288283348083496, "global_step": 197143, "epoch": 4693} {"train_loss": -7.336058616638184, "global_step": 197144, "epoch": 4693} {"train_loss": -7.30938720703125, "global_step": 197145, "epoch": 4693} {"train_loss": -7.306087493896484, "global_step": 197146, "epoch": 4693} {"train_loss": -7.237387066795712, "global_step": 197147, "epoch": 4693, "val_loss": 81190.3203125} {"train_loss": -7.362305641174316, "global_step": 197148, "epoch": 4694} {"train_loss": -7.327225685119629, "global_step": 197149, "epoch": 4694} {"train_loss": -7.344449996948242, "global_step": 197150, "epoch": 4694} {"train_loss": -7.140179634094238, "global_step": 197151, "epoch": 4694} {"train_loss": -7.26646089553833, "global_step": 197152, "epoch": 4694} {"train_loss": -7.350461006164551, "global_step": 197153, "epoch": 4694} {"train_loss": -7.191362380981445, "global_step": 197154, "epoch": 4694} {"train_loss": -7.386441230773926, "global_step": 197155, "epoch": 4694} {"train_loss": -7.239721298217773, "global_step": 197156, "epoch": 4694} {"train_loss": -7.192371368408203, "global_step": 197157, "epoch": 4694} {"train_loss": -7.289977550506592, "global_step": 197158, "epoch": 4694} {"train_loss": -7.305448055267334, "global_step": 197159, "epoch": 4694} {"train_loss": -7.354249000549316, "global_step": 197160, "epoch": 4694} {"train_loss": -7.301968097686768, "global_step": 197161, "epoch": 4694} {"train_loss": -7.234790802001953, "global_step": 197162, "epoch": 4694} {"train_loss": -7.22291374206543, "global_step": 197163, "epoch": 4694} {"train_loss": -7.308620452880859, "global_step": 197164, "epoch": 4694} {"train_loss": -7.232126235961914, "global_step": 197165, "epoch": 4694} {"train_loss": -7.252411842346191, "global_step": 197166, "epoch": 4694} {"train_loss": -7.377586364746094, "global_step": 197167, "epoch": 4694} {"train_loss": -7.249776840209961, "global_step": 197168, "epoch": 4694} {"train_loss": -7.330264091491699, "global_step": 197169, "epoch": 4694} {"train_loss": -7.369300842285156, "global_step": 197170, "epoch": 4694} {"train_loss": -7.227598190307617, "global_step": 197171, "epoch": 4694} {"train_loss": -7.24361515045166, "global_step": 197172, "epoch": 4694} {"train_loss": -7.166046619415283, "global_step": 197173, "epoch": 4694} {"train_loss": -7.268218040466309, "global_step": 197174, "epoch": 4694} {"train_loss": -7.35780143737793, "global_step": 197175, "epoch": 4694} {"train_loss": -7.2013397216796875, "global_step": 197176, "epoch": 4694} {"train_loss": -7.3683624267578125, "global_step": 197177, "epoch": 4694} {"train_loss": -7.274850845336914, "global_step": 197178, "epoch": 4694} {"train_loss": -7.345497131347656, "global_step": 197179, "epoch": 4694} {"train_loss": -7.218076705932617, "global_step": 197180, "epoch": 4694} {"train_loss": -7.323814392089844, "global_step": 197181, "epoch": 4694} {"train_loss": -7.299205780029297, "global_step": 197182, "epoch": 4694} {"train_loss": -7.466700077056885, "global_step": 197183, "epoch": 4694} {"train_loss": -7.340415000915527, "global_step": 197184, "epoch": 4694} {"train_loss": -7.259162902832031, "global_step": 197185, "epoch": 4694} {"train_loss": -7.266631603240967, "global_step": 197186, "epoch": 4694} {"train_loss": -7.247701168060303, "global_step": 197187, "epoch": 4694} {"train_loss": -7.335383892059326, "global_step": 197188, "epoch": 4694} {"train_loss": -7.289470683960688, "global_step": 197189, "epoch": 4694, "val_loss": 81161.6015625} {"train_loss": -7.218321800231934, "global_step": 197190, "epoch": 4695} {"train_loss": -7.460409164428711, "global_step": 197191, "epoch": 4695} {"train_loss": -7.360833168029785, "global_step": 197192, "epoch": 4695} {"train_loss": -7.23063850402832, "global_step": 197193, "epoch": 4695} {"train_loss": -7.288430690765381, "global_step": 197194, "epoch": 4695} {"train_loss": -7.1851301193237305, "global_step": 197195, "epoch": 4695} {"train_loss": -7.268723487854004, "global_step": 197196, "epoch": 4695} {"train_loss": -7.28303337097168, "global_step": 197197, "epoch": 4695} {"train_loss": -7.318282127380371, "global_step": 197198, "epoch": 4695} {"train_loss": -7.288027763366699, "global_step": 197199, "epoch": 4695} {"train_loss": -7.3620285987854, "global_step": 197200, "epoch": 4695} {"train_loss": -7.296366214752197, "global_step": 197201, "epoch": 4695} {"train_loss": -7.378314971923828, "global_step": 197202, "epoch": 4695} {"train_loss": -7.301939964294434, "global_step": 197203, "epoch": 4695} {"train_loss": -7.3204665184021, "global_step": 197204, "epoch": 4695} {"train_loss": -7.302440643310547, "global_step": 197205, "epoch": 4695} {"train_loss": -7.259035587310791, "global_step": 197206, "epoch": 4695} {"train_loss": -7.329168319702148, "global_step": 197207, "epoch": 4695} {"train_loss": -7.346426010131836, "global_step": 197208, "epoch": 4695} {"train_loss": -7.27988338470459, "global_step": 197209, "epoch": 4695} {"train_loss": -7.362862586975098, "global_step": 197210, "epoch": 4695} {"train_loss": -7.30557107925415, "global_step": 197211, "epoch": 4695} {"train_loss": -7.342147350311279, "global_step": 197212, "epoch": 4695} {"train_loss": -7.251607894897461, "global_step": 197213, "epoch": 4695} {"train_loss": -7.327572822570801, "global_step": 197214, "epoch": 4695} {"train_loss": -7.250026226043701, "global_step": 197215, "epoch": 4695} {"train_loss": -7.3703460693359375, "global_step": 197216, "epoch": 4695} {"train_loss": -7.295729637145996, "global_step": 197217, "epoch": 4695} {"train_loss": -7.297046184539795, "global_step": 197218, "epoch": 4695} {"train_loss": -7.232337951660156, "global_step": 197219, "epoch": 4695} {"train_loss": -7.120254039764404, "global_step": 197220, "epoch": 4695} {"train_loss": -7.3240647315979, "global_step": 197221, "epoch": 4695} {"train_loss": -7.272176742553711, "global_step": 197222, "epoch": 4695} {"train_loss": -7.251051425933838, "global_step": 197223, "epoch": 4695} {"train_loss": -7.279112815856934, "global_step": 197224, "epoch": 4695} {"train_loss": -7.132604598999023, "global_step": 197225, "epoch": 4695} {"train_loss": -7.115020751953125, "global_step": 197226, "epoch": 4695} {"train_loss": -7.125588417053223, "global_step": 197227, "epoch": 4695} {"train_loss": -7.058135032653809, "global_step": 197228, "epoch": 4695} {"train_loss": -7.090993404388428, "global_step": 197229, "epoch": 4695} {"train_loss": -7.144177436828613, "global_step": 197230, "epoch": 4695} {"train_loss": -7.266526244935536, "global_step": 197231, "epoch": 4695, "val_loss": 81365.828125} {"train_loss": -7.10752010345459, "global_step": 197232, "epoch": 4696} {"train_loss": -7.039029598236084, "global_step": 197233, "epoch": 4696} {"train_loss": -7.09221076965332, "global_step": 197234, "epoch": 4696} {"train_loss": -7.2123284339904785, "global_step": 197235, "epoch": 4696} {"train_loss": -6.954338073730469, "global_step": 197236, "epoch": 4696} {"train_loss": -7.126422882080078, "global_step": 197237, "epoch": 4696} {"train_loss": -7.157448768615723, "global_step": 197238, "epoch": 4696} {"train_loss": -7.267412185668945, "global_step": 197239, "epoch": 4696} {"train_loss": -7.2374587059021, "global_step": 197240, "epoch": 4696} {"train_loss": -7.185266494750977, "global_step": 197241, "epoch": 4696} {"train_loss": -7.175179958343506, "global_step": 197242, "epoch": 4696} {"train_loss": -7.1346659660339355, "global_step": 197243, "epoch": 4696} {"train_loss": -7.157597541809082, "global_step": 197244, "epoch": 4696} {"train_loss": -7.291652202606201, "global_step": 197245, "epoch": 4696} {"train_loss": -7.280993461608887, "global_step": 197246, "epoch": 4696} {"train_loss": -7.204267978668213, "global_step": 197247, "epoch": 4696} {"train_loss": -7.197804927825928, "global_step": 197248, "epoch": 4696} {"train_loss": -7.163434028625488, "global_step": 197249, "epoch": 4696} {"train_loss": -7.288819313049316, "global_step": 197250, "epoch": 4696} {"train_loss": -7.262940883636475, "global_step": 197251, "epoch": 4696} {"train_loss": -7.2430500984191895, "global_step": 197252, "epoch": 4696} {"train_loss": -7.2685346603393555, "global_step": 197253, "epoch": 4696} {"train_loss": -7.355221748352051, "global_step": 197254, "epoch": 4696} {"train_loss": -7.217571258544922, "global_step": 197255, "epoch": 4696} {"train_loss": -7.36022424697876, "global_step": 197256, "epoch": 4696} {"train_loss": -7.295691967010498, "global_step": 197257, "epoch": 4696} {"train_loss": -7.376920700073242, "global_step": 197258, "epoch": 4696} {"train_loss": -7.341654300689697, "global_step": 197259, "epoch": 4696} {"train_loss": -7.300251007080078, "global_step": 197260, "epoch": 4696} {"train_loss": -7.214565277099609, "global_step": 197261, "epoch": 4696} {"train_loss": -7.351633071899414, "global_step": 197262, "epoch": 4696} {"train_loss": -7.272237300872803, "global_step": 197263, "epoch": 4696} {"train_loss": -7.312475204467773, "global_step": 197264, "epoch": 4696} {"train_loss": -7.265896797180176, "global_step": 197265, "epoch": 4696} {"train_loss": -7.37519645690918, "global_step": 197266, "epoch": 4696} {"train_loss": -7.273599624633789, "global_step": 197267, "epoch": 4696} {"train_loss": -7.327239036560059, "global_step": 197268, "epoch": 4696} {"train_loss": -7.412732124328613, "global_step": 197269, "epoch": 4696} {"train_loss": -7.273399353027344, "global_step": 197270, "epoch": 4696} {"train_loss": -7.276202201843262, "global_step": 197271, "epoch": 4696} {"train_loss": -7.388943195343018, "global_step": 197272, "epoch": 4696} {"train_loss": -7.246884016763596, "global_step": 197273, "epoch": 4696, "val_loss": 81241.7421875} {"train_loss": -7.364516258239746, "global_step": 197274, "epoch": 4697} {"train_loss": -7.289355754852295, "global_step": 197275, "epoch": 4697} {"train_loss": -7.1363019943237305, "global_step": 197276, "epoch": 4697} {"train_loss": -7.247570514678955, "global_step": 197277, "epoch": 4697} {"train_loss": -7.375147819519043, "global_step": 197278, "epoch": 4697} {"train_loss": -7.224079132080078, "global_step": 197279, "epoch": 4697} {"train_loss": -7.434128761291504, "global_step": 197280, "epoch": 4697} {"train_loss": -7.3802361488342285, "global_step": 197281, "epoch": 4697} {"train_loss": -7.13485050201416, "global_step": 197282, "epoch": 4697} {"train_loss": -7.364745140075684, "global_step": 197283, "epoch": 4697} {"train_loss": -7.290899276733398, "global_step": 197284, "epoch": 4697} {"train_loss": -7.4303178787231445, "global_step": 197285, "epoch": 4697} {"train_loss": -7.381694316864014, "global_step": 197286, "epoch": 4697} {"train_loss": -7.199785232543945, "global_step": 197287, "epoch": 4697} {"train_loss": -7.3416314125061035, "global_step": 197288, "epoch": 4697} {"train_loss": -7.309605598449707, "global_step": 197289, "epoch": 4697} {"train_loss": -7.383824825286865, "global_step": 197290, "epoch": 4697} {"train_loss": -7.314375877380371, "global_step": 197291, "epoch": 4697} {"train_loss": -7.403968334197998, "global_step": 197292, "epoch": 4697} {"train_loss": -7.311441898345947, "global_step": 197293, "epoch": 4697} {"train_loss": -7.389186859130859, "global_step": 197294, "epoch": 4697} {"train_loss": -7.061197280883789, "global_step": 197295, "epoch": 4697} {"train_loss": -7.2433929443359375, "global_step": 197296, "epoch": 4697} {"train_loss": -7.300500869750977, "global_step": 197297, "epoch": 4697} {"train_loss": -7.418117523193359, "global_step": 197298, "epoch": 4697} {"train_loss": -7.3692216873168945, "global_step": 197299, "epoch": 4697} {"train_loss": -7.300614833831787, "global_step": 197300, "epoch": 4697} {"train_loss": -7.291345596313477, "global_step": 197301, "epoch": 4697} {"train_loss": -7.211544513702393, "global_step": 197302, "epoch": 4697} {"train_loss": -7.305007457733154, "global_step": 197303, "epoch": 4697} {"train_loss": -7.244826316833496, "global_step": 197304, "epoch": 4697} {"train_loss": -7.315842628479004, "global_step": 197305, "epoch": 4697} {"train_loss": -7.347749710083008, "global_step": 197306, "epoch": 4697} {"train_loss": -7.224237442016602, "global_step": 197307, "epoch": 4697} {"train_loss": -7.188083648681641, "global_step": 197308, "epoch": 4697} {"train_loss": -7.3471856117248535, "global_step": 197309, "epoch": 4697} {"train_loss": -7.2510175704956055, "global_step": 197310, "epoch": 4697} {"train_loss": -7.291119575500488, "global_step": 197311, "epoch": 4697} {"train_loss": -7.258960723876953, "global_step": 197312, "epoch": 4697} {"train_loss": -7.219874382019043, "global_step": 197313, "epoch": 4697} {"train_loss": -7.251081943511963, "global_step": 197314, "epoch": 4697} {"train_loss": -7.29523846081325, "global_step": 197315, "epoch": 4697, "val_loss": 81776.171875} {"train_loss": -7.198012351989746, "global_step": 197316, "epoch": 4698} {"train_loss": -7.3508806228637695, "global_step": 197317, "epoch": 4698} {"train_loss": -7.166224479675293, "global_step": 197318, "epoch": 4698} {"train_loss": -7.189358711242676, "global_step": 197319, "epoch": 4698} {"train_loss": -7.232535362243652, "global_step": 197320, "epoch": 4698} {"train_loss": -7.275514602661133, "global_step": 197321, "epoch": 4698} {"train_loss": -7.2832231521606445, "global_step": 197322, "epoch": 4698} {"train_loss": -7.262069225311279, "global_step": 197323, "epoch": 4698} {"train_loss": -7.213772773742676, "global_step": 197324, "epoch": 4698} {"train_loss": -7.246582984924316, "global_step": 197325, "epoch": 4698} {"train_loss": -7.243148326873779, "global_step": 197326, "epoch": 4698} {"train_loss": -7.227204322814941, "global_step": 197327, "epoch": 4698} {"train_loss": -7.18358850479126, "global_step": 197328, "epoch": 4698} {"train_loss": -7.312616348266602, "global_step": 197329, "epoch": 4698} {"train_loss": -7.284554481506348, "global_step": 197330, "epoch": 4698} {"train_loss": -7.31667947769165, "global_step": 197331, "epoch": 4698} {"train_loss": -7.296919822692871, "global_step": 197332, "epoch": 4698} {"train_loss": -7.281594276428223, "global_step": 197333, "epoch": 4698} {"train_loss": -7.229881286621094, "global_step": 197334, "epoch": 4698} {"train_loss": -7.187785625457764, "global_step": 197335, "epoch": 4698} {"train_loss": -7.320786476135254, "global_step": 197336, "epoch": 4698} {"train_loss": -7.3438310623168945, "global_step": 197337, "epoch": 4698} {"train_loss": -7.225991249084473, "global_step": 197338, "epoch": 4698} {"train_loss": -7.261800289154053, "global_step": 197339, "epoch": 4698} {"train_loss": -7.209468364715576, "global_step": 197340, "epoch": 4698} {"train_loss": -7.339333534240723, "global_step": 197341, "epoch": 4698} {"train_loss": -7.245627403259277, "global_step": 197342, "epoch": 4698} {"train_loss": -7.209987640380859, "global_step": 197343, "epoch": 4698} {"train_loss": -7.363524436950684, "global_step": 197344, "epoch": 4698} {"train_loss": -7.237789630889893, "global_step": 197345, "epoch": 4698} {"train_loss": -7.429327487945557, "global_step": 197346, "epoch": 4698} {"train_loss": -7.361958980560303, "global_step": 197347, "epoch": 4698} {"train_loss": -7.269007205963135, "global_step": 197348, "epoch": 4698} {"train_loss": -7.258707046508789, "global_step": 197349, "epoch": 4698} {"train_loss": -7.374223709106445, "global_step": 197350, "epoch": 4698} {"train_loss": -7.222224235534668, "global_step": 197351, "epoch": 4698} {"train_loss": -7.256561279296875, "global_step": 197352, "epoch": 4698} {"train_loss": -7.24013614654541, "global_step": 197353, "epoch": 4698} {"train_loss": -7.355042457580566, "global_step": 197354, "epoch": 4698} {"train_loss": -7.346623420715332, "global_step": 197355, "epoch": 4698} {"train_loss": -7.39230489730835, "global_step": 197356, "epoch": 4698} {"train_loss": -7.276466256096249, "global_step": 197357, "epoch": 4698, "val_loss": 81425.1875} {"train_loss": -7.207688331604004, "global_step": 197358, "epoch": 4699} {"train_loss": -7.258394241333008, "global_step": 197359, "epoch": 4699} {"train_loss": -7.343592643737793, "global_step": 197360, "epoch": 4699} {"train_loss": -7.296497344970703, "global_step": 197361, "epoch": 4699} {"train_loss": -7.403348922729492, "global_step": 197362, "epoch": 4699} {"train_loss": -7.245302200317383, "global_step": 197363, "epoch": 4699} {"train_loss": -7.258754730224609, "global_step": 197364, "epoch": 4699} {"train_loss": -7.377263069152832, "global_step": 197365, "epoch": 4699} {"train_loss": -7.257045745849609, "global_step": 197366, "epoch": 4699} {"train_loss": -7.187597274780273, "global_step": 197367, "epoch": 4699} {"train_loss": -7.229389667510986, "global_step": 197368, "epoch": 4699} {"train_loss": -7.218226432800293, "global_step": 197369, "epoch": 4699} {"train_loss": -7.301795482635498, "global_step": 197370, "epoch": 4699} {"train_loss": -7.323089599609375, "global_step": 197371, "epoch": 4699} {"train_loss": -7.342688083648682, "global_step": 197372, "epoch": 4699} {"train_loss": -7.339317321777344, "global_step": 197373, "epoch": 4699} {"train_loss": -7.347270965576172, "global_step": 197374, "epoch": 4699} {"train_loss": -7.249478340148926, "global_step": 197375, "epoch": 4699} {"train_loss": -7.492926597595215, "global_step": 197376, "epoch": 4699} {"train_loss": -7.3075480461120605, "global_step": 197377, "epoch": 4699} {"train_loss": -7.398587226867676, "global_step": 197378, "epoch": 4699} {"train_loss": -7.280796051025391, "global_step": 197379, "epoch": 4699} {"train_loss": -7.31905460357666, "global_step": 197380, "epoch": 4699} {"train_loss": -7.443665504455566, "global_step": 197381, "epoch": 4699} {"train_loss": -7.3414483070373535, "global_step": 197382, "epoch": 4699} {"train_loss": -7.294912815093994, "global_step": 197383, "epoch": 4699} {"train_loss": -7.316266059875488, "global_step": 197384, "epoch": 4699} {"train_loss": -7.186019420623779, "global_step": 197385, "epoch": 4699} {"train_loss": -7.172597408294678, "global_step": 197386, "epoch": 4699} {"train_loss": -7.258908271789551, "global_step": 197387, "epoch": 4699} {"train_loss": -7.170882701873779, "global_step": 197388, "epoch": 4699} {"train_loss": -7.121565818786621, "global_step": 197389, "epoch": 4699} {"train_loss": -7.056939125061035, "global_step": 197390, "epoch": 4699} {"train_loss": -7.244687080383301, "global_step": 197391, "epoch": 4699} {"train_loss": -7.006343841552734, "global_step": 197392, "epoch": 4699} {"train_loss": -7.175078392028809, "global_step": 197393, "epoch": 4699} {"train_loss": -7.268640518188477, "global_step": 197394, "epoch": 4699} {"train_loss": -7.014429092407227, "global_step": 197395, "epoch": 4699} {"train_loss": -7.283100605010986, "global_step": 197396, "epoch": 4699} {"train_loss": -7.146566390991211, "global_step": 197397, "epoch": 4699} {"train_loss": -7.210141181945801, "global_step": 197398, "epoch": 4699} {"train_loss": -7.256721190043858, "global_step": 197399, "epoch": 4699, "val_loss": 81072.1015625} {"train_loss": -7.268912315368652, "global_step": 197400, "epoch": 4700} {"train_loss": -7.246172904968262, "global_step": 197401, "epoch": 4700} {"train_loss": -7.26246452331543, "global_step": 197402, "epoch": 4700} {"train_loss": -7.235051155090332, "global_step": 197403, "epoch": 4700} {"train_loss": -7.192478179931641, "global_step": 197404, "epoch": 4700} {"train_loss": -7.245790958404541, "global_step": 197405, "epoch": 4700} {"train_loss": -7.1607160568237305, "global_step": 197406, "epoch": 4700} {"train_loss": -7.308854103088379, "global_step": 197407, "epoch": 4700} {"train_loss": -7.144166946411133, "global_step": 197408, "epoch": 4700} {"train_loss": -7.290798187255859, "global_step": 197409, "epoch": 4700} {"train_loss": -7.202391624450684, "global_step": 197410, "epoch": 4700} {"train_loss": -7.173093318939209, "global_step": 197411, "epoch": 4700} {"train_loss": -7.231006622314453, "global_step": 197412, "epoch": 4700} {"train_loss": -7.231006622314453, "global_step": 197413, "epoch": 4700} {"train_loss": -7.251360893249512, "global_step": 197414, "epoch": 4700} {"train_loss": -7.214942932128906, "global_step": 197415, "epoch": 4700} {"train_loss": -7.172894477844238, "global_step": 197416, "epoch": 4700} {"train_loss": -7.292202949523926, "global_step": 197417, "epoch": 4700} {"train_loss": -7.357954502105713, "global_step": 197418, "epoch": 4700} {"train_loss": -7.265451908111572, "global_step": 197419, "epoch": 4700} {"train_loss": -7.282828330993652, "global_step": 197420, "epoch": 4700} {"train_loss": -7.3395490646362305, "global_step": 197421, "epoch": 4700} {"train_loss": -7.2432990074157715, "global_step": 197422, "epoch": 4700} {"train_loss": -7.340267658233643, "global_step": 197423, "epoch": 4700} {"train_loss": -7.256981372833252, "global_step": 197424, "epoch": 4700} {"train_loss": -7.0777482986450195, "global_step": 197425, "epoch": 4700} {"train_loss": -7.1638994216918945, "global_step": 197426, "epoch": 4700} {"train_loss": -7.318310737609863, "global_step": 197427, "epoch": 4700} {"train_loss": -7.281162261962891, "global_step": 197428, "epoch": 4700} {"train_loss": -7.230022430419922, "global_step": 197429, "epoch": 4700} {"train_loss": -7.2414140701293945, "global_step": 197430, "epoch": 4700} {"train_loss": -7.262055397033691, "global_step": 197431, "epoch": 4700} {"train_loss": -7.174780368804932, "global_step": 197432, "epoch": 4700} {"train_loss": -7.207010746002197, "global_step": 197433, "epoch": 4700} {"train_loss": -7.240422248840332, "global_step": 197434, "epoch": 4700} {"train_loss": -7.166594505310059, "global_step": 197435, "epoch": 4700} {"train_loss": -7.330883979797363, "global_step": 197436, "epoch": 4700} {"train_loss": -7.134232044219971, "global_step": 197437, "epoch": 4700} {"train_loss": -7.2190141677856445, "global_step": 197438, "epoch": 4700} {"train_loss": -7.297762393951416, "global_step": 197439, "epoch": 4700} {"train_loss": -7.2819671630859375, "global_step": 197440, "epoch": 4700} {"train_loss": -7.24089655422029, "global_step": 197441, "epoch": 4700, "train/sim_max_reward_0": 0.9390059336134285, "train/sim_max_reward_1": 0.9926160418671807, "train/sim_max_reward_2": 0.9413096031276087, "train/sim_max_reward_3": 0.5902376693520164, "train/sim_max_reward_4": 0.9772936114088024, "train/sim_max_reward_5": 0.5584560073382493, "test/sim_max_reward_4500000": 0.9717518012231318, "test/sim_max_reward_4500001": 0.9679950611174314, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9725275107514039, "test/sim_max_reward_4500004": 0.8638716227557339, "test/sim_max_reward_4500005": 0.8690247433531284, "test/sim_max_reward_4500006": 0.8936039890891485, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.8963857126554097, "test/sim_max_reward_4500009": 0.05298192361653667, "test/sim_max_reward_4500010": 0.0, "test/sim_max_reward_4500011": 0.997336193917166, "test/sim_max_reward_4500012": 0.9765099187064783, "test/sim_max_reward_4500013": 0.0037660753292844628, "test/sim_max_reward_4500014": 0.9738484188007378, "test/sim_max_reward_4500015": 0.9920928514489844, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.1207609822229729, "test/sim_max_reward_4500018": 0.485621851334807, "test/sim_max_reward_4500019": 0.9837963089510305, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8686296166749847, "test/sim_max_reward_4500022": 1.0, "test/sim_max_reward_4500023": 0.886324679586528, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.5248263253796593, "test/sim_max_reward_4500026": 0.9803840756359438, "test/sim_max_reward_4500027": 0.9035948386479414, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.052033154518069294, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.7871420894511506, "test/sim_max_reward_4500034": 0.8864945388024513, "test/sim_max_reward_4500035": 0.8892016663961956, "test/sim_max_reward_4500036": 0.9460374649209354, "test/sim_max_reward_4500037": 0.8951939150519204, "test/sim_max_reward_4500038": 0.32511365474194154, "test/sim_max_reward_4500039": 0.9488724145667912, "test/sim_max_reward_4500040": 0.9083209702666362, "test/sim_max_reward_4500041": 0.9886174103522357, "test/sim_max_reward_4500042": 0.04245474262337596, "test/sim_max_reward_4500043": 0.9909525023000723, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.39420560702158586, "test/sim_max_reward_4500046": 0.21093231843249652, "test/sim_max_reward_4500047": 0.9577736375855787, "test/sim_max_reward_4500048": 0.8729646007165537, "test/sim_max_reward_4500049": 0.9758410879121422, "train/mean_score": 0.8331531444512144, "test/mean_score": 0.6502003477089597, "val_loss": 81337.640625} {"train_loss": -7.22548246383667, "global_step": 197442, "epoch": 4701} {"train_loss": -7.337420463562012, "global_step": 197443, "epoch": 4701} {"train_loss": -7.245078086853027, "global_step": 197444, "epoch": 4701} {"train_loss": -7.106195449829102, "global_step": 197445, "epoch": 4701} {"train_loss": -7.3360419273376465, "global_step": 197446, "epoch": 4701} {"train_loss": -7.274101257324219, "global_step": 197447, "epoch": 4701} {"train_loss": -7.1743059158325195, "global_step": 197448, "epoch": 4701} {"train_loss": -7.120791435241699, "global_step": 197449, "epoch": 4701} {"train_loss": -7.227655410766602, "global_step": 197450, "epoch": 4701} {"train_loss": -7.277368068695068, "global_step": 197451, "epoch": 4701} {"train_loss": -7.250606536865234, "global_step": 197452, "epoch": 4701} {"train_loss": -7.353174209594727, "global_step": 197453, "epoch": 4701} {"train_loss": -7.318648815155029, "global_step": 197454, "epoch": 4701} {"train_loss": -7.323502540588379, "global_step": 197455, "epoch": 4701} {"train_loss": -7.302001953125, "global_step": 197456, "epoch": 4701} {"train_loss": -7.347753047943115, "global_step": 197457, "epoch": 4701} {"train_loss": -7.35499906539917, "global_step": 197458, "epoch": 4701} {"train_loss": -7.383496284484863, "global_step": 197459, "epoch": 4701} {"train_loss": -7.316656589508057, "global_step": 197460, "epoch": 4701} {"train_loss": -7.29324197769165, "global_step": 197461, "epoch": 4701} {"train_loss": -7.3989458084106445, "global_step": 197462, "epoch": 4701} {"train_loss": -7.33390474319458, "global_step": 197463, "epoch": 4701} {"train_loss": -7.30804443359375, "global_step": 197464, "epoch": 4701} {"train_loss": -7.351740837097168, "global_step": 197465, "epoch": 4701} {"train_loss": -7.355429649353027, "global_step": 197466, "epoch": 4701} {"train_loss": -7.328512191772461, "global_step": 197467, "epoch": 4701} {"train_loss": -7.2871785163879395, "global_step": 197468, "epoch": 4701} {"train_loss": -7.473682403564453, "global_step": 197469, "epoch": 4701} {"train_loss": -7.302020072937012, "global_step": 197470, "epoch": 4701} {"train_loss": -7.319086074829102, "global_step": 197471, "epoch": 4701} {"train_loss": -7.354682922363281, "global_step": 197472, "epoch": 4701} {"train_loss": -7.412471771240234, "global_step": 197473, "epoch": 4701} {"train_loss": -7.313254356384277, "global_step": 197474, "epoch": 4701} {"train_loss": -7.339993953704834, "global_step": 197475, "epoch": 4701} {"train_loss": -7.3962554931640625, "global_step": 197476, "epoch": 4701} {"train_loss": -7.291998386383057, "global_step": 197477, "epoch": 4701} {"train_loss": -7.368003845214844, "global_step": 197478, "epoch": 4701} {"train_loss": -7.409528732299805, "global_step": 197479, "epoch": 4701} {"train_loss": -7.300662994384766, "global_step": 197480, "epoch": 4701} {"train_loss": -7.3002848625183105, "global_step": 197481, "epoch": 4701} {"train_loss": -7.320141315460205, "global_step": 197482, "epoch": 4701} {"train_loss": -7.314899103982108, "global_step": 197483, "epoch": 4701, "val_loss": 81326.453125} {"train_loss": -7.352313041687012, "global_step": 197484, "epoch": 4702} {"train_loss": -7.3232526779174805, "global_step": 197485, "epoch": 4702} {"train_loss": -7.353330135345459, "global_step": 197486, "epoch": 4702} {"train_loss": -7.444423675537109, "global_step": 197487, "epoch": 4702} {"train_loss": -7.291297912597656, "global_step": 197488, "epoch": 4702} {"train_loss": -7.340250015258789, "global_step": 197489, "epoch": 4702} {"train_loss": -7.319496154785156, "global_step": 197490, "epoch": 4702} {"train_loss": -7.262192726135254, "global_step": 197491, "epoch": 4702} {"train_loss": -7.237549781799316, "global_step": 197492, "epoch": 4702} {"train_loss": -7.305933952331543, "global_step": 197493, "epoch": 4702} {"train_loss": -7.270689010620117, "global_step": 197494, "epoch": 4702} {"train_loss": -7.394035816192627, "global_step": 197495, "epoch": 4702} {"train_loss": -7.379042625427246, "global_step": 197496, "epoch": 4702} {"train_loss": -7.305068492889404, "global_step": 197497, "epoch": 4702} {"train_loss": -7.330214023590088, "global_step": 197498, "epoch": 4702} {"train_loss": -7.0295562744140625, "global_step": 197499, "epoch": 4702} {"train_loss": -7.061211585998535, "global_step": 197500, "epoch": 4702} {"train_loss": -7.292537689208984, "global_step": 197501, "epoch": 4702} {"train_loss": -6.96585750579834, "global_step": 197502, "epoch": 4702} {"train_loss": -7.226065158843994, "global_step": 197503, "epoch": 4702} {"train_loss": -6.935823440551758, "global_step": 197504, "epoch": 4702} {"train_loss": -7.009641647338867, "global_step": 197505, "epoch": 4702} {"train_loss": -7.087569236755371, "global_step": 197506, "epoch": 4702} {"train_loss": -7.030495643615723, "global_step": 197507, "epoch": 4702} {"train_loss": -7.147851943969727, "global_step": 197508, "epoch": 4702} {"train_loss": -7.061306953430176, "global_step": 197509, "epoch": 4702} {"train_loss": -7.259778022766113, "global_step": 197510, "epoch": 4702} {"train_loss": -7.311751365661621, "global_step": 197511, "epoch": 4702} {"train_loss": -7.226462364196777, "global_step": 197512, "epoch": 4702} {"train_loss": -7.260200500488281, "global_step": 197513, "epoch": 4702} {"train_loss": -7.110180377960205, "global_step": 197514, "epoch": 4702} {"train_loss": -7.265413284301758, "global_step": 197515, "epoch": 4702} {"train_loss": -7.126738548278809, "global_step": 197516, "epoch": 4702} {"train_loss": -7.231236457824707, "global_step": 197517, "epoch": 4702} {"train_loss": -7.25626277923584, "global_step": 197518, "epoch": 4702} {"train_loss": -7.066824913024902, "global_step": 197519, "epoch": 4702} {"train_loss": -7.296598434448242, "global_step": 197520, "epoch": 4702} {"train_loss": -7.106738090515137, "global_step": 197521, "epoch": 4702} {"train_loss": -7.2741007804870605, "global_step": 197522, "epoch": 4702} {"train_loss": -7.181363105773926, "global_step": 197523, "epoch": 4702} {"train_loss": -7.220057487487793, "global_step": 197524, "epoch": 4702} {"train_loss": -7.216530243555705, "global_step": 197525, "epoch": 4702, "val_loss": 81631.59375} {"train_loss": -7.245107173919678, "global_step": 197526, "epoch": 4703} {"train_loss": -7.270622253417969, "global_step": 197527, "epoch": 4703} {"train_loss": -7.259213447570801, "global_step": 197528, "epoch": 4703} {"train_loss": -7.144750595092773, "global_step": 197529, "epoch": 4703} {"train_loss": -7.160336494445801, "global_step": 197530, "epoch": 4703} {"train_loss": -7.206563949584961, "global_step": 197531, "epoch": 4703} {"train_loss": -7.25811767578125, "global_step": 197532, "epoch": 4703} {"train_loss": -7.331863880157471, "global_step": 197533, "epoch": 4703} {"train_loss": -7.199837684631348, "global_step": 197534, "epoch": 4703} {"train_loss": -7.197079658508301, "global_step": 197535, "epoch": 4703} {"train_loss": -7.25521993637085, "global_step": 197536, "epoch": 4703} {"train_loss": -7.225795745849609, "global_step": 197537, "epoch": 4703} {"train_loss": -7.279838562011719, "global_step": 197538, "epoch": 4703} {"train_loss": -7.3263773918151855, "global_step": 197539, "epoch": 4703} {"train_loss": -7.113178253173828, "global_step": 197540, "epoch": 4703} {"train_loss": -7.1946563720703125, "global_step": 197541, "epoch": 4703} {"train_loss": -7.11815071105957, "global_step": 197542, "epoch": 4703} {"train_loss": -7.363021373748779, "global_step": 197543, "epoch": 4703} {"train_loss": -7.25241231918335, "global_step": 197544, "epoch": 4703} {"train_loss": -7.2043256759643555, "global_step": 197545, "epoch": 4703} {"train_loss": -7.290399074554443, "global_step": 197546, "epoch": 4703} {"train_loss": -7.256802082061768, "global_step": 197547, "epoch": 4703} {"train_loss": -7.171440124511719, "global_step": 197548, "epoch": 4703} {"train_loss": -7.399878978729248, "global_step": 197549, "epoch": 4703} {"train_loss": -7.30042028427124, "global_step": 197550, "epoch": 4703} {"train_loss": -7.326087951660156, "global_step": 197551, "epoch": 4703} {"train_loss": -7.312891006469727, "global_step": 197552, "epoch": 4703} {"train_loss": -7.292978286743164, "global_step": 197553, "epoch": 4703} {"train_loss": -7.379767417907715, "global_step": 197554, "epoch": 4703} {"train_loss": -7.349672317504883, "global_step": 197555, "epoch": 4703} {"train_loss": -7.355273723602295, "global_step": 197556, "epoch": 4703} {"train_loss": -7.322845935821533, "global_step": 197557, "epoch": 4703} {"train_loss": -7.246821880340576, "global_step": 197558, "epoch": 4703} {"train_loss": -7.262054920196533, "global_step": 197559, "epoch": 4703} {"train_loss": -7.227819442749023, "global_step": 197560, "epoch": 4703} {"train_loss": -7.331180572509766, "global_step": 197561, "epoch": 4703} {"train_loss": -7.266092777252197, "global_step": 197562, "epoch": 4703} {"train_loss": -7.3387861251831055, "global_step": 197563, "epoch": 4703} {"train_loss": -7.330093860626221, "global_step": 197564, "epoch": 4703} {"train_loss": -7.300868511199951, "global_step": 197565, "epoch": 4703} {"train_loss": -7.408256530761719, "global_step": 197566, "epoch": 4703} {"train_loss": -7.269718045280094, "global_step": 197567, "epoch": 4703, "val_loss": 81430.3984375} {"train_loss": -7.347832679748535, "global_step": 197568, "epoch": 4704} {"train_loss": -7.333615303039551, "global_step": 197569, "epoch": 4704} {"train_loss": -7.389062881469727, "global_step": 197570, "epoch": 4704} {"train_loss": -7.346351146697998, "global_step": 197571, "epoch": 4704} {"train_loss": -7.329315662384033, "global_step": 197572, "epoch": 4704} {"train_loss": -7.37542724609375, "global_step": 197573, "epoch": 4704} {"train_loss": -7.248257160186768, "global_step": 197574, "epoch": 4704} {"train_loss": -7.481085777282715, "global_step": 197575, "epoch": 4704} {"train_loss": -7.2299604415893555, "global_step": 197576, "epoch": 4704} {"train_loss": -7.211058616638184, "global_step": 197577, "epoch": 4704} {"train_loss": -7.293939590454102, "global_step": 197578, "epoch": 4704} {"train_loss": -7.343480110168457, "global_step": 197579, "epoch": 4704} {"train_loss": -7.205061435699463, "global_step": 197580, "epoch": 4704} {"train_loss": -7.238012313842773, "global_step": 197581, "epoch": 4704} {"train_loss": -7.322049140930176, "global_step": 197582, "epoch": 4704} {"train_loss": -7.161251544952393, "global_step": 197583, "epoch": 4704} {"train_loss": -7.265595436096191, "global_step": 197584, "epoch": 4704} {"train_loss": -7.332803726196289, "global_step": 197585, "epoch": 4704} {"train_loss": -7.329933166503906, "global_step": 197586, "epoch": 4704} {"train_loss": -7.128440856933594, "global_step": 197587, "epoch": 4704} {"train_loss": -7.168710231781006, "global_step": 197588, "epoch": 4704} {"train_loss": -7.278382301330566, "global_step": 197589, "epoch": 4704} {"train_loss": -7.248990058898926, "global_step": 197590, "epoch": 4704} {"train_loss": -7.2011613845825195, "global_step": 197591, "epoch": 4704} {"train_loss": -7.262325286865234, "global_step": 197592, "epoch": 4704} {"train_loss": -7.234217166900635, "global_step": 197593, "epoch": 4704} {"train_loss": -7.233885765075684, "global_step": 197594, "epoch": 4704} {"train_loss": -7.308194637298584, "global_step": 197595, "epoch": 4704} {"train_loss": -7.105240821838379, "global_step": 197596, "epoch": 4704} {"train_loss": -7.213336944580078, "global_step": 197597, "epoch": 4704} {"train_loss": -7.219013214111328, "global_step": 197598, "epoch": 4704} {"train_loss": -7.2119855880737305, "global_step": 197599, "epoch": 4704} {"train_loss": -7.2601165771484375, "global_step": 197600, "epoch": 4704} {"train_loss": -7.275041580200195, "global_step": 197601, "epoch": 4704} {"train_loss": -7.16978645324707, "global_step": 197602, "epoch": 4704} {"train_loss": -7.297298431396484, "global_step": 197603, "epoch": 4704} {"train_loss": -7.331937789916992, "global_step": 197604, "epoch": 4704} {"train_loss": -7.2355546951293945, "global_step": 197605, "epoch": 4704} {"train_loss": -7.285368919372559, "global_step": 197606, "epoch": 4704} {"train_loss": -7.207134246826172, "global_step": 197607, "epoch": 4704} {"train_loss": -7.1929612159729, "global_step": 197608, "epoch": 4704} {"train_loss": -7.266409715016683, "global_step": 197609, "epoch": 4704, "val_loss": 81248.2265625} {"train_loss": -7.274676322937012, "global_step": 197610, "epoch": 4705} {"train_loss": -7.322605609893799, "global_step": 197611, "epoch": 4705} {"train_loss": -7.274179458618164, "global_step": 197612, "epoch": 4705} {"train_loss": -7.3228888511657715, "global_step": 197613, "epoch": 4705} {"train_loss": -7.212604522705078, "global_step": 197614, "epoch": 4705} {"train_loss": -7.277070045471191, "global_step": 197615, "epoch": 4705} {"train_loss": -7.375296592712402, "global_step": 197616, "epoch": 4705} {"train_loss": -7.359574317932129, "global_step": 197617, "epoch": 4705} {"train_loss": -7.3150224685668945, "global_step": 197618, "epoch": 4705} {"train_loss": -7.289875030517578, "global_step": 197619, "epoch": 4705} {"train_loss": -7.267807960510254, "global_step": 197620, "epoch": 4705} {"train_loss": -7.286760330200195, "global_step": 197621, "epoch": 4705} {"train_loss": -7.358945369720459, "global_step": 197622, "epoch": 4705} {"train_loss": -7.39684534072876, "global_step": 197623, "epoch": 4705} {"train_loss": -7.297898292541504, "global_step": 197624, "epoch": 4705} {"train_loss": -7.214452266693115, "global_step": 197625, "epoch": 4705} {"train_loss": -7.372110843658447, "global_step": 197626, "epoch": 4705} {"train_loss": -7.355759620666504, "global_step": 197627, "epoch": 4705} {"train_loss": -7.314357757568359, "global_step": 197628, "epoch": 4705} {"train_loss": -7.3087921142578125, "global_step": 197629, "epoch": 4705} {"train_loss": -7.259688377380371, "global_step": 197630, "epoch": 4705} {"train_loss": -7.174984455108643, "global_step": 197631, "epoch": 4705} {"train_loss": -7.344684600830078, "global_step": 197632, "epoch": 4705} {"train_loss": -7.18178653717041, "global_step": 197633, "epoch": 4705} {"train_loss": -7.2239670753479, "global_step": 197634, "epoch": 4705} {"train_loss": -7.368196487426758, "global_step": 197635, "epoch": 4705} {"train_loss": -7.250949382781982, "global_step": 197636, "epoch": 4705} {"train_loss": -7.237729072570801, "global_step": 197637, "epoch": 4705} {"train_loss": -7.276098251342773, "global_step": 197638, "epoch": 4705} {"train_loss": -7.277365684509277, "global_step": 197639, "epoch": 4705} {"train_loss": -7.378230571746826, "global_step": 197640, "epoch": 4705} {"train_loss": -7.2926177978515625, "global_step": 197641, "epoch": 4705} {"train_loss": -7.383790969848633, "global_step": 197642, "epoch": 4705} {"train_loss": -7.307302474975586, "global_step": 197643, "epoch": 4705} {"train_loss": -7.425539970397949, "global_step": 197644, "epoch": 4705} {"train_loss": -7.391839981079102, "global_step": 197645, "epoch": 4705} {"train_loss": -7.248252868652344, "global_step": 197646, "epoch": 4705} {"train_loss": -7.410523414611816, "global_step": 197647, "epoch": 4705} {"train_loss": -7.3041582107543945, "global_step": 197648, "epoch": 4705} {"train_loss": -7.261555194854736, "global_step": 197649, "epoch": 4705} {"train_loss": -7.342644691467285, "global_step": 197650, "epoch": 4705} {"train_loss": -7.305908986500332, "global_step": 197651, "epoch": 4705, "val_loss": 81376.953125} {"train_loss": -7.255056381225586, "global_step": 197652, "epoch": 4706} {"train_loss": -7.412703990936279, "global_step": 197653, "epoch": 4706} {"train_loss": -7.2763872146606445, "global_step": 197654, "epoch": 4706} {"train_loss": -7.174576282501221, "global_step": 197655, "epoch": 4706} {"train_loss": -7.161499500274658, "global_step": 197656, "epoch": 4706} {"train_loss": -7.226001739501953, "global_step": 197657, "epoch": 4706} {"train_loss": -7.14257287979126, "global_step": 197658, "epoch": 4706} {"train_loss": -7.299345016479492, "global_step": 197659, "epoch": 4706} {"train_loss": -7.352052688598633, "global_step": 197660, "epoch": 4706} {"train_loss": -7.23759126663208, "global_step": 197661, "epoch": 4706} {"train_loss": -7.216871738433838, "global_step": 197662, "epoch": 4706} {"train_loss": -7.26521110534668, "global_step": 197663, "epoch": 4706} {"train_loss": -7.277437210083008, "global_step": 197664, "epoch": 4706} {"train_loss": -7.280715465545654, "global_step": 197665, "epoch": 4706} {"train_loss": -7.349274635314941, "global_step": 197666, "epoch": 4706} {"train_loss": -7.247501373291016, "global_step": 197667, "epoch": 4706} {"train_loss": -7.186776161193848, "global_step": 197668, "epoch": 4706} {"train_loss": -7.222345352172852, "global_step": 197669, "epoch": 4706} {"train_loss": -7.358499526977539, "global_step": 197670, "epoch": 4706} {"train_loss": -7.214861869812012, "global_step": 197671, "epoch": 4706} {"train_loss": -7.2298431396484375, "global_step": 197672, "epoch": 4706} {"train_loss": -7.287806510925293, "global_step": 197673, "epoch": 4706} {"train_loss": -7.294060230255127, "global_step": 197674, "epoch": 4706} {"train_loss": -7.2403130531311035, "global_step": 197675, "epoch": 4706} {"train_loss": -7.295528411865234, "global_step": 197676, "epoch": 4706} {"train_loss": -7.273453235626221, "global_step": 197677, "epoch": 4706} {"train_loss": -7.200277328491211, "global_step": 197678, "epoch": 4706} {"train_loss": -7.257594108581543, "global_step": 197679, "epoch": 4706} {"train_loss": -7.309242248535156, "global_step": 197680, "epoch": 4706} {"train_loss": -7.191769123077393, "global_step": 197681, "epoch": 4706} {"train_loss": -7.3068742752075195, "global_step": 197682, "epoch": 4706} {"train_loss": -7.364498138427734, "global_step": 197683, "epoch": 4706} {"train_loss": -7.230809211730957, "global_step": 197684, "epoch": 4706} {"train_loss": -7.231986999511719, "global_step": 197685, "epoch": 4706} {"train_loss": -7.207094192504883, "global_step": 197686, "epoch": 4706} {"train_loss": -7.170469284057617, "global_step": 197687, "epoch": 4706} {"train_loss": -7.432961463928223, "global_step": 197688, "epoch": 4706} {"train_loss": -7.085982322692871, "global_step": 197689, "epoch": 4706} {"train_loss": -7.14411735534668, "global_step": 197690, "epoch": 4706} {"train_loss": -7.292353630065918, "global_step": 197691, "epoch": 4706} {"train_loss": -7.195483207702637, "global_step": 197692, "epoch": 4706} {"train_loss": -7.255487271717617, "global_step": 197693, "epoch": 4706, "val_loss": 81220.1328125} {"train_loss": -7.25272274017334, "global_step": 197694, "epoch": 4707} {"train_loss": -7.257631301879883, "global_step": 197695, "epoch": 4707} {"train_loss": -7.281961441040039, "global_step": 197696, "epoch": 4707} {"train_loss": -7.098296165466309, "global_step": 197697, "epoch": 4707} {"train_loss": -7.246599197387695, "global_step": 197698, "epoch": 4707} {"train_loss": -7.2043304443359375, "global_step": 197699, "epoch": 4707} {"train_loss": -7.199357032775879, "global_step": 197700, "epoch": 4707} {"train_loss": -7.323976516723633, "global_step": 197701, "epoch": 4707} {"train_loss": -7.182281494140625, "global_step": 197702, "epoch": 4707} {"train_loss": -7.212526798248291, "global_step": 197703, "epoch": 4707} {"train_loss": -7.232621192932129, "global_step": 197704, "epoch": 4707} {"train_loss": -7.28013801574707, "global_step": 197705, "epoch": 4707} {"train_loss": -7.333316802978516, "global_step": 197706, "epoch": 4707} {"train_loss": -7.227629661560059, "global_step": 197707, "epoch": 4707} {"train_loss": -7.134869575500488, "global_step": 197708, "epoch": 4707} {"train_loss": -7.251062393188477, "global_step": 197709, "epoch": 4707} {"train_loss": -7.271994590759277, "global_step": 197710, "epoch": 4707} {"train_loss": -7.350948333740234, "global_step": 197711, "epoch": 4707} {"train_loss": -7.318132400512695, "global_step": 197712, "epoch": 4707} {"train_loss": -7.230409622192383, "global_step": 197713, "epoch": 4707} {"train_loss": -7.207648277282715, "global_step": 197714, "epoch": 4707} {"train_loss": -7.29050350189209, "global_step": 197715, "epoch": 4707} {"train_loss": -7.220742225646973, "global_step": 197716, "epoch": 4707} {"train_loss": -7.124369144439697, "global_step": 197717, "epoch": 4707} {"train_loss": -7.234292030334473, "global_step": 197718, "epoch": 4707} {"train_loss": -7.21173095703125, "global_step": 197719, "epoch": 4707} {"train_loss": -7.103271007537842, "global_step": 197720, "epoch": 4707} {"train_loss": -7.387275695800781, "global_step": 197721, "epoch": 4707} {"train_loss": -7.190848350524902, "global_step": 197722, "epoch": 4707} {"train_loss": -7.216582775115967, "global_step": 197723, "epoch": 4707} {"train_loss": -7.29036283493042, "global_step": 197724, "epoch": 4707} {"train_loss": -7.241955280303955, "global_step": 197725, "epoch": 4707} {"train_loss": -7.386020660400391, "global_step": 197726, "epoch": 4707} {"train_loss": -7.234823226928711, "global_step": 197727, "epoch": 4707} {"train_loss": -7.347167491912842, "global_step": 197728, "epoch": 4707} {"train_loss": -7.110468864440918, "global_step": 197729, "epoch": 4707} {"train_loss": -7.300358772277832, "global_step": 197730, "epoch": 4707} {"train_loss": -7.36854362487793, "global_step": 197731, "epoch": 4707} {"train_loss": -7.35664176940918, "global_step": 197732, "epoch": 4707} {"train_loss": -7.27811336517334, "global_step": 197733, "epoch": 4707} {"train_loss": -7.344526290893555, "global_step": 197734, "epoch": 4707} {"train_loss": -7.2533352602095835, "global_step": 197735, "epoch": 4707, "val_loss": 81425.5078125} {"train_loss": -7.372280120849609, "global_step": 197736, "epoch": 4708} {"train_loss": -7.394770622253418, "global_step": 197737, "epoch": 4708} {"train_loss": -7.287461757659912, "global_step": 197738, "epoch": 4708} {"train_loss": -7.325384140014648, "global_step": 197739, "epoch": 4708} {"train_loss": -7.288851737976074, "global_step": 197740, "epoch": 4708} {"train_loss": -7.286141872406006, "global_step": 197741, "epoch": 4708} {"train_loss": -7.240816116333008, "global_step": 197742, "epoch": 4708} {"train_loss": -7.320878982543945, "global_step": 197743, "epoch": 4708} {"train_loss": -7.355975151062012, "global_step": 197744, "epoch": 4708} {"train_loss": -7.28743839263916, "global_step": 197745, "epoch": 4708} {"train_loss": -7.299839973449707, "global_step": 197746, "epoch": 4708} {"train_loss": -7.317614555358887, "global_step": 197747, "epoch": 4708} {"train_loss": -7.350980758666992, "global_step": 197748, "epoch": 4708} {"train_loss": -7.255245208740234, "global_step": 197749, "epoch": 4708} {"train_loss": -7.224178314208984, "global_step": 197750, "epoch": 4708} {"train_loss": -7.094087600708008, "global_step": 197751, "epoch": 4708} {"train_loss": -7.349338531494141, "global_step": 197752, "epoch": 4708} {"train_loss": -7.242753505706787, "global_step": 197753, "epoch": 4708} {"train_loss": -7.238798141479492, "global_step": 197754, "epoch": 4708} {"train_loss": -7.248004913330078, "global_step": 197755, "epoch": 4708} {"train_loss": -7.121552467346191, "global_step": 197756, "epoch": 4708} {"train_loss": -7.205834865570068, "global_step": 197757, "epoch": 4708} {"train_loss": -7.229024887084961, "global_step": 197758, "epoch": 4708} {"train_loss": -7.169476509094238, "global_step": 197759, "epoch": 4708} {"train_loss": -7.258985996246338, "global_step": 197760, "epoch": 4708} {"train_loss": -7.226865768432617, "global_step": 197761, "epoch": 4708} {"train_loss": -7.37091064453125, "global_step": 197762, "epoch": 4708} {"train_loss": -7.061547756195068, "global_step": 197763, "epoch": 4708} {"train_loss": -7.260433197021484, "global_step": 197764, "epoch": 4708} {"train_loss": -7.286781311035156, "global_step": 197765, "epoch": 4708} {"train_loss": -7.160218715667725, "global_step": 197766, "epoch": 4708} {"train_loss": -7.236070156097412, "global_step": 197767, "epoch": 4708} {"train_loss": -7.219095230102539, "global_step": 197768, "epoch": 4708} {"train_loss": -7.188938140869141, "global_step": 197769, "epoch": 4708} {"train_loss": -7.2527360916137695, "global_step": 197770, "epoch": 4708} {"train_loss": -7.15180778503418, "global_step": 197771, "epoch": 4708} {"train_loss": -7.232821464538574, "global_step": 197772, "epoch": 4708} {"train_loss": -7.316008567810059, "global_step": 197773, "epoch": 4708} {"train_loss": -7.3040547370910645, "global_step": 197774, "epoch": 4708} {"train_loss": -7.241105556488037, "global_step": 197775, "epoch": 4708} {"train_loss": -7.305386543273926, "global_step": 197776, "epoch": 4708} {"train_loss": -7.255080098197574, "global_step": 197777, "epoch": 4708, "val_loss": 81318.0} {"train_loss": -7.164156913757324, "global_step": 197778, "epoch": 4709} {"train_loss": -7.192792892456055, "global_step": 197779, "epoch": 4709} {"train_loss": -7.042446613311768, "global_step": 197780, "epoch": 4709} {"train_loss": -7.315147399902344, "global_step": 197781, "epoch": 4709} {"train_loss": -7.301504135131836, "global_step": 197782, "epoch": 4709} {"train_loss": -7.426836013793945, "global_step": 197783, "epoch": 4709} {"train_loss": -7.333164691925049, "global_step": 197784, "epoch": 4709} {"train_loss": -7.237723350524902, "global_step": 197785, "epoch": 4709} {"train_loss": -7.272034168243408, "global_step": 197786, "epoch": 4709} {"train_loss": -7.336173057556152, "global_step": 197787, "epoch": 4709} {"train_loss": -7.257284164428711, "global_step": 197788, "epoch": 4709} {"train_loss": -7.325339317321777, "global_step": 197789, "epoch": 4709} {"train_loss": -7.272796630859375, "global_step": 197790, "epoch": 4709} {"train_loss": -7.363192558288574, "global_step": 197791, "epoch": 4709} {"train_loss": -7.3497538566589355, "global_step": 197792, "epoch": 4709} {"train_loss": -7.275277137756348, "global_step": 197793, "epoch": 4709} {"train_loss": -7.250687599182129, "global_step": 197794, "epoch": 4709} {"train_loss": -7.361641883850098, "global_step": 197795, "epoch": 4709} {"train_loss": -7.320704460144043, "global_step": 197796, "epoch": 4709} {"train_loss": -7.311224937438965, "global_step": 197797, "epoch": 4709} {"train_loss": -7.225414276123047, "global_step": 197798, "epoch": 4709} {"train_loss": -7.40255069732666, "global_step": 197799, "epoch": 4709} {"train_loss": -7.355496406555176, "global_step": 197800, "epoch": 4709} {"train_loss": -7.279127597808838, "global_step": 197801, "epoch": 4709} {"train_loss": -7.3720831871032715, "global_step": 197802, "epoch": 4709} {"train_loss": -7.18442440032959, "global_step": 197803, "epoch": 4709} {"train_loss": -7.345673561096191, "global_step": 197804, "epoch": 4709} {"train_loss": -7.2597455978393555, "global_step": 197805, "epoch": 4709} {"train_loss": -7.299793243408203, "global_step": 197806, "epoch": 4709} {"train_loss": -7.328676223754883, "global_step": 197807, "epoch": 4709} {"train_loss": -7.24555778503418, "global_step": 197808, "epoch": 4709} {"train_loss": -7.286862373352051, "global_step": 197809, "epoch": 4709} {"train_loss": -7.352077484130859, "global_step": 197810, "epoch": 4709} {"train_loss": -7.3902812004089355, "global_step": 197811, "epoch": 4709} {"train_loss": -7.32694149017334, "global_step": 197812, "epoch": 4709} {"train_loss": -7.061098098754883, "global_step": 197813, "epoch": 4709} {"train_loss": -7.2643632888793945, "global_step": 197814, "epoch": 4709} {"train_loss": -7.186611652374268, "global_step": 197815, "epoch": 4709} {"train_loss": -7.274037837982178, "global_step": 197816, "epoch": 4709} {"train_loss": -7.2526774406433105, "global_step": 197817, "epoch": 4709} {"train_loss": -7.211973667144775, "global_step": 197818, "epoch": 4709} {"train_loss": -7.280551751454671, "global_step": 197819, "epoch": 4709, "val_loss": 81399.921875} {"train_loss": -7.174471855163574, "global_step": 197820, "epoch": 4710} {"train_loss": -7.3917741775512695, "global_step": 197821, "epoch": 4710} {"train_loss": -7.139825820922852, "global_step": 197822, "epoch": 4710} {"train_loss": -7.348648548126221, "global_step": 197823, "epoch": 4710} {"train_loss": -7.2430219650268555, "global_step": 197824, "epoch": 4710} {"train_loss": -7.16680383682251, "global_step": 197825, "epoch": 4710} {"train_loss": -7.288790702819824, "global_step": 197826, "epoch": 4710} {"train_loss": -7.234209060668945, "global_step": 197827, "epoch": 4710} {"train_loss": -7.266194820404053, "global_step": 197828, "epoch": 4710} {"train_loss": -7.238761901855469, "global_step": 197829, "epoch": 4710} {"train_loss": -7.324758529663086, "global_step": 197830, "epoch": 4710} {"train_loss": -7.20663595199585, "global_step": 197831, "epoch": 4710} {"train_loss": -7.245868682861328, "global_step": 197832, "epoch": 4710} {"train_loss": -7.191900253295898, "global_step": 197833, "epoch": 4710} {"train_loss": -7.248309135437012, "global_step": 197834, "epoch": 4710} {"train_loss": -7.215704917907715, "global_step": 197835, "epoch": 4710} {"train_loss": -7.337803363800049, "global_step": 197836, "epoch": 4710} {"train_loss": -7.233647346496582, "global_step": 197837, "epoch": 4710} {"train_loss": -7.342453479766846, "global_step": 197838, "epoch": 4710} {"train_loss": -7.351428031921387, "global_step": 197839, "epoch": 4710} {"train_loss": -7.321922779083252, "global_step": 197840, "epoch": 4710} {"train_loss": -7.346737861633301, "global_step": 197841, "epoch": 4710} {"train_loss": -7.296876907348633, "global_step": 197842, "epoch": 4710} {"train_loss": -7.290871620178223, "global_step": 197843, "epoch": 4710} {"train_loss": -7.450835227966309, "global_step": 197844, "epoch": 4710} {"train_loss": -7.228362083435059, "global_step": 197845, "epoch": 4710} {"train_loss": -7.285886764526367, "global_step": 197846, "epoch": 4710} {"train_loss": -7.268734455108643, "global_step": 197847, "epoch": 4710} {"train_loss": -7.3738932609558105, "global_step": 197848, "epoch": 4710} {"train_loss": -7.359243869781494, "global_step": 197849, "epoch": 4710} {"train_loss": -7.288972854614258, "global_step": 197850, "epoch": 4710} {"train_loss": -7.3243560791015625, "global_step": 197851, "epoch": 4710} {"train_loss": -7.32959508895874, "global_step": 197852, "epoch": 4710} {"train_loss": -7.204658508300781, "global_step": 197853, "epoch": 4710} {"train_loss": -7.292801856994629, "global_step": 197854, "epoch": 4710} {"train_loss": -7.3868818283081055, "global_step": 197855, "epoch": 4710} {"train_loss": -7.29371452331543, "global_step": 197856, "epoch": 4710} {"train_loss": -7.163477420806885, "global_step": 197857, "epoch": 4710} {"train_loss": -7.266170501708984, "global_step": 197858, "epoch": 4710} {"train_loss": -7.136133193969727, "global_step": 197859, "epoch": 4710} {"train_loss": -7.323667526245117, "global_step": 197860, "epoch": 4710} {"train_loss": -7.276649577277047, "global_step": 197861, "epoch": 4710, "val_loss": 81479.7109375} {"train_loss": -7.187490463256836, "global_step": 197862, "epoch": 4711} {"train_loss": -7.360536575317383, "global_step": 197863, "epoch": 4711} {"train_loss": -7.172380447387695, "global_step": 197864, "epoch": 4711} {"train_loss": -7.197719573974609, "global_step": 197865, "epoch": 4711} {"train_loss": -7.244133949279785, "global_step": 197866, "epoch": 4711} {"train_loss": -7.1454010009765625, "global_step": 197867, "epoch": 4711} {"train_loss": -7.310364723205566, "global_step": 197868, "epoch": 4711} {"train_loss": -7.166180610656738, "global_step": 197869, "epoch": 4711} {"train_loss": -7.269125938415527, "global_step": 197870, "epoch": 4711} {"train_loss": -7.181127071380615, "global_step": 197871, "epoch": 4711} {"train_loss": -7.207231521606445, "global_step": 197872, "epoch": 4711} {"train_loss": -7.1772074699401855, "global_step": 197873, "epoch": 4711} {"train_loss": -7.063492298126221, "global_step": 197874, "epoch": 4711} {"train_loss": -7.2183837890625, "global_step": 197875, "epoch": 4711} {"train_loss": -7.051057815551758, "global_step": 197876, "epoch": 4711} {"train_loss": -7.153067588806152, "global_step": 197877, "epoch": 4711} {"train_loss": -7.066187858581543, "global_step": 197878, "epoch": 4711} {"train_loss": -7.089992523193359, "global_step": 197879, "epoch": 4711} {"train_loss": -7.1060943603515625, "global_step": 197880, "epoch": 4711} {"train_loss": -7.162214279174805, "global_step": 197881, "epoch": 4711} {"train_loss": -7.108274459838867, "global_step": 197882, "epoch": 4711} {"train_loss": -7.100743293762207, "global_step": 197883, "epoch": 4711} {"train_loss": -7.114903926849365, "global_step": 197884, "epoch": 4711} {"train_loss": -7.221593856811523, "global_step": 197885, "epoch": 4711} {"train_loss": -7.168483734130859, "global_step": 197886, "epoch": 4711} {"train_loss": -7.150234699249268, "global_step": 197887, "epoch": 4711} {"train_loss": -7.135195732116699, "global_step": 197888, "epoch": 4711} {"train_loss": -7.315258979797363, "global_step": 197889, "epoch": 4711} {"train_loss": -7.1422200202941895, "global_step": 197890, "epoch": 4711} {"train_loss": -7.206910133361816, "global_step": 197891, "epoch": 4711} {"train_loss": -7.1477837562561035, "global_step": 197892, "epoch": 4711} {"train_loss": -7.264000415802002, "global_step": 197893, "epoch": 4711} {"train_loss": -7.223878383636475, "global_step": 197894, "epoch": 4711} {"train_loss": -7.216458797454834, "global_step": 197895, "epoch": 4711} {"train_loss": -7.217592239379883, "global_step": 197896, "epoch": 4711} {"train_loss": -7.359325408935547, "global_step": 197897, "epoch": 4711} {"train_loss": -7.070943355560303, "global_step": 197898, "epoch": 4711} {"train_loss": -7.365915298461914, "global_step": 197899, "epoch": 4711} {"train_loss": -7.095675468444824, "global_step": 197900, "epoch": 4711} {"train_loss": -7.236823081970215, "global_step": 197901, "epoch": 4711} {"train_loss": -7.047637462615967, "global_step": 197902, "epoch": 4711} {"train_loss": -7.185457411266508, "global_step": 197903, "epoch": 4711, "val_loss": 81528.4453125} {"train_loss": -7.114070892333984, "global_step": 197904, "epoch": 4712} {"train_loss": -7.179989814758301, "global_step": 197905, "epoch": 4712} {"train_loss": -7.067575454711914, "global_step": 197906, "epoch": 4712} {"train_loss": -7.236173629760742, "global_step": 197907, "epoch": 4712} {"train_loss": -7.141387939453125, "global_step": 197908, "epoch": 4712} {"train_loss": -7.194772720336914, "global_step": 197909, "epoch": 4712} {"train_loss": -7.2162017822265625, "global_step": 197910, "epoch": 4712} {"train_loss": -7.144371032714844, "global_step": 197911, "epoch": 4712} {"train_loss": -7.166259765625, "global_step": 197912, "epoch": 4712} {"train_loss": -7.1829142570495605, "global_step": 197913, "epoch": 4712} {"train_loss": -7.315549850463867, "global_step": 197914, "epoch": 4712} {"train_loss": -7.244504928588867, "global_step": 197915, "epoch": 4712} {"train_loss": -7.243614673614502, "global_step": 197916, "epoch": 4712} {"train_loss": -7.245824813842773, "global_step": 197917, "epoch": 4712} {"train_loss": -7.219587326049805, "global_step": 197918, "epoch": 4712} {"train_loss": -7.381017684936523, "global_step": 197919, "epoch": 4712} {"train_loss": -7.353979587554932, "global_step": 197920, "epoch": 4712} {"train_loss": -7.265694618225098, "global_step": 197921, "epoch": 4712} {"train_loss": -7.236441612243652, "global_step": 197922, "epoch": 4712} {"train_loss": -7.301950454711914, "global_step": 197923, "epoch": 4712} {"train_loss": -7.303157806396484, "global_step": 197924, "epoch": 4712} {"train_loss": -7.340578079223633, "global_step": 197925, "epoch": 4712} {"train_loss": -7.31458854675293, "global_step": 197926, "epoch": 4712} {"train_loss": -7.300955772399902, "global_step": 197927, "epoch": 4712} {"train_loss": -7.298415184020996, "global_step": 197928, "epoch": 4712} {"train_loss": -7.4037184715271, "global_step": 197929, "epoch": 4712} {"train_loss": -7.239137649536133, "global_step": 197930, "epoch": 4712} {"train_loss": -7.210766792297363, "global_step": 197931, "epoch": 4712} {"train_loss": -7.292978763580322, "global_step": 197932, "epoch": 4712} {"train_loss": -7.2476983070373535, "global_step": 197933, "epoch": 4712} {"train_loss": -7.395203590393066, "global_step": 197934, "epoch": 4712} {"train_loss": -7.2356367111206055, "global_step": 197935, "epoch": 4712} {"train_loss": -7.403908729553223, "global_step": 197936, "epoch": 4712} {"train_loss": -7.219670295715332, "global_step": 197937, "epoch": 4712} {"train_loss": -7.247847080230713, "global_step": 197938, "epoch": 4712} {"train_loss": -7.399245262145996, "global_step": 197939, "epoch": 4712} {"train_loss": -7.323212623596191, "global_step": 197940, "epoch": 4712} {"train_loss": -7.322220802307129, "global_step": 197941, "epoch": 4712} {"train_loss": -7.2757649421691895, "global_step": 197942, "epoch": 4712} {"train_loss": -7.242896556854248, "global_step": 197943, "epoch": 4712} {"train_loss": -7.358706951141357, "global_step": 197944, "epoch": 4712} {"train_loss": -7.2639105433509465, "global_step": 197945, "epoch": 4712, "val_loss": 81324.125} {"train_loss": -7.3337321281433105, "global_step": 197946, "epoch": 4713} {"train_loss": -7.152702331542969, "global_step": 197947, "epoch": 4713} {"train_loss": -7.298152446746826, "global_step": 197948, "epoch": 4713} {"train_loss": -7.2564778327941895, "global_step": 197949, "epoch": 4713} {"train_loss": -7.224796295166016, "global_step": 197950, "epoch": 4713} {"train_loss": -7.283803462982178, "global_step": 197951, "epoch": 4713} {"train_loss": -7.209893226623535, "global_step": 197952, "epoch": 4713} {"train_loss": -7.3346028327941895, "global_step": 197953, "epoch": 4713} {"train_loss": -7.270350456237793, "global_step": 197954, "epoch": 4713} {"train_loss": -7.313860893249512, "global_step": 197955, "epoch": 4713} {"train_loss": -7.342503547668457, "global_step": 197956, "epoch": 4713} {"train_loss": -7.245020866394043, "global_step": 197957, "epoch": 4713} {"train_loss": -7.129115104675293, "global_step": 197958, "epoch": 4713} {"train_loss": -7.266332149505615, "global_step": 197959, "epoch": 4713} {"train_loss": -7.359269142150879, "global_step": 197960, "epoch": 4713} {"train_loss": -7.326559066772461, "global_step": 197961, "epoch": 4713} {"train_loss": -7.138552665710449, "global_step": 197962, "epoch": 4713} {"train_loss": -7.271774768829346, "global_step": 197963, "epoch": 4713} {"train_loss": -7.219021797180176, "global_step": 197964, "epoch": 4713} {"train_loss": -7.216583728790283, "global_step": 197965, "epoch": 4713} {"train_loss": -7.181738376617432, "global_step": 197966, "epoch": 4713} {"train_loss": -7.199219703674316, "global_step": 197967, "epoch": 4713} {"train_loss": -7.234763145446777, "global_step": 197968, "epoch": 4713} {"train_loss": -7.105312347412109, "global_step": 197969, "epoch": 4713} {"train_loss": -7.361042022705078, "global_step": 197970, "epoch": 4713} {"train_loss": -7.159816741943359, "global_step": 197971, "epoch": 4713} {"train_loss": -7.283809185028076, "global_step": 197972, "epoch": 4713} {"train_loss": -7.278912544250488, "global_step": 197973, "epoch": 4713} {"train_loss": -7.325400352478027, "global_step": 197974, "epoch": 4713} {"train_loss": -7.292801856994629, "global_step": 197975, "epoch": 4713} {"train_loss": -7.328041076660156, "global_step": 197976, "epoch": 4713} {"train_loss": -7.29394006729126, "global_step": 197977, "epoch": 4713} {"train_loss": -7.186464309692383, "global_step": 197978, "epoch": 4713} {"train_loss": -7.2730302810668945, "global_step": 197979, "epoch": 4713} {"train_loss": -7.289977550506592, "global_step": 197980, "epoch": 4713} {"train_loss": -7.288786888122559, "global_step": 197981, "epoch": 4713} {"train_loss": -7.2069501876831055, "global_step": 197982, "epoch": 4713} {"train_loss": -7.364711761474609, "global_step": 197983, "epoch": 4713} {"train_loss": -7.157441139221191, "global_step": 197984, "epoch": 4713} {"train_loss": -7.306094169616699, "global_step": 197985, "epoch": 4713} {"train_loss": -7.236724853515625, "global_step": 197986, "epoch": 4713} {"train_loss": -7.254255907876151, "global_step": 197987, "epoch": 4713, "val_loss": 81343.359375} {"train_loss": -7.17427921295166, "global_step": 197988, "epoch": 4714} {"train_loss": -7.304747581481934, "global_step": 197989, "epoch": 4714} {"train_loss": -7.127912998199463, "global_step": 197990, "epoch": 4714} {"train_loss": -7.1876301765441895, "global_step": 197991, "epoch": 4714} {"train_loss": -7.316669464111328, "global_step": 197992, "epoch": 4714} {"train_loss": -7.336225509643555, "global_step": 197993, "epoch": 4714} {"train_loss": -7.202391624450684, "global_step": 197994, "epoch": 4714} {"train_loss": -7.213201999664307, "global_step": 197995, "epoch": 4714} {"train_loss": -7.242438316345215, "global_step": 197996, "epoch": 4714} {"train_loss": -7.286920547485352, "global_step": 197997, "epoch": 4714} {"train_loss": -7.307825088500977, "global_step": 197998, "epoch": 4714} {"train_loss": -7.271265029907227, "global_step": 197999, "epoch": 4714} {"train_loss": -7.223320960998535, "global_step": 198000, "epoch": 4714} {"train_loss": -7.206416130065918, "global_step": 198001, "epoch": 4714} {"train_loss": -7.463785648345947, "global_step": 198002, "epoch": 4714} {"train_loss": -7.3724260330200195, "global_step": 198003, "epoch": 4714} {"train_loss": -7.284517288208008, "global_step": 198004, "epoch": 4714} {"train_loss": -7.284727573394775, "global_step": 198005, "epoch": 4714} {"train_loss": -7.162153244018555, "global_step": 198006, "epoch": 4714} {"train_loss": -7.385893821716309, "global_step": 198007, "epoch": 4714} {"train_loss": -7.196595191955566, "global_step": 198008, "epoch": 4714} {"train_loss": -7.3222174644470215, "global_step": 198009, "epoch": 4714} {"train_loss": -7.338610649108887, "global_step": 198010, "epoch": 4714} {"train_loss": -7.225963592529297, "global_step": 198011, "epoch": 4714} {"train_loss": -7.305532455444336, "global_step": 198012, "epoch": 4714} {"train_loss": -7.293654441833496, "global_step": 198013, "epoch": 4714} {"train_loss": -7.292777061462402, "global_step": 198014, "epoch": 4714} {"train_loss": -7.2759833335876465, "global_step": 198015, "epoch": 4714} {"train_loss": -7.385623931884766, "global_step": 198016, "epoch": 4714} {"train_loss": -7.265358924865723, "global_step": 198017, "epoch": 4714} {"train_loss": -7.259620666503906, "global_step": 198018, "epoch": 4714} {"train_loss": -7.180219650268555, "global_step": 198019, "epoch": 4714} {"train_loss": -7.273960113525391, "global_step": 198020, "epoch": 4714} {"train_loss": -7.328438758850098, "global_step": 198021, "epoch": 4714} {"train_loss": -7.232611656188965, "global_step": 198022, "epoch": 4714} {"train_loss": -6.949245452880859, "global_step": 198023, "epoch": 4714} {"train_loss": -7.038969039916992, "global_step": 198024, "epoch": 4714} {"train_loss": -7.180605888366699, "global_step": 198025, "epoch": 4714} {"train_loss": -7.207793235778809, "global_step": 198026, "epoch": 4714} {"train_loss": -7.070594787597656, "global_step": 198027, "epoch": 4714} {"train_loss": -7.339698791503906, "global_step": 198028, "epoch": 4714} {"train_loss": -7.252917766571045, "global_step": 198029, "epoch": 4714, "val_loss": 81507.9375} {"train_loss": -7.261336326599121, "global_step": 198030, "epoch": 4715} {"train_loss": -7.21649169921875, "global_step": 198031, "epoch": 4715} {"train_loss": -7.17331075668335, "global_step": 198032, "epoch": 4715} {"train_loss": -7.254752159118652, "global_step": 198033, "epoch": 4715} {"train_loss": -7.294157028198242, "global_step": 198034, "epoch": 4715} {"train_loss": -7.21980619430542, "global_step": 198035, "epoch": 4715} {"train_loss": -7.253796577453613, "global_step": 198036, "epoch": 4715} {"train_loss": -7.161397457122803, "global_step": 198037, "epoch": 4715} {"train_loss": -7.221310615539551, "global_step": 198038, "epoch": 4715} {"train_loss": -7.256021499633789, "global_step": 198039, "epoch": 4715} {"train_loss": -7.259800910949707, "global_step": 198040, "epoch": 4715} {"train_loss": -7.179270267486572, "global_step": 198041, "epoch": 4715} {"train_loss": -7.308193683624268, "global_step": 198042, "epoch": 4715} {"train_loss": -7.282596111297607, "global_step": 198043, "epoch": 4715} {"train_loss": -7.324202537536621, "global_step": 198044, "epoch": 4715} {"train_loss": -7.239335060119629, "global_step": 198045, "epoch": 4715} {"train_loss": -7.2448649406433105, "global_step": 198046, "epoch": 4715} {"train_loss": -7.2027130126953125, "global_step": 198047, "epoch": 4715} {"train_loss": -7.299635887145996, "global_step": 198048, "epoch": 4715} {"train_loss": -7.326840877532959, "global_step": 198049, "epoch": 4715} {"train_loss": -7.186532020568848, "global_step": 198050, "epoch": 4715} {"train_loss": -7.196502685546875, "global_step": 198051, "epoch": 4715} {"train_loss": -7.292417049407959, "global_step": 198052, "epoch": 4715} {"train_loss": -7.160035610198975, "global_step": 198053, "epoch": 4715} {"train_loss": -7.455698013305664, "global_step": 198054, "epoch": 4715} {"train_loss": -7.1973066329956055, "global_step": 198055, "epoch": 4715} {"train_loss": -7.259138584136963, "global_step": 198056, "epoch": 4715} {"train_loss": -7.323931694030762, "global_step": 198057, "epoch": 4715} {"train_loss": -7.335445404052734, "global_step": 198058, "epoch": 4715} {"train_loss": -7.280008792877197, "global_step": 198059, "epoch": 4715} {"train_loss": -7.3142991065979, "global_step": 198060, "epoch": 4715} {"train_loss": -7.297499656677246, "global_step": 198061, "epoch": 4715} {"train_loss": -7.336773872375488, "global_step": 198062, "epoch": 4715} {"train_loss": -7.239497184753418, "global_step": 198063, "epoch": 4715} {"train_loss": -7.249241352081299, "global_step": 198064, "epoch": 4715} {"train_loss": -7.303893089294434, "global_step": 198065, "epoch": 4715} {"train_loss": -7.072774887084961, "global_step": 198066, "epoch": 4715} {"train_loss": -7.2461771965026855, "global_step": 198067, "epoch": 4715} {"train_loss": -7.284160614013672, "global_step": 198068, "epoch": 4715} {"train_loss": -7.1175150871276855, "global_step": 198069, "epoch": 4715} {"train_loss": -7.260921478271484, "global_step": 198070, "epoch": 4715} {"train_loss": -7.252707015900385, "global_step": 198071, "epoch": 4715, "val_loss": 81229.984375} {"train_loss": -7.069051742553711, "global_step": 198072, "epoch": 4716} {"train_loss": -7.227880001068115, "global_step": 198073, "epoch": 4716} {"train_loss": -6.9815874099731445, "global_step": 198074, "epoch": 4716} {"train_loss": -7.3275604248046875, "global_step": 198075, "epoch": 4716} {"train_loss": -7.256747245788574, "global_step": 198076, "epoch": 4716} {"train_loss": -7.2008137702941895, "global_step": 198077, "epoch": 4716} {"train_loss": -7.296258926391602, "global_step": 198078, "epoch": 4716} {"train_loss": -7.147479057312012, "global_step": 198079, "epoch": 4716} {"train_loss": -7.226007461547852, "global_step": 198080, "epoch": 4716} {"train_loss": -7.1931233406066895, "global_step": 198081, "epoch": 4716} {"train_loss": -7.28297233581543, "global_step": 198082, "epoch": 4716} {"train_loss": -7.304945468902588, "global_step": 198083, "epoch": 4716} {"train_loss": -7.312216758728027, "global_step": 198084, "epoch": 4716} {"train_loss": -7.253934860229492, "global_step": 198085, "epoch": 4716} {"train_loss": -7.320802688598633, "global_step": 198086, "epoch": 4716} {"train_loss": -7.3291521072387695, "global_step": 198087, "epoch": 4716} {"train_loss": -7.35048770904541, "global_step": 198088, "epoch": 4716} {"train_loss": -7.22871208190918, "global_step": 198089, "epoch": 4716} {"train_loss": -7.231404781341553, "global_step": 198090, "epoch": 4716} {"train_loss": -7.377756118774414, "global_step": 198091, "epoch": 4716} {"train_loss": -7.291661262512207, "global_step": 198092, "epoch": 4716} {"train_loss": -7.266679763793945, "global_step": 198093, "epoch": 4716} {"train_loss": -7.219978332519531, "global_step": 198094, "epoch": 4716} {"train_loss": -7.269290924072266, "global_step": 198095, "epoch": 4716} {"train_loss": -7.227404594421387, "global_step": 198096, "epoch": 4716} {"train_loss": -7.267030715942383, "global_step": 198097, "epoch": 4716} {"train_loss": -7.231411933898926, "global_step": 198098, "epoch": 4716} {"train_loss": -7.262219429016113, "global_step": 198099, "epoch": 4716} {"train_loss": -7.377319812774658, "global_step": 198100, "epoch": 4716} {"train_loss": -7.324261665344238, "global_step": 198101, "epoch": 4716} {"train_loss": -7.290539741516113, "global_step": 198102, "epoch": 4716} {"train_loss": -7.239984512329102, "global_step": 198103, "epoch": 4716} {"train_loss": -7.074650764465332, "global_step": 198104, "epoch": 4716} {"train_loss": -7.306183815002441, "global_step": 198105, "epoch": 4716} {"train_loss": -7.148262977600098, "global_step": 198106, "epoch": 4716} {"train_loss": -7.250322341918945, "global_step": 198107, "epoch": 4716} {"train_loss": -7.166947841644287, "global_step": 198108, "epoch": 4716} {"train_loss": -7.18673038482666, "global_step": 198109, "epoch": 4716} {"train_loss": -7.184296607971191, "global_step": 198110, "epoch": 4716} {"train_loss": -7.2483696937561035, "global_step": 198111, "epoch": 4716} {"train_loss": -7.448309898376465, "global_step": 198112, "epoch": 4716} {"train_loss": -7.24851823988415, "global_step": 198113, "epoch": 4716, "val_loss": 81449.5078125} {"train_loss": -7.308753967285156, "global_step": 198114, "epoch": 4717} {"train_loss": -7.399705410003662, "global_step": 198115, "epoch": 4717} {"train_loss": -7.283952236175537, "global_step": 198116, "epoch": 4717} {"train_loss": -7.263080596923828, "global_step": 198117, "epoch": 4717} {"train_loss": -7.23614501953125, "global_step": 198118, "epoch": 4717} {"train_loss": -7.3068013191223145, "global_step": 198119, "epoch": 4717} {"train_loss": -7.2217698097229, "global_step": 198120, "epoch": 4717} {"train_loss": -7.244649887084961, "global_step": 198121, "epoch": 4717} {"train_loss": -7.274847030639648, "global_step": 198122, "epoch": 4717} {"train_loss": -7.194581508636475, "global_step": 198123, "epoch": 4717} {"train_loss": -7.114657402038574, "global_step": 198124, "epoch": 4717} {"train_loss": -7.169371604919434, "global_step": 198125, "epoch": 4717} {"train_loss": -7.301019668579102, "global_step": 198126, "epoch": 4717} {"train_loss": -7.166115760803223, "global_step": 198127, "epoch": 4717} {"train_loss": -7.149806976318359, "global_step": 198128, "epoch": 4717} {"train_loss": -7.272470474243164, "global_step": 198129, "epoch": 4717} {"train_loss": -7.24428653717041, "global_step": 198130, "epoch": 4717} {"train_loss": -7.211674213409424, "global_step": 198131, "epoch": 4717} {"train_loss": -6.995129585266113, "global_step": 198132, "epoch": 4717} {"train_loss": -7.178654670715332, "global_step": 198133, "epoch": 4717} {"train_loss": -7.233769416809082, "global_step": 198134, "epoch": 4717} {"train_loss": -7.2755022048950195, "global_step": 198135, "epoch": 4717} {"train_loss": -7.216413497924805, "global_step": 198136, "epoch": 4717} {"train_loss": -7.273151397705078, "global_step": 198137, "epoch": 4717} {"train_loss": -7.179256439208984, "global_step": 198138, "epoch": 4717} {"train_loss": -7.322905540466309, "global_step": 198139, "epoch": 4717} {"train_loss": -7.26469087600708, "global_step": 198140, "epoch": 4717} {"train_loss": -7.321305274963379, "global_step": 198141, "epoch": 4717} {"train_loss": -7.362900733947754, "global_step": 198142, "epoch": 4717} {"train_loss": -7.337436676025391, "global_step": 198143, "epoch": 4717} {"train_loss": -7.28068208694458, "global_step": 198144, "epoch": 4717} {"train_loss": -7.236793041229248, "global_step": 198145, "epoch": 4717} {"train_loss": -7.3129730224609375, "global_step": 198146, "epoch": 4717} {"train_loss": -7.264003276824951, "global_step": 198147, "epoch": 4717} {"train_loss": -7.296655654907227, "global_step": 198148, "epoch": 4717} {"train_loss": -7.341283798217773, "global_step": 198149, "epoch": 4717} {"train_loss": -7.23916482925415, "global_step": 198150, "epoch": 4717} {"train_loss": -7.2397260665893555, "global_step": 198151, "epoch": 4717} {"train_loss": -7.352910995483398, "global_step": 198152, "epoch": 4717} {"train_loss": -7.293551921844482, "global_step": 198153, "epoch": 4717} {"train_loss": -7.463654518127441, "global_step": 198154, "epoch": 4717} {"train_loss": -7.261710348583403, "global_step": 198155, "epoch": 4717, "val_loss": 81366.890625} {"train_loss": -7.387919902801514, "global_step": 198156, "epoch": 4718} {"train_loss": -7.416901588439941, "global_step": 198157, "epoch": 4718} {"train_loss": -7.34126615524292, "global_step": 198158, "epoch": 4718} {"train_loss": -7.39504337310791, "global_step": 198159, "epoch": 4718} {"train_loss": -7.3931379318237305, "global_step": 198160, "epoch": 4718} {"train_loss": -7.425128936767578, "global_step": 198161, "epoch": 4718} {"train_loss": -7.362275123596191, "global_step": 198162, "epoch": 4718} {"train_loss": -7.266567707061768, "global_step": 198163, "epoch": 4718} {"train_loss": -7.302392482757568, "global_step": 198164, "epoch": 4718} {"train_loss": -7.362250328063965, "global_step": 198165, "epoch": 4718} {"train_loss": -7.360063552856445, "global_step": 198166, "epoch": 4718} {"train_loss": -7.364912509918213, "global_step": 198167, "epoch": 4718} {"train_loss": -7.325690746307373, "global_step": 198168, "epoch": 4718} {"train_loss": -7.299805641174316, "global_step": 198169, "epoch": 4718} {"train_loss": -7.347858428955078, "global_step": 198170, "epoch": 4718} {"train_loss": -7.2535014152526855, "global_step": 198171, "epoch": 4718} {"train_loss": -7.2464599609375, "global_step": 198172, "epoch": 4718} {"train_loss": -7.3295183181762695, "global_step": 198173, "epoch": 4718} {"train_loss": -7.250215530395508, "global_step": 198174, "epoch": 4718} {"train_loss": -7.251433372497559, "global_step": 198175, "epoch": 4718} {"train_loss": -7.238312244415283, "global_step": 198176, "epoch": 4718} {"train_loss": -7.117403030395508, "global_step": 198177, "epoch": 4718} {"train_loss": -7.189645767211914, "global_step": 198178, "epoch": 4718} {"train_loss": -7.316851615905762, "global_step": 198179, "epoch": 4718} {"train_loss": -7.131698131561279, "global_step": 198180, "epoch": 4718} {"train_loss": -7.235475063323975, "global_step": 198181, "epoch": 4718} {"train_loss": -7.323488712310791, "global_step": 198182, "epoch": 4718} {"train_loss": -7.170445919036865, "global_step": 198183, "epoch": 4718} {"train_loss": -7.305426120758057, "global_step": 198184, "epoch": 4718} {"train_loss": -7.29217529296875, "global_step": 198185, "epoch": 4718} {"train_loss": -7.241523742675781, "global_step": 198186, "epoch": 4718} {"train_loss": -7.27619743347168, "global_step": 198187, "epoch": 4718} {"train_loss": -7.215665817260742, "global_step": 198188, "epoch": 4718} {"train_loss": -7.189570426940918, "global_step": 198189, "epoch": 4718} {"train_loss": -7.242074966430664, "global_step": 198190, "epoch": 4718} {"train_loss": -7.121359825134277, "global_step": 198191, "epoch": 4718} {"train_loss": -7.261897087097168, "global_step": 198192, "epoch": 4718} {"train_loss": -7.293751239776611, "global_step": 198193, "epoch": 4718} {"train_loss": -7.195484638214111, "global_step": 198194, "epoch": 4718} {"train_loss": -7.354397773742676, "global_step": 198195, "epoch": 4718} {"train_loss": -7.299261093139648, "global_step": 198196, "epoch": 4718} {"train_loss": -7.284882295699346, "global_step": 198197, "epoch": 4718, "val_loss": 81362.5859375} {"train_loss": -7.205646514892578, "global_step": 198198, "epoch": 4719} {"train_loss": -7.300538063049316, "global_step": 198199, "epoch": 4719} {"train_loss": -7.242478847503662, "global_step": 198200, "epoch": 4719} {"train_loss": -7.2877726554870605, "global_step": 198201, "epoch": 4719} {"train_loss": -7.284999847412109, "global_step": 198202, "epoch": 4719} {"train_loss": -7.301453590393066, "global_step": 198203, "epoch": 4719} {"train_loss": -7.3530097007751465, "global_step": 198204, "epoch": 4719} {"train_loss": -7.2034759521484375, "global_step": 198205, "epoch": 4719} {"train_loss": -7.321065902709961, "global_step": 198206, "epoch": 4719} {"train_loss": -7.19076681137085, "global_step": 198207, "epoch": 4719} {"train_loss": -7.228600025177002, "global_step": 198208, "epoch": 4719} {"train_loss": -7.249599933624268, "global_step": 198209, "epoch": 4719} {"train_loss": -7.142366409301758, "global_step": 198210, "epoch": 4719} {"train_loss": -7.247427940368652, "global_step": 198211, "epoch": 4719} {"train_loss": -7.208956241607666, "global_step": 198212, "epoch": 4719} {"train_loss": -7.145364284515381, "global_step": 198213, "epoch": 4719} {"train_loss": -7.237945079803467, "global_step": 198214, "epoch": 4719} {"train_loss": -7.31682014465332, "global_step": 198215, "epoch": 4719} {"train_loss": -7.269106388092041, "global_step": 198216, "epoch": 4719} {"train_loss": -7.274875640869141, "global_step": 198217, "epoch": 4719} {"train_loss": -7.394218921661377, "global_step": 198218, "epoch": 4719} {"train_loss": -7.326475143432617, "global_step": 198219, "epoch": 4719} {"train_loss": -7.263940811157227, "global_step": 198220, "epoch": 4719} {"train_loss": -7.356518268585205, "global_step": 198221, "epoch": 4719} {"train_loss": -7.171098709106445, "global_step": 198222, "epoch": 4719} {"train_loss": -7.364164352416992, "global_step": 198223, "epoch": 4719} {"train_loss": -7.379181385040283, "global_step": 198224, "epoch": 4719} {"train_loss": -7.204197883605957, "global_step": 198225, "epoch": 4719} {"train_loss": -7.2683610916137695, "global_step": 198226, "epoch": 4719} {"train_loss": -7.248547077178955, "global_step": 198227, "epoch": 4719} {"train_loss": -7.084912300109863, "global_step": 198228, "epoch": 4719} {"train_loss": -7.245120048522949, "global_step": 198229, "epoch": 4719} {"train_loss": -7.317791938781738, "global_step": 198230, "epoch": 4719} {"train_loss": -7.3041887283325195, "global_step": 198231, "epoch": 4719} {"train_loss": -7.182790756225586, "global_step": 198232, "epoch": 4719} {"train_loss": -7.155247211456299, "global_step": 198233, "epoch": 4719} {"train_loss": -7.188600063323975, "global_step": 198234, "epoch": 4719} {"train_loss": -7.41294527053833, "global_step": 198235, "epoch": 4719} {"train_loss": -7.074295520782471, "global_step": 198236, "epoch": 4719} {"train_loss": -7.2306342124938965, "global_step": 198237, "epoch": 4719} {"train_loss": -7.2441606521606445, "global_step": 198238, "epoch": 4719} {"train_loss": -7.252557663690476, "global_step": 198239, "epoch": 4719, "val_loss": 81408.3203125} {"train_loss": -7.268239498138428, "global_step": 198240, "epoch": 4720} {"train_loss": -7.0910491943359375, "global_step": 198241, "epoch": 4720} {"train_loss": -7.232832908630371, "global_step": 198242, "epoch": 4720} {"train_loss": -7.251922607421875, "global_step": 198243, "epoch": 4720} {"train_loss": -7.265280246734619, "global_step": 198244, "epoch": 4720} {"train_loss": -7.277234077453613, "global_step": 198245, "epoch": 4720} {"train_loss": -7.2428388595581055, "global_step": 198246, "epoch": 4720} {"train_loss": -7.25228214263916, "global_step": 198247, "epoch": 4720} {"train_loss": -7.3135762214660645, "global_step": 198248, "epoch": 4720} {"train_loss": -7.236536026000977, "global_step": 198249, "epoch": 4720} {"train_loss": -7.260868072509766, "global_step": 198250, "epoch": 4720} {"train_loss": -7.268430233001709, "global_step": 198251, "epoch": 4720} {"train_loss": -7.207533836364746, "global_step": 198252, "epoch": 4720} {"train_loss": -7.237267971038818, "global_step": 198253, "epoch": 4720} {"train_loss": -7.224781036376953, "global_step": 198254, "epoch": 4720} {"train_loss": -7.138226509094238, "global_step": 198255, "epoch": 4720} {"train_loss": -7.2078704833984375, "global_step": 198256, "epoch": 4720} {"train_loss": -7.33317232131958, "global_step": 198257, "epoch": 4720} {"train_loss": -7.251741409301758, "global_step": 198258, "epoch": 4720} {"train_loss": -7.2159576416015625, "global_step": 198259, "epoch": 4720} {"train_loss": -7.261144161224365, "global_step": 198260, "epoch": 4720} {"train_loss": -7.268698692321777, "global_step": 198261, "epoch": 4720} {"train_loss": -7.129429340362549, "global_step": 198262, "epoch": 4720} {"train_loss": -7.018518447875977, "global_step": 198263, "epoch": 4720} {"train_loss": -7.21281623840332, "global_step": 198264, "epoch": 4720} {"train_loss": -7.176286697387695, "global_step": 198265, "epoch": 4720} {"train_loss": -7.206419944763184, "global_step": 198266, "epoch": 4720} {"train_loss": -7.317844390869141, "global_step": 198267, "epoch": 4720} {"train_loss": -7.19144344329834, "global_step": 198268, "epoch": 4720} {"train_loss": -7.202224254608154, "global_step": 198269, "epoch": 4720} {"train_loss": -7.294736862182617, "global_step": 198270, "epoch": 4720} {"train_loss": -7.247730731964111, "global_step": 198271, "epoch": 4720} {"train_loss": -7.1730852127075195, "global_step": 198272, "epoch": 4720} {"train_loss": -7.3131422996521, "global_step": 198273, "epoch": 4720} {"train_loss": -7.299352645874023, "global_step": 198274, "epoch": 4720} {"train_loss": -7.297732830047607, "global_step": 198275, "epoch": 4720} {"train_loss": -7.274267196655273, "global_step": 198276, "epoch": 4720} {"train_loss": -7.354186058044434, "global_step": 198277, "epoch": 4720} {"train_loss": -7.349214553833008, "global_step": 198278, "epoch": 4720} {"train_loss": -7.211404800415039, "global_step": 198279, "epoch": 4720} {"train_loss": -7.191506385803223, "global_step": 198280, "epoch": 4720} {"train_loss": -7.239970434279669, "global_step": 198281, "epoch": 4720, "val_loss": 81258.5859375} {"train_loss": -7.2901811599731445, "global_step": 198282, "epoch": 4721} {"train_loss": -7.327150344848633, "global_step": 198283, "epoch": 4721} {"train_loss": -7.34208345413208, "global_step": 198284, "epoch": 4721} {"train_loss": -7.396819591522217, "global_step": 198285, "epoch": 4721} {"train_loss": -7.211633205413818, "global_step": 198286, "epoch": 4721} {"train_loss": -7.2656965255737305, "global_step": 198287, "epoch": 4721} {"train_loss": -7.249930381774902, "global_step": 198288, "epoch": 4721} {"train_loss": -7.375004291534424, "global_step": 198289, "epoch": 4721} {"train_loss": -7.2357635498046875, "global_step": 198290, "epoch": 4721} {"train_loss": -7.318552017211914, "global_step": 198291, "epoch": 4721} {"train_loss": -7.331530570983887, "global_step": 198292, "epoch": 4721} {"train_loss": -7.301295280456543, "global_step": 198293, "epoch": 4721} {"train_loss": -7.36746883392334, "global_step": 198294, "epoch": 4721} {"train_loss": -7.2536492347717285, "global_step": 198295, "epoch": 4721} {"train_loss": -7.293450355529785, "global_step": 198296, "epoch": 4721} {"train_loss": -7.351670265197754, "global_step": 198297, "epoch": 4721} {"train_loss": -7.301503658294678, "global_step": 198298, "epoch": 4721} {"train_loss": -7.077981472015381, "global_step": 198299, "epoch": 4721} {"train_loss": -7.0779571533203125, "global_step": 198300, "epoch": 4721} {"train_loss": -7.290362358093262, "global_step": 198301, "epoch": 4721} {"train_loss": -7.21577787399292, "global_step": 198302, "epoch": 4721} {"train_loss": -7.097245216369629, "global_step": 198303, "epoch": 4721} {"train_loss": -7.274836540222168, "global_step": 198304, "epoch": 4721} {"train_loss": -7.126348972320557, "global_step": 198305, "epoch": 4721} {"train_loss": -7.192927837371826, "global_step": 198306, "epoch": 4721} {"train_loss": -7.391037940979004, "global_step": 198307, "epoch": 4721} {"train_loss": -7.242434501647949, "global_step": 198308, "epoch": 4721} {"train_loss": -7.20353889465332, "global_step": 198309, "epoch": 4721} {"train_loss": -7.18460750579834, "global_step": 198310, "epoch": 4721} {"train_loss": -7.117648601531982, "global_step": 198311, "epoch": 4721} {"train_loss": -7.212752342224121, "global_step": 198312, "epoch": 4721} {"train_loss": -7.207080841064453, "global_step": 198313, "epoch": 4721} {"train_loss": -7.1704487800598145, "global_step": 198314, "epoch": 4721} {"train_loss": -7.208264350891113, "global_step": 198315, "epoch": 4721} {"train_loss": -7.261675834655762, "global_step": 198316, "epoch": 4721} {"train_loss": -7.164859771728516, "global_step": 198317, "epoch": 4721} {"train_loss": -7.183925628662109, "global_step": 198318, "epoch": 4721} {"train_loss": -7.259234428405762, "global_step": 198319, "epoch": 4721} {"train_loss": -7.1678667068481445, "global_step": 198320, "epoch": 4721} {"train_loss": -7.315605163574219, "global_step": 198321, "epoch": 4721} {"train_loss": -7.256590843200684, "global_step": 198322, "epoch": 4721} {"train_loss": -7.244479326974778, "global_step": 198323, "epoch": 4721, "val_loss": 81261.40625} {"train_loss": -7.166416168212891, "global_step": 198324, "epoch": 4722} {"train_loss": -7.29953670501709, "global_step": 198325, "epoch": 4722} {"train_loss": -7.298508644104004, "global_step": 198326, "epoch": 4722} {"train_loss": -7.280172348022461, "global_step": 198327, "epoch": 4722} {"train_loss": -7.256647109985352, "global_step": 198328, "epoch": 4722} {"train_loss": -7.28325891494751, "global_step": 198329, "epoch": 4722} {"train_loss": -7.316679000854492, "global_step": 198330, "epoch": 4722} {"train_loss": -7.383291244506836, "global_step": 198331, "epoch": 4722} {"train_loss": -7.228372573852539, "global_step": 198332, "epoch": 4722} {"train_loss": -7.341569423675537, "global_step": 198333, "epoch": 4722} {"train_loss": -7.314451217651367, "global_step": 198334, "epoch": 4722} {"train_loss": -7.333364009857178, "global_step": 198335, "epoch": 4722} {"train_loss": -7.174813747406006, "global_step": 198336, "epoch": 4722} {"train_loss": -7.270852088928223, "global_step": 198337, "epoch": 4722} {"train_loss": -7.1810760498046875, "global_step": 198338, "epoch": 4722} {"train_loss": -7.2447357177734375, "global_step": 198339, "epoch": 4722} {"train_loss": -7.313381671905518, "global_step": 198340, "epoch": 4722} {"train_loss": -7.282217979431152, "global_step": 198341, "epoch": 4722} {"train_loss": -7.262214183807373, "global_step": 198342, "epoch": 4722} {"train_loss": -7.077388763427734, "global_step": 198343, "epoch": 4722} {"train_loss": -7.077691078186035, "global_step": 198344, "epoch": 4722} {"train_loss": -7.32272481918335, "global_step": 198345, "epoch": 4722} {"train_loss": -7.182886123657227, "global_step": 198346, "epoch": 4722} {"train_loss": -7.14077091217041, "global_step": 198347, "epoch": 4722} {"train_loss": -7.242887496948242, "global_step": 198348, "epoch": 4722} {"train_loss": -7.247100830078125, "global_step": 198349, "epoch": 4722} {"train_loss": -7.178438186645508, "global_step": 198350, "epoch": 4722} {"train_loss": -7.205266952514648, "global_step": 198351, "epoch": 4722} {"train_loss": -7.268184185028076, "global_step": 198352, "epoch": 4722} {"train_loss": -7.183756351470947, "global_step": 198353, "epoch": 4722} {"train_loss": -7.268884658813477, "global_step": 198354, "epoch": 4722} {"train_loss": -7.289414405822754, "global_step": 198355, "epoch": 4722} {"train_loss": -7.17080020904541, "global_step": 198356, "epoch": 4722} {"train_loss": -7.230401992797852, "global_step": 198357, "epoch": 4722} {"train_loss": -7.301288604736328, "global_step": 198358, "epoch": 4722} {"train_loss": -7.286346435546875, "global_step": 198359, "epoch": 4722} {"train_loss": -7.1964592933654785, "global_step": 198360, "epoch": 4722} {"train_loss": -7.237570762634277, "global_step": 198361, "epoch": 4722} {"train_loss": -7.141885757446289, "global_step": 198362, "epoch": 4722} {"train_loss": -7.283245086669922, "global_step": 198363, "epoch": 4722} {"train_loss": -7.235451698303223, "global_step": 198364, "epoch": 4722} {"train_loss": -7.245734453201294, "global_step": 198365, "epoch": 4722, "val_loss": 81395.0859375} {"train_loss": -7.2881622314453125, "global_step": 198366, "epoch": 4723} {"train_loss": -7.28635311126709, "global_step": 198367, "epoch": 4723} {"train_loss": -7.278618812561035, "global_step": 198368, "epoch": 4723} {"train_loss": -7.321819305419922, "global_step": 198369, "epoch": 4723} {"train_loss": -7.299201011657715, "global_step": 198370, "epoch": 4723} {"train_loss": -7.383845329284668, "global_step": 198371, "epoch": 4723} {"train_loss": -7.2756571769714355, "global_step": 198372, "epoch": 4723} {"train_loss": -7.267838954925537, "global_step": 198373, "epoch": 4723} {"train_loss": -7.390734672546387, "global_step": 198374, "epoch": 4723} {"train_loss": -7.29685640335083, "global_step": 198375, "epoch": 4723} {"train_loss": -7.369513988494873, "global_step": 198376, "epoch": 4723} {"train_loss": -7.289248466491699, "global_step": 198377, "epoch": 4723} {"train_loss": -7.298139572143555, "global_step": 198378, "epoch": 4723} {"train_loss": -7.324814796447754, "global_step": 198379, "epoch": 4723} {"train_loss": -7.292569160461426, "global_step": 198380, "epoch": 4723} {"train_loss": -7.396634578704834, "global_step": 198381, "epoch": 4723} {"train_loss": -7.3081817626953125, "global_step": 198382, "epoch": 4723} {"train_loss": -7.369335174560547, "global_step": 198383, "epoch": 4723} {"train_loss": -7.304620265960693, "global_step": 198384, "epoch": 4723} {"train_loss": -7.324156761169434, "global_step": 198385, "epoch": 4723} {"train_loss": -7.282780170440674, "global_step": 198386, "epoch": 4723} {"train_loss": -7.3566389083862305, "global_step": 198387, "epoch": 4723} {"train_loss": -7.285919189453125, "global_step": 198388, "epoch": 4723} {"train_loss": -7.358019828796387, "global_step": 198389, "epoch": 4723} {"train_loss": -7.258240222930908, "global_step": 198390, "epoch": 4723} {"train_loss": -7.235283374786377, "global_step": 198391, "epoch": 4723} {"train_loss": -7.34256649017334, "global_step": 198392, "epoch": 4723} {"train_loss": -7.306262016296387, "global_step": 198393, "epoch": 4723} {"train_loss": -7.255742073059082, "global_step": 198394, "epoch": 4723} {"train_loss": -7.233094692230225, "global_step": 198395, "epoch": 4723} {"train_loss": -7.200840950012207, "global_step": 198396, "epoch": 4723} {"train_loss": -7.215818881988525, "global_step": 198397, "epoch": 4723} {"train_loss": -7.29599666595459, "global_step": 198398, "epoch": 4723} {"train_loss": -7.346532821655273, "global_step": 198399, "epoch": 4723} {"train_loss": -7.2670440673828125, "global_step": 198400, "epoch": 4723} {"train_loss": -7.253994941711426, "global_step": 198401, "epoch": 4723} {"train_loss": -7.260292053222656, "global_step": 198402, "epoch": 4723} {"train_loss": -7.270256996154785, "global_step": 198403, "epoch": 4723} {"train_loss": -7.2613677978515625, "global_step": 198404, "epoch": 4723} {"train_loss": -7.151708126068115, "global_step": 198405, "epoch": 4723} {"train_loss": -7.180880069732666, "global_step": 198406, "epoch": 4723} {"train_loss": -7.2922129063379195, "global_step": 198407, "epoch": 4723, "val_loss": 81331.3359375} {"train_loss": -7.339713096618652, "global_step": 198408, "epoch": 4724} {"train_loss": -7.266854286193848, "global_step": 198409, "epoch": 4724} {"train_loss": -7.17385721206665, "global_step": 198410, "epoch": 4724} {"train_loss": -7.2543535232543945, "global_step": 198411, "epoch": 4724} {"train_loss": -7.143889427185059, "global_step": 198412, "epoch": 4724} {"train_loss": -7.268747329711914, "global_step": 198413, "epoch": 4724} {"train_loss": -7.329793930053711, "global_step": 198414, "epoch": 4724} {"train_loss": -7.198544025421143, "global_step": 198415, "epoch": 4724} {"train_loss": -7.193755149841309, "global_step": 198416, "epoch": 4724} {"train_loss": -7.224123477935791, "global_step": 198417, "epoch": 4724} {"train_loss": -7.217032432556152, "global_step": 198418, "epoch": 4724} {"train_loss": -7.229184150695801, "global_step": 198419, "epoch": 4724} {"train_loss": -7.235801696777344, "global_step": 198420, "epoch": 4724} {"train_loss": -7.262071132659912, "global_step": 198421, "epoch": 4724} {"train_loss": -7.302903175354004, "global_step": 198422, "epoch": 4724} {"train_loss": -7.346863746643066, "global_step": 198423, "epoch": 4724} {"train_loss": -7.301461219787598, "global_step": 198424, "epoch": 4724} {"train_loss": -7.315739631652832, "global_step": 198425, "epoch": 4724} {"train_loss": -7.2062883377075195, "global_step": 198426, "epoch": 4724} {"train_loss": -7.287083625793457, "global_step": 198427, "epoch": 4724} {"train_loss": -7.273226737976074, "global_step": 198428, "epoch": 4724} {"train_loss": -7.1579437255859375, "global_step": 198429, "epoch": 4724} {"train_loss": -7.187856674194336, "global_step": 198430, "epoch": 4724} {"train_loss": -7.2207489013671875, "global_step": 198431, "epoch": 4724} {"train_loss": -7.278473854064941, "global_step": 198432, "epoch": 4724} {"train_loss": -7.132748603820801, "global_step": 198433, "epoch": 4724} {"train_loss": -7.237878799438477, "global_step": 198434, "epoch": 4724} {"train_loss": -7.305692672729492, "global_step": 198435, "epoch": 4724} {"train_loss": -7.211798667907715, "global_step": 198436, "epoch": 4724} {"train_loss": -7.261267185211182, "global_step": 198437, "epoch": 4724} {"train_loss": -7.1538591384887695, "global_step": 198438, "epoch": 4724} {"train_loss": -7.379036903381348, "global_step": 198439, "epoch": 4724} {"train_loss": -7.35994815826416, "global_step": 198440, "epoch": 4724} {"train_loss": -7.301409721374512, "global_step": 198441, "epoch": 4724} {"train_loss": -7.2210893630981445, "global_step": 198442, "epoch": 4724} {"train_loss": -7.292782783508301, "global_step": 198443, "epoch": 4724} {"train_loss": -7.3182244300842285, "global_step": 198444, "epoch": 4724} {"train_loss": -7.337081432342529, "global_step": 198445, "epoch": 4724} {"train_loss": -7.295886516571045, "global_step": 198446, "epoch": 4724} {"train_loss": -7.254642009735107, "global_step": 198447, "epoch": 4724} {"train_loss": -7.312360763549805, "global_step": 198448, "epoch": 4724} {"train_loss": -7.2586252348763605, "global_step": 198449, "epoch": 4724, "val_loss": 81530.5} {"train_loss": -7.273004055023193, "global_step": 198450, "epoch": 4725} {"train_loss": -7.273427963256836, "global_step": 198451, "epoch": 4725} {"train_loss": -7.257051467895508, "global_step": 198452, "epoch": 4725} {"train_loss": -7.330709457397461, "global_step": 198453, "epoch": 4725} {"train_loss": -7.284772872924805, "global_step": 198454, "epoch": 4725} {"train_loss": -7.271865367889404, "global_step": 198455, "epoch": 4725} {"train_loss": -7.253174781799316, "global_step": 198456, "epoch": 4725} {"train_loss": -7.3767499923706055, "global_step": 198457, "epoch": 4725} {"train_loss": -7.159601211547852, "global_step": 198458, "epoch": 4725} {"train_loss": -7.163721084594727, "global_step": 198459, "epoch": 4725} {"train_loss": -7.1231184005737305, "global_step": 198460, "epoch": 4725} {"train_loss": -7.253784656524658, "global_step": 198461, "epoch": 4725} {"train_loss": -7.014364242553711, "global_step": 198462, "epoch": 4725} {"train_loss": -7.1066484451293945, "global_step": 198463, "epoch": 4725} {"train_loss": -7.210193634033203, "global_step": 198464, "epoch": 4725} {"train_loss": -6.938714027404785, "global_step": 198465, "epoch": 4725} {"train_loss": -7.251704216003418, "global_step": 198466, "epoch": 4725} {"train_loss": -7.098854064941406, "global_step": 198467, "epoch": 4725} {"train_loss": -6.993415832519531, "global_step": 198468, "epoch": 4725} {"train_loss": -7.2323150634765625, "global_step": 198469, "epoch": 4725} {"train_loss": -7.190206527709961, "global_step": 198470, "epoch": 4725} {"train_loss": -7.164321422576904, "global_step": 198471, "epoch": 4725} {"train_loss": -7.149479866027832, "global_step": 198472, "epoch": 4725} {"train_loss": -7.2744035720825195, "global_step": 198473, "epoch": 4725} {"train_loss": -7.177309989929199, "global_step": 198474, "epoch": 4725} {"train_loss": -7.126325607299805, "global_step": 198475, "epoch": 4725} {"train_loss": -7.302713394165039, "global_step": 198476, "epoch": 4725} {"train_loss": -7.204100608825684, "global_step": 198477, "epoch": 4725} {"train_loss": -7.2729315757751465, "global_step": 198478, "epoch": 4725} {"train_loss": -7.291260242462158, "global_step": 198479, "epoch": 4725} {"train_loss": -7.213064193725586, "global_step": 198480, "epoch": 4725} {"train_loss": -7.061222076416016, "global_step": 198481, "epoch": 4725} {"train_loss": -7.29979133605957, "global_step": 198482, "epoch": 4725} {"train_loss": -7.1781005859375, "global_step": 198483, "epoch": 4725} {"train_loss": -7.198104381561279, "global_step": 198484, "epoch": 4725} {"train_loss": -7.203142166137695, "global_step": 198485, "epoch": 4725} {"train_loss": -7.292778491973877, "global_step": 198486, "epoch": 4725} {"train_loss": -7.18452262878418, "global_step": 198487, "epoch": 4725} {"train_loss": -7.302166938781738, "global_step": 198488, "epoch": 4725} {"train_loss": -7.188253402709961, "global_step": 198489, "epoch": 4725} {"train_loss": -7.352071762084961, "global_step": 198490, "epoch": 4725} {"train_loss": -7.206127598172142, "global_step": 198491, "epoch": 4725, "val_loss": 81278.640625} {"train_loss": -7.290656089782715, "global_step": 198492, "epoch": 4726} {"train_loss": -7.284955024719238, "global_step": 198493, "epoch": 4726} {"train_loss": -7.296607971191406, "global_step": 198494, "epoch": 4726} {"train_loss": -7.311039447784424, "global_step": 198495, "epoch": 4726} {"train_loss": -7.256577968597412, "global_step": 198496, "epoch": 4726} {"train_loss": -7.339316368103027, "global_step": 198497, "epoch": 4726} {"train_loss": -7.2762956619262695, "global_step": 198498, "epoch": 4726} {"train_loss": -7.333656311035156, "global_step": 198499, "epoch": 4726} {"train_loss": -7.202478408813477, "global_step": 198500, "epoch": 4726} {"train_loss": -7.301664352416992, "global_step": 198501, "epoch": 4726} {"train_loss": -7.361532211303711, "global_step": 198502, "epoch": 4726} {"train_loss": -7.25956916809082, "global_step": 198503, "epoch": 4726} {"train_loss": -7.3751654624938965, "global_step": 198504, "epoch": 4726} {"train_loss": -7.430743217468262, "global_step": 198505, "epoch": 4726} {"train_loss": -7.290570259094238, "global_step": 198506, "epoch": 4726} {"train_loss": -7.280327796936035, "global_step": 198507, "epoch": 4726} {"train_loss": -7.323716163635254, "global_step": 198508, "epoch": 4726} {"train_loss": -7.300628662109375, "global_step": 198509, "epoch": 4726} {"train_loss": -7.323328018188477, "global_step": 198510, "epoch": 4726} {"train_loss": -7.367554187774658, "global_step": 198511, "epoch": 4726} {"train_loss": -7.362838268280029, "global_step": 198512, "epoch": 4726} {"train_loss": -7.282487869262695, "global_step": 198513, "epoch": 4726} {"train_loss": -7.2826738357543945, "global_step": 198514, "epoch": 4726} {"train_loss": -7.462116241455078, "global_step": 198515, "epoch": 4726} {"train_loss": -7.329392433166504, "global_step": 198516, "epoch": 4726} {"train_loss": -7.33668327331543, "global_step": 198517, "epoch": 4726} {"train_loss": -7.291337490081787, "global_step": 198518, "epoch": 4726} {"train_loss": -7.36623477935791, "global_step": 198519, "epoch": 4726} {"train_loss": -7.143851280212402, "global_step": 198520, "epoch": 4726} {"train_loss": -7.301999568939209, "global_step": 198521, "epoch": 4726} {"train_loss": -7.348278522491455, "global_step": 198522, "epoch": 4726} {"train_loss": -7.253076076507568, "global_step": 198523, "epoch": 4726} {"train_loss": -7.27957820892334, "global_step": 198524, "epoch": 4726} {"train_loss": -7.374080181121826, "global_step": 198525, "epoch": 4726} {"train_loss": -7.3449296951293945, "global_step": 198526, "epoch": 4726} {"train_loss": -7.382254600524902, "global_step": 198527, "epoch": 4726} {"train_loss": -7.341111183166504, "global_step": 198528, "epoch": 4726} {"train_loss": -7.235202789306641, "global_step": 198529, "epoch": 4726} {"train_loss": -7.32392692565918, "global_step": 198530, "epoch": 4726} {"train_loss": -7.367722511291504, "global_step": 198531, "epoch": 4726} {"train_loss": -7.329890251159668, "global_step": 198532, "epoch": 4726} {"train_loss": -7.314826885859172, "global_step": 198533, "epoch": 4726, "val_loss": 81426.640625} {"train_loss": -7.275962829589844, "global_step": 198534, "epoch": 4727} {"train_loss": -7.277898788452148, "global_step": 198535, "epoch": 4727} {"train_loss": -7.383296966552734, "global_step": 198536, "epoch": 4727} {"train_loss": -7.212188720703125, "global_step": 198537, "epoch": 4727} {"train_loss": -7.31258487701416, "global_step": 198538, "epoch": 4727} {"train_loss": -7.322046279907227, "global_step": 198539, "epoch": 4727} {"train_loss": -7.268481254577637, "global_step": 198540, "epoch": 4727} {"train_loss": -7.036129951477051, "global_step": 198541, "epoch": 4727} {"train_loss": -7.198224067687988, "global_step": 198542, "epoch": 4727} {"train_loss": -7.188449382781982, "global_step": 198543, "epoch": 4727} {"train_loss": -7.092532634735107, "global_step": 198544, "epoch": 4727} {"train_loss": -7.282236099243164, "global_step": 198545, "epoch": 4727} {"train_loss": -7.134768486022949, "global_step": 198546, "epoch": 4727} {"train_loss": -7.1742634773254395, "global_step": 198547, "epoch": 4727} {"train_loss": -7.2255778312683105, "global_step": 198548, "epoch": 4727} {"train_loss": -7.178650379180908, "global_step": 198549, "epoch": 4727} {"train_loss": -7.205300331115723, "global_step": 198550, "epoch": 4727} {"train_loss": -7.2667412757873535, "global_step": 198551, "epoch": 4727} {"train_loss": -7.187615394592285, "global_step": 198552, "epoch": 4727} {"train_loss": -7.3203535079956055, "global_step": 198553, "epoch": 4727} {"train_loss": -7.192968845367432, "global_step": 198554, "epoch": 4727} {"train_loss": -7.216696739196777, "global_step": 198555, "epoch": 4727} {"train_loss": -7.3052897453308105, "global_step": 198556, "epoch": 4727} {"train_loss": -7.295312881469727, "global_step": 198557, "epoch": 4727} {"train_loss": -7.417027473449707, "global_step": 198558, "epoch": 4727} {"train_loss": -7.276845932006836, "global_step": 198559, "epoch": 4727} {"train_loss": -7.275243759155273, "global_step": 198560, "epoch": 4727} {"train_loss": -7.330796241760254, "global_step": 198561, "epoch": 4727} {"train_loss": -7.250880718231201, "global_step": 198562, "epoch": 4727} {"train_loss": -7.256941318511963, "global_step": 198563, "epoch": 4727} {"train_loss": -7.321958541870117, "global_step": 198564, "epoch": 4727} {"train_loss": -7.326231956481934, "global_step": 198565, "epoch": 4727} {"train_loss": -7.117553234100342, "global_step": 198566, "epoch": 4727} {"train_loss": -7.209259510040283, "global_step": 198567, "epoch": 4727} {"train_loss": -7.30135440826416, "global_step": 198568, "epoch": 4727} {"train_loss": -7.146934509277344, "global_step": 198569, "epoch": 4727} {"train_loss": -7.266212463378906, "global_step": 198570, "epoch": 4727} {"train_loss": -7.205256938934326, "global_step": 198571, "epoch": 4727} {"train_loss": -7.242970943450928, "global_step": 198572, "epoch": 4727} {"train_loss": -7.153514862060547, "global_step": 198573, "epoch": 4727} {"train_loss": -7.137368202209473, "global_step": 198574, "epoch": 4727} {"train_loss": -7.24051554997762, "global_step": 198575, "epoch": 4727, "val_loss": 81414.6015625} {"train_loss": -7.17158317565918, "global_step": 198576, "epoch": 4728} {"train_loss": -7.220073223114014, "global_step": 198577, "epoch": 4728} {"train_loss": -7.225452423095703, "global_step": 198578, "epoch": 4728} {"train_loss": -7.197955131530762, "global_step": 198579, "epoch": 4728} {"train_loss": -7.242832660675049, "global_step": 198580, "epoch": 4728} {"train_loss": -7.219913482666016, "global_step": 198581, "epoch": 4728} {"train_loss": -7.204344749450684, "global_step": 198582, "epoch": 4728} {"train_loss": -7.281350135803223, "global_step": 198583, "epoch": 4728} {"train_loss": -7.211569786071777, "global_step": 198584, "epoch": 4728} {"train_loss": -7.3018293380737305, "global_step": 198585, "epoch": 4728} {"train_loss": -7.238948822021484, "global_step": 198586, "epoch": 4728} {"train_loss": -7.2426066398620605, "global_step": 198587, "epoch": 4728} {"train_loss": -7.273441791534424, "global_step": 198588, "epoch": 4728} {"train_loss": -7.1998443603515625, "global_step": 198589, "epoch": 4728} {"train_loss": -7.145683288574219, "global_step": 198590, "epoch": 4728} {"train_loss": -7.359498977661133, "global_step": 198591, "epoch": 4728} {"train_loss": -7.338356018066406, "global_step": 198592, "epoch": 4728} {"train_loss": -7.390201568603516, "global_step": 198593, "epoch": 4728} {"train_loss": -7.119178771972656, "global_step": 198594, "epoch": 4728} {"train_loss": -7.264796257019043, "global_step": 198595, "epoch": 4728} {"train_loss": -7.425029754638672, "global_step": 198596, "epoch": 4728} {"train_loss": -7.206108570098877, "global_step": 198597, "epoch": 4728} {"train_loss": -7.19675350189209, "global_step": 198598, "epoch": 4728} {"train_loss": -7.1736016273498535, "global_step": 198599, "epoch": 4728} {"train_loss": -7.270601272583008, "global_step": 198600, "epoch": 4728} {"train_loss": -7.332063674926758, "global_step": 198601, "epoch": 4728} {"train_loss": -7.252785682678223, "global_step": 198602, "epoch": 4728} {"train_loss": -7.382632732391357, "global_step": 198603, "epoch": 4728} {"train_loss": -7.207043647766113, "global_step": 198604, "epoch": 4728} {"train_loss": -7.326927185058594, "global_step": 198605, "epoch": 4728} {"train_loss": -7.33925199508667, "global_step": 198606, "epoch": 4728} {"train_loss": -7.370474338531494, "global_step": 198607, "epoch": 4728} {"train_loss": -7.33113431930542, "global_step": 198608, "epoch": 4728} {"train_loss": -7.291464328765869, "global_step": 198609, "epoch": 4728} {"train_loss": -7.2788920402526855, "global_step": 198610, "epoch": 4728} {"train_loss": -7.397531509399414, "global_step": 198611, "epoch": 4728} {"train_loss": -7.218954086303711, "global_step": 198612, "epoch": 4728} {"train_loss": -7.293963432312012, "global_step": 198613, "epoch": 4728} {"train_loss": -7.3570709228515625, "global_step": 198614, "epoch": 4728} {"train_loss": -7.331878662109375, "global_step": 198615, "epoch": 4728} {"train_loss": -7.326231002807617, "global_step": 198616, "epoch": 4728} {"train_loss": -7.27235373996553, "global_step": 198617, "epoch": 4728, "val_loss": 81402.4375} {"train_loss": -7.328939914703369, "global_step": 198618, "epoch": 4729} {"train_loss": -7.202045440673828, "global_step": 198619, "epoch": 4729} {"train_loss": -7.30263614654541, "global_step": 198620, "epoch": 4729} {"train_loss": -7.283572673797607, "global_step": 198621, "epoch": 4729} {"train_loss": -7.419010162353516, "global_step": 198622, "epoch": 4729} {"train_loss": -7.323890686035156, "global_step": 198623, "epoch": 4729} {"train_loss": -7.335199356079102, "global_step": 198624, "epoch": 4729} {"train_loss": -7.534168243408203, "global_step": 198625, "epoch": 4729} {"train_loss": -7.338253974914551, "global_step": 198626, "epoch": 4729} {"train_loss": -7.340487957000732, "global_step": 198627, "epoch": 4729} {"train_loss": -7.327582359313965, "global_step": 198628, "epoch": 4729} {"train_loss": -7.437008857727051, "global_step": 198629, "epoch": 4729} {"train_loss": -7.370668411254883, "global_step": 198630, "epoch": 4729} {"train_loss": -7.372072219848633, "global_step": 198631, "epoch": 4729} {"train_loss": -7.372645378112793, "global_step": 198632, "epoch": 4729} {"train_loss": -7.257172584533691, "global_step": 198633, "epoch": 4729} {"train_loss": -7.3315043449401855, "global_step": 198634, "epoch": 4729} {"train_loss": -7.37213659286499, "global_step": 198635, "epoch": 4729} {"train_loss": -7.354727745056152, "global_step": 198636, "epoch": 4729} {"train_loss": -7.347405433654785, "global_step": 198637, "epoch": 4729} {"train_loss": -7.322976112365723, "global_step": 198638, "epoch": 4729} {"train_loss": -7.453616142272949, "global_step": 198639, "epoch": 4729} {"train_loss": -7.444920063018799, "global_step": 198640, "epoch": 4729} {"train_loss": -7.24450159072876, "global_step": 198641, "epoch": 4729} {"train_loss": -7.383858680725098, "global_step": 198642, "epoch": 4729} {"train_loss": -7.424180030822754, "global_step": 198643, "epoch": 4729} {"train_loss": -7.2205352783203125, "global_step": 198644, "epoch": 4729} {"train_loss": -7.352077484130859, "global_step": 198645, "epoch": 4729} {"train_loss": -7.319945335388184, "global_step": 198646, "epoch": 4729} {"train_loss": -7.256278038024902, "global_step": 198647, "epoch": 4729} {"train_loss": -7.214188575744629, "global_step": 198648, "epoch": 4729} {"train_loss": -7.2794108390808105, "global_step": 198649, "epoch": 4729} {"train_loss": -7.28300666809082, "global_step": 198650, "epoch": 4729} {"train_loss": -7.275750160217285, "global_step": 198651, "epoch": 4729} {"train_loss": -7.355395793914795, "global_step": 198652, "epoch": 4729} {"train_loss": -7.266785144805908, "global_step": 198653, "epoch": 4729} {"train_loss": -7.309760093688965, "global_step": 198654, "epoch": 4729} {"train_loss": -7.275625705718994, "global_step": 198655, "epoch": 4729} {"train_loss": -7.173200607299805, "global_step": 198656, "epoch": 4729} {"train_loss": -7.3163838386535645, "global_step": 198657, "epoch": 4729} {"train_loss": -7.247513771057129, "global_step": 198658, "epoch": 4729} {"train_loss": -7.323692446663266, "global_step": 198659, "epoch": 4729, "val_loss": 81307.046875} {"train_loss": -7.303122520446777, "global_step": 198660, "epoch": 4730} {"train_loss": -7.228099346160889, "global_step": 198661, "epoch": 4730} {"train_loss": -7.257699012756348, "global_step": 198662, "epoch": 4730} {"train_loss": -7.347900390625, "global_step": 198663, "epoch": 4730} {"train_loss": -7.378628730773926, "global_step": 198664, "epoch": 4730} {"train_loss": -7.321332931518555, "global_step": 198665, "epoch": 4730} {"train_loss": -7.376214504241943, "global_step": 198666, "epoch": 4730} {"train_loss": -7.369926452636719, "global_step": 198667, "epoch": 4730} {"train_loss": -7.202261924743652, "global_step": 198668, "epoch": 4730} {"train_loss": -7.358137130737305, "global_step": 198669, "epoch": 4730} {"train_loss": -7.194487571716309, "global_step": 198670, "epoch": 4730} {"train_loss": -7.117669105529785, "global_step": 198671, "epoch": 4730} {"train_loss": -7.311227798461914, "global_step": 198672, "epoch": 4730} {"train_loss": -7.1072492599487305, "global_step": 198673, "epoch": 4730} {"train_loss": -7.319468975067139, "global_step": 198674, "epoch": 4730} {"train_loss": -7.288733005523682, "global_step": 198675, "epoch": 4730} {"train_loss": -7.125432014465332, "global_step": 198676, "epoch": 4730} {"train_loss": -7.232590675354004, "global_step": 198677, "epoch": 4730} {"train_loss": -7.218891143798828, "global_step": 198678, "epoch": 4730} {"train_loss": -7.1375651359558105, "global_step": 198679, "epoch": 4730} {"train_loss": -7.074272155761719, "global_step": 198680, "epoch": 4730} {"train_loss": -7.037776470184326, "global_step": 198681, "epoch": 4730} {"train_loss": -7.12490177154541, "global_step": 198682, "epoch": 4730} {"train_loss": -7.062413215637207, "global_step": 198683, "epoch": 4730} {"train_loss": -7.153773307800293, "global_step": 198684, "epoch": 4730} {"train_loss": -6.962834358215332, "global_step": 198685, "epoch": 4730} {"train_loss": -7.2599053382873535, "global_step": 198686, "epoch": 4730} {"train_loss": -6.966196060180664, "global_step": 198687, "epoch": 4730} {"train_loss": -7.242278099060059, "global_step": 198688, "epoch": 4730} {"train_loss": -7.233127593994141, "global_step": 198689, "epoch": 4730} {"train_loss": -7.143758296966553, "global_step": 198690, "epoch": 4730} {"train_loss": -7.230166435241699, "global_step": 198691, "epoch": 4730} {"train_loss": -7.242136478424072, "global_step": 198692, "epoch": 4730} {"train_loss": -7.053940773010254, "global_step": 198693, "epoch": 4730} {"train_loss": -7.1732659339904785, "global_step": 198694, "epoch": 4730} {"train_loss": -6.995029449462891, "global_step": 198695, "epoch": 4730} {"train_loss": -7.134103775024414, "global_step": 198696, "epoch": 4730} {"train_loss": -7.131606101989746, "global_step": 198697, "epoch": 4730} {"train_loss": -7.177715301513672, "global_step": 198698, "epoch": 4730} {"train_loss": -7.078893661499023, "global_step": 198699, "epoch": 4730} {"train_loss": -7.263957977294922, "global_step": 198700, "epoch": 4730} {"train_loss": -7.1915763559795565, "global_step": 198701, "epoch": 4730, "val_loss": 81177.8515625} {"train_loss": -7.280638694763184, "global_step": 198702, "epoch": 4731} {"train_loss": -7.236713409423828, "global_step": 198703, "epoch": 4731} {"train_loss": -7.2031450271606445, "global_step": 198704, "epoch": 4731} {"train_loss": -7.217293739318848, "global_step": 198705, "epoch": 4731} {"train_loss": -7.078408241271973, "global_step": 198706, "epoch": 4731} {"train_loss": -7.273723602294922, "global_step": 198707, "epoch": 4731} {"train_loss": -7.105045795440674, "global_step": 198708, "epoch": 4731} {"train_loss": -7.1651411056518555, "global_step": 198709, "epoch": 4731} {"train_loss": -7.184118270874023, "global_step": 198710, "epoch": 4731} {"train_loss": -7.194504737854004, "global_step": 198711, "epoch": 4731} {"train_loss": -7.125526428222656, "global_step": 198712, "epoch": 4731} {"train_loss": -7.151623725891113, "global_step": 198713, "epoch": 4731} {"train_loss": -7.286536693572998, "global_step": 198714, "epoch": 4731} {"train_loss": -6.993344306945801, "global_step": 198715, "epoch": 4731} {"train_loss": -7.314764022827148, "global_step": 198716, "epoch": 4731} {"train_loss": -7.099567890167236, "global_step": 198717, "epoch": 4731} {"train_loss": -7.219566345214844, "global_step": 198718, "epoch": 4731} {"train_loss": -7.18533182144165, "global_step": 198719, "epoch": 4731} {"train_loss": -7.212896347045898, "global_step": 198720, "epoch": 4731} {"train_loss": -7.147425651550293, "global_step": 198721, "epoch": 4731} {"train_loss": -7.178117752075195, "global_step": 198722, "epoch": 4731} {"train_loss": -7.166212558746338, "global_step": 198723, "epoch": 4731} {"train_loss": -7.19718599319458, "global_step": 198724, "epoch": 4731} {"train_loss": -7.245640277862549, "global_step": 198725, "epoch": 4731} {"train_loss": -7.232143402099609, "global_step": 198726, "epoch": 4731} {"train_loss": -7.285799503326416, "global_step": 198727, "epoch": 4731} {"train_loss": -7.253705978393555, "global_step": 198728, "epoch": 4731} {"train_loss": -7.175520896911621, "global_step": 198729, "epoch": 4731} {"train_loss": -7.194090366363525, "global_step": 198730, "epoch": 4731} {"train_loss": -7.313835144042969, "global_step": 198731, "epoch": 4731} {"train_loss": -7.189208030700684, "global_step": 198732, "epoch": 4731} {"train_loss": -7.127017021179199, "global_step": 198733, "epoch": 4731} {"train_loss": -7.212440013885498, "global_step": 198734, "epoch": 4731} {"train_loss": -7.182514190673828, "global_step": 198735, "epoch": 4731} {"train_loss": -7.235968589782715, "global_step": 198736, "epoch": 4731} {"train_loss": -7.205309867858887, "global_step": 198737, "epoch": 4731} {"train_loss": -7.153867721557617, "global_step": 198738, "epoch": 4731} {"train_loss": -7.297430038452148, "global_step": 198739, "epoch": 4731} {"train_loss": -7.260422706604004, "global_step": 198740, "epoch": 4731} {"train_loss": -7.178125381469727, "global_step": 198741, "epoch": 4731} {"train_loss": -7.208935737609863, "global_step": 198742, "epoch": 4731} {"train_loss": -7.19989123798552, "global_step": 198743, "epoch": 4731, "val_loss": 81248.7421875} {"train_loss": -7.224672317504883, "global_step": 198744, "epoch": 4732} {"train_loss": -7.181960105895996, "global_step": 198745, "epoch": 4732} {"train_loss": -7.243093490600586, "global_step": 198746, "epoch": 4732} {"train_loss": -7.29499626159668, "global_step": 198747, "epoch": 4732} {"train_loss": -7.236029624938965, "global_step": 198748, "epoch": 4732} {"train_loss": -7.163798809051514, "global_step": 198749, "epoch": 4732} {"train_loss": -7.291310787200928, "global_step": 198750, "epoch": 4732} {"train_loss": -7.425230979919434, "global_step": 198751, "epoch": 4732} {"train_loss": -7.170454978942871, "global_step": 198752, "epoch": 4732} {"train_loss": -7.243599891662598, "global_step": 198753, "epoch": 4732} {"train_loss": -7.24122428894043, "global_step": 198754, "epoch": 4732} {"train_loss": -7.214520454406738, "global_step": 198755, "epoch": 4732} {"train_loss": -7.328036308288574, "global_step": 198756, "epoch": 4732} {"train_loss": -7.26157283782959, "global_step": 198757, "epoch": 4732} {"train_loss": -7.230199813842773, "global_step": 198758, "epoch": 4732} {"train_loss": -7.309027194976807, "global_step": 198759, "epoch": 4732} {"train_loss": -7.2916178703308105, "global_step": 198760, "epoch": 4732} {"train_loss": -7.32626485824585, "global_step": 198761, "epoch": 4732} {"train_loss": -7.32181453704834, "global_step": 198762, "epoch": 4732} {"train_loss": -7.342485427856445, "global_step": 198763, "epoch": 4732} {"train_loss": -7.228607177734375, "global_step": 198764, "epoch": 4732} {"train_loss": -7.286478519439697, "global_step": 198765, "epoch": 4732} {"train_loss": -7.2705607414245605, "global_step": 198766, "epoch": 4732} {"train_loss": -7.1438703536987305, "global_step": 198767, "epoch": 4732} {"train_loss": -7.409257411956787, "global_step": 198768, "epoch": 4732} {"train_loss": -7.260077476501465, "global_step": 198769, "epoch": 4732} {"train_loss": -7.251859664916992, "global_step": 198770, "epoch": 4732} {"train_loss": -7.2359418869018555, "global_step": 198771, "epoch": 4732} {"train_loss": -7.167154788970947, "global_step": 198772, "epoch": 4732} {"train_loss": -6.990764617919922, "global_step": 198773, "epoch": 4732} {"train_loss": -7.19268798828125, "global_step": 198774, "epoch": 4732} {"train_loss": -7.178449630737305, "global_step": 198775, "epoch": 4732} {"train_loss": -7.1316633224487305, "global_step": 198776, "epoch": 4732} {"train_loss": -7.310484886169434, "global_step": 198777, "epoch": 4732} {"train_loss": -7.175134658813477, "global_step": 198778, "epoch": 4732} {"train_loss": -7.037944316864014, "global_step": 198779, "epoch": 4732} {"train_loss": -7.272347450256348, "global_step": 198780, "epoch": 4732} {"train_loss": -7.126923084259033, "global_step": 198781, "epoch": 4732} {"train_loss": -7.2849884033203125, "global_step": 198782, "epoch": 4732} {"train_loss": -7.0881171226501465, "global_step": 198783, "epoch": 4732} {"train_loss": -7.289262294769287, "global_step": 198784, "epoch": 4732} {"train_loss": -7.233913353511265, "global_step": 198785, "epoch": 4732, "val_loss": 81400.1328125} {"train_loss": -7.151049613952637, "global_step": 198786, "epoch": 4733} {"train_loss": -7.23682165145874, "global_step": 198787, "epoch": 4733} {"train_loss": -7.211455345153809, "global_step": 198788, "epoch": 4733} {"train_loss": -7.288507461547852, "global_step": 198789, "epoch": 4733} {"train_loss": -7.334722995758057, "global_step": 198790, "epoch": 4733} {"train_loss": -7.296822547912598, "global_step": 198791, "epoch": 4733} {"train_loss": -7.278426170349121, "global_step": 198792, "epoch": 4733} {"train_loss": -7.227470397949219, "global_step": 198793, "epoch": 4733} {"train_loss": -7.376126766204834, "global_step": 198794, "epoch": 4733} {"train_loss": -7.24659538269043, "global_step": 198795, "epoch": 4733} {"train_loss": -7.3849687576293945, "global_step": 198796, "epoch": 4733} {"train_loss": -7.2412872314453125, "global_step": 198797, "epoch": 4733} {"train_loss": -7.389998912811279, "global_step": 198798, "epoch": 4733} {"train_loss": -7.267735004425049, "global_step": 198799, "epoch": 4733} {"train_loss": -7.2473955154418945, "global_step": 198800, "epoch": 4733} {"train_loss": -7.339482307434082, "global_step": 198801, "epoch": 4733} {"train_loss": -7.218236923217773, "global_step": 198802, "epoch": 4733} {"train_loss": -7.236878395080566, "global_step": 198803, "epoch": 4733} {"train_loss": -7.2591352462768555, "global_step": 198804, "epoch": 4733} {"train_loss": -7.268165588378906, "global_step": 198805, "epoch": 4733} {"train_loss": -7.487786769866943, "global_step": 198806, "epoch": 4733} {"train_loss": -7.390478134155273, "global_step": 198807, "epoch": 4733} {"train_loss": -7.2145233154296875, "global_step": 198808, "epoch": 4733} {"train_loss": -7.26193904876709, "global_step": 198809, "epoch": 4733} {"train_loss": -7.251139163970947, "global_step": 198810, "epoch": 4733} {"train_loss": -7.288572311401367, "global_step": 198811, "epoch": 4733} {"train_loss": -7.223862648010254, "global_step": 198812, "epoch": 4733} {"train_loss": -7.29106330871582, "global_step": 198813, "epoch": 4733} {"train_loss": -7.358712196350098, "global_step": 198814, "epoch": 4733} {"train_loss": -7.2822265625, "global_step": 198815, "epoch": 4733} {"train_loss": -7.328853130340576, "global_step": 198816, "epoch": 4733} {"train_loss": -7.251897811889648, "global_step": 198817, "epoch": 4733} {"train_loss": -7.189621925354004, "global_step": 198818, "epoch": 4733} {"train_loss": -7.2929534912109375, "global_step": 198819, "epoch": 4733} {"train_loss": -7.14435338973999, "global_step": 198820, "epoch": 4733} {"train_loss": -7.304354667663574, "global_step": 198821, "epoch": 4733} {"train_loss": -7.167420387268066, "global_step": 198822, "epoch": 4733} {"train_loss": -7.419482231140137, "global_step": 198823, "epoch": 4733} {"train_loss": -7.331969261169434, "global_step": 198824, "epoch": 4733} {"train_loss": -7.2799973487854, "global_step": 198825, "epoch": 4733} {"train_loss": -7.227548599243164, "global_step": 198826, "epoch": 4733} {"train_loss": -7.278434174401419, "global_step": 198827, "epoch": 4733, "val_loss": 81372.8203125} {"train_loss": -7.162788391113281, "global_step": 198828, "epoch": 4734} {"train_loss": -7.201180458068848, "global_step": 198829, "epoch": 4734} {"train_loss": -7.2631449699401855, "global_step": 198830, "epoch": 4734} {"train_loss": -7.270321369171143, "global_step": 198831, "epoch": 4734} {"train_loss": -7.228322982788086, "global_step": 198832, "epoch": 4734} {"train_loss": -7.287624359130859, "global_step": 198833, "epoch": 4734} {"train_loss": -7.24947452545166, "global_step": 198834, "epoch": 4734} {"train_loss": -7.287789821624756, "global_step": 198835, "epoch": 4734} {"train_loss": -7.300631523132324, "global_step": 198836, "epoch": 4734} {"train_loss": -7.322232246398926, "global_step": 198837, "epoch": 4734} {"train_loss": -7.200544357299805, "global_step": 198838, "epoch": 4734} {"train_loss": -7.18910026550293, "global_step": 198839, "epoch": 4734} {"train_loss": -7.1821513175964355, "global_step": 198840, "epoch": 4734} {"train_loss": -7.157120704650879, "global_step": 198841, "epoch": 4734} {"train_loss": -7.3336405754089355, "global_step": 198842, "epoch": 4734} {"train_loss": -7.233062744140625, "global_step": 198843, "epoch": 4734} {"train_loss": -7.082451820373535, "global_step": 198844, "epoch": 4734} {"train_loss": -7.21793794631958, "global_step": 198845, "epoch": 4734} {"train_loss": -7.207908630371094, "global_step": 198846, "epoch": 4734} {"train_loss": -7.247550964355469, "global_step": 198847, "epoch": 4734} {"train_loss": -7.289664268493652, "global_step": 198848, "epoch": 4734} {"train_loss": -7.238884925842285, "global_step": 198849, "epoch": 4734} {"train_loss": -7.208687782287598, "global_step": 198850, "epoch": 4734} {"train_loss": -7.340533256530762, "global_step": 198851, "epoch": 4734} {"train_loss": -7.161309719085693, "global_step": 198852, "epoch": 4734} {"train_loss": -7.246009826660156, "global_step": 198853, "epoch": 4734} {"train_loss": -7.210194110870361, "global_step": 198854, "epoch": 4734} {"train_loss": -7.172323226928711, "global_step": 198855, "epoch": 4734} {"train_loss": -7.2824554443359375, "global_step": 198856, "epoch": 4734} {"train_loss": -7.1178178787231445, "global_step": 198857, "epoch": 4734} {"train_loss": -7.183165073394775, "global_step": 198858, "epoch": 4734} {"train_loss": -7.3001251220703125, "global_step": 198859, "epoch": 4734} {"train_loss": -7.20780611038208, "global_step": 198860, "epoch": 4734} {"train_loss": -7.329575538635254, "global_step": 198861, "epoch": 4734} {"train_loss": -7.227565765380859, "global_step": 198862, "epoch": 4734} {"train_loss": -7.236161231994629, "global_step": 198863, "epoch": 4734} {"train_loss": -7.328108787536621, "global_step": 198864, "epoch": 4734} {"train_loss": -7.223173141479492, "global_step": 198865, "epoch": 4734} {"train_loss": -7.3297905921936035, "global_step": 198866, "epoch": 4734} {"train_loss": -7.161904335021973, "global_step": 198867, "epoch": 4734} {"train_loss": -7.2075042724609375, "global_step": 198868, "epoch": 4734} {"train_loss": -7.235512597220285, "global_step": 198869, "epoch": 4734, "val_loss": 81460.0546875} {"train_loss": -7.357748031616211, "global_step": 198870, "epoch": 4735} {"train_loss": -7.341610908508301, "global_step": 198871, "epoch": 4735} {"train_loss": -7.345090389251709, "global_step": 198872, "epoch": 4735} {"train_loss": -7.262007713317871, "global_step": 198873, "epoch": 4735} {"train_loss": -7.173935890197754, "global_step": 198874, "epoch": 4735} {"train_loss": -7.356106758117676, "global_step": 198875, "epoch": 4735} {"train_loss": -7.289027690887451, "global_step": 198876, "epoch": 4735} {"train_loss": -7.249391078948975, "global_step": 198877, "epoch": 4735} {"train_loss": -7.36678409576416, "global_step": 198878, "epoch": 4735} {"train_loss": -7.38078498840332, "global_step": 198879, "epoch": 4735} {"train_loss": -7.357824325561523, "global_step": 198880, "epoch": 4735} {"train_loss": -7.195446968078613, "global_step": 198881, "epoch": 4735} {"train_loss": -7.369968414306641, "global_step": 198882, "epoch": 4735} {"train_loss": -7.159226417541504, "global_step": 198883, "epoch": 4735} {"train_loss": -7.339456558227539, "global_step": 198884, "epoch": 4735} {"train_loss": -7.328697681427002, "global_step": 198885, "epoch": 4735} {"train_loss": -7.312104225158691, "global_step": 198886, "epoch": 4735} {"train_loss": -7.257122993469238, "global_step": 198887, "epoch": 4735} {"train_loss": -7.26560640335083, "global_step": 198888, "epoch": 4735} {"train_loss": -7.2551374435424805, "global_step": 198889, "epoch": 4735} {"train_loss": -7.37235164642334, "global_step": 198890, "epoch": 4735} {"train_loss": -7.249098777770996, "global_step": 198891, "epoch": 4735} {"train_loss": -7.338504791259766, "global_step": 198892, "epoch": 4735} {"train_loss": -7.346027851104736, "global_step": 198893, "epoch": 4735} {"train_loss": -7.2853240966796875, "global_step": 198894, "epoch": 4735} {"train_loss": -7.394557476043701, "global_step": 198895, "epoch": 4735} {"train_loss": -7.380385875701904, "global_step": 198896, "epoch": 4735} {"train_loss": -7.175415992736816, "global_step": 198897, "epoch": 4735} {"train_loss": -7.320742607116699, "global_step": 198898, "epoch": 4735} {"train_loss": -7.32442045211792, "global_step": 198899, "epoch": 4735} {"train_loss": -7.2018818855285645, "global_step": 198900, "epoch": 4735} {"train_loss": -7.362508296966553, "global_step": 198901, "epoch": 4735} {"train_loss": -7.130160331726074, "global_step": 198902, "epoch": 4735} {"train_loss": -7.331302642822266, "global_step": 198903, "epoch": 4735} {"train_loss": -7.230773448944092, "global_step": 198904, "epoch": 4735} {"train_loss": -7.236034393310547, "global_step": 198905, "epoch": 4735} {"train_loss": -7.380890846252441, "global_step": 198906, "epoch": 4735} {"train_loss": -7.370119571685791, "global_step": 198907, "epoch": 4735} {"train_loss": -7.34993839263916, "global_step": 198908, "epoch": 4735} {"train_loss": -7.320751190185547, "global_step": 198909, "epoch": 4735} {"train_loss": -7.344827651977539, "global_step": 198910, "epoch": 4735} {"train_loss": -7.302496228899274, "global_step": 198911, "epoch": 4735, "val_loss": 81385.9140625} {"train_loss": -7.454189300537109, "global_step": 198912, "epoch": 4736} {"train_loss": -7.205485820770264, "global_step": 198913, "epoch": 4736} {"train_loss": -7.350077152252197, "global_step": 198914, "epoch": 4736} {"train_loss": -7.312520980834961, "global_step": 198915, "epoch": 4736} {"train_loss": -7.231435775756836, "global_step": 198916, "epoch": 4736} {"train_loss": -7.25299072265625, "global_step": 198917, "epoch": 4736} {"train_loss": -7.207529067993164, "global_step": 198918, "epoch": 4736} {"train_loss": -7.313763618469238, "global_step": 198919, "epoch": 4736} {"train_loss": -7.319252967834473, "global_step": 198920, "epoch": 4736} {"train_loss": -7.295523643493652, "global_step": 198921, "epoch": 4736} {"train_loss": -7.161157608032227, "global_step": 198922, "epoch": 4736} {"train_loss": -7.297961235046387, "global_step": 198923, "epoch": 4736} {"train_loss": -7.256524085998535, "global_step": 198924, "epoch": 4736} {"train_loss": -7.12149715423584, "global_step": 198925, "epoch": 4736} {"train_loss": -7.164825439453125, "global_step": 198926, "epoch": 4736} {"train_loss": -7.162010192871094, "global_step": 198927, "epoch": 4736} {"train_loss": -7.309542655944824, "global_step": 198928, "epoch": 4736} {"train_loss": -7.270512580871582, "global_step": 198929, "epoch": 4736} {"train_loss": -7.293834686279297, "global_step": 198930, "epoch": 4736} {"train_loss": -7.128255367279053, "global_step": 198931, "epoch": 4736} {"train_loss": -7.360248565673828, "global_step": 198932, "epoch": 4736} {"train_loss": -7.238279819488525, "global_step": 198933, "epoch": 4736} {"train_loss": -7.281771183013916, "global_step": 198934, "epoch": 4736} {"train_loss": -7.250705718994141, "global_step": 198935, "epoch": 4736} {"train_loss": -7.233465671539307, "global_step": 198936, "epoch": 4736} {"train_loss": -7.337810516357422, "global_step": 198937, "epoch": 4736} {"train_loss": -7.309168815612793, "global_step": 198938, "epoch": 4736} {"train_loss": -7.2900309562683105, "global_step": 198939, "epoch": 4736} {"train_loss": -7.244020462036133, "global_step": 198940, "epoch": 4736} {"train_loss": -7.192464828491211, "global_step": 198941, "epoch": 4736} {"train_loss": -7.228379726409912, "global_step": 198942, "epoch": 4736} {"train_loss": -7.135393142700195, "global_step": 198943, "epoch": 4736} {"train_loss": -7.2026190757751465, "global_step": 198944, "epoch": 4736} {"train_loss": -7.305773735046387, "global_step": 198945, "epoch": 4736} {"train_loss": -7.205348014831543, "global_step": 198946, "epoch": 4736} {"train_loss": -7.2457427978515625, "global_step": 198947, "epoch": 4736} {"train_loss": -7.117323875427246, "global_step": 198948, "epoch": 4736} {"train_loss": -7.24599552154541, "global_step": 198949, "epoch": 4736} {"train_loss": -7.0605669021606445, "global_step": 198950, "epoch": 4736} {"train_loss": -7.279948711395264, "global_step": 198951, "epoch": 4736} {"train_loss": -7.294253349304199, "global_step": 198952, "epoch": 4736} {"train_loss": -7.243831759407406, "global_step": 198953, "epoch": 4736, "val_loss": 81624.921875} {"train_loss": -7.132528305053711, "global_step": 198954, "epoch": 4737} {"train_loss": -7.0469889640808105, "global_step": 198955, "epoch": 4737} {"train_loss": -7.194274425506592, "global_step": 198956, "epoch": 4737} {"train_loss": -7.104794025421143, "global_step": 198957, "epoch": 4737} {"train_loss": -7.147016525268555, "global_step": 198958, "epoch": 4737} {"train_loss": -7.2614216804504395, "global_step": 198959, "epoch": 4737} {"train_loss": -7.188975811004639, "global_step": 198960, "epoch": 4737} {"train_loss": -7.20506477355957, "global_step": 198961, "epoch": 4737} {"train_loss": -7.206587791442871, "global_step": 198962, "epoch": 4737} {"train_loss": -7.275118350982666, "global_step": 198963, "epoch": 4737} {"train_loss": -7.230965614318848, "global_step": 198964, "epoch": 4737} {"train_loss": -7.27242374420166, "global_step": 198965, "epoch": 4737} {"train_loss": -7.230863571166992, "global_step": 198966, "epoch": 4737} {"train_loss": -7.095520973205566, "global_step": 198967, "epoch": 4737} {"train_loss": -7.161282062530518, "global_step": 198968, "epoch": 4737} {"train_loss": -7.166794300079346, "global_step": 198969, "epoch": 4737} {"train_loss": -7.212880611419678, "global_step": 198970, "epoch": 4737} {"train_loss": -7.110008716583252, "global_step": 198971, "epoch": 4737} {"train_loss": -7.194102764129639, "global_step": 198972, "epoch": 4737} {"train_loss": -7.23690938949585, "global_step": 198973, "epoch": 4737} {"train_loss": -7.264192581176758, "global_step": 198974, "epoch": 4737} {"train_loss": -7.202117919921875, "global_step": 198975, "epoch": 4737} {"train_loss": -7.2440643310546875, "global_step": 198976, "epoch": 4737} {"train_loss": -7.163717269897461, "global_step": 198977, "epoch": 4737} {"train_loss": -7.201040267944336, "global_step": 198978, "epoch": 4737} {"train_loss": -7.250137805938721, "global_step": 198979, "epoch": 4737} {"train_loss": -7.25532341003418, "global_step": 198980, "epoch": 4737} {"train_loss": -7.250177383422852, "global_step": 198981, "epoch": 4737} {"train_loss": -7.313626289367676, "global_step": 198982, "epoch": 4737} {"train_loss": -7.278352737426758, "global_step": 198983, "epoch": 4737} {"train_loss": -7.131824493408203, "global_step": 198984, "epoch": 4737} {"train_loss": -7.195626735687256, "global_step": 198985, "epoch": 4737} {"train_loss": -7.130451679229736, "global_step": 198986, "epoch": 4737} {"train_loss": -7.294551849365234, "global_step": 198987, "epoch": 4737} {"train_loss": -7.326216697692871, "global_step": 198988, "epoch": 4737} {"train_loss": -7.313556671142578, "global_step": 198989, "epoch": 4737} {"train_loss": -7.193701267242432, "global_step": 198990, "epoch": 4737} {"train_loss": -7.378595352172852, "global_step": 198991, "epoch": 4737} {"train_loss": -7.313779830932617, "global_step": 198992, "epoch": 4737} {"train_loss": -7.3535847663879395, "global_step": 198993, "epoch": 4737} {"train_loss": -7.282146453857422, "global_step": 198994, "epoch": 4737} {"train_loss": -7.221534581411452, "global_step": 198995, "epoch": 4737, "val_loss": 81295.078125} {"train_loss": -7.386499881744385, "global_step": 198996, "epoch": 4738} {"train_loss": -7.350395202636719, "global_step": 198997, "epoch": 4738} {"train_loss": -7.29043436050415, "global_step": 198998, "epoch": 4738} {"train_loss": -7.290087699890137, "global_step": 198999, "epoch": 4738} {"train_loss": -7.315366744995117, "global_step": 199000, "epoch": 4738} {"train_loss": -7.228930473327637, "global_step": 199001, "epoch": 4738} {"train_loss": -7.273058891296387, "global_step": 199002, "epoch": 4738} {"train_loss": -7.416143417358398, "global_step": 199003, "epoch": 4738} {"train_loss": -7.3467254638671875, "global_step": 199004, "epoch": 4738} {"train_loss": -7.253742694854736, "global_step": 199005, "epoch": 4738} {"train_loss": -7.247529029846191, "global_step": 199006, "epoch": 4738} {"train_loss": -7.436855792999268, "global_step": 199007, "epoch": 4738} {"train_loss": -7.404665946960449, "global_step": 199008, "epoch": 4738} {"train_loss": -7.175753593444824, "global_step": 199009, "epoch": 4738} {"train_loss": -7.271482467651367, "global_step": 199010, "epoch": 4738} {"train_loss": -7.216315269470215, "global_step": 199011, "epoch": 4738} {"train_loss": -7.30478572845459, "global_step": 199012, "epoch": 4738} {"train_loss": -7.269765853881836, "global_step": 199013, "epoch": 4738} {"train_loss": -7.316652297973633, "global_step": 199014, "epoch": 4738} {"train_loss": -7.2870917320251465, "global_step": 199015, "epoch": 4738} {"train_loss": -7.244933605194092, "global_step": 199016, "epoch": 4738} {"train_loss": -7.33996057510376, "global_step": 199017, "epoch": 4738} {"train_loss": -7.142645359039307, "global_step": 199018, "epoch": 4738} {"train_loss": -7.174327373504639, "global_step": 199019, "epoch": 4738} {"train_loss": -7.200692176818848, "global_step": 199020, "epoch": 4738} {"train_loss": -7.022644996643066, "global_step": 199021, "epoch": 4738} {"train_loss": -7.228316307067871, "global_step": 199022, "epoch": 4738} {"train_loss": -7.145082950592041, "global_step": 199023, "epoch": 4738} {"train_loss": -7.215171813964844, "global_step": 199024, "epoch": 4738} {"train_loss": -7.192354202270508, "global_step": 199025, "epoch": 4738} {"train_loss": -7.11360502243042, "global_step": 199026, "epoch": 4738} {"train_loss": -7.276087760925293, "global_step": 199027, "epoch": 4738} {"train_loss": -7.234348297119141, "global_step": 199028, "epoch": 4738} {"train_loss": -7.143912315368652, "global_step": 199029, "epoch": 4738} {"train_loss": -7.246959686279297, "global_step": 199030, "epoch": 4738} {"train_loss": -7.305941104888916, "global_step": 199031, "epoch": 4738} {"train_loss": -7.233452796936035, "global_step": 199032, "epoch": 4738} {"train_loss": -7.159664154052734, "global_step": 199033, "epoch": 4738} {"train_loss": -7.2876482009887695, "global_step": 199034, "epoch": 4738} {"train_loss": -7.3335466384887695, "global_step": 199035, "epoch": 4738} {"train_loss": -7.202181339263916, "global_step": 199036, "epoch": 4738} {"train_loss": -7.255289327530634, "global_step": 199037, "epoch": 4738, "val_loss": 81488.3984375} {"train_loss": -7.348116397857666, "global_step": 199038, "epoch": 4739} {"train_loss": -7.401180267333984, "global_step": 199039, "epoch": 4739} {"train_loss": -7.304640769958496, "global_step": 199040, "epoch": 4739} {"train_loss": -7.241785049438477, "global_step": 199041, "epoch": 4739} {"train_loss": -7.239019393920898, "global_step": 199042, "epoch": 4739} {"train_loss": -7.284321308135986, "global_step": 199043, "epoch": 4739} {"train_loss": -7.321146488189697, "global_step": 199044, "epoch": 4739} {"train_loss": -7.3055009841918945, "global_step": 199045, "epoch": 4739} {"train_loss": -7.369968891143799, "global_step": 199046, "epoch": 4739} {"train_loss": -7.389342308044434, "global_step": 199047, "epoch": 4739} {"train_loss": -7.1716766357421875, "global_step": 199048, "epoch": 4739} {"train_loss": -7.271529197692871, "global_step": 199049, "epoch": 4739} {"train_loss": -7.304113388061523, "global_step": 199050, "epoch": 4739} {"train_loss": -7.330775260925293, "global_step": 199051, "epoch": 4739} {"train_loss": -7.040870666503906, "global_step": 199052, "epoch": 4739} {"train_loss": -7.224387168884277, "global_step": 199053, "epoch": 4739} {"train_loss": -7.377657890319824, "global_step": 199054, "epoch": 4739} {"train_loss": -7.246944427490234, "global_step": 199055, "epoch": 4739} {"train_loss": -7.361804008483887, "global_step": 199056, "epoch": 4739} {"train_loss": -7.270230293273926, "global_step": 199057, "epoch": 4739} {"train_loss": -7.30461311340332, "global_step": 199058, "epoch": 4739} {"train_loss": -7.3780927658081055, "global_step": 199059, "epoch": 4739} {"train_loss": -7.236757278442383, "global_step": 199060, "epoch": 4739} {"train_loss": -7.388988971710205, "global_step": 199061, "epoch": 4739} {"train_loss": -7.260659694671631, "global_step": 199062, "epoch": 4739} {"train_loss": -7.198646545410156, "global_step": 199063, "epoch": 4739} {"train_loss": -7.164559841156006, "global_step": 199064, "epoch": 4739} {"train_loss": -7.20144510269165, "global_step": 199065, "epoch": 4739} {"train_loss": -7.198294162750244, "global_step": 199066, "epoch": 4739} {"train_loss": -7.220268249511719, "global_step": 199067, "epoch": 4739} {"train_loss": -7.29282283782959, "global_step": 199068, "epoch": 4739} {"train_loss": -7.3313493728637695, "global_step": 199069, "epoch": 4739} {"train_loss": -7.298956871032715, "global_step": 199070, "epoch": 4739} {"train_loss": -7.32227897644043, "global_step": 199071, "epoch": 4739} {"train_loss": -7.383492469787598, "global_step": 199072, "epoch": 4739} {"train_loss": -7.357220649719238, "global_step": 199073, "epoch": 4739} {"train_loss": -7.409348011016846, "global_step": 199074, "epoch": 4739} {"train_loss": -7.3382768630981445, "global_step": 199075, "epoch": 4739} {"train_loss": -7.393325328826904, "global_step": 199076, "epoch": 4739} {"train_loss": -7.337907791137695, "global_step": 199077, "epoch": 4739} {"train_loss": -7.180953025817871, "global_step": 199078, "epoch": 4739} {"train_loss": -7.292601732980637, "global_step": 199079, "epoch": 4739, "val_loss": 81432.3984375} {"train_loss": -7.302225112915039, "global_step": 199080, "epoch": 4740} {"train_loss": -7.248027801513672, "global_step": 199081, "epoch": 4740} {"train_loss": -7.337275505065918, "global_step": 199082, "epoch": 4740} {"train_loss": -7.2967939376831055, "global_step": 199083, "epoch": 4740} {"train_loss": -7.2477216720581055, "global_step": 199084, "epoch": 4740} {"train_loss": -7.317269325256348, "global_step": 199085, "epoch": 4740} {"train_loss": -7.2606611251831055, "global_step": 199086, "epoch": 4740} {"train_loss": -7.317584991455078, "global_step": 199087, "epoch": 4740} {"train_loss": -7.389988422393799, "global_step": 199088, "epoch": 4740} {"train_loss": -7.237095355987549, "global_step": 199089, "epoch": 4740} {"train_loss": -7.381129741668701, "global_step": 199090, "epoch": 4740} {"train_loss": -7.294586658477783, "global_step": 199091, "epoch": 4740} {"train_loss": -7.335681915283203, "global_step": 199092, "epoch": 4740} {"train_loss": -7.349155426025391, "global_step": 199093, "epoch": 4740} {"train_loss": -7.304459571838379, "global_step": 199094, "epoch": 4740} {"train_loss": -7.2339091300964355, "global_step": 199095, "epoch": 4740} {"train_loss": -7.227417469024658, "global_step": 199096, "epoch": 4740} {"train_loss": -7.343353271484375, "global_step": 199097, "epoch": 4740} {"train_loss": -7.310357570648193, "global_step": 199098, "epoch": 4740} {"train_loss": -7.339512825012207, "global_step": 199099, "epoch": 4740} {"train_loss": -7.2423176765441895, "global_step": 199100, "epoch": 4740} {"train_loss": -7.297323703765869, "global_step": 199101, "epoch": 4740} {"train_loss": -7.331820964813232, "global_step": 199102, "epoch": 4740} {"train_loss": -7.190187931060791, "global_step": 199103, "epoch": 4740} {"train_loss": -7.3430328369140625, "global_step": 199104, "epoch": 4740} {"train_loss": -7.303993225097656, "global_step": 199105, "epoch": 4740} {"train_loss": -7.250070571899414, "global_step": 199106, "epoch": 4740} {"train_loss": -7.189482688903809, "global_step": 199107, "epoch": 4740} {"train_loss": -7.371291160583496, "global_step": 199108, "epoch": 4740} {"train_loss": -7.224173069000244, "global_step": 199109, "epoch": 4740} {"train_loss": -7.286465167999268, "global_step": 199110, "epoch": 4740} {"train_loss": -7.346230506896973, "global_step": 199111, "epoch": 4740} {"train_loss": -7.232109546661377, "global_step": 199112, "epoch": 4740} {"train_loss": -7.353994846343994, "global_step": 199113, "epoch": 4740} {"train_loss": -7.220501899719238, "global_step": 199114, "epoch": 4740} {"train_loss": -7.318141937255859, "global_step": 199115, "epoch": 4740} {"train_loss": -7.409102439880371, "global_step": 199116, "epoch": 4740} {"train_loss": -7.322775840759277, "global_step": 199117, "epoch": 4740} {"train_loss": -7.342817306518555, "global_step": 199118, "epoch": 4740} {"train_loss": -7.377229690551758, "global_step": 199119, "epoch": 4740} {"train_loss": -7.355566024780273, "global_step": 199120, "epoch": 4740} {"train_loss": -7.303205501465571, "global_step": 199121, "epoch": 4740, "val_loss": 81427.8125} {"train_loss": -7.333595275878906, "global_step": 199122, "epoch": 4741} {"train_loss": -7.203876495361328, "global_step": 199123, "epoch": 4741} {"train_loss": -7.229043960571289, "global_step": 199124, "epoch": 4741} {"train_loss": -7.086568832397461, "global_step": 199125, "epoch": 4741} {"train_loss": -7.170339584350586, "global_step": 199126, "epoch": 4741} {"train_loss": -7.224205017089844, "global_step": 199127, "epoch": 4741} {"train_loss": -6.940057754516602, "global_step": 199128, "epoch": 4741} {"train_loss": -7.215543746948242, "global_step": 199129, "epoch": 4741} {"train_loss": -6.951407432556152, "global_step": 199130, "epoch": 4741} {"train_loss": -7.103358745574951, "global_step": 199131, "epoch": 4741} {"train_loss": -7.049624443054199, "global_step": 199132, "epoch": 4741} {"train_loss": -7.034833908081055, "global_step": 199133, "epoch": 4741} {"train_loss": -7.180418968200684, "global_step": 199134, "epoch": 4741} {"train_loss": -7.060515880584717, "global_step": 199135, "epoch": 4741} {"train_loss": -7.187989711761475, "global_step": 199136, "epoch": 4741} {"train_loss": -7.142597198486328, "global_step": 199137, "epoch": 4741} {"train_loss": -7.268899917602539, "global_step": 199138, "epoch": 4741} {"train_loss": -7.100266456604004, "global_step": 199139, "epoch": 4741} {"train_loss": -7.1679792404174805, "global_step": 199140, "epoch": 4741} {"train_loss": -7.153726577758789, "global_step": 199141, "epoch": 4741} {"train_loss": -7.173735618591309, "global_step": 199142, "epoch": 4741} {"train_loss": -7.226642608642578, "global_step": 199143, "epoch": 4741} {"train_loss": -7.270162105560303, "global_step": 199144, "epoch": 4741} {"train_loss": -7.222675323486328, "global_step": 199145, "epoch": 4741} {"train_loss": -7.21826171875, "global_step": 199146, "epoch": 4741} {"train_loss": -7.209529876708984, "global_step": 199147, "epoch": 4741} {"train_loss": -7.326214790344238, "global_step": 199148, "epoch": 4741} {"train_loss": -7.275768280029297, "global_step": 199149, "epoch": 4741} {"train_loss": -7.116683006286621, "global_step": 199150, "epoch": 4741} {"train_loss": -7.35914421081543, "global_step": 199151, "epoch": 4741} {"train_loss": -7.215939044952393, "global_step": 199152, "epoch": 4741} {"train_loss": -7.321495532989502, "global_step": 199153, "epoch": 4741} {"train_loss": -7.107065677642822, "global_step": 199154, "epoch": 4741} {"train_loss": -7.371248245239258, "global_step": 199155, "epoch": 4741} {"train_loss": -7.266139030456543, "global_step": 199156, "epoch": 4741} {"train_loss": -7.236780166625977, "global_step": 199157, "epoch": 4741} {"train_loss": -7.335207462310791, "global_step": 199158, "epoch": 4741} {"train_loss": -7.333520889282227, "global_step": 199159, "epoch": 4741} {"train_loss": -7.294992923736572, "global_step": 199160, "epoch": 4741} {"train_loss": -7.31425142288208, "global_step": 199161, "epoch": 4741} {"train_loss": -7.2924580574035645, "global_step": 199162, "epoch": 4741} {"train_loss": -7.205346118836176, "global_step": 199163, "epoch": 4741, "val_loss": 81365.046875} {"train_loss": -7.288024425506592, "global_step": 199164, "epoch": 4742} {"train_loss": -7.293282508850098, "global_step": 199165, "epoch": 4742} {"train_loss": -7.385313510894775, "global_step": 199166, "epoch": 4742} {"train_loss": -7.334987640380859, "global_step": 199167, "epoch": 4742} {"train_loss": -7.327746391296387, "global_step": 199168, "epoch": 4742} {"train_loss": -7.384902000427246, "global_step": 199169, "epoch": 4742} {"train_loss": -7.391900539398193, "global_step": 199170, "epoch": 4742} {"train_loss": -7.369707107543945, "global_step": 199171, "epoch": 4742} {"train_loss": -7.4118547439575195, "global_step": 199172, "epoch": 4742} {"train_loss": -7.43436336517334, "global_step": 199173, "epoch": 4742} {"train_loss": -7.406363487243652, "global_step": 199174, "epoch": 4742} {"train_loss": -7.306839942932129, "global_step": 199175, "epoch": 4742} {"train_loss": -7.42407751083374, "global_step": 199176, "epoch": 4742} {"train_loss": -7.383155345916748, "global_step": 199177, "epoch": 4742} {"train_loss": -7.358572959899902, "global_step": 199178, "epoch": 4742} {"train_loss": -7.201960563659668, "global_step": 199179, "epoch": 4742} {"train_loss": -7.315340042114258, "global_step": 199180, "epoch": 4742} {"train_loss": -7.287814140319824, "global_step": 199181, "epoch": 4742} {"train_loss": -7.179085731506348, "global_step": 199182, "epoch": 4742} {"train_loss": -7.314648628234863, "global_step": 199183, "epoch": 4742} {"train_loss": -7.234939098358154, "global_step": 199184, "epoch": 4742} {"train_loss": -7.303226470947266, "global_step": 199185, "epoch": 4742} {"train_loss": -7.302947521209717, "global_step": 199186, "epoch": 4742} {"train_loss": -7.228764533996582, "global_step": 199187, "epoch": 4742} {"train_loss": -7.175017833709717, "global_step": 199188, "epoch": 4742} {"train_loss": -7.2295074462890625, "global_step": 199189, "epoch": 4742} {"train_loss": -7.360173225402832, "global_step": 199190, "epoch": 4742} {"train_loss": -7.310159206390381, "global_step": 199191, "epoch": 4742} {"train_loss": -7.224255084991455, "global_step": 199192, "epoch": 4742} {"train_loss": -7.225865364074707, "global_step": 199193, "epoch": 4742} {"train_loss": -7.222655773162842, "global_step": 199194, "epoch": 4742} {"train_loss": -7.270346164703369, "global_step": 199195, "epoch": 4742} {"train_loss": -7.270351409912109, "global_step": 199196, "epoch": 4742} {"train_loss": -7.246263027191162, "global_step": 199197, "epoch": 4742} {"train_loss": -7.31129789352417, "global_step": 199198, "epoch": 4742} {"train_loss": -7.204181671142578, "global_step": 199199, "epoch": 4742} {"train_loss": -7.293911933898926, "global_step": 199200, "epoch": 4742} {"train_loss": -7.257172107696533, "global_step": 199201, "epoch": 4742} {"train_loss": -7.269619464874268, "global_step": 199202, "epoch": 4742} {"train_loss": -7.1450300216674805, "global_step": 199203, "epoch": 4742} {"train_loss": -7.353584289550781, "global_step": 199204, "epoch": 4742} {"train_loss": -7.297026838575091, "global_step": 199205, "epoch": 4742, "val_loss": 81434.9140625} {"train_loss": -7.251716136932373, "global_step": 199206, "epoch": 4743} {"train_loss": -7.389129638671875, "global_step": 199207, "epoch": 4743} {"train_loss": -7.31704044342041, "global_step": 199208, "epoch": 4743} {"train_loss": -7.181917190551758, "global_step": 199209, "epoch": 4743} {"train_loss": -7.295526504516602, "global_step": 199210, "epoch": 4743} {"train_loss": -7.277806282043457, "global_step": 199211, "epoch": 4743} {"train_loss": -7.236478805541992, "global_step": 199212, "epoch": 4743} {"train_loss": -7.164356708526611, "global_step": 199213, "epoch": 4743} {"train_loss": -7.2632246017456055, "global_step": 199214, "epoch": 4743} {"train_loss": -7.119345188140869, "global_step": 199215, "epoch": 4743} {"train_loss": -7.338441371917725, "global_step": 199216, "epoch": 4743} {"train_loss": -7.188806056976318, "global_step": 199217, "epoch": 4743} {"train_loss": -7.364212512969971, "global_step": 199218, "epoch": 4743} {"train_loss": -7.117992877960205, "global_step": 199219, "epoch": 4743} {"train_loss": -7.310009956359863, "global_step": 199220, "epoch": 4743} {"train_loss": -7.221034526824951, "global_step": 199221, "epoch": 4743} {"train_loss": -7.350679397583008, "global_step": 199222, "epoch": 4743} {"train_loss": -7.324051856994629, "global_step": 199223, "epoch": 4743} {"train_loss": -7.330152988433838, "global_step": 199224, "epoch": 4743} {"train_loss": -7.283278465270996, "global_step": 199225, "epoch": 4743} {"train_loss": -7.165385723114014, "global_step": 199226, "epoch": 4743} {"train_loss": -7.391456127166748, "global_step": 199227, "epoch": 4743} {"train_loss": -7.279019355773926, "global_step": 199228, "epoch": 4743} {"train_loss": -7.335087776184082, "global_step": 199229, "epoch": 4743} {"train_loss": -7.168747901916504, "global_step": 199230, "epoch": 4743} {"train_loss": -7.270320892333984, "global_step": 199231, "epoch": 4743} {"train_loss": -7.357569694519043, "global_step": 199232, "epoch": 4743} {"train_loss": -7.2883734703063965, "global_step": 199233, "epoch": 4743} {"train_loss": -7.2830400466918945, "global_step": 199234, "epoch": 4743} {"train_loss": -7.417111396789551, "global_step": 199235, "epoch": 4743} {"train_loss": -7.278990268707275, "global_step": 199236, "epoch": 4743} {"train_loss": -7.307397365570068, "global_step": 199237, "epoch": 4743} {"train_loss": -7.301214694976807, "global_step": 199238, "epoch": 4743} {"train_loss": -7.300786972045898, "global_step": 199239, "epoch": 4743} {"train_loss": -7.264980316162109, "global_step": 199240, "epoch": 4743} {"train_loss": -7.299177169799805, "global_step": 199241, "epoch": 4743} {"train_loss": -7.292996406555176, "global_step": 199242, "epoch": 4743} {"train_loss": -7.2230939865112305, "global_step": 199243, "epoch": 4743} {"train_loss": -7.299121856689453, "global_step": 199244, "epoch": 4743} {"train_loss": -7.270885944366455, "global_step": 199245, "epoch": 4743} {"train_loss": -7.24684476852417, "global_step": 199246, "epoch": 4743} {"train_loss": -7.275012186595371, "global_step": 199247, "epoch": 4743, "val_loss": 81258.265625} {"train_loss": -7.262202739715576, "global_step": 199248, "epoch": 4744} {"train_loss": -7.386968612670898, "global_step": 199249, "epoch": 4744} {"train_loss": -7.232767105102539, "global_step": 199250, "epoch": 4744} {"train_loss": -7.33223819732666, "global_step": 199251, "epoch": 4744} {"train_loss": -7.273624420166016, "global_step": 199252, "epoch": 4744} {"train_loss": -7.323417663574219, "global_step": 199253, "epoch": 4744} {"train_loss": -7.389674186706543, "global_step": 199254, "epoch": 4744} {"train_loss": -7.406704902648926, "global_step": 199255, "epoch": 4744} {"train_loss": -7.367283821105957, "global_step": 199256, "epoch": 4744} {"train_loss": -7.229171276092529, "global_step": 199257, "epoch": 4744} {"train_loss": -7.26910400390625, "global_step": 199258, "epoch": 4744} {"train_loss": -7.26624870300293, "global_step": 199259, "epoch": 4744} {"train_loss": -7.32442045211792, "global_step": 199260, "epoch": 4744} {"train_loss": -7.207482814788818, "global_step": 199261, "epoch": 4744} {"train_loss": -7.222375869750977, "global_step": 199262, "epoch": 4744} {"train_loss": -7.125912189483643, "global_step": 199263, "epoch": 4744} {"train_loss": -7.220611572265625, "global_step": 199264, "epoch": 4744} {"train_loss": -7.350744724273682, "global_step": 199265, "epoch": 4744} {"train_loss": -7.1667094230651855, "global_step": 199266, "epoch": 4744} {"train_loss": -7.1916608810424805, "global_step": 199267, "epoch": 4744} {"train_loss": -7.343510150909424, "global_step": 199268, "epoch": 4744} {"train_loss": -7.168010711669922, "global_step": 199269, "epoch": 4744} {"train_loss": -7.306458473205566, "global_step": 199270, "epoch": 4744} {"train_loss": -7.302732467651367, "global_step": 199271, "epoch": 4744} {"train_loss": -7.205974102020264, "global_step": 199272, "epoch": 4744} {"train_loss": -7.3338117599487305, "global_step": 199273, "epoch": 4744} {"train_loss": -7.27742862701416, "global_step": 199274, "epoch": 4744} {"train_loss": -7.326218605041504, "global_step": 199275, "epoch": 4744} {"train_loss": -7.256874084472656, "global_step": 199276, "epoch": 4744} {"train_loss": -7.293590545654297, "global_step": 199277, "epoch": 4744} {"train_loss": -7.28587532043457, "global_step": 199278, "epoch": 4744} {"train_loss": -7.306653022766113, "global_step": 199279, "epoch": 4744} {"train_loss": -7.318016052246094, "global_step": 199280, "epoch": 4744} {"train_loss": -7.408868789672852, "global_step": 199281, "epoch": 4744} {"train_loss": -7.371469020843506, "global_step": 199282, "epoch": 4744} {"train_loss": -7.279603481292725, "global_step": 199283, "epoch": 4744} {"train_loss": -7.335902214050293, "global_step": 199284, "epoch": 4744} {"train_loss": -7.325650215148926, "global_step": 199285, "epoch": 4744} {"train_loss": -7.219817638397217, "global_step": 199286, "epoch": 4744} {"train_loss": -7.300016403198242, "global_step": 199287, "epoch": 4744} {"train_loss": -7.311160564422607, "global_step": 199288, "epoch": 4744} {"train_loss": -7.289533660525367, "global_step": 199289, "epoch": 4744, "val_loss": 81427.734375} {"train_loss": -7.322979927062988, "global_step": 199290, "epoch": 4745} {"train_loss": -7.347542762756348, "global_step": 199291, "epoch": 4745} {"train_loss": -7.335273742675781, "global_step": 199292, "epoch": 4745} {"train_loss": -7.359509468078613, "global_step": 199293, "epoch": 4745} {"train_loss": -7.291800498962402, "global_step": 199294, "epoch": 4745} {"train_loss": -7.426539897918701, "global_step": 199295, "epoch": 4745} {"train_loss": -7.372600555419922, "global_step": 199296, "epoch": 4745} {"train_loss": -7.29949951171875, "global_step": 199297, "epoch": 4745} {"train_loss": -7.461578369140625, "global_step": 199298, "epoch": 4745} {"train_loss": -7.369562149047852, "global_step": 199299, "epoch": 4745} {"train_loss": -7.422295570373535, "global_step": 199300, "epoch": 4745} {"train_loss": -7.392188549041748, "global_step": 199301, "epoch": 4745} {"train_loss": -7.424809455871582, "global_step": 199302, "epoch": 4745} {"train_loss": -7.4676947593688965, "global_step": 199303, "epoch": 4745} {"train_loss": -7.337852478027344, "global_step": 199304, "epoch": 4745} {"train_loss": -7.407934188842773, "global_step": 199305, "epoch": 4745} {"train_loss": -7.403087615966797, "global_step": 199306, "epoch": 4745} {"train_loss": -7.462815761566162, "global_step": 199307, "epoch": 4745} {"train_loss": -7.385840892791748, "global_step": 199308, "epoch": 4745} {"train_loss": -7.431597709655762, "global_step": 199309, "epoch": 4745} {"train_loss": -7.343462944030762, "global_step": 199310, "epoch": 4745} {"train_loss": -7.455938816070557, "global_step": 199311, "epoch": 4745} {"train_loss": -7.390567302703857, "global_step": 199312, "epoch": 4745} {"train_loss": -7.377274990081787, "global_step": 199313, "epoch": 4745} {"train_loss": -7.285472869873047, "global_step": 199314, "epoch": 4745} {"train_loss": -7.311089515686035, "global_step": 199315, "epoch": 4745} {"train_loss": -7.210379600524902, "global_step": 199316, "epoch": 4745} {"train_loss": -7.22586727142334, "global_step": 199317, "epoch": 4745} {"train_loss": -7.229427337646484, "global_step": 199318, "epoch": 4745} {"train_loss": -7.180003643035889, "global_step": 199319, "epoch": 4745} {"train_loss": -7.0967206954956055, "global_step": 199320, "epoch": 4745} {"train_loss": -7.10406494140625, "global_step": 199321, "epoch": 4745} {"train_loss": -7.17454195022583, "global_step": 199322, "epoch": 4745} {"train_loss": -7.126035690307617, "global_step": 199323, "epoch": 4745} {"train_loss": -7.126489639282227, "global_step": 199324, "epoch": 4745} {"train_loss": -7.173484802246094, "global_step": 199325, "epoch": 4745} {"train_loss": -7.09755802154541, "global_step": 199326, "epoch": 4745} {"train_loss": -7.232944011688232, "global_step": 199327, "epoch": 4745} {"train_loss": -7.083327293395996, "global_step": 199328, "epoch": 4745} {"train_loss": -7.14838171005249, "global_step": 199329, "epoch": 4745} {"train_loss": -7.210969924926758, "global_step": 199330, "epoch": 4745} {"train_loss": -7.296349309739613, "global_step": 199331, "epoch": 4745, "val_loss": 81466.9453125} {"train_loss": -7.189213752746582, "global_step": 199332, "epoch": 4746} {"train_loss": -7.106398582458496, "global_step": 199333, "epoch": 4746} {"train_loss": -7.120541572570801, "global_step": 199334, "epoch": 4746} {"train_loss": -7.214768886566162, "global_step": 199335, "epoch": 4746} {"train_loss": -7.276788711547852, "global_step": 199336, "epoch": 4746} {"train_loss": -7.152502059936523, "global_step": 199337, "epoch": 4746} {"train_loss": -7.195074081420898, "global_step": 199338, "epoch": 4746} {"train_loss": -7.222930908203125, "global_step": 199339, "epoch": 4746} {"train_loss": -7.195905685424805, "global_step": 199340, "epoch": 4746} {"train_loss": -7.144308090209961, "global_step": 199341, "epoch": 4746} {"train_loss": -7.219776153564453, "global_step": 199342, "epoch": 4746} {"train_loss": -7.170232772827148, "global_step": 199343, "epoch": 4746} {"train_loss": -7.239410400390625, "global_step": 199344, "epoch": 4746} {"train_loss": -7.117572784423828, "global_step": 199345, "epoch": 4746} {"train_loss": -7.180464744567871, "global_step": 199346, "epoch": 4746} {"train_loss": -7.175036430358887, "global_step": 199347, "epoch": 4746} {"train_loss": -7.1721930503845215, "global_step": 199348, "epoch": 4746} {"train_loss": -7.229995250701904, "global_step": 199349, "epoch": 4746} {"train_loss": -7.241085052490234, "global_step": 199350, "epoch": 4746} {"train_loss": -7.175137519836426, "global_step": 199351, "epoch": 4746} {"train_loss": -7.1730451583862305, "global_step": 199352, "epoch": 4746} {"train_loss": -7.229107856750488, "global_step": 199353, "epoch": 4746} {"train_loss": -7.219419479370117, "global_step": 199354, "epoch": 4746} {"train_loss": -7.224028587341309, "global_step": 199355, "epoch": 4746} {"train_loss": -7.277112007141113, "global_step": 199356, "epoch": 4746} {"train_loss": -7.157347679138184, "global_step": 199357, "epoch": 4746} {"train_loss": -7.182683944702148, "global_step": 199358, "epoch": 4746} {"train_loss": -7.261017799377441, "global_step": 199359, "epoch": 4746} {"train_loss": -7.2180609703063965, "global_step": 199360, "epoch": 4746} {"train_loss": -7.215000629425049, "global_step": 199361, "epoch": 4746} {"train_loss": -7.282458782196045, "global_step": 199362, "epoch": 4746} {"train_loss": -7.246905326843262, "global_step": 199363, "epoch": 4746} {"train_loss": -7.252590656280518, "global_step": 199364, "epoch": 4746} {"train_loss": -7.29595947265625, "global_step": 199365, "epoch": 4746} {"train_loss": -7.200265884399414, "global_step": 199366, "epoch": 4746} {"train_loss": -7.264294624328613, "global_step": 199367, "epoch": 4746} {"train_loss": -7.157478332519531, "global_step": 199368, "epoch": 4746} {"train_loss": -7.321907043457031, "global_step": 199369, "epoch": 4746} {"train_loss": -7.300310134887695, "global_step": 199370, "epoch": 4746} {"train_loss": -7.268345832824707, "global_step": 199371, "epoch": 4746} {"train_loss": -7.315753936767578, "global_step": 199372, "epoch": 4746} {"train_loss": -7.21776008605957, "global_step": 199373, "epoch": 4746, "val_loss": 81691.1875} {"train_loss": -7.329394340515137, "global_step": 199374, "epoch": 4747} {"train_loss": -7.4009528160095215, "global_step": 199375, "epoch": 4747} {"train_loss": -7.378871917724609, "global_step": 199376, "epoch": 4747} {"train_loss": -7.431225776672363, "global_step": 199377, "epoch": 4747} {"train_loss": -7.283289909362793, "global_step": 199378, "epoch": 4747} {"train_loss": -7.360620498657227, "global_step": 199379, "epoch": 4747} {"train_loss": -7.326639175415039, "global_step": 199380, "epoch": 4747} {"train_loss": -7.4217681884765625, "global_step": 199381, "epoch": 4747} {"train_loss": -7.338296890258789, "global_step": 199382, "epoch": 4747} {"train_loss": -7.388472557067871, "global_step": 199383, "epoch": 4747} {"train_loss": -7.426703453063965, "global_step": 199384, "epoch": 4747} {"train_loss": -7.368740558624268, "global_step": 199385, "epoch": 4747} {"train_loss": -7.235348701477051, "global_step": 199386, "epoch": 4747} {"train_loss": -7.375417709350586, "global_step": 199387, "epoch": 4747} {"train_loss": -7.295106887817383, "global_step": 199388, "epoch": 4747} {"train_loss": -7.410881042480469, "global_step": 199389, "epoch": 4747} {"train_loss": -7.295167922973633, "global_step": 199390, "epoch": 4747} {"train_loss": -7.38284969329834, "global_step": 199391, "epoch": 4747} {"train_loss": -7.295233726501465, "global_step": 199392, "epoch": 4747} {"train_loss": -7.377965927124023, "global_step": 199393, "epoch": 4747} {"train_loss": -7.362070560455322, "global_step": 199394, "epoch": 4747} {"train_loss": -7.345364570617676, "global_step": 199395, "epoch": 4747} {"train_loss": -7.409476280212402, "global_step": 199396, "epoch": 4747} {"train_loss": -7.463253021240234, "global_step": 199397, "epoch": 4747} {"train_loss": -7.3127546310424805, "global_step": 199398, "epoch": 4747} {"train_loss": -7.421220779418945, "global_step": 199399, "epoch": 4747} {"train_loss": -7.398780822753906, "global_step": 199400, "epoch": 4747} {"train_loss": -7.343493461608887, "global_step": 199401, "epoch": 4747} {"train_loss": -7.401665687561035, "global_step": 199402, "epoch": 4747} {"train_loss": -7.297060966491699, "global_step": 199403, "epoch": 4747} {"train_loss": -7.296658515930176, "global_step": 199404, "epoch": 4747} {"train_loss": -7.262663841247559, "global_step": 199405, "epoch": 4747} {"train_loss": -7.343570709228516, "global_step": 199406, "epoch": 4747} {"train_loss": -7.441411972045898, "global_step": 199407, "epoch": 4747} {"train_loss": -7.328238487243652, "global_step": 199408, "epoch": 4747} {"train_loss": -7.31587553024292, "global_step": 199409, "epoch": 4747} {"train_loss": -7.386492729187012, "global_step": 199410, "epoch": 4747} {"train_loss": -7.21451997756958, "global_step": 199411, "epoch": 4747} {"train_loss": -7.286559104919434, "global_step": 199412, "epoch": 4747} {"train_loss": -7.3382487297058105, "global_step": 199413, "epoch": 4747} {"train_loss": -7.412947654724121, "global_step": 199414, "epoch": 4747} {"train_loss": -7.3519746121906095, "global_step": 199415, "epoch": 4747, "val_loss": 81521.6328125} {"train_loss": -7.330897331237793, "global_step": 199416, "epoch": 4748} {"train_loss": -7.332890510559082, "global_step": 199417, "epoch": 4748} {"train_loss": -7.361266136169434, "global_step": 199418, "epoch": 4748} {"train_loss": -7.371020317077637, "global_step": 199419, "epoch": 4748} {"train_loss": -7.326806545257568, "global_step": 199420, "epoch": 4748} {"train_loss": -7.349725723266602, "global_step": 199421, "epoch": 4748} {"train_loss": -7.512457370758057, "global_step": 199422, "epoch": 4748} {"train_loss": -7.333325386047363, "global_step": 199423, "epoch": 4748} {"train_loss": -7.281588554382324, "global_step": 199424, "epoch": 4748} {"train_loss": -7.375917434692383, "global_step": 199425, "epoch": 4748} {"train_loss": -7.409946441650391, "global_step": 199426, "epoch": 4748} {"train_loss": -7.339395046234131, "global_step": 199427, "epoch": 4748} {"train_loss": -7.393756866455078, "global_step": 199428, "epoch": 4748} {"train_loss": -7.221213340759277, "global_step": 199429, "epoch": 4748} {"train_loss": -7.3139801025390625, "global_step": 199430, "epoch": 4748} {"train_loss": -7.40673828125, "global_step": 199431, "epoch": 4748} {"train_loss": -7.424158096313477, "global_step": 199432, "epoch": 4748} {"train_loss": -7.278354167938232, "global_step": 199433, "epoch": 4748} {"train_loss": -7.295057773590088, "global_step": 199434, "epoch": 4748} {"train_loss": -7.076424598693848, "global_step": 199435, "epoch": 4748} {"train_loss": -7.334692001342773, "global_step": 199436, "epoch": 4748} {"train_loss": -7.330875396728516, "global_step": 199437, "epoch": 4748} {"train_loss": -7.2990922927856445, "global_step": 199438, "epoch": 4748} {"train_loss": -7.355892181396484, "global_step": 199439, "epoch": 4748} {"train_loss": -7.279494285583496, "global_step": 199440, "epoch": 4748} {"train_loss": -7.291272163391113, "global_step": 199441, "epoch": 4748} {"train_loss": -7.115880012512207, "global_step": 199442, "epoch": 4748} {"train_loss": -7.29526424407959, "global_step": 199443, "epoch": 4748} {"train_loss": -7.0923566818237305, "global_step": 199444, "epoch": 4748} {"train_loss": -7.046878814697266, "global_step": 199445, "epoch": 4748} {"train_loss": -7.264102935791016, "global_step": 199446, "epoch": 4748} {"train_loss": -7.163963317871094, "global_step": 199447, "epoch": 4748} {"train_loss": -7.258942604064941, "global_step": 199448, "epoch": 4748} {"train_loss": -7.354795455932617, "global_step": 199449, "epoch": 4748} {"train_loss": -7.18436336517334, "global_step": 199450, "epoch": 4748} {"train_loss": -7.1967267990112305, "global_step": 199451, "epoch": 4748} {"train_loss": -7.182238578796387, "global_step": 199452, "epoch": 4748} {"train_loss": -7.136504173278809, "global_step": 199453, "epoch": 4748} {"train_loss": -7.165233135223389, "global_step": 199454, "epoch": 4748} {"train_loss": -7.182856559753418, "global_step": 199455, "epoch": 4748} {"train_loss": -7.177365303039551, "global_step": 199456, "epoch": 4748} {"train_loss": -7.276109082358224, "global_step": 199457, "epoch": 4748, "val_loss": 81713.2421875} {"train_loss": -7.2160234451293945, "global_step": 199458, "epoch": 4749} {"train_loss": -7.0707316398620605, "global_step": 199459, "epoch": 4749} {"train_loss": -7.274798393249512, "global_step": 199460, "epoch": 4749} {"train_loss": -7.144303321838379, "global_step": 199461, "epoch": 4749} {"train_loss": -7.201127052307129, "global_step": 199462, "epoch": 4749} {"train_loss": -7.1472272872924805, "global_step": 199463, "epoch": 4749} {"train_loss": -7.2194108963012695, "global_step": 199464, "epoch": 4749} {"train_loss": -7.1213459968566895, "global_step": 199465, "epoch": 4749} {"train_loss": -7.1705803871154785, "global_step": 199466, "epoch": 4749} {"train_loss": -7.194511413574219, "global_step": 199467, "epoch": 4749} {"train_loss": -7.283899784088135, "global_step": 199468, "epoch": 4749} {"train_loss": -7.181556701660156, "global_step": 199469, "epoch": 4749} {"train_loss": -7.111710071563721, "global_step": 199470, "epoch": 4749} {"train_loss": -7.223977565765381, "global_step": 199471, "epoch": 4749} {"train_loss": -7.247411727905273, "global_step": 199472, "epoch": 4749} {"train_loss": -7.15320348739624, "global_step": 199473, "epoch": 4749} {"train_loss": -7.19630241394043, "global_step": 199474, "epoch": 4749} {"train_loss": -7.245020389556885, "global_step": 199475, "epoch": 4749} {"train_loss": -7.1101884841918945, "global_step": 199476, "epoch": 4749} {"train_loss": -7.258550643920898, "global_step": 199477, "epoch": 4749} {"train_loss": -7.215012550354004, "global_step": 199478, "epoch": 4749} {"train_loss": -7.188923358917236, "global_step": 199479, "epoch": 4749} {"train_loss": -7.182847023010254, "global_step": 199480, "epoch": 4749} {"train_loss": -7.248401165008545, "global_step": 199481, "epoch": 4749} {"train_loss": -7.353699684143066, "global_step": 199482, "epoch": 4749} {"train_loss": -7.2767767906188965, "global_step": 199483, "epoch": 4749} {"train_loss": -7.2962965965271, "global_step": 199484, "epoch": 4749} {"train_loss": -7.2729268074035645, "global_step": 199485, "epoch": 4749} {"train_loss": -7.32041597366333, "global_step": 199486, "epoch": 4749} {"train_loss": -7.248893737792969, "global_step": 199487, "epoch": 4749} {"train_loss": -7.21097469329834, "global_step": 199488, "epoch": 4749} {"train_loss": -7.218847274780273, "global_step": 199489, "epoch": 4749} {"train_loss": -7.148134708404541, "global_step": 199490, "epoch": 4749} {"train_loss": -7.379809379577637, "global_step": 199491, "epoch": 4749} {"train_loss": -7.375724792480469, "global_step": 199492, "epoch": 4749} {"train_loss": -7.224888801574707, "global_step": 199493, "epoch": 4749} {"train_loss": -7.322005271911621, "global_step": 199494, "epoch": 4749} {"train_loss": -7.339013576507568, "global_step": 199495, "epoch": 4749} {"train_loss": -7.258367538452148, "global_step": 199496, "epoch": 4749} {"train_loss": -7.405208587646484, "global_step": 199497, "epoch": 4749} {"train_loss": -7.27125358581543, "global_step": 199498, "epoch": 4749} {"train_loss": -7.234014783586774, "global_step": 199499, "epoch": 4749, "val_loss": 81581.3984375} {"train_loss": -7.388574600219727, "global_step": 199500, "epoch": 4750} {"train_loss": -7.258876800537109, "global_step": 199501, "epoch": 4750} {"train_loss": -7.3055009841918945, "global_step": 199502, "epoch": 4750} {"train_loss": -7.185870170593262, "global_step": 199503, "epoch": 4750} {"train_loss": -7.373392105102539, "global_step": 199504, "epoch": 4750} {"train_loss": -7.288002014160156, "global_step": 199505, "epoch": 4750} {"train_loss": -7.148871421813965, "global_step": 199506, "epoch": 4750} {"train_loss": -7.156528472900391, "global_step": 199507, "epoch": 4750} {"train_loss": -7.1835713386535645, "global_step": 199508, "epoch": 4750} {"train_loss": -7.321654319763184, "global_step": 199509, "epoch": 4750} {"train_loss": -7.156036376953125, "global_step": 199510, "epoch": 4750} {"train_loss": -7.2789306640625, "global_step": 199511, "epoch": 4750} {"train_loss": -7.200333595275879, "global_step": 199512, "epoch": 4750} {"train_loss": -7.3585429191589355, "global_step": 199513, "epoch": 4750} {"train_loss": -7.310313701629639, "global_step": 199514, "epoch": 4750} {"train_loss": -7.304220199584961, "global_step": 199515, "epoch": 4750} {"train_loss": -7.373714923858643, "global_step": 199516, "epoch": 4750} {"train_loss": -7.162802696228027, "global_step": 199517, "epoch": 4750} {"train_loss": -7.27901554107666, "global_step": 199518, "epoch": 4750} {"train_loss": -7.413595199584961, "global_step": 199519, "epoch": 4750} {"train_loss": -7.225214004516602, "global_step": 199520, "epoch": 4750} {"train_loss": -7.324371814727783, "global_step": 199521, "epoch": 4750} {"train_loss": -7.297202110290527, "global_step": 199522, "epoch": 4750} {"train_loss": -7.260769367218018, "global_step": 199523, "epoch": 4750} {"train_loss": -7.439997673034668, "global_step": 199524, "epoch": 4750} {"train_loss": -7.2974677085876465, "global_step": 199525, "epoch": 4750} {"train_loss": -7.544055938720703, "global_step": 199526, "epoch": 4750} {"train_loss": -7.325803756713867, "global_step": 199527, "epoch": 4750} {"train_loss": -7.231513023376465, "global_step": 199528, "epoch": 4750} {"train_loss": -7.347256660461426, "global_step": 199529, "epoch": 4750} {"train_loss": -7.327312469482422, "global_step": 199530, "epoch": 4750} {"train_loss": -7.34741735458374, "global_step": 199531, "epoch": 4750} {"train_loss": -7.3561625480651855, "global_step": 199532, "epoch": 4750} {"train_loss": -7.3681511878967285, "global_step": 199533, "epoch": 4750} {"train_loss": -7.23716926574707, "global_step": 199534, "epoch": 4750} {"train_loss": -7.352100849151611, "global_step": 199535, "epoch": 4750} {"train_loss": -7.317880630493164, "global_step": 199536, "epoch": 4750} {"train_loss": -7.199390411376953, "global_step": 199537, "epoch": 4750} {"train_loss": -7.343441009521484, "global_step": 199538, "epoch": 4750} {"train_loss": -7.184950828552246, "global_step": 199539, "epoch": 4750} {"train_loss": -7.095011234283447, "global_step": 199540, "epoch": 4750} {"train_loss": -7.290569736844017, "global_step": 199541, "epoch": 4750, "train/sim_max_reward_0": 0.8645707081937891, "train/sim_max_reward_1": 0.930688606779014, "train/sim_max_reward_2": 0.5609442667941031, "train/sim_max_reward_3": 0.13994860686849805, "train/sim_max_reward_4": 0.9559989645898872, "train/sim_max_reward_5": 0.9172916993802589, "test/sim_max_reward_4500000": 0.974456752780346, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9635476967289617, "test/sim_max_reward_4500003": 0.8873890781148277, "test/sim_max_reward_4500004": 0.1826798888534296, "test/sim_max_reward_4500005": 0.5522212746925484, "test/sim_max_reward_4500006": 0.9085088996809749, "test/sim_max_reward_4500007": 0.9803533879748758, "test/sim_max_reward_4500008": 0.9625424771411956, "test/sim_max_reward_4500009": 0.05294220505031562, "test/sim_max_reward_4500010": 0.05052232504826654, "test/sim_max_reward_4500011": 0.8612290281602639, "test/sim_max_reward_4500012": 0.9904328954022679, "test/sim_max_reward_4500013": 0.003016451101395865, "test/sim_max_reward_4500014": 0.3878263682326698, "test/sim_max_reward_4500015": 0.08894209007762723, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.0997637664714099, "test/sim_max_reward_4500018": 0.5388233581156786, "test/sim_max_reward_4500019": 0.9736949398853331, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.4558578551431223, "test/sim_max_reward_4500022": 0.9474753186715235, "test/sim_max_reward_4500023": 0.8867823457680616, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8864951416013008, "test/sim_max_reward_4500026": 0.9118792822374838, "test/sim_max_reward_4500027": 0.8533541651794456, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.08191246403158337, "test/sim_max_reward_4500030": 1.0, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.00012312537725908565, "test/sim_max_reward_4500034": 0.8966097388634643, "test/sim_max_reward_4500035": 0.8916231349896969, "test/sim_max_reward_4500036": 0.9969000396216808, "test/sim_max_reward_4500037": 0.9003050186908531, "test/sim_max_reward_4500038": 0.3127599507861583, "test/sim_max_reward_4500039": 0.9038803443369594, "test/sim_max_reward_4500040": 0.9535765058346131, "test/sim_max_reward_4500041": 0.8863580495460328, "test/sim_max_reward_4500042": 0.05291827093105188, "test/sim_max_reward_4500043": 0.48511226784508327, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 1.0, "test/sim_max_reward_4500046": 0.0, "test/sim_max_reward_4500047": 0.9786896784959391, "test/sim_max_reward_4500048": 0.9235502158527364, "test/sim_max_reward_4500049": 0.9925958661844245, "train/mean_score": 0.7282404754342585, "test/mean_score": 0.5581976554418054, "val_loss": 81463.265625} {"train_loss": -7.349137306213379, "global_step": 199542, "epoch": 4751} {"train_loss": -7.236575126647949, "global_step": 199543, "epoch": 4751} {"train_loss": -7.264050483703613, "global_step": 199544, "epoch": 4751} {"train_loss": -7.1635661125183105, "global_step": 199545, "epoch": 4751} {"train_loss": -7.441431999206543, "global_step": 199546, "epoch": 4751} {"train_loss": -7.361221790313721, "global_step": 199547, "epoch": 4751} {"train_loss": -7.414549827575684, "global_step": 199548, "epoch": 4751} {"train_loss": -7.220938682556152, "global_step": 199549, "epoch": 4751} {"train_loss": -7.3367600440979, "global_step": 199550, "epoch": 4751} {"train_loss": -7.375553131103516, "global_step": 199551, "epoch": 4751} {"train_loss": -7.401252746582031, "global_step": 199552, "epoch": 4751} {"train_loss": -7.288614273071289, "global_step": 199553, "epoch": 4751} {"train_loss": -7.286569595336914, "global_step": 199554, "epoch": 4751} {"train_loss": -7.296341896057129, "global_step": 199555, "epoch": 4751} {"train_loss": -7.3589887619018555, "global_step": 199556, "epoch": 4751} {"train_loss": -7.408584117889404, "global_step": 199557, "epoch": 4751} {"train_loss": -7.398484230041504, "global_step": 199558, "epoch": 4751} {"train_loss": -7.356596946716309, "global_step": 199559, "epoch": 4751} {"train_loss": -7.353847503662109, "global_step": 199560, "epoch": 4751} {"train_loss": -7.271664142608643, "global_step": 199561, "epoch": 4751} {"train_loss": -7.2906012535095215, "global_step": 199562, "epoch": 4751} {"train_loss": -7.279268264770508, "global_step": 199563, "epoch": 4751} {"train_loss": -7.406654357910156, "global_step": 199564, "epoch": 4751} {"train_loss": -7.368205547332764, "global_step": 199565, "epoch": 4751} {"train_loss": -7.275341033935547, "global_step": 199566, "epoch": 4751} {"train_loss": -7.206028938293457, "global_step": 199567, "epoch": 4751} {"train_loss": -7.177907943725586, "global_step": 199568, "epoch": 4751} {"train_loss": -7.304470062255859, "global_step": 199569, "epoch": 4751} {"train_loss": -7.281784534454346, "global_step": 199570, "epoch": 4751} {"train_loss": -7.271394729614258, "global_step": 199571, "epoch": 4751} {"train_loss": -7.226692199707031, "global_step": 199572, "epoch": 4751} {"train_loss": -7.159183502197266, "global_step": 199573, "epoch": 4751} {"train_loss": -7.3608574867248535, "global_step": 199574, "epoch": 4751} {"train_loss": -7.20989465713501, "global_step": 199575, "epoch": 4751} {"train_loss": -7.22285795211792, "global_step": 199576, "epoch": 4751} {"train_loss": -7.2927398681640625, "global_step": 199577, "epoch": 4751} {"train_loss": -7.210751533508301, "global_step": 199578, "epoch": 4751} {"train_loss": -7.141780376434326, "global_step": 199579, "epoch": 4751} {"train_loss": -7.126119613647461, "global_step": 199580, "epoch": 4751} {"train_loss": -7.170169830322266, "global_step": 199581, "epoch": 4751} {"train_loss": -7.189065933227539, "global_step": 199582, "epoch": 4751} {"train_loss": -7.282983189537411, "global_step": 199583, "epoch": 4751, "val_loss": 81498.671875} {"train_loss": -7.146384239196777, "global_step": 199584, "epoch": 4752} {"train_loss": -7.162253379821777, "global_step": 199585, "epoch": 4752} {"train_loss": -7.104738235473633, "global_step": 199586, "epoch": 4752} {"train_loss": -7.288578033447266, "global_step": 199587, "epoch": 4752} {"train_loss": -7.177128791809082, "global_step": 199588, "epoch": 4752} {"train_loss": -7.247533321380615, "global_step": 199589, "epoch": 4752} {"train_loss": -7.223873138427734, "global_step": 199590, "epoch": 4752} {"train_loss": -7.205420017242432, "global_step": 199591, "epoch": 4752} {"train_loss": -7.156217575073242, "global_step": 199592, "epoch": 4752} {"train_loss": -7.387297630310059, "global_step": 199593, "epoch": 4752} {"train_loss": -7.33299446105957, "global_step": 199594, "epoch": 4752} {"train_loss": -7.291637420654297, "global_step": 199595, "epoch": 4752} {"train_loss": -7.28200101852417, "global_step": 199596, "epoch": 4752} {"train_loss": -7.195852279663086, "global_step": 199597, "epoch": 4752} {"train_loss": -7.270443916320801, "global_step": 199598, "epoch": 4752} {"train_loss": -7.271432876586914, "global_step": 199599, "epoch": 4752} {"train_loss": -7.372881889343262, "global_step": 199600, "epoch": 4752} {"train_loss": -7.136131286621094, "global_step": 199601, "epoch": 4752} {"train_loss": -7.289419174194336, "global_step": 199602, "epoch": 4752} {"train_loss": -7.326398849487305, "global_step": 199603, "epoch": 4752} {"train_loss": -7.310384750366211, "global_step": 199604, "epoch": 4752} {"train_loss": -7.229240417480469, "global_step": 199605, "epoch": 4752} {"train_loss": -7.217041969299316, "global_step": 199606, "epoch": 4752} {"train_loss": -7.366199493408203, "global_step": 199607, "epoch": 4752} {"train_loss": -7.3078155517578125, "global_step": 199608, "epoch": 4752} {"train_loss": -7.105323791503906, "global_step": 199609, "epoch": 4752} {"train_loss": -7.405107498168945, "global_step": 199610, "epoch": 4752} {"train_loss": -7.1987810134887695, "global_step": 199611, "epoch": 4752} {"train_loss": -7.3185930252075195, "global_step": 199612, "epoch": 4752} {"train_loss": -7.286466121673584, "global_step": 199613, "epoch": 4752} {"train_loss": -7.178123474121094, "global_step": 199614, "epoch": 4752} {"train_loss": -7.305504322052002, "global_step": 199615, "epoch": 4752} {"train_loss": -7.2571868896484375, "global_step": 199616, "epoch": 4752} {"train_loss": -7.3379740715026855, "global_step": 199617, "epoch": 4752} {"train_loss": -7.171611785888672, "global_step": 199618, "epoch": 4752} {"train_loss": -7.3348612785339355, "global_step": 199619, "epoch": 4752} {"train_loss": -7.2466583251953125, "global_step": 199620, "epoch": 4752} {"train_loss": -7.3257551193237305, "global_step": 199621, "epoch": 4752} {"train_loss": -7.244837760925293, "global_step": 199622, "epoch": 4752} {"train_loss": -7.294485092163086, "global_step": 199623, "epoch": 4752} {"train_loss": -7.224091529846191, "global_step": 199624, "epoch": 4752} {"train_loss": -7.258374089286441, "global_step": 199625, "epoch": 4752, "val_loss": 81600.1484375} {"train_loss": -7.353806972503662, "global_step": 199626, "epoch": 4753} {"train_loss": -7.354925155639648, "global_step": 199627, "epoch": 4753} {"train_loss": -7.339644908905029, "global_step": 199628, "epoch": 4753} {"train_loss": -7.189493656158447, "global_step": 199629, "epoch": 4753} {"train_loss": -7.300896644592285, "global_step": 199630, "epoch": 4753} {"train_loss": -7.27955436706543, "global_step": 199631, "epoch": 4753} {"train_loss": -7.385204792022705, "global_step": 199632, "epoch": 4753} {"train_loss": -7.314697742462158, "global_step": 199633, "epoch": 4753} {"train_loss": -7.31517219543457, "global_step": 199634, "epoch": 4753} {"train_loss": -7.328508377075195, "global_step": 199635, "epoch": 4753} {"train_loss": -7.2957763671875, "global_step": 199636, "epoch": 4753} {"train_loss": -7.3689727783203125, "global_step": 199637, "epoch": 4753} {"train_loss": -7.247976303100586, "global_step": 199638, "epoch": 4753} {"train_loss": -7.392484188079834, "global_step": 199639, "epoch": 4753} {"train_loss": -7.32986307144165, "global_step": 199640, "epoch": 4753} {"train_loss": -7.4636735916137695, "global_step": 199641, "epoch": 4753} {"train_loss": -7.338659286499023, "global_step": 199642, "epoch": 4753} {"train_loss": -7.4151177406311035, "global_step": 199643, "epoch": 4753} {"train_loss": -7.333146095275879, "global_step": 199644, "epoch": 4753} {"train_loss": -7.2183027267456055, "global_step": 199645, "epoch": 4753} {"train_loss": -7.28593111038208, "global_step": 199646, "epoch": 4753} {"train_loss": -7.284332275390625, "global_step": 199647, "epoch": 4753} {"train_loss": -7.148673057556152, "global_step": 199648, "epoch": 4753} {"train_loss": -7.244877815246582, "global_step": 199649, "epoch": 4753} {"train_loss": -7.192257881164551, "global_step": 199650, "epoch": 4753} {"train_loss": -7.382509231567383, "global_step": 199651, "epoch": 4753} {"train_loss": -7.302929401397705, "global_step": 199652, "epoch": 4753} {"train_loss": -7.341996669769287, "global_step": 199653, "epoch": 4753} {"train_loss": -7.250857353210449, "global_step": 199654, "epoch": 4753} {"train_loss": -7.174653053283691, "global_step": 199655, "epoch": 4753} {"train_loss": -7.233400344848633, "global_step": 199656, "epoch": 4753} {"train_loss": -7.213939666748047, "global_step": 199657, "epoch": 4753} {"train_loss": -7.289685249328613, "global_step": 199658, "epoch": 4753} {"train_loss": -7.235520362854004, "global_step": 199659, "epoch": 4753} {"train_loss": -7.21244478225708, "global_step": 199660, "epoch": 4753} {"train_loss": -7.0495758056640625, "global_step": 199661, "epoch": 4753} {"train_loss": -7.320865631103516, "global_step": 199662, "epoch": 4753} {"train_loss": -7.144804954528809, "global_step": 199663, "epoch": 4753} {"train_loss": -7.239850044250488, "global_step": 199664, "epoch": 4753} {"train_loss": -7.2804155349731445, "global_step": 199665, "epoch": 4753} {"train_loss": -7.253605842590332, "global_step": 199666, "epoch": 4753} {"train_loss": -7.283223299753098, "global_step": 199667, "epoch": 4753, "val_loss": 81434.9375} {"train_loss": -7.17894983291626, "global_step": 199668, "epoch": 4754} {"train_loss": -7.3193511962890625, "global_step": 199669, "epoch": 4754} {"train_loss": -7.261940956115723, "global_step": 199670, "epoch": 4754} {"train_loss": -7.222630977630615, "global_step": 199671, "epoch": 4754} {"train_loss": -7.2946367263793945, "global_step": 199672, "epoch": 4754} {"train_loss": -7.317803382873535, "global_step": 199673, "epoch": 4754} {"train_loss": -7.310540199279785, "global_step": 199674, "epoch": 4754} {"train_loss": -7.324740886688232, "global_step": 199675, "epoch": 4754} {"train_loss": -7.288849353790283, "global_step": 199676, "epoch": 4754} {"train_loss": -7.390407562255859, "global_step": 199677, "epoch": 4754} {"train_loss": -7.392367839813232, "global_step": 199678, "epoch": 4754} {"train_loss": -7.265119552612305, "global_step": 199679, "epoch": 4754} {"train_loss": -7.213209629058838, "global_step": 199680, "epoch": 4754} {"train_loss": -7.277410507202148, "global_step": 199681, "epoch": 4754} {"train_loss": -7.39532995223999, "global_step": 199682, "epoch": 4754} {"train_loss": -7.418654441833496, "global_step": 199683, "epoch": 4754} {"train_loss": -7.357090950012207, "global_step": 199684, "epoch": 4754} {"train_loss": -7.333757400512695, "global_step": 199685, "epoch": 4754} {"train_loss": -7.2897844314575195, "global_step": 199686, "epoch": 4754} {"train_loss": -7.286159515380859, "global_step": 199687, "epoch": 4754} {"train_loss": -7.425833702087402, "global_step": 199688, "epoch": 4754} {"train_loss": -7.319536209106445, "global_step": 199689, "epoch": 4754} {"train_loss": -7.274954795837402, "global_step": 199690, "epoch": 4754} {"train_loss": -7.529151916503906, "global_step": 199691, "epoch": 4754} {"train_loss": -7.390976905822754, "global_step": 199692, "epoch": 4754} {"train_loss": -7.462907791137695, "global_step": 199693, "epoch": 4754} {"train_loss": -7.344875335693359, "global_step": 199694, "epoch": 4754} {"train_loss": -7.398141384124756, "global_step": 199695, "epoch": 4754} {"train_loss": -7.312646865844727, "global_step": 199696, "epoch": 4754} {"train_loss": -7.414532661437988, "global_step": 199697, "epoch": 4754} {"train_loss": -7.354578018188477, "global_step": 199698, "epoch": 4754} {"train_loss": -7.445509910583496, "global_step": 199699, "epoch": 4754} {"train_loss": -7.285867691040039, "global_step": 199700, "epoch": 4754} {"train_loss": -7.371030807495117, "global_step": 199701, "epoch": 4754} {"train_loss": -7.412284851074219, "global_step": 199702, "epoch": 4754} {"train_loss": -7.229568958282471, "global_step": 199703, "epoch": 4754} {"train_loss": -7.279242515563965, "global_step": 199704, "epoch": 4754} {"train_loss": -7.374045372009277, "global_step": 199705, "epoch": 4754} {"train_loss": -7.385482311248779, "global_step": 199706, "epoch": 4754} {"train_loss": -7.241976261138916, "global_step": 199707, "epoch": 4754} {"train_loss": -7.216559410095215, "global_step": 199708, "epoch": 4754} {"train_loss": -7.332787820271084, "global_step": 199709, "epoch": 4754, "val_loss": 81324.2109375} {"train_loss": -7.295066833496094, "global_step": 199710, "epoch": 4755} {"train_loss": -7.209301948547363, "global_step": 199711, "epoch": 4755} {"train_loss": -7.421445846557617, "global_step": 199712, "epoch": 4755} {"train_loss": -7.149964332580566, "global_step": 199713, "epoch": 4755} {"train_loss": -7.275001525878906, "global_step": 199714, "epoch": 4755} {"train_loss": -7.251395225524902, "global_step": 199715, "epoch": 4755} {"train_loss": -7.293676853179932, "global_step": 199716, "epoch": 4755} {"train_loss": -7.289987564086914, "global_step": 199717, "epoch": 4755} {"train_loss": -7.361021518707275, "global_step": 199718, "epoch": 4755} {"train_loss": -7.320558071136475, "global_step": 199719, "epoch": 4755} {"train_loss": -7.288527011871338, "global_step": 199720, "epoch": 4755} {"train_loss": -7.322207450866699, "global_step": 199721, "epoch": 4755} {"train_loss": -7.189104080200195, "global_step": 199722, "epoch": 4755} {"train_loss": -7.31845235824585, "global_step": 199723, "epoch": 4755} {"train_loss": -7.356532096862793, "global_step": 199724, "epoch": 4755} {"train_loss": -7.235569953918457, "global_step": 199725, "epoch": 4755} {"train_loss": -7.2943925857543945, "global_step": 199726, "epoch": 4755} {"train_loss": -7.296582221984863, "global_step": 199727, "epoch": 4755} {"train_loss": -7.087798118591309, "global_step": 199728, "epoch": 4755} {"train_loss": -7.2849531173706055, "global_step": 199729, "epoch": 4755} {"train_loss": -7.337719917297363, "global_step": 199730, "epoch": 4755} {"train_loss": -7.248116493225098, "global_step": 199731, "epoch": 4755} {"train_loss": -7.367039203643799, "global_step": 199732, "epoch": 4755} {"train_loss": -7.319074630737305, "global_step": 199733, "epoch": 4755} {"train_loss": -7.421823501586914, "global_step": 199734, "epoch": 4755} {"train_loss": -7.32315731048584, "global_step": 199735, "epoch": 4755} {"train_loss": -7.267334461212158, "global_step": 199736, "epoch": 4755} {"train_loss": -7.395370960235596, "global_step": 199737, "epoch": 4755} {"train_loss": -7.3371171951293945, "global_step": 199738, "epoch": 4755} {"train_loss": -7.332655906677246, "global_step": 199739, "epoch": 4755} {"train_loss": -7.187292098999023, "global_step": 199740, "epoch": 4755} {"train_loss": -7.146732330322266, "global_step": 199741, "epoch": 4755} {"train_loss": -7.248373508453369, "global_step": 199742, "epoch": 4755} {"train_loss": -7.33790397644043, "global_step": 199743, "epoch": 4755} {"train_loss": -7.262327671051025, "global_step": 199744, "epoch": 4755} {"train_loss": -7.220486640930176, "global_step": 199745, "epoch": 4755} {"train_loss": -7.331175804138184, "global_step": 199746, "epoch": 4755} {"train_loss": -7.35366678237915, "global_step": 199747, "epoch": 4755} {"train_loss": -7.272256851196289, "global_step": 199748, "epoch": 4755} {"train_loss": -7.316261291503906, "global_step": 199749, "epoch": 4755} {"train_loss": -7.222055435180664, "global_step": 199750, "epoch": 4755} {"train_loss": -7.288164343152728, "global_step": 199751, "epoch": 4755, "val_loss": 81441.0625} {"train_loss": -7.267285346984863, "global_step": 199752, "epoch": 4756} {"train_loss": -7.315519332885742, "global_step": 199753, "epoch": 4756} {"train_loss": -7.284435272216797, "global_step": 199754, "epoch": 4756} {"train_loss": -7.368292331695557, "global_step": 199755, "epoch": 4756} {"train_loss": -7.154685974121094, "global_step": 199756, "epoch": 4756} {"train_loss": -7.280698776245117, "global_step": 199757, "epoch": 4756} {"train_loss": -7.364886283874512, "global_step": 199758, "epoch": 4756} {"train_loss": -7.311290740966797, "global_step": 199759, "epoch": 4756} {"train_loss": -7.38466215133667, "global_step": 199760, "epoch": 4756} {"train_loss": -7.270129203796387, "global_step": 199761, "epoch": 4756} {"train_loss": -7.259669303894043, "global_step": 199762, "epoch": 4756} {"train_loss": -7.355610370635986, "global_step": 199763, "epoch": 4756} {"train_loss": -7.225316524505615, "global_step": 199764, "epoch": 4756} {"train_loss": -7.426886081695557, "global_step": 199765, "epoch": 4756} {"train_loss": -7.250480651855469, "global_step": 199766, "epoch": 4756} {"train_loss": -7.2639384269714355, "global_step": 199767, "epoch": 4756} {"train_loss": -7.2838640213012695, "global_step": 199768, "epoch": 4756} {"train_loss": -7.271871566772461, "global_step": 199769, "epoch": 4756} {"train_loss": -7.223559379577637, "global_step": 199770, "epoch": 4756} {"train_loss": -7.160045623779297, "global_step": 199771, "epoch": 4756} {"train_loss": -7.219820022583008, "global_step": 199772, "epoch": 4756} {"train_loss": -7.346381187438965, "global_step": 199773, "epoch": 4756} {"train_loss": -7.405712127685547, "global_step": 199774, "epoch": 4756} {"train_loss": -7.187628746032715, "global_step": 199775, "epoch": 4756} {"train_loss": -7.162805557250977, "global_step": 199776, "epoch": 4756} {"train_loss": -7.2108001708984375, "global_step": 199777, "epoch": 4756} {"train_loss": -7.266308307647705, "global_step": 199778, "epoch": 4756} {"train_loss": -7.3098344802856445, "global_step": 199779, "epoch": 4756} {"train_loss": -7.325616836547852, "global_step": 199780, "epoch": 4756} {"train_loss": -7.37984561920166, "global_step": 199781, "epoch": 4756} {"train_loss": -7.28448486328125, "global_step": 199782, "epoch": 4756} {"train_loss": -7.303027629852295, "global_step": 199783, "epoch": 4756} {"train_loss": -7.294064521789551, "global_step": 199784, "epoch": 4756} {"train_loss": -7.304896354675293, "global_step": 199785, "epoch": 4756} {"train_loss": -7.250688552856445, "global_step": 199786, "epoch": 4756} {"train_loss": -7.203839302062988, "global_step": 199787, "epoch": 4756} {"train_loss": -7.1694464683532715, "global_step": 199788, "epoch": 4756} {"train_loss": -7.251341819763184, "global_step": 199789, "epoch": 4756} {"train_loss": -7.0758466720581055, "global_step": 199790, "epoch": 4756} {"train_loss": -7.318628787994385, "global_step": 199791, "epoch": 4756} {"train_loss": -7.184978485107422, "global_step": 199792, "epoch": 4756} {"train_loss": -7.27325389498756, "global_step": 199793, "epoch": 4756, "val_loss": 81634.2734375} {"train_loss": -7.314847946166992, "global_step": 199794, "epoch": 4757} {"train_loss": -7.237612247467041, "global_step": 199795, "epoch": 4757} {"train_loss": -7.266837120056152, "global_step": 199796, "epoch": 4757} {"train_loss": -7.159182548522949, "global_step": 199797, "epoch": 4757} {"train_loss": -7.134028434753418, "global_step": 199798, "epoch": 4757} {"train_loss": -7.293551921844482, "global_step": 199799, "epoch": 4757} {"train_loss": -7.142932415008545, "global_step": 199800, "epoch": 4757} {"train_loss": -7.030987739562988, "global_step": 199801, "epoch": 4757} {"train_loss": -7.30768346786499, "global_step": 199802, "epoch": 4757} {"train_loss": -7.039116382598877, "global_step": 199803, "epoch": 4757} {"train_loss": -7.272417068481445, "global_step": 199804, "epoch": 4757} {"train_loss": -7.046807765960693, "global_step": 199805, "epoch": 4757} {"train_loss": -7.141151428222656, "global_step": 199806, "epoch": 4757} {"train_loss": -7.179953575134277, "global_step": 199807, "epoch": 4757} {"train_loss": -7.253357887268066, "global_step": 199808, "epoch": 4757} {"train_loss": -7.294661521911621, "global_step": 199809, "epoch": 4757} {"train_loss": -7.253952980041504, "global_step": 199810, "epoch": 4757} {"train_loss": -7.235156059265137, "global_step": 199811, "epoch": 4757} {"train_loss": -7.245544910430908, "global_step": 199812, "epoch": 4757} {"train_loss": -7.2391533851623535, "global_step": 199813, "epoch": 4757} {"train_loss": -7.259166717529297, "global_step": 199814, "epoch": 4757} {"train_loss": -7.308346271514893, "global_step": 199815, "epoch": 4757} {"train_loss": -7.206696510314941, "global_step": 199816, "epoch": 4757} {"train_loss": -7.176481246948242, "global_step": 199817, "epoch": 4757} {"train_loss": -7.371468544006348, "global_step": 199818, "epoch": 4757} {"train_loss": -7.23197603225708, "global_step": 199819, "epoch": 4757} {"train_loss": -7.350655555725098, "global_step": 199820, "epoch": 4757} {"train_loss": -7.271914005279541, "global_step": 199821, "epoch": 4757} {"train_loss": -7.262244701385498, "global_step": 199822, "epoch": 4757} {"train_loss": -7.387454986572266, "global_step": 199823, "epoch": 4757} {"train_loss": -7.1953959465026855, "global_step": 199824, "epoch": 4757} {"train_loss": -7.349823951721191, "global_step": 199825, "epoch": 4757} {"train_loss": -7.322563171386719, "global_step": 199826, "epoch": 4757} {"train_loss": -7.334561347961426, "global_step": 199827, "epoch": 4757} {"train_loss": -7.294417381286621, "global_step": 199828, "epoch": 4757} {"train_loss": -7.414520263671875, "global_step": 199829, "epoch": 4757} {"train_loss": -7.357349395751953, "global_step": 199830, "epoch": 4757} {"train_loss": -7.296444892883301, "global_step": 199831, "epoch": 4757} {"train_loss": -7.279364585876465, "global_step": 199832, "epoch": 4757} {"train_loss": -7.3643035888671875, "global_step": 199833, "epoch": 4757} {"train_loss": -7.195823669433594, "global_step": 199834, "epoch": 4757} {"train_loss": -7.25195186478751, "global_step": 199835, "epoch": 4757, "val_loss": 81373.96875} {"train_loss": -7.337480545043945, "global_step": 199836, "epoch": 4758} {"train_loss": -7.355844497680664, "global_step": 199837, "epoch": 4758} {"train_loss": -7.490816116333008, "global_step": 199838, "epoch": 4758} {"train_loss": -7.2333502769470215, "global_step": 199839, "epoch": 4758} {"train_loss": -7.424370765686035, "global_step": 199840, "epoch": 4758} {"train_loss": -7.367707252502441, "global_step": 199841, "epoch": 4758} {"train_loss": -7.2517499923706055, "global_step": 199842, "epoch": 4758} {"train_loss": -7.407883167266846, "global_step": 199843, "epoch": 4758} {"train_loss": -7.309757232666016, "global_step": 199844, "epoch": 4758} {"train_loss": -7.30489444732666, "global_step": 199845, "epoch": 4758} {"train_loss": -7.291939735412598, "global_step": 199846, "epoch": 4758} {"train_loss": -7.248567581176758, "global_step": 199847, "epoch": 4758} {"train_loss": -7.258642196655273, "global_step": 199848, "epoch": 4758} {"train_loss": -7.296847343444824, "global_step": 199849, "epoch": 4758} {"train_loss": -7.309141159057617, "global_step": 199850, "epoch": 4758} {"train_loss": -7.334396839141846, "global_step": 199851, "epoch": 4758} {"train_loss": -7.287563323974609, "global_step": 199852, "epoch": 4758} {"train_loss": -7.322712421417236, "global_step": 199853, "epoch": 4758} {"train_loss": -7.370244979858398, "global_step": 199854, "epoch": 4758} {"train_loss": -7.324955940246582, "global_step": 199855, "epoch": 4758} {"train_loss": -7.256901741027832, "global_step": 199856, "epoch": 4758} {"train_loss": -7.386817932128906, "global_step": 199857, "epoch": 4758} {"train_loss": -7.428801536560059, "global_step": 199858, "epoch": 4758} {"train_loss": -7.342823028564453, "global_step": 199859, "epoch": 4758} {"train_loss": -7.318419933319092, "global_step": 199860, "epoch": 4758} {"train_loss": -7.3628716468811035, "global_step": 199861, "epoch": 4758} {"train_loss": -7.388419151306152, "global_step": 199862, "epoch": 4758} {"train_loss": -7.35076904296875, "global_step": 199863, "epoch": 4758} {"train_loss": -7.369004726409912, "global_step": 199864, "epoch": 4758} {"train_loss": -7.259120941162109, "global_step": 199865, "epoch": 4758} {"train_loss": -7.298900604248047, "global_step": 199866, "epoch": 4758} {"train_loss": -7.333259105682373, "global_step": 199867, "epoch": 4758} {"train_loss": -7.42091178894043, "global_step": 199868, "epoch": 4758} {"train_loss": -7.285440444946289, "global_step": 199869, "epoch": 4758} {"train_loss": -7.354548931121826, "global_step": 199870, "epoch": 4758} {"train_loss": -7.363964080810547, "global_step": 199871, "epoch": 4758} {"train_loss": -7.205311298370361, "global_step": 199872, "epoch": 4758} {"train_loss": -7.126577854156494, "global_step": 199873, "epoch": 4758} {"train_loss": -7.182769775390625, "global_step": 199874, "epoch": 4758} {"train_loss": -7.208629608154297, "global_step": 199875, "epoch": 4758} {"train_loss": -7.0211944580078125, "global_step": 199876, "epoch": 4758} {"train_loss": -7.307104950859433, "global_step": 199877, "epoch": 4758, "val_loss": 81503.171875} {"train_loss": -7.1178693771362305, "global_step": 199878, "epoch": 4759} {"train_loss": -6.863337516784668, "global_step": 199879, "epoch": 4759} {"train_loss": -7.278594970703125, "global_step": 199880, "epoch": 4759} {"train_loss": -7.1378631591796875, "global_step": 199881, "epoch": 4759} {"train_loss": -7.080745697021484, "global_step": 199882, "epoch": 4759} {"train_loss": -7.27172327041626, "global_step": 199883, "epoch": 4759} {"train_loss": -7.181609630584717, "global_step": 199884, "epoch": 4759} {"train_loss": -7.2743821144104, "global_step": 199885, "epoch": 4759} {"train_loss": -7.251210689544678, "global_step": 199886, "epoch": 4759} {"train_loss": -7.231378555297852, "global_step": 199887, "epoch": 4759} {"train_loss": -7.247962951660156, "global_step": 199888, "epoch": 4759} {"train_loss": -7.192901134490967, "global_step": 199889, "epoch": 4759} {"train_loss": -7.296679496765137, "global_step": 199890, "epoch": 4759} {"train_loss": -7.225825786590576, "global_step": 199891, "epoch": 4759} {"train_loss": -7.402032375335693, "global_step": 199892, "epoch": 4759} {"train_loss": -7.231750965118408, "global_step": 199893, "epoch": 4759} {"train_loss": -7.409191608428955, "global_step": 199894, "epoch": 4759} {"train_loss": -7.296050071716309, "global_step": 199895, "epoch": 4759} {"train_loss": -7.3007354736328125, "global_step": 199896, "epoch": 4759} {"train_loss": -7.338921546936035, "global_step": 199897, "epoch": 4759} {"train_loss": -7.3053436279296875, "global_step": 199898, "epoch": 4759} {"train_loss": -7.172781944274902, "global_step": 199899, "epoch": 4759} {"train_loss": -7.287941932678223, "global_step": 199900, "epoch": 4759} {"train_loss": -7.126760959625244, "global_step": 199901, "epoch": 4759} {"train_loss": -7.327334880828857, "global_step": 199902, "epoch": 4759} {"train_loss": -7.102972984313965, "global_step": 199903, "epoch": 4759} {"train_loss": -7.255188465118408, "global_step": 199904, "epoch": 4759} {"train_loss": -7.073273658752441, "global_step": 199905, "epoch": 4759} {"train_loss": -7.245412349700928, "global_step": 199906, "epoch": 4759} {"train_loss": -7.135858535766602, "global_step": 199907, "epoch": 4759} {"train_loss": -7.1890435218811035, "global_step": 199908, "epoch": 4759} {"train_loss": -7.126735687255859, "global_step": 199909, "epoch": 4759} {"train_loss": -7.281636714935303, "global_step": 199910, "epoch": 4759} {"train_loss": -7.170897006988525, "global_step": 199911, "epoch": 4759} {"train_loss": -7.171632766723633, "global_step": 199912, "epoch": 4759} {"train_loss": -7.320908546447754, "global_step": 199913, "epoch": 4759} {"train_loss": -7.193014621734619, "global_step": 199914, "epoch": 4759} {"train_loss": -7.210559368133545, "global_step": 199915, "epoch": 4759} {"train_loss": -7.139617919921875, "global_step": 199916, "epoch": 4759} {"train_loss": -7.261814594268799, "global_step": 199917, "epoch": 4759} {"train_loss": -7.350644588470459, "global_step": 199918, "epoch": 4759} {"train_loss": -7.221380301884243, "global_step": 199919, "epoch": 4759, "val_loss": 81581.8671875} {"train_loss": -7.259438514709473, "global_step": 199920, "epoch": 4760} {"train_loss": -7.220468521118164, "global_step": 199921, "epoch": 4760} {"train_loss": -7.2215704917907715, "global_step": 199922, "epoch": 4760} {"train_loss": -7.169738292694092, "global_step": 199923, "epoch": 4760} {"train_loss": -7.341179370880127, "global_step": 199924, "epoch": 4760} {"train_loss": -7.266654968261719, "global_step": 199925, "epoch": 4760} {"train_loss": -7.219438552856445, "global_step": 199926, "epoch": 4760} {"train_loss": -7.27077579498291, "global_step": 199927, "epoch": 4760} {"train_loss": -7.159958839416504, "global_step": 199928, "epoch": 4760} {"train_loss": -7.368809700012207, "global_step": 199929, "epoch": 4760} {"train_loss": -7.264253616333008, "global_step": 199930, "epoch": 4760} {"train_loss": -7.254137992858887, "global_step": 199931, "epoch": 4760} {"train_loss": -7.289056777954102, "global_step": 199932, "epoch": 4760} {"train_loss": -7.276819229125977, "global_step": 199933, "epoch": 4760} {"train_loss": -7.329461097717285, "global_step": 199934, "epoch": 4760} {"train_loss": -7.203432559967041, "global_step": 199935, "epoch": 4760} {"train_loss": -7.42765474319458, "global_step": 199936, "epoch": 4760} {"train_loss": -7.316910266876221, "global_step": 199937, "epoch": 4760} {"train_loss": -7.339925765991211, "global_step": 199938, "epoch": 4760} {"train_loss": -7.344983100891113, "global_step": 199939, "epoch": 4760} {"train_loss": -7.330495834350586, "global_step": 199940, "epoch": 4760} {"train_loss": -7.359307765960693, "global_step": 199941, "epoch": 4760} {"train_loss": -7.3143157958984375, "global_step": 199942, "epoch": 4760} {"train_loss": -7.351188659667969, "global_step": 199943, "epoch": 4760} {"train_loss": -7.454118728637695, "global_step": 199944, "epoch": 4760} {"train_loss": -7.333260536193848, "global_step": 199945, "epoch": 4760} {"train_loss": -7.324878215789795, "global_step": 199946, "epoch": 4760} {"train_loss": -7.326574802398682, "global_step": 199947, "epoch": 4760} {"train_loss": -7.208291530609131, "global_step": 199948, "epoch": 4760} {"train_loss": -7.3566694259643555, "global_step": 199949, "epoch": 4760} {"train_loss": -7.274600505828857, "global_step": 199950, "epoch": 4760} {"train_loss": -7.436182022094727, "global_step": 199951, "epoch": 4760} {"train_loss": -7.32939338684082, "global_step": 199952, "epoch": 4760} {"train_loss": -7.390265941619873, "global_step": 199953, "epoch": 4760} {"train_loss": -7.329176425933838, "global_step": 199954, "epoch": 4760} {"train_loss": -7.345200538635254, "global_step": 199955, "epoch": 4760} {"train_loss": -7.411110877990723, "global_step": 199956, "epoch": 4760} {"train_loss": -7.378693580627441, "global_step": 199957, "epoch": 4760} {"train_loss": -7.23441219329834, "global_step": 199958, "epoch": 4760} {"train_loss": -7.307244777679443, "global_step": 199959, "epoch": 4760} {"train_loss": -7.340649604797363, "global_step": 199960, "epoch": 4760} {"train_loss": -7.309561059588478, "global_step": 199961, "epoch": 4760, "val_loss": 81514.1328125} {"train_loss": -7.415431976318359, "global_step": 199962, "epoch": 4761} {"train_loss": -7.388240814208984, "global_step": 199963, "epoch": 4761} {"train_loss": -7.321952819824219, "global_step": 199964, "epoch": 4761} {"train_loss": -7.370601654052734, "global_step": 199965, "epoch": 4761} {"train_loss": -7.352890968322754, "global_step": 199966, "epoch": 4761} {"train_loss": -7.28127384185791, "global_step": 199967, "epoch": 4761} {"train_loss": -7.235387802124023, "global_step": 199968, "epoch": 4761} {"train_loss": -7.393096446990967, "global_step": 199969, "epoch": 4761} {"train_loss": -7.392599582672119, "global_step": 199970, "epoch": 4761} {"train_loss": -7.2175188064575195, "global_step": 199971, "epoch": 4761} {"train_loss": -7.374274253845215, "global_step": 199972, "epoch": 4761} {"train_loss": -7.254101753234863, "global_step": 199973, "epoch": 4761} {"train_loss": -7.179999351501465, "global_step": 199974, "epoch": 4761} {"train_loss": -7.2470197677612305, "global_step": 199975, "epoch": 4761} {"train_loss": -7.343632698059082, "global_step": 199976, "epoch": 4761} {"train_loss": -7.195696830749512, "global_step": 199977, "epoch": 4761} {"train_loss": -7.304559230804443, "global_step": 199978, "epoch": 4761} {"train_loss": -7.147171974182129, "global_step": 199979, "epoch": 4761} {"train_loss": -7.17509651184082, "global_step": 199980, "epoch": 4761} {"train_loss": -7.265872478485107, "global_step": 199981, "epoch": 4761} {"train_loss": -7.250536918640137, "global_step": 199982, "epoch": 4761} {"train_loss": -7.26725959777832, "global_step": 199983, "epoch": 4761} {"train_loss": -7.227011680603027, "global_step": 199984, "epoch": 4761} {"train_loss": -7.14248514175415, "global_step": 199985, "epoch": 4761} {"train_loss": -7.213964939117432, "global_step": 199986, "epoch": 4761} {"train_loss": -7.1621809005737305, "global_step": 199987, "epoch": 4761} {"train_loss": -7.045170783996582, "global_step": 199988, "epoch": 4761} {"train_loss": -7.204336643218994, "global_step": 199989, "epoch": 4761} {"train_loss": -7.244097709655762, "global_step": 199990, "epoch": 4761} {"train_loss": -7.240246295928955, "global_step": 199991, "epoch": 4761} {"train_loss": -7.293956756591797, "global_step": 199992, "epoch": 4761} {"train_loss": -7.271728992462158, "global_step": 199993, "epoch": 4761} {"train_loss": -7.248353004455566, "global_step": 199994, "epoch": 4761} {"train_loss": -7.0340986251831055, "global_step": 199995, "epoch": 4761} {"train_loss": -7.187848091125488, "global_step": 199996, "epoch": 4761} {"train_loss": -7.235694408416748, "global_step": 199997, "epoch": 4761} {"train_loss": -7.237639427185059, "global_step": 199998, "epoch": 4761} {"train_loss": -7.311728477478027, "global_step": 199999, "epoch": 4761} {"train_loss": -7.277487754821777, "global_step": 200000, "epoch": 4761} {"train_loss": -7.314792633056641, "global_step": 200001, "epoch": 4761} {"train_loss": -7.310264587402344, "global_step": 200002, "epoch": 4761} {"train_loss": -7.261123134976342, "global_step": 200003, "epoch": 4761, "val_loss": 81520.328125} {"train_loss": -7.392084121704102, "global_step": 200004, "epoch": 4762} {"train_loss": -7.343900203704834, "global_step": 200005, "epoch": 4762} {"train_loss": -7.438342094421387, "global_step": 200006, "epoch": 4762} {"train_loss": -7.47023344039917, "global_step": 200007, "epoch": 4762} {"train_loss": -7.329713821411133, "global_step": 200008, "epoch": 4762} {"train_loss": -7.369109153747559, "global_step": 200009, "epoch": 4762} {"train_loss": -7.283714294433594, "global_step": 200010, "epoch": 4762} {"train_loss": -7.188963413238525, "global_step": 200011, "epoch": 4762} {"train_loss": -7.345857620239258, "global_step": 200012, "epoch": 4762} {"train_loss": -7.296473503112793, "global_step": 200013, "epoch": 4762} {"train_loss": -7.329944610595703, "global_step": 200014, "epoch": 4762} {"train_loss": -7.293324947357178, "global_step": 200015, "epoch": 4762} {"train_loss": -7.186488628387451, "global_step": 200016, "epoch": 4762} {"train_loss": -7.385215759277344, "global_step": 200017, "epoch": 4762} {"train_loss": -7.266121864318848, "global_step": 200018, "epoch": 4762} {"train_loss": -7.235750675201416, "global_step": 200019, "epoch": 4762} {"train_loss": -7.237959861755371, "global_step": 200020, "epoch": 4762} {"train_loss": -7.38429594039917, "global_step": 200021, "epoch": 4762} {"train_loss": -7.2015838623046875, "global_step": 200022, "epoch": 4762} {"train_loss": -7.338122367858887, "global_step": 200023, "epoch": 4762} {"train_loss": -7.180695533752441, "global_step": 200024, "epoch": 4762} {"train_loss": -7.080624580383301, "global_step": 200025, "epoch": 4762} {"train_loss": -7.2935872077941895, "global_step": 200026, "epoch": 4762} {"train_loss": -7.216914176940918, "global_step": 200027, "epoch": 4762} {"train_loss": -7.264925956726074, "global_step": 200028, "epoch": 4762} {"train_loss": -7.220523834228516, "global_step": 200029, "epoch": 4762} {"train_loss": -7.048741817474365, "global_step": 200030, "epoch": 4762} {"train_loss": -7.2319841384887695, "global_step": 200031, "epoch": 4762} {"train_loss": -7.094052314758301, "global_step": 200032, "epoch": 4762} {"train_loss": -7.082812309265137, "global_step": 200033, "epoch": 4762} {"train_loss": -7.214756011962891, "global_step": 200034, "epoch": 4762} {"train_loss": -7.195589065551758, "global_step": 200035, "epoch": 4762} {"train_loss": -7.225846767425537, "global_step": 200036, "epoch": 4762} {"train_loss": -7.208849906921387, "global_step": 200037, "epoch": 4762} {"train_loss": -7.1647257804870605, "global_step": 200038, "epoch": 4762} {"train_loss": -7.171458721160889, "global_step": 200039, "epoch": 4762} {"train_loss": -7.137945175170898, "global_step": 200040, "epoch": 4762} {"train_loss": -7.166988372802734, "global_step": 200041, "epoch": 4762} {"train_loss": -7.18366003036499, "global_step": 200042, "epoch": 4762} {"train_loss": -7.037954330444336, "global_step": 200043, "epoch": 4762} {"train_loss": -7.058811187744141, "global_step": 200044, "epoch": 4762} {"train_loss": -7.239572911035447, "global_step": 200045, "epoch": 4762, "val_loss": 81614.4609375} {"train_loss": -7.180962562561035, "global_step": 200046, "epoch": 4763} {"train_loss": -7.331936836242676, "global_step": 200047, "epoch": 4763} {"train_loss": -7.160066604614258, "global_step": 200048, "epoch": 4763} {"train_loss": -7.301376819610596, "global_step": 200049, "epoch": 4763} {"train_loss": -7.261938095092773, "global_step": 200050, "epoch": 4763} {"train_loss": -7.272346019744873, "global_step": 200051, "epoch": 4763} {"train_loss": -7.267144680023193, "global_step": 200052, "epoch": 4763} {"train_loss": -7.097268104553223, "global_step": 200053, "epoch": 4763} {"train_loss": -7.256916046142578, "global_step": 200054, "epoch": 4763} {"train_loss": -7.063052177429199, "global_step": 200055, "epoch": 4763} {"train_loss": -7.293463706970215, "global_step": 200056, "epoch": 4763} {"train_loss": -7.299441337585449, "global_step": 200057, "epoch": 4763} {"train_loss": -7.139932632446289, "global_step": 200058, "epoch": 4763} {"train_loss": -7.347634315490723, "global_step": 200059, "epoch": 4763} {"train_loss": -7.2430620193481445, "global_step": 200060, "epoch": 4763} {"train_loss": -7.189516067504883, "global_step": 200061, "epoch": 4763} {"train_loss": -7.291975975036621, "global_step": 200062, "epoch": 4763} {"train_loss": -7.043128967285156, "global_step": 200063, "epoch": 4763} {"train_loss": -7.235228061676025, "global_step": 200064, "epoch": 4763} {"train_loss": -7.133517742156982, "global_step": 200065, "epoch": 4763} {"train_loss": -7.248453140258789, "global_step": 200066, "epoch": 4763} {"train_loss": -7.169613361358643, "global_step": 200067, "epoch": 4763} {"train_loss": -7.228227615356445, "global_step": 200068, "epoch": 4763} {"train_loss": -7.234955787658691, "global_step": 200069, "epoch": 4763} {"train_loss": -7.268581390380859, "global_step": 200070, "epoch": 4763} {"train_loss": -7.212372779846191, "global_step": 200071, "epoch": 4763} {"train_loss": -7.360716342926025, "global_step": 200072, "epoch": 4763} {"train_loss": -7.317549705505371, "global_step": 200073, "epoch": 4763} {"train_loss": -7.210000514984131, "global_step": 200074, "epoch": 4763} {"train_loss": -7.3269758224487305, "global_step": 200075, "epoch": 4763} {"train_loss": -7.194568157196045, "global_step": 200076, "epoch": 4763} {"train_loss": -7.316126823425293, "global_step": 200077, "epoch": 4763} {"train_loss": -7.338153839111328, "global_step": 200078, "epoch": 4763} {"train_loss": -7.252003192901611, "global_step": 200079, "epoch": 4763} {"train_loss": -7.33338737487793, "global_step": 200080, "epoch": 4763} {"train_loss": -7.229239463806152, "global_step": 200081, "epoch": 4763} {"train_loss": -7.247905254364014, "global_step": 200082, "epoch": 4763} {"train_loss": -7.219542980194092, "global_step": 200083, "epoch": 4763} {"train_loss": -7.242196083068848, "global_step": 200084, "epoch": 4763} {"train_loss": -7.292798042297363, "global_step": 200085, "epoch": 4763} {"train_loss": -7.118373394012451, "global_step": 200086, "epoch": 4763} {"train_loss": -7.23885592960176, "global_step": 200087, "epoch": 4763, "val_loss": 81374.953125} {"train_loss": -7.205854415893555, "global_step": 200088, "epoch": 4764} {"train_loss": -7.297983169555664, "global_step": 200089, "epoch": 4764} {"train_loss": -7.356766700744629, "global_step": 200090, "epoch": 4764} {"train_loss": -7.350132942199707, "global_step": 200091, "epoch": 4764} {"train_loss": -7.298878192901611, "global_step": 200092, "epoch": 4764} {"train_loss": -7.133955001831055, "global_step": 200093, "epoch": 4764} {"train_loss": -7.274371147155762, "global_step": 200094, "epoch": 4764} {"train_loss": -7.389077186584473, "global_step": 200095, "epoch": 4764} {"train_loss": -7.351313591003418, "global_step": 200096, "epoch": 4764} {"train_loss": -7.2608747482299805, "global_step": 200097, "epoch": 4764} {"train_loss": -7.339070796966553, "global_step": 200098, "epoch": 4764} {"train_loss": -7.3483452796936035, "global_step": 200099, "epoch": 4764} {"train_loss": -7.362149238586426, "global_step": 200100, "epoch": 4764} {"train_loss": -7.314006805419922, "global_step": 200101, "epoch": 4764} {"train_loss": -7.240849494934082, "global_step": 200102, "epoch": 4764} {"train_loss": -7.410223007202148, "global_step": 200103, "epoch": 4764} {"train_loss": -7.183500289916992, "global_step": 200104, "epoch": 4764} {"train_loss": -7.295631408691406, "global_step": 200105, "epoch": 4764} {"train_loss": -7.298116683959961, "global_step": 200106, "epoch": 4764} {"train_loss": -7.231671333312988, "global_step": 200107, "epoch": 4764} {"train_loss": -7.337190628051758, "global_step": 200108, "epoch": 4764} {"train_loss": -7.304330825805664, "global_step": 200109, "epoch": 4764} {"train_loss": -7.401514053344727, "global_step": 200110, "epoch": 4764} {"train_loss": -7.312569618225098, "global_step": 200111, "epoch": 4764} {"train_loss": -7.323972702026367, "global_step": 200112, "epoch": 4764} {"train_loss": -7.307077407836914, "global_step": 200113, "epoch": 4764} {"train_loss": -7.369867324829102, "global_step": 200114, "epoch": 4764} {"train_loss": -7.315181732177734, "global_step": 200115, "epoch": 4764} {"train_loss": -7.217739582061768, "global_step": 200116, "epoch": 4764} {"train_loss": -7.2712626457214355, "global_step": 200117, "epoch": 4764} {"train_loss": -7.375790596008301, "global_step": 200118, "epoch": 4764} {"train_loss": -7.263047218322754, "global_step": 200119, "epoch": 4764} {"train_loss": -7.3420634269714355, "global_step": 200120, "epoch": 4764} {"train_loss": -7.310441970825195, "global_step": 200121, "epoch": 4764} {"train_loss": -7.281686782836914, "global_step": 200122, "epoch": 4764} {"train_loss": -7.238210201263428, "global_step": 200123, "epoch": 4764} {"train_loss": -7.282668113708496, "global_step": 200124, "epoch": 4764} {"train_loss": -7.1212615966796875, "global_step": 200125, "epoch": 4764} {"train_loss": -7.3740763664245605, "global_step": 200126, "epoch": 4764} {"train_loss": -7.342001914978027, "global_step": 200127, "epoch": 4764} {"train_loss": -7.315543174743652, "global_step": 200128, "epoch": 4764} {"train_loss": -7.3014425323123024, "global_step": 200129, "epoch": 4764, "val_loss": 81639.9453125} {"train_loss": -7.281249046325684, "global_step": 200130, "epoch": 4765} {"train_loss": -7.228175163269043, "global_step": 200131, "epoch": 4765} {"train_loss": -7.313873291015625, "global_step": 200132, "epoch": 4765} {"train_loss": -7.31887149810791, "global_step": 200133, "epoch": 4765} {"train_loss": -7.361347198486328, "global_step": 200134, "epoch": 4765} {"train_loss": -7.251197814941406, "global_step": 200135, "epoch": 4765} {"train_loss": -7.345611572265625, "global_step": 200136, "epoch": 4765} {"train_loss": -7.3517608642578125, "global_step": 200137, "epoch": 4765} {"train_loss": -7.370681285858154, "global_step": 200138, "epoch": 4765} {"train_loss": -7.448245048522949, "global_step": 200139, "epoch": 4765} {"train_loss": -7.397150039672852, "global_step": 200140, "epoch": 4765} {"train_loss": -7.385293960571289, "global_step": 200141, "epoch": 4765} {"train_loss": -7.342525482177734, "global_step": 200142, "epoch": 4765} {"train_loss": -7.418756008148193, "global_step": 200143, "epoch": 4765} {"train_loss": -7.247556209564209, "global_step": 200144, "epoch": 4765} {"train_loss": -7.343679904937744, "global_step": 200145, "epoch": 4765} {"train_loss": -7.366758346557617, "global_step": 200146, "epoch": 4765} {"train_loss": -7.295791149139404, "global_step": 200147, "epoch": 4765} {"train_loss": -7.302557468414307, "global_step": 200148, "epoch": 4765} {"train_loss": -7.311578750610352, "global_step": 200149, "epoch": 4765} {"train_loss": -7.36336612701416, "global_step": 200150, "epoch": 4765} {"train_loss": -7.419210433959961, "global_step": 200151, "epoch": 4765} {"train_loss": -7.384340286254883, "global_step": 200152, "epoch": 4765} {"train_loss": -7.26969575881958, "global_step": 200153, "epoch": 4765} {"train_loss": -7.318960666656494, "global_step": 200154, "epoch": 4765} {"train_loss": -7.278210163116455, "global_step": 200155, "epoch": 4765} {"train_loss": -7.389794826507568, "global_step": 200156, "epoch": 4765} {"train_loss": -7.412986755371094, "global_step": 200157, "epoch": 4765} {"train_loss": -7.346133232116699, "global_step": 200158, "epoch": 4765} {"train_loss": -7.3430376052856445, "global_step": 200159, "epoch": 4765} {"train_loss": -7.378094673156738, "global_step": 200160, "epoch": 4765} {"train_loss": -7.461298942565918, "global_step": 200161, "epoch": 4765} {"train_loss": -7.284618377685547, "global_step": 200162, "epoch": 4765} {"train_loss": -7.3177642822265625, "global_step": 200163, "epoch": 4765} {"train_loss": -7.255659580230713, "global_step": 200164, "epoch": 4765} {"train_loss": -7.295915126800537, "global_step": 200165, "epoch": 4765} {"train_loss": -7.312349319458008, "global_step": 200166, "epoch": 4765} {"train_loss": -7.17300271987915, "global_step": 200167, "epoch": 4765} {"train_loss": -7.223873138427734, "global_step": 200168, "epoch": 4765} {"train_loss": -7.3193254470825195, "global_step": 200169, "epoch": 4765} {"train_loss": -7.2011613845825195, "global_step": 200170, "epoch": 4765} {"train_loss": -7.324791794731503, "global_step": 200171, "epoch": 4765, "val_loss": 81679.4921875} {"train_loss": -7.367727279663086, "global_step": 200172, "epoch": 4766} {"train_loss": -7.0904107093811035, "global_step": 200173, "epoch": 4766} {"train_loss": -7.3246331214904785, "global_step": 200174, "epoch": 4766} {"train_loss": -7.147880554199219, "global_step": 200175, "epoch": 4766} {"train_loss": -7.258177757263184, "global_step": 200176, "epoch": 4766} {"train_loss": -7.227384567260742, "global_step": 200177, "epoch": 4766} {"train_loss": -6.887468338012695, "global_step": 200178, "epoch": 4766} {"train_loss": -7.252463340759277, "global_step": 200179, "epoch": 4766} {"train_loss": -7.205653190612793, "global_step": 200180, "epoch": 4766} {"train_loss": -7.183550834655762, "global_step": 200181, "epoch": 4766} {"train_loss": -7.277106761932373, "global_step": 200182, "epoch": 4766} {"train_loss": -7.135069847106934, "global_step": 200183, "epoch": 4766} {"train_loss": -7.289929389953613, "global_step": 200184, "epoch": 4766} {"train_loss": -7.224163055419922, "global_step": 200185, "epoch": 4766} {"train_loss": -7.16811466217041, "global_step": 200186, "epoch": 4766} {"train_loss": -7.322900772094727, "global_step": 200187, "epoch": 4766} {"train_loss": -7.261331558227539, "global_step": 200188, "epoch": 4766} {"train_loss": -7.155948638916016, "global_step": 200189, "epoch": 4766} {"train_loss": -7.1220903396606445, "global_step": 200190, "epoch": 4766} {"train_loss": -7.266356468200684, "global_step": 200191, "epoch": 4766} {"train_loss": -7.286750793457031, "global_step": 200192, "epoch": 4766} {"train_loss": -7.263675212860107, "global_step": 200193, "epoch": 4766} {"train_loss": -7.166750907897949, "global_step": 200194, "epoch": 4766} {"train_loss": -7.310417175292969, "global_step": 200195, "epoch": 4766} {"train_loss": -6.986180305480957, "global_step": 200196, "epoch": 4766} {"train_loss": -7.365018844604492, "global_step": 200197, "epoch": 4766} {"train_loss": -7.284382343292236, "global_step": 200198, "epoch": 4766} {"train_loss": -7.3320465087890625, "global_step": 200199, "epoch": 4766} {"train_loss": -7.358037948608398, "global_step": 200200, "epoch": 4766} {"train_loss": -7.270142555236816, "global_step": 200201, "epoch": 4766} {"train_loss": -7.257097244262695, "global_step": 200202, "epoch": 4766} {"train_loss": -7.332257270812988, "global_step": 200203, "epoch": 4766} {"train_loss": -7.36204719543457, "global_step": 200204, "epoch": 4766} {"train_loss": -7.328847408294678, "global_step": 200205, "epoch": 4766} {"train_loss": -7.348085403442383, "global_step": 200206, "epoch": 4766} {"train_loss": -7.256458282470703, "global_step": 200207, "epoch": 4766} {"train_loss": -7.290511131286621, "global_step": 200208, "epoch": 4766} {"train_loss": -7.3393964767456055, "global_step": 200209, "epoch": 4766} {"train_loss": -7.266040802001953, "global_step": 200210, "epoch": 4766} {"train_loss": -7.208706855773926, "global_step": 200211, "epoch": 4766} {"train_loss": -7.303421497344971, "global_step": 200212, "epoch": 4766} {"train_loss": -7.247465451558431, "global_step": 200213, "epoch": 4766, "val_loss": 81579.71875} {"train_loss": -7.275277137756348, "global_step": 200214, "epoch": 4767} {"train_loss": -7.309573173522949, "global_step": 200215, "epoch": 4767} {"train_loss": -7.360262870788574, "global_step": 200216, "epoch": 4767} {"train_loss": -7.290146827697754, "global_step": 200217, "epoch": 4767} {"train_loss": -7.267673492431641, "global_step": 200218, "epoch": 4767} {"train_loss": -7.430912017822266, "global_step": 200219, "epoch": 4767} {"train_loss": -7.211256504058838, "global_step": 200220, "epoch": 4767} {"train_loss": -7.287868499755859, "global_step": 200221, "epoch": 4767} {"train_loss": -7.22457218170166, "global_step": 200222, "epoch": 4767} {"train_loss": -7.246190071105957, "global_step": 200223, "epoch": 4767} {"train_loss": -7.388263702392578, "global_step": 200224, "epoch": 4767} {"train_loss": -7.287969589233398, "global_step": 200225, "epoch": 4767} {"train_loss": -7.3329877853393555, "global_step": 200226, "epoch": 4767} {"train_loss": -7.286078453063965, "global_step": 200227, "epoch": 4767} {"train_loss": -7.363491058349609, "global_step": 200228, "epoch": 4767} {"train_loss": -7.351179122924805, "global_step": 200229, "epoch": 4767} {"train_loss": -7.225523471832275, "global_step": 200230, "epoch": 4767} {"train_loss": -7.241922378540039, "global_step": 200231, "epoch": 4767} {"train_loss": -7.303884506225586, "global_step": 200232, "epoch": 4767} {"train_loss": -7.283738613128662, "global_step": 200233, "epoch": 4767} {"train_loss": -7.23396635055542, "global_step": 200234, "epoch": 4767} {"train_loss": -7.35554313659668, "global_step": 200235, "epoch": 4767} {"train_loss": -7.373583793640137, "global_step": 200236, "epoch": 4767} {"train_loss": -7.369225978851318, "global_step": 200237, "epoch": 4767} {"train_loss": -7.2762556076049805, "global_step": 200238, "epoch": 4767} {"train_loss": -7.217433929443359, "global_step": 200239, "epoch": 4767} {"train_loss": -7.322173118591309, "global_step": 200240, "epoch": 4767} {"train_loss": -7.203872203826904, "global_step": 200241, "epoch": 4767} {"train_loss": -7.250574111938477, "global_step": 200242, "epoch": 4767} {"train_loss": -7.2380051612854, "global_step": 200243, "epoch": 4767} {"train_loss": -7.265197277069092, "global_step": 200244, "epoch": 4767} {"train_loss": -7.292354583740234, "global_step": 200245, "epoch": 4767} {"train_loss": -7.217451095581055, "global_step": 200246, "epoch": 4767} {"train_loss": -7.314811706542969, "global_step": 200247, "epoch": 4767} {"train_loss": -7.267539978027344, "global_step": 200248, "epoch": 4767} {"train_loss": -7.24442195892334, "global_step": 200249, "epoch": 4767} {"train_loss": -7.243372917175293, "global_step": 200250, "epoch": 4767} {"train_loss": -7.3309831619262695, "global_step": 200251, "epoch": 4767} {"train_loss": -7.257681369781494, "global_step": 200252, "epoch": 4767} {"train_loss": -7.224715232849121, "global_step": 200253, "epoch": 4767} {"train_loss": -7.1931304931640625, "global_step": 200254, "epoch": 4767} {"train_loss": -7.286275818234398, "global_step": 200255, "epoch": 4767, "val_loss": 81474.6796875} {"train_loss": -7.278750419616699, "global_step": 200256, "epoch": 4768} {"train_loss": -7.273312568664551, "global_step": 200257, "epoch": 4768} {"train_loss": -7.4318952560424805, "global_step": 200258, "epoch": 4768} {"train_loss": -7.304566860198975, "global_step": 200259, "epoch": 4768} {"train_loss": -7.268987655639648, "global_step": 200260, "epoch": 4768} {"train_loss": -7.4241533279418945, "global_step": 200261, "epoch": 4768} {"train_loss": -7.304983139038086, "global_step": 200262, "epoch": 4768} {"train_loss": -7.44607400894165, "global_step": 200263, "epoch": 4768} {"train_loss": -7.356050968170166, "global_step": 200264, "epoch": 4768} {"train_loss": -7.235866546630859, "global_step": 200265, "epoch": 4768} {"train_loss": -7.271951198577881, "global_step": 200266, "epoch": 4768} {"train_loss": -7.356019973754883, "global_step": 200267, "epoch": 4768} {"train_loss": -7.239208698272705, "global_step": 200268, "epoch": 4768} {"train_loss": -7.295262336730957, "global_step": 200269, "epoch": 4768} {"train_loss": -7.29270076751709, "global_step": 200270, "epoch": 4768} {"train_loss": -7.297405242919922, "global_step": 200271, "epoch": 4768} {"train_loss": -7.366565704345703, "global_step": 200272, "epoch": 4768} {"train_loss": -7.276730537414551, "global_step": 200273, "epoch": 4768} {"train_loss": -7.359157562255859, "global_step": 200274, "epoch": 4768} {"train_loss": -7.203276634216309, "global_step": 200275, "epoch": 4768} {"train_loss": -7.083202838897705, "global_step": 200276, "epoch": 4768} {"train_loss": -7.259079456329346, "global_step": 200277, "epoch": 4768} {"train_loss": -7.2370147705078125, "global_step": 200278, "epoch": 4768} {"train_loss": -7.318994998931885, "global_step": 200279, "epoch": 4768} {"train_loss": -7.033888816833496, "global_step": 200280, "epoch": 4768} {"train_loss": -7.189687252044678, "global_step": 200281, "epoch": 4768} {"train_loss": -7.146295070648193, "global_step": 200282, "epoch": 4768} {"train_loss": -7.190746307373047, "global_step": 200283, "epoch": 4768} {"train_loss": -7.293323516845703, "global_step": 200284, "epoch": 4768} {"train_loss": -7.273728370666504, "global_step": 200285, "epoch": 4768} {"train_loss": -7.168647766113281, "global_step": 200286, "epoch": 4768} {"train_loss": -7.1965131759643555, "global_step": 200287, "epoch": 4768} {"train_loss": -7.278006553649902, "global_step": 200288, "epoch": 4768} {"train_loss": -7.1874098777771, "global_step": 200289, "epoch": 4768} {"train_loss": -7.092039585113525, "global_step": 200290, "epoch": 4768} {"train_loss": -7.091535568237305, "global_step": 200291, "epoch": 4768} {"train_loss": -7.211740493774414, "global_step": 200292, "epoch": 4768} {"train_loss": -7.168951988220215, "global_step": 200293, "epoch": 4768} {"train_loss": -7.303905010223389, "global_step": 200294, "epoch": 4768} {"train_loss": -7.224482536315918, "global_step": 200295, "epoch": 4768} {"train_loss": -7.253276348114014, "global_step": 200296, "epoch": 4768} {"train_loss": -7.251914523896717, "global_step": 200297, "epoch": 4768, "val_loss": 81297.984375} {"train_loss": -7.22333288192749, "global_step": 200298, "epoch": 4769} {"train_loss": -7.233377933502197, "global_step": 200299, "epoch": 4769} {"train_loss": -7.246176719665527, "global_step": 200300, "epoch": 4769} {"train_loss": -7.453401565551758, "global_step": 200301, "epoch": 4769} {"train_loss": -7.386831760406494, "global_step": 200302, "epoch": 4769} {"train_loss": -7.284250736236572, "global_step": 200303, "epoch": 4769} {"train_loss": -7.269145488739014, "global_step": 200304, "epoch": 4769} {"train_loss": -7.290888786315918, "global_step": 200305, "epoch": 4769} {"train_loss": -7.320995807647705, "global_step": 200306, "epoch": 4769} {"train_loss": -7.283751487731934, "global_step": 200307, "epoch": 4769} {"train_loss": -7.204792499542236, "global_step": 200308, "epoch": 4769} {"train_loss": -7.388552665710449, "global_step": 200309, "epoch": 4769} {"train_loss": -7.268868446350098, "global_step": 200310, "epoch": 4769} {"train_loss": -7.271324157714844, "global_step": 200311, "epoch": 4769} {"train_loss": -7.296299934387207, "global_step": 200312, "epoch": 4769} {"train_loss": -7.15779447555542, "global_step": 200313, "epoch": 4769} {"train_loss": -7.328237056732178, "global_step": 200314, "epoch": 4769} {"train_loss": -7.194732666015625, "global_step": 200315, "epoch": 4769} {"train_loss": -7.328333854675293, "global_step": 200316, "epoch": 4769} {"train_loss": -7.16581392288208, "global_step": 200317, "epoch": 4769} {"train_loss": -7.319110870361328, "global_step": 200318, "epoch": 4769} {"train_loss": -7.170343399047852, "global_step": 200319, "epoch": 4769} {"train_loss": -7.077844619750977, "global_step": 200320, "epoch": 4769} {"train_loss": -7.361903667449951, "global_step": 200321, "epoch": 4769} {"train_loss": -7.260102272033691, "global_step": 200322, "epoch": 4769} {"train_loss": -7.257810115814209, "global_step": 200323, "epoch": 4769} {"train_loss": -7.178613662719727, "global_step": 200324, "epoch": 4769} {"train_loss": -7.194581985473633, "global_step": 200325, "epoch": 4769} {"train_loss": -7.200701713562012, "global_step": 200326, "epoch": 4769} {"train_loss": -7.211591720581055, "global_step": 200327, "epoch": 4769} {"train_loss": -7.309269905090332, "global_step": 200328, "epoch": 4769} {"train_loss": -7.280288219451904, "global_step": 200329, "epoch": 4769} {"train_loss": -7.462070941925049, "global_step": 200330, "epoch": 4769} {"train_loss": -7.351064682006836, "global_step": 200331, "epoch": 4769} {"train_loss": -7.356709957122803, "global_step": 200332, "epoch": 4769} {"train_loss": -7.278682708740234, "global_step": 200333, "epoch": 4769} {"train_loss": -7.249791145324707, "global_step": 200334, "epoch": 4769} {"train_loss": -7.286177158355713, "global_step": 200335, "epoch": 4769} {"train_loss": -7.500176429748535, "global_step": 200336, "epoch": 4769} {"train_loss": -7.347264289855957, "global_step": 200337, "epoch": 4769} {"train_loss": -7.233808994293213, "global_step": 200338, "epoch": 4769} {"train_loss": -7.280813194456554, "global_step": 200339, "epoch": 4769, "val_loss": 81434.4140625} {"train_loss": -7.366757392883301, "global_step": 200340, "epoch": 4770} {"train_loss": -7.338361740112305, "global_step": 200341, "epoch": 4770} {"train_loss": -7.2846150398254395, "global_step": 200342, "epoch": 4770} {"train_loss": -7.10963249206543, "global_step": 200343, "epoch": 4770} {"train_loss": -7.209169387817383, "global_step": 200344, "epoch": 4770} {"train_loss": -7.307642936706543, "global_step": 200345, "epoch": 4770} {"train_loss": -7.160289287567139, "global_step": 200346, "epoch": 4770} {"train_loss": -7.311382293701172, "global_step": 200347, "epoch": 4770} {"train_loss": -7.2143449783325195, "global_step": 200348, "epoch": 4770} {"train_loss": -7.0972089767456055, "global_step": 200349, "epoch": 4770} {"train_loss": -7.244047164916992, "global_step": 200350, "epoch": 4770} {"train_loss": -7.305755138397217, "global_step": 200351, "epoch": 4770} {"train_loss": -7.222339630126953, "global_step": 200352, "epoch": 4770} {"train_loss": -7.320330619812012, "global_step": 200353, "epoch": 4770} {"train_loss": -7.215893745422363, "global_step": 200354, "epoch": 4770} {"train_loss": -7.233092308044434, "global_step": 200355, "epoch": 4770} {"train_loss": -7.272505760192871, "global_step": 200356, "epoch": 4770} {"train_loss": -7.257822036743164, "global_step": 200357, "epoch": 4770} {"train_loss": -7.374100685119629, "global_step": 200358, "epoch": 4770} {"train_loss": -7.284605979919434, "global_step": 200359, "epoch": 4770} {"train_loss": -7.289867401123047, "global_step": 200360, "epoch": 4770} {"train_loss": -7.2957611083984375, "global_step": 200361, "epoch": 4770} {"train_loss": -7.237926959991455, "global_step": 200362, "epoch": 4770} {"train_loss": -7.392055511474609, "global_step": 200363, "epoch": 4770} {"train_loss": -7.238345146179199, "global_step": 200364, "epoch": 4770} {"train_loss": -7.239471435546875, "global_step": 200365, "epoch": 4770} {"train_loss": -7.2973952293396, "global_step": 200366, "epoch": 4770} {"train_loss": -7.281622886657715, "global_step": 200367, "epoch": 4770} {"train_loss": -7.147205352783203, "global_step": 200368, "epoch": 4770} {"train_loss": -7.282224655151367, "global_step": 200369, "epoch": 4770} {"train_loss": -7.289401054382324, "global_step": 200370, "epoch": 4770} {"train_loss": -7.326178073883057, "global_step": 200371, "epoch": 4770} {"train_loss": -7.115603446960449, "global_step": 200372, "epoch": 4770} {"train_loss": -7.283990859985352, "global_step": 200373, "epoch": 4770} {"train_loss": -7.2728424072265625, "global_step": 200374, "epoch": 4770} {"train_loss": -7.258573532104492, "global_step": 200375, "epoch": 4770} {"train_loss": -7.280811309814453, "global_step": 200376, "epoch": 4770} {"train_loss": -7.291879177093506, "global_step": 200377, "epoch": 4770} {"train_loss": -7.287847518920898, "global_step": 200378, "epoch": 4770} {"train_loss": -7.222797393798828, "global_step": 200379, "epoch": 4770} {"train_loss": -7.236546993255615, "global_step": 200380, "epoch": 4770} {"train_loss": -7.26048477490743, "global_step": 200381, "epoch": 4770, "val_loss": 81552.359375} {"train_loss": -7.279145240783691, "global_step": 200382, "epoch": 4771} {"train_loss": -7.317791938781738, "global_step": 200383, "epoch": 4771} {"train_loss": -7.213273525238037, "global_step": 200384, "epoch": 4771} {"train_loss": -7.351356506347656, "global_step": 200385, "epoch": 4771} {"train_loss": -7.202601909637451, "global_step": 200386, "epoch": 4771} {"train_loss": -7.289562702178955, "global_step": 200387, "epoch": 4771} {"train_loss": -7.285843849182129, "global_step": 200388, "epoch": 4771} {"train_loss": -7.275634288787842, "global_step": 200389, "epoch": 4771} {"train_loss": -7.324618816375732, "global_step": 200390, "epoch": 4771} {"train_loss": -7.305757522583008, "global_step": 200391, "epoch": 4771} {"train_loss": -7.121516227722168, "global_step": 200392, "epoch": 4771} {"train_loss": -7.377987861633301, "global_step": 200393, "epoch": 4771} {"train_loss": -7.256233215332031, "global_step": 200394, "epoch": 4771} {"train_loss": -7.127937316894531, "global_step": 200395, "epoch": 4771} {"train_loss": -7.171651840209961, "global_step": 200396, "epoch": 4771} {"train_loss": -7.2273054122924805, "global_step": 200397, "epoch": 4771} {"train_loss": -7.2143354415893555, "global_step": 200398, "epoch": 4771} {"train_loss": -7.311484336853027, "global_step": 200399, "epoch": 4771} {"train_loss": -7.079765796661377, "global_step": 200400, "epoch": 4771} {"train_loss": -7.1924662590026855, "global_step": 200401, "epoch": 4771} {"train_loss": -7.236824989318848, "global_step": 200402, "epoch": 4771} {"train_loss": -7.285785675048828, "global_step": 200403, "epoch": 4771} {"train_loss": -7.231303691864014, "global_step": 200404, "epoch": 4771} {"train_loss": -7.1081223487854, "global_step": 200405, "epoch": 4771} {"train_loss": -7.220480918884277, "global_step": 200406, "epoch": 4771} {"train_loss": -7.3760857582092285, "global_step": 200407, "epoch": 4771} {"train_loss": -7.253154277801514, "global_step": 200408, "epoch": 4771} {"train_loss": -7.318697929382324, "global_step": 200409, "epoch": 4771} {"train_loss": -7.270058631896973, "global_step": 200410, "epoch": 4771} {"train_loss": -7.339550018310547, "global_step": 200411, "epoch": 4771} {"train_loss": -7.35444974899292, "global_step": 200412, "epoch": 4771} {"train_loss": -7.360480308532715, "global_step": 200413, "epoch": 4771} {"train_loss": -7.379558563232422, "global_step": 200414, "epoch": 4771} {"train_loss": -7.369302749633789, "global_step": 200415, "epoch": 4771} {"train_loss": -7.2601213455200195, "global_step": 200416, "epoch": 4771} {"train_loss": -7.347959518432617, "global_step": 200417, "epoch": 4771} {"train_loss": -7.231301784515381, "global_step": 200418, "epoch": 4771} {"train_loss": -7.41942834854126, "global_step": 200419, "epoch": 4771} {"train_loss": -7.312272071838379, "global_step": 200420, "epoch": 4771} {"train_loss": -7.488458633422852, "global_step": 200421, "epoch": 4771} {"train_loss": -7.40091609954834, "global_step": 200422, "epoch": 4771} {"train_loss": -7.2815770989372615, "global_step": 200423, "epoch": 4771, "val_loss": 81495.234375} {"train_loss": -7.368101119995117, "global_step": 200424, "epoch": 4772} {"train_loss": -7.3674798011779785, "global_step": 200425, "epoch": 4772} {"train_loss": -7.325925827026367, "global_step": 200426, "epoch": 4772} {"train_loss": -7.3738861083984375, "global_step": 200427, "epoch": 4772} {"train_loss": -7.42622184753418, "global_step": 200428, "epoch": 4772} {"train_loss": -7.401327610015869, "global_step": 200429, "epoch": 4772} {"train_loss": -7.369123458862305, "global_step": 200430, "epoch": 4772} {"train_loss": -7.543396472930908, "global_step": 200431, "epoch": 4772} {"train_loss": -7.351513862609863, "global_step": 200432, "epoch": 4772} {"train_loss": -7.411448001861572, "global_step": 200433, "epoch": 4772} {"train_loss": -7.463202953338623, "global_step": 200434, "epoch": 4772} {"train_loss": -7.398737907409668, "global_step": 200435, "epoch": 4772} {"train_loss": -7.328433036804199, "global_step": 200436, "epoch": 4772} {"train_loss": -7.397672653198242, "global_step": 200437, "epoch": 4772} {"train_loss": -7.432551860809326, "global_step": 200438, "epoch": 4772} {"train_loss": -7.441488742828369, "global_step": 200439, "epoch": 4772} {"train_loss": -7.359793663024902, "global_step": 200440, "epoch": 4772} {"train_loss": -7.449277877807617, "global_step": 200441, "epoch": 4772} {"train_loss": -7.452198505401611, "global_step": 200442, "epoch": 4772} {"train_loss": -7.380037784576416, "global_step": 200443, "epoch": 4772} {"train_loss": -7.354777812957764, "global_step": 200444, "epoch": 4772} {"train_loss": -7.5263447761535645, "global_step": 200445, "epoch": 4772} {"train_loss": -7.33553409576416, "global_step": 200446, "epoch": 4772} {"train_loss": -7.375663757324219, "global_step": 200447, "epoch": 4772} {"train_loss": -7.276350021362305, "global_step": 200448, "epoch": 4772} {"train_loss": -7.356646537780762, "global_step": 200449, "epoch": 4772} {"train_loss": -7.364211082458496, "global_step": 200450, "epoch": 4772} {"train_loss": -7.313817977905273, "global_step": 200451, "epoch": 4772} {"train_loss": -7.4001665115356445, "global_step": 200452, "epoch": 4772} {"train_loss": -7.32834529876709, "global_step": 200453, "epoch": 4772} {"train_loss": -7.325653076171875, "global_step": 200454, "epoch": 4772} {"train_loss": -7.335702896118164, "global_step": 200455, "epoch": 4772} {"train_loss": -7.299070835113525, "global_step": 200456, "epoch": 4772} {"train_loss": -7.235902786254883, "global_step": 200457, "epoch": 4772} {"train_loss": -7.363626480102539, "global_step": 200458, "epoch": 4772} {"train_loss": -7.271924018859863, "global_step": 200459, "epoch": 4772} {"train_loss": -7.199969291687012, "global_step": 200460, "epoch": 4772} {"train_loss": -7.296133995056152, "global_step": 200461, "epoch": 4772} {"train_loss": -7.339409828186035, "global_step": 200462, "epoch": 4772} {"train_loss": -7.16568660736084, "global_step": 200463, "epoch": 4772} {"train_loss": -7.2522172927856445, "global_step": 200464, "epoch": 4772} {"train_loss": -7.3540333566211515, "global_step": 200465, "epoch": 4772, "val_loss": 81444.2109375} {"train_loss": -7.245049476623535, "global_step": 200466, "epoch": 4773} {"train_loss": -7.019384384155273, "global_step": 200467, "epoch": 4773} {"train_loss": -7.046212196350098, "global_step": 200468, "epoch": 4773} {"train_loss": -7.163928508758545, "global_step": 200469, "epoch": 4773} {"train_loss": -6.978528022766113, "global_step": 200470, "epoch": 4773} {"train_loss": -7.153440475463867, "global_step": 200471, "epoch": 4773} {"train_loss": -7.0572404861450195, "global_step": 200472, "epoch": 4773} {"train_loss": -7.175054550170898, "global_step": 200473, "epoch": 4773} {"train_loss": -7.110020637512207, "global_step": 200474, "epoch": 4773} {"train_loss": -7.0684123039245605, "global_step": 200475, "epoch": 4773} {"train_loss": -7.1844611167907715, "global_step": 200476, "epoch": 4773} {"train_loss": -7.013044357299805, "global_step": 200477, "epoch": 4773} {"train_loss": -7.192073822021484, "global_step": 200478, "epoch": 4773} {"train_loss": -7.100776672363281, "global_step": 200479, "epoch": 4773} {"train_loss": -7.149327754974365, "global_step": 200480, "epoch": 4773} {"train_loss": -7.0952558517456055, "global_step": 200481, "epoch": 4773} {"train_loss": -7.239707946777344, "global_step": 200482, "epoch": 4773} {"train_loss": -7.178310394287109, "global_step": 200483, "epoch": 4773} {"train_loss": -7.21928596496582, "global_step": 200484, "epoch": 4773} {"train_loss": -7.262228965759277, "global_step": 200485, "epoch": 4773} {"train_loss": -7.099604606628418, "global_step": 200486, "epoch": 4773} {"train_loss": -7.255701541900635, "global_step": 200487, "epoch": 4773} {"train_loss": -7.313158988952637, "global_step": 200488, "epoch": 4773} {"train_loss": -7.170680999755859, "global_step": 200489, "epoch": 4773} {"train_loss": -7.085115909576416, "global_step": 200490, "epoch": 4773} {"train_loss": -7.3175435066223145, "global_step": 200491, "epoch": 4773} {"train_loss": -7.249551773071289, "global_step": 200492, "epoch": 4773} {"train_loss": -7.236865520477295, "global_step": 200493, "epoch": 4773} {"train_loss": -7.245819091796875, "global_step": 200494, "epoch": 4773} {"train_loss": -7.202661037445068, "global_step": 200495, "epoch": 4773} {"train_loss": -7.324736595153809, "global_step": 200496, "epoch": 4773} {"train_loss": -7.242082595825195, "global_step": 200497, "epoch": 4773} {"train_loss": -7.300366401672363, "global_step": 200498, "epoch": 4773} {"train_loss": -7.302353858947754, "global_step": 200499, "epoch": 4773} {"train_loss": -7.186305046081543, "global_step": 200500, "epoch": 4773} {"train_loss": -7.252846717834473, "global_step": 200501, "epoch": 4773} {"train_loss": -7.332728385925293, "global_step": 200502, "epoch": 4773} {"train_loss": -7.314280986785889, "global_step": 200503, "epoch": 4773} {"train_loss": -7.3140788078308105, "global_step": 200504, "epoch": 4773} {"train_loss": -7.141902446746826, "global_step": 200505, "epoch": 4773} {"train_loss": -7.32304573059082, "global_step": 200506, "epoch": 4773} {"train_loss": -7.192122800009591, "global_step": 200507, "epoch": 4773, "val_loss": 81419.6328125} {"train_loss": -6.978957176208496, "global_step": 200508, "epoch": 4774} {"train_loss": -7.26551628112793, "global_step": 200509, "epoch": 4774} {"train_loss": -7.345677375793457, "global_step": 200510, "epoch": 4774} {"train_loss": -7.084834098815918, "global_step": 200511, "epoch": 4774} {"train_loss": -7.303933143615723, "global_step": 200512, "epoch": 4774} {"train_loss": -7.200489044189453, "global_step": 200513, "epoch": 4774} {"train_loss": -7.205352783203125, "global_step": 200514, "epoch": 4774} {"train_loss": -7.133113861083984, "global_step": 200515, "epoch": 4774} {"train_loss": -7.234475135803223, "global_step": 200516, "epoch": 4774} {"train_loss": -7.219443321228027, "global_step": 200517, "epoch": 4774} {"train_loss": -7.190119743347168, "global_step": 200518, "epoch": 4774} {"train_loss": -7.19287109375, "global_step": 200519, "epoch": 4774} {"train_loss": -7.1443634033203125, "global_step": 200520, "epoch": 4774} {"train_loss": -7.249332427978516, "global_step": 200521, "epoch": 4774} {"train_loss": -7.073660850524902, "global_step": 200522, "epoch": 4774} {"train_loss": -7.315717697143555, "global_step": 200523, "epoch": 4774} {"train_loss": -7.2745137214660645, "global_step": 200524, "epoch": 4774} {"train_loss": -7.2536396980285645, "global_step": 200525, "epoch": 4774} {"train_loss": -7.354288101196289, "global_step": 200526, "epoch": 4774} {"train_loss": -7.128509521484375, "global_step": 200527, "epoch": 4774} {"train_loss": -7.274035930633545, "global_step": 200528, "epoch": 4774} {"train_loss": -7.324430465698242, "global_step": 200529, "epoch": 4774} {"train_loss": -7.255222320556641, "global_step": 200530, "epoch": 4774} {"train_loss": -7.3123321533203125, "global_step": 200531, "epoch": 4774} {"train_loss": -7.345752239227295, "global_step": 200532, "epoch": 4774} {"train_loss": -7.366733551025391, "global_step": 200533, "epoch": 4774} {"train_loss": -7.279452800750732, "global_step": 200534, "epoch": 4774} {"train_loss": -7.324970722198486, "global_step": 200535, "epoch": 4774} {"train_loss": -7.378695011138916, "global_step": 200536, "epoch": 4774} {"train_loss": -7.294775009155273, "global_step": 200537, "epoch": 4774} {"train_loss": -7.420403003692627, "global_step": 200538, "epoch": 4774} {"train_loss": -7.251223564147949, "global_step": 200539, "epoch": 4774} {"train_loss": -7.342984676361084, "global_step": 200540, "epoch": 4774} {"train_loss": -7.383271217346191, "global_step": 200541, "epoch": 4774} {"train_loss": -7.295851707458496, "global_step": 200542, "epoch": 4774} {"train_loss": -7.318323612213135, "global_step": 200543, "epoch": 4774} {"train_loss": -7.147341728210449, "global_step": 200544, "epoch": 4774} {"train_loss": -7.269903659820557, "global_step": 200545, "epoch": 4774} {"train_loss": -7.299938678741455, "global_step": 200546, "epoch": 4774} {"train_loss": -7.266855239868164, "global_step": 200547, "epoch": 4774} {"train_loss": -7.227764129638672, "global_step": 200548, "epoch": 4774} {"train_loss": -7.258341925484793, "global_step": 200549, "epoch": 4774, "val_loss": 81720.578125} {"train_loss": -7.209868431091309, "global_step": 200550, "epoch": 4775} {"train_loss": -7.2975969314575195, "global_step": 200551, "epoch": 4775} {"train_loss": -7.294599533081055, "global_step": 200552, "epoch": 4775} {"train_loss": -7.377128601074219, "global_step": 200553, "epoch": 4775} {"train_loss": -7.3850932121276855, "global_step": 200554, "epoch": 4775} {"train_loss": -7.29757022857666, "global_step": 200555, "epoch": 4775} {"train_loss": -7.285141468048096, "global_step": 200556, "epoch": 4775} {"train_loss": -7.345414161682129, "global_step": 200557, "epoch": 4775} {"train_loss": -7.340644836425781, "global_step": 200558, "epoch": 4775} {"train_loss": -7.279306411743164, "global_step": 200559, "epoch": 4775} {"train_loss": -7.269820213317871, "global_step": 200560, "epoch": 4775} {"train_loss": -7.411651611328125, "global_step": 200561, "epoch": 4775} {"train_loss": -7.40336799621582, "global_step": 200562, "epoch": 4775} {"train_loss": -7.425358772277832, "global_step": 200563, "epoch": 4775} {"train_loss": -7.3628034591674805, "global_step": 200564, "epoch": 4775} {"train_loss": -7.221225261688232, "global_step": 200565, "epoch": 4775} {"train_loss": -7.228065490722656, "global_step": 200566, "epoch": 4775} {"train_loss": -7.107203483581543, "global_step": 200567, "epoch": 4775} {"train_loss": -7.226973533630371, "global_step": 200568, "epoch": 4775} {"train_loss": -7.3375701904296875, "global_step": 200569, "epoch": 4775} {"train_loss": -7.126481533050537, "global_step": 200570, "epoch": 4775} {"train_loss": -7.2382659912109375, "global_step": 200571, "epoch": 4775} {"train_loss": -7.051867485046387, "global_step": 200572, "epoch": 4775} {"train_loss": -7.187110424041748, "global_step": 200573, "epoch": 4775} {"train_loss": -7.222726821899414, "global_step": 200574, "epoch": 4775} {"train_loss": -6.993438243865967, "global_step": 200575, "epoch": 4775} {"train_loss": -7.2144775390625, "global_step": 200576, "epoch": 4775} {"train_loss": -7.107635021209717, "global_step": 200577, "epoch": 4775} {"train_loss": -7.302489280700684, "global_step": 200578, "epoch": 4775} {"train_loss": -7.137404441833496, "global_step": 200579, "epoch": 4775} {"train_loss": -7.330445766448975, "global_step": 200580, "epoch": 4775} {"train_loss": -7.258185863494873, "global_step": 200581, "epoch": 4775} {"train_loss": -7.311892509460449, "global_step": 200582, "epoch": 4775} {"train_loss": -7.1468424797058105, "global_step": 200583, "epoch": 4775} {"train_loss": -7.369626998901367, "global_step": 200584, "epoch": 4775} {"train_loss": -7.226731777191162, "global_step": 200585, "epoch": 4775} {"train_loss": -7.361554145812988, "global_step": 200586, "epoch": 4775} {"train_loss": -7.312361717224121, "global_step": 200587, "epoch": 4775} {"train_loss": -7.291313171386719, "global_step": 200588, "epoch": 4775} {"train_loss": -7.211307525634766, "global_step": 200589, "epoch": 4775} {"train_loss": -7.306098937988281, "global_step": 200590, "epoch": 4775} {"train_loss": -7.262711615789504, "global_step": 200591, "epoch": 4775, "val_loss": 81485.4609375} {"train_loss": -7.287303447723389, "global_step": 200592, "epoch": 4776} {"train_loss": -7.299384117126465, "global_step": 200593, "epoch": 4776} {"train_loss": -7.161312103271484, "global_step": 200594, "epoch": 4776} {"train_loss": -7.4181928634643555, "global_step": 200595, "epoch": 4776} {"train_loss": -7.202281951904297, "global_step": 200596, "epoch": 4776} {"train_loss": -7.197821617126465, "global_step": 200597, "epoch": 4776} {"train_loss": -7.3103227615356445, "global_step": 200598, "epoch": 4776} {"train_loss": -7.308577537536621, "global_step": 200599, "epoch": 4776} {"train_loss": -7.2549638748168945, "global_step": 200600, "epoch": 4776} {"train_loss": -7.289547443389893, "global_step": 200601, "epoch": 4776} {"train_loss": -7.24249267578125, "global_step": 200602, "epoch": 4776} {"train_loss": -7.188702583312988, "global_step": 200603, "epoch": 4776} {"train_loss": -7.2587995529174805, "global_step": 200604, "epoch": 4776} {"train_loss": -7.270839691162109, "global_step": 200605, "epoch": 4776} {"train_loss": -7.29033899307251, "global_step": 200606, "epoch": 4776} {"train_loss": -7.424679279327393, "global_step": 200607, "epoch": 4776} {"train_loss": -7.19569206237793, "global_step": 200608, "epoch": 4776} {"train_loss": -7.309246063232422, "global_step": 200609, "epoch": 4776} {"train_loss": -7.348328590393066, "global_step": 200610, "epoch": 4776} {"train_loss": -7.332035064697266, "global_step": 200611, "epoch": 4776} {"train_loss": -7.243414402008057, "global_step": 200612, "epoch": 4776} {"train_loss": -7.267601013183594, "global_step": 200613, "epoch": 4776} {"train_loss": -7.392783164978027, "global_step": 200614, "epoch": 4776} {"train_loss": -7.285253047943115, "global_step": 200615, "epoch": 4776} {"train_loss": -7.224719524383545, "global_step": 200616, "epoch": 4776} {"train_loss": -7.3256096839904785, "global_step": 200617, "epoch": 4776} {"train_loss": -7.324808120727539, "global_step": 200618, "epoch": 4776} {"train_loss": -7.353394508361816, "global_step": 200619, "epoch": 4776} {"train_loss": -7.321392059326172, "global_step": 200620, "epoch": 4776} {"train_loss": -7.310964584350586, "global_step": 200621, "epoch": 4776} {"train_loss": -7.329892158508301, "global_step": 200622, "epoch": 4776} {"train_loss": -7.322793006896973, "global_step": 200623, "epoch": 4776} {"train_loss": -7.225324630737305, "global_step": 200624, "epoch": 4776} {"train_loss": -7.337896347045898, "global_step": 200625, "epoch": 4776} {"train_loss": -7.332353115081787, "global_step": 200626, "epoch": 4776} {"train_loss": -7.187403678894043, "global_step": 200627, "epoch": 4776} {"train_loss": -7.442671775817871, "global_step": 200628, "epoch": 4776} {"train_loss": -7.271214008331299, "global_step": 200629, "epoch": 4776} {"train_loss": -7.276049613952637, "global_step": 200630, "epoch": 4776} {"train_loss": -7.273280620574951, "global_step": 200631, "epoch": 4776} {"train_loss": -7.412275314331055, "global_step": 200632, "epoch": 4776} {"train_loss": -7.294215111505418, "global_step": 200633, "epoch": 4776, "val_loss": 81404.03125} {"train_loss": -7.235274314880371, "global_step": 200634, "epoch": 4777} {"train_loss": -7.4173994064331055, "global_step": 200635, "epoch": 4777} {"train_loss": -7.3806281089782715, "global_step": 200636, "epoch": 4777} {"train_loss": -7.346839904785156, "global_step": 200637, "epoch": 4777} {"train_loss": -7.308515548706055, "global_step": 200638, "epoch": 4777} {"train_loss": -7.255867004394531, "global_step": 200639, "epoch": 4777} {"train_loss": -7.183191776275635, "global_step": 200640, "epoch": 4777} {"train_loss": -7.362504959106445, "global_step": 200641, "epoch": 4777} {"train_loss": -7.3372697830200195, "global_step": 200642, "epoch": 4777} {"train_loss": -7.434217929840088, "global_step": 200643, "epoch": 4777} {"train_loss": -7.328512191772461, "global_step": 200644, "epoch": 4777} {"train_loss": -7.418801307678223, "global_step": 200645, "epoch": 4777} {"train_loss": -7.385930061340332, "global_step": 200646, "epoch": 4777} {"train_loss": -7.249534606933594, "global_step": 200647, "epoch": 4777} {"train_loss": -7.436320781707764, "global_step": 200648, "epoch": 4777} {"train_loss": -7.416752815246582, "global_step": 200649, "epoch": 4777} {"train_loss": -7.324357032775879, "global_step": 200650, "epoch": 4777} {"train_loss": -7.422852039337158, "global_step": 200651, "epoch": 4777} {"train_loss": -7.462267875671387, "global_step": 200652, "epoch": 4777} {"train_loss": -7.302722454071045, "global_step": 200653, "epoch": 4777} {"train_loss": -7.368283748626709, "global_step": 200654, "epoch": 4777} {"train_loss": -7.385382175445557, "global_step": 200655, "epoch": 4777} {"train_loss": -7.387808322906494, "global_step": 200656, "epoch": 4777} {"train_loss": -7.3162031173706055, "global_step": 200657, "epoch": 4777} {"train_loss": -7.204866409301758, "global_step": 200658, "epoch": 4777} {"train_loss": -7.2989888191223145, "global_step": 200659, "epoch": 4777} {"train_loss": -7.377744674682617, "global_step": 200660, "epoch": 4777} {"train_loss": -7.392784595489502, "global_step": 200661, "epoch": 4777} {"train_loss": -7.238324165344238, "global_step": 200662, "epoch": 4777} {"train_loss": -7.238719463348389, "global_step": 200663, "epoch": 4777} {"train_loss": -7.364408016204834, "global_step": 200664, "epoch": 4777} {"train_loss": -7.386603355407715, "global_step": 200665, "epoch": 4777} {"train_loss": -7.186763763427734, "global_step": 200666, "epoch": 4777} {"train_loss": -7.241707801818848, "global_step": 200667, "epoch": 4777} {"train_loss": -7.2568230628967285, "global_step": 200668, "epoch": 4777} {"train_loss": -7.338451862335205, "global_step": 200669, "epoch": 4777} {"train_loss": -7.336820125579834, "global_step": 200670, "epoch": 4777} {"train_loss": -7.410798072814941, "global_step": 200671, "epoch": 4777} {"train_loss": -7.293344497680664, "global_step": 200672, "epoch": 4777} {"train_loss": -7.210987091064453, "global_step": 200673, "epoch": 4777} {"train_loss": -7.312470436096191, "global_step": 200674, "epoch": 4777} {"train_loss": -7.330041737783523, "global_step": 200675, "epoch": 4777, "val_loss": 81331.6875} {"train_loss": -7.318645477294922, "global_step": 200676, "epoch": 4778} {"train_loss": -7.247830867767334, "global_step": 200677, "epoch": 4778} {"train_loss": -7.237444877624512, "global_step": 200678, "epoch": 4778} {"train_loss": -7.264163494110107, "global_step": 200679, "epoch": 4778} {"train_loss": -7.211492538452148, "global_step": 200680, "epoch": 4778} {"train_loss": -7.393240451812744, "global_step": 200681, "epoch": 4778} {"train_loss": -7.24480676651001, "global_step": 200682, "epoch": 4778} {"train_loss": -7.305488109588623, "global_step": 200683, "epoch": 4778} {"train_loss": -7.407212257385254, "global_step": 200684, "epoch": 4778} {"train_loss": -7.1525163650512695, "global_step": 200685, "epoch": 4778} {"train_loss": -7.0719099044799805, "global_step": 200686, "epoch": 4778} {"train_loss": -7.299220085144043, "global_step": 200687, "epoch": 4778} {"train_loss": -7.288171768188477, "global_step": 200688, "epoch": 4778} {"train_loss": -7.226871013641357, "global_step": 200689, "epoch": 4778} {"train_loss": -7.30860710144043, "global_step": 200690, "epoch": 4778} {"train_loss": -7.4044060707092285, "global_step": 200691, "epoch": 4778} {"train_loss": -7.307985305786133, "global_step": 200692, "epoch": 4778} {"train_loss": -7.346170425415039, "global_step": 200693, "epoch": 4778} {"train_loss": -7.258670806884766, "global_step": 200694, "epoch": 4778} {"train_loss": -7.382915496826172, "global_step": 200695, "epoch": 4778} {"train_loss": -7.132539749145508, "global_step": 200696, "epoch": 4778} {"train_loss": -7.286393165588379, "global_step": 200697, "epoch": 4778} {"train_loss": -7.243563175201416, "global_step": 200698, "epoch": 4778} {"train_loss": -7.259289264678955, "global_step": 200699, "epoch": 4778} {"train_loss": -7.224484443664551, "global_step": 200700, "epoch": 4778} {"train_loss": -7.21589469909668, "global_step": 200701, "epoch": 4778} {"train_loss": -7.2809553146362305, "global_step": 200702, "epoch": 4778} {"train_loss": -7.289966106414795, "global_step": 200703, "epoch": 4778} {"train_loss": -7.3174238204956055, "global_step": 200704, "epoch": 4778} {"train_loss": -7.326347351074219, "global_step": 200705, "epoch": 4778} {"train_loss": -7.172076225280762, "global_step": 200706, "epoch": 4778} {"train_loss": -7.363704681396484, "global_step": 200707, "epoch": 4778} {"train_loss": -7.20672607421875, "global_step": 200708, "epoch": 4778} {"train_loss": -7.192964553833008, "global_step": 200709, "epoch": 4778} {"train_loss": -7.25097131729126, "global_step": 200710, "epoch": 4778} {"train_loss": -7.266844272613525, "global_step": 200711, "epoch": 4778} {"train_loss": -7.341991424560547, "global_step": 200712, "epoch": 4778} {"train_loss": -7.311471939086914, "global_step": 200713, "epoch": 4778} {"train_loss": -7.286954879760742, "global_step": 200714, "epoch": 4778} {"train_loss": -7.173830032348633, "global_step": 200715, "epoch": 4778} {"train_loss": -7.237389087677002, "global_step": 200716, "epoch": 4778} {"train_loss": -7.2663817292168025, "global_step": 200717, "epoch": 4778, "val_loss": 81339.890625} {"train_loss": -7.169522285461426, "global_step": 200718, "epoch": 4779} {"train_loss": -7.142499923706055, "global_step": 200719, "epoch": 4779} {"train_loss": -7.260049819946289, "global_step": 200720, "epoch": 4779} {"train_loss": -7.199902534484863, "global_step": 200721, "epoch": 4779} {"train_loss": -6.925271511077881, "global_step": 200722, "epoch": 4779} {"train_loss": -7.308864116668701, "global_step": 200723, "epoch": 4779} {"train_loss": -6.929056167602539, "global_step": 200724, "epoch": 4779} {"train_loss": -7.164921760559082, "global_step": 200725, "epoch": 4779} {"train_loss": -7.140987396240234, "global_step": 200726, "epoch": 4779} {"train_loss": -7.247308731079102, "global_step": 200727, "epoch": 4779} {"train_loss": -7.0358686447143555, "global_step": 200728, "epoch": 4779} {"train_loss": -7.28751277923584, "global_step": 200729, "epoch": 4779} {"train_loss": -7.161466598510742, "global_step": 200730, "epoch": 4779} {"train_loss": -7.3202972412109375, "global_step": 200731, "epoch": 4779} {"train_loss": -7.223005771636963, "global_step": 200732, "epoch": 4779} {"train_loss": -7.231513023376465, "global_step": 200733, "epoch": 4779} {"train_loss": -7.318248748779297, "global_step": 200734, "epoch": 4779} {"train_loss": -7.330580711364746, "global_step": 200735, "epoch": 4779} {"train_loss": -7.376978874206543, "global_step": 200736, "epoch": 4779} {"train_loss": -7.335293769836426, "global_step": 200737, "epoch": 4779} {"train_loss": -7.30926513671875, "global_step": 200738, "epoch": 4779} {"train_loss": -7.3321428298950195, "global_step": 200739, "epoch": 4779} {"train_loss": -7.18280553817749, "global_step": 200740, "epoch": 4779} {"train_loss": -7.271003246307373, "global_step": 200741, "epoch": 4779} {"train_loss": -7.348928451538086, "global_step": 200742, "epoch": 4779} {"train_loss": -7.334095001220703, "global_step": 200743, "epoch": 4779} {"train_loss": -7.365560531616211, "global_step": 200744, "epoch": 4779} {"train_loss": -7.302735328674316, "global_step": 200745, "epoch": 4779} {"train_loss": -7.414498805999756, "global_step": 200746, "epoch": 4779} {"train_loss": -7.300978183746338, "global_step": 200747, "epoch": 4779} {"train_loss": -7.323666095733643, "global_step": 200748, "epoch": 4779} {"train_loss": -7.306916236877441, "global_step": 200749, "epoch": 4779} {"train_loss": -7.304112434387207, "global_step": 200750, "epoch": 4779} {"train_loss": -7.302113056182861, "global_step": 200751, "epoch": 4779} {"train_loss": -7.323946952819824, "global_step": 200752, "epoch": 4779} {"train_loss": -7.266356468200684, "global_step": 200753, "epoch": 4779} {"train_loss": -7.218508720397949, "global_step": 200754, "epoch": 4779} {"train_loss": -7.202290058135986, "global_step": 200755, "epoch": 4779} {"train_loss": -7.3709187507629395, "global_step": 200756, "epoch": 4779} {"train_loss": -7.234162330627441, "global_step": 200757, "epoch": 4779} {"train_loss": -7.317444801330566, "global_step": 200758, "epoch": 4779} {"train_loss": -7.253108558200655, "global_step": 200759, "epoch": 4779, "val_loss": 81666.921875} {"train_loss": -7.099273681640625, "global_step": 200760, "epoch": 4780} {"train_loss": -7.309528350830078, "global_step": 200761, "epoch": 4780} {"train_loss": -7.258801460266113, "global_step": 200762, "epoch": 4780} {"train_loss": -7.286506175994873, "global_step": 200763, "epoch": 4780} {"train_loss": -7.313370704650879, "global_step": 200764, "epoch": 4780} {"train_loss": -7.314488410949707, "global_step": 200765, "epoch": 4780} {"train_loss": -7.240537643432617, "global_step": 200766, "epoch": 4780} {"train_loss": -7.232154846191406, "global_step": 200767, "epoch": 4780} {"train_loss": -7.252964973449707, "global_step": 200768, "epoch": 4780} {"train_loss": -7.177127361297607, "global_step": 200769, "epoch": 4780} {"train_loss": -7.185352325439453, "global_step": 200770, "epoch": 4780} {"train_loss": -7.271088600158691, "global_step": 200771, "epoch": 4780} {"train_loss": -7.206329822540283, "global_step": 200772, "epoch": 4780} {"train_loss": -7.227699279785156, "global_step": 200773, "epoch": 4780} {"train_loss": -7.274724006652832, "global_step": 200774, "epoch": 4780} {"train_loss": -7.3762712478637695, "global_step": 200775, "epoch": 4780} {"train_loss": -7.179277420043945, "global_step": 200776, "epoch": 4780} {"train_loss": -7.308653831481934, "global_step": 200777, "epoch": 4780} {"train_loss": -7.2795000076293945, "global_step": 200778, "epoch": 4780} {"train_loss": -7.344444274902344, "global_step": 200779, "epoch": 4780} {"train_loss": -7.200628280639648, "global_step": 200780, "epoch": 4780} {"train_loss": -7.212774753570557, "global_step": 200781, "epoch": 4780} {"train_loss": -7.198843955993652, "global_step": 200782, "epoch": 4780} {"train_loss": -7.128440856933594, "global_step": 200783, "epoch": 4780} {"train_loss": -7.095398902893066, "global_step": 200784, "epoch": 4780} {"train_loss": -7.122213363647461, "global_step": 200785, "epoch": 4780} {"train_loss": -7.177755355834961, "global_step": 200786, "epoch": 4780} {"train_loss": -7.28043270111084, "global_step": 200787, "epoch": 4780} {"train_loss": -7.179690361022949, "global_step": 200788, "epoch": 4780} {"train_loss": -7.212713241577148, "global_step": 200789, "epoch": 4780} {"train_loss": -7.079057693481445, "global_step": 200790, "epoch": 4780} {"train_loss": -7.175638198852539, "global_step": 200791, "epoch": 4780} {"train_loss": -7.156590461730957, "global_step": 200792, "epoch": 4780} {"train_loss": -7.139181137084961, "global_step": 200793, "epoch": 4780} {"train_loss": -7.156310081481934, "global_step": 200794, "epoch": 4780} {"train_loss": -7.249583721160889, "global_step": 200795, "epoch": 4780} {"train_loss": -7.137693405151367, "global_step": 200796, "epoch": 4780} {"train_loss": -7.079957962036133, "global_step": 200797, "epoch": 4780} {"train_loss": -7.2552008628845215, "global_step": 200798, "epoch": 4780} {"train_loss": -7.138185501098633, "global_step": 200799, "epoch": 4780} {"train_loss": -7.205760955810547, "global_step": 200800, "epoch": 4780} {"train_loss": -7.215133825937907, "global_step": 200801, "epoch": 4780, "val_loss": 81760.0390625} {"train_loss": -7.045698165893555, "global_step": 200802, "epoch": 4781} {"train_loss": -7.208115100860596, "global_step": 200803, "epoch": 4781} {"train_loss": -7.314598083496094, "global_step": 200804, "epoch": 4781} {"train_loss": -7.290966987609863, "global_step": 200805, "epoch": 4781} {"train_loss": -7.251049995422363, "global_step": 200806, "epoch": 4781} {"train_loss": -7.2960100173950195, "global_step": 200807, "epoch": 4781} {"train_loss": -7.390357494354248, "global_step": 200808, "epoch": 4781} {"train_loss": -7.376461982727051, "global_step": 200809, "epoch": 4781} {"train_loss": -7.378040313720703, "global_step": 200810, "epoch": 4781} {"train_loss": -7.266336441040039, "global_step": 200811, "epoch": 4781} {"train_loss": -7.3984246253967285, "global_step": 200812, "epoch": 4781} {"train_loss": -7.2214460372924805, "global_step": 200813, "epoch": 4781} {"train_loss": -7.318256378173828, "global_step": 200814, "epoch": 4781} {"train_loss": -7.334237098693848, "global_step": 200815, "epoch": 4781} {"train_loss": -7.251441955566406, "global_step": 200816, "epoch": 4781} {"train_loss": -7.231216907501221, "global_step": 200817, "epoch": 4781} {"train_loss": -7.297091007232666, "global_step": 200818, "epoch": 4781} {"train_loss": -7.26872444152832, "global_step": 200819, "epoch": 4781} {"train_loss": -7.321562767028809, "global_step": 200820, "epoch": 4781} {"train_loss": -7.307060241699219, "global_step": 200821, "epoch": 4781} {"train_loss": -7.219522476196289, "global_step": 200822, "epoch": 4781} {"train_loss": -7.260965347290039, "global_step": 200823, "epoch": 4781} {"train_loss": -7.25730037689209, "global_step": 200824, "epoch": 4781} {"train_loss": -7.221615314483643, "global_step": 200825, "epoch": 4781} {"train_loss": -7.163677215576172, "global_step": 200826, "epoch": 4781} {"train_loss": -7.268938064575195, "global_step": 200827, "epoch": 4781} {"train_loss": -7.00321626663208, "global_step": 200828, "epoch": 4781} {"train_loss": -7.1533637046813965, "global_step": 200829, "epoch": 4781} {"train_loss": -7.3286638259887695, "global_step": 200830, "epoch": 4781} {"train_loss": -7.1517415046691895, "global_step": 200831, "epoch": 4781} {"train_loss": -7.298372268676758, "global_step": 200832, "epoch": 4781} {"train_loss": -7.230374336242676, "global_step": 200833, "epoch": 4781} {"train_loss": -7.149134159088135, "global_step": 200834, "epoch": 4781} {"train_loss": -7.266209125518799, "global_step": 200835, "epoch": 4781} {"train_loss": -7.198606491088867, "global_step": 200836, "epoch": 4781} {"train_loss": -7.28050422668457, "global_step": 200837, "epoch": 4781} {"train_loss": -7.1082258224487305, "global_step": 200838, "epoch": 4781} {"train_loss": -7.173381328582764, "global_step": 200839, "epoch": 4781} {"train_loss": -7.280632972717285, "global_step": 200840, "epoch": 4781} {"train_loss": -7.16726016998291, "global_step": 200841, "epoch": 4781} {"train_loss": -7.250699996948242, "global_step": 200842, "epoch": 4781} {"train_loss": -7.246420985176449, "global_step": 200843, "epoch": 4781, "val_loss": 81475.03125} {"train_loss": -7.219554424285889, "global_step": 200844, "epoch": 4782} {"train_loss": -7.259875774383545, "global_step": 200845, "epoch": 4782} {"train_loss": -7.160363674163818, "global_step": 200846, "epoch": 4782} {"train_loss": -7.295377254486084, "global_step": 200847, "epoch": 4782} {"train_loss": -7.264085292816162, "global_step": 200848, "epoch": 4782} {"train_loss": -7.269401550292969, "global_step": 200849, "epoch": 4782} {"train_loss": -7.320268630981445, "global_step": 200850, "epoch": 4782} {"train_loss": -7.213953018188477, "global_step": 200851, "epoch": 4782} {"train_loss": -7.386297225952148, "global_step": 200852, "epoch": 4782} {"train_loss": -7.343677520751953, "global_step": 200853, "epoch": 4782} {"train_loss": -7.230565071105957, "global_step": 200854, "epoch": 4782} {"train_loss": -7.228210926055908, "global_step": 200855, "epoch": 4782} {"train_loss": -7.373716354370117, "global_step": 200856, "epoch": 4782} {"train_loss": -7.322024345397949, "global_step": 200857, "epoch": 4782} {"train_loss": -7.286314964294434, "global_step": 200858, "epoch": 4782} {"train_loss": -7.339043617248535, "global_step": 200859, "epoch": 4782} {"train_loss": -7.386810302734375, "global_step": 200860, "epoch": 4782} {"train_loss": -7.209086894989014, "global_step": 200861, "epoch": 4782} {"train_loss": -7.3153886795043945, "global_step": 200862, "epoch": 4782} {"train_loss": -7.341498374938965, "global_step": 200863, "epoch": 4782} {"train_loss": -7.306423187255859, "global_step": 200864, "epoch": 4782} {"train_loss": -7.315459728240967, "global_step": 200865, "epoch": 4782} {"train_loss": -7.295233726501465, "global_step": 200866, "epoch": 4782} {"train_loss": -7.320100784301758, "global_step": 200867, "epoch": 4782} {"train_loss": -7.330241680145264, "global_step": 200868, "epoch": 4782} {"train_loss": -7.331170082092285, "global_step": 200869, "epoch": 4782} {"train_loss": -7.273516654968262, "global_step": 200870, "epoch": 4782} {"train_loss": -7.252518653869629, "global_step": 200871, "epoch": 4782} {"train_loss": -7.263425350189209, "global_step": 200872, "epoch": 4782} {"train_loss": -7.3311285972595215, "global_step": 200873, "epoch": 4782} {"train_loss": -7.274304389953613, "global_step": 200874, "epoch": 4782} {"train_loss": -7.249704360961914, "global_step": 200875, "epoch": 4782} {"train_loss": -7.261841773986816, "global_step": 200876, "epoch": 4782} {"train_loss": -7.25660514831543, "global_step": 200877, "epoch": 4782} {"train_loss": -7.302296161651611, "global_step": 200878, "epoch": 4782} {"train_loss": -7.2386369705200195, "global_step": 200879, "epoch": 4782} {"train_loss": -7.389150619506836, "global_step": 200880, "epoch": 4782} {"train_loss": -7.327485084533691, "global_step": 200881, "epoch": 4782} {"train_loss": -7.402676582336426, "global_step": 200882, "epoch": 4782} {"train_loss": -7.495366096496582, "global_step": 200883, "epoch": 4782} {"train_loss": -7.386768341064453, "global_step": 200884, "epoch": 4782} {"train_loss": -7.305149055662609, "global_step": 200885, "epoch": 4782, "val_loss": 81691.6640625} {"train_loss": -7.334565162658691, "global_step": 200886, "epoch": 4783} {"train_loss": -7.309487342834473, "global_step": 200887, "epoch": 4783} {"train_loss": -7.403110980987549, "global_step": 200888, "epoch": 4783} {"train_loss": -7.346811294555664, "global_step": 200889, "epoch": 4783} {"train_loss": -7.371058464050293, "global_step": 200890, "epoch": 4783} {"train_loss": -7.278841972351074, "global_step": 200891, "epoch": 4783} {"train_loss": -7.224360466003418, "global_step": 200892, "epoch": 4783} {"train_loss": -7.328031539916992, "global_step": 200893, "epoch": 4783} {"train_loss": -7.326409339904785, "global_step": 200894, "epoch": 4783} {"train_loss": -7.302865028381348, "global_step": 200895, "epoch": 4783} {"train_loss": -7.2245378494262695, "global_step": 200896, "epoch": 4783} {"train_loss": -7.327384948730469, "global_step": 200897, "epoch": 4783} {"train_loss": -7.372468948364258, "global_step": 200898, "epoch": 4783} {"train_loss": -7.368011474609375, "global_step": 200899, "epoch": 4783} {"train_loss": -7.3076300621032715, "global_step": 200900, "epoch": 4783} {"train_loss": -7.429738998413086, "global_step": 200901, "epoch": 4783} {"train_loss": -7.350038528442383, "global_step": 200902, "epoch": 4783} {"train_loss": -7.386937141418457, "global_step": 200903, "epoch": 4783} {"train_loss": -7.387749195098877, "global_step": 200904, "epoch": 4783} {"train_loss": -7.523047924041748, "global_step": 200905, "epoch": 4783} {"train_loss": -7.2686967849731445, "global_step": 200906, "epoch": 4783} {"train_loss": -7.51447057723999, "global_step": 200907, "epoch": 4783} {"train_loss": -7.330803871154785, "global_step": 200908, "epoch": 4783} {"train_loss": -7.319039344787598, "global_step": 200909, "epoch": 4783} {"train_loss": -7.45212459564209, "global_step": 200910, "epoch": 4783} {"train_loss": -7.352151870727539, "global_step": 200911, "epoch": 4783} {"train_loss": -7.302139759063721, "global_step": 200912, "epoch": 4783} {"train_loss": -7.361029624938965, "global_step": 200913, "epoch": 4783} {"train_loss": -7.387209892272949, "global_step": 200914, "epoch": 4783} {"train_loss": -7.2274017333984375, "global_step": 200915, "epoch": 4783} {"train_loss": -7.194886684417725, "global_step": 200916, "epoch": 4783} {"train_loss": -7.185685634613037, "global_step": 200917, "epoch": 4783} {"train_loss": -7.420546531677246, "global_step": 200918, "epoch": 4783} {"train_loss": -7.193886756896973, "global_step": 200919, "epoch": 4783} {"train_loss": -7.284961700439453, "global_step": 200920, "epoch": 4783} {"train_loss": -7.451581954956055, "global_step": 200921, "epoch": 4783} {"train_loss": -7.234855651855469, "global_step": 200922, "epoch": 4783} {"train_loss": -7.239530086517334, "global_step": 200923, "epoch": 4783} {"train_loss": -7.3193359375, "global_step": 200924, "epoch": 4783} {"train_loss": -7.207231521606445, "global_step": 200925, "epoch": 4783} {"train_loss": -7.167593002319336, "global_step": 200926, "epoch": 4783} {"train_loss": -7.323462929044451, "global_step": 200927, "epoch": 4783, "val_loss": 81532.078125} {"train_loss": -7.185656547546387, "global_step": 200928, "epoch": 4784} {"train_loss": -7.2378458976745605, "global_step": 200929, "epoch": 4784} {"train_loss": -7.262897491455078, "global_step": 200930, "epoch": 4784} {"train_loss": -7.3313188552856445, "global_step": 200931, "epoch": 4784} {"train_loss": -7.252547264099121, "global_step": 200932, "epoch": 4784} {"train_loss": -7.142266273498535, "global_step": 200933, "epoch": 4784} {"train_loss": -7.364551544189453, "global_step": 200934, "epoch": 4784} {"train_loss": -7.211299896240234, "global_step": 200935, "epoch": 4784} {"train_loss": -7.230448246002197, "global_step": 200936, "epoch": 4784} {"train_loss": -7.187270164489746, "global_step": 200937, "epoch": 4784} {"train_loss": -7.163159370422363, "global_step": 200938, "epoch": 4784} {"train_loss": -7.1988677978515625, "global_step": 200939, "epoch": 4784} {"train_loss": -7.377815246582031, "global_step": 200940, "epoch": 4784} {"train_loss": -7.25918436050415, "global_step": 200941, "epoch": 4784} {"train_loss": -7.192063331604004, "global_step": 200942, "epoch": 4784} {"train_loss": -7.120330810546875, "global_step": 200943, "epoch": 4784} {"train_loss": -7.298855304718018, "global_step": 200944, "epoch": 4784} {"train_loss": -7.238981246948242, "global_step": 200945, "epoch": 4784} {"train_loss": -7.260418891906738, "global_step": 200946, "epoch": 4784} {"train_loss": -7.186810493469238, "global_step": 200947, "epoch": 4784} {"train_loss": -7.33835506439209, "global_step": 200948, "epoch": 4784} {"train_loss": -7.3290934562683105, "global_step": 200949, "epoch": 4784} {"train_loss": -7.288293838500977, "global_step": 200950, "epoch": 4784} {"train_loss": -7.295206069946289, "global_step": 200951, "epoch": 4784} {"train_loss": -7.301270484924316, "global_step": 200952, "epoch": 4784} {"train_loss": -7.247603416442871, "global_step": 200953, "epoch": 4784} {"train_loss": -7.309045791625977, "global_step": 200954, "epoch": 4784} {"train_loss": -7.246667861938477, "global_step": 200955, "epoch": 4784} {"train_loss": -7.33709716796875, "global_step": 200956, "epoch": 4784} {"train_loss": -7.332181930541992, "global_step": 200957, "epoch": 4784} {"train_loss": -7.345128059387207, "global_step": 200958, "epoch": 4784} {"train_loss": -7.339715957641602, "global_step": 200959, "epoch": 4784} {"train_loss": -7.2073140144348145, "global_step": 200960, "epoch": 4784} {"train_loss": -7.26717472076416, "global_step": 200961, "epoch": 4784} {"train_loss": -7.269245624542236, "global_step": 200962, "epoch": 4784} {"train_loss": -7.30189323425293, "global_step": 200963, "epoch": 4784} {"train_loss": -7.364501953125, "global_step": 200964, "epoch": 4784} {"train_loss": -7.200020790100098, "global_step": 200965, "epoch": 4784} {"train_loss": -7.391514778137207, "global_step": 200966, "epoch": 4784} {"train_loss": -7.4154157638549805, "global_step": 200967, "epoch": 4784} {"train_loss": -7.3199052810668945, "global_step": 200968, "epoch": 4784} {"train_loss": -7.27423864319211, "global_step": 200969, "epoch": 4784, "val_loss": 81580.7734375} {"train_loss": -7.346051216125488, "global_step": 200970, "epoch": 4785} {"train_loss": -7.365569114685059, "global_step": 200971, "epoch": 4785} {"train_loss": -7.352376937866211, "global_step": 200972, "epoch": 4785} {"train_loss": -7.453801155090332, "global_step": 200973, "epoch": 4785} {"train_loss": -7.409150123596191, "global_step": 200974, "epoch": 4785} {"train_loss": -7.386295318603516, "global_step": 200975, "epoch": 4785} {"train_loss": -7.420090675354004, "global_step": 200976, "epoch": 4785} {"train_loss": -7.384052276611328, "global_step": 200977, "epoch": 4785} {"train_loss": -7.384936332702637, "global_step": 200978, "epoch": 4785} {"train_loss": -7.352165222167969, "global_step": 200979, "epoch": 4785} {"train_loss": -7.329856872558594, "global_step": 200980, "epoch": 4785} {"train_loss": -7.245912551879883, "global_step": 200981, "epoch": 4785} {"train_loss": -7.399472236633301, "global_step": 200982, "epoch": 4785} {"train_loss": -7.281686305999756, "global_step": 200983, "epoch": 4785} {"train_loss": -7.3531494140625, "global_step": 200984, "epoch": 4785} {"train_loss": -7.230096817016602, "global_step": 200985, "epoch": 4785} {"train_loss": -7.2801127433776855, "global_step": 200986, "epoch": 4785} {"train_loss": -7.347228050231934, "global_step": 200987, "epoch": 4785} {"train_loss": -7.395877838134766, "global_step": 200988, "epoch": 4785} {"train_loss": -7.329639434814453, "global_step": 200989, "epoch": 4785} {"train_loss": -7.271766662597656, "global_step": 200990, "epoch": 4785} {"train_loss": -7.2554755210876465, "global_step": 200991, "epoch": 4785} {"train_loss": -7.3370513916015625, "global_step": 200992, "epoch": 4785} {"train_loss": -7.304512023925781, "global_step": 200993, "epoch": 4785} {"train_loss": -7.347294807434082, "global_step": 200994, "epoch": 4785} {"train_loss": -7.324626922607422, "global_step": 200995, "epoch": 4785} {"train_loss": -7.263272285461426, "global_step": 200996, "epoch": 4785} {"train_loss": -7.1787333488464355, "global_step": 200997, "epoch": 4785} {"train_loss": -7.197047233581543, "global_step": 200998, "epoch": 4785} {"train_loss": -7.311707496643066, "global_step": 200999, "epoch": 4785} {"train_loss": -7.323876857757568, "global_step": 201000, "epoch": 4785} {"train_loss": -7.240187644958496, "global_step": 201001, "epoch": 4785} {"train_loss": -7.352017879486084, "global_step": 201002, "epoch": 4785} {"train_loss": -7.374102592468262, "global_step": 201003, "epoch": 4785} {"train_loss": -7.345651626586914, "global_step": 201004, "epoch": 4785} {"train_loss": -7.251126766204834, "global_step": 201005, "epoch": 4785} {"train_loss": -7.384912490844727, "global_step": 201006, "epoch": 4785} {"train_loss": -7.281372547149658, "global_step": 201007, "epoch": 4785} {"train_loss": -7.291263580322266, "global_step": 201008, "epoch": 4785} {"train_loss": -7.227002143859863, "global_step": 201009, "epoch": 4785} {"train_loss": -7.196259498596191, "global_step": 201010, "epoch": 4785} {"train_loss": -7.320825077238537, "global_step": 201011, "epoch": 4785, "val_loss": 81363.1796875} {"train_loss": -7.404533863067627, "global_step": 201012, "epoch": 4786} {"train_loss": -7.379015922546387, "global_step": 201013, "epoch": 4786} {"train_loss": -7.347869396209717, "global_step": 201014, "epoch": 4786} {"train_loss": -7.336215972900391, "global_step": 201015, "epoch": 4786} {"train_loss": -7.430147171020508, "global_step": 201016, "epoch": 4786} {"train_loss": -7.384989261627197, "global_step": 201017, "epoch": 4786} {"train_loss": -7.302981376647949, "global_step": 201018, "epoch": 4786} {"train_loss": -7.33635950088501, "global_step": 201019, "epoch": 4786} {"train_loss": -7.240018844604492, "global_step": 201020, "epoch": 4786} {"train_loss": -7.285499572753906, "global_step": 201021, "epoch": 4786} {"train_loss": -7.378230094909668, "global_step": 201022, "epoch": 4786} {"train_loss": -7.309340476989746, "global_step": 201023, "epoch": 4786} {"train_loss": -7.305398464202881, "global_step": 201024, "epoch": 4786} {"train_loss": -7.358180999755859, "global_step": 201025, "epoch": 4786} {"train_loss": -7.413588047027588, "global_step": 201026, "epoch": 4786} {"train_loss": -7.21297550201416, "global_step": 201027, "epoch": 4786} {"train_loss": -7.307748794555664, "global_step": 201028, "epoch": 4786} {"train_loss": -7.179856300354004, "global_step": 201029, "epoch": 4786} {"train_loss": -7.306537628173828, "global_step": 201030, "epoch": 4786} {"train_loss": -7.307699680328369, "global_step": 201031, "epoch": 4786} {"train_loss": -7.233906269073486, "global_step": 201032, "epoch": 4786} {"train_loss": -7.152497291564941, "global_step": 201033, "epoch": 4786} {"train_loss": -7.293595314025879, "global_step": 201034, "epoch": 4786} {"train_loss": -7.269007205963135, "global_step": 201035, "epoch": 4786} {"train_loss": -7.312483787536621, "global_step": 201036, "epoch": 4786} {"train_loss": -7.214103698730469, "global_step": 201037, "epoch": 4786} {"train_loss": -7.244223594665527, "global_step": 201038, "epoch": 4786} {"train_loss": -7.322429180145264, "global_step": 201039, "epoch": 4786} {"train_loss": -7.2959771156311035, "global_step": 201040, "epoch": 4786} {"train_loss": -7.321496486663818, "global_step": 201041, "epoch": 4786} {"train_loss": -7.250135898590088, "global_step": 201042, "epoch": 4786} {"train_loss": -7.222437858581543, "global_step": 201043, "epoch": 4786} {"train_loss": -7.198436260223389, "global_step": 201044, "epoch": 4786} {"train_loss": -7.188676834106445, "global_step": 201045, "epoch": 4786} {"train_loss": -7.31004524230957, "global_step": 201046, "epoch": 4786} {"train_loss": -7.355471611022949, "global_step": 201047, "epoch": 4786} {"train_loss": -7.363555908203125, "global_step": 201048, "epoch": 4786} {"train_loss": -7.321413993835449, "global_step": 201049, "epoch": 4786} {"train_loss": -7.288468360900879, "global_step": 201050, "epoch": 4786} {"train_loss": -7.217617988586426, "global_step": 201051, "epoch": 4786} {"train_loss": -7.244264602661133, "global_step": 201052, "epoch": 4786} {"train_loss": -7.295869588851929, "global_step": 201053, "epoch": 4786, "val_loss": 81453.46875} {"train_loss": -7.315896987915039, "global_step": 201054, "epoch": 4787} {"train_loss": -7.230345726013184, "global_step": 201055, "epoch": 4787} {"train_loss": -7.282859802246094, "global_step": 201056, "epoch": 4787} {"train_loss": -7.242238521575928, "global_step": 201057, "epoch": 4787} {"train_loss": -7.338705062866211, "global_step": 201058, "epoch": 4787} {"train_loss": -7.24755859375, "global_step": 201059, "epoch": 4787} {"train_loss": -7.211671829223633, "global_step": 201060, "epoch": 4787} {"train_loss": -7.330629348754883, "global_step": 201061, "epoch": 4787} {"train_loss": -7.254075050354004, "global_step": 201062, "epoch": 4787} {"train_loss": -7.331901550292969, "global_step": 201063, "epoch": 4787} {"train_loss": -7.393118858337402, "global_step": 201064, "epoch": 4787} {"train_loss": -7.2279462814331055, "global_step": 201065, "epoch": 4787} {"train_loss": -7.384199142456055, "global_step": 201066, "epoch": 4787} {"train_loss": -7.368455410003662, "global_step": 201067, "epoch": 4787} {"train_loss": -7.293889045715332, "global_step": 201068, "epoch": 4787} {"train_loss": -7.341824531555176, "global_step": 201069, "epoch": 4787} {"train_loss": -7.255189895629883, "global_step": 201070, "epoch": 4787} {"train_loss": -7.154934883117676, "global_step": 201071, "epoch": 4787} {"train_loss": -7.26061487197876, "global_step": 201072, "epoch": 4787} {"train_loss": -7.245159149169922, "global_step": 201073, "epoch": 4787} {"train_loss": -7.242694854736328, "global_step": 201074, "epoch": 4787} {"train_loss": -7.301758766174316, "global_step": 201075, "epoch": 4787} {"train_loss": -7.16030740737915, "global_step": 201076, "epoch": 4787} {"train_loss": -7.317078590393066, "global_step": 201077, "epoch": 4787} {"train_loss": -7.222782135009766, "global_step": 201078, "epoch": 4787} {"train_loss": -7.274545192718506, "global_step": 201079, "epoch": 4787} {"train_loss": -7.345713138580322, "global_step": 201080, "epoch": 4787} {"train_loss": -7.306010723114014, "global_step": 201081, "epoch": 4787} {"train_loss": -7.137835502624512, "global_step": 201082, "epoch": 4787} {"train_loss": -7.27280330657959, "global_step": 201083, "epoch": 4787} {"train_loss": -7.2618818283081055, "global_step": 201084, "epoch": 4787} {"train_loss": -7.243109703063965, "global_step": 201085, "epoch": 4787} {"train_loss": -7.282317161560059, "global_step": 201086, "epoch": 4787} {"train_loss": -7.373085975646973, "global_step": 201087, "epoch": 4787} {"train_loss": -7.315628528594971, "global_step": 201088, "epoch": 4787} {"train_loss": -7.288546085357666, "global_step": 201089, "epoch": 4787} {"train_loss": -7.334064483642578, "global_step": 201090, "epoch": 4787} {"train_loss": -7.391035079956055, "global_step": 201091, "epoch": 4787} {"train_loss": -7.185688495635986, "global_step": 201092, "epoch": 4787} {"train_loss": -7.287615776062012, "global_step": 201093, "epoch": 4787} {"train_loss": -7.42515754699707, "global_step": 201094, "epoch": 4787} {"train_loss": -7.281943150929043, "global_step": 201095, "epoch": 4787, "val_loss": 81777.6640625} {"train_loss": -7.354328155517578, "global_step": 201096, "epoch": 4788} {"train_loss": -7.323932647705078, "global_step": 201097, "epoch": 4788} {"train_loss": -7.233213424682617, "global_step": 201098, "epoch": 4788} {"train_loss": -7.3249616622924805, "global_step": 201099, "epoch": 4788} {"train_loss": -7.27834415435791, "global_step": 201100, "epoch": 4788} {"train_loss": -7.382153511047363, "global_step": 201101, "epoch": 4788} {"train_loss": -7.284003734588623, "global_step": 201102, "epoch": 4788} {"train_loss": -7.204960823059082, "global_step": 201103, "epoch": 4788} {"train_loss": -7.369287014007568, "global_step": 201104, "epoch": 4788} {"train_loss": -7.184568405151367, "global_step": 201105, "epoch": 4788} {"train_loss": -7.445113182067871, "global_step": 201106, "epoch": 4788} {"train_loss": -7.342637062072754, "global_step": 201107, "epoch": 4788} {"train_loss": -7.387580871582031, "global_step": 201108, "epoch": 4788} {"train_loss": -7.30271577835083, "global_step": 201109, "epoch": 4788} {"train_loss": -7.369964599609375, "global_step": 201110, "epoch": 4788} {"train_loss": -7.265758991241455, "global_step": 201111, "epoch": 4788} {"train_loss": -7.373989582061768, "global_step": 201112, "epoch": 4788} {"train_loss": -7.265556812286377, "global_step": 201113, "epoch": 4788} {"train_loss": -7.388235092163086, "global_step": 201114, "epoch": 4788} {"train_loss": -7.29096794128418, "global_step": 201115, "epoch": 4788} {"train_loss": -7.223962306976318, "global_step": 201116, "epoch": 4788} {"train_loss": -7.296852111816406, "global_step": 201117, "epoch": 4788} {"train_loss": -7.235013008117676, "global_step": 201118, "epoch": 4788} {"train_loss": -7.141972541809082, "global_step": 201119, "epoch": 4788} {"train_loss": -7.355552673339844, "global_step": 201120, "epoch": 4788} {"train_loss": -7.306643486022949, "global_step": 201121, "epoch": 4788} {"train_loss": -7.355900287628174, "global_step": 201122, "epoch": 4788} {"train_loss": -7.3022918701171875, "global_step": 201123, "epoch": 4788} {"train_loss": -7.3090033531188965, "global_step": 201124, "epoch": 4788} {"train_loss": -7.346920013427734, "global_step": 201125, "epoch": 4788} {"train_loss": -7.349550247192383, "global_step": 201126, "epoch": 4788} {"train_loss": -7.150965690612793, "global_step": 201127, "epoch": 4788} {"train_loss": -7.3387250900268555, "global_step": 201128, "epoch": 4788} {"train_loss": -7.346416473388672, "global_step": 201129, "epoch": 4788} {"train_loss": -7.242585182189941, "global_step": 201130, "epoch": 4788} {"train_loss": -7.245860576629639, "global_step": 201131, "epoch": 4788} {"train_loss": -7.2514777183532715, "global_step": 201132, "epoch": 4788} {"train_loss": -7.234379768371582, "global_step": 201133, "epoch": 4788} {"train_loss": -7.33726167678833, "global_step": 201134, "epoch": 4788} {"train_loss": -7.333615303039551, "global_step": 201135, "epoch": 4788} {"train_loss": -7.3309855461120605, "global_step": 201136, "epoch": 4788} {"train_loss": -7.30353856086731, "global_step": 201137, "epoch": 4788, "val_loss": 81572.2265625} {"train_loss": -7.329681873321533, "global_step": 201138, "epoch": 4789} {"train_loss": -7.385181427001953, "global_step": 201139, "epoch": 4789} {"train_loss": -7.2089643478393555, "global_step": 201140, "epoch": 4789} {"train_loss": -7.229609966278076, "global_step": 201141, "epoch": 4789} {"train_loss": -7.342918872833252, "global_step": 201142, "epoch": 4789} {"train_loss": -7.289123058319092, "global_step": 201143, "epoch": 4789} {"train_loss": -7.444293975830078, "global_step": 201144, "epoch": 4789} {"train_loss": -7.300018787384033, "global_step": 201145, "epoch": 4789} {"train_loss": -7.255349636077881, "global_step": 201146, "epoch": 4789} {"train_loss": -7.20185661315918, "global_step": 201147, "epoch": 4789} {"train_loss": -7.130013942718506, "global_step": 201148, "epoch": 4789} {"train_loss": -7.294629096984863, "global_step": 201149, "epoch": 4789} {"train_loss": -7.2850847244262695, "global_step": 201150, "epoch": 4789} {"train_loss": -7.176874160766602, "global_step": 201151, "epoch": 4789} {"train_loss": -7.260440826416016, "global_step": 201152, "epoch": 4789} {"train_loss": -7.198977470397949, "global_step": 201153, "epoch": 4789} {"train_loss": -7.184215545654297, "global_step": 201154, "epoch": 4789} {"train_loss": -7.24418830871582, "global_step": 201155, "epoch": 4789} {"train_loss": -7.252951145172119, "global_step": 201156, "epoch": 4789} {"train_loss": -7.40053653717041, "global_step": 201157, "epoch": 4789} {"train_loss": -7.28558349609375, "global_step": 201158, "epoch": 4789} {"train_loss": -7.314598083496094, "global_step": 201159, "epoch": 4789} {"train_loss": -7.377726078033447, "global_step": 201160, "epoch": 4789} {"train_loss": -7.242885589599609, "global_step": 201161, "epoch": 4789} {"train_loss": -7.295479774475098, "global_step": 201162, "epoch": 4789} {"train_loss": -7.238527297973633, "global_step": 201163, "epoch": 4789} {"train_loss": -7.161111354827881, "global_step": 201164, "epoch": 4789} {"train_loss": -7.33796501159668, "global_step": 201165, "epoch": 4789} {"train_loss": -7.224404335021973, "global_step": 201166, "epoch": 4789} {"train_loss": -7.27843713760376, "global_step": 201167, "epoch": 4789} {"train_loss": -7.266617298126221, "global_step": 201168, "epoch": 4789} {"train_loss": -7.319524765014648, "global_step": 201169, "epoch": 4789} {"train_loss": -7.360391616821289, "global_step": 201170, "epoch": 4789} {"train_loss": -7.242033958435059, "global_step": 201171, "epoch": 4789} {"train_loss": -7.2246551513671875, "global_step": 201172, "epoch": 4789} {"train_loss": -7.360493183135986, "global_step": 201173, "epoch": 4789} {"train_loss": -7.300517559051514, "global_step": 201174, "epoch": 4789} {"train_loss": -7.416369915008545, "global_step": 201175, "epoch": 4789} {"train_loss": -7.325667381286621, "global_step": 201176, "epoch": 4789} {"train_loss": -7.327256202697754, "global_step": 201177, "epoch": 4789} {"train_loss": -7.242315292358398, "global_step": 201178, "epoch": 4789} {"train_loss": -7.281629993802025, "global_step": 201179, "epoch": 4789, "val_loss": 81685.6640625} {"train_loss": -7.338287353515625, "global_step": 201180, "epoch": 4790} {"train_loss": -7.164881706237793, "global_step": 201181, "epoch": 4790} {"train_loss": -7.3369855880737305, "global_step": 201182, "epoch": 4790} {"train_loss": -7.385641098022461, "global_step": 201183, "epoch": 4790} {"train_loss": -7.364956855773926, "global_step": 201184, "epoch": 4790} {"train_loss": -7.297481536865234, "global_step": 201185, "epoch": 4790} {"train_loss": -7.275712013244629, "global_step": 201186, "epoch": 4790} {"train_loss": -7.215544700622559, "global_step": 201187, "epoch": 4790} {"train_loss": -7.342222213745117, "global_step": 201188, "epoch": 4790} {"train_loss": -7.382441997528076, "global_step": 201189, "epoch": 4790} {"train_loss": -7.322155475616455, "global_step": 201190, "epoch": 4790} {"train_loss": -7.3089280128479, "global_step": 201191, "epoch": 4790} {"train_loss": -7.497007369995117, "global_step": 201192, "epoch": 4790} {"train_loss": -7.35333251953125, "global_step": 201193, "epoch": 4790} {"train_loss": -7.440995216369629, "global_step": 201194, "epoch": 4790} {"train_loss": -7.176069259643555, "global_step": 201195, "epoch": 4790} {"train_loss": -7.246001720428467, "global_step": 201196, "epoch": 4790} {"train_loss": -7.278507709503174, "global_step": 201197, "epoch": 4790} {"train_loss": -7.2195587158203125, "global_step": 201198, "epoch": 4790} {"train_loss": -7.233905792236328, "global_step": 201199, "epoch": 4790} {"train_loss": -7.310635089874268, "global_step": 201200, "epoch": 4790} {"train_loss": -7.229147911071777, "global_step": 201201, "epoch": 4790} {"train_loss": -7.2049641609191895, "global_step": 201202, "epoch": 4790} {"train_loss": -7.294857025146484, "global_step": 201203, "epoch": 4790} {"train_loss": -7.077313423156738, "global_step": 201204, "epoch": 4790} {"train_loss": -7.363727569580078, "global_step": 201205, "epoch": 4790} {"train_loss": -7.479562282562256, "global_step": 201206, "epoch": 4790} {"train_loss": -7.348813056945801, "global_step": 201207, "epoch": 4790} {"train_loss": -7.244357109069824, "global_step": 201208, "epoch": 4790} {"train_loss": -7.348538875579834, "global_step": 201209, "epoch": 4790} {"train_loss": -7.095035552978516, "global_step": 201210, "epoch": 4790} {"train_loss": -7.251673698425293, "global_step": 201211, "epoch": 4790} {"train_loss": -7.216155052185059, "global_step": 201212, "epoch": 4790} {"train_loss": -7.200818061828613, "global_step": 201213, "epoch": 4790} {"train_loss": -7.203946113586426, "global_step": 201214, "epoch": 4790} {"train_loss": -7.174324989318848, "global_step": 201215, "epoch": 4790} {"train_loss": -7.1725754737854, "global_step": 201216, "epoch": 4790} {"train_loss": -7.081783294677734, "global_step": 201217, "epoch": 4790} {"train_loss": -7.149651050567627, "global_step": 201218, "epoch": 4790} {"train_loss": -7.178197860717773, "global_step": 201219, "epoch": 4790} {"train_loss": -7.25723934173584, "global_step": 201220, "epoch": 4790} {"train_loss": -7.266011260804676, "global_step": 201221, "epoch": 4790, "val_loss": 81423.71875} {"train_loss": -7.189278602600098, "global_step": 201222, "epoch": 4791} {"train_loss": -7.148366451263428, "global_step": 201223, "epoch": 4791} {"train_loss": -7.232955455780029, "global_step": 201224, "epoch": 4791} {"train_loss": -7.08966064453125, "global_step": 201225, "epoch": 4791} {"train_loss": -7.252422332763672, "global_step": 201226, "epoch": 4791} {"train_loss": -7.215277671813965, "global_step": 201227, "epoch": 4791} {"train_loss": -7.2216081619262695, "global_step": 201228, "epoch": 4791} {"train_loss": -7.228621482849121, "global_step": 201229, "epoch": 4791} {"train_loss": -7.2608842849731445, "global_step": 201230, "epoch": 4791} {"train_loss": -7.3304524421691895, "global_step": 201231, "epoch": 4791} {"train_loss": -7.294294357299805, "global_step": 201232, "epoch": 4791} {"train_loss": -7.213093280792236, "global_step": 201233, "epoch": 4791} {"train_loss": -7.295441627502441, "global_step": 201234, "epoch": 4791} {"train_loss": -7.212882041931152, "global_step": 201235, "epoch": 4791} {"train_loss": -7.345391273498535, "global_step": 201236, "epoch": 4791} {"train_loss": -7.272680282592773, "global_step": 201237, "epoch": 4791} {"train_loss": -7.184779167175293, "global_step": 201238, "epoch": 4791} {"train_loss": -7.266138553619385, "global_step": 201239, "epoch": 4791} {"train_loss": -7.244585990905762, "global_step": 201240, "epoch": 4791} {"train_loss": -7.2479166984558105, "global_step": 201241, "epoch": 4791} {"train_loss": -7.253972053527832, "global_step": 201242, "epoch": 4791} {"train_loss": -7.325319766998291, "global_step": 201243, "epoch": 4791} {"train_loss": -7.257697582244873, "global_step": 201244, "epoch": 4791} {"train_loss": -7.312577247619629, "global_step": 201245, "epoch": 4791} {"train_loss": -7.2469282150268555, "global_step": 201246, "epoch": 4791} {"train_loss": -7.1858744621276855, "global_step": 201247, "epoch": 4791} {"train_loss": -7.241242408752441, "global_step": 201248, "epoch": 4791} {"train_loss": -7.188709735870361, "global_step": 201249, "epoch": 4791} {"train_loss": -7.265965938568115, "global_step": 201250, "epoch": 4791} {"train_loss": -7.292992115020752, "global_step": 201251, "epoch": 4791} {"train_loss": -7.335608959197998, "global_step": 201252, "epoch": 4791} {"train_loss": -7.355297088623047, "global_step": 201253, "epoch": 4791} {"train_loss": -7.189563751220703, "global_step": 201254, "epoch": 4791} {"train_loss": -7.358486652374268, "global_step": 201255, "epoch": 4791} {"train_loss": -7.3548479080200195, "global_step": 201256, "epoch": 4791} {"train_loss": -7.3238677978515625, "global_step": 201257, "epoch": 4791} {"train_loss": -7.308112144470215, "global_step": 201258, "epoch": 4791} {"train_loss": -7.326319694519043, "global_step": 201259, "epoch": 4791} {"train_loss": -7.308454513549805, "global_step": 201260, "epoch": 4791} {"train_loss": -7.354687690734863, "global_step": 201261, "epoch": 4791} {"train_loss": -7.293319225311279, "global_step": 201262, "epoch": 4791} {"train_loss": -7.267671267191569, "global_step": 201263, "epoch": 4791, "val_loss": 81444.890625} {"train_loss": -7.408262729644775, "global_step": 201264, "epoch": 4792} {"train_loss": -7.322739601135254, "global_step": 201265, "epoch": 4792} {"train_loss": -7.2939348220825195, "global_step": 201266, "epoch": 4792} {"train_loss": -7.285972595214844, "global_step": 201267, "epoch": 4792} {"train_loss": -7.296544551849365, "global_step": 201268, "epoch": 4792} {"train_loss": -7.250814914703369, "global_step": 201269, "epoch": 4792} {"train_loss": -7.204686164855957, "global_step": 201270, "epoch": 4792} {"train_loss": -7.21323823928833, "global_step": 201271, "epoch": 4792} {"train_loss": -7.2183332443237305, "global_step": 201272, "epoch": 4792} {"train_loss": -7.232630729675293, "global_step": 201273, "epoch": 4792} {"train_loss": -7.358915328979492, "global_step": 201274, "epoch": 4792} {"train_loss": -7.380369186401367, "global_step": 201275, "epoch": 4792} {"train_loss": -7.108717918395996, "global_step": 201276, "epoch": 4792} {"train_loss": -7.259140968322754, "global_step": 201277, "epoch": 4792} {"train_loss": -7.276721477508545, "global_step": 201278, "epoch": 4792} {"train_loss": -7.176883220672607, "global_step": 201279, "epoch": 4792} {"train_loss": -7.3314690589904785, "global_step": 201280, "epoch": 4792} {"train_loss": -7.2680158615112305, "global_step": 201281, "epoch": 4792} {"train_loss": -7.371013641357422, "global_step": 201282, "epoch": 4792} {"train_loss": -7.241510391235352, "global_step": 201283, "epoch": 4792} {"train_loss": -7.228427886962891, "global_step": 201284, "epoch": 4792} {"train_loss": -7.280006408691406, "global_step": 201285, "epoch": 4792} {"train_loss": -7.3900251388549805, "global_step": 201286, "epoch": 4792} {"train_loss": -7.1623616218566895, "global_step": 201287, "epoch": 4792} {"train_loss": -7.169790267944336, "global_step": 201288, "epoch": 4792} {"train_loss": -7.128674507141113, "global_step": 201289, "epoch": 4792} {"train_loss": -7.344192981719971, "global_step": 201290, "epoch": 4792} {"train_loss": -7.213176727294922, "global_step": 201291, "epoch": 4792} {"train_loss": -7.3423261642456055, "global_step": 201292, "epoch": 4792} {"train_loss": -7.268105506896973, "global_step": 201293, "epoch": 4792} {"train_loss": -7.39561128616333, "global_step": 201294, "epoch": 4792} {"train_loss": -7.351287841796875, "global_step": 201295, "epoch": 4792} {"train_loss": -7.418826103210449, "global_step": 201296, "epoch": 4792} {"train_loss": -7.388806343078613, "global_step": 201297, "epoch": 4792} {"train_loss": -7.255321025848389, "global_step": 201298, "epoch": 4792} {"train_loss": -7.2892165184021, "global_step": 201299, "epoch": 4792} {"train_loss": -7.383515357971191, "global_step": 201300, "epoch": 4792} {"train_loss": -7.274456977844238, "global_step": 201301, "epoch": 4792} {"train_loss": -7.238389015197754, "global_step": 201302, "epoch": 4792} {"train_loss": -7.370463848114014, "global_step": 201303, "epoch": 4792} {"train_loss": -7.2902350425720215, "global_step": 201304, "epoch": 4792} {"train_loss": -7.286440803891137, "global_step": 201305, "epoch": 4792, "val_loss": 81384.2734375} {"train_loss": -7.389871120452881, "global_step": 201306, "epoch": 4793} {"train_loss": -7.312534809112549, "global_step": 201307, "epoch": 4793} {"train_loss": -7.426356315612793, "global_step": 201308, "epoch": 4793} {"train_loss": -7.299801826477051, "global_step": 201309, "epoch": 4793} {"train_loss": -7.3424882888793945, "global_step": 201310, "epoch": 4793} {"train_loss": -7.382195949554443, "global_step": 201311, "epoch": 4793} {"train_loss": -7.336503505706787, "global_step": 201312, "epoch": 4793} {"train_loss": -7.345726013183594, "global_step": 201313, "epoch": 4793} {"train_loss": -7.365055561065674, "global_step": 201314, "epoch": 4793} {"train_loss": -7.343775749206543, "global_step": 201315, "epoch": 4793} {"train_loss": -7.333160400390625, "global_step": 201316, "epoch": 4793} {"train_loss": -7.37017297744751, "global_step": 201317, "epoch": 4793} {"train_loss": -7.279712677001953, "global_step": 201318, "epoch": 4793} {"train_loss": -7.424996852874756, "global_step": 201319, "epoch": 4793} {"train_loss": -7.230521202087402, "global_step": 201320, "epoch": 4793} {"train_loss": -7.328682899475098, "global_step": 201321, "epoch": 4793} {"train_loss": -7.19676399230957, "global_step": 201322, "epoch": 4793} {"train_loss": -7.339778900146484, "global_step": 201323, "epoch": 4793} {"train_loss": -7.404886722564697, "global_step": 201324, "epoch": 4793} {"train_loss": -7.2130537033081055, "global_step": 201325, "epoch": 4793} {"train_loss": -7.298111915588379, "global_step": 201326, "epoch": 4793} {"train_loss": -7.280490398406982, "global_step": 201327, "epoch": 4793} {"train_loss": -7.240041732788086, "global_step": 201328, "epoch": 4793} {"train_loss": -7.30143928527832, "global_step": 201329, "epoch": 4793} {"train_loss": -7.389671325683594, "global_step": 201330, "epoch": 4793} {"train_loss": -7.333643913269043, "global_step": 201331, "epoch": 4793} {"train_loss": -7.206727981567383, "global_step": 201332, "epoch": 4793} {"train_loss": -7.3049821853637695, "global_step": 201333, "epoch": 4793} {"train_loss": -7.19899845123291, "global_step": 201334, "epoch": 4793} {"train_loss": -7.302371978759766, "global_step": 201335, "epoch": 4793} {"train_loss": -7.2918853759765625, "global_step": 201336, "epoch": 4793} {"train_loss": -7.340636253356934, "global_step": 201337, "epoch": 4793} {"train_loss": -7.27889347076416, "global_step": 201338, "epoch": 4793} {"train_loss": -7.322176933288574, "global_step": 201339, "epoch": 4793} {"train_loss": -7.3321027755737305, "global_step": 201340, "epoch": 4793} {"train_loss": -7.390043258666992, "global_step": 201341, "epoch": 4793} {"train_loss": -7.21923303604126, "global_step": 201342, "epoch": 4793} {"train_loss": -7.25356388092041, "global_step": 201343, "epoch": 4793} {"train_loss": -7.332961082458496, "global_step": 201344, "epoch": 4793} {"train_loss": -7.278307914733887, "global_step": 201345, "epoch": 4793} {"train_loss": -7.386351585388184, "global_step": 201346, "epoch": 4793} {"train_loss": -7.318244934082031, "global_step": 201347, "epoch": 4793, "val_loss": 81449.5078125} {"train_loss": -7.34682559967041, "global_step": 201348, "epoch": 4794} {"train_loss": -7.368358135223389, "global_step": 201349, "epoch": 4794} {"train_loss": -7.259183883666992, "global_step": 201350, "epoch": 4794} {"train_loss": -7.288605690002441, "global_step": 201351, "epoch": 4794} {"train_loss": -7.366422653198242, "global_step": 201352, "epoch": 4794} {"train_loss": -7.338605880737305, "global_step": 201353, "epoch": 4794} {"train_loss": -7.410588264465332, "global_step": 201354, "epoch": 4794} {"train_loss": -7.445898056030273, "global_step": 201355, "epoch": 4794} {"train_loss": -7.383223533630371, "global_step": 201356, "epoch": 4794} {"train_loss": -7.435634613037109, "global_step": 201357, "epoch": 4794} {"train_loss": -7.3393049240112305, "global_step": 201358, "epoch": 4794} {"train_loss": -7.455310821533203, "global_step": 201359, "epoch": 4794} {"train_loss": -7.433506011962891, "global_step": 201360, "epoch": 4794} {"train_loss": -7.344771385192871, "global_step": 201361, "epoch": 4794} {"train_loss": -7.465827941894531, "global_step": 201362, "epoch": 4794} {"train_loss": -7.2918925285339355, "global_step": 201363, "epoch": 4794} {"train_loss": -7.393693923950195, "global_step": 201364, "epoch": 4794} {"train_loss": -7.299681186676025, "global_step": 201365, "epoch": 4794} {"train_loss": -7.368650913238525, "global_step": 201366, "epoch": 4794} {"train_loss": -7.378357410430908, "global_step": 201367, "epoch": 4794} {"train_loss": -7.415034294128418, "global_step": 201368, "epoch": 4794} {"train_loss": -7.279479026794434, "global_step": 201369, "epoch": 4794} {"train_loss": -7.285019874572754, "global_step": 201370, "epoch": 4794} {"train_loss": -7.394983291625977, "global_step": 201371, "epoch": 4794} {"train_loss": -7.29116153717041, "global_step": 201372, "epoch": 4794} {"train_loss": -7.343136787414551, "global_step": 201373, "epoch": 4794} {"train_loss": -7.299338340759277, "global_step": 201374, "epoch": 4794} {"train_loss": -7.321390151977539, "global_step": 201375, "epoch": 4794} {"train_loss": -7.41172981262207, "global_step": 201376, "epoch": 4794} {"train_loss": -7.286199569702148, "global_step": 201377, "epoch": 4794} {"train_loss": -7.228357315063477, "global_step": 201378, "epoch": 4794} {"train_loss": -7.261228561401367, "global_step": 201379, "epoch": 4794} {"train_loss": -7.376953125, "global_step": 201380, "epoch": 4794} {"train_loss": -7.403609752655029, "global_step": 201381, "epoch": 4794} {"train_loss": -7.362273216247559, "global_step": 201382, "epoch": 4794} {"train_loss": -7.300403118133545, "global_step": 201383, "epoch": 4794} {"train_loss": -7.219076156616211, "global_step": 201384, "epoch": 4794} {"train_loss": -7.276035308837891, "global_step": 201385, "epoch": 4794} {"train_loss": -7.372641086578369, "global_step": 201386, "epoch": 4794} {"train_loss": -7.492501258850098, "global_step": 201387, "epoch": 4794} {"train_loss": -7.241281032562256, "global_step": 201388, "epoch": 4794} {"train_loss": -7.348281576519921, "global_step": 201389, "epoch": 4794, "val_loss": 81623.890625} {"train_loss": -7.206132888793945, "global_step": 201390, "epoch": 4795} {"train_loss": -7.358819007873535, "global_step": 201391, "epoch": 4795} {"train_loss": -7.28731107711792, "global_step": 201392, "epoch": 4795} {"train_loss": -7.139192581176758, "global_step": 201393, "epoch": 4795} {"train_loss": -7.283167839050293, "global_step": 201394, "epoch": 4795} {"train_loss": -7.206586837768555, "global_step": 201395, "epoch": 4795} {"train_loss": -7.158483505249023, "global_step": 201396, "epoch": 4795} {"train_loss": -7.263120651245117, "global_step": 201397, "epoch": 4795} {"train_loss": -7.392668724060059, "global_step": 201398, "epoch": 4795} {"train_loss": -7.196392059326172, "global_step": 201399, "epoch": 4795} {"train_loss": -7.289053916931152, "global_step": 201400, "epoch": 4795} {"train_loss": -7.275357246398926, "global_step": 201401, "epoch": 4795} {"train_loss": -7.302826404571533, "global_step": 201402, "epoch": 4795} {"train_loss": -7.273468971252441, "global_step": 201403, "epoch": 4795} {"train_loss": -7.218043327331543, "global_step": 201404, "epoch": 4795} {"train_loss": -7.382676124572754, "global_step": 201405, "epoch": 4795} {"train_loss": -7.34945011138916, "global_step": 201406, "epoch": 4795} {"train_loss": -7.227542877197266, "global_step": 201407, "epoch": 4795} {"train_loss": -7.187370300292969, "global_step": 201408, "epoch": 4795} {"train_loss": -7.202112197875977, "global_step": 201409, "epoch": 4795} {"train_loss": -7.321054935455322, "global_step": 201410, "epoch": 4795} {"train_loss": -7.163389682769775, "global_step": 201411, "epoch": 4795} {"train_loss": -7.247169494628906, "global_step": 201412, "epoch": 4795} {"train_loss": -7.25637674331665, "global_step": 201413, "epoch": 4795} {"train_loss": -7.207564353942871, "global_step": 201414, "epoch": 4795} {"train_loss": -7.200878143310547, "global_step": 201415, "epoch": 4795} {"train_loss": -7.052227020263672, "global_step": 201416, "epoch": 4795} {"train_loss": -7.20596981048584, "global_step": 201417, "epoch": 4795} {"train_loss": -7.200037956237793, "global_step": 201418, "epoch": 4795} {"train_loss": -7.231400012969971, "global_step": 201419, "epoch": 4795} {"train_loss": -7.258644104003906, "global_step": 201420, "epoch": 4795} {"train_loss": -7.193998336791992, "global_step": 201421, "epoch": 4795} {"train_loss": -7.168428421020508, "global_step": 201422, "epoch": 4795} {"train_loss": -7.2972869873046875, "global_step": 201423, "epoch": 4795} {"train_loss": -7.186066627502441, "global_step": 201424, "epoch": 4795} {"train_loss": -7.152836322784424, "global_step": 201425, "epoch": 4795} {"train_loss": -7.281383991241455, "global_step": 201426, "epoch": 4795} {"train_loss": -7.1678009033203125, "global_step": 201427, "epoch": 4795} {"train_loss": -7.2063188552856445, "global_step": 201428, "epoch": 4795} {"train_loss": -7.235274314880371, "global_step": 201429, "epoch": 4795} {"train_loss": -7.261772155761719, "global_step": 201430, "epoch": 4795} {"train_loss": -7.237031482514881, "global_step": 201431, "epoch": 4795, "val_loss": 81476.2890625} {"train_loss": -7.255673408508301, "global_step": 201432, "epoch": 4796} {"train_loss": -7.355373382568359, "global_step": 201433, "epoch": 4796} {"train_loss": -7.310428619384766, "global_step": 201434, "epoch": 4796} {"train_loss": -7.2786407470703125, "global_step": 201435, "epoch": 4796} {"train_loss": -7.380984783172607, "global_step": 201436, "epoch": 4796} {"train_loss": -7.314620494842529, "global_step": 201437, "epoch": 4796} {"train_loss": -7.297434329986572, "global_step": 201438, "epoch": 4796} {"train_loss": -7.394416809082031, "global_step": 201439, "epoch": 4796} {"train_loss": -7.199192047119141, "global_step": 201440, "epoch": 4796} {"train_loss": -7.2606940269470215, "global_step": 201441, "epoch": 4796} {"train_loss": -7.158577919006348, "global_step": 201442, "epoch": 4796} {"train_loss": -7.098696708679199, "global_step": 201443, "epoch": 4796} {"train_loss": -7.17962646484375, "global_step": 201444, "epoch": 4796} {"train_loss": -7.331437110900879, "global_step": 201445, "epoch": 4796} {"train_loss": -7.152896881103516, "global_step": 201446, "epoch": 4796} {"train_loss": -7.07578706741333, "global_step": 201447, "epoch": 4796} {"train_loss": -7.125048637390137, "global_step": 201448, "epoch": 4796} {"train_loss": -7.035700798034668, "global_step": 201449, "epoch": 4796} {"train_loss": -7.250563144683838, "global_step": 201450, "epoch": 4796} {"train_loss": -6.8268232345581055, "global_step": 201451, "epoch": 4796} {"train_loss": -7.080601692199707, "global_step": 201452, "epoch": 4796} {"train_loss": -7.287359237670898, "global_step": 201453, "epoch": 4796} {"train_loss": -7.172689914703369, "global_step": 201454, "epoch": 4796} {"train_loss": -6.997229099273682, "global_step": 201455, "epoch": 4796} {"train_loss": -7.158178329467773, "global_step": 201456, "epoch": 4796} {"train_loss": -7.110803127288818, "global_step": 201457, "epoch": 4796} {"train_loss": -7.111747741699219, "global_step": 201458, "epoch": 4796} {"train_loss": -7.26834774017334, "global_step": 201459, "epoch": 4796} {"train_loss": -7.163179397583008, "global_step": 201460, "epoch": 4796} {"train_loss": -7.310407638549805, "global_step": 201461, "epoch": 4796} {"train_loss": -7.157454013824463, "global_step": 201462, "epoch": 4796} {"train_loss": -7.16648006439209, "global_step": 201463, "epoch": 4796} {"train_loss": -7.2310686111450195, "global_step": 201464, "epoch": 4796} {"train_loss": -7.194484710693359, "global_step": 201465, "epoch": 4796} {"train_loss": -7.2852702140808105, "global_step": 201466, "epoch": 4796} {"train_loss": -7.142065048217773, "global_step": 201467, "epoch": 4796} {"train_loss": -7.404881477355957, "global_step": 201468, "epoch": 4796} {"train_loss": -7.310724258422852, "global_step": 201469, "epoch": 4796} {"train_loss": -7.295792579650879, "global_step": 201470, "epoch": 4796} {"train_loss": -7.307643413543701, "global_step": 201471, "epoch": 4796} {"train_loss": -7.3010149002075195, "global_step": 201472, "epoch": 4796} {"train_loss": -7.214892296564011, "global_step": 201473, "epoch": 4796, "val_loss": 81433.5546875} {"train_loss": -7.134183406829834, "global_step": 201474, "epoch": 4797} {"train_loss": -7.371891975402832, "global_step": 201475, "epoch": 4797} {"train_loss": -7.236340045928955, "global_step": 201476, "epoch": 4797} {"train_loss": -7.173370361328125, "global_step": 201477, "epoch": 4797} {"train_loss": -7.438847541809082, "global_step": 201478, "epoch": 4797} {"train_loss": -7.113821983337402, "global_step": 201479, "epoch": 4797} {"train_loss": -7.319094657897949, "global_step": 201480, "epoch": 4797} {"train_loss": -7.24285888671875, "global_step": 201481, "epoch": 4797} {"train_loss": -7.330136299133301, "global_step": 201482, "epoch": 4797} {"train_loss": -7.211108207702637, "global_step": 201483, "epoch": 4797} {"train_loss": -7.1983137130737305, "global_step": 201484, "epoch": 4797} {"train_loss": -7.2418670654296875, "global_step": 201485, "epoch": 4797} {"train_loss": -7.249420166015625, "global_step": 201486, "epoch": 4797} {"train_loss": -7.26960563659668, "global_step": 201487, "epoch": 4797} {"train_loss": -7.217985153198242, "global_step": 201488, "epoch": 4797} {"train_loss": -7.3094587326049805, "global_step": 201489, "epoch": 4797} {"train_loss": -7.337240219116211, "global_step": 201490, "epoch": 4797} {"train_loss": -7.34697961807251, "global_step": 201491, "epoch": 4797} {"train_loss": -7.378724098205566, "global_step": 201492, "epoch": 4797} {"train_loss": -7.293169021606445, "global_step": 201493, "epoch": 4797} {"train_loss": -7.346657752990723, "global_step": 201494, "epoch": 4797} {"train_loss": -7.178327560424805, "global_step": 201495, "epoch": 4797} {"train_loss": -7.227314472198486, "global_step": 201496, "epoch": 4797} {"train_loss": -7.183825969696045, "global_step": 201497, "epoch": 4797} {"train_loss": -7.3983564376831055, "global_step": 201498, "epoch": 4797} {"train_loss": -7.214168548583984, "global_step": 201499, "epoch": 4797} {"train_loss": -7.116862773895264, "global_step": 201500, "epoch": 4797} {"train_loss": -7.2697296142578125, "global_step": 201501, "epoch": 4797} {"train_loss": -7.098982810974121, "global_step": 201502, "epoch": 4797} {"train_loss": -7.269988059997559, "global_step": 201503, "epoch": 4797} {"train_loss": -7.2006940841674805, "global_step": 201504, "epoch": 4797} {"train_loss": -7.14536190032959, "global_step": 201505, "epoch": 4797} {"train_loss": -7.234520435333252, "global_step": 201506, "epoch": 4797} {"train_loss": -7.179860591888428, "global_step": 201507, "epoch": 4797} {"train_loss": -7.407138347625732, "global_step": 201508, "epoch": 4797} {"train_loss": -7.271252155303955, "global_step": 201509, "epoch": 4797} {"train_loss": -7.331962585449219, "global_step": 201510, "epoch": 4797} {"train_loss": -7.3274149894714355, "global_step": 201511, "epoch": 4797} {"train_loss": -7.330837249755859, "global_step": 201512, "epoch": 4797} {"train_loss": -7.28617525100708, "global_step": 201513, "epoch": 4797} {"train_loss": -7.27031135559082, "global_step": 201514, "epoch": 4797} {"train_loss": -7.261790309633527, "global_step": 201515, "epoch": 4797, "val_loss": 81403.7265625} {"train_loss": -7.256189346313477, "global_step": 201516, "epoch": 4798} {"train_loss": -7.344597339630127, "global_step": 201517, "epoch": 4798} {"train_loss": -7.296706199645996, "global_step": 201518, "epoch": 4798} {"train_loss": -7.313732147216797, "global_step": 201519, "epoch": 4798} {"train_loss": -7.320481777191162, "global_step": 201520, "epoch": 4798} {"train_loss": -7.320807933807373, "global_step": 201521, "epoch": 4798} {"train_loss": -7.328426361083984, "global_step": 201522, "epoch": 4798} {"train_loss": -7.350732803344727, "global_step": 201523, "epoch": 4798} {"train_loss": -7.412351131439209, "global_step": 201524, "epoch": 4798} {"train_loss": -7.413007736206055, "global_step": 201525, "epoch": 4798} {"train_loss": -7.325014591217041, "global_step": 201526, "epoch": 4798} {"train_loss": -7.279196739196777, "global_step": 201527, "epoch": 4798} {"train_loss": -7.395514488220215, "global_step": 201528, "epoch": 4798} {"train_loss": -7.345179080963135, "global_step": 201529, "epoch": 4798} {"train_loss": -7.497910499572754, "global_step": 201530, "epoch": 4798} {"train_loss": -7.322548866271973, "global_step": 201531, "epoch": 4798} {"train_loss": -7.3801679611206055, "global_step": 201532, "epoch": 4798} {"train_loss": -7.335881233215332, "global_step": 201533, "epoch": 4798} {"train_loss": -7.469566822052002, "global_step": 201534, "epoch": 4798} {"train_loss": -7.313345909118652, "global_step": 201535, "epoch": 4798} {"train_loss": -7.271227836608887, "global_step": 201536, "epoch": 4798} {"train_loss": -7.380459785461426, "global_step": 201537, "epoch": 4798} {"train_loss": -7.199650287628174, "global_step": 201538, "epoch": 4798} {"train_loss": -7.372269630432129, "global_step": 201539, "epoch": 4798} {"train_loss": -7.433704376220703, "global_step": 201540, "epoch": 4798} {"train_loss": -7.2740797996521, "global_step": 201541, "epoch": 4798} {"train_loss": -7.166880130767822, "global_step": 201542, "epoch": 4798} {"train_loss": -7.304351806640625, "global_step": 201543, "epoch": 4798} {"train_loss": -7.3955278396606445, "global_step": 201544, "epoch": 4798} {"train_loss": -7.256694316864014, "global_step": 201545, "epoch": 4798} {"train_loss": -7.243849754333496, "global_step": 201546, "epoch": 4798} {"train_loss": -7.350281715393066, "global_step": 201547, "epoch": 4798} {"train_loss": -7.394013404846191, "global_step": 201548, "epoch": 4798} {"train_loss": -7.330147743225098, "global_step": 201549, "epoch": 4798} {"train_loss": -7.261463165283203, "global_step": 201550, "epoch": 4798} {"train_loss": -7.140645980834961, "global_step": 201551, "epoch": 4798} {"train_loss": -7.301116943359375, "global_step": 201552, "epoch": 4798} {"train_loss": -7.325852870941162, "global_step": 201553, "epoch": 4798} {"train_loss": -7.285892486572266, "global_step": 201554, "epoch": 4798} {"train_loss": -7.249916076660156, "global_step": 201555, "epoch": 4798} {"train_loss": -7.30876350402832, "global_step": 201556, "epoch": 4798} {"train_loss": -7.324425254549299, "global_step": 201557, "epoch": 4798, "val_loss": 81763.7421875} {"train_loss": -7.3129730224609375, "global_step": 201558, "epoch": 4799} {"train_loss": -7.330466270446777, "global_step": 201559, "epoch": 4799} {"train_loss": -7.421369552612305, "global_step": 201560, "epoch": 4799} {"train_loss": -7.339485168457031, "global_step": 201561, "epoch": 4799} {"train_loss": -7.2983717918396, "global_step": 201562, "epoch": 4799} {"train_loss": -7.337606430053711, "global_step": 201563, "epoch": 4799} {"train_loss": -7.327084541320801, "global_step": 201564, "epoch": 4799} {"train_loss": -7.2705512046813965, "global_step": 201565, "epoch": 4799} {"train_loss": -7.351019859313965, "global_step": 201566, "epoch": 4799} {"train_loss": -7.3819732666015625, "global_step": 201567, "epoch": 4799} {"train_loss": -7.322212219238281, "global_step": 201568, "epoch": 4799} {"train_loss": -7.309908866882324, "global_step": 201569, "epoch": 4799} {"train_loss": -7.460190773010254, "global_step": 201570, "epoch": 4799} {"train_loss": -7.2674078941345215, "global_step": 201571, "epoch": 4799} {"train_loss": -7.373383522033691, "global_step": 201572, "epoch": 4799} {"train_loss": -7.354921340942383, "global_step": 201573, "epoch": 4799} {"train_loss": -7.222315788269043, "global_step": 201574, "epoch": 4799} {"train_loss": -7.334478378295898, "global_step": 201575, "epoch": 4799} {"train_loss": -7.317078590393066, "global_step": 201576, "epoch": 4799} {"train_loss": -7.321652412414551, "global_step": 201577, "epoch": 4799} {"train_loss": -7.322968482971191, "global_step": 201578, "epoch": 4799} {"train_loss": -7.299661636352539, "global_step": 201579, "epoch": 4799} {"train_loss": -7.252135276794434, "global_step": 201580, "epoch": 4799} {"train_loss": -7.284285545349121, "global_step": 201581, "epoch": 4799} {"train_loss": -7.281680583953857, "global_step": 201582, "epoch": 4799} {"train_loss": -7.231349945068359, "global_step": 201583, "epoch": 4799} {"train_loss": -7.1269330978393555, "global_step": 201584, "epoch": 4799} {"train_loss": -7.302276134490967, "global_step": 201585, "epoch": 4799} {"train_loss": -7.304956912994385, "global_step": 201586, "epoch": 4799} {"train_loss": -7.164165019989014, "global_step": 201587, "epoch": 4799} {"train_loss": -7.308013439178467, "global_step": 201588, "epoch": 4799} {"train_loss": -7.159267425537109, "global_step": 201589, "epoch": 4799} {"train_loss": -7.268747329711914, "global_step": 201590, "epoch": 4799} {"train_loss": -7.325593948364258, "global_step": 201591, "epoch": 4799} {"train_loss": -7.314352035522461, "global_step": 201592, "epoch": 4799} {"train_loss": -7.267645835876465, "global_step": 201593, "epoch": 4799} {"train_loss": -7.342832088470459, "global_step": 201594, "epoch": 4799} {"train_loss": -7.280546188354492, "global_step": 201595, "epoch": 4799} {"train_loss": -7.202892303466797, "global_step": 201596, "epoch": 4799} {"train_loss": -7.304704189300537, "global_step": 201597, "epoch": 4799} {"train_loss": -7.283504486083984, "global_step": 201598, "epoch": 4799} {"train_loss": -7.301648968742008, "global_step": 201599, "epoch": 4799, "val_loss": 81562.71875} {"train_loss": -7.406728744506836, "global_step": 201600, "epoch": 4800} {"train_loss": -7.358497619628906, "global_step": 201601, "epoch": 4800} {"train_loss": -7.297233581542969, "global_step": 201602, "epoch": 4800} {"train_loss": -7.373072624206543, "global_step": 201603, "epoch": 4800} {"train_loss": -7.236780166625977, "global_step": 201604, "epoch": 4800} {"train_loss": -7.376640796661377, "global_step": 201605, "epoch": 4800} {"train_loss": -7.262142181396484, "global_step": 201606, "epoch": 4800} {"train_loss": -7.388745307922363, "global_step": 201607, "epoch": 4800} {"train_loss": -7.409130573272705, "global_step": 201608, "epoch": 4800} {"train_loss": -7.38681697845459, "global_step": 201609, "epoch": 4800} {"train_loss": -7.37541389465332, "global_step": 201610, "epoch": 4800} {"train_loss": -7.193464756011963, "global_step": 201611, "epoch": 4800} {"train_loss": -7.43697452545166, "global_step": 201612, "epoch": 4800} {"train_loss": -7.355733871459961, "global_step": 201613, "epoch": 4800} {"train_loss": -7.31112813949585, "global_step": 201614, "epoch": 4800} {"train_loss": -7.4124884605407715, "global_step": 201615, "epoch": 4800} {"train_loss": -7.43983268737793, "global_step": 201616, "epoch": 4800} {"train_loss": -7.4426960945129395, "global_step": 201617, "epoch": 4800} {"train_loss": -7.286111354827881, "global_step": 201618, "epoch": 4800} {"train_loss": -7.401134014129639, "global_step": 201619, "epoch": 4800} {"train_loss": -7.402915954589844, "global_step": 201620, "epoch": 4800} {"train_loss": -7.401365280151367, "global_step": 201621, "epoch": 4800} {"train_loss": -7.319307327270508, "global_step": 201622, "epoch": 4800} {"train_loss": -7.399813652038574, "global_step": 201623, "epoch": 4800} {"train_loss": -7.31911563873291, "global_step": 201624, "epoch": 4800} {"train_loss": -7.330558776855469, "global_step": 201625, "epoch": 4800} {"train_loss": -7.309363842010498, "global_step": 201626, "epoch": 4800} {"train_loss": -7.472866535186768, "global_step": 201627, "epoch": 4800} {"train_loss": -7.483625411987305, "global_step": 201628, "epoch": 4800} {"train_loss": -7.352784156799316, "global_step": 201629, "epoch": 4800} {"train_loss": -7.4206862449646, "global_step": 201630, "epoch": 4800} {"train_loss": -7.426945686340332, "global_step": 201631, "epoch": 4800} {"train_loss": -7.228672981262207, "global_step": 201632, "epoch": 4800} {"train_loss": -7.338582992553711, "global_step": 201633, "epoch": 4800} {"train_loss": -7.39618444442749, "global_step": 201634, "epoch": 4800} {"train_loss": -7.372722625732422, "global_step": 201635, "epoch": 4800} {"train_loss": -7.322854995727539, "global_step": 201636, "epoch": 4800} {"train_loss": -7.254919528961182, "global_step": 201637, "epoch": 4800} {"train_loss": -7.36897087097168, "global_step": 201638, "epoch": 4800} {"train_loss": -7.3618011474609375, "global_step": 201639, "epoch": 4800} {"train_loss": -7.384437561035156, "global_step": 201640, "epoch": 4800} {"train_loss": -7.358082442056565, "global_step": 201641, "epoch": 4800, "train/sim_max_reward_0": 0.9696317129768456, "train/sim_max_reward_1": 0.9087170734830315, "train/sim_max_reward_2": 0.47454700557783597, "train/sim_max_reward_3": 0.13695616958569892, "train/sim_max_reward_4": 0.9498861953500644, "train/sim_max_reward_5": 0.5598484543865002, "test/sim_max_reward_4500000": 0.9646965779231914, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 0.9454670959876055, "test/sim_max_reward_4500003": 0.9354318945039504, "test/sim_max_reward_4500004": 0.20141849828801914, "test/sim_max_reward_4500005": 0.2669545394879116, "test/sim_max_reward_4500006": 1.0, "test/sim_max_reward_4500007": 1.0, "test/sim_max_reward_4500008": 0.3501821821006952, "test/sim_max_reward_4500009": 0.0529392574676389, "test/sim_max_reward_4500010": 0.15098076422496098, "test/sim_max_reward_4500011": 0.9612394819866639, "test/sim_max_reward_4500012": 0.9685230738390724, "test/sim_max_reward_4500013": 0.008670985692138741, "test/sim_max_reward_4500014": 0.9567557328138115, "test/sim_max_reward_4500015": 0.98364535592589, "test/sim_max_reward_4500016": 0.016252761917270736, "test/sim_max_reward_4500017": 0.07608321371389098, "test/sim_max_reward_4500018": 0.9426455696515441, "test/sim_max_reward_4500019": 0.866255145467881, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8783157144582749, "test/sim_max_reward_4500022": 0.905922294680108, "test/sim_max_reward_4500023": 0.9514118106652465, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.4556044922326755, "test/sim_max_reward_4500026": 0.8159815710404308, "test/sim_max_reward_4500027": 0.9982724059596434, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.06958262596901314, "test/sim_max_reward_4500030": 0.9959339571702986, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.7191571410912253, "test/sim_max_reward_4500034": 0.9360902212460888, "test/sim_max_reward_4500035": 0.8993092515330225, "test/sim_max_reward_4500036": 0.47730774950038235, "test/sim_max_reward_4500037": 1.0, "test/sim_max_reward_4500038": 0.32012188764258687, "test/sim_max_reward_4500039": 0.9117296702283157, "test/sim_max_reward_4500040": 1.0, "test/sim_max_reward_4500041": 0.9829707925299203, "test/sim_max_reward_4500042": 0.04356416171679369, "test/sim_max_reward_4500043": 0.9662224894065073, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.8927500583510277, "test/sim_max_reward_4500046": 0.08194161144966647, "test/sim_max_reward_4500047": 0.19420338457400735, "test/sim_max_reward_4500048": 0.9988263235741713, "test/sim_max_reward_4500049": 0.8294891900870776, "train/mean_score": 0.6665977685599961, "test/mean_score": 0.584150757732469, "val_loss": 81570.1328125} {"train_loss": -7.373814582824707, "global_step": 201642, "epoch": 4801} {"train_loss": -7.3527936935424805, "global_step": 201643, "epoch": 4801} {"train_loss": -7.439055442810059, "global_step": 201644, "epoch": 4801} {"train_loss": -7.388099670410156, "global_step": 201645, "epoch": 4801} {"train_loss": -7.316531181335449, "global_step": 201646, "epoch": 4801} {"train_loss": -7.380080223083496, "global_step": 201647, "epoch": 4801} {"train_loss": -7.3116536140441895, "global_step": 201648, "epoch": 4801} {"train_loss": -7.377925872802734, "global_step": 201649, "epoch": 4801} {"train_loss": -7.253992557525635, "global_step": 201650, "epoch": 4801} {"train_loss": -7.241903781890869, "global_step": 201651, "epoch": 4801} {"train_loss": -7.187261581420898, "global_step": 201652, "epoch": 4801} {"train_loss": -7.2361226081848145, "global_step": 201653, "epoch": 4801} {"train_loss": -7.294346809387207, "global_step": 201654, "epoch": 4801} {"train_loss": -7.244542121887207, "global_step": 201655, "epoch": 4801} {"train_loss": -7.210270881652832, "global_step": 201656, "epoch": 4801} {"train_loss": -7.260915756225586, "global_step": 201657, "epoch": 4801} {"train_loss": -7.24421501159668, "global_step": 201658, "epoch": 4801} {"train_loss": -7.353055477142334, "global_step": 201659, "epoch": 4801} {"train_loss": -7.1715850830078125, "global_step": 201660, "epoch": 4801} {"train_loss": -7.238604545593262, "global_step": 201661, "epoch": 4801} {"train_loss": -7.2724738121032715, "global_step": 201662, "epoch": 4801} {"train_loss": -7.311192989349365, "global_step": 201663, "epoch": 4801} {"train_loss": -7.258995056152344, "global_step": 201664, "epoch": 4801} {"train_loss": -7.229188919067383, "global_step": 201665, "epoch": 4801} {"train_loss": -7.35140323638916, "global_step": 201666, "epoch": 4801} {"train_loss": -7.203713893890381, "global_step": 201667, "epoch": 4801} {"train_loss": -7.31317663192749, "global_step": 201668, "epoch": 4801} {"train_loss": -7.278138160705566, "global_step": 201669, "epoch": 4801} {"train_loss": -7.240264892578125, "global_step": 201670, "epoch": 4801} {"train_loss": -7.255095481872559, "global_step": 201671, "epoch": 4801} {"train_loss": -7.1761250495910645, "global_step": 201672, "epoch": 4801} {"train_loss": -7.324281692504883, "global_step": 201673, "epoch": 4801} {"train_loss": -7.30306339263916, "global_step": 201674, "epoch": 4801} {"train_loss": -7.140022277832031, "global_step": 201675, "epoch": 4801} {"train_loss": -7.178170680999756, "global_step": 201676, "epoch": 4801} {"train_loss": -7.245042324066162, "global_step": 201677, "epoch": 4801} {"train_loss": -7.191059112548828, "global_step": 201678, "epoch": 4801} {"train_loss": -7.3224053382873535, "global_step": 201679, "epoch": 4801} {"train_loss": -7.214805603027344, "global_step": 201680, "epoch": 4801} {"train_loss": -7.261473655700684, "global_step": 201681, "epoch": 4801} {"train_loss": -7.347892761230469, "global_step": 201682, "epoch": 4801} {"train_loss": -7.272426752817063, "global_step": 201683, "epoch": 4801, "val_loss": 81685.1953125} {"train_loss": -7.251544952392578, "global_step": 201684, "epoch": 4802} {"train_loss": -7.147035598754883, "global_step": 201685, "epoch": 4802} {"train_loss": -7.289638519287109, "global_step": 201686, "epoch": 4802} {"train_loss": -7.310661315917969, "global_step": 201687, "epoch": 4802} {"train_loss": -7.150960922241211, "global_step": 201688, "epoch": 4802} {"train_loss": -7.394868850708008, "global_step": 201689, "epoch": 4802} {"train_loss": -7.228000640869141, "global_step": 201690, "epoch": 4802} {"train_loss": -7.210902214050293, "global_step": 201691, "epoch": 4802} {"train_loss": -7.258647441864014, "global_step": 201692, "epoch": 4802} {"train_loss": -7.30097770690918, "global_step": 201693, "epoch": 4802} {"train_loss": -7.325442790985107, "global_step": 201694, "epoch": 4802} {"train_loss": -7.19160270690918, "global_step": 201695, "epoch": 4802} {"train_loss": -7.191755294799805, "global_step": 201696, "epoch": 4802} {"train_loss": -7.299731254577637, "global_step": 201697, "epoch": 4802} {"train_loss": -7.256885528564453, "global_step": 201698, "epoch": 4802} {"train_loss": -7.236204624176025, "global_step": 201699, "epoch": 4802} {"train_loss": -7.384425163269043, "global_step": 201700, "epoch": 4802} {"train_loss": -7.293307304382324, "global_step": 201701, "epoch": 4802} {"train_loss": -7.365686416625977, "global_step": 201702, "epoch": 4802} {"train_loss": -7.174777507781982, "global_step": 201703, "epoch": 4802} {"train_loss": -7.230719089508057, "global_step": 201704, "epoch": 4802} {"train_loss": -7.333436965942383, "global_step": 201705, "epoch": 4802} {"train_loss": -7.315334320068359, "global_step": 201706, "epoch": 4802} {"train_loss": -7.25364351272583, "global_step": 201707, "epoch": 4802} {"train_loss": -7.262880802154541, "global_step": 201708, "epoch": 4802} {"train_loss": -7.294556140899658, "global_step": 201709, "epoch": 4802} {"train_loss": -7.275481224060059, "global_step": 201710, "epoch": 4802} {"train_loss": -7.277852535247803, "global_step": 201711, "epoch": 4802} {"train_loss": -7.264001369476318, "global_step": 201712, "epoch": 4802} {"train_loss": -7.258955001831055, "global_step": 201713, "epoch": 4802} {"train_loss": -7.40739631652832, "global_step": 201714, "epoch": 4802} {"train_loss": -7.274628639221191, "global_step": 201715, "epoch": 4802} {"train_loss": -7.3248066902160645, "global_step": 201716, "epoch": 4802} {"train_loss": -7.361659049987793, "global_step": 201717, "epoch": 4802} {"train_loss": -7.338611125946045, "global_step": 201718, "epoch": 4802} {"train_loss": -7.1632490158081055, "global_step": 201719, "epoch": 4802} {"train_loss": -7.394002914428711, "global_step": 201720, "epoch": 4802} {"train_loss": -7.292083740234375, "global_step": 201721, "epoch": 4802} {"train_loss": -7.364095687866211, "global_step": 201722, "epoch": 4802} {"train_loss": -7.233794212341309, "global_step": 201723, "epoch": 4802} {"train_loss": -7.197779655456543, "global_step": 201724, "epoch": 4802} {"train_loss": -7.276680912290301, "global_step": 201725, "epoch": 4802, "val_loss": 81510.5859375} {"train_loss": -7.207252502441406, "global_step": 201726, "epoch": 4803} {"train_loss": -7.0357465744018555, "global_step": 201727, "epoch": 4803} {"train_loss": -7.268239498138428, "global_step": 201728, "epoch": 4803} {"train_loss": -7.156310081481934, "global_step": 201729, "epoch": 4803} {"train_loss": -7.070374965667725, "global_step": 201730, "epoch": 4803} {"train_loss": -7.260406017303467, "global_step": 201731, "epoch": 4803} {"train_loss": -7.07526969909668, "global_step": 201732, "epoch": 4803} {"train_loss": -7.196776866912842, "global_step": 201733, "epoch": 4803} {"train_loss": -7.160536766052246, "global_step": 201734, "epoch": 4803} {"train_loss": -7.15854549407959, "global_step": 201735, "epoch": 4803} {"train_loss": -7.075090408325195, "global_step": 201736, "epoch": 4803} {"train_loss": -7.155078887939453, "global_step": 201737, "epoch": 4803} {"train_loss": -7.239555358886719, "global_step": 201738, "epoch": 4803} {"train_loss": -7.019556045532227, "global_step": 201739, "epoch": 4803} {"train_loss": -7.3386664390563965, "global_step": 201740, "epoch": 4803} {"train_loss": -7.145092964172363, "global_step": 201741, "epoch": 4803} {"train_loss": -7.2327752113342285, "global_step": 201742, "epoch": 4803} {"train_loss": -7.159518241882324, "global_step": 201743, "epoch": 4803} {"train_loss": -7.282589912414551, "global_step": 201744, "epoch": 4803} {"train_loss": -7.239152908325195, "global_step": 201745, "epoch": 4803} {"train_loss": -7.206752777099609, "global_step": 201746, "epoch": 4803} {"train_loss": -7.098000526428223, "global_step": 201747, "epoch": 4803} {"train_loss": -7.223455905914307, "global_step": 201748, "epoch": 4803} {"train_loss": -7.295582294464111, "global_step": 201749, "epoch": 4803} {"train_loss": -7.386989116668701, "global_step": 201750, "epoch": 4803} {"train_loss": -7.172366142272949, "global_step": 201751, "epoch": 4803} {"train_loss": -7.184252738952637, "global_step": 201752, "epoch": 4803} {"train_loss": -7.148907661437988, "global_step": 201753, "epoch": 4803} {"train_loss": -7.091608047485352, "global_step": 201754, "epoch": 4803} {"train_loss": -7.291570663452148, "global_step": 201755, "epoch": 4803} {"train_loss": -7.258164405822754, "global_step": 201756, "epoch": 4803} {"train_loss": -7.306689262390137, "global_step": 201757, "epoch": 4803} {"train_loss": -7.226925373077393, "global_step": 201758, "epoch": 4803} {"train_loss": -7.219712257385254, "global_step": 201759, "epoch": 4803} {"train_loss": -7.211182594299316, "global_step": 201760, "epoch": 4803} {"train_loss": -7.275388717651367, "global_step": 201761, "epoch": 4803} {"train_loss": -7.3496246337890625, "global_step": 201762, "epoch": 4803} {"train_loss": -7.178896903991699, "global_step": 201763, "epoch": 4803} {"train_loss": -7.270773887634277, "global_step": 201764, "epoch": 4803} {"train_loss": -7.254087448120117, "global_step": 201765, "epoch": 4803} {"train_loss": -7.260775089263916, "global_step": 201766, "epoch": 4803} {"train_loss": -7.204875469207764, "global_step": 201767, "epoch": 4803, "val_loss": 81333.6328125} {"train_loss": -7.367834568023682, "global_step": 201768, "epoch": 4804} {"train_loss": -7.093922138214111, "global_step": 201769, "epoch": 4804} {"train_loss": -7.2810564041137695, "global_step": 201770, "epoch": 4804} {"train_loss": -7.169532299041748, "global_step": 201771, "epoch": 4804} {"train_loss": -7.222708702087402, "global_step": 201772, "epoch": 4804} {"train_loss": -7.302734375, "global_step": 201773, "epoch": 4804} {"train_loss": -7.139888763427734, "global_step": 201774, "epoch": 4804} {"train_loss": -7.334347724914551, "global_step": 201775, "epoch": 4804} {"train_loss": -7.197414875030518, "global_step": 201776, "epoch": 4804} {"train_loss": -7.173746585845947, "global_step": 201777, "epoch": 4804} {"train_loss": -7.326870918273926, "global_step": 201778, "epoch": 4804} {"train_loss": -7.113886833190918, "global_step": 201779, "epoch": 4804} {"train_loss": -7.1704277992248535, "global_step": 201780, "epoch": 4804} {"train_loss": -7.245424270629883, "global_step": 201781, "epoch": 4804} {"train_loss": -7.054427146911621, "global_step": 201782, "epoch": 4804} {"train_loss": -7.248334884643555, "global_step": 201783, "epoch": 4804} {"train_loss": -7.101160526275635, "global_step": 201784, "epoch": 4804} {"train_loss": -7.312920570373535, "global_step": 201785, "epoch": 4804} {"train_loss": -7.177875995635986, "global_step": 201786, "epoch": 4804} {"train_loss": -7.2596049308776855, "global_step": 201787, "epoch": 4804} {"train_loss": -7.232813358306885, "global_step": 201788, "epoch": 4804} {"train_loss": -7.236937999725342, "global_step": 201789, "epoch": 4804} {"train_loss": -7.224664688110352, "global_step": 201790, "epoch": 4804} {"train_loss": -7.167330741882324, "global_step": 201791, "epoch": 4804} {"train_loss": -7.302491664886475, "global_step": 201792, "epoch": 4804} {"train_loss": -7.126071929931641, "global_step": 201793, "epoch": 4804} {"train_loss": -7.331428527832031, "global_step": 201794, "epoch": 4804} {"train_loss": -7.210903644561768, "global_step": 201795, "epoch": 4804} {"train_loss": -7.204883575439453, "global_step": 201796, "epoch": 4804} {"train_loss": -7.132382392883301, "global_step": 201797, "epoch": 4804} {"train_loss": -7.320361137390137, "global_step": 201798, "epoch": 4804} {"train_loss": -7.207859039306641, "global_step": 201799, "epoch": 4804} {"train_loss": -7.3593034744262695, "global_step": 201800, "epoch": 4804} {"train_loss": -7.263575553894043, "global_step": 201801, "epoch": 4804} {"train_loss": -7.208776950836182, "global_step": 201802, "epoch": 4804} {"train_loss": -7.269659042358398, "global_step": 201803, "epoch": 4804} {"train_loss": -7.27918815612793, "global_step": 201804, "epoch": 4804} {"train_loss": -7.236372947692871, "global_step": 201805, "epoch": 4804} {"train_loss": -7.285716533660889, "global_step": 201806, "epoch": 4804} {"train_loss": -7.286113262176514, "global_step": 201807, "epoch": 4804} {"train_loss": -7.186057090759277, "global_step": 201808, "epoch": 4804} {"train_loss": -7.232608658926828, "global_step": 201809, "epoch": 4804, "val_loss": 81697.6015625} {"train_loss": -7.1494646072387695, "global_step": 201810, "epoch": 4805} {"train_loss": -7.314218521118164, "global_step": 201811, "epoch": 4805} {"train_loss": -7.155921936035156, "global_step": 201812, "epoch": 4805} {"train_loss": -7.10179328918457, "global_step": 201813, "epoch": 4805} {"train_loss": -7.3181962966918945, "global_step": 201814, "epoch": 4805} {"train_loss": -7.089872360229492, "global_step": 201815, "epoch": 4805} {"train_loss": -7.345402717590332, "global_step": 201816, "epoch": 4805} {"train_loss": -7.140939712524414, "global_step": 201817, "epoch": 4805} {"train_loss": -7.1104230880737305, "global_step": 201818, "epoch": 4805} {"train_loss": -7.297696113586426, "global_step": 201819, "epoch": 4805} {"train_loss": -7.058590888977051, "global_step": 201820, "epoch": 4805} {"train_loss": -7.157849311828613, "global_step": 201821, "epoch": 4805} {"train_loss": -7.1368632316589355, "global_step": 201822, "epoch": 4805} {"train_loss": -7.190199851989746, "global_step": 201823, "epoch": 4805} {"train_loss": -7.174726486206055, "global_step": 201824, "epoch": 4805} {"train_loss": -7.181763648986816, "global_step": 201825, "epoch": 4805} {"train_loss": -7.224208831787109, "global_step": 201826, "epoch": 4805} {"train_loss": -7.28115701675415, "global_step": 201827, "epoch": 4805} {"train_loss": -7.134676933288574, "global_step": 201828, "epoch": 4805} {"train_loss": -7.2856926918029785, "global_step": 201829, "epoch": 4805} {"train_loss": -7.2449846267700195, "global_step": 201830, "epoch": 4805} {"train_loss": -7.172423362731934, "global_step": 201831, "epoch": 4805} {"train_loss": -7.209136009216309, "global_step": 201832, "epoch": 4805} {"train_loss": -7.229357719421387, "global_step": 201833, "epoch": 4805} {"train_loss": -7.189737319946289, "global_step": 201834, "epoch": 4805} {"train_loss": -7.202373027801514, "global_step": 201835, "epoch": 4805} {"train_loss": -7.215033531188965, "global_step": 201836, "epoch": 4805} {"train_loss": -7.276442527770996, "global_step": 201837, "epoch": 4805} {"train_loss": -7.205594062805176, "global_step": 201838, "epoch": 4805} {"train_loss": -7.362339496612549, "global_step": 201839, "epoch": 4805} {"train_loss": -7.2705078125, "global_step": 201840, "epoch": 4805} {"train_loss": -7.251810073852539, "global_step": 201841, "epoch": 4805} {"train_loss": -7.351935863494873, "global_step": 201842, "epoch": 4805} {"train_loss": -7.2522664070129395, "global_step": 201843, "epoch": 4805} {"train_loss": -7.156625747680664, "global_step": 201844, "epoch": 4805} {"train_loss": -7.2705841064453125, "global_step": 201845, "epoch": 4805} {"train_loss": -7.343266010284424, "global_step": 201846, "epoch": 4805} {"train_loss": -7.262167930603027, "global_step": 201847, "epoch": 4805} {"train_loss": -7.32182502746582, "global_step": 201848, "epoch": 4805} {"train_loss": -7.322783470153809, "global_step": 201849, "epoch": 4805} {"train_loss": -7.354911804199219, "global_step": 201850, "epoch": 4805} {"train_loss": -7.229932660148258, "global_step": 201851, "epoch": 4805, "val_loss": 81562.78125} {"train_loss": -7.358699321746826, "global_step": 201852, "epoch": 4806} {"train_loss": -7.3749895095825195, "global_step": 201853, "epoch": 4806} {"train_loss": -7.2850446701049805, "global_step": 201854, "epoch": 4806} {"train_loss": -7.3301215171813965, "global_step": 201855, "epoch": 4806} {"train_loss": -7.338131904602051, "global_step": 201856, "epoch": 4806} {"train_loss": -7.399949550628662, "global_step": 201857, "epoch": 4806} {"train_loss": -7.322419166564941, "global_step": 201858, "epoch": 4806} {"train_loss": -7.258808135986328, "global_step": 201859, "epoch": 4806} {"train_loss": -7.275500774383545, "global_step": 201860, "epoch": 4806} {"train_loss": -7.454638957977295, "global_step": 201861, "epoch": 4806} {"train_loss": -7.308090686798096, "global_step": 201862, "epoch": 4806} {"train_loss": -7.425788402557373, "global_step": 201863, "epoch": 4806} {"train_loss": -7.333540916442871, "global_step": 201864, "epoch": 4806} {"train_loss": -7.441789627075195, "global_step": 201865, "epoch": 4806} {"train_loss": -7.428595542907715, "global_step": 201866, "epoch": 4806} {"train_loss": -7.251620292663574, "global_step": 201867, "epoch": 4806} {"train_loss": -7.382942199707031, "global_step": 201868, "epoch": 4806} {"train_loss": -7.315551280975342, "global_step": 201869, "epoch": 4806} {"train_loss": -7.287450790405273, "global_step": 201870, "epoch": 4806} {"train_loss": -7.4044952392578125, "global_step": 201871, "epoch": 4806} {"train_loss": -7.347850799560547, "global_step": 201872, "epoch": 4806} {"train_loss": -7.2674336433410645, "global_step": 201873, "epoch": 4806} {"train_loss": -7.281947135925293, "global_step": 201874, "epoch": 4806} {"train_loss": -7.27419900894165, "global_step": 201875, "epoch": 4806} {"train_loss": -7.355893611907959, "global_step": 201876, "epoch": 4806} {"train_loss": -7.330404758453369, "global_step": 201877, "epoch": 4806} {"train_loss": -7.18403434753418, "global_step": 201878, "epoch": 4806} {"train_loss": -7.279353618621826, "global_step": 201879, "epoch": 4806} {"train_loss": -7.23398494720459, "global_step": 201880, "epoch": 4806} {"train_loss": -7.297940254211426, "global_step": 201881, "epoch": 4806} {"train_loss": -7.184402942657471, "global_step": 201882, "epoch": 4806} {"train_loss": -7.24513053894043, "global_step": 201883, "epoch": 4806} {"train_loss": -7.214112281799316, "global_step": 201884, "epoch": 4806} {"train_loss": -7.351147651672363, "global_step": 201885, "epoch": 4806} {"train_loss": -7.248408317565918, "global_step": 201886, "epoch": 4806} {"train_loss": -7.178323268890381, "global_step": 201887, "epoch": 4806} {"train_loss": -7.325328350067139, "global_step": 201888, "epoch": 4806} {"train_loss": -7.148287773132324, "global_step": 201889, "epoch": 4806} {"train_loss": -7.242305755615234, "global_step": 201890, "epoch": 4806} {"train_loss": -7.297830581665039, "global_step": 201891, "epoch": 4806} {"train_loss": -7.2164835929870605, "global_step": 201892, "epoch": 4806} {"train_loss": -7.3012333029792424, "global_step": 201893, "epoch": 4806, "val_loss": 81647.6875} {"train_loss": -7.171236991882324, "global_step": 201894, "epoch": 4807} {"train_loss": -7.5076518058776855, "global_step": 201895, "epoch": 4807} {"train_loss": -7.295920372009277, "global_step": 201896, "epoch": 4807} {"train_loss": -7.276025295257568, "global_step": 201897, "epoch": 4807} {"train_loss": -7.285314559936523, "global_step": 201898, "epoch": 4807} {"train_loss": -7.283926486968994, "global_step": 201899, "epoch": 4807} {"train_loss": -7.312600612640381, "global_step": 201900, "epoch": 4807} {"train_loss": -7.307550430297852, "global_step": 201901, "epoch": 4807} {"train_loss": -7.295458793640137, "global_step": 201902, "epoch": 4807} {"train_loss": -7.277894973754883, "global_step": 201903, "epoch": 4807} {"train_loss": -7.374883651733398, "global_step": 201904, "epoch": 4807} {"train_loss": -7.174740791320801, "global_step": 201905, "epoch": 4807} {"train_loss": -7.026905059814453, "global_step": 201906, "epoch": 4807} {"train_loss": -7.195897102355957, "global_step": 201907, "epoch": 4807} {"train_loss": -7.128179550170898, "global_step": 201908, "epoch": 4807} {"train_loss": -7.188207626342773, "global_step": 201909, "epoch": 4807} {"train_loss": -7.174158096313477, "global_step": 201910, "epoch": 4807} {"train_loss": -7.161628723144531, "global_step": 201911, "epoch": 4807} {"train_loss": -7.193118572235107, "global_step": 201912, "epoch": 4807} {"train_loss": -7.268922805786133, "global_step": 201913, "epoch": 4807} {"train_loss": -7.238824844360352, "global_step": 201914, "epoch": 4807} {"train_loss": -7.269857406616211, "global_step": 201915, "epoch": 4807} {"train_loss": -7.279361724853516, "global_step": 201916, "epoch": 4807} {"train_loss": -7.231690406799316, "global_step": 201917, "epoch": 4807} {"train_loss": -7.2176713943481445, "global_step": 201918, "epoch": 4807} {"train_loss": -7.284435272216797, "global_step": 201919, "epoch": 4807} {"train_loss": -7.240576267242432, "global_step": 201920, "epoch": 4807} {"train_loss": -7.314663887023926, "global_step": 201921, "epoch": 4807} {"train_loss": -7.244810581207275, "global_step": 201922, "epoch": 4807} {"train_loss": -7.2257843017578125, "global_step": 201923, "epoch": 4807} {"train_loss": -7.285409927368164, "global_step": 201924, "epoch": 4807} {"train_loss": -7.24634313583374, "global_step": 201925, "epoch": 4807} {"train_loss": -7.407054901123047, "global_step": 201926, "epoch": 4807} {"train_loss": -7.341154098510742, "global_step": 201927, "epoch": 4807} {"train_loss": -7.262053489685059, "global_step": 201928, "epoch": 4807} {"train_loss": -7.312777996063232, "global_step": 201929, "epoch": 4807} {"train_loss": -7.241412162780762, "global_step": 201930, "epoch": 4807} {"train_loss": -7.284150123596191, "global_step": 201931, "epoch": 4807} {"train_loss": -7.259038925170898, "global_step": 201932, "epoch": 4807} {"train_loss": -7.37164306640625, "global_step": 201933, "epoch": 4807} {"train_loss": -7.411787033081055, "global_step": 201934, "epoch": 4807} {"train_loss": -7.265996160961333, "global_step": 201935, "epoch": 4807, "val_loss": 81619.1328125} {"train_loss": -7.225135326385498, "global_step": 201936, "epoch": 4808} {"train_loss": -7.293991565704346, "global_step": 201937, "epoch": 4808} {"train_loss": -7.326349258422852, "global_step": 201938, "epoch": 4808} {"train_loss": -7.287464141845703, "global_step": 201939, "epoch": 4808} {"train_loss": -7.333566188812256, "global_step": 201940, "epoch": 4808} {"train_loss": -7.324765682220459, "global_step": 201941, "epoch": 4808} {"train_loss": -7.345014572143555, "global_step": 201942, "epoch": 4808} {"train_loss": -7.262800216674805, "global_step": 201943, "epoch": 4808} {"train_loss": -7.284125804901123, "global_step": 201944, "epoch": 4808} {"train_loss": -7.199954032897949, "global_step": 201945, "epoch": 4808} {"train_loss": -7.410505294799805, "global_step": 201946, "epoch": 4808} {"train_loss": -7.396257400512695, "global_step": 201947, "epoch": 4808} {"train_loss": -7.425929069519043, "global_step": 201948, "epoch": 4808} {"train_loss": -7.342741966247559, "global_step": 201949, "epoch": 4808} {"train_loss": -7.307447910308838, "global_step": 201950, "epoch": 4808} {"train_loss": -7.388660907745361, "global_step": 201951, "epoch": 4808} {"train_loss": -7.271976470947266, "global_step": 201952, "epoch": 4808} {"train_loss": -7.386081695556641, "global_step": 201953, "epoch": 4808} {"train_loss": -7.3087053298950195, "global_step": 201954, "epoch": 4808} {"train_loss": -7.289676666259766, "global_step": 201955, "epoch": 4808} {"train_loss": -7.369658470153809, "global_step": 201956, "epoch": 4808} {"train_loss": -7.300936698913574, "global_step": 201957, "epoch": 4808} {"train_loss": -7.279233932495117, "global_step": 201958, "epoch": 4808} {"train_loss": -7.448298454284668, "global_step": 201959, "epoch": 4808} {"train_loss": -7.329527854919434, "global_step": 201960, "epoch": 4808} {"train_loss": -7.2936553955078125, "global_step": 201961, "epoch": 4808} {"train_loss": -7.339290618896484, "global_step": 201962, "epoch": 4808} {"train_loss": -7.40683650970459, "global_step": 201963, "epoch": 4808} {"train_loss": -7.3218560218811035, "global_step": 201964, "epoch": 4808} {"train_loss": -7.356697082519531, "global_step": 201965, "epoch": 4808} {"train_loss": -7.372927188873291, "global_step": 201966, "epoch": 4808} {"train_loss": -7.304594039916992, "global_step": 201967, "epoch": 4808} {"train_loss": -7.283065319061279, "global_step": 201968, "epoch": 4808} {"train_loss": -7.184186935424805, "global_step": 201969, "epoch": 4808} {"train_loss": -7.293242454528809, "global_step": 201970, "epoch": 4808} {"train_loss": -7.292479515075684, "global_step": 201971, "epoch": 4808} {"train_loss": -7.244744300842285, "global_step": 201972, "epoch": 4808} {"train_loss": -7.408473968505859, "global_step": 201973, "epoch": 4808} {"train_loss": -7.344085693359375, "global_step": 201974, "epoch": 4808} {"train_loss": -7.287730693817139, "global_step": 201975, "epoch": 4808} {"train_loss": -7.293460369110107, "global_step": 201976, "epoch": 4808} {"train_loss": -7.320793583279564, "global_step": 201977, "epoch": 4808, "val_loss": 81578.609375} {"train_loss": -7.271397590637207, "global_step": 201978, "epoch": 4809} {"train_loss": -7.344217300415039, "global_step": 201979, "epoch": 4809} {"train_loss": -7.278116226196289, "global_step": 201980, "epoch": 4809} {"train_loss": -7.310057640075684, "global_step": 201981, "epoch": 4809} {"train_loss": -7.505623817443848, "global_step": 201982, "epoch": 4809} {"train_loss": -7.423124313354492, "global_step": 201983, "epoch": 4809} {"train_loss": -7.3951263427734375, "global_step": 201984, "epoch": 4809} {"train_loss": -7.37148380279541, "global_step": 201985, "epoch": 4809} {"train_loss": -7.398066997528076, "global_step": 201986, "epoch": 4809} {"train_loss": -7.360085487365723, "global_step": 201987, "epoch": 4809} {"train_loss": -7.36054801940918, "global_step": 201988, "epoch": 4809} {"train_loss": -7.3260674476623535, "global_step": 201989, "epoch": 4809} {"train_loss": -7.361907005310059, "global_step": 201990, "epoch": 4809} {"train_loss": -7.415056228637695, "global_step": 201991, "epoch": 4809} {"train_loss": -7.252470970153809, "global_step": 201992, "epoch": 4809} {"train_loss": -7.37465763092041, "global_step": 201993, "epoch": 4809} {"train_loss": -7.286048412322998, "global_step": 201994, "epoch": 4809} {"train_loss": -7.268210411071777, "global_step": 201995, "epoch": 4809} {"train_loss": -7.271963119506836, "global_step": 201996, "epoch": 4809} {"train_loss": -7.246664524078369, "global_step": 201997, "epoch": 4809} {"train_loss": -7.223311424255371, "global_step": 201998, "epoch": 4809} {"train_loss": -7.320890426635742, "global_step": 201999, "epoch": 4809} {"train_loss": -7.308998107910156, "global_step": 202000, "epoch": 4809} {"train_loss": -7.290184020996094, "global_step": 202001, "epoch": 4809} {"train_loss": -7.378469467163086, "global_step": 202002, "epoch": 4809} {"train_loss": -7.330832481384277, "global_step": 202003, "epoch": 4809} {"train_loss": -7.329659461975098, "global_step": 202004, "epoch": 4809} {"train_loss": -7.291814804077148, "global_step": 202005, "epoch": 4809} {"train_loss": -7.410868167877197, "global_step": 202006, "epoch": 4809} {"train_loss": -7.344953536987305, "global_step": 202007, "epoch": 4809} {"train_loss": -7.304059982299805, "global_step": 202008, "epoch": 4809} {"train_loss": -7.291412830352783, "global_step": 202009, "epoch": 4809} {"train_loss": -7.254359722137451, "global_step": 202010, "epoch": 4809} {"train_loss": -7.241793632507324, "global_step": 202011, "epoch": 4809} {"train_loss": -7.234907150268555, "global_step": 202012, "epoch": 4809} {"train_loss": -7.342984199523926, "global_step": 202013, "epoch": 4809} {"train_loss": -7.383511543273926, "global_step": 202014, "epoch": 4809} {"train_loss": -7.2137861251831055, "global_step": 202015, "epoch": 4809} {"train_loss": -7.176520347595215, "global_step": 202016, "epoch": 4809} {"train_loss": -7.374195098876953, "global_step": 202017, "epoch": 4809} {"train_loss": -7.33918571472168, "global_step": 202018, "epoch": 4809} {"train_loss": -7.320549624306815, "global_step": 202019, "epoch": 4809, "val_loss": 81300.4140625} {"train_loss": -7.299149513244629, "global_step": 202020, "epoch": 4810} {"train_loss": -7.226256370544434, "global_step": 202021, "epoch": 4810} {"train_loss": -7.303355693817139, "global_step": 202022, "epoch": 4810} {"train_loss": -7.414398193359375, "global_step": 202023, "epoch": 4810} {"train_loss": -7.282912254333496, "global_step": 202024, "epoch": 4810} {"train_loss": -7.1966023445129395, "global_step": 202025, "epoch": 4810} {"train_loss": -7.257410049438477, "global_step": 202026, "epoch": 4810} {"train_loss": -7.262058734893799, "global_step": 202027, "epoch": 4810} {"train_loss": -7.365256309509277, "global_step": 202028, "epoch": 4810} {"train_loss": -7.306175231933594, "global_step": 202029, "epoch": 4810} {"train_loss": -7.254265785217285, "global_step": 202030, "epoch": 4810} {"train_loss": -7.252247333526611, "global_step": 202031, "epoch": 4810} {"train_loss": -7.248556613922119, "global_step": 202032, "epoch": 4810} {"train_loss": -7.339946746826172, "global_step": 202033, "epoch": 4810} {"train_loss": -7.323400020599365, "global_step": 202034, "epoch": 4810} {"train_loss": -7.2615742683410645, "global_step": 202035, "epoch": 4810} {"train_loss": -7.2996826171875, "global_step": 202036, "epoch": 4810} {"train_loss": -7.2399373054504395, "global_step": 202037, "epoch": 4810} {"train_loss": -7.433570861816406, "global_step": 202038, "epoch": 4810} {"train_loss": -7.319052219390869, "global_step": 202039, "epoch": 4810} {"train_loss": -7.3120880126953125, "global_step": 202040, "epoch": 4810} {"train_loss": -7.291987895965576, "global_step": 202041, "epoch": 4810} {"train_loss": -7.356927871704102, "global_step": 202042, "epoch": 4810} {"train_loss": -7.3748860359191895, "global_step": 202043, "epoch": 4810} {"train_loss": -7.430930137634277, "global_step": 202044, "epoch": 4810} {"train_loss": -7.3134660720825195, "global_step": 202045, "epoch": 4810} {"train_loss": -7.154441833496094, "global_step": 202046, "epoch": 4810} {"train_loss": -7.287330627441406, "global_step": 202047, "epoch": 4810} {"train_loss": -7.127723693847656, "global_step": 202048, "epoch": 4810} {"train_loss": -7.354308128356934, "global_step": 202049, "epoch": 4810} {"train_loss": -7.300350189208984, "global_step": 202050, "epoch": 4810} {"train_loss": -7.008679389953613, "global_step": 202051, "epoch": 4810} {"train_loss": -7.332316875457764, "global_step": 202052, "epoch": 4810} {"train_loss": -7.436816692352295, "global_step": 202053, "epoch": 4810} {"train_loss": -7.3087310791015625, "global_step": 202054, "epoch": 4810} {"train_loss": -7.275471210479736, "global_step": 202055, "epoch": 4810} {"train_loss": -7.351907730102539, "global_step": 202056, "epoch": 4810} {"train_loss": -7.28422737121582, "global_step": 202057, "epoch": 4810} {"train_loss": -7.165024757385254, "global_step": 202058, "epoch": 4810} {"train_loss": -7.305499076843262, "global_step": 202059, "epoch": 4810} {"train_loss": -7.250039100646973, "global_step": 202060, "epoch": 4810} {"train_loss": -7.291011991954985, "global_step": 202061, "epoch": 4810, "val_loss": 81642.6484375} {"train_loss": -7.2795939445495605, "global_step": 202062, "epoch": 4811} {"train_loss": -7.230222702026367, "global_step": 202063, "epoch": 4811} {"train_loss": -7.308717727661133, "global_step": 202064, "epoch": 4811} {"train_loss": -7.268111228942871, "global_step": 202065, "epoch": 4811} {"train_loss": -7.409132957458496, "global_step": 202066, "epoch": 4811} {"train_loss": -7.23222541809082, "global_step": 202067, "epoch": 4811} {"train_loss": -7.298388957977295, "global_step": 202068, "epoch": 4811} {"train_loss": -7.353146076202393, "global_step": 202069, "epoch": 4811} {"train_loss": -7.196713924407959, "global_step": 202070, "epoch": 4811} {"train_loss": -7.296189308166504, "global_step": 202071, "epoch": 4811} {"train_loss": -7.367834568023682, "global_step": 202072, "epoch": 4811} {"train_loss": -7.209931373596191, "global_step": 202073, "epoch": 4811} {"train_loss": -7.275554656982422, "global_step": 202074, "epoch": 4811} {"train_loss": -7.278613567352295, "global_step": 202075, "epoch": 4811} {"train_loss": -7.254110813140869, "global_step": 202076, "epoch": 4811} {"train_loss": -7.245636940002441, "global_step": 202077, "epoch": 4811} {"train_loss": -7.314249515533447, "global_step": 202078, "epoch": 4811} {"train_loss": -7.2961931228637695, "global_step": 202079, "epoch": 4811} {"train_loss": -7.34157657623291, "global_step": 202080, "epoch": 4811} {"train_loss": -7.246614456176758, "global_step": 202081, "epoch": 4811} {"train_loss": -7.296741485595703, "global_step": 202082, "epoch": 4811} {"train_loss": -7.237174987792969, "global_step": 202083, "epoch": 4811} {"train_loss": -7.336254119873047, "global_step": 202084, "epoch": 4811} {"train_loss": -7.349637031555176, "global_step": 202085, "epoch": 4811} {"train_loss": -7.389442443847656, "global_step": 202086, "epoch": 4811} {"train_loss": -7.346079349517822, "global_step": 202087, "epoch": 4811} {"train_loss": -7.34188175201416, "global_step": 202088, "epoch": 4811} {"train_loss": -7.328856468200684, "global_step": 202089, "epoch": 4811} {"train_loss": -7.373620986938477, "global_step": 202090, "epoch": 4811} {"train_loss": -7.178656578063965, "global_step": 202091, "epoch": 4811} {"train_loss": -7.34599494934082, "global_step": 202092, "epoch": 4811} {"train_loss": -7.445148468017578, "global_step": 202093, "epoch": 4811} {"train_loss": -7.426443576812744, "global_step": 202094, "epoch": 4811} {"train_loss": -7.273432731628418, "global_step": 202095, "epoch": 4811} {"train_loss": -7.258942127227783, "global_step": 202096, "epoch": 4811} {"train_loss": -7.342588424682617, "global_step": 202097, "epoch": 4811} {"train_loss": -7.237809181213379, "global_step": 202098, "epoch": 4811} {"train_loss": -7.413635730743408, "global_step": 202099, "epoch": 4811} {"train_loss": -7.249482154846191, "global_step": 202100, "epoch": 4811} {"train_loss": -7.243525505065918, "global_step": 202101, "epoch": 4811} {"train_loss": -7.3508148193359375, "global_step": 202102, "epoch": 4811} {"train_loss": -7.304329134169079, "global_step": 202103, "epoch": 4811, "val_loss": 81826.578125} {"train_loss": -7.302884578704834, "global_step": 202104, "epoch": 4812} {"train_loss": -7.294546604156494, "global_step": 202105, "epoch": 4812} {"train_loss": -7.262789249420166, "global_step": 202106, "epoch": 4812} {"train_loss": -7.267399787902832, "global_step": 202107, "epoch": 4812} {"train_loss": -7.306244373321533, "global_step": 202108, "epoch": 4812} {"train_loss": -7.054948806762695, "global_step": 202109, "epoch": 4812} {"train_loss": -7.281513690948486, "global_step": 202110, "epoch": 4812} {"train_loss": -7.243461608886719, "global_step": 202111, "epoch": 4812} {"train_loss": -7.427184581756592, "global_step": 202112, "epoch": 4812} {"train_loss": -7.243456840515137, "global_step": 202113, "epoch": 4812} {"train_loss": -7.310290336608887, "global_step": 202114, "epoch": 4812} {"train_loss": -7.372900485992432, "global_step": 202115, "epoch": 4812} {"train_loss": -7.238804340362549, "global_step": 202116, "epoch": 4812} {"train_loss": -7.246193885803223, "global_step": 202117, "epoch": 4812} {"train_loss": -7.321678161621094, "global_step": 202118, "epoch": 4812} {"train_loss": -7.144315242767334, "global_step": 202119, "epoch": 4812} {"train_loss": -7.234133243560791, "global_step": 202120, "epoch": 4812} {"train_loss": -7.31204891204834, "global_step": 202121, "epoch": 4812} {"train_loss": -6.995505332946777, "global_step": 202122, "epoch": 4812} {"train_loss": -7.328310489654541, "global_step": 202123, "epoch": 4812} {"train_loss": -7.264813423156738, "global_step": 202124, "epoch": 4812} {"train_loss": -7.363836288452148, "global_step": 202125, "epoch": 4812} {"train_loss": -7.39400577545166, "global_step": 202126, "epoch": 4812} {"train_loss": -7.380572319030762, "global_step": 202127, "epoch": 4812} {"train_loss": -7.391298294067383, "global_step": 202128, "epoch": 4812} {"train_loss": -7.354459762573242, "global_step": 202129, "epoch": 4812} {"train_loss": -7.321773052215576, "global_step": 202130, "epoch": 4812} {"train_loss": -7.324408531188965, "global_step": 202131, "epoch": 4812} {"train_loss": -7.301023483276367, "global_step": 202132, "epoch": 4812} {"train_loss": -7.340299606323242, "global_step": 202133, "epoch": 4812} {"train_loss": -7.397155284881592, "global_step": 202134, "epoch": 4812} {"train_loss": -7.453274726867676, "global_step": 202135, "epoch": 4812} {"train_loss": -7.36231803894043, "global_step": 202136, "epoch": 4812} {"train_loss": -7.439210891723633, "global_step": 202137, "epoch": 4812} {"train_loss": -7.469922065734863, "global_step": 202138, "epoch": 4812} {"train_loss": -7.33571195602417, "global_step": 202139, "epoch": 4812} {"train_loss": -7.397297382354736, "global_step": 202140, "epoch": 4812} {"train_loss": -7.38017463684082, "global_step": 202141, "epoch": 4812} {"train_loss": -7.444230079650879, "global_step": 202142, "epoch": 4812} {"train_loss": -7.260218620300293, "global_step": 202143, "epoch": 4812} {"train_loss": -7.324613094329834, "global_step": 202144, "epoch": 4812} {"train_loss": -7.313540663037982, "global_step": 202145, "epoch": 4812, "val_loss": 81617.7890625} {"train_loss": -7.45257043838501, "global_step": 202146, "epoch": 4813} {"train_loss": -7.247917175292969, "global_step": 202147, "epoch": 4813} {"train_loss": -7.253016471862793, "global_step": 202148, "epoch": 4813} {"train_loss": -7.392947196960449, "global_step": 202149, "epoch": 4813} {"train_loss": -7.243575096130371, "global_step": 202150, "epoch": 4813} {"train_loss": -7.369110107421875, "global_step": 202151, "epoch": 4813} {"train_loss": -7.22991943359375, "global_step": 202152, "epoch": 4813} {"train_loss": -7.1595354080200195, "global_step": 202153, "epoch": 4813} {"train_loss": -7.300702095031738, "global_step": 202154, "epoch": 4813} {"train_loss": -7.247703552246094, "global_step": 202155, "epoch": 4813} {"train_loss": -7.177296161651611, "global_step": 202156, "epoch": 4813} {"train_loss": -7.2271647453308105, "global_step": 202157, "epoch": 4813} {"train_loss": -7.326948165893555, "global_step": 202158, "epoch": 4813} {"train_loss": -7.068195343017578, "global_step": 202159, "epoch": 4813} {"train_loss": -7.262801647186279, "global_step": 202160, "epoch": 4813} {"train_loss": -7.189115524291992, "global_step": 202161, "epoch": 4813} {"train_loss": -7.272979736328125, "global_step": 202162, "epoch": 4813} {"train_loss": -7.216012001037598, "global_step": 202163, "epoch": 4813} {"train_loss": -7.14159631729126, "global_step": 202164, "epoch": 4813} {"train_loss": -7.155508518218994, "global_step": 202165, "epoch": 4813} {"train_loss": -7.189206123352051, "global_step": 202166, "epoch": 4813} {"train_loss": -7.331355094909668, "global_step": 202167, "epoch": 4813} {"train_loss": -7.240569114685059, "global_step": 202168, "epoch": 4813} {"train_loss": -7.164209365844727, "global_step": 202169, "epoch": 4813} {"train_loss": -7.351845741271973, "global_step": 202170, "epoch": 4813} {"train_loss": -7.33328914642334, "global_step": 202171, "epoch": 4813} {"train_loss": -7.25493860244751, "global_step": 202172, "epoch": 4813} {"train_loss": -7.400353908538818, "global_step": 202173, "epoch": 4813} {"train_loss": -7.2581658363342285, "global_step": 202174, "epoch": 4813} {"train_loss": -7.267839431762695, "global_step": 202175, "epoch": 4813} {"train_loss": -7.182649612426758, "global_step": 202176, "epoch": 4813} {"train_loss": -7.344936370849609, "global_step": 202177, "epoch": 4813} {"train_loss": -7.369646072387695, "global_step": 202178, "epoch": 4813} {"train_loss": -7.21769380569458, "global_step": 202179, "epoch": 4813} {"train_loss": -7.354879379272461, "global_step": 202180, "epoch": 4813} {"train_loss": -7.277260780334473, "global_step": 202181, "epoch": 4813} {"train_loss": -7.386222839355469, "global_step": 202182, "epoch": 4813} {"train_loss": -7.28752326965332, "global_step": 202183, "epoch": 4813} {"train_loss": -7.288207054138184, "global_step": 202184, "epoch": 4813} {"train_loss": -7.321228504180908, "global_step": 202185, "epoch": 4813} {"train_loss": -7.291684627532959, "global_step": 202186, "epoch": 4813} {"train_loss": -7.26992468606858, "global_step": 202187, "epoch": 4813, "val_loss": 81603.6796875} {"train_loss": -7.341506004333496, "global_step": 202188, "epoch": 4814} {"train_loss": -7.152414321899414, "global_step": 202189, "epoch": 4814} {"train_loss": -7.144800186157227, "global_step": 202190, "epoch": 4814} {"train_loss": -7.304302215576172, "global_step": 202191, "epoch": 4814} {"train_loss": -7.275812149047852, "global_step": 202192, "epoch": 4814} {"train_loss": -7.205368518829346, "global_step": 202193, "epoch": 4814} {"train_loss": -7.172817707061768, "global_step": 202194, "epoch": 4814} {"train_loss": -7.258803367614746, "global_step": 202195, "epoch": 4814} {"train_loss": -7.090152740478516, "global_step": 202196, "epoch": 4814} {"train_loss": -7.28282356262207, "global_step": 202197, "epoch": 4814} {"train_loss": -7.322473049163818, "global_step": 202198, "epoch": 4814} {"train_loss": -7.137094020843506, "global_step": 202199, "epoch": 4814} {"train_loss": -7.199134826660156, "global_step": 202200, "epoch": 4814} {"train_loss": -7.1870880126953125, "global_step": 202201, "epoch": 4814} {"train_loss": -7.219920635223389, "global_step": 202202, "epoch": 4814} {"train_loss": -7.353280067443848, "global_step": 202203, "epoch": 4814} {"train_loss": -7.301695823669434, "global_step": 202204, "epoch": 4814} {"train_loss": -7.219821929931641, "global_step": 202205, "epoch": 4814} {"train_loss": -7.243850231170654, "global_step": 202206, "epoch": 4814} {"train_loss": -7.242100238800049, "global_step": 202207, "epoch": 4814} {"train_loss": -7.336569786071777, "global_step": 202208, "epoch": 4814} {"train_loss": -7.269227981567383, "global_step": 202209, "epoch": 4814} {"train_loss": -7.413514137268066, "global_step": 202210, "epoch": 4814} {"train_loss": -7.368603706359863, "global_step": 202211, "epoch": 4814} {"train_loss": -7.161322593688965, "global_step": 202212, "epoch": 4814} {"train_loss": -7.3549346923828125, "global_step": 202213, "epoch": 4814} {"train_loss": -7.150142669677734, "global_step": 202214, "epoch": 4814} {"train_loss": -7.099736213684082, "global_step": 202215, "epoch": 4814} {"train_loss": -7.192770004272461, "global_step": 202216, "epoch": 4814} {"train_loss": -7.168584823608398, "global_step": 202217, "epoch": 4814} {"train_loss": -7.112488746643066, "global_step": 202218, "epoch": 4814} {"train_loss": -7.272085189819336, "global_step": 202219, "epoch": 4814} {"train_loss": -7.185593605041504, "global_step": 202220, "epoch": 4814} {"train_loss": -7.333255767822266, "global_step": 202221, "epoch": 4814} {"train_loss": -7.335973262786865, "global_step": 202222, "epoch": 4814} {"train_loss": -7.229074001312256, "global_step": 202223, "epoch": 4814} {"train_loss": -7.291818618774414, "global_step": 202224, "epoch": 4814} {"train_loss": -7.302692413330078, "global_step": 202225, "epoch": 4814} {"train_loss": -7.198771953582764, "global_step": 202226, "epoch": 4814} {"train_loss": -7.320184707641602, "global_step": 202227, "epoch": 4814} {"train_loss": -7.253910064697266, "global_step": 202228, "epoch": 4814} {"train_loss": -7.244208994365874, "global_step": 202229, "epoch": 4814, "val_loss": 81515.59375} {"train_loss": -7.241825103759766, "global_step": 202230, "epoch": 4815} {"train_loss": -7.158386707305908, "global_step": 202231, "epoch": 4815} {"train_loss": -7.256214141845703, "global_step": 202232, "epoch": 4815} {"train_loss": -7.212488174438477, "global_step": 202233, "epoch": 4815} {"train_loss": -7.298501968383789, "global_step": 202234, "epoch": 4815} {"train_loss": -7.263493537902832, "global_step": 202235, "epoch": 4815} {"train_loss": -7.20744514465332, "global_step": 202236, "epoch": 4815} {"train_loss": -7.1941070556640625, "global_step": 202237, "epoch": 4815} {"train_loss": -7.193011283874512, "global_step": 202238, "epoch": 4815} {"train_loss": -7.341968536376953, "global_step": 202239, "epoch": 4815} {"train_loss": -7.200508117675781, "global_step": 202240, "epoch": 4815} {"train_loss": -7.115316390991211, "global_step": 202241, "epoch": 4815} {"train_loss": -7.398429870605469, "global_step": 202242, "epoch": 4815} {"train_loss": -7.30438232421875, "global_step": 202243, "epoch": 4815} {"train_loss": -7.3141350746154785, "global_step": 202244, "epoch": 4815} {"train_loss": -7.298424243927002, "global_step": 202245, "epoch": 4815} {"train_loss": -7.221490383148193, "global_step": 202246, "epoch": 4815} {"train_loss": -7.341984748840332, "global_step": 202247, "epoch": 4815} {"train_loss": -7.261898040771484, "global_step": 202248, "epoch": 4815} {"train_loss": -7.347869396209717, "global_step": 202249, "epoch": 4815} {"train_loss": -7.21909236907959, "global_step": 202250, "epoch": 4815} {"train_loss": -7.31927490234375, "global_step": 202251, "epoch": 4815} {"train_loss": -7.29624605178833, "global_step": 202252, "epoch": 4815} {"train_loss": -7.264793395996094, "global_step": 202253, "epoch": 4815} {"train_loss": -7.2285919189453125, "global_step": 202254, "epoch": 4815} {"train_loss": -7.24988317489624, "global_step": 202255, "epoch": 4815} {"train_loss": -7.428267478942871, "global_step": 202256, "epoch": 4815} {"train_loss": -7.215757846832275, "global_step": 202257, "epoch": 4815} {"train_loss": -7.307310581207275, "global_step": 202258, "epoch": 4815} {"train_loss": -7.470015525817871, "global_step": 202259, "epoch": 4815} {"train_loss": -7.330843448638916, "global_step": 202260, "epoch": 4815} {"train_loss": -7.309803485870361, "global_step": 202261, "epoch": 4815} {"train_loss": -7.395473480224609, "global_step": 202262, "epoch": 4815} {"train_loss": -7.343808650970459, "global_step": 202263, "epoch": 4815} {"train_loss": -7.217029094696045, "global_step": 202264, "epoch": 4815} {"train_loss": -7.381925106048584, "global_step": 202265, "epoch": 4815} {"train_loss": -7.298590660095215, "global_step": 202266, "epoch": 4815} {"train_loss": -7.243653297424316, "global_step": 202267, "epoch": 4815} {"train_loss": -7.391988754272461, "global_step": 202268, "epoch": 4815} {"train_loss": -7.329560279846191, "global_step": 202269, "epoch": 4815} {"train_loss": -7.341939926147461, "global_step": 202270, "epoch": 4815} {"train_loss": -7.287047125044323, "global_step": 202271, "epoch": 4815, "val_loss": 81699.375} {"train_loss": -7.287034034729004, "global_step": 202272, "epoch": 4816} {"train_loss": -7.298805236816406, "global_step": 202273, "epoch": 4816} {"train_loss": -7.404214382171631, "global_step": 202274, "epoch": 4816} {"train_loss": -7.31161642074585, "global_step": 202275, "epoch": 4816} {"train_loss": -7.1747331619262695, "global_step": 202276, "epoch": 4816} {"train_loss": -7.388455867767334, "global_step": 202277, "epoch": 4816} {"train_loss": -7.368552207946777, "global_step": 202278, "epoch": 4816} {"train_loss": -7.272441387176514, "global_step": 202279, "epoch": 4816} {"train_loss": -7.355829238891602, "global_step": 202280, "epoch": 4816} {"train_loss": -7.380983352661133, "global_step": 202281, "epoch": 4816} {"train_loss": -7.271296501159668, "global_step": 202282, "epoch": 4816} {"train_loss": -7.320908069610596, "global_step": 202283, "epoch": 4816} {"train_loss": -7.389573097229004, "global_step": 202284, "epoch": 4816} {"train_loss": -7.257477760314941, "global_step": 202285, "epoch": 4816} {"train_loss": -7.347260475158691, "global_step": 202286, "epoch": 4816} {"train_loss": -7.253155708312988, "global_step": 202287, "epoch": 4816} {"train_loss": -7.405787944793701, "global_step": 202288, "epoch": 4816} {"train_loss": -7.100374221801758, "global_step": 202289, "epoch": 4816} {"train_loss": -7.242062568664551, "global_step": 202290, "epoch": 4816} {"train_loss": -7.3021674156188965, "global_step": 202291, "epoch": 4816} {"train_loss": -7.241846084594727, "global_step": 202292, "epoch": 4816} {"train_loss": -7.226733207702637, "global_step": 202293, "epoch": 4816} {"train_loss": -7.268280506134033, "global_step": 202294, "epoch": 4816} {"train_loss": -7.206303119659424, "global_step": 202295, "epoch": 4816} {"train_loss": -7.202718257904053, "global_step": 202296, "epoch": 4816} {"train_loss": -7.198311805725098, "global_step": 202297, "epoch": 4816} {"train_loss": -7.310292720794678, "global_step": 202298, "epoch": 4816} {"train_loss": -7.266959190368652, "global_step": 202299, "epoch": 4816} {"train_loss": -7.400518417358398, "global_step": 202300, "epoch": 4816} {"train_loss": -7.304394721984863, "global_step": 202301, "epoch": 4816} {"train_loss": -7.423305034637451, "global_step": 202302, "epoch": 4816} {"train_loss": -7.128565788269043, "global_step": 202303, "epoch": 4816} {"train_loss": -7.230475425720215, "global_step": 202304, "epoch": 4816} {"train_loss": -7.340770721435547, "global_step": 202305, "epoch": 4816} {"train_loss": -7.185805320739746, "global_step": 202306, "epoch": 4816} {"train_loss": -7.180654048919678, "global_step": 202307, "epoch": 4816} {"train_loss": -7.299556255340576, "global_step": 202308, "epoch": 4816} {"train_loss": -7.428182601928711, "global_step": 202309, "epoch": 4816} {"train_loss": -7.3213210105896, "global_step": 202310, "epoch": 4816} {"train_loss": -7.324003219604492, "global_step": 202311, "epoch": 4816} {"train_loss": -7.351704120635986, "global_step": 202312, "epoch": 4816} {"train_loss": -7.292684725352696, "global_step": 202313, "epoch": 4816, "val_loss": 81544.5390625} {"train_loss": -7.355138301849365, "global_step": 202314, "epoch": 4817} {"train_loss": -7.292061805725098, "global_step": 202315, "epoch": 4817} {"train_loss": -7.32375431060791, "global_step": 202316, "epoch": 4817} {"train_loss": -7.331155776977539, "global_step": 202317, "epoch": 4817} {"train_loss": -7.436956882476807, "global_step": 202318, "epoch": 4817} {"train_loss": -7.25325870513916, "global_step": 202319, "epoch": 4817} {"train_loss": -7.363407135009766, "global_step": 202320, "epoch": 4817} {"train_loss": -7.31044864654541, "global_step": 202321, "epoch": 4817} {"train_loss": -7.370438575744629, "global_step": 202322, "epoch": 4817} {"train_loss": -7.310209274291992, "global_step": 202323, "epoch": 4817} {"train_loss": -7.390857696533203, "global_step": 202324, "epoch": 4817} {"train_loss": -7.382229328155518, "global_step": 202325, "epoch": 4817} {"train_loss": -7.340527534484863, "global_step": 202326, "epoch": 4817} {"train_loss": -7.361641883850098, "global_step": 202327, "epoch": 4817} {"train_loss": -7.33744478225708, "global_step": 202328, "epoch": 4817} {"train_loss": -7.34945011138916, "global_step": 202329, "epoch": 4817} {"train_loss": -7.30142068862915, "global_step": 202330, "epoch": 4817} {"train_loss": -7.442939758300781, "global_step": 202331, "epoch": 4817} {"train_loss": -7.250749588012695, "global_step": 202332, "epoch": 4817} {"train_loss": -7.376720428466797, "global_step": 202333, "epoch": 4817} {"train_loss": -7.293536186218262, "global_step": 202334, "epoch": 4817} {"train_loss": -7.279611110687256, "global_step": 202335, "epoch": 4817} {"train_loss": -7.346863269805908, "global_step": 202336, "epoch": 4817} {"train_loss": -7.227389812469482, "global_step": 202337, "epoch": 4817} {"train_loss": -7.296062469482422, "global_step": 202338, "epoch": 4817} {"train_loss": -7.08620023727417, "global_step": 202339, "epoch": 4817} {"train_loss": -7.326471328735352, "global_step": 202340, "epoch": 4817} {"train_loss": -7.337867259979248, "global_step": 202341, "epoch": 4817} {"train_loss": -7.286877632141113, "global_step": 202342, "epoch": 4817} {"train_loss": -7.352705001831055, "global_step": 202343, "epoch": 4817} {"train_loss": -7.2524261474609375, "global_step": 202344, "epoch": 4817} {"train_loss": -7.231104373931885, "global_step": 202345, "epoch": 4817} {"train_loss": -7.304147720336914, "global_step": 202346, "epoch": 4817} {"train_loss": -7.373321056365967, "global_step": 202347, "epoch": 4817} {"train_loss": -7.319610118865967, "global_step": 202348, "epoch": 4817} {"train_loss": -7.372226715087891, "global_step": 202349, "epoch": 4817} {"train_loss": -7.413361549377441, "global_step": 202350, "epoch": 4817} {"train_loss": -7.373522758483887, "global_step": 202351, "epoch": 4817} {"train_loss": -7.363295555114746, "global_step": 202352, "epoch": 4817} {"train_loss": -7.271527290344238, "global_step": 202353, "epoch": 4817} {"train_loss": -7.243512153625488, "global_step": 202354, "epoch": 4817} {"train_loss": -7.323486907141549, "global_step": 202355, "epoch": 4817, "val_loss": 81530.4375} {"train_loss": -7.268685817718506, "global_step": 202356, "epoch": 4818} {"train_loss": -7.317758560180664, "global_step": 202357, "epoch": 4818} {"train_loss": -7.313169479370117, "global_step": 202358, "epoch": 4818} {"train_loss": -7.510902404785156, "global_step": 202359, "epoch": 4818} {"train_loss": -7.343111038208008, "global_step": 202360, "epoch": 4818} {"train_loss": -7.230250358581543, "global_step": 202361, "epoch": 4818} {"train_loss": -7.433346748352051, "global_step": 202362, "epoch": 4818} {"train_loss": -7.3056817054748535, "global_step": 202363, "epoch": 4818} {"train_loss": -7.386153221130371, "global_step": 202364, "epoch": 4818} {"train_loss": -7.443521022796631, "global_step": 202365, "epoch": 4818} {"train_loss": -7.344976902008057, "global_step": 202366, "epoch": 4818} {"train_loss": -7.393826484680176, "global_step": 202367, "epoch": 4818} {"train_loss": -7.301362037658691, "global_step": 202368, "epoch": 4818} {"train_loss": -7.392188549041748, "global_step": 202369, "epoch": 4818} {"train_loss": -7.344876289367676, "global_step": 202370, "epoch": 4818} {"train_loss": -7.378669738769531, "global_step": 202371, "epoch": 4818} {"train_loss": -7.3587493896484375, "global_step": 202372, "epoch": 4818} {"train_loss": -7.335611343383789, "global_step": 202373, "epoch": 4818} {"train_loss": -7.400035858154297, "global_step": 202374, "epoch": 4818} {"train_loss": -7.316226005554199, "global_step": 202375, "epoch": 4818} {"train_loss": -7.293978691101074, "global_step": 202376, "epoch": 4818} {"train_loss": -7.329567909240723, "global_step": 202377, "epoch": 4818} {"train_loss": -7.364197731018066, "global_step": 202378, "epoch": 4818} {"train_loss": -7.404928684234619, "global_step": 202379, "epoch": 4818} {"train_loss": -7.31290864944458, "global_step": 202380, "epoch": 4818} {"train_loss": -7.315280914306641, "global_step": 202381, "epoch": 4818} {"train_loss": -7.2420654296875, "global_step": 202382, "epoch": 4818} {"train_loss": -7.421820163726807, "global_step": 202383, "epoch": 4818} {"train_loss": -7.120302677154541, "global_step": 202384, "epoch": 4818} {"train_loss": -7.213245391845703, "global_step": 202385, "epoch": 4818} {"train_loss": -7.340358734130859, "global_step": 202386, "epoch": 4818} {"train_loss": -7.371849060058594, "global_step": 202387, "epoch": 4818} {"train_loss": -7.2954559326171875, "global_step": 202388, "epoch": 4818} {"train_loss": -7.351849555969238, "global_step": 202389, "epoch": 4818} {"train_loss": -7.237529277801514, "global_step": 202390, "epoch": 4818} {"train_loss": -7.290589332580566, "global_step": 202391, "epoch": 4818} {"train_loss": -7.330015659332275, "global_step": 202392, "epoch": 4818} {"train_loss": -7.363130569458008, "global_step": 202393, "epoch": 4818} {"train_loss": -7.330431938171387, "global_step": 202394, "epoch": 4818} {"train_loss": -7.27137565612793, "global_step": 202395, "epoch": 4818} {"train_loss": -7.35659122467041, "global_step": 202396, "epoch": 4818} {"train_loss": -7.3311846142723445, "global_step": 202397, "epoch": 4818, "val_loss": 81389.234375} {"train_loss": -7.384917259216309, "global_step": 202398, "epoch": 4819} {"train_loss": -7.262580871582031, "global_step": 202399, "epoch": 4819} {"train_loss": -7.346147537231445, "global_step": 202400, "epoch": 4819} {"train_loss": -7.293380260467529, "global_step": 202401, "epoch": 4819} {"train_loss": -7.358095169067383, "global_step": 202402, "epoch": 4819} {"train_loss": -7.284051895141602, "global_step": 202403, "epoch": 4819} {"train_loss": -7.311219215393066, "global_step": 202404, "epoch": 4819} {"train_loss": -7.387192726135254, "global_step": 202405, "epoch": 4819} {"train_loss": -7.346219062805176, "global_step": 202406, "epoch": 4819} {"train_loss": -7.259369850158691, "global_step": 202407, "epoch": 4819} {"train_loss": -7.318533420562744, "global_step": 202408, "epoch": 4819} {"train_loss": -7.36428165435791, "global_step": 202409, "epoch": 4819} {"train_loss": -7.369429111480713, "global_step": 202410, "epoch": 4819} {"train_loss": -7.3361663818359375, "global_step": 202411, "epoch": 4819} {"train_loss": -7.3098626136779785, "global_step": 202412, "epoch": 4819} {"train_loss": -7.349909782409668, "global_step": 202413, "epoch": 4819} {"train_loss": -7.32520866394043, "global_step": 202414, "epoch": 4819} {"train_loss": -7.395666122436523, "global_step": 202415, "epoch": 4819} {"train_loss": -7.366920471191406, "global_step": 202416, "epoch": 4819} {"train_loss": -7.250424861907959, "global_step": 202417, "epoch": 4819} {"train_loss": -7.176418781280518, "global_step": 202418, "epoch": 4819} {"train_loss": -7.284233570098877, "global_step": 202419, "epoch": 4819} {"train_loss": -7.307521820068359, "global_step": 202420, "epoch": 4819} {"train_loss": -7.391735553741455, "global_step": 202421, "epoch": 4819} {"train_loss": -7.348666667938232, "global_step": 202422, "epoch": 4819} {"train_loss": -7.386284828186035, "global_step": 202423, "epoch": 4819} {"train_loss": -7.333400249481201, "global_step": 202424, "epoch": 4819} {"train_loss": -7.345071792602539, "global_step": 202425, "epoch": 4819} {"train_loss": -7.207524299621582, "global_step": 202426, "epoch": 4819} {"train_loss": -7.312148094177246, "global_step": 202427, "epoch": 4819} {"train_loss": -7.349177837371826, "global_step": 202428, "epoch": 4819} {"train_loss": -7.297109603881836, "global_step": 202429, "epoch": 4819} {"train_loss": -7.354795455932617, "global_step": 202430, "epoch": 4819} {"train_loss": -7.334746360778809, "global_step": 202431, "epoch": 4819} {"train_loss": -7.3222761154174805, "global_step": 202432, "epoch": 4819} {"train_loss": -7.339229106903076, "global_step": 202433, "epoch": 4819} {"train_loss": -7.399359703063965, "global_step": 202434, "epoch": 4819} {"train_loss": -7.227244853973389, "global_step": 202435, "epoch": 4819} {"train_loss": -7.233854293823242, "global_step": 202436, "epoch": 4819} {"train_loss": -7.198446273803711, "global_step": 202437, "epoch": 4819} {"train_loss": -7.309824466705322, "global_step": 202438, "epoch": 4819} {"train_loss": -7.318267686026437, "global_step": 202439, "epoch": 4819, "val_loss": 81798.2421875} {"train_loss": -7.279336929321289, "global_step": 202440, "epoch": 4820} {"train_loss": -7.191620826721191, "global_step": 202441, "epoch": 4820} {"train_loss": -7.392775535583496, "global_step": 202442, "epoch": 4820} {"train_loss": -7.318312644958496, "global_step": 202443, "epoch": 4820} {"train_loss": -7.191037178039551, "global_step": 202444, "epoch": 4820} {"train_loss": -7.297975540161133, "global_step": 202445, "epoch": 4820} {"train_loss": -7.19005012512207, "global_step": 202446, "epoch": 4820} {"train_loss": -7.369686126708984, "global_step": 202447, "epoch": 4820} {"train_loss": -7.296443462371826, "global_step": 202448, "epoch": 4820} {"train_loss": -7.349876403808594, "global_step": 202449, "epoch": 4820} {"train_loss": -7.262877464294434, "global_step": 202450, "epoch": 4820} {"train_loss": -7.374948501586914, "global_step": 202451, "epoch": 4820} {"train_loss": -7.249711513519287, "global_step": 202452, "epoch": 4820} {"train_loss": -7.41988468170166, "global_step": 202453, "epoch": 4820} {"train_loss": -7.365555763244629, "global_step": 202454, "epoch": 4820} {"train_loss": -7.288366794586182, "global_step": 202455, "epoch": 4820} {"train_loss": -7.3201189041137695, "global_step": 202456, "epoch": 4820} {"train_loss": -7.189539909362793, "global_step": 202457, "epoch": 4820} {"train_loss": -7.281199932098389, "global_step": 202458, "epoch": 4820} {"train_loss": -7.405343055725098, "global_step": 202459, "epoch": 4820} {"train_loss": -7.353043556213379, "global_step": 202460, "epoch": 4820} {"train_loss": -7.290938377380371, "global_step": 202461, "epoch": 4820} {"train_loss": -7.381917476654053, "global_step": 202462, "epoch": 4820} {"train_loss": -7.353907108306885, "global_step": 202463, "epoch": 4820} {"train_loss": -7.380879878997803, "global_step": 202464, "epoch": 4820} {"train_loss": -7.217012405395508, "global_step": 202465, "epoch": 4820} {"train_loss": -7.310993194580078, "global_step": 202466, "epoch": 4820} {"train_loss": -7.23261833190918, "global_step": 202467, "epoch": 4820} {"train_loss": -7.141948223114014, "global_step": 202468, "epoch": 4820} {"train_loss": -7.308343887329102, "global_step": 202469, "epoch": 4820} {"train_loss": -7.297063827514648, "global_step": 202470, "epoch": 4820} {"train_loss": -7.1202216148376465, "global_step": 202471, "epoch": 4820} {"train_loss": -7.229123592376709, "global_step": 202472, "epoch": 4820} {"train_loss": -7.171721458435059, "global_step": 202473, "epoch": 4820} {"train_loss": -7.329505920410156, "global_step": 202474, "epoch": 4820} {"train_loss": -7.2745866775512695, "global_step": 202475, "epoch": 4820} {"train_loss": -7.217731475830078, "global_step": 202476, "epoch": 4820} {"train_loss": -7.362748622894287, "global_step": 202477, "epoch": 4820} {"train_loss": -7.181080341339111, "global_step": 202478, "epoch": 4820} {"train_loss": -7.362871170043945, "global_step": 202479, "epoch": 4820} {"train_loss": -7.300112247467041, "global_step": 202480, "epoch": 4820} {"train_loss": -7.28862038112822, "global_step": 202481, "epoch": 4820, "val_loss": 81629.328125} {"train_loss": -7.2736663818359375, "global_step": 202482, "epoch": 4821} {"train_loss": -7.322249412536621, "global_step": 202483, "epoch": 4821} {"train_loss": -7.237357139587402, "global_step": 202484, "epoch": 4821} {"train_loss": -7.353877544403076, "global_step": 202485, "epoch": 4821} {"train_loss": -7.255646228790283, "global_step": 202486, "epoch": 4821} {"train_loss": -7.222357749938965, "global_step": 202487, "epoch": 4821} {"train_loss": -7.363801002502441, "global_step": 202488, "epoch": 4821} {"train_loss": -7.345234394073486, "global_step": 202489, "epoch": 4821} {"train_loss": -7.162633895874023, "global_step": 202490, "epoch": 4821} {"train_loss": -7.207642555236816, "global_step": 202491, "epoch": 4821} {"train_loss": -7.3275299072265625, "global_step": 202492, "epoch": 4821} {"train_loss": -7.26547908782959, "global_step": 202493, "epoch": 4821} {"train_loss": -7.235866546630859, "global_step": 202494, "epoch": 4821} {"train_loss": -7.376955986022949, "global_step": 202495, "epoch": 4821} {"train_loss": -7.114412784576416, "global_step": 202496, "epoch": 4821} {"train_loss": -7.195491790771484, "global_step": 202497, "epoch": 4821} {"train_loss": -7.261778354644775, "global_step": 202498, "epoch": 4821} {"train_loss": -7.194041728973389, "global_step": 202499, "epoch": 4821} {"train_loss": -7.227293968200684, "global_step": 202500, "epoch": 4821} {"train_loss": -7.183547019958496, "global_step": 202501, "epoch": 4821} {"train_loss": -7.189835548400879, "global_step": 202502, "epoch": 4821} {"train_loss": -7.257717132568359, "global_step": 202503, "epoch": 4821} {"train_loss": -7.219595909118652, "global_step": 202504, "epoch": 4821} {"train_loss": -7.240682601928711, "global_step": 202505, "epoch": 4821} {"train_loss": -7.353908061981201, "global_step": 202506, "epoch": 4821} {"train_loss": -7.240972995758057, "global_step": 202507, "epoch": 4821} {"train_loss": -7.28459358215332, "global_step": 202508, "epoch": 4821} {"train_loss": -7.396090507507324, "global_step": 202509, "epoch": 4821} {"train_loss": -7.223026752471924, "global_step": 202510, "epoch": 4821} {"train_loss": -7.202902793884277, "global_step": 202511, "epoch": 4821} {"train_loss": -7.390181541442871, "global_step": 202512, "epoch": 4821} {"train_loss": -7.366065502166748, "global_step": 202513, "epoch": 4821} {"train_loss": -7.41858434677124, "global_step": 202514, "epoch": 4821} {"train_loss": -7.381704330444336, "global_step": 202515, "epoch": 4821} {"train_loss": -7.359589099884033, "global_step": 202516, "epoch": 4821} {"train_loss": -7.29774284362793, "global_step": 202517, "epoch": 4821} {"train_loss": -7.229388236999512, "global_step": 202518, "epoch": 4821} {"train_loss": -7.199761390686035, "global_step": 202519, "epoch": 4821} {"train_loss": -7.350091934204102, "global_step": 202520, "epoch": 4821} {"train_loss": -7.147587776184082, "global_step": 202521, "epoch": 4821} {"train_loss": -7.244081974029541, "global_step": 202522, "epoch": 4821} {"train_loss": -7.271614347185407, "global_step": 202523, "epoch": 4821, "val_loss": 81871.4140625} {"train_loss": -7.283591270446777, "global_step": 202524, "epoch": 4822} {"train_loss": -7.123130798339844, "global_step": 202525, "epoch": 4822} {"train_loss": -7.211452960968018, "global_step": 202526, "epoch": 4822} {"train_loss": -7.107616424560547, "global_step": 202527, "epoch": 4822} {"train_loss": -7.328012943267822, "global_step": 202528, "epoch": 4822} {"train_loss": -7.151166915893555, "global_step": 202529, "epoch": 4822} {"train_loss": -7.172234535217285, "global_step": 202530, "epoch": 4822} {"train_loss": -7.285017490386963, "global_step": 202531, "epoch": 4822} {"train_loss": -7.362679481506348, "global_step": 202532, "epoch": 4822} {"train_loss": -7.272646427154541, "global_step": 202533, "epoch": 4822} {"train_loss": -7.352658271789551, "global_step": 202534, "epoch": 4822} {"train_loss": -7.327805519104004, "global_step": 202535, "epoch": 4822} {"train_loss": -7.302599906921387, "global_step": 202536, "epoch": 4822} {"train_loss": -7.337824821472168, "global_step": 202537, "epoch": 4822} {"train_loss": -7.271024227142334, "global_step": 202538, "epoch": 4822} {"train_loss": -7.284835338592529, "global_step": 202539, "epoch": 4822} {"train_loss": -7.355042457580566, "global_step": 202540, "epoch": 4822} {"train_loss": -7.314373016357422, "global_step": 202541, "epoch": 4822} {"train_loss": -7.314079284667969, "global_step": 202542, "epoch": 4822} {"train_loss": -7.318921089172363, "global_step": 202543, "epoch": 4822} {"train_loss": -7.313699722290039, "global_step": 202544, "epoch": 4822} {"train_loss": -7.279303073883057, "global_step": 202545, "epoch": 4822} {"train_loss": -7.310746669769287, "global_step": 202546, "epoch": 4822} {"train_loss": -7.2747087478637695, "global_step": 202547, "epoch": 4822} {"train_loss": -7.26104736328125, "global_step": 202548, "epoch": 4822} {"train_loss": -7.401969909667969, "global_step": 202549, "epoch": 4822} {"train_loss": -7.331476211547852, "global_step": 202550, "epoch": 4822} {"train_loss": -7.235333442687988, "global_step": 202551, "epoch": 4822} {"train_loss": -7.329143524169922, "global_step": 202552, "epoch": 4822} {"train_loss": -7.259622573852539, "global_step": 202553, "epoch": 4822} {"train_loss": -7.332037448883057, "global_step": 202554, "epoch": 4822} {"train_loss": -7.289910316467285, "global_step": 202555, "epoch": 4822} {"train_loss": -7.204037666320801, "global_step": 202556, "epoch": 4822} {"train_loss": -7.260662078857422, "global_step": 202557, "epoch": 4822} {"train_loss": -7.317452430725098, "global_step": 202558, "epoch": 4822} {"train_loss": -7.081240653991699, "global_step": 202559, "epoch": 4822} {"train_loss": -7.4060211181640625, "global_step": 202560, "epoch": 4822} {"train_loss": -7.254886627197266, "global_step": 202561, "epoch": 4822} {"train_loss": -7.310328483581543, "global_step": 202562, "epoch": 4822} {"train_loss": -7.253170967102051, "global_step": 202563, "epoch": 4822} {"train_loss": -7.165476322174072, "global_step": 202564, "epoch": 4822} {"train_loss": -7.27751594498044, "global_step": 202565, "epoch": 4822, "val_loss": 81654.96875} {"train_loss": -7.263918399810791, "global_step": 202566, "epoch": 4823} {"train_loss": -7.188035011291504, "global_step": 202567, "epoch": 4823} {"train_loss": -7.3459062576293945, "global_step": 202568, "epoch": 4823} {"train_loss": -7.18289852142334, "global_step": 202569, "epoch": 4823} {"train_loss": -7.3394670486450195, "global_step": 202570, "epoch": 4823} {"train_loss": -7.324704170227051, "global_step": 202571, "epoch": 4823} {"train_loss": -7.219002723693848, "global_step": 202572, "epoch": 4823} {"train_loss": -7.342607021331787, "global_step": 202573, "epoch": 4823} {"train_loss": -7.328225135803223, "global_step": 202574, "epoch": 4823} {"train_loss": -7.174391746520996, "global_step": 202575, "epoch": 4823} {"train_loss": -7.279191970825195, "global_step": 202576, "epoch": 4823} {"train_loss": -7.272639751434326, "global_step": 202577, "epoch": 4823} {"train_loss": -7.325601100921631, "global_step": 202578, "epoch": 4823} {"train_loss": -7.304629325866699, "global_step": 202579, "epoch": 4823} {"train_loss": -7.230600833892822, "global_step": 202580, "epoch": 4823} {"train_loss": -7.216089725494385, "global_step": 202581, "epoch": 4823} {"train_loss": -7.157732009887695, "global_step": 202582, "epoch": 4823} {"train_loss": -7.327662944793701, "global_step": 202583, "epoch": 4823} {"train_loss": -7.257773399353027, "global_step": 202584, "epoch": 4823} {"train_loss": -7.37955379486084, "global_step": 202585, "epoch": 4823} {"train_loss": -7.367266654968262, "global_step": 202586, "epoch": 4823} {"train_loss": -7.355840682983398, "global_step": 202587, "epoch": 4823} {"train_loss": -7.3447113037109375, "global_step": 202588, "epoch": 4823} {"train_loss": -7.274485111236572, "global_step": 202589, "epoch": 4823} {"train_loss": -7.242708206176758, "global_step": 202590, "epoch": 4823} {"train_loss": -7.403409004211426, "global_step": 202591, "epoch": 4823} {"train_loss": -7.25766134262085, "global_step": 202592, "epoch": 4823} {"train_loss": -7.291791915893555, "global_step": 202593, "epoch": 4823} {"train_loss": -7.410094261169434, "global_step": 202594, "epoch": 4823} {"train_loss": -7.304274082183838, "global_step": 202595, "epoch": 4823} {"train_loss": -7.322301387786865, "global_step": 202596, "epoch": 4823} {"train_loss": -7.2299418449401855, "global_step": 202597, "epoch": 4823} {"train_loss": -7.290867328643799, "global_step": 202598, "epoch": 4823} {"train_loss": -7.319791316986084, "global_step": 202599, "epoch": 4823} {"train_loss": -7.372295379638672, "global_step": 202600, "epoch": 4823} {"train_loss": -7.394138813018799, "global_step": 202601, "epoch": 4823} {"train_loss": -7.406020164489746, "global_step": 202602, "epoch": 4823} {"train_loss": -7.339603900909424, "global_step": 202603, "epoch": 4823} {"train_loss": -7.396617889404297, "global_step": 202604, "epoch": 4823} {"train_loss": -7.378705024719238, "global_step": 202605, "epoch": 4823} {"train_loss": -7.394306182861328, "global_step": 202606, "epoch": 4823} {"train_loss": -7.308811630521502, "global_step": 202607, "epoch": 4823, "val_loss": 81651.9609375} {"train_loss": -7.391134262084961, "global_step": 202608, "epoch": 4824} {"train_loss": -7.38795280456543, "global_step": 202609, "epoch": 4824} {"train_loss": -7.338745594024658, "global_step": 202610, "epoch": 4824} {"train_loss": -7.4203081130981445, "global_step": 202611, "epoch": 4824} {"train_loss": -7.311653137207031, "global_step": 202612, "epoch": 4824} {"train_loss": -7.495306015014648, "global_step": 202613, "epoch": 4824} {"train_loss": -7.276140213012695, "global_step": 202614, "epoch": 4824} {"train_loss": -7.26432466506958, "global_step": 202615, "epoch": 4824} {"train_loss": -7.164469242095947, "global_step": 202616, "epoch": 4824} {"train_loss": -7.273196220397949, "global_step": 202617, "epoch": 4824} {"train_loss": -7.194060325622559, "global_step": 202618, "epoch": 4824} {"train_loss": -7.288763523101807, "global_step": 202619, "epoch": 4824} {"train_loss": -7.213850021362305, "global_step": 202620, "epoch": 4824} {"train_loss": -7.393746852874756, "global_step": 202621, "epoch": 4824} {"train_loss": -7.381780624389648, "global_step": 202622, "epoch": 4824} {"train_loss": -7.307233810424805, "global_step": 202623, "epoch": 4824} {"train_loss": -7.281292915344238, "global_step": 202624, "epoch": 4824} {"train_loss": -7.167891025543213, "global_step": 202625, "epoch": 4824} {"train_loss": -7.253634452819824, "global_step": 202626, "epoch": 4824} {"train_loss": -7.3261027336120605, "global_step": 202627, "epoch": 4824} {"train_loss": -7.1613264083862305, "global_step": 202628, "epoch": 4824} {"train_loss": -7.158062934875488, "global_step": 202629, "epoch": 4824} {"train_loss": -7.234465599060059, "global_step": 202630, "epoch": 4824} {"train_loss": -7.236685752868652, "global_step": 202631, "epoch": 4824} {"train_loss": -7.234231948852539, "global_step": 202632, "epoch": 4824} {"train_loss": -7.222978591918945, "global_step": 202633, "epoch": 4824} {"train_loss": -7.191037654876709, "global_step": 202634, "epoch": 4824} {"train_loss": -7.130033016204834, "global_step": 202635, "epoch": 4824} {"train_loss": -7.186789512634277, "global_step": 202636, "epoch": 4824} {"train_loss": -7.272428512573242, "global_step": 202637, "epoch": 4824} {"train_loss": -7.295135498046875, "global_step": 202638, "epoch": 4824} {"train_loss": -7.423159599304199, "global_step": 202639, "epoch": 4824} {"train_loss": -7.247497081756592, "global_step": 202640, "epoch": 4824} {"train_loss": -7.247881889343262, "global_step": 202641, "epoch": 4824} {"train_loss": -7.310735702514648, "global_step": 202642, "epoch": 4824} {"train_loss": -7.360797882080078, "global_step": 202643, "epoch": 4824} {"train_loss": -7.2525482177734375, "global_step": 202644, "epoch": 4824} {"train_loss": -7.401264190673828, "global_step": 202645, "epoch": 4824} {"train_loss": -7.427123069763184, "global_step": 202646, "epoch": 4824} {"train_loss": -7.3020830154418945, "global_step": 202647, "epoch": 4824} {"train_loss": -7.35520601272583, "global_step": 202648, "epoch": 4824} {"train_loss": -7.2897941612062, "global_step": 202649, "epoch": 4824, "val_loss": 81614.3671875} {"train_loss": -7.3581132888793945, "global_step": 202650, "epoch": 4825} {"train_loss": -7.284075736999512, "global_step": 202651, "epoch": 4825} {"train_loss": -7.327651500701904, "global_step": 202652, "epoch": 4825} {"train_loss": -7.331241607666016, "global_step": 202653, "epoch": 4825} {"train_loss": -7.420976638793945, "global_step": 202654, "epoch": 4825} {"train_loss": -7.381340026855469, "global_step": 202655, "epoch": 4825} {"train_loss": -7.280777931213379, "global_step": 202656, "epoch": 4825} {"train_loss": -7.377771854400635, "global_step": 202657, "epoch": 4825} {"train_loss": -7.425863265991211, "global_step": 202658, "epoch": 4825} {"train_loss": -7.358281135559082, "global_step": 202659, "epoch": 4825} {"train_loss": -7.347589492797852, "global_step": 202660, "epoch": 4825} {"train_loss": -7.2703094482421875, "global_step": 202661, "epoch": 4825} {"train_loss": -7.23264217376709, "global_step": 202662, "epoch": 4825} {"train_loss": -7.215845584869385, "global_step": 202663, "epoch": 4825} {"train_loss": -7.34418249130249, "global_step": 202664, "epoch": 4825} {"train_loss": -7.4166765213012695, "global_step": 202665, "epoch": 4825} {"train_loss": -7.457505226135254, "global_step": 202666, "epoch": 4825} {"train_loss": -7.360868453979492, "global_step": 202667, "epoch": 4825} {"train_loss": -7.274625301361084, "global_step": 202668, "epoch": 4825} {"train_loss": -7.390122413635254, "global_step": 202669, "epoch": 4825} {"train_loss": -7.319080352783203, "global_step": 202670, "epoch": 4825} {"train_loss": -7.385374546051025, "global_step": 202671, "epoch": 4825} {"train_loss": -7.314906120300293, "global_step": 202672, "epoch": 4825} {"train_loss": -7.4868364334106445, "global_step": 202673, "epoch": 4825} {"train_loss": -7.292768955230713, "global_step": 202674, "epoch": 4825} {"train_loss": -7.341383457183838, "global_step": 202675, "epoch": 4825} {"train_loss": -7.338924407958984, "global_step": 202676, "epoch": 4825} {"train_loss": -7.353989601135254, "global_step": 202677, "epoch": 4825} {"train_loss": -7.387951374053955, "global_step": 202678, "epoch": 4825} {"train_loss": -7.316745281219482, "global_step": 202679, "epoch": 4825} {"train_loss": -7.421334266662598, "global_step": 202680, "epoch": 4825} {"train_loss": -7.2706708908081055, "global_step": 202681, "epoch": 4825} {"train_loss": -7.20949649810791, "global_step": 202682, "epoch": 4825} {"train_loss": -7.086548805236816, "global_step": 202683, "epoch": 4825} {"train_loss": -7.300988674163818, "global_step": 202684, "epoch": 4825} {"train_loss": -7.243100643157959, "global_step": 202685, "epoch": 4825} {"train_loss": -7.048396110534668, "global_step": 202686, "epoch": 4825} {"train_loss": -7.227687835693359, "global_step": 202687, "epoch": 4825} {"train_loss": -7.195179462432861, "global_step": 202688, "epoch": 4825} {"train_loss": -7.324538230895996, "global_step": 202689, "epoch": 4825} {"train_loss": -7.251887798309326, "global_step": 202690, "epoch": 4825} {"train_loss": -7.3139512198311945, "global_step": 202691, "epoch": 4825, "val_loss": 81803.0625} {"train_loss": -7.206737995147705, "global_step": 202692, "epoch": 4826} {"train_loss": -7.19407844543457, "global_step": 202693, "epoch": 4826} {"train_loss": -7.284182548522949, "global_step": 202694, "epoch": 4826} {"train_loss": -7.248233795166016, "global_step": 202695, "epoch": 4826} {"train_loss": -7.393261909484863, "global_step": 202696, "epoch": 4826} {"train_loss": -7.21173620223999, "global_step": 202697, "epoch": 4826} {"train_loss": -7.268924713134766, "global_step": 202698, "epoch": 4826} {"train_loss": -7.340534210205078, "global_step": 202699, "epoch": 4826} {"train_loss": -7.217063903808594, "global_step": 202700, "epoch": 4826} {"train_loss": -7.214381217956543, "global_step": 202701, "epoch": 4826} {"train_loss": -7.05307149887085, "global_step": 202702, "epoch": 4826} {"train_loss": -7.225600719451904, "global_step": 202703, "epoch": 4826} {"train_loss": -7.162817001342773, "global_step": 202704, "epoch": 4826} {"train_loss": -7.264673233032227, "global_step": 202705, "epoch": 4826} {"train_loss": -7.416046619415283, "global_step": 202706, "epoch": 4826} {"train_loss": -7.182783603668213, "global_step": 202707, "epoch": 4826} {"train_loss": -7.215385437011719, "global_step": 202708, "epoch": 4826} {"train_loss": -7.1567487716674805, "global_step": 202709, "epoch": 4826} {"train_loss": -7.199150085449219, "global_step": 202710, "epoch": 4826} {"train_loss": -7.3029985427856445, "global_step": 202711, "epoch": 4826} {"train_loss": -7.285429954528809, "global_step": 202712, "epoch": 4826} {"train_loss": -7.394804000854492, "global_step": 202713, "epoch": 4826} {"train_loss": -7.286356449127197, "global_step": 202714, "epoch": 4826} {"train_loss": -7.297544002532959, "global_step": 202715, "epoch": 4826} {"train_loss": -7.339601516723633, "global_step": 202716, "epoch": 4826} {"train_loss": -7.1790385246276855, "global_step": 202717, "epoch": 4826} {"train_loss": -7.333397388458252, "global_step": 202718, "epoch": 4826} {"train_loss": -7.306114196777344, "global_step": 202719, "epoch": 4826} {"train_loss": -7.30219030380249, "global_step": 202720, "epoch": 4826} {"train_loss": -7.414578437805176, "global_step": 202721, "epoch": 4826} {"train_loss": -7.259429931640625, "global_step": 202722, "epoch": 4826} {"train_loss": -7.431079864501953, "global_step": 202723, "epoch": 4826} {"train_loss": -7.419558048248291, "global_step": 202724, "epoch": 4826} {"train_loss": -7.355319499969482, "global_step": 202725, "epoch": 4826} {"train_loss": -7.3857831954956055, "global_step": 202726, "epoch": 4826} {"train_loss": -7.449340343475342, "global_step": 202727, "epoch": 4826} {"train_loss": -7.424424171447754, "global_step": 202728, "epoch": 4826} {"train_loss": -7.426802635192871, "global_step": 202729, "epoch": 4826} {"train_loss": -7.298960208892822, "global_step": 202730, "epoch": 4826} {"train_loss": -7.437220573425293, "global_step": 202731, "epoch": 4826} {"train_loss": -7.296706199645996, "global_step": 202732, "epoch": 4826} {"train_loss": -7.297309046699887, "global_step": 202733, "epoch": 4826, "val_loss": 81460.1484375} {"train_loss": -7.329100131988525, "global_step": 202734, "epoch": 4827} {"train_loss": -7.362613201141357, "global_step": 202735, "epoch": 4827} {"train_loss": -7.37819766998291, "global_step": 202736, "epoch": 4827} {"train_loss": -7.344659805297852, "global_step": 202737, "epoch": 4827} {"train_loss": -7.243062973022461, "global_step": 202738, "epoch": 4827} {"train_loss": -7.225861072540283, "global_step": 202739, "epoch": 4827} {"train_loss": -7.380002975463867, "global_step": 202740, "epoch": 4827} {"train_loss": -7.310091972351074, "global_step": 202741, "epoch": 4827} {"train_loss": -7.3005595207214355, "global_step": 202742, "epoch": 4827} {"train_loss": -7.360321998596191, "global_step": 202743, "epoch": 4827} {"train_loss": -7.289927005767822, "global_step": 202744, "epoch": 4827} {"train_loss": -7.318093776702881, "global_step": 202745, "epoch": 4827} {"train_loss": -7.370950222015381, "global_step": 202746, "epoch": 4827} {"train_loss": -7.3374924659729, "global_step": 202747, "epoch": 4827} {"train_loss": -7.249442100524902, "global_step": 202748, "epoch": 4827} {"train_loss": -7.323588848114014, "global_step": 202749, "epoch": 4827} {"train_loss": -7.335735321044922, "global_step": 202750, "epoch": 4827} {"train_loss": -7.284450531005859, "global_step": 202751, "epoch": 4827} {"train_loss": -7.409737586975098, "global_step": 202752, "epoch": 4827} {"train_loss": -7.285405158996582, "global_step": 202753, "epoch": 4827} {"train_loss": -7.151335716247559, "global_step": 202754, "epoch": 4827} {"train_loss": -7.344355583190918, "global_step": 202755, "epoch": 4827} {"train_loss": -7.307755470275879, "global_step": 202756, "epoch": 4827} {"train_loss": -7.3119401931762695, "global_step": 202757, "epoch": 4827} {"train_loss": -7.316617488861084, "global_step": 202758, "epoch": 4827} {"train_loss": -7.322819709777832, "global_step": 202759, "epoch": 4827} {"train_loss": -7.337145805358887, "global_step": 202760, "epoch": 4827} {"train_loss": -7.371723175048828, "global_step": 202761, "epoch": 4827} {"train_loss": -7.302927017211914, "global_step": 202762, "epoch": 4827} {"train_loss": -7.304076671600342, "global_step": 202763, "epoch": 4827} {"train_loss": -7.234460353851318, "global_step": 202764, "epoch": 4827} {"train_loss": -7.321908473968506, "global_step": 202765, "epoch": 4827} {"train_loss": -7.165740013122559, "global_step": 202766, "epoch": 4827} {"train_loss": -7.284268379211426, "global_step": 202767, "epoch": 4827} {"train_loss": -7.410554885864258, "global_step": 202768, "epoch": 4827} {"train_loss": -7.233338832855225, "global_step": 202769, "epoch": 4827} {"train_loss": -7.1674580574035645, "global_step": 202770, "epoch": 4827} {"train_loss": -7.252022743225098, "global_step": 202771, "epoch": 4827} {"train_loss": -7.315778732299805, "global_step": 202772, "epoch": 4827} {"train_loss": -7.336875915527344, "global_step": 202773, "epoch": 4827} {"train_loss": -7.24515438079834, "global_step": 202774, "epoch": 4827} {"train_loss": -7.303543749309721, "global_step": 202775, "epoch": 4827, "val_loss": 81613.6953125} {"train_loss": -7.375576496124268, "global_step": 202776, "epoch": 4828} {"train_loss": -7.249046325683594, "global_step": 202777, "epoch": 4828} {"train_loss": -7.275325775146484, "global_step": 202778, "epoch": 4828} {"train_loss": -7.331508636474609, "global_step": 202779, "epoch": 4828} {"train_loss": -7.272336959838867, "global_step": 202780, "epoch": 4828} {"train_loss": -7.345871448516846, "global_step": 202781, "epoch": 4828} {"train_loss": -7.3003435134887695, "global_step": 202782, "epoch": 4828} {"train_loss": -7.319119930267334, "global_step": 202783, "epoch": 4828} {"train_loss": -7.3587799072265625, "global_step": 202784, "epoch": 4828} {"train_loss": -7.376378536224365, "global_step": 202785, "epoch": 4828} {"train_loss": -7.435210227966309, "global_step": 202786, "epoch": 4828} {"train_loss": -7.348662853240967, "global_step": 202787, "epoch": 4828} {"train_loss": -7.269224166870117, "global_step": 202788, "epoch": 4828} {"train_loss": -7.302026271820068, "global_step": 202789, "epoch": 4828} {"train_loss": -7.226403713226318, "global_step": 202790, "epoch": 4828} {"train_loss": -7.3725199699401855, "global_step": 202791, "epoch": 4828} {"train_loss": -7.320969581604004, "global_step": 202792, "epoch": 4828} {"train_loss": -7.189656734466553, "global_step": 202793, "epoch": 4828} {"train_loss": -7.357018947601318, "global_step": 202794, "epoch": 4828} {"train_loss": -7.322405815124512, "global_step": 202795, "epoch": 4828} {"train_loss": -7.3572001457214355, "global_step": 202796, "epoch": 4828} {"train_loss": -7.325381278991699, "global_step": 202797, "epoch": 4828} {"train_loss": -7.321970462799072, "global_step": 202798, "epoch": 4828} {"train_loss": -7.255165100097656, "global_step": 202799, "epoch": 4828} {"train_loss": -7.215167045593262, "global_step": 202800, "epoch": 4828} {"train_loss": -7.4186296463012695, "global_step": 202801, "epoch": 4828} {"train_loss": -7.3322343826293945, "global_step": 202802, "epoch": 4828} {"train_loss": -7.232008934020996, "global_step": 202803, "epoch": 4828} {"train_loss": -7.3365631103515625, "global_step": 202804, "epoch": 4828} {"train_loss": -7.34471321105957, "global_step": 202805, "epoch": 4828} {"train_loss": -7.261529922485352, "global_step": 202806, "epoch": 4828} {"train_loss": -7.3003692626953125, "global_step": 202807, "epoch": 4828} {"train_loss": -7.356607437133789, "global_step": 202808, "epoch": 4828} {"train_loss": -7.165306091308594, "global_step": 202809, "epoch": 4828} {"train_loss": -7.297380447387695, "global_step": 202810, "epoch": 4828} {"train_loss": -7.137603759765625, "global_step": 202811, "epoch": 4828} {"train_loss": -7.267433166503906, "global_step": 202812, "epoch": 4828} {"train_loss": -7.4149861335754395, "global_step": 202813, "epoch": 4828} {"train_loss": -7.132965087890625, "global_step": 202814, "epoch": 4828} {"train_loss": -7.294024467468262, "global_step": 202815, "epoch": 4828} {"train_loss": -7.056332588195801, "global_step": 202816, "epoch": 4828} {"train_loss": -7.297355402083624, "global_step": 202817, "epoch": 4828, "val_loss": 81721.515625} {"train_loss": -7.3513641357421875, "global_step": 202818, "epoch": 4829} {"train_loss": -7.267010688781738, "global_step": 202819, "epoch": 4829} {"train_loss": -7.3969831466674805, "global_step": 202820, "epoch": 4829} {"train_loss": -7.3558430671691895, "global_step": 202821, "epoch": 4829} {"train_loss": -7.313138008117676, "global_step": 202822, "epoch": 4829} {"train_loss": -7.301352500915527, "global_step": 202823, "epoch": 4829} {"train_loss": -7.2548322677612305, "global_step": 202824, "epoch": 4829} {"train_loss": -7.258256912231445, "global_step": 202825, "epoch": 4829} {"train_loss": -7.265929698944092, "global_step": 202826, "epoch": 4829} {"train_loss": -7.214461326599121, "global_step": 202827, "epoch": 4829} {"train_loss": -7.304805278778076, "global_step": 202828, "epoch": 4829} {"train_loss": -7.295327663421631, "global_step": 202829, "epoch": 4829} {"train_loss": -7.397254467010498, "global_step": 202830, "epoch": 4829} {"train_loss": -7.300592422485352, "global_step": 202831, "epoch": 4829} {"train_loss": -7.270374298095703, "global_step": 202832, "epoch": 4829} {"train_loss": -7.346775054931641, "global_step": 202833, "epoch": 4829} {"train_loss": -7.338259696960449, "global_step": 202834, "epoch": 4829} {"train_loss": -7.3546037673950195, "global_step": 202835, "epoch": 4829} {"train_loss": -7.272794246673584, "global_step": 202836, "epoch": 4829} {"train_loss": -7.352624893188477, "global_step": 202837, "epoch": 4829} {"train_loss": -7.312772750854492, "global_step": 202838, "epoch": 4829} {"train_loss": -7.374242305755615, "global_step": 202839, "epoch": 4829} {"train_loss": -7.360941410064697, "global_step": 202840, "epoch": 4829} {"train_loss": -7.529317855834961, "global_step": 202841, "epoch": 4829} {"train_loss": -7.291938781738281, "global_step": 202842, "epoch": 4829} {"train_loss": -7.289473533630371, "global_step": 202843, "epoch": 4829} {"train_loss": -7.296696186065674, "global_step": 202844, "epoch": 4829} {"train_loss": -7.4433913230896, "global_step": 202845, "epoch": 4829} {"train_loss": -7.299300670623779, "global_step": 202846, "epoch": 4829} {"train_loss": -7.3309006690979, "global_step": 202847, "epoch": 4829} {"train_loss": -7.299039840698242, "global_step": 202848, "epoch": 4829} {"train_loss": -7.360482215881348, "global_step": 202849, "epoch": 4829} {"train_loss": -7.311395645141602, "global_step": 202850, "epoch": 4829} {"train_loss": -7.354124546051025, "global_step": 202851, "epoch": 4829} {"train_loss": -7.308267593383789, "global_step": 202852, "epoch": 4829} {"train_loss": -7.192019462585449, "global_step": 202853, "epoch": 4829} {"train_loss": -7.33314323425293, "global_step": 202854, "epoch": 4829} {"train_loss": -7.404933929443359, "global_step": 202855, "epoch": 4829} {"train_loss": -7.302665710449219, "global_step": 202856, "epoch": 4829} {"train_loss": -7.206508636474609, "global_step": 202857, "epoch": 4829} {"train_loss": -7.250011444091797, "global_step": 202858, "epoch": 4829} {"train_loss": -7.3184214773632235, "global_step": 202859, "epoch": 4829, "val_loss": 81746.0859375} {"train_loss": -7.279746055603027, "global_step": 202860, "epoch": 4830} {"train_loss": -7.22054386138916, "global_step": 202861, "epoch": 4830} {"train_loss": -7.406374454498291, "global_step": 202862, "epoch": 4830} {"train_loss": -7.355554580688477, "global_step": 202863, "epoch": 4830} {"train_loss": -7.266265392303467, "global_step": 202864, "epoch": 4830} {"train_loss": -7.325272560119629, "global_step": 202865, "epoch": 4830} {"train_loss": -7.258851528167725, "global_step": 202866, "epoch": 4830} {"train_loss": -7.141337871551514, "global_step": 202867, "epoch": 4830} {"train_loss": -7.293806076049805, "global_step": 202868, "epoch": 4830} {"train_loss": -7.308465003967285, "global_step": 202869, "epoch": 4830} {"train_loss": -7.397455215454102, "global_step": 202870, "epoch": 4830} {"train_loss": -7.3688530921936035, "global_step": 202871, "epoch": 4830} {"train_loss": -7.3150835037231445, "global_step": 202872, "epoch": 4830} {"train_loss": -7.452024459838867, "global_step": 202873, "epoch": 4830} {"train_loss": -7.332434177398682, "global_step": 202874, "epoch": 4830} {"train_loss": -7.295334815979004, "global_step": 202875, "epoch": 4830} {"train_loss": -7.309908390045166, "global_step": 202876, "epoch": 4830} {"train_loss": -7.407975196838379, "global_step": 202877, "epoch": 4830} {"train_loss": -7.24995231628418, "global_step": 202878, "epoch": 4830} {"train_loss": -7.240617275238037, "global_step": 202879, "epoch": 4830} {"train_loss": -7.161477088928223, "global_step": 202880, "epoch": 4830} {"train_loss": -7.376831531524658, "global_step": 202881, "epoch": 4830} {"train_loss": -7.2123942375183105, "global_step": 202882, "epoch": 4830} {"train_loss": -7.146742820739746, "global_step": 202883, "epoch": 4830} {"train_loss": -7.350991249084473, "global_step": 202884, "epoch": 4830} {"train_loss": -7.148050308227539, "global_step": 202885, "epoch": 4830} {"train_loss": -7.256355285644531, "global_step": 202886, "epoch": 4830} {"train_loss": -7.242306709289551, "global_step": 202887, "epoch": 4830} {"train_loss": -7.196868896484375, "global_step": 202888, "epoch": 4830} {"train_loss": -7.217555046081543, "global_step": 202889, "epoch": 4830} {"train_loss": -7.301681041717529, "global_step": 202890, "epoch": 4830} {"train_loss": -7.2669901847839355, "global_step": 202891, "epoch": 4830} {"train_loss": -7.202384948730469, "global_step": 202892, "epoch": 4830} {"train_loss": -7.140924453735352, "global_step": 202893, "epoch": 4830} {"train_loss": -7.267529487609863, "global_step": 202894, "epoch": 4830} {"train_loss": -7.286490440368652, "global_step": 202895, "epoch": 4830} {"train_loss": -7.283881187438965, "global_step": 202896, "epoch": 4830} {"train_loss": -7.310202121734619, "global_step": 202897, "epoch": 4830} {"train_loss": -7.363731861114502, "global_step": 202898, "epoch": 4830} {"train_loss": -7.277246475219727, "global_step": 202899, "epoch": 4830} {"train_loss": -7.212629795074463, "global_step": 202900, "epoch": 4830} {"train_loss": -7.278858956836519, "global_step": 202901, "epoch": 4830, "val_loss": 81625.421875} {"train_loss": -7.254878997802734, "global_step": 202902, "epoch": 4831} {"train_loss": -7.362122535705566, "global_step": 202903, "epoch": 4831} {"train_loss": -7.33787727355957, "global_step": 202904, "epoch": 4831} {"train_loss": -7.246335506439209, "global_step": 202905, "epoch": 4831} {"train_loss": -7.400032997131348, "global_step": 202906, "epoch": 4831} {"train_loss": -7.438529968261719, "global_step": 202907, "epoch": 4831} {"train_loss": -7.331352233886719, "global_step": 202908, "epoch": 4831} {"train_loss": -7.325782775878906, "global_step": 202909, "epoch": 4831} {"train_loss": -7.269681930541992, "global_step": 202910, "epoch": 4831} {"train_loss": -7.272176265716553, "global_step": 202911, "epoch": 4831} {"train_loss": -7.173943519592285, "global_step": 202912, "epoch": 4831} {"train_loss": -7.257007122039795, "global_step": 202913, "epoch": 4831} {"train_loss": -7.3928728103637695, "global_step": 202914, "epoch": 4831} {"train_loss": -7.340278148651123, "global_step": 202915, "epoch": 4831} {"train_loss": -7.312856674194336, "global_step": 202916, "epoch": 4831} {"train_loss": -7.490575313568115, "global_step": 202917, "epoch": 4831} {"train_loss": -7.342489242553711, "global_step": 202918, "epoch": 4831} {"train_loss": -7.241338729858398, "global_step": 202919, "epoch": 4831} {"train_loss": -7.296905517578125, "global_step": 202920, "epoch": 4831} {"train_loss": -7.454780101776123, "global_step": 202921, "epoch": 4831} {"train_loss": -7.17160701751709, "global_step": 202922, "epoch": 4831} {"train_loss": -7.2404303550720215, "global_step": 202923, "epoch": 4831} {"train_loss": -7.278924942016602, "global_step": 202924, "epoch": 4831} {"train_loss": -7.2134599685668945, "global_step": 202925, "epoch": 4831} {"train_loss": -7.283552646636963, "global_step": 202926, "epoch": 4831} {"train_loss": -7.098452091217041, "global_step": 202927, "epoch": 4831} {"train_loss": -7.232881546020508, "global_step": 202928, "epoch": 4831} {"train_loss": -7.274706840515137, "global_step": 202929, "epoch": 4831} {"train_loss": -7.27737283706665, "global_step": 202930, "epoch": 4831} {"train_loss": -7.15388298034668, "global_step": 202931, "epoch": 4831} {"train_loss": -7.37531852722168, "global_step": 202932, "epoch": 4831} {"train_loss": -7.244555950164795, "global_step": 202933, "epoch": 4831} {"train_loss": -7.327032089233398, "global_step": 202934, "epoch": 4831} {"train_loss": -7.388149261474609, "global_step": 202935, "epoch": 4831} {"train_loss": -7.319858074188232, "global_step": 202936, "epoch": 4831} {"train_loss": -7.232152938842773, "global_step": 202937, "epoch": 4831} {"train_loss": -7.141284465789795, "global_step": 202938, "epoch": 4831} {"train_loss": -7.222314834594727, "global_step": 202939, "epoch": 4831} {"train_loss": -7.12042236328125, "global_step": 202940, "epoch": 4831} {"train_loss": -7.263578414916992, "global_step": 202941, "epoch": 4831} {"train_loss": -7.153163909912109, "global_step": 202942, "epoch": 4831} {"train_loss": -7.282221044812884, "global_step": 202943, "epoch": 4831, "val_loss": 81729.7734375} {"train_loss": -7.271237373352051, "global_step": 202944, "epoch": 4832} {"train_loss": -7.1616530418396, "global_step": 202945, "epoch": 4832} {"train_loss": -7.215873718261719, "global_step": 202946, "epoch": 4832} {"train_loss": -7.21366024017334, "global_step": 202947, "epoch": 4832} {"train_loss": -7.370902061462402, "global_step": 202948, "epoch": 4832} {"train_loss": -7.240189552307129, "global_step": 202949, "epoch": 4832} {"train_loss": -7.242753028869629, "global_step": 202950, "epoch": 4832} {"train_loss": -7.302150249481201, "global_step": 202951, "epoch": 4832} {"train_loss": -7.2676777839660645, "global_step": 202952, "epoch": 4832} {"train_loss": -7.332359313964844, "global_step": 202953, "epoch": 4832} {"train_loss": -7.209972381591797, "global_step": 202954, "epoch": 4832} {"train_loss": -7.245277404785156, "global_step": 202955, "epoch": 4832} {"train_loss": -7.241588592529297, "global_step": 202956, "epoch": 4832} {"train_loss": -7.263038635253906, "global_step": 202957, "epoch": 4832} {"train_loss": -7.330202102661133, "global_step": 202958, "epoch": 4832} {"train_loss": -7.213488578796387, "global_step": 202959, "epoch": 4832} {"train_loss": -7.358950614929199, "global_step": 202960, "epoch": 4832} {"train_loss": -7.278098106384277, "global_step": 202961, "epoch": 4832} {"train_loss": -7.211210250854492, "global_step": 202962, "epoch": 4832} {"train_loss": -7.330348014831543, "global_step": 202963, "epoch": 4832} {"train_loss": -7.216971397399902, "global_step": 202964, "epoch": 4832} {"train_loss": -7.29276180267334, "global_step": 202965, "epoch": 4832} {"train_loss": -7.347511291503906, "global_step": 202966, "epoch": 4832} {"train_loss": -7.348977088928223, "global_step": 202967, "epoch": 4832} {"train_loss": -7.207538604736328, "global_step": 202968, "epoch": 4832} {"train_loss": -7.295291900634766, "global_step": 202969, "epoch": 4832} {"train_loss": -7.286205291748047, "global_step": 202970, "epoch": 4832} {"train_loss": -7.224819183349609, "global_step": 202971, "epoch": 4832} {"train_loss": -7.318033218383789, "global_step": 202972, "epoch": 4832} {"train_loss": -7.393897533416748, "global_step": 202973, "epoch": 4832} {"train_loss": -7.356788635253906, "global_step": 202974, "epoch": 4832} {"train_loss": -7.3128252029418945, "global_step": 202975, "epoch": 4832} {"train_loss": -7.245721817016602, "global_step": 202976, "epoch": 4832} {"train_loss": -7.346187591552734, "global_step": 202977, "epoch": 4832} {"train_loss": -7.3425140380859375, "global_step": 202978, "epoch": 4832} {"train_loss": -7.233851432800293, "global_step": 202979, "epoch": 4832} {"train_loss": -7.268860340118408, "global_step": 202980, "epoch": 4832} {"train_loss": -7.285370826721191, "global_step": 202981, "epoch": 4832} {"train_loss": -7.2873125076293945, "global_step": 202982, "epoch": 4832} {"train_loss": -7.331253528594971, "global_step": 202983, "epoch": 4832} {"train_loss": -7.433748245239258, "global_step": 202984, "epoch": 4832} {"train_loss": -7.2876411733173185, "global_step": 202985, "epoch": 4832, "val_loss": 81502.6484375} {"train_loss": -7.329442977905273, "global_step": 202986, "epoch": 4833} {"train_loss": -7.310210227966309, "global_step": 202987, "epoch": 4833} {"train_loss": -7.3953537940979, "global_step": 202988, "epoch": 4833} {"train_loss": -7.190404415130615, "global_step": 202989, "epoch": 4833} {"train_loss": -7.358087539672852, "global_step": 202990, "epoch": 4833} {"train_loss": -7.382078647613525, "global_step": 202991, "epoch": 4833} {"train_loss": -7.4052324295043945, "global_step": 202992, "epoch": 4833} {"train_loss": -7.368317127227783, "global_step": 202993, "epoch": 4833} {"train_loss": -7.362423419952393, "global_step": 202994, "epoch": 4833} {"train_loss": -7.479465484619141, "global_step": 202995, "epoch": 4833} {"train_loss": -7.287299633026123, "global_step": 202996, "epoch": 4833} {"train_loss": -7.369539260864258, "global_step": 202997, "epoch": 4833} {"train_loss": -7.303333282470703, "global_step": 202998, "epoch": 4833} {"train_loss": -7.373271942138672, "global_step": 202999, "epoch": 4833} {"train_loss": -7.340859889984131, "global_step": 203000, "epoch": 4833} {"train_loss": -7.486394882202148, "global_step": 203001, "epoch": 4833} {"train_loss": -7.399596691131592, "global_step": 203002, "epoch": 4833} {"train_loss": -7.26357889175415, "global_step": 203003, "epoch": 4833} {"train_loss": -7.307607650756836, "global_step": 203004, "epoch": 4833} {"train_loss": -7.43759822845459, "global_step": 203005, "epoch": 4833} {"train_loss": -7.409717559814453, "global_step": 203006, "epoch": 4833} {"train_loss": -7.326641082763672, "global_step": 203007, "epoch": 4833} {"train_loss": -7.323734283447266, "global_step": 203008, "epoch": 4833} {"train_loss": -7.343513488769531, "global_step": 203009, "epoch": 4833} {"train_loss": -7.322610855102539, "global_step": 203010, "epoch": 4833} {"train_loss": -7.3078389167785645, "global_step": 203011, "epoch": 4833} {"train_loss": -7.40292501449585, "global_step": 203012, "epoch": 4833} {"train_loss": -7.325164794921875, "global_step": 203013, "epoch": 4833} {"train_loss": -7.3266143798828125, "global_step": 203014, "epoch": 4833} {"train_loss": -7.293853759765625, "global_step": 203015, "epoch": 4833} {"train_loss": -7.305818557739258, "global_step": 203016, "epoch": 4833} {"train_loss": -7.386553764343262, "global_step": 203017, "epoch": 4833} {"train_loss": -7.3538336753845215, "global_step": 203018, "epoch": 4833} {"train_loss": -7.31810188293457, "global_step": 203019, "epoch": 4833} {"train_loss": -7.27720308303833, "global_step": 203020, "epoch": 4833} {"train_loss": -7.387251853942871, "global_step": 203021, "epoch": 4833} {"train_loss": -7.3293633460998535, "global_step": 203022, "epoch": 4833} {"train_loss": -7.210043907165527, "global_step": 203023, "epoch": 4833} {"train_loss": -7.337313652038574, "global_step": 203024, "epoch": 4833} {"train_loss": -7.1643266677856445, "global_step": 203025, "epoch": 4833} {"train_loss": -7.348047256469727, "global_step": 203026, "epoch": 4833} {"train_loss": -7.332730508985973, "global_step": 203027, "epoch": 4833, "val_loss": 81870.0546875} {"train_loss": -7.1971330642700195, "global_step": 203028, "epoch": 4834} {"train_loss": -7.2314534187316895, "global_step": 203029, "epoch": 4834} {"train_loss": -7.0423583984375, "global_step": 203030, "epoch": 4834} {"train_loss": -7.247314453125, "global_step": 203031, "epoch": 4834} {"train_loss": -7.041214942932129, "global_step": 203032, "epoch": 4834} {"train_loss": -7.087389945983887, "global_step": 203033, "epoch": 4834} {"train_loss": -7.072822570800781, "global_step": 203034, "epoch": 4834} {"train_loss": -7.060872554779053, "global_step": 203035, "epoch": 4834} {"train_loss": -7.034664154052734, "global_step": 203036, "epoch": 4834} {"train_loss": -7.169958114624023, "global_step": 203037, "epoch": 4834} {"train_loss": -7.257343292236328, "global_step": 203038, "epoch": 4834} {"train_loss": -7.073768615722656, "global_step": 203039, "epoch": 4834} {"train_loss": -7.206550598144531, "global_step": 203040, "epoch": 4834} {"train_loss": -7.168521881103516, "global_step": 203041, "epoch": 4834} {"train_loss": -7.159297466278076, "global_step": 203042, "epoch": 4834} {"train_loss": -7.2808637619018555, "global_step": 203043, "epoch": 4834} {"train_loss": -7.302112579345703, "global_step": 203044, "epoch": 4834} {"train_loss": -7.2603302001953125, "global_step": 203045, "epoch": 4834} {"train_loss": -7.301735877990723, "global_step": 203046, "epoch": 4834} {"train_loss": -7.201519966125488, "global_step": 203047, "epoch": 4834} {"train_loss": -7.26140022277832, "global_step": 203048, "epoch": 4834} {"train_loss": -7.2549028396606445, "global_step": 203049, "epoch": 4834} {"train_loss": -7.16038179397583, "global_step": 203050, "epoch": 4834} {"train_loss": -7.245359897613525, "global_step": 203051, "epoch": 4834} {"train_loss": -7.319801330566406, "global_step": 203052, "epoch": 4834} {"train_loss": -7.270623207092285, "global_step": 203053, "epoch": 4834} {"train_loss": -7.111336708068848, "global_step": 203054, "epoch": 4834} {"train_loss": -7.214941501617432, "global_step": 203055, "epoch": 4834} {"train_loss": -7.104190349578857, "global_step": 203056, "epoch": 4834} {"train_loss": -7.060318470001221, "global_step": 203057, "epoch": 4834} {"train_loss": -7.2543463706970215, "global_step": 203058, "epoch": 4834} {"train_loss": -7.126309394836426, "global_step": 203059, "epoch": 4834} {"train_loss": -7.194328308105469, "global_step": 203060, "epoch": 4834} {"train_loss": -7.228638648986816, "global_step": 203061, "epoch": 4834} {"train_loss": -7.2455010414123535, "global_step": 203062, "epoch": 4834} {"train_loss": -7.356560230255127, "global_step": 203063, "epoch": 4834} {"train_loss": -7.198486328125, "global_step": 203064, "epoch": 4834} {"train_loss": -7.196062088012695, "global_step": 203065, "epoch": 4834} {"train_loss": -7.1779985427856445, "global_step": 203066, "epoch": 4834} {"train_loss": -7.2928056716918945, "global_step": 203067, "epoch": 4834} {"train_loss": -7.253946304321289, "global_step": 203068, "epoch": 4834} {"train_loss": -7.19592547416687, "global_step": 203069, "epoch": 4834, "val_loss": 81661.4921875} {"train_loss": -7.358489990234375, "global_step": 203070, "epoch": 4835} {"train_loss": -7.300846099853516, "global_step": 203071, "epoch": 4835} {"train_loss": -7.2655839920043945, "global_step": 203072, "epoch": 4835} {"train_loss": -7.267996788024902, "global_step": 203073, "epoch": 4835} {"train_loss": -7.314719200134277, "global_step": 203074, "epoch": 4835} {"train_loss": -7.3322038650512695, "global_step": 203075, "epoch": 4835} {"train_loss": -7.47266960144043, "global_step": 203076, "epoch": 4835} {"train_loss": -7.304725646972656, "global_step": 203077, "epoch": 4835} {"train_loss": -7.280412673950195, "global_step": 203078, "epoch": 4835} {"train_loss": -7.441167831420898, "global_step": 203079, "epoch": 4835} {"train_loss": -7.302993297576904, "global_step": 203080, "epoch": 4835} {"train_loss": -7.338875770568848, "global_step": 203081, "epoch": 4835} {"train_loss": -7.43192195892334, "global_step": 203082, "epoch": 4835} {"train_loss": -7.359443664550781, "global_step": 203083, "epoch": 4835} {"train_loss": -7.337707996368408, "global_step": 203084, "epoch": 4835} {"train_loss": -7.408305644989014, "global_step": 203085, "epoch": 4835} {"train_loss": -7.401486873626709, "global_step": 203086, "epoch": 4835} {"train_loss": -7.3094611167907715, "global_step": 203087, "epoch": 4835} {"train_loss": -7.397612571716309, "global_step": 203088, "epoch": 4835} {"train_loss": -7.3738017082214355, "global_step": 203089, "epoch": 4835} {"train_loss": -7.38576602935791, "global_step": 203090, "epoch": 4835} {"train_loss": -7.3997673988342285, "global_step": 203091, "epoch": 4835} {"train_loss": -7.412034034729004, "global_step": 203092, "epoch": 4835} {"train_loss": -7.448741436004639, "global_step": 203093, "epoch": 4835} {"train_loss": -7.347053527832031, "global_step": 203094, "epoch": 4835} {"train_loss": -7.318328380584717, "global_step": 203095, "epoch": 4835} {"train_loss": -7.409964084625244, "global_step": 203096, "epoch": 4835} {"train_loss": -7.3986406326293945, "global_step": 203097, "epoch": 4835} {"train_loss": -7.354648590087891, "global_step": 203098, "epoch": 4835} {"train_loss": -7.323029041290283, "global_step": 203099, "epoch": 4835} {"train_loss": -7.4167561531066895, "global_step": 203100, "epoch": 4835} {"train_loss": -7.373452186584473, "global_step": 203101, "epoch": 4835} {"train_loss": -7.418698787689209, "global_step": 203102, "epoch": 4835} {"train_loss": -7.287575721740723, "global_step": 203103, "epoch": 4835} {"train_loss": -7.449456214904785, "global_step": 203104, "epoch": 4835} {"train_loss": -7.319284439086914, "global_step": 203105, "epoch": 4835} {"train_loss": -7.324010848999023, "global_step": 203106, "epoch": 4835} {"train_loss": -7.36836051940918, "global_step": 203107, "epoch": 4835} {"train_loss": -7.405470848083496, "global_step": 203108, "epoch": 4835} {"train_loss": -7.3051252365112305, "global_step": 203109, "epoch": 4835} {"train_loss": -7.3595051765441895, "global_step": 203110, "epoch": 4835} {"train_loss": -7.360711824326288, "global_step": 203111, "epoch": 4835, "val_loss": 81671.125} {"train_loss": -7.2157182693481445, "global_step": 203112, "epoch": 4836} {"train_loss": -7.331319808959961, "global_step": 203113, "epoch": 4836} {"train_loss": -7.300868988037109, "global_step": 203114, "epoch": 4836} {"train_loss": -7.251399993896484, "global_step": 203115, "epoch": 4836} {"train_loss": -7.1944684982299805, "global_step": 203116, "epoch": 4836} {"train_loss": -7.316723823547363, "global_step": 203117, "epoch": 4836} {"train_loss": -7.292745113372803, "global_step": 203118, "epoch": 4836} {"train_loss": -7.361832618713379, "global_step": 203119, "epoch": 4836} {"train_loss": -7.253495693206787, "global_step": 203120, "epoch": 4836} {"train_loss": -7.240665435791016, "global_step": 203121, "epoch": 4836} {"train_loss": -7.331541061401367, "global_step": 203122, "epoch": 4836} {"train_loss": -7.22933292388916, "global_step": 203123, "epoch": 4836} {"train_loss": -7.306873321533203, "global_step": 203124, "epoch": 4836} {"train_loss": -7.27236270904541, "global_step": 203125, "epoch": 4836} {"train_loss": -7.260437488555908, "global_step": 203126, "epoch": 4836} {"train_loss": -7.3664960861206055, "global_step": 203127, "epoch": 4836} {"train_loss": -7.327652931213379, "global_step": 203128, "epoch": 4836} {"train_loss": -7.373863697052002, "global_step": 203129, "epoch": 4836} {"train_loss": -7.344266891479492, "global_step": 203130, "epoch": 4836} {"train_loss": -7.39218282699585, "global_step": 203131, "epoch": 4836} {"train_loss": -7.265398979187012, "global_step": 203132, "epoch": 4836} {"train_loss": -7.2910637855529785, "global_step": 203133, "epoch": 4836} {"train_loss": -7.2858147621154785, "global_step": 203134, "epoch": 4836} {"train_loss": -7.214604377746582, "global_step": 203135, "epoch": 4836} {"train_loss": -7.371068954467773, "global_step": 203136, "epoch": 4836} {"train_loss": -7.337123870849609, "global_step": 203137, "epoch": 4836} {"train_loss": -7.341872215270996, "global_step": 203138, "epoch": 4836} {"train_loss": -7.423644065856934, "global_step": 203139, "epoch": 4836} {"train_loss": -7.23744010925293, "global_step": 203140, "epoch": 4836} {"train_loss": -7.303844451904297, "global_step": 203141, "epoch": 4836} {"train_loss": -7.394414901733398, "global_step": 203142, "epoch": 4836} {"train_loss": -7.190853595733643, "global_step": 203143, "epoch": 4836} {"train_loss": -7.1649370193481445, "global_step": 203144, "epoch": 4836} {"train_loss": -7.421124458312988, "global_step": 203145, "epoch": 4836} {"train_loss": -7.403112411499023, "global_step": 203146, "epoch": 4836} {"train_loss": -7.1122002601623535, "global_step": 203147, "epoch": 4836} {"train_loss": -7.2088422775268555, "global_step": 203148, "epoch": 4836} {"train_loss": -7.18182373046875, "global_step": 203149, "epoch": 4836} {"train_loss": -7.177168846130371, "global_step": 203150, "epoch": 4836} {"train_loss": -7.195116996765137, "global_step": 203151, "epoch": 4836} {"train_loss": -7.37574577331543, "global_step": 203152, "epoch": 4836} {"train_loss": -7.288173175993419, "global_step": 203153, "epoch": 4836, "val_loss": 81788.09375} {"train_loss": -7.258917808532715, "global_step": 203154, "epoch": 4837} {"train_loss": -7.250606060028076, "global_step": 203155, "epoch": 4837} {"train_loss": -7.264492988586426, "global_step": 203156, "epoch": 4837} {"train_loss": -7.240860939025879, "global_step": 203157, "epoch": 4837} {"train_loss": -7.302746772766113, "global_step": 203158, "epoch": 4837} {"train_loss": -7.278446674346924, "global_step": 203159, "epoch": 4837} {"train_loss": -7.328943252563477, "global_step": 203160, "epoch": 4837} {"train_loss": -7.287377834320068, "global_step": 203161, "epoch": 4837} {"train_loss": -7.289698600769043, "global_step": 203162, "epoch": 4837} {"train_loss": -7.306285858154297, "global_step": 203163, "epoch": 4837} {"train_loss": -7.377216815948486, "global_step": 203164, "epoch": 4837} {"train_loss": -7.3459014892578125, "global_step": 203165, "epoch": 4837} {"train_loss": -7.274982452392578, "global_step": 203166, "epoch": 4837} {"train_loss": -7.3730034828186035, "global_step": 203167, "epoch": 4837} {"train_loss": -7.192002296447754, "global_step": 203168, "epoch": 4837} {"train_loss": -7.376779556274414, "global_step": 203169, "epoch": 4837} {"train_loss": -7.32071590423584, "global_step": 203170, "epoch": 4837} {"train_loss": -7.306160926818848, "global_step": 203171, "epoch": 4837} {"train_loss": -7.332672595977783, "global_step": 203172, "epoch": 4837} {"train_loss": -7.3854451179504395, "global_step": 203173, "epoch": 4837} {"train_loss": -7.374929428100586, "global_step": 203174, "epoch": 4837} {"train_loss": -7.193055152893066, "global_step": 203175, "epoch": 4837} {"train_loss": -7.304088115692139, "global_step": 203176, "epoch": 4837} {"train_loss": -7.2868804931640625, "global_step": 203177, "epoch": 4837} {"train_loss": -7.27200984954834, "global_step": 203178, "epoch": 4837} {"train_loss": -7.361710071563721, "global_step": 203179, "epoch": 4837} {"train_loss": -7.378576278686523, "global_step": 203180, "epoch": 4837} {"train_loss": -7.257156848907471, "global_step": 203181, "epoch": 4837} {"train_loss": -7.186139106750488, "global_step": 203182, "epoch": 4837} {"train_loss": -7.27554988861084, "global_step": 203183, "epoch": 4837} {"train_loss": -7.321645736694336, "global_step": 203184, "epoch": 4837} {"train_loss": -7.26253080368042, "global_step": 203185, "epoch": 4837} {"train_loss": -7.257383346557617, "global_step": 203186, "epoch": 4837} {"train_loss": -7.364436626434326, "global_step": 203187, "epoch": 4837} {"train_loss": -7.3023295402526855, "global_step": 203188, "epoch": 4837} {"train_loss": -7.361889839172363, "global_step": 203189, "epoch": 4837} {"train_loss": -7.269558429718018, "global_step": 203190, "epoch": 4837} {"train_loss": -7.3524627685546875, "global_step": 203191, "epoch": 4837} {"train_loss": -7.352993965148926, "global_step": 203192, "epoch": 4837} {"train_loss": -7.269309997558594, "global_step": 203193, "epoch": 4837} {"train_loss": -7.344564914703369, "global_step": 203194, "epoch": 4837} {"train_loss": -7.301544337045579, "global_step": 203195, "epoch": 4837, "val_loss": 81653.859375} {"train_loss": -7.3897905349731445, "global_step": 203196, "epoch": 4838} {"train_loss": -7.429317474365234, "global_step": 203197, "epoch": 4838} {"train_loss": -7.254679203033447, "global_step": 203198, "epoch": 4838} {"train_loss": -7.265154838562012, "global_step": 203199, "epoch": 4838} {"train_loss": -7.36641788482666, "global_step": 203200, "epoch": 4838} {"train_loss": -7.32474422454834, "global_step": 203201, "epoch": 4838} {"train_loss": -7.413100242614746, "global_step": 203202, "epoch": 4838} {"train_loss": -7.390646457672119, "global_step": 203203, "epoch": 4838} {"train_loss": -7.378690719604492, "global_step": 203204, "epoch": 4838} {"train_loss": -7.33113956451416, "global_step": 203205, "epoch": 4838} {"train_loss": -7.475285053253174, "global_step": 203206, "epoch": 4838} {"train_loss": -7.419440746307373, "global_step": 203207, "epoch": 4838} {"train_loss": -7.428023338317871, "global_step": 203208, "epoch": 4838} {"train_loss": -7.286703586578369, "global_step": 203209, "epoch": 4838} {"train_loss": -7.382628917694092, "global_step": 203210, "epoch": 4838} {"train_loss": -7.44560432434082, "global_step": 203211, "epoch": 4838} {"train_loss": -7.265859603881836, "global_step": 203212, "epoch": 4838} {"train_loss": -7.373772144317627, "global_step": 203213, "epoch": 4838} {"train_loss": -7.4005327224731445, "global_step": 203214, "epoch": 4838} {"train_loss": -7.402308464050293, "global_step": 203215, "epoch": 4838} {"train_loss": -7.391659259796143, "global_step": 203216, "epoch": 4838} {"train_loss": -7.324033737182617, "global_step": 203217, "epoch": 4838} {"train_loss": -7.292910099029541, "global_step": 203218, "epoch": 4838} {"train_loss": -7.437573432922363, "global_step": 203219, "epoch": 4838} {"train_loss": -7.428661823272705, "global_step": 203220, "epoch": 4838} {"train_loss": -7.183818817138672, "global_step": 203221, "epoch": 4838} {"train_loss": -7.258667945861816, "global_step": 203222, "epoch": 4838} {"train_loss": -7.305143356323242, "global_step": 203223, "epoch": 4838} {"train_loss": -7.089499473571777, "global_step": 203224, "epoch": 4838} {"train_loss": -7.287042140960693, "global_step": 203225, "epoch": 4838} {"train_loss": -7.2559099197387695, "global_step": 203226, "epoch": 4838} {"train_loss": -7.038461685180664, "global_step": 203227, "epoch": 4838} {"train_loss": -7.156838417053223, "global_step": 203228, "epoch": 4838} {"train_loss": -7.083457946777344, "global_step": 203229, "epoch": 4838} {"train_loss": -7.158649444580078, "global_step": 203230, "epoch": 4838} {"train_loss": -7.302525520324707, "global_step": 203231, "epoch": 4838} {"train_loss": -7.265463829040527, "global_step": 203232, "epoch": 4838} {"train_loss": -7.320951461791992, "global_step": 203233, "epoch": 4838} {"train_loss": -7.242347240447998, "global_step": 203234, "epoch": 4838} {"train_loss": -7.288477420806885, "global_step": 203235, "epoch": 4838} {"train_loss": -7.208755970001221, "global_step": 203236, "epoch": 4838} {"train_loss": -7.3106131326584585, "global_step": 203237, "epoch": 4838, "val_loss": 81738.6796875} {"train_loss": -7.230241775512695, "global_step": 203238, "epoch": 4839} {"train_loss": -7.278288841247559, "global_step": 203239, "epoch": 4839} {"train_loss": -7.275484561920166, "global_step": 203240, "epoch": 4839} {"train_loss": -7.343774318695068, "global_step": 203241, "epoch": 4839} {"train_loss": -7.109010696411133, "global_step": 203242, "epoch": 4839} {"train_loss": -7.180044651031494, "global_step": 203243, "epoch": 4839} {"train_loss": -7.286503791809082, "global_step": 203244, "epoch": 4839} {"train_loss": -7.223563194274902, "global_step": 203245, "epoch": 4839} {"train_loss": -7.253880977630615, "global_step": 203246, "epoch": 4839} {"train_loss": -7.181053161621094, "global_step": 203247, "epoch": 4839} {"train_loss": -7.219053268432617, "global_step": 203248, "epoch": 4839} {"train_loss": -7.154253959655762, "global_step": 203249, "epoch": 4839} {"train_loss": -7.298779487609863, "global_step": 203250, "epoch": 4839} {"train_loss": -7.225820064544678, "global_step": 203251, "epoch": 4839} {"train_loss": -7.269680976867676, "global_step": 203252, "epoch": 4839} {"train_loss": -7.3765363693237305, "global_step": 203253, "epoch": 4839} {"train_loss": -7.247128486633301, "global_step": 203254, "epoch": 4839} {"train_loss": -7.280074119567871, "global_step": 203255, "epoch": 4839} {"train_loss": -7.34310245513916, "global_step": 203256, "epoch": 4839} {"train_loss": -7.166067123413086, "global_step": 203257, "epoch": 4839} {"train_loss": -7.178971290588379, "global_step": 203258, "epoch": 4839} {"train_loss": -7.236657619476318, "global_step": 203259, "epoch": 4839} {"train_loss": -7.32413387298584, "global_step": 203260, "epoch": 4839} {"train_loss": -7.3057637214660645, "global_step": 203261, "epoch": 4839} {"train_loss": -7.3321332931518555, "global_step": 203262, "epoch": 4839} {"train_loss": -7.248898983001709, "global_step": 203263, "epoch": 4839} {"train_loss": -7.177286148071289, "global_step": 203264, "epoch": 4839} {"train_loss": -7.226693153381348, "global_step": 203265, "epoch": 4839} {"train_loss": -7.191555976867676, "global_step": 203266, "epoch": 4839} {"train_loss": -7.295891761779785, "global_step": 203267, "epoch": 4839} {"train_loss": -7.2931413650512695, "global_step": 203268, "epoch": 4839} {"train_loss": -7.253227233886719, "global_step": 203269, "epoch": 4839} {"train_loss": -7.272249221801758, "global_step": 203270, "epoch": 4839} {"train_loss": -7.2541728019714355, "global_step": 203271, "epoch": 4839} {"train_loss": -7.345183372497559, "global_step": 203272, "epoch": 4839} {"train_loss": -7.339604377746582, "global_step": 203273, "epoch": 4839} {"train_loss": -7.304665565490723, "global_step": 203274, "epoch": 4839} {"train_loss": -7.368257999420166, "global_step": 203275, "epoch": 4839} {"train_loss": -7.257357597351074, "global_step": 203276, "epoch": 4839} {"train_loss": -7.3179168701171875, "global_step": 203277, "epoch": 4839} {"train_loss": -7.287259578704834, "global_step": 203278, "epoch": 4839} {"train_loss": -7.26309187071664, "global_step": 203279, "epoch": 4839, "val_loss": 81517.7890625} {"train_loss": -7.267373085021973, "global_step": 203280, "epoch": 4840} {"train_loss": -7.122425079345703, "global_step": 203281, "epoch": 4840} {"train_loss": -7.419322967529297, "global_step": 203282, "epoch": 4840} {"train_loss": -7.255422115325928, "global_step": 203283, "epoch": 4840} {"train_loss": -7.306905269622803, "global_step": 203284, "epoch": 4840} {"train_loss": -7.315023422241211, "global_step": 203285, "epoch": 4840} {"train_loss": -7.273601055145264, "global_step": 203286, "epoch": 4840} {"train_loss": -7.301833152770996, "global_step": 203287, "epoch": 4840} {"train_loss": -7.297379016876221, "global_step": 203288, "epoch": 4840} {"train_loss": -7.318560600280762, "global_step": 203289, "epoch": 4840} {"train_loss": -7.4001359939575195, "global_step": 203290, "epoch": 4840} {"train_loss": -7.360938549041748, "global_step": 203291, "epoch": 4840} {"train_loss": -7.277878284454346, "global_step": 203292, "epoch": 4840} {"train_loss": -7.326297760009766, "global_step": 203293, "epoch": 4840} {"train_loss": -7.229014873504639, "global_step": 203294, "epoch": 4840} {"train_loss": -7.153509140014648, "global_step": 203295, "epoch": 4840} {"train_loss": -7.377195358276367, "global_step": 203296, "epoch": 4840} {"train_loss": -7.34306001663208, "global_step": 203297, "epoch": 4840} {"train_loss": -7.2665557861328125, "global_step": 203298, "epoch": 4840} {"train_loss": -7.401190757751465, "global_step": 203299, "epoch": 4840} {"train_loss": -7.2987518310546875, "global_step": 203300, "epoch": 4840} {"train_loss": -7.331184387207031, "global_step": 203301, "epoch": 4840} {"train_loss": -7.2660698890686035, "global_step": 203302, "epoch": 4840} {"train_loss": -7.229237079620361, "global_step": 203303, "epoch": 4840} {"train_loss": -7.285257816314697, "global_step": 203304, "epoch": 4840} {"train_loss": -7.2770280838012695, "global_step": 203305, "epoch": 4840} {"train_loss": -7.384387969970703, "global_step": 203306, "epoch": 4840} {"train_loss": -7.376416206359863, "global_step": 203307, "epoch": 4840} {"train_loss": -7.205564975738525, "global_step": 203308, "epoch": 4840} {"train_loss": -7.267024040222168, "global_step": 203309, "epoch": 4840} {"train_loss": -7.389037132263184, "global_step": 203310, "epoch": 4840} {"train_loss": -7.231558322906494, "global_step": 203311, "epoch": 4840} {"train_loss": -7.281229019165039, "global_step": 203312, "epoch": 4840} {"train_loss": -7.221924781799316, "global_step": 203313, "epoch": 4840} {"train_loss": -7.285412788391113, "global_step": 203314, "epoch": 4840} {"train_loss": -7.31113338470459, "global_step": 203315, "epoch": 4840} {"train_loss": -7.347614288330078, "global_step": 203316, "epoch": 4840} {"train_loss": -7.169025421142578, "global_step": 203317, "epoch": 4840} {"train_loss": -7.248726844787598, "global_step": 203318, "epoch": 4840} {"train_loss": -7.228329658508301, "global_step": 203319, "epoch": 4840} {"train_loss": -7.352297782897949, "global_step": 203320, "epoch": 4840} {"train_loss": -7.293328069505238, "global_step": 203321, "epoch": 4840, "val_loss": 81696.3984375} {"train_loss": -7.4237060546875, "global_step": 203322, "epoch": 4841} {"train_loss": -7.3000054359436035, "global_step": 203323, "epoch": 4841} {"train_loss": -7.377610206604004, "global_step": 203324, "epoch": 4841} {"train_loss": -7.334468841552734, "global_step": 203325, "epoch": 4841} {"train_loss": -7.385799407958984, "global_step": 203326, "epoch": 4841} {"train_loss": -7.328268051147461, "global_step": 203327, "epoch": 4841} {"train_loss": -7.36456298828125, "global_step": 203328, "epoch": 4841} {"train_loss": -7.363640308380127, "global_step": 203329, "epoch": 4841} {"train_loss": -7.429800987243652, "global_step": 203330, "epoch": 4841} {"train_loss": -7.302205562591553, "global_step": 203331, "epoch": 4841} {"train_loss": -7.302082538604736, "global_step": 203332, "epoch": 4841} {"train_loss": -7.41193962097168, "global_step": 203333, "epoch": 4841} {"train_loss": -7.34680700302124, "global_step": 203334, "epoch": 4841} {"train_loss": -7.255836486816406, "global_step": 203335, "epoch": 4841} {"train_loss": -7.354454040527344, "global_step": 203336, "epoch": 4841} {"train_loss": -7.305595397949219, "global_step": 203337, "epoch": 4841} {"train_loss": -7.238768577575684, "global_step": 203338, "epoch": 4841} {"train_loss": -7.264130115509033, "global_step": 203339, "epoch": 4841} {"train_loss": -7.357371807098389, "global_step": 203340, "epoch": 4841} {"train_loss": -7.244777202606201, "global_step": 203341, "epoch": 4841} {"train_loss": -7.272065162658691, "global_step": 203342, "epoch": 4841} {"train_loss": -7.28771448135376, "global_step": 203343, "epoch": 4841} {"train_loss": -7.298128128051758, "global_step": 203344, "epoch": 4841} {"train_loss": -7.310710906982422, "global_step": 203345, "epoch": 4841} {"train_loss": -7.291951656341553, "global_step": 203346, "epoch": 4841} {"train_loss": -7.276933670043945, "global_step": 203347, "epoch": 4841} {"train_loss": -7.381608009338379, "global_step": 203348, "epoch": 4841} {"train_loss": -7.2349066734313965, "global_step": 203349, "epoch": 4841} {"train_loss": -7.119841575622559, "global_step": 203350, "epoch": 4841} {"train_loss": -7.346443176269531, "global_step": 203351, "epoch": 4841} {"train_loss": -7.370568752288818, "global_step": 203352, "epoch": 4841} {"train_loss": -7.317851543426514, "global_step": 203353, "epoch": 4841} {"train_loss": -7.295985698699951, "global_step": 203354, "epoch": 4841} {"train_loss": -7.258998870849609, "global_step": 203355, "epoch": 4841} {"train_loss": -7.23165225982666, "global_step": 203356, "epoch": 4841} {"train_loss": -7.264121055603027, "global_step": 203357, "epoch": 4841} {"train_loss": -7.217703819274902, "global_step": 203358, "epoch": 4841} {"train_loss": -7.302977085113525, "global_step": 203359, "epoch": 4841} {"train_loss": -7.321065902709961, "global_step": 203360, "epoch": 4841} {"train_loss": -7.317359447479248, "global_step": 203361, "epoch": 4841} {"train_loss": -7.2069244384765625, "global_step": 203362, "epoch": 4841} {"train_loss": -7.306763399214971, "global_step": 203363, "epoch": 4841, "val_loss": 81601.671875} {"train_loss": -7.266361236572266, "global_step": 203364, "epoch": 4842} {"train_loss": -7.199906349182129, "global_step": 203365, "epoch": 4842} {"train_loss": -7.253045082092285, "global_step": 203366, "epoch": 4842} {"train_loss": -7.331549167633057, "global_step": 203367, "epoch": 4842} {"train_loss": -7.268756866455078, "global_step": 203368, "epoch": 4842} {"train_loss": -7.335046768188477, "global_step": 203369, "epoch": 4842} {"train_loss": -7.338283538818359, "global_step": 203370, "epoch": 4842} {"train_loss": -7.296506881713867, "global_step": 203371, "epoch": 4842} {"train_loss": -7.417717456817627, "global_step": 203372, "epoch": 4842} {"train_loss": -7.196008682250977, "global_step": 203373, "epoch": 4842} {"train_loss": -7.251511573791504, "global_step": 203374, "epoch": 4842} {"train_loss": -7.123597621917725, "global_step": 203375, "epoch": 4842} {"train_loss": -7.462599754333496, "global_step": 203376, "epoch": 4842} {"train_loss": -7.19843864440918, "global_step": 203377, "epoch": 4842} {"train_loss": -7.306214809417725, "global_step": 203378, "epoch": 4842} {"train_loss": -7.274631500244141, "global_step": 203379, "epoch": 4842} {"train_loss": -7.235991477966309, "global_step": 203380, "epoch": 4842} {"train_loss": -7.218845367431641, "global_step": 203381, "epoch": 4842} {"train_loss": -7.118009090423584, "global_step": 203382, "epoch": 4842} {"train_loss": -7.2462358474731445, "global_step": 203383, "epoch": 4842} {"train_loss": -7.299777030944824, "global_step": 203384, "epoch": 4842} {"train_loss": -7.236973762512207, "global_step": 203385, "epoch": 4842} {"train_loss": -7.341019630432129, "global_step": 203386, "epoch": 4842} {"train_loss": -7.29547119140625, "global_step": 203387, "epoch": 4842} {"train_loss": -7.252535820007324, "global_step": 203388, "epoch": 4842} {"train_loss": -7.256402969360352, "global_step": 203389, "epoch": 4842} {"train_loss": -7.316167831420898, "global_step": 203390, "epoch": 4842} {"train_loss": -7.317644119262695, "global_step": 203391, "epoch": 4842} {"train_loss": -7.224646091461182, "global_step": 203392, "epoch": 4842} {"train_loss": -7.371049880981445, "global_step": 203393, "epoch": 4842} {"train_loss": -7.216464042663574, "global_step": 203394, "epoch": 4842} {"train_loss": -7.395606517791748, "global_step": 203395, "epoch": 4842} {"train_loss": -7.320584297180176, "global_step": 203396, "epoch": 4842} {"train_loss": -7.196749687194824, "global_step": 203397, "epoch": 4842} {"train_loss": -7.284079074859619, "global_step": 203398, "epoch": 4842} {"train_loss": -7.223443031311035, "global_step": 203399, "epoch": 4842} {"train_loss": -7.195122718811035, "global_step": 203400, "epoch": 4842} {"train_loss": -7.122440814971924, "global_step": 203401, "epoch": 4842} {"train_loss": -7.061690807342529, "global_step": 203402, "epoch": 4842} {"train_loss": -7.194863796234131, "global_step": 203403, "epoch": 4842} {"train_loss": -7.226787567138672, "global_step": 203404, "epoch": 4842} {"train_loss": -7.258251315071469, "global_step": 203405, "epoch": 4842, "val_loss": 81960.7265625} {"train_loss": -7.315026760101318, "global_step": 203406, "epoch": 4843} {"train_loss": -7.30600643157959, "global_step": 203407, "epoch": 4843} {"train_loss": -7.307541847229004, "global_step": 203408, "epoch": 4843} {"train_loss": -7.241193771362305, "global_step": 203409, "epoch": 4843} {"train_loss": -7.321691036224365, "global_step": 203410, "epoch": 4843} {"train_loss": -7.3341875076293945, "global_step": 203411, "epoch": 4843} {"train_loss": -7.332363128662109, "global_step": 203412, "epoch": 4843} {"train_loss": -7.186279773712158, "global_step": 203413, "epoch": 4843} {"train_loss": -7.320094108581543, "global_step": 203414, "epoch": 4843} {"train_loss": -7.289071083068848, "global_step": 203415, "epoch": 4843} {"train_loss": -7.3514533042907715, "global_step": 203416, "epoch": 4843} {"train_loss": -7.344180583953857, "global_step": 203417, "epoch": 4843} {"train_loss": -7.3379411697387695, "global_step": 203418, "epoch": 4843} {"train_loss": -7.279616832733154, "global_step": 203419, "epoch": 4843} {"train_loss": -7.374555587768555, "global_step": 203420, "epoch": 4843} {"train_loss": -7.2315802574157715, "global_step": 203421, "epoch": 4843} {"train_loss": -7.1896891593933105, "global_step": 203422, "epoch": 4843} {"train_loss": -7.2818603515625, "global_step": 203423, "epoch": 4843} {"train_loss": -7.202124118804932, "global_step": 203424, "epoch": 4843} {"train_loss": -7.315556526184082, "global_step": 203425, "epoch": 4843} {"train_loss": -7.352029323577881, "global_step": 203426, "epoch": 4843} {"train_loss": -7.346038818359375, "global_step": 203427, "epoch": 4843} {"train_loss": -7.346369743347168, "global_step": 203428, "epoch": 4843} {"train_loss": -7.234720706939697, "global_step": 203429, "epoch": 4843} {"train_loss": -7.301200866699219, "global_step": 203430, "epoch": 4843} {"train_loss": -7.312628746032715, "global_step": 203431, "epoch": 4843} {"train_loss": -7.21286153793335, "global_step": 203432, "epoch": 4843} {"train_loss": -7.237196922302246, "global_step": 203433, "epoch": 4843} {"train_loss": -7.234146595001221, "global_step": 203434, "epoch": 4843} {"train_loss": -7.18104362487793, "global_step": 203435, "epoch": 4843} {"train_loss": -7.409576416015625, "global_step": 203436, "epoch": 4843} {"train_loss": -7.1142449378967285, "global_step": 203437, "epoch": 4843} {"train_loss": -7.320126533508301, "global_step": 203438, "epoch": 4843} {"train_loss": -7.242622375488281, "global_step": 203439, "epoch": 4843} {"train_loss": -7.228307247161865, "global_step": 203440, "epoch": 4843} {"train_loss": -7.231588363647461, "global_step": 203441, "epoch": 4843} {"train_loss": -7.29877233505249, "global_step": 203442, "epoch": 4843} {"train_loss": -7.214503765106201, "global_step": 203443, "epoch": 4843} {"train_loss": -7.357242584228516, "global_step": 203444, "epoch": 4843} {"train_loss": -7.241145133972168, "global_step": 203445, "epoch": 4843} {"train_loss": -7.2353339195251465, "global_step": 203446, "epoch": 4843} {"train_loss": -7.27822056270781, "global_step": 203447, "epoch": 4843, "val_loss": 81495.9453125} {"train_loss": -7.289865970611572, "global_step": 203448, "epoch": 4844} {"train_loss": -7.39626407623291, "global_step": 203449, "epoch": 4844} {"train_loss": -7.269434928894043, "global_step": 203450, "epoch": 4844} {"train_loss": -7.3817033767700195, "global_step": 203451, "epoch": 4844} {"train_loss": -7.270190238952637, "global_step": 203452, "epoch": 4844} {"train_loss": -7.3326263427734375, "global_step": 203453, "epoch": 4844} {"train_loss": -7.429409027099609, "global_step": 203454, "epoch": 4844} {"train_loss": -7.333974838256836, "global_step": 203455, "epoch": 4844} {"train_loss": -7.3667497634887695, "global_step": 203456, "epoch": 4844} {"train_loss": -7.341119289398193, "global_step": 203457, "epoch": 4844} {"train_loss": -7.425963401794434, "global_step": 203458, "epoch": 4844} {"train_loss": -7.295249938964844, "global_step": 203459, "epoch": 4844} {"train_loss": -7.398043155670166, "global_step": 203460, "epoch": 4844} {"train_loss": -7.5250725746154785, "global_step": 203461, "epoch": 4844} {"train_loss": -7.2963409423828125, "global_step": 203462, "epoch": 4844} {"train_loss": -7.441272735595703, "global_step": 203463, "epoch": 4844} {"train_loss": -7.4052534103393555, "global_step": 203464, "epoch": 4844} {"train_loss": -7.384483814239502, "global_step": 203465, "epoch": 4844} {"train_loss": -7.317766189575195, "global_step": 203466, "epoch": 4844} {"train_loss": -7.330568313598633, "global_step": 203467, "epoch": 4844} {"train_loss": -7.316707134246826, "global_step": 203468, "epoch": 4844} {"train_loss": -7.345052719116211, "global_step": 203469, "epoch": 4844} {"train_loss": -7.352314472198486, "global_step": 203470, "epoch": 4844} {"train_loss": -7.3816680908203125, "global_step": 203471, "epoch": 4844} {"train_loss": -7.364636421203613, "global_step": 203472, "epoch": 4844} {"train_loss": -7.444059371948242, "global_step": 203473, "epoch": 4844} {"train_loss": -7.348039627075195, "global_step": 203474, "epoch": 4844} {"train_loss": -7.373076438903809, "global_step": 203475, "epoch": 4844} {"train_loss": -7.344776153564453, "global_step": 203476, "epoch": 4844} {"train_loss": -7.303929328918457, "global_step": 203477, "epoch": 4844} {"train_loss": -7.383324146270752, "global_step": 203478, "epoch": 4844} {"train_loss": -7.4193010330200195, "global_step": 203479, "epoch": 4844} {"train_loss": -7.334664344787598, "global_step": 203480, "epoch": 4844} {"train_loss": -7.41016960144043, "global_step": 203481, "epoch": 4844} {"train_loss": -7.200409889221191, "global_step": 203482, "epoch": 4844} {"train_loss": -7.3663811683654785, "global_step": 203483, "epoch": 4844} {"train_loss": -7.333493232727051, "global_step": 203484, "epoch": 4844} {"train_loss": -7.225259304046631, "global_step": 203485, "epoch": 4844} {"train_loss": -7.230798721313477, "global_step": 203486, "epoch": 4844} {"train_loss": -7.30978536605835, "global_step": 203487, "epoch": 4844} {"train_loss": -7.3214569091796875, "global_step": 203488, "epoch": 4844} {"train_loss": -7.349317789077759, "global_step": 203489, "epoch": 4844, "val_loss": 81515.8984375} {"train_loss": -7.315333366394043, "global_step": 203490, "epoch": 4845} {"train_loss": -7.242425441741943, "global_step": 203491, "epoch": 4845} {"train_loss": -7.323202133178711, "global_step": 203492, "epoch": 4845} {"train_loss": -7.23012638092041, "global_step": 203493, "epoch": 4845} {"train_loss": -7.374622821807861, "global_step": 203494, "epoch": 4845} {"train_loss": -7.295851707458496, "global_step": 203495, "epoch": 4845} {"train_loss": -7.240878105163574, "global_step": 203496, "epoch": 4845} {"train_loss": -7.353603363037109, "global_step": 203497, "epoch": 4845} {"train_loss": -7.362524509429932, "global_step": 203498, "epoch": 4845} {"train_loss": -7.195333480834961, "global_step": 203499, "epoch": 4845} {"train_loss": -7.337592124938965, "global_step": 203500, "epoch": 4845} {"train_loss": -7.384212493896484, "global_step": 203501, "epoch": 4845} {"train_loss": -7.2972869873046875, "global_step": 203502, "epoch": 4845} {"train_loss": -7.364272594451904, "global_step": 203503, "epoch": 4845} {"train_loss": -7.284757614135742, "global_step": 203504, "epoch": 4845} {"train_loss": -7.368387222290039, "global_step": 203505, "epoch": 4845} {"train_loss": -7.26326847076416, "global_step": 203506, "epoch": 4845} {"train_loss": -7.342233657836914, "global_step": 203507, "epoch": 4845} {"train_loss": -7.359068870544434, "global_step": 203508, "epoch": 4845} {"train_loss": -7.288699626922607, "global_step": 203509, "epoch": 4845} {"train_loss": -7.499790191650391, "global_step": 203510, "epoch": 4845} {"train_loss": -7.2507829666137695, "global_step": 203511, "epoch": 4845} {"train_loss": -7.261348724365234, "global_step": 203512, "epoch": 4845} {"train_loss": -7.326262474060059, "global_step": 203513, "epoch": 4845} {"train_loss": -7.178615570068359, "global_step": 203514, "epoch": 4845} {"train_loss": -7.38432502746582, "global_step": 203515, "epoch": 4845} {"train_loss": -7.236776351928711, "global_step": 203516, "epoch": 4845} {"train_loss": -7.174145221710205, "global_step": 203517, "epoch": 4845} {"train_loss": -7.520389080047607, "global_step": 203518, "epoch": 4845} {"train_loss": -7.194602966308594, "global_step": 203519, "epoch": 4845} {"train_loss": -7.388590335845947, "global_step": 203520, "epoch": 4845} {"train_loss": -7.37795352935791, "global_step": 203521, "epoch": 4845} {"train_loss": -7.37744140625, "global_step": 203522, "epoch": 4845} {"train_loss": -7.366847991943359, "global_step": 203523, "epoch": 4845} {"train_loss": -7.259724140167236, "global_step": 203524, "epoch": 4845} {"train_loss": -7.330114364624023, "global_step": 203525, "epoch": 4845} {"train_loss": -7.296586990356445, "global_step": 203526, "epoch": 4845} {"train_loss": -7.296658515930176, "global_step": 203527, "epoch": 4845} {"train_loss": -7.383176326751709, "global_step": 203528, "epoch": 4845} {"train_loss": -7.1412763595581055, "global_step": 203529, "epoch": 4845} {"train_loss": -7.240567207336426, "global_step": 203530, "epoch": 4845} {"train_loss": -7.3084236326671785, "global_step": 203531, "epoch": 4845, "val_loss": 81620.453125} {"train_loss": -7.227124214172363, "global_step": 203532, "epoch": 4846} {"train_loss": -7.254146575927734, "global_step": 203533, "epoch": 4846} {"train_loss": -7.365136623382568, "global_step": 203534, "epoch": 4846} {"train_loss": -7.2647833824157715, "global_step": 203535, "epoch": 4846} {"train_loss": -7.3136491775512695, "global_step": 203536, "epoch": 4846} {"train_loss": -7.414301872253418, "global_step": 203537, "epoch": 4846} {"train_loss": -7.454775810241699, "global_step": 203538, "epoch": 4846} {"train_loss": -7.327576637268066, "global_step": 203539, "epoch": 4846} {"train_loss": -7.378726959228516, "global_step": 203540, "epoch": 4846} {"train_loss": -7.394181251525879, "global_step": 203541, "epoch": 4846} {"train_loss": -7.476475238800049, "global_step": 203542, "epoch": 4846} {"train_loss": -7.321584701538086, "global_step": 203543, "epoch": 4846} {"train_loss": -7.305225849151611, "global_step": 203544, "epoch": 4846} {"train_loss": -7.347725868225098, "global_step": 203545, "epoch": 4846} {"train_loss": -7.320901870727539, "global_step": 203546, "epoch": 4846} {"train_loss": -7.193990707397461, "global_step": 203547, "epoch": 4846} {"train_loss": -7.41840934753418, "global_step": 203548, "epoch": 4846} {"train_loss": -7.359584331512451, "global_step": 203549, "epoch": 4846} {"train_loss": -7.289819240570068, "global_step": 203550, "epoch": 4846} {"train_loss": -7.384360313415527, "global_step": 203551, "epoch": 4846} {"train_loss": -7.217992305755615, "global_step": 203552, "epoch": 4846} {"train_loss": -7.470733642578125, "global_step": 203553, "epoch": 4846} {"train_loss": -7.108782768249512, "global_step": 203554, "epoch": 4846} {"train_loss": -7.329671859741211, "global_step": 203555, "epoch": 4846} {"train_loss": -7.1598615646362305, "global_step": 203556, "epoch": 4846} {"train_loss": -7.208758354187012, "global_step": 203557, "epoch": 4846} {"train_loss": -7.271028518676758, "global_step": 203558, "epoch": 4846} {"train_loss": -7.126792907714844, "global_step": 203559, "epoch": 4846} {"train_loss": -7.257514953613281, "global_step": 203560, "epoch": 4846} {"train_loss": -6.949573516845703, "global_step": 203561, "epoch": 4846} {"train_loss": -7.221733093261719, "global_step": 203562, "epoch": 4846} {"train_loss": -7.317922592163086, "global_step": 203563, "epoch": 4846} {"train_loss": -7.169260025024414, "global_step": 203564, "epoch": 4846} {"train_loss": -7.377683639526367, "global_step": 203565, "epoch": 4846} {"train_loss": -7.249050140380859, "global_step": 203566, "epoch": 4846} {"train_loss": -7.286168098449707, "global_step": 203567, "epoch": 4846} {"train_loss": -7.193121910095215, "global_step": 203568, "epoch": 4846} {"train_loss": -7.242654800415039, "global_step": 203569, "epoch": 4846} {"train_loss": -7.4275712966918945, "global_step": 203570, "epoch": 4846} {"train_loss": -7.215539932250977, "global_step": 203571, "epoch": 4846} {"train_loss": -7.31336784362793, "global_step": 203572, "epoch": 4846} {"train_loss": -7.2903763680231, "global_step": 203573, "epoch": 4846, "val_loss": 81641.078125} {"train_loss": -7.432343482971191, "global_step": 203574, "epoch": 4847} {"train_loss": -7.365530967712402, "global_step": 203575, "epoch": 4847} {"train_loss": -7.295965194702148, "global_step": 203576, "epoch": 4847} {"train_loss": -7.332808971405029, "global_step": 203577, "epoch": 4847} {"train_loss": -7.29775333404541, "global_step": 203578, "epoch": 4847} {"train_loss": -7.34432315826416, "global_step": 203579, "epoch": 4847} {"train_loss": -7.353151321411133, "global_step": 203580, "epoch": 4847} {"train_loss": -7.39143180847168, "global_step": 203581, "epoch": 4847} {"train_loss": -7.338594436645508, "global_step": 203582, "epoch": 4847} {"train_loss": -7.450085639953613, "global_step": 203583, "epoch": 4847} {"train_loss": -7.414092063903809, "global_step": 203584, "epoch": 4847} {"train_loss": -7.357572555541992, "global_step": 203585, "epoch": 4847} {"train_loss": -7.248172760009766, "global_step": 203586, "epoch": 4847} {"train_loss": -7.387191295623779, "global_step": 203587, "epoch": 4847} {"train_loss": -7.248948097229004, "global_step": 203588, "epoch": 4847} {"train_loss": -7.405128002166748, "global_step": 203589, "epoch": 4847} {"train_loss": -7.422556400299072, "global_step": 203590, "epoch": 4847} {"train_loss": -7.3810882568359375, "global_step": 203591, "epoch": 4847} {"train_loss": -7.515362739562988, "global_step": 203592, "epoch": 4847} {"train_loss": -7.322200775146484, "global_step": 203593, "epoch": 4847} {"train_loss": -7.36644172668457, "global_step": 203594, "epoch": 4847} {"train_loss": -7.365848541259766, "global_step": 203595, "epoch": 4847} {"train_loss": -7.396578311920166, "global_step": 203596, "epoch": 4847} {"train_loss": -7.449043273925781, "global_step": 203597, "epoch": 4847} {"train_loss": -7.452627658843994, "global_step": 203598, "epoch": 4847} {"train_loss": -7.361466407775879, "global_step": 203599, "epoch": 4847} {"train_loss": -7.289013385772705, "global_step": 203600, "epoch": 4847} {"train_loss": -7.410588264465332, "global_step": 203601, "epoch": 4847} {"train_loss": -7.21101188659668, "global_step": 203602, "epoch": 4847} {"train_loss": -7.281005382537842, "global_step": 203603, "epoch": 4847} {"train_loss": -7.369758605957031, "global_step": 203604, "epoch": 4847} {"train_loss": -7.247175693511963, "global_step": 203605, "epoch": 4847} {"train_loss": -7.3871283531188965, "global_step": 203606, "epoch": 4847} {"train_loss": -7.290185928344727, "global_step": 203607, "epoch": 4847} {"train_loss": -7.274866104125977, "global_step": 203608, "epoch": 4847} {"train_loss": -7.248647689819336, "global_step": 203609, "epoch": 4847} {"train_loss": -7.360346794128418, "global_step": 203610, "epoch": 4847} {"train_loss": -7.393407821655273, "global_step": 203611, "epoch": 4847} {"train_loss": -7.321849822998047, "global_step": 203612, "epoch": 4847} {"train_loss": -7.217994689941406, "global_step": 203613, "epoch": 4847} {"train_loss": -7.309840679168701, "global_step": 203614, "epoch": 4847} {"train_loss": -7.3501894019898915, "global_step": 203615, "epoch": 4847, "val_loss": 81675.5546875} {"train_loss": -7.389996528625488, "global_step": 203616, "epoch": 4848} {"train_loss": -7.297156810760498, "global_step": 203617, "epoch": 4848} {"train_loss": -7.344600200653076, "global_step": 203618, "epoch": 4848} {"train_loss": -7.36777925491333, "global_step": 203619, "epoch": 4848} {"train_loss": -7.309785842895508, "global_step": 203620, "epoch": 4848} {"train_loss": -7.300407409667969, "global_step": 203621, "epoch": 4848} {"train_loss": -7.342108726501465, "global_step": 203622, "epoch": 4848} {"train_loss": -7.486417293548584, "global_step": 203623, "epoch": 4848} {"train_loss": -7.29514741897583, "global_step": 203624, "epoch": 4848} {"train_loss": -7.285247802734375, "global_step": 203625, "epoch": 4848} {"train_loss": -7.322856426239014, "global_step": 203626, "epoch": 4848} {"train_loss": -7.344714641571045, "global_step": 203627, "epoch": 4848} {"train_loss": -7.341303825378418, "global_step": 203628, "epoch": 4848} {"train_loss": -7.322659492492676, "global_step": 203629, "epoch": 4848} {"train_loss": -7.323141098022461, "global_step": 203630, "epoch": 4848} {"train_loss": -7.385133266448975, "global_step": 203631, "epoch": 4848} {"train_loss": -7.370528697967529, "global_step": 203632, "epoch": 4848} {"train_loss": -7.316557884216309, "global_step": 203633, "epoch": 4848} {"train_loss": -7.298123359680176, "global_step": 203634, "epoch": 4848} {"train_loss": -7.431001663208008, "global_step": 203635, "epoch": 4848} {"train_loss": -7.239444732666016, "global_step": 203636, "epoch": 4848} {"train_loss": -7.2372050285339355, "global_step": 203637, "epoch": 4848} {"train_loss": -7.312957286834717, "global_step": 203638, "epoch": 4848} {"train_loss": -7.3292412757873535, "global_step": 203639, "epoch": 4848} {"train_loss": -7.343201637268066, "global_step": 203640, "epoch": 4848} {"train_loss": -7.2275567054748535, "global_step": 203641, "epoch": 4848} {"train_loss": -7.2163591384887695, "global_step": 203642, "epoch": 4848} {"train_loss": -7.307697772979736, "global_step": 203643, "epoch": 4848} {"train_loss": -7.304713249206543, "global_step": 203644, "epoch": 4848} {"train_loss": -7.193000793457031, "global_step": 203645, "epoch": 4848} {"train_loss": -7.299637794494629, "global_step": 203646, "epoch": 4848} {"train_loss": -7.326133728027344, "global_step": 203647, "epoch": 4848} {"train_loss": -7.247566223144531, "global_step": 203648, "epoch": 4848} {"train_loss": -7.361011505126953, "global_step": 203649, "epoch": 4848} {"train_loss": -7.234821319580078, "global_step": 203650, "epoch": 4848} {"train_loss": -7.279090881347656, "global_step": 203651, "epoch": 4848} {"train_loss": -7.377161026000977, "global_step": 203652, "epoch": 4848} {"train_loss": -7.2274699211120605, "global_step": 203653, "epoch": 4848} {"train_loss": -7.370580673217773, "global_step": 203654, "epoch": 4848} {"train_loss": -7.363488674163818, "global_step": 203655, "epoch": 4848} {"train_loss": -7.458630561828613, "global_step": 203656, "epoch": 4848} {"train_loss": -7.32131502741859, "global_step": 203657, "epoch": 4848, "val_loss": 81745.7421875} {"train_loss": -7.3898725509643555, "global_step": 203658, "epoch": 4849} {"train_loss": -7.316780090332031, "global_step": 203659, "epoch": 4849} {"train_loss": -7.439262390136719, "global_step": 203660, "epoch": 4849} {"train_loss": -7.404046058654785, "global_step": 203661, "epoch": 4849} {"train_loss": -7.36327600479126, "global_step": 203662, "epoch": 4849} {"train_loss": -7.366231441497803, "global_step": 203663, "epoch": 4849} {"train_loss": -7.397615432739258, "global_step": 203664, "epoch": 4849} {"train_loss": -7.29746675491333, "global_step": 203665, "epoch": 4849} {"train_loss": -7.242275238037109, "global_step": 203666, "epoch": 4849} {"train_loss": -7.372124671936035, "global_step": 203667, "epoch": 4849} {"train_loss": -7.323686122894287, "global_step": 203668, "epoch": 4849} {"train_loss": -7.261897563934326, "global_step": 203669, "epoch": 4849} {"train_loss": -7.278002738952637, "global_step": 203670, "epoch": 4849} {"train_loss": -7.31585168838501, "global_step": 203671, "epoch": 4849} {"train_loss": -7.328134536743164, "global_step": 203672, "epoch": 4849} {"train_loss": -7.298949241638184, "global_step": 203673, "epoch": 4849} {"train_loss": -7.299435615539551, "global_step": 203674, "epoch": 4849} {"train_loss": -7.251143455505371, "global_step": 203675, "epoch": 4849} {"train_loss": -7.309540748596191, "global_step": 203676, "epoch": 4849} {"train_loss": -7.159887313842773, "global_step": 203677, "epoch": 4849} {"train_loss": -7.258807182312012, "global_step": 203678, "epoch": 4849} {"train_loss": -7.367380142211914, "global_step": 203679, "epoch": 4849} {"train_loss": -7.003627777099609, "global_step": 203680, "epoch": 4849} {"train_loss": -7.187224388122559, "global_step": 203681, "epoch": 4849} {"train_loss": -7.123316764831543, "global_step": 203682, "epoch": 4849} {"train_loss": -7.188914775848389, "global_step": 203683, "epoch": 4849} {"train_loss": -7.165366172790527, "global_step": 203684, "epoch": 4849} {"train_loss": -7.027618408203125, "global_step": 203685, "epoch": 4849} {"train_loss": -7.242687225341797, "global_step": 203686, "epoch": 4849} {"train_loss": -7.1200761795043945, "global_step": 203687, "epoch": 4849} {"train_loss": -7.267721652984619, "global_step": 203688, "epoch": 4849} {"train_loss": -7.239983081817627, "global_step": 203689, "epoch": 4849} {"train_loss": -7.282975196838379, "global_step": 203690, "epoch": 4849} {"train_loss": -7.06559944152832, "global_step": 203691, "epoch": 4849} {"train_loss": -7.265417575836182, "global_step": 203692, "epoch": 4849} {"train_loss": -7.249911308288574, "global_step": 203693, "epoch": 4849} {"train_loss": -7.237340927124023, "global_step": 203694, "epoch": 4849} {"train_loss": -7.201601505279541, "global_step": 203695, "epoch": 4849} {"train_loss": -7.331056594848633, "global_step": 203696, "epoch": 4849} {"train_loss": -7.335360527038574, "global_step": 203697, "epoch": 4849} {"train_loss": -7.2826995849609375, "global_step": 203698, "epoch": 4849} {"train_loss": -7.263094527380807, "global_step": 203699, "epoch": 4849, "val_loss": 81632.125} {"train_loss": -7.272967338562012, "global_step": 203700, "epoch": 4850} {"train_loss": -7.245462417602539, "global_step": 203701, "epoch": 4850} {"train_loss": -7.265527725219727, "global_step": 203702, "epoch": 4850} {"train_loss": -7.282168865203857, "global_step": 203703, "epoch": 4850} {"train_loss": -7.333918571472168, "global_step": 203704, "epoch": 4850} {"train_loss": -7.363008975982666, "global_step": 203705, "epoch": 4850} {"train_loss": -7.349608421325684, "global_step": 203706, "epoch": 4850} {"train_loss": -7.313049793243408, "global_step": 203707, "epoch": 4850} {"train_loss": -7.314316272735596, "global_step": 203708, "epoch": 4850} {"train_loss": -7.427191734313965, "global_step": 203709, "epoch": 4850} {"train_loss": -7.304999351501465, "global_step": 203710, "epoch": 4850} {"train_loss": -7.363776683807373, "global_step": 203711, "epoch": 4850} {"train_loss": -7.251056671142578, "global_step": 203712, "epoch": 4850} {"train_loss": -7.433017253875732, "global_step": 203713, "epoch": 4850} {"train_loss": -7.366265296936035, "global_step": 203714, "epoch": 4850} {"train_loss": -7.354404449462891, "global_step": 203715, "epoch": 4850} {"train_loss": -7.417980194091797, "global_step": 203716, "epoch": 4850} {"train_loss": -7.303802013397217, "global_step": 203717, "epoch": 4850} {"train_loss": -7.350640296936035, "global_step": 203718, "epoch": 4850} {"train_loss": -7.396585464477539, "global_step": 203719, "epoch": 4850} {"train_loss": -7.4054460525512695, "global_step": 203720, "epoch": 4850} {"train_loss": -7.3324432373046875, "global_step": 203721, "epoch": 4850} {"train_loss": -7.403054714202881, "global_step": 203722, "epoch": 4850} {"train_loss": -7.303361892700195, "global_step": 203723, "epoch": 4850} {"train_loss": -7.504505157470703, "global_step": 203724, "epoch": 4850} {"train_loss": -7.366150379180908, "global_step": 203725, "epoch": 4850} {"train_loss": -7.238861083984375, "global_step": 203726, "epoch": 4850} {"train_loss": -7.315877437591553, "global_step": 203727, "epoch": 4850} {"train_loss": -7.4108991622924805, "global_step": 203728, "epoch": 4850} {"train_loss": -7.497204303741455, "global_step": 203729, "epoch": 4850} {"train_loss": -7.304738998413086, "global_step": 203730, "epoch": 4850} {"train_loss": -7.324020862579346, "global_step": 203731, "epoch": 4850} {"train_loss": -7.366079330444336, "global_step": 203732, "epoch": 4850} {"train_loss": -7.312709331512451, "global_step": 203733, "epoch": 4850} {"train_loss": -7.28978157043457, "global_step": 203734, "epoch": 4850} {"train_loss": -7.265561103820801, "global_step": 203735, "epoch": 4850} {"train_loss": -7.382343292236328, "global_step": 203736, "epoch": 4850} {"train_loss": -7.290798187255859, "global_step": 203737, "epoch": 4850} {"train_loss": -7.329908847808838, "global_step": 203738, "epoch": 4850} {"train_loss": -7.340519905090332, "global_step": 203739, "epoch": 4850} {"train_loss": -7.331890106201172, "global_step": 203740, "epoch": 4850} {"train_loss": -7.342802127202352, "global_step": 203741, "epoch": 4850, "train/sim_max_reward_0": 0.19029749660605202, "train/sim_max_reward_1": 0.8598899861265553, "train/sim_max_reward_2": 0.34424340298032907, "train/sim_max_reward_3": 0.14529206005638912, "train/sim_max_reward_4": 0.5488397904897722, "train/sim_max_reward_5": 0.5631585724827122, "test/sim_max_reward_4500000": 0.4317290370468022, "test/sim_max_reward_4500001": 0.0, "test/sim_max_reward_4500002": 1.0, "test/sim_max_reward_4500003": 0.9342532027244959, "test/sim_max_reward_4500004": 0.08969914005977433, "test/sim_max_reward_4500005": 0.9364671280747466, "test/sim_max_reward_4500006": 0.8944806511628673, "test/sim_max_reward_4500007": 0.8725581417698361, "test/sim_max_reward_4500008": 0.0, "test/sim_max_reward_4500009": 0.05295262889345519, "test/sim_max_reward_4500010": 0.11110615384947994, "test/sim_max_reward_4500011": 0.9846427863434454, "test/sim_max_reward_4500012": 0.9925652485354461, "test/sim_max_reward_4500013": 0.005775420846401406, "test/sim_max_reward_4500014": 0.9841488083986062, "test/sim_max_reward_4500015": 0.9342951096777837, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.014927022836406534, "test/sim_max_reward_4500018": 0.9213473128910779, "test/sim_max_reward_4500019": 0.8780905798949308, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.8740151224705888, "test/sim_max_reward_4500022": 0.8979648085383936, "test/sim_max_reward_4500023": 1.0, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8744621475042014, "test/sim_max_reward_4500026": 0.3372198108730914, "test/sim_max_reward_4500027": 1.0, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.08325370435973072, "test/sim_max_reward_4500030": 0.8584178680471046, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.928306896843157, "test/sim_max_reward_4500034": 0.996566347501855, "test/sim_max_reward_4500035": 0.9858588247734681, "test/sim_max_reward_4500036": 0.9875485804280196, "test/sim_max_reward_4500037": 0.9178728946770847, "test/sim_max_reward_4500038": 0.3394000274782444, "test/sim_max_reward_4500039": 0.9305645477001203, "test/sim_max_reward_4500040": 0.9614145820336827, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.045820138013469215, "test/sim_max_reward_4500043": 0.5425362980495535, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.9378282582654947, "test/sim_max_reward_4500046": 0.18645253346500476, "test/sim_max_reward_4500047": 0.9791629582095228, "test/sim_max_reward_4500048": 0.9908437845768656, "test/sim_max_reward_4500049": 0.9466134872091175, "train/mean_score": 0.44195355145696835, "test/mean_score": 0.5978678620522547, "val_loss": 81750.4921875} {"train_loss": -7.406373500823975, "global_step": 203742, "epoch": 4851} {"train_loss": -7.302178382873535, "global_step": 203743, "epoch": 4851} {"train_loss": -7.43427848815918, "global_step": 203744, "epoch": 4851} {"train_loss": -7.333614826202393, "global_step": 203745, "epoch": 4851} {"train_loss": -7.300102710723877, "global_step": 203746, "epoch": 4851} {"train_loss": -7.4202399253845215, "global_step": 203747, "epoch": 4851} {"train_loss": -7.353721618652344, "global_step": 203748, "epoch": 4851} {"train_loss": -7.402131080627441, "global_step": 203749, "epoch": 4851} {"train_loss": -7.412774085998535, "global_step": 203750, "epoch": 4851} {"train_loss": -7.404395580291748, "global_step": 203751, "epoch": 4851} {"train_loss": -7.292978286743164, "global_step": 203752, "epoch": 4851} {"train_loss": -7.418481826782227, "global_step": 203753, "epoch": 4851} {"train_loss": -7.432600021362305, "global_step": 203754, "epoch": 4851} {"train_loss": -7.432648658752441, "global_step": 203755, "epoch": 4851} {"train_loss": -7.380898475646973, "global_step": 203756, "epoch": 4851} {"train_loss": -7.403731346130371, "global_step": 203757, "epoch": 4851} {"train_loss": -7.388485908508301, "global_step": 203758, "epoch": 4851} {"train_loss": -7.424005031585693, "global_step": 203759, "epoch": 4851} {"train_loss": -7.455563545227051, "global_step": 203760, "epoch": 4851} {"train_loss": -7.45635461807251, "global_step": 203761, "epoch": 4851} {"train_loss": -7.385219573974609, "global_step": 203762, "epoch": 4851} {"train_loss": -7.342479228973389, "global_step": 203763, "epoch": 4851} {"train_loss": -7.41096830368042, "global_step": 203764, "epoch": 4851} {"train_loss": -7.403437614440918, "global_step": 203765, "epoch": 4851} {"train_loss": -7.36515998840332, "global_step": 203766, "epoch": 4851} {"train_loss": -7.360291004180908, "global_step": 203767, "epoch": 4851} {"train_loss": -7.355498313903809, "global_step": 203768, "epoch": 4851} {"train_loss": -7.272279739379883, "global_step": 203769, "epoch": 4851} {"train_loss": -7.286487102508545, "global_step": 203770, "epoch": 4851} {"train_loss": -7.236198425292969, "global_step": 203771, "epoch": 4851} {"train_loss": -7.321946144104004, "global_step": 203772, "epoch": 4851} {"train_loss": -7.280889511108398, "global_step": 203773, "epoch": 4851} {"train_loss": -7.324577331542969, "global_step": 203774, "epoch": 4851} {"train_loss": -7.339118957519531, "global_step": 203775, "epoch": 4851} {"train_loss": -7.306199073791504, "global_step": 203776, "epoch": 4851} {"train_loss": -7.229741096496582, "global_step": 203777, "epoch": 4851} {"train_loss": -7.1683197021484375, "global_step": 203778, "epoch": 4851} {"train_loss": -7.182212829589844, "global_step": 203779, "epoch": 4851} {"train_loss": -7.31277322769165, "global_step": 203780, "epoch": 4851} {"train_loss": -7.360259532928467, "global_step": 203781, "epoch": 4851} {"train_loss": -7.255281925201416, "global_step": 203782, "epoch": 4851} {"train_loss": -7.347741263253348, "global_step": 203783, "epoch": 4851, "val_loss": 81446.78125} {"train_loss": -7.237851142883301, "global_step": 203784, "epoch": 4852} {"train_loss": -7.356771469116211, "global_step": 203785, "epoch": 4852} {"train_loss": -7.301851749420166, "global_step": 203786, "epoch": 4852} {"train_loss": -7.337092399597168, "global_step": 203787, "epoch": 4852} {"train_loss": -7.315973281860352, "global_step": 203788, "epoch": 4852} {"train_loss": -7.181924819946289, "global_step": 203789, "epoch": 4852} {"train_loss": -7.374299049377441, "global_step": 203790, "epoch": 4852} {"train_loss": -7.347681999206543, "global_step": 203791, "epoch": 4852} {"train_loss": -7.356309413909912, "global_step": 203792, "epoch": 4852} {"train_loss": -7.359811782836914, "global_step": 203793, "epoch": 4852} {"train_loss": -7.312793731689453, "global_step": 203794, "epoch": 4852} {"train_loss": -7.349710464477539, "global_step": 203795, "epoch": 4852} {"train_loss": -7.361523628234863, "global_step": 203796, "epoch": 4852} {"train_loss": -7.198996543884277, "global_step": 203797, "epoch": 4852} {"train_loss": -7.175107002258301, "global_step": 203798, "epoch": 4852} {"train_loss": -7.2248215675354, "global_step": 203799, "epoch": 4852} {"train_loss": -7.275565147399902, "global_step": 203800, "epoch": 4852} {"train_loss": -7.349700927734375, "global_step": 203801, "epoch": 4852} {"train_loss": -7.312893390655518, "global_step": 203802, "epoch": 4852} {"train_loss": -7.285255432128906, "global_step": 203803, "epoch": 4852} {"train_loss": -7.265689849853516, "global_step": 203804, "epoch": 4852} {"train_loss": -7.273897171020508, "global_step": 203805, "epoch": 4852} {"train_loss": -7.26627254486084, "global_step": 203806, "epoch": 4852} {"train_loss": -7.34427547454834, "global_step": 203807, "epoch": 4852} {"train_loss": -7.273396968841553, "global_step": 203808, "epoch": 4852} {"train_loss": -7.345835208892822, "global_step": 203809, "epoch": 4852} {"train_loss": -7.201951026916504, "global_step": 203810, "epoch": 4852} {"train_loss": -7.359193801879883, "global_step": 203811, "epoch": 4852} {"train_loss": -7.271371841430664, "global_step": 203812, "epoch": 4852} {"train_loss": -7.26768684387207, "global_step": 203813, "epoch": 4852} {"train_loss": -7.431203842163086, "global_step": 203814, "epoch": 4852} {"train_loss": -7.167901992797852, "global_step": 203815, "epoch": 4852} {"train_loss": -7.296399116516113, "global_step": 203816, "epoch": 4852} {"train_loss": -7.306041717529297, "global_step": 203817, "epoch": 4852} {"train_loss": -7.330953598022461, "global_step": 203818, "epoch": 4852} {"train_loss": -7.267415523529053, "global_step": 203819, "epoch": 4852} {"train_loss": -7.347260475158691, "global_step": 203820, "epoch": 4852} {"train_loss": -7.3316802978515625, "global_step": 203821, "epoch": 4852} {"train_loss": -7.212001323699951, "global_step": 203822, "epoch": 4852} {"train_loss": -7.387125015258789, "global_step": 203823, "epoch": 4852} {"train_loss": -7.335188865661621, "global_step": 203824, "epoch": 4852} {"train_loss": -7.3026330925169445, "global_step": 203825, "epoch": 4852, "val_loss": 81674.734375} {"train_loss": -7.206211090087891, "global_step": 203826, "epoch": 4853} {"train_loss": -7.365324020385742, "global_step": 203827, "epoch": 4853} {"train_loss": -7.432893753051758, "global_step": 203828, "epoch": 4853} {"train_loss": -7.3626508712768555, "global_step": 203829, "epoch": 4853} {"train_loss": -7.377516269683838, "global_step": 203830, "epoch": 4853} {"train_loss": -7.3973002433776855, "global_step": 203831, "epoch": 4853} {"train_loss": -7.386033058166504, "global_step": 203832, "epoch": 4853} {"train_loss": -7.4176554679870605, "global_step": 203833, "epoch": 4853} {"train_loss": -7.37244176864624, "global_step": 203834, "epoch": 4853} {"train_loss": -7.397406101226807, "global_step": 203835, "epoch": 4853} {"train_loss": -7.372399806976318, "global_step": 203836, "epoch": 4853} {"train_loss": -7.194438457489014, "global_step": 203837, "epoch": 4853} {"train_loss": -7.275854110717773, "global_step": 203838, "epoch": 4853} {"train_loss": -7.266112327575684, "global_step": 203839, "epoch": 4853} {"train_loss": -7.191896438598633, "global_step": 203840, "epoch": 4853} {"train_loss": -7.228856563568115, "global_step": 203841, "epoch": 4853} {"train_loss": -7.372101783752441, "global_step": 203842, "epoch": 4853} {"train_loss": -7.285682678222656, "global_step": 203843, "epoch": 4853} {"train_loss": -7.1705732345581055, "global_step": 203844, "epoch": 4853} {"train_loss": -7.326100826263428, "global_step": 203845, "epoch": 4853} {"train_loss": -7.138820648193359, "global_step": 203846, "epoch": 4853} {"train_loss": -7.226982116699219, "global_step": 203847, "epoch": 4853} {"train_loss": -7.158365249633789, "global_step": 203848, "epoch": 4853} {"train_loss": -7.090590000152588, "global_step": 203849, "epoch": 4853} {"train_loss": -7.347345352172852, "global_step": 203850, "epoch": 4853} {"train_loss": -7.219635009765625, "global_step": 203851, "epoch": 4853} {"train_loss": -7.126530647277832, "global_step": 203852, "epoch": 4853} {"train_loss": -7.106865882873535, "global_step": 203853, "epoch": 4853} {"train_loss": -7.21486759185791, "global_step": 203854, "epoch": 4853} {"train_loss": -7.173644542694092, "global_step": 203855, "epoch": 4853} {"train_loss": -7.150808811187744, "global_step": 203856, "epoch": 4853} {"train_loss": -7.35328483581543, "global_step": 203857, "epoch": 4853} {"train_loss": -7.285483360290527, "global_step": 203858, "epoch": 4853} {"train_loss": -7.283390522003174, "global_step": 203859, "epoch": 4853} {"train_loss": -7.318878173828125, "global_step": 203860, "epoch": 4853} {"train_loss": -7.331544876098633, "global_step": 203861, "epoch": 4853} {"train_loss": -7.27025032043457, "global_step": 203862, "epoch": 4853} {"train_loss": -7.33586311340332, "global_step": 203863, "epoch": 4853} {"train_loss": -7.286012649536133, "global_step": 203864, "epoch": 4853} {"train_loss": -7.3090386390686035, "global_step": 203865, "epoch": 4853} {"train_loss": -7.3336992263793945, "global_step": 203866, "epoch": 4853} {"train_loss": -7.281157822836013, "global_step": 203867, "epoch": 4853, "val_loss": 81824.9140625} {"train_loss": -7.308114051818848, "global_step": 203868, "epoch": 4854} {"train_loss": -7.330491542816162, "global_step": 203869, "epoch": 4854} {"train_loss": -7.236339092254639, "global_step": 203870, "epoch": 4854} {"train_loss": -7.46743106842041, "global_step": 203871, "epoch": 4854} {"train_loss": -7.414752006530762, "global_step": 203872, "epoch": 4854} {"train_loss": -7.2118120193481445, "global_step": 203873, "epoch": 4854} {"train_loss": -7.161700248718262, "global_step": 203874, "epoch": 4854} {"train_loss": -7.386222839355469, "global_step": 203875, "epoch": 4854} {"train_loss": -7.2504448890686035, "global_step": 203876, "epoch": 4854} {"train_loss": -7.46354341506958, "global_step": 203877, "epoch": 4854} {"train_loss": -7.281712532043457, "global_step": 203878, "epoch": 4854} {"train_loss": -7.252470970153809, "global_step": 203879, "epoch": 4854} {"train_loss": -7.405795097351074, "global_step": 203880, "epoch": 4854} {"train_loss": -7.305650234222412, "global_step": 203881, "epoch": 4854} {"train_loss": -7.266818523406982, "global_step": 203882, "epoch": 4854} {"train_loss": -7.429657936096191, "global_step": 203883, "epoch": 4854} {"train_loss": -7.331989288330078, "global_step": 203884, "epoch": 4854} {"train_loss": -7.212360382080078, "global_step": 203885, "epoch": 4854} {"train_loss": -7.382931232452393, "global_step": 203886, "epoch": 4854} {"train_loss": -7.320344924926758, "global_step": 203887, "epoch": 4854} {"train_loss": -7.329163074493408, "global_step": 203888, "epoch": 4854} {"train_loss": -7.308714866638184, "global_step": 203889, "epoch": 4854} {"train_loss": -7.312191009521484, "global_step": 203890, "epoch": 4854} {"train_loss": -7.4024858474731445, "global_step": 203891, "epoch": 4854} {"train_loss": -7.356522560119629, "global_step": 203892, "epoch": 4854} {"train_loss": -7.186977386474609, "global_step": 203893, "epoch": 4854} {"train_loss": -7.338802814483643, "global_step": 203894, "epoch": 4854} {"train_loss": -7.360654354095459, "global_step": 203895, "epoch": 4854} {"train_loss": -7.35918664932251, "global_step": 203896, "epoch": 4854} {"train_loss": -7.331839561462402, "global_step": 203897, "epoch": 4854} {"train_loss": -7.156911849975586, "global_step": 203898, "epoch": 4854} {"train_loss": -7.227770805358887, "global_step": 203899, "epoch": 4854} {"train_loss": -7.333416938781738, "global_step": 203900, "epoch": 4854} {"train_loss": -7.266146659851074, "global_step": 203901, "epoch": 4854} {"train_loss": -7.296669006347656, "global_step": 203902, "epoch": 4854} {"train_loss": -7.211616516113281, "global_step": 203903, "epoch": 4854} {"train_loss": -7.1274285316467285, "global_step": 203904, "epoch": 4854} {"train_loss": -7.437361717224121, "global_step": 203905, "epoch": 4854} {"train_loss": -7.322235107421875, "global_step": 203906, "epoch": 4854} {"train_loss": -7.223865032196045, "global_step": 203907, "epoch": 4854} {"train_loss": -7.176122188568115, "global_step": 203908, "epoch": 4854} {"train_loss": -7.303814649581909, "global_step": 203909, "epoch": 4854, "val_loss": 81634.0546875} {"train_loss": -7.32795524597168, "global_step": 203910, "epoch": 4855} {"train_loss": -7.287723064422607, "global_step": 203911, "epoch": 4855} {"train_loss": -7.200056076049805, "global_step": 203912, "epoch": 4855} {"train_loss": -7.149895668029785, "global_step": 203913, "epoch": 4855} {"train_loss": -7.309337139129639, "global_step": 203914, "epoch": 4855} {"train_loss": -7.321552753448486, "global_step": 203915, "epoch": 4855} {"train_loss": -7.340216636657715, "global_step": 203916, "epoch": 4855} {"train_loss": -7.380650520324707, "global_step": 203917, "epoch": 4855} {"train_loss": -7.284483909606934, "global_step": 203918, "epoch": 4855} {"train_loss": -7.388902187347412, "global_step": 203919, "epoch": 4855} {"train_loss": -7.252958297729492, "global_step": 203920, "epoch": 4855} {"train_loss": -7.232761383056641, "global_step": 203921, "epoch": 4855} {"train_loss": -7.432913780212402, "global_step": 203922, "epoch": 4855} {"train_loss": -7.260066509246826, "global_step": 203923, "epoch": 4855} {"train_loss": -7.395725727081299, "global_step": 203924, "epoch": 4855} {"train_loss": -7.306413650512695, "global_step": 203925, "epoch": 4855} {"train_loss": -7.313107490539551, "global_step": 203926, "epoch": 4855} {"train_loss": -7.396721363067627, "global_step": 203927, "epoch": 4855} {"train_loss": -7.3144850730896, "global_step": 203928, "epoch": 4855} {"train_loss": -7.255081653594971, "global_step": 203929, "epoch": 4855} {"train_loss": -7.326196670532227, "global_step": 203930, "epoch": 4855} {"train_loss": -7.277663230895996, "global_step": 203931, "epoch": 4855} {"train_loss": -7.385977745056152, "global_step": 203932, "epoch": 4855} {"train_loss": -7.303189754486084, "global_step": 203933, "epoch": 4855} {"train_loss": -7.389369964599609, "global_step": 203934, "epoch": 4855} {"train_loss": -7.355397701263428, "global_step": 203935, "epoch": 4855} {"train_loss": -7.307609558105469, "global_step": 203936, "epoch": 4855} {"train_loss": -7.358654975891113, "global_step": 203937, "epoch": 4855} {"train_loss": -7.356130599975586, "global_step": 203938, "epoch": 4855} {"train_loss": -7.493313789367676, "global_step": 203939, "epoch": 4855} {"train_loss": -7.406668186187744, "global_step": 203940, "epoch": 4855} {"train_loss": -7.274755954742432, "global_step": 203941, "epoch": 4855} {"train_loss": -7.342981338500977, "global_step": 203942, "epoch": 4855} {"train_loss": -7.33588981628418, "global_step": 203943, "epoch": 4855} {"train_loss": -7.418906211853027, "global_step": 203944, "epoch": 4855} {"train_loss": -7.3261613845825195, "global_step": 203945, "epoch": 4855} {"train_loss": -7.440230369567871, "global_step": 203946, "epoch": 4855} {"train_loss": -7.255667686462402, "global_step": 203947, "epoch": 4855} {"train_loss": -7.344689846038818, "global_step": 203948, "epoch": 4855} {"train_loss": -7.308437824249268, "global_step": 203949, "epoch": 4855} {"train_loss": -7.33050537109375, "global_step": 203950, "epoch": 4855} {"train_loss": -7.327127309072585, "global_step": 203951, "epoch": 4855, "val_loss": 81818.5625} {"train_loss": -7.301605224609375, "global_step": 203952, "epoch": 4856} {"train_loss": -7.267337799072266, "global_step": 203953, "epoch": 4856} {"train_loss": -7.153819561004639, "global_step": 203954, "epoch": 4856} {"train_loss": -7.323521614074707, "global_step": 203955, "epoch": 4856} {"train_loss": -7.222312927246094, "global_step": 203956, "epoch": 4856} {"train_loss": -7.1002960205078125, "global_step": 203957, "epoch": 4856} {"train_loss": -7.226789474487305, "global_step": 203958, "epoch": 4856} {"train_loss": -7.120689392089844, "global_step": 203959, "epoch": 4856} {"train_loss": -7.199048042297363, "global_step": 203960, "epoch": 4856} {"train_loss": -7.292389392852783, "global_step": 203961, "epoch": 4856} {"train_loss": -7.128607273101807, "global_step": 203962, "epoch": 4856} {"train_loss": -7.314112663269043, "global_step": 203963, "epoch": 4856} {"train_loss": -7.183994770050049, "global_step": 203964, "epoch": 4856} {"train_loss": -7.329126358032227, "global_step": 203965, "epoch": 4856} {"train_loss": -7.192165851593018, "global_step": 203966, "epoch": 4856} {"train_loss": -7.222519874572754, "global_step": 203967, "epoch": 4856} {"train_loss": -7.155166149139404, "global_step": 203968, "epoch": 4856} {"train_loss": -7.271173477172852, "global_step": 203969, "epoch": 4856} {"train_loss": -7.399833679199219, "global_step": 203970, "epoch": 4856} {"train_loss": -7.284177780151367, "global_step": 203971, "epoch": 4856} {"train_loss": -7.306743621826172, "global_step": 203972, "epoch": 4856} {"train_loss": -7.255941867828369, "global_step": 203973, "epoch": 4856} {"train_loss": -7.224799156188965, "global_step": 203974, "epoch": 4856} {"train_loss": -7.327215194702148, "global_step": 203975, "epoch": 4856} {"train_loss": -7.280750274658203, "global_step": 203976, "epoch": 4856} {"train_loss": -7.182515621185303, "global_step": 203977, "epoch": 4856} {"train_loss": -7.26214075088501, "global_step": 203978, "epoch": 4856} {"train_loss": -7.270829200744629, "global_step": 203979, "epoch": 4856} {"train_loss": -7.2583513259887695, "global_step": 203980, "epoch": 4856} {"train_loss": -7.246119022369385, "global_step": 203981, "epoch": 4856} {"train_loss": -7.389078140258789, "global_step": 203982, "epoch": 4856} {"train_loss": -7.33134126663208, "global_step": 203983, "epoch": 4856} {"train_loss": -7.342080593109131, "global_step": 203984, "epoch": 4856} {"train_loss": -7.321471214294434, "global_step": 203985, "epoch": 4856} {"train_loss": -7.222054481506348, "global_step": 203986, "epoch": 4856} {"train_loss": -7.252694606781006, "global_step": 203987, "epoch": 4856} {"train_loss": -7.302835464477539, "global_step": 203988, "epoch": 4856} {"train_loss": -7.306138515472412, "global_step": 203989, "epoch": 4856} {"train_loss": -7.251728057861328, "global_step": 203990, "epoch": 4856} {"train_loss": -7.240948677062988, "global_step": 203991, "epoch": 4856} {"train_loss": -7.170774459838867, "global_step": 203992, "epoch": 4856} {"train_loss": -7.258148624783471, "global_step": 203993, "epoch": 4856, "val_loss": 81650.1015625} {"train_loss": -7.33226203918457, "global_step": 203994, "epoch": 4857} {"train_loss": -7.135977745056152, "global_step": 203995, "epoch": 4857} {"train_loss": -7.203118801116943, "global_step": 203996, "epoch": 4857} {"train_loss": -7.257113456726074, "global_step": 203997, "epoch": 4857} {"train_loss": -7.049340724945068, "global_step": 203998, "epoch": 4857} {"train_loss": -7.234392166137695, "global_step": 203999, "epoch": 4857} {"train_loss": -7.302787780761719, "global_step": 204000, "epoch": 4857} {"train_loss": -7.215242385864258, "global_step": 204001, "epoch": 4857} {"train_loss": -7.198676109313965, "global_step": 204002, "epoch": 4857} {"train_loss": -7.355031967163086, "global_step": 204003, "epoch": 4857} {"train_loss": -7.185384750366211, "global_step": 204004, "epoch": 4857} {"train_loss": -7.213204383850098, "global_step": 204005, "epoch": 4857} {"train_loss": -7.341168403625488, "global_step": 204006, "epoch": 4857} {"train_loss": -7.303033828735352, "global_step": 204007, "epoch": 4857} {"train_loss": -7.222448348999023, "global_step": 204008, "epoch": 4857} {"train_loss": -7.211877346038818, "global_step": 204009, "epoch": 4857} {"train_loss": -7.270829200744629, "global_step": 204010, "epoch": 4857} {"train_loss": -7.242866039276123, "global_step": 204011, "epoch": 4857} {"train_loss": -7.300720691680908, "global_step": 204012, "epoch": 4857} {"train_loss": -7.344797134399414, "global_step": 204013, "epoch": 4857} {"train_loss": -7.393795490264893, "global_step": 204014, "epoch": 4857} {"train_loss": -7.375273704528809, "global_step": 204015, "epoch": 4857} {"train_loss": -7.331128120422363, "global_step": 204016, "epoch": 4857} {"train_loss": -7.36451530456543, "global_step": 204017, "epoch": 4857} {"train_loss": -7.251827239990234, "global_step": 204018, "epoch": 4857} {"train_loss": -7.333268165588379, "global_step": 204019, "epoch": 4857} {"train_loss": -7.214022636413574, "global_step": 204020, "epoch": 4857} {"train_loss": -7.220965385437012, "global_step": 204021, "epoch": 4857} {"train_loss": -7.431584358215332, "global_step": 204022, "epoch": 4857} {"train_loss": -7.295250415802002, "global_step": 204023, "epoch": 4857} {"train_loss": -7.369474411010742, "global_step": 204024, "epoch": 4857} {"train_loss": -7.173626899719238, "global_step": 204025, "epoch": 4857} {"train_loss": -7.3624348640441895, "global_step": 204026, "epoch": 4857} {"train_loss": -7.37476921081543, "global_step": 204027, "epoch": 4857} {"train_loss": -7.324841499328613, "global_step": 204028, "epoch": 4857} {"train_loss": -7.374635696411133, "global_step": 204029, "epoch": 4857} {"train_loss": -7.370579719543457, "global_step": 204030, "epoch": 4857} {"train_loss": -7.376090049743652, "global_step": 204031, "epoch": 4857} {"train_loss": -7.431478500366211, "global_step": 204032, "epoch": 4857} {"train_loss": -7.327983379364014, "global_step": 204033, "epoch": 4857} {"train_loss": -7.355316162109375, "global_step": 204034, "epoch": 4857} {"train_loss": -7.2923165162404375, "global_step": 204035, "epoch": 4857, "val_loss": 81416.2734375} {"train_loss": -7.354543685913086, "global_step": 204036, "epoch": 4858} {"train_loss": -7.494659900665283, "global_step": 204037, "epoch": 4858} {"train_loss": -7.338604927062988, "global_step": 204038, "epoch": 4858} {"train_loss": -7.408787250518799, "global_step": 204039, "epoch": 4858} {"train_loss": -7.425430774688721, "global_step": 204040, "epoch": 4858} {"train_loss": -7.398813247680664, "global_step": 204041, "epoch": 4858} {"train_loss": -7.350365161895752, "global_step": 204042, "epoch": 4858} {"train_loss": -7.354966163635254, "global_step": 204043, "epoch": 4858} {"train_loss": -7.382137298583984, "global_step": 204044, "epoch": 4858} {"train_loss": -7.41862678527832, "global_step": 204045, "epoch": 4858} {"train_loss": -7.300976753234863, "global_step": 204046, "epoch": 4858} {"train_loss": -7.442517280578613, "global_step": 204047, "epoch": 4858} {"train_loss": -7.324929714202881, "global_step": 204048, "epoch": 4858} {"train_loss": -7.37868595123291, "global_step": 204049, "epoch": 4858} {"train_loss": -7.3298845291137695, "global_step": 204050, "epoch": 4858} {"train_loss": -7.274869918823242, "global_step": 204051, "epoch": 4858} {"train_loss": -7.450509071350098, "global_step": 204052, "epoch": 4858} {"train_loss": -7.319777488708496, "global_step": 204053, "epoch": 4858} {"train_loss": -7.228228569030762, "global_step": 204054, "epoch": 4858} {"train_loss": -7.203616142272949, "global_step": 204055, "epoch": 4858} {"train_loss": -7.337906837463379, "global_step": 204056, "epoch": 4858} {"train_loss": -7.300686836242676, "global_step": 204057, "epoch": 4858} {"train_loss": -7.3419084548950195, "global_step": 204058, "epoch": 4858} {"train_loss": -7.423525810241699, "global_step": 204059, "epoch": 4858} {"train_loss": -7.342023849487305, "global_step": 204060, "epoch": 4858} {"train_loss": -7.353315353393555, "global_step": 204061, "epoch": 4858} {"train_loss": -7.263062953948975, "global_step": 204062, "epoch": 4858} {"train_loss": -7.356925964355469, "global_step": 204063, "epoch": 4858} {"train_loss": -7.362762451171875, "global_step": 204064, "epoch": 4858} {"train_loss": -7.233925819396973, "global_step": 204065, "epoch": 4858} {"train_loss": -7.148592472076416, "global_step": 204066, "epoch": 4858} {"train_loss": -7.25567102432251, "global_step": 204067, "epoch": 4858} {"train_loss": -7.248644828796387, "global_step": 204068, "epoch": 4858} {"train_loss": -7.233394622802734, "global_step": 204069, "epoch": 4858} {"train_loss": -7.146357536315918, "global_step": 204070, "epoch": 4858} {"train_loss": -7.344691276550293, "global_step": 204071, "epoch": 4858} {"train_loss": -7.252307415008545, "global_step": 204072, "epoch": 4858} {"train_loss": -7.1547346115112305, "global_step": 204073, "epoch": 4858} {"train_loss": -7.175492763519287, "global_step": 204074, "epoch": 4858} {"train_loss": -7.234560012817383, "global_step": 204075, "epoch": 4858} {"train_loss": -7.383534908294678, "global_step": 204076, "epoch": 4858} {"train_loss": -7.319124142328898, "global_step": 204077, "epoch": 4858, "val_loss": 81802.1328125} {"train_loss": -7.359455108642578, "global_step": 204078, "epoch": 4859} {"train_loss": -7.331898212432861, "global_step": 204079, "epoch": 4859} {"train_loss": -7.3359527587890625, "global_step": 204080, "epoch": 4859} {"train_loss": -7.399935722351074, "global_step": 204081, "epoch": 4859} {"train_loss": -7.308241844177246, "global_step": 204082, "epoch": 4859} {"train_loss": -7.3904523849487305, "global_step": 204083, "epoch": 4859} {"train_loss": -7.272257328033447, "global_step": 204084, "epoch": 4859} {"train_loss": -7.155387878417969, "global_step": 204085, "epoch": 4859} {"train_loss": -7.382521152496338, "global_step": 204086, "epoch": 4859} {"train_loss": -7.308468818664551, "global_step": 204087, "epoch": 4859} {"train_loss": -7.179403781890869, "global_step": 204088, "epoch": 4859} {"train_loss": -7.257180213928223, "global_step": 204089, "epoch": 4859} {"train_loss": -7.013948917388916, "global_step": 204090, "epoch": 4859} {"train_loss": -7.426741600036621, "global_step": 204091, "epoch": 4859} {"train_loss": -7.138337135314941, "global_step": 204092, "epoch": 4859} {"train_loss": -7.136398792266846, "global_step": 204093, "epoch": 4859} {"train_loss": -7.27578592300415, "global_step": 204094, "epoch": 4859} {"train_loss": -7.123589515686035, "global_step": 204095, "epoch": 4859} {"train_loss": -7.196678638458252, "global_step": 204096, "epoch": 4859} {"train_loss": -7.290435791015625, "global_step": 204097, "epoch": 4859} {"train_loss": -7.239974498748779, "global_step": 204098, "epoch": 4859} {"train_loss": -7.1683149337768555, "global_step": 204099, "epoch": 4859} {"train_loss": -7.234204292297363, "global_step": 204100, "epoch": 4859} {"train_loss": -7.254485607147217, "global_step": 204101, "epoch": 4859} {"train_loss": -7.23764181137085, "global_step": 204102, "epoch": 4859} {"train_loss": -7.206310272216797, "global_step": 204103, "epoch": 4859} {"train_loss": -7.341056823730469, "global_step": 204104, "epoch": 4859} {"train_loss": -7.353613376617432, "global_step": 204105, "epoch": 4859} {"train_loss": -7.353721618652344, "global_step": 204106, "epoch": 4859} {"train_loss": -7.282557487487793, "global_step": 204107, "epoch": 4859} {"train_loss": -7.140384674072266, "global_step": 204108, "epoch": 4859} {"train_loss": -7.3616862297058105, "global_step": 204109, "epoch": 4859} {"train_loss": -7.4346442222595215, "global_step": 204110, "epoch": 4859} {"train_loss": -7.244713306427002, "global_step": 204111, "epoch": 4859} {"train_loss": -7.301898002624512, "global_step": 204112, "epoch": 4859} {"train_loss": -7.300357818603516, "global_step": 204113, "epoch": 4859} {"train_loss": -7.324855804443359, "global_step": 204114, "epoch": 4859} {"train_loss": -7.340481758117676, "global_step": 204115, "epoch": 4859} {"train_loss": -7.290256023406982, "global_step": 204116, "epoch": 4859} {"train_loss": -7.23525333404541, "global_step": 204117, "epoch": 4859} {"train_loss": -7.266125679016113, "global_step": 204118, "epoch": 4859} {"train_loss": -7.275214320137387, "global_step": 204119, "epoch": 4859, "val_loss": 81640.171875} {"train_loss": -7.189833641052246, "global_step": 204120, "epoch": 4860} {"train_loss": -7.4740071296691895, "global_step": 204121, "epoch": 4860} {"train_loss": -7.288788795471191, "global_step": 204122, "epoch": 4860} {"train_loss": -7.357824325561523, "global_step": 204123, "epoch": 4860} {"train_loss": -7.342868804931641, "global_step": 204124, "epoch": 4860} {"train_loss": -7.329267501831055, "global_step": 204125, "epoch": 4860} {"train_loss": -7.367819786071777, "global_step": 204126, "epoch": 4860} {"train_loss": -7.421465873718262, "global_step": 204127, "epoch": 4860} {"train_loss": -7.404209136962891, "global_step": 204128, "epoch": 4860} {"train_loss": -7.404836654663086, "global_step": 204129, "epoch": 4860} {"train_loss": -7.326967716217041, "global_step": 204130, "epoch": 4860} {"train_loss": -7.351615905761719, "global_step": 204131, "epoch": 4860} {"train_loss": -7.461611747741699, "global_step": 204132, "epoch": 4860} {"train_loss": -7.399932861328125, "global_step": 204133, "epoch": 4860} {"train_loss": -7.422432899475098, "global_step": 204134, "epoch": 4860} {"train_loss": -7.3402204513549805, "global_step": 204135, "epoch": 4860} {"train_loss": -7.401534080505371, "global_step": 204136, "epoch": 4860} {"train_loss": -7.408677577972412, "global_step": 204137, "epoch": 4860} {"train_loss": -7.363800048828125, "global_step": 204138, "epoch": 4860} {"train_loss": -7.437949180603027, "global_step": 204139, "epoch": 4860} {"train_loss": -7.267450332641602, "global_step": 204140, "epoch": 4860} {"train_loss": -7.323177337646484, "global_step": 204141, "epoch": 4860} {"train_loss": -7.372772216796875, "global_step": 204142, "epoch": 4860} {"train_loss": -7.399240016937256, "global_step": 204143, "epoch": 4860} {"train_loss": -7.4028706550598145, "global_step": 204144, "epoch": 4860} {"train_loss": -7.4016828536987305, "global_step": 204145, "epoch": 4860} {"train_loss": -7.30983829498291, "global_step": 204146, "epoch": 4860} {"train_loss": -7.392634391784668, "global_step": 204147, "epoch": 4860} {"train_loss": -7.343351364135742, "global_step": 204148, "epoch": 4860} {"train_loss": -7.359858512878418, "global_step": 204149, "epoch": 4860} {"train_loss": -7.345099449157715, "global_step": 204150, "epoch": 4860} {"train_loss": -7.383069038391113, "global_step": 204151, "epoch": 4860} {"train_loss": -7.390069961547852, "global_step": 204152, "epoch": 4860} {"train_loss": -7.318973064422607, "global_step": 204153, "epoch": 4860} {"train_loss": -7.185455799102783, "global_step": 204154, "epoch": 4860} {"train_loss": -7.275869846343994, "global_step": 204155, "epoch": 4860} {"train_loss": -7.1896281242370605, "global_step": 204156, "epoch": 4860} {"train_loss": -7.285431385040283, "global_step": 204157, "epoch": 4860} {"train_loss": -7.152114391326904, "global_step": 204158, "epoch": 4860} {"train_loss": -7.3118109703063965, "global_step": 204159, "epoch": 4860} {"train_loss": -7.163150787353516, "global_step": 204160, "epoch": 4860} {"train_loss": -7.3428330307915095, "global_step": 204161, "epoch": 4860, "val_loss": 81605.484375} {"train_loss": -7.1655778884887695, "global_step": 204162, "epoch": 4861} {"train_loss": -7.147561073303223, "global_step": 204163, "epoch": 4861} {"train_loss": -7.305257797241211, "global_step": 204164, "epoch": 4861} {"train_loss": -7.141298294067383, "global_step": 204165, "epoch": 4861} {"train_loss": -7.185083389282227, "global_step": 204166, "epoch": 4861} {"train_loss": -7.348862171173096, "global_step": 204167, "epoch": 4861} {"train_loss": -7.168467998504639, "global_step": 204168, "epoch": 4861} {"train_loss": -7.290985584259033, "global_step": 204169, "epoch": 4861} {"train_loss": -7.255424499511719, "global_step": 204170, "epoch": 4861} {"train_loss": -7.212526321411133, "global_step": 204171, "epoch": 4861} {"train_loss": -7.255866527557373, "global_step": 204172, "epoch": 4861} {"train_loss": -7.30433464050293, "global_step": 204173, "epoch": 4861} {"train_loss": -7.445618629455566, "global_step": 204174, "epoch": 4861} {"train_loss": -7.267467498779297, "global_step": 204175, "epoch": 4861} {"train_loss": -7.350373268127441, "global_step": 204176, "epoch": 4861} {"train_loss": -7.2322797775268555, "global_step": 204177, "epoch": 4861} {"train_loss": -7.349761486053467, "global_step": 204178, "epoch": 4861} {"train_loss": -7.396676540374756, "global_step": 204179, "epoch": 4861} {"train_loss": -7.376035213470459, "global_step": 204180, "epoch": 4861} {"train_loss": -7.3167009353637695, "global_step": 204181, "epoch": 4861} {"train_loss": -7.387263298034668, "global_step": 204182, "epoch": 4861} {"train_loss": -7.3658952713012695, "global_step": 204183, "epoch": 4861} {"train_loss": -7.354907035827637, "global_step": 204184, "epoch": 4861} {"train_loss": -7.347311973571777, "global_step": 204185, "epoch": 4861} {"train_loss": -7.3524980545043945, "global_step": 204186, "epoch": 4861} {"train_loss": -7.285181045532227, "global_step": 204187, "epoch": 4861} {"train_loss": -7.312930583953857, "global_step": 204188, "epoch": 4861} {"train_loss": -7.357297897338867, "global_step": 204189, "epoch": 4861} {"train_loss": -7.405150413513184, "global_step": 204190, "epoch": 4861} {"train_loss": -7.259350299835205, "global_step": 204191, "epoch": 4861} {"train_loss": -7.403058052062988, "global_step": 204192, "epoch": 4861} {"train_loss": -7.408393383026123, "global_step": 204193, "epoch": 4861} {"train_loss": -7.378486633300781, "global_step": 204194, "epoch": 4861} {"train_loss": -7.324952125549316, "global_step": 204195, "epoch": 4861} {"train_loss": -7.339107990264893, "global_step": 204196, "epoch": 4861} {"train_loss": -7.368487358093262, "global_step": 204197, "epoch": 4861} {"train_loss": -7.377998352050781, "global_step": 204198, "epoch": 4861} {"train_loss": -7.303280830383301, "global_step": 204199, "epoch": 4861} {"train_loss": -7.236767768859863, "global_step": 204200, "epoch": 4861} {"train_loss": -7.296011924743652, "global_step": 204201, "epoch": 4861} {"train_loss": -7.296077728271484, "global_step": 204202, "epoch": 4861} {"train_loss": -7.3093948023659845, "global_step": 204203, "epoch": 4861, "val_loss": 81750.0859375} {"train_loss": -7.436504364013672, "global_step": 204204, "epoch": 4862} {"train_loss": -7.253567695617676, "global_step": 204205, "epoch": 4862} {"train_loss": -7.361419677734375, "global_step": 204206, "epoch": 4862} {"train_loss": -7.293232440948486, "global_step": 204207, "epoch": 4862} {"train_loss": -7.354608058929443, "global_step": 204208, "epoch": 4862} {"train_loss": -7.410383224487305, "global_step": 204209, "epoch": 4862} {"train_loss": -7.290992736816406, "global_step": 204210, "epoch": 4862} {"train_loss": -7.3556413650512695, "global_step": 204211, "epoch": 4862} {"train_loss": -7.249732494354248, "global_step": 204212, "epoch": 4862} {"train_loss": -7.321911811828613, "global_step": 204213, "epoch": 4862} {"train_loss": -7.396651268005371, "global_step": 204214, "epoch": 4862} {"train_loss": -7.253902435302734, "global_step": 204215, "epoch": 4862} {"train_loss": -7.351946830749512, "global_step": 204216, "epoch": 4862} {"train_loss": -7.376601219177246, "global_step": 204217, "epoch": 4862} {"train_loss": -7.281890869140625, "global_step": 204218, "epoch": 4862} {"train_loss": -7.347535133361816, "global_step": 204219, "epoch": 4862} {"train_loss": -7.231870174407959, "global_step": 204220, "epoch": 4862} {"train_loss": -7.225290775299072, "global_step": 204221, "epoch": 4862} {"train_loss": -7.3379716873168945, "global_step": 204222, "epoch": 4862} {"train_loss": -7.349137306213379, "global_step": 204223, "epoch": 4862} {"train_loss": -7.390707015991211, "global_step": 204224, "epoch": 4862} {"train_loss": -7.370934009552002, "global_step": 204225, "epoch": 4862} {"train_loss": -7.256942272186279, "global_step": 204226, "epoch": 4862} {"train_loss": -7.441071510314941, "global_step": 204227, "epoch": 4862} {"train_loss": -7.24782657623291, "global_step": 204228, "epoch": 4862} {"train_loss": -7.371669769287109, "global_step": 204229, "epoch": 4862} {"train_loss": -7.2225823402404785, "global_step": 204230, "epoch": 4862} {"train_loss": -7.284157752990723, "global_step": 204231, "epoch": 4862} {"train_loss": -7.4184112548828125, "global_step": 204232, "epoch": 4862} {"train_loss": -7.422907829284668, "global_step": 204233, "epoch": 4862} {"train_loss": -7.309554100036621, "global_step": 204234, "epoch": 4862} {"train_loss": -7.343987464904785, "global_step": 204235, "epoch": 4862} {"train_loss": -7.2378034591674805, "global_step": 204236, "epoch": 4862} {"train_loss": -7.342548370361328, "global_step": 204237, "epoch": 4862} {"train_loss": -7.4636712074279785, "global_step": 204238, "epoch": 4862} {"train_loss": -7.375869274139404, "global_step": 204239, "epoch": 4862} {"train_loss": -7.321137428283691, "global_step": 204240, "epoch": 4862} {"train_loss": -7.266351222991943, "global_step": 204241, "epoch": 4862} {"train_loss": -7.351751804351807, "global_step": 204242, "epoch": 4862} {"train_loss": -7.285652160644531, "global_step": 204243, "epoch": 4862} {"train_loss": -7.35176944732666, "global_step": 204244, "epoch": 4862} {"train_loss": -7.329370839255197, "global_step": 204245, "epoch": 4862, "val_loss": 81578.9609375} {"train_loss": -7.403213977813721, "global_step": 204246, "epoch": 4863} {"train_loss": -7.439961910247803, "global_step": 204247, "epoch": 4863} {"train_loss": -7.333258628845215, "global_step": 204248, "epoch": 4863} {"train_loss": -7.151176452636719, "global_step": 204249, "epoch": 4863} {"train_loss": -7.352781772613525, "global_step": 204250, "epoch": 4863} {"train_loss": -7.311912536621094, "global_step": 204251, "epoch": 4863} {"train_loss": -7.417102813720703, "global_step": 204252, "epoch": 4863} {"train_loss": -7.338075160980225, "global_step": 204253, "epoch": 4863} {"train_loss": -7.209029197692871, "global_step": 204254, "epoch": 4863} {"train_loss": -7.367611885070801, "global_step": 204255, "epoch": 4863} {"train_loss": -7.325229167938232, "global_step": 204256, "epoch": 4863} {"train_loss": -7.241311550140381, "global_step": 204257, "epoch": 4863} {"train_loss": -7.361629009246826, "global_step": 204258, "epoch": 4863} {"train_loss": -7.230947494506836, "global_step": 204259, "epoch": 4863} {"train_loss": -7.298624515533447, "global_step": 204260, "epoch": 4863} {"train_loss": -7.268882751464844, "global_step": 204261, "epoch": 4863} {"train_loss": -7.233322620391846, "global_step": 204262, "epoch": 4863} {"train_loss": -7.3616719245910645, "global_step": 204263, "epoch": 4863} {"train_loss": -7.251233100891113, "global_step": 204264, "epoch": 4863} {"train_loss": -7.445204734802246, "global_step": 204265, "epoch": 4863} {"train_loss": -7.34768009185791, "global_step": 204266, "epoch": 4863} {"train_loss": -7.384603500366211, "global_step": 204267, "epoch": 4863} {"train_loss": -7.256440162658691, "global_step": 204268, "epoch": 4863} {"train_loss": -7.426305770874023, "global_step": 204269, "epoch": 4863} {"train_loss": -7.336688995361328, "global_step": 204270, "epoch": 4863} {"train_loss": -7.225831985473633, "global_step": 204271, "epoch": 4863} {"train_loss": -7.386196613311768, "global_step": 204272, "epoch": 4863} {"train_loss": -7.268482208251953, "global_step": 204273, "epoch": 4863} {"train_loss": -7.277787208557129, "global_step": 204274, "epoch": 4863} {"train_loss": -7.268303871154785, "global_step": 204275, "epoch": 4863} {"train_loss": -7.234781265258789, "global_step": 204276, "epoch": 4863} {"train_loss": -7.372267723083496, "global_step": 204277, "epoch": 4863} {"train_loss": -7.3473052978515625, "global_step": 204278, "epoch": 4863} {"train_loss": -7.339940547943115, "global_step": 204279, "epoch": 4863} {"train_loss": -7.241883277893066, "global_step": 204280, "epoch": 4863} {"train_loss": -7.284450531005859, "global_step": 204281, "epoch": 4863} {"train_loss": -7.2534966468811035, "global_step": 204282, "epoch": 4863} {"train_loss": -7.224766254425049, "global_step": 204283, "epoch": 4863} {"train_loss": -7.141456604003906, "global_step": 204284, "epoch": 4863} {"train_loss": -7.302696228027344, "global_step": 204285, "epoch": 4863} {"train_loss": -7.157549858093262, "global_step": 204286, "epoch": 4863} {"train_loss": -7.299887589045933, "global_step": 204287, "epoch": 4863, "val_loss": 81662.265625} {"train_loss": -7.234694004058838, "global_step": 204288, "epoch": 4864} {"train_loss": -7.248782634735107, "global_step": 204289, "epoch": 4864} {"train_loss": -7.214158058166504, "global_step": 204290, "epoch": 4864} {"train_loss": -7.156446933746338, "global_step": 204291, "epoch": 4864} {"train_loss": -7.2637457847595215, "global_step": 204292, "epoch": 4864} {"train_loss": -7.190018177032471, "global_step": 204293, "epoch": 4864} {"train_loss": -7.192487716674805, "global_step": 204294, "epoch": 4864} {"train_loss": -7.200876235961914, "global_step": 204295, "epoch": 4864} {"train_loss": -7.067967891693115, "global_step": 204296, "epoch": 4864} {"train_loss": -7.218634128570557, "global_step": 204297, "epoch": 4864} {"train_loss": -7.117800712585449, "global_step": 204298, "epoch": 4864} {"train_loss": -7.0959625244140625, "global_step": 204299, "epoch": 4864} {"train_loss": -7.20743989944458, "global_step": 204300, "epoch": 4864} {"train_loss": -7.0375871658325195, "global_step": 204301, "epoch": 4864} {"train_loss": -7.348875999450684, "global_step": 204302, "epoch": 4864} {"train_loss": -7.066119194030762, "global_step": 204303, "epoch": 4864} {"train_loss": -7.292128562927246, "global_step": 204304, "epoch": 4864} {"train_loss": -7.218001842498779, "global_step": 204305, "epoch": 4864} {"train_loss": -7.184811115264893, "global_step": 204306, "epoch": 4864} {"train_loss": -7.155850887298584, "global_step": 204307, "epoch": 4864} {"train_loss": -7.322141647338867, "global_step": 204308, "epoch": 4864} {"train_loss": -7.168520927429199, "global_step": 204309, "epoch": 4864} {"train_loss": -7.246609687805176, "global_step": 204310, "epoch": 4864} {"train_loss": -7.354423522949219, "global_step": 204311, "epoch": 4864} {"train_loss": -7.259665489196777, "global_step": 204312, "epoch": 4864} {"train_loss": -7.4068403244018555, "global_step": 204313, "epoch": 4864} {"train_loss": -7.286028861999512, "global_step": 204314, "epoch": 4864} {"train_loss": -7.227780818939209, "global_step": 204315, "epoch": 4864} {"train_loss": -7.184869766235352, "global_step": 204316, "epoch": 4864} {"train_loss": -7.2414445877075195, "global_step": 204317, "epoch": 4864} {"train_loss": -7.21543550491333, "global_step": 204318, "epoch": 4864} {"train_loss": -7.455575466156006, "global_step": 204319, "epoch": 4864} {"train_loss": -7.252352714538574, "global_step": 204320, "epoch": 4864} {"train_loss": -7.452671051025391, "global_step": 204321, "epoch": 4864} {"train_loss": -7.341088771820068, "global_step": 204322, "epoch": 4864} {"train_loss": -7.278291702270508, "global_step": 204323, "epoch": 4864} {"train_loss": -7.4081573486328125, "global_step": 204324, "epoch": 4864} {"train_loss": -7.400479316711426, "global_step": 204325, "epoch": 4864} {"train_loss": -7.4021759033203125, "global_step": 204326, "epoch": 4864} {"train_loss": -7.3531341552734375, "global_step": 204327, "epoch": 4864} {"train_loss": -7.356942176818848, "global_step": 204328, "epoch": 4864} {"train_loss": -7.254596585319156, "global_step": 204329, "epoch": 4864, "val_loss": 81591.7109375} {"train_loss": -7.418758392333984, "global_step": 204330, "epoch": 4865} {"train_loss": -7.4065351486206055, "global_step": 204331, "epoch": 4865} {"train_loss": -7.372261047363281, "global_step": 204332, "epoch": 4865} {"train_loss": -7.339587211608887, "global_step": 204333, "epoch": 4865} {"train_loss": -7.407964706420898, "global_step": 204334, "epoch": 4865} {"train_loss": -7.4154510498046875, "global_step": 204335, "epoch": 4865} {"train_loss": -7.272661209106445, "global_step": 204336, "epoch": 4865} {"train_loss": -7.430629730224609, "global_step": 204337, "epoch": 4865} {"train_loss": -7.387622833251953, "global_step": 204338, "epoch": 4865} {"train_loss": -7.246741771697998, "global_step": 204339, "epoch": 4865} {"train_loss": -7.286471366882324, "global_step": 204340, "epoch": 4865} {"train_loss": -7.4067230224609375, "global_step": 204341, "epoch": 4865} {"train_loss": -7.415927410125732, "global_step": 204342, "epoch": 4865} {"train_loss": -7.36152458190918, "global_step": 204343, "epoch": 4865} {"train_loss": -7.349540710449219, "global_step": 204344, "epoch": 4865} {"train_loss": -7.463141441345215, "global_step": 204345, "epoch": 4865} {"train_loss": -7.436089515686035, "global_step": 204346, "epoch": 4865} {"train_loss": -7.3969831466674805, "global_step": 204347, "epoch": 4865} {"train_loss": -7.3049468994140625, "global_step": 204348, "epoch": 4865} {"train_loss": -7.3525309562683105, "global_step": 204349, "epoch": 4865} {"train_loss": -7.14686918258667, "global_step": 204350, "epoch": 4865} {"train_loss": -7.176109313964844, "global_step": 204351, "epoch": 4865} {"train_loss": -7.408210754394531, "global_step": 204352, "epoch": 4865} {"train_loss": -7.396838188171387, "global_step": 204353, "epoch": 4865} {"train_loss": -7.29292631149292, "global_step": 204354, "epoch": 4865} {"train_loss": -7.365594863891602, "global_step": 204355, "epoch": 4865} {"train_loss": -7.22719144821167, "global_step": 204356, "epoch": 4865} {"train_loss": -7.264766693115234, "global_step": 204357, "epoch": 4865} {"train_loss": -7.403568744659424, "global_step": 204358, "epoch": 4865} {"train_loss": -7.2971038818359375, "global_step": 204359, "epoch": 4865} {"train_loss": -7.323703765869141, "global_step": 204360, "epoch": 4865} {"train_loss": -7.088422775268555, "global_step": 204361, "epoch": 4865} {"train_loss": -7.331302642822266, "global_step": 204362, "epoch": 4865} {"train_loss": -7.178365707397461, "global_step": 204363, "epoch": 4865} {"train_loss": -7.201568126678467, "global_step": 204364, "epoch": 4865} {"train_loss": -7.205776214599609, "global_step": 204365, "epoch": 4865} {"train_loss": -7.161383628845215, "global_step": 204366, "epoch": 4865} {"train_loss": -7.266049385070801, "global_step": 204367, "epoch": 4865} {"train_loss": -7.107382774353027, "global_step": 204368, "epoch": 4865} {"train_loss": -7.136528015136719, "global_step": 204369, "epoch": 4865} {"train_loss": -7.12477970123291, "global_step": 204370, "epoch": 4865} {"train_loss": -7.307651054291498, "global_step": 204371, "epoch": 4865, "val_loss": 81826.890625} {"train_loss": -7.113106727600098, "global_step": 204372, "epoch": 4866} {"train_loss": -7.267004489898682, "global_step": 204373, "epoch": 4866} {"train_loss": -7.187967300415039, "global_step": 204374, "epoch": 4866} {"train_loss": -7.280441761016846, "global_step": 204375, "epoch": 4866} {"train_loss": -7.310445785522461, "global_step": 204376, "epoch": 4866} {"train_loss": -7.3623948097229, "global_step": 204377, "epoch": 4866} {"train_loss": -7.280555725097656, "global_step": 204378, "epoch": 4866} {"train_loss": -7.263739585876465, "global_step": 204379, "epoch": 4866} {"train_loss": -7.2544846534729, "global_step": 204380, "epoch": 4866} {"train_loss": -7.240701198577881, "global_step": 204381, "epoch": 4866} {"train_loss": -7.359717845916748, "global_step": 204382, "epoch": 4866} {"train_loss": -7.342316627502441, "global_step": 204383, "epoch": 4866} {"train_loss": -7.375993251800537, "global_step": 204384, "epoch": 4866} {"train_loss": -7.312703609466553, "global_step": 204385, "epoch": 4866} {"train_loss": -7.253362655639648, "global_step": 204386, "epoch": 4866} {"train_loss": -7.33949089050293, "global_step": 204387, "epoch": 4866} {"train_loss": -7.246655464172363, "global_step": 204388, "epoch": 4866} {"train_loss": -7.296339988708496, "global_step": 204389, "epoch": 4866} {"train_loss": -7.260515213012695, "global_step": 204390, "epoch": 4866} {"train_loss": -7.259212493896484, "global_step": 204391, "epoch": 4866} {"train_loss": -7.22269868850708, "global_step": 204392, "epoch": 4866} {"train_loss": -7.400595664978027, "global_step": 204393, "epoch": 4866} {"train_loss": -7.2580060958862305, "global_step": 204394, "epoch": 4866} {"train_loss": -7.309463024139404, "global_step": 204395, "epoch": 4866} {"train_loss": -7.336328029632568, "global_step": 204396, "epoch": 4866} {"train_loss": -7.259244918823242, "global_step": 204397, "epoch": 4866} {"train_loss": -7.409733772277832, "global_step": 204398, "epoch": 4866} {"train_loss": -7.388099193572998, "global_step": 204399, "epoch": 4866} {"train_loss": -7.28437614440918, "global_step": 204400, "epoch": 4866} {"train_loss": -7.321468353271484, "global_step": 204401, "epoch": 4866} {"train_loss": -7.253200531005859, "global_step": 204402, "epoch": 4866} {"train_loss": -7.145241737365723, "global_step": 204403, "epoch": 4866} {"train_loss": -7.371333122253418, "global_step": 204404, "epoch": 4866} {"train_loss": -7.276761054992676, "global_step": 204405, "epoch": 4866} {"train_loss": -7.378818511962891, "global_step": 204406, "epoch": 4866} {"train_loss": -7.3026227951049805, "global_step": 204407, "epoch": 4866} {"train_loss": -7.325201511383057, "global_step": 204408, "epoch": 4866} {"train_loss": -7.347205638885498, "global_step": 204409, "epoch": 4866} {"train_loss": -7.324143886566162, "global_step": 204410, "epoch": 4866} {"train_loss": -7.302927017211914, "global_step": 204411, "epoch": 4866} {"train_loss": -7.283536911010742, "global_step": 204412, "epoch": 4866} {"train_loss": -7.294869752157302, "global_step": 204413, "epoch": 4866, "val_loss": 81728.53125} {"train_loss": -7.280403137207031, "global_step": 204414, "epoch": 4867} {"train_loss": -7.463160991668701, "global_step": 204415, "epoch": 4867} {"train_loss": -7.415834426879883, "global_step": 204416, "epoch": 4867} {"train_loss": -7.368879318237305, "global_step": 204417, "epoch": 4867} {"train_loss": -7.306150436401367, "global_step": 204418, "epoch": 4867} {"train_loss": -7.316710472106934, "global_step": 204419, "epoch": 4867} {"train_loss": -7.338349342346191, "global_step": 204420, "epoch": 4867} {"train_loss": -7.278919219970703, "global_step": 204421, "epoch": 4867} {"train_loss": -7.380330562591553, "global_step": 204422, "epoch": 4867} {"train_loss": -7.372707366943359, "global_step": 204423, "epoch": 4867} {"train_loss": -7.282199859619141, "global_step": 204424, "epoch": 4867} {"train_loss": -7.219297409057617, "global_step": 204425, "epoch": 4867} {"train_loss": -7.209458827972412, "global_step": 204426, "epoch": 4867} {"train_loss": -7.296151161193848, "global_step": 204427, "epoch": 4867} {"train_loss": -7.1896257400512695, "global_step": 204428, "epoch": 4867} {"train_loss": -7.451809883117676, "global_step": 204429, "epoch": 4867} {"train_loss": -7.459245681762695, "global_step": 204430, "epoch": 4867} {"train_loss": -7.256522178649902, "global_step": 204431, "epoch": 4867} {"train_loss": -7.343371391296387, "global_step": 204432, "epoch": 4867} {"train_loss": -7.386501312255859, "global_step": 204433, "epoch": 4867} {"train_loss": -7.216429233551025, "global_step": 204434, "epoch": 4867} {"train_loss": -7.375317573547363, "global_step": 204435, "epoch": 4867} {"train_loss": -7.319108009338379, "global_step": 204436, "epoch": 4867} {"train_loss": -7.302270889282227, "global_step": 204437, "epoch": 4867} {"train_loss": -7.4148969650268555, "global_step": 204438, "epoch": 4867} {"train_loss": -7.156194686889648, "global_step": 204439, "epoch": 4867} {"train_loss": -7.24936580657959, "global_step": 204440, "epoch": 4867} {"train_loss": -7.3176679611206055, "global_step": 204441, "epoch": 4867} {"train_loss": -7.299825668334961, "global_step": 204442, "epoch": 4867} {"train_loss": -7.281467437744141, "global_step": 204443, "epoch": 4867} {"train_loss": -7.2732954025268555, "global_step": 204444, "epoch": 4867} {"train_loss": -7.270377159118652, "global_step": 204445, "epoch": 4867} {"train_loss": -7.22599983215332, "global_step": 204446, "epoch": 4867} {"train_loss": -7.281477451324463, "global_step": 204447, "epoch": 4867} {"train_loss": -7.159347057342529, "global_step": 204448, "epoch": 4867} {"train_loss": -7.362793445587158, "global_step": 204449, "epoch": 4867} {"train_loss": -7.305452346801758, "global_step": 204450, "epoch": 4867} {"train_loss": -7.313473701477051, "global_step": 204451, "epoch": 4867} {"train_loss": -7.240841388702393, "global_step": 204452, "epoch": 4867} {"train_loss": -7.2579345703125, "global_step": 204453, "epoch": 4867} {"train_loss": -7.3280229568481445, "global_step": 204454, "epoch": 4867} {"train_loss": -7.306839931578863, "global_step": 204455, "epoch": 4867, "val_loss": 81736.484375} {"train_loss": -7.143832206726074, "global_step": 204456, "epoch": 4868} {"train_loss": -7.216907501220703, "global_step": 204457, "epoch": 4868} {"train_loss": -7.306758880615234, "global_step": 204458, "epoch": 4868} {"train_loss": -7.303123474121094, "global_step": 204459, "epoch": 4868} {"train_loss": -7.242098331451416, "global_step": 204460, "epoch": 4868} {"train_loss": -7.271010875701904, "global_step": 204461, "epoch": 4868} {"train_loss": -7.291542053222656, "global_step": 204462, "epoch": 4868} {"train_loss": -7.334535598754883, "global_step": 204463, "epoch": 4868} {"train_loss": -7.3886566162109375, "global_step": 204464, "epoch": 4868} {"train_loss": -7.28255558013916, "global_step": 204465, "epoch": 4868} {"train_loss": -7.274428844451904, "global_step": 204466, "epoch": 4868} {"train_loss": -7.331910133361816, "global_step": 204467, "epoch": 4868} {"train_loss": -7.391308784484863, "global_step": 204468, "epoch": 4868} {"train_loss": -7.240592002868652, "global_step": 204469, "epoch": 4868} {"train_loss": -7.334842681884766, "global_step": 204470, "epoch": 4868} {"train_loss": -7.348937034606934, "global_step": 204471, "epoch": 4868} {"train_loss": -7.252378463745117, "global_step": 204472, "epoch": 4868} {"train_loss": -7.306619644165039, "global_step": 204473, "epoch": 4868} {"train_loss": -7.355092525482178, "global_step": 204474, "epoch": 4868} {"train_loss": -7.282540321350098, "global_step": 204475, "epoch": 4868} {"train_loss": -7.244186878204346, "global_step": 204476, "epoch": 4868} {"train_loss": -7.363520622253418, "global_step": 204477, "epoch": 4868} {"train_loss": -7.261099815368652, "global_step": 204478, "epoch": 4868} {"train_loss": -7.289065837860107, "global_step": 204479, "epoch": 4868} {"train_loss": -7.324311256408691, "global_step": 204480, "epoch": 4868} {"train_loss": -7.160331726074219, "global_step": 204481, "epoch": 4868} {"train_loss": -7.313844680786133, "global_step": 204482, "epoch": 4868} {"train_loss": -7.311252593994141, "global_step": 204483, "epoch": 4868} {"train_loss": -7.2563862800598145, "global_step": 204484, "epoch": 4868} {"train_loss": -7.3868184089660645, "global_step": 204485, "epoch": 4868} {"train_loss": -7.263565540313721, "global_step": 204486, "epoch": 4868} {"train_loss": -7.256715774536133, "global_step": 204487, "epoch": 4868} {"train_loss": -7.280689239501953, "global_step": 204488, "epoch": 4868} {"train_loss": -7.255802154541016, "global_step": 204489, "epoch": 4868} {"train_loss": -7.31279182434082, "global_step": 204490, "epoch": 4868} {"train_loss": -7.444814682006836, "global_step": 204491, "epoch": 4868} {"train_loss": -7.312023162841797, "global_step": 204492, "epoch": 4868} {"train_loss": -7.328979015350342, "global_step": 204493, "epoch": 4868} {"train_loss": -7.305391311645508, "global_step": 204494, "epoch": 4868} {"train_loss": -7.263980865478516, "global_step": 204495, "epoch": 4868} {"train_loss": -7.407762050628662, "global_step": 204496, "epoch": 4868} {"train_loss": -7.297694830667405, "global_step": 204497, "epoch": 4868, "val_loss": 81498.71875} {"train_loss": -7.318181037902832, "global_step": 204498, "epoch": 4869} {"train_loss": -7.3248162269592285, "global_step": 204499, "epoch": 4869} {"train_loss": -7.222841262817383, "global_step": 204500, "epoch": 4869} {"train_loss": -7.218255043029785, "global_step": 204501, "epoch": 4869} {"train_loss": -7.347108840942383, "global_step": 204502, "epoch": 4869} {"train_loss": -7.3524909019470215, "global_step": 204503, "epoch": 4869} {"train_loss": -7.345336437225342, "global_step": 204504, "epoch": 4869} {"train_loss": -7.387235641479492, "global_step": 204505, "epoch": 4869} {"train_loss": -7.370230674743652, "global_step": 204506, "epoch": 4869} {"train_loss": -7.342576026916504, "global_step": 204507, "epoch": 4869} {"train_loss": -7.41074800491333, "global_step": 204508, "epoch": 4869} {"train_loss": -7.399338722229004, "global_step": 204509, "epoch": 4869} {"train_loss": -7.424459457397461, "global_step": 204510, "epoch": 4869} {"train_loss": -7.354734420776367, "global_step": 204511, "epoch": 4869} {"train_loss": -7.413917541503906, "global_step": 204512, "epoch": 4869} {"train_loss": -7.400815010070801, "global_step": 204513, "epoch": 4869} {"train_loss": -7.2993998527526855, "global_step": 204514, "epoch": 4869} {"train_loss": -7.415536880493164, "global_step": 204515, "epoch": 4869} {"train_loss": -7.255531311035156, "global_step": 204516, "epoch": 4869} {"train_loss": -7.307300567626953, "global_step": 204517, "epoch": 4869} {"train_loss": -7.352252960205078, "global_step": 204518, "epoch": 4869} {"train_loss": -7.384721279144287, "global_step": 204519, "epoch": 4869} {"train_loss": -7.3170576095581055, "global_step": 204520, "epoch": 4869} {"train_loss": -7.319620609283447, "global_step": 204521, "epoch": 4869} {"train_loss": -7.179619312286377, "global_step": 204522, "epoch": 4869} {"train_loss": -7.29594612121582, "global_step": 204523, "epoch": 4869} {"train_loss": -7.355621337890625, "global_step": 204524, "epoch": 4869} {"train_loss": -7.097066402435303, "global_step": 204525, "epoch": 4869} {"train_loss": -7.3189544677734375, "global_step": 204526, "epoch": 4869} {"train_loss": -7.372302055358887, "global_step": 204527, "epoch": 4869} {"train_loss": -7.287492752075195, "global_step": 204528, "epoch": 4869} {"train_loss": -7.344324111938477, "global_step": 204529, "epoch": 4869} {"train_loss": -7.131139755249023, "global_step": 204530, "epoch": 4869} {"train_loss": -7.296194076538086, "global_step": 204531, "epoch": 4869} {"train_loss": -7.239672660827637, "global_step": 204532, "epoch": 4869} {"train_loss": -7.313981056213379, "global_step": 204533, "epoch": 4869} {"train_loss": -7.261584758758545, "global_step": 204534, "epoch": 4869} {"train_loss": -7.314008712768555, "global_step": 204535, "epoch": 4869} {"train_loss": -7.300930976867676, "global_step": 204536, "epoch": 4869} {"train_loss": -7.326897621154785, "global_step": 204537, "epoch": 4869} {"train_loss": -7.245691776275635, "global_step": 204538, "epoch": 4869} {"train_loss": -7.311485256467547, "global_step": 204539, "epoch": 4869, "val_loss": 81890.625} {"train_loss": -7.291973114013672, "global_step": 204540, "epoch": 4870} {"train_loss": -7.472171783447266, "global_step": 204541, "epoch": 4870} {"train_loss": -7.26536750793457, "global_step": 204542, "epoch": 4870} {"train_loss": -7.278927803039551, "global_step": 204543, "epoch": 4870} {"train_loss": -7.456934452056885, "global_step": 204544, "epoch": 4870} {"train_loss": -7.35040807723999, "global_step": 204545, "epoch": 4870} {"train_loss": -7.338040351867676, "global_step": 204546, "epoch": 4870} {"train_loss": -7.408060073852539, "global_step": 204547, "epoch": 4870} {"train_loss": -7.377223014831543, "global_step": 204548, "epoch": 4870} {"train_loss": -7.381180763244629, "global_step": 204549, "epoch": 4870} {"train_loss": -7.3613810539245605, "global_step": 204550, "epoch": 4870} {"train_loss": -7.396214008331299, "global_step": 204551, "epoch": 4870} {"train_loss": -7.424478054046631, "global_step": 204552, "epoch": 4870} {"train_loss": -7.313808441162109, "global_step": 204553, "epoch": 4870} {"train_loss": -7.406357765197754, "global_step": 204554, "epoch": 4870} {"train_loss": -7.375709533691406, "global_step": 204555, "epoch": 4870} {"train_loss": -7.283619403839111, "global_step": 204556, "epoch": 4870} {"train_loss": -7.4861345291137695, "global_step": 204557, "epoch": 4870} {"train_loss": -7.327625274658203, "global_step": 204558, "epoch": 4870} {"train_loss": -7.338239669799805, "global_step": 204559, "epoch": 4870} {"train_loss": -7.263176441192627, "global_step": 204560, "epoch": 4870} {"train_loss": -7.356380462646484, "global_step": 204561, "epoch": 4870} {"train_loss": -7.365435600280762, "global_step": 204562, "epoch": 4870} {"train_loss": -7.41668701171875, "global_step": 204563, "epoch": 4870} {"train_loss": -7.3169684410095215, "global_step": 204564, "epoch": 4870} {"train_loss": -7.211040019989014, "global_step": 204565, "epoch": 4870} {"train_loss": -7.324806213378906, "global_step": 204566, "epoch": 4870} {"train_loss": -7.413422584533691, "global_step": 204567, "epoch": 4870} {"train_loss": -7.350671291351318, "global_step": 204568, "epoch": 4870} {"train_loss": -7.319366455078125, "global_step": 204569, "epoch": 4870} {"train_loss": -7.331215858459473, "global_step": 204570, "epoch": 4870} {"train_loss": -7.273834228515625, "global_step": 204571, "epoch": 4870} {"train_loss": -7.296147346496582, "global_step": 204572, "epoch": 4870} {"train_loss": -7.3821001052856445, "global_step": 204573, "epoch": 4870} {"train_loss": -7.349831581115723, "global_step": 204574, "epoch": 4870} {"train_loss": -7.344714164733887, "global_step": 204575, "epoch": 4870} {"train_loss": -7.3335089683532715, "global_step": 204576, "epoch": 4870} {"train_loss": -7.247824192047119, "global_step": 204577, "epoch": 4870} {"train_loss": -7.316847801208496, "global_step": 204578, "epoch": 4870} {"train_loss": -7.463591575622559, "global_step": 204579, "epoch": 4870} {"train_loss": -7.4313859939575195, "global_step": 204580, "epoch": 4870} {"train_loss": -7.3534281594412665, "global_step": 204581, "epoch": 4870, "val_loss": 81829.375} {"train_loss": -7.374087333679199, "global_step": 204582, "epoch": 4871} {"train_loss": -7.282855033874512, "global_step": 204583, "epoch": 4871} {"train_loss": -7.35943603515625, "global_step": 204584, "epoch": 4871} {"train_loss": -7.407634258270264, "global_step": 204585, "epoch": 4871} {"train_loss": -7.429498672485352, "global_step": 204586, "epoch": 4871} {"train_loss": -7.347866058349609, "global_step": 204587, "epoch": 4871} {"train_loss": -7.391829967498779, "global_step": 204588, "epoch": 4871} {"train_loss": -7.411659240722656, "global_step": 204589, "epoch": 4871} {"train_loss": -7.236844062805176, "global_step": 204590, "epoch": 4871} {"train_loss": -7.304328441619873, "global_step": 204591, "epoch": 4871} {"train_loss": -7.4188761711120605, "global_step": 204592, "epoch": 4871} {"train_loss": -7.412525177001953, "global_step": 204593, "epoch": 4871} {"train_loss": -7.412879943847656, "global_step": 204594, "epoch": 4871} {"train_loss": -7.349843502044678, "global_step": 204595, "epoch": 4871} {"train_loss": -7.402519226074219, "global_step": 204596, "epoch": 4871} {"train_loss": -7.312019348144531, "global_step": 204597, "epoch": 4871} {"train_loss": -7.476070404052734, "global_step": 204598, "epoch": 4871} {"train_loss": -7.332627296447754, "global_step": 204599, "epoch": 4871} {"train_loss": -7.501683712005615, "global_step": 204600, "epoch": 4871} {"train_loss": -7.474935531616211, "global_step": 204601, "epoch": 4871} {"train_loss": -7.352479934692383, "global_step": 204602, "epoch": 4871} {"train_loss": -7.371164798736572, "global_step": 204603, "epoch": 4871} {"train_loss": -7.3779449462890625, "global_step": 204604, "epoch": 4871} {"train_loss": -7.449268341064453, "global_step": 204605, "epoch": 4871} {"train_loss": -7.391730308532715, "global_step": 204606, "epoch": 4871} {"train_loss": -7.4173994064331055, "global_step": 204607, "epoch": 4871} {"train_loss": -7.311339855194092, "global_step": 204608, "epoch": 4871} {"train_loss": -7.319612503051758, "global_step": 204609, "epoch": 4871} {"train_loss": -7.343697547912598, "global_step": 204610, "epoch": 4871} {"train_loss": -7.408876419067383, "global_step": 204611, "epoch": 4871} {"train_loss": -7.216314315795898, "global_step": 204612, "epoch": 4871} {"train_loss": -7.1715521812438965, "global_step": 204613, "epoch": 4871} {"train_loss": -7.250746726989746, "global_step": 204614, "epoch": 4871} {"train_loss": -7.280459880828857, "global_step": 204615, "epoch": 4871} {"train_loss": -7.223971366882324, "global_step": 204616, "epoch": 4871} {"train_loss": -7.138888359069824, "global_step": 204617, "epoch": 4871} {"train_loss": -7.1860761642456055, "global_step": 204618, "epoch": 4871} {"train_loss": -7.204665184020996, "global_step": 204619, "epoch": 4871} {"train_loss": -7.079887866973877, "global_step": 204620, "epoch": 4871} {"train_loss": -7.114404678344727, "global_step": 204621, "epoch": 4871} {"train_loss": -7.119656085968018, "global_step": 204622, "epoch": 4871} {"train_loss": -7.316717806316557, "global_step": 204623, "epoch": 4871, "val_loss": 81765.78125} {"train_loss": -7.253066539764404, "global_step": 204624, "epoch": 4872} {"train_loss": -7.008358955383301, "global_step": 204625, "epoch": 4872} {"train_loss": -7.275567531585693, "global_step": 204626, "epoch": 4872} {"train_loss": -7.082721710205078, "global_step": 204627, "epoch": 4872} {"train_loss": -7.1802473068237305, "global_step": 204628, "epoch": 4872} {"train_loss": -7.127504825592041, "global_step": 204629, "epoch": 4872} {"train_loss": -7.055829048156738, "global_step": 204630, "epoch": 4872} {"train_loss": -7.11906623840332, "global_step": 204631, "epoch": 4872} {"train_loss": -7.263083457946777, "global_step": 204632, "epoch": 4872} {"train_loss": -7.237153053283691, "global_step": 204633, "epoch": 4872} {"train_loss": -7.053669452667236, "global_step": 204634, "epoch": 4872} {"train_loss": -7.195137977600098, "global_step": 204635, "epoch": 4872} {"train_loss": -7.19571590423584, "global_step": 204636, "epoch": 4872} {"train_loss": -7.238254547119141, "global_step": 204637, "epoch": 4872} {"train_loss": -7.100400924682617, "global_step": 204638, "epoch": 4872} {"train_loss": -7.285933971405029, "global_step": 204639, "epoch": 4872} {"train_loss": -7.286183834075928, "global_step": 204640, "epoch": 4872} {"train_loss": -7.334979057312012, "global_step": 204641, "epoch": 4872} {"train_loss": -7.3234148025512695, "global_step": 204642, "epoch": 4872} {"train_loss": -7.348902702331543, "global_step": 204643, "epoch": 4872} {"train_loss": -7.36357307434082, "global_step": 204644, "epoch": 4872} {"train_loss": -7.393289566040039, "global_step": 204645, "epoch": 4872} {"train_loss": -7.357052326202393, "global_step": 204646, "epoch": 4872} {"train_loss": -7.3257551193237305, "global_step": 204647, "epoch": 4872} {"train_loss": -7.390109539031982, "global_step": 204648, "epoch": 4872} {"train_loss": -7.340667724609375, "global_step": 204649, "epoch": 4872} {"train_loss": -7.396188735961914, "global_step": 204650, "epoch": 4872} {"train_loss": -7.331455230712891, "global_step": 204651, "epoch": 4872} {"train_loss": -7.27797794342041, "global_step": 204652, "epoch": 4872} {"train_loss": -7.399184226989746, "global_step": 204653, "epoch": 4872} {"train_loss": -7.299815654754639, "global_step": 204654, "epoch": 4872} {"train_loss": -7.3817458152771, "global_step": 204655, "epoch": 4872} {"train_loss": -7.562976837158203, "global_step": 204656, "epoch": 4872} {"train_loss": -7.366168022155762, "global_step": 204657, "epoch": 4872} {"train_loss": -7.439934253692627, "global_step": 204658, "epoch": 4872} {"train_loss": -7.418744087219238, "global_step": 204659, "epoch": 4872} {"train_loss": -7.335429668426514, "global_step": 204660, "epoch": 4872} {"train_loss": -7.354842662811279, "global_step": 204661, "epoch": 4872} {"train_loss": -7.398468017578125, "global_step": 204662, "epoch": 4872} {"train_loss": -7.432183265686035, "global_step": 204663, "epoch": 4872} {"train_loss": -7.447283744812012, "global_step": 204664, "epoch": 4872} {"train_loss": -7.2956046376909525, "global_step": 204665, "epoch": 4872, "val_loss": 81614.3515625} {"train_loss": -7.345640182495117, "global_step": 204666, "epoch": 4873} {"train_loss": -7.432251930236816, "global_step": 204667, "epoch": 4873} {"train_loss": -7.424770355224609, "global_step": 204668, "epoch": 4873} {"train_loss": -7.4552531242370605, "global_step": 204669, "epoch": 4873} {"train_loss": -7.416774749755859, "global_step": 204670, "epoch": 4873} {"train_loss": -7.337498664855957, "global_step": 204671, "epoch": 4873} {"train_loss": -7.414035797119141, "global_step": 204672, "epoch": 4873} {"train_loss": -7.271657943725586, "global_step": 204673, "epoch": 4873} {"train_loss": -7.424986839294434, "global_step": 204674, "epoch": 4873} {"train_loss": -7.370183944702148, "global_step": 204675, "epoch": 4873} {"train_loss": -7.367419719696045, "global_step": 204676, "epoch": 4873} {"train_loss": -7.355481147766113, "global_step": 204677, "epoch": 4873} {"train_loss": -7.356692790985107, "global_step": 204678, "epoch": 4873} {"train_loss": -7.351510047912598, "global_step": 204679, "epoch": 4873} {"train_loss": -7.240574359893799, "global_step": 204680, "epoch": 4873} {"train_loss": -7.176446437835693, "global_step": 204681, "epoch": 4873} {"train_loss": -7.185854434967041, "global_step": 204682, "epoch": 4873} {"train_loss": -7.30317497253418, "global_step": 204683, "epoch": 4873} {"train_loss": -7.325109481811523, "global_step": 204684, "epoch": 4873} {"train_loss": -7.437083721160889, "global_step": 204685, "epoch": 4873} {"train_loss": -7.375852584838867, "global_step": 204686, "epoch": 4873} {"train_loss": -7.439553737640381, "global_step": 204687, "epoch": 4873} {"train_loss": -7.357969760894775, "global_step": 204688, "epoch": 4873} {"train_loss": -7.352916717529297, "global_step": 204689, "epoch": 4873} {"train_loss": -7.340595245361328, "global_step": 204690, "epoch": 4873} {"train_loss": -7.368335723876953, "global_step": 204691, "epoch": 4873} {"train_loss": -7.337533950805664, "global_step": 204692, "epoch": 4873} {"train_loss": -7.351546287536621, "global_step": 204693, "epoch": 4873} {"train_loss": -7.391787528991699, "global_step": 204694, "epoch": 4873} {"train_loss": -7.309877395629883, "global_step": 204695, "epoch": 4873} {"train_loss": -7.380031585693359, "global_step": 204696, "epoch": 4873} {"train_loss": -7.372875213623047, "global_step": 204697, "epoch": 4873} {"train_loss": -7.245419502258301, "global_step": 204698, "epoch": 4873} {"train_loss": -7.222251892089844, "global_step": 204699, "epoch": 4873} {"train_loss": -7.233259201049805, "global_step": 204700, "epoch": 4873} {"train_loss": -7.038299560546875, "global_step": 204701, "epoch": 4873} {"train_loss": -7.349086761474609, "global_step": 204702, "epoch": 4873} {"train_loss": -7.008298397064209, "global_step": 204703, "epoch": 4873} {"train_loss": -7.26765251159668, "global_step": 204704, "epoch": 4873} {"train_loss": -7.201953887939453, "global_step": 204705, "epoch": 4873} {"train_loss": -7.155215263366699, "global_step": 204706, "epoch": 4873} {"train_loss": -7.31792798496428, "global_step": 204707, "epoch": 4873, "val_loss": 82067.890625} {"train_loss": -7.1421003341674805, "global_step": 204708, "epoch": 4874} {"train_loss": -7.321340560913086, "global_step": 204709, "epoch": 4874} {"train_loss": -7.2331695556640625, "global_step": 204710, "epoch": 4874} {"train_loss": -7.203737258911133, "global_step": 204711, "epoch": 4874} {"train_loss": -7.218523979187012, "global_step": 204712, "epoch": 4874} {"train_loss": -7.175248146057129, "global_step": 204713, "epoch": 4874} {"train_loss": -7.288829326629639, "global_step": 204714, "epoch": 4874} {"train_loss": -7.1927571296691895, "global_step": 204715, "epoch": 4874} {"train_loss": -7.240151882171631, "global_step": 204716, "epoch": 4874} {"train_loss": -7.2942609786987305, "global_step": 204717, "epoch": 4874} {"train_loss": -7.2082600593566895, "global_step": 204718, "epoch": 4874} {"train_loss": -7.157620906829834, "global_step": 204719, "epoch": 4874} {"train_loss": -7.33537483215332, "global_step": 204720, "epoch": 4874} {"train_loss": -7.093182563781738, "global_step": 204721, "epoch": 4874} {"train_loss": -7.395796298980713, "global_step": 204722, "epoch": 4874} {"train_loss": -7.243705749511719, "global_step": 204723, "epoch": 4874} {"train_loss": -7.294032096862793, "global_step": 204724, "epoch": 4874} {"train_loss": -7.234557151794434, "global_step": 204725, "epoch": 4874} {"train_loss": -7.1660284996032715, "global_step": 204726, "epoch": 4874} {"train_loss": -7.237356185913086, "global_step": 204727, "epoch": 4874} {"train_loss": -7.233519554138184, "global_step": 204728, "epoch": 4874} {"train_loss": -7.1793365478515625, "global_step": 204729, "epoch": 4874} {"train_loss": -7.265078544616699, "global_step": 204730, "epoch": 4874} {"train_loss": -7.2567315101623535, "global_step": 204731, "epoch": 4874} {"train_loss": -7.1630988121032715, "global_step": 204732, "epoch": 4874} {"train_loss": -7.290985107421875, "global_step": 204733, "epoch": 4874} {"train_loss": -7.208946704864502, "global_step": 204734, "epoch": 4874} {"train_loss": -7.307319641113281, "global_step": 204735, "epoch": 4874} {"train_loss": -7.26279878616333, "global_step": 204736, "epoch": 4874} {"train_loss": -7.200296401977539, "global_step": 204737, "epoch": 4874} {"train_loss": -7.232778072357178, "global_step": 204738, "epoch": 4874} {"train_loss": -7.229671478271484, "global_step": 204739, "epoch": 4874} {"train_loss": -7.282458782196045, "global_step": 204740, "epoch": 4874} {"train_loss": -7.349884986877441, "global_step": 204741, "epoch": 4874} {"train_loss": -7.229754447937012, "global_step": 204742, "epoch": 4874} {"train_loss": -7.3272504806518555, "global_step": 204743, "epoch": 4874} {"train_loss": -7.315828323364258, "global_step": 204744, "epoch": 4874} {"train_loss": -7.220120429992676, "global_step": 204745, "epoch": 4874} {"train_loss": -7.257845878601074, "global_step": 204746, "epoch": 4874} {"train_loss": -7.201735496520996, "global_step": 204747, "epoch": 4874} {"train_loss": -7.312227249145508, "global_step": 204748, "epoch": 4874} {"train_loss": -7.247008902685983, "global_step": 204749, "epoch": 4874, "val_loss": 81597.0390625} {"train_loss": -7.175905704498291, "global_step": 204750, "epoch": 4875} {"train_loss": -7.330583572387695, "global_step": 204751, "epoch": 4875} {"train_loss": -7.275457859039307, "global_step": 204752, "epoch": 4875} {"train_loss": -7.317806243896484, "global_step": 204753, "epoch": 4875} {"train_loss": -7.407540321350098, "global_step": 204754, "epoch": 4875} {"train_loss": -7.270086288452148, "global_step": 204755, "epoch": 4875} {"train_loss": -7.41722297668457, "global_step": 204756, "epoch": 4875} {"train_loss": -7.392821788787842, "global_step": 204757, "epoch": 4875} {"train_loss": -7.331709861755371, "global_step": 204758, "epoch": 4875} {"train_loss": -7.402204990386963, "global_step": 204759, "epoch": 4875} {"train_loss": -7.202553749084473, "global_step": 204760, "epoch": 4875} {"train_loss": -7.360810279846191, "global_step": 204761, "epoch": 4875} {"train_loss": -7.317387580871582, "global_step": 204762, "epoch": 4875} {"train_loss": -7.346165180206299, "global_step": 204763, "epoch": 4875} {"train_loss": -7.3590545654296875, "global_step": 204764, "epoch": 4875} {"train_loss": -7.345081329345703, "global_step": 204765, "epoch": 4875} {"train_loss": -7.4594550132751465, "global_step": 204766, "epoch": 4875} {"train_loss": -7.349411964416504, "global_step": 204767, "epoch": 4875} {"train_loss": -7.351977825164795, "global_step": 204768, "epoch": 4875} {"train_loss": -7.427546501159668, "global_step": 204769, "epoch": 4875} {"train_loss": -7.323813438415527, "global_step": 204770, "epoch": 4875} {"train_loss": -7.339690685272217, "global_step": 204771, "epoch": 4875} {"train_loss": -7.415932655334473, "global_step": 204772, "epoch": 4875} {"train_loss": -7.332313537597656, "global_step": 204773, "epoch": 4875} {"train_loss": -7.278425216674805, "global_step": 204774, "epoch": 4875} {"train_loss": -7.32393741607666, "global_step": 204775, "epoch": 4875} {"train_loss": -7.338441371917725, "global_step": 204776, "epoch": 4875} {"train_loss": -7.318508148193359, "global_step": 204777, "epoch": 4875} {"train_loss": -7.083841323852539, "global_step": 204778, "epoch": 4875} {"train_loss": -7.3125104904174805, "global_step": 204779, "epoch": 4875} {"train_loss": -7.276727676391602, "global_step": 204780, "epoch": 4875} {"train_loss": -7.292904853820801, "global_step": 204781, "epoch": 4875} {"train_loss": -7.333435535430908, "global_step": 204782, "epoch": 4875} {"train_loss": -7.422534942626953, "global_step": 204783, "epoch": 4875} {"train_loss": -7.28799295425415, "global_step": 204784, "epoch": 4875} {"train_loss": -7.312821865081787, "global_step": 204785, "epoch": 4875} {"train_loss": -7.331618309020996, "global_step": 204786, "epoch": 4875} {"train_loss": -7.320939064025879, "global_step": 204787, "epoch": 4875} {"train_loss": -7.356978416442871, "global_step": 204788, "epoch": 4875} {"train_loss": -7.2871246337890625, "global_step": 204789, "epoch": 4875} {"train_loss": -7.3472089767456055, "global_step": 204790, "epoch": 4875} {"train_loss": -7.3264787424178355, "global_step": 204791, "epoch": 4875, "val_loss": 81546.7890625} {"train_loss": -7.275242805480957, "global_step": 204792, "epoch": 4876} {"train_loss": -7.3890380859375, "global_step": 204793, "epoch": 4876} {"train_loss": -7.270102500915527, "global_step": 204794, "epoch": 4876} {"train_loss": -7.321897506713867, "global_step": 204795, "epoch": 4876} {"train_loss": -7.243373870849609, "global_step": 204796, "epoch": 4876} {"train_loss": -7.199812412261963, "global_step": 204797, "epoch": 4876} {"train_loss": -7.341433525085449, "global_step": 204798, "epoch": 4876} {"train_loss": -7.357437610626221, "global_step": 204799, "epoch": 4876} {"train_loss": -7.316874980926514, "global_step": 204800, "epoch": 4876} {"train_loss": -7.357030868530273, "global_step": 204801, "epoch": 4876} {"train_loss": -7.276893138885498, "global_step": 204802, "epoch": 4876} {"train_loss": -7.283110618591309, "global_step": 204803, "epoch": 4876} {"train_loss": -7.333923816680908, "global_step": 204804, "epoch": 4876} {"train_loss": -7.253478050231934, "global_step": 204805, "epoch": 4876} {"train_loss": -7.3553924560546875, "global_step": 204806, "epoch": 4876} {"train_loss": -7.433620452880859, "global_step": 204807, "epoch": 4876} {"train_loss": -7.249545574188232, "global_step": 204808, "epoch": 4876} {"train_loss": -7.354111194610596, "global_step": 204809, "epoch": 4876} {"train_loss": -7.257197380065918, "global_step": 204810, "epoch": 4876} {"train_loss": -7.309185981750488, "global_step": 204811, "epoch": 4876} {"train_loss": -7.437285900115967, "global_step": 204812, "epoch": 4876} {"train_loss": -7.306767463684082, "global_step": 204813, "epoch": 4876} {"train_loss": -7.271299362182617, "global_step": 204814, "epoch": 4876} {"train_loss": -7.257891654968262, "global_step": 204815, "epoch": 4876} {"train_loss": -7.4052019119262695, "global_step": 204816, "epoch": 4876} {"train_loss": -7.212730884552002, "global_step": 204817, "epoch": 4876} {"train_loss": -7.31693172454834, "global_step": 204818, "epoch": 4876} {"train_loss": -7.2492995262146, "global_step": 204819, "epoch": 4876} {"train_loss": -7.366607189178467, "global_step": 204820, "epoch": 4876} {"train_loss": -7.385272979736328, "global_step": 204821, "epoch": 4876} {"train_loss": -7.339381217956543, "global_step": 204822, "epoch": 4876} {"train_loss": -7.306236267089844, "global_step": 204823, "epoch": 4876} {"train_loss": -7.207937240600586, "global_step": 204824, "epoch": 4876} {"train_loss": -7.410327911376953, "global_step": 204825, "epoch": 4876} {"train_loss": -7.3088483810424805, "global_step": 204826, "epoch": 4876} {"train_loss": -7.289553642272949, "global_step": 204827, "epoch": 4876} {"train_loss": -7.425793170928955, "global_step": 204828, "epoch": 4876} {"train_loss": -7.303271770477295, "global_step": 204829, "epoch": 4876} {"train_loss": -7.386795520782471, "global_step": 204830, "epoch": 4876} {"train_loss": -7.405814170837402, "global_step": 204831, "epoch": 4876} {"train_loss": -7.38084602355957, "global_step": 204832, "epoch": 4876} {"train_loss": -7.31826358749753, "global_step": 204833, "epoch": 4876, "val_loss": 81952.8203125} {"train_loss": -7.341373920440674, "global_step": 204834, "epoch": 4877} {"train_loss": -7.3627753257751465, "global_step": 204835, "epoch": 4877} {"train_loss": -7.407174587249756, "global_step": 204836, "epoch": 4877} {"train_loss": -7.3973708152771, "global_step": 204837, "epoch": 4877} {"train_loss": -7.359094619750977, "global_step": 204838, "epoch": 4877} {"train_loss": -7.2540669441223145, "global_step": 204839, "epoch": 4877} {"train_loss": -7.395205020904541, "global_step": 204840, "epoch": 4877} {"train_loss": -7.332427978515625, "global_step": 204841, "epoch": 4877} {"train_loss": -7.285987377166748, "global_step": 204842, "epoch": 4877} {"train_loss": -7.325405597686768, "global_step": 204843, "epoch": 4877} {"train_loss": -7.26707124710083, "global_step": 204844, "epoch": 4877} {"train_loss": -7.412774085998535, "global_step": 204845, "epoch": 4877} {"train_loss": -7.280834197998047, "global_step": 204846, "epoch": 4877} {"train_loss": -7.179600715637207, "global_step": 204847, "epoch": 4877} {"train_loss": -7.436261177062988, "global_step": 204848, "epoch": 4877} {"train_loss": -7.296710968017578, "global_step": 204849, "epoch": 4877} {"train_loss": -7.2808732986450195, "global_step": 204850, "epoch": 4877} {"train_loss": -7.306456565856934, "global_step": 204851, "epoch": 4877} {"train_loss": -7.329000949859619, "global_step": 204852, "epoch": 4877} {"train_loss": -7.314530372619629, "global_step": 204853, "epoch": 4877} {"train_loss": -7.322292804718018, "global_step": 204854, "epoch": 4877} {"train_loss": -7.4207587242126465, "global_step": 204855, "epoch": 4877} {"train_loss": -7.278899192810059, "global_step": 204856, "epoch": 4877} {"train_loss": -7.379467964172363, "global_step": 204857, "epoch": 4877} {"train_loss": -7.313107490539551, "global_step": 204858, "epoch": 4877} {"train_loss": -7.312836647033691, "global_step": 204859, "epoch": 4877} {"train_loss": -7.413642883300781, "global_step": 204860, "epoch": 4877} {"train_loss": -7.336358070373535, "global_step": 204861, "epoch": 4877} {"train_loss": -7.430019378662109, "global_step": 204862, "epoch": 4877} {"train_loss": -7.283987522125244, "global_step": 204863, "epoch": 4877} {"train_loss": -7.308315277099609, "global_step": 204864, "epoch": 4877} {"train_loss": -7.429560661315918, "global_step": 204865, "epoch": 4877} {"train_loss": -7.390481472015381, "global_step": 204866, "epoch": 4877} {"train_loss": -7.322224140167236, "global_step": 204867, "epoch": 4877} {"train_loss": -7.34766960144043, "global_step": 204868, "epoch": 4877} {"train_loss": -7.342099189758301, "global_step": 204869, "epoch": 4877} {"train_loss": -7.329019546508789, "global_step": 204870, "epoch": 4877} {"train_loss": -7.351265907287598, "global_step": 204871, "epoch": 4877} {"train_loss": -7.297213077545166, "global_step": 204872, "epoch": 4877} {"train_loss": -7.1954145431518555, "global_step": 204873, "epoch": 4877} {"train_loss": -7.2998456954956055, "global_step": 204874, "epoch": 4877} {"train_loss": -7.330615872428531, "global_step": 204875, "epoch": 4877, "val_loss": 81884.8671875} {"train_loss": -7.395720481872559, "global_step": 204876, "epoch": 4878} {"train_loss": -7.189027309417725, "global_step": 204877, "epoch": 4878} {"train_loss": -7.111034393310547, "global_step": 204878, "epoch": 4878} {"train_loss": -7.352725982666016, "global_step": 204879, "epoch": 4878} {"train_loss": -7.251859188079834, "global_step": 204880, "epoch": 4878} {"train_loss": -7.296303749084473, "global_step": 204881, "epoch": 4878} {"train_loss": -7.290686130523682, "global_step": 204882, "epoch": 4878} {"train_loss": -7.227600574493408, "global_step": 204883, "epoch": 4878} {"train_loss": -7.2349677085876465, "global_step": 204884, "epoch": 4878} {"train_loss": -7.303986072540283, "global_step": 204885, "epoch": 4878} {"train_loss": -7.285800457000732, "global_step": 204886, "epoch": 4878} {"train_loss": -7.268886089324951, "global_step": 204887, "epoch": 4878} {"train_loss": -7.160513401031494, "global_step": 204888, "epoch": 4878} {"train_loss": -7.233500957489014, "global_step": 204889, "epoch": 4878} {"train_loss": -7.2277679443359375, "global_step": 204890, "epoch": 4878} {"train_loss": -7.155942916870117, "global_step": 204891, "epoch": 4878} {"train_loss": -7.0682830810546875, "global_step": 204892, "epoch": 4878} {"train_loss": -7.230679512023926, "global_step": 204893, "epoch": 4878} {"train_loss": -7.135781764984131, "global_step": 204894, "epoch": 4878} {"train_loss": -7.149306297302246, "global_step": 204895, "epoch": 4878} {"train_loss": -7.080709934234619, "global_step": 204896, "epoch": 4878} {"train_loss": -7.399697303771973, "global_step": 204897, "epoch": 4878} {"train_loss": -7.156649589538574, "global_step": 204898, "epoch": 4878} {"train_loss": -7.243412017822266, "global_step": 204899, "epoch": 4878} {"train_loss": -7.191804885864258, "global_step": 204900, "epoch": 4878} {"train_loss": -7.280213356018066, "global_step": 204901, "epoch": 4878} {"train_loss": -7.251308917999268, "global_step": 204902, "epoch": 4878} {"train_loss": -7.193782329559326, "global_step": 204903, "epoch": 4878} {"train_loss": -7.256907939910889, "global_step": 204904, "epoch": 4878} {"train_loss": -7.313940048217773, "global_step": 204905, "epoch": 4878} {"train_loss": -7.379071235656738, "global_step": 204906, "epoch": 4878} {"train_loss": -7.21882438659668, "global_step": 204907, "epoch": 4878} {"train_loss": -7.398862361907959, "global_step": 204908, "epoch": 4878} {"train_loss": -7.434051990509033, "global_step": 204909, "epoch": 4878} {"train_loss": -7.336148262023926, "global_step": 204910, "epoch": 4878} {"train_loss": -7.3420867919921875, "global_step": 204911, "epoch": 4878} {"train_loss": -7.3660664558410645, "global_step": 204912, "epoch": 4878} {"train_loss": -7.327522277832031, "global_step": 204913, "epoch": 4878} {"train_loss": -7.360806465148926, "global_step": 204914, "epoch": 4878} {"train_loss": -7.419045448303223, "global_step": 204915, "epoch": 4878} {"train_loss": -7.326292991638184, "global_step": 204916, "epoch": 4878} {"train_loss": -7.26693514415196, "global_step": 204917, "epoch": 4878, "val_loss": 81622.375} {"train_loss": -7.289250373840332, "global_step": 204918, "epoch": 4879} {"train_loss": -7.331761837005615, "global_step": 204919, "epoch": 4879} {"train_loss": -7.389100074768066, "global_step": 204920, "epoch": 4879} {"train_loss": -7.307867050170898, "global_step": 204921, "epoch": 4879} {"train_loss": -7.383432865142822, "global_step": 204922, "epoch": 4879} {"train_loss": -7.354970932006836, "global_step": 204923, "epoch": 4879} {"train_loss": -7.294269561767578, "global_step": 204924, "epoch": 4879} {"train_loss": -7.430600166320801, "global_step": 204925, "epoch": 4879} {"train_loss": -7.507234573364258, "global_step": 204926, "epoch": 4879} {"train_loss": -7.483917236328125, "global_step": 204927, "epoch": 4879} {"train_loss": -7.548017501831055, "global_step": 204928, "epoch": 4879} {"train_loss": -7.364098072052002, "global_step": 204929, "epoch": 4879} {"train_loss": -7.3302083015441895, "global_step": 204930, "epoch": 4879} {"train_loss": -7.337186813354492, "global_step": 204931, "epoch": 4879} {"train_loss": -7.345221042633057, "global_step": 204932, "epoch": 4879} {"train_loss": -7.326155662536621, "global_step": 204933, "epoch": 4879} {"train_loss": -7.375916481018066, "global_step": 204934, "epoch": 4879} {"train_loss": -7.403647422790527, "global_step": 204935, "epoch": 4879} {"train_loss": -7.335005760192871, "global_step": 204936, "epoch": 4879} {"train_loss": -7.3510422706604, "global_step": 204937, "epoch": 4879} {"train_loss": -7.282687187194824, "global_step": 204938, "epoch": 4879} {"train_loss": -7.431349754333496, "global_step": 204939, "epoch": 4879} {"train_loss": -7.415238380432129, "global_step": 204940, "epoch": 4879} {"train_loss": -7.413753986358643, "global_step": 204941, "epoch": 4879} {"train_loss": -7.308274745941162, "global_step": 204942, "epoch": 4879} {"train_loss": -7.418338775634766, "global_step": 204943, "epoch": 4879} {"train_loss": -7.269626617431641, "global_step": 204944, "epoch": 4879} {"train_loss": -7.334911346435547, "global_step": 204945, "epoch": 4879} {"train_loss": -7.402369499206543, "global_step": 204946, "epoch": 4879} {"train_loss": -7.408683776855469, "global_step": 204947, "epoch": 4879} {"train_loss": -7.37293004989624, "global_step": 204948, "epoch": 4879} {"train_loss": -7.308882713317871, "global_step": 204949, "epoch": 4879} {"train_loss": -7.333800792694092, "global_step": 204950, "epoch": 4879} {"train_loss": -7.3483171463012695, "global_step": 204951, "epoch": 4879} {"train_loss": -7.367156505584717, "global_step": 204952, "epoch": 4879} {"train_loss": -7.397185802459717, "global_step": 204953, "epoch": 4879} {"train_loss": -7.330057144165039, "global_step": 204954, "epoch": 4879} {"train_loss": -7.401486873626709, "global_step": 204955, "epoch": 4879} {"train_loss": -7.28399658203125, "global_step": 204956, "epoch": 4879} {"train_loss": -7.09637451171875, "global_step": 204957, "epoch": 4879} {"train_loss": -7.402769565582275, "global_step": 204958, "epoch": 4879} {"train_loss": -7.359065634863717, "global_step": 204959, "epoch": 4879, "val_loss": 81731.765625} {"train_loss": -7.245212078094482, "global_step": 204960, "epoch": 4880} {"train_loss": -7.316524982452393, "global_step": 204961, "epoch": 4880} {"train_loss": -7.210484504699707, "global_step": 204962, "epoch": 4880} {"train_loss": -7.164039611816406, "global_step": 204963, "epoch": 4880} {"train_loss": -7.0345458984375, "global_step": 204964, "epoch": 4880} {"train_loss": -7.0598039627075195, "global_step": 204965, "epoch": 4880} {"train_loss": -7.095681190490723, "global_step": 204966, "epoch": 4880} {"train_loss": -7.076108932495117, "global_step": 204967, "epoch": 4880} {"train_loss": -7.210736274719238, "global_step": 204968, "epoch": 4880} {"train_loss": -7.19140100479126, "global_step": 204969, "epoch": 4880} {"train_loss": -7.022884845733643, "global_step": 204970, "epoch": 4880} {"train_loss": -7.28817892074585, "global_step": 204971, "epoch": 4880} {"train_loss": -7.10526704788208, "global_step": 204972, "epoch": 4880} {"train_loss": -7.200922012329102, "global_step": 204973, "epoch": 4880} {"train_loss": -7.186158657073975, "global_step": 204974, "epoch": 4880} {"train_loss": -7.1436262130737305, "global_step": 204975, "epoch": 4880} {"train_loss": -7.19657039642334, "global_step": 204976, "epoch": 4880} {"train_loss": -7.295380592346191, "global_step": 204977, "epoch": 4880} {"train_loss": -7.210298538208008, "global_step": 204978, "epoch": 4880} {"train_loss": -7.265929222106934, "global_step": 204979, "epoch": 4880} {"train_loss": -7.107106685638428, "global_step": 204980, "epoch": 4880} {"train_loss": -7.0569634437561035, "global_step": 204981, "epoch": 4880} {"train_loss": -7.1376214027404785, "global_step": 204982, "epoch": 4880} {"train_loss": -7.1190505027771, "global_step": 204983, "epoch": 4880} {"train_loss": -7.231710910797119, "global_step": 204984, "epoch": 4880} {"train_loss": -7.164172172546387, "global_step": 204985, "epoch": 4880} {"train_loss": -7.151493072509766, "global_step": 204986, "epoch": 4880} {"train_loss": -7.223069190979004, "global_step": 204987, "epoch": 4880} {"train_loss": -7.14629602432251, "global_step": 204988, "epoch": 4880} {"train_loss": -7.264141082763672, "global_step": 204989, "epoch": 4880} {"train_loss": -7.185986518859863, "global_step": 204990, "epoch": 4880} {"train_loss": -7.154099464416504, "global_step": 204991, "epoch": 4880} {"train_loss": -7.205389022827148, "global_step": 204992, "epoch": 4880} {"train_loss": -7.208474159240723, "global_step": 204993, "epoch": 4880} {"train_loss": -7.166904449462891, "global_step": 204994, "epoch": 4880} {"train_loss": -7.32073450088501, "global_step": 204995, "epoch": 4880} {"train_loss": -7.346667766571045, "global_step": 204996, "epoch": 4880} {"train_loss": -7.254651069641113, "global_step": 204997, "epoch": 4880} {"train_loss": -7.220947742462158, "global_step": 204998, "epoch": 4880} {"train_loss": -7.351188659667969, "global_step": 204999, "epoch": 4880} {"train_loss": -7.329374313354492, "global_step": 205000, "epoch": 4880} {"train_loss": -7.191097566059658, "global_step": 205001, "epoch": 4880, "val_loss": 81789.5625} {"train_loss": -7.374497413635254, "global_step": 205002, "epoch": 4881} {"train_loss": -7.313982009887695, "global_step": 205003, "epoch": 4881} {"train_loss": -7.29619026184082, "global_step": 205004, "epoch": 4881} {"train_loss": -7.148153305053711, "global_step": 205005, "epoch": 4881} {"train_loss": -7.311749458312988, "global_step": 205006, "epoch": 4881} {"train_loss": -7.305211067199707, "global_step": 205007, "epoch": 4881} {"train_loss": -7.355568885803223, "global_step": 205008, "epoch": 4881} {"train_loss": -7.282596111297607, "global_step": 205009, "epoch": 4881} {"train_loss": -7.2407426834106445, "global_step": 205010, "epoch": 4881} {"train_loss": -7.383121490478516, "global_step": 205011, "epoch": 4881} {"train_loss": -7.2322845458984375, "global_step": 205012, "epoch": 4881} {"train_loss": -7.28782844543457, "global_step": 205013, "epoch": 4881} {"train_loss": -7.236359119415283, "global_step": 205014, "epoch": 4881} {"train_loss": -7.223397254943848, "global_step": 205015, "epoch": 4881} {"train_loss": -7.241786479949951, "global_step": 205016, "epoch": 4881} {"train_loss": -7.17909049987793, "global_step": 205017, "epoch": 4881} {"train_loss": -7.266977787017822, "global_step": 205018, "epoch": 4881} {"train_loss": -7.1542558670043945, "global_step": 205019, "epoch": 4881} {"train_loss": -7.364472389221191, "global_step": 205020, "epoch": 4881} {"train_loss": -7.200992584228516, "global_step": 205021, "epoch": 4881} {"train_loss": -7.263491630554199, "global_step": 205022, "epoch": 4881} {"train_loss": -7.368870258331299, "global_step": 205023, "epoch": 4881} {"train_loss": -7.186316013336182, "global_step": 205024, "epoch": 4881} {"train_loss": -7.345811367034912, "global_step": 205025, "epoch": 4881} {"train_loss": -7.28004264831543, "global_step": 205026, "epoch": 4881} {"train_loss": -7.244110107421875, "global_step": 205027, "epoch": 4881} {"train_loss": -7.175127029418945, "global_step": 205028, "epoch": 4881} {"train_loss": -7.306371688842773, "global_step": 205029, "epoch": 4881} {"train_loss": -7.396995544433594, "global_step": 205030, "epoch": 4881} {"train_loss": -7.294548034667969, "global_step": 205031, "epoch": 4881} {"train_loss": -7.237520694732666, "global_step": 205032, "epoch": 4881} {"train_loss": -7.302865028381348, "global_step": 205033, "epoch": 4881} {"train_loss": -7.285590648651123, "global_step": 205034, "epoch": 4881} {"train_loss": -7.303165435791016, "global_step": 205035, "epoch": 4881} {"train_loss": -7.352516174316406, "global_step": 205036, "epoch": 4881} {"train_loss": -7.374665260314941, "global_step": 205037, "epoch": 4881} {"train_loss": -7.319468021392822, "global_step": 205038, "epoch": 4881} {"train_loss": -7.418257713317871, "global_step": 205039, "epoch": 4881} {"train_loss": -7.306334495544434, "global_step": 205040, "epoch": 4881} {"train_loss": -7.320863723754883, "global_step": 205041, "epoch": 4881} {"train_loss": -7.254062652587891, "global_step": 205042, "epoch": 4881} {"train_loss": -7.286238318397885, "global_step": 205043, "epoch": 4881, "val_loss": 81877.5078125} {"train_loss": -7.344616413116455, "global_step": 205044, "epoch": 4882} {"train_loss": -7.379417419433594, "global_step": 205045, "epoch": 4882} {"train_loss": -7.287014007568359, "global_step": 205046, "epoch": 4882} {"train_loss": -7.325359344482422, "global_step": 205047, "epoch": 4882} {"train_loss": -7.397214889526367, "global_step": 205048, "epoch": 4882} {"train_loss": -7.379133701324463, "global_step": 205049, "epoch": 4882} {"train_loss": -7.312833786010742, "global_step": 205050, "epoch": 4882} {"train_loss": -7.378113746643066, "global_step": 205051, "epoch": 4882} {"train_loss": -7.199511528015137, "global_step": 205052, "epoch": 4882} {"train_loss": -7.235194206237793, "global_step": 205053, "epoch": 4882} {"train_loss": -7.36363410949707, "global_step": 205054, "epoch": 4882} {"train_loss": -7.190977573394775, "global_step": 205055, "epoch": 4882} {"train_loss": -7.2975873947143555, "global_step": 205056, "epoch": 4882} {"train_loss": -7.301226615905762, "global_step": 205057, "epoch": 4882} {"train_loss": -7.203643798828125, "global_step": 205058, "epoch": 4882} {"train_loss": -7.276546001434326, "global_step": 205059, "epoch": 4882} {"train_loss": -7.315434455871582, "global_step": 205060, "epoch": 4882} {"train_loss": -7.141078948974609, "global_step": 205061, "epoch": 4882} {"train_loss": -7.40927791595459, "global_step": 205062, "epoch": 4882} {"train_loss": -7.096864700317383, "global_step": 205063, "epoch": 4882} {"train_loss": -7.394981861114502, "global_step": 205064, "epoch": 4882} {"train_loss": -7.411781311035156, "global_step": 205065, "epoch": 4882} {"train_loss": -7.314919471740723, "global_step": 205066, "epoch": 4882} {"train_loss": -7.3441667556762695, "global_step": 205067, "epoch": 4882} {"train_loss": -7.201203346252441, "global_step": 205068, "epoch": 4882} {"train_loss": -7.335544109344482, "global_step": 205069, "epoch": 4882} {"train_loss": -7.277597427368164, "global_step": 205070, "epoch": 4882} {"train_loss": -7.322342872619629, "global_step": 205071, "epoch": 4882} {"train_loss": -7.251105308532715, "global_step": 205072, "epoch": 4882} {"train_loss": -7.163962364196777, "global_step": 205073, "epoch": 4882} {"train_loss": -7.235539436340332, "global_step": 205074, "epoch": 4882} {"train_loss": -7.166134834289551, "global_step": 205075, "epoch": 4882} {"train_loss": -7.34724760055542, "global_step": 205076, "epoch": 4882} {"train_loss": -7.133157730102539, "global_step": 205077, "epoch": 4882} {"train_loss": -7.26915168762207, "global_step": 205078, "epoch": 4882} {"train_loss": -7.129871368408203, "global_step": 205079, "epoch": 4882} {"train_loss": -7.349389553070068, "global_step": 205080, "epoch": 4882} {"train_loss": -7.087544918060303, "global_step": 205081, "epoch": 4882} {"train_loss": -7.354981422424316, "global_step": 205082, "epoch": 4882} {"train_loss": -7.219512462615967, "global_step": 205083, "epoch": 4882} {"train_loss": -7.225218296051025, "global_step": 205084, "epoch": 4882} {"train_loss": -7.274124554225376, "global_step": 205085, "epoch": 4882, "val_loss": 82155.8671875} {"train_loss": -7.208595275878906, "global_step": 205086, "epoch": 4883} {"train_loss": -7.1844072341918945, "global_step": 205087, "epoch": 4883} {"train_loss": -7.282360076904297, "global_step": 205088, "epoch": 4883} {"train_loss": -7.13739013671875, "global_step": 205089, "epoch": 4883} {"train_loss": -7.305905342102051, "global_step": 205090, "epoch": 4883} {"train_loss": -7.33791446685791, "global_step": 205091, "epoch": 4883} {"train_loss": -7.308928489685059, "global_step": 205092, "epoch": 4883} {"train_loss": -7.263021945953369, "global_step": 205093, "epoch": 4883} {"train_loss": -7.301965713500977, "global_step": 205094, "epoch": 4883} {"train_loss": -7.356256484985352, "global_step": 205095, "epoch": 4883} {"train_loss": -7.298246383666992, "global_step": 205096, "epoch": 4883} {"train_loss": -7.336692810058594, "global_step": 205097, "epoch": 4883} {"train_loss": -7.530643939971924, "global_step": 205098, "epoch": 4883} {"train_loss": -7.344270706176758, "global_step": 205099, "epoch": 4883} {"train_loss": -7.360965728759766, "global_step": 205100, "epoch": 4883} {"train_loss": -7.323188781738281, "global_step": 205101, "epoch": 4883} {"train_loss": -7.262627124786377, "global_step": 205102, "epoch": 4883} {"train_loss": -7.342520713806152, "global_step": 205103, "epoch": 4883} {"train_loss": -7.336734771728516, "global_step": 205104, "epoch": 4883} {"train_loss": -7.403043746948242, "global_step": 205105, "epoch": 4883} {"train_loss": -7.250182151794434, "global_step": 205106, "epoch": 4883} {"train_loss": -7.320047378540039, "global_step": 205107, "epoch": 4883} {"train_loss": -7.318908214569092, "global_step": 205108, "epoch": 4883} {"train_loss": -7.279541969299316, "global_step": 205109, "epoch": 4883} {"train_loss": -7.3007097244262695, "global_step": 205110, "epoch": 4883} {"train_loss": -7.296676158905029, "global_step": 205111, "epoch": 4883} {"train_loss": -7.430594444274902, "global_step": 205112, "epoch": 4883} {"train_loss": -7.342560768127441, "global_step": 205113, "epoch": 4883} {"train_loss": -7.329309940338135, "global_step": 205114, "epoch": 4883} {"train_loss": -7.375253200531006, "global_step": 205115, "epoch": 4883} {"train_loss": -7.290218353271484, "global_step": 205116, "epoch": 4883} {"train_loss": -7.3744916915893555, "global_step": 205117, "epoch": 4883} {"train_loss": -7.189144611358643, "global_step": 205118, "epoch": 4883} {"train_loss": -7.376304626464844, "global_step": 205119, "epoch": 4883} {"train_loss": -7.289115905761719, "global_step": 205120, "epoch": 4883} {"train_loss": -7.2466044425964355, "global_step": 205121, "epoch": 4883} {"train_loss": -7.348076820373535, "global_step": 205122, "epoch": 4883} {"train_loss": -7.309314727783203, "global_step": 205123, "epoch": 4883} {"train_loss": -7.245664119720459, "global_step": 205124, "epoch": 4883} {"train_loss": -7.276375770568848, "global_step": 205125, "epoch": 4883} {"train_loss": -7.345542907714844, "global_step": 205126, "epoch": 4883} {"train_loss": -7.311639831179664, "global_step": 205127, "epoch": 4883, "val_loss": 81744.2421875} {"train_loss": -7.378218650817871, "global_step": 205128, "epoch": 4884} {"train_loss": -7.408190727233887, "global_step": 205129, "epoch": 4884} {"train_loss": -7.268478870391846, "global_step": 205130, "epoch": 4884} {"train_loss": -7.243138313293457, "global_step": 205131, "epoch": 4884} {"train_loss": -7.372330188751221, "global_step": 205132, "epoch": 4884} {"train_loss": -7.2804999351501465, "global_step": 205133, "epoch": 4884} {"train_loss": -7.228419303894043, "global_step": 205134, "epoch": 4884} {"train_loss": -7.292194366455078, "global_step": 205135, "epoch": 4884} {"train_loss": -7.306952476501465, "global_step": 205136, "epoch": 4884} {"train_loss": -7.393257141113281, "global_step": 205137, "epoch": 4884} {"train_loss": -7.347390651702881, "global_step": 205138, "epoch": 4884} {"train_loss": -7.2668986320495605, "global_step": 205139, "epoch": 4884} {"train_loss": -7.2829999923706055, "global_step": 205140, "epoch": 4884} {"train_loss": -7.39323091506958, "global_step": 205141, "epoch": 4884} {"train_loss": -7.375761032104492, "global_step": 205142, "epoch": 4884} {"train_loss": -7.358555793762207, "global_step": 205143, "epoch": 4884} {"train_loss": -7.322758197784424, "global_step": 205144, "epoch": 4884} {"train_loss": -7.302448272705078, "global_step": 205145, "epoch": 4884} {"train_loss": -7.413425445556641, "global_step": 205146, "epoch": 4884} {"train_loss": -7.35059118270874, "global_step": 205147, "epoch": 4884} {"train_loss": -7.349440097808838, "global_step": 205148, "epoch": 4884} {"train_loss": -7.428169250488281, "global_step": 205149, "epoch": 4884} {"train_loss": -7.35645866394043, "global_step": 205150, "epoch": 4884} {"train_loss": -7.371400833129883, "global_step": 205151, "epoch": 4884} {"train_loss": -7.428187370300293, "global_step": 205152, "epoch": 4884} {"train_loss": -7.387309551239014, "global_step": 205153, "epoch": 4884} {"train_loss": -7.280119895935059, "global_step": 205154, "epoch": 4884} {"train_loss": -7.43499755859375, "global_step": 205155, "epoch": 4884} {"train_loss": -7.438098430633545, "global_step": 205156, "epoch": 4884} {"train_loss": -7.3431196212768555, "global_step": 205157, "epoch": 4884} {"train_loss": -7.523096084594727, "global_step": 205158, "epoch": 4884} {"train_loss": -7.433516502380371, "global_step": 205159, "epoch": 4884} {"train_loss": -7.33881950378418, "global_step": 205160, "epoch": 4884} {"train_loss": -7.214754104614258, "global_step": 205161, "epoch": 4884} {"train_loss": -7.3644609451293945, "global_step": 205162, "epoch": 4884} {"train_loss": -7.1895904541015625, "global_step": 205163, "epoch": 4884} {"train_loss": -7.2074456214904785, "global_step": 205164, "epoch": 4884} {"train_loss": -7.296313285827637, "global_step": 205165, "epoch": 4884} {"train_loss": -7.298864841461182, "global_step": 205166, "epoch": 4884} {"train_loss": -7.171375274658203, "global_step": 205167, "epoch": 4884} {"train_loss": -7.370298385620117, "global_step": 205168, "epoch": 4884} {"train_loss": -7.335176967439198, "global_step": 205169, "epoch": 4884, "val_loss": 81697.8359375} {"train_loss": -7.288962364196777, "global_step": 205170, "epoch": 4885} {"train_loss": -7.296396255493164, "global_step": 205171, "epoch": 4885} {"train_loss": -7.2550225257873535, "global_step": 205172, "epoch": 4885} {"train_loss": -7.230893611907959, "global_step": 205173, "epoch": 4885} {"train_loss": -7.265535354614258, "global_step": 205174, "epoch": 4885} {"train_loss": -7.323627471923828, "global_step": 205175, "epoch": 4885} {"train_loss": -7.246445178985596, "global_step": 205176, "epoch": 4885} {"train_loss": -7.320699691772461, "global_step": 205177, "epoch": 4885} {"train_loss": -7.394114017486572, "global_step": 205178, "epoch": 4885} {"train_loss": -7.408837795257568, "global_step": 205179, "epoch": 4885} {"train_loss": -7.357309341430664, "global_step": 205180, "epoch": 4885} {"train_loss": -7.2965593338012695, "global_step": 205181, "epoch": 4885} {"train_loss": -7.323330879211426, "global_step": 205182, "epoch": 4885} {"train_loss": -7.454608917236328, "global_step": 205183, "epoch": 4885} {"train_loss": -7.286588668823242, "global_step": 205184, "epoch": 4885} {"train_loss": -7.226336479187012, "global_step": 205185, "epoch": 4885} {"train_loss": -7.443653106689453, "global_step": 205186, "epoch": 4885} {"train_loss": -7.35590934753418, "global_step": 205187, "epoch": 4885} {"train_loss": -7.357603073120117, "global_step": 205188, "epoch": 4885} {"train_loss": -7.29442834854126, "global_step": 205189, "epoch": 4885} {"train_loss": -7.266496181488037, "global_step": 205190, "epoch": 4885} {"train_loss": -7.489461898803711, "global_step": 205191, "epoch": 4885} {"train_loss": -7.344325065612793, "global_step": 205192, "epoch": 4885} {"train_loss": -7.240464210510254, "global_step": 205193, "epoch": 4885} {"train_loss": -7.4336256980896, "global_step": 205194, "epoch": 4885} {"train_loss": -7.318390846252441, "global_step": 205195, "epoch": 4885} {"train_loss": -7.356816291809082, "global_step": 205196, "epoch": 4885} {"train_loss": -7.2207746505737305, "global_step": 205197, "epoch": 4885} {"train_loss": -7.316521644592285, "global_step": 205198, "epoch": 4885} {"train_loss": -7.39434814453125, "global_step": 205199, "epoch": 4885} {"train_loss": -7.30756950378418, "global_step": 205200, "epoch": 4885} {"train_loss": -7.3297014236450195, "global_step": 205201, "epoch": 4885} {"train_loss": -7.371785640716553, "global_step": 205202, "epoch": 4885} {"train_loss": -7.226736068725586, "global_step": 205203, "epoch": 4885} {"train_loss": -7.327444076538086, "global_step": 205204, "epoch": 4885} {"train_loss": -7.20992374420166, "global_step": 205205, "epoch": 4885} {"train_loss": -7.3664350509643555, "global_step": 205206, "epoch": 4885} {"train_loss": -7.19409704208374, "global_step": 205207, "epoch": 4885} {"train_loss": -7.188977241516113, "global_step": 205208, "epoch": 4885} {"train_loss": -7.325416564941406, "global_step": 205209, "epoch": 4885} {"train_loss": -7.150275230407715, "global_step": 205210, "epoch": 4885} {"train_loss": -7.3103068215506415, "global_step": 205211, "epoch": 4885, "val_loss": 82029.6328125} {"train_loss": -7.2019734382629395, "global_step": 205212, "epoch": 4886} {"train_loss": -7.267743110656738, "global_step": 205213, "epoch": 4886} {"train_loss": -7.264266490936279, "global_step": 205214, "epoch": 4886} {"train_loss": -7.287370681762695, "global_step": 205215, "epoch": 4886} {"train_loss": -7.347003936767578, "global_step": 205216, "epoch": 4886} {"train_loss": -7.303755283355713, "global_step": 205217, "epoch": 4886} {"train_loss": -7.333542346954346, "global_step": 205218, "epoch": 4886} {"train_loss": -7.3109283447265625, "global_step": 205219, "epoch": 4886} {"train_loss": -7.2498064041137695, "global_step": 205220, "epoch": 4886} {"train_loss": -7.382900238037109, "global_step": 205221, "epoch": 4886} {"train_loss": -7.4118499755859375, "global_step": 205222, "epoch": 4886} {"train_loss": -7.265296936035156, "global_step": 205223, "epoch": 4886} {"train_loss": -7.226570129394531, "global_step": 205224, "epoch": 4886} {"train_loss": -7.3429765701293945, "global_step": 205225, "epoch": 4886} {"train_loss": -7.373443603515625, "global_step": 205226, "epoch": 4886} {"train_loss": -7.335623741149902, "global_step": 205227, "epoch": 4886} {"train_loss": -7.257833003997803, "global_step": 205228, "epoch": 4886} {"train_loss": -7.456185340881348, "global_step": 205229, "epoch": 4886} {"train_loss": -7.412431716918945, "global_step": 205230, "epoch": 4886} {"train_loss": -7.369800567626953, "global_step": 205231, "epoch": 4886} {"train_loss": -7.313769340515137, "global_step": 205232, "epoch": 4886} {"train_loss": -7.366395950317383, "global_step": 205233, "epoch": 4886} {"train_loss": -7.2688140869140625, "global_step": 205234, "epoch": 4886} {"train_loss": -7.324544906616211, "global_step": 205235, "epoch": 4886} {"train_loss": -7.367749214172363, "global_step": 205236, "epoch": 4886} {"train_loss": -7.312287330627441, "global_step": 205237, "epoch": 4886} {"train_loss": -7.459088325500488, "global_step": 205238, "epoch": 4886} {"train_loss": -7.301360130310059, "global_step": 205239, "epoch": 4886} {"train_loss": -7.253952980041504, "global_step": 205240, "epoch": 4886} {"train_loss": -7.233615875244141, "global_step": 205241, "epoch": 4886} {"train_loss": -7.163476943969727, "global_step": 205242, "epoch": 4886} {"train_loss": -7.14887809753418, "global_step": 205243, "epoch": 4886} {"train_loss": -7.166697978973389, "global_step": 205244, "epoch": 4886} {"train_loss": -7.43239688873291, "global_step": 205245, "epoch": 4886} {"train_loss": -7.1678996086120605, "global_step": 205246, "epoch": 4886} {"train_loss": -7.347846031188965, "global_step": 205247, "epoch": 4886} {"train_loss": -7.21579647064209, "global_step": 205248, "epoch": 4886} {"train_loss": -7.330409526824951, "global_step": 205249, "epoch": 4886} {"train_loss": -7.193491458892822, "global_step": 205250, "epoch": 4886} {"train_loss": -7.340551853179932, "global_step": 205251, "epoch": 4886} {"train_loss": -7.284496307373047, "global_step": 205252, "epoch": 4886} {"train_loss": -7.301560242970784, "global_step": 205253, "epoch": 4886, "val_loss": 81500.9921875} {"train_loss": -7.2558746337890625, "global_step": 205254, "epoch": 4887} {"train_loss": -7.224366188049316, "global_step": 205255, "epoch": 4887} {"train_loss": -7.319575786590576, "global_step": 205256, "epoch": 4887} {"train_loss": -7.367921829223633, "global_step": 205257, "epoch": 4887} {"train_loss": -7.322548866271973, "global_step": 205258, "epoch": 4887} {"train_loss": -7.321362495422363, "global_step": 205259, "epoch": 4887} {"train_loss": -7.359125137329102, "global_step": 205260, "epoch": 4887} {"train_loss": -7.3783464431762695, "global_step": 205261, "epoch": 4887} {"train_loss": -7.383018493652344, "global_step": 205262, "epoch": 4887} {"train_loss": -7.26354455947876, "global_step": 205263, "epoch": 4887} {"train_loss": -7.339601516723633, "global_step": 205264, "epoch": 4887} {"train_loss": -7.3682661056518555, "global_step": 205265, "epoch": 4887} {"train_loss": -7.304316520690918, "global_step": 205266, "epoch": 4887} {"train_loss": -7.363938808441162, "global_step": 205267, "epoch": 4887} {"train_loss": -7.3213725090026855, "global_step": 205268, "epoch": 4887} {"train_loss": -7.346385955810547, "global_step": 205269, "epoch": 4887} {"train_loss": -7.383065700531006, "global_step": 205270, "epoch": 4887} {"train_loss": -7.232774257659912, "global_step": 205271, "epoch": 4887} {"train_loss": -7.311076641082764, "global_step": 205272, "epoch": 4887} {"train_loss": -7.435439109802246, "global_step": 205273, "epoch": 4887} {"train_loss": -7.327250003814697, "global_step": 205274, "epoch": 4887} {"train_loss": -7.316176891326904, "global_step": 205275, "epoch": 4887} {"train_loss": -7.271726608276367, "global_step": 205276, "epoch": 4887} {"train_loss": -7.241368293762207, "global_step": 205277, "epoch": 4887} {"train_loss": -7.370495319366455, "global_step": 205278, "epoch": 4887} {"train_loss": -7.3512468338012695, "global_step": 205279, "epoch": 4887} {"train_loss": -7.291559219360352, "global_step": 205280, "epoch": 4887} {"train_loss": -7.4151716232299805, "global_step": 205281, "epoch": 4887} {"train_loss": -7.383464813232422, "global_step": 205282, "epoch": 4887} {"train_loss": -7.293622970581055, "global_step": 205283, "epoch": 4887} {"train_loss": -7.362082481384277, "global_step": 205284, "epoch": 4887} {"train_loss": -7.343993186950684, "global_step": 205285, "epoch": 4887} {"train_loss": -7.415909767150879, "global_step": 205286, "epoch": 4887} {"train_loss": -7.385045528411865, "global_step": 205287, "epoch": 4887} {"train_loss": -7.324566841125488, "global_step": 205288, "epoch": 4887} {"train_loss": -7.4239373207092285, "global_step": 205289, "epoch": 4887} {"train_loss": -7.402832508087158, "global_step": 205290, "epoch": 4887} {"train_loss": -7.433277606964111, "global_step": 205291, "epoch": 4887} {"train_loss": -7.376301288604736, "global_step": 205292, "epoch": 4887} {"train_loss": -7.510737895965576, "global_step": 205293, "epoch": 4887} {"train_loss": -7.349985599517822, "global_step": 205294, "epoch": 4887} {"train_loss": -7.348290761311849, "global_step": 205295, "epoch": 4887, "val_loss": 81769.453125} {"train_loss": -7.350836277008057, "global_step": 205296, "epoch": 4888} {"train_loss": -7.424525260925293, "global_step": 205297, "epoch": 4888} {"train_loss": -7.2491021156311035, "global_step": 205298, "epoch": 4888} {"train_loss": -7.300519943237305, "global_step": 205299, "epoch": 4888} {"train_loss": -7.238279342651367, "global_step": 205300, "epoch": 4888} {"train_loss": -7.320143699645996, "global_step": 205301, "epoch": 4888} {"train_loss": -7.36539363861084, "global_step": 205302, "epoch": 4888} {"train_loss": -7.379267692565918, "global_step": 205303, "epoch": 4888} {"train_loss": -7.406999111175537, "global_step": 205304, "epoch": 4888} {"train_loss": -7.320633411407471, "global_step": 205305, "epoch": 4888} {"train_loss": -7.239591598510742, "global_step": 205306, "epoch": 4888} {"train_loss": -7.353428840637207, "global_step": 205307, "epoch": 4888} {"train_loss": -7.34605598449707, "global_step": 205308, "epoch": 4888} {"train_loss": -7.292386531829834, "global_step": 205309, "epoch": 4888} {"train_loss": -7.3409104347229, "global_step": 205310, "epoch": 4888} {"train_loss": -7.297355651855469, "global_step": 205311, "epoch": 4888} {"train_loss": -7.281955242156982, "global_step": 205312, "epoch": 4888} {"train_loss": -7.2307233810424805, "global_step": 205313, "epoch": 4888} {"train_loss": -7.237464904785156, "global_step": 205314, "epoch": 4888} {"train_loss": -7.291247367858887, "global_step": 205315, "epoch": 4888} {"train_loss": -7.319271087646484, "global_step": 205316, "epoch": 4888} {"train_loss": -7.297435760498047, "global_step": 205317, "epoch": 4888} {"train_loss": -7.3016204833984375, "global_step": 205318, "epoch": 4888} {"train_loss": -7.211134910583496, "global_step": 205319, "epoch": 4888} {"train_loss": -7.391161918640137, "global_step": 205320, "epoch": 4888} {"train_loss": -7.360164165496826, "global_step": 205321, "epoch": 4888} {"train_loss": -7.303807258605957, "global_step": 205322, "epoch": 4888} {"train_loss": -7.328611850738525, "global_step": 205323, "epoch": 4888} {"train_loss": -7.321404933929443, "global_step": 205324, "epoch": 4888} {"train_loss": -7.408138275146484, "global_step": 205325, "epoch": 4888} {"train_loss": -7.2873687744140625, "global_step": 205326, "epoch": 4888} {"train_loss": -7.430919647216797, "global_step": 205327, "epoch": 4888} {"train_loss": -7.381311416625977, "global_step": 205328, "epoch": 4888} {"train_loss": -7.462629318237305, "global_step": 205329, "epoch": 4888} {"train_loss": -7.494894981384277, "global_step": 205330, "epoch": 4888} {"train_loss": -7.360066890716553, "global_step": 205331, "epoch": 4888} {"train_loss": -7.5123090744018555, "global_step": 205332, "epoch": 4888} {"train_loss": -7.448535442352295, "global_step": 205333, "epoch": 4888} {"train_loss": -7.334021091461182, "global_step": 205334, "epoch": 4888} {"train_loss": -7.352066993713379, "global_step": 205335, "epoch": 4888} {"train_loss": -7.261610984802246, "global_step": 205336, "epoch": 4888} {"train_loss": -7.3378410793486095, "global_step": 205337, "epoch": 4888, "val_loss": 81814.46875} {"train_loss": -7.307517051696777, "global_step": 205338, "epoch": 4889} {"train_loss": -7.442726135253906, "global_step": 205339, "epoch": 4889} {"train_loss": -7.424402713775635, "global_step": 205340, "epoch": 4889} {"train_loss": -7.409751892089844, "global_step": 205341, "epoch": 4889} {"train_loss": -7.3461809158325195, "global_step": 205342, "epoch": 4889} {"train_loss": -7.423211097717285, "global_step": 205343, "epoch": 4889} {"train_loss": -7.368997573852539, "global_step": 205344, "epoch": 4889} {"train_loss": -7.29409122467041, "global_step": 205345, "epoch": 4889} {"train_loss": -7.429835319519043, "global_step": 205346, "epoch": 4889} {"train_loss": -7.342913627624512, "global_step": 205347, "epoch": 4889} {"train_loss": -7.233647346496582, "global_step": 205348, "epoch": 4889} {"train_loss": -7.209278583526611, "global_step": 205349, "epoch": 4889} {"train_loss": -7.359203815460205, "global_step": 205350, "epoch": 4889} {"train_loss": -7.231860637664795, "global_step": 205351, "epoch": 4889} {"train_loss": -7.111929893493652, "global_step": 205352, "epoch": 4889} {"train_loss": -7.356013774871826, "global_step": 205353, "epoch": 4889} {"train_loss": -7.090850830078125, "global_step": 205354, "epoch": 4889} {"train_loss": -7.139950275421143, "global_step": 205355, "epoch": 4889} {"train_loss": -7.325063705444336, "global_step": 205356, "epoch": 4889} {"train_loss": -7.021625518798828, "global_step": 205357, "epoch": 4889} {"train_loss": -7.316289901733398, "global_step": 205358, "epoch": 4889} {"train_loss": -7.250194549560547, "global_step": 205359, "epoch": 4889} {"train_loss": -7.2594709396362305, "global_step": 205360, "epoch": 4889} {"train_loss": -7.272195816040039, "global_step": 205361, "epoch": 4889} {"train_loss": -7.357621669769287, "global_step": 205362, "epoch": 4889} {"train_loss": -7.266208171844482, "global_step": 205363, "epoch": 4889} {"train_loss": -7.419480800628662, "global_step": 205364, "epoch": 4889} {"train_loss": -7.389643669128418, "global_step": 205365, "epoch": 4889} {"train_loss": -7.247689723968506, "global_step": 205366, "epoch": 4889} {"train_loss": -7.317813873291016, "global_step": 205367, "epoch": 4889} {"train_loss": -7.297245025634766, "global_step": 205368, "epoch": 4889} {"train_loss": -7.2689008712768555, "global_step": 205369, "epoch": 4889} {"train_loss": -7.247992038726807, "global_step": 205370, "epoch": 4889} {"train_loss": -7.314274787902832, "global_step": 205371, "epoch": 4889} {"train_loss": -7.343832492828369, "global_step": 205372, "epoch": 4889} {"train_loss": -7.250470161437988, "global_step": 205373, "epoch": 4889} {"train_loss": -7.324939727783203, "global_step": 205374, "epoch": 4889} {"train_loss": -7.28083610534668, "global_step": 205375, "epoch": 4889} {"train_loss": -7.253358840942383, "global_step": 205376, "epoch": 4889} {"train_loss": -7.334638595581055, "global_step": 205377, "epoch": 4889} {"train_loss": -7.334019184112549, "global_step": 205378, "epoch": 4889} {"train_loss": -7.298277014777774, "global_step": 205379, "epoch": 4889, "val_loss": 81801.359375} {"train_loss": -7.377081871032715, "global_step": 205380, "epoch": 4890} {"train_loss": -7.354943752288818, "global_step": 205381, "epoch": 4890} {"train_loss": -7.261551380157471, "global_step": 205382, "epoch": 4890} {"train_loss": -7.290615558624268, "global_step": 205383, "epoch": 4890} {"train_loss": -7.332211494445801, "global_step": 205384, "epoch": 4890} {"train_loss": -7.3281073570251465, "global_step": 205385, "epoch": 4890} {"train_loss": -7.370915412902832, "global_step": 205386, "epoch": 4890} {"train_loss": -7.32427978515625, "global_step": 205387, "epoch": 4890} {"train_loss": -7.327880382537842, "global_step": 205388, "epoch": 4890} {"train_loss": -7.408477783203125, "global_step": 205389, "epoch": 4890} {"train_loss": -7.251628875732422, "global_step": 205390, "epoch": 4890} {"train_loss": -7.374590873718262, "global_step": 205391, "epoch": 4890} {"train_loss": -7.333400249481201, "global_step": 205392, "epoch": 4890} {"train_loss": -7.331472396850586, "global_step": 205393, "epoch": 4890} {"train_loss": -7.195608139038086, "global_step": 205394, "epoch": 4890} {"train_loss": -7.160329818725586, "global_step": 205395, "epoch": 4890} {"train_loss": -7.287178993225098, "global_step": 205396, "epoch": 4890} {"train_loss": -7.181095123291016, "global_step": 205397, "epoch": 4890} {"train_loss": -7.256337642669678, "global_step": 205398, "epoch": 4890} {"train_loss": -7.234257698059082, "global_step": 205399, "epoch": 4890} {"train_loss": -7.055795669555664, "global_step": 205400, "epoch": 4890} {"train_loss": -7.112697124481201, "global_step": 205401, "epoch": 4890} {"train_loss": -7.094945907592773, "global_step": 205402, "epoch": 4890} {"train_loss": -7.111789703369141, "global_step": 205403, "epoch": 4890} {"train_loss": -7.303372859954834, "global_step": 205404, "epoch": 4890} {"train_loss": -7.083669185638428, "global_step": 205405, "epoch": 4890} {"train_loss": -7.178869247436523, "global_step": 205406, "epoch": 4890} {"train_loss": -7.21709680557251, "global_step": 205407, "epoch": 4890} {"train_loss": -7.211363315582275, "global_step": 205408, "epoch": 4890} {"train_loss": -7.1011199951171875, "global_step": 205409, "epoch": 4890} {"train_loss": -7.331103801727295, "global_step": 205410, "epoch": 4890} {"train_loss": -7.212082862854004, "global_step": 205411, "epoch": 4890} {"train_loss": -7.2026824951171875, "global_step": 205412, "epoch": 4890} {"train_loss": -7.322257041931152, "global_step": 205413, "epoch": 4890} {"train_loss": -7.099798202514648, "global_step": 205414, "epoch": 4890} {"train_loss": -7.30180025100708, "global_step": 205415, "epoch": 4890} {"train_loss": -7.23666524887085, "global_step": 205416, "epoch": 4890} {"train_loss": -7.22590446472168, "global_step": 205417, "epoch": 4890} {"train_loss": -7.237857341766357, "global_step": 205418, "epoch": 4890} {"train_loss": -7.279728889465332, "global_step": 205419, "epoch": 4890} {"train_loss": -7.204904556274414, "global_step": 205420, "epoch": 4890} {"train_loss": -7.246428205853417, "global_step": 205421, "epoch": 4890, "val_loss": 81846.5078125} {"train_loss": -7.306478500366211, "global_step": 205422, "epoch": 4891} {"train_loss": -7.366624355316162, "global_step": 205423, "epoch": 4891} {"train_loss": -7.403824806213379, "global_step": 205424, "epoch": 4891} {"train_loss": -7.234045505523682, "global_step": 205425, "epoch": 4891} {"train_loss": -7.356456756591797, "global_step": 205426, "epoch": 4891} {"train_loss": -7.289672374725342, "global_step": 205427, "epoch": 4891} {"train_loss": -7.2943878173828125, "global_step": 205428, "epoch": 4891} {"train_loss": -7.333147048950195, "global_step": 205429, "epoch": 4891} {"train_loss": -7.358494758605957, "global_step": 205430, "epoch": 4891} {"train_loss": -7.266776084899902, "global_step": 205431, "epoch": 4891} {"train_loss": -7.347499370574951, "global_step": 205432, "epoch": 4891} {"train_loss": -7.306880950927734, "global_step": 205433, "epoch": 4891} {"train_loss": -7.388165473937988, "global_step": 205434, "epoch": 4891} {"train_loss": -7.301246166229248, "global_step": 205435, "epoch": 4891} {"train_loss": -7.479739189147949, "global_step": 205436, "epoch": 4891} {"train_loss": -7.340242862701416, "global_step": 205437, "epoch": 4891} {"train_loss": -7.36030387878418, "global_step": 205438, "epoch": 4891} {"train_loss": -7.24906063079834, "global_step": 205439, "epoch": 4891} {"train_loss": -7.331343650817871, "global_step": 205440, "epoch": 4891} {"train_loss": -7.371576309204102, "global_step": 205441, "epoch": 4891} {"train_loss": -7.226771831512451, "global_step": 205442, "epoch": 4891} {"train_loss": -7.192957878112793, "global_step": 205443, "epoch": 4891} {"train_loss": -7.360655307769775, "global_step": 205444, "epoch": 4891} {"train_loss": -7.314453125, "global_step": 205445, "epoch": 4891} {"train_loss": -7.391138076782227, "global_step": 205446, "epoch": 4891} {"train_loss": -7.402674674987793, "global_step": 205447, "epoch": 4891} {"train_loss": -7.380862236022949, "global_step": 205448, "epoch": 4891} {"train_loss": -7.351926326751709, "global_step": 205449, "epoch": 4891} {"train_loss": -7.287229537963867, "global_step": 205450, "epoch": 4891} {"train_loss": -7.426419734954834, "global_step": 205451, "epoch": 4891} {"train_loss": -7.352535247802734, "global_step": 205452, "epoch": 4891} {"train_loss": -7.320870399475098, "global_step": 205453, "epoch": 4891} {"train_loss": -7.274137496948242, "global_step": 205454, "epoch": 4891} {"train_loss": -7.281461715698242, "global_step": 205455, "epoch": 4891} {"train_loss": -7.2433390617370605, "global_step": 205456, "epoch": 4891} {"train_loss": -7.369126796722412, "global_step": 205457, "epoch": 4891} {"train_loss": -7.428062438964844, "global_step": 205458, "epoch": 4891} {"train_loss": -7.25375509262085, "global_step": 205459, "epoch": 4891} {"train_loss": -7.33095645904541, "global_step": 205460, "epoch": 4891} {"train_loss": -7.261429786682129, "global_step": 205461, "epoch": 4891} {"train_loss": -7.31199836730957, "global_step": 205462, "epoch": 4891} {"train_loss": -7.327772299448649, "global_step": 205463, "epoch": 4891, "val_loss": 81918.6640625} {"train_loss": -7.16549015045166, "global_step": 205464, "epoch": 4892} {"train_loss": -7.3278303146362305, "global_step": 205465, "epoch": 4892} {"train_loss": -7.279664993286133, "global_step": 205466, "epoch": 4892} {"train_loss": -7.259198188781738, "global_step": 205467, "epoch": 4892} {"train_loss": -7.304307460784912, "global_step": 205468, "epoch": 4892} {"train_loss": -7.339169502258301, "global_step": 205469, "epoch": 4892} {"train_loss": -7.343983173370361, "global_step": 205470, "epoch": 4892} {"train_loss": -7.23134708404541, "global_step": 205471, "epoch": 4892} {"train_loss": -7.232789039611816, "global_step": 205472, "epoch": 4892} {"train_loss": -7.372507095336914, "global_step": 205473, "epoch": 4892} {"train_loss": -7.219936847686768, "global_step": 205474, "epoch": 4892} {"train_loss": -7.453927040100098, "global_step": 205475, "epoch": 4892} {"train_loss": -7.201070785522461, "global_step": 205476, "epoch": 4892} {"train_loss": -7.267947196960449, "global_step": 205477, "epoch": 4892} {"train_loss": -7.333392143249512, "global_step": 205478, "epoch": 4892} {"train_loss": -7.266424179077148, "global_step": 205479, "epoch": 4892} {"train_loss": -7.285233497619629, "global_step": 205480, "epoch": 4892} {"train_loss": -7.223940372467041, "global_step": 205481, "epoch": 4892} {"train_loss": -7.371694564819336, "global_step": 205482, "epoch": 4892} {"train_loss": -7.166238307952881, "global_step": 205483, "epoch": 4892} {"train_loss": -7.224315643310547, "global_step": 205484, "epoch": 4892} {"train_loss": -7.211176872253418, "global_step": 205485, "epoch": 4892} {"train_loss": -7.336325645446777, "global_step": 205486, "epoch": 4892} {"train_loss": -7.21989107131958, "global_step": 205487, "epoch": 4892} {"train_loss": -7.346137046813965, "global_step": 205488, "epoch": 4892} {"train_loss": -7.338587760925293, "global_step": 205489, "epoch": 4892} {"train_loss": -7.255239486694336, "global_step": 205490, "epoch": 4892} {"train_loss": -7.296298980712891, "global_step": 205491, "epoch": 4892} {"train_loss": -7.321002006530762, "global_step": 205492, "epoch": 4892} {"train_loss": -7.454220771789551, "global_step": 205493, "epoch": 4892} {"train_loss": -7.406278610229492, "global_step": 205494, "epoch": 4892} {"train_loss": -7.273159980773926, "global_step": 205495, "epoch": 4892} {"train_loss": -7.215160369873047, "global_step": 205496, "epoch": 4892} {"train_loss": -7.302656173706055, "global_step": 205497, "epoch": 4892} {"train_loss": -7.297765731811523, "global_step": 205498, "epoch": 4892} {"train_loss": -7.344662189483643, "global_step": 205499, "epoch": 4892} {"train_loss": -7.26114559173584, "global_step": 205500, "epoch": 4892} {"train_loss": -7.448670864105225, "global_step": 205501, "epoch": 4892} {"train_loss": -7.279841423034668, "global_step": 205502, "epoch": 4892} {"train_loss": -7.277400016784668, "global_step": 205503, "epoch": 4892} {"train_loss": -7.327401638031006, "global_step": 205504, "epoch": 4892} {"train_loss": -7.293023370561146, "global_step": 205505, "epoch": 4892, "val_loss": 81874.6015625} {"train_loss": -7.340569496154785, "global_step": 205506, "epoch": 4893} {"train_loss": -7.258938312530518, "global_step": 205507, "epoch": 4893} {"train_loss": -7.287800312042236, "global_step": 205508, "epoch": 4893} {"train_loss": -7.354384422302246, "global_step": 205509, "epoch": 4893} {"train_loss": -7.352749824523926, "global_step": 205510, "epoch": 4893} {"train_loss": -7.41225528717041, "global_step": 205511, "epoch": 4893} {"train_loss": -7.329736232757568, "global_step": 205512, "epoch": 4893} {"train_loss": -7.279821872711182, "global_step": 205513, "epoch": 4893} {"train_loss": -7.368450164794922, "global_step": 205514, "epoch": 4893} {"train_loss": -7.281715393066406, "global_step": 205515, "epoch": 4893} {"train_loss": -7.395916938781738, "global_step": 205516, "epoch": 4893} {"train_loss": -7.337460517883301, "global_step": 205517, "epoch": 4893} {"train_loss": -7.331354141235352, "global_step": 205518, "epoch": 4893} {"train_loss": -7.471561908721924, "global_step": 205519, "epoch": 4893} {"train_loss": -7.363582611083984, "global_step": 205520, "epoch": 4893} {"train_loss": -7.484710693359375, "global_step": 205521, "epoch": 4893} {"train_loss": -7.356005668640137, "global_step": 205522, "epoch": 4893} {"train_loss": -7.37169075012207, "global_step": 205523, "epoch": 4893} {"train_loss": -7.350270748138428, "global_step": 205524, "epoch": 4893} {"train_loss": -7.35795783996582, "global_step": 205525, "epoch": 4893} {"train_loss": -7.409849166870117, "global_step": 205526, "epoch": 4893} {"train_loss": -7.383859157562256, "global_step": 205527, "epoch": 4893} {"train_loss": -7.286591529846191, "global_step": 205528, "epoch": 4893} {"train_loss": -7.409877777099609, "global_step": 205529, "epoch": 4893} {"train_loss": -7.455044269561768, "global_step": 205530, "epoch": 4893} {"train_loss": -7.224008083343506, "global_step": 205531, "epoch": 4893} {"train_loss": -7.415971755981445, "global_step": 205532, "epoch": 4893} {"train_loss": -7.347390174865723, "global_step": 205533, "epoch": 4893} {"train_loss": -7.29973840713501, "global_step": 205534, "epoch": 4893} {"train_loss": -7.3119659423828125, "global_step": 205535, "epoch": 4893} {"train_loss": -7.23598575592041, "global_step": 205536, "epoch": 4893} {"train_loss": -7.435307502746582, "global_step": 205537, "epoch": 4893} {"train_loss": -7.266836166381836, "global_step": 205538, "epoch": 4893} {"train_loss": -7.367979049682617, "global_step": 205539, "epoch": 4893} {"train_loss": -7.365455150604248, "global_step": 205540, "epoch": 4893} {"train_loss": -7.484874725341797, "global_step": 205541, "epoch": 4893} {"train_loss": -7.468204021453857, "global_step": 205542, "epoch": 4893} {"train_loss": -7.463644981384277, "global_step": 205543, "epoch": 4893} {"train_loss": -7.316681385040283, "global_step": 205544, "epoch": 4893} {"train_loss": -7.31970739364624, "global_step": 205545, "epoch": 4893} {"train_loss": -7.224573135375977, "global_step": 205546, "epoch": 4893} {"train_loss": -7.358009281612578, "global_step": 205547, "epoch": 4893, "val_loss": 81791.28125} {"train_loss": -7.390427589416504, "global_step": 205548, "epoch": 4894} {"train_loss": -7.502260684967041, "global_step": 205549, "epoch": 4894} {"train_loss": -7.376326560974121, "global_step": 205550, "epoch": 4894} {"train_loss": -7.361691951751709, "global_step": 205551, "epoch": 4894} {"train_loss": -7.415802955627441, "global_step": 205552, "epoch": 4894} {"train_loss": -7.365909099578857, "global_step": 205553, "epoch": 4894} {"train_loss": -7.3043975830078125, "global_step": 205554, "epoch": 4894} {"train_loss": -7.438319683074951, "global_step": 205555, "epoch": 4894} {"train_loss": -7.304689884185791, "global_step": 205556, "epoch": 4894} {"train_loss": -7.247904300689697, "global_step": 205557, "epoch": 4894} {"train_loss": -7.403632164001465, "global_step": 205558, "epoch": 4894} {"train_loss": -7.385149955749512, "global_step": 205559, "epoch": 4894} {"train_loss": -7.43033504486084, "global_step": 205560, "epoch": 4894} {"train_loss": -7.237754821777344, "global_step": 205561, "epoch": 4894} {"train_loss": -7.364844799041748, "global_step": 205562, "epoch": 4894} {"train_loss": -7.355698108673096, "global_step": 205563, "epoch": 4894} {"train_loss": -7.315234184265137, "global_step": 205564, "epoch": 4894} {"train_loss": -7.296990871429443, "global_step": 205565, "epoch": 4894} {"train_loss": -7.283120155334473, "global_step": 205566, "epoch": 4894} {"train_loss": -7.199904441833496, "global_step": 205567, "epoch": 4894} {"train_loss": -7.390923500061035, "global_step": 205568, "epoch": 4894} {"train_loss": -7.364224910736084, "global_step": 205569, "epoch": 4894} {"train_loss": -7.292616367340088, "global_step": 205570, "epoch": 4894} {"train_loss": -7.283116340637207, "global_step": 205571, "epoch": 4894} {"train_loss": -7.381180286407471, "global_step": 205572, "epoch": 4894} {"train_loss": -7.452295303344727, "global_step": 205573, "epoch": 4894} {"train_loss": -7.258517742156982, "global_step": 205574, "epoch": 4894} {"train_loss": -7.379388332366943, "global_step": 205575, "epoch": 4894} {"train_loss": -7.345510482788086, "global_step": 205576, "epoch": 4894} {"train_loss": -7.32521915435791, "global_step": 205577, "epoch": 4894} {"train_loss": -7.113250732421875, "global_step": 205578, "epoch": 4894} {"train_loss": -7.192623138427734, "global_step": 205579, "epoch": 4894} {"train_loss": -7.226115703582764, "global_step": 205580, "epoch": 4894} {"train_loss": -7.231440544128418, "global_step": 205581, "epoch": 4894} {"train_loss": -7.279938697814941, "global_step": 205582, "epoch": 4894} {"train_loss": -7.23883056640625, "global_step": 205583, "epoch": 4894} {"train_loss": -7.093376159667969, "global_step": 205584, "epoch": 4894} {"train_loss": -7.3697309494018555, "global_step": 205585, "epoch": 4894} {"train_loss": -7.300991058349609, "global_step": 205586, "epoch": 4894} {"train_loss": -7.269822120666504, "global_step": 205587, "epoch": 4894} {"train_loss": -7.2014994621276855, "global_step": 205588, "epoch": 4894} {"train_loss": -7.31335465113322, "global_step": 205589, "epoch": 4894, "val_loss": 81778.984375} {"train_loss": -7.271432876586914, "global_step": 205590, "epoch": 4895} {"train_loss": -7.237382888793945, "global_step": 205591, "epoch": 4895} {"train_loss": -7.290739059448242, "global_step": 205592, "epoch": 4895} {"train_loss": -7.142524719238281, "global_step": 205593, "epoch": 4895} {"train_loss": -7.270755290985107, "global_step": 205594, "epoch": 4895} {"train_loss": -7.224582672119141, "global_step": 205595, "epoch": 4895} {"train_loss": -7.328408241271973, "global_step": 205596, "epoch": 4895} {"train_loss": -7.226000785827637, "global_step": 205597, "epoch": 4895} {"train_loss": -7.37934684753418, "global_step": 205598, "epoch": 4895} {"train_loss": -7.387155532836914, "global_step": 205599, "epoch": 4895} {"train_loss": -7.20841646194458, "global_step": 205600, "epoch": 4895} {"train_loss": -7.396236419677734, "global_step": 205601, "epoch": 4895} {"train_loss": -7.237231731414795, "global_step": 205602, "epoch": 4895} {"train_loss": -7.430560111999512, "global_step": 205603, "epoch": 4895} {"train_loss": -7.288045883178711, "global_step": 205604, "epoch": 4895} {"train_loss": -7.38918399810791, "global_step": 205605, "epoch": 4895} {"train_loss": -7.217334747314453, "global_step": 205606, "epoch": 4895} {"train_loss": -7.338184833526611, "global_step": 205607, "epoch": 4895} {"train_loss": -7.37851619720459, "global_step": 205608, "epoch": 4895} {"train_loss": -7.230729103088379, "global_step": 205609, "epoch": 4895} {"train_loss": -7.279018878936768, "global_step": 205610, "epoch": 4895} {"train_loss": -7.318642616271973, "global_step": 205611, "epoch": 4895} {"train_loss": -7.232234001159668, "global_step": 205612, "epoch": 4895} {"train_loss": -7.461024284362793, "global_step": 205613, "epoch": 4895} {"train_loss": -7.244516372680664, "global_step": 205614, "epoch": 4895} {"train_loss": -7.371943473815918, "global_step": 205615, "epoch": 4895} {"train_loss": -7.338367462158203, "global_step": 205616, "epoch": 4895} {"train_loss": -7.306499481201172, "global_step": 205617, "epoch": 4895} {"train_loss": -7.36749792098999, "global_step": 205618, "epoch": 4895} {"train_loss": -7.363140106201172, "global_step": 205619, "epoch": 4895} {"train_loss": -7.348726272583008, "global_step": 205620, "epoch": 4895} {"train_loss": -7.414800643920898, "global_step": 205621, "epoch": 4895} {"train_loss": -7.36598014831543, "global_step": 205622, "epoch": 4895} {"train_loss": -7.293970108032227, "global_step": 205623, "epoch": 4895} {"train_loss": -7.365781784057617, "global_step": 205624, "epoch": 4895} {"train_loss": -7.361748695373535, "global_step": 205625, "epoch": 4895} {"train_loss": -7.38692045211792, "global_step": 205626, "epoch": 4895} {"train_loss": -7.366120338439941, "global_step": 205627, "epoch": 4895} {"train_loss": -7.360592842102051, "global_step": 205628, "epoch": 4895} {"train_loss": -7.314226150512695, "global_step": 205629, "epoch": 4895} {"train_loss": -7.36501407623291, "global_step": 205630, "epoch": 4895} {"train_loss": -7.3189293429965065, "global_step": 205631, "epoch": 4895, "val_loss": 81604.9609375} {"train_loss": -7.358927249908447, "global_step": 205632, "epoch": 4896} {"train_loss": -7.382179260253906, "global_step": 205633, "epoch": 4896} {"train_loss": -7.456794738769531, "global_step": 205634, "epoch": 4896} {"train_loss": -7.4546895027160645, "global_step": 205635, "epoch": 4896} {"train_loss": -7.39033842086792, "global_step": 205636, "epoch": 4896} {"train_loss": -7.3665008544921875, "global_step": 205637, "epoch": 4896} {"train_loss": -7.410618782043457, "global_step": 205638, "epoch": 4896} {"train_loss": -7.353395938873291, "global_step": 205639, "epoch": 4896} {"train_loss": -7.4313740730285645, "global_step": 205640, "epoch": 4896} {"train_loss": -7.400053024291992, "global_step": 205641, "epoch": 4896} {"train_loss": -7.300472259521484, "global_step": 205642, "epoch": 4896} {"train_loss": -7.302577018737793, "global_step": 205643, "epoch": 4896} {"train_loss": -7.360167503356934, "global_step": 205644, "epoch": 4896} {"train_loss": -7.338239669799805, "global_step": 205645, "epoch": 4896} {"train_loss": -7.3795905113220215, "global_step": 205646, "epoch": 4896} {"train_loss": -7.327425956726074, "global_step": 205647, "epoch": 4896} {"train_loss": -7.3992156982421875, "global_step": 205648, "epoch": 4896} {"train_loss": -7.349455833435059, "global_step": 205649, "epoch": 4896} {"train_loss": -7.252594947814941, "global_step": 205650, "epoch": 4896} {"train_loss": -7.2969279289245605, "global_step": 205651, "epoch": 4896} {"train_loss": -7.3372087478637695, "global_step": 205652, "epoch": 4896} {"train_loss": -7.2664690017700195, "global_step": 205653, "epoch": 4896} {"train_loss": -7.22075891494751, "global_step": 205654, "epoch": 4896} {"train_loss": -7.324963569641113, "global_step": 205655, "epoch": 4896} {"train_loss": -7.375186920166016, "global_step": 205656, "epoch": 4896} {"train_loss": -7.406410217285156, "global_step": 205657, "epoch": 4896} {"train_loss": -7.298205852508545, "global_step": 205658, "epoch": 4896} {"train_loss": -7.323734283447266, "global_step": 205659, "epoch": 4896} {"train_loss": -7.326648712158203, "global_step": 205660, "epoch": 4896} {"train_loss": -7.360448360443115, "global_step": 205661, "epoch": 4896} {"train_loss": -7.330400466918945, "global_step": 205662, "epoch": 4896} {"train_loss": -7.375640869140625, "global_step": 205663, "epoch": 4896} {"train_loss": -7.351620674133301, "global_step": 205664, "epoch": 4896} {"train_loss": -7.342872619628906, "global_step": 205665, "epoch": 4896} {"train_loss": -7.339916229248047, "global_step": 205666, "epoch": 4896} {"train_loss": -7.339601993560791, "global_step": 205667, "epoch": 4896} {"train_loss": -7.386849403381348, "global_step": 205668, "epoch": 4896} {"train_loss": -7.406357765197754, "global_step": 205669, "epoch": 4896} {"train_loss": -7.498812675476074, "global_step": 205670, "epoch": 4896} {"train_loss": -7.355443954467773, "global_step": 205671, "epoch": 4896} {"train_loss": -7.437108039855957, "global_step": 205672, "epoch": 4896} {"train_loss": -7.360882963453021, "global_step": 205673, "epoch": 4896, "val_loss": 81745.2890625} {"train_loss": -7.458222389221191, "global_step": 205674, "epoch": 4897} {"train_loss": -7.442798614501953, "global_step": 205675, "epoch": 4897} {"train_loss": -7.3873748779296875, "global_step": 205676, "epoch": 4897} {"train_loss": -7.4105730056762695, "global_step": 205677, "epoch": 4897} {"train_loss": -7.467219829559326, "global_step": 205678, "epoch": 4897} {"train_loss": -7.296191215515137, "global_step": 205679, "epoch": 4897} {"train_loss": -7.320744514465332, "global_step": 205680, "epoch": 4897} {"train_loss": -7.481742858886719, "global_step": 205681, "epoch": 4897} {"train_loss": -7.393637657165527, "global_step": 205682, "epoch": 4897} {"train_loss": -7.393523216247559, "global_step": 205683, "epoch": 4897} {"train_loss": -7.445066452026367, "global_step": 205684, "epoch": 4897} {"train_loss": -7.3032732009887695, "global_step": 205685, "epoch": 4897} {"train_loss": -7.443385601043701, "global_step": 205686, "epoch": 4897} {"train_loss": -7.412359714508057, "global_step": 205687, "epoch": 4897} {"train_loss": -7.369028091430664, "global_step": 205688, "epoch": 4897} {"train_loss": -7.482715606689453, "global_step": 205689, "epoch": 4897} {"train_loss": -7.3688554763793945, "global_step": 205690, "epoch": 4897} {"train_loss": -7.434759140014648, "global_step": 205691, "epoch": 4897} {"train_loss": -7.40224552154541, "global_step": 205692, "epoch": 4897} {"train_loss": -7.402183532714844, "global_step": 205693, "epoch": 4897} {"train_loss": -7.319986820220947, "global_step": 205694, "epoch": 4897} {"train_loss": -7.422659873962402, "global_step": 205695, "epoch": 4897} {"train_loss": -7.181682586669922, "global_step": 205696, "epoch": 4897} {"train_loss": -7.353326797485352, "global_step": 205697, "epoch": 4897} {"train_loss": -7.362114429473877, "global_step": 205698, "epoch": 4897} {"train_loss": -7.141684055328369, "global_step": 205699, "epoch": 4897} {"train_loss": -7.2338972091674805, "global_step": 205700, "epoch": 4897} {"train_loss": -7.271209716796875, "global_step": 205701, "epoch": 4897} {"train_loss": -7.124917984008789, "global_step": 205702, "epoch": 4897} {"train_loss": -7.290541172027588, "global_step": 205703, "epoch": 4897} {"train_loss": -7.230843544006348, "global_step": 205704, "epoch": 4897} {"train_loss": -7.220367908477783, "global_step": 205705, "epoch": 4897} {"train_loss": -7.265206336975098, "global_step": 205706, "epoch": 4897} {"train_loss": -7.299102783203125, "global_step": 205707, "epoch": 4897} {"train_loss": -7.1449480056762695, "global_step": 205708, "epoch": 4897} {"train_loss": -7.310347557067871, "global_step": 205709, "epoch": 4897} {"train_loss": -7.195830345153809, "global_step": 205710, "epoch": 4897} {"train_loss": -7.261662006378174, "global_step": 205711, "epoch": 4897} {"train_loss": -7.219588279724121, "global_step": 205712, "epoch": 4897} {"train_loss": -7.140589237213135, "global_step": 205713, "epoch": 4897} {"train_loss": -7.251466274261475, "global_step": 205714, "epoch": 4897} {"train_loss": -7.323062488010952, "global_step": 205715, "epoch": 4897, "val_loss": 81811.9609375} {"train_loss": -7.384794235229492, "global_step": 205716, "epoch": 4898} {"train_loss": -7.28182315826416, "global_step": 205717, "epoch": 4898} {"train_loss": -7.214755535125732, "global_step": 205718, "epoch": 4898} {"train_loss": -7.249225616455078, "global_step": 205719, "epoch": 4898} {"train_loss": -7.074104309082031, "global_step": 205720, "epoch": 4898} {"train_loss": -7.154251575469971, "global_step": 205721, "epoch": 4898} {"train_loss": -7.174840927124023, "global_step": 205722, "epoch": 4898} {"train_loss": -7.206597328186035, "global_step": 205723, "epoch": 4898} {"train_loss": -7.310279846191406, "global_step": 205724, "epoch": 4898} {"train_loss": -7.219252586364746, "global_step": 205725, "epoch": 4898} {"train_loss": -7.240871906280518, "global_step": 205726, "epoch": 4898} {"train_loss": -7.145565509796143, "global_step": 205727, "epoch": 4898} {"train_loss": -7.296414852142334, "global_step": 205728, "epoch": 4898} {"train_loss": -7.231165885925293, "global_step": 205729, "epoch": 4898} {"train_loss": -7.311071872711182, "global_step": 205730, "epoch": 4898} {"train_loss": -7.261563777923584, "global_step": 205731, "epoch": 4898} {"train_loss": -7.218502044677734, "global_step": 205732, "epoch": 4898} {"train_loss": -7.145023345947266, "global_step": 205733, "epoch": 4898} {"train_loss": -7.284921646118164, "global_step": 205734, "epoch": 4898} {"train_loss": -7.245978832244873, "global_step": 205735, "epoch": 4898} {"train_loss": -7.194100856781006, "global_step": 205736, "epoch": 4898} {"train_loss": -7.243460655212402, "global_step": 205737, "epoch": 4898} {"train_loss": -7.035341262817383, "global_step": 205738, "epoch": 4898} {"train_loss": -7.280477046966553, "global_step": 205739, "epoch": 4898} {"train_loss": -7.148447036743164, "global_step": 205740, "epoch": 4898} {"train_loss": -7.341091156005859, "global_step": 205741, "epoch": 4898} {"train_loss": -7.136722087860107, "global_step": 205742, "epoch": 4898} {"train_loss": -7.270439624786377, "global_step": 205743, "epoch": 4898} {"train_loss": -7.178475856781006, "global_step": 205744, "epoch": 4898} {"train_loss": -7.393205642700195, "global_step": 205745, "epoch": 4898} {"train_loss": -7.25263786315918, "global_step": 205746, "epoch": 4898} {"train_loss": -7.414768218994141, "global_step": 205747, "epoch": 4898} {"train_loss": -7.370943546295166, "global_step": 205748, "epoch": 4898} {"train_loss": -7.2955098152160645, "global_step": 205749, "epoch": 4898} {"train_loss": -7.3654069900512695, "global_step": 205750, "epoch": 4898} {"train_loss": -7.440293312072754, "global_step": 205751, "epoch": 4898} {"train_loss": -7.208667278289795, "global_step": 205752, "epoch": 4898} {"train_loss": -7.325669765472412, "global_step": 205753, "epoch": 4898} {"train_loss": -7.217259407043457, "global_step": 205754, "epoch": 4898} {"train_loss": -7.208416938781738, "global_step": 205755, "epoch": 4898} {"train_loss": -7.248043060302734, "global_step": 205756, "epoch": 4898} {"train_loss": -7.247643947601318, "global_step": 205757, "epoch": 4898, "val_loss": 81671.921875} {"train_loss": -7.234012126922607, "global_step": 205758, "epoch": 4899} {"train_loss": -7.262557029724121, "global_step": 205759, "epoch": 4899} {"train_loss": -7.315394401550293, "global_step": 205760, "epoch": 4899} {"train_loss": -7.323557376861572, "global_step": 205761, "epoch": 4899} {"train_loss": -7.320698261260986, "global_step": 205762, "epoch": 4899} {"train_loss": -7.314784049987793, "global_step": 205763, "epoch": 4899} {"train_loss": -7.388607978820801, "global_step": 205764, "epoch": 4899} {"train_loss": -7.224316596984863, "global_step": 205765, "epoch": 4899} {"train_loss": -7.235146999359131, "global_step": 205766, "epoch": 4899} {"train_loss": -7.306460380554199, "global_step": 205767, "epoch": 4899} {"train_loss": -7.298419952392578, "global_step": 205768, "epoch": 4899} {"train_loss": -7.458813667297363, "global_step": 205769, "epoch": 4899} {"train_loss": -7.322995662689209, "global_step": 205770, "epoch": 4899} {"train_loss": -7.307690620422363, "global_step": 205771, "epoch": 4899} {"train_loss": -7.395478248596191, "global_step": 205772, "epoch": 4899} {"train_loss": -7.439502716064453, "global_step": 205773, "epoch": 4899} {"train_loss": -7.355298042297363, "global_step": 205774, "epoch": 4899} {"train_loss": -7.294688701629639, "global_step": 205775, "epoch": 4899} {"train_loss": -7.333536624908447, "global_step": 205776, "epoch": 4899} {"train_loss": -7.4154229164123535, "global_step": 205777, "epoch": 4899} {"train_loss": -7.3092169761657715, "global_step": 205778, "epoch": 4899} {"train_loss": -7.3892059326171875, "global_step": 205779, "epoch": 4899} {"train_loss": -7.252748489379883, "global_step": 205780, "epoch": 4899} {"train_loss": -7.350647926330566, "global_step": 205781, "epoch": 4899} {"train_loss": -7.280878067016602, "global_step": 205782, "epoch": 4899} {"train_loss": -7.386900901794434, "global_step": 205783, "epoch": 4899} {"train_loss": -7.427431106567383, "global_step": 205784, "epoch": 4899} {"train_loss": -7.046936988830566, "global_step": 205785, "epoch": 4899} {"train_loss": -7.441450119018555, "global_step": 205786, "epoch": 4899} {"train_loss": -7.116886138916016, "global_step": 205787, "epoch": 4899} {"train_loss": -7.184893608093262, "global_step": 205788, "epoch": 4899} {"train_loss": -7.254940032958984, "global_step": 205789, "epoch": 4899} {"train_loss": -7.233994960784912, "global_step": 205790, "epoch": 4899} {"train_loss": -7.252119064331055, "global_step": 205791, "epoch": 4899} {"train_loss": -7.328125476837158, "global_step": 205792, "epoch": 4899} {"train_loss": -7.259523391723633, "global_step": 205793, "epoch": 4899} {"train_loss": -7.2381978034973145, "global_step": 205794, "epoch": 4899} {"train_loss": -7.251386642456055, "global_step": 205795, "epoch": 4899} {"train_loss": -7.25174617767334, "global_step": 205796, "epoch": 4899} {"train_loss": -7.238813877105713, "global_step": 205797, "epoch": 4899} {"train_loss": -7.307149410247803, "global_step": 205798, "epoch": 4899} {"train_loss": -7.302751552490961, "global_step": 205799, "epoch": 4899, "val_loss": 82043.625} {"train_loss": -7.297746658325195, "global_step": 205800, "epoch": 4900} {"train_loss": -7.309117794036865, "global_step": 205801, "epoch": 4900} {"train_loss": -7.32051944732666, "global_step": 205802, "epoch": 4900} {"train_loss": -7.374170303344727, "global_step": 205803, "epoch": 4900} {"train_loss": -7.250941753387451, "global_step": 205804, "epoch": 4900} {"train_loss": -7.351463317871094, "global_step": 205805, "epoch": 4900} {"train_loss": -7.252828121185303, "global_step": 205806, "epoch": 4900} {"train_loss": -7.400757789611816, "global_step": 205807, "epoch": 4900} {"train_loss": -7.473736763000488, "global_step": 205808, "epoch": 4900} {"train_loss": -7.347287178039551, "global_step": 205809, "epoch": 4900} {"train_loss": -7.39859676361084, "global_step": 205810, "epoch": 4900} {"train_loss": -7.391549110412598, "global_step": 205811, "epoch": 4900} {"train_loss": -7.369142532348633, "global_step": 205812, "epoch": 4900} {"train_loss": -7.367683410644531, "global_step": 205813, "epoch": 4900} {"train_loss": -7.350595951080322, "global_step": 205814, "epoch": 4900} {"train_loss": -7.307423114776611, "global_step": 205815, "epoch": 4900} {"train_loss": -7.268424034118652, "global_step": 205816, "epoch": 4900} {"train_loss": -7.4288787841796875, "global_step": 205817, "epoch": 4900} {"train_loss": -7.362898826599121, "global_step": 205818, "epoch": 4900} {"train_loss": -7.437700271606445, "global_step": 205819, "epoch": 4900} {"train_loss": -7.393237113952637, "global_step": 205820, "epoch": 4900} {"train_loss": -7.396329879760742, "global_step": 205821, "epoch": 4900} {"train_loss": -7.49507474899292, "global_step": 205822, "epoch": 4900} {"train_loss": -7.320580005645752, "global_step": 205823, "epoch": 4900} {"train_loss": -7.3540825843811035, "global_step": 205824, "epoch": 4900} {"train_loss": -7.483542442321777, "global_step": 205825, "epoch": 4900} {"train_loss": -7.404059410095215, "global_step": 205826, "epoch": 4900} {"train_loss": -7.366295337677002, "global_step": 205827, "epoch": 4900} {"train_loss": -7.462250232696533, "global_step": 205828, "epoch": 4900} {"train_loss": -7.491346836090088, "global_step": 205829, "epoch": 4900} {"train_loss": -7.335366725921631, "global_step": 205830, "epoch": 4900} {"train_loss": -7.423566818237305, "global_step": 205831, "epoch": 4900} {"train_loss": -7.377688884735107, "global_step": 205832, "epoch": 4900} {"train_loss": -7.534960746765137, "global_step": 205833, "epoch": 4900} {"train_loss": -7.38385534286499, "global_step": 205834, "epoch": 4900} {"train_loss": -7.245004177093506, "global_step": 205835, "epoch": 4900} {"train_loss": -7.39755916595459, "global_step": 205836, "epoch": 4900} {"train_loss": -7.378958702087402, "global_step": 205837, "epoch": 4900} {"train_loss": -7.368376731872559, "global_step": 205838, "epoch": 4900} {"train_loss": -7.463014125823975, "global_step": 205839, "epoch": 4900} {"train_loss": -7.301278114318848, "global_step": 205840, "epoch": 4900} {"train_loss": -7.3780401320684526, "global_step": 205841, "epoch": 4900, "train/sim_max_reward_0": 0.8371802354129116, "train/sim_max_reward_1": 0.9941680848574708, "train/sim_max_reward_2": 0.2797859528829556, "train/sim_max_reward_3": 0.13233432909872656, "train/sim_max_reward_4": 0.9261143771448339, "train/sim_max_reward_5": 0.9638942631646873, "test/sim_max_reward_4500000": 0.5263022326459051, "test/sim_max_reward_4500001": 0.9475455871996474, "test/sim_max_reward_4500002": 0.9359925467954668, "test/sim_max_reward_4500003": 0.9787374303476241, "test/sim_max_reward_4500004": 0.18757638000150076, "test/sim_max_reward_4500005": 0.9487374791750264, "test/sim_max_reward_4500006": 0.9626620586704341, "test/sim_max_reward_4500007": 0.8632734986467491, "test/sim_max_reward_4500008": 0.3699385937225379, "test/sim_max_reward_4500009": 0.05302239584619528, "test/sim_max_reward_4500010": 0.16880287623528764, "test/sim_max_reward_4500011": 0.9756015246868219, "test/sim_max_reward_4500012": 0.9377059784537498, "test/sim_max_reward_4500013": 0.006127839829602635, "test/sim_max_reward_4500014": 1.0, "test/sim_max_reward_4500015": 0.9754689935652332, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.02721924640463034, "test/sim_max_reward_4500018": 0.37065588343175687, "test/sim_max_reward_4500019": 0.9996637991975098, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9088890469837803, "test/sim_max_reward_4500022": 0.951094460539745, "test/sim_max_reward_4500023": 0.5108158164113898, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.9753006157402788, "test/sim_max_reward_4500026": 0.8479577821961123, "test/sim_max_reward_4500027": 0.9963094898255151, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.06047079564908578, "test/sim_max_reward_4500030": 0.9893158268982539, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.997730713579621, "test/sim_max_reward_4500034": 0.9291765472327993, "test/sim_max_reward_4500035": 1.0, "test/sim_max_reward_4500036": 1.0, "test/sim_max_reward_4500037": 0.8992857134759179, "test/sim_max_reward_4500038": 0.6715378437259876, "test/sim_max_reward_4500039": 0.9536644307711598, "test/sim_max_reward_4500040": 0.9914975093427527, "test/sim_max_reward_4500041": 0.9722676934040279, "test/sim_max_reward_4500042": 0.0, "test/sim_max_reward_4500043": 0.6396114173949543, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 0.4341216274432133, "test/sim_max_reward_4500046": 0.20486877471299184, "test/sim_max_reward_4500047": 1.0, "test/sim_max_reward_4500048": 0.9599853383603243, "test/sim_max_reward_4500049": 0.5276512596786685, "train/mean_score": 0.6889128737602643, "test/mean_score": 0.6181763631362336, "val_loss": 81735.21875} {"train_loss": -7.385597229003906, "global_step": 205842, "epoch": 4901} {"train_loss": -7.457441806793213, "global_step": 205843, "epoch": 4901} {"train_loss": -7.478811740875244, "global_step": 205844, "epoch": 4901} {"train_loss": -7.349795341491699, "global_step": 205845, "epoch": 4901} {"train_loss": -7.361983299255371, "global_step": 205846, "epoch": 4901} {"train_loss": -7.383872985839844, "global_step": 205847, "epoch": 4901} {"train_loss": -7.403475761413574, "global_step": 205848, "epoch": 4901} {"train_loss": -7.374608993530273, "global_step": 205849, "epoch": 4901} {"train_loss": -7.379056453704834, "global_step": 205850, "epoch": 4901} {"train_loss": -7.204537868499756, "global_step": 205851, "epoch": 4901} {"train_loss": -7.322280406951904, "global_step": 205852, "epoch": 4901} {"train_loss": -7.341129302978516, "global_step": 205853, "epoch": 4901} {"train_loss": -7.226081848144531, "global_step": 205854, "epoch": 4901} {"train_loss": -7.424818992614746, "global_step": 205855, "epoch": 4901} {"train_loss": -7.293746471405029, "global_step": 205856, "epoch": 4901} {"train_loss": -7.39011287689209, "global_step": 205857, "epoch": 4901} {"train_loss": -7.260254859924316, "global_step": 205858, "epoch": 4901} {"train_loss": -7.288471698760986, "global_step": 205859, "epoch": 4901} {"train_loss": -7.336544513702393, "global_step": 205860, "epoch": 4901} {"train_loss": -7.389880657196045, "global_step": 205861, "epoch": 4901} {"train_loss": -7.510823726654053, "global_step": 205862, "epoch": 4901} {"train_loss": -7.385102272033691, "global_step": 205863, "epoch": 4901} {"train_loss": -7.464750289916992, "global_step": 205864, "epoch": 4901} {"train_loss": -7.303001403808594, "global_step": 205865, "epoch": 4901} {"train_loss": -7.4753594398498535, "global_step": 205866, "epoch": 4901} {"train_loss": -7.33182430267334, "global_step": 205867, "epoch": 4901} {"train_loss": -7.377547264099121, "global_step": 205868, "epoch": 4901} {"train_loss": -7.418499946594238, "global_step": 205869, "epoch": 4901} {"train_loss": -7.293384552001953, "global_step": 205870, "epoch": 4901} {"train_loss": -7.262251853942871, "global_step": 205871, "epoch": 4901} {"train_loss": -7.427304267883301, "global_step": 205872, "epoch": 4901} {"train_loss": -7.3233184814453125, "global_step": 205873, "epoch": 4901} {"train_loss": -7.286672592163086, "global_step": 205874, "epoch": 4901} {"train_loss": -7.401615142822266, "global_step": 205875, "epoch": 4901} {"train_loss": -7.279682159423828, "global_step": 205876, "epoch": 4901} {"train_loss": -7.347182273864746, "global_step": 205877, "epoch": 4901} {"train_loss": -7.352828025817871, "global_step": 205878, "epoch": 4901} {"train_loss": -7.327880859375, "global_step": 205879, "epoch": 4901} {"train_loss": -7.251270771026611, "global_step": 205880, "epoch": 4901} {"train_loss": -7.325549125671387, "global_step": 205881, "epoch": 4901} {"train_loss": -7.2966766357421875, "global_step": 205882, "epoch": 4901} {"train_loss": -7.352544478007725, "global_step": 205883, "epoch": 4901, "val_loss": 81878.890625} {"train_loss": -7.400973320007324, "global_step": 205884, "epoch": 4902} {"train_loss": -7.245131015777588, "global_step": 205885, "epoch": 4902} {"train_loss": -7.401054859161377, "global_step": 205886, "epoch": 4902} {"train_loss": -7.210332870483398, "global_step": 205887, "epoch": 4902} {"train_loss": -7.49146842956543, "global_step": 205888, "epoch": 4902} {"train_loss": -7.377641677856445, "global_step": 205889, "epoch": 4902} {"train_loss": -7.338283061981201, "global_step": 205890, "epoch": 4902} {"train_loss": -7.366782188415527, "global_step": 205891, "epoch": 4902} {"train_loss": -7.304502487182617, "global_step": 205892, "epoch": 4902} {"train_loss": -7.3486857414245605, "global_step": 205893, "epoch": 4902} {"train_loss": -7.260634422302246, "global_step": 205894, "epoch": 4902} {"train_loss": -7.306838035583496, "global_step": 205895, "epoch": 4902} {"train_loss": -7.408998012542725, "global_step": 205896, "epoch": 4902} {"train_loss": -7.349419116973877, "global_step": 205897, "epoch": 4902} {"train_loss": -7.306170463562012, "global_step": 205898, "epoch": 4902} {"train_loss": -7.366946220397949, "global_step": 205899, "epoch": 4902} {"train_loss": -7.313368797302246, "global_step": 205900, "epoch": 4902} {"train_loss": -7.3183746337890625, "global_step": 205901, "epoch": 4902} {"train_loss": -7.2260212898254395, "global_step": 205902, "epoch": 4902} {"train_loss": -7.367758750915527, "global_step": 205903, "epoch": 4902} {"train_loss": -7.429278373718262, "global_step": 205904, "epoch": 4902} {"train_loss": -7.293086051940918, "global_step": 205905, "epoch": 4902} {"train_loss": -7.440770626068115, "global_step": 205906, "epoch": 4902} {"train_loss": -7.187924861907959, "global_step": 205907, "epoch": 4902} {"train_loss": -7.330050468444824, "global_step": 205908, "epoch": 4902} {"train_loss": -7.266523361206055, "global_step": 205909, "epoch": 4902} {"train_loss": -7.354540824890137, "global_step": 205910, "epoch": 4902} {"train_loss": -7.389145374298096, "global_step": 205911, "epoch": 4902} {"train_loss": -7.272189617156982, "global_step": 205912, "epoch": 4902} {"train_loss": -7.454037666320801, "global_step": 205913, "epoch": 4902} {"train_loss": -7.341543197631836, "global_step": 205914, "epoch": 4902} {"train_loss": -7.357728958129883, "global_step": 205915, "epoch": 4902} {"train_loss": -7.3849616050720215, "global_step": 205916, "epoch": 4902} {"train_loss": -7.418454170227051, "global_step": 205917, "epoch": 4902} {"train_loss": -7.461239337921143, "global_step": 205918, "epoch": 4902} {"train_loss": -7.234833240509033, "global_step": 205919, "epoch": 4902} {"train_loss": -7.368322372436523, "global_step": 205920, "epoch": 4902} {"train_loss": -7.311164855957031, "global_step": 205921, "epoch": 4902} {"train_loss": -7.343410015106201, "global_step": 205922, "epoch": 4902} {"train_loss": -7.413728713989258, "global_step": 205923, "epoch": 4902} {"train_loss": -7.3138837814331055, "global_step": 205924, "epoch": 4902} {"train_loss": -7.343731494176955, "global_step": 205925, "epoch": 4902, "val_loss": 81640.890625} {"train_loss": -7.417452812194824, "global_step": 205926, "epoch": 4903} {"train_loss": -7.358645915985107, "global_step": 205927, "epoch": 4903} {"train_loss": -7.291557312011719, "global_step": 205928, "epoch": 4903} {"train_loss": -7.418111801147461, "global_step": 205929, "epoch": 4903} {"train_loss": -7.302492618560791, "global_step": 205930, "epoch": 4903} {"train_loss": -7.446319580078125, "global_step": 205931, "epoch": 4903} {"train_loss": -7.430293083190918, "global_step": 205932, "epoch": 4903} {"train_loss": -7.338749885559082, "global_step": 205933, "epoch": 4903} {"train_loss": -7.353122711181641, "global_step": 205934, "epoch": 4903} {"train_loss": -7.36308479309082, "global_step": 205935, "epoch": 4903} {"train_loss": -7.430616855621338, "global_step": 205936, "epoch": 4903} {"train_loss": -7.429353713989258, "global_step": 205937, "epoch": 4903} {"train_loss": -7.323385715484619, "global_step": 205938, "epoch": 4903} {"train_loss": -7.366389751434326, "global_step": 205939, "epoch": 4903} {"train_loss": -7.379069805145264, "global_step": 205940, "epoch": 4903} {"train_loss": -7.329517841339111, "global_step": 205941, "epoch": 4903} {"train_loss": -7.389002323150635, "global_step": 205942, "epoch": 4903} {"train_loss": -7.3582539558410645, "global_step": 205943, "epoch": 4903} {"train_loss": -7.2994842529296875, "global_step": 205944, "epoch": 4903} {"train_loss": -7.441197872161865, "global_step": 205945, "epoch": 4903} {"train_loss": -7.413853645324707, "global_step": 205946, "epoch": 4903} {"train_loss": -7.294918537139893, "global_step": 205947, "epoch": 4903} {"train_loss": -7.317330360412598, "global_step": 205948, "epoch": 4903} {"train_loss": -7.353294372558594, "global_step": 205949, "epoch": 4903} {"train_loss": -7.3079514503479, "global_step": 205950, "epoch": 4903} {"train_loss": -7.313899993896484, "global_step": 205951, "epoch": 4903} {"train_loss": -7.3046770095825195, "global_step": 205952, "epoch": 4903} {"train_loss": -7.513566017150879, "global_step": 205953, "epoch": 4903} {"train_loss": -7.189874172210693, "global_step": 205954, "epoch": 4903} {"train_loss": -7.328801155090332, "global_step": 205955, "epoch": 4903} {"train_loss": -7.26338005065918, "global_step": 205956, "epoch": 4903} {"train_loss": -7.300070285797119, "global_step": 205957, "epoch": 4903} {"train_loss": -7.2593278884887695, "global_step": 205958, "epoch": 4903} {"train_loss": -7.176219940185547, "global_step": 205959, "epoch": 4903} {"train_loss": -7.305215358734131, "global_step": 205960, "epoch": 4903} {"train_loss": -7.416769027709961, "global_step": 205961, "epoch": 4903} {"train_loss": -7.236021995544434, "global_step": 205962, "epoch": 4903} {"train_loss": -7.280823707580566, "global_step": 205963, "epoch": 4903} {"train_loss": -7.453902721405029, "global_step": 205964, "epoch": 4903} {"train_loss": -7.177314281463623, "global_step": 205965, "epoch": 4903} {"train_loss": -7.427492141723633, "global_step": 205966, "epoch": 4903} {"train_loss": -7.344429470243908, "global_step": 205967, "epoch": 4903, "val_loss": 81702.1328125} {"train_loss": -7.317934036254883, "global_step": 205968, "epoch": 4904} {"train_loss": -7.424098968505859, "global_step": 205969, "epoch": 4904} {"train_loss": -7.3667120933532715, "global_step": 205970, "epoch": 4904} {"train_loss": -7.510941505432129, "global_step": 205971, "epoch": 4904} {"train_loss": -7.375778675079346, "global_step": 205972, "epoch": 4904} {"train_loss": -7.4843058586120605, "global_step": 205973, "epoch": 4904} {"train_loss": -7.458698749542236, "global_step": 205974, "epoch": 4904} {"train_loss": -7.337920665740967, "global_step": 205975, "epoch": 4904} {"train_loss": -7.448393821716309, "global_step": 205976, "epoch": 4904} {"train_loss": -7.315086364746094, "global_step": 205977, "epoch": 4904} {"train_loss": -7.507702827453613, "global_step": 205978, "epoch": 4904} {"train_loss": -7.435509204864502, "global_step": 205979, "epoch": 4904} {"train_loss": -7.34144926071167, "global_step": 205980, "epoch": 4904} {"train_loss": -7.391292572021484, "global_step": 205981, "epoch": 4904} {"train_loss": -7.386224746704102, "global_step": 205982, "epoch": 4904} {"train_loss": -7.318800449371338, "global_step": 205983, "epoch": 4904} {"train_loss": -7.376321792602539, "global_step": 205984, "epoch": 4904} {"train_loss": -7.251213073730469, "global_step": 205985, "epoch": 4904} {"train_loss": -7.293179512023926, "global_step": 205986, "epoch": 4904} {"train_loss": -7.290863990783691, "global_step": 205987, "epoch": 4904} {"train_loss": -7.349599838256836, "global_step": 205988, "epoch": 4904} {"train_loss": -7.284949779510498, "global_step": 205989, "epoch": 4904} {"train_loss": -7.201417922973633, "global_step": 205990, "epoch": 4904} {"train_loss": -7.297482490539551, "global_step": 205991, "epoch": 4904} {"train_loss": -7.235518455505371, "global_step": 205992, "epoch": 4904} {"train_loss": -7.270270347595215, "global_step": 205993, "epoch": 4904} {"train_loss": -7.374143600463867, "global_step": 205994, "epoch": 4904} {"train_loss": -7.14616584777832, "global_step": 205995, "epoch": 4904} {"train_loss": -7.291614532470703, "global_step": 205996, "epoch": 4904} {"train_loss": -7.3014726638793945, "global_step": 205997, "epoch": 4904} {"train_loss": -7.291543960571289, "global_step": 205998, "epoch": 4904} {"train_loss": -7.292909622192383, "global_step": 205999, "epoch": 4904} {"train_loss": -7.407126426696777, "global_step": 206000, "epoch": 4904} {"train_loss": -7.151131629943848, "global_step": 206001, "epoch": 4904} {"train_loss": -7.358720779418945, "global_step": 206002, "epoch": 4904} {"train_loss": -7.253257751464844, "global_step": 206003, "epoch": 4904} {"train_loss": -7.399893760681152, "global_step": 206004, "epoch": 4904} {"train_loss": -7.349815368652344, "global_step": 206005, "epoch": 4904} {"train_loss": -7.2876386642456055, "global_step": 206006, "epoch": 4904} {"train_loss": -7.265568733215332, "global_step": 206007, "epoch": 4904} {"train_loss": -7.0961594581604, "global_step": 206008, "epoch": 4904} {"train_loss": -7.328584160123553, "global_step": 206009, "epoch": 4904, "val_loss": 82162.1015625} {"train_loss": -7.346452236175537, "global_step": 206010, "epoch": 4905} {"train_loss": -7.285122871398926, "global_step": 206011, "epoch": 4905} {"train_loss": -7.415818214416504, "global_step": 206012, "epoch": 4905} {"train_loss": -7.324540138244629, "global_step": 206013, "epoch": 4905} {"train_loss": -7.312129974365234, "global_step": 206014, "epoch": 4905} {"train_loss": -7.324547290802002, "global_step": 206015, "epoch": 4905} {"train_loss": -7.110236167907715, "global_step": 206016, "epoch": 4905} {"train_loss": -7.33489465713501, "global_step": 206017, "epoch": 4905} {"train_loss": -7.25050163269043, "global_step": 206018, "epoch": 4905} {"train_loss": -7.218120574951172, "global_step": 206019, "epoch": 4905} {"train_loss": -7.278180122375488, "global_step": 206020, "epoch": 4905} {"train_loss": -7.243002414703369, "global_step": 206021, "epoch": 4905} {"train_loss": -7.354978084564209, "global_step": 206022, "epoch": 4905} {"train_loss": -7.290257453918457, "global_step": 206023, "epoch": 4905} {"train_loss": -7.223263263702393, "global_step": 206024, "epoch": 4905} {"train_loss": -7.2799177169799805, "global_step": 206025, "epoch": 4905} {"train_loss": -7.113431453704834, "global_step": 206026, "epoch": 4905} {"train_loss": -7.3695478439331055, "global_step": 206027, "epoch": 4905} {"train_loss": -7.256134986877441, "global_step": 206028, "epoch": 4905} {"train_loss": -7.317848205566406, "global_step": 206029, "epoch": 4905} {"train_loss": -7.336456298828125, "global_step": 206030, "epoch": 4905} {"train_loss": -7.287422180175781, "global_step": 206031, "epoch": 4905} {"train_loss": -7.302117347717285, "global_step": 206032, "epoch": 4905} {"train_loss": -7.290559768676758, "global_step": 206033, "epoch": 4905} {"train_loss": -7.429678916931152, "global_step": 206034, "epoch": 4905} {"train_loss": -7.285800933837891, "global_step": 206035, "epoch": 4905} {"train_loss": -7.303787708282471, "global_step": 206036, "epoch": 4905} {"train_loss": -7.345790863037109, "global_step": 206037, "epoch": 4905} {"train_loss": -7.3497314453125, "global_step": 206038, "epoch": 4905} {"train_loss": -7.2983174324035645, "global_step": 206039, "epoch": 4905} {"train_loss": -7.349567890167236, "global_step": 206040, "epoch": 4905} {"train_loss": -7.411981105804443, "global_step": 206041, "epoch": 4905} {"train_loss": -7.474130630493164, "global_step": 206042, "epoch": 4905} {"train_loss": -7.350775718688965, "global_step": 206043, "epoch": 4905} {"train_loss": -7.337803840637207, "global_step": 206044, "epoch": 4905} {"train_loss": -7.3936662673950195, "global_step": 206045, "epoch": 4905} {"train_loss": -7.343512535095215, "global_step": 206046, "epoch": 4905} {"train_loss": -7.415952682495117, "global_step": 206047, "epoch": 4905} {"train_loss": -7.36762809753418, "global_step": 206048, "epoch": 4905} {"train_loss": -7.298541069030762, "global_step": 206049, "epoch": 4905} {"train_loss": -7.316918849945068, "global_step": 206050, "epoch": 4905} {"train_loss": -7.313954080854144, "global_step": 206051, "epoch": 4905, "val_loss": 82026.5859375} {"train_loss": -7.354952812194824, "global_step": 206052, "epoch": 4906} {"train_loss": -7.319320201873779, "global_step": 206053, "epoch": 4906} {"train_loss": -7.375796794891357, "global_step": 206054, "epoch": 4906} {"train_loss": -7.2941107749938965, "global_step": 206055, "epoch": 4906} {"train_loss": -7.322800636291504, "global_step": 206056, "epoch": 4906} {"train_loss": -7.28516960144043, "global_step": 206057, "epoch": 4906} {"train_loss": -7.297245025634766, "global_step": 206058, "epoch": 4906} {"train_loss": -7.2920331954956055, "global_step": 206059, "epoch": 4906} {"train_loss": -7.204217433929443, "global_step": 206060, "epoch": 4906} {"train_loss": -7.2741289138793945, "global_step": 206061, "epoch": 4906} {"train_loss": -7.2892866134643555, "global_step": 206062, "epoch": 4906} {"train_loss": -7.310186386108398, "global_step": 206063, "epoch": 4906} {"train_loss": -7.287473678588867, "global_step": 206064, "epoch": 4906} {"train_loss": -7.302529335021973, "global_step": 206065, "epoch": 4906} {"train_loss": -7.361551284790039, "global_step": 206066, "epoch": 4906} {"train_loss": -7.3490309715271, "global_step": 206067, "epoch": 4906} {"train_loss": -7.313333988189697, "global_step": 206068, "epoch": 4906} {"train_loss": -7.204539775848389, "global_step": 206069, "epoch": 4906} {"train_loss": -7.249847412109375, "global_step": 206070, "epoch": 4906} {"train_loss": -7.390751361846924, "global_step": 206071, "epoch": 4906} {"train_loss": -7.341466426849365, "global_step": 206072, "epoch": 4906} {"train_loss": -7.358471870422363, "global_step": 206073, "epoch": 4906} {"train_loss": -7.372396945953369, "global_step": 206074, "epoch": 4906} {"train_loss": -7.346183776855469, "global_step": 206075, "epoch": 4906} {"train_loss": -7.33174991607666, "global_step": 206076, "epoch": 4906} {"train_loss": -7.3794450759887695, "global_step": 206077, "epoch": 4906} {"train_loss": -7.312180042266846, "global_step": 206078, "epoch": 4906} {"train_loss": -7.499744415283203, "global_step": 206079, "epoch": 4906} {"train_loss": -7.386788845062256, "global_step": 206080, "epoch": 4906} {"train_loss": -7.317502021789551, "global_step": 206081, "epoch": 4906} {"train_loss": -7.327828407287598, "global_step": 206082, "epoch": 4906} {"train_loss": -7.346920013427734, "global_step": 206083, "epoch": 4906} {"train_loss": -7.436979293823242, "global_step": 206084, "epoch": 4906} {"train_loss": -7.480847358703613, "global_step": 206085, "epoch": 4906} {"train_loss": -7.3406219482421875, "global_step": 206086, "epoch": 4906} {"train_loss": -7.442893981933594, "global_step": 206087, "epoch": 4906} {"train_loss": -7.309924602508545, "global_step": 206088, "epoch": 4906} {"train_loss": -7.333836078643799, "global_step": 206089, "epoch": 4906} {"train_loss": -7.3893327713012695, "global_step": 206090, "epoch": 4906} {"train_loss": -7.3989057540893555, "global_step": 206091, "epoch": 4906} {"train_loss": -7.243736267089844, "global_step": 206092, "epoch": 4906} {"train_loss": -7.339204776854742, "global_step": 206093, "epoch": 4906, "val_loss": 81691.328125} {"train_loss": -7.404442310333252, "global_step": 206094, "epoch": 4907} {"train_loss": -7.340526580810547, "global_step": 206095, "epoch": 4907} {"train_loss": -7.457078456878662, "global_step": 206096, "epoch": 4907} {"train_loss": -7.386112213134766, "global_step": 206097, "epoch": 4907} {"train_loss": -7.5290117263793945, "global_step": 206098, "epoch": 4907} {"train_loss": -7.320736885070801, "global_step": 206099, "epoch": 4907} {"train_loss": -7.429316520690918, "global_step": 206100, "epoch": 4907} {"train_loss": -7.482522010803223, "global_step": 206101, "epoch": 4907} {"train_loss": -7.285565376281738, "global_step": 206102, "epoch": 4907} {"train_loss": -7.276547908782959, "global_step": 206103, "epoch": 4907} {"train_loss": -7.391515254974365, "global_step": 206104, "epoch": 4907} {"train_loss": -7.452919960021973, "global_step": 206105, "epoch": 4907} {"train_loss": -7.446063041687012, "global_step": 206106, "epoch": 4907} {"train_loss": -7.311210632324219, "global_step": 206107, "epoch": 4907} {"train_loss": -7.4008564949035645, "global_step": 206108, "epoch": 4907} {"train_loss": -7.457350730895996, "global_step": 206109, "epoch": 4907} {"train_loss": -7.4062676429748535, "global_step": 206110, "epoch": 4907} {"train_loss": -7.4340009689331055, "global_step": 206111, "epoch": 4907} {"train_loss": -7.528326034545898, "global_step": 206112, "epoch": 4907} {"train_loss": -7.459595203399658, "global_step": 206113, "epoch": 4907} {"train_loss": -7.345588684082031, "global_step": 206114, "epoch": 4907} {"train_loss": -7.382341384887695, "global_step": 206115, "epoch": 4907} {"train_loss": -7.392886161804199, "global_step": 206116, "epoch": 4907} {"train_loss": -7.415796279907227, "global_step": 206117, "epoch": 4907} {"train_loss": -7.349717140197754, "global_step": 206118, "epoch": 4907} {"train_loss": -7.404879570007324, "global_step": 206119, "epoch": 4907} {"train_loss": -7.371845245361328, "global_step": 206120, "epoch": 4907} {"train_loss": -7.348719596862793, "global_step": 206121, "epoch": 4907} {"train_loss": -7.254563331604004, "global_step": 206122, "epoch": 4907} {"train_loss": -7.200974464416504, "global_step": 206123, "epoch": 4907} {"train_loss": -7.218721389770508, "global_step": 206124, "epoch": 4907} {"train_loss": -7.178982734680176, "global_step": 206125, "epoch": 4907} {"train_loss": -7.164227485656738, "global_step": 206126, "epoch": 4907} {"train_loss": -7.1392693519592285, "global_step": 206127, "epoch": 4907} {"train_loss": -7.355721473693848, "global_step": 206128, "epoch": 4907} {"train_loss": -7.117633819580078, "global_step": 206129, "epoch": 4907} {"train_loss": -7.299504280090332, "global_step": 206130, "epoch": 4907} {"train_loss": -7.227146625518799, "global_step": 206131, "epoch": 4907} {"train_loss": -7.314702987670898, "global_step": 206132, "epoch": 4907} {"train_loss": -7.313514709472656, "global_step": 206133, "epoch": 4907} {"train_loss": -7.142411231994629, "global_step": 206134, "epoch": 4907} {"train_loss": -7.343465453102475, "global_step": 206135, "epoch": 4907, "val_loss": 81678.2734375} {"train_loss": -7.108244895935059, "global_step": 206136, "epoch": 4908} {"train_loss": -7.314817428588867, "global_step": 206137, "epoch": 4908} {"train_loss": -7.188930511474609, "global_step": 206138, "epoch": 4908} {"train_loss": -7.295323371887207, "global_step": 206139, "epoch": 4908} {"train_loss": -7.3021979331970215, "global_step": 206140, "epoch": 4908} {"train_loss": -7.230121612548828, "global_step": 206141, "epoch": 4908} {"train_loss": -7.327654838562012, "global_step": 206142, "epoch": 4908} {"train_loss": -7.1633501052856445, "global_step": 206143, "epoch": 4908} {"train_loss": -7.270363807678223, "global_step": 206144, "epoch": 4908} {"train_loss": -7.226539611816406, "global_step": 206145, "epoch": 4908} {"train_loss": -7.426538467407227, "global_step": 206146, "epoch": 4908} {"train_loss": -7.145054817199707, "global_step": 206147, "epoch": 4908} {"train_loss": -7.211405277252197, "global_step": 206148, "epoch": 4908} {"train_loss": -7.1283278465271, "global_step": 206149, "epoch": 4908} {"train_loss": -7.470362186431885, "global_step": 206150, "epoch": 4908} {"train_loss": -7.152705192565918, "global_step": 206151, "epoch": 4908} {"train_loss": -7.278774261474609, "global_step": 206152, "epoch": 4908} {"train_loss": -7.241869926452637, "global_step": 206153, "epoch": 4908} {"train_loss": -7.258873462677002, "global_step": 206154, "epoch": 4908} {"train_loss": -7.221857070922852, "global_step": 206155, "epoch": 4908} {"train_loss": -7.185062408447266, "global_step": 206156, "epoch": 4908} {"train_loss": -7.149243354797363, "global_step": 206157, "epoch": 4908} {"train_loss": -7.339153289794922, "global_step": 206158, "epoch": 4908} {"train_loss": -7.291524887084961, "global_step": 206159, "epoch": 4908} {"train_loss": -7.1552228927612305, "global_step": 206160, "epoch": 4908} {"train_loss": -7.318039417266846, "global_step": 206161, "epoch": 4908} {"train_loss": -7.203090190887451, "global_step": 206162, "epoch": 4908} {"train_loss": -7.358021259307861, "global_step": 206163, "epoch": 4908} {"train_loss": -7.281939506530762, "global_step": 206164, "epoch": 4908} {"train_loss": -7.347392559051514, "global_step": 206165, "epoch": 4908} {"train_loss": -7.337091445922852, "global_step": 206166, "epoch": 4908} {"train_loss": -7.389508247375488, "global_step": 206167, "epoch": 4908} {"train_loss": -7.349315166473389, "global_step": 206168, "epoch": 4908} {"train_loss": -7.27215576171875, "global_step": 206169, "epoch": 4908} {"train_loss": -7.295260429382324, "global_step": 206170, "epoch": 4908} {"train_loss": -7.213994979858398, "global_step": 206171, "epoch": 4908} {"train_loss": -7.291504859924316, "global_step": 206172, "epoch": 4908} {"train_loss": -7.318918228149414, "global_step": 206173, "epoch": 4908} {"train_loss": -7.292214870452881, "global_step": 206174, "epoch": 4908} {"train_loss": -7.207879543304443, "global_step": 206175, "epoch": 4908} {"train_loss": -7.195255756378174, "global_step": 206176, "epoch": 4908} {"train_loss": -7.264641409828549, "global_step": 206177, "epoch": 4908, "val_loss": 82035.5625} {"train_loss": -7.221968650817871, "global_step": 206178, "epoch": 4909} {"train_loss": -7.3054938316345215, "global_step": 206179, "epoch": 4909} {"train_loss": -7.3312907218933105, "global_step": 206180, "epoch": 4909} {"train_loss": -7.4127302169799805, "global_step": 206181, "epoch": 4909} {"train_loss": -7.398309707641602, "global_step": 206182, "epoch": 4909} {"train_loss": -7.11941385269165, "global_step": 206183, "epoch": 4909} {"train_loss": -7.382709503173828, "global_step": 206184, "epoch": 4909} {"train_loss": -7.315661430358887, "global_step": 206185, "epoch": 4909} {"train_loss": -7.333169937133789, "global_step": 206186, "epoch": 4909} {"train_loss": -7.311247825622559, "global_step": 206187, "epoch": 4909} {"train_loss": -7.389735221862793, "global_step": 206188, "epoch": 4909} {"train_loss": -7.332427024841309, "global_step": 206189, "epoch": 4909} {"train_loss": -7.308313369750977, "global_step": 206190, "epoch": 4909} {"train_loss": -7.391667366027832, "global_step": 206191, "epoch": 4909} {"train_loss": -7.236980438232422, "global_step": 206192, "epoch": 4909} {"train_loss": -7.453431606292725, "global_step": 206193, "epoch": 4909} {"train_loss": -7.337705612182617, "global_step": 206194, "epoch": 4909} {"train_loss": -7.361468315124512, "global_step": 206195, "epoch": 4909} {"train_loss": -7.459722995758057, "global_step": 206196, "epoch": 4909} {"train_loss": -7.403213024139404, "global_step": 206197, "epoch": 4909} {"train_loss": -7.295763969421387, "global_step": 206198, "epoch": 4909} {"train_loss": -7.37208890914917, "global_step": 206199, "epoch": 4909} {"train_loss": -7.368553161621094, "global_step": 206200, "epoch": 4909} {"train_loss": -7.398867130279541, "global_step": 206201, "epoch": 4909} {"train_loss": -7.438300132751465, "global_step": 206202, "epoch": 4909} {"train_loss": -7.237401962280273, "global_step": 206203, "epoch": 4909} {"train_loss": -7.357822895050049, "global_step": 206204, "epoch": 4909} {"train_loss": -7.374911308288574, "global_step": 206205, "epoch": 4909} {"train_loss": -7.224540710449219, "global_step": 206206, "epoch": 4909} {"train_loss": -7.252513885498047, "global_step": 206207, "epoch": 4909} {"train_loss": -7.46474552154541, "global_step": 206208, "epoch": 4909} {"train_loss": -7.28657341003418, "global_step": 206209, "epoch": 4909} {"train_loss": -7.329700469970703, "global_step": 206210, "epoch": 4909} {"train_loss": -7.446271896362305, "global_step": 206211, "epoch": 4909} {"train_loss": -7.3122453689575195, "global_step": 206212, "epoch": 4909} {"train_loss": -7.334331512451172, "global_step": 206213, "epoch": 4909} {"train_loss": -7.358669281005859, "global_step": 206214, "epoch": 4909} {"train_loss": -7.274394512176514, "global_step": 206215, "epoch": 4909} {"train_loss": -7.372954368591309, "global_step": 206216, "epoch": 4909} {"train_loss": -7.337688446044922, "global_step": 206217, "epoch": 4909} {"train_loss": -7.4225568771362305, "global_step": 206218, "epoch": 4909} {"train_loss": -7.34337904339745, "global_step": 206219, "epoch": 4909, "val_loss": 81764.03125} {"train_loss": -7.443416595458984, "global_step": 206220, "epoch": 4910} {"train_loss": -7.400983810424805, "global_step": 206221, "epoch": 4910} {"train_loss": -7.393797397613525, "global_step": 206222, "epoch": 4910} {"train_loss": -7.481802940368652, "global_step": 206223, "epoch": 4910} {"train_loss": -7.3715434074401855, "global_step": 206224, "epoch": 4910} {"train_loss": -7.501123428344727, "global_step": 206225, "epoch": 4910} {"train_loss": -7.404916763305664, "global_step": 206226, "epoch": 4910} {"train_loss": -7.378195285797119, "global_step": 206227, "epoch": 4910} {"train_loss": -7.303002834320068, "global_step": 206228, "epoch": 4910} {"train_loss": -7.305850028991699, "global_step": 206229, "epoch": 4910} {"train_loss": -7.414844989776611, "global_step": 206230, "epoch": 4910} {"train_loss": -7.3853349685668945, "global_step": 206231, "epoch": 4910} {"train_loss": -7.307600021362305, "global_step": 206232, "epoch": 4910} {"train_loss": -7.308358669281006, "global_step": 206233, "epoch": 4910} {"train_loss": -7.330752372741699, "global_step": 206234, "epoch": 4910} {"train_loss": -7.46558952331543, "global_step": 206235, "epoch": 4910} {"train_loss": -7.366966247558594, "global_step": 206236, "epoch": 4910} {"train_loss": -7.228540897369385, "global_step": 206237, "epoch": 4910} {"train_loss": -7.395940780639648, "global_step": 206238, "epoch": 4910} {"train_loss": -7.410974502563477, "global_step": 206239, "epoch": 4910} {"train_loss": -7.468008041381836, "global_step": 206240, "epoch": 4910} {"train_loss": -7.354259490966797, "global_step": 206241, "epoch": 4910} {"train_loss": -7.2838945388793945, "global_step": 206242, "epoch": 4910} {"train_loss": -7.409467697143555, "global_step": 206243, "epoch": 4910} {"train_loss": -7.388810634613037, "global_step": 206244, "epoch": 4910} {"train_loss": -7.342382431030273, "global_step": 206245, "epoch": 4910} {"train_loss": -7.383455276489258, "global_step": 206246, "epoch": 4910} {"train_loss": -7.419349193572998, "global_step": 206247, "epoch": 4910} {"train_loss": -7.4638824462890625, "global_step": 206248, "epoch": 4910} {"train_loss": -7.3211517333984375, "global_step": 206249, "epoch": 4910} {"train_loss": -7.411192893981934, "global_step": 206250, "epoch": 4910} {"train_loss": -7.393256187438965, "global_step": 206251, "epoch": 4910} {"train_loss": -7.436431407928467, "global_step": 206252, "epoch": 4910} {"train_loss": -7.443763732910156, "global_step": 206253, "epoch": 4910} {"train_loss": -7.318471431732178, "global_step": 206254, "epoch": 4910} {"train_loss": -7.450430393218994, "global_step": 206255, "epoch": 4910} {"train_loss": -7.351977348327637, "global_step": 206256, "epoch": 4910} {"train_loss": -7.227964401245117, "global_step": 206257, "epoch": 4910} {"train_loss": -7.317473411560059, "global_step": 206258, "epoch": 4910} {"train_loss": -7.359278678894043, "global_step": 206259, "epoch": 4910} {"train_loss": -7.3118672370910645, "global_step": 206260, "epoch": 4910} {"train_loss": -7.374864101409912, "global_step": 206261, "epoch": 4910, "val_loss": 81751.6640625} {"train_loss": -7.337414741516113, "global_step": 206262, "epoch": 4911} {"train_loss": -7.225437164306641, "global_step": 206263, "epoch": 4911} {"train_loss": -7.314215660095215, "global_step": 206264, "epoch": 4911} {"train_loss": -7.270455837249756, "global_step": 206265, "epoch": 4911} {"train_loss": -7.243229866027832, "global_step": 206266, "epoch": 4911} {"train_loss": -7.412998199462891, "global_step": 206267, "epoch": 4911} {"train_loss": -7.274905204772949, "global_step": 206268, "epoch": 4911} {"train_loss": -7.132349491119385, "global_step": 206269, "epoch": 4911} {"train_loss": -7.436599254608154, "global_step": 206270, "epoch": 4911} {"train_loss": -7.189248561859131, "global_step": 206271, "epoch": 4911} {"train_loss": -7.273828029632568, "global_step": 206272, "epoch": 4911} {"train_loss": -7.229089736938477, "global_step": 206273, "epoch": 4911} {"train_loss": -7.192927837371826, "global_step": 206274, "epoch": 4911} {"train_loss": -7.339437007904053, "global_step": 206275, "epoch": 4911} {"train_loss": -7.372983455657959, "global_step": 206276, "epoch": 4911} {"train_loss": -7.319755554199219, "global_step": 206277, "epoch": 4911} {"train_loss": -7.298415184020996, "global_step": 206278, "epoch": 4911} {"train_loss": -7.379429817199707, "global_step": 206279, "epoch": 4911} {"train_loss": -7.339694976806641, "global_step": 206280, "epoch": 4911} {"train_loss": -7.2805376052856445, "global_step": 206281, "epoch": 4911} {"train_loss": -7.362297534942627, "global_step": 206282, "epoch": 4911} {"train_loss": -7.18422794342041, "global_step": 206283, "epoch": 4911} {"train_loss": -7.407925605773926, "global_step": 206284, "epoch": 4911} {"train_loss": -7.316854953765869, "global_step": 206285, "epoch": 4911} {"train_loss": -7.287495136260986, "global_step": 206286, "epoch": 4911} {"train_loss": -7.329821586608887, "global_step": 206287, "epoch": 4911} {"train_loss": -7.273904800415039, "global_step": 206288, "epoch": 4911} {"train_loss": -7.4145894050598145, "global_step": 206289, "epoch": 4911} {"train_loss": -7.397622585296631, "global_step": 206290, "epoch": 4911} {"train_loss": -7.2291412353515625, "global_step": 206291, "epoch": 4911} {"train_loss": -7.393127918243408, "global_step": 206292, "epoch": 4911} {"train_loss": -7.36275577545166, "global_step": 206293, "epoch": 4911} {"train_loss": -7.357102394104004, "global_step": 206294, "epoch": 4911} {"train_loss": -7.4036545753479, "global_step": 206295, "epoch": 4911} {"train_loss": -7.331272125244141, "global_step": 206296, "epoch": 4911} {"train_loss": -7.312097072601318, "global_step": 206297, "epoch": 4911} {"train_loss": -7.342911243438721, "global_step": 206298, "epoch": 4911} {"train_loss": -7.412542343139648, "global_step": 206299, "epoch": 4911} {"train_loss": -7.243934154510498, "global_step": 206300, "epoch": 4911} {"train_loss": -7.312020778656006, "global_step": 206301, "epoch": 4911} {"train_loss": -7.249543190002441, "global_step": 206302, "epoch": 4911} {"train_loss": -7.313717762629191, "global_step": 206303, "epoch": 4911, "val_loss": 81710.03125} {"train_loss": -7.436049461364746, "global_step": 206304, "epoch": 4912} {"train_loss": -7.2340826988220215, "global_step": 206305, "epoch": 4912} {"train_loss": -7.366367816925049, "global_step": 206306, "epoch": 4912} {"train_loss": -7.344454288482666, "global_step": 206307, "epoch": 4912} {"train_loss": -7.3200788497924805, "global_step": 206308, "epoch": 4912} {"train_loss": -7.359647750854492, "global_step": 206309, "epoch": 4912} {"train_loss": -7.205939292907715, "global_step": 206310, "epoch": 4912} {"train_loss": -7.394495010375977, "global_step": 206311, "epoch": 4912} {"train_loss": -7.319625377655029, "global_step": 206312, "epoch": 4912} {"train_loss": -7.404507637023926, "global_step": 206313, "epoch": 4912} {"train_loss": -7.351864814758301, "global_step": 206314, "epoch": 4912} {"train_loss": -7.333158493041992, "global_step": 206315, "epoch": 4912} {"train_loss": -7.453305244445801, "global_step": 206316, "epoch": 4912} {"train_loss": -7.362052917480469, "global_step": 206317, "epoch": 4912} {"train_loss": -7.297638893127441, "global_step": 206318, "epoch": 4912} {"train_loss": -7.363528251647949, "global_step": 206319, "epoch": 4912} {"train_loss": -7.313279628753662, "global_step": 206320, "epoch": 4912} {"train_loss": -7.328093528747559, "global_step": 206321, "epoch": 4912} {"train_loss": -7.417197227478027, "global_step": 206322, "epoch": 4912} {"train_loss": -7.345486164093018, "global_step": 206323, "epoch": 4912} {"train_loss": -7.288556098937988, "global_step": 206324, "epoch": 4912} {"train_loss": -7.325541973114014, "global_step": 206325, "epoch": 4912} {"train_loss": -7.259894371032715, "global_step": 206326, "epoch": 4912} {"train_loss": -7.217608451843262, "global_step": 206327, "epoch": 4912} {"train_loss": -7.301148414611816, "global_step": 206328, "epoch": 4912} {"train_loss": -7.1977996826171875, "global_step": 206329, "epoch": 4912} {"train_loss": -7.332684516906738, "global_step": 206330, "epoch": 4912} {"train_loss": -7.178012371063232, "global_step": 206331, "epoch": 4912} {"train_loss": -7.191761493682861, "global_step": 206332, "epoch": 4912} {"train_loss": -7.297707557678223, "global_step": 206333, "epoch": 4912} {"train_loss": -7.25697135925293, "global_step": 206334, "epoch": 4912} {"train_loss": -7.352513313293457, "global_step": 206335, "epoch": 4912} {"train_loss": -7.35143518447876, "global_step": 206336, "epoch": 4912} {"train_loss": -7.216310024261475, "global_step": 206337, "epoch": 4912} {"train_loss": -7.247516632080078, "global_step": 206338, "epoch": 4912} {"train_loss": -7.237461566925049, "global_step": 206339, "epoch": 4912} {"train_loss": -7.361021041870117, "global_step": 206340, "epoch": 4912} {"train_loss": -7.255349159240723, "global_step": 206341, "epoch": 4912} {"train_loss": -7.249533176422119, "global_step": 206342, "epoch": 4912} {"train_loss": -7.30068826675415, "global_step": 206343, "epoch": 4912} {"train_loss": -7.36588191986084, "global_step": 206344, "epoch": 4912} {"train_loss": -7.309850113732474, "global_step": 206345, "epoch": 4912, "val_loss": 82068.3125} {"train_loss": -7.141670227050781, "global_step": 206346, "epoch": 4913} {"train_loss": -7.355009078979492, "global_step": 206347, "epoch": 4913} {"train_loss": -7.479432106018066, "global_step": 206348, "epoch": 4913} {"train_loss": -7.266676902770996, "global_step": 206349, "epoch": 4913} {"train_loss": -7.4337873458862305, "global_step": 206350, "epoch": 4913} {"train_loss": -7.308618545532227, "global_step": 206351, "epoch": 4913} {"train_loss": -7.3096466064453125, "global_step": 206352, "epoch": 4913} {"train_loss": -7.2637786865234375, "global_step": 206353, "epoch": 4913} {"train_loss": -7.193154335021973, "global_step": 206354, "epoch": 4913} {"train_loss": -7.301619529724121, "global_step": 206355, "epoch": 4913} {"train_loss": -7.376392364501953, "global_step": 206356, "epoch": 4913} {"train_loss": -7.297362327575684, "global_step": 206357, "epoch": 4913} {"train_loss": -7.30186653137207, "global_step": 206358, "epoch": 4913} {"train_loss": -7.3148698806762695, "global_step": 206359, "epoch": 4913} {"train_loss": -7.239741325378418, "global_step": 206360, "epoch": 4913} {"train_loss": -7.331928253173828, "global_step": 206361, "epoch": 4913} {"train_loss": -7.304967880249023, "global_step": 206362, "epoch": 4913} {"train_loss": -7.34249210357666, "global_step": 206363, "epoch": 4913} {"train_loss": -7.133627891540527, "global_step": 206364, "epoch": 4913} {"train_loss": -7.198993682861328, "global_step": 206365, "epoch": 4913} {"train_loss": -7.326564311981201, "global_step": 206366, "epoch": 4913} {"train_loss": -7.1458001136779785, "global_step": 206367, "epoch": 4913} {"train_loss": -7.295994281768799, "global_step": 206368, "epoch": 4913} {"train_loss": -7.206960678100586, "global_step": 206369, "epoch": 4913} {"train_loss": -7.357728958129883, "global_step": 206370, "epoch": 4913} {"train_loss": -7.270771026611328, "global_step": 206371, "epoch": 4913} {"train_loss": -7.28256368637085, "global_step": 206372, "epoch": 4913} {"train_loss": -7.232341289520264, "global_step": 206373, "epoch": 4913} {"train_loss": -7.188631534576416, "global_step": 206374, "epoch": 4913} {"train_loss": -7.3136138916015625, "global_step": 206375, "epoch": 4913} {"train_loss": -7.326964855194092, "global_step": 206376, "epoch": 4913} {"train_loss": -7.41490364074707, "global_step": 206377, "epoch": 4913} {"train_loss": -7.239799976348877, "global_step": 206378, "epoch": 4913} {"train_loss": -7.2760396003723145, "global_step": 206379, "epoch": 4913} {"train_loss": -7.298142433166504, "global_step": 206380, "epoch": 4913} {"train_loss": -7.267683982849121, "global_step": 206381, "epoch": 4913} {"train_loss": -7.430793285369873, "global_step": 206382, "epoch": 4913} {"train_loss": -7.204422473907471, "global_step": 206383, "epoch": 4913} {"train_loss": -7.194531440734863, "global_step": 206384, "epoch": 4913} {"train_loss": -7.24260139465332, "global_step": 206385, "epoch": 4913} {"train_loss": -7.268680572509766, "global_step": 206386, "epoch": 4913} {"train_loss": -7.2837005115690685, "global_step": 206387, "epoch": 4913, "val_loss": 81585.3125} {"train_loss": -7.23165225982666, "global_step": 206388, "epoch": 4914} {"train_loss": -7.209600925445557, "global_step": 206389, "epoch": 4914} {"train_loss": -7.274360656738281, "global_step": 206390, "epoch": 4914} {"train_loss": -7.297604560852051, "global_step": 206391, "epoch": 4914} {"train_loss": -7.182835578918457, "global_step": 206392, "epoch": 4914} {"train_loss": -7.2460408210754395, "global_step": 206393, "epoch": 4914} {"train_loss": -7.452113628387451, "global_step": 206394, "epoch": 4914} {"train_loss": -7.172033786773682, "global_step": 206395, "epoch": 4914} {"train_loss": -7.30054235458374, "global_step": 206396, "epoch": 4914} {"train_loss": -7.285693168640137, "global_step": 206397, "epoch": 4914} {"train_loss": -7.254558563232422, "global_step": 206398, "epoch": 4914} {"train_loss": -7.269036293029785, "global_step": 206399, "epoch": 4914} {"train_loss": -7.26664924621582, "global_step": 206400, "epoch": 4914} {"train_loss": -7.087194919586182, "global_step": 206401, "epoch": 4914} {"train_loss": -7.297431468963623, "global_step": 206402, "epoch": 4914} {"train_loss": -7.313253879547119, "global_step": 206403, "epoch": 4914} {"train_loss": -7.297255992889404, "global_step": 206404, "epoch": 4914} {"train_loss": -7.31442928314209, "global_step": 206405, "epoch": 4914} {"train_loss": -7.326613426208496, "global_step": 206406, "epoch": 4914} {"train_loss": -7.345073699951172, "global_step": 206407, "epoch": 4914} {"train_loss": -7.273205757141113, "global_step": 206408, "epoch": 4914} {"train_loss": -7.375706672668457, "global_step": 206409, "epoch": 4914} {"train_loss": -7.389814376831055, "global_step": 206410, "epoch": 4914} {"train_loss": -7.312997817993164, "global_step": 206411, "epoch": 4914} {"train_loss": -7.289834976196289, "global_step": 206412, "epoch": 4914} {"train_loss": -7.305774211883545, "global_step": 206413, "epoch": 4914} {"train_loss": -7.381466865539551, "global_step": 206414, "epoch": 4914} {"train_loss": -7.300319671630859, "global_step": 206415, "epoch": 4914} {"train_loss": -7.394294738769531, "global_step": 206416, "epoch": 4914} {"train_loss": -7.398856163024902, "global_step": 206417, "epoch": 4914} {"train_loss": -7.281435966491699, "global_step": 206418, "epoch": 4914} {"train_loss": -7.392362117767334, "global_step": 206419, "epoch": 4914} {"train_loss": -7.308615207672119, "global_step": 206420, "epoch": 4914} {"train_loss": -7.377826690673828, "global_step": 206421, "epoch": 4914} {"train_loss": -7.423600196838379, "global_step": 206422, "epoch": 4914} {"train_loss": -7.310949325561523, "global_step": 206423, "epoch": 4914} {"train_loss": -7.420227527618408, "global_step": 206424, "epoch": 4914} {"train_loss": -7.40564489364624, "global_step": 206425, "epoch": 4914} {"train_loss": -7.337521553039551, "global_step": 206426, "epoch": 4914} {"train_loss": -7.3441386222839355, "global_step": 206427, "epoch": 4914} {"train_loss": -7.265384674072266, "global_step": 206428, "epoch": 4914} {"train_loss": -7.312556664148967, "global_step": 206429, "epoch": 4914, "val_loss": 81840.875} {"train_loss": -7.473457336425781, "global_step": 206430, "epoch": 4915} {"train_loss": -7.521842002868652, "global_step": 206431, "epoch": 4915} {"train_loss": -7.421614646911621, "global_step": 206432, "epoch": 4915} {"train_loss": -7.485299110412598, "global_step": 206433, "epoch": 4915} {"train_loss": -7.492090702056885, "global_step": 206434, "epoch": 4915} {"train_loss": -7.4075236320495605, "global_step": 206435, "epoch": 4915} {"train_loss": -7.482467174530029, "global_step": 206436, "epoch": 4915} {"train_loss": -7.435802459716797, "global_step": 206437, "epoch": 4915} {"train_loss": -7.452610015869141, "global_step": 206438, "epoch": 4915} {"train_loss": -7.49576473236084, "global_step": 206439, "epoch": 4915} {"train_loss": -7.488950729370117, "global_step": 206440, "epoch": 4915} {"train_loss": -7.377946853637695, "global_step": 206441, "epoch": 4915} {"train_loss": -7.408699989318848, "global_step": 206442, "epoch": 4915} {"train_loss": -7.444249153137207, "global_step": 206443, "epoch": 4915} {"train_loss": -7.462746620178223, "global_step": 206444, "epoch": 4915} {"train_loss": -7.484185218811035, "global_step": 206445, "epoch": 4915} {"train_loss": -7.362601280212402, "global_step": 206446, "epoch": 4915} {"train_loss": -7.427249908447266, "global_step": 206447, "epoch": 4915} {"train_loss": -7.2438483238220215, "global_step": 206448, "epoch": 4915} {"train_loss": -7.43873929977417, "global_step": 206449, "epoch": 4915} {"train_loss": -7.400462627410889, "global_step": 206450, "epoch": 4915} {"train_loss": -7.312026500701904, "global_step": 206451, "epoch": 4915} {"train_loss": -7.401589393615723, "global_step": 206452, "epoch": 4915} {"train_loss": -7.350269317626953, "global_step": 206453, "epoch": 4915} {"train_loss": -7.18858528137207, "global_step": 206454, "epoch": 4915} {"train_loss": -7.462177276611328, "global_step": 206455, "epoch": 4915} {"train_loss": -7.437803268432617, "global_step": 206456, "epoch": 4915} {"train_loss": -7.340967178344727, "global_step": 206457, "epoch": 4915} {"train_loss": -7.39180850982666, "global_step": 206458, "epoch": 4915} {"train_loss": -7.192024230957031, "global_step": 206459, "epoch": 4915} {"train_loss": -7.370162010192871, "global_step": 206460, "epoch": 4915} {"train_loss": -7.476668357849121, "global_step": 206461, "epoch": 4915} {"train_loss": -7.239825248718262, "global_step": 206462, "epoch": 4915} {"train_loss": -7.322049140930176, "global_step": 206463, "epoch": 4915} {"train_loss": -7.3856048583984375, "global_step": 206464, "epoch": 4915} {"train_loss": -7.386850357055664, "global_step": 206465, "epoch": 4915} {"train_loss": -7.377352714538574, "global_step": 206466, "epoch": 4915} {"train_loss": -7.460735321044922, "global_step": 206467, "epoch": 4915} {"train_loss": -7.26836633682251, "global_step": 206468, "epoch": 4915} {"train_loss": -7.399606704711914, "global_step": 206469, "epoch": 4915} {"train_loss": -7.278105735778809, "global_step": 206470, "epoch": 4915} {"train_loss": -7.3948948837461925, "global_step": 206471, "epoch": 4915, "val_loss": 81891.28125} {"train_loss": -7.410143852233887, "global_step": 206472, "epoch": 4916} {"train_loss": -7.354561805725098, "global_step": 206473, "epoch": 4916} {"train_loss": -7.431385040283203, "global_step": 206474, "epoch": 4916} {"train_loss": -7.406228065490723, "global_step": 206475, "epoch": 4916} {"train_loss": -7.377107620239258, "global_step": 206476, "epoch": 4916} {"train_loss": -7.314064025878906, "global_step": 206477, "epoch": 4916} {"train_loss": -7.40203332901001, "global_step": 206478, "epoch": 4916} {"train_loss": -7.418063163757324, "global_step": 206479, "epoch": 4916} {"train_loss": -7.390674591064453, "global_step": 206480, "epoch": 4916} {"train_loss": -7.448173522949219, "global_step": 206481, "epoch": 4916} {"train_loss": -7.538661956787109, "global_step": 206482, "epoch": 4916} {"train_loss": -7.283818244934082, "global_step": 206483, "epoch": 4916} {"train_loss": -7.5520853996276855, "global_step": 206484, "epoch": 4916} {"train_loss": -7.440848350524902, "global_step": 206485, "epoch": 4916} {"train_loss": -7.460726737976074, "global_step": 206486, "epoch": 4916} {"train_loss": -7.3840460777282715, "global_step": 206487, "epoch": 4916} {"train_loss": -7.342509746551514, "global_step": 206488, "epoch": 4916} {"train_loss": -7.474174499511719, "global_step": 206489, "epoch": 4916} {"train_loss": -7.388802528381348, "global_step": 206490, "epoch": 4916} {"train_loss": -7.441381454467773, "global_step": 206491, "epoch": 4916} {"train_loss": -7.245736122131348, "global_step": 206492, "epoch": 4916} {"train_loss": -7.398937702178955, "global_step": 206493, "epoch": 4916} {"train_loss": -7.301425933837891, "global_step": 206494, "epoch": 4916} {"train_loss": -7.325839996337891, "global_step": 206495, "epoch": 4916} {"train_loss": -7.435508728027344, "global_step": 206496, "epoch": 4916} {"train_loss": -7.332257270812988, "global_step": 206497, "epoch": 4916} {"train_loss": -7.449768543243408, "global_step": 206498, "epoch": 4916} {"train_loss": -7.26654052734375, "global_step": 206499, "epoch": 4916} {"train_loss": -7.410163879394531, "global_step": 206500, "epoch": 4916} {"train_loss": -7.309291839599609, "global_step": 206501, "epoch": 4916} {"train_loss": -7.2423906326293945, "global_step": 206502, "epoch": 4916} {"train_loss": -7.428264141082764, "global_step": 206503, "epoch": 4916} {"train_loss": -7.26157283782959, "global_step": 206504, "epoch": 4916} {"train_loss": -7.061759948730469, "global_step": 206505, "epoch": 4916} {"train_loss": -7.4216413497924805, "global_step": 206506, "epoch": 4916} {"train_loss": -7.251701354980469, "global_step": 206507, "epoch": 4916} {"train_loss": -7.2359161376953125, "global_step": 206508, "epoch": 4916} {"train_loss": -7.447979927062988, "global_step": 206509, "epoch": 4916} {"train_loss": -7.256567001342773, "global_step": 206510, "epoch": 4916} {"train_loss": -7.331012725830078, "global_step": 206511, "epoch": 4916} {"train_loss": -7.299050331115723, "global_step": 206512, "epoch": 4916} {"train_loss": -7.3621613298143656, "global_step": 206513, "epoch": 4916, "val_loss": 81631.2265625} {"train_loss": -7.28727912902832, "global_step": 206514, "epoch": 4917} {"train_loss": -7.258258819580078, "global_step": 206515, "epoch": 4917} {"train_loss": -7.239894390106201, "global_step": 206516, "epoch": 4917} {"train_loss": -7.36865234375, "global_step": 206517, "epoch": 4917} {"train_loss": -7.274805545806885, "global_step": 206518, "epoch": 4917} {"train_loss": -7.249683380126953, "global_step": 206519, "epoch": 4917} {"train_loss": -7.274932384490967, "global_step": 206520, "epoch": 4917} {"train_loss": -7.29270076751709, "global_step": 206521, "epoch": 4917} {"train_loss": -7.194576263427734, "global_step": 206522, "epoch": 4917} {"train_loss": -7.279362678527832, "global_step": 206523, "epoch": 4917} {"train_loss": -7.201696395874023, "global_step": 206524, "epoch": 4917} {"train_loss": -7.2952375411987305, "global_step": 206525, "epoch": 4917} {"train_loss": -7.254213333129883, "global_step": 206526, "epoch": 4917} {"train_loss": -7.363547325134277, "global_step": 206527, "epoch": 4917} {"train_loss": -7.258510589599609, "global_step": 206528, "epoch": 4917} {"train_loss": -7.235817909240723, "global_step": 206529, "epoch": 4917} {"train_loss": -7.3260908126831055, "global_step": 206530, "epoch": 4917} {"train_loss": -7.357455253601074, "global_step": 206531, "epoch": 4917} {"train_loss": -7.3556318283081055, "global_step": 206532, "epoch": 4917} {"train_loss": -7.269275665283203, "global_step": 206533, "epoch": 4917} {"train_loss": -7.324464797973633, "global_step": 206534, "epoch": 4917} {"train_loss": -7.358044147491455, "global_step": 206535, "epoch": 4917} {"train_loss": -7.351400852203369, "global_step": 206536, "epoch": 4917} {"train_loss": -7.372849464416504, "global_step": 206537, "epoch": 4917} {"train_loss": -7.3498430252075195, "global_step": 206538, "epoch": 4917} {"train_loss": -7.261347770690918, "global_step": 206539, "epoch": 4917} {"train_loss": -7.378681182861328, "global_step": 206540, "epoch": 4917} {"train_loss": -7.183850288391113, "global_step": 206541, "epoch": 4917} {"train_loss": -7.258655548095703, "global_step": 206542, "epoch": 4917} {"train_loss": -7.3121185302734375, "global_step": 206543, "epoch": 4917} {"train_loss": -7.169112682342529, "global_step": 206544, "epoch": 4917} {"train_loss": -7.441592216491699, "global_step": 206545, "epoch": 4917} {"train_loss": -7.253385066986084, "global_step": 206546, "epoch": 4917} {"train_loss": -7.342518329620361, "global_step": 206547, "epoch": 4917} {"train_loss": -7.291242599487305, "global_step": 206548, "epoch": 4917} {"train_loss": -7.228982448577881, "global_step": 206549, "epoch": 4917} {"train_loss": -7.334474563598633, "global_step": 206550, "epoch": 4917} {"train_loss": -7.396461486816406, "global_step": 206551, "epoch": 4917} {"train_loss": -7.223252296447754, "global_step": 206552, "epoch": 4917} {"train_loss": -7.26186466217041, "global_step": 206553, "epoch": 4917} {"train_loss": -7.260711669921875, "global_step": 206554, "epoch": 4917} {"train_loss": -7.294011524745396, "global_step": 206555, "epoch": 4917, "val_loss": 81726.2265625} {"train_loss": -7.096489906311035, "global_step": 206556, "epoch": 4918} {"train_loss": -7.3252763748168945, "global_step": 206557, "epoch": 4918} {"train_loss": -7.099386215209961, "global_step": 206558, "epoch": 4918} {"train_loss": -7.356363296508789, "global_step": 206559, "epoch": 4918} {"train_loss": -7.270960807800293, "global_step": 206560, "epoch": 4918} {"train_loss": -7.251953601837158, "global_step": 206561, "epoch": 4918} {"train_loss": -7.324862957000732, "global_step": 206562, "epoch": 4918} {"train_loss": -7.173689842224121, "global_step": 206563, "epoch": 4918} {"train_loss": -7.294410705566406, "global_step": 206564, "epoch": 4918} {"train_loss": -7.343118190765381, "global_step": 206565, "epoch": 4918} {"train_loss": -7.1678466796875, "global_step": 206566, "epoch": 4918} {"train_loss": -7.187925338745117, "global_step": 206567, "epoch": 4918} {"train_loss": -7.288707733154297, "global_step": 206568, "epoch": 4918} {"train_loss": -7.169089317321777, "global_step": 206569, "epoch": 4918} {"train_loss": -7.234536647796631, "global_step": 206570, "epoch": 4918} {"train_loss": -7.322548866271973, "global_step": 206571, "epoch": 4918} {"train_loss": -7.2980780601501465, "global_step": 206572, "epoch": 4918} {"train_loss": -7.264858722686768, "global_step": 206573, "epoch": 4918} {"train_loss": -7.190483093261719, "global_step": 206574, "epoch": 4918} {"train_loss": -7.346267223358154, "global_step": 206575, "epoch": 4918} {"train_loss": -7.321023941040039, "global_step": 206576, "epoch": 4918} {"train_loss": -7.153733253479004, "global_step": 206577, "epoch": 4918} {"train_loss": -7.334554195404053, "global_step": 206578, "epoch": 4918} {"train_loss": -7.296109199523926, "global_step": 206579, "epoch": 4918} {"train_loss": -7.28631591796875, "global_step": 206580, "epoch": 4918} {"train_loss": -7.294619560241699, "global_step": 206581, "epoch": 4918} {"train_loss": -7.322887420654297, "global_step": 206582, "epoch": 4918} {"train_loss": -7.34989070892334, "global_step": 206583, "epoch": 4918} {"train_loss": -7.386590957641602, "global_step": 206584, "epoch": 4918} {"train_loss": -7.309398651123047, "global_step": 206585, "epoch": 4918} {"train_loss": -7.421418190002441, "global_step": 206586, "epoch": 4918} {"train_loss": -7.43564510345459, "global_step": 206587, "epoch": 4918} {"train_loss": -7.2935638427734375, "global_step": 206588, "epoch": 4918} {"train_loss": -7.406083106994629, "global_step": 206589, "epoch": 4918} {"train_loss": -7.40366268157959, "global_step": 206590, "epoch": 4918} {"train_loss": -7.269680023193359, "global_step": 206591, "epoch": 4918} {"train_loss": -7.44273042678833, "global_step": 206592, "epoch": 4918} {"train_loss": -7.410599708557129, "global_step": 206593, "epoch": 4918} {"train_loss": -7.506566047668457, "global_step": 206594, "epoch": 4918} {"train_loss": -7.403755187988281, "global_step": 206595, "epoch": 4918} {"train_loss": -7.342909812927246, "global_step": 206596, "epoch": 4918} {"train_loss": -7.303114153089977, "global_step": 206597, "epoch": 4918, "val_loss": 81991.0546875} {"train_loss": -7.309004306793213, "global_step": 206598, "epoch": 4919} {"train_loss": -7.345266342163086, "global_step": 206599, "epoch": 4919} {"train_loss": -7.3106160163879395, "global_step": 206600, "epoch": 4919} {"train_loss": -7.38291072845459, "global_step": 206601, "epoch": 4919} {"train_loss": -7.450774192810059, "global_step": 206602, "epoch": 4919} {"train_loss": -7.407597064971924, "global_step": 206603, "epoch": 4919} {"train_loss": -7.417144298553467, "global_step": 206604, "epoch": 4919} {"train_loss": -7.401216506958008, "global_step": 206605, "epoch": 4919} {"train_loss": -7.426033020019531, "global_step": 206606, "epoch": 4919} {"train_loss": -7.4073896408081055, "global_step": 206607, "epoch": 4919} {"train_loss": -7.3274688720703125, "global_step": 206608, "epoch": 4919} {"train_loss": -7.410841464996338, "global_step": 206609, "epoch": 4919} {"train_loss": -7.337093353271484, "global_step": 206610, "epoch": 4919} {"train_loss": -7.301969051361084, "global_step": 206611, "epoch": 4919} {"train_loss": -7.3261942863464355, "global_step": 206612, "epoch": 4919} {"train_loss": -7.309251308441162, "global_step": 206613, "epoch": 4919} {"train_loss": -7.32720422744751, "global_step": 206614, "epoch": 4919} {"train_loss": -7.410557270050049, "global_step": 206615, "epoch": 4919} {"train_loss": -7.256999969482422, "global_step": 206616, "epoch": 4919} {"train_loss": -7.368537425994873, "global_step": 206617, "epoch": 4919} {"train_loss": -7.295633316040039, "global_step": 206618, "epoch": 4919} {"train_loss": -7.326563835144043, "global_step": 206619, "epoch": 4919} {"train_loss": -7.3357954025268555, "global_step": 206620, "epoch": 4919} {"train_loss": -7.388814926147461, "global_step": 206621, "epoch": 4919} {"train_loss": -7.330109596252441, "global_step": 206622, "epoch": 4919} {"train_loss": -7.409493923187256, "global_step": 206623, "epoch": 4919} {"train_loss": -7.304648399353027, "global_step": 206624, "epoch": 4919} {"train_loss": -7.457343578338623, "global_step": 206625, "epoch": 4919} {"train_loss": -7.404078483581543, "global_step": 206626, "epoch": 4919} {"train_loss": -7.294824123382568, "global_step": 206627, "epoch": 4919} {"train_loss": -7.39218807220459, "global_step": 206628, "epoch": 4919} {"train_loss": -7.46602725982666, "global_step": 206629, "epoch": 4919} {"train_loss": -7.271125793457031, "global_step": 206630, "epoch": 4919} {"train_loss": -7.392560958862305, "global_step": 206631, "epoch": 4919} {"train_loss": -7.293453693389893, "global_step": 206632, "epoch": 4919} {"train_loss": -7.3840436935424805, "global_step": 206633, "epoch": 4919} {"train_loss": -7.462059020996094, "global_step": 206634, "epoch": 4919} {"train_loss": -7.294425010681152, "global_step": 206635, "epoch": 4919} {"train_loss": -7.311557769775391, "global_step": 206636, "epoch": 4919} {"train_loss": -7.385726451873779, "global_step": 206637, "epoch": 4919} {"train_loss": -7.37447452545166, "global_step": 206638, "epoch": 4919} {"train_loss": -7.362904037748065, "global_step": 206639, "epoch": 4919, "val_loss": 82020.515625} {"train_loss": -7.4257893562316895, "global_step": 206640, "epoch": 4920} {"train_loss": -7.224689960479736, "global_step": 206641, "epoch": 4920} {"train_loss": -7.1725006103515625, "global_step": 206642, "epoch": 4920} {"train_loss": -7.208196640014648, "global_step": 206643, "epoch": 4920} {"train_loss": -7.333719253540039, "global_step": 206644, "epoch": 4920} {"train_loss": -7.3659820556640625, "global_step": 206645, "epoch": 4920} {"train_loss": -7.323326110839844, "global_step": 206646, "epoch": 4920} {"train_loss": -7.29400110244751, "global_step": 206647, "epoch": 4920} {"train_loss": -7.337041854858398, "global_step": 206648, "epoch": 4920} {"train_loss": -7.113523483276367, "global_step": 206649, "epoch": 4920} {"train_loss": -7.268087863922119, "global_step": 206650, "epoch": 4920} {"train_loss": -7.28892707824707, "global_step": 206651, "epoch": 4920} {"train_loss": -7.065443992614746, "global_step": 206652, "epoch": 4920} {"train_loss": -7.24808931350708, "global_step": 206653, "epoch": 4920} {"train_loss": -7.166637897491455, "global_step": 206654, "epoch": 4920} {"train_loss": -7.074780464172363, "global_step": 206655, "epoch": 4920} {"train_loss": -7.242047309875488, "global_step": 206656, "epoch": 4920} {"train_loss": -7.21829891204834, "global_step": 206657, "epoch": 4920} {"train_loss": -7.203292369842529, "global_step": 206658, "epoch": 4920} {"train_loss": -7.240777015686035, "global_step": 206659, "epoch": 4920} {"train_loss": -7.307034492492676, "global_step": 206660, "epoch": 4920} {"train_loss": -7.146504878997803, "global_step": 206661, "epoch": 4920} {"train_loss": -7.223424434661865, "global_step": 206662, "epoch": 4920} {"train_loss": -7.227721214294434, "global_step": 206663, "epoch": 4920} {"train_loss": -7.302162170410156, "global_step": 206664, "epoch": 4920} {"train_loss": -7.309831619262695, "global_step": 206665, "epoch": 4920} {"train_loss": -7.32035493850708, "global_step": 206666, "epoch": 4920} {"train_loss": -7.146904945373535, "global_step": 206667, "epoch": 4920} {"train_loss": -7.292558670043945, "global_step": 206668, "epoch": 4920} {"train_loss": -7.275016784667969, "global_step": 206669, "epoch": 4920} {"train_loss": -7.255823612213135, "global_step": 206670, "epoch": 4920} {"train_loss": -7.1257219314575195, "global_step": 206671, "epoch": 4920} {"train_loss": -7.325267791748047, "global_step": 206672, "epoch": 4920} {"train_loss": -7.333280086517334, "global_step": 206673, "epoch": 4920} {"train_loss": -7.340382099151611, "global_step": 206674, "epoch": 4920} {"train_loss": -7.375128746032715, "global_step": 206675, "epoch": 4920} {"train_loss": -7.360387325286865, "global_step": 206676, "epoch": 4920} {"train_loss": -7.416995048522949, "global_step": 206677, "epoch": 4920} {"train_loss": -7.3394389152526855, "global_step": 206678, "epoch": 4920} {"train_loss": -7.329473972320557, "global_step": 206679, "epoch": 4920} {"train_loss": -7.328094482421875, "global_step": 206680, "epoch": 4920} {"train_loss": -7.26893112772987, "global_step": 206681, "epoch": 4920, "val_loss": 82041.1796875} {"train_loss": -7.281092643737793, "global_step": 206682, "epoch": 4921} {"train_loss": -7.2808966636657715, "global_step": 206683, "epoch": 4921} {"train_loss": -7.245931148529053, "global_step": 206684, "epoch": 4921} {"train_loss": -7.3208136558532715, "global_step": 206685, "epoch": 4921} {"train_loss": -7.338106155395508, "global_step": 206686, "epoch": 4921} {"train_loss": -7.348021507263184, "global_step": 206687, "epoch": 4921} {"train_loss": -7.243119239807129, "global_step": 206688, "epoch": 4921} {"train_loss": -7.2270402908325195, "global_step": 206689, "epoch": 4921} {"train_loss": -7.349327087402344, "global_step": 206690, "epoch": 4921} {"train_loss": -7.149144172668457, "global_step": 206691, "epoch": 4921} {"train_loss": -7.134958267211914, "global_step": 206692, "epoch": 4921} {"train_loss": -7.329171180725098, "global_step": 206693, "epoch": 4921} {"train_loss": -7.227386474609375, "global_step": 206694, "epoch": 4921} {"train_loss": -7.329307556152344, "global_step": 206695, "epoch": 4921} {"train_loss": -7.202592372894287, "global_step": 206696, "epoch": 4921} {"train_loss": -7.207617282867432, "global_step": 206697, "epoch": 4921} {"train_loss": -7.1918535232543945, "global_step": 206698, "epoch": 4921} {"train_loss": -7.196991920471191, "global_step": 206699, "epoch": 4921} {"train_loss": -7.336139678955078, "global_step": 206700, "epoch": 4921} {"train_loss": -7.281406879425049, "global_step": 206701, "epoch": 4921} {"train_loss": -7.203200340270996, "global_step": 206702, "epoch": 4921} {"train_loss": -7.267312049865723, "global_step": 206703, "epoch": 4921} {"train_loss": -7.349834442138672, "global_step": 206704, "epoch": 4921} {"train_loss": -7.2562360763549805, "global_step": 206705, "epoch": 4921} {"train_loss": -7.319126129150391, "global_step": 206706, "epoch": 4921} {"train_loss": -7.331997871398926, "global_step": 206707, "epoch": 4921} {"train_loss": -7.248616695404053, "global_step": 206708, "epoch": 4921} {"train_loss": -7.428893089294434, "global_step": 206709, "epoch": 4921} {"train_loss": -7.279074192047119, "global_step": 206710, "epoch": 4921} {"train_loss": -7.394138813018799, "global_step": 206711, "epoch": 4921} {"train_loss": -7.445612907409668, "global_step": 206712, "epoch": 4921} {"train_loss": -7.220244407653809, "global_step": 206713, "epoch": 4921} {"train_loss": -7.4223151206970215, "global_step": 206714, "epoch": 4921} {"train_loss": -7.3320465087890625, "global_step": 206715, "epoch": 4921} {"train_loss": -7.44862174987793, "global_step": 206716, "epoch": 4921} {"train_loss": -7.375607967376709, "global_step": 206717, "epoch": 4921} {"train_loss": -7.390782356262207, "global_step": 206718, "epoch": 4921} {"train_loss": -7.445923805236816, "global_step": 206719, "epoch": 4921} {"train_loss": -7.169917106628418, "global_step": 206720, "epoch": 4921} {"train_loss": -7.423582077026367, "global_step": 206721, "epoch": 4921} {"train_loss": -7.307470798492432, "global_step": 206722, "epoch": 4921} {"train_loss": -7.298907790865217, "global_step": 206723, "epoch": 4921, "val_loss": 81613.9609375} {"train_loss": -7.389493942260742, "global_step": 206724, "epoch": 4922} {"train_loss": -7.28236198425293, "global_step": 206725, "epoch": 4922} {"train_loss": -7.364752292633057, "global_step": 206726, "epoch": 4922} {"train_loss": -7.298081874847412, "global_step": 206727, "epoch": 4922} {"train_loss": -7.348876476287842, "global_step": 206728, "epoch": 4922} {"train_loss": -7.345386028289795, "global_step": 206729, "epoch": 4922} {"train_loss": -7.254180908203125, "global_step": 206730, "epoch": 4922} {"train_loss": -7.3257246017456055, "global_step": 206731, "epoch": 4922} {"train_loss": -7.409404277801514, "global_step": 206732, "epoch": 4922} {"train_loss": -7.3593831062316895, "global_step": 206733, "epoch": 4922} {"train_loss": -7.380898475646973, "global_step": 206734, "epoch": 4922} {"train_loss": -7.4352264404296875, "global_step": 206735, "epoch": 4922} {"train_loss": -7.458491802215576, "global_step": 206736, "epoch": 4922} {"train_loss": -7.330575942993164, "global_step": 206737, "epoch": 4922} {"train_loss": -7.413562774658203, "global_step": 206738, "epoch": 4922} {"train_loss": -7.420501708984375, "global_step": 206739, "epoch": 4922} {"train_loss": -7.273358345031738, "global_step": 206740, "epoch": 4922} {"train_loss": -7.411890506744385, "global_step": 206741, "epoch": 4922} {"train_loss": -7.362900733947754, "global_step": 206742, "epoch": 4922} {"train_loss": -7.361414909362793, "global_step": 206743, "epoch": 4922} {"train_loss": -7.3103346824646, "global_step": 206744, "epoch": 4922} {"train_loss": -7.2981085777282715, "global_step": 206745, "epoch": 4922} {"train_loss": -7.387325286865234, "global_step": 206746, "epoch": 4922} {"train_loss": -7.334622859954834, "global_step": 206747, "epoch": 4922} {"train_loss": -7.331662178039551, "global_step": 206748, "epoch": 4922} {"train_loss": -7.274081230163574, "global_step": 206749, "epoch": 4922} {"train_loss": -7.359637260437012, "global_step": 206750, "epoch": 4922} {"train_loss": -7.271344184875488, "global_step": 206751, "epoch": 4922} {"train_loss": -7.295172691345215, "global_step": 206752, "epoch": 4922} {"train_loss": -7.352474689483643, "global_step": 206753, "epoch": 4922} {"train_loss": -7.3387980461120605, "global_step": 206754, "epoch": 4922} {"train_loss": -7.255688667297363, "global_step": 206755, "epoch": 4922} {"train_loss": -7.292479991912842, "global_step": 206756, "epoch": 4922} {"train_loss": -7.4507737159729, "global_step": 206757, "epoch": 4922} {"train_loss": -7.210765361785889, "global_step": 206758, "epoch": 4922} {"train_loss": -7.368520736694336, "global_step": 206759, "epoch": 4922} {"train_loss": -7.289084434509277, "global_step": 206760, "epoch": 4922} {"train_loss": -7.387760639190674, "global_step": 206761, "epoch": 4922} {"train_loss": -7.3049845695495605, "global_step": 206762, "epoch": 4922} {"train_loss": -7.3355560302734375, "global_step": 206763, "epoch": 4922} {"train_loss": -7.234189510345459, "global_step": 206764, "epoch": 4922} {"train_loss": -7.338436308361235, "global_step": 206765, "epoch": 4922, "val_loss": 81797.265625} {"train_loss": -7.452614784240723, "global_step": 206766, "epoch": 4923} {"train_loss": -7.171555042266846, "global_step": 206767, "epoch": 4923} {"train_loss": -7.2320637702941895, "global_step": 206768, "epoch": 4923} {"train_loss": -7.303164482116699, "global_step": 206769, "epoch": 4923} {"train_loss": -7.137930393218994, "global_step": 206770, "epoch": 4923} {"train_loss": -7.386113166809082, "global_step": 206771, "epoch": 4923} {"train_loss": -7.13745641708374, "global_step": 206772, "epoch": 4923} {"train_loss": -7.275336265563965, "global_step": 206773, "epoch": 4923} {"train_loss": -7.316536903381348, "global_step": 206774, "epoch": 4923} {"train_loss": -7.188850402832031, "global_step": 206775, "epoch": 4923} {"train_loss": -7.257824897766113, "global_step": 206776, "epoch": 4923} {"train_loss": -7.165960311889648, "global_step": 206777, "epoch": 4923} {"train_loss": -7.207890510559082, "global_step": 206778, "epoch": 4923} {"train_loss": -7.121808052062988, "global_step": 206779, "epoch": 4923} {"train_loss": -7.093960285186768, "global_step": 206780, "epoch": 4923} {"train_loss": -7.244182586669922, "global_step": 206781, "epoch": 4923} {"train_loss": -7.124843597412109, "global_step": 206782, "epoch": 4923} {"train_loss": -7.222005844116211, "global_step": 206783, "epoch": 4923} {"train_loss": -7.207221031188965, "global_step": 206784, "epoch": 4923} {"train_loss": -7.174690246582031, "global_step": 206785, "epoch": 4923} {"train_loss": -7.272995948791504, "global_step": 206786, "epoch": 4923} {"train_loss": -7.227758407592773, "global_step": 206787, "epoch": 4923} {"train_loss": -7.3106889724731445, "global_step": 206788, "epoch": 4923} {"train_loss": -7.135529518127441, "global_step": 206789, "epoch": 4923} {"train_loss": -7.371252059936523, "global_step": 206790, "epoch": 4923} {"train_loss": -7.293057918548584, "global_step": 206791, "epoch": 4923} {"train_loss": -7.322772026062012, "global_step": 206792, "epoch": 4923} {"train_loss": -7.3606462478637695, "global_step": 206793, "epoch": 4923} {"train_loss": -7.270998954772949, "global_step": 206794, "epoch": 4923} {"train_loss": -7.1182966232299805, "global_step": 206795, "epoch": 4923} {"train_loss": -7.395840167999268, "global_step": 206796, "epoch": 4923} {"train_loss": -7.270140171051025, "global_step": 206797, "epoch": 4923} {"train_loss": -7.38768196105957, "global_step": 206798, "epoch": 4923} {"train_loss": -7.304159641265869, "global_step": 206799, "epoch": 4923} {"train_loss": -7.2909650802612305, "global_step": 206800, "epoch": 4923} {"train_loss": -7.360082149505615, "global_step": 206801, "epoch": 4923} {"train_loss": -7.2510986328125, "global_step": 206802, "epoch": 4923} {"train_loss": -7.399086952209473, "global_step": 206803, "epoch": 4923} {"train_loss": -7.372361660003662, "global_step": 206804, "epoch": 4923} {"train_loss": -7.478672981262207, "global_step": 206805, "epoch": 4923} {"train_loss": -7.356797218322754, "global_step": 206806, "epoch": 4923} {"train_loss": -7.271879593531291, "global_step": 206807, "epoch": 4923, "val_loss": 81976.71875} {"train_loss": -7.433777809143066, "global_step": 206808, "epoch": 4924} {"train_loss": -7.310461521148682, "global_step": 206809, "epoch": 4924} {"train_loss": -7.306313514709473, "global_step": 206810, "epoch": 4924} {"train_loss": -7.346548080444336, "global_step": 206811, "epoch": 4924} {"train_loss": -7.531676292419434, "global_step": 206812, "epoch": 4924} {"train_loss": -7.407952308654785, "global_step": 206813, "epoch": 4924} {"train_loss": -7.441801071166992, "global_step": 206814, "epoch": 4924} {"train_loss": -7.501443862915039, "global_step": 206815, "epoch": 4924} {"train_loss": -7.406859874725342, "global_step": 206816, "epoch": 4924} {"train_loss": -7.3471574783325195, "global_step": 206817, "epoch": 4924} {"train_loss": -7.458199977874756, "global_step": 206818, "epoch": 4924} {"train_loss": -7.3098554611206055, "global_step": 206819, "epoch": 4924} {"train_loss": -7.322234153747559, "global_step": 206820, "epoch": 4924} {"train_loss": -7.433696746826172, "global_step": 206821, "epoch": 4924} {"train_loss": -7.459506511688232, "global_step": 206822, "epoch": 4924} {"train_loss": -7.433393955230713, "global_step": 206823, "epoch": 4924} {"train_loss": -7.365777969360352, "global_step": 206824, "epoch": 4924} {"train_loss": -7.482359409332275, "global_step": 206825, "epoch": 4924} {"train_loss": -7.432801723480225, "global_step": 206826, "epoch": 4924} {"train_loss": -7.434016227722168, "global_step": 206827, "epoch": 4924} {"train_loss": -7.470516204833984, "global_step": 206828, "epoch": 4924} {"train_loss": -7.376247406005859, "global_step": 206829, "epoch": 4924} {"train_loss": -7.376291751861572, "global_step": 206830, "epoch": 4924} {"train_loss": -7.37322473526001, "global_step": 206831, "epoch": 4924} {"train_loss": -7.373246669769287, "global_step": 206832, "epoch": 4924} {"train_loss": -7.29265022277832, "global_step": 206833, "epoch": 4924} {"train_loss": -7.244917869567871, "global_step": 206834, "epoch": 4924} {"train_loss": -7.220947265625, "global_step": 206835, "epoch": 4924} {"train_loss": -7.299055099487305, "global_step": 206836, "epoch": 4924} {"train_loss": -7.10872745513916, "global_step": 206837, "epoch": 4924} {"train_loss": -7.15944766998291, "global_step": 206838, "epoch": 4924} {"train_loss": -7.23211669921875, "global_step": 206839, "epoch": 4924} {"train_loss": -7.124657154083252, "global_step": 206840, "epoch": 4924} {"train_loss": -7.245708465576172, "global_step": 206841, "epoch": 4924} {"train_loss": -7.177059173583984, "global_step": 206842, "epoch": 4924} {"train_loss": -7.146727561950684, "global_step": 206843, "epoch": 4924} {"train_loss": -7.25562858581543, "global_step": 206844, "epoch": 4924} {"train_loss": -7.088842868804932, "global_step": 206845, "epoch": 4924} {"train_loss": -7.192546844482422, "global_step": 206846, "epoch": 4924} {"train_loss": -7.144869804382324, "global_step": 206847, "epoch": 4924} {"train_loss": -7.340134620666504, "global_step": 206848, "epoch": 4924} {"train_loss": -7.325071278072539, "global_step": 206849, "epoch": 4924, "val_loss": 82259.2890625} {"train_loss": -7.259550094604492, "global_step": 206850, "epoch": 4925} {"train_loss": -7.206757545471191, "global_step": 206851, "epoch": 4925} {"train_loss": -7.366856575012207, "global_step": 206852, "epoch": 4925} {"train_loss": -7.299112319946289, "global_step": 206853, "epoch": 4925} {"train_loss": -7.264403343200684, "global_step": 206854, "epoch": 4925} {"train_loss": -7.1449127197265625, "global_step": 206855, "epoch": 4925} {"train_loss": -7.2343549728393555, "global_step": 206856, "epoch": 4925} {"train_loss": -7.254371166229248, "global_step": 206857, "epoch": 4925} {"train_loss": -7.363507270812988, "global_step": 206858, "epoch": 4925} {"train_loss": -7.205344200134277, "global_step": 206859, "epoch": 4925} {"train_loss": -7.255663871765137, "global_step": 206860, "epoch": 4925} {"train_loss": -7.32238245010376, "global_step": 206861, "epoch": 4925} {"train_loss": -7.384786128997803, "global_step": 206862, "epoch": 4925} {"train_loss": -7.243170738220215, "global_step": 206863, "epoch": 4925} {"train_loss": -7.348732948303223, "global_step": 206864, "epoch": 4925} {"train_loss": -7.429281234741211, "global_step": 206865, "epoch": 4925} {"train_loss": -7.25118350982666, "global_step": 206866, "epoch": 4925} {"train_loss": -7.45651388168335, "global_step": 206867, "epoch": 4925} {"train_loss": -7.387706756591797, "global_step": 206868, "epoch": 4925} {"train_loss": -7.415292739868164, "global_step": 206869, "epoch": 4925} {"train_loss": -7.460093975067139, "global_step": 206870, "epoch": 4925} {"train_loss": -7.299056529998779, "global_step": 206871, "epoch": 4925} {"train_loss": -7.2690229415893555, "global_step": 206872, "epoch": 4925} {"train_loss": -7.267712116241455, "global_step": 206873, "epoch": 4925} {"train_loss": -7.34770393371582, "global_step": 206874, "epoch": 4925} {"train_loss": -7.415700912475586, "global_step": 206875, "epoch": 4925} {"train_loss": -7.362493515014648, "global_step": 206876, "epoch": 4925} {"train_loss": -7.283223628997803, "global_step": 206877, "epoch": 4925} {"train_loss": -7.360761642456055, "global_step": 206878, "epoch": 4925} {"train_loss": -7.300583839416504, "global_step": 206879, "epoch": 4925} {"train_loss": -7.3954267501831055, "global_step": 206880, "epoch": 4925} {"train_loss": -7.325716018676758, "global_step": 206881, "epoch": 4925} {"train_loss": -7.416226387023926, "global_step": 206882, "epoch": 4925} {"train_loss": -7.37933349609375, "global_step": 206883, "epoch": 4925} {"train_loss": -7.261751174926758, "global_step": 206884, "epoch": 4925} {"train_loss": -7.15181827545166, "global_step": 206885, "epoch": 4925} {"train_loss": -7.40618896484375, "global_step": 206886, "epoch": 4925} {"train_loss": -7.335729122161865, "global_step": 206887, "epoch": 4925} {"train_loss": -7.283285140991211, "global_step": 206888, "epoch": 4925} {"train_loss": -7.275143623352051, "global_step": 206889, "epoch": 4925} {"train_loss": -7.2256035804748535, "global_step": 206890, "epoch": 4925} {"train_loss": -7.313634100414458, "global_step": 206891, "epoch": 4925, "val_loss": 82175.6015625} {"train_loss": -7.156164646148682, "global_step": 206892, "epoch": 4926} {"train_loss": -7.280991554260254, "global_step": 206893, "epoch": 4926} {"train_loss": -7.043185234069824, "global_step": 206894, "epoch": 4926} {"train_loss": -7.2205095291137695, "global_step": 206895, "epoch": 4926} {"train_loss": -7.2344512939453125, "global_step": 206896, "epoch": 4926} {"train_loss": -7.338235855102539, "global_step": 206897, "epoch": 4926} {"train_loss": -7.161757469177246, "global_step": 206898, "epoch": 4926} {"train_loss": -7.333199977874756, "global_step": 206899, "epoch": 4926} {"train_loss": -7.188140869140625, "global_step": 206900, "epoch": 4926} {"train_loss": -7.268426895141602, "global_step": 206901, "epoch": 4926} {"train_loss": -7.259504795074463, "global_step": 206902, "epoch": 4926} {"train_loss": -7.330887794494629, "global_step": 206903, "epoch": 4926} {"train_loss": -7.260900020599365, "global_step": 206904, "epoch": 4926} {"train_loss": -7.219927787780762, "global_step": 206905, "epoch": 4926} {"train_loss": -7.248485088348389, "global_step": 206906, "epoch": 4926} {"train_loss": -7.36027717590332, "global_step": 206907, "epoch": 4926} {"train_loss": -7.265377998352051, "global_step": 206908, "epoch": 4926} {"train_loss": -7.314432144165039, "global_step": 206909, "epoch": 4926} {"train_loss": -7.2736639976501465, "global_step": 206910, "epoch": 4926} {"train_loss": -7.32562255859375, "global_step": 206911, "epoch": 4926} {"train_loss": -7.295951843261719, "global_step": 206912, "epoch": 4926} {"train_loss": -7.343199729919434, "global_step": 206913, "epoch": 4926} {"train_loss": -7.348717212677002, "global_step": 206914, "epoch": 4926} {"train_loss": -7.287543296813965, "global_step": 206915, "epoch": 4926} {"train_loss": -7.260078430175781, "global_step": 206916, "epoch": 4926} {"train_loss": -7.310858249664307, "global_step": 206917, "epoch": 4926} {"train_loss": -7.274587631225586, "global_step": 206918, "epoch": 4926} {"train_loss": -7.514150619506836, "global_step": 206919, "epoch": 4926} {"train_loss": -7.355573654174805, "global_step": 206920, "epoch": 4926} {"train_loss": -7.361132621765137, "global_step": 206921, "epoch": 4926} {"train_loss": -7.414254188537598, "global_step": 206922, "epoch": 4926} {"train_loss": -7.258785724639893, "global_step": 206923, "epoch": 4926} {"train_loss": -7.395731449127197, "global_step": 206924, "epoch": 4926} {"train_loss": -7.372707366943359, "global_step": 206925, "epoch": 4926} {"train_loss": -7.372837543487549, "global_step": 206926, "epoch": 4926} {"train_loss": -7.344346046447754, "global_step": 206927, "epoch": 4926} {"train_loss": -7.430764198303223, "global_step": 206928, "epoch": 4926} {"train_loss": -7.469692230224609, "global_step": 206929, "epoch": 4926} {"train_loss": -7.316336154937744, "global_step": 206930, "epoch": 4926} {"train_loss": -7.493100166320801, "global_step": 206931, "epoch": 4926} {"train_loss": -7.382918357849121, "global_step": 206932, "epoch": 4926} {"train_loss": -7.310473555610294, "global_step": 206933, "epoch": 4926, "val_loss": 81919.734375} {"train_loss": -7.304836273193359, "global_step": 206934, "epoch": 4927} {"train_loss": -7.411807060241699, "global_step": 206935, "epoch": 4927} {"train_loss": -7.325035095214844, "global_step": 206936, "epoch": 4927} {"train_loss": -7.260171890258789, "global_step": 206937, "epoch": 4927} {"train_loss": -7.358843803405762, "global_step": 206938, "epoch": 4927} {"train_loss": -7.185221195220947, "global_step": 206939, "epoch": 4927} {"train_loss": -7.2368927001953125, "global_step": 206940, "epoch": 4927} {"train_loss": -7.395452499389648, "global_step": 206941, "epoch": 4927} {"train_loss": -7.267816543579102, "global_step": 206942, "epoch": 4927} {"train_loss": -7.235358238220215, "global_step": 206943, "epoch": 4927} {"train_loss": -7.248630523681641, "global_step": 206944, "epoch": 4927} {"train_loss": -7.242309093475342, "global_step": 206945, "epoch": 4927} {"train_loss": -7.320600509643555, "global_step": 206946, "epoch": 4927} {"train_loss": -7.351001262664795, "global_step": 206947, "epoch": 4927} {"train_loss": -7.308385848999023, "global_step": 206948, "epoch": 4927} {"train_loss": -7.2411088943481445, "global_step": 206949, "epoch": 4927} {"train_loss": -7.2697906494140625, "global_step": 206950, "epoch": 4927} {"train_loss": -7.265961170196533, "global_step": 206951, "epoch": 4927} {"train_loss": -7.2024431228637695, "global_step": 206952, "epoch": 4927} {"train_loss": -7.330153942108154, "global_step": 206953, "epoch": 4927} {"train_loss": -7.288920879364014, "global_step": 206954, "epoch": 4927} {"train_loss": -7.378941059112549, "global_step": 206955, "epoch": 4927} {"train_loss": -7.3867082595825195, "global_step": 206956, "epoch": 4927} {"train_loss": -7.328763961791992, "global_step": 206957, "epoch": 4927} {"train_loss": -7.193817138671875, "global_step": 206958, "epoch": 4927} {"train_loss": -7.170600414276123, "global_step": 206959, "epoch": 4927} {"train_loss": -7.356398582458496, "global_step": 206960, "epoch": 4927} {"train_loss": -7.242935657501221, "global_step": 206961, "epoch": 4927} {"train_loss": -7.339351177215576, "global_step": 206962, "epoch": 4927} {"train_loss": -7.357174873352051, "global_step": 206963, "epoch": 4927} {"train_loss": -7.354608535766602, "global_step": 206964, "epoch": 4927} {"train_loss": -7.288313865661621, "global_step": 206965, "epoch": 4927} {"train_loss": -7.378064155578613, "global_step": 206966, "epoch": 4927} {"train_loss": -7.369527816772461, "global_step": 206967, "epoch": 4927} {"train_loss": -7.412841796875, "global_step": 206968, "epoch": 4927} {"train_loss": -7.299599647521973, "global_step": 206969, "epoch": 4927} {"train_loss": -7.282159805297852, "global_step": 206970, "epoch": 4927} {"train_loss": -7.365114688873291, "global_step": 206971, "epoch": 4927} {"train_loss": -7.264308929443359, "global_step": 206972, "epoch": 4927} {"train_loss": -7.376674652099609, "global_step": 206973, "epoch": 4927} {"train_loss": -7.4060821533203125, "global_step": 206974, "epoch": 4927} {"train_loss": -7.30745283762614, "global_step": 206975, "epoch": 4927, "val_loss": 81812.2265625} {"train_loss": -7.380938529968262, "global_step": 206976, "epoch": 4928} {"train_loss": -7.243893623352051, "global_step": 206977, "epoch": 4928} {"train_loss": -7.386791229248047, "global_step": 206978, "epoch": 4928} {"train_loss": -7.315847396850586, "global_step": 206979, "epoch": 4928} {"train_loss": -7.381592273712158, "global_step": 206980, "epoch": 4928} {"train_loss": -7.336345672607422, "global_step": 206981, "epoch": 4928} {"train_loss": -7.290698051452637, "global_step": 206982, "epoch": 4928} {"train_loss": -7.367894172668457, "global_step": 206983, "epoch": 4928} {"train_loss": -7.268754005432129, "global_step": 206984, "epoch": 4928} {"train_loss": -7.409221649169922, "global_step": 206985, "epoch": 4928} {"train_loss": -7.256796836853027, "global_step": 206986, "epoch": 4928} {"train_loss": -7.234278202056885, "global_step": 206987, "epoch": 4928} {"train_loss": -7.3688507080078125, "global_step": 206988, "epoch": 4928} {"train_loss": -7.327378273010254, "global_step": 206989, "epoch": 4928} {"train_loss": -7.403386116027832, "global_step": 206990, "epoch": 4928} {"train_loss": -7.498355865478516, "global_step": 206991, "epoch": 4928} {"train_loss": -7.276469707489014, "global_step": 206992, "epoch": 4928} {"train_loss": -7.360971450805664, "global_step": 206993, "epoch": 4928} {"train_loss": -7.377992630004883, "global_step": 206994, "epoch": 4928} {"train_loss": -7.224508285522461, "global_step": 206995, "epoch": 4928} {"train_loss": -7.268826961517334, "global_step": 206996, "epoch": 4928} {"train_loss": -7.224224090576172, "global_step": 206997, "epoch": 4928} {"train_loss": -7.249202728271484, "global_step": 206998, "epoch": 4928} {"train_loss": -7.254653453826904, "global_step": 206999, "epoch": 4928} {"train_loss": -7.327170372009277, "global_step": 207000, "epoch": 4928} {"train_loss": -7.330491542816162, "global_step": 207001, "epoch": 4928} {"train_loss": -7.20822811126709, "global_step": 207002, "epoch": 4928} {"train_loss": -7.411516189575195, "global_step": 207003, "epoch": 4928} {"train_loss": -7.200679302215576, "global_step": 207004, "epoch": 4928} {"train_loss": -7.332947731018066, "global_step": 207005, "epoch": 4928} {"train_loss": -7.304684638977051, "global_step": 207006, "epoch": 4928} {"train_loss": -7.1920599937438965, "global_step": 207007, "epoch": 4928} {"train_loss": -7.316659450531006, "global_step": 207008, "epoch": 4928} {"train_loss": -7.32139778137207, "global_step": 207009, "epoch": 4928} {"train_loss": -7.414099216461182, "global_step": 207010, "epoch": 4928} {"train_loss": -7.284842014312744, "global_step": 207011, "epoch": 4928} {"train_loss": -7.3166913986206055, "global_step": 207012, "epoch": 4928} {"train_loss": -7.461084365844727, "global_step": 207013, "epoch": 4928} {"train_loss": -7.281436920166016, "global_step": 207014, "epoch": 4928} {"train_loss": -7.404486656188965, "global_step": 207015, "epoch": 4928} {"train_loss": -7.364409446716309, "global_step": 207016, "epoch": 4928} {"train_loss": -7.3195366859436035, "global_step": 207017, "epoch": 4928, "val_loss": 81880.78125} {"train_loss": -7.2761125564575195, "global_step": 207018, "epoch": 4929} {"train_loss": -7.183701038360596, "global_step": 207019, "epoch": 4929} {"train_loss": -7.34871768951416, "global_step": 207020, "epoch": 4929} {"train_loss": -7.193756103515625, "global_step": 207021, "epoch": 4929} {"train_loss": -7.296484470367432, "global_step": 207022, "epoch": 4929} {"train_loss": -7.171669006347656, "global_step": 207023, "epoch": 4929} {"train_loss": -7.17431640625, "global_step": 207024, "epoch": 4929} {"train_loss": -7.3008623123168945, "global_step": 207025, "epoch": 4929} {"train_loss": -7.079768180847168, "global_step": 207026, "epoch": 4929} {"train_loss": -7.279916286468506, "global_step": 207027, "epoch": 4929} {"train_loss": -7.054254055023193, "global_step": 207028, "epoch": 4929} {"train_loss": -7.205788612365723, "global_step": 207029, "epoch": 4929} {"train_loss": -7.106963157653809, "global_step": 207030, "epoch": 4929} {"train_loss": -7.16196870803833, "global_step": 207031, "epoch": 4929} {"train_loss": -7.174709796905518, "global_step": 207032, "epoch": 4929} {"train_loss": -7.139616966247559, "global_step": 207033, "epoch": 4929} {"train_loss": -7.283629894256592, "global_step": 207034, "epoch": 4929} {"train_loss": -7.32382869720459, "global_step": 207035, "epoch": 4929} {"train_loss": -7.290655612945557, "global_step": 207036, "epoch": 4929} {"train_loss": -7.137515544891357, "global_step": 207037, "epoch": 4929} {"train_loss": -7.202773094177246, "global_step": 207038, "epoch": 4929} {"train_loss": -7.171234130859375, "global_step": 207039, "epoch": 4929} {"train_loss": -7.2253875732421875, "global_step": 207040, "epoch": 4929} {"train_loss": -7.275135040283203, "global_step": 207041, "epoch": 4929} {"train_loss": -7.281806468963623, "global_step": 207042, "epoch": 4929} {"train_loss": -7.302166938781738, "global_step": 207043, "epoch": 4929} {"train_loss": -7.3647918701171875, "global_step": 207044, "epoch": 4929} {"train_loss": -7.312539577484131, "global_step": 207045, "epoch": 4929} {"train_loss": -7.404042720794678, "global_step": 207046, "epoch": 4929} {"train_loss": -7.416256904602051, "global_step": 207047, "epoch": 4929} {"train_loss": -7.380543231964111, "global_step": 207048, "epoch": 4929} {"train_loss": -7.3262739181518555, "global_step": 207049, "epoch": 4929} {"train_loss": -7.346793174743652, "global_step": 207050, "epoch": 4929} {"train_loss": -7.237500190734863, "global_step": 207051, "epoch": 4929} {"train_loss": -7.456615924835205, "global_step": 207052, "epoch": 4929} {"train_loss": -7.36331844329834, "global_step": 207053, "epoch": 4929} {"train_loss": -7.311846733093262, "global_step": 207054, "epoch": 4929} {"train_loss": -7.410940170288086, "global_step": 207055, "epoch": 4929} {"train_loss": -7.383639335632324, "global_step": 207056, "epoch": 4929} {"train_loss": -7.475442409515381, "global_step": 207057, "epoch": 4929} {"train_loss": -7.29250431060791, "global_step": 207058, "epoch": 4929} {"train_loss": -7.274943113327026, "global_step": 207059, "epoch": 4929, "val_loss": 81772.5078125} {"train_loss": -7.413856029510498, "global_step": 207060, "epoch": 4930} {"train_loss": -7.311062812805176, "global_step": 207061, "epoch": 4930} {"train_loss": -7.377171039581299, "global_step": 207062, "epoch": 4930} {"train_loss": -7.3100786209106445, "global_step": 207063, "epoch": 4930} {"train_loss": -7.4049882888793945, "global_step": 207064, "epoch": 4930} {"train_loss": -7.290786266326904, "global_step": 207065, "epoch": 4930} {"train_loss": -7.372819900512695, "global_step": 207066, "epoch": 4930} {"train_loss": -7.362773895263672, "global_step": 207067, "epoch": 4930} {"train_loss": -7.292893886566162, "global_step": 207068, "epoch": 4930} {"train_loss": -7.331012725830078, "global_step": 207069, "epoch": 4930} {"train_loss": -7.374834060668945, "global_step": 207070, "epoch": 4930} {"train_loss": -7.108474254608154, "global_step": 207071, "epoch": 4930} {"train_loss": -7.350948810577393, "global_step": 207072, "epoch": 4930} {"train_loss": -7.298694133758545, "global_step": 207073, "epoch": 4930} {"train_loss": -7.299285411834717, "global_step": 207074, "epoch": 4930} {"train_loss": -7.269716262817383, "global_step": 207075, "epoch": 4930} {"train_loss": -7.13901948928833, "global_step": 207076, "epoch": 4930} {"train_loss": -7.44572639465332, "global_step": 207077, "epoch": 4930} {"train_loss": -7.128066062927246, "global_step": 207078, "epoch": 4930} {"train_loss": -7.318539142608643, "global_step": 207079, "epoch": 4930} {"train_loss": -7.130125045776367, "global_step": 207080, "epoch": 4930} {"train_loss": -7.337360858917236, "global_step": 207081, "epoch": 4930} {"train_loss": -7.353964328765869, "global_step": 207082, "epoch": 4930} {"train_loss": -7.167274475097656, "global_step": 207083, "epoch": 4930} {"train_loss": -7.3247575759887695, "global_step": 207084, "epoch": 4930} {"train_loss": -7.242735862731934, "global_step": 207085, "epoch": 4930} {"train_loss": -7.243668079376221, "global_step": 207086, "epoch": 4930} {"train_loss": -7.2804975509643555, "global_step": 207087, "epoch": 4930} {"train_loss": -7.239413261413574, "global_step": 207088, "epoch": 4930} {"train_loss": -7.209707260131836, "global_step": 207089, "epoch": 4930} {"train_loss": -7.330329418182373, "global_step": 207090, "epoch": 4930} {"train_loss": -7.279291152954102, "global_step": 207091, "epoch": 4930} {"train_loss": -7.373722553253174, "global_step": 207092, "epoch": 4930} {"train_loss": -7.383758068084717, "global_step": 207093, "epoch": 4930} {"train_loss": -7.302262783050537, "global_step": 207094, "epoch": 4930} {"train_loss": -7.279388427734375, "global_step": 207095, "epoch": 4930} {"train_loss": -7.317368507385254, "global_step": 207096, "epoch": 4930} {"train_loss": -7.241254806518555, "global_step": 207097, "epoch": 4930} {"train_loss": -7.145256042480469, "global_step": 207098, "epoch": 4930} {"train_loss": -7.189352989196777, "global_step": 207099, "epoch": 4930} {"train_loss": -7.229432106018066, "global_step": 207100, "epoch": 4930} {"train_loss": -7.291347026824951, "global_step": 207101, "epoch": 4930, "val_loss": 81954.1015625} {"train_loss": -7.2868428230285645, "global_step": 207102, "epoch": 4931} {"train_loss": -7.476304054260254, "global_step": 207103, "epoch": 4931} {"train_loss": -7.332500457763672, "global_step": 207104, "epoch": 4931} {"train_loss": -7.282812118530273, "global_step": 207105, "epoch": 4931} {"train_loss": -7.38515567779541, "global_step": 207106, "epoch": 4931} {"train_loss": -7.283147811889648, "global_step": 207107, "epoch": 4931} {"train_loss": -7.416717052459717, "global_step": 207108, "epoch": 4931} {"train_loss": -7.4135847091674805, "global_step": 207109, "epoch": 4931} {"train_loss": -7.201353073120117, "global_step": 207110, "epoch": 4931} {"train_loss": -7.212571144104004, "global_step": 207111, "epoch": 4931} {"train_loss": -7.355295181274414, "global_step": 207112, "epoch": 4931} {"train_loss": -7.194029331207275, "global_step": 207113, "epoch": 4931} {"train_loss": -7.365664005279541, "global_step": 207114, "epoch": 4931} {"train_loss": -7.282403945922852, "global_step": 207115, "epoch": 4931} {"train_loss": -7.294219017028809, "global_step": 207116, "epoch": 4931} {"train_loss": -7.414451599121094, "global_step": 207117, "epoch": 4931} {"train_loss": -7.345597743988037, "global_step": 207118, "epoch": 4931} {"train_loss": -7.197281837463379, "global_step": 207119, "epoch": 4931} {"train_loss": -7.325264930725098, "global_step": 207120, "epoch": 4931} {"train_loss": -7.409196853637695, "global_step": 207121, "epoch": 4931} {"train_loss": -7.330630779266357, "global_step": 207122, "epoch": 4931} {"train_loss": -7.344656467437744, "global_step": 207123, "epoch": 4931} {"train_loss": -7.29585075378418, "global_step": 207124, "epoch": 4931} {"train_loss": -7.342554092407227, "global_step": 207125, "epoch": 4931} {"train_loss": -7.316125869750977, "global_step": 207126, "epoch": 4931} {"train_loss": -7.405590057373047, "global_step": 207127, "epoch": 4931} {"train_loss": -7.30438756942749, "global_step": 207128, "epoch": 4931} {"train_loss": -7.3311357498168945, "global_step": 207129, "epoch": 4931} {"train_loss": -7.337759971618652, "global_step": 207130, "epoch": 4931} {"train_loss": -7.298320770263672, "global_step": 207131, "epoch": 4931} {"train_loss": -7.421769142150879, "global_step": 207132, "epoch": 4931} {"train_loss": -7.302422523498535, "global_step": 207133, "epoch": 4931} {"train_loss": -7.321407318115234, "global_step": 207134, "epoch": 4931} {"train_loss": -7.408724308013916, "global_step": 207135, "epoch": 4931} {"train_loss": -7.304296970367432, "global_step": 207136, "epoch": 4931} {"train_loss": -7.40146541595459, "global_step": 207137, "epoch": 4931} {"train_loss": -7.380551815032959, "global_step": 207138, "epoch": 4931} {"train_loss": -7.298596382141113, "global_step": 207139, "epoch": 4931} {"train_loss": -7.36221170425415, "global_step": 207140, "epoch": 4931} {"train_loss": -7.317006587982178, "global_step": 207141, "epoch": 4931} {"train_loss": -7.298088073730469, "global_step": 207142, "epoch": 4931} {"train_loss": -7.331174714224679, "global_step": 207143, "epoch": 4931, "val_loss": 82128.546875} {"train_loss": -7.220187187194824, "global_step": 207144, "epoch": 4932} {"train_loss": -7.323380947113037, "global_step": 207145, "epoch": 4932} {"train_loss": -7.324628829956055, "global_step": 207146, "epoch": 4932} {"train_loss": -7.39194393157959, "global_step": 207147, "epoch": 4932} {"train_loss": -7.319234848022461, "global_step": 207148, "epoch": 4932} {"train_loss": -7.30183219909668, "global_step": 207149, "epoch": 4932} {"train_loss": -7.378917217254639, "global_step": 207150, "epoch": 4932} {"train_loss": -7.343854904174805, "global_step": 207151, "epoch": 4932} {"train_loss": -7.505120754241943, "global_step": 207152, "epoch": 4932} {"train_loss": -7.272663116455078, "global_step": 207153, "epoch": 4932} {"train_loss": -7.442288875579834, "global_step": 207154, "epoch": 4932} {"train_loss": -7.356971740722656, "global_step": 207155, "epoch": 4932} {"train_loss": -7.283308982849121, "global_step": 207156, "epoch": 4932} {"train_loss": -7.295869827270508, "global_step": 207157, "epoch": 4932} {"train_loss": -7.424130439758301, "global_step": 207158, "epoch": 4932} {"train_loss": -7.321035385131836, "global_step": 207159, "epoch": 4932} {"train_loss": -7.247803688049316, "global_step": 207160, "epoch": 4932} {"train_loss": -7.407986640930176, "global_step": 207161, "epoch": 4932} {"train_loss": -7.350215911865234, "global_step": 207162, "epoch": 4932} {"train_loss": -7.28884220123291, "global_step": 207163, "epoch": 4932} {"train_loss": -7.3797407150268555, "global_step": 207164, "epoch": 4932} {"train_loss": -7.40341854095459, "global_step": 207165, "epoch": 4932} {"train_loss": -7.460279941558838, "global_step": 207166, "epoch": 4932} {"train_loss": -7.3902106285095215, "global_step": 207167, "epoch": 4932} {"train_loss": -7.506201267242432, "global_step": 207168, "epoch": 4932} {"train_loss": -7.46833610534668, "global_step": 207169, "epoch": 4932} {"train_loss": -7.393986701965332, "global_step": 207170, "epoch": 4932} {"train_loss": -7.486264705657959, "global_step": 207171, "epoch": 4932} {"train_loss": -7.3626484870910645, "global_step": 207172, "epoch": 4932} {"train_loss": -7.413155555725098, "global_step": 207173, "epoch": 4932} {"train_loss": -7.329420566558838, "global_step": 207174, "epoch": 4932} {"train_loss": -7.470059394836426, "global_step": 207175, "epoch": 4932} {"train_loss": -7.379834175109863, "global_step": 207176, "epoch": 4932} {"train_loss": -7.4770426750183105, "global_step": 207177, "epoch": 4932} {"train_loss": -7.391836166381836, "global_step": 207178, "epoch": 4932} {"train_loss": -7.443207740783691, "global_step": 207179, "epoch": 4932} {"train_loss": -7.388184070587158, "global_step": 207180, "epoch": 4932} {"train_loss": -7.404027938842773, "global_step": 207181, "epoch": 4932} {"train_loss": -7.280917644500732, "global_step": 207182, "epoch": 4932} {"train_loss": -7.290960311889648, "global_step": 207183, "epoch": 4932} {"train_loss": -7.273334503173828, "global_step": 207184, "epoch": 4932} {"train_loss": -7.371111869812012, "global_step": 207185, "epoch": 4932, "val_loss": 81834.46875} {"train_loss": -7.285721778869629, "global_step": 207186, "epoch": 4933} {"train_loss": -7.408577919006348, "global_step": 207187, "epoch": 4933} {"train_loss": -7.2742085456848145, "global_step": 207188, "epoch": 4933} {"train_loss": -7.289187908172607, "global_step": 207189, "epoch": 4933} {"train_loss": -7.431964874267578, "global_step": 207190, "epoch": 4933} {"train_loss": -7.369219779968262, "global_step": 207191, "epoch": 4933} {"train_loss": -7.51249885559082, "global_step": 207192, "epoch": 4933} {"train_loss": -7.429332733154297, "global_step": 207193, "epoch": 4933} {"train_loss": -7.460073471069336, "global_step": 207194, "epoch": 4933} {"train_loss": -7.401456832885742, "global_step": 207195, "epoch": 4933} {"train_loss": -7.370693206787109, "global_step": 207196, "epoch": 4933} {"train_loss": -7.4712677001953125, "global_step": 207197, "epoch": 4933} {"train_loss": -7.421176910400391, "global_step": 207198, "epoch": 4933} {"train_loss": -7.378230094909668, "global_step": 207199, "epoch": 4933} {"train_loss": -7.508546352386475, "global_step": 207200, "epoch": 4933} {"train_loss": -7.495265007019043, "global_step": 207201, "epoch": 4933} {"train_loss": -7.48792839050293, "global_step": 207202, "epoch": 4933} {"train_loss": -7.408851623535156, "global_step": 207203, "epoch": 4933} {"train_loss": -7.469269752502441, "global_step": 207204, "epoch": 4933} {"train_loss": -7.5846171379089355, "global_step": 207205, "epoch": 4933} {"train_loss": -7.321307182312012, "global_step": 207206, "epoch": 4933} {"train_loss": -7.533542633056641, "global_step": 207207, "epoch": 4933} {"train_loss": -7.432149887084961, "global_step": 207208, "epoch": 4933} {"train_loss": -7.404163360595703, "global_step": 207209, "epoch": 4933} {"train_loss": -7.287599563598633, "global_step": 207210, "epoch": 4933} {"train_loss": -7.376420497894287, "global_step": 207211, "epoch": 4933} {"train_loss": -7.369336128234863, "global_step": 207212, "epoch": 4933} {"train_loss": -7.35700798034668, "global_step": 207213, "epoch": 4933} {"train_loss": -7.403842926025391, "global_step": 207214, "epoch": 4933} {"train_loss": -7.336982727050781, "global_step": 207215, "epoch": 4933} {"train_loss": -7.403341293334961, "global_step": 207216, "epoch": 4933} {"train_loss": -7.288799285888672, "global_step": 207217, "epoch": 4933} {"train_loss": -7.489103317260742, "global_step": 207218, "epoch": 4933} {"train_loss": -7.442193984985352, "global_step": 207219, "epoch": 4933} {"train_loss": -7.371476173400879, "global_step": 207220, "epoch": 4933} {"train_loss": -7.352655410766602, "global_step": 207221, "epoch": 4933} {"train_loss": -7.328929901123047, "global_step": 207222, "epoch": 4933} {"train_loss": -7.2902421951293945, "global_step": 207223, "epoch": 4933} {"train_loss": -7.337252616882324, "global_step": 207224, "epoch": 4933} {"train_loss": -7.344987392425537, "global_step": 207225, "epoch": 4933} {"train_loss": -7.067917823791504, "global_step": 207226, "epoch": 4933} {"train_loss": -7.387372016906738, "global_step": 207227, "epoch": 4933, "val_loss": 82087.1796875} {"train_loss": -7.227490425109863, "global_step": 207228, "epoch": 4934} {"train_loss": -7.045679092407227, "global_step": 207229, "epoch": 4934} {"train_loss": -7.282279968261719, "global_step": 207230, "epoch": 4934} {"train_loss": -7.319018363952637, "global_step": 207231, "epoch": 4934} {"train_loss": -7.233841896057129, "global_step": 207232, "epoch": 4934} {"train_loss": -7.348615646362305, "global_step": 207233, "epoch": 4934} {"train_loss": -7.233148574829102, "global_step": 207234, "epoch": 4934} {"train_loss": -7.282938480377197, "global_step": 207235, "epoch": 4934} {"train_loss": -7.194467544555664, "global_step": 207236, "epoch": 4934} {"train_loss": -7.3591628074646, "global_step": 207237, "epoch": 4934} {"train_loss": -7.403021335601807, "global_step": 207238, "epoch": 4934} {"train_loss": -7.272495269775391, "global_step": 207239, "epoch": 4934} {"train_loss": -7.473658084869385, "global_step": 207240, "epoch": 4934} {"train_loss": -7.318512439727783, "global_step": 207241, "epoch": 4934} {"train_loss": -7.314805030822754, "global_step": 207242, "epoch": 4934} {"train_loss": -7.319875240325928, "global_step": 207243, "epoch": 4934} {"train_loss": -7.362513542175293, "global_step": 207244, "epoch": 4934} {"train_loss": -7.4001359939575195, "global_step": 207245, "epoch": 4934} {"train_loss": -7.314115524291992, "global_step": 207246, "epoch": 4934} {"train_loss": -7.373958587646484, "global_step": 207247, "epoch": 4934} {"train_loss": -7.404822826385498, "global_step": 207248, "epoch": 4934} {"train_loss": -7.353099822998047, "global_step": 207249, "epoch": 4934} {"train_loss": -7.336399078369141, "global_step": 207250, "epoch": 4934} {"train_loss": -7.467558860778809, "global_step": 207251, "epoch": 4934} {"train_loss": -7.360140800476074, "global_step": 207252, "epoch": 4934} {"train_loss": -7.369885444641113, "global_step": 207253, "epoch": 4934} {"train_loss": -7.384690284729004, "global_step": 207254, "epoch": 4934} {"train_loss": -7.353888511657715, "global_step": 207255, "epoch": 4934} {"train_loss": -7.37776517868042, "global_step": 207256, "epoch": 4934} {"train_loss": -7.253993988037109, "global_step": 207257, "epoch": 4934} {"train_loss": -7.285764694213867, "global_step": 207258, "epoch": 4934} {"train_loss": -7.279352188110352, "global_step": 207259, "epoch": 4934} {"train_loss": -7.474158763885498, "global_step": 207260, "epoch": 4934} {"train_loss": -7.462214469909668, "global_step": 207261, "epoch": 4934} {"train_loss": -7.421977996826172, "global_step": 207262, "epoch": 4934} {"train_loss": -7.405097007751465, "global_step": 207263, "epoch": 4934} {"train_loss": -7.269919395446777, "global_step": 207264, "epoch": 4934} {"train_loss": -7.424525260925293, "global_step": 207265, "epoch": 4934} {"train_loss": -7.364149570465088, "global_step": 207266, "epoch": 4934} {"train_loss": -7.4009552001953125, "global_step": 207267, "epoch": 4934} {"train_loss": -7.298652648925781, "global_step": 207268, "epoch": 4934} {"train_loss": -7.335274946121943, "global_step": 207269, "epoch": 4934, "val_loss": 81799.078125} {"train_loss": -7.406400680541992, "global_step": 207270, "epoch": 4935} {"train_loss": -7.371136665344238, "global_step": 207271, "epoch": 4935} {"train_loss": -7.368517875671387, "global_step": 207272, "epoch": 4935} {"train_loss": -7.342995643615723, "global_step": 207273, "epoch": 4935} {"train_loss": -7.3132243156433105, "global_step": 207274, "epoch": 4935} {"train_loss": -7.352365016937256, "global_step": 207275, "epoch": 4935} {"train_loss": -7.262075424194336, "global_step": 207276, "epoch": 4935} {"train_loss": -7.3561110496521, "global_step": 207277, "epoch": 4935} {"train_loss": -7.39023494720459, "global_step": 207278, "epoch": 4935} {"train_loss": -7.276978015899658, "global_step": 207279, "epoch": 4935} {"train_loss": -7.341879367828369, "global_step": 207280, "epoch": 4935} {"train_loss": -7.381685733795166, "global_step": 207281, "epoch": 4935} {"train_loss": -7.327239036560059, "global_step": 207282, "epoch": 4935} {"train_loss": -7.369208335876465, "global_step": 207283, "epoch": 4935} {"train_loss": -7.36052131652832, "global_step": 207284, "epoch": 4935} {"train_loss": -7.423126220703125, "global_step": 207285, "epoch": 4935} {"train_loss": -7.297224521636963, "global_step": 207286, "epoch": 4935} {"train_loss": -7.3513054847717285, "global_step": 207287, "epoch": 4935} {"train_loss": -7.388104438781738, "global_step": 207288, "epoch": 4935} {"train_loss": -7.30824613571167, "global_step": 207289, "epoch": 4935} {"train_loss": -7.250816822052002, "global_step": 207290, "epoch": 4935} {"train_loss": -7.284597396850586, "global_step": 207291, "epoch": 4935} {"train_loss": -7.311435699462891, "global_step": 207292, "epoch": 4935} {"train_loss": -7.392823219299316, "global_step": 207293, "epoch": 4935} {"train_loss": -7.358138084411621, "global_step": 207294, "epoch": 4935} {"train_loss": -7.311337471008301, "global_step": 207295, "epoch": 4935} {"train_loss": -7.410962104797363, "global_step": 207296, "epoch": 4935} {"train_loss": -7.337116718292236, "global_step": 207297, "epoch": 4935} {"train_loss": -7.236537933349609, "global_step": 207298, "epoch": 4935} {"train_loss": -7.337120056152344, "global_step": 207299, "epoch": 4935} {"train_loss": -7.377533912658691, "global_step": 207300, "epoch": 4935} {"train_loss": -7.327037811279297, "global_step": 207301, "epoch": 4935} {"train_loss": -7.379971504211426, "global_step": 207302, "epoch": 4935} {"train_loss": -7.424224853515625, "global_step": 207303, "epoch": 4935} {"train_loss": -7.414070129394531, "global_step": 207304, "epoch": 4935} {"train_loss": -7.332975387573242, "global_step": 207305, "epoch": 4935} {"train_loss": -7.4096808433532715, "global_step": 207306, "epoch": 4935} {"train_loss": -7.385863304138184, "global_step": 207307, "epoch": 4935} {"train_loss": -7.2774434089660645, "global_step": 207308, "epoch": 4935} {"train_loss": -7.372275352478027, "global_step": 207309, "epoch": 4935} {"train_loss": -7.341423988342285, "global_step": 207310, "epoch": 4935} {"train_loss": -7.34912245614188, "global_step": 207311, "epoch": 4935, "val_loss": 82036.375} {"train_loss": -7.332895278930664, "global_step": 207312, "epoch": 4936} {"train_loss": -7.292535305023193, "global_step": 207313, "epoch": 4936} {"train_loss": -7.426433563232422, "global_step": 207314, "epoch": 4936} {"train_loss": -7.378771781921387, "global_step": 207315, "epoch": 4936} {"train_loss": -7.500990867614746, "global_step": 207316, "epoch": 4936} {"train_loss": -7.292111396789551, "global_step": 207317, "epoch": 4936} {"train_loss": -7.390186786651611, "global_step": 207318, "epoch": 4936} {"train_loss": -7.442277908325195, "global_step": 207319, "epoch": 4936} {"train_loss": -7.3069000244140625, "global_step": 207320, "epoch": 4936} {"train_loss": -7.424674987792969, "global_step": 207321, "epoch": 4936} {"train_loss": -7.47248649597168, "global_step": 207322, "epoch": 4936} {"train_loss": -7.413939952850342, "global_step": 207323, "epoch": 4936} {"train_loss": -7.479131698608398, "global_step": 207324, "epoch": 4936} {"train_loss": -7.442166328430176, "global_step": 207325, "epoch": 4936} {"train_loss": -7.306952476501465, "global_step": 207326, "epoch": 4936} {"train_loss": -7.434549331665039, "global_step": 207327, "epoch": 4936} {"train_loss": -7.319011211395264, "global_step": 207328, "epoch": 4936} {"train_loss": -7.3705735206604, "global_step": 207329, "epoch": 4936} {"train_loss": -7.4594526290893555, "global_step": 207330, "epoch": 4936} {"train_loss": -7.341306686401367, "global_step": 207331, "epoch": 4936} {"train_loss": -7.422935485839844, "global_step": 207332, "epoch": 4936} {"train_loss": -7.409235954284668, "global_step": 207333, "epoch": 4936} {"train_loss": -7.485351085662842, "global_step": 207334, "epoch": 4936} {"train_loss": -7.305891990661621, "global_step": 207335, "epoch": 4936} {"train_loss": -7.3337249755859375, "global_step": 207336, "epoch": 4936} {"train_loss": -7.412468433380127, "global_step": 207337, "epoch": 4936} {"train_loss": -7.436681270599365, "global_step": 207338, "epoch": 4936} {"train_loss": -7.360965728759766, "global_step": 207339, "epoch": 4936} {"train_loss": -7.431537628173828, "global_step": 207340, "epoch": 4936} {"train_loss": -7.3144965171813965, "global_step": 207341, "epoch": 4936} {"train_loss": -7.3416290283203125, "global_step": 207342, "epoch": 4936} {"train_loss": -7.462499618530273, "global_step": 207343, "epoch": 4936} {"train_loss": -7.439483642578125, "global_step": 207344, "epoch": 4936} {"train_loss": -7.338747024536133, "global_step": 207345, "epoch": 4936} {"train_loss": -7.361682891845703, "global_step": 207346, "epoch": 4936} {"train_loss": -7.194701671600342, "global_step": 207347, "epoch": 4936} {"train_loss": -7.306478500366211, "global_step": 207348, "epoch": 4936} {"train_loss": -7.274535179138184, "global_step": 207349, "epoch": 4936} {"train_loss": -7.383939743041992, "global_step": 207350, "epoch": 4936} {"train_loss": -7.34595251083374, "global_step": 207351, "epoch": 4936} {"train_loss": -7.367811679840088, "global_step": 207352, "epoch": 4936} {"train_loss": -7.375135137921288, "global_step": 207353, "epoch": 4936, "val_loss": 81999.171875} {"train_loss": -7.427331447601318, "global_step": 207354, "epoch": 4937} {"train_loss": -7.2905778884887695, "global_step": 207355, "epoch": 4937} {"train_loss": -7.338711261749268, "global_step": 207356, "epoch": 4937} {"train_loss": -7.225995063781738, "global_step": 207357, "epoch": 4937} {"train_loss": -7.19378662109375, "global_step": 207358, "epoch": 4937} {"train_loss": -7.3386125564575195, "global_step": 207359, "epoch": 4937} {"train_loss": -7.28425407409668, "global_step": 207360, "epoch": 4937} {"train_loss": -7.258758544921875, "global_step": 207361, "epoch": 4937} {"train_loss": -7.332098007202148, "global_step": 207362, "epoch": 4937} {"train_loss": -7.404801368713379, "global_step": 207363, "epoch": 4937} {"train_loss": -7.250235557556152, "global_step": 207364, "epoch": 4937} {"train_loss": -7.398229122161865, "global_step": 207365, "epoch": 4937} {"train_loss": -7.2352118492126465, "global_step": 207366, "epoch": 4937} {"train_loss": -7.507376670837402, "global_step": 207367, "epoch": 4937} {"train_loss": -7.249743461608887, "global_step": 207368, "epoch": 4937} {"train_loss": -7.342745780944824, "global_step": 207369, "epoch": 4937} {"train_loss": -7.268688201904297, "global_step": 207370, "epoch": 4937} {"train_loss": -7.28442907333374, "global_step": 207371, "epoch": 4937} {"train_loss": -7.367372035980225, "global_step": 207372, "epoch": 4937} {"train_loss": -7.362407684326172, "global_step": 207373, "epoch": 4937} {"train_loss": -7.419782638549805, "global_step": 207374, "epoch": 4937} {"train_loss": -7.301335334777832, "global_step": 207375, "epoch": 4937} {"train_loss": -7.260486602783203, "global_step": 207376, "epoch": 4937} {"train_loss": -7.4020094871521, "global_step": 207377, "epoch": 4937} {"train_loss": -7.33876371383667, "global_step": 207378, "epoch": 4937} {"train_loss": -7.263424873352051, "global_step": 207379, "epoch": 4937} {"train_loss": -7.302951335906982, "global_step": 207380, "epoch": 4937} {"train_loss": -7.335413932800293, "global_step": 207381, "epoch": 4937} {"train_loss": -7.307833194732666, "global_step": 207382, "epoch": 4937} {"train_loss": -7.370297431945801, "global_step": 207383, "epoch": 4937} {"train_loss": -7.241757392883301, "global_step": 207384, "epoch": 4937} {"train_loss": -7.305503845214844, "global_step": 207385, "epoch": 4937} {"train_loss": -7.470256805419922, "global_step": 207386, "epoch": 4937} {"train_loss": -7.3292436599731445, "global_step": 207387, "epoch": 4937} {"train_loss": -7.377780914306641, "global_step": 207388, "epoch": 4937} {"train_loss": -7.388952255249023, "global_step": 207389, "epoch": 4937} {"train_loss": -7.486783027648926, "global_step": 207390, "epoch": 4937} {"train_loss": -7.275792121887207, "global_step": 207391, "epoch": 4937} {"train_loss": -7.43972110748291, "global_step": 207392, "epoch": 4937} {"train_loss": -7.428792953491211, "global_step": 207393, "epoch": 4937} {"train_loss": -7.347569465637207, "global_step": 207394, "epoch": 4937} {"train_loss": -7.336304414839971, "global_step": 207395, "epoch": 4937, "val_loss": 81968.7265625} {"train_loss": -7.369422912597656, "global_step": 207396, "epoch": 4938} {"train_loss": -7.413725852966309, "global_step": 207397, "epoch": 4938} {"train_loss": -7.357189655303955, "global_step": 207398, "epoch": 4938} {"train_loss": -7.3905816078186035, "global_step": 207399, "epoch": 4938} {"train_loss": -7.449915885925293, "global_step": 207400, "epoch": 4938} {"train_loss": -7.472702980041504, "global_step": 207401, "epoch": 4938} {"train_loss": -7.480060577392578, "global_step": 207402, "epoch": 4938} {"train_loss": -7.427323341369629, "global_step": 207403, "epoch": 4938} {"train_loss": -7.443215370178223, "global_step": 207404, "epoch": 4938} {"train_loss": -7.401561260223389, "global_step": 207405, "epoch": 4938} {"train_loss": -7.476302146911621, "global_step": 207406, "epoch": 4938} {"train_loss": -7.33985710144043, "global_step": 207407, "epoch": 4938} {"train_loss": -7.290684223175049, "global_step": 207408, "epoch": 4938} {"train_loss": -7.340167045593262, "global_step": 207409, "epoch": 4938} {"train_loss": -7.36911678314209, "global_step": 207410, "epoch": 4938} {"train_loss": -7.392868995666504, "global_step": 207411, "epoch": 4938} {"train_loss": -7.421763896942139, "global_step": 207412, "epoch": 4938} {"train_loss": -7.392066478729248, "global_step": 207413, "epoch": 4938} {"train_loss": -7.421754360198975, "global_step": 207414, "epoch": 4938} {"train_loss": -7.457718849182129, "global_step": 207415, "epoch": 4938} {"train_loss": -7.486327171325684, "global_step": 207416, "epoch": 4938} {"train_loss": -7.454442024230957, "global_step": 207417, "epoch": 4938} {"train_loss": -7.4280853271484375, "global_step": 207418, "epoch": 4938} {"train_loss": -7.440572738647461, "global_step": 207419, "epoch": 4938} {"train_loss": -7.29259729385376, "global_step": 207420, "epoch": 4938} {"train_loss": -7.255331039428711, "global_step": 207421, "epoch": 4938} {"train_loss": -7.355216979980469, "global_step": 207422, "epoch": 4938} {"train_loss": -7.488157749176025, "global_step": 207423, "epoch": 4938} {"train_loss": -7.343280792236328, "global_step": 207424, "epoch": 4938} {"train_loss": -7.468940734863281, "global_step": 207425, "epoch": 4938} {"train_loss": -7.286320686340332, "global_step": 207426, "epoch": 4938} {"train_loss": -7.361088752746582, "global_step": 207427, "epoch": 4938} {"train_loss": -7.372732639312744, "global_step": 207428, "epoch": 4938} {"train_loss": -7.300462245941162, "global_step": 207429, "epoch": 4938} {"train_loss": -7.325613975524902, "global_step": 207430, "epoch": 4938} {"train_loss": -7.372659206390381, "global_step": 207431, "epoch": 4938} {"train_loss": -7.461118698120117, "global_step": 207432, "epoch": 4938} {"train_loss": -7.21050500869751, "global_step": 207433, "epoch": 4938} {"train_loss": -7.342436790466309, "global_step": 207434, "epoch": 4938} {"train_loss": -7.358057975769043, "global_step": 207435, "epoch": 4938} {"train_loss": -7.364696025848389, "global_step": 207436, "epoch": 4938} {"train_loss": -7.388878050304594, "global_step": 207437, "epoch": 4938, "val_loss": 81871.6015625} {"train_loss": -7.372983455657959, "global_step": 207438, "epoch": 4939} {"train_loss": -7.283371448516846, "global_step": 207439, "epoch": 4939} {"train_loss": -7.3401594161987305, "global_step": 207440, "epoch": 4939} {"train_loss": -7.396892547607422, "global_step": 207441, "epoch": 4939} {"train_loss": -7.200563907623291, "global_step": 207442, "epoch": 4939} {"train_loss": -7.370560646057129, "global_step": 207443, "epoch": 4939} {"train_loss": -7.363826751708984, "global_step": 207444, "epoch": 4939} {"train_loss": -7.269304275512695, "global_step": 207445, "epoch": 4939} {"train_loss": -7.313424110412598, "global_step": 207446, "epoch": 4939} {"train_loss": -7.335597991943359, "global_step": 207447, "epoch": 4939} {"train_loss": -7.20107364654541, "global_step": 207448, "epoch": 4939} {"train_loss": -7.3135271072387695, "global_step": 207449, "epoch": 4939} {"train_loss": -7.197329521179199, "global_step": 207450, "epoch": 4939} {"train_loss": -7.420864105224609, "global_step": 207451, "epoch": 4939} {"train_loss": -7.223391532897949, "global_step": 207452, "epoch": 4939} {"train_loss": -7.142956733703613, "global_step": 207453, "epoch": 4939} {"train_loss": -7.321444511413574, "global_step": 207454, "epoch": 4939} {"train_loss": -7.290306568145752, "global_step": 207455, "epoch": 4939} {"train_loss": -7.273821830749512, "global_step": 207456, "epoch": 4939} {"train_loss": -7.341541290283203, "global_step": 207457, "epoch": 4939} {"train_loss": -7.335176944732666, "global_step": 207458, "epoch": 4939} {"train_loss": -7.365988731384277, "global_step": 207459, "epoch": 4939} {"train_loss": -7.270049095153809, "global_step": 207460, "epoch": 4939} {"train_loss": -7.278279781341553, "global_step": 207461, "epoch": 4939} {"train_loss": -7.32211446762085, "global_step": 207462, "epoch": 4939} {"train_loss": -7.3768391609191895, "global_step": 207463, "epoch": 4939} {"train_loss": -7.505064010620117, "global_step": 207464, "epoch": 4939} {"train_loss": -7.282410144805908, "global_step": 207465, "epoch": 4939} {"train_loss": -7.2583231925964355, "global_step": 207466, "epoch": 4939} {"train_loss": -7.39321231842041, "global_step": 207467, "epoch": 4939} {"train_loss": -7.450153350830078, "global_step": 207468, "epoch": 4939} {"train_loss": -7.317903995513916, "global_step": 207469, "epoch": 4939} {"train_loss": -7.435840606689453, "global_step": 207470, "epoch": 4939} {"train_loss": -7.3030195236206055, "global_step": 207471, "epoch": 4939} {"train_loss": -7.319303512573242, "global_step": 207472, "epoch": 4939} {"train_loss": -7.347691535949707, "global_step": 207473, "epoch": 4939} {"train_loss": -7.493356704711914, "global_step": 207474, "epoch": 4939} {"train_loss": -7.349453926086426, "global_step": 207475, "epoch": 4939} {"train_loss": -7.359066009521484, "global_step": 207476, "epoch": 4939} {"train_loss": -7.360172271728516, "global_step": 207477, "epoch": 4939} {"train_loss": -7.329299449920654, "global_step": 207478, "epoch": 4939} {"train_loss": -7.328835192180815, "global_step": 207479, "epoch": 4939, "val_loss": 81835.2890625} {"train_loss": -7.353701591491699, "global_step": 207480, "epoch": 4940} {"train_loss": -7.265710830688477, "global_step": 207481, "epoch": 4940} {"train_loss": -7.355706691741943, "global_step": 207482, "epoch": 4940} {"train_loss": -7.279445648193359, "global_step": 207483, "epoch": 4940} {"train_loss": -7.392282485961914, "global_step": 207484, "epoch": 4940} {"train_loss": -7.455224990844727, "global_step": 207485, "epoch": 4940} {"train_loss": -7.204184532165527, "global_step": 207486, "epoch": 4940} {"train_loss": -7.452913284301758, "global_step": 207487, "epoch": 4940} {"train_loss": -7.437984943389893, "global_step": 207488, "epoch": 4940} {"train_loss": -7.331077575683594, "global_step": 207489, "epoch": 4940} {"train_loss": -7.2730326652526855, "global_step": 207490, "epoch": 4940} {"train_loss": -7.328643798828125, "global_step": 207491, "epoch": 4940} {"train_loss": -7.326415538787842, "global_step": 207492, "epoch": 4940} {"train_loss": -7.420952796936035, "global_step": 207493, "epoch": 4940} {"train_loss": -7.3981146812438965, "global_step": 207494, "epoch": 4940} {"train_loss": -7.39858865737915, "global_step": 207495, "epoch": 4940} {"train_loss": -7.328353404998779, "global_step": 207496, "epoch": 4940} {"train_loss": -7.3133087158203125, "global_step": 207497, "epoch": 4940} {"train_loss": -7.493546485900879, "global_step": 207498, "epoch": 4940} {"train_loss": -7.350688934326172, "global_step": 207499, "epoch": 4940} {"train_loss": -7.427975654602051, "global_step": 207500, "epoch": 4940} {"train_loss": -7.277969837188721, "global_step": 207501, "epoch": 4940} {"train_loss": -7.30015754699707, "global_step": 207502, "epoch": 4940} {"train_loss": -7.381109237670898, "global_step": 207503, "epoch": 4940} {"train_loss": -7.293441295623779, "global_step": 207504, "epoch": 4940} {"train_loss": -7.457297325134277, "global_step": 207505, "epoch": 4940} {"train_loss": -7.313016891479492, "global_step": 207506, "epoch": 4940} {"train_loss": -7.199692249298096, "global_step": 207507, "epoch": 4940} {"train_loss": -7.437808990478516, "global_step": 207508, "epoch": 4940} {"train_loss": -7.400531768798828, "global_step": 207509, "epoch": 4940} {"train_loss": -7.3871893882751465, "global_step": 207510, "epoch": 4940} {"train_loss": -7.312112331390381, "global_step": 207511, "epoch": 4940} {"train_loss": -7.3471832275390625, "global_step": 207512, "epoch": 4940} {"train_loss": -7.296348571777344, "global_step": 207513, "epoch": 4940} {"train_loss": -7.424870491027832, "global_step": 207514, "epoch": 4940} {"train_loss": -7.323183059692383, "global_step": 207515, "epoch": 4940} {"train_loss": -7.503302574157715, "global_step": 207516, "epoch": 4940} {"train_loss": -7.335891246795654, "global_step": 207517, "epoch": 4940} {"train_loss": -7.31804895401001, "global_step": 207518, "epoch": 4940} {"train_loss": -7.373129844665527, "global_step": 207519, "epoch": 4940} {"train_loss": -7.2707366943359375, "global_step": 207520, "epoch": 4940} {"train_loss": -7.353170996620541, "global_step": 207521, "epoch": 4940, "val_loss": 81917.5078125} {"train_loss": -7.519459247589111, "global_step": 207522, "epoch": 4941} {"train_loss": -7.3154497146606445, "global_step": 207523, "epoch": 4941} {"train_loss": -7.3809895515441895, "global_step": 207524, "epoch": 4941} {"train_loss": -7.355406284332275, "global_step": 207525, "epoch": 4941} {"train_loss": -7.393415927886963, "global_step": 207526, "epoch": 4941} {"train_loss": -7.396210193634033, "global_step": 207527, "epoch": 4941} {"train_loss": -7.355269908905029, "global_step": 207528, "epoch": 4941} {"train_loss": -7.4151835441589355, "global_step": 207529, "epoch": 4941} {"train_loss": -7.313368797302246, "global_step": 207530, "epoch": 4941} {"train_loss": -7.361690998077393, "global_step": 207531, "epoch": 4941} {"train_loss": -7.398324489593506, "global_step": 207532, "epoch": 4941} {"train_loss": -7.3775634765625, "global_step": 207533, "epoch": 4941} {"train_loss": -7.435138702392578, "global_step": 207534, "epoch": 4941} {"train_loss": -7.493616580963135, "global_step": 207535, "epoch": 4941} {"train_loss": -7.329662799835205, "global_step": 207536, "epoch": 4941} {"train_loss": -7.436834335327148, "global_step": 207537, "epoch": 4941} {"train_loss": -7.449227333068848, "global_step": 207538, "epoch": 4941} {"train_loss": -7.447484016418457, "global_step": 207539, "epoch": 4941} {"train_loss": -7.42304801940918, "global_step": 207540, "epoch": 4941} {"train_loss": -7.334726810455322, "global_step": 207541, "epoch": 4941} {"train_loss": -7.475553512573242, "global_step": 207542, "epoch": 4941} {"train_loss": -7.472496032714844, "global_step": 207543, "epoch": 4941} {"train_loss": -7.25516414642334, "global_step": 207544, "epoch": 4941} {"train_loss": -7.458794593811035, "global_step": 207545, "epoch": 4941} {"train_loss": -7.37467622756958, "global_step": 207546, "epoch": 4941} {"train_loss": -7.447500228881836, "global_step": 207547, "epoch": 4941} {"train_loss": -7.345353126525879, "global_step": 207548, "epoch": 4941} {"train_loss": -7.334991455078125, "global_step": 207549, "epoch": 4941} {"train_loss": -7.384631156921387, "global_step": 207550, "epoch": 4941} {"train_loss": -7.298274517059326, "global_step": 207551, "epoch": 4941} {"train_loss": -7.285787582397461, "global_step": 207552, "epoch": 4941} {"train_loss": -7.225533485412598, "global_step": 207553, "epoch": 4941} {"train_loss": -7.3201799392700195, "global_step": 207554, "epoch": 4941} {"train_loss": -7.485227108001709, "global_step": 207555, "epoch": 4941} {"train_loss": -7.405245780944824, "global_step": 207556, "epoch": 4941} {"train_loss": -7.263186454772949, "global_step": 207557, "epoch": 4941} {"train_loss": -7.377915382385254, "global_step": 207558, "epoch": 4941} {"train_loss": -7.192830562591553, "global_step": 207559, "epoch": 4941} {"train_loss": -7.3541669845581055, "global_step": 207560, "epoch": 4941} {"train_loss": -7.267179012298584, "global_step": 207561, "epoch": 4941} {"train_loss": -7.362123489379883, "global_step": 207562, "epoch": 4941} {"train_loss": -7.37348290852138, "global_step": 207563, "epoch": 4941, "val_loss": 81931.6640625} {"train_loss": -7.290759563446045, "global_step": 207564, "epoch": 4942} {"train_loss": -7.3591532707214355, "global_step": 207565, "epoch": 4942} {"train_loss": -7.302066802978516, "global_step": 207566, "epoch": 4942} {"train_loss": -7.354082107543945, "global_step": 207567, "epoch": 4942} {"train_loss": -7.356807708740234, "global_step": 207568, "epoch": 4942} {"train_loss": -7.292398452758789, "global_step": 207569, "epoch": 4942} {"train_loss": -7.395334720611572, "global_step": 207570, "epoch": 4942} {"train_loss": -7.365928649902344, "global_step": 207571, "epoch": 4942} {"train_loss": -7.39483642578125, "global_step": 207572, "epoch": 4942} {"train_loss": -7.325558662414551, "global_step": 207573, "epoch": 4942} {"train_loss": -7.300576686859131, "global_step": 207574, "epoch": 4942} {"train_loss": -7.272373199462891, "global_step": 207575, "epoch": 4942} {"train_loss": -7.441115379333496, "global_step": 207576, "epoch": 4942} {"train_loss": -7.260293960571289, "global_step": 207577, "epoch": 4942} {"train_loss": -7.3034987449646, "global_step": 207578, "epoch": 4942} {"train_loss": -7.387838363647461, "global_step": 207579, "epoch": 4942} {"train_loss": -7.191445350646973, "global_step": 207580, "epoch": 4942} {"train_loss": -7.254897117614746, "global_step": 207581, "epoch": 4942} {"train_loss": -7.437506675720215, "global_step": 207582, "epoch": 4942} {"train_loss": -7.302443981170654, "global_step": 207583, "epoch": 4942} {"train_loss": -7.347919464111328, "global_step": 207584, "epoch": 4942} {"train_loss": -7.323863983154297, "global_step": 207585, "epoch": 4942} {"train_loss": -7.211844444274902, "global_step": 207586, "epoch": 4942} {"train_loss": -7.226461887359619, "global_step": 207587, "epoch": 4942} {"train_loss": -7.297449111938477, "global_step": 207588, "epoch": 4942} {"train_loss": -7.240421295166016, "global_step": 207589, "epoch": 4942} {"train_loss": -7.149560928344727, "global_step": 207590, "epoch": 4942} {"train_loss": -7.254416465759277, "global_step": 207591, "epoch": 4942} {"train_loss": -7.274805068969727, "global_step": 207592, "epoch": 4942} {"train_loss": -7.20572566986084, "global_step": 207593, "epoch": 4942} {"train_loss": -7.375251770019531, "global_step": 207594, "epoch": 4942} {"train_loss": -7.1215105056762695, "global_step": 207595, "epoch": 4942} {"train_loss": -7.338276386260986, "global_step": 207596, "epoch": 4942} {"train_loss": -7.112278461456299, "global_step": 207597, "epoch": 4942} {"train_loss": -7.286843299865723, "global_step": 207598, "epoch": 4942} {"train_loss": -7.215908050537109, "global_step": 207599, "epoch": 4942} {"train_loss": -7.308191776275635, "global_step": 207600, "epoch": 4942} {"train_loss": -7.271794319152832, "global_step": 207601, "epoch": 4942} {"train_loss": -7.282423973083496, "global_step": 207602, "epoch": 4942} {"train_loss": -7.3058552742004395, "global_step": 207603, "epoch": 4942} {"train_loss": -7.257233142852783, "global_step": 207604, "epoch": 4942} {"train_loss": -7.2929026399339945, "global_step": 207605, "epoch": 4942, "val_loss": 81758.375} {"train_loss": -7.366404056549072, "global_step": 207606, "epoch": 4943} {"train_loss": -7.307033538818359, "global_step": 207607, "epoch": 4943} {"train_loss": -7.2645745277404785, "global_step": 207608, "epoch": 4943} {"train_loss": -7.428516387939453, "global_step": 207609, "epoch": 4943} {"train_loss": -7.268315315246582, "global_step": 207610, "epoch": 4943} {"train_loss": -7.389087677001953, "global_step": 207611, "epoch": 4943} {"train_loss": -7.370428085327148, "global_step": 207612, "epoch": 4943} {"train_loss": -7.270578384399414, "global_step": 207613, "epoch": 4943} {"train_loss": -7.386258602142334, "global_step": 207614, "epoch": 4943} {"train_loss": -7.404518127441406, "global_step": 207615, "epoch": 4943} {"train_loss": -7.37175989151001, "global_step": 207616, "epoch": 4943} {"train_loss": -7.347848892211914, "global_step": 207617, "epoch": 4943} {"train_loss": -7.403182029724121, "global_step": 207618, "epoch": 4943} {"train_loss": -7.404149055480957, "global_step": 207619, "epoch": 4943} {"train_loss": -7.4740471839904785, "global_step": 207620, "epoch": 4943} {"train_loss": -7.361330986022949, "global_step": 207621, "epoch": 4943} {"train_loss": -7.316161155700684, "global_step": 207622, "epoch": 4943} {"train_loss": -7.234055519104004, "global_step": 207623, "epoch": 4943} {"train_loss": -7.296003341674805, "global_step": 207624, "epoch": 4943} {"train_loss": -7.324275493621826, "global_step": 207625, "epoch": 4943} {"train_loss": -7.28400993347168, "global_step": 207626, "epoch": 4943} {"train_loss": -7.211367607116699, "global_step": 207627, "epoch": 4943} {"train_loss": -7.359129905700684, "global_step": 207628, "epoch": 4943} {"train_loss": -7.325057029724121, "global_step": 207629, "epoch": 4943} {"train_loss": -7.228791236877441, "global_step": 207630, "epoch": 4943} {"train_loss": -7.326066017150879, "global_step": 207631, "epoch": 4943} {"train_loss": -7.297939300537109, "global_step": 207632, "epoch": 4943} {"train_loss": -7.453797340393066, "global_step": 207633, "epoch": 4943} {"train_loss": -7.344113826751709, "global_step": 207634, "epoch": 4943} {"train_loss": -7.396362781524658, "global_step": 207635, "epoch": 4943} {"train_loss": -7.389642715454102, "global_step": 207636, "epoch": 4943} {"train_loss": -7.371615409851074, "global_step": 207637, "epoch": 4943} {"train_loss": -7.462981700897217, "global_step": 207638, "epoch": 4943} {"train_loss": -7.3596343994140625, "global_step": 207639, "epoch": 4943} {"train_loss": -7.441011428833008, "global_step": 207640, "epoch": 4943} {"train_loss": -7.436460018157959, "global_step": 207641, "epoch": 4943} {"train_loss": -7.425273895263672, "global_step": 207642, "epoch": 4943} {"train_loss": -7.436871528625488, "global_step": 207643, "epoch": 4943} {"train_loss": -7.3941521644592285, "global_step": 207644, "epoch": 4943} {"train_loss": -7.419641494750977, "global_step": 207645, "epoch": 4943} {"train_loss": -7.479735374450684, "global_step": 207646, "epoch": 4943} {"train_loss": -7.36141468229748, "global_step": 207647, "epoch": 4943, "val_loss": 81865.546875} {"train_loss": -7.395881652832031, "global_step": 207648, "epoch": 4944} {"train_loss": -7.490267753601074, "global_step": 207649, "epoch": 4944} {"train_loss": -7.473940849304199, "global_step": 207650, "epoch": 4944} {"train_loss": -7.373636245727539, "global_step": 207651, "epoch": 4944} {"train_loss": -7.372468948364258, "global_step": 207652, "epoch": 4944} {"train_loss": -7.470776557922363, "global_step": 207653, "epoch": 4944} {"train_loss": -7.4705963134765625, "global_step": 207654, "epoch": 4944} {"train_loss": -7.434390068054199, "global_step": 207655, "epoch": 4944} {"train_loss": -7.351426124572754, "global_step": 207656, "epoch": 4944} {"train_loss": -7.314939498901367, "global_step": 207657, "epoch": 4944} {"train_loss": -7.418966293334961, "global_step": 207658, "epoch": 4944} {"train_loss": -7.159335136413574, "global_step": 207659, "epoch": 4944} {"train_loss": -7.232093811035156, "global_step": 207660, "epoch": 4944} {"train_loss": -7.435924053192139, "global_step": 207661, "epoch": 4944} {"train_loss": -7.374878883361816, "global_step": 207662, "epoch": 4944} {"train_loss": -6.983244895935059, "global_step": 207663, "epoch": 4944} {"train_loss": -7.213365077972412, "global_step": 207664, "epoch": 4944} {"train_loss": -7.314859390258789, "global_step": 207665, "epoch": 4944} {"train_loss": -7.083125114440918, "global_step": 207666, "epoch": 4944} {"train_loss": -7.220701217651367, "global_step": 207667, "epoch": 4944} {"train_loss": -7.148310661315918, "global_step": 207668, "epoch": 4944} {"train_loss": -7.140031814575195, "global_step": 207669, "epoch": 4944} {"train_loss": -7.22718620300293, "global_step": 207670, "epoch": 4944} {"train_loss": -7.099399566650391, "global_step": 207671, "epoch": 4944} {"train_loss": -7.20734977722168, "global_step": 207672, "epoch": 4944} {"train_loss": -7.117342948913574, "global_step": 207673, "epoch": 4944} {"train_loss": -7.248317718505859, "global_step": 207674, "epoch": 4944} {"train_loss": -7.289750099182129, "global_step": 207675, "epoch": 4944} {"train_loss": -7.233591079711914, "global_step": 207676, "epoch": 4944} {"train_loss": -7.219167709350586, "global_step": 207677, "epoch": 4944} {"train_loss": -7.193168640136719, "global_step": 207678, "epoch": 4944} {"train_loss": -7.201441764831543, "global_step": 207679, "epoch": 4944} {"train_loss": -7.265233993530273, "global_step": 207680, "epoch": 4944} {"train_loss": -7.18796443939209, "global_step": 207681, "epoch": 4944} {"train_loss": -7.262016296386719, "global_step": 207682, "epoch": 4944} {"train_loss": -7.226119041442871, "global_step": 207683, "epoch": 4944} {"train_loss": -7.17116641998291, "global_step": 207684, "epoch": 4944} {"train_loss": -7.268298625946045, "global_step": 207685, "epoch": 4944} {"train_loss": -7.319635391235352, "global_step": 207686, "epoch": 4944} {"train_loss": -7.230188369750977, "global_step": 207687, "epoch": 4944} {"train_loss": -7.166329383850098, "global_step": 207688, "epoch": 4944} {"train_loss": -7.268661317371187, "global_step": 207689, "epoch": 4944, "val_loss": 81865.8203125} {"train_loss": -7.269863128662109, "global_step": 207690, "epoch": 4945} {"train_loss": -7.344049453735352, "global_step": 207691, "epoch": 4945} {"train_loss": -7.290804862976074, "global_step": 207692, "epoch": 4945} {"train_loss": -7.388341903686523, "global_step": 207693, "epoch": 4945} {"train_loss": -7.408417701721191, "global_step": 207694, "epoch": 4945} {"train_loss": -7.33553409576416, "global_step": 207695, "epoch": 4945} {"train_loss": -7.308056354522705, "global_step": 207696, "epoch": 4945} {"train_loss": -7.296272277832031, "global_step": 207697, "epoch": 4945} {"train_loss": -7.3645920753479, "global_step": 207698, "epoch": 4945} {"train_loss": -7.3600897789001465, "global_step": 207699, "epoch": 4945} {"train_loss": -7.251914024353027, "global_step": 207700, "epoch": 4945} {"train_loss": -7.270479202270508, "global_step": 207701, "epoch": 4945} {"train_loss": -7.39675235748291, "global_step": 207702, "epoch": 4945} {"train_loss": -7.345776081085205, "global_step": 207703, "epoch": 4945} {"train_loss": -7.353711128234863, "global_step": 207704, "epoch": 4945} {"train_loss": -7.4782209396362305, "global_step": 207705, "epoch": 4945} {"train_loss": -7.356175422668457, "global_step": 207706, "epoch": 4945} {"train_loss": -7.329308032989502, "global_step": 207707, "epoch": 4945} {"train_loss": -7.2654571533203125, "global_step": 207708, "epoch": 4945} {"train_loss": -7.33380651473999, "global_step": 207709, "epoch": 4945} {"train_loss": -7.406246185302734, "global_step": 207710, "epoch": 4945} {"train_loss": -7.30613899230957, "global_step": 207711, "epoch": 4945} {"train_loss": -7.339564323425293, "global_step": 207712, "epoch": 4945} {"train_loss": -7.380219459533691, "global_step": 207713, "epoch": 4945} {"train_loss": -7.317582130432129, "global_step": 207714, "epoch": 4945} {"train_loss": -7.386699199676514, "global_step": 207715, "epoch": 4945} {"train_loss": -7.325214385986328, "global_step": 207716, "epoch": 4945} {"train_loss": -7.306663513183594, "global_step": 207717, "epoch": 4945} {"train_loss": -7.354145050048828, "global_step": 207718, "epoch": 4945} {"train_loss": -7.342574119567871, "global_step": 207719, "epoch": 4945} {"train_loss": -7.307163238525391, "global_step": 207720, "epoch": 4945} {"train_loss": -7.489048480987549, "global_step": 207721, "epoch": 4945} {"train_loss": -7.429625511169434, "global_step": 207722, "epoch": 4945} {"train_loss": -7.368811130523682, "global_step": 207723, "epoch": 4945} {"train_loss": -7.3784284591674805, "global_step": 207724, "epoch": 4945} {"train_loss": -7.381280422210693, "global_step": 207725, "epoch": 4945} {"train_loss": -7.301277160644531, "global_step": 207726, "epoch": 4945} {"train_loss": -7.392331123352051, "global_step": 207727, "epoch": 4945} {"train_loss": -7.247373104095459, "global_step": 207728, "epoch": 4945} {"train_loss": -7.342552185058594, "global_step": 207729, "epoch": 4945} {"train_loss": -7.397282600402832, "global_step": 207730, "epoch": 4945} {"train_loss": -7.347346317200434, "global_step": 207731, "epoch": 4945, "val_loss": 82206.3046875} {"train_loss": -7.438508987426758, "global_step": 207732, "epoch": 4946} {"train_loss": -7.384486198425293, "global_step": 207733, "epoch": 4946} {"train_loss": -7.25771427154541, "global_step": 207734, "epoch": 4946} {"train_loss": -7.379828453063965, "global_step": 207735, "epoch": 4946} {"train_loss": -7.395795822143555, "global_step": 207736, "epoch": 4946} {"train_loss": -7.356877326965332, "global_step": 207737, "epoch": 4946} {"train_loss": -7.4972429275512695, "global_step": 207738, "epoch": 4946} {"train_loss": -7.330493927001953, "global_step": 207739, "epoch": 4946} {"train_loss": -7.412444114685059, "global_step": 207740, "epoch": 4946} {"train_loss": -7.298110485076904, "global_step": 207741, "epoch": 4946} {"train_loss": -7.37326192855835, "global_step": 207742, "epoch": 4946} {"train_loss": -7.397321701049805, "global_step": 207743, "epoch": 4946} {"train_loss": -7.180233955383301, "global_step": 207744, "epoch": 4946} {"train_loss": -7.191296577453613, "global_step": 207745, "epoch": 4946} {"train_loss": -7.376768112182617, "global_step": 207746, "epoch": 4946} {"train_loss": -7.309825897216797, "global_step": 207747, "epoch": 4946} {"train_loss": -7.257434368133545, "global_step": 207748, "epoch": 4946} {"train_loss": -7.389045715332031, "global_step": 207749, "epoch": 4946} {"train_loss": -7.201696872711182, "global_step": 207750, "epoch": 4946} {"train_loss": -7.3333611488342285, "global_step": 207751, "epoch": 4946} {"train_loss": -7.310889720916748, "global_step": 207752, "epoch": 4946} {"train_loss": -7.333826065063477, "global_step": 207753, "epoch": 4946} {"train_loss": -7.326821327209473, "global_step": 207754, "epoch": 4946} {"train_loss": -7.241212844848633, "global_step": 207755, "epoch": 4946} {"train_loss": -7.212810516357422, "global_step": 207756, "epoch": 4946} {"train_loss": -7.268540382385254, "global_step": 207757, "epoch": 4946} {"train_loss": -7.304472923278809, "global_step": 207758, "epoch": 4946} {"train_loss": -7.269068241119385, "global_step": 207759, "epoch": 4946} {"train_loss": -7.393321990966797, "global_step": 207760, "epoch": 4946} {"train_loss": -7.293759346008301, "global_step": 207761, "epoch": 4946} {"train_loss": -7.506141662597656, "global_step": 207762, "epoch": 4946} {"train_loss": -7.332869529724121, "global_step": 207763, "epoch": 4946} {"train_loss": -7.318673133850098, "global_step": 207764, "epoch": 4946} {"train_loss": -7.281017303466797, "global_step": 207765, "epoch": 4946} {"train_loss": -7.243265628814697, "global_step": 207766, "epoch": 4946} {"train_loss": -7.291635990142822, "global_step": 207767, "epoch": 4946} {"train_loss": -7.324634075164795, "global_step": 207768, "epoch": 4946} {"train_loss": -7.2918500900268555, "global_step": 207769, "epoch": 4946} {"train_loss": -7.286561012268066, "global_step": 207770, "epoch": 4946} {"train_loss": -7.387884616851807, "global_step": 207771, "epoch": 4946} {"train_loss": -7.26877498626709, "global_step": 207772, "epoch": 4946} {"train_loss": -7.321999231974284, "global_step": 207773, "epoch": 4946, "val_loss": 81745.9609375} {"train_loss": -7.2968621253967285, "global_step": 207774, "epoch": 4947} {"train_loss": -7.227971076965332, "global_step": 207775, "epoch": 4947} {"train_loss": -7.336548805236816, "global_step": 207776, "epoch": 4947} {"train_loss": -7.25216007232666, "global_step": 207777, "epoch": 4947} {"train_loss": -7.220162391662598, "global_step": 207778, "epoch": 4947} {"train_loss": -7.1467390060424805, "global_step": 207779, "epoch": 4947} {"train_loss": -7.125637054443359, "global_step": 207780, "epoch": 4947} {"train_loss": -7.419085502624512, "global_step": 207781, "epoch": 4947} {"train_loss": -7.206429958343506, "global_step": 207782, "epoch": 4947} {"train_loss": -7.429305553436279, "global_step": 207783, "epoch": 4947} {"train_loss": -7.289967060089111, "global_step": 207784, "epoch": 4947} {"train_loss": -7.335575103759766, "global_step": 207785, "epoch": 4947} {"train_loss": -7.286664962768555, "global_step": 207786, "epoch": 4947} {"train_loss": -7.256419658660889, "global_step": 207787, "epoch": 4947} {"train_loss": -7.357425212860107, "global_step": 207788, "epoch": 4947} {"train_loss": -7.166363716125488, "global_step": 207789, "epoch": 4947} {"train_loss": -7.366583824157715, "global_step": 207790, "epoch": 4947} {"train_loss": -7.225318908691406, "global_step": 207791, "epoch": 4947} {"train_loss": -7.1859941482543945, "global_step": 207792, "epoch": 4947} {"train_loss": -7.171059608459473, "global_step": 207793, "epoch": 4947} {"train_loss": -7.207040786743164, "global_step": 207794, "epoch": 4947} {"train_loss": -7.3233537673950195, "global_step": 207795, "epoch": 4947} {"train_loss": -7.388430595397949, "global_step": 207796, "epoch": 4947} {"train_loss": -7.243900299072266, "global_step": 207797, "epoch": 4947} {"train_loss": -7.293517112731934, "global_step": 207798, "epoch": 4947} {"train_loss": -7.248205184936523, "global_step": 207799, "epoch": 4947} {"train_loss": -7.277519702911377, "global_step": 207800, "epoch": 4947} {"train_loss": -7.245656967163086, "global_step": 207801, "epoch": 4947} {"train_loss": -7.2538557052612305, "global_step": 207802, "epoch": 4947} {"train_loss": -7.288518905639648, "global_step": 207803, "epoch": 4947} {"train_loss": -7.355654239654541, "global_step": 207804, "epoch": 4947} {"train_loss": -7.341168403625488, "global_step": 207805, "epoch": 4947} {"train_loss": -7.372525215148926, "global_step": 207806, "epoch": 4947} {"train_loss": -7.30034065246582, "global_step": 207807, "epoch": 4947} {"train_loss": -7.3329339027404785, "global_step": 207808, "epoch": 4947} {"train_loss": -7.291082382202148, "global_step": 207809, "epoch": 4947} {"train_loss": -7.255339622497559, "global_step": 207810, "epoch": 4947} {"train_loss": -7.312488079071045, "global_step": 207811, "epoch": 4947} {"train_loss": -7.334071636199951, "global_step": 207812, "epoch": 4947} {"train_loss": -7.425003528594971, "global_step": 207813, "epoch": 4947} {"train_loss": -7.279307842254639, "global_step": 207814, "epoch": 4947} {"train_loss": -7.286877711613973, "global_step": 207815, "epoch": 4947, "val_loss": 81824.1484375} {"train_loss": -7.368514060974121, "global_step": 207816, "epoch": 4948} {"train_loss": -7.347771644592285, "global_step": 207817, "epoch": 4948} {"train_loss": -7.390985488891602, "global_step": 207818, "epoch": 4948} {"train_loss": -7.4271650314331055, "global_step": 207819, "epoch": 4948} {"train_loss": -7.312599182128906, "global_step": 207820, "epoch": 4948} {"train_loss": -7.241516590118408, "global_step": 207821, "epoch": 4948} {"train_loss": -7.340272903442383, "global_step": 207822, "epoch": 4948} {"train_loss": -7.2501325607299805, "global_step": 207823, "epoch": 4948} {"train_loss": -7.4763994216918945, "global_step": 207824, "epoch": 4948} {"train_loss": -7.368721961975098, "global_step": 207825, "epoch": 4948} {"train_loss": -7.3570356369018555, "global_step": 207826, "epoch": 4948} {"train_loss": -7.373940944671631, "global_step": 207827, "epoch": 4948} {"train_loss": -7.344033241271973, "global_step": 207828, "epoch": 4948} {"train_loss": -7.458454132080078, "global_step": 207829, "epoch": 4948} {"train_loss": -7.380465507507324, "global_step": 207830, "epoch": 4948} {"train_loss": -7.294208526611328, "global_step": 207831, "epoch": 4948} {"train_loss": -7.399160385131836, "global_step": 207832, "epoch": 4948} {"train_loss": -7.444199562072754, "global_step": 207833, "epoch": 4948} {"train_loss": -7.329822063446045, "global_step": 207834, "epoch": 4948} {"train_loss": -7.335089683532715, "global_step": 207835, "epoch": 4948} {"train_loss": -7.4149274826049805, "global_step": 207836, "epoch": 4948} {"train_loss": -7.339545726776123, "global_step": 207837, "epoch": 4948} {"train_loss": -7.3474249839782715, "global_step": 207838, "epoch": 4948} {"train_loss": -7.374164581298828, "global_step": 207839, "epoch": 4948} {"train_loss": -7.321931838989258, "global_step": 207840, "epoch": 4948} {"train_loss": -7.427555561065674, "global_step": 207841, "epoch": 4948} {"train_loss": -7.448861598968506, "global_step": 207842, "epoch": 4948} {"train_loss": -7.368627548217773, "global_step": 207843, "epoch": 4948} {"train_loss": -7.26266622543335, "global_step": 207844, "epoch": 4948} {"train_loss": -7.26611328125, "global_step": 207845, "epoch": 4948} {"train_loss": -7.329848766326904, "global_step": 207846, "epoch": 4948} {"train_loss": -7.320570945739746, "global_step": 207847, "epoch": 4948} {"train_loss": -7.29007625579834, "global_step": 207848, "epoch": 4948} {"train_loss": -7.3670454025268555, "global_step": 207849, "epoch": 4948} {"train_loss": -7.247941017150879, "global_step": 207850, "epoch": 4948} {"train_loss": -7.342238426208496, "global_step": 207851, "epoch": 4948} {"train_loss": -7.415909767150879, "global_step": 207852, "epoch": 4948} {"train_loss": -7.420711040496826, "global_step": 207853, "epoch": 4948} {"train_loss": -7.444799423217773, "global_step": 207854, "epoch": 4948} {"train_loss": -7.360660552978516, "global_step": 207855, "epoch": 4948} {"train_loss": -7.413127899169922, "global_step": 207856, "epoch": 4948} {"train_loss": -7.358718724477859, "global_step": 207857, "epoch": 4948, "val_loss": 81878.625} {"train_loss": -7.439488887786865, "global_step": 207858, "epoch": 4949} {"train_loss": -7.3877692222595215, "global_step": 207859, "epoch": 4949} {"train_loss": -7.38264274597168, "global_step": 207860, "epoch": 4949} {"train_loss": -7.375368118286133, "global_step": 207861, "epoch": 4949} {"train_loss": -7.295185565948486, "global_step": 207862, "epoch": 4949} {"train_loss": -7.379270076751709, "global_step": 207863, "epoch": 4949} {"train_loss": -7.462101936340332, "global_step": 207864, "epoch": 4949} {"train_loss": -7.313867568969727, "global_step": 207865, "epoch": 4949} {"train_loss": -7.363633155822754, "global_step": 207866, "epoch": 4949} {"train_loss": -7.383331298828125, "global_step": 207867, "epoch": 4949} {"train_loss": -7.35386848449707, "global_step": 207868, "epoch": 4949} {"train_loss": -7.304259300231934, "global_step": 207869, "epoch": 4949} {"train_loss": -7.428812503814697, "global_step": 207870, "epoch": 4949} {"train_loss": -7.242395401000977, "global_step": 207871, "epoch": 4949} {"train_loss": -7.319730758666992, "global_step": 207872, "epoch": 4949} {"train_loss": -7.413323402404785, "global_step": 207873, "epoch": 4949} {"train_loss": -7.359092712402344, "global_step": 207874, "epoch": 4949} {"train_loss": -7.23198127746582, "global_step": 207875, "epoch": 4949} {"train_loss": -7.325695991516113, "global_step": 207876, "epoch": 4949} {"train_loss": -7.3341217041015625, "global_step": 207877, "epoch": 4949} {"train_loss": -7.363300800323486, "global_step": 207878, "epoch": 4949} {"train_loss": -7.3096418380737305, "global_step": 207879, "epoch": 4949} {"train_loss": -7.445982933044434, "global_step": 207880, "epoch": 4949} {"train_loss": -7.334941864013672, "global_step": 207881, "epoch": 4949} {"train_loss": -7.3422017097473145, "global_step": 207882, "epoch": 4949} {"train_loss": -7.276556015014648, "global_step": 207883, "epoch": 4949} {"train_loss": -7.297881603240967, "global_step": 207884, "epoch": 4949} {"train_loss": -7.479299545288086, "global_step": 207885, "epoch": 4949} {"train_loss": -7.274392604827881, "global_step": 207886, "epoch": 4949} {"train_loss": -7.358124732971191, "global_step": 207887, "epoch": 4949} {"train_loss": -7.295200824737549, "global_step": 207888, "epoch": 4949} {"train_loss": -7.458095550537109, "global_step": 207889, "epoch": 4949} {"train_loss": -7.305410385131836, "global_step": 207890, "epoch": 4949} {"train_loss": -7.422294616699219, "global_step": 207891, "epoch": 4949} {"train_loss": -7.375914573669434, "global_step": 207892, "epoch": 4949} {"train_loss": -7.364292144775391, "global_step": 207893, "epoch": 4949} {"train_loss": -7.432107448577881, "global_step": 207894, "epoch": 4949} {"train_loss": -7.308970928192139, "global_step": 207895, "epoch": 4949} {"train_loss": -7.21263313293457, "global_step": 207896, "epoch": 4949} {"train_loss": -7.3422956466674805, "global_step": 207897, "epoch": 4949} {"train_loss": -7.374084949493408, "global_step": 207898, "epoch": 4949} {"train_loss": -7.351096164612543, "global_step": 207899, "epoch": 4949, "val_loss": 82005.015625} {"train_loss": -7.427521705627441, "global_step": 207900, "epoch": 4950} {"train_loss": -7.328363418579102, "global_step": 207901, "epoch": 4950} {"train_loss": -7.272318363189697, "global_step": 207902, "epoch": 4950} {"train_loss": -7.314026832580566, "global_step": 207903, "epoch": 4950} {"train_loss": -7.334940433502197, "global_step": 207904, "epoch": 4950} {"train_loss": -7.237153053283691, "global_step": 207905, "epoch": 4950} {"train_loss": -7.315912246704102, "global_step": 207906, "epoch": 4950} {"train_loss": -7.279985427856445, "global_step": 207907, "epoch": 4950} {"train_loss": -7.217747211456299, "global_step": 207908, "epoch": 4950} {"train_loss": -7.428116321563721, "global_step": 207909, "epoch": 4950} {"train_loss": -7.300597190856934, "global_step": 207910, "epoch": 4950} {"train_loss": -7.347662448883057, "global_step": 207911, "epoch": 4950} {"train_loss": -7.432883262634277, "global_step": 207912, "epoch": 4950} {"train_loss": -7.316657543182373, "global_step": 207913, "epoch": 4950} {"train_loss": -7.433551788330078, "global_step": 207914, "epoch": 4950} {"train_loss": -7.41598653793335, "global_step": 207915, "epoch": 4950} {"train_loss": -7.4242844581604, "global_step": 207916, "epoch": 4950} {"train_loss": -7.367242813110352, "global_step": 207917, "epoch": 4950} {"train_loss": -7.353804111480713, "global_step": 207918, "epoch": 4950} {"train_loss": -7.323582172393799, "global_step": 207919, "epoch": 4950} {"train_loss": -7.357900142669678, "global_step": 207920, "epoch": 4950} {"train_loss": -7.439133644104004, "global_step": 207921, "epoch": 4950} {"train_loss": -7.262923717498779, "global_step": 207922, "epoch": 4950} {"train_loss": -7.43642520904541, "global_step": 207923, "epoch": 4950} {"train_loss": -7.417263031005859, "global_step": 207924, "epoch": 4950} {"train_loss": -7.2342529296875, "global_step": 207925, "epoch": 4950} {"train_loss": -7.390602111816406, "global_step": 207926, "epoch": 4950} {"train_loss": -7.295820236206055, "global_step": 207927, "epoch": 4950} {"train_loss": -7.2181077003479, "global_step": 207928, "epoch": 4950} {"train_loss": -7.363278865814209, "global_step": 207929, "epoch": 4950} {"train_loss": -7.242206573486328, "global_step": 207930, "epoch": 4950} {"train_loss": -7.299142360687256, "global_step": 207931, "epoch": 4950} {"train_loss": -7.308721542358398, "global_step": 207932, "epoch": 4950} {"train_loss": -7.210563659667969, "global_step": 207933, "epoch": 4950} {"train_loss": -7.423172950744629, "global_step": 207934, "epoch": 4950} {"train_loss": -7.311567306518555, "global_step": 207935, "epoch": 4950} {"train_loss": -7.244195938110352, "global_step": 207936, "epoch": 4950} {"train_loss": -7.306012153625488, "global_step": 207937, "epoch": 4950} {"train_loss": -7.2664031982421875, "global_step": 207938, "epoch": 4950} {"train_loss": -7.275324821472168, "global_step": 207939, "epoch": 4950} {"train_loss": -7.362536430358887, "global_step": 207940, "epoch": 4950} {"train_loss": -7.3309270313807895, "global_step": 207941, "epoch": 4950, "train/sim_max_reward_0": 0.1905104938906, "train/sim_max_reward_1": 0.9083375916979083, "train/sim_max_reward_2": 0.5264512785997834, "train/sim_max_reward_3": 0.14533194940352992, "train/sim_max_reward_4": 0.3270886950890841, "train/sim_max_reward_5": 0.5668167726930615, "test/sim_max_reward_4500000": 0.9536303136718136, "test/sim_max_reward_4500001": 0.9856130144843711, "test/sim_max_reward_4500002": 0.8980345073870555, "test/sim_max_reward_4500003": 0.5266326977209215, "test/sim_max_reward_4500004": 0.20537403392707204, "test/sim_max_reward_4500005": 0.26545889107990484, "test/sim_max_reward_4500006": 0.9742887385740234, "test/sim_max_reward_4500007": 0.8795821532091409, "test/sim_max_reward_4500008": 0.9615895287887206, "test/sim_max_reward_4500009": 0.052827203313027184, "test/sim_max_reward_4500010": 0.05509668741796519, "test/sim_max_reward_4500011": 0.6644589721295443, "test/sim_max_reward_4500012": 0.8965788740810233, "test/sim_max_reward_4500013": 0.6679528517253565, "test/sim_max_reward_4500014": 0.9510439848044566, "test/sim_max_reward_4500015": 0.11174920754337812, "test/sim_max_reward_4500016": 0.017544158064586216, "test/sim_max_reward_4500017": 0.024085394241361722, "test/sim_max_reward_4500018": 0.7289861175835134, "test/sim_max_reward_4500019": 0.810568333165018, "test/sim_max_reward_4500020": 0.0, "test/sim_max_reward_4500021": 0.9454696963445238, "test/sim_max_reward_4500022": 0.9487881538370673, "test/sim_max_reward_4500023": 0.55826565570725, "test/sim_max_reward_4500024": 0.0, "test/sim_max_reward_4500025": 0.8674480428226063, "test/sim_max_reward_4500026": 0.9986575991009318, "test/sim_max_reward_4500027": 0.8880037542364873, "test/sim_max_reward_4500028": 0.18817745937666963, "test/sim_max_reward_4500029": 0.05553856612451496, "test/sim_max_reward_4500030": 0.9087685025429842, "test/sim_max_reward_4500031": 0.0, "test/sim_max_reward_4500032": 0.0465094911481587, "test/sim_max_reward_4500033": 0.9440798116341833, "test/sim_max_reward_4500034": 0.9567262946815202, "test/sim_max_reward_4500035": 0.9550707197060097, "test/sim_max_reward_4500036": 0.3817969684039973, "test/sim_max_reward_4500037": 0.980466691707678, "test/sim_max_reward_4500038": 0.9970491220960469, "test/sim_max_reward_4500039": 0.8964471115140646, "test/sim_max_reward_4500040": 0.9758034701696181, "test/sim_max_reward_4500041": 1.0, "test/sim_max_reward_4500042": 0.05162330342567991, "test/sim_max_reward_4500043": 0.8147541290740508, "test/sim_max_reward_4500044": 0.0, "test/sim_max_reward_4500045": 1.0, "test/sim_max_reward_4500046": 0.19399364633971627, "test/sim_max_reward_4500047": 0.9150886165239094, "test/sim_max_reward_4500048": 0.9712490276983791, "test/sim_max_reward_4500049": 0.8417479740723317, "train/mean_score": 0.44408946356232787, "test/mean_score": 0.6182523894240127, "val_loss": 81907.71875} {"train_loss": -7.48534631729126, "global_step": 207942, "epoch": 4951} {"train_loss": -7.1934099197387695, "global_step": 207943, "epoch": 4951} {"train_loss": -7.327055931091309, "global_step": 207944, "epoch": 4951} {"train_loss": -7.137637138366699, "global_step": 207945, "epoch": 4951} {"train_loss": -7.281255722045898, "global_step": 207946, "epoch": 4951} {"train_loss": -7.275365829467773, "global_step": 207947, "epoch": 4951} {"train_loss": -7.291813373565674, "global_step": 207948, "epoch": 4951} {"train_loss": -7.285207271575928, "global_step": 207949, "epoch": 4951} {"train_loss": -7.34136962890625, "global_step": 207950, "epoch": 4951} {"train_loss": -7.283105850219727, "global_step": 207951, "epoch": 4951} {"train_loss": -7.262140274047852, "global_step": 207952, "epoch": 4951} {"train_loss": -7.365292549133301, "global_step": 207953, "epoch": 4951} {"train_loss": -7.4340314865112305, "global_step": 207954, "epoch": 4951} {"train_loss": -7.298471450805664, "global_step": 207955, "epoch": 4951} {"train_loss": -7.427950859069824, "global_step": 207956, "epoch": 4951} {"train_loss": -7.450970649719238, "global_step": 207957, "epoch": 4951} {"train_loss": -7.303305625915527, "global_step": 207958, "epoch": 4951} {"train_loss": -7.384599208831787, "global_step": 207959, "epoch": 4951} {"train_loss": -7.327667236328125, "global_step": 207960, "epoch": 4951} {"train_loss": -7.434003829956055, "global_step": 207961, "epoch": 4951} {"train_loss": -7.382582187652588, "global_step": 207962, "epoch": 4951} {"train_loss": -7.299314022064209, "global_step": 207963, "epoch": 4951} {"train_loss": -7.3777971267700195, "global_step": 207964, "epoch": 4951} {"train_loss": -7.442837715148926, "global_step": 207965, "epoch": 4951} {"train_loss": -7.350010395050049, "global_step": 207966, "epoch": 4951} {"train_loss": -7.330729007720947, "global_step": 207967, "epoch": 4951} {"train_loss": -7.328588485717773, "global_step": 207968, "epoch": 4951} {"train_loss": -7.295501232147217, "global_step": 207969, "epoch": 4951} {"train_loss": -7.373197555541992, "global_step": 207970, "epoch": 4951} {"train_loss": -7.344114780426025, "global_step": 207971, "epoch": 4951} {"train_loss": -7.314239501953125, "global_step": 207972, "epoch": 4951} {"train_loss": -7.321846961975098, "global_step": 207973, "epoch": 4951} {"train_loss": -7.243595123291016, "global_step": 207974, "epoch": 4951} {"train_loss": -7.32895565032959, "global_step": 207975, "epoch": 4951} {"train_loss": -7.247596740722656, "global_step": 207976, "epoch": 4951} {"train_loss": -7.236641883850098, "global_step": 207977, "epoch": 4951} {"train_loss": -7.438162803649902, "global_step": 207978, "epoch": 4951} {"train_loss": -7.377770900726318, "global_step": 207979, "epoch": 4951} {"train_loss": -7.35810661315918, "global_step": 207980, "epoch": 4951} {"train_loss": -7.430580139160156, "global_step": 207981, "epoch": 4951} {"train_loss": -7.330297470092773, "global_step": 207982, "epoch": 4951} {"train_loss": -7.336872452781314, "global_step": 207983, "epoch": 4951, "val_loss": 81853.1015625} {"train_loss": -7.459281921386719, "global_step": 207984, "epoch": 4952} {"train_loss": -7.419459342956543, "global_step": 207985, "epoch": 4952} {"train_loss": -7.468377113342285, "global_step": 207986, "epoch": 4952} {"train_loss": -7.401619911193848, "global_step": 207987, "epoch": 4952} {"train_loss": -7.36234712600708, "global_step": 207988, "epoch": 4952} {"train_loss": -7.32459831237793, "global_step": 207989, "epoch": 4952} {"train_loss": -7.274377822875977, "global_step": 207990, "epoch": 4952} {"train_loss": -7.434313774108887, "global_step": 207991, "epoch": 4952} {"train_loss": -7.331171035766602, "global_step": 207992, "epoch": 4952} {"train_loss": -7.3756232261657715, "global_step": 207993, "epoch": 4952} {"train_loss": -7.391508102416992, "global_step": 207994, "epoch": 4952} {"train_loss": -7.306964874267578, "global_step": 207995, "epoch": 4952} {"train_loss": -7.374796390533447, "global_step": 207996, "epoch": 4952} {"train_loss": -7.44603157043457, "global_step": 207997, "epoch": 4952} {"train_loss": -7.331671714782715, "global_step": 207998, "epoch": 4952} {"train_loss": -7.385164260864258, "global_step": 207999, "epoch": 4952} {"train_loss": -7.416482448577881, "global_step": 208000, "epoch": 4952} {"train_loss": -7.368144989013672, "global_step": 208001, "epoch": 4952} {"train_loss": -7.4071946144104, "global_step": 208002, "epoch": 4952} {"train_loss": -7.348758220672607, "global_step": 208003, "epoch": 4952} {"train_loss": -7.442523956298828, "global_step": 208004, "epoch": 4952} {"train_loss": -7.355245590209961, "global_step": 208005, "epoch": 4952} {"train_loss": -7.400907516479492, "global_step": 208006, "epoch": 4952} {"train_loss": -7.313922882080078, "global_step": 208007, "epoch": 4952} {"train_loss": -7.439525127410889, "global_step": 208008, "epoch": 4952} {"train_loss": -7.3531694412231445, "global_step": 208009, "epoch": 4952} {"train_loss": -7.320990085601807, "global_step": 208010, "epoch": 4952} {"train_loss": -7.275230407714844, "global_step": 208011, "epoch": 4952} {"train_loss": -7.427072525024414, "global_step": 208012, "epoch": 4952} {"train_loss": -7.26138973236084, "global_step": 208013, "epoch": 4952} {"train_loss": -7.363726615905762, "global_step": 208014, "epoch": 4952} {"train_loss": -7.342226028442383, "global_step": 208015, "epoch": 4952} {"train_loss": -7.404755115509033, "global_step": 208016, "epoch": 4952} {"train_loss": -7.350127220153809, "global_step": 208017, "epoch": 4952} {"train_loss": -7.481934547424316, "global_step": 208018, "epoch": 4952} {"train_loss": -7.454049110412598, "global_step": 208019, "epoch": 4952} {"train_loss": -7.291750907897949, "global_step": 208020, "epoch": 4952} {"train_loss": -7.360610008239746, "global_step": 208021, "epoch": 4952} {"train_loss": -7.369483947753906, "global_step": 208022, "epoch": 4952} {"train_loss": -7.32004451751709, "global_step": 208023, "epoch": 4952} {"train_loss": -7.3805670738220215, "global_step": 208024, "epoch": 4952} {"train_loss": -7.375251270475841, "global_step": 208025, "epoch": 4952, "val_loss": 82065.3671875} {"train_loss": -7.432948112487793, "global_step": 208026, "epoch": 4953} {"train_loss": -7.468621730804443, "global_step": 208027, "epoch": 4953} {"train_loss": -7.375496864318848, "global_step": 208028, "epoch": 4953} {"train_loss": -7.21588134765625, "global_step": 208029, "epoch": 4953} {"train_loss": -7.343404769897461, "global_step": 208030, "epoch": 4953} {"train_loss": -7.367135047912598, "global_step": 208031, "epoch": 4953} {"train_loss": -7.357610702514648, "global_step": 208032, "epoch": 4953} {"train_loss": -7.399614334106445, "global_step": 208033, "epoch": 4953} {"train_loss": -7.281191825866699, "global_step": 208034, "epoch": 4953} {"train_loss": -7.264214038848877, "global_step": 208035, "epoch": 4953} {"train_loss": -7.360705375671387, "global_step": 208036, "epoch": 4953} {"train_loss": -7.357512474060059, "global_step": 208037, "epoch": 4953} {"train_loss": -7.3861846923828125, "global_step": 208038, "epoch": 4953} {"train_loss": -7.317198753356934, "global_step": 208039, "epoch": 4953} {"train_loss": -7.3816237449646, "global_step": 208040, "epoch": 4953} {"train_loss": -7.398561477661133, "global_step": 208041, "epoch": 4953} {"train_loss": -7.4896745681762695, "global_step": 208042, "epoch": 4953} {"train_loss": -7.308379173278809, "global_step": 208043, "epoch": 4953} {"train_loss": -7.382470607757568, "global_step": 208044, "epoch": 4953} {"train_loss": -7.468580722808838, "global_step": 208045, "epoch": 4953} {"train_loss": -7.422743797302246, "global_step": 208046, "epoch": 4953} {"train_loss": -7.328856468200684, "global_step": 208047, "epoch": 4953} {"train_loss": -7.316980361938477, "global_step": 208048, "epoch": 4953} {"train_loss": -7.386301517486572, "global_step": 208049, "epoch": 4953} {"train_loss": -7.3614959716796875, "global_step": 208050, "epoch": 4953} {"train_loss": -7.120654106140137, "global_step": 208051, "epoch": 4953} {"train_loss": -7.212673664093018, "global_step": 208052, "epoch": 4953} {"train_loss": -7.43133544921875, "global_step": 208053, "epoch": 4953} {"train_loss": -7.208148956298828, "global_step": 208054, "epoch": 4953} {"train_loss": -7.054498195648193, "global_step": 208055, "epoch": 4953} {"train_loss": -7.281544208526611, "global_step": 208056, "epoch": 4953} {"train_loss": -7.272162437438965, "global_step": 208057, "epoch": 4953} {"train_loss": -7.16787576675415, "global_step": 208058, "epoch": 4953} {"train_loss": -7.341767311096191, "global_step": 208059, "epoch": 4953} {"train_loss": -7.262313365936279, "global_step": 208060, "epoch": 4953} {"train_loss": -7.039433002471924, "global_step": 208061, "epoch": 4953} {"train_loss": -7.220559597015381, "global_step": 208062, "epoch": 4953} {"train_loss": -7.246217727661133, "global_step": 208063, "epoch": 4953} {"train_loss": -7.078458786010742, "global_step": 208064, "epoch": 4953} {"train_loss": -7.245253562927246, "global_step": 208065, "epoch": 4953} {"train_loss": -7.194258689880371, "global_step": 208066, "epoch": 4953} {"train_loss": -7.306981801986694, "global_step": 208067, "epoch": 4953, "val_loss": 82092.109375} {"train_loss": -7.275374412536621, "global_step": 208068, "epoch": 4954} {"train_loss": -7.176846504211426, "global_step": 208069, "epoch": 4954} {"train_loss": -7.327197074890137, "global_step": 208070, "epoch": 4954} {"train_loss": -7.308619976043701, "global_step": 208071, "epoch": 4954} {"train_loss": -7.333268165588379, "global_step": 208072, "epoch": 4954} {"train_loss": -7.431562900543213, "global_step": 208073, "epoch": 4954} {"train_loss": -7.259154796600342, "global_step": 208074, "epoch": 4954} {"train_loss": -7.281665802001953, "global_step": 208075, "epoch": 4954} {"train_loss": -7.317332744598389, "global_step": 208076, "epoch": 4954} {"train_loss": -7.239096641540527, "global_step": 208077, "epoch": 4954} {"train_loss": -7.370196342468262, "global_step": 208078, "epoch": 4954} {"train_loss": -7.323295593261719, "global_step": 208079, "epoch": 4954} {"train_loss": -7.397430419921875, "global_step": 208080, "epoch": 4954} {"train_loss": -7.425427436828613, "global_step": 208081, "epoch": 4954} {"train_loss": -7.361485004425049, "global_step": 208082, "epoch": 4954} {"train_loss": -7.378462791442871, "global_step": 208083, "epoch": 4954} {"train_loss": -7.259328842163086, "global_step": 208084, "epoch": 4954} {"train_loss": -7.444215774536133, "global_step": 208085, "epoch": 4954} {"train_loss": -7.356733322143555, "global_step": 208086, "epoch": 4954} {"train_loss": -7.354762077331543, "global_step": 208087, "epoch": 4954} {"train_loss": -7.490435600280762, "global_step": 208088, "epoch": 4954} {"train_loss": -7.452272415161133, "global_step": 208089, "epoch": 4954} {"train_loss": -7.341129302978516, "global_step": 208090, "epoch": 4954} {"train_loss": -7.2848992347717285, "global_step": 208091, "epoch": 4954} {"train_loss": -7.420289993286133, "global_step": 208092, "epoch": 4954} {"train_loss": -7.31583309173584, "global_step": 208093, "epoch": 4954} {"train_loss": -7.338895797729492, "global_step": 208094, "epoch": 4954} {"train_loss": -7.43714714050293, "global_step": 208095, "epoch": 4954} {"train_loss": -7.442732334136963, "global_step": 208096, "epoch": 4954} {"train_loss": -7.358379364013672, "global_step": 208097, "epoch": 4954} {"train_loss": -7.356263160705566, "global_step": 208098, "epoch": 4954} {"train_loss": -7.324984550476074, "global_step": 208099, "epoch": 4954} {"train_loss": -7.365764617919922, "global_step": 208100, "epoch": 4954} {"train_loss": -7.261480331420898, "global_step": 208101, "epoch": 4954} {"train_loss": -7.273033142089844, "global_step": 208102, "epoch": 4954} {"train_loss": -7.376955509185791, "global_step": 208103, "epoch": 4954} {"train_loss": -7.246739864349365, "global_step": 208104, "epoch": 4954} {"train_loss": -7.2220048904418945, "global_step": 208105, "epoch": 4954} {"train_loss": -7.305220603942871, "global_step": 208106, "epoch": 4954} {"train_loss": -7.18670654296875, "global_step": 208107, "epoch": 4954} {"train_loss": -7.2388410568237305, "global_step": 208108, "epoch": 4954} {"train_loss": -7.33079777445112, "global_step": 208109, "epoch": 4954, "val_loss": 81878.53125} {"train_loss": -7.316954612731934, "global_step": 208110, "epoch": 4955} {"train_loss": -7.292103290557861, "global_step": 208111, "epoch": 4955} {"train_loss": -7.318201065063477, "global_step": 208112, "epoch": 4955} {"train_loss": -7.21439266204834, "global_step": 208113, "epoch": 4955} {"train_loss": -7.199911117553711, "global_step": 208114, "epoch": 4955} {"train_loss": -7.233734130859375, "global_step": 208115, "epoch": 4955} {"train_loss": -7.391727924346924, "global_step": 208116, "epoch": 4955} {"train_loss": -7.126128196716309, "global_step": 208117, "epoch": 4955} {"train_loss": -7.305105209350586, "global_step": 208118, "epoch": 4955} {"train_loss": -7.282912254333496, "global_step": 208119, "epoch": 4955} {"train_loss": -7.127452373504639, "global_step": 208120, "epoch": 4955} {"train_loss": -7.2321367263793945, "global_step": 208121, "epoch": 4955} {"train_loss": -7.132016181945801, "global_step": 208122, "epoch": 4955} {"train_loss": -7.2548933029174805, "global_step": 208123, "epoch": 4955} {"train_loss": -7.270694255828857, "global_step": 208124, "epoch": 4955} {"train_loss": -7.405680179595947, "global_step": 208125, "epoch": 4955} {"train_loss": -7.15884256362915, "global_step": 208126, "epoch": 4955} {"train_loss": -7.219477653503418, "global_step": 208127, "epoch": 4955} {"train_loss": -7.217593193054199, "global_step": 208128, "epoch": 4955} {"train_loss": -7.380069255828857, "global_step": 208129, "epoch": 4955} {"train_loss": -7.310523509979248, "global_step": 208130, "epoch": 4955} {"train_loss": -7.358617305755615, "global_step": 208131, "epoch": 4955} {"train_loss": -7.347509384155273, "global_step": 208132, "epoch": 4955} {"train_loss": -7.291635990142822, "global_step": 208133, "epoch": 4955} {"train_loss": -7.3387451171875, "global_step": 208134, "epoch": 4955} {"train_loss": -7.281491279602051, "global_step": 208135, "epoch": 4955} {"train_loss": -7.417693138122559, "global_step": 208136, "epoch": 4955} {"train_loss": -7.273993492126465, "global_step": 208137, "epoch": 4955} {"train_loss": -7.355189323425293, "global_step": 208138, "epoch": 4955} {"train_loss": -7.332057952880859, "global_step": 208139, "epoch": 4955} {"train_loss": -7.304869651794434, "global_step": 208140, "epoch": 4955} {"train_loss": -7.389564514160156, "global_step": 208141, "epoch": 4955} {"train_loss": -7.4365949630737305, "global_step": 208142, "epoch": 4955} {"train_loss": -7.249001979827881, "global_step": 208143, "epoch": 4955} {"train_loss": -7.276601791381836, "global_step": 208144, "epoch": 4955} {"train_loss": -7.4092912673950195, "global_step": 208145, "epoch": 4955} {"train_loss": -7.4237165451049805, "global_step": 208146, "epoch": 4955} {"train_loss": -7.37300443649292, "global_step": 208147, "epoch": 4955} {"train_loss": -7.346052646636963, "global_step": 208148, "epoch": 4955} {"train_loss": -7.394879341125488, "global_step": 208149, "epoch": 4955} {"train_loss": -7.303403377532959, "global_step": 208150, "epoch": 4955} {"train_loss": -7.300074736277263, "global_step": 208151, "epoch": 4955, "val_loss": 81826.375} {"train_loss": -7.302187442779541, "global_step": 208152, "epoch": 4956} {"train_loss": -7.318458557128906, "global_step": 208153, "epoch": 4956} {"train_loss": -7.349180221557617, "global_step": 208154, "epoch": 4956} {"train_loss": -7.475594520568848, "global_step": 208155, "epoch": 4956} {"train_loss": -7.427567958831787, "global_step": 208156, "epoch": 4956} {"train_loss": -7.33111047744751, "global_step": 208157, "epoch": 4956} {"train_loss": -7.335189342498779, "global_step": 208158, "epoch": 4956} {"train_loss": -7.350707054138184, "global_step": 208159, "epoch": 4956} {"train_loss": -7.283169746398926, "global_step": 208160, "epoch": 4956} {"train_loss": -7.345616817474365, "global_step": 208161, "epoch": 4956} {"train_loss": -7.3762054443359375, "global_step": 208162, "epoch": 4956} {"train_loss": -7.176479816436768, "global_step": 208163, "epoch": 4956} {"train_loss": -7.470634937286377, "global_step": 208164, "epoch": 4956} {"train_loss": -7.3032331466674805, "global_step": 208165, "epoch": 4956} {"train_loss": -7.356071472167969, "global_step": 208166, "epoch": 4956} {"train_loss": -7.262527942657471, "global_step": 208167, "epoch": 4956} {"train_loss": -7.287814140319824, "global_step": 208168, "epoch": 4956} {"train_loss": -7.210817337036133, "global_step": 208169, "epoch": 4956} {"train_loss": -7.334365367889404, "global_step": 208170, "epoch": 4956} {"train_loss": -7.290349960327148, "global_step": 208171, "epoch": 4956} {"train_loss": -7.33913516998291, "global_step": 208172, "epoch": 4956} {"train_loss": -7.3183441162109375, "global_step": 208173, "epoch": 4956} {"train_loss": -7.274383544921875, "global_step": 208174, "epoch": 4956} {"train_loss": -7.2720136642456055, "global_step": 208175, "epoch": 4956} {"train_loss": -7.382513046264648, "global_step": 208176, "epoch": 4956} {"train_loss": -7.342006683349609, "global_step": 208177, "epoch": 4956} {"train_loss": -7.371860980987549, "global_step": 208178, "epoch": 4956} {"train_loss": -7.345492362976074, "global_step": 208179, "epoch": 4956} {"train_loss": -7.364860534667969, "global_step": 208180, "epoch": 4956} {"train_loss": -7.353747367858887, "global_step": 208181, "epoch": 4956} {"train_loss": -7.4686760902404785, "global_step": 208182, "epoch": 4956} {"train_loss": -7.395653247833252, "global_step": 208183, "epoch": 4956} {"train_loss": -7.355863094329834, "global_step": 208184, "epoch": 4956} {"train_loss": -7.303448677062988, "global_step": 208185, "epoch": 4956} {"train_loss": -7.461762428283691, "global_step": 208186, "epoch": 4956} {"train_loss": -7.463550567626953, "global_step": 208187, "epoch": 4956} {"train_loss": -7.410816192626953, "global_step": 208188, "epoch": 4956} {"train_loss": -7.436882972717285, "global_step": 208189, "epoch": 4956} {"train_loss": -7.382440090179443, "global_step": 208190, "epoch": 4956} {"train_loss": -7.403896331787109, "global_step": 208191, "epoch": 4956} {"train_loss": -7.463901519775391, "global_step": 208192, "epoch": 4956} {"train_loss": -7.353823457445417, "global_step": 208193, "epoch": 4956, "val_loss": 81895.5} {"train_loss": -7.333311080932617, "global_step": 208194, "epoch": 4957} {"train_loss": -7.206335544586182, "global_step": 208195, "epoch": 4957} {"train_loss": -7.376312255859375, "global_step": 208196, "epoch": 4957} {"train_loss": -7.295673370361328, "global_step": 208197, "epoch": 4957} {"train_loss": -7.395756244659424, "global_step": 208198, "epoch": 4957} {"train_loss": -7.359195232391357, "global_step": 208199, "epoch": 4957} {"train_loss": -7.286495208740234, "global_step": 208200, "epoch": 4957} {"train_loss": -7.357244491577148, "global_step": 208201, "epoch": 4957} {"train_loss": -7.27531623840332, "global_step": 208202, "epoch": 4957} {"train_loss": -7.3448166847229, "global_step": 208203, "epoch": 4957} {"train_loss": -7.413580417633057, "global_step": 208204, "epoch": 4957} {"train_loss": -7.343015670776367, "global_step": 208205, "epoch": 4957} {"train_loss": -7.4163312911987305, "global_step": 208206, "epoch": 4957} {"train_loss": -7.304039001464844, "global_step": 208207, "epoch": 4957} {"train_loss": -7.3512420654296875, "global_step": 208208, "epoch": 4957} {"train_loss": -7.333003520965576, "global_step": 208209, "epoch": 4957} {"train_loss": -7.332637310028076, "global_step": 208210, "epoch": 4957} {"train_loss": -7.243343353271484, "global_step": 208211, "epoch": 4957} {"train_loss": -7.356337547302246, "global_step": 208212, "epoch": 4957} {"train_loss": -7.379720211029053, "global_step": 208213, "epoch": 4957} {"train_loss": -7.263228416442871, "global_step": 208214, "epoch": 4957} {"train_loss": -7.377373218536377, "global_step": 208215, "epoch": 4957} {"train_loss": -7.4276533126831055, "global_step": 208216, "epoch": 4957} {"train_loss": -7.324224948883057, "global_step": 208217, "epoch": 4957} {"train_loss": -7.3275604248046875, "global_step": 208218, "epoch": 4957} {"train_loss": -7.444729804992676, "global_step": 208219, "epoch": 4957} {"train_loss": -7.243552207946777, "global_step": 208220, "epoch": 4957} {"train_loss": -7.259878158569336, "global_step": 208221, "epoch": 4957} {"train_loss": -7.349320888519287, "global_step": 208222, "epoch": 4957} {"train_loss": -7.060988426208496, "global_step": 208223, "epoch": 4957} {"train_loss": -7.361128807067871, "global_step": 208224, "epoch": 4957} {"train_loss": -7.31594181060791, "global_step": 208225, "epoch": 4957} {"train_loss": -7.2803239822387695, "global_step": 208226, "epoch": 4957} {"train_loss": -7.402304649353027, "global_step": 208227, "epoch": 4957} {"train_loss": -7.202191352844238, "global_step": 208228, "epoch": 4957} {"train_loss": -7.347480297088623, "global_step": 208229, "epoch": 4957} {"train_loss": -7.23106575012207, "global_step": 208230, "epoch": 4957} {"train_loss": -7.375953674316406, "global_step": 208231, "epoch": 4957} {"train_loss": -7.1838274002075195, "global_step": 208232, "epoch": 4957} {"train_loss": -7.309971809387207, "global_step": 208233, "epoch": 4957} {"train_loss": -7.209738731384277, "global_step": 208234, "epoch": 4957} {"train_loss": -7.316425925209408, "global_step": 208235, "epoch": 4957, "val_loss": 81840.7265625} {"train_loss": -7.341405391693115, "global_step": 208236, "epoch": 4958} {"train_loss": -7.2402119636535645, "global_step": 208237, "epoch": 4958} {"train_loss": -7.271191596984863, "global_step": 208238, "epoch": 4958} {"train_loss": -7.305177688598633, "global_step": 208239, "epoch": 4958} {"train_loss": -7.251206398010254, "global_step": 208240, "epoch": 4958} {"train_loss": -7.296523094177246, "global_step": 208241, "epoch": 4958} {"train_loss": -7.3310651779174805, "global_step": 208242, "epoch": 4958} {"train_loss": -7.131065368652344, "global_step": 208243, "epoch": 4958} {"train_loss": -7.290897369384766, "global_step": 208244, "epoch": 4958} {"train_loss": -7.29960823059082, "global_step": 208245, "epoch": 4958} {"train_loss": -7.204334259033203, "global_step": 208246, "epoch": 4958} {"train_loss": -7.298055648803711, "global_step": 208247, "epoch": 4958} {"train_loss": -7.244871139526367, "global_step": 208248, "epoch": 4958} {"train_loss": -7.254846572875977, "global_step": 208249, "epoch": 4958} {"train_loss": -7.368738651275635, "global_step": 208250, "epoch": 4958} {"train_loss": -7.267281532287598, "global_step": 208251, "epoch": 4958} {"train_loss": -7.342185020446777, "global_step": 208252, "epoch": 4958} {"train_loss": -7.315799713134766, "global_step": 208253, "epoch": 4958} {"train_loss": -7.290782451629639, "global_step": 208254, "epoch": 4958} {"train_loss": -7.326287746429443, "global_step": 208255, "epoch": 4958} {"train_loss": -7.272425651550293, "global_step": 208256, "epoch": 4958} {"train_loss": -7.262228488922119, "global_step": 208257, "epoch": 4958} {"train_loss": -7.36064338684082, "global_step": 208258, "epoch": 4958} {"train_loss": -7.280816078186035, "global_step": 208259, "epoch": 4958} {"train_loss": -7.326007843017578, "global_step": 208260, "epoch": 4958} {"train_loss": -7.255341529846191, "global_step": 208261, "epoch": 4958} {"train_loss": -7.425066947937012, "global_step": 208262, "epoch": 4958} {"train_loss": -7.3936614990234375, "global_step": 208263, "epoch": 4958} {"train_loss": -7.340666770935059, "global_step": 208264, "epoch": 4958} {"train_loss": -7.413987159729004, "global_step": 208265, "epoch": 4958} {"train_loss": -7.363187789916992, "global_step": 208266, "epoch": 4958} {"train_loss": -7.336329936981201, "global_step": 208267, "epoch": 4958} {"train_loss": -7.466047286987305, "global_step": 208268, "epoch": 4958} {"train_loss": -7.38901424407959, "global_step": 208269, "epoch": 4958} {"train_loss": -7.2809014320373535, "global_step": 208270, "epoch": 4958} {"train_loss": -7.249755859375, "global_step": 208271, "epoch": 4958} {"train_loss": -7.430720329284668, "global_step": 208272, "epoch": 4958} {"train_loss": -7.3184003829956055, "global_step": 208273, "epoch": 4958} {"train_loss": -7.410592079162598, "global_step": 208274, "epoch": 4958} {"train_loss": -7.398284912109375, "global_step": 208275, "epoch": 4958} {"train_loss": -7.246433258056641, "global_step": 208276, "epoch": 4958} {"train_loss": -7.3167190324692495, "global_step": 208277, "epoch": 4958, "val_loss": 81703.359375} {"train_loss": -7.336570739746094, "global_step": 208278, "epoch": 4959} {"train_loss": -7.3992204666137695, "global_step": 208279, "epoch": 4959} {"train_loss": -7.384221076965332, "global_step": 208280, "epoch": 4959} {"train_loss": -7.43851900100708, "global_step": 208281, "epoch": 4959} {"train_loss": -7.4304094314575195, "global_step": 208282, "epoch": 4959} {"train_loss": -7.415410995483398, "global_step": 208283, "epoch": 4959} {"train_loss": -7.339349746704102, "global_step": 208284, "epoch": 4959} {"train_loss": -7.358152389526367, "global_step": 208285, "epoch": 4959} {"train_loss": -7.429709434509277, "global_step": 208286, "epoch": 4959} {"train_loss": -7.42318058013916, "global_step": 208287, "epoch": 4959} {"train_loss": -7.287332534790039, "global_step": 208288, "epoch": 4959} {"train_loss": -7.424399375915527, "global_step": 208289, "epoch": 4959} {"train_loss": -7.395820617675781, "global_step": 208290, "epoch": 4959} {"train_loss": -7.38060188293457, "global_step": 208291, "epoch": 4959} {"train_loss": -7.386506080627441, "global_step": 208292, "epoch": 4959} {"train_loss": -7.298871040344238, "global_step": 208293, "epoch": 4959} {"train_loss": -7.327942848205566, "global_step": 208294, "epoch": 4959} {"train_loss": -7.388961315155029, "global_step": 208295, "epoch": 4959} {"train_loss": -7.326328754425049, "global_step": 208296, "epoch": 4959} {"train_loss": -7.3543572425842285, "global_step": 208297, "epoch": 4959} {"train_loss": -7.313961982727051, "global_step": 208298, "epoch": 4959} {"train_loss": -7.311761856079102, "global_step": 208299, "epoch": 4959} {"train_loss": -7.451843738555908, "global_step": 208300, "epoch": 4959} {"train_loss": -7.391844749450684, "global_step": 208301, "epoch": 4959} {"train_loss": -7.400702476501465, "global_step": 208302, "epoch": 4959} {"train_loss": -7.345953464508057, "global_step": 208303, "epoch": 4959} {"train_loss": -7.410794258117676, "global_step": 208304, "epoch": 4959} {"train_loss": -7.348343372344971, "global_step": 208305, "epoch": 4959} {"train_loss": -7.348861217498779, "global_step": 208306, "epoch": 4959} {"train_loss": -7.472926139831543, "global_step": 208307, "epoch": 4959} {"train_loss": -7.2646484375, "global_step": 208308, "epoch": 4959} {"train_loss": -7.3794026374816895, "global_step": 208309, "epoch": 4959} {"train_loss": -7.41851806640625, "global_step": 208310, "epoch": 4959} {"train_loss": -7.234999656677246, "global_step": 208311, "epoch": 4959} {"train_loss": -7.325082302093506, "global_step": 208312, "epoch": 4959} {"train_loss": -7.328107833862305, "global_step": 208313, "epoch": 4959} {"train_loss": -7.315871238708496, "global_step": 208314, "epoch": 4959} {"train_loss": -7.474970817565918, "global_step": 208315, "epoch": 4959} {"train_loss": -7.369844913482666, "global_step": 208316, "epoch": 4959} {"train_loss": -7.323720455169678, "global_step": 208317, "epoch": 4959} {"train_loss": -7.3814520835876465, "global_step": 208318, "epoch": 4959} {"train_loss": -7.37067030725025, "global_step": 208319, "epoch": 4959, "val_loss": 81871.0390625} {"train_loss": -7.360408782958984, "global_step": 208320, "epoch": 4960} {"train_loss": -7.366207122802734, "global_step": 208321, "epoch": 4960} {"train_loss": -7.471739292144775, "global_step": 208322, "epoch": 4960} {"train_loss": -7.322301864624023, "global_step": 208323, "epoch": 4960} {"train_loss": -7.410782814025879, "global_step": 208324, "epoch": 4960} {"train_loss": -7.452376365661621, "global_step": 208325, "epoch": 4960} {"train_loss": -7.4606804847717285, "global_step": 208326, "epoch": 4960} {"train_loss": -7.279678821563721, "global_step": 208327, "epoch": 4960} {"train_loss": -7.352275371551514, "global_step": 208328, "epoch": 4960} {"train_loss": -7.253989219665527, "global_step": 208329, "epoch": 4960} {"train_loss": -7.231377124786377, "global_step": 208330, "epoch": 4960} {"train_loss": -7.434762001037598, "global_step": 208331, "epoch": 4960} {"train_loss": -7.26739501953125, "global_step": 208332, "epoch": 4960} {"train_loss": -7.2313079833984375, "global_step": 208333, "epoch": 4960} {"train_loss": -7.405771255493164, "global_step": 208334, "epoch": 4960} {"train_loss": -7.331604957580566, "global_step": 208335, "epoch": 4960} {"train_loss": -7.419541358947754, "global_step": 208336, "epoch": 4960} {"train_loss": -7.411031723022461, "global_step": 208337, "epoch": 4960} {"train_loss": -7.345373153686523, "global_step": 208338, "epoch": 4960} {"train_loss": -7.350612163543701, "global_step": 208339, "epoch": 4960} {"train_loss": -7.447141647338867, "global_step": 208340, "epoch": 4960} {"train_loss": -7.284904479980469, "global_step": 208341, "epoch": 4960} {"train_loss": -7.310924530029297, "global_step": 208342, "epoch": 4960} {"train_loss": -7.288877964019775, "global_step": 208343, "epoch": 4960} {"train_loss": -7.391085624694824, "global_step": 208344, "epoch": 4960} {"train_loss": -7.411722183227539, "global_step": 208345, "epoch": 4960} {"train_loss": -7.400714874267578, "global_step": 208346, "epoch": 4960} {"train_loss": -7.416367530822754, "global_step": 208347, "epoch": 4960} {"train_loss": -7.401919364929199, "global_step": 208348, "epoch": 4960} {"train_loss": -7.414340019226074, "global_step": 208349, "epoch": 4960} {"train_loss": -7.4461669921875, "global_step": 208350, "epoch": 4960} {"train_loss": -7.398070812225342, "global_step": 208351, "epoch": 4960} {"train_loss": -7.262871742248535, "global_step": 208352, "epoch": 4960} {"train_loss": -7.431585311889648, "global_step": 208353, "epoch": 4960} {"train_loss": -7.368022918701172, "global_step": 208354, "epoch": 4960} {"train_loss": -7.323007583618164, "global_step": 208355, "epoch": 4960} {"train_loss": -7.484548568725586, "global_step": 208356, "epoch": 4960} {"train_loss": -7.428098201751709, "global_step": 208357, "epoch": 4960} {"train_loss": -7.486885070800781, "global_step": 208358, "epoch": 4960} {"train_loss": -7.379809379577637, "global_step": 208359, "epoch": 4960} {"train_loss": -7.4007368087768555, "global_step": 208360, "epoch": 4960} {"train_loss": -7.3751456169855025, "global_step": 208361, "epoch": 4960, "val_loss": 82018.3203125} {"train_loss": -7.496122360229492, "global_step": 208362, "epoch": 4961} {"train_loss": -7.470966339111328, "global_step": 208363, "epoch": 4961} {"train_loss": -7.452230453491211, "global_step": 208364, "epoch": 4961} {"train_loss": -7.329092025756836, "global_step": 208365, "epoch": 4961} {"train_loss": -7.365811347961426, "global_step": 208366, "epoch": 4961} {"train_loss": -7.423369407653809, "global_step": 208367, "epoch": 4961} {"train_loss": -7.369758605957031, "global_step": 208368, "epoch": 4961} {"train_loss": -7.516873359680176, "global_step": 208369, "epoch": 4961} {"train_loss": -7.322761535644531, "global_step": 208370, "epoch": 4961} {"train_loss": -7.35501766204834, "global_step": 208371, "epoch": 4961} {"train_loss": -7.2979326248168945, "global_step": 208372, "epoch": 4961} {"train_loss": -7.297933578491211, "global_step": 208373, "epoch": 4961} {"train_loss": -7.317779064178467, "global_step": 208374, "epoch": 4961} {"train_loss": -7.387273788452148, "global_step": 208375, "epoch": 4961} {"train_loss": -7.435639381408691, "global_step": 208376, "epoch": 4961} {"train_loss": -7.459270000457764, "global_step": 208377, "epoch": 4961} {"train_loss": -7.400882720947266, "global_step": 208378, "epoch": 4961} {"train_loss": -7.413041114807129, "global_step": 208379, "epoch": 4961} {"train_loss": -7.396903038024902, "global_step": 208380, "epoch": 4961} {"train_loss": -7.427282333374023, "global_step": 208381, "epoch": 4961} {"train_loss": -7.5158185958862305, "global_step": 208382, "epoch": 4961} {"train_loss": -7.5819854736328125, "global_step": 208383, "epoch": 4961} {"train_loss": -7.299438953399658, "global_step": 208384, "epoch": 4961} {"train_loss": -7.451326370239258, "global_step": 208385, "epoch": 4961} {"train_loss": -7.4922871589660645, "global_step": 208386, "epoch": 4961} {"train_loss": -7.435732841491699, "global_step": 208387, "epoch": 4961} {"train_loss": -7.368051528930664, "global_step": 208388, "epoch": 4961} {"train_loss": -7.460521221160889, "global_step": 208389, "epoch": 4961} {"train_loss": -7.340084552764893, "global_step": 208390, "epoch": 4961} {"train_loss": -7.386476516723633, "global_step": 208391, "epoch": 4961} {"train_loss": -7.391787528991699, "global_step": 208392, "epoch": 4961} {"train_loss": -7.316352844238281, "global_step": 208393, "epoch": 4961} {"train_loss": -7.3553266525268555, "global_step": 208394, "epoch": 4961} {"train_loss": -7.235086441040039, "global_step": 208395, "epoch": 4961} {"train_loss": -7.165363311767578, "global_step": 208396, "epoch": 4961} {"train_loss": -7.175490856170654, "global_step": 208397, "epoch": 4961} {"train_loss": -7.329625606536865, "global_step": 208398, "epoch": 4961} {"train_loss": -7.24787712097168, "global_step": 208399, "epoch": 4961} {"train_loss": -7.186942100524902, "global_step": 208400, "epoch": 4961} {"train_loss": -7.042452812194824, "global_step": 208401, "epoch": 4961} {"train_loss": -7.13586950302124, "global_step": 208402, "epoch": 4961} {"train_loss": -7.35290036882673, "global_step": 208403, "epoch": 4961, "val_loss": 82148.28125} {"train_loss": -7.230319976806641, "global_step": 208404, "epoch": 4962} {"train_loss": -7.251278400421143, "global_step": 208405, "epoch": 4962} {"train_loss": -7.09426212310791, "global_step": 208406, "epoch": 4962} {"train_loss": -7.119444847106934, "global_step": 208407, "epoch": 4962} {"train_loss": -7.172297477722168, "global_step": 208408, "epoch": 4962} {"train_loss": -7.2437591552734375, "global_step": 208409, "epoch": 4962} {"train_loss": -7.215994358062744, "global_step": 208410, "epoch": 4962} {"train_loss": -7.301752090454102, "global_step": 208411, "epoch": 4962} {"train_loss": -7.0603108406066895, "global_step": 208412, "epoch": 4962} {"train_loss": -7.320806503295898, "global_step": 208413, "epoch": 4962} {"train_loss": -7.252167224884033, "global_step": 208414, "epoch": 4962} {"train_loss": -7.304710388183594, "global_step": 208415, "epoch": 4962} {"train_loss": -7.278028964996338, "global_step": 208416, "epoch": 4962} {"train_loss": -7.2141618728637695, "global_step": 208417, "epoch": 4962} {"train_loss": -7.405289173126221, "global_step": 208418, "epoch": 4962} {"train_loss": -7.291443824768066, "global_step": 208419, "epoch": 4962} {"train_loss": -7.323838233947754, "global_step": 208420, "epoch": 4962} {"train_loss": -7.287456512451172, "global_step": 208421, "epoch": 4962} {"train_loss": -7.409367561340332, "global_step": 208422, "epoch": 4962} {"train_loss": -7.318889617919922, "global_step": 208423, "epoch": 4962} {"train_loss": -7.341867446899414, "global_step": 208424, "epoch": 4962} {"train_loss": -7.447329044342041, "global_step": 208425, "epoch": 4962} {"train_loss": -7.356712818145752, "global_step": 208426, "epoch": 4962} {"train_loss": -7.3599114418029785, "global_step": 208427, "epoch": 4962} {"train_loss": -7.419899940490723, "global_step": 208428, "epoch": 4962} {"train_loss": -7.374159336090088, "global_step": 208429, "epoch": 4962} {"train_loss": -7.357048034667969, "global_step": 208430, "epoch": 4962} {"train_loss": -7.359955787658691, "global_step": 208431, "epoch": 4962} {"train_loss": -7.503076553344727, "global_step": 208432, "epoch": 4962} {"train_loss": -7.402398586273193, "global_step": 208433, "epoch": 4962} {"train_loss": -7.393107891082764, "global_step": 208434, "epoch": 4962} {"train_loss": -7.467566013336182, "global_step": 208435, "epoch": 4962} {"train_loss": -7.333674430847168, "global_step": 208436, "epoch": 4962} {"train_loss": -7.380981922149658, "global_step": 208437, "epoch": 4962} {"train_loss": -7.419867515563965, "global_step": 208438, "epoch": 4962} {"train_loss": -7.3729023933410645, "global_step": 208439, "epoch": 4962} {"train_loss": -7.400409698486328, "global_step": 208440, "epoch": 4962} {"train_loss": -7.306568145751953, "global_step": 208441, "epoch": 4962} {"train_loss": -7.336627006530762, "global_step": 208442, "epoch": 4962} {"train_loss": -7.384936809539795, "global_step": 208443, "epoch": 4962} {"train_loss": -7.4333696365356445, "global_step": 208444, "epoch": 4962} {"train_loss": -7.323864221572876, "global_step": 208445, "epoch": 4962, "val_loss": 82087.828125} {"train_loss": -7.29305362701416, "global_step": 208446, "epoch": 4963} {"train_loss": -7.395833492279053, "global_step": 208447, "epoch": 4963} {"train_loss": -7.42696475982666, "global_step": 208448, "epoch": 4963} {"train_loss": -7.259451866149902, "global_step": 208449, "epoch": 4963} {"train_loss": -7.237520694732666, "global_step": 208450, "epoch": 4963} {"train_loss": -7.259376525878906, "global_step": 208451, "epoch": 4963} {"train_loss": -7.232048988342285, "global_step": 208452, "epoch": 4963} {"train_loss": -7.344771862030029, "global_step": 208453, "epoch": 4963} {"train_loss": -7.422905921936035, "global_step": 208454, "epoch": 4963} {"train_loss": -7.311546802520752, "global_step": 208455, "epoch": 4963} {"train_loss": -7.3124237060546875, "global_step": 208456, "epoch": 4963} {"train_loss": -7.2293596267700195, "global_step": 208457, "epoch": 4963} {"train_loss": -7.310471534729004, "global_step": 208458, "epoch": 4963} {"train_loss": -7.406532287597656, "global_step": 208459, "epoch": 4963} {"train_loss": -7.234749794006348, "global_step": 208460, "epoch": 4963} {"train_loss": -7.358397006988525, "global_step": 208461, "epoch": 4963} {"train_loss": -7.370846748352051, "global_step": 208462, "epoch": 4963} {"train_loss": -7.333185195922852, "global_step": 208463, "epoch": 4963} {"train_loss": -7.175069808959961, "global_step": 208464, "epoch": 4963} {"train_loss": -7.407361030578613, "global_step": 208465, "epoch": 4963} {"train_loss": -7.345198154449463, "global_step": 208466, "epoch": 4963} {"train_loss": -7.260838985443115, "global_step": 208467, "epoch": 4963} {"train_loss": -7.250252723693848, "global_step": 208468, "epoch": 4963} {"train_loss": -7.307670593261719, "global_step": 208469, "epoch": 4963} {"train_loss": -7.129910469055176, "global_step": 208470, "epoch": 4963} {"train_loss": -7.289289474487305, "global_step": 208471, "epoch": 4963} {"train_loss": -7.140599250793457, "global_step": 208472, "epoch": 4963} {"train_loss": -7.209738731384277, "global_step": 208473, "epoch": 4963} {"train_loss": -7.202568054199219, "global_step": 208474, "epoch": 4963} {"train_loss": -7.0740132331848145, "global_step": 208475, "epoch": 4963} {"train_loss": -7.159184455871582, "global_step": 208476, "epoch": 4963} {"train_loss": -7.05280876159668, "global_step": 208477, "epoch": 4963} {"train_loss": -7.188065528869629, "global_step": 208478, "epoch": 4963} {"train_loss": -7.115368843078613, "global_step": 208479, "epoch": 4963} {"train_loss": -7.134771347045898, "global_step": 208480, "epoch": 4963} {"train_loss": -7.092845916748047, "global_step": 208481, "epoch": 4963} {"train_loss": -7.073488235473633, "global_step": 208482, "epoch": 4963} {"train_loss": -7.29882287979126, "global_step": 208483, "epoch": 4963} {"train_loss": -7.06538200378418, "global_step": 208484, "epoch": 4963} {"train_loss": -7.230204105377197, "global_step": 208485, "epoch": 4963} {"train_loss": -7.069345474243164, "global_step": 208486, "epoch": 4963} {"train_loss": -7.243152005331857, "global_step": 208487, "epoch": 4963, "val_loss": 81623.71875} {"train_loss": -7.165863990783691, "global_step": 208488, "epoch": 4964} {"train_loss": -7.226919174194336, "global_step": 208489, "epoch": 4964} {"train_loss": -7.118066787719727, "global_step": 208490, "epoch": 4964} {"train_loss": -7.1838836669921875, "global_step": 208491, "epoch": 4964} {"train_loss": -7.235565185546875, "global_step": 208492, "epoch": 4964} {"train_loss": -7.126582145690918, "global_step": 208493, "epoch": 4964} {"train_loss": -7.22333288192749, "global_step": 208494, "epoch": 4964} {"train_loss": -7.037142753601074, "global_step": 208495, "epoch": 4964} {"train_loss": -7.213713645935059, "global_step": 208496, "epoch": 4964} {"train_loss": -7.177955627441406, "global_step": 208497, "epoch": 4964} {"train_loss": -7.314088821411133, "global_step": 208498, "epoch": 4964} {"train_loss": -7.224172592163086, "global_step": 208499, "epoch": 4964} {"train_loss": -7.306013107299805, "global_step": 208500, "epoch": 4964} {"train_loss": -7.2606120109558105, "global_step": 208501, "epoch": 4964} {"train_loss": -7.3606672286987305, "global_step": 208502, "epoch": 4964} {"train_loss": -7.266966819763184, "global_step": 208503, "epoch": 4964} {"train_loss": -7.293200969696045, "global_step": 208504, "epoch": 4964} {"train_loss": -7.361360549926758, "global_step": 208505, "epoch": 4964} {"train_loss": -7.315678596496582, "global_step": 208506, "epoch": 4964} {"train_loss": -7.372540473937988, "global_step": 208507, "epoch": 4964} {"train_loss": -7.337637424468994, "global_step": 208508, "epoch": 4964} {"train_loss": -7.299874305725098, "global_step": 208509, "epoch": 4964} {"train_loss": -7.388757705688477, "global_step": 208510, "epoch": 4964} {"train_loss": -7.352238655090332, "global_step": 208511, "epoch": 4964} {"train_loss": -7.369701385498047, "global_step": 208512, "epoch": 4964} {"train_loss": -7.316531181335449, "global_step": 208513, "epoch": 4964} {"train_loss": -7.410861968994141, "global_step": 208514, "epoch": 4964} {"train_loss": -7.3438310623168945, "global_step": 208515, "epoch": 4964} {"train_loss": -7.372796535491943, "global_step": 208516, "epoch": 4964} {"train_loss": -7.463037490844727, "global_step": 208517, "epoch": 4964} {"train_loss": -7.5375871658325195, "global_step": 208518, "epoch": 4964} {"train_loss": -7.513723373413086, "global_step": 208519, "epoch": 4964} {"train_loss": -7.47859525680542, "global_step": 208520, "epoch": 4964} {"train_loss": -7.396337032318115, "global_step": 208521, "epoch": 4964} {"train_loss": -7.382386207580566, "global_step": 208522, "epoch": 4964} {"train_loss": -7.4180755615234375, "global_step": 208523, "epoch": 4964} {"train_loss": -7.521777153015137, "global_step": 208524, "epoch": 4964} {"train_loss": -7.416563987731934, "global_step": 208525, "epoch": 4964} {"train_loss": -7.412902355194092, "global_step": 208526, "epoch": 4964} {"train_loss": -7.4990105628967285, "global_step": 208527, "epoch": 4964} {"train_loss": -7.467512607574463, "global_step": 208528, "epoch": 4964} {"train_loss": -7.331160340990339, "global_step": 208529, "epoch": 4964, "val_loss": 81860.265625} {"train_loss": -7.422236442565918, "global_step": 208530, "epoch": 4965} {"train_loss": -7.5330400466918945, "global_step": 208531, "epoch": 4965} {"train_loss": -7.337576866149902, "global_step": 208532, "epoch": 4965} {"train_loss": -7.332151412963867, "global_step": 208533, "epoch": 4965} {"train_loss": -7.487366676330566, "global_step": 208534, "epoch": 4965} {"train_loss": -7.222837924957275, "global_step": 208535, "epoch": 4965} {"train_loss": -7.320756912231445, "global_step": 208536, "epoch": 4965} {"train_loss": -7.27036190032959, "global_step": 208537, "epoch": 4965} {"train_loss": -7.152788162231445, "global_step": 208538, "epoch": 4965} {"train_loss": -7.404413223266602, "global_step": 208539, "epoch": 4965} {"train_loss": -7.371908187866211, "global_step": 208540, "epoch": 4965} {"train_loss": -7.291020393371582, "global_step": 208541, "epoch": 4965} {"train_loss": -7.321421146392822, "global_step": 208542, "epoch": 4965} {"train_loss": -7.2060980796813965, "global_step": 208543, "epoch": 4965} {"train_loss": -7.439303398132324, "global_step": 208544, "epoch": 4965} {"train_loss": -7.354281425476074, "global_step": 208545, "epoch": 4965} {"train_loss": -7.413707733154297, "global_step": 208546, "epoch": 4965} {"train_loss": -7.314699172973633, "global_step": 208547, "epoch": 4965} {"train_loss": -7.383748531341553, "global_step": 208548, "epoch": 4965} {"train_loss": -7.166308879852295, "global_step": 208549, "epoch": 4965} {"train_loss": -7.2453532218933105, "global_step": 208550, "epoch": 4965} {"train_loss": -7.346324443817139, "global_step": 208551, "epoch": 4965} {"train_loss": -7.268538475036621, "global_step": 208552, "epoch": 4965} {"train_loss": -7.2368855476379395, "global_step": 208553, "epoch": 4965} {"train_loss": -7.308189392089844, "global_step": 208554, "epoch": 4965} {"train_loss": -7.183200836181641, "global_step": 208555, "epoch": 4965} {"train_loss": -7.272184371948242, "global_step": 208556, "epoch": 4965} {"train_loss": -7.211580276489258, "global_step": 208557, "epoch": 4965} {"train_loss": -7.213812828063965, "global_step": 208558, "epoch": 4965} {"train_loss": -7.3033976554870605, "global_step": 208559, "epoch": 4965} {"train_loss": -7.288283348083496, "global_step": 208560, "epoch": 4965} {"train_loss": -7.308280944824219, "global_step": 208561, "epoch": 4965} {"train_loss": -7.4057817459106445, "global_step": 208562, "epoch": 4965} {"train_loss": -7.3564276695251465, "global_step": 208563, "epoch": 4965} {"train_loss": -7.326685428619385, "global_step": 208564, "epoch": 4965} {"train_loss": -7.288313865661621, "global_step": 208565, "epoch": 4965} {"train_loss": -7.278122901916504, "global_step": 208566, "epoch": 4965} {"train_loss": -7.382400989532471, "global_step": 208567, "epoch": 4965} {"train_loss": -7.394472122192383, "global_step": 208568, "epoch": 4965} {"train_loss": -7.480866432189941, "global_step": 208569, "epoch": 4965} {"train_loss": -7.207966327667236, "global_step": 208570, "epoch": 4965} {"train_loss": -7.317114285060337, "global_step": 208571, "epoch": 4965, "val_loss": 81969.6875} {"train_loss": -7.358860969543457, "global_step": 208572, "epoch": 4966} {"train_loss": -7.312058448791504, "global_step": 208573, "epoch": 4966} {"train_loss": -7.375421524047852, "global_step": 208574, "epoch": 4966} {"train_loss": -7.331515312194824, "global_step": 208575, "epoch": 4966} {"train_loss": -7.262939453125, "global_step": 208576, "epoch": 4966} {"train_loss": -7.415482044219971, "global_step": 208577, "epoch": 4966} {"train_loss": -7.411290168762207, "global_step": 208578, "epoch": 4966} {"train_loss": -7.3619303703308105, "global_step": 208579, "epoch": 4966} {"train_loss": -7.326481819152832, "global_step": 208580, "epoch": 4966} {"train_loss": -7.316555023193359, "global_step": 208581, "epoch": 4966} {"train_loss": -7.346528053283691, "global_step": 208582, "epoch": 4966} {"train_loss": -7.37123966217041, "global_step": 208583, "epoch": 4966} {"train_loss": -7.201358795166016, "global_step": 208584, "epoch": 4966} {"train_loss": -7.281113624572754, "global_step": 208585, "epoch": 4966} {"train_loss": -7.385504722595215, "global_step": 208586, "epoch": 4966} {"train_loss": -7.282276630401611, "global_step": 208587, "epoch": 4966} {"train_loss": -7.274255752563477, "global_step": 208588, "epoch": 4966} {"train_loss": -7.402500152587891, "global_step": 208589, "epoch": 4966} {"train_loss": -7.361323356628418, "global_step": 208590, "epoch": 4966} {"train_loss": -7.327886581420898, "global_step": 208591, "epoch": 4966} {"train_loss": -7.3353352546691895, "global_step": 208592, "epoch": 4966} {"train_loss": -7.359477996826172, "global_step": 208593, "epoch": 4966} {"train_loss": -7.303232192993164, "global_step": 208594, "epoch": 4966} {"train_loss": -7.532291412353516, "global_step": 208595, "epoch": 4966} {"train_loss": -7.318710803985596, "global_step": 208596, "epoch": 4966} {"train_loss": -7.322563648223877, "global_step": 208597, "epoch": 4966} {"train_loss": -7.4506940841674805, "global_step": 208598, "epoch": 4966} {"train_loss": -7.419888496398926, "global_step": 208599, "epoch": 4966} {"train_loss": -7.425026893615723, "global_step": 208600, "epoch": 4966} {"train_loss": -7.374902725219727, "global_step": 208601, "epoch": 4966} {"train_loss": -7.406888961791992, "global_step": 208602, "epoch": 4966} {"train_loss": -7.318502426147461, "global_step": 208603, "epoch": 4966} {"train_loss": -7.534399032592773, "global_step": 208604, "epoch": 4966} {"train_loss": -7.272891998291016, "global_step": 208605, "epoch": 4966} {"train_loss": -7.291952133178711, "global_step": 208606, "epoch": 4966} {"train_loss": -7.408160209655762, "global_step": 208607, "epoch": 4966} {"train_loss": -7.293529033660889, "global_step": 208608, "epoch": 4966} {"train_loss": -7.3415632247924805, "global_step": 208609, "epoch": 4966} {"train_loss": -7.354616165161133, "global_step": 208610, "epoch": 4966} {"train_loss": -7.249251365661621, "global_step": 208611, "epoch": 4966} {"train_loss": -7.372405529022217, "global_step": 208612, "epoch": 4966} {"train_loss": -7.355252583821614, "global_step": 208613, "epoch": 4966, "val_loss": 81998.375} {"train_loss": -7.40616512298584, "global_step": 208614, "epoch": 4967} {"train_loss": -7.384212017059326, "global_step": 208615, "epoch": 4967} {"train_loss": -7.463703155517578, "global_step": 208616, "epoch": 4967} {"train_loss": -7.368501663208008, "global_step": 208617, "epoch": 4967} {"train_loss": -7.262521743774414, "global_step": 208618, "epoch": 4967} {"train_loss": -7.39756965637207, "global_step": 208619, "epoch": 4967} {"train_loss": -7.463942527770996, "global_step": 208620, "epoch": 4967} {"train_loss": -7.352256774902344, "global_step": 208621, "epoch": 4967} {"train_loss": -7.45933198928833, "global_step": 208622, "epoch": 4967} {"train_loss": -7.31596040725708, "global_step": 208623, "epoch": 4967} {"train_loss": -7.615666389465332, "global_step": 208624, "epoch": 4967} {"train_loss": -7.45847749710083, "global_step": 208625, "epoch": 4967} {"train_loss": -7.442807197570801, "global_step": 208626, "epoch": 4967} {"train_loss": -7.482856750488281, "global_step": 208627, "epoch": 4967} {"train_loss": -7.461099624633789, "global_step": 208628, "epoch": 4967} {"train_loss": -7.370981693267822, "global_step": 208629, "epoch": 4967} {"train_loss": -7.451271057128906, "global_step": 208630, "epoch": 4967} {"train_loss": -7.471523284912109, "global_step": 208631, "epoch": 4967} {"train_loss": -7.334146022796631, "global_step": 208632, "epoch": 4967} {"train_loss": -7.487514495849609, "global_step": 208633, "epoch": 4967} {"train_loss": -7.448642730712891, "global_step": 208634, "epoch": 4967} {"train_loss": -7.341905117034912, "global_step": 208635, "epoch": 4967} {"train_loss": -7.401589393615723, "global_step": 208636, "epoch": 4967} {"train_loss": -7.440845489501953, "global_step": 208637, "epoch": 4967} {"train_loss": -7.440969467163086, "global_step": 208638, "epoch": 4967} {"train_loss": -7.255521774291992, "global_step": 208639, "epoch": 4967} {"train_loss": -7.40037202835083, "global_step": 208640, "epoch": 4967} {"train_loss": -7.357542037963867, "global_step": 208641, "epoch": 4967} {"train_loss": -7.258099555969238, "global_step": 208642, "epoch": 4967} {"train_loss": -7.2682037353515625, "global_step": 208643, "epoch": 4967} {"train_loss": -7.314432144165039, "global_step": 208644, "epoch": 4967} {"train_loss": -7.293130874633789, "global_step": 208645, "epoch": 4967} {"train_loss": -7.344813823699951, "global_step": 208646, "epoch": 4967} {"train_loss": -7.288416862487793, "global_step": 208647, "epoch": 4967} {"train_loss": -7.377488136291504, "global_step": 208648, "epoch": 4967} {"train_loss": -7.231249809265137, "global_step": 208649, "epoch": 4967} {"train_loss": -7.319484710693359, "global_step": 208650, "epoch": 4967} {"train_loss": -7.334840297698975, "global_step": 208651, "epoch": 4967} {"train_loss": -7.320923328399658, "global_step": 208652, "epoch": 4967} {"train_loss": -7.332563400268555, "global_step": 208653, "epoch": 4967} {"train_loss": -7.319392204284668, "global_step": 208654, "epoch": 4967} {"train_loss": -7.378347351437523, "global_step": 208655, "epoch": 4967, "val_loss": 82000.453125} {"train_loss": -7.4094414710998535, "global_step": 208656, "epoch": 4968} {"train_loss": -7.395580768585205, "global_step": 208657, "epoch": 4968} {"train_loss": -7.382009506225586, "global_step": 208658, "epoch": 4968} {"train_loss": -7.350320816040039, "global_step": 208659, "epoch": 4968} {"train_loss": -7.279928207397461, "global_step": 208660, "epoch": 4968} {"train_loss": -7.286657333374023, "global_step": 208661, "epoch": 4968} {"train_loss": -7.488472938537598, "global_step": 208662, "epoch": 4968} {"train_loss": -7.351713180541992, "global_step": 208663, "epoch": 4968} {"train_loss": -7.31641960144043, "global_step": 208664, "epoch": 4968} {"train_loss": -7.4827470779418945, "global_step": 208665, "epoch": 4968} {"train_loss": -7.441084384918213, "global_step": 208666, "epoch": 4968} {"train_loss": -7.426004886627197, "global_step": 208667, "epoch": 4968} {"train_loss": -7.359477996826172, "global_step": 208668, "epoch": 4968} {"train_loss": -7.171197414398193, "global_step": 208669, "epoch": 4968} {"train_loss": -7.253793716430664, "global_step": 208670, "epoch": 4968} {"train_loss": -7.285853862762451, "global_step": 208671, "epoch": 4968} {"train_loss": -7.236042022705078, "global_step": 208672, "epoch": 4968} {"train_loss": -7.312353134155273, "global_step": 208673, "epoch": 4968} {"train_loss": -7.237923622131348, "global_step": 208674, "epoch": 4968} {"train_loss": -7.227449417114258, "global_step": 208675, "epoch": 4968} {"train_loss": -7.354837417602539, "global_step": 208676, "epoch": 4968} {"train_loss": -7.229353904724121, "global_step": 208677, "epoch": 4968} {"train_loss": -7.216462135314941, "global_step": 208678, "epoch": 4968} {"train_loss": -7.373699188232422, "global_step": 208679, "epoch": 4968} {"train_loss": -7.185559272766113, "global_step": 208680, "epoch": 4968} {"train_loss": -7.404274940490723, "global_step": 208681, "epoch": 4968} {"train_loss": -7.252269744873047, "global_step": 208682, "epoch": 4968} {"train_loss": -7.30176305770874, "global_step": 208683, "epoch": 4968} {"train_loss": -7.308531761169434, "global_step": 208684, "epoch": 4968} {"train_loss": -7.33510684967041, "global_step": 208685, "epoch": 4968} {"train_loss": -7.245401382446289, "global_step": 208686, "epoch": 4968} {"train_loss": -7.211504936218262, "global_step": 208687, "epoch": 4968} {"train_loss": -7.337296485900879, "global_step": 208688, "epoch": 4968} {"train_loss": -7.302041530609131, "global_step": 208689, "epoch": 4968} {"train_loss": -7.221149444580078, "global_step": 208690, "epoch": 4968} {"train_loss": -7.1645402908325195, "global_step": 208691, "epoch": 4968} {"train_loss": -7.198383808135986, "global_step": 208692, "epoch": 4968} {"train_loss": -7.149405002593994, "global_step": 208693, "epoch": 4968} {"train_loss": -7.282625198364258, "global_step": 208694, "epoch": 4968} {"train_loss": -7.01026725769043, "global_step": 208695, "epoch": 4968} {"train_loss": -7.135281085968018, "global_step": 208696, "epoch": 4968} {"train_loss": -7.290019375937326, "global_step": 208697, "epoch": 4968, "val_loss": 81920.359375} {"train_loss": -7.15962028503418, "global_step": 208698, "epoch": 4969} {"train_loss": -7.260259628295898, "global_step": 208699, "epoch": 4969} {"train_loss": -7.143167495727539, "global_step": 208700, "epoch": 4969} {"train_loss": -7.113663673400879, "global_step": 208701, "epoch": 4969} {"train_loss": -7.221835136413574, "global_step": 208702, "epoch": 4969} {"train_loss": -7.048208713531494, "global_step": 208703, "epoch": 4969} {"train_loss": -7.254327774047852, "global_step": 208704, "epoch": 4969} {"train_loss": -7.258320331573486, "global_step": 208705, "epoch": 4969} {"train_loss": -7.222855567932129, "global_step": 208706, "epoch": 4969} {"train_loss": -7.304566860198975, "global_step": 208707, "epoch": 4969} {"train_loss": -7.193808555603027, "global_step": 208708, "epoch": 4969} {"train_loss": -7.219331741333008, "global_step": 208709, "epoch": 4969} {"train_loss": -7.17525577545166, "global_step": 208710, "epoch": 4969} {"train_loss": -7.336236953735352, "global_step": 208711, "epoch": 4969} {"train_loss": -7.097303867340088, "global_step": 208712, "epoch": 4969} {"train_loss": -7.298187255859375, "global_step": 208713, "epoch": 4969} {"train_loss": -7.27845573425293, "global_step": 208714, "epoch": 4969} {"train_loss": -7.273999214172363, "global_step": 208715, "epoch": 4969} {"train_loss": -7.320955276489258, "global_step": 208716, "epoch": 4969} {"train_loss": -7.369874000549316, "global_step": 208717, "epoch": 4969} {"train_loss": -7.271791458129883, "global_step": 208718, "epoch": 4969} {"train_loss": -7.289037227630615, "global_step": 208719, "epoch": 4969} {"train_loss": -7.2935638427734375, "global_step": 208720, "epoch": 4969} {"train_loss": -7.392372131347656, "global_step": 208721, "epoch": 4969} {"train_loss": -7.341800689697266, "global_step": 208722, "epoch": 4969} {"train_loss": -7.273201942443848, "global_step": 208723, "epoch": 4969} {"train_loss": -7.3301849365234375, "global_step": 208724, "epoch": 4969} {"train_loss": -7.320255756378174, "global_step": 208725, "epoch": 4969} {"train_loss": -7.328317642211914, "global_step": 208726, "epoch": 4969} {"train_loss": -7.262956619262695, "global_step": 208727, "epoch": 4969} {"train_loss": -7.344423770904541, "global_step": 208728, "epoch": 4969} {"train_loss": -7.345947742462158, "global_step": 208729, "epoch": 4969} {"train_loss": -7.53839111328125, "global_step": 208730, "epoch": 4969} {"train_loss": -7.40054988861084, "global_step": 208731, "epoch": 4969} {"train_loss": -7.2982072830200195, "global_step": 208732, "epoch": 4969} {"train_loss": -7.3169755935668945, "global_step": 208733, "epoch": 4969} {"train_loss": -7.469429969787598, "global_step": 208734, "epoch": 4969} {"train_loss": -7.4591593742370605, "global_step": 208735, "epoch": 4969} {"train_loss": -7.336619853973389, "global_step": 208736, "epoch": 4969} {"train_loss": -7.361364841461182, "global_step": 208737, "epoch": 4969} {"train_loss": -7.331892013549805, "global_step": 208738, "epoch": 4969} {"train_loss": -7.290590411140805, "global_step": 208739, "epoch": 4969, "val_loss": 82001.984375} {"train_loss": -7.338645935058594, "global_step": 208740, "epoch": 4970} {"train_loss": -7.477916717529297, "global_step": 208741, "epoch": 4970} {"train_loss": -7.436724662780762, "global_step": 208742, "epoch": 4970} {"train_loss": -7.352884292602539, "global_step": 208743, "epoch": 4970} {"train_loss": -7.3654961585998535, "global_step": 208744, "epoch": 4970} {"train_loss": -7.363545894622803, "global_step": 208745, "epoch": 4970} {"train_loss": -7.447864532470703, "global_step": 208746, "epoch": 4970} {"train_loss": -7.2240376472473145, "global_step": 208747, "epoch": 4970} {"train_loss": -7.461805820465088, "global_step": 208748, "epoch": 4970} {"train_loss": -7.437906265258789, "global_step": 208749, "epoch": 4970} {"train_loss": -7.3360819816589355, "global_step": 208750, "epoch": 4970} {"train_loss": -7.274456024169922, "global_step": 208751, "epoch": 4970} {"train_loss": -7.218268871307373, "global_step": 208752, "epoch": 4970} {"train_loss": -7.260725021362305, "global_step": 208753, "epoch": 4970} {"train_loss": -7.293444633483887, "global_step": 208754, "epoch": 4970} {"train_loss": -7.234838008880615, "global_step": 208755, "epoch": 4970} {"train_loss": -7.32952880859375, "global_step": 208756, "epoch": 4970} {"train_loss": -7.256190299987793, "global_step": 208757, "epoch": 4970} {"train_loss": -7.334199905395508, "global_step": 208758, "epoch": 4970} {"train_loss": -7.256412029266357, "global_step": 208759, "epoch": 4970} {"train_loss": -7.325896263122559, "global_step": 208760, "epoch": 4970} {"train_loss": -7.351844310760498, "global_step": 208761, "epoch": 4970} {"train_loss": -7.368699073791504, "global_step": 208762, "epoch": 4970} {"train_loss": -7.16851282119751, "global_step": 208763, "epoch": 4970} {"train_loss": -7.310586929321289, "global_step": 208764, "epoch": 4970} {"train_loss": -7.317770957946777, "global_step": 208765, "epoch": 4970} {"train_loss": -7.197122573852539, "global_step": 208766, "epoch": 4970} {"train_loss": -7.2529296875, "global_step": 208767, "epoch": 4970} {"train_loss": -7.296820640563965, "global_step": 208768, "epoch": 4970} {"train_loss": -7.2867889404296875, "global_step": 208769, "epoch": 4970} {"train_loss": -7.373741626739502, "global_step": 208770, "epoch": 4970} {"train_loss": -7.40789270401001, "global_step": 208771, "epoch": 4970} {"train_loss": -7.408745288848877, "global_step": 208772, "epoch": 4970} {"train_loss": -7.400935649871826, "global_step": 208773, "epoch": 4970} {"train_loss": -7.337522506713867, "global_step": 208774, "epoch": 4970} {"train_loss": -7.181692123413086, "global_step": 208775, "epoch": 4970} {"train_loss": -7.31908655166626, "global_step": 208776, "epoch": 4970} {"train_loss": -7.305070877075195, "global_step": 208777, "epoch": 4970} {"train_loss": -7.480099201202393, "global_step": 208778, "epoch": 4970} {"train_loss": -7.265181541442871, "global_step": 208779, "epoch": 4970} {"train_loss": -7.226374626159668, "global_step": 208780, "epoch": 4970} {"train_loss": -7.325941710245042, "global_step": 208781, "epoch": 4970, "val_loss": 81932.765625} {"train_loss": -7.431718349456787, "global_step": 208782, "epoch": 4971} {"train_loss": -7.254934310913086, "global_step": 208783, "epoch": 4971} {"train_loss": -7.231877326965332, "global_step": 208784, "epoch": 4971} {"train_loss": -7.371054172515869, "global_step": 208785, "epoch": 4971} {"train_loss": -7.347650527954102, "global_step": 208786, "epoch": 4971} {"train_loss": -7.424664497375488, "global_step": 208787, "epoch": 4971} {"train_loss": -7.345422744750977, "global_step": 208788, "epoch": 4971} {"train_loss": -7.386369705200195, "global_step": 208789, "epoch": 4971} {"train_loss": -7.288341522216797, "global_step": 208790, "epoch": 4971} {"train_loss": -7.299712181091309, "global_step": 208791, "epoch": 4971} {"train_loss": -7.279243469238281, "global_step": 208792, "epoch": 4971} {"train_loss": -7.3567094802856445, "global_step": 208793, "epoch": 4971} {"train_loss": -7.272428512573242, "global_step": 208794, "epoch": 4971} {"train_loss": -7.342235565185547, "global_step": 208795, "epoch": 4971} {"train_loss": -7.320603370666504, "global_step": 208796, "epoch": 4971} {"train_loss": -7.285757064819336, "global_step": 208797, "epoch": 4971} {"train_loss": -7.437268257141113, "global_step": 208798, "epoch": 4971} {"train_loss": -7.407837867736816, "global_step": 208799, "epoch": 4971} {"train_loss": -7.346518516540527, "global_step": 208800, "epoch": 4971} {"train_loss": -7.399541854858398, "global_step": 208801, "epoch": 4971} {"train_loss": -7.325443267822266, "global_step": 208802, "epoch": 4971} {"train_loss": -7.279124736785889, "global_step": 208803, "epoch": 4971} {"train_loss": -7.507268905639648, "global_step": 208804, "epoch": 4971} {"train_loss": -7.390618801116943, "global_step": 208805, "epoch": 4971} {"train_loss": -7.359848976135254, "global_step": 208806, "epoch": 4971} {"train_loss": -7.376648902893066, "global_step": 208807, "epoch": 4971} {"train_loss": -7.3443498611450195, "global_step": 208808, "epoch": 4971} {"train_loss": -7.36167049407959, "global_step": 208809, "epoch": 4971} {"train_loss": -7.472834587097168, "global_step": 208810, "epoch": 4971} {"train_loss": -7.364656448364258, "global_step": 208811, "epoch": 4971} {"train_loss": -7.404414176940918, "global_step": 208812, "epoch": 4971} {"train_loss": -7.405113220214844, "global_step": 208813, "epoch": 4971} {"train_loss": -7.403216361999512, "global_step": 208814, "epoch": 4971} {"train_loss": -7.3284406661987305, "global_step": 208815, "epoch": 4971} {"train_loss": -7.4393415451049805, "global_step": 208816, "epoch": 4971} {"train_loss": -7.313261032104492, "global_step": 208817, "epoch": 4971} {"train_loss": -7.27855920791626, "global_step": 208818, "epoch": 4971} {"train_loss": -7.427680969238281, "global_step": 208819, "epoch": 4971} {"train_loss": -7.323735237121582, "global_step": 208820, "epoch": 4971} {"train_loss": -7.302097320556641, "global_step": 208821, "epoch": 4971} {"train_loss": -7.419981002807617, "global_step": 208822, "epoch": 4971} {"train_loss": -7.3567563238598055, "global_step": 208823, "epoch": 4971, "val_loss": 81987.0546875} {"train_loss": -7.378053188323975, "global_step": 208824, "epoch": 4972} {"train_loss": -7.398416519165039, "global_step": 208825, "epoch": 4972} {"train_loss": -7.2352752685546875, "global_step": 208826, "epoch": 4972} {"train_loss": -7.30881929397583, "global_step": 208827, "epoch": 4972} {"train_loss": -7.329441070556641, "global_step": 208828, "epoch": 4972} {"train_loss": -7.3234357833862305, "global_step": 208829, "epoch": 4972} {"train_loss": -7.342024326324463, "global_step": 208830, "epoch": 4972} {"train_loss": -7.456812858581543, "global_step": 208831, "epoch": 4972} {"train_loss": -7.3718767166137695, "global_step": 208832, "epoch": 4972} {"train_loss": -7.357119560241699, "global_step": 208833, "epoch": 4972} {"train_loss": -7.482200622558594, "global_step": 208834, "epoch": 4972} {"train_loss": -7.282201766967773, "global_step": 208835, "epoch": 4972} {"train_loss": -7.409945487976074, "global_step": 208836, "epoch": 4972} {"train_loss": -7.4800262451171875, "global_step": 208837, "epoch": 4972} {"train_loss": -7.273439407348633, "global_step": 208838, "epoch": 4972} {"train_loss": -7.366572380065918, "global_step": 208839, "epoch": 4972} {"train_loss": -7.404270172119141, "global_step": 208840, "epoch": 4972} {"train_loss": -7.3654561042785645, "global_step": 208841, "epoch": 4972} {"train_loss": -7.376246452331543, "global_step": 208842, "epoch": 4972} {"train_loss": -7.4499430656433105, "global_step": 208843, "epoch": 4972} {"train_loss": -7.474684715270996, "global_step": 208844, "epoch": 4972} {"train_loss": -7.436306953430176, "global_step": 208845, "epoch": 4972} {"train_loss": -7.366809368133545, "global_step": 208846, "epoch": 4972} {"train_loss": -7.446110725402832, "global_step": 208847, "epoch": 4972} {"train_loss": -7.291272163391113, "global_step": 208848, "epoch": 4972} {"train_loss": -7.4571919441223145, "global_step": 208849, "epoch": 4972} {"train_loss": -7.464491367340088, "global_step": 208850, "epoch": 4972} {"train_loss": -7.396533966064453, "global_step": 208851, "epoch": 4972} {"train_loss": -7.390255451202393, "global_step": 208852, "epoch": 4972} {"train_loss": -7.2815446853637695, "global_step": 208853, "epoch": 4972} {"train_loss": -7.260969161987305, "global_step": 208854, "epoch": 4972} {"train_loss": -7.457781791687012, "global_step": 208855, "epoch": 4972} {"train_loss": -7.421147346496582, "global_step": 208856, "epoch": 4972} {"train_loss": -7.390145301818848, "global_step": 208857, "epoch": 4972} {"train_loss": -7.306424140930176, "global_step": 208858, "epoch": 4972} {"train_loss": -7.294358253479004, "global_step": 208859, "epoch": 4972} {"train_loss": -7.461605072021484, "global_step": 208860, "epoch": 4972} {"train_loss": -7.268001556396484, "global_step": 208861, "epoch": 4972} {"train_loss": -7.319491386413574, "global_step": 208862, "epoch": 4972} {"train_loss": -7.488746643066406, "global_step": 208863, "epoch": 4972} {"train_loss": -7.32631778717041, "global_step": 208864, "epoch": 4972} {"train_loss": -7.375916481018066, "global_step": 208865, "epoch": 4972, "val_loss": 81985.921875} {"train_loss": -7.253147125244141, "global_step": 208866, "epoch": 4973} {"train_loss": -7.371830940246582, "global_step": 208867, "epoch": 4973} {"train_loss": -7.368462562561035, "global_step": 208868, "epoch": 4973} {"train_loss": -7.424528121948242, "global_step": 208869, "epoch": 4973} {"train_loss": -7.427542686462402, "global_step": 208870, "epoch": 4973} {"train_loss": -7.362316131591797, "global_step": 208871, "epoch": 4973} {"train_loss": -7.407121658325195, "global_step": 208872, "epoch": 4973} {"train_loss": -7.525588035583496, "global_step": 208873, "epoch": 4973} {"train_loss": -7.365673542022705, "global_step": 208874, "epoch": 4973} {"train_loss": -7.383123874664307, "global_step": 208875, "epoch": 4973} {"train_loss": -7.443537712097168, "global_step": 208876, "epoch": 4973} {"train_loss": -7.480491638183594, "global_step": 208877, "epoch": 4973} {"train_loss": -7.416341781616211, "global_step": 208878, "epoch": 4973} {"train_loss": -7.35078239440918, "global_step": 208879, "epoch": 4973} {"train_loss": -7.477831840515137, "global_step": 208880, "epoch": 4973} {"train_loss": -7.405961036682129, "global_step": 208881, "epoch": 4973} {"train_loss": -7.404256343841553, "global_step": 208882, "epoch": 4973} {"train_loss": -7.292884349822998, "global_step": 208883, "epoch": 4973} {"train_loss": -7.233499526977539, "global_step": 208884, "epoch": 4973} {"train_loss": -7.448191165924072, "global_step": 208885, "epoch": 4973} {"train_loss": -7.318241596221924, "global_step": 208886, "epoch": 4973} {"train_loss": -7.297542572021484, "global_step": 208887, "epoch": 4973} {"train_loss": -7.4052839279174805, "global_step": 208888, "epoch": 4973} {"train_loss": -7.390209674835205, "global_step": 208889, "epoch": 4973} {"train_loss": -7.372664928436279, "global_step": 208890, "epoch": 4973} {"train_loss": -7.439289569854736, "global_step": 208891, "epoch": 4973} {"train_loss": -7.298789024353027, "global_step": 208892, "epoch": 4973} {"train_loss": -7.382920265197754, "global_step": 208893, "epoch": 4973} {"train_loss": -7.311257362365723, "global_step": 208894, "epoch": 4973} {"train_loss": -7.293900489807129, "global_step": 208895, "epoch": 4973} {"train_loss": -7.3769097328186035, "global_step": 208896, "epoch": 4973} {"train_loss": -7.311201572418213, "global_step": 208897, "epoch": 4973} {"train_loss": -7.360261917114258, "global_step": 208898, "epoch": 4973} {"train_loss": -7.428731918334961, "global_step": 208899, "epoch": 4973} {"train_loss": -7.325322151184082, "global_step": 208900, "epoch": 4973} {"train_loss": -7.216943740844727, "global_step": 208901, "epoch": 4973} {"train_loss": -7.299416542053223, "global_step": 208902, "epoch": 4973} {"train_loss": -7.408508777618408, "global_step": 208903, "epoch": 4973} {"train_loss": -7.3974409103393555, "global_step": 208904, "epoch": 4973} {"train_loss": -7.380285739898682, "global_step": 208905, "epoch": 4973} {"train_loss": -7.317681789398193, "global_step": 208906, "epoch": 4973} {"train_loss": -7.370012464977446, "global_step": 208907, "epoch": 4973, "val_loss": 82168.3125} {"train_loss": -7.365965366363525, "global_step": 208908, "epoch": 4974} {"train_loss": -7.246364116668701, "global_step": 208909, "epoch": 4974} {"train_loss": -7.321906566619873, "global_step": 208910, "epoch": 4974} {"train_loss": -7.360445976257324, "global_step": 208911, "epoch": 4974} {"train_loss": -7.277153015136719, "global_step": 208912, "epoch": 4974} {"train_loss": -7.264186859130859, "global_step": 208913, "epoch": 4974} {"train_loss": -7.336286544799805, "global_step": 208914, "epoch": 4974} {"train_loss": -7.299691200256348, "global_step": 208915, "epoch": 4974} {"train_loss": -7.101223945617676, "global_step": 208916, "epoch": 4974} {"train_loss": -7.3476362228393555, "global_step": 208917, "epoch": 4974} {"train_loss": -7.398413181304932, "global_step": 208918, "epoch": 4974} {"train_loss": -7.324112892150879, "global_step": 208919, "epoch": 4974} {"train_loss": -7.3259501457214355, "global_step": 208920, "epoch": 4974} {"train_loss": -7.343662261962891, "global_step": 208921, "epoch": 4974} {"train_loss": -7.2950439453125, "global_step": 208922, "epoch": 4974} {"train_loss": -7.399951934814453, "global_step": 208923, "epoch": 4974} {"train_loss": -7.397612571716309, "global_step": 208924, "epoch": 4974} {"train_loss": -7.437211036682129, "global_step": 208925, "epoch": 4974} {"train_loss": -7.29820442199707, "global_step": 208926, "epoch": 4974} {"train_loss": -7.333556652069092, "global_step": 208927, "epoch": 4974} {"train_loss": -7.233236789703369, "global_step": 208928, "epoch": 4974} {"train_loss": -7.305093288421631, "global_step": 208929, "epoch": 4974} {"train_loss": -7.399346351623535, "global_step": 208930, "epoch": 4974} {"train_loss": -7.273232460021973, "global_step": 208931, "epoch": 4974} {"train_loss": -7.41359806060791, "global_step": 208932, "epoch": 4974} {"train_loss": -7.383937835693359, "global_step": 208933, "epoch": 4974} {"train_loss": -7.346762180328369, "global_step": 208934, "epoch": 4974} {"train_loss": -7.415400981903076, "global_step": 208935, "epoch": 4974} {"train_loss": -7.520090103149414, "global_step": 208936, "epoch": 4974} {"train_loss": -7.390303134918213, "global_step": 208937, "epoch": 4974} {"train_loss": -7.353005409240723, "global_step": 208938, "epoch": 4974} {"train_loss": -7.4539971351623535, "global_step": 208939, "epoch": 4974} {"train_loss": -7.240825653076172, "global_step": 208940, "epoch": 4974} {"train_loss": -7.3704071044921875, "global_step": 208941, "epoch": 4974} {"train_loss": -7.269023895263672, "global_step": 208942, "epoch": 4974} {"train_loss": -7.442127704620361, "global_step": 208943, "epoch": 4974} {"train_loss": -7.422033786773682, "global_step": 208944, "epoch": 4974} {"train_loss": -7.455160140991211, "global_step": 208945, "epoch": 4974} {"train_loss": -7.3647356033325195, "global_step": 208946, "epoch": 4974} {"train_loss": -7.286031723022461, "global_step": 208947, "epoch": 4974} {"train_loss": -7.454769134521484, "global_step": 208948, "epoch": 4974} {"train_loss": -7.349254426502046, "global_step": 208949, "epoch": 4974, "val_loss": 82012.9921875} {"train_loss": -7.443416118621826, "global_step": 208950, "epoch": 4975} {"train_loss": -7.380121231079102, "global_step": 208951, "epoch": 4975} {"train_loss": -7.348649024963379, "global_step": 208952, "epoch": 4975} {"train_loss": -7.337563991546631, "global_step": 208953, "epoch": 4975} {"train_loss": -7.35294771194458, "global_step": 208954, "epoch": 4975} {"train_loss": -7.3236083984375, "global_step": 208955, "epoch": 4975} {"train_loss": -7.434981346130371, "global_step": 208956, "epoch": 4975} {"train_loss": -7.419630527496338, "global_step": 208957, "epoch": 4975} {"train_loss": -7.352426528930664, "global_step": 208958, "epoch": 4975} {"train_loss": -7.32550048828125, "global_step": 208959, "epoch": 4975} {"train_loss": -7.410536766052246, "global_step": 208960, "epoch": 4975} {"train_loss": -7.406132221221924, "global_step": 208961, "epoch": 4975} {"train_loss": -7.418102741241455, "global_step": 208962, "epoch": 4975} {"train_loss": -7.212887763977051, "global_step": 208963, "epoch": 4975} {"train_loss": -7.264407157897949, "global_step": 208964, "epoch": 4975} {"train_loss": -7.29306697845459, "global_step": 208965, "epoch": 4975} {"train_loss": -7.26057243347168, "global_step": 208966, "epoch": 4975} {"train_loss": -7.396725654602051, "global_step": 208967, "epoch": 4975} {"train_loss": -7.235103607177734, "global_step": 208968, "epoch": 4975} {"train_loss": -7.281558990478516, "global_step": 208969, "epoch": 4975} {"train_loss": -7.367941379547119, "global_step": 208970, "epoch": 4975} {"train_loss": -7.226562023162842, "global_step": 208971, "epoch": 4975} {"train_loss": -7.356241226196289, "global_step": 208972, "epoch": 4975} {"train_loss": -7.092341423034668, "global_step": 208973, "epoch": 4975} {"train_loss": -7.179041385650635, "global_step": 208974, "epoch": 4975} {"train_loss": -7.2729082107543945, "global_step": 208975, "epoch": 4975} {"train_loss": -7.463329315185547, "global_step": 208976, "epoch": 4975} {"train_loss": -7.271862030029297, "global_step": 208977, "epoch": 4975} {"train_loss": -7.205616474151611, "global_step": 208978, "epoch": 4975} {"train_loss": -7.328932762145996, "global_step": 208979, "epoch": 4975} {"train_loss": -7.216386318206787, "global_step": 208980, "epoch": 4975} {"train_loss": -7.342741012573242, "global_step": 208981, "epoch": 4975} {"train_loss": -7.216455936431885, "global_step": 208982, "epoch": 4975} {"train_loss": -7.323904991149902, "global_step": 208983, "epoch": 4975} {"train_loss": -7.353748321533203, "global_step": 208984, "epoch": 4975} {"train_loss": -7.346983909606934, "global_step": 208985, "epoch": 4975} {"train_loss": -7.359086990356445, "global_step": 208986, "epoch": 4975} {"train_loss": -7.315116882324219, "global_step": 208987, "epoch": 4975} {"train_loss": -7.401251792907715, "global_step": 208988, "epoch": 4975} {"train_loss": -7.345080375671387, "global_step": 208989, "epoch": 4975} {"train_loss": -7.225266933441162, "global_step": 208990, "epoch": 4975} {"train_loss": -7.320299602690197, "global_step": 208991, "epoch": 4975, "val_loss": 82278.4609375} {"train_loss": -7.266071796417236, "global_step": 208992, "epoch": 4976} {"train_loss": -7.359377861022949, "global_step": 208993, "epoch": 4976} {"train_loss": -7.292642593383789, "global_step": 208994, "epoch": 4976} {"train_loss": -7.3371782302856445, "global_step": 208995, "epoch": 4976} {"train_loss": -7.392575263977051, "global_step": 208996, "epoch": 4976} {"train_loss": -7.3555474281311035, "global_step": 208997, "epoch": 4976} {"train_loss": -7.290803909301758, "global_step": 208998, "epoch": 4976} {"train_loss": -7.3459930419921875, "global_step": 208999, "epoch": 4976} {"train_loss": -7.403380870819092, "global_step": 209000, "epoch": 4976} {"train_loss": -7.265634536743164, "global_step": 209001, "epoch": 4976} {"train_loss": -7.341877460479736, "global_step": 209002, "epoch": 4976} {"train_loss": -7.315539836883545, "global_step": 209003, "epoch": 4976} {"train_loss": -7.308590888977051, "global_step": 209004, "epoch": 4976} {"train_loss": -7.373384475708008, "global_step": 209005, "epoch": 4976} {"train_loss": -7.422215938568115, "global_step": 209006, "epoch": 4976} {"train_loss": -7.296113967895508, "global_step": 209007, "epoch": 4976} {"train_loss": -7.220641136169434, "global_step": 209008, "epoch": 4976} {"train_loss": -7.448758602142334, "global_step": 209009, "epoch": 4976} {"train_loss": -7.352860450744629, "global_step": 209010, "epoch": 4976} {"train_loss": -7.273207187652588, "global_step": 209011, "epoch": 4976} {"train_loss": -7.434159278869629, "global_step": 209012, "epoch": 4976} {"train_loss": -7.172244071960449, "global_step": 209013, "epoch": 4976} {"train_loss": -7.38160514831543, "global_step": 209014, "epoch": 4976} {"train_loss": -7.482260704040527, "global_step": 209015, "epoch": 4976} {"train_loss": -7.216897010803223, "global_step": 209016, "epoch": 4976} {"train_loss": -7.270748138427734, "global_step": 209017, "epoch": 4976} {"train_loss": -7.383993148803711, "global_step": 209018, "epoch": 4976} {"train_loss": -7.28676700592041, "global_step": 209019, "epoch": 4976} {"train_loss": -7.280230522155762, "global_step": 209020, "epoch": 4976} {"train_loss": -7.294747352600098, "global_step": 209021, "epoch": 4976} {"train_loss": -7.371387481689453, "global_step": 209022, "epoch": 4976} {"train_loss": -7.330438613891602, "global_step": 209023, "epoch": 4976} {"train_loss": -7.398415565490723, "global_step": 209024, "epoch": 4976} {"train_loss": -7.367876052856445, "global_step": 209025, "epoch": 4976} {"train_loss": -7.352588653564453, "global_step": 209026, "epoch": 4976} {"train_loss": -7.400705337524414, "global_step": 209027, "epoch": 4976} {"train_loss": -7.228969573974609, "global_step": 209028, "epoch": 4976} {"train_loss": -7.475067615509033, "global_step": 209029, "epoch": 4976} {"train_loss": -7.3437700271606445, "global_step": 209030, "epoch": 4976} {"train_loss": -7.4435014724731445, "global_step": 209031, "epoch": 4976} {"train_loss": -7.290825843811035, "global_step": 209032, "epoch": 4976} {"train_loss": -7.341073195139567, "global_step": 209033, "epoch": 4976, "val_loss": 82234.375} {"train_loss": -7.330959796905518, "global_step": 209034, "epoch": 4977} {"train_loss": -7.339634418487549, "global_step": 209035, "epoch": 4977} {"train_loss": -7.368377208709717, "global_step": 209036, "epoch": 4977} {"train_loss": -7.424861907958984, "global_step": 209037, "epoch": 4977} {"train_loss": -7.283411979675293, "global_step": 209038, "epoch": 4977} {"train_loss": -7.343083381652832, "global_step": 209039, "epoch": 4977} {"train_loss": -7.348334789276123, "global_step": 209040, "epoch": 4977} {"train_loss": -7.318082332611084, "global_step": 209041, "epoch": 4977} {"train_loss": -7.363324165344238, "global_step": 209042, "epoch": 4977} {"train_loss": -7.432345867156982, "global_step": 209043, "epoch": 4977} {"train_loss": -7.388713359832764, "global_step": 209044, "epoch": 4977} {"train_loss": -7.461416244506836, "global_step": 209045, "epoch": 4977} {"train_loss": -7.441549301147461, "global_step": 209046, "epoch": 4977} {"train_loss": -7.361913204193115, "global_step": 209047, "epoch": 4977} {"train_loss": -7.303439617156982, "global_step": 209048, "epoch": 4977} {"train_loss": -7.371473789215088, "global_step": 209049, "epoch": 4977} {"train_loss": -7.341347694396973, "global_step": 209050, "epoch": 4977} {"train_loss": -7.351215362548828, "global_step": 209051, "epoch": 4977} {"train_loss": -7.378334999084473, "global_step": 209052, "epoch": 4977} {"train_loss": -7.344448089599609, "global_step": 209053, "epoch": 4977} {"train_loss": -7.408093452453613, "global_step": 209054, "epoch": 4977} {"train_loss": -7.253294944763184, "global_step": 209055, "epoch": 4977} {"train_loss": -7.330345153808594, "global_step": 209056, "epoch": 4977} {"train_loss": -7.270169258117676, "global_step": 209057, "epoch": 4977} {"train_loss": -7.331457138061523, "global_step": 209058, "epoch": 4977} {"train_loss": -7.363881587982178, "global_step": 209059, "epoch": 4977} {"train_loss": -7.241710662841797, "global_step": 209060, "epoch": 4977} {"train_loss": -7.36379861831665, "global_step": 209061, "epoch": 4977} {"train_loss": -7.173321723937988, "global_step": 209062, "epoch": 4977} {"train_loss": -7.370149612426758, "global_step": 209063, "epoch": 4977} {"train_loss": -7.339753150939941, "global_step": 209064, "epoch": 4977} {"train_loss": -7.265965938568115, "global_step": 209065, "epoch": 4977} {"train_loss": -7.312900543212891, "global_step": 209066, "epoch": 4977} {"train_loss": -7.374222278594971, "global_step": 209067, "epoch": 4977} {"train_loss": -7.333250999450684, "global_step": 209068, "epoch": 4977} {"train_loss": -7.421945571899414, "global_step": 209069, "epoch": 4977} {"train_loss": -7.253998756408691, "global_step": 209070, "epoch": 4977} {"train_loss": -7.250777721405029, "global_step": 209071, "epoch": 4977} {"train_loss": -7.315141677856445, "global_step": 209072, "epoch": 4977} {"train_loss": -7.238666534423828, "global_step": 209073, "epoch": 4977} {"train_loss": -7.291970252990723, "global_step": 209074, "epoch": 4977} {"train_loss": -7.336590210596721, "global_step": 209075, "epoch": 4977, "val_loss": 81832.578125} {"train_loss": -7.297557353973389, "global_step": 209076, "epoch": 4978} {"train_loss": -7.331658363342285, "global_step": 209077, "epoch": 4978} {"train_loss": -7.427680015563965, "global_step": 209078, "epoch": 4978} {"train_loss": -7.36366081237793, "global_step": 209079, "epoch": 4978} {"train_loss": -7.365274429321289, "global_step": 209080, "epoch": 4978} {"train_loss": -7.262163162231445, "global_step": 209081, "epoch": 4978} {"train_loss": -7.374238967895508, "global_step": 209082, "epoch": 4978} {"train_loss": -7.327716827392578, "global_step": 209083, "epoch": 4978} {"train_loss": -7.327666282653809, "global_step": 209084, "epoch": 4978} {"train_loss": -7.340179443359375, "global_step": 209085, "epoch": 4978} {"train_loss": -7.414714813232422, "global_step": 209086, "epoch": 4978} {"train_loss": -7.354267597198486, "global_step": 209087, "epoch": 4978} {"train_loss": -7.317635536193848, "global_step": 209088, "epoch": 4978} {"train_loss": -7.47589111328125, "global_step": 209089, "epoch": 4978} {"train_loss": -7.285439491271973, "global_step": 209090, "epoch": 4978} {"train_loss": -7.296221733093262, "global_step": 209091, "epoch": 4978} {"train_loss": -7.289947032928467, "global_step": 209092, "epoch": 4978} {"train_loss": -7.344618797302246, "global_step": 209093, "epoch": 4978} {"train_loss": -7.388636112213135, "global_step": 209094, "epoch": 4978} {"train_loss": -7.469367027282715, "global_step": 209095, "epoch": 4978} {"train_loss": -7.352713584899902, "global_step": 209096, "epoch": 4978} {"train_loss": -7.390848159790039, "global_step": 209097, "epoch": 4978} {"train_loss": -7.417125701904297, "global_step": 209098, "epoch": 4978} {"train_loss": -7.408611297607422, "global_step": 209099, "epoch": 4978} {"train_loss": -7.413414001464844, "global_step": 209100, "epoch": 4978} {"train_loss": -7.428950786590576, "global_step": 209101, "epoch": 4978} {"train_loss": -7.4353227615356445, "global_step": 209102, "epoch": 4978} {"train_loss": -7.46427059173584, "global_step": 209103, "epoch": 4978} {"train_loss": -7.401976108551025, "global_step": 209104, "epoch": 4978} {"train_loss": -7.352349758148193, "global_step": 209105, "epoch": 4978} {"train_loss": -7.455455780029297, "global_step": 209106, "epoch": 4978} {"train_loss": -7.312952041625977, "global_step": 209107, "epoch": 4978} {"train_loss": -7.335268020629883, "global_step": 209108, "epoch": 4978} {"train_loss": -7.418340682983398, "global_step": 209109, "epoch": 4978} {"train_loss": -7.427915573120117, "global_step": 209110, "epoch": 4978} {"train_loss": -7.4827423095703125, "global_step": 209111, "epoch": 4978} {"train_loss": -7.268009185791016, "global_step": 209112, "epoch": 4978} {"train_loss": -7.348603248596191, "global_step": 209113, "epoch": 4978} {"train_loss": -7.322583198547363, "global_step": 209114, "epoch": 4978} {"train_loss": -7.273428916931152, "global_step": 209115, "epoch": 4978} {"train_loss": -7.326964378356934, "global_step": 209116, "epoch": 4978} {"train_loss": -7.36548173995245, "global_step": 209117, "epoch": 4978, "val_loss": 81829.5546875} {"train_loss": -7.430376052856445, "global_step": 209118, "epoch": 4979} {"train_loss": -7.4208269119262695, "global_step": 209119, "epoch": 4979} {"train_loss": -7.4253363609313965, "global_step": 209120, "epoch": 4979} {"train_loss": -7.394778251647949, "global_step": 209121, "epoch": 4979} {"train_loss": -7.309731483459473, "global_step": 209122, "epoch": 4979} {"train_loss": -7.277352333068848, "global_step": 209123, "epoch": 4979} {"train_loss": -7.342944622039795, "global_step": 209124, "epoch": 4979} {"train_loss": -7.3375701904296875, "global_step": 209125, "epoch": 4979} {"train_loss": -7.375371932983398, "global_step": 209126, "epoch": 4979} {"train_loss": -7.2516279220581055, "global_step": 209127, "epoch": 4979} {"train_loss": -7.373044013977051, "global_step": 209128, "epoch": 4979} {"train_loss": -7.458178520202637, "global_step": 209129, "epoch": 4979} {"train_loss": -7.266277313232422, "global_step": 209130, "epoch": 4979} {"train_loss": -7.3660054206848145, "global_step": 209131, "epoch": 4979} {"train_loss": -7.35433292388916, "global_step": 209132, "epoch": 4979} {"train_loss": -7.255581378936768, "global_step": 209133, "epoch": 4979} {"train_loss": -7.4770965576171875, "global_step": 209134, "epoch": 4979} {"train_loss": -7.4748945236206055, "global_step": 209135, "epoch": 4979} {"train_loss": -7.439718723297119, "global_step": 209136, "epoch": 4979} {"train_loss": -7.455380439758301, "global_step": 209137, "epoch": 4979} {"train_loss": -7.4200968742370605, "global_step": 209138, "epoch": 4979} {"train_loss": -7.369434356689453, "global_step": 209139, "epoch": 4979} {"train_loss": -7.388667106628418, "global_step": 209140, "epoch": 4979} {"train_loss": -7.370452880859375, "global_step": 209141, "epoch": 4979} {"train_loss": -7.357616901397705, "global_step": 209142, "epoch": 4979} {"train_loss": -7.4786481857299805, "global_step": 209143, "epoch": 4979} {"train_loss": -7.328299522399902, "global_step": 209144, "epoch": 4979} {"train_loss": -7.307748794555664, "global_step": 209145, "epoch": 4979} {"train_loss": -7.299979209899902, "global_step": 209146, "epoch": 4979} {"train_loss": -7.277693271636963, "global_step": 209147, "epoch": 4979} {"train_loss": -7.416965007781982, "global_step": 209148, "epoch": 4979} {"train_loss": -7.44167423248291, "global_step": 209149, "epoch": 4979} {"train_loss": -7.440445423126221, "global_step": 209150, "epoch": 4979} {"train_loss": -7.421875476837158, "global_step": 209151, "epoch": 4979} {"train_loss": -7.368386268615723, "global_step": 209152, "epoch": 4979} {"train_loss": -7.371371269226074, "global_step": 209153, "epoch": 4979} {"train_loss": -7.32697057723999, "global_step": 209154, "epoch": 4979} {"train_loss": -7.492820739746094, "global_step": 209155, "epoch": 4979} {"train_loss": -7.355454444885254, "global_step": 209156, "epoch": 4979} {"train_loss": -7.3104047775268555, "global_step": 209157, "epoch": 4979} {"train_loss": -7.415843963623047, "global_step": 209158, "epoch": 4979} {"train_loss": -7.3756321384793235, "global_step": 209159, "epoch": 4979, "val_loss": 81968.0078125} {"train_loss": -7.295228481292725, "global_step": 209160, "epoch": 4980} {"train_loss": -7.452705383300781, "global_step": 209161, "epoch": 4980} {"train_loss": -7.44135856628418, "global_step": 209162, "epoch": 4980} {"train_loss": -7.293636322021484, "global_step": 209163, "epoch": 4980} {"train_loss": -7.271205425262451, "global_step": 209164, "epoch": 4980} {"train_loss": -7.363408088684082, "global_step": 209165, "epoch": 4980} {"train_loss": -7.29091739654541, "global_step": 209166, "epoch": 4980} {"train_loss": -7.324743270874023, "global_step": 209167, "epoch": 4980} {"train_loss": -7.3873291015625, "global_step": 209168, "epoch": 4980} {"train_loss": -7.433474540710449, "global_step": 209169, "epoch": 4980} {"train_loss": -7.352447509765625, "global_step": 209170, "epoch": 4980} {"train_loss": -7.312615394592285, "global_step": 209171, "epoch": 4980} {"train_loss": -7.402966499328613, "global_step": 209172, "epoch": 4980} {"train_loss": -7.348756790161133, "global_step": 209173, "epoch": 4980} {"train_loss": -7.398144721984863, "global_step": 209174, "epoch": 4980} {"train_loss": -7.27951717376709, "global_step": 209175, "epoch": 4980} {"train_loss": -7.335621356964111, "global_step": 209176, "epoch": 4980} {"train_loss": -7.242671012878418, "global_step": 209177, "epoch": 4980} {"train_loss": -7.445716381072998, "global_step": 209178, "epoch": 4980} {"train_loss": -7.409792900085449, "global_step": 209179, "epoch": 4980} {"train_loss": -7.259160041809082, "global_step": 209180, "epoch": 4980} {"train_loss": -7.516378402709961, "global_step": 209181, "epoch": 4980} {"train_loss": -7.24505615234375, "global_step": 209182, "epoch": 4980} {"train_loss": -7.269702911376953, "global_step": 209183, "epoch": 4980} {"train_loss": -7.362745761871338, "global_step": 209184, "epoch": 4980} {"train_loss": -7.17286491394043, "global_step": 209185, "epoch": 4980} {"train_loss": -7.308490753173828, "global_step": 209186, "epoch": 4980} {"train_loss": -7.276080131530762, "global_step": 209187, "epoch": 4980} {"train_loss": -7.302072525024414, "global_step": 209188, "epoch": 4980} {"train_loss": -7.411268711090088, "global_step": 209189, "epoch": 4980} {"train_loss": -7.376276016235352, "global_step": 209190, "epoch": 4980} {"train_loss": -7.1593523025512695, "global_step": 209191, "epoch": 4980} {"train_loss": -7.380426406860352, "global_step": 209192, "epoch": 4980} {"train_loss": -7.389341354370117, "global_step": 209193, "epoch": 4980} {"train_loss": -7.171818733215332, "global_step": 209194, "epoch": 4980} {"train_loss": -7.426352500915527, "global_step": 209195, "epoch": 4980} {"train_loss": -7.235759258270264, "global_step": 209196, "epoch": 4980} {"train_loss": -7.279719352722168, "global_step": 209197, "epoch": 4980} {"train_loss": -7.3287811279296875, "global_step": 209198, "epoch": 4980} {"train_loss": -7.313839435577393, "global_step": 209199, "epoch": 4980} {"train_loss": -7.211559772491455, "global_step": 209200, "epoch": 4980} {"train_loss": -7.3273478008451915, "global_step": 209201, "epoch": 4980, "val_loss": 82014.40625} {"train_loss": -7.332246780395508, "global_step": 209202, "epoch": 4981} {"train_loss": -7.135610580444336, "global_step": 209203, "epoch": 4981} {"train_loss": -7.393726348876953, "global_step": 209204, "epoch": 4981} {"train_loss": -7.228770732879639, "global_step": 209205, "epoch": 4981} {"train_loss": -7.352317810058594, "global_step": 209206, "epoch": 4981} {"train_loss": -7.29881477355957, "global_step": 209207, "epoch": 4981} {"train_loss": -7.213201522827148, "global_step": 209208, "epoch": 4981} {"train_loss": -7.401473045349121, "global_step": 209209, "epoch": 4981} {"train_loss": -7.315971374511719, "global_step": 209210, "epoch": 4981} {"train_loss": -7.299560070037842, "global_step": 209211, "epoch": 4981} {"train_loss": -7.3387041091918945, "global_step": 209212, "epoch": 4981} {"train_loss": -7.286341667175293, "global_step": 209213, "epoch": 4981} {"train_loss": -7.42970085144043, "global_step": 209214, "epoch": 4981} {"train_loss": -7.295813083648682, "global_step": 209215, "epoch": 4981} {"train_loss": -7.334073543548584, "global_step": 209216, "epoch": 4981} {"train_loss": -7.361508369445801, "global_step": 209217, "epoch": 4981} {"train_loss": -7.4171247482299805, "global_step": 209218, "epoch": 4981} {"train_loss": -7.381464004516602, "global_step": 209219, "epoch": 4981} {"train_loss": -7.292627334594727, "global_step": 209220, "epoch": 4981} {"train_loss": -7.448368072509766, "global_step": 209221, "epoch": 4981} {"train_loss": -7.264532089233398, "global_step": 209222, "epoch": 4981} {"train_loss": -7.254951477050781, "global_step": 209223, "epoch": 4981} {"train_loss": -7.437877655029297, "global_step": 209224, "epoch": 4981} {"train_loss": -7.390155792236328, "global_step": 209225, "epoch": 4981} {"train_loss": -7.464594841003418, "global_step": 209226, "epoch": 4981} {"train_loss": -7.407709121704102, "global_step": 209227, "epoch": 4981} {"train_loss": -7.394936561584473, "global_step": 209228, "epoch": 4981} {"train_loss": -7.264510154724121, "global_step": 209229, "epoch": 4981} {"train_loss": -7.32369327545166, "global_step": 209230, "epoch": 4981} {"train_loss": -7.261524200439453, "global_step": 209231, "epoch": 4981} {"train_loss": -7.211251258850098, "global_step": 209232, "epoch": 4981} {"train_loss": -7.333220481872559, "global_step": 209233, "epoch": 4981} {"train_loss": -7.329967975616455, "global_step": 209234, "epoch": 4981} {"train_loss": -7.266043663024902, "global_step": 209235, "epoch": 4981} {"train_loss": -7.25331974029541, "global_step": 209236, "epoch": 4981} {"train_loss": -7.332028388977051, "global_step": 209237, "epoch": 4981} {"train_loss": -7.204503536224365, "global_step": 209238, "epoch": 4981} {"train_loss": -7.244651794433594, "global_step": 209239, "epoch": 4981} {"train_loss": -7.319367408752441, "global_step": 209240, "epoch": 4981} {"train_loss": -7.185626983642578, "global_step": 209241, "epoch": 4981} {"train_loss": -7.462873458862305, "global_step": 209242, "epoch": 4981} {"train_loss": -7.321337881542387, "global_step": 209243, "epoch": 4981, "val_loss": 82096.1953125} {"train_loss": -7.409822463989258, "global_step": 209244, "epoch": 4982} {"train_loss": -7.415097236633301, "global_step": 209245, "epoch": 4982} {"train_loss": -7.388775825500488, "global_step": 209246, "epoch": 4982} {"train_loss": -7.39475679397583, "global_step": 209247, "epoch": 4982} {"train_loss": -7.318713188171387, "global_step": 209248, "epoch": 4982} {"train_loss": -7.4015398025512695, "global_step": 209249, "epoch": 4982} {"train_loss": -7.443096160888672, "global_step": 209250, "epoch": 4982} {"train_loss": -7.277555465698242, "global_step": 209251, "epoch": 4982} {"train_loss": -7.457039833068848, "global_step": 209252, "epoch": 4982} {"train_loss": -7.351329803466797, "global_step": 209253, "epoch": 4982} {"train_loss": -7.278251647949219, "global_step": 209254, "epoch": 4982} {"train_loss": -7.471433639526367, "global_step": 209255, "epoch": 4982} {"train_loss": -7.354949951171875, "global_step": 209256, "epoch": 4982} {"train_loss": -7.345611572265625, "global_step": 209257, "epoch": 4982} {"train_loss": -7.454063415527344, "global_step": 209258, "epoch": 4982} {"train_loss": -7.4023518562316895, "global_step": 209259, "epoch": 4982} {"train_loss": -7.402417182922363, "global_step": 209260, "epoch": 4982} {"train_loss": -7.548473834991455, "global_step": 209261, "epoch": 4982} {"train_loss": -7.371304035186768, "global_step": 209262, "epoch": 4982} {"train_loss": -7.364320755004883, "global_step": 209263, "epoch": 4982} {"train_loss": -7.257769584655762, "global_step": 209264, "epoch": 4982} {"train_loss": -7.45896053314209, "global_step": 209265, "epoch": 4982} {"train_loss": -7.352302551269531, "global_step": 209266, "epoch": 4982} {"train_loss": -7.387420654296875, "global_step": 209267, "epoch": 4982} {"train_loss": -7.4189958572387695, "global_step": 209268, "epoch": 4982} {"train_loss": -7.306836128234863, "global_step": 209269, "epoch": 4982} {"train_loss": -7.448436737060547, "global_step": 209270, "epoch": 4982} {"train_loss": -7.407602787017822, "global_step": 209271, "epoch": 4982} {"train_loss": -7.406856536865234, "global_step": 209272, "epoch": 4982} {"train_loss": -7.40672492980957, "global_step": 209273, "epoch": 4982} {"train_loss": -7.412288665771484, "global_step": 209274, "epoch": 4982} {"train_loss": -7.326718330383301, "global_step": 209275, "epoch": 4982} {"train_loss": -7.3453369140625, "global_step": 209276, "epoch": 4982} {"train_loss": -7.425954818725586, "global_step": 209277, "epoch": 4982} {"train_loss": -7.3350982666015625, "global_step": 209278, "epoch": 4982} {"train_loss": -7.373431205749512, "global_step": 209279, "epoch": 4982} {"train_loss": -7.385382652282715, "global_step": 209280, "epoch": 4982} {"train_loss": -7.286528587341309, "global_step": 209281, "epoch": 4982} {"train_loss": -7.335427284240723, "global_step": 209282, "epoch": 4982} {"train_loss": -7.388721466064453, "global_step": 209283, "epoch": 4982} {"train_loss": -7.309572696685791, "global_step": 209284, "epoch": 4982} {"train_loss": -7.37733701297215, "global_step": 209285, "epoch": 4982, "val_loss": 81917.640625} {"train_loss": -7.240331172943115, "global_step": 209286, "epoch": 4983} {"train_loss": -7.411547660827637, "global_step": 209287, "epoch": 4983} {"train_loss": -7.331792831420898, "global_step": 209288, "epoch": 4983} {"train_loss": -7.336767196655273, "global_step": 209289, "epoch": 4983} {"train_loss": -7.272985935211182, "global_step": 209290, "epoch": 4983} {"train_loss": -7.319445610046387, "global_step": 209291, "epoch": 4983} {"train_loss": -7.414333343505859, "global_step": 209292, "epoch": 4983} {"train_loss": -7.251427173614502, "global_step": 209293, "epoch": 4983} {"train_loss": -7.450578689575195, "global_step": 209294, "epoch": 4983} {"train_loss": -7.360517978668213, "global_step": 209295, "epoch": 4983} {"train_loss": -7.405706882476807, "global_step": 209296, "epoch": 4983} {"train_loss": -7.341991901397705, "global_step": 209297, "epoch": 4983} {"train_loss": -7.338749408721924, "global_step": 209298, "epoch": 4983} {"train_loss": -7.363704681396484, "global_step": 209299, "epoch": 4983} {"train_loss": -7.417689323425293, "global_step": 209300, "epoch": 4983} {"train_loss": -7.205117702484131, "global_step": 209301, "epoch": 4983} {"train_loss": -7.422259330749512, "global_step": 209302, "epoch": 4983} {"train_loss": -7.236989974975586, "global_step": 209303, "epoch": 4983} {"train_loss": -7.3497314453125, "global_step": 209304, "epoch": 4983} {"train_loss": -7.440274715423584, "global_step": 209305, "epoch": 4983} {"train_loss": -7.356054306030273, "global_step": 209306, "epoch": 4983} {"train_loss": -7.255806922912598, "global_step": 209307, "epoch": 4983} {"train_loss": -7.370829105377197, "global_step": 209308, "epoch": 4983} {"train_loss": -7.298000335693359, "global_step": 209309, "epoch": 4983} {"train_loss": -7.3141374588012695, "global_step": 209310, "epoch": 4983} {"train_loss": -7.214105606079102, "global_step": 209311, "epoch": 4983} {"train_loss": -7.3222150802612305, "global_step": 209312, "epoch": 4983} {"train_loss": -7.378306865692139, "global_step": 209313, "epoch": 4983} {"train_loss": -7.4889068603515625, "global_step": 209314, "epoch": 4983} {"train_loss": -7.282055854797363, "global_step": 209315, "epoch": 4983} {"train_loss": -7.453734874725342, "global_step": 209316, "epoch": 4983} {"train_loss": -7.270829200744629, "global_step": 209317, "epoch": 4983} {"train_loss": -7.387202262878418, "global_step": 209318, "epoch": 4983} {"train_loss": -7.356832504272461, "global_step": 209319, "epoch": 4983} {"train_loss": -7.353728294372559, "global_step": 209320, "epoch": 4983} {"train_loss": -7.307272911071777, "global_step": 209321, "epoch": 4983} {"train_loss": -7.300743103027344, "global_step": 209322, "epoch": 4983} {"train_loss": -7.318112373352051, "global_step": 209323, "epoch": 4983} {"train_loss": -7.278817176818848, "global_step": 209324, "epoch": 4983} {"train_loss": -7.230554580688477, "global_step": 209325, "epoch": 4983} {"train_loss": -7.147238731384277, "global_step": 209326, "epoch": 4983} {"train_loss": -7.331896566209339, "global_step": 209327, "epoch": 4983, "val_loss": 82214.4609375} {"train_loss": -7.158419609069824, "global_step": 209328, "epoch": 4984} {"train_loss": -7.301719665527344, "global_step": 209329, "epoch": 4984} {"train_loss": -7.32442045211792, "global_step": 209330, "epoch": 4984} {"train_loss": -7.292992115020752, "global_step": 209331, "epoch": 4984} {"train_loss": -7.277562618255615, "global_step": 209332, "epoch": 4984} {"train_loss": -7.3551530838012695, "global_step": 209333, "epoch": 4984} {"train_loss": -7.258482933044434, "global_step": 209334, "epoch": 4984} {"train_loss": -7.307570457458496, "global_step": 209335, "epoch": 4984} {"train_loss": -7.295647621154785, "global_step": 209336, "epoch": 4984} {"train_loss": -7.276360511779785, "global_step": 209337, "epoch": 4984} {"train_loss": -7.294636249542236, "global_step": 209338, "epoch": 4984} {"train_loss": -7.321530342102051, "global_step": 209339, "epoch": 4984} {"train_loss": -7.40012264251709, "global_step": 209340, "epoch": 4984} {"train_loss": -7.370588302612305, "global_step": 209341, "epoch": 4984} {"train_loss": -7.275389194488525, "global_step": 209342, "epoch": 4984} {"train_loss": -7.336606979370117, "global_step": 209343, "epoch": 4984} {"train_loss": -7.292341232299805, "global_step": 209344, "epoch": 4984} {"train_loss": -7.3357319831848145, "global_step": 209345, "epoch": 4984} {"train_loss": -7.407324314117432, "global_step": 209346, "epoch": 4984} {"train_loss": -7.257669448852539, "global_step": 209347, "epoch": 4984} {"train_loss": -7.312168121337891, "global_step": 209348, "epoch": 4984} {"train_loss": -7.346050262451172, "global_step": 209349, "epoch": 4984} {"train_loss": -7.281411647796631, "global_step": 209350, "epoch": 4984} {"train_loss": -7.217526435852051, "global_step": 209351, "epoch": 4984} {"train_loss": -7.229745388031006, "global_step": 209352, "epoch": 4984} {"train_loss": -7.3387651443481445, "global_step": 209353, "epoch": 4984} {"train_loss": -7.351748466491699, "global_step": 209354, "epoch": 4984} {"train_loss": -7.262179851531982, "global_step": 209355, "epoch": 4984} {"train_loss": -7.199085235595703, "global_step": 209356, "epoch": 4984} {"train_loss": -7.386549949645996, "global_step": 209357, "epoch": 4984} {"train_loss": -7.388887405395508, "global_step": 209358, "epoch": 4984} {"train_loss": -7.222686290740967, "global_step": 209359, "epoch": 4984} {"train_loss": -7.324995994567871, "global_step": 209360, "epoch": 4984} {"train_loss": -7.352883338928223, "global_step": 209361, "epoch": 4984} {"train_loss": -7.364547252655029, "global_step": 209362, "epoch": 4984} {"train_loss": -7.289681434631348, "global_step": 209363, "epoch": 4984} {"train_loss": -7.335714817047119, "global_step": 209364, "epoch": 4984} {"train_loss": -7.353542327880859, "global_step": 209365, "epoch": 4984} {"train_loss": -7.380419731140137, "global_step": 209366, "epoch": 4984} {"train_loss": -7.379924774169922, "global_step": 209367, "epoch": 4984} {"train_loss": -7.449522495269775, "global_step": 209368, "epoch": 4984} {"train_loss": -7.312937566212246, "global_step": 209369, "epoch": 4984, "val_loss": 81985.6796875} {"train_loss": -7.3670501708984375, "global_step": 209370, "epoch": 4985} {"train_loss": -7.5087504386901855, "global_step": 209371, "epoch": 4985} {"train_loss": -7.376428604125977, "global_step": 209372, "epoch": 4985} {"train_loss": -7.300717353820801, "global_step": 209373, "epoch": 4985} {"train_loss": -7.564474105834961, "global_step": 209374, "epoch": 4985} {"train_loss": -7.326763153076172, "global_step": 209375, "epoch": 4985} {"train_loss": -7.435050010681152, "global_step": 209376, "epoch": 4985} {"train_loss": -7.355634689331055, "global_step": 209377, "epoch": 4985} {"train_loss": -7.348250865936279, "global_step": 209378, "epoch": 4985} {"train_loss": -7.39406156539917, "global_step": 209379, "epoch": 4985} {"train_loss": -7.429569721221924, "global_step": 209380, "epoch": 4985} {"train_loss": -7.346741676330566, "global_step": 209381, "epoch": 4985} {"train_loss": -7.408936023712158, "global_step": 209382, "epoch": 4985} {"train_loss": -7.3581438064575195, "global_step": 209383, "epoch": 4985} {"train_loss": -7.363778114318848, "global_step": 209384, "epoch": 4985} {"train_loss": -7.426080703735352, "global_step": 209385, "epoch": 4985} {"train_loss": -7.421980857849121, "global_step": 209386, "epoch": 4985} {"train_loss": -7.393429756164551, "global_step": 209387, "epoch": 4985} {"train_loss": -7.453329086303711, "global_step": 209388, "epoch": 4985} {"train_loss": -7.468963623046875, "global_step": 209389, "epoch": 4985} {"train_loss": -7.451416492462158, "global_step": 209390, "epoch": 4985} {"train_loss": -7.392251968383789, "global_step": 209391, "epoch": 4985} {"train_loss": -7.427694320678711, "global_step": 209392, "epoch": 4985} {"train_loss": -7.459522247314453, "global_step": 209393, "epoch": 4985} {"train_loss": -7.335040092468262, "global_step": 209394, "epoch": 4985} {"train_loss": -7.441887855529785, "global_step": 209395, "epoch": 4985} {"train_loss": -7.430487632751465, "global_step": 209396, "epoch": 4985} {"train_loss": -7.356807231903076, "global_step": 209397, "epoch": 4985} {"train_loss": -7.378148078918457, "global_step": 209398, "epoch": 4985} {"train_loss": -7.465528964996338, "global_step": 209399, "epoch": 4985} {"train_loss": -7.190173625946045, "global_step": 209400, "epoch": 4985} {"train_loss": -7.260665416717529, "global_step": 209401, "epoch": 4985} {"train_loss": -7.413282871246338, "global_step": 209402, "epoch": 4985} {"train_loss": -7.332717418670654, "global_step": 209403, "epoch": 4985} {"train_loss": -7.281542778015137, "global_step": 209404, "epoch": 4985} {"train_loss": -7.327442169189453, "global_step": 209405, "epoch": 4985} {"train_loss": -7.3458123207092285, "global_step": 209406, "epoch": 4985} {"train_loss": -7.235499858856201, "global_step": 209407, "epoch": 4985} {"train_loss": -7.42083740234375, "global_step": 209408, "epoch": 4985} {"train_loss": -7.396003723144531, "global_step": 209409, "epoch": 4985} {"train_loss": -7.171568870544434, "global_step": 209410, "epoch": 4985} {"train_loss": -7.378086805343628, "global_step": 209411, "epoch": 4985, "val_loss": 82257.265625} {"train_loss": -7.407130241394043, "global_step": 209412, "epoch": 4986} {"train_loss": -7.154717445373535, "global_step": 209413, "epoch": 4986} {"train_loss": -7.2893476486206055, "global_step": 209414, "epoch": 4986} {"train_loss": -7.324667453765869, "global_step": 209415, "epoch": 4986} {"train_loss": -7.233878135681152, "global_step": 209416, "epoch": 4986} {"train_loss": -7.222593784332275, "global_step": 209417, "epoch": 4986} {"train_loss": -7.365311622619629, "global_step": 209418, "epoch": 4986} {"train_loss": -7.206520080566406, "global_step": 209419, "epoch": 4986} {"train_loss": -7.214658260345459, "global_step": 209420, "epoch": 4986} {"train_loss": -7.270261764526367, "global_step": 209421, "epoch": 4986} {"train_loss": -7.24034309387207, "global_step": 209422, "epoch": 4986} {"train_loss": -7.297673225402832, "global_step": 209423, "epoch": 4986} {"train_loss": -7.238034725189209, "global_step": 209424, "epoch": 4986} {"train_loss": -7.363499641418457, "global_step": 209425, "epoch": 4986} {"train_loss": -7.1987481117248535, "global_step": 209426, "epoch": 4986} {"train_loss": -7.283747673034668, "global_step": 209427, "epoch": 4986} {"train_loss": -7.2671918869018555, "global_step": 209428, "epoch": 4986} {"train_loss": -7.369830131530762, "global_step": 209429, "epoch": 4986} {"train_loss": -7.32712459564209, "global_step": 209430, "epoch": 4986} {"train_loss": -7.257816314697266, "global_step": 209431, "epoch": 4986} {"train_loss": -7.171855926513672, "global_step": 209432, "epoch": 4986} {"train_loss": -7.184385299682617, "global_step": 209433, "epoch": 4986} {"train_loss": -7.3664045333862305, "global_step": 209434, "epoch": 4986} {"train_loss": -7.326164245605469, "global_step": 209435, "epoch": 4986} {"train_loss": -7.295449733734131, "global_step": 209436, "epoch": 4986} {"train_loss": -7.288882255554199, "global_step": 209437, "epoch": 4986} {"train_loss": -7.314234256744385, "global_step": 209438, "epoch": 4986} {"train_loss": -7.36464786529541, "global_step": 209439, "epoch": 4986} {"train_loss": -7.369309902191162, "global_step": 209440, "epoch": 4986} {"train_loss": -7.291430473327637, "global_step": 209441, "epoch": 4986} {"train_loss": -7.289546012878418, "global_step": 209442, "epoch": 4986} {"train_loss": -7.169191360473633, "global_step": 209443, "epoch": 4986} {"train_loss": -7.237420082092285, "global_step": 209444, "epoch": 4986} {"train_loss": -7.298618316650391, "global_step": 209445, "epoch": 4986} {"train_loss": -7.413276195526123, "global_step": 209446, "epoch": 4986} {"train_loss": -7.328119277954102, "global_step": 209447, "epoch": 4986} {"train_loss": -7.373631477355957, "global_step": 209448, "epoch": 4986} {"train_loss": -7.428712368011475, "global_step": 209449, "epoch": 4986} {"train_loss": -7.379661560058594, "global_step": 209450, "epoch": 4986} {"train_loss": -7.297441005706787, "global_step": 209451, "epoch": 4986} {"train_loss": -7.342576026916504, "global_step": 209452, "epoch": 4986} {"train_loss": -7.29579496383667, "global_step": 209453, "epoch": 4986, "val_loss": 81904.7890625} {"train_loss": -7.4976701736450195, "global_step": 209454, "epoch": 4987} {"train_loss": -7.445988655090332, "global_step": 209455, "epoch": 4987} {"train_loss": -7.4513092041015625, "global_step": 209456, "epoch": 4987} {"train_loss": -7.277578830718994, "global_step": 209457, "epoch": 4987} {"train_loss": -7.32429313659668, "global_step": 209458, "epoch": 4987} {"train_loss": -7.501086235046387, "global_step": 209459, "epoch": 4987} {"train_loss": -7.360384464263916, "global_step": 209460, "epoch": 4987} {"train_loss": -7.30838680267334, "global_step": 209461, "epoch": 4987} {"train_loss": -7.438486576080322, "global_step": 209462, "epoch": 4987} {"train_loss": -7.478808403015137, "global_step": 209463, "epoch": 4987} {"train_loss": -7.412130355834961, "global_step": 209464, "epoch": 4987} {"train_loss": -7.559963226318359, "global_step": 209465, "epoch": 4987} {"train_loss": -7.429686069488525, "global_step": 209466, "epoch": 4987} {"train_loss": -7.4460248947143555, "global_step": 209467, "epoch": 4987} {"train_loss": -7.4513373374938965, "global_step": 209468, "epoch": 4987} {"train_loss": -7.418482303619385, "global_step": 209469, "epoch": 4987} {"train_loss": -7.626148223876953, "global_step": 209470, "epoch": 4987} {"train_loss": -7.503359317779541, "global_step": 209471, "epoch": 4987} {"train_loss": -7.485650062561035, "global_step": 209472, "epoch": 4987} {"train_loss": -7.423908233642578, "global_step": 209473, "epoch": 4987} {"train_loss": -7.458093643188477, "global_step": 209474, "epoch": 4987} {"train_loss": -7.493250370025635, "global_step": 209475, "epoch": 4987} {"train_loss": -7.347350597381592, "global_step": 209476, "epoch": 4987} {"train_loss": -7.29076623916626, "global_step": 209477, "epoch": 4987} {"train_loss": -7.458860397338867, "global_step": 209478, "epoch": 4987} {"train_loss": -7.385426998138428, "global_step": 209479, "epoch": 4987} {"train_loss": -7.395270347595215, "global_step": 209480, "epoch": 4987} {"train_loss": -7.348212242126465, "global_step": 209481, "epoch": 4987} {"train_loss": -7.265616416931152, "global_step": 209482, "epoch": 4987} {"train_loss": -7.335672855377197, "global_step": 209483, "epoch": 4987} {"train_loss": -7.27394962310791, "global_step": 209484, "epoch": 4987} {"train_loss": -7.257053375244141, "global_step": 209485, "epoch": 4987} {"train_loss": -7.392207145690918, "global_step": 209486, "epoch": 4987} {"train_loss": -7.338253974914551, "global_step": 209487, "epoch": 4987} {"train_loss": -7.259757041931152, "global_step": 209488, "epoch": 4987} {"train_loss": -7.427799224853516, "global_step": 209489, "epoch": 4987} {"train_loss": -7.24615478515625, "global_step": 209490, "epoch": 4987} {"train_loss": -7.366371154785156, "global_step": 209491, "epoch": 4987} {"train_loss": -7.354053497314453, "global_step": 209492, "epoch": 4987} {"train_loss": -7.476037502288818, "global_step": 209493, "epoch": 4987} {"train_loss": -7.326680660247803, "global_step": 209494, "epoch": 4987} {"train_loss": -7.397632996241252, "global_step": 209495, "epoch": 4987, "val_loss": 82006.6796875} {"train_loss": -7.438857555389404, "global_step": 209496, "epoch": 4988} {"train_loss": -7.31489372253418, "global_step": 209497, "epoch": 4988} {"train_loss": -7.351815223693848, "global_step": 209498, "epoch": 4988} {"train_loss": -7.250721454620361, "global_step": 209499, "epoch": 4988} {"train_loss": -7.273826599121094, "global_step": 209500, "epoch": 4988} {"train_loss": -7.340505123138428, "global_step": 209501, "epoch": 4988} {"train_loss": -7.35209321975708, "global_step": 209502, "epoch": 4988} {"train_loss": -7.272721290588379, "global_step": 209503, "epoch": 4988} {"train_loss": -7.389181137084961, "global_step": 209504, "epoch": 4988} {"train_loss": -7.2644758224487305, "global_step": 209505, "epoch": 4988} {"train_loss": -7.232728958129883, "global_step": 209506, "epoch": 4988} {"train_loss": -7.142745018005371, "global_step": 209507, "epoch": 4988} {"train_loss": -7.186814308166504, "global_step": 209508, "epoch": 4988} {"train_loss": -7.2254838943481445, "global_step": 209509, "epoch": 4988} {"train_loss": -7.366815567016602, "global_step": 209510, "epoch": 4988} {"train_loss": -7.2639007568359375, "global_step": 209511, "epoch": 4988} {"train_loss": -7.415793418884277, "global_step": 209512, "epoch": 4988} {"train_loss": -7.214409828186035, "global_step": 209513, "epoch": 4988} {"train_loss": -7.291287422180176, "global_step": 209514, "epoch": 4988} {"train_loss": -7.434465408325195, "global_step": 209515, "epoch": 4988} {"train_loss": -7.234006881713867, "global_step": 209516, "epoch": 4988} {"train_loss": -7.322910785675049, "global_step": 209517, "epoch": 4988} {"train_loss": -7.328643798828125, "global_step": 209518, "epoch": 4988} {"train_loss": -7.359279632568359, "global_step": 209519, "epoch": 4988} {"train_loss": -7.428900718688965, "global_step": 209520, "epoch": 4988} {"train_loss": -7.360896587371826, "global_step": 209521, "epoch": 4988} {"train_loss": -7.243204116821289, "global_step": 209522, "epoch": 4988} {"train_loss": -7.237586975097656, "global_step": 209523, "epoch": 4988} {"train_loss": -7.243152618408203, "global_step": 209524, "epoch": 4988} {"train_loss": -7.425637722015381, "global_step": 209525, "epoch": 4988} {"train_loss": -7.306197643280029, "global_step": 209526, "epoch": 4988} {"train_loss": -7.381834983825684, "global_step": 209527, "epoch": 4988} {"train_loss": -7.500555038452148, "global_step": 209528, "epoch": 4988} {"train_loss": -7.3466033935546875, "global_step": 209529, "epoch": 4988} {"train_loss": -7.393697738647461, "global_step": 209530, "epoch": 4988} {"train_loss": -7.520476818084717, "global_step": 209531, "epoch": 4988} {"train_loss": -7.444993495941162, "global_step": 209532, "epoch": 4988} {"train_loss": -7.442983627319336, "global_step": 209533, "epoch": 4988} {"train_loss": -7.3918962478637695, "global_step": 209534, "epoch": 4988} {"train_loss": -7.413212299346924, "global_step": 209535, "epoch": 4988} {"train_loss": -7.494830131530762, "global_step": 209536, "epoch": 4988} {"train_loss": -7.340087754385812, "global_step": 209537, "epoch": 4988, "val_loss": 81842.3125} {"train_loss": -7.43194580078125, "global_step": 209538, "epoch": 4989} {"train_loss": -7.368276596069336, "global_step": 209539, "epoch": 4989} {"train_loss": -7.272318363189697, "global_step": 209540, "epoch": 4989} {"train_loss": -7.312463760375977, "global_step": 209541, "epoch": 4989} {"train_loss": -7.432657718658447, "global_step": 209542, "epoch": 4989} {"train_loss": -7.342507839202881, "global_step": 209543, "epoch": 4989} {"train_loss": -7.30685567855835, "global_step": 209544, "epoch": 4989} {"train_loss": -7.220053672790527, "global_step": 209545, "epoch": 4989} {"train_loss": -7.2126383781433105, "global_step": 209546, "epoch": 4989} {"train_loss": -7.340673446655273, "global_step": 209547, "epoch": 4989} {"train_loss": -7.355598449707031, "global_step": 209548, "epoch": 4989} {"train_loss": -7.351593971252441, "global_step": 209549, "epoch": 4989} {"train_loss": -7.3474273681640625, "global_step": 209550, "epoch": 4989} {"train_loss": -7.429117679595947, "global_step": 209551, "epoch": 4989} {"train_loss": -7.317716121673584, "global_step": 209552, "epoch": 4989} {"train_loss": -7.321684837341309, "global_step": 209553, "epoch": 4989} {"train_loss": -7.282049655914307, "global_step": 209554, "epoch": 4989} {"train_loss": -7.403757572174072, "global_step": 209555, "epoch": 4989} {"train_loss": -7.26368522644043, "global_step": 209556, "epoch": 4989} {"train_loss": -7.319454669952393, "global_step": 209557, "epoch": 4989} {"train_loss": -7.311495780944824, "global_step": 209558, "epoch": 4989} {"train_loss": -7.318140029907227, "global_step": 209559, "epoch": 4989} {"train_loss": -7.4427385330200195, "global_step": 209560, "epoch": 4989} {"train_loss": -7.361560821533203, "global_step": 209561, "epoch": 4989} {"train_loss": -7.335251331329346, "global_step": 209562, "epoch": 4989} {"train_loss": -7.375010013580322, "global_step": 209563, "epoch": 4989} {"train_loss": -7.3169660568237305, "global_step": 209564, "epoch": 4989} {"train_loss": -7.343909740447998, "global_step": 209565, "epoch": 4989} {"train_loss": -7.323565483093262, "global_step": 209566, "epoch": 4989} {"train_loss": -7.29736852645874, "global_step": 209567, "epoch": 4989} {"train_loss": -7.259257793426514, "global_step": 209568, "epoch": 4989} {"train_loss": -7.245898246765137, "global_step": 209569, "epoch": 4989} {"train_loss": -7.42392110824585, "global_step": 209570, "epoch": 4989} {"train_loss": -7.406153202056885, "global_step": 209571, "epoch": 4989} {"train_loss": -7.400661468505859, "global_step": 209572, "epoch": 4989} {"train_loss": -7.397197723388672, "global_step": 209573, "epoch": 4989} {"train_loss": -7.3758087158203125, "global_step": 209574, "epoch": 4989} {"train_loss": -7.316765785217285, "global_step": 209575, "epoch": 4989} {"train_loss": -7.47214412689209, "global_step": 209576, "epoch": 4989} {"train_loss": -7.3643412590026855, "global_step": 209577, "epoch": 4989} {"train_loss": -7.359681129455566, "global_step": 209578, "epoch": 4989} {"train_loss": -7.343911375318255, "global_step": 209579, "epoch": 4989, "val_loss": 81973.109375} {"train_loss": -7.405671119689941, "global_step": 209580, "epoch": 4990} {"train_loss": -7.316682815551758, "global_step": 209581, "epoch": 4990} {"train_loss": -7.3271331787109375, "global_step": 209582, "epoch": 4990} {"train_loss": -7.440911769866943, "global_step": 209583, "epoch": 4990} {"train_loss": -7.42067289352417, "global_step": 209584, "epoch": 4990} {"train_loss": -7.543041229248047, "global_step": 209585, "epoch": 4990} {"train_loss": -7.343345642089844, "global_step": 209586, "epoch": 4990} {"train_loss": -7.267380714416504, "global_step": 209587, "epoch": 4990} {"train_loss": -7.357999801635742, "global_step": 209588, "epoch": 4990} {"train_loss": -7.323300838470459, "global_step": 209589, "epoch": 4990} {"train_loss": -7.289702892303467, "global_step": 209590, "epoch": 4990} {"train_loss": -7.384109020233154, "global_step": 209591, "epoch": 4990} {"train_loss": -7.383220672607422, "global_step": 209592, "epoch": 4990} {"train_loss": -7.388453006744385, "global_step": 209593, "epoch": 4990} {"train_loss": -7.493592262268066, "global_step": 209594, "epoch": 4990} {"train_loss": -7.399774551391602, "global_step": 209595, "epoch": 4990} {"train_loss": -7.3882036209106445, "global_step": 209596, "epoch": 4990} {"train_loss": -7.4231743812561035, "global_step": 209597, "epoch": 4990} {"train_loss": -7.370939254760742, "global_step": 209598, "epoch": 4990} {"train_loss": -7.395596027374268, "global_step": 209599, "epoch": 4990} {"train_loss": -7.354928016662598, "global_step": 209600, "epoch": 4990} {"train_loss": -7.437590599060059, "global_step": 209601, "epoch": 4990} {"train_loss": -7.402597904205322, "global_step": 209602, "epoch": 4990} {"train_loss": -7.381993293762207, "global_step": 209603, "epoch": 4990} {"train_loss": -7.328075885772705, "global_step": 209604, "epoch": 4990} {"train_loss": -7.505771636962891, "global_step": 209605, "epoch": 4990} {"train_loss": -7.232725143432617, "global_step": 209606, "epoch": 4990} {"train_loss": -7.497047424316406, "global_step": 209607, "epoch": 4990} {"train_loss": -7.43399715423584, "global_step": 209608, "epoch": 4990} {"train_loss": -7.3582587242126465, "global_step": 209609, "epoch": 4990} {"train_loss": -7.456924915313721, "global_step": 209610, "epoch": 4990} {"train_loss": -7.405503273010254, "global_step": 209611, "epoch": 4990} {"train_loss": -7.386863708496094, "global_step": 209612, "epoch": 4990} {"train_loss": -7.530735492706299, "global_step": 209613, "epoch": 4990} {"train_loss": -7.402223587036133, "global_step": 209614, "epoch": 4990} {"train_loss": -7.391654968261719, "global_step": 209615, "epoch": 4990} {"train_loss": -7.331718921661377, "global_step": 209616, "epoch": 4990} {"train_loss": -7.377664566040039, "global_step": 209617, "epoch": 4990} {"train_loss": -7.318093299865723, "global_step": 209618, "epoch": 4990} {"train_loss": -7.384391784667969, "global_step": 209619, "epoch": 4990} {"train_loss": -7.2691545486450195, "global_step": 209620, "epoch": 4990} {"train_loss": -7.385768186478388, "global_step": 209621, "epoch": 4990, "val_loss": 82177.6953125} {"train_loss": -7.353842258453369, "global_step": 209622, "epoch": 4991} {"train_loss": -7.312929153442383, "global_step": 209623, "epoch": 4991} {"train_loss": -7.341203689575195, "global_step": 209624, "epoch": 4991} {"train_loss": -7.353137016296387, "global_step": 209625, "epoch": 4991} {"train_loss": -7.365949630737305, "global_step": 209626, "epoch": 4991} {"train_loss": -7.34817361831665, "global_step": 209627, "epoch": 4991} {"train_loss": -7.4314141273498535, "global_step": 209628, "epoch": 4991} {"train_loss": -7.221515655517578, "global_step": 209629, "epoch": 4991} {"train_loss": -7.3243255615234375, "global_step": 209630, "epoch": 4991} {"train_loss": -7.397019386291504, "global_step": 209631, "epoch": 4991} {"train_loss": -7.2276997566223145, "global_step": 209632, "epoch": 4991} {"train_loss": -7.400180816650391, "global_step": 209633, "epoch": 4991} {"train_loss": -7.253255844116211, "global_step": 209634, "epoch": 4991} {"train_loss": -7.343837738037109, "global_step": 209635, "epoch": 4991} {"train_loss": -7.371949195861816, "global_step": 209636, "epoch": 4991} {"train_loss": -7.394144535064697, "global_step": 209637, "epoch": 4991} {"train_loss": -7.382469177246094, "global_step": 209638, "epoch": 4991} {"train_loss": -7.328986167907715, "global_step": 209639, "epoch": 4991} {"train_loss": -7.341282844543457, "global_step": 209640, "epoch": 4991} {"train_loss": -7.276640892028809, "global_step": 209641, "epoch": 4991} {"train_loss": -7.371540069580078, "global_step": 209642, "epoch": 4991} {"train_loss": -7.312938690185547, "global_step": 209643, "epoch": 4991} {"train_loss": -7.359135627746582, "global_step": 209644, "epoch": 4991} {"train_loss": -7.428205490112305, "global_step": 209645, "epoch": 4991} {"train_loss": -7.287791728973389, "global_step": 209646, "epoch": 4991} {"train_loss": -7.286749839782715, "global_step": 209647, "epoch": 4991} {"train_loss": -7.21291971206665, "global_step": 209648, "epoch": 4991} {"train_loss": -7.217535972595215, "global_step": 209649, "epoch": 4991} {"train_loss": -7.353387832641602, "global_step": 209650, "epoch": 4991} {"train_loss": -7.265139579772949, "global_step": 209651, "epoch": 4991} {"train_loss": -7.220717906951904, "global_step": 209652, "epoch": 4991} {"train_loss": -7.275844573974609, "global_step": 209653, "epoch": 4991} {"train_loss": -7.047929763793945, "global_step": 209654, "epoch": 4991} {"train_loss": -7.234382629394531, "global_step": 209655, "epoch": 4991} {"train_loss": -7.004312515258789, "global_step": 209656, "epoch": 4991} {"train_loss": -7.274345397949219, "global_step": 209657, "epoch": 4991} {"train_loss": -7.08189058303833, "global_step": 209658, "epoch": 4991} {"train_loss": -7.283510208129883, "global_step": 209659, "epoch": 4991} {"train_loss": -7.162064075469971, "global_step": 209660, "epoch": 4991} {"train_loss": -7.057334899902344, "global_step": 209661, "epoch": 4991} {"train_loss": -7.220757484436035, "global_step": 209662, "epoch": 4991} {"train_loss": -7.283658243360973, "global_step": 209663, "epoch": 4991, "val_loss": 81917.0546875} {"train_loss": -7.281156539916992, "global_step": 209664, "epoch": 4992} {"train_loss": -7.214159965515137, "global_step": 209665, "epoch": 4992} {"train_loss": -7.2988505363464355, "global_step": 209666, "epoch": 4992} {"train_loss": -7.384130477905273, "global_step": 209667, "epoch": 4992} {"train_loss": -7.2768988609313965, "global_step": 209668, "epoch": 4992} {"train_loss": -7.234979629516602, "global_step": 209669, "epoch": 4992} {"train_loss": -7.236476898193359, "global_step": 209670, "epoch": 4992} {"train_loss": -7.370842933654785, "global_step": 209671, "epoch": 4992} {"train_loss": -7.2541704177856445, "global_step": 209672, "epoch": 4992} {"train_loss": -7.281362533569336, "global_step": 209673, "epoch": 4992} {"train_loss": -7.310395240783691, "global_step": 209674, "epoch": 4992} {"train_loss": -7.275139808654785, "global_step": 209675, "epoch": 4992} {"train_loss": -7.265614986419678, "global_step": 209676, "epoch": 4992} {"train_loss": -7.399065971374512, "global_step": 209677, "epoch": 4992} {"train_loss": -7.452486038208008, "global_step": 209678, "epoch": 4992} {"train_loss": -7.3431525230407715, "global_step": 209679, "epoch": 4992} {"train_loss": -7.390931129455566, "global_step": 209680, "epoch": 4992} {"train_loss": -7.2955121994018555, "global_step": 209681, "epoch": 4992} {"train_loss": -7.34298849105835, "global_step": 209682, "epoch": 4992} {"train_loss": -7.361380577087402, "global_step": 209683, "epoch": 4992} {"train_loss": -7.336132049560547, "global_step": 209684, "epoch": 4992} {"train_loss": -7.511919975280762, "global_step": 209685, "epoch": 4992} {"train_loss": -7.381956100463867, "global_step": 209686, "epoch": 4992} {"train_loss": -7.419198036193848, "global_step": 209687, "epoch": 4992} {"train_loss": -7.382854461669922, "global_step": 209688, "epoch": 4992} {"train_loss": -7.332230567932129, "global_step": 209689, "epoch": 4992} {"train_loss": -7.3181843757629395, "global_step": 209690, "epoch": 4992} {"train_loss": -7.253293037414551, "global_step": 209691, "epoch": 4992} {"train_loss": -7.285024642944336, "global_step": 209692, "epoch": 4992} {"train_loss": -7.356085777282715, "global_step": 209693, "epoch": 4992} {"train_loss": -7.262668609619141, "global_step": 209694, "epoch": 4992} {"train_loss": -7.352055549621582, "global_step": 209695, "epoch": 4992} {"train_loss": -7.275285243988037, "global_step": 209696, "epoch": 4992} {"train_loss": -7.361089706420898, "global_step": 209697, "epoch": 4992} {"train_loss": -7.218442916870117, "global_step": 209698, "epoch": 4992} {"train_loss": -7.290218353271484, "global_step": 209699, "epoch": 4992} {"train_loss": -7.401185512542725, "global_step": 209700, "epoch": 4992} {"train_loss": -7.2360968589782715, "global_step": 209701, "epoch": 4992} {"train_loss": -7.422842025756836, "global_step": 209702, "epoch": 4992} {"train_loss": -7.315509796142578, "global_step": 209703, "epoch": 4992} {"train_loss": -7.334367752075195, "global_step": 209704, "epoch": 4992} {"train_loss": -7.328153769175212, "global_step": 209705, "epoch": 4992, "val_loss": 81878.625} {"train_loss": -7.394430160522461, "global_step": 209706, "epoch": 4993} {"train_loss": -7.334742546081543, "global_step": 209707, "epoch": 4993} {"train_loss": -7.4134650230407715, "global_step": 209708, "epoch": 4993} {"train_loss": -7.401241302490234, "global_step": 209709, "epoch": 4993} {"train_loss": -7.274811744689941, "global_step": 209710, "epoch": 4993} {"train_loss": -7.373045921325684, "global_step": 209711, "epoch": 4993} {"train_loss": -7.358084678649902, "global_step": 209712, "epoch": 4993} {"train_loss": -7.3127546310424805, "global_step": 209713, "epoch": 4993} {"train_loss": -7.3950958251953125, "global_step": 209714, "epoch": 4993} {"train_loss": -7.233382225036621, "global_step": 209715, "epoch": 4993} {"train_loss": -7.267926216125488, "global_step": 209716, "epoch": 4993} {"train_loss": -7.382786273956299, "global_step": 209717, "epoch": 4993} {"train_loss": -7.359901428222656, "global_step": 209718, "epoch": 4993} {"train_loss": -7.235318183898926, "global_step": 209719, "epoch": 4993} {"train_loss": -7.328338623046875, "global_step": 209720, "epoch": 4993} {"train_loss": -7.456132411956787, "global_step": 209721, "epoch": 4993} {"train_loss": -7.398995876312256, "global_step": 209722, "epoch": 4993} {"train_loss": -7.395780563354492, "global_step": 209723, "epoch": 4993} {"train_loss": -7.439492225646973, "global_step": 209724, "epoch": 4993} {"train_loss": -7.377538681030273, "global_step": 209725, "epoch": 4993} {"train_loss": -7.461203098297119, "global_step": 209726, "epoch": 4993} {"train_loss": -7.4545722007751465, "global_step": 209727, "epoch": 4993} {"train_loss": -7.339452743530273, "global_step": 209728, "epoch": 4993} {"train_loss": -7.542363166809082, "global_step": 209729, "epoch": 4993} {"train_loss": -7.450170516967773, "global_step": 209730, "epoch": 4993} {"train_loss": -7.390622138977051, "global_step": 209731, "epoch": 4993} {"train_loss": -7.346368789672852, "global_step": 209732, "epoch": 4993} {"train_loss": -7.367932319641113, "global_step": 209733, "epoch": 4993} {"train_loss": -7.525331020355225, "global_step": 209734, "epoch": 4993} {"train_loss": -7.484457015991211, "global_step": 209735, "epoch": 4993} {"train_loss": -7.331987380981445, "global_step": 209736, "epoch": 4993} {"train_loss": -7.544092178344727, "global_step": 209737, "epoch": 4993} {"train_loss": -7.309629917144775, "global_step": 209738, "epoch": 4993} {"train_loss": -7.50114631652832, "global_step": 209739, "epoch": 4993} {"train_loss": -7.357762813568115, "global_step": 209740, "epoch": 4993} {"train_loss": -7.418082237243652, "global_step": 209741, "epoch": 4993} {"train_loss": -7.432025909423828, "global_step": 209742, "epoch": 4993} {"train_loss": -7.388588905334473, "global_step": 209743, "epoch": 4993} {"train_loss": -7.407295227050781, "global_step": 209744, "epoch": 4993} {"train_loss": -7.495724678039551, "global_step": 209745, "epoch": 4993} {"train_loss": -7.496883392333984, "global_step": 209746, "epoch": 4993} {"train_loss": -7.396824552899315, "global_step": 209747, "epoch": 4993, "val_loss": 82383.78125} {"train_loss": -7.398309707641602, "global_step": 209748, "epoch": 4994} {"train_loss": -7.500543594360352, "global_step": 209749, "epoch": 4994} {"train_loss": -7.37404727935791, "global_step": 209750, "epoch": 4994} {"train_loss": -7.225553512573242, "global_step": 209751, "epoch": 4994} {"train_loss": -7.402644157409668, "global_step": 209752, "epoch": 4994} {"train_loss": -7.445245742797852, "global_step": 209753, "epoch": 4994} {"train_loss": -7.005951881408691, "global_step": 209754, "epoch": 4994} {"train_loss": -7.229806900024414, "global_step": 209755, "epoch": 4994} {"train_loss": -7.497760772705078, "global_step": 209756, "epoch": 4994} {"train_loss": -6.889410972595215, "global_step": 209757, "epoch": 4994} {"train_loss": -6.828747749328613, "global_step": 209758, "epoch": 4994} {"train_loss": -7.3095598220825195, "global_step": 209759, "epoch": 4994} {"train_loss": -6.928820610046387, "global_step": 209760, "epoch": 4994} {"train_loss": -7.21596097946167, "global_step": 209761, "epoch": 4994} {"train_loss": -7.024996757507324, "global_step": 209762, "epoch": 4994} {"train_loss": -7.216529846191406, "global_step": 209763, "epoch": 4994} {"train_loss": -7.199712753295898, "global_step": 209764, "epoch": 4994} {"train_loss": -7.176088333129883, "global_step": 209765, "epoch": 4994} {"train_loss": -7.239026069641113, "global_step": 209766, "epoch": 4994} {"train_loss": -7.176469802856445, "global_step": 209767, "epoch": 4994} {"train_loss": -7.144132614135742, "global_step": 209768, "epoch": 4994} {"train_loss": -7.241911888122559, "global_step": 209769, "epoch": 4994} {"train_loss": -7.269649505615234, "global_step": 209770, "epoch": 4994} {"train_loss": -7.1971755027771, "global_step": 209771, "epoch": 4994} {"train_loss": -7.231392860412598, "global_step": 209772, "epoch": 4994} {"train_loss": -7.21112060546875, "global_step": 209773, "epoch": 4994} {"train_loss": -7.23854923248291, "global_step": 209774, "epoch": 4994} {"train_loss": -7.322849273681641, "global_step": 209775, "epoch": 4994} {"train_loss": -7.216819763183594, "global_step": 209776, "epoch": 4994} {"train_loss": -7.393562316894531, "global_step": 209777, "epoch": 4994} {"train_loss": -7.370610237121582, "global_step": 209778, "epoch": 4994} {"train_loss": -7.2857794761657715, "global_step": 209779, "epoch": 4994} {"train_loss": -7.404472351074219, "global_step": 209780, "epoch": 4994} {"train_loss": -7.283923149108887, "global_step": 209781, "epoch": 4994} {"train_loss": -7.33681058883667, "global_step": 209782, "epoch": 4994} {"train_loss": -7.377304553985596, "global_step": 209783, "epoch": 4994} {"train_loss": -7.337338924407959, "global_step": 209784, "epoch": 4994} {"train_loss": -7.450457572937012, "global_step": 209785, "epoch": 4994} {"train_loss": -7.367180824279785, "global_step": 209786, "epoch": 4994} {"train_loss": -7.368684768676758, "global_step": 209787, "epoch": 4994} {"train_loss": -7.423916816711426, "global_step": 209788, "epoch": 4994} {"train_loss": -7.2648160344078425, "global_step": 209789, "epoch": 4994, "val_loss": 81942.6328125} {"train_loss": -7.402478218078613, "global_step": 209790, "epoch": 4995} {"train_loss": -7.384485244750977, "global_step": 209791, "epoch": 4995} {"train_loss": -7.340677261352539, "global_step": 209792, "epoch": 4995} {"train_loss": -7.4671950340271, "global_step": 209793, "epoch": 4995} {"train_loss": -7.1878767013549805, "global_step": 209794, "epoch": 4995} {"train_loss": -7.361971855163574, "global_step": 209795, "epoch": 4995} {"train_loss": -7.3719940185546875, "global_step": 209796, "epoch": 4995} {"train_loss": -7.05023193359375, "global_step": 209797, "epoch": 4995} {"train_loss": -7.388526916503906, "global_step": 209798, "epoch": 4995} {"train_loss": -7.336647033691406, "global_step": 209799, "epoch": 4995} {"train_loss": -7.4245405197143555, "global_step": 209800, "epoch": 4995} {"train_loss": -7.395665645599365, "global_step": 209801, "epoch": 4995} {"train_loss": -7.394318103790283, "global_step": 209802, "epoch": 4995} {"train_loss": -7.351540565490723, "global_step": 209803, "epoch": 4995} {"train_loss": -7.394273281097412, "global_step": 209804, "epoch": 4995} {"train_loss": -7.306428909301758, "global_step": 209805, "epoch": 4995} {"train_loss": -7.3791680335998535, "global_step": 209806, "epoch": 4995} {"train_loss": -7.395843029022217, "global_step": 209807, "epoch": 4995} {"train_loss": -7.403585910797119, "global_step": 209808, "epoch": 4995} {"train_loss": -7.3300065994262695, "global_step": 209809, "epoch": 4995} {"train_loss": -7.291661262512207, "global_step": 209810, "epoch": 4995} {"train_loss": -7.4013190269470215, "global_step": 209811, "epoch": 4995} {"train_loss": -7.356490135192871, "global_step": 209812, "epoch": 4995} {"train_loss": -7.517810821533203, "global_step": 209813, "epoch": 4995} {"train_loss": -7.366946220397949, "global_step": 209814, "epoch": 4995} {"train_loss": -7.285744667053223, "global_step": 209815, "epoch": 4995} {"train_loss": -7.407616138458252, "global_step": 209816, "epoch": 4995} {"train_loss": -7.319890975952148, "global_step": 209817, "epoch": 4995} {"train_loss": -7.311034679412842, "global_step": 209818, "epoch": 4995} {"train_loss": -7.320369720458984, "global_step": 209819, "epoch": 4995} {"train_loss": -7.3131184577941895, "global_step": 209820, "epoch": 4995} {"train_loss": -7.299613952636719, "global_step": 209821, "epoch": 4995} {"train_loss": -7.325632095336914, "global_step": 209822, "epoch": 4995} {"train_loss": -7.214607238769531, "global_step": 209823, "epoch": 4995} {"train_loss": -7.311611652374268, "global_step": 209824, "epoch": 4995} {"train_loss": -7.369015216827393, "global_step": 209825, "epoch": 4995} {"train_loss": -7.256227493286133, "global_step": 209826, "epoch": 4995} {"train_loss": -7.339180946350098, "global_step": 209827, "epoch": 4995} {"train_loss": -7.322649955749512, "global_step": 209828, "epoch": 4995} {"train_loss": -7.357434272766113, "global_step": 209829, "epoch": 4995} {"train_loss": -7.334571361541748, "global_step": 209830, "epoch": 4995} {"train_loss": -7.34607762382144, "global_step": 209831, "epoch": 4995, "val_loss": 81994.1015625} {"train_loss": -7.476624488830566, "global_step": 209832, "epoch": 4996} {"train_loss": -7.375146865844727, "global_step": 209833, "epoch": 4996} {"train_loss": -7.425837993621826, "global_step": 209834, "epoch": 4996} {"train_loss": -7.49177360534668, "global_step": 209835, "epoch": 4996} {"train_loss": -7.293608665466309, "global_step": 209836, "epoch": 4996} {"train_loss": -7.359071731567383, "global_step": 209837, "epoch": 4996} {"train_loss": -7.384237289428711, "global_step": 209838, "epoch": 4996} {"train_loss": -7.417478084564209, "global_step": 209839, "epoch": 4996} {"train_loss": -7.409562587738037, "global_step": 209840, "epoch": 4996} {"train_loss": -7.563011169433594, "global_step": 209841, "epoch": 4996} {"train_loss": -7.321002006530762, "global_step": 209842, "epoch": 4996} {"train_loss": -7.398764610290527, "global_step": 209843, "epoch": 4996} {"train_loss": -7.38419771194458, "global_step": 209844, "epoch": 4996} {"train_loss": -7.363185405731201, "global_step": 209845, "epoch": 4996} {"train_loss": -7.429774284362793, "global_step": 209846, "epoch": 4996} {"train_loss": -7.387678146362305, "global_step": 209847, "epoch": 4996} {"train_loss": -7.422338485717773, "global_step": 209848, "epoch": 4996} {"train_loss": -7.407332420349121, "global_step": 209849, "epoch": 4996} {"train_loss": -7.4953293800354, "global_step": 209850, "epoch": 4996} {"train_loss": -7.534966945648193, "global_step": 209851, "epoch": 4996} {"train_loss": -7.426684856414795, "global_step": 209852, "epoch": 4996} {"train_loss": -7.349259853363037, "global_step": 209853, "epoch": 4996} {"train_loss": -7.401487350463867, "global_step": 209854, "epoch": 4996} {"train_loss": -7.521914005279541, "global_step": 209855, "epoch": 4996} {"train_loss": -7.410855770111084, "global_step": 209856, "epoch": 4996} {"train_loss": -7.3086771965026855, "global_step": 209857, "epoch": 4996} {"train_loss": -7.4247283935546875, "global_step": 209858, "epoch": 4996} {"train_loss": -7.404353618621826, "global_step": 209859, "epoch": 4996} {"train_loss": -7.374551773071289, "global_step": 209860, "epoch": 4996} {"train_loss": -7.570682525634766, "global_step": 209861, "epoch": 4996} {"train_loss": -7.4339070320129395, "global_step": 209862, "epoch": 4996} {"train_loss": -7.3895721435546875, "global_step": 209863, "epoch": 4996} {"train_loss": -7.328285217285156, "global_step": 209864, "epoch": 4996} {"train_loss": -7.4111785888671875, "global_step": 209865, "epoch": 4996} {"train_loss": -7.329162120819092, "global_step": 209866, "epoch": 4996} {"train_loss": -7.39630126953125, "global_step": 209867, "epoch": 4996} {"train_loss": -7.3548102378845215, "global_step": 209868, "epoch": 4996} {"train_loss": -7.462953567504883, "global_step": 209869, "epoch": 4996} {"train_loss": -7.3119330406188965, "global_step": 209870, "epoch": 4996} {"train_loss": -7.316914081573486, "global_step": 209871, "epoch": 4996} {"train_loss": -7.371147632598877, "global_step": 209872, "epoch": 4996} {"train_loss": -7.407703252065749, "global_step": 209873, "epoch": 4996, "val_loss": 81996.734375} {"train_loss": -7.402207374572754, "global_step": 209874, "epoch": 4997} {"train_loss": -7.3581438064575195, "global_step": 209875, "epoch": 4997} {"train_loss": -7.414994239807129, "global_step": 209876, "epoch": 4997} {"train_loss": -7.430603981018066, "global_step": 209877, "epoch": 4997} {"train_loss": -7.4061126708984375, "global_step": 209878, "epoch": 4997} {"train_loss": -7.310359001159668, "global_step": 209879, "epoch": 4997} {"train_loss": -7.318376541137695, "global_step": 209880, "epoch": 4997} {"train_loss": -7.379993438720703, "global_step": 209881, "epoch": 4997} {"train_loss": -7.304085731506348, "global_step": 209882, "epoch": 4997} {"train_loss": -7.318307876586914, "global_step": 209883, "epoch": 4997} {"train_loss": -7.344657897949219, "global_step": 209884, "epoch": 4997} {"train_loss": -7.263089179992676, "global_step": 209885, "epoch": 4997} {"train_loss": -7.36368465423584, "global_step": 209886, "epoch": 4997} {"train_loss": -7.406530380249023, "global_step": 209887, "epoch": 4997} {"train_loss": -7.3360700607299805, "global_step": 209888, "epoch": 4997} {"train_loss": -7.466128826141357, "global_step": 209889, "epoch": 4997} {"train_loss": -7.431068420410156, "global_step": 209890, "epoch": 4997} {"train_loss": -7.343268871307373, "global_step": 209891, "epoch": 4997} {"train_loss": -7.310704231262207, "global_step": 209892, "epoch": 4997} {"train_loss": -7.38871955871582, "global_step": 209893, "epoch": 4997} {"train_loss": -7.271355628967285, "global_step": 209894, "epoch": 4997} {"train_loss": -7.42789888381958, "global_step": 209895, "epoch": 4997} {"train_loss": -7.297878265380859, "global_step": 209896, "epoch": 4997} {"train_loss": -7.429290294647217, "global_step": 209897, "epoch": 4997} {"train_loss": -7.366283416748047, "global_step": 209898, "epoch": 4997} {"train_loss": -7.333995819091797, "global_step": 209899, "epoch": 4997} {"train_loss": -7.32987642288208, "global_step": 209900, "epoch": 4997} {"train_loss": -7.235355377197266, "global_step": 209901, "epoch": 4997} {"train_loss": -7.386836528778076, "global_step": 209902, "epoch": 4997} {"train_loss": -7.309082508087158, "global_step": 209903, "epoch": 4997} {"train_loss": -7.281914710998535, "global_step": 209904, "epoch": 4997} {"train_loss": -7.401939392089844, "global_step": 209905, "epoch": 4997} {"train_loss": -7.456498146057129, "global_step": 209906, "epoch": 4997} {"train_loss": -7.297473430633545, "global_step": 209907, "epoch": 4997} {"train_loss": -7.389881134033203, "global_step": 209908, "epoch": 4997} {"train_loss": -7.347713947296143, "global_step": 209909, "epoch": 4997} {"train_loss": -7.314574241638184, "global_step": 209910, "epoch": 4997} {"train_loss": -7.387930870056152, "global_step": 209911, "epoch": 4997} {"train_loss": -7.288829326629639, "global_step": 209912, "epoch": 4997} {"train_loss": -7.3235368728637695, "global_step": 209913, "epoch": 4997} {"train_loss": -7.260770320892334, "global_step": 209914, "epoch": 4997} {"train_loss": -7.352724393208821, "global_step": 209915, "epoch": 4997, "val_loss": 82282.0078125} {"train_loss": -7.390125274658203, "global_step": 209916, "epoch": 4998} {"train_loss": -7.350214958190918, "global_step": 209917, "epoch": 4998} {"train_loss": -7.327394962310791, "global_step": 209918, "epoch": 4998} {"train_loss": -7.454774856567383, "global_step": 209919, "epoch": 4998} {"train_loss": -7.216359615325928, "global_step": 209920, "epoch": 4998} {"train_loss": -7.427977561950684, "global_step": 209921, "epoch": 4998} {"train_loss": -7.35154914855957, "global_step": 209922, "epoch": 4998} {"train_loss": -7.111440658569336, "global_step": 209923, "epoch": 4998} {"train_loss": -7.359311103820801, "global_step": 209924, "epoch": 4998} {"train_loss": -7.042751312255859, "global_step": 209925, "epoch": 4998} {"train_loss": -7.289445877075195, "global_step": 209926, "epoch": 4998} {"train_loss": -7.223545551300049, "global_step": 209927, "epoch": 4998} {"train_loss": -7.356319427490234, "global_step": 209928, "epoch": 4998} {"train_loss": -7.2862701416015625, "global_step": 209929, "epoch": 4998} {"train_loss": -7.2314581871032715, "global_step": 209930, "epoch": 4998} {"train_loss": -7.348343372344971, "global_step": 209931, "epoch": 4998} {"train_loss": -7.120207786560059, "global_step": 209932, "epoch": 4998} {"train_loss": -7.405045509338379, "global_step": 209933, "epoch": 4998} {"train_loss": -7.200713157653809, "global_step": 209934, "epoch": 4998} {"train_loss": -7.287552356719971, "global_step": 209935, "epoch": 4998} {"train_loss": -6.959866046905518, "global_step": 209936, "epoch": 4998} {"train_loss": -7.28287410736084, "global_step": 209937, "epoch": 4998} {"train_loss": -7.268280982971191, "global_step": 209938, "epoch": 4998} {"train_loss": -7.245193004608154, "global_step": 209939, "epoch": 4998} {"train_loss": -7.308836460113525, "global_step": 209940, "epoch": 4998} {"train_loss": -7.177195072174072, "global_step": 209941, "epoch": 4998} {"train_loss": -7.368440628051758, "global_step": 209942, "epoch": 4998} {"train_loss": -7.116248607635498, "global_step": 209943, "epoch": 4998} {"train_loss": -7.36423921585083, "global_step": 209944, "epoch": 4998} {"train_loss": -7.1767473220825195, "global_step": 209945, "epoch": 4998} {"train_loss": -7.320437431335449, "global_step": 209946, "epoch": 4998} {"train_loss": -7.300689697265625, "global_step": 209947, "epoch": 4998} {"train_loss": -7.314865589141846, "global_step": 209948, "epoch": 4998} {"train_loss": -7.245956897735596, "global_step": 209949, "epoch": 4998} {"train_loss": -7.288848876953125, "global_step": 209950, "epoch": 4998} {"train_loss": -7.273464202880859, "global_step": 209951, "epoch": 4998} {"train_loss": -7.299441337585449, "global_step": 209952, "epoch": 4998} {"train_loss": -7.278501510620117, "global_step": 209953, "epoch": 4998} {"train_loss": -7.276881217956543, "global_step": 209954, "epoch": 4998} {"train_loss": -7.33526611328125, "global_step": 209955, "epoch": 4998} {"train_loss": -7.368034839630127, "global_step": 209956, "epoch": 4998} {"train_loss": -7.278191044217064, "global_step": 209957, "epoch": 4998, "val_loss": 82073.4609375} {"train_loss": -7.325643539428711, "global_step": 209958, "epoch": 4999} {"train_loss": -7.301533222198486, "global_step": 209959, "epoch": 4999} {"train_loss": -7.405252933502197, "global_step": 209960, "epoch": 4999} {"train_loss": -7.24941873550415, "global_step": 209961, "epoch": 4999} {"train_loss": -7.368300914764404, "global_step": 209962, "epoch": 4999} {"train_loss": -7.359782695770264, "global_step": 209963, "epoch": 4999} {"train_loss": -7.408699035644531, "global_step": 209964, "epoch": 4999} {"train_loss": -7.3634490966796875, "global_step": 209965, "epoch": 4999} {"train_loss": -7.3726372718811035, "global_step": 209966, "epoch": 4999} {"train_loss": -7.393246650695801, "global_step": 209967, "epoch": 4999} {"train_loss": -7.40981388092041, "global_step": 209968, "epoch": 4999} {"train_loss": -7.339987754821777, "global_step": 209969, "epoch": 4999} {"train_loss": -7.3495612144470215, "global_step": 209970, "epoch": 4999} {"train_loss": -7.446623802185059, "global_step": 209971, "epoch": 4999} {"train_loss": -7.315500736236572, "global_step": 209972, "epoch": 4999} {"train_loss": -7.307216167449951, "global_step": 209973, "epoch": 4999} {"train_loss": -7.374838829040527, "global_step": 209974, "epoch": 4999} {"train_loss": -7.366707801818848, "global_step": 209975, "epoch": 4999} {"train_loss": -7.362350940704346, "global_step": 209976, "epoch": 4999} {"train_loss": -7.225435256958008, "global_step": 209977, "epoch": 4999} {"train_loss": -7.539346218109131, "global_step": 209978, "epoch": 4999} {"train_loss": -7.396572113037109, "global_step": 209979, "epoch": 4999} {"train_loss": -7.350925445556641, "global_step": 209980, "epoch": 4999} {"train_loss": -7.352876663208008, "global_step": 209981, "epoch": 4999} {"train_loss": -7.261261463165283, "global_step": 209982, "epoch": 4999} {"train_loss": -7.39262580871582, "global_step": 209983, "epoch": 4999} {"train_loss": -7.440587043762207, "global_step": 209984, "epoch": 4999} {"train_loss": -7.303606986999512, "global_step": 209985, "epoch": 4999} {"train_loss": -7.423496246337891, "global_step": 209986, "epoch": 4999} {"train_loss": -7.428041934967041, "global_step": 209987, "epoch": 4999} {"train_loss": -7.3788347244262695, "global_step": 209988, "epoch": 4999} {"train_loss": -7.393436431884766, "global_step": 209989, "epoch": 4999} {"train_loss": -7.361635208129883, "global_step": 209990, "epoch": 4999} {"train_loss": -7.419245719909668, "global_step": 209991, "epoch": 4999} {"train_loss": -7.398272514343262, "global_step": 209992, "epoch": 4999} {"train_loss": -7.308721542358398, "global_step": 209993, "epoch": 4999} {"train_loss": -7.421009540557861, "global_step": 209994, "epoch": 4999} {"train_loss": -7.483498573303223, "global_step": 209995, "epoch": 4999} {"train_loss": -7.488296985626221, "global_step": 209996, "epoch": 4999} {"train_loss": -7.507359504699707, "global_step": 209997, "epoch": 4999} {"train_loss": -7.536870956420898, "global_step": 209998, "epoch": 4999} {"train_loss": -7.381417251768566, "global_step": 209999, "epoch": 4999, "val_loss": 81992.28125}